Repository: PBSPro/pbspro
Branch: master
Commit: cd7ab5edaf03
Files: 1196
Total size: 17.5 MB

Directory structure:
gitextract_2t7z1zdf/

├── .clang-format
├── .github/
│   ├── PULL_REQUEST_TEMPLATE.md
│   ├── checkclang
│   ├── checkpep8
│   └── runchecks
├── .gitignore
├── CODE_OF_CONDUCT.md
├── CONTRIBUTING.md
├── COPYRIGHT
├── INSTALL
├── LICENSE
├── Makefile.am
├── PBS_License.txt
├── README.md
├── autogen.sh
├── azure-pipelines.yml
├── buildutils/
│   ├── Makefile.am
│   └── attr_parser.py
├── ci/
│   ├── README.md
│   ├── ci
│   └── etc/
│       ├── build-pbs-packages.sh
│       ├── ci-script-wrapper.service
│       ├── configure_node.sh
│       ├── container-env-setup.sh
│       ├── container-init
│       ├── do.sh
│       ├── do_sanitize_mode.sh
│       ├── docker-entrypoint
│       ├── gen_ptl_json.sh
│       ├── id_rsa
│       ├── id_rsa.pub
│       ├── install-system-packages
│       ├── killit.sh
│       ├── macros
│       └── sudoers-overrides
├── configure.ac
├── doc/
│   ├── Makefile.am
│   ├── man1/
│   │   ├── pbs_hook_attributes.7B
│   │   ├── pbs_job_attributes.7B
│   │   ├── pbs_login.1B
│   │   ├── pbs_module.7B
│   │   ├── pbs_node_attributes.7B
│   │   ├── pbs_professional.7B
│   │   ├── pbs_python.1B
│   │   ├── pbs_queue_attributes.7B
│   │   ├── pbs_ralter.1B
│   │   ├── pbs_rdel.1B
│   │   ├── pbs_release_nodes.1B
│   │   ├── pbs_resources.7B
│   │   ├── pbs_resv_attributes.7B
│   │   ├── pbs_rstat.1B
│   │   ├── pbs_rsub.1B
│   │   ├── pbs_sched_attributes.7B
│   │   ├── pbs_server_attributes.7B
│   │   ├── pbsdsh.1B
│   │   ├── qalter.1B
│   │   ├── qdel.1B
│   │   ├── qhold.1B
│   │   ├── qmove.1B
│   │   ├── qmsg.1B
│   │   ├── qorder.1B
│   │   ├── qrerun.1B
│   │   ├── qrls.1B
│   │   ├── qselect.1B
│   │   ├── qsig.1B
│   │   ├── qstat.1B
│   │   └── qsub.1B
│   ├── man3/
│   │   ├── pbs_alterjob.3B
│   │   ├── pbs_asyrunjob.3B
│   │   ├── pbs_confirmresv.3B
│   │   ├── pbs_connect.3B
│   │   ├── pbs_default.3B
│   │   ├── pbs_deljob.3B
│   │   ├── pbs_delresv.3B
│   │   ├── pbs_disconnect.3B
│   │   ├── pbs_geterrmsg.3B
│   │   ├── pbs_holdjob.3B
│   │   ├── pbs_locjob.3B
│   │   ├── pbs_manager.3B
│   │   ├── pbs_modify_resv.3B
│   │   ├── pbs_movejob.3B
│   │   ├── pbs_msgjob.3B
│   │   ├── pbs_orderjob.3B
│   │   ├── pbs_preempt_jobs.3B
│   │   ├── pbs_relnodesjob.3B
│   │   ├── pbs_rerunjob.3B
│   │   ├── pbs_rescquery.3B
│   │   ├── pbs_rescreserve.3B
│   │   ├── pbs_rlsjob.3B
│   │   ├── pbs_runjob.3B
│   │   ├── pbs_selectjob.3B
│   │   ├── pbs_selstat.3B
│   │   ├── pbs_sigjob.3B
│   │   ├── pbs_stagein.3B
│   │   ├── pbs_statfree.3B
│   │   ├── pbs_stathook.3B
│   │   ├── pbs_stathost.3B
│   │   ├── pbs_statjob.3B
│   │   ├── pbs_statnode.3B
│   │   ├── pbs_statque.3B
│   │   ├── pbs_statresv.3B
│   │   ├── pbs_statrsc.3B
│   │   ├── pbs_statsched.3B
│   │   ├── pbs_statserver.3B
│   │   ├── pbs_statvnode.3B
│   │   ├── pbs_submit.3B
│   │   ├── pbs_submit_resv.3B
│   │   ├── pbs_submitresv.3B
│   │   ├── pbs_tclapi.3B
│   │   ├── pbs_terminate.3B
│   │   ├── rm.3B
│   │   └── tm.3
│   └── man8/
│       ├── mpiexec.8B
│       ├── pbs.8B
│       ├── pbs.conf.8B
│       ├── pbs_account.8B
│       ├── pbs_attach.8B
│       ├── pbs_comm.8B
│       ├── pbs_dataservice.8B
│       ├── pbs_ds_password.8B
│       ├── pbs_hostn.8B
│       ├── pbs_idled.8B
│       ├── pbs_iff.8B
│       ├── pbs_interactive.8B
│       ├── pbs_lamboot.8B
│       ├── pbs_mkdirs.8B
│       ├── pbs_mom.8B
│       ├── pbs_mpihp.8B
│       ├── pbs_mpilam.8B
│       ├── pbs_mpirun.8B
│       ├── pbs_probe.8B
│       ├── pbs_sched.8B
│       ├── pbs_server.8B
│       ├── pbs_snapshot.8B
│       ├── pbs_tclsh.8B
│       ├── pbs_tmrsh.8B
│       ├── pbs_topologyinfo.8B
│       ├── pbs_wish.8B
│       ├── pbsfs.8B
│       ├── pbsnodes.8B
│       ├── pbsrun.8B
│       ├── pbsrun_unwrap.8B
│       ├── pbsrun_wrap.8B
│       ├── printjob.8B
│       ├── qdisable.8B
│       ├── qenable.8B
│       ├── qmgr.8B
│       ├── qrun.8B
│       ├── qstart.8B
│       ├── qstop.8B
│       ├── qterm.8B
│       ├── tracejob.8B
│       └── win_postinstall.py.8B
├── m4/
│   ├── disable_shell_pipe.m4
│   ├── disable_syslog.m4
│   ├── enable_alps.m4
│   ├── enable_ptl.m4
│   ├── pbs_decl_epoll.m4
│   ├── pbs_decl_epoll_pwait.m4
│   ├── pbs_decl_h_errno.m4
│   ├── pbs_decl_ppoll.m4
│   ├── pbs_decl_socklen_t.m4
│   ├── pbs_patch_libtool.m4
│   ├── pbs_systemd_unitdir.m4
│   ├── pbs_version.m4
│   ├── security_check.m4
│   ├── with_cjson.m4
│   ├── with_core_limit.m4
│   ├── with_database_dir.m4
│   ├── with_database_port.m4
│   ├── with_database_user.m4
│   ├── with_editline.m4
│   ├── with_expat.m4
│   ├── with_hwloc.m4
│   ├── with_krbauth.m4
│   ├── with_libical.m4
│   ├── with_libz.m4
│   ├── with_min_stack_limit.m4
│   ├── with_pbs_conf_file.m4
│   ├── with_pmix.m4
│   ├── with_python.m4
│   ├── with_sendmail.m4
│   ├── with_server_home.m4
│   ├── with_server_name_file.m4
│   ├── with_swig.m4
│   ├── with_tcl.m4
│   ├── with_tclatrsep.m4
│   ├── with_tmpdir.m4
│   ├── with_unsupported_dir.m4
│   └── with_xauth.m4
├── openpbs-rpmlintrc
├── openpbs.spec.in
├── src/
│   ├── Makefile.am
│   ├── cmds/
│   │   ├── Makefile.am
│   │   ├── mpiexec.in
│   │   ├── pbs_attach.c
│   │   ├── pbs_attach_sup.c
│   │   ├── pbs_dataservice.c
│   │   ├── pbs_demux.c
│   │   ├── pbs_ds_password.c
│   │   ├── pbs_lamboot.in
│   │   ├── pbs_mpihp.in
│   │   ├── pbs_mpilam.in
│   │   ├── pbs_mpirun.in
│   │   ├── pbs_ralter.c
│   │   ├── pbs_rdel.c
│   │   ├── pbs_release_nodes.c
│   │   ├── pbs_remsh.in
│   │   ├── pbs_rstat.c
│   │   ├── pbs_rsub.c
│   │   ├── pbs_tmrsh.c
│   │   ├── pbsdsh.c
│   │   ├── pbsnodes.c
│   │   ├── pbsrun.in
│   │   ├── pbsrun_unwrap.in
│   │   ├── pbsrun_wrap.in
│   │   ├── qalter.c
│   │   ├── qdel.c
│   │   ├── qdisable.c
│   │   ├── qenable.c
│   │   ├── qhold.c
│   │   ├── qmgr.c
│   │   ├── qmgr_sup.c
│   │   ├── qmove.c
│   │   ├── qmsg.c
│   │   ├── qorder.c
│   │   ├── qrerun.c
│   │   ├── qrls.c
│   │   ├── qrun.c
│   │   ├── qselect.c
│   │   ├── qsig.c
│   │   ├── qstart.c
│   │   ├── qstat.c
│   │   ├── qstop.c
│   │   ├── qsub.c
│   │   ├── qsub_sup.c
│   │   ├── qterm.c
│   │   ├── sample.qstatrc
│   │   └── scripts/
│   │       ├── Makefile.am
│   │       ├── limits.pbs_mom.compat
│   │       ├── limits.post_services.compat
│   │       ├── modulefile.in
│   │       ├── pbs.csh
│   │       ├── pbs.service.in
│   │       ├── pbs.sh
│   │       ├── pbs_bootcheck.py
│   │       ├── pbs_dataservice
│   │       ├── pbs_ds_password
│   │       ├── pbs_habitat.in
│   │       ├── pbs_init.d.in
│   │       ├── pbs_poerun.in
│   │       ├── pbs_postinstall.in
│   │       ├── pbs_posttrans
│   │       ├── pbs_preuninstall
│   │       ├── pbs_reload.in
│   │       ├── pbs_server
│   │       ├── pbs_snapshot
│   │       ├── pbs_topologyinfo
│   │       ├── pbs_topologyinfo.py
│   │       ├── pbsrun.ch_gm.init.in
│   │       ├── pbsrun.ch_mx.init.in
│   │       ├── pbsrun.gm_mpd.init.in
│   │       ├── pbsrun.intelmpi.init.in
│   │       ├── pbsrun.mpich2.init.in
│   │       ├── pbsrun.mvapich1.init.in
│   │       ├── pbsrun.mvapich2.init.in
│   │       ├── pbsrun.mx_mpd.init.in
│   │       ├── pbsrun.poe.in
│   │       ├── pbsrun.poe.init.in
│   │       ├── printjob
│   │       └── sgiMPI.awk
│   ├── hooks/
│   │   ├── Makefile.am
│   │   └── cgroups/
│   │       ├── pbs_cgroups.CF
│   │       ├── pbs_cgroups.HK
│   │       └── pbs_cgroups.PY
│   ├── iff/
│   │   ├── Makefile.am
│   │   └── iff2.c
│   ├── include/
│   │   ├── Long.h
│   │   ├── Long_.h
│   │   ├── Makefile.am
│   │   ├── acct.h
│   │   ├── attribute.h
│   │   ├── auth.h
│   │   ├── avltree.h
│   │   ├── basil.h
│   │   ├── batch_request.h
│   │   ├── bitfield.h
│   │   ├── cmds.h
│   │   ├── credential.h
│   │   ├── dedup_jobids.h
│   │   ├── dis.h
│   │   ├── grunt.h
│   │   ├── hook.h
│   │   ├── hook_func.h
│   │   ├── ifl_internal.h
│   │   ├── job.h
│   │   ├── libauth.h
│   │   ├── libpbs.h
│   │   ├── libsec.h
│   │   ├── libutil.h
│   │   ├── list_link.h
│   │   ├── log.h
│   │   ├── mom_func.h
│   │   ├── mom_hook_func.h
│   │   ├── mom_server.h
│   │   ├── mom_vnode.h
│   │   ├── net_connect.h
│   │   ├── pbs_array_list.h
│   │   ├── pbs_assert.h
│   │   ├── pbs_client_thread.h
│   │   ├── pbs_db.h
│   │   ├── pbs_ecl.h
│   │   ├── pbs_entlim.h
│   │   ├── pbs_error.h
│   │   ├── pbs_idx.h
│   │   ├── pbs_ifl.h
│   │   ├── pbs_internal.h
│   │   ├── pbs_json.h
│   │   ├── pbs_license.h
│   │   ├── pbs_mpp.h
│   │   ├── pbs_nodes.h
│   │   ├── pbs_python.h
│   │   ├── pbs_python_private.h
│   │   ├── pbs_reliable.h
│   │   ├── pbs_sched.h
│   │   ├── pbs_share.h
│   │   ├── pbs_v1_module_common.i
│   │   ├── pbs_version.h.in
│   │   ├── placementsets.h
│   │   ├── port_forwarding.h
│   │   ├── portability.h
│   │   ├── provision.h
│   │   ├── qmgr.h
│   │   ├── queue.h
│   │   ├── range.h
│   │   ├── reservation.h
│   │   ├── resmon.h
│   │   ├── resource.h
│   │   ├── resv_node.h
│   │   ├── rm.h
│   │   ├── sched_cmds.h
│   │   ├── server.h
│   │   ├── server_limits.h
│   │   ├── site_job_attr_def.h
│   │   ├── site_job_attr_enum.h
│   │   ├── site_qmgr_node_print.h
│   │   ├── site_qmgr_que_print.h
│   │   ├── site_qmgr_sched_print.h
│   │   ├── site_qmgr_svr_print.h
│   │   ├── site_que_attr_def.h
│   │   ├── site_que_attr_enum.h
│   │   ├── site_queue.h
│   │   ├── site_resc_attr_def.h
│   │   ├── site_resv_attr_def.h
│   │   ├── site_resv_attr_enum.h
│   │   ├── site_sched_attr_def.h
│   │   ├── site_sched_attr_enum.h
│   │   ├── site_svr_attr_def.h
│   │   ├── site_svr_attr_enum.h
│   │   ├── svrfunc.h
│   │   ├── ticket.h
│   │   ├── tm.h
│   │   ├── tm_.h
│   │   ├── tpp.h
│   │   ├── tracking.h
│   │   ├── user.h
│   │   └── work_task.h
│   ├── lib/
│   │   ├── Libattr/
│   │   │   ├── Long_.c
│   │   │   ├── Makefile.am
│   │   │   ├── attr_atomic.c
│   │   │   ├── attr_fn_acl.c
│   │   │   ├── attr_fn_arst.c
│   │   │   ├── attr_fn_b.c
│   │   │   ├── attr_fn_c.c
│   │   │   ├── attr_fn_entlim.c
│   │   │   ├── attr_fn_f.c
│   │   │   ├── attr_fn_hold.c
│   │   │   ├── attr_fn_intr.c
│   │   │   ├── attr_fn_l.c
│   │   │   ├── attr_fn_ll.c
│   │   │   ├── attr_fn_resc.c
│   │   │   ├── attr_fn_size.c
│   │   │   ├── attr_fn_str.c
│   │   │   ├── attr_fn_time.c
│   │   │   ├── attr_fn_unkn.c
│   │   │   ├── attr_func.c
│   │   │   ├── attr_node_func.c
│   │   │   ├── attr_resc_func.c
│   │   │   ├── master_job_attr_def.xml
│   │   │   ├── master_node_attr_def.xml
│   │   │   ├── master_queue_attr_def.xml
│   │   │   ├── master_resc_def_all.xml
│   │   │   ├── master_resv_attr_def.xml
│   │   │   ├── master_sched_attr_def.xml
│   │   │   ├── master_svr_attr_def.xml
│   │   │   ├── resc_map.c
│   │   │   ├── strToL.c
│   │   │   ├── strTouL.c
│   │   │   └── uLTostr.c
│   │   ├── Libauth/
│   │   │   ├── Makefile.am
│   │   │   ├── README.md
│   │   │   ├── gss/
│   │   │   │   ├── Makefile.am
│   │   │   │   └── pbs_gss.c
│   │   │   └── munge/
│   │   │       ├── Makefile.am
│   │   │       └── munge_supp.c
│   │   ├── Libcmds/
│   │   │   ├── batch_status.c
│   │   │   ├── check_job_script.c
│   │   │   ├── chk_Jrange.c
│   │   │   ├── ck_job_name.c
│   │   │   ├── cmds_common.c
│   │   │   ├── cnt2server.c
│   │   │   ├── cs_error.c
│   │   │   ├── cvtdate.c
│   │   │   ├── err_handling.c
│   │   │   ├── get_attr.c
│   │   │   ├── get_dataservice_usr.c
│   │   │   ├── get_server.c
│   │   │   ├── isjobid.c
│   │   │   ├── locate_job.c
│   │   │   ├── parse_at.c
│   │   │   ├── parse_depend.c
│   │   │   ├── parse_destid.c
│   │   │   ├── parse_equal.c
│   │   │   ├── parse_jobid.c
│   │   │   ├── parse_stage.c
│   │   │   ├── prepare_path.c
│   │   │   ├── set_attr.c
│   │   │   └── set_resource.c
│   │   ├── Libdb/
│   │   │   ├── Makefile.am
│   │   │   └── pgsql/
│   │   │       ├── Makefile.am
│   │   │       ├── db_attr.c
│   │   │       ├── db_common.c
│   │   │       ├── db_job.c
│   │   │       ├── db_node.c
│   │   │       ├── db_postgres.h
│   │   │       ├── db_que.c
│   │   │       ├── db_resv.c
│   │   │       ├── db_sched.c
│   │   │       ├── db_svr.c
│   │   │       ├── pbs_db_env
│   │   │       ├── pbs_db_schema.sql
│   │   │       ├── pbs_db_utility
│   │   │       ├── pbs_ds_systemd
│   │   │       └── pbs_schema_upgrade
│   │   ├── Libdis/
│   │   │   ├── dis.c
│   │   │   ├── dis_.h
│   │   │   ├── dis_helpers.c
│   │   │   ├── discui_.c
│   │   │   ├── discul_.c
│   │   │   ├── discull_.c
│   │   │   ├── disi10d_.c
│   │   │   ├── disi10l_.c
│   │   │   ├── disiui_.c
│   │   │   ├── disp10d_.c
│   │   │   ├── disp10l_.c
│   │   │   ├── disrcs.c
│   │   │   ├── disrd.c
│   │   │   ├── disrf.c
│   │   │   ├── disrfcs.c
│   │   │   ├── disrfst.c
│   │   │   ├── disrl.c
│   │   │   ├── disrl_.c
│   │   │   ├── disrsc.c
│   │   │   ├── disrsi.c
│   │   │   ├── disrsi_.c
│   │   │   ├── disrsl.c
│   │   │   ├── disrsl_.c
│   │   │   ├── disrsll_.c
│   │   │   ├── disrss.c
│   │   │   ├── disrst.c
│   │   │   ├── disruc.c
│   │   │   ├── disrui.c
│   │   │   ├── disrul.c
│   │   │   ├── disrull.c
│   │   │   ├── disrus.c
│   │   │   ├── diswcs.c
│   │   │   ├── diswf.c
│   │   │   ├── diswl_.c
│   │   │   ├── diswsi.c
│   │   │   ├── diswsl.c
│   │   │   ├── diswui.c
│   │   │   ├── diswui_.c
│   │   │   ├── diswul.c
│   │   │   ├── diswull.c
│   │   │   └── ps_dis.c
│   │   ├── Libecl/
│   │   │   ├── ecl_verify.c
│   │   │   ├── ecl_verify_datatypes.c
│   │   │   ├── ecl_verify_object_name.c
│   │   │   ├── ecl_verify_values.c
│   │   │   └── pbs_client_thread.c
│   │   ├── Libifl/
│   │   │   ├── DIS_decode.c
│   │   │   ├── DIS_encode.c
│   │   │   ├── Makefile.am
│   │   │   ├── PBS_attr.c
│   │   │   ├── advise.c
│   │   │   ├── auth.c
│   │   │   ├── conn_table.c
│   │   │   ├── dec_DelJobList.c
│   │   │   ├── dec_reply.c
│   │   │   ├── enc_reply.c
│   │   │   ├── entlim_parse.c
│   │   │   ├── get_svrport.c
│   │   │   ├── grunt_parse.c
│   │   │   ├── ifl_impl.c
│   │   │   ├── ifl_pointers.c
│   │   │   ├── ifl_util.c
│   │   │   ├── int_cred.c
│   │   │   ├── int_hook.c
│   │   │   ├── int_jcred.c
│   │   │   ├── int_manage2.c
│   │   │   ├── int_manager.c
│   │   │   ├── int_modify_resv.c
│   │   │   ├── int_msg2.c
│   │   │   ├── int_rdrpy.c
│   │   │   ├── int_sig2.c
│   │   │   ├── int_status.c
│   │   │   ├── int_status2.c
│   │   │   ├── int_submit.c
│   │   │   ├── int_submit_resv.c
│   │   │   ├── int_ucred.c
│   │   │   ├── list_link.c
│   │   │   ├── pbsD_Preempt_Jobs.c
│   │   │   ├── pbsD_alterjob.c
│   │   │   ├── pbsD_confirmresv.c
│   │   │   ├── pbsD_connect.c
│   │   │   ├── pbsD_defschreply.c
│   │   │   ├── pbsD_deljob.c
│   │   │   ├── pbsD_deljoblist.c
│   │   │   ├── pbsD_delresv.c
│   │   │   ├── pbsD_holdjob.c
│   │   │   ├── pbsD_locjob.c
│   │   │   ├── pbsD_manager.c
│   │   │   ├── pbsD_modify_resv.c
│   │   │   ├── pbsD_movejob.c
│   │   │   ├── pbsD_msgjob.c
│   │   │   ├── pbsD_orderjo.c
│   │   │   ├── pbsD_rerunjo.c
│   │   │   ├── pbsD_resc.c
│   │   │   ├── pbsD_rlsjob.c
│   │   │   ├── pbsD_runjob.c
│   │   │   ├── pbsD_selectj.c
│   │   │   ├── pbsD_sigjob.c
│   │   │   ├── pbsD_stagein.c
│   │   │   ├── pbsD_stathook.c
│   │   │   ├── pbsD_stathost.c
│   │   │   ├── pbsD_statjob.c
│   │   │   ├── pbsD_statnode.c
│   │   │   ├── pbsD_statque.c
│   │   │   ├── pbsD_statresv.c
│   │   │   ├── pbsD_statrsc.c
│   │   │   ├── pbsD_statsched.c
│   │   │   ├── pbsD_statsrv.c
│   │   │   ├── pbsD_submit.c
│   │   │   ├── pbsD_submit_resv.c
│   │   │   ├── pbsD_termin.c
│   │   │   ├── pbs_delstatfree.c
│   │   │   ├── pbs_get_attribute_errors.c
│   │   │   ├── pbs_geterrmg.c
│   │   │   ├── pbs_geterrno.c
│   │   │   ├── pbs_ifl.i
│   │   │   ├── pbs_loadconf.c
│   │   │   ├── pbs_quote_parse.c
│   │   │   ├── pbs_statfree.c
│   │   │   ├── rm.c
│   │   │   ├── strsep.c
│   │   │   ├── tcp_dis.c
│   │   │   ├── tm.c
│   │   │   └── xml_encode_decode.c
│   │   ├── Libjson/
│   │   │   ├── Makefile.am
│   │   │   └── cJSON/
│   │   │       ├── Makefile.am
│   │   │       └── pbs_cjson.c
│   │   ├── Liblicensing/
│   │   │   ├── Makefile.am
│   │   │   ├── liblicense.h
│   │   │   └── license_client.c
│   │   ├── Liblog/
│   │   │   ├── Makefile.am
│   │   │   ├── chk_file_sec.c
│   │   │   ├── log_event.c
│   │   │   ├── pbs_log.c
│   │   │   ├── pbs_messages.c
│   │   │   └── setup_env.c
│   │   ├── Libnet/
│   │   │   ├── Makefile.am
│   │   │   ├── get_hostaddr.c
│   │   │   ├── hnls.c
│   │   │   ├── net_client.c
│   │   │   ├── net_server.c
│   │   │   ├── net_set_clse.c
│   │   │   └── port_forwarding.c
│   │   ├── Libpbs/
│   │   │   ├── Makefile.am
│   │   │   └── pbs.pc.in
│   │   ├── Libpython/
│   │   │   ├── Makefile.am
│   │   │   ├── common_python_utils.c
│   │   │   ├── module_pbs_v1.c
│   │   │   ├── pbs_python_external.c
│   │   │   ├── pbs_python_import_types.c
│   │   │   ├── pbs_python_svr_external.c
│   │   │   ├── pbs_python_svr_internal.c
│   │   │   ├── pbs_python_svr_size_type.c
│   │   │   └── shared_python_utils.c
│   │   ├── Libsec/
│   │   │   ├── Makefile.am
│   │   │   └── cs_standard.c
│   │   ├── Libsite/
│   │   │   ├── Makefile.am
│   │   │   ├── site_allow_u.c
│   │   │   ├── site_alt_rte.c
│   │   │   ├── site_check_u.c
│   │   │   ├── site_map_usr.c
│   │   │   ├── site_mom_chu.c
│   │   │   ├── site_mom_ckp.c
│   │   │   └── site_mom_jst.c
│   │   ├── Libtpp/
│   │   │   ├── Makefile.am
│   │   │   ├── tpp_client.c
│   │   │   ├── tpp_em.c
│   │   │   ├── tpp_internal.h
│   │   │   ├── tpp_platform.c
│   │   │   ├── tpp_router.c
│   │   │   ├── tpp_transport.c
│   │   │   └── tpp_util.c
│   │   ├── Libutil/
│   │   │   ├── Makefile.am
│   │   │   ├── avltree.c
│   │   │   ├── daemon_protect.c
│   │   │   ├── dedup_jobids.c
│   │   │   ├── entlim.c
│   │   │   ├── execvnode_seq_util.c
│   │   │   ├── get_hostname.c
│   │   │   ├── hook.c
│   │   │   ├── misc_utils.c
│   │   │   ├── pbs_aes_encrypt.c
│   │   │   ├── pbs_array_list.c
│   │   │   ├── pbs_ical.c
│   │   │   ├── pbs_idx.c
│   │   │   ├── pbs_secrets.c
│   │   │   ├── range.c
│   │   │   ├── thread_utils.c
│   │   │   └── work_task.c
│   │   └── Makefile.am
│   ├── modules/
│   │   ├── Makefile.am
│   │   └── python/
│   │       ├── Makefile.am
│   │       ├── pbs/
│   │       │   ├── __init__.py
│   │       │   └── v1/
│   │       │       ├── __init__.py
│   │       │       ├── _attr_types.py
│   │       │       ├── _base_types.py
│   │       │       ├── _exc_types.py
│   │       │       ├── _export_types.py
│   │       │       ├── _pmi_cray.py
│   │       │       ├── _pmi_none.py
│   │       │       ├── _pmi_sgi.py
│   │       │       ├── _pmi_types.py
│   │       │       ├── _pmi_utils.py
│   │       │       └── _svr_types.py
│   │       ├── pbs_hooks/
│   │       │   ├── PBS_alps_inventory_check.HK
│   │       │   ├── PBS_alps_inventory_check.PY
│   │       │   ├── PBS_cray_atom.CF
│   │       │   ├── PBS_cray_atom.HK
│   │       │   ├── PBS_cray_atom.PY
│   │       │   ├── PBS_power.CF
│   │       │   ├── PBS_power.HK
│   │       │   ├── PBS_power.PY
│   │       │   ├── PBS_xeon_phi_provision.HK
│   │       │   └── PBS_xeon_phi_provision.PY
│   │       ├── pbs_v1_module_init.c
│   │       ├── setup.cfg
│   │       └── setup.py
│   ├── mom_rcp/
│   │   ├── Makefile.am
│   │   ├── README
│   │   ├── extern.h
│   │   ├── pathnames.h
│   │   ├── pbs_stat.h
│   │   ├── rcp.c
│   │   ├── replace.c
│   │   └── util.c
│   ├── resmom/
│   │   ├── Makefile.am
│   │   ├── catch_child.c
│   │   ├── job_recov_fs.c
│   │   ├── linux/
│   │   │   ├── alps.c
│   │   │   ├── mom_func.c
│   │   │   ├── mom_mach.c
│   │   │   ├── mom_mach.h
│   │   │   ├── mom_start.c
│   │   │   └── pe_input.c
│   │   ├── mock_run.c
│   │   ├── mock_run.h
│   │   ├── mom_comm.c
│   │   ├── mom_hook_func.c
│   │   ├── mom_inter.c
│   │   ├── mom_main.c
│   │   ├── mom_pmix.c
│   │   ├── mom_pmix.h
│   │   ├── mom_server.c
│   │   ├── mom_updates_bundle.c
│   │   ├── mom_vnode.c
│   │   ├── mom_walltime.c
│   │   ├── popen.c
│   │   ├── prolog.c
│   │   ├── renew_creds.c
│   │   ├── renew_creds.h
│   │   ├── requests.c
│   │   ├── rm_dep.h
│   │   ├── stage_func.c
│   │   ├── start_exec.c
│   │   └── vnode_storage.c
│   ├── scheduler/
│   │   ├── Makefile.am
│   │   ├── buckets.cpp
│   │   ├── buckets.h
│   │   ├── check.cpp
│   │   ├── check.h
│   │   ├── config.h
│   │   ├── constant.h
│   │   ├── data_types.h
│   │   ├── dedtime.cpp
│   │   ├── dedtime.h
│   │   ├── fairshare.cpp
│   │   ├── fairshare.h
│   │   ├── fifo.cpp
│   │   ├── fifo.h
│   │   ├── get_4byte.cpp
│   │   ├── globals.cpp
│   │   ├── globals.h
│   │   ├── job_info.cpp
│   │   ├── job_info.h
│   │   ├── limits.cpp
│   │   ├── limits_if.h
│   │   ├── list_order.awk
│   │   ├── misc.cpp
│   │   ├── misc.h
│   │   ├── multi_threading.cpp
│   │   ├── multi_threading.h
│   │   ├── node_info.cpp
│   │   ├── node_info.h
│   │   ├── node_partition.cpp
│   │   ├── node_partition.h
│   │   ├── parse.cpp
│   │   ├── parse.h
│   │   ├── pbs_bitmap.cpp
│   │   ├── pbs_bitmap.h
│   │   ├── pbs_dedicated
│   │   ├── pbs_holidays
│   │   ├── pbs_holidays.2017
│   │   ├── pbs_resource_group
│   │   ├── pbs_sched.cpp
│   │   ├── pbs_sched_bare.cpp
│   │   ├── pbs_sched_config
│   │   ├── pbs_sched_utils.cpp
│   │   ├── pbsfs.cpp
│   │   ├── prev_job_info.cpp
│   │   ├── prev_job_info.h
│   │   ├── prime.cpp
│   │   ├── prime.h
│   │   ├── queue.cpp
│   │   ├── queue.h
│   │   ├── queue_info.cpp
│   │   ├── queue_info.h
│   │   ├── resource.cpp
│   │   ├── resource.h
│   │   ├── resource_resv.cpp
│   │   ├── resource_resv.h
│   │   ├── resv_info.cpp
│   │   ├── resv_info.h
│   │   ├── sched_exception.cpp
│   │   ├── sched_ifl_wrappers.cpp
│   │   ├── server_info.cpp
│   │   ├── server_info.h
│   │   ├── simulate.cpp
│   │   ├── simulate.h
│   │   ├── site_code.cpp
│   │   ├── site_code.h
│   │   ├── site_data.h
│   │   ├── sort.cpp
│   │   ├── sort.h
│   │   ├── state_count.cpp
│   │   └── state_count.h
│   ├── server/
│   │   ├── Makefile.am
│   │   ├── accounting.c
│   │   ├── array_func.c
│   │   ├── attr_recov.c
│   │   ├── attr_recov_db.c
│   │   ├── checkkey.c
│   │   ├── daemon_info.c
│   │   ├── dis_read.c
│   │   ├── failover.c
│   │   ├── geteusernam.c
│   │   ├── hook_func.c
│   │   ├── issue_request.c
│   │   ├── jattr_get_set.c
│   │   ├── job_func.c
│   │   ├── job_recov_db.c
│   │   ├── job_route.c
│   │   ├── license_client.c
│   │   ├── licensing_func.c
│   │   ├── mom_info.c
│   │   ├── nattr_get_set.c
│   │   ├── node_func.c
│   │   ├── node_manager.c
│   │   ├── node_recov_db.c
│   │   ├── pbs_comm.c
│   │   ├── pbs_db_func.c
│   │   ├── pbsd_init.c
│   │   ├── pbsd_main.c
│   │   ├── process_request.c
│   │   ├── qattr_get_set.c
│   │   ├── queue_func.c
│   │   ├── queue_recov_db.c
│   │   ├── rattr_get_set.c
│   │   ├── reply_send.c
│   │   ├── req_cred.c
│   │   ├── req_delete.c
│   │   ├── req_getcred.c
│   │   ├── req_holdjob.c
│   │   ├── req_jobobit.c
│   │   ├── req_locate.c
│   │   ├── req_manager.c
│   │   ├── req_message.c
│   │   ├── req_modify.c
│   │   ├── req_movejob.c
│   │   ├── req_preemptjob.c
│   │   ├── req_quejob.c
│   │   ├── req_register.c
│   │   ├── req_rerun.c
│   │   ├── req_rescq.c
│   │   ├── req_runjob.c
│   │   ├── req_select.c
│   │   ├── req_shutdown.c
│   │   ├── req_signal.c
│   │   ├── req_stat.c
│   │   ├── req_track.c
│   │   ├── resc_attr.c
│   │   ├── run_sched.c
│   │   ├── sattr_get_set.c
│   │   ├── sched_attr_get_set.c
│   │   ├── sched_func.c
│   │   ├── setup_resc.c
│   │   ├── stat_job.c
│   │   ├── svr_chk_owner.c
│   │   ├── svr_connect.c
│   │   ├── svr_credfunc.c
│   │   ├── svr_func.c
│   │   ├── svr_jobfunc.c
│   │   ├── svr_mail.c
│   │   ├── svr_movejob.c
│   │   ├── svr_recov_db.c
│   │   ├── svr_resccost.c
│   │   ├── user_func.c
│   │   └── vnparse.c
│   ├── tools/
│   │   ├── Makefile.am
│   │   ├── chk_tree.c
│   │   ├── create_env_file.sh
│   │   ├── hostn.c
│   │   ├── pbsTclInit.c
│   │   ├── pbsTkInit.c
│   │   ├── pbs_ds_monitor.c
│   │   ├── pbs_idled.c
│   │   ├── pbs_probe.c
│   │   ├── pbs_python.c
│   │   ├── pbs_sleep.c
│   │   ├── pbs_tclWrap.c
│   │   ├── pbs_upgrade_job.c
│   │   ├── printjob.c
│   │   ├── rstester.c
│   │   ├── site_tclWrap.c
│   │   ├── tracejob.c
│   │   ├── tracejob.h
│   │   └── wrap_tcl.sh.in
│   └── unsupported/
│       ├── Makefile.am
│       ├── NodeHealthCheck.json
│       ├── NodeHealthCheck.py
│       ├── README
│       ├── ReliableJobStartup.py
│       ├── cray_readme
│       ├── load_balance.py
│       ├── mom_dyn_res.py
│       ├── pbs-mailer/
│       │   ├── README.md
│       │   ├── debian/
│       │   │   ├── changelog
│       │   │   ├── compat
│       │   │   ├── conffiles
│       │   │   ├── control
│       │   │   ├── pbs-mailer.service
│       │   │   └── rules
│       │   ├── pbs_mail.json
│       │   ├── pbs_mail_saver
│       │   ├── pbs_mail_sender
│       │   ├── release-deb.sh
│       │   └── release-rpm.sh
│       ├── pbs_config
│       ├── pbs_jobs_at.8B
│       ├── pbs_loganalyzer
│       ├── pbs_output.py
│       ├── pbs_rescquery.3B
│       ├── pbs_rmget.8B
│       ├── pbs_rmget.c
│       ├── pbs_stat
│       ├── rapid_inter.py
│       ├── renew-test/
│       │   ├── base64.c
│       │   ├── base64.h
│       │   └── renew-test.c
│       ├── run_pelog_shell.ini
│       ├── run_pelog_shell.py
│       ├── sgiICEplacement.sh
│       ├── sgiICEvnode.sh
│       └── sgigenvnodelist.awk
├── test/
│   ├── Makefile.am
│   ├── fw/
│   │   ├── MANIFEST.in
│   │   ├── Makefile.am
│   │   ├── bin/
│   │   │   ├── pbs_as
│   │   │   ├── pbs_benchpress
│   │   │   ├── pbs_compare_results
│   │   │   ├── pbs_config
│   │   │   ├── pbs_cov
│   │   │   ├── pbs_loganalyzer
│   │   │   ├── pbs_py_spawn
│   │   │   ├── pbs_snapshot
│   │   │   ├── pbs_stat
│   │   │   ├── pbs_swigify
│   │   │   └── pbs_sys_report
│   │   ├── doc/
│   │   │   ├── caveats.rst
│   │   │   ├── commands.rst
│   │   │   ├── conf.py
│   │   │   ├── howtotest.rst
│   │   │   ├── index.rst
│   │   │   ├── install.rst
│   │   │   ├── intro.rst
│   │   │   ├── make.bat
│   │   │   ├── ptl.rst
│   │   │   └── tutorial.rst
│   │   ├── ptl/
│   │   │   ├── __init__.py.in
│   │   │   ├── lib/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── pbs_api_to_cli.py
│   │   │   │   ├── pbs_ifl_mock.py
│   │   │   │   ├── pbs_testlib.py
│   │   │   │   ├── ptl_batchutils.py
│   │   │   │   ├── ptl_comm.py
│   │   │   │   ├── ptl_config.py
│   │   │   │   ├── ptl_constants.py
│   │   │   │   ├── ptl_entities.py
│   │   │   │   ├── ptl_error.py
│   │   │   │   ├── ptl_expect_action.py
│   │   │   │   ├── ptl_fairshare.py
│   │   │   │   ├── ptl_mom.py
│   │   │   │   ├── ptl_object.py
│   │   │   │   ├── ptl_resourceresv.py
│   │   │   │   ├── ptl_sched.py
│   │   │   │   ├── ptl_server.py
│   │   │   │   ├── ptl_service.py
│   │   │   │   ├── ptl_types.py
│   │   │   │   └── ptl_wrappers.py
│   │   │   └── utils/
│   │   │       ├── __init__.py
│   │   │       ├── pbs_anonutils.py
│   │   │       ├── pbs_cliutils.py
│   │   │       ├── pbs_covutils.py
│   │   │       ├── pbs_crayutils.py
│   │   │       ├── pbs_dshutils.py
│   │   │       ├── pbs_logutils.py
│   │   │       ├── pbs_procutils.py
│   │   │       ├── pbs_snaputils.py
│   │   │       ├── pbs_testsuite.py
│   │   │       ├── pbs_testusers.py
│   │   │       └── plugins/
│   │   │           ├── __init__.py
│   │   │           ├── ptl_report_json.py
│   │   │           ├── ptl_test_data.py
│   │   │           ├── ptl_test_db.py
│   │   │           ├── ptl_test_info.py
│   │   │           ├── ptl_test_loader.py
│   │   │           ├── ptl_test_runner.py
│   │   │           └── ptl_test_tags.py
│   │   ├── ptl.csh
│   │   ├── ptl.sh
│   │   ├── ptlreport
│   │   ├── requirements.txt
│   │   └── setup.py.in
│   ├── scripts/
│   │   └── qsub_multi.sh
│   └── tests/
│       ├── Makefile.am
│       ├── __init__.py
│       ├── functional/
│       │   ├── __init__.py
│       │   ├── pbs_Rrecord_resources_used.py
│       │   ├── pbs_acct_log.py
│       │   ├── pbs_accumulate_resc_used.py
│       │   ├── pbs_acl_groups.py
│       │   ├── pbs_acl_host_moms.py
│       │   ├── pbs_acl_host_queue.py
│       │   ├── pbs_acl_host_server.py
│       │   ├── pbs_admin_suspend.py
│       │   ├── pbs_allpart.py
│       │   ├── pbs_alps_inventory_check_hook.py
│       │   ├── pbs_alps_release_tunables.py
│       │   ├── pbs_array_job_mail.py
│       │   ├── pbs_basil_parser_err.py
│       │   ├── pbs_basil_support.py
│       │   ├── pbs_calendaring.py
│       │   ├── pbs_cgroups_hook.py
│       │   ├── pbs_check_job_attrib.py
│       │   ├── pbs_checkpoint.py
│       │   ├── pbs_client_response.py
│       │   ├── pbs_complete_running_parent_job.py
│       │   ├── pbs_conf_resv_stale_vnode.py
│       │   ├── pbs_config.py
│       │   ├── pbs_cpuset.py
│       │   ├── pbs_cray_check_node_exclusivity.py
│       │   ├── pbs_cray_hyperthread.py
│       │   ├── pbs_cray_pagg_id.py
│       │   ├── pbs_cray_reliable_job_startup.py
│       │   ├── pbs_cray_smoketest.py
│       │   ├── pbs_cray_suspend_resume.py
│       │   ├── pbs_cray_vnode_per_numa.py
│       │   ├── pbs_cray_vnode_pool.py
│       │   ├── pbs_daemon_service_user.py
│       │   ├── pbs_dup_acc_log_for_resv.py
│       │   ├── pbs_eligible_time.py
│       │   ├── pbs_equiv_classes.py
│       │   ├── pbs_exceeded_resources_notification.py
│       │   ├── pbs_execjob_susp_resume.py
│       │   ├── pbs_fairshare.py
│       │   ├── pbs_gen_nodefile_on_sister_mom.py
│       │   ├── pbs_grunt.py
│       │   ├── pbs_highreslog.py
│       │   ├── pbs_holidays.py
│       │   ├── pbs_hook_config_os_env.py
│       │   ├── pbs_hook_crosslink_mom.py
│       │   ├── pbs_hook_debug_input.py
│       │   ├── pbs_hook_debug_nocrash.py
│       │   ├── pbs_hook_exechost_periodic.py
│       │   ├── pbs_hook_execjob_abort.py
│       │   ├── pbs_hook_execjob_end.py
│       │   ├── pbs_hook_execjob_prologue.py
│       │   ├── pbs_hook_jobobit.py
│       │   ├── pbs_hook_management.py
│       │   ├── pbs_hook_modifyvnode_state_changes.py
│       │   ├── pbs_hook_perf_stat.py
│       │   ├── pbs_hook_postqueuejob.py
│       │   ├── pbs_hook_set_attr.py
│       │   ├── pbs_hook_set_interrupt.py
│       │   ├── pbs_hook_set_jobenv.py
│       │   ├── pbs_hook_set_nonexist.py
│       │   ├── pbs_hook_timeout.py
│       │   ├── pbs_hook_unset_res.py
│       │   ├── pbs_hooksmoketest.py
│       │   ├── pbs_hookswig.py
│       │   ├── pbs_indirect_resources.py
│       │   ├── pbs_init_script.py
│       │   ├── pbs_job_array.py
│       │   ├── pbs_job_array_comment.py
│       │   ├── pbs_job_comment_on_resume.py
│       │   ├── pbs_job_default_group.py
│       │   ├── pbs_job_dependency.py
│       │   ├── pbs_job_purge.py
│       │   ├── pbs_job_requeue_timeout_error.py
│       │   ├── pbs_job_routing.py
│       │   ├── pbs_job_script.py
│       │   ├── pbs_job_sort_formula.py
│       │   ├── pbs_job_status_after_mom_hup.py
│       │   ├── pbs_job_task.py
│       │   ├── pbs_maintenance_reservations.py
│       │   ├── pbs_modifyresv_hook.py
│       │   ├── pbs_mom_hook_sync.py
│       │   ├── pbs_mom_hooks_test.py
│       │   ├── pbs_mom_job_dir.py
│       │   ├── pbs_mom_local_nodename.py
│       │   ├── pbs_mom_mock_run.py
│       │   ├── pbs_mom_walltime.py
│       │   ├── pbs_moved_job.py
│       │   ├── pbs_moved_job_local.py
│       │   ├── pbs_multi_sched.py
│       │   ├── pbs_multiple_execjob_launch_hook.py
│       │   ├── pbs_node_buckets.py
│       │   ├── pbs_node_jobs_restart.py
│       │   ├── pbs_node_jobs_restart_multinode.py
│       │   ├── pbs_node_rampdown.py
│       │   ├── pbs_node_rampdown_keep_select.py
│       │   ├── pbs_node_sleep_state.py
│       │   ├── pbs_nodes_json.py
│       │   ├── pbs_nodes_queues.py
│       │   ├── pbs_nonprint_characters.py
│       │   ├── pbs_offline_vnodes.py
│       │   ├── pbs_one_event_multiple_hooks.py
│       │   ├── pbs_only_explicit_psets.py
│       │   ├── pbs_only_small_files_over_tpp.py
│       │   ├── pbs_passing_environment_variable.py
│       │   ├── pbs_pbsnodes.py
│       │   ├── pbs_pbsnodes_output_trimmed.py
│       │   ├── pbs_peer.py
│       │   ├── pbs_periodic_constant.py
│       │   ├── pbs_power_provisioning_cray.py
│       │   ├── pbs_power_provisioning_sgi.py
│       │   ├── pbs_preemption.py
│       │   ├── pbs_printjob.py
│       │   ├── pbs_provisioning.py
│       │   ├── pbs_provisioning_enhancement.py
│       │   ├── pbs_python_restart_settings.py
│       │   ├── pbs_python_test.py
│       │   ├── pbs_qdel.py
│       │   ├── pbs_qmgr.py
│       │   ├── pbs_qrun.py
│       │   ├── pbs_qselect.py
│       │   ├── pbs_qstat.py
│       │   ├── pbs_qstat_2servers.py
│       │   ├── pbs_qstat_count.py
│       │   ├── pbs_qstat_formats.py
│       │   ├── pbs_qsub_direct_write.py
│       │   ├── pbs_qsub_opts_args.py
│       │   ├── pbs_qsub_remove_files.py
│       │   ├── pbs_qsub_script.py
│       │   ├── pbs_qsub_wblock.py
│       │   ├── pbs_que_resc_usage.py
│       │   ├── pbs_ralter.py
│       │   ├── pbs_release_limited_res_suspend.py
│       │   ├── pbs_reliable_job_startup.py
│       │   ├── pbs_resc_custom_perm.py
│       │   ├── pbs_resc_used_single_node.py
│       │   ├── pbs_reservations.py
│       │   ├── pbs_resource_multichunk.py
│       │   ├── pbs_resource_unset.py
│       │   ├── pbs_resource_usage_log.py
│       │   ├── pbs_resv_begin_hook.py
│       │   ├── pbs_resv_confirm_hook.py
│       │   ├── pbs_resv_end_hook.py
│       │   ├── pbs_resv_start_dur_end.py
│       │   ├── pbs_root_owned_script.py
│       │   ├── pbs_rstat.py
│       │   ├── pbs_runjob_hook.py
│       │   ├── pbs_sched_attr_updates.py
│       │   ├── pbs_sched_badstate.py
│       │   ├── pbs_sched_fifo.py
│       │   ├── pbs_sched_preempt_enforce_resumption.py
│       │   ├── pbs_sched_rerun.py
│       │   ├── pbs_sched_runjobwait.py
│       │   ├── pbs_sched_signal.py
│       │   ├── pbs_schedule_indirect_resources.py
│       │   ├── pbs_server_hook_attr.py
│       │   ├── pbs_server_periodic_hook.py
│       │   ├── pbs_set_enforcement.py
│       │   ├── pbs_sister_mom_crash.py
│       │   ├── pbs_snapshot_unittest.py
│       │   ├── pbs_soft_walltime.py
│       │   ├── pbs_stf.py
│       │   ├── pbs_strict_ordering.py
│       │   ├── pbs_support_linux_hook_event_phase1_2.py
│       │   ├── pbs_suspend_resume_accounting.py
│       │   ├── pbs_svr_dyn_res.py
│       │   ├── pbs_systemd.py
│       │   ├── pbs_test_entity_limits.py
│       │   ├── pbs_test_qorder.py
│       │   ├── pbs_test_run_count.py
│       │   ├── pbs_test_svr_dflt.py
│       │   ├── pbs_test_tpp.py
│       │   ├── pbs_trillion_jobid.py
│       │   ├── pbs_two_mom_hooks_resources_used.py
│       │   ├── pbs_types.py
│       │   ├── pbs_unknown_resource_hook_update.py
│       │   ├── pbs_unset_exectime.py
│       │   ├── pbs_user_reliability.py
│       │   ├── pbs_validate_job_qsub_attributes.py
│       │   └── pbs_verify_log_output.py
│       ├── interfaces/
│       │   ├── __init__.py
│       │   ├── pbs_libpbs_so.py
│       │   ├── pbs_node_partition.py
│       │   ├── pbs_partition.py
│       │   ├── pbs_preempt_params.py
│       │   └── pbs_sched_interface_test.py
│       ├── pbs_smoketest.py
│       ├── performance/
│       │   ├── __init__.py
│       │   ├── pbs_cgroups_stress.py
│       │   ├── pbs_client_nagle_performance.py
│       │   ├── pbs_equiv_classes_perf.py
│       │   ├── pbs_history_cleanup_quasihang.py
│       │   ├── pbs_jobperf.py
│       │   ├── pbs_preemptperformance.py
│       │   ├── pbs_qstat_performance.py
│       │   ├── pbs_qsub_performance.py
│       │   ├── pbs_rerunjob_file_transfer_perf.py
│       │   ├── pbs_runjobwait_perf.py
│       │   ├── pbs_sched_perf.py
│       │   ├── pbs_standing_resv_quasihang.py
│       │   └── test_dependency_perf.py
│       ├── resilience/
│       │   ├── __init__.py
│       │   └── pbs_hook_alarm_large_multinode_job.py
│       ├── security/
│       │   ├── __init__.py
│       │   ├── pbs_command_injection.py
│       │   └── pbs_multiple_auth.py
│       ├── selftest/
│       │   ├── __init__.py
│       │   ├── pbs_config_sched.py
│       │   ├── pbs_cycles_test.py
│       │   ├── pbs_default_timeout.py
│       │   ├── pbs_dshutils_tests.py
│       │   ├── pbs_expect.py
│       │   ├── pbs_initservices.py
│       │   ├── pbs_job_cleanup.py
│       │   ├── pbs_json_test_report.py
│       │   ├── pbs_manager.py
│       │   ├── pbs_managers_operators.py
│       │   ├── pbs_param_dict.py
│       │   ├── pbs_pbstestsuite.py
│       │   ├── pbs_requirements_decorator.py
│       │   ├── pbs_resvid_test.py
│       │   ├── pbs_test_create_vnodes.py
│       │   ├── pbs_test_revert_site_hooks.py
│       │   ├── pbs_test_revert_to_defaults.py
│       │   ├── pbs_testlogutils.py
│       │   └── pbs_testparams_decorator.py
│       └── upgrades/
│           └── __init__.py
└── valgrind.supp

================================================
FILE CONTENTS
================================================

================================================
FILE: .clang-format
================================================
---
Language:        Cpp
# BasedOnStyle:  LLVM
AccessModifierOffset: -2
AlignAfterOpenBracket: Align
AlignConsecutiveAssignments: false
AlignConsecutiveDeclarations: false
AlignEscapedNewlines: Right
AlignOperands:   true
AlignTrailingComments: true
AllowAllArgumentsOnNextLine: true
AllowAllConstructorInitializersOnNextLine: true
AllowAllParametersOfDeclarationOnNextLine: true
AllowShortBlocksOnASingleLine: false
AllowShortCaseLabelsOnASingleLine: false
AllowShortFunctionsOnASingleLine: All
AllowShortLambdasOnASingleLine: All
AllowShortIfStatementsOnASingleLine: Never
AllowShortLoopsOnASingleLine: false
AlwaysBreakAfterDefinitionReturnType: None
AlwaysBreakBeforeMultilineStrings: false
AlwaysBreakTemplateDeclarations: MultiLine
BinPackArguments: true
BinPackParameters: true
BreakBeforeBraces: Custom
BraceWrapping:
  AfterCaseLabel:  false
  AfterClass:      false
  AfterControlStatement: false
  AfterEnum:       false
  AfterFunction:   true
  AfterNamespace:  false
  AfterObjCDeclaration: false
  AfterStruct:     false
  AfterUnion:      false
  AfterExternBlock: false
  BeforeCatch:     false
  BeforeElse:      false
  IndentBraces:    false
  SplitEmptyFunction: true
  SplitEmptyRecord: true
  SplitEmptyNamespace: true
BreakBeforeBinaryOperators: None
BreakBeforeInheritanceComma: false
BreakInheritanceList: BeforeColon
BreakBeforeTernaryOperators: true
BreakConstructorInitializersBeforeComma: false
BreakConstructorInitializers: BeforeColon
BreakAfterJavaFieldAnnotations: false
BreakStringLiterals: true
ColumnLimit:     0
CommentPragmas:  '^ IWYU pragma:'
CompactNamespaces: false
ConstructorInitializerAllOnOneLineOrOnePerLine: false
ConstructorInitializerIndentWidth: 4
ContinuationIndentWidth: 8
Cpp11BracedListStyle: true
DerivePointerAlignment: false
DisableFormat:   false
ExperimentalAutoDetectBinPacking: false
FixNamespaceComments: true
ForEachMacros:
  - foreach
  - Q_FOREACH
  - BOOST_FOREACH
IncludeBlocks:   Preserve
IncludeCategories:
  - Regex:           '[<"]pbs_config.h[>"]'
    Priority:        -1
  - Regex:           '.*'
    Priority:        3
  - Regex:           '^"(llvm|llvm-c|clang|clang-c)/'
    Priority:        2
  - Regex:           '^(<|"(gtest|gmock|isl|json)/)'
    Priority:        4
IncludeIsMainRegex: '(Test)?$'
IndentCaseLabels: true
IndentPPDirectives: None
IndentWidth:     8
IndentWrappedFunctionNames: false
JavaScriptQuotes: Leave
JavaScriptWrapImports: true
KeepEmptyLinesAtTheStartOfBlocks: true
MacroBlockBegin: ''
MacroBlockEnd:   ''
MaxEmptyLinesToKeep: 1
NamespaceIndentation: None
ObjCBinPackProtocolList: Auto
ObjCBlockIndentWidth: 2
ObjCSpaceAfterProperty: false
ObjCSpaceBeforeProtocolList: true
PenaltyBreakAssignment: 2
PenaltyBreakBeforeFirstCallParameter: 19
PenaltyBreakComment: 300
PenaltyBreakFirstLessLess: 120
PenaltyBreakString: 1000
PenaltyBreakTemplateDeclaration: 10
PenaltyExcessCharacter: 1000000
PenaltyReturnTypeOnItsOwnLine: 60
PointerAlignment: Right
ReflowComments:  false
SortIncludes:    false
SortUsingDeclarations: true
SpaceAfterLogicalNot: false
SpaceAfterTemplateKeyword: true
SpaceBeforeAssignmentOperators: true
SpaceBeforeCpp11BracedList: false
SpaceBeforeCtorInitializerColon: true
SpaceBeforeInheritanceColon: true
SpaceBeforeParens: ControlStatements
SpaceBeforeRangeBasedForLoopColon: true
SpaceInEmptyParentheses: false
SpacesBeforeTrailingComments: 1
SpacesInAngles:  false
SpacesInContainerLiterals: true
SpacesInCStyleCastParentheses: false
SpacesInParentheses: false
SpacesInSquareBrackets: false
Standard:        Cpp11
StatementMacros:
  - Q_UNUSED
  - QT_REQUIRE_VERSION
TabWidth:        8
UseTab:          Always
AlwaysBreakAfterReturnType: AllDefinitions
SpaceAfterCStyleCast: true
...


================================================
FILE: .github/PULL_REQUEST_TEMPLATE.md
================================================
<!--- Please review your changes in preview mode -->
<!--- Provide a general summary of your changes in the Title above -->

#### Describe Bug or Feature
<!--- Describe the problem, ideally from the customer's viewpoint  -->


#### Describe Your Change
<!--- Say how you fixed the problem.  Please describe your code changes in detail for reviewer -->


#### Link to Design Doc
<!--- If there is a design, link to it here: **[project documentation area](https://pbspro.atlassian.net/wiki/display/PD)** -->


#### Attach Test and Valgrind Logs/Output
<!--- Please attach your test log output from running the test you added (or from existing tests that cover your changes) -->
<!--- Don't forget to run Valgrind if appropriate and attach the resulting logs -->


<!--- Pull Request Guidelines: [Pull Request Guidelines](https://pbspro.atlassian.net/wiki/spaces/DG/pages/1187348483/Pull+Request+Guidelines) -->


================================================
FILE: .github/checkclang
================================================
#!/bin/bash

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


export PATH=$PATH:/usr/local/bin/

checkdir="$(readlink -f $(dirname $0))"

which clang-format 1>/dev/null 2>/dev/null
if [ $? -ne 0 ]; then
    echo "Could not find clang-format command" 1>&2
    exit 1
fi

cd ${checkdir}/..

find . -iname *.h -o -iname *.c -o -iname *.cpp | xargs clang-format --dry-run
exit $?


================================================
FILE: .github/checkpep8
================================================
#!/bin/bash

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

checkdir="$(readlink -f $(dirname $0))"
errors=0

which pep8 1>/dev/null 2>/dev/null
if [ $? -ne 0 ]; then
    echo "Could not find pep8 command" 1>&2
    exit 1
fi

cd ${checkdir}/..

is_python_file() {
    name=$(basename ${1})

    # special case
    # if .rst file then it will be considered
    # as a  plain text file
    if [ "x${name##*.}" == "xrst" ]; then
        return 1
    fi

    # special case
    # if __init__.py does not contain any code then file
    # command will consider it as plain text file
    if [ "x${name}" == "x__init__.py" ]; then
        return 0
    fi

    if [ "x$(file --mime-type -b ${1})" == "xtext/x-python" ]; then
        return 0
    fi
    return 1

}

check_pep8() {
    pep8 --show-source ${1} >out_check_pep8 2>&1
    return $?
}

for f in $(find test -type f)
do
    if is_python_file ${f}
    then
        if ! check_pep8 ${f}
        then
            cat out_check_pep8 1>&2
            rm -f out_check_pep8
            errors=$((errors + 1))
        fi
        if [ -x "${f}" ]; then
            echo "${f}: executable bit set" 1>&2
            errors=$((errors + 1))
        fi
    fi
done

if [ ${errors} -ne 0 ]; then
    exit 1
else
    exit 0
fi


================================================
FILE: .github/runchecks
================================================
#!/bin/bash

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


declare -a listofchecks
listofchecks[0]="checkpep8"
listofchecks[1]="checkclang"

checkdir=$(readlink -f $(dirname $0))
errors_fails=0

for check in ${listofchecks[@]}
do
    echo -n "Running check: '${check}' ... "
    if [ ! -x "${checkdir}/${check}" ]; then
        echo "NOTFOUND"
        errors_fails=$((errors_fails + 1))
        continue
    fi
    ${checkdir}/${check} >out 2>err
    if [ $? -ne 0 ]; then
        echo "FAILED"
        cat err
        errors_fails=$((errors_fails + 1))
    else
        echo "OK"
        cat out
    fi
done

if [ ${errors_fails} -ne 0 ]; then
    exit 1
else
    exit 0
fi


================================================
FILE: .gitignore
================================================
# Object files
*.o
*.ko
*.obj
*.elf
*.slo

# Precompiled Headers
*.gch
*.pch

# Libraries
*.lib
*.libs
*.a
*.la
*.lo
*.lai

# module files
*.mod

# Shared objects (inc. Windows DLLs)
*.dll
*.so
*.so.*
*.dylib

# Executables
*.exe
*.out
*.app
*.i*86
*.x86_64
*.hex

# Debug files
*.dSYM/

# Eclipse project files
.project
.cproject
.pydevproject
.settings/
.autotools
.csettings/
.devcontainer/

# Files used by ctags
tags

# Files used by cscope
cscope.files
cscope.out

#Visual Studio files
*.user
*.ncb
*.suo
.vscode/
win_configure/.vs/

# Files used by gtags
GPATH
GRTAGS
GTAGS

# Files/Directory generated by PBSTestLab
ptl_test_results.html
ptl_test_results.json
test/fw/build/
test/fw/ptl/__init__.py
test/fw/setup.py
test/tests/ptl_test_results.json
test/tests/*/ptl_test_results.json

# Byte-compiled / optimized / DLL files
__pycache__/
*.py[cod]
*$py.class

# Python Distribution / packaging
.Python
develop-eggs/
dist/
downloads/
eggs/
.eggs/
sdist/
*.egg-info/
.installed.cfg
*.egg

# pip Installer logs
pip-log.txt
pip-delete-this-directory.txt
*.log

# Build directory
target/
target-*/

#PyCharm project directory
.idea/

# From automake/autoconf
autom4te.cache/
autoscan.log
autoscan-*.log
configure.scan
config.status
aclocal.m4
buildutils/config.guess
buildutils/config.sub

# Libtool
libtool
m4/libtool.m4
m4/ltoptions.m4
m4/ltsugar.m4
m4/ltversion.m4
m4/lt~obsolete.m4
buildutils/ltmain.sh

# Build related files
configure
Makefile.in
Makefile
*.deps
buildutils/pbs_mkdirs
buildutils/ar-lib
buildutils/compile
buildutils/depcomp
buildutils/install-sh
buildutils/missing
buildutils/py-compile
buildutils/exclude_script
buildutils/makedepend-sh
buildutils/ylwrap

# Generated binaries

src/cmds/mpiexec
src/cmds/nqs2pbs
src/cmds/pbs_attach
src/cmds/pbs_demux
src/cmds/pbs_ds_password.bin
src/cmds/pbs_lamboot
src/cmds/pbs_mpihp
src/cmds/pbs_mpilam
src/cmds/pbs_mpirun
src/cmds/pbs_rdel
src/cmds/pbs_remsh
src/cmds/pbs_rstat
src/cmds/pbs_rsub
src/cmds/pbs_ralter
src/cmds/pbs_tmrsh
src/cmds/pbsdsh
src/cmds/pbsnodes
src/cmds/pbs_release_nodes
src/cmds/pbs_dataservice.bin
src/cmds/pbsrun
src/cmds/pbsrun_unwrap
src/cmds/pbsrun_wrap
src/cmds/qalter
src/cmds/qdel
src/cmds/qdisable
src/cmds/qenable
src/cmds/qhold
src/cmds/qmgr
src/cmds/qmove
src/cmds/qmsg
src/cmds/qorder
src/cmds/qrerun
src/cmds/qrls
src/cmds/qrun
src/cmds/qselect
src/cmds/qsig
src/cmds/qstart
src/cmds/qstat
src/cmds/qstop
src/cmds/qsub
src/cmds/qterm
src/cmds/scripts/limits.pbs_mom
src/cmds/scripts/limits.post_services
src/cmds/scripts/pbs_habitat
src/cmds/scripts/pbs_init.d
src/cmds/scripts/pbs_poerun
src/cmds/scripts/pbs_postinstall
src/cmds/scripts/pbsrun.poe
src/cmds/scripts/pbs_reload
src/iff/pbs_iff
src/mom_rcp/pbs_rcp
src/resmom/pbs_mom
src/scheduler/pbs_sched
src/scheduler/pbs_sched_bare
src/scheduler/pbsfs
src/server/pbs_comm
src/server/pbs_server.bin
src/tools/pbs_ds_monitor
src/tools/pbs_hostn
src/tools/pbs_idled
src/tools/pbs_probe
src/tools/pbs_python
src/tools/pbs_tclsh
src/tools/pbs_upgrade_job
src/tools/pbs_wish
src/tools/printjob.bin
src/tools/printjob_svr.bin
src/tools/tracejob
src/tools/wrap_tcl.sh
src/tools/pbs_sleep
src/unsupported/pbs_rmget
src/unsupported/renew-test/renew-test

# Generated source files
src/include/pbs_version.h
src/include/pbs_config.h
src/include/pbs_config.h.in
src/include/pbs_config.h.in~
src/include/job_attr_enum.h
src/include/node_attr_enum.h
src/include/queue_attr_enum.h
src/include/resc_def_enum.h
src/include/resv_attr_enum.h
src/include/sched_attr_enum.h
src/include/svr_attr_enum.h
src/lib/Libattr/queue_attr_def.c
src/lib/Libattr/resc_def_all.c
src/lib/Libattr/resv_attr_def.c
src/lib/Libattr/sched_attr_def.c
src/lib/Libattr/svr_attr_def.c
src/lib/Libattr/job_attr_def.c
src/lib/Libattr/node_attr_def.c
src/lib/Libpbs/ecl_job_attr_def.c
src/lib/Libpbs/ecl_node_attr_def.c
src/lib/Libpbs/ecl_queue_attr_def.c
src/lib/Libpbs/ecl_resc_def_all.c
src/lib/Libpbs/ecl_resv_attr_def.c
src/lib/Libpbs/ecl_sched_attr_def.c
src/lib/Libpbs/ecl_svr_attr_def.c
src/include/stamp-h1
src/lib/Libpython/pbs_ifl.i
src/lib/Libpython/pbs_ifl.py
src/lib/Libpython/pbs_ifl_wrap.c
src/lib/Libifl/pbs_ifl.py
src/lib/Libifl/pbs_ifl_wrap.c
src/include/job_attr_enum.h
src/include/node_attr_enum.h
src/include/queue_attr_enum.h
src/include/resc_def_enum.h
src/include/resv_attr_enum.h
src/include/sched_attr_enum.h
src/include/svr_attr_enum.h

#Generated source files - Windows
src/lib/Libecl/ecl_node_attr_def.c
src/lib/Libecl/ecl_job_attr_def.c
src/lib/Libecl/ecl_queue_attr_def.c
src/lib/Libecl/ecl_resc_def_all.c
src/lib/Libecl/ecl_resv_attr_def.c
src/lib/Libecl/ecl_sched_attr_def.c
src/lib/Libecl/ecl_svr_attr_def.c
win_configure/projects/pbs_ifl.i
win_configure/projects/pbs_ifl.py
win_configure/projects/pbs_ifl_wrap.c

#ci logs
ci/logs/
ci/logs/prev_LOGS/
ci/.*
ci/packages
ci/ptl_ts_tree.json
ci/docker-compose.json

# Generated scripts
src/cmds/scripts/modulefile
src/cmds/scripts/pbs.service

# Generated by make dist
*.tar.gz
src/lib/Libpbs/pbs.pc

# rpm spec file
*.spec

# Other archive file types
*.tar
*.tar.bz
*.tgz
*.zip
*.cpio
*.rpm
*.deb

# Generated directories by autotools
*.libs


================================================
FILE: CODE_OF_CONDUCT.md
================================================
#### OpenPBS Open Source Project 

## **Code of Conduct**

This code of conduct is a guide for members of the OpenPBS community. We are committed to providing an open and welcoming environment for the OpenPBS community.  We expect that all members of the community will behave according to this code of conduct.  This code of conduct is intended to explain the spirit in which we expect to communicate, not to be an exhaustive list.  This code of conduct applies to all elements of the OpenPBS community: mailing lists, bug tracking systems, etc.  Anyone who violates this code of conduct may be banned from the OpenPBS community.  It is unacceptable to follow the letter but not the spirit of this code of conduct.

Guidelines for code of conduct:

* **Be friendly and patient.**
* **Be welcoming:** We strive to be a community that welcomes and supports people of all backgrounds and identities.
* **Be considerate:** Your work will be used by other people, and you in turn will depend on the work of others. Decisions you make affect everyone in the community, so please be mindful of your actions and always choose a non-confrontational approach. Remember: this is a global community and English is not everyone's primary language.
* **Be respectful:** Disagreements may occur, but we cannot abide personal attacks. The health of the community depends on all members feeling comfortable and supported. If you don't agree, use discretion and be polite.
* **Be careful in the words that we choose:** we are a community of professionals, and we conduct ourselves professionally. Be kind to others. Do not insult or put down other participants. Harassment and other exclusionary behavior aren’t acceptable.
* **Try to understand why we disagree:** Disagreements, both social and technical, happen all the time. It is important that we resolve disagreements and differing views constructively. Different people have different perspectives on issues. Being unable to understand why someone holds a viewpoint doesn’t mean that they’re wrong. Don’t forget that it is human to err and blaming each other doesn’t get us anywhere. Instead, focus on helping to resolve issues and learning from mistakes.
In addition, our open source community members are expected to abide by the **[OpenPBS Acceptable Use Policy](https://openpbs.atlassian.net/wiki/spaces/PBSPro/pages/5537837/Acceptable+Use+Policy).

### Reporting Issues
If you experience or witness unacceptable behavior — or have any other concerns — please report it by sending e-mail to webmaster@pbspro.org. All reports will be handled with discretion. In your report please include:
* Your contact information.
* Names (real, nicknames, or pseudonyms) of any individuals involved. If there are additional witnesses, please include them as well. Your account of what occurred, and if you believe the incident is ongoing. If there is a publicly available record (e.g. a mailing list archive or a public IRC logger), please include a link.
* Any additional information that may be helpful.

After filing a report, a representative will contact you personally, review the incident, follow up with any additional questions, and make a decision as to how to respond. If the person who is harassing you is part of the response team, they will recuse themselves from handling your incident. If the complaint originates from a member of the response team, it will be handled by a different member of the response team. We will respect confidentiality requests for the purpose of protecting victims of abuse.

### Attribution & Acknowledgements
This code of conduct is based on the **[Open Code of Conduct v1.0](https://github.com/todogroup/opencodeofconduct)** from the **[TODOGroup](http://todogroup.org)**. We are thankful for their work and all the communities who have paved the way with codes of conduct.

### PBS Pro Contributor's Portal
Please see the PBS Pro Contributor's Portal for the PBS Pro **[Code of Conduct](https://openpbs.atlassian.net/wiki/spaces/PBSPro/pages/5537835/Code+of+Conduct)**.

Note: In May 2020, OpenPBS became the new name for the PBS Professional Open Source Project. (PBS Professional will be used to refer to the commercial version; OpenPBS to the Open Source version -- same code, easier naming.) As there are many parts to the project, it will take several weeks to change the name in all places, so you will continue to see references to PBS Pro (as in the above) -- stay tuned.


================================================
FILE: CONTRIBUTING.md
================================================
### Contributing to the OpenPBS Open Source Project

We're so happy that you want to contribute to OpenPBS!

Please see the Contributor's Portal for details, guidelines, and how-to tutorials.  Start at **[Becoming a Contributor to OpenPBS](https://pbspro.atlassian.net/wiki/spaces/DG/pages/20414474/Becoming+a+Contributor+to+PBS+Pro)**.

Note: In May 2020, OpenPBS became the new name for the PBS Professional Open Source Project.  (PBS Professional will be used to refer to the commercial version; OpenPBS to the Open Source version -- same code, easier naming.)  As there are many parts to the project, it will take several weeks to change the name in all places, so you will continue to see references to PBS Pro (as in the above) -- stay tuned. 


================================================
FILE: COPYRIGHT
================================================
Copyright (C) 1994-2021 Altair Engineering, Inc.
For more information, contact Altair at www.altair.com.

This file is part of both the OpenPBS software ("OpenPBS")
and the PBS Professional ("PBS Pro") software.

Open Source License Information:

OpenPBS is free software. You can redistribute it and/or modify it under
the terms of the GNU Affero General Public License as published by the
Free Software Foundation, either version 3 of the License, or (at your
option) any later version.

OpenPBS is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
License for more details.

You should have received a copy of the GNU Affero General Public License
along with this program.  If not, see <http://www.gnu.org/licenses/>.

Commercial License Information:

PBS Pro is commercially licensed software that shares a common core with
the OpenPBS software.  For a copy of the commercial license terms and
conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
Altair Legal Department.

Altair's dual-license business model allows companies, individuals, and
organizations to create proprietary derivative works of OpenPBS and
distribute them - whether embedded or bundled with other software -
under a commercial license agreement.

Use of Altair's trademarks, including but not limited to "PBS™",
"OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
subject to Altair's trademark licensing policies.


================================================
FILE: INSTALL
================================================

--------------------------------------------------------------------

How to install PBS using the configure script.

0. Disable SELinux.

  OpenPBS does not support SELinux. With SELinux enabled, initial start fails
    with datastore permission error. You can also define proper policy but it is
    out of scope of this guide.

1. Install the prerequisite packages for building PBS.

  For CentOS-8 systems you should configure and enable powertools
  repo for hwloc-devel and libedit-devel packages.

  You should run the following commands as root:

    dnf install -y dnf-plugins-core
    dnf config-manager --set-enabled powertools

    dnf install -y gcc make rpm-build libtool hwloc-devel \
      libX11-devel libXt-devel libedit-devel libical-devel \
      ncurses-devel perl postgresql-devel postgresql-contrib python3-devel tcl-devel \
      tk-devel swig expat-devel openssl-devel libXext libXft \
      autoconf automake gcc-c++ cjson-devel

  For CentOS-7 systems you should run the following command as root:

    yum install -y gcc make rpm-build libtool hwloc-devel \
      libX11-devel libXt-devel libedit-devel libical-devel \
      ncurses-devel perl postgresql-devel postgresql-contrib python3-devel tcl-devel \
      tk-devel swig expat-devel openssl-devel libXext libXft \
      autoconf automake gcc-c++

  For openSUSE systems you should run the following command as root:

    zypper install gcc make rpm-build libtool hwloc-devel \
      libX11-devel libXt-devel libedit-devel libical-devel \
      ncurses-devel perl postgresql-devel postgresql-contrib python3-devel tcl-devel \
      tk-devel swig libexpat-devel libopenssl-devel libXext-devel \
      libXft-devel fontconfig autoconf automake gcc-c++ cJSON-devel

  For Debian systems you should run the following command as root:

    apt-get install gcc make libtool libhwloc-dev libx11-dev \
      libxt-dev libedit-dev libical-dev ncurses-dev perl \
      postgresql-server-dev-all postgresql-contrib python3-dev tcl-dev tk-dev swig \
      libexpat-dev libssl-dev libxext-dev libxft-dev autoconf \
      automake g++ libcjson-dev

  For Ubuntu-18.04 systems you should run the following command as root:

    apt install gcc make libtool libhwloc-dev libx11-dev \
      libxt-dev libedit-dev libical-dev ncurses-dev perl \
      postgresql-server-dev-all postgresql-contrib python3-dev tcl-dev tk-dev swig \
      libexpat-dev libssl-dev libxext-dev libxft-dev autoconf \
      automake g++

  For Ubuntu-24.04 systems you should run the following command as root:

    apt install gcc make libtool libhwloc-dev libx11-dev \
      libxt-dev libedit-dev libical-dev ncurses-dev perl \
      postgresql-server-dev-all postgresql-contrib python3-dev tcl-dev tk-dev swig \
      libexpat-dev libssl-dev libxext-dev libxft-dev autoconf \
      automake g++ libcjson-dev

  For macOS systems using MacPorts you should run the following command as root:

    port install autoconf automake libtool pkgconfig \
      expat hwloc libedit libical openssl postgresql14 python310 \
      swig-python tcl tk xorg-libX11 xorg-libXt

2. Install the prerequisite packages for running PBS. In addition
  to the commands below, you should also install a text editor of
  your choosing (vim, emacs, gedit, etc.).

  For CentOS systems you should run the following command as root:

    yum install -y expat libedit postgresql-server postgresql-contrib python3 \
      sendmail sudo tcl tk libical chkconfig cjson

  For openSUSE systems you should run the following command as root:

    zypper install expat libedit postgresql-server postgresql-contrib python3 \
      sendmail sudo tcl tk libical1 libcjson1

  For Debian (jessie) systems you should run the following command as root:

    apt-get install expat libedit2 postgresql python3 postgresql-contrib sendmail-bin \
      sudo tcl tk libical1a

  For Debian (stretch) systems you should run the following command as root:

    apt-get install expat libedit2 postgresql python3 postgresql-contrib sendmail-bin \
      sudo tcl tk libical2

  For Debian (buster) systems you should run the following command as root:

    apt-get install expat libedit2 postgresql python3 postgresql-contrib sendmail-bin \
      sudo tcl tk libical3 libcjson1

  For Ubuntu-18.04 systems you should run the following command as root:

    apt install expat libedit2 postgresql python3 postgresql-contrib sendmail-bin \
      sudo tcl tk libical3 postgresql-server-dev-all

  For Ubuntu-24.04 systems you should run the following command as root:

    apt install expat libedit2 postgresql python3 postgresql-contrib sendmail-bin \
      sudo tcl tk libical3 postgresql-server-dev-all

  For macOS systems using MacPorts you should run the following command as root:

    port install expat libedit libical openssl postgresql14-server python310 \
      tcl tk

3. Open a terminal as a normal (non-root) user, unpack the PBS
  tarball, and cd to the package directory.

    tar -xpvf openpbs-20.0.0.tar.gz
    cd openpbs-20.0.0

4. Generate the configure script and Makefiles. (See note 1 below)

    ./autogen.sh

5. Display the available build parameters.

    ./configure --help

6. Configure the build for your environment. You may utilize the
  parameters displayed in the previous step. (See note 2 below)

  For CentOS and Debian systems you should run the following
  command:

    ./configure --prefix=/opt/pbs

  For openSUSE systems (see note 3 below) you should run the
  following command:

    ./configure --prefix=/opt/pbs --libexecdir=/opt/pbs/libexec

  For macOS systems using MacPorts you should run the following commands:

    export CPATH=/opt/local/include/postgresql14:/opt/local/include
    export LIBRARY_PATH=/opt/local/lib/postgresql14:/opt/local/lib
    ./configure --with-swig=/opt/local --with-tcl=/opt/local

  If PTL needs to be installed along with PBS use the option
  "--enable-ptl" (see note 5 below)
    eg ./configure --prefix=/opt/pbs --enable-ptl

7. Build PBS by running "make". (See note 4 below)

    make

8. Configure sudo to allow your user account to run commands as
  root. Refer to the online manual pages for sudo, sudoers, and
  visudo.

9. Install PBS. Use sudo to run the command as root.

    sudo make install

10. Configure PBS by executing the post-install script.

    sudo /opt/pbs/libexec/pbs_postinstall

11. Edit /etc/pbs.conf to configure the PBS services that
  should be started. If you are installing PBS on only
  one system, you should change the value of PBS_START_MOM
  from zero to one. If you use vi as your editor, you would
  run:

    sudo vi /etc/pbs.conf

12. Some file permissions must be modified to add SUID privilege.

    sudo chmod 4755 /opt/pbs/sbin/pbs_iff /opt/pbs/sbin/pbs_rcp

13. Start the PBS services.

    sudo /etc/init.d/pbs start

14. All configured PBS services should now be running. Update
  your PATH and MANPATH variables by sourcing the appropriate
  PBS profile or logging out and back in.

  For Bourne shell (or similar) run the following:
    . /etc/profile.d/pbs.sh

  For C shell (or similar) run the following:
    source /etc/profile.d/pbs.csh

15. You should now be able to run PBS commands to submit
  and query jobs. Some examples follow.

bash$ qstat -B
Server             Max   Tot   Que   Run   Hld   Wat   Trn   Ext Status
---------------- ----- ----- ----- ----- ----- ----- ----- ----- -----------
host1                0     0     0     0     0     0     0     0 Active
bash$ pbsnodes -a
host1
     Mom = host1
     ntype = PBS
     state = free
     pcpus = 2
     resources_available.arch = linux
     resources_available.host = host1
     resources_available.mem = 2049248kb
     resources_available.ncpus = 2
     resources_available.vnode = host1
     resources_assigned.accelerator_memory = 0kb
     resources_assigned.mem = 0kb
     resources_assigned.naccelerators = 0
     resources_assigned.ncpus = 0
     resources_assigned.vmem = 0kb
     resv_enable = True
     sharing = default_shared
     license = l

bash$ echo "sleep 60" | qsub
0.host1
bash$ qstat -a

host1:
                                                            Req'd  Req'd   Elap
Job ID          Username Queue    Jobname    SessID NDS TSK Memory Time  S Time
--------------- -------- -------- ---------- ------ --- --- ------ ----- - -----
0.host1         mike     workq    STDIN        2122   1   1    --    --  R 00:00

bash$

--------------------------------------------------------------------

NOTES:

Note 1: If you modify configure.ac or adjust timestamps on any files
  that are automatically generated, you will need to regenerate them
  by re-running autogen.sh.

Note 2: It is advisable to create a simple shell script that calls
  configure with the appropriate options for your environment. This
  ensures configure will be called with the same arguments during
  subsequent invocations. If you have already run configure you can
  regenerate all of the Makefiles by running "./config.status".
  The first few lines of config.status will reveal the options that
  were specified when configure was run. If you set envirnment
  variables such as CFLAGS it is best to do so as an argument to
  configure (e.g. ./configure CFLAGS="-O0 -g" --prefix=/opt/pbs).
  This will ensure consistency when config.status regenerates the
  Makefiles.

Note 3: The openSUSE rpm package expands %_libexecdir to /opt/pbs/lib
  rather than /opt/pbs/libexec which causes problems for the post-
  install scripts. Providing the --libexecdir value to configure
  overrides this behavior.

Note 4: You need to use a POSIX (or nearly POSIX) make. GNU make
  works quite well in this regard; BSD make does not. If you are
  having any sort of build problems, your make should be a prime
  suspect. Tremendous effort has been expended to provide proper
  dependency generation and makefiles without relying on any
  non-POSIX features. The build should work fine with a simple call
  to make, however, complicating things by using various make flags
  is not guaranteed to work. Don't be surprised if the first thing
  that make does is call configure again.

Note 5: PTL gets installed in the parent directory of where PBS
  is installed. For example if you have given install prefix=/opt/pbs, then
  you can find PTL installation in the directory /opt/ptl . You may need to
  log out and log in from the terminal for PATH and PYTHONPATH to update.


Using valgrind with PBS.
-------------------------------------
Here is a set of steps to detect memory errors/leaks within PBS code.

1. Install the valgrind development package.

   yum install valgrind-devel (zypper for OpenSUSE).


2. Compile Python in a way that valgrind can work with it, as follows:

   ./configure --prefix=<installdir> --without-pymalloc --with-pydebug --with-valgrind
   make; make install


3. Compile PBS with the special python and in debug mode as follows:

   ./configure --prefix=<installdir> --with-python=<python-dir>  CFLAGS="-g -DPy_DEBUG -DDEBUG -Wall -Werror"


4. Run pbs daemons under valgrind.

   a) To detect memory errors (not leaks) run pbs daemons as follows:

   export LD_LIBRARY_PATH=/opt/pbs/pgsql/lib:/opt/pbs/lib:$LD_LIBRARY_PATH
   valgrind --tool=memcheck --log-file=/tmp/val.out /opt/pbs/sbin/pbs_server.bin


   b) To detect memory leaks use the supplied leaks suppression file valgrind.supp, as follows:

   export LD_LIBRARY_PATH=/opt/pbs/pgsql/lib:/opt/pbs/lib:$LD_LIBRARY_PATH
   valgrind --tool=memcheck --log-file=/tmp/val.out --suppressions=./valgrind.supp --leak-check=full --track-origins=yes /opt/pbs/sbin/pbs_server.bin


================================================
FILE: LICENSE
================================================
----------------------------------------------------
Open Source License for OpenPBS and PBS Professional
----------------------------------------------------

Copyright (C) 1994-2021 Altair Engineering, Inc.
For more information, contact Altair at www.altair.com.

This file is part of both the OpenPBS software ("OpenPBS")
and the PBS Professional ("PBS Pro") software.

Open Source License Information:

OpenPBS is free software. You can redistribute it and/or modify it under
the terms of the GNU Affero General Public License as published by the
Free Software Foundation, either version 3 of the License, or (at your
option) any later version.

OpenPBS is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
License for more details.

You should have received a copy of the GNU Affero General Public License
along with this program.  If not, see <http://www.gnu.org/licenses/>.

Commercial License Information:

PBS Pro is commercially licensed software that shares a common core with
the OpenPBS software.  For a copy of the commercial license terms and
conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
Altair Legal Department.

Altair's dual-license business model allows companies, individuals, and
organizations to create proprietary derivative works of OpenPBS and
distribute them - whether embedded or bundled with other software -
under a commercial license agreement.

Use of Altair's trademarks, including but not limited to "PBS™",
"OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
subject to Altair's trademark licensing policies.

==============================================================================

                    GNU AFFERO GENERAL PUBLIC LICENSE
                       Version 3, 19 November 2007

 Copyright (C) 2007 Free Software Foundation, Inc. <http://fsf.org/>
 Everyone is permitted to copy and distribute verbatim copies
 of this license document, but changing it is not allowed.

                            Preamble

  The GNU Affero General Public License is a free, copyleft license for
software and other kinds of works, specifically designed to ensure
cooperation with the community in the case of network server software.

  The licenses for most software and other practical works are designed
to take away your freedom to share and change the works.  By contrast,
our General Public Licenses are intended to guarantee your freedom to
share and change all versions of a program--to make sure it remains free
software for all its users.

  When we speak of free software, we are referring to freedom, not
price.  Our General Public Licenses are designed to make sure that you
have the freedom to distribute copies of free software (and charge for
them if you wish), that you receive source code or can get it if you
want it, that you can change the software or use pieces of it in new
free programs, and that you know you can do these things.

  Developers that use our General Public Licenses protect your rights
with two steps: (1) assert copyright on the software, and (2) offer
you this License which gives you legal permission to copy, distribute
and/or modify the software.

  A secondary benefit of defending all users' freedom is that
improvements made in alternate versions of the program, if they
receive widespread use, become available for other developers to
incorporate.  Many developers of free software are heartened and
encouraged by the resulting cooperation.  However, in the case of
software used on network servers, this result may fail to come about.
The GNU General Public License permits making a modified version and
letting the public access it on a server without ever releasing its
source code to the public.

  The GNU Affero General Public License is designed specifically to
ensure that, in such cases, the modified source code becomes available
to the community.  It requires the operator of a network server to
provide the source code of the modified version running there to the
users of that server.  Therefore, public use of a modified version, on
a publicly accessible server, gives the public access to the source
code of the modified version.

  An older license, called the Affero General Public License and
published by Affero, was designed to accomplish similar goals.  This is
a different license, not a version of the Affero GPL, but Affero has
released a new version of the Affero GPL which permits relicensing under
this license.

  The precise terms and conditions for copying, distribution and
modification follow.

                       TERMS AND CONDITIONS

  0. Definitions.

  "This License" refers to version 3 of the GNU Affero General Public License.

  "Copyright" also means copyright-like laws that apply to other kinds of
works, such as semiconductor masks.

  "The Program" refers to any copyrightable work licensed under this
License.  Each licensee is addressed as "you".  "Licensees" and
"recipients" may be individuals or organizations.

  To "modify" a work means to copy from or adapt all or part of the work
in a fashion requiring copyright permission, other than the making of an
exact copy.  The resulting work is called a "modified version" of the
earlier work or a work "based on" the earlier work.

  A "covered work" means either the unmodified Program or a work based
on the Program.

  To "propagate" a work means to do anything with it that, without
permission, would make you directly or secondarily liable for
infringement under applicable copyright law, except executing it on a
computer or modifying a private copy.  Propagation includes copying,
distribution (with or without modification), making available to the
public, and in some countries other activities as well.

  To "convey" a work means any kind of propagation that enables other
parties to make or receive copies.  Mere interaction with a user through
a computer network, with no transfer of a copy, is not conveying.

  An interactive user interface displays "Appropriate Legal Notices"
to the extent that it includes a convenient and prominently visible
feature that (1) displays an appropriate copyright notice, and (2)
tells the user that there is no warranty for the work (except to the
extent that warranties are provided), that licensees may convey the
work under this License, and how to view a copy of this License.  If
the interface presents a list of user commands or options, such as a
menu, a prominent item in the list meets this criterion.

  1. Source Code.

  The "source code" for a work means the preferred form of the work
for making modifications to it.  "Object code" means any non-source
form of a work.

  A "Standard Interface" means an interface that either is an official
standard defined by a recognized standards body, or, in the case of
interfaces specified for a particular programming language, one that
is widely used among developers working in that language.

  The "System Libraries" of an executable work include anything, other
than the work as a whole, that (a) is included in the normal form of
packaging a Major Component, but which is not part of that Major
Component, and (b) serves only to enable use of the work with that
Major Component, or to implement a Standard Interface for which an
implementation is available to the public in source code form.  A
"Major Component", in this context, means a major essential component
(kernel, window system, and so on) of the specific operating system
(if any) on which the executable work runs, or a compiler used to
produce the work, or an object code interpreter used to run it.

  The "Corresponding Source" for a work in object code form means all
the source code needed to generate, install, and (for an executable
work) run the object code and to modify the work, including scripts to
control those activities.  However, it does not include the work's
System Libraries, or general-purpose tools or generally available free
programs which are used unmodified in performing those activities but
which are not part of the work.  For example, Corresponding Source
includes interface definition files associated with source files for
the work, and the source code for shared libraries and dynamically
linked subprograms that the work is specifically designed to require,
such as by intimate data communication or control flow between those
subprograms and other parts of the work.

  The Corresponding Source need not include anything that users
can regenerate automatically from other parts of the Corresponding
Source.

  The Corresponding Source for a work in source code form is that
same work.

  2. Basic Permissions.

  All rights granted under this License are granted for the term of
copyright on the Program, and are irrevocable provided the stated
conditions are met.  This License explicitly affirms your unlimited
permission to run the unmodified Program.  The output from running a
covered work is covered by this License only if the output, given its
content, constitutes a covered work.  This License acknowledges your
rights of fair use or other equivalent, as provided by copyright law.

  You may make, run and propagate covered works that you do not
convey, without conditions so long as your license otherwise remains
in force.  You may convey covered works to others for the sole purpose
of having them make modifications exclusively for you, or provide you
with facilities for running those works, provided that you comply with
the terms of this License in conveying all material for which you do
not control copyright.  Those thus making or running the covered works
for you must do so exclusively on your behalf, under your direction
and control, on terms that prohibit them from making any copies of
your copyrighted material outside their relationship with you.

  Conveying under any other circumstances is permitted solely under
the conditions stated below.  Sublicensing is not allowed; section 10
makes it unnecessary.

  3. Protecting Users' Legal Rights From Anti-Circumvention Law.

  No covered work shall be deemed part of an effective technological
measure under any applicable law fulfilling obligations under article
11 of the WIPO copyright treaty adopted on 20 December 1996, or
similar laws prohibiting or restricting circumvention of such
measures.

  When you convey a covered work, you waive any legal power to forbid
circumvention of technological measures to the extent such circumvention
is effected by exercising rights under this License with respect to
the covered work, and you disclaim any intention to limit operation or
modification of the work as a means of enforcing, against the work's
users, your or third parties' legal rights to forbid circumvention of
technological measures.

  4. Conveying Verbatim Copies.

  You may convey verbatim copies of the Program's source code as you
receive it, in any medium, provided that you conspicuously and
appropriately publish on each copy an appropriate copyright notice;
keep intact all notices stating that this License and any
non-permissive terms added in accord with section 7 apply to the code;
keep intact all notices of the absence of any warranty; and give all
recipients a copy of this License along with the Program.

  You may charge any price or no price for each copy that you convey,
and you may offer support or warranty protection for a fee.

  5. Conveying Modified Source Versions.

  You may convey a work based on the Program, or the modifications to
produce it from the Program, in the form of source code under the
terms of section 4, provided that you also meet all of these conditions:

    a) The work must carry prominent notices stating that you modified
    it, and giving a relevant date.

    b) The work must carry prominent notices stating that it is
    released under this License and any conditions added under section
    7.  This requirement modifies the requirement in section 4 to
    "keep intact all notices".

    c) You must license the entire work, as a whole, under this
    License to anyone who comes into possession of a copy.  This
    License will therefore apply, along with any applicable section 7
    additional terms, to the whole of the work, and all its parts,
    regardless of how they are packaged.  This License gives no
    permission to license the work in any other way, but it does not
    invalidate such permission if you have separately received it.

    d) If the work has interactive user interfaces, each must display
    Appropriate Legal Notices; however, if the Program has interactive
    interfaces that do not display Appropriate Legal Notices, your
    work need not make them do so.

  A compilation of a covered work with other separate and independent
works, which are not by their nature extensions of the covered work,
and which are not combined with it such as to form a larger program,
in or on a volume of a storage or distribution medium, is called an
"aggregate" if the compilation and its resulting copyright are not
used to limit the access or legal rights of the compilation's users
beyond what the individual works permit.  Inclusion of a covered work
in an aggregate does not cause this License to apply to the other
parts of the aggregate.

  6. Conveying Non-Source Forms.

  You may convey a covered work in object code form under the terms
of sections 4 and 5, provided that you also convey the
machine-readable Corresponding Source under the terms of this License,
in one of these ways:

    a) Convey the object code in, or embodied in, a physical product
    (including a physical distribution medium), accompanied by the
    Corresponding Source fixed on a durable physical medium
    customarily used for software interchange.

    b) Convey the object code in, or embodied in, a physical product
    (including a physical distribution medium), accompanied by a
    written offer, valid for at least three years and valid for as
    long as you offer spare parts or customer support for that product
    model, to give anyone who possesses the object code either (1) a
    copy of the Corresponding Source for all the software in the
    product that is covered by this License, on a durable physical
    medium customarily used for software interchange, for a price no
    more than your reasonable cost of physically performing this
    conveying of source, or (2) access to copy the
    Corresponding Source from a network server at no charge.

    c) Convey individual copies of the object code with a copy of the
    written offer to provide the Corresponding Source.  This
    alternative is allowed only occasionally and noncommercially, and
    only if you received the object code with such an offer, in accord
    with subsection 6b.

    d) Convey the object code by offering access from a designated
    place (gratis or for a charge), and offer equivalent access to the
    Corresponding Source in the same way through the same place at no
    further charge.  You need not require recipients to copy the
    Corresponding Source along with the object code.  If the place to
    copy the object code is a network server, the Corresponding Source
    may be on a different server (operated by you or a third party)
    that supports equivalent copying facilities, provided you maintain
    clear directions next to the object code saying where to find the
    Corresponding Source.  Regardless of what server hosts the
    Corresponding Source, you remain obligated to ensure that it is
    available for as long as needed to satisfy these requirements.

    e) Convey the object code using peer-to-peer transmission, provided
    you inform other peers where the object code and Corresponding
    Source of the work are being offered to the general public at no
    charge under subsection 6d.

  A separable portion of the object code, whose source code is excluded
from the Corresponding Source as a System Library, need not be
included in conveying the object code work.

  A "User Product" is either (1) a "consumer product", which means any
tangible personal property which is normally used for personal, family,
or household purposes, or (2) anything designed or sold for incorporation
into a dwelling.  In determining whether a product is a consumer product,
doubtful cases shall be resolved in favor of coverage.  For a particular
product received by a particular user, "normally used" refers to a
typical or common use of that class of product, regardless of the status
of the particular user or of the way in which the particular user
actually uses, or expects or is expected to use, the product.  A product
is a consumer product regardless of whether the product has substantial
commercial, industrial or non-consumer uses, unless such uses represent
the only significant mode of use of the product.

  "Installation Information" for a User Product means any methods,
procedures, authorization keys, or other information required to install
and execute modified versions of a covered work in that User Product from
a modified version of its Corresponding Source.  The information must
suffice to ensure that the continued functioning of the modified object
code is in no case prevented or interfered with solely because
modification has been made.

  If you convey an object code work under this section in, or with, or
specifically for use in, a User Product, and the conveying occurs as
part of a transaction in which the right of possession and use of the
User Product is transferred to the recipient in perpetuity or for a
fixed term (regardless of how the transaction is characterized), the
Corresponding Source conveyed under this section must be accompanied
by the Installation Information.  But this requirement does not apply
if neither you nor any third party retains the ability to install
modified object code on the User Product (for example, the work has
been installed in ROM).

  The requirement to provide Installation Information does not include a
requirement to continue to provide support service, warranty, or updates
for a work that has been modified or installed by the recipient, or for
the User Product in which it has been modified or installed.  Access to a
network may be denied when the modification itself materially and
adversely affects the operation of the network or violates the rules and
protocols for communication across the network.

  Corresponding Source conveyed, and Installation Information provided,
in accord with this section must be in a format that is publicly
documented (and with an implementation available to the public in
source code form), and must require no special password or key for
unpacking, reading or copying.

  7. Additional Terms.

  "Additional permissions" are terms that supplement the terms of this
License by making exceptions from one or more of its conditions.
Additional permissions that are applicable to the entire Program shall
be treated as though they were included in this License, to the extent
that they are valid under applicable law.  If additional permissions
apply only to part of the Program, that part may be used separately
under those permissions, but the entire Program remains governed by
this License without regard to the additional permissions.

  When you convey a copy of a covered work, you may at your option
remove any additional permissions from that copy, or from any part of
it.  (Additional permissions may be written to require their own
removal in certain cases when you modify the work.)  You may place
additional permissions on material, added by you to a covered work,
for which you have or can give appropriate copyright permission.

  Notwithstanding any other provision of this License, for material you
add to a covered work, you may (if authorized by the copyright holders of
that material) supplement the terms of this License with terms:

    a) Disclaiming warranty or limiting liability differently from the
    terms of sections 15 and 16 of this License; or

    b) Requiring preservation of specified reasonable legal notices or
    author attributions in that material or in the Appropriate Legal
    Notices displayed by works containing it; or

    c) Prohibiting misrepresentation of the origin of that material, or
    requiring that modified versions of such material be marked in
    reasonable ways as different from the original version; or

    d) Limiting the use for publicity purposes of names of licensors or
    authors of the material; or

    e) Declining to grant rights under trademark law for use of some
    trade names, trademarks, or service marks; or

    f) Requiring indemnification of licensors and authors of that
    material by anyone who conveys the material (or modified versions of
    it) with contractual assumptions of liability to the recipient, for
    any liability that these contractual assumptions directly impose on
    those licensors and authors.

  All other non-permissive additional terms are considered "further
restrictions" within the meaning of section 10.  If the Program as you
received it, or any part of it, contains a notice stating that it is
governed by this License along with a term that is a further
restriction, you may remove that term.  If a license document contains
a further restriction but permits relicensing or conveying under this
License, you may add to a covered work material governed by the terms
of that license document, provided that the further restriction does
not survive such relicensing or conveying.

  If you add terms to a covered work in accord with this section, you
must place, in the relevant source files, a statement of the
additional terms that apply to those files, or a notice indicating
where to find the applicable terms.

  Additional terms, permissive or non-permissive, may be stated in the
form of a separately written license, or stated as exceptions;
the above requirements apply either way.

  8. Termination.

  You may not propagate or modify a covered work except as expressly
provided under this License.  Any attempt otherwise to propagate or
modify it is void, and will automatically terminate your rights under
this License (including any patent licenses granted under the third
paragraph of section 11).

  However, if you cease all violation of this License, then your
license from a particular copyright holder is reinstated (a)
provisionally, unless and until the copyright holder explicitly and
finally terminates your license, and (b) permanently, if the copyright
holder fails to notify you of the violation by some reasonable means
prior to 60 days after the cessation.

  Moreover, your license from a particular copyright holder is
reinstated permanently if the copyright holder notifies you of the
violation by some reasonable means, this is the first time you have
received notice of violation of this License (for any work) from that
copyright holder, and you cure the violation prior to 30 days after
your receipt of the notice.

  Termination of your rights under this section does not terminate the
licenses of parties who have received copies or rights from you under
this License.  If your rights have been terminated and not permanently
reinstated, you do not qualify to receive new licenses for the same
material under section 10.

  9. Acceptance Not Required for Having Copies.

  You are not required to accept this License in order to receive or
run a copy of the Program.  Ancillary propagation of a covered work
occurring solely as a consequence of using peer-to-peer transmission
to receive a copy likewise does not require acceptance.  However,
nothing other than this License grants you permission to propagate or
modify any covered work.  These actions infringe copyright if you do
not accept this License.  Therefore, by modifying or propagating a
covered work, you indicate your acceptance of this License to do so.

  10. Automatic Licensing of Downstream Recipients.

  Each time you convey a covered work, the recipient automatically
receives a license from the original licensors, to run, modify and
propagate that work, subject to this License.  You are not responsible
for enforcing compliance by third parties with this License.

  An "entity transaction" is a transaction transferring control of an
organization, or substantially all assets of one, or subdividing an
organization, or merging organizations.  If propagation of a covered
work results from an entity transaction, each party to that
transaction who receives a copy of the work also receives whatever
licenses to the work the party's predecessor in interest had or could
give under the previous paragraph, plus a right to possession of the
Corresponding Source of the work from the predecessor in interest, if
the predecessor has it or can get it with reasonable efforts.

  You may not impose any further restrictions on the exercise of the
rights granted or affirmed under this License.  For example, you may
not impose a license fee, royalty, or other charge for exercise of
rights granted under this License, and you may not initiate litigation
(including a cross-claim or counterclaim in a lawsuit) alleging that
any patent claim is infringed by making, using, selling, offering for
sale, or importing the Program or any portion of it.

  11. Patents.

  A "contributor" is a copyright holder who authorizes use under this
License of the Program or a work on which the Program is based.  The
work thus licensed is called the contributor's "contributor version".

  A contributor's "essential patent claims" are all patent claims
owned or controlled by the contributor, whether already acquired or
hereafter acquired, that would be infringed by some manner, permitted
by this License, of making, using, or selling its contributor version,
but do not include claims that would be infringed only as a
consequence of further modification of the contributor version.  For
purposes of this definition, "control" includes the right to grant
patent sublicenses in a manner consistent with the requirements of
this License.

  Each contributor grants you a non-exclusive, worldwide, royalty-free
patent license under the contributor's essential patent claims, to
make, use, sell, offer for sale, import and otherwise run, modify and
propagate the contents of its contributor version.

  In the following three paragraphs, a "patent license" is any express
agreement or commitment, however denominated, not to enforce a patent
(such as an express permission to practice a patent or covenant not to
sue for patent infringement).  To "grant" such a patent license to a
party means to make such an agreement or commitment not to enforce a
patent against the party.

  If you convey a covered work, knowingly relying on a patent license,
and the Corresponding Source of the work is not available for anyone
to copy, free of charge and under the terms of this License, through a
publicly available network server or other readily accessible means,
then you must either (1) cause the Corresponding Source to be so
available, or (2) arrange to deprive yourself of the benefit of the
patent license for this particular work, or (3) arrange, in a manner
consistent with the requirements of this License, to extend the patent
license to downstream recipients.  "Knowingly relying" means you have
actual knowledge that, but for the patent license, your conveying the
covered work in a country, or your recipient's use of the covered work
in a country, would infringe one or more identifiable patents in that
country that you have reason to believe are valid.

  If, pursuant to or in connection with a single transaction or
arrangement, you convey, or propagate by procuring conveyance of, a
covered work, and grant a patent license to some of the parties
receiving the covered work authorizing them to use, propagate, modify
or convey a specific copy of the covered work, then the patent license
you grant is automatically extended to all recipients of the covered
work and works based on it.

  A patent license is "discriminatory" if it does not include within
the scope of its coverage, prohibits the exercise of, or is
conditioned on the non-exercise of one or more of the rights that are
specifically granted under this License.  You may not convey a covered
work if you are a party to an arrangement with a third party that is
in the business of distributing software, under which you make payment
to the third party based on the extent of your activity of conveying
the work, and under which the third party grants, to any of the
parties who would receive the covered work from you, a discriminatory
patent license (a) in connection with copies of the covered work
conveyed by you (or copies made from those copies), or (b) primarily
for and in connection with specific products or compilations that
contain the covered work, unless you entered into that arrangement,
or that patent license was granted, prior to 28 March 2007.

  Nothing in this License shall be construed as excluding or limiting
any implied license or other defenses to infringement that may
otherwise be available to you under applicable patent law.

  12. No Surrender of Others' Freedom.

  If conditions are imposed on you (whether by court order, agreement or
otherwise) that contradict the conditions of this License, they do not
excuse you from the conditions of this License.  If you cannot convey a
covered work so as to satisfy simultaneously your obligations under this
License and any other pertinent obligations, then as a consequence you may
not convey it at all.  For example, if you agree to terms that obligate you
to collect a royalty for further conveying from those to whom you convey
the Program, the only way you could satisfy both those terms and this
License would be to refrain entirely from conveying the Program.

  13. Remote Network Interaction; Use with the GNU General Public License.

  Notwithstanding any other provision of this License, if you modify the
Program, your modified version must prominently offer all users
interacting with it remotely through a computer network (if your version
supports such interaction) an opportunity to receive the Corresponding
Source of your version by providing access to the Corresponding Source
from a network server at no charge, through some standard or customary
means of facilitating copying of software.  This Corresponding Source
shall include the Corresponding Source for any work covered by version 3
of the GNU General Public License that is incorporated pursuant to the
following paragraph.

  Notwithstanding any other provision of this License, you have
permission to link or combine any covered work with a work licensed
under version 3 of the GNU General Public License into a single
combined work, and to convey the resulting work.  The terms of this
License will continue to apply to the part which is the covered work,
but the work with which it is combined will remain governed by version
3 of the GNU General Public License.

  14. Revised Versions of this License.

  The Free Software Foundation may publish revised and/or new versions of
the GNU Affero General Public License from time to time.  Such new versions
will be similar in spirit to the present version, but may differ in detail to
address new problems or concerns.

  Each version is given a distinguishing version number.  If the
Program specifies that a certain numbered version of the GNU Affero General
Public License "or any later version" applies to it, you have the
option of following the terms and conditions either of that numbered
version or of any later version published by the Free Software
Foundation.  If the Program does not specify a version number of the
GNU Affero General Public License, you may choose any version ever published
by the Free Software Foundation.

  If the Program specifies that a proxy can decide which future
versions of the GNU Affero General Public License can be used, that proxy's
public statement of acceptance of a version permanently authorizes you
to choose that version for the Program.

  Later license versions may give you additional or different
permissions.  However, no additional obligations are imposed on any
author or copyright holder as a result of your choosing to follow a
later version.

  15. Disclaimer of Warranty.

  THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY
APPLICABLE LAW.  EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT
HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY
OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO,
THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM
IS WITH YOU.  SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF
ALL NECESSARY SERVICING, REPAIR OR CORRECTION.

  16. Limitation of Liability.

  IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS
THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY
GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE
USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF
DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD
PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS),
EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF
SUCH DAMAGES.

  17. Interpretation of Sections 15 and 16.

  If the disclaimer of warranty and limitation of liability provided
above cannot be given local legal effect according to their terms,
reviewing courts shall apply local law that most closely approximates
an absolute waiver of all civil liability in connection with the
Program, unless a warranty or assumption of liability accompanies a
copy of the Program in return for a fee.

                     END OF TERMS AND CONDITIONS

            How to Apply These Terms to Your New Programs

  If you develop a new program, and you want it to be of the greatest
possible use to the public, the best way to achieve this is to make it
free software which everyone can redistribute and change under these terms.

  To do so, attach the following notices to the program.  It is safest
to attach them to the start of each source file to most effectively
state the exclusion of warranty; and each file should have at least
the "copyright" line and a pointer to where the full notice is found.

    <one line to give the program's name and a brief idea of what it does.>
    Copyright (C) <year>  <name of author>

    This program is free software: you can redistribute it and/or modify
    it under the terms of the GNU Affero General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU Affero General Public License for more details.

    You should have received a copy of the GNU Affero General Public License
    along with this program.  If not, see <http://www.gnu.org/licenses/>.

Also add information on how to contact you by electronic and paper mail.

  If your software can interact with users remotely through a computer
network, you should also make sure that it provides a way for users to
get its source.  For example, if your program is a web application, its
interface could display a "Source" link that leads users to an archive
of the code.  There are many ways you could offer source, and different
solutions will be better for different programs; see section 13 for the
specific requirements.

  You should also get your employer (if you work as a programmer) or school,
if any, to sign a "copyright disclaimer" for the program, if necessary.
For more information on this, and how to apply and follow the GNU AGPL, see
<http://www.gnu.org/licenses/>.

==============================================================================

--------------------------------
Third Party Software Information
--------------------------------

PBS Pro includes code created by other parties which is provided under
the open source software license agreements chosen by the authors. All
unmodified files from these and other sources retain their original
copyright and license notices.

_ _ _ _ _ _

src/scheduler/sort.c

Copyright (c) 1992, 1993. Regents of the University of California.
All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
1. Redistributions of source code must retain the above copyright
   notice, this list of conditions and the following disclaimer.
2. Redistributions in binary form must reproduce the above copyright
   notice, this list of conditions and the following disclaimer in the
   documentation and/or other materials provided with the distribution.
3. All advertising materials mentioning features or use of this software
   must display the following acknowledgement:
     This product includes software developed by the University of
     California, Berkeley and its contributors.
4. Neither the name of the University nor the names of its contributors
   may be used to endorse or promote products derived from this software
   without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
SUCH DAMAGE.

_ _ _ _ _ _

src/lib/Libwin/rcmd.c

Copyright (c) 1983 Regents of the University of California.
All rights reserved.

Redistribution and use in source and binary forms are permitted
provided that the above copyright notice and this paragraph are
duplicated in all such forms and that any documentation,
advertising materials, and other materials related to such
distribution and use acknowledge that the software was developed
by the University of California, Berkeley.  The name of the
University may not be used to endorse or promote products derived
from this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
WARRANTIES OF MERCHANTIBILITY AND FITNESS FOR A PARTICULAR PURPOSE.

_ _ _ _ _ _

src/resmom/popen.c

Copyright (c) 1988, 1993
     The Regents of the University of California.  All rights reserved.

This code is derived from software written by Ken Arnold and
published in UNIX Review, Vol. 6, No. 8.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
1. Redistributions of source code must retain the above copyright
   notice, this list of conditions and the following disclaimer.
2. Redistributions in binary form must reproduce the above copyright
   notice, this list of conditions and the following disclaimer in the
   documentation and/or other materials provided with the distribution.
3. All advertising materials mentioning features or use of this software
   must display the following acknowledgement:
     This product includes software developed by the University of
     California, Berkeley and its contributors.
4. Neither the name of the University nor the names of its contributors
   may be used to endorse or promote products derived from this software
   without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
SUCH DAMAGE.

_ _ _ _ _ _

src/lib/Libutil/avltree.c

Copyright (c) 2000 Gregory Tseytin <tseyting@acm.org>
  All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
1. Redistributions of source code must retain the above copyright
   notice, this list of conditions and the following disclaimer as
   the first lines of this file unmodified.
2. Redistributions in binary form must reproduce the above copyright
   notice, this list of conditions and the following disclaimer in the
   documentation and/or other materials provided with the distribution.

THIS SOFTWARE IS PROVIDED BY Gregory Tseytin ``AS IS'' AND ANY EXPRESS OR
IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
IN NO EVENT SHALL Gregory Tseytin BE LIABLE FOR ANY DIRECT, INDIRECT,
INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

_ _ _ _ _ _

buildutils/depcomp
buildutils/compile

Copyright (C) 1999-2013 Free Software Foundation, Inc.

This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2, or (at your option)
any later version.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program.  If not, see <http://www.gnu.org/licenses/>.

As a special exception to the GNU General Public License, if you
distribute this file as part of a program that contains a
configuration script generated by Autoconf, you may include it under
the same distribution terms that you use for the rest of that program.

_ _ _ _ _ _

buildutils/install-sh

Copyright (C) 1994 X Consortium

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to
deal in the Software without restriction, including without limitation the
rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
sell copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
X CONSORTIUM BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNEC-
TION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

Except as contained in this notice, the name of the X Consortium shall not
be used in advertising or otherwise to promote the sale, use or other deal-
ings in this Software without prior written authorization from the X Consor-
tium.

_ _ _ _ _ _

buildutils/ltmain.sh
m4/libtool.m4

  Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2003, 2004, 2005,
                2006, 2007, 2008, 2009, 2010, 2011 Free Software
                Foundation, Inc.
  Written by Gordon Matzigkeit, 1996

  This file is part of GNU Libtool.

GNU Libtool is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License as
published by the Free Software Foundation; either version 2 of
the License, or (at your option) any later version.

As a special exception to the GNU General Public License,
if you distribute this file as part of a program or library that
is built using GNU Libtool, you may include this file under the
same distribution terms that you use for the rest of that program.

GNU Libtool is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with GNU Libtool; see the file COPYING.  If not, a copy
can be downloaded from http://www.gnu.org/licenses/gpl.html, or
obtained by writing to the Free Software Foundation, Inc.,
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.

_ _ _ _ _ _

m4/lt~obsolete.m4

  Copyright (C) 2004, 2005, 2007, 2009 Free Software Foundation, Inc.
  Written by Scott James Remnant, 2004. (see license below)

m4/ltoptions.m4

  Copyright (C) 2004, 2005, 2007, 2008, 2009 Free Software Foundation,
  Inc.
  Written by Gary V. Vaughan, 2004  (see license below)

m4/ltsugar.m4

Copyright (C) 2004, 2005, 2007, 2008 Free Software Foundation, Inc.
Written by Gary V. Vaughan, 2004   (see license below)

m4/ltversion.m4

  Copyright (C) 2004 Free Software Foundation, Inc.
  Written by Scott James Remnant, 2004.   (see license below)

m4 GNU license:

License: GPL-2+ or configure-same-as-package
 This file is free software; you can redistribute it and/or modify it
 under the terms of the GNU General Public License as published by the
 Free Software Foundation; either version 2 of the License, or (at your
 option) any later version.

 This program is distributed in the hope that it will be useful, but
 WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General
 Public License for more details.

 The full text of the GNU General Public License version 2 is available on
 Debian systems in /usr/share/common-licenses/GPL-2.

 As a special exception to the GNU General Public License, if you
 distribute this file as part of a program that contains a configuration
 script generated by Autoconf, you may include it under the same
 distribution terms that you use for the rest of that program.

_ _ _ _ _ _

buildutils/makedepend-sh

Copyright (c) 1996, 1998 The NetBSD Foundation, Inc.
All rights reserved.

This code is derived from software contributed to The NetBSD Foundation
by Lonhyn T. Jasinskyj.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
1. Redistributions of source code must retain the above copyright
   notice, this list of conditions and the following disclaimer.
2. Redistributions in binary form must reproduce the above copyright
   notice, this list of conditions and the following disclaimer in the
   documentation and/or other materials provided with the distribution.
3. All advertising materials mentioning features or use of this software
   must display the following acknowledgement:
       This product includes software developed by the NetBSD
       Foundation, Inc. and its contributors.
4. Neither the name of The NetBSD Foundation nor the names of its
   contributors may be used to endorse or promote products derived
   from this software without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
POSSIBILITY OF SUCH DAMAGE.


================================================
FILE: Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

ACLOCAL_AMFLAGS = -I m4

SUBDIRS = buildutils src doc test
EXTRA_DIST = \
	COPYRIGHT \
	INSTALL \
	LICENSE \
	README.md \
	autogen.sh \
	openpbs-rpmlintrc \
	openpbs.spec


================================================
FILE: PBS_License.txt
================================================
Copyright (C) 1994-2021 Altair Engineering, Inc.
For more information, contact Altair at www.altair.com.

This file is part of both the OpenPBS software ("OpenPBS")
and the PBS Professional ("PBS Pro") software.

Open Source License Information:

OpenPBS is free software. You can redistribute it and/or modify it under
the terms of the GNU Affero General Public License as published by the
Free Software Foundation, either version 3 of the License, or (at your
option) any later version.

OpenPBS is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
License for more details.

You should have received a copy of the GNU Affero General Public License
along with this program.  If not, see <http://www.gnu.org/licenses/>.

Commercial License Information:

PBS Pro is commercially licensed software that shares a common core with
the OpenPBS software.  For a copy of the commercial license terms and
conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
Altair Legal Department.

Altair's dual-license business model allows companies, individuals, and
organizations to create proprietary derivative works of OpenPBS and
distribute them - whether embedded or bundled with other software -
under a commercial license agreement.

Use of Altair's trademarks, including but not limited to "PBS™",
"OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
subject to Altair's trademark licensing policies.


================================================
FILE: README.md
================================================
### OpenPBS Open Source Project

If you are new to this project, please start at https://www.openpbs.org/

Note: In May 2020, OpenPBS became the new name for the PBS Professional Open Source Project. (PBS Professional will be used to refer to the commercial version; OpenPBS to the Open Source version -- same code, easier naming.)  As there are many parts to the project, it will take several weeks to change the name in all places, so you will continue to see references to PBS Pro -- stay tuned.

### What is OpenPBS?
OpenPBS® software optimizes job scheduling and workload management in high-performance computing (HPC) environments – clusters, clouds, and supercomputers – improving system efficiency and people’s productivity.  Built by HPC people for HPC people, OpenPBS is fast, scalable, secure, and resilient, and supports all modern infrastructure, middleware, and applications.

* **Scalability:** supports millions of cores with fast job dispatch and minimal latency; tested beyond 50,000 nodes
* **Policy-Driven Scheduling:** meets unique site goals and SLAs by balancing job turnaround time and utilization with optimal job placement
* **Resiliency:** includes automatic fail-over architecture with no single point of failure – jobs are never lost, and jobs continue to run despite failures
* **Flexible Plugin Framework:** simplifies administration with enhanced visibility and extensibility; customize implementations to meet complex requirements
* **Health Checks:** monitors and automatically mitigates faults with a comprehensive health check framework
* **Voted #1 HPC Software** by HPC Wire readers and proven for over 20 years at thousands of sites around the globe in both the private sector and public sector

### Community and Ways to Participate

OpenPBS is a community effort and there are a variety of ways to engage, from helping answer questions to benchmarking to developing new capabilities and tests.  We value being aggressively open and inclusive, but also aggressively respectful and professional.  See our [Code of Conduct](https://openpbs.atlassian.net/wiki/display/PBSPro/Code+of+Conduct).

The best place to start is by joining the community forum.  You may sign up or view the archives via:

* [Announcements](http://community.openpbs.org/c/announcements) -- important updates relevant to the entire PBS Pro community
* [Users/Site Admins](http://community.openpbs.org/c/users-site-administrators) -- general questions and discussions among end users (system admins, engineers, scientists)
* [Developers](http://community.openpbs.org/c/developers) -- technical discussions among developers

To dive in deeper and learn more about the project and what the community is up to, visit:

* [Contributor’s portal](https://openpbs.atlassian.net/wiki) -- includes roadmaps, processes, how to articles, coding standards, release notes, etc  (Uses Confluence)
* [Source code](https://github.com/OpenPBS/openpbs) -- includes full source code and test framework (Uses Github)
* [Issue tracking system](https://github.com/OpenPBS/openpbs/issues) -- includes bugs and feature requests and status (Uses Github).  Previously, we used [JIRA](https://pbspro.atlassian.net), which contains older issues.

OpenPBS is also integrated in the OpenHPC software stack. The mission of OpenHPC is to provide an integrated collection of HPC-centric components to provide full-featured HPC software stacks. OpenHPC is a Linux Foundation Collaborative Project.  Learn more at:

* [OpenHPC.community](http://openhpc.community)
* [The Linux Foundation](http://thelinuxfoundation.org)

### Our Vision:  One Scheduler for the whole HPC World

There is a huge opportunity to advance the state of the art in HPC scheduling by bringing the whole HPC world together, marrying public sector innovations with private sector enterprise know-how, and retargeting the effort wasted re-implementing the same old capabilities again and again towards pushing the outside of the envelope.  At the heart of this vision is fostering common standards (at least defacto standards like common software).  To this end, Altair has made a big investment by releasing the PBS Professional technology as OpenPBS (under an Open Source license to meet the needs of the public sector), while also continuing to offer PBS Professional (under a commercial license to meet the needs of the private sector).  One defacto standard that can work for the whole HPC community.

### Current Build status
[![Build Status](https://travis-ci.com/OpenPBS/openpbs.svg?branch=master)](https://travis-ci.com/OpenPBS/openpbs)


================================================
FILE: autogen.sh
================================================
#!/bin/sh

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


if test -d ./src/resmom; then
	echo "Generating configure script and Makefile templates."
	exec autoreconf --force --install -I m4 $*
else
	echo "Execute `basename $0` from the top level distribution directory."
fi


================================================
FILE: azure-pipelines.yml
================================================
trigger:
  branches:
    include:
      - master
      - release_*

pr:
  branches:
    include:
      - master
      - release_*

pool:
  vmImage: 'ubuntu-latest'  # Changed from ubuntu-20.04

variables:
  - name: DOCKER_BUILDKIT
    value: 1

jobs:
  - job: runcheck
    displayName: 'Code Quality Checks'
    pool:
      vmImage: 'ubuntu-latest'
    steps:
      - checkout: self
        displayName: 'Checkout code'
      
      - bash: |
          sudo apt-get update
          sudo apt-get install -y python3-pip
          sudo pip3 install --upgrade pip
          sudo pip3 install pycodestyle pep8 flake8 clang-format
          
          # Create pep8 symlink if it doesn't exist (for compatibility)
          if ! command -v pep8 &> /dev/null; then
            sudo ln -sf $(which pycodestyle) /usr/local/bin/pep8
          fi
          
          # Verify installations
          echo "Checking installed tools:"
          python3 --version
          pip3 --version
          pep8 --version || pycodestyle --version
          clang-format --version
          
          # Check if runchecks script exists
          if [ -f ".github/runchecks" ]; then
            chmod +x .github/runchecks
            ./.github/runchecks
          else
            echo "Warning: .github/runchecks script not found"
            # Run basic checks if script is missing
            echo "Running basic Python style checks..."
            find . -name "*.py" -exec pep8 {} \; || true
          fi
        displayName: 'Run code quality checks'

  - job: ubuntu_2004_build
    displayName: 'Ubuntu 20.04'
    dependsOn: runcheck
    pool:
      vmImage: 'ubuntu-latest'
    variables:
      OS_TYPE: "ubuntu:20.04"
      PKG_INSTALL_CMD: "apt-get -y update && apt-get -y upgrade && apt-get install -y python3 build-essential"
      DOCKER_EXTRA_ARG: "-e DEBIAN_FRONTEND=noninteractive -e LANGUAGE=C.UTF-8 -e LANG=C.UTF-8 -e LC_ALL=C.UTF-8"
      CI_CMD: "./ci --local"
      CONTAINER_NAME: "ubuntu2004-$(Build.BuildId)"
    steps:
    - checkout: self
      displayName: 'Checkout code'
      
    - script: |
        echo "Starting build for Ubuntu 20.04"
        echo "OS Type: $(OS_TYPE)"
        echo "Package Install: $(PKG_INSTALL_CMD)"
        echo "Docker Args: $(DOCKER_EXTRA_ARG)"
        echo "CI Command: $(CI_CMD)"
        echo "Container Name: $(CONTAINER_NAME)"
      displayName: 'Display build configuration'
      
    - script: |
        # Pull the Docker image
        docker pull $(OS_TYPE)
        
        # Start the container with proper init to handle zombie processes
        docker run -d \
          $(DOCKER_EXTRA_ARG) \
          -h pbs.dev.local \
          --name $(CONTAINER_NAME) \
          -v $(pwd):$(pwd) \
          --privileged \
          --init \
          -w $(pwd) \
          $(OS_TYPE) \
          /bin/bash -c "sleep 3600"
          
        # Verify container is running
        docker ps | grep $(CONTAINER_NAME)
        
      displayName: 'Start Docker container'
      
    - script: |
        # Install packages
        docker exec $(CONTAINER_NAME) bash -c "$(PKG_INSTALL_CMD)"
        
        # Install additional tools for process management
        docker exec $(CONTAINER_NAME) bash -c "apt-get install -y procps psmisc"
        
        # Verify Python installation
        docker exec $(CONTAINER_NAME) python3 --version
        
      displayName: 'Install dependencies'
      
    - script: |
        # Monitor processes before running CI
        echo "=== Process monitoring before CI ==="
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Current processes:'
          ps aux | head -20
          echo ''
          echo 'Checking for zombie/defunct processes:'
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
          echo ''
          echo 'PBS-related processes:'
          ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'
        "
      displayName: 'Monitor processes before CI'
      
    - script: |
        # Check if ci directory and script exist
        docker exec $(CONTAINER_NAME) bash -c "ls -la"
        docker exec $(CONTAINER_NAME) bash -c "if [ -d 'ci' ]; then ls -la ci/; else echo 'ci directory not found'; fi"
        
        # Run CI script if it exists
        if docker exec $(CONTAINER_NAME) bash -c "[ -f 'ci/ci' ] || [ -f './ci' ]"; then
          docker exec --privileged $(CONTAINER_NAME) bash -c "cd ci && $(CI_CMD)"
        else
          echo "CI script not found, running basic build test"
          docker exec $(CONTAINER_NAME) bash -c "python3 -c 'print(\"Python test successful\")'"
        fi
        
        # Check for any PBS processes and stop them properly
        echo "Checking for PBS processes..."
        docker exec $(CONTAINER_NAME) bash -c "ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'"
        
        # Stop PBS services properly if they're running
        docker exec $(CONTAINER_NAME) bash -c "
          if command -v pbs_server &> /dev/null; then
            echo 'Stopping PBS services...'
            pkill -TERM pbs_server || true
            pkill -TERM pbs_sched || true
            pkill -TERM pbs_mom || true
            pkill -TERM pbs_ds_monitor || true
            sleep 2
            # Force kill if still running
            pkill -KILL pbs_server || true
            pkill -KILL pbs_sched || true
            pkill -KILL pbs_mom || true
            pkill -KILL pbs_ds_monitor || true
          fi
        " || true
        
      displayName: 'Run CI tests'
      
    - script: |
        # Proper PBS cleanup and container shutdown
        echo "Cleaning up PBS processes and container..."
        
        # Stop PBS services gracefully first
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Stopping PBS services gracefully...'
          if command -v qterm &> /dev/null; then
            qterm -t quick || true
          fi
          
          # Stop individual PBS components
          pkill -TERM pbs_server || true
          pkill -TERM pbs_sched || true  
          pkill -TERM pbs_mom || true
          pkill -TERM pbs_ds_monitor || true
          
          # Wait a bit for graceful shutdown
          sleep 3
          
          # Force kill any remaining PBS processes
          pkill -KILL pbs_server || true
          pkill -KILL pbs_sched || true
          pkill -KILL pbs_mom || true
          pkill -KILL pbs_ds_monitor || true
          
          # Clean up any remaining zombie processes
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
        " || true
        
        # Stop and remove container
        docker stop $(CONTAINER_NAME) || true
        docker rm $(CONTAINER_NAME) || true
        
      displayName: 'Cleanup Docker container'
      condition: always()

  - job: ubuntu_2404_build
    displayName: 'Ubuntu 24.04'
    dependsOn: runcheck
    pool:
      vmImage: 'ubuntu-latest'
    variables:
      OS_TYPE: "ubuntu:24.04"
      PKG_INSTALL_CMD: "apt-get -y update && apt-get -y upgrade && apt-get install -y python3 build-essential"
      DOCKER_EXTRA_ARG: "-e DEBIAN_FRONTEND=noninteractive -e LANGUAGE=C.UTF-8 -e LANG=C.UTF-8 -e LC_ALL=C.UTF-8"
      CI_CMD: "./ci --local"
      CONTAINER_NAME: "ubuntu2404-$(Build.BuildId)"
    steps:
    - checkout: self
      displayName: 'Checkout code'
      
    - script: |
        echo "Starting build for Ubuntu 24.04"
        echo "OS Type: $(OS_TYPE)"
        echo "Package Install: $(PKG_INSTALL_CMD)"
        echo "Docker Args: $(DOCKER_EXTRA_ARG)"
        echo "CI Command: $(CI_CMD)"
        echo "Container Name: $(CONTAINER_NAME)"
      displayName: 'Display build configuration'
      
    - script: |
        # Pull the Docker image
        docker pull $(OS_TYPE)
        
        # Start the container with proper init to handle zombie processes
        docker run -d \
          $(DOCKER_EXTRA_ARG) \
          -h pbs.dev.local \
          --name $(CONTAINER_NAME) \
          -v $(pwd):$(pwd) \
          --privileged \
          --init \
          -w $(pwd) \
          $(OS_TYPE) \
          /bin/bash -c "sleep 3600"
          
        # Verify container is running
        docker ps | grep $(CONTAINER_NAME)
        
      displayName: 'Start Docker container'
      
    - script: |
        # Install packages
        docker exec $(CONTAINER_NAME) bash -c "$(PKG_INSTALL_CMD)"
        
        # Install additional tools for process management
        docker exec $(CONTAINER_NAME) bash -c "apt-get install -y procps psmisc"
        
        # Verify Python installation
        docker exec $(CONTAINER_NAME) python3 --version
        
      displayName: 'Install dependencies'
      
    - script: |
        # Monitor processes before running CI
        echo "=== Process monitoring before CI ==="
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Current processes:'
          ps aux | head -20
          echo ''
          echo 'Checking for zombie/defunct processes:'
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
          echo ''
          echo 'PBS-related processes:'
          ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'
        "
      displayName: 'Monitor processes before CI'
      
    - script: |
        # Check if ci directory and script exist
        docker exec $(CONTAINER_NAME) bash -c "ls -la"
        docker exec $(CONTAINER_NAME) bash -c "if [ -d 'ci' ]; then ls -la ci/; else echo 'ci directory not found'; fi"
        
        # Run CI script if it exists
        if docker exec $(CONTAINER_NAME) bash -c "[ -f 'ci/ci' ] || [ -f './ci' ]"; then
          docker exec --privileged $(CONTAINER_NAME) bash -c "cd ci && $(CI_CMD)"
        else
          echo "CI script not found, running basic build test"
          docker exec $(CONTAINER_NAME) bash -c "python3 -c 'print(\"Python test successful\")'"
        fi
        
        # Check for any PBS processes and stop them properly
        echo "Checking for PBS processes..."
        docker exec $(CONTAINER_NAME) bash -c "ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'"
        
        # Stop PBS services properly if they're running
        docker exec $(CONTAINER_NAME) bash -c "
          if command -v pbs_server &> /dev/null; then
            echo 'Stopping PBS services...'
            pkill -TERM pbs_server || true
            pkill -TERM pbs_sched || true
            pkill -TERM pbs_mom || true
            pkill -TERM pbs_ds_monitor || true
            sleep 2
            # Force kill if still running
            pkill -KILL pbs_server || true
            pkill -KILL pbs_sched || true
            pkill -KILL pbs_mom || true
            pkill -KILL pbs_ds_monitor || true
          fi
        " || true
        
      displayName: 'Run CI tests'
      
    - script: |
        # Proper PBS cleanup and container shutdown
        echo "Cleaning up PBS processes and container..."
        
        # Stop PBS services gracefully first
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Stopping PBS services gracefully...'
          if command -v qterm &> /dev/null; then
            qterm -t quick || true
          fi
          
          # Stop individual PBS components
          pkill -TERM pbs_server || true
          pkill -TERM pbs_sched || true  
          pkill -TERM pbs_mom || true
          pkill -TERM pbs_ds_monitor || true
          
          # Wait a bit for graceful shutdown
          sleep 3
          
          # Force kill any remaining PBS processes
          pkill -KILL pbs_server || true
          pkill -KILL pbs_sched || true
          pkill -KILL pbs_mom || true
          pkill -KILL pbs_ds_monitor || true
          
          # Clean up any remaining zombie processes
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
        " || true
        
        # Stop and remove container
        docker stop $(CONTAINER_NAME) || true
        docker rm $(CONTAINER_NAME) || true
        
      displayName: 'Cleanup Docker container'
      condition: always()

  - job: rocky_sanitize_build
    displayName: 'Rocky Linux 9 Sanitize'
    dependsOn: runcheck
    pool:
      vmImage: 'ubuntu-latest'
    variables:
      OS_TYPE: "rockylinux/rockylinux:9.2"
      PKG_INSTALL_CMD: "yum -y update && yum -y install python3 gcc gcc-c++ make"
      DOCKER_EXTRA_ARG: "-e BUILD_MODE=sanitize"
      CI_CMD: "./ci --local=sanitize"
      CONTAINER_NAME: "rocky-sanitize-$(Build.BuildId)"
    steps:
    - checkout: self
      displayName: 'Checkout code'
      
    - script: |
        echo "Starting build for Rocky Linux 9 Sanitize"
        echo "OS Type: $(OS_TYPE)"
        echo "Package Install: $(PKG_INSTALL_CMD)"
        echo "Docker Args: $(DOCKER_EXTRA_ARG)"
        echo "CI Command: $(CI_CMD)"
        echo "Container Name: $(CONTAINER_NAME)"
      displayName: 'Display build configuration'
      
    - script: |
        # Pull the Docker image
        docker pull $(OS_TYPE)
        
        # Start the container with proper init to handle zombie processes
        docker run -d \
          $(DOCKER_EXTRA_ARG) \
          -h pbs.dev.local \
          --name $(CONTAINER_NAME) \
          -v $(pwd):$(pwd) \
          --privileged \
          --init \
          -w $(pwd) \
          $(OS_TYPE) \
          /bin/bash -c "sleep 3600"
          
        # Verify container is running
        docker ps | grep $(CONTAINER_NAME)
        
      displayName: 'Start Docker container'
      
    - script: |
        # Install packages
        docker exec $(CONTAINER_NAME) bash -c "$(PKG_INSTALL_CMD)"
        
        # Install additional tools for process management
        docker exec $(CONTAINER_NAME) bash -c "yum install -y procps-ng psmisc || dnf install -y procps-ng psmisc"
        
        # Verify Python installation
        docker exec $(CONTAINER_NAME) python3 --version
        
      displayName: 'Install dependencies'
      
    - script: |
        # Monitor processes before running CI
        echo "=== Process monitoring before CI ==="
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Current processes:'
          ps aux | head -20
          echo ''
          echo 'Checking for zombie/defunct processes:'
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
          echo ''
          echo 'PBS-related processes:'
          ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'
        "
      displayName: 'Monitor processes before CI'
      
    - script: |
        # Check if ci directory and script exist
        docker exec $(CONTAINER_NAME) bash -c "ls -la"
        docker exec $(CONTAINER_NAME) bash -c "if [ -d 'ci' ]; then ls -la ci/; else echo 'ci directory not found'; fi"
        
        # Run CI script if it exists
        if docker exec $(CONTAINER_NAME) bash -c "[ -f 'ci/ci' ] || [ -f './ci' ]"; then
          docker exec --privileged $(CONTAINER_NAME) bash -c "cd ci && $(CI_CMD)"
        else
          echo "CI script not found, running basic build test"
          docker exec $(CONTAINER_NAME) bash -c "python3 -c 'print(\"Python test successful\")'"
        fi
        
        # Check for any PBS processes and stop them properly
        echo "Checking for PBS processes..."
        docker exec $(CONTAINER_NAME) bash -c "ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'"
        
        # Stop PBS services properly if they're running
        docker exec $(CONTAINER_NAME) bash -c "
          if command -v pbs_server &> /dev/null; then
            echo 'Stopping PBS services...'
            pkill -TERM pbs_server || true
            pkill -TERM pbs_sched || true
            pkill -TERM pbs_mom || true
            pkill -TERM pbs_ds_monitor || true
            sleep 2
            # Force kill if still running
            pkill -KILL pbs_server || true
            pkill -KILL pbs_sched || true
            pkill -KILL pbs_mom || true
            pkill -KILL pbs_ds_monitor || true
          fi
        " || true
        
      displayName: 'Run CI tests'
      
    - script: |
        # Proper PBS cleanup and container shutdown
        echo "Cleaning up PBS processes and container..."
        
        # Stop PBS services gracefully first
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Stopping PBS services gracefully...'
          if command -v qterm &> /dev/null; then
            qterm -t quick || true
          fi
          
          # Stop individual PBS components
          pkill -TERM pbs_server || true
          pkill -TERM pbs_sched || true  
          pkill -TERM pbs_mom || true
          pkill -TERM pbs_ds_monitor || true
          
          # Wait a bit for graceful shutdown
          sleep 3
          
          # Force kill any remaining PBS processes
          pkill -KILL pbs_server || true
          pkill -KILL pbs_sched || true
          pkill -KILL pbs_mom || true
          pkill -KILL pbs_ds_monitor || true
          
          # Clean up any remaining zombie processes
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
        " || true
        
        # Stop and remove container
        docker stop $(CONTAINER_NAME) || true
        docker rm $(CONTAINER_NAME) || true
        
      displayName: 'Cleanup Docker container'
      condition: always()

  - job: rocky_kerberos_build
    displayName: 'Rocky Linux 9 Kerberos'
    dependsOn: runcheck
    pool:
      vmImage: 'ubuntu-latest'
    variables:
      OS_TYPE: "rockylinux/rockylinux:9.2"
      PKG_INSTALL_CMD: "yum -y update && yum -y install python3 gcc gcc-c++ make"
      DOCKER_EXTRA_ARG: "-e BUILD_MODE=kerberos"
      CI_CMD: "./ci --local"
      CONTAINER_NAME: "rocky-kerberos-$(Build.BuildId)"
    steps:
    - checkout: self
      displayName: 'Checkout code'
      
    - script: |
        echo "Starting build for Rocky Linux 9 Kerberos"
        echo "OS Type: $(OS_TYPE)"
        echo "Package Install: $(PKG_INSTALL_CMD)"
        echo "Docker Args: $(DOCKER_EXTRA_ARG)"
        echo "CI Command: $(CI_CMD)"
        echo "Container Name: $(CONTAINER_NAME)"
      displayName: 'Display build configuration'
      
    - script: |
        # Pull the Docker image
        docker pull $(OS_TYPE)
        
        # Start the container with proper init to handle zombie processes
        docker run -d \
          $(DOCKER_EXTRA_ARG) \
          -h pbs.dev.local \
          --name $(CONTAINER_NAME) \
          -v $(pwd):$(pwd) \
          --privileged \
          --init \
          -w $(pwd) \
          $(OS_TYPE) \
          /bin/bash -c "sleep 3600"
          
        # Verify container is running
        docker ps | grep $(CONTAINER_NAME)
        
      displayName: 'Start Docker container'
      
    - script: |
        # Install packages
        docker exec $(CONTAINER_NAME) bash -c "$(PKG_INSTALL_CMD)"
        
        # Install additional tools for process management
        docker exec $(CONTAINER_NAME) bash -c "yum install -y procps-ng psmisc || dnf install -y procps-ng psmisc"
        
        # Verify Python installation
        docker exec $(CONTAINER_NAME) python3 --version
        
      displayName: 'Install dependencies'
      
    - script: |
        # Monitor processes before running CI
        echo "=== Process monitoring before CI ==="
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Current processes:'
          ps aux | head -20
          echo ''
          echo 'Checking for zombie/defunct processes:'
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
          echo ''
          echo 'PBS-related processes:'
          ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'
        "
      displayName: 'Monitor processes before CI'
      
    - script: |
        # Check if ci directory and script exist
        docker exec $(CONTAINER_NAME) bash -c "ls -la"
        docker exec $(CONTAINER_NAME) bash -c "if [ -d 'ci' ]; then ls -la ci/; else echo 'ci directory not found'; fi"
        
        # Run CI script if it exists
        if docker exec $(CONTAINER_NAME) bash -c "[ -f 'ci/ci' ] || [ -f './ci' ]"; then
          docker exec --privileged $(CONTAINER_NAME) bash -c "cd ci && $(CI_CMD)"
        else
          echo "CI script not found, running basic build test"
          docker exec $(CONTAINER_NAME) bash -c "python3 -c 'print(\"Python test successful\")'"
        fi
        
        # Check for any PBS processes and stop them properly
        echo "Checking for PBS processes..."
        docker exec $(CONTAINER_NAME) bash -c "ps aux | grep -E 'pbs_|openpbs' || echo 'No PBS processes found'"
        
        # Stop PBS services properly if they're running
        docker exec $(CONTAINER_NAME) bash -c "
          if command -v pbs_server &> /dev/null; then
            echo 'Stopping PBS services...'
            pkill -TERM pbs_server || true
            pkill -TERM pbs_sched || true
            pkill -TERM pbs_mom || true
            pkill -TERM pbs_ds_monitor || true
            sleep 2
            # Force kill if still running
            pkill -KILL pbs_server || true
            pkill -KILL pbs_sched || true
            pkill -KILL pbs_mom || true
            pkill -KILL pbs_ds_monitor || true
          fi
        " || true
        
      displayName: 'Run CI tests'
      
    - script: |
        # Proper PBS cleanup and container shutdown
        echo "Cleaning up PBS processes and container..."
        
        # Stop PBS services gracefully first
        docker exec $(CONTAINER_NAME) bash -c "
          echo 'Stopping PBS services gracefully...'
          if command -v qterm &> /dev/null; then
            qterm -t quick || true
          fi
          
          # Stop individual PBS components
          pkill -TERM pbs_server || true
          pkill -TERM pbs_sched || true  
          pkill -TERM pbs_mom || true
          pkill -TERM pbs_ds_monitor || true
          
          # Wait a bit for graceful shutdown
          sleep 3
          
          # Force kill any remaining PBS processes
          pkill -KILL pbs_server || true
          pkill -KILL pbs_sched || true
          pkill -KILL pbs_mom || true
          pkill -KILL pbs_ds_monitor || true
          
          # Clean up any remaining zombie processes
          ps aux | grep -E 'defunct|<zombie>' || echo 'No zombie processes found'
        " || true
        
        # Stop and remove container
        docker stop $(CONTAINER_NAME) || true
        docker rm $(CONTAINER_NAME) || true
        
      displayName: 'Cleanup Docker container'
      condition: always()


================================================
FILE: buildutils/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

EXTRA_DIST = \
	attr_parser.py


================================================
FILE: buildutils/attr_parser.py
================================================
# coding: utf-8
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
    attr_parser.py will parse xml files also called master attribute files
containing all the members of both server and ecl files,and will generate
two corresponding files one for server and one for ecl
"""
import getopt
import os
import pdb
import re
import string
import sys
import enum
import xml.dom.minidom
import xml.parsers.expat

list_ecl = []
list_svr = []
list_defs = []

global attr_type
global newattr

class PropType(enum.Enum):
    '''
    BOTH - Write information for this tag to all the output files
    SERVER - Write information for this tag to the SERVER file only
    ECL - Write information for this tag to the ECL file only
    '''
    BOTH = 0
    SERVER = 1
    ECL = 2

class switch(object):
    """
    This class provides the functionality which is equivalent
    to switch/case statements in C. It only needs to be defined
    once.
    """

    def __init__(self, value):
        self.value = value
        self.fall = False

    def __iter__(self):
        """Return the match method once, then stop"""
        yield self.match

    def match(self, *args):
        """Indicate whether or not to enter a case suite"""
        if self.fall or not args:
            return True
        elif self.value in args:  # changed for v1.5, see below
            self.fall = True
            return True
        else:
            return False


def fileappend(prop_type, line):
    '''
    Selects files to append line to dependig on prop_type
    prop_type - BOTH, SERVER, ECL
    line - The string line to append to the file(s)
    '''
    global attr_type

    if prop_type == PropType.SERVER:
        if attr_type == PropType.SERVER or attr_type == PropType.BOTH:
            list_svr.append(line)
    elif prop_type == PropType.ECL:
        if attr_type == PropType.ECL or attr_type == PropType.BOTH:
            list_ecl.append(line)
    elif prop_type == PropType.BOTH:
        if attr_type == PropType.SERVER or attr_type == PropType.BOTH:
            list_svr.append(line)
        if attr_type == PropType.ECL or attr_type == PropType.BOTH:
            list_ecl.append(line)
    return None


def getText(svr_file, ecl_file, defines_file):
    '''
    getText function - (writes the data stored in lists to file)
    svr_file - the server side output file
    ecl_file - the output file to be used by the ECL layer
    defines_file - the output file containing the macro definitions for the
                   index positions
    '''
    buff = "".join(list_svr)
    for line in buff:
        svr_file.write(line)

    buff = "".join(list_ecl)
    for line in buff:
        ecl_file.write(line)

    buff = "".join(list_defs)
    for line in buff:
        defines_file.write(line)


def do_head(node):
    '''
    Processes the head element of the node passed
    '''
    alist = node.getElementsByTagName('head')
    for a in alist:
        list_svr.append("/*Disclaimer: This is a machine generated file.*/" +
                        '\n')
        list_svr.append("/*For modifying any attribute change corresponding "
                        "XML file */" + '\n')
        list_ecl.append("/*Disclaimer: This is a machine generated file.*/" +
                        '\n')
        list_ecl.append("/*For modifying any attribute change corresponding "
                        "XML file */" + '\n')
        blist = a.getElementsByTagName('SVR')
        blist_ecl = a.getElementsByTagName('ECL')
        for s in blist:
            text1 = s.childNodes[0].nodeValue
            text1 = text1.strip(' \t')
            list_svr.append(text1)
        for e in blist_ecl:
            text2 = e.childNodes[0].nodeValue
            text2 = text2.strip(' \t')
            list_ecl.append(text2)


def do_index(attr):
    '''
    Processes the member_index attribute attr
    '''
    li = None
    li = attr.getElementsByTagName('member_index')
    if li:
        for v in li:
            buf = v.childNodes[0].nodeValue
            list_defs.append("\n\t" + buf + ",")


def do_member(attr, p_flag, tag_name):
    '''
    Processes the member identified by tage_name
    attr - the attribute definition node
    p_flag - property flag - SVR, ECL, BOTH
    tag_name - the tag_name string to process
    '''
    global newattr
    buf = None
    comma = ','
    if newattr:
        comma = ''

    newattr = False
    li = attr.getElementsByTagName(tag_name)
    if li:
        svr = li[0].getElementsByTagName('SVR')
        if svr:
            value = svr
            for v in value:
                buf = v.childNodes[0].nodeValue
                fileappend(PropType.SERVER, comma + '\n' + '\t' + '\t' + buf)

        ecl = li[0].getElementsByTagName('ECL')
        if ecl:
            value = ecl
            for v in value:
                buf = v.childNodes[0].nodeValue
                fileappend(PropType.ECL, comma + '\n' + '\t' + '\t' + buf)

        value = li
        for v in value:
            buf = v.childNodes[0].nodeValue
            if buf:
                s = buf.strip('\n \t')
                if s:
                    fileappend(p_flag, comma + '\n' + '\t' + '\t' + buf)


def process(master_file, svr_file, ecl_file, defines_file):
    '''
    process the master xml file and produce the outputs files as requested
    master_file - the Master XML files to process
    svr_file - the server side output file
    ecl_file - the output file to be used by the ECL layer
    defines_file - the output file containing the macro definitions for the
                   index positions
    '''
    from xml.dom import minidom

    global attr_type
    global newattr
    newattr = False

    doc = minidom.parse(master_file)
    nodes = doc.getElementsByTagName('data')

    for node in nodes:
        do_head(node)
    
        at_list = node.getElementsByTagName('attributes')
        for attr in at_list:
            attr_type = PropType.BOTH
            newattr  = True

            flag_name = attr.getAttribute('flag')
            if flag_name == 'SVR':
                attr_type = PropType.SERVER
            if flag_name == 'ECL':
                attr_type = PropType.ECL

            inc_name =  attr.getAttribute('include')
            if inc_name:
                fileappend(PropType.SERVER, '\n' + inc_name)

            mem_list = attr.childNodes[0].nodeValue
            mem_list = mem_list.strip(' \t')
            fileappend(PropType.BOTH, mem_list)

            macro_name = attr.getAttribute('macro')
            if macro_name:
                fileappend(PropType.BOTH, '\n' + macro_name + "\n")

            do_index(attr)
            fileappend(PropType.BOTH, '\t{')

            do_member(attr, PropType.BOTH, 'member_name')
            do_member(attr, PropType.SERVER, 'member_at_decode')
            do_member(attr, PropType.SERVER, 'member_at_encode')
            do_member(attr, PropType.SERVER, 'member_at_set')
            do_member(attr, PropType.SERVER, 'member_at_comp')
            do_member(attr, PropType.SERVER, 'member_at_free')
            do_member(attr, PropType.SERVER, 'member_at_action')
            do_member(attr, PropType.BOTH, 'member_at_flags')
            do_member(attr, PropType.BOTH, 'member_at_type')
            do_member(attr, PropType.SERVER, 'member_at_parent')
            do_member(attr, PropType.ECL, 'member_verify_function')
            do_member(attr, PropType.SERVER, 'member_at_entlim')
            do_member(attr, PropType.SERVER, 'member_at_struct')

            fileappend(PropType.BOTH, '\n\t}')
            fileappend(PropType.BOTH, ",")

            if macro_name:
                fileappend(PropType.BOTH, '\n#else')
                fileappend(PropType.BOTH, '\n\t{\n\t\t"noop"\n\t},')
                fileappend(PropType.BOTH, '\n#endif')

        tail_list = node.getElementsByTagName('tail')
        for t in tail_list:
            tail_value = t.childNodes[0].nodeValue
            if tail_value is None:
                pass
            fileappend(PropType.BOTH, '\n')
            tail_both = t.getElementsByTagName('both')
            tail_svr = t.getElementsByTagName('SVR')
            tail_ecl = t.getElementsByTagName('ECL')
            for tb in tail_both:
                b = tb.childNodes[0].nodeValue
                b = b.strip(' \t')
                list_ecl.append(b)
                list_svr.append(b)
            for ts in tail_svr:
                s = ts.childNodes[0].nodeValue
                s = s.strip(' \t')
                list_svr.append(s)
            for te in tail_ecl:
                e = te.childNodes[0].nodeValue
                e = e.strip(' \t')
                list_ecl.append(e)

        getText(svr_file, ecl_file, defines_file)


def main(argv):
    '''
    Opens files,and calls appropriate functions based on Object values.
    '''
    global SVR_FILENAME
    global ECL_FILENAME
    global DEFINES_FILENAME
    global MASTER_FILENAME

    SVR_FILENAME = "/dev/null"
    ECL_FILENAME = "/dev/null"
    DEFINES_FILENAME = "/dev/null"
    MASTER_FILENAME = "/dev/null"

    if len(sys.argv) == 2:
        usage()
        sys.exit(1)
    try:
        opts, args = getopt.getopt(
            argv, "m:s:e:d:h",
            ["master=", "svr=", "ecl=", "attr=", "help=", "defines="])
    except getopt.error as err:
        print(str(err))
        usage()
        sys.exit(1)
    for opt, arg in opts:
        if opt in ('-h', "--help"):
            usage()
            sys.exit(1)
        elif opt in ("-m", "--master"):
            MASTER_FILENAME = arg
        elif opt in ("-s", "--svr"):
            SVR_FILENAME = arg
        elif opt in ("-d", "--defines"):
            DEFINES_FILENAME = arg
        elif opt in ("-e", "--ecl"):
            ECL_FILENAME = arg
        else:
            print("Invalid Option!")
            sys.exit(1)
#    Error conditions are checked here.

    if (MASTER_FILENAME is None or not os.path.isfile(MASTER_FILENAME) or
            not os.path.getsize(MASTER_FILENAME) > 0):
        print("Master file not found or data is not present in File")
        sys.exit(1)

    try:
        master_file = open(MASTER_FILENAME, encoding='utf-8')
    except IOError as err:
        print(str(err))
        print('Cannot open master file ' + MASTER_FILENAME)
        sys.exit(1)

    try:
        svr_file = open(SVR_FILENAME, 'w', encoding='utf-8')
    except IOError as err:
        print(str(err))
        print('Cannot open ferver file ' + SVR_FILENAME)
        sys.exit(1)

    try:
        defines_file = open(DEFINES_FILENAME, 'w', encoding='utf-8')
    except IOError as err:
        print(str(err))
        print('Cannot open defines file ' + DEFINES_FILENAME)
        sys.exit(1)

    try:
        ecl_file = open(ECL_FILENAME, 'w', encoding='utf-8')
    except IOError as err:
        print(str(err))
        print('Cannot open ecl file ' + ECL_FILENAME)
        sys.exit(1)

    process(master_file, svr_file, ecl_file, defines_file)

    master_file.close()
    svr_file.close()
    ecl_file.close()


def usage():
    """
    Usage (depicts the usage of the script)
    """
    print("usage: prog -m <MASTER_FILENAME> -s <svr_attr_file> "
          "-e <ecl_attr_file> -d <defines_file>")


if __name__ == "__main__":
    main(sys.argv[1:])


================================================
FILE: ci/README.md
================================================
Instant-CI is a developer tool which aims at providing continous integration to the developers locally on their development systems.
Users can build, install PBS and run PTL tests with a single command. For this, the user need not worry about any underlying dependencies.
It also supports build and test history in the form of logs.

Dependencies for this tool are:
* python3.5 or above
* docker (17.12.0+)
* docker-compose

***How to setup:***

Simply invoke the following command:

` ./ci`

***CLI interface for ci:***

* **./ci :** This is the primary command for ci. It starts the container (if not already running), builds PBS dependencies. Will configure(if required), make and install PBS. If the tests option are given it will run PTL with the same. It does not take any argument.
```bash
./ci
 ```

* **./ci --params:** The params option can be used to run ci with a custom configuration.
Following parameters can be set.
| os | nodes | configure | tests |
> os: used to set OS platform of the container (single node) <br>
> nodes: used to define multi-node configuration for container <br>
> configure: will hold the value of configure options for PBS <br>
> tests: will hold the value for pbs_benchpress argument for PTL; if set empty will skip PTL tests <br>

```bash
# When the params command is called without any arguments it will display the currently set "configuration" and then proceed to run ci
# as the following example.
./ci --params
# or
./ci -p


# The following command is an example of how to provide a custom configure option for PBS. Everything to the right of the first '=' after configure will
# be taken as it is and given as an argument to the configure file in PBS. The same convention follows for other configuration options as well
./ci --params 'configure=CFLAGS=" -O2 -Wall -Werror" --prefix=/tmp/pbs --enable-ptl'

# You can also pass multiple parameter with this option for example
./ci -p 'configure=--enable-ptl --prefix=/opt/pbs' -p 'tests=-t SmokeTest.test_basic'


# The following are examples how to define a custom test case for pbs_benchpress.
# NOTE: The string is passed to pbs_benchpress command therefore one can use all available options of pbs_benchpress here.
# By default the test option is set to '-t SmokeTest'
./ci --params 'tests=-f pbs_smoketest.py'
./ci --params 'tests=--tags=smoke'


# If you wish to not run any PTL tests then use the below command. This will set tests as empty thus not invoking PTL.
./ci --params 'tests='


# Below is an example of setting the container operating system. This will setup a single container running PBS server.
# NOTE: ci uses cached image to increase performance. These cached images are saved on the local system
#		with the suffix '-ci-pbs'. If you do not wish to use the cached image(s) delete them using <docker rmi {image_name}>.
# OS platform can be defined by any image from docker-hub
./ci --params 'os=centos:7'


# Following is an example of how to define multi node setup for PBS.
# You can define multiple 'mom' or 'comm' nodes but only one 'server' node
./ci --params 'nodes=mom=centos:7;server=ubuntu:16.04;comm=ubuntu:18.04;mom=centos:8'

```


* **./ci --build-pkgs:** Invoke this command to build PBS packages. By default it will build packages for the platform ci container is started for.
Optionally accepts argument for other platform. The packages can be found in 'ci/packages' folder.

```bash
# Below command builds package for the platform ci was started/currently running on.
./ci --build-pkgs
# or
./ci -b

```

* **./ci --delete:** This will delete any containers created by this tool and take a backup of logs. The current logs can be found in the "logs" folder in the ci folder. The backup of previous sessions logs can be can be found in the ci/logs/session-{date}-{timestamp} folder.

```bash
# If you want to delete the container simply invoke this command.
./ci --delete
# or
./ci -d
```

* **./ci --local:** This will build, install PBS, and run smoke tests on the local machine. This option can not be combined with other options. It does not take configurations from params but runs with predefined params(as run in travis).
```bash
# The command to run
./ci --local
#or
./ci -l

# Optionally one can run the sanitize version (works only on centos:7) with the following argument
./ci --local sanitize
```


================================================
FILE: ci/ci
================================================
#!/usr/bin/env python3

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import argparse
import configparser
import copy
import fileinput
import json
import os
import platform
import re
import shlex
import shutil
import subprocess
import sys
import textwrap
import threading
import time
from argparse import RawTextHelpFormatter
from string import Template

ci_dirname = ''
default_platform = ''
MACROS = {}


def read_macros():
    for line in open(os.path.join(ci_dirname, 'etc', 'macros')):
        var, value = line.split('=')
        MACROS[var] = value.replace('\n', '')


requirements_template = Template('''num_servers=${num_servers}
num_moms=${num_moms}
num_comms=${num_comms}
no_mom_on_server=${no_mom_on_server}
no_comm_on_server=${no_comm_on_server}
no_comm_on_mom=${no_comm_on_mom}
''')

service_template_prist = Template('''{
"image": "${image}",
"volumes": [
    "../:/pbssrc",
    "./:/src",
    "./logs:/logs",
    "./etc:/workspace/etc"
],
"entrypoint": "/workspace/etc/container-init",
"environment": [
    "NODE_TYPE=${node_type}",
    "LANG=en_US.utf-8"
],
"networks": {
    "ci.local": { }
},
"domainname": "ci.local",
"container_name": "${hostname}",
"hostname": "${hostname}",
"user": "root",
"privileged": true,
"stdin_open": true,
"tty": true
}''')


def log_error(msg):
    print("ERROR ::: " + str(msg))


def log_info(msg):
    t = time.localtime()
    current_time = time.strftime("%H:%M:%S", t)
    print(current_time + " ---> " + str(msg))


def log_warning(msg):
    print("WARNING ::: " + str(msg))


def get_services_list():
    _ps = subprocess.run(
        ["docker-compose", "-f", "docker-compose.json",
         "ps", "--filter", "status=running", "--services"],
        stdout=subprocess.PIPE)
    _p = str((_ps.stdout).decode('utf-8'))
    return [x for x in _p.splitlines() if len(x) > 0]


def get_compose_file_services_list():
    compose_file = os.path.join(ci_dirname, 'docker-compose.json')
    with open(compose_file) as f:
        compose_file = json.loads(f.read())
    return list(compose_file['services'].keys())


def run_cmd(cmd, return_output=False):
    '''
    Run a terminal command, and if needed return output of the command.
    '''
    cmd = shlex.split(cmd)
    try:
        a = subprocess.Popen(cmd, stdout=subprocess.PIPE)
        out, err = a.communicate()
        if a.returncode != 0:
            log_error("command failed")
            log_error(str(err))
        else:
            if return_output:
                return str(out)
    except Exception as e:
        log_error("The command failed.")
        log_error(e)


def run_docker_cmd(run_cmd, run_on='all'):
    '''
    Runs a docker command and on failure redirects user to
    the container terminal
    '''
    services = get_services_list()
    services.sort(reverse=True)  # we want server cmds to run first
    for service in services:
        cmd = "docker-compose -f docker-compose.json exec "
        cmd += service + " bash -c \'" + run_cmd + "\'"
        if run_on != 'all' and service.find(run_on) == -1:
            log_info('Skipping on ' + service +
                     ' as command only to be run on ' + run_on)
            continue
        try:
            log_info(cmd)
            docker_cmd = shlex.split(cmd)
            a = subprocess.Popen(docker_cmd)
            a.communicate()
            if a.returncode != 0:
                _msg = "docker cmd returned with non zero exit code,"
                _msg += "redirecting you to container terminal"
                log_error(_msg)
                _docker_cmd = "docker-compose -f docker-compose.json exec "
                _docker_cmd += service + " bash -c \'cd /pbssrc && /bin/bash\'"
                docker_cmd = shlex.split(_docker_cmd)
                subprocess.run(docker_cmd)
                os._exit(1)
        except Exception as e:
            log_error("Failed\n:")
            log_error(e)


def write_to_file(file_path, value):
    with open(file_path, "w+") as f:
        f.write(value)


def read_from_file(file_path):
    if not os.path.isfile(file_path):
        open(file_path, 'a').close()
    with open(file_path, 'r+') as f:
        val = f.read()
    return val


def commit_docker_image():
    '''
    Watch for readiness of ci containers to commit a new image
    '''

    images_to_commit = {}
    time_spent = 0
    services = get_services_list()
    service_count = len(services)
    timeout = 1 * 60 * 60
    while service_count > 0:
        # Do not want to check constantly as it increases cpu load
        time.sleep(15)
        time_spent = time_spent + 15
        if time_spent > timeout:
            log_error("build is taking too long, timed out")
            sys.exit(1)
        status = read_from_file(os.path.join(
            ci_dirname, MACROS['CONFIG_DIR'], MACROS['STATUS_FILE']))
        for service in services:
            if str(status).find(service) != -1:
                services.remove(service)
                service_count -= 1
                image = (service.split('-', 1)[1][:-2]).replace('-', ':')
                image = image.replace("_", ".")
                images_to_commit[image] = service
    for key in images_to_commit:
        try:
            build_id = 'docker-compose -f docker-compose.json ps -q ' + \
                images_to_commit[key]
            build_id = run_cmd(build_id, True)
            build_id = build_id.split("'")[1]
            build_id = build_id[:12]
            image_name = (str(key).replace(':', '-')
                          ).replace('.', '_') + '-ci-pbs'
            # shortening the build id to 12 characters as is displayed by
            # 'docker ps' unlike 'docker-compose ps'  which shows full id
            cmd = 'docker commit '+build_id+' '+image_name+':latest'
            log_info(cmd)
            run_cmd(cmd)
        except Exception as e:
            log_error(e)
        try:
            bad_images = "docker images -qa -f'dangling=true'"
            bad_images = run_cmd(bad_images, True)
            if bad_images != "b''":
                bad_images = (bad_images.split("'")[1]).replace("\\n", " ")
                print("The following untagged images will be removed -> " +
                      bad_images)
                cmd = 'docker rmi ' + bad_images
                run_cmd(cmd)
        except Exception as e:
            log_warning(
                "could not remove bad (dangling) images, \
                please remove manually")
            print(e)
    return True


def create_ts_tree_json():
    benchpress_opt = os.path.join(
        ci_dirname, MACROS['CONFIG_DIR'], MACROS['BENCHPRESS_OPT_FILE'])
    benchpress_value = read_from_file(benchpress_opt)
    try:
        cmd = '/src/etc/gen_ptl_json.sh "' + benchpress_value + '"'
        run_docker_cmd(cmd, run_on='server')
    except Exception:
        log_error('Failed to generate testsuite info json')
        sys.exit(1)


def get_node_config(node_image=default_platform):
    '''
    Calculate the required node configuration for given
    requirements decorator and return node config
    '''
    json_data = {}
    max_servers_needed = 1
    max_moms_needed = 1
    max_comms_needed = 1
    no_mom_on_server_flag = False
    no_comm_on_mom_flag = True
    no_comm_on_server_flag = False
    try:
        with open(os.path.join(ci_dirname, 'ptl_ts_tree.json')) as f:
            json_data = json.load(f)
    except Exception:
        log_error('Could not find ptl tree json file')
    for ts in json_data.values():
        for tclist in ts['tclist'].values():
            max_moms_needed = max(
                tclist['requirements']['num_moms'], max_moms_needed)
            max_servers_needed = max(
                tclist['requirements']['num_servers'], max_servers_needed)
            max_comms_needed = max(
                tclist['requirements']['num_comms'], max_comms_needed)
            no_mom_on_server_flag = tclist['requirements']['no_mom_on_server']\
                or no_mom_on_server_flag
            no_comm_on_server_flag = tclist['requirements']['no_comm_on_server']\
                or no_comm_on_server_flag
            no_comm_on_mom_flag = tclist['requirements']['no_comm_on_mom']\
                or no_comm_on_mom_flag
    # Create a bash readable requirements decorator file
    write_to_file(os.path.join(ci_dirname, MACROS['CONFIG_DIR'],
                               MACROS['REQUIREMENT_DECORATOR_FILE']),
                  requirements_template.substitute(num_servers=max_servers_needed,
                                                   num_moms=max_moms_needed,
                                                   num_comms=max_comms_needed,
                                                   no_mom_on_server=no_mom_on_server_flag,
                                                   no_comm_on_server=no_comm_on_server_flag,
                                                   no_comm_on_mom=no_comm_on_mom_flag))

    server_nodes = []
    mom_nodes = []
    comm_nodes = []
    # get required number of servers and moms
    for _ in range(max_servers_needed):
        server_nodes.append(node_image)
    if not no_mom_on_server_flag:
        max_moms_needed = max(max_moms_needed, max_servers_needed)
        if max_moms_needed > max_servers_needed:
            for _ in range(max_moms_needed - max_servers_needed):
                mom_nodes.append(node_image)
    else:
        for _ in range(max_moms_needed):
            mom_nodes.append(node_image)

    only_moms = len(mom_nodes)
    # get required num of comms
    if no_comm_on_mom_flag and no_comm_on_server_flag:
        for _ in range(max_comms_needed):
            comm_nodes.append(node_image)
    elif no_comm_on_mom_flag and not no_comm_on_server_flag:
        if max_comms_needed > max_servers_needed:
            for _ in range(max_comms_needed-max_servers_needed):
                comm_nodes.append(node_image)
    else:
        if max_comms_needed > only_moms:
            for _ in range(max_comms_needed - only_moms):
                comm_nodes.append(node_image)

    # remove the trailing ';' from the node_config string
    mom_nodes = ['mom=' + x for x in mom_nodes]
    server_nodes = ['server=' + x for x in server_nodes]
    comm_nodes = ['comm=' + x for x in comm_nodes]
    node_images = ";".join(server_nodes + mom_nodes + comm_nodes)
    return node_images


def tail_build_log():
    server_name = ''
    build_log_path = get_services_list()
    for i in build_log_path:
        if i.find('server') != -1:
            build_log_path = i
            server_name = i
    build_log_path = os.path.join(
        ci_dirname, 'logs', 'build-' + build_log_path)
    prev = ''
    next = ''
    with open(build_log_path, 'rb') as f:
        while True:
            f.seek(-2, os.SEEK_END)
            while f.read(1) != b'\n':
                f.seek(-2, os.SEEK_CUR)
            next = f.readline().decode()
            if next != prev:
                print(next, end='')
                prev = next
            else:
                status = os.path.join(
                    ci_dirname, MACROS['CONFIG_DIR'], MACROS['STATUS_FILE'])
                status = read_from_file(status)
                if status.find(server_name) != -1:
                    return


def check_for_existing_image(val=default_platform):
    '''
    This function will check whether an existing image with the
    post-fix of '-ci-pbs' exists or not for the given docker image.
    '''
    if val.find('-ci-pbs') == -1:
        search_str = val.replace(":", "-")
        search_str = search_str.replace(".", '_')
        search_str += '-ci-pbs'
    cmd = 'docker images -q ' + search_str
    search_result = run_cmd(cmd, True)
    if search_result != "b''":
        return True, search_str
    else:
        return False, val


def get_current_setup():
    '''
    Returns the node config for currently running ci containers
    '''
    compose_file = os.path.join(ci_dirname, 'docker-compose.json')
    node_config = ''
    with open(compose_file) as f:
        compose_file = json.loads(f.read())
    for service in compose_file['services']:
        image = compose_file["services"][service]['image']
        if image[-7:] == '-ci-pbs':
            image = image[:-7][::-1].replace('-', ':', 1)[::-1]
        node_type = compose_file["services"][service]['environment'][0]
        node_type = node_type.split('=')[1]
        node_config += node_type + '=' + image + ';'
    node_config = node_config[:-1]
    return node_config


def load_conf():
    conf_file = os.path.join(
        ci_dirname, MACROS['CONFIG_DIR'], MACROS['CONF_JSON_FILE'])
    with open(conf_file) as f:
        conf_file = json.loads(f.read())
    return conf_file


def show_set_opts():
    conf_opts = load_conf()
    os_file_list = get_compose_file_services_list()
    os_file_list = [(x.split('-', 1)[0] + '=' + x.split('-', 1)[1][:-2]
                     ).replace('-', ':').replace('_', '.')
                    for x in os_file_list]
    os_file_list.sort()
    conf_opts['OS'] = os_file_list
    print(json.dumps(conf_opts, indent=2, sort_keys=True))


def create_param_file():
    '''
    Create param file with necessary node configuration for
    multi node PTL tests.
    '''
    moms = []
    comms = []
    include_server_mom = False
    include_server_comm = False
    include_mom_comm = False
    reqs = read_from_file(os.path.join(
        ci_dirname, MACROS['CONFIG_DIR'],
        MACROS['REQUIREMENT_DECORATOR_FILE']))
    if reqs.find('no_mom_on_server=False') != -1:
        include_server_mom = True
    if reqs.find('no_comm_on_server=False') != -1:
        include_server_comm = True
    if reqs.find('no_comm_on_mom=False') != -1:
        include_mom_comm = True
    for service in get_services_list():
        service = service+'.ci.local'
        if service.find('server') != -1:
            if include_server_mom:
                moms.append(service)
            if include_server_comm:
                comms.append(service)
        if service.find('mom') != -1:
            moms.append(service)
            if include_mom_comm:
                comms.append(service)
        if service.find('comm') != -1:
            comms.append(service)
    write_str = ''
    if len(moms) != 0:
        write_str = 'moms=' + ':'.join(moms) + '\n'
    if len(comms) != 0:
        write_str += 'comms=' + ':'.join(comms)
    param_path = os.path.join(
        ci_dirname, MACROS['CONFIG_DIR'], MACROS['PARAM_FILE'])
    write_to_file(param_path, write_str)


def unpack_node_string(nodes):
    '''
    Helper function to expand abbreviated node config
    '''
    for x in nodes:
        if x.find('*') != -1:
            num = x.split('*')[0]
            try:
                num = int(num)
            except Exception:
                log_error('invalid string provided for "nodes" configuration')
                sys.exit(1)
            val = x.split('*')[1]
            nodes.remove(x)
            for _ in range(num):
                nodes.append(val)
    return ';'.join(nodes)


def build_compose_file(nodes):
    '''
    Build docker-compose file for given node config in function parameter
    '''
    compose_template = {
        "version": "3.5",
        "networks": {
            "ci.local": {
                "name": "ci.local"
            }
        },
        "services": {}
    }
    if nodes.find("*") != -1:
        nodes = unpack_node_string(nodes.split(';'))
    count = 0
    server = ''
    for n in nodes.split(';'):
        count = count + 1
        node_key, node_val = n.split('=')
        if (node_val not in MACROS['SUPPORTED_PLATFORMS'].split(',')
                and ''.join(sys.argv).find(node_val) != -1):
            log_warning("Given platform '" + node_val + "' is not supported by" +
                        " ci, will result in unexpected behaviour")
            log_warning("Supported platforms are " +
                        MACROS['SUPPORTED_PLATFORMS'])
        node_name = node_key + '-' + \
            (node_val.replace(':', '-')).replace('.', '_') + '-' + str(count)
        image_value = node_val
        _, image_value = check_for_existing_image(node_val)
        service_template = json.loads(service_template_prist.substitute(
            image=image_value, node_type=node_key,
            hostname=node_name))
        if node_key == 'server':
            server = node_name
        compose_template['services'][node_name] = service_template
    for service in compose_template['services']:
        compose_template['services'][service]['environment'].append(
            "SERVER="+server)
    f = open(os.path.join(ci_dirname, 'docker-compose.json'), 'w')
    json.dump(compose_template, f, indent=2, sort_keys=True)
    f.close()
    log_info("Configured nodes for ci")


def ensure_ci_running():
    '''
    Check for running ci container; if not start ci container.
    '''
    try:
        service_count = len(get_services_list())
        if service_count == 0:
            log_info("No running service found")
            try:
                log_info('Attempting to start container')
                os.chdir(ci_dirname)
                subprocess.run(["docker-compose", "-f",
                                "docker-compose.json", "down",
                                "--remove-orphans"],
                               stdout=subprocess.DEVNULL)
                if os.path.exists(os.path.join(ci_dirname,
                                               MACROS['CONFIG_DIR'],
                                               MACROS['STATUS_FILE'])):
                    os.remove(os.path.join(
                        ci_dirname, MACROS['CONFIG_DIR'],
                        MACROS['STATUS_FILE']))
                write_to_file(os.path.join(
                    ci_dirname, MACROS['CONFIG_DIR'],
                    MACROS['STATUS_FILE']), '')
                subprocess.run(
                    ["docker-compose", "-f",
                     "docker-compose.json", "up", "-d"])
                log_info('Waiting for container build to complete ')
                build_log_path = os.path.join(ci_dirname, 'logs')
                log_info("Build logs can be found in " + build_log_path)
                # wait for build to complete and commit newly built container
                tail_build_log()
                commit_docker_image()
            except Exception as e:
                log_error(e)
        else:
            log_info("running container found")
            return 0
    except Exception:
        log_error(e)


def check_prerequisites():
    '''
    This function will check whether docker docker-compose commands
    are available. Also check docker version is minimum required.
    '''
    cmd = "where" if platform.system() == "Windows" else "which"

    try:
        subprocess.run([cmd, "docker"], stdout=subprocess.DEVNULL)
    except Exception:
        log_error("docker not found in PATH")
        sys.exit(1)

    def version_tuple(s: str):
        return tuple(int(x) for x in s.split("."))

    try:
        version = subprocess.run(
            ["docker", "--version"], stdout=subprocess.PIPE)
        version = re.findall(r'\s*([\d.]+)', version.stdout.decode('utf-8'))
        req_version = MACROS['REQ_DOCKER_VERSION']
        if version_tuple(version[0]) < version_tuple(req_version):
            print(version[0])
            print("Docker version less than minimum required " + req_version)
            sys.exit(1)
    except Exception:
        log_error("Failed to get docker version")
        sys.exit(1)

    try:
        subprocess.run([cmd, "docker-compose"], stdout=subprocess.DEVNULL)
    except Exception:
        log_error("docker-compose not found in PATH")
        sys.exit(1)


def is_restart_required():
    '''
    This function checks if the number of nodes currently running meet
    requirement for the given test case. If not builds new docker-compose file
    and returns bool value to restart ci.
    '''
    create_ts_tree_json()
    current_file_services_list = get_compose_file_services_list()
    current_node_image = current_file_services_list[0].split(
        '-', 1)[1][:-2].replace('-', ':')
    node_config = get_node_config(node_image=current_node_image)
    potential_list = []
    for val in node_config.split(';'):
        val = val.replace('=', '-')
        val = val.replace(':', '-')
        potential_list.append(val)
    current_file_services_list = [i[:-2] for i in current_file_services_list]
    # compare without platform names
    current_file_services_list = [
        i.split('-', 1)[0] for i in current_file_services_list]
    potential_list = [i.split('-', 1)[0] for i in potential_list]
    potential_list.sort()
    current_file_services_list.sort()
    if current_file_services_list != potential_list:
        build_compose_file(node_config)
        return True
    else:
        return False


def setup_config_dir():
    '''
    Initializes config directory and files for ci
    '''
    command_path = os.path.join(ci_dirname, MACROS['CONFIG_DIR'])
    if not os.path.exists(command_path):
        os.mkdir(command_path)
    target_path = os.path.join(command_path, MACROS['CONF_JSON_FILE'])
    if not os.path.exists(target_path):
        value = '{ "configure": "--prefix=/opt/pbs '
        value += '--enable-ptl", "tests" : "-t SmokeTest" }'
        write_to_file(target_path, value)
    target_path = os.path.join(command_path, MACROS['CONFIGURE_OPT_FILE'])
    if not os.path.exists(target_path):
        value = "--prefix=/opt/pbs --enable-ptl"
        write_to_file(target_path, value)
    target_path = os.path.join(command_path, MACROS['BENCHPRESS_OPT_FILE'])
    if not os.path.exists(target_path):
        value = "-t SmokeTest"
        write_to_file(target_path, value)
    target_path = os.path.join(ci_dirname, 'docker-compose.json')
    if not os.path.exists(target_path):
        build_compose_file('server=' + default_platform)
        run_cmd('docker-compose -f docker-compose.json down --remove-orphans')


def delete_ci():
    '''
    Takes backup of logs and deletes running containers.
    '''
    services = get_services_list()
    if len(services) != 0:
        build_compose_file(nodes=get_current_setup())
        cmd = '/src/etc/killit.sh backup'
        run_docker_cmd(cmd, run_on='server')
        log_warning('Removed logs file')
        log_info('backup files can be found in ' + build_log_path)
    else:
        log_info('No running container found, nothing to backup')
    try:
        os.chdir(ci_dirname)
        run_cmd(
            "docker-compose -f docker-compose.json down --remove-orphans")
        log_info(
            "done delete container and services")
    except Exception as e:
        log_error("Failed to destroy container and services: " + e)


def parse_params(params_list):
    '''
    Update given params
    '''
    if params_list[0] != 'called':
        container_running = False
        conf_opts = load_conf()
        for set_opts in params_list:
            key, value = (set_opts).split('=', 1)
            service_count = len(get_services_list())
            if service_count > 0:
                container_running = True
            if key.lower() == 'nodes':
                if container_running:
                    log_warning(
                        "Deleting existing containers first,\
                        find backup in logs folder")
                    delete_ci()
                build_compose_file(value)
            elif key.lower() == 'os':
                if container_running:
                    log_warning(
                        "Deleting existing containers first, \
                        find backup in logs folder")
                    delete_ci()
                node_string = value.replace('"', '')
                node_string = 'server=' + node_string
                build_compose_file(node_string)
            else:
                if key in conf_opts:
                    conf_opts[key] = value
                    f = open(os.path.join(
                        ci_dirname, MACROS['CONFIG_DIR'],
                        MACROS['CONF_JSON_FILE']), 'w')
                    json.dump(conf_opts, f, indent=2, sort_keys=True)
                    f.close()
                else:
                    log_error("Unrecognised key in parameter: '" +
                              key + "' , nothing updated")
                    sys.exit(1)


def run_ci_local(local):
    '''
    Run ci locally on host without spawning containers
    '''
    os.chdir(ci_dirname)
    # using subprocess.run instead of run_cmd function
    # so we dont supress stdout and stderr
    if local == 'normal':
        exit_code = subprocess.run("./etc/do.sh")
        sys.exit(exit_code.returncode)
    if local == 'sanitize':
        exit_code = subprocess.run("./etc/do_sanitize_mode.sh")
        sys.exit(exit_code.returncode)


def run_ci(build_pkgs=False):
    '''
    Run PBS configure, install PBS and run PTL tests, if build_pkgs
    is set to True it will instead run package build script only
    '''
    # Display Current options
    log_info("Running ci with the following options")
    show_set_opts()
    if len(get_services_list()) > 0:
        build_compose_file(get_current_setup())
    ret = ensure_ci_running()
    if ret == 1:
        log_error(
            "container build failed, build logs can be found in " +
            build_log_path)
        sys.exit(1)
    command_path = os.path.join(ci_dirname, MACROS['CONFIG_DIR'])
    conf_opts = load_conf()
    if build_pkgs:
        build_cmd = '/src/etc/build-pbs-packages.sh'
        log_info('The package build logs can be found in logs/pkglogs')
        run_docker_cmd(build_cmd + ' | tee /logs/pkglogs',
                       run_on='server')
        sys.exit(0)
    if conf_opts['tests'] != '':
        target_path = os.path.join(command_path, MACROS['BENCHPRESS_OPT_FILE'])
        write_to_file(target_path, conf_opts['tests'])
        if is_restart_required():
            delete_ci()
            ensure_ci_running()
    target_path = os.path.join(command_path, MACROS['CONFIGURE_OPT_FILE'])
    if conf_opts['configure'] != read_from_file(target_path):
        write_to_file(target_path, conf_opts['configure'])
        cmd = ' export ONLY_CONFIGURE=1 && /src/etc/do.sh 2>&1 \
            | tee -a /logs/build-$(hostname -s) '
        run_docker_cmd(cmd)
    cmd = ' export ONLY_REBUILD=1 && /src/etc/do.sh 2>&1 \
        | tee -a /logs/build-$(hostname -s) '
    run_docker_cmd(cmd)
    cmd = ' export ONLY_INSTALL=1 && /src/etc/do.sh 2>&1 \
        | tee -a /logs/build-$(hostname -s) '
    run_docker_cmd(cmd)
    target_path = os.path.join(command_path, MACROS['BENCHPRESS_OPT_FILE'])
    if conf_opts['tests'] == '':
        write_to_file(target_path, conf_opts['tests'])
        log_warning("No tests assigned, skipping PTL run")
    else:
        create_param_file()
        write_to_file(target_path, conf_opts['tests'])
        cmd = 'export RUN_TESTS=1 && export ONLY_TEST=1 && /src/etc/do.sh '
        run_docker_cmd(cmd, run_on='server')


if __name__ == "__main__":

    ci_dirname = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
    ci_dirname = os.path.join(ci_dirname, 'ci')
    os.chdir(ci_dirname)
    read_macros()
    _help = '''
    Examples of using arguments.
        ./ci -p 'OS=centos:7'
        ./ci -p 'tests=-t SmokeTest'
        ./ci -p 'configure=CFLAGS="-g -O2" --enable-ptl'
        ./ci -p 'nodes=mom=centos:7;server=ubuntu:16.04'
        ./ci -d or ./ci --delete
        ./ci -b or ./ci --build
        ./ci -l or ./ci --local
    Note: Set tests as empty if you dont want to run PTL'
    '''
    _help += 'Supported platforms are ' + MACROS['SUPPORTED_PLATFORMS']
    ap = argparse.ArgumentParser(prog='ci',
                                 description='Runs the ci tool for pbs',
                                 formatter_class=argparse.RawTextHelpFormatter,
                                 epilog=textwrap.dedent(_help),
                                 conflict_handler='resolve')
    _help = 'set configuration values for os | nodes | configure | tests'
    ap.add_argument('-p', '--params', nargs='+',
                    action='append', help=_help, metavar='param')
    _help = 'destroy pbs container'
    ap.add_argument('-d', '--delete', action='store_true', help=_help)
    _help = 'build packages for the current platform.'
    ap.add_argument('-b', '--build-pkgs', nargs='?', const='called',
                    help=_help)
    _help = 'Simply run the tests locally, without spawning any containers.'
    _help += '\ntype can be one of normal (default) or sanitize'
    ap.add_argument('-l', '--local', nargs='?', const='normal',
                    help=_help, metavar='type')
    args = ap.parse_args()
    build_pkgs = False
    default_platform = MACROS['DEFAULT_PLATFORM']
    build_log_path = os.path.join(ci_dirname, 'logs')
    not_local_run = sys.argv.count('-l') == 0 \
        and sys.argv.count('--local') == 0 \
        and sys.argv.count('-l=sanitize') == 0\
        and sys.argv.count('--local=sanitize') == 0 \
        and sys.argv.count('-l=normal') == 0 \
        and sys.argv.count('--local=normal') == 0
    if not_local_run:
        setup_config_dir()
        check_prerequisites()
    if (not args.delete) and not_local_run and (args.params is None):
        ret = ensure_ci_running()
        if ret == 1:
            log_error(
                "container build failed, build logs can be found in " +
                build_log_path)
            sys.exit(1)
    try:
        if args.params is not None:
            for p in args.params:
                parse_params(p)
        if args.build_pkgs is not None:
            build_pkgs = True
        if args.delete is True:
            confirm = input(
                'Are you sure you want to delete containers (Y/N)?: ')
            if confirm[0].lower() == 'n':
                sys.exit(0)
            elif confirm[0].lower() == 'y':
                delete_ci()
            else:
                log_error("Invalid option provided")
            sys.exit(0)
        if args.local is not None:
            run_ci_local(args.local)
    except Exception as e:
        ap.print_help()
        log_error(e)

    run_ci(build_pkgs)


================================================
FILE: ci/etc/build-pbs-packages.sh
================================================
#! /bin/bash -xe

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

. /etc/os-release

pbsdir=/pbssrc
rpm_dir=/root/rpmbuild

rm -rf /src/packages
mkdir -p /src/packages
mkdir -p ${rpm_dir}/{BUILD,RPMS,SOURCES,SPECS,SRPMS}

if [ "x${ID}" == "xcentos" -a "x${VERSION_ID}" == "x8" ]; then
	export LANG="C.utf8"
	swig_opt="--with-swig=/usr/local"
	if [ ! -f /tmp/swig/swig/configure ]; then
		# source install swig
		dnf -y install gcc-c++ byacc pcre-devel
		mkdir -p /tmp/swig/
		cd /tmp/swig
		git clone https://github.com/swig/swig --branch rel-4.0.0 --single-branch
		cd swig
		./autogen.sh
		./configure
		make -j8
		make install
		cd ${PBS_DIR}
	fi
fi

cp -r $pbsdir /tmp/pbs
cd /tmp/pbs
./autogen.sh
mkdir -p target
cd target
../configure --prefix=/opt/pbs --enable-ptl ${swig_opt}
make dist
cp *.tar.gz ${rpm_dir}/SOURCES
cp ../*-rpmlintrc ${rpm_dir}/SOURCES
cp *.spec ${rpm_dir}/SPECS
cflags="-g -O2 -Wall -Werror"
cxxflags="-g -O2 -Wall -Werror"
if [ "x${ID}" == "xdebian" -o "x${ID}" == "xubuntu" ]; then
	CFLAGS="${cflags} -Wno-unused-result" CXXFLAGS="${cxxflags} -Wno-unused-result" rpmbuild -ba --nodeps *.spec --with ptl
else
	if [ "x${ID}" == "xcentos" -a "x${VERSION_ID}" == "x8" ]; then
		CFLAGS="${cflags}" CXXFLAGS="${cxxflags}" rpmbuild -ba *.spec --with ptl -D "_with_swig ${swig_opt}"
	else
		CFLAGS="${cflags}" CXXFLAGS="${cxxflags}" rpmbuild -ba *.spec --with ptl
	fi
fi

cp ${pbsdir}/README.md /src/packages/
cp ${pbsdir}/LICENSE /src/packages/
cp ${pbsdir}/COPYRIGHT /src/packages/
mv ${rpm_dir}/RPMS/*/*pbs* /src/packages/
mv ${rpm_dir}/SRPMS/*pbs* /src/packages/
cd /src/packages
rm -rf /tmp/pbs

if [ "x${ID}" == "xdebian" -o "x${ID}" == "xubuntu" ]; then
	_target_arch=$(dpkg --print-architecture)
	fakeroot alien --to-deb --scripts --target=${_target_arch} *-debuginfo*.rpm -g
	_dir=$(/bin/ls -1d *debuginfo* | grep -vE '(rpm|orig)')
	mv ${_dir}/opt/pbs/usr/ ${_dir}/
	rm -rf ${_dir}/opt
	(
		cd ${_dir}
		dpkg-buildpackage -d -b -us -uc
	)
	rm -rf ${_dir} ${_dir}.orig *debuginfo*.buildinfo *debuginfo*.changes *debuginfo*.rpm
	fakeroot alien --to-deb --scripts --target=${_target_arch} *.rpm
	rm -f *.rpm
fi


================================================
FILE: ci/etc/ci-script-wrapper.service
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

[Unit]
Description=Run ci docker entrypoint script at startup after all systemd services are loaded
After=getty.target

[Service]
Type=forking
RemainAfterExit=yes
EnvironmentFile=/.env-file
ExecStart=/src/etc/docker-entrypoint
TimeoutStartSec=0

[Install]
WantedBy=default.target


================================================
FILE: ci/etc/configure_node.sh
================================================
#! /bin/bash -x

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

. /src/etc/macros
if [ -f /src/${CONFIG_DIR}/${REQUIREMENT_DECORATOR_FILE} ]; then
	. /src/${CONFIG_DIR}/${REQUIREMENT_DECORATOR_FILE}
fi

if [ "x${NODE_TYPE}" == "xmom" ]; then
	sed -i "s@PBS_SERVER=.*@PBS_SERVER=${SERVER}@" /etc/pbs.conf
	sed -i "s@PBS_START_SERVER=.*@PBS_START_SERVER=0@" /etc/pbs.conf
	ssh -t root@${SERVER} " /opt/pbs/bin/qmgr -c 'c n $(hostname -s)'"
	if [ "x${no_comm_on_mom}" == "xTrue" ]; then
		sed -i "s@PBS_START_COMM=.*@PBS_START_COMM=0@" /etc/pbs.conf
	else
		sed -i "s@PBS_START_COMM=.*@PBS_START_COMM=1@" /etc/pbs.conf
	fi
	sed -i "s@PBS_START_SCHED=.*@PBS_START_SCHED=0@" /etc/pbs.conf
fi

if [ "x${NODE_TYPE}" == "xserver" ]; then
	sed -i "s@PBS_SERVER=.*@PBS_SERVER=$(hostname)@" /etc/pbs.conf
	if [ "x${no_comm_on_server}" == "xTrue" ]; then
		sed -i "s@PBS_START_COMM=.*@PBS_START_COMM=0@" /etc/pbs.conf
	else
		sed -i "s@PBS_START_COMM=.*@PBS_START_COMM=1@" /etc/pbs.conf
	fi
	if [ "x${no_mom_on_server}" == "xTrue" ]; then
		sed -i "s@PBS_START_MOM=.*@PBS_START_MOM=0@" /etc/pbs.conf
	else
		sed -i "s@PBS_START_MOM=.*@PBS_START_MOM=1@" /etc/pbs.conf
	fi
	sed -i "s@PBS_START_SERVER=.*@PBS_START_SERVER=1@" /etc/pbs.conf
	sed -i "s@PBS_START_SCHED=.*@PBS_START_SCHED=1@" /etc/pbs.conf
fi

if [ "x${NODE_TYPE}" == "xcomm" ]; then
	sed -i "s@PBS_START_COMM=.*@PBS_START_COMM=1@" /etc/pbs.conf
	sed -i "s@PBS_SERVER=.*@PBS_SERVER=${SERVER}@" /etc/pbs.conf
	sed -i "s@PBS_START_MOM=.*@PBS_START_MOM=0@" /etc/pbs.conf
	sed -i "s@PBS_START_SERVER=.*@PBS_START_SERVER=0@" /etc/pbs.conf
	sed -i "s@PBS_START_SCHED=.*@PBS_START_SCHED=0@" /etc/pbs.conf
fi


================================================
FILE: ci/etc/container-env-setup.sh
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

export container=docker
export TERM=xterm
if [ -e /etc/debian_version ]; then
  export DEBIAN_FRONTEND=noninteractive
fi
export LOGNAME=${LOGNAME:-"$(id -un)"}
export USER=${USER:-"$(id -un)"}
export TZ=UTC
export PBS_TZID=UTC
export PATH="$(printf "%s" "/usr/local/bin:/usr/local/sbin:${PATH}" | awk -v RS=: -v ORS=: '!($0 in a) {a[$0]; print}')"
export DOMAIN=$(hostname -d)
export PERL5LIB=${HOME}/AUTO/lib/perl5/site_perl
export PERL5LIB=${PERL5LIB}:${HOME}/AUTO/lib/site_perl
export PERL5LIB=${PERL5LIB}:${HOME}/AUTO/share/perl5
export PERL5LIB=${PERL5LIB}:${HOME}/AUTO/share/perl
export PBS_TEST_DEBUG=1
export PBS_TEST_VERBOSE=1
export PBS_PRINT_STACK_TRACE=1
export MAIL="${MAIL:-"/var/mail/$(id -un)"}"


================================================
FILE: ci/etc/container-init
================================================
#!/bin/bash -x

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

/workspace/etc/install-system-packages 2>&1 | tee -a /logs/build-$(hostname -s)

# set environment var file
touch /.env-file
set >/.env-file

capsh --print | grep -Eq '*cap_sys_admin*'
if [ $? -eq 0 ]; then
	if [ -x "/usr/lib/systemd/systemd" ]; then
		exec /usr/lib/systemd/systemd --system
	elif [ -x "/lib/systemd/systemd" ]; then
		exec /lib/systemd/systemd --system
	elif [ -x "/usr/sbin/init" ]; then
		exec /usr/sbin/init
	elif [ -x "/sbin/init" ]; then
		exec /sbin/init
	else
		echo "Couldn't start container in systemd mode, starting in default mode"
	fi
fi


================================================
FILE: ci/etc/do.sh
================================================
#!/bin/bash -xe

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

if [ $(id -u) -ne 0 ]; then
  echo "This script must be run by root user"
  exit 1
fi

if [ -f /src/ci ]; then
  IS_CI_BUILD=1
  FIRST_TIME_BUILD=$1
  . /src/etc/macros
  config_dir=/src/${CONFIG_DIR}
  chmod -R 755 ${config_dir}
  logdir=/logs
  chmod -R 755 ${logdir}
  PBS_DIR=/pbssrc
else
  PBS_DIR=$(readlink -f $0 | awk -F'/ci/' '{print $1}')
fi

cd ${PBS_DIR}
. /etc/os-release
# Extract major version number
MAJOR_VERSION="${VERSION_ID%%.*}"
SPEC_FILE=$(/bin/ls -1 ${PBS_DIR}/*.spec)
REQ_FILE=${PBS_DIR}/test/fw/requirements.txt
if [ ! -r ${SPEC_FILE} -o ! -r ${REQ_FILE} ]; then
  echo "Couldn't find pbs spec file or ptl requirements file"
  exit 1
fi

if [ "x${IS_CI_BUILD}" != "x1" ] || [ "x${FIRST_TIME_BUILD}" == "x1" -a "x${IS_CI_BUILD}" == "x1" ]; then
  if [ "x${ID}" == "xcentos" -a "x${VERSION_ID}" == "x7" ]; then
    yum clean all
    yum -y install yum-utils epel-release rpmdevtools
    yum -y install python3-pip sudo which net-tools man-db time.x86_64 \
      expat libedit postgresql-server postgresql-contrib python3 \
      sendmail sudo tcl tk libical libasan llvm git
    rpmdev-setuptree
    yum-builddep -y ${SPEC_FILE}
    yum -y install $(rpmspec --requires -q ${SPEC_FILE} | awk '{print $1}' | sort -u | grep -vE '^(/bin/)?(ba)?sh$')
    pip3 install --trusted-host pypi.org --trusted-host files.pythonhosted.org -r ${REQ_FILE}
    if [ "x${BUILD_MODE}" == "xkerberos" ]; then
      yum -y install krb5-libs krb5-devel libcom_err libcom_err-devel
    fi
    yum -y install cmake3
    rm -rf cJSON
    git clone https://github.com/DaveGamble/cJSON.git
    cd cJSON; mkdir build; cd build; cmake3 .. -DCMAKE_INSTALL_PREFIX=/usr; make; make install; cd ../../
  elif [ "x${ID}" == "xcentos" -a "x${VERSION_ID}" == "x8" ]; then
    export LANG="C.utf8"
    sed -i -e "s|mirrorlist=|#mirrorlist=|g" /etc/yum.repos.d/CentOS-*
    sed -i -e "s|#baseurl=http://mirror.centos.org|baseurl=http://vault.centos.org|g" /etc/yum.repos.d/CentOS-*
    dnf -y clean all
    dnf -y install 'dnf-command(config-manager)'
    dnf -y config-manager --set-enabled powertools
    dnf -y install epel-release
    dnf -y install python3-pip sudo which net-tools man-db time.x86_64 \
      expat libedit postgresql-server postgresql-contrib python3 \
      sendmail sudo tcl tk libical libasan llvm git
    dnf -y builddep ${SPEC_FILE}
    dnf -y install $(rpmspec --requires -q ${SPEC_FILE} | awk '{print $1}' | sort -u | grep -vE '^(/bin/)?(ba)?sh$')
    pip3 install --trusted-host pypi.org --trusted-host files.pythonhosted.org -r ${REQ_FILE}
    if [ "x${BUILD_MODE}" == "xkerberos" ]; then
      dnf -y install krb5-libs krb5-devel libcom_err libcom_err-devel
    fi
  elif [ "x${ID}" == "xrocky" -a "x${MAJOR_VERSION}" == "x9" ]; then
    export LANG="C.utf8"
    dnf -y clean all
    yum -y install yum-utils
    dnf -y install 'dnf-command(config-manager)'
    dnf config-manager --set-enabled crb
    dnf -y install epel-release
    dnf -y install python3-pip sudo which net-tools man-db time.x86_64 procps \
      expat libedit postgresql-server postgresql-contrib python3 \
      sendmail sudo tcl tk libical libasan llvm git chkconfig
    dnf -y builddep ${SPEC_FILE}
    dnf -y install $(rpmspec --requires -q ${SPEC_FILE} | awk '{print $1}' | sort -u | grep -vE '^(/bin/)?(ba)?sh$')
    pip3 install --trusted-host pypi.org --trusted-host files.pythonhosted.org -r ${REQ_FILE}
    if [ "x${BUILD_MODE}" == "xkerberos" ]; then
      dnf -y install krb5-libs krb5-devel libcom_err libcom_err-devel
    fi
  elif [ "x${ID}" == "xopensuse" -o "x${ID}" == "xopensuse-leap" ]; then
    zypper -n ref
    zypper -n install rpmdevtools python3-pip sudo which net-tools man time.x86_64 git
    rpmdev-setuptree
    zypper -n install --force-resolution $(rpmspec --buildrequires -q ${SPEC_FILE} | sort -u | grep -vE '^(/bin/)?(ba)?sh$')
    zypper -n install --force-resolution $(rpmspec --requires -q ${SPEC_FILE} | sort -u | grep -vE '^(/bin/)?(ba)?sh$')
    pip3 install --trusted-host pypi.org --trusted-host files.pythonhosted.org -r ${REQ_FILE}
  elif [ "x${ID}" == "xdebian" ]; then
    if [ "x${DEBIAN_FRONTEND}" == "x" ]; then
      export DEBIAN_FRONTEND=noninteractive
    fi
    apt-get -y update
    apt-get install -y build-essential dpkg-dev autoconf libtool rpm alien libssl-dev \
      libxt-dev libpq-dev libexpat1-dev libedit-dev libncurses5-dev \
      libical-dev libhwloc-dev pkg-config tcl-dev tk-dev python3-dev \
      swig expat postgresql postgresql-contrib python3-pip sudo \
      man-db git elfutils libcjson-dev
    pip3 install --trusted-host pypi.org --trusted-host files.pythonhosted.org -r ${REQ_FILE}
  elif [ "x${ID}" == "xubuntu" ]; then
    if [ "x${DEBIAN_FRONTEND}" == "x" ]; then
      export DEBIAN_FRONTEND=noninteractive
    fi
    apt-get -y update
    apt-get install -y build-essential dpkg-dev autoconf libtool rpm alien libssl-dev \
      libxt-dev libpq-dev libexpat1-dev libedit-dev libncurses5-dev \
      libical-dev libhwloc-dev pkg-config tcl-dev tk-dev python3-dev \
      swig expat postgresql python3-pip sudo man-db git elfutils libcjson-dev
    if [[ $(printf '%s\n' "24.04" "$VERSION_ID" | sort -V | head -n1) == "24.04" ]]; then
	apt-get -y install python3-nose python3-bs4 python3-defusedxml python3-pexpect
    else
        pip3 install --trusted-host pypi.org --trusted-host files.pythonhosted.org -r ${REQ_FILE}
    fi
  else
    echo "Unknown platform..."
    exit 1
  fi
fi

if [ "x${FIRST_TIME_BUILD}" == "x1" -a "x${IS_CI_BUILD}" == "x1" ]; then
  echo "### First time build is complete ###"
  echo "READY:$(hostname -s)" >>${config_dir}/${STATUS_FILE}
  exit 0
fi

if [ "x${ID}" == "xcentos" -a "x${VERSION_ID}" == "x8" ]; then
  export LANG="C.utf8"
  swig_opt="--with-swig=/usr/local"
  if [ ! -f /tmp/swig/swig/configure ]; then
    # source install swig
    dnf -y install gcc-c++ byacc pcre-devel
    mkdir -p /tmp/swig/
    cd /tmp/swig
    git clone https://github.com/swig/swig --branch rel-4.0.0 --single-branch
    cd swig
    ./autogen.sh
    ./configure
    make -j8
    make install
    cd ${PBS_DIR}
  fi
fi

if [ "x${ONLY_INSTALL_DEPS}" == "x1" ]; then
  exit 0
fi
_targetdirname=target-${ID}-$(hostname -s)
if [ "x${ONLY_INSTALL}" != "x1" -a "x${ONLY_REBUILD}" != "x1" -a "x${ONLY_TEST}" != "x1" ]; then
  rm -rf ${_targetdirname}
fi
mkdir -p ${_targetdirname}
[[ -f Makefile ]] && make distclean || true
if [ ! -f ./${SPEC_FILE} ]; then
  git config --global --add safe.directory ${PBS_DIR}
  git checkout ${SPEC_FILE}
fi
if [ ! -f ./configure ]; then
  ./autogen.sh
fi
if [ "x${ONLY_REBUILD}" != "x1" -a "x${ONLY_INSTALL}" != "x1" -a "x${ONLY_TEST}" != "x1" ]; then
  _cflags="-g -O2 -Wall -Werror"
  if [ "x${ID}" == "xubuntu" ]; then
    _cflags="${_cflags} -Wno-unused-result"
  fi
  cd ${_targetdirname}
  if [ -f /src/ci ]; then
    if [ -f ${config_dir}/${CONFIGURE_OPT_FILE} ]; then
      PYTHON_CODE=$(cat <<END
with open('${config_dir}/${CONFIGURE_OPT_FILE}') as f:
  x = f.read()
import re
if len(x.split("'")) > 1:
  if re.search(r"CFLAGS=(\"|\').*(\"|\')",x) != None:
    print(re.search(r"CFLAGS=(\"|\').*(\"|\')",x).group(0).split('\'')[1])
else:
  if re.search(r"CFLAGS=(\"|\').*(\"|\')",x) != None:
    print(re.search(r"CFLAGS=(\"|\').*(\"|\')",x).group(0).split('"')[1])
END
)
      _cflags="$(python3 -c "$PYTHON_CODE")"
      PYTHON_CODE=$(cat <<END
with open('${config_dir}/${CONFIGURE_OPT_FILE}') as f:
  x = f.read()
import re
print(re.sub(r"CFLAGS=(\"|\').*(\"|\')","",x))
END
)
    configure_opt="$(python3 -c "$PYTHON_CODE")"
    else
      configure_opt='--prefix=/opt/pbs --enable-ptl'
    fi
    if [ -z "${_cflags}" ]; then
      ../configure ${configure_opt} ${swig_opt}
    else
      ../configure CFLAGS="${_cflags}" ${configure_opt} ${swig_opt}
    fi
    if [ "x${ONLY_CONFIGURE}" == "x1" ]; then
      exit 0
    fi
  else
    configure_opt='--prefix=/opt/pbs --enable-ptl'
    if [ "x${BUILD_MODE}" == "xkerberos" ]; then
      configure_opt="${configure_opt} --with-krbauth PATH_KRB5_CONFIG=/usr/bin/krb5-config"
    fi
    ../configure CFLAGS="${_cflags}" ${configure_opt} ${swig_opt}
  fi
  cd -
fi
cd ${_targetdirname}
prefix=$(cat ${config_dir}/${CONFIGURE_OPT_FILE} | awk -F'prefix=' '{print $2}' | awk -F' ' '{print $1}')
if [ "x${prefix}" == "x" ]; then
  prefix='/opt/pbs'
fi
if [ "x${ONLY_INSTALL}" == "x1" -o "x${ONLY_TEST}" == "x1" ]; then
  echo "skipping make"
else
  if [ ! -f ${PBS_DIR}/${_targetdirname}/Makefile ]; then
    if [ -f ${config_dir}/${CONFIGURE_OPT_FILE} ]; then
      PYTHON_CODE=$(cat <<END
with open('${config_dir}/${CONFIGURE_OPT_FILE}') as f:
  x = f.read()
import re
if len(x.split("'")) > 1:
  if re.search(r"CFLAGS=(\"|\').*(\"|\')",x) != None:
    print(re.search(r"CFLAGS=(\"|\').*(\"|\')",x).group(0).split('\'')[1])
else:
  if re.search(r"CFLAGS=(\"|\').*(\"|\')",x) != None:
    print(re.search(r"CFLAGS=(\"|\').*(\"|\')",x).group(0).split('"')[1])
END
)
      _cflags="$(python3 -c "$PYTHON_CODE")"
      PYTHON_CODE=$(cat <<END
with open('${config_dir}/${CONFIGURE_OPT_FILE}') as f:
  x = f.read()
import re
print(re.sub(r"CFLAGS=(\"|\').*(\"|\')","",x))
END
)
      configure_opt="$(python3 -c "$PYTHON_CODE")"
    else
      configure_opt='--prefix=/opt/pbs --enable-ptl'
    fi
    if [ -z "${_cflags}" ]; then
      ../configure ${configure_opt}
    else
      ../configure CFLAGS="${_cflags}" ${configure_opt}
    fi
  fi
  make -j8
fi
if [ "x${ONLY_REBUILD}" == "x1" ]; then
  exit 0
fi
if [ "x${ONLY_TEST}" != "x1" ]; then
  if [ ! -f ${PBS_DIR}/${_targetdirname}/Makefile ]; then
    if [ -f ${config_dir}/${CONFIGURE_OPT_FILE} ]; then
      PYTHON_CODE=$(cat <<END
with open('${config_dir}/${CONFIGURE_OPT_FILE}') as f:
  x = f.read()
import re
if len(x.split("'")) > 1:
  if re.search(r"CFLAGS=(\"|\').*(\"|\')",x) != None:
    print(re.search(r"CFLAGS=(\"|\').*(\"|\')",x).group(0).split('\'')[1])
else:
  if re.search(r"CFLAGS=(\"|\').*(\"|\')",x) != None:
    print(re.search(r"CFLAGS=(\"|\').*(\"|\')",x).group(0).split('"')[1])
END
)
      _cflags="$(python3 -c "$PYTHON_CODE")"
      PYTHON_CODE=$(cat <<END
with open('${config_dir}/${CONFIGURE_OPT_FILE}') as f:
  x = f.read()
import re
print(re.sub(r"CFLAGS=(\"|\').*(\"|\')","",x))
END
)
    configure_opt="$(python3 -c "$PYTHON_CODE")"
    else
      configure_opt='--prefix=/opt/pbs --enable-ptl'
    fi
    if [ -z "${_cflags}" ]; then
      ../configure ${configure_opt}
    else
      ../configure CFLAGS="${_cflags}" ${configure_opt}
    fi
    make -j8
  fi
  make -j8 install
  chmod 4755 ${prefix}/sbin/pbs_iff ${prefix}/sbin/pbs_rcp
  if [ "x${DONT_START_PBS}" != "x1" ]; then
    ${prefix}/libexec/pbs_postinstall server
    sed -i "s@PBS_START_MOM=0@PBS_START_MOM=1@" /etc/pbs.conf
    if [ "x$IS_CI_BUILD" == "x1" ]; then
      /src/etc/configure_node.sh
    fi
    /etc/init.d/pbs restart
  fi
fi

if [ "x${BUILD_MODE}" == "xkerberos" ]; then
  echo "PTL with Kerberos support not implemented yet."
  exit 0
fi

set +e
. /etc/profile.d/ptl.sh
set -e
pbs_config --make-ug

if [ "x${RUN_TESTS}" == "x1" ]; then
  if [ "x${ID}" == "xcentos" ]; then
    export LC_ALL=en_US.utf-8
    export LANG=en_US.utf-8
  elif [ "x${ID}" == "xopensuse" ]; then
    export LC_ALL=C.utf8
  fi
  ptl_tests_dir=/pbssrc/test/tests
  cd ${ptl_tests_dir}/
  benchpress_opt="$(cat ${config_dir}/${BENCHPRESS_OPT_FILE})"
  eval_tag="$(echo ${benchpress_opt} | awk -F'"' '{print $2}')"
  benchpress_opt="$(echo ${benchpress_opt} | sed -e 's/--eval-tags=\".*\"//g')"
  params="--param-file=${config_dir}/${PARAM_FILE}"
  time_stamp=$(date -u "+%Y-%m-%d-%H%M%S")
  ptl_log_file=${logdir}/logfile-${time_stamp}
  chown pbsroot ${logdir}
  if [ -z "${eval_tag}" ]; then
    sudo -Hiu pbsroot pbs_benchpress ${benchpress_opt} --db-type=html --db-name=${logdir}/result.html -o ${ptl_log_file} ${params}
  else
    sudo -Hiu pbsroot pbs_benchpress --eval-tags="'${eval_tag}'" ${benchpress_opt} --db-type=html --db-name=${logdir}/result.html -o ${ptl_log_file} ${params}
  fi
fi

if [ "x${IS_CI_BUILD}" != "x1" ]; then
  cd /opt/ptl/tests/
  /opt/pbs/bin/pbsnodes -av
  ps -ef | grep pbs
#Azure pipeline : on Suse platform man page test is failing. Need to analyze.
#for time being skipping man page test case
  pbs_benchpress --tags=smoke --exclude=SmokeTest.test_man_pages
  /opt/pbs/bin/pbsnodes -av
fi


================================================
FILE: ci/etc/do_sanitize_mode.sh
================================================
#!/bin/bash -xe

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

PBS_DIR=$(readlink -f $0 | awk -F'/ci/' '{print $1}')
cd ${PBS_DIR}

[ -f /sys/fs/selinux/enforce ] && echo 0 > /sys/fs/selinux/enforce
yum clean all
yum -y update
yum -y install yum-utils epel-release rpmdevtools libasan llvm
dnf config-manager --set-enabled crb
rpmdev-setuptree
yum -y install python3-pip sudo which net-tools man-db time.x86_64 procps
yum-builddep -y ./*.spec
yum -y install cmake3 git
rm -rf cJSON
git clone https://github.com/DaveGamble/cJSON.git
cd cJSON; mkdir build; cd build; cmake3 .. -DCMAKE_INSTALL_PREFIX=/usr; make; make install; cd ../../
./autogen.sh
rm -rf target-sanitize
mkdir -p target-sanitize
cd target-sanitize
../configure
make dist
cp -fv *.tar.gz /root/rpmbuild/SOURCES/
CFLAGS="-g -O2 -Wall -Werror -fsanitize=address -fno-omit-frame-pointer" CXXFLAGS="-g -O2 -Wall -Werror -fsanitize=address -fno-omit-frame-pointer" rpmbuild -bb --with ptl *.spec
yum -y install /root/rpmbuild/RPMS/x86_64/*-server-??.*.x86_64.rpm
yum -y install /root/rpmbuild/RPMS/x86_64/*-debuginfo-??.*.x86_64.rpm
yum -y install /root/rpmbuild/RPMS/x86_64/*-ptl-??.*.x86_64.rpm
sed -i "s@PBS_START_MOM=0@PBS_START_MOM=1@" /etc/pbs.conf
/etc/init.d/pbs start
set +e
. /etc/profile.d/ptl.sh
set -e
pbs_config --make-ug
cd /opt/ptl/tests/
# Ignore address sanitizer link order because of
# importing pbs python modules (like pbs and pbs_ifl) in ptl.
# The problem is that original Python bin is not compiled with ASAN.
# This will not affect pbs service as it has its own env.
export ASAN_OPTIONS=verify_asan_link_order=0
pbs_benchpress --tags=smoke


================================================
FILE: ci/etc/docker-entrypoint
================================================
#!/bin/bash -ex

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

workdir=/src/etc
logdir=/logs

cd /pbssrc
${workdir}/do.sh 1 2>&1 | tee -a ${logdir}/build-$(hostname -s)
if [ $? -ne 0 ]; then
    exit 1
else
    exit 0
fi


================================================
FILE: ci/etc/gen_ptl_json.sh
================================================
#!/bin/bash -x

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

cleanup() {
	cd ${etcdir}
	rm -rf ./tmpptl
}

etcdir=$(dirname $(readlink -f "$0"))
cidir=/pbssrc/ci
cd ${etcdir}
mkdir tmpptl
workdir=${etcdir}/tmpptl
cd ${workdir}
mkdir -p ptlsrc
/bin/cp -rf ${cidir}/../test/* ptlsrc/
if [ -f ptlsrc/fw/setup.py.in ]; then
	sed "s;@PBS_VERSION@;1.0.0;g" ptlsrc/fw/setup.py.in >ptlsrc/fw/setup.py
	sed "s;@PBS_VERSION@;1.0.0;g" ptlsrc/fw/ptl/__init__.py.in >ptlsrc/fw/ptl/__init__.py
fi
cd ${workdir}/ptlsrc
mkdir ../tp
__python="$(grep -rE '^#!/usr/bin/(python|env python)[23]' fw/bin/pbs_benchpress | awk -F[/" "] '{print $NF}')"
${__python} -m pip install --trusted-host pypi.org --trusted-host files.pythonhosted.org --prefix $(pwd)/tp -r fw/requirements.txt fw/.
cd tests
PYTHONPATH=../tp/lib/$(/bin/ls -1 ../tp/lib)/site-packages ${__python} ../tp/bin/pbs_benchpress $1 --gen-ts-tree
ret=$?
if [ ${ret} -ne 0 ]; then
	echo "Failed to generate ptl json"
	cleanup
	exit $ret
else
	mv ptl_ts_tree.json ${cidir}
fi

cleanup


================================================
FILE: ci/etc/id_rsa
================================================
-----BEGIN OPENSSH PRIVATE KEY-----
b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAABlwAAAAdzc2gtcn
NhAAAAAwEAAQAAAYEAt6kNw0C2ZMybkld0sucLkpaMuwn6SXB6+9scN3ZMTSFRSMxa85MT
ee8sOsiyrkIjv85nAWdYsGjLBKgr43IlV2qBCxZO2YsTryl52E6pVBbVuizBj8m6sO+3hM
hUBEbIrqvplrxf19y2HlNsygSlNFfMb3ptIIvTGGez+o8ZTAI3wXcFqxNxi8flo77yp6UH
x31zIDOJCfN98W1GYXVwXiowfkoKkROvbH9B/HsLTjuxkHzFCGwGNzEClr3ayJSmYyJu0P
nfjBPeZrL7Dxt1RwSfqI8j1kp4VhLCeEyFYS5pi8CypLgtvL37gLdqEGpBjcf4J/AyjDZJ
cDgzTI+ZrTP/ldhnVMy84B8TAC53swauaec1JKDtc+FNSN28GY/0VTcyH7Pwt9gRESWFsV
zrN4lwRWZivwndi3mj3zUcge3LQ6pBpjTEGiYIgNNJd5mjDZM9ieB4lC7+MTmq9Yg0Dzm4
u6uanAP5t2up6F5jck/7sLiAX4+fQ8vLZOAqsZdhAAAFgPS9UiD0vVIgAAAAB3NzaC1yc2
EAAAGBALepDcNAtmTMm5JXdLLnC5KWjLsJ+klwevvbHDd2TE0hUUjMWvOTE3nvLDrIsq5C
I7/OZwFnWLBoywSoK+NyJVdqgQsWTtmLE68pedhOqVQW1boswY/JurDvt4TIVARGyK6r6Z
a8X9fcth5TbMoEpTRXzG96bSCL0xhns/qPGUwCN8F3BasTcYvH5aO+8qelB8d9cyAziQnz
ffFtRmF1cF4qMH5KCpETr2x/Qfx7C047sZB8xQhsBjcxApa92siUpmMibtD534wT3may+w
8bdUcEn6iPI9ZKeFYSwnhMhWEuaYvAsqS4Lby9+4C3ahBqQY3H+CfwMow2SXA4M0yPma0z
/5XYZ1TMvOAfEwAud7MGrmnnNSSg7XPhTUjdvBmP9FU3Mh+z8LfYERElhbFc6zeJcEVmYr
8J3Yt5o981HIHty0OqQaY0xBomCIDTSXeZow2TPYngeJQu/jE5qvWINA85uLurmpwD+bdr
qeheY3JP+7C4gF+Pn0PLy2TgKrGXYQAAAAMBAAEAAAGAJVEQHtATPz/jjESAzajsTQiR55
8LX8ie9HV8sjgzIKjYXzZGdJ85odja38bPp2CA6wQBIePhvVZNidCxujEDLVPSjHIn60O6
6ChBPZYeCZvqKT3WxmRyrmjGnRAnIgdP103O1HXJ845A4sCIpjNzbcM5Ip15dtdyOM85Xn
uc5Di/I2wPlscIlyIyoqa1nyKFBh+TOMO/4Gm8+UT+u+akwj1IRSC+LOQXDLB+s9I8ZdTz
KyxuzFtGmAg5Qm+o+IBbRbvTzpdx2UHkiFw8+VQn8fwHuzfR+Od48D1kFBCk5yGcAMTQP3
g4AV8vp/UAVU3f4stYWh7okxXE7dKY+YTb1qHbjadNp9KqJUY3d+LO2F2vT7QBD4eIDS22
1emtqfaiLXXWDG1vZHXq3wx5MlvnwFE4gSY9yxF0FsSwi3s0j8zEYjszKQBiAoPLkxmqDq
2/WcmT9GhKd5FsMQEy0W8lBePtRYw85BRfhZH7Lzh0gGZ+3ZYss4qQS2vAzqWWiuhRAAAA
wHsVos2ccAcgMeTVYmo3JNgahAF0orP+NPxFLgZrK7Z0nwjICpKfaR6D3lWiFvlhUH33iv
wr3gCAFTNL7zblbJXTebA5dvw8kFmUuXhe7/uRGNjn2l38j0t+aHMXDVafo7Dm1chh6pa8
AyP5/OR9sVXsFVrkQ3+iVQHJBpsXDYlI7q5j51CrNb7wgr8l8HhWyDLDTg0irmzfrvPJ43
H7URIgDIDuX7mbSnYoDDtP2azdpaZyG1IZlbFkCNyaQtjycwAAAMEA8fq3kVuTqntNXqTE
3H7CnKSwR8w7yE/VGaVs7jLRvPyHpC3umUiKWjO/ebLMKBKdS3fQ0I72MB2BdeQbmuYTBY
2FwRQOAopjketAZDrZWhjmzRgSsSRofl3N/cqya6L+0RcAfwR/2OGM9E1QzEIyPcH8khVo
BK2I+xRpU5s1b5SXw5TOge9PXWgEWvRRtFRgbgOJ5WfPiLabKMm9skVx8BiNFzsVJxsEnb
WdwJKwnT+2a7gIOnM+DvFQiLyEr8QTAAAAwQDCTUpPyB8cqP0cCOFFH46im7ryV3ROZLlj
hj5dVKpXPyA5iHEQbPTx+VXOLSM1MysNRFPWlisE2OCES897kPgD5cypatnC1aa+sztOeD
fuuEN4wZXjDo97DhIaO6YtfzhXI5Y/CEOKWQmrWlEQEf4HEGoK2kQka5KeOPKQTACLcLqi
ATLFxSEDr6wyEwHA0EGh7WjH1zEpFDDY9pUCAwmyETD/OriqfCbRPhGrTTQVrcadG/Sc72
V5hjFzgl3J3TsAAAALcm9vdEBwYnMuY2k=
-----END OPENSSH PRIVATE KEY-----


================================================
FILE: ci/etc/id_rsa.pub
================================================
ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQC3qQ3DQLZkzJuSV3Sy5wuSloy7CfpJcHr72xw3dkxNIVFIzFrzkxN57yw6yLKuQiO/zmcBZ1iwaMsEqCvjciVXaoELFk7ZixOvKXnYTqlUFtW6LMGPybqw77eEyFQERsiuq+mWvF/X3LYeU2zKBKU0V8xvem0gi9MYZ7P6jxlMAjfBdwWrE3GLx+WjvvKnpQfHfXMgM4kJ833xbUZhdXBeKjB+SgqRE69sf0H8ewtOO7GQfMUIbAY3MQKWvdrIlKZjIm7Q+d+ME95msvsPG3VHBJ+ojyPWSnhWEsJ4TIVhLmmLwLKkuC28vfuAt2oQakGNx/gn8DKMNklwODNMj5mtM/+V2GdUzLzgHxMALnezBq5p5zUkoO1z4U1I3bwZj/RVNzIfs/C32BERJYWxXOs3iXBFZmK/Cd2LeaPfNRyB7ctDqkGmNMQaJgiA00l3maMNkz2J4HiULv4xOar1iDQPObi7q5qcA/m3a6noXmNyT/uwuIBfj59Dy8tk4Cqxl2E= root@pbs.ci


================================================
FILE: ci/etc/install-system-packages
================================================
#!/bin/bash -x

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

groupadd -g 1900 tstgrp00
groupadd -g 1901 tstgrp01
groupadd -g 1902 tstgrp02
groupadd -g 1903 tstgrp03
groupadd -g 1904 tstgrp04
groupadd -g 1905 tstgrp05
groupadd -g 1906 tstgrp06
groupadd -g 1907 tstgrp07
groupadd -g 901 pbs
groupadd -g 1146 agt
useradd -m -s /bin/bash -u 4357 -g tstgrp00 -G tstgrp00 pbsadmin
useradd -m -s /bin/bash -u 9000 -g tstgrp00 -G tstgrp00 pbsbuild
useradd -m -s /bin/bash -u 884 -g tstgrp00 -G tstgrp00 pbsdata
useradd -m -s /bin/bash -u 4367 -g tstgrp00 -G tstgrp00 pbsmgr
useradd -m -s /bin/bash -u 4373 -g tstgrp00 -G tstgrp00 pbsnonroot
useradd -m -s /bin/bash -u 4356 -g tstgrp00 -G tstgrp00 pbsoper
useradd -m -s /bin/bash -u 4358 -g tstgrp00 -G tstgrp00 pbsother
useradd -m -s /bin/bash -u 4371 -g tstgrp00 -G tstgrp00 pbsroot
useradd -m -s /bin/bash -u 4355 -g tstgrp00 -G tstgrp02,tstgrp00 pbstest
useradd -m -s /bin/bash -u 4359 -g tstgrp00 -G tstgrp00 pbsuser
useradd -m -s /bin/bash -u 4361 -g tstgrp00 -G tstgrp01,tstgrp02,tstgrp00 pbsuser1
useradd -m -s /bin/bash -u 4362 -g tstgrp00 -G tstgrp01,tstgrp03,tstgrp00 pbsuser2
useradd -m -s /bin/bash -u 4363 -g tstgrp00 -G tstgrp01,tstgrp04,tstgrp00 pbsuser3
useradd -m -s /bin/bash -u 4364 -g tstgrp01 -G tstgrp04,tstgrp05,tstgrp01 pbsuser4
useradd -m -s /bin/bash -u 4365 -g tstgrp02 -G tstgrp04,tstgrp06,tstgrp02 pbsuser5
useradd -m -s /bin/bash -u 4366 -g tstgrp03 -G tstgrp04,tstgrp07,tstgrp03 pbsuser6
useradd -m -s /bin/bash -u 4368 -g tstgrp01 -G tstgrp01 pbsuser7
useradd -m -s /bin/bash -u 11000 -g tstgrp00 -G tstgrp00 tstusr00
useradd -m -s /bin/bash -u 11001 -g tstgrp00 -G tstgrp00 tstusr01
chmod g+x,o+x /home/*

. /etc/os-release

if [ "x${ID}" == "xcentos" -a "x${VERSION_ID}" == "x8" ]; then
  sed -i -e "s|mirrorlist=|#mirrorlist=|g" /etc/yum.repos.d/CentOS-*
  sed -i -e "s|#baseurl=http://mirror.centos.org|baseurl=http://vault.centos.org|g" /etc/yum.repos.d/CentOS-*
  dnf -y clean all
  dnf -y install 'dnf-command(config-manager)'
  dnf -y config-manager --set-enabled powertools
  dnf -y install epel-release
  dnf -y update
  dnf -y install git gcc make m4 autoconf automake libtool rpm-build rpmdevtools \
    hwloc-devel libX11-devel libXt-devel libXext-devel libXft-devel \
    libedit-devel libical-devel cmake glibc-common yum-utils \
    ncurses-devel postgresql-devel python3-devel tcl-devel tk-devel swig \
    expat-devel openssl-devel libXext libXft expat libedit glibc-static \
    postgresql-server python3 tcl tk libical perl tar sendmail sudo perl-Env \
    perl-Switch gcc-c++ doxygen elfutils bison flex glibc-langpack-en \
    which net-tools man-db time csh lsof tzdata file \
    expect perl-App-cpanminus cpan initscripts \
    systemd systemd-sysv libcap rsyslog \
    openssh-clients openssh-server valgrind-devel valgrind libasan \
    llvm bc gzip gdb rsync wget curl ccache bind-utils vim iputils pam-devel
  dnf -y clean all
  rpmdev-setuptree
  __systemd_paths='/etc/systemd/system /usr/lib/systemd/system'
elif [ "x${ID}" == "xcentos" -a "x${VERSION_ID}" == "x7" ]; then
  yum -y clean all
  rpm --import https://package.perforce.com/perforce.pubkey &&
    {
      echo [perforce]
      echo name=Perforce
      echo baseurl=http://package.perforce.com/yum/rhel/7/x86_64
      echo enabled=1
      echo gpgcheck=1
    } >/etc/yum.repos.d/perforce.repo
  yum -y install epel-release
  yum -y update
  yum -y install git gcc make m4 autoconf automake libtool rpm-build rpmdevtools \
    hwloc-devel libX11-devel libXt-devel libXext-devel libXft-devel \
    libedit-devel libical-devel cmake glibc-common yum-utils \
    ncurses-devel postgresql-devel python3-devel tcl-devel tk-devel swig \
    expat-devel openssl-devel libXext libXft expat libedit glibc-static \
    postgresql-server python3 tcl tk libical perl tar sendmail sudo perl-Env \
    perl-Switch gcc-c++ doxygen elfutils bison flex postgresql-contrib \
    which net-tools man-db time csh lsof tzdata file glibc-langpack-en \
    expect perl-App-cpanminus cpan \
    systemd systemd-sysv libcap rsyslog \
    openssh-clients openssh-server valgrind-devel valgrind libasan pam-devel \
    llvm bc gzip gdb rsync wget curl ccache bind-utils vim iputils python2-pip helix-cli
  yum -y clean all
  rpmdev-setuptree
  __systemd_paths='/etc/systemd/system /usr/lib/systemd/system'
elif [ "x${ID}" == "xopensuse" -o "x${ID}" == "xopensuse-leap" ]; then
  __on="$(grep -oP '(?<=^NAME=").*(?=")' /etc/os-release)"
  __ov="$(grep -oP '(?<=^VERSION=").*(?=")' /etc/os-release)"
  zypper -n addrepo -ceKfG "https://download.opensuse.org/repositories/devel:tools/${__on// /_}_${__ov// /_}/devel:tools.repo"
  zypper -n addrepo -ceKfG "https://download.opensuse.org/repositories/devel:languages:perl/${__on// /_}_${__ov// /_}/devel:languages:perl.repo"
  zypper -n addrepo -ceKfG "http://package.perforce.com/yum/rhel/7/x86_64" p4
  zypper -n clean -mMa
  zypper -n refresh -fbd
  zypper --no-gpg-checks -n update --force-resolution
  zypper --no-gpg-checks -n install --force-resolution git m4 \
    gcc make autoconf automake libtool rpm-build rpmdevtools helix-cli hwloc-devel \
    libX11-devel libXt-devel libedit-devel libical-devel cmake ncurses-devel \
    postgresql-devel python3-devel tcl-devel tk-devel swig libexpat-devel \
    libopenssl-devel libXext-devel libXft-devel expat libedit fontconfig net-tools-deprecated net-tools \
    timezone python3-xml glibc-devel-static postgresql-server python3 python3-pip tcl tk \
    perl tar sendmail sudo gcc-c++ doxygen elfutils bison flex \
    which net-tools net-tools-deprecated man time tcsh lsof file vim \
    expect perl-App-cpanminus perl-Parse-PMFile hostname bind-utils \
    systemd systemd-sysvinit libcap-progs iputils rsyslog openssh pam-devel \
    valgrind-devel valgrind llvm gdb rsync wget ccache bc gzip python-pip
  zypper -n clean -mMa
  zypper -n rr devel_tools
  rpmdev-setuptree
  __systemd_paths='/etc/systemd/system /usr/lib/systemd/system'
elif [ "x${ID}" == "xubuntu" ]; then
  if [ "x${DEBIAN_FRONTEND}" == "x" ]; then
    export DEBIAN_FRONTEND=noninteractive
  fi
  apt -y update
  apt -y upgrade
  apt -y install git build-essential gcc g++ make dpkg-dev m4 \
    autoconf automake libtool rpm alien elfutils dh-make \
    libhwloc-dev libx11-dev libxt-dev libedit-dev libical-dev cmake \
    libncurses-dev libpq-dev python3-dev tcl-dev tk-dev swig libexpat1-dev \
    libssl-dev libxext-dev libxft-dev pkg-config expat postgresql perl tar \
    sendmail sendmail-bin sudo doxygen bison flex fakeroot libnuma1 \
    net-tools man time csh lsof curl gzip iputils-ping \
    expect cpanminus locales-all dnsutils tzdata vim bc file \
    systemd systemd-sysv sysvinit-utils libcap2-bin rsyslog libpam-dev \
    openssh-server openssh-client valgrind llvm gdb rsync wget ccache \
    python3 python3-pip cpanminus
  if [ "x${ID}" == "xubuntu" -a "x${VERSION_ID}" == "x16.04" ]; then
    wget -qO - https://package.perforce.com/perforce.pubkey | apt-key add - &&
      echo 'deb http://package.perforce.com/apt/ubuntu/ xenial release' >/etc/apt/sources.list.d/perforce.list
  else
    wget -qO - https://package.perforce.com/perforce.pubkey | apt-key add - &&
      echo 'deb http://package.perforce.com/apt/ubuntu/ bionic release' >/etc/apt/sources.list.d/perforce.list
  fi
  apt -y update
  apt -y install helix-cli
  __systemd_paths='/etc/systemd/system /lib/systemd/system'
  apt -y autoremove
  apt -y clean
  rm -rf /var/lib/apt/list/*
  mkdir -p /root/rpmbuild/SOURCES
fi

# Install pip, requests and sh python modules
set -ex &&
  python -m pip install --trusted-host pypi.org --trusted-host files.pythonhosted.org requests sh &&
  rm -rf ~/.cache /tmp/*

# QALib deps modules
cpanm -n --no-wget --no-lwp --curl \
  IO::Pty IPC::Run IPC::Cmd Class::Accessor Module::Build Pod::Usage \
  Getopt::Long DateTime Date::Parse Proc::ProcessTable Test::More \
  Unix::Process Time::HiRes File::FcntlLock File::Remote

find ${__systemd_paths} -path '*.wants/*' \
  -not -name '*journald*' \
  -not -name '*systemd-tmpfiles*' \
  -not -name '*systemd-user-sessions*' \
  -not -name '*getty*' \
  -not -name '*dbus*' \
  -exec rm -fv {} \;

cp /workspace/etc/ci-script-wrapper.service /etc/systemd/system
systemctl set-default multi-user.target

systemctl enable sshd || systemctl enable ssh
systemctl enable sendmail
if [ "x${ID}" != "xubuntu" -a "x${VERSION_ID}" != "x16.04" ]; then
  systemctl disable sm-client
  systemctl mask sm-client
fi
systemctl enable rsyslog
systemctl disable getty@.service
systemctl unmask getty.target
systemctl unmask console-getty
systemctl enable getty.target
systemctl enable console-getty
systemctl enable ci-script-wrapper

cp /workspace/etc/container-env-setup.sh /etc/profile.d/0container-env-setup.sh
cp /workspace/etc/sudoers-overrides /etc/sudoers.d/container-overrides

echo '' >/etc/security/limits.conf
rm -f /etc/security/limits.d/*.conf
rm -rf ~/.ssh
mkdir --mode=700 ~/.ssh
cp /workspace/etc/id_rsa* ~/.ssh/
chmod 0600 ~/.ssh/id_rsa
chmod 0644 ~/.ssh/id_rsa.pub
cp ~/.ssh/id_rsa.pub ~/.ssh/authorized_keys
chmod 0600 ~/.ssh/authorized_keys
echo 'root:pbs' | chpasswd
cat /etc/profile.d/0container-env-setup.sh >>/root/.profile
cat /etc/profile.d/0container-env-setup.sh >>/root/.bash_profile
cat /etc/profile.d/0container-env-setup.sh >>/root/.bashrc
for user in $(awk -F: '/^(pbs|tst)/ {print $1}' /etc/passwd); do
  rm -rf /home/${user}/.ssh
  cp -rfp ~/.ssh /home/${user}/
  chown -R ${user}: /home/${user}/.ssh
  echo "${user}:pbs" | chpasswd
  cat /etc/profile.d/0container-env-setup.sh >>/home/${user}/.profile
  cat /etc/profile.d/0container-env-setup.sh >>/home/${user}/.bash_profile
  cat /etc/profile.d/0container-env-setup.sh >>/home/${user}/.bashrc
  chown ${user}: /home/${user}/.bashrc /home/${user}/.profile /home/${user}/.bash_profile
done
echo 'Host *' >>/etc/ssh/ssh_config
echo '  StrictHostKeyChecking no' >>/etc/ssh/ssh_config
echo '  ConnectionAttempts 3' >>/etc/ssh/ssh_config
echo '  IdentityFile ~/.ssh/id_rsa' >>/etc/ssh/ssh_config
echo '  PreferredAuthentications publickey,password' >>/etc/ssh/ssh_config
echo 'PermitRootLogin yes' >>/etc/ssh/sshd_config
echo 'UseDNS no' >>/etc/ssh/sshd_config
sed -i 's/AcceptEnv/# AcceptEnv/g' /etc/ssh/sshd_config
ssh-keygen -A
rm -f /var/run/*.pid /run/nologin

rm -rf ~/.cache ~/.cpanm /var/{log,cache} /tmp /var/tmp /run/*.pid /var/run/*.pid
mkdir -p --mode=0755 /var/{log,cache}
mkdir -p --mode=1777 /tmp /var/tmp


================================================
FILE: ci/etc/killit.sh
================================================
#!/bin/bash -x

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

killit() {
    if [ -z "$1" ]; then
        return 0
    fi
    pid=$(ps -ef 2>/dev/null | grep $1 | grep -v grep | awk '{print $2}')
    if [ ! -z "${pid}" ]; then
        echo "kill -TERM ${pid}"
        kill -TERM ${pid} 2>/dev/null
    else
        return 0
    fi
    sleep 10
    pid=$(ps -ef 2>/dev/null | grep $1 | grep -v grep | awk '{print $2}')
    if [ ! -z "${pid}" ]; then
        echo "kill -KILL ${pid}"
        kill -KILL ${pid} 2>/dev/null
    fi
}

kill_pbs_process() {
    ps -eaf 2>/dev/null | grep pbs_ | grep -v grep | wc -l
    if [ $ret -gt 0 ]; then
        killit pbs_server
        killit pbs_mom
        killit pbs_comm
        killit pbs_sched
        killit pbs_ds_monitor
        killit /opt/pbs/pgsql/bin/postgres
        killit pbs_benchpress
        ps_count=$(ps -eaf 2>/dev/null | grep pbs_ | grep -v grep | wc -l)
        if [ ${ps_count} -eq 0 ]; then
            return 0
        else
            return 1
        fi
    fi
}

. /etc/os-release

if [ "x$1" == "xbackup" ]; then
    time_stamp=$(date -u "+%Y-%m-%d-%H%M%S")
    folder=session-${time_stamp}
    mkdir -p /logs/${folder}
    cp /logs/build-* /logs/${folder}
    cp /logs/logfile* /logs/${folder}
    cp /logs/result* /logs/${folder}
    cp /src/.config_dir/.conf.json /logs/${folder}/conf.json
    cp /src/docker-compose.json /logs/${folder}/
    rm -rf /logs/build-*
    rm -rf /logs/logfile*
    rm -rf /logs/result*
    rm -rf /pbssrc/target-*
    exit 0
fi

clean=${1}
echo "Trying to stop all process via init.d"
/etc/init.d/pbs stop
ret=$?
if [ ${ret} -ne 0 ]; then
    echo "failed graceful stop"
    echo "force kill all processes"
    kill_pbs_process
else
    echo "checking for running ptl"
    benchpress_count=$(ps -ef 2>/dev/null | grep $1 | grep -v grep | wc -l)
    if [ ${benchpress_count} -gt 0 ]; then
        killit pbs_benchpress
    else
        echo "No running ptl tests found"
    fi
fi

if [ "XX${clean}" == "XXclean" ]; then
    cd /pbssrc/target-${ID} && make uninstall
    rm -rf /etc/init.d/pbs
    rm -rf /etc/pbs.conf
    rm -rf /var/spool/pbs
    rm -rf /opt/ptl
    rm -rf /opt/pbs
fi


================================================
FILE: ci/etc/macros
================================================
CONFIG_DIR=.config_dir
STATUS_FILE=status
PARAM_FILE=params
REQUIREMENT_DECORATOR_FILE=requirements_decorator
CONFIGURE_OPT_FILE=configure_opt
BENCHPRESS_OPT_FILE=benchpress_opt
CONF_JSON_FILE=conf.json
REQ_DOCKER_VERSION=17.12.0
DEFAULT_PLATFORM=centos:8
SUPPORTED_PLATFORMS=centos:7,centos:8,ubuntu:16.04,ubuntu:18.04


================================================
FILE: ci/etc/sudoers-overrides
================================================
Defaults	syslog = local7
Defaults	always_set_home
Defaults	!requiretty
Defaults	!env_reset
Defaults	!secure_path
Defaults	env_keep = "*"
ALL ALL=(ALL)       NOPASSWD: ALL


================================================
FILE: configure.ac
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_PREREQ([2.63])
# Use PBS_VERSION to override the version statically defined here. For example:
# ./configure PBS_VERSION=20.0.0 --prefix=/opt/pbs
AC_INIT([OpenPBS],
  [23.06.06],
  [pbssupport@altair.com],
  [openpbs],
  [http://www.openpbs.org/])
AC_CONFIG_HEADERS([src/include/pbs_config.h])
AC_CONFIG_SRCDIR([src/cmds/qmgr.c])
AC_CONFIG_AUX_DIR([buildutils])
AC_CONFIG_MACRO_DIR([m4])
AC_CANONICAL_TARGET([])
os_id=`grep ^ID= /etc/os-release | sed -n 's/.*"\(.*\)"/\1/p'`
AS_CASE([$os_id],
  [opensuse-tumbleweed], m4_define([am_init_string], [-Wall foreign subdir-objects]),
  [*], m4_define([am_init_string], [-Wall foreign]))
AM_INIT_AUTOMAKE(am_init_string)
AC_USE_SYSTEM_EXTENSIONS


# Checks for programs.
AC_PROG_AWK
AC_PROG_YACC
AC_PROG_SED
AC_PROG_CC
AC_PROG_LEX
AC_PROG_INSTALL
AC_PROG_LN_S
AC_PROG_CXX

AC_SUBST([AM_CXXFLAGS], [--std=c++11])

# Automake macros
#AM_PROG_AR macro is defined with automake version >= 1.12
m4_ifdef([AM_PROG_AR], [AM_PROG_AR])
AM_PROG_CC_C_O

# Initialize libtool
AM_PROG_LIBTOOL
LT_INIT([shared static])

# Checks for libraries.
AC_CHECK_LIB([c], [xdr_int],
  [],
  AC_CHECK_LIB(nsl, xdr_int)
)
AC_CHECK_LIB([c], [ruserok],
  [],
  AC_CHECK_LIB(socket, ruserok)
)
AC_CHECK_LIB([c], [crypt],
  [],
  AC_CHECK_LIB(crypt, crypt)
)
AC_CHECK_LIB([c], [posix_openpt],
  AC_DEFINE([HAVE_POSIX_OPENPT], [], [Defined whe posix_openpt is available])
)
AC_CHECK_LIB(dl, dlopen)
AC_CHECK_LIB([kvm], [kvm_open])
AC_CHECK_LIB([socket], [socket],
  [socket_lib="-lsocket -lnsl"]
  AC_SUBST(socket_lib),
  [socket_lib=""]
  AC_SUBST(socket_lib),
  [-lnsl]
)
AC_CHECK_LIB([c], [malloc_info],
  AC_DEFINE([HAVE_MALLOC_INFO], [], [Defined when malloc_info is available])
)

# Check for X Window System
AC_PATH_XTRA

# Checks for optional header files.
AC_CHECK_HEADERS([ \
	com_err.h \
	gssapi.h \
	krb5.h \
	libpq-fe.h \
	mach/mach.h \
	nlist.h \
	sys/eventfd.h \
	sys/systeminfo.h \
])

# Checks for required header files.
AC_CHECK_HEADERS([ \
	stdio.h \
	alloca.h \
	arpa/inet.h \
	assert.h \
	ctype.h \
	dirent.h \
	dlfcn.h \
	execinfo.h \
	fcntl.h \
	float.h \
	fstab.h \
	ftw.h \
	grp.h \
	libgen.h \
	limits.h \
	math.h \
	memory.h \
	netdb.h \
	netinet/in.h \
	netinet/in_systm.h \
	netinet/ip.h \
	netinet/tcp.h \
	openssl/aes.h \
	openssl/bio.h \
	openssl/err.h \
	openssl/evp.h \
	openssl/ssl.h \
	paths.h \
	poll.h \
	pthread.h \
	pwd.h \
	regex.h \
	signal.h \
	stdbool.h \
	stddef.h \
	stdint.h \
	stdio.h \
	stdlib.h \
	string.h \
	strings.h \
	syslog.h \
	sys/fcntl.h \
	sys/file.h \
	sys/ioctl.h \
	sys/mman.h \
	sys/mount.h \
	sys/param.h \
	sys/poll.h \
	sys/quota.h \
	sys/resource.h \
	sys/select.h \
	sys/signal.h \
	sys/socket.h \
	sys/stat.h \
	sys/statvfs.h \
	sys/time.h \
	sys/timeb.h \
	sys/times.h \
	sys/types.h \
	sys/uio.h \
	sys/un.h \
	sys/user.h \
	sys/utsname.h \
	sys/wait.h \
	termios.h \
	time.h \
	unistd.h \
	utime.h \
	X11/Intrinsic.h \
	X11/X.h \
	X11/Xlib.h \
	zlib.h \
	],, AC_MSG_ERROR([Required header file is missing.]) \
)

# Checks for typedefs, structures, and compiler characteristics.
#AC_CHECK_HEADER_STDBOOL macro is defined with autoconf version >= 2.67
m4_ifdef([AC_CHECK_HEADER_STDBOOL], [AC_CHECK_HEADER_STDBOOL])
AC_TYPE_UID_T
AC_TYPE_MODE_T
AC_TYPE_OFF_T
AC_TYPE_PID_T
AC_C_RESTRICT
AC_TYPE_SIZE_T
AC_TYPE_SSIZE_T
AC_CHECK_MEMBERS([struct stat.st_blksize])
AC_TYPE_UINT16_T
AC_TYPE_UINT32_T
AC_TYPE_UINT64_T
AC_TYPE_UINT8_T
AC_CHECK_TYPES([ptrdiff_t])

# Checks for library functions.
AC_FUNC_ALLOCA
AC_FUNC_CHOWN
AC_FUNC_ERROR_AT_LINE
AC_FUNC_FORK
AC_FUNC_GETGROUPS
AC_FUNC_GETMNTENT
AC_FUNC_LSTAT_FOLLOWS_SLASHED_SYMLINK
AC_FUNC_MKTIME
AC_FUNC_MMAP
AC_FUNC_STRERROR_R
AC_FUNC_STRTOD
AC_CHECK_FUNCS([ \
	alarm \
	atexit \
	bzero \
	dup2 \
	endpwent \
	floor \
	ftruncate \
	getcwd \
	gethostbyaddr \
	gethostbyname \
	gethostname \
	getmntent \
	getpagesize \
	gettimeofday \
	hasmntopt \
	inet_ntoa \
	localtime_r \
	memchr \
	memmove \
	memset \
	mkdir \
	munmap \
	pathconf \
	poll \
	pstat_getdynamic \
	putenv \
	realpath \
	regcomp \
	rmdir \
	select \
	setresuid \
	setresgid \
	getpwuid \
	initgroups \
	seteuid \
	setegid \
	strerror_r \
	socket \
	strcasecmp \
	strchr \
	strcspn \
	strdup \
	strerror \
	strncasecmp \
	strpbrk \
	strrchr \
	strspn \
	strstr \
	strtol \
	strtoul \
	strtoull \
	sysinfo \
	uname \
	utime \
])

PKG_PROG_PKG_CONFIG
m4_ifdef([PKG_INSTALLDIR],
  [PKG_INSTALLDIR],
  [
    pkgconfigdir=/usr/lib64/pkgconfig
    AC_SUBST([pkgconfigdir])
  ])


# PBS macros (order matters for some of these)
PBS_AC_PBS_VERSION
PBS_AC_DECL_H_ERRNO
PBS_AC_DECL_SOCKLEN_T
PBS_AC_DECL_EPOLL
PBS_AC_DECL_EPOLL_PWAIT
PBS_AC_DECL_PPOLL
PBS_AC_WITH_SERVER_HOME
PBS_AC_WITH_SERVER_NAME_FILE
PBS_AC_WITH_DATABASE_DIR
PBS_AC_WITH_DATABASE_USER
PBS_AC_WITH_DATABASE_PORT
PBS_AC_WITH_PBS_CONF_FILE
PBS_AC_WITH_TMP_DIR
PBS_AC_WITH_UNSUPPORTED_DIR
PBS_AC_WITH_CORE_LIMIT
PBS_AC_WITH_PYTHON
PBS_AC_WITH_EXPAT
PBS_AC_WITH_EDITLINE
PBS_AC_WITH_HWLOC
PBS_AC_WITH_LIBICAL
PBS_AC_WITH_PMIX
PBS_AC_WITH_SENDMAIL
PBS_AC_WITH_SWIG
PBS_AC_WITH_TCL
PBS_AC_WITH_TCLATRSEP
PBS_AC_WITH_XAUTH
PBS_AC_WITH_KRBAUTH
PBS_AC_WITH_MIN_STACK_LIMIT
PBS_AC_DISABLE_SHELL_PIPE
PBS_AC_DISABLE_SYSLOG
PBS_AC_SECURITY
PBS_AC_ENABLE_ALPS
PBS_AC_WITH_LIBZ
PBS_AC_ENABLE_PTL
PBS_AC_SYSTEMD_UNITDIR
PBS_AC_PATCH_LIBTOOL
PBS_AC_WITH_CJSON

AC_CONFIG_FILES([
	openpbs.spec
	Makefile
	buildutils/Makefile
	doc/Makefile
	test/Makefile
	test/fw/Makefile
	test/tests/Makefile
	test/fw/setup.py
	test/fw/ptl/__init__.py
	src/Makefile
	src/cmds/Makefile
	src/cmds/mpiexec
	src/cmds/pbs_lamboot
	src/cmds/pbs_mpihp
	src/cmds/pbs_mpilam
	src/cmds/pbs_mpirun
	src/cmds/pbs_remsh
	src/cmds/pbsrun_unwrap
	src/cmds/pbsrun_wrap
	src/cmds/pbsrun
	src/cmds/scripts/Makefile
	src/cmds/scripts/modulefile
	src/cmds/scripts/pbs_habitat
	src/cmds/scripts/pbs_init.d
	src/cmds/scripts/pbs_reload
	src/cmds/scripts/pbs_poerun
	src/cmds/scripts/pbs_postinstall
	src/cmds/scripts/pbs.service
	src/cmds/scripts/pbsrun.poe
	src/hooks/Makefile
	src/iff/Makefile
	src/include/Makefile
	src/include/pbs_version.h
	src/lib/Libattr/Makefile
	src/lib/Libdb/Makefile
	src/lib/Libdb/pgsql/Makefile
	src/lib/Libifl/Makefile
	src/lib/Liblog/Makefile
	src/lib/Libnet/Makefile
	src/lib/Libpbs/Makefile
	src/lib/Libpbs/pbs.pc
	src/lib/Libpython/Makefile
	src/lib/Libsec/Makefile
	src/lib/Libsite/Makefile
	src/lib/Libtpp/Makefile
	src/lib/Libutil/Makefile
	src/lib/Libauth/Makefile
	src/lib/Libauth/gss/Makefile
	src/lib/Libauth/munge/Makefile
	src/lib/Liblicensing/Makefile
	src/lib/Libjson/Makefile
	src/lib/Libjson/cJSON/Makefile
	src/lib/Makefile
	src/modules/Makefile
	src/modules/python/Makefile
	src/mom_rcp/Makefile
	src/resmom/Makefile
	src/scheduler/Makefile
	src/server/Makefile
	src/tools/Makefile
	src/tools/wrap_tcl.sh
	src/unsupported/Makefile
])
AC_OUTPUT


================================================
FILE: doc/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

notrans_dist_man1_MANS = \
	man1/pbsdsh.1B \
	man1/pbs_login.1B \
	man1/pbs_python.1B \
	man1/pbs_ralter.1B \
	man1/pbs_rdel.1B \
	man1/pbs_release_nodes.1B \
	man1/pbs_rstat.1B \
	man1/pbs_rsub.1B \
	man1/qalter.1B \
	man1/qdel.1B \
	man1/qhold.1B \
	man1/qmove.1B \
	man1/qmsg.1B \
	man1/qorder.1B \
	man1/qrerun.1B \
	man1/qrls.1B \
	man1/qselect.1B \
	man1/qsig.1B \
	man1/qstat.1B \
	man1/qsub.1B

notrans_dist_man3_MANS = \
	man3/pbs_alterjob.3B \
	man3/pbs_asyrunjob.3B \
	man3/pbs_confirmresv.3B \
	man3/pbs_connect.3B \
	man3/pbs_default.3B \
	man3/pbs_deljob.3B \
	man3/pbs_delresv.3B \
	man3/pbs_disconnect.3B \
	man3/pbs_geterrmsg.3B \
	man3/pbs_holdjob.3B \
	man3/pbs_locjob.3B \
	man3/pbs_manager.3B \
	man3/pbs_modify_resv.3B \
	man3/pbs_movejob.3B \
	man3/pbs_msgjob.3B \
	man3/pbs_orderjob.3B \
	man3/pbs_preempt_jobs.3B \
	man3/pbs_rerunjob.3B \
	man3/pbs_rescreserve.3B \
	man3/pbs_relnodesjob.3B \
	man3/pbs_rlsjob.3B \
	man3/pbs_runjob.3B \
	man3/pbs_selectjob.3B \
	man3/pbs_selstat.3B \
	man3/pbs_sigjob.3B \
	man3/pbs_stagein.3B \
	man3/pbs_statfree.3B \
	man3/pbs_stathook.3B \
	man3/pbs_stathost.3B \
	man3/pbs_statjob.3B \
	man3/pbs_statnode.3B \
	man3/pbs_statque.3B \
	man3/pbs_statresv.3B \
	man3/pbs_statrsc.3B \
	man3/pbs_statsched.3B \
	man3/pbs_statserver.3B \
	man3/pbs_statvnode.3B \
	man3/pbs_submit.3B \
	man3/pbs_submit_resv.3B \
	man3/pbs_tclapi.3B \
	man3/pbs_terminate.3B \
	man3/rm.3B \
	man3/tm.3

noinst_man3_MANS = \
	man3/pbs_rescquery.3B \
	man3/pbs_submitresv.3B

notrans_dist_man7_MANS = \
	man1/pbs_hook_attributes.7B \
	man1/pbs_job_attributes.7B \
	man1/pbs_module.7B \
	man1/pbs_node_attributes.7B \
	man1/pbs_professional.7B \
	man1/pbs_queue_attributes.7B \
	man1/pbs_resources.7B \
	man1/pbs_resv_attributes.7B \
	man1/pbs_sched_attributes.7B \
	man1/pbs_server_attributes.7B

notrans_dist_man8_MANS = \
	man8/mpiexec.8B \
	man8/pbs.8B \
	man8/pbs_account.8B \
	man8/pbs_attach.8B \
	man8/pbs_comm.8B \
	man8/pbs.conf.8B \
	man8/pbs_dataservice.8B \
	man8/pbs_ds_password.8B \
	man8/pbsfs.8B \
	man8/pbs_hostn.8B \
	man8/pbs_idled.8B \
	man8/pbs_iff.8B \
	man8/pbs_interactive.8B \
	man8/pbs_lamboot.8B \
	man8/pbs_mkdirs.8B \
	man8/pbs_mom.8B \
	man8/pbs_mpihp.8B \
	man8/pbs_mpilam.8B \
	man8/pbs_mpirun.8B \
	man8/pbsnodes.8B \
	man8/pbs_probe.8B \
	man8/pbsrun.8B \
	man8/pbsrun_unwrap.8B \
	man8/pbsrun_wrap.8B \
	man8/pbs_sched.8B \
	man8/pbs_server.8B \
	man8/pbs_snapshot.8B \
	man8/pbs_tclsh.8B \
	man8/pbs_tmrsh.8B \
	man8/pbs_topologyinfo.8B \
	man8/pbs_wish.8B \
	man8/printjob.8B \
	man8/qdisable.8B \
	man8/qenable.8B \
	man8/qmgr.8B \
	man8/qrun.8B \
	man8/qstart.8B \
	man8/qstop.8B \
	man8/qterm.8B \
	man8/tracejob.8B \
	man8/win_postinstall.py.8B


================================================
FILE: doc/man1/pbs_hook_attributes.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_hook_attributes 7B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_hook_attributes 
\- attributes of PBS hooks

.SH DESCRIPTION
.LP
Hook attributes can be set, unset, and viewed using the 
.B qmgr 
command.
See the 
.B qmgr(1B) 
man page.

An unset hook attribute takes the default value for that attribute.

Under UNIX/Linux, root privilege is required in order to operate on
hooks.  Under Windows, this must be done from the installation
account.  For domained environments, the installation account must be
a lo cal account that is a member of the local Administrators group on
the local computer.  For standalone environments, the ins tallation
account must be a local account that is a member of the local
Administrators group on the local computer.

.IP "alarm=<n>"
Specifies the number of seconds to allow a hook to run before
the hook times out.
.br
Set by administrator.
.br
Valid values: >0
.br
Format: Integer
.br
Default value: 30

.IP "debug"
Specifies whether or not the hook produces debugging files under
PBS_HOME/server_priv/hooks/tmp or PBS_HOME/mom_priv/hooks/tmp.  Files
are named hook_<hook event>_<hook name>_<unique ID>.in, .data, and .out.
When this is set to 
.I true, 
the hook leaves debugging files.
.br
Set by administrator.
.br
Format: Boolean
.br
Default value: False

.IP "enabled"
Determines whether or not a hook is run when its triggering event occurs.
If a hook's 
.I enabled
attribute is 
.I True, 
the hook is run.
.br
Set by administrator.
.br
Format: Boolean
.br
Default: True

.IP "event"
List of events that trigger the hook.  Can be operated on with 
the "=", "+=", and "-=" operators.  The 
.I provision
event cannot be combined with any other events.
.br
Valid events: 
.RS 11
.nf
"exechost_periodic"
"exechost_startup" 
"execjob_attach"
"execjob_begin"
"execjob_end"
"execjob_epilogue" 
"execjob_launch" 
"execjob_postsuspend"
"execjob_preresume"
"execjob_preterm" 
"execjob_prologue"
"modifyjob" 
"movejob" 
"periodic"
"provision"
"queuejob"
"resvsub" 
"runjob"
"" (meaning no event)
.fi
.RE
.IP
.br
Set by administrator.
.br
Format: string array 
.br
Default value: "" (meaning none, i.e. the hook is not triggered)

.IP "fail_action"
Specifies the action to be taken when hook fails due to alarm call or
unhandled exception, or to an internal error such as not enough disk
space or memory.  Can also specify a subsequent action to be taken
when hook runs successfully.  Value can be either "none" or one or more of 
"offline_vnodes", "clear_vnodes_upon_recovery", and "scheduler_restart_cycle". 
If this attribute is set to multiple values, scheduler restart happens last.
.br
.I offline_vnodes
.RS 11
After unsuccessful hook execution, offlines the vnodes managed by the MoM
executing the hook.  Only available for execjob_prologue, exechost_startup
and execjob_begin hooks.
.RE
.IP
.I clear_vnodes_upon_recovery
.RS 11
After successful hook execution, clears vnodes previously offlined via
offline_vnodes fail action.  Only available for exechost_startup hooks.
.RE
.IP
.I scheduler_restart_cycle
.RS 11
After unsuccessful hook execution, restarts scheduling cycle.  Only 
available for execjob_begin and execjob_prologue hooks.
.RE
.IP
.br
Set by administrator.
.br
Format: string_array
.br
Default value: "none"

.IP "freq"
Number of seconds between periodic or exechost_periodic triggers.
.br
Set by administrator.
.br 
Format: integer
.br
Default: 120 seconds

.IP "order"
Indicates relative order of hook execution, for hooks of the same 
type sharing a trigger.  Hooks with lower 
.I order
values execute before those with higher values.
Does not apply to periodic or exechost_periodic hooks.
.br
Set by administrator.
.br
Valid values:
.RS 8
Built-in hooks:
.I [-1000, 2000]
.br
Site hooks:
.I [1, 1000]
.RE
.IP
Format: Integer
.br
Default value: 1

.IP "Type"
The type of the hook.  Cannot be set for a built-in hook.
.br
Valid values: "pbs", "site"
.br
.I pbs
.RS 11
Hook is built in.
.RE
.IP
.I site
.RS 11
Hook is custom (site-defined).
.RE
.IP
.br
Set by administrator.
.br
Format: String
.br
Default value: "site"

.IP "user"
Specifies who executes the hook.  
.br
Valid values: "pbsadmin", "pbsuser"
.br
.I "pbsadmin"
.RS 11
The hook executes as root.  
.RE
.IP
.I "pbsuser"
.RS 11
The hook executes as the triggering job's owner.
.RE
.IP
.br
Set by administrator.
.br
Format: String
.br
Default value: "pbsadmin"

.SH SEE ALSO
qmgr(1B),
pbs_module(7B), 
pbs_stathook(3B)


================================================
FILE: doc/man1/pbs_job_attributes.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_job_attributes 7B "4 March 2021" Local "PBS Professional"
.SH NAME
.B pbs_job_attributes 
\- attributes of PBS jobs
.SH DESCRIPTION
Each PBS job has attributes that characterize that job.

.IP "Account_Name" 8
String used for accounting purposes.  Can be used for fairshare.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String; 
can contain any character.
.br
Python type: 
.I str
.br
Default: No default

.IP accounting_id 8
Accounting ID for tracking accounting data not produced by PBS.
Readable by all.
.br
Format: 
.I String
.br
Python type: 
.I str

.IP accrue_type 8
Indicates what kind of time the job is accruing.  
.br
Readable by Manager only.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Valid values: 
.RS 11
One of 0 (initial_time), 1 (ineligible_time), 2 (eligible_time), or 3 (run_time).  
.RE
.IP
Default:
.I 2 (eligible_time)

.IP alt_id 8
For a few systems, the session ID is insufficient to track which
processes belong to the job.  Where a different identifier is
required, it is recorded in this attribute.  If set, it will also be
recorded in the end-of-job accounting record.  
.br
On Windows, holds PBS home directory.
.br
Readable by all; settable by None.
.br
Format:
.I String; 
may contain white spaces.
.br
Python type: 
.I str
.br
Default: No default

.IP "argument_list" 8
Job executable's argument list.  Shown if job is submitted with 
"-- <executable> [<argument list>]".
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I JSDL=encoded string
.RS 11
.I <jsdl-hpcpa:Argument> <1st arg> </jsdl-hpcpa:Argument>
.br
.I <jsdl-hpcpa:Argument> <2nd arg> </jsdl-hpcpa:Argument>
.br
.I <jsdl-hpcpa:Argument> <nth arg> </jsdl-hpcpa:Argument>
.RE
.IP
Example: 
.RS 11
If arguments are "A B": 
<jsdl-hpcpa:Argument>A</jsdl-hpcpa:Argument> <jsdl-hpcpa:Argument>B</jsdl-hpcpa:Argument>
.RE
.IP
Python type: 
.I str
.br
Default: No default

.IP array 8
Indicates whether this is a job array.  Set to 
.I True
if this is an array job.
.br
Can be read and set by user.  Can be read by Manager and Operator.
.br
Format: 
.I Boolean
.br
Python type: 
.I bool
.br
Default: 
.I False

.IP array_id 8
Applies only to subjobs.  Array identifier of subjob.
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP array_index 8
Applies only to subjobs.  Index number of subjob. 
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I int
.br
Default: No default

.IP array_indices_remaining 8
Applies only to job arrays.  List of indices of subjobs still queued.  
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Syntax: Range or list of ranges, e.g. 500, 552, 596-1000
.br
Python type: 
.I str
.br
Default: No default

.IP array_indices_submitted 8
Applies only to job arrays.  Complete list of indices of subjobs 
given at submission time.  
.br
Can be read and set by user.  Can be read by Manager and Operator.
.br
Format: 
.I String
.br
Syntax: 
Given as range, e.g. 1-100
.br
Python type: 
.I pbs.range
.br
Default: No default

.IP array_state_count 8
Applies only to job arrays.  Lists number of subjobs in each state. 
.br 
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I pbs.state_count
.br
Default: No default

.IP "block" 8
Specifies whether qsub will wait for the job to complete and
return the exit value of the job.  
.br
For X11 forwarding jobs, and jobs with 
.I interactive
and 
.I block
attributes set to
.I True, 
the job's exit status is not returned.
.br
When 
.I block 
is 
.I True, 
qsub waits for the job to finish.  
.br
Can be read and set by user.  Can be read by Manager and Operator.
.br
Format: 
.I Boolean
.br
Python type: 
.I int
.br
Default: 
.I False

.IP "Checkpoint" 8
Determines when the job will be checkpointed.  An 
.I $action
script is required to checkpoint the job.  See the 
.I pbs_mom(8B)
man page. 
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String, 
containing description of interval at which to checkpoint.
.br
Python type: 
.I pbs.checkpoint
.br
Valid values:  
.RS
.IP c 3
Checkpoint at intervals, measured in CPU time, set on the job's 
execution queue.  If no interval set at queue, job is not checkpointed.

.IP "c=<minutes of CPU time>" 3
Checkpoint at intervals of the specified number of minutes of job CPU
time.  This value must be greater than zero.  If the interval
specified is less than that set on the job's execution queue, the
queue's interval is used.
.br
Format:
.I Integer

.IP w 3
Checkpoint at intervals, measured in walltime, set on job's execution 
queue.  If no interval set at queue, job is not checkpointed.

.IP "w=<minutes of walltime>" 3
Checkpoint at intervals of the specified number of minutes of job 
walltime.  This value must be greater than zero.  If the interval 
specified is less that that set on job's execution queue, the 
queue's interval is used.
.br
Format: 
.I Integer
.IP n 3
No checkpointing.
.IP s 3
Checkpoint only when the server is shut down.
.IP u 3
Unset.  Defaults to behavior when 
.I interval
argument is set to 
.I s.
.LP
Default: 
.I u
.RE

.IP comment 8
Comment about job.  Informational only.
.br
Can be read by user.  Can be read and set by Operator, Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP create_resv_from_job 8
When this attribute is
.I True, 
when this job is run, immediately creates and confirms a job-specific
start reservation on the same resources as the job (including
resources inherited by the job), and places the job in the
job-specific reservation's queue.  Sets the job's
.I create_resv_from_job 
attribute to 
.I True.  
Sets the job-specific reservation's 
.I reserve_job 
attribute to the ID of the job from which the reservation was created.
The new reservation's duration and start time are the same as the
job's walltime and start time.  If the job is peer scheduled, the
job-specific reservation is created in the pulling complex.
.br
Readable and settable by all.
.br
Format: 
.I Boolean
.br
Python type:
.I bool
.br
Default: 
.I False


.IP ctime 8
Timestamp; time at which the job was created.  
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer
.br
Syntax: Timestamp.  
.RS 11
Printed by 
.B qstat
in human-readable format.  Output by hooks as seconds since epoch.
.RE
.IP
Python type: 
.I int
.br
Default: No default

.IP depend 8
Specifies inter-job dependencies.
.br
No limit on number of dependencies.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
"<type>:<job ID>[,<job ID> ...][,<type>:<job ID>[,<job ID> ...] ...]"
.br
Must be enclosed in double quotes if it contains commas.  
.RE
.IP
Example: "before:123,456"
.br
Python type: 
.I pbs.depend
.br
Valid values: 
.RS
.IP "after:<job ID list>" 3
This job may run at any point after all jobs in 
.I job ID list 
have started execution.

.IP "afterok:<job ID list>" 3
This job may run only after all jobs in 
.I job ID list 
have terminated with no errors.

.IP "afternotok:<job ID list>" 3
This job may run only after all jobs in 
.I job ID list 
have terminated with errors.

.IP "afterany:<job ID list>"  
This job can run after all jobs in 
.I job ID list
have finished execution, with or without errors. This job will not run
if a job in the 
.I job ID list 
was deleted without ever having been run.

.IP "before:<job ID list>" 3    
Jobs in 
.I job ID list 
may start once this job has started.

.IP "beforeok:<job ID list>" 3  
Jobs in 
.I job ID list 
may start once this job terminates without errors.

.IP "beforenotok:<job ID list>" 3
If this job terminates execution with errors, jobs in 
.I job ID list 
may begin.

.IP "beforeany:<job id list>" 3 
Jobs in 
.I job ID list 
may begin execution once this job terminates execution, with or without errors.

.IP "on:<count>" 3
This job may run after 
.I count 
dependencies on other jobs have been satisfied. This type is used with one of the 
.I before types listed. 
.I Count 
is an integer greater than 
.I 0.
.RE
.IP
Default: No dependencies

.IP egroup 8
If the job is queued, this attribute is set to the
group name under which the job is to be run.  
.br
Readable by Manager only.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP eligible_time 8
The amount of wall clock wait time a job has accrued while the job
is blocked waiting for resources.  For a job currently accruing 
.I eligible_time, 
if we were to add enough of the right type of resources, the job would
start immediately.
.br
Viewable via 
.B qstat -f.
.br
Readable by job owner, Manager and Operator.  Settable by Operator or Manager.
.br
Format: 
.I Duration
.br
Python type: 
.I pbs.duration
.br
Default: 
.I Zero

.IP "Error_Path" 8
The final path name for the file containing the job's standard error
stream.  See the
.B qsub
and
.B qalter
commands.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Syntax: 
.I [<hostname>:]<path>
.br
Valid values:
.RS
.IP "<relative path>" 3
Path is relative to the current working directory of command executing
on current host.
.IP "<absolute path>" 3
Path is absolute path on current host where command is executing.
.IP "<hostname>:<relative path>" 3
Path is relative to user's home directory on specified host.
.IP "<hostname>:<absolute path>" 3
Path is absolute path on named host.
.IP "No path" 3 
Path is current working directory where qsub is executed.
.RE
.IP
Default: Default path is current working directory where qsub is run.
If the output path is specified, but does not include a
filename, the default filename is 
.I <job ID>.ER.  
If the path name is not specified, the default filename is 
.I <job name>.e<sequence number>.


.IP estimated 8
List of estimated values for job.  Used to report job's 
.I exec_vnode, start_time, 
and 
.I soft_walltime.
Can be set in a hook or via qalter, but PBS will overwrite the values.  
.br
Format: Format of reported element
.br
Syntax: 
.RS 11
.I estimated.<resource name>=<value>[, estimated.<resource name>=<value> ...]
.RE
.IP
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
estimated.<resource name>=<value>
.br
where <resource name> is a resource
.RE
.IP
Reported values: 
.RS
.IP "exec_vnode" 3
The estimated vnodes used by this job.     
.br
Readable by all; settable by Manager and Operator.
.br
Format: 
.I String
.br
Python type: 
.I pbs.exec_vnode
.br
Default: Unset   

.IP "soft_walltime" 3
The estimated soft walltime for this job.  Calculated when a job
exceeds its soft_walltime resource.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Duration
.br
Python type: 
.I pbs.duration
.br
Default: Unset

.IP "start_time" 3
The estimated start time for this job.
.br
Readable by all; settable by Manager and Operator.
.br
Format: 
.I start_time 
is printed by qstat
in human-readable format; 
.I start_time 
output in hooks as seconds since epoch.
.br
Python type: 
.I int
.br
Default: Unset

.RE
.IP

.IP etime 8
Timestamp; time when job became eligible to run, i.e. was enqueued in
an execution queue and was in the "Q" state.  Reset when a job moves
queues, or is held then released.  Not affected by qaltering.
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer 
.br
Syntax:
.RS 11
Printed by qstat in human-readable format.  Output in hooks as seconds since epoch.
.RE
.IP
Python type: 
.I int
.br
Default: No default

.IP euser 8
If the job is queued, this attribute is set to the
user name under which the job is to be run.  
.br
Readable by Manager only; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP "executable" 8
JSDL-encoded listing of job's executable.  
Shown if job is submitted with "-- <executable> [<arg list>]".
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I JSDL-encoded string
.br
Syntax: <jsdl-hpcpa:Executable> <name of executable> 
.br
Example: 
.RS 11
If the executable is ping, the string
is <jsdl-hpcpa:Executable>ping</jsdl-hpcpa:Executable>
.RE
.IP
Python type: 
.I str
.br
Default: No default

.IP "Execution_Time" 8
Timestamp; time after which the job may execute.  Before this time,
the job remains queued in the (W)ait state.  Can be set when stage-in
fails and PBS moves job start time out 30 minutes to allow user to fix
problem.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I Datetime
.br
Syntax:
.I [[CCwYY]MMDDhhmm[.ss]
.br
Python type: 
.I int
.br
Default: Unset (no delay)  

.IP exec_host 8
If the job is running, this is set to the name of the host or hosts on which
the job is executing.  
.br
Can be read by user, Operator, Manager.
.br
Format: 
.I String
.br
Syntax:
.RS 11
.I <hostname>/N[*C][+...], 
.br
where 
.I N 
is task slot number, starting with 0,
on that vnode, and 
.I C 
is the number of CPUs allocated to the job.
.I *C 
does not appear if 
.I C 
has a value of 
.I 1.
.RE
.IP
Python type: 
.I pbs.exec_host
.br
Default: No default

.IP exec_vnode 8
List of chunks for the job.  Each chunk shows the name of the vnode(s)
from which it is taken, along with the host-level, consumable resources 
allocated from that vnode, and any AOE provisioned on this vnode for this job.  
.br
If a vnode is allocated to the job but no resources 
from the vnode are used by the job, the vnode
name appears alone.  
.br
If a chunk is split across vnodes, the name of 
each vnode and its resources appear inside one pair of parentheses, 
joined with a plus sign ("+").
.br
Can be read by user.  Can be read and set by Manager, Operator.
.br
Format: 
.I String
.br
Syntax: 
.RS 11 
Each chunk is enclosed in parentheses, and
chunks are connected by plus signs.  
.RE
.IP
Example: 
.RS 11
For a job which requested two chunks
that were satisfied by resources from three vnodes,
.I exec_vnode 
is
.br
(vnodeA:ncpus=N:mem=X)+(vnodeB:ncpus=P:mem=Y+vnodeC:mem=Z).
.br
For a job which requested one chunk and exclusive use of a 2-vnode host,
where the chunk was satisfied by resources from one vnode,
.I exec_vnode 
is
.br
(vnodeA:ncpus=N:mem=X)+(vnodeB).
.RE
.IP
Python type: 
.I pbs.exec_vnode
.br
Default: No default

.IP Exit_status 8
Exit status of job.  Set to zero for successful execution.  If any
subjob of an array job has non-zero exit status, the array job has
non-zero exit status.  
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP "forward_x11_cookie" 8
Contains the X authorization cookie.
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type:
.I int
.br
Default: No default

.IP "forward_x11_port"  8
Contains the number of the port being listened to by the port 
forwarder on the submission host.
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP "group_list" 8
A list of group names used to determine the group under which the job
runs. When a job runs, the server selects a group name from the list
according to the following ordered set of rules:
.RS
.IP "1." 3 
Select the group name for which the associated host name matches the
name of the server host.

.IP "2." 3 
Select the group name which has no associated host name.

.IP "3." 3 
Use the login group for the user name under which the job will be run. 
.RE
.IP
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
.I <group name>[@<hostname>] [,<group name>[@<hostname>] ...]
.br
Must be enclosed in double quotes if it contains commas.
.RE
.IP
Python type: 
.I pbs.group_list
.br
Default: No default

.IP hashname 8
No longer used.

.IP "Hold_Types" 8
The set of holds currently applied to the job.  If the set is not null, 
the job will not be scheduled for execution and is said to be in the
.I held
state.  The
.I held
state takes precedence over the
.I wait
state.  
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String, 
made up of the letters 
.I 'n', 'o', 'p', 's', 'u'
.br
Hold types:
.RS
.IP n 3
No hold
.IP o 3
Other hold
.IP p 3
Bad password
.IP s 3
System hold
.IP u 3
User hold
.RE
.IP
Python type: 
.I pbs.hold_types
.br
Default:
.I n
(no hold)
.RE

.IP "interactive" 8
Specifies whether the job is interactive.  
.br
When both this attribute and the 
.I block
attribute are 
.I True, 
no exit status is returned.  
For X11 forwarding jobs, the job's exit status is not returned.
.br
Cannot be set using a PBS directive.
.br
Job arrays cannot be interactive.
.br
Can be set, but not altered, by unprivileged user.  Can be read by Operator, Manager.
.br
Format: 
.I Boolean
.br
Python type: 
.I int
.br
Default: 
.I False

.IP "jobdir" 8
Path of the job's staging and execution directory on the 
primary execution host.  Either user's home, or private sandbox.
Depends on value of 
.I sandbox
attribute.  Viewable via 
.B qstat -f.
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP "Job_Name" 8
The job name.  See the 
.B qsub
and
.B qalter
commands.   
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String 
up to 236 characters, first character must be alphabetic or numeric
.br
Python type: 
.I str
.br
Default: Base name of job script, or STDIN

.IP "Job_Owner" 8
The login name on the submitting host of the user who submitted the batch job.
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP "job_state" 8
The state of the job.
.br
Readable by all.  Can be set indirectly by all.
.br
Format: 
.I Character
.br
Job states:
.RS 
.IP B 3
.I Begun.
Job arrays only.  The job array has begun execution.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_BEGUN
.IP E 3
.I Exiting.  
The job has finished, with or without errors,
and PBS is cleaning up post-execution.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_EXITING
.IP F 3
.I Finished.
Job is finished.  Job has completed execution, job failed during execution,
or job was deleted.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_FINISHED
.IP H 3
.I Held.  
The job is held. 
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_HELD
.IP M 3
.I Moved.
Job has been moved to another server. 
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_MOVED
.IP Q 3
.I Queued.  
The job resides in an execution or routing queue pending
execution or routing.  It is not in
.B held
or
.B waiting
state.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_QUEUED
.IP R 3
.I Running.  
The job is in a execution queue and is running.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_RUNNING
.IP S 3
.I Suspended.  
The job was executing and has been suspended.   
The job does not use CPU cycles or walltime.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_SUSPEND
.IP T 3
.I Transiting.  
The job is being routed or moved to a new destination.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_TRANSIT
.IP U 3
.I User suspended.  
The job was running on a workstation configured for cycle
harvesting and the keyboard/mouse is currently busy.  The job is suspended
until the workstation has been idle for a configured amount of time.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_SUSPEND_USERACTIVE
.IP W 3
.I Waiting.  
The 
.I Execution_Time
attribute contains a time in the future.  Can be set when
stage-in fails and PBS moves job start time out 
30 minutes to allow user to fix problem.
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_WAIITING
.IP X 3
.I Expired.
Subjobs only.  Subjob is finished (expired.)
.br
Python type: PBS job state constant
.I pbs.JOB_STATE_EXPIRED
.LP
.RE

.IP "Join_Path" 8
Specifies whether the job's standard error and standard output streams
are to be merged and placed in the file specified in the 
.I Output_Path
job attribute.
.br
When set to 
.I True, 
the job's standard error and standard output streams are merged.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Behavior:
.RS
.IP eo 3
Standard output and standard error are merged, intermixed, into a 
single stream, which becomes standard error.
.IP oe 3
Standard output and standard error are merged, intermixed, into a single stream, which becomes standard output.
.IP n 3
Standard output and standard error are not merged.
.RE
.IP
Python type: 
.I pbs.join_path
.br
Default: 
.I False

.IP "Keep_Files" 8
Specifies whether the standard output and/or standard error streams
are retained on the execution host in the job's staging and execution
directory after the job has executed.  Otherwise these files are
returned to the submission host.  
.I Keep_Files 
overrides the 
.I Output_Path
and 
.I Error_Path 
attributes.
.br
Readable and settable by all.
.br
Format: 
.I String
.br
Python type:
.I pbs.keep_files
.br
Valid values: Can be one of the following:
.RS
.IP o 3
The standard output stream is retained.  The filename is:
.I <job name>.o<sequence number>
.IP e 3
The standard error stream is  retained.  The filename is: 
.I <job name>.e<sequence number>
.IP "eo, oe" 3
Both standard output and standard error streams are retained.
.IP d 3
Output and error are written directly to their final destination
.IP n 3
Neither stream is retained.  Files are returned to submission host.
.RE
.IP 
Default: 
.I n
.RS 11
(neither stream is retained, and files are returned to submission host.)
.RE

.IP "Mail_Points" 8
Specifies state changes for which the server sends mail about the job.
.br
Can be read and set by user, Operator, Manager.
.br
Format:
.I String
.br
Python type: 
.I pbs.mail_points
.br
Valid values: Combination of
.I a, b, 
and
.I e, 
with optional 
.I j, 
or 
.I n
by itself.
.RS
.IP a 3
Mail is sent when job is aborted
.IP b 3
Mail is sent at beginning of job
.IP e 3
Mail is sent when job ends
.IP j 3
Mail is sent for subjobs.  Must be combined with one or more of
.I a, b, 
and 
.I e
options.
.IP n 3
No mail is sent.  Cannot be combined with other options.
.RE
.IP
Default: 
.I a

.IP "Mail_Users" 8
The set of users to whom mail is sent when the job makes state changes
specified in the 
.I Mail_Points
job attribute.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Syntax: "<username>@<hostname>[,<username>@<hostname>]"
.br
Python type: 
.I pbs.email_list
.br
Default: Job owner only

.IP "max_run_subjobs" 8
Sets a limit on the number of subjobs that can be running at one time.
Can be set using 
.B qsub -J <range> [%<max subjobs>] 
or 
.B qalter -Wmax_run_subjobs=<new value> <job ID>.

.IP mtime 8
Timestamp; the time that the job was last modified, changed state, or changed locations.
.br
Format: 
.I Integer.
.br
Syntax: Timestamp.  
.RS 11
Printed by qstat in human-readable format; output in hooks 
as seconds since epoch.
.RE
.IP
Python type: 
.I int
.br
Default: No default

.IP "no_stdio_sockets" 8
.B Not used.

.IP "Output_Path" 8
The final path name for the file containing the job's standard output
stream.  See the
.B qsub
and
.B qalter
commands.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Syntax: 
.I [<hostname>:]<path>
.br
Valid values:
.RS
.IP "<relative path>" 3
Path is relative to the current working directory of command executing
on current host.
.IP "<absolute path>" 3
Path is absolute path on current host where command is executing.
.IP "<hostname>:<relative path>" 3
Path is relative to user's home directory on specified host.
.IP "<hostname>:<absolute path>" 3
Path is absolute path on named host.
.IP "No path" 3 
Path is current working directory where qsub is executed.
.RE
.IP
Default: 
.RS 11
Default path is current working directory where qsub is run.
.br
If the output path is specified, but does not include a
filename, the default filename is 
.I <job ID>.OU.  
.br
If the path name is not specified, the default filename is 
.I <job name>.o<sequence number>.
.RE

.IP "pcap_accelerator" 8
Power attribute.  Power cap for an accleerator.  Corresponds to Cray 
.I capmc set_power_cap --accel
setting.  See 
.I capmc
documentation.
.br
Readable and settable by all.
.br
Format: 
.I Integer
.br
Units: 
.I Watts
.br
Python type: 
.I int
.br
Default: Unset

.IP "pcap_node" 8
Power attribute.  Power cap for a node.  Corresponds to Cray 
.I capmc set_power_cap --node
setting.  See 
.I capmc
documentation.
.br
Readable and settable by all.
.br
Format: 
.I Integer
.br
Units: 
.I Watts
.br
Python type: 
.I int
.br
Default: Unset

.IP "pgov" 8
Power attribute.  Cray ALPS reservation setting for CPU throttling
corresponding to 
.I p-governor.
See BASIL 1.4 documentation.  We do not recommend using this attribute.
.br
Readable and settable by all.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: Unset

.IP "Priority" 8
The scheduling priority for the job.  Higher value indicates higher priority.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I Integer
.br
Syntax: 
.I [+|-]nnnnn
.br
Valid values: [-1024, +1023] inclusive
.br
Python type: 
.I int
.br
Default: Unset

.IP "project" 8
The job's project. A project is a way to tag jobs.  Each job can belong
to at most one project.
.br
Readable and settable by user, Operator, Manager.
.br
Format: 
.I String
.RS 11
Can contain any characters except for the following:
Slash ("/"), left bracket ("["), right bracket ("]"), double quote ("""), 
semicolon (";"), colon (":"), vertical bar ("|"), left angle bracket ("<"), 
right angle bracket (">"), plus ("+"), comma (","), question mark ("?"), 
and asterisk ("*").
.RE
.IP
Python type: 
.I str
.br
Default: "_pbs_project_default"

.IP "pset" 8
.B Deprecated.  
Name of the placement set used by the job.  
.br
Can be read by user, Operator.  Can be read and set by Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP "pstate" 8
Power attribute.  Cray ALPS reservation setting for CPU frequency
corresponding to 
.I p-state.
See BASIL 1.4 documentation.  
.br
Readable and settable by all.
.br
Format: 
.I String
.br
Units:
.I Hertz
.br
Python type: 
.I str
.br
Default: Unset

.IP qtime 8
Timestamp; the time that the job entered the current queue.
.br
Readable by all; settable only by PBS.
.br
Format: 
.I Integer
.br
Syntax: Timestamp.  
.RS 11
Printed by qstat in human-readable format; output in hooks 
as seconds since epoch.
.RE
.IP
Python type: 
.I int
.br
Default: No default

.IP queue 8
The name of the queue in which the job currently resides.
.br
Readable by all; settable only by PBS.
.br
Format: 
.I String
.br
Python type: 
.I pbs.queue
.br
Default: No default

.IP queue_rank 8
A number indicating the job's position within the
queue.  Only used internally by PBS.  
.br
Readable by Manager only.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP queue_type 8
The type of queue in which the job is currently residing.  
.br
Readable by Manager only.
.br
Format: 
.I Character
.br
Valid values: One of 
.I E
or 
.I R
.RS
.IP E 3
Execution queue
.br
Python type: 
.RS 3
PBS job state constant
.I pbs.QUEUE_TYPE_EXECUTION
.RE
.IP R 3
Routing queue
.br
Python type: 
.RS 3
PBS job state constant
.I pbs.QUEUE_TYPE_EXECUTION
.RE
.RE
.IP
Default: No default

.IP "release_nodes_on_stageout" 8
Controls whether job vnodes are released when stageout begins.
.br
Cannot be used with vnodes tied to Cray X* series systems.
.br
When cgroups is enabled and this is used with some but not all vnodes
from one MoM, resources on those vnodes that are part of a cgroup are
not released until the entire cgroup is released.
.br
The job's 
.I stageout 
attribute must be set for the
.I release_nodes_on_stageout 
attribute to take effect.
.br
When set to 
.I True, 
all of the job's vnodes not on the primary execution
host are released when stageout begins.  
.br
When set to 
.I False,
job's vnodes are released when the job finishes and MoM cleans up the job.
.br
Readable and settable by all.
.br
Format: 
.I Boolean
.br
Python type:
.I bool
.br
Default:
.I False

.IP "Remove_Files" 8
Specifies whether standard output and/or standard error files are 
automatically removed upon job completion.
.br
Readable and settable by all.
.br
Format: 
.I String
.br
Python type:
.I str
.br
Valid values: "e", "o", "eo", "oe", or unset
.RS
.IP e 3
Standard error is removed upon job completion.
.IP o 3
Standard output is removed upon job completion.
.IP "eo, oe" 3
Standard output and standard error are removed upon job completion.
.IP unset 3
Neither is removed.
.RE
.IP
Default: Unset

.IP "Rerunable" 8
Specifies whether the job can be rerun.  Does not affect how a job is
treated if the job could not begin execution.  
.br
Job arrays are required to be rerunnable and are rerunnable by
default.
.br
Readable and settable by all.
.br
Format: 
.I Character
.br
Syntax: One of 
.I y
or 
.I n
.br
Python type: 
.I bool
.br
Default: y (job is rerunnable)

.IP "Resource_List" 8
The list of resources required by the job. List is a set of 
.I <resource name>=<value> 
strings. The meaning of name and value is dependent upon
defined resources. Each value establishes the limit of usage of that
resource. If not set, the value for a resource may be determined by a
queue or server default established by the administrator. 
.br
Readable and settable by all.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
.I Resource_List.<resource name>=<value>[, Resource_List.<resource name>=<value>, ...]
.RE
.IP
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
Resource_List["<resource name>"]=<value>
.br
where <resource name> is any built-in or custom resource
.RE
.IP
Default: No default

.IP "resources_released" 8
Listed by vnode, consumable resources that were released when the job
was suspended.  Populated only when 
.I restrict_res_to_release_on_suspend
server attribute is set.  
.br
Readable by all.  Set by server.
.br
Format: 
.I String 
.br
Syntax: 
.RS 11
.I (<vnode>:<resource name>=<value>:
.I <resource name>=<value>:...)+
.I (<vnode>:<resource name>=<value>:...)
.RE
.IP
Python type:
.I str
.br
Default: No default

.IP "resource_release_list" 8
Sum of each consumable resource requested by the job that was released
when the job was suspended.  Populated only when
.I restrict_res_to_release_on_suspend 
server attribute is set. 
.br
Readable by Manager and Operator.  Set by server.
.br
Format: 
.I String 
.br
Syntax: 
.RS 11
.I resource_released_list.<resource name>=<value>,
.I resource_released_list.<resource name>=<value>, ...
.RE
.IP
Python type: 
.I pbs.pbs_resource
.br
Default: No default

.IP "resources_used" 8
The amount of each resource used by the job.  
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
List of 
.I resources_used.<resource name>=<value>,resources_used.<resource name>=<value>
pairs.  
.RE
.IP
Example: resources_used.mem=2mb
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_used["<resource name>"]=<value> 
.br
where <resource name> is any built-in or custom resource
.RE
.IP 
Default: No default

.IP run_count 8
The number of times the server thinks the job has been executed.  
.br
The
.I run_count
attribute starts at zero.  Job is held after 21 tries.  
.br
Can be set via qsub, qalter, or a hook.
.br
Can be read and set by Manager and Operator.
.br
Format: 
.I Integer;
must be greater than or equal to zero.
.br
Python type: 
.I int
.br
Default: 
.I Zero

.IP "run_version" 8
Used internally by PBS to track the instance of the job.  
.br
Set by PBS.  Visible to Manager only.  
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP "sandbox" 8
Specifies type of location PBS uses for job staging and execution.
.br
User-settable via 
.B qsub -Wsandbox=<value>
or via a PBS directive.
.br
See the $jobdir_root MoM configuration option in 
.B pbs_mom.8B. 
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Valid values: 
.I PRIVATE, HOME, 
unset
.br
.RS
.IP PRIVATE 3
When set to PRIVATE, PBS creates job-specific staging and
execution directories under the directory specified in 
the 
.I $jobdir_root 
MoM configuration option.
.IP "HOME or unset" 3
PBS uses the job owner's home directory for staging and execution.
.RE
.IP
Python type: 
.I str 
.br
Default: Unset

.IP schedselect  8
The union of the select specification of the job, and the queue and 
server defaults for resources in a chunk.  
.br
Can be read by PBS Manager only.
.br
Format: 
.I String
.br
Python type: 
.I pbs.select
.br
Default: No default

.IP sched_hint 8
.B No longer used.

.IP security_context 8
Contains security context of job submitter.  Set by PBS to the
security context of the job submitter at the time of job
submission. If not present when a request is submitted, an error
occurs, a server message is logged, and the request is rejected.
.br
Readable by all; set by PBS.
.br
Format: 
.I String in SELinux format
.br
Default: Unset

.IP server 8
The name of the server which is currently managing the job.
When the secondary server is running during failover, shows the name
of the primary server.  After a job is moved to another server, either
via qmove or peer scheduling, shows the name of the new server.
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I pbs.server
.br
Default: No default

.IP session_id 8
If the job is running, this is set to the session ID of the first
executing task.
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP "Shell_Path_List" 8
One or more absolute paths to the program(s) to process the job's
script file.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
"<path>[@<hostname>][,<path>[@<hostname>]...]"
.br
Must be enclosed in double quotes if it contains commas.
.RE
.IP
Python type: 
.I pbs.path_list
.br
Default: User's login shell on execution host

.IP stagein 8
The list of files to be staged in prior to job execution.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
"<execution path>@<storage host>:<storage path>
[, <execution path>@<storage host>:<storage path>, ...]"
.RE
.IP
Python type: 
.I pbs.staging_list
.br
Default: No default

.IP stageout 8
The list of files to be staged out after job execution.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
"<execution path>@<storage host>:<storage path>
[, <execution path>@<storage host>:<storage path>, ...]"
.RE
.IP
Python type: 
.I pbs.staging_list
.br
Default: No default

.IP Stageout_status 8
Status of stageout.  If stageout succeeded, this is set to 1.  
If stageout failed, this is 
set to 0.  Displayed only if set.  
If stageout fails for any subjob of an array job, the value of 
.I Stageout_status
is zero for the array job.  Available only for finished jobs.
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP stime 8
Timestamp; time when the job started execution.  Changes when job is restarted.
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer 
.br
Syntax: Timestamp.  
.RS 11
Printed by qstat in human-readable format; output in hooks 
as seconds since epoch.
.RE
.IP
Python type: 
.I int
.br
Default: No default

.IP "Submit_arguments" 8
Job submission arguments given on the 
.B qsub
command line.  Available for all jobs.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP "substate" 8
The substate of the job.  The substate is used internally by PBS.
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br 
Default: No default

.IP sw_index 8
.B No longer used.

.IP "tobjob_ineligible" 8
Allows administrators to mark this job as ineligible to be a top job.
.br
When 
.I True
, this job is not eligible to be the top job.
.br
Can be read and set by Manager.
.br
Format: 
.I Boolean
.br
Python type: 
.I bool
.br
Default: 
.I False

.IP umask 8
The initial umask of the job is set to the value of this attribute when the
job is created.  This may be changed by umask commands in the shell
initialization files such as .profile or .cshrc.
.br
Can be read and set by user, Operator, Manager.
.br
Format: 
.I Decimal integer
.br
Python type: 
.I int
.br
Default: 
.I 077

.IP "User_List" 8
The list of users which determines the user name under which the job
is run on a given host.  No length limit.
.br
When a job is to be executed, the server selects a user name from the
list according to the following ordered set of rules:
.RS
.IP 1. 3 
Select the user name from the list for which the associated host name
matches the name of the server.
.IP 2. 3
Select the user name which has no associated host name; the wild card name.
.IP 3. 3 
Use the value of 
.I Job_Owner 
as the user name.
.RE
.IP
Readable and settable by all.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
"<username>@<hostname> [,<username>@<hostname>...]" 
.br
Must be enclosed in double quotes if it contains commas.  May be up to
256 characters in length.
.RE
.IP
Python type:
.I pbs.user_list
.br
Default: Value of 
.I Job_Owner
job attribute

.IP "Variable_List" 8
List of environment variables set in the job's execution environment.
See the qsub(1B) command.
.br
Readable and settable by all.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
"<variable name>=<value> [,<variable name>=<value>...]"
.br
Must be enclosed in double quotes if it contains commas. 
.RE
.IP
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11 
Variable_List["<variable name>"]=<value>
.RE
.IP
Default: No default


.SH SEE ALSO
qsub(1B), qalter(1B), qhold(1B), qrls(1B), pbs_resources(7B)


================================================
FILE: doc/man1/pbs_login.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_login 1B "15 July 2020" Local "PBS Professional"
.SH NAME
.B pbs_login 
- cache encrypted user password for authentication
.SH Synopsis
.B pbs_login
.br
.B pbs_login
-m <PBS service account password>
.br
echo <password>|
.B pbs_login
-p

.SH Description
The 
.B pbs_login 
command encrypts the password and caches it locally where it can be
used by daemons for authorization.

Job submitters must run this command at each submission host each time
their password changes.

On Windows, the 
.B win_postinstall 
script calls 
.B pbs_login 
to store the PBS service account password so that the account user can
be authenticated by daemons.

.SH Required Privilege
Can be run by any user.


.SH Options to pbs_login
.IP "(no options)" 8
Queries user for password.

.IP "-m <PBS service account password>" 8
This option is intended to be used only by the PBS service account,
which is the account that is used to execute 
.B pbs_mom 
via the Service Control Manager on Windows.  This option is used during installation
when invoked by the
.B win_postinstall 
script, or by the administrator when the
PBS service account password has changed.  Stores PBS service account
password in the mom_priv directory.

.IP "-p" 8
Caches user password on client host.  Intended to be run by job
submitter at client host.  Allows job submitter to be authenticated
by daemons.


================================================
FILE: doc/man1/pbs_module.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_module 7B "6 April 2020" Local "PBS Professional"
.SH NAME
.B pbs_module
\- Python interface to PBS and PBS hook environment


.SH DESCRIPTION
 
The 
.I pbs module 
provides an interface to PBS and the hook environment.
The interface is made up of Python objects, which have attributes and
methods.  You can operate on these objects using Python code.

.SH PBS MODULE OBJECTS

.IP  pbs.acl
Represents a PBS ACL type. 
.IP  pbs.args
Represents a space-separated list of PBS arguments to commands like qsub, qdel.
.IP  pbs.argv[]
Represents a list of argument strings to be passed to the program
.IP  pbs.BadAttributeValueError
Raised when setting the attribute value of a pbs.* object to an invalid value.
.IP  pbs.BadAttributeValueTypeError
Raised when setting the attribute value of a pbs.* object to an invalid value type.
.IP  pbs.BadResourceValueError
Raised when setting the resource value of a pbs.* object to an invalid value.
.IP  pbs.BadResourceValueTypeError
Raised when setting the resource value of a pbs.* object to an invalid value type.
.IP  pbs.checkpoint
Represents a job's 
.I Checkpoint 
attribute.
.IP  pbs.depend
Represents a job's 
.I depend
attribute.
.IP  pbs.duration
Represents a time interval.
.IP  pbs.email_list
Represents the set of users to whom mail may be sent.
.IP  pbs.env[]
Dictionary of environment variables.
.IP  pbs.event
Represents a PBS event.
.IP  pbs.EventIncompatibleError
Raised when referencing a non-existent attribute in pbs.event().
.IP  pbs.EXECHOST_PERIODIC
The 
.I exechost_periodic 
event type.
.IP  pbs.EXECHOST_STARTUP
The 
.I exechost_startup
event type.
.IP  pbs.EXECJOB_ATTACH
The 
.I execjob_attach
event type.
.IP  pbs.EXECJOB_BEGIN
The 
.I execjob_begin
event type.
.IP  pbs.EXECJOB_END
The 
.I execjob_end
event type.
.IP  pbs.EXECJOB_EPILOGUE
The 
.I execjob_epilogue
event type.
.IP  pbs.EXECJOB_LAUNCH
The 
.I execjob_launch
event type.
.IP  pbs.EXECJOB_PRETERM
The 
.I execjob_preterm
event type.
.IP  pbs.EXECJOB_PROLOGUE
The 
.I execjob_prologue
event type.
.IP  pbs.exec_host
Represents a job's 
.I exec_host 
attribute.
.IP  pbs.exec_vnode
Represents a job's 
.I exec_vnode 
attribute.
.IP  pbs.group_list
Represents a list of group names.
.IP  pbs.hold_types
Represents a job's 
.I Hold_Types 
attribute.
.IP  pbs.hook_config_filename
Contains path to hook's configuration file.
.IP  pbs.job
Represents a PBS job.
.IP  pbs.job_list[]
Represents a list of pbs.job objects.
.IP  pbs.job_sort_formula
Represents the server's
.I job_sort_formula 
attribute.
.IP  pbs.JOB_STATE_BEGUN
Represents the job array state of having started.
.IP  pbs.JOB_STATE_EXITING
Represents the job state of exiting.
.IP  pbs.JOB_STATE_EXPIRED
Represents the subjob state of expiring.
.IP  pbs.JOB_STATE_FINISHED
Represents the job state of finished.
.IP  pbs.JOB_STATE_HELD
Represents the job state of held.
.IP  pbs.JOB_STATE_MOVED
Represents the job state of moved.
.IP  pbs.JOB_STATE_QUEUED
Represents the job state of queued.
.IP  pbs.JOB_STATE_RUNNING
Represents the job state of running.
.IP  pbs.JOB_STATE_SUSPEND
Represents the job state of suspended.
.IP  pbs.JOB_STATE_SUSPEND_USERACTIVE
Represents the job state of suspended due to user activity.
.IP  pbs.JOB_STATE_TRANSIT
Represents the job state of transiting.
.IP  pbs.JOB_STATE_WAITING
Represents the job state of waiting.
.IP  pbs.join_path
Represents a job's 
.I Join_Path
attribute.
.IP  pbs.keep_files
Represents a job's 
.I Keep_Files 
attribute.
.IP pbs.license_count
Represents a set of licensing-related counters.
.IP  pbs.LOG_DEBUG
Log level 004.
.IP  pbs.LOG_ERROR
Log level 004.
.IP  pbs.LOG_WARNING
Log level 004.
.IP  pbs.mail_points
Represents a job's 
.I Mail_Points 
attribute.
.IP  pbs.MODIFYJOB
The 
.I modifyjob 
event type.
.IP  pbs.MOVEJOB
The 
.I movejob 
event type.

.IP pbs.ND_BUSY
Represents 
.I busy 
vnode state.

.IP pbs.ND_DEFAULT_EXCL
Represents 
.I default_excl sharing 
vnode attribute value

.IP pbs.ND_DEFAULT_SHARED
Represents 
.I default_shared sharing 
vnode attribute value.

.IP pbs.ND_DOWN
Represents 
.I down 
vnode state

.IP pbs.ND_FORCE_EXCL
Represents 
.I force_excl sharing 
vnode attribute value.

.IP pbs.ND_FREE
Represents 
.I free 
vnode state. 

.IP pbs.ND_GLOBUS
PBS no longer supports Globus.  The Globus functionality has been 
.B removed 
from PBS.

Represents
.I globus 
vnode 
.I ntype.

.IP pbs.ND_IGNORE_EXCL
Represents 
.I ignore_excl sharing 
vnode attribute value.

.IP pbs.ND_JOBBUSY
Represents 
.I job-busy 
vnode state.

.IP pbs.ND_JOB_EXCLUSIVE
Represents 
.I job-exclusive 
vnode state.

.IP pbs.ND_OFFLINE
Represents 
.I offline 
vnode state.  

.IP pbs.ND_PBS
Represents 
.I pbs 
vnode 
.I ntype.

.IP pbs.ND_PROV
Represents 
.I provisioning 
vnode state.

.IP pbs.ND_RESV_EXCLUSIVE
Represents
.I resv-exclusive
vnode state.

.IP pbs.ND_STALE
Represents 
.I stale 
vnode state.

.IP pbs.ND_STATE_UNKNOWN
Represents 
.I state-unknown, down 
vnode state.

.IP pbs.ND_UNRESOLVABLE
Represents the 
.I unresolvable
vnode state.

.IP pbs.ND_WAIT_PROV
Represents 
.I wait-provisioning 
vnode state.

.IP  pbs.node_group_key
Represents the server or queue 
.I node_group_key
attribute.
.IP  pbs.path_list
Represents a list of pathnames.
.IP  pbs.pbs_conf[]
Dictionary of entries in pbs.conf.
.IP  pbs.pid
Represents the process ID of a process belonging to a job.

.IP  pbs.place
Represents the 
.I place
job submission specification.
.IP pbs.progname
Path of job shell or executable.
.IP  pbs.QTYPE_EXECUTION
The 
.I execution
queue type.
.IP  pbs.QTYPE_ROUTE
The 
.I route
queue type.
.IP  pbs.queue
Represents a PBS queue.
.IP  pbs.QUEUEJOB
The 
.I queuejob 
event type.
.IP  pbs.range
Represents a range of numbers referring to array indices.
.IP  pbs.resv
Represents a PBS reservation.
.IP  pbs.RESVSUB
The 
.I resvsub
event type.
.IP  pbs.RESV_STATE_BEING_DELETED
Represents the reservation state RESV_BEING_DELETED.
.IP  pbs.RESV_STATE_CONFIRMED
Represents the reservation state RESV_CONFIRMED.
.IP  pbs.RESV_STATE_DEGRADED
Represents the reservation state RESV_DEGRADED.
.IP  pbs.RESV_STATE_DELETED
Represents the reservation state RESV_DELETED.
.IP  pbs.RESV_STATE_DELETING_JOBS
Represents the reservation state RESV_DELETING_JOBS.
.IP  pbs.RESV_STATE_FINISHED
Represents the reservation state RESV_FINISHED.
.IP  pbs.RESV_STATE_NONE
Represents the reservation state RESV_NONE.
.IP  pbs.RESV_STATE_RUNNING
Represents the reservation state RESV_RUNNING.
.IP  pbs.RESV_STATE_TIME_TO_RUN
Represents the reservation state RESV_TIME_TO_RUN.
.IP  pbs.RESV_STATE_UNCONFIRMED
Represents the reservation state RESV_UNCONFIRMED.
.IP  pbs.RESV_STATE_WAIT
Represents the reservation state RESV_WAIT.
.IP  pbs.route_destinations
Represents a queue's 
.I route_destinations
attribute.
.IP  pbs.RUNJOB
The 
.I runjob
event type.
.IP  pbs.select
Represents the 
.I select
job submission specification.
.IP  pbs.server
Represents the local PBS server.
.IP  pbs.size
Represents a PBS 
.I size
type.
.IP  pbs.software
Represents a site-dependent software specification resource.
.IP  pbs.staging_list
Represents a list of file stagein or stageout parameters.
.IP  pbs.state_count
Represents a set of job-related state counters.
.IP  pbs.SV_STATE_ACTIVE
Represents the server state "Scheduling".
.IP  pbs.SV_STATE_HOT
Represents the server state "Hot_Start".
.IP  pbs.SV_STATE_IDLE
Represents the server state "Idle".
.IP  pbs.SV_STATE_SHUTDEL
Represents the server state "Terminating, Delayed".
.IP  pbs.SV_STATE_SHUTIMM
Represents the server state "Terminating".
.IP  pbs.SV_STATE_SHUTSIG
Represents the server state "Terminating", when a signal has been caught.
.IP  pbs.UnsetAttributeNameError
Raised when referencing a non-existent name of a pbs.* object.
.IP  pbs.UnsetResourceNameError
Raised when referencing a non-existent name of a pbs.* object.
.IP  pbs.user_list
Represents a list of user names.
.IP  pbs.vchunk
Represents a resource chunk assigned to a job.
.IP  pbs.version
Represents PBS version information.
.IP  pbs.vnode
Represents a PBS vnode.
.IP  pbs.vnode_list[]
Represents a list of PBS vnodes.
.IP  SystemExit
Raised when accepting or rejecting an action.
.LP

.SH PBS MODULE GLOBAL METHODS
.IP pbs.acl("[+|-]<entity>][,...]")
Creates an object representing a PBS ACL, using the given string parameter.
Instantiation of these objects requires a formatted input string.


.IP pbs.args("<args>")
where 
.I <args> 
are space-separated arguments to a command such as 
.B qsub 
or 
.B qdel.
Creates an object representing the arguments to the command.
Example:
.RS 10
pbs.args("-Wsuppress_email=N -r y")
.RE
.IP
Instantiation of these objects requires a formatted input string.

.IP pbs.checkpoint("<checkpoint_string>")
where 
.I <checkpoint_string> 
must be one of "n", "s", "c", "c=mmm", "w", or "w=mmm"
Creates an object representing the job's
.I Checkpoint 
attribute, using the given string.
Instantiation of these objects requires a formatted input string.
.IP pbs.depend("<depend_string>")
.I <depend_string> 
must be of format "<type>:<jobid>[,<jobid>...]", or "on:<count>", and
where 
.I <type> 
is one of "after", "afterok", "afterany", "before", "beforeok",
and "beforenotok".
Creates a PBS dependency specification object representing the job's
.I depend 
attribute, using the given 
.I <depend_string>.
Instantiation of these objects requires a formatted input string.
.IP pbs.duration("[[hours:]minutes:]seconds[.milliseconds]")
Creates a time specification duration instance, returning the
equivalent number of seconds from the given time string. Represents an
interval or elapsed time in number of seconds. Duration objects can be
specified using either a time or an integer. See the
"pbs.duration(<integer>)" creation method.
.IP pbs.duration(<integer>)
Creates an integer duration instance using the specified number of
seconds.  A 
.I pbs.duration 
instance can be operated on by any of the
Python 
.I int 
functions.  When performing arithmetic operations on a
.I pbs.duration 
type, ensure the resulting value is a 
.I pbs.duration()
type, before assigning to a job member that expects such a type.
.IP pbs.email_list("<email_address1>[,<email_address2>...]")
Creates an object representing a mail list.
Instantiation of these objects requires a formatted input string.
.IP pbs.exec_host("host/N[*C][+...]")
Create an object representing the 
.I exec_host 
job attribute, using the
given host and resource specification.
Instantiation of these objects requires a formatted input string.
.IP pbs.exec_vnode("<vchunk>[+<vchunk>...]")
.I <vchunk> 
is (<vnodename:ncpus=N:mem=M>)
Creates an object representing the 
.I exec_vnode 
job attribute, using the
given vnode and resource specification. When the 
.B qrun -H 
command is used, or when the scheduler runs a job, the 
.I pbs.job.exec_vnode 
object contains the vnode specification for the job.  Instantiation of these
objects requires a formatted input string.
.br
Example:
.br
pbs.exec_vnode("(vnodeA:ncpus=N:mem=X)+(nodeB:ncpus=P:mem=Y+nodeC:mem=Z)")
.br
This object is managed and accessed via the 
.I str() 
or 
.I repr() 
functions. 
.br
Example:
.br
Python> ev = pbs.server().job("10").exec_vnode
.br
Python> str(ev)
.br
"(vnodeA:ncpus=2:mem=200m)+(vnodeB:ncpus=5:mem=1g)"

.IP pbs.get_hook_config_file()
Returns the path to the hook's configuration file, or None if there is
no configuration file.  For example:
.RS 10
configfilepath = pbs.get_hook_config_file()
.RE

.IP pbs.get_local_nodename()
This returns a Python str whose value is the name of the local natural vnode.
If you want to refer to the vnode object representing the current
host, you can pass this vnode name as the key to
.I pbs.event().vnode_list[].  
For example:
.RS 10
Vn = pbs.event().vnode_list[pbs.get_local_nodename()]
.RE

.IP pbs.get_pbs_conf()
This method returns a dictionary of values which represent entries in
the pbs.conf file.  The method reads the file on the host where a hook
runs, so pre-execution event hooks get the entries on the server host,
and execution event hooks get the entries on the execution host where
the hook runs.  The method reads /etc/pbs.conf on the host where
pbs_python runs.
Example:
.RS 10
pbs_conf = pbs.get_pbs_conf()
.br
pbs.logmsg(pbs.LOG_DEBUG, "pbs home is " % (pbs_conf['PBS_HOME]))
.RE
.IP
If you HUP pbs_mom (Linux/UNIX), pbs.get_pbs_conf returns the reloaded
contents of the pbs.conf file.

.IP pbs.group_list("<group_name>[@<host>][,<group_name>[@<host>]...]")
Creates an object representing a PBS group list.
To use a group list object:
.br
pbs.job.group_list = pbs.group_list(....)
.br
Instantiation of these objects requires a formatted input string.
.IP pbs.hold_types("<hold_type_str>")
where 
.I <hold_type_str> 
is one of "u", "o", "s", or "n".
Creates an object representing the 
.I Hold_Types 
job attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.job_sort_formula("<formula_string>")
where 
.I <formula_string> 
is a string containing a math formula. 
Creates an object representing the 
.I job_sort_formula 
server attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.join_path({"oe"|"eo"|"n"})
Creates an object representing the 
.I Join_Path 
job attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.keep_files("<keep_files_str>")
where 
.I <keep_files_str> 
is one of "o", "e", "oe", "eo".
Creates an object representing the 
.I Keep_Files 
job attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.license_count("Avail_Global:<W>Avail_Local:<X>Used:<Y>High_Use:<Z>")
Instantiates an object representing a 
.I license_count 
attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.logjobmsg(job_ID,message)
where 
.I job_ID 
must be an existing or previously existing job ID and where 
.I message 
is an arbitrary string.  This puts a custom string in the PBS Server
log. The 
.B tracejob 
command can be used to print out the job-related
messages logged by a hook script.  Messages are logged at log event
class 
.I pbs.LOG_DEBUG.
.IP pbs.logmsg(log_event_class,message)
where 
.I message 
is an arbitrary string, and where 
.I log_event_class 
can be one of the message log event class constants:
.br
pbs.LOG_WARNING
.br
pbs.LOG_ERROR
.br
pbs.LOG_DEBUG
.br
This puts a custom string in the daemon log.
.IP pbs.mail_points("<mail_points_string>")
where 
.I <mail_points_string> 
is "a", "b", and/or "e", or "n".
Creates an object representing a 
.I Mail_Points 
attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.node_group_key("<resource>")
Creates an object representing the resource to be used for node
grouping, using the specified resource.
.IP pbs.path_list("<path>[@<host>][,<path>@<host>...]")
Creates an object representing a PBS pathname list.
To use a path list object:
.br
pbs.job.Shell_Path_List = pbs.path_list(....)
.br
Instantiation of these objects requires a formatted input string.

.IP pbs.env()
Creates an empty environment variable list.  For example, to create
an empty environment variable list:
.RS 10
pbs.event().env = pbs.pbs_env()
.RE

.IP pbs.place("[arrangement]:[sharing]:[group]")
.I arrangement 
can be "pack", "scatter", "free", "vscatter"
.br
.I sharing 
can be "shared", "excl", "exclhost"
.br
.I group 
can be of the form "group=<resource>"
.br
.I [arrangement], [sharing], 
and 
.I [group] 
can be given in any order or combination.
.br
Creates a place object representing the job's place specification.
Instantiation of these objects requires a formatted input string.
.br
Example:
.br
pl = pbs.place("pack:excl")
.br
s = repr(pl) (or s = `pl`)
.br
letter = pl[0] (assigns 'p' to letter)
.br
s = s + ":group=host" (append to string)
br
pl = pbs.place(s) (update original pl)
.IP pbs.range("<start>-<stop>:<step>")
Creates a PBS object representing a range of values.
.br
Example:
.br
pbs.range("1-30:3")
.br
Instantiation of these objects requires a formatted input string.

.IP pbs.reboot([<command>])
This stops hook execution, so that remaining lines in the hook script
are not executed, and starts the tasks that would normally begin after
the hook is finished, such as flagging the current host to be
rebooted.  The MoM logs show the following:
.RS 10
<hook name> requested for host to be rebooted
.RE
.IP
We recommend that before calling pbs.reboot(), you set any vnodes
managed by this MoM offline, and requeue the current job, if this hook
is not an exechost_periodic hook.  For example:
.RS 10
for  v in pbs.event().vnode_list.keys():
.br
\ \ \ pbs.event().vnode_list[v].state = pbs.ND_OFFLINE
.br
\ \ \ pbs.event().vnode_list[v].comment = "MoM host rebooting"
.br
pbs.event().job.rerun()
.br
pbs.reboot()
.RE
.IP
The effect of the call to pbs.reboot() is not instantaneous. The
reboot happens after the hook executes, and after any of the other
actions such as pbs.event().job.rerun(), pbs.event().delete(), and
pbs.event().vnode_list[] take effect.

A hook with its user attribute set to pbsuser cannot successfully
invoke pbs.reboot(), even if the owner is a PBS Manager or Operator.
If this is attempted, the host is not rebooted, and the following
message appears at log event class PBSEVENT_DEBUG2 in the MoM logs:
.RS 10
<hook_name>; Not allowed to issue reboot if run as user.
.RE
.IP
The <command> is an optional argument.  It is a Python str which is
executed instead of the reboot command that is the default for the
system.  For example:
.RS 10
pbs.reboot("/usr/local/bin/my_reboot -s 10 -c 'going down in 10'")
.RE
.IP
The specified <command> is executed in a shell on Linux/UNIX or via cmd on Windows.


.IP pbs.route_destinations("<queue_spec>[,<queue_spec>,...]")
where 
.I <queue_spec> 
is queue_name[@server_host[:port]]
.br
Creates an object that represents a 
.I route_destinations 
routing queue attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.select("[N:]res=val[:res=val][+[N:]res=val[:res=val]...]")
Creates a 
.I select 
object representing the job's select specification.
Instantiation of these objects requires a formatted input string.
Example:
.br
sel = pbs.select("2:ncpus=1:mem=5gb+3:ncpus=2:mem=5gb")
.br
s = repr(sel) (or s = `sel`)
.br
letter = s[3] (assigns 'c' to letter)
.br
s = s + "+5:scratch=10gb" (append to string)
.br
sel = pbs.select(s) (reset the value of sel)
.br
.IP pbs.size(<integer>)
Creates a PBS 
.I size 
object using the given integer value, storing the
value as the number of bytes. Size objects can be specified using
either an integer or a string. See the "pbs.size("<integer><suffix>")"
creation method.
.IP pbs.size("<integer><suffix>")
Creates a PBS 
.I size 
object out of the given string specification. 
The size of a word
is the word size on the execution host. 
.I Size 
objects can be specified
using either an integer or a string.  To operate on 
.I pbs.size
instances, use the "+" and "-" operators.  To compare 
.I pbs.size
instances, use the "==", "!=", ">", "<", ">=", and "<=" operators.
Example: the sizes are normalized to the smaller of the 2 suffixes. In
this case, "10gb" becomes "10240mb" and is added to "10mb":
.br
sz = pbs.size("10gb")
.br
sz = sz + 10mb
.br
10250mb
.br
Example: the following returns 
.I True 
because 
.I sz 
is greater than 100 bytes:
.br
if sz > 100:
.br
\ \ \ \ gt100 = True
.br

.IP pbs.software("<software_info_string>")
Creates an object representing a site-dependent software resource.
Instantiation of these objects requires a formatted input string.

.IP pbs.staging_list("<filespec>[,<filespec>,...]")
where 
.I <filespec> 
is <execution_path>@<storage_host>:<storage_path>
Creates an object representing a job file staging parameters list.
To use a staging list object:
.br
pbs.job.stagein = pbs.staging_list(....)
.br
Instantiation of these objects requires a formatted input string.
.IP pbs.state_count("Transit:<U>Queued:<V>Held:<W>Running:<X>Exiting:<Y>Begun:<Z>)
Instantiates an object representing a 
.I state_count 
attribute.
Instantiation of these objects requires a formatted input string.
.IP pbs.user_list("<user>[@<host>][,<user>@<host>...]")
Creates an object representing a PBS user list.
To use a user list object:
.br
pbs.job.User_List = pbs.user_list(....)
.br
Instantiation of these objects requires a formatted input string.

.IP pbs.version("<pbs_version_string>")
Creates an object representing the PBS version string.
Instantiation of these objects requires a formatted input string.


.SH ATTRIBUTES AND RESOURCES
.br
Hooks can read Server, Queue, or reservation resources. 
Hooks can read vnode or job attributes and resources.  Hooks can modify
.IP
The resources requested by a job
.br
The resources used by a job
.br
The attributes of a job
.br
The resource arguments to pbs_rsub
.br
Vnode attributes and resources
.br
The shell or program to be executed in a job
.br 
The arguments to the shell or program to be executed in a job
.br
The environment of the job
.LP

Custom and built-in PBS resources are represented in Python dictionaries,
where the resource names are the dictionary keys.  Built-in resources are
listed in pbs_resources(7B).  You reference a resource through a vnode,
the Server, the event that triggered the hook, or the current job, for example:

.IP
pbs.server().resources_available["< resource name>"]
.br
pbs.event().job.Resource_List["< resource name>"]
.br 
pbs.event().vnode_list[<vnode name>].resources_available["< resource name >"]
.LP

The resource name must be in quotes.
Example: Get the number of CPUs:

.IP
ncpus = Resource_List["ncpus"]
.LP

An instance R of a job resource can be set as follows:
.IP
R["<resource name>"] = <resource value>
.LP

For example:
.IP
pbs.event().job().Resource_List["mem"] = 8gb
.LP

.SH EXCEPTIONS

.IP  pbs.BadAttributeValueError
Raised when setting the attribute value of a pbs.* object to an invalid value.
.IP  pbs.BadAttributeValueTypeError
Raised when setting the attribute value of a pbs.* object to an invalid value type.
.IP  pbs.BadResourceValueError
Raised when setting the resource value of a pbs.* object to an invalid value.
.IP  pbs.BadResourceValueTypeError
Raised when setting the resource value of a pbs.* object to an invalid value type.
.IP  pbs.EventIncompatibleError
Raised when referencing a non-existent attribute in pbs.event().
.IP  pbs.UnsetAttributeNameError
Raised when referencing a non-existent name of an attribute.
.IP  pbs.UnsetResourceNameError
Raised when referencing a non-existent name of a resource.
.IP  SystemExit
Raised when accepting or rejecting an action.
.LP

If a hook encounters an unhandled exception:
.IP
PBS rejects the corresponding action, and an error message is printed 
to stderr.
.br
A message is printed to the daemon log.
.LP


.SH SEE ALSO
pbs_hook_attributes(7B), pbs_resources(7B),
qmgr(1B)


================================================
FILE: doc/man1/pbs_node_attributes.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_node_attributes 7B "17 July 2020" Local "PBS Professional"
.SH NAME
.B pbs_node_attributes 
\- attributes of PBS vnodes


.SH DESCRIPTION
Vnodes have the following attributes:

.IP comment 8
Information about this vnode.  This attribute may be set by the
manager to any string to inform users of any information relating to
the node. If this attribute is not explicitly set, the PBS server will
use the attribute to pass information about the node status,
specifically why the node is down. If the attribute is explicitly set
by the manager, it will not be modified by the server.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP current_aoe 8
The AOE currently instantiated on this vnode.  Cannot be set on 
server's host.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: 
.I Unset

.IP current_eoe 8
Current value of eoe on this vnode.  We do not recommend setting this
attribute manually.
.br
Readable by all; settable by Manager (not recommended).
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default:
.I Unset

.IP in_multivnode_host 8
Specifies whether a vnode is part of a multi-vnoded host.  Used
internally.  Do not set.
.br
Readable and settable by Manager (not recommended).
.br
Format:
.I Integer 
.br
Python type:
.I int
.br
Behavior:
.RS
.IP 1 3
Part of a multi-vnode host
.IP Unset 3
Not part of a multi-vnode host
.RE
.IP
Default: 
.I Unset   

.IP jobs 8
List of jobs running on this vnode.
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Syntax: 
.I <processor number>/<job ID>, ... 
.br
Python type:
.I int
.br

.IP last_state_change_time 8
Records the most recent time that this node changed state.              
.br
Format: 
.RS 11
Timestamp
.br
Printed by qstat in human-readable Date format.  
.br
Output in hooks as seconds since epoch.
.RE
.IP

.IP last_used_time 8
Records the most recent time that this node finished being used for a
job or reservation.  Set at creation or reboot time.  Updated when
node is released early from a running job.  Reset when node is ramped
up.
.br
Format: 
.RS 11
Timestamp
.br
Printed by qstat in human-readable Date format.  
.br
Output in hooks as seconds since epoch.
.RE

.IP license 8
.br
Indicates whether this vnode is licensed.
.br
Readable by all; set by PBS.
.br
Format:
.I Character
.br
Python type: 
.I str
.br
Valid values:
.RS
.IP l 3
This vnode is licensed.
.RE
.IP 
Default: 
.I Unset

.IP license_info 8
Number of licenses assigned to this vnode.  
.br
Readable by all; set by PBS.             
.br
Format: 
.I Integer
.br
Python type:
.I int
.br
Default: 
.I Unset

.IP lictype 8
No longer used.

.IP maintenance_jobs 8
List of jobs that were running on this vnode, but have been suspended
via the
.I admin-suspend 
signal to qsig.
.br
Readable by Manager; set by PBS.
.br
Format:
.I string_array                      
.br
Python type:
.I str
.br
Default: No default 

.IP Mom
Hostname of host on which MoM daemon runs.  
.br
Readable by all.  Can be explicitly set by Manager only via 
.B qmgr, 
and only at vnode creation. The server can set this to the FQDN of the host 
on which MoM runs, if the vnode name is the same as the hostname.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: Value of 
.I vnode 
resource (vnode name)

.IP name 8
The name of this vnode.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP no_multinode_jobs 8
Controls whether jobs which request more than one chunk are allowed to execute
on this vnode.  Used for cycle harvesting.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Boolean
.br
Python type:
.I bool
.br
Behavior: 
.RS
.IP True 3
Jobs requesting more than one chunk are not allowed to execute on this vnode.
.RE
.IP
Default: 
.I False

.IP ntype 8
The type of this vnode.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Valid values:
.RS
.IP PBS 3
Normal vnode
.br
Python type: 
.I pbs.ND_PBS
.br
Default: 
.I PBS
.RE

.IP partition 8
Name of partition to which this vnode is assigned.  A vnode can be
assigned to at most one partition.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Python type:
.I str
.br
Default: No default

.IP pbs_version 8
The version of PBS for this MoM.  
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP pcpus 8
.B Deprecated.  
The number of physical CPUs on this vnode.  This is set to the number
of CPUs available when MoM starts.  For a multiple-vnode MoM, only the
natural vnode has 
.I pcpus.
.br
Readable by all; set by PBS.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: 
.I Number of CPUs on startup

.IP pnames
The list of resources being used for placement sets.  
Not used for scheduling; advisory only.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Syntax: 
.I Comma-separated list of resource names
.br
Python type: 
.I str
.br
Default: No default

.IP Port 8
Port number on which MoM daemon listens.  
.br
Can be explicitly set only via
.B qmgr, 
and only at vnode creation.  
Readable and settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: 
.I 15002

.IP poweroff_eligible 8
Enables powering this vnode up and down by PBS.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Boolean
.br
Python type:
.I bool
.br
Values:
.RS 11
.IP True
PBS can power this vnode on and off.
.IP False
PBS cannot power this vnode on and off.
.RE
.IP
Default: 
.I False


.IP power_provisioning 8
Enables use of power profiles by this vnode.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS
.IP True 3
Power provisioning is enabled at this vnode.
.IP False 3
Power provisioning is disabled at this vnode.
.RE
.IP
Default: 
.I False

.IP Priority 8
The priority of this vnode compared with other vnodes.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type: 
.I int
.br
Valid values: 
.I -1024 to +1023
.br
Default: No default

.IP provision_enable
Controls whether this vnode can be provisioned.  
Cannot be set on server's host.  
.br
Format: 
.I Boolean
.br
Python type: 
.I bool
.br
Behavior:
.RS
.IP True 3
This vnode may be provisioned.  
.IP False 3
This vnode may not be provisioned.  
.RE
.IP
Default: 
.I False

.IP queue 8
.B Deprecated.  
The queue with which this vnode is associated.  Each vnode can be
associated with at most 1 queue.  Queues can be associated with
multiple vnodes.  Any jobs in a queue that has associated vnodes can
run only on those vnodes.  If a vnode has an associated queue, only
jobs in that queue can run on that vnode.  
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Python type:
.I pbs.queue
.br
Behavior:
.RS
.IP "<name of queue>" 3
Only jobs in specified queue may run on this vnode.  
.IP Unset 3
Any job in any queue that does not have associated vnodes can run on this vnode.
.RE
.IP 
Default: No default

.IP resources_assigned 8
The total amount of each resource allocated to jobs and started
reservations running on this vnode.
.br
Readable by all; set by PBS.
.br
Format: String
.br
Syntax: 
.RS 11
.I resources_assigned.<resource name>=<value>[,resources_assigned.<resource name>=<value>
.RE
.IP
Python type: 
.I pbs.pbs_resource
.br
Syntax: 
.RS 11
resources_assigned['<resource name>'] = < val> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP resources_available 8
The list of resource and amounts available on this vnode.  If not
explicitly set, the amount shown is that reported by the pbs_mom
running on this vnode.  If a resource value is explicitly set, that
value is retained across restarts.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.RS 11
.I resources_available.<resource name>=<value>, 
.I resources_available.<resource name> = <value>, ...
.RE
.IP 
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_available['<resource name>'] = < val> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP 
Default: No default

.IP resv 8 
List of advance and standing reservations pending on this vnode.
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
.I <reservation ID>[, <reservation ID>, ...]
.br
(Comma-separated list of reservation IDs)
.RE
.IP
Python type:
.I str
.br
Example: resv = R142.examplemachine, R143.examplemachine
.br
Default: No default

.IP resv_enable 8
Controls whether the vnode can be used for advance and standing
reservations.  Reservations are incompatible with cycle harvesting.
.br
Readable by all; settable by Manger.
.br
Format: 
.I Boolean
.br
Python type: 
.I bool
.br
Behavior: 
.RS 11
When set to 
.I True, 
this vnode can be used for reservations. Existing reservations are
honored when this attribute is changed from 
.I True 
to 
.I False.
.RE
.IP
Default: 
.I True

.IP sharing 8
Specifies whether more than one job at a time can use the resources of
the vnode or the vnode's host.  Either (1) the vnode or host is
allocated exclusively to one job, or (2) the vnode's or host's unused
resources are available to other jobs.  
.br
Can be set using 
.I pbs_mom -s insert
only.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Python type:
.I int 
.br
Valid values: 
.RS
.IP default_shared 3
Defaults to 
.I shared
.br
Python type:
.I pbs.ND_DEFAULT_SHARED
.IP default_excl 3
Defaults to 
.I exclusive
.br
Python type:
.I pbs.ND_DEFAULT_EXCL
.IP default_exclhost 3
Entire host is assigned to the job unless the job's sharing request
specifies otherwise
.br
Python type:
.I pbs.ND_DEFAULT_EXCLHOST
.IP ignore_excl 3
Overrides any job 
.I place=excl
setting
.br
Python type:
.I pbs.ND_IGNORE_EXCL
.IP force_excl 3
Overrides any job
.I place=shared
setting
.br
Python type:
.I pbs.ND_FORCE_EXCL
.IP force_exclhost 3
The entire host is assigned to the job, regardless of the job's sharing request
.br
Python type:
.I pbs.ND_FORCE_EXCLHOST
.IP Unset 3
Defaults to 
.I shared
.RE
.IP
Behavior of a vnode or host is determined by a combination of the 
.I sharing
attribute and a job's placement directive, defined as follows:
.nf
                 | Vnode Behavior      | Host Behavior
                 | when place=         | when place=
                 |                     |   
sharing value    | unset  shared excl  |exclhost !=exclhost
----------------------------------------------------------------
not set          | shared shared excl  | excl   depends on place
default_shared   | shared shared excl  | excl   depends on place
default_excl     | excl   shared excl  | excl   depends on place
default_exclhost | excl   shared excl  | excl   depends on place
ignore_excl      | shared shared shared| shared not exclusive
force_excl       | excl   excl   excl  | excl   not exclusive
force_exclhost   | excl   excl   excl  | excl   excl
.fi

Example: <vnode name>: sharing=force_excl
.br
Default value: 
.I default_shared

.IP state 8
Shows or sets the state of the vnode.  
.br
Readable by all.  All states are set by PBS; Operator and Manager 
can set 
.I state
to 
.I offline.
.br
Format: 
.I String 
.br
Syntax: 
.I <state>[, <state>, ...]
.br
(Comma-separated list of one or more states)
.br
Python type: 
.I int
.br
Valid values:
.RS
.IP busy 3
Vnode is reporting load average greater than allowed max.
Can combine with 
.I offline
.IP down 3
Node is not responding to queries from the server.  
Cannot be combined with 
.I free, provisioning.
.IP free 3
Vnode is up and capable of accepting additional job(s).
Cannot be combined with other states.
.IP job-busy 3
All CPUs on the vnode are allocated to jobs.
Can combine with: 
.I offline, resv_exclusive
.IP job-exclusive 3
Entire vnode is exclusively allocated to one job at the job's request.
Can combine:
.I offline, resv_exclusive
.IP offline 3
Jobs are not to be assigned to this vnode.  
Can combine: 
.I busy, job-busy, job-exclusive, resv_exclusive
.IP provisioning 3
Vnode is in being provisioned.  Cannot be combined with other states.
.IP resv-exclusive 3
Running reservation has requested exclusive use of vnode.  Can combine
with: 
.I job-exclusive, offline
.IP stale 3
Vnode was previously reported to server, but is no longer reported to
server.  Cannot combine with 
.I free, provisioning.
.IP state-unknown 3
The server has never been able to contact the vnode.  Either MoM is
not running on the vnode, the vnode hardware is down, or there is a
network problem.
.IP unresolvable 3
The server cannot resolve the name of the vnode.
.IP wait-provisioning 3
Vnode needs to be provisioned, but can't: limit reached
for concurrently provisioning vnodes.  See the 
.I max_concurrent_provision 
server attribute.
.RE
.IP
Default: No default

.IP topology_info
Contains information intended to be used in hooks.  
.br
Visible in and usable by hooks only.
Invisible to Manager, Operator, User.
.br
Format: 
.I XML String
.br
Python type: 
.I str
.br
Default value: 
.I Unset

.IP vnode_pool 8
Cray only.  Allows just one MoM, instead of all, to report inventory
upon startup, allowing faster startup and less network communication
between server and non-reporting MoMs.  On each Cray, all MoMs must
have same setting for this attribute.  Can be set only at vnode
creation; valid only on login nodes running a MoM.  Not supported on
non-Cray machines.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer
.br
Python type:
.I int
.br
Behavior:
.RS
.IP ">0" 3
Only one MoM per Cray reports inventory.
.IP Unset 3
Each MoM reports inventory separately.
.RE
.IP 
Default: 
.I 0
(Unset)


.SH SEE ALSO
qmgr(1B)


================================================
FILE: doc/man1/pbs_professional.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_professional 7B "6 May 2020" Local "PBS Professional"
.SH NAME
.B PBS Professional
\- The PBS Professional workload management system


.SH DESCRIPTION
PBS Professional is an HPC workload manager and job scheduler.
PBS schedules jobs onto systems with the required resources, according
to specified policy.  PBS runs on most major platforms.  See 
.B www.pbsworks.com 
and
.B https://pbspro.atlassian.net/wiki/spaces/PBSPro/overview.

.B Primary Commands
.br
.IP "init.d/pbs" 8
Starts, stops or restarts PBS daemons on the local machine.
This command is typically placed in /etc/init.d so that 
PBS starts up automatically.  See the 
.B pbs.8B
man page.
.br
.IP "qmgr" 8
Administrator's interface for configuring and managing PBS.  See the 
.B qmgr.8B 
man page.
.IP "qstat" 8
Administrator's and job submitter's tool for checking server, queue, and job status.
See the 
.B qstat.1B 
man page.
.IP "qsub" 8
Job submitter's tool for submitting jobs to PBS.  See the 
.B qsub.1B
man page.
.LP

.SH SEE ALSO
.br
pbs_mom(8B), pbs_server(8B), pbs_sched(8B), pbs_comm(8B)


================================================
FILE: doc/man1/pbs_python.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_python 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_python 
\- Python interpreter for debugging a hook script from the command line
.SH SYNOPSIS
.B pbs_python
--hook  [-e <log event mask>] [-i <event input file>] 
.RS 11
[-L <log dir>] [-l <log file>] [-o <hook execution record>] 
.br
[-r <resourcedef file>] [-s <site data file>] [<Python script>]
.RE

.B pbs_python
<standard Python options>

.B pbs_python
--version

.SH DESCRIPTION
The PBS Python interpreter, 
.B pbs_python,
is a wrapper for Python.  

You can use the 
.B pbs_python
wrapper that is shipped with PBS to debug hooks.  Either:
.RS 5
Use the 
.I --hook 
option to 
.B pbs_python
to run 
.B pbs_python
as a wrapper to Python, employing the 
.B pbs_python 
options.  With the 
.I --hook 
option, you cannot use the standard Python options.  The rest of this
man page covers how to use 
.B pbs_python
with the 
.I --hook
option.

Do not use the 
.I --hook
option, so 
.B pbs_python
runs the Python interpreter, with the standard Python options, and without access to
the 
.B pbs_python 
options.
.RE

.B Debugging Hooks
.br
You can get each hook to write out debugging files, and then modify the files
and use them as debugging input to
.B pbs_python.  
Alternatively, you can write them yourself.  

Debugging files can contain information about the event, about the site, and 
about what the hook changed.  You can use these as inputs to a hook when debugging.

.SH Options to pbs_python
.IP "--hook" 6
This option is a switch.  When you use this option, you can use the
PBS Python module (via "import pbs"), and the other options described
here are available.  When you use this option, you cannot use the
standard Python options.  This option is useful for debugging.  

When you do not use this option, you cannot use
the other options listed here, but you can use the standard 
Python options.

.IP "-e <log event mask>" 6
Sets the mask that determines which event types are logged by
.B pbs_python. 
To see only debug messages, set the value to 0xd80. To
see all messages, set the value to 0xffff.
.br
The 
.B pbs_python 
interpreter uses the same set of mask values that are
used for the 
.I $logevent <mask> 
entry in the 
.B pbs_mom 
configuration file.
See the pbs_mom.8B man page.  Available only when 
.I --hook 
option is used.

.IP "-i <event input file>" 6
Text file containing data to populate pbs.event() objects.  

Each line specifies an attribute value or a resource value.  Syntax of
each input line is one of the following:
.RS 10
<object name>.<attribute name>=<attribute value>
.br
<object name>.<resource list>[<resource name>]=<resource value>
.RE
.IP
Where
.RS 10
<object name> is a PBS object name which can refer to its sub-objects.  Examples:  
"pbs.event()", "pbs.event().job", "pbs.event().vnode_list["<vnode name>"]".
.RE
.IP
Example input file:
.RS 10
.br
pbs.event().hook_name=proto
.br
pbs.event().hook_type=site
.br
pbs.event().type=queuejob
.br
pbs.event().requestor=user1
.br
pbs.event().requestor_host=host1
.br
pbs.event().hook_alarm=40
.br
pbs.event().job.id=72
.br
pbs.event().job.Job_Name=job1
.br
pbs.event().job.Resource_List[ncpus]=5
.br
pbs.event().job.Resource_List[mem]=6mb
.br
pbs.event().vnode_list["host1"].resources_available["ncpus"] = 5
.br
pbs.event().vnode_list["host1"].resources_available["mem"] = 300gb
.RE

.IP
Available only when 
.I --hook 
option is used.


.IP "-L <log dir>" 6
Directory holding the log file where pbs.logmsg() and pbs.logjobmsg()
write their output.  Default is current working directory where 
.B pbs_python
is executed.
Available only when 
.I --hook 
option is used.

.IP "-l <log file>" 6
Log file where pbs.logmsg() and pbs.logjobmsg() write their output.
Default file name is current date in 
.I yyyymmdd 
format.
Available only when 
.I --hook 
option is used.

.IP "-o <hook execution record>" 6
The hook execution record contains the changes made after executing the hook
script, such as the attributes and resources set in any pbs.event()
jobs and reservations, whether an action was accepted or rejected, and any
pbs.reject() messages.
.br
Example hook execution record:
.RS 10
.br
pbs.event().job.Job_Name=job2
.br
pbs.event().job.Resource_List[file]=60gb
.br
pbs.event().job.Resource_List[ncpus]=5
.br
pbs.event().job.Resource_List[mem]=20gb
.br
pbs.event().job.Account_Name=account2
.br
pbs.event().reject=True
.br
pbs.event().reject_msg=No way! 
.RE

.IP 
Without this option, output goes to stdout.

.IP
Available only when 
.I --hook 
option is used.

.IP "-r <resourcedef file>" 6
File/path name containing a resource definition specifying a custom
resource whose Python type is 
.I pbs.resource.
.br 
Format: 
.br
.I <resource name> type=<typename> [flag=<value>]
.br
This file has the same format as the PBS_HOME/server_priv/resourcedef
file.  Available only when 
.I --hook 
option is used.

.IP "-s <site data file>" 6
The site data file can contain any relevant information about the
server, queues, vnodes, and jobs at the server.  This file 
can be written by a hook or by the administrator.  
.br
When the hook writes it, this file contains the values that populate
the server, queues, vnodes, reservations, and jobs, with all
attributes and resources for which there are values.
.br 
The site data file is named 
.I hook_<event type>_<hook name>_<random integer>.data.  
Available only when 
.I --hook 
option is used.

.IP "--version" 6
The 
.B pbs_python 
command prints its version information and exits.  This option
can only be used alone.  

.SH ARGUMENTS
.IP "<Python script>" 6
The hook script to execute.
We recommend importing the PBS Python module at the start of the script:
.RS 9
import pbs
.RE
.IP
If you do not specify 
.I Python script, 
you can perform interactive
debugging.  If you type the following:
.RS 9
pbs_python --hook -i hook.input
.RE
.IP
The interpreter displays a prompt:
.RS 9
>>
.RE
.IP
You can type your Python lines at the prompt:
.RS 9
>>import pbs
.br
>> e=pbs.event().job
.br
>> print e.id
.br
<job ID>
.br
...
.RE


================================================
FILE: doc/man1/pbs_queue_attributes.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_queue_attributes 7B "6 May 2020" Local "PBS Professional"
.SH NAME
pbs_queue_attributes
\- Attributes of PBS queues
.SH DESCRIPTION
Queues have the following attributes:

.IP acl_group_enable 8
Controls whether group access to the queue obeys the access control list defined in
the 
.I acl_groups 
queue attribute.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior: 
.RS 
.IP True 3
Group access to the queue is limited according to the group access control list.
.IP False 3
All groups are allowed access.
.RE
.IP
Default: 
.I False

.IP acl_groups 8
List of groups which are allowed or denied access to this queue. The
groups in the list are groups on the server host, not submitting
hosts.  List is evaluated left-to-right; first match in list is used.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<group name>[, ...]"
.br
Python type:
.I pbs.acl
.br
Default: No default

.IP acl_host_enable 8
Controls whether host access to the queue obeys the access control list defined in
the 
.I acl_hosts 
queue attribute.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior: 
.RS 
.IP True 3
Host access to the queue is limited according to the host access control list.
.IP False 3
All hosts are allowed access.
.RE
.IP
Default: 
.I False

.IP acl_hosts 8
List of hosts from which jobs may be submitted to this queue.  List is
evaluated left-to-right; first match in list is used.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<hostname>[, ...]"
.br
Python type:
.I pbs.acl
.br
Default: No default

.IP acl_user_enable 8
Controls whether user access to the queue obeys the access control list defined in
the 
.I acl_users 
queue attribute.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior: 
.RS 
.IP True 3
User access to the queue is limited according to the user access control list.
.IP False 3
All users are allowed access.
.RE
.IP
Default: 
.I False

.IP acl_users 8
List of users which are allowed or denied access to this queue.
List is evaluated left-to-right; first match in list is used.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<username>[, ...]"
.br
Python type:
.I pbs.acl
.br
Default: No default

.IP alt_router 8
No longer used.

.IP backfill_depth 8
Modifies backfilling behavior for this queue.  Sets the number of jobs 
to be backfilled around in this queue.  Overrides 
.I backfill_depth
server attribute.
.br
Recommendation: set this to less than 
.I 100.
.br
Applies to execution queues.
.br
Readable by all; settable by all.
.br
Format:
.I Integer
.br
Valid values: Must be >=0
.br
Behavior: 
.RS
.IP ">= 0" 3
PBS backfills around the specified number of jobs.
.IP "Unset" 3
Backfill depth is set to 
.I 1.
.RE
.IP
Python type:
.I int
.br
Default: Unset (backfill depth is 1)

.IP checkpoint_min 8
Minimum number of minutes of CPU time or walltime allowed
between checkpoints of a job.  
If a user specifies a time less than this
value, this value is used instead.  The value given in 
.I checkpoint_min
is used for both CPU minutes and walltime minutes.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I pbs.duration
.br
Default: No default

.IP default_chunk 8
The list of resources which will be inserted into each chunk of a job's select 
specification if the corresponding resource is not specified by the user.
This provides a means for a site to be sure a given resource is properly 
accounted for even if not specified by the user.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.RS 11
.nf
.I default_chunk.<resource name>=<value>
.I [, default_chunk.<resource name>=<value>, ...]
.fi
.RE
.IP
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
default_chunk["<resource name>"]=<value> 
.br
where 
.I resource name
is any built-in or custom resource
.RE
.IP
Default: No default

.IP enabled 8
Specifies whether this queue accepts new jobs.  
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS
.IP True 3
This queue is enabled.  This queue accepts new jobs; new jobs can be enqueued.
.IP False 3
This queue does not accept new jobs.
.RE
.IP
Default: 
.I False
(disabled)

.IP from_route_only 8
Specifies whether this queue accepts jobs only from routing queues, or
from both execution and routing queues.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS
.IP True 3
This queue accepts jobs only from routing queues.
.IP False 3
This queue accepts jobs from both execution and routing queues,
as well as directly from submitter.
.RE
.IP
Default: 
.I False

.IP hasnodes 8
Indicates whether vnodes are associated with this queue.
.br
Applies to execution queues.
.br
Readable by all; set by PBS.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior: 
.RS 11
When 
.I True,
there are vnodes associated with this queue.
.RE
.IP
Default: 
.I False

.IP kill_delay 8
The time delay between sending SIGTERM and SIGKILL when a qdel command
is issued against a running job.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Units:
.I Seconds
.br
Python type:
.I pbs.duration
.br
Valid values: Must be >= 0
.br
Default: 
.I 10 seconds

.IP max_array_size 8
The maximum number of subjobs that are allowed in an array job.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP max_group_res 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum amount of the specified resource that any single group may consume
in a complex.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax: 
.I max_group_res.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_group_res["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set server max_group_res.ncpus=6
.br
Default: No default

.IP max_group_res_soft 8
Old limit attribute.  Incompatible with new limit attributes.
The soft limit on the amount of the specified resource that any single group may consume
in a complex.
If a group is consuming more than this amount of the specified resource,
their jobs are eligible to be preempted by jobs from groups who are not over
their soft limit.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax: 
.I max_group_res_soft.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax: 
.RS 11
max_group_res_soft["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set queue workq max_group_res_soft.ncpus=3
.br
Default: No default

.IP max_group_run 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum number of jobs owned by a group that are
allowed to be running from this queue at one time.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP max_group_run_soft 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum number of jobs owned by users in a single group that are
allowed to be running from this queue at one time.
If a group has more than this number of jobs
running, their jobs are eligible to be preempted by jobs from groups who are not over
their soft limit.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP max_queuable 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum number of jobs allowed to reside in this queue at any given time.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default (no limit)

.IP max_queued 8
Limit attribute.  The maximum number of jobs allowed to be queued
in or running from this queue.  Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes. 
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
.br
Format:
.I Limit specification.  
See 
.B FORMATS.
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_queued["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP max_queued_res 8
Limit attribute.  The maximum amount of the specified resource 
allowed to be allocated to jobs queued in or running from this queue.
Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes.  
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Limit specification.  
See 
.B FORMATS.
.br
Syntax: 
.I max_queued_res.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax: 
.RS 11
max_queued_res["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set queue workq max_queued_res.ncpus=4
.br
Default: No default

.IP max_run 8
Limit attribute.  The maximum number of jobs allowed to be running 
from this queue.  Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes. 
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Limit specification.  
See 
.B FORMATS.
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_run["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP max_run_res 8
Limit attribute.  The maximum amount of the specified resource 
allowed to be allocated to jobs running from this queue.
Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes.  
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Limit specification.  
See 
.B FORMATS.
.br
Syntax: 
.I max_run_res.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_run_res["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set queue workq max_run_res.ncpus=4
.br
Default: No default

.IP max_run_res_soft 8
Limit attribute.  Soft limit on the amount of the specified resource 
allowed to be allocated to jobs running from this queue.
Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes.  
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Limit specification.  
See 
.B FORMATS.
.br
Syntax: 
.I max_run_res_soft.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_run_res_soft["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set queue workq max_run_res_soft.ncpus=2
.br
Default: No default

.IP max_run_soft 8
Limit attribute.  Soft limit on the number of jobs allowed to be running 
from this queue.  Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes.  
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Limit specification.  
See 
.B FORMATS.
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_run_soft["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP max_running 8
Old limit attribute.  Incompatible with new limit attributes.
For an execution queue, this is the largest number of jobs allowed to 
be running at any given time.  For a routing queue, this is the largest
number of jobs allowed to be transiting from this queue at any given 
time.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP max_user_res 8 
Old limit attribute.  Incompatible with new limit attributes.
The maximum amount of the specified resource that any single user may consume.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.I max_user_res.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_user_res["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set queue workq max_user_res.ncpus=2
.br
Default: No default

.IP max_user_res_soft 8
Old limit attribute.  Incompatible with new limit attributes.
The soft limit on the amount of the specified resource that any single user may consume.
If a user is consuming more than this amount of the specified resource,
their jobs are eligible to be preempted by jobs from users who are not over
their soft limit.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.I max_user_res_soft.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_user_res_soft["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set queue workq max_user_res_soft.ncpus=2
.br
Default: No default

.IP max_user_run 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum number of jobs owned by a single user that are allowed to be 
running from this queue at one time.  
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP max_user_run_soft 8
Old limit attribute.  Incompatible with new limit attributes.
The soft limit on the number of jobs owned by any single user that are allowed to be
running from this queue at one time.  If a user has more than this number of jobs
running, their jobs are eligible to be preempted by jobs from users who are not over
their soft limit.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP node_group_key 8
Specifies the resources to use for placement sets.  Overrides server's 
.I node_group_key
attribute.  Specified resources must be of type 
.I string_array.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I string_array
.br
Syntax:
.RS 11
.I Comma-separated list of resource names.  
.br
When specifying multiple resources, enclose value in double quotes.
.RE
.IP
Python type:
.I pbs.node_group_key
.br
Example:
.RS 11
Qmgr> set queue workq node_group_key=<resource name>
.RE
.IP
Default: No default

.IP partition 8
Name of partition to which this queue is assigned.  Cannot be set for
routing queue.  An execution queue cannot be changed to a routing
queue while this attribute is set.
.br
Applies to execution queues.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP Priority 8
The priority of this queue compared to other queues of the same type
in this PBS complex.  Priority can define a queue as an express queue.  See 
.I preempt_queue_prio
in the pbs_sched(8B) man page.  Used for execution queues only; the value
of 
.I Priority 
has no meaning for routing queues.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Valid values: -1024 to 1023
.br
Python type:
.I int
.br
Default: No default

.IP queued_jobs_threshold 8
Limit attribute.  The maximum number of jobs allowed
to be queued in this queue.  Can be specified for
projects, users, groups, or all.  Cannot be used with old limit
attributes.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Limit specification;
See 
.B LIMITS
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
queued_jobs_threshold["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP queued_jobs_threshold_res 8
Limit attribute.  The maximum amount of the specified resource allowed
to be allocated to jobs queued in this queue.  Can be specified for
projects, users, groups, or all.  Cannot be used with old limit
attributes.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I limit specification.
See 
.B LIMITS
.br
Syntax:
.I queued_jobs_threshold_res.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
queued_jobs_threshold_res_["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Valid values: Any PBS resource, e.g. "ncpus", "mem", "pmem"
.br
Example: 
.I set queue workq queued_jobs_threshold_res.ncpus=8
.br
Default: No default

.IP queue_type 8
The type of the queue.  This attribute must be explicitly set 
at queue creation.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Python type: 
.RS 11
PBS queue type constant: 
.I pbs.QUEUETYPE_EXECUTION 
or 
.I pbs.QUEUETYPE_ROUTE
.RE
.IP
Valid values: "e", "execution", "r", "route"
.br
Default: No default

.IP require_cred 8
Specifies the credential type required.  All jobs submitted to the named 
queue without the specified credential will be rejected.  
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Python type:
.I str
.br
Valid values:
.I krb5
or 
.I dce
.br
Default: Unset

.IP require_cred_enable 8
Specifies whether the credential authentication method specified in the 
.I require_cred 
queue attribute is required for this queue. 
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 11
When set to 
.I True,
the credential authentication method is required.
.RE
.IP
Default: 
.I False

.IP resources_assigned 8
The total for each kind of resource allocated to running and 
exiting jobs in this queue.
.br
Applies to execution queues.
.br
Readable by all; set by PBS.
.br
Format:
.I String
.br
Syntax:
.RS 11
.nf
.I resources_assigned.<resource name>=<value><newline> 
.I resources_assigned.<resource name>=<value><newline> ...
.fi
.RE
.IP
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_assigned["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP 
Default value: No default

.IP resources_available 8
The list of resources and amounts available to jobs running in this
queue. The sum of the resource of each type used by all jobs running
from this queue cannot exceed the total amount listed here.  See the
.I qmgr(1B) 
man page.
.br
Applies to execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.RS 11
.nf
.I resources_available.<resource name>=<value><newline> 
.I resources_available.<resource name>=<value><newline> ...
.fi
.RE
.IP
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_available["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP 
Default value: No default

.IP resources_default 8
The list of default resource values which are set as limits for a job 
residing in this queue and for which the job did not specify a limit.  
If not explicitly set, the default limit for a job is determined by
the first of the following attributes which is set: server's 
.I resources_default,
queue's 
.I resources_max, 
server's 
.I resources_max.  
If none of these is set, the job gets unlimited resource usage.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.RS 11
.nf
.I resources_default.<resource name>=<value>,
.I resources_default.<resource name>=<value>, ...
.fi
.RE
.IP
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_default["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP 
Default value: No default

.IP resources_max 8
The maximum amount of each resource that can be requested by a single job
in this queue.  The queue value supersedes any server wide maximum limit.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.RS 11
.nf
.I resources_max.<resource name>=<value>,
.I resources_max.<resource name>=<value>, ...
.fi
.RE
.IP
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_max["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP 
Default value: No default (infinite usage)

.IP resources_min 8
The minimum amount of each resource that can be requested by a single job
in this queue.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I String
.br
Syntax:
.RS 11
.nf
.I resources_min.<resource name>=<value>,
.I resources_min.<resource name>=<value>, ...
.fi
.RE
.IP
Python type:
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_min["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP 
Default value: No default (zero usage)

.IP route_destinations 8
The list of destinations to which jobs may be routed.
.br
Must be set to at least one valid destination.
.br
Applies to routing queues.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Syntax:
.RS 11
List of comma-separated strings:
.br
.I <queue name>[@<server host>[:<port>]]
.RE
.IP
Python type:
.I pbs.route_destinations
.br
Example:  
.I Q1,Q2@remote,Q3@remote:15501
.br
Default: No default

.IP route_held_jobs 8
Specifies whether jobs in the 
.I held
state can be routed from this queue.
.br
Applies to routing queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 11
When 
.I True, 
jobs with a hold can be routed from this queue.
.RE
.IP
Default: 
.I False

.IP route_lifetime 8
The maximum time a job is allowed to reside in this routing queue.  If a job
cannot be routed in this amount of time, the job is aborted.
.br
Applies to routing queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer
.br
Units:
.I Seconds
.br
Python type:
.I pbs.duration
.br
Behavior:
.RS 
.IP >0 3
Jobs can reside for specified number of seconds
.IP "0 or unset" 3
Jobs can reside for infinite time
.RE
.IP
Default: Unset

.IP route_retry_time 8
Time delay between routing retries.  Typically used when the network between
servers is down.  
.br
Applies to routing queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Integer 
.br
Units: 
.I Seconds
.br
Python type:
.I pbs.duration
.br
Default: 
.I 30 seconds

.IP route_waiting_jobs 8
Specifies whether jobs whose 
.I Execution_Time 
attribute value is in the future can be routed from this queue. 
.br
Applies to routing queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Boolean 
.br
Python type:
.I bool
Behavior:
.RS 11
When 
.I True,
jobs with a future
.I Execution_Time 
can be routed from this queue.
.RE
.IP
Default: 
.I False

.IP started 8
If this is an execution queue, specifies whether jobs in this queue can be scheduled for execution, 
or if this is a routing queue, whether jobs can be routed.
.br
Applies to routing and execution queues.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior: When
.I True, 
jobs in this queue can run or be routed.
.br
Default: 
.I False

.IP state_count 8
The total number of jobs in each state currently residing in this queue.
.br
Applies to routing and execution queues.
.br
Readable by all; set by PBS.
.br
Format:
.I String
.br
Syntax: 
.I transiting=<value>,exiting=<value>, ...
.br
Python type:
.I pbs.state_count
.br
Default: No default

.IP total_jobs 8
The number of jobs currently residing in this queue.
.br
Applies to routing and execution queues.
.br
Readable by all; set by PBS.
.br 
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default


.SH FORMATS

.IP "Limit specification" 8
Limit attributes can be set, added to, or removed from.

Format for setting a limit specification:
.RS 11
.nf
set server <limit attribute> = "<limit specification>=<limit>[, <limit specification>=<limit>] ..."
.fi
.RE
.IP
Format for adding to a limit specification:
.RS 11
.nf
set server <limit attribute> += "<limit specification>=<limit>[, <limit specification>=<limit>] ..."
.fi
.RE
.IP
Format for removing from a limit specification:
.RS 11
.nf
set server <limit attribute> -= "<limit specification>=<limit>[, [<limit specification>=<limit>] ..."
.br
or
.br
set server <limit attribute> -= "<limit specification>[, <limit specification>] ..."
.fi
.RE
.IP
Where 
.I limit specification 
is 
.RS 11
o:PBS_ALL         Overall limit
.br
u:PBS_GENERIC     Generic users
.br
u:<username>      A specific user
.br
g:PBS_GENERIC     Generic groups
.br
g:<group name>    A specific group
.br
p:PBS_GENERIC     Generic projects
.br
p:<project name>  A specific project
.RE
.IP
The 
.I limit specification 
can contain spaces anywhere except after the colon
(":").
.br
If there are comma-separated 
.I limit specifications, 
the entire string must be enclosed in double quotes.
.br
A username, groupname, or project name containing spaces must be
enclosed in quotes.
.br
If a username, groupname, or project name is quoted using double
quotes, and the entire string requires quotes, the outer enclosing
quotes must be single quotes.  Similarly, if the inner quotes are
single quotes, the outer quotes must be double quotes.
.br
.I PBS_ALL 
is a keyword which indicates that this limit applies to the usage total.
.br
.I PBS_GENERIC 
is a keyword which indicates that this limit applies to
generic users, groups, or projects.
.br
When removing a limit, the 
.I limit value 
does not need to be specified.
.br

For example, to set the 
.I max_queued 
limit on QueueA to 5 for total usage, and to limit user bill to 3:
.RS 11
s q QueueA max_queued = "[o:PBS_ALL=5], [u:bill =3]"
.RE
.IP

Examples of setting, adding, and removing: 
.br
.RS 11
set server max_run="[u:PBS_GENERIC=2], [g:group1=10], [o:PBS_ALL = 100]"
.br
set server max_run+="[u:user1=3], [g:PBS_GENERIC=8]"
.br
set server max_run-="[u:user2], [g:group3]"
.br
set server max_run_res.ncpus="[u:PBS_GENERIC=2], [g:group1=8], [o:PBS_ALL = 64]"
.RE
.IP

.SH Incompatible Limit Attributes
The old and new limit attributes are incompatible.  
If any of one kind is set, none of the other kind can be set.
All of one kind must be unset in order to set any of the other kind.
.br


.SH SEE ALSO
qmgr(1B)


================================================
FILE: doc/man1/pbs_ralter.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_ralter 1B "28 February 2021" Local "PBS Professional"
.SH NAME
.B pbs_ralter 
\- modify an existing reservation
.SH SYNOPSIS
.B pbs_ralter
[-D <duration>] [-E <end time>] [-G <auth group list>] 
           [-I <block time>] [-l select=<select spec>]
           [-m <mail points>] [-M <mail list>] 
           [-N <reservation name>] [-R <start time>] 
           [-U <auth user list>] <reservation ID>
.br
.B pbs_ralter
-Wforce [-D <duration>] [-E <end time>] [-R <start time>]
           <reservation ID>
.br
.B pbs_ralter
--version
.SH DESCRIPTION
You can use the 
.B pbs_ralter 
command to alter an existing reservation, whether it is an 
individual job-specific, advance, or maintenance reservation,
or the next or current occurrence of a standing
reservation.  You can change the start time, end time, duration,
events that generate mail, mail recipient list, authorized groups,
authorized users, and reservation name.

The PBS Administrator can use the 
.I -Wforce
option to this command to change the start time, end time, or duration
of a reservation; this option overrides the scheduler's actions.

After the change is requested, the change is either confirmed or
denied. On denial of the change, the reservation is not deleted and is
left as is, and the following message appears in the server's log:
.nf
   Unable to alter reservation <reservation ID> 
.fi

When a reservation is
confirmed, the following message appears in the server's log:
.nf
   Reservation alter successful for <reservation ID> 
.fi

To find out whether or not the change was allowed: 
.RS 3
Use the pbs_rstat command: see whether you altered reservation attribute(s) 

Use the interactive option: check for confirmation after the blocking
time has run out

Check the server log for confirmation or denial messages
.RE

Before the change is confirmed or denied, the change is unconfirmed,
and the reservation state is 
.I AL.  

Once a reservation change is confirmed, the reservation state is 
.I CO 
or 
.I RN.  

If the reservation has not started and it cannot be confirmed on the same vnodes, PBS
searches for another set of vnodes.

If the reservation is altered, PBS logs a 
.I Y 
accounting record.  

.B Caveats and Restrictions
.br
You cannot change the start time of a reservation if jobs are running in it.

If you change the end time of a reservation so that it ends before a job running in the 
reservation finishes, the job is killed when the reservation ends.

.B Required Privilege
.br
Without the 
.I Wforce
option, this command can be used by the reservation owner or the PBS
Administrator.

With the 
.I Wforce 
option, this command can be used only by the PBS Administrator.

.SH Options to pbs_ralter

.IP "-D <duration>" 10
Specifies reservation's new duration. This option can be used even
when the reservation is running and has jobs that are submitted to
and/or are running in the reservation.  

Can be specified with start and/or end time.  PBS calculates anything
not specified.  When specified without start or end time, PBS keeps
previous start time.

If you change the duration to less than the time the reservation has
already run, PBS deletes the reservation.  

Format: 
.I Duration, 
as 
.I seconds 
or 
.I hh:mm:ss

.IP "-E <end time>" 10
Specifies reservation's new end time. This option can be used even
when the reservation is running and has jobs that are submitted to
and/or are running in the reservation.

Format: 
.I Datetime

.IP "-G <auth group list>" 10
Comma-separated list of names of groups who
can or cannot submit jobs to this reservation.  Sets reservation's 
.I Authorized_Groups 
attribute to 
.I auth group list.
.br
This list becomes the 
.I acl_groups 
list for the 
reservation's queue. 
.br
More specific entries should be listed before more general, because the
list is read left-to-right, and the first match determines access.
.br
If both the
.I Authorized_Users
and 
.I Authorized_Groups
reservation attributes are set, a user must belong to both in order to
be able to submit jobs to this reservation.  
.br
Group names are
interpreted in the context of the server's host, not the context of the host 
from which the job is submitted. 
.br
See the 
.I Authorized_Groups 
reservation attribute in the 
pbs_resv_attributes(7B) man page.  
.br
Syntax: 
.I [+|-]<group name>[,[+|-]<group name> ...]
.br
Default: no default; group names are unchanged

.IP "-I <block time>" 10
(Capital I) Specifies interactive mode. The pbs_ralter command will block, up to
.I block time 
seconds, while waiting for the reservation's change request
to be confirmed or denied.

The value for 
.I block time 
must be positive. The pbs_ralter command
returns either the status 
.I "CONFIRMED" 
or the status 
.I "DENIED".

Format: 
.I Integer

Default: Not interactive

.IP "-l select=<select spec>" 10
(Lowercase L) Specifies new select specification for reservation.  New
specification must be a subset of the same chunks requested by the
original reservation.  If reservation is started, cannot be used to
release chunks where reservation jobs are running.  If reservation is
started and degraded, you must release all unavailable chunks in
order to alter the reservation select specification.

.IP "-m <mail points>" 10
Specifies the set of events that cause mail to be sent to the list of
users specified in the 
.I -M <mail list> 
option.

Format: 
.I String
.br
Syntax: Either of
.RS 13
1) any combination of "a", "b", "c" or "e", or
.br
2) the single character "n"
.RE
.IP
.nf
Suboptions to -m Option:

Character   Meaning
--------------------------------------------------------------
a           Notify if reservation is terminated for any reason
b           Notify when the reservation period begins
c           Notify when the reservation is confirmed
e           Notify when the reservation period ends
n           Send no mail.  Cannot be used with any of a, b, c or e.
.fi

Default: No default; if not specified, mail events are unchanged

.IP "-M <mail list>" 10
The list of users to whom mail is sent whenever the reservation
transitions to one of the states specified in the
.I -m <mail points> 
option.  

Format: 
.I <username>[@<hostname>][,<username>[@<hostname>]...]

Default: No default; if not specified, user list is unchanged

.IP "-N <reservation name>" 10
Specifies a name for the reservation.  

Format: 
.RS 13
String up to 15 characters in length.  It must consist of printable,
non-white space characters with the first character alphabetic.
.RE
.IP
Default: No default; if not specified, reservation name is unchanged

.IP "-R <start time>" 10
Specifies reservation's new start time. This option can be used either
when the reservation is not running or there are no jobs are submitted
to the reservation.  You cannot use this option when a reservation is
not empty and has started running.

The specifications for providing the time are the same as for pbs_rsub:
.br
If the day, 
.I DD, 
is not specified, it defaults to today if the time
.I hhmm 
is in the future.  Otherwise, the day is set to tomorrow.  For
example, if you alter a reservation with the specification -R 1110 at
11:15 a.m., it is interpreted as being for 11:10 a.m. tomorrow.  If
the month portion,
.I MM, 
is not specified, it defaults to the current month, provided that the specified day 
.I DD, 
is in the future.  Otherwise, the month is set to next month.  Similar
rules apply to the two other optional, left-side components.

Format: 
.I Datetime

.IP "-U <auth user list>" 10
Comma-separated list of users who are and are not allowed to 
submit jobs to this reservation.  Sets reservation's 
.I Authorized_Users 
attribute to 
.I auth user list.
.br
This list becomes the 
.I acl_users 
attribute for the reservation's queue. 
.br
More specific entries should be listed before more general, because the
list is read left-to-right, and the first match determines access. 
The reservation creator's username is automatically added to this list,
whether or not the reservation creator specifies this list.
.br
If both the
.I Authorized_Users
and 
.I Authorized_Groups
reservation attributes are set, a user must belong to both in order to be able to 
submit jobs to this reservation.
.br
See the 
.I Authorized_Users
reservation attribute in the pbs_resv_attributes(7B) man page.
.br
Syntax:
.I [+|-]<username>[@<hostname>][,[+|-]<username>[@<hostname>]...]
.br 
Default: no default; user list is unchanged
.br

.IP "-Wforce" 10
Enforces changes made to the reservation start time, end time, or
duration, regardless of the actions of the scheduler.  Can be used
only by the PBS Administrator.  Note that with this option you can
force PBS to oversubscribe resources, in which case you (the
administrator) may need to manage them yourself.  Cannot be used to
change the start time of a reservation in which jobs are running.

.IP "--version" 10
The 
.B pbs_ralter
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
The pbs_ralter command takes a reservation ID.
.br
For an advance or job-specific reservation this has the form:
.RS 4
.I "R<sequence number>[.<server name>][@<remote server>]"
.RE
For a standing reservation this has the form:
.RS 4
.I "S<sequence number>[.<server name>][@<remote server>]"
.RE
For a maintenance reservation this has the form:
.RS 4
.I "M<sequence number>[.<server name>][@<remote server>]"
.RE

.I @<remote server> 
specifies a reservation at a server other than the default server.


================================================
FILE: doc/man1/pbs_rdel.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_rdel 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_rdel 
\- delete a PBS reservation 
.SH SYNOPSIS
.B pbs_rdel
<reservation ID>[,<reservation ID>...]
.br
.B pbs_rdel
--version
.SH DESCRIPTION
The 
.B pbs_rdel
command deletes reservations in the order specified.

This command deletes the specified reservations, whether or not they
are running, all jobs in the reservations, and the reservation queues.

.B Required Privilege
.br
A reservation may be deleted by its owner, a PBS Operator,
or a PBS Manager.

.SH OPTIONS
.IP "--version" 10
The 
.B pbs_rdel
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
The pbs_rdel command accepts one or more 
.I reservation ID
operands.  
.br
For an advance or job-specific reservation this has the form:
.RS 4
.I "R<sequence number>[.<server name>][@<remote server>]"
.RE
For a standing reservation this has the form:
.RS 4
.I "S<sequence number>[.<server name>][@<remote server>]"
.RE
For a maintenance reservation this has the form:
.RS 4
.I "M<sequence number>[.<server name>][@<remote server>]"
.RE

.I @<remote server> 
specifies a reservation at a server other than the default server.

.SH EXIT STATUS
.IP "Zero" 10 
Upon success
.IP "Greater than zero" 10
Upon failure to process any operand

.SH SEE ALSO
pbs_rsub(1B),
pbs_rstat(1B),
pbs_resv_attributes(7B)


================================================
FILE: doc/man1/pbs_release_nodes.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_release_nodes 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_release_nodes 
\- release vnodes assigned to a PBS job
.SH SYNOPSIS
.B pbs_release_nodes
[-j <job ID>] 
.RS 18
.br
[-k (<number of hosts to keep> | 
.br
<selection of vnodes to keep>)] 
.br
<vnode> [<vnode> [<vnode>] ...]
.RE
.br
.B pbs_release_nodes 
[-j <job ID>] -a
.br
.B pbs_release_nodes
--version
.SH DESCRIPTION

You can use the 
.B pbs_release_nodes 
command to release no-longer-needed
sister hosts or vnodes assigned to a running job, before the job would
normally release them.  These vnodes are then available for use by
other jobs.  

You can specify the names of sister vnodes to be released, or you can
release all sister vnodes not on the primary execution host that are
assigned to a running job via the
.I -a 
option.

PBS can keep the numbe of sister hosts you specify, or PBS can release
all sister vnodes except for the ones you specify vi a a select
statement.  

Can be used on jobs and subjobs, but not on job arrays or ranges of
subjobs.

.B Caveats and Restrictions
.br

You can release only sister hosts or vnodes that are not on the
primary execution host.  You cannot release vnodes on the primary
execution host.

The job must be running (in the 
.I R 
state).

The pbs_release_nodes command is not supported on vnodes tied to Cray
X* series systems (vnodes whose 
.I vntype 
has the "cray_" prefix).

If cgroups support is enabled, and pbs_release_nodes is called to
release some but not all the vnodes managed by a MoM, resources on
those vnodes that are part of a cgroup are not released until the
entire cgroup is released.

You cannot release a partial host.  If you try to release some but not
all of a host, the job's 
.I exec_vnode 
attribute shows the new, smaller list of vnodes, but the pbsnodes
command will reveal that the host is still allocated to the job.

If you specify release of a vnode on which a job process is running,
that process is terminated when the vnode is released.

.B Required Privilege
.br
This command can be run by the job owner, the PBS Manager, Operator,
and Administrator, as well as root on Linux and Admin on Windows.

.SH Options to pbs_release_nodes

.IP "-a" 10
Releases all job vnodes not on the primary execution host.  Cannot be
used 
.I -k
option, or with list of vnode names.

.IP "-j <job ID>" 10
Specifies the job ID for the job or subjob whose vnode(s) are to be released.

.IP "-k <keep number> | <keep selection>" 10
Use 
.I keep number 
to specify how many sister hosts to keep.

Use 
.I keep selection 
to specify which sister vnodes to keep.  The 
.I keep selection 
is a select statement beginning with "select=" specifying which vnodes to keep.  

The primary execution host and its vnodes are not released.

For example, to release all sister hosts except 8:
.br
.B \ \ \ pbs_release_nodes -k 8
.br

To release all sister vnodes except for 4 of the ones marked with
"bigmem":

.br
.B \ \ \ pbs_release_nodes -k select=4:bigmem=true

Cannot be used with 
.I -a 
option or with vnode list argument.

.IP "(no options)" 10
With no options, pbs_release_nodes uses the value of the
.I PBS_JOBID 
environment variable as the job ID of the job whose vnodes are to be released.

.IP "--version" 10
The pbs_release_nodes command returns its PBS version information and exits.
This option can only be used alone.

.SH Operands for pbs_release_nodes
The pbs_release_nodes command can take as an operand a list of vnodes.  Format:
.br
.I <vnode name> [<vnode name> [<vnode name>] ...]
.br
Cannot be used with the 
.I -a 
option.

.SH Usage
This command can be run at the command line, or called inside a job
script, where it can use the value of the 
.I PBS_JOBID 
environment variable.

You can release any vnode that appears in the job's 
.I exec_vnode 
attribute that is not on the primary execution host.  You can release
a particular set of a job's vnodes, or you can release all of a job's
non-primary-execution-host vnodes.

To release specific vnodes:
.br
.B \ \ \  pbs_release_nodes [-j <job ID>] <vnode name> [<vnode name>] ...]

To release all of a job's vnodes that are not on the primary execution host:
.br
.B \ \ \  pbs_release_nodes [-j <job ID>] -a

To release all except a specified number of vnodes:
.br
.B \ \ \ pbs_release_nodes -k <number of sister hosts to keep>

To release all vnodes except for those in a select specification:
.br
.B \ \ \ pbs_release_nodes -k <select specification>


================================================
FILE: doc/man1/pbs_resources.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_resources 7B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_resources 
\- computational resources for PBS jobs


.SH DESCRIPTION
PBS provides computational resources for jobs, limits on using 
resources, and control over how
jobs are placed on the vnodes from which resources may be allocated for
a job.

PBS provides built-in resources and custom resources for some systems, 
and allows the administrator to define
custom resources.  The administrator can specify which resources are
available on a given vnode, as well as at the queue or server level
(e.g. walltime).  Resources can be "stretched" across vnodes.
See the 
.I qmgr(8B)
man page.

Resources defined at the queue or server level apply to an entire job.
If resources are defined at the host level, they apply only to the part of
the job running on that host.

.B Allocating Resources to Jobs
.br
Resources are allocated to jobs when jobs explicitly request them, 
when hooks assign them, and when defaults are assigned by PBS.  
Resources are explicitly requested in this order of precedence:
.RS 3
Through a
.B qalter
operation
.br
Via the 
.B qsub
command line
.br
Via PBS job script directives  
.RE 
The administrator writes
any hooks that assign resources to jobs.  Default resources can be
specified by the administrator (in order of precedence) for
.B qsub
arguments, 
queues, the server, and vnodes.  

.B Limits on Resource Usage
.br
A resource allocated to a job, whether explicitly requested or
assigned via hooks or defaults, places a limit on the amount of that
resource a job can use.  This limit applies to how much the job can
use on each vnode and to how much the whole job can use.

.B Placing Jobs on Vnodes
.br
Jobs are placed on vnodes according to their explicit placement request, 
or according to default placement rules.
The explicit placement request can be specified (in order of precedence) using 
.B qalter, qsub, 
and PBS job script directives.
Default placement rules can be specified for queues and the server, 
and rules for default placement take effect if no other placement
specifications exist.  
A job's placement request is specified in its 
.I place statement.

.B Old Syntax
.br
A job submitted with the old node or resource specification syntax
will be converted to the new select and place syntax.  If the job is
submitted with
.I -lnodes= 
or 
.I -lncpus=
it will be converted to 
.I -l select=
and 
.I -l place=.  See 
.B BACKWARD COMPATIBILITY.  
Jobs cannot use both new and old syntax for resource requests.

.B Allocating Chunks and Job-wide Resources
.br
Job resource requests are defined either at the host level in 
.I chunks
specified in a 
.I selection statement,
or as job-wide resources.  
.br
Job-wide format: 
.RS 3
.nf
.I qsub ... -l <resource name>=<value>
.RE
Chunk format:
.RS 3
.I -l select=<chunks>
.fi
.RE
The only resources that can be
requested in chunks are host-level resources, such as 
.I mem 
and 
.I ncpus.
The only resources that can be in a job-wide request are server-level
or queue-level resources, such as 
.I walltime.  

.IP " " 3
.RS
.B Requesting Resources in Chunks
.br
A 
.I chunk 
declares the value of each resource in a set of resources
which are to be allocated as a unit to a job.  All of a chunk 
must be taken from a single vnode.  
A 
.I chunk
request is a host-level request, and it must be for a host-level resource.
A
.I chunk
is the smallest 
set of resources that will be allocated to a job.  It is one or 
more 
.I <resource name>=<value>
statements separated by a colon, e.g.:
.RS 3
ncpus=2:mem=10GB:host=Host1
.br
ncpus=1:mem=20GB:arch=linux
.RE

.I Chunks 
are described in a 
.I selection statement, 
which specifies how many of each kind of chunk.
A selection statement is of the form:
.RS 3
.I -l select=[<N>:]<chunk>[+[<N>:]<chunk> ...]
.RE
If 
.I N 
is not specified, it is taken to be 1.
.br
No spaces are allowed between chunks.

Example of multiple chunks in a 
.I selection statement:
.RS 3
-l select=2:ncpus=1:mem=10GB+3:ncpus=2:mem=8GB
.RE

.B Requesting Job-wide Resources
.br
A job-wide resource request is for resource(s) at the server or queue
level.  This resource must be a server-level or queue-level resource.
A job-wide resource is designed to be used by the entire job, and is
available to the complex, not just one execution host.  Job-wide
resources are requested outside of a
.I selection statement, 
in this form:
.RS 3
.I -l <resource name>=<value>[,<resource name>=<value> ...]
.RE
where 
.I resource name
is either a consumable resource or a time-based resource such
as
.I walltime.

Example of job-wide resources: walltime

.B Do not mix old style resource or node specification with the new select and place statements.
Do not use one in a job script and the other on the command line.
This will result in an error.

See the qsub(1B) man page for a detailed description of how to request 
resources and place jobs on vnodes.

.B Applying Resource Defaults
.br
When a default resource is defined, it is applied to a job when that
job does not explicitly request the resource.  Jobs get default
resources, both
.I job-wide 
and per-
.I chunk
with the following order of precedence, from 
.RS 3
Default
.B qsub
arguments
.br	
Default queue resources
.br	
Default server resources
.RE

For each 
.I chunk
in the job's selection statement, first queue chunk defaults are
applied, then server chunk defaults are applied.  If the chunk does not
contain a resource defined in the defaults, the default is
added.  The chunk defaults are specified with "default_chunk.<resource name>".

For example, if the queue in which the job is enqueued has the
following defaults defined: 
.RS 3
default_chunk.ncpus=1
.br
default_chunk.mem=2gb
.RE
a job submitted with this selection statement:
.RS 3
select=2:ncpus=4+1:mem=9gb 
.RE
will have this specification after the 
.I default_chunk 
elements are applied:
.RS 3
select=2:ncpus=4:mem=2gb+1:ncpus=1:mem=9gb 
.RE
In the above, mem=2gb and ncpus=1 are inherited from 
.I default_chunk.

If a default job-wide resource is defined which is not specified in a
job's resource request, it is added to the resource request.
Queue defaults are applied first, then server defaults are applied
to any remaining gaps in the resource request.

.B Specifying Default Resources
.br
The administrator can specify default resources on the server and
queue.  These resources can be job-wide or apply to chunks.  Job-wide
resources are specified via
.I resources_default 
on the server or queue, and chunk
resources are specified via 
.I default_chunk 
on the server or queue.

The administrator can specify default resources to be added to
any qsub arguments via the server's 
.I default_qsub_arguments
attribute.

.B Specifying Default Placement
.br
The administrator can specify default job placement by setting 
a value for 
.I resources.default 
at the queue or server. 

See the qmgr(8B) man page for how to set default resources.

.B How Default Resources Work When 
.B Moving Jobs Between Queues
.br
If the job is moved from the current queue to a new queue, any default
resources in the job's resource list are removed.  This
includes a select specification and place directive generated by the
rules for conversion from the old syntax.  If a job's resource is
unset (undefined) and there exists a default value at the new queue or server,
that default value is applied to the job's resource list.  If either
.I select 
or 
.I place
is missing from the job's new resource list, it will 
be automatically generated,
using any newly-inherited default values.

Example:
.RS 3
Given the following set of queue and server default values:
.IP Server 3
resources_default.ncpus=1
.IP "Queue QA" 3
resources_default.ncpus=2
.br
default_chunk.mem=2gb
.IP "Queue QB" 3
default_chunk.mem=1gb
.br
no default for ncpus
.LP

The following illustrate the equivalent select specification for jobs
submitted into queue QA and then moved to (or submitted directly to)
queue QB:
.IP "qsub -l ncpus=1 -lmem=4gb" 3
In QA:  select=1:ncpus=1:mem=4gb  -  no defaults need be applied
.br
In QB:  select=1:ncpus=1:mem=4gb  -  no defaults need be applied

.IP "qsub -l ncpus=1" 3
In QA: select=1:ncpus=1:mem=2gb
.br
In QB: select=1:ncpus=1:mem=1gb

.IP "qsub -lmem=4gb" 3
In QA: select=1:ncpus=2:mem=4gb
.br
In QB: select=1:ncpus=1:mem=4gb

.IP "qsub -l nodes=4" 3
In QA: select=4:ncpus=1:mem=2gb
.br
In QB: select=4:mem=1gb
.IP "qsub -l mem=16gb -l nodes=4" 3
In QA: select=4:ncpus=1:mem=4gb
.br
In QB: select=4:ncpus=1:mem=4gb
.RE
.RE
.LP

.B Limits on Resource Usage
.br
Each chunk's
per-chunk limits determine how much of any resource can be used in
that chunk.
Per-chunk resource usage limits are established by per-chunk
resources, both from explicit requests and from defaults.  

.I Job-wide resource limits 
set a limit for per-job resource usage.  
.I Job-wide resource limits 
are established both by requesting job-wide resources and 
by summing per-chunk consumable resources.  
.I Job-wide resource limits 
from sums of all chunks, including defaults, override those from
job-wide defaults and resource requests.  Limits include both
explicitly requested resources and default resources.

If a job-wide resource limit exceeds queue or server restrictions, it
will not be put in the queue or accepted by the server.  If, while
running, a job exceeds its limit for a consumable or time-based
resource, it will be terminated.  

.B Controlling Placement of Jobs
.br
Jobs are placed on vnodes according to their 
.I place
statements.  The 
.I place 
statement is specified, in order of precedence, via:
.RS 3
Explicit placement request in 
.B qalter
.br
Explicit placement request in
.B qsub
.br
Explicit placement request in PBS job script directives
.br
Default 
.B qsub
place statement
.br
Queue default placement rules
.br
Server default placement rules
.br
Built-in default conversion and placement rules
.RE

The 
.I place
statement may be not be used without the 
.I select
statement.  

For a detailed description of the 
.I place 
statement, see the qsub(1B) man page.

Note that vnodes can have sharing attributes that override
job placement requests.  See the
.I pbs_node_attributes(7B)
man page.
.LP
.RS 3
.B Default Placement
.br
If, after all defaults have been applied to a resource request that
contains a selection statement, there is no place statement, then
.I arrangement
is set to 
.I free.
Default 
.I sharing
is 
.I shared.

If the job's place statement does not contain 
.I group=resource,
then a grouping defined at the queue level may be used, 
or a grouping defined at the server level if there is
none at the queue level.

.B Placement of Jobs Submitted 
.B with Old Syntax
.br
A job submitted with a 
node (
.I -lnodes=
) or resource (
.I -lncpus=
) specification will be converted to select and place,
according to the rules described below in 
.B BACKWARD COMPATIBILITY.
.RE

.B Boolean Resources
.br 
A Boolean resource can be either true or false.  A resource request
for a Boolean specifies the required value for the Boolean resource.  For
example, if some vnodes have
.I green=true 
and some have
.I red=true,
a selection statement for two vnodes, each with one CPU, all green and
no red, would be:
.RS 3
-l select=2:green=true:red=false:ncpus=1
.RE

.B Consumable Resources 
.br
Consumable resources are those whose use by a job reduces the amount
available to other concurrent jobs, e.g. memory 
.I (mem), 
CPUs (ncpus) and licenses.  
Non-consumable resources include time-based resources such as 
.I walltime 
and CPU time
.I (cput), 
and string-value resources such as architecture
.I (arch).

.B Custom Resources
.br
Custom resources are site-defined and site-dependent.  The
administrator defines custom resources.  These are typically used for
licenses and scratch space.  PBS provides custom resources
specifically for Cray systems.  

A job requesting a floating license must specify it outside of a
selection statement, as a job-wide resource limit.  A job requesting a
node-locked license must specify it inside a selection statement in a
chunk.  See your system administrator.  

Custom resources can be created to be invisible or read-only for
unprivileged users.  See the pbsnodes(8B), pbs_rstat(1B), pbs_rsub(1B),
qalter(1B), qselect(1B), qstat(1B), and qmgr(8B) man pages.
These restricted resources cannot be requested by a job via the 
.B qsub
command, regardless of privilege.  

.B Behavior of Unset Resources
.br
An unset resource is undefined.  An unset numerical resource
(i.e. float, long, size, or time) at the host level behaves as if its
value is zero, but at the server or queue level it behaves as if it
were infinite.  An unset string or string array resource at the
server, queue or vnode level cannot be matched by a job's resource
request.  An unset Boolean resource at a server, queue, or vnode
behaves as if that resource is set to "false".

.SH Resources Built Into PBS

.IP accelerator 8
Indicates whether this vnode is associated with an accelerator.
Used for requesting accelerators.
.br
On Cray, this resource exists only when there is at least one associated
accelerator. 
.br 
Behavior:
.RS
.IP True 3
On Cray, this is set to 
.I True 
when there is at least one associated accelerator whose state is UP.  
.IP False 3
On Cray, set to 
.I False 
when all associated accelerators are in state DOWN.  
.RE
.IP
Host-level.  Can be requested only inside of a select statement.  
.br
Not consumable.
.br
Format: 
.I Boolean
.br
Python type: 
.I bool
.br
Default: 
.I False

.IP accelerator_memory 8
Indicates amount of memory for accelerator(s) associated with this
vnode.  
.br
On Cray, PBS sets this resource only on vnodes with at
least one accelerator with state = UP.  For Cray, PBS sets this
resource on the 0th NUMA node (the vnode with PBScrayseg=0), and the
resource is shared by other vnodes on the compute node.
.br
For example, on vnodeA_2_0: 
.br
.nf
   resources_available.accelerator_memory=4196mb 
On vnodeA_2_1: 
   resources_available.accelerator_memory=@vnodeA_2_0
.fi
.br
A scheduler rounds all resources of type 
.I size
up to the nearest kb.
.br
Host-level.  Can be requested only inside of a select statement.  
.br
Consumable.  
.br
Format: 
.I Size
.br
Python type: 
.I pbs.size
.br
Default: No default

.IP accelerator_model 8
Indicates model of accelerator(s) associated with this vnode.
.br
On Cray, PBS sets this resource only on vnodes with at
least one accelerator with state = UP.  
.br
Host-level.  Can be requested only inside of a select statement.
.br
Non-consumable.  
.br
Format: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP aoe 8
List of AOEs (Application Operating Environments) 
that can be instantiated on this vnode.  Case-sensitive.  
An AOE is the environment that results from provisioning a vnode.
Each job can request at most one AOE.  Cannot be set on server's host.
.br
Valid values: Allowable values are site-dependent.  
.br
Host-level.  Can be requested only inside of a select statement.  
.br
Non-consumable.
.br
Type: 
.I String_array
.br
Python type: 
.I str
.br
Default: No default

.IP arch 8
System architecture.  One architecture
can be defined for a vnode.  One architecture can be requested per
vnode.  
.br
Valid values: 
.RS 11
Allowable values and effect on job placement are site-dependent.  
.RE
.IP
Host-level.  Can be requested only inside of a select statement.
.br
Non-consumable.  
.br
Type: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP cput 8
Amount of CPU time used by the job for all processes on all
vnodes.  Establishes a job-wide resource limit.  
.br
Job-wide.  Can be requested only outside of a select statement.
.br
Non-consumable.
.br
Type: 
.I Duration
.br
Python type: 
.I pbs.duration
.br
Default: No default

.IP energy 8
The energy used by a job.  Set by PBS.  
.br
Consumable.
.br
Format: 
.I Float
.br
Units: 
.I kWh
.br
Default: No default

.IP eoe 8
Stands for "Energy Operational Environment".  When set on a vnode in
.I resources_available.eoe, 
contains the list of available power profiles.  When set for a job
in
.I Resource_List.eoe,
can contain at most one power profile.  (A job can request only one
power profile.)  
.br
Non-consumable.
.br
Format: 
.I String_array
.br
Python type:
.I str
.br
Default value for 
.I resources_available.eoe: 
unset
.br
Default value for 
.I Resource_List.eoe:
no default

.IP exec_vnode 8
The vnodes that PBS estimates this job will use.  Cannot
be requested for a job; used for reporting only. Read-only.  
.br
Type: 
.I String
.br
Python type: 
.I str
.br
Default: No default

.IP file 8
Size of any single file that may be created by the job.
.br
The scheduler rounds all resources of type 
.I size
up to the nearest kb.
.br
Job-wide.  Can be requested only outside of a select statement.
.br
Type: 
.I Size
.br
Python type: 
.I pbs.size
.br
Default: No default

.IP hbmem 8
High-bandwidth memory.  Available only on some architectures such as 
Xeon Phi KNL.
.br
Valid values: Greater than or equal to zero.
.br
Host-level.  
.br
Format:
.I Size
.br
Python type:
.I pbs.size
.br
Default: No default

.IP host 8
Name of execution host.  Cannot be changed.  Site-dependent.
.br
Can be requested only inside of a select statement.  
.br
Behavior:
.RS 11
Automatically set to the short form of the hostname in the 
.I Mom 
attribute. 
.br
On Cray compute node, set to 
.I <mpp_host>_<nid>.
.RE
.IP
Type: 
.I String
.br
Python type: 
.I str

.IP max_walltime 8
Maximum walltime allowed for a shrink-to-fit job.  Job's actual
walltime is between 
.I max_walltime 
and 
.I min_walltime.  
PBS sets 
.I walltime
for a shrink-to-fit job.  If 
.I max_walltime 
is specifed, 
.I min_walltime
must also be specified.  
Cannot be used for 
.I resources_min 
or 
.I resources_max.
Cannot be set on job arrays or reservations.  
.br
Valid values: Must be greater than or equal to
.I min_walltime.  
.br
Can be requested only outside of a select statement.  
.br
Non-consumable.
.br
Format: 
.I Duration
.br
Python type: 
.I pbs.duration
.br
Default: 
.I 5 years

.IP mem 8
Amount of physical memory i.e. workingset allocated to 
the job, either job-wide or host-level.  
.br
The scheduler rounds all resources of type 
.I size
up to the nearest kb.
.br
Can be requested only inside of a select statement. 
.br
Consumable.
.br
Format: 
.I Size
.br
Python type: 
.I pbs.size
.br
Default: No default

.IP min_walltime 8
Minimum walltime allowed for a shrink-to-fit job.  When 
.I min_walltime
is specified, job is a shrink-to-fit job.  If this attribute is set,
PBS sets the job 
.I walltime.  
Job's actual 
.I walltime 
is between
.I max_walltime 
and 
.I min_walltime.  
Cannot be used for 
.I resources_min 
or 
.I resources_max.
Cannot be set on job arrays or reservations.  
.br
Valid values: Must be less than or equal to
.I max_walltime.  
.br
Can be requested only outside of a select statement.  
.br
Non-consumable.
.br
Type: 
.I Duration
.br
Python type: 
.I pbs.duration
.br
Default: No default

.IP mpiprocs 8
Number of MPI processes for this chunk.  Cannot use sum from chunks
as job-wide limit.
.br
The number of lines in PBS_NODEFILE is the sum of the values
of 
.I mpiprocs
for all chunks requested by the job.  For each chunk with 
.I mpiprocs=P, 
the host name for that chunk is written to the PBS_NODEFILE
.I P
times.  
.br
Host-level.  Can be requested only inside of a select statement.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: 
.RS 11
.nf
If ncpus > 0
\ \ \ 1
Otherwise
\ \ \ 0
.fi
.RE
.IP

.IP naccelerators 8
Number of accelerators on the host.  PBS sets this resource to the
number of accelerators with state = 
.I UP.
.br
On Cray, PBS sets this resource only on vnodes whose hosts have at 
least one accelerator with state = 
.I UP.  
For Cray, PBS sets this resource on the 0th NUMA
node (the vnode with PBScrayseg=0), and the resource is shared by
other vnodes on the compute node.
.nf
For example, on vnodeA_2_0:
   resources_available.naccelerators=1
On vnodeA_2_1:
   resources_available.naccelerators=@vnodeA_2_0
.fi
Host-level.  Can be requested only inside of a select statement.
.br
Consumable.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP nchunk 8
Number of chunks requested between plus symbols in a
select statement.  For example, if the select statement is 
.br
\ \ \ -lselect=4:ncpus=2+12:ncpus=8 
.br
the value of nchunk for the first part is 4, and
for the second part it is 12.  The 
.I nchunk 
resource cannot be named in
a select statement; it can only be specified as a number preceding the
colon, as in the above example.  When the number is omitted, 
.I nchunk 
is 
.I 1.
.br
This resource can be used to specify the default
number of chunks at the server or queue 
Example:  
.br
\ \ \ set queue myqueue default_chunk.nchunk=2
.br
This resource cannot be used in server and queue 
.I resources_min 
and 
.I resources_max.
.br
Non-consumable.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default value: 
.I 1

.IP ncpus 8
Number of processors.
.br
Can be requested only inside of a select statement.
.br
Consumable.  
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP nice 8
Nice value with which the job is to be run.  Host-dependent.
.br
Can be requested only outside of a select statement.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP nodect 8
.B Deprecated.    
Number of chunks in resource request from selection
directive, or number of nodes requested from node specification.
Otherwise defaults to value of 1.  Can be requested only outside 
of a select statement.  Read-only.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: 
.I 1

.IP nodes
.B Deprecated.
.br
Number of hosts requested.  
.br
Format:
.I Integer  
.br
See 
.B BACKWARD COMPATIBILITY.

.IP ompthreads 8
Number of OpenMP threads for this chunk.  
.br
Cannot use sum from chunks as job-wide limit.  
.br
For the MPI process with rank 0, the environment variables NCPUS and  
OMP_NUM_THREADS are set to the value of 
.I ompthreads.
For other MPI processes, behavior is dependent on MPI implementation.
.br
Can be requested only inside of a select statement.
.br
Non-consumable.  
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: Value of
.I ncpus 

.IP PBScrayhost 8
Used to differentiate a Cray system, containing
ALPS, login nodes running PBS MoMs, and compute nodes, from a separate
Cray system with a separate ALPS.  
.br
Non-consumable.  
.br
Format: 
.I String
.br
Python type:
.I str
.br
Default: Value of 
.I mpp_host 
for this system

.IP "PBScraylabel_<label name>" 8
Tracks labels applied to compute nodes.  
.br
For each label on a compute node, PBS creates a custom resource 
whose name is a concatenation of
.I PBScraylabel_ 
and the name of the label.  
Name format: PBScraylabel_<label name>
.br
For example, if the label name is 
.I Blue,
the name of this resource is 
.I PBScraylabel_Blue.
.br
Behavior: 
.RS 11
PBS sets the value of the resource to 
.I True 
on all vnodes representing the compute node.
.RE
.IP
Format: 
.I Boolean
.br
Python type:
.I bool
.br
Default: No default

.IP PBScraynid 8
Tracks the node ID of the associated compute node.  All vnodes
representing a particular compute node share a value
for 
.I PBScraynid.  
.br 
Non-consumable.  
.br 
Format: 
.I String 
.br 
Python type:
.I str
.br
Default: Value of 
.I node_id 
for this compute node

.IP PBScrayorder 8
Tracks the order in which compute nodes are listed in the Cray
inventory.  All vnodes associated with a particular compute node share
a value for 
.I PBScrayorder.  
.br
Behavior:
.RS 11
Vnodes for the first compute node listed are assigned a value of 
.I 1 
for 
.I PBScrayorder.  
.br
The vnodes for each subsequent compute node listed are assigned a value
one greater than the previous value.  
.RE
.IP 
Do not use this resource in a resource request.
.br
Non-consumable.  
.br
Format: 
.I Integer 
.br
Python type: 
.I int
.br
Default: No default

.IP PBScrayseg 8
Not used. 
.br
Format: 
.I String
.br
Default: No default

.IP pcput 8
Amount of CPU time allocated to any single process in the job.
Establishes a per-process resource limit.  
.br
Can be requested only outside of a select statement.
.br
Non-consumable.
.br
Format:
.I Duration
.br
Python type:
.I pbs.duration
.br
Default: No default

.IP pmem 8
Amount of physical memory (workingset) for use by any single
process of the job.  Establishes a
per-process resource limit.  
.br
The scheduler rounds all resources of type
.I size
up to the nearest kb.
.br
Can be requested only outside of a select statement.
.br
Non-consumable.
.br
Format:
.I Size
.br
Python type:
.I pbs.size
.br
Default: No default

.IP preempt_targets
List of resources and/or queues.  Jobs requesting those resources or
in those queues are preemption targets.  
.br
Job-wide.  Can be requested only outside of a select statement.  
.br
Non-consumable.  
.br
Format:
.I String_array
.br
Syntax:
.RS 11
preempt_targets="Queue=<queue name>[,Queue=<queue name>],
Resource_List.<resource>=<value>[,Resource_List.<resource>=<value>]" 
.RE
.IP
or 
.RS 11
preempt_targets=None
.RE
.IP 
Keywords "queue" and "none" are case-insensitive.  You can
list multiple comma-separated targets.  
.br
Python type: 
.I str
.br
Default: No default

.IP pvmem 8
Amount of virtual memory for use by any single process in the
job.  Establishes a per-process resource limit.  
.br
The scheduler rounds all resources of type
.I size
up to the nearest kb.
.br
Can be requested only outside of a select statement.
.br
Non-consumable.  
.br
Format:
.I Size
.br
Python type:
.I pbs.size
.br
Default: No default

.IP site 8
Arbitrary string resource.  
.br
Can be requested only outside of a select statement.  
.br
Non-consumable.  
.br
Format:
.I String
.br  
Python type:
.I str
.br
Default: No default

.IP software 8
Site-specific software specification.  
.br
Values: Allowable values and effect on job placement are site-dependent.  
.br
Can be requested only outside of a select statement.
.br
Format:
.I String
.br
Python type:
.I pbs.software
.br
Default: No default

.IP soft_walltime 8
Soft limit on walltime.  Similar to 
.I walltime, 
but cannot be requested by unprivileged users, and job is not killed
if it exceeds its 
.I soft_walltime.  
A job's 
.I soft_walltime 
cannot exceed its 
.I walltime.  
Can be set by Manager only.
.br
Format:
.I Duration
.br
Python type:
.I pbs.duration
.br
Default: No default

.IP start_time 8
The estimated start time for this job.  Cannot be requested
for a job; used for reporting only.  Appears only in job's 
.I estimated
attribute.  Read-only.
.br
Host-level.
.br
Consumable.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP vmem 8
Amount of virtual memory for use by all concurrent processes in
the job.  Establishes a per-chunk resource limit.  
.br
The scheduler rounds all resources of type
.I size
up to the nearest kb
.br
Can be requested only inside of a select statement.
.br
Consumable.
.br
Format:
.I Size
.br
Python type:
.I pbs.size
.br
Default: No default

.IP vnode 8
Name of virtual node (vnode) on which to execute.  Site-dependent.  
See the 
.I pbs_node_attributes(7B) 
man page.
.br
Can be requested only inside of a select statement.
.br
Format:
.I String
.br
Python type:
.I str
.br
Default: No default

.IP vntype 8
The type of the vnode.  
Automatically set by PBS to one of two specific values for Cray vnodes.  
Has no meaning for non-Cray vnodes.  
.br
Automatically assigned values for Cray vnodes:
.RS 11
.IP cray_compute 3
This vnode represents part of a compute node.
.IP cray_login 3
This vnode represents a login node.
.RE
.IP
Can be requested only inside of a select statement.
.br
Non-consumable. 
.br
Format: 
.I String_array
.br
Python type:
.I str
.br
Default:  No default

.IP walltime 8
Amount of wall-clock time.  Establishes a job-wide resource limit. 
.br
Actual elapsed time may differ from 
.I walltime 
during Daylight Savings transitions.
.br 
Can be requested only outside of a select statement.
.br
Non-consumable.  
.br
Format:
.I Duration
.br
Python type:
.I pbs.duration
.br
Default: 
.I 5 years

.SH BACKWARD COMPATIBILITY
.B Conversion to Select and Place
.br
For backward compatibility, a legal node specification or resource
specification is converted into selection and placement directives.

.B Node Specification Conversion
.br
Node specification format:
.IP " " 3
-lnodes=[<N>:<spec list> | <spec list>]
.br
        [[+<N>:<spec list> | +<spec list>] ...]
.br
        [#<suffix> ...][-lncpus=Z]
.LP
where:
.IP " " 3
.I spec list  
has syntax:  
.I <spec>[:<spec> ...]
.br
.I spec 
is any of:  
.I <hostname> | <property> | ncpus=X | cpp=X | ppn=P 
.br
.I suffix 
is any of: 
.I <property> | excl | shared
.br
.I N
and 
.I P 
are positive integers
.br
.I X 
and 
.I Z 
are non-negative integers
.LP
The node specification is converted into selection and placement directives as follows:
.IP " " 3
Each
.I spec list 
is converted into one chunk, 
so that 
.I <N>:<spec list> 
is converted into 
.I N 
chunks.

If 
.I spec 
is 
.I hostname
:
.br
The chunk will include 
.I host=<hostname>

If 
.I spec 
matches any vnode's 
.I resources_available.host 
value:
.br
The chunk will include 
.I host=<hostname>

If 
.I spec 
is 
.I <property>
:
.br
The chunk will include 
.I <property>=true
.br
where
.I property 
must be a site-defined host-level Boolean resource.

If 
.I spec 
is 
.I ncpus=X 
or 
.I cpp=X
:
.br 
The chunk will include 
.I ncpus=X

If no 
.I spec 
is 
.I ncpus=X 
and no 
.I spec 
is 
.I cpp=X
:
.br 
The chunk will include 
.I ncpus=1

If 
.I spec 
is 
.I ppn=P
:
.br
The chunk will include 
.I mpiprocs=P
.br
Example: 
    -lnodes=4:ppn=2 
.br
is converted into 
.br
    -lselect=4:ncpus=2:mpiprocs=2

If 
.I -lncpus=Z 
is specified and no 
.I spec 
contains 
.I ncpus=X 
and no 
.I spec 
is 
.I ccp=X
:
.br
Every chunk will include 
.I ncpus=W,
.br
where 
.I W 
is 
.I Z 
divided by the total number of chunks.
.br
(Note:
.I W 
must be an integer; 
.I Z 
must be evenly divisible by the number of chunks.)

If 
.I property 
is a 
.I suffix 
:
.br
All chunks will include 
.I <property>=true

If 
.I excl 
is a 
.I suffix 
:
.br
The placement directive will be 
.I -lplace=scatter:excl

If 
.I shared 
is a 
.I suffix
:
.br
The placement directive will be 
.I -lplace=scatter:shared

If neither 
.I excl 
nor shared is a 
.I suffix
:
.br 
The placement directive will be 
.I -lplace=scatter
.LP
Example: 
.IP " " 3
-l nodes=3:green:ncpus=2:ppn=2+2:red
.LP
is converted to:
.IP " " 3
-l select=3:green=true:ncpus=4:mpiprocs=2+2:red=true:ncpus=1 
.br
-l place=scatter
.LP
Node specification syntax for requesting properties is 
.B deprecated.
The new Boolean resource syntax "<property>=<value>" is accepted only in a
selection directive.  It is erroneous to mix old and new syntax.

.B Resource Specification Conversion
.br
The resource specification is converted to select and place statements 
after any defaults have been applied.

Resource specification format:
.IP " " 3
-l<resource>=<value>[:<resource>=<value> ...]
.LP
The resource specification is converted to:
.IP " " 3
select=1[:<resource>=<value> ...]
.br
place=pack
.br
.LP
with one instance of 
.I <resource>=<value> 
for each of the following 
host-level resources in the resource request:
.IP " " 3
Built-in resources: 
.I ncpus 
| 
.I mem 
| 
.I vmem 
| 
.I arch 
| 
.I host

Site-defined host-level resources with flags including "h"

.SH SEE ALSO
pbs_node_attributes(7B),
pbs_rsub(1B),
qalter(1B), 
qmgr(8B), 
qstat(1B),
qsub(1B)


================================================
FILE: doc/man1/pbs_resv_attributes.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_resv_attributes 7B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_resv_attributes 
\- attributes of PBS reservations

.SH DESCRIPTION
PBS reservations have the following attributes:

.IP Account_Name 8
No longer used.

.IP Authorized_Groups 8
List of groups who can or cannot submit jobs to this reservation.
Group names are interpreted relative to the server, not the 
submission host.  List is evaluated left-to-right; first match in 
list is used.  This list is used to set the reservation queue's 
.I acl_groups 
attribute.  See the 
.I G 
option to the 
.I pbs_rsub 
command.
.br
Readable by all; settable by all.
.br
Format: 
.I String
.br
Syntax:
.RS 11
.I [+|-]<group name> [,[+|-]<group name> ...] 
.RE
.IP
Python type:
.I pbs.acl
.br
Default: Reservation owner's login group

.IP Authorized_Hosts 8
The list of hosts from which jobs can and cannot be submitted to this reservation. 
List is evaluated left-to-right; first match in list is used.  
This list is used to set the reservation queue's 
.I acl_hosts
attribute.  See the 
.I H
option to the 
.I pbs_rsub 
command.  
.br
Readable by all; settable by all.
.br
Format: 
.I String
.br
Syntax:
.RS 11
.I [+|-]<hostname> [,[+|-]<hostname> ...]
.br
Hostnames may be wildcarded using an asterisk, according to the following rules:
.RS 3
- A hostname can contain at most one asterisk
.br
- The asterisk must be the leftmost label
.RE
Examples:
.RS 3
*.test.example.com
.br
*.example.com
.br
*.com
.RE
.RE
.RE
.IP
Python type:
.I pbs.acl
.br
Default: No default (Jobs can be submitted from all hosts)

.IP Authorized_Users 8
The list of users who can or cannot submit jobs to this reservation.
List is evaluated left-to-right; first match in list is used.  
This list is used to set the reservation queue's 
.I acl_users
attribute.  See the 
.I U 
option to the 
.I pbs_rsub 
command.
.br
Readable by all; settable by all.
.br
Format: 
.I String
.br
Syntax:
.RS 11
.I [+|-]<username>[@<hostname>.<domain>] [, [+|-]<username>[@<hostname>.<domain>] ...]
.br
where '-' means "deny" and '+' means "allow". 
.br
The hostname portion of a username may be wildcarded using an asterisk, 
according to the following rules:
.RS 3
- A hostname can contain at most one asterisk
.br
- The asterisk must be the leftmost label in the hostname
.RE
Examples:
.RS 3
*.test.example.com
.br
*.example.com
.br
*.com
.RE
.RE
.RE
.IP
Python type:
.I pbs.acl
.br
Default: Reservation owner only

.IP ctime 8
The time that the reservation was created.
.br
Readable by all; set by PBS.
.br
Format: 
.I Timestamp
.RS 11
Printed by qstat in human-readable
.I Date
format.  
.br
Output in hooks as seconds since epoch.
.RE
.IP 
Python type:
.I int
.br
Default: No default

.IP group_list 8
No longer used.

.IP hashname 8
No longer used.

.IP "interactive" 8
Number of seconds that the 
.I pbs_rsub 
command will block while waiting for confirmation or denial of the 
reservation.  
See the 
.I -I block_time
option to the 
.I pbs_rsub 
command.
.br
Readable by all; settable by all.
.br
Format:
.I Integer
.br
Behavior:
.RS 11
.IP "Less than zero" 3
The reservation is automatically deleted if it cannot be confirmed in the time specified.
.IP "Zero or greater than zero" 3
The reservation is not automatically deleted after this time.  
.RE
.IP
Python type:
.I int
.br
Default: 
.I Zero

.IP "Mail_Points" 8
Sets the list of events for which mail is sent by the server.  Mail 
is sent to the list of users specified in the 
.I Mail_Users
attribute.  See the 
.I m mail_points 
option to the 
.I pbs_rsub 
command.
.br
Readable by all; settable by all.
.br
Format:
.I String 
.br
Syntax:
.RS 11
One or more letters "a", "b", "c", "e", or the string "n".  
.br
Cannot use "n" with any other letter.
.RE
.IP
Behavior:
.RS 11
.IP a 3
Notify when reservation is terminated
.IP b 3
Notify when reservation period begins
.IP c 3
Notify when reservation is confirmed
.IP e 3
Notify when reservation period ends
.IP n 3
Do not send mail.  Cannot be used with other letters.
.RE
.IP
Python type:
.I pbs.group_list
.br
Default: "ac"

.IP "Mail_Users" 8
The set of users to whom mail is sent for the reservation events
specified in the 
.I Mail_Points
attribute.  See the 
.I M mail_list 
option to the 
.I pbs_rsub 
command.
.br
Readable by all; settable by all.
.br
Format:
.I String 
.br
Syntax:
.RS 11
.I <username>@<hostname>[,<username>@<hostname> ...]
.RE
.IP
Python type:
.I pbs.user_list
.br
Default: Reservation owner only

.IP mtime 8
The time that the reservation was last modified.
.br
Readable by all; set by PBS.
.br
Format: 
.I Timestamp
.RS 11
Printed by qstat in human-readable
.I Date
format.  
.br
Output in hooks as seconds since epoch.
.RE
.IP
Python type:
.I int
.br
Default: No default

.IP Priority 8
No longer used.

.IP queue 8
Name of the reservation queue.  Jobs that 
are to use resources belonging to this reservation are submitted to this queue. 
.br
Readable by all; set by PBS.
.br
Format:
.I String
.RS 11
Format for an advance or job-specific reservation:
.I R<unique integer>
.br
Format for a standing reservation:
.I S<unique integer>
.RE
.IP
Python type:
.I pbs.queue
.br
Default: No default

.IP reserve_count 8
The total number of occurrences in a standing reservation.
.br 
Readable by all; settable by all.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP reserve_duration 8
Reservation duration in seconds.  For a standing reservation, this is the
duration for one occurrence.
.br
Readable by all; settable by all.
.br
Format:
.I Integer
.br
Python type:
.I pbs.duration
.br
Default: No default

.IP reserve_end 8
The date and time when an advance reservation or soonest occurrence of a
standing reservation ends.  
.br
Readable by all; settable by all.
.br
Format: 
.I Timestamp
.RS 11
Printed by qstat in human-readable
.I Date
format.  
.br
Output in hooks as seconds since epoch.
.RE
.IP
Python type:
.I int
.br
Default: No default

.IP reserve_ID 8
The reservation identifier. 
.br
Format:
.I String 
.RS 11
Format for an advance or job-specific reservation: 
.I R<unique integer>.<server name>
.br
Format for a standing reservation: 
.I S<unique integer>.<server name>
.RE
.IP
Python type:
.I str
.br
Default: No default

.IP reserve_index 8
The index of the soonest occurrence of a standing reservation.
.br
Readable by all; set by PBS.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP "reserve_job" 8
If this reservation is a job-specific start or now reservation, 
shows the ID of the job from which the reservation was created.
.br
Readable by all; set by PBS.
.br
Format:
.I String
.br
Python type:
.I str
.br
Default: no default


.IP "Reserve_Name" 8
The name assigned to the reservation during creation, if specified.  See the 
.I N 
option to the 
.I pbs_rsub 
command.
.br
Readable by all; settable by all.
.br
Format:
.I String 
.br
Syntax:
Up to 15 characters.  First character is alphabetic.
.br
Python type:
.I str
.br
Default: No default

.IP "Reserve_Owner" 8
The login name on the submitting host of the user who created the
reservation.
.br
Readable by all; set by PBS.
.br
Format:
.I String
.br
Syntax:
.I <username>@<hostname>
.br
Python type:
.I str
.br
Default: Login name of creator

.IP reserve_retry 8
If this reservation becomes degraded, this is set to the 
next time that PBS will attempt to reconfirm this reservation.
.br
Readable by all; set by PBS.
.br
Format: 
.I Timestamp
.RS 11
Printed by qstat in human-readable
.I Date
format.  
.br
Output in hooks as seconds since epoch.
.RE
.IP
Python type:
.I int
.br
Default: No default

.IP reserve_rrule 8
The rule that describes the recurrence pattern of a standing reservation.
See the 
.I r
option to the 
.I pbs_rsub
command.
.br
Readable by all; settable by all.
.br
Format: 
.I String
.br
Syntax: either of two forms:
.RS 11
"FREQ=
.I <freq_spec>;
COUNT=
.I <count_spec>;
.I <interval_spec>"
.br
or
.br
"FREQ=
.I <freq_spec>;
UNTIL=
.I <until_spec>; <interval_spec>"
.br
where
.IP freq_spec 15
Frequency with which the standing reservation repeats.  Valid values are:
.br
WEEKLY|DAILY|HOURLY

.IP count_spec 15
The exact number of occurrences.  Number up to 4 digits in length.  
.br
Format:
.I Integer

.IP interval_spec 15
Specifies interval.  
.br
Format is one or both of:
.br
.I BYDAY = MO|TU|WE|TH|FR|SA|SU 
.br
or
.br
.I BYHOUR = 0|1|2|...|23
.br

.IP until_spec 15
Occurrences will start up to but not after date and time 
specified.
.br
.br
Format:
.I YYYYMMDD[THHMMSS] 
.br
Note that the year-month-day section is separated from 
the hour-minute-second section by a capital T.
.RE
.IP
Python type:
.I str
.br
Default: No default

.IP reserve_start 8
The date and time when the reservation period for the reservation 
or soonest occurrence begins.  
.br
Readable by all; settable by all.
.br
Format: 
.I Timestamp
.RS 11
Printed by qstat in human-readable
.I Date
format.  
.br
Output in hooks as seconds since epoch.
.RE
.IP
Python type:
.I int

.IP reserve_state 8
The state of the reservation.  
.br
Readable by all; set by PBS.
.br
Format: 
.I String
.br
Python type:
Each value has its own reservation state constant.

The following table shows each abbreviation, state, and Python constant:
.RS

.IP "NO   RESV_NONE            pbs.RESV_STATE_NONE"
No reservation yet.

.IP "UN   RESV_UNCONFIRMED     pbs.RESV_STATE_UNCONFIRMED "
Reservation request is awaiting confirmation.

.IP "CO   RESV_CONFIRMED       pbs.RESV_STATE_CONFIRMED "
Reservation has been confirmed.  For a standing reservation, this means
that all occurrences of the reservation have been confirmed.

.IP "WT   RESV_WAIT            pbs.RESV_STATE_WAIT "
Unused.  

.IP "TR   RESV_TIME_TO_RUN     pbs.RESV_STATE_TIME_TO_RUN "
Start of the reservation period.

.IP "RN   RESV_RUNNING         pbs.RESV_STATE_RUNNING "
Reservation period has started and reservation is running.

.IP "FN   RESV_FINISHED        pbs.RESV_STATE_FINISHED "
End of the reservation period.

.IP "BD   RESV_BEING_DELETED   pbs.RESV_STATE_BEING_DELETED "
Reservation is being deleted.

.IP "DE   RESV_DELETED         pbs.RESV_STATE_DELETED "
Reservation has been deleted.

.IP "DJ   RESV_DELETING_JOBS   pbs.RESV_STATE_DELETING_JOBS "
Jobs belonging to the reservation are being deleted.
.RE
.IP
Default: No default

.IP reserve_substate 8
The substate of the reservation or occurrence.  The 
substate is used internally by PBS.
.br
Readable by all; set by PBS.
.br
Format:
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP reserve_type 8
No longer used.

.IP "Resource_List" 8
The list of resources allocated to the reservation.  Jobs running in
the reservation cannot use in aggregate more than the specified amount
of a resource.
.br
Readable by all; settable by all.
.br
Format:
.I String
.br
Syntax:
.RS 11
.I Resource_List.<resource name>=<value>[,Resource_List.<resource name>=<value> ...]
.RE
.IP
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
.I Resource_List["<resource name>"]=<resource value>
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP resv_nodes 8
The list of vnodes and resources allocated from them to satisfy 
the chunks requested for this reservation or occurrence.
.br
Readable by all; set by PBS.
.br
Format:
.I String
.br
Syntax:  
.RS 11
.I (<vnode name>:<resource name>=<value>[:<resource name>=<value>]...) 
.I [+(<vnode name>:<resource name>=<value>[:<resource name>=<value>])+...]
.RE
.IP
Python type:
.I pbs.exec_vnode
.br
Default: No default

.IP server 8
Name of server.
.br
Readable by all; set by PBS.
.br
Format:
.I String
.br
Python type:
.I pbs.server
.br
Default: No default

.IP User_List 8
No longer used.

.IP Variable_List 8
Not used.


.SH SEE ALSO
pbs_rstat(1B), 
pbs_rsub(1B), 
pbs_resources(7B)


================================================
FILE: doc/man1/pbs_rstat.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_rstat 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_rstat 
\- show status of PBS reservations
.SH SYNOPSIS
.B pbs_rstat 
[-B] [-f | -F] [-S] [<reservation ID>...]
.br
.B pbs_rstat 
--version
.SH DESCRIPTION
The
.B pbs_rstat
command shows the status of all reservations at the PBS server.
Denied reservations are not displayed.

.B Required Privilege
.br
This command can be run by a user with any level of PBS privilege.  For
full output, users without manager or operator privilege cannot print
custom resources which where created to be invisible to users.

.SH Output
The
.B pbs_rstat
command displays output in any of brief, short, or full formats.

See the 
.B pbs_resv_attributes(7B) 
man page for information about reservation attributes.

.SH OPTIONS
.IP "-B" 10
Brief output.  Displays each reservation identifier only.

.IP "-f, -F" 10
Full output.  Displays all reservation attributes that are not set to 
the default value.  Users without manager or operator privilege
cannot print custom resources which were created to be invisible to users.

.IP "-S" 10
Short output.  Displays a table showing the name, queue, owner, state, 
start time, duration, and end time of each reservation.

.IP "--version" 10
The 
.B pbs_rstat
command returns its PBS version information and exits.
This option can only be used alone.

.IP "(no options)" 10
Short output.  Same behavior as 
.I -S 
option.

.SH OPERANDS
The 
.B pbs_rstat 
command accepts one or more
.I reservation ID
operands.  
.br

Format for an advance or job-specific reservation:
.RS 4
.I "R<sequence number>[.<server name>][@<remote server>]"
.RE

Format for a standing reservation:
.RS 4
.I "S<sequence number>[.<server name>][@<remote server>]"
.RE

Format for a maintenance reservation:
.RS 4
.I "M<sequence number>[.<server name>][@<remote server>]"
.RE


.I @<remote server> 
specifies a reservation at a server other than the default server.

.SH SEE ALSO
pbs_rsub(1B), pbs_rdel(1B), pbs_resv_attributes(7B)


================================================
FILE: doc/man1/pbs_rsub.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_rsub 1B "24 September 2020" Local "PBS Professional"
.SH NAME
.B pbs_rsub 
\- create a PBS reservation 

.SH SYNOPSIS
.B For advance and standing reservations:
.br
.B pbs_rsub 
[-D <duration>] [-E <end time>] [-g <group list>] 
.RS 9
[-G <auth group list>] [-H <auth host list>] [-I <block time>]
] [-l <placement>] [-l <resource request>] [-m <mail events>] 
[-M <mail list>] [-N <reservation name>] [-q <destination>] 
[-r <recurrence rule>] [-R <start time>]  [-u <user list>] 
[-U <auth user list>] [-W <attribute value list>]
.RE

.B For job-specific now reservations:
.br
.B pbs_rsub 
[-I <block time>] [-m <mail events>] [-M <mail list>] 
.RS 9
.br
--job <job ID>
.RE

.B For maintenance reservations:
.br
.B pbs_rsub 
[-D <duration>] [-E <end time>] [--hosts <host list>]
.RS 9
[-N <reservation name>] [-q <destination>] [-R <start time>]  
.RE

.B For version information:
.br
.B pbs_rsub 
--version

.SH DESCRIPTION
The 
.B pbs_rsub
command is used to create advance, standing, job-specific now, 
job-specific ASAP, or maintenance reservations.  
.RS 3

An advance reservation reserves specific resources for the requested
time period.

A standing reservation reserves specific resources for recurring time
periods.

A job-specific now reservation reserves the resources being used by a
specific job in case the job fails and needs to be re-submitted,
allowing it to run again without having to wait to be scheduled.  The
reservation is created and starts running when a queued job starts
running, or immediately when you use 
.B pbs_rsub --job <job ID> 
on a running job.

A job-specific ASAP reservation is created from a queued job via
.B pbs_rsub -Wqmove=<job ID>.  
The reservation runs as soon as possible,
and the job is moved into the reservation.  The reservation is created
using the same resources as the job requested.  

A job-specific start reservation is created immediately using a 
running job's resources, and the job is moved into the reservation.  
You create job-specific start reservations using 
.B qsub -Wcreate_resv_from_job=true 
on a running job.  See the
.B qsub 
command.

A maintenance
reservation reserves the specified hosts for the specified time
regardless of other circumstances.

.RE

Advance, standing, and job-specific reservations are "job reservations", 
to distinguish them from maintenance reservations.  When a reservation
is created, it has an associated queue.  

To get information about a reservation, use the 
.B pbs_rstat 
command.  

To delete a reservation, use the 
.B pbs_rdel 
command.  Do not use the qdel command.  

The behavior of the 
.B pbs_rsub 
command may be affected by any site hooks.  Site hooks can modify the
reservation's attributes.

.B Job Reservations
.br
After an advance or standing reservation is requested, it is either
confirmed or denied.  A job-specific now reservation is created when
the job is started and confirmed immediately.  A job-specific ASAP
reservation is scheduled as soon as possible.  Once the reservation
has been confirmed, authorized users submit jobs to the
reservation's queue via qsub and qmove.  

A confirmed job reservation will accept jobs at any time.  The jobs in
its queue can run only during the reservation period.  Jobs in a
single advance reservation or job-specific reservation can run only
during the reservation's time slot, and jobs in a standing
reservation can run only during the time slots of occurrences of the
standing reservation.  

When an advance reservation ends, all of its jobs are deleted, whether
running or queued.  When an occurrence of a standing reservation ends,
only its running jobs are deleted; those jobs still in the queue are
not deleted.

.B Maintenance Reservations 
.br
You can create maintenance reservations using 
.B pbs_rsub --hosts <host list>.  
Maintenance reservations are designed to make the specified
hosts available for the specified amount of time, regardless of what
else is happening:
.RS 3
You can create a maintenance reservation that includes or is made up
of vnodes that are down or offline.  

Maintenance reservations ignore the value of a vnode's 
.I resv_enable 
attribute.  

PBS immediately confirms any maintenance reservation.  

Maintenance reservations take precedence over other reservations; if you create a
maintenance reservation that overlaps an advance or standing job
reservation, the overlapping vnodes become unavailable to the job
reservation, and the job reservation becomes degraded.  PBS looks for
replacement vnodes.
.RE

PBS will not start any new jobs on vnodes overlapping or in a
maintenance reservation.  However, jobs that were already running on
overlapping vnodes continue to run; you can let them run or requeue
them.  

You cannot specify place or select for a maintenance
reservation; these are created by PBS: 

.RS 3
PBS creates the
reservation's placement specification so that hosts are
assigned exclusively to the reservation.  The placement specification
is always the following: 
.RS 3
.I -lplace=exclhost 
.RE

PBS sets the reservation's 
.I resv_nodes
attribute value so that all CPUs on the reserved hosts are assigned
to the
maintenance reservation.  The select specification is always the
following: 
.IP "" 3
.I -lselect = host=<host1>:ncpus= <number of CPUs at host1> 
.I +host=<host2>:ncpus= <number of CPUs at host2>+...
.LP
.RE

Maintenance reservations are prefixed with M.  A maintenance
reservation ID has the format: 
.RS 3
.I M<unique integer>.<server name>
.RE

Creating a maintenance reservation does not trigger a scheduling
cycle.  

You must have manager or operator privilege to create a maintenance reservation.

.SH REQUIREMENTS

When using
.B pbs_rsub
to request a standing, advance, or maintenance reservation, you must 
specify two of the following options: 
.I -R, -E, 
and
.I -D.
The resource request 
.I -l walltime
can be used instead of the 
.I -D 
option.

If you want to run jobs in a reservation that will request exclusiveqsub 
placement, you must create the reservation with exclusive placement
via -l place=excl.

.SH OPTIONS
.IP "-D <duration>" 8
Specifies reservation duration. If the start
time and end time are the only times specified, this duration time is
calculated.  
.br
Format: 
.I Duration.  
See 
.B FORMATS.
.br
Default: none
.RE
.IP "-E <end time>" 8
Specifies the reservation end time.  If start time and duration are
the only times specified, the end time value is calculated.    
.br
Format: 
.I Datetime. 
See 
.B FORMATS.
.br
Default: none.
.RE
.IP "-g <group list>" 8
The 
.I group list
is a comma-separated list of group names. 
The server uses entries in this list, along with an ordered set 
of rules, to associate a group name with the reservation. 
The reservation creator's primary group is automatically added to this list.
.br
Format: <group>@<hostname>[,<group>@<hostname> ...]
.RE
.IP "-G <auth group list>" 8
Comma-separated list of names of groups who
can or cannot submit jobs to this reservation.  Sets reservation's 
.I Authorized_Groups 
attribute to 
.I auth group list.
.br
This list becomes the 
.I acl_groups 
list for the 
reservation's queue. 
.br
More specific entries should be listed before more general, because the
list is read left-to-right, and the first match determines access.
.br
If both the
.I Authorized_Users
and 
.I Authorized_Groups
reservation attributes are set, a user must belong to both in order to
be able to submit jobs to this reservation.  
.br
Group names are
interpreted in the context of the server's host, not the context of the host 
from which the job is submitted. 
.br
See the 
.I Authorized_Groups 
reservation attribute in the 
pbs_resv_attributes(7B) man page.  
.br
Syntax: 
.I [+|-]<group name>[,[+|-]<group name> ...]
.br
Default: No groups are authorized to submit jobs
.RE

.IP "--hosts <host list>" 8
Space-separated list of hosts to be included in maintenance
reservation.  Cannot be used with the 
.I -l <placement> 
or 
.I -l <resource request> 
options.  PBS creates placement and resource requests.  Placement is always 
.I exclhost, 
and all CPUs of requested hosts are assigned to maintenance reservation.

.IP "-H <auth host list>" 8
Comma-separated list of hosts from which jobs can and cannot be 
submitted to this reservation.  This list becomes the 
.I acl_hosts 
list for the reservation's queue. 
.br
More specific entries should be listed before more general, because the
list is read left-to-right, and the first match determines access.
If the reservation creator specifies this list, the creator's 
host is not automatically added to the list.
.br
See the 
.I Authorized_Hosts 
reservation attribute in the pbs_resv_attributes(7B) man page.
.br
Format: [+|-]<hostname>[,[+|-]<hostname> ...]
.br
Default: All hosts are authorized to submit jobs
.RE

.IP "-I <block time>" 8
Specifies interactive mode.  The 
.B pbs_rsub 
command will block, up to 
.I block time 
seconds, while waiting for the reservation request to be 
confirmed or denied.
.br
If 
.I block time
is positive, and the reservation isn't confirmed or denied in 
the specified time, the ID string for the reservation is returned 
with the status "UNCONFIRMED".
.br
If 
.I block time
is negative, and a scheduler doesn't confirm or deny the reservation in 
the specified time, the reservation is deleted.
.br
Cannot be used with
.I --hosts
option.  Has no effect when used with 
.I --job 
option.
.br
Format: Integer
.br
Default: Not interactive
.RE

.IP "--job <job ID>" 8
Immediately creates and confirms a job-specific now reservation on the
same resources as the job (including resources inherited by the job),
and places the job in the job-specific now reservation queue.  Sets
the job's 
.I create_resv_from_job 
attribute to 
.I True.  
Sets the now reservation's 
.I reserve_job 
attribute to the ID of the job from which the reservation was created,
sets the reservation's 
.I Reserve_Owner 
attribute to the value of the job's 
.I Job_Owner 
attribute, sets the reservation's 
.I resv_nodes 
attribute to the job's 
.I exec_vnode 
attribute, sets the reservation's resources to match the job's 
.I schedselect 
attribute, and sets the reservation's
.I Resource_List 
attribute to the job's 
.I Resource_List 
attribute.

The now reservation's duration and start time are the same as the
job's walltime and start time.  If the job is peer scheduled, the now
reservation is created in the pulling complex.
.br
Format: 
.I Boolean
.br
Default: no default
.br
Example:
.B pbs_rsub --job 1234.myserver

Can be used on running jobs only (jobs in the 
.I R 
state, with substate 
.I 42
).

Cannot be used with job arrays, jobs already in reservations, or other users' jobs.

.IP "-l <placement>" 8
The 
.I placement
specifies how vnodes are reserved. 
The 
.I place
statement can contain the following elements, in any order:
.IP " " 11
-l place=[
.I <arrangement>
][:
.I <sharing>
][:
.I <grouping>
]
.LP
.IP " " 8
where
.IP " " 11
.RS 
.IP arrangement 3
Whether this reservation chunk is willing to share this vnode or host 
with other chunks from this reservation.  One of 
.I free
|
.I pack
|
.I scatter
| 
.I vscatter

.IP sharing 3
Whether this reservation chunk is willing to share this vnode or host
with other reservations or jobs.  One of 
.I excl 
| 
.I share 
| 
.I exclhost

.IP grouping 3
Whether the chunks from this reservation should be placed on vnodes
that all have the smae value for a resource.  Can have only one
instance of
.I group=resource
.LP
.LP
.RE
.LP
.IP " " 8
and where
.IP " " 11
.RS
.IP free 3
Place reservation on any vnode(s).
.IP pack
All chunks are taken from one host.
.IP scatter 3
Only one chunk with any MPI processes is taken from a host.
A chunk with no MPI processes may be taken from the same vnode as
another chunk.
.IP vscatter 3
Only one chunk is taken from any vnode.  Each chunk must fit on a vnode.
.IP excl 3
Only this reservation uses the vnodes chosen.
.IP exclhost 3
The entire host is allocated to the reservation.
.IP shared 3
This reservation can share the vnodes chosen.
.IP group=<resource> 3
Chunks are grouped according to a 
.I resource.  
All vnodes in the group must have a common value for 
.I resource, 
which can be either the built-in resource
.I host
or a custom vnode-level resource.
.br
.I resource
must be a string or a string array.
.LP
.LP
.RE
.LP
.IP " " 8
If you want to run jobs in the reservation that will request exclusive 
placement, you must create the reservation with exclusive placement via 
.B -l place=excl.

The place statement cannot begin with a colon.  Colons are delimiters; use 
them only to separate parts of a place statement, unless they are quoted
inside resource values.

Note that nodes can have sharing attributes that override
job placement requests.  See the
.B pbs_node_attributes(7B)
man page.
.LP
.IP "-l resource request" 8
The 
.I resource request 
specifies the resources required for the reservation. These 
resources are used for the limits on the queue that is dynamically created 
for the reservation. The aggregate amount of resources for currently 
running jobs from this queue will not exceed these resource limits. 
Jobs in the queue that 
request more of a resource than the queue limit for that resource are not 
allowed to run. Also, the queue inherits the value of any resource limit set 
on the server, and these are used for the job if the reservation request 
itself is silent about that resource.
A non-privileged user cannot submit a reservation requesting a custom 
resource which has
been created to be invisible or read-only for users.

Resources are requested
by using the
.I -l
option, either in
.I chunks
inside of
.I selection statements,
or in job-wide requests using
.I <resource name>=<value>
pairs.

Requesting resources in chunks:
.RS 
.IP " " 3
.I -l select=[N:]<chunk>[+[N:]<chunk> ...]
.LP
where
.I N
specifies how many of that chunk, and
a
.I chunk
is of the form:

.IP " " 3
.I <resource name>=<value>[:<resource name>=<value> ...]
.LP

Requesting job-wide resources:
.IP " " 3
.I -l <resource name>=<value>[,<resource name>=<value> ...]
.LP
.RE

.IP "-m <mail events>" 8
Specifies the set of events that cause mail to be sent to the 
list of users specified in the 
.I -M mail list
option. 
.br
Format: string consisting of one of the following:
.RS
1) any combination of "a", "b", "c" or "e"
.br
2) the single character "n"
.IP a
Notify if the reservation is terminated for whatever reason
.IP b
Notify when the reservation period begins
.IP c 
Notify when the reservation is confirmed
.IP e 
Notify when the reservation period ends
.IP n
Send no mail.  Cannot be used with any of 
.I a, b, c
or 
.I e.
.LP
Default:
.I ac
.RE

.IP "-M <mail list>" 8
The list of users to whom mail is sent 
whenever the reservation transitions to one of the states 
specified in the 
.I -m mail events
option. 
.br
Format: <username>[@<hostname>][,<username>[@<hostname>]...]
.br
Default: reservation owner.
.RE
.IP "-N <reservation name>" 8
Specifies a name for the reservation. 
.br
Format: 
.I Reservation name.  
See 
.B FORMATS.
.br
Default: None.
.RE
.IP "-q <destination>" 8
Specifies the destination server at which to create the reservation. 
.br
Default: The default server is used if this option is not selected.
.RE

.IP "-r <recurrence rule>" 8
Specifies rule for recurrence of standing reservations.  Rule must conform to iCalendar
syntax, and is specified using a subset of parameters from RFC 2445.
.br
Valid syntax for 
.I recurrence rule 
takes one of two forms:
.RS 11
.I FREQ=<freq spec>;COUNT=<count spec>;<interval spec>
.RE
.IP " " 8
or
.RS 11
.I FREQ=<freq spec>;UNTIL=<until spec>; <interval spec>
.RE
.IP " " 8
where
.RS 11
.IP "freq spec" 5
Frequency with which the standing reservation repeats.  Valid values are:
.br
WEEKLY|DAILY|HOURLY

.IP "count spec" 5
The exact number of occurrences.  Number up to 4 digits in length.  
Format: integer.

.IP "interval spec" 5
Specifies interval.  Format is one or both of:
.br
BYDAY = MO|TU|WE|TH|FR|SA|SU 
.br
or
.br
BYHOUR = 0|1|2|...|23
.br
When using both, separate them with a semicolon.
.br
Elements specified in the recurrence rule override those 
specified in the arguments to the 
.I -R 
and 
.I -E
options.  For example, the 
.I BYHOUR 
specification overrides the hourly part of the
.I -R
option.  For example, 
.br
-R 0730 -E 0830 ... BYHOUR=9
.br
results in a reservation that starts at 9:30 and runs for 1 hour.

.IP "until spec" 5
Occurrences will start up to but not after date and time 
specified.
.br
Format: YYYYMMDD[THHMMSS] 
.br
Note that the year-month-day section is separated from 
the hour-minute-second section by a capital T.
.RE
.IP " " 8
Requirements:
.br
The recurrence rule must be on one unbroken line and must be enclosed
in double quotes.  

A start and end date must be used when specifying a recurrence rule.  
See the 
.I R
and
.I E 
options.

The PBS_TZID environment variable must be set at the submission host.  The 
format for PBS_TZID is a timezone location.  Examples: America/Los_Angeles,
America/Detroit, Europe/Berlin, Asia/Calcutta.  

.B Examples of Standing Reservations
.br
For a reservation that runs every day from 8am to 10am, for a total of 10 occurrences:
.RS 
.IP " " 3
pbs_rsub -R 0800 -E 1000 -r "FREQ=DAILY;COUNT=10"
.LP

Every weekday from 6am to 6pm until December 10 2008
.IP " " 3
pbs_rsub -R 0600 -E 1800 
.br
-r "FREQ=WEEKLY; BYDAY=MO,TU,WE,TH,FR; UNTIL=20081210"
.LP

Every week from 3pm to 5pm on Monday, Wednesday, and Friday, for 9 occurrences, 
i.e., for three weeks:
.RS 5
pbs_rsub -R 1500 -E 1700
.br
-r "FREQ=WEEKLY;BYDAY=MO,WE,FR; COUNT=3"
.RE
.RE

.IP "-R <start time>" 8
.RS
.LP
Specifies reservation starting time. If the reservation's end time 
and duration are the only times specified, this start time is calculated.

If the day,
.I DD ,
is not specified, it defaults to today if the time
.I hhmm
is in the future. Otherwise, the day is set to tomorrow.
For example, if you submit a reservation with the specification 
.I "-R 1110"
at 11:15 a.m., it is interpreted as being for 11:10am tomorrow.
If the month portion,
.I MM ,
is not specified, it defaults to the current month, provided that the specified 
day
.I DD ,
is in the future. Otherwise, the month is set to next month. Similar
rules apply to the two other optional, left-side components.
.br
Format: 
.I Datetime
.LP
.RE
.IP "-u <user list>" 8
Not used. Comma-separated list of user names.
.br
Format: <username>[@<hostname>][,<username>[@<hostname>] ...]
.br
Default: None
.RE
.IP "-U <auth user list>" 8
Comma-separated list of users who are and are not allowed to 
submit jobs to this reservation.  Sets reservation's 
.I Authorized_Users 
attribute to 
.I auth user list.
.br
This list becomes the 
.I acl_users 
attribute for the reservation's queue. 
.br
More specific entries should be listed before more general, because the
list is read left-to-right, and the first match determines access. 
The reservation creator's username is automatically added to this list,
whether or not the reservation creator specifies this list.
.br
If both the
.I Authorized_Users
and 
.I Authorized_Groups
reservation attributes are set, a user must belong to both in order to be able to 
submit jobs to this reservation.
.br
See the 
.I Authorized_Users
reservation attribute in the pbs_resv_attributes(7B) man page.
.br
Syntax:
.I [+|-]<username>[@<hostname>][,[+|-]<username>[@<hostname>]...]
.br
Default: Reservation owner only
.br
.RE
.IP "-W attribute value list" 8
This allows you to define other attributes for the reservation.
Supported attributes:
.RS

.IP "qmove=<job ID>" 5
Takes as input a queued job, creates a job-specific ASAP reservation
for the same resources the job requests, and moves the job into the
reservation's queue.  The reservation is scheduled to run as soon as
possible.  

When the reservation is created, it inherits its resources from the
job, not from the resources requested through the pbs_rsub command.

You can use the 
.I -I 
option to specify a timeout for the conversion.  If you use the 
.I qmove 
option to convert a job to a reservation, and the
reservation is not confirmed within the timeout period, the
reservation is deleted.  The default timeout period is 10 seconds.
There is no option for this kind of reservation to be unconfirmed.  

To specify the timeout, you must give a negative value for the 
.I -I
option.  For example, to specify a timeout of 300 seconds: 
.br
.B \ \ \ pbs_rsub -Wqmove=<job ID> -I -300 

The default value for the 
.I delete_idle_time
attribute for an ASAP reservation is 10 minutes.  

The 
.I -R 
and 
.I -E 
options to pbs_rsub are disabled when using the
.I qmove=<job ID> 
option.  

Some shells require that you enclose a job array ID in double quotes.

Can be used on queued jobs only.
.RE

.IP "--version" 8
The 
.B pbs_rsub
command returns its PBS version information and exits.
This option can only be used alone.

.SH OUTPUT
The 
.B pbs_rsub 
command returns the reservation identifier.  
.br
Format for an advance or job-specific reservation:
.IP
.I R<sequence number>.<server name>
.br
The associated queue's name is the prefix, 
.I R<sequence number>.
.LP

Format for a standing reservation:
.IP
.I S<sequence number>.<server name>
.br
The associated queue's name is the prefix, 
.I S<sequence number>.
.LP

Format for a maintenance reservation:
.IP
.I M<sequence number>.<server name>
.LP

.SH FORMATS
.IP "Datetime format"
.I "[[[[CC]YY]MM]DD]hhmm[.SS]"

.IP "Duration format"
A period of time, expressed either as 
.RS 11
.I    An integer whose units are seconds
.RE
.IP 
or 
.RS 11
.I [[hours:]minutes:]seconds[.milliseconds]
.br
in the form
.br
.I [[HH:]MM:]SS[.milliseconds]
.RE
.IP
Milliseconds are rounded to the nearest second.

.IP "Reservation name format"
String up to 230 characters in length. It must consist of printable,
non-white space characters.  It can contain alphabetic and numeric
characters, and plus sign, dash or minus, underscore, and dot or period.

.SH SEE ALSO
pbs_resv_attributes(7B),
pbs_rdel(1B),
pbs_rstat(1B), 
qmove(1B),
qsub(1B)	


================================================
FILE: doc/man1/pbs_sched_attributes.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_sched_attributes 7B "4 March 2020" Local "PBS Professional"
.SH NAME
.B pbs_sched_attributes
\- attributes of default PBS scheduler and multischeds
.SH DESCRIPTION
These are the attributes of the default PBS scheduler and PBS multischeds.

.IP comment 8
For certain scheduler errors, PBS sets the scheduler's 
.I comment
attribute to specific error messages.  You can use the 
.I comment 
attribute to notify another administrator of something, but PBS does overwrite
the value of 
.I comment 
under certain circumstances.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Default: no default
.br
Python type: No Python type

.IP do_not_span_psets 8
Specifies whether or not the scheduler requires the job to fit within
one existing placement set.
.br
Readable by all; settable by Manager and Operator.
.br
Format: 
.I Boolean
.br
Behavior:
.nf
   True   The job must fit in one existing placement set.  All 
          existing placement sets are checked.  If the job fits 
          in an occupied placement set, the job waits for the 
          placement set to be available.  If the job cannot fit 
          within a single placement set, it won't run.
   False  The scheduler first attempts to place the job in a 
          single placement set, but if it cannot, it allows the 
          job to span placement sets, running on whichever
          vnodes can satisfy the job's resource request.
.fi
Default: 
.I False
.br
Python type: No Python type

.IP job_sort_formula_threshold 8
Lower bound for calculated priority for job.  If job priority is at 
or below this value, the job is not eligible to run in the current
scheduler cycle.  
.br
Readable by all; settable by Manager.  
.br
Format: 
.I Float
.br
Default: None
.br
Python type: No Python type

.IP log_events 8
Types of events logged by this scheduler.
.br
Readable by all; settable by Manager and Operator.
.br
Format:
.I Integer
.br
Default:
.I 767
.br
Python type: No Python type

.IP only_explicit_psets 8
Specifies whether placement sets are created for unset resources.  
.br
Readable by all; settable by Manager and Operator.
.br
Format: 
.I Boolean
.br
Behavior:
.nf
   True   Placement sets are not created from vnodes 
          whose value for a resource is unset.
   False  placement sets are created from vnodes whose 
          value for a resource is unset.
.fi
Default:
.I False
.br
Python type: No Python type

.IP opt_backfill_fuzzy 8
Sets the tradeoff between scheduling cycle speed and granularity of 
estimated start time calculation.  
.br
Readable by all; settable by Manager.
.br
Behavior: 
.RS 11
.IP off 8
Finest granularity; no speedup.
.IP low 8
Fairly fine granularity; some speedup.
.IP medium 8
Medium granularity; medium speedup.
.IP high 8
Coarse granularity; greatest speedup.
.RE
.IP
.br
Format: 
.I String
.br 
Default: unset (behaves like 
.I low
).
.br
Python type: No Python type

.IP partition 8
Name of partition for which this scheduler is to run jobs.
Cannot be set on default scheduler.
.br
Format:
.I String
.br
Default: "None"
.br
Python type: No Python type

.IP pbs_version 8
The version of PBS for this scheduler.  
.br
Readable by Manager and Operator; not settable.
.br
Format:
.I String
.br
Default: no default
.br
Python type: No Python type

.IP preempt_order
Defines the order of preemption methods which this scheduler uses on
jobs. This order can change depending on the percentage of time
remaining on the job. The ordering can be any combination of 
.I S, C, R, 
and 
.I D.  

Usage: an ordering 
.I (SCR) 
optionally followed by a percentage of time remaining and another
ordering.

For example, PBS should first attempt to use suspension to preempt a
job, and if that is unsuccessful, requeue the job: 
.nf
   preempt_order: "SR"
.fi

For example, if the job has between 100% and 810f requested time
remaining, first try to suspend the job, then try checkpoint, then
requeue. If the job has between 80% and 510f requested time
remaining, attempt suspend, then checkpoint.  Between 50% and 0% time
remaining, just attempt to suspend the job:
.nf
   preempt_order: "SCR 80 SC 50 S"
.fi

For each job percentage, each method can be used only once.  Note that
in the example above, the 
.I S 
method appears only once per percentage. 

Readable by all; settable by Manager.
.br
Format:
.I String, 
as a quoted list
.br
Preemption methods:
.nf
   C   Checkpoint job
   D   Delete job
   R   Requeue job
   S   Suspend job
.fi
Default: 
.I "SCR"
.br
Python type: No Python type

.IP "preempt_prio" 8
Specifies the ordering of priority for different preemption levels.
Two or more job types may be combined at the same priority level with
a plus sign ("+") between them, using no whitespace.  Comma-separated
preemption levels are evaluated left to right, with higher priority to
the left.  Any level not specified in the
.I preempt_prio 
list is ignored.  

For example, starving jobs have the highest priority, then normal
jobs, and jobs whose entities are over their fairshare limit are third
highest:
.nf
   preempt_prio: "starving_jobs, normal_jobs, fairshare"
.fi

For example, starving jobs whose entities are also over their
fairshare limit are lower priority than normal jobs: 
.nf 
   preempt_prio: "normal_jobs, starving_jobs+fairshare"
.fi

Readable by all; settable by Manager.
.br
Format:
.I string_array,
as quoted string
.br
Preemption levels:
.nf
   express_queue      Jobs in express queues preempt other jobs.  
.fi
.RS 30
See 
.I preempt_queue_prio.  
Does not require 
.I by_queue 
to be 
.I True. 
.RE
.RS 8
.nf
   starving_jobs      When a job becomes starving it can preempt 
                      other jobs.  
   fairshare          When the entity owning a job exceeds its 
                      fairshare limit.       
   queue_softlimits   Jobs which are over their queue soft limits     
   server_softlimits  Jobs which are over their server soft limits    
   normal_jobs        The preemption level into which a job falls 
                      if it does not fit into any other specified 
                      level.     
.fi

Default:
.I "express queue, normal_jobs"
.br
Python type: No Python type
.RE

.IP preempt_queue_prio 8
Specifies the minimum queue priority required for a queue to be
classified as an express queue.  Express queues do not require
.I by_queue 
to be 
.I True.
.br
Readable by all; settable by Manager.
.br
Format:
.I Integer
.br
Default:
.I 150
.br
Python type: No Python type

.IP preempt_sort 8
Specifies whether jobs most eligible for preemption are sorted
according to their start times.  
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Behavior:
.nf
   unset                 Preempted job will be that with 
                         longest running time.
   min_time_since_start  First job preempted will be that with 
                         most recent start time.
.fi
.br
Default:
.I min_time_since_start
.br
Python type: No Python type

.IP scheduler_iteration 8
Time in seconds between scheduling iterations.  If you set the
server's 
.I scheduler_iteration 
attribute, that value is assigned to the default scheduler's 
.I scheduler_iteration
attribute, and vice versa.
.br
Readable by all; settable by Manager.
.br
Format:
.I Integer
.br
Units:
Seconds
.br
Default:
.I 600
.br
Python type: No Python type

.IP scheduling 8
Enables scheduling of jobs.  
.br
If you set the server's 
.I scheduling 
attribute, that value is
assigned to the default scheduler's 
.I scheduling 
attribute, and
vice versa.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Default value for default scheduler:
.I True
.br
Default value for multischeds: 
.I False
.br
Python type: No Python type

.IP sched_cycle_length 8
The scheduler's maximum cycle length.  
Overwritten by the 
.I -a
option to the
.I pbs_sched
command.
.br
Readable by all and settable by the PBS Manager and Operator only.
.br
Format: 
.I Duration
 expressed as integer seconds, or 
.I [[hours:]minutes:]seconds[.milliseconds]
.br
Default: 
.I 20:00 (20 minutes)
.br
Python type: No Python type

.IP sched_host 8
The hostname of the machine on which this scheduler runs.  
.br
Cannot be set on default scheduler; value for default scheduler is server
hostname.  
.br
Must be set by administrator.
.br
Readable by Manager and Operator.
.br
Format: 
.I String
.br
Default value for multischeds: server hostname
.br
Python type: No Python type

.IP sched_log 8
Directory where this scheduler writes its logs.  Permissions should be
755.  Must be owned by root.  Cannot be shared with another scheduler.
.br
Format: 
.I String
.br
Default: 
.I $PBS_HOME/sched_logs_<scheduler name>

.IP sched_port 8
.B Removed. 

.IP sched_preempt_enforce_resumption 8
Controls whether the scheduler treats preempted jobs as top jobs.  
.br
When 
.I True
, preempted jobs are treated as top jobs.  
.br
Readable by all; settable by Manager.
.br 
Format: 
.I Boolean
.br
Default: 
.I False
.br
Python type: No Python type

.IP sched_priv 8
Directory where this scheduler keeps its fairshare usage, resource_group, 
holidays, and sched_config files. Must be owned by root.  
For default scheduler, use default value; do not set.  Settable for 
multischeds.
.br
Readable by all; settable by Manager (for multischeds).
.br
Format: 
.I String
.br
Default: 
.I $PBS_HOME/sched_priv_<scheduler name>
.br
Python type: No Python type


.IP state 8
State of this scheduler. 
.br
States:
.RS 11
.IP down
Scheduler is not running.
.IP idle
Scheduler is running and is waiting for a scheduling cycle to be triggered.
.IP scheduling
Scheduler is running and is in a scheduling cycle.
.RE
.IP 
Format:
.I String
.br
Default value for default scheduler: 
.I idle
.br
Default value for multischeds:
.I down
.br
Python type: No Python type

.IP throughput_mode  8
Allows scheduler to run faster; it doesn't have to wait for each job
to be accepted, and doesn't wait for 
.I execjob_begin 
hooks to finish.  Also allows jobs that were changed via 
.I qalter, server_dyn_res 
scripts, or peering to run in the same scheduling cycle where they
were changed.
.br
Readable by all; settable by Manager and Operator.
.br
Format: 
.I Boolean
.br
Behavior:
.nf
   True    Scheduler runs asynchronously and faster.  Only available 
           when PBS complex is in TPP mode.
   False   Scheduler does not run asynchronously
.fi
.br
Default: 
.I True
.br
Python type: No Python type


.SH SEE ALSO
.B qmgr(1B)


================================================
FILE: doc/man1/pbs_server_attributes.7B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_server_attributes 7B "18 July 2020" Local "PBS Professional"
.SH NAME
pbs_server_attributes 
\- PBS server attributes
.SH DESCRIPTION
A PBS server has the following attributes.

.IP acl_host_enable 8
Specifies whether the server obeys the host access control list in the
.I acl_hosts 
server attribute.  
.br
Readable by all; settable by Manager.
.br
Format: 
.I Boolean
.br
Python type: 
.I bool
.br
Behavior:
.RS
.IP True 3
The server limits host access according to the access control list.
.IP False 3
All hosts are allowed access.
.RE
.IP
Default: 
.I False 

.IP acl_host_moms_enable 8
Specifies whether all MoMs are automatically allowed to contact the
server with the same privilege as hosts listed in the acl_hosts server
attribute.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 
.IP True 3
All MoMs are automatically allowed to contact the server with the same
privilege as hosts listed in the 
.I acl_hosts 
server attribute.
.IP False 3
MoMs are not automatically allowed to contact the server with the same
privilege as hosts listed in the 
.I acl_hosts 
server attribute.
.RE
.IP
Default: 
.I False

.IP acl_hosts 8
List of hosts from which services can be requested of this
server. Requests from the server host are always honored whether or
not that host is in the list.  This list contains the fully qualified
domain names of the hosts. List is evaluated left-to-right; first
match in list is used.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<hostname>.<domain>[, ...]"
.br
Python type: 
.I pbs.acl
.br
Default: No default (all hosts are allowed access)

.IP acl_resv_group_enable 8
Specifies whether the server obeys the group reservation access
control list in the 
.I acl_resv_groups 
server attribute.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 
.IP True 3
The server limits group access according to the access control list.
.IP False 3
All groups are allowed access.
.RE
.IP
Default:
.I False

.IP acl_resv_groups 8
List of groups allowed or denied permission to create reservations in
this PBS complex.  The groups in the list are groups on the server
host, not submission hosts.  List is evaluated left-to-right; first
match in list is used.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<group name>[, ...]"
.br
Python type:
.I pbs.acl
.br
Default: No default

.IP acl_resv_host_enable 8
Specifies whether the server obeys the host reservation access control
list in the 
.I acl_resv_hosts 
server attribute.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 
.IP True 3
The server limits host access according to the access control list.
.IP False 3
All hosts are allowed access.
.RE
.IP
Default:
.I False

.IP acl_resv_hosts 8
List of hosts from which reservations can be created in this PBS
complex. This list is made up of the fully-qualified domain names of
the hosts.  List is evaluated left-to-right; first match in list is
used.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<hostname>.<domain>[, ...]"
.br
Python type:
.I pbs.acl
.br
Default: No default

.IP acl_resv_user_enable 8
Specifies whether the server limits which users are allowed to create
reservations, according to the access control list in the 
.I acl_resv_users 
server attribute.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 
.IP True 3
The server limits user reservation creation according to the access control list.
.IP False 3
All users can create reservations.
.RE
.IP
Default:
.I False

.IP acl_resv_users 8
List of users allowed or denied permission to create reservations in
this PBS complex.  List is evaluated left-to-right; first match in
list is used.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<username>[@<hostname>][, ...]"
.br
Python type:
.I pbs.acl
.br
Default: No default

.IP acl_roots 8
List of users with root privilege who may run jobs
at this server.  If the owner of a job is root or Administrator,
the owner must be listed in this access control list or
the job is rejected.  More specific entries should be listed before
more general, because the list is read left-to-right, and the first
match determines access.
.br
Readable by all; can be set or altered by root only, and only at 
the server host.
.br
Format: 
.I String
.br
Syntax: "[+|-]<username>[@<hostname>][, ...]"
.br
Python type: 
.I pbs.acl
.br
Default: No default; no root jobs allowed

.IP acl_user_enable 8
Specifies whether the server limits which users are allowed to run
commands at the server, according to the control list in the 
.I acl_users
server attribute.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 
.IP True 3
The server limits user access according to the access control list.
.IP False 3
All users have access.
.RE
.IP
Default:
.I False

.IP acl_users 8
List of users allowed or denied permission to run commands at this
server.  List is evaluated left-to-right; first match in list is used.
.br
Readable by all; settable by Manager.
.br
Format:
.I String
.br
Syntax: "[+|-]<username>[@<hostname>][, ...]"
.br
Python type:
.I pbs.acl
.br
Default: No default

.IP backfill_depth 8
Modifies backfilling behavior.  Sets the number of jobs that are to be backfilled 
around.  Overridden by 
.I backfill_depth 
queue attribute.
.br
Recommendation: set this to less than 100.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Valid values: Must be >= 0
.br
Behavior:
.RS
.IP ">= 0" 3
PBS backfills around the specified number of jobs.
.IP "Unset" 3
Backfill depth is set to
.I 1.
.RE
.IP
Python type:
.I int
.br
Default: Unset (backfill depth is 1)

.IP comment 8
Informational text.  Can be set by a scheduler or other privileged client.
.br
Readable by all; settable by Operator, Manager, and PBS.
.br
Format: 
.I String
of any form
.br
Python type:
.I str
.br
Default: No default

.IP default_chunk  8
The list of resources which will be inserted into each chunk of a
job's select specification if the corresponding resource is not
specified by the user.  This provides a means for a site to be sure a
given resource is properly accounted for even if not specified by the
user.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
.I default_chunk.<resource name>=<value>, default_chunk.<resource name>=<value>, ...
.RE
.IP
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
default_chunk["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP default_node 8
No longer used.

.IP default_qdel_arguments 8
Argument to qdel command.  Automatically added to all qdel commands.
See qdel(1B).  Overrides standard defaults. Overridden by arguments
given on the command line.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax: "-Wsuppress_mail=<N>"
.br
Python type: 
.I pbs.args
.br
Default: No default

.IP default_qsub_arguments 8
Arguments that are automatically added to the qsub command.  Any valid
arguments to qsub command, such as job attributes. Setting a job
attribute via default_qsub_arguments sets that attribute for each job
which does not explicitly override it. See qsub(1B). Settable by the
administrator via the qmgr command. Overrides standard
defaults. Overridden by arguments given on the command line and in
script directives.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11
"<option> <value> <option> <value>"
.RE
.IP 
Python type:
.I pbs.args
.br
To set: 
.RS 11
Qmgr: s s default_qsub_arguments ="<option> <value>"
.RE
.IP
To add to existing: 
.RS 11
Qmgr: s s default_qsub_arguments +="<option> <value>"
.RE
.IP
Example: 
.RS 11
Qmgr: set server default_qsub_arguments = "-r y -N MyJob"
.br
Qmgr: set server default_qsub_arguments += "-l Blue=False"
.RE
.IP
Default: No default

.IP default_queue 8
The name of the default target queue.  Used for requests that do not
specify a queue name.  Must be set to an existing queue.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I Queue name
.br
Python type:
.I pbs.queue
.br
Default: 
.I workq

.IP eligible_time_enable 8
Controls starving behavior. Toggles between using the value of the job's 
.I eligible_time 
attribute and the value of 
.I now() - etime
to evaluate whether job is starving.
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS
.IP True 3
The value of the job's 
.I eligible_time 
attribute is used for its starving time.
.IP False 3
The value of 
.I now() - etime 
is used for the job's starving time.
.RE
.IP 
Default: 
.I False

.IP est_start_time_freq 8
.B Obsolete. 
No longer used.

.IP flatuid 8
Used for authorization allowing users to submit and alter jobs.
Specifies whether user names are treated as being the same across the
PBS server and all submission hosts in the complex.  Can be used to
allow users without accounts at the server host to submit jobs.
.br
If UserA has an account at the server host, PBS requires that
UserA@<server host> is the same as UserA@<execution host>.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS
.IP True 3
PBS assumes that UserA@<submithost> is same user as UserA@<server
name>.  Jobs that run under the name of the job owner do not need
authorization.  
.br
A job submitted under a different username, by using the 
.I -u 
option to the qsub command, requires authorization.  
.br
Entries in .rhosts or hosts.equiv are not checked, so even if
UserA@host1 has an entry for UserB@host2, UserB@host2 cannot operate
on UserA@host1's jobs.  User without account on server can submit
jobs.
.IP False 3
PBS does not assume that UserA@<submission host> is the same user as
UserA@<server host>.  Jobs that run under the name of the job owner
need authorization.  Users must have accounts on the server host to
submit jobs.
.RE
.IP
Default: 
.I False
(authorization is required)

.IP FLicenses 8
The number of licenses currently available for allocation to unlicensed
hosts.
.br
Readable by all; settable by Manager.
.br
Format:
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP job_history_duration 8
The length of time PBS will keep each job's history.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Duration
.br
Syntax: 
.I [[hours:]minutes:]seconds[.milliseconds]
.br
Python type:
.I pbs.duration
.br
Default: 
.I Two weeks

.IP job_history_enable 8
Enables job history management.  
Setting this attribute to True enables job history management.  
.br 
Readable by all; settable by Manager.
.br
Format: 
.I Boolean
.br
Python type:
.I bool
.br
Default: 
.I False

.IP job_requeue_timeout 8
The amount of time that can be taken while requeueing a job.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Duration
.br
Python type:
.I pbs.duration
.br
Minimum allowed value: 
.I 1 second
.br 
Maximum allowed value: 
.I 3 hours
.br
Default: 
.I 45 seconds

.IP job_sort_formula 8
Formula for computing job priorities.
If the attribute 
.I job_sort_formula 
is set, all schedulers use the formula in it to compute job
priorities.  When a scheduler sorts jobs according to the formula, it
computes a priority for each job, where that priority is the value
produced by the formula.  Jobs with a higher value get higher
priority.
.br
Readable by all; settable by root.
.br
Format: 
.I String 
.br
Syntax:
Mathematical formula; can be made up of expressions, where
expressions contain terms which are added, subtracted,
multiplied, or divided, and which can contain parentheses, 
exponents, and unary plus and minus. 
.br
Python type: 
.I pbs.job_sort_formula
.br
Default: Unset

.IP jobscript_max_size 8
Limit on the size of any job script.  
.br
Readable by all; settable by Manager.
.br
Format: 
.I size
.br
Units default to bytes
.br 
Python type: 
.I pbs.size
.br
Default: 
.I 100MB

.IP license_count 8
The 
.I license_count
attribute contains the following elements with their values: 
.I Avail_Global, Avail_Local, Used, High_Use.
.br
Readable by all; settable by PBS only.
.br
Format: 
.I String
.br
Syntax:
.RS 11
.I Avail_Global:<value> Avail_Local:<value> Used:<value> 
.I High_Use:<value>
.RE
.IP
.RS
.IP Avail_Global 3
The number of licenses available at ALM license server
(checked in.)
.LP
.IP Avail_Local 3
The number licenses kept by PBS (checked out.)
.LP
.IP Used 3
The number of licenses currently in use.
.LP
.IP High_Use 3
The highest number of licenses checked out and used at any time 
by the current instance of the PBS server.
.LP
.RE
.IP
Python type: 
.I pbs.license_count
.br
Default value:
.RS 11
.I Avail_Global:0 Avail_Local:0 Used:0 High_Use:0
.RE

.IP log_events 8
The types of events the server logs.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
representation of bit string
.br
Python type: 
.I int
.br
Default: 
.I 511
(all events)

.IP mail_from 8
The username from which server-generated mail is sent to users.  
Mail is sent 
.B to
this address upon failover.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Python type: 
.I str
Default: "adm"

.IP managers 8
List of PBS Managers.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Syntax:
.RS 11
"<username>@<hostname>.<subdomain>.<domain>[,<username>@<hostname>.<subdomain>.<domain> ...]"
.br
The 
.I hostname, subdomain, 
or 
.I domain 
may be wildcarded with an asterisk ("*").
.RE
.IP
Python type: 
.I pbs.acl
.br
Default: Root on the server host

.IP max_array_size 8
The maximum number of subjobs that are allowed in any array job.  
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: 
.I 10000

.IP max_concurrent_provision 8
The maximum number of vnodes allowed to be in the process of being provisioned.
Cannot be set to zero.
.br
When unset, default value is used.  
.br
Readable by all; settable by Manager.
.br
Format:
.I Integer
.br
Python type: 
.I int
.br
Default:
.I 5

.IP max_group_res 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum amount of the specified resource that any single group may consume
in this PBS complex. 
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax: 
.I max_group_res.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.br
.RS 11
max_group_res["<resource name>"]=<value> 
.br
where 
.I resource name
is any built-in or custom resource
.RE
.IP
Example: set server max_group_res.ncpus=6
.br
Default: No default
.br

.IP max_group_res_soft 8
Old limit attribute.  Incompatible with new limit attributes.  The
soft limit on the amount of the specified resource that any single
group may consume in this complex.  If a group is
consuming more than this amount of the specified resource, their jobs
are eligible to be preempted by jobs from groups who are not over
their soft limit.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax: 
.I max_group_res_soft.<resource name>=<value>
.br
Python type:
.I pbs.pbs_resource
.br
Syntax:
.br
.RS 11
max_group_res_soft["<resource name>"]=<value> 
.br
where 
.I resource name
is any built-in or custom resource
.RE
.IP
Default: No default
.br

.IP max_group_run 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum number of jobs owned by any users in a single group that are
allowed to be running within this complex at one time.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP max_group_run_soft 8
Old limit attribute.  Incompatible with new limit attributes.  The
maximum number of jobs owned by the users in one group allowed to be
running in this complex at one time.  If a group has more than this
number of jobs running, their jobs are eligible to be preempted by
jobs from groups who are not over their soft limit.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP max_queued 8
Limit attribute.  The maximum number of jobs allowed to be queued
or running in the complex.  Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes. 
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Limit specification
.RS 11
.RE
.IP
Python type:
.I str
.br
Default: No default

.IP max_queued_res 8
Limit attribute.  The maximum amount of the specified resource 
allowed to be allocated to jobs queued or running in the complex.
Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes. 
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Limit specification
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_queued_res["<resource name>"]=<value> 
.br 
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP max_run 8
Limit attribute.  The maximum number of jobs allowed to be running 
in the complex.  Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes. 
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Limit specification
.br
Python type:
.I str
.br
Default: No default

.IP max_run_res 8
Limit attribute.  The maximum amount of the specified resource 
allowed to be allocated to jobs running in the complex.
Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes.  
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Limit specification
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_run_res["<resource name>"]=<value> 
.br 
where 
.I resource name
is any built-in or custom resource
.RE
.IP
Default: No default

.IP max_run_res_soft 8
Limit attribute.  Soft limit on the amount of the specified resource 
allowed to be allocated to jobs running in the complex.
Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Limit specification
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
max_run_res_soft["<resource name>"]=<value> 
.br 
where
.I resource name
is any built-in or custom resource
.RE
.IP
Default: No default

.IP max_run_soft 8
Limit attribute.  Soft limit on the number of jobs allowed to be running 
in the complex.  Can be specified for projects, users, groups, or all.
Cannot be used with old limit attributes.  
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Limit specification
.br
Python type:
.I str
.br
Default: No default

.IP max_running 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum number of jobs in this complex allowed to be 
running any given time.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP max_user_res 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum amount of the specified resource that any single user may consume
within this complex. 
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax:
.I max_user_res.<resource name>=<value>
.br
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.br
.RS 11
max_user_res["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Example: set server max_user_res.ncpus=6
.br
Default: No default

.IP max_user_res_soft 8
Old limit attribute.  Incompatible with new limit attributes.  The
soft limit on the amount of the specified resource that any single
user may consume within this complex.  If a user is consuming more
than this amount of the specified resource, their jobs are eligible to
be preempted by jobs from users who are not over their soft limit.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax:
.I max_user_res_soft.<resource name>=<value>
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.br
.RS 11
max_user_res_soft["<resource name>"]=<value> 
.br
where 
.I resource name
is any built-in or custom resource
.RE
.IP
Example: set server max_user_res_soft.ncpus=3
.br
Default: No default

.IP max_user_run 8
Old limit attribute.  Incompatible with new limit attributes.
The maximum number of jobs owned by a single user that are allowed to be
running within this complex at one time.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Python type:
.I int
.br
Default: No default

.IP max_user_run_soft 8
Old limit attribute.  Incompatible with new limit attributes.
The soft limit on the number of jobs owned by a single user that are allowed to be
running within this complex at one time.  If a user has more than this number of jobs 
running, their jobs are eligible to be preempted by jobs from users who are not over 
their soft limit.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.IP node_fail_requeue 8
Controls whether running jobs are automatically requeued or deleted
when the primary execution host fails.  Number of seconds to wait after
losing contact with Mother Superior before requeueing or deleting jobs.  
.br
Reverts to default value when server is restarted.
.br
Can be set by Managers and Operators.  Visible to all.
.br
Format: 
.I Integer
.br
Python type:
.I int
Behavior:
.RS
.IP "< 0" 3
Behaves as if set to 
.I 1.
.IP 0 3
Jobs are not requeued; they are left in the 
.I Running 
state until the execution host is recovered.  
.IP "> 0" 3
When the host has been down for the specified number of seconds, 
jobs are requeued if they are marked as rerunnable, or are deleted.
.IP Unset 3
Behaves as if set to default value of 
.I 310.
.RE
.IP
Default: 
.I 310

.IP resend_term_delay 8
Delay for resending the TERM signal to a job in seconds.
.br
Can be set by Managers and Operators.  Visible to all.
.br
Must be >= 0 and <= 1800.
.br
Format: 
.I Integer
.br
Python type:
.I int
.IP Unset 3
Behaves as if set to default value of 
.I 5.
.RE
.IP
Default: 
.I 5

.IP "node_group_enable" 8
Specifies whether placement sets (which includes node grouping) are
enabled.  See the 
.I node_group_key
server attribute.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Boolean
.br  
Python type: 
.I bool
.br
Example: Qmgr> set server node_group_enable=true
.br
Default: 
.I False

.IP node_group_key 8
Specifies the resources to use for placement sets (node grouping.)  
Overridden by queue's 
.I node_group_key 
attribute.  See 
.I node_group_enable
server attribute.
.br
Readable by all; settable by Operator and Manager.
.br
Format:
.I string_array
.br
Syntax:
.RS 11
When specifying multiple resources, separate them with commas and 
enclose the value in double quotes.
.RE
.IP
Python type:
.I pbs.node_group_key
.br
Example: Qmgr> set server node_group_key="ncpus,mem"
.br
Default: 
.I Unset

.IP operators 8
List of PBS Operators.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11 
<username>@<hostname>.<subdomain>.<domain
name>[,<username>@<hostname>.<subdomain>.<domain name> ...]
.br
The 
.I host, subdomain, 
or 
.I domain name 
may be wildcarded with an asterisk (*).
.RE
.IP
Python type:
.I pbs.acl
.br
Default: No default

.IP pbs_license_file_location 8
.B Deprecated.  
Do not use.

.IP pbs_license_info 8
Location of license server(s).  
.br
Readable by all; settable by Manager.
.br
Format: 
.I String
.br
Syntax: 
.RS 11 
One or more port number and hostname combinations:
.br
.I <port1>@<host1>[:<port2>@<host2>:...:<portN>@<hostN>]
.br
where 
.I host1, host2, ... hostN 
can be IP addresses.
.br
Delimiter between items is colon (":").
.RE
.IP 
Python type: 
.I str
.br
Default: No default

.IP pbs_license_linger_time 8
The number of seconds to keep an unused license, when the number
of licenses is above the value given by 
.I pbs_license_min.  
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer 
.br
Units:
.I seconds
.br
Python type: 
.I pbs.duration
.br
To set 
.I pbs_license_linger_time:
.br
\ \ \ Qmgr> set server pbs_license_linger_time=<value>
.br
To unset 
.I pbs_license_linger_time:
.br
\ \ \ Qmgr> unset server pbs_license_linger_time
.br
Default: 
.I 3600 seconds

.IP pbs_license_max 8
Maximum number of licenses to be checked out at any time, i.e maximum
number of licenses to keep in the PBS local license pool.  Sets a
cap on the number of nodes or sockets that can be licensed at one time. 
.br
Readable by all; settable by Manager. 
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
To set
.I pbs_license_max:
.br
\ \ \ Qmgr> set server pbs_license_max=<value>
.br
To unset 
.I pbs_license_max:
.br
\ \ \ Qmgr> unset server pbs_license_max
.br
Default: 
.I Maximum value for an integer

.IP pbs_license_min 8
Minimum number of nodes or sockets to permanently keep licensed, i.e. the minimum
number of licenses to keep in the PBS local license pool. This is
the minimum number of licenses to keep checked out.  
.br
Readable by all; settable by Manager. 
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
To set pbs_license_min:
.br
\ \ \ Qmgr> set server pbs_license_min=<value>
.br
To unset pbs_license_min:
.br
\ \ \ Qmgr> unset server pbs_license_min
.br
If unset, PBS automatically sets the value to 
.I 0.
.br
Default: 
.I 0

.IP pbs_version 8
The version of PBS for this server.  
.br
.br
Readable by all.
.br
Format: 
.I String
.br
Python type: 
.I pbs.version
.br
Default: No default

.IP power_provisioning 8
Shows use of power profiles via PBS.
.br
Readable by all; set by PBS.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS
.IP True 3
Power provisioning is enabled.  
.IP False 3
Power provisioning is disabled.
.RE
.IP 
Default: 
.I False

.IP python_restart_max_hooks 8
The maximum number of hooks to be serviced before the Python
interpreter is restarted.  If this number is exceeded, and the time
limit set in 
.I python_restart_min_interval 
has elapsed, the Python interpreter is restarted.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: 
.I 100

.IP python_restart_max_objects 8
The maximum number of objects to be created before the Python
interpreter is restarted.  If this number is exceeded, and the time
limit set in 
.I python_restart_min_interval 
has elapsed, the Python interpreter is restarted.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer
.br
Python type:
.I int
.br
Default: 
.I 1000

.IP python_restart_min_interval 8
The minimum time interval before the Python interpreter is restarted.
If this interval has elapsed, and either the maximum number of hooks
to be serviced (set in 
.I python_restart_max_hooks
) has been exceeded or
the maximum number of objects to be created (set in
.I python_restart_max_objects
) has been exceeded, the Python interpreter is restarted.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer 
.br
Units: 
.I Seconds 
or 
.I Duration [[HH:]MM:]SS
.br
Python type: 
.I pbs.duration
.br
Default: 
.I 30

.IP query_other_jobs 8
Controls whether unprivileged users are allowed to select or query the
status of jobs owned by other users.
.br
When 
.I True, 
unprivileged users can query or select other users' jobs.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Boolean
.br
Python type: 
.I bool
.br
Default: 
.I True

.IP queued_jobs_threshold 8
Limit attribute.  The maximum number of jobs allowed
to be queued in the complex.  Can be specified for
projects, users, groups, or all.  Cannot be used with old limit
attributes.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Limit specification
.br
Python type: 
.I str
.br
Default: No default

.IP queued_jobs_threshold_res 8
Limit attribute.  The maximum amount of the specified resource allowed
to be allocated to jobs queued in the complex.  Can be specified for
projects, users, groups, or all.  Cannot be used with old limit
attributes.
.br
Readable by all; settable by Operator and Manager.
Format: 
.I Limit specification
.br
Python type: 
.I pbs.pbs_resource
.br 
Syntax:
.RS 11
queued_jobs_threshold_res["<resource name>"]=<value> 
.br
where 
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No default

.IP reserve_retry_cutoff 8
.B Obsolete.
No longer used.

.IP reserve_retry_init 8
.B Deprecated.
The amount of time after a reservation becomes degraded that
PBS waits before attempting to reconfirm the reservation.
When this value is changed, only reservations that become degraded
after the change use the new value.
.br
Readable and settable by Manager only.
.br
Format: 
.I Integer 
.br
Units: 
.I Seconds
.br
Python type: 
.I int
.br
Valid values: Must be greater than 
.I zero
.br
Default: 
.I 7200 
(2 hours)

.IP reserve_retry_time 8
The amount of time after a reservation becomes degraded that
PBS waits before attempting to reconfirm the reservation, as well
as the amount of time between attempts to reconfirm degraded 
reservations.
When this value is changed, only reservations that become degraded
after the change use the new value.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer 
.br
Units: 
.I Seconds
.br
Python type: 
.I int
.br
Valid values: Must be greater than 
.I zero
.br
Default: 
.I 600 
(5 minutes)


.IP resources_assigned 8
The total of each type of resource allocated to jobs running in this
complex, plus the total of each type of resource allocated to any reservation.
Reservation resources are added when the reservation starts.
.br
Readable by all; settable by PBS only.
.br
Format: 
.I String
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.br
.RS 11
resources_assigned["<resource name>"]=<value> 
.br
where
.I resource name
is any built-in or custom resource
.RE
.IP
Default: No default

.IP resources_available 8
The list of available resources and their values defined on the server.  
Each resource is listed on a separate line.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String 
.br
Syntax: 
.RS 11
"resources_available.<resource name>=<value>"
.br
where 
.I resource name
is any built-in or custom resource
.RE
.IP
Python type:
.I pbs.pbs_resource
.br
Syntax:
.br
.RS 11
resources_available["<resource name>"]=<value> 
.br
where
.I resource name
is any built-in or custom resource
.RE
.IP
Default: No default

.IP resources_cost 8
No longer used.

.IP resources_default 8
The list of default job-wide resource values that are set as limits
for jobs in this complex when a) the job does not specify a limit, and
b) there is no queue default.  The value for a string array,
e.g. 
.I resources_default.<string array resource>, 
can contain only one string.  For host-level resources, see the 
.I default_chunk.<resource name> 
server attribute.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax:
.I resources_default.<resource name>=value[, ...]
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_default["<resource name>"]=<value> 
.br
where
.I resource name 
is any built-in or custom resource
.RE
.IP 
Default: No limit

.IP resources_max 8 
The maximum amount of each resource that can be requested by any
single job in this complex, if there is not a 
.I resources_max 
value defined for the queue at which the job is targeted.  This
attribute functions as a gating value for jobs entering the PBS
complex.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I String
.br
Syntax:
.I resources_default.<resource name>=value[, ...]
.br
Python type: 
.I pbs.pbs_resource
.br
Syntax:
.RS 11
resources_max["<resource name>"]=<value> 
.br
where
.I resource name 
is any built-in or custom resource
.RE
.IP
Default: No limit

.IP restrict_res_to_release_on_suspend 8
Comma-separated list of consumable resources to be released when
jobs are suspended.  If unset, all consumable resources are released
on suspension.
.br
Readable by all; settable by Manager.
.br
Format: 
.I String array
.br
Syntax: 
.I comma-separated list
.br
Python type:
.I Python list
.br
Default: 
.I Unset

.IP "resv_enable" 8
Specifies whether or not advance and standing reservations can be 
created at this server.  
.br
Readable by all; settable by Manager.
.br
Format:
.I Boolean
.br
Python type:
.I bool
.br
Behavior:
.RS 11
When set to 
.I True, 
new reservations can be created.  When changed from 
.I True 
to 
.I False, 
new reservations cannot be created, but existing reservations are honored.
.RE
.IP
Default: 
.I True

.IP "resv_post_processing_time" 8
The amount of time allowed for reservations to clean up after running jobs.
.br
Reservation duration and end time are extended by this amount of time.  Jobs
are not allowed to run during the cleanup period.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Duration
.br
Syntax: 
.I [[hours:]minutes:]seconds[.milliseconds]
.br
Python type: 
.I int
.br
Behavior: When unset, behaves as if set to 
.I zero.
.br
Default: 
.I Unset

.IP rpp_highwater 8
The maximum number of messages.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer
.br
Python type:
.I int
.br
Valid values: Greater than or equal to 
.I one
.br
Default: 
.I 1024

.IP rpp_max_pkt_check 8
Maxiumum number of TPP messages processed by the main server thread per iteration.
.br
Readable by all; settable by Manager.
.br
Format:
.I Integer
.br
Python type: 
.I int
.br
Default: 
.I 1024

.IP rpp_retry 8
In a fault-tolerant setup (multiple pbs_comms), when the first
pbs_comm fails partway through a message, this is number of times TPP
tries to use the first pbs_comm.
.br
Readable by all; settable by Manager.
.br
Format: 
.I Integer
.br
Python type:
.I int
.br
Valid values: Greater than or equal to 
.I zero
.br
Default: 
.I 10

.IP scheduler_iteration 8
The time between scheduling iterations.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Integer 
.br
Units:
.I Seconds
.br
Python type: 
.I pbs.duration
.br
Default: 
.I 600
(10 minutes)

.IP scheduling 8
Enables scheduling of jobs.  Specified by value of 
.I -a 
option to
.I pbs_server 
command. If 
.I -a 
is not specified, value is taken from previous invocation of 
.I pbs_server.
.br
Readable by all; settable by Operator and Manager.
.br
Format: 
.I Boolean 
.br
Python type: 
.I bool
.br
Default: 
.I False
if never set via 
.I pbs_server 
command

.IP server_host 8
The name of the host on which the active server is running.
If the secondary server takes over, this attribute is set to the 
name of the secondary server's host.  When the primary server
takes control again, this attribute shows the name of the primary
server's host.
.br
Readable by all; settable by PBS only.
.br
Format: 
.I String
.br
Syntax: 
.I <hostname>.<domain name>
.RS 11
If the server is listening to a non-standard port, the port number is
appended, with a colon, to the hostname: 
.I <hostname>.<domain name>:<port number>
.RE
.IP
Python type: 
.I str
.br
Default: No default
 
.IP server_state 8
The current state of the server.
.br
Readable by all; settable by PBS only.
.br
Format: 
.I String
.br
Python type: 
.RS 11
Each server state's Python type is its corresponding server state constant
.RE
.IP
Server states and their Python types:
.RS
.IP "Active                pbs.SV_STATE_ACTIVE" 3
The server is running.  The scheduler is between scheduling cycles.

.IP "Hot_Start             pbs.SV_STATE_HOT " 3
The server will run first any jobs that were running when it 
was shut down.

.IP "Idle                  pbs.SV_STATE_IDLE" 3
The server is running.  The default scheduler's 
.I scheduling
attribute is 
.I False.

.IP "Scheduling            pbs.SV_STATE_ACTIVE" 3
The server is running.  The scheduler is in a scheduling cycle.

.IP "Terminating    pbs.SV_STATE_SHUTIMM or pbs.SV_STATE_SHUTSIG" 3
The server is terminating.  No additional jobs will be run.

.IP "Terminating_Delayed   pbs.SV_STATE_SHUTDEL" 3
The server is terminating in delayed mode.  No new jobs will be run.
The server will shut down when all running jobs have finished.
.RE
.IP
Default: No default

.IP single_signon_password_enable 8
.B Removed. (2020.1)

.IP state_count 8
List of the number of jobs in each state in the complex.  Suspended
jobs are counted as running.
.br
Readable by all; settable by PBS only.
.br
Format: 
.I String
.br
Syntax:
.I transiting=<value>, queued=<value>, ...
.br
Python type: 
.I pbs.state_count
.br
Default: No default

.IP system_cost 8
No longer used.

.IP total_jobs 8
The total number of jobs in the complex.  If the 
.I job_history_enable
attribute is set to 
.I True, 
this includes jobs that are finished, deleted, and moved.
.br
Readable by all; settable by PBS only.
.br
Format: 
.I Integer
.br
Python type: 
.I int
.br
Default: No default

.SH Incompatible Limit Attributes
The old and new limit attributes are incompatible.  
If any of one kind is set, none of the other kind can be set.
All of one kind must be unset in order to set any of the other kind.

.SH FORMATS

.IP Duration 8
Syntax: either
.I [[hours:]minutes:]seconds[.milliseconds]
or 
.I an integer, whose units are seconds 

.IP "Limit specification" 8
Limit attributes can be set, added to or removed from.
.RS
Format for setting a 
.I limit specification:
.RS 3
set server <limit attribute> = "[<limit specification>=<limit value>], [<limit specification>=<limit value>] ..."
.RE
Format for adding to a 
.I limit specification:
.RS 3
set server <limit attribute> += "[<limit specification>=<limit value>], [<limit specification>=<limit value>] ..."
.RE
Format for removing from a 
.I limit specification:
.RS 3
set server <limit attribute> -= "[<limit specification>=<limit value>], [<limit specification>=<limit value>] ..."
.br
or
.br
set server <limit attribute> -= "[<limit specification>], [<limit specification>] ..."
.RE

Where 
.I limit specification
is 
.RS 3
.IP "o:PBS_ALL" 3
Overall limit
.IP "p:PBS_GENERIC" 3
Generic users
.IP "p:<project name>" 3
An individual project
.IP "u:PBS_GENERIC" 3
Generic users
.IP "u:<user name>" 3
An individual user
.IP "g:PBS_GENERIC" 3
Generic groups
.IP "g:<group name>" 3
An individual group
.RE

The 
.I limit specification 
can contain spaces anywhere except after the colon
(":").
.br
If there are comma-separated 
.I limit specifications, 
the entire string must be enclosed in double quotes.
.br
A user name, group name, or project name containing spaces must be
enclosed in quotes.
.br
If a user name, group name, or project name is quoted using double
quotes, and the entire string requires quotes, the outer enclosing
quotes must be single quotes.  Similarly, if the inner quotes are
single quotes, the outer quotes must be double quotes.
.br
PBS_ALL is a keyword which indicates that this limit applies to 
the usage total.
.br
PBS_GENERIC is a keyword which indicates that this limit applies to
generic users, groups, or projects.
.br
When removing a limit, the 
.I limit value 
does not need to be specified.
.br
PBS_ALL and PBS_GENERIC are case-sensitive.
.br

Format for setting a limit attribute:
.RS 3
set server <limit attribute> = "[<limit specification>=<limit value>],
[<limit specification>=<limit value>], ..."
.br

set queue <queue name> <limit attribute> = "[<limit specification>=
<limit value>], [<limit specification>=<limit value>], ..."
.RE
.RE

.IP
For example, to set the 
.I max_queued 
limit on QueueA to 5 for total usage, and to limit user bill to 3:
.br
\ \ \ s q QueueA max_queued = "[o:PBS_ALL=5], [u:bill =3]"

Examples of setting, adding, and removing: 
.RS 
.RS 3
set server max_run="[u:PBS_GENERIC=2], [g:group1=10], [o:PBS_ALL = 100]"
.br
set server max_run+="[u:user1=3], [g:PBS_GENERIC=8]"
.br
set server max_run-="[u:user2], [g:group3]"
.RE
.RE

.IP

.SH SEE ALSO
qdel(1B),
qmgr(1B),
qsub(1b)


================================================
FILE: doc/man1/pbsdsh.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbsdsh 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbsdsh 
\- distribute tasks to vnodes under PBS

.SH SYNOPSIS
.B pbsdsh 
[-c <copies>] [-s] [-v] [-o] -- <program> [<program args>]
.br
.B pbsdsh 
[-n <vnode index>] [-s] [-v] [-o] -- <program> [<program args>]
.br
.B pbsdsh 
--version

.SH DESCRIPTION
The 
.B pbsdsh
command allows you to distribute and execute a task on each of the vnodes
assigned to your job by executing (spawning) the application on each
vnode.  The 
.B pbsdsh 
command uses the PBS Task Manager, or TM, to distribute the program on 
the allocated vnodes.

When run without the 
.I -c 
or the 
.I -n 
option, 
.B pbsdsh 
will spawn the program
on all vnodes allocated to the PBS job.  The spawns take place concurrently;
all execute at (about) the same time.

Note that the double dash must come after the options and before the 
program and arguments.  The double dash is only required for Linux.

The 
.B pbsdsh 
command runs one task for each line in the $PBS_NODEFILE.  Each MPI rank 
gets a single line in the $PBS_NODEFILE, so if you are running multiple 
MPI ranks on the same host, you still get multiple 
.B pbsdsh 
tasks on that host.

.B Example
.br
The following example shows the 
.B pbsdsh 
command inside of a PBS batch job. The options indicate that the user wants 
.B pbsdsh 
to run the myapp program with one argument (app-arg1) on all four vnodes 
allocated to the job (i.e. the default behavior).

.RS 5
#!/bin/sh
.br
#PBS -l select=4:ncpus=1
.br
#PBS -l walltime=1:00:00

pbsdsh ./myapp app-arg1
.RE

.SH OPTIONS
.IP "-c copies"
The program is spawned 
.I copies
times on the vnodes allocated, one per vnode, unless
.I copies 
is greater than the number of vnodes.
If 
.I copies
is greater than the number of vnodes, 
it wraps around, running multiple instances on some vnodes.
This option is mutually exclusive with 
.I -n.
.IP "-n <vnode index>"
The program is spawned only on a single vnode, which is the 
.I vnode index -th
vnode allocated.  This option is mutually exclusive with 
.I -c.
.IP -o
No obit request is made for spawned tasks.  The program does not wait for
the tasks to finish.
.IP -s
Te program is run in turn on each vnode, one after the other.
.IP -v
Produces verbose output about error conditions and task exit status.

.IP --version
The 
.B pbsdsh
command returns its PBS version information and exits.
This option can only be used alone

.SH OPERANDS
.IP program
The first operand,
.I program ,
is the program to execute.  The double dash must precede the 
.I program 
under Linux.
.LP
.IP "program args"
Additional operands,
.I program args ,
are passed as arguments to the 
.I program.

.SH STANDARD ERROR
The 
.B pbsdsh 
command writes a diagnostic message to standard error for
each error occurrence.

.SH SEE ALSO
qsub(1B), tm(3).


================================================
FILE: doc/man1/qalter.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qalter 1B "25 January 2021" Local "PBS Professional"
.SH NAME
.B qalter 
\- alter PBS job


.SH SYNOPSIS
.B qalter
[-a <date and time>] [-A <account string>] 
.RS 7
[-c <checkpoint spec>] 
[-e <error path>] 
[-h <hold list>] [-j <join>] [-k <discard>] [-l <resource list>]
[-m <mail events>] [-M <user list>] [-N <name>] [-o <output path>] 
[-p <priority>] [-P <project>] [-r <y|n>] [-S <path list>] [-u <user list>] 
[-W <additional attributes>] 
<job ID> [<job ID> ...]
.RE

.B qalter
--version

.SH DESCRIPTION
The 
.B qalter 
command is used to alter one or more PBS batch jobs.
Each of certain job attributes can be modified using the 
.B qalter
option for that attribute.


.B Required Privilege
.br
A non-privileged user can alter their own jobs, whether they are 
queued or running.  An Operator or Manager can alter any job, 
whether it is queued or running.

A non-privileged user can only lower resource requests.
A Manager or Operator can raise or lower resource requests.

.B Modifying resources and job placement
.br

A Manager or Operator may lower or raise requested resource limits,
except for per-process limits such as 
.I pcput 
and 
.I pmem, 
because these are set when the process starts, and enforced by the
kernel.  A non-privileged user can only lower resource requests.

The 
.B qalter 
command cannot be used by a non-privileged user to alter a
custom resource which has been created to be invisible or read-only
for users.

If a job is running, the only resources that can be modified are
.I mppnodes, mppt, cput, walltime, min_walltime, 
and 
.I max_walltime.

If a job is queued, any resource mentioned in the options to the
.B qalter 
command can be modified, but requested modifications must fit
within the limits set at the server and queue for the amount of each
resource allocated for queued jobs.  If a requested modification does
not fit within these limits, the modification is rejected.

A job's resource request must fit within the queue's and server's
resource run limits.  If a modification to a resource exceeds the
amount of the resource allowed by the queue or server to be used by
running jobs, the job is never run.

Requesting resources includes setting limits on resource usage and
controlling how the job is placed on vnodes.

.B Syntax for Modifying Resources and Job Placement
.br
Resources are modified
by using the 
.I -l
option, either in
.I chunks 
inside of 
.I selection statements,
or in job-wide requests using
.I <resource name>=<value>
pairs.
The 
.I selection statement 
is of the form:
.IP
.I -l select=[<N>:]<chunk>[+[<N>:]<chunk> ...]
.LP
where 
.I N
specifies how many of that chunk, and 
a 
.I chunk 
is of the form:
.IP
.I <resource name>=<value>[:<resource name>=<value> ...]
.LP
Job-wide 
.I <resource name>=<value>
requests are of the form:
.IP
.I -l <resource name>=<value>[,<resource name>=<value> ...]
.LP
.B The Place Statement
.br
You choose how your chunks are placed using the 
.I place statement.  
The 
.I place statement
can contain the following elements, in any order:
.IP
.I -l place=[<arrangement>][:<sharing>][:<grouping>]
.LP
where
.br
.I \ \ \ arrangement
.RS 13
Whether this chunk is willing to share this vnode or host with other
chunks from the same job.  One of 
.I free | pack | scatter | vscatter
.RE
.LP
.I \ \ \ sharing
.RS 13
Whether this chunk is willing to share this vnode or host with other
jobs.  One of 
.I excl | shared | exclhost
.RE
.LP 
.I \ \ \ grouping
.RS 13
Whether the chunks from this job should be placed on vnodes that all 
have the same value for a resource.  Can have only one instance of 
.I group=<resource name>
.RE
.LP
.I \ \ \ \ \ free
.RS 15
Place job on any vnodes.
.RE
.LP
.I \ \ \ \ \ pack
.RS 15
All chunks are taken from one host.
.RE
.LP
.I \ \ \ \ \ scatter
.RS 15
Only one chunk with any MPI processes is taken from a host.  A chunk
with no MPI processes may be taken from the same vnode as another chunk.
.RE
.LP
.I \ \ \ \ \ vscatter
.RS 15
Only one chunk is taken from any vnode.  Each chunk must fit on a vnode.
.RE
.LP
.I \ \ \ \ \ excl
.RS 15
Only this job uses the vnodes chosen.
.RE
.LP
.I \ \ \ \ \ shared
.RS 15
This job can share the vnodes chosen.
.RE
.LP
.I \ \ \ \ \ exclhost
.RS 15
The entire host is allocated to the job.
.RE
.LP
.I \ \ \ \ \ group=<resource name>
.RS 15
Chunks are grouped according to a resource.  All vnodes in the group must 
have a common value for 
.I resource, 
which can be either the built-in resource
.I host
or a custom vnode-level resource.  The
.I resource name 
must be a string or a string array.
.RE
.LP

The 
.I place statement
cannot begin with a colon.  Colons are delimiters; use them only to separate
parts of a place statement, unless they are quoted inside resource values.

For more on resource requests, usage limits and job placement, see
.B pbs_resources(7B).

.B Modifying Attributes
.br
The user alters job attributes via options to the 
.B qalter 
command.  Each
.B qalter 
option changes a job attribute.  See pbs_job_attributes(7B).

The behavior of the 
.B qalter 
command may be affected by 
any site hooks.  Site hooks can modify the job's attributes, 
change its routing, etc.

To modify the 
.I max_run_subjobs 
attribute, use 
.B qalter -Wmax_run_subjobs=<new value> <job ID>.

.SH Caveats and Restrictions for Altering Jobs
When you lengthen the 
.I walltime
of a running job, make sure that the new 
.I walltime
will not interfere with any existing reservations etc.

If any of the modifications to a job fails, 
none of the job's attributes is modified.

A job that is in the process of provisioning cannot be altered.

.SH OPTIONS

.IP "-a <date and time>" 8
Changes the point in time after which the job is eligible for execution.
Given in pairs of digits.  Sets job's 
.I Execution_Time
attribute to 
.I date and time.
Format:
.RS 13
.I "[[[[CC]YY]MM]DD]hhmm[.SS]"
.RE
.IP
where CC is the century,
YY is the year, 
MM is the month,
DD is the day of the month, 
hh is the hour, mm is the minute,
and SS is the seconds.

Each portion of the date defaults to the current date, as long as the 
next-smaller portion is in the future.  For example, if today is the
3rd of the month and the specified day 
.I DD 
is the 5th, the month 
.I MM
is set to the current month.

If a specified portion has already passed, the next-larger portion is set
to one after the current date.  For example, if the day
.I DD
is not specified, but the hour 
.I hh 
is specified to be 10:00 a.m. and the current time is 11:00 a.m., 
the day 
.I DD
is set to tomorrow.

The job's 
.I Execution_Time
attribute can be altered after the job has begun execution, in which
case it will not take effect until the job is rerun.

.IP "-A <account string>" 8
Replaces the accounting string associated with the job.  Used for labeling accounting data.
Sets job's 
.I Account_Name 
attribute to 
.I account string.
This attribute cannot be altered once the job has begun execution.
.br
Format: 
.I String

.IP "-c <checkpoint spec>"
Changes when the job will be checkpointed.  Sets job's 
.I Checkpoint
attribute.  An 
.I $action
script is required to checkpoint the job.  See the 
.B pbs_mom(8B)
man page.  
This attribute can be altered after the job has begun execution, 
in which case the new value will not take effect until the
job is rerun.
.IP
The argument 
.I checkpoint spec
can take one of the following values:
.RS
.IP c 5
Checkpoint at intervals, measured
in CPU time, set on job's execution queue.  
If no interval set at queue, job is not checkpointed.

.IP "c=<minutes of CPU time>" 5
Checkpoint at intervals of specified number of minutes of job CPU
time.  This value must be greater than zero.  If interval specified is less that
that set on job's execution queue, queue's interval is used.
.br
Format: 
.I Integer

.IP w 5
Checkpoint at intervals, measured in walltime, set on job's execution queue.
If no interval set at queue, job is not checkpointed.

.IP "w=<minutes of walltime>" 5
Checkpoint at intervals of the specified number
of minutes of job walltime.  This value must be greater
than zero.  If the interval specified is less than that set on the
job's execution queue, the queue's interval is used.
.br
Format: 
.I Integer
.IP n 5
No checkpointing.
.IP s 5
Checkpoint only when the server is shut down.

.IP u 5
Unset.  Defaults to behavior when 
.I interval
argument is set to 
.I s.
.I 
.LP
Default: 
.I u
.br
Format: 
.I String
.RE
.RE

.IP "-e <error path>" 8
Replaces the path to be used for the job's standard error stream.
Sets job's 
.I Error_Path 
attribute to 
.I error path.
Overridden by 
.I -k 
option.
.br  
Format:
.RS 13
.I [<hostname>:]<path>
.RE
.RS
The 
.I error path 
is interpreted as follows:

.IP path 5
If
.I path 
is relative, it is taken to be relative to 
the current working directory of the 
.B qalter
command, where it is executing 
on the current host.

If
.I path
is absolute, then it is taken to be an absolute path on 
the current host where the 
.B qalter
command is executing.

.IP hostname:path
If 
.I path
is relative, it is taken to be relative to the user's 
home directory on the host named
.I hostname.

If 
.I path
is absolute, it is the absolute path on the host named
.I hostname.
.LP
If 
.I path
does not include a filename, the default filename is
.RS 
<job ID>.ER
.RE
If the
.I -e
option is not specified, PBS writes standard error to the default filename,
which has this form:
.RS 
.I <job name>.e<sequence number>
.RE

This attribute can be altered after the job has begun execution, 
in which case the new value will not take effect until the
job is rerun.

If you use a UNC path, the hostname is optional.  If you use a non-UNC 
path, the hostname is required.
.RE

.IP "-h <hold list>" 8
Updates the job's hold list.
Adds 
.I hold list
to the job's 
.I Hold_Types 
attribute.
The 
.I hold list
is a string of one or more characters.  The following table shows the 
holds and the privilege required to set each:
.RS

Hold  Meaning       Who Can Set
.br
--------------------------------------------------------------
.IP u 6
User          Job owner, Operator, Manager, 
.br
              administrator, root
.IP o 6
Other         Operator, Manager, administrator, root
.IP s 6
System        Manager, administrator, root, 
.br
              PBS (dependency)
.IP n 6
None          Job owner, Operator, Manager, 
.br
              administrator, root
.IP p 6
Bad password  Administrator, root
.LP
This attribute can be altered after the job has begun execution, 
in which case the new value will not take effect until the
job is rerun.
.RE

.IP "-j <join>" 8
Changes whether and how to join the job's standard error 
and standard output streams.
Sets job's 
.I Join_Path
attribute to 
.I join.
.br
This attribute can be altered after the job has begun execution, in which
case the new value will not take effect until the job is rerun.

The 
.I join
argument can take the following values:
.RS
.IP oe 5
Standard error and standard output are merged into standard output.
.IP eo 5
Standard error and standard output are merged into standard error.
.IP n 5
Standard error and standard output are not merged.
.RE
.IP
Default: 
.I n;
not merged
.LP

.IP "-k <discard>" 8
Changes whether and which of the standard output and standard error streams
is left behind on the execution host, and whether they are written to their 
final destinations.  Sets the job's 
.I Keep_Files 
attribute to 
.I discard.

This attribute cannot be altered once the job has begun execution.

In the case where output and/or error is retained on the execution host in
a job-specific staging and execution directory created by PBS, these
files are deleted when PBS deletes the directory.

Default: 
.I n;
neither is retained, and files are not written to final destinations

The 
.I discard
argument can take the following values:
.RS

.IP e 5
The standard error stream is retained on the execution host, in the 
job's staging and execution directory.  The filename is:
.RS
.RS 5
<job name>.e<sequence number>
.RE
.RE

.IP o  5
The standard output stream is retained on the execution host, in the 
job's staging and execution directory.  The filename is:
.RS
.RS 5
<job name>.o<sequence number>
.RE
.RE

.IP "eo, oe"  5
Both standard output and standard error streams are 
retained on the execution host, in the job's staging 
and execution directory.

.IP d 5
Output and/or error are written directly to their final destination.
Overrides the action of leaving files behind on the execution host.

.IP n  5
Neither stream is retained.
.RE


.IP "-l <resource list>" 8
.RS
Allows the user to change requested resources and job
placement.  Sets job's 
.I Resource_list 
attribute to 
.I resource list.
Uses resource request syntax.
Requesting a resource places a limit on its usage.
Users without manager or operator privilege cannot alter a custom 
resource which was created to be invisible or read-only for users.

For syntax, see 
.B "Syntax for Modifying Resources and Job Placement"
above.

If a requested modification to a resource would exceed the server's or
job queue's limits, the resource request is rejected.
Which resources can be altered is system-dependent.

If the job was submitted with an explicit "-l select=", vnode-level 
resources must be qaltered using the "-l select=" form.  In this
case a vnode level resource <resource> cannot be qaltered with 
the "-l <resource name>" form.

The place statement cannot begin with a colon.


For example: 
.RS
Submit the job:
.br
% qsub -l select=1:ncpus=2:mem=512mb jobscript
.br
Job's ID is 230

qalter the job using "-l <resource name>" form:
.br
% qalter -l ncpus=4 230
.br

Error reported by qalter:
.br
qalter: Resource must only appear in "select" specification 
when select is used: ncpus 230
.br

qalter the job using the "-l select=" form:
.br
% qalter -l select=1:ncpus=4:mem=512mb 230
.br

No error reported by qalter:
.br
%
.RE

For more on resource requests, usage limits and job placement, see
.B pbs_resources(7B).
.RE

.IP "-m <mail events> " 8
Changes the set of conditions under which mail about the job is sent.
Sets job's 
.I Mail_Points
attribute to 
.I mail events.  
The 
.I mail events
argument can be one of the following:
.RS 11
The single character "n"
.br
Any combination of "a", "b", and "e", with optional "j"
.RE
.IP
The following table lists the sub-options to the 
.I -m 
option:
.RS
.IP n 5
No mail is sent
.IP a 5
Mail is sent when the job is aborted by the batch system
.IP b 5
Mail is sent when the job begins execution
.IP e 5
Mail is sent when the job terminates
.IP j 5
Mail is sent for subjobs.  Must be combined with one or more of the
.I a
, 
.I b
, or 
.I e 
sub-options
.RE
.IP
Can be used with job arrays but not subjobs.
.br
Format: 
.I String
.br
Syntax: 
.I n | [j](one or more of a, b, e)
.br
Example: -m ja
.br
Default: 
.I "a"  


.IP "-M <user list>" 8
Alters list of users to whom mail about the job is sent.  Sets job's 
.I Mail_Users 
attribute to 
.I user list.  
.br
Format:
.br
.I \ \ \ <username>[@<hostname>][,<username>[@<hostname>],...]
.br
Default: job owner

.IP "-N <name> " 8
Renames the job.
Sets job's 
.I Job_Name
attribute to 
.I name.
.br
Format: 
.I Job Name 
.br
Default: if a script is used to submit the job, the job's name is the
name of the script.  If no script is used, the job's name is 
.I "STDIN".

.IP "-o <output path>" 8
Alters path to be used for the job's standard output stream.
Sets job's 
.I Output_Path 
attribute to 
.I output path.
Overridden by 
.I -k
option.
Format:
.RS 13
.I [<hostname>:]<path>
.RE
.RS
The 
.I output path 
is interpreted as follows:

.IP path 5
If
.I path
is relative, it is taken to be relative to 
the current working directory of the command, where it is executing 
on the current host.

If
.I path
is absolute, it is taken to be an absolute path on 
the current host where the command is executing.

.IP hostname:path
If 
.I path
is relative, it is taken to be relative to the user's 
home directory on the host named
.I hostname.

If 
.I path 
is absolute, it is the absolute path on the host named
.I hostname.

If 
.I path
does not include a filename, the default filename is
.RS 
<job ID>.OU
.LP
.RE

If the
.I -o
option is not specified, PBS writes standard output to 
the default filename, which has this form:
.RS 
.I <job name>.o<sequence_number>
.RE
This attribute can be altered after the job has begun execution, 
in which case the new value will not take effect until the
job is rerun.

If you use a UNC path, the hostname is optional.  If you use a non-UNC
path, the hostname is required.
.RE

.IP "-p <priority>" 8
Alters priority of the job.  Sets job's 
.I Priority
attribute to 
.I priority.

This attribute can be altered after the job has begun execution, 
in which case the new value will not take effect until the
job is rerun.

Format: 
.I Host-dependent integer
.br
Range: [-1024, +1023] inclusive
.br
Default: 
.I Zero  

.IP "-P <project>" 8
Specifies a project for the job. Sets job's 
.I project
attribute to specified value.

Format: 
.I Project Name
.br
Default: 
.I "_pbs_project_default"

.IP "-r <y|n>" 8
Changes whether the job is rerunnable.  Sets job's 
.I Rerunable
attribute to the argument. Does not affect how the job is handled when
the job is unable to begin execution.
.br
See the
.B qrerun(1B)
command.  
.br
Format: Single character, 
.I "y" 
or 
.I "n"
.br

.RS
.IP y 5
Job is rerunnable.
.IP n 5
Job is not rerunnable.
.LP

Default: 
.I "y"

Interactive jobs are not rerunnable.  Job arrays are always rerunnable.
.RE
.LP

.IP "R <remove options>" 8
Changes whether standard output and/or standard error files are automatically
removed upon job completion.  Sets job's 
.I Remove_Files
attribute to 
.I remove options.
Overrides default path names for these streams.  Overrides
.I -o
and 
.I -e
options.

This attribute cannot be altered once the job has begun execution.

Default:
.I Unset; 
neither is removed

The 
.I remove options
argument can take the following values:

.RS
.IP e
The standard error stream is removed (deleted) upon job completion
.IP o
The standard output stream is removed (deleted) upon job completion
.IP "eo, oe"
Both standard error and standard output streams are removed (deleted) 
upon job completion
.IP unset
Neither stream is removed
.RE

.IP "-S <path list>" 8
Specifies the interpreter or shell path for the job script.  Sets job's 
.I Shell_Path_List 
attribute to 
.I path list.

The 
.I path_list
argument is the full path to the interpreter or shell including the 
executable name.  

Only one path may be specified without a hostname.
Only one path may be specified per named host.  The path selected
is the one whose hostname is that of the server on which the job
resides.  

This attribute can be altered after the job has begun execution, 
in which case the new value will not take effect until the
job is rerun.

Format:
.RS
.IP
.I <path>[@<hostname>][,<path>@<hostname> ...]
.LP
If the path contains spaces, it must be quoted, for example:
.IP
qsub -S "C:\Program Files\\PBS Pro\\bin\\pbs_python.exe" <script name>
.LP
.br
Default: User's login shell on execution node

Example of using bash via a directive:
.IP
#PBS -S /bin/bash@mars,/usr/bin/bash@jupiter
.LP
Example of using a Python script from the command line on Linux: 
.IP
qsub -S $PBS_EXEC/bin/pbs_python <script name>
.LP
Example of using a Python script from the command line on Windows: 
.IP
qsub -S \%PBS_EXEC\%\\bin\\pbs_python.exe <script name>
.LP

.RE
.IP 
.IP "-u <user list>" 8
Alters list of usernames.  Job will be run under a username from this list.
Sets job's 
.I User_List 
attribute to 
.I user list.

Only one username may be specified without a hostname.
Only one username may be specified per named host.  
The server on which the job resides will select first the username whose
hostname is the same as the server name.  Failing that, 
the next selection will be the username with no specified hostname.
The usernames on the server and execution hosts must be the same.
The job owner must have authorization to run as the specified user.

This attribute cannot be altered once the job has begun execution.

Format: 
.br
.I \ \ \ <username>[@<hostname>][,<username>@<hostname> ...]

Default: Job owner (username on submit host)  
.RE

.IP "-W <additional attributes>" 8
Each sub-option to the 
.I -W 
option allows you to change a specific job attribute
.br
Format:
.br
.I \ \ \ -W <attribute name>=<value>[,<attribute name>=<value>...]

If white space occurs within the 
.I additional attributes
argument, or the equal sign "=" occurs within an 
.I attribute value
string, that argument or string must be enclosed with single or double quotes.
PBS supports the following attributes via the 
.I -W 
option:

.I "depend=<dependency list>"
.IP
Defines dependencies between this and other jobs.  
Sets the job's
.I depend
attribute to 
.I dependency list.
The 
.I dependency list
has the form:
.RS
.RS 5
.I <type>:<arg list>[,<type>:<arg list> ...]
.RE
where except for the 
.I on
type, 
the
.I arg list
is one or more PBS job IDs in the form:
.RS 5
.I <job ID>[:<job ID> ...]
.RE
The types and their argument lists can be:

.IP " after: <arg list>" 4
This job may be scheduled for execution at any point after all jobs
in 
.I arg list
have started execution.

.IP " afterok: <arg list>" 4
This job may be scheduled for execution only after all jobs in
.I arg list
have terminated with no errors.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP " afternotok: <arg list>" 4
This job may be scheduled for execution only after all jobs in 
.I arg list
have terminated with errors.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP " afterany: <arg list>" 4
This job may be scheduled for execution after all jobs in
.I arg list
have finished execution, with any exit status (with or without errors.)
This job will not run if a job in the 
.I arg list 
was deleted without ever having been run.

.IP " before: <arg list>"  4
Jobs in 
.I arg list 
may begin execution once this job has begun execution.

.IP  " beforeok: <arg list> " 4
Jobs in 
.I arg list
may begin execution once this job terminates without errors.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP " beforenotok: <arg list>"  4
If this job terminates execution with errors, jobs in 
.I arg list
may begin.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP " beforeany: <arg list>"  4
Jobs in 
.I arg list
may begin execution once this job terminates execution,
with or without errors.

.IP " on: count " 4
This job may be scheduled for execution after
.I count
dependencies on
other jobs have been satisfied.  This type is used in conjunction
with one of the 
.I before
types listed.
Count is an integer greater than 
.I 0.
.LP

.B Restrictions
.br
Job IDs in the
.I arg list 
of 
.I before 
types must have been submitted with a 
.I type 
of 
.I on.

To use the 
.I before 
types, the user must have the authority to alter the jobs in 
.I arg list.
Otherwise, the dependency is rejected and the new job aborted.

Error processing of the existence, state, or condition of the job on which the
newly submitted job depends is performed after
the job is queued.  If an error is detected, the new job is deleted by
the server.  Mail is sent to the job submitter stating the error.

.B Dependency examples:
.br
qalter -W depend=afterok:123.host1.domain.com /tmp/script
.br
qalter -W depend=before:234.host1.com:235.host1.com /tmp/script
.RE

.IP "group_list=<group list>"
Alters list of group names.  Job will run under a group name from this list.
Sets job's
.I group_List
attribute to
.I group list.

Only one group name may be specified without a hostname.
Only one group name may be specified per named host.
The server on which the job resides will select first the group name whose
hostname is the same as the server name.  Failing that,
the next selection will be the group name with no specified hostname.
The group names on the server and execution hosts must be the same.

Format:
.br
.I \ \ \ <group>[@<hostname>][,<group>@<hostname> ...]

Default: no default
.LP

.IP "release_nodes_on_stageout=<value>"
When set to 
.I True, 
all of the job's vnodes not on the primary execution host are released
when stageout begins.

Cannot be used with vnodes tied to Cray X* series systems.

When cgroups is enabled and this is used with some but not all vnodes
from one MoM, resources on those vnodes that are part of a cgroup are
not released until the entire cgroup is released.

The job's 
.I stageout 
attribute must be set for the 
.I release_nodes_on_stageout 
attribute to take effect.

Format: 
.I Boolean
.br
Default: 
.I False


.IP "run_count=<count>"
Sets the number of times the server thinks it has run the job.  Sets the job's
.I run_count
attribute to 
.I count.  

Can be set while job is running.

Job is held when the value of this attribute goes over 
.I 20.

Format: Integer greater than or equal to zero
.LP

.IP "sandbox=<sandbox spec>"
Changes which directory PBS uses for the job's staging and execution.
Sets job's 
.I sandbox
attribute to the value of 
.I sandbox spec.

Format: 
.I String

Allowed values for 
.I sandbox spec:
.RS
.IP PRIVATE
PBS creates a job-specific directory for staging and execution.

.IP "HOME or unset"
PBS uses the user's home directory for staging and execution.
.RE
.LP

.IP "stagein=<path list>"
.br
.IP "stageout=<path list>"
Changes files or directories to be staged in before execution or staged out
after execution is complete.  Sets the job's 
.I stagein
and 
.I stageout
attributes to the specified
.I path lists.
On completion of the job, all staged-in and staged-out files and directories
are removed from the execution host(s).  A
.I path list
has the form:
.br
.I \ \ \ <filespec>[,<filespec>]
.br
where 
.I filespec 
is 
.br
.I \ \ \ <execution path>@<hostname>:<storage path>
.br
regardless of the direction of the copy.
The
.I execution path 
is the name of the file or directory on the primary execution host.
It can be relative to the staging and execution directory on the
execution host, or it can be an absolute path.

The "@" character separates 
.I execution path 
from 
.I storage path.

The
.I storage path
is the path on 
.I hostname. 
The name can be relative to the staging and execution directory on the
primary execution host, or it can be an absolute path.

If 
.I path list
has more than one 
.I filespec,
i.e. it contains commas, it must be enclosed in double quotes.

If you use a UNC path, the hostname is optional.  If you use a non-UNC 
path, the hostname is required.
.RE
.LP

.IP "umask=<value>"
Alters the umask with which the job is started.  Controls umask of
job's standard output and standard error.  Sets job's
.I umask
attribute to 
.I value.

Format: One to four digits; typically two

Default: 
.I 077

The following example allows group and world read of the job's output
and error:
.br
.I \ \ \ -W umask=33

.IP "--version"
The 
.B qalter
command returns its PBS version information and exits.
This option can only be used alone.
.LP


.SH  OPERANDS
The 
.B qalter 
command accepts a 
.I job ID
list as its operand.  The 
.I job ID
list is a space-separated list of 
one or more job IDs for normal jobs or array jobs.  

Subjobs and ranges of subjobs are not alterable.

Job IDs have the form:
.br
.I \ \ \ <sequence number>[.<server name>][@<server name>]
.br
.I \ \ \ <sequence number>[][.<server name>][@<server name>]


Note that some shells require that you enclose a job array ID 
in double quotes.

.SH STANDARD ERROR
The
.B qalter
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 
Upon successful processing of input
.IP "Greater than zero"
Upon failure

.SH Warning about exit status with csh:
If a job is run in csh and a .logout file
exists in the home directory in which the job executes, the exit status
of the job is that of the .logout script, not the job script.  This may
impact any inter-job dependencies.  


.SH SEE ALSO
pbs_job_attributes(7B),
pbs_resources(7B),
qdel(1B), 
qhold(1B), 
qmove(1B), 
qmsg(1B), 
qrerun(1B),
qrls(1B), 
qselect(1B), 
qstat(1B),
qsub(1B)


================================================
FILE: doc/man1/qdel.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qdel 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qdel 
- delete PBS jobs
.SH SYNOPSIS
.B qdel 
[ -Wforce | -Wsuppress_email=<N>] [-x] <job ID> [<job ID> ...]
.br
.B qdel
--version
.SH DESCRIPTION
The 
.B qdel 
command deletes jobs in the order given, whether they are at the local
server or at a remote server.  

.B Usage
.br
The qdel command is used without options to delete queued, running,
held, or suspended jobs, while the
.I -x  
option gives it the additional capacity to delete finished or moved
jobs.  With the
.I -x 
option, this command can be used on finished and moved jobs, in
addition to queued, running, held, or suspended jobs.

When this command is used without the 
.I -x 
option, if job history is enabled, the deleted job's history is
retained.  The 
.I -x 
option is used to additionally remove the history of the job being
deleted.

If someone other than the job's owner deletes the job, mail is
sent to the job's owner, or to a list of mail recipients if 
specified during 
.B qsub.  
See the 
.B qsub(1B)
man page.

If the job is in the process of provisioning,
it can be deleted only by using the 
.I -W force
option.

.B "How Behavior of qdel Command Can Be Affected"
.br
The server's 
.I default_qdel_arguments
attribute may affect the behavior of the 
.B qdel 
command.  This attribute is settable by the administrator 
via the 
.B qmgr
command.  The attribute may be set to "-Wsuppress_email=<N>".
The server attribute is overridden by command-line arguments.
See the 
.B pbs_server_attributes(1B) 
man page.

.B Sequence of Events
.IP " " 3
The job's running processes are killed.
.IP
The epilogue runs.
.IP
Files that were staged in are staged out.  This includes
standard out (.o) and standard error (.e) files.
.IP
Files that were staged in or out are deleted.
.IP
The job's temp directory is removed.
.IP
The job is removed from the MOM(s) and the server.
.LP

.B Required Privilege
.br
A PBS job may be deleted by its owner, an Operator, or the
administrator.  The MoM deletes a PBS job by sending a 
.B SIGTERM
signal, then, if there are remaining processes, a
.B SIGKILL 
signal.  


.SH OPTIONS
.IP "(no options)" 8
Can delete queued, running, held, or suspended jobs.  
Does not delete job history for specified job(s).
.IP "-W force" 8
Deletes the job whether or not the job's execution host is 
reachable.  Deletes the job whether or not the job is in the
process of provisioning.  Cannot be used with the 
.I -Wsuppress_email
option.

If the server can contact the MoM, this option is ignored; the 
server allows the job to be deleted normally.  If the server 
cannot contact the MoM or the job is in the 
.I E
state, the server deletes its information about the job.

.IP "-Wsuppress_email=<N>" 8
Sets limit on number of emails sent when deleting multiple jobs.  
.RS 11
If 
.I N
>= 1 and 
.I N 
or more 
.I job IDs
are given, 
.I N 
emails are sent.  
.br
If 
.I N
>=1 and less than 
.I N job IDs
are given, the number of emails is
the same as the number of jobs.  
.br
If 
.I N
= 0, this option is ignored.  
.br
If 
.I N
= -1, no email is sent.
.RE
.LP
.IP " " 8
The 
.I <N>
argument is an integer.  Note that there is no space between "W" and "suppress_email".
Cannot be used with the 
.I -Wforce
option.
.LP
.IP "-x" 8
Can delete running, queued, suspended, held, finished, or moved jobs.
Deletes job history for specified job(s).
.LP
.IP "--version" 8
The 
.B qdel
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
The 
.B qdel 
command accepts one or more space-separated
.I job ID
operands.  These operands can be job identifiers, job array
identifiers, subjob dentifiers, or subjob range identifiers.

Job IDs have the form:
.br
.I \ \ \ <sequence number>[.<server name>][@<server name>]

Job arrays have the form:
.br
.I \ \ \ <sequence number>[][.<server name>][@<server name>]

Subjobs have the form:
.br
.I \ \ \ <sequence number>[<index>][.<server name>][@<server name>]

Ranges of subjobs have the form:
.br
.I \ \ \  <sequence number>[<first>-<last>][.<server name>][@<server name>]

Job array identifiers must be enclosed in double quotes for some shells.


.SH STANDARD ERROR
The 
.B qdel 
command writes a diagnostic message to standard error for each
error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of input

.IP "Greater than zero" 8
Upon error

.SH SEE ALSO
pbs_queue_attributes(7B), pbs_server_attributes(1B), 
qsub(1B), qsig(1B), pbs_deljob(3B)


================================================
FILE: doc/man1/qhold.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qhold 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qhold 
\- hold PBS batch jobs


.SH SYNOPSIS
.B qhold
[-h <hold list>] <job ID> [<job ID> ...]
.br
.B qhold
--version

.SH DESCRIPTION
Places one or more holds on a job.  A job that has a hold is not
eligible for execution.  Can be used on jobs and job arrays, but not
on subjobs or ranges of subjobs.

If a job identified by
.I job ID
is in the queued, held, or waiting states, then all that occurs is
that the hold type is added to the job.  The job is then put into the
held state if it resides in an execution queue.

If the job is running, the result of the 
.B qhold 
command depends upon whether the job can be checkpointed.
The job can be checkpointed if the OS supports checkpointing, or 
if the application being checkpointed supports checkpointing. 
.br
If the job can be checkpointed, the following happens:
.RS 3
The job is checkpointed and its execution is interrupted.

The resources assigned to the job are released.

The job is placed in the held state in the execution queue.

The job's 
.I Hold_Types 
attribute is set to 
.I u
for 
.I user hold.
.RE

If checkpoint / restart is not supported, 
.B qhold 
simply sets the
job's 
.I Hold_Types 
attribute to 
.I u.  
The job continues to execute.

A job's dependency places a 
.I system 
hold on the job.  When the
dependency is satisfied, the 
.I system 
hold is removed.  This 
.I system 
hold
is the same as the one set by an administrator.  If the administrator
sets a 
.I system 
hold on a job with a dependency, when the
dependency is satisfied, the job becomes eligible for execution.

If the job is in the process of provisioning, it cannot be held.

A hold on a job can be released by the administrator, a Manager, 
an Operator, or the job owner, when the job reaches the time set
in its 
.I Execution_Time
attribute, or when a dependency clears.  See 
.B qrls.1B.

.B Effect of Privilege on Behavior
.br
The following table shows the holds and the privilege required to set each:
.RS 3
Hold  Meaning       Who Can Set
.br
--------------------------------------------------------------
.IP u 6
User          Job owner, Operator, Manager, 
.br
              administrator, root
.IP o 6
Other         Operator, Manager, administrator, root
.IP s 6
System        Manager, administrator, root, 
.br
              PBS (dependency)
.IP n 6
None          Job owner, Operator, Manager, 
.br
              administrator, root
.IP p 6
Bad password  Administrator, root
.RE
.LP

.SH OPTIONS
.IP "(no options)" 8
Same as 
.I -h u.
Applies the 
.I user
hold to the specified job(s).
.IP "-h <hold list>" 8
Types of holds to be placed on the job(s).

The
.I hold list
argument is a string consisting of one or more of the letters
.I """u""", """o""", 
or 
.I """s"""
in any combination, or one of the letters
.I """n""" 
or 
.I """p""".

.IP "--version" 8
The 
.B qhold
command returns its PBS version information and exits.
This option can only be used alone.


.SH OPERANDS
The 
.B qhold 
command can be used on jobs and job arrays, but not on subjobs or ranges 
of subjobs.  The 
.B qhold 
comand accepts one or more 
.I job IDs
in the form:
.RS 4
.I <sequence number>[.<server name>][@<server name>]
.br
.I <sequence number>[][.<server name>][@<server name>]
.RE
Note that some shells require that you enclose a job array identifier in
double quotes.

.SH STANDARD ERROR
The 
.B qhold 
command writes a diagnostic message to standard error for each
error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all operands

.IP "Greater than zero" 8
If the 
.B qhold 
command fails to process any operand

.SH SEE ALSO
qrls(1B), qalter(1B), qsub(1B), pbs_alterjob(3B), pbs_holdjob(3B),
pbs_rlsjob(3B), pbs_job_attributes(7B), pbs_resources(7B)


================================================
FILE: doc/man1/qmove.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qmove 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qmove 
- move PBS batch job

.SH SYNOPSIS
.B qmove 
<destination> <job ID> [<job ID> ...]
.br
.B qmove
--version

.SH DESCRIPTION
Moves a job from one queue to another.  

The behavior of the 
.B qmove 
command may be affected by 
any site hooks.  Site hooks can modify the job's attributes, 
change its routing, etc.

.B Restrictions
.br
The
.B qmove
command can be used on job arrays, but not on subjobs or ranges of
subjobs.  

Job arrays can only be moved from one server to another if
they are in the 'Q', 'H', or 'W' states, and only if there are no
running subjobs.  The state of the job array is preserved, and the job
array will run to completion on the new server.
.LP
A job in the
.B Running ,
.B Transiting ,
or
.B Exiting
state cannot be moved.  

A job in the process of provisioning cannot 
be moved.


.SH EFFECT OF PRIVILEGE ON BEHAVIOR

An unprivileged user can use the 
.B qmove 
command to move a job only when
the move would not violate queue restrictions.  A privileged user
(root, Manager, Operator) can use the 
.B qmove 
command to move a job
under some circumstances where an unprivileged user cannot.  The
following restrictions apply only to unprivileged users:

.RS 4
The queue must be enabled

.br
Moving the job into the queue must not exceed the queue limits for
jobs or resources

.br
If the job is an array job, the size of the job array must not exceed 
.I max_array_size 
for the queue

.br 
The queue cannot have its 
.I from_route_only
attribute set to 
.I True
(accepting jobs only from routing queues)
.RE

.SH OPTIONS
.IP "--version" 4
The 
.B qmove
command returns its PBS version information and exits.
This option can only be used alone.


.SH OPERANDS
.IP destination 4
Where job(s) are to end up.  First operand.  Syntax:
.RS 4
.I <queue name>
.RS 4
Moves the job(s) into the specified queue at the job's current server.
.RE
.br
.I @<server name>
.RS 4
Moves the job(s) into the default queue at the specified server.
.RE
.br
.I <queue name>@<server name>
.RS 4
Moves the job(s) into the specified queue at the specified server.
.RE
.RE

.LP
.IP "job ID" 4
Job(s) and/or job array(s) to be moved to the new destination.  The
.B qmove
command accepts one or more
.I job ID
operands of the form:
.RS 4
.I <sequence number>[.<server name>][@<server name>]
.br
.I <sequence number>[][.<server name>][@<server name>]
.RE

Note that some shells require that you enclose a job array identifier 
in double quotes.


.br
.SH STANDARD ERROR
The 
.B qmove 
command writes a diagnostic messages to standard error for each
error occurrence.

.SH EXIT STATUS
.IP Zero 4
Upon success

.IP "Greater than zero" 4
Upon failure


.SH SEE ALSO
qsub(1B), pbs_movejob(3B)


================================================
FILE: doc/man1/qmsg.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qmsg 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qmsg 
- write message string into one or more job output files
.SH SYNOPSIS
.B qmsg
[-E] [-O] <message string>
<job ID> [<job ID> ...]
.br
.B qmsg
--version

.SH DESCRIPTION
Writes a message string into one or more output files of the job.
Typically this is done to leave an informative message in the output
of the job.  Also called "sending a message to a job".  

The 
.B qmsg
command writes messages into the files of jobs by sending a 
.I Message Job 
batch request to the batch server that owns the job.  The 
.B qmsg
command does not directly write the message into the files of the job.

The 
.B qmsg 
command can be used on jobs and subjobs, but not on job arrays or ranges of
subjobs.

.SH OPTIONS
.IP "-E" 8
The message is written to the standard error of each job.

.IP "-O" 8
The message is written to the standard output of each job.

.IP "--version" 8
The 
.B qmsg
command returns its PBS version information and exits.
This option can only be used alone.

.IP "(no options)" 8
The message is written to the standard error of each job.

.SH  OPERANDS
.IP "message string" 8
The message to be written. String.  First operand.  If the string contains
blanks, the string must be quoted.  If the final character of the string 
is not a newline, a newline character is added when written to the job's file.

.IP "job ID" 8
The job(s) to receive the message string.  This operand follows the 
.I message string
operand.  Can be a job or subjob.  Cannot be a job array or range of subjobs.  The 
.B qmsg 
command accepts one or more
.I job ID
operands.
.br
Format for job:
.br
.I <sequence number>[.<server name>][@<server name>]
.br
Format for subjob. Note that a subjob has square brackets around its index number:
.br
.I <sequence number>[<index>][.<server name>][@<server name>]

.SH STANDARD ERROR
The 
.B qmsg
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon success
.IP "Greater than zero" 8
Upon failure

.SH SEE ALSO
qsub(1B), pbs_msgjob(3B)


================================================
FILE: doc/man1/qorder.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qorder 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qorder 
\- exchange order of two PBS batch jobs.
.SH SYNOPSIS
.B qorder 
<job ID> <job ID>
.br
.B qorder 
--version
.SH DESCRIPTION

Exchanges positions in queue(s) of two jobs, whether in the same or different
queue(s).

No attribute of either job, e.g. priority, is changed.
The impact of interchanging the order within or between queues is dependent on local
job scheduling policy; contact your systems administrator.  

.B Restrictions
.br
A job in the
.B running
state cannot be reordered.
.br
The 
.B qorder
command can be used on job arrays, but not on subjobs or ranges of subjobs.
.br
The two jobs must be located at the same server.

.B Effect of Privilege on Behavior
.br
For an unprivileged user to reorder jobs, both jobs must be owned by
the user.  A privileged user (Manager, Operator) can reorder any jobs.

.SH OPTIONS
.IP "--version" 8
The 
.B qorder
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
Both operands are
.I job IDs
which specify the jobs to be exchanged.
The 
.B qorder
command accepts two
.I job ID
operands of the form:
.RS 4
.I <sequence number>[.<server name>][@<server name>]
.br
.I <sequence number>[][.<server name>][@<server name>]
.RE

If you specify a server for both jobs, they must be at the same server.

Note that some shells require that you enclose a job array identifier in
double quotes.

.SH STANDARD ERROR
The 
.B qorder 
command writes diagnostic messages to standard error for each
error occurrence.

.SH EXIT STATUS
.IP "Zero" 8
Upon successful processing of all operands
.IP "Greater than zero" 8
If the 
.B qorder 
command fails to process any operand

.SH SEE ALSO
qsub(1B), qmove(1B), pbs_orderjob(3B), pbs_movejob(3B)


================================================
FILE: doc/man1/qrerun.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qrerun 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qrerun 
- requeue a PBS job
.SH SYNOPSIS
.B qrerun 
[-W force]
<job ID> [<job ID> ...]
.br
.B qrerun 
--version

.SH DESCRIPTION
If possible, kills the specified job(s), then requeues each job in the
execution queue from which it was run. 

The 
.B qrerun
command can be used on jobs, job arrays, subjobs, and ranges of subjobs.
If you give a job array identifier as an argument, the job array is
returned to its initial state at submission time, or to its altered
state if it has been qaltered.  All of that job array's subjobs are
requeued, which includes those that are currently running, and those
that are completed and deleted. If a you give a subjob or range as an
argument, those subjobs are requeued.

.B Restrictions
.br
If a job is marked as not rerunnable, 
.B qrerun 
neither kills nor requeues the job.  See the
.I -r 
option for the
.B qsub 
and
.B qalter
commands, and the 
.I Rerunable 
job attribute.

The
.B qrerun 
command cannot requeue a job or subjob which is not running, is held, 
or is suspended.

.B Required Privilege
.br
PBS Manager or Operator privilege is required to use this command.

.SH OPTIONS
.IP "-W force" 8
The job is to be requeued even if the vnode on which the job is
executing is unreachable, or if the job's substate is 
.I provisioning.
.IP "--version" 8
The 
.B qrerun
command returns its PBS version information and exits.
This option can only be used alone.


.SH  OPERANDS
The qrerun
command accepts one or more
.I job ID
operands of the form:
.RS 4
.I <sequence number>[.<server name>][@<server name>]
.br
.I <sequence number>[][.<server name>][@<server name>]
.br
.I <sequence number>[<index>][.<server name>][@<server name>]
.br
.I <sequence number>[<index start>-<index end>][.<server name>] 
.br
\ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ [@<server name>]
.RE

Note that some shells require that you enclose a job array identifier in
double quotes.
.br

.SH STANDARD ERROR
The
.B qrerun
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all operands
.IP "Greater than zero" 8
Upon failure to process any operand

.SH SEE ALSO
qsub(1B), qalter(1B), pbs_alterjob(3B), pbs_rerunjob(3B)


================================================
FILE: doc/man1/qrls.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qrls 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qrls 
- release hold on PBS jobs
.SH SYNOPSIS
.B qrls
[-h <hold list>] <job ID> [<job ID> ...]
.br
.B qrls
--version
.SH DESCRIPTION
The
.B qrls
command removes or releases holds on batch jobs or job arrays, 
but not on subjobs or ranges of subjobs.

A job may have one or more types of holds which make the job
ineligible for execution.

If you 
.B qrls
a job whose 
.I Execution_Time
attribute is not set to a time in the future, the job changes to the 
.I queued
state.  If 
.I Execution_Time
is in the future, the job changes to the
.I waiting
state.

Holds can be set by the owner, an Operator, or Manager, when a job 
has a dependency, or when a job has its 
.I Execution_Time 
attribute set to a time in the future.  Se the 
.B qhold
man page.

.B Effect of Privilege on Behavior
.br
The following table shows the holds and the privilege required to release each:
.RS 3
Hold  Meaning       Privilege Required to Release
.br
--------------------------------------------------------------
.IP u 6
User          Job owner, Operator, Manager, 
.br
              administrator, root
.IP o 6
Other         Operator, Manager, administrator, root
.IP s 6
System        Manager, administrator, root, 
.br
              PBS (dependency)
.IP n 6
None          Job owner, Operator, Manager, 
.br
              administrator, root
.IP p 6
Bad password  Administrator, root
.RE
.LP

.SH OPTIONS
.IP "(no options)" 8
Defaults to
.I -h u,
removing
.I user
hold.
.IP "-h <hold list>" 8
Types of holds to be released for the job(s).

The
.I hold list
argument is a string consisting of one or more of the letters
.I """u""", """o""", 
or 
.I """s"""
in any combination, or one of the letters
.I """n""" 
or 
.I """p""".

.IP "--version" 8
The 
.B qrls
command returns its PBS version information and exits.
This option can only be used alone.

.SH  OPERANDS
The 
.B qrls
command can be used on jobs and job arrays, but not on subjobs or ranges 
of subjobs.  The 
.B qrls 
comand accepts one or more 
.I job IDs
in the form:
.RS 4
.I <sequence number>[.<server name>][@<server name>]
.br
.I <sequence number>[][.<server name>][@<server name>]
.RE
Note that some shells require that you enclose a job array identifier in
double quotes.

.SH STANDARD ERROR
The 
.B qrls 
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all operands

.IP "Greater than zero" 8
If the 
.B qrls
command fails to process any operand

.SH SEE ALSO
qsub(1B), qalter(1B), qhold(1B), pbs_alterjob(3B), pbs_holdjob(3B), and
pbs_rlsjob(3B).


================================================
FILE: doc/man1/qselect.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qselect 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qselect 
- select specified PBS jobs
.SH SYNOPSIS
.B qselect
[-a [<op>] <date and time>] [-A <account string>] 
.RS 8
[-c [<op>] <interval>] [-h <hold list>] [-H] [-J] 
.br
[-l <resource list>] [-N <name>] [-p [<op>] <priority>] 
.br
[-P <project>] [-q <destination>] [-r <rerun>] [-s <states>] 
.br
[-t <time option> [<comparison>] <specified time>] [-T] 
.br
[-u <user list>] [-x]
.RE
.br
.B qselect
--version

.SH DESCRIPTION
The
.B qselect
command lists those jobs that meet the specified selection criteria.
You can compare certain job attribute values to specified values using
a comparison operator shown as 
.I op 
in the option description.

You can select jobs, job arrays, or subjobs.  You can select jobs from
one server per call to the command.

Each option acts as a filter restricting which jobs are listed.  

You can select jobs according to the values of some of the resources
in the 
.I Resource_List 
job attribute.  You can also select jobs
according the selection directive (although because this is a string,
you can only check for equality or inequality.)

Jobs that are finished or moved are listed only when the 
.I -x 
or 
.I -H
options are used.  Otherwise, job selection is limited to queued and
running jobs.

.B Comparison Operations
.br
You can select jobs by comparing the values of certain job attributes
to values you specify.  The following table lists the comparison 
operations you can use:

.B Operation \ \ Type of Comparison
.br
-----------------------------------------------------------------------
.IP .eq. 12
The value of the attribute of the job is equal to the value of the
option argument.
.IP .ne. 12
The value of the attribute of the job is not equal to the value of the
option argument.
.IP .ge. 12
The value of the attribute of the job is greater than or equal to the
value of the option argument.
.IP .gt. 12	
The value of the attribute of the job is greater than the value of the
option argument.
.IP .le. 12
The value of the attribute of the job is less than or equal to the
value of the option argument.
.IP .lt. 12
The value of the attribute of the job is less than the
value of the option argument.
.LP

For example, to select jobs whose 
.I Priority 
attribute has a value greater than 
.I 5:
.br
.B \ \ \ qselect -p.gt.5

Where an optional comparison is not specified, the comparison
operation defaults to 
.I .eq, 
meaning PBS checks whether the value of the
attribute is equal to the option argument.

.B Required Permissions
.br
When selecting jobs according to resource values, users without
Operator or Manager privilege cannot specify custom resources which
were created to be invisible to unprivileged users.

.SH Options to qselect
.IP "(no options)" 8
Lists all jobs at the server which the user is authorized to list
(query status of).

.IP "-a [<op>] <date and time>" 8
.B Deprecated.  
Restricts selection to those jobs whose 
.I Execution_Time
attribute qualifies when compared to the 
.I date and time
argument.  You can select a range of execution times by using this
option twice, to compare to a minimum time and a maximum time.

The 
.I date and time
argument has the format:
.br
.I [[CC]YY]MMDDhhmm[.SS]
.br
where the 
.I MM 
is the two digits for the month, 
.I DD 
is the day of the month, 
.I hh 
is the hour, 
.I mm 
is the minute, and the optional 
.I SS 
is the seconds.  
.I CC 
is the century and 
.I YY 
the year.

.IP "-A <account string>" 8
Restricts selection to jobs whose 
.I Account_Name
attribute matches the specified
.I account string.

.IP "-c [<op>] <interval>" 8
Restricts selection to jobs whose 
.I Checkpoint
interval attribute meets the comparison criteria.

The 
.I interval
argument can take one of the following values:
.RS 11
.I c
.br
.I c=<minutes>
.br
.I n
.br
.I s
.br
.I w
.br
.I w=<minutes>
.RE
.IP " "  8
We give the range of interval  values for the 
.I Checkpoint
attribute the following ordered relationship:
.br
.I  n\ >\ s\ >\ c=minutes\ >\ c\ >\ u

(Information about 
.I w
and 
.I w=<minutes>
is not available.)

For an interval value of 
"u", only ".eq" and ".ne" are valid.

.IP "-h <hold list>" 8
Restricts the selection of jobs to those with a specific set of hold types.
The holds in the 
.I Hold_Types
job attribute must be the same as those in the 
.I hold list
argument, but can be in a different order.

The
.I hold list
argument is a string consisting of the single letter
.I n,
or one or more of the letters
.I u,
.I o,
.I p,
or 
.I s 
in any combination.  If letters are duplicated, they are treated as if they
occurred once.
The letters represent the hold types:

.B Letter \ \ Hold Type
.br
---------------------------------------------------------------
.nf
n        None
u        User
o        Other
p        Bad password
s        System
.fi

.IP "-H" 8
Restricts selection to finished and moved jobs.

.IP "-J" 8
Limits selection to job arrays only.

.IP "-l <resource list>" 8
Restricts selection of jobs to those with specified resource amounts.
Resource must be job-wide, or be 
.I mem, ncpus, 
or 
.I vmem.

The 
.I resource list
is in the following format:
.br
.I <resource name> <op> <value>[,<resource name> <op> <value> ...]

You must specify
.I op,
and you can use any of the comparison operators.

Because resource specifications for chunks using the select statement,
and placement using the place statement, are stored as strings, the
only useful operators for these are 
.I .eq.  
and 
.I .ne.

Unprivileged users cannot specify custom resources
which were created to be invisible to unprivileged users.

.IP "-N <name>" 8
Restricts selection of jobs to those with the specified value for the
.I Job_Name
attribute.

.IP "-p [<op>] <priority>" 8
Restricts selection of jobs to those with the specified 
.I Priority 
value(s).

.IP "-P <project>" 8
Restricts selection of jobs to those matching the specified value for the 
.I project
attribute.

Format: 
.I Project Name

.IP "-q <destination>" 8
Restricts selection to those jobs at the specified 
.I destination.

The
.I destination
may take of one of the following forms:
.RS 11
.I <queue name>
.br
Restricts selection to the specified queue at the default server.
.br
.I @<server name>
.br
Restricts selection to the specified server.
.br
.I <queue name>@<server name>
.br
Restricts selection to the specified queue at the specified server. 
.RE
.IP " " 8
If the -q option is not specified, jobs are selected from the default server.

.IP "-r <rerun>" 8
Restricts selection of jobs to those with the specified value for the 
.I Rerunable
attribute.  The option argument 
.I rerun
must be a single character, either
.I y
or 
.I n.

.IP "-s <states>" 8
Restricts job selection to those whose
.I job_state
attribute has the specified value(s).

The
.I states
argument is a character string consisting of any combination of these
characters:
.I B
, 
.I E
, 
.I F
,
.I H
,
.I M
,
.I Q
,
.I R
,
.I S
,
.I T
,
.I U
,
.I W
, and
.I X.
(A repeated character is accepted, but no additional meaning is
assigned to it.)

.nf
.B State \ \ Meaning
---------------------------------------------------------------
B       Job array has started execution
E       The Exiting state
F       The Finished state
H       The Held state
M       The Moved state
Q       The Queued state
R       The Running state
S       The Suspended state
T       The Transiting state
U       Job suspended due to workstation user activity
W       The Waiting state
X       The eXited state.  Subjobs only
.fi

.IP
Jobs in any of the specified states are selected.

Job arrays are never in states 
.I R, S, T, 
or 
.I U.  
Subjobs may be in those states.

.IP "-t <time option> [<op>] <specified time>" 8
Jobs are selected according to one of their time-based attributes.  The 
.I time option
specifies which time-based attribute is tested.  You give the 
.I specified time
in 
.I datetime
format. 

The 
.I time option 
is one of the following:

.nf
.B Time 
.B Option \ Time Attribute \ Attribute Description
---------------------------------------------------------------
a       Execution_Time  Timestamp.  Time the job is eligible 
                        for execution.  Specified in datetime 
                        format.

c       ctime           Timestamp; time at which the job was
                        created.  Printed by qstat in 
                        human-readable format.  Output in hooks
                        as seconds since epoch.

e       etime           Timestamp; time when job became 
                        eligible to run, i.e. was enqueued in 
                        an execution queue and was in the "Q" 
                        state.  Reset when a job moves queues, 
                        or is held then released.  Not affected 
                        by qaltering.  Printed by qstat in 
                        human-readable format.  Output in hooks 
                        as seconds since epoch.

g       eligible_time   Amount of eligible time job accrued 
                        waiting to run.  Specified as duration.

m       mtime           Timestamp; the time that the job was 
                        last modified, changed state, or 
                        changed locations.  Printed by qstat in 
                        human-readable format.  Output in hooks 
                        as seconds since epoch.

q       qtime           Timestamp; the time that the job 
                        entered the current queue.  Printed by 
                        qstat in human-readable format.  Output 
                        in hooks as seconds since epoch.

s       stime           Timestamp; time the job started.  
                        Updated when job is restarted.  Printed 
                        by qstat in human-readable format.  
                        Output in hooks as seconds since epoch.

t       estimated.      Job's estimated start time.  Specified 
        start_time      in datetime format.  Printed by qstat in 
                        human-readable format.  Output in hooks 
                        as seconds since epoch.
.fi

To bracket a time period, use the 
.I -t
option twice.
.br
For example, to select jobs using 
.I stime 
between noon and 3 p.m.:
.br
.B \ \ \ qselect -ts.gt.09251200 -ts.lt.09251500

.IP "-T" 8
Limits selection to jobs and subjobs.

.IP "-u <user list>" 8
Restricts selection to jobs owned by the specified usernames.

Syntax of
.I user_list:
.br
.I <username>[@<hostname>][,<username>[@<hostname>],...]

Selects jobs which are owned by the listed users at the corresponding hosts. 
Hostnames may be wildcarded on the left end, e.g. "*.nasa.gov".  A username
without a "@<hostname>" is equivalent to "<username>@*", meaning that it is 
valid at any host.

.IP "-x" 8
Selects finished and moved jobs in addition to queued and running jobs.

.IP "--version" 8
The 
.B qselect
command returns its PBS version information and exits.
This option can only be used alone.

.SH STANDARD OUTPUT
PBS writes a list of the selected job IDs to standard output.  Each
job ID is separated by white space.  A job ID can represent a job, a
job array, or a subjob.  Each job ID has one of the forms:
.br
.I <sequence number>.<server name>[@<server name>]
.br
.I <sequence number>[].<server name>[@<server name>]   
.br
.I <sequence number>[<index>].<server name>[@<server name>]
.br
.I @<server name> 
identifies the server which currently owns the job.

.SH STANDARD ERROR
The 
.B qselect 
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all options presented to the
.B qselect 
command
.IP "Greater than zero" 8
If the 
.B qselect 
command fails to process any option

.SH SEE ALSO
qstat(1B),
qsub(1B), 
pbs_job_attributes(7B),
pbs_resources(7B)


================================================
FILE: doc/man1/qsig.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qsig 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qsig 
\- signal a PBS batch job
.SH SYNOPSIS
.B qsig
[-s <signal>] <job ID> [<job ID> ...]
.br
.B qsig
--version

.SH DESCRIPTION
The
.B qsig
command sends a signal to all the processes of the specified jobs.  
The 
.B qsig 
command sends a 
.I Signal Job
batch request to the server which owns the job.

The 
.B qsig
command can be used for jobs, job arrays, subjobs, and ranges of subjobs.
If it is used on a range of subjobs, the running subjobs in the range 
are signaled.

Not all signal names are recognized by 
.B qsig
; if using a signal name does not work, try issuing the signal number instead.

.B Using admin-suspend and admin-resume
.br
If you have a vnode requiring maintenance while remaining powered up,
where you do not want jobs running during the maintenance, you can use
the special signals 
.I admin-suspend 
and 
.I admin-resume 
to suspend and resume the jobs on the vnode.  When you use 
.I admin-suspend 
on a vnode's
job(s), the vnode goes into the 
.I maintenance 
state, and its scheduler does not schedule jobs on it.  You must separately 
.I admin-suspend 
each job on the vnode.  When its last 
.I admin-suspended 
job is admin-resumed, a vnode leaves the 
.I maintenance 
state.  

.B Restrictions
.br
The request to signal a job is rejected if:
.IP -
The user is not authorized to signal the job
.IP -
The job is not in the 
.I running
or 
.I suspended
state
.IP -
The requested signal is not supported by the system upon which the
job is executing
.IP -
The job is in the process of provisioning
.IP -
You attempt to use 
.I admin-resume 
on a job that was 
.I suspended
.IP -
You attempt to use 
.I resume 
on a job that was 
.I admin-suspended
.LP

.B Required Privilege
.br
Manager or Operator privilege is required to use the 
.I admin-suspend, admin-resume, suspend, 
or 
.I resume
signals.  Unprivileged users can use other signals.

.SH OPTIONS
.IP "-s" 8
PBS sends SIGTERM to the job.
.IP "-s <signal>" 8
PBS sends signal
.I signal
to the job.
.IP "--version" 8
The 
.B qsig
command returns its PBS version information and exits.
This option can only be used alone.

.SH SIGNALS
You can send standard signals to a job, or the special signals described below.
The
.I signal
argument can be in any of the following formats:
.RS 4
A signal name, e.g.
.I SIGKILL

The signal name without the 
.I SIG
prefix, e.g. 
.I KILL

An unsigned signal number, e.g.
.I 9
.RE

The signal name
.I SIGNULL
is allowed; in this case the server sends the signal 0 to the job, which 
has no effect.

.B Special Signals
.br
The following special signals are all lower-case, and have no
associated signal number:

.IP "admin-suspend"
Suspends a job and puts its vnodes into the 
.I maintenance 
state.  The job is put into the 
.I S 
state and its processes are suspended.  
When suspended, a job is not executing and is not charged for
walltime.
.br
Syntax:
.I qsig -s admin-suspend <job ID>

.IP "admin-resume"
Resumes a job that was suspended using the 
.I admin-suspend 
signal, without waiting for its scheduler.   Cannot be used on jobs that were suspended with 
.I suspend 
signal. When the last 
.I admin-suspended
job has been 
.I admin_resumed, 
the vnode leaves the maintenance state.
.br
Syntax:
.I qsig -s admin-resume <job ID>

.IP "suspend" 
Suspends specified job(s).  Job goes into 
.I suspended (S)
state.  When suspended, a job is not
executing and is not charged for walltime.

.IP "resume"
Marks specified job(s) for resumption by a
scheduler when there are sufficient resources.  If you use
.B qsig -s resume 
on a job that was suspended using 
.B qsig -s suspend
, the job is resumed when there are sufficient resources.  Cannot
be used on jobs that were suspended with 
.I admin_suspend 
signal.  

.SH  OPERANDS
The 
.B qsig 
command accepts one or more
.I job ID
operands.  For a job, this has the form:
.RS 4
.I <sequence number>[.<server name>][@<server name>]
.RE

For a job array, 
.I job ID
takes the form:
.RS 4
.I <sequence number>[][.<server name>][@<server name>]
.RE

Note that some shells require that you enclose a job array identifier in
double quotes.

.SH STANDARD ERROR
The 
.B qsig 
command writes a diagnostic messages to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all the operands presented to the
.B qsig 
command
.IP "Greater than zero" 8
If the 
.B qsig 
command fails to process any operand

.SH SEE ALSO
qsub(1B), pbs_sigjob(3B),
pbs_resources(7B)


================================================
FILE: doc/man1/qstat.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qstat 1B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qstat 
- display status of PBS jobs, queues, or servers


.SH SYNOPSIS
.RE
.B Displaying Job Status
.RS 7
Default format:
.br
.B qstat 
[-E] [-J] [-p] [-t] [-w] [-x] [[<job ID> | <destination>] ...]

.sp
Long format:
.br
.B qstat 
-f [-F json | dsv [-D <delimiter>]] [-E] [-J] [-p] 
[-t] [-w] 
.RS 6
[-x] [[<job ID> | <destination>] ...]
.RE
.sp
Alternate format:
.br
.B qstat 
[-a | -H | -i | -r ] [-E] [-G | -M] [-J] [-n [-1]]   
.RS 6
[-s [-1]] [-t] [-T] [-u <user list>] [-w]
.br
[[<job ID> | <destination>] ...]
.RE
.RE

.B Displaying Queue Status
.RS 7
Default format:
.br
.B qstat 
-Q [<destination> ...]
.sp
Long format:
.br
.B qstat 
-Q -f [-F json | dsv [-D <delimiter>]] [-w] [<destination> ...]
.sp
Alternate format:
.br
.B qstat 
-q [-G | -M] [<destination> ...]
.RE

.B Displaying Server Status
.RS 7
Default format:
.br
.B qstat 
-B [<server> ...]
.sp
Long format:
.br
.B qstat 
-B -f [-F json | dsv [-D <delimiter>]] [-w] [<server> ...]

.B Version Information
.br
.B qstat
--version

.SH DESCRIPTION
The
.B qstat
command displays the status of jobs, queues, or servers, writing
the status information to standard output.
.LP
When displaying job status information, the 
.B qstat 
command displays status information about all specified jobs, job
arrays, and subjobs.  You can specify jobs by ID, or by destination,
for example all jobs at a specified queue or server.

.B Display Formats
.br
You can use particular options to display status information in a
default format, an alternate format, or a long format.  Default and
alternate formats display all status information for a job, queue, or
server with one line per object, in columns.  Long formats display
status information showing all attributes, one attribute to a line.

.B Displaying Information for Finished and Moved Jobs
.br
You can display status information for finished and moved jobs by
using the 
.I -x 
and 
.I -H 
options.

If your job has been moved to another server through peer scheduling,
give the job ID as an argument to 
.B qstat.  
If you do not specify the job ID, your job will not appear to exist.  
For example, your job 123.ServerA is moved to ServerB.  In this case, you can use
.br
.B \ \ \ qstat 123
.br
or
.br
.B \ \ \ qstat 123.ServerA

Specifying the full job name, including the server, avoids the possibility
that 
.B qstat
will report on a job named 123.ServerB that was moved to ServerA.

To list all jobs at ServerB, you can use:
.br
.B \ \ \ qstat @ServerB

.B Displaying Truncated Data
.br
When the number of characters required would exceed the space
available, qstat truncates the output and puts an asterisk ("*") in
the last position.  For example, in default job display format, there
are three characters allowed for the number of cores.  If the actual
output were 
.I 1234
, the value displayed would be 
.I 12*
instead.

.B Required Privilege
.br
Users without Manager or Operator privilege cannot view 
resources or attributes that are invisible to unprivileged users.

.SH DISPLAYING JOB STATUS
.B Job Status in Default Format
.br
Triggers: no options, or any of the 
.I -J, -p, -t, 
or 
.I -x
options.

The 
.B qstat 
command displays job status in default format when you specify no
options, or any of the 
.I -J, -p, -t,
or 
.I -x, 
options.
Jobs are displayed one to a line, with these column headers:

.nf
Job ID   Name       User      Time Use S Queue   
-------- ---------- --------- -------- - -----

Description of columns:

Column    Width                Width    Description
Name      without -w           with -w
-------------------------------------------------------------------------------

Job ID    17 (22 when          30       Job ID assigned by PBS
          max_job_sequence_id
          > 10 million)

Name      16                   15       Job name specified by submitter       

User      16                   15       Username of job owner                 

Time Use  8                    8        The CPU time used by the job.  Before 
or                                      the application has actually started  
Percent                                 running, for example during stage-in, 
Complete                                this field is "0". At the point where 
                                        the application starts accumulating   
                                        cput, this field changes to "00:00:00".  
                                        After that, every time the MoM polls  
                                        for resource usage, the field is      
                                        updated.

                                        The MoM on each execution host polls   
                                        for the usage of all processes on her 
                                        host belonging to the job.  Usage is  
                                        summed.  The polling interval is short 
                                        when a job first starts running and   
                                        lengthens to a maximum of 2 minutes.  

                                        If you specify -p, the Time Use column 
                                        is replaced with the percentage 
                                        completed for the job.  For a job array 
                                        this is the percentage of subjobs 
                                        completed.  For a normal job, it is the 
                                        percentage of allocated CPU time used.

S         1                    1        The job's state:
                                          B  Array job has at least one subjob
                                             running
                                          E  Job is exiting after having run
                                          F  Job is finished
                                          H  Job is held
                                          M  Job was moved to another server
                                          Q  Job is queued
                                          R  Job is running
                                          S  Job is suspended
                                          T  Job is being moved to new location
                                          U  Cycle-harvesting job is suspended 
                                             due to keyboard activity
                                          W  Job is waiting for its submitter-
                                             assigned start time to be reached
                                          X  Subjob has completed execution or
                                             has been deleted

Queue     16                   15       The queue in which the job resides
.fi
.LP

.B Job Status in Long Format
.br
Trigger: the 
.I -f
option.
.br
If you specify the 
.I -f
(full) option, full job status information for each job is displayed 
in this order:
.RS 5
The job ID
.br
Each job attribute, one to a line
.br
The job's submission arguments 
.br
The job's executable, in JSDL format
.br
The executable's argument list, in JSDL format
.RE

The job attributes are listed 
as 
.I <name> = <value>
pairs. This includes the 
.I exec_host 
and 
.I exec_vnode 
strings.  
The full output can be very large.
.sp

The 
.I exec_host 
string has the format:
.br
.I <host1>/<T1>*<P1>[+<host2>/<T2>*<P2>+...]
.br
where 
.br
.I T1
is the task slot number (the index) of the job on hostA.
.br
.I P1
is the number of processors allocated to the job from host1.  The 
number of processors allocated does not appear if it is 1.

The 
.I exec_vnode 
string has the format:
.br
.I (<vnode1>:ncpus=<N1>:mem=<M1>)[+(<vnode2>:ncpus=<N2>:mem=<M2>)+...]
.br
where
.br
N1 is the number of CPUs allocated to that job on vnode1.
.br
M1 is the amount of memory allocated to that job on vnode1.

.B Job Status in Alternate Format
.br
Triggers: any of the 
.I -a, -i, -G, -H, -M, -n, -r, -s, -T,
or
.I -u <user list>
options.
.br
The 
.B qstat
command displays job status in the alternate format if you specify any of the
.I -a, -i, -G, -H, -M, -n, -r, -s, -T,
or 
.I -u <user list>
options.
Jobs are displayed one to a line.  If jobs are running and the -n
option is specified, or if jobs are finished or moved and the -H and
-n options are specified, there is a second line for the 
.I exec_host
string.

.nf
Column headers:

                                             Req'd  Req'd   Elap
Job ID Username Queue Jobname SessID NDS TSK Memory Time  S Time
------ -------- ----- ------- ------ --- --- ------ ----- - ---- 

Description of columns:
   
Column    Width                Width    Description
Name      without -w           with -w  
--------------------------------------------------------------------------------

Job ID    15 (20 when          30       The job ID assigned by PBS
          max_job_sequence_id
          > 10 million)

Username  8                    15       Username of job owner

Queue     8                    15       Queue in which the job resides

Jobname   10                   15       Job name specified by submitter

SessID    6                    8        Session ID.  Appears only if the job 
                                        is running.

NDS       3                    4        Number of chunks or vnodes requested 
                                        by the job

TSK       3                    5        Number of CPUs requested by the job

Req'd     6                    6        Amount of memory requested by the job
Memory

Req'd     5                    5        If CPU time is requested, this shows CPU 
Time                                    time.  Otherwise, shows walltime

S         1                    1        The job's state.  (See listing above  
                                        for default format)

Elap      5                    5        If CPU time is requested, this shows CPU 
Time                                    time.  Otherwise, shows walltime.
or       
Est Start                               If you use the -P option, displays 
Time                                    estimated start time for queued jobs, 
                                        replacing the Elap Time field with the 
                                        Est Start Time field.
.fi

.SH Grouping Jobs and Sorting by ID
Trigger: the 
.I -E 
option.  
.br
You can use the 
.I -E 
option to sort and group jobs in the output of 
.B qstat.  
The 
.I -E 
option groups jobs by server and displays each group by ascending ID.
This option also improves 
.B qstat 
performance.  The following table shows how the 
.I -E 
option affects the behavior of 
.B qstat:
  
.B How qstat is Used \ \  Result Without -E \ \ \ \ \ \ \ \ \  Result With -E 
.br
-----------------------------------------------------------------------
.br
qstat (no job ID     Queries the default server  No change in behavior; 
.br
specified)           and displays result         same as without 
.I -E
.br
                                                 option
.br
-----------------------------------------------------------------------
.br
qstat <list of job   Displays results in the     Displays results in 
.br
IDs from single      order specified             ascending ID order
.br
server>
.br
-----------------------------------------------------------------------
.br
qstat <job IDs at    Displays results in the     Groups jobs by server.  
.br
multiple servers>    order they are specified    Displays each group in 
.br
                                                 ascending order
.br
-----------------------------------------------------------------------


.SH DISPLAYING QUEUE STATUS
.B Queue Status in Default Format
.br
Trigger: the 
.I -Q
option by itself.
.br
The 
.B qstat
command displays queue status in the default format if 
the only option is
.I -Q.
Queue status is displayed one queue to a line, with these column headers: 

.nf
Queue Max  Tot  Ena  Str Que  Run  Hld  Wat  Trn  Ext  Type
----- ---- ---- ---- --- ---- ---- ---- ---- ---- ---- ----
.fi

Description of columns:
.IP "Queue" 15
Queue name
.IP "Max" 15
Maximum number of jobs allowed to run concurrently in this queue
.IP "Tot" 15
Total number of jobs in the queue
.IP "Ena" 15
Whether the queue is 
enabled
or 
disabled
.IP "Str" 15
Whether the queue is 
started
or 
stopped
.IP "Que" 15
Number of queued jobs
.IP "Run" 15
Number of running jobs
.IP "Hld" 15
Number of held jobs
.IP "Wat" 15
Number of waiting jobs
.IP "Trn" 15
Number of jobs being moved (transiting)
.IP "Ext" 15
Number of exiting jobs
.IP "Type" 15
Type of queue: execution or routing
.sp

.LP

.B Queue Status in Long Format
.br
Trigger: the 
.I -q
and 
.I -f
options together.
.br
If you specify the
.I -f
(full) option with the 
.I -q
option, full queue status information for each queue is displayed
starting with the queue name, followed by each attribute, one to a line,
as
.I <name> = <value>
pairs.  
.sp

.B Queue Status: Alternate Format
.br
Triggers: any of the 
.I -q, -G, 
or 
.I -M
options.
.br
The
.B qstat
command displays queue status in the alternate format if you 
specify any of the
.I -q, -G,
or 
.I -M
options.
Queue status is displayed one queue to a line, and the lowest line 
contains totals for some columns.

These are the alternate format queue status column headers:

.nf
Queue Memory CPU Time Walltime Node Run Que Lm State
----- ------ -------- -------- ---- --- --- -- -----
.fi

Description of columns:
.IP "Queue" 15
Queue name
.IP "Memory" 15
Maximum amount of memory that can be requested by a job in this queue
.IP "CPU Time" 15
Maximum amount of CPU time that can be requested by a job in this queue
.IP "Walltime" 15
Maximum amount of walltime that can be requested by a job in this queue
.IP "Node" 15
Maximum number of vnodes that can be requested by a job in this queue
.IP "Run" 15
Number of running and suspended jobs.  Lowest row is total number of
running and suspended jobs in all the queues shown
.IP "Que" 15
Number of queued, waiting, and held jobs.  Lowest row is total number 
of queued, waiting, and held jobs in all the queues shown
.IP "Lm" 15
Maximum number of jobs allowed to run concurrently in this queue
.IP "State" 15
State of this queue: 
.I E
(enabled) or 
.I D
(disabled), 
and 
.I R
(running) or 
.I S
(stopped)

.sp


.SH DISPLAYING SERVER STATUS

.B Server Status in Default Format:
.br
Trigger: the 
.I -B 
option.
.br
The 
.B qstat 
command displays server status if the only option given is 
.I -B.
.sp
Column headers for default server status output:

.nf
Server Max Tot Que Run Hld Wat Trn Ext Status
------ --- --- --- --- --- --- --- --- ------
.fi

Description of columns:
.IP "Server" 15
Name of server
.IP "Max" 15
Maximum number of jobs allowed to be running concurrently 
on the server
.IP "Tot" 15
Total number of jobs currently managed by the server
.IP "Que" 15
Number of queued jobs
.IP "Run" 15
Number of running jobs
.IP "Hld" 15
Number of held jobs
.IP "Wat" 15
Number of waiting jobs
.IP "Trn" 15
Number of transiting jobs
.IP "Ext" 15
Number of exiting jobs
.IP "Status" 15
Status of the server
.RE

.B Server Status in Long Format
.br
Trigger: the
.I -f
option.
.br
If you specify the
.I -f
(full) option, displays full server status information
starting with the server name, followed by each server attribute, 
one to a line, as
.I <name> = <value>
pairs. Includes PBS version information.
.sp

.SH OPTIONS
.B Generic Job Status Options
.IP "-E" 10
Groups jobs by server and displays jobs sorted by ascending ID.  When
.B qstat
is presented with a list of jobs, jobs are grouped by server and each 
group is displayed by ascending ID.  This option also improves 
.B qstat
performance.  
.LP
.B Default Job Status Options
.IP "-J" 10
Prints status information for job arrays (not subjobs).
.IP "-t" 10
Displays status information for jobs, job arrays, and subjobs.
When used with 
.I -J
option, prints status information for subjobs only.

.IP "-p" 10
The 
.I Time Use 
column is replaced with the percentage completed for the job.  For an 
array job this is the percentage of subjobs completed.  For a normal
job, it is the percentage of allocated CPU time used.

.IP "-x" 10
Displays status information for finished and moved jobs in 
addition to queued and running jobs.
.LP

.B Alternate Job Status Options
.IP "-a" 10
All queued and running jobs are displayed.  
If a
.I destination
is specified, information for all jobs at that
.I destination
is displayed.
If a 
.I job ID
is specified, information about that job is displayed.  
Always specify this option before the 
.I -n 
or 
.I -s
options, otherwise they will not take effect.

.IP "-H" 10
Without a job identifier, displays information for all finished or moved jobs.
If a 
.I job ID 
is given, displays information for that job regardless of 
its state.  If a 
.I destination
is specified, displays information for finished or moved jobs, or 
specified job(s), at 
.I destination.

.IP "-i" 10
If a
.I destination
is given, information for queued, held or waiting jobs at that 
.I destination
is displayed.
If a 
.I job ID
is given, information about that job is displayed regardless
of its state. 

.IP "-n" 10
The 
.I exec_host 
string is listed on the line below the basic information.
If the 
.I -1
option is given, the 
.I exec_host 
string is listed on the end of the same line.
If using the 
.I -a 
option, always specify the
.I -n 
option after
.I -a,
otherwise the
.I -n 
option does not take effect.
 
.IP "-r" 10
If a 
.I destination
is given, information for running or suspended jobs at that 
.I destination
is displayed.
If a 
.I job ID
is given, information about that job is displayed regardless of its state.  

.IP "-s" 10
Any comment added by the administrator or scheduler is shown on the line below the basic information.
If the 
.I -1 
option is given, the comment string is listed on the end of the same line.
If using the 
.I -a 
option, always specify the
.I -s 
option after
.I -a,
otherwise the
.I -s 
option does not take effect.

.IP "-T" 10
Displays estimated start time for queued jobs, replacing the 
.I Elap Time
field with the 
.I Est Start Time
field.  Jobs with earlier estimated start
times are displayed before those with later estimated start times. 

Running jobs are displayed before other jobs.  Running jobs are sorted
by their 
.I stime 
attribute (start time).

Queued jobs whose estimated start times are unset
(estimated.start_time = unset) are displayed after those with
estimated start times, with estimated start time shown as a double dash
("--").  Queued jobs with estimated start times in the past are treated
as if their estimated start times are unset.

If a job's estimated start time cannot be calculated, the start time
is shown as a question mark ("?").

Time displayed is local to the qstat command.  Current week begins on
Sunday.

The following table shows the format for the 
.I Est Start Time 
field when the
.I -w 
option is not used:

.IP " " 10
.nf
.B Format\ \ \ \ \ \ \ \ \ Job's Estimated Start Time\ \ \ \ \ \ \ \ \ \ \ \ \ Example
-------------------------------------------------------------
<HH>:<MM>      Today                                  15:34
-------------------------------------------------------------
<2-letter      Within 7 days, but after today         We 15
weekday> <HH>
-------------------------------------------------------------
<3-letter      This calendar year, but after this     Feb 
month name>    week
-------------------------------------------------------------
<YYYY>         Less than or equal to 5 years from     2018
               today, after this year
-------------------------------------------------------------
>5yrs          More than 5 years from today           >5yrs
-------------------------------------------------------------
.fi

.IP " " 10
The following table shows the format for the 
.I Est Start Time 
field when the
.I -w 
option is used:
.IP " " 10
.nf
.B Format\ \ \ \ \ \ \ \ \ \ \ \ \ \ Job Est Start Time\ \ Example
-------------------------------------------------------------
Today <HH>:<MM>     Today               Today 13:34
-------------------------------------------------------------
<Day> <HH>:<MM>     This week, but      Wed 15:34
                    after today  
-------------------------------------------------------------
<Day> <Month>       This year, but      Wed Feb 10 15:34
<Daynum> <HH>:<MM>  after this week
-------------------------------------------------------------
<Day> <Month>       After this year     Wed Feb 10 2018 15:34
<Daynum> <YYYY>
<HH>:<MM>
-------------------------------------------------------------
.fi

.IP " " 10
When used with the 
.I -f 
option, prints the full timezone-qualified start time.

Estimated start time information can be made unavailable to unprivileged 
users; in this case, the estimated start time appears to be unset.

.IP "-u <user list>" 10
If a 
.I destination
is given, status for jobs at that 
.I destination 
owned by users in 
.I <user list>
is displayed.
If a 
.I job ID
is given, status information for that job is displayed regardless of the job's 
ownership.
.sp
Format: 
.I <username>[@<hostname>][, <username>[@<hostname>], ...] 
in comma-separated list.  

Hostnames may be wildcarded, but not domain names.
When no hostname is specified, username is for any host.

.IP "-w" 10
Can be used with job status in default and alternate formats.  Allows display
of wider fields up to 120 characters.  See
.B Job Status in Default Format
and 
.B Job Status in Alternate Format
for column widths.

This option is different from the 
.I -w
option used with the
.I -f 
long-format option.

.IP "-1 (hyphen one)" 10
Reformats 
.B qstat 
output to a single line.  Can be used only in conjunction with the 
.I -n
and/or 
.I -s
options.

.LP
.B Queue Status Options
.IP "-Q" 10
Displays queue status in default format.  
Operands must be 
.I destinations.
.IP "-q" 10
Displays queue status in alternate format.  
Operands must be 
.I destinations.

.LP
.B Server Status Options
.IP "-B" 10
Display server status.
Operands must be names of servers.

.LP
.B Job, Queue, and Server Status Options
.IP "-f [-w]" 10
Full display for long format. Job, queue or server attributes displayed one to a line.
.br
JSON output: PBS reports 
.I resources_used 
values for resources that are created or set in a hook as JSON strings
in the output of 
.B qstat -f.

If MoM returns a JSON object (a Python dictionary), PBS reports the
value as a string in single quotes:  
.br
.I resources_used.<resource_name> = '{ <mom_JSON_item_value>, 
.I <mom_JSON_item_value>, <mom_JSON_item_value>, ..}'
.br
Example:  MoM returns { "a":1, "b":2, "c":1,"d": 4} for 
.I resources_used.foo_str.  
We get: 
.br
resources_used.foo_str='{"a": 1, "b": 2, "c":1,"d": 4}'

If MoM returns a value that is
not a valid JSON object, the value is reported verbatim.
.br
Example: MoM returns "hello"  for 
.I resources_used.foo_str.  
We get:
.br
resources_used.foo_str="hello"

.br
Optional 
.I -w 
prints each attribute on one unbroken line.  Feed characters are converted:
.RS 13
Newline is converted to backslash concatenated with "n", resulting in "\\n"
.br
Form feed is converted to backslash concatenated with "f", resulting in "\\f"
.RE
.RS 10
This 
.I -w 
is independent of the 
.I -w 
job output option used with default and alternate formats.
.RE

.IP "-F dsv [-D <delimiter>]" 10

Prints output in delimiter-separated value format.  The default
.I delimiter 
is a pipe ("|").  You can specify a character or a string
delimiter using the 
.I -D 
argument to the 
.I -F dsv 
option.  For example, to use a comma as the delimeter:
.RS 13
.B qstat -f -F dsv -D,
.RE
.RS 10 
If the delimiter itself appears in a value, it is escaped:
.RS 3
On Linux, the delimiter is escaped with a backslash ("\\").
.br
On Windows, the delimiter is escaped with a caret ("^").
.RE
.RE
.RS 10
.sp
Feed characters are converted:
.RS 3
Newline is converted to backslash concatenated with "n", resulting in "\\n"
.br
Form feed is converted to backslash concatenated with "f", resulting in "\\f"
.RE

A newline separates each job from the next.  Using newline as the
delimiter leads to undefined behavior.

.br
Example of getting output in delimiter-separated value format:
.RS 3
.B qstat -f -Fdsv

Job Id: 1.vbox|Job_Name = STDIN|Job_Owner = root@vbox|job_state = Q|queue = workq|server = vbox|Checkpoint = u|ctime = Fri Nov 11 17:57:05 2016|Error_Path = ...
.RE
.RE

.IP "-F json" 10
Prints output in JSON format (http://www.json.org/).  
Attribute output is preceded by timestamp, PBS version, and PBS server hostname.  
Example: 

.RS 13
.B qstat -f F json

{
        "timestamp":1479277336,
        "pbs_version":"14.1",
        "pbs_server":"vbox",
        "Jobs":{
                "1.vbox":{
                        "Job_Name":"STDIN",
                        "Job_Owner":"root@vbox",
                        "job_state":"Q",
...

.RE

.IP "-G" 10
Shows size in gigabytes.  Triggers alternate format.
.IP "-M" 10
Shows size in megawords.  A word is considered to be 8 bytes.  
Triggers alternate format.

.LP

.B Version Information
.IP "--version" 8
The 
.B qstat
command returns its PBS version information and exits.
This option can only be used alone.


.SH  OPERANDS
.B Job Identifier Operands
.br
The 
.I job ID
is assigned by PBS at submission.  
Job IDs are used only with job status requests.
Status information for specified job(s) is displayed.
Formats:
.IP Job 15
.I <sequence number>[.<server>][@<server>]
.IP "Job array" 15
.I <sequence number>[][.<server>][@<server>]
.IP Subjob 15
.I <sequence number>[<index>][.<server>][@<server>]
.IP "Range of subjobs" 15
.I <sequence number>[<start>-<end>][.<server>][@<server>]
.LP
Note that some shells require that you enclose a job array identifier in
double quotes.

.RE
.LP

.B Destination Operands
.br
Name of queue, name of server, or name of queue at a specific server.
Formats:
.IP "queue name" 15
Specifies name of queue for job or queue display.
.RS 18
When displaying job status, PBS displays status for all jobs in the
specified queue at the default server.
.br
When displaying queue status, PBS displays status for the specified
queue at the default server.
.RE
.IP "queue name@server name" 15
Specifies name of queue at server for job or queue display.
.RS 18
When displaying job status, PBS displays status for all jobs in the
specified queue at the specified server.
.br
When displaying queue status, PBS displays status for the specified
queue at the specified server.
.RE
.IP "@server name" 15
Specifies server name for job or queue display.  
.RS 18
When displaying job status, PBS displays status for all jobs at all
queues at the specified server.
.br
When displaying queue status, PBS displays status for all queues at
the specified server.
.RE
.IP "server name" 
Specifies server name for server display.
.RS 18
When displaying server status (with the -B option) PBS displays status
for the specified server.
.RE
.LP

.SH STANDARD ERROR
The 
.B qstat 
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 15
Upon successful processing of all operands
.IP "Greater than zero" 15
If any operands could not be processed

.SH SEE ALSO
qalter(1B), qsub(1B), pbs_alterjob(3B), pbs_statjob(3B), pbs_statque(3B),
pbs_statserver(3B), pbs_submit(3B),
pbs_job_attributes(7B), pbs_queue_attributes(7B), pbs_server_attributes(7B),
pbs_resources(7B) 


================================================
FILE: doc/man1/qsub.1B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qsub 1B "25 January 2021" Local "PBS Professional"
.SH NAME
.B qsub 
\- submit a job to PBS 


.SH SYNOPSIS
.B qsub 
[-a <date and time>] [-A <account string>] [-c <checkpoint spec>] 
.RS 5
[-C <directive prefix>] [-e <path>] [-f] [-h] 
.br
[-I [-G [-- <GUI application/script>]] | [-X]] [-j <join>] 
.br
[-J <range> [%<max subjobs]] [-k <discard>] [-l <resource list>] 
.br
[-m <mail events>] [-M <user list>] [-N <name>] [-o <path>]
.br
[-p <priority>] [-P <project>] [-q <destination>] [-r <y|n>]
.br
[-R <remove options>] [-S <path list>] [-u <user list>] 
.br
[-v <variable list>] [-V] [-W <additional attributes>] [-z] 
.br
[- | <script> | -- <executable> [<arguments to executable>]]
.RE
.B qsub
--version

.SH DESCRIPTION
You use the 
.B qsub 
command to submit a batch job to PBS.
Submitting a PBS job specifies a task, requests resources, and sets job attributes.

The 
.B qsub 
command can read from a job script, from standard input, or from the command line.
When the user has submitted the job, PBS returns the job identifier for that job.
For a job, this is of the form:
.RS 3
.I <sequence number>.<server name>
.RE

For an array job, this is of the form:
.RS 3
.I <sequence number>[].<server name>
.RE

During execution, jobs can be interactive or non-interactive.
Interactive jobs are not rerunnable, and if they are blocking, you
cannot use their exit status.

Jobs are run as the user and group who submitted the job.

.B Background Process
.br
By default, on the first invocation, qsub spawns a background process
to manage communication with the PBS server.  Later invocations of
qsub attempt to communicate with this background process.  Under
certain circumstances, calls to qsub when it uses the background
process can result in communication problems.  You can prevent qsub
from spawning a background process by using the 
.I -f 
option, although this can degrade performance.

.B Where PBS Puts Job Files
.br
By default, PBS copies the stdout and stderr files from the job back to the 
current working directory where the 
.B qsub
command is executed.  However, you can specify the output paths using
the 
.I -o 
and 
.I -e 
options.  You can also specify which and whether these
files should be kept on the execution host via the 
.I -k 
option, or deleted, using the 
.I -R 
option.  See the 
.I -k, -o, -e, 
and 
.I -R 
options.

.B Submitting Jobs By Using Scripts
.br
To submit a PBS job by using a script, you specify a job script on the
command line:
.br
.I \ \ \ qsub [<options>] <script name>

For example:
.br
.B \ \ \ qsub myscript.sh

Job scripts are run as the user and group who submitted the job.  Job
scripts can be written in Python, Linux shells such as csh and sh, the
Windows command batch language, Perl, etc.

A PBS job script consists of the following:
.RS 3
Optional shell specification 

Any PBS directives

The user's tasks: programs, commands, or applications 

Optional comments (Under Windows, comments can contain only ASCII
characters.)
.RE

.B Using Shells and Interpreters
.br
By default, PBS uses your login shell to run your script.  You can
optionally specify a different shell or interpreter to run your
script:

Via the 
.I -S 
option to qsub:
.RS 3
.I qsub -S <path to shell> <script name>

For example:
.br
.B qsub -S /bin/bash myscript.sh
.RE

You can specify a different interpreter in the first line of your script.
For example:
.RS 3
.nf
.B cat myscript.sh
#!/bin/bash
#PBS -N MyHelloJob
echo "Hello"
.fi
.RE

.B Python Job Scripts
.br
You can use the same Python script under Linux or under Windows, if
the script is written to be portable.  PBS includes a Python package,
allowing Python job scripts to run; you do not need to install Python.
You can include PBS directives in a Python job script as you would in
a Linux shell script.  Python job scripts can access Win32 APIs,
including the following modules:
.RS 3
Win32api

Win32con

Pywintypes
.RE

For example, we have a Python job script that includes PBS directives:
.RS 3
.B cat myjob.py
.nf
#!/usr/bin/python
#PBS -l select=1:ncpus=3:mem=1gb
#PBS -N HelloJob
print "Hello"
.fi
.RE

So long as the first line of the script is the "#!/usr/bin/python" line
or similar, you don't need to do anything special to run a python script.
.RS 3
.I qsub <script name>
.RE

To run a Python job script under Windows, use the path to the pbs_python
executable on the execution host:
.RS 3
.I qsub -S <pbs_python path on execution host> <script name>

For example, 
.br
qsub -S %PBS_EXEC%\\bin\\pbs_python.exe <script name>
.RE

If the script pathname contains spaces, it must be quoted, for example:
.RS 3
qsub -S "C:\\Program Files\\PBS Pro\\bin\\pbs_python.exe" <script name>
.RE

.B Linux Shell Job Scripts
.br
For example, we have a Linux job script named "weatherscript" for a job named
"Weather1" which runs the executable "weathersim" on Linux:
.RS 3
.nf
#!/bin/sh
#PBS -N Weather1
#PBS -l walltime=1:00:00
/usr/local/weathersim
.RE
.fi

To submit the job, the user types:
.RS 3
.B qsub weatherscript <return>
.RE

.B Windows Command Job Scripts
.br
For example, we have a script named "weather.exe" for a job named "Weather1" which
runs under Windows:
.RS 3
.nf
#PBS -N Weather1
#PBS -l walltime=1:00:00
weathersim.exe
.fi
.RE

To submit the job, the user types:
.RS 3
.B qsub weather.exe <return>
.RE

In Windows, if you use notepad to create a job script, the last line
does not automatically get newline-terminated. Be sure to put one
explicitly, otherwise, PBS job will get the following error message:

   More?

when the Windows command interpreter tries to execute that last line.

.B Submitting Jobs From Standard Input
.br
To submit a PBS job by typing job specifications at the command line,
you type:
.br
.I qsub [<options>] [-] <return>
.br
then type any directives, then any tasks, followed by:
.RS 3
Linux: CTRL-D on a line by itself

Windows: CTRL-Z <return>
.RE

to terminate the input.

The qsub command behaves the same both with and without the dash operand.
.br
For example, on Linux:
.RS 3
.nf
.B qsub <return>
#PBS -N StdInJob
sleep 100
<CTRL-D>
.RE
.fi

.B Submitting Job Directly by Specifying Executable on Command Line
.br
To submit a job directly, you specify the executable on the command
line:
.RS 3
.I qsub [<options>] -- <executable> [<arguments to executable>] <return>
.RE

When you run qsub this way, it runs the executable directly.  It does
not start a shell, so no shell initialization scripts are run, and
execution paths and other environment variables are not set.  There is
not an easy way to run your command in a different directory.  You
should make sure that environment variables are set correctly, and you
will usually have to specify the full path to the command.

For example, to run myprog with the arguments a and b:
.RS 3
.B qsub -- myprog a b <return>
.RE

For example, to run myprog with the arguments a and b, naming the job "JobA":
.RS 3
.B qsub -N JobA -- myprog a b <return>
.RE

On Linux, you need to specify the path to myprog, so the previous example
becomes:
.RS 3
.B qsub -N JobA -- /path/to/myprog a b <return>
.RE

.B Requesting Resources and Placing Jobs
.br
Requesting resources includes setting limits 
on resource usage and controlling how the job is placed on vnodes.

Resources are requested by using the 
.I -l
option, either in job-wide requests using
.I <resource name>=<value>
pairs, or in
.I chunks 
inside of 
.I selection statements.
  See the 
.B pbs_resources(7B) 
man page.

Job-wide 
.I <resource name>=<value> 
requests are of the form:
.RS 3
.I -l <resource name>=<value>[,<resource name>=<value> ...]
.RE

The 
.I selection statement 
is of the form:
.RS 3
.I -l select=[<N>:]<chunk>[+[<N>:]<chunk> ...]
.RE
where 
.I N
specifies how many of that chunk, and a 
.I chunk 
is of the form:
.RS 3
.I <resource name>=<value>[:<resource name>=<value> ...]
.RE

You choose how your chunks are placed using the 
.I place statement.  
The place statement can contain the following elements, in any order:
.RS 3
.I -l place=[<arrangement>][:<sharing>][:<grouping>]

where
.br
.I arrangement 
.RS 3
Whether this chunk is willing to share this vnode or host with other
chunks from the same job.  
.br
One of 
.I free | pack | scatter | vscatter
.RE

.I sharing
.RS 3
Whether this this chunk is willing to share this vnode or host with
other jobs.  
.br
One of 
.I excl | shared | exclhost
.RE

.I grouping 
.RS 3
Whether the chunks from this job should be placed on vnodes that all
have the same value for a resource.  
.br
Can have only one instance of
.I group=<resource name>
.RE

.I free
.RS 3
Place job on any vnode(s).
.RE

.I pack
.RS 3
All chunks are taken from one host.
.RE

.I scatter
.RS 3
Only one chunk with any MPI processes is taken from a host.  A chunk
with no MPI processes may be taken from the same vnode as another
chunk.
.RE

.I vscatter
.RS 3
Only one chunk is taken from any vnode.  Each chunk must fit on a vnode.
.RE

.I excl
.RS 3
Only this job uses the vnodes chosen.
.RE

.I shared
.RS 3
This job can share the vnodes chosen.
.RE

.I exclhost
.RS 3
The entire host is allocated to the job.
.RE

.I group=<resource name>
.RS 3
Chunks are grouped according to a resource.  All vnodes in the group
must have a common value for resource, which can be either the
built-in resource host or a custom vnode-level resource.

.I resource name 
must be a string or a string array.
.RE

The place statement cannot begin with a colon.  Colons are delimiters;
use them only to separate parts of a place statement, unless they are
quoted inside resource values.
.RE

Note that vnodes can have 
.I sharing 
attributes that override job placement requests.  
See the 
.I pbs_node_attributes.7B
man page.

.B Caveats for Requesting Resources
.br
Do not mix old-style resource or vnode specifications with the new
select and place statements.  Do not use one in a job script and the
other on the command line.  Mixing the two will result in an error.

You cannot submit a job requesting a custom resource which has been
created to be invisible or read-only for unprivileged users,
regardless of your privilege.  A Manager or Operator can use the
.B qalter 
command to change a job's request for this kind of custom resource.

For more on resource requests, usage limits and job placement, see
.I pbs_resources(7B).


.B Setting attributes
.br
The job submitter sets job attributes by giving options to the 
.B qsub 
command or by using 
.I PBS directives.
Most qsub options set a job attribute, and have a corresponding PBS
directive with the same syntax as the option.  Attributes set via
command-line options take precedence over those set using PBS
directives. See
.I pbs_job_attributes.7B.

.B Changing qsub Behavior
.br
The behavior of the 
.B qsub
command
may be affected by 
the server's 
.I default_qsub_arguments
attribute.  
This attribute can set the default for any job attribute.  
The 
.I default_qsub_arguments
server attribute is settable by the administrator,
and is overridden by command-line arguments and
script directives.
See the 
.I pbs_server_attributes(1B) 
man page.

The behavior of the 
.B qsub 
command may also be affected by 
any site hooks.  Site hooks can modify the job's attributes, 
change its routing, etc.

.SH Options to qsub

.IP "-a <date and time>" 8
Point in time after which the job is eligible for execution.
Given in pairs of digits.  Sets job's 
.I Execution_Time
attribute to 
.I date and time.
Format: 
.I datetime, 
expressed as
.RS 11
.I [[[[CC]YY]MM]DD]hhmm[.SS]
.RE
.IP " " 8
where 
.I CC 
is the century,
.I YY 
is the year, 
.I MM 
is the month,
.I DD 
is the day of the month, 
.I hh 
is the hour, 
.I mm 
is the minute, and 
.I SS 
is the seconds.

.IP " " 8
Each portion of the date defaults to the current date, as long as the 
next-smaller portion is in the future.  For example, if today is the
3rd of the month and the specified day 
.I DD 
is the 5th, the month 
.I MM
is set to the current month.

If a specified portion has already passed, the next-larger portion is set
to one after the current date.  For example, if the day
.I DD
is not specified, but the hour 
.I hh 
is specified to be 10:00 a.m. and the current time is 11:00 a.m., 
the day 
.I DD
is set to tomorrow.

.IP "-A <account string>" 8
Accounting string associated with the job.  Used for labeling accounting data.
Sets job's 
.I Account_Name 
attribute to 
.I account string.
.br
Format: 
.I String

.IP "-c <checkpoint spec>"
Determines when the job will be checkpointed.  Sets job's 
.I Checkpoint
attribute to 
.I checkpoint spec.  
An 
.I $action
script is required to checkpoint the job.  

The argument 
.I checkpoint spec
can take on one of the following values:
.RS
.IP c 5
Checkpoint at intervals, measured in CPU time, set on job's execution
queue.  If there is no interval set at the queue, the job is not
checkpointed.

.IP "c=<minutes of CPU time>" 5
Checkpoint at intervals of specified number of minutes of job CPU
time.  This value must be greater than zero.  If the interval
specified is less than that set on the job's execution queue, the
queue's interval is used.
.br
Format: 
.I Integer
.IP w 5
Checkpoint at intervals, measured in walltime, set on job's execution
queue.  If there is no interval set at the queue, the job is not
checkpointed.

.IP "w=<minutes of walltime>" 5
Checkpoint at intervals of the specified number of minutes of job walltime.
This value must be greater
than zero.  If the interval specified is less than that set on the
job's execution queue, the queue's interval is
used.
.br
Format: 
.I Integer
.IP n 5
No checkpointing.
.IP s 5
Checkpoint only when the server is shut down.
.IP u 5
Unset.  Defaults to behavior when 
.I interval
argument is set to 
.I s.
.LP
Default: 
.I u
.br
Format: 
.I String
.RE
.RE

.IP "-C <directive prefix>" 8
Defines the prefix identifying a 
.I PBS directive.
Default prefix is "#PBS".
.IP
If the
.I directive prefix
argument is a null string, qsub
does not scan the script file for directives.
Overrides the PBS_DPREFIX environment variable and the default.
The string "PBS_DPREFIX" cannot be used as a PBS directive.
Length limit: 4096 characters.

.IP "-e <path>" 8
Path to be used for the job's standard error stream.
Sets job's 
.I Error_Path 
attribute to 
.I path.
The
.I path
argument is of the form:
.RS 13
.I [<hostname>:]<path>
.RE
.RS
The 
.I path 
is interpreted as follows:

.IP path 5
If
.I path
is relative, it is taken to be relative to the current working directory of the 
.B qsub
command, where it is executing on the current host.

If
.I path
is absolute, it is taken to be an absolute path on the current host where the 
.B qsub
command is executing.

.IP hostname:path
If 
.I path
is relative, it is taken to be relative to the user's 
home directory on the host named
.I hostname.

If 
.I path
is absolute, it is an absolute path on the host named
.I hostname.
.LP
If 
.I path
does not include a filename, the default filename has the form
.I <job ID>.ER

If the
.I -e
option is not specified, PBS copies the standard error to the current
working directory where the 
.B qsub 
command was executed, and writes standard error to the default filename, 
which has this form:
.br
.I <job name>.e<sequence number>

If you use a UNC path for output or error files, the 
.I hostname 
is optional.  If you use a non-UNC path, the 
.I hostname 
is required.

This option is overridden by the 
.I -k
option.
.RE

.IP "-f" 8
Prevents 
.B qsub
from spawning a background process.  By default, 
.B qsub 
spawns a background process to manage communication with the PBS server.  
When this option is specified, the 
.B qsub
process connects directly to the server and no background process is created.

NOTE: Use of this option degrades performance of the 
.B qsub
command when calls are made in rapid succession.

.IP "-G [-- <GUI application>]" 8
Starts a GUI session.  When no application or script is provided,
starts a GUI-enabled interactive shell.  When an application or script
is provided, starts the GUI application or script.  Use full path to
application or script unless the path is part of the user's
PATH environment variable on the execution host.  When submission and
execution hosts are different, this uses a remote viewer.
.br
Session is terminated when remote viewer, GUI application, or 
interactive shell is terminated, or when job is deleted.
.br
Can be used only with interactive jobs (the 
.I -I 
option).
.br
Available only under Windows.

.IP "-h" 8
Applies a 
.I User 
hold to the job.
Sets the job's 
.I Hold_Types 
attribute to "u".

.IP "-I" 8
Job is to be run interactively.  Sets job's 
.I interactive
attribute to 
.I True.
The job is queued
and scheduled as any PBS batch job, but when executed, the standard input,
output, and error streams of the job are connected to the
terminal session in which 
.B qsub 
is running.
If a job script is given, only its directives are processed.  When the job
begins execution, all input to the job is taken from the terminal session.

Interactive jobs are not rerunnable.

Job arrays cannot be interactive.

When used with 
.I -Wblock=true, 
no exit status is returned.

.IP "-j <join>" 8
Specifies whether and how to join the job's standard error and standard output streams.
Sets job's 
.I Join_Path
attribute to 
.I join.
Default: 
.I n, 
not merged.  
The 
.I join
argument can take the following values:
.RS
.IP oe 11
Standard error and standard output are merged into standard output.

.IP eo 11
Standard error and standard output are merged into standard error.

.IP n 11
Standard error and standard output are not merged.
.RE

.IP "-J <range> [%<max subjobs>]" 8
Makes this job an array job.  Sets job's 
.I array
attribute to 
.I True.

Use the
.I range 
argument to specify the indices of the subjobs of the array.
.I range 
is specified in the form
.I X-Y[:Z]  
where 
.I X 
is the first index, 
.I Y 
is the upper bound on the indices, and
.I Z 
is the stepping factor.  For example,  2-7:2 will produce indices of 2, 4, and
6.  If 
.I Z 
is not specified, it is taken to be 1.  Indices must be greater than or 
equal to zero.

Use the optional 
.I %max subjobs 
argument to set a limit on the number of subjobs that can be running
at one time.  This sets the value of the 
.I max_run_subjobs 
job attribute to the specified maximum.

Job arrays are always rerunnable.

.IP "-k <discard>" 8
Specifies whether and which of the standard output and standard error streams
is left behind on the execution host, or written to their final destination.
Sets the job's 
.I Keep_Files 
attribute to 
.I discard.
Overrides default path names for these streams.  
Overrides 
.I -o
and 
.I -e
options.

Default: 
.I n; 
neither is retained, and files are not written to their final destinations.

In the case where output and/or error is retained on the execution host in
a job-specific staging and execution directory created by PBS, these
files are deleted when PBS deletes the directory.

The 
.I discard
argument can take the following values:
.RS
.IP e 5
The standard error stream is retained on the execution host, in the 
job's staging and execution directory.  The filename is
.RS
.RS 3
.I <job name>.e<sequence number>
.RE
.RE

.IP o  5
The standard output stream is retained on the execution host, in the
job's staging and execution directory.  The filename is
.RS
.RS 3
.I <job name>.o<sequence number>
.RE
.RE

.IP "eo, oe"  5
Both standard output and standard error streams are 
retained on the execution host, in the
job's staging and execution directory. 

.IP d 5
Output and/or error are written directly to their final destination.
Overrides action of leaving files on execution host.

.IP n  5
Neither stream is retained.
.RE

.IP "-l <resource list>" 8
.RS
Allows the user to request resources and specify job placement.  Sets job's 
.I Resource_list 
attribute to 
.I resource list.
Requesting a resource places a limit on its usage.

For how to request resources and place jobs, see 
.B "Requesting Resources and Placing Jobs" above.
.RE

.IP "-m <mail events> " 8
Specifies the set of conditions under which mail about the job is sent.
Sets job's 
.I Mail_Points
attribute to 
.I mail events.  
The 
.I mail events
argument can be one of the following:
.RS 11
The single character "n"
.br
Any combination of "a", "b", and "e", with optional "j"
.RE
.IP
The following table lists the sub-options to the 
.I -m 
option:
.RS
.IP n 5
No mail is sent
.IP a 5
Mail is sent when the job is aborted by the batch system
.IP b 5
Mail is sent when the job begins execution
.IP e 5
Mail is sent when the job terminates
.IP j 5
Mail is sent for subjobs. Must be combined with one or more of the
.I a
, 
.I b
, or 
.I e 
sub-options
.RE
.IP
Format: 
.I String
.br
Syntax: 
.I n | [j](one or more of a, b, e)
.br
Example: -m ja
.br
Default: 
.I "a"  

.IP "-M <user list>" 8
List of users to whom mail about the job is sent.  Sets job's 
.I Mail_Users 
attribute to 
.I user list.  

.RS
The
.I user list
argument has the form:
.RS 3
.I <username>[@<hostname>][,<username>[@<hostname>],...]
.RE

Default: Job owner
.RE

.IP "-N <name> " 8
Sets job's 
.I Job_Name 
attribute and name to 
.I name.  

Format: 
.I Job Name

Default: if a script is used to submit the job, the job's name is the
name of the script.  If no script is used, the job's name is "STDIN".

.IP "-o <path>" 8
Path to be used for the job's standard output stream.
Sets job's 
.I Output_Path 
attribute to 
.I path.
The
.I path
argument has the form:
.RS 13
.I [<hostname>:]<path>
.RE
.RS
The 
.I path 
is interpreted as follows:
.IP path 5
If
.I path 
is relative, it is taken to be relative to 
the current working directory of the
.B qsub
command, where it is executing on the current host.

If
.I path
is absolute, it is taken to be an absolute path on 
the current host where the
.B qsub
command is executing.
.IP hostname:path
If 
.I path
is relative, it is taken to be relative to the user's 
home directory on the host named
.I hostname.

If 
.I path 
is absolute, it is an absolute path on the host named
.I hostname.
.LP

If 
.I path
does not include a filename, the default filename has the form 
.I <job ID>.OU

If the
.I -o
option is not specified, PBS copies the standard output to the current
working directory where the 
.B qsub 
command was executed, and writes standard output to the default filename,
which has this form: 
.I <job name>.o<sequence number>

If you use a UNC path, the hostname is optional.  If you use a non-UNC
path, the hostname is required.

This option is overridden by the 
.I -k
option.
.RE

.IP "-p <priority>" 8
Priority of the job.  Sets job's 
.I Priority
attribute to 
.I priority.

Format: host-dependent integer
.br
Range: 
.I [-1024, +1023] 
inclusive
.br
Default: 
.I Zero  

.IP "-P <project>" 8
Specifies a project for the job. Sets job's 
.I project
attribute to 
.I project.

Format: 
.I Project Name

Default value: "_pbs_project_default"

.IP "-q <destination>" 8
Where the job is sent upon submission.  

Specifies a queue, a server, or a queue at a server.  The destination
argument can have one of these formats:
.RS
.I <queue name>
.RS 3
Job is submitted to the specified queue at the default server.
.RE

.I @<server name>
.RS 3
Job is submitted to the default queue at the specified server.
.RE

.I <queue name>@<server name>
.RS 3
Job is submitted to the specified queue at the specified server.
.RE

Default: Default queue at default server 
.RE

.IP "-r <y|n>" 8
Declares whether the job is rerunnable.  Sets job's 
.I Rerunable
attribute to the argument value.
Does not affect how the job is handled in the case where the job was
unable to begin execution.

Format: Single character, "y" or "n"
.br

.RS
.IP y 5
Job is rerunnable.
.IP n 5
Job is not rerunnable.
.RE

.IP "" 8
Default: "y"

Interactive jobs are not rerunnable.
Job arrays are automatically marked as rerunnable.
See the
.I qrerun.1B
man page.

.IP "-R <remove options>" 8
Specifies whether standard output and/or standard error files are
automatically removed (deleted) upon job completion.

Sets the job's 
.I Remove_Files 
attribute to 
.I remove options.  
Overrides default path names for these streams.  Overrides 
.I -o 
and 
.I -e 
options.

This attribute cannot be altered once the job has begun execution.

Default: 
.I Unset; 
neither is removed

The 
.I remove options 
argument can take the following values:
.RS
.IP e 5     
The standard error stream is removed (deleted) upon job completion
.IP o 5      
The standard output stream is removed (deleted) upon job completion
.IP "eo, oe" 5  
Both standard output and standard error streams are removed (deleted) upon job completion
.IP unset 5  
Neither stream is removed.
.RE

.IP "-S <path list>" 8
Specifies the interpreter or shell path for the job script.  Sets job's 
.I Shell_Path_List 
attribute to 
.I path list.

The 
.I path list
argument is the full path to the interpreter or shell including the 
executable name.  

Only one path may be specified without a host name.
Only one path may be specified per named host.  The path selected
is the one whose host name is that of the server on which the job
resides.  

.RS
Format:
.RS 3
.I <path>[@<hostname>][,<path>@<hostname> ...]
.RE

Default: user's login shell on execution host

Example of using bash via a directive:
.RS 3
.B #PBS -S /bin/bash@mars,/usr/bin/bash@jupiter
.RE
Example of running a Python script from the command line on Linux: 
.RS 3
.B qsub -S $PBS_EXEC/bin/pbs_python <script name>
.RE
Example of running a Python script from the command line on Windows: 
.RS 3
qsub -S %PBS_EXEC%\\bin\\pbs_python.exe <script name>
.RE
.RE
.IP 

.IP "-u <user list>" 8
List of usernames.  Job is run under a username from this list.
Sets job's 
.I User_List 
attribute to 
.I user list.

Only one username may be specified without a hostname.
Only one username may be specified per named host.  
The server on which the job resides will select first the username whose
hostname is the same as the server name.  Failing that, 
the next selection is the username with no specified hostname.
The usernames on the server and execution hosts must be the same.
The job owner must have authorization to run as the specified user.

.RS
Format of
.I user list: 
.RS 3
.I <username>[@<hostname>][,<username>@<hostname> ...]
.RE

Default: job owner (username on submission host)  
.RE

.IP "-v <variable list>"
Lists environment variables and shell functions to be exported to the job.
This is the list of environment variables that are added to
those already automatically exported.  These variables exist in
the user's environment from which
.B qsub
is run.
The job's 
.I Variable_List
attribute is appended with the variables in
.I variable list 
and their values.
See the 
.B ENVIRONMENT
section of this man page.

.RS
Format: comma-separated list of strings in the form:
.RS 3
.I <variable>
.RE
or
.RS 3
.I <variable>=<value>
.RE

If a 
.I <variable>=<value> 
pair contains any commas, the value must be 
enclosed in single or double quotes, and the 
.I <variable>=<value> 
pair must be enclosed in the kind of quotes not used to 
enclose the value.  For example:
.RS 3
qsub -v "var1='A,B,C,D'" job.sh
.br
qsub -v "a=10,var2='A,B',c=20,d='Hello world'" job.sh
.RE

Default: no environment variables are added to the job's variable list.
.RE

.IP "-V" 8
All environment variables and shell functions in the user's
environment where
.B qsub
is run are exported to the job.
The job's
.I Variable_List
attribute is appended with all of these environment variables and
their values.

.IP "-W <additional attributes>" 8
The 
.I -W 
option allows specification of some job attributes.  Some
job attributes must be specified using this option.  Those attributes
are listed below.
.RS
Format:
.RS 3
.I -W <attribute name>=<value>[,<attribute name>=<value>...]
.RE

If white space occurs within the 
.I additional attributes
argument, or the equal sign "=" occurs within a
.I value
string, it must be enclosed with single quotes or double quotes.

The following attributes can be set using the -W option only

.I "block=true"
.RS 3
The 
.B qsub
command waits for the job to terminate, then returns the job's exit value.
Sets job's 
.I block
attribute to 
.I True.
When used with X11 forwarding or interactive jobs, no exit value is returned.
See 
.B EXIT STATUS
section in this man page.
.LP
.RE

.I "create_resv_from_job=<value>"
.RS 3
When this job starts, immediately creates and confirms a job-specific
start reservation on the same resources as the job (including
resources inherited by the job), and places the job in the
job-specific reservation queue.  Sets the job's
.I create_resv_from_job 
attribute to 
.I True.  
Sets the job-specific reservation's 
.I reserve_job 
attribute to the ID of the job from which the reservation was created.
The new reservation's duration and start time are the same as the
job's walltime and start time.  If the job is peer scheduled, the
job-specific reservation is created in the pulling complex.
.br
Format: 
.I Boolean 
.br
Example: 
.B qsub myscript.sh -Wcreate_resv_from_job=1 

Cannot be used with job arrays or jobs being submitted into a reservation.
.RE

.I "depend=<dependency list>"
.RS 3
Defines dependencies between this and other jobs.  
Sets the job's
.I depend
attribute to 
.I dependency list.
The 
.I dependency list
has the form:
.RS 3
.I <type>:<arg list>[,<type>:<arg list> ...]
.RE
where except for the 
.I on
type, the
.I arg list
is one or more PBS job IDs, and has the form:
.RS 3
.I <job ID>[:<job ID> ...]
.RE
The 
.I type 
can be:

.IP "after: <arg list>" 4
This job may be scheduled for execution at any point after all jobs
in 
.I arg list
have started execution.

.IP "afterok: <arg list>" 4
This job may be scheduled for execution only after all jobs in
.I arg list
have terminated with no errors.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP "afternotok: <arg list>" 4
This job may be scheduled for execution only after all jobs in 
.I arg list
have terminated with errors.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP "afterany: <arg list>" 4
This job may be scheduled for execution after all jobs in
.I arg list
have finished execution, with any exit status (with or without errors.)
This job will not run if a job in the 
.I arg list 
was deleted without ever having been run.

.IP  "before: <arg list> " 4
Jobs in 
.I arg list 
may begin execution once this job has begun execution.
It is uncommon for users to specify a before condition. Rather,
PBS adds before dependencies automatically to the targets of
after dependencies.

.IP  "beforeok: <arg list>" 4
Jobs in 
.I arg list
may begin execution once this job terminates without errors.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP  "beforenotok: <arg list>" 4
If this job terminates execution with errors, jobs in 
.I arg list
may begin.
See "Warning about exit status with csh" in 
.B EXIT STATUS.

.IP  "beforeany: <arg list>" 4
Jobs in 
.I arg list
may begin execution once this job terminates execution,
with or without errors.

.IP "on: count" 4
This job may be scheduled for execution after 
.I count 
dependencies on
other jobs have been satisfied.  This type is used in conjunction
with one of the 
.I before
types listed.
.I count 
is an integer greater than 0.
.LP

Job IDs in the
.I arg list 
of 
.I before 
types must have been submitted with a 
.I type 
of 
.I on.

To use the 
.I before types,
the user must have the authority to alter the jobs in 
.I arg list.
Otherwise, the dependency is rejected and the new job aborted.

Error processing of the existence, state, or condition of the job on
which the newly submitted job is performed after the job is queued.
If an error is detected, the new job is deleted by the server.  Mail
is sent to the job submitter stating the error.

Dependency example:
.RS 3
In this example, we save the output (the jobid) from the first qsub into
shell variable "jobid" so we can supply it to the depend option on the
second job.
.LP
.B "jobid=`qsub first_step.sh`"
.br
.B "qsub -W depend=afterok:$jobid second_step.sh"
.br
.RE
.RE

.I "group_list=<group list>"
.RS 3
List of group names.  Job is run under a group name from this list.
Sets job's
.I group_List
attribute to
.I group list.

Only one group name may be specified without a hostname.
Only one group name may be specified per named host.
The server on which the job resides will select first the group name whose
hostname is the same as the server name.  Failing that,
the next selection is the group name with no specified hostname.
The group names on the server and execution hosts must be the same.
Job submitter's primary group is automatically added to this 
list.  
.LP
Under Windows, the primary group is the first group found for 
the user by PBS when it queries the accounts database.

Format of
.I group list:
.RS 3
.I <group name>[@<hostname>][,<group name>@<hostname> ...]
.RE

Default: Login group name of job owner
.RE

.I pwd
.br
.I pwd=''
.br
.I pwd=""
.RS 3
These forms prompt the user for a password.  A space between
.I W
and
.I pwd
is optional.  Spaces between the quotes are optional.
Examples:
.nf
    qsub ... -Wpwd <return>
    qsub ... -W pwd='' <return>
    qsub ... -W pwd="  " <return>
.fi
Available on supported Linux platforms only.
.RE

.I release_nodes_on_stageout=<value>
.RS 3
When set to 
.I True, 
all of the job's vnodes not on the primary execution
host are released when stageout begins.

Cannot be used with vnodes tied to Cray X* series systems.

When cgroups is enabled and this is used with some but not all vnodes
from one MoM, resources on those vnodes that are part of a cgroup are
not released until the entire cgroup is released.

The job's 
.I stageout 
attribute must be set for the
.I release_nodes_on_stageout 
attribute to take effect.

Format: 
.I Boolean

Default: 
.I False
.RE

.I "run_count=<value>"
.RS 3
Sets the number of times the server thinks it has run the job.  Sets the value of
the job's 
.I run_count
attribute to 
.I value.  

Format: Integer greater than or equal to zero
.RE

.I "sandbox=<sandbox spec>"
.RS 3
Determines which directory PBS uses for the job's staging and execution.  Sets
job's 
.I sandbox
attribute to 
.I sandbox spec.

Allowed values for 
.I sandbox spec:

.IP PRIVATE 5
PBS creates a job-specific directory for staging and execution.
.IP "HOME or unset" 5
PBS uses the user's home directory for staging and execution.
.LP

Format:
.I String
.RE

.I "stagein=<path list>"
.br
.I "stageout=<path list>"
.RS 3
Specifies files or directories to be staged in before execution or staged out
after execution is complete.  Sets the job's 
.I stagein
and 
.I stageout
attributes to the specified
.I path lists.
On completion of the job, all staged-in and staged-out files and directories
are removed from the execution host(s).  The
.I path list
has the form:
.RS 3
.I <file spec>[,<file spec>]
.RE
where 
.I file spec 
is 
.RS 3
.I <execution path>@<hostname>:<storage path>
.RE
regardless of the direction of the copy.
The name
.I execution path
is the name of the file or directory on the primary execution host.
It can be relative to the staging and execution directory on the
execution host, or it can be an absolute path.

The "@" character separates 
.I execution path
from 
.I storage path.

The name
.I storage_path
is the path on 
.I <hostname>. 
The storage_path can be absolute, or it can be relative to the user's home
directory on hostname.

If 
.I path list
has more than one 
.I file spec,
i.e. it contains commas, it must be enclosed in double quotes.

If you use a UNC path, the 
.I hostname 
is optional.  If you use a non-UNC path, the 
.I hostname 
is required.
.RE

.I "umask=<mask value>"
.RS 3
The umask with which the job is started.  Sets job's 
.I umask
attribute to 
.I mask value.
Controls umask of job's standard output and standard error.

The following example allows group and world read on the job's output:
.RS 3
.B -W umask=33
.RE

Format: One to four octal digits; typically two

Default value: 
.I 077
.RE
.RE

.IP "-X" 8
Allows user to receive X output from interactive job.

DISPLAY variable in submission environment must be set to 
desired display.

Can be used with interactive jobs only: must be used with
one of the following:
.RS
.RS 3
.I -I 
.br
.I -W interactive=true
.B (deprecated)
.RE

Cannot be used with 
.I -v DISPLAY.

When used with 
.I -Wblock=true,
no exit status is returned.

Can be used with 
.I -V 
option.

Not available under Windows.
.RE

.IP "-z" 8
Job identifier is not written to standard output.
.RE

.IP "--version" 8
The 
.B qsub
command returns its PBS version information and exits.
This option can only be used alone.

.SH  OPERANDS
The 
.B qsub 
command accepts as operands one of the following:
.RS 3
.I (no operands)
.RS 3
Same as with a dash. Any PBS directives and user tasks are read
from the command line.
.RE

.I <script>
.RS 3
Path to script.  Can be absolute or relative to current directory
where 
.B qsub 
is run.
The script must be the last argument to
.BR qsub .
.RE

.I "-"
.RS 3
When you use a dash, any PBS directives and user tasks are read
from the command line.
.RE

.I -- <executable> [<arguments to executable>]
.RS 3
A single executable (preceded by two dashes) and its arguments

The executable, and any arguments to the executable, are given on the
qsub command line.  The executable is preceded by two dashes, "--".
All
.B qsub
options must come before the "--".

When you run qsub this way, it runs the executable directly.  It does
not start a shell, so no shell initialization scripts are run, and
execution paths and other environment variables are not set.  You
should make sure that environment variables are set correctly.
.RE
.RE

.SH STANDARD OUTPUT
.IP "Job ID for submitted jobs" 8
If the job is successfully created

.IP "(No output)" 8
If the 
.I -z
option is set

.SH STANDARD ERROR
The
.B qsub
command writes a diagnostic message to standard error for
each error occurrence.

.SH ENVIRONMENT VARIABLES
The
.B qsub
command uses the following environment variables:
.RS 3
.IP PBS_DEFAULT 3
Name of default server.

.IP PBS_DPREFIX 3
Prefix string which identifies PBS directives.
.RE

PBS automatically exports the following environment variables to the job.
Environment variables beginning with "PBS_O_" are created by 
.B qsub
and included in the job's Variable_List.

.IP PBS_ENVIRONMENT 8
Set to 
.I PBS_BATCH 
for a batch job.  Set to 
.I PBS_INTERACTIVE
for an interactive job.

.IP PBS_JOBDIR 8
Pathname of job's staging and execution directory on the
primary execution host.  

.IP PBS_JOBID 8
Job identifier given by PBS when the job is submitted.

.IP PBS_JOBNAME 8
Job name specified by submitter.

.IP PBS_NODEFILE 8
Name of file containing the list of vnodes assigned to the job when
the job runs.

.IP PBS_O_HOME 8
User's home directory.  
Value of HOME taken from user's submission environment.

.IP PBS_O_HOST 8
Name of submit host.
Value taken from user's submission environment.

.IP PBS_O_LANG 8
Value of LANG taken from user's submission environment.

.IP PBS_O_LOGNAME 8
User's login name.
Value of LOGNAME taken from user's submission environment.

.IP PBS_O_MAIL 8
Value of MAIL taken from user's submission environment.

.IP PBS_O_PATH 8
User's PATH.
Value of PATH taken from user's submission environment.

.IP PBS_O_QUEUE 8
Name of the queue to which the job was submitted.
Value taken from job submission, otherwise default queue.

.IP PBS_O_SHELL 8
Value of SHELL taken from user's submission environment.

.IP PBS_O_SYSTEM 8
Operating system, from 
.I uname -s, 
on submit host.
Value taken from user's submission environment.

.IP PBS_O_TZ 8
Timezone.  Value taken from user's submission environment.

.IP PBS_O_WORKDIR 8
Absolute path to directory where
.B qsub
is run.
Value taken from user's submission environment.

.IP PBS_QUEUE 8
Name of the queue from which the job is executed.

.IP TMPDIR 8
Pathname of job's scratch directory.  Set when PBS assigns it.

.SH EXIT STATUS
For non-blocking jobs:
.RS 3
.IP Zero 8
Upon successful processing of input

.IP "Greater than zero" 8
Upon failure of 
.B qsub
.RE

For blocking jobs:
.RS 3
.IP "Exit value of job" 8
When job runs successfully

.IP 3 8
If the job is deleted without being run
.RE

.B Warning About Exit Status with csh:
.br
If a job is run in csh and a .logout file
exists in the user's home directory on the host where the job executes,
the exit status
of the job is that of the .logout script, not the job script.  This may
impact any inter-job dependencies.  

.SH SEE ALSO
pbs_job_attributes(7B),
pbs_server_attributes(7B),
pbs_resources(7B),
qalter(1B), 
qhold(1B), 
qmove(1B), 
qmsg(1B), 
qrerun(1B),
qrls(1B), 
qselect(1B), 
qstat(1B)


================================================
FILE: doc/man3/pbs_alterjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_alterjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_alterjob 
\- alter a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_alterjob(int connect, char *jobID, struct attropl *change_list, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to alter a batch job.

This command generates a 
.I Modify Job 
(11) batch request and sends it to the server over the connection specified by 
.I connect.

Job state may affect which attributes can be altered.  See the qalter(1B) man page.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job or job array to be altered.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for an array job:
.br
.I <sequence number>[].<server name>

.IP change_list 8
Pointer to a list of attributes to change.  Each attribute is described in an 
.I attropl 
structure, defined in pbs_ifl.h as:
.nf
struct attropl {
        struct attropl *next;
        char           *name;
        char           *resource;
        char           *value;
        enum batch_op  op;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP
.B Members of attropl Structure
.br
.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a pointer to a null string.

If the resource is already present in the job's 
.I Resource_List 
attribute, the value is altered as specified.  Otherwise the resource is added.

.IP value
Points to a string containing the value of the attribute or resource.  

.IP op 8
Defines the operation to perform on the attribute or resource.  For
this command, operators are 
.I SET, UNSET, INCR, DECR.

.SH RETURN VALUE
The routine returns 0 (zero) on success.
.br
If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qalter(1B), qhold(1B), qrls(1B), qsub(1B), pbs_connect(3B), pbs_holdjob(3B),
pbs_rlsjob(3B)


================================================
FILE: doc/man3/pbs_asyrunjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_asyrunjob 3B "11 December 2019" Local "PBS Professional"
.SH NAME
.B pbs_asyrunjob
\- run an asynchronous PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_asyrunjob(int connect, char *jobID, char *location, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION
Issues a batch request to run a batch job.

Generates an 
.I Asynchronous Run Job 
request and sends it to the server over the connection specified by 
.I connect.  

The server validates the request and replies before initiating the execution of the job.  

You can use this version of the call to reduce latency in scheduling,
especially when the scheduler must start a large number of jobs.

.SH REQUIRED PRIVILEGE
You must have Manager or Operator privilege to use this command.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job to be run.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for an array job:
.br
.I <sequence number>[].<server name

.IP location 8
Location where job should run, and optionally resources to use.  Same as 
.B qrun -H:

.RS 8
.IP "-H <vnode specification without resources>" 3
The 
.I vnode specification without resources
has this format:
.br
.I \ \ \ (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.br
.I \ \ \ <vnode name>[+<vnode name> ...]
.br
Example: -H (VnodeA+VnodeB)+(VnodeC)

PBS applies one requested chunk from the job's selection directive in round-robin
fashion to each 
.I vchunk 
in the list.  Each 
.I vchunk 
must be sufficient to run the job's corresponding chunk, otherwise
the job may not execute correctly.
.RE

.RS 8
.IP "-H <vnode specification with resources>" 3
The 
.I vnode specification with resources
has this format:
.br
.I \ \ \ (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.IP "" 6
.I <vnode name>:<vnode resources>[+<vnode name>:<vnode resources> ...]
.LP
.RS 3
and where
.I vnode resources
has the format
.RS 3
<resource name>=<value>[:<resource name>=<value> ...]
.RE

.IP "Example:" 3
.nf
-H (VnodeA:mem=100kb:ncpus=1)+ 
.br 
     (VnodeB:mem=100kb:ncpus=2+ VnodeC:mem=100kb)
.fi
.LP

PBS creates a new selection directive from the 
.I vnode specification with resources, 
using it instead of the original specification from the user.
Any single resource specification results in the
job's original selection directive being ignored.  Each 
.I vchunk 
must be sufficient to run the job's corresponding chunk, otherwise
the job may not execute correctly.

If the job being run requests
.I -l place=exclhost,
take extra care to satisfy the 
.I exclhost 
request.  Make sure that if any vnodes are from a multi-vnoded host, 
all vnodes from that host are allocated.  Otherwise those vnodes can 
be allocated to other jobs.
.RE
.RE

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.
.br

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qrun(1B), pbs_connect(3B), pbs_runjob(3B)


================================================
FILE: doc/man3/pbs_confirmresv.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_confirmresv 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_confirmresv 
\- confirm a PBS reservation 
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_confirmresv(int connect, char *reservationID, char *location,
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to confirm a PBS advance, standing, or maintenance reservation.

This function generates a 
.I Confirm Reservation 
(75) batch request and sends it to the server over the connection specified by 
.I connect.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP reservationID 8
Reservation to be confirmed.  
.br
Format for advance reservation:
.br
.I R<sequence number>.<server name>
.br
Format for standing reservation:
.br
.I S<sequence number>.<server name>
.br
Format for maintenance reservation:
.br
.I M<sequence number>.<server name>

.IP location 8
String describing vnodes and resources to be used for reservation.  
Format:
.br
.I (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.br
.nf
.I <vnode name>:<vnode resources>[+<vnode name>:<vnode 
.br
.I resources> ...]
.fi
.br
and where
.I vnode resources
has the format
.br
.I <resource name>=<value>[:<resource name>=<value> ...]

Example:
.nf
-H (VnodeA:mem=100kb:ncpus=1)+ 
.br 
     (VnodeB:mem=100kb:ncpus=2+ VnodeC:mem=100kb)
.fi
.LP

.IP start_time 8
Unsigned long containing start time in seconds since epoch.  Used only
for ASAP reservations (reservations created by using
.I pbs_ralter -W qmove=<jobID> 
on an existing job).  

.IP extend 8
Character string for specifying confirmation/non-confirmation action:
.RS 11
To confirm a normal reservation, pass in PBS_RESV_CONFIRM_SUCCESS.
.br
To have an unconfirmed reservation deleted, pass in PBS_RESV_CONFIRM_FAIL.
.br
To have the scheduler set the time when it will try to reconfirm a
degraded reservation, pass in PBS_RESV_CONFIRM_FAIL.
.RE

.SH RETURN VALUE
The routine returns 0 (zero) on success.

On error, the routine returns a non-zero exit value, and the error
number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
pbs_rdel(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_connect.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_connect 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_connect 
\- return a connection handle from a PBS batch server

.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_connect(char *server) 

.SH DESCRIPTION
This function establishes a virtual stream (TCP/IP) connection with
the specified batch server.

Returns a connection handle.

.B pbs_connect() 
determines whether or not the complex has a failover server
configured.  It also determines which server is the primary and which
is the secondary.

.SH ARGUMENTS
.IP server 8
Specifies name of server to connect to.  Format:
.br
.I <hostname>[:<port>]

If you do not specify a port, PBS uses the default.

If 
.I server 
is a null pointer or a null string, this function opens a
connection to the default server.  The default server is specified in
the PBS_DEFAULT environment variable or the PBS_SERVER parameter in
/etc/pbs.conf.

.SH USAGE
Use this function to establish a connection handle to the desired
server before calling any of the other pbs_* API functions.  They
will send their batch requests over the connection established by this
function.  You can send multiple requests over one connection.

.SH CLEANUP
After you are done using the connection handle, close the connection
via a call to 
.B pbs_disconnect().

.SH SIDE EFFECTS

The global variable 
.I pbs_server 
is declared in pbs_ifl.h.  This
variable is set on return to point to the server name to which
.B pbs_connect() 
connected or attempted to connect.

.SH Windows Requirement

In order to use 
.B pbs_connect() 
with Windows, initialize the network
library and link with winsock2.  To do this, call winsock_init()
before calling 
.B pbs_connect(), 
and link against the ws2_32.lib library.

.SH RETURN VAlUE
On success, the routine returns a connection handle which is a
non-negative integer.

If an error occurred, the routine returns -1, and the error number is
available in the global integer 
.I pbs_errno.

.SH SEE ALSO
pbs_disconnect(3B)


================================================
FILE: doc/man3/pbs_default.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_default 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_default 
\- return the name of the default PBS server
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B char *pbs_default()

.SH DESCRIPTION
Returns a pointer to a character string containing the name of the default PBS server.  

The default server is specified in the PBS_DEFAULT environment
variable or the PBS_SERVER parameter in /etc/pbs.conf.

.SH RETURN VALUE
On success, returns a pointer to a character string containing the
name of the default PBS server.  You do not need to free the character string.

Returns null if it cannot determine the name of the default server.


================================================
FILE: doc/man3/pbs_deljob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_deljob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_deljob 
\- delete a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_deljob(int connect, char *jobID, char *extend)

.SH DESCRIPTION
Issues a batch request to delete a batch job.  

This function generates a 
.I Delete Job 
(6) batch request and sends it to the server over the connection specified by 
.I connect.

If the batch job is running, the MoM sends the SIGTERM signal followed
by SIGKILL.

If the batch job is deleted by a user other than the job owner, PBS
sends mail to the job owner.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job, job array, subjob, or range of subjobs to be deleted.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for an array job:
.br
.I <sequence number>[].<server name>
.br
Format for a subjob:
.br
.I <sequence number>[<index>][.<server name>]
.br
Format for a range of subjobs:
.br
.I <sequence number>[<first>-<last>][.<server name>]

.IP extend 8
Character string for extensions to command.  If the string is not
null, it is appended to the message mailed to the job owner.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

On error, the routine returns a non-zero exit value, and the error
number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qdel(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_delresv.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_delresv 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_delresv 
\- delete a reservation 
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_delresv(int connect, char *reservationID, char *extend)

.SH DESCRIPTION
Issues a batch request to delete a reservation.

This function generates a 
.I Delete Reservation 
(72) batch request and sends it to the server over the connection specified by 
.I connect.

If the reservation is in state 
.I RESV_RUNNING, 
and there are jobs in the reservation queue, those jobs are deleted 
before the reservation is deleted.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP reservationID 8
Reservation to be deleted.  
.br
Format for advance reservation:
.br
.I R<sequence number>.<server name>
.br
Format for standing reservation:
.br
.I S<sequence number>.<server name>
.br
Format for maintenance reservation:
.br
.I M<sequence number>.<server name>

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

On error, the routine returns a non-zero exit value, and the error
number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
pbs_rdel(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_disconnect.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_disconnect 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_disconnect 
\- disconnect from a PBS batch server
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_disconnect(int connect)

.SH DESCRIPTION
Closes the virtual stream connection to a PBS batch server.
Connection was previously returned from a call to
.B pbs_connect().

.SH ARGUMENTS
.IP connect 8
Connection to be closed.  Return value of 
.B pbs_connect().
Specifies connection used earlier to send batch requests to server.

.SH RETURN VALUE
The routine returns 0 (zero) after successfully closing the connection.

If an error occurred, the routine returns -1, and the error number is 
available in the global inteter 
.I pbs_errno.

.SH SEE ALSO
pbs_connect(3B)


================================================
FILE: doc/man3/pbs_geterrmsg.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_geterrmsg 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_geterrmsg 
\- get error message for most recent PBS batch operation
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B char *pbs_geterrmsg(int connect)

.SH DESCRIPTION
Returns most recent error message text associated with a batch server request.

If a preceding batch interface library call over the connection
specified by 
.I connect 
returned an error from the server, the server may
have created an associated text message.  If there is a text message,
this function returns a pointer to the text message.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to request error message from server.

.SH RETURN VALUE
If the server returned an error and created an error text string in
reply to a previous batch request, this function returns a pointer to
the text string.  The text string is null-terminated.

If the server does not have an error text string, this function
returns a null pointer.  The text string is a global variable; you do
not need to free it.

.SH SEE ALSO
pbs_connect(3B)


================================================
FILE: doc/man3/pbs_holdjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_holdjob 3B "11 December 2019" Local "PBS Professional"
.SH NAME
.B pbs_holdjob 
\- place a hold on a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_holdjob(int connect, char *jobID, char *hold_type, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to place a hold on a job or job array.

This function generates a
.I Hold Job 
batch request sends it to the server over the connection specified by 
.I connect.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job which is to be held.
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>

.IP hold_type 8
Type of hold to apply to job or job array.  Valid values are defined
in pbs_ifl.h.  If hold_type is a null pointer or points to a null
string, PBS applies a 
.I User 
hold to the job or job array.

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qhold(1B), pbs_connect(3B), pbs_alterjob(3B), pbs_rlsjob(3B)


================================================
FILE: doc/man3/pbs_locjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_locjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_locjob 
- return current location of a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B char *pbs_locjob(int connect, char *jobID, char *extend)

.SH DESCRIPTION
Issues a batch request to locate a batch job or job array.

This function generates a 
.I Locate Job 
(8) batch request and sends it to the server over the connection specified by 
.I connect.

If the server currently manages the batch job, or knows which server
does currently manage the job, the server returns the location of the
job.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job to be located.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH CLEANUP
The character string returned by 
.B pbs_locjob() 
is allocated by
.B pbs_locjob().  
You must free it via a call to 
.B free().

.SH RETURN VALUE
On success, returns a pointer to a character string containing current
location.  Format: 
.br
.I <server name> 

On failure, returns a null pointer, and the error number is available
in the global integer 
.I pbs_errno.

.SH SEE ALSO
pbs_connect(3B)


================================================
FILE: doc/man3/pbs_manager.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_manager 3B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_manager 
\- modify a PBS batch object
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_manager(int connect, int command, int object_type, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *object_name, struct attropl *attrib_list, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION

Issues a batch request to perform administrative functions at a server.

Generates a 
.I Manager
(9) batch request and sends it to the server over the connection specified by 
.I connect.  

You can use this to create, delete, and set attributes of objects such as queues.

.SH REQUIRED PRIVILEGE
This function requires Manager or Operator privilege depending on the
operation, and root privilege when used with hooks.

When not used with hooks:
.RS 3
Functions MGR_CMD_CREATE and MGR_CMD_DELETE require PBS Manager privilege.
.br
Functions MGR_CMD_SET and MGR_CMD_UNSET require PBS Manager or Operator privilege.
.RE

When used with hooks:
.RS 3
All commands require root privilege on the server host.  
.br
Functions MGR_CMD_IMPORT, MGR_CMD_EXPORT, and MGR_OBJ_HOOK are used
only with hooks, and therefore require root privilege on the server
host.
.br
Hook commands are run at the server host.
.RE

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP command 8
Operation to be performed.  Valid values are specified in pbs_ifl.h. 

.IP object_type 8
Specifies type of object on which command is to operate.  Valid values
are specified in pbs_ifl.h.

.IP object_name 8
Name of object on which to operate.

.IP attrib_list 8
Pointer to a list of attributes to be operated on.  Each attribute is
described in an 
.I attropl 
structure, defined in pbs_ifl .h as:
.nf
struct attropl {
        struct attropl *next;
        char           *name;
        char           *resource;
        char           *value;
        enum batch_op  op;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.

.LP

.B Members of attropl Structure
.br
.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.
Otherwise, 
.I resource 
should be a null pointer.  

If the resource is already present in the object's attribute, the
value is altered as specified.  Otherwise the resource is added.

.IP value 8
Points to a string containing the new value of the attribute or
resource.  For parameterized limit attributes, this string contains
all parameters for the attribute.

.IP op 8
Defines the manner in which the new value is assigned to the attribute
or resource.  The operators used for this function are 
.I SET, UNSET, INCR, DECR.

.SH USAGE FOR HOOKS
When importing a hook or hook configuration file:
.RS 3
Set 
.I command 
to 
.I MGR_CMD_IMPORT

Set 
.I object_type 
to 
.I SITE_HOOK 
(or 
.I PBS_HOOK 
if you are importing a
configuration file for a built-in hook; you cannot import a built-in hook)

Set 
.I object_name 
to the name of the hook

In one attropl structure:
.RS 6
Set 
.I name 
to "content-type"

Set 
.I value 
to "application/x-python" for a hook, or "application/x-config" for a configuration file
.RE

In another attropl structure:
.RS 6
Set 
.I name 
to "content-encoding"

Set 
.I value 
to "default" or "base64"
.RE

In a third attropl structure:
.RS 6
Set  
.I name 
to "input-file"

Set 
.I value 
to the name of the input file
.RE

Set 
.I op 
to 
.I SET
.RE

When exporting a hook or hook configuration file:
.RS 3
Set 
.I command 
to 
.I MGR_CMD_EXPORT

Set 
.I object_type 
to 
.I SITE_HOOK 
(or 
.I PBS_HOOK 
if you are exporting a configuration file for a built-in hook; you cannot export 
a built-in hook) 

Set 
.I object_name 
to the name of the hook

In one attropl structure:
.RS 6
Set 
.I name to "content-type"

Set 
.I value 
to "application/x-python" for a hook, or "application/x-config" for a configuration file
.RE
In another attropl structure:
.RS 6
Set  
.I name 
to "content-encoding"

Set 
.I value 
to "default" or "base64"
.RE
In another attropl structure:
.RS 6
Set  
.I name 
to "output-file"

Set 
.I value 
to "default" or "base64"
.RE
In a third attropl structure:
.RS 6
Set 
.I name 
to "output-file"

Set 
.I value 
to the name of the output file
.RE

Set 
.I op 
to 
.I SET
.RE

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qmgr(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_modify_resv.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_modify_resv 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_modify_resv 
\- modify a PBS reservation
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B char *pbs_modify_resv(int connect, char *reservationID, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ struct attropl *attrib_list, char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to modify a reservation.

Generates a 
.I Modify Reservation 
(91) batch request and sends it to the server over the connection specified by 
.I connect.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP reservationID 8
Reservation to be modified.  
.br
Format for advance reservation:
.br
.I R<sequence number>.<server name>
.br
Format for standing reservation:
.br
.I S<sequence number>.<server name>
.br

.IP attrib_list 8
Pointer to a list of attributes to modify.  Each attribute is
described in an 
.I attropl 
structure, defined in pbs_ifl.h as:
.nf
struct attropl {
        struct attropl *next;
        char           *name;
        char           *resource;
        char           *value;
        enum batch_op  op;
};
.fi

For any attribute that is not specified or that is a null pointer, PBS
takes the default action for that attribute.  The default action is to
assign the default value or to not pass the attribute with the
reservation; the action depends on the attribute.

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP
.B Members of attropl Structure
.br
.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

If the resource is already present in the reservation's
.I Resource_List 
attribute, the value is altered as specified.  Otherwise the resource is added.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP op 8
Operator.  The only allowed operator for this function is 
.I SET.

.SH RETURN VALUE
On success, returns a character string containing the reservation ID assigned by the server.  

On failure, returns a null pointer, and the error number is available
in the global integer 
.I pbs_errno.

.SH CLEANUP
The space for the reservation ID string is allocated by 
.B pbs_modify_resv().
Release the reservation ID via a call to 
.B free() 
when no longer needed.

.SH SEE ALSO
pbs_rsub(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_movejob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_movejob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_movejob 
\- move a PBS batch job to a new destination
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_movejob(int connect, char *jobID, char *destination, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION
Issues a batch request to move a job or job array to a new destination.

Generates a 
.I Move Job 
(12) batch request and sends it to the server over the connection specified by 
.I connect.

Moves specified job or job array from its current queue and server to
the specified queue and server.

You cannot move a job in the 
.I Running, Transiting, 
or 
.I Exiting 
states.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job to be moved.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>

.IP destination 8
New location for job or job array.  Formats:
.br
.I <queue name>@<server name>
.br
   Specified queue at specified server
.br
.I <queue name>
.br
   Specified queue at default server
.br
.I @<server name> 
.br
   Default queue at specified server
.br
.I @default
.br
   Default queue at default server
.br
.I (null pointer or null string)
.br
   Default queue at default server

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qmove(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_msgjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_msgjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_msgjob 
\- record a message for a running PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_msgjob(int connect, char *jobID, int file, char *message, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION

Issues a batch request to write a message in one or more output files of a batch job.

Generates a 
.I Message Job 
(10) batch request and sends it to the server over the connection specified by 
.I connect.

You can write a message into a job's stdout and/or stderr files.  Can
be used on jobs or subjobs, but not job arrays or ranges of subjobs.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job into whose output file(s) to write.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a subjob:
.br
.I <sequence number>[<index>].<server name>

.IP file 8
Indicates whether to write to stdout, stderr, or both:
.RS 8
1
.br
   Writes to stdout
.br
2 
.br
   Writes to stderr
.br
3 
.br
   Writes to stdout and stderr
.RE
.IP message 8
Character string to be written to output file(s).

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qmsg(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_orderjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_orderjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_orderjob 
\- swap positions of two PBS batch jobs

.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_orderjob(int connect, char *job_id1, char *job_id2, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to swap the positions of two jobs.

Generates an 
.I Order Job 
(50) batch request and sends it to the server over the connection specified by 
.I connect.

Can be used on jobs and job arrays.  Can be used on jobs in different
queues.  Both jobs must be at the same server.

You cannot swap positions of jobs that are running.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP "jobID1, jobID2" 8
IDs of jobs to be swapped.
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qmove(1B), qorder(1B), qsub(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_preempt_jobs.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_preempt_jobs 3B "11 December 2019" Local "PBS Professional"
.SH NAME
.B pbs_preempt_jobs 
\- preempt a list of jobs
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int preempt_job_info *pbs_preempt_jobs(int connect, char **jobID_list)
.fi
.SH DESCRIPTION
Sends the server a list of jobs to be preempted.

Sends a 
.I Preempt Jobs
(93) batch request to the server over the connection specified by 
.I connect.

Returns a list of preempted jobs along with the method used to preempt
each one.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP jobID_list 8
List of job IDs to be preempted, as a null-terminated array of pointers to strings.  
.br
Format for a job ID:
.br
.I <sequence number>.<server name>
.br
Format for a job array ID:
.br
.I <sequence number>[].<server name>
.br
For example:
.RS 11
.nf
const char *joblist[3];
joblist[0]="123@myserver";
joblist[1]="456@myserver";
joblist[2]=NULL;
.fi
.RE

.SH RETURN VALUE
Returns a list of preempted jobs.  Each job is represented in a
.I preempt_job_info 
structure, which has the following fields:

.IP job_id 8
The job ID, in a char*

.IP preempt_method 8
How the job was preempted, in a char:
.br
S 
.br
   The job was preempted using suspension.
.br
C 
.br
   The job was preempted using checkpointing.
.br
R 
.br
   The job was preempted by being requeued.
.br
D 
.br
   The job was preempted by being deleted.
.br
0 (zero)
.br
   The job could not be preempted.
.SH CLEANUP
You must free the list of preempted jobs by passing it directly to 
.B free().


================================================
FILE: doc/man3/pbs_relnodesjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_relnodesjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_relnodesjob 
\- release some or all of the non-primary-execution-host vnodes assigned to a PBS job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_relnodesjob (int connect, char *jobID, char *vnode_list, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION

Issues a batch request to release some or all of the vnodes of a batch job.

Generates a 
.I RelnodesJob 
(90) batch request and sends it to the server over the connection specified by 
.I connect.

You cannot release vnodes on the primary execution host.

You can use this on jobs and subjobs, but not on job arrays or ranges of subjobs.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP jobID 8
ID of job or subjob whose vnodes are to be released.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a subjob:
.br
.I <sequence number>[<index>].<server name>

.IP vnode_list 8
List of vnode names separated by plus signs ("+").

If 
.I vnode_list 
is a null pointer, this specifies that all the vnodes assigned to the
job that are not on the primary execution host are to be released.

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALLUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.


================================================
FILE: doc/man3/pbs_rerunjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_rerunjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_rerunjob 
\- requeue a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_rerunjob(int connect, char *jobID, char *extend)

.SH DESCRIPTION
Issues a batch request to requeue a batch job, job array, subjob, or range of subjobs.

Generates a 
.I Rerun Job 
(14) batch request and sends it to the server over the connection specified by 
.I connect.

You cannot requeue a job that is marked as not rerunnable (the 
.I Rerunable 
attribute is False).

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP jobID 8
ID of job to be requeued.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>
.br
Format for a subjob:
.br
.I <sequence number>[<index>].<server name>
.br
Format for a range of subjobs:
.br
.I <sequence number>[<index start>-<index end>].<server name>

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qrerun(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_rescquery.3B
================================================
.\"
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"

.if \n(Pb .ig Ig
.TH pbs_rescquery 3B "1 Oct 2009" Local "PBS"
.\" The following macros are style for object names and values.
.de Ar		\" command/function arguments and operands (italic)
.ft 2
.if \\n(.$>0 \&\\$1\f1\\$2
..
.de Av		\" data item values  (Helv)
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
.ps -1
.if \\n(.$>0 \&\\$1\s+1\f1\\$2
..
.de At		\" attribute and data item names (Helv Bold)
.if  \n(Pb .ft 6
.if !\n(Pb .ft 2
.ps -1
.if \\n(.$>0 \&\\$1\s+1\f1\\$2
..
.de Ty		\" Type-ins and examples (typewriter)
.if  \n(Pb .ft 5
.if !\n(Pb .ft 3
.if \\n(.$>0 \&\\$1\f1\\$2
..
.de Er		\" Error values ( [Helv] )
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
\&\s-1[\^\\$1\^]\s+1\f1\\$2
..
.de Sc		\" Symbolic constants ( {Helv} )
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
\&\s-1{\^\\$1\^}\s+1\f1\\$2
..
.de Al		\" Attribute list item, like .IP but set font and size
.if !\n(Pb .ig Ig
.ft 6
.IP "\&\s-1\\$1\s+1\f1"
.Ig
.if  \n(Pb .ig Ig
.ft 2
.IP "\&\\$1\s+1\f1"
.Ig
..
.\" the following pair of macros are used to bracket sections of code
.de Cs
.ft 5
.nf
..
.de Ce
.sp
.fi
.ft 1
..
.\" End of macros
.Ig
.SH NAME
pbs_rescquery, avail, totpool, usepool - query resource availability
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.ft 3
.nf
int pbs_rescquery\^(\^int\ connect, char\ **resourcelist, int *arraysize,
int *available, int *allocated, int *reserved, int *down \^)
.sp
char *avail\^(\^int connect, char *resc\^)
.sp
int totpool\^(\^int connect, int update\^)
.sp
int usepool\^(\^int connect, int update\^)
.fi
.ft 1
.SH DESCRIPTION
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B pbs_rescquery
.br
Issue a request to the batch server to query the availability of resources.
.Ar connect
is the connection returned by \f3pbs_connect\fP().
.Ar resourcelist
is an array of one or more strings specifying the resources to be queried.
.Ar arraysize
is the is the number of strings in resourcelist.
.Ar available ,
.Ar allocated ,
.Ar reserved ,
and
.Ar down
are integer arrays of size arraysize.  The amount of resource specified in
the corresponding resourcelist string which is available, already allocated,
reserved, and down/off-line is returned in the integer arrays.
.IP
At the present time the only resources which may be specified is "nodes".
It may be specified as
.br
.Ty \ \ \ \ nodes
.br
.Ty \ \ \ \ nodes=
.br
.Ty \ \ \ \ nodes=\f2specification\f1
.br
where specification is what a user specifies in the -l option argument list
for nodes.  See the qsub(1B) and pbs_resources(7B) man pages.
.IP
Where the node resourcelist is a simple type, such as "nodes", "nodes=",
or "nodes=\f2type\fP", the numbers returned reflect the actual number of nodes
(of the specified type) which are \f2available\fP, \f2allocated\fP,
\f2reserved\fP, or \f2down\fP.
.IP
For a more complex node resourcelist, such as
"nodes=2" or "nodes=type1:type2", only the value returned in
.I available
has meaning.
If the number in
.I available
is positive, it is the number of nodes required to satisfy the specification
and that some set of nodes are available which will satisfy it, see
.I avail ().
If the number in
.I available
is zero, some number of nodes required for the specification are
currently unavailable, the request might be satisfied at a later time.
If the number in
.I available
is negative, no combination of known nodes can fulfill the specification.
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B avail
.br
The
.I avail ()
call is provided as a conversion aid for schedulers written for early versions
of PBS.   The avail() routine uses pbs_rescquery() and returns a character
string answer.
.Ar connect
is the connection returned by \f3pbs_connect\fP().
.Ar resc
is a single
.I node=specification
specification as discussed above.  If the nodes to satisfy the specification
are currently available, the return value is the character string
.B yes .
If the nodes are currently unavailable, the return is the character string
.B no .
If the specification could never be satisfied, the return is the string
.B never .
An error in the specification returns the character string
.B ? .
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B totpool
.br
The
.I totpool ()
function returns the total number of nodes known to the PBS server.  This is
the sum of the number of nodes available, allocated, reserved, and down.
The parameter
.Ar connection
is the connection returned by pbs_connect().
The parameter
.Ar update
if non-zero, causes totpool() to issue a pbs_rescquery() call to obtain
fresh information.   If zero, numbers from the prior pbs_rescquery() are used.
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B usepool
.br
.I usepool ()
returns the number of nodes currently in use, the sum of allocated, reserved,
and down.
The parameter
.Ar connection
is the connection returned by pbs_connect().
The parameter
.Ar update
if non-zero, causes totpool() to issue a pbs_rescquery() call to obtain
fresh information.   If zero, numbers from the prior pbs_rescquery() are used.
.SH "SEE ALSO"
qsub(1B), pbs_connect(3B), pbs_disconnect(3B), pbs_rescreserve(3B) and
pbs_resources(7B)
.SH DIAGNOSTICS
When the batch request generated by the \f3pbs_rescquery\f1()
function has been completed successfully
by a batch server, the routine will return 0 (zero).
Otherwise, a non zero error is returned.  The error number is also set
in pbs_errno.
.LP
The functions usepool() and totpool() return -1 on error.


================================================
FILE: doc/man3/pbs_rescreserve.3B
================================================
.\"
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_rescreserve 3B "13 Sept 2011" Local "PBS Professional"
.SH NAME
pbs_rescreserve, pbs_rescrelease - reserve/free batch resources
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_rescreserve\^(\^int\ connect, char\ **resourcelist, 
.B int arraysize, resource_t *resource_id\^)
.sp
.B int pbs_rescrelease\^(\^int connect, resource_t resource_id\^)
.SH DESCRIPTION
.HP 2
.B pbs_rescreserve
.br
Issue a request to the batch server to reserve specified resources.
.I connect
is the connection returned by \f3pbs_connect\fP().
.I resourcelist 
is an array of one or more strings specifying the resources to be queried.
.I arraysize
is the is the number of strings in resourcelist.
.I resource_id
is a pointer to a resource handle.
The pointer cannot be null.
If the present value of the resource handle is 
.B RESOURCE_T_NULL ,
this request is for a new reservation and if successful, a resource handle
will be returned in resource_id.
.IP
If the value of resource_id as supplied by the caller is not 
.B RESOURCE_T_NULL ,
this is a existing (partial) reservation.   Resources currently reserved 
for this handle will be released and the full reservation will be attempted
again.
If the caller wishes to release the resources allocated to a partial
reservation, the caller should pass the resource handle to 
\f2pbs_rescrelease\fP().
.IP
At the present time the only resources which may be specified are "nodes". 
It should be specified as:
.RS 4
.I nodes=specification
.RE
.IP
where specification is what a user specifies in the -l option argument list
for nodes, see 
.I qsub (1B).
.HP 2
.B pbs_rescrelease
.br
The \f2pbs_rescrelease\fP()
call releases or frees resources reserved with the resource handle of
.I resource_id
returned from a prior \f2pbs_rescreserve\fP() call.
.I connect
is the connection returned by \f3pbs_connect\fP().
.LP
Both functions require that the issuing user have operator or administrator
privilege.
.SH "SEE ALSO"
qsub(1B), pbs_connect(3B), pbs_disconnect(3B) and
pbs_resources(7B)
.SH DIAGNOSTICS
pbs_rescreserve() and pbs_rescrelease() return zero on success.
Otherwise, a non zero error is returned.  The error number is also set
in pbs_errno.
.IP PBSE_RMPART
is a special case indicating that some but not all of the requested resources
could be reserved; a partial reservation was made.  The reservation request
should either be rerequested with the returned handle or the partial 
resources released.
.IP PBSE_RMBADPARAM
a parameter is incorrect, such as a null for the pointer to the resource_id.
.IP PBSE_RMNOPARAM
a parameter is missing, such as a null resource list. 
.LP


================================================
FILE: doc/man3/pbs_rlsjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_rlsjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_rlsjob 
\- release a hold on a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_rlsjob(int connect, char *jobID, char *hold_type, char *extend)

.SH DESCRIPTION
Issues a batch request to release a hold on a job or job array.

Generates a 
.I Release Job 
(13) batch request and sends it to the server over the connection specified by 
.I connect.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP jobID 8
ID of job to be requeued.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>
.br

.IP hold_type 8
Type of hold to remove from job or job array.  Valid values are defined
in pbs_ifl.h.  If hold_type is a null pointer or points to a null
string, PBS removes a 
.I User 
hold to the job or job array.

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qhold(1B), qrls(1B), pbs_connect(3B), pbs_holdjob(3B)


================================================
FILE: doc/man3/pbs_runjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_runjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_runjob
\- run a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_runjob(int connect, char *jobID, char *location, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION
Issues a batch request to run a batch job.

Generates a
.I Run Job 
(15) request and sends it to the server over the connection specified by 
.I connect.  

If no file stagein is required, the server replies when the job has
started execution.  If file stagein is required, the server replies
when staging is started.

.SH REQUIRED PRIVILEGE
You must have Manager or Operator privilege to use this command.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP jobID 8
ID of job to be run.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name

.IP location 8
Location where job should run, and optionally resources to use.  Same as 
.B qrun -H:

.RS 8
.IP "-H <vnode specification without resources>" 3
The 
.I vnode specification without resources
has this format:
.br
.I \ \ \ (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.br
.I \ \ \ <vnode name>[+<vnode name> ...]
.br
Example: -H (VnodeA+VnodeB)+(VnodeC)

PBS applies one requested chunk from the job's selection directive in round-robin
fashion to each 
.I vchunk 
in the list.  Each 
.I vchunk 
must be sufficient to run the job's corresponding chunk, otherwise
the job may not execute correctly.
.RE

.RS 8
.IP "-H <vnode specification with resources>" 3
The 
.I vnode specification with resources
has this format:
.br
.I \ \ \ (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.IP "" 6
.I <vnode name>:<vnode resources>[+<vnode name>:<vnode resources> ...]
.LP
.RS 3
and where
.I vnode resources
has the format
.RS 3
<resource name>=<value>[:<resource name>=<value> ...]
.RE

.IP "Example:" 3
.nf
-H (VnodeA:mem=100kb:ncpus=1)+ 
.br 
     (VnodeB:mem=100kb:ncpus=2+ VnodeC:mem=100kb)
.fi
.LP

PBS creates a new selection directive from the 
.I vnode specification with resources, 
using it instead of the original specification from the user.
Any single resource specification results in the
job's original selection directive being ignored.  Each 
.I vchunk 
must be sufficient to run the job's corresponding chunk, otherwise
the job may not execute correctly.

If the job being run requests
.I -l place=exclhost,
take extra care to satisfy the 
.I exclhost 
request.  Make sure that if any vnodes are from a multi-vnoded host, 
all vnodes from that host are allocated.  Otherwise those vnodes can 
be allocated to other jobs.
.RE
.RE

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.
.br

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qrun(1B), pbs_asyrunjob(3B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_selectjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_selectjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_selectjob 
\- select PBS batch jobs according to specified criteria
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B char **pbs_selectjob(int connect, struct attropl *criteria_list, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION

.B pbs_selectjob() 
issues a batch request to select jobs that meet specified criteria,
and returns an array of job IDs that meet the specified criteria.

This command generates a 
.I Select Jobs 
(16) batch request and sends it to the server over the connection handle specified by 
.I connect.

By default, 
.B pbs_selectjob() 
returns all batch jobs for which the user
is authorized to query status.  You filter the jobs by specifying
values for job attributes and resources.  You send a linked list of
attributes with associated values and operators.  Job attributes are
listed pbs_job_attributes(7B).

Returns a list of jobs that meet all specified criteria.  

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP criteria_list 8
Pointer to a list of attributes to use as selection criteria.  Each
attribute is described in an 
.I attropl 
structure, defined in pbs_ifl.h as:
.nf
struct attropl {
        struct attropl *next;
        char           *name;
        char           *resource;
        char           *value;
        enum batch_op  op;
};
.fi

If 
.I criteria_list 
itself is null, you are not using attributes or resources as selection criteria.

.IP extend 8
Character string where you can specify limits or extensions of your search.
.LP

.B Members of attropl Structure
.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP op 8
Defines the operator in the logical expression:
.br
.I <existing value> <operator> <specified limit>
.br
Jobs for which the logical expression evaluates to True are selected.

For this command, 
.I op 
can be
.I EQ, NE, GE, GT, LE, LT.

.SH QUERYING STATES
You can select jobs in more than one state using a single request, by
listing all states you want returned.  For example, to get jobs in
.I Held 
and 
.I Waiting 
states:
.RS 3
Fill in 
.I criteria_list->name 
with "job_state"
.br
Fill in 
.I criteria_list->value 
with "HW" for 
.I Held 
and 
.I Waiting
.RE

.SH EXTENDING YOUR QUERY
You can use the following characters in the extend parameter:
.IP "T, t" 8
Extends query to include subjobs.  Job arrays are not included.
.IP x 8
Extends query to include finished and moved jobs.
.LP

.B Querying Finished and Moved Jobs
.br
To get information on finished or moved jobs, as well as current jobs,
add an 'x' character to the 
.I extend 
parameter (set one character to be the 'x' character).  For example:
.nf 
   pbs_selectjob ( ..., ..., <extend characters>) ...
.fi
To get information on finished jobs only:
.RS 3
Add the "x" character to the 
.I extend 
parameter
.br
Fill in 
.I criteria_list->name 
with "ATTR_state"
.br
Fill in 
.I criteria_list->value 
with "FM" for Finished and Moved
.RE
Subjobs are not considered finished until the parent array job is finished.

.B Querying Job Arrays and Subjobs
.br
To query only job arrays (not jobs or subjobs):
.RS 3
Fill in 
.I criteria_list->name 
with "array"
.br
Fill in 
.I criteria_list->value 
with "True"
.RE
To query only job arrays and subjobs (not jobs):
.RS 3
Fill in 
.I criteria_list->name 
with "array"
.br
Fill in 
.I criteria_list->value 
with "True"
.br
Add the "T" or "t" character to the 
.I extend 
parameter
.RE
To query only jobs and subjobs (not job arrays), add the "T" or "t" character to the 
.I extend 
parameter.

.SH RETURN VALUE
The return value is a pointer to a null-terminated array of character
pointers.  Each character pointer in the array points to a character
string which is a job ID in the form:
.br
.I <sequence number>.<server>@<server>

If no jobs met the criteria, the first pointer in the array is null.

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.SH CLEANUP REQUIRED
The returned array of character pointers is malloc()'ed by
.B pbs_selectjob().  
When the array is no longer needed, you must free it via a call to 
.B free().

.SH SEE ALSO
qselect(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_selstat.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_selstat 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_selstat 
\- get status of selected PBS batch jobs
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_selstat(int connect, struct attropl *criteria_list, 
.B \ \ \ \ \ \ \ \ \ \ \ \ struct attrl *output_attribs, char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to get the status of jobs which meet the specified criteria.  

Generates a 
.I Select Status 
(51) batch request and sends it to the server over the connection specified by 
.I connect.

Returns a list of 
.I batch_status 
structures for jobs that meet the selection criteria.

This function is a combination of 
.B pbs_selectjob() 
and 
.B pbs_statjob().  

By default this gives status for all jobs for which you are authorized
to query status.  You can filter the results by specifying selection
criteria.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP criteria_list 8
Pointer to a list of selection criteria, which are attributes and
resources with required values.  If this list is null, you are not
filtering your results via selection criteria.  Each attribute or
resource is described in an 
.I attropl 
structure, defined in pbs_ifl.h
as:
.nf
struct attropl {
        struct attropl *next;
        char           *name;
        char           *resource;
        char           *value;
        enum batch_op  op;
};
.fi
If 
.I criteria_list 
itself is null, you are not using attributes or resources as selection criteria.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this list is null, all
attributes are returned.  Each attribute is described in an 
.I attrl
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi
.IP extend 8
Character string where you can specify limits or extensions of your selection.
.LP
.B Members of attropl Structure
.br
.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.
For parameterized limit attributes, this string contains all
parameters for the attribute.

.IP op 8
Specifies the test to be applied to the attribute or resource.  The
operators are 
.I EQ, NE, GE, GT, LE, LT.
.LP 

.B Members of attrl Structure
.br
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise, 
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  Should always be null.

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH QUERYING STATES
You can select jobs in more than one state using a single request, by
listing all states you want returned.  For example, to get jobs in
.I Held 
and 
.I Waiting 
states:
.RS 3
Fill in 
.I criteria_list->name 
with "job_state"
.br
Fill in 
.I criteria_list->value 
with "HW" for 
.I Held 
and 
.I Waiting
.RE
.SH EXTENDING YOUR QUERY
You can use the following characters in the 
.I extend 
parameter:
.IP "T, t" 8
Extends query to include subjobs.  Job arrays are not included.
.IP x 8
Extends query to include finished and moved jobs.
.LP

.B Querying Finished and Moved Jobs
.br
To get information on finished or moved jobs, as well as current jobs,
add an 'x' character to the 
.I extend 
parameter (set one character to be the 'x' character).  For example:
.nf
   pbs_selstat ( ..., ..., <extend characters>) ...
.fi
To get information on finished jobs only:
.RS 3
Add the "x" character to the 
.I extend 
parameter
.br
Fill in 
.I criteria_list->name 
with "ATTR_state"
.br
Fill in 
.I criteria_list->value 
with "FM" for 
.I Finished 
and 
.I Moved
.RE
For example:
.nf
   criteria_list->name = ATTR_state;
   criteria_list->value = "FM";
   criteria_list->op = EQ;
   pbs_selstat ( ..., criteria_list, ..., extend) ...
.fi
Subjobs are not considered finished until the parent array job is finished.

.B Querying Job Arrays and Subjobs
.br
To query only job arrays (not jobs or subjobs):
.RS 3
Fill in 
.I criteria_list->name 
with "array"
.br
Fill in 
.I criteria_list->value 
with "True"
.RE

To query only job arrays and subjobs (not jobs):
.RS 3
Fill in 
.I criteria_list->name 
with "array"
.br
Fill in 
.I criteria_list->value 
with "True"
.br
Add the "T" or "t" character to the 
.I extend 
parameter
.RE
To query only jobs and subjobs (not job arrays), add the "T" or "t" character to the 
.I extend 
parameter.

.SH RETURN VALUE
Returns a pointer to a list of 
.I batch_status 
structures for jobs that meet the selection criteria.  If no jobs meet
the criteria or can be queried for status, returns the null pointer.

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qselect(1B), qstat(1B), pbs_connect(3B), pbs_selectjob(3B), pbs_statjob(3B)


================================================
FILE: doc/man3/pbs_sigjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_sigjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_sigjob 
\- send a signal to a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_sigjob(int connect, char *jobID, char *signal, char *extend)

.SH DESCRIPTION
Issues a batch request to send a signal to a batch job.

Generates a 
.I Signal Job 
(18) batch request and sends it to the server over the connection specified by 
.I connect.

You can send a signal to a job, job array, subjob, or range of subjobs.

The batch server sends the job the specified signal.

The job must be in the 
.I running 
or 
.I suspended 
state.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP jobID *
ID of job to be signaled.  
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>
.br
Format for a subjob:
.br
.I <sequence number>[<index>].<server name>
.br
Format for a range of subjobs:
.br
.I <sequence number>[<index start>-<index end>].<server name>

.IP signal 8
Name of signal to send to job.  Can be alphabetic, with or without 
.I SIG
prefix.  Can be signal number.

The following special signals are all lower-case, and have no associated signal number:
.RS 8
.IP admin-suspend 6
Suspends a job and puts its vnodes into the 
.I maintenance 
state.  The job is put into the 
.I S 
state and its processes are suspended.

.IP admin-resume 6
Resumes a job that was suspended using the 
.I admin-suspend 
signal, without waiting for scheduler.  Cannot be used on jobs that were
suspended with the 
.I suspend 
signal.  When the last 
.I admin-suspend
ed job has been 
.I admin-resume
d, the vnode leaves the maintenance state.

.IP suspend 6
Suspends specified job(s).  Job goes into 
.I suspended (S) 
state.

.IP resume 6
Marks specified job(s) for resumption by scheduler when there are
sufficient resources.  Cannot be used on jobs that were suspended
with the 
.I admin_suspend 
signal.  
.LP
If the signal is not recognized on the execution host, no signal is
sent and an error is returned.
.RE

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qsig(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_stagein.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_stagein 3B "3 March 2015" Local "PBS Professional"
.SH NAME
pbs_stagein - request that files for a PBS batch job be staged in.
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B int pbs_stagein(\^int\ connect, char\ *job_id, char\ *location, char\ *extend)

.SH DESCRIPTION
Issue a batch request to start the stage in of files specified in the stagein attribute of a batch job.
.LP
A
.I "stage in"
batch request is generated and sent to the server over the connection
specified by
.I connect 
which is the return value of \f3pbs_connect\f1().
.LP
This request directs the server to begin the stage in of files specified in the
job's stage in attribute.
This request requires that the issuing user have operator or
administrator privilege.
.LP
The argument,
.I job_id ,
identifies which job for which file staging is to begin.  It is specified in
the form:
.RS 4
.I "sequence_number.server"
.RE
.LP
The argument,
.I location ,
if not the null pointer or null string, specifies the location where the 
job will  be run and hence to where the files will be staged.
The location is the name of a host in the cluster managed by the server.
If the job is then directed to run at different location, the run request will
be rejected.
.LP
The argument,
.I extend ,
is reserved for implementation-defined extensions.
.SH "SEE ALSO"
qrun(8B), qsub(1B), and pbs_connect(3B)
.SH DIAGNOSTICS
When the batch request generated by \f3pbs_stagein\f1()
function has been completed successfully by a batch server, the routine will
return 0 (zero).
Otherwise, a non zero error is returned.  The error number is also set
in pbs_errno.


================================================
FILE: doc/man3/pbs_statfree.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statfree 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statfree 
\- free a PBS status object
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B void pbs_statfree(struct batch_status *psj)

.SH DESCRIPTION
Frees the specified PBS status object returned by PBS API routines
such as 
.B pbs_statque, pbs_statserver, pbs_stathook, 
etc.

.SH ARGUMENTS

.IP psj 8
Pointer to the 
.I batch_status 
structure to be freed.
.LP
.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
     struct batch_status *next;
     char                *name;
     struct attrl        *attribs;
     char                *text;
}
.fi

.SH RETURN VALUE
No return value.


================================================
FILE: doc/man3/pbs_stathook.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_stathook 3B "19 July 2020" Local "PBS Professional"
.SH NAME
.B pbs_stathook 
- get status information about PBS site hooks
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status 
.B *pbs_stathook(int connect, char *hook_id, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.sp
.B void pbs_statfree(struct batch_status *psj)
.fi
.SH DESCRIPTION
Issues a batch request to get the status of a specified site hook
or a set of site hooks at the current server.

Generates a 
.I Status Hook 
batch request and sends it to the server over the connection specified
by connect.

.B Required Privilege
.br
This API can be executed only by root on the local server host.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP hook_id 8
Hook name, null string, or null pointer.  
.br
If 
.I hook_id 
specifies a name, the attribute-value list for that hook is returned.  
.br
If 
.I hook_id 
is a null string or a null pointer, the status of all hooks
at the current server is returned.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this list is null, all
attributes are returned.  Each attribute is described in an 
.I attrl
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi
.IP extend 8
Character string where you can specify limits or extensions of your selection.
.LP

.B Members of attrl Structure
.br
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise, 
.I resource 
should be a null pointer.

.IP value 8
Should always be a pointer to a null string.

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a list of 
.I batch_status 
structures for for the specified site hook.  If no site hook can be
queried for status, returns the null pointer.

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
pbs_hook_attributes(7B), 
pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_stathost.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_stathost 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_stathost
\- get status of PBS execution host(s)
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_stathost(int connect, char *target, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to get the status of PBS execution hosts.

Generates a 
.I Status Node 
(58) batch request and sends it to the server over the connection specified by 
.I connect.

Returns specified attributes or all attributes of specified execution
host or all execution hosts.  If an execution host has multiple
vnodes, this command reports aggregated information from the vnodes
for that host.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP target 8
Name of execution host whose attributes are to be reported.  If this
argument is a null pointer or points to a null string, returns
attributes of all execution hosts known to the server.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this argument is null,
returns all attributes.  Each attribute is described in an 
.I attrl
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP
.B Members of attrl Structure
.br
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a list of
.I batch_status 
structures describing the execution host(s).

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP 
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statjob.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statjob 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statjob 
\- get status of PBS batch jobs
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statjob(int connect, char *ID, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION
Issues a batch request to get the status of a specified batch job, a
list of batch jobs, or the batch jobs at a queue or server.

Generates a 
.I Status Job 
(19) batch request and sends it to the server over the connection specified by 
.I connect.

You can query status of jobs, job arrays, subjobs, and ranges of subjobs.

Queries all specified jobs that the user is authorized to query.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP ID 8
Job ID, list of job IDs, queue, server, or null.  
.br
If 
.I ID 
is a null pointer or points to a null string, gets status of jobs at connected server. 
.br
Format for a job:
.br
.I <sequence number>.<server name>
.br
Format for a job array:
.br
.I <sequence number>[].<server name>
.br
Format for a subjob:
.br
.I <sequence number>[<index>].<server name>
.br
Format for a range of subjobs:
.br
.I <sequence number>[<index start>-<index end>].<server name>
.br
Format for a list of jobs: comma-separated list of job IDs in a single
string.  White space is ignored.  No limit on length:
.br
.I "<job ID>,<job ID>,<job ID>, ..."
.br
Format for a queue:
.br
.I <queue name>@<server name>
.br
Format for a server:
.br
.I <server name>
.br

.IP output_attribs 8
Pointer to a list of attributes to return.  If this list is null, all
attributes are returned.  Each attribute is described in an 
.I attrl
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string where you can specify limits or extensions of your
search.  Order of characters is not important.

.LP
.B Members of attrl Structure
.br
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH QUERYING JOB ARRAYS AND SUBJOBS
You can query status of job arrays and their subjobs, or just the parent job arrays only.

To query status of job arrays and their subjobs, include the job array
IDs in the 
.I ID 
argument, and include the "t" character in the 
.I extend
argument.  The function returns the status of each parent job array
followed by status of each subjob in that job array.

To query status of one or more parent job arrays only, but not their
subjobs, include their job IDs in the 
.I ID 
argument, but do not include anything in the 
.I extend 
argument.

.SH QUERYING THE JOBS AT A QUEUE OR SERVER
To query status of all jobs at a queue, give the queue name in the 
.I ID 
argument.

To query status of all jobs at a server, give the server name in the
.I ID 
argument.  If you give a null ID argument, the function queries the
default server.

.SH EXTENDING YOUR QUERY
You can use the following characters in the extend parameter:
.IP "T, t" 8
Extends query to include subjobs.  Job arrays are not included.

.IP x 8
Extends query to include finished and moved jobs.
.LP
.B Querying Finished and Moved Jobs
.br
To get status for finished or moved jobs, as well as current jobs, add
an 'x' character to the 
.I extend 
parameter (set one character to be the 'x' character).  For example: 
.br
.I \ \ \ pbs_statjob ( ..., ..., <extend characters>) ...

Subjobs are not considered finished until the parent array job is finished.


.SH RETURN VALUES

For a single job, if the job can be queried, returns a pointer to a
.I batch_status 
structure containing the status of the specified job.
If the job cannot be queried, returns a NULL pointer, and 
.I pbs_errno 
is set to an error number indicating the reason the job could not be queried.

For a list of jobs, if any of the specified jobs can be queried,
returns a pointer to a 
.I batch_status 
structure containing the status
of all the queryable jobs.  If none of the jobs can be queried,
returns a NULL pointer, and 
.I pbs_errno 
is set to the error number that indicates the reason that the last
job in the list could not be queried.

For a queue, if the queue exists, returns a pointer to a 
.I batch_status
structure containing the status of all the queryable jobs in the
queue.  If the queue does not exist, returns a NULL pointer, and
.I pbs_errno 
is set to 
.I PBSE_UNKQUE (15018).  
If the queue exists but contains no queryable jobs, returns a NULL pointer, and 
.I pbs_errno 
is set to 
.I PBSE_NONE (0).

When querying a server, the connection to the server is already
established by 
.B pbs_connect().  
If there are jobs at the server, returns a pointer to a 
.I batch_status 
structure containing the status of all the queryable jobs at the
server.  If the server does not contain any queryable jobs, returns a
NULL pointer, and 
.I pbs_errno 
is set to 
.I PBSE_NONE (0).  

.B The batch_status Structure 
.br 
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf 
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}

.SH CLEANUP
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statnode.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statnode 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statnode
\- get status of PBS execution host(s)
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statnode(int connect, char *target, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to get the status of PBS execution hosts.

Generates a 
.I Status Node 
(58) batch request and sends it to the server over the connection specified by 
.I connect.

Returns specified attributes or all attributes of specified execution
host or all execution hosts.  If an execution host has multiple
vnodes, this command reports aggregated information from the vnodes
for that host.

Identical to 
.B pbs_stathost(); 
retained for backward compatibility.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP target 8
Name of execution host whose attributes are to be reported.  If this
argument is a null pointer or points to a null string, returns
attributes of all execution hosts known to the server.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this argument is null,
returns all attributes.  Each attribute is described in an 
.I attrl
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP
.B Members of attrl Structure
.br
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a list of
.I batch_status 
structures describing the execution host(s).

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi


.SH CLEANUP 
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statque.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statque 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statque 
\- get status of PBS queue(s)
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statque(int connect, char *target, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to get the status of PBS queues.

Generates a 
.I Status Queue 
(20) batch request and sends it to the server over the connection specified by 
.I connect.

Returns specified attributes or all attributes of specified queue or all queues.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP target 8
Name of queue whose attributes are to be reported.  If this argument
is null, returns attributes of all queues known to the server.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this argument is a null
pointer or points to a null string, returns all attributes.  Each
attribute is described in an 
.I attrl 
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP
.B Members of attrl Structure
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a list of 
.I batch_status 
structures describing the queue(s).  

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi


.SH CLEANUP
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statresv.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statresv 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statresv 
\- get status of PBS reservation(s)
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statresv(int connect, char *target, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi
.SH DESCRIPTION
Issues a batch request to get the status of PBS reservation(s).

Generates a 
.I Status Reservation 
(71) batch request and sends it to the server over the connection specified by 
.I connect.

Returns specified attributes or all attributes of specified reservation or all reservations.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP target 8
ID of reservation whose attributes are to be reported.  If this
argument is a null pointer or points to a null string, returns
attributes of all reservations the user is authorized to query.
.br
Format for advance reservation:
.br
.I R<sequence number>.<server name>
.br
Format for standing reservation:
.br
.I S<sequence number>.<server name>
.br
Format for maintenance reservation:
.br
.I M<sequence number>.<server name>

.IP output_attribs 8
Pointer to a list of attributes to  return.  If this argument is null,
returns all attributes.  Each attribute is described in an
.I attrl 
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP
.B Members of attrl Structure

.IP name  8
Points to a string containing the name of the attribute.  

.IP resource
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a list of 
.I batch_status 
structures describing the reservation(s).  

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
pbs_rstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statrsc.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statrsc 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statrsc 
\- get status of PBS resources
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statrsc(int connect, char *rescname, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to query and return the status of a specified
resource, or a set of resources at a server.

Generates a 
.I Status Resource 
(82) batch request and sends it to the server over the connection specified by 
.I connect.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP rescname 8
Name of resource to be queried.  If this is null, queries all resources at the server.  

.IP output_attribs 8
Pointer to a list of attributes to return.  If this argument is a null
pointer or points to a null string, returns all attributes.  Each
attribute is described in an 
.I attrl 
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP

.B Members of attrl Structure
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Should be a null pointer.  

.IP value 8
Points to a string containing the value of the attribute or resource.
Should always be a pointer to a null string.

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH QUERYING RESOURCES AT SERVER
Use the 
.B pbs_connect() 
command to get a connection handle at the server.  

To query all resources at the server, pass a null pointer as the name
of the resource.

.SH RETURN VALUE
For a single resource, if the resource can be queried, returns a
pointer to a 
.I batch_status 
structure containing the status of the specified resource.

If the resource cannot be queried, the routine returns a null pointer,
and the error number is available in the global integer
.I pbs_errno.

When querying a server, the connection to the server is already
established by 
.B pbs_connect().  
If there are resources at the server, returns a pointer to a 
.I batch_status 
structure describing the queryable resource(s) at the server.  
In the unlikely event that the server does not contain any queryable
resources because the user is unprivileged and all  resources are
marked as invisible (the 
.I i 
flag is set), returns a NULL pointer, and
.I pbs_errno 
is set to 
.I PBSE_NONE (0).

.B The batch_status Structure
.br
The
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statsched.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statsched 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statsched 
\- get status of PBS schedulers
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statsched(int connect, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ struct attrl *output_attribs, char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to get the status of the PBS schedulers.

Generates a 
.I Status Scheduler 
(81) batch request and sends it to the server over the connection specified by 
.I connect.

This command returns status of the default scheduler and all multischeds.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this argument is a null
pointer or points to a null string, returns all attributes.  Each
attribute is described in an 
.I attrl 
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP

.B Members of attrl Structure
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8

Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.
Should always be a pointer to a null string.

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a list of 
.I batch_status 
structures describing the default scheduler and all multischeds.

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH "SEE ALSO"
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statserver.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statserver 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statserver 
\- get status of a PBS batch server
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statserver(int connect, struct attrl *output_attribs, char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to get the status of a batch server.

Generates a 
.I Status Server 
(21) batch request and sends it to the server over the connection specified by 
.I connect.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this argument is a null
pointer or points to a null string, returns all attributes.  Each
attribute is described in an 
.I attrl 
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP

.B Members of attrl Structure
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.
Should always be a pointer to a null string.

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a 
.I batch_status 
structure describing the server.  

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP
You must free the 
.I batch_status 
structure when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_statvnode.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_statvnode 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_statvnode
\- get status of PBS vnode(s) on execution hosts
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B struct batch_status *
.B pbs_statvnode(int connect, char *target, struct attrl *output_attribs, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to get the status of PBS vnodes on execution hosts.

Generates a 
.I Status Node 
(58) batch request and sends it to the server over the connection specified by 
.I connect.

Returns specified attributes or all attributes of specified execution
host vnode or all execution host vnodes.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP target 8
Name of execution host vnode whose attributes are to be reported.  If this
argument is a null pointer or points to a null string, returns
attributes of all execution host vnodes known to the server.

.IP output_attribs 8
Pointer to a list of attributes to return.  If this argument is null,
returns all attributes.  Each attribute is described in an 
.I attrl
structure, defined in pbs_ifl.h as:
.nf
struct attrl {
        char         *name;
        char         *resource;
        char         *value;
        struct attrl *next;
};
.fi

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP
.B Members of attrl Structure
.br
.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.SH RETURN VALUE
Returns a pointer to a list of
.I batch_status 
structures describing the vnode(s).

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.B The batch_status Structure
.br
The 
.I batch_status 
structure is defined in pbs_ifl.h as
.nf
struct batch_status {
        struct batch_status *next;
        char                *name;
        struct attrl        *attribs;
        char                *text;
}
.fi

.SH CLEANUP 
You must free the list of 
.I batch_status 
structures when no longer needed, by calling 
.B pbs_statfree().

.SH SEE ALSO
qstat(1B), pbs_connect(3B), pbs_statfree(3B)


================================================
FILE: doc/man3/pbs_submit.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_submit 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_submit 
\- submit a PBS batch job
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B char *pbs_submit(int connect, struct attropl *attrib_list, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *jobscript,  char *destqueue, char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to submit a new batch job.

Generates a 
.I Queue Job 
(1) batch request and sends it to the server over the connection specified by 
.I connect.

Submits job to specified queue at connected server, or if no queue is
specified, to default queue at connected server.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP attrib_list 8
Pointer to a list of attributes explicitly requested for
job.  Each attribute is described in an 
.I attropl 
structure, defined in pbs_ifl.h as:
.nf
struct attropl {
        struct attropl *next;
        char           *name;
        char           *resource;
        char           *value;
        enum batch_op  op;
};
.fi

For any attribute that is not specified or that is a null pointer, PBS
takes the default action for that attribute.  The default action is
to assign the default value or to not pass the attribute with the job;
the action depends on the attribute.

.IP jobscript 8
Pointer to path to job script.  Can be absolute or relative.  Relative
path begins with the directory where the user submits the job.

If null pointer or pointer to null string, no script is passed with job.

.IP destqueue 8
Pointer to name of destination queue at connected server.  If this is
a null pointer or points to a null string, the job is submitted to the
default queue at the connected server.

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP

.B Members of attropl Structure
.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.  

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP op 8
Operation to perform on the attribute or resource.  In this command,
the only allowed operator is 
.I SET.

.SH RETURN VALUE
Returns a pointer to a character string containing the job ID assigned
by the server.

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.SH CLEANUP

The space for the job ID returned by 
.B pbs_submit() 
is allocated by 
.B pbs_submit().  
Free it via a call to 
.B free() 
when you no longer need it.

.SH SEE ALSO
qsub(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_submit_resv.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_submit_resv 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_submit_resv 
\- submit a PBS reservation
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B char *pbs_submit_resv(int connect, struct attropl *attrib_list, 
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to submit a new reservation.

Generates a 
.I Submit Reservation 
(70) batch request and sends it to the server over the connection specified by 
.I connect.

Returns a pointer to the reservation ID. 

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection over which to send batch request to server.

.IP attrib_list 8
Pointer to a list of attributes to set, with values.  Each attribute
is described in an 
.I attropl 
structure, defined in pbs_ifl.h as:
.nf
struct attropl {
        struct attropl *next;
        char           *name;
        char           *resource;
        char           *value;
        enum batch_op  op;
};
.fi

For any attribute that is not specified or that is a null pointer, PBS
takes the default action for that attribute.  The default action is
to assign the default value or to not pass the attribute with the
reservation; the action depends on the attribute.

.IP extend 8
Character string for extensions to command.  Not currently used.
.LP

.B Members of attropl Structure
.IP next 8
Points to next attribute in list.  A null pointer terminates the list.

.IP name 8
Points to a string containing the name of the attribute.  

.IP resource 8
Points to a string containing the name of a resource.  Used only when
the specified attribute contains resource information.  Otherwise,
.I resource 
should be a null pointer.

.IP value 8
Points to a string containing the value of the attribute or resource.  

.IP op 8
Operator.  The only allowed operator for this function is 
.I SET.

.SH RETURN VALUE

Returns a pointer to a character string containing the reservation ID
assigned by the server.

If an error occurred, the routine returns a null pointer, and the
error number is available in the global integer 
.I pbs_errno.

.SH CLEANUP

The space for the reservation ID returned by 
.B pbs_submit_resv() 
is allocated by 
.B pbs_submit_resv().  
Free it via a call to 
.B free() 
when you no longer need it.

.SH SEE ALSO
pbs_rsub(1B), pbs_connect(3B)


================================================
FILE: doc/man3/pbs_submitresv.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"

.TH pbs_submitresv 3B "29 August 2011" Local "PBS"
.SH NAME
pbs_submitresv - submit a pbs reservation
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.B char *pbs_submitresv(\^int\ connect, struct\ attropl\ *attrib, char\ *extend)

.SH DESCRIPTION
Issue a batch request to submit a new reservation.
.LP
A
.I "Submit Reservation"
batch request is generated and sent to the server over the connection
specified by
.I connect
which is the return value of \f3pbs_connect\f1().
.LP
The parameter,
.I attrib ,
is a list of
.I attropl
structures which is defined in pbs_ifl.h as:
.sp
.Ty
.nf
    struct attrl {
        char   *name;
        char   *resource;
        char   *value;
        struct attrl *next;
        enum batch_op op;
    };
.fi
.sp
The
.I attrib
list is terminated by the first entry where
.I next
is a null pointer.
.LP
The
.I name
member points to a string which is the name of the attribute.  The
.I value
member points to a string which is the value of the attribute.
The attribute names are defined in pbs_ifl.h.
.LP
If an attribute is not named in the
.I attrib
array, the default action will be taken.  It will either be assigned
the default value or will not be passed with the reservation.  The action
depends on the attribute.
If
.I attrib
itself is a null pointer, then the default action will be taken for
each attribute.
.LP
Associated with an attribute of type ATTR_l (the letter ell)
is a resource name indicated by
.I resource
in the
.I attrl
structure.
All other attribute types should have a pointer to a null string for
.I resource .
.LP
The
.I op
member is forced to a value of
.I SET
by pbs_submitresv().
.LP
The parameter,
.I extend ,
is reserved for implementation-defined extensions.
.LP
The return value is a character string which is the
.I reservation_identifier
assigned to the job by the server.
The space for the
.I reservation_identifier
string is allocated by \f3pbs_submitresv\f1()
and should be released via a call to \f3free\f1()
by the user when no longer needed.
.SH "SEE ALSO"
pbs_rsub(1B) and pbs_connect(3B)
.SH DIAGNOSTICS
When the batch request generated by pbs_submitresv()
function has been completed successfully by a batch server, the routine will
return a pointer to a character string which is the job identifier of the
submitted batch job.
Otherwise, a null pointer is returned and the error code is set in pbs_error.


================================================
FILE: doc/man3/pbs_tclapi.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_tclapi 3B "4 December 2019" Local "PBS Professional"
.SH NAME
pbs_tclapi \- PBS TCL Application Programming Interface 
.SH DESCRIPTION
.B Deprecated.  
The
.B pbs_tclapi
is a subset of the PBS external API wrapped in a TCL
library. This functionality allows the creation of 
scripts that query the PBS system. Specifically,
it permits the user to query the
.B pbs_server
about the state of PBS, jobs,
queues, and nodes, and communicate with
.B pbs_mom
to get information about the status of running jobs, available
resources on nodes, etc.
.LP
.SH USAGE
A set of functions to communicate with the PBS
server and resource monitor have been added to those normally
available with Tcl. All these calls will set the Tcl variable
"pbs_errno" to a value to indicate if an error occurred.
In all cases, the value "0" means no error. If a call to
a Resource Monitor function is made, any error value will
come from the system supplied
.B errno
variable. If the function call communicates with the PBS
Server, any error value will come from the error number returned
by the server. This is the same TCL interface used by the
.B pbs_tclsh
and 
.B pbs_wish
commands.

.IP "openrm host ?port?" 6
Creates a connection to the PBS Resource Monitor on
.I host
using
.I port
as the port number or the standard port for the resource monitor
if it is not given.  A connection handle is returned.
If the open is successful, this will be a non-negative integer.
If not, an error occurred.
.IP "closerm connection" 6
The parameter
.I connection
is a handle to a resource monitor which was previously returned from
.B openrm.
This connection is closed.  Nothing is returned.
.LP
.IP "downrm connection" 6
Sends a command to the connected resource monitor to shutdown.
Nothing is returned.
.LP
.IP "configrm connection filename" 6
Sends a command to the connected resource monitor to read the configuration
file given by
.I filename.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "addreq connection request" 6
A resource request is sent to the connected resource monitor.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "getreq connection" 6
One resource request response from the connected resource monitor is
returned.  If an error occurred or there are no more responses, an
empty string is returned.
.LP
.IP "allreq request" 6
A resource request is sent to all connected resource monitors.
The number of streams acted upon is returned.
.LP
.IP "flushreq" 6
All resource requests previously sent to all connected resource monitors
are flushed out to the network.  Nothing is returned.
.LP
.IP "activereq" 6
The connection number of the next stream with something to read is returned.
If there is nothing to read from any of the connections, a negative
number is returned.
.LP
.IP "fullresp flag" 6
Evaluates
.I flag
as a boolean value and sets
the response mode used by
.B getreq
to
.B full
if
.I flag
evaluates to "true".
The full return from a resource monitor includes the original request
followed by an equal sign followed by the response.  The default
situation is only to return the response following the equal sign.
If a script needs to "see" the entire line, this function may be used.
.LP
.IP "pbsstatserv" 6
The server is sent a status request for information about the server
itself.
If the request succeeds, a list with three elements is returned,
otherwise an empty string is returned.
The first element is the server's name.  The second is a list of attributes.
The third is the "text" associated with the server (usually blank).
.LP
.IP "pbsstatjob" 6
The server is sent a status request for information about the all
jobs resident within the server.
If the request succeeds, a list is returned, otherwise an empty string
is returned.
The list contains an entry for each job.  Each element is a list
with three elements.  The first is the job's jobid.  The second
is a list of attributes.  The attribute names which specify
resources will have a name of the form "Resource_List:name" where
"name" is the resource name.
The third is the "text" associated with the job (usually blank).
.LP
.IP "pbsstatque" 6
The server is sent a status request for information about all
queues resident within the server.
If the request succeeds, a list is returned, otherwise an empty string
is returned.
The list contains an entry for each queue.  Each element is a list
with three elements.  This first is the queue's name.  The second
is a list of attributes similar to
.B pbsstatjob.
The third is the "text" associated with the queue (usually blank).
.LP
.IP "pbsstatnode" 6
The server is sent a status request for information about all
nodes defined within the server.
If the request succeeds, a list is returned, otherwise an empty string
is returned.
The list contains an entry for each node.  Each element is a list
with three elements.  This first is the node's name.  The second
is a list of attributes similar to
.B pbsstatjob.
The third is the "text" associated with the node (usually blank).
.LP
.IP "pbsselstat" 6
The server is sent a status request for information about the all runnable
jobs resident within the server.
If the request succeeds, a list similar to
.B pbsstatjob
is returned, otherwise an empty string is returned.
.LP
.IP "pbsrunjob jobid ?location?" 6
Run the job given by
.I jobid
at the location given by
.I location.
If
.I location
is not given, the default location is used.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsasyrunjob jobid ?location?" 6
Run the job given by
.I jobid
at the location given by
.I location
without waiting for a positive response that the job
has actually started.
If
.I location
is not given, the default location is used.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsrerunjob jobid" 6
Re-runs the job given by
.I jobid.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsdeljob jobid" 6
Delete the job given by
.I jobid.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsholdjob jobid" 6
Place a hold on the job given by
.I jobid.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsmovejob jobid ?location?" 6
Move the job given by
.I jobid
to the location given by
.I location.
If
.I location
is not given, the default location is used.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsqenable queue" 6
Set the "enabled" attribute for the queue given by
.I queue
to true.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsqdisable queue" 6
Set the "enabled" attribute for the queue given by
.I queue
to false.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsqstart queue" 6
Set the "started" attribute for the queue given by
.I queue
to true.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsqstop queue" 6
Set the "started" attribute for the queue given by
.I queue
to false.
If this is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsalterjob jobid attribute_list" 6
Alter the attributes for a job specified by
.I jobid.
The parameter
.I attribute_list
is the list of attributes to be altered.  There can be more than one.
Each attribute consists of a list of three elements.  The first
is the name, the second the resource and the third is the new value.
If the alter is successful, a "0" is returned, otherwise, "-1" is returned.
.LP
.IP "pbsrescquery resource_list" 6
.B Deprecated. 
Obtain information about the resources specified by
.I resource_list.
This will be a list of strings.  If the request succeeds, a list
with the same number of elements as
.I resource_list
is returned.  Each element in this list will be a list with four
numbers.  The numbers specify
.I available,
.I allocated,
.I reserved,
and
.I down
in that order.
.LP

.IP "pbsconnect ?server?" 6
Make a connection to the named server or the default server if
a parameter is not given.
Only one connection to a server is allowed at any one time.
.LP
.IP pbsdisconnect 6
Disconnect from the currently connected server.
.LP
The above Tcl functions use PBS interface library calls for communication
with the server and the PBS resource monitor library to communicate
with pbs_mom.
.LP
.IP "datetime ?day? ?time?" 6
The number of arguments used determine the type of
date to be calculated.  With no arguments, the current POSIX
date is returned.  This is an integer in seconds.
.sp
With one argument there are two possible formats.  The first is a 12
(or more) character string specifying a complete date in
the following format:
.br
.I \ \ \ YYMMDDhhmmss
.br
All characters must be digits.  The year (YY) is given by the first
two (or more) characters and is the number of years since 1900.
The month (MM) is the number of the month [01-12].
The day (DD) is the day of the month [01-32].  The hour (hh) is the hour
of the day [00-23].  The minute (mm) is minutes after the hour [00-59].
The second (ss) is seconds after the minute [00-59].  The POSIX date
for the given date/time is returned.
.sp
The second option with one argument is a relative time.  The format
for this is
.br
.I \ \ \ HH:MM:SS
.br
With hours (HH), minutes (MM) and seconds (SS) being separated by
colons ":".  The number returned in this case will be the number of seconds
in the interval specified, not an absolute POSIX date.
.sp
With two arguments a relative date is calculated.  The first argument
specifies a day of the week and must be one of the following strings:
"Sun", "Mon", "Tue", "Wed", "Thr", "Fri", or "Sat".  The second
argument is a relative time as given above.  The POSIX date
calculated will be the day of the week given which follows the
current day, and the time given in the second argument.  For example,
if the current day was Monday, and the two arguments were
"Fri" and "04:30:00", the date calculated would be the POSIX date
for the Friday following the current Monday, at four-thirty in the
morning.  If the day specified and the current day are the same,
the current day is used, not the day one week later.
.LP
.IP "strftime format time"
This function calls the POSIX function
.I strftime().
It requires two arguments.  The first
is a format string.  The format conventions are the same as those
for the POSIX function strftime().  The second argument is POSIX
calendar time in second as returned by
.I datetime.
It returns a string based on the format given.  This gives the ability to
extract information about a time, or format it for printing.
.LP
.IP "logmsg tag message" 6
This function calls the internal PBS function
.I log_err().
It will cause a log message to be written to the scheduler's log file.  The 
.I tag
specifies a function name or other word used to identify the area
where the message is generated.  The
.I message
is the string to be logged.
.LP
.SH "SEE ALSO"
pbs_tclsh(8B), pbs_wish(8B), pbs_mom(8B),
pbs_server(8B), pbs_sched(8B)


================================================
FILE: doc/man3/pbs_terminate.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_terminate 3B "15 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_terminate 
\- shut down a PBS batch server
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.nf
.B int pbs_terminate(int connect, int manner, char *extend)
.fi

.SH DESCRIPTION
Issues a batch request to shut down a batch server.  

Generates a 
.I Server Shutdown 
(17) batch request and sends it to the server over the connection specified by 
.I connect.

The 
.B pbs_terminate() 
command exits after the server has completed its shutdown procedure.

.SH REQUIRED PRIVILEGE
You must have Operator or Manager privilege to run this command.

.SH ARGUMENTS
.IP connect 8
Return value of 
.B pbs_connect().  
Specifies connection handle over which to send batch request to server.

.IP manner 8
Manner in which to shut down server.  The available manners are
defined in pbs_ifl.h.  Valid values: 
.I SHUT_IMMEDIATE, SHUT_DELAY, SHUT_QUICK.
See qterm(8B) for information on manner in which to shut down server.

.IP extend 8
Character string for extensions to command.  Not currently used.

.SH RETURN VALUE
The routine returns 0 (zero) on success.

If an error occurred, the routine returns a non-zero exit value, and
the error number is available in the global integer 
.I pbs_errno.

.SH SEE ALSO
qterm(8B), pbs_connect(3B)


================================================
FILE: doc/man3/rm.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH RM 3 "6 March 2019" Local "PBS Professional"
.SH NAME
openrm, closerm, downrm, configrm, addreq, allreq, getreq, flushreq, activereq, fullresp \- resource monitor API
.SH SYNOPSIS

.B #include <sys/types.h>
.br
.B #include <netinet/in.h>
.br
.B #include <rm.h>

.LP
.B
int openrm (host, port)
.br
.RS 6
char *host;
.br
unsigned int port;
.RE
.LP
.B int closerm (stream) 
.br
.RS 6
int stream;
.RE
.LP
.B
int downrm (stream)   
.br
.RS 6
int stream;
.RE
.LP
.B
int configrm (stream, file)
.br
.RS 6
int stream;
.br
char *file;
.RE
.LP
.B
int addreq (stream, line)
.br
.RS 6
int stream; 
.br
char *line;
.RE
.LP
.B
int allreq (line) 
.br
.RS 6
char *line; 
.RE
.LP
.B
char *getreq(stream)  
.br
.RS 6
int stream;
.RE
.LP
.B
int flushreq() 
.LP
.B
int activereq()
.LP
.B
void fullresp(flag)  
.br
.RS 6
int flag; 
.RE
.SH DESCRIPTION
.LP
The resource monitor library contains functions to facilitate
communication with the PBS Professional resource monitor. It is set up
to make it easy to connect to several resource monitors and
handle the network communication efficiently.
.LP
In all these routines, the variable
.B pbs_errno
will be set when an error is indicated.
The lower levels of network protocol are handled by the
"Data Is Strings" 
.I DIS
library and the "Reliable Packet Protocol"
.I RPP
library.

.LP
.B configrm() 
causes the resource monitor to read the file named. 
.B Deprecated.

.LP
.B addreq()
begins a new message to the resource monitor if necessary.
Then adds a line to the body of an outstanding command to the resource
monitor.

.LP
.B allreq()
begins, for each stream, a new message to the resource monitor if necessary.
Then adds a line to the body of an outstanding command to the resource
monitor.

.LP
.B getreq()
finishes and sends any outstanding message to the resource monitor.
If
.B fullresp()
has been called to turn off "full response" mode, the routine
searches down the line to find the equal sign just before the
response value.
The returned string (if it is not NULL) has been allocated by
.I malloc
and thus
.I free
must be called when it is no longer needed to prevent memory leaks.

.LP
.B flushreq()
finishes and sends any outstanding messages to all resource monitors.
For each active resource monitor structure, it checks if any
outstanding data is waiting to be sent. If there is, it is sent and
the internal structure is marked to show "waiting for response".

.LP
.B fullresp()
turns on, if flag is true, "full response" mode where
.B getreq()
returns a pointer to the beginning of a line of response.
This is the default.  If flag is false,
the line returned by
.B getreq()
is just the answer following the equal sign.

.LP
.B activereq()
Returns the stream number of the next stream with something
to read or a negative number (the return from
.I rpp_poll )
if there is no stream to read.

In order to use any of the above with Windows, initialize the network
library and link with 
.B winsock2.  
To do this, call 
.B winsock_init() 
before calling the function and link against the 
.B ws2_32.lib 
library.

.SH SEE ALSO
.BR tcp (4P),
.BR udp (4P)


================================================
FILE: doc/man3/tm.3
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH TM 3 "24 February 2015" Local "PBS Professional"
.SH NAME
tm_init, tm_nodeinfo, tm_poll, tm_notify, tm_spawn, tm_kill, tm_obit, tm_taskinfo, tm_atnode, tm_rescinfo, tm_publish, tm_subscribe, tm_finalize, tm_attach \- task management API
.SH SYNOPSIS
.B
#include <tm.h>
.LP
.B
int tm_init(info, roots)
.RS 6
void \(**info;
.br
struct tm_roots \(**roots;
.RE
.LP
.B
int tm_nodeinfo(list, nnodes)
.RS 6
tm_node_id \(**\(**list;
.br
int \(**nnodes;
.RE
.LP
.B
int tm_poll(poll_event, result_event, wait, tm_errno)
.RS 6
tm_event_t poll_event;
.br
tm_event_t \(**result_event;
.br
int wait;
.br
int \(**tm_errno;
.RE
.LP
.B
int tm_notify(tm_signal)
.RS 6
int tm_signal;
.RE
.LP
.B
int tm_spawn(argc, argv, envp, where, tid, event)
.RS 6
int argc;
.br
char \(**\(**argv;
.br
char \(**\(**envp;
.br
tm_node_id where;
.br
tm_task_id \(**tid;
.br
tm_event_t \(**event;
.RE
.LP
.B
int tm_kill(tid, sig, event)
.RS 6
tm_task_id tid;
.br
int sig;
.br
tm_event_t \(**event;
.RE
.LP
.B
int tm_obit(tid, obitval, event)
.RS 6
tm_task_id tid;
.br
int \(**obitval;
.br
tm_event_t \(**event;
.RE
.LP
.B
int tm_taskinfo(node, tid_list, list_size, ntasks, event)
.RS 6
tm_node_id node;
.br
tm_task_id \(**tid_list;
.br
int list_size;
.br
int \(**ntasks;
.br
tm_event_t \(**event;
.RE
.LP
.B
int tm_atnode(tid, node)
.RS 6
tm_task_id tid;
.br
tm_node_id \(**node;
.RE
.LP
.B
int tm_rescinfo(node, resource, len, event)
.RS 6
tm_node_id node;
.br
char \(**resource;
.br
int len;
.br
tm_event_t \(**event;
.RE
.LP
.B
int tm_publish(name, info, len, event)
.RS 6
char \(**name;
.br
void \(**info;
.br
int len;
.br
tm_event_t \(**event;
.RE
.LP
.B
int tm_subscribe(tid, name, info, len, info_len, event)
.RS 6
tm_task_id tid;
.br
char \(**name;
.br
void \(**info;
.br	
int len;
.br
int \(**info_len;
.br
tm_event_t \(**event;
.RE
.LP
.B
int tm_attach(jobid, cookie, pid, tid, host, port)
.RS 6
char \(**jobid;
.br
char \(**cookie;
.br
pid_t pid;
.br
tm_task_id \(**tid;
.br
char \(**host;
.br
int port;
.RE
.LP
.B
int tm_finalize()

.SH DESCRIPTION
.LP
These functions provide a partial implementation of the task
management interface part of the PSCHED API.  In PBS, MOM
provides the task manager functions.  This library opens a
tcp socket to the MOM running on the local host and sends
and receives messages using the DIS protocol (described in
the PBS IDS).  The 
.B tm 
interface can only be used by a process within a PBS job.
.LP
The PSCHED Task Management API description used to create this
library was committed to paper on November 15, 1996 and was
given the version number 0.1.  Changes may have taken place since
that time which are not reflected in this library.
.LP
The API description uses several data types that it purposefully
does not define.  This was done so an implementation would not be
confined in the way it was written.  For this specific work,
the definitions follow:
.sp
.nf
typedef	int			tm_node_id;	/* job-relative node id */
#define	TM_ERROR_NODE	((tm_node_id)-1)

typedef	int			tm_event_t;	/* > 0 for real events */
#define	TM_NULL_EVENT	((tm_event_t)0)
#define	TM_ERROR_EVENT	((tm_event_t)-1)

typedef	unsigned long	tm_task_id;
#define	TM_NULL_TASK	(tm_task_id)0
.fi
.LP
There are a number of error values defined as well:
.na
TM_SUCCESS, TM_ESYSTEM, TM_ENOEVENT, TM_ENOTCONNECTED, TM_EUNKNOWNCMD,
TM_ENOTIMPLEMENTED, TM_EBADENVIRONMENT, TM_ENOTFOUND.
.ad
.LP

.B tm_init(\|)
initializes the library by opening a socket to the MOM on the local
host and sending a TM_INIT message, then waiting for the reply.
The
.IR info
parameter has no use and is included to conform with the PSCHED
document.  The
.IR roots
pointer will contain valid data after the function returns and
has the following structure:
.sp
.nf
struct	tm_roots {
	tm_task_id	tm_me;
	tm_task_id	tm_parent;
	int		tm_nnodes;
	int		tm_ntasks;
	int		tm_taskpoolid;
	tm_task_id	*tm_tasklist;
};
.fi
.sp
.IP tm_me 20
The task id of this calling task.
.IP tm_parent 20
The task id of the task which spawned this task or TM_NULL_TASK if
the calling task is the initial task started by PBS.
.IP tm_nnodes 20
The number of nodes allocated to the job.
.IP tm_ntasks 20
This will always be 0 for PBS.
.IP tm_taskpoolid 20
PBS does not support task pools so this will always be -1.
.IP tm_tasklist 20
This will be NULL for PBS.
.LP
The
.IR tm_ntasks ,
.IR tm_taskpoolid
and
.IR tm_tasklist
fields are not filled with data specified by the PSCHED document.  PBS does
not support task pools and, at this time, does not return information
about current running tasks from
.B tm_init.
There is a separate call to get information for current running tasks called
.B tm_taskinfo
which is described below.  The return value from
.B tm_init
is TM_SUCCESS if the library initialization was successful, or an error
is returned otherwise.
.LP
.B tm_nodeinfo(\|)
places a pointer to a malloc'ed
array of tm_node_id's in the pointer pointed at by
.IR list .
The order of the tm_node_id's in
.IR list
is the same as that specified to MOM in the "exec_host" attribute.  The
int pointed to by
.IR nnodes
contains the number of nodes allocated to the job.
This is information that is returned during initialization and does
not require communication with MOM.  If
.B tm_init
has not been called, TM_ESYSTEM is returned, otherwise TM_SUCCESS is
returned.
.LP
.B tm_poll(\|)
is the function which will retrieve information about the task management
system to locations specified when other routines request an action
take place.  The bookkeeping for this is done by generating an
.IR event
for each action.  When the task manager (MOM) sends a message that an
action is complete, the event is reported by
.B tm_poll
and information is placed where the caller requested it.
The argument
.IR poll_event
is meant to be used to request a specific event.  This implementation
does not use it and it must be set to TM_NULL_EVENT or an error
is returned.  Upon return, the argument
.IR result_event
will contain a valid event number or TM_ERROR_EVENT on error.  If
.IR wait
is zero and there are no events to report,
.IR result_event
is set to TM_NULL_EVENT.  If
.IR wait
is non-zero an there are no events to report, the function will block
waiting for an event.  If no local error takes place, TM_SUCCESS is
returned.  If an error is reported by MOM for an event, then the argument
.IR tm_errno
will be set to an error code.
.LP
.B tm_notify(\|)
is described in the PSCHED documentation, but is not implemented for
PBS yet.  It will return TM_ENOTIMPLEMENTED.
.LP
.B tm_spawn(\|)
sends a message to MOM to start a new task.  The node id of the
host to run the task is given by
.IR where .
The parameters
.IR argc ,
.IR argv
and
.IR envp
specify the program to run and its arguments and environment very
much like
.B exec(\|).
The full path of the program executable must be given by
.IR argv[0]
and the number of elements in the argv array is given by
.IR argc .
The array
.IR envp
is NULL terminated.  The argument
.IR event
points to a tm_event_t variable which is filled in with an event
number.  When this event is returned by
.B tm_poll ,
the tm_task_id pointed to by
.IR tid
will contain the task id of the newly created task.
.LP
.B tm_kill(\|)
sends a signal specified by
.IR sig
to the task
.IR tid
and puts an event number in the tm_event_t pointed to by
.IR event .
.LP
.B tm_obit(\|)
creates an event which will be reported when the task
.IR tid
exits.  The int pointed to by
.IR obitval
will contain the exit value of the task when the event is reported.
.LP
.B tm_taskinfo(\|)
returns the list of tasks running on the node specified by
.IR node .
The PSCHED documentation mentions a special ability to retrieve
all tasks running in the job.  This is not supported by PBS.
The argument
.IR tid_list
points to an array of tm_task_id's which contains
.IR list_size
elements.  Upon return,
.IR event
will contain an event number.  When this event is polled, the int
pointed to by
.IR ntasks
will contain the number of tasks running on the node and the array
will be filled in with tm_task_id's.  If
.IR ntasks
is greater than
.IR list_size ,
only
.IR list_size
tasks will be returned.
.LP
.B tm_atnode(\|)
will place the node id where the task
.IR tid
exists in the tm_node_id pointed to by
.IR node .
.LP
.B tm_rescinfo(\|)
makes a request for a string specifying the resources available on
a node given by the argument
.IR node .  
The string is returned in the buffer pointed to by
.IR resource
and is terminated by a NUL character unless the number of characters
of information is greater than specified by
.IR len .
The resource string PBS returns is formatted as follows:
.sp
A space separated set of strings from the
.B uname
system call.  The order of the strings is 
.B sysname,
.B nodename,
.B release,
.B version,
.B machine.
.sp
A comma separated set of strings giving the components of the
"Resource_List" attribute of the job, preceded by a colon (:).
Each component has the
resource name, an equal sign, and the limit value.
.LP
.B tm_publish(\|)
causes
.IR len
bytes of information pointed at by
.IR info
to be sent to the local MOM to be saved under the name given by
.IR name .
.LP
.B tm_subscribe(\|)
returns a copy of the information named by
.IR name
for the task given by
.IR tid .
The argument
.IR info
points to a buffer of size
.IR len
where the information will be returned.  The argument
.IR info_len
will be set with the size of the published data.  If this is larger
than the supplied buffer, the data will have been truncated.
.LP
.B tm_attach(\|)
commands MOM to create a new PBS "attached task" out of a session running on MOM's host.
The 
.IR jobid
parameter specifies the job which is to have a new task attached.  If it is NULL, the system 
will try to determine the correct 
.IR jobid.
The 
.IR cookie
parameter must be NULL.  The 
.IR pid
parameter must be a non-zero process id for the process which is to be 
added to the job specified by 
.IR jobid.
If 
.IR tid
is non-NULL, it will be used to store the task id of the new task.  The 
.IR host
and 
.IR port 
parameters specify where to contact MOM.  
.IR host
should be NULL.  The return value will be 0 if a new 
task has been successfully
created and non-zero on error.  The return value will be one of the 
TM error numbers defined in 
.B tm.h
as follows:
   TM_ESYSTEM          MOM cannot be contacted
   TM_ENOTFOUND        No matching job was found
   TM_ENOTIMPLEMENTED  The call is not implemented/supported
   TM_ESESSION         The session specified is already attached
   TM_EUSER            The calling user is not permitted to attach
   TM_EOWNER           The process owner does not match the job
   TM_ENOPROC          The process does not exist
.LP
.B tm_finalize(\|)
may be called to free any memory in use by the library and close
the connection to MOM.
.SH SEE ALSO
pbs_mom(8B),
pbs_sched(8B)


================================================
FILE: doc/man8/mpiexec.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH mpiexec 8B "26 May 2020" Local "PBS Professional"
.SH NAME
.B mpiexec 
\- run MPI programs under PBS on Linux

.SH SYNOPSIS
.B mpiexec 

.B mpiexec 
--version

.SH DESCRIPTION
The PBS 
.B mpiexec
command provides the standard mpiexec interface on a system
running supported versions of Performance Suite.  
If executed on a different system, it will assume
it was invoked by mistake.  In this case it will use the value of
.B PBS_O_PATH
to search for the correct mpiexec.  If one is found, the PBS 
.B mpiexec 
will
exec it.

The PBS
.B mpiexec
calls the HPE mpirun(1).  

It is transparent to the user; MPI jobs submitted outside of PBS will
run as they would normally.  MPI jobs can be launched across multiple
HPE machines.  PBS will manage, track, and cleanly terminate multi-host MPI
jobs.  PBS users can run MPI jobs within specific partitions.

If CSA has been configured and enabled, PBS will collect accounting
information on all tasks launched by an MPI job.  CSA information will
be associated with the PBS job ID that invoked it, on each execution
host.

If the 
.B PBS_MPI_DEBUG 
environment variable's value has a nonzero
length, PBS will write debugging information to standard output.

.SH USAGE 
The PBS
.B mpiexec 
command presents the mpiexec interface described in section 
"4.1 Portable MPI Process Startup" of the "MPI-2: Extensions 
to the Message-Passing Interface" document in 
http://www.mpi-forum.org/docs/mpi-20-html/node42.htm

.SH OPTIONS
.IP "--version" 8
The 
.B mpiexec
command returns its PBS version information and exits.
This option can only be used alone.

.SH REQUIREMENTS
System running a supported version of Performance Suite.

PBS uses HPE's mpirun(1) command to launch MPI jobs.  HPE's mpirun
must be in the standard location.

The location of 
.B pbs_attach() 
on each node of a multinode MPI job
must be the same as it is on the mother superior node.

In order to run multihost jobs, the HPE Array Services must be
correctly configured.  HPE systems communicating via HPE's Array
Services must all use the same version of the sgi-arraysvcs package.
HPE systems communicating via HPE's Array Services must have been
configured to interoperate with each other using the default array.
See HPE's array_services(5) man page.

.SH ENVIRONMENT VARIABLES
The PBS 
.B mpiexec 
checks the 
.B PBS_MPI_DEBUG 
environment variable.  If
this variable has a nonzero length, debugging information is written.

The 
.B PBS_ENVIRONMENT 
environment variable is used to determine whether
.B mpiexec 
is being called from within a PBS job.

The PBS 
.B mpiexec 
uses the value of 
.B PBS_O_PATH 
to search for the correct
.B mpiexec 
if it was invoked by mistake.

.SH PATH
PBS' 
.B mpiexec 
is located in 
.I PBS_EXEC/bin/mpiexec.


.SH SEE ALSO
HPE man pages: 
HPE's mpirun(1), 
HPE's mpiexec_mpt(1),
HPE's array_services(5)
.LP
PBS man pages:
pbs_attach(8B)


================================================
FILE: doc/man8/pbs.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs 
\- Start, stop, restart, or get the PIDs of PBS daemons


.SH SYNOPSIS
.B pbs 
[start|stop|restart|status] 


.SH DESCRIPTION
The
.B pbs
command starts, stops or restarts all PBS daemons on the local machine, or
reports the PIDs of all daemons when given the 
.I status
argument.  Does not affect other hosts.

You can start, stop, restart, or status the PBS daemons using the 
.B systemctl
command.

.B Caveats
.br
This command operates only on daemons that are marked as active
in pbs.conf.  For example, if PBS_START_MOM is set to 0 in the local
pbs.conf, this command will not operate on pbs_mom, and will not
start, stop, or restart pbs_mom.

This command is typically placed in /etc/init.d so that 
PBS starts up automatically.  

.B Required Privilege
.br
Root privilege is required to use this command.

.SH ARGUMENTS

.IP "restart" 10
All daemons on the local machine are stopped, then they are restarted.
PBS reports the name of the license server and the 
number and type of licenses available.

.IP "start" 10
Each daemon on the local machine is started.  PBS reports the number
and type of licenses available, as well as the name of the license
server.  Any running jobs are killed.

.IP "status" 10
PBS reports the PID of each daemon on the local machine.

.IP "stop" 10
Each daemon on the local machine is stopped, and its PID is reported.


.SH SEE ALSO
pbs_mom(8B), pbs_server(8B), pbs_sched(8B), and pbs_comm(8B)


================================================
FILE: doc/man8/pbs.conf.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs.conf 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs.conf
- PBS configuration parameters

.SH DESCRIPTION
The 
.I /etc/pbs.conf 
file contains PBS configuration parameters.  You may also set these using
environment variables.  Environment variables override settings in 
.I pbs.conf.

To specify an alternate location for 
.I pbs.conf, 
you may set 
.I PBS_CONF_FILE in your environment.

.SH CONFIGURATION PARAMETERS

.IP PBS_AUTH_METHOD 
Authentication method to be used by PBS. Allowed values are
"munge" and "resvport" (case-insensitive). Defaults to "resvport".

.IP PBS_AUTH_SERVICE_USERS
List of daemon users allowed to connect to the communication daemon.
Defaults to "root". 

.IP PBS_BATCH_SERVICE_PORT  
Port on which server listens.  Default: 15001

.IP PBS_BATCH_SERVICE_PORT_DIS      
DIS port on which server listens.

.IP PBS_COMM_LOG_EVENTS     
Communication daemon log mask.  
.br
Default: 511

.IP PBS_COMM_ROUTERS        
Tells a 
.I pbs_comm 
the location of the other 
.I pbs_comms.

.IP PBS_COMM_THREADS        
Number of threads for communication daemon.

.IP PBS_CONF_REMOTE_VIEWER  
Specifies remote viewer client.  If not specified, PBS uses native
Remote Desktop client for remote viewer.  Set on submission host(s).
Supported on Windows only.

.IP PBS_CORE_LIMIT  
Limit on corefile size for PBS daemons.  Can be set to an integer
number of bytes or to the string "unlimited".

.IP PBS_DATA_SERVICE_PORT   
Used to specify non-default port for connecting to data service.  Default: 15007

.IP PBS_ENVIRONMENT 
Location of pbs_environment file.

.IP PBS_EXEC        
Location of PBS 
.I bin 
and 
.I sbin 
directories.

.IP PBS_HOME        
Location of PBS working directories.

.IP PBS_LEAF_NAME   
Tells endpoint what hostname to use for network.

.IP PBS_LEAF_ROUTERS        
Location of endpoint's 
.I pbs_comm 
daemon(s).

.IP PBS_LOCALLOG    
Enables logging to local PBS log files.

.IP PBS_MAIL_HOST_NAME      
Used in addressing mail regarding jobs and reservations that is sent
to users specified in a job or reservation's Mail_Users attribute.
Optional.  Must be a fully qualified domain name.  Cannot contain a
colon (":").  

.IP PBS_MANAGER_SERVICE_PORT        
Port on which MoM listens.  Default: 15003

.IP PBS_MOM_HOME    
Location of MoM working directories.

.IP PBS_MOM_SERVICE_PORT    
Port on which MoM listens. Default: 15002

.IP PBS_OUTPUT_HOST_NAME 
Host to which all job standard output and
standard error are delivered.  If specified in 
.I pbs.conf 
on a job
submission host, the value of PBS_OUTPUT_HOST_NAME is used in the host
portion of the job's 
.I Output_Path 
and 
.I Error_Path 
attributes.  If the
job submitter does not specify paths for standard output and standard
error, the current working directory for the 
.I qsub 
command is used, and
the value of PBS_OUTPUT_HOST_NAME is appended after an at sign ("@").
If the job submitter specifies only a file path for standard output
and standard error, the value of PBS_OUTPUT_HOST_NAME is appended
after an at sign ("@").  If the job submitter specifies paths for
standard output and standard error that include host names, the
specified paths are used.  Optional.  Must be a fully qualified domain
name.  Cannot contain a colon (":").  

.IP PBS_PRIMARY     
Hostname of primary server.  Used only for failover configuration.  
Overrides PBS_SERVER_HOST_NAME.

.IP PBS_INTERACTIVE_AUTH_METHOD
Authentication method to be used when establishing a qsub interactive session.
Supported methods are "resvport" and "munge" (case-insensitive). Defaults to "resvport".

.IP PBS_CP 
Location of local copy command. Default is cp on Linux systems and xcopy on Windows.

.IP PBS_RCP
Location of rcp command if rcp is used.

.IP PBS_SCHEDULER_SERVICE_PORT      
Port on which default scheduler listens.  Default value: 15004

.IP PBS_SCP 
Location of scp command if scp is used; setting this parameter causes
PBS to first try scp rather than rcp for file transport.

.IP PBS_SCP_ARGS
Arguments for the scp command if scp is used; if not set, defaults will be used.

.IP PBS_SECONDARY   
Hostname of secondary server.  Used only for failover configuration.  
Overrides PBS_SERVER_HOST_NAME.

.IP PBS_SERVER 
Hostname of host running the server.  
If the short name of the server host resolves to the
correct IP address, you can use the short name for the value of the
PBS_SERVER entry in pbs.conf.  If only the FQDN of the server host
resolves to the correct IP address, you must use the FQDN for the
value of PBS_SERVER.  Overridden by PBS_SERVER_HOST_NAME and
PBS_PRIMARY.  Cannot be longer than 255 characters.  

.IP PBS_SERVER_HOST_NAME
The FQDN of the server host.  Used by clients to contact server.
Overridden by PBS_PRIMARY and PBS_SECONDARY failover parameters.
Overrides PBS_SERVER parameter.  Optional.  Must be a fully qualified
domain name.  Cannot contain a colon (":").  

.IP PBS_SMTP_SERVER_NAME    
Name of SMTP server PBS will use to send mail.  Should be a fully
qualified domain name.  Cannot contain a colon (":").  

.IP PBS_START_COMM  
Set to 1 if a communication daemon is to run on this host.

.IP PBS_START_MOM   
Set to 1 if a MoM is to run on this host.

.IP PBS_START_SCHED 
.B Deprecated. 
Set to 1 if the scheduler is to run on this host.  Overridden by 
scheduler's 
.I scheduling
attribute.

.IP PBS_START_SERVER        
Set to 1 if the server is to run on this host.

.IP PBS_SYSLOG      
Controls use of syslog facility.

.IP PBS_SYSLOGSEVR  
Filters syslog messages by severity.

.IP PBS_TMPDIR      
Root directory for temporary files for PBS components.


================================================
FILE: doc/man8/pbs_account.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_account 8B "18 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_account 
For Windows.  Manage PBS service account
.SH SYNOPSIS
.B pbs_account 
[-a <PBS service account name>] [-c [<password>]] [--ci] 
.RS 12
[--instid <instance ID>] [-o <output path>] 
.br
[-p [<password>]] [--reg <service path>] [-s] 
.br
[--unreg <service path>]
.RE

.SH DESCRIPTION
The
.B pbs_account
command is used to manage the PBS service account. It is used to
create the account, set or validate the account password, add
privileges to the account, and register or unregister the account with
the SCM.

.SH Permissions
This command can be run by administrators only.

.SH Platforms
This command is available on Windows only.

.SH Caveats
Using 
.B pbs_account --unreg
and
.B pbs_account --reg 
stops and restarts MoM, which can kill jobs.

.SH OPTIONS
.IP "-a <account name>" 15
Specifies service account name.

.IP "-c [<password>]" 15  
If specified account does not exist, creates the account with the password.

If specified account exists, validates password against it.

Gives necessary privileges to the specified account: 
.I Create Token Object, Replace Process Level Token, Log on as a Service, 
and 
.I Act as Part of the Operating System

If password is not specified, user is prompted for password.

.IP "--ci" 15
Informational only.  Prints actions taken by pbs_account while
creating PBS service account while operations are performed.

.IP "instid <instance ID>" 15
Specifies the instance ID when registering or unregistering multiple
instances of a service.  Example:
.RS 18
pbs_account --reg "C:\\Program Files (x86)\\PBS Pro_2\\exec\\sbin\\pbs_mom" --instid 2 -a <username> -p <password>
.br
pbs_account --unreg "C:\\Program Files (x86)\\PBS Pro_2\\exec\\sbin\\pbs_mom" --instid 2

.RE

.IP "-o <output path>" 15   
Prints stdout and stderr messages in specified output path.

.IP "-p [<password >]" 15
Updates the PBS service account password. If no password is specified,
the user is prompted for a password.

.IP "--reg <path to service>" 15
Registers the PBS service with the SCM, instructing it to run the services 
under the PBS service account.  
.I path to service
must be in double quotes.  Restarts MoM. 

.IP "-S" 15
Adds necessary privileges to the PBS service account. Grants the
"Create Token Object", "Replace Process Level Token", "Log On as a
Service", and "Act as Part of the Operating System" privileges to PBS
service account.

.IP "--unreg <path to service>" 15
Unregisters the PBS service with the SCM.  
.I path to service
must be in double quotes.  Stops MoM.

.IP "(no options)" 15
Prints name of PBS service account, if it exists.  Exit value is 0.


.SH Examples

To create the PBS service account:
.RS 4
pbs_account -c -s -p <password>
.RE
To change the PBS service account:
.RS 4
pbs_account [--reg <service path>] -a <PBS service account name>
.RE
To register the MoM service:
.RS 4
.nf
pbs_account --reg "\\Program Files\\PBS Pro\\exec\\sbin\\pbs_mom.exe" -p <password>
.fi
.RE

.SH Exit Value

.IP "Zero" 15
Upon success


================================================
FILE: doc/man8/pbs_attach.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_attach 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_attach 
\- attach a session ID to a PBS job


.SH SYNOPSIS
.B Linux
.br
.B pbs_attach 
[-j <job ID>] [-m <port>] -p <PID>
.br
.B pbs_attach 
[-j <job ID>] [-m <port>] [-P] [-s] <cmd> [<arg> ...] 
.br
.B pbs_attach 
--version

.B Windows
.br
.B pbs_attach 
[-c <path to script>] [-j <job ID>] [-m <port>] -p <PID>
.br
.B pbs_attach
[-c <path to script>] [-j <job ID>] [-m <port>] [-P] [-s] 
.RS 11
<cmd> [<arg> ...] 
.RE
.br
.B pbs_attach 
--version

.SH DESCRIPTION
The
.B pbs_attach
command associates the processes in a session with 
a PBS job by attaching the session ID to the job.  This allows PBS MoM
to monitor and control those processes.

MoM uses process IDs to determine session IDs, which are
put into MoM's task list (attached to the job.)  All process IDs in 
a session are then associated with the job.

When a command
.I cmd
is given as an operand, 
the 
.B pbs_attach
process becomes the parent process of 
.I cmd, 
and the session ID of 
.B pbs_attach
is attached to the job.  


.SH OPTIONS
.IP "-c <path to script>" 15
Windows only.  Specified command is invoked using a new command shell.
In order to spawn and attach built-in DOS commands such as set or
echo, it is necessary to open the task using a 
.I cmd 
shell.  The new
command shell, 
.I cmd.exe
, is attached as a task to the PBS job.  The
.B pbs_attach 
command spawns a program using a new command shell when
attaching a batch script, or when invoked with the 
.I -c 
option.
.IP "-j <job ID>" 15
The job ID to which the session ID is to be attached.
If 
.I job ID
is not specified,
a best effort is made to determine the job to which to attach
the session.
.IP "-m <port>" 15
The port at which to contact MOM.  Default: value of PBS_MANAGER_SERVICE_PORT
from pbs.conf
.IP "-p <PID>" 15
Process ID whose session ID is to be attached to the job.  
Default: process ID of pbs_attach.
Cannot be used with the 
.I -P 
or
.I -s
options or the 
.I cmd
operand.

.IP "-P" 15
Attach sessions of both 
.B pbs_attach 
and the parent of 
.B pbs_attach 
to job.  
When used with 
.I -s
option, 
the sessions of the new
.B fork()
ed
.B pbs_attach
and its parent, which is 
.B pbs_attach,
are attached to the job.  Cannot be used with the 
.I -p
or
.I -s
options or the 
.I cmd
operand.

.IP "-s" 15
Starts a new session and attaches it to the job: 
.B pbs_attach
calls 
.B fork(), 
then the child
.B pbs_attach
first calls 
.B setsid() 
and then calls 
.B tm_attach
to attach the new session to the job.  The session ID of the new
.B pbs_attach
is attached to the job.

.IP "--version" 15
The 
.B pbs_attach
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
.IP "cmd" 15 
Name of command whose process ID is to be associated with the job.


.SH EXIT STATUS
.IP "0" 15 
Success
.IP "1" 15
Any error following successful command line processing.
A message is printed to standard error.
.LP
If 
.I cmd
is specified, 
.B pbs_attach 
waits for
.I cmd
to exit, then exits with the exit value of
.I cmd.
.LP
If 
.I cmd
is not specified, 
.B pbs_attach
exits after attaching the session ID(s) to the job.


.SH SEE ALSO
pbs_mom(8B), pbs_tmrsh(8B), setsid(2), tm(3)


================================================
FILE: doc/man8/pbs_comm.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_comm 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_comm 
- start the PBS communication daemon
.SH SYNOPSIS
.B pbs_comm 
[-N] [-r <other routers>] [-t <number of threads>]
.br
.B pbs_comm
--version
.br

.SH DESCRIPTION
The PBS communication daemon, 
.B pbs_comm, 
handles communication between daemons, except for scheduler-server and
server-server communication, which uses TCP.  The server, scheduler,
and MoMs are connected by one or more pbs_comm daemons.

Available on Linux only.

.SH OPTIONS
.IP "-N" 10
Runs the communication daemon in standalone mode.

.IP "-r <other routers>" 10
List of other 
.B pbs_comm 
daemons to which this
.B pbs_comm 
must connect. This is equivalent to the pbs.conf variable
.I PBS_COMM_ROUTERS. 
The command line overrides the variable.  
.br
Format: <host>[:<port>][,<host>[:<port>]]

.IP "-t" 10
Number of threads the 
.B pbs_comm 
daemon uses.  This
is equivalent to the pbs.conf variable 
.I PBS_COMM_THREADS.  
The command
line overrides the variable.  
.br
Format: Integer

.IP "--version" 10
Prints the PBS version and exits.  This option can only be used alone.

.SH CONFIGURATION PARAMETERS

.IP "PBS_LEAF_ROUTERS" 10
Parameter in /etc/pbs.conf.  Tells an endpoint where to find its
communication daemon.  You can tell each endpoint which communication
daemon it should talk to.  Specifying the port is optional.
.br
Format: PBS_LEAF_ROUTERS=<host>[:<port>][,<host>[:>port>]]

.IP "PBS_COMM_ROUTERS" 10
Parameter in /etc/pbs.conf.  Tells a pbs_comm where to find its fellow
communication daemons.  When you add a communication daemon, you must
tell it about the other pbs_comms in the complex.  When you inform
communication daemons about each other, you only tell one of each pair
about the other.  Do not tell both about each other.  We recommend
that an easy way to do this is to tell each new pbs_comm about each
existing pbs_comm, and leave it at that.
.br
Format: PBS_COMM_ROUTERS=<host>[:<port>][,<host>[:>port>]]

.IP "PBS_COMM_THREADS" 10
Parameter in /etc/pbs.conf.  Tells pbs_comm how many threads to start.
By default, each pbs_comm process starts four threads.  You can
configure the number of threads that each pbs_comm uses.  Usually, you
want no more threads than the number of processors on the host.
.br
Maximum allowed value: 100
.br
Format: Integer
.br
Example: PBS_COMM_THREADS=8

.IP "PBS_COMM_LOG_EVENTS" 10
Parameter in /etc/pbs.conf.  Tells pbs_comm which log mask to use.  By
default, pbs_comm produces few log messages.  You can choose more
logging, usually for troubleshooting.
.br
Format: Integer
.br
Default: 511
.br
Example: PBS_COMM_LOG_EVENTS=<log level>

.IP "PBS_LEAF_NAME" 10
Parameter in /etc/pbs.conf.  Tells endpoint what name to use for
network.  The value does not include a port, since that is usually set
by the daemon.  By default, the name of the endpoint's host is the
hostname of the machine.  You can set the name where an endpoint runs.
This is useful when you have multiple networks configured, and you
want PBS to use a particular network.  TPP internally resolves the
name to a set of IP addresses, so you do not affect how pbs_comm
works.
.br
Format: String
.br
Example: PBS_LEAF_NAME=host1

.IP "PBS_START_COMM" 10
Parameter in /etc/pbs.conf.  Tells PBS init script whether to start a
pbs_comm on this host if one is installed.  When set to 1, pbs_comm is
started.  Just as with the other PBS daemons, you can specify whether
each host should start pbs_comm.
.br
Format: Boolean
.br
Default: 0
.br
Example: PBS_START_COMM=1

.SH COMMUNICATION DAEMON LOGFILES

The pbs_comm daemon creates its log files under $PBS_HOME/comm_logs.
This directory is automatically created by the PBS installer.  

In a
failover configuration, this directory is in the shared PBS_HOME,
and is used by the pbs_comm daemons running on both the primary and
secondary servers.  This directory must never be shared across
multiple pbs_comm daemons in any other case.

The log filename format is yyyymmdd (the same as for other PBS
daemons).  

The log record format is the same as used by other pbs
daemons, with the addition of the thread number and the daemon name in
the log record. The log record format is as follows:
.br
<date and time>;<event code>;<daemon name>(<thread number>);<object
type>;<object name>;<message>

Example: 
.br
03/25/2014
15:13:39;0d86;host1.example.com;TPP;host1.example.com(Thread 2);
Connection from leaf 192.168.184.156:19331, tfd=81 down

.SH SIGNAL HANDLING
The 
.B pbs_comm
daemon handles the following signals:

.IP "HUP" 10
Re-reads the value of
.I PBS_COMM_LOG_EVENTS
from pbs.conf.

.IP "TERM" 10
The 
.B pbs_comm
daemon exits.


================================================
FILE: doc/man8/pbs_dataservice.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_dataservice 8B "19 November 2019" Local "PBS Professional"
.SH NAME
.B pbs_dataservice 
\- start, stop, or check the status of the PBS data service
.SH SYNOPSIS
.B pbs_dataservice 
[start|stop|status]

.SH DESCRIPTION
The
.B pbs_dataservice
command starts, stops, or gets the status of the PBS data service.

.SH Permission
Root privilege is required to use this command. 

.SH Arguments
.IP "start" 15
Starts the PBS data service.

.IP "stop" 15  
Stops the PBS data service.

Can be used only when the PBS server is not running.

.IP "status" 15   
Displays the status of the PBS data service, as follows:

Data service running
.RS 20
"PBS Data Service running"
.RE

.IP " " 15 
Data service not running
.RS 20
"PBS Data Service not running"
.RE

.SH EXIT STATUS
.IP "Zero" 15
Success
.IP "Non-zero" 15
Failure


================================================
FILE: doc/man8/pbs_ds_password.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_ds_password 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_ds_password 
\- set or change data service user account or its password
.SH SYNOPSIS
.B pbs_ds_password 
[-C <username>] [-r]

.SH DESCRIPTION
You can use this command to change the user account or account password 
for the data service.  

.B Passwords
.br
Blank passwords are not allowed.

If you type in a password, make sure it does not contain restricted
characters.  The 
.B pbs_ds_password
command generates passwords
containing the following characters:

0123456789abcdefghijklmnopqrstuvwxyz ABCDEFGHIJKLMNOPQRSTUVWXYZ!@#$%^&*()_+

When creating a password manually, do not use \\ (backslash) or `
(backquote). This can prevent certain commands such as pbs_server,
pbs_ds_password, and printjob from functioning properly, as they rely
on connecting to the database.  

.B Permissions
On Linux, root privilege is required to use this command. On Windows, 
Admin privilege is required.

.B Restrictions
Do not run this command if failover is configured. It is important 
not to inadvertently start two separate instances of the data service 
on two machines, thus potentially corrupting the database.
If failover is configured, stop the secondary server, remove
definitions for PBS_PRIMARY and PBS_SECONDARY from pbs.conf on the
primary server host, start PBS, run pbs_ds_password, stop PBS, replace
the definitions, and start PBS again.

.SH OPTIONS

.IP "-C <username>" 15  
Changes user account for data service to specified account.  Specified
user account must already exist. 
.br

On Linux-based systems, the specified user account must not be root.
.br

On Windows, the specified user account must match the PBS service
account (which can be any user account.)
.br

This option cannot be used while the data service is running. 
.br

Can be used with the 
.I -r
option to automatically generate a password
for the new account.

.IP "-r" 15
Generates a random password. The data service is updated with the new
password. 

Can be used with the -C option.

.IP "(no options)" 15
Asks the user to enter a new password twice. Entries must
match. Updates data service with new password.


.RE
.RE
.RE
.RE
.LP

.SH EXIT STATUS
.IP "Zero" 15
Success
.IP "Non-zero" 15
Failure


================================================
FILE: doc/man8/pbs_hostn.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_hostn 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_hostn 
- report hostname and network address(es)
.SH SYNOPSIS
.B pbs_hostn 
[ -v ] <hostname>
.br
.B pbs_hostn 
--version

.SH DESCRIPTION
The
.B pbs_hostn
command takes a hostname, and reports the results of both 
gethostbyname(3) and gethostbyaddr(3) system calls. Both forward and
reverse lookup of hostname and network addresses need to succeed in order
for PBS to authenticate a host.
.LP
Running this command can assist in
troubleshooting problems related to incorrect or non-standard network
configuration, especially within clusters.
.SH OPTIONS
.IP "-v" 15
Turns on verbose mode.
.LP
.IP "--version" 15
The 
.B pbs_hostn
command returns its PBS version information and exits.
This option can only be used alone.


.SH OPERANDS
.IP "hostname" 15
The
.B pbs_hostn
command accepts a 
.I hostname
operand either in short name form, or in fully qualified
domain name (FQDN) form.
.SH STANDARD ERROR
The
.B pbs_hostn
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP "Zero" 15
Upon successful processing of all the operands presented to the
.B pbs_hostn
command
.LP
.IP "Greater than zero" 15
If the
.B pbs_hostn
command fails to process any operand.

.SH SEE ALSO
pbs_server(8B)


================================================
FILE: doc/man8/pbs_idled.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_idled 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_idled 
\- run PBS daemon that monitors the console and informs pbs_mom of idle time
.SH LINUX SYNOPSIS
.B pbs_idled 
[-D <display>] [-r <reconnect delay>] [-w <wait time>] 
.br
.B pbs_idled
--version
.SH WINDOWS SYNOPSIS
.B pbs_idled 
[start | stop] 
.br
.B pbs_idled
--version

.SH LINUX DESCRIPTION
On Linux, the 
.B pbs_idled 
program monitors an X windows display and communicates the idle time
of the display back to PBS.  If the mouse is moved or a key is
touched, PBS is informed that the vnode is busy.
.br
You should run this program from the system-wide Xsession file, in the
background before the window manager is run.  If this program is run
outside of the Xsession, it will need to be able to make a connection
to the X display.  See the xhost or xauth man pages for a description
of X security.

.SH WINDOWS DESCRIPTION
On Windows, 
.B pbs_idled 
reads its polling interval from a file called
.I idle_poll_time 
which is created by MoM.  The process monitors
keyboard, mouse, and console activity, and updates a file called
.I idle_touch 
when it finds user activity.  The 
.I idle_touch 
file is created by MoM.

.SH LINUX OPTIONS
.IP "-D <display>" 10
The display to connect to and monitor
.IP "-r <reconnect delay>" 10
Time to wait before we try to reconnect to the X display if the previous 
attempt was unsuccessful
.IP "-w <wait time>" 10
Interval between times when the daemon checks for events or pointer movement
.IP "--version" 10
The 
.B pbs_idled
command returns its PBS version information and exits.
This option can only be used alone.
.SH WINDOWS OPTIONS
.IP "start" 10
Starts the 
.B pbs_idled 
process.
.IP "stop" 10
Stops the 
.B pbs_idled 
process.
.IP "--version" 10
The 
.B pbs_idled 
process returns its PBS version information and exits.
This option can only be used alone.

.SH SEE ALSO
pbs_mom(8B), xhost(1), xauth(1)


================================================
FILE: doc/man8/pbs_iff.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_iff 8B "18 October 2017" Local "PBS Professional"
.SH NAME
.B pbs_iff
\- tests authentication with the server
.SH SYNOPSIS
.B pbs_iff 
[-t] <server host> <server port>

.B pbs_iff 
--version
.SH DESCRIPTION
Called from the pbs_connect() IFL API to authenticate a connection
with the PBS server.  Designed to be called internally by PBS commands
and components, to be used by our IFL layer to talk to the server.

If 
.B pbs_iff
cannot authenticate, it returns an error message.

.B Required Privilege
.br
Can be run by any user.

It's a setuid root binary so it runs as the user who requests a
connection to a server but it becomes root so that it can grab a
privileged port.

.SH OPTIONS TO pbs_iff
.IP "-t" 10
Test mode; means test whether 
.B pbs_iff 
can authenticate with the server
.IP "--version" 10
Reports version and exits; can only be used alone

.SH ARGUMENTS TO pbs_iff
.IP "daemon host" 10
Host where server is running
.IP "daemon port" 10
Port on which server is listening; default is 15001

.SH EXIT STATUS
.IP "Zero" 10
If 
.B pbs_iff 
is able to contact the server at the specified port
.IP "Non-zero" 10
If 
.B pbs_iff 
is unable to contact the server at the specified port


================================================
FILE: doc/man8/pbs_interactive.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_interactive 8B "19 October 2017" Local "PBS Professional"
.SH NAME
.B pbs_interactive 
\- For Windows. Register, unregister, or get the version of the PBS_INTERACTIVE service
.SH SYNOPSIS
.B pbs_interactive 
[R | U]
.br
.B pbs_interactive
--version

.SH DESCRIPTION
The
.B pbs_interactive
command registers, unregisters, or gets the version of the PBS_INTERACTIVE service.
The service must be registered manually; the installer does not register it.

On Windows, the PBS_INTERACTIVE service itself monitors logging in and out by users,
starts a pbs_idled process for each user logging in, and stops the pbs_idled process
of each user logging out.

.SH Permission
Admin privilege is required to use this command.

.SH Arguments
.IP "R" 15
Registers the PBS_INTERACTIVE service.

.IP "U" 15  
Unregisters the PBS_INTERACTIVE service.

.IP "--version" 15   
The 
.B pbs_interactive
command returns its version information and exits.
This option can only be used alone.


================================================
FILE: doc/man8/pbs_lamboot.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_lamboot 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_lamboot 
\- PBS front end to LAM's lamboot program

.SH SYNOPSIS
.B pbs_lamboot

.B pbs_lamboot
--version

.SH DESCRIPTION
.B Deprecated.  
The PBS command 
.B pbs_lamboot 
replaces the standard 
.I lamboot
command in a PBS
LAM MPI job, for starting LAM software on each of the 
PBS execution hosts running Linux 2.4 or higher.

Usage is the same as for LAM's
.I lamboot.
All arguments except for
.I bhost 
are passed directly to 
.I lamboot.  
PBS will issue a warning saying that the
.I bhost 
argument is ignored by PBS since input is taken automatically 
from 
.B $PBS_NODEFILE.
The 
.B pbs_lamboot 
program will not redundantly consult the
.B $PBS_NODEFILE
if it has been instructed to boot the nodes using the 
.I tm
module.  This instruction happens when an argument is
passed to
.B pbs_lamboot
containing "-ssi boot tm" or when the 
.B LAM_MPI_SSI_boot 
environment variable exists with the value
.I tm.

.SH OPTIONS
.IP "--version" 8
The 
.B pbs_lamboot
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
The operands for
.B pbs_lamboot 
are the same as for 
.I lamboot.


.SH ENVIRONMENT VARIABLES


.SH PATH
The PATH on remote machines must contain 
.I PBS_EXEC/bin.


.SH SEE ALSO
lamboot(1), tm(3)


================================================
FILE: doc/man8/pbs_mkdirs.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_mkdirs 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_mkdirs
- For Windows. Create, or fix the permissions of, the directories and files used by PBS


.SH SYNOPSIS
.B pbs_mkdirs
.br
.B pbs_mkdirs 
[ mom ]
.br

.SH DESCRIPTION
Runs on Windows only.  If the directories and files used by PBS exist, the 
.B pbs_mkdirs 
command fixes their permissions.  If the directories and/or files do not
exist, the 
.B pbs_mkdirs 
command creates them, with the correct
permissions.  The 
.B pbs_mkdirs 
command always examines the following directories and files:
.RS 5
pbs.conf
.br
PBS_EXEC
.br
PBS_HOME/spool
.br
PBS_HOME/undelivered
.br
PBS_HOME/pbs_environment
.RE
.B Required Privilege
.br
You must have Administrator privilege to run this command.

.SH OPTIONS
.IP "mom" 5
The 
.B pbs_mkdirs 
command examines the following additional items:
.RS 10
PBS_HOME/mom_priv
.br
PBS_HOME/mom_logs
.RE


.IP "(no options)" 5
The 
.B pbs_mkdirs 
command examines all of the files and directories
specified for the 
.I mom
option.


.SH SEE ALSO
pbs_probe(8B)


================================================
FILE: doc/man8/pbs_mom.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_mom 8B "1 March 2021" Local "PBS Professional"
.SH NAME
.B pbs_mom 
- run the PBS job monitoring and execution daemon
.SH SYNOPSIS
.B pbs_mom 
[-a <alarm timeout>] 
[-C <checkpoint directory>] 
.RS 8
[-c <config file>] 
[-d <MoM home directory>] 
[-L <logfile>] 
.br
[-M <MoM service port>] 
[-N]
[-n <nice value>] 
[-p|-r] 
.br
[-R <inter-MoM communication port>] 
[-S <server port>]
.br
[-s <options>]
.RE
.B pbs_mom
--version

.SH DESCRIPTION
The
.B pbs_mom
command starts the PBS job monitoring and execution daemon, called
MoM.  

The standard MoM starts jobs on the execution host, monitors and reports
resource usage, enforces resource usage limits, and notifies the
server when the job is finished.  The MoM also runs any prologue
scripts before the job runs, and runs any epilogue scripts after the
job runs.  

The MoM performs any communication with job tasks and with other MoMs.
The MoM on the first vnode on which a job is running manages
communication with the MoMs on the remaining vnodes on which the job
runs.

The MoM manages one or more vnodes.  PBS may treat a  host as 
a set of virtual nodes, in which case one MoM 
manages all of the host's vnodes.  

.B Logging
.br
The MoM's log file is in PBS_HOME/mom_logs.  The MoM writes an
error message in its log file when it encounters any error.  If it
cannot write to its log file, it writes to standard error.  The
MoM writes events to its log file.  
The MoM writes its PBS 
version and build information to the logfile whenever it starts up or 
the logfile is rolled to a new file.

.B Required Permission
.br
The executable for 
.B pbs_mom
is in PBS_EXEC/sbin, and can be run only by root on Linux, and Admin 
on Windows.


.B HPE machine Running Supported Versions of Performance Software - 
Message Passing Interface
.br

A PBS job can run across multiple machines that run supported versions 
of Performance Software - Message Passing Interface.

PBS can run using HPE's MPI (MPT) over InfiniBand.
.LP

.B Effect on Jobs of Starting MoM
.br
When MoM is started or restarted, her default behavior is to leave
any running processes running, but to tell the PBS server to requeue
the jobs she manages.  MoM tracks the process ID of jobs across 
restarts.

In order to have all jobs killed and requeued, use the 
.I r
option when starting or restarting MoM.

In order to leave any running processes running, and not to requeue
any jobs, use the 
.I p
option when starting or restarting MoM.

.SH OPTIONS
.IP "-a <alarm timeout>" 10
Number of seconds before alarm timeout.  
Whenever a resource request is processed, an alarm is set for the
given amount of time.  If the request has not completed before 
.I alarm timeout, 
the OS generates an alarm signal and sends it to MoM.  
Default: 10 seconds.  Format: integer.

.IP "-C <checkpoint directory>" 10
Specifies the path of the directory where MoM creates job-specific
subdirectories used to hold each job's restart files.  MoM passes this
path to checkpoint and restart scripts.  Overrides other checkpoint
path specification methods.  Any directory specified with the
.I -C 
option must be owned, readable, writable, and executable by root only 
.I (rwx,---,---, or 0700), 
to protect the security of the checkpoint files.  See the 
.I -d 
option.  Format: string.
.br
Default: PBS_HOME/spool/checkpoint.  

.IP "-c <config file>" 10
MoM will read this alternate default configuration file upon starting.
If this is a relative file name it will be relative to
PBS_HOME/mom_priv.  If the specified file cannot be opened,
.B pbs_mom 
will abort.  See the 
.I -d 
option.

MoM's normal operation, when the -c option is not given, is to attempt
to open the default configuration file PBS_HOME/mom_priv/config.
If this file is not present,
.B pbs_mom 
will log the fact and continue.

.IP "-d <MoM home directory>" 10
Specifies the path of the 
.I directory 
to be used in place of PBS_HOME by
.B pbs_mom.
The default directory is given by $PBS_HOME.  Format: string.

.IP "-L <logfile>" 10
Specifies an absolute path and filename for the log file.
The default is a file named for the current date in PBS_HOME/mom_logs/.
See the
.I -d
option.  Format: string.

.IP "-M <MoM port>" 10
Specifies the number of the port on which MoM will
listen for server requests and instructions.  Overrides 
PBS_MOM_SERVICE_PORT setting in pbs.conf and environment variable.
Default: 15002.
Format: integer port number.

.IP "-n <nice value>" 10
Specifies the priority for the
.B pbs_mom 
daemon.  Format: integer.

.IP "-N" 10
Specifies that when starting, MoM should not detach from the
current session.

.IP "-p" 10
Specifies that when starting, MoM should allow any running jobs
to continue running, and not have them requeued.  This option 
can be used for single-host jobs only; multi-host jobs cannot
be preserved.
Cannot be used with the
.I -r
option.  
MoM is not the parent of these jobs.

.IP "-r" 10
Specifies that when starting, MoM should requeue any rerunnable jobs and 
kill any non-rerunnable jobs that 
she was tracking, and mark the 
jobs as terminated.  Cannot be used with the
.I -p
option.  
MoM is not the parent of these jobs.  

It is not recommended to use the 
.I -r 
option after a reboot, because process IDs of new, legitimate tasks
may match those MoM was previously tracking.  If they match and MoM is
started with the 
.I -r
option, MoM will kill the new tasks.

.IP "-R <inter-MoM communication port>" 10
Specifies the number of the port on which MoM will listen for pings,
resource information requests, communication from other MoMs, etc.  
Overrides PBS_MANAGER_SERVICE_PORT setting in pbs.conf and environment variable.
Default:  15003.  Format: integer port number.

.IP "-S <server port>" 10
Specifies the port number on which 
.B pbs_mom
initially contacts the server.  Default: 15001.  Format: integer port number.

.IP "-s <file options>" 5
If you are running the cgroups hook, make sure that the vnode names in any Version 2 
configuration file exactly match those in the output of pbsnodes -av.
This option lets you add, delete, and display MoM Version 2 configuration files.  
See 
.B CONFIGURATION FILES.  
Run this command at the host you want to change.
The 
.I file options 
are used this way:
.RS
.IP "-s insert <Version 2 filename> <inputfile>" 5
Reads 
.I inputfile 
and copies it to a Version 2 
.B pbs_mom
configuration file with the filename 
.I Version 2 filename.  
For example, to create a Version 2 file named "Myhost_V2":

.B pbs_mom -s insert <Myhost_V2> <myhost_v2_input>

If a configuration file with the specified 
.I Version 2 filename 
already exists,
the operation fails, and
.B pbs_mom
writes a diagnostic and exits with a nonzero status.  
Configuration files whose names begin with
the prefix "PBS" are reserved.  You cannot add a file
whose name begins with "PBS";
.B pbs_mom 
will print a diagnostic message and exit with a nonzero status.  

.IP "-s remove <Version 2 filename>" 5
Removes the configuration file named 
.I Version 2 filename 
if it exists.  Example:

.B pbs_mom -s remove <Version 2 filename> 

If the file does not exist or if you try to remove a file with the reserved "PBS"
prefix, the operation fails, and
.B pbs_mom 
prints a diagnostic and exits with a nonzero status.  

.IP "-s show <Version 2 filename>" 5
Prints the contents of the named file to standard output.  Example:

.B pbs_mom -s show <Version 2 filename> 

If 
.I Version 2 filename 
does not exist, the
operation fails, and 
.B pbs_mom
writes a diagnostic and exits with a nonzero status.  

.IP "-s list" 5
MoM lists the PBS-prefixed and site-defined configuration
files in the order in which they are executed.  Example:

.B pbs_mom -s list

.LP

.B WINDOWS:
.RS 5
Under Windows, use the 
.I -N
option so that 
.B pbs_mom 
will start up as a standalone
program.  For example:

.B pbs_mom -N -s insert <Version 2 filename> <inputfile>

or 

.B pbs_mom -N -s list

.RE


.RE

.LP
.IP "--version" 10
The 
.B pbs_mom
command returns its PBS version information and exits.
This option can only be used alone.

.SH CONFIGURATION FILES
MoM's configuration information can be contained in configuration
files of three types: 
.I default, PBS-prefixed, 
and 
.I site-defined.  
The
default configuration file is usually PBS_HOME/mom_priv/config.  The
"PBS" prefix is reserved for files created by PBS.  Site-defined
configuration files are those created by the site administrator.
MoM reads the configuration files at startup and reinitialization.  
The files are processed in this order:
.br
     The default configuration file
.br
     PBS-prefixed configuration files
.br
     Site-defined configuration files
.br

The contents of a file read later override the contents of a file read earlier.
For example, to change flags, create a script "update_flags"
then use the 
.I -s insert
option:
.RS 4
.B pbs_mom -s insert update_script update_flags
.RE
This adds the configuration file "update_script".
Configuration files can be added, deleted and displayed using
the 
.I -s
option.  

MoM's configuration files can use either the syntax shown 
below under 
.B Default Syntax and Contents
or the syntax for describing 
.I vnodes
shown in 
.B Vnode Syntax.

.B Location
.br
The default configuration file is in PBS_HOME/mom_priv/.

PBS places PBS-prefixed and site-defined configuration files 
in an area that is private to each installed instance of PBS.
This area is relative to the default PBS_HOME.  Note that the 
.I -d 
option changes where MoM looks for PBS_HOME.

The 
.I -c
option will change which default configuration file MoM reads.

Site-defined configuration files can be moved from one installed
instance of PBS to another.  Do not move PBS-prefixed configuration
files.  To move a set of site-defined configuration files from one
installed instance of PBS to another:

.IP "1" 5
Use the 
.I -s list 
directive with the "source" instance of PBS to enumerate the 
site-defined files.

.IP "2" 5
Use the 
.I -s show
directive with each site-defined file of the "source" instance of PBS
to save a copy of that file.

.IP "3" 5
Use the 
.I -s insert 
directive with each file at the "target" instance of PBS 
to create a copy of each site-defined configuration file.
.LP

.B Vnode Configuration File Syntax and Contents
.br
Configuration files with the following syntax describe vnodes and
the resources available on them.  They do not contain initialization 
values for MoM.

PBS-prefixed configuration files use the following syntax.  Other
configuration files can use the following syntax.  

Any configuration file containing vnode-specific assignments must
begin with this line:
.RS 4
.B $configversion 2
.RE
The format a file containing vnode information is:
.RS 4
.I <ID> : <ATTRNAME> = <ATTRVAL>
.RE
where
.RS 4
.IP "<ID>" 12
sequence of characters not including a colon (":")

.IP "<ATTRNAME>" 12
sequence of characters beginning with alphabetics or numerics, which
can contain underscore ("_") and dash ("-")

.IP "<ATTRVAL>" 12
sequence of characters not including an equal sign ("=")
.LP
The colon and equal sign may be surrounded by spaces.
.RE

A vnode's 
.I ID 
is an identifier that will be unique across all
vnodes known to a given 
.B pbs_server 
and will be be stable across
reinitializations or invocations of 
.B pbs_mom.  
ID stability is
of importance when a vnode's CPUs or memory might be expected
to change over time and PBS is expected to adapt to such changes
by resuming suspended jobs on the same vnodes to which they
were originally assigned.  Vnodes for which this is not a
consideration may simply use IDs of the form "0", "1", etc.
concatenated with some identifier that ensures uniqueness across
the vnodes served by the 
.B pbs_server.

A 
.I natural vnode 
does not correspond to any actual hardware.  It is used to define
any placement set information that is invariant for a given host, 
such as pnames.

It is defined as
follows:
.br
.IP "" 5
The name of the natural vnode is, by convention,
the MoM contact name, which is usually the hostname.
The MoM contact name is the vnode's MoM attribute.  See the
.B pbs_node_attributes(7B) man page.

.IP "" 5
An attribute, "pnames", with value set to the list of
resource names that define the placement sets' types for
this machine.

.IP "" 5
An attribute, "sharing" is set to the value "force_shared"
.LP

The 
.I natural vnode
is used to define any placement set information	that is invariant for
a given host (e.g. the placement set resource names themselves).

The order of the 
.I pnames
attribute follows placement set organization.  If
name X appears to the left of name Y in this attribute's value, an
entity of type X may be assumed to be smaller (that is, be
capable of containing fewer vnodes) than one of type Y.  No such
guarantee is made for specific instances of the types.

For example, on an HPE machine named "HostA", with two vnodes, a natural
vnode, four processors and two cbricks, the description would
look like this:
.br
     HostA:  pnames = cbrick
.br
     HostA:  sharing = force_shared
.br
     HostA[001c02#0]:  sharing = default_excl
.br
     HostA[001c02#0]:  resources_available.ncpus = 2
.br
     HostA[001c02#0]:  resources_available.cbrick = cbrick-0
.br
     HostA[001c02#0]:  resources_available.mem = 1968448kb
.br
     HostA[001c04#0]:  sharing = default_excl
.br
     HostA[001c04#0]:  resources_available.ncpus = 2
.br
     HostA[001c04#0]:  resources_available.cbrick = cbrick-1
.br
     HostA[001c04#0]:  resources_available.mem = 1961328kb
.br
The natural vnode is described in the first two lines.
The first vnode uses cbrick-0, and the second one uses cbrick-1.

.B Default Syntax and Contents
.br
Configuration files with this syntax list local resources and
initialization values for MoM.  Local resources are either static,
listed by name and value, or externally-provided, listed by name and
command path.  See the
.I -c
option.

Each configuration item is listed on a single line, with its parts 
separated by white space.  Comments begin with a hashmark ("#").

The default configuration file must be secure.  It must be owned by a user ID
and group ID both less than 10 and must not be world-writable.

.B Externally-provided Resources
.br
Externally-provided resources use a shell escape to run a command.
These resources are described with a name and value, 
where the first character of the value is an exclamation mark ("!").
The remainder of the value is the path and command to execute.

Parameters in the command beginning with a percent sign ("%") can
be replaced when the command is executed.  
For example, this line in a configuration file describes a 
resource named "escape":
.RS 14
escape     !echo 0xx %yyy
.RE
.IP
If a query for the "escape" resource is sent with no parameter replacements, 
the command executed would be "echo 0xx %yyy".  If one parameter replacement is sent,
"escape[xxx=hi there]", the command executed would be "echo hi there %yyy".
If two parameter replacements are sent, "escape[xxx=hi][yyy=there]", the command
executed would be "echo hi there".  If a parameter replacement is sent with
no matching token in the command line, "escape[zzz=snafu]", an error
is reported.
.LP

.B Windows Notes
.br
If the argument to a MoM option is a pathname containing a space,
enclose it in double quotes as in the following:

hostn !"\\Program Files\\PBS Pro\\exec\\bin\\hostn" host

When you edit any PBS configuration file, make sure that you put a
newline at the end of the file.  The Notepad application does not
automatically add a newline at the end of a file; you must explicitly
add the newline.


.B Replacing Actions
.br
.IP "$action <default action> <timeout> <new action>" 5
Replaces the 
.I default action
for an event with the site-specified
.I new action.  
.I timeout
is the time allowed for 
.I new action 
to run. 
The 
.I default action 
can be one of:
.RS
.IP "checkpoint" 5
Run
.I new action 
in place of the periodic job checkpoint, after which the job 
continues to run.
.IP "checkpoint_abort" 5
Run
.I new action 
to checkpoint the job, after which the job must be terminated by the script.
.IP "multinodebusy <timeout> requeue" 5
Used with cycle harvesting and multi-vnode jobs.
Changes default behavior when a vnode becomes busy.  Instead of 
allowing the job to run, the job is requeued.  
.I timeout
is ignored.  The only
.I new action 
is 
.I requeue.  
.IP "restart" 5
Runs 
.I new action 
in place of 
.I restart.
.IP "terminate" 5
Runs 
.I new action 
in place of SIGTERM or SIGKILL when MoM terminates a job.
.RE

.SH MoM Parameters

.IP "$alps_client <path>" 5
Cray only.  MoM runs this command to get the ALPS inventory.  Must 
be full path to command.  
.br 
Format: path to command
.br
Default: None

.IP "alps_release_jitter <maximum jitter>" 5
Cray only.  PBS sends requests to ALPS to release a finished job at
intervals specified by the sum of 
.I $alps_release_wait_time 
and a randomly generated value between zero and 
.I maximum jitter, 
in seconds.
.br
Format: Float
.br
Default: 0.12 seconds

.IP "$alps_release_timeout <timeout>" 5
Cray only.  Specifies the amount of time that PBS tries to release an
ALPS reservation before giving up.  After this amount of time has
passed, PBS stops trying to release the ALPS reservation, the job
exits, and the job's rsources are released.  PBS sends a HUP to the
MoM so that she re-reads the ALPS inventory to get the current
available ALPS resources.
.br
We recommend that the value for this parameter be greater than the value for 
.I suspectbegin.
.br
Format: Seconds, specified as positive integer
.br
Default: 600 (10 minutes)

.IP "$alps_release_wait_time <wait time>" 5
Cray only.  PBS sends requests to ALPS to release a finished job at
intervals specified by the sum of 
.I wait time 
and a randomly generated value between zero and the maximum specified in 
.I $alps_release_jitter,
in seconds.
.br
Format: Float
.br
Default: 0.4 seconds

.IP "$checkpoint_path <path>" 5
MoM passes this path to checkpoint and restart scripts.
This path can be absolute or relative to PBS_HOME/mom_priv.
Overrides default.  Overridden by 
.I pbs_mom -C 
option and by 
.I PBS_CHECKPOINT_PATH 
environment variable.

.IP "$clienthost <hostname>" 5
.I hostname 
is added to the list of hosts which are allowed
to connect to MoM as long as they are using a privileged port.
For example, 
this allows the hosts "fred" and "wilma"
to connect to MoM:
.br
 "$clienthost      fred"
.br
 "$clienthost      wilma"
.br

The following hostnames are added to 
.I $clienthost 
automatically: the
server, the localhost, and if configured, the secondary server.  The
server sends each MoM a list of the hosts in the nodes file, and these
are added internally to 
.I $clienthost.  
None of these hostnames need to
be listed in the configuration file.

Two hostnames are always allowed to connect to 
.B pbs_mom, 
"localhost" and the name returned to MoM 
by the system call gethostname().  These
hostnames do not need to be listed in the configuration file.  

The hosts listed
as "clienthosts" make up a "sisterhood" of machines.  Any one of the
sisterhood will accept connections from within the
sisterhood.  The sisterhood must all use the same port number.

.IP "$cputmult <factor>" 5
This sets a 
.I factor 
used to adjust CPU time used by each job.  This allows adjustment of time
charged and limits enforced where jobs run on a system with
different CPU performance.  If MoM's system is faster than the
reference system, set
.I factor
to a decimal value greater than 1.0.  For example:
.RS 9
$cputmult 1.5
.RE
.IP
If MoM's system is slower, set 
.I factor 
to a value between 1.0 and 0.0.  For example:
.RS 9
$cputmult 0.75
.RE
.IP

.IP "$dce_refresh_delta <delta>" 5
Defines the number of seconds between successive refreshings of a job's
DCE login context.
For example:
.RS 9
$dce_refresh_delta 18000
.RE
.IP

.IP "$enforce <limit>" 5
MoM will enforce the given 
.I limit.
Some
.I limits
have associated values.  Syntax:
.br
.I $enforce <variable name> <value>
.br

.RS
.IP "$enforce mem" 5
MoM will enforce each job's memory limit.

.IP "$enforce cpuaverage" 5
MoM will enforce ncpus when the average CPU usage over a job's
lifetime usage is greater than the job's limit.

.RS
.IP "$enforce average_trialperiod <seconds>" 5
Modifies 
.I cpuaverage.
Minimum number of 
.I seconds 
of job walltime before enforcement begins.  Default: 120.  
Integer.

.IP "$enforce average_percent_over <percentage>" 5
Modifies 
.I cpuaverage.
Gives 
.I percentage
by which a job may exceed its ncpus limit.  Default: 50.
Integer.

.IP "$enforce average_cpufactor <factor>" 5
Modifies 
.I cpuaverage.
The ncpus limit is multiplied by 
.I factor 
to produce actual
limit.  Default: 1.025.  Float.
.RE

.IP "$enforce cpuburst" 5
MoM will enforce the ncpus limit when CPU burst usage exceeds
the job's limit.
.RS
.IP "$enforce delta_percent_over <percentage>" 5
Modifies 
.I cpuburst.
Gives
.I percentage
over limit to be allowed.  Default: 50.  Integer.

.IP "$enforce delta_cpufactor <factor>" 5
Modifies 
.I cpuburst.
The ncpus limit is multiplied by 
.I factor
to produce actual limit.  Default: 1.5.  Float.

.IP "$enforce delta_weightup <factor>" 5
Modifies 
.I cpuburst.
Weighting factor for smoothing burst usage when average is increasing.  Default: 0.4.
Float.

.IP "$enforce delta_weightdown <factor>" 5
Modifies 
.I cpuburst.
Weighting factor
for smoothing burst usage when average is decreasing.  Default: 0.4.
Float.
.RE
.RE

.IP "$ideal_load <load>" 5
Defines the 
.I load 
below which the vnode is not considered to be busy.
Used with 
the 
.I $max_load 
directive.  
No default.  Float.  
.RS
.IP "Example:" 5
$ideal_load 1.8
.LP
.br
Use of $ideal_load adds a static resource to the vnode called "ideal_load", 
which is only internally visible.
.LP
.RE

.IP "$jobdir_root <stage directory root>
Directory under which PBS creates job-specific staging and execution directories.
PBS creates a job's staging and execution directory when the job's 
.I sandbox
attribute is set to PRIVATE.  If 
.I $jobdir_root
is unset, it defaults to the job owner's home directory.  
In this case the user's home directory must exist.  
If 
.I stage_directory_root
does not exist when MoM starts up, MoM will abort.  If 
.I stage directory root
does not exist when MoM tries to run a job, MoM will kill the job.
Path must be owned by root, and permissions must be 1777.  On Windows,
this directory should have Full Control Permission for the local
Administrators group.
.br
When you set 
.I $jobdir_root
to a shared (e.g. NFS) directory, tell MoM it is shared by setting the
.I shared
directive after the directory name:
.br
.I $jobdir_root <directory name> shared
.br
Otherwise sister MoMs can prematurely delete files and directories
when nodes are released.  This is because when a jobs sandbox
attribute is set to PRIVATE and $jobdir_root is set to a shared
directory, PBS can use a shared location for job files.  When sister
nodes are released, those sister MoMs would normally clean up their
own files upon release.  So if $jobdir_root is set to a shared
directory, you need to tell the sister MoMs not to do the cleanup, and
let the primary execution host MoM clean up when the job is finished.
.RS
.IP "Example of a shared directory:" 5
$jobdir_root /r/shared shared
.IP "Example of a non-shared directory:" 5
$jobdir_root /scratch/foo
.RE

.IP "$job_launch_delay" 5
When the primary MoM gets a job whose 
.I tolerate_node_failures 
attribute is set to 
.I all 
or 
.I job_start, 
the primary MoM can wait to start the job (running the job script or
executable) for up to a configured number of seconds.  During this
time, execjob_prologue hooks can finish and the primary MoM can check
for communication problems with sister MoMs.  You configure the number
of seconds for the primary MoM to wait for hooks via the
.I job_launch_delay 
configuration parameter in MoM's config file:
.br
   $job_launch_delay <number of seconds to wait>
.br
Default: the sum of the values of the alarm attributes of any enabled
execjob_prologue hooks. If there are no enabled execjob_prologue
hooks, the default value is 30 seconds.  For example, if there are two
enabled execjob_prologue hooks, one with alarm = 30 and one with alarm
= 60, the default value of MoM's 
.I job_launch_delay
is 90 seconds.

After all the execjob_prologue hooks have finished, or MoM has waited
for the value of the 
.I job_launch_delay parameter, 
she starts the job.

.IP "$kbd_idle <idle wait> <min use> <poll interval>" 5
Declares that the vnode will be used for batch jobs during periods when
the keyboard and mouse are not in use.  

The vnode must be idle for a minimum of 
.I idle wait
seconds before being considered available for batch jobs.  
No default.  Integer.

The vnode must be in use for a minimum of 
.I min use
seconds before it becomes unavailable for batch jobs.  Default: 10.  Integer.

Mom checks for activity every
.I poll interval
seconds.  Default: 1.  Integer.
.RS
.IP "Example:" 5
$kbd_idle 1800 10 5
.RE


.IP "$logevent <mask>" 5
Sets the 
.I mask 
that determines which event types are logged by 
.B pbs_mom.
To include all debug events, use 0xffffffff.
.nf
Log events:

Name       Hex Value  Message Category                   
---------------------------------------------------
ERROR      0001       Internal errors
SYSTEM     0002       System errors 
ADMIN      0004       Administrative events
JOB        0008       Job-related events
JOB_USAGE  0010       Job accounting info
SECURITY   0020       Security violations
SCHED      0040       Scheduler events
DEBUG      0080       Common debug messages
DEBUG2     0100       Uncommon debug messages
RESV       0200       Reservation-related info
DEBUG3     0400       Rare debug messages
DEBUG4     0800       Limit-related messages
.fi

.IP "$max_check_poll <seconds>" 5
Maximum time between polling cycles, in seconds.  Minimum recommended
value: 30 seconds.  

The interval between each poll starts at 
.I $min_check_poll 
and increases with each cycle until it reaches 
.I $max_check_poll, 
after which it remains the same. The amount by which the cycle increases is 1/20 of
the difference between 
.I $max_check_poll 
and 
.I $min_check_poll.
.br
Format: Integer
.br
Minimum value: 1 second
.br
Default value: 120 seconds

.IP "$max_load <load> [suspend]" 5
Defines the load above which the vnode is considered to be busy.
Used with 
the 
.I $ideal_load 
directive. No new jobs are started on a 
.I busy
vnode.

The optional 
.I suspend 
directive tells PBS to suspend jobs running on
the vnode if the load average exceeds the 
.I $ max_load 
number, regardless of the source of the load (PBS and/or logged-in users).
Without this directive, PBS will not suspend jobs due to load.

We recommend setting 
.I load
to a value that is slightly higher than the number of CPUs, 
for example 0.25 + 
.I ncpus.

.br
Default: number of CPUs on machine
.br
Format: Float  
.br
Example:
.RS 8
$max_load 3.5
.RE
.IP

.IP "$max_poll_downtime" 5
When mother superior detects that a sister mom has lost connectivity (e.g. MoM went down or the network is having problems) it waits 
.I downtime 
seconds for the sister to reconnect before it gives up and kills the job.
.br
Format: 
.I Integer
.br
Default: 
.I Five minutes

.IP "memreserved <megabytes>" 5
.B Deprecated.  
The amount of per-vnode memory reserved for system overhead. 
This much memory is deducted from the value of 
.I resources_available.mem
for each vnode managed by this MoM.
.br
Example:
.RS 9
memreserved 16
.RE
.IP
Default: 0MB
.br

.IP "$min_check_poll <seconds>" 5
Minimum time between polling cycles, in seconds.  Must be 
greater than zero and less than
.I $max_check_poll.  
Minimum recommended value: 10 seconds.
.br
Format: Integer.
.br
Minimum value: 1 second
.br
Default value: 10 seconds

.IP "pbs_accounting_workload_mgmt <value>" 5
Controls whether CSA accounting is enabled.  Name does not start with
dollar sign.  If set to 
.I 1, on, 
or 
.I true, 
CSA accounting is enabled.  If set to
.I 0, off, 
or 
.I false,
accounting is disabled.  Cray only.  Requires CLE 5.2.
.br
Default: "true"; enabled

.IP "$prologalarm <timeout>" 5
Defines the maximum number of seconds the prologue and epilogue
may run before timing out.  Default: 30 seconds.  Integer.
Example:
.RS 8
$prologalarm 30
.RE
.IP

.IP "$reject_root_scripts <True | False>" 5
When set to 
.I True,
MoM won't aquire any new hook scripts, and MoM won't run job scripts that would execute
as root or Admin. However, MoM will run previously-aquired hooks that run as root.
.br 
Format: Boolean
.br
Default: False

.IP "$restart_background <True | False>" 5
Controls how MoM runs a restart script after checkpointing a job.
When this option is set to 
.I True, 
MoM forks a child which runs the restart script.  The child returns
when all restarts for all the local tasks of the job are done.  MoM
does not block on the restart.  When this option is set to 
.I False,
MoM runs the restart script and waits for the result.
.br
Format: Boolean
.br  
Default: False


.IP "$restart_transmogrify <True | False>" 5
Controls how MoM runs a restart script after checkpointing a job.
When this option is set to 
.I True, 
MoM runs the restart script, replacing the session ID of the original 
task's top process with the session ID of the script.  

When this option is set to 
.I False,
MoM runs the restart script and waits for the result.  The restart
script must restore the original session ID for all the processes of
each task so that MoM can continue to track the job.  

When this option is set to 
.I False
and the restart uses an external command, the configuration parameter
.I restart_background
is ignored and treated as if it were set to 
.I True,
preventing MoM from blocking on the restart.
.br
Format: Boolean
.br
Default: False
.br

.IP "$restrict_user <True | False>" 5
Controls whether users not submitting jobs have access to this
machine.  If 
.I value
is 
.I True, 
restrictions are applied.  See 
.I $restrict_user_exceptions
and 
.I $restrict_user_maxsysid.
Not supported on Windows.
.br
Format: Boolean
.br
Default: False

.IP "$restrict_user_exceptions <user list>" 5
Comma-separated list of users who are exempt from access
restrictions applied by 
.I $restrict_user.
Leading spaces within each entry are allowed.  
Maximum of 10 names.

.IP "$restrict_user_maxsysid <value>" 5
Any user with a numeric user ID less than or equal to 
.I value
is exempt from restrictions applied by 
$restrict_user.  

If 
.I $restrict_user 
is 
.I True 
and no 
.I value
exists for 
.I $restrict_user_maxsysid, 
PBS looks in /etc/login.defs, if it exists, for the 
.I value. 
Otherwise the default is used.
.br
Format: 
.I Integer
.br
Default: 
.I 999

.IP "$restricted <hostname>" 5
The 
.I hostname
is added to the list of hosts which are allowed to connect to MoM 
without being required to use a privileged port.  

Hostnames can be
wildcarded.  For example, to allow queries from any host from the 
domain "xyz.com":
.RS 9
$restricted      *.xyz.com
.RE
.IP
Queries from the hosts in the restricted list are only allowed 
access to information internal to this host, such as load
average, memory available, etc.  They may not run shell commands.

.IP "$sister_join_job_alarm" 5

When the primary MoM gets a job whose 
.I tolerate_node_failures 
attribute is set to 
.I all 
or 
.I job_start, 
the primary MoM can wait to start the job
for up to a configured number of seconds if the sister MoMs do not
immediately acknowledge joining the job.  This gives the sister MoMs
more time to join the job.  You configure the number of seconds for
the primary MoM to wait for sister MoMs via the 
.I sister_join_job_alarm
configuration parameter in MoM's config file:
.br
   $sister_join_job_alarm <number of seconds to wait>
.br
Default: the sum of the values of the 
.I alarm 
attributes of any enabled
execjob_begin hooks. If there are no enabled execjob_ begin hooks, the
default value is 30 seconds.  For example, if there are two enabled
execjob_begin hooks, one with alarm = 30 and one with alarm = 20, the
default value of MoM's 
.I sister_join_job_alarm 
is 50 seconds.

After all the sister MoMs have joined the job, or MoM has waited for
the value of the 
.I $sister_join_job_alarm 
parameter, she starts the job.

.IP "$suspendsig <suspend signal> [resume signal]" 5
Alternate signal 
.I suspend signal
is used to suspend jobs instead of SIGSTOP.  Optional 
.I resume signal
is used to resume jobs instead of SIGCONT.

.IP "$tmpdir <directory>" 5
Location where each job's scratch directory will be created.

PBS creats a temporary directory for use by the job, not by PBS.
PBS creates the directory before the the job is run and removes 
the directory and its contents when the job is finished.  It is 
scratch space for use by the job.  Permission must be 1777 on
Linux, writable by 
.I Everyone 
on Windows.

Example: 
.RS 9
$tmpdir /memfs
.RE

.IP
Default on Linux: /var/tmp
.br
Default on Windows: value of the
.I TMP
environment variable 

.IP "$usecp <hostname:source prefix> <destination prefix>" 5
MoM uses /bin/cp or the program specified by PBS_CP to deliver 
output files when the destination is a network mounted file system, 
or when the source and destination are both on the local host, or 
when the 
.I source prefix 
can be replaced with the 
.I destination prefix
on 
.I hostname.  
Both
.I source prefix
and 
.I destination prefix
are absolute pathnames of directories, not files.  

Overrides
.I PBS_CP
and
.I PBS_RCP
and 
.I PBS_SCP.

Use trailing
slashes on both source and destination.  For example:
.RS 9
$usecp HostA:/users/work/myproj/ /sharedwork/proj_results/
.RE
.IP

.IP "$vnodedef_additive" 5
Specifies whether MoM considers a vnode that appeared previously
either in the inventory or in a vnode definition file, but that does
not appear now, to be in her list of vnodes.
.br
When 
.I $vnodedef_additive 
is True, MoM treats missing vnodes as if they
are still present, and continues to report them as if they are
present.  This means that the server does not mark missing vnodes as
.I stale.
.br
When 
.I $vnodedef_additive 
is False, MoM does not list missing vnodes,
the server's information is brought up to date with the inventory and
vnode definition files, and the server marks missing vnodes as 
.I stale.
.br
Visible in configuration file on Cray only.
.br
Format: Boolean
.br
Default for MoM on Cray login node: False


.IP "$wallmult <factor>" 5
Each job's walltime usage is multiplied by 
.I factor.
For example:
.RS 9
$wallmult 1.5
.RE
.IP

.RE


.RE
.B Static Resources
.br
Static resources local to the vnode are described
one resource to a line,
with a name and value separated by white space.
For example, tape drives of different types could be specified by:
.RS 15
.nf
.B tape3480 \ \  4
.B tape3420 \ \  2
.B tapedat  \ \ \ \ 1
.B tape8mm  \ \ \ \ 1
.fi
.RE


.RE

.SH FILES AND DIRECTORIES
.IP $PBS_HOME/mom_priv 10
Default directory for default configuration files.

.IP $PBS_HOME/mom_priv/config 10
MoM's default configuration file.

.IP $PBS_HOME/mom_logs 10
Default directory for log files written by MoM.

.IP $PBS_HOME/mom_priv/prologue 10
File containing administrative script to be run before job execution.

.IP $PBS_HOME/mom_priv/epilogue 10
File containing administrative script to be run after job execution.


.SH SIGNAL HANDLING
.B pbs_mom 
handles the following signals:

.IP SIGHUP 10
The 
.B pbs_mom 
daemon rereads its configuration files, closes and reopens the log
file, and reinitializes resource structures.  

.IP SIGALRM 10
MoM writes a log file entry.  See the 
.I -a alarm_timeout 
option.

.IP SIGINT 10
The 
.B pbs_mom 
daemon exits, leaving all running jobs still running.  
See the 
.I -p
option. 

.IP SIGKILL 10
This signal is not caught.  The 
.B pbs_mom 
daemon exits immediately.

.IP "SIGTERM, SIGXCPU, SIGXFSZ, SIGCPULIM, SIGSHUTDN" 10
The 
.B pbs_mom 
daemon terminates all running children and exits.

.IP "SIGPIPE, SIGUSR1, SIGUSR2, SIGINFO" 10
These are ignored.

.LP
All other signals have their default behavior installed.

.SH EXIT STATUS
.IP "Greater than zero" 5
If the 
.B pbs_mom 
daemon fails to start
.br
If the 
.I -s insert 
option is used with an existing 
.I Version 2 filename
.br
If the administrator attempts to add a script whose name 
begins with "PBS"
.br
If the administrator attempts to use the 
.I -s remove 
option on a nonexistent configuration file, or on a configuration
file whose name begins with "PBS"
.br
If the administrator attempts to use the 
.I -s show
option on a nonexistent script


.SH SEE ALSO
pbs_server(8B), 
pbs_sched(8B), 
qstat(1B)


================================================
FILE: doc/man8/pbs_mpihp.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_mpihp 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_mpihp 
\- run an MPI application in a PBS job with HP MPI

.SH SYNOPSIS
.B pbs_mpihp
[-h <host>] [-np <number>] [<other HP mpirun options>] <program> [<args>]

.B pbs_mpihp  
[<HP mpirun options>] -f <appfile> [-- [<extra_args>]]

.B pbs_mpihp
--version

.SH DESCRIPTION
The PBS command 
.B pbs_mpihp 
replaces the standard 
.I mpirun
command in a PBS
HP MPI job, for executing programs.  
.B pbs_mpihp 
is a front end to the HP MPI version of mpirun.  

When 
.B pbs_mpihp 
is invoked from a PBS job, it 
processes the command line arguments, then calls standard HP mpirun to
actually start the MPI ranks.  The ranks created are mapped onto
CPUs on the vnodes allocated to the PBS job.  The environment variable 
.B MPI_REMSH 
is set to 
.I $PBS_EXEC/bin/pbs_tmrsh.  
This causes
the processes that are created to become part of the PBS job.

The path to standard HP mpirun is found by checking to see if a link
exists with the name 
.I "PBS_EXEC/etc/pbs_mpihp".  
If this link exists,
it points to standard HP mpirun.  If it does not exist, a call
to 
.I "mpirun -version" 
is made to determine whether it is HP mpirun.
If so, the call is made to "mpirun" without an absolute path.
If HP mpirun cannot be found, an error is output, all temp
files are cleaned up and the script exits with value 127.

If 
.B pbs_mpihp 
is invoked from outside a PBS job, it passes all of
its arguments directly to standard HP mpirun without further processing.

.B Configuration
.br
When HP MPI is wrapped with pbs_mpihp, "rsh" is the default used to 
start the mpids. If you wish to use "ssh" or something else, 
be sure to set the following in $PBS_HOME/pbs_environment:

.RS 5
.I PBS_RSHCOMMAND=ssh
.RE

or put the following in the job script:

.RS 5
.I export PBS_RSHCOMMAND=<rsh_cmd>
.RE

.SH USAGE
Usage is the same as for HP 
.I mpirun.

.B pbs_mpihp <program>
allows one executable to be specified.

.B pbs_mpihp -f <appfile>
uses an
.I appfile 
to list multiple executables.
The format is described in the HP mpirun man page.  If this form
is used from inside a PBS job, the file is read to determine
what executables are to be run and how many processes are
started for each.

Executing 
.B pbs_mpihp 
with the 
.I -client 
option is not supported under PBS.

.SH OPTIONS
All options except the following are passed directly to HP mpirun
with no modification.

.IP "-client" 15  
Not supported.

.IP "-f <appfile>"  
The specified 
.I appfile 
is read by 
.B pbs_mpihp.

.IP "-h <host>" 15    
Ignored by 
.B pbs_mpihp.

.IP "-l <user>"     
Ignored by pbs_mpihp.

.IP "-np <number>" 15  
Specifies the 
.I number 
of processes to run on the PBS vnodes.

.IP "--version" 15
The 
.B pbs_mpihp
command returns its PBS version information and exits.
This option can only be used alone.

.SH EXIT VALUES

.IP 127 15
If HP
.B mpirun
cannot be found

.SH SEE ALSO
mpirun(1)


================================================
FILE: doc/man8/pbs_mpilam.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_mpilam 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_mpilam 
\- run MPI programs under PBS with LAM MPI

.SH SYNOPSIS
.B pbs_mpilam 
[<mpilam options>]

.B pbs_mpilam 
--version

.SH DESCRIPTION
.B Deprecated.  
The PBS command 
.B pbs_mpilam 
replaces the standard 
.I mpirun
command in a PBS LAM MPI job.

If used to run a single program, PBS tracks resource usage 
and controls all user processes spawned by the program.
If used to run multiple programs as specified in an application file
(no 
.I <where> 
argument and no 
.I -np/-c 
option), PBS does not manage the spawned user processes of each program.

If the 
.I where 
argument is not specified,
.I pbs_mpilam
will try to run the user's program on all available CPUs
using the 
.I C
keyword.

.B Prerequisites
.br
The PATH on remote machines must contain 
.I PBS_EXEC/bin.

.SH USAGE
Usage is the same as for LAM 
.I mpirun.
All options are passed directly to 
.I mpirun.  

.SH OPTIONS
.IP "<mpilam options>" 8
The 
.B pbs_mpilam 
command uses the same options as 
.I mpirun.

.IP "--version" 8
The 
.B pbs_mpilam
command returns its PBS version information and exits.
This option can only be used alone.

.SH SEE ALSO
mpirun(1)


================================================
FILE: doc/man8/pbs_mpirun.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_mpirun 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_mpirun

.B Deprecated.  
Run MPI programs under PBS with MPICH

.SH SYNOPSIS
.B pbs_mpirun 
[<mpirun options>]

.B pbs_mpirun 
--version
.SH DESCRIPTION

The PBS command 
.B pbs_mpirun 
replaces the standard 
.I mpirun 
command in a PBS
MPICH job using P4.  

On Windows, this command cannot be used to start job processes or
to track a job's resource usage.

.B Prerequisite
.br
The PATH on remote machines must contain 
.I PBS_EXEC/bin.

.SH USAGE
Usage is the same as for 
.I mpirun, 
except for the 
.I -machinefile 
option.  All other options are passed directly to 
.I mpirun.

.SH OPTIONS
.IP "<mpirun options>" 8
The 
.I options 
to 
.B pbs_mpirun 
are the same as for 
.I mpirun, 
except for the
.I -machinefile 
option.  This is generated by 
.B pbs_mpirun.
The user should not attempt to specify 
.I -machinefile.

The value for 
.I -machinefile
is a temporary
file created from 
.I PBS_NODEFILE 
in the format:
       hostname-1[:number of processors]
       hostname-2[:number of processors]
       hostname-n[:number of processors]

where if the number of processors is not specified, it is 1.
An attempt  by the user to specify the 
.I -machinefile 
option
will result in a warning saying "Warning, -machinefile value
replaced by PBS".

The default value for the 
.I -np 
option is the number of entries in PBS_NODEFILE.

.IP "--version" 8
The 
.B pbs_mpirun
command returns its PBS version information and exits.
This option can only be used alone.
.LP
.SH ENVIRONMENT VARIABLES
.B pbs_mpirun 
modifies 
.I P4_RSHCOMMAND 
and 
.I PBS_RSHCOMMAND.  
Users should not
edit these.  
.B pbs_mpirun 
copies the value of 
.I P4_RSHCOMMAND 
into 
.I PBS_RSHCOMMAND.

.SH SEE ALSO
mpirun(1)


================================================
FILE: doc/man8/pbs_probe.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_probe 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_probe 
- report PBS diagnostic information and fix permission errors
.SH SYNOPSIS
.B pbs_probe 
[ -f | -v ] 
.br
.B pbs_probe
--version
.SH DESCRIPTION
.B Deprecated.
The
.B pbs_probe
command reports post-installation information that is useful for PBS
diagnostics, and fixes permission errors.

.B Information Sources
.RS 3
Information that is supplied on the command line
.br
The file /etc/pbs.conf 
.br
The file /etc/init.d/pbs
.br
The values of any of the following environment variables; these may 
be set in the environment in which
.B pbs_probe
is run: PBS_CONF_FILE, PBS_HOME, PBS_EXEC, PBS_START_SERVER, PBS_START_MOM,
and PBS_START_SCHED
.RE

.B Required Privilege
.br
In order to execute
.B pbs_probe,
the user must have PBS Operator or Manager privilege.

.SH OPTIONS
.IP "(no options)" 10
Run in "report" mode. In this mode
.B pbs_probe
reports any permission errors detected in the PBS infrastructure files.
The command categorizes the errors and writes a list of them by category.
Empty categories are not written.

.IP "-f " 10
Run in "fix" mode. In this mode pbs_probe examines each of the relevant
infrastructure files and, where possible, fixes any errors that it detects,
and prints a message of what got changed. If it is unable to fix a problem,
it prints a message regarding what was detected. 
.IP "-v" 10
Run in "verbose" mode. In this mode
.B pbs_probe
writes a complete list of the infrastructure files that it checked.
.LP
.IP "--version" 10
The 
.B pbs_probe
command returns its PBS version information and exits.
This option can only be used alone.

.SH STANDARD ERROR
The
.B pbs_probe
command writes a diagnostic message to standard error for each error occurrence.

.SH EXIT STATUS
Exit code does not reflect results of probe; it reflects whether or not
the program ran.  
.IP "Zero" 10
When run correctly, whether or not 
.B pbs_probe 
finds any problems or errors

.IP "Non-negative" 10
When run incorrectly
.RE
.SH SEE ALSO
pbs_server(8B), pbs_sched(8B), pbs_mom(8B).


================================================
FILE: doc/man8/pbs_sched.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_sched 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_sched
\- run a PBS scheduler

.SH SYNOPSIS
.B pbs_sched
[-a <alarm>] [-c <clientsfile>] [-d <home dir>]
          [-I <scheduler name>] [-L <logfile>] [-n] [-N]
          [-p <output file>] [-R <port number>] [-S <port number>]
          [-t <num threads>]

.B pbs_sched
--version

.SH DESCRIPTION
Runs the default scheduler or a multisched.
.LP
.B pbs_sched
must be executed with root permission.

.SH OPTIONS
.IP "-a <alarm>" 13
.B Deprecated.
Overwrites value of
.I sched_cycle_length
scheduler attribute.
.br
Time in seconds to wait for a scheduling cycle to finish.
.br
Format: Time, in seconds.
.br

.IP "-c <clientsfile>" 13
Add clients to this scheduler's list of known clients.
The
.I clientsfile
contains single-line entries of the form
.RS 17
.I $clienthost <hostname>
.RE
.IP
Each
.I hostname
is added to the list of hosts allowed to connect to this scheduler.
If
.I clientsfile
cannot be opened, this scheduler aborts.
Path can be absolute or relative.  If relative, it is relative to
PBS_HOME/sched_priv.

.IP "-d <home dir>" 13
The directory in which this scheduler will run.
.br
Default: PBS_HOME/sched_priv.

.IP "-I <scheduler name>" 13
Name of scheduler to start.  Required when starting a multisched.

.IP "-L <logfile>" 13
The absolute path and filename of the log file.
A scheduler writes its PBS version and build information to
the logfile whenever it starts up or
the logfile is rolled to a new file.  See the
.I -d
option.
.br
Default: A scheduler opens a file named for the current
date in the PBS_HOME/sched_logs directory.

.IP "-n" 13
Tells this scheduler to not restart itself if it receives a
.I sigsegv
or a
.I sigbus.
A scheduler by default restarts itself if it receives either
of these two signals more than five minutes after starting.
A scheduler does not restart itself if it receives
either one within five minutes of starting.

.IP "-N" 13
Runs the scheduler in standalone mode.
.LP

.IP "-p <output file>" 13
Any output which is written to standard out or standard error is
written to
.I output file.
The pathname can be absolute or relative,
in which case it is relative to PBS_HOME/sched_priv.
See the
.I -d
option.
.br
Default: PBS_HOME/sched_priv/sched_out


.IP "-R <port number>" 13
The port for MOM to use.  If this option is not given,
the port number is taken from PBS_MANAGER_SERVICE_PORT, in pbs.conf.
.br
Default: 15003

.IP "-S <port number>" 13
The port for this scheduler to use.

Required when starting a multisched.

For the default scheduler, if this option is not specified
the default port is taken from PBS_SCHEDULER_SERVICE_PORT,
in pbs.conf.
.br
Default value for default scheduler: 15004
.br
Default value for multisched: none

.IP "-t <num threads>" 13
Specifies number of threads for this scheduler.
.br
Scheduler automatically caps number of threads at the number of cores
(or hyperthreads if applicable), regardless of value of
.I num threads.
.br
Overrides PBS_SCHED_THREADS environment variable and PBS_SCHED_THREADS
parameter in pbs.conf.
.br
Valid values:
.I >=1
.br
Default: half the number of cores (or hyperthreads if applicable) on this host

.IP "--version" 13
The
.B pbs_sched
command returns its PBS version information and exits.
This option can only be used alone.

.SH CONFIGURATION FILE
The file PBS_HOME/sched_priv/sched_config contains configuration parameters
for this scheduler.  Each entry must be a single unbroken line.
.br
Format:
.I name: value [prime | non-prime | all | none]
.br
where
.RS 3
.IP name 13
Must not contain whitespace.
.IP value 13
Must be double-quoted if it contains whitespace.
.I value
can be
.I True | False | <number> | <string>.
.I True
and
.I False
are not case-sensitive.
.IP "[prime | non-prime | all | none]" 13
Specifies when this setting applies:
during primetime,
non-primetime, all the time, or none of the time.  A blank third field
is equivalent to
.I all
which means that it applies to both primetime and non-primetime.
.br
Valid values:
.I "all", "ALL", "none", "NONE", "prime", "PRIME", "non_prime", "NON_PRIME"
.LP
.RE
Any line starting with a hashmark, "#", is a comment, and is ignored.

.B Configuration Parameters
.br
.IP "backfill " 13
.B Deprecated.
Use the
.I backfill_depth
queue/server attribute instead.
Toggle that controls whether PBS uses backfilling.
If this is set to True, this scheduler attempts to schedule
smaller jobs around higher-priority jobs when using
.I strict_ordering,
as long as running the smaller jobs won't change the
start time of the jobs they were scheduled around. A scheduler
chooses jobs in the standard order, so other high-priority jobs will be
considered first in the set to fit around the highest-priority job.

When this parameter is
.I True
and
.I help_starving_jobs
is
.I True,
this scheduler backfills around starving jobs.

Can be used
with
.I strict_ordering
and
.I help_starving_jobs.
.br
Format: Boolean.
.br
Default:
.I True all


.IP "backfill_prime " 13
This Scheduler will not run jobs which would overlap
the boundary between primetime and non-primetime. This assures
that jobs restricted to running in either primetime or non-primetime
can start as soon as the time boundary happens. See also
.I prime_spill, prime_exempt_anytime_queues.
.br
Format: Boolean.
.br
Default:
.I False all

.IP "by_queue " 13
If set to
.I True,
all jobs that can be run from the highest-priority
queue are run, then any jobs that can be run from the next queue are
run, and so on.  If
.I by_queue
is set to
.I False,
all jobs are treated as if they are in one large queue. The
.I by_queue
parameter is overridden
by the
.I round_robin
parameter when
.I round_robin
is set to
.I True.
.br
Format: Boolean.
.br
Default:
.I True all

.IP cpus_per_ssinode 13
.B Obsolete.

.IP dedicated_prefix 13
Queue names with this prefix are treated as dedicated
queues, meaning jobs in that queue are considered for
execution only when the system is in dedicated time as specified in the
configuration file PBS_HOME/sched_priv/dedicated_time.
.br
Format: String
.br
Default:
.I ded

.IP fair_share 13
Enables the fairshare algorithm, and
turns on usage collecting. Jobs will be selected based on a
function of their recent usage and priority (shares). Not a prime option.
.br
Format: Boolean
.br
Default:
.I False all

.IP fairshare_decay_factor 13
Decay multiplier for fairshare usage reduction.  Each decay period, the
usage is multiplied by this value.
.br
Valid values: between 0 and 1, not inclusive.  Not a prime option.
.br
Format: Float
.br
Default:
.I 0.5

.IP fairshare_decay_time 13
Time between fairshare usage decay operations.  Not a prime option.
.br
Format: Duration
.br
Default:
.I 24:00:00

.IP fairshare_entity 13
Specifies the entity for which fairshare usage data will
be collected. Can be
.I euser, egroup, Account_Name, queue,
or
.I egroup:euser.
Not a prime option.
.br
Format: String
.br
Default:
.I euser

.IP fairshare_enforce_no_shares 13
If this option is enabled, jobs whose entity has zero
shares will never run. Requires
.I fair_share
parameter to be enabled.
.br
Format: Boolean
.br
Default:
.I False

.IP fairshare_usage_res 13
Specifies the mathematical formula to use in fairshare calculations.
Is composed of PBS resources as well as mathematical operations that
are standard Python operators and/or those in the Python math module.
When using a PBS resource, if
.I resources_used.<resource name>
exists, that value is used.  Otherwise, the value is taken from
.I Resource_List.<resource name>.
Not a prime option.
.br
Format: String
.br
Default:
.I cput

.IP half_life 13
.B Deprecated
(as of 13.0).
The half-life for fairshare usage; after the amount of time
specified, the fairshare usage is halved. Requires that
.I fair_share
parameter be enabled.  Not a prime option.
.br
Format: Duration
.br
Default:
.I 24:00:00

.IP help_starving_jobs 13
Setting this option enables starving job support. Once
jobs have waited for the amount of time given by
.I max_starve
they are considered starving. If a job is considered starving, no
lower-priority jobs will run until the starving job can be run, unless
backfilling is also specified. To use this option, the
.I max_starve
configuration parameter needs to be set as well. See also
.I backfill, max_starve,
and the server's
.I eligible_time_enable
attribute.
.br
At each scheduler iteration, PBS calculates
.I estimated.start_time
and
.I estimated.exec_vnode
for starving jobs being backfilled around.
.br
Format: Boolean
.br
Default:
.I True all

.IP job_sort_key 13
.RS
Specifies how jobs should be sorted.
.I job_sort_key
can be used to sort either by resources or by special case sorting
routines. Multiple
.I job_sort_key
entries can be used, one to a line, in which
case the first entry will be the primary sort key, the second will be
used to sort equivalent items from the first sort, etc.
The
.I HIGH
option implies descending sorting,
.I LOW
implies ascending. See example for details.

This attribute is overridden by the
.I job_sort_formula
attribute.
If both are set,
.I job_sort_key
is ignored and an error message is
printed.

.br
Syntax:
.br
.I job_sort_key: """<resource name> HIGH|LOW"""
.br
.I job_sort_key: """fairshare_perc HIGH|LOW"""
.br
.I job_sort_key: """job_priority HIGH|LOW"""

.br
There are three special case sorting routines, which can be used
instead of
.I <resource name>:
.RS
.IP "fairshare_perc HIGH" 13
Sort based on how much fairshare percentage the entity deserves,
based on the values in the
.I resource group
file. If user A has more priority than user B, all of user A's
jobs will always run first.  Past history is not used.

This should only
be used if entity share (strict priority) sorting is needed.
Incompatible with
.I fair_share
scheduling parameter being
.I True.

.IP "job_priority HIGH | LOW" 13
Sort jobs by the job
.I priority
attribute regardless of job owner.

.IP "sort_priority HIGH|LOW" 13
.B Deprecated.
See
.I job_priority
above.
.RE

The following example shows how to sort jobs so that those with
high CPU count come first:
.RS
job_sort_key: "ncpus HIGH" all
.br
.RE
The following example shows how to sort jobs so that those with
lower memory come first:
.br
.RS
job_sort_key: "mem LOW" prime
.RE

.br
Format: Quoted string
.br
Default: Not in force
.RE

.IP load_balancing 13
When set to
.I True,
this scheduler takes into account the load average on vnodes as
well as the resources listed in the
.I resources
line in sched_config.  Load balancing can result in overloaded CPUs.
.br
Format: Boolean
.br
Default:
.I False all

.IP load_balancing_rr 13
.B Deprecated.
To duplicate this setting, enable
.I load_balancing
and
.I set smp_cluster_dist
to
.I round_robin.

.IP log_filter 13
.B Obsolete.
See the
.I log_events
scheduler attribute.

.IP max_starve 13
The amount of time before a job is considered starving. This
variable is used only if
.I help_starving_jobs
is set.
.br
Upper limit: None
.br
Format: Duration
.br
Default:
.I 24:00:00

.IP mem_per_ssinode 13
.B Obsolete.

.IP mom_resources 13
This option is used to query the MoMs to set the value of
.I resources_available.<resource name>
where
.I resource name
is a site-defined
resource. Each MoM is queried with the resource name and the
return value is used to replace
.I resources_available.<resource name>
on that vnode. On a multi-vnoded machine with a natural vnode,
all vnodes share anything set in
.I mom_resources.
.br
Format: String

.IP node_sort_key 13
.RS
Defines sorting on resource or priority values on vnodes. Resource
must be numerical, for example, long or float.  Up to 20
.I node_sort_key entries
can be used, in which
case the first entry will be the primary sort key, the second will be
used to sort equivalent items from the first sort, etc.

.br
Syntax:
.br
.I node_sort_key: <resource name>|sort_priority <HIGH | LOW>
.br
.I node_sort_key: <resource name> <HIGH | LOW> <total | assigned | unused>
.br
where
.RS
.IP total
Use the
.I resources_available
value.
.IP assigned
Use the
.I resources_assigned
value.
.IP unused
Use the value given by
.I resources_available - resources_assigned.
.IP sort_priority
Sort vnodes by the value of the vnode
.I priority
attribute.
.RE

.br
When sorting on a resource, the default third field is "total".
.br
Format: String
.br
Default:
.I node_sort_key: sort_priority HIGH all
.RE

.IP nonprimetime_prefix 13
Queue names which start with this prefix are treated
as non-primetime queues. Jobs in these queues
run only during non-primetime. Primetime and non-primetime are
defined in the holidays file.
.br
Format: String
.br
Default:
.I np_

.IP peer_queue 13
Defines the mapping of a pulling queue to a furnishing queue
for peer scheduling. Maximum number is 50 peer queues per
scheduler.
.br
Format: String
.br
Default: Unset

.IP preemptive_sched 13
Enables job preemption.  See the
.I preempt_order
scheduler attribute.
.br
Format: String
.br
Default:
.I True all

.IP preempt_order 13
.B Obsolete.
See the
.I preempt_order
scheduler attribute.

.IP preempt_prio 13
.B Obsolete.
See the
.I preempt_prio
scheduler attribute.

.IP preempt_queue_prio 13
.B Obsolete.
See the
.I preempt_queue_prio
scheduler attribute.

.IP preempt_sort 13
.B Obsolete.
See the
.I preempt_sort
scheduler attribute.

.IP primetime_prefix 13
Queue names starting with this prefix are treated as
primetime queues. Jobs in these queues run only during
primetime. Primetime and non-primetime are defined in the
holidays file.
.br
Format: String
.br
Default:
.I p_

.IP prime_exempt_anytime_queues 13
Determines whether
.I anytime
queues are controlled by
.I backfill_prime.
If set to true, jobs in an
.I anytime
queue
are not prevented from running across a primetime/nonprimetime
or non-primetime/primetime boundary. If set to
false, the jobs in an
.I anytime
queue may not cross this boundary,
except for the amount specified by their
.I prime_spill
setting.
See also
.I backfill_prime, prime_spill.
.br
Format: Boolean
.br
Default:
.I False

.IP prime_spill 13
.RS
Specifies the amount of time a job can spill over from non-primetime
into primetime or from primetime into non-primetime.
This option is only meaningful if
.I backfill_prime
is
.I True.
This option can be separately specified for
primetime and non-primetime. See also
.I backfill_prime, prime_exempt_anytime_queues.
.br
For example, non-primetime jobs can spill into primetime by 1 hour:
.RS
.I prime_spill: 1:00:00 prime
.RE
For example, jobs in either prime/non-prime can spill into
the other by 1 hour:
.RS
.I prime_spill: 1:00:00 all
.RE
.br
Format: Duration
.br
Default:
.I 00:00:00
.RE

.IP provision_policy
Specifies how vnodes are selected for provisioning.  Can be set by
Manager only; readable by all.  Can be set to one of the following:

.RS
.IP "avoid_provision" 5

PBS first tries to satisfy the job's request from free vnodes that
already have the requested AOE instantiated.  PBS uses
.I node_sort_key
to sort these vnodes.

If it cannot satisfy the job's request using vnodes that already have
the requested AOE instantiated, PBS uses the server's
.I node_sort_key
to select the free vnodes that must be
provisioned in order to run the job, choosing from any free vnodes,
regardless of which AOE is instantiated on them.

Of the selected vnodes, PBS provisions any that do not have the
requested AOE instantiated on them.


.IP "aggressive_provision" 5
PBS selects vnodes to be provisioned without considering which AOE
is currently instantiated.

PBS uses the server's
.I node_sort_key
to select the vnodes on which to run the job,
choosing from any free vnodes, regardless of which AOE is instantiated
on them.  Of the selected vnodes, PBS provisions any that do not have
the requested AOE instantiated on them.
.LP

Format: string
.br
Default:
.I "aggressive_provision"
.RE

.IP resources 13
.RS
Specifies those resources which are not to be over-allocated,
or if Boolean, are to be honored, when
scheduling jobs. Vnode-level Boolean resources are automatically
enforced and do not need to be listed here. Limits are set
by setting
.I resources_available.<resource name>
on vnodes, queues, and the server. A scheduler
considers numeric (integer or float) items as consumable
resources and ensures that no more are assigned than are available
(e.g.
.I ncpus
or
.I mem
). Any string resources are compared
using string comparisons (e.g.
.I arch
).
.br
If "host" is not added to the
resources line, then when the user submits a job requesting a specific
vnode in the following syntax:
.RS
qsub -l select=host=vnodeName
.RE
the job will run on any host.
.br
Format: String
.br
Default:
.I ncpus, mem, arch, host, vnode, aoe
.RE

.IP resource_unset_infinite 13
Resources in this list are treated as infinite if they are unset.
Cannot be set differently
for primetime and non-primetime.
.br
Example:
.I resource_unset_infinite: vmem, foo_licenses
.br
Format: Comma-delimited list of resources
.br
Default: Empty list

.IP round_robin 13
If set to
.I True,
this scheduler considers one job from the first queue, then one job
from the second queue, and so on in a circular fashion.  The queues
are ordered with the highest-priority queue first.  Each scheduling
cycle starts with the same highest-priority queue, which will
therefore get preferential treatment.

If there are groups of queues with the same priority, and this
parameter is set to
.I True,
this scheduler round-robins through each
group of queues before moving to the next group.

If
.I round_robin
is set to
.I False,
this scheduler considers jobs according to the setting of the
.I by_queue
parameter.  When
.I True, overrides the
.I by_queue parameter.

Format:
.I Boolean
.br
Default:
.I False all

.IP server_dyn_res 13
Directs this scheduler to replace the server's
.I resources_available
values with new values returned
by a site-specific external program.
.br
Format: String
.br
Default: Unset

.IP smp_cluster_dist 13
.RS
.B Deprecated (12.2).
Specifies how single-host jobs should be distributed to
all hosts of the complex. Options:
.RS
.IP pack
Keep putting jobs onto one host until it is full and then move on to the next.
.IP round_robin
Put one job on each vnode in turn before cycling back to the first one.
.IP lowest_load
Put the job on the lowest-loaded host.
.RE
.br
Format: String
.br
Default:
.I pack all
.RE

.IP sort_queues 13
.B Obsolete.

.IP strict_fifo 13
.B Deprecated.
Use
.I strict_ordering.

.IP strict_ordering 13
Specifies that jobs must be run in the order determined
by whatever sorting parameters are being used. This means that
a job cannot be skipped due to resources required not being
available.
If a job due to run next cannot run, no job will run, unless
backfilling is used, in which case jobs can be backfilled around the job that is
due to run next.
.br
Example line in PBS_HOME/sched_priv/sched_config:
.RS
.I strict_ordering: true ALL
.br
Format: Boolean
.br
Default:
.I False all
.RE

.IP sync_time 13
.B Obsolete.

.IP unknown_shares 13
The number of shares for the
.I unknown
group. These
shares determine the portion of a resource to be allotted to that
group via fairshare. Requires
.I fair_share
to be enabled.
.br
Format: Integer
.br
Default: The unknown group gets 0 shares

.SH FORMATS
.IP Boolean 10
Allowable values (case insensitive): True|T|Y|1|False|F|N|0

.IP Duration 10
Period of time.  Expressed either as
.br
.I \ \ \ integer seconds
.br
or
.br
.I \ \ \ [[hours:]minutes:]seconds[.milliseconds]
.br
Milliseconds are rounded to the nearest second.
.LP

.IP Float 10
Allowable values: [+-] 0-9 [[0-9] ...][.][[0-9] ...]

.IP Long 10
Long integer.
Allowable values: 0-9 [[0-9] ...], and + and -

.IP Size 10
Number of bytes or words.  The size of a word is 64 bits.
.br
Format:
.I <integer>[<suffix>]
.br
where
.I suffix
can be
.RS 13
.IP "\ b\ or\ \ w" 13
bytes or words
.IP "kb\ or\ kw"
Kilobytes or kilowords (2 to the 10th, or 1024)
.IP "mb\ or\ mw" 13
Megabytes or megawords (2 to the 20th, or 1,048,576)
.IP "gb\ or\ gw" 13
Gigabytes or gigawords (2 to the 30th, or 1,073,741,824)
.IP "tb\ or\ tw" 13
Terabytes or terawords (2 to the 40th, or 1024 gigabytes)
.IP "pb\ or\ pw" 13
Petabytes or petawords (2 to the 50th, or 1,048,576 gigabytes)
.RE
.IP
Default:
.I bytes


.IP String 10
(Resource value)
.br
Any character, including the space character.
.br
Only one of the two types of quote characters, " or ', may appear in any given value.
.br
Allowable values: [_a-zA-Z0-9][[-_a-zA-Z0-9 !"#$%' ()*+,-./:;<=>?@[\\]^_{|}~] ...]
.br
String resource values are case-sensitive.

.SH FILES
$PBS_HOME/sched_priv is
the default directory for configuration files.

$PBS_HOME/sched_priv/holidays is the holidays file.

.SH SIGNAL HANDLING

All signals are ignored until the end of the cycle.  Most signals are
handled in the standard UNIX fashion.

.IP SIGHUP
This scheduler closes and reopens its log file and rereads its
configuration file if one exists.
.IP "SIGALRM, SIGBUS, etc."
Ignored until end of scheduling cycle.  This scheduler quits.
.IP "SIGINT and SIGTERM"
This scheduler closes its log file and shuts down.
.LP


.SH EXIT STATUS
Zero upon normal termination.

.SH SEE ALSO
pbs_server(8B), pbs_mom(8B)


================================================
FILE: doc/man8/pbs_server.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_server 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_server 
- start a PBS batch server
.SH SYNOPSIS
.B pbs_server 
[-a <active>] 
[-A <acctfile>] 
[-C]
[-d <config path>] 
.RS 11
[-e <mask>] 
[-F <delay>]
[-L <logfile>]
[-M <MoM port>] 
[-N]
[-p <port number>]
[-R <MoM RPP port>] 
[-S <default scheduler port>]
[-s <replacement string>]
[-t <restart type>] 
.RE
.B pbs_server
--version

.SH DESCRIPTION
The
.B pbs_server
command starts a batch server on the local host.
Typically, this command is in a local boot file such as
.I /etc/rc.local.
If the batch server is already in running, 
.B pbs_server
exits with an error.

.B Required Permission
.br
To ensure that the 
.B pbs_server
command is not runnable by the general user community, the server
runs only if its real and effective uid is zero.  You must be root.

.SH OPTIONS
.IP "-A <acctfile>" 10
Specifies an absolute path name for the file to use as the accounting file.
If not specified, the file is named for the current date in the
PBS_HOME/server_priv/accounting directory.

.IP "-a <active> " 10
When 
.I True, 
the server is in state "active" and the default scheduler is called
to schedule jobs.
When 
.I False, 
the server is in state "idle" and the default scheduler is not called
to schedule jobs.
Sets the server's 
.I scheduling 
attribute.
If this option is not specified, the server uses the prior 
.I value 
for the 
.I scheduling
attribute.
.br
Format: Boolean
.br

.IP "-C" 10
The server starts up, creates the database, and exits.  Windows only.

.IP "-d <config path>" 10
Specifies the absolute path to the directory containing the server
configuration files, PBS_HOME.  Each server must have a different
configuration directory.  The default configuration directory is
specified in $PBS_HOME, and is typically
.I /var/spool/PBS .

.IP "-e <mask>"
Specifies a log event mask to be used when logging.  See "log_events" in the
pbs_server_attributes(7B) man page.

.IP "-F <delay>"
Specifies the number of seconds that the secondary server should wait 
before taking over when it believes the primary server is down.  If 
the number of seconds is specified as 
.I -1, 
the secondary will make one
attempt to contact the primary and then become active.
.br
Default: 
.I 30 seconds

.IP "-L <logfile>"
Specifies the absolute path name for the log file.
If not specified, the file is named for the current date in the
PBS_HOME/server_logs directory.  PBS_HOME is specified in the $PBS_HOME
environment variable or in /etc/pbs.conf; see the
.I -d
option.

.IP "-M <MoM port>"
Specifies the host name and/or port number on which the server should connect
to MOM.  The option argument,
.I MoM port,
uses the syntax: 
.br
.I \ \ \ [<hostname>][:<port number>]
.br
If 
.I hostname 
is not specified, the local host is assumed.   
.br
If 
.I port number 
is not specified, the default port is assumed.  See the 
.I -M 
option for pbs_mom(8).  
.br
Default: 
.I 15002

.IP "-N" 10
Runs the server in standalone mode.

.IP "-p <port number>" 10
Specifies the port number on which the server is to listen for batch requests.
If multiple servers are running on a
single host, each must have its own unique port number.
This option is for use in testing with multiple batch systems on a single host.
.br
Default: 
.I 15001

.IP "-R <MoM RPP port>"
Specifies the port number on which the server should query the up/down
status of MoM.    See the 
.I -R 
option for pbs_mom(8).  
.br
Default: 
.I 15003

.IP "-S <default scheduler port>" 10
Specifies the port number to which the server should connect when
contacting the default scheduler.  The option argument,
.I default scheduler port,
uses the syntax:
.br
.I \ \ \ [<hostname>][:<port number>]
.br
Default: 
.I 15004

.IP "-s <replacement string>" 10
Specifies the string to use when replacing spaces in accounting 
entity names.  Only available under Windows.

.IP "-t <restart type>"
Specifies behavior when the server restarts.  The
.I restart type
argument is one of the following:
.RS
.IP cold 7
All jobs are purged.  Positive confirmation is required before
this direction is accepted.

.IP create 7
The server discards any existing configuration files: server, nodes, queues,
and jobs, and initialize configuration files to the default values.  
The default scheduler is idled (
.I scheduling 
is set to 
.I False
).  Any multischeds are deleted.

.IP hot 7
All jobs in the Running state are retained in that state.  Any job
that was requeued into the Queued state from the Running state when
the server last shut down is run immediately, assuming the required
resources are available.  This returns the server to the same state as
when it went down.  After those jobs are restarted, normal scheduling
takes place for all remaining queued jobs.  All other jobs are
retained in their current state.

.IP
If a job cannot be restarted immediately because of a missing resource, such
as a vnode being down, the server attempts to restart it periodically for
up to 5 minutes.   After that period, the server will revert to a normal state,
as if 
.I warm 
started, and will no longer attempt to restart any remaining jobs
which were running prior to the shutdown.

.IP updatedb 7
Updates format of PBS data from the previous format to the
data service format.

.IP warm 7
All jobs in the Running state are retained in that state.  All other
jobs are maintained in their current state.  The default scheduler
typically chooses new jobs for execution.  
.I warm 
is the default if 
.I -t
is not specified.


.RE
.LP
.IP "--version" 10
The 
.B pbs_server
command returns its PBS version information and exits.
This option can only be used alone.

.SH FILES
.IP $PBS_HOME/server_priv 10
Default directory for configuration files

.IP $PBS_HOME/server_logs 10
Directory for log files recorded by the server


.SH Signal Handling
When it receives the following signals, the server performs the following actions:

.IP SIGHUP
The current server log and accounting log are closed and reopened.  This 
allows for the prior log to be renamed and a new log started from the time
of the signal.

.IP SIGTERM
Causes a rapid orderly shutdown of 
.B pbs_server, 
identical to 
.I "qterm -t quick".

.IP SIGSHUTDN
On systems where SIGSHUTDN is defined, causes an orderly
.I "quick" 
shutdown of the server.

.IP "SIGPIPE, SIGUSR1, SIGUSR2"
These signals are ignored.
.LP
All other signals have their default behavior installed.

.SH Diagnostic Messages
The server will record a diagnostic message in a log file for any
error occurrence.  The log files are maintained in the server_logs
directory below the home directory of the server.
If the log file cannot be opened, the diagnostic message is written
to the system console.  The server writes its PBS 
version and build information to the logfile whenever it starts up or 
the logfile is rolled to a new file.

.SH Stopping the PBS Server
.B Stopping the Server on Linux
.br
Use the 
.B qterm
command:
.br
.I \ \ \ qterm 
.br
(see qterm(8B)) 
.br
or send a SIGTERM:
.br
.I \ \ \ kill <server PID>

.SH EXIT STATUS
.IP Zero
When the server has run in the background and then exits

.IP "Greater than zero"
If the server command fails to begin batch operation


.SH SEE ALSO
qsub (1B), pbs_connect(3B),
pbs_mom(8B), pbs_sched(8B),
pbsnodes(8B), qdisable(8B), qenable(8B), qmgr(8B), qrun(8B), qstart(8B),
qstop(8B), and qterm(8B)


================================================
FILE: doc/man8/pbs_snapshot.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_snapshot 8B "20 September 2019" Local "PBS Professional"
.SH NAME
.B pbs_snapshot
- Linux only.  Capture PBS data to be used for diagnostics
.SH SYNOPSIS
.B pbs_snapshot
-h, --help
.br
.B pbs_snapshot 
-o <output directory path> 
.RS 12
[--accounting-logs=<number of days>] 
.br
[--additional-hosts=<hostname list>] [--basic]
.br
[--daemon-logs=<number of days>] 
[-H <server host>]
.br
[-l <log level>] 
[--map=<file path>]
[--obfuscate]
.br
[--with-sudo]
.RE
.B pbs_snapshot
--version
.SH DESCRIPTION

You use 
.B pbs_snapshot 
to capture PBS data for diagnostics.  This tool is written in Python
and uses PTL libraries, including PBSSnapUtils, to extract the data.
You can optionally anonymize the PBS data.  The 
.B pbs_snapshot 
command captures data from all multischeds.  The
command detects which daemon or daemons are running on the host where
it is collecting information, and captures daemon and system data
accordingly.  If no PBS daemons are running, the command collects
system information.  The output tarball contains information about the
host specified via the 
.I -H 
option, or if that is not specified, the
local host.  If you specify additional hosts, the command creates a
tarball for each additional host and includes it as a sub-tarball in
the output.

If you want to capture only PBS configuration information, use the 
.I --basic
option.

.B Required Privilege
.br
The 
.B pbs_snapshot 
command allows you to use the 
.B sudo 
infrastructure
provided by the PTL framework to capture root-owned information via
.I --with-sudo.  
All other information is collected as a normal user.  If
you need to run 
.B pbs_snapshot 
as a non-prvileged user, and without
using the PTL 
.I --with-sudo 
infrastructure, you must be root if you want
root-owned information to be collected.

.B Restrictions
.br
The 
.B pbs_snapshot 
command is not available on Windows.

.SH OPTIONS
.IP "--accounting-logs=<number of days>" 5
Specifies number of days of accounting logs to be collected; this
count includes the current day.
.br
Value of 
.I number of days 
must be >=0:
.br
   If number of days is 0, no logs are captured.
.br
   If number of days is 1, only the logs for the current day 
.br
   are captured.
.br
Default: 
.B pbs_snapshot
collects 30 days of accounting logs

.IP "--additional-hosts=<hostname list>" 5
Specifies that 
.B pbs_snapshot
should gather data from the specified list of additional hosts.  
Launches the 
.B pbs_snapshot 
command on each specified host, creates a
tarball there named 
.I <hostname>_snapshot.tgz, 
and includes it as a sub-tarball in the output for the main output.  If you use the
.I --with-sudo 
option, each launched copy uses that option as well.

The command does not query the server when it runs at a non-server host.  

The command collects a full snapshot, including the following information:
.RS 8
Daemon logs, for the number of days of logs being captured, specified
via the 
.I --daemon-logs=<number of days> 
option
.br
The PBS_HOME/<daemon>_priv directory
.br
Accounting logs if server daemon runs on host
.br
System information
.RE
.IP
Format for 
.I hostname list 
is a comma-separated list of one or more hostnames: 
.br
.I <hostname>[, <hostname> ...]

.IP "--basic" 5
Captures PBS configuration information only.  Captures the following:
.nf

Output File                   Description of Captured Information
------------------------------------------------------------------
server/qstat_Bf.out           Output of qstat -Bf
server/qstat_Qf.out           Output of qstat -Qf
scheduler/qmgr_lsched.out     Output of qmgr -c 'list sched'
node/pbsnodes_va.out          Output of pbsnodes -va
reservation/pbs_rstat_f.out   Output of pbs_rstat -f
job/qstat_f.out               Output of qstat -f
hook/qmgr_lpbshook.out        Output of qmgr -c 'list pbshook'
sched_priv/ for each          Copy of each scheduler's 
scheduler instance            sched_priv directory
server_priv/resourcedef       Copy of server_priv/resourcedef file  
pbs.conf                      Copy of /etc/pbs.conf on server host    
pbs_snapshot.log              Log of pbs_snapshot execution
ctime                         Timestamp of when the snapshot
                              was taken
.fi

Can be combined with other options such as 
.I --accounting-logs
and 
.I --daemon-logs
in order to capture additional information.

.IP "--daemon-logs=<number of days>" 5
Specifies number of days of daemon logs to be collected; this count
includes the current day. 
.br
Value of 
.I number of days 
must be >=0:
.RS 8
If number of days is 0, no logs are captured.
.br
If number of days is 1, only the logs for the current day are captured.
.RE
.IP
Default: 
.B pbs_snapshot
collects 5 days of daemon logs

.IP "-h, --help" 5
Prints usage and exits.

.IP "-H <hostname>" 5
Specifies hostname for host whose retrieved data is to be at the top
level in the output tarball.  If not specified, 
.B pbs_snapshot 
puts data for the local host at the top level in the output tarball.

.IP "-l <log level>" 5
Specifies level at which 
.B pbs_snapshot
writes its log.  The log file is 
pbs_snapshot.log, in the output directory path specified using the 
.I -o <output directory path> 
option.

Valid values, from most comprehensive to least: DEBUG2, DEBUG,
INFOCLI2, INFOCLI, INFO, WARNING, ERROR, FATAL
.br
Default: INFOCLI2


.IP "--map=<file path>" 5
Specifies path for file containing obfuscation map, which is a
<key>:<value> pair-mapping of obfuscated data.  Path can be absolute
or relative to current working directory.
.br
Default: 
.B pbs_snapshot
writes its obfuscation map in a file called obfuscate.map in the
location specified via the
.I -o <output directory path> 
option.  
.br
Can only be used with the 
.I --obfuscate 
option.

.IP "--obfuscate" 5
Obfuscates (anonymizes) or deletes sensitive PBS data captured by 
.B pbs_snapshot.
.br
Obfuscates the following data: 
.RS 8
euser, egroup, project, Account_Name, operators, managers, group_list,
Mail_Users, User_List, server_host, acl_groups, acl_users,
acl_resv_groups, acl_resv_users, sched_host, acl_resv_hosts,
acl_hosts, Job_Owner, exec_host, Host, Mom, resources_available.host,
resources_available.vnode
.RE
.IP " " 5
Deletes the following data: 
.RS 8
Variable_List, Error_Path, Output_Path, mail_from, Mail_Points,
Job_Name, jobdir, Submit_arguments, Shell_Path_List
.RE

.IP "--version" 5
The 
.B pbs_snapshot
command prints its PBS version information and exits.
Can only be used alone.

.IP "--with-sudo" 5
Uses the PTL 
.B sudo 
infrastructure in order capture root-owned
information via 
.B sudo.  
(Information not owned by root is captured
using normal privilege, not root privilege.)  With this option, you do
not need to prefix your 
.B pbs_snapshot 
command with 
.B sudo, 
and you do not need root privilege.

.SH Arguments to pbs_snapshot
.IP "-o <output directory path>" 5
Path to directory where 
.B pbs_snapshot
writes its output tarball.  Required.  Path can be absolute or
relative to current working directory.
.br
For example, if you specify 
.I -o /temp,
.B pbs_snapshot
writes "/temp/snapshot_<timestamp>.tgz".
.br
The output directory path must already exist. 

.SH Output
.B Output Location
.br
You must use the 
.I -o <output directory path> 
option to specify the directory where 
.B pbs_snapshot
writes its output.  The path can be absolute or relative to current
working directory.  The output directory must already exist.  As an
example, if you specify "-o /temp", 
.B pbs_snapshot
writes "/temp/snapshot_<timestamp>.tgz".

.B Output Contents
.br
The 
.B pbs_snapshot
command writes 
the output for the local host and each specified remote host as a
tarball.  Tarballs for remote hosts are included in the main tarball.

The command captures JSON output from 
.B qstat-f -F json 
and 
.B pbsnodes -av -F json.  
.br
The main tarball contains the following directory structure, files, and tarballs:
.nf
Directory  Directory
or File    Contents             Description
------------------------------------------------------------------------
server/         
           qstat_B.out          Output of qstat -B
           qstat_Bf.out         Output of qstat -Bf
           qmgr_ps.out          Output of qmgr print server
           qstat_Q.out          Output of qstat -Q
           qstat_Qf.out         Output of qstat -Qf
           qmgr_pr.out          Output of qmgr print resource

server_priv/                    Copy of the PBS_HOME/server_priv 
                                directory.   
                                Core files are captured separately; 
.fi
.RS 32
see
.I core_file_bt/.  
.RE
.nf

           accounting/          Accounting logs from 
                                PBS_HOME/server_priv/accounting/ 
                                directory for the number of days 
.fi
.RS 32
specified via 
.I --accounting-logs 
option
.RE
.nf

server_logs/                    Server logs from the 
                                PBS_HOME/server_logs directory for the
                                number of days specified 
.fi
.RS 32
via
.I --daemon-logs 
option
.RE
.nf

job/            
           qstat.out            Output of qstat
           qstat_f.out          Output of qstat -f
           qstat_f_F_json.out   Output of qstat -f -F json
           qstat_t.out          Output of qstat -t
           qstat_tf.out         Output of qstat -tf
           qstat_x.out          Output of qstat -x
           qstat_xf.out         Output of qstat -xf
           qstat_ns.out         Output of qstat -ns
           qstat_fx_F_dsv.out   Output of qstat -fx -F dsv
           qstat_f_F_dsv.out    Output of qstat -f -F dsv
node/           
           pbsnodes_va.out      Output of pbsnodes -va
           pbsnodes_a.out       Output of pbsnodes -a
           pbsnodes_avSj.out    Output of pbsnodes -avSj
           pbsnodes_aSj.out     Output of pbsnodes -aSj
           pbsnodes_avS.out     Output of pbsnodes -avS
           pbsnodes_aS.out      Output of pbsnodes -aS
           pbsnodes_aFdsv.out   Output of pbsnodes -aF dsv
           pbsnodes_avFdsv.out  Output of pbsnodes -avF dsv
           pbsnodes_avFjson.out Output of pbsnodes -avF json
           qmgr_pn_default.out  Output of qmgr print node @default

mom_priv/                       Copy of the PBS_HOME/mom_priv 
                                directory.
                                Core files are captured separately; 
                                see core_file_bt/.  

mom_logs/                       MoM logs from the PBS_HOME/mom_logs 
                                directory for the number of days 
.fi
.RS 32
via
.I --daemon-logs 
option
.RE
.nf

comm_logs/                      Comm logs from the PBS_HOME/comm_logs 
                                directory for the number of days 
.fi
.RS 32
specified via 
.I --daemon-logs 
option
.RE
.nf  

sched_priv/                     Copy of the PBS_HOME/sched_priv 
                                directory, with all files.
                                Core files are not captured; 
                                see core_file_bt/. 

sched_logs/                     Scheduler logs from the 
                                PBS_HOME/sched_logs directory for 
                                the number of days specified 
.fi
.RS 32
via
.I --daemon-logs 
option    
.RE
.nf

sched_priv_<multisched name>/   Copy of the 
                                PBS_HOME/sched_priv_<multisched_name>
                                directory, with all files.
                                Core files are not captured; 
                                see core_file_bt/. 

sched_logs_<multisched name>/   Scheduler logs from the 
                                PBS_HOME/sched_logs_<multisched_name> 
                                directory for the number
                                of days specified
.fi
.RS 32
via
.I --daemon-logs 
option    
.RE
.nf

reservation/            
           pbs_rstat_f.out      Output of pbs_rstat -f

           pbs_rstat.out        Output of pbs_rstat

scheduler/              
           qmgr_lsched.out      Output of qmgr list sched

hook/           
           qmgr_ph_default.out  Output of qmgr print hook @default

           qmgr_lpbshook.out    Output of qmgr list pbshook

datastore/              
           pg_log/              Copy of the 
                                PBS_HOME/datastore/pg_log directory 
                                for the number of days specified 
.fi
.RS 32
via
.I --daemon-logs 
option
.RE
.nf

core_file_bt/                   Stack backtrace from core files 

           sched_priv/          Files containing the output of thread 
                                apply all backtrace full on all core 
                                files captured from PBS_HOME/sched_priv

           sched_priv_          Files containing the output of thread 
           <multisched name>/   apply all backtrace full on all core 
                                files captured from PBS_HOME/sched_priv

           server_priv/         Files containing the output of thread 
                                apply all backtrace full on all core 
                                files captured from 
                                PBS_HOME/server_priv

           mom_priv/            Files containing the output of thread 
                                apply all backtrace full on all core 
                                files captured from PBS_HOME/mom_priv

           misc/                Files containing the output of thread 
                                apply all backtrace full on any other 
                                core files found inside PBS_HOME

system/         
           pbs_probe_v.out      Output of pbs_probe -v

           pbs_hostn_v.out      Output of pbs_hostn -v $(hostname)

           pbs_environment      Copy of PBS_HOME/pbs_environment file

           os_info              Information about the OS

           process_info         List of processes running on the system 
                                when the snapshot was taken.  Output of
                                ps -aux | grep [p]bs on Linux systems,
                                or tasklist /v on Windows systems

           ps_leaf.out          Output of ps -leaf.  Linux only.

           lsof_pbs.out         Output of lsof | grep [p]bs.
                                Linux only.
           etc_hosts            Copy of /etc/hosts file.  Linux only.

           etc_nsswitch_conf    Copy of /etc/nsswitch.conf file.
                                Linux only.

           vmstat.out           Output of the command vmstat.  
                                Linux only.

           df_h.out             Output of the command df -h.  
                                Linux only.

           dmesg.out            Output of the dmesg command.  
                                Linux only.

pbs.conf                        Copy of the pbs.conf file on the 
                                server host    

ctime                           Contains the time in seconds since 
                                epoch when the snapshot was taken    

pbs_snapshot.log                Log messages written by pbs_snapshot
    
<remote hostname>.tgz           Tarball of output from running the 
                                pbs_snapshot command at a remote host
.fi

.SH Examples
.IP "pbs_snapshot -o /tmp" 5
Writes a snapshot to /temp/snapshot_<timestamp>.tgz that includes 30
days of accounting logs and 5 days of daemon logs from the server
host.

.IP "pbs_snapshot --daemon-logs=1 --accounting-logs=1 -o /tmp --obfuscate --map=mapfile.txt" 5
Writes a snapshot to /temp/snapshot_<timestamp>.tgz that includes 1
day of accounting and daemon logs.  Obfuscates the data and stores the
data mapping in the map file named "mapfile.txt".


================================================
FILE: doc/man8/pbs_tclsh.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_tclsh 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_tclsh 
- TCL shell with TCL-wrapped PBS API
.SH SYNOPSIS
.B pbs_tclsh 

.B pbs_tclsh 
--version
.SH DESCRIPTION
.B Deprecated.  
The
.B pbs_tclsh
command starts a version of the TCL shell which includes wrapped versions of
the PBS external API. The PBS TCL API is documented in the pbs_tclapi(3B) manual page.

The 
.B pbs_tclsh
command is used to query MoM.  For example:

.RS
.nf
\> pbs_tclsh
tclsh> openrm <hostname>
<file descriptor>
tclsh> addreq <file descriptor> "loadave"
tclsh> getreq <file descriptor>
<load average>
tclsh> closereq <file descriptor>
.fi
.RE

.B Required Privilege
.br
Root privilege is required in order to query MoM for dynamic 
resources.  Root privilege is not required in order to query
MoM for built-in resources and site-defined static resources.


.SH OPTIONS
.IP "--version" 8
The 
.B pbs_tclsh
command returns its PBS version information and exits.
This option can only be used alone.

.SH STANDARD ERROR
The
.B pbs_tclsh
command writes a diagnostic message to standard error for
each error occurrence.

.SH SEE ALSO
pbs_wish(8B), pbs_server(8B), pbs_mom(8B), pbs_sched(8B)


================================================
FILE: doc/man8/pbs_tmrsh.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_tmrsh 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_tmrsh 
- TM-enabled replacement for rsh/ssh for use by MPI implementations
.SH SYNOPSIS
.B pbs_tmrsh 
<hostname> [-l <username>] [-n] <command> [<args> ...]
.br
.B pbs_tmrsh 
--version

.SH DESCRIPTION
The
.B pbs_tmrsh
command attempts to emulate an "rsh" connection to the specified host,
via underlying calls to the Task Management (TM) API. The program is
intended to be used during MPI integration activities, and not by
end-users. 

Running "pbs_tmrsh <hostname> <command>" causes a PBS task to be started
on 
.I hostname 
running 
.I command. 

.B Requirements for Environment Variables
.br
The environment variables used by the two MPI implementations
to point to the rsh work-alike (MPI_REMSH in the case of HP and
P4_RSHCOMMAND for MPICH) must be set in the job environment
and point to the full path for
.B pbs_tmrsh.
.LP
The file $PBS_HOME/pbs_environment should contain an environment
variable PATH in which to search for the program executable. This
applies to both Windows and Linux. It is expected that a full path will
be specified for the 
.I command 
and the PATH variable will not be needed.

.SH OPTIONS
.IP "-l <username>" 13
Specifies the username under which to execute the task. If used, 
.I username 
must
match the username running the
.B pbs_tmrsh 
command.
.IP "-n" 13
A no-op; provided for MPI implementations that expect to call
rsh with the 
.I -n 
option.
.LP
.IP "--version" 13
The 
.B pbs_tmrsh
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
.IP command
Specifies command to be run as a PBS task.

.IP hostname
Specifies host on which to run PBS task.  The 
.I hostname 
may be in IP-dot-address form.

.SH Output and Error
Output and errors are written to the PBS job's output and error files,
not to standard output/error.

The
.B pbs_tmrsh
command writes a diagnostic message to the PBS job's error file for
each error occurrence.

.SH EXIT STATUS
The
.B pbs_tmrsh
program exits with the exit status of the remote command or with
255 if an error occurred. This is because ssh works this way.

.SH SEE ALSO
pbs_attach(8B), tm(3) 


================================================
FILE: doc/man8/pbs_topologyinfo.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_topologyinfo 8B "17 July 2020" Local "PBS Professional"
.SH NAME
.B pbs_topologyinfo 
\- report topological information


.SH SYNOPSIS
.B pbs_topologyinfo 
(-a | --all) [(-l | --license) | (-s | --sockets)]
.br
.B pbs_topologyinfo 
(-l | --license) <vnode name> [<vnode name> ...]
.br
.B pbs_topologyinfo 
(-s | --sockets) <vnode name> [<vnode name> ...]
.br
.B pbs_topologyinfo 
-h | --help

.SH DESCRIPTION
The
.B pbs_topologyinfo
command reports topological information for one or more vnodes.  This
information is used for licensing purposes.  To use the command, you
must specify what kind of topological information you want.  The
command reports only the requested information.

This command must be run on the server host.

.SH Usage
.B pbs_topologyinfo -al
reports number of node licenses needed for all vnodes.

.B pbs_topologyinfo -l <vnode name>
reports number of node licenses needed for 
.I vnode name.

.B pbs_topologyinfo -as 
reports socket counts for all vnodes that have reported sockets.

.B pbs_topologyinfo -s <vnode name>
reports socket count for vnode 
.I vnode name.

.SH Prerequisites
Before you use this command, the server and MoMs must be configured 
so that they can contact each other, and must have been run.  

.SH Required Privilege

This command can be run only by root or Admin on Windows.

.SH OPTIONS
.IP "-a, --all" 15
Reports requested topological information for all vnodes.  When this
option is used alone, the command does not report any information.

.IP "-h, --help " 15
Prints usage and exits.

.IP "-l, --license [<vnode name(s)>]" 15
Reports number of node licenses required.  If you specify
.I vnode name(s),
the command reports node licenses needed for the specified vnode(s) only.

.IP "-s, --sockets [<vnode name(s)>]" 15
Reports derived socket counts.  If you specify
.I vnode name(s),
the command reports socket count information for the specified vnode(s) only.

.IP "(no options)" 15
Does not report any information.

.SH OPERANDS
.IP "vnode name [<vnode name> ...]" 15 
Name(s) of vnode(s) about which to report.

.SH Errors
If you specify an invalid vnode name, the command prints a message to standard error.


.SH EXIT STATUS
.IP "0" 15 
Success
.IP "1" 15
Any error following successful command line processing.


================================================
FILE: doc/man8/pbs_wish.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbs_wish 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbs_wish 
- TK window shell with TCL-wrapped PBS API
.SH SYNOPSIS
.B pbs_wish 

.B pbs_wish
--version
.SH DESCRIPTION
.B Deprecated.  
The
.B pbs_wish
command is a version of the TK window shell which includes wrapped versions of
the PBS external API. The PBS TCL API is documented in the
pbs_tclapi(3B) manual page.

.SH OPTIONS
.IP "--version" 8
The 
.B pbs_wish
command returns its PBS version information and exits.
This option can only be used alone.

.SH STANDARD ERROR
The
.B pbs_wish
command writes a diagnostic message to standard error for each error occurrence.

.SH SEE ALSO
pbs_tclsh(8B), pbs_mom(8B), pbs_server(8B), pbs_sched(8B)


================================================
FILE: doc/man8/pbsfs.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbsfs 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbsfs 
\- show or manipulate PBS fairshare usage data
.SH SYNOPSIS

Showing usage data:
.br
.B pbsfs 
[-c <entity1> <entity2>] [-g <entity>] [-I <scheduler name>] 
      [-p] [-t]

.br
Manipulating usage data:
.br
.B pbsfs 
[-d] [-e] [-I <scheduler name>] [-s <entity> <usage value>]

.br
Printing version:
.br
.B pbsfs 
--version

.SH DESCRIPTION

You can use the 
.B pbsfs 
command to print or manipulate the PBS scheduler's
fairshare usage data.  You can print the usage data in various
formats, described below.  Changes made using 
.B pbsfs 
take effect in the next scheduling cycle; you do not need to restart or HUP the
scheduler for changes to take effect.  

We recommend that if you use the options that manipulate usage data,
you should do this when the scheduler is not scheduling jobs, because
scheduling while changing fairshare usage data may give unwanted
results.  

.B Prerequisites
.br
The server must be running in order to use the 
.B pbsfs
command.

.B Permissions 
.br
You must be root to run the 
.B pbsfs 
command; if not, it will print the error message, 
"Unable to access fairshare data".

.SH OPTIONS

.B You can safely use the following options while jobs are being scheduled:
.IP "(no options)" 10
Same as 
.B pbsfs -p
.IP "-c <entity1> <entity2>" 10
Compare two fairshare entities
.IP "-g <entity>" 10
Print a detailed listing for the specified entity, including the path 
from the root of the tree to the entity.
.IP "-I <scheduler name>" 10
Specifies name of scheduler whose data is to be manipulated or shown.  
Required for multischeds; optional for default scheduler.  Name of 
default scheduler is "default".  If not specified, 
.B pbsfs
operates on default scheduler.
.IP "-p" 10
Print the fairshare tree as a table, showing for each internal and
leaf vertex the group ID of the vertex's parent, group ID of the vertex,
vertex shares, vertex usage, and percent of shares allotted to the
vertex.
.IP "-t" 10
Print the fairshare tree in a hierarchical format.
.IP "--version" 10
The 
.B pbsfs
command returns its PBS version information and exits.
This option can only be used alone.
.LP

.B It is not recommended to be scheduling jobs when you use the following options:
.IP "-d" 10
Decay the fairshare tree by the amount specified in the 
.I fairshare_decay_factor
scheduler parameter.
.IP "-e" 10
Trim fairshare tree to just the entities in the 
.I resource_group 
file.  Unknown entities and their usage are deleted; as a result the unknown
group has no usage and no children.
.IP "-s <entity> <usage value>" 10
Set 
.I entity's 
usage value to 
.I usage value.  
Editing a non-leaf entity is ignored.  All non-leaf entity usage
values are calculated each time you use the pbsfs command to make
changes.
.LP

.SH Output Formats for pbsfs

The pbsfs command can print output in three different formats:

.B pbsfs -g <entity>
.br
Prints a detailed listing for the specified entity.  Example:
.br
.B pbsfs -g pbsuser3
 fairshare entity: pbsuser3
 Resgroup: 20
 cresgroup: 22
 Shares: 40
 Percentage: 24.000000%
 fairshare_tree_usage: 0.832973
 usage: 1000 (cput)
 usage/perc: 4167
 Path from root:
 TREEROOT  :     0       1201 / 1.000 = 1201
 group2    :    20       1001 / 0.600 = 1668
 pbsuser3  :    22       1000 / 0.240 = 4167

.B pbsfs or pbsfs -p
.br
Prints the entire tree as a table, with data in columns.  Example:
.br
.B pbsfs
.br
Fairshare usage units are in: cput
.br
TREEROOT\ : Grp:\ -1\ \ cgrp:\ \ 0  Shares:\ -1  Usage:\ 1201   Perc:\ 100.000%
.br
group2\ \ \ : Grp:\ \ 0\ \ cgrp:\ 20  Shares:\ 60  Usage:\ 1001   Perc:\ \ 60.000%
.br
pbsuser3\ : Grp:\ 20\ \ cgrp:\ 22  Shares:\ 40  Usage:\ 1000   Perc:\ \ 24.000%
.br
pbsuser2\ : Grp:\ 20\ \ cgrp:\ 21  Shares:\ 60  Usage:\ \ \ \ 1   Perc:\ \ 36.000%
.br
group1\ \ \ : Grp:\ \ 0\ \ cgrp:\ 10  Shares:\ 40  Usage:\ \ 201   Perc:\ \ 40.000%
.br
pbsuser1\ : Grp:\ 10\ \ cgrp:\ 12  Shares:\ 50  Usage:\ \ 100   Perc:\ \ 20.000%
.br
pbsuser\ \ : Grp:\ 10\ \ cgrp:\ 11  Shares:\ 50  Usage:\ \ 100   Perc:\ \ 20.000%
.br
unknown\ \ : Grp:\ \ 0\ \ cgrp:\ \ 1  Shares:\ \ 0  Usage:\ \ \ \ 1   Perc:\ \ \ 0.000%

.B pbsfs -t
.br
Prints the entire tree as a tree, showing group-child relationships.  Example:
.br
.B pbsfs -t
  TREEROOT(0)
      group2(20)
           pbsuser3(22)
           pbsuser2(21)
      group1(10)
           pbsuser1(12)
           pbsuser(11)
      unknown(1)

.SH Data Output by pbsfs
.IP "cresgroup or cgrp" 10
Group ID of the entity.
.IP "fairshare entity" 10
The specified fairshare tree entity.
.IP "fairshare usage units" 10
The resource for which the scheduler accumulates usage for fairshare
calculations.  This defaults to 
.I cput 
(CPU seconds) but can be set in
the scheduler's configuration file.
.IP "fairshare_tree_usage" 10
The entity's effective usage.  

.IP "Path from root" 10
The path from the root of the tree to the entity.  The scheduler
follows this path when comparing priority between two entities.
.IP "Percentage or perc" 10
The percentage of the shares in the tree allotted to the entity,
computed as 
.I fairshare_perc.  

.IP "Resgroup or Grp" 10
Group ID of the entity's parent group.
.IP "Shares" 10
The number of shares allotted to the entity.
.IP "usage" 10
The amount of usage by the entity.
.IP "usage / perc" 10
The value the scheduler uses to the pick which entity has priority
over another.  The smaller the number the higher the priority.

.SH SEE ALSO
pbs_sched(8B)


================================================
FILE: doc/man8/pbsnodes.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbsnodes 8B "6 May 2020" Local "PBS Professional"
.SH NAME

.B pbsnodes 
\- query PBS host or vnode status, mark hosts free or offline, change 
the comment for a host, or output vnode information
.SH SYNOPSIS

.B pbsnodes 
[-o | -r] [-s <server>] [-C <comment>] <hostname> [<hostname> ...]

.B pbsnodes 
[-l] [-s <server>] 

.B pbsnodes 
-v <vnode> [<vnode> ...] [-s <server>]

.B pbsnodes 
-a[v] [-S[j][L]] [-F json|dsv [-D <delim>]] [-s <server>]

.B pbsnodes 
[-H] [-S[j][L]] [-F json|dsv [-D <delim>]] <hostname> [<hostname> ...]

.B pbsnodes 
--version

.SH DESCRIPTION
The 
.B pbsnodes
command is used to query the status of hosts or vnodes, to mark hosts FREE or
OFFLINE, to edit a host's 
.I comment 
attribute, or to output vnode information.  The 
.B pbsnodes 
command obtains host information by sending a request to the PBS server.
.LP

.B Using pbsnodes
.br
To list all vnodes:
.br
   pbsnodes -av
.br   

To print the status of the specified host or hosts, run 
.B pbsnodes
with no options (except the 
.I -s
option) and with a list of hosts.
.LP
To print the command usage, run 
.B pbsnodes 
with no options and without a list of hosts.

To remove a node from the scheduling pool, mark it OFFLINE.  If it is marked
DOWN, when the server next queries the MoM, and can connect, the node will be
marked FREE.

To offline a single vnode in a multi-vnoded system, use: 
.RS 5
qmgr -c "set node <vnode name> state=offline"
.RE

.SH OUTPUT
The order in which hosts or vnodes are listed in the output of the
.B pbsnodes 
command is undefined.  Do not rely on output being ordered.
If you print attributes, 
.B pbsnodes
prints out only those attributes which are not at default values.

.SH PERMISSIONS
PBS Manager or Operator privilege is required to execute 
.B pbsnodes 
with the
.B \-o 
or
.B \-r
options, to view custom resources which have been created to be
invisible to users, and to see some output such as PBS version.

.SH OPTIONS
.IP "(no options)" 8
If neither options nor a host list is given, the 
.B pbsnodes
command prints usage syntax.

.IP "-a" 8
Lists all hosts and all their attributes (available and used.)

When used with the 
.I -v
option, lists all vnodes.

When listing a host with multiple vnodes:

.RS 
.IP "" 5
The output for the 
.I jobs 
attribute lists all the jobs on all the vnodes
on that host.
Jobs that run on more than one vnode will appear once for each vnode they
run on.

For consumable resources, the output for each resource is the sum of that
resource across all vnodes on that host.

For all other resources, e.g. string and Boolean, if the value of that
resource is the same on all vnodes on that host, the value is returned.
Otherwise the output is the literal string "<various>".
.LP
.RE

.IP "-C <comment>" 8
Sets the 
.I comment
attribute for the specified host(s) to the value of <comment>.
Comments containing spaces must be quoted.  The comment string is limited
to 80 characters.  Usage:
.br
.B \ \ \  pbsnodes -C <comment> <hostname> [<hostname> ...]

To set the comment for a vnode:
.br
.B \ \ \ qmgr -c "s n <vnode name> comment=<comment>"

.IP "-F dsv [-D <delim>]"
Prints output in delimiter-separated value format.  Optional delimiter
specification.  Default delimiter is vertical bar ("|").

.IP "-F json"
Prints output in JSON format.

.IP "-H <host> [<host> ...]"
Prints all non-default-valued attributes for specified hosts and all
vnodes on specified hosts.

.IP "-j"
Displays the following job-related headers for specified vnodes:
.nf
Header\ \ \ \ \ Width\ \ Description
------------------------------------
vnode       15    Vnode name
state       15    Vnode state
njobs        6    Number of jobs on vnode
run          5    Number of running jobs at vnode
susp         6    Number of suspended jobs at vnode
mem f/t     12    Vnode memory free/total
ncpus f/t    7    Number of CPUs at vnode free/total
nmics f/t    7    Number of MICs at vnode free/total
ngpus f/t    7    Number of GPUs at vnode free/total
jobs        any   List of job IDs on vnode
.fi

.br
Note that 
.I nmics 
is a custom resource that must be created by the administrator if you 
want it displayed here.

Each subjob is treated as a unique job.

.IP "-L"
Displays output with no restrictions on column width.

.IP "-l" 8
Lists all hosts marked as DOWN or OFFLINE. Each such host's state and
comment attribute (if set) is listed.  If a host also has state 
STATE-UNKNOWN, it is listed. For hosts with multiple vnodes, 
only hosts where all vnodes are marked as DOWN or OFFLINE are listed.

.IP "-o <hostname> [<hostname> ...]" 8
Marks listed hosts as OFFLINE even if currently in use.  This is
different from being marked DOWN.  A host that is marked OFFLINE 
continues to execute the jobs already on it, but is removed from
the scheduling pool (no more jobs are scheduled on it.)  

For hosts with multiple vnodes, pbsnodes operates on a host and all of
its vnodes, where the hostname is resources_available.host, which is
the name of the natural vnode.  

To offline all vnodes on a multi-vnoded machine:
.br
.B \ \ \ pbsnodes -o <name of natural vnode>

To offline a single vnode on a multi-vnoded system, use: 
.br
.B \ \ \ qmgr -c "set node <vnode name> state=offline"

Requires PBS Manager or Operator privilege.
.RE

.IP "-r <hostname> [<hostname> ...]" 8
Clears OFFLINE from listed hosts.

.IP "-S"
Displays the following vnode information:
.nf
Header\ \ \ \ \ Width\ \ Description
------------------------------------
name        15    Vnode name
state       15    Vnode state
OS           8    Value of OS custom resource, if any
hardware     8    Value of hardware custom resource, if any
host        15    Hostname
queue       10    Value of vnode's queue attribute
ncpus        7    Number of CPUs at vnode
nmics        7    Number of MICs at vnode
mem          8    Vnode memory
ngpus        7    Number of GPUs at vnode
comment     any   Vnode comment
.fi

Note that 
.I nmics 
and 
.I OS
are custom resources that must be created by the administrator
if you want their values displayed here.

.IP "-s <server>" 8
Specifies the PBS server to which to connect.

.IP "-v <vnode> [<vnode> ...]" 8
Lists all non-default-valued attributes for each specified vnode.
.br
With no arguments, prints one entry for each vnode in the PBS complex.
.br
With one or more vnodes specified, prints on entry for each specified
vnode.
.br
When used with 
.I -a,
lists all vnodes.

.IP "--version" 8
The 
.B pbsnodes
command returns its PBS version information and exits.
This option can only be used alone.


.SH OPERANDS
.IP "<server>" 8
Specifies the server to which to connect. 
Default: default server.

.IP "<hostname> [<hostname> ...]" 8
Specifies the host(s) to be queried or operated on.

.IP "<vnode> [<vnode> ...]" 8
Specifies the vnode(s) to be queried or operated on.

.SH EXIT STATUS
.IP "Zero"
Success

.IP "Greater than zero"
Incorrect operands are given
.br
.B pbsnodes
cannot connect to the server 
.br
There is an error querying the server for the vnodes

.SH SEE ALSO
pbs_server(8B) and qmgr(8B)


================================================
FILE: doc/man8/pbsrun.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbsrun 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbsrun
\- general-purpose wrapper script for mpirun

.SH SYNOPSIS
.B pbsrun

.B pbsrun
--version

.SH DESCRIPTION
.B pbsrun
is a wrapper script for any of several versions of mpirun.
This provides a user-transparent way for PBS to control jobs
which call mpirun in their jobscripts.
The
.B pbsrun_wrap
script instantiates 
.B pbsrun
so that the wrapper script for the specific version of mpirun
being used has the same name as that version of mpirun.

If the mpirun wrapper script is run inside a PBS job, it
translates any mpirun call of the form:
.br
    mpirun [<options>] <executable> [<args>]
.br
into
.br
    mpirun [<options>] pbs_attach [<special options to pbs_attach>] \\
.br
            <executable> [<args>]
.br
where 
.I special options to pbs_attach 
refers to any options needed by 
.B pbs_attach 
to do its job (e.g. -j $PBS_JOBID).

If the wrapper script is executed outside of PBS, a warning is issued
about "not running under PBS", but it proceeds as if the actual
program had been called in standalone fashion.

The 
.B pbsrun 
wrapper script is not meant to be executed directly; instead
it is instantiated by 
.B pbsrun_wrap.
It is copied to the target directory and renamed
"pbsrun.<mpirun version/flavor>" where 
.I mpirun version/flavor
is a string that identifies the mpirun
version being wrapped (e.g. ch_gm).

The 
.B pbsrun 
script, if executed inside a PBS job,
runs an 
.B initialization script, 
named $PBS_EXEC/lib/MPI/pbsrun.<mpirun version/flavor>.init, then
parses mpirun-like arguments from the command line, sorting which
options and option values to retain, to ignore, or to transform,
before calling the actual mpirun script with a "pbs_attach" prefixed
to the executable.  The actual mpirun to call is found by tracing the
link pointed to by $PBS_EXEC/lib/MPI/pbsrun.<mpirun
version/flavor>.link.

For all of the wrapped MPIs, the maximum number of ranks that can be
launched is the number of entries in $PBS_NODEFILE.

The wrapped MPIs are:
.RS 5
MPICH-GM's mpirun (mpirun.ch_gm) with rsh/ssh (
.B deprecated
as of 14.2.1)
.br
MPICH-MX's mpirun (mpirun.ch_mx) with rsh/ssh (
.B deprecated
as of 14.2.1)
.br
MPICH-GM's mpirun (mpirun.mpd) with MPD (
.B deprecated
as of 14.2.1)
.br
MPICH-MX's mpirun (mpirun.mpd) with MPD (
.B deprecated
as of 14.2.1)
.br
MPICH2's mpirun
.br
Intel MPI's mpirun (
.B deprecated
as of 13.0)
.br
MVAPICH1's mpirun (
.B deprecated
as of 14.2.1)
.br
MVAPICH2's mpiexec
.RE

.SH OPTIONS
.IP "--version" 8
The 
.B pbsrun
command returns its PBS version information and exits.
This option can only be used alone.

.SH INITIALIZATION SCRIPT

The initialization script, called $PBS_EXEC/lib/MPI/pbsrun.<mpirun version/flavor>.init,
where 
.I mpirun version/flavor 
reflects the mpirun flavor/version being wrapped,
can be modified by an administrator to customize against the local
flavor/version of mpirun being wrapped.

Inside this sourced init script, 8 variables are set:
.RS 5
options_to_retain="-optA -optB <val> -optC <val1> val2> ..."
.br
options_to_ignore="-optD -optE <n> -optF <val1> val2> ..."
.br
options_to_transform="-optG -optH <val> -optI <val1> val2> ..."
.br
options_to_fail="-optY -optZ ..."
.br
options_to_configfile="-optX <val> ..."
.br
options_with_another_form="-optW <val> ..."
.br
pbs_attach=pbs_attach
.br
options_to_pbs_attach="-J $PBS_JOBID"
.br
.RE

.B Initialization Script Options
.br
.IP "options_to_retain" 5
Space-separated list of options and values that
pbsrun.<mpirun version/flavor> passes on to the actual mpirun call. Options must
begin with "-" or "--", and option arguments must be specified by some
arbitrary name with left and right arrows, as in "<val1>".

.IP "options_to_ignore" 5
Space-separated list of options and values that pbsrun.<mpirun
version/flavor> does not pass on to the actual mpirun call. Options
must begin with "-" or "--", and option arguments must be specified by
arbitrary names with left and right arrows, as in "<n>".

.IP "options_to_transform" 5
Space-separated list of options and values
that 
.B pbsrun 
modifies before passing on to the actual mpirun call.

.IP "option_to_fail" 5
Space-separated list of options that will cause
.B pbsrun 
to exit upon encountering a match.

.IP "options_to_configfile" 5
Single option and value that refers to
the name of the "configfile" containing command line segments found in
certain versions of mpirun. 

.IP "options_with_another_form" 5
Space-separated list of options and values that can be found in
options_to_retain, options_to_ignore, or options_to_transform, whose
syntax has an alternate, unsupported form.

.IP "pbs_attach" 5
Path to 
.B pbs_attach, 
which is called before the
<executable> argument of mpirun.

.IP "options_to_pbs_attach" 5
Special options to pass to the
.B pbs_attach call. 
You may pass variable references (e.g. $PBS_JOBID) and
they are substituted  by 
.B pbsrun 
to actual values.
.LP
.RE

If 
.B pbsrun 
encounters any option not found in 
.I options_to_retain, options_to_ignore, 
and 
.I options_to_transform, 
then it is flagged
as an error.

.B Functions Created
.br
These functions are created inside the init script.  These can be
modified by the PBS administrator.
.RS 5

.IP "transform_action () {" 5
     # passed actual values of $options_to_transform
.br
     args=$*
.br
}

.IP "boot_action () {" 5
     mpirun_location=$1
.br
}

.IP "evaluate_options_action () {" 5
     # passed actual values of transformed options
.br
     args=$*
.br
}

.IP "configfile_cmdline_action () {" 5
     args=$*
.br
}
		
.IP "end_action () {" 5
     mpirun_location=$1
.br
}
.LP

.IP "transform_action()" 5
The pbsrun.<mpirun version/flavor> wrapper script invokes the function
.I transform_action() 
(called once on each matched item and value) with
actual options and values received matching one of the
"options_to_transform". The function returns a string to pass on
to the actual mpirun call.


.IP "boot_action()" 5
Performs any initialization tasks needed before running the actual
mpirun call. For instance, GM's MPD requires the MPD daemons to be
user-started first. This function is called by the pbsrun.<mpirun
version/flavor> script with the location of actual mpirun passed as
the first argument. Also, the pbsrun.<mpirun version/flavor> checks
for the exit value of this function to determine whether or not to
progress to the next step.


.IP "evaluate_options_action()" 5
Called with the actual options
and values that resulted after consulting 
.I options_to_retain, options_to_ignore, options_to_transform, 
and executing 
.I transform_action().
This provides one more chance for the script writer to evaluate all
the options and values in general, and make any necessary adjustments,
before passing them on to the actual mpirun call. For instance,
this function can specify what the default value is for a missing 
.I -np
option.


.IP "configfile_cmdline_action()" 5
Returns the actual options and values
to be put in before the option_to_configfile parameter. 

.IP "configfile_firstline_action()" 5
Returns the item that is 
put in the first line of the configuration file specified in the
.I option_to_configfile 
parameter.

.IP "end_action()" 5
Called by pbsrun.<mpirun version/flavor> at the end of execution.  It
undoes any action done by transform_action(), like cleanup of
temporary files. It is also called when pbsrun.<mpirun
version/flavor> is prematurely killed. This function is called
with the location of actual mpirun passed as first argument.
.RE

The actual mpirun program to call is the path pointed to by
    $PBS_EXEC/lib/MPI/pbsrun.<mpirun version/flavor>.link.


.B Modifying *.init scripts
.br
In order for administrators to modify *.init scripts without breaking
package verification in RPM, master copies of the initialization
scripts are named *.init.in.  
.B pbsrun_wrap 
instantiates the *.init.in files as *.init. For instance,
$PBS_EXEC/lib/MPI/pbsrun.mpich2.init.in is the master copy, and
.B pbsrun_wrap 
instantiates it as $PBS_EXEC/lib/MPI/pbsrun.mpich2.init.
.B pbsrun_unwrap 
takes care of removing the *.init files.


.SH MPIRUN VERSIONS/FLAVORS
-----------------------------------------------------------
.br
.B MPICH-GM's mpirun (mpirun.ch_gm) with rsh/ssh: pbsrun.ch_gm
.br
-----------------------------------------------------------

SYNTAX
.RS 5

.B pbsrun.ch_gm <options> <executable> <arg1> 
.B <arg2> ... <argn>

.B Deprecated.
This is the PBS wrapper script to MPICH-GM's mpirun (mpirun.ch_gm) with
rsh/ssh process startup method.

If executed inside a PBS job, this allows for PBS to track all MPICH-GM
processes started by rsh/ssh so that PBS can perform accounting and 
have complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
.B mpirun.ch_gm 
was used.
.RE

OPTIONS HANDLING
.RS 5
If executed inside a PBS job script, all 
.B mpirun.ch_gm 
options given are
passed on to the actual mpirun call with these exceptions:

.IP "-machinefile <file>" 5
The 
.I file 
argument contents are ignored and replaced by the contents of
the $PBS_NODEFILE.

.IP "-np" 5
If not specified, the number of entries found in the
$PBS_NODEFILE is used.

.IP "-pg" 5
The use of the 
.I -pg 
option, for having multiple executables on multiple
hosts, is allowed but it is up to user to make sure 
only PBS hosts are specified in the process group file; MPI processes
spawned are not guaranteed to be under the control of PBS.
.RE

WRAP/UNWRAP
.RS 5
To wrap MPICH-GM's mpirun script:
.RS 4
.B # pbsrun_wrap [MPICH-GM_BIN_PATH]/mpirun.ch_gm pbsrun.ch_gm
.RE
To unwrap MPICH-GM's mpirun script:
.RS 4
.B # pbsrun_unwrap pbsrun.ch_gm
.RE
.RE
.RE

-----------------------------------------------------------
.br
.B MPICH-MX's mpirun (mpirun.ch_mx) with rsh/ssh: pbsrun.ch_mx
.br
-----------------------------------------------------------

SYNTAX
.RS 5

.B pbsrun.ch_mx <options> <executable> <arg1> 
.B <arg2> ... <argn>

.B Deprecated.  
This is the PBS wrapper script to MPICH-MX's mpirun (mpirun.ch_mx) with
rsh/ssh process startup method.

If executed inside a PBS job, this allows for PBS to track all MPICH-MX
processes started by rsh/ssh so that PBS can perform accounting and 
has complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
mpirun.ch_mx was used.
.RE

OPTIONS HANDLING
.RS 5
If executed inside a PBS job script, all mpirun.ch_gm options given are
passed on to the actual mpirun call with some exceptions:

.IP "-machinefile <file>" 5
The 
.I file 
argument contents is ignored and replaced by the contents
of the $PBS_NODEFILE.

.IP "-np" 5
If not specified, the number of entries found in the
$PBS_NODEFILE is used.

.IP "-pg" 5
The use of the 
.I -pg 
option, for having multiple executables on multiple
hosts, is allowed but it is up to user to make sure 
only PBS hosts are specified in the process group file; MPI processes
spawned are not guaranteed to be under the control of PBS.
.RE

WRAP/UNWRAP
.RS 5
To wrap MPICH-MX's mpirun script:
.RS 4
.B # pbsrun_wrap [MPICH-MX_BIN_PATH]/mpirun.ch_mx pbsrun.ch_mx
.RE
To unwrap MPICH-MX's mpirun script:
.RS 4
.B # pbsrun_unwrap pbsrun.ch_mx
.RE
.RE 
.RE

--------------------------------------------------------
.br
.B MPICH-GM's mpirun (mpirun.mpd) with MPD: pbsrun.gm_mpd
.br
--------------------------------------------------------

SYNTAX
.RS 5

.B pbsrun.gm_mpd <options> <executable> <arg1> 
.B <arg2> ... <argn>

.B Deprecated.  
This is the PBS wrapper script to MPICH-GM's mpirun (mpirun.mpd) with
MPD process startup method.

If executed inside a PBS job, this allows for PBS to track all MPICH-GM
processes started by the MPD daemons so that PBS can perform accounting 
have and complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
mpirun.ch_gm with MPD was used.
.RE

OPTIONS HANDLING
.RS 5 
If executed inside a PBS job script, all mpirun.ch_gm with MPD options given
are passed on to the actual mpirun call with these exceptions:

.IP "-m <file>" 5
The 
.I file 
argument contents are ignored and replaced by the contents of
the $PBS_NODEFILE.

.IP "-np" 5
If not specified, the number of entries found in the
$PBS_NODEFILE is used.

.IP "-pg" 5
The use of the 
.I -pg 
option, for having multiple executables on multiple
hosts, is allowed but it is up to user to make sure 
only PBS hosts are specified in the process group file; MPI processes
spawned are not guaranteed to be under the control of PBS.
.RE

STARTUP/SHUTDOWN
.RS 5
The script starts MPD daemons on each of the unique hosts listed in
$PBS_NODEFILE, using either rsh or ssh method based on value of environment
variable RSHCOMMAND.  The default is rsh.

The script also takes care of shutting down the MPD daemons at the end of
a run.
.RE

WRAP/UNWRAP
.RS 5
To wrap MPICH-GM's mpirun script with MPD:
.RS 4
.B # pbsrun_wrap [MPICH-GM_BIN_PATH]/mpirun.mpd pbsrun.gm_mpd
.RE
To unwrap MPICH-GM's mpirun script with MPD:
.RS 4
.B # pbsrun_unwrap pbsrun.gm_mpd
.RE
.RE
.RE

--------------------------------------------------------
.br
.B MPICH-MX's mpirun (mpirun.mpd) with MPD: pbsrun.mx_mpd
.br
--------------------------------------------------------

SYNTAX
.RS 5

.B pbsrun.mx_mpd <options> <executable> <arg1> 
.B <arg2> ... <argn>

.B Deprecated.  
This is the PBS wrapper script to MPICH-MX's mpirun (mpirun.mpd) with
MPD process startup method.

If executed inside a PBS job, this allows for PBS to track all MPICH-MX
processes started by the MPD daemons so that PBS can perform accounting 
and have complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
mpirun.ch_mx with MPD was used.
.RE

OPTIONS HANDLING
.RS 5
If executed inside a PBS job script, all mpirun.ch_gm with MPD options given
are passed on to the actual mpirun call with these exceptions:

.IP "-m <file>" 5
The 
.I file
argument contents are ignored and replaced by the contents of
the $PBS_NODEFILE.

.IP "-np" 5
If not specified, the number of entries found in the $PBS_NODEFILE is used.

.IP "-pg" 5
The use of the 
.I -pg 
option, for having multiple executables on multiple
hosts, is allowed but it is up to user to make sure 
only PBS hosts are specified in the process group file; MPI processes
spawned are not guaranteed to be under the control of PBS.
.RE

STARTUP/SHUTDOWN
.RS 5
The script starts MPD daemons on each of the unique hosts listed in
$PBS_NODEFILE, using either rsh or ssh method, based on value of environment
variable RSHCOMMAND -- rsh is the default.

The script also takes care of shutting down the MPD daemons at the end of
a run.
.RE

WRAP/UNWRAP
.RS 5
To wrap MPICH-MX's mpirun script with MPD:
.RS 4
.B # pbsrun_wrap [MPICH-MX_BIN_PATH]/mpirun.mpd pbsrun.mx_mpd
.RE
To unwrap MPICH-MX's mpirun script with MPD:
.RS 4
.B # pbsrun_unwrap pbsrun.mx_mpd
.RE
.RE
.RE

------------------------------
.br
.B MPICH2's mpirun: pbsrun.mpich2
.br
------------------------------

SYNTAX
.RS 5

.B pbsrun.mpich2 [<global args>] [<local args>] 
.B <executable> 
.RS 14
.B [<args>]
.B [: [<local args>] <executable> [<args>]] 
.RE
.br
- or - 
.br
.B pbsrun.mpich2 -configfile <configfile>

where <configfile> contains command line segments as lines:
.RS 5
[local args] executable1 [args]
.br
[local args] executable2 [args]
.br
[local args] executable3 [args]
.RE

This is the PBS wrapper script to MPICH2's mpirun.

If executed inside a PBS job, this allows for PBS to track all MPICH2
processes so that PBS can perform accounting and have complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
MPICH2's mpirun was used.
.RE

OPTIONS HANDLING
.RS 5
If executed inside a PBS job script, all MPICH2's mpirun options given
are passed on to the actual mpirun call with these exceptions:

.IP "-host and -ghost" 5
For specifying the execution host to run
on.  Not passed on to the actual mpirun call.

.IP "-machinefile <file>" 5
The 
.I file 
argument contents are ignored and replaced by the
contents of the $PBS_NODEFILE.

.IP "MPICH2's mpirun -localonly <x>" 5
For specifying the <x> number of
processes to run locally. Not supported. The user is advised
instead to use the equivalent arguments: 
.I "-np <x> -localonly".  
The reason
for this is that the 
.B pbsrun 
wrapper script cannot handle a variable number
of arguments to an option (e.g. "-localonly" has 1 argument and "-localonly <x>"
has 2 arguments).

.IP "-np" 5
If user did not specify a 
.I -np 
option, then no default value is provided
by the PBS wrapper scripts. It is up to the local mpirun to decide what
the reasonable default value should be, which is usually 1.
.RE 

STARTUP/SHUTDOWN
.RS 5
The script takes care of ensuring that the MPD daemons on each of the hosts
listed in the $PBS_NODEFILE are started. It also takes care of ensuring
that the MPD daemons have been shut down at the end of MPI job execution. 
.RE

WRAP/UNWRAP
.RS 5
To wrap MPICH2's mpirun script:
.RS 4
.B # pbsrun_wrap [MPICH2_BIN_PATH]/mpirun pbsrun.mpich2
.RE
To unwrap MPICH2's mpirun script:
.RS 4
.B # pbsrun_unwrap pbsrun.mpich2
.RE
.RE
.RE

-----------------------------------
.br
.B Intel MPI's mpirun: pbsrun.intelmpi 
.br
-----------------------------------

Wrapping Intel MPI, and support for mpdboot, are 
.B deprecated.

SYNTAX
.RS 5

.B pbsrun.intelmpi  [<mpdboot options>] [<mpiexec options>]
.RS 16
.B <executable> [<prog args>]
.br 
.B [: [<mpiexec options>] <executable> [<prog args>]]
.RE
.br
- or - 
.br
.B pbsrun.intelmpi [<mpdboot options>] -f <configfile>

where 
.I mpdboot options 
are any options to pass to the mpdboot program,
which is automatically called by Intel MPI's mpirun to start MPDs, and
.I configfile 
contains command line segments as lines.

This is the PBS wrapper script to Intel MPI's mpirun.

If executed inside a PBS job, this allows for PBS to track all Intel MPI
processes so that PBS can perform accounting and have complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
Intel MPI's mpirun was used.
.RE

Using 
.B pbsrun, pbsrun_wrap, 
and 
.B pbsrun_unwrap
with Intel MPI is 
.B deprecated 
as of 13.0.

OPTIONS HANDLING
.RS 5
If executed inside a PBS job script, all of the options to the PBS 
interface to MPI's mpirun are passed to the actual 
mpirun call with these exceptions:

.IP "-host and -ghost" 5
For specifying the execution host to run
on.  Not passed on to the actual mpirun call.

.IP  "-machinefile <file>" 5
The 
.I file
argument contents are ignored and replaced by the
contents of the $PBS_NODEFILE.

.IP "mpdboot options --totalnum=* and --file=*" 5
Ignored and replaced by the number of unique entries in $PBS_NODEFILE
and name of $PBS_NODEFILE respectively.

.IP "arguments to mpdboot options --file=* and -f <mpd_hosts_file>" 5
Replaced by $PBS_NODEFILE.

.IP "-s" 5 
If 
.B pbsrun.intelmpi 
is called inside a PBS job, Intel MPIs mpirun 
.I -s 
argument
to mpdboot are not supported as this closely matches the mpirun option
.I "-s <spec>". 
The user can simply run a separate mpdboot 
.I -s 
before calling
mpirun.  A warning message is issued by 
.B pbsrun.intelmpi 
upon
encountering a 
.I -s 
option telling users of the supported form.

.IP "-np" 5
If the user does not specify a 
.I -np 
option, then no default value is provided
by the PBS wrap scripts. It is up to the local mpirun to decide what
the reasonable default value should be, which is usually 1.
.RE

STARTUP/SHUTDOWN
.RS 5
Intel MPI's mpirun itself takes care of starting/stopping the
MPD daemons. 
.B pbsrun.intelmpi 
always passes the arguments
.I -totalnum=<number of mpds to start> 
and 
.I -file=<mpd_hosts_file> 
to the actual
mpirun, taking its input from unique entries in $PBS_NODEFILE.
.RE

WRAP/UNWRAP
.RS 5
To wrap Intel MPI's mpirun script:
.RS 4
.B # pbsrun_wrap [INTEL_MPI_BIN_PATH]/mpirun pbsrun.intelmpi
.RE
To unwrap Intel MPI's mpirun script:
.RS 4
.B # pbsrun_unwrap pbsrun.intelmpi
.RE
.RE
.RE


-----------------------------------------------------------
.br
.B MVAPICH1's mpirun: pbsrun.mvapich1
.br
-----------------------------------------------------------

SYNTAX
.RS 5

.B pbsrun.mvapich1 <mpirun options> <executable> <options>

.B Deprecated.  
Only one executable can be specified.
This is the PBS wrapper script to MVAPICH1's mpirun.  

If executed inside a PBS job, this allows for PBS to be aware of all MVAPICH1 
ranks and track their resources, so that PBS can perform accounting and 
have complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
.B mpirun
was used.
.RE

OPTIONS HANDLING
.RS 5
If executed inside a PBS job script, all 
.B mpirun
options given are
passed on to the actual mpirun call with these exceptions:

.IP "-map <list>" 5
The 
.I map
option is ignored.

.IP "-exclude <list>" 5
The 
.I exclude
option is ignored.

.IP "-machinefile <file>" 5
The 
.I machinefile
option is ignored.

.IP "-np" 5
If not specified, the number of entries found in the
$PBS_NODEFILE is used.

.RE


WRAP/UNWRAP
.RS 5
To wrap MVAPICH1's mpirun script:
.RS 4
.B # pbsrun_wrap  <path-to-actual-mpirun> pbsrun.mvapich1
.RE
To unwrap MVAPICH1's mpirun script:
.RS 4
.B # pbsrun_unwrap pbsrun.mvapich1
.RE
.RE
.RE


-----------------------------------------------------------
.br
.B MVAPICH2's mpiexec: pbsrun.mvapich2
.br
-----------------------------------------------------------

SYNTAX
.RS 5

.B pbsrun.mvapich2 <mpiexec args> <executable> <executable's 
.RS 16
.B args> 
.B [: <mpiexec args> <executable> <executable's args>]
.RE
Multiple executables can be specified using the colon notation.
This is the PBS wrapper script to MVAPICH2's mpiexec, which have 
the same format.

If executed inside a PBS job, this allows for PBS to be aware of all MVAPICH2
ranks and track their resources, so that PBS can perform accounting and 
have complete job control.

If executed outside of a PBS job, it behaves exactly as if standard
.B mpiexec
was used.
.RE

OPTIONS HANDLING
.RS 5
If executed inside a PBS job script, all 
.B mpiexec
options given are
passed on to the actual mpiexec call with these exceptions:

.IP "-host <host>" 5
The 
.I host
argument contents are ignored.

.IP "-machinefile <file>" 5
The 
.I file 
argument contents are ignored and replaced by the contents of
the $PBS_NODEFILE.

.RE

WRAP/UNWRAP
.RS 5
To wrap MVAPICH2's mpiexec script:
.RS 4
.B # pbsrun_wrap  <path-to-actual-mpiexec> pbsrun.mvapich2
.RE
To unwrap MVAPICH2's mpiexec script:
.RS 4
.B # pbsrun_unwrap pbsrun.mvapich2
.RE
.RE
.RE


.SH REQUIREMENTS
The mpirun being wrapped
must be installed and working on all the nodes in the PBS cluster.

.SH ERRORS
If 
.B pbsrun 
encounters any option not found in 
.I options_to_retain, options_to_ignore, 
and 
.I options_to_transform, 
then it is flagged as an error.

.SH SEE ALSO
pbs_attach(8B), 
pbsrun_wrap(8B), 
pbsrun_unwrap(8B)


================================================
FILE: doc/man8/pbsrun_unwrap.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbsrun_unwrap 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B pbsrun_unwrap
\- unwraps mpirun, reversing 
.B pbsrun_wrap

.SH SYNOPSIS
.B pbsrun_unwrap
pbsrun.<mpirun version/flavor>

.B pbsrun_unwrap
--version

.SH DESCRIPTION
The 
.B pbsrun_unwrap
script is used to reverse the actions of the 
.B pbsrun_wrap
script.

Use 
.B pbsrun_wrap
to wrap mpirun.

Using 
.B pbsrun_unwrap
with Intel MPI is 
.B deprecated
as of 13.0.

.SH USAGE

Syntax: 
.RS 5
.B pbsrun_unwrap 
pbsrun.<mpirun version/flavor>
.RE

For example, running the following:

     pbsrun_unwrap pbsrun.ch_gm

causes the following actions:

.IP " " 5
Checks for a link in $PBS_EXEC/lib/MPI/pbsrun.ch_gm.link;
If one exists, get the pathname it points to:
.br
/opt/mpich-gm/bin/mpirun.ch_gm.actual

.IP " " 5
rm $PBS_EXEC/lib/MPI/pbsrun.mpirun.ch_gm.link

.IP " " 5
rm /opt/mpich-gm/bin/mpirun.ch_gm

.IP " " 5
rm $PBS_EXEC/bin/pbsrun.ch_gm

.RS 5
.IP "mv" 4
/opt/mpich-gm/bin/mpirun.ch_gm.actual
.br
/opt/mpich-gm/bin/mpirun.ch_gm
.RE

.SH OPTIONS
.IP "--version" 5
The 
.B pbsrun_unwrap
command returns its PBS version information and exits.
This option can only be used alone.

.SH SEE ALSO
pbs_attach(8B), 
pbsrun(8B), 
pbsrun_wrap(8B)


================================================
FILE: doc/man8/pbsrun_wrap.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH pbsrun_wrap 8B "3 June 2020" Local "PBS Professional"
.SH NAME
.B pbsrun_wrap
\- general-purpose script for wrapping mpirun in pbsrun

.SH SYNOPSIS
.B pbsrun_wrap
[-s] <path to actual mpirun> pbsrun.<mpirun version/flavor>

.B pbsrun_wrap
--version

.SH DESCRIPTION
The 
.B pbsrun_wrap
script is used to wrap any of several versions of mpirun in 
.B pbsrun. 
The 
.B pbsrun_wrap 
script creates a symbolic link with the same
path and name as the mpirun being wrapped.  This calls 
.B pbsrun, 
which uses 
.B pbs_attach
to give MoM control of jobs.  The result is transparent to the
user; 
when mpirun is called from inside a
PBS job, 
PBS can monitor and control the job, but when mpirun is called
from outside of a PBS job, it behaves as it would normally.
See the 
.B pbs_attach(8B) 
and 
.B pbsrun(8B)
man pages.

Use 
.B pbsrun_unwrap
to reverse the process.

Using 
.B pbsrun_wrap
with Intel MPI is 
.B deprecated 
as of 13.0.

Available only under Linux.

.SH USAGE

Syntax: 
.RS 5
.B pbsrun_wrap 
[-s] <path to actual mpirun> pbsrun.<mpirun version/flavor>
.RE

Any mpirun version/flavor that can be wrapped has
an initialization script ending in ".init", 
found in $PBS_EXEC/lib/MPI:
.br
.RS 5
$PBS_EXEC/lib/MPI/pbsrun.<mpirun version/flavor>.init
.RE

The  
.B pbsrun_wrap 
script
instantiates the 
.B pbsrun 
wrapper script as
.B pbsrun.<mpirun version/flavor> 
in the same directory where 
.B pbsrun 
is located, and sets up the link to actual mpirun call via the symbolic link
.RS 5
$PBS_EXEC/lib/MPI/pbsrun.<mpirun version/flavor>.link
.RE

For example, running:
.RS 5
.B pbsrun_wrap 
/opt/mpich-gm/bin/mpirun.ch_gm pbsrun.ch_gm
.RE
causes the following actions:
.RS 4
Save original mpirun.ch_gm script:
.RS 4
.IP "mv" 4
/opt/mpich-gm/bin/mpirun.ch_gm 
.br 
/opt/mpich/gm/bin/mpirun.ch_gm.actual
.LP
.RE
Instantiate pbsrun wrapper script as pbsrun.ch_gm:
.RS 4
.IP "cp" 4
$PBS_EXEC/bin/pbsrun $PBS_EXEC/bin/pbsrun.ch_gm
.LP
.RE
Link "mpirun.ch_gm" to actually call "pbsrun.ch_gm":
.RS 4
.IP "ln -s" 6
$PBS_EXEC/bin/pbsrun.ch_gm /opt/mpich-gm/bin/mpirun.ch_gm
.LP
.RE
Create a link so that "pbsrun.ch_gm" calls "mpirun.ch_gm.actual":
.RS 4
.IP "ln -s" 6
/opt/mpich-gm/bin/mpirun.ch_gm.actual
$PBS_EXEC/lib/MPI/pbsrun.ch_gm.link
.RE
.RE
.RE


.SH OPTIONS

.IP "-s" 5
Sets the "strict_pbs" options in the various 
initialization scripts (e.g. pbsrun.bgl.init, pbsrun.ch_gm.init, etc...)
to 1 from the default 0. This means that the mpirun being wrapped by 
pbsrun will only be executed if inside a PBS environment. Otherwise, the user 
gets the error:
.RS
.IP 
Not running under PBS
exiting since strict_pbs is enabled; execute only in PBS
.LP

.RE

.IP "--version" 5
The 
.B pbsrun_wrap
command returns its PBS version information and exits.
This option can only be used alone.


.SH REQUIREMENTS
The mpirun being wrapped
must be installed and working on all the nodes in the PBS complex.


.SH SEE ALSO
pbs_attach(8B), 
pbsrun(8B), 
pbsrun_unwrap(8B)


================================================
FILE: doc/man8/printjob.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH printjob 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B printjob 
\- print job information
.SH SYNOPSIS
.B printjob 
[ -a | -s ] <job ID>
.br
.B printjob 
[ -a ] <file path> [<file path>...]
.br
.B printjob
--version
.SH DESCRIPTION
Prints job information.  This command is mainly useful for troubleshooting, 
as during normal operation, the 
.B qstat(8B) 
command is the preferred method for displaying job-specific data and attributes.
The server and MoM do not have to be running to execute this command.

.SH Usage
For a running job, you can run this command at any host using a 
job ID, and you can run this command at any execution host where
the job is running using a .JB file path.

For a finished job, if job history is enabled, you can run this command at
the server using the job ID.

When querying the server, you must use the job ID, and the data service
must be running.

Results will vary depending on whether you use the job ID or
a .JB file, and on which execution host you query with a .JB file.

.SH PERMISSIONS
In order to execute
.B printjob,
you must have root or Windows Administrator privilege.

.SH OPTIONS
.IP "(no options)" 15
Prints all job data including job attributes.
.IP "-a" 15
Suppresses the printing of job attributes.  Cannot be used with 
.I -s 
option.
.IP "-s" 15
Prints out the job script only.  Can be used at server or primary execution host.
Cannot be used with 
.I -a
option.  Must be used with a job ID.

.IP "--version" 15
The 
.B printjob
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
.IP "file path" 15
The 
.B printjob
command accepts one or more
.I file path
operands at the execution host.  Files are found in PBS_HOME/mom_priv/jobs/ 
on the primary execution host.  File path must include full path to file.  Cannot be
used with 
.I -s 
option.

.IP "job ID" 15
The 
.B printjob 
command accepts a job ID at the server host. 
.br
Format: <sequence number>[.<server name>][@<server name>]
.br
Data service must be running.
.SH STANDARD ERROR
The
.B printjob
command writes a diagnostic message to standard error for
each error occurrence.
.SH EXIT STATUS
.IP Zero 15
Upon successful processing of all the operands presented to the
.B printjob
command
.LP
.IP "Greater than zero" 15
If the 
.B printjob 
command fails to process any operand

.SH SEE ALSO
pbs_server(8B), qstat(8B)


================================================
FILE: doc/man8/qdisable.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qdisable 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qdisable 
- prevent a queue from accepting jobs
.SH SYNOPSIS
.B qdisable 
<destination> [<destination> ...]
.br
.B qdisable
--version
.SH DESCRIPTION
The
.B qdisable
command prevents a queue from accepting batch jobs.  Sets the value of 
the queue's 
.I enabled
attribute to
.I False.
If the command is accepted, the queue no longer accepts
.I "Queue Job"
requests.  Jobs already in the queue continue to be processed.  You
can use this to drain a queue of jobs.

.B Required Permission
.br
In order to execute 
.B qdisable, 
the user must have PBS Operator or Manager privilege.

.SH OPTIONS
.IP "--version" 8
The 
.B qdisable
command returns its PBS version information and exits.
This option can only be used alone.

.SH  OPERANDS
The qdisable command accepts one or more space-separated
.I destination
operands.  The operands take any of the following forms:

.I <queue name>
.IP " " 8
Prevents specified queue at default server from accepting jobs.
.LP
.I @<server name>
.IP " " 8
Prevents all queues at specified server from accepting jobs.
.LP
.I <queue name>@<server name>
.IP " " 8
Prevents specified queue at specified server from accepting jobs.
.LP
To prevent all queues at the default server from accepting jobs, 
use the 
.B qmgr 
command:
.br
.B \ \ \ Qmgr: set queue @default enabled=false

.SH STANDARD ERROR
The 
.B qdisable
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all the operands
.IP "Greater than zero" 8
If the 
.B qdisable 
command fails to process any operand

.SH SEE ALSO
pbs_server(8B), qmgr(8B), and qenable(8B)


================================================
FILE: doc/man8/qenable.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qenable 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qenable 
- allow a queue to accept jobs
.SH SYNOPSIS
.B qenable 
<destination> [<destination> ...]
.br
.B qenable
--version
.SH DESCRIPTION
The
.B qenable
command allows a queue to accept batch jobs.  Sets the value of 
the queue's 
.I enabled
attribute to
.I True.
If the command is accepted, the 
.I destination
accepts
.I "Queue Job"
requests.  

.B Required Permission
.br
In order to execute 
.B qenable, 
the user must have PBS Operator or Manager privilege.

.SH OPTIONS
.IP "--version" 8
The 
.B qenable
command returns its PBS version information and exits.
This option can only be used alone.

.SH  OPERANDS
The qenable command accepts one or more space-separated
.I destination
operands.  The operands take any of the following forms:

.I <queue name>
.IP " " 8
Allows specified queue at default server to accept jobs.
.LP
.I @<server name>
.IP " " 8
Allows all queues at specified server to accept jobs.
.LP
.I <queue name>@<server name>
.IP " " 8
Allows specified queue at specified server to accept jobs.
.LP
To allow all queues at the default server to accept jobs, 
use the 
.B qmgr 
command:
.br
.B \ \ \ Qmgr: set queue @default enabled=true

.SH STANDARD ERROR
The 
.B qenable
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all the operands
.IP "Greater than zero" 8
If the 
.B qenable 
command fails to process any operand

.SH SEE ALSO
pbs_server(8B), qmgr(8B), and qenable(8B)


================================================
FILE: doc/man8/qmgr.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qmgr 8B "6 May 2020" Local "PBS Professional"
.nf
.SH NAME
.B qmgr 
\- administrator's command interface for managing PBS
.SH SYNOPSIS
.B At shell command line:
.br
.B qmgr 
-c '<directive> [-a] [-e] [-n] [-z]'
.br
.B qmgr 
-c 'help [<help option>]'
.br
.B qmgr 
<return>
.br
.B qmgr 
--version
.br

.B In qmgr session:
.br
<directive> [-a] [-e] [-n] [-z]
.br
help <help option>

.SH DESCRIPTION
The PBS manager command, 
.B qmgr, 
provides a command-line interface to parts of PBS.  The 
.B qmgr 
command is used to create or delete queues,
vnodes, resources, and hooks, to set or change vnode, queue, hook,
server, or scheduler attributes and resources, and to view information
about hooks, queues, vnodes, resource definitions, the server, and 
schedulers.  

For a list of quick summaries of information about syntax, commands,
attributes, operators, names, and values, type "help" or "?" at the
qmgr prompt.  See "Printing Usage Information", below.

.B Modes of Operation
.br
When you type qmgr -c '<directive>', 
.B qmgr 
performs its
task and then exits.  

When you type qmgr <return>, 
.B qmgr 
starts a session and presents you with its command line prompt.  The 
.B qmgr
command then reads directives etc. from standard input; see 
"Directive Syntax", below.  You can edit the command
line; see "Reusing and Editing the qmgr Command
Line", below.  

For a qmgr prompt, type: 
.br
.B \ \ \ qmgr <return> 
.br
You will see the qmgr prompt:
.br
.B \ \ \ Qmgr:
.br

.B Required Privilege
.br
The qmgr command requires different levels of privilege depending on
the operation to be performed.

All users can list or print attributes except for hook attributes.  

PBS Operator or Manager privilege is required in order to set or
change vnode, queue, server, or scheduler attributes.  PBS Manager
privilege is required in order to create or delete queues, vnodes, and
resources.

Under Linux, root privilege is required in order to create hooks, or
operate on hooks or the 
.I job_sort_formula 
server attribute.  Under
Windows, this must be done from the installation account.

For domained environments, the installation account must be a local
account that is a member of the local Administrators group on the
local computer.  For standalone environments, the installation account
must be a local account that is a member of the local Administrators
group on the local computer.

Users without manager or operator privilege cannot view custom
resources or resource definitions which were created to be invisible
to users.

.B When To Run qmgr At Server Host
.br
When operating on hooks or on the 
.I job_sort_formula 
server attribute,
the qmgr command must be run at the server host.

.B Reusing and Editing the qmgr Command Line
.br
You can reuse or edit qmgr command lines.  The qmgr command maintains
a history of commands entered, up to a maximum of 500.  You can use
the 'history' command to see a numbered list of commands, and the !<n>
command to execute the line whose number is n.  You must not put any
spaces between the bang ("!") and the number.  For example, to execute
the 123rd command, type the following:
.br
.B \ \ \ !123
.br
You can see the last m commands by typing 'history m'.  For example,
to see the last 6 commands, type the following:
.br
.B \ \ \ history 6
.br
You can use the up and down arrows to navigate through the command
history list, and the left and right arrows to navigate within a
command line.  Within a command line, you can use emacs commands to
move forward and backward, and delete characters.

You can edit the qmgr command line using the backspace and delete
keys, and you can insert characters anywhere in a command line.

History is maintained across qmgr sessions, so that if you start qmgr,
then exit, then restart it, you can reuse your commands from the
previous session.  If you exit qmgr and then restart it, the command
lines are renumbered.

If you enter the same command line more than once in a row, only one
occurrence is recorded in the history.  If you enter the same command
line multiple times, but intersperse other command lines after each
line, each occurrence is recorded.

Each user's history is unique to that user on that host.

In the case where an account runs concurrent sessions, the most recent
logout of a session overwrites history from previous logouts.  For
example, if two people are both logged in as root and using qmgr, the
second person to log out overwrites the history file.

.B The qmgr History File
.br
The qmgr command stores and retrieves its history.  First, it tries to
write its history in the ${HOME}/.pbs_qmgr_history file.  If this file
or directory location is not writable, the command stores its history
in $PBS_HOME/spool/.pbs_qmgr_history_<user name>.  If this file is
also not writable, the following happens:

   The qmgr command prints error messages once at qmgr startup

   The qmgr command cannot provide history across qmgr sessions

.SH OPTIONS TO qmgr
The following table lists the options to qmgr:

.nf
.B Option \ \ \ \ \ \ \ \ \ \ \  Action
-----------------------------------------------------------------------
<return>           Starts a qmgr session and presents user with 
                   qmgr prompt
-----------------------------------------------------------------------
-a                 Aborts qmgr on any syntax errors or any requests 
                   rejected by a server.
-----------------------------------------------------------------------
-c '<directive>'   Executes a single command (directive) and exit qmgr. 
                   The directive must be enclosed in single or double 
                   quote marks, for example:
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ qmgr -c "print server" 
-----------------------------------------------------------------------
-c 'help           Prints out usage information.  
 [<help option>]'  See "Printing Usage Information"
-----------------------------------------------------------------------
-e                 Echoes all commands to standard output
-----------------------------------------------------------------------
-n                 No commands are executed; syntax checking only 
                   is performed
-----------------------------------------------------------------------
-z                 No errors are written to standard error
-----------------------------------------------------------------------
--version          The qmgr command returns its PBS version information 
                   and  exits.  This option can only be used alone
-----------------------------------------------------------------------


.SH Directives
A qmgr 
.I directive 
is a command together with the object(s) to be operated on, the
attribute(s) belonging to the object that is to be changed, the
operator, and the value(s) the attribute(s) will take.  In the case of
resources, you can set the type and/or flag(s).

.B Directive Syntax
.br
A directive is terminated by a newline or a semicolon (";"). Multiple
directives may be entered on a single line.  A directive may extend
across lines by escaping the newline with a backslash ("\").

Comments begin with the "#" character and continue to the end of the
line. Comments and blank lines are ignored by qmgr.

.B Server, Scheduler, Queue, Vnode Directives
.br
Syntax for operating on servers, schedulers, queues, vnodes:
.RS 3
.I <command> <object type> [<object name(s)>] [<attribute> <operator> <value>[,<attribute> <operator> <value>,...]]
.RE

.B Resource Directives
.br
Syntax for operating on resources:
.nf
.RS 3
.I <command> <resource name> [<resource name> ...] [type = <type>][,flag = <flag(s)>]
.RE
.fi
For information about resources, see 
.I pbs_resources.7B.

.B Hook-only Directives
.br
The directives here apply only to hooks.  Other directives apply to all objects such as 
queues, resources, hooks, etc. 

Syntax for importing and exporting site-defined hooks:
.nf
.RS 3
.I import hook <hook name> application/x-python <content-encoding> (<input file> | -) 
.br
.I export hook <hook name> <content-type> <content-encoding> [<output file>]
.fi
.RE
Syntax for importing site-defined hook configuration file:
.nf
.RS 3
.I import hook <hook name> application/x-config <content-encoding> (<input file> | -)  
.fi
.RE
Syntax for importing built-in hook configuration file:
.nf
.RS 3
.I import pbshook <hook name> application/x-config <content-encoding> (<input file> | -)  
.fi
.RE

.B Using Directives
.br
You can use a directive from the shell command line or from within
the qmgr session.

To use a directive from the command line, enclose the command and its
arguments in single or double quotes.
.br
.I \ \ \ qmgr -c '<command> <command arguments>'

For example, to have qmgr print server information and exit:
.br
.B \ \ \ qmgr -c "print server"

To use a directive from within the qmgr session, first start qmgr:
.br
.I \ \ \ qmgr <return>

The qmgr session presents a qmgr prompt:
.br
.B \ \ \ Qmgr:

At the qmgr prompt, enter the directive (a command and its arguments).
For example, to enter the same "print server" directive:
.br
.B \ \ \ Qmgr: print server

.B Commands Used in Directives
.br
Commands can be abbreviated to their minimum unambiguous form.
Commands apply to all target objects unless explicitly limited.  The
following table lists the commands, briefly tells what they do, and
lists the section with the full description:

.nf
.B Command \ Abbr \ Effect \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ See Description
-----------------------------------------------------------------------
active   a     Specifies active objects   "Making Objects Active"
-----------------------------------------------------------------------
create   c     Creates object             "Creating Objects (Server, 
                                           Scheduler, Vnode, Queue, 
                                           Hook)"
-----------------------------------------------------------------------
delete   d     Deletes object             "Deleting Objects"
-----------------------------------------------------------------------
exit           Exits (quits) the qmgr     
               session
-----------------------------------------------------------------------
export   e     Exports hook               "Exporting Hooks"
-----------------------------------------------------------------------
help     h|?   Prints usage to stdout     "Printing Usage Information"
-----------------------------------------------------------------------
import   i     Imports hook or            "Importing Hooks"
               configuration file         "Importing Hook 
                                           Configuration Files"
-----------------------------------------------------------------------
list     l     Lists object attributes    "Listing Objects and Their 
               and their values            Attributes"
-----------------------------------------------------------------------
print    p     Prints creation and        "Printing Creation and 
               configuration commands      Configuration Commands"
-----------------------------------------------------------------------
quit     q     Quits (exits) the qmgr 
               session
-----------------------------------------------------------------------
set      s     Sets value of attribute    "Setting Attribute and 
                                           Resource Values"
-----------------------------------------------------------------------
unset    u     Unsets value of attribute  "Unsetting Attribute and 
                                           Resource Values"
-----------------------------------------------------------------------

.SH Arguments to Directive Commands

.B Object Arguments to Directive Commands
.br
The qmgr command can operate on objects (servers, schedulers, queues, vnodes,
resources, hooks, and built-in hooks).  Each of these can be
abbreviated inside a directive.  The following table lists the objects
and their abbreviations:

.nf
.B Object \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ Can Be Created or \ \ \ \ \  Can Be
.B Name \ \ \ \ \ Abbr \ Object \ \ \ Deleted By: \ \ \ \ \ \ \ \ \ \ \ \ Modified By:
-----------------------------------------------------------------------
server    s    server     No one (created         Administrator,
                          at installation)        Operator, Manager
-----------------------------------------------------------------------
sched     sc   default    No one (created         Administrator,
               scheduler  at installation)        Operator, Manager 
               --------------------------------------------------------                 
               multisched Administrator, Manager  Administrator, 
                                                  Operator, Manager
-----------------------------------------------------------------------
queue     q    queue      Administrator,          Administrator,
                          Operator, Manager       Operator, Manager
-----------------------------------------------------------------------
node      n    vnode      Administrator,          Administrator,
                          Operator, Manager       Operator, Manager
-----------------------------------------------------------------------
resource  r    resource   Administrator, Manager  Administrator, 
                                                  Manager
-----------------------------------------------------------------------
hook      h    hook       Linux: root             Linux: root

                          Windows: installation   Windows: installation   
                                   account                 account
-----------------------------------------------------------------------
pbshook   p    built-in   No one (created         Linux: root
               hook       at installation)        
                                                  Windows: installation 
                                                           account 
-----------------------------------------------------------------------

.B Specifying Active Server
.br
The qmgr command operates on objects (queues, vnodes, etc.) at the
active server.  There is always at least one active server; the
default server is the active server unless other servers have been
made active.  The default server is the server managing the host where
the qmgr command runs, meaning it is the server specified in that
host's pbs.conf file.  Server names have the following format:
.br
.I \ \ \ <hostname>[:<port number>]
.br
where 
.I hostname 
is the fully-qualified domain name of the host on which
the server is running and 
.I port number 
is the port number to which to
connect.  If 
.I port number 
is not specified, the default port number, 15001, is used.

To specify the default server:
.br
.I \ \ \ @default

To specify a named server:
.br
.I \ \ \ @<server name>

To specify all active servers:
.br
.I \ \ \ @active

.B Using Lists of Object Names 
.br
In a qmgr directive, 
.I object name(s) 
is a list of one or more names of
specific objects.  The administrator specifies the name of an object
when creating the object.  The name list is in the form:
.br
.I \ \ \ <object name>[@<server>][,<object name>[@<server>] ...]
.br
where 
.I server 
is replaced in the directive with "default", "active", or
the name of the server.  The name list must conform to the following:
.RS 3
There must be no space between the object name and the @ sign.

Name lists must not contain white space between entries.  

All objects in a list must be of the same type.  

Node attributes cannot be used as vnode names.
.RE

.B Specifying Object Type and Name
.br
You can specify objects in the following ways:

To act on the active objects of the named type, at the active server:
.RS 3
.I <object type>

For example, to list all active vnodes, along with their attributes,
at the active server:
.br
.B Qmgr: list node
.RE

To act on the active objects of the named type, at a specified server:
.RS 3
.I <object type> @<server name>  
(note space before @ sign)

For example, to list all active vnodes at the default server, along
with their attributes:
.br
.B Qmgr: list node @default

For example, to print out all queues at the default server, along with
their attributes:
.br
.B qmgr -c "print queue @default"
.RE

To act on a specific named object:
.RS 3
.I <object type> <object name>

For example, to list Node1 and its attributes:
.br
.B Qmgr: list node Node1

To list queues workq, slowq, and fastq at the active server:
.br
.B Qmgr: list queue workq,slowq,fastq
.RE

To act on the named object at the specified server:
.RS 3
.I <object type> <object name>@<server name>

For example, to list Node1 at the default server, along with the
attributes of Node1:
.br
.B Qmgr: list node Node1@default

To list queues Queue1 at the default server, Queue2 at Server2, and
Queue3 at the active server:
.br
.B Qmgr: list queue Queue1@default,Queue2@Server2,Queue3@active
.RE

.B Operators in Directive Commands
.br
In a qmgr directive, 
.I operator 
is the operation to be performed with
the attribute and its value.  Operators are listed here:

.nf
.B Operator \ \ Effect
-----------------------------------------------------------------------
=          Sets the value of the attribute or resource.  If the 
           attribute or resource has an existing value, the current 
           value is replaced with the new value.
-----------------------------------------------------------------------
+=         Increases the current value of the attribute or resource by 
           the amount in the new value.  When used for a string array, 
           adds the new value as another string after a comma.
-----------------------------------------------------------------------
-=         Decreases the current value of the attribute or resource by 
           the specified amount.  When used for a string array, removes 
           the first matching string.
-----------------------------------------------------------------------

Example: Set routing destination for queue Queue1 to be Dest1:
.br
.B \ \ \ Qmgr: set queue route_destinations = Dest1

Example: Add new routing destination for queue Queue1:
.br
.B \ \ \ Qmgr: set queue route_destinations += Dest2

Example: Remove new routing destination for queue Queue1:
.br
.B \ \ \ Qmgr: set queue route_destinations -= Dest2

When setting numerical resource values, you can use only the equal sign ("=").

.B Windows Requirements For Directive Arguments
.br
Under Windows, use double quotes when specifying arguments to qmgr.
For example:
.br
   Qmgr: import hook hook1 application/x-python default \*(lq\\Documents and Settings\\pbsuser1\\hook1.py\\\*(rq
.br
or
.br
   qmgr -c 'import hook hook1 application/x-python default \*(lq\\Documents and Settings\\pbsuser1\\hook1.py\\\*(rq'

.SH Operating on Objects (Server, Scheduler, Vnode, Queue, Hook)
.B Making Objects Active
.br
Making objects active is a way to set up a list of objects, all of the
same type, on which you can then use a single command.  For example,
if you are going to set the same attribute to the same value on
several vnodes, you can make all of the target vnodes active before
using a single command to set the attribute value, instead of having
to give the command once for each vnode.  You can make any type of
object active except for resources or hooks.

When an object is active, it is acted upon when you specify its type
but do not specify names.  When you specify any object names in a
directive, active objects are not operated on unless they are named in
the directive.

You can specify a list of active objects for each type of object. You
can have active objects of multiple types at the same time.  The
active objects of one type have no effect on whether objects of
another type are active.

Objects are active only until the qmgr command is exited, so this
feature can be used only at the qmgr prompt.

Each time you make any objects active at a given server, that list of
objects replaces any active objects of the same kind at that server.
For example, if you have four queues at a particular server, and you
make Q1 and Q2 active, then later make Q3 and Q4 active, the result is
that Q3 and Q4 are the only active queues.

You can make different objects be active at different servers
simultaneously.  For example, you can set vnodes N1 and N2 at the
default server, and vnodes N3 and N4 at server Server2 to be active at
the same time.

To make all objects inactive, quit qmgr.  When you quit qmgr, any
object that was active is no longer active.

.B Using the active Command
.br
To make the named object(s) of the specified type active:
.RS 3
.I active <object type> [<object name>[,<object name> ...]]

Example: To make queue Queue1 active:
.br
.B Qmgr: active queue Queue1

Example: To make queues Queue1 and Queue2 at the active server be
active, then enable them:
.br
.B Qmgr: active queue Queue1,Queue2
.br
.B Qmgr: set queue enabled=True

Example: To make queue Queue1 at the default server and queue Queue2
at Server2 be active:
.br
.B Qmgr: active queue Queue1@default,Queue2@Server2

Example: To make vnodes N1, N2, N3, and N4 active, and then give them
all the same value for their 
.I max_running 
attribute:
.br
.B Qmgr: active node N1,N2,N3,N4
.br
.B Qmgr: set node max_running = 2
.RE

To make all object(s) of the specified type at the specified server
active:
.RS 3
.I active <object type> @<server name>        
(note space before @ sign)

Example: To make all queues at the default server active:
.br
.B Qmgr: active queue @default

Example: To make all vnodes at server Server2 active:
.br
.B Qmgr: active node @Server2
.RE

To report which objects of the specified type are active:
.RS 3
.I active <object type>  

The qmgr command prints a list of names of active objects of the
specified type to stdout.
.RE

.B Creating Objects (Server, Scheduler, Vnode, Queue, Hook)
.br
To create one new object of the specified type for each name, and give
it the specified name:
.RS 3
.I create <object type> <object name>[,<object name> ...] [[<attribute> = <value>] [,<attribute> = <value>] ...]
.RE

Can be used only with multischeds, queues, vnodes, resources, and hooks.  Cannot be
used with built-in hooks.

.RS 3
For example, to create a multisched named multisched_1 at the active server:
.br
.B Qmgr: create sched multisched_1

For example, to create a queue named Q1 at the active server: 
.br
.B Qmgr: create queue Q1

For example, to create a vnode named N1 and a vnode named N2:
.br
.B Qmgr: create node N1,N2

For example, to create queue Queue1 at the default server and queue
Queue2 at Server2:
.br
.B Qmgr: create queue Queue1@default,Queue2@Server2

For example, to create vnodes named N1, N2, N3, and N4 at the active
server, and to set their Mom attribute to Host1 and their 
.I max_running
attribute to 1:
.br
.B Qmgr: create node N1,N2,N3,N4 Mom=Host1, max_running = 1

For example, to create a host-level consumable string resource named "foo":
.br
.B qmgr -c "create resource foo type=string,flag=nh"
.RE

All objects of the same type at a server must have unique names.  For
example, each queue at server Server1 must have a unique name.
Objects at one server can have the same name as objects at another
server.

You can create multiple objects of the same type with a single
command.  You cannot create multiple types of objects in a single
command.  

To create multiple resources of the same type
and flag, separate each resource name with a comma:
.RS 3
.I qmgr -c "create resource <resource>[,<resource> ...] type=<type>,flag=<flag(s)>"
.RE

.B Examples of Creating Objects
.br
Example: Create queue:
.RS 3
.B Qmgr: create queue fast priority=10,queue_type=e,enabled = true,max_running=0
.RE

Example: Create queue, set resources:
.RS 3
.B Qmgr: create queue little
.br
.B Qmgr: set queue little resources_max.mem=8mw,resources_max.cput=10
.RE

.B Deleting Objects
.br
To delete the named object(s):
.RS 3
.I delete <object type> <object name>[,<object name> ...]

When you delete more than one object, do not put a space after a comma.

Can be used only with queues, vnodes, resources, and hooks.  Cannot be
used with built-in hooks.

For example, to delete queue Q1 at the active server:
.br
.B Qmgr: delete queue Q1

For example, to delete vnodes N1 and N2 at the active server:
.br
.B Qmgr: delete node N1,N2

For example, to delete queue Queue1 at the default server and queue
Queue2 at Server2:
.br
.B Qmgr: delete queue Queue1@default,Queue2@Server2

For example, to delete resource "foo" at the active server:
.br
.B Qmgr: delete resource foo
.RE

To delete the active objects of the specified type:
.RS 3
.I delete <object type>

For example, to delete the active queues:
.br
.B Qmgr: delete queue
.RE

To delete the active objects of the specified type at the specified
server:
.RS 3
.I delete <object type> @<server name>

For example, to delete the active queues at server Server2:
.br
.B Qmgr: delete queue @Server2
.RE

You can delete multiple objects of the same type with a single
command.  You cannot delete multiple types of objects in a single
command.  To delete multiple resources, separate the
resource names with commas.
.RS 3

For example:
.br
.B Qmgr: delete resource r1,r2
.RE

You cannot delete a resource that is requested by a job or
reservation, or that is set on a server, queue, or vnode.

.SH Operating on Attributes and Resources
You can specify attributes and resources for named objects or for all
objects of a type.

.B Setting Attribute and Resource Values
.br
To set the value of the specified attribute(s) for the named
object(s):
.RS 3
.I set <object type> <object name>[,<object name> ...] <attribute> = <value> [,<attribute> = <value> ...]
.RE

Each specified attribute is set for each named object, so if you
specify three attributes and two objects, both objects get all three
attributes set.

To set the attribute value for all active objects when there are
active objects of the type specified:
.br
.I \ \ \ set <object type> <attribute> = <value>

To set the attribute value for all active objects at the specified
server when there are active objects of the type specified:
.RS 3
.I set <object type> @<server name> <attribute> = <value>

For example, to set the amount of memory on a vnode:
.br
.B Qmgr: set node Vnode1 resources_available.mem = 2mb
.RE

If the attribute is one which describes a set of resources such as
.I resources_available, resources_default, resources_max, resources_used,
etc., the attribute is specified in the form:
.br
.I \ \ \ <attribute name>.<resource name>

You can have spaces between attribute=value pairs.  

.B Examples of Setting Attribute Values
.br
Increase limit on queue:
.RS 3
.B Qmgr: set queue fast max_running +=2
.RE

Set software resource on mynode:
.RS 3
.B Qmgr: set node mynode resources_available.software = "myapp=/tmp/foo"
.RE

Set limit on queue:
.RS 3
.B Qmgr: set queue max_running = 10
.RE

Set vnode offline:
.RS 3
.B Qmgr: set node state = "offline"
.RE

.B Unsetting Attribute and Resource Values 
.br
You can use the qmgr command to unset attributes of any object, except
for the 
.I type 
attribute of a built-in hook.

To unset the value of the specified attributes of the named object(s):
.nf
.RS 3
.I unset <object type> <object name>[,<object name> ...] <attribute>[,<attribute>...]
.RE

To unset the value of specified attributes of active objects:
.br
.I \ \ \ unset <object type> <attribute>[,<attribute>...]

To unset the value of specified attributes of the named object:
.br
.I \ \ \ unset <object type> <object name> <attribute>[,<attribute>...]

To unset the value of specified attributes of the named object:
.br
.I \ \ \ unset <object type> @<server name> <attribute>[,<attribute>...]

.B Example of Unsetting Attribute Value
.br
Unset limit on queue
.br
.B \ \ \ Qmgr: unset queue fast max_running

.B Caveats and Restrictions for Setting Attribute and Resource Values
.br
If the value includes whitespace, commas or other special characters,
such as the # character, the value string must be enclosed in single
or double quotes.  For example:
.RS 3
.B Qmgr: set node Vnode1 comment="Node will be taken offline Friday at 1:00 for memory upgrade."
.RE

You can set or unset attribute values for only one type of object in each command.

You can use the qmgr command to set attributes of any object, except
for the 
.I type 
attribute of a built-in hook.

You can have spaces between attribute names.

Attribute and resource values must conform to the format for the
attribute or resource type.  

Most of a vnode's attributes may be set using qmgr.  However, some
must be set on the individual execution host in local vnode definition
files, NOT by using qmgr.  

.B Setting Resource Type and Flag(s)
.br
You can use the qmgr command to set or unset the type and flag(s) for
resources.

Resource types can be the following:
.RS 3
string
.br
boolean
.br
string_array
.br
long
.br
size
.br
float
.RE

To set a resource type:
.br
.I \ \ \ set resource <resource name> type = <type>

Sets the type of the named resource to the specified type.  For
example:
.br
.B \ \ \ qmgr -c "set resource foo type=string_array"

.B Resource Accumulation Flags
The resource accumulation flag for a resource can be one of the
following:

.B Flag \ \ \ \ \ \ \ Meaning
-----------------------------------------------------------------------
(no flags)  Indicates a queue-level or server-level resource that is 
            not consumable.
-----------------------------------------------------------------------
fh          The amount is consumable at the host level for only the 
            first vnode allocated to the job (vnode with first task.) 
            Must be consumable or time-based. Cannot be used with 
            Boolean or string resources.

            This flag specifies that the resource is accumulated at the 
            first vnode, meaning that the value of 
            resources_assigned.<resource> is incremented only at the 
            first vnode when a job is allocated this resource or when a 
            reservation requesting this resource on this vnode starts.
-----------------------------------------------------------------------
h           Indicates a host-level resource. Used alone, means that the 
            resource is not consumable. Required for any resource that 
            will be used inside a select statement. This flag selects 
            hardware. This flag indicates that the resource must be 
            requested inside of a select statement.

            Example: for a Boolean resource named "green":
.B \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ green type=boolean,flag=h
-----------------------------------------------------------------------
nh          The amount is consumable at the host level, for all vnodes 
            assigned to the job. Must be consumable or time-based. 
            Cannot be used with Boolean or string resources. 

            This flag specifies that the resource is accumulated at the 
            vnode level, meaning that the value of 
            resources_assigned.<resource> is incremented at relevant 
            vnodes when a job is allocated this resource or when a 
            reservation requesting this resource on this vnode starts.

            This flag is not used with dynamic consumable resources. 
            A scheduler will not oversubscribe dynamic consumable 
            resources.
-----------------------------------------------------------------------
q           The amount is consumable at the queue and server level. 
            When a job is assigned one unit of a resource with this 
            flag, the resources_assigned.<resource> attribute at the 
            server and any queue is incremented by one. Must be 
            consumable or time-based.

            This flag specifies that the resource is accumulated at the 
            queue and server level, meaning that the value of 
            resources_assigned.<resource> is incremented at each queue 
            and at the server when a job is allocated this resource. 
            When a reservation starts, allocated resources are added to 
            the server's resources_assigned attribute.

            This flag is not used with dynamic consumable resources. 
            A scheduler will not oversubscribe dynamic consumable 
            resources.
-----------------------------------------------------------------------

.B Resource Permission Flags
The permission flag for a resource can be one of the following:    

.B Flag \ \ \ \ \ \ \ Meaning
-----------------------------------------------------------------------
(no flag)   Users can view and request the resource, and qalter a 
            resource request for this resource.
-----------------------------------------------------------------------
i           "Invisible".  Users cannot view or request the resource.  
            Users cannot qalter a resource request for this resource.
-----------------------------------------------------------------------
r           "Read only".  Users can view the resource, but cannot 
            request it or qalter a resource request for this resource.
-----------------------------------------------------------------------

To set resource flags, concatenate the flags you want without spaces
or commas.

To set the flag(s) of the named resource to the specified flag(s):
.RS 3
.I set resource <resource name> flag=<flag(s)>

For example:
.br
.B qmgr -c "set resource foo flag=nhi"
.RE

To set both type and flag(s):
.RS 3
.I set resource <resource name> type=<type>,flag=<flag(s)> 

Sets the type and flag(s) of the named resource to the specified type
and flag(s).  For example:
.br
.B qmgr -c "set resource foo type=long,flag=nhi"
.RE

You can set multiple resources by separating the names with commas.
.RS 3
For example:
.br
.B qmgr -c "set resource r1,r2 type=long"
.RE

You cannot set the type for a resource that is requested by a job or
reservation, or set on a server, queue, or vnode.

You cannot set the flag(s) to h, nh, fh, or q for a resource that is
requested by a job or reservation.

.B Unsetting Resource Flag(s)
.br
You can use the qmgr command to unset the flag(s) for resources.

To unset the flag(s) of the named resource:
.RS 3
.I unset resource <resource name> flag

For example:
.br
.B qmgr -c "unset resource foo flag"
.RE

You can unset the flag(s) of multiple resources by separating the
resource names with commas.  
.RS 3
For example:
.br
.B qmgr -c "unset resource r1,r2 flag"
.RE

You cannot unset the type for a resource.

You cannot unset the flag(s) for a resource that is requested by a job
or reservation, or set on any server, queue, or vnode.

.SH Viewing Object, Attribute, and Resource Information
.B Listing Objects and Their Attributes
.br
You can use the qmgr command to list attributes of any object,
including attributes at their default values.

To list the attributes, with associated values, of the named
object(s):
.RS 3
.I list <object type> <object name>[,<object name> ...]
.RE

To list values of the specified attributes of the named object:
.RS 3
.I list <object type> <object name> <attribute name>[, <attribute name>]...
.RE

To list attributes, with associated values, of active objects of the
specified type at the active server:
.br
.I \ \ \ list <object type>

To list all objects of the specified type at the specified server,
with their attributes and the values associated with the attributes:
.br
.I \ \ \ list <object type> @<server name>

To list attributes of the active server: 
.RS 3
.I list server
.br
If no server other than the default server has been made active,
lists attributes of the default server (it is the active server).
.RE

To list attributes of the specified server:
.br
.I \ \ \ list server <server name>

To list all attributes of all schedulers:
.br
.I \ \ \ list sched

To list all attributes of the specified scheduler:
.br
.I \ \ \ list sched <scheduler name>

To list all hooks, along with their attributes:
.br
.I \ \ \ list hook

To list attributes of the specified hook:
.br
.I \ \ \ list hook <hook name>

.B Examples of Listing Objects and Their Attributes
.br
List serverA's schedulers' attributes:
.br
.B \ \ \ Qmgr: list sched @serverA 

List attributes for default server's scheduler(s):
.br
.B \ \ \ Qmgr: l sched @default

List PBS version for default server's scheduler:
.br
.B \ \ \ Qmgr: l sched @default pbs_version

List queues at a specified server:
.br
.B \ \ \ Qmgr: list queue @server1

.B Listing Resource Definitions
.br
You can use the qmgr 
.B list 
and 
.B print 
commands to list resource
definitions showing resource name, type, and flag(s).

To list the name, type, and flag(s) of the named resource(s):
.RS 3
.I list resource <resource name>[,<resource name> ...]
.RE
or
.RS 3
.I print resource <resource name>[,<resource name> ...]
.RE

To list name, type, and flag(s) of custom resources only: 
.RS 3
.I list resource
.RE
or
.RS 3
.I print resource
.RE
or
.RS 3
.I print server 
(note that this also prints information for the active server)
.RE

To list all custom resources at the specified server, with their
names, types, and flags:
.RS 3
.I list resource @<server name>
.RE
or
.RS 3
.I print resource @<server name>
.RE

When used by a non-privileged user, qmgr prints only resource
definitions for resources that are visible to non-privileged users
(those that do not have the 
.B i 
flag set).

.B Printing Creation and Configuration Commands
.br
For printing the creation commands for any object except for a
built-in hook.

To print out the commands to create the named object(s) and set their
attributes to their current values:
.RS 3
.I print <object type> <object name>[,<object name> ...] 
.br
where object name follows the name rules in "Using Lists of Object Names".
.RE

To print out the commands to create the named object and set its
attributes to their current values:
.RS 3
.I print <object type> <object name> [<attribute name>[, <attribute name>]...]
.br
where object name follows the name rules in "Using Lists of Object Names".
.RE

To print out the commands to create and configure the active objects
of the named type:
.br
.I \ \ \ print <object type>

To print out the commands to create and configure all of the objects
of the specified type at the specified server:
.br
.I \ \ \ print <object type> @<server name>

To print out the commands to create each queue, set the attributes of
each queue to their current values, and set the attributes of the
server to their current values:
.br
.I \ \ \ print server

This is used for the server and queues, but not hooks.

Prints information for the active server.  If there is no active
server, prints information for the default server.

.B Caveats for Viewing Information
.br
Some attributes whose values are unset do not appear in the output of the
qmgr command.

Definitions for built-in resources do not appear in the output of the
qmgr command.

When a non-privileged user prints resource definitions, qmgr prints
only resource definitions for resources that are visible to
non-privileged users (those that do not have the 
.B i 
flag set).

.SH Saving and Re-creating Server and Queue Information
To save and recreate server and queue configuration, print the
configuration information to a file, then read it back in later.  For
example, to save your configuration:
.br
.B \ \ \ # qmgr -c "print server" > savedsettings
.br
or
.br
.B \ \ \ Qmgr: print server > savedsettings

When re-creating queue and server configuration, read the commands
back into qmgr.  For example:
.br
.B \ \ \ qmgr < savedsettings

.SH Operating on Hooks
.B Creating Hooks
.br
To create a hook:
.RS 3
.I Qmgr: create hook <hook name>

For example:
.br
.B Qmgr: create hook my_hook
.RE

.B Deleting Hooks
.br
To delete a hook:
.RS 3
.I Qmgr: delete hook <hook name>

For example:
.br
.B Qmgr: delete hook my_hook
.RE

.B Setting and Unsetting Hook Attributes
.br
To set a hook attribute:
.RS 3
.I Qmgr: set hook <hook name> <attribute> = <value>
.RE

To unset a hook attribute: 
.RS 3
.I Qmgr: unset hook <hook name> <attribute>

Example: Unset hook1's 
.I alarm 
attribute, causing hook1's alarm to revert to its
default value of 30 seconds:
.br
.B Qmgr: unset hook hook1 alarm
.RE

.B Importing Hooks
.br
For importing the contents of a site-defined hook.  Cannot be used with built-in
hooks.

To import a hook, you import the contents of a hook script into the
hook.  You must specify a filename that is locally accessible to qmgr
and the PBS server.

Format for importing a site-defined hook:
.RS 3
.I import hook <hook name> application/x-python <content encoding> {<input file> | -} 
.RE
This uses the contents of 
.I input file 
or stdin (-) as the contents of
hook 
.I hook name.

The 
.I input file 
or stdin (-) data must have a format of 
.I content type
and must be encoded with 
.I content encoding.

The allowed values for 
.I content encoding 
are "default" (7bit) and
"base64".

If the source of input is stdin (-) and 
.I content encoding 
is "default",
qmgr expects the input data to be terminated by EOF.

If the source of input is stdin (-) and 
.I content encoding 
is "base64",
qmgr expects input data to be terminated by a blank line.

.I input file 
must be locally accessible to both qmgr and the requested
batch server.

A relative path 
.I input file 
is relative to the directory where qmgr was
executed.

If a hook already has a content script, that is overwritten by this
import call.

If the name in 
.I input file 
contains spaces as are used in Windows filenames, input file must be quoted.

There is no restriction on the size of the hook script.

.B Examples of Importing Hooks
.br
Example: Given a Python script in ASCII text file "hello.py", use its contents
as the script contents of hook1:

   #cat hello.py
   import pbs

   pbs.event().job.comment="Hello, world"

.RS 3
.B # qmgr -c 'import hook hook1 application/x-python default hello.py'
.RE

Example: Given a base64-encoded file "hello.py.b64", qmgr unencodes the file's
contents, and then makes this the script contents of hook1:

.B \ \ \ # cat hello.py.b64
.br
   cHJpbnQgImhlbGxvLCB3b3JsZCIK

.RS 3
.B # qmgr -c 'import hook hook1 application/x-python base64 hello.py.b64'
.RE

Example: To create a provisioning hook called Provision_Hook, and import the
ASCII hook script called "master_provision.py" located in /root/data/:
.RS 3
.B Qmgr: create hook Provision_Hook
.br
.B Qmgr: import hook Provision_Hook application/x-python default /root/data/master_provision.py
.RE

.B Importing and Exporting Hook Configuration Files
.br
.B Importing Configuration Files
.br
For importing the contents of a site-defined or built-in hook configuration file.  To import a
hook configuration file, you import the contents of a file to a hook.
You must specify a filename that is locally accessible to qmgr and the
PBS server.

Format for importing a site-defined hook configuration file:
.RS 3
.I import hook <hook name> application/x-config <content encoding> {<config file>|-}
.RE

Format for importing a built-in hook configuration file:
.RS 3
.I import pbshook <hook name> application/x-config <content encoding> {<config file>|-}
.RE

This uses the contents of 
.I config file 
or stdin (-) as the contents of the configuration file for hook 
.I hook name.

The 
.I config file 
or stdin (-) data must have a format of 
.I content-type
and must be encoded with 
.I content encoding.

The allowed values for 
.I content encoding 
are "default" (7bit) and "base64".

If the source of input is stdin (-) and 
.I content encoding 
is "default", qmgr expects the input data to be terminated by EOF.

If the source of input is stdin (-) and 
.I content encoding 
is "base64", qmgr expects input data to be terminated by a blank line.

.I config file 
must be locally accessible to both qmgr and the requested batch server.

A relative path 
.I config file 
is relative to the directory where qmgr was executed.

If a hook already has a configuration file, that file is overwritten
by this import call.

If the name in 
.I config file 
contains spaces as are used in Windows filenames, input file must be quoted.

There is no restriction on the size of the hook configuration file.

.B Exporting Configuration Files
.br

Format for exporting a site-defined hook configuration file:
.RS 3
.I export hook <hook name> application/x-config default {<config file>|-}
.RE

Format for exporting a built-in hook configuration file:
.RS 3
.I export pbshook <hook name> application/x-config default {<config file>|-}
.RE


.B Hook Configuration File Format
.br
PBS supports several file formats for configuration files.  The format
of the file is specified in its suffix.  Formats can be any of the
following:
.RS 3
 .ini
.br
 .json
.br
 .py (Python)
.br
 .txt (generic, no special format)
.br
 .xml
.RE
.RS 4
No suffix: treat the input file as if it is a .txt file
.br
The dash (-) symbol: configuration file content is taken from STDIN. The content is treated as if it is a .txt file.
.RE

Example: To import a configuration file in .json format:
.RS 3
.I # qmgr -c "import hook my_hook application/x-config default my_input_file.json"
.RE

.B Exporting Hooks
.br
For exporting the contents of a site-defined hook.  Cannot be used with built-in
hooks.

Format for exporting a hook: 
.br
.RS 3
.I export hook <hook name> <content type> <content encoding> [<output file>]
.RE
This dumps the script contents of hook 
.I hook name 
into 
.I output file, 
or stdout if 
.I output file 
is not specified.

The resulting 
.I output file 
or stdout data is of 
.I content type 
and 
.I content encoding.

The only 
.I content type 
currently supported is "application/x-python".

The allowed values for 
.I content encoding 
are "default" (7bit) and "base64".

.I output file 
must be a path that can be created by qmgr.

Any relative path 
.I output file 
is relative to the directory where qmgr was executed.

If 
.I output file 
already exists it is overwritten. If PBS is unable to
overwrite the file due to ownership or permission problems, an error
message is displayed in stderr.

If the 
.I output file 
name contains spaces like the ones used in Windows
file names, 
.I output file 
must be enclosed in quotes.

.B Examples of Exporting Hooks
.br
Example: Dump hook1's script contents directly into a file "hello.py.out":
.RS 3
.B # qmgr -c 'export hook hook1 application/x-python default hello.py'
.br
.B # cat hello.py
.br
import pbs
.br
pbs.event().job.comment="Hello, world"
.RE

Example: To dump the script contents of a hook named hook1 into a file named hook1.py:
.RS 3
.B Qmgr: export hook hook1 application/x-python default hook1.py
.RE

.B Printing Hook Information
.br
To print out the commands to create and configure all hooks, including
their configuration files:
.br
.I \ \ \ print hook

To print out the commands to create and configure the specified hook,
including its configuration file:
.br
.I \ \ \ print hook <hook name>

.B Saving and Re-creating Hook Information
.br
You can save creation and configuration information for all hooks.
For example:
.br
.B \ \ \ # qmgr -c "print hook" > hook.qmgr

You can re-create all hooks and their configuration files.  For example:
.br
.B \ \ \ # qmgr < hook.qmgr

.B Restrictions on Built-in Hooks
.br
You cannot do the following with built-in hooks:
.RS 3
Import a built-in hook
.br
Export a built-in hook
.br
Print creation commands for a built-in hook
.br
Create a built-in hook
.br
Delete a built-in hook
.br
Set the type attribute for a built-in hook
.RE

.SH Printing Usage Information
You use the help command or a question mark ("?") to invoke the qmgr
built-in help function.  You can request usage information for any of
the qmgr commands, and for topics including attributes, operators,
names, and values.

To print out usage information for the specified command or topic:
.br
.B \ \ \ Qmgr: help [<command or topic>]
.br
or
.br
.B \ \ \ Qmgr: ? [<command or topic>]

For example, to print usage information for the set command:
.RS 3
.B qmgr
.br
.B Qmgr: help set
.br
Syntax: set object [name][,name...] attribute[.resource] OP value
.RE

.SH Standard Input
When you start a qmgr session, the qmgr command reads standard input
for directives until it reaches end-of-file, or it reads the exit or quit
command.

.SH Standard Output
When you start a qmgr session, and standard output is connected to a
terminal, qmgr writes a command prompt to standard output.

If you specify the -e option, qmgr echoes the directives it reads from
standard input to standard output.

.SH Standard Error
If you do not specify the -z option, the qmgr command writes a
diagnostic message to standard error for each error occurrence.

.SH Exit Status
.IP 0 5
Success

.IP 1 5
Error in parsing

.IP 2 5
Error in execution

.IP 3 5
Error connecting to server

.IP 4 5
Error making object active

.IP 5 5
Memory allocation error

.SH See Also
and pbs_server_attributes.7B, 
pbs_job_attributes.7B, pbs_hook_attributes.7B, pbs_node_attributes.7B, 
pbs_queue_attributes.7B, pbs_resv_attributes.7B, and pbs_sched_attributes.7B

================================================
FILE: doc/man8/qrun.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qrun 8B "25 January 2021" Local "PBS Professional"
.SH NAME
.B qrun 
\- run a PBS batch job now

.SH SYNOPSIS
.B qrun 
[-a] [-H <vnode specification>] <job ID> [<job ID> ...]
.br
.B qrun
[-a] [-H - ] <job ID> [<job ID> ...]
.br
.B qrun
--version

.SH DESCRIPTION
Forces a job to run, regardless of scheduling position or resource requirements.

The 
.B qrun 
command can be used on jobs, subjobs, or ranges of subjobs, but
not on job arrays.  When it is used on a range of subjobs, the
non-running subjobs in that range are run.

When preemption is enabled, the scheduler preempts other jobs in order
to run this job.  Running a job via 
.B qrun 
gives the job higher preemption priority than any of the priorities defined
in the 
.I preempt_prio 
scheduler parameter.  

.B Required Privilege
.br
In order to execute 
.B qrun, 
you must have PBS Operator or Manager privilege.

.B Caveats for qrun
.RS 3
The job is run without respect for limits, primetime, or dedicated time.

If you use a
.B -H vnode_specification
option to run a job, but specify insufficient vnodes or resources, the
job may not run correctly.  Avoid using this option unless you are
sure.

If you don't use the 
.I -H 
option, the job must be in the 
.I Queued
state and reside in an execution queue.

If you do use the 
.I -H 
option, the job must be in the 
.I Queued 
or 
.I Suspended 
state and reside in an execution queue.

If you use the 
.I -H
option, all schedulers are bypassed, and partition boundaries are ignored.

The 
.B qrun
command cannot be used on a job that is in the process of provisioning.

If you use 
.B qrun
on a subjob, PBS will try to run the subjob regardless of whether the job 
has hit the limit specified in 
.I max_run_subjobs.
.RE

.SH OPTIONS
.IP "-a" 6
The 
.B qrun 
command exits before the job actually starts execution.

.IP "(no -H option)" 6
The job is run immediately regardless of scheduling policy as long as 
the following are true:
.RS 9
The queue in which the job resides is an execution queue.

Either the resources required by the job are available, or preemption
is enabled and the required resources can be made available by
preempting jobs that are running.
.RE

.IP "(with -H option)" 6
Do 
.B NOT
use this option unless you know exactly what you are doing.

With the -H option, all scheduling policies are bypassed and the job
is run directly.  The job is run immediately on the named or
previously assigned vnodes, regardless of current usage on those
vnodes or which scheduler manages the vnodes, 
with the exception of vnode state.  The job is not run and
the qrun request is rejected if any named vnode is down, 
already allocated exclusively, or would need to be allocated
exclusively and another job is already running on the vnode.  The job
is run if the vnode is 
.I offline.

The 
.I -H
option runs jobs that are queued or suspended.

If the 
.B qrun -H 
command is used on a job that requests an AOE, and that AOE is not instantiated
on those vnodes, the vnodes are provisioned with the AOE.

If the job requests an AOE, and that AOE is not available on the 
specified vnodes, the job is held.
.RS 6
.IP "-H <vnode specification without resources>" 3
The 
.I vnode specification without resources
has this format:
.br
.I \ \ \ (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.br
.I \ \ \ <vnode name>[+<vnode name> ...]
.br
Example: -H (VnodeA+VnodeB)+(VnodeC)

PBS applies one requested chunk from the job's selection directive in round-robin
fashion to each 
.I vchunk 
in the list.  Each 
.I vchunk 
must be sufficient to run the job's corresponding chunk, otherwise
the job may not execute correctly.
.RE

.RS 6
.IP "-H <vnode specification with resources>" 3
The 
.I vnode specification with resources
has this format:
.br
.I \ \ \ (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.IP "" 6
.I <vnode name>:<vnode resources>[+<vnode name>:<vnode resources> ...]
.LP
.RS 3
and where
.I vnode resources
has the format
.RS 3
<resource name>=<value>[:<resource name>=<value> ...]
.RE

.IP "Example:" 3
-H (VnodeA:mem=100kb:ncpus=1)+ (VnodeB:mem=100kb:ncpus=2+ VnodeC:mem=100kb)
.LP

PBS creates a new selection directive from the 
.I vnode specification with resources, 
using it instead of the original specification from the user.
Any single resource specification results in the
job's original selection directive being ignored.  Each 
.I vchunk 
must be sufficient to run the job's corresponding chunk, otherwise
the job may not execute correctly.

If the job being run requests
.I -l place=exclhost,
take extra care to satisfy the 
.I exclhost 
request.  Make sure that if any vnodes are from a multi-vnoded host, 
all vnodes from that host are allocated.  Otherwise those vnodes can 
be allocated to other jobs.
.RE

.IP "-H -" 3
Runs the job on the set of resources to which it is already assigned.
You can run a job on the set of resources already assigned to the job, without having to list the resources, by using the 
.I -
(dash) argument to the
.I -H 
option.
.RE

.IP "--version" 6
The 
.B qrun
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
.IP "Job ID" 6
The 
.B qrun 
command accepts a list of job IDs, of the form
.I \ \ \ <sequence number>[.<server name>][@<server name>]
.br
.I \ \ \ <sequence number>[<index>][.<server name>][@<server name>]
.IP " " 9
.I <sequence number>[<index start>-<index end>][.<server name>][@<server name>]
.IP " " 6
Note that some shells require that you enclose a job array identifier in
double quotes.

.IP "vnode specification" 6
The 
.I vnode specification without resources
has this format:
.IP "" 9
.I (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.br
.I <vnode name>[+<vnode name> ...]
.br
Example: -H (VnodeA+VnodeB)+(VnodeC)
.LP
.IP "" 6
The 
.I vnode specification with resources
has this format:
.IP "" 9
.I (<vchunk>)[+(<vchunk>) ...]
.br
where 
.I vchunk 
has the format
.br
.I <vnode name>:<vnode resources>[+<vnode name>:<vnode resources> ...]
.br
and where
.I vnode resources
has the format
.br
.I <resource name>=<value>[:<resource name>=<value> ...]

Example: -H (VnodeA:mem=100kb:ncpus=1) + (VnodeB:mem=100kb:ncpus=2 + VnodeC:mem=100kb)
.IP "" 6
A 
.I vnode name
is the name of the vnode, not the name of the host.

.SH STANDARD ERROR
The
.B qrun
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 6
On success

.IP "Greater than zero" 6
If the 
.B qrun 
command fails to process any operand

.SH SEE ALSO
qsub(1B), 
qmgr(8B), 
pbs_runjob(3B)


================================================
FILE: doc/man8/qstart.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qstart 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qstart 
- turn on scheduling or routing for jobs in a PBS queue
.SH SYNOPSIS
.B qstart 
<destination> [<destination> ...]
.br
.B qstart
--version
.SH DESCRIPTION
If 
.I destination 
is an execution queue, the 
.B qstart 
command allows a PBS scheduler to schedule jobs residing in the specified queue.
If 
.I destination
is a routing queue, the server can begin routing jobs from that queue.  Sets
the value of the queue's 
.I started 
attribute to
.I True.

.B Required Privilege
.br
In order to execute 
.B qstart, 
you must have PBS Operator or Manager privilege.

.SH OPTIONS
.IP "--version" 
The 
.B qstart
command returns its PBS version information and exits.
This option can only be used alone.


.SH  OPERANDS
The qstart command accepts one or more space-separated
.I destination
operands.  The operands take one of three forms:
.IP "<queue name>" 3
Starts scheduling or routing from the specified queue.
.IP "@<server name>" 3
Starts scheduling or routing from all queues at the specified server.
.IP "<queue name>@<server name>" 3
Starts scheduling or routing from the specified queue at the specified server.
.LP
To start scheduling at all queues at the default server, use the 
.B qmgr
command:
.br
.B \ \ \ Qmgr: set queue @default started=true

.SH STANDARD ERROR
The 
.B qstart
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 3
Upon successful processing of all the operands presented to the
.B qstart
command
.IP "Greater than zero" 3
If the qstart command fails to process any operand

.SH SEE ALSO
pbs_server(8B), qstop(8B), and qmgr(8B)


================================================
FILE: doc/man8/qstop.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qstop 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qstop 
\- prevent PBS jobs in the specified queue from being scheduled or routed
.SH SYNOPSIS
.B qstop 
<destination> [<destination> ...]
.br
.B qstop
--version

.SH DESCRIPTION

If 
.I destination 
is an execution queue, the 
.B qstop 
command stops the
scheduler from scheduling jobs residing in 
.I destination.  
If
.I destination 
is a routing queue, the server stops routing jobs from
that queue.  Sets the value of the queue's 
.I started 
attribute to 
.I False.

.B Required Privilege
.br
You must have PBS Operator or Manager privilege to run this command.

.SH OPTIONS
.IP "--version" 8
The 
.B qstop
command returns its PBS version information and exits.
This option can only be used alone

.SH  OPERANDS
The 
.B qstop 
command accepts one or more space-separated
.I destination
operands.  The operands take one of three forms:
.br
.I <queue name>
.RS 3
Stops scheduling or routing from the specified queue.
.RE

.I @<server name>
.RS 3
Stops scheduling or routing from all queues at the specified server.
.RE

.I <queue name>@<server name>
.RS 3
Stops scheduling or routing from the specified queue at the specified server.
.RE

To stop scheduling at all queues at the default server, use the 
.B qmgr
command:
.RS 3
.B Qmgr: set queue @default started=false
.RE

.SH STANDARD ERROR
The 
.B qstop
command writes a diagnostic message to standard error for each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all operands

.IP "Greater than zero" 8
If the 
.B qstop 
command fails to process any operand

.SH SEE ALSO
pbs_server(8B), qstart(8B), and qmgr(8B)


================================================
FILE: doc/man8/qterm.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH qterm 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B qterm 
\- terminate one or both PBS servers, and optionally terminate scheduler(s) and/or MoMs

.SH SYNOPSIS
.B qterm 
[-f | -F | -i] [-m] [-s] [-t <type>] [<server>[ <server> ...]]
.br
.B qterm
--version

.SH DESCRIPTION
The
.B qterm 
command terminates a PBS batch server.

Once the server is terminating, no new jobs are accepted by the
server, and no jobs are allowed to begin execution.  The impact on
running jobs depends on the way the server is shut down.

The 
.B qterm 
command does not exit until the server has completed its shutdown procedure.

If the complex is configured for failover, and the primary server is
shut down, the normal behavior for the secondary server is to become
active.  The 
.B qterm 
command provides options to manage the behavior of
the secondary server; it can be shut down, forced to remain idle, or
shut down in place of the primary server.

.B Required Privilege
.br
In order to
run the 
.B qterm 
command, you must have PBS Operator or Manager privilege.

.SH OPTIONS
.IP "(no options)" 10
The 
.B qterm 
command defaults to 
.B qterm -t quick.

.IP "-f" 10
If the complex is configured for failover, shuts down both the primary and
secondary servers.  
.br
Without the 
.I -f 
option, 
.B qterm 
shuts down the the primary server and makes the secondary server active.  
.br
The 
.I -f
option cannot be used with the 
.I -i 
or 
.I -F 
options.

.IP "-F" 10
If the complex is configured for failover, shuts down only the secondary server,
leaving the primary server active.
.br
The 
.I -F 
option cannot be used with the 
.I -f 
or 
.I -i 
options.

.IP "-i" 10
If the complex is configured for failover, leaves the secondary server
idle when the primary server is shut down.
.br
The 
.I -i 
option cannot be used with the 
.I -f 
or 
.I -F 
options.

.IP "-m" 10
Shuts down the primary server and all MoMs 
.B (pbs_mom).
This option does not cause jobs or subjobs to be killed.
Jobs are left running subject to other options to the 
.B qterm
command.  

.IP "-s" 10
Shuts down the primary server and the scheduler
.B (pbs_sched).

.IP "-t <type>" 10
The 
.I type 
specifies how the server is shut down.  The 
.I types
are the following:
.RS
.IP immediate
Shuts down the primary server.  Immediately stops all running jobs.
Any running jobs that can be checkpointed are checkpointed,
terminated, and requeued.  Jobs that cannot be checkpointed are
terminated and requeued if they are rerunnable, otherwise they are
killed.

If any job cannot be terminated, for example the server cannot contact
the MoM of a running job, the server continues to execute and the job
is listed as running.  The server can be terminated by a second 
.B qterm -t immediate 
command.

While terminating, the server is in the 
.I Terminating 
state.

.IP delay 
Shuts down the primary server.  The server waits to terminate until
all non-checkpointable, non-rerunnable jobs are finished executing.
Any running jobs that can be checkpointed are checkpointed,
terminated, and requeued.  Jobs that cannot be checkpointed are
terminated and requeued if they are rerunnable, otherwise they are
allowed to continue to run.

While terminating, the server is in the 
.I Terminating-Delayed 
state.

.IP quick
Shuts down the primary server.  Running jobs and subjobs are left running.

This is the default behavior when no options are given to the 
.B qterm
command.

While terminating, the server is in the 
.I Terminating 
state.

.RE
.LP
.IP "--version" 10
The 
.B qterm
command returns its PBS version information and exits.
This option can only be used alone.

.SH OPERANDS
You optionally specify the list of servers to shut down using 
.I [<server>[ <server> ...].

If you do not specify any servers, the 
.B qterm
command shuts down the default server.

.SH STANDARD ERROR
The
.B qterm
command writes a diagnostic message to standard error for
each error occurrence.

.SH EXIT STATUS
.IP Zero 8
Upon successful processing of all operands presented to the 
.B qterm
command.
.IP "Greater than zero" 8
If the 
.B qterm 
command fails to process any operand

.SH SEE ALSO
pbs_server(8B), pbs_mom(8B), pbs_sched(8B)


================================================
FILE: doc/man8/tracejob.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH tracejob 8B "6 May 2020" Local "PBS Professional"
.SH NAME
.B tracejob 
\- extract and print log messages for a PBS job
.SH SYNOPSIS
.B tracejob 
[-a] [-c <count>] [-f <filter>] [-l] [-m] [-n <days>] 
.RS 9
[-p <path>] [-s] [-v] [-w <cols>] [-z] <job ID>
.RE
.B tracejob
--version
.SH DESCRIPTION
The
.B tracejob
command extracts log messages for a given 
.I job ID 
and  prints them in chronological order.
.LP
The 
.B tracejob
command extracts information from the server, scheduler, accounting, and MoM logs.
Server logs contain information such as when a job was queued or modified.
Scheduler logs contain clues as to why a job is not running.  Accounting
logs contain accounting records for when a job was queued, started, ended,
or deleted.  MoM logs contain information about what happened to a job
while it was running.  
.LP
To get MoM log messages for a job, 
.B tracejob 
must be run on the machine on which the job ran.  If the job ran on multiple
hosts, you must run 
.B tracejob
on each of those hosts.
.LP
Some log messages appear many times.  In order to make the output of 
.B tracejob
more readable, messages that appear over a certain number of times (see option 
.I -c 
below) are restricted to only the most recent message.

.B Using tracejob on Job Arrays
.br
If 
.B tracejob 
is run on a job array, the information returned is about
the job array itself, and not its subjobs.  Job arrays do not have associated
MoM log messages.  If 
.B tracejob 
is run on a subjob, the same types of log 
messages are available as for a job.  Certain log messages that occur for 
a regular job will not occur for a subjob.

.B Required Privilege
.br 
All users have access to server, scheduler, and MoM information. Only 
Administrator or root can access accounting information.
.LP

.SH Options to tracejob
.IP "-a" 8
Do not report accounting information.
.IP "-c <count>" 8
Set excessive message limit to 
.I count.
If a message is logged 
at least 
.I count
times, only the most recent message is printed.
The default for 
.I count
is 15.

.IP "-f <filter>" 8
Do not include log events of type 
.I filter.
The 
.B -f 
option can be used 
more than once on the command line.  
The following table shows each filter with its hex value and category:

.nf
Filter      Hex Value  Message Category                   
---------------------------------------------------
error       0001       Internal errors
system      0002       System errors 
admin       0004       Administrative events
job         0008       Job-related events
job_usage   0010       Job accounting info
security    0020       Security violations
sched       0040       Scheduler events
debug       0080       Common debug messages
debug2      0100       Uncommon debug messages
resv        0200       Reservation debug messages
debug3      0400       Less common than debug2
debug4      0800       Less common than debug3
.fi
.RE

.IP "-l" 8
Do not report scheduler information.            

.IP "-m" 8
Do not report MoM information.

.IP "-n <days>" 8
Report information from up to 
.I days 
days in the past.  Default number of days: 
.I 1 
= today

.IP "-p <path>" 8
Use 
.I path 
as path to PBS_HOME on machine being queried.

.IP "-s"   8
Do not report server information.

.IP "-w <cols>" 8
Width of current terminal.  If 
.I cols 
is not specified, 
.B tracejob 
queries OS to get terminal width.  If OS doesn't 
return anything, defaults to 
.I 80.

.IP "-v" 8
Verbose.  Report more of 
.B tracejob's 
errors than default.

.IP "-z" 8
Suppresses printing of duplicate messages.

.RE
.LP
.IP "--version" 8
The 
.B tracejob
command returns its PBS version information and exits.
This option can only be used alone.

.SH Operands
The tracejob command accepts one 
.I job ID 
operand. 
.br
For a job, this has the form: 
.br
.I <sequence number>[.<server name>][@<server name>]
.br
For a job array, the form is:
.br
.I <sequence number>[][.<server name>][@<server name>]
.br
For a subjob, the form is: 
.br
.I <sequence number>[<index>][.<server name>][@<server name>]
.br
Note that some shells require that you enclose a job array identifier in double quotes.


.SH EXIT STATUS
.IP Zero 8
upon successful processing of all options
.IP "Greater than zero" 8
If
.B tracejob 
is unable to process any options

.SH SEE ALSO
pbs_server(8B), pbs_sched(8B), pbs_mom(8B)


================================================
FILE: doc/man8/win_postinstall.py.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"
.TH win_postinstall.py 8B "20 November 2019" Local "PBS Professional"
.SH NAME
.B win_postinstall.py 
\- For Windows.  Configures PBS MoM or client


.SH SYNOPSIS
<PBS_EXEC>\\etc\\python win_postinstall.py 
-u <PBS service account> 
.br
        -p <PBS service account password> -t <installation type>   
.br
        -s <server name> [-c <path to scp command>]

.SH DESCRIPTION
The
.B win_postinstall.py
command configures the PBS MoM and commands.  It performs
post-installation steps such as validating the PBS service account
username and password, installing the Visual C++ redistributable
binary, and creating the
.I pbs.conf
file in the PBS destination folder.

For an "execution" type of installation, it creates PBS_HOME, 
and registers and starts the PBS_MOM service.

When you use this command during an "execution" type installation of
PBS, the command automatically un-registers any old PBS MoM.

Available on Windows only.

.SH Required Privilege

You must have Administrator privilege to run this command.

.SH Options to win_postinstall.py
.IP "-c, --scp-path <path to scp command>" 8
Specifies path to 
.B scp
command.

.IP "-p, --passwd <PBS service account password>" 8
Specifies password for PBS service account.  

.IP "-s, --server <server name>" 8
Specifies the hostname on which the PBS server will run; required when
the installation type is one of "execution" or "client".

.IP "-t, --type <installation type>" 8
Specifies type of installation.  Type can be one of 
"execution" or "client".

.IP "-u, --user <PBS service account>" 8
Specifies PBS service account.  When you specify the PBS service
account, whether or not you are on a domain machine, include only the
username, not the domain.  For example, if the full username on a
domain machine is 
.I <domain>
\\
.I <username>
, pass only 
.I <username>
as an argument.


================================================
FILE: m4/disable_shell_pipe.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_DISABLE_SHELL_PIPE],
[
  AC_MSG_CHECKING([for method to pass job script name])
  AC_ARG_ENABLE([shell-pipe],
    AS_HELP_STRING([--disable-shell-pipe],
      [Pass the job script name via STDIN rather than using a pipe.]
    )
  )
  AS_IF([test "x$enable_shell_pipe" != "xno"],
    AC_MSG_RESULT([pipe])
    AC_DEFINE([SHELL_INVOKE], [1], [Define to 0 for STDIN or 1 for pipe]),
    AC_MSG_RESULT([stdin])
    AC_DEFINE([SHELL_INVOKE], [0], [Define to 0 for STDIN or 1 for pipe])
  )
])


================================================
FILE: m4/disable_syslog.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_DISABLE_SYSLOG],
[
  AC_MSG_CHECKING([whether to disable syslog support])
  AC_ARG_ENABLE([syslog],
    AS_HELP_STRING([--disable-syslog],
      [Do not provide support for logging via syslog.]
    )
  )
  AS_IF([test "x$enable_syslog" != "xno"],
    AC_MSG_RESULT([no])
    AC_DEFINE([SYSLOG], [1], [Define as 0 to disable syslog, 1 to enable]),
    AC_MSG_RESULT([yes])
    AC_DEFINE([SYSLOG], [0], [Define as 0 to disable syslog, 1 to enable])
  )
])


================================================
FILE: m4/enable_alps.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_ENABLE_ALPS],
[
  AC_MSG_CHECKING([whether Cray ALPS support was requested])
  AC_ARG_ENABLE([alps],
    AS_HELP_STRING([--enable-alps],
      [Enable support for Cray ALPS.]
    )
  )
  AS_IF([test "x$enable_alps" = "xyes"],
    AC_MSG_RESULT([yes]),
    AC_MSG_RESULT([no])
  )
  AM_CONDITIONAL([ALPS_ENABLED], [test x$enable_alps = xyes])
])


================================================
FILE: m4/enable_ptl.m4
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_ENABLE_PTL],
[
  # check for PTL enable to generate PTL package which is disabled by default
  AC_MSG_CHECKING([whether PTL package was requested])
  AC_ARG_ENABLE([ptl],
    AS_HELP_STRING([--enable-ptl],
    [Enable package creation for PTL]))
  AS_IF([test "x$enable_ptl" = "xyes"],
    [AC_MSG_RESULT([yes])],
    [AC_MSG_RESULT([no])])
  AM_CONDITIONAL([ENABLEPTL], [test "x${enable_ptl}" = "xyes"])
  [ptl_prefix=`dirname ${prefix}`/ptl]
  AC_SUBST(ptl_prefix)
])


================================================
FILE: m4/pbs_decl_epoll.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#


#
# Prefix the macro names with PBS_ so they don't conflict with Python definitions
#

AC_DEFUN([PBS_AC_DECL_EPOLL],
[
  AS_CASE([x$target_os],
    [xlinux*],
      AC_MSG_CHECKING([for epoll])
      AC_TRY_RUN(
[
#include <sys/epoll.h>
int main()
{
  return ((epoll_create(100) == -1) ? -1 : 0);
}
],
        AC_DEFINE([PBS_HAVE_EPOLL], [], [Defined when epoll is available])
        AC_MSG_RESULT([yes]),
        AC_MSG_RESULT([no])
      ),
)])


================================================
FILE: m4/pbs_decl_epoll_pwait.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#


#
# Prefix the macro names with PBS_ so they don't conflict with
# Python definitions
#

AC_DEFUN([PBS_AC_DECL_EPOLL_PWAIT],
[
  AS_CASE([x$target_os],
    [xlinux*],
      AC_MSG_CHECKING(whether epoll_pwait system call is supported)
      AC_TRY_RUN([
#include <unistd.h>
#include <poll.h>
#include <signal.h>
#include <stdio.h>
#include <errno.h>
#include <sys/epoll.h>
int main()
{
  sigset_t allsigs;
  int n;
  int maxevents = 1;
  int timeout = 0;
  int epollfd;
  struct   epoll_event  events;
  sigemptyset(&allsigs);
  events.events = EPOLLIN;
  epollfd = epoll_create1(0);
  if (epollfd == -1) {
    perror("epoll_create1");
    return (1);
  }
  n = epoll_pwait(epollfd, &events, maxevents, timeout, &allsigs);
  return (n);
}],
        AC_DEFINE([PBS_HAVE_EPOLL_PWAIT], [],
                  [Defined when epoll_pwait is available])
        AC_MSG_RESULT([yes]),
        AC_MSG_RESULT([no])
      )
  )
])


================================================
FILE: m4/pbs_decl_h_errno.m4
================================================

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# Test to see whether h_errno is visible when netdb.h is included.
# At least under HP-UX 10.x this is not the case unless
# XOPEN_SOURCE_EXTENDED is declared but then other nasty stuff happens.
# The appropriate thing to do is to call this macro and then
# if it is not available do a "extern int h_errno;" in the code.

AC_DEFUN([PBS_AC_DECL_H_ERRNO],
  [AC_CACHE_CHECK([for h_errno declaration in netdb.h],
    ac_cv_decl_h_errno,
    [AC_TRY_COMPILE([#include <sys/types.h>
#ifdef HAVE_UNISTD_H
#include <unistd.h>
#endif
#include <netdb.h>
],
      [int _ZzQ = (int)(h_errno + 1);],
      [ac_cv_decl_h_errno=yes],
      [ac_cv_decl_h_errno=no])
    ])
  AS_IF([test x$ac_cv_decl_h_errno = xyes],
    AC_DEFINE(H_ERRNO_DECLARED, [], [Defined when h_errno is declared in netdb.h]))
])


================================================
FILE: m4/pbs_decl_ppoll.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#


#
# Prefix the macro names with PBS_ so they don't conflict with Python definitions
#
AC_DEFUN([PBS_AC_DECL_PPOLL],
[
  AS_CASE([x$target_os],
    [xlinux*],
      AC_MSG_CHECKING(whether ppoll API is supported)
      AC_TRY_RUN([
#include <unistd.h>
#include <poll.h>
#include <signal.h>
int main()
{
  sigset_t allsigs;
  int n;
  int fd[2];
  struct timespec timeoutspec;
  struct   pollfd  pollfds[1];
  timeoutspec.tv_nsec = 1000;
  timeoutspec.tv_sec = 0;
  pipe(fd);
  pollfds[0].fd = fd[0];
  sigemptyset(&allsigs);
  n = ppoll(pollfds, 1, &timeoutspec, &allsigs);
  return (n);
}],
        AC_DEFINE([PBS_HAVE_PPOLL], [], [Defined when ppoll is available])
        AC_MSG_RESULT([yes]),
        AC_MSG_RESULT([no])
      )
  )
])


================================================
FILE: m4/pbs_decl_socklen_t.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_DECL_SOCKLEN_T],
  [AC_CACHE_CHECK([for socklen_t],
    pbs_ac_cv_decl_socklen_t,
    [AC_TRY_COMPILE([
#include <sys/types.h>
#include <unistd.h>
#include <sys/socket.h>
#include <netdb.h>
], [
  socklen_t       len = 0;
  len++;
],
    pbs_ac_cv_decl_socklen_t=yes,
    pbs_ac_cv_decl_socklen_t=no)])
  AS_IF([test x$pbs_ac_cv_decl_socklen_t = xno],
    AC_DEFINE([pbs_socklen_t], [int], [socklen_t was not defined]),
    AC_DEFINE([pbs_socklen_t], [socklen_t], [socklen_t was defined]))
])


================================================
FILE: m4/pbs_patch_libtool.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_PATCH_LIBTOOL], [
	AC_CONFIG_COMMANDS([patch-libtool], [
		AS_IF([! grep '[[-]]fsanitize=\*' libtool 2>&1 >/dev/null], [
			AC_MSG_NOTICE([patching libtool to support -fsanitize])
			AS_IF([! grep '[[-]]pg[[|)]]' libtool 2>&1 >/dev/null], [
				grep -A 30 'Flags to be passed through unchanged' libtool \
					>libtool.patched.err
				AC_MSG_ERROR([libtool does not pass through -pg])
			])
			$SED 's/\(-pg\)\([[|)]]\)/\1|-fsanitize=\*\2/' \
				libtool >libtool.patched 2>libtool.patched.err
			AS_IF([! grep '[[-]]fsanitize=\*' libtool.patched \
					2>&1 >/dev/null ], [
				AC_MSG_ERROR([Failed to patch libtool])
			], [])
			mv -f libtool.patched libtool
			rm -f libtool.patched.err
		])
	])
])


================================================
FILE: m4/pbs_systemd_unitdir.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_SYSTEMD_UNITDIR],
[
  AC_MSG_CHECKING([system/machine type for systemd unit dir])
  systemd_dir="/usr/lib/systemd/system"
  AS_IF([test -r "/etc/os-release"],
    [system_type=$( cat /etc/os-release | awk -F'=' '/^ID=/' | cut -d "=" -f 2 )
      AS_IF([test "x$system_type" = "xubuntu" -o "x$system_type" = "xdebian"],
      [systemd_dir="/lib/systemd/system"])
    ]
  )
  _unitdir=$systemd_dir
  AC_MSG_RESULT([$_unitdir])
  AC_SUBST([_unitdir])
])


================================================
FILE: m4/pbs_version.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_PBS_VERSION],
[
  AC_MSG_CHECKING([for PBS version])
  AC_ARG_VAR([PBS_VERSION], [Specifies the PBS version number.])
  AS_IF([test "x$PBS_VERSION" = "x"],
    [PBS_VERSION=$PACKAGE_VERSION]
  )
  AC_MSG_RESULT([$PBS_VERSION])
  AC_SUBST([PBS_VERSION])
  VERSION=$PBS_VERSION
  AC_SUBST([VERSION])
  PACKAGE_VERSION=$PBS_VERSION
  AC_SUBST([PACKAGE_VERSION])
])


================================================
FILE: m4/security_check.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_SECURITY],
[
  AC_MSG_CHECKING([whether to disable security check])
  AC_ARG_ENABLE([security],
    AS_HELP_STRING([--disable/--enable-security],
      [whether to perform security checks, enabled by default]
    )
  )
  AS_IF([test "x$enable_security" != "xno"],
    AC_MSG_RESULT([no])
    AS_ECHO("Security checks will be performed"),
    AC_MSG_RESULT([yes])
    AC_DEFINE([NO_SECURITY_CHECK], [], [Define to disable security])
  )
])


================================================
FILE: m4/with_cjson.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_CJSON],
[
  AC_ARG_WITH([cjson],
    AS_HELP_STRING([--with-cjson=DIR],
      [Specify the directory where cJSON is installed.]
    )
  )
  [cjson_dir="$with_cjson"]
  AC_MSG_CHECKING([for cJSON])
  AS_IF(
    [test "$cjson_dir" = ""],
    AC_CHECK_HEADER([cjson/cJSON.h], [], AC_MSG_ERROR([cJSON headers not found.])),
    [test -r "$cjson_dir/include/cjson/cJSON.h"],
    [cjson_inc="-I$cjson_dir/include"],
    AC_MSG_ERROR([cJSON headers not found.])
  )
  AS_IF(
    [test "$cjson_dir" = ""],
    # Using system installed cjson
    AC_CHECK_LIB([cjson], [cJSON_Parse],
      [cjson_lib="-lcjson"],
      AC_MSG_ERROR([cJSON shared object library not found.])),
    # Using developer installed cJSON
    [test -r "${cjson_dir}/lib64/libcjson.so"],
    [cjson_lib="-L${cjson_dir}/lib64 -lcjson"],
    [test -r "${cjson_dir}/lib/libcjson.so"],
    [cjson_lib="-L${cjson_dir}/lib -lcjson"],
    AC_MSG_ERROR([cJSON library not found.])
  )
  AC_MSG_RESULT([$cjson_dir])
  AC_SUBST(cjson_inc)
  AC_SUBST(cjson_lib)
  AC_DEFINE([CJSON], [], [Defined when cjson is available])
])


================================================
FILE: m4/with_core_limit.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_CORE_LIMIT],
[
  AC_MSG_CHECKING([for daemon coredump limit])
  AC_ARG_WITH([core-limit],
    AS_HELP_STRING([--with-core-limit=VALUE],
      [Specify the daemon coredump limit.]
    )
  )
  AS_IF([test x$with_core_limit != x],
    [PBS_CORE_LIMIT="$with_core_limit"],
    [PBS_CORE_LIMIT="unlimited"]
  )
  AC_MSG_RESULT([$PBS_CORE_LIMIT])
  AC_SUBST(PBS_CORE_LIMIT)
])


================================================
FILE: m4/with_database_dir.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_DATABASE_DIR],
[
  AC_MSG_CHECKING([for PBS database directory])
  AC_ARG_WITH([database-dir],
    AS_HELP_STRING([--with-database-dir=DIR],
      [Specify the directory where the PBS database is installed.]
    )
  )
  [database_dir="$with_database_dir"]
  AS_IF(
    [test "$database_dir" = ""],
    AC_CHECK_HEADER([libpq-fe.h], [], [database_dir="/usr"])
  )
  AS_IF(
    [test "$database_dir" != ""],
    AS_IF(
      [test -r "$database_dir/include/libpq-fe.h"],
      [database_inc="-I$database_dir/include"],
      [test -r "$database_dir/include/pgsql/libpq-fe.h"],
      [database_inc="-I$database_dir/include/pgsql"],
      [test -r "$database_dir/include/postgresql/libpq-fe.h"],
      [database_inc="-I$database_dir/include/postgresql"],
      AC_MSG_ERROR([Database headers not found.])
    )
  )
  AS_IF(
    # Using system installed PostgreSQL
    [test "$with_database_dir" = ""],
    AC_CHECK_LIB([pq], [PQconnectdb],
      [database_lib="-lpq"],
      AC_MSG_ERROR([PBS database shared object library not found.])),
    # Using developer installed PostgreSQL
    [test -r "$database_dir/lib64/libpq.a"],
    [database_lib="$database_dir/lib64/libpq.a"],
    [test -r "$database_dir/lib/libpq.a"],
    [database_lib="$database_dir/lib/libpq.a"],
    AC_MSG_ERROR([PBS database library not found.])
  )
  AC_MSG_RESULT([$database_dir])
  AC_SUBST([database_dir])
  AC_SUBST([database_inc])
  AC_SUBST([database_lib])
  AC_DEFINE([DATABASE], [], [Defined when PBS database is available])
])


================================================
FILE: m4/with_database_port.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_DATABASE_PORT],
[
  AC_MSG_CHECKING([for PBS database port])
  AC_ARG_WITH([database-port],
    AS_HELP_STRING([--with-database-port=PORT],
      [Specify the port number for the PBS database.]
    )
  )
  AS_IF([test "x$with_database_port" != "x"],
    database_port=[$with_database_port],
    database_port=[15007]
  )
  AC_MSG_RESULT([$database_port])
  AC_SUBST([database_port])
  AC_DEFINE_UNQUOTED([PBS_DATA_SERVICE_PORT], [$database_port], [Port number for the PBS database])
])


================================================
FILE: m4/with_database_user.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_DATABASE_USER],
[
  AC_MSG_CHECKING([for PBS database user])
  AC_ARG_WITH([database-user],
    AS_HELP_STRING([--with-database-user=USER],
      [Specify the user account that owns the PBS database.]
    )
  )
  AS_IF([test "x$with_database_user" != "x"],
    database_user=[$with_database_user],
    database_user=[postgres]
  )
  AC_MSG_RESULT([$database_user])
  AC_SUBST([database_user])
  AC_DEFINE_UNQUOTED([PBS_DATA_SERVICE_USER], ["$database_user"], [User that owns the PBS database])
])


================================================
FILE: m4/with_editline.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_EDITLINE],
[
  AC_ARG_WITH([editline],
    AS_HELP_STRING([--with-editline=DIR],
      [Specify the directory where editline is installed.]
    )
  )
  [editline_dir="$with_editline"]
  AC_MSG_CHECKING([for editline])
  AS_IF(
    [test "$editline_dir" = ""],
    AC_CHECK_HEADER([histedit.h], [], AC_MSG_ERROR([editline headers not found.])),
    [test -r "$editline_dir/include/histedit.h"],
    [editline_inc="-I$editline_dir/include"],
    AC_MSG_ERROR([editline headers not found.])
  )
  AS_IF(
    # Using system installed editline
    [test "$editline_dir" = ""],
    AC_CHECK_LIB([edit], [el_init],
      [editline_lib="-ledit"],
      AC_MSG_ERROR([editline shared object library not found.])),
    # Using developer installed editline
    [test -r "${editline_dir}/lib64/libedit.a"],
    [editline_lib="${editline_dir}/lib64/libedit.a"],
    [test -r "${editline_dir}/lib/libedit.a"],
    [editline_lib="${editline_dir}/lib/libedit.a"],
    AC_MSG_ERROR([editline library not found.])
  )
  AC_MSG_RESULT([$editline_dir])
  AC_CHECK_LIB([ncurses], [tgetent],
    [curses_lib="-lncurses"],
    AC_CHECK_LIB([curses], [tgetent],
      [curses_lib="-lcurses"],
      AC_MSG_ERROR([curses library not found.])))
  [editline_lib="$editline_lib $curses_lib"]
  AC_SUBST(editline_inc)
  AC_SUBST(editline_lib)
  AC_DEFINE([QMGR_HAVE_HIST], [], [Defined when editline is available])
])


================================================
FILE: m4/with_expat.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_EXPAT],
[
  AC_ARG_WITH([expat],
    AS_HELP_STRING([--with-expat=DIR],
      [Specify the directory where expat is installed.]
    )
  )
  [expat_dir="$with_expat"]
  AC_MSG_CHECKING([for expat])
  AS_IF(
    [test "$expat_dir" = ""],
    AC_CHECK_HEADER([expat.h], [], AC_MSG_ERROR([expat headers not found.])),
    [test -r "$expat_dir/include/expat.h"],
    [expat_inc="-I$expat_dir/include"],
    AC_MSG_ERROR([expat headers not found.])
  )
  AS_IF(
    [test "$expat_dir" = ""],
    # Using system installed expat
    AC_CHECK_LIB([expat], [XML_Parse],
      [expat_lib="-lexpat"],
      AC_MSG_ERROR([expat shared object library not found.])),
    # Using developer installed expat
    [test -r "${expat_dir}/lib64/libexpat.a"],
    [expat_lib="${expat_dir}/lib64/libexpat.a"],
    [test -r "${expat_dir}/lib/libexpat.a"],
    [expat_lib="${expat_dir}/lib/libexpat.a"],
    AC_MSG_ERROR([expat library not found.])
  )
  AC_MSG_RESULT([$expat_dir])
  AC_SUBST(expat_inc)
  AC_SUBST(expat_lib)
  AC_DEFINE([EXPAT], [], [Defined when expat is available])
])


================================================
FILE: m4/with_hwloc.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_HWLOC],
[
  AC_ARG_WITH([hwloc],
    AS_HELP_STRING([--with-hwloc=DIR],
      [Specify the directory where hwloc is installed.]
    )
  )
  hwloc_dir=["$with_hwloc"]
  AC_MSG_CHECKING([for hwloc])
  [hwloc_flags=""]
  [hwloc_inc=""]
  [hwloc_lib=""]
  AS_IF(
    [test "$hwloc_dir" = ""],
    AC_CHECK_HEADER([hwloc.h], [], AC_MSG_ERROR([hwloc headers not found.])),
    [test -r "$hwloc_dir/include/hwloc.h"],
    [hwloc_inc="-I$hwloc_dir/include"],
    AC_MSG_ERROR([hwloc headers not found.])
  )
  AS_IF(
    # Using system installed hwloc
    [test "$hwloc_dir" = ""],
    AC_CHECK_LIB([hwloc], [hwloc_topology_init],
      [hwloc_lib="-lhwloc"],
      AC_MSG_ERROR([hwloc shared object library not found.])
    ),
    # Using developer installed hwloc
    [test -r "${hwloc_dir}/lib64/libhwloc_embedded.a"],
    [hwloc_lib="${hwloc_dir}/lib64/libhwloc_embedded.a"],
    [test -r "${hwloc_dir}/lib/libhwloc_embedded.a"],
    [hwloc_lib="${hwloc_dir}/lib/libhwloc_embedded.a"],
    AC_MSG_ERROR([hwloc library not found.])
  )
  AC_MSG_RESULT([$hwloc_dir])
  AS_CASE([x$target_os],
    [xlinux*],
      AC_CHECK_LIB([numa], [mbind], [hwloc_lib="$hwloc_lib -lnuma"])
      AC_CHECK_LIB([udev], [udev_new], [hwloc_lib="$hwloc_lib -ludev"])
      AC_CHECK_LIB([pciaccess], [pci_system_init], [hwloc_lib="$hwloc_lib -lpciaccess"])
  )
  AC_SUBST(hwloc_flags)
  AC_SUBST(hwloc_inc)
  AC_SUBST(hwloc_lib)
  AC_DEFINE([HWLOC], [], [Defined when hwloc is available])
])


================================================
FILE: m4/with_krbauth.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([_KRB5_CONFIG_PATH],
[
  AC_ARG_VAR([PATH_KRB5_CONFIG], [Path to krb5-config.])
  AC_PATH_PROG([PATH_KRB5_CONFIG], [krb5-config], [], [${PATH}:/usr/kerberos/bin])
  AS_IF([test -x "$PATH_KRB5_CONFIG"],
    [
    AC_MSG_NOTICE([krb5-config found])
    ],
    [
    AC_MSG_ERROR([krb5-config not found at provided/default path])
    ])
])

AC_DEFUN([_KRB5_CONFIG_LIBS],
  [AC_REQUIRE([_KRB5_CONFIG_PATH])
  $3[]_LIBS=`"$1" --libs $2 2>/dev/null | grep -vi unknown 2>/dev/null`
])

AC_DEFUN([_KRB5_CONFIG_CFLAGS],
  [AC_REQUIRE([_KRB5_CONFIG_PATH])
  $3[]_CFLAGS=`"$1" --cflags $2 2>/dev/null`
])

AC_DEFUN([_KRB5_CHECK_HEIMDAL],
  [AC_REQUIRE([_KRB5_CONFIG_PATH])
  _KRB5_HEIMDAL=`"$1" --vendor 2>/dev/null | grep Heimdal 2>/dev/null`
])

AC_DEFUN([KRB5_CONFIG],
[
  AC_REQUIRE([_KRB5_CONFIG_PATH])

  PKG_CHECK_MODULES(com_err, [com_err])

  _KRB5_CONFIG_CFLAGS([$PATH_KRB5_CONFIG],[],[_KRB5])
  _KRB5_CONFIG_LIBS([$PATH_KRB5_CONFIG],[krb5],[_KRB5_KRB5])
  _KRB5_CONFIG_LIBS([$PATH_KRB5_CONFIG],[gssapi],[_KRB5_GSSAPI])
  _KRB5_CONFIG_LIBS([$PATH_KRB5_CONFIG],[kafs],[_KRB5_KAFS])

  # we don't want to add -lkafs into the general LIBS
  ac_save_libs=${LIBS}

  AS_IF([test "x$_KRB5_KAFS_LIBS" != "x"],
  [ac_save_ldflags=${LDFLAGS}
  LDFLAGS="${_KRB5_KAFS_LIBS} ${LDFLAGS}"
  AC_CHECK_LIB([kafs],[k_hasafs],[],[_KRB5_KAFS_LIBS=""])
  LDFLAGS="$ac_save_ldflags"],
  [])

  AS_IF([test "x$_KRB5_KAFS_LIBS" = "x"],
    [
    AC_CHECK_LIB([kafs],[k_hasafs],
      [_KRB5_KAFS_LIBS="-lkafs"],
      AC_CHECK_LIB([kopenafs],[k_hasafs],[_KRB5_KAFS_LIBS="-lkopenafs"],
        AC_MSG_WARN([k(open)afs library not found - afs will be ignored])))
    ],[])

  LIBS="$ac_save_libs"

  _KRB5_CHECK_HEIMDAL([$PATH_KRB5_CONFIG])
  AS_IF([test "x$_KRB5_HEIMDAL" != "x"],
    [AC_MSG_NOTICE([Kerberos vendor is Heimdal])
    AC_DEFINE_UNQUOTED([KRB5_HEIMDAL],[],[Kerberos is Heimdal])
    ],[])

  AC_SUBST([KRB5_CFLAGS],["$_KRB5_CFLAGS $com_err_CFLAGS"])
  _KRB5_LIBS="$_KRB5_KRB5_LIBS $_KRB5_GSSAPI_LIBS $_KRB5_KAFS_LIBS $com_err_LIBS"
  AC_SUBST([KRB5_LIBS],[$_KRB5_LIBS])
])

AC_DEFUN([PBS_AC_WITH_KRBAUTH],
[
  AC_MSG_CHECKING([for kerberos support])
  AC_ARG_WITH([krbauth],
    [AS_HELP_STRING([--with-krbauth],
       [enable kerberos authentication, krb5-config required for setup])],
    [],[with_krbauth=no])
  AM_CONDITIONAL([KRB5_ENABLED], [test "x$with_krbauth" != xno])
  AS_IF([test "x$with_krbauth" != xno],
    [
    AC_MSG_RESULT([requested])
    _KRB5_CONFIG_PATH
    KRB5_CONFIG
    AC_DEFINE_UNQUOTED([PBS_SECURITY],[KRB5],[Enable krb5/gssapi security.])
    ],
    [
    AC_MSG_RESULT([disabled])
    ])
])


================================================
FILE: m4/with_libical.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_LIBICAL],
[
  AC_ARG_WITH([libical],
    AS_HELP_STRING([--with-libical=DIR],
      [Specify the directory where the ical library is installed.]
    )
  )
  [libical_dir="$with_libical"]
  AC_MSG_CHECKING([for libical])
  AS_IF(
    [test "$libical_dir" = ""],
    AC_CHECK_HEADER([libical/ical.h], [], AC_MSG_ERROR([libical headers not found.])),
    [test -r "$libical_dir/include/libical/ical.h"],
    [libical_include="$libical_dir/include"],
    AC_MSG_ERROR([libical headers not found.])
  )
  AS_IF(
    [test "$libical_include" = ""],
    [AC_PREPROC_IFELSE(
      [AC_LANG_SOURCE([[#include <libical/ical.h>
        ICAL_VERSION]])],
      [libical_version=`tail -n1 conftest.i | $SED -n 's/"\([[0-9]]*\)..*/\1/p'`]
    )],
    [libical_version=`$SED -n 's/^#define ICAL_VERSION "\([[0-9]]*\)..*/\1/p' "$libical_include/libical/ical.h"`]
  )
  AS_IF(
    [test "x$libical_version" = "x"],
    AC_MSG_ERROR([Could not determine libical version.]),
    [test "$libical_version" -gt 1],
    AC_DEFINE([LIBICAL_API2], [], [Defined when libical version >= 2])
  )
  AS_IF([test "$libical_dir" = ""],
    dnl Using system installed libical
    libical_inc=""
    AC_CHECK_LIB([ical], [icalrecurrencetype_from_string],
      [libical_lib="-lical"],
      AC_MSG_ERROR([libical shared object library not found.])),
    dnl Using developer installed libical
    libical_inc="-I$libical_include"
    AS_IF([test -r "${libical_dir}/lib64/libical.a"],
      [libical_lib="${libical_dir}/lib64/libical.a"],
      AS_IF([test -r "${libical_dir}/lib/libical.a"],
        [libical_lib="${libical_dir}/lib/libical.a"],
        AC_MSG_ERROR([ical library not found.])
      )
    )
  )
  AC_MSG_RESULT([$libical_dir])
  AC_SUBST(libical_inc)
  AC_SUBST(libical_lib)
  AC_DEFINE([LIBICAL], [], [Defined when libical is available])
])


================================================
FILE: m4/with_libz.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_LIBZ],
[
  AC_ARG_WITH([libz],
    AS_HELP_STRING([--with-libz=DIR],
      [Specify the directory where libz is installed.]
    )
  )
  [libz_dir="$with_libz"]
  AC_MSG_CHECKING([for libz])
  AS_IF(
    [test "$libz_dir" = ""],
    AC_CHECK_HEADER([zlib.h], [], AC_MSG_ERROR([libz headers not found.])),
    [test -r "$libz_dir/include/zlib.h"],
    [libz_inc="-I$libz_dir/include"],
    AC_MSG_ERROR([libz headers not found.])
  )
  AS_IF(
    # Using system installed libz
    [test "$libz_dir" = ""],
    AC_CHECK_LIB([z], [deflateInit_],
      [libz_lib="-lz"],
      AC_MSG_ERROR([libz shared object library not found.])),
	  # Using developer installed libz
    [test -r "${libz_dir}/lib64/libz.a"],
    [libz_lib="${libz_dir}/lib64/libz.a"],
    [test -r "${libz_dir}/lib/libz.a"],
    [libz_lib="${libz_dir}/lib/libz.a"],
    AC_MSG_ERROR([libz not found.])
  )
  AC_MSG_RESULT([$libz_dir])
  AC_SUBST(libz_inc)
  AC_SUBST(libz_lib)
  AC_DEFINE([PBS_COMPRESSION_ENABLED], [], [Defined when libz is available])
])


================================================
FILE: m4/with_min_stack_limit.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_MIN_STACK_LIMIT],
[
  AC_MSG_CHECKING([for min stack limit])
  AC_ARG_WITH([stack-limit],
    AS_HELP_STRING([--with_min_stack_limit=LIMIT],
      [Specify the minimum stack limit.]
    )
  )
  AS_IF([test "x$with_min_stack_limit" != "x"],
    limit_value=[$with_min_stack_limit],
    limit_value=[0x1000000]
  )
  AC_MSG_RESULT([$limit_value])
  AC_SUBST([limit_value])
  AC_DEFINE_UNQUOTED([MIN_STACK_LIMIT], [$limit_value], [Mininum stack limit])
])


================================================
FILE: m4/with_pbs_conf_file.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_PBS_CONF_FILE],
[
  AC_MSG_CHECKING([for PBS configuration file location])
  AC_ARG_WITH([pbs-conf-file],
    AS_HELP_STRING([--with-pbs-conf-file=FILE],
      [Location of the PBS configuration file.]
    )
  )
  AS_IF([test "x$with_pbs_conf_file" != "x"],
    pbs_conf_file=[$with_pbs_conf_file],
    pbs_conf_file=[/etc/pbs.conf]
  )
  AC_MSG_RESULT([$pbs_conf_file])
  AC_SUBST([PBS_CONF_FILE], ["$pbs_conf_file"])
  AC_DEFINE_UNQUOTED([PBS_CONF_FILE], ["$pbs_conf_file"], [Location of the PBS configuration file])
])


================================================
FILE: m4/with_pmix.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_PMIX],
[
  AC_ARG_WITH([pmix],
    AS_HELP_STRING([--with-pmix=DIR],
      [Specify the directory where the pmix library is installed.]
    )
  )
  AC_MSG_CHECKING([for PMIx])
  AS_IF([test "x$with_pmix" = "xno" -o "x$with_pmix" = "x"],
    AC_MSG_RESULT([no]),
    AS_IF([test "x$with_pmix" = "xyes"],
      pmix_dir=["/usr"],
      pmix_dir=["$with_pmix"]
    )
    AS_IF([test -r "$pmix_dir/include/pmix_version.h"],
      [pmix_version_h="$pmix_dir/include/pmix_version.h"],
      AC_MSG_ERROR([PMIx headers not found.])
    )
    AC_MSG_RESULT([$pmix_dir])
    AC_MSG_CHECKING([PMIx version])
    pmix_version_major=`${SED} -n 's/^#define PMIX_VERSION_MAJOR \([[0-9]]*\)L/\1/p' "$pmix_version_h"`
    AS_IF([test "x$pmix_version_major" = "x"],
      AC_MSG_ERROR([Could not determine PMIx major version.])
    )
    pmix_version_minor=`${SED} -n 's/^#define PMIX_VERSION_MINOR \([[0-9]]*\)L/\1/p' "$pmix_version_h"`
    AS_IF([test "x$pmix_version_minor" = "x"],
      AC_MSG_ERROR([Could not determine PMIx minor version.])
    )
    pmix_version_release=`${SED} -n 's/^#define PMIX_VERSION_RELEASE \([[0-9]]*\)L/\1/p' "$pmix_version_h"`
    AS_IF([test "x$pmix_version_release" = "x"],
      AC_MSG_ERROR([Could not determine PMIx release version.])
    )
    pmix_version="$pmix_version_major.$pmix_version_minor.$pmix_version_release"
    AC_MSG_RESULT([$pmix_version])
    AS_IF([test "$pmix_dir" = "/usr"],
      [pmix_lib="-lpmix"; pmix_inc=""],
      AS_IF([test -r "$pmix_dir/lib/libpmix.so"],
        [pmix_lib="-L$pmix_dir/lib -lpmix"],
        AS_IF([test -r "$pmix_dir/lib64/libpmix.so"],
          [pmix_lib="-L$pmix_dir/lib64 -lpmix"],
          AC_MSG_ERROR([PMIx library not found.])
        )
      )
      pmix_inc="-I$pmix_dir/include"
    )
    AC_SUBST(pmix_inc)
    AC_SUBST(pmix_lib)
    AC_DEFINE([PMIX], [], [Defined when PMIx is available])
  )
])


================================================
FILE: m4/with_python.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_PYTHON],
[
  AC_ARG_WITH([python],
    AS_HELP_STRING([--with-python=DIR],
      [Specify the directory where Python is installed.]
    )
  )
  AS_IF([test "x$with_python" != "x"],
    [PYTHON="$with_python/bin/python3"]
  )
  AM_PATH_PYTHON([3.6])
  [PYTHON_CONFIG="$PYTHON-config"]
  [python_major_version=`echo $PYTHON_VERSION | sed -e 's/\..*$//'`]
  [python_minor_version=`echo $PYTHON_VERSION | sed -e 's/^[^.]*\.//'`]
  AS_IF([test $python_major_version -eq 3],
  [
    python_config_embed=""
    AS_IF([test $python_minor_version -ge 8], [python_config_embed="--embed"])
    [PYTHON_INCLUDES=`$PYTHON_CONFIG --includes ${python_config_embed}`]
    AC_SUBST(PYTHON_INCLUDES)
    [PYTHON_CFLAGS=`$PYTHON_CONFIG --cflags ${python_config_embed}`]
    AC_SUBST(PYTHON_CFLAGS)
    [PYTHON_LDFLAGS=`$PYTHON_CONFIG --ldflags ${python_config_embed}`]
    AC_SUBST(PYTHON_LDFLAGS)
    [PYTHON_LIBS=`$PYTHON_CONFIG --libs ${python_config_embed}`]
    AC_SUBST(PYTHON_LIBS)
    AC_DEFINE([PYTHON], [], [Defined when Python is available])
    AC_DEFINE_UNQUOTED([PYTHON_BIN_PATH], ["$PYTHON"], [Python executable path])
  ],
  [AC_MSG_ERROR([Python version 3 is required.])])
])


================================================
FILE: m4/with_sendmail.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_SENDMAIL],
[
  AC_ARG_WITH([sendmail],
    AS_HELP_STRING([--with-sendmail=EXECUTABLE],
      [Specify the full path where the sendmail executable is installed.]
    )
  )
  AS_IF([test "x$with_sendmail" != "x"],
    sendmail_cmd=["$with_sendmail"],
    sendmail_cmd=["/usr/sbin/sendmail"]
  )
  AC_MSG_CHECKING([for sendmail])
  AC_MSG_RESULT([$sendmail_cmd])
  AC_DEFINE_UNQUOTED([SENDMAIL_CMD], ["$sendmail_cmd"], [Full path to the sendmail executable])
])


================================================
FILE: m4/with_server_home.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_SERVER_HOME],
[
  AC_MSG_CHECKING([for PBS home directory])
  AC_ARG_WITH([pbs-server-home],
    AS_HELP_STRING([--with-pbs-server-home=DIR],
      [Location of the PBS spool directory. Default is /var/spool/pbs]
    )
  )
  AS_IF([test "x$with_pbs_server_home" != "x"],
    PBS_SERVER_HOME=[$with_pbs_server_home],
    PBS_SERVER_HOME=[/var/spool/pbs]
  )
  AC_MSG_RESULT([$PBS_SERVER_HOME])
  AC_SUBST(PBS_SERVER_HOME)
  AC_DEFINE_UNQUOTED([PBS_SERVER_HOME], ["$PBS_SERVER_HOME"], [Location of the PBS spool directory])
])


================================================
FILE: m4/with_server_name_file.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_SERVER_NAME_FILE],
[
  AC_MSG_CHECKING([for PBS server name file])
  AC_ARG_WITH([pbs-server-name-file],
    AS_HELP_STRING([--with-pbs-server-name-file=FILE],
      [Location of the PBS server name file relative to PBS_HOME. Default is PBS_HOME/server_name]
    )
  )
  AS_IF([test "x$with_server_name_file" != "x"],
    [pbs_default_file=$with_server_name_file],
    [pbs_default_file=server_name]
  )
  AS_CASE([$pbs_default_file],
    [/*],
      [PBS_DEFAULT_FILE=$pbs_default_file],
    [PBS_DEFAULT_FILE=$PBS_SERVER_HOME/$pbs_default_file]
  )
  AC_MSG_RESULT([$PBS_DEFAULT_FILE])
  AC_SUBST(PBS_DEFAULT_FILE)
  AC_DEFINE_UNQUOTED([PBS_DEFAULT_FILE], ["$PBS_DEFAULT_FILE"], [Location of the PBS server name file])
])


================================================
FILE: m4/with_swig.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_SWIG],
[
  AC_ARG_WITH([swig],
    AS_HELP_STRING([--with-swig=EXECUTABLE],
      [Specify the full path where the swig executable is installed.]
    )
  )
  AS_IF([test "x$with_swig" != "x"],
    swig_dir=["$with_swig"],
    swig_dir=["/usr"]
  )
  AC_MSG_CHECKING([for swig])
  AS_IF([test -x "$swig_dir/bin/swig"],
    AC_MSG_RESULT([$swig_dir/bin/swig])
    AC_DEFINE([SWIG], [], [Defined when swig is available]),
    AC_MSG_RESULT([not found])
    AC_MSG_WARN([swig command not found.]))
  AS_IF([test "x`ls -d ${swig_dir}/share/swig/* 2>/dev/null`" = "x" ],
          [swig_py_inc="-I`ls -d ${swig_dir}/share/swig* | tail -n 1` -I`ls -d ${swig_dir}/share/swig*/python | tail -n 1`"],
          [swig_py_inc="-I`ls -d ${swig_dir}/share/swig/* | tail -n 1` -I`ls -d ${swig_dir}/share/swig/*/python | tail -n 1`"])
  AC_SUBST([swig_dir])
  AC_SUBST([swig_py_inc])
])


================================================
FILE: m4/with_tcl.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_TCL],
[
  AC_ARG_WITH([tcl],
    AS_HELP_STRING([--with-tcl=DIR],
      [Specify the directory where Tcl is installed.]
    )
  )
  AS_IF([test "x$with_tcl" != "x"],
    tcl_dir=["$with_tcl"],
    tcl_dir=["/usr"]
  )
  AC_MSG_CHECKING([for Tcl])
  AS_IF([test -r "$tcl_dir/lib64/tclConfig.sh"],
    [. "$tcl_dir/lib64/tclConfig.sh"],
    AS_IF([test -r "$tcl_dir/lib/tclConfig.sh"],
      [. "$tcl_dir/lib/tclConfig.sh"],
      AS_IF([test -r "$tcl_dir/lib/x86_64-linux-gnu/tclConfig.sh"],
        [. "$tcl_dir/lib/x86_64-linux-gnu/tclConfig.sh"],
        AC_MSG_ERROR([tclConfig.sh not found]))))
  AC_MSG_RESULT([$tcl_dir])
  AC_MSG_CHECKING([for Tcl version])
  AS_IF([test "x$TCL_VERSION" = "x"],
    AC_MSG_ERROR([Could not determine Tcl version]))
  AC_MSG_RESULT([$TCL_VERSION])
  [tcl_version="$TCL_VERSION"]
  AC_SUBST(tcl_version)
  AC_MSG_CHECKING([for Tk])
  AS_IF([test -r "$tcl_dir/lib64/tkConfig.sh"],
    [. "$tcl_dir/lib64/tkConfig.sh"],
    AS_IF([test -r "$tcl_dir/lib/tkConfig.sh"],
      [. "$tcl_dir/lib/tkConfig.sh"],
      AS_IF([test -r "$tcl_dir/lib/x86_64-linux-gnu/tkConfig.sh"],
        [. "$tcl_dir/lib/x86_64-linux-gnu/tkConfig.sh"],
        AC_MSG_ERROR([tkConfig.sh not found]))))
  AC_MSG_RESULT([$tcl_dir])
  AC_MSG_CHECKING([for Tk version])
  AS_IF([test "x$TK_VERSION" = "x"],
    AC_MSG_ERROR([Could not determine Tk version]))
  AC_MSG_RESULT([$TK_VERSION])
  [tk_version="$TK_VERSION"]
  AC_SUBST(tk_version)
  AS_IF([test x$TCL_INCLUDE_SPEC = x],
    # Using developer installed tcl
    [tcl_inc="-I$tcl_dir/include"]
    [tcl_lib="$tcl_dir/lib/libtcl$TCL_VERSION.a $TCL_LIBS"]
    [tk_inc="-I$tcl_dir/include"]
    [tk_lib="$tcl_dir/lib/libtcl$TCL_VERSION.a $tcl_dir/lib/libtk$TK_VERSION.a $TK_LIBS"],
    # Using system installed tcl
    [tcl_inc="$TCL_INCLUDE_SPEC"]
    [tcl_lib="$TCL_LIB_SPEC $TCL_LIBS"]
    [tk_inc="$TK_INCLUDE_SPEC"]
    [tk_lib=`echo "$TCL_LIB_SPEC $TK_LIB_SPEC $TK_LIBS" | ${SED} -e 's/-lXss //'`])
  save_CPPFLAGS="$CPPFLAGS"
  CPPFLAGS="$CPPFLAGS $tcl_inc"
  AC_CHECK_TYPES([Tcl_Size], [], [], [[#include <tcl.h>]])
  CPPFLAGS="$save_CPPFLAGS"
  AC_SUBST(tcl_inc)
  AC_SUBST(tcl_lib)
  AC_SUBST(tk_inc)
  AC_SUBST(tk_lib)
  [TCLSH_PATH=$tcl_dir/bin/tclsh$tcl_version]
  AC_SUBST(TCLSH_PATH)
  AC_DEFINE([TCL], [], [Defined when Tcl is available])
  AC_DEFINE([TK], [], [Defined when TK is available])
])


================================================
FILE: m4/with_tclatrsep.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_TCLATRSEP],
[
  AC_ARG_WITH([tclatrsep],
    AS_HELP_STRING([--with-tclatrsep=CHAR],
      [Specify the Tcl attribute separator.]
    )
  )
  AS_IF([test x$with_tclatrsep != x],
    [tcl_atrsep="$with_tclatrsep"],
    [tcl_atrsep="."]
  )
  AC_MSG_CHECKING([for Tcl attribute separator])
  AC_MSG_RESULT(["$tcl_atrsep"])
  AC_DEFINE_UNQUOTED([TCL_ATRSEP], ["$tcl_atrsep"], [The Tcl attribute separator character])
])


================================================
FILE: m4/with_tmpdir.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_TMP_DIR],
[
  AC_MSG_CHECKING([for PBS temporary file location])
  AC_ARG_WITH([tmpdir],
    AS_HELP_STRING([--with-tmpdir=DIR],
      [Location of the PBS temporary file directory.]
    )
  )
  AS_IF([test "x$with_tmpdir" != "x"],
    pbs_tmpdir=[$with_tmpdir],
    pbs_tmpdir=[/var/tmp]
  )
  AC_MSG_RESULT([$pbs_tmpdir])
  AC_DEFINE_UNQUOTED([TMP_DIR], ["$pbs_tmpdir"], [Location of the PBS temporary file directory])
])


================================================
FILE: m4/with_unsupported_dir.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_UNSUPPORTED_DIR],
[
  AC_MSG_CHECKING([for unsupported directory])
  AC_ARG_WITH([unsupported-dir],
    AS_HELP_STRING([--with-unsupported-dir=DIR],
      [Specify the installation directory for unsupported tools.]
    )
  )
  AS_IF([test x$with_unsupported_dir != x],
    [unsupporteddir="$with_unsupported_dir"],
    [unsupporteddir='${exec_prefix}/unsupported']
  )
  AC_MSG_RESULT([$unsupporteddir])
  AC_SUBST(unsupporteddir)
])


================================================
FILE: m4/with_xauth.m4
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

AC_DEFUN([PBS_AC_WITH_XAUTH],
[
  AC_ARG_WITH([xauth],
    AS_HELP_STRING([--with-xauth=EXECUTABLE],
      [Specify the name of the xauth command.]
    )
  )
  AS_IF([test "x$with_xauth" != "x"],
    xauth_cmd=["$with_xauth"],
    xauth_cmd=["xauth"]
  )
  AC_MSG_CHECKING([for xauth])
  AC_MSG_RESULT([$xauth_cmd])
  AC_DEFINE_UNQUOTED([XAUTH_BINARY], ["$xauth_cmd"], [Name of the xauth executable])
])


================================================
FILE: openpbs-rpmlintrc
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

# IGNORE: The following are purposely suppressed.
addFilter("dir-or-file-in-opt")
addFilter("non-executable-script")
addFilter("non-standard-executable-perm .*pbs_iff")
addFilter("setuid-binary .*pbs_iff")
addFilter("non-standard-executable-perm .*pbs_rcp")
addFilter("setuid-binary .*pbs_rcp")
addFilter("only-non-binary-in-usr-lib")
# FIXME: The following errors need to be addressed rather than ignored
addFilter('permissions-file-setuid-bit')
setBadness('permissions-file-setuid-bit', 0)
addFilter('non-position-independent-executable')
setBadness('non-position-independent-executable', 0)
addFilter('devel-file-in-non-devel-package')
setBadness('devel-file-in-non-devel-package', 0)


================================================
FILE: openpbs.spec.in
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

%if !%{defined pbs_name}
%define pbs_name openpbs
%endif

%if !%{defined pbs_version}
%define pbs_version @PBS_VERSION@
%endif

%if !%{defined pbs_release}
%define pbs_release 0
%endif

%if !%{defined pbs_prefix}
%define pbs_prefix /opt/pbs
%endif

%if !%{defined pbs_home}
%define pbs_home @PBS_SERVER_HOME@
%endif

%if !%{defined pbs_dbuser}
%define pbs_dbuser postgres
%endif

%define pbs_client client
%define pbs_execution execution
%define pbs_server server
%define pbs_devel devel
%define pbs_dist %{pbs_name}-%{pbs_version}.tar.gz

%if !%{defined _unitdir}
%define _unitdir @_unitdir@
%endif
%if "%{_vendor}" == "debian" && %(test -f /etc/os-release && echo 1 || echo 0)
%define _vendor_ver %(cat /etc/os-release | awk -F[=\\".] '/^VERSION_ID=/ {print \$3}')
%define _vendor_id %(cat /etc/os-release | awk -F= '/^ID=/ {print \$2}')
%endif
%if ( 0%{?suse_version} >= 1210 ) || ( 0%{?rhel} >= 7 ) || ("x%{?_vendor_id}" == "xdebian" && 0%{?_vendor_ver} >= 8) || ("x%{?_vendor_id}" == "xubuntu" && 0%{?_vendor_ver} >= 16)
%define have_systemd 1
%endif

%global __python %{__python3}

Name: %{pbs_name}
Version: %{pbs_version}
Release: %{pbs_release}
Source0: %{pbs_dist}
Summary: OpenPBS
License: AGPLv3 with exceptions
URL: http://www.openpbs.org
Vendor: Altair Engineering, Inc.
Prefix: %{?pbs_prefix}%{!?pbs_prefix:%{_prefix}}

%bcond_with alps
%bcond_with ptl
%bcond_with pmix

BuildRoot: %{buildroot}
BuildRequires: gcc
BuildRequires: gcc-c++
BuildRequires: make
BuildRequires: rpm-build
BuildRequires: autoconf
BuildRequires: automake
BuildRequires: libtool
BuildRequires: libtool-ltdl-devel
BuildRequires: hwloc-devel
BuildRequires: libX11-devel
BuildRequires: libXt-devel
BuildRequires: libedit-devel
BuildRequires: libical-devel
BuildRequires: ncurses-devel
BuildRequires: perl
BuildRequires: postgresql-devel >= 9.1
BuildRequires: postgresql-contrib >= 9.1
BuildRequires: python3-devel >= 3.5
BuildRequires: tcl-devel
BuildRequires: tk-devel
BuildRequires: swig
BuildRequires: zlib-devel
%if %{with pmix}
BuildRequires: pmix-devel
%endif
%if %{defined suse_version}
BuildRequires: libexpat-devel
BuildRequires: libopenssl-devel
BuildRequires: libXext-devel
BuildRequires: libXft-devel
BuildRequires: fontconfig
BuildRequires: timezone
BuildRequires: cJSON-devel
%if ( ( !%{defined sle_version} ) || ( 0%{?sle_version} < 150500 ) )
BuildRequires: python-xml
%endif
%else
BuildRequires: expat-devel
BuildRequires: openssl-devel
BuildRequires: libXext
BuildRequires: libXft
%if ( ( !%{defined rhel} ) || ( 0%{?rhel} >= 8 ) )
BuildRequires: cjson-devel
%endif
%endif

# Pure python extensions use the 32 bit library path
%{!?py_site_pkg_32: %global py_site_pkg_32 %(%{__python} -c "from distutils.sysconfig import get_python_lib; print(get_python_lib(0))")}
%{!?py_site_pkg_64: %global py_site_pkg_64 %(%{__python} -c "from distutils.sysconfig import get_python_lib; print(get_python_lib(1))")}

%description
OpenPBS is a fast, powerful workload manager and
job scheduler designed to improve productivity, optimize
utilization & efficiency, and simplify administration for
HPC clusters, clouds and supercomputers.

%package %{pbs_server}
Summary: OpenPBS for a server host
Group: System Environment/Base
Conflicts: openpbs-execution
Conflicts: openpbs-client
Conflicts: openpbs-execution-ohpc
Conflicts: openpbs-client-ohpc
Conflicts: openpbs-server-ohpc
Conflicts: pbspro-server
Conflicts: pbspro-execution
Conflicts: pbspro-client
Conflicts: pbspro-client-ohpc
Conflicts: pbspro-execution-ohpc
Conflicts: pbspro-server-ohpc
Conflicts: pbs
Conflicts: pbs-mom
Conflicts: pbs-cmds
%if %{defined rhel}
Requires: chkconfig
%endif
Requires: bash
Requires: expat
Requires: libedit
Requires: postgresql-server >= 9.1
Requires: postgresql-contrib >= 9.1
Requires: python3 >= 3.5
Requires: tcl
Requires: tk
%if %{with pmix}
Requires: pmix
%endif
%if %{defined suse_version}
Requires: smtp_daemon
Requires: libhwloc15
Requires: net-tools
Requires: libcjson1
%else
Requires: smtpdaemon
Requires: hostname
%if ( ( !%{defined rhel} ) || ( 0%{?rhel} >= 8 ) )
Requires: cjson
%endif
%endif
%if 0%{?rhel} >= 7
Requires: hwloc-libs
%endif
Requires: libical
Autoreq: 1

%description %{pbs_server}
OpenPBS is a fast, powerful workload manager and
job scheduler designed to improve productivity, optimize
utilization & efficiency, and simplify administration for
HPC clusters, clouds and supercomputers.

This package is intended for a server host. It includes all
PBS components.

%package %{pbs_execution}
Summary: OpenPBS for an execution host
Group: System Environment/Base
Conflicts: openpbs-server
Conflicts: openpbs-client
Conflicts: openpbs-execution-ohpc
Conflicts: openpbs-client-ohpc
Conflicts: openpbs-server-ohpc
Conflicts: pbspro-server
Conflicts: pbspro-execution
Conflicts: pbspro-client
Conflicts: pbspro-client-ohpc
Conflicts: pbspro-execution-ohpc
Conflicts: pbspro-server-ohpc
Conflicts: pbs
Conflicts: pbs-mom
Conflicts: pbs-cmds
%if %{defined rhel}
Requires: chkconfig
%endif
Requires: bash
Requires: expat
Requires: python3 >= 3.5
%if %{with pmix}
Requires: pmix
%endif
%if %{defined suse_version}
Requires: libhwloc15
Requires: net-tools
Requires: libcjson1
%else
Requires: hostname
%if ( ( !%{defined rhel} ) || ( 0%{?rhel} >= 8 ) )
Requires: cjson
%endif
%endif
%if 0%{?rhel} >= 7
Requires: hwloc-libs
%endif
Autoreq: 1

%description %{pbs_execution}
OpenPBS is a fast, powerful workload manager and
job scheduler designed to improve productivity, optimize
utilization & efficiency, and simplify administration for
HPC clusters, clouds and supercomputers.

This package is intended for an execution host. It does not
include the scheduler, server, or communication agent. It
does include the PBS user commands.

%package %{pbs_client}
Summary: OpenPBS for a client host
Group: System Environment/Base
Conflicts: openpbs-server
Conflicts: openpbs-execution
Conflicts: openpbs-execution-ohpc
Conflicts: openpbs-client-ohpc
Conflicts: openpbs-server-ohpc
Conflicts: pbspro-server
Conflicts: pbspro-execution
Conflicts: pbspro-client
Conflicts: pbspro-client-ohpc
Conflicts: pbspro-execution-ohpc
Conflicts: pbspro-server-ohpc
Conflicts: pbs
Conflicts: pbs-mom
Conflicts: pbs-cmds
Requires: bash
Requires: python3 >= 3.5
%if %{defined suse_version}
Requires: libcjson1
%else
%if ( ( !%{defined rhel} ) || ( 0%{?rhel} >= 8 ) )
Requires: cjson
%endif
%endif
Autoreq: 1

%description %{pbs_client}
OpenPBS is a fast, powerful workload manager and
job scheduler designed to improve productivity, optimize
utilization & efficiency, and simplify administration for
HPC clusters, clouds and supercomputers.

This package is intended for a client host and provides
the PBS user commands.


%package %{pbs_devel}
Summary: OpenPBS Development Package
Group: Development/System
Conflicts: pbspro-devel
Conflicts: pbspro-devel-ohpc
Conflicts: openpbs-devel-ohpc

%description %{pbs_devel}
OpenPBS is a fast, powerful workload manager and
job scheduler designed to improve productivity, optimize
utilization & efficiency, and simplify administration for
HPC clusters, clouds and supercomputers.


%if %{with ptl}

%define pbs_ptl ptl

%if !%{defined ptl_prefix}
%define ptl_prefix %{pbs_prefix}/../ptl
%endif

%package %{pbs_ptl}
Summary: Testing framework for PBS
Group: System Environment/Base
Prefix: %{ptl_prefix}
Conflicts: pbspro-ptl

%description %{pbs_ptl}
PBS Test Lab is a testing framework intended to test and validate the
functionality of PBS.

%endif

%if 0%{?opensuse_bs}
# Do not specify debug_package for OBS builds.
%else
%if 0%{?suse_version} || "x%{?_vendor_id}" == "xdebian" || "x%{?_vendor_id}" == "xubuntu"
%debug_package
%endif
%endif

%prep
%setup

%build
[ -f configure ] || ./autogen.sh
[ -d build ] && rm -rf build
mkdir build
cd build
../configure \
	PBS_VERSION=%{pbs_version} \
	--prefix=%{pbs_prefix} \
%if %{with ptl}
	--enable-ptl \
%endif
	%{?_with_swig} \
%if %{defined suse_version}
	--libexecdir=%{pbs_prefix}/libexec \
%endif
%if %{with alps}
	--enable-alps \
%endif
%if %{with pmix}
	--with-pmix \
%endif
	--with-pbs-server-home=%{pbs_home} \
	--with-database-user=%{pbs_dbuser}
%{__make} %{?_smp_mflags}

%install
cd build
%make_install
mandir=$(find %{buildroot} -type d -name man)
[ -d "$mandir" ] && find $mandir -type f -exec gzip -9 -n {} \;
install -D %{buildroot}/%{pbs_prefix}/libexec/pbs_init.d %{buildroot}/etc/init.d/pbs
%if 0%{?rhel} >= 7
export QA_RPATHS=$[ 0x0002 ]
%endif

%post %{pbs_server}
ldconfig %{_libdir}
# do not run pbs_postinstall when the CLE is greater than or equal to 6
imps=0
cle_release_version=0
cle_release_path=/etc/opt/cray/release/cle-release
if [ -f ${cle_release_path} ]; then
	cle_release_version=`grep RELEASE ${cle_release_path} | cut -f2 -d= | cut -f1 -d.`
fi
[ "${cle_release_version}" -ge 6 ] 2>/dev/null && imps=1
if [ $imps -eq 0 ]; then
${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_postinstall server \
	%{version} ${RPM_INSTALL_PREFIX:=%{pbs_prefix}} %{pbs_home} %{pbs_dbuser}
fi

%post %{pbs_execution}
ldconfig %{_libdir}
# do not run pbs_postinstall when the CLE is greater than or equal to 6
imps=0
cle_release_version=0
cle_release_path=/etc/opt/cray/release/cle-release
if [ -f ${cle_release_path} ]; then
	cle_release_version=`grep RELEASE ${cle_release_path} | cut -f2 -d= | cut -f1 -d.`
fi
[ "${cle_release_version}" -ge 6 ] 2>/dev/null && imps=1
if [ $imps -eq 0 ]; then
${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_postinstall execution \
	%{version} ${RPM_INSTALL_PREFIX:=%{pbs_prefix}} %{pbs_home}
fi

%post %{pbs_client}
ldconfig %{_libdir}
# do not run pbs_postinstall when the CLE is greater than or equal to 6
imps=0
cle_release_version=0
cle_release_path=/etc/opt/cray/release/cle-release
if [ -f ${cle_release_path} ]; then
	cle_release_version=`grep RELEASE ${cle_release_path} | cut -f2 -d= | cut -f1 -d.`
fi
[ "${cle_release_version}" -ge 6 ] 2>/dev/null && imps=1
if [ $imps -eq 0 ]; then
${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_postinstall client \
	%{version} ${RPM_INSTALL_PREFIX:=%{pbs_prefix}}
fi

%post %{pbs_devel}
ldconfig %{_libdir}

%preun %{pbs_server}
if [ "$1" != "1" ]; then
	# This is an uninstall, not an upgrade.
	${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_preuninstall server \
		%{version} ${RPM_INSTALL_PREFIX:=%{pbs_prefix}} %{pbs_home} %{defined have_systemd}
fi

%preun %{pbs_execution}
if [ "$1" != "1" ]; then
	# This is an uninstall, not an upgrade.
	${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_preuninstall execution \
		%{version} ${RPM_INSTALL_PREFIX:=%{pbs_prefix}} %{pbs_home} %{defined have_systemd}
fi

%preun %{pbs_client}
if [ "$1" != "1" ]; then
	# This is an uninstall, not an upgrade.
	${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_preuninstall client \
		%{version} ${RPM_INSTALL_PREFIX:=%{pbs_prefix}} %{pbs_home} %{defined have_systemd}
fi

%postun %{pbs_server}
if [ "$1" != "1" ]; then
	# This is an uninstall, not an upgrade.
	ldconfig %{_libdir}
	echo
	echo "NOTE: @PBS_CONF_FILE@ and the PBS_HOME directory must be deleted manually"
	echo
fi

%postun %{pbs_execution}
if [ "$1" != "1" ]; then
	# This is an uninstall, not an upgrade.
	ldconfig %{_libdir}
	echo
	echo "NOTE: @PBS_CONF_FILE@ and the PBS_HOME directory must be deleted manually"
	echo
fi

%postun %{pbs_client}
if [ "$1" != "1" ]; then
	# This is an uninstall, not an upgrade.
	ldconfig %{_libdir}
	echo
	echo "NOTE: @PBS_CONF_FILE@ must be deleted manually"
	echo
fi

%postun %{pbs_devel}
ldconfig %{_libdir}

%posttrans %{pbs_server}
${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_posttrans \
	${RPM_INSTALL_PREFIX:=%{pbs_prefix}}

%posttrans %{pbs_execution}
${RPM_INSTALL_PREFIX:=%{pbs_prefix}}/libexec/pbs_posttrans \
	${RPM_INSTALL_PREFIX:=%{pbs_prefix}}

%files %{pbs_server}
%defattr(-,root,root, -)
%dir %{pbs_prefix}
%{pbs_prefix}/*
%attr(4755, root, root) %{pbs_prefix}/sbin/pbs_rcp
%attr(4755, root, root) %{pbs_prefix}/sbin/pbs_iff
#%attr(644, root, root) %{pbs_prefix}/lib*/libpbs.la
%{_sysconfdir}/profile.d/pbs.csh
%{_sysconfdir}/profile.d/pbs.sh
%config(noreplace) %{_sysconfdir}/profile.d/pbs.*
%exclude %{_sysconfdir}/profile.d/ptl.csh
%exclude %{_sysconfdir}/profile.d/ptl.sh
%if %{defined have_systemd}
%attr(644, root, root) %{_unitdir}/pbs.service
%attr(644, root, root) %{pbs_prefix}/libexec/pbs_reload
%else
%exclude %{_unitdir}/pbs.service
%exclude %{pbs_prefix}/libexec/pbs_reload
%endif
#%exclude %{pbs_prefix}/unsupported/*.pyc
#%exclude %{pbs_prefix}/unsupported/*.pyo
%exclude %{pbs_prefix}/lib*/*.a
%exclude %{pbs_prefix}/include/*
%doc README.md
%license LICENSE

%files %{pbs_execution}
%defattr(-,root,root, -)
%dir %{pbs_prefix}
%{pbs_prefix}/*
%attr(4755, root, root) %{pbs_prefix}/sbin/pbs_rcp
%attr(4755, root, root) %{pbs_prefix}/sbin/pbs_iff
#%attr(644, root, root) %{pbs_prefix}/lib*/libpbs.la
%{_sysconfdir}/profile.d/pbs.csh
%{_sysconfdir}/profile.d/pbs.sh
%config(noreplace) %{_sysconfdir}/profile.d/pbs.*
%exclude %{_sysconfdir}/profile.d/ptl.csh
%exclude %{_sysconfdir}/profile.d/ptl.sh
%if %{defined have_systemd}
%attr(644, root, root) %{_unitdir}/pbs.service
%else
%exclude %{_unitdir}/pbs.service
%endif
%exclude %{pbs_prefix}/bin/printjob_svr.bin
%exclude %{pbs_prefix}/etc/pbs_dedicated
%exclude %{pbs_prefix}/etc/pbs_holidays*
%exclude %{pbs_prefix}/etc/pbs_resource_group
%exclude %{pbs_prefix}/etc/pbs_sched_config
%exclude %{pbs_prefix}/lib*/init.d/sgiICEplacement.sh
%exclude %{pbs_prefix}/lib*/python/altair/pbs_hooks/*
%exclude %{pbs_prefix}/libexec/pbs_db_utility
%exclude %{pbs_prefix}/sbin/pbs_comm
%exclude %{pbs_prefix}/sbin/pbs_dataservice
%exclude %{pbs_prefix}/sbin/pbs_ds_monitor
%exclude %{pbs_prefix}/sbin/pbs_ds_password
%exclude %{pbs_prefix}/sbin/pbs_ds_password.bin
%exclude %{pbs_prefix}/sbin/pbs_ds_systemd
%exclude %{pbs_prefix}/sbin/pbs_sched
%exclude %{pbs_prefix}/sbin/pbs_server
%exclude %{pbs_prefix}/sbin/pbs_server.bin
%exclude %{pbs_prefix}/sbin/pbsfs
#%exclude %{pbs_prefix}/unsupported/*.pyc
#%exclude %{pbs_prefix}/unsupported/*.pyo
%exclude %{pbs_prefix}/lib*/*.a
%exclude %{pbs_prefix}/include/*
%doc README.md
%license LICENSE

%files %{pbs_client}
%defattr(-,root,root, -)
%dir %{pbs_prefix}
%{pbs_prefix}/*
%attr(4755, root, root) %{pbs_prefix}/sbin/pbs_iff
#%attr(644, root, root) %{pbs_prefix}/lib*/libpbs.la
%{_sysconfdir}/profile.d/pbs.csh
%{_sysconfdir}/profile.d/pbs.sh
%config(noreplace) %{_sysconfdir}/profile.d/pbs.*
%exclude %{_sysconfdir}/profile.d/ptl.csh
%exclude %{_sysconfdir}/profile.d/ptl.sh
%exclude %{pbs_prefix}/bin/mpiexec
%exclude %{pbs_prefix}/bin/pbs_attach
%exclude %{pbs_prefix}/bin/pbs_tmrsh
%exclude %{pbs_prefix}/bin/printjob_svr.bin
%exclude %{pbs_prefix}/etc/pbs_dedicated
%exclude %{pbs_prefix}/etc/pbs_holidays*
%exclude %{pbs_prefix}/etc/pbs_resource_group
%exclude %{pbs_prefix}/etc/pbs_sched_config
%exclude %{pbs_prefix}/include
%exclude %{pbs_prefix}/lib*/MPI
%exclude %{pbs_prefix}/lib*/init.d
%exclude %{pbs_prefix}/lib*/python/altair/pbs_hooks
%exclude %{pbs_prefix}/lib*/python/pbs_bootcheck*
%exclude %{pbs_prefix}/libexec/pbs_db_utility
%exclude %{pbs_prefix}/libexec/pbs_habitat
%exclude %{pbs_prefix}/libexec/pbs_init.d
%exclude %{pbs_prefix}/sbin/pbs_comm
%exclude %{pbs_prefix}/sbin/pbs_demux
%exclude %{pbs_prefix}/sbin/pbs_dataservice
%exclude %{pbs_prefix}/sbin/pbs_ds_monitor
%exclude %{pbs_prefix}/sbin/pbs_ds_password
%exclude %{pbs_prefix}/sbin/pbs_ds_password.bin
%exclude %{pbs_prefix}/sbin/pbs_ds_systemd
%exclude %{pbs_prefix}/sbin/pbs_idled
%exclude %{pbs_prefix}/sbin/pbs_mom
%exclude %{pbs_prefix}/sbin/pbs_rcp
%exclude %{pbs_prefix}/sbin/pbs_sched
%exclude %{pbs_prefix}/sbin/pbs_server
%exclude %{pbs_prefix}/sbin/pbs_server.bin
%exclude %{pbs_prefix}/sbin/pbs_upgrade_job
%exclude %{pbs_prefix}/sbin/pbsfs
#%exclude %{pbs_prefix}/unsupported/*.pyc
#%exclude %{pbs_prefix}/unsupported/*.pyo
%exclude %{_unitdir}/pbs.service
%exclude %{pbs_prefix}/lib*/*.a
%exclude %{pbs_prefix}/include/*
%exclude /etc/init.d/pbs
%doc README.md
%license LICENSE

%files %{pbs_devel}
%defattr(-,root,root, -)
%{pbs_prefix}/lib*/*.a
%{pbs_prefix}/include/*
%doc README.md
%license LICENSE

%if %{with ptl}
%files %{pbs_ptl}
%defattr(-,root,root, -)
%dir %{ptl_prefix}
%{ptl_prefix}/*
%{_sysconfdir}/profile.d/ptl.csh
%{_sysconfdir}/profile.d/ptl.sh
%config(noreplace) %{_sysconfdir}/profile.d/ptl.*

%post %{pbs_ptl}
pip3 install --trusted-host pypi.org --trusted-host files.pythonhosted.org -r "%{ptl_prefix}/fw/requirements.txt"

%preun %{pbs_ptl}
pip3 uninstall --yes -r "%{ptl_prefix}/fw/requirements.txt"

%endif

%changelog
* Fri Apr 17 2020 Hiren Vadalia <hiren.vadalia@altair.com> - 1.31
- We are not using this changelog, see commit history


================================================
FILE: src/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = \
	include \
	lib \
	server \
	scheduler \
	modules \
	resmom \
	mom_rcp \
	iff \
	cmds \
	tools \
	hooks \
	unsupported


================================================
FILE: src/cmds/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = scripts

bin_PROGRAMS = \
	pbsdsh \
	pbsnodes \
	pbs_attach \
	pbs_tmrsh \
	pbs_ralter \
	pbs_rdel \
	pbs_rstat \
	pbs_rsub \
	pbs_release_nodes \
	qalter \
	qdel \
	qdisable \
	qenable \
	qhold \
	qmgr \
	qmove \
	qorder \
	qmsg \
	qrerun \
	qrls \
	qrun \
	qselect \
	qsig \
	qstat \
	qstart \
	qstop \
	qsub \
	qterm

sbin_PROGRAMS = \
	pbs_dataservice.bin \
	pbs_ds_password.bin \
	pbs_demux

dist_bin_SCRIPTS = \
	mpiexec \
	pbs_lamboot \
	pbs_mpihp \
	pbs_mpilam \
	pbs_mpirun \
	pbs_remsh \
	pbsrun \
	pbsrun_unwrap \
	pbsrun_wrap

common_cflags = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

common_libs = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	@KRB5_LIBS@ \
	-lpthread \
	@socket_lib@

common_sources = \
	$(top_srcdir)/src/lib/Libcmds/cmds_common.c

pbsdsh_CPPFLAGS = ${common_cflags}
pbsdsh_LDADD = ${common_libs}
pbsdsh_SOURCES = pbsdsh.c ${common_sources}

pbsnodes_CPPFLAGS = ${common_cflags}
pbsnodes_LDADD = ${common_libs} \
	$(top_builddir)/src/lib/Libjson/libpbsjson.la
pbsnodes_SOURCES = pbsnodes.c ${common_sources}

pbs_attach_CPPFLAGS = ${common_cflags}
pbs_attach_LDADD = ${common_libs}
pbs_attach_SOURCES = pbs_attach.c pbs_attach_sup.c ${common_sources}

pbs_demux_CPPFLAGS = ${common_cflags}
pbs_demux_LDADD = ${common_libs}
pbs_demux_SOURCES = pbs_demux.c

pbs_dataservice_bin_CPPFLAGS = \
	${common_cflags}
pbs_dataservice_bin_LDADD = \
	$(top_builddir)/src/lib/Libdb/libpbsdb.la \
	${common_libs} \
	-lssl \
	-lcrypto
pbs_dataservice_bin_SOURCES = pbs_dataservice.c ${common_sources}

pbs_ds_password_bin_CPPFLAGS = \
	${common_cflags}
pbs_ds_password_bin_LDADD = \
	$(top_builddir)/src/lib/Libdb/libpbsdb.la \
	${common_libs} \
	-lssl \
	-lcrypto
pbs_ds_password_bin_SOURCES = pbs_ds_password.c ${common_sources}

pbs_tmrsh_CPPFLAGS = ${common_cflags}
pbs_tmrsh_LDADD = ${common_libs}
pbs_tmrsh_SOURCES = pbs_tmrsh.c ${common_sources}

pbs_ralter_CPPFLAGS = ${common_cflags}
pbs_ralter_LDADD = ${common_libs}
pbs_ralter_SOURCES = pbs_ralter.c ${common_sources}

pbs_rdel_CPPFLAGS = ${common_cflags}
pbs_rdel_LDADD = ${common_libs}
pbs_rdel_SOURCES = pbs_rdel.c ${common_sources}

pbs_rstat_CPPFLAGS = ${common_cflags}
pbs_rstat_LDADD = ${common_libs}
pbs_rstat_SOURCES = pbs_rstat.c ${common_sources}

pbs_rsub_CPPFLAGS = ${common_cflags}
pbs_rsub_LDADD = ${common_libs}
pbs_rsub_SOURCES = pbs_rsub.c ${common_sources}

pbs_release_nodes_CPPFLAGS = ${common_cflags}
pbs_release_nodes_LDADD = ${common_libs}
pbs_release_nodes_SOURCES = pbs_release_nodes.c ${common_sources}

qalter_CPPFLAGS = ${common_cflags}
qalter_LDADD = ${common_libs}
qalter_SOURCES = qalter.c ${common_sources}

qdel_CPPFLAGS = ${common_cflags}
qdel_LDADD = ${common_libs}
qdel_SOURCES = qdel.c ${common_sources}

qdisable_CPPFLAGS = ${common_cflags}
qdisable_LDADD = ${common_libs}
qdisable_SOURCES = qdisable.c ${common_sources}

qenable_CPPFLAGS = ${common_cflags}
qenable_LDADD = ${common_libs}
qenable_SOURCES = qenable.c ${common_sources}

qhold_CPPFLAGS = ${common_cflags}
qhold_LDADD = ${common_libs}
qhold_SOURCES = qhold.c ${common_sources}

qmgr_CPPFLAGS = \
	${common_cflags} \
	@editline_inc@
qmgr_LDADD = \
	${common_libs} \
	@editline_lib@
qmgr_SOURCES = qmgr.c qmgr_sup.c ${common_sources}

qmove_CPPFLAGS = ${common_cflags}
qmove_LDADD = ${common_libs}
qmove_SOURCES = qmove.c ${common_sources}

qorder_CPPFLAGS = ${common_cflags}
qorder_LDADD = ${common_libs}
qorder_SOURCES = qorder.c ${common_sources}

qmsg_CPPFLAGS = ${common_cflags}
qmsg_LDADD = ${common_libs}
qmsg_SOURCES = qmsg.c ${common_sources}

qrerun_CPPFLAGS = ${common_cflags}
qrerun_LDADD = ${common_libs}
qrerun_SOURCES = qrerun.c ${common_sources}

qrls_CPPFLAGS = ${common_cflags}
qrls_LDADD = ${common_libs}
qrls_SOURCES = qrls.c ${common_sources}

qrun_CPPFLAGS = ${common_cflags}
qrun_LDADD = ${common_libs}
qrun_SOURCES = qrun.c ${common_sources}

qselect_CPPFLAGS = ${common_cflags}
qselect_LDADD = ${common_libs}
qselect_SOURCES = qselect.c ${common_sources}

qsig_CPPFLAGS = ${common_cflags}
qsig_LDADD = ${common_libs}
qsig_SOURCES = qsig.c ${common_sources}

qstat_CPPFLAGS = ${common_cflags}
qstat_LDADD = ${common_libs} \
	$(top_builddir)/src/lib/Libjson/libpbsjson.la
qstat_SOURCES = qstat.c ${common_sources}

qstart_CPPFLAGS = ${common_cflags}
qstart_LDADD = ${common_libs}
qstart_SOURCES = qstart.c ${common_sources}

qstop_CPPFLAGS = ${common_cflags}
qstop_LDADD = ${common_libs}
qstop_SOURCES = qstop.c ${common_sources}

qsub_CPPFLAGS = ${common_cflags}
qsub_LDADD = ${common_libs} \
		-lssl \
		-lcrypto
qsub_SOURCES = qsub.c qsub_sup.c ${common_sources}

qterm_CPPFLAGS = ${common_cflags}
qterm_LDADD = ${common_libs}
qterm_SOURCES = qterm.c ${common_sources}


================================================
FILE: src/cmds/mpiexec.in
================================================
#!/bin/sh -

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


#   This text is cited from
#
#		http://www.mpi-forum.org/docs/mpi-20-html/node42.htm,
#
# section "4.1. Portable MPI Process Startup":
#
# A number of implementations of MPI-1 provide a startup command for MPI
# programs that is of the form
#
#     mpirun <mpirun arguments> <program> <program arguments>
#
# Separating the command to start the program from the program itself
# provides flexibility, particularly for network and heterogeneous
# implementations. For example, the startup script need not run on one of
# the machines that will be executing the MPI program itself.
#
# Having a standard startup mechanism also extends the portability of MPI
# programs one step further, to the command lines and scripts that manage
# them. For example, a validation suite script that runs hundreds of
# programs can be a portable script if it is written using such a standard
# starup mechanism. In order that the ``standard'' command not be confused
# with existing practice, which is not standard and not portable among
# implementations, instead of mpirun MPI specifies mpiexec.
#
# While a standardized startup mechanism improves the usability of MPI,
# the range of environments is so diverse (e.g., there may not even be a
# command line interface) that MPI cannot mandate such a mechanism.
# Instead, MPI specifies an mpiexec startup command and recommends but
# does not require it, as advice to implementors. However, if an
# implementation does provide a command called mpiexec, it must be of the
# form described below.
#
# It is suggested that
#
#     mpiexec -n <numprocs> <program>
#
# be at least one way to start <program> with an initial MPI_COMM_WORLD
# whose group contains <numprocs> processes. Other arguments to mpiexec
# may be implementation-dependent.
#
# This is advice to implementors, rather than a required part of MPI-2. It
# is not suggested that this be the only way to start MPI programs. If an
# implementation does provide a command called mpiexec, however, it must
# be of the form described here.
#
#
# / Advice to implementors./
#
# Implementors, if they do provide a special startup command for MPI
# programs, are advised to give it the following form. The syntax is
# chosen in order that mpiexec be able to be viewed as a command-line
# version of MPI_COMM_SPAWN (See Section Reserved Keys <node97.htm#Node97>).
#
# Analogous to MPI_COMM_SPAWN, we have
#
#
#     mpiexec -n    <maxprocs>
#            -soft  <        >
#            -host  <        >
#            -arch  <        >
#            -wdir  <        >
#            -path  <        >
#            -file  <        >
#             ...
#            <command line>
#
# for the case where a single command line for the application program and
# its arguments will suffice. See Section Reserved Keys
# <node97.htm#Node97> for the meanings of these arguments. For the case
# corresponding to MPI_COMM_SPAWN_MULTIPLE there are two possible formats:
#
# Form A:
#
#
#     mpiexec { <above arguments> } : { ... } : { ... } : ... : { ... }
#
# As with MPI_COMM_SPAWN, all the arguments are optional. (Even the -n x
# argument is optional; the default is implementation dependent. It might
# be 1, it might be taken from an environment variable, or it might be
# specified at compile time.) The names and meanings of the arguments are
# taken from the keys in the info argument to MPI_COMM_SPAWN. There may be
# other, implementation-dependent arguments as well.
#
# Note that Form A, though convenient to type, prevents colons from being
# program arguments. Therefore an alternate, file-based form is allowed:
#
# Form B:
#
#
#     mpiexec -configfile <filename>
#
# where the lines of /</filename/>/ are of the form separated by the
# colons in Form A. Lines beginning with ` #' are comments, and lines may
# be continued by terminating the partial line with `\'.
#
#
# * Example* Start 16 instances of myprog on the current or default machine:
#
#     mpiexec -n 16 myprog
#
#
# * Example* Start 10 processes on the machine called ferrari:
#
#     mpiexec -n 10 -host ferrari myprog
#
#
# * Example* Start three copies of the same program with different
# command-line arguments:
#
#     mpiexec myprog infile1 : myprog infile2 : myprog infile3
#
#
# * Example* Start the ocean program on five Suns and the atmos program on
# 10 RS/6000's:
#
#     mpiexec -n 5 -arch sun ocean : -n 10 -arch rs6000 atmos
#
# It is assumed that the implementation in this case has a method for
# choosing hosts of the appropriate type. Their ranks are in the order
# specified.
# * Example* Start the ocean program on five Suns and the atmos program on
# 10 RS/6000's (Form B):
#
#     mpiexec -configfile myfile
#
# where myfile contains
#
#     -n 5  -arch sun    ocean
#     -n 10 -arch rs6000 atmos
#
# (/ End of advice to implementors./)
# ...
# MPI-2.0 of July 18, 1997
# HTML Generated on September 10, 2001

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

#	startup initializations
init()
{
	pbsconffile=${PBS_CONF_FILE:-"@PBS_CONF_FILE@"}
	if [ -r $pbsconffile ]
	then
		. $pbsconffile
		export PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"
	else
		logerr "cannot read PBS configuration file \"$pbsconffile\""
		exit 1
	fi

	vendor_init ${1+"$@"}

	configfile=""
	runfile="`mktemp ${PBS_TMPDIR}/mpiexec_runfileXXXXXX`"
	tmpconfigfile="`mktemp ${PBS_TMPDIR}/mpiexec_configfileXXXXXX`"
	trap "rm -f $runfile $tmpconfigfile" 0 1 2 3 15

	ranknum=0
	reset_rank

	if [ -n "$PBS_MPI_DEBUG" ]
	then
		debug=1
	else
		debug=0
	fi
}

#	The purpose of this function is to find another mpiexec in the user's
#	path and hand control over to it.  If executing outside of PBS, the
#	user's normal PATH is used;  if within PBS, we consult the pre-PBS path
#	(available within PBS as $PBS_O_PATH).  In either case, we take special
#	precautions to avoid attempting to re-exec ourselves.
rempiexec()
{
	#	if PBS_ENVIRONMENT is not set, this function is called before
	#	the init() function.
	if [ -z "$PBS_ENVIRONMENT" ]
	then
	        testPATH=$PATH

		# make implicit "." in $testPATH explicit
		prepPATH=`echo $testPATH | sed	-e 's/^:/.:/'		\
						-e 's/:$/:./'		\
						-e 's/:::*/:.:/g'`

		for component in `echo $prepPATH | tr : " "`
		do
			if [ $component = `dirname $0` ]
			then
				continue
			fi
			if [ -x $component/mpiexec ]
			then
				exec $component/mpiexec ${1+"$@"}
			fi
		done
		logerr "unexpected error - no non-PBS mpiexec in PATH"
	else
		testPATH=$PBS_O_PATH
		pbsbindirID="`filestat $PBS_EXEC/bin`"

		# make implicit "." in $testPATH explicit
		prepPATH=`echo $testPATH | sed	-e 's/^:/.:/'		\
						-e 's/:$/:./'		\
						-e 's/:::*/:.:/g'`

		for component in `echo $prepPATH | tr : " "`
		do
			#	Check to see whether . is $PBS_EXEC/bin
			if [ $component = "." ]
			then
				if [ "`filestat .`" = $pbsbindirID ]
				then
					continue
				fi
			else
				if [ $component = "$PBS_EXEC/bin" ]
				then
					continue
				fi
			fi
			if [ -x $component/mpiexec ]
			then
				exec $component/mpiexec ${1+"$@"}
			fi
		done
		logerr "unexpected error - no non-PBS mpiexec in PBS_O_PATH"
	fi

	exit 1
}

filestat()
{
	if [ $# -ne 1 ]
	then
		logerr "filestat:  unexpected internal error ($#)"
		exit 1
	else
		#	Check for GNU stat(1) command, which allows us to
		#	return a tag (the file's serial number on a given
		#	device) more likely to be unique than the serial
		#	number alone.
		if type stat > /dev/null 2>&1
		then
			statformat="%d:%i"
			stat -c $statformat $1
		else
			#	Sigh - best we can do under the circumstances
			ls -id $1 | awk '{print $1}'
		fi
	fi
}

#	reset per-rank settings
reset_rank()
{
	maxprocs=`wc -l $PBS_NODEFILE | cut -f1 -d' '`
	arch=""
	file=""
	host=""
	path=""
	prog=""
	progargs=""
	set=""
	wdir=""
}

usage()
{
	printf "Usage:\n"
	printf "\t%s\n" "mpiexec -n    <maxprocs>"
	printf "\t%s\n" "-soft  <        >"
	printf "\t%s\n" "-host  <        >"
	printf "\t%s\n" "-arch  <        >"
	printf "\t%s\n" "-wdir  <        >"
	printf "\t%s\n" "-path  <        >"
	printf "\t%s\n" "-file  <        >"
	printf "\t%s\n" "..."
	printf "\t%s\n" "<command line>"
	printf "or\n"
	printf "\t%s\n" "mpiexec <args as above> [ : <args as above> ... ]"
	printf "or\n"
	printf "\t%s\n" "mpiexec -configfile <filename>"
	printf "\t%s\n" "mpiexec --version"

	exit 1
}

logerr()
{
	printf "%s:  %s\n" $MyName ${1+"$@"} > /dev/stderr
}

evalsimpleargs()
{
	if [ $# -le 1 ]
	then
		if [ $# -eq 1 ]
		then
			logerr "$1:  argument expected"
		fi
		usage
	else
		opt="$1"
		arg="$2"
	fi

	case "$opt" in
		"-n")		maxprocs=$arg	;;
		"-soft")	set=$arg	;;	# unimplemented?
		"-host")	host=$arg	;;
		"-arch")	arch=$arg	;;
		"-wdir")	wdir=$arg	;;
		"-path")	path=$arg	;;
		"-file")	file=$arg	;;
		*)		logerr "internal error - option \"$opt\""
				exit 1
				;;
	esac
}

#	debugging hook
printargs()
{
	printf "%s:\n" $MyName
	printf "\tmaxprocs:  %s\n" $maxprocs
	printf "\tsoft:  %s\n" $soft
	printf "\thost:  %s\n" $host
	printf "\tarch:  %s\n" $arch
	printf "\twdir:  %s\n" $wdir
	printf "\tpath:  %s\n" $path
	printf "\tfile:  %s\n" $file
	printf "\tprog:  %s\n" $prog
	printf "\targs:  %s\n" $progargs
	printf "\tconfigfile:  %s\n" $configfile
}

dorank()
{
	line=""
	[ -n "$maxprocs" ] && line="$line -n $maxprocs"
	[ -n "$soft" ] && line="$line -soft $soft"
	[ -n "$host" ] && line="$line -host $host"
	[ -n "$arch" ] && line="$line -arch $arch"
	[ -n "$wdir" ] && line="$line -wdir $wdir"
	[ -n "$path" ] && line="$line -path $path"
	[ -n "$file" ] && line="$line -file $file"
	[ -n "$prog" ] && line="$line $prog"
	[ -n "$progargs" ] && line="$line $progargs"

	echo "$line" >> $tmpconfigfile
	reset_rank
}

#	This function is passed the script's initial arguments (via init()).
#	It does any necessary vendor-specific initializations, including
#	determining whether this is a supported platform.
#
#	Currently the only supported platforms are Altix systems running
#	either the SGI MPI bundle of Performance Suite or older SGIs with
#	ProPack version 4 or greater.  On Altix systems with an earlier
#	version of ProPack, we complain about an unsupported version.  On
#	non-Altix systems, we assume we were invoked by mistake and use
#	the value of PBS_O_PATH to search for the correct version of mpiexec
#	to execute.
vendor_init()
{
	supported_platform=0

	sgi_release="/etc/sgi-release"
	sgi_compute_node="/etc/sgi-compute-node-release"
	sgi_service_node="/etc/sgi-service-node-release"

	if [ -f $sgi_release -o -f $sgi_compute_node -o -f $sgi_service_node ]
	then
		sgiinit
		supported_platform=1
	fi

	if [ $supported_platform -eq 0 ]
	then
		rempiexec ${1+"$@"}
	fi
}

#	This function is passed as its argument an mpiexec-style configuration
#	file and is expected to reformat it into a format suitable for native
#	consumption by the vendor's MPI infrastructure.
vendor_config()
{
	if [ $# -ne 1 ]
	then
		usage
	fi

	sgiconfig ${1+"$@"}
}

#	This function takes no arguments.  It causes the native-format MPI job
#	constructed by vendor_config() to be executed.
vendor_run()
{
	sgimpirun
}

# Handle initialization of an SGI system based on either the chkfeature
# utility or, as a fallback, the presence of various text files on an
# older ProPack system.
sgiinit()
{
	PATH=$PATH:/usr/sbin	# ensure access to chkfeature CLI if present
	if type chkfeature > /dev/null 2>&1
	then
	    #	If MPT is present, make sure it's loaded so we can exec mpirun
	    if chkfeature -p sgi-mpt > /dev/null 2>&1
	    then
		module load mpt > /dev/null 2>&1
	    else
		#	chkfeature says MPT is not present.  If there is an
		#	mpirun in our path, we assume (as we did before) that
		#	it's the SGI one.
		if type mpirun > /dev/null 2>&1
		then
		    :
		else
		    logerr "unexpected error - MPT mpirun unavailable"
		    exit 1
		fi
	    fi
	else
	    #	no chkfeature - older ProPack
	    sgippinit
	fi
}

#	For the release into which this change is targeted, only the Altix
#	should use the PBS version of mpiexec.  Therefore, our mpiexec will
#	determine whether it is executing on an SGI system running ProPack 4
#	or greater.  This is accomplished by examining the /etc/sgi-release
#	file to look for a string of the form
#
#		"SGI ProPack N ..."
#
#	where N is an integer greater than or equal to 4.  There are three
#	cases to consider:
#
#		-  if the file does not exist, 	PBS's mpiexec assumes that it
#		   was the unintentional recipient of control and searches the
#		   user's pre-PBS path, whose value is found in the PBS_O_PATH
#		   environment variable, for mpiexec.  If one is found, we exec
#		   it;  otherwise, an appropriate error message is displayed
#		   and we exit with an error
#
#		-  if the file does exist but its format is not what we expect
#		   to find, or N is less than 4, an appropriate error message
#		   is displayed and we exit with an error
#
#		-  otherwise, we proceed with normal execution
sgippinit()
{
	if ! sgicheckppversion
	then
		logerr "unexpected error - sgicheckppversion returned $?"
		exit 1
	fi
}

sgicheckppversion()
{
	sgi_release="/etc/sgi-release"
	sgi_compute_node="/etc/sgi-compute-node-release"
	sgi_ppversmin=4
	if [ -r $sgi_release ]
	then
		read sgi propack propackvers rest < $sgi_release
		if [ "$sgi" != "SGI" -o "$propack" != "ProPack" ]
		then
			logerr "$sgi_release:  unexpected contents"
			exit 1
		fi
		if [ `expr substr $propackvers 1 1` -lt $sgi_ppversmin ]
		then
			logerr "ProPack version $propackvers is unsupported"
			exit 1
		else
			return 0
		fi
	elif [ -r $sgi_compute_node ]
	then
		if grep "Build 5" $sgi_compute_node > /dev/null
		then
			return 0
		fi
	else
		return 1
	fi
}

#	Translate the mpiexec-style configuration file into an mpirun-style
#	one ...
sgiconfig()
{
	if [ $debug -eq 1 ]
	then
		report_config "$1"
	fi

	PBS_LIB_PATH=${PBS_EXEC}/lib
	if [ ! -d ${PBS_LIB_PATH} -a -d ${PBS_EXEC}/lib64 ] ; then
		PBS_LIB_PATH=${PBS_EXEC}/lib64
	fi

	awk -f ${PBS_LIB_PATH}/MPI/sgiMPI.awk	-v configfile="$1"	\
						-v runfile="$runfile"	\
						-v pbs_exec="$PBS_EXEC"	\
						-v debug=$debug
}

#	... and execute it.
sgimpirun()
{
	if [ $debug -eq 1 ]
	then
		report_run
	fi

	# The Performance Suite version of mpirun needs to be told
	# that it ought not complain when we exec it via this script.
	# Don't be confused by the name - it's simply a directive to
	# the SGI mpirun command to assert that mpirun need not worry
	# its pretty little head about the absence of a pbs_attach
	# command among its command line arguments.
	export MPI_IGNORE_PBS=1

	a_opt=''
	if [ -n "$PBS_MPI_SGIARRAY" ]
	then
		a_opt="-a $PBS_MPI_SGIARRAY"
	fi

	mpirun $a_opt -f $runfile
}

#	debugging hooks
report_config()
{
	echo "generated mpiexec configuration file ($1) contains"
	cat "$1" | sed -e 's/^/\t/'
}
report_run()
{
	if [ -n "$PBS_MPI_SGIARRAY" ]
	then
		echo "mpirun -a $PBS_MPI_SGIARRAY -f $runfile"
	else
		echo "mpirun -f $runfile"
	fi
	echo "where $runfile contains:"
	cat $runfile | sed -e 's/^/\t/'
}

MyName="`basename $0`"					# must occur first

[ -z "$PBS_ENVIRONMENT" ] && rempiexec ${1+"$@"}	# no work for us to do

init ${1+"$@"}

in_rankdef=0
while [ $# -gt 0 ]
do
	case "$1" in
		"-n"|"-soft"|"-host"|"-arch"|"-wdir"|"-path"|"-file")
			in_rankdef=1
			evalsimpleargs ${1+"$@"}
			shift 2
			;;
		"-configfile")
			if [ $in_rankdef -eq 1 ]
			then
				logerr "-configfile in rank definition"
				exit 1
			fi
			# first "-configfile" option terminates argument parsing
			shift
			configfile="$1"
			vendor_config $configfile && vendor_run
			exit $?
			;;
		":")
			in_rankdef=0
			shift
			evalsimpleargs ${1+"$@"}
			while [ $# -gt 0 -a "$1" != ":" ]
			do
				shift
			done
			;;
		*)
			prog="$1"
			shift
			while [ $# -gt 0 ]
			do
				if [ "$1" = ":" ]
				then
					in_rankdef=0
					dorank
					break
				else
					progargs="$progargs $1"
				fi
				shift
			done
			if [ $# -gt 0 ]
			then
				if [ `expr substr "$1" 1 1` = ":" ]
				then
					shift
				fi
			else
				ranknum=`expr $ranknum + 1`
				in_rankdef=0
				dorank
			fi
			;;
	esac
done

if [ $in_rankdef -eq 1 -a -z "$prog" ]
then
	logerr "rank $ranknum has no executable"
	exit 1
else
	vendor_config $tmpconfigfile && vendor_run
fi


================================================
FILE: src/cmds/pbs_attach.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_attach.c
 * @brief
 * pbs_attach - attach a session to a job.
 *
 */
#include <pbs_config.h>

#include "cmds.h"
#include "pbs_version.h"

extern char *getoptargstr;

extern void usage(char *);

extern void attach(int use_cmd, int newsid, int port, int doparent, pid_t pid, char *jobid, char *host, int argc, char *argv[]);

int
main(int argc, char *argv[])
{
	char *jobid = NULL;
	char *host = NULL;
	int c;
	int newsid = 0;
	int port = 0;
	int err = 0;
	int use_cmd = FALSE; /* spawn the process using a new cmd shell */
	extern char *optarg;
	extern int optind;
	pid_t pid = 0;
	char *end;
	int doparent = 0;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((c = getopt(argc, argv, getoptargstr)) != EOF) {
		switch (c) {
			case 'j':
				jobid = optarg;
				break;

			case 'p':
				pid = strtol(optarg, &end, 10);
				if (pid <= 0 || *end != '\0') {
					fprintf(stderr, "bad pid: %s\n", optarg);
					err = 1;
				}
				break;

			case 'P':
				doparent = 1;
				break;

			case 'h':
				host = optarg;
				break;

			case 'c':
				use_cmd = TRUE;
				break;

			case 'm':
				port = strtol(optarg, &end, 10);
				if (port <= 0 || *end != '\0') {
					fprintf(stderr, "bad port: %s\n", optarg);
					err = 1;
				}
				break;

			case 's':
				newsid = 1;
				break;

			default:
				err = 1;
				break;
		}
	}

	if (pid != 0) {
		if (newsid) {
			fprintf(stderr, "cannot specify pid and session\n");
			err = 1;
		}
		if (doparent) {
			fprintf(stderr, "cannot specify pid and parent\n");
			err = 1;
		}
		if (optind < argc) {
			fprintf(stderr, "cannot specify pid and command\n");
			err = 1;
		}
	} else if (optind == argc) {
		fprintf(stderr, "must specify pid or command\n");
		err = 1;
	}

	if (err)
		usage(argv[0]);

	if (port == 0) {
		pbs_loadconf(0);
		port = pbs_conf.manager_service_port;
	}

	attach(use_cmd, newsid, port, doparent, pid, jobid, host, argc, argv);

	return 0;
}


================================================
FILE: src/cmds/pbs_attach_sup.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_attach_sup.c
 * @brief
 * supporting file for pbs_attach.c
 *
 */

#include <pbs_config.h>

#include <stdio.h>
#include <sys/wait.h>

#include "cmds.h"
#include "tm.h"

extern char *get_ecname(int rc);

char *getoptargstr = "+j:p:h:m:sP";
/**
 * @brief
 * 	displays how to use pbs_attach command
 *
 * @param[in] id - command name i.e pbs_attach
 *
 * @return Void
 *
 */
void
usage(char *id)
{
	fprintf(stderr, "usage: %s [-j jobid] [-m port] -p pid\n", id);
	fprintf(stderr, "usage: %s [-j jobid] [-m port] [-P] [-s] cmd [arg1 ...]\n", id);
	fprintf(stderr, "usage: %s --version\n", id);
	exit(2);
}

/**
 * @brief
 *	attach the process session to a job via TM
 *
 * @param[in] use_cmd : if TRUE, launch the process using a new command shell. (Not used)
 * @param[in] newsid : if TRUE, create a new process group for the newly spawned process
 * @param[in] port : port to connect to Mom
 * @param[in] doparent : if non-zero, attach the parent pid
 * @param[in] jobid : job id
 * @param[in] host : name of the local host
 * @param[in] argc : number of command line arguments for attach request
 * @param[in] argv : command line arguments for attach request
 *
 * @return void
 *
 */
void
attach(int use_cmd, int newsid, int port, int doparent, pid_t pid, char *jobid, char *host, int argc, char *argv[])
{
	char *cookie = NULL;
	tm_task_id tid;
	int rc = 0;

	if (newsid) {
		if ((pid = fork()) == -1) {
			perror("pbs_attach: fork");
			exit(1);
		} else if (pid > 0) { /* parent */
			int status;

			if (wait(&status) == -1) {
				perror("pbs_attach: wait");
				exit(1);
			}
			if (WIFEXITED(status))
				exit(WEXITSTATUS(status));
			else
				exit(2);
		}
		if (setsid() == -1) {
			perror("pbs_attach: setsid");
			exit(1);
		}
	}

	if (pid == 0)
		pid = getpid();

	/*
	 **	Do the attach.
	 */
	rc = tm_attach(jobid, cookie, pid, &tid, host, port);

	/*
	 **	If an error other than "session already attached" is returned,
	 **	complain and return failure.
	 */
	if ((rc != TM_SUCCESS) && (rc != TM_ESESSION)) {
		fprintf(stderr, "%s: tm_attach: %s\n", argv[0], get_ecname(rc));
		exit(1);
	}
	/*
	 **	Optional attach of the parent pid.
	 */
	if (doparent) {
		pid = getppid();
		rc = tm_attach(jobid, cookie, pid, &tid, host, port);
		if ((rc != TM_SUCCESS) && (rc != TM_ESESSION)) {
			fprintf(stderr, "%s: tm_attach parent: %s\n", argv[0], get_ecname(rc));
		}
	}

	if (optind < argc) {
		/*
		 ** Put MPICH_PROCESS_GROUP into the environment so some
		 ** installations of MPICH will not call setsid() and escape
		 ** the new task.
		 */
		(void) setenv("MPICH_PROCESS_GROUP", "no", 1);

		argv += optind;
		argc -= optind;

		execvp(argv[0], argv);
		perror(argv[0]);
		exit(255); /* not reached */
	}
	exit(0);
}


================================================
FILE: src/cmds/pbs_dataservice.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>
#include <assert.h>
#include <pwd.h>
#include <stdio.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <libgen.h>
#include <dirent.h>
#include <errno.h>
#include "libpbs.h"
#include "portability.h"
#include "ticket.h"
#include "server_limits.h"
#include "pbs_db.h"

/**
 * @brief
 *	The main function in C - entry point
 *
 * @param[in]  argc - argument count
 * @param[in]  argv - pointer to argument array
 *
 * @return  int
 * @retval  0 - success
 * @retval  !0 - error
 */
int
main(int argc, char *argv[])
{
	int rc;
	int i;
	int errflg = 0;
	char prog[] = "pbs_dataservice";
	char sopt[256];
	char conn_db_host[PBS_MAXSERVERNAME + 1];
	char *errmsg = NULL;

	/* test for real deal or just version and exit */
	PRINT_VERSION_AND_EXIT(argc, argv);
	while ((i = getopt(argc, argv, "s:")) != EOF) {
		switch (i) {
			case 's':
				pbs_strncpy(sopt, optarg, sizeof(sopt));
				break;
			case '?':
			default:
				errflg++;
		}
	}
	if (errflg) {
		fprintf(stderr, "\nusage: %s -s [start|stop|status]\n", prog);
		return (-1);
	}
	/* read configuration file */
	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "%s: Could not load pbs configuration\n", prog);
		return (-1);
	}

	/* check admin privileges */
	if (getuid() != 0 || geteuid() != 0) {
		fprintf(stderr, "%s: Must be run by root\n", prog);
		return (1);
	}

	if (pbs_conf.pbs_data_service_host)
		pbs_strncpy(conn_db_host, pbs_conf.pbs_data_service_host, PBS_MAXSERVERNAME);
	else
		pbs_strncpy(conn_db_host, pbs_default(), PBS_MAXSERVERNAME);

	if (strcmp(sopt, PBS_DB_CONTROL_START) == 0) {
		rc = pbs_start_db(conn_db_host, pbs_conf.pbs_data_service_port);
		if (rc == PBS_DB_OOM_ERR)
			rc = 0; /* Ignore OOM access error */
	} else if (strcmp(sopt, PBS_DB_CONTROL_STOP) == 0) {
		rc = pbs_stop_db(conn_db_host, pbs_conf.pbs_data_service_port);
	} else if (strcmp(sopt, PBS_DB_CONTROL_STATUS) == 0) {
		rc = pbs_status_db(conn_db_host, pbs_conf.pbs_data_service_port);
		if (rc) {
			pbs_db_get_errmsg(PBS_DB_ERR, &errmsg);
			if (errmsg) {
				fprintf(stderr, "%s: %s", prog, errmsg);
				free(errmsg);
			}
		}
	} else {
		fprintf(stderr, "\nusage: %s -s [start|stop|status]\n", prog);
		return -1;
	}
	return (rc);
}


================================================
FILE: src/cmds/pbs_demux.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file pbs_demux.c
 * @brief
 * pbs_demux - handle I/O from multiple node job
 *
 *	Standard Out and Standard Error of each task is bound to
 *	stream sockets connected to pbs_demux which inputs from the
 *	various streams and writes to the JOB's out and error.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#include <sys/types.h>
#include <sys/time.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <netdb.h>
#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <signal.h>

#if defined(FD_SET_IN_SYS_SELECT_H)
#include <sys/select.h>
#endif

#include "cmds.h"

enum rwhere { invalid,
	      new_out,
	      new_err,
	      old_out,
	      old_err };
struct routem {
	enum rwhere r_where;
	short r_nl;
	short r_first;
};
fd_set readset;
char *cookie = 0;

/**
 * @brief
 *	read data from socket
 *
 * @param[in] sock - socket
 * @param[in] prm  - routem structure pointer
 *
 * @return - Void
 *
 */
void
readit(int sock, struct routem *prm)
{
	int amt;
	char buf[256];
	FILE *fil;
	int i;
	char *pc;

	if (prm->r_where == old_out)
		fil = stdout;
	else
		fil = stderr;

	i = 0;
	if ((amt = read(sock, buf, 256)) > 0) {
		if (prm->r_first == 1) {

			/* first data on connection must be the cookie to validate it */

			i = strlen(cookie);
			if (strncmp(buf, cookie, i) != 0) {
				(void) close(sock);
				prm->r_where = invalid;
				FD_CLR(sock, &readset);
			}
			prm->r_first = 0;
		}
		for (pc = buf + i; pc < buf + amt; ++pc) {
#ifdef DEBUG
			if (prm->r_nl) {
				fprintf(fil, "socket %d: ", sock);
				prm->r_nl = 0;
			}
#endif /* DEBUG */
			putc(*pc, fil);
			if (*pc == '\n') {
				prm->r_nl = 1;
				fflush(fil);
			}
		}
	} else {
		close(sock);
		prm->r_where = invalid;
		FD_CLR(sock, &readset);
	}
	return;
}

int
main(int argc, char *argv[])
{
	struct timeval timeout;
	int i;
	int maxfd;
	int main_sock_out = 3;
	int main_sock_err = 4;
	int n;
	int newsock;
	pid_t parent;
	fd_set selset;
	struct routem *routem;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	parent = getppid();
	cookie = getenv("PBS_JOBCOOKIE");
	if (cookie == 0) {
		fprintf(stderr, "%s: no PBS_JOBCOOKIE found in the env\n",
			argv[0]);
		exit(3);
	}
#ifdef DEBUG
	printf("Cookie found in environment: %s\n", cookie);
#endif

	maxfd = sysconf(_SC_OPEN_MAX);
	routem = (struct routem *) malloc(maxfd * sizeof(struct routem));
	if (routem == NULL) {
		fprintf(stderr, "%s: out of memory\n", argv[0]);
		exit(2);
	}
	for (i = 0; i < maxfd; ++i) {
		(routem + i)->r_where = invalid;
		(routem + i)->r_nl = 1;
		(routem + i)->r_first = 0;
	}
	(routem + main_sock_out)->r_where = new_out;
	(routem + main_sock_err)->r_where = new_err;

	FD_ZERO(&readset);
	FD_SET(main_sock_out, &readset);
	FD_SET(main_sock_err, &readset);

	if (listen(main_sock_out, 5) < 0) {
		perror("listen on out");
		exit(5);
	}

	if (listen(main_sock_err, 5) < 0) {
		perror("listen on err");
		exit(5);
	}

	while (1) {

		selset = readset;
		timeout.tv_usec = 0;
		timeout.tv_sec = 10;

		n = select(FD_SETSIZE, &selset, NULL, NULL, &timeout);
		if (n == -1) {
			if (errno == EINTR) {
				n = 0;
			} else {
				fprintf(stderr, "%s: select failed\n", argv[0]);
				exit(1);
			}
		} else if (n == 0) {
			if (kill(parent, 0) == -1) {
#ifdef DEBUG
				fprintf(stderr, "%s: Parent has gone, and so do I\n",
					argv[0]);
#endif /* DEBUG */
				break;
			}
		}

		for (i = 0; n && i < maxfd; ++i) {
			if (FD_ISSET(i, &selset)) { /* this socket has data */
				n--;
				switch ((routem + i)->r_where) {
					case new_out:
					case new_err:
						newsock = accept(i, 0, 0);
						(routem + newsock)->r_where = (routem + i)->r_where == new_out ? old_out : old_err;
						FD_SET(newsock, &readset);
						(routem + newsock)->r_first = 1;
						break;
					case old_out:
					case old_err:
						readit(i, routem + i);
						break;
					default:
						fprintf(stderr, "%s: internal error\n", argv[0]);
						exit(2);
				}
			}
		}
	}
	free(routem);
	return 0;
}


================================================
FILE: src/cmds/pbs_ds_password.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    pbs_ds_password.c
 *
 * @brief
 *      This is a tool to allow the admin to change the database password.
 *	This file uses the Libaes (AES) encryption to encrypt the chosen
 *	password to file $PBS_HOME/server_priv/db_password.
 *
 * @par	This tool has two modes.
 *	-r - No password is asked from the user. A random password is generated
 *	and set to the database, then the password is encrypted using AES
 *	encryption and stored in the above mentioned location. This option
 *	is used by the PBS installer to generate and set an initial password
 *	for the database.
 *
 *	-C <username>- Change the data-service account name that PBS uses to access
 *	the data-service. If the user name specified is different from what is listed
 *	in pbs.conf file, then pbs_ds_password asks the user to confirm whether
 *	he/she really intends to change the data-service user. On Unix, the user-name
 *	supplied must be an existing non-root system user. pbs_ds_password will
 *	check to ensure that the user is non-root.
 *	If the admin wishes to change the data-service user, then pbs_ds_password
 *	will also prompt the user to enter the password to be set for this new user.
 *	pbs_ds_password then creates the new user as a superuser in the database,
 *	and sets the chosen password. It then updates the db_usr file in
 *	server_priv with the new data service user name. On Unix,
 *	pbs_ds_password displays a reminder to the user to run "pbs_probe -f "
 *	command to "fix" the change in ownership of the files related to the data-service.
 *
 *	No options: This is the interactive mode. In this mode, the tool asks the
 *	user to enter a password twice. If both the passwords match then the tool
 *	sets the password to the database and stores the encrypted password
 *	in the above mentioned location.
 *
 *	Changes can be made only when the pbs data-service is running. This
 *	can be done when pbs_server is running (which means data-service is also
 *	running), or if pbs_server is down, the admin can start the data-service and
 *	then run this command.
 *
 *	This tool uses the usual way to connect to the database, which means to
 *	change the database it has to first authenticate with the database with the
 *	currently set password. The connect_db function it calls, automatically
 *	uses the current password from $PBS_HOME/server_priv/db_password
 *	to connect to the database.
 *
 *	The tool attempts to connect to the data-service running on the localhost
 *	only. Thus this tool can be used only from the same host that is running the
 *	pbs_dataservice. (For example, in failover scenario, this tool needs to be
 *	invoked from the same host which is currently running the data-service)
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>
#include <assert.h>
#include <pwd.h>
#include <stdio.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <libgen.h>
#include <dirent.h>
#include <errno.h>

#include "libpbs.h"
#include "portability.h"

#include "ticket.h"

#include "server_limits.h"
#include "pbs_db.h"

#ifndef LOGIN_NAME_MAX
#define LOGIN_NAME_MAX 256
#endif

int cred_type;
size_t cred_len;
char *cred_buf = NULL;

int started_db = 0;
void *conn = NULL;
struct passwd *pwent;
char pwd_file_new[MAXPATHLEN + 1];
char conn_db_host[PBS_MAXSERVERNAME + 1];

extern unsigned char pbs_aes_key[][16];
extern unsigned char pbs_aes_iv[][16];

/**
 * @brief
 *	At exit handler to close database connection,
 *	stop database if this program had started it,
 *	and to remove the temp password file, if it
 *	was created
 *
 * @return	Void
 *
 */
static void
cleanup()
{
	char *db_err = NULL;

	if (pwd_file_new[0] != 0)
		unlink(pwd_file_new);

	if (conn != NULL) {
		pbs_db_disconnect(conn);
		conn = NULL;
	}

	if (started_db == 1) {
		if (pbs_stop_db(conn_db_host, pbs_conf.pbs_data_service_port) != 0) {
			fprintf(stderr, "Failed to stop PBS Data Service");
			pbs_db_get_errmsg(PBS_DB_ERR, &db_err);
			if (db_err) {
				fprintf(stderr, ":[%s]", db_err);
				free(db_err);
			}
			fprintf(stderr, "\n");
		}
		started_db = 0;
	}
}

#define MAX_PASSWORD_LEN 256

/**
 * @brief
 *	Accepts a password string without echoing characters
 *	on the screen
 *
 * @param[out]	passwd - password read from user
 *
 * @return - Error code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 */
static int
read_password(char *passwd)
{
	int len;
	char *p;

	if (system("stty -echo") != 0)
		return -1;

	if (fgets(passwd, MAX_PASSWORD_LEN, stdin) == NULL) {
		fprintf(stderr, "%s : fgets failed", __func__);
		return -1;
	}

	if (system("stty echo") != 0)
		return -1;

	len = strlen(passwd);
	p = passwd + len - 1;
	while (*p == '\r' || *p == '\n')
		p--;
	*(p + 1) = 0;

	return 0;
}

/**
 * @brief
 *	Generates a random password for the database
 *	The allowed_chars array contains a list of
 *	characters acceptable for the password. This
 *	function uses srand to randomize the seed on the
 *	current timestamp. Then it uses rand to select
 *	a random character from the array to add to the
 *	password string.
 *
 * @param[out]	passwd - password generated
 * @param[in] len - Length of password to be generated
 *
 * @return - Error code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 */
static int
gen_password(char *passwd, int len)
{
	int chrs = 0;
	char allowed_chars[] = "0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ!@#$%^&*()_+";
	int arr_len = strlen(allowed_chars);

	sleep(1); /* sleep 1 second to ensure the srand on time(0) truely randomizes the seed */
	srand(time(0));
	while (chrs < len) {
		int c;
		c = (char) (rand() % arr_len);
		passwd[chrs++] = allowed_chars[c];
	}
	passwd[chrs] = '\0';
	return 0;
}

/**
 * @brief
 *	Updates the db_usr file in server_priv with
 *	the new data service user name.
 *
 * @param[in] file - The db_usr file
 * @param[in] userid - The new data service user to be set
 *
 * @return - Error code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 */
int
update_db_usr(char *file, char *userid)
{
	int fd;
	int rc = 0;

	if ((fd = open(file, O_CREAT | O_TRUNC | O_WRONLY, 0600)) == -1) {
		fprintf(stderr, "%s: open failed, errno=%d\n", file, errno);
		return -1;
	}
	if (write(fd, userid, strlen(userid)) == -1) {
		fprintf(stderr, "%s: write failed, errno=%d\n", file, errno);
		rc = -1;
	}
	close(fd);
	return rc;
}

/**
 * @brief
 *	Checks whether given user exists on the system.
 *	On Unix, it additionally checks that the user is not
 *	the root user (id 0).
 *
 * @param[in] userid - The id to check
 *
 * @return - user suitable to use?
 * @retval  -1 - Userid not suitable for use
 * @retval   0 - Userid suitable to use
 *
 */
int
check_user(char *userid)
{
	pwent = getpwnam(userid);
	if (pwent == NULL)
		return (-1);
	if (pwent->pw_uid == 0)
		return (-1);

	/* in unix make sure that the user home dir is accessible */
	if (access(pwent->pw_dir, R_OK | W_OK | X_OK) != 0)
		return (-1);
	return 0;
}

/**
 * @brief
 *	This function changes the ownership of
 *	the whole directory tree (and files) under the
 *	pbs datastore directory to the new data service
 *	user account. This is required only in Unix.
 *	On Windows, acess is given to the admin
 *	group anyway, which allows any service_account
 *	(part of the admin group) to be able to access
 *	these directories.
 *
 * @param[out] path - Path of the datastore directory
 * @param[in] userid - The new data service user
 *				to change ownership to
 *
 * @return - Error code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 */
int
change_ownership(char *path, char *userid)
{
	DIR *dir;
	struct dirent *pdirent;
	char dirfile[MAXPATHLEN + 1];
	struct stat stbuf;

	if (chown(path, pwent->pw_uid, (gid_t) -1) == -1) {
		fprintf(stderr, "%s : chown failed : ERR : %s\n"
				,__func__, strerror(errno));
		return -1;
	}
	dir = opendir(path);
	if (dir == NULL) {
		return -1;
	}

	while (errno = 0, (pdirent = readdir(dir)) != NULL) {
		if (strcmp(pdirent->d_name, ".") == 0 ||
		    strcmp(pdirent->d_name, "..") == 0)
			continue;

		sprintf(dirfile, "%s/%s", path, pdirent->d_name);
		if (chown(dirfile, pwent->pw_uid, (gid_t) -1) == -1) {
			fprintf(stderr, "%s : chown failed : ERR : %s\n"
					,__func__, strerror(errno));
			fprintf(stderr, "%s : chown failed : ERR : %s\n",__func__, strerror(errno));
			continue;
		}
		stat(dirfile, &stbuf);
		if (stbuf.st_mode & S_IFDIR) {
			change_ownership(dirfile, userid);
			continue;
		}
	}
	if (errno != 0 && errno != ENOENT) {
		(void) closedir(dir);
		return -1;
	}
	(void) closedir(dir);
	return 0;
}
/**
 * @brief
 *	The main function in C - entry point
 *
 * @param[in]  argc - argument count
 * @param[in]  argv - pointer to argument array
 *
 * @return  int
 * @retval  0 - success
 * @retval  !0 - error
 */
int
main(int argc, char *argv[])
{
	int i, rc;
	char passwd[MAX_PASSWORD_LEN + 1] = {'\0'};
	char passwd2[MAX_PASSWORD_LEN + 1];
	char pwd_file[MAXPATHLEN + 1];
	char userid[LOGIN_NAME_MAX + 1];
	int fd, errflg = 0;
	int gen_pwd = 0;
	int failcode = 0;
	char *db_errmsg = NULL;
	int pmode;
	int change_user = 0;
	char *olduser = NULL;
	int ret = 0;
	int update_db = 0;
	char getopt_format[5];
	char prog[] = "pbs_ds_password";
	char errmsg[PBS_MAX_DB_CONN_INIT_ERR + 1];

	conn = NULL;
	pwd_file_new[0] = 0;

	/*test for real deal or just version and exit*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	/* read configuration file */
	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "%s: Could not load pbs configuration\n", prog);
		return (-1);
	}

	/* backup old user name */
	if ((olduser = pbs_get_dataservice_usr(errmsg, PBS_MAX_DB_CONN_INIT_ERR)) == NULL) {
		fprintf(stderr, "%s: Could not retrieve current data service user\n", prog);
		if (strlen(errmsg) > 0)
			fprintf(stderr, "%s\n", errmsg);
		return (-1);
	}

	if (pbs_conf.pbs_data_service_host == NULL)
		update_db = 1;

	userid[0] = 0; /* empty user id */

	strcpy(getopt_format, "rC:");

	while ((i = getopt(argc, argv, getopt_format)) != EOF) {
		switch (i) {
			case 'r':
				gen_pwd = 1;
				break;
			case 'C':
				pbs_strncpy(userid, optarg, sizeof(userid));
				break;
			case '?':
			default:
				errflg++;
		}
	}

	if (errflg) {
		fprintf(stderr, "\nusage:\t%s [-r] [-C username]\n", prog);
		fprintf(stderr, "      \t%s --version\n", prog);
		ret = -1;
		goto exit;
	}

	/* NOTE : This functionality is added just for the automation testing purpose.
     * Usage: pbs_ds_password <password>
     */
	if (argv[optind] != NULL) {
		gen_pwd = 0;
		pbs_strncpy(passwd, argv[optind], sizeof(passwd));
	}

	/* check admin privileges */
	if ((getuid() != 0) || (geteuid() != 0)) {
		fprintf(stderr, "%s: Must be run by root\n", prog);
		ret = 1;
		goto exit;
	}

	change_user = 0;
	/* if the -C option was specified read the user from pbs.conf */
	if (userid[0] != 0) {
		if (strcmp(olduser, userid) != 0) {
			change_user = 1;
		}
	}

	if (change_user == 1) {
		/* check that the supplied user-id exists (and is non-root on unix) */
		if (check_user(userid) != 0) {
			fprintf(stderr, "\n%s: User-id %s does not exist/is root user/home dir is not accessible\n", prog, userid);
			ret = -1;
			goto exit;
		}
	}

	atexit(cleanup);
	if (pbs_conf.pbs_data_service_host)
		pbs_strncpy(conn_db_host, pbs_conf.pbs_data_service_host, sizeof(conn_db_host));
	else
		pbs_strncpy(conn_db_host, pbs_default(), sizeof(conn_db_host));

	if (update_db == 1) {
		/* then connect to database */

		failcode = pbs_db_connect(&conn, NULL, pbs_conf.pbs_data_service_port, PBS_DB_CNT_TIMEOUT_NORMAL);

		if (conn && change_user == 1) {
			/* able to connect ? Thats bad, PBS or dataservice is running */
			fprintf(stderr, "%s: PBS Services and/or PBS Data Service is running\n", prog);
			fprintf(stderr, "                 Stop PBS and Data Services before changing Data Service user\n");
			ret = -1;
			goto exit;
		}

		if (!conn) {
			/* start db only if it was not already running */
			failcode = pbs_start_db(conn_db_host, pbs_conf.pbs_data_service_port);
			if (failcode != 0 && failcode != PBS_DB_OOM_ERR) {
				if (failcode == -1)
					pbs_db_get_errmsg(PBS_DB_ERR, &db_errmsg);
				else
					pbs_db_get_errmsg(failcode, &db_errmsg);
				if (db_errmsg)
					fprintf(stderr, "%s: Failed to start PBS dataservice:[%s]\n", prog, db_errmsg);
				else
					fprintf(stderr, "%s: Failed to start PBS dataservice\n", prog);
				ret = -1;
				goto exit;
			}
			started_db = 1;

			failcode = pbs_db_connect(&conn, NULL, pbs_conf.pbs_data_service_port, PBS_DB_CNT_TIMEOUT_NORMAL);
			if (!conn) {
				pbs_db_get_errmsg(failcode, &db_errmsg);
				if (db_errmsg)
					fprintf(stderr, "%s: Could not connect to PBS data service:%s\n", prog, db_errmsg);
				ret = -1;
				goto exit;
			}
		}
	}

	if (gen_pwd == 0 && passwd[0] == '\0') {
		/* ask user to enter password twice */
		printf("Enter the password:");
		read_password(passwd);

		printf("\nRe-enter the password:");
		read_password(passwd2);
		printf("\n\n");
		if (strcmp(passwd, passwd2) != 0) {
			fprintf(stderr, "Entered passwords do not match\n");
			ret = -2;
			goto exit;
		}
		if (strlen(passwd) == 0) {
			fprintf(stderr, "Blank password is not allowed\n");
			ret = -2;
			goto exit;
		}
	} else if (gen_pwd == 1) {
		gen_password(passwd, 16);
	}

	rc = pbs_encrypt_pwd(passwd, &cred_type, &cred_buf, &cred_len, (const unsigned char *) pbs_aes_key, (const unsigned char *) pbs_aes_iv);
	if (rc != 0) {
		fprintf(stderr, "%s: Failed to encrypt password\n", prog);
		ret = -1;
		goto exit;
	}

	sprintf(pwd_file_new, "%s/server_priv/db_password.new", pbs_conf.pbs_home_path);
	sprintf(pwd_file, "%s/server_priv/db_password", pbs_conf.pbs_home_path);

	/* write encrypted password to the password file */
	pmode = 0600;
	if ((fd = open(pwd_file_new, O_WRONLY | O_TRUNC | O_CREAT | O_Sync,
		       pmode)) == -1) {
		perror("open/create failed");
		fprintf(stderr, "%s: Unable to create file %s\n", prog, pwd_file_new);
		ret = -1;
		goto exit;
	}

	if (update_db == 1) {
		/* change password only if this config option is not set */
		rc = pbs_db_password(conn, userid, passwd, olduser);
		free(olduser);
		olduser = NULL;
		memset(passwd, 0, sizeof(passwd));
		memset(passwd2, 0, sizeof(passwd2));
		if (rc == -1) {
			fprintf(stderr, "%s: Failed to create/alter user id %s\n", prog, userid);
			ret = -1;
			goto exit;
		}
	}

	if (write(fd, cred_buf, cred_len) != cred_len) {
		perror("write failed");
		fprintf(stderr, "%s: Unable to write to file %s\n", prog, pwd_file_new);
		ret = -1;
		goto exit;
	}
	close(fd);
	free(cred_buf);

	if (rename(pwd_file_new, pwd_file) != 0) {
		ret = -1;
		goto exit;
	}

	if (update_db == 1) {
		/* commit  to database */
		cleanup(); /* cleanup will disconnect and delete tmp file too */
	}

	printf("---> Updated user password\n");
	if (update_db == 1 && change_user == 1) {
		printf("---> Updated user in datastore\n");
		printf("---> Stored user password in datastore\n");
	}

	if (change_user == 1) {
		char usr_file[MAXPATHLEN + 1];
		sprintf(usr_file, "%s/server_priv/db_user", pbs_conf.pbs_home_path);

		/* update PBS_HOME/server_priv/db_user file with the new user name */
		if (update_db_usr(usr_file, userid) != 0) {
			fprintf(stderr, "Unable to update file %s\n", usr_file);
			ret = -1;
			goto exit;
		}
		printf("---> Updated new user\n");
	}

	if (update_db == 1 && change_user == 1) {
		char datastore[MAXPATHLEN + 1];

		/* ownership is changed only for Unix users
		 * On windows, these files are allways owned by the user who installed the database
		 * and writable by administrators anyway
		 */
		sprintf(datastore, "%s/datastore", pbs_conf.pbs_home_path);
		/* change ownership of the datastore directories to the new user, so that db can be started again */
		if (change_ownership(datastore, userid) != 0) {
			fprintf(stderr, "%s: Failed to change ownership on path %s\n", prog, datastore);
			ret = -1;
			goto exit;
		}
		printf("---> Changed ownership of %s to user %s\n", datastore, userid);

		/* reload configuration file */
		if (pbs_loadconf(1) == 0) {
			fprintf(stderr, "%s: Could not load pbs configuration\n", prog);
			ret = -1;
			goto exit;
		}

		failcode = pbs_start_db(conn_db_host, pbs_conf.pbs_data_service_port);
		if (failcode != 0 && failcode != PBS_DB_OOM_ERR) {
			pbs_db_get_errmsg(failcode, &db_errmsg);
			if (db_errmsg)
				fprintf(stderr, "%s: Failed to start PBS dataservice as new user:[%s]\n", prog, db_errmsg);
			else
				fprintf(stderr, "%s: Failed to start PBS dataservice as new user\n", prog);
			ret = -1;
			goto exit;
		}
	}
	printf("---> Success\n");

exit:
	free(olduser);
	return ret;
}


================================================
FILE: src/cmds/pbs_lamboot.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

lamboot="lamboot"
name=`basename $0`

if [ "${PBS_NODEFILE:-XX}" = "XX" ]; then
        if [ "$name" != "lamboot" ]; then
               echo "$name: Warning, not running under PBS"
        fi
	$lamboot $*
	exit $?
fi

options=""
bhost=""
boot_tm=0
boot_rsh=0
ssi_arg1=""
ssi_arg2=""
while [ $# -gt 0 ]; do

	if   [ "XX$1" = "XX-c" ]     		 ||
             [ "XX$1" = "XX-prefix" ]     	 ||
             [ "XX$1" = "XX-sessionprefix" ]     ||
             [ "XX$1" = "XX-sessionsuffix" ]     ||
             [ "XX$1" = "XX-withlamprefixpath" ] ; then
		options="$options $1"
		shift
		options="$options $1"
        elif [ "XX$1" = "XX-ssi" ] ; then
		options="$options $1"
		shift
		options="$options $1"
		ssi_arg1=$1
		shift
		ssi_arg2=$1

		if [ "$ssi_arg1" = "boot" ] &&
		   [ "$ssi_arg2" = "tm" ] ; then
			boot_tm=1
		elif [ "$ssi_arg1" = "boot" ] &&
		     [ "$ssi_arg2" = "rsh" ] ; then
			boot_rsh=1
		fi

		if [ `echo $1 | wc -w` -gt 1 ] ; then
			options="$options \"$1\""
		else
			options="$options $1"
		fi
	elif [ `expr match "$1" "-\+"` -ne 0 ] ; then
		options="$options $1"
	else
		bhost="$1"
        fi

	shift

done

if [ "${bhost:-XX}" != "XX" ]; then
	echo "$name: Warning, <bhost> value ignored by PBS"
fi

# check if tm boot module is specified with lamboot
if [ $boot_tm -eq 1 ] ||
   ( [ $boot_rsh -eq 0 ] &&
     [ "${LAM_MPI_SSI_boot:-XX}" != "XX" ] &&
     [ "${LAM_MPI_SSI_boot}" = "tm" ] ) ; then
	eval $lamboot $options
else
	eval $lamboot $options ${PBS_NODEFILE}
fi


================================================
FILE: src/cmds/pbs_mpihp.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

#
# is_comment_line: echoes 0 if line content as specified
#         by first argument begins with #; returns
#         1 otherwise.
#

is_comment_line ()
{
   line=$*

   if [ `echo "$1" | egrep -c "^#"` -ne 0 ] ; then
      echo 0
      return
   fi

   echo 1

}

#
# read_appfile: read next non-comment line of  user's appfile
#      named in $1. Be sure to set 'appfile_num_entries" global
#      variable first.
# Returns: line read-in put in 'appfile_content" global
#      variable, which can be the <empty> string if all
#      lines have been read.
#
# Global variables:
#   appfile_idx - next line to read in user's appfile
#   appfile_num_entries - number of entries in user's appfile
#   appfile_content - upon returns, holds the content
#           of line read.

appfile_idx=1
appfile_num_entries=0
appfile_content=""

read_appfile ()
{
   appfile=$1

   while true ; do

      if [ $appfile_idx -gt $appfile_num_entries ] ; then
         appfile_content=""
         return
      fi

      appfile_content=`eval sed -n '${appfile_idx}p' $appfile`
      appfile_idx=`expr $appfile_idx + 1`

      if [ `is_comment_line $appfile_content` -eq 1 ] ; then
         return
      fi

   done
}

#
# reset_appfile: resets the  next line to read in user's
#       appfile back to first line.
#

reset_appfile ()
{

   appfile_idx=1
}


#
# read_nodefile: read next line of  nodefile named in
#      in $1. Be sure to set 'nodefile_num_entries"
#      first.
# Returns: line read-in put in 'nodefile_content" global
#      variable, which can be the <empty> string if all
#      lines have been read.
#
# Global variables:
#   nodefile_idx - next line to read in nodefile
#   nodefile_num_entries - number of entries in nodefile
#   nodeile_content - upon returns, holds the content
#           of line read.

nodefile_idx=1
nodefile_num_entries=0
nodefile_content=""

read_nodefile ()
{
   nodefile=$1

   if [ $nodefile_idx -gt $nodefile_num_entries ] ; then
      nodefile_content=""
      return
   fi
   nodefile_content=`eval sed -n '${nodefile_idx}p' $nodefile`

   nodefile_idx=`expr $nodefile_idx + 1`
}


#
# reset_nodefile: resets the  next line to read in user's
#       nodefile back to first line.
#

reset_nodefile ()
{

   nodefile_idx=1
}

#
# get_rank (): echoes the rank (-np value) value given
#          in an appfile specification:
#      [-np X] [-h host] ... <prog> <args>
#

get_rank ()
{
   line=$*

   np_val=1   # default is 1

   while [ $# -gt 0 ] ; do
      if [ "XX$1" = "XX-np" ] ; then
         shift
         np_val="$1"
         break
      fi
      shift
   done
   echo $np_val
}

#
# get_appfile_args (): given an mpirun command line
#  argument specification of the form:
#
#  (1)  [-np #] [-help] [-version] [-djpv] [-ck]
#       [-h host] [-l user] [-stdio=[options]] [-e var[=val]]...
#       [-sp paths] [-i spec] [-tv] program [args]
#
#  (2)  [-help] [-version] [-djpv] [-ck]
#   [-i spec] [-stdio=[options]] [-commd] [-tv]
#   [-f appfile] [-- extra_args_for_appfile]
#
# echoes only the options and arguments that are allowed
# to appear in an application file except
# "-h host", and "-l user" options which are ignored
# under PBS.
#
#   -np <#> [-E <VAR>[=<val>] [...]] [-sp <paths>] <program> [<args>]
#

get_appfile_args ()
{
   line=$*

   args=""
   in_program_args=0
   while [ $# -gt 0 ] ; do

      if [ $in_program_args -eq 1 ] ; then
         args="$args $1"
      elif [ "XX$1" = "XX-e" ]  ||
           [ "XX$1" = "XX-np" ] ||
           [ "XX$1" = "XX-sp" ] ; then
         args="$args $1"
         shift
         args="$args $1"

#      NOTE: we're using egrep for
#            regular expression matching
#            as expr MATCH doesn't seemed
#            to work under HP

      elif [ "XX$1" = "XX-h" ]  ||
           [ "XX$1" = "XX-l" ]  ||
           [ "XX$1" = "XX-i" ] ; then
	 shift
      elif [ `echo "$1" | egrep -c "^\-aff=.+"` -ne 0 ] ; then
         shift
         continue
      elif [ "XX$1" = "XX--" ] ; then
         break
      elif [ `echo "$1" | egrep -c "^\-.+"` -ne 0 ] ; then
         shift
         continue
      else
         args="$args $1"
	 in_program_args=1
      fi
      shift
   done
   echo "$args"
}

#
# get_global_args (): given an mpirun command line
#  argument specification of the form:
#
#  (1)  [-np #] [-help] [-version] [-djpv] [-ck]
#       [-h host] [-l user] [-stdio=[options]] [-e var[=val]]...
#       [-sp paths] [-i spec] [-tv] program [args]
#
#  (2)  [-help] [-version] [-djpv] [-ck]
#   [-i spec] [-stdio=[options]] [-commd] [-tv]
#   [-f appfile] [-- extra_args_for_appfile]
#
# puts in the global variable 'global_args', the
# options and arguments that are NOT allowed
# to appear inside an application file - global arguments:
#
#   [-help] [-version] [-djpv] [-ck] [-i spec] [-tv]
#                         ... [-- extra_args_for_appfile]
# Also sets global variable 'global_extra_args'
# the value of
#   [-- extra_args_for_appfile]
#
# NOTE: Under HP Linux, mpirun has the following
#       additional global arguments:
#       [-universe=#] [-T] [-prot] [-spawn] [-1sided] [-ha] [-hmp]
# Returns: value of 0 for success; 1 if -client argument
#          was encountered.
#
#

global_args=""
global_extra_args=""
get_global_args ()
{
   in_extra_args=0
   in_prog_args=0

   while [ $# -gt 0 ] ; do

      if [ $in_prog_args -eq 1 ] ; then
         break
      elif [ $in_extra_args -eq 1 ] ; then
         global_extra_args="$global_extra_args $1"
      elif [ "XX$1" = "XX-help" ]  ||
         [ "XX$1" = "XX-version" ] ||
         [ "XX$1" = "XX-tv" ] ||
         [ "XX$1" = "XX-commd" ] ||
         [ "XX$1" = "XX-T" ] ||
         [ "XX$1" = "XX-prot" ] ||
         [ "XX$1" = "XX-spawn" ] ||
         [ "XX$1" = "XX-1sided" ] ||
         [ "XX$1" = "XX-ha" ] ||
         [ "XX$1" = "XX-hmp" ] ||
         [ "XX$1" = "XX-itapi" ] ||
         [ "XX$1" = "XX-ITAPI" ] ||
         [ "XX$1" = "XX-TCP" ] ||
         [ "XX$1" = "XX-intra=mix" ] ||
         [ "XX$1" = "XX-intra=nic" ] ||
         [ "XX$1" = "XX-intra=shm" ] ||
         [ "XX$1" = "XX-cpu_bind" ] ||
         [ "XX$1" = "XX-dd" ] ||
         [ "XX$1" = "XX-ndd" ] ||
         [ "XX$1" = "XX-rdma" ] ||
         [ "XX$1" = "XX-srq" ] ||
         [ "XX$1" = "XX-ibv" ] ||
         [ "XX$1" = "XX-IBV" ] ||
         [ `echo "$1" | egrep -c "^\-[djpv]+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-stdio=.+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-aff=.+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-universe_size=.+"` -ne 0 ] ||
         [ "XX$1" = "XX-ck" ] ; then
         global_args="$global_args $1"

#      NOTE: we're using egrep for
#            regular expression matching
#            as expr MATCH doesn't seemed
#            to work under HP

      elif [ "XX$1" = "XX-i" ] ||
	   [ "XX$1" = "XX-netaddr" ] ||
           [ "XX$1" = "XX-e" ] ||
	   [ "XX$1" = "XX-subnet" ] ; then
         global_args="$global_args $1"
	 shift
         global_args="$global_args $1"
      elif [ "XX$1" = "XX-client" ] ; then
         return 1
      elif [ "XX$1" = "XX--" ] ; then
	 global_extra_args="--"
	 in_extra_args=1
      elif [ "XX$1" = "XX-f" ]  ||
	   [ "XX$1" = "XX-np" ] ||
	   [ "XX$1" = "XX-h" ]  ||
	   [ "XX$1" = "XX-l" ]  ||
	   [ "XX$1" = "XX-sp" ] ; then
         shift
      else
         in_prog_args=1
      fi
      shift
   done

   return 0
}

#
# get_appfile (): echoes the application file name given
# by the -f command line option. This returns an empty
# string ("") if -f option is not given
#

get_appfile ()
{
   appfile=""
   while [ $# -gt 0 ] ; do

      if [ "XX$1" = "XX-f" ] ; then
         shift
	 if [ "$appfile" != "" ] ; then
		echo "Encountered multiple -f arguments"
		return 1
	 fi
	 appfile="$1"
      elif [ "XX$1" = "XX-help" ]  ||
         [ "XX$1" = "XX-version" ] ||
         [ "XX$1" = "XX-tv" ] ||
         [ "XX$1" = "XX-commd" ] ||
         [ "XX$1" = "XX-T" ] ||
         [ "XX$1" = "XX-prot" ] ||
         [ "XX$1" = "XX-spawn" ] ||
         [ "XX$1" = "XX-1sided" ] ||
         [ "XX$1" = "XX-ha" ] ||
         [ "XX$1" = "XX-hmp" ] ||
         [ "XX$1" = "XX-client" ] ||
         [ "XX$1" = "XX-itapi" ] ||
         [ "XX$1" = "XX-ITAPI" ] ||
         [ "XX$1" = "XX-TCP" ] ||
         [ "XX$1" = "XX-intra=mix" ] ||
         [ "XX$1" = "XX-intra=nic" ] ||
         [ "XX$1" = "XX-intra=shm" ] ||
         [ "XX$1" = "XX-cpu_bind" ] ||
         [ "XX$1" = "XX-dd" ] ||
         [ "XX$1" = "XX-ndd" ] ||
         [ "XX$1" = "XX-rdma" ] ||
         [ "XX$1" = "XX-srq" ] ||
         [ "XX$1" = "XX-ibv" ] ||
         [ "XX$1" = "XX-IBV" ] ||
         [ `echo "$1" | egrep -c "^\-[djpv]+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-stdio=.+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-aff=.+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-universe_size=.+"` -ne 0 ] ||
         [ "XX$1" = "XX-ck" ] ; then
         shift
         continue

#      NOTE: we're using egrep for
#            regular expression matching
#            as expr MATCH doesn't seemed
#            to work under HP

      elif [ "XX$1" = "XX-i" ]  ||
           [ "XX$1" = "XX-e" ]	||
	   [ "XX$1" = "XX-np" ] ||
	   [ "XX$1" = "XX-h" ]  ||
	   [ "XX$1" = "XX-l" ]  ||
           [ "XX$1" = "XX-netaddr" ] ||
           [ "XX$1" = "XX-subnet" ] ||
	   [ "XX$1" = "XX-sp" ] ; then
         shift
      else
         break
      fi

      shift
   done
   echo $appfile
   return 0
}

# is_prun_specified(): given as input the HP mpirun
# command line arguments of the form:
#
#   mpirun [-help] [-version] [-jv] [-i <spec>]
#          [-spawn] [-1sided] [-universe_size=#] [-sp <paths>]
#          [-T] [-prot] [-e var[=val]] [...] -prun <prun-options> <program> [<args>]
#
# RETURN:
#  Echoes 1 if one of the arguments is "-prun"; 0 otherwise.
#

is_prun_specified ()
{
   is_prun=0

   while [ $# -gt 0 ] ; do

      if [ "XX$1" = "XX-prun" ] ; then
         is_prun=1
         break
      elif [ "XX$1" = "XX-help" ]  ||
         [ "XX$1" = "XX-version" ] ||
         [ "XX$1" = "XX-tv" ] ||
         [ "XX$1" = "XX-commd" ] ||
         [ "XX$1" = "XX-T" ] ||
         [ "XX$1" = "XX-prot" ] ||
         [ "XX$1" = "XX-spawn" ] ||
         [ "XX$1" = "XX-1sided" ] ||
         [ "XX$1" = "XX-ha" ] ||
         [ "XX$1" = "XX-hmp" ] ||
         [ "XX$1" = "XX-client" ] ||
         [ "XX$1" = "XX-itapi" ] ||
         [ "XX$1" = "XX-ITAPI" ] ||
         [ "XX$1" = "XX-TCP" ] ||
         [ "XX$1" = "XX-intra=mix" ] ||
         [ "XX$1" = "XX-intra=nic" ] ||
         [ "XX$1" = "XX-intra=shm" ] ||
         [ "XX$1" = "XX-cpu_bind" ] ||
         [ "XX$1" = "XX-dd" ] ||
         [ "XX$1" = "XX-ndd" ] ||
         [ "XX$1" = "XX-rdma" ] ||
         [ "XX$1" = "XX-srq" ] ||
         [ "XX$1" = "XX-ibv" ] ||
         [ "XX$1" = "XX-IBV" ] ||
         [ `echo "$1" | egrep -c "^\-[djpv]+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-stdio=.+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-aff=.+"` -ne 0 ] ||
         [ `echo "$1" | egrep -c "^\-universe_size=.+"` -ne 0 ] ||
         [ "XX$1" = "XX-ck" ] ; then
         shift
         continue

#      NOTE: we're using egrep for
#            regular expression matching
#            as expr MATCH doesn't seemed
#            to work under HP

      elif [ "XX$1" = "XX-i" ]  ||
           [ "XX$1" = "XX-e" ]	||
           [ "XX$1" = "XX-f" ]	||
	   [ "XX$1" = "XX-np" ] ||
	   [ "XX$1" = "XX-h" ]  ||
	   [ "XX$1" = "XX-l" ]  ||
           [ "XX$1" = "XX-netaddr" ] ||
           [ "XX$1" = "XX-subnet" ] ||
	   [ "XX$1" = "XX-sp" ] ; then
         shift
      else
         break
      fi

      shift
   done
   echo $is_prun
}

#
# get_appfile_args_nonp (): same as get_appfile_args ()
#             except -np argument is
#             stripped out.
#
get_appfile_args_nonp ()
{
   line=$*

   args=""
   in_program_args=0
   while [ $# -gt 0 ] ; do

      if [ $in_program_args -eq 1 ] ; then
         args="$args $1"
      elif [ "XX$1" = "XX-e" ]  ||
           [ "XX$1" = "XX-sp" ] ; then
         args="$args $1"
         shift
         args="$args $1"

#      NOTE: we're using egrep for
#            regular expression matching
#            as expr MATCH doesn't seemed
#            to work under HP

      elif [ "XX$1" = "XX-h" ]  ||
           [ "XX$1" = "XX-l" ]  ||
           [ "XX$1" = "XX-np" ]  ||
           [ "XX$1" = "XX-i" ] ; then
   	 shift

      elif [ "XX$1" = "XX--" ] ; then
         break
      elif [ `echo "$1" | egrep -c "^\-.+"` -ne 0 ] ; then
         shift
         continue
      else
         args="$args $1"
         in_program_args=1
      fi
      shift
   done
   echo "$args"
}

#
# transform_appfile (): given a <user_appfile> (named in first argument),
#      transform its contents into a PBS-environment
#      friendly <pbs_appfile> (named in second argument)
#      using nodes assigned in <pbs_nodes_file>
#
transform_appfile ()
{
   user_appfile=$1
   pbs_appfile=$2
   pbs_nodes_file=$3

   cat /dev/null > $pbs_appfile

   appfile_num_entries=`wc -l $user_appfile | awk '{print $1}'`
   nodefile_num_entries=`wc -l $pbs_nodes_file | awk '{print $1}'`

   nodefile_rank=0
   appfile_rank=0
   read_appfile $user_appfile
   while [ "$appfile_content" != "" ] ; do

         if [ $appfile_rank -eq 0 ] ; then
            appfile_rank=`get_rank $appfile_content`
         fi

         if [ $nodefile_rank -eq 0 ] ; then
            read_nodefile $pbs_nodes_file
         fi

         while [ "$nodefile_content" != "" ] ; do
            if [ $nodefile_rank -eq 0 ] ; then
               nodefile_rank=`get_rank $nodefile_content`
            fi
            node=`echo $nodefile_content | awk '{print $1}'`

            if [ $appfile_rank -eq $nodefile_rank ] ; then
               echo "-np $appfile_rank -h $node  `get_appfile_args_nonp $appfile_content`" >> $pbs_appfile
               nodefile_rank=0
               break
            elif [ $appfile_rank -gt $nodefile_rank ] ; then
               echo "-np $nodefile_rank -h $node `get_appfile_args_nonp $appfile_content`" >> $pbs_appfile
               appfile_rank=`expr $appfile_rank - $nodefile_rank`
               read_nodefile $pbs_nodes_file
               nodefile_rank=0
               continue
            else
               echo "-np $appfile_rank -h $node `get_appfile_args_nonp $appfile_content`" >> $pbs_appfile
               nodefile_rank=`expr $nodefile_rank - $appfile_rank`

               read_appfile $user_appfile
               if [ "$appfile_content" = "" ] ; then
                  break
               fi
               appfile_rank=`get_rank $appfile_content`
               continue
            fi
         done

#        all nodes have been processed
         if [ "$nodefile_content" = "" ] ; then
            break
         fi

         read_appfile $user_appfile
         appfile_rank=0


   done

#  still more appfile lines to process, but we've cycled through all nodes

   while [ "$appfile_content" != "" ] ; do

      if [ $nodefile_num_entries -eq 0 ] ; then
         break
      fi

      if [ $appfile_rank -eq 0 ] ; then
         appfile_rank=`get_rank $appfile_content`
      fi

      chunk=`expr $appfile_rank / $nodefile_num_entries`

      if [ $chunk -eq 0 ] ; then
         chunk=1
      fi

      reset_nodefile $pbs_nodes_file
      read_nodefile $pbs_nodes_file
      while [ "$nodefile_content" != "" ] ; do
         node=`echo $nodefile_content | awk '{print $1}'`

         rank_remain=`expr $appfile_rank - $chunk`
         if [ $rank_remain -eq 0 ] ; then
            echo "-np $chunk -h $node `get_appfile_args_nonp $appfile_content`" >> $pbs_appfile
            break
         elif [  $rank_remain -lt 0 ] ; then
            echo "-np $appfile_rank -h $node `get_appfile_args_nonp $appfile_content`" >> $pbs_appfile
            break
         else
            echo "-np $chunk -h $node `get_appfile_args_nonp $appfile_content`" >> $pbs_appfile
            appfile_rank=`expr $appfile_rank - $chunk`
         fi

         read_nodefile $pbs_nodes_file

#	 if processed all nodes but appfile not completely satisfied,
#	 we'll continue to round robin through the nodes
	 if [ "$nodefile_content" = "" ] && [ $appfile_rank -gt 0 ] ; then
		reset_nodefile
         	read_nodefile $pbs_nodes_file
	 fi

      done

      read_appfile $user_appfile
      appfile_rank=0

   done
}

#####################################################
# MAIN
#####################################################

. ${PBS_CONF_FILE:-@PBS_CONF_FILE@}
export PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"

# Global variables

user_appfile="${PBS_TMPDIR}/pbs_mpihp_uappfile$$"
pbs_appfile="${PBS_TMPDIR}/pbs_mpihp_pappfile$$"
pbs_nodefile="${PBS_TMPDIR}/pbs_mpihp_nodefile$$"

type mpirun >/dev/null 2>&1
mpirun_found=$?

if [ -h ${PBS_EXEC}/etc/pbs_mpihp ] ; then
   mpirun=`ls -l ${PBS_EXEC}/etc/pbs_mpihp | awk -F "->" '{print $2}'| tr -d ' '`
   if [ ! -x "$mpirun" ] ; then
	echo "mpirun=$mpirun is not executable!"
	exit 127

   fi
elif [ $mpirun_found -eq 0 ] && #    Platform bought HP MPI so match either
     [ `(mpirun -version | egrep -c "HP MPI|Platform") 2>/dev/null` -ne 0 ] ; then
   mpirun=mpirun
else
   echo "HP version of mpirun not found"
   exit 127
fi

name=`basename $0`
if [ "${PBS_NODEFILE:-XX}" = "XX" ]; then
   if [ "$name" != "mpirun" ]; then
      echo "$name: Warning, not running under PBS"
   fi
   $mpirun $*
   exit $?
fi

# mpirun -prun specified, pass all arguments to HP mpirun,
# but keep processes under control of PBS
if [ `is_prun_specified $*` -eq 1 ]; then
   export MPI_REMSH="${PBS_EXEC}/bin/pbs_remsh -j $PBS_JOBID -r ${PBS_RSHCOMMAND:-rsh}"
   $mpirun $*
   exit $?
fi

### get arguments  to appear outside of an appfile
get_global_args $*
if [ $? -eq 1 ] ; then
   echo "-client option is unsupported. Exiting..."
   exit 1
fi

# Signals to catch
trap '(rm -f $user_appfile $pbs_appfile $pbs_nodefile) 2> /dev/null; exit 1;'  1 2 3 9 15

### create interim user appfile
input_appfile=`get_appfile $*`
if [ $? -eq 1 ] ; then
   echo "Encountered multiple -f arguments. Exiting..."
   exit 1
fi

if [ "$input_appfile" = "" ] ; then
   appfile_args=`get_appfile_args $*`
   echo "$appfile_args" > $user_appfile
else
   cat /dev/null > $user_appfile
   while read line
   do
      if [ `is_comment_line $line` -eq 0 ] ; then
         continue
      fi
      appfile_args=`get_appfile_args $line`
      echo "$appfile_args" >> $user_appfile
   done < $input_appfile

fi

### tally up PBS nodes
cat -n ${PBS_NODEFILE} | \
	sort -k2 | uniq -f1 -c | \
	awk '{if ($1 == 1) print $2, $3; else print $2, $3 " -np " $1}' | \
	sort -n | awk '{print $2, $3, $4}' > $pbs_nodefile

### transform appfile to a PBS-friendly appfile
transform_appfile $user_appfile $pbs_appfile $pbs_nodefile

rm -f $user_appfile $pbs_nodefile

export MPI_REMSH="${PBS_EXEC}/bin/pbs_remsh -j $PBS_JOBID -r ${PBS_RSHCOMMAND:-rsh}"

if [ -s $pbs_appfile ] ; then
   $mpirun $global_args -f $pbs_appfile $global_extra_args
   ret=$?
else
   echo "No MPI application to process"
   ret=2
fi

rm -f $pbs_appfile

exit $ret


================================================
FILE: src/cmds/pbs_mpilam.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

mpirun="mpirun"
name=`basename $0`

if [ "${PBS_NODEFILE:-XX}" = "XX" ]; then
	if [ "$name" != "mpirun" ]; then
		echo "$name: Warning, not running under PBS"
	fi
	echo $mpirun $*
	$mpirun $*
	exit $?
fi

start=1
options=""
where=""
prog_args=""
np_spec=0
c_spec=0
while [ $# -gt 0 ]; do

  if [ $start -eq 1 ] ; then
        if [ "XX$1" = "XX-np" ]; then
		np_spec=1
		options="$options $1"
		shift
		options="$options $1"
        elif [ "XX$1" = "XX-c" ]; then
		c_spec=1
		options="$options $1"
		shift
		options="$options $1"
        elif [ "XX$1" = "XX-s" ]     ||
             [ "XX$1" = "XX-x" ]     ||
             [ "XX$1" = "XX-wd" ]    ||
             [ "XX$1" = "XX-p" ] ; then
		options="$options $1"
		shift
		options="$options $1"
        elif [ "XX$1" = "XX-ssi" ] ; then
		options="$options $1"
		shift
		options="$options $1"
		shift
		if [ `echo $1 | wc -w` -gt 1 ] ; then
			options="$options \"$1\""
		else
			options="$options $1"
		fi
	elif [ `expr match "$1" "-\+"` -ne 0 ] ; then
		options="$options $1"
	elif [ `expr match $1 "n\+"` -ne 0 ] 	||
             [ `expr match $1 "c\+"` -ne 0 ]   	||
             [ $1 = "h" ]   			||
             [ $1 = "o" ]   			||
             [ $1 = "N" ]   			||
             [ $1 = "C" ] ; then
		where="$where $1"
	else
		prog_args="$prog_args $1"
                start=0
        fi
  else
	prog_args="$prog_args $1"
  fi
  shift

done

# Under LAM >= 7, need to put a -s (new session)
# option to pbs_attach  so as to not redundantly
# attach the pids of lamds that may have been
# started by tm-enabled lamboot.

if [ `(lamboot -V | egrep -c "LAM 7") 2>/dev/null` -ne 0 ] ; then
	s_opt="-s"
else
	s_opt=""
fi

# no <where> parameter
if [ "${where:-XX}" = "XX" ]; then
	if [ $c_spec -eq 0 ] && [ $np_spec -eq 0 ] ; then
		eval $mpirun $options $prog_args
	else
		eval $mpirun $options C pbs_attach -P -j ${PBS_JOBID} $s_opt $prog_args
	fi
else
	eval $mpirun $options $where pbs_attach -P -j ${PBS_JOBID} $s_opt $prog_args
fi


================================================
FILE: src/cmds/pbs_mpirun.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

mpirun="mpirun"
name=`basename $0`

export PBS_RSHCOMMAND=${P4_RSHCOMMAND:-rsh}
. ${PBS_CONF_FILE:-@PBS_CONF_FILE@}
export P4_RSHCOMMAND=${PBS_EXEC}/bin/pbs_remsh
export MPICH_PROCESS_GROUP=no
export PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"

if [ "${PBS_NODEFILE:-XX}" = "XX" ]; then
	if [ "$name" != "mpirun" ]; then
		echo "$name: Warning, not running under PBS"
	fi
	$mpirun $*
	exit $?
fi

list=""
usernp=`cat ${PBS_NODEFILE} | wc -l`

while [ $# -gt 0 ]; do
	if [ "XX$1" = "XX-np" ]; then
		shift
		usernp=$1
	elif [ "XX$1" = "XX-machinefile" ]; then
		shift
		echo "$name: Warning, -machinefile value replaced by PBS"
	else
		list="$list $1"
	fi
	shift
done

machinefile="${PBS_TMPDIR}/pbs_mpimach$$"
cat -n ${PBS_NODEFILE} | \
	sort -k2 | uniq -f1 -c | \
	awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}' | \
	sort -n | awk '{print $2}' > $machinefile


$mpirun -np $usernp -machinefile $machinefile $list
ret=$?

rm $machinefile
exit $ret


================================================
FILE: src/cmds/pbs_ralter.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#include <sys/types.h>
#include <sys/time.h>
#include <errno.h>
#include <pbs_ifl.h>
#include "cmds.h"
#include "net_connect.h"

#define OPT_BUF_LEN 256

static struct attrl *attrib = NULL;
static time_t dtstart;
static time_t dtend;
int force_alter = FALSE;

/*
 * @brief process options input to the command.
 *
 * @param[in]  argc  - the number of arguments to be parsed.
 * @param[in]  argv  - the argument array.
 * @param[out] attrp - attribute list sent to the caller.
 * @param[out] dest  - destination server.
 *
 * @retval 0 on no error.
 * @retval No. of options having errors.
 */
int
process_opts(int argc, char **argv, struct attrl **attrp, char *dest)
{
	int c = 0;

	int errflg = 0;
	time_t t;

	char time_buf[80] = {0};
	char *endptr = NULL;
	long temp = 0;
	char dur_buf[800];
	int alter_duration = FALSE;

	while ((c = getopt(argc, argv, "E:I:m:M:N:R:q:U:G:D:l:W:")) != EOF) {
		switch (c) {
			case 'E':
				t = cvtdate(optarg);
				if (t >= 0) {
					(void) sprintf(time_buf, "%ld", (long) t);
					set_attr_error_exit(&attrib, ATTR_resv_end, time_buf);
					dtend = t;
				} else {
					fprintf(stderr, "pbs_ralter: illegal -E time value\n");
					errflg++;
				}
				break;

			case 'I':
				temp = strtol(optarg, &endptr, 0);
				if (*endptr == '\0' && temp > 0) {
					set_attr_error_exit(&attrib, ATTR_inter, optarg);
				} else {
					fprintf(stderr, "pbs_ralter: illegal -I time value\n");
					errflg++;
				}
				break;

			case 'm':
				set_attr_error_exit(&attrib, ATTR_m, optarg);
				break;

			case 'M':
				set_attr_error_exit(&attrib, ATTR_M, optarg);
				break;

			case 'N':
				set_attr_error_exit(&attrib, ATTR_resv_name, optarg);
				break;

			case 'R':
				t = cvtdate(optarg);
				if (t >= 0) {
					(void) sprintf(time_buf, "%ld", (long) t);
					set_attr_error_exit(&attrib, ATTR_resv_start, time_buf);
					dtstart = t;
				} else {
					fprintf(stderr, "pbs_ralter: illegal -R time value\n");
					errflg++;
				}
				break;

			case 'q':
				/* destination can only be another server */
				if (optarg[0] != '@') {
					fprintf(stderr, "pbs_ralter: illegal -q value: format \"@server\"\n");
					errflg++;
					break;
				}
				pbs_strncpy(dest, &optarg[1], OPT_BUF_LEN);
				break;

			case 'U':
				set_attr_error_exit(&attrib, ATTR_auth_u, optarg);
				break;
			case 'G':
				set_attr_error_exit(&attrib, ATTR_auth_g, optarg);
				break;

			case 'D':
				snprintf(dur_buf, sizeof(dur_buf), "%s", optarg);
				set_attr_error_exit(&attrib, ATTR_resv_duration, dur_buf);
				alter_duration = TRUE;
				break;
			case 'l':
				if (strncmp(optarg, "select=", 7) == 0)
					set_attr_resc_error_exit(&attrib, ATTR_l, "select", (optarg + 7));
				else {
					fprintf(stderr, "pbs_ralter -l only allows for select\n");
					errflg++;
				}
				break;
			case 'W':
				if (strcmp(optarg, "force") == 0)
					force_alter = TRUE;
				else {
					fprintf(stderr, "pbs_ralter: illegal -W value\n");
					errflg++;
				}
				break;
			default:
				/* pbs_ralter option not recognized */
				errflg++;

		} /* End of lengthy 'switch on option' constuction */
	}	  /* End of lengthy while loop on 'options' */

	/* Check that force option is used with 'R', 'E' or 'D' option */
	if ((force_alter == TRUE) && (dtstart == 0) && (dtend == 0) && (alter_duration == 0)) {
		fprintf(stderr, "pbs_ralter: No support for requested service\n");
		errflg++;
	}
	*attrp = attrib;
	return (errflg);
}

/*
 * @brief - prints correct usage of the command to the console.
 */

static void
print_usage()
{
	static char usag2[] = "       pbs_ralter --version\n";
	static char usage[] =
		"usage: pbs_ralter [-I seconds] [-m mail_points] [-M mail_list]\n"
		"                [-N reservation_name] [-R start_time] [-E end_time]\n"
		"                [-U (+/-)username[,(+/-)username]...]\n"
		"                [-G [(+/-)group[,(+/-)group]...]]\n"
		"                [-D duration]\n"
		"                [-W force]\n"
		"                resv_id\n";
	fprintf(stderr, "%s", usage);
	fprintf(stderr, "%s", usag2);
}

/**
 * @brief
 * 	handles attribute errors and prints appropriate errmsg
 *
 * @param[in] err_list - list of possible attribute errors
 *
 * @return - Void
 *
 */
static void
handle_attribute_errors(struct ecl_attribute_errors *err_list)
{
	struct attropl *attribute = NULL;
	char *opt = NULL;
	int i = 0;

	for (i = 0; i < err_list->ecl_numerrors; i++) {
		attribute = err_list->ecl_attrerr[i].ecl_attribute;
		if (strcmp(attribute->name, ATTR_resv_duration) == 0)
			opt = "D";
		else if (strcmp(attribute->name, ATTR_resv_end) == 0)
			opt = "E";
		else if (strcmp(attribute->name, ATTR_auth_g) == 0)
			opt = "G";
		else if (strcmp(attribute->name, ATTR_inter) == 0)
			opt = "I";
		else if (strcmp(attribute->name, ATTR_m) == 0)
			opt = "m";
		else if (strcmp(attribute->name, ATTR_M) == 0)
			opt = "M";
		else if (strcmp(attribute->name, ATTR_resv_name) == 0)
			opt = "N";
		else if (strcmp(attribute->name, ATTR_resv_start) == 0)
			opt = "R";
		else if (strcmp(attribute->name, ATTR_auth_u) == 0)
			opt = "U";
		else
			return;

		CS_close_app();
		fprintf(stderr, "pbs_ralter: illegal -%s value\n", opt);
		print_usage();
		exit(2);
	}
}

int
main(int argc, char *argv[], char *envp[]) /* pbs_ralter */
{
	int errflg = 0;			 /* command line option error */
	int connect = -1;		 /* return from pbs_connect */
	char *errmsg = NULL;		 /* return from pbs_geterrmsg */
	char destbuf[OPT_BUF_LEN] = {0}; /* buffer for option server */
	struct attrl *attrib = NULL;	 /* the attrib list */
	struct ecl_attribute_errors *err_list = NULL;
	char resv_id[PBS_MAXCLTJOBID] = {0};
	char resv_id_out[PBS_MAXCLTJOBID] = {0};
	char server_out[MAXSERVERNAME] = {0};
	char *stat = NULL;
	char *extend = NULL;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	destbuf[0] = '\0';
	errflg = process_opts(argc, argv, &attrib, destbuf); /* get cmdline options */

	if (errflg || ((optind + 1) != argc) || argc == 1) {
		print_usage();
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "pbs_ralter: unable to initialize security library.\n");
		exit(1);
	}

	/* Connect to the server */
	connect = cnt2server(destbuf);
	if (connect <= 0) {
		fprintf(stderr, "pbs_ralter: cannot connect to server %s (errno=%d)\n",
			pbs_server, pbs_errno);
		CS_close_app();
		exit(pbs_errno);
	}

	pbs_strncpy(resv_id, argv[optind], sizeof(resv_id));
	if (get_server(resv_id, resv_id_out, server_out)) {
		fprintf(stderr, "pbs_ralter: illegally formed reservation identifier: %s\n", resv_id);
		exit(2);
	}

	if (force_alter == TRUE)
		extend = "force";
	stat = pbs_modify_resv(connect, resv_id_out, (struct attropl *) attrib, extend);

	if (stat == NULL) {
		if ((err_list = pbs_get_attributes_in_error(connect)))
			handle_attribute_errors(err_list);

		errmsg = pbs_geterrmsg(connect);
		if (errmsg != NULL) {
			fprintf(stderr, "pbs_ralter: %s\n", errmsg);
		} else
			fprintf(stderr, "pbs_ralter: Error (%d) modifying reservation\n", pbs_errno);
		CS_close_app();
		exit(pbs_errno);
	} else {
		printf("pbs_ralter: %s\n", stat);
		free(stat);
	}
	/* Disconnet from the server. */
	pbs_disconnect(connect);

	CS_close_app();
	exit(0);
}


================================================
FILE: src/cmds/pbs_rdel.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_rdel.c
 * @brief
 *  pbs_rdel - PBS command to delete reservations
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>
#include <stdio.h>
#include <pbs_ifl.h>
#include <cmds.h>

/**
 * @brief
 *	The main function in C - entry point
 *
 * @param[in]  argc - argument count
 * @param[in]  argv - pointer to argument array
 * @param[in]  envp - pointer to environment values
 *
 * @return  int
 * @retval  0 - success
 * @retval  !0 - error
 */
int
main(int argc, char **argv, char **envp)
{
	int c;
	int errflg = 0;
	int any_failed = 0;

	char resv_id[PBS_MAXCLTJOBID]; /* from the command line */

	char resv_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];

	/* destqueue=queue + '@' + server + \0 */
	char dest_queue[PBS_MAXQUEUENAME + PBS_MAXSERVERNAME + 2 + 10] = {'\0'};

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((c = getopt(argc, argv, "q:")) != EOF)
		switch (c) {
			case 'q':
				if (optarg[0] == '\0') {
					fprintf(stderr, "pbs_rdel: illegal -q value\n");
					errflg++;
					break;
				}
				sprintf(dest_queue, "destqueue=%s", optarg);
				break;
			default:
				errflg++;
		}

	if (errflg || optind >= argc) {
		fprintf(stderr, "usage:\tpbs_rdel [-q dest] resv_identifier...\n");
		fprintf(stderr, "      \tpbs_rdel --version\n");
		exit(2);
	}

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "pbs_rdel: unable to initialize security library.\n");
		exit(1);
	}

	for (; optind < argc; optind++) {
		int connect;
		int stat = 0;

		pbs_strncpy(resv_id, argv[optind], sizeof(resv_id));
		if (get_server(resv_id, resv_id_out, server_out)) {
			fprintf(stderr, "pbs_rdel: illegally formed reservation identifier: %s\n", resv_id);
			any_failed = 1;
			continue;
		}

		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "pbs_rdel: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_delresv(connect, resv_id_out, dest_queue);
		if (stat) {
			prt_job_err("pbs_rdel", connect, resv_id_out);
			any_failed = pbs_errno;
		}
		pbs_disconnect(connect);
	}
	CS_close_app();
	exit(any_failed);
}


================================================
FILE: src/cmds/pbs_release_nodes.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    pbs_release_nodes.c
 *
 * @brief
 *
 * 	Send release nodes request to batch job.
 *
 */

#include <pbs_config.h>

#include <errno.h>
#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#define USAGE                                                                              \
	"usage: pbs_release_nodes [-j job_identifier] host_or_vnode1 host_or_vnode2 ...\n" \
	"       pbs_release_nodes [-j job_identifier] -a\n"                                \
	"       pbs_release_nodes [-j job_identifier] -k <select string>\n"                \
	"       pbs_release_nodes [-j job_identifier] -k <node count>\n"                   \
	"       pbs_release_nodes --version\n"

int
main(int argc, char **argv, char **envp) /* pbs_release_nodes */
{
	int c;
	int errflg = 0;
	int any_failed = 0;

	char job_id[PBS_MAXCLTJOBID]; /* from the command line */
	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];
	char *keep_opt = NULL;
	int len;
	char *node_list = NULL;
	int connect;
	int stat = 0;
	int k;
	int all_opt = 0;

#define GETOPT_ARGS "j:k:a"

	/*test for real deal or just version and exit*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	job_id[0] = '\0';
	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF) {
		switch (c) {
			case 'j':
				pbs_strncpy(job_id, optarg, sizeof(job_id));
				break;
			case 'k':
				keep_opt = optarg;
				break;
			case 'a':
				all_opt = 1;
				break;
			default:
				errflg++;
		}
	}
	if (job_id[0] == '\0') {
		char *jid;
		jid = getenv("PBS_JOBID");
		pbs_strncpy(job_id, jid ? jid : "", sizeof(job_id));
	}

	if (all_opt && keep_opt) {
		errflg++;
		fprintf(stderr, "pbs_release_nodes: -a and -k options cannot be used together\n");
	}

	if ((optind != argc) && keep_opt) {
		errflg++;
		fprintf(stderr, "pbs_release_nodes: cannot supply node list with -k option\n");
	}

	if (errflg ||
	    ((optind == argc) && !(all_opt || keep_opt)) ||
	    ((optind != argc) && all_opt)) {
		fprintf(stderr, "%s", USAGE);
		exit(2);
	}

	if (job_id[0] == '\0') {
		fprintf(stderr, "pbs_release_nodes: No jobid given\n");
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "pbs_release_nodes: unable to initialize security library.\n");
		exit(2);
	}

	len = 0;
	for (k = optind; k < argc; k++) {
		len += (strlen(argv[k]) + 1); /* +1 for space */
	}

	node_list = (char *) malloc(len + 1);
	if (node_list == NULL) {
		fprintf(stderr, "failed to malloc to store data (error %d)", errno);
		exit(2);
	}
	node_list[0] = '\0';

	for (k = optind; k < argc; k++) {
		if (k != optind)
			strcat(node_list, "+");
		strcat(node_list, argv[k]);
	}
	if (get_server(job_id, job_id_out, server_out)) {
		fprintf(stderr, "pbs_release_nodes: illegally formed job identifier: %s\n", job_id);
		free(node_list);
		exit(2);
	}

	pbs_errno = 0;
	stat = 0;
	while (1) {
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr,
				"pbs_release_nodes: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			break;
		}

		stat = pbs_relnodesjob(connect, job_id_out, node_list, keep_opt);
		if (stat && (pbs_errno == PBSE_UNKJOBID)) {
			if (locate_job(job_id_out, server_out, rmt_server)) {
				/*
				 * job located at a different server
				 * retry connect on the new server
				 */
				pbs_disconnect(connect);
				strcpy(server_out, rmt_server);
			} else {
				prt_job_err("pbs_release_nodes", connect, job_id_out);
				break;
			}
		} else {
			char *info_msg;

			if (stat && (pbs_errno != PBSE_UNKJOBID)) {
				prt_job_err("pbs_release_nodes", connect, "");
			} else if ((info_msg = pbs_geterrmsg(connect)) != NULL) {
				/* print potential warning message */
				printf("pbs_release_nodes: %s\n", info_msg);
			}
			break;
		}
	}
	any_failed = pbs_errno;

	pbs_disconnect(connect);

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(any_failed);
}


================================================
FILE: src/cmds/pbs_remsh.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

# pbs_remsh might be called in a non-PBS environment causing
# PBS_JOBID and PBS_RSHCOMMAND to not exist. The fix is to pass
# the values to these as arguments to pbs_remsh.

if [ $# -lt 2 ]; then
        echo "Usage: $0 --version"
        echo "Usage: $0 [-j jobid] [-r rshcmd] host [-n] [-l username] command"
        exit 1;
fi

jobid=""
rshcmd=""
while [ $# -gt 1 ]; do
        if [ "XX$1" = "XX-j" ]; then
                shift;
                jobid=$1
                shift;
        elif [ "XX$1" = "XX-r" ]; then
                shift;
                rshcmd=$1
                shift;
        else
                break;
        fi
done

host="$1"
shift

while [ $# -gt 1 ]; do
	if [ "XX$1" = "XX-n" ]; then
		shift;
	elif [ "XX$1" = "XX-l" ]; then
		shift;
		shift;
	else
		break;
	fi
done

if [ ! -z "$jobid" ] ; then
        export PBS_JOBID=$jobid
fi

if [ ! -z "$rshcmd" ] ; then
        export PBS_RSHCOMMAND=$rshcmd
fi

remsh="${PBS_RSHCOMMAND:-rsh} -n"
$remsh "$host" pbs_attach -j "$PBS_JOBID" $*


================================================
FILE: src/cmds/pbs_rstat.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file pbs_rstat.c
 */
#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#include <stdio.h>
#include <stdlib.h>
#include <time.h>
#include <errno.h>
#include "cmds.h"
#include "pbs_ifl.h"

#define DISP_RESV_FULL 0x01    /* -F,-f option - full verbose description */
#define DISP_RESV_NAMES 0x02   /* -B option - Reservation names only */
#define DISP_RESV_DEFAULT 0x04 /* -S option - Default, Short Description */
#define DISP_INCR_WIDTH 0x08   /*  Increases the header width */

/* prototypes */
char *convert_resv_state(char *pcode, int long_str);
void handle_resv(char *resv_id, char *server, int how);
static int check_width;

/**
 * @brief
 *	display_single_reservation - display a single reservation
 *
 * @param[in] resv - the reservation to display
 * @param[in] how - 1: long form (all resv info)
 * 		      2: print reservation name
 *		      4: short form
 *                  8: increase header width
 * @return Void
 *
 */
void
display_single_reservation(struct batch_status *resv, int how)
{
	char *queue_name = NULL;
#ifdef NAS /* localmod 075 */
	char *resv_name = NULL;
#endif /* localmod 075 */
	char *user = NULL;
	char *resv_state = NULL;
	char *resv_start = NULL;
	char *resv_end = NULL;
	time_t resv_duration = 0;
	char *str;
	struct attrl *attrp = NULL;
	time_t tmp_time;
	char tbuf[64];
	char *fmt = "%a %b %d %H:%M:%S %Y";
	attrp = resv->attribs;

	if (how & DISP_RESV_NAMES) { /* display just name of the reservation */
		printf("Resv ID: %s\n", resv->name);
	} else if (how & DISP_RESV_DEFAULT) { /* display short form, default*/
		while (attrp != NULL) {
			if (strcmp(attrp->name, ATTR_queue) == 0)
				queue_name = attrp->value;
			else if (strcmp(attrp->name, ATTR_auth_u) == 0)
				user = attrp->value;
			else if (strcmp(attrp->name, ATTR_resv_start) == 0)
				resv_start = attrp->value;
			else if (strcmp(attrp->name, ATTR_resv_end) == 0)
				resv_end = attrp->value;
			else if (strcmp(attrp->name, ATTR_resv_duration) == 0)
				resv_duration = strtol(attrp->value, NULL, 10);
			else if (strcmp(attrp->name, ATTR_resv_state) == 0)
				resv_state = convert_resv_state(attrp->value, 0); /*short state str*/
#ifdef NAS									  /* localmod 075 */
			else if (strcmp(attrp->name, ATTR_resv_name) == 0)
				resv_name = attrp->value;
#endif /* localmod 075 */

			attrp = attrp->next;
		}
		if (how & DISP_INCR_WIDTH) {
			printf("%-15.15s %-13.13s %-8.8s %-5.5s ",
#ifdef NAS /* localmod 075 */
			       (resv_name ? resv_name : resv->name),
			       queue_name, user, resv_state);
#else
			       resv->name, queue_name, user, resv_state);
#endif
		} else {
			printf("%-10.10s %-8.8s %-8.8s %-5.5s ",
#ifdef NAS /* localmod 075 */
			       (resv_name ? resv_name : resv->name),
			       queue_name, user, resv_state);
#else
			       resv->name, queue_name, user, resv_state);
#endif /* localmod 075 */
		}
		printf("%17.17s / ", convert_time(resv_start));
		printf("%ld / %-17.17s\n", (long) resv_duration, convert_time(resv_end));
	} else { /*display long form (all reservation info)*/
		printf("Resv ID: %s\n", resv->name);
		while (attrp != NULL) {
			if (attrp->resource != NULL)
				printf("%s.%s = %s\n", attrp->name, attrp->resource, show_nonprint_chars(attrp->value));
			else {
				if (strcmp(attrp->name, ATTR_resv_state) == 0) {
					str = convert_resv_state(attrp->value, 1); /* long state str */
				} else if (strcmp(attrp->name, ATTR_resv_start) == 0 ||
					   strcmp(attrp->name, ATTR_resv_end) == 0 ||
					   strcmp(attrp->name, ATTR_ctime) == 0 ||
					   strcmp(attrp->name, ATTR_mtime) == 0 ||
					   strcmp(attrp->name, ATTR_resv_retry) == 0) {
					tmp_time = atol(attrp->value);
					strftime(tbuf, sizeof(tbuf), fmt, localtime((time_t *) &tmp_time));
					str = tbuf;
				} else if (!strcmp(attrp->name, ATTR_resv_execvnodes)) {
					attrp = attrp->next;
					continue;
				} else if (!strcmp(attrp->name, ATTR_resv_standing)) {
					attrp = attrp->next;
					continue;
				} else if (!strcmp(attrp->name, ATTR_resv_timezone)) {
					attrp = attrp->next;
					continue;
				} else if (!strcmp(attrp->name, ATTR_resv_count)) {
					str = attrp->value;
				} else if (!strcmp(attrp->name, ATTR_resv_rrule)) {
					str = attrp->value;
				} else if (!strcmp(attrp->name, ATTR_resv_idx)) {
					str = attrp->value;
				} else {
					str = attrp->value;
				}
				printf("%s = %s\n", attrp->name, show_nonprint_chars(str));
			}
			attrp = attrp->next;
		}
		printf("\n");
	}
}

/**
 * @brief
 *	display - display the resv data
 *
 * @param[in] bstat - the batch_status list to display
 * @param[in] how - 1: long form (all resv info)
 *		      2: print reservation name
 *		      4: short form
 *		      8: increase header width
 *
 *@return Void
 *
 */
void
display(struct batch_status *resv, int how)
{
	struct batch_status *cur; /* loop var - current batch_status in loop */
	static char no_display = 0;

	if (resv == NULL)
		return;

	cur = resv;

	if ((how & DISP_RESV_DEFAULT) && (!no_display)) {
#ifdef NAS /* localmod 075 */
		if (how & DISP_INCR_WIDTH)
			printf("%-15.15s %-13.13s %-8.8s %-5.5s %17.17s / Duration / %s\n",
		else
			printf("%-10.10s %-8.8s %-8.8s %-5.5s %17.17s / Duration / %s\n",
#else
		if (how & DISP_INCR_WIDTH) {
			printf("%-15.15s %-13.13s %-8.8s %-5.5s %17.17s / Duration / %-17.17s\n",
			       "Resv ID", "Queue", "User", "State", "Start", "End");
			printf("-------------------------------------------------------------------------------\n");
		} else {
			printf("%-10.10s %-8.8s %-8.8s %-5.5s %17.17s / Duration / %-17.17s\n",
			       "Resv ID", "Queue", "User", "State", "Start", "End");
			printf("---------------------------------------------------------------------\n");
		}
#endif /* localmod 075 */

		/* only display header once */
		no_display = 1;
	}

	while (cur != NULL) {
		display_single_reservation(cur, how);
		cur = cur->next;
	}
}

int
main(int argc, char *argv[])
{
	int c;			     /* for getopts() */
	int how = DISP_RESV_DEFAULT; /* how the reservation should be display, default to short listing */
	int errflg = 0;
	int i;
	char *resv_id; /* reservation ID from the command line */
	char resv_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((c = getopt(argc, argv, "fFBS")) != EOF) {
		switch (c) {
			case 'F': /* full verbose description */
			case 'f':
				how = DISP_RESV_FULL;
				break;

			case 'B': /* Brief, just the names */
				how = DISP_RESV_NAMES;
				break;

			case 'S': /* short desc, default */
				how = DISP_RESV_DEFAULT;
				break;

			default:
				errflg = 1;
		}
	}

	if (errflg) {
		fprintf(stderr, "Usage:\n\tpbs_rstat [-fFBS] [reservation-id]\n");
		fprintf(stderr, "\tpbs_rstat --version\n");
		exit(1);
	}

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "pbs_rstat: unable to initialize security library.\n");
		exit(1);
	}

	if (optind == argc)
		handle_resv(NULL, NULL, how);
	else {
		for (i = optind; i < argc; i++) {
			resv_id = argv[i];

#ifdef NAS /* localmod 075 */
			if (*resv_id == '@') {
				handle_resv(NULL, resv_id + 1, how);
				continue;
			} else if (get_server(resv_id, resv_id_out, server_out)) {
#else
			if (get_server(resv_id, resv_id_out, server_out)) {
#endif /* localmod 075 */
				fprintf(stderr,
					"pbs_rstat: illegally formed reservation identifier: %s\n", resv_id);
				errflg = 1;
#ifdef NAS /* localmod 075 */
				continue;
			}
#else
			} else
#endif /* localmod 075 */
			handle_resv(resv_id_out, server_out, how);
		}
	}
	CS_close_app();
	exit(errflg);
}

/*
 * @brief
 *	handle_resv - handle connecting to the server, and displaying the
 *			reservations
 *
 * @param[in] resv_id - the id of the reservation
 * @param[in] server  - the server to connect to
 * @param[in] how     - 0: just the names
 *                      1: short display
 *                      2: full display (all attributes)
 *
 * @return Void
 *
 */
void
handle_resv(char *resv_id, char *server, int how)
{
	int pbs_sd;
	struct batch_status *bstat;
	char *errmsg;
	/* for dynamic pbs_rstat width */
	struct batch_status *server_attrs;

	pbs_sd = cnt2server(server);
	if (pbs_sd < 0) {
		fprintf(stderr, "pbs_rstat: cannot connect to server (errno=%d)\n",
			pbs_errno);
		CS_close_app();
		exit(pbs_errno);
	}

	/* check the server attribute max_job_sequence_id value */
	if (check_width == 0) {
		server_attrs = pbs_statserver(pbs_sd, NULL, NULL);
		if (server_attrs == NULL && pbs_errno != PBSE_NONE) {
			if ((errmsg = pbs_geterrmsg(pbs_sd)) != NULL)
				fprintf(stderr, "pbs_rstat: %s\n", errmsg);
			else
				fprintf(stderr, "pbs_rstat: Error %d\n", pbs_errno);
			return;
		}

		if (server_attrs != NULL) {
			int check_seqid_len;
			check_seqid_len = check_max_job_sequence_id(server_attrs);
			if (check_seqid_len == 1) {
				how |= DISP_INCR_WIDTH; /* increased column width*/
			}
			pbs_statfree(server_attrs);
			server_attrs = NULL;
			check_width = 1;
		}
	}

	bstat = pbs_statresv(pbs_sd, resv_id, NULL, NULL);
	if (pbs_errno) {
		errmsg = pbs_geterrmsg(pbs_sd);
		fprintf(stderr, "pbs_rstat: %s\n", errmsg);
	}

	display(bstat, how);
	pbs_statfree(bstat);
}

/*
 * @brief
 *	convert_resv_state - convert the reservation state from a
 *			     string integer enum resv_states value into
 *			     a human readable string
 *
 * @param[out] pcode - the string enum value
 * @param[in] long_str - int value to indicate short or long human readable string to be printed
 *
 * @return - string
 * @retval   "state of reservation"
 *
 */
char *
convert_resv_state(char *pcode, int long_str)
{
	int i;
	static char *resv_strings_short[] =
		{"NO", "UN", "CO", "WT", "TR", "RN", "FN", "BD", "DE", "DJ", "DG", "AL", "IC"};
	static char *resv_strings_long[] =
		{"RESV_NONE", "RESV_UNCONFIRMED", "RESV_CONFIRMED",
		 "RESV_WAIT", "RESV_TIME_TO_RUN", "RESV_RUNNING",
		 "RESV_FINISHED", "RESV_BEING_DELETED", "RESV_DELETED",
		 "RESV_DELETING_JOBS", "RESV_DEGRADED", "RESV_BEING_ALTERED",
		 "RESV_IN_CONFLICT"};

	i = atoi(pcode);
	switch (i) {
		case RESV_NONE:
		case RESV_UNCONFIRMED:
		case RESV_CONFIRMED:
		case RESV_DEGRADED:
		case RESV_WAIT:
		case RESV_TIME_TO_RUN:
		case RESV_RUNNING:
		case RESV_FINISHED:
		case RESV_BEING_DELETED:
		case RESV_DELETED:
		case RESV_DELETING_JOBS:
		case RESV_BEING_ALTERED:
		case RESV_IN_CONFLICT:
			if (long_str == 0) /* short */
				return resv_strings_short[i];
			else
				return resv_strings_long[i];
	}
	return pcode;
}


================================================
FILE: src/cmds/pbs_rsub.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_rsub.c
 * @brief
 *  pbs_rdel - PBS command to submit reservations
 */
#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#include <sys/types.h>
#include <sys/time.h>
#include <errno.h>
#include <pbs_ifl.h>
#include "cmds.h"
#include "net_connect.h"
#include "attribute.h"
#include "portability.h"

#define DEFAULT_INTERACTIVE "-10"
#define OPT_BUF_LEN 256

static struct attrl *attrib = NULL;
static int qmoveflg = FALSE;
static time_t dtstart;
static time_t dtend;
static int is_stdng_resv = 0;
static int is_maintenance_resv = 0;
static int is_job_resv = 0;
static char **maintenance_hosts = NULL;

/* The maximum buffer size that is allowed not to exceed 80 columns.
 * The number 67 (66 chars + 1 EOL) is the result of subtracting the number
 * of characters to print "reserve_rrule=" (14 chars) via pbs_rstat.
 */
char rrule[67];

/**
 * @brief
 *	processes the argument list for pbs_rsub and validates
 *	and sets attribute according to the argument value
 *
 * @param[in] argc - commandline args count
 * @param[in] argv - pointer to argument list
 * @param[in] dest - server option
 *
 * @return errflag
 * @retval 0  Success
 * @retval  !0 Failure
 *
 */
int
process_opts(int argc, char **argv, struct attrl **attrp, char *dest)
{
	int c, i;
	char *erp;
	int errflg = 0;
	char *keyword;
	char *valuewd;
	time_t t;
	char *pc;
	int hhmm = FALSE;

	char time_buf[80];
	char dur_buf[800];
	char badw[] = "pbs_rsub: illegal -W value\n";
	int opt_re_flg = FALSE;
	int opt_inter_flg = FALSE;
	int opt_res_req_flg = FALSE;

	while ((c = getopt(argc, argv, "D:E:I:l:m:M:N:q:r:R:u:U:g:G:H:W:-:")) != EOF) {
		switch (c) {
			case 'D':
				sprintf(dur_buf, "walltime=%s", optarg);
				if ((i = set_resources(&attrib, dur_buf, 0, &erp)) != 0) {
					fprintf(stderr, "pbs_rsub: illegal -D value\n");
					errflg++;
				}
				break;

			case 'E':
				opt_re_flg = TRUE;
				t = cvtdate(optarg);
				if (t >= 0) {
					(void) sprintf(time_buf, "%ld", (long) t);
					set_attr_error_exit(&attrib, ATTR_resv_end, time_buf);
					dtend = t;
				} else {
					fprintf(stderr, "pbs_rsub: illegal -E time value\n");
					errflg++;
				}
				break;

			case 'I':
				opt_inter_flg = TRUE;
				if ((optarg == NULL) || (*optarg == '\0'))
					set_attr_error_exit(&attrib, ATTR_inter, "0");
				else {
					char *endptr;
					(void) strtol(optarg, &endptr, 0);
					if (*endptr == '\0') {
						set_attr_error_exit(&attrib, ATTR_inter, optarg);
					} else {
						fprintf(stderr, "pbs_rsub: illegal -I time value\n");
						errflg++;
					}
				}
				break;

			case 'l':
				opt_res_req_flg = TRUE;
				if ((i = set_resources(&attrib, optarg, 0, &erp)) != 0) {
					if (i > 1) {
						pbs_prt_parse_err("pbs_rsub: illegal -l value\n", optarg,
								  (int) (erp - optarg), i);
					} else
						fprintf(stderr, "pbs_rsub: illegal -l value\n");
					errflg++;
				}
				break;

			case 'm':
				while (isspace((int) *optarg))
					optarg++;
				set_attr_error_exit(&attrib, ATTR_m, optarg);
				break;

			case 'M':
				set_attr_error_exit(&attrib, ATTR_M, optarg);
				break;

			case 'N':
				set_attr_error_exit(&attrib, ATTR_resv_name, optarg);
				break;

			case 'q':
				/* destination can only be another server */
				if (optarg[0] != '@') {
					fprintf(stderr, "pbs_rsub: illegal -q value: format \"@server\"\n");
					errflg++;
					break;
				}
				pbs_strncpy(dest, &optarg[1], OPT_BUF_LEN);
				break;

			case 'R':
				opt_re_flg = TRUE;
				t = cvtdate(optarg);
				if (t >= 0) {
					(void) sprintf(time_buf, "%ld", (long) t);
					set_attr_error_exit(&attrib, ATTR_resv_start, time_buf);
					dtstart = t;
				} else {
					fprintf(stderr, "pbs_rsub: illegal -R time value\n");
					errflg++;
				}
				if ((pc = strchr(optarg, (int) '.')) != 0) {
					if ((pc - optarg) == 4)
						hhmm = TRUE;
				} else if ((strlen(optarg)) == 4)
					hhmm = TRUE;
				break;

			case 'r':
				is_stdng_resv = 1;
				set_attr_error_exit(&attrib, ATTR_resv_rrule, optarg);
				set_attr_error_exit(&attrib, ATTR_resv_standing, "1");
				if (strlen(optarg) > sizeof(rrule) - 1) {
					fprintf(stderr, "pbs_rsub: illegal -r value (expression too long)\n");
					errflg++;
					break;
				}
				pbs_strncpy(rrule, optarg, sizeof(rrule));
				break;

			case 'u':
				set_attr_error_exit(&attrib, ATTR_u, optarg);
				break;

			case 'U':
				set_attr_error_exit(&attrib, ATTR_auth_u, optarg);
				break;

			case 'g':
				set_attr_error_exit(&attrib, ATTR_g, optarg);
				break;

			case 'G':
				set_attr_error_exit(&attrib, ATTR_auth_g, optarg);
				break;

			case 'H':
				set_attr_error_exit(&attrib, ATTR_auth_h, optarg);
				break;

			case 'W':
				while (isspace((int) *optarg))
					optarg++;

				if (strlen(optarg) == 0) {
					fprintf(stderr, "pbs_rsub: illegal -W value\n");
					errflg++;
					break;
				}

				i = parse_equal_string(optarg, &keyword, &valuewd);
				while (i == 1) {
					if (strcmp(keyword, ATTR_convert) == 0)
						qmoveflg = TRUE;

					set_attr_error_exit(&attrib, keyword, valuewd);

					/* move to next attribute in this "-W" specification */

					i = parse_equal_string(NULL, &keyword, &valuewd);
				}

				if (i == -1) {
					fprintf(stderr, "%s", badw);
					errflg++;
				}
				break;

			case '-':
				if (strcmp(optarg, "hosts") == 0)
					is_maintenance_resv = 1;
				else if (strcmp(optarg, "job") == 0) {
					set_attr_error_exit(&attrib, ATTR_resv_job, argv[optind]);
					is_job_resv = 1;
					++optind;
				} else
					errflg++;
				break;

			default:
				/* pbs_rsub option not recognized */
				errflg++;

		} /* End of lengthy 'switch on option' constuction */
	}	  /* End of lengthy while loop on 'options' */

	if (opt_re_flg == TRUE && qmoveflg == TRUE) {
		fprintf(stderr, "pbs_rsub: -Wqmove is not compatible with -R or -E option\n");
		errflg++;
	}

	if (opt_inter_flg && is_maintenance_resv) {
		fprintf(stderr, "pbs_rsub: can't use -I with --hosts\n");
		errflg++;
	}

	if (opt_res_req_flg && is_maintenance_resv) {
		fprintf(stderr, "pbs_rsub: can't use -l with --hosts\n");
		errflg++;
	}

	if (is_maintenance_resv) {
		char **hostp = NULL;
		int num_hosts = argc - optind;

		if (num_hosts > 0) {
			int i;

			maintenance_hosts = malloc(sizeof(char *) * (num_hosts + 1));
			if (maintenance_hosts == NULL) {
				fprintf(stderr, "pbs_rsub: Out of memory\n");
				return (++errflg);
			}

			maintenance_hosts[0] = NULL;

			for (i = 0; optind < argc; optind++, i++) {
				hostp = maintenance_hosts;
				for (; *hostp; hostp++) {
					if (strcmp(*hostp, argv[optind]) == 0) {
						fprintf(stderr, "pbs_rsub: Duplicate host: %s\n", argv[optind]);
						return (++errflg);
					}
				}

				if (strlen(argv[optind]) == 0) {
					i--;
					continue;
				}

				maintenance_hosts[i + 1] = NULL;
				maintenance_hosts[i] = strdup(argv[optind]);
				if (maintenance_hosts[i] == NULL) {
					fprintf(stderr, "pbs_rsub: Out of memory\n");
					return (++errflg);
				}
			}
		}

		if (maintenance_hosts == NULL) {
			fprintf(stderr, "pbs_rsub: missing host(s)\n");
			return (++errflg);
		}
	}

	if (is_job_resv && ((dtstart != 0) || (dtend != 0))) {
		fprintf(stderr, "pbs_rsub: Start/End time cannot be used with --job option");
		fprintf(stderr, "\n");
		return (++errflg);
	}

	if ((hhmm == TRUE) && (dtend != 0) && (dtend < dtstart)) {
		/* if end time is behind the start time, move it to the next day */
		time_t skew = 60 * 60 * 24;
		dtend += skew;
		sprintf(time_buf, "%ld", (long) dtend);
		set_attr_error_exit(&attrib, ATTR_resv_end, time_buf);
	}

	if (!errflg) {
		errflg = (optind != argc);
		if (errflg) {
			fprintf(stderr, "pbs_rsub: directive error: ");
			for (optind = 1; optind < argc; optind++)
				fprintf(stderr, "%s ", argv[optind]);
			fprintf(stderr, "\n");
		}
	}

	*attrp = attrib;
	return (errflg);
}

/**
 * @brief
 *	sets the environment for reservation
 *
 * @param[in] envp - pointer to pointer to the environment variable
 *
 * @return - Boolean value
 * @retval   TRUE  Success
 * @retval   FALSE Failure
 *
 */
int
set_resv_env(char **envp)
{
	char *resv_env;
	char *c, *env;
	char host[PBS_MAXHOSTNAME + 1];
	int len;
	int rc;

	/* Calculate how big to make the variable string. */
	len = 0;
	env = getenv("HOME");
	if (env != NULL)
		len += strlen(env);
	env = getenv("LANG");
	if (env != NULL)
		len += strlen(env);
	env = getenv("LOGNAME");
	if (env != NULL)
		len += strlen(env);
	env = getenv("PATH");
	if (env != NULL)
		len += strlen(env);
	env = getenv("MAIL");
	if (env != NULL)
		len += strlen(env);
	env = getenv("SHELL");
	if (env != NULL)
		len += strlen(env);
	env = getenv("TZ");
	if (env != NULL)
		len += strlen(env);
	len += PBS_MAXHOSTNAME;
	len += MAXPATHLEN;
	len += len; /* Double it for all the commas, etc. */
	if ((resv_env = (char *) malloc(len)) == NULL) {
		fprintf(stderr, "pbs_rsub: Out of memory\n");
		return FALSE;
	}
	*resv_env = '\0';

	/* Send the required variables with the reservation. */
	c = getenv("LOGNAME");
	if (c != NULL) {
		strcat(resv_env, "PBS_O_LOGNAME=");
		strcat(resv_env, c);
	}
	if ((rc = gethostname(host, (sizeof(host) - 1))) == 0) {
		if ((rc = get_fullhostname(host, host, (sizeof(host) - 1))) == 0) {
			if (*resv_env)
				strcat(resv_env, ",PBS_O_HOST=");
			else
				strcat(resv_env, "PBS_O_HOST=");
			strcat(resv_env, host);
		}
	}

	c = getenv("MAIL");
	if (c != NULL) {
		fix_path(c, 1);
		strcat(resv_env, ",PBS_O_MAIL=");
		strcat(resv_env, c);
	}
	if (rc != 0) {
		fprintf(stderr, "pbs_rsub: cannot get full local host name\n");
		exit(3);
	}
	c = getenv("PBS_TZID");
	if (c != NULL) {
		strcat(resv_env, ",PBS_TZID=");
		strcat(resv_env, c);
		set_attr_error_exit(&attrib, ATTR_resv_timezone, c);
	} else if (is_stdng_resv) {
		fprintf(stderr, "pbs_rsub error: a valid PBS_TZID timezone environment variable is required.\n");
		exit(2);
	}

	set_attr_error_exit(&attrib, ATTR_v, resv_env);
	free(resv_env);
	return TRUE;
}

/**
 * @brief
 *	converts and processes the attribute values
 *
 * @param[in] connect - indiacation for connection of server
 * @param[in] attrp   - attribute list
 * @param[in] dest    - server option
 *
 * @return - int
 * @retval   0 Success
 * @retval   exits on failure
 *
 */
int
cnvrt_proc_attrib(int connect, struct attrl **attrp, char *dest)
{
	char *str;
	int setflag, cnt = 0;
	struct attropl *jobid_ptr;
	struct batch_status *p, *p_status;
	struct attrl *a, *ap, *apx, *attr, *cmd_attr;
	char time_buf[80];
	char job[PBS_MAXCLTJOBID];
	char server[MAXSERVERNAME];

	jobid_ptr = (struct attropl *) attrib;
	while (jobid_ptr != NULL) {
		if (strcmp(jobid_ptr->name, ATTR_convert) == 0)
			break;
		jobid_ptr = jobid_ptr->next;
	}

	if (get_server(jobid_ptr->value, job, server)) {
		fprintf(stderr, "pbs_rsub: illegally formed job identifier: %s\n", jobid_ptr->value);
		exit(-1);
	}
	/* update value string with full job-id (seqnum.server) */
	(void) free(jobid_ptr->value);
	jobid_ptr->value = strdup(job);
	if (jobid_ptr->value == NULL) {
		fprintf(stderr, "Out of memory\n");
		exit(2);
	}

	p_status = pbs_statjob(connect, jobid_ptr->value, NULL, NULL);
	if (p_status == NULL) {
		fprintf(stderr, "Job %s does not exist\n", jobid_ptr->value);
		exit(2);
	}

	p = p_status;
	while (p != NULL) {
		a = p->attribs;
		while (a != NULL) {
			if (a->name != NULL) {
				/* avoid qmove job in R, T or E state */
				if (strcmp(a->name, ATTR_state) == 0) {
					if (strcmp(a->value, "R") == 0 ||
					    strcmp(a->value, "T") == 0 ||
					    strcmp(a->value, "E") == 0) {
						fprintf(stderr, "Job not in qmove state\n");
						exit(2);
					}
				} else {
					if (strcmp(a->name, ATTR_l) == 0 &&
					    strcmp(a->resource, "nodect") != 0 &&
					    strcmp(a->resource, "neednodes") != 0) {
						setflag = FALSE;
						ap = attrib;
						while (ap != NULL) {
							if (ap->resource != NULL) {
								if (strcmp(ap->resource, a->resource) == 0) {
									setflag = TRUE;
								}
							}
							if (ap->next == NULL && setflag == FALSE) {
								attr = new_attrl();
								if (attr == NULL) {
									fprintf(stderr, "pbs_rsub: Out of memory\n");
									exit(2);
								}

								str = strdup(ATTR_l);
								if (str == NULL) {
									fprintf(stderr, "pbs_rsub: Out of memory\n");
									exit(2);
								}
								attr->name = str;

								str = strdup(a->resource);
								if (str == NULL) {
									fprintf(stderr, "pbs_rsub: Out of memory\n");
									exit(2);
								}
								attr->resource = str;

								if (a->value != NULL) {
									str = strdup(a->value);
									if (str == NULL) {
										fprintf(stderr, "pbs_rsub: Out of memory\n");
										exit(2);
									}
									attr->value = str;
								} else {
									str = (char *) malloc(1);
									if (str == NULL) {
										fprintf(stderr, "pbs_rsub: Out of memory\n");
										exit(2);
									}
									str[0] = '\0';
									attr->value = str;
								}
								attr->next = NULL;
								ap->next = attr;
								ap = ap->next;
							}
							setflag = FALSE;
							ap = ap->next;
						}
					}
				}
			}
			a = a->next;
		}
		p = p->next;
	}
	pbs_statfree(p_status);

	cmd_attr = attrib;
	while (cmd_attr != NULL) {
		if (strcmp(cmd_attr->name, ATTR_resv_start) == 0 ||
		    strcmp(cmd_attr->name, ATTR_resv_end) == 0) {
			if (cmd_attr->name != NULL)
				free(cmd_attr->name);
			if (cmd_attr->resource != NULL)
				free(cmd_attr->resource);
			if (cmd_attr->value != NULL)
				free(cmd_attr->value);
			apx = cmd_attr->next;
			free(cmd_attr);
			cmd_attr = apx;
			if (cnt == 0)
				attrib = cmd_attr;
			cnt++;
		} else
			cmd_attr = cmd_attr->next;
	}

	(void) sprintf(time_buf, "%ld", PBS_RESV_FUTURE_SCH);
	set_attr_error_exit(&attrib, ATTR_resv_start, time_buf);
	*attrp = attrib;

	return (0);
}

/**
 * @brief
 * 	prints usage format for pbs_rsub command
 *
 * @return - Void
 *
 */
static void
print_usage()
{
	static char usag2[] = "       pbs_rsub --version\n";
	static char usage[] =
		"usage: pbs_rsub [-I seconds] [-m mail_points] [-M mail_list]\n"
		"                [-N reservation_name] [-u user_list] [-g group_list]\n"
		"                [-U auth_user_list] [-G auth_group_list] [-H auth_host_list]\n"
		"                [-R start_time] [-E end_time] [-D duration] [-q destination]\n"
		"                [-r rrule_expression] [-W otherattributes=value...]\n"
		"                -l resource_list | --hosts host1 [... hostn]\n";

	fprintf(stderr, "%s", usage);
	fprintf(stderr, "%s", usag2);
}

/**
 * @brief
 * 	handles attribute errors and prints appropriate errmsg
 *
 * @param[in] err_list - list of possible attribute errors
 *
 * @return - Void
 *
 */
static void
handle_attribute_errors(struct ecl_attribute_errors *err_list)
{
	struct attropl *attribute;
	char *opt;
	int i;

	for (i = 0; i < err_list->ecl_numerrors; i++) {
		attribute = err_list->ecl_attrerr[i].ecl_attribute;
		if (strcmp(attribute->name, ATTR_resv_end) == 0)
			opt = "E";
		else if (strcmp(attribute->name, ATTR_g) == 0)
			opt = "g";
		else if (strcmp(attribute->name, ATTR_auth_g) == 0)
			opt = "G";
		else if (strcmp(attribute->name, ATTR_auth_h) == 0)
			opt = "H";
		else if (strcmp(attribute->name, ATTR_inter) == 0)
			opt = "I";
		else if (strcmp(attribute->name, ATTR_l) == 0)
			opt = "l";
		else if (strcmp(attribute->name, ATTR_m) == 0)
			opt = "m";
		else if (strcmp(attribute->name, ATTR_M) == 0)
			opt = "M";
		else if (strcmp(attribute->name, ATTR_resv_name) == 0)
			opt = "N";
		else if (strcmp(attribute->name, ATTR_resv_start) == 0)
			opt = "R";
		else if (strcmp(attribute->name, ATTR_resv_rrule) == 0)
			opt = "r";
		else if (strcmp(attribute->name, ATTR_u) == 0)
			opt = "u";
		else if (strcmp(attribute->name, ATTR_auth_u) == 0)
			opt = "U";
		else if (strcmp(attribute->name, ATTR_convert) == 0)
			opt = "W";
		else
			return;

		CS_close_app();
		if (*opt == 'l') {
			fprintf(stderr, "pbs_rsub: %s\n",
				err_list->ecl_attrerr[i].ecl_errmsg);
			exit(err_list->ecl_attrerr[i].ecl_errcode);
		} else if (err_list->ecl_attrerr->ecl_errcode == PBSE_JOBNBIG) {
			fprintf(stderr, "pbs_rsub: Reservation %s \n", err_list->ecl_attrerr->ecl_errmsg);
			exit(2);
		} else {
			fprintf(stderr, "pbs_rsub: illegal -%s value\n", opt);
			print_usage();
			exit(2);
		}
	}
}

/**
 * @brief
 *	The main function in C - entry point
 *
 * @param[in]  argc - argument count
 * @param[in]  argv - pointer to argument array
 * @param[in]  envp - pointer to environment values
 *
 * @return  int
 * @retval  0 - success
 * @retval  !0 - error
 */
int
main(int argc, char *argv[], char *envp[])
{
	int errflg;		   /* command line option error */
	int connect;		   /* return from pbs_connect */
	char *errmsg;		   /* return from pbs_geterrmsg */
	char destbuf[OPT_BUF_LEN]; /* buffer for option server */
	struct attrl *attrib;	   /* the attrib list */
	char *new_resvname;	   /* the name returned from pbs_submit_resv */
	struct ecl_attribute_errors *err_list;
	char *interactive = NULL;
	char *reservid = NULL;
	char extend[2];
	struct batch_status *bstat_head = NULL;
	struct batch_status *bstat = NULL;
	struct attrl *pattr = NULL;
	char *execvnodes_str = NULL;
	int execvnodes_str_size = 0;
	char *select_str = NULL;
	int select_str_size = 0;
	char **hostp = NULL;
	struct attrl *pal;
	char *erp;
	char *host = NULL;
	char *endp; /* used for strtol() */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	destbuf[0] = '\0';
	extend[0] = '\0';
	errflg = process_opts(argc, argv, &attrib, destbuf); /* get cmdline options */

	if (errflg || ((optind + 1) < argc) || argc == 1) {
		print_usage();
		exit(2);
	}

	if (is_maintenance_resv) {
		pal = attrib;
		while (pal) {
			if ((strcasecmp(pal->name, ATTR_l) == 0) &&
			    (strcasecmp(pal->resource, "select") == 0)) {
				fprintf(stderr, "pbs_rsub: can't use -l select with --hosts\n");
				print_usage();
				exit(2);
			}
			if ((strcasecmp(pal->name, ATTR_l) == 0) &&
			    (strcasecmp(pal->resource, "place") == 0)) {
				fprintf(stderr, "pbs_rsub: can't use -l place with --hosts\n");
				print_usage();
				exit(2);
			}
			pal = pal->next;
		}
	}

	/* Get any required environment variables needing to be sent. */
	if (!set_resv_env(envp)) {
		fprintf(stderr, "pbs_rsub: can't send environment with the reservation\n");
		exit(3);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "pbs_rsub: unable to initialize security library.\n");
		exit(1);
	}

	/* Connect to the server */
	connect = cnt2server(destbuf);
	if (connect <= 0) {
		fprintf(stderr, "pbs_rsub: cannot connect to server %s (errno=%d)\n",
			pbs_server, pbs_errno);
		CS_close_app();
		exit(pbs_errno);
	}

	if (qmoveflg == TRUE) {
		qmoveflg = FALSE;
		interactive = get_attr(attrib, ATTR_inter, NULL);
		if (interactive == NULL) {
			set_attr_error_exit(&attrib, ATTR_inter, DEFAULT_INTERACTIVE);
		} else {
			if (atoi(interactive) > -1) {
				fprintf(stderr, "pbs_rsub: -I <timeout> value must be negative when used with -Wqmove option.\n");
				CS_close_app();
				exit(2);
			}
		}
		errflg = cnvrt_proc_attrib(connect, &attrib, destbuf);
		if (errflg) {
			fprintf(stderr, "pbs_rsub: can't make a reservation with the qmove option\n");
			CS_close_app();
			exit(2);
		}
	}

	if (is_maintenance_resv) {
		int i;
		char tmp_str[BUF_SIZE];
		char *endp;

		pbs_errno = 0;
		bstat_head = pbs_statvnode(connect, "", NULL, NULL);
		if (bstat_head == NULL) {
			if (pbs_errno) {
				errmsg = pbs_geterrmsg(connect);
				if (errmsg != NULL) {
					fprintf(stderr, "pbs_rsub: %s\n", errmsg);
				} else {
					fprintf(stderr, "pbs_rsub: Error (%d) submitting reservation\n", pbs_errno);
				}
			} else {
				fprintf(stderr, "pbs_rsub: No nodes found\n");
			}

			CS_close_app();
			exit(pbs_errno);
		}

		hostp = maintenance_hosts;
		for (; *hostp; hostp++) {
			int host_ncpus = 0;

			for (bstat = bstat_head; bstat; bstat = bstat->next) {
				char *ncpus_str = NULL;
				int ncpus = 0;

				for (pattr = bstat->attribs; pattr; pattr = pattr->next) {
					if (pattr->resource && strcmp(pattr->name, ATTR_rescavail) == 0 && strcmp(pattr->resource, "host") == 0)
						host = pattr->value;
					if (pattr->resource && strcmp(pattr->name, ATTR_rescavail) == 0 && strcmp(pattr->resource, "ncpus") == 0)
						ncpus_str = pattr->value;
				}

				if (ncpus_str != NULL)
					ncpus = strtol(ncpus_str, &endp, 0);

				if (*endp != '\0') {
					fprintf(stderr, "pbs_rsub: Attribute value error\n");
					CS_close_app();
					exit(2);
				}

				/* here, the execvnodes is crafted */
				if (strcmp(host, *hostp) == 0 && ncpus > 0) {
					/* count ncpus of a host across vnodes
					 * it will be used for crafting select
					 */
					host_ncpus += ncpus;

					if (!execvnodes_str) {
						execvnodes_str = malloc(BUF_SIZE);
						if (execvnodes_str == NULL) {
							fprintf(stderr, "pbs_rsub: Out of memory\n");
							CS_close_app();
							exit(2);
						}
						execvnodes_str_size = BUF_SIZE;

						snprintf(execvnodes_str, BUF_SIZE, "(%s:ncpus=%d)", bstat->name, ncpus);
					} else {
						snprintf(tmp_str, BUF_SIZE, "+(%s:ncpus=%d)", bstat->name, ncpus);

						if (pbs_strcat(&execvnodes_str, &execvnodes_str_size, tmp_str) == NULL) {
							fprintf(stderr, "pbs_rsub: Out of memory\n");
							CS_close_app();
							exit(2);
						}
					}
				} /* end of part that crafts execvnodes */
			}

			/* host not found or host has zero ncpus */
			if (host_ncpus == 0) {
				fprintf(stderr, "pbs_rsub: Host with resources not found: %s\n", *hostp);
				CS_close_app();
				exit(2);
			}

			/* here, the select is crafted */
			if (host_ncpus > 0) {
				if (!select_str) {
					select_str = malloc(BUF_SIZE);
					if (select_str == NULL) {
						fprintf(stderr, "pbs_rsub: Out of memory\n");
						CS_close_app();
						exit(2);
					}
					select_str_size = BUF_SIZE;

					snprintf(select_str, BUF_SIZE, "select=host=%s:ncpus=%d", *hostp, host_ncpus);
				} else {
					snprintf(tmp_str, BUF_SIZE, "+host=%s:ncpus=%d", *hostp, host_ncpus);

					if (pbs_strcat(&select_str, &select_str_size, tmp_str) == NULL) {
						fprintf(stderr, "pbs_rsub: Out of memory\n");
						CS_close_app();
						exit(2);
					}
				}
			} /* end of part that crafts select */
		}

		pbs_statfree(bstat_head); /* free info returned by pbs_statvnodes() */

		if (select_str == NULL) {
			fprintf(stderr, "pbs_rsub: missing host(s)\n");
			print_usage();

			CS_close_app();
			exit(2);
		}

		/* add crafted select */
		if ((i = set_resources(&attrib, select_str, 0, &erp)) != 0) {
			if (i > 1) {
				pbs_prt_parse_err("pbs_rsub: illegal -l value\n", select_str,
						  (int) (erp - select_str), i);
			} else {
				fprintf(stderr, "pbs_rsub: illegal -l value\n");
			}

			CS_close_app();
			exit(pbs_errno);
		}

		/* add place=exclhost */
		if (set_resources(&attrib, "place=exclhost", 0, &erp) != 0) {
			fprintf(stderr, "pbs_rsub: illegal -l value\n");

			CS_close_app();
			exit(pbs_errno);
		}

		strcat(extend, "m");
	}

	pbs_errno = 0;
	new_resvname = pbs_submit_resv(connect, (struct attropl *) attrib, extend);
	if (new_resvname == NULL) {
		if ((err_list = pbs_get_attributes_in_error(connect)))
			handle_attribute_errors(err_list);

		errmsg = pbs_geterrmsg(connect);
		if (errmsg != NULL) {
			fprintf(stderr, "pbs_rsub: %s\n", errmsg);
		} else
			fprintf(stderr, "pbs_rsub: Error (%d) submitting reservation\n", pbs_errno);
		CS_close_app();
		exit(pbs_errno);
	}

	if (is_maintenance_resv) {
		char *rest;
		char *resv_start_time_str;
		time_t resv_start_time = 0;

		reservid = strtok_r(new_resvname, " ", &rest);

		resv_start_time_str = get_attr(attrib, ATTR_resv_start, NULL);
		if (resv_start_time_str)
			resv_start_time = strtol(resv_start_time_str, &endp, 10);

		pbs_errno = 0;
		if (pbs_confirmresv(connect, reservid, execvnodes_str, resv_start_time, PBS_RESV_CONFIRM_SUCCESS) > 0) {
			errmsg = pbs_geterrmsg(connect);
			if (errmsg == NULL)
				errmsg = "";

			fprintf(stderr, "pbs_rsub: PBS Failed to confirm resv: %s (%d)\n", errmsg, pbs_errno);

			CS_close_app();
			exit(pbs_errno);
		}

		printf("%s CONFIRMED\n", reservid);
	} else {
		printf("%s\n", new_resvname);
	}

	free(new_resvname);

	if (maintenance_hosts) {
		hostp = maintenance_hosts;
		for (; *hostp; hostp++)
			free(*hostp);
		free(maintenance_hosts);
	}

	/* Disconnet from the server. */
	pbs_disconnect(connect);

	CS_close_app();
	exit(0);
}


================================================
FILE: src/cmds/pbs_tmrsh.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_tmrsh.c
 * @brief
 * pbs_tmrsh - a replacement for rsh using the Task Management API
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <pwd.h>
#include <netdb.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>

#include "cmds.h"
#include "tm.h"
#include "pbs_version.h"

char *host = NULL;

extern char *get_ecname(int rc);

/**
 * @brief
 * 	displays how to use pbs_tmrsh
 *
 * @param[in] id - command name i.e pbs_tmrsh
 *
 * @return Void
 *
 */
void
usage(char *id)
{
	fprintf(stderr, "usage: %s [-n][-l username] host [-n][-l username] command\n", id);
	fprintf(stderr, "       %s --version\n", id);
	exit(255);
}

/**
 * @brief
 *  	returns the username
 *
 * @return string
 * @retval "username"
 *
 */
char *
myname(void)
{
	uid_t me = getuid();
	struct passwd *pent;

	if ((pent = getpwuid(me)) == NULL)
		return "";
	else
		return pent->pw_name;
}

#ifndef INADDR_NONE
#define INADDR_NONE (in_addr_t) 0xFFFFFFFF
#endif

/**
 * @brief
 *	Check the host to a line read from PBS_NODEFILE.
 *	The PBS_NODEFILE will contain node names.  We want to be able
 *	to accept IP addresses for the host.
 *
 * @param[in] line - line from PBS_NODEFILE
 *
 * @return  	Error code
 * @retval	1 - Success i.e matched
 * @retval	0 - Failure i.e not matched
 *
 */
int
host_match(char *line)
{
	int len = strlen(line);
	static char domain[PBS_MAXHOSTNAME + 1];
	char fullhost[PBS_MAXHOSTNAME + 1];
	static struct in_addr addr;
	static int addrvalid = -1;

	if (line[len - 1] == '\n')
		line[len - 1] = '\0';

	if (strcmp(line, host) == 0)
		return 1;

	if (addrvalid == -1) {
		addr.s_addr = inet_addr(host);
		addrvalid = (addr.s_addr == INADDR_NONE) ? 0 : 1;
	}

	if (addrvalid) { /* compare IP addresses */
		struct hostent *hp = gethostbyname(line);
		int i;

		if (hp == NULL)
			return 0;

		for (i = 0; hp->h_addr_list[i]; i++) {
			if (memcmp(&addr, hp->h_addr_list[i],
				   hp->h_length) == 0)
				return 1;
		}
		return 0;
	}

	if (domain[0] == '\0') {
		if (getdomainname(domain, (sizeof(domain) - 1)) == -1) {
			perror("getdomainname");
			exit(255);
		}
		if (domain[0] == '\0') {
			int i;
			char *dot;

			if (gethostname(domain, (sizeof(domain) - 1)) == -1) {
				perror("getdomainname");
				exit(255);
			}
			if (domain[0] == '\0')
				return 0;
			if ((dot = strchr(domain, '.')) == NULL)
				return 0;
			for (i = 0, dot++; *dot; i++, dot++)
				domain[i] = *dot;
			domain[i] = '\0';
		}
	}
	pbs_strncpy(fullhost, line, sizeof(fullhost));
	strcat(fullhost, ".");
	strcat(fullhost, domain);

	if (strcmp(fullhost, host) == 0)
		return 1;

	return 0;
}

int
main(int argc, char *argv[], char *envp[])
{
	char *id;
	char *jobid;
	int i, arg;
	FILE *fp;
	int numnodes;
	int err = 0;
	int rc, exitval;
	struct tm_roots rootrot;
	char *nodefile;
	tm_node_id *nodelist;
	tm_event_t event;
	tm_task_id tid;
	char line[256], *cp;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	id = argv[0];
	if (argc < 3)
		usage(id);

	for (arg = 1; arg < argc; arg++) {
		char *c = argv[arg];
		char lopt[] = "-l";
		int len = sizeof(lopt) - 1;

		if (*c == '-') {		  /* option */
			if (strcmp(c, "-n") == 0) /* noop */
				continue;

			if (strncmp(c, lopt, len) == 0) { /* login name */
				if (strlen(c) == len) {
					arg++;
					if (arg == argc) {
						err = 1; /* no args left */
						break;
					}
					c = argv[arg];
				} else /* -lname */
					c += len;

				if (strcmp(c, myname()) != 0) {
					fprintf(stderr, "%s: bad user \"%s\"\n",
						id, c);
					err = 1;
				}
			} else { /* unknown option */
				err = 1;
				break;
			}
		} else if (host == NULL)
			host = c; /* first non-option is host */
		else
			break; /* host is set, must be command */
	}

	/*
	 **	If there was an error processing arguments or there is
	 **	no command, exit.
	 */
	if (err || (argc == arg) || (host == NULL))
		usage(id);

	if (getenv("PBS_ENVIRONMENT") == 0) {
		fprintf(stderr, "%s: not executing under PBS\n", id);
		return 255;
	}
	if ((jobid = getenv("PBS_JOBID")) == NULL) {
		fprintf(stderr, "%s: PBS jobid not in environment\n", id);
		return 255;
	}

	/*
	 **	Set up interface to the Task Manager
	 */
	if ((rc = tm_init(NULL, &rootrot)) != TM_SUCCESS) {
		fprintf(stderr, "%s: tm_init: %s\n", id, get_ecname(rc));
		return 255;
	}

	if ((rc = tm_nodeinfo(&nodelist, &numnodes)) != TM_SUCCESS) {
		fprintf(stderr, "%s: tm_nodeinfo: %s\n", id, get_ecname(rc));
		return 255;
	}

	/*
	 ** Check which node number the host is.
	 */
	if ((nodefile = getenv("PBS_NODEFILE")) == NULL) {
		fprintf(stderr, "%s: cannot find PBS_NODEFILE\n", id);
		return 255;
	}
	if ((fp = fopen(nodefile, "r")) == NULL) {
		perror(nodefile);
		return 255;
	}

	for (i = 0; (cp = fgets(line, sizeof(line), fp)) != NULL; i++) {
		if (host_match(line))
			break;
	}
	fclose(fp);
	if (cp == NULL) {
		fprintf(stderr, "%s: host \"%s\" is not a node in job <%s>\n",
			id, host, jobid);
		return 255;
	}
	if (i >= numnodes) {
		fprintf(stderr, "%s: PBS_NODEFILE contains %d entries, "
				"only %d nodes in job\n",
			id, i, numnodes);
		return 255;
	}

	if ((rc = tm_spawn(argc - arg, argv + arg, NULL,
			   nodelist[i], &tid, &event)) != TM_SUCCESS) {
		fprintf(stderr, "%s: tm_spawn: host \"%s\" err %s\n",
			id, host, get_ecname(rc));
	}

	rc = tm_poll(TM_NULL_EVENT, &event, 1, &err);
	if (rc != TM_SUCCESS || event == TM_ERROR_EVENT) {
		fprintf(stderr, "%s: tm_poll(spawn): host \"%s\" err %s %d\n",
			id, host, get_ecname(rc), err);
		return 255;
	}

	if ((rc = tm_obit(tid, &exitval, &event)) != TM_SUCCESS) {
		fprintf(stderr, "%s: obit: host \"%s\" err %s\n",
			id, host, get_ecname(rc));
		return 255;
	}

	rc = tm_poll(TM_NULL_EVENT, &event, 1, &err);
	if (rc != TM_SUCCESS || event == TM_ERROR_EVENT) {
		fprintf(stderr, "%s: tm_poll(obit): host \"%s\" err %s %d\n",
			id, host, get_ecname(rc), err);
		return 255;
	}

	tm_finalize();

	return exitval;
}


================================================
FILE: src/cmds/pbsdsh.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */


/**
 * @file	pbs_dsh.c
 * @brief
 * pbs_dsh - a distribute task program using the Task Management API
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>


#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <pwd.h>
#include <netdb.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include "cmds.h"
#include "tm.h"
#include <signal.h>

int *ev;
tm_event_t *events_spawn;
tm_event_t *events_obit;
int numnodes;
tm_task_id *tid;
int verbose = 0;

#ifndef WIN32
sigset_t allsigs;
#endif

char *id;

int fire_phasers = 0;
int no_obit = 0;
extern char *get_ecname(int rc);

/**
 * @brief
 *	signal handler function
 *
 * @param[in] sig - signal number
 *
 * @return - Void
 *
 */
void
bailout(int sig)
{
	fire_phasers = sig;
}


/**
 * @brief
 *      Check the host to a line read from PBS_NODEFILE.
 *      The PBS_NODEFILE will contain node names.  We want to be able
 *      to accept IP addresses for the host.
 * 
 * @param[in] line - line from PBS_NODEFILE
 *
 * @return      Error code
 * @retval      1 - Success i.e matched
 * @retval      0 - Failure i.e not matched
 * 
 */

int
host_match(char *line, char *host)
{
	if (NULL == host) 
		return 0;
	if (NULL == line)
		return 0;
	int len = strlen(line);
	static char domain[PBS_MAXHOSTNAME + 1];
	char fullhost[PBS_MAXHOSTNAME + 1];
	struct in_addr addr;
        memset(&addr,0,sizeof(addr));
        int addrvalid = -1;

	if (line[len - 1] == '\n')
		line[len - 1] = '\0';

	if (strcmp(line, host) == 0)
		return 1;

	if (addrvalid == -1) {
		addr.s_addr = inet_addr(host);
		addrvalid = (addr.s_addr == INADDR_NONE) ? 0 : 1;
	}

	if (addrvalid) { /* compare IP addresses */
	 	
		struct addrinfo hints, *res, *p;	 
		int status;
		memset(&hints, 0, sizeof(hints));
		hints.ai_family = AF_INET; /* IPv6 not supported */ 
		hints.ai_socktype = SOCK_STREAM;
		
		if ((status = getaddrinfo(line,NULL,&hints,&res)) != 0) {
			perror("getaddrinfo");
			exit(255);
		}
	
		for(p = res; p;p = p->ai_next) {
			struct sockaddr_in *s_in_entry = (struct sockaddr_in *) p->ai_addr;
			if (memcmp(&addr, &(s_in_entry->sin_addr), sizeof(addr)) == 0) {
				freeaddrinfo(res);
				return 1;
			}
		}	
		freeaddrinfo(res);
		return 0;
	}

	if (domain[0] == '\0') {
		if (getdomainname(domain, (sizeof(domain) - 1)) == -1) {
			perror("getdomainname");
			exit(255);
		}
		if (domain[0] == '\0') {
			int i;
			char *dot;

			if (gethostname(domain, (sizeof(domain) - 1)) == -1) {
				perror("gethostname");
				exit(255);
			}
			if (domain[0] == '\0')
				return 0;
			if ((dot = strchr(domain, '.')) == NULL)
				return 0;
			for (i = 0, dot++; *dot; i++, dot++)
				domain[i] = *dot;
			domain[i] = '\0';
		}
	}
	pbs_strncpy(fullhost, line, sizeof(fullhost));
	strcat(fullhost, ".");
	strcat(fullhost, domain);

	if (strcmp(fullhost, host) == 0)
		return 1;

	return 0;
}

/**
 * @brief
 *      find_hostline - check a if a hostname has a entry in PBS_NODEFILE
 *     	 it calls host_match to do a match, does more that str operations;
 *      
 * 
 * @param[in] first - the hostname to match
 * 
 * @return - 
 * @retval      1 - Success i.e matched
 * @retval      0 - Failure i.e not matched
 *
 */


int find_hostline(char *host)
{
	if (NULL == host) 
		return -1;
	if (NULL == getenv("PBS_NODEFILE")) 
		return -1;
	FILE *fp = fopen(getenv("PBS_NODEFILE"),"r");
	if (NULL == fp) 
		return -1;
	
        char line[HOST_NAME_MAX], *cp;
        int i, host_hit = 0;
        for (i = 0; (cp = fgets(line, sizeof(line), fp)) != NULL; i++) {
                if ((host_hit = host_match(line, host)) == 1)
                        break;
        }
        fclose(fp);
        if (host_hit) 
		return i;
        return -1;

}


/**
 * @brief
 *      wait_for_task - wait for all spawned tasks to
 *      a. have the spawn acknowledged, and
 *      b. the task to terminate and return the obit with the exit status
 * 
 * @param[in] first - first event index to consider
 * @param[in] nspawned - number of tasks spawned
 * 
 * @return - Void
 *
 */

void
wait_for_task(int first, int *nspawned)
{
	int c;
	tm_event_t eventpolled;
	int nevents;
	int nobits = 0;
	int rc;
	int tm_errno;

	nevents = *nspawned;
	while (*nspawned || nobits) {
		if (verbose) {
			printf("pbsdsh: waiting on %d spawned and %d obits\n",
			       *nspawned, nobits);
		}

		if (fire_phasers) {
			tm_event_t event;

			for (c = first; c < (first + nevents); c++) {
				if (*(tid + c) == TM_NULL_TASK)
					continue;
				printf("pbsdsh: killing task 0x%08X signal %d\n",
				       *(tid + c), fire_phasers);
				(void) tm_kill(*(tid + c), fire_phasers, &event);
			}
			tm_finalize();
			exit(1);
		}

#ifdef WIN32
		rc = tm_poll(TM_NULL_EVENT, &eventpolled, 1, &tm_errno);
#else
		sigprocmask(SIG_UNBLOCK, &allsigs, NULL);
		rc = tm_poll(TM_NULL_EVENT, &eventpolled, 1, &tm_errno);
		sigprocmask(SIG_BLOCK, &allsigs, NULL);
#endif

		if (rc != TM_SUCCESS) {
			fprintf(stderr, "%s: Event poll failed, error %s\n",
				id, get_ecname(rc));
			exit(2);
		}

		for (c = first; c < (first + nevents); ++c) {
			if (eventpolled == *(events_spawn + c)) {
				/* spawn event returned - register obit */
				(*nspawned)--;
				if (tm_errno) {
					fprintf(stderr, "error %d on spawn\n",
						tm_errno);
					continue;
				}
				if (no_obit)
					continue;

				rc = tm_obit(*(tid + c), ev + c, events_obit + c);
				if (rc == TM_SUCCESS) {
					if (*(events_obit + c) == TM_NULL_EVENT) {
						if (verbose) {
							fprintf(stderr, "task already dead\n");
						}
					} else if (*(events_obit + c) == TM_ERROR_EVENT) {
						if (verbose) {
							fprintf(stderr, "Error on Obit return\n");
						}
					} else {
						nobits++;
					}
				} else if (verbose) {
					fprintf(stderr, "%s: failed to register for task termination notice, task 0x%08X\n", id, c);
				}

			} else if (eventpolled == *(events_obit + c)) {
				/* obit event, task exited */
				nobits--;
				*(tid + c) = TM_NULL_TASK;
				if (verbose || *(ev + c) != 0) {
					printf("%s: task 0x%08X exit status %d\n",
					       id, c, *(ev + c));
				}
			}
		}
	}
}

int
main(int argc, char *argv[], char *envp[])
{
	int c = 0;
	int err = 0;
	int max_events;
	int ncopies = -1;
	int nd = 0;
	int onenode = -1;
	int rc = 0;
	struct tm_roots rootrot;
	int nspawned = 0;
	tm_node_id *nodelist = NULL;
	int start = 0;
	int stop = 0;
	int sync = 0;
	char *pbs_environ = NULL;
#ifndef WIN32
	struct sigaction act;
#endif
	extern int optind;
	extern char *optarg;
	char *targethost = NULL;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((c = getopt(argc, argv, "c:n:h:svo")) != EOF) {
		switch (c) {
			case 'c':
				targethost = NULL;
				ncopies = atoi(optarg);
				if (ncopies < 0) {
					err = 1;
				}
				break;
			case 'n':
				targethost = NULL;
				onenode = atoi(optarg);
				if (onenode < 0) {
					err = 1;
				}
				break;
			case 'h':
				onenode = 0;
				targethost = optarg;		
				onenode = find_hostline(targethost);
				if (onenode < 0) {
					err = 1;
				}
				break;
			case 's':
				sync = 1; /* force synchronous spawns */
				break;
			case 'v':
				verbose = 1; /* turn on verbose output */
				break;
			case 'o':
				no_obit = 1;
				break;
			default:
				err = 1;
				break;
		}
	}
	
	if (err || (onenode >= 0 && ncopies >= 0) || (argc == optind)) {
		fprintf(stderr, "Usage: %s [-c copies][-s][-v][-o]"
				" -- program [args...]\n",
			argv[0]);
		fprintf(stderr, "       %s [-n node_index][-s][-v][-o]"
				" -- program [args...]\n",
			argv[0]);
		fprintf(stderr, "       %s --version\n", argv[0]);
		fprintf(stderr, "Where -c copies =  run a copy "
				"of \"program\" on the first \"copies\" nodes,\n");
		fprintf(stderr, "      -n node_index = run a copy "
				"of \"program\" on the \"node_index\"-th node,\n");

		fprintf(stderr, "      -h hostname = run a copy "
				"of \"program\" on the node named by hostname,\n");
		fprintf(stderr, "      -s = forces synchronous execution,\n");
		fprintf(stderr, "      -v = forces verbose output.\n");
		fprintf(stderr, "      -o = no obits are waited for.\n");

		exit(1);
	}

	id = argv[0];
	if ((pbs_environ = getenv("PBS_ENVIRONMENT")) == 0) {
		fprintf(stderr, "%s: not executing under PBS\n", id);
		return 1;
	}

	
	/*
	 *	Set up interface to the Task Manager
	 */
	if ((rc = tm_init(0, &rootrot)) != TM_SUCCESS) {
		fprintf(stderr, "%s: tm_init failed, rc = %s (%d)\n", id,
			get_ecname(rc), rc);
		return 1;
	}

#ifdef WIN32
	signal(SIGINT, bailout);
	signal(SIGTERM, bailout);
#else
	sigemptyset(&allsigs);
	sigaddset(&allsigs, SIGHUP);
	sigaddset(&allsigs, SIGINT);
	sigaddset(&allsigs, SIGTERM);

	act.sa_mask = allsigs;
	act.sa_flags = 0;
	/*
	 ** We want to abort system calls and call a function.
	 */
#ifdef SA_INTERRUPT
	act.sa_flags |= SA_INTERRUPT;
#endif
	act.sa_handler = bailout;
	sigaction(SIGHUP, &act, NULL);
	sigaction(SIGINT, &act, NULL);
	sigaction(SIGTERM, &act, NULL);

#endif /* WIN32 */

#ifdef DEBUG
	if (rootrot.tm_parent == TM_NULL_TASK) {
		printf("%s: I am the mother of all tasks\n", id);
	} else {
		printf("%s: I am but a child in the scheme of things\n", id);
	}
#endif /* DEBUG */

	if ((rc = tm_nodeinfo(&nodelist, &numnodes)) != TM_SUCCESS) {
		fprintf(stderr, "%s: tm_nodeinfo failed, rc = %s (%d)\n", id,
			get_ecname(rc), rc);
		return 1;
	}

	max_events = (ncopies > numnodes) ? ncopies : numnodes;

	/* malloc space for various arrays based on number of nodes/tasks */

	tid = (tm_task_id *) calloc(max_events, sizeof(tm_task_id));
	if (tid == NULL) {
		fprintf(stderr, "%s: malloc of task ids failed\n", id);
		return 1;
	}
	events_spawn = (tm_event_t *) calloc(max_events, sizeof(tm_event_t));
	if (events_spawn == NULL) {
		fprintf(stderr, "%s: out of memory\n", id);
		return 1;
	}
	events_obit = (tm_event_t *) calloc(max_events, sizeof(tm_event_t));
	if (events_obit == NULL) {
		fprintf(stderr, "%s: out of memory\n", id);
		return 1;
	}
	ev = (int *) calloc(max_events, sizeof(int));
	if (ev == NULL) {
		fprintf(stderr, "%s: out of memory\n", id);
		return 1;
	}
	for (c = 0; c < max_events; c++) {
		*(tid + c) = TM_NULL_TASK;
		*(events_spawn + c) = TM_NULL_EVENT;
		*(events_obit + c) = TM_NULL_EVENT;
		*(ev + c) = 0;
	}

	/* Now spawn the program to where it goes */


	if (onenode >= 0) {

		/* Spawning one copy onto logical node "onenode" */

		start = onenode;
		stop = onenode + 1;

	} else if (ncopies >= 0) {
		/* Spawn a copy of the program to the first "ncopies" nodes */

		start = 0;
		stop = ncopies;
	} else {
		/* Spawn a copy on all nodes */

		start = 0;
		stop = numnodes;
	}

#ifndef WIN32
	sigprocmask(SIG_BLOCK, &allsigs, NULL);
#endif

	for (c = 0; c < (stop - start); ++c) {
		nd = (start + c) % numnodes;
		if ((rc = tm_spawn(argc - optind,
				   argv + optind,
				   NULL,
				   *(nodelist + nd),
				   tid + c,
				   events_spawn + c)) != TM_SUCCESS) {
			fprintf(stderr, "%s: spawn failed on node %d err %s\n",
				id, nd, get_ecname(rc));
		} else {
			if (verbose)
				printf("%s: spawned task 0x%08X on logical node %d event %d\n", id, c, nd, *(events_spawn + c));
			++nspawned;
			if (sync)
				wait_for_task(c, &nspawned); /* one at a time */
		}
	}

	if (sync == 0)
		wait_for_task(0, &nspawned); /* wait for all to finish */
#ifdef WIN32
	/*
	 * On Windows, in case of interactive jobs - pbs_demux is writing on stdout and stderr
	 * in parallel to the interactive shell on which pbsdsh executes. Give pbs_demux some time to
	 * finish writing to the console before we exit from here.
	 *
	 */
	if (strncmp(pbs_environ, "PBS_INTERACTIVE", strlen("PBS_INTERACTIVE")) == 0) {
		Sleep(200); /* 200 ms */
	}
#endif
	/*
	 *	Terminate interface with Task Manager
	 */
	tm_finalize();

	return 0;
}


================================================
FILE: src/cmds/pbsnodes.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbsnodes.c
 * @brief
 *	 This program exists to give a way to mark nodes
 *	 Down, Offline, or Free in PBS.
 *
 * @par	usage:	pbsnodes [-s server] -[F format] host host ...
 *		pbsnodes [-s server] -[F format]-v vnode vnode ...
 *		pbsnodes [-s server] -[F format]-H host host...
 *		pbsnodes [-s server] -[C comment]{o|r} host host ...
 *		pbsnodes [-s server] -a[v][F format]
 *		pbsnodes [-s server] -a[v][S[j][L]][F format]
 *		pbsnodes [-s server] -[S[j][L]][F format][H] host host ...
 *	where the node(s) are the names given in the node
 *	description file.
 *
 * @note
 *		pbsnodes -c and -d have been deprecated.
 *		Text about -c and -d are removed from the usage
 *		statement.  The code will be removed in the future.
 *
 *	pbsnodes			print command usage
 *
 *	pbsnodes -d			clear "DOWN" from all nodes so marked
 *
 *	pbsnodes -d node1 node2		set nodes node1, node2 "DOWN"
 *					unmark "DOWN" from any other node
 *
 *	pbsnodes -a			list all hosts
 *	pbsnodes host [host...]		list specified hosts
 *	pbsnodes -av			list all hosts and v-nodes
 *	pbsnodes -v vnode [vnode...]	list specified vnodes
 *
 *	pbsnodes -C <comment> host ...	set a comment on hosts
 *
 *	pbsnodes -F <format> host ...	list the output in specified format for specified nodes.
 *
 *	pbsnodes -H host [host ...]	list the hosts and vnodes on them.
 *
 *	pbsnodes -l			list all nodes marked in any way
 *	pbsnodes -l node1 node2		list specified nodes
 *
 *	pbsnodes -o host1 host2		mark hosts host1, host2 as OFF_LINE
 *					even if currently in use.
 *
 *	pbsnodes -r host1 host2		clear OFF_LINE from listed hosts
 *
 *	pbsnodes -S host1 host2 ...	single line Node summary of specified nodes
 *	pbsnodes -Sj			single line Jobs summary of specified nodes
 *	pbsnodes -S[j]L			list expanded version of each field in the single line summary
 *
 *	pbsnodes -c host1 host2		clear OFF_LINE or DOWN from listed hosts
 */
#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#include "cmds.h"
#include "portability.h"
#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "pbs_json.h"

/* Field width for Single line summary */
#define NODE_NAME 15
#define NODE_STATE 15
#define NODE_OS 8
#define NODE_HARDW 8
#define NODE_HOST 15
#define QUEUE 10
#define NCPUS 7
#define MEM 8
#define NMIC 7
#define NGPUS 7
#define COMMENT 20
#define NJOBS 6
#define RUNNING_JOBS 5
#define SUSP_JOBS 6
#define NCPUS_FT 7
#define MEM_FT 12
#define NMIC_FT 7
#define NGPUS_FT 7

typedef enum mgr_operation {
	DOWN,		/* Set nodes DOWN */
	LISTMRK,	/* List nodes marked DOWN or OFF_LINE */
	CLEAR,		/* Clear DOWN and OFF_LINE */
	OFFLINE,	/* Set nodes OFF_LINE */
	RESET,		/* Clear nodes OFF_LINE */
	UPDATE_COMMENT, /* add comment to nodes */
	ALL,		/* List all nodes */
	LISTSP,		/* List specified nodes */
	LISTSPNV	/* List specified nodes and their associated vnodes*/
} mgr_operation_t;

enum output_format_enum {
	FORMAT_DEFAULT = 0,
	FORMAT_DSV,
	FORMAT_JSON,
	FORMAT_MAX /* Add new formats before FORMAT_MAX */
		   /* and update output_format_names[]  */
};

/* This array contains the names users may specify for output format. */
static char *output_format_names[] = {"default", "dsv", "json", NULL};

static int output_format = FORMAT_DEFAULT;
static int quiet = 0;
static char *dsv_delim = "|";
static json_data *json_nodes = NULL; /* json structure for nodes */

/**
 * @brief
 *	cmp_node_name - compare two node names, allow the second to match the
 *	first if the same upto a dot ('.') in the second; i.e.
 *	"foo" == "foo.bar"
 *
 * @param[in]  n1 - first node name to be matched with
 * @param[in]  n2 - second node name to be matched
 *
 *
 * @return - Error code
 * @retval   1 - Failure
 * @retval   0 - Success
 *
 */

static int
cmp_node_name(char *n1, char *n2)
{
	while ((*n1 != '\0') && (*n2 != '\0')) {
		if (*n1 != *n2)
			break;
		n1++;
		n2++;
	}
	if (*n1 == *n2)
		return 0;
	else if ((*n1 == '.') && (*n2 == '\0'))
		return 0;
	else
		return 1;
}

/**
 * @brief
 *	Encodes the information in batch_status structure to json format
 *
 * @param[in] *bstat - structure containing node information
 *
 * @return - Error code
 * @retval   1 - Failure
 * @retval   0 - Success
 *
 */
static int
encode_to_json(struct batch_status *bstat)
{
	struct attrl *next;
	struct attrl *pattr;
	char *str;
	char *pc;
	char *pc1;
	char *prev_jobid = "";
	json_data *json_node;

	if ((json_node = pbs_json_create_object()) == NULL)
		return 1;
	pbs_json_insert_item(json_nodes, bstat->name, json_node);
	for (pattr = bstat->attribs; pattr; pattr = pattr->next) {
		if (strcmp(pattr->name, "resources_available") == 0) {
			json_data *json_resc;
			if ((json_resc = pbs_json_create_object()) == NULL)
				return 1;
			pbs_json_insert_item(json_node, pattr->name, json_resc);
			for (next = pattr; next;) {
				if (pbs_json_insert_parsed(json_resc, next->resource, next->value, 0))
					return 1;
				if (next->next == NULL || strcmp(next->next->name, "resources_available")) {
					pattr = next;
					next = NULL;
				} else {
					next = next->next;
				}
			}
		} else if (strcmp(pattr->name, "resources_assigned") == 0) {
			json_data *json_resc;
			if ((json_resc = pbs_json_create_object()) == NULL)
				return 1;
			pbs_json_insert_item(json_node, pattr->name, json_resc);
			for (next = pattr; next;) {
				str = next->value;
				strtod(str, &pc);
				while (pc) {
					if (isspace(*pc))
						pc++;
					else
						break;
				}
				/* Adding only non zero values.*/
				if (pbs_json_insert_parsed(json_resc, next->resource, next->value, 1))
					return 1;
				if (next->next == NULL || strcmp(next->next->name, "resources_assigned")) {
					pattr = next;
					next = NULL;
				} else {
					next = next->next;
				}
			}
		} else if (strcmp(pattr->name, "jobs") == 0) {
			json_data *json_jobs;
			if ((json_jobs = pbs_json_create_array()) == NULL)
				return 1;
			pbs_json_insert_item(json_node, pattr->name, json_jobs);
			pc = pc1 = str = pattr->value;
			while (*pc1) {
				if (*pc1 != ' ')
					*pc++ = *(pc1);
				pc1++;
			}
			*pc = '\0';
			for (pc = strtok(str, ","); pc != NULL; pc = strtok(NULL, ",")) {
				pc1 = strchr(pc, '/');
				if (pc1)
					*pc1 = '\0';
				if (strcmp(pc, prev_jobid) != 0) {
					if (pbs_json_insert_string(json_jobs, NULL, pc))
						return 1;
				}
				prev_jobid = pc;
			}
		} else {
			if(pbs_json_insert_parsed(json_node, pattr->name, pattr->value, 0))
				return 1;
		}
	}
	return 0;
}

/**
 * @brief
 *	prints the nodes summary in specified format
 *
 * @param[in] *def_server - server name
 * @param[in] *bstatus - structure with node information
 * @param[in] job_summary - value to test wheteher job running on node
 * @param[in] long_summary - value to test whether to print long summary of node
 *
 * @retval - Error code
 * @retval   1 - Failure
 * @retval   0 - Success
 *
 */
static int
prt_node_summary(char *def_server, struct batch_status *bstatus, int job_summary, int long_summary)
{
	struct batch_status *bstat = NULL;
	struct attrl *pattr;
	struct attrl *next;
	char suffixletter[] = " kmgtp?";
	char *pc;
	char *pc1;
	char mem_info[50] = "0kb";
	char ncpus_info[20] = "0";
	char nmic_info[20] = "0";
	char ngpus_info[20] = "0";
	char *prev_jobid = NULL;
	char *cur_jobid = NULL;
	int prefix_assigned = 0;
	long int assigned_mem = 0;
	long int njobs = 0;
	long int run_jobs = 0;
	long int susp_jobs = 0;
	long int value = 0;
	static int done_headers = 0;
	json_data *json_node;
	json_data *json_jobs;

	if (output_format == FORMAT_DEFAULT && !done_headers) {
		if (job_summary) {
			printf("                                                        mem       ncpus   nmics   ngpus\n");
			printf("vnode           state           njobs   run   susp      f/t        f/t     f/t     f/t   jobs\n");
			printf("--------------- --------------- ------ ----- ------ ------------ ------- ------- ------- -------\n");
		} else {
			printf("vnode           state           OS       hardware host            queue        mem     ncpus   nmics   ngpus  comment\n");
			printf("--------------- --------------- -------- -------- --------------- ---------- -------- ------- ------- ------- ---------\n");
		}
		done_headers = 1;
	}
	if (def_server == NULL)
		def_server = "";

	for (bstat = bstatus; bstat; bstat = bstat->next) {
		char *name;
		char *state;
		char *hardware;
		char *queue;
		char *os;
		char *host;
		char *comment;
		char *jobs;
		int count;
		int prefix_total;
		int prefix_available; /* magnitude of value when printed */
		long int total_mem;
		long int available_mem;
		long int total_cpus;
		long int available_cpus;
		long int total_nmic;
		long int available_nmic;
		long int total_ngpus;
		long int available_ngpus;
		long int resource_assigned;

		name = bstat->name;
		state = "--";
		hardware = "--";
		queue = "--";
		os = "--";
		host = "--";
		comment = "--";
		jobs = "--";
		count = 0;
		prefix_total = 0;
		prefix_available = 0;
		total_mem = 0;
		available_mem = 0;
		total_cpus = 0;
		available_cpus = 0;
		total_nmic = 0;
		available_nmic = 0;
		total_ngpus = 0;
		available_ngpus = 0;
		resource_assigned = 0;
		njobs = 0;
		run_jobs = 0;
		susp_jobs = 0;
		value = 0;
		prev_jobid = "";
		cur_jobid = "";
		pc = NULL;

		if (job_summary) {
			strcpy(mem_info, "0kb/0kb");
			strcpy(ncpus_info, "0/0");
			strcpy(nmic_info, "0/0");
			strcpy(ngpus_info, "0/0");
		} else {
			strcpy(mem_info, "0kb");
			strcpy(ncpus_info, "0");
			strcpy(nmic_info, "0");
			strcpy(ngpus_info, "0");
		}

		for (pattr = bstat->attribs; pattr; pattr = pattr->next) {
			if (pattr->resource && (strcmp(pattr->name, "resources_assigned") != 0)) {
				if ((strcmp(pattr->resource, "mem") == 0)) {
					total_mem = strtol(pattr->value, &pc, 10);
					if (*pc == 'k')
						prefix_total = 1;
					else if (*pc == 'm')
						prefix_total = 2;
					else if (*pc == 'g')
						prefix_total = 3;
					else if (*pc == 't')
						prefix_total = 4;
					else
						prefix_total = 0;
					prefix_available = prefix_total;
					for (next = pattr->next; next && job_summary; next = next->next) {
						if (!next->resource)
							continue;
						if (strcmp(next->resource, "mem") == 0) {
							assigned_mem = strtol(next->value, &pc, 10);
							if (*pc == 'k')
								prefix_assigned = 1;
							else if (*pc == 'm')
								prefix_assigned = 2;
							else if (*pc == 'g')
								prefix_assigned = 3;
							else if (*pc == 't')
								prefix_assigned = 4;
							else
								prefix_assigned = 0;
							while (prefix_assigned != prefix_total) {
								if (prefix_assigned < prefix_total) {
									assigned_mem = ((assigned_mem % 1024) + assigned_mem) >> 10;
									prefix_assigned++;
								} else {
									assigned_mem = assigned_mem << 10;
									prefix_assigned--;
								}
							}
							available_mem = total_mem - assigned_mem;
							prefix_available = prefix_total;
							while (available_mem > 999) {
								available_mem = ((available_mem % 1024) + available_mem) >> 10;
								prefix_available++;
							}
							break;
						}
					}
					while (total_mem > 999) {
						total_mem = ((total_mem % 1024) + total_mem) >> 10;
						prefix_total++;
					}
					if (job_summary)
						snprintf(mem_info, sizeof(mem_info), "%ld%cb/%ld%cb", available_mem, suffixletter[prefix_available],
							 total_mem, suffixletter[prefix_total]);
					else
						snprintf(mem_info, sizeof(mem_info), "%ld%cb", total_mem, suffixletter[prefix_total]);
				} else if ((strcmp(pattr->resource, "ncpus") == 0)) {
					total_cpus = atol(pattr->value);
					resource_assigned = 0;
					for (next = pattr->next; next && job_summary; next = next->next) {
						if (!next->resource)
							continue;
						if (strcmp(next->resource, "ncpus") == 0) {
							resource_assigned = atol(next->value);
							break;
						}
					}
					if (job_summary) {
						available_cpus = total_cpus - resource_assigned;
						snprintf(ncpus_info, 20, "%ld/%ld", available_cpus, total_cpus);
					} else
						snprintf(ncpus_info, 20, "%ld", total_cpus);
				} else if (strcmp(pattr->resource, "nmics") == 0) {
					total_nmic = atol(pattr->value);
					resource_assigned = 0;
					for (next = pattr->next; next && job_summary; next = next->next) {
						if (!next->resource)
							continue;
						if (strcmp(next->resource, "nmics") == 0) {
							resource_assigned = atol(next->value);
							break;
						}
					}
					if (job_summary) {
						available_nmic = total_nmic - resource_assigned;
						snprintf(nmic_info, 20, "%ld/%ld", available_nmic, total_nmic);
					} else
						snprintf(nmic_info, 20, "%ld", total_nmic);
				} else if (strcmp(pattr->resource, "ngpus") == 0) {
					total_ngpus = atol(pattr->value);
					resource_assigned = 0;
					for (next = pattr->next; next && job_summary; next = next->next) {
						if (!next->resource)
							continue;
						if (strcmp(next->resource, "ngpus") == 0) {
							resource_assigned = atol(next->value);
							break;
						}
					}
					if (job_summary) {
						available_ngpus = total_ngpus - resource_assigned;
						snprintf(ngpus_info, 20, "%ld/%ld", available_ngpus, total_ngpus);
					} else
						snprintf(ngpus_info, 20, "%ld", total_ngpus);

				} else if (strcmp(pattr->resource, "host") == 0)
					host = pattr->value;
				else if (strcmp(pattr->resource, "OS") == 0)
					os = pattr->value;
				else if (strcmp(pattr->resource, "hardware") == 0)
					hardware = pattr->value;
			} else if (strcmp(pattr->name, "state") == 0) {
				if (!long_summary)
					state = strtok(pattr->value, ",");
				else
					state = pattr->value;
			} else if (strcmp(pattr->name, "comment") == 0)
				comment = pattr->value;
			else if (strcmp(pattr->name, "queue") == 0)
				queue = pattr->value;
			else if (job_summary) {
				if (strcmp(pattr->name, "jobs") == 0) {
					jobs = pattr->value;
					count = 1;
					pc = strtok(pattr->value, ", ");
					while (pc != NULL) {
						pc1 = strchr(pc, (int) '/'); /* remove virtual core description from jobid. */
						if (pc1)
							*pc1 = '\0';
						cur_jobid = pc;
						if (output_format == FORMAT_DEFAULT) {
							pc1 = strchr(pc, (int) '.');
							if (strcmp((pc1 + 1), def_server) == 0) /* if not equal, job is from a peer_server. */
								*pc1 = '\0';
						}
						if ((strcmp(cur_jobid, prev_jobid) != 0) && strcmp(cur_jobid, jobs) != 0) { /* will skip concatenating if only one job.*/
							strcat(jobs, ",");
							strcat(jobs, cur_jobid);
							count++;
						}
						prev_jobid = cur_jobid;
						pc = strtok(NULL, ", ");
					}
					run_jobs = count;
					njobs = susp_jobs + run_jobs;
				}
			}
		}
		switch (output_format) {

			case FORMAT_DSV:
				if (job_summary) {
					printf("vnode=%s%sstate=%s%snjobs=%ld%srun=%ld%ssusp=%ld%smem(f/t)=%s%sncpus(f/t)=%s%snmics(f/t)=%s%sngpus(f/t)=%s%sjobs=%s\n",
					       name, dsv_delim, state, dsv_delim, njobs, dsv_delim, run_jobs, dsv_delim, susp_jobs,
					       dsv_delim, mem_info, dsv_delim, ncpus_info, dsv_delim, nmic_info, dsv_delim, ngpus_info, dsv_delim, jobs);
				} else {
					printf("vnode=%s%sstate=%s%sOS=%s%shardware=%s%shost=%s%squeue=%s%smem=%s%sncpus=%s%snmics=%s%sngpus=%s%scomment=%s\n",
					       name, dsv_delim, state, dsv_delim, os, dsv_delim, hardware, dsv_delim, host, dsv_delim, queue,
					       dsv_delim, mem_info, dsv_delim, ncpus_info, dsv_delim, nmic_info, dsv_delim, ngpus_info, dsv_delim, show_nonprint_chars(comment));
				}
				break;

			case FORMAT_JSON:
				if ((json_node = pbs_json_create_object()) == NULL)
					return 1;
				pbs_json_insert_item(json_nodes, name, json_node);
				if (pbs_json_insert_string(json_node, "State", state))
					return 1;
				if (job_summary) {
					if (pbs_json_insert_number(json_node, "Total Jobs", (double) njobs))
						return 1;
					if (pbs_json_insert_number(json_node, "Running Jobs", (double) run_jobs))
						return 1;
					if (pbs_json_insert_number(json_node, "Suspended Jobs", (double) susp_jobs))
						return 1;
					if (pbs_json_insert_string(json_node, "mem f/t", mem_info))
						return 1;
					if (pbs_json_insert_string(json_node, "ncpus f/t", ncpus_info))
						return 1;
					if (pbs_json_insert_string(json_node, "nmics f/t", nmic_info))
						return 1;
					if (pbs_json_insert_string(json_node, "ngpus f/t", ngpus_info))
						return 1;
					if ((json_jobs = pbs_json_create_array()) == NULL)
						return 1;
					pbs_json_insert_item(json_node, "jobs", json_jobs);
					if (strcmp(jobs, "--") != 0) {
						pc = strtok(jobs, ",");
						while (pc != NULL) {
							if (pbs_json_insert_string(json_jobs, NULL, pc))
								return 1;
							pc = strtok(NULL, ",");
						}
					}
				} else {
					if (pbs_json_insert_string(json_node, "OS", os))
						return 1;
					if (pbs_json_insert_string(json_node, "hardware", hardware))
						return 1;
					if (pbs_json_insert_string(json_node, "host", host))
						return 1;
					if (pbs_json_insert_string(json_node, "queue", queue))
						return 1;
					if (pbs_json_insert_string(json_node, "Memory", mem_info))
						return 1;
					value = atol(ncpus_info);
					if (pbs_json_insert_number(json_node, "ncpus", (double) value))
						return 1;
					value = atol(nmic_info);
					if (pbs_json_insert_number(json_node, "nmics", (double) value))
						return 1;
					value = atol(ngpus_info);
					if (pbs_json_insert_number(json_node, "ngpus", (double) value))
						return 1;
					if (pbs_json_insert_string(json_node, "comment", comment))
						return 1;
				}
				break;
			case FORMAT_DEFAULT:
				if (job_summary) {
					if (long_summary)
						printf("%-*s %-*s %*ld %*ld %*ld %*s %*s %*s %*s %s\n",
						       NODE_NAME, name, NODE_STATE, state, NJOBS, njobs, RUNNING_JOBS, run_jobs, SUSP_JOBS, susp_jobs,
						       MEM_FT, mem_info, NCPUS_FT, ncpus_info, NMIC_FT, nmic_info,
						       NGPUS_FT, ngpus_info, jobs);
					else
						printf("%-*.*s %-*.*s %*ld %*ld %*ld %*.*s %*.*s %*.*s %*.*s %s\n",
						       NODE_NAME, NODE_NAME, name, NODE_STATE, NODE_STATE, state, NJOBS, njobs, RUNNING_JOBS, run_jobs,
						       SUSP_JOBS, susp_jobs, MEM_FT, MEM_FT, mem_info, NCPUS_FT, NCPUS_FT, ncpus_info, NMIC_FT, NMIC_FT, nmic_info,
						       NGPUS_FT, NGPUS_FT, ngpus_info, jobs);
				} else {
					if (long_summary)
						printf("%-*s %-*s %-*s %-*s %-*s %-*s %*s %*s %*s %*s %s\n", NODE_NAME, name, NODE_STATE, state,
						       NODE_OS, os, NODE_HARDW, hardware, NODE_HOST, host, QUEUE, queue, MEM, mem_info, NCPUS, ncpus_info,
						       NMIC, nmic_info, NGPUS, ngpus_info, show_nonprint_chars(comment));
					else
						printf("%-*.*s %-*.*s %-*.*s %-*.*s %-*.*s %-*.*s %*.*s %*.*s %*.*s %*.*s %s\n", NODE_NAME, NODE_NAME, name,
						       NODE_STATE, NODE_STATE, state, NODE_OS, NODE_OS, os, NODE_HARDW, NODE_HARDW, hardware,
						       NODE_HOST, NODE_HOST, host, QUEUE, QUEUE, queue, MEM, MEM, mem_info, NCPUS, NCPUS, ncpus_info,
						       NMIC, NMIC, nmic_info, NGPUS, NGPUS, ngpus_info, show_nonprint_chars(comment));
				}
		}
	}
	return 0;
}

/**
 * @brief
 * 	print node information without summary
 *
 * @param[in] bstat - structure pointer having node information
 *
 * @retval Void
 *
 */
static void
prt_node(struct batch_status *bstat)
{
	char *pc;
	struct attrl *pattr = NULL;
	time_t epoch;
	if (bstat == NULL)
		return;

	switch (output_format) {
		case FORMAT_JSON:
			if (encode_to_json(bstat)) {
				fprintf(stderr, "pbsnodes: out of memory\n");
				exit(1);
			}
			break;
		case FORMAT_DSV:
			printf("Name=%s%s", bstat->name, dsv_delim);
			for (pattr = bstat->attribs; pattr; pattr = pattr->next) {
				if (pattr->resource)
					printf("%s.%s=%s", pattr->name, pattr->resource, show_nonprint_chars(pattr->value));
				else if (strcmp(pattr->name, "jobs") == 0) {
					printf("%s=", pattr->name);
					pc = pattr->value;
					while (*pc) {
						char *sbuf;
						char char_buf[2];
						if (*pc == ' ') {
							pc++;
							continue;
						}

						sprintf(char_buf, "%c", *pc);
						sbuf = show_nonprint_chars(char_buf);
						if (sbuf != NULL) {
							int c;
							for (c = 0; c < strlen(sbuf); c++)
								printf("%c", sbuf[c]);
						} else {
							printf("%c", *pc);
						}
						pc++;
					}
				} else
					printf("%s=%s", pattr->name, show_nonprint_chars(pattr->value));
				if (pattr->next)
					printf("%s", dsv_delim);
			}
			printf("\n");
			break;
		default:
			printf("%s\n", bstat->name);
			for (pattr = bstat->attribs; pattr; pattr = pattr->next) {
				printf("     %s", pattr->name);
				if (pattr->resource)
					printf(".%s", pattr->resource);
				if ((strcmp(pattr->name, ATTR_NODE_last_used_time) == 0) ||
				    (strcmp(pattr->name, ATTR_NODE_last_state_change_time) == 0)) {
					epoch = (time_t) atol(pattr->value);
					printf(" = %s", ctime(&epoch));
				} else
					printf(" = %s\n", show_nonprint_chars(pattr->value));
			}
			printf("\n");
			break;
	}
}

/**
 * @brief
 *	returns the state of node
 *
 * @param[in] pbs - structure pointer containing node information
 *
 * @return - string
 * @retval   "" - Failure
 * @retval   "value" - Success
 *
 */
static char *
get_nstate(struct batch_status *pbs)
{
	struct attrl *pat;

	for (pat = pbs->attribs; pat; pat = pat->next) {
		if (strcmp(pat->name, ATTR_NODE_state) == 0)
			return pat->value;
	}
	return "";
}

/**
 * @brief
 *	returns the comment for the node
 *
 * @param pbs - structure pointer containing node information
 *
 * @return - string
 * @retval   "" - Failure
 * @retval   "value" - Success
 *
 */
static char *
get_comment(struct batch_status *pbs)
{
	struct attrl *pat;

	for (pat = pbs->attribs; pat; pat = pat->next) {
		if (strcmp(pat->name, ATTR_comment) == 0)
			return pat->value;
	}
	return "";
}

/*
 * @brief
 *	returns indication if node is marked down or not
 *
 * @param pbs - structure pointer containing node information
 *
 * @return - Error code
 * @retval   1 - Failure indiacating node is down
 * @retval   0 - Success indicating node is not down
 *
 */
static int
is_down(struct batch_status *pbs)
{
	if (strstr(get_nstate(pbs), ND_down) != NULL)
		return 1;
	else
		return 0;
}

/*
 * @brief
 *      returns indication if node is marked offline or not
 *
 * @param pbs - structure pointer containing node information
 *
 * @return - Error code
 * @retval   1 - Failure indiacating node is  offline
 * @retval   0 - Success indicating node is not ofline
 *
 */
static int
is_offline(struct batch_status *pbs)
{
	if (strstr(get_nstate(pbs), ND_offline) != NULL)
		return 1;
	else
		return 0;
}

/**
 * @brief
 *	Mark the node with values sent as parameters
 *
 * @param[in] con - value to test connected to server or not
 * @param[in] name - name of node
 * @param[in] state1 - current state
 * @param[in] op1 - integer value corresponding to  state1
 * @param[in] state2 - transition to this state
 * @param[in] op2 - integere value corresponding to state2
 *
 * @return	int
 * @retval	0		success
 * @retval	pbse error	failure
 *
 */
static int
marknode(int con, char *name,
	 char *state1, enum batch_op op1,
	 char *state2, enum batch_op op2,
	 char *comment)
{
	char Comment[80];
	struct attropl new[3];
	int i;
	int rc;

	i = 0;
	if (state1 != NULL) {
		new[i].name = ATTR_NODE_state;
		new[i].resource = NULL;
		new[i].value = state1;
		new[i].op = op1;
		new[i].next = NULL;
	}
	if (state2 != NULL) {
		if (state1 != NULL) {
			new[i].next = &new[i + 1];
			++i;
		}
		new[i].name = ATTR_NODE_state;
		new[i].resource = NULL;
		new[i].value = state2;
		new[i].op = op2;
		new[i].next = NULL;
	}

	if (comment != NULL) {
		if (state1 != NULL || state2 != NULL) {
			new[i].next = &new[i + 1];
			++i;
		}
		snprintf(Comment, 80, "%s", comment);
		new[i].name = ATTR_comment;
		new[i].resource = NULL;
		new[i].value = Comment;
		new[i].op = SET;
		new[i].next = NULL;
	}

	rc = pbs_manager(con, MGR_CMD_SET, MGR_OBJ_HOST, name, new, NULL);
	if (rc && !quiet) {
		char *errmsg;

		fprintf(stderr, "Error marking node %s - ", name);
		if ((errmsg = pbs_geterrmsg(con)) != NULL)
			fprintf(stderr, "%s\n", errmsg);
		else
			fprintf(stderr, "error: %d\n", pbs_errno);
	}
	return (rc);
}

/**
 * @brief
 *	The main function in C - entry point
 *
 * @param[in]  argc - argument count
 * @param[in]  argv - pointer to argument array
 *
 * @return  int
 * @retval  0 - success
 * @retval  !0 - error
 */
int
main(int argc, char *argv[])
{
	time_t timenow;
	struct attrl *pattr = NULL;
	int con;
	char *def_server = NULL;
	int errflg = 0;
	char *errmsg;
	int i;
	int rc = 0;
	extern char *optarg;
	extern int optind;
	char **pa;
	char *comment = NULL;
	struct batch_status *bstat = NULL;
	struct batch_status *bstat_head = NULL;
	struct batch_status *next_bstat = NULL;
	int do_vnodes = 0;
	mgr_operation_t oper = LISTSP;
	int ret = 0;
	int job_summary = 0;
	int long_summary = 0;
	int format = 0;
	int prt_summary = 0;
	json_data *json_root = NULL; /* root of json structure */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	if (argc == 1)
		errflg = 1;
	while ((i = getopt(argc, argv, "acC:dD:F:HjlLoqrs:Sv")) != EOF)
		switch (i) {

			case 'a':
				if (oper == LISTSP)
					oper = ALL;
				else
					errflg = 1;
				break;

			case 'c':
				if (oper == LISTSP || do_vnodes == 1)
					oper = CLEAR;
				else
					errflg = 1;
				break;

			case 'C':
				if (optarg && (oper == LISTSP)) {
					oper = UPDATE_COMMENT;
					comment = optarg;
				} else if (optarg && (oper == OFFLINE || oper == RESET))
					comment = optarg;
				else
					errflg = 1;
				break;

			case 'd':
				if (oper == LISTSP || do_vnodes == 1)
					oper = DOWN;
				else
					errflg = 1;
				break;

			case 'D':
				if (oper == LISTSP || oper == ALL || oper == LISTSPNV)
					dsv_delim = optarg;
				else
					errflg = 1;
				break;

			case 'F':
				for (format = FORMAT_DEFAULT; format < FORMAT_MAX; format++) {
					if (strcasecmp(optarg, output_format_names[format]) == 0) {
						output_format = format;
						break;
					}
				}
				if (format >= FORMAT_MAX)
					errflg = 1;
				break;

			case 'H':
				if (oper == LISTSP)
					oper = LISTSPNV;
				else
					errflg = 1;
				break;

			case 'j':
				if (oper == LISTSP || oper == ALL || oper == LISTSPNV)
					job_summary = 1;
				else
					errflg = 1;
				break;

			case 'l':
				if (oper == LISTSP || do_vnodes == 1)
					oper = LISTMRK;
				else
					errflg = 1;
				break;

			case 'L':
				if (oper == LISTSP || oper == ALL || oper == LISTSPNV)
					long_summary = 1;
				else
					errflg = 1;
				break;

			case 'o':
				if (oper == LISTSP || do_vnodes == 1 || oper == UPDATE_COMMENT)
					oper = OFFLINE;
				else
					errflg = 1;
				break;

			case 'q':
				quiet = 1;
				break;

			case 'r':
				if (oper == LISTSP || do_vnodes == 1 || oper == UPDATE_COMMENT)
					oper = RESET;
				else
					errflg = 1;
				break;

			case 's':
				def_server = optarg;
				break;

			case 'S':
				if (oper == LISTSP || oper == ALL || oper == LISTSPNV)
					prt_summary = 1;
				else
					errflg = 1;
				break;

			case 'v':
				if (oper == LISTSP || oper == ALL)
					do_vnodes = 1;
				else
					errflg = 1;
				break;

			case '?':
			default:
				errflg = 1;
				break;
		}

	if (errflg ||
	    (oper == LISTMRK && optind != argc) ||
	    (oper == CLEAR && optind == argc) ||
	    (oper == OFFLINE && optind == argc) ||
	    (oper == RESET && optind == argc) ||
	    (oper == LISTSPNV && optind == argc) ||
	    (oper == LISTSP && optind == argc) ||
	    (oper == UPDATE_COMMENT && optind == argc) ||
	    (prt_summary && (oper != LISTSP && oper != LISTSPNV && oper != ALL))) {
		if (!quiet)
			fprintf(stderr,
				"usage:\t%s [-{o|r}][-C comment][-s server] host host ...\n"
				"\t%s -l [-s server]\n"
				"\t%s [-s server] -v vnode vnode ...\n"
				"\t%s -a[v][S[j][L]][-F format][-D delim][-s server]\n"
				"\t%s -[H][S[j][L]][-F format][-D delim] host host ...\n"
				"\t%s --version\n\n",
				argv[0], argv[0], argv[0], argv[0], argv[0], argv[0]);
		exit(1);
	}

	if (def_server == NULL) {
		def_server = pbs_default();
		if (def_server == NULL)
			def_server = "";
	}

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "pbsnodes: unable to initialize security library.\n");
		exit(1);
	}

	con = cnt2server(def_server);
	if (con <= 0) {
		if (!quiet)
			fprintf(stderr, "%s: cannot connect to server %s, error=%d\n",
				argv[0], def_server, pbs_errno);
		CS_close_app();
		exit(1);
	}

	/* if do_vnodes is set, get status of all virtual nodes (vnodes) */
	/* else if oper is ALL then get status of all hosts              */

	if ((do_vnodes == 1) || (oper == ALL) ||
	    (oper == DOWN) || (oper == LISTMRK) || (oper == LISTSPNV)) {
		if (do_vnodes || oper == LISTSPNV)
			bstat_head = pbs_statvnode(con, "", NULL, NULL);
		else
			bstat_head = pbs_stathost(con, "", NULL, NULL);

		if (bstat_head == NULL) {
			if (pbs_errno) {
				if (!quiet) {
					if ((errmsg = pbs_geterrmsg(con)) != NULL)
						fprintf(stderr, "%s: %s\n", argv[0], errmsg);
					else
						fprintf(stderr, "%s: Error %d\n", argv[0], pbs_errno);
				}
				exit(1);
			} else {
				if (!quiet)
					fprintf(stderr, "%s: No nodes found\n", argv[0]);
				exit(0);
			}
		}
	}
	/* adding prologue to json output. */
	if (output_format == FORMAT_JSON) {
		timenow = time(0);
		if ((json_root = pbs_json_create_object()) == NULL) {
			fprintf(stderr, "pbsnodes: json error\n");
			exit(1);
		}
		if (pbs_json_insert_number(json_root, "timestamp", (double) timenow)) {
			fprintf(stderr, "pbsnodes: json error\n");
			exit(1);
		}
		if (pbs_json_insert_string(json_root, "pbs_version", PBS_VERSION)) {
			fprintf(stderr, "pbsnodes: json error\n");
			exit(1);
		}
		if (pbs_json_insert_string(json_root, "pbs_server", def_server)) {
			fprintf(stderr, "pbsnodes: json error\n");
			exit(1);
		}
		if ((json_nodes = pbs_json_create_object()) == NULL) {
			fprintf(stderr, "pbsnodes: json error\n");
			exit(1);
		}
		pbs_json_insert_item(json_root, "nodes", json_nodes);
	}
	switch (oper) {

		case DOWN:

			/*
			 * loop through the list of nodes returned above:
			 *   if node is up and is in argv list, mark it down;
			 *   if node is down and not in argv list, mark it up;
			 * for all changed nodes, send in request to server
			 */

			for (bstat = bstat_head; bstat; bstat = bstat->next) {
				for (pa = argv + optind; *pa; pa++) {
					if (cmp_node_name(*pa, bstat->name) == 0) {
						if (is_down(bstat) == 0) {
							ret = marknode(con, bstat->name,
								       ND_down, INCR, NULL, INCR, comment);
							if (ret > 0)
								rc = ret;
						}
						break;
					}
				}
				if (*pa == NULL) {

					/* node not in list, if down now, set up */
					if (is_down(bstat) == 1)
						ret = marknode(con, bstat->name,
							       ND_down, DECR, NULL, DECR, comment);
					if (ret > 0)
						rc = ret;
				}
			}
			pbs_statfree(bstat_head);

			break;

		case CLEAR:

			/* clear DOWN and OFF_LINE from specified nodes		*/

			for (pa = argv + optind; *pa; pa++) {
				ret = marknode(con, *pa, ND_offline, DECR, ND_down, DECR, comment);
				if (ret > 0)
					rc = ret;
			}

			break;

		case RESET:

			/* clear OFF_LINE from specified nodes			*/

			for (pa = argv + optind; *pa; pa++) {
				ret = marknode(con, *pa, ND_offline, DECR, NULL, DECR, comment);
				if (ret > 0)
					rc = ret;
			}
			break;

		case OFFLINE:

			/* set OFF_LINE on specified nodes			*/
			for (pa = argv + optind; *pa; pa++) {
				ret = marknode(con, *pa, ND_offline, INCR, NULL, INCR, comment);
				if (ret > 0)
					rc = ret;
			}
			break;

		case UPDATE_COMMENT:

			/*just add comment to specified nodes*/
			for (pa = argv + optind; *pa; pa++) {
				if (strcmp(*pa, "") == 0)
					continue;
				ret = marknode(con, *pa, NULL, INCR, NULL, INCR, comment);
				if (ret > 0)
					rc = ret;
			}
			break;

		case ALL:

			if (prt_summary) {
				if (prt_node_summary(def_server, bstat_head, job_summary, long_summary)) {
					fprintf(stderr, "pbsnodes: out of memory\n");
					return 1;
				}
			} else {
				for (bstat = bstat_head; bstat; bstat = bstat->next)
					prt_node(bstat);
			}
			if (output_format == FORMAT_JSON) {
				if (pbs_json_print(json_root, stdout))
					fprintf(stderr, "json error\n");
				pbs_json_delete(json_root);
			}
			pbs_statfree(bstat_head);

			break;

		case LISTMRK:

			/* list any node that is marked DOWN or OFF_LINE	*/
			for (bstat = bstat_head; bstat; bstat = bstat->next) {
				if (is_down(bstat) || is_offline(bstat)) {
					printf("%-20s %s %s\n", bstat->name,
					       get_nstate(bstat), show_nonprint_chars(get_comment(bstat)));
				}
			}
			pbs_statfree(bstat_head);

			break;

		case LISTSP:

			/* list the specified nodes or vnodes */
			for (pa = argv + optind; *pa; pa++) {
				if (do_vnodes)
					bstat = pbs_statvnode(con, *pa, NULL, NULL);
				else
					bstat = pbs_stathost(con, *pa, NULL, NULL);
				if (!bstat) {
					if (pbs_errno != 0) {

						if (output_format == FORMAT_JSON) {
							json_data *json_error;
							if ((json_error = pbs_json_create_object()) == NULL) {
								fprintf(stderr, "pbsnodes: json error\n");
								exit(1);
							}
							pbs_json_insert_item(json_nodes, *pa, json_error);
							if (pbs_json_insert_string(json_error, *pa, pbs_geterrmsg(con))) {
								fprintf(stderr, "pbsnodes: json error\n");
								exit(1);
							}
						} else {
							fprintf(stderr, "Node: %s,  Error: %s\n", *pa, pbs_geterrmsg(con));
							rc = 1;
						}
					}
				} else {
					if (prt_summary) {
						if (prt_node_summary(def_server, bstat, job_summary, long_summary)) {
							fprintf(stderr, "pbsnodes: out of memory\n");
							exit(1);
						}
					} else {
						prt_node(bstat);
					}
					pbs_statfree(bstat);
				}
			}
			if (output_format == FORMAT_JSON) {
				if (pbs_json_print(json_root, stdout))
					fprintf(stderr, "json error\n");
				pbs_json_delete(json_root);
			}
			if (do_vnodes) {
				pbs_statfree(bstat_head);
			}

			break;

		case LISTSPNV:

			/*list nodes and vnodes associated with them.*/
			if (argc - optind) {
				for (bstat = bstat_head; bstat; bstat = bstat->next) {
					int matched;

					matched = 0;
					pa = argv + optind;
					while (*pa) {
						if (pa == NULL) {
							pa++;
							continue;
						}
						pattr = bstat->attribs;
						while (pattr) {
							if (pattr->resource) {
								if (strcmp(pattr->resource, "host") == 0) {
									if (strcmp(pattr->value, *pa) == 0)
										matched = 1;
								}
							}
							if (matched)
								break;
							pattr = pattr->next;
						}
						if (matched) {
							if (prt_summary) {
								next_bstat = bstat->next;
								bstat->next = NULL;
								prt_node_summary(def_server, bstat, job_summary, long_summary);
								bstat->next = next_bstat;
							} else {
								prt_node(bstat);
							}
							matched = 0;
							break;
						}
						pa++;
					}
				}
			}
			pa = argv + optind;
			while (*pa) {
				bstat = pbs_stathost(con, *pa, NULL, NULL);
				if (!bstat) {
					if (pbs_errno != 0) {
						if (output_format == FORMAT_JSON) {
							json_data *json_error;
							if ((json_error = pbs_json_create_object()) == NULL) {
								fprintf(stderr, "pbsnodes: json error\n");
								exit(1);
							}
							pbs_json_insert_item(json_nodes, *pa, json_error);
							if (pbs_json_insert_string(json_error, *pa, pbs_geterrmsg(con))) {
								fprintf(stderr, "pbsnodes: json error\n");
								exit(1);
							}
						} else {
							fprintf(stderr, "Node: %s,  Error: %s\n", *pa, pbs_geterrmsg(con));
							rc = 1;
						}
					} else
						pbs_statfree(bstat);
				}
				pa++;
			}
			if (output_format == FORMAT_JSON) {
				if (pbs_json_print(json_root, stdout))
					fprintf(stderr, "json error\n");
				pbs_json_delete(json_root);
			}
			pbs_statfree(bstat_head);
			break;
	}
	(void) pbs_disconnect(con);
	return (rc ? 1 : 0);
}


================================================
FILE: src/cmds/pbsrun.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

# Global variables

# build_arg_counts: given a list of options and their arguments, returns
# a space-separated list of elements of the form:
#
#   -optionN:<# of arguments>
#
# For instance,
#	given: -v -gm-wait <n>"
#	output: -v:0 -gm-wait:1
# NOTE: if error encountered parsing the arguments, return value is "".

build_arg_counts ()
{

  num_args=0
  find_opt=1
  arg_counts=""
  while [ $# -gt 0 ] ; do

    first_char=`printf "%s" "$1" | cut -b1`
    last_char=`printf "%s" "$1" | awk '{printf "%s", substr($1,length($1),1)}'`

    if [ $find_opt -eq 1 ] ; then


	if [ "$first_char" = "-" ] ; then

	  if [ "`printf "%s" "$1" | sed $SED_OPT_XREGEXP 's/^(-|--)//g' | cut -b1`" = "-" ] ; then
		echo ""
		return
	  fi

    	  find_opt=0
          num_args=0
          arg_counts="$arg_counts $1"
	  shift
	  if [ "$1" = "" ] ; then
             arg_counts="${arg_counts}:${num_args}"
	  fi
	else
	  echo ""
	  return
	fi

     else

	if [ "$first_char" = "<" ] && [ "$last_char" = ">" ] ; then
      	  num_args=`expr $num_args + 1`
	  shift
	  if [ "$1" = "" ] ; then
             arg_counts="${arg_counts}:${num_args}"
	  fi
        elif [ "$first_char" = "-" ] ; then
          arg_counts="${arg_counts}:${num_args}"
	  find_opt=1
	else
	  echo ""
	  return
	fi
     fi

  done

  echo "$arg_counts"

}

# Given an option, and an options list that was transformed by
# build_arg_counts(), returns the # of arguments of the option that
# was matched in the options list. Otherwise, -1 is returned.
# For instance,
#	given: -v -x:0 -opt:1 -z:0 -v:0 -gm-buffers:1 -gx:gb:3 --totalnum=*:0
#	return:  0 since "-v" (first argument) has no arguments (-v:0)
match_opt ()
{

  opt_given=$1
  shift

  if [ "`printf "%s" "$opt_given" | cut -b1`" != "-" ] ; then
	echo -1
	return
  fi

  while [ $# -gt 0 ] ; do

	opt_2match=`printf "%s" "$1" | awk -F":" '{
             for(i=1;i<NF;i++) {
                if( i == (NF-1) ) {
                  printf "%s",$i
                } else {
                  printf "%s:",$i
                }
             } }'`

    	opt_num_args=`printf "%s" "$1" | awk -F":" '{ print $NF }'`

	# wcard_str is for egrep matching and not glob
	wcard_str=""
	if [ `printf "%s" $opt_2match | egrep -c "\*"` -ne 0 ]  ; then
		wcard_str=`printf "%s" $opt_2match | sed 's/*/.+/g'`
	fi

	# if opt_given contains wildcard "*", then do egrep matching
	if [ "$opt_2match" = "$opt_given" ]  || \
	   ([ "$wcard_str" != "" ] && \
	    [ `printf "%s" $opt_given | egrep -c -e "$wcard_str"` -ne 0 ]) ; then
		echo $opt_num_args
		return
	fi
	shift

  done

  echo -1

}

# given a list of options and values as transformed by
# build_arg_counts(), this returns a space-separated, list of single
# option letters. For instance,
#	given: -v:0 -opt:1 -x:0 -y:2 -z:0 -gm-buffers:1 -gx:gb:3
#	return: -v -x -z

build_single_letter_noargs_opts ()
{
  single_letter_opts=""
  while [ $# -gt 0 ] ; do

	opt_2match=`printf "%s" "$1" | awk -F":" '{
             for(i=1;i<NF;i++) {
                if( i == (NF-1) ) {
                  printf "%s",$i
                } else {
                  printf "%s:",$i
                }
             } }'`
        opt_2match_len=`printf "%s" "$opt_2match" | sed $SED_OPT_XREGEXP 's/^(-|--)//g' | \
					awk '{print length($1)}'`
    	opt_num_args=`printf "%s" "$1" | awk -F":" '{ print $NF }'`

	if [ $opt_2match_len -eq 1 ] && [ $opt_num_args -eq 0 ] ; then
		single_letter_opts="$single_letter_opts $opt_2match"
	fi
	shift

  done

  printf "%s" "$single_letter_opts"

}

# Given an option, and an options list, return 0 if the given option
# matches one of the items on the options list.
# For instance,
#	given: "-v" -x -opt happy -z -v --totalnum=*
#	return 0 since "-v" (first argument) is in the  succeeding
#	arguments list.
match_opt2 ()
{
	opt_given=$1
	shift

	if [ "`printf "%s" "$opt_given" | cut -b1`" != "-" ] ; then
		echo -1
		return
	fi

   	while [ $# -gt 0 ] ; do

		if [ "`printf "%s" "$1" | cut -b1`" != "-" ] ; then
			shift
			continue
		fi

		# wcard_str is for egrep matching and not glob
		wcard_str=""
		if [ `printf "%s" $1 | egrep -c "\*"` -ne 0 ]  ; then
			wcard_str=`printf "%s" $1 | sed 's/*/.+/g'`
		fi


		if [ "$opt_given" = "$1" ] || \
		   ([ "$wcard_str" != "" ] && \
		    [ `printf "%s" $opt_given | egrep -c -e "$wcard_str"` -ne 0 ]) ; then
			echo 0
			return
		fi
		shift
	done
	echo -1
}

# Given an input list of single letter/no option arguments (SLNOA) (arg #1),
# a valid options list that was transformed by build_arg_counts() (arg #2),
# and a list of actual options and arguments to parse (args #3..#N),
# return a new list such that any "combined" single letter, no option arguments
# appearing in the SLNOA list are separated out. For instance,
# given: "-v -x -y -z -a -b" "-v:0 -x:0 -y:0 -z:0 -opt:1" -v -opt happy -xyz
# output: -v -opt happy -x -y -z
expand_args ()
{
	options_single_letter=$1
	options_valid=$2
	shift 2

	options_to_return=""
   	while [ $# -gt 0 ] ; do
    	  first_char=`printf "%s" $1 | cut -b1`
	  second_char=`printf "%s" $1 | cut -b2,2`

	  if [ "$first_char"  = "-" ] ; then

		if [ "$second_char" = "-" ] ; then
			prefix="--"
		else
			prefix="-"
		fi
	  	option_str="`printf "%s" "$1" | sed $SED_OPT_XREGEXP 's/^(-|--)//g'`"
	  	option_str_len=`printf "%s" "$option_str" | awk '{print length($1)}'`

		i=1
	  	exp_option_str=""
		while [ $i -le $option_str_len ] ; do
			exp_option_str="$exp_option_str ${prefix}`printf "%s" "$option_str" | cut -b${i},${i}`"
			i=`expr $i + 1`
		done

		match_all=1
		for opt in $exp_option_str ; do
		   if [ `match_opt2 $opt $options_single_letter` -eq -1 ] ; then
			match_all=0
			break
		   fi
		done

		if [ $match_all -eq 1 ] && \
		   [ `match_opt $1 $options_valid` -eq -1 ] ; then
			options_to_return="$options_to_return $exp_option_str"
		else
			options_to_return="$options_to_return $1"
		fi

	  else
		options_to_return="$options_to_return $1"
	  fi
	  shift
	done
	printf "%s" "$options_to_return"
}

#####################################################
# MAIN
#####################################################

# Returns the option in sed for doing extended regular expression.
# This returns "-r", "-E", or "" if no option could be found.

SED_OPT_XREGEXP=""
for e in "-r" "-E" ; do
	sed $e 's/^(-|--)//g' /dev/null 2>/dev/null >/dev/null
	if [ $? -eq 0 ]; then
		SED_OPT_XREGEXP="$e"
		break
	fi
done

if [ "$SED_OPT_XREGEXP" = "" ] ; then
	echo "Could not find option to sed for doing extended regular expressions."
	exit 1
fi


# We need to get name of the actual binary, and not some link
# that resulted from wrapping
if [ -h $0 ] ; then
   realpath=`ls -l $0 | awk -F "->" '{print $2}'| tr -d ' '`
   name=`basename $realpath`
else
   name=`basename $0`
fi

. ${PBS_CONF_FILE:-@PBS_CONF_FILE@}
export PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"
export PATH=$PATH:${PBS_EXEC}/bin

PBS_LIB_PATH=${PBS_EXEC}/lib
if [ ! -d ${PBS_LIB_PATH} -a -d ${PBS_EXEC}/lib64 ] ; then
	PBS_LIB_PATH=${PBS_EXEC}/lib64
fi

if [ -h ${PBS_LIB_PATH}/MPI/${name}.link ] ; then
   mpirun=`ls -l ${PBS_LIB_PATH}/MPI/${name}.link | awk -F "->" '{print $2}'| tr -d ' '`
   if [ ! -x "$mpirun" ] ; then
	echo "mpirun=$mpirun is not executable!"
	exit 127

   fi
else
   echo "No mpirun link found under ${PBS_LIB_PATH}/MPI/$name.link !"
   echo "Please run pbsrun_wrap to create the link"
   exit 127
fi

# let's source the initialization script
mpirun_location=`dirname $mpirun`

if [ -s ${PBS_LIB_PATH}/MPI/${name}.init ] ; then
   . ${PBS_LIB_PATH}/MPI/${name}.init
else
   echo "No ${PBS_LIB_PATH}/MPI/{$name}.init file exists!"
   exit 127
fi

if [ "${PBS_NODEFILE:-XX}" = "XX" ]; then
   if [ "$name" != "mpirun" ]; then
      echo "$name: Warning, not running under PBS"

      if [ ${strict_pbs:=0} -eq 1 ] ; then
		echo "$name: exiting since strict_pbs is enabled; execute only in PBS"
		exit 1
      fi
   fi

   # parse arguments looking for any quoted arguments
   # to preserved.
   # Use 'pres_pos_params' in place of $*

   pres_pos_params=""
   while [ $# -gt 0 ]
   do
        nwords=`echo $1 | wc -w 2>/dev/null`
        if [ "$nwords" = "" ] ; then
           nwords=1
        fi
        if [ $nwords -gt 1 ] ; then
                pres_pos_params="${pres_pos_params} \"$1\""
        else
                pres_pos_params="${pres_pos_params} $1"
        fi
        shift
   done

   eval $mpirun $pres_pos_params
   exit $?
fi

if [ "$option_to_configfile" != "" ] ; then
	if [ `printf "%s" "$option_to_configfile" | awk '{print NF}'` -ne 2 ] ; then
		echo "option_to_configfile must contain single option and its argument: Please fix in ${PBS_LIB_PATH}/MPI/${name}.init!"
   		exit 127
	fi
fi

_options_to_retain="`build_arg_counts $options_to_retain`"

if [ "$_options_to_retain" = "" ] && [ "$options_to_retain" != "" ] ; then
   echo "Encountered bad options_to_retain=$options_to_retain in ${PBS_LIB_PATH}/MPI/${name}.init!"
   exit 127
fi

_options_to_ignore="`build_arg_counts $options_to_ignore`"
if [ "$_options_to_ignore" = "" ] && [ "$options_to_ignore" != "" ] ; then
   echo "Encountered bad options_to_ignore=$options_to_ignore in ${PBS_LIB_PATH}/MPI/${name}.init!"
   exit 127
fi

_options_to_transform="`build_arg_counts $options_to_transform`"
if [ "$_options_to_transform" = "" ] && \
			[ "$options_to_transform" != "" ] ; then
   echo "Encountered bad options_to_transform=$options_to_transform in ${PBS_LIB_PATH}/MPI/${name}.init!"
   exit 127
fi

_options_with_single_letter=`build_single_letter_noargs_opts \
				$_options_to_retain \
				$_options_to_ignore \
				$_options_to_transform`


configfile=""
configfile_new="${PBS_TMPDIR}/pbsrun_config$$"
in_configfile=0

# Signals to catch
trap '(end_action $mpirun_location); /bin/rm -f ${configfile_new}; exit 1;'  1 2 3 15

num_lines=1
line=1
_option_list_global=""
while [ $line -le $num_lines ] ; do


   if [ $in_configfile -eq 1 ] ; then
	cmd_seg=`eval sed -n '${line}p' $configfile`

	# skip past comment lines
	while [ `printf "%s" "$cmd_seg" | egrep -c "^#"` -ne 0 ] ; do
		line=`expr $line + 1`
		if [ $line -gt $num_lines ] ; then
			# go to top loop
			break 2
		fi
		cmd_seg=`eval sed -n '${line}p' $configfile`
	done
	set -- $cmd_seg
   fi

   # parse arguments looking for any quoted arguments
   # to preserved.
   # Use 'pres_pos_params' in place of $*

   pres_pos_params=""
   while [ $# -gt 0 ]
   do
        nwords=`echo $1 | wc -w 2>/dev/null`
        if [ "$nwords" = "" ] ; then
           nwords=1
        fi
        if [ $nwords -gt 1 ] ; then
                pres_pos_params="${pres_pos_params} \"$1\""
        else
                pres_pos_params="${pres_pos_params} $1"
        fi
        shift
   done

   eval set -- `expand_args "$_options_with_single_letter" \
	   "$_options_to_retain $_options_to_ignore $_options_to_transform" $pres_pos_params`

   option_list=""
   num_retain=-1
   num_ignore=-1
   num_transform=-1
   prog_args=""
   in_prog_args=0
   while [ $# -gt 0 ] ; do

	# first time matching configfile option
	if [ $in_configfile -eq 0 ] &&
		[ `match_opt2 $1 $option_to_configfile` -eq 0 ] ; then

		shift
		configfile="$1"

		if [ "$configfile" = "" ] ; then
			echo "$name: No configfile value given!"
			(end_action)
			exit 1
		fi
		if ! [ -s "$configfile" ] ; then
			echo "$name: File $configfile does not exit or zero length!"
			(end_action)
			exit 1
		fi

		# reset flags and counters
		in_configfile=1
		num_lines=`wc -l $configfile | awk '{print $1}'`
		line=1
   		cat /dev/null > ${configfile_new}

		# whatever command line segment we've encountered
		# previously will be considered "global" arguments.
   		_option_list_global=`configfile_cmdline_action $option_list`

		shift
		if [ "$1" != "" ] ; then
			echo "$name: Extra options after ${option_to_configfile}!"
			(end_action)
			exit 1
		fi
		# first line will contain -machinefile option
		# which maps processes to host
		configfile_first=`configfile_firstline_action`
		if [ "$configfile_first" != "" ] ; then
   			echo "$configfile_first" >> ${configfile_new}
		fi
		# go to top loop
		continue 2
	fi

	if [ $in_prog_args -eq 1 ] ; then

		# handle multiple command line segments
		if [ "$1" = ":" ] ; then
			option_list="$option_list :"
			in_prog_args=0
			shift
			if [ "$1" = ":" ] ; then
			   echo "$name: encountered empty command args segment!"
			   (end_action $mpirun_location)
		    	   /bin/rm -f ${configfile_new}
			   exit 1
			fi
		else
			option_list="$option_list $1"
			shift
		fi
		continue
	fi

	if [ `match_opt2 $1 $options_to_fail` -eq 0 ] ; then
		echo "$name: option $1 is not allowed!"
		(end_action $mpirun_location)
		/bin/rm -f ${configfile_new}
		exit 1
	fi

	if [ `match_opt2 $1 $options_with_another_form` -eq 0 ] ; then
		echo "$name: warning: $1 has multiple forms; the  one supported is listed in \"$options_with_another_form\""
	fi

	num_retain=`match_opt $1 $_options_to_retain`
	if [ $num_retain -ge 0 ] ; then

		option_list="$option_list $1"

		loop=$num_retain
		while [ $loop -gt 0 ] ; do
			shift
			nwords=`echo $1 | wc -w 2>/dev/null`
			if [ "$nwords" = "" ] ; then
				nwords=1
			fi
			if [ $nwords -gt 1 ] ; then
				option_list="$option_list \"$1\""
			else
				option_list="$option_list $1"
			fi
			loop=`expr $loop - 1`
		done

		shift
		continue
	fi

	num_ignore=`match_opt $1 $_options_to_ignore`
	if [ $num_ignore -ge 0 ] ; then
		echo "$name: warning: ignoring option $1"
		loop=$num_ignore
		while [ $loop -gt 0 ] ; do
			shift
			loop=`expr $loop - 1`
		done
		shift
		continue
	fi

	num_transform=`match_opt $1 $_options_to_transform`
	if [ $num_transform -ge 0 ] ; then
		loop=$num_transform
		transform_list="$transform_list $1"

		while [ $loop -gt 0 ] ; do
			shift
			nwords=`echo $1 | wc -w 2>/dev/null`
			if [ "$nwords" = "" ] ; then
				nwords=1
			fi
			if [ $nwords -gt 1 ] ; then
				transform_list="$transform_list \"$1\""
			else
				transform_list="$transform_list $1"
			fi
			loop=`expr $loop - 1`
		done

		option_list="$option_list `transform_action $transform_list`"
	fi

	if [ $num_retain -eq -1 ] && [ $num_ignore -eq  -1 ] && \
					[ $num_transform -eq -1 ] ; then
		if [ "`printf "%s" $1 | cut -b1`" = "-" ] ; then
			echo "$name: option $1 is not recognized!"
			echo "$name: Please update ${PBS_LIB_PATH}/MPI/${name}.init"
			(end_action $mpirun_location)
			/bin/rm -f ${configfile_new}
			exit 127
		else
			option_list="$option_list $pbs_attach $options_to_pbs_attach $1"
			in_prog_args=1
		fi
	fi
      shift
#  inner loop
   done

   if [ $in_configfile -eq 1 ] ; then
	if [ "$option_list" != "" ] ; then
   		echo "$option_list" >> ${configfile_new}
	fi
   else
   	_option_list=`evaluate_options_action $option_list`
   fi

   line=`expr $line + 1`

# top loop
done

(boot_action $mpirun_location)
if [ $? -eq 0 ] ; then
	if [ $in_configfile -eq 1 ] ; then
		eval $mpirun $_option_list_global -configfile ${configfile_new}
	else
		eval $mpirun $_option_list
	fi
fi
ret=$?

(end_action $mpirun_location)
/bin/rm -f ${configfile_new}
exit $ret

return 0


================================================
FILE: src/cmds/pbsrun_unwrap.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

exec_cmd () {
  $* 2>/dev/null
  if [ $? -ne 0 ] ; then
	echo "$progname: FAILED:  \"$*\""
	exit 1
  else
	echo "$progname: EXECUTED: \"$*\""
  fi

}

. ${PBS_CONF_FILE:-@PBS_CONF_FILE@}
export PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"

progname=`basename $0`
usage="$progname pbsrun.<keyword>"
usag2="$progname --version"

pbs_mpirun=$1

PBS_EXEC_BIN=${PBS_EXEC}/bin
PBS_LIB_PATH=${PBS_EXEC}/lib
if [ ! -d ${PBS_LIB_PATH} -a -d ${PBS_EXEC}/lib64 ] ; then
	PBS_LIB_PATH=${PBS_EXEC}/lib64
fi

# sanity checks
if [ "${PBS_EXEC_BIN}" =  "*" ] ; then
	echo "$progname: PBS_EXEC_BIN set to *!"
	exit 1
fi

if [ "${pbs_mpirun}" =  "*" ] ; then
	echo "$progname: pbs_mpirun set to *!"
	exit 1
fi


if [ $# -ne 1 ] ; then
   echo "$usage"
   echo "$usag2"
   exit 1
fi

if [ -h ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.link ] ; then
   actual_mpirun=`ls -l ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.link | \
					awk -F "->" '{print $2}'| tr -d ' '`
   if [ ! -x "$actual_mpirun" ] ; then
	echo "$progname: mpirun=$pbs_mpirun is not executable!"
	exit 1
   fi
else
   echo "$progname: did not find a ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.link!"
   exit 1
fi
orig_mpirun_dir=`dirname $actual_mpirun`
orig_mpirun_name=`basename ${actual_mpirun} .actual`
# sanity check
if [ "${orig_mpirun_dir}" =  "*" ] || \
		[ "${orig_mpirun_name}" =  "*" ] ; then
	echo "$progname: orig_mpirun_dir or ori_mpirun_name set to *!"
	exit 1
fi
orig_mpirun="${orig_mpirun_dir}/${orig_mpirun_name}"


echo "$progname: saving a copy of $actual_mpirun to ${orig_mpirun}.back$$"
res=`exec_cmd cp $actual_mpirun ${orig_mpirun}.back$$`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
        exit 1
fi

echo "$progname: restoring $actual_mpirun to $orig_mpirun"

res=`exec_cmd rm -f ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.link`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
        exit 1
fi

res=`exec_cmd rm -f $orig_mpirun`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
        exit 1
fi

res=`exec_cmd rm -f ${PBS_EXEC_BIN}/${pbs_mpirun}`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
        exit 1
fi

res=`exec_cmd rm -f ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.init`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
        exit 1
fi

res=`exec_cmd mv $actual_mpirun $orig_mpirun`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
        exit 1
fi


================================================
FILE: src/cmds/pbsrun_wrap.in
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

exec_cmd () {
  $* 2>/dev/null
  if [ $? -ne 0 ] ; then
        echo "$progname: FAILED:  \"$*\""
  else
        echo "$progname: EXECUTED: \"$*\""
  fi

}

. ${PBS_CONF_FILE:-@PBS_CONF_FILE@}
export PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"

progname=`basename $0`
usage="$progname [-s] <path_to_actual_mpirun> pbsrun.<keyword>"
usag2="$progname --version"

options_list=`getopt s $*`
if [ $? != 0 ] ; then
        echo "$usage"
        echo "$usag2"
        exit 2
fi

set -- $options_list

strict_pbs=0
for i in $* ; do
        case $i in
        -s) strict_pbs=1; shift;;
        --) shift; break;;
        esac
done

PBS_EXEC_BIN=${PBS_EXEC}/bin
PBS_LIB_PATH=${PBS_EXEC}/lib
if [ ! -d ${PBS_LIB_PATH} -a -d ${PBS_EXEC}/lib64 ] ; then
	PBS_LIB_PATH=${PBS_EXEC}/lib64
fi

if [ $# -ne 2 ] ; then
   echo "$usage"
   echo "$usag2"
   exit 1
fi

actual_mpirun=$1
pbs_mpirun=$2

if [ "`echo $pbs_mpirun | awk -F. '{print $1}'`" != "pbsrun" ] ; then
   	echo "$usage"
   	echo "$usag2"
   	exit 1
fi

if [ "`echo $pbs_mpirun | awk -F. '{print $2}'`" == "" ] ; then
   	echo "$usage"
   	echo "$usag2"
   	exit 1
fi

if ! [ -x $actual_mpirun ] ; then
   echo "$progname: $actual_mpirun not exists and an executable!"
   exit 1
fi

actual_mpirun_name=`basename $actual_mpirun`
actual_mpirun_dir=`dirname $actual_mpirun`

# Save original mpirun script
res=`exec_cmd mv $actual_mpirun ${actual_mpirun}.actual`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
	exit 1
fi

# Instantiate pbsrun
if [ "$pbs_mpirun" = "pbsrun.poe" ]; then
	res=`exec_cmd cp ${PBS_LIB_PATH}/MPI/${pbs_mpirun} ${PBS_EXEC_BIN}`
else
	res=`exec_cmd cp ${PBS_EXEC_BIN}/pbsrun ${PBS_EXEC_BIN}/${pbs_mpirun}`
fi
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
	exit 1
fi

res=`exec_cmd chmod 755 ${PBS_EXEC_BIN}/${pbs_mpirun}`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
	exit 1
fi

res=`exec_cmd ln -s ${PBS_EXEC_BIN}/$pbs_mpirun $actual_mpirun`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
	exit 1
fi

res=`exec_cmd ln -s ${actual_mpirun}.actual ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.link`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
	exit 1
fi

# Instantiate the *.init.in script to *.init
eval sed 's/^strict_pbs=.*/strict_pbs=${strict_pbs}/' ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.init.in > ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.init 2>/dev/null
if [ $? -ne 0 ] || [ ! -s ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.init ] ; then
	echo "FAILED to instantiate ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.init.in as ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.init"
	exit 1
fi

res=`exec_cmd chmod 644  ${PBS_LIB_PATH}/MPI/${pbs_mpirun}.init`
echo $res
if [ `echo $res | egrep -c FAILED` -ne 0 ] ; then
	exit 1
fi


================================================
FILE: src/cmds/qalter.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qalter.c
 * @brief
 * 	qalter - (PBS) alter batch job
 *
 * @author  Terry Heidelberg
 * 			Livermore Computing
 *
 * @author	Bruce Kelly
 *      	National Energy Research Supercomputer Center
 *
 * @author	Lawrence Livermore National Laboratory
 *      	University of California
 */

#include <pbs_config.h>

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>
#include "portability.h"

/**
 * @brief
 * 	prints usage format for qalter command
 *
 * @return - Void
 *
 */
static void
print_usage()
{
	static char usag2[] = "       qalter --version\n";
	static char usage[] =
		"usage: qalter [-a date_time] [-A account_string] [-c interval] [-e path]\n"
		"\t[-h hold_list] [-j y|n] [-k keep] [-l resource_list]\n"
		"\t[-m mail_options] [-M user_list] [-N jobname] [-o path] [-p priority]\n"
		"\t[-R o|e|oe] [-r y|n] [-S path] [-u user_list] [-W dependency_list]\n"
		"\t[-P project_name] job_identifier...\n";
	fprintf(stderr, "%s", usage);
	fprintf(stderr, "%s", usag2);
}

/**
 * @brief
 * 	handles attribute errors and prints appropriate errmsg
 *
 * @param[in] connect - value indicating server connection
 * @param[in] err_list - list of possible attribute errors
 * @param[in] id - corresponding id(string) for attribute error
 *
 * @return - Void
 *
 */
static void
handle_attribute_errors(int connect,
			struct ecl_attribute_errors *err_list, char *id)
{
	struct attropl *attribute;
	char *opt;
	int i;

	for (i = 0; i < err_list->ecl_numerrors; i++) {
		attribute = err_list->ecl_attrerr[i].ecl_attribute;
		if (strcmp(attribute->name, ATTR_a) == 0)
			opt = "a";
		else if (strcmp(attribute->name, ATTR_A) == 0)
			opt = "A";
		else if (strcmp(attribute->name, ATTR_project) == 0)
			opt = "P";
		else if (strcmp(attribute->name, ATTR_c) == 0)
			opt = "c";
		else if (strcmp(attribute->name, ATTR_e) == 0)
			opt = "e";
		else if (strcmp(attribute->name, ATTR_h) == 0)
			opt = "h";
		else if (strcmp(attribute->name, ATTR_j) == 0)
			opt = "j";
		else if (strcmp(attribute->name, ATTR_k) == 0)
			opt = "k";
		else if (strcmp(attribute->name, ATTR_l) == 0) {
			opt = "l";
			fprintf(stderr, "qalter: %s %s\n",
				err_list->ecl_attrerr[i].ecl_errmsg, id);
			exit(err_list->ecl_attrerr[i].ecl_errcode);
		} else if (strcmp(attribute->name, ATTR_m) == 0)
			opt = "m";
		else if (strcmp(attribute->name, ATTR_M) == 0)
			opt = "M";
		else if (strcmp(attribute->name, ATTR_N) == 0)
			opt = "N";
		else if (strcmp(attribute->name, ATTR_o) == 0)
			opt = "o";
		else if (strcmp(attribute->name, ATTR_p) == 0)
			opt = "p";
		else if (strcmp(attribute->name, ATTR_r) == 0)
			opt = "r";
		else if (strcmp(attribute->name, ATTR_R) == 0)
			opt = "R";
		else if (strcmp(attribute->name, ATTR_S) == 0)
			opt = "S";
		else if (strcmp(attribute->name, ATTR_u) == 0)
			opt = "u";
		else if ((strcmp(attribute->name, ATTR_depend) == 0) ||
			 (strcmp(attribute->name, ATTR_stagein) == 0) ||
			 (strcmp(attribute->name, ATTR_stageout) == 0) ||
			 (strcmp(attribute->name, ATTR_sandbox) == 0) ||
			 (strcmp(attribute->name, ATTR_umask) == 0) ||
			 (strcmp(attribute->name, ATTR_runcount) == 0) ||
			 (strcmp(attribute->name, ATTR_g) == 0))
			opt = "W";
		else
			return;

		pbs_disconnect(connect);
		CS_close_app();

		if (err_list->ecl_attrerr->ecl_errcode == PBSE_JOBNBIG)
			fprintf(stderr, "qalter: Job %s \n", err_list->ecl_attrerr->ecl_errmsg);
		else {
			fprintf(stderr, "qalter: illegal -%s value\n", opt);
			print_usage();
		}
		exit(2);
	}
}

int
main(int argc, char **argv, char **envp) /* qalter */
{
	int c;
	int errflg = 0;
	int any_failed = 0;
	char *pc;
	int i;
	struct attrl *attrib = NULL;
	char *keyword;
	char *valuewd;
	char *erplace;
	time_t after;
	char a_value[80];

	char job_id[PBS_MAXCLTJOBID];

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];
	struct ecl_attribute_errors *err_list;

#define GETOPT_ARGS "a:A:c:e:h:j:k:l:m:M:N:o:p:r:R:S:u:W:P:"

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF)
		switch (c) {
			case 'a':
				if ((after = cvtdate(optarg)) < 0) {
					fprintf(stderr, "qalter: illegal -a value\n");
					errflg++;
					break;
				}
				sprintf(a_value, "%ld", (long) after);
				set_attr_error_exit(&attrib, ATTR_a, a_value);
				break;
			case 'A':
				set_attr_error_exit(&attrib, ATTR_A, optarg);
				break;
			case 'P':
				set_attr_error_exit(&attrib, ATTR_project, optarg);
				break;
			case 'c':
				while (isspace((int) *optarg))
					optarg++;
				pc = optarg;
				if ((pc[0] == 'u') && (pc[1] == '\0')) {
					fprintf(stderr, "qalter: illegal -c value\n");
					errflg++;
					break;
				}
				set_attr_error_exit(&attrib, ATTR_c, optarg);
				break;
			case 'e':
				set_attr_error_exit(&attrib, ATTR_e, optarg);
				break;
			case 'h':
				while (isspace((int) *optarg))
					optarg++;
				set_attr_error_exit(&attrib, ATTR_h, optarg);
				break;
			case 'j':
				set_attr_error_exit(&attrib, ATTR_j, optarg);
				break;
			case 'k':
				set_attr_error_exit(&attrib, ATTR_k, optarg);
				break;
			case 'l':
				if ((i = set_resources(&attrib, optarg, TRUE, &erplace)) != 0) {
					if (i > 1) {
						pbs_prt_parse_err("qalter: illegal -l value\n", optarg,
								  erplace - optarg, i);

					} else
						fprintf(stderr, "qalter: illegal -l value\n");
					errflg++;
				}
				break;
			case 'm':
				while (isspace((int) *optarg))
					optarg++;
				set_attr_error_exit(&attrib, ATTR_m, optarg);
				break;
			case 'M':
				set_attr_error_exit(&attrib, ATTR_M, optarg);
				break;
			case 'N':
				set_attr_error_exit(&attrib, ATTR_N, optarg);
				break;
			case 'o':
				set_attr_error_exit(&attrib, ATTR_o, optarg);
				break;
			case 'p':
				while (isspace((int) *optarg))
					optarg++;
				set_attr_error_exit(&attrib, ATTR_p, optarg);
				break;
			case 'r':
				if (strlen(optarg) != 1) {
					fprintf(stderr, "qalter: illegal -r value\n");
					errflg++;
					break;
				}
				if (*optarg != 'y' && *optarg != 'n') {
					fprintf(stderr, "qalter: illegal -r value\n");
					errflg++;
					break;
				}
				set_attr_error_exit(&attrib, ATTR_r, optarg);
				break;
			case 'R':
				set_attr_error_exit(&attrib, ATTR_R, optarg);
				break;
			case 'S':
				set_attr_error_exit(&attrib, ATTR_S, optarg);
				break;
			case 'u':
				set_attr_error_exit(&attrib, ATTR_u, optarg);
				break;
			case 'W':
				while (isspace((int) *optarg))
					optarg++;
				if (strlen(optarg) == 0) {
					fprintf(stderr, "qalter: illegal -W value\n");
					errflg++;
					break;
				}
				fix_path(optarg, 2);
				i = parse_equal_string(optarg, &keyword, &valuewd);
				while (i == 1) {
					set_attr_error_exit(&attrib, keyword, valuewd);
					i = parse_equal_string(NULL, &keyword, &valuewd);
				}
				if (i == -1) {
					fprintf(stderr, "qalter: illegal -W value\n");
					errflg++;
				}
				break;
			case '?':
			default:
				errflg++;
				break;
		}

	if (errflg || optind == argc) {
		print_usage();
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qalter: unable to initialize security library.\n");
		exit(1);
	}

	for (; optind < argc; optind++) {
		int connect;
		int stat = 0;
		int located = FALSE;

		pbs_strncpy(job_id, argv[optind], sizeof(job_id));
		if (get_server(job_id, job_id_out, server_out)) {
			fprintf(stderr, "qalter: illegally formed job identifier: %s\n", job_id);
			any_failed = 1;
			continue;
		}
	cnt:
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "qalter: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_alterjob(connect, job_id_out, attrib, NULL);
		if (stat && (pbs_errno != PBSE_UNKJOBID)) {
			if ((err_list = pbs_get_attributes_in_error(connect)))
				handle_attribute_errors(connect, err_list, job_id_out);

			prt_job_err("qalter", connect, job_id_out);
			any_failed = pbs_errno;
		} else if (stat && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job_id_out, server_out, rmt_server)) {
				pbs_disconnect(connect);
				strcpy(server_out, rmt_server);
				goto cnt;
			}
			prt_job_err("qalter", connect, job_id_out);
			any_failed = pbs_errno;
		}

		pbs_disconnect(connect);
	}
	CS_close_app();
	exit(any_failed);
}


================================================
FILE: src/cmds/qdel.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qdel.c
 * @brief
 * 	qdel - (PBS) delete batch job
 *
 * @author  Terry Heidelberg
 * 			Livermore Computing
 *
 * @author  Bruce Kelly
 * 			National Energy Research Supercomputer Center
 *
 * @author  Lawrence Livermore National Laboratory
 * 			University of California
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>

#define MAX_TIME_DELAY_LEN 32
#define GETOPT_ARGS "W:x"

extern void free_svrjobidlist(svr_jobid_list_t *list, int shallow);
extern int add_jid_to_list_by_name(char *job_id, char *svrname, svr_jobid_list_t **svr_jobid_list_hd);

static int num_deleted = 0;

/**
 * @brief	Process the deljob error response from server
 *
 * @param[in]	clusterid - cluster name (PBS_SERVER)
 * @param[in]	list - list of deljob response objects
 * @param[out]	rmtlist - return pointer to list of jobs to try deleting on remote servers
 * @param[out]	nfailed - number of failed jobs
 *
 * @return int
 * @retval error code from server
 */
static int
process_deljobstat(char *clusterid, struct batch_deljob_status **list, svr_jobid_list_t **rmtlist, int *nfailed)
{
	struct batch_deljob_status *p_delstatus;
	struct batch_deljob_status *next = NULL;
	struct batch_deljob_status *prev = NULL;
	char *errtxt = NULL;
	int any_failed = 0;

	*nfailed = 0;

	for (p_delstatus = *list; p_delstatus != NULL; prev = p_delstatus, p_delstatus = next) {
		next = p_delstatus->next;
		if (p_delstatus->code == PBSE_UNKJOBID && rmtlist != NULL) {
			char rmt_server[PBS_MAXDEST + 1];

			/* Check if job was moved to a remote cluster */
			if (locate_job(p_delstatus->name, clusterid, rmt_server)) {
				if (add_jid_to_list_by_name(strdup(p_delstatus->name), rmt_server, rmtlist) != 0)
					return pbs_errno;
				else { /* Job found on remote server, let's remove it from error list */
					if (prev != NULL)
						prev->next = next;
					else
						*list = next;
					p_delstatus->next = NULL;
					pbs_delstatfree(p_delstatus);
					p_delstatus = prev;
					continue;
				}
			}
		}
		if (p_delstatus->code != PBSE_HISTJOBDELETED) {
			errtxt = pbse_to_txt(p_delstatus->code);
			if ((errtxt != NULL) && (p_delstatus->code != PBSE_HISTJOBDELETED)) {
				fprintf(stderr, "%s: %s %s\n", "qdel", errtxt, p_delstatus->name);
				any_failed = p_delstatus->code;
			}
		}
		*nfailed += 1;
	}

	return any_failed;
}

/**
 * @brief	Get the mail suppression limit
 *
 * @param[in]	connect - connection fd
 *
 * @return int
 * @retval mail suppression limit
 */
static int
get_mail_suppress_count(int connect)
{
	struct batch_status *ss = NULL;
	struct attrl attr = {0};
	char *errmsg;
	char *keystr, *valuestr;
	int maillimit = 0;

	attr.name = ATTR_dfltqdelargs;
	attr.value = "";
	ss = pbs_statserver(connect, &attr, NULL);

	if (ss == NULL && pbs_errno != PBSE_NONE) {
		if ((errmsg = pbs_geterrmsg(connect)) != NULL)
			fprintf(stderr, "qdel: %s\n", errmsg);
		else
			fprintf(stderr, "qdel: Error %d\n", pbs_errno);
		exit(pbs_errno);
	}

	if (ss != NULL && ss->attribs != NULL && ss->attribs->value != NULL) {
		if (parse_equal_string(ss->attribs->value, &keystr, &valuestr)) {
			if (strcmp(keystr, "-Wsuppress_email") == 0)
				maillimit = atol(valuestr);
			else
				fprintf(stderr, "qdel: unsupported %s \'%s\'\n",
					ss->attribs->name, ss->attribs->value);
		}
	}
	pbs_statfree(ss);

	return maillimit;
}

/**
 * @brief	Helper function to handle job deletion for a given cluster
 *
 * @param[in]	clusterid - id of the cluster, currently the PBS_SERVER value
 * @param[in]	jobids - the list of jobs to delete on this server
 * @param[in]	numids - count of jobs to delete
 * @param[in]	dfltmail - mail suppression limit from the -W CLI value
 * @param[in]	warg - -W tokens ('force' et al)
 *
 * @return int
 * @retval pbs_errno
 */
static int
delete_jobs_for_cluster(char *clusterid, char **jobids, int numids, int dfltmail, char *warg, int wargsz)
{
	int connect;
	int mails; /* number of emails we can send */
	int numofjobs;
	struct batch_deljob_status *p_delstatus;
	int any_failed = 0;
	char warg1[MAX_TIME_DELAY_LEN + 7];
	svr_jobid_list_t *rmtsvr_jobid_list = NULL;
	svr_jobid_list_t *iter_remote = NULL;
	int nfailed = 0;

	strcpy(warg1, NOMAIL);

	if (clusterid == NULL || jobids == NULL)
		return PBSE_INTERNAL;

	if (numids <= 0)
		return PBSE_NONE;

	connect = cnt2server(clusterid);
	if (connect <= 0) {
		fprintf(stderr, "Couldn't connect to cluster: %s\n", clusterid);
		return pbs_errno;
	}

	/* retrieve default: suppress_email from server: default_qdel_arguments */
	mails = dfltmail;
	if (mails == 0)
		mails = get_mail_suppress_count(connect);
	if (mails == 0)
		mails = QDEL_MAIL_SUPPRESS;
	mails = mails - num_deleted;
	if (mails < 0)
		mails = 0;

	/* First, delete mail limit number of jobs */
	int temp = 0;
	int diff = 0;
	numofjobs = temp = (mails <= numids) ? mails : numids;
	p_delstatus = pbs_deljoblist(connect, jobids, numofjobs, warg);
	diff = temp - numofjobs;
	any_failed = process_deljobstat(clusterid, &p_delstatus, &rmtsvr_jobid_list, &nfailed);
	pbs_delstatfree(p_delstatus);
	num_deleted += (numofjobs - nfailed);

	if (numofjobs < numids) { /* More jobs to delete */
		int any_failed_local = 0;
		/* when jobs to be deleted over the mail suppression limit, mail function is disabled
		* by sending the flag below to server via its extend field:
		*   "" -- delete a job with a mail
		*   "nomail" -- delete a job without sending a mail
		*   "force" -- force job to be deleted with a mail
		*   "nomailforce" -- force job to be deleted without sending a mail
		*   "nomaildeletehist" -- delete history of a job without sending mail
		*   "nomailforcedeletehist" -- force delete history of a job without sending mail.
		*
		* current warg1 "nomail" should be at start
		*/
		strcat(warg1, warg);
		pbs_strncpy(warg, warg1, wargsz);
		p_delstatus = pbs_deljoblist(connect, &jobids[numofjobs + diff], (numids - numofjobs - diff), warg);
		any_failed_local = process_deljobstat(clusterid, &p_delstatus, &rmtsvr_jobid_list, &nfailed);
		pbs_delstatfree(p_delstatus);
		num_deleted += ((numids - numofjobs) - nfailed);
		if (any_failed_local)
			any_failed = any_failed_local;
	}

	/* Delete any jobs which were found on remote servers */
	for (iter_remote = rmtsvr_jobid_list; iter_remote != NULL; iter_remote = iter_remote->next) {
		int fd;
		int any_failed_local = 0;

		fd = pbs_connect(iter_remote->svrname);
		if (fd > 0) {
			p_delstatus = pbs_deljoblist(fd, iter_remote->jobids, iter_remote->total_jobs, warg);
			any_failed_local = process_deljobstat(iter_remote->svrname, &p_delstatus, NULL, &nfailed);
			pbs_delstatfree(p_delstatus);
			num_deleted += (iter_remote->total_jobs - nfailed);
			if (any_failed_local)
				any_failed = any_failed_local;
			pbs_disconnect(fd);
		}
	}

	free_svrjobidlist(rmtsvr_jobid_list, 0);
	pbs_disconnect(connect);

	return any_failed;
}

/**
 * @brief	Helper function to group the total list of jobs by each cluster
 *
 * @param[in]	jobids - list of jobids
 * @param[in]	numjids - the number of job ids
 *
 * @return svr_jobid_list_t *
 * @retval the svr_jobid_list_t list of clusters and jobids within each
 * @retval NULL for error
 */
static svr_jobid_list_t *
group_jobs_by_cluster(char **jobids, int numjids, int *any_failed)
{
	int i;
	char server_out[PBS_MAXSERVERNAME];
	char job_id_out[PBS_MAXCLTJOBID];
	svr_jobid_list_t *svr_jobid_list_hd = NULL;
	char *dflt_server = pbs_default();

	/* Club jobs by each server */
	for (i = 0; i < numjids; i++) {
		if (get_server(jobids[i], job_id_out, server_out)) {
			fprintf(stderr, "qdel: illegally formed job identifier: %s\n", jobids[i]);
			*any_failed = 1;
			continue;
		}
		if (server_out[0] == '\0') {
			if (dflt_server != NULL)
				pbs_strncpy(server_out, dflt_server, sizeof(server_out));
		}
		if (server_out[0] == '\0') {
			fprintf(stderr, "Couldn't determine server name for job %s\n", jobids[i]);
			*any_failed = 1;
			continue;
		}

		if (add_jid_to_list_by_name(jobids[i], server_out, &svr_jobid_list_hd) != 0)
			return NULL;
	}

	return svr_jobid_list_hd;
}

int
main(int argc, char **argv, char **envp) /* qdel */
{
	int c;
	int errflg = 0;
	int any_failed = 0;
	char *pc;
	int forcedel = FALSE;
	int deletehist = FALSE;
	char *keystr, *valuestr;
	char **jobids = NULL;
	int dfltmail = 0;
	int numids = 0;
	/* -W no longer supports a time delay */
	/* max length is "nomailforcedeletehist" plus terminating '\0' */
	char warg[MAX_TIME_DELAY_LEN + 1];
	svr_jobid_list_t *jobsbycluster = NULL;
	svr_jobid_list_t *iter_list = NULL;
	int any_failed_local = 0;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	warg[0] = '\0';
	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF) {
		switch (c) {
			case 'W':
				pc = optarg;
				if (strlen(pc) == 0) {
					fprintf(stderr, "qdel: illegal -W value\n");
					errflg++;
					break;
				}
				if (strcmp(pc, FORCE) == 0) {
					forcedel = TRUE;
					break;
				}
				if (parse_equal_string(optarg, &keystr, &valuestr)) {
					if (strcmp(keystr, SUPPRESS_EMAIL) == 0) {
						dfltmail = atol(valuestr);
						break;
					}
				}

				while (*pc != '\0') {
					if (!isdigit(*pc)) {
						fprintf(stderr, "qdel: illegal -W value\n");
						errflg++;
						break;
					}
					pc++;
				}
				break;
			case 'x':
				deletehist = TRUE;
				break;
			default:
				errflg++;
		}
	}

	if (errflg || optind >= argc) {
		static char usage[] =
			"usage:\n"
			"\tqdel [-W force|suppress_email=X] [-x] job_identifier...\n"
			"\tqdel --version\n";
		fprintf(stderr, "%s", usage);
		exit(2);
	}

	if (forcedel && deletehist)
		snprintf(warg, sizeof(warg), "%s%s", FORCE, DELETEHISTORY);
	else if (forcedel)
		strcpy(warg, FORCE);
	else if (deletehist)
		strcpy(warg, DELETEHISTORY);

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qdel: unable to initialize security library.\n");
		exit(1);
	}

	jobids = &argv[optind];
	numids = argc - optind;
	if (jobids == NULL || numids <= 0) {
		/* No jobs to delete */
		return 0;
	}

	/* Send delete job list request by each cluster */
	jobsbycluster = group_jobs_by_cluster(jobids, numids, &any_failed);
	if (jobsbycluster == NULL) {
		exit(1);
	}
	for (iter_list = jobsbycluster; iter_list != NULL; iter_list = iter_list->next) {
		any_failed_local = delete_jobs_for_cluster(iter_list->svrname, iter_list->jobids,
							   iter_list->total_jobs, dfltmail, warg, sizeof(warg));
	}
	free_svrjobidlist(jobsbycluster, 1);
	if (any_failed_local)
		any_failed = any_failed_local;

	/* cleanup security library initializations before exiting */
	CS_close_app();

	if (any_failed == 0 && pbs_errno != PBSE_NONE)
		any_failed = PBSE_NONE;

	exit(any_failed);
}


================================================
FILE: src/cmds/qdisable.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qdisable.c
 * @brief
 *  The qdisable command directs that a destination should no longer accept
 *  batch jobs.
 *
 * @par	Synopsis:
 *  	qdisable destination ...
 *
 * @par	Arguments:
 *  	destination ...
 *      A list of destinations.  A destination has one of the following
 *      three forms:
 *          queue
 *          @server
 *          queue@server
 *      If queue is specified, the request is to disable the queue at
 *      the default server.  If @server is given, the request is to
 *      disable the default queue at the server.  If queue@server is
 *      used, the request is to disable the named queue at the named
 *      server.
 *
 * @author 	Bruce Kelly
 *  		National Energy Research Supercomputer Center
 *  		Livermore, CA
 *    		May, 1993
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include <pbs_version.h>

int exitstatus = 0; /* Exit Status */

static void execute(char *, char *);

int
main(int argc, char **argv)
{
	/*
	 *  This routine sends a Manage request to the batch server specified by
	 * the destination.  The ENABLED queue attribute is set to {False}.  If the
	 * batch request is accepted, the server will no longer accept Queue Job
	 * requests for the specified queue.
	 */

	int dest;     /* Index into the destination array (argv) */
	char *queue;  /* Queue name part of destination */
	char *server; /* Server name part of destination */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	if (argc == 1) {
		fprintf(stderr, "Usage: qdisable [queue][@server] ...\n");
		fprintf(stderr, "       qdisable --version\n");
		exit(1);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qdisable.c: unable to initialize security library.\n");
		exit(1);
	}

	for (dest = 1; dest < argc; dest++)
		if (parse_destination_id(argv[dest], &queue, &server) == 0)
			execute(queue, server);
		else {
			fprintf(stderr, "qdisable: illegally formed destination: %s\n",
				argv[dest]);
			exitstatus = 1;
		}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(exitstatus);
}

/**
 * @brief
 *	disables a queue on server
 *
 * @param[in] queue - The name of the queue to disable.
 * @param[in] server - The name of the server that manages the queue.
 *
 * @return - Void
 *
 * @File Variables:
 *  exitstatus  Set to two if an error occurs.
 *
 */
static void
execute(char *queue, char *server)
{
	int ct;	      /* Connection to the server */
	int merr;     /* Error return from pbs_manager */
	char *errmsg; /* Error message from pbs_manager */
	/* The disable request */
	static struct attropl attr = {NULL, "enabled", NULL, "FALSE", SET};

	if ((ct = cnt2server(server)) > 0) {
		merr = pbs_manager(ct, MGR_CMD_SET, MGR_OBJ_QUEUE, queue, &attr, NULL);
		if (merr != 0) {
			errmsg = pbs_geterrmsg(ct);
			if (errmsg != NULL) {
				fprintf(stderr, "qdisable: %s ", errmsg);
			} else {
				fprintf(stderr, "qdisable: Error (%d) disabling queue ", pbs_errno);
			}
			if (notNULL(queue))
				fprintf(stderr, "%s", queue);
			if (notNULL(server))
				fprintf(stderr, "@%s", server);
			fprintf(stderr, "\n");
			exitstatus = 2;
		}
		pbs_disconnect(ct);
	} else {
		fprintf(stderr, "qdisable: could not connect to server %s (%d)\n", server, pbs_errno);
		exitstatus = 2;
	}
}


================================================
FILE: src/cmds/qenable.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qenable.c
 * @brief
 *  The qenable command directs that a destination should no longer accept
 *  batch jobs.
 *
 * @par	Synopsis:
 *  qenable destination ...
 *
 * @par	Arguments:
 *  destination ...
 *      A list of destinations.  A destination has one of the following
 *      three forms:
 *          queue
 *          @server
 *          queue@server
 *      If queue is specified, the request is to enable the queue at
 *      the default server.  If @server is given, the request is to
 *      enable the default queue at the server.  If queue@server is
 *      used, the request is to enable the named queue at the named
 *      server.
 *
 *  @author	Bruce Kelly
 *   		National Energy Research Supercomputer Center, Livermore, CA
 *  		May, 1993
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include <pbs_version.h>

int exitstatus = 0; /* Exit Status */
static void execute(char *, char *);

int
main(int argc, char **argv)
{
	/*
	 *  This routine sends a Manage request to the batch server specified by
	 * the destination.  The ENABLED queue attribute is set to {True}.  If the
	 * batch request is accepted, the server will accept Queue Job requests for
	 * the specified queue.
	 */

	int dest;     /* Index into the destination array (argv) */
	char *queue;  /* Queue name part of destination */
	char *server; /* Server name part of destination */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	if (argc == 1) {
		fprintf(stderr, "Usage: qenable [queue][@server] ...\n");
		fprintf(stderr, "       qenable --version\n");
		exit(1);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qenable: unable to initialize security library.\n");
		exit(1);
	}

	for (dest = 1; dest < argc; dest++)
		if (parse_destination_id(argv[dest], &queue, &server) == 0)
			execute(queue, server);
		else {
			fprintf(stderr, "qenable: illegally formed destination: %s\n",
				argv[dest]);
			exitstatus = 1;
		}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(exitstatus);
}

/**
 * @brief
 *	enables a queue on server
 *
 * @param[in] queue - The name of the queue to enable.
 * @param[in] server - The name of the server that manages the queue.
 *
 * @return - Void
 *
 * @File Variables:
 * exitstatus  Set to two if an error occurs.
 *
 */
static void
execute(char *queue, char *server)
{
	int ct;	      /* Connection to the server */
	int merr;     /* Error return from pbs_manager */
	char *errmsg; /* Error message from pbs_manager */
	/* The disable request */
	static struct attropl attr = {NULL, "enabled", NULL, "TRUE", SET};

	if ((ct = cnt2server(server)) > 0) {
		merr = pbs_manager(ct, MGR_CMD_SET, MGR_OBJ_QUEUE, queue, &attr, NULL);
		if (merr != 0) {
			errmsg = pbs_geterrmsg(ct);
			if (errmsg != NULL) {
				fprintf(stderr, "qenable: %s ", errmsg);
			} else {
				fprintf(stderr, "qenable: Error (%d) enabling queue ", pbs_errno);
			}
			if (notNULL(queue))
				fprintf(stderr, "%s", queue);
			if (notNULL(server))
				fprintf(stderr, "@%s", server);
			fprintf(stderr, "\n");
			exitstatus = 2;
		}
		pbs_disconnect(ct);
	} else {
		fprintf(stderr, "qenable: could not connect to server %s (%d)\n", server, pbs_errno);
		exitstatus = 2;
	}
}


================================================
FILE: src/cmds/qhold.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qhold.c
 * @brief
 * 	qhold - (PBS) hold batch job
 *
 * @author     	Terry Heidelberg
 * 				Livermore Computing
 *
 * @author     	Bruce Kelly
 * 				National Energy Research Supercomputer Center
 *
 * @author     	Lawrence Livermore National Laboratory
 * 				University of California
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>

/**
 * @brief
 *      prints usage format for qhold command
 *
 * @return - Void
 *
 */
static void
print_usage()
{
	static char usag2[] = "       qhold --version\n";
	static char usage[] =
		"usage: qhold [-h hold_list] job_identifier...\n";

	fprintf(stderr, "%s", usage);
	fprintf(stderr, "%s", usag2);
}

/**
 * @brief
 *      handles attribute errors and prints appropriate errmsg
 *
 * @param[in] connect - value indicating server connection
 * @param[in] err_list - list of possible attribute errors
 *
 * @return - Void
 *
 */
static void
handle_attribute_errors(int connect,
			struct ecl_attribute_errors *err_list)
{
	struct attropl *attribute;
	char *opt;
	int i;

	for (i = 0; i < err_list->ecl_numerrors; i++) {
		attribute = err_list->ecl_attrerr[i].ecl_attribute;
		if (strcmp(attribute->name, ATTR_h) == 0)
			opt = "h";
		else
			return;

		fprintf(stderr, "qhold: illegal -%s value\n", opt);
		print_usage();
		pbs_disconnect(connect);

		/*cleanup security library initializations before exiting*/
		CS_close_app();
		exit(2);
	}
}

int
main(int argc, char **argv, char **envp) /* qhold */
{
	int c;
	int errflg = 0;
	int any_failed = 0;
	char job_id[PBS_MAXCLTJOBID]; /* from the command line */

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];
	struct ecl_attribute_errors *err_list;

#define MAX_HOLD_TYPE_LEN 32
	char hold_type[MAX_HOLD_TYPE_LEN + 1];

#define GETOPT_ARGS "h:-:"

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	hold_type[0] = '\0';

	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF)
		switch (c) {
			case 'h':
				while (isspace((int) *optarg))
					optarg++;
				if (optarg[0] == '\0') {
					fprintf(stderr, "qhold: illegal -h value\n");
					errflg++;
				} else
					pbs_strncpy(hold_type, optarg, sizeof(hold_type));
				break;
			default:
				errflg++;
		}

	if (errflg || optind >= argc) {
		print_usage();
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qhold: unable to initialize security library.\n");
		exit(2);
	}

	for (; optind < argc; optind++) {
		int connect;
		int stat = 0;
		int located = FALSE;

		pbs_strncpy(job_id, argv[optind], sizeof(job_id));
		if (get_server(job_id, job_id_out, server_out)) {
			fprintf(stderr, "qhold: illegally formed job identifier: %s\n", job_id);
			any_failed = 1;
			continue;
		}
	cnt:
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "qhold: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_holdjob(connect, job_id_out, hold_type, NULL);
		if (stat && (err_list = pbs_get_attributes_in_error(connect)))
			handle_attribute_errors(connect, err_list);

		if (stat && (pbs_errno != PBSE_UNKJOBID)) {
			prt_job_err("qhold", connect, job_id_out);
			any_failed = pbs_errno;
		} else if (stat && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job_id_out, server_out, rmt_server)) {
				pbs_disconnect(connect);
				strcpy(server_out, rmt_server);
				goto cnt;
			}
			prt_job_err("qhold", connect, job_id_out);
			any_failed = pbs_errno;
		}

		pbs_disconnect(connect);
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(any_failed);
}


================================================
FILE: src/cmds/qmgr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qmgr.c
 * @brief
 *  	The qmgr command provides an administrator interface to the batch
 *      system.  The command reads directives from standard input.  The syntax
 *      of each directive is checked and the appropriate request is sent to the
 *      batch server or servers.
 * @par	Synopsis:
 *      qmgr [-a] [-c command] [-e] [-n] [-z] [server...]
 *
 * @par Options:
 *      -a      Abort qmgr on any syntax errors or any requests rejected by a
 *              server.
 *
 *      -c command
 *              Execute a single command and exit qmgr.
 *
 *      -e      Echo all commands to standard output.
 *
 *      -n      No commands are executed, syntax checking only is performed.
 *
 *      -z      No errors are written to standard error.
 *
 * 	@par Arguments:
 *      server...
 *              A list of servers to administer.  If no servers are given, then
 *              use the default server.
 *
 *
 *	@par Exitcodes:
 *	  0 - successful
 *	  1 - error in parse
 *	  2 - error in execute
 *	  3 - error connect_servers
 *	  4 - error set_active
 *	  5 - memory allocation error
 *
 * @author 	Bruce Kelly
 * 			National Energy Research Supercomputer Center
 * 			Livermore, CA
 *			March, 1993
 *
 */

#include <pbs_config.h>

#include <stdio.h>
#include <unistd.h>
#include <ctype.h>
#include <pwd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <errno.h>

/* PBS include files */
#include <cmds.h>
#include <qmgr.h>
#include "libpbs.h"
#include "pbs_version.h"
#include "pbs_share.h"
#include "hook.h"
#include "pbs_ifl.h"
#include "net_connect.h"
#include "server_limits.h"
#include "attribute.h"
#include "pbs_entlim.h"
#include "resource.h"
#include "pbs_ecl.h"
#include "libutil.h"

/* Global Variables */
#define QMGR_TIMEOUT 900 /* qmgr connection timeout set to 15 min */
time_t start_time = 0;
time_t check_time = 0;

char prompt[] = "Qmgr: "; /* Prompt if input is from terminal */
char contin[] = "Qmgr< "; /* Prompt if input is continued across lines */
char *cur_prompt = prompt;
const char hist_init_err[] = "History could not be initialized\n";
const char histfile_access_err[] = "Cannot read/write history file %s, history across sessions disabled\n";
int qmgr_hist_enabled = 0;	     /* history is enabled by default */
char qmgr_hist_file[MAXPATHLEN + 1]; /* history file for this user */

static char hook_tempfile_errmsg[HOOK_MSG_SIZE] = {'\0'};

/*
 * This variable represents the use of the -z option on the command line.
 * It is declared here because it must be used by the pstderr routine to
 * determine if any message should be printed to standard error.
 */
int zopt = FALSE; /* -z option */

static struct server *servers = NULL; /* Linked list of server structures */
static int nservers = 0;	      /* Number of servers */

/* active objects */
struct objname *active_servers;
struct objname *active_queues;
struct objname *active_nodes;
struct objname *active_scheds;

/* The following refer to who is executing the qmgr and from what host */
char cur_host[PBS_MAXHOSTNAME + 1];
char cur_user[PBS_MAXHOSTNAME + 1];
char conf_full_server_name[PBS_MAXHOSTNAME + 1] = {'\0'};

const char syntaxerr[] = "qmgr: Syntax error\n";

/* List of attribute names for attributes of type entlim */
static char *entlim_attrs[] = {
	ATTR_max_run,
	ATTR_max_run_res,
	ATTR_max_run_soft,
	ATTR_max_run_res_soft,
	ATTR_max_queued,
	ATTR_max_queued_res,
	ATTR_queued_jobs_threshold,
	ATTR_queued_jobs_threshold_res,
	NULL /* keep as last one please */
};

/* Hook-related variables and functions */

static char *hook_tempfile = NULL; /* a temporary file in PBS_HOOK_WORKDIR */
static char *hook_tempdir = NULL;  /* PBS_HOOK_WORKDIR path */

extern void qmgr_list_history(int);
extern int init_qmgr_hist(char *);
extern int qmgr_add_history(char *);
extern int get_request_hist(char **);

/**
 * @brief
 * 	dyn_strcpy: copies src string into 'dest', and adjusting the size of
 * 	'dest'  with realloc to fit the value of src.
 *
 * @param[in] dest - destination string for holding hookfile name
 * @param[in] src - src string holding filename
 *
 * @return - Void  (exits the program upon error.)
 *
 */
static void
dyn_strcpy(char **dest, char *src)
{
	char *p;

	if ((dest == NULL) || (*dest == NULL) || (src == NULL)) {

		fprintf(stderr, "dyn_strcpy: bad argument\n");
		exit(1);
	}

	if (strlen(*dest) >= strlen(src)) {
		strcpy(*dest, src);
	} else {
		p = (char *) realloc((char *) *dest, strlen(src) + 1);
		if (p == NULL) {
			fprintf(stderr, "dyn_strcpy: Failed to realloc\n");
			exit(1);
		}
		*dest = p;
	}
	strcpy(*dest, src);
}

/**
 * @brief
 * 	base: returns the basename of the given 'path'.
 *
 * @param[in] path - file path
 *
 * @return string
 * @retval filename
 * exits from program on failure
 *
 */
static char *
base(char *path)
{
	char *p;

	if (path == NULL) {
		fprintf(stderr, "base: bad argument\n");
		exit(1);
	}

	p = (char *) path;

#ifdef WIN32
	if (((p = strrchr(path, '/')) != NULL) || ((p = strrchr(path, '\\')) != NULL))
#else
	if ((p = strrchr(path, '/')))
#endif
	{
		p++;
	}

	return (p);
}

static void
attrlist_add(struct attropl **attrlist, char *attname,
	     size_t attname_len, char *attval, size_t attval_len)
{
	struct attropl *paol;
	int ltxt;

	if ((attrlist == NULL) || (attname == NULL) || (attval == NULL)) {
		fprintf(stderr, "attrlist_add: bad argument\n");
		exit(1);
	}

	/* Allocate storage for attribute structure */
	Mstruct(paol, struct attropl);
	paol->name = NULL;
	paol->resource = NULL;
	paol->value = NULL;
	paol->next = *attrlist;
	*attrlist = paol;

	ltxt = attname_len;
	Mstring(paol->name, ltxt + 1);
	pbs_strncpy(paol->name, attname, ltxt + 1);

	paol->op = SET;

	if (attval_len == 0) { /* don't malloc */
		paol->value = attval;
	} else {
		ltxt = attval_len;
		Mstring(paol->value, ltxt + 1);
		pbs_strncpy(paol->value, attval, ltxt + 1);
	}
}

/* dump_file: dump contents of 'infile' into 'outfile'. If 'infile' is NULL
 or the empty string, then input contents is coming from STDIN; if 'outfile'
 is NULL or the empty string, then contents are dumped into STDOUT.
 Return 0 for success; 1 otherwise, with
 'msg' filled in with error information.
 */
int
dump_file(char *infile, char *outfile, char *infile_encoding, char *msg, size_t msg_len)
{
	FILE *infp;
	FILE *outfp;

	unsigned char in_data[HOOK_BUF_SIZE + 1];
	ssize_t in_len;
	int ret = 0;
	int encode_b64 = 0; /* 1 if encode in base 64 */
	struct stat sb;

	memset(msg, '\0', msg_len);

	if ((infile == NULL) || (infile[0] == '\0')) {
		infp = stdin;
	} else {

		infp = fopen(infile, "rb");

		if (infp == NULL) {
			snprintf(msg, msg_len - 1,
				 "%s - %s", infile, strerror(errno));
			return (1);
		}
		/* need to check if we really opened a file and not a directory/dev */
		if ((fstat(fileno(infp), &sb) != -1) && !S_ISREG(sb.st_mode)) {
			snprintf(msg, msg_len - 1,
				 "%s - Permission denied", infile);

			fclose(infp);
			return (1);
		}
	}

	if ((outfile == NULL) || (outfile[0] == '\0')) {
		outfp = stdout;
	} else {
		outfp = fopen(outfile, "wb");

		if (outfp == NULL) {
			snprintf(msg, msg_len - 1,
				 "%s - %s", outfile, strerror(errno));
			ret = 1;
			goto dump_file_exit;
		}
#ifdef WIN32
		secure_file(outfile, "Administrators",
			    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif
	}

	if (strcmp(infile_encoding, HOOKSTR_BASE64) == 0) {
		encode_b64 = 1;
	}

	while (fgets((char *) in_data, sizeof(in_data), infp) != NULL) {
		in_len = strlen((char *) in_data);
		if (encode_b64 &&
		    (strcmp((char *) in_data, "\n") == 0)) { /* empty line */
			/* signals end of processing, especially when     */
			/* qmgr -c print hook output is fed back to qmgr  */
			/* The output will have one or more hooks         */
			/* definitions with their encoded contents, and   */
			/* an empty line terminates a hook content.       */
			break;
		}
		if (in_len > 0) {
			if (fwrite(in_data, 1, in_len, outfp) != in_len) {
				snprintf(msg, msg_len - 1,
					 "write to %s failed! Aborting...",
					 outfile);
				ret = 1;
				goto dump_file_exit;
			}
		}
	}
	if (fflush(outfp) != 0) {
		snprintf(msg, msg_len - 1,
			 "Failed to dump file %s (error %s)", outfile,
			 strerror(errno));
		ret = 1;
	}

dump_file_exit:
	if (infp && infp != stdin)
		fclose(infp);

	if (outfp && outfp != stdout) {
		fclose(outfp);
	}
	if (ret != 0) {
		if (outfile)
			(void) unlink(outfile);
	}
	return (ret);
}

/*
 *
 *	params_import - parse the parameters to the MGR_CMD_IMPORT
 *			<content-type> <content-encoding> <input_file>|-
 *
 *	  attrs        Text of the import command parameters.
 * 	  OUT: attrlist     Address of the attribute-value structure.
 * 	  doper	directive operation type  - must be import.
 *
 * 	Returns:
 *        This routine returns zero upon successful completion.  If there is
 *        a syntax error, it will return the index into attrs where the error
 *        occurred.
 *
 * 	Note:
 *        The following is an example of the text input and what the resulting
 *        data structure should look like.
 *
 *		"content-type" = "application/x-python"
 *	 	"content-encoding" = "base64"
 *		"input-file" = "in_file.PY"
 *
 *      attrlist ---> struct attropl *
 *                      |
 *                      |
 *                      \/
 *                      "content-type"
 *                      ""
 *                      "application/x-python"
 *                      SET
 *                      ---------
 *                              |
 *                      "content-encoding"   <-
 *                      ""
 *                      "base64"
 *                      SET
 *                      ---------
 *                              |
 *                      "input-file"   <-
 *                      ""
 *                      "in_file.PY"
 *                      SET
 *                      NULL
 */
int
params_import(char *attrs, struct attropl **attrlist, int doper)
{
	int i;
	char *c;     /* Pointer into the attrs text */
	char *start; /* Pointer to the start of a word */
	char *v;     /* value returned by pbs_quote_parse */
	char *e;

	if ((attrs == NULL) || (attrlist == NULL)) {
		fprintf(stderr, "params_import: bad argument\n");
		exit(1);
	}

	if (doper != MGR_CMD_IMPORT)
		return 1;

	/* Free the space from the previous structure */
	freeattropl(*attrlist);
	*attrlist = NULL;

	/* Is there any thing to parse? */
	c = attrs;
	while (White(*c))
		c++;

	if (EOL(*c))
		return 1; /* no parameter */

	/* Parse the parameter values */

	/* Get the content-type */

	start = c;
	while (!EOL(*c) && !White(*c))
		c++;

	if (c == start) {
		/* No attribute */
		if (start == attrs)
			start++;
		return (start - attrs);
	}
	attrlist_add(attrlist, CONTENT_TYPE_PARAM, strlen(CONTENT_TYPE_PARAM),
		     start, c - start);

	/* Get the content-encoding */
	while (White(*c))
		c++;

	if (!EOL(*c)) {
		start = c;
		while (!EOL(*c) && !White(*c))
			c++;

		if (c == start) {
			/* No attribute */
			if (start == attrs)
				start++;
			return (start - attrs);
		}

		attrlist_add(attrlist, CONTENT_ENCODING_PARAM,
			     strlen(CONTENT_ENCODING_PARAM), start, c - start);
	} else
		return (c - attrs);

	/* Get the input-file */
	while (White(*c))
		c++;

	if (!EOL(*c)) {
		i = pbs_quote_parse(c, &v, &e, QMGR_NO_WHITE_IN_VALUE);
		if (i == -1) {
			pstderr("qmgr: Out of memory\n");
			clean_up_and_exit(5);
		} else if (i > 0)
			return (c - attrs);

		/* value ok */
		attrlist_add(attrlist, INPUT_FILE_PARAM, strlen(INPUT_FILE_PARAM), v,
			     strlen(v));
		if (strlen(v) > 0) {
			free(v);
		}

		if (EOL(*e)) {
			return 0; /* end of line */
		}
		c = e; /* otherwise more to parse */
	} else
		return (c - attrs);

	/* See if there is another argument */
	while (White(*c))
		c++;

	if (!EOL(*c))
		return (c - attrs);

	return 0;
}

/**
 * @brief
 *	params_export - parse the parameters to the MGR_CMD_EXPORT
 *			<content-type> <content-encoding> <output_file>
 *
 *	attrs        Text of the export command parameters.
 * 	OUT: attrlist     Address of the attribute-value structure.
 *	doper	directive operation type - must be export
 *
 * @return Returns:
 *        This routine returns zero upon successful completion.  If there is
 *        a syntax error, it will return the index into attrs where the error
 *        occurred.
 *
 * 	Note:
 *        The following is an example of the text input and what the resulting
 *        data structure should look like.
 *
 *		"content-type" = "application/x-python"
 *	 	"content-encoding" = "base64"
 *		"input-file" = "in_file.PY"
 *
 *      attrlist ---> struct attropl *
 *                      |
 *                      |
 *                      \/
 *                      "content-type"
 *                      ""
 *                      "application/x-python"
 *                      SET
 *                      ---------
 *                              |
 *                      "content-encoding"   <-
 *                      ""
 *                      "base64"
 *                      SET
 *                      ---------
 *                              |
 *                      "output-file"   <-
 *                      ""
 *                      "out_file.PY"
 *                      SET
 *                      NULL
 */
int
params_export(char *attrs, struct attropl **attrlist, int doper)
{
	int i;
	char *c;     /* Pointer into the attrs text */
	char *start; /* Pointer to the start of a word */
	char *v;     /* value returned by pbs_quote_parse */
	char *e;

	if ((attrs == NULL) || (attrlist == NULL)) {
		fprintf(stderr, "params_export: bad argument\n");
		exit(1);
	}

	if (doper != MGR_CMD_EXPORT)
		return 1;

	/* Free the space from the previous structure */
	freeattropl(*attrlist);
	*attrlist = NULL;

	/* Is there any thing to parse? */
	c = attrs;
	while (White(*c))
		c++;

	if (EOL(*c))
		return 1; /* no parameter */

	/* Parse the parameter values */

	/* Get the content-type */

	start = c;
	while (!EOL(*c) && !White(*c))
		c++;

	if (c == start) {
		/* No attribute */
		if (start == attrs)
			start++;
		return (start - attrs);
	}
	attrlist_add(attrlist, CONTENT_TYPE_PARAM, strlen(CONTENT_TYPE_PARAM),
		     start, c - start);

	/* Get the content-encoding */
	while (White(*c))
		c++;

	if (!EOL(*c)) {
		start = c;
		while (!EOL(*c) && !White(*c))
			c++;

		if (c == start) {
			/* No attribute */
			if (start == attrs)
				start++;
			return (start - attrs);
		}

		attrlist_add(attrlist, CONTENT_ENCODING_PARAM,
			     strlen(CONTENT_ENCODING_PARAM), start, c - start);
	} else
		return (c - attrs);

	/* Get the OUTPUT_FILE_PARAM */
	while (White(*c))
		c++;

	if (!EOL(*c)) {
		i = pbs_quote_parse(c, &v, &e, QMGR_NO_WHITE_IN_VALUE);
		if (i == -1) {
			pstderr("qmgr: Out of memory\n");
			clean_up_and_exit(5);
		} else if (i > 0) {
			return (c - attrs);
		}
		/* value ok */
		attrlist_add(attrlist, OUTPUT_FILE_PARAM, strlen(OUTPUT_FILE_PARAM), v,
			     strlen(v));
		if (strlen(v) > 0) {
			free(v);
		}

		if (EOL(*e)) {
			return 0; /* end of line */
		}
		c = e; /* otherwise more to parse */
	} else {
		/* ok to not have OUTPUT_FILE_PARAM, just put empty string */
		attrlist_add(attrlist, OUTPUT_FILE_PARAM, strlen(OUTPUT_FILE_PARAM), "", 1);
	}

	/* See if there is another argument */
	while (White(*c))
		c++;

	if (!EOL(*c))
		return (c - attrs);
	return 0;
}

/**
 * @brief
 *	who: returns the username currently running this command
 *
 * @return string
 * @retval username
 *
 */
char *
who()
{
#ifdef WIN32
	return (getlogin()); /* Windows version does not return NULL */

#else
	struct passwd *pw;

	if ((pw = getpwuid(getuid())) == NULL) {
		return ("");
	}

	if (pw->pw_name == NULL)
		return ("");

	return (pw->pw_name);
#endif
}

int
main(int argc, char **argv)
{
	static char opts[] = "ac:enz"; /* See man getopt */
	static char usage[] = "Usage: qmgr [-a] [-c command] [-e] [-n] [-z] [server...]\n";
	static char usag2[] = "       qmgr --version\n";
	int aopt = FALSE;		/* -a option */
	int eopt = FALSE;		/* -e option */
	int nopt = FALSE;		/* -n option */
	char *copt = NULL;		/* -c command option */
	int c;				/* Individual option */
	int errflg = 0;			/* Error flag */
	char *request = NULL;		/* Current request */
	int oper = MGR_CMD_CREATE;	/* Operation: create, delete, set, unset, list, print */
	int type = MGR_OBJ_SERVER;	/* Object type: server or queue */
	char *name = NULL;		/* Object name */
	struct attropl *attribs = NULL; /* Pointer to attribute list */
	struct objname *svrs;
#ifndef WIN32
	int htmp_fd; /* for creating hooks temp file */
#endif

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	/* Command line options */
	while ((c = getopt(argc, argv, opts)) != EOF) {
		switch (c) {
			case 'a':
				aopt = TRUE;
				break;
			case 'c':
				copt = optarg;
				break;
			case 'e':
				eopt = TRUE;
				break;
			case 'n':
				nopt = TRUE;
				break;
			case 'z':
				zopt = TRUE;
				break;
			case '?':
			default:
				errflg++;
				break;
		}
	}

	if (errflg) {
		pstderr(usage);
		pstderr(usag2);
		exit(1);
	}

	if (argc > optind)
		svrs = strings2objname(&argv[optind], argc - optind, MGR_OBJ_SERVER);
	else
		svrs = default_server_name();

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qmgr: unable to initialize security library.\n");
		exit(2);
	}

	pbs_strncpy(cur_user, who(), sizeof(cur_user));
	cur_host[0] = '\0';

	/* obtain global information for hooks */
	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "Failed to load pbs.conf file\n");
		exit(2);
	}

	if (gethostname(cur_host, (sizeof(cur_host) - 1)) == 0)
		get_fullhostname(cur_host, cur_host, (sizeof(cur_host) - 1));

	/*
	 * Get the Server Name which is used in hook related error messages:
	 * 1. from PBS_PRIMARY if defined, if not
	 * 2. from PBS_SERVER_HOST_NAME if defined, if not
	 * 3. from PBS_SERVER, and as last resort
	 * 4. use my host name
	 */
	if (pbs_conf.pbs_primary != NULL) {
		pbs_strncpy(conf_full_server_name, pbs_conf.pbs_primary,
			    sizeof(conf_full_server_name));
	} else if (pbs_conf.pbs_server_host_name != NULL) {
		pbs_strncpy(conf_full_server_name, pbs_conf.pbs_server_host_name,
			    sizeof(conf_full_server_name));
	} else if (pbs_conf.pbs_server_name != NULL) {
		pbs_strncpy(conf_full_server_name, pbs_conf.pbs_server_name,
			    sizeof(conf_full_server_name));
	}
	if (conf_full_server_name[0] != '\0') {
		get_fullhostname(conf_full_server_name, conf_full_server_name,
				 (sizeof(conf_full_server_name) - 1));
	}

	pbs_asprintf(&hook_tempdir, "%s/server_priv/%s",
		     pbs_conf.pbs_home_path, PBS_HOOK_WORKDIR);
	pbs_asprintf(&hook_tempfile, "%s/qmgr_hook%dXXXXXX",
		     hook_tempdir, getpid());

#ifdef WIN32
	/* mktemp() generates a filename */
	if (mktemp(hook_tempfile) == NULL) {
		snprintf(hook_tempfile_errmsg, sizeof(hook_tempfile_errmsg),
			 "unable to generate a hook_tempfile from %s - %s\n",
			 hook_tempfile, strerror(errno));
		hook_tempfile[0] = '\0'; /* hook_tempfile name generation not successful */
	}
#else
	/*
	 * For Linux/Unix, it is recommended to use mkstemp() for mktemp() is
	 * dangerous - see mktemp(3).
	 * mkstemp() generates and CREATES a filename
	 */
	if ((htmp_fd = mkstemp(hook_tempfile)) == -1) {
		snprintf(hook_tempfile_errmsg, sizeof(hook_tempfile_errmsg),
			 "unable to generate a hook_tempfile from %s - %s\n",
			 hook_tempfile, strerror(errno));
		hook_tempfile[0] = '\0'; /* hook_tempfile name generation not successful */
	} else {			 /* success */
		(void) close(htmp_fd);
		(void) unlink(hook_tempfile); /* we'll recreate later if needed */
	}
#endif /* Linux/Unix */

	errflg = connect_servers(svrs, ALL_SERVERS);
	if ((nservers == 0) || (errflg))
		clean_up_and_exit(3);

	errflg = set_active(MGR_OBJ_SERVER, svrs);
	if (errflg && aopt)
		clean_up_and_exit(4);

	/*
	 * If no command was given on the command line, then read them from
	 * stdin until end-of-file.  Otherwise, execute the one command only.
	 */
	if (copt == NULL) {

#ifdef QMGR_HAVE_HIST
		qmgr_hist_enabled = 0;
		if (isatty(0) && isatty(1)) {
			if (init_qmgr_hist(argv[0]) == 0)
				qmgr_hist_enabled = 1;
		}
#endif

		printf("Max open servers: %d\n", pbs_query_max_connections());
		/*
		 * Passing the address of request since the memory is allocated
		 * in the function get_request itself and passed back to the
		 * caller
		 */
		while (get_request(&request) != EOF) {
			check_time = time(0);
			if (attribs) {
				PBS_free_aopl(attribs);
				attribs = NULL;
			}
			if (eopt)
				printf("%s\n", request);

			errflg = parse(request, &oper, &type, &name, &attribs);
			if (errflg == -1) /* help */
				continue;

			if (aopt && errflg)
				clean_up_and_exit(1);

			if (!nopt && !errflg) {
				errflg = execute(aopt, oper, type, name, attribs);
				if (aopt && errflg)
					clean_up_and_exit(2);
			}
			if (request != NULL) {
				free(request);
				request = NULL;
			}
			/*
			 * Deallocate the memory for the variable name whose memory
			 * is allocated originally in the function parse
			 */
			if (name != NULL) {
				free(name);
				name = NULL;
			}
		}
	} else {
		if (eopt)
			printf("%s\n", copt);

		errflg = parse(copt, &oper, &type, &name, &attribs);
		if (aopt && errflg)
			clean_up_and_exit(1);

		if (!nopt && !errflg) {
			errflg = execute(aopt, oper, type, name, attribs);
			if (aopt && errflg)
				clean_up_and_exit(2);
		}
		PBS_free_aopl(attribs);
		/*
		 * Deallocate the memory for the variable name whose memory
		 * is allocated originally in the function parse
		 */
		if (name != NULL) {
			free(name);
			name = NULL;
		}
	}
	if (errflg)
		clean_up_and_exit(errflg);

	clean_up_and_exit(0);

	return 0;
}

/*
 * chk_special_attr_values - do additional syntax checking on the values
 *	of certain attributes
 */
static int
chk_special_attr_values(struct attropl *paol)
{
	int i;
	char *dupval;
	int r;

	i = 0;
	while (entlim_attrs[i]) {
		if (strcmp(paol->name, entlim_attrs[i]) == 0) {
			dupval = strdup(paol->value);
			if (dupval == NULL)
				return 0;
			r = entlim_parse(dupval, paol->resource, NULL, NULL);
			free(dupval);
			return (-r);
		}
		++i;
	}
	return 0;
}

/*
 *
 *	attributes - parse attribute-value pairs in the format:
 *		     attribute OP value
 *		     which are on the qmgr input
 *
 * 	  attrs        Text of the attribute-value pairs.
 * 	  OUT: attrlist     Address of the attribute-value structure.
 * 	  doper	directive operation type (create, delete, set, ...)
 *
 * 	Returns:
 *        This routine returns zero upon successful completion.  If there is
 *        a syntax error, it will return the index or offset into the attrs
 *	  character string (input) where the error occurred.  This can be used
 *	  by the calling function to indicate to the user the character in error
 *
 * 	Note:
 *        The following is an example of the text input and what the resulting
 *        data structure should look like.
 *
 *      a1 = v1, a2.r2 += v2 , a3-=v3
 *
 *      attrlist ---> struct attropl *
 *                      |
 *                      |
 *                      \/
 *                      "a1"
 *                      ""
 *                      "v1"
 *                      SET
 *                      ---------
 *                              |
 *                      "a2"   <-
 *                      "r2"
 *                      "v2"
 *                      INCR
 *                      ---------
 *                              |
 *                      "a3"   <-
 *                      ""
 *                      "v3"
 *                      DECR
 *                      NULL
 */
int
attributes(char *attrs, struct attropl **attrlist, int doper)
{
	int i;
	char *c;     /* Pointer into the attrs text */
	char *start; /* Pointer to the start of a word */
	char *v;     /* value returned by pbs_quote_parse */
	char *e;
	int ltxt; /* Length of a word */
	struct attropl *paol;
	char **pentlim_name;

	/* Free the space from the previous structure */
	freeattropl(*attrlist);
	*attrlist = NULL;

	/* Is there any thing to parse? */
	c = attrs;
	while (White(*c))
		c++;

	if (EOL(*c))
		return 0;

	/* Parse the attribute-values */
	while (TRUE) {
		/* Get the attribute and resource */
		while (White(*c))
			c++;
		if (!EOL(*c)) {
			start = c;
			while ((*c != '.') && (*c != ',') && !EOL(*c) && !Oper(c) && !White(*c))
				c++;

			if (c == start) {
				/* No attribute */
				if (start == attrs)
					start++;
				return (start - attrs);
			}

			/* Allocate storage for attribute structure */
			Mstruct(paol, struct attropl);
			paol->name = NULL;
			paol->resource = NULL;
			paol->value = NULL;
			paol->next = *attrlist;
			*attrlist = paol;

			/* Copy attribute into structure */
			ltxt = c - start;
			Mstring(paol->name, ltxt + 1);
			pbs_strncpy(paol->name, start, ltxt + 1);

			/* Resource, if any */
			if (*c == '.') {
				start = ++c;
				if ((doper == MGR_CMD_UNSET) ||
				    (doper == MGR_CMD_LIST) ||
				    (doper == MGR_CMD_PRINT)) {
					while (!White(*c) && !Oper(c) && !EOL(*c) && !(*c == ','))
						c++;
				} else {
					while (!White(*c) && !Oper(c) && !EOL(*c))
						c++;
				}

				ltxt = c - start;
				if (ltxt == 0) /* No resource */
					return (start - attrs);

				Mstring(paol->resource, ltxt + 1);
				pbs_strncpy(paol->resource, start, ltxt + 1);
			}
		} else
			return (c - attrs);

		/* Get the operator */
		while (White(*c))
			c++;

		if (!EOL(*c)) {
			switch (*c) {
				case '=':
					paol->op = SET;
					c++;
					break;
				case '+':
					paol->op = INCR;
					c += 2;
					break;
				case '-':
					paol->op = DECR;
					c += 2;
					break;
				case ',':
					/* Attribute with no value */
					Mstring(paol->value, 1);
					paol->value[0] = '\0';
					goto next;
				default:
					return (c - attrs);
			}

			/* The unset command must not have a operator or value */
			if (doper == MGR_CMD_UNSET)
				return (c - attrs);
		} else if (doper != MGR_CMD_CREATE && doper != MGR_CMD_SET) {
			Mstring(paol->value, 1);
			paol->value[0] = '\0';
			return 0;
		} else
			return (c - attrs);

		/* Get the value */
		while (White(*c))
			c++;

		/* need to know if the attrbute is of the entlim variety */
		/* look through the list of attribute names which are    */
		pentlim_name = entlim_attrs;
		while (*pentlim_name) {
			if (strcasecmp(*pentlim_name, paol->name) == 0)
				break;
			++pentlim_name;
		}

		if (!EOL(*c)) {
			if (*pentlim_name == NULL) {
				/* regular type of attribute, unquoted white space not allowed in val */
				i = pbs_quote_parse(c, &v, &e, QMGR_NO_WHITE_IN_VALUE);
			} else {
				/* entlim type of attribute, unquoted white space is allowed in val */
				i = pbs_quote_parse(c, &v, &e, QMGR_ALLOW_WHITE_IN_VALUE);
			}
			if (i == -1) {
				pstderr("qmgr: Out of memory\n");
				clean_up_and_exit(5);
			} else if (i > 0)
				return (c - attrs);
			/* value ok */
			paol->value = v;

			/* Add special checks for syntax of value for certain attributes */
			i = chk_special_attr_values(paol);
			if (i > 0)			    /* error return,  i is offset of error in input */
				return (c - attrs + i - 1); /* c - attrs = start + offset is err loc */

			if (EOL(*e))
				return 0; /* end of line */
			c = e;		  /* otherwise more to parse */
		} else
			return (c - attrs);

		/* See if there is another attribute-value pair */
	next:
		while (White(*c))
			c++;
		if (EOL(*c))
			return 0;

		if (*c == ',')
			c++;
		else
			return (c - attrs);
	}
}

/**
 * @brief
 *	make_connection - open a connection to the server and assign
 *			  server entry
 *
 * @param[in] name - name of server to connect to
 *
 *	returns server struct if connection can be made or NULL if not
 *
 */
struct server *
make_connection(char *name)
{
	int connection;
	struct server *svr = NULL;

	if ((connection = cnt2server(name)) > 0) {
		svr = new_server();
		Mstring(svr->s_name, strlen(name) + 1);
		strcpy(svr->s_name, name);
		svr->s_connect = connection;
	} else
		PSTDERR1("qmgr: cannot connect to server %s\n", name)

	return svr;
}

/**
 * @brief
 *	connect_servers - call connect to connect to each server in list
 *			  and add then to the global server list
 *
 * @param[on] server_names - list of objnames
 * @param[in] numservers   - the number of servers to connect to or -1 for all
 *			 the servers on the list
 *
 * @return int
 * @retval False/1   Failure
 * @retval True      Success
 *
 */
int
connect_servers(struct objname *server_names, int numservers)
{
	int error = FALSE;
	struct server *cur_svr;
	struct objname *cur_obj;
	int i;
	int max_servers;

	max_servers = pbs_query_max_connections();

	close_non_ref_servers();

	if (nservers < max_servers) {
		cur_obj = server_names;

		/* if numservers == -1 (all servers) the var i will never equal zero */
		for (i = numservers; i && cur_obj; i--, cur_obj = cur_obj->next) {
			nservers++;
			if ((cur_svr = make_connection(cur_obj->svr_name)) == NULL) {
				nservers--;
				error = TRUE;
			}

			if (cur_svr != NULL) {
				cur_obj->svr = cur_svr;
				cur_svr->ref++;
				cur_svr->next = servers;
				servers = cur_svr;
			}
		}
	} else {
		pstderr("qmgr: max server connections reached.\n");
		error = 1;
	}
	return error;
}

/**
 * @brief
 *	blanks - print requested spaces
 *
 * @param[in] number - The number spaces
 *
 * @return Void
 *
 */
void
blanks(int number)
{
	char spaces[1024];
	int i;

	if (number < 1023) {
		for (i = 0; i < number; i++)
			spaces[i] = ' ';
		spaces[i] = '\0';

		pstderr(spaces);
	} else
		pstderr("Too many blanks requested.\n");
}

/**
 * @brief
 *	check_list - check a comma delimited list for valid syntax
 *
 * @param[in] list  - A comma delimited list.
 * @param[in] type  - server, queue, node, or resource
 *
 * valid syntax: name[@server][,name]
 *		example: batch@svr1,debug
 *
 * @return int
 * @retval	0	If the syntax of the list is correct for all commands.
 * @retval     >0	The number of chars into the list where the error occured
 *
 */
int
check_list(char *list, int type)
{
	char *foreptr, *backptr;

	backptr = list;

	while (!EOL(*backptr)) {
		foreptr = backptr;

		/* object names (except nodes ) have to start with an alpha character or
		 * can be left off if all object of the same type are wanted
		 */
		if (type == MGR_OBJ_NODE) {
			if (!isalnum((int) *backptr) && *backptr != '@')
				return (backptr - list ? backptr - list : 1);
		} else if (!isalpha((int) *backptr) && *backptr != '@')
			return (backptr - list ? backptr - list : 1);

		while (*foreptr != ',' && *foreptr != '@' && !EOL(*foreptr))
			foreptr++;

		if (*foreptr == '@') {
			foreptr++;

			/* error on "name@" or "name@," */
			if (EOL(*foreptr) || *foreptr == ',')
				return (foreptr - list);

			while (!EOL(*foreptr) && *foreptr != ',')
				foreptr++;

			/* error on name@svr@blah */
			if (*foreptr == '@')
				return (foreptr - list);
		}

		if (*foreptr == ',') {
			foreptr++;
			/* error on "name," */
			if (EOL(*foreptr))
				return (foreptr - list ? foreptr - list : 1);
		}
		backptr = foreptr;
	}
	return 0; /* Success! */
}

/**
 * @brief
 *	disconnect_from_server  - disconnect from one server and clean up
 *
 * @param[in] svr - the server to disconnect from
 *
 * @return  Void
 *
 */
static void
disconnect_from_server(struct server *svr)
{
	pbs_disconnect(svr->s_connect);
	free_server(svr);
	nservers--;
}

/**
 * @brief
 *	clean_up_and_exit - disconnect from the servers and free memory used
 *			    by active object lists and then exits
 *
 * @param[in]  exit_val - value to pass to exit
 *
 * @return Void
 *
 */
void
clean_up_and_exit(int exit_val)
{
	struct server *cur_svr, *next_svr;

	free(hook_tempdir);
	free(hook_tempfile);
	free_objname_list(active_servers);
	free_objname_list(active_queues);
	free_objname_list(active_nodes);

	cur_svr = servers;

	while (cur_svr) {
		next_svr = cur_svr->next;
		disconnect_from_server(cur_svr);
		cur_svr = next_svr;
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(exit_val);
}

/**
 * @brief
 *	remove_char - remove char from a string
 *
 * @param[in]  ptr    pointer to a string
 * @param[in]  ch     character to be removed
 *
 * @return Void
 *
 */
void
remove_char(char *ptr, int ch)
{
	int index = 0;
	int i;
	for (i = 0; ptr[i] != '\0'; ++i)
		if (ptr[i] != ch)
			ptr[index++] = ptr[i];
	ptr[index] = '\0';
}

/**
 * @brief
 *	get_resc_type - for a named resource, look it up in the batch_status
 *	returned by pbs_statrsc().
 *
 * @return int
 * @retval 0	If the resource is not found, or if the type is not available,
 *
 */
int
get_resc_type(char *rname, struct batch_status *pbs)
{
	struct attrl *pat;

	while (pbs) {
		if (strcmp(rname, pbs->name) == 0) {
			pat = pbs->attribs;
			while (pat) {
				if (strcmp("type", pat->name) == 0)
					return (atoi(pat->value));
				pat = pat->next;
			}
			return 0;
		}
		pbs = pbs->next;
	}
	return 0;
}

/**
 * @brief
 *	Determine if a given queue name belongs to a reservation
 *
 * @param[in] sd    - server to which queue belongs
 * @param[in] qname - queue name to check
 *
 * @return Error code
 * @retval 0 if queue is not a reservation queue
 * @retval 1 if queue is a reservation queue
 *
 */
static int
is_reservation_queue(int sd, char *qname)
{
	struct batch_status *bs = NULL;
	struct attrl *resv_queue = NULL;

	/* pasing "" as value because DIS expects a non NULL value */
	set_attr_error_exit(&resv_queue, ATTR_queue, "");
	if (resv_queue != NULL) {
		bs = pbs_statresv(sd, NULL, resv_queue, NULL);
		while (bs != NULL) {
			if (bs->attribs != NULL && bs->attribs->value != NULL) {
				if (strcmp(qname, bs->attribs->value) == 0)
					break;
			}
			bs = bs->next;
		}
		if (resv_queue->name != NULL)
			free(resv_queue->name);
		if (resv_queue->value != NULL)
			free(resv_queue->value);
		free(resv_queue);
	}
	if (bs == NULL)
		return 0;
	pbs_statfree(bs);
	return 1;
}

/**
 * @brief
 *	display - format and output the status information.
 *
 * @par Functionality:
 * 	prints out all the information in a batch_status struct in either
 *	readable form (one attribute per line) or formated for inputing back
 *	into qmgr.
 *
 * @param[in]	otype	Object type, MGR_OBJ_*
 * @param[in]	ptype	Parent Object type, MGR_OBJ_*
 * @param[in]	oname	Object name
 * @param[in]	status	Attribute list of the object in form of batch_status
 * @param[in]	format	True, not zero, if the output should be formatted
 *			to look like qmgr command input
 * @param[in]	 mysvr	pointer to current "server" structure on which to find
 *		     info about resources
 *
 * @return	void
 *
 * @par Side Effects: None
 *
 */
void
display(int otype, int ptype, char *oname, struct batch_status *status,
	int format, struct server *mysvr)
{
	struct attrl *attr;
	char *c, *e;
	char q;
	int l, comma, do_comma, first, indent_len;
	char dump_msg[HOOK_MSG_SIZE];
	char *hooktmp = NULL;
	int custom_resource = FALSE;
	ecl_attribute_def *attrdef_l = NULL;
	int attrdef_size = 0, i;
	static struct attropl exp_attribs[] = {
		{(struct attropl *) &exp_attribs[1],
		 CONTENT_TYPE_PARAM,
		 NULL,
		 HOOKSTR_CONTENT,
		 SET},
		{(struct attropl *) &exp_attribs[2],
		 CONTENT_ENCODING_PARAM,
		 NULL,
		 HOOKSTR_BASE64,
		 SET},
		{NULL,
		 OUTPUT_FILE_PARAM,
		 NULL,
		 NULL, /* has to be constant in some compilers like IRIX */
		 SET},
	};

	static struct attropl exp_attribs_config[] = {
		{(struct attropl *) &exp_attribs_config[1],
		 CONTENT_TYPE_PARAM,
		 NULL,
		 HOOKSTR_CONFIG,
		 SET},
		{(struct attropl *) &exp_attribs_config[2],
		 CONTENT_ENCODING_PARAM,
		 NULL,
		 HOOKSTR_BASE64,
		 SET},
		{NULL,
		 OUTPUT_FILE_PARAM,
		 NULL,
		 NULL, /* has to be constant in some compilers like IRIX */
		 SET},
	};

	/* the OUTPUT_FILE_PARAM entry */
	hooktmp = base(hook_tempfile);
	exp_attribs[2].value = hooktmp ? hooktmp : "";
	exp_attribs_config[2].value = hooktmp ? hooktmp : "";

	if (format) {
		if (otype == MGR_OBJ_SERVER)
			printf("#\n# Set server attributes.\n#\n");
		else if (otype == MGR_OBJ_QUEUE)
			printf("#\n# Create queues and set their attributes.\n#\n");
		else if (otype == MGR_OBJ_NODE)
			printf("#\n# Create nodes and set their properties.\n#\n");
		else if (otype == MGR_OBJ_SITE_HOOK)
			printf("#\n# Create hooks and set their properties.\n#\n");
		else if (otype == MGR_OBJ_PBS_HOOK)
			printf("#\n# Set PBS hooks properties.\n#\n");
	}

	if (otype == MGR_OBJ_SERVER) {
		attrdef_l = ecl_svr_attr_def;
		attrdef_size = ecl_svr_attr_size;
	} else if (otype == MGR_OBJ_SCHED) {
		attrdef_l = ecl_sched_attr_def;
		attrdef_size = ecl_sched_attr_size;
	} else if (otype == MGR_OBJ_QUEUE) {
		attrdef_l = ecl_que_attr_def;
		attrdef_size = ecl_que_attr_size;
	} else if (otype == MGR_OBJ_NODE) {
		attrdef_l = ecl_node_attr_def;
		attrdef_size = ecl_node_attr_size;
	}

	while (status != NULL) {
		if (otype == MGR_OBJ_SERVER) {
			if (!format)
				printf("Server %s\n", status->name);
		} else if (otype == MGR_OBJ_SCHED) {
			if ((oname != NULL) && *oname && strcmp(oname, status->name)) {
				status = status->next;
				continue;
			}

			if (format) {
				printf("#\n# Create and define scheduler %s\n#\n", status->name);
				printf("create sched %s\n", status->name);
			} else
				printf("Sched %s\n", status->name);

		} else if (otype == MGR_OBJ_QUEUE) {
			/* When printing server, skip display of reservation queue. This is done
			 * to prevent recreating the reservation queue upon migration of a server
			 * configuration.
			 */
			if ((ptype == MGR_OBJ_SERVER) && is_reservation_queue(mysvr->s_connect,
									      status->name)) {
				status = status->next;
				continue;
			}
			if (format) {
				printf("#\n# Create and define queue %s\n#\n", status->name);
				printf("create queue %s\n", status->name);
			} else
				printf("Queue %s\n", status->name);
		} else if (otype == MGR_OBJ_NODE) {
			if (format) {
				first = TRUE;
				printf("#\n# Create and define node %s\n#\n", status->name);
				printf("create node %s", status->name);
				if ((c = get_attr(status->attribs, ATTR_NODE_Host, NULL)) != NULL) {
					if (strcmp(c, status->name) != 0) {
						printf(" %s=%s", ATTR_NODE_Mom, c);
						first = 0;
					}
				} else if ((c = get_attr(status->attribs, ATTR_NODE_Mom, NULL)) != NULL) {
					if (strcmp(c, status->name) != 0) {
						if (format && (strchr(c, (int) ',') != NULL))
							printf(" %s=\"%s\"", ATTR_NODE_Mom, c); /* quote value */
						else
							printf(" %s=%s", ATTR_NODE_Mom, c);
						first = 0;
					}
				}
				if ((c = get_attr(status->attribs, ATTR_NODE_Port, NULL)) != NULL) {
					if (atoi(c) != PBS_MOM_SERVICE_PORT) {
						if (first)
							printf(" ");
						else
							printf(",");
						printf("%s=%s", ATTR_NODE_Port, c);
					}
				}
				printf("\n");
			} else
				printf("Node %s\n", status->name);
		} else if (otype == MGR_OBJ_SITE_HOOK) {
			if (format) {
				printf("#\n# Create and define hook %s\n#\n", show_nonprint_chars(status->name));
				printf("create hook %s\n", show_nonprint_chars(status->name));
			} else
				printf("Hook %s\n", show_nonprint_chars(status->name));
		} else if (otype == MGR_OBJ_PBS_HOOK) {
			if (format) {
				printf("#\n# Set pbshook %s\n#\n", show_nonprint_chars(status->name));
			} else
				printf("Hook %s\n", show_nonprint_chars(status->name));
		} else if (otype == MGR_OBJ_RSC) {
			if ((oname == NULL) || (strcmp(oname, "") == 0)) {
				if (strcmp(status->name, RESOURCE_UNKNOWN) == 0) {
					custom_resource = TRUE;
					status = status->next;
					if (status)
						printf("#\n# Create resources and set their properties.\n#\n");
					continue;
				}
				if (custom_resource == FALSE) {
					status = status->next;
					continue;
				}
			}
			if (format) {
				printf("#\n# Create and define resource %s\n#\n", status->name);
				printf("create resource %s\n", status->name);
			} else
				printf("Resource %s\n", status->name);
		}

		attr = status->attribs;

		while (attr != NULL) {
			if (format) {
				if ((otype == MGR_OBJ_SITE_HOOK) || (otype == MGR_OBJ_PBS_HOOK) ||
				    is_attr(otype, attr->name, TYPE_ATTR_PUBLIC)) {
					if ((otype != MGR_OBJ_SITE_HOOK) && (otype != MGR_OBJ_PBS_HOOK) &&
					    ((strcmp(attr->name, ATTR_NODE_Host) == 0) ||
					     (strcmp(attr->name, ATTR_NODE_Mom) == 0) ||
					     (strcmp(attr->name, ATTR_NODE_Port) == 0))) {
						/* skip Host, Mom and Port, already done on line with name */
						attr = attr->next;
						continue;
					}
					if ((otype != MGR_OBJ_SITE_HOOK) && (otype != MGR_OBJ_PBS_HOOK) &&
					    (strcmp(attr->name, ATTR_NODE_state) == 0) &&
					    ((strncmp(attr->value, ND_state_unknown, strlen(ND_state_unknown)) == 0) ||
					     (strcmp(attr->value, ND_down) == 0))) {
						/* don't record "Down" or "state-unknown" */
						attr = attr->next;
						continue;
					}
					if (otype == MGR_OBJ_RSC) {
						if ((attr != NULL) && (strcmp(attr->name, ATTR_RESC_TYPE) == 0)) {
							struct resc_type_map *rtm = find_resc_type_map_by_typev(atoi(attr->value));
							if (rtm) {
								printf("set resource %s type = %s\n", status->name, rtm->rtm_rname);
							}
							attr = attr->next;
							continue;
						}
						if ((attr != NULL) && (strcmp(attr->name, ATTR_RESC_FLAG) == 0)) {
							char *rfm = find_resc_flag_map(atoi(attr->value));
							if ((rfm != NULL) && (strcmp(rfm, "") != 0)) {
								printf("set resource %s flag = %s\n", status->name, rfm);
							}
							if (rfm != NULL) {
								free(rfm);
							}
							attr = attr->next;
							continue;
						}
					}
					if ((attr->resource != NULL) &&
					    (get_resc_type(attr->resource, mysvr->s_rsc) == ATR_TYPE_STR))
						do_comma = FALSE; /* single string, don't parse substrings on a comma */
					else
						do_comma = TRUE;
					first = TRUE;
					c = attr->value;
					e = c;
					while (*c) {
						printf("set ");
						if (otype == MGR_OBJ_SERVER) {
							printf("server ");
						} else if (otype == MGR_OBJ_SCHED) {
							if (strcmp(status->name, PBS_DFLT_SCHED_NAME) == 0)
								printf("sched ");
							else
								printf("sched %s ", status->name);
						} else if (otype == MGR_OBJ_QUEUE) {
							printf("queue %s ", status->name);
						} else if (otype == MGR_OBJ_NODE) {
							printf("node %s ", status->name);
						} else if (otype == MGR_OBJ_SITE_HOOK)
							printf("hook %s ", show_nonprint_chars(status->name));
						else if (otype == MGR_OBJ_PBS_HOOK)
							printf("pbshook %s ", show_nonprint_chars(status->name));

						if (attr->name != NULL)
							printf("%s", attr->name);
						if (attr->resource != NULL)
							printf(".%s", attr->resource);
						if (attr->value != NULL) {
							for (i = 0; i < attrdef_size; i++) {
								if (strcmp(attr->name, attrdef_l[i].at_name) == 0) {
									break;
								}
							}
							if ((attrdef_l != NULL) && (attrdef_l[i].at_type == ATR_TYPE_STR)) {
								if (strpbrk(c, "\"' ,") != NULL) {
									if (strchr(c, (int) '"'))
										q = '\'';
									else
										q = '"';
									printf(" = %c%s%c\n", q, show_nonprint_chars(c), q);
								} else
									printf(" = %s\n", show_nonprint_chars(c));
								break;
							} else {
								if (attr->op == INCR)
									printf(" += ");
								else if (first)
									printf(" = ");
								else
									printf(" += ");

								first = FALSE;

								while (*e) {
									if ((do_comma == TRUE) && (*e == ',')) {
										*e++ = '\0';
										break;
									}
									e++;
								}
								if (strpbrk(c, "\"' ,") != NULL) {
									/* need to quote string */
									if (strchr(c, (int) '"'))
										q = '\'';
									else
										q = '"';
									printf("%c%s%c", q, show_nonprint_chars(c), q);
								} else
									printf("%s", show_nonprint_chars(c)); /* no quoting */

								c = e;
							}
						}

						printf("\n");
					}
				}
			} else {
				indent_len = 4;
				if (otype == MGR_OBJ_RSC) {
					if ((attr != NULL) && (strcmp(attr->name, "type") == 0)) {
						struct resc_type_map *rtm = find_resc_type_map_by_typev(atoi(attr->value));
						if (rtm) {
							printf("%*s", indent_len, " ");
							printf("type = %s\n", rtm->rtm_rname);
						}
					} else if ((attr != NULL) && (strcmp(attr->name, "flag") == 0)) {
						char *rfm = find_resc_flag_map(atoi(attr->value));
						if ((rfm != NULL) && (strcmp(rfm, "") != 0)) {
							printf("%*s", indent_len, " ");
							printf("flag = %s\n", rfm);
						}
						if (rfm != NULL) {
							free(rfm);
						}
					}
					attr = attr->next;
					continue;
				}

				if (attr->name != NULL) {
					printf("%*s", indent_len, " ");
					printf("%s", attr->name);
				}

				if (attr->resource != NULL)
					printf(".%s", attr->resource);

				if (attr->value != NULL) {
					l = strlen(attr->name) + 8;

					if (attr->resource != NULL)
						l += strlen(attr->resource) + 1;

					l += 3; /* length of " = " */
					printf(" = ");
					c = attr->value;
					e = c;
					comma = TRUE;
					first = TRUE;
					while (comma) {
						while (*e != ',' && *e != '\0')
							e++;

						comma = (*e == ',');
						*e = '\0';
						l += strlen(c) + 1;

						if (!first && (l >= 80)) { /* line extension */
							printf("\n\t");
							while (White(*c))
								c++;
						}

						printf("%s", show_nonprint_chars(c));
						first = FALSE;

						if (comma) {
							printf(",");
							*e = ',';
						}

						e++;
						c = e;
					}
					printf("\n");
				}
			}
			attr = attr->next;
		}
		if (!format) {
			printf("\n");
		} else {
			if (otype == MGR_OBJ_SITE_HOOK) {
				if (exp_attribs[2].value[0] == '\0') {
					fprintf(stderr, "%s", hook_tempfile_errmsg);
					fprintf(stderr, "can't display hooks data - no hook_tempfile!\n");
				} else if (pbs_manager(mysvr->s_connect, MGR_CMD_EXPORT, otype,
						       status->name, exp_attribs, NULL) == 0) {
					printf(PRINT_HOOK_IMPORT_CALL, show_nonprint_chars(status->name));
					if (dump_file(hook_tempfile, NULL, HOOKSTR_BASE64,
						      dump_msg, sizeof(dump_msg)) != 0) {
						fprintf(stderr, "%s\n", dump_msg);
					}
					printf("\n");
				}
				if (exp_attribs_config[2].value[0] == '\0') {
					fprintf(stderr, "%s", hook_tempfile_errmsg);
					fprintf(stderr, "can't display hooks data - no hook_tempfile!\n");
				} else if (pbs_manager(mysvr->s_connect, MGR_CMD_EXPORT, otype,
						       status->name, exp_attribs_config, NULL) == 0) {
					printf(PRINT_HOOK_IMPORT_CONFIG, show_nonprint_chars(status->name));
					if (dump_file(hook_tempfile, NULL, HOOKSTR_BASE64,
						      dump_msg, sizeof(dump_msg)) != 0) {
						fprintf(stderr, "%s\n", dump_msg);
					}
					printf("\n");
				}
			} else if (otype == MGR_OBJ_PBS_HOOK) {
				if (exp_attribs_config[2].value[0] == '\0') {
					fprintf(stderr, "%s", hook_tempfile_errmsg);
					fprintf(stderr, "can't display pbs hooks data - no hook_tempfile!\n");
				} else if (pbs_manager(mysvr->s_connect, MGR_CMD_EXPORT, otype,
						       status->name, exp_attribs_config, NULL) == 0) {
					printf(PRINT_HOOK_IMPORT_CONFIG, show_nonprint_chars(status->name));
					if (dump_file(hook_tempfile, NULL, HOOKSTR_BASE64,
						      dump_msg, sizeof(dump_msg)) != 0) {
						fprintf(stderr, "%s\n", dump_msg);
					}
					printf("\n");
				}
			}
		}
		status = status->next;
	}
}

/**
 * @brief
 *	set_active - sets active objects
 *
 * @param[in] obj_type - the type of object - should be caller allocated space
 * @parm[in]  obj_names - names of objects to set active
 *
 * @return  Error code
 * @retval  0  on success
 * @retval  !0 on failure
 *
 */
int
set_active(int obj_type, struct objname *obj_names)
{
	struct objname *cur_obj = NULL;
	struct server *svr;
	int error = 0;

	if (obj_names != NULL) {
		switch (obj_type) {
			case MGR_OBJ_SERVER:
				cur_obj = obj_names;
				while (cur_obj != NULL && !error) {
					if (cur_obj->svr == NULL) {
						svr = find_server(cur_obj->obj_name);
						if (svr == NULL)
							error = connect_servers(cur_obj, 1);
						else {
							cur_obj->svr = svr;
							svr->ref++;
						}
					}

					cur_obj = cur_obj->next;
				}
				if (!error) {
					free_objname_list(active_servers);
					active_servers = obj_names;
				} else
					free_objname_list(obj_names);

				break;

			case MGR_OBJ_SCHED:
				cur_obj = obj_names;
				while (cur_obj != NULL && !error) {
					if (cur_obj->svr == NULL) {
						svr = find_server(cur_obj->obj_name);
						if (svr == NULL)
							error = connect_servers(cur_obj, 1);
						else {
							cur_obj->svr = svr;
							svr->ref++;
						}
					}

					cur_obj = cur_obj->next;
				}
				if (!error) {
					free_objname_list(active_scheds);
					active_scheds = obj_names;
				} else
					free_objname_list(obj_names);

				break;

			case MGR_OBJ_QUEUE:
				cur_obj = obj_names;

				while (cur_obj != NULL && !error) {
					if (cur_obj->svr_name != NULL) {
						if (cur_obj->svr == NULL)
							if (connect_servers(cur_obj, 1) == TRUE)
								error = 1;
					}

					if (!is_valid_object(cur_obj, MGR_OBJ_QUEUE)) {
						PSTDERR1("Queue does not exist: %s.\n", cur_obj->obj_name)
						error = 1;
					}

					cur_obj = cur_obj->next;
				}

				if (!error) {
					free_objname_list(active_queues);
					active_queues = obj_names;
				}
				break;

			case MGR_OBJ_NODE:
				cur_obj = obj_names;
				while (cur_obj != NULL && !error) {
					if (cur_obj->svr_name != NULL) {
						if (cur_obj->svr == NULL)
							if (connect_servers(cur_obj, 1) == TRUE)
								error = 1;
					}
					if (!is_valid_object(cur_obj, MGR_OBJ_NODE)) {
						PSTDERR1("Node does not exist: %s.\n", cur_obj->obj_name)
						error = 1;
					}

					cur_obj = cur_obj->next;
				}

				if (!error) {
					free_objname_list(active_nodes);
					active_nodes = obj_names;
				}
				break;

			default:
				error = 1;
		}
	} else {
		switch (obj_type) {
			case MGR_OBJ_SERVER:
				printf("Active servers:\n");
				cur_obj = active_servers;
				break;
			case MGR_OBJ_SCHED:
				printf("Active schedulers:\n");
				cur_obj = active_scheds;
				break;
			case MGR_OBJ_QUEUE:
				printf("Active queues:\n");
				cur_obj = active_queues;
				break;
			case MGR_OBJ_NODE:
				printf("Active nodes:\n");
				cur_obj = active_nodes;
				break;
		}
		while (cur_obj != NULL) {
			if (obj_type == MGR_OBJ_SERVER)
				printf("%s\n", Svrname(cur_obj->svr));
			else
				printf("%s@%s\n", cur_obj->obj_name, Svrname(cur_obj->svr));

			cur_obj = cur_obj->next;
		}
	}

	return error;
}

/**
 * @brief
 *	handle_formula - if we're setting the formula, we need to write the
 *			value into a root owned file, instead of sending it over
 *			the wire.  This	is because of the fact that we run it as root
 *
 * @param[in] attribs - the attribute we're setting
 *
 * @return Void
 *
 */
void
handle_formula(struct attropl *attribs)
{
	struct attropl *pattr;
	char pathbuf[MAXPATHLEN + 1];
	FILE *fp;

	for (pattr = attribs; pattr != NULL; pattr = pattr->next) {
		if (!strcmp(pattr->name, ATTR_job_sort_formula) && pattr->op == SET) {
			sprintf(pathbuf, "%s/%s", pbs_conf.pbs_home_path, FORMULA_ATTR_PATH);
			if ((fp = fopen(pathbuf, "w")) != NULL) {
				fprintf(fp, "%s\n", pattr->value);
				fclose(fp);
#ifdef WIN32
				/* Give file an Administrators permission so pbs server can read it */
				secure_file(pathbuf, "Administrators",
					    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif
			} else {
				PSTDERR1("qmgr: Failed to open %s for writing.\n", pathbuf)
				return;
			}
		}
	}
	return;
}

/**
 * @brief
 * 	execute - contact the server and execute the command
 *
 * @param[in] aopt      True, if the -a option was given.
 * @param[in] oper      The command, either create, delete, set, unset or list.
 * @param[in] type      The object type, either server or queue.
 * @param[in] names     The object name list.
 * @param[in] attribs   The attribute list with operators.
 *
 * @return int
 * @retval 0 for success
 * @retval non-zero for error
 *
 * @par
 * Uses the following library calls from libpbs:
 *          pbs_manager
 *          pbs_statserver
 *          pbs_statque
 *          pbs_statsched
 *          pbs_statfree
 *          pbs_geterrmsg
 *
 */
int
execute(int aopt, int oper, int type, char *names, struct attropl *attribs)
{
	int len; /* Used for length of an err msg*/
	int cerror;
	int error; /* Error value returned */
	int perr;  /* Value returned from pbs_manager */
	char *pmsg;
	char *errmsg;		      /* Error message from pbs_errmsg */
	char errnomsg[256];	      /* Error message with pbs_errno */
	struct objname *name;	      /* Pointer to a list of object names */
	struct objname *pname = NULL; /* Pointer to current object name */
	struct objname *sname = NULL; /* Pointer to current server name */
	struct objname *svrs;	      /* servers to loop through */
	struct attrl *sa;	      /* Argument needed for status routines */
	/* Argument used to request queue names */
	struct server *sp; /* Pointer to server structure */
	/* Return structure from a list or print request */
	struct batch_status *ss = NULL;
	struct attropl *attribs_tmp = NULL;
	struct attropl *attribs_file = NULL;
	char infile[MAXPATHLEN + 1];
	char outfile[MAXPATHLEN + 1];
	char dump_msg[HOOK_MSG_SIZE];
	char content_encoding[HOOK_BUF_SIZE];
	char content_type[HOOK_BUF_SIZE];
	error = 0;
	name = commalist2objname(names, type);

	if (oper == MGR_CMD_ACTIVE)
		return set_active(type, name);

	if (name == NULL) {
		switch (type) {
				/* There will always be an active server */
			case MGR_OBJ_SCHED:
			case MGR_OBJ_SERVER:
			case MGR_OBJ_SITE_HOOK:
			case MGR_OBJ_PBS_HOOK:
			case MGR_OBJ_RSC:
				pname = active_servers;
				break;
			case MGR_OBJ_QUEUE:
				if (active_queues != NULL)
					pname = active_queues;
				else
					pstderr("No Active Queues, nothing done.\n");
				break;
			case MGR_OBJ_NODE:
				if (active_nodes != NULL)
					pname = active_nodes;
				else
					pstderr("No Active Nodes, nothing done.\n");
				break;
		}
	} else
		pname = name;

	for (; pname != NULL; pname = pname->next) {
		if (pname->svr_name != NULL)
			svrs = temp_objname(NULL, pname->svr_name, pname->svr);
		else
			svrs = active_servers;

		for (sname = svrs; sname != NULL; sname = sname->next) {
			if (sname->svr == NULL) {
				cerror = connect_servers(sname, 1);
				/* if connect_servers() returned an error   */
				/* update "error", otherwise leave it alone */
				/* so that any prior error is retained      */
				if (cerror) {
					error = cerror;
					continue;
				}
			}

			sp = sname->svr;
			if (oper == MGR_CMD_LIST) {
				sa = attropl2attrl(attribs);
				switch (type) {
					case MGR_OBJ_SERVER:
						ss = pbs_statserver(sp->s_connect, sa, NULL);
						break;
					case MGR_OBJ_QUEUE:
						ss = pbs_statque(sp->s_connect, pname->obj_name, sa, NULL);
						break;
					case MGR_OBJ_NODE:
						ss = pbs_statvnode(sp->s_connect, pname->obj_name, sa, NULL);
						break;
					case MGR_OBJ_SCHED:
						ss = pbs_statsched(sp->s_connect, sa, NULL);
						break;
					case MGR_OBJ_SITE_HOOK:
						ss = pbs_stathook(sp->s_connect, pname->obj_name, sa, SITE_HOOK);
						break;
					case MGR_OBJ_PBS_HOOK:
						ss = pbs_stathook(sp->s_connect, pname->obj_name, sa, PBS_HOOK);
						break;
					case MGR_OBJ_RSC:
						ss = pbs_statrsc(sp->s_connect, pname->obj_name, sa, "p");
						break;
				}
				free_attrl_list(sa);
				perr = (ss == NULL);
				if (!perr)
					display(type, type, pname->obj_name, ss, FALSE, sp);

				/* For 'list hook' command of all available */
				/* hooks, if none are found in the system, */
				/* then force a return success value.   */
				if ((perr != 0) &&
				    ((type == MGR_OBJ_SITE_HOOK) ||
				     (type == MGR_OBJ_PBS_HOOK)) &&
				    ((pname->obj_name == NULL) ||
				     (pname->obj_name[0] == '\0'))) {
					/* not an error */
					perr = 0;
				}

				pbs_statfree(ss);
			} else if (oper == MGR_CMD_PRINT) {

				sa = attropl2attrl(attribs);
				switch (type) {
					case MGR_OBJ_SERVER:
						if (sa == NULL) {
							sp->s_rsc = pbs_statrsc(sp->s_connect, NULL, NULL, "p");
							if (sp->s_rsc != NULL) {
								display(MGR_OBJ_RSC, MGR_OBJ_SERVER, NULL, sp->s_rsc, TRUE, sp);
							} else if (pbs_errno != PBSE_NONE) {
								break;
							}
							ss = pbs_statque(sp->s_connect, NULL, NULL, NULL);
							if (ss != NULL) {
								display(MGR_OBJ_QUEUE, MGR_OBJ_SERVER, NULL, ss, TRUE, sp);
								pbs_statfree(ss);
							} else if (pbs_errno != PBSE_NONE) {
								break;
							}
						}
						ss = pbs_statserver(sp->s_connect, sa, NULL);
						break;
					case MGR_OBJ_QUEUE:
						ss = pbs_statque(sp->s_connect, pname->obj_name, sa, NULL);
						break;
					case MGR_OBJ_NODE:
						ss = pbs_statvnode(sp->s_connect, pname->obj_name, sa, NULL);
						break;
					case MGR_OBJ_SCHED:
						ss = pbs_statsched(sp->s_connect, sa, NULL);
						break;
					case MGR_OBJ_SITE_HOOK:
						ss = pbs_stathook(sp->s_connect, pname->obj_name, sa, SITE_HOOK);
						break;
					case MGR_OBJ_RSC:
						ss = pbs_statrsc(sp->s_connect, pname->obj_name, sa, "p");
						break;
				}

				free_attrl_list(sa);
				perr = (ss == NULL);
				if (!perr) {
					display(type, type, pname->obj_name, ss, TRUE, sp);
				}
				pbs_statfree(ss);
			} else {
				if (oper == MGR_CMD_IMPORT) {
					infile[0] = '\0';
					content_encoding[0] = '\0';
					content_type[0] = '\0';
					attribs_tmp = attribs;
					attribs_file = NULL;
					while (attribs_tmp) {
						if (strcmp(attribs_tmp->name, INPUT_FILE_PARAM) == 0) {
							pbs_strncpy(infile, attribs_tmp->value, sizeof(infile));
							attribs_file = attribs_tmp;
						} else if (strcmp(attribs_tmp->name, CONTENT_ENCODING_PARAM) == 0) {
							pbs_strncpy(content_encoding, attribs_tmp->value, sizeof(content_encoding));
						} else if (strcmp(attribs_tmp->name, CONTENT_TYPE_PARAM) == 0) {
							pbs_strncpy(content_type, attribs_tmp->value, sizeof(content_type));
						}
						attribs_tmp = attribs_tmp->next;
					}
					if (infile[0] == '\0') {
						fprintf(stderr,
							"hook import command has no <input-file> argument\n");
						error = 1;
						continue;
					}
					if (content_encoding[0] == '\0') {
						fprintf(stderr,
							"hook import command has no <content-encoding> argument\n");
						error = 1;
						continue;
					}
					if (content_type[0] == '\0') {
						fprintf(stderr,
							"hook import command has no <content-type> argument\n");
						error = 1;
						continue;
					}

					if (strcmp(infile, "-") == 0) {
						infile[0] = '\0';
					}

					if (strcmp(content_type, HOOKSTR_CONFIG) == 0) {
						char *p;
						int totlen;
						p = strrchr(infile, '.');
						/* need to pass the suffix */
						/* to the server which will */
						/* validate the file based */
						/* on type */
						if (p != NULL) {
							totlen = strlen(p) + strlen(hook_tempfile);

							if (totlen < sizeof(hook_tempfile))
								strcat(hook_tempfile, p);
						}
					}

					/* hook_tempfile could be set to empty if generating this filename */
					/* by mktemp() was not successful */
					if ((hook_tempfile[0] == '\0') ||
					    dump_file(infile, hook_tempfile, content_encoding,
						      dump_msg, sizeof(dump_msg)) != 0) {
						struct stat sbuf;

						error = 1; /* set error indicator */

						if (hook_tempfile_errmsg[0] != '\0')
							fprintf(stderr, "%s\n", hook_tempfile_errmsg);

							/* Detect failed to access hooks working directory */

#ifdef WIN32
						if ((lstat(hook_tempdir, &sbuf) == -1) && (GetLastError() == ERROR_ACCESS_DENIED))
#else
						if ((stat(hook_tempdir, &sbuf) == -1) && (errno == EACCES))
#endif
						{
							fprintf(stderr, "%s@%s is unauthorized to access hooks data "
									"from server %s\n",
								cur_user, cur_host,
								(sname->svr_name[0] == '\0') ? pbs_conf.pbs_server_name : sname->svr_name);
						} else {
							fprintf(stderr, "%s\n", dump_msg);
						}
						continue;
					}

					dyn_strcpy(&attribs_file->value, base(hook_tempfile));

				} else if (oper == MGR_CMD_EXPORT) {
					char *hooktmp = NULL;

					if (hook_tempfile[0] == '\0') {

						struct stat sbuf;

						error = 1;

						if (hook_tempfile_errmsg[0] != '\0')
							fprintf(stderr, "%s\n", hook_tempfile_errmsg);

							/* Detect failed to access hooks working directory */
#ifdef WIN32
						if ((lstat(hook_tempdir, &sbuf) == -1) && (GetLastError() == ERROR_ACCESS_DENIED))
#else
						if ((stat(hook_tempdir, &sbuf) == -1) && (errno == EACCES))
#endif
						{
							fprintf(stderr, "%s@%s is unauthorized to access hooks data "
									"from server %s\n",
								cur_user, cur_host,
								(sname->svr_name[0] == '\0') ? conf_full_server_name : sname->svr_name);
						} else {
							fprintf(stderr, "can't export hooks data. no hook_tempfile!\n");
						}
						continue;
					}
					outfile[0] = '\0';
					content_encoding[0] = '\0';
					attribs_tmp = attribs;
					attribs_file = NULL;
					while (attribs_tmp) {
						if (strcmp(attribs_tmp->name, OUTPUT_FILE_PARAM) == 0) {
							pbs_strncpy(outfile, attribs_tmp->value, sizeof(outfile));
							attribs_file = attribs_tmp;
						} else if (strcmp(attribs_tmp->name,
								  CONTENT_ENCODING_PARAM) == 0) {
							pbs_strncpy(content_encoding, attribs_tmp->value, sizeof(content_encoding));
						}
						attribs_tmp = attribs_tmp->next;
					}
					hooktmp = base(hook_tempfile);
					/* dyn_strcpy does not like a NULL second argument. */
					dyn_strcpy(&attribs_file->value, (hooktmp ? hooktmp : ""));
				}
				handle_formula(attribs);
				if (type == MGR_OBJ_PBS_HOOK) {
					struct attropl *popl;
					perr = pbs_manager(sp->s_connect, oper, type, pname->obj_name, attribs, PBS_HOOK);

					popl = attribs;
					if (perr == 0) {
						while (popl != NULL) {

							if (strcmp(popl->name, "enabled") != 0) {
								popl = popl->next;
								continue;
							}
							if ((strcasecmp(popl->value, HOOKSTR_FALSE) == 0) ||
							    (strcasecmp(popl->value, "f") == 0) ||
							    (strcasecmp(popl->value, "n") == 0) ||
							    (strcmp(popl->value, "0") == 0)) {
								fprintf(stderr, "WARNING: Disabling a PBS hook "
										"results in an unsupported configuration!\n");
							}
							popl = popl->next;
						}
					}
				} else {
					if ((strlen(pname->obj_name) == 0) && type == MGR_OBJ_SCHED && oper != MGR_CMD_DELETE) {
						perr = pbs_manager(sp->s_connect, oper, type, PBS_DFLT_SCHED_NAME, attribs, NULL);
					} else
						perr = pbs_manager(sp->s_connect, oper, type, pname->obj_name, attribs, NULL);
				}
			}

			errmsg = pbs_geterrmsg(sp->s_connect);
			if (perr) {
				/*
				 ** IF
				 **	stdin is a tty			OR
				 **	the command is not SET		OR
				 **	the object type is not NODE	OR
				 **	the error is not "attempt to set READ ONLY attribute"
				 ** THEN print error messages
				 ** ELSE don't print error messages
				 **
				 ** This is to deal with bug 4941 where errors are generated
				 ** from running qmgr with input from a file which was generated
				 ** by 'qmgr -c "p n @default" > /tmp/nodes_out'.
				 */
				if (isatty(0) ||
				    (oper != MGR_CMD_SET) || (type != MGR_OBJ_NODE) ||
				    (pbs_errno != PBSE_ATTRRO)) {
					if (errmsg != NULL) {
						len = strlen(errmsg) + strlen(pname->obj_name) + strlen(Svrname(sp)) + 20;
						if (len < 256) {
							sprintf(errnomsg, "qmgr obj=%s svr=%s: %s\n",
								pname->obj_name, Svrname(sp), errmsg);
							pstderr(errnomsg);
						} else {
							/*obviously, this is to cover a highly unlikely case*/

							pstderr_big(Svrname(sp), pname->obj_name, errmsg);
						}
					}

					if (pbs_errno == PBSE_PROTOCOL) {
						if ((check_time - start_time) >= QMGR_TIMEOUT) {
							pstderr("qmgr: Server disconnected due to idle connection timeout\n");
						} else {
							pstderr("qmgr: Protocol error, server disconnected\n");
						}
						exit(1);
					} else if (pbs_errno == PBSE_HOOKERROR) {
						pstderr("qmgr: hook error returned from server\n");
					} else if (pbs_errno != 0) /* 0 happens with hooks if no hooks found */
						PSTDERR1("qmgr: Error (%d) returned from server\n", pbs_errno)
				}

				if (aopt)
					return perr;
				error = perr;
			} else if (errmsg != NULL) {
				/* batch reply code is 0 but a text message is also being returned */

				if ((pmsg = malloc(strlen(errmsg) + 2)) != NULL) {
					strcpy(pmsg, errmsg);
					strcat(pmsg, "\n");
					pstderr(pmsg);
					free(pmsg);
				}
			} else {

				if (oper == MGR_CMD_EXPORT) {
					if (dump_file(hook_tempfile, outfile, content_encoding,
						      dump_msg, sizeof(dump_msg)) != 0) {
						fprintf(stderr, "%s\n", dump_msg);
						error = 1;
					}
				}
			}

			temp_objname(NULL, NULL, NULL); /* clears reference count */
		}
	}
	if (name != NULL)
		free_objname_list(name);
	return error;
}

/**
 * @brief
 *	frees the attribute list
 *
 * @param[in] attr   Pointer to the linked list of attropls to clean up.
 *
 * @return Void
 *
 */
void
freeattropl(struct attropl *attr)
{
	struct attropl *ap;

	while (attr != NULL) {
		if (attr->name != NULL)
			free(attr->name);
		if (attr->resource != NULL)
			free(attr->resource);
		if (attr->value != NULL)
			free(attr->value);
		ap = attr->next;
		free(attr);
		attr = ap;
	}
}

/**
 * @brief
 *	commalist2objname - convert a comma seperated list of strings to a
 *			    linked list of objname structs
 *
 * @param[in] names - comma seperated list of strings
 * @param[in] type - the type of the objects
 *
 * @return  structure
 * @retval  linked list of objname structs
 *
 */
struct objname *
commalist2objname(char *names, int type)
{
	char *foreptr, *backptr;	 /* front and back of words */
	struct objname *objs = NULL;	 /* the front of the name object list */
	struct objname *cur_obj;	 /* the current name object */
	struct objname *prev_obj = NULL; /* the previous name object */
	int len;			 /* length of segment of string */
	char error = 0;			 /* error flag */

	if (names != NULL) {
		foreptr = backptr = names;
		while (!EOL(*foreptr) && !error) {
			while (White(*foreptr))
				foreptr++;

			backptr = foreptr;

			while (*foreptr != ',' && *foreptr != '@' && !EOL(*foreptr))
				foreptr++;

			cur_obj = new_objname();
			cur_obj->obj_type = type;
			if (*foreptr == '@') {
				len = foreptr - backptr;
				Mstring(cur_obj->obj_name, len + 1);
				pbs_strncpy(cur_obj->obj_name, backptr, len + 1);
				foreptr++;
				backptr = foreptr;
				while (*foreptr != ',' && !EOL(*foreptr))
					foreptr++;

				len = foreptr - backptr;
				if (strncmp(backptr, DEFAULT_SERVER, len) == 0) {
					Mstring(cur_obj->svr_name, 1);
					cur_obj->svr_name[0] = '\0';
				} else if (strncmp(backptr, ACTIVE_SERVER, len) == 0)
					cur_obj->svr_name = NULL;
				else {
					Mstring(cur_obj->svr_name, len + 1);
					pbs_strncpy(cur_obj->svr_name, backptr, len + 1);
				}

				if (!EOL(*foreptr))
					foreptr++;
			} else {
				len = foreptr - backptr;

				if ((type == MGR_OBJ_SERVER || type == MGR_OBJ_SITE_HOOK || type == MGR_OBJ_PBS_HOOK) && !strcmp(backptr, DEFAULT_SERVER)) {
					Mstring(cur_obj->obj_name, 1);
					cur_obj->obj_name[0] = '\0';
				} else {
					Mstring(cur_obj->obj_name, len + 1);
					pbs_strncpy(cur_obj->obj_name, backptr, len + 1);
				}

				if (type == MGR_OBJ_SERVER)
					cur_obj->svr_name = cur_obj->obj_name;

				if (!EOL(*foreptr))
					foreptr++;
			}

			if ((cur_obj->svr = find_server(cur_obj->svr_name)) != NULL)
				cur_obj->svr->ref++;

			if (objs == NULL)
				objs = cur_obj;

			if (prev_obj == NULL)
				prev_obj = cur_obj;
			else if (cur_obj != NULL) {
				prev_obj->next = cur_obj;
				prev_obj = cur_obj;
			}
		}
	}

	if (error) {
		free_objname_list(objs);
		return NULL;
	}

	return objs;
}

/**
 * @brief
 *	get_request - get a qmgr request from the standard input
 *
 * @param[out] request      The buffer for the qmgr request
 *
 * @return Error code
 * @retval 0     Success
 * @retval EOF   Failure
 *
 * NOTE:
 *      This routine has a static buffer it keeps lines of input in.
 * Since commands can be separated by semicolons, a line may contain
 * more than one command.  In this case, the command is copied to
 * request and the rest of the line is moved up to overwrite the previous
 * command.  Another line is retrieved from stdin only if the buffer is
 * empty
 *
 */
int
get_request(char **request)
{
	static char *line = NULL; /* Stdin line */
	static int empty = TRUE;  /* Line has nothing in it */
	int eol;		  /* End of line */
	int ll;			  /* Length of line */
	int i = 0;		  /* Index into line */
	char *rp;		  /* Pointer into request */
	char *lp;		  /* Pointer into line */
	int eoc;		  /* End of command */
	char quote;		  /* Either ' or " */
	char *cur_line = NULL;	  /* Pointer to the current line */
	int line_len = 0;	  /* Length of the line buffer */
	char *ret;

#ifdef QMGR_HAVE_HIST
	if (qmgr_hist_enabled == 1) {
		if (empty) {
			if (line != NULL) {
				free(line);
				line = NULL;
			}

			if (get_request_hist(&cur_line) == EOF)
				return EOF;
		}
	}
#endif

	/* Make sure something is in the stdin line */
	if (empty) {
		eol = FALSE;
		lp = line;
		ll = 0;
		while (!eol) {
			/* The following code block (enclosed within if() {}) is executed only for the special case of
 			 * qmgr Commands being supplied from a file or within delimiters e.g. $qmgr < cmd_file.txt, where
			 * cmd_file.txt contains Commands ... or
			 * $qmgr <<EOF
 			 * p q workq
 			 * EOF <--- EOF is a delimiter.
 			 * This code block is not needed for the cases where qmgr receives input Interactively
 			 * or from the Command Line, since these checks already get done in get_request_hist().
 			 */
			if (qmgr_hist_enabled == 0) {
				if (isatty(0) && isatty(1)) {
					if (lp == line)
						printf("%s", prompt);
					else
						printf("%s", contin);
				}

				start_time = time(0);
				ll = 0;
				if ((ret = pbs_fgets(&cur_line, &ll, stdin)) == NULL) {
					if (line != NULL) {
						free(line);
						line = NULL;
					}
					if (cur_line != NULL) {
						free(cur_line);
					}
					return EOF;
				}
				cur_line = ret;
				ll = strlen(cur_line);
				if (cur_line[ll - 1] == '\n') {
					/* remove newline */
					cur_line[ll - 1] = '\0';
					--ll;
				}
				lp = cur_line;

				while (White(*lp))
					lp++;

				if (strlen(lp) == 0) {
					if (cur_line != NULL) {
						free(cur_line);
						cur_line = NULL;
						lp = line;
					}
					continue;
				}
			} else {
				ll = strlen(cur_line);
				lp = cur_line;
			}

			if (cur_line[ll - 1] == '\\') {
				cur_line[ll - 1] = ' ';
			} else if (*lp != '#')
				eol = TRUE;

			if (*lp != '#') {
				if (line != NULL) {
					line_len = strlen(line);
				} else {
					line_len = 0;
				}
				/*
				 * Append the contents of cur_line to the earlier line buffer
				 * pbs_strcat takes care of increasing the size of the destination
				 * buffer if required.
				 */
				if ((pbs_strcat(&line, &line_len, cur_line)) == NULL) {
					fprintf(stderr, "malloc failure (errno %d)\n", errno);
					exit(1);
				}
			}
			if (cur_line != NULL) {
				free(cur_line);
			}
		} /* End while(). */
	}	  /* End if(empty). */

	/* Move a command from line to request */
	ll = strlen(line);
	*request = (char *) malloc(ll + 1);
	if (*request == NULL) {
		fprintf(stderr, "malloc failure (errno %d)\n", errno);
		exit(1);
	}
	(*request)[ll] = '\0';
	rp = *request;
	lp = line;
	eoc = FALSE;
	while (!eoc) {
		switch (*lp) {
				/* End of command */
			case ';':
			case '\0':
				eoc = TRUE;
				break;

				/* Quoted string */
			case '"':
			case '\'':
				quote = *lp;
				*rp = *lp;
				rp++;
				lp++;
				while (*lp != quote && !EOL(*lp)) {
					*rp = *lp;
					rp++;
					lp++;
				}
				*rp = *lp;
				if (!EOL(*lp)) {
					rp++;
					lp++;
				}
				break;

			case '#':
				if ((lp == line) || isspace(*(lp - 1))) {
					/* comment */
					eoc = TRUE;
					break;
				} /* not comment, fall into default case */
				  /* Move the character */
			default:
				*rp = *lp;
				rp++;
				lp++;
				break;
		}
	}
	*rp = '\0';

	/* Is there any thing left in the line? */
	switch (*lp) {
		case '\0':
		case '#':
			i = 0;
			empty = TRUE;
			break;

		case ';':
			rp = line;
			lp++;
			while (White(*lp))
				lp++;
			if (!EOL(*lp)) {
				i = strlen(lp);
				memmove(rp, lp, (size_t) i); /* By using memmove() we avoid strcpy's overlapping buffer issue. */
				empty = FALSE;		     /* Note: memmove() doesn't Null terminate; so we take care of this by */
			}				     /* nullifying 'line', at the end of this function, by setting line[i] to '\0'. */
			else {
				i = 0;
				empty = TRUE;
			}
			break;
	}

	line[i] = '\0'; /* Nullify the 'line' buffer at position 'i'. The un-processed command(s) got copied */
			/* to the start of the 'line' buffer by memmove() above. These command(s) are now */
			/* Null terminated appropriately. */

	return 0;
}

/**
 * @brief
 *	show_help - show help for qmgr
 *
 * @param[in] str - possible sub topic to show help on
 *
 * @return Void
 *
 */
void
show_help(char *str)
{
	if (str != NULL) {
		while (White(*str))
			str++;
	}

	if ((str == NULL) || (*str == '\0')) {
		printf(HELP_DEFAULT);
	} else if (strncmp(str, "active", 6) == 0)
		printf(HELP_ACTIVE);
	else if (strncmp(str, "create", 6) == 0)
		printf(HELP_CREATE);
	else if (strncmp(str, "delete", 6) == 0)
		printf(HELP_DELETE);
	else if (strncmp(str, "set", 3) == 0)
		printf(HELP_SET);
	else if (strncmp(str, "unset", 5) == 0)
		printf(HELP_UNSET);
	else if (strncmp(str, "list", 4) == 0)
		printf(HELP_LIST);
	else if (strncmp(str, "print", 5) == 0)
		printf(HELP_PRINT);
	else if (strncmp(str, "import", 6) == 0)
		printf(HELP_IMPORT);
	else if (strncmp(str, "export", 6) == 0)
		printf(HELP_EXPORT);
	else if (strncmp(str, "quit", 4) == 0)
		printf(HELP_QUIT0);
	else if (strncmp(str, "exit", 4) == 0)
		printf(HELP_EXIT);
	else if (strncmp(str, "operator", 8) == 0)
		printf(HELP_OPERATOR);
	else if (strncmp(str, "value", 5) == 0)
		printf(HELP_VALUE);
	else if (strncmp(str, "name", 4) == 0)
		printf(HELP_NAME);
	else if (strncmp(str, "attribute", 9) == 0)
		printf(HELP_ATTRIBUTE);
	else if (strncmp(str, "serverpublic", 12) == 0)
		printf(HELP_SERVERPUBLIC);
	else if (strncmp(str, "serverro", 8) == 0)
		printf(HELP_SERVERRO);
	else if (strncmp(str, "queuepublic", 11) == 0)
		printf(HELP_QUEUEPUBLIC);
	else if (strncmp(str, "queueexec", 9) == 0)
		printf(HELP_QUEUEEXEC);
	else if (strncmp(str, "queueroute", 10) == 0)
		printf(HELP_QUEUEROUTE);
	else if (strncmp(str, "queuero", 7) == 0)
		printf(HELP_QUEUERO);
	else if (strncmp(str, "nodeattr", 8) == 0)
		printf(HELP_NODEATTR);
	else
		printf("No help available on: %s\nCheck the PBS Reference Guide for more help.\n", str);

	printf("\n");
}

/**
 * @brief
 *	parse - parse the qmgr request
 *
 * @param[in]  request      The text of a single qmgr command.
 * @param[out] oper    Indicates either create, delete, set, unset, or list
 * @param[out] type    Indicates either server or queue.
 * @param[out] names   The names of the objects.
 * @param[out] attr    The attribute list with operators.
 *
 * @return Error code
 * @retval       0  Success
 * @retval       !0 Failure
 *
 * Note:
 *  The syntax of a qmgr directive is:
 *
 *      operation type [namelist] [attributelist]
 *
 *  where
 *      operation       create, delete, set, unset, list or print
 *      type            server, queue, node, or resource
 *      namelist        comma delimit list of names with no white space,
 *                      can only be defaulted if the type is server
 *      attributelist   comma delimit list of name or name-value pairs
 *
 *  If the operation part is quit or exit, then the code will be stopped
 *  now.
 *
 */
int
parse(char *request, int *oper, int *type, char **names, struct attropl **attr)
{
	int error;
	int lp;	 /* Length of current string */
	int len; /* ammount parsed by parse_request */
	char **req = NULL;
	int names_len = 0;
	char *p;

	/* jump over whitespace atleast in the LHS */
	p = request;
	while (White(*p))
		p++;
	if (*p == '\0')
		return -1;
	request = p;

	/* request was all right, if history enabled, add to history */
#ifdef QMGR_HAVE_HIST
	if (qmgr_hist_enabled == 1)
		qmgr_add_history(p);
#endif

	/* parse the request into parts */
	len = parse_request(request, &req);

	if (len != 0) { /* error in parse_request */
		lp = strlen(req[IND_CMD]);

		if (strncmp(req[0], "create", lp) == 0)
			*oper = MGR_CMD_CREATE;
		else if (strncmp(req[0], "delete", lp) == 0)
			*oper = MGR_CMD_DELETE;
		else if (strncmp(req[0], "set", lp) == 0)
			*oper = MGR_CMD_SET;
		else if (strncmp(req[0], "unset", lp) == 0)
			*oper = MGR_CMD_UNSET;
		else if (strncmp(req[0], "list", lp) == 0)
			*oper = MGR_CMD_LIST;
		else if (strncmp(req[0], "print", lp) == 0)
			*oper = MGR_CMD_PRINT;
		else if (strncmp(req[0], "active", lp) == 0)
			*oper = MGR_CMD_ACTIVE;
		else if (strncmp(req[0], "import", lp) == 0)
			*oper = MGR_CMD_IMPORT;
		else if (strncmp(req[0], "export", lp) == 0)
			*oper = MGR_CMD_EXPORT;
		else if (strncmp(req[0], "help", lp) == 0) {
			show_help(req[1]);
			CLEAN_UP_REQ(req)
			return -1;
		} else if (strncmp(req[0], "?", lp) == 0) {
			show_help(req[1]);
			CLEAN_UP_REQ(req)
			return -1;
		} else if (strncmp(req[0], "quit", lp) == 0) {
			CLEAN_UP_REQ(req)
			clean_up_and_exit(0);
		} else if (strncmp(req[0], "exit", lp) == 0) {
			CLEAN_UP_REQ(req)
			clean_up_and_exit(0);
		}
#ifdef QMGR_HAVE_HIST
		else if (strncmp(req[0], "history", lp) == 0) {
			qmgr_list_history(req[1] ? atol(req[1]) : QMGR_HIST_SIZE);
			free(request);
			return -1;
		}
#endif
		else {
			PSTDERR1("qmgr: Illegal operation: %s\n"
				 "Try 'help' if you are having trouble.\n",
				 req[IND_CMD])
			CLEAN_UP_REQ(req)
			return 1;
		}

		if (EOL(req[IND_OBJ])) {
			pstderr("qmgr: No object type given\n");
			CLEAN_UP_REQ(req)
			return 2;
		}

		lp = strlen(req[IND_OBJ]);
		if (strncmp(req[1], "server", lp) == 0)
			*type = MGR_OBJ_SERVER;
		else if ((strncmp(req[1], "queue", lp) == 0) ||
			 (strncmp(req[1], "queues", lp) == 0))
			*type = MGR_OBJ_QUEUE;
		else if ((strncmp(req[1], "node", lp) == 0) ||
			 (strncmp(req[1], "nodes", lp) == 0))
			*type = MGR_OBJ_NODE;
		else if (strncmp(req[1], "resource", lp) == 0)
			*type = MGR_OBJ_RSC;
		else if (strncmp(req[1], "sched", lp) == 0)
			*type = MGR_OBJ_SCHED;
		else if (strncmp(req[1], SITE_HOOK, lp) == 0)
			*type = MGR_OBJ_SITE_HOOK;
		else if (strncmp(req[1], PBS_HOOK, lp) == 0)
			*type = MGR_OBJ_PBS_HOOK;
		else {
			PSTDERR1("qmgr: Illegal object type: %s.\n", req[IND_OBJ])
			CLEAN_UP_REQ(req)
			return 2;
		}

		if (!EOL(req[IND_NAME])) {
			if ((*type != MGR_OBJ_SITE_HOOK) && (*type != MGR_OBJ_PBS_HOOK) && (*type != MGR_OBJ_RSC) &&
			    is_attr(*type, req[IND_NAME], TYPE_ATTR_ALL)) {
				len -= strlen(req[IND_NAME]);
				req[IND_NAME][0] = '\0';
			} else if ((error = check_list(req[IND_NAME], *type))) {
				pstderr(syntaxerr);
				CaretErr(request, len - (int) strlen(req[IND_NAME]) + error - 1);
				CLEAN_UP_REQ(req)
				return 3;
			} else {
				names_len = strlen(req[IND_NAME]);
				*names = (char *) malloc(names_len + 1);
				if (*names == NULL) {
					fprintf(stderr, "malloc failure (errno %d)\n", errno);
					exit(1);
				}
				pbs_strncpy(*names, req[IND_NAME], names_len + 1);
			}
		}

		/* Get attribute list; remaining part of the request */
		if ((*oper != MGR_CMD_IMPORT) && (*oper != MGR_CMD_EXPORT) &&
		    ((error = attributes(request + len, attr, *oper)) != 0)) {
			pstderr(syntaxerr);
			CaretErr(request, len + error);
			CLEAN_UP_REQ(req)
			return 4;
		} else if ((*oper == MGR_CMD_IMPORT) &&
			   ((error = params_import(request + len, attr, *oper)) != 0)) {
			pstderr(syntaxerr);
			CaretErr(request, len + error);
			CLEAN_UP_REQ(req)
			return 4;
		} else if ((*oper == MGR_CMD_EXPORT) &&
			   ((error = params_export(request + len, attr, *oper)) != 0)) {
			pstderr(syntaxerr);
			CaretErr(request, len + error);
			CLEAN_UP_REQ(req)
			return 4;
		} else if ((*oper == MGR_CMD_SET || *oper == MGR_CMD_UNSET) && *attr == NULL) {
			pstderr(syntaxerr);
			CaretErr(request, len + error);
			CLEAN_UP_REQ(req)
			return 4;
		} else if (*oper == MGR_CMD_ACTIVE && *attr != NULL) {
			pstderr(syntaxerr);
			CaretErr(request, len);
			CLEAN_UP_REQ(req)
			return 4;
		}
	} else {
		pstderr(syntaxerr);
		CaretErr(request, len);
		CLEAN_UP_REQ(req)
		return 4;
	}
	CLEAN_UP_REQ(req)
	return 0;
}

/**
 * @brief
 *	pstderr - prints error message to standard error.  It will not be
 *		  printed if the "-z" option was given on the command line
 *
 * @param[in] string       The error message to print.
 *
 * @return Void
 * 	Global Variable: zopt
 *
 */
void
pstderr(const char *string)
{
	if (!zopt)
		fprintf(stderr, "%s", string);
}

/**
 * @brief
 *	pstderr_big - prints error message to standard error.  It handles
 *                    the highly unusual case where the error message
 *                    that's to be generated is too big to be placed in
 *                    the buffer that was allocated.  In this case the
 *                    message is put out in pieces to stderr.  Kind of
 *                    ugly, but one doesn't really expect this code to be
 *                    called except in the oddest of cases.
 *
 * @param[in]   svrname       name of the server
 * @param[in]	objname       name of the object
 * @param[in]	errmesg       actual error message
 *
 * @return Void
 * 	Global Variable: zopt
 *
 */
void
pstderr_big(char *svrname, char *objname, char *errmesg)
{
	pstderr("qmgr obj=");
	pstderr(objname);
	pstderr(" svr=");
	pstderr(svrname);
	pstderr(": ");
	pstderr(errmesg);
	pstderr("\n");
}

/**
 * @brief
 *	free_objname_list - frees an objname list
 *
 *@param[in]  list - objname list to free
 *
 * @return Void
 *
 */
void
free_objname_list(struct objname *list)
{
	struct objname *cur, *tmp;

	cur = list;

	while (cur != NULL) {
		tmp = cur->next;
		free_objname(cur);
		cur = tmp;
	}
}

/**
 * @brief
 *	find_server - find a server in the server list
 *
 * @param[in] name - the name of the server
 *
 * @return pointer to structure
 * @retval return a pointer to the specified server struct or NULL if not found
 *
 */
struct server *
find_server(char *name)
{
	struct server *s = NULL;

	if (name != NULL) {
		s = servers;

		while (s != NULL && strcmp(s->s_name, name))
			s = s->next;
	}

	return s;
}

/**
 * @brief
 *	new_server - allocate new server objcet and initialize it
 *
 * @return structure
 * @retval new server object
 *
 */
struct server *
new_server()
{
	struct server *new;

	Mstruct(new, struct server);
	new->s_connect = -1;
	new->s_name = NULL;
	new->ref = 0;
	new->s_rsc = NULL;
	new->next = NULL;
	return new;
}

/**
 * @brief
 *	free_server - remove server from servers list and free it up
 *
 * @param[in] svr - the server to free
 *
 * @return Void
 *
 */
void
free_server(struct server *svr)
{
	struct server *cur_svr, *prev_svr = NULL;

	/* remove server from servers list */
	cur_svr = servers;
	while (cur_svr != svr && cur_svr != NULL) {
		prev_svr = cur_svr;
		cur_svr = cur_svr->next;
	}

	if (cur_svr != NULL) {
		if (prev_svr == NULL)
			servers = servers->next;
		else
			prev_svr->next = cur_svr->next;

		if (svr->s_name != NULL)
			free(svr->s_name);

		if (svr->s_rsc != NULL)
			pbs_statfree(svr->s_rsc);

		svr->s_name = NULL;
		svr->s_connect = -1;
		svr->next = NULL;
		free(svr);
	}
}

/**
 * @brief
 *	new_objname - allocate new object and initialize it
 *
 * @return structure
 * @retval newly allocated object
 *
 */
struct objname *
new_objname()
{
	struct objname *new;
	Mstruct(new, struct objname);
	new->obj_type = MGR_OBJ_NONE;
	new->obj_name = NULL;
	new->svr_name = NULL;
	new->svr = NULL;
	new->next = NULL;

	return new;
}

/**
 * @brief
 *	free_objname - frees space used by an objname
 *
 * @param[in] obj - objname to free
 *
 * @return Void
 *
 */
void
free_objname(struct objname *obj)
{
	if (obj->obj_name != NULL)
		free(obj->obj_name);

	if (obj->obj_type != MGR_OBJ_SERVER && obj->svr_name != NULL &&
	    obj->obj_name != obj->svr_name)
		free(obj->svr_name);

	if (obj->svr != NULL)
		obj->svr->ref--;

	obj->svr = NULL;
	obj->obj_name = NULL;
	obj->svr_name = NULL;
	obj->next = NULL;
	free(obj);
}

/**
 * @brief
 *	strings2objname - convert an array of strings to a list of objnames
 *
 * @param[in]  str - array of strings
 * @param[in]  num - number of strings
 * @param[in]  type - type of objects
 *
 * @return structure
 * @retval newly allocated list of objnames
 *
 */
struct objname *
strings2objname(char **str, int num, int type)
{
	struct objname *objs = NULL;	 /* head of objname list */
	struct objname *cur_obj;	 /* current object in objname list */
	struct objname *prev_obj = NULL; /* previous object in objname list */
	int i;
	int len;

	if (str != NULL) {
		for (i = 0; i < num; i++) {
			cur_obj = new_objname();

			len = strlen(str[i]);
			Mstring(cur_obj->obj_name, len + 1);
			strcpy(cur_obj->obj_name, str[i]);
			cur_obj->obj_type = type;
			if (type == MGR_OBJ_SERVER || type == MGR_OBJ_SCHED || type == MGR_OBJ_SITE_HOOK || type == MGR_OBJ_PBS_HOOK)
				cur_obj->svr_name = cur_obj->obj_name;

			if (prev_obj != NULL)
				prev_obj->next = cur_obj;

			if (objs == NULL)
				objs = cur_obj;

			prev_obj = cur_obj;
		}
	}
	return objs;
}

/**
 * @brief
 *	is_valid_object - connects to the server to check if the object exists
 *			  on the server its connected.
 *
 * @param[in] obj - object to check
 * @param[in] type - type of object
 *
 * @returns Error code
 * @retval  1  Success  valid
 * @retval  0  Failure  not valid
 *
 */
int
is_valid_object(struct objname *obj, int type)
{
	struct batch_status *batch_obj = NULL;
	/* we need something to make the pbs_stat* call.
	 * Even if we only want the object name
	 */
	static struct attrl attrq = {NULL, ATTR_qtype, "", ""};
	static struct attrl attrn = {NULL, ATTR_NODE_state, "", ""};
	int valid = 1;
	char *errmsg;

	if (obj != NULL && obj->svr != NULL) {
		switch (type) {
			case MGR_OBJ_QUEUE:
				batch_obj = pbs_statque(obj->svr->s_connect, obj->obj_name, &attrq, NULL);
				break;

			case MGR_OBJ_NODE:
				batch_obj = pbs_statvnode(obj->svr->s_connect, obj->obj_name, &attrn, NULL);
				break;

			default:
				valid = 0;
		}

		if (batch_obj == NULL) {
			errmsg = pbs_geterrmsg(obj->svr->s_connect);
			PSTDERR1("qmgr: %s.\n", errmsg)
			valid = 0;
		} else {
			/* if pbs_stat*() returned something, then the object exists */
			valid = 1;
			pbs_statfree(batch_obj);
		}
	} else
		valid = 1; /* NULL server means all active servers */

	return valid;
}

/**
 * @brief
 *	default_server_name - create an objname struct for the default server
 *
 * @return   structure
 * @retval   newly allocated objname with the default server assigned
 *
 */
struct objname *
default_server_name()
{
	struct objname *obj;

	obj = new_objname();
	/* default server name is the NULL string */
	Mstring(obj->obj_name, 1);
	obj->obj_name[0] = '\0';
	obj->svr_name = obj->obj_name;
	obj->obj_type = MGR_OBJ_SERVER;

	return obj;
}

/**
 * @brief
 *	temp_objname - set up a temporary objname struct.  This is meant for
 *		       a one time use.  The memory is static.
 *
 * @param[in]  obj_name - name for temp struct
 * @param[in]  svr_name - name of the server for the temp struct
 * @param[in]  svr  - server for temp struct
 *
 * @returns structure
 * @retval  temporary objname
 *
 */
struct objname *
temp_objname(char *obj_name, char *svr_name, struct server *svr)
{
	static struct objname temp = {0, NULL, NULL, NULL, NULL};

	if (temp.svr != NULL)
		temp.svr->ref--;

	temp.obj_name = NULL;
	temp.svr_name = NULL;
	temp.svr = NULL;

	temp.obj_name = obj_name;
	temp.svr_name = svr_name;
	temp.svr = svr;

	if (temp.svr != NULL)
		temp.svr->ref++;

	return &temp;
}

/**
 * @brief
 *	close_non_ref_servers - close all nonreferenced servers
 *
 * @returns Void
 *
 */
void
close_non_ref_servers()
{
	struct server *svr, *tmp_svr;

	svr = servers;

	while (svr != NULL) {
		tmp_svr = svr->next;

		if (svr->ref == 0)
			disconnect_from_server(svr);

		svr = tmp_svr;
	}
}

/**
 * @brief
 *	parse_request - parse out the command, object, and possible name
 *
 * @remarks
 *	FULL: command object name ...
 *	      command object ...
 *	NOTE: there does not need to be whitespace around the operator
 *
 * @param[in]  request - the request to be processed
 * @param[out] req - array to return data in
 *	       indicies:
 *	       IND_CMD   : command
 *	       IND_OBJ   : object
 *	       IND_NAME  : name
 *
 * if any field is not there, it is left blank.
 * returns The number of characters parsed.  Note: 0 chars parsed is error
 *		Data is passed back via the req variable.
 * @return int
 * @retval 0  Failure
 * @retval The number of characters parsed  Success
 *
 */
int
parse_request(char *request, char ***req)
{
	char *foreptr, *backptr;
	int len;
	int i = 0;
	int chars_parsed = 0;
	int error = 0;

	foreptr = request;
	*req = (char **) malloc(MAX_REQ_WORDS * sizeof(char *));
	if (*req == NULL) {
		fprintf(stderr, "malloc failure (errno %d)\n", errno);
		exit(1);
	}
	for (i = IND_FIRST; i <= IND_LAST; i++)
		(*req)[i] = NULL;

	for (i = 0; !EOL(*foreptr) && i < MAX_REQ_WORDS && error == 0;) {
		while (White(*foreptr))
			foreptr++;

		backptr = foreptr;
		while (!White(*foreptr) && !Oper(foreptr) && !EOL(*foreptr))
			foreptr++;

		len = foreptr - backptr;

		if (len > strlen(request)) {
			error = 1;
			chars_parsed = (int) (foreptr - request);
			pstderr("qmgr: max word length exceeded\n");
			CaretErr(request, chars_parsed);
		}
		(*req)[i] = (char *) malloc(len + 1);
		if ((*req)[i] == NULL) {
			fprintf(stderr, "malloc failure (errno %d)\n", errno);
			exit(1);
		}
		((*req)[i])[len] = '\0';
		if (len > 0)
			pbs_strncpy((*req)[i], backptr, len + 1);
		i++;
	}
	chars_parsed = foreptr - request;

	return error ? 0 : chars_parsed;
}


================================================
FILE: src/cmds/qmgr_sup.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#include <pwd.h>

#include "pbs_ifl.h"
#include "cmds.h"
#include "qmgr.h"

#include "histedit.h"

#ifdef QMGR_HAVE_HIST

EditLine *el;
HistEvent ev;
History *qmgrhist;

extern char prompt[];
extern char contin[];
extern char *cur_prompt;
extern const char hist_init_err[];
extern const char histfile_access_err[];
extern char qmgr_hist_file[MAXPATHLEN + 1]; /* history file for this user */

/**
 * @brief
 *	To print out the prompt you need to use a function.  This could be
 *	made to do something special, but I opt to just have a static prompt.
 *
 * @param[in] e - prompt printing function
 *
 * @return string
 * @retval string containing prompt
 *
 */
static char *
el_prompt(EditLine *e)
{
	return cur_prompt;
}

/**
 * @brief
 *	To handle SIGQUIT signal when Ctrl-D is pressed.
 *
 * @param[in] Editline pointer
 * @param[in] int - key which caused the invocation
 *
 * @return EOF
 *
 * @par Side Effects: None
 *
 */
static unsigned char
EOF_handler(EditLine *e, int ch)
{
	return CC_EOF;
}

/**
 * @brief
 *	List the commands stored in qmgr history
 *
 * @param[in] len - Length of history from recent to list
 *
 * @par Side Effects: None
 *
 */
void
qmgr_list_history(int len)
{
	int i = 0;
	int tot;

	if (len <= 0) {
		if (len != 0)
			printf("Invalid option\n");
		return;
	}

	if (history(qmgrhist, &ev, H_GETSIZE) == -1)
		return;
	tot = ev.num;

	if (history(qmgrhist, &ev, H_LAST) == -1)
		return;

	while (1) {
		i++;
		if ((ev.str != NULL) && ((i + len) > tot))
			printf("%d\t%s\n", ev.num, ev.str);

		if (history(qmgrhist, &ev, H_PREV) == -1)
			return;
	}
}

/**
 * @brief
 *	Get the num-th event from the history
 *
 * @param[in] num - the num-th element to get
 * @param[out] request - return history in newly allocated address
 *
 * @par Side Effects: None
 *
 * @return      Error code
 * @retval  0 - success
 * @retval -1 - Failure
 */
static int
qmgr_get_history(int num, char **request)
{
	if (history(qmgrhist, &ev, H_LAST) == -1)
		return -1;

	while (1) {
		if (ev.num == num) {
			if (ev.str == NULL || (*request = strdup(ev.str)) == NULL)
				return -1;
			return 0;
		}
		if (history(qmgrhist, &ev, H_PREV) == -1)
			return -1;
	}
	return -1;
}

/**
 * @brief
 *	Initialize the qmgr history capability
 *
 * @param[in]	prog - Name of the program (qmgr) so that
 * editline can use editrc for any custom settings.
 *
 * @return      Error code
 * @retval  0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects: None
 *
 */
int
init_qmgr_hist(char *prog)
{
	struct passwd *pw;
	int rc;

	el = el_init(prog, stdin, stdout, stderr);
	el_set(el, EL_PROMPT, &el_prompt);
	el_set(el, EL_EDITOR, "emacs");
	el_set(el, EL_ADDFN, "EOF_handler", "EOF_handler", &EOF_handler);
	el_set(el, EL_BIND, "^D", "EOF_handler", NULL);

	/* Initialize the history */
	qmgrhist = history_init();
	if (qmgrhist == NULL) {
		fprintf(stderr, "%s", hist_init_err);
		return -1;
	}

	/* Set the size of the history */
	if (history(qmgrhist, &ev, H_SETSIZE, QMGR_HIST_SIZE) == -1) {
		fprintf(stderr, "%s", hist_init_err);
		return -1;
	}

	/* set adjacent unique */
	if (history(qmgrhist, &ev, H_SETUNIQUE, 1) == -1) {
		fprintf(stderr, "%s", hist_init_err);
		return -1;
	}

	/* This sets up the call back functions for history functionality */
	el_set(el, EL_HIST, history, qmgrhist);

	qmgr_hist_file[0] = '\0';
	rc = 1;
	if ((pw = getpwuid(getuid()))) {
		snprintf(qmgr_hist_file, MAXPATHLEN, "%s/.pbs_qmgr_history", pw->pw_dir);
		history(qmgrhist, &ev, H_LOAD, qmgr_hist_file);
		if (history(qmgrhist, &ev, H_SAVE, qmgr_hist_file) == -1)
			history(qmgrhist, &ev, H_CLEAR);
		else
			rc = 0;

		if (rc == 1) {
			snprintf(qmgr_hist_file, MAXPATHLEN, "%s/spool/.pbs_qmgr_history_%s",
				 pbs_conf.pbs_home_path, pw->pw_name);
			history(qmgrhist, &ev, H_LOAD, qmgr_hist_file);
			if (history(qmgrhist, &ev, H_SAVE, qmgr_hist_file) == -1)
				history(qmgrhist, &ev, H_CLEAR);
			else
				rc = 0;
		}
	}

	if (rc == 1) {
		fprintf(stderr, histfile_access_err, qmgr_hist_file);
		qmgr_hist_file[0] = '\0';
	}

	return 0;
}

/**
 * @brief
 * Add a line to history
 *
 * @param[in] req - line to be added to history
 *
 * @return - Error code
 * @retval -1 Failure
 * @retval  0 Success
 */
int
qmgr_add_history(char *req)
{
	if (history(qmgrhist, &ev, H_ENTER, req) == -1) {
		fprintf(stderr, "Failed to set history\n");
		return -1;
	} else if (qmgr_hist_file[0] != '\0') {
		if (history(qmgrhist, &ev, H_SAVE, qmgr_hist_file) == -1) {
			fprintf(stderr, "Failed to save history\n");
			return -1;
		}
	}
	return 0;
}

/**
 * @brief
 *	Get a request from the command prompt with the support for history
 *
 * @par Functionality:
 *	Gets a line of input from the user. The user can use up and down arrows
 *	(emacs style) to recall history.
 *
 * @param[out]	request - The buffer to which user-input is returned into
 *
 * @return	   int
 * @retval 0 - Success
 * @retval 1 - Failure
 *
 * @par Side Effects: None
 *
 */

int
get_request_hist(char **request)
{
	int count;
	char *line;
	char *p;
	char *req;
	int req_size;
	int cont_char;

	*request = NULL;
	req = NULL;

	/* loop till we get some data */
	while (1) {
		cur_prompt = prompt;
		cont_char = 1;

		while (cont_char) {
			/* count is the number of characters read.
			 line is a const char* of our command line with the tailing \n */
			if ((line = (char *) el_gets(el, &count)) == NULL) {
				return EOF;
			}

			count--; /* don't count the last \n */
			if (count <= 0) {
				cont_char = 0;
				continue;
			}

			line[count] = '\0'; /* remove the trailing \n */

			p = line;
			/* gloss over initial white space */
			while (White(*p))
				p++;

			if (*p == '#')
				continue; /* ignore comments */

			count = strlen(p);
			if (count <= 0) {
				cont_char = 0;
				continue;
			}

			if (p[count - 1] == '\\') {
				p[count - 1] = ' ';
			} else
				cont_char = 0;

			if (*request == NULL) {
				*request = strdup(p);
				if (*request == NULL)
					return 1;
			} else {
				req_size = strlen(*request) + count + 1;
				*request = realloc(*request, req_size);
				if (*request == NULL)
					return 1;
				strcat(*request, p);
			}
			cur_prompt = contin;
		}

		if (*request == NULL)
			continue; /* we did not get a good input, continue */

		req = *request;

		/* immediately check if this was a recall of a command from history */
		if (req[0] == '!') {
			p = &req[1];
			if (qmgr_get_history(atol(p), request) != 0) {
				fprintf(stderr, "No item %s in history\n", p);
				free(req);
				*request = NULL;
				req = NULL;
				continue;
			}
			free(req); /* free the old one */
		}
		return 0;
	}
	return 1;
}

#endif


================================================
FILE: src/cmds/qmove.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qmove.c
 * @brief
 *  qmove - (PBS) move batch job
 *
 * @author	Terry Heidelberg
 * 			Livermore Computing
 *
 * @author	Bruce Kelly
 * 			National Energy Research Supercomputer Center
 *
 * @author	Lawrence Livermore National Laboratory
 * 			University of California
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>

int
main(int argc, char **argv, char **envp) /* qmove */
{
	int any_failed = 0;

	char job_id[PBS_MAXCLTJOBID];	     /* from the command line */
	char destination[PBS_MAXSERVERNAME]; /* from the command line */
	char *q_n_out, *s_n_out;

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	if (argc < 3) {
		static char usage[] = "usage: qmove destination job_identifier...\n";
		static char usag2[] = "       qmove --version\n";
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(2);
	}

	pbs_strncpy(destination, argv[1], sizeof(destination));
	if (parse_destination_id(destination, &q_n_out, &s_n_out)) {
		fprintf(stderr, "qmove: illegally formed destination: %s\n", destination);
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qmove: unable to initialize security library.\n");
		exit(2);
	}

	for (optind = 2; optind < argc; optind++) {
		int connect;
		int stat = 0;
		int located = FALSE;

		pbs_strncpy(job_id, argv[optind], sizeof(job_id));
		if (get_server(job_id, job_id_out, server_out)) {
			fprintf(stderr, "qmove: illegally formed job identifier: %s\n", job_id);
			any_failed = 1;
			continue;
		}
	cnt:
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "qmove: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_movejob(connect, job_id_out, destination, NULL);
		if (stat && (pbs_errno != PBSE_UNKJOBID)) {
			if (stat != PBSE_NEEDQUET) {
				prt_job_err("qmove", connect, job_id_out);
				any_failed = pbs_errno;
			} else {
				fprintf(stderr, "qmove: Queue type not set for queue \'%s\'\n", destination);
			}
		} else if (stat && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job_id_out, server_out, rmt_server)) {
				pbs_disconnect(connect);
				pbs_strncpy(server_out, rmt_server, sizeof(server_out));
				goto cnt;
			}
			prt_job_err("qmove", connect, job_id_out);
			any_failed = pbs_errno;
		}

		pbs_disconnect(connect);
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(any_failed);
}


================================================
FILE: src/cmds/qmsg.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qmsg.c
 * @brief
 * 	qmsg - (PBS) send message to batch job
 *
 * @author	Terry Heidelberg
 * 			Livermore Computing
 *
 * @author	Bruce Kelly
 * 			National Energy Research Supercomputer Center
 *
 * @author	Lawrence Livermore National Laboratory
 * 			University of California
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>

int
main(int argc, char **argv, char **envp) /* qmsg */
{
	int c;
	int to_file;
	int errflg = 0;
	int any_failed = 0;

	char job_id[PBS_MAXCLTJOBID]; /* from the command line */

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];

#define MAX_MSG_STRING_LEN 256
	char msg_string[MAX_MSG_STRING_LEN + 1];

#define GETOPT_ARGS "EO"

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	msg_string[0] = '\0';
	to_file = 0;

	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF)
		switch (c) {
			case 'E':
				to_file |= MSG_ERR;
				break;
			case 'O':
				to_file |= MSG_OUT;
				break;
			default:
				errflg++;
		}
	if (to_file == 0)
		to_file = MSG_ERR; /* default */

	if (errflg || ((optind + 1) >= argc)) {
		static char usage[] =
			"usage: qmsg [-O] [-E] msg_string job_identifier...\n";
		static char usag2[] =
			"       qmsg --version\n";
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(2);
	}

	pbs_strncpy(msg_string, argv[optind], sizeof(msg_string));

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qmsg: unable to initialize security library.\n");
		exit(2);
	}

	for (optind++; optind < argc; optind++) {
		int connect;
		int stat = 0;
		int located = FALSE;

		pbs_strncpy(job_id, argv[optind], sizeof(job_id));
		if (get_server(job_id, job_id_out, server_out)) {
			fprintf(stderr, "qmsg: illegally formed job identifier: %s\n", job_id);
			any_failed = 1;
			continue;
		}
	cnt:
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "qmsg: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_msgjob(connect, job_id_out, to_file, msg_string, NULL);
		if (stat && (pbs_errno != PBSE_UNKJOBID)) {
			prt_job_err("qmsg", connect, job_id_out);
			any_failed = pbs_errno;
		} else if (stat && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job_id_out, server_out, rmt_server)) {
				pbs_disconnect(connect);
				strcpy(server_out, rmt_server);
				goto cnt;
			}
			prt_job_err("qmsg", connect, job_id_out);
			any_failed = pbs_errno;
		}

		pbs_disconnect(connect);
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(any_failed);
}


================================================
FILE: src/cmds/qorder.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qorder.c
 * @brief
 * 	qorder - change the order of two batch jobs in a queue
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include "cmds.h"
#include <pbs_version.h>
#include "pbs_ifl.h"
#include "net_connect.h"

int
main(int argc, char **argv, char **envp)
{
	char job_id1[PBS_MAXCLTJOBID + 1]; /* from the command line */
	char job_id2[PBS_MAXCLTJOBID + 1]; /* from the command line */
	char job_id1_out[PBS_MAXCLTJOBID + 1];
	char job_id2_out[PBS_MAXCLTJOBID + 1];
	char *pn;
	int port1 = 0;
	int port2 = 0;
	char server_out1[MAXSERVERNAME + 1];
	char server_out2[MAXSERVERNAME + 1];
	char svrtmp[MAXSERVERNAME + 1];
	int connect;
	int stat = 0;
	int rc = 0;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	if (argc != 3) {
		static char usage[] = "usage: qorder job_identifier job_identifier\n";
		static char usag2[] = "       qorder --version\n";
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(2);
	}

	pbs_strncpy(job_id1, argv[1], sizeof(job_id1));
	pbs_strncpy(job_id2, argv[2], sizeof(job_id2));
	svrtmp[0] = '\0';
	if (get_server(job_id1, job_id1_out, svrtmp)) {
		fprintf(stderr, "qorder: illegally formed job identifier: %s\n", job_id1);
		exit(1);
	}
	if (*svrtmp == '\0') {
		if ((pn = pbs_default()) != NULL) {
			pbs_strncpy(svrtmp, pn, sizeof(svrtmp));
		} else {
			fprintf(stderr, "qorder: could not get default server: %s\n", job_id1);
			exit(1);
		}
	}

	if ((pn = strchr(svrtmp, (int) ':')) != 0) {
		*pn = '\0';
		port1 = atoi(pn + 1);
	}
	if (get_fullhostname(svrtmp, server_out1, MAXSERVERNAME) != 0) {
		fprintf(stderr, "qorder: invalid server name: %s\n", job_id1);
		exit(1);
	}

	svrtmp[0] = '\0';
	if (get_server(job_id2, job_id2_out, svrtmp)) {
		fprintf(stderr, "qorder: illegally formed job identifier: %s\n", job_id2);
		exit(1);
	}
	if (*svrtmp == '\0') {
		if ((pn = pbs_default()) != NULL) {
			pbs_strncpy(svrtmp, pn, sizeof(svrtmp));
		} else {
			fprintf(stderr, "qorder: could not get default server: %s\n", job_id1);
			exit(1);
		}
	}
	if ((pn = strchr(svrtmp, (int) ':')) != 0) {
		*pn = '\0';
		port2 = atoi(pn + 1);
	}
	if (get_fullhostname(svrtmp, server_out2, MAXSERVERNAME) != 0) {
		fprintf(stderr, "qorder: invalid server name: %s\n", job_id2);
		exit(1);
	}
	if ((strcmp(server_out1, server_out2) != 0) || (port1 != port2)) {
		fprintf(stderr, "qorder: both jobs ids must specify the same server\n");
		exit(1);
	}
	if (pn)
		*pn = ':'; /* restore : if it was present */

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qorder: unable to initialize security library.\n");
		exit(1);
	}

	connect = cnt2server(svrtmp);
	if (connect <= 0) {
		fprintf(stderr, "qorder: cannot connect to server %s (errno=%d)\n",
			pbs_server, pbs_errno);
		exit(1);
		;
	}

	stat = pbs_orderjob(connect, job_id1_out, job_id2_out, NULL);
	if (stat) {

		char job_id_both[PBS_MAXCLTJOBID + PBS_MAXCLTJOBID + 3];

		strcpy(job_id_both, job_id1_out);
		strcat(job_id_both, " or ");
		strcat(job_id_both, job_id2_out);
		prt_job_err("qorder", connect, job_id_both);
		rc = pbs_errno;
	}

	pbs_disconnect(connect);

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(rc);
}


================================================
FILE: src/cmds/qrerun.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qrerun.c
 * @brief
 * 	qrerun - (PBS) rerun batch job
 *
 * @author	   	Terry Heidelberg
 * 				Livermore Computing
 *
 * @author     	Bruce Kelly
 * 				National Energy Research Supercomputer Center
 *
 * @author     	Lawrence Livermore National Laboratory
 * 				University of California
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>

int
main(int argc, char **argv, char **envp) /* qrerun */
{
	int any_failed = 0;

	char job_id[PBS_MAXCLTJOBID]; /* from the command line */

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[PBS_MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];
	char *extra = NULL;
	char *force = "force";
	int i;
	static char usage[] = "usage: qrerun [-W force] job_identifier...\n";
	static char usag2[] = "       qrerun --version\n";

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((i = getopt(argc, argv, "W:")) != EOF) {
		switch (i) {
			case 'W':
				if (strcmp(optarg, force) == 0)
					extra = force;
				else {
					fprintf(stderr, "%s", usage);
					fprintf(stderr, "%s", usag2);
					exit(2);
				}
				break;
			default:
				fprintf(stderr, "%s", usage);
				fprintf(stderr, "%s", usag2);
				exit(2);
		}
	}

	if (optind == argc) {
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qrerun: unable to initialize security library.\n");
		exit(1);
	}

	for (; optind < argc; optind++) {
		int connect;
		int stat = 0;
		int located = FALSE;

		pbs_strncpy(job_id, argv[optind], sizeof(job_id));
		if (get_server(job_id, job_id_out, server_out)) {
			fprintf(stderr, "qrerun: illegally formed job identifier: %s\n", job_id);
			any_failed = 1;
			continue;
		}
	cnt:
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "qrerun: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_rerunjob(connect, job_id_out, extra);
		if (stat && (pbs_errno != PBSE_UNKJOBID)) {
			prt_job_err("qrerun", connect, job_id_out);
			any_failed = pbs_errno;
		} else if (stat && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job_id_out, server_out, rmt_server)) {
				pbs_disconnect(connect);
				pbs_strncpy(server_out, rmt_server, sizeof(server_out));
				goto cnt;
			}
			prt_job_err("qrerun", connect, job_id_out);
			any_failed = pbs_errno;
		}

		pbs_disconnect(connect);
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(any_failed);
}


================================================
FILE: src/cmds/qrls.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qrls.c
 * qrls - (PBS) release a hold on a batch job
 *
 * @author	   	Terry Heidelberg
 * 				Livermore Computing
 *
 * @author     	Bruce Kelly
 * 				National Energy Research Supercomputer Center
 *
 * @author     	Lawrence Livermore National Laboratory
 * 				University of California
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>

int
main(int argc, char **argv, char **envp) /* qrls */
{
	int c;
	int errflg = 0;
	int any_failed = 0;
	int u_cnt, o_cnt, s_cnt, n_cnt, p_cnt;
	char *pc;

	char job_id[PBS_MAXCLTJOBID]; /* from the command line */

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];

#define MAX_HOLD_TYPE_LEN 32
	char hold_type[MAX_HOLD_TYPE_LEN + 1];

#define GETOPT_ARGS "h:"

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	hold_type[0] = '\0';

	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF)
		switch (c) {
			case 'h':
				while (isspace((int) *optarg))
					optarg++;
				if (strlen(optarg) == 0) {
					fprintf(stderr, "qrls: illegal -h value\n");
					errflg++;
					break;
				}
				pc = optarg;
				u_cnt = o_cnt = s_cnt = n_cnt = p_cnt = 0;
				while (*pc) {
					if (*pc == 'u')
						u_cnt++;
					else if (*pc == 'o')
						o_cnt++;
					else if (*pc == 's')
						s_cnt++;
					else if (*pc == 'p')
						p_cnt++;
					else if (*pc == 'n')
						n_cnt++;
					else {
						fprintf(stderr, "qrls: illegal -h value\n");
						errflg++;
						break;
					}
					pc++;
				}
				if (n_cnt && (u_cnt + o_cnt + s_cnt + p_cnt)) {
					fprintf(stderr, "qrls: illegal -h value\n");
					errflg++;
					break;
				}
				pbs_strncpy(hold_type, optarg, sizeof(hold_type));
				break;
			default:
				errflg++;
		}

	if (errflg || optind >= argc) {
		static char usage[] = "usage: qrls [-h hold_list] job_identifier...\n";
		static char usag2[] = "       qrls --version\n";
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qrls: unable to initialize security library.\n");
		exit(1);
	}

	for (; optind < argc; optind++) {
		int connect;
		int stat = 0;
		int located = FALSE;

		pbs_strncpy(job_id, argv[optind], sizeof(job_id));
		if (get_server(job_id, job_id_out, server_out)) {
			fprintf(stderr, "qrls: illegally formed job identifier: %s\n", job_id);
			any_failed = 1;
			continue;
		}
	cnt:
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "qrls: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_rlsjob(connect, job_id_out, hold_type, NULL);
		if (stat && (pbs_errno != PBSE_UNKJOBID)) {
			prt_job_err("qrls", connect, job_id_out);
			any_failed = pbs_errno;
		} else if (stat && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job_id_out, server_out, rmt_server)) {
				pbs_disconnect(connect);
				strcpy(server_out, rmt_server);
				goto cnt;
			}
			prt_job_err("qrls", connect, job_id_out);
			any_failed = pbs_errno;
		}

		pbs_disconnect(connect);
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(any_failed);
}


================================================
FILE: src/cmds/qrun.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qrun.c
 * @brief
 *  	The qrun command forces a batch job to run.
 *
 * @par	Synopsis:
 *  	qrun [-H host][-a] job_identifier ...
 *
 * @par	Arguments:
 *  host
 *      The host to run the job at.
 *  job_identifier ...
 *      A list of job_identifiers.  A job_identifier has the following form:
 *          sequence_number[.server_name][@server]
 *
 *  @author	Bruce Kelly
 *  		National Energy Research Supercomputer Center
 *  		Livermore, CA
 *  		May, 1993
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>
#include <pbs_share.h> /* the comment buffer size declaration*/
#include "grunt.h"

int exitstatus = 0; /* Exit Status */
int async = 0;
static void execute(char *, char *, char *);

int
main(int argc, char **argv)
{
	/*
	 *  This routine sends a Run Job request to the batch server.  If the
	 * batch request is accepted, the server will have started the execution
	 * of the job.
	 */

	char job[PBS_MAXCLTJOBID];  /* Job Id */
	char server[MAXSERVERNAME]; /* Server name */
	char *location = NULL;	    /* Where to run the job */

	static char opts[] = "H:a"; /* See man getopt */
	static char *usage = "Usage: qrun [-a] [-H vnode_specification ] job_identifier_list\n"
			     "       qrun [-a] [-H - ] job_identifier_list\n"
			     "       qrun --version\n";
	int s;
	int errflg = 0;

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	/* Command line options */
	while ((s = getopt(argc, argv, opts)) != EOF)
		switch (s) {

			case 'H':
				if (strlen(optarg) == 0) {
					fprintf(stderr, "qrun: illegal -H value\n");
					errflg++;
					break;
				}
				location = optarg;
				break;

			case 'a':
				async = 1;
				break;

			case '?':
			default:
				errflg++;
				break;
		}

	if (errflg || (optind >= argc)) {
		fprintf(stderr, "%s", usage);
		exit(1);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qrun: unable to initialize security library.\n");
		exit(2);
	}

	for (; optind < argc; optind++) {
		if (get_server(argv[optind], job, server)) {
			fprintf(stderr,
				"qrun: illegally formed job identifier: %s\n", argv[optind]);
			exitstatus = 1;
			continue;
		}
		execute(job, server, location);
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(exitstatus);
}

/**
 * @brief
 * 	executes a job
 *
 * @param[in] job - The fully qualified job id.
 * @param[in] server - The name of the server that manages the job.
 * @param[in] location -  location indicating where to run job
 *
 * @return - Void
 *
 * @File Variables:
 *  exitstatus  Set to two if an error occurs.
 *
 */
static void
execute(char *job, char *server, char *location)
{
	int ct;	 /* Connection to the server */
	int err; /* Error return from pbs_run */
	int out; /* Stores the size of err_msg_buf*/
	int located = FALSE;
	char *errmsg;
	char err_msg_buf[COMMENT_BUF_SIZE] = {'\0'}; /* generic buffer - comments & logging*/
	char rmt_server[MAXSERVERNAME];

cnt:
	if ((ct = cnt2server(server)) > 0) {
		if (async)
			err = pbs_asyrunjob(ct, job, location, NULL);
		else
			err = pbs_runjob(ct, job, location, NULL);

		if (err && (pbs_errno != PBSE_UNKJOBID)) {
			errmsg = pbs_geterrmsg(ct);
			if (errmsg != NULL) {
				if (pbs_errno == PBSE_UNKNODE) {
					out = snprintf(err_msg_buf, sizeof(err_msg_buf), "qrun: %s %s", errmsg, location);
					if (out >= sizeof(err_msg_buf)) {
						fprintf(stderr, "%s...\n", err_msg_buf);
					} else {
						fprintf(stderr, "%s\n", err_msg_buf);
					}

				} else {
					prt_job_err("qrun", ct, job);
				}
			} else {
				fprintf(stderr, "qrun : Server returned error %d for job\n", pbs_errno);
			}
			exitstatus = 2;
		} else if (err && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job, server, rmt_server)) {
				pbs_disconnect(ct);
				strcpy(server, rmt_server);
				goto cnt;
			}
			prt_job_err("qrun", ct, job);
			exitstatus = 2;
		}
		pbs_disconnect(ct);
	} else {
		fprintf(stderr,
			"qrun: could not connect to server %s (%d)\n", server, pbs_errno);
		exitstatus = 2;
	}
}


================================================
FILE: src/cmds/qselect.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qselect.c
 * @brief
 * 	qselect - (PBS) select batch job
 *
 * @author     	Terry Heidelberg
 *				Livermore Computing
 *
 * @author     	Bruce Kelly
 * 				National Energy Research Supercomputer Center
 *
 * @author     	Lawrence Livermore National Laboratory
 * 				University of California
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include <pbs_version.h>

#define OPSTRING_LEN 4
#define OP_LEN 2
#define OP_ENUM_LEN 6
#define MAX_OPTARG_LEN 256
#define MAX_RESOURCE_NAME_LEN 256
#define GETOPT_ARGS "a:A:c:h:HJl:N:p:q:r:s:t:Tu:xP:"
static char *opstring_vals[] = {"eq", "ne", "ge", "gt", "le", "lt"};
static enum batch_op opstring_enums[] = {EQ, NE, GE, GT, LE, LT};

/**
 * @brief
 *	sets the attribute details
 *
 * @param[out] list - attribute list
 * @param[in] a_name - attribute name
 * @param[in] r_name - resource name
 * @param[in] v_name - value for the attribute
 *
 * @return Void
 *
 */
void
set_attrop(struct attropl **list, char *a_name, char *r_name, char *v_name, enum batch_op op)
{
	struct attropl *attr;

	attr = (struct attropl *) malloc(sizeof(struct attropl));
	if (attr == NULL) {
		fprintf(stderr, "qselect: out of memory\n");
		exit(2);
	}

	if (a_name == NULL) {
		attr->name = NULL;
	} else {
		attr->name = strdup(a_name);
		if (attr->name == NULL) {
			fprintf(stderr, "qselect: out of memory\n");
			exit(2);
		}
	}

	if (r_name == NULL) {
		attr->resource = NULL;
	} else {
		attr->resource = strdup(r_name);
		if (attr->resource == NULL) {
			fprintf(stderr, "qselect: out of memory\n");
			exit(2);
		}
	}

	if (v_name == NULL) {
		attr->value = NULL;
	} else {
		attr->value = strdup(v_name);
		if (attr->value == NULL) {
			fprintf(stderr, "qselect: out of memory\n");
			exit(2);
		}
	}
	attr->op = op;
	attr->next = *list;
	*list = attr;
	return;
}

/**
 * @brief
 *	processes the argument string and checks the operation
 *	to be performed
 *
 * @param[in] optarg -  argument string
 * @param[out] op    -  enum value
 * @param[out] optargout  -  char pointer to hold output
 *
 */
void
check_op(char *optarg, enum batch_op *op, char *optargout)
{
	char opstring[OP_LEN + 1];
	int i;
	int cp_pos;

	*op = EQ; /* default */
	cp_pos = 0;

	if (optarg[0] == '.') {
		pbs_strncpy(opstring, &optarg[1], OP_LEN + 1);
		cp_pos = OPSTRING_LEN;
		for (i = 0; i < OP_ENUM_LEN; i++) {
			if (strncmp(opstring, opstring_vals[i], OP_LEN) == 0) {
				*op = opstring_enums[i];
				break;
			}
		}
	}
	pbs_strncpy(optargout, &optarg[cp_pos], MAX_OPTARG_LEN + 1);
	return;
}

/**
 * @brief
 *	Function name: get_tsubopt()
 * 	To parse the optarg and get the sub option to -t option
 * 	and populate the appropriate time atrr in attr_t.
 *
 * @param[in]  opt the first character of the "optarg" string.
 * @param[out] attr_t string pointer to be populated with appropriate
 * 		 job level time attribute.
 * @param[out] resc_t string pointer to be populated with appropriate
 *		 resource associated with attr_t if necessary (NULL if not).
 *
 * @retval 0 for SUCCESS
 * @retval -1 for FAILURE
 *
 * @par Scope of Linkage: local
 *
 */
static int
get_tsubopt(char opt, char **attr_t, char **resc_t)
{
	*resc_t = NULL;
	switch (opt) {
		case 'a':
			*attr_t = ATTR_a;
			break;
		case 'c':
			*attr_t = ATTR_ctime;
			break;
		case 'e':
			*attr_t = ATTR_etime;
			break;
		case 'g':
			*attr_t = ATTR_eligible_time;
			break;
		case 'm':
			*attr_t = ATTR_mtime;
			break;
		case 'q':
			*attr_t = ATTR_qtime;
			break;
		case 's':
			*attr_t = ATTR_stime;
			break;
		case 't':
			*attr_t = ATTR_estimated;
			*resc_t = "start_time";
			break;
		default:
			return -1; /* failure */
	}
	return 0; /* success */
}

/**
 * @brief
 *      To parse the optarg and check the option to -l option
 *      and populate the appropriate resource value in resource_list.
 *
 * @param[in]  optarg -  string containing resource info
 * @param[out] resource_name - string to hold resource name
 * @param[out] op - enum value to hold option
 * @param[out] resource_value - string to hold resource value
 * @param[out] res_pos - string holding the resource info
 *
 * @retval 0 for SUCCESS
 * @retval 1 for FAILURE
 *
 */
int
check_res_op(char *optarg, char *resource_name, enum batch_op *op, char *resource_value, char **res_pos)
{
	char opstring[OPSTRING_LEN];
	int i;
	int hit;
	char *p;

	p = strchr(optarg, '.');
	if (p == NULL || *p == '\0') {
		fprintf(stderr, "qselect: illegal -l value\n");
		fprintf(stderr, "resource_list: %s\n", optarg);
		return (1);
	} else {
		pbs_strncpy(resource_name, optarg, p - optarg + 1);
		*res_pos = p + OPSTRING_LEN;
	}
	if (p[0] == '.') {
		pbs_strncpy(opstring, &p[1], OP_LEN + 1);
		hit = 0;
		for (i = 0; i < OP_ENUM_LEN; i++) {
			if (strncmp(opstring, opstring_vals[i], OP_LEN) == 0) {
				*op = opstring_enums[i];
				hit = 1;
				break;
			}
		}
		if (!hit) {
			fprintf(stderr, "qselect: illegal -l value\n");
			fprintf(stderr, "resource_list: %s\n", optarg);
			return (1);
		}
	}
	p = strchr(*res_pos, ',');
	if (p == NULL) {
		p = strchr(*res_pos, '\0');
	}
	pbs_strncpy(resource_value, *res_pos, p - (*res_pos) + 1);
	if (strlen(resource_value) == 0) {
		fprintf(stderr, "qselect: illegal -l value\n");
		fprintf(stderr, "resource_list: %s\n", optarg);
		return (1);
	}
	*res_pos = (*p == '\0') ? p : (p += 1);
	if (**res_pos == '\0' && *(p - 1) == ',') {
		fprintf(stderr, "qselect: illegal -l value\n");
		fprintf(stderr, "resource_list: %s\n", optarg);
		return (1);
	}

	return (0); /* ok */
}

/**
 * @brief
 * 	prints usage format for qselect command
 *
 * @return - Void
 *
 */
static void
print_usage()
{
	static char usag2[] = "       qselect --version\n";
	static char usage[] =
		"usage: qselect [-a [op]date_time] [-A account_string] [-c [op]interval]\n"
		"\t[-h hold_list] [-H] [-J] [-l resource_list] [-N name] [-p [op]priority]\n"
		"\t[-q destination] [-r y|n] [-s states] [-t subopt[op]date_time] [-T] [-P project_name]\n"
		"\t[-x] [-u user_name]\n";
	fprintf(stderr, "%s", usage);
	fprintf(stderr, "%s", usag2);
}

/**
 * @brief
 * 	handles attribute errors and prints appropriate errmsg
 *
 * @param[in] err_list - list of possible attribute errors
 *
 * @return - Void
 *
 */
static void
handle_attribute_errors(struct ecl_attribute_errors *err_list)
{
	struct attropl *attribute;
	char *opt;
	int i;

	for (i = 0; i < err_list->ecl_numerrors; i++) {
		attribute = err_list->ecl_attrerr[i].ecl_attribute;
		if (strcmp(attribute->name, ATTR_a) == 0)
			opt = "a";
		else if (strcmp(attribute->name, ATTR_project) == 0)
			opt = "P";
		else if (strcmp(attribute->name, ATTR_A) == 0)
			opt = "A";
		else if (strcmp(attribute->name, ATTR_c) == 0)
			opt = "c";
		else if (strcmp(attribute->name, ATTR_h) == 0)
			opt = "h";
		else if (strcmp(attribute->name, ATTR_array) == 0)
			opt = "J";
		else if (strcmp(attribute->name, ATTR_l) == 0) {
			opt = "l";
			fprintf(stderr, "qselect: %s\n",
				err_list->ecl_attrerr[i].ecl_errmsg);
			exit(err_list->ecl_attrerr[i].ecl_errcode);
		} else if (strcmp(attribute->name, ATTR_N) == 0)
			opt = "N";
		else if (strcmp(attribute->name, ATTR_p) == 0) {
			opt = "p";
			fprintf(stderr, "qselect: %s\n",
				err_list->ecl_attrerr[i].ecl_errmsg);
			exit(err_list->ecl_attrerr[i].ecl_errcode);
		} else if (strcmp(attribute->name, ATTR_q) == 0)
			opt = "q";
		else if (strcmp(attribute->name, ATTR_r) == 0)
			opt = "r";
		else if (strcmp(attribute->name, ATTR_state) == 0)
			opt = "s";
		else if (strcmp(attribute->name, ATTR_ctime) == 0)
			opt = "t";
		else if (strcmp(attribute->name, ATTR_etime) == 0)
			opt = "t";
		else if (strcmp(attribute->name, ATTR_eligible_time) == 0)
			opt = "t";
		else if (strcmp(attribute->name, ATTR_mtime) == 0)
			opt = "t";
		else if (strcmp(attribute->name, ATTR_qtime) == 0)
			opt = "t";
		else if (strcmp(attribute->name, ATTR_stime) == 0)
			opt = "t";
		else if (strcmp(attribute->name, ATTR_u) == 0)
			opt = "u";
		else
			return;

		fprintf(stderr, "qselect: illegal -%s value\n", opt);
		print_usage();
		/*cleanup security library initializations before exiting*/
		CS_close_app();
		exit(2);
	}
}

int
main(int argc, char **argv, char **envp) /* qselect */
{
	int c;
	int errflg = 0;
	char *errmsg;

	char optargout[MAX_OPTARG_LEN + 1];
	char resource_name[MAX_RESOURCE_NAME_LEN + 1];

	enum batch_op op;
	enum batch_op *pop = &op;

	struct attropl *select_list = 0;

	/* two extra spaces because of \0 and '@' */
	char destination[MAXSERVERNAME + PBS_MAXQUEUENAME + 2] = "";
	char server_out[MAXSERVERNAME] = "";

	char *queue_name_out;
	char *server_name_out;

	int connect;
	char **selectjob_list;
	char *res_pos;
	char *pc;
	time_t after;
	char a_value[80];
	char extendopts[4] = "";
	char *attr_time = NULL;
	struct ecl_attribute_errors *err_list;
	char *resc_time = NULL;

	/*test for real deal or just version and exit*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF)
		switch (c) {
			case 'a':
				check_op(optarg, pop, optargout);
				if ((after = cvtdate(optargout)) < 0) {
					fprintf(stderr, "qselect: illegal -a value\n");
					errflg++;
					break;
				}
				sprintf(a_value, "%ld", (long) after);
				set_attrop(&select_list, ATTR_a, NULL, a_value, op);
				break;
			case 'c':
				check_op(optarg, pop, optargout);
				pc = optargout;
				while (isspace((int) *pc))
					pc++;
				if (strlen(pc) == 0) {
					fprintf(stderr, "qselect: illegal -c value\n");
					errflg++;
					break;
				}
				set_attrop(&select_list, ATTR_c, NULL, optargout, op);
				break;
			case 'h':
				check_op(optarg, pop, optargout);
				pc = optargout;
				while (isspace((int) *pc))
					pc++;
				set_attrop(&select_list, ATTR_h, NULL, optargout, op);
				break;
			case 'J':
				op = EQ;
				set_attrop(&select_list, ATTR_array, NULL, "True", op);
				break;
			case 'l':
				res_pos = optarg;
				while (*res_pos != '\0') {
					if (check_res_op(res_pos, resource_name, pop, optargout, &res_pos) != 0) {
						errflg++;
						break;
					}
					set_attrop(&select_list, ATTR_l, resource_name, optargout, op);
				}
				break;
			case 'p':
				check_op(optarg, pop, optargout);
				set_attrop(&select_list, ATTR_p, NULL, optargout, op);
				break;
			case 'q':
				pbs_strncpy(destination, optarg, sizeof(destination));
				check_op(optarg, pop, optargout);
				set_attrop(&select_list, ATTR_q, NULL, optargout, op);
				break;
			case 'r':
				op = EQ;
				pc = optarg;
				while (isspace((int) (*pc)))
					pc++;
				if (*pc != 'y' && *pc != 'n') { /* qselect specific check - stays */
					fprintf(stderr, "qselect: illegal -r value\n");
					errflg++;
					break;
				}
				set_attrop(&select_list, ATTR_r, NULL, pc, op);
				break;
			case 's':
				check_op(optarg, pop, optargout);
				pc = optargout;
				while (isspace((int) (*pc)))
					pc++;
				set_attrop(&select_list, ATTR_state, NULL, optargout, op);
				break;
			case 't':
				if (get_tsubopt(*optarg, &attr_time, &resc_time)) {
					fprintf(stderr, "qselect: illegal -t value\n");
					errflg++;
					break;
				}
				/* 1st character possess the subopt, so send optarg++ */
				optarg++;
				check_op(optarg, pop, optargout);
				if ((after = cvtdate(optargout)) < 0) {
					fprintf(stderr, "qselect: illegal -t value\n");
					errflg++;
					break;
				}
				sprintf(a_value, "%ld", (long) after);
				set_attrop(&select_list, attr_time, resc_time, a_value, op);
				break;
			case 'T':
				if (strchr(extendopts, (int) 'T') == NULL)
					(void) strcat(extendopts, "T");
				break;
			case 'x':
				if (strchr(extendopts, (int) 'x') == NULL)
					(void) strcat(extendopts, "x");
				break;
			case 'H':
				op = EQ;
				if (strchr(extendopts, (int) 'x') == NULL)
					(void) strcat(extendopts, "x");
				set_attrop(&select_list, ATTR_state, NULL, "FM", op);
				break;
			case 'u':
				op = EQ;
				set_attrop(&select_list, ATTR_u, NULL, optarg, op);
				break;
			case 'A':
				op = EQ;
				set_attrop(&select_list, ATTR_A, NULL, optarg, op);
				break;
			case 'P':
				op = EQ;
				set_attrop(&select_list, ATTR_project, NULL, optarg, op);
				break;
			case 'N':
				op = EQ;
				set_attrop(&select_list, ATTR_N, NULL, optarg, op);
				break;
			default:
				errflg++;
		}

	if (errflg || (optind < argc)) {
		print_usage();
		exit(2);
	}

	if (notNULL(destination)) {
		if (parse_destination_id(destination, &queue_name_out, &server_name_out)) {
			fprintf(stderr, "qselect: illegally formed destination: %s\n", destination);
			exit(2);
		}
		if (notNULL(server_name_out))
			pbs_strncpy(server_out, server_name_out, sizeof(server_out));
	}

	/*perform needed security library initializations (including none)*/
	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qselect: unable to initialize security library.\n");
		exit(2);
	}

	connect = cnt2server(server_out);
	if (connect <= 0) {
		fprintf(stderr, "qselect: cannot connect to server %s (errno=%d)\n",
			pbs_server, pbs_errno);

		/*cleanup security library initializations before exiting*/
		CS_close_app();

		exit(pbs_errno);
	}

	if (extendopts[0] == '\0')
		selectjob_list = pbs_selectjob(connect, select_list, NULL);
	else
		selectjob_list = pbs_selectjob(connect, select_list, extendopts);
	if (selectjob_list == NULL) {
		if ((err_list = pbs_get_attributes_in_error(connect)))
			handle_attribute_errors(err_list);

		if (pbs_errno != PBSE_NONE) {
			errmsg = pbs_geterrmsg(connect);
			if (errmsg != NULL) {
				fprintf(stderr, "qselect: %s\n", errmsg);
			} else {
				fprintf(stderr, "qselect: Error (%d) selecting jobs\n", pbs_errno);
			}

			/*
			 * If the server is not configured for history jobs i.e.
			 * job_history_enable svr attr is unset/set to FALSE, qselect
			 * command with -x/-H option is being used, then pbs_selectjob()
			 * will return PBSE_JOBHISTNOTSET error code. But command will
			 * exit with exit code '0'after printing the corresponding error
			 * message. i.e. "job_history_enable is set to false"
			 */
			if (pbs_errno == PBSE_JOBHISTNOTSET)
				pbs_errno = 0;

			/*cleanup security library initializations before exiting*/
			CS_close_app();
			exit(pbs_errno);
		}
	} else { /* got some jobs ids */
		int i = 0;
		while (selectjob_list[i] != NULL) {
			printf("%s\n", selectjob_list[i++]);
		}
		free_string_array(selectjob_list);
	}
	pbs_disconnect(connect);

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(0);
}


================================================
FILE: src/cmds/qsig.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qsig.c
 * @brief
 * 	qsig - (PBS) signal a batch job
 *
 * @author	    Terry Heidelberg
 * 				Livermore Computing
 *
 * @author      Bruce Kelly
 * 				National Energy Research Supercomputer Center
 *
 * @author     	Lawrence Livermore National Laboratory
 * 				University of California
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include <pbs_version.h>

int
main(int argc, char **argv, char **envp) /* qsig */
{
	int c;
	int errflg = 0;
	int any_failed = 0;

	char job_id[PBS_MAXCLTJOBID]; /* from the command line */

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char rmt_server[MAXSERVERNAME];

#define MAX_SIGNAL_TYPE_LEN 32
	static char sig_string[MAX_SIGNAL_TYPE_LEN + 1] = "SIGTERM";

#define GETOPT_ARGS "s:"

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF)
		switch (c) {
			case 's':
				pbs_strncpy(sig_string, optarg, sizeof(sig_string));
				break;
			default:
				errflg++;
		}

	if (errflg || optind >= argc) {
		static char usage[] = "usage: qsig [-s signal] job_identifier...\n";
		static char usag2[] = "       qsig --version\n";
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(2);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qsig: unable to initialize security library.\n");
		exit(2);
	}

	for (; optind < argc; optind++) {
		int connect;
		int stat = 0;
		int located = FALSE;

		pbs_strncpy(job_id, argv[optind], sizeof(job_id));
		if (get_server(job_id, job_id_out, server_out)) {
			fprintf(stderr, "qsig: illegally formed job identifier: %s\n", job_id);
			any_failed = 1;
			continue;
		}
	cnt:
		connect = cnt2server(server_out);
		if (connect <= 0) {
			fprintf(stderr, "qsig: cannot connect to server %s (errno=%d)\n",
				pbs_server, pbs_errno);
			any_failed = pbs_errno;
			continue;
		}

		stat = pbs_sigjob(connect, job_id_out, sig_string, NULL);
		if (stat && (pbs_errno != PBSE_UNKJOBID)) {
			prt_job_err("qsig", connect, job_id_out);
			any_failed = pbs_errno;
		} else if (stat && (pbs_errno == PBSE_UNKJOBID) && !located) {
			located = TRUE;
			if (locate_job(job_id_out, server_out, rmt_server)) {
				pbs_disconnect(connect);
				pbs_strncpy(server_out, rmt_server, sizeof(server_out));
				goto cnt;
			}
			prt_job_err("qsig", connect, job_id_out);
			any_failed = pbs_errno;
		}

		pbs_disconnect(connect);
	}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(any_failed);
}


================================================
FILE: src/cmds/qstart.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qstart.c
 * @brief
 *  The qstart command directs that a destination should start scheduling
 *  or routing batch jobs.
 *
 * @par	Synopsis:
 *  qstart destination ...
 *
 * @par	Arguments:
 *  destination ...
 *      A list of destinations.  A destination has one of the following
 *      three forms:
 *          queue
 *          @server
 *          queue@server
 *      If queue is specified, the request is to start the queue at
 *      the default server.  If @server is given, the request is to
 *      start all queues at the server.  If queue@server is used,
 *      the request is to start the named queue at the named server.
 *
 * @author	Bruce Kelly
 *			National Energy Research Supercomputer Center
 *			Livermore, CA
 * 			May, 1993
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include <pbs_version.h>

int exitstatus = 0; /* Exit Status */
static void execute(char *, char *);

int
main(int argc, char **argv)
{
	/*
	 *  This routine sends a Manage request to the batch server specified by
	 * the destination.  The STARTED queue attribute is set to {True}.  If the
	 * batch request is accepted, the server will start scheduling or routing
	 * requests in the specified queue.
	 */

	int dest;     /* Index into the destination array (argv) */
	char *queue;  /* Queue name part of destination */
	char *server; /* Server name part of destination */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	if (argc == 1) {
		fprintf(stderr, "Usage: qstart [queue][@server] ...\n");
		fprintf(stderr, "       qstart --version\n");
		exit(1);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qstart: unable to initialize security library.\n");
		exit(1);
	}

	for (dest = 1; dest < argc; dest++)
		if (parse_destination_id(argv[dest], &queue, &server) == 0)
			execute(queue, server);
		else {
			fprintf(stderr, "qstart: illegally formed destination: %s\n",
				argv[dest]);
			exitstatus = 1;
		}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(exitstatus);
}

/**
 * @brief
 *	executes to start a queue
 *
 * @param[in] queue - The name of the queue to start.
 * @param[in] server - The name of the server that manages the queue.
 *
 * @return - Void
 *
 * File Variables:
 * exitstatus  Set to two if an error occurs.
 *
 */
static void
execute(char *queue, char *server)
{
	int ct;	      /* Connection to the server */
	int merr;     /* Error return from pbs_manager */
	char *errmsg; /* Error message from pbs_manager */
	/* The disable request */
	static struct attropl attr = {NULL, "started", NULL, "TRUE", SET};

	if ((ct = cnt2server(server)) > 0) {
		merr = pbs_manager(ct, MGR_CMD_SET, MGR_OBJ_QUEUE, queue, &attr, NULL);
		if (merr != 0) {
			errmsg = pbs_geterrmsg(ct);
			if (errmsg != NULL) {
				fprintf(stderr, "qstart: %s ", errmsg);
			} else {
				fprintf(stderr, "qstart: Error (%d) starting queue ", pbs_errno);
			}
			if (notNULL(queue))
				fprintf(stderr, "%s", queue);
			if (notNULL(server))
				fprintf(stderr, "@%s", server);
			fprintf(stderr, "\n");
			exitstatus = 2;
		}
		pbs_disconnect(ct);
	} else {
		fprintf(stderr, "qstart: could not connect to server %s (%d)\n", server, pbs_errno);
		exitstatus = 2;
	}
}


================================================
FILE: src/cmds/qstat.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qstat.c
 * @brief
 * 	qstat - (PBS) show stats of batch jobs, queues, or servers
 *
 * @author	Terry Heidelberg
 * 			Livermore Computing
 *
 * @author  Bruce Kelly
 * 			National Energy Research Supercomputer Center
 *
 * @author  Lawrence Livermore National Laboratory
 * 			University of California
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#include "pbs_ifl.h"
#include "cmds.h"
#include "pbs_share.h"
#include <pwd.h>
#include <stdlib.h>
#include "pbs_internal.h"
#include "libutil.h"
#include <arpa/inet.h>
#include "pbs_json.h"

#if TCL_QSTAT
#include <sys/stat.h>
#include <tcl.h>
#ifdef NAS /* localmod 071 */
extern char *tcl_atrsep;
#endif /* localmod 071 */
#endif

/* default server */
char *def_server;

static char *cvtResvstate(char *);
static int cmp_est_time(struct batch_status *a, struct batch_status *b);
char *cnvt_est_start_time(char *start_time, int shortform);

#if !defined(PBS_NO_POSIX_VIOLATION)
/* defines for alternative display formats */
#define ALT_DISPLAY_a 1		      /* -a option - show all jobs */
#define ALT_DISPLAY_i 2		      /* -i option - show not running */
#define ALT_DISPLAY_r 4		      /* -r option - show only running */
#define ALT_DISPLAY_u 8		      /* -u option - list user's jobs */
#define ALT_DISPLAY_n 0x10	      /* -n option - add node list */
#define ALT_DISPLAY_s 0x20	      /* -s option - add scheduler comment */
#define ALT_DISPLAY_H 0x40	      /* -H option - show history(F/M) jobs */
#define ALT_DISPLAY_q 0x80	      /* -q option - alt queue display */
#define ALT_DISPLAY_Mb 0x100	      /* show sizes in MB */
#define ALT_DISPLAY_Mw 0x200	      /* -M option - show sizes in MW */
#define ALT_DISPLAY_G 0x400	      /* -G option - show sizes in GB */
#define ALT_DISPLAY_1l 0x800	      /* -n -s -f on line line */
#define ALT_DISPLAY_w 0x1000	      /* -w - wide output */
#define ALT_DISPLAY_T 0x2000	      /* -T option - estimated start times */
#define ALT_DISPLAY_p 0x4000	      /* -p option - percentage completed for the job */
#define ALT_DISPLAY_INCR_WIDTH 0x8000 /* increases qstat header width */

#endif /* not PBS_NO_POSIX_VIOLATION */
#define HPCBP_EXEC_TAG "jsdl-hpcpa:Executable"
#define CHAR_LINE_LIMIT 78 /* maximum number of characters which can be printed on a line */

#define DISPLAY_TRUNC_CHAR '*'

#define NUML 5
#define MAX_ATTRS 64
#define MAX_RES 64

static struct attrl basic_attribs[] = {
	{&basic_attribs[1],
	 ATTR_N,
	 NULL,
	 "",
	 SET},
	{&basic_attribs[2],
	 ATTR_owner,
	 NULL,
	 "",
	 SET},
	{&basic_attribs[3],
	 ATTR_used,
	 NULL,
	 "",
	 SET},
	{&basic_attribs[4],
	 ATTR_state,
	 NULL,
	 "",
	 SET},
	{NULL,
	 ATTR_queue,
	 NULL,
	 "",
	 SET}};

static struct attrl alt_attribs[] = {
	{&alt_attribs[1],
	 ATTR_session,
	 NULL,
	 "",
	 SET},
	{&basic_attribs[0],
	 ATTR_l,
	 NULL,
	 "",
	 SET}};

enum output_format_enum {
	FORMAT_DEFAULT = 0,
	FORMAT_DSV,
	FORMAT_JSON,
	FORMAT_MAX
};

enum batch_status_item_type {
	BATCH_ITEM_DEFAULT=0,
	BATCH_ITEM_IS_STRING,
	BATCH_ITEM_IS_NUMBER,
	BATCH_ITEM_IS_ATTR_V,
	BATCH_ITEM_IS_RESOURCE
};

/**
 * @brief
 *	triage the json_type of a batch_item, identify it's type
 *
 * @param[in] string - ( batch_item -> name )
 * @param[in] string - ( batch_item -> resource ) 
 *
 * @return enum BATCH_ITEM_* 
 * 
 */

int batch_item_json_type_triage (const char *name, const char *resource)
{
	if (resource)
		return BATCH_ITEM_IS_RESOURCE; 
	struct name_type_mappings {
		char *name;
		int type; 
	};
	typedef struct name_type_mappings name_map_t;
	/* keep it local */ 
	const static name_map_t name_type_map[] = {
		{ATTR_v, BATCH_ITEM_IS_ATTR_V},
		{ATTR_N, BATCH_ITEM_IS_STRING},
		{ATTR_project, BATCH_ITEM_IS_STRING},
		{ATTR_A, BATCH_ITEM_IS_STRING}
	};

	for (int i = 0; i < sizeof(name_type_map) / sizeof(name_type_map[0]); ++i) {
		if (!strcmp(name,name_type_map[i].name)) {
			return name_type_map[i].type;
		}
	}
  
	return BATCH_ITEM_DEFAULT;
}


/* This array contains the names users may specify for output format. */
static char *output_format_names[] = {"default", "dsv", "json", NULL};

static int output_format = FORMAT_DEFAULT;
static char *dsv_delim = "|";
static char *delimiter = "\n";
static char *prev_resc_name = NULL;
static int first_stat = 1;
static int conn;
static json_data *json_root = NULL; /* root of json structure */
static json_data *json_prev_resc = NULL;

static struct attrl *display_attribs = &basic_attribs[0];

int
cmp_jobs(const void *j1, const void *j2)
{
	char *job1, *job2;
	char *seq_num1 = NULL;
	char *seq_num2 = NULL;
	char *pserver_one = NULL;
	char *pserver_two = NULL;
	int ret = 0;
	int ret_val = 0;
	char *eptr = NULL;
	long jid1, jid2;
	job1 = *(char **) j1;
	job2 = *(char **) j2;
	if (pbs_isjobid(job1) == 0) {
		ret_val = 1;
		goto return_here;
	} else if (pbs_isjobid(job2) == 0) {
		ret_val = 1;
		goto return_here;
	} else {
		parse_jobid(job1, &seq_num1, &pserver_one, NULL);
		/* default server */
		if (pserver_one == NULL)
			pserver_one = strdup(def_server);
		else if (pserver_one[0] == '\0')
			strcpy(pserver_one, def_server);
		parse_jobid(job2, &seq_num2, &pserver_two, NULL);
		/* default server */
		if (pserver_two == NULL)
			pserver_two = strdup(def_server);
		else if (pserver_two[0] == '\0')
			strcpy(pserver_two, def_server);

		ret = strcmp(pserver_one, pserver_two);
		if (ret < 0) {
			ret_val = -1;
			goto return_here;
		} else if (ret > 0) {
			ret_val = 1;
			goto return_here;
		}
	}
	/* Server name is same, Now sort on the job id */
	jid1 = strtoll(job1, &eptr, 10);
	jid2 = strtoll(job2, &eptr, 10);
	if (jid1 < jid2) {
		ret_val = -1;
		goto return_here;
	} else if (jid1 > jid2) {
		ret_val = 1;
		goto return_here;
	} else if (seq_num1 != NULL && seq_num2 != NULL) {
		/* Array sub jobs, sort on the basis of index */
		jid1 = strtoll(seq_num1, &eptr, 10);
		jid2 = strtoll(seq_num2, &eptr, 10);
		if (jid1 < jid2) {
			ret_val = -1;
			goto return_here;
		} else if (jid1 > jid2) {
			ret_val = 1;
			goto return_here;
		}
	}
	/* Same job id getting repeated */
	ret_val = 0;
return_here:
	free(seq_num1);
	free(seq_num2);
	free(pserver_one);
	free(pserver_two);
	return ret_val;
}

/**
 * @brief
 *	tests whether the string value is true or false
 *
 * @param[in] string - string to be tested
 *
 * @return Boolean value
 * @retval 0  Failre
 * @retval 1  Success
 *
 */
int
istrue(char *string)
{
	if (strcmp(string, "TRUE") == 0)
		return TRUE;
	if (strcmp(string, "True") == 0)
		return TRUE;
	if (strcmp(string, "true") == 0)
		return TRUE;
	if (strcmp(string, "1") == 0)
		return TRUE;
	return FALSE;
}

/**
 * @brief
 *	sets single character for each state of job
 *
 * @param[in] string - string holding state of job
 * @param[in] q      - string holding string for que
 * @param[in] r      - string holding string for run
 * @param[in] h      - string holding string for hld
 * @param[in] w      - string holding string for wait
 * @param[in] t      - string holding string for transit
 * @param[in] e      - string holding string for end
 * @param[in] len    - length of string
 *
 */
static void
states(char *string, char *q, char *r, char *h, char *w, char *t, char *e, int len)
{
	char *c, *d, *f, *s, l;

	c = string;
	while (isspace(*c) && *c != '\0')
		c++;
	while (*c != '\0') {
		s = c;
		while ((*c != ':') && (*c != '\0'))
			c++;
		if (*c == '\0')
			break;
		*c = '\0';
		d = NULL;
		if (strcmp(s, "Queued") == 0)
			d = q;
		else if (strcmp(s, "Running") == 0)
			d = r;
		else if (strcmp(s, "Held") == 0)
			d = h;
		else if (strcmp(s, "Waiting") == 0)
			d = w;
		else if (strcmp(s, "Transit") == 0)
			d = t;
		else if (strcmp(s, "Exiting") == 0)
			d = e;
		c++;
		if (d != NULL) {
			s = c;
			while (*c != ' ' && *c != '\0')
				c++;
			l = *c;
			*c = '\0';
			if (strlen(s) > (size_t) len) {
				f = s + len;
				if (f > s)
					*(f - 1) = DISPLAY_TRUNC_CHAR;
				*f = '\0';
			}
			pbs_strncpy(d, s, NUML + 1);
			if (l != '\0')
				c++;
		} else {
			while (*c != ' ' && *c != '\0')
				c++;
		}
	}
}

/**
 * @brief
 *	Convert special characters, line feed and form feed into '\\'+n and '\\'+f respectively.
 *
 * @param[in]   val - input string
 *
 * @return string
 * @retval NULL     - if memory allocation failed.
 * @retval string   - string with feed characters escaped.
 *
 * @note
 *	The string returned should be freed by the caller.
 */
char *
convert_feed_chars(char *val)
{
	int i = 0;
	int len = MAXBUFLEN;
	char *temp = NULL;
	char *buf = (char *) malloc(MAXBUFLEN);
	if (buf == NULL)
		return NULL;
	while (*val != '\0') {
		if (*val == '\n') {
			buf[i++] = '\\';
			buf[i++] = 'n';
			val++;
		} else if (*val == '\f') {
			buf[i++] = '\\';
			buf[i++] = 'f';
			val++;
		} else
			buf[i++] = *val++;
		if (i >= len - 2) {
			len *= BUFFER_GROWTH_RATE;
			temp = (char *) realloc(buf, len);
			if (temp == NULL) {
				free(buf);
				return NULL;
			}
			buf = temp;
		}
	}
	buf[i] = '\0';
	return buf;
}

/**
 * @brief
 *	print the exit message and die.
 */
void
exit_qstat(char *msg)
{
	fprintf(stderr, "qstat: %s\n", msg);
	exit(1);
}

/**
 * @brief
 *	print a attribute value string, formating to break at a comma if possible
 *
 * @param[in] name - attribute name
 * @param[in] resource - resource name
 * @param[in] value - value for the attribute
 * @param[in] one_line - one line per attribute
 *
 */
void
prt_attr(char *name, char *resource, char *value, int one_line, json_data * json_obj)
{
	int first = 1;
	int len = 0;
	int start = 0;
	char *comma = ",";
	char *key = NULL;
	char *val = NULL;
	char *buf = NULL;
	char *temp = NULL;
	json_data *json_attr = NULL;
	int item_type = 0;

	if (value == NULL)
		return;
	switch (output_format) {
	case FORMAT_JSON:
		item_type = batch_item_json_type_triage (name, resource);
		switch (item_type) {
		case BATCH_ITEM_IS_ATTR_V:
			if ((json_attr = pbs_json_create_object()) == NULL)
				exit_qstat("json error");
			pbs_json_insert_item(json_obj, name, json_attr);
			buf = strdup(value);
			temp = buf;
			if (buf == NULL)
				exit_qstat("out of memory");
			while (*value) {
				/* value is split based on comma and each key-value is stored in keyvalpair.
				 * If the value contains an escaped comma, only the comma is copied to keyvalpair.
				 * Then separated into key and value based on the first '=' */
				key = buf;
				val = NULL;
				while (!(*value == *comma || *value == '\0')) {
					if (*value == ESC_CHAR && *(value + 1) == *comma)
						value++;
					if (!val && *value == '=') {
						*buf++ = '\0';
						val = buf;
						value++;
					} else {
						*buf++ = *value++;
					}
				}
				*buf = '\0';
				if (pbs_json_insert_parsed(json_attr, key, val, 0))
					exit_qstat("json error");
				if (*value != '\0')
					value++;
			}
			free(temp);
			break;
		case BATCH_ITEM_IS_RESOURCE:
			if (prev_resc_name && strcmp(prev_resc_name, name) != 0) {
				prev_resc_name = NULL;
			}
			if (prev_resc_name == NULL || strcmp(prev_resc_name, name) != 0) {
				if ((json_prev_resc = pbs_json_create_object()) == NULL)
					exit_qstat("json error");
				pbs_json_insert_item(json_obj, name, json_prev_resc);
				prev_resc_name = name;
			}
			if (pbs_json_insert_parsed(json_prev_resc, resource, value, 0))
				exit_qstat("json error");
			break;
		case BATCH_ITEM_IS_STRING:
			if (prev_resc_name) {
				json_prev_resc = NULL;
				prev_resc_name = NULL;
			}
			if (pbs_json_insert_string(json_obj, name, value))
				exit_qstat("json error");
			break;
		case BATCH_ITEM_IS_NUMBER:
			/* skip to default parser */ 
		default:
			if (prev_resc_name) {
				json_prev_resc = NULL;
				prev_resc_name = NULL;
			}
			if (pbs_json_insert_parsed(json_obj, name, value, 0))
				exit_qstat("json error");
		}
		break;

		case FORMAT_DSV:
			buf = escape_delimiter(value, delimiter, ESC_CHAR);
			if (buf == NULL)
				exit_qstat("out of memory");
			buf = convert_feed_chars(buf);
			if (buf == NULL)
				exit_qstat("out of memory");
			if (resource)
				printf("%s.%s=%s", name, resource, show_nonprint_chars(buf));
			else
				printf("%s=%s", name, show_nonprint_chars(buf));
			free(buf);
			break;

		default:
			if (one_line) {
				buf = convert_feed_chars(value);
				if (buf == NULL)
					exit_qstat("out of memory");
				if (resource)
					printf("    %s.%s = %s", name, resource, buf);
				else
					printf("    %s = %s", name, show_nonprint_chars(buf));
				free(buf);
			} else {
				start = strlen(name) + 7; /* 4 spaces + ' = ' is 7 */
				printf("    %s", name);
				if (resource) {
					start += strlen(resource) + 1; /* 1 for dot */
					printf(".%s", resource);
				}
				printf(" = ");
				if ((temp = strdup(value)) == NULL)
					exit_qstat("out of memory");
				buf = strtok(temp, comma);
				while (buf) {
					if ((len = strlen(buf)) + start < CHAR_LINE_LIMIT) {
						printf("%s", show_nonprint_chars(buf));
						start += len;
					} else {
						if (!first) {
							printf("\n\t");
							start = 9; /* tab + 1 */
						}
						while (*buf) {
							char *sbuf;
							int ch;
							char char_buf[2];

							ch = *buf++;
							sprintf(char_buf, "%c", ch);
							sbuf = show_nonprint_chars(char_buf);
							if (sbuf != NULL) {
								int c;
								for (c = 0; c < strlen(sbuf); c++)
									putchar(sbuf[c]);
							} else {
								putchar(ch);
							}
							if (++start > CHAR_LINE_LIMIT) {
								start = 8; /* tab */
								printf("\n\t");
							}
						}
					}
					if ((buf = strtok(NULL, comma)) != NULL) {
						first = 0;
						putchar(',');
					}
				}
				free(temp);
			}
	}
}

#define NAMEL 16  /* printf of jobs, queues, and servers */
#define OWNERL 16 /* printf of jobs */
#define TIMEUL 8  /* printf of jobs */
#define STATEL 1  /* printf of jobs */
#define LOCL 16	  /* printf of jobs */
#define SIZEL 6	  /* length of "SIZE" fields in printf */

/* format widths defined for display in normal format output */
#define SIZEJOBID 15	  /* length of JobId field in printf */
#define SIZEJOBID_INCR 20 /*length of jobId field in printf with incr_width */
#define SIZEJOBNAME 10	  /* length of JobName field in printf */
#define SIZEQUEUENAME 8	  /* length of Queue field in printf */
#define SIZESESSID 6	  /* length of session id in printf */
#define SIZENDS 3	  /* length of nds in printf */
#define SIZETSK 3	  /* length of tsk in printf */
#define SIZEUSER 8	  /* length of user name in printf */

/* format widths defined for display in wide format output */
#define SIZEJOBID_W 30	 /* length of JobId field in printf */
#define SIZEJOBNAME_W 15 /* length of JobName field in printf */
#define SIZESESSID_W 8	 /* length of session id in printf */
#define SIZENDS_W 4	 /* length of nds in printf */
#define SIZETSK_W 5	 /* length of tsk in printf */
#define SIZEUSER_W 15	 /* length of user name in printf */

/**
 * @brief
 *	Check if value is too long, truncate and append DISPLAY_TRUNC_CHAR if needed
 *
 * @param[in] value - value that may be truncated
 * @param[in] len - non-wide length that must be met
 * @param[in] wide_len - wide length that must be met
 * @param[in] wide - whether or not wide format is used
 *
 */

static void
trunc_value(char *value, int len, int wide_len, int wide)
{
	if (wide) {
		if (strlen(value) > wide_len && wide_len > 0) {
			*(value + wide_len - 1) = DISPLAY_TRUNC_CHAR;
		}
	} else {
		if (strlen(value) > len && len > 0) {
			*(value + len - 1) = DISPLAY_TRUNC_CHAR;
		}
	}
}

/**
 * @brief
 *	Format and display string of assigned nodes, (1) strip off domain name
 *	if present and (2) break line at '+' sign.
 *
 * @param[in] nodes - name of exechosts
 * @param[in] no_newl - int value to decide which comment to be set
 *
 */
static void
prt_nodes(char *nodes, int no_newl)
{
	int i, len;
	char linebuf[CHAR_LINE_LIMIT];
	char *rest = NULL;
	char *saveptr = NULL;
	char *token = NULL;
	char *token_cp = NULL;
	char *subtoken = NULL;
	char *node_name = NULL;
	char *node_name_bkp = NULL;
	char *chunk = NULL;
	struct sockaddr_in check_ip;
	int ret = 0;

	if ((nodes == NULL) || (*nodes == '\0'))
		return;

	i = 0;
	rest = strdup(nodes);
	if (rest == NULL)
		exit_qstat("out of memory");
	/* The exec_host string has the format <host1>/<T1>*<P1>[+<host2>/<T2>*<P2>+... ].
	 * We are using '+' delimiter to find each <host1>/<T1>*<P1> string.
	 */
	token = strtok_r(rest, "+", &saveptr);
	while (token != NULL) {
		token_cp = strdup(token);
		if (token_cp == NULL)
			exit_qstat("out of memory");
		/* We are using '/' delimiter to extract the <host1> value
		 * from <host1>/<T1>*<P1> string. We use the <host1> to identify if
		 * the node is created using IP address.
		 */
		subtoken = strtok(token, "/");
		chunk = token_cp + strlen(subtoken);
		ret = inet_pton(AF_INET, subtoken, &(check_ip.sin_addr));
		if (ret == 1) {
			/* node name is an IP address */
			pbs_asprintf(&node_name, "%s%s", subtoken, chunk);
		} else {
			/* Node name is not an IP address */
			pbs_asprintf(&node_name, "%s%s", strtok(subtoken, "."), chunk);
		}
		/* Backing up node_name as we are modifying the pointer further in the code */
		node_name_bkp = node_name;
		len = strlen(node_name);
		if (i + len < (CHAR_LINE_LIMIT - 1)) {
			for (; len > 0; i++, len--) {
				linebuf[i] = *node_name++;
			}
			/* Appending a  '+' here because we want to maintain the
			 * exec_host format i.e. <host1>/<T1>*<P1>[+<host2>/<T2>*<P2>+.
			 */
			linebuf[i++] = '+';
		} else {
			/* flush line and start next */
			linebuf[i] = '\0';
			printf((no_newl ? "%s" : "   %s\n"), show_nonprint_chars(linebuf));
			for (i = 0; len > 0; i++, len--) {
				linebuf[i] = *node_name++;
			}
			linebuf[i++] = '+';
		}
		token = strtok_r(NULL, "+", &saveptr);
	}
	if (i > 0) {
		linebuf[--i] = '\0';
		printf((no_newl ? "%s\n" : "   %s\n"), show_nonprint_chars(linebuf));
	} else if (no_newl)
		printf("\n");
	free(token_cp);
	free(rest);
	free(node_name_bkp);
	token_cp = NULL;
	rest = NULL;
	node_name_bkp = NULL;
}

/**
 * @brief
 *	convert size from suffix string (nnnn[ kmgt][ bw]) to string of
 *	k[bw] for neither -M or -G (magnitude may be adjusted to fit print)
 *	mw    for	  -M
 *	gb    for	  -G
 * @param[in] value - string holding info about size which processed to get long int
 * @param[in] opt   - option indicating which conversion
 *
 * @return string
 * @retval string holding magnitude
 *
 */

static char *
cnv_size(char *value, int opt)
{
	static int sift_factor[5][5] = {
		{0, 10, 20, 30, 40},	/*  b conversion */
		{-10, 0, 10, 20, 30},	/* kb conversion */
		{-20, -10, 0, 10, 20},	/* mb conversion */
		{-30, -20, -10, 0, 10}, /* gb conversion */
		{-40, -30, -20, -10, 0} /* tb conversion */
	};

	static char suffixletter[] = " kmgtp?";
	int in;	 /* magnitude of value from server  */
	int out; /* magnitude of value when printed */
	int sft;
	unsigned long nval;
	char *pc;
	char suffix1;	    /* magnitude key letter [ kmgt] */
	char suffix2 = 'b'; /* suffix letter, 'b' or 'w'    */
	static char outbuf[25];

	nval = strtol(value, &pc, 10);
	if (*pc == 'k')
		in = 1;
	else if (*pc == 'm')
		in = 2;
	else if (*pc == 'g')
		in = 3;
	else if (*pc == 't')
		in = 4;
	else
		in = 0;

	if ((*pc == 'w') || (*(pc + 1) == 'w')) {
		nval = nval << 3; /* convert to bytes */
		suffix2 = 'w';
	}

	if (opt & (ALT_DISPLAY_Mb | ALT_DISPLAY_Mw)) {
		out = 2;
		suffix1 = 'm';
		if (opt & ALT_DISPLAY_Mw)
			suffix2 = 'w';
		else
			suffix2 = 'b';
	} else if (opt & ALT_DISPLAY_G) {
		out = 3;
		suffix2 = 'b';
	} else {
		out = in;
	}

	sft = sift_factor[out][in];

	if (sft < 0) {
		nval = nval + ((1 << -sft) - 1); /* round up (ceiling) */
		nval = nval >> -sft;
	} else if (sft > 0) {
		nval = nval << sft;
	}

	if (suffix2 == 'w')
		nval = (nval + 7) >> 3; /* round and convert (back) to words */

	/* if the value will overflow the field size, up the magnitude */
	while (nval > 9999) {
		nval = (nval + 1023) >> 10;
		out++;
	}
	suffix1 = suffixletter[out];

	(void) sprintf(outbuf, "%lu%c%c", nval, suffix1, suffix2);
	return outbuf;
}

/**
 * @brief
 *	Format and display status of job in alternate and alternate wide form (not POSIX standard)
 *
 *
 */

static void
altdsp_statjob(struct batch_status *pstat, struct batch_status *prtheader, int alt_opt, int wide, int how_opt)
{
	char *comment;
	char *pc;
	struct attrl *pat;
	char *exechost;
	char *usern;
	char *queuen;
	char *jobn;
	char *sess;
	char *tasks;
	char *nodect;
	char *rqtimecpu;
	char *rqtimewal;
	char *jstate;
	char *eltimecpu;
	char *eltimewal;
	char *est_time;
	char *timeval;
	int usecput;
	static char pfs[SIZEL];
	static char rqmem[SIZEL];
	static char srfsbig[SIZEL];
	static char srfsfast[SIZEL];
	static char *blank = " -- ";
	char buf[COMMENT_BUF_SIZE] = {'\0'};
	int id_len;

	if (alt_opt & ALT_DISPLAY_T)
		pstat = bs_isort(pstat, cmp_est_time);

	if (prtheader) {
		printf("\n%s: ", prtheader->name);

		pc = get_attr(prtheader->attribs, ATTR_comment, NULL);
		if (pc)
			printf("%s", show_nonprint_chars(pc));
		if (wide) {

			/* Used for for displaying spaces and dashes dynamically for wide formatted output */
#define STR_DASH "--------------------------------------------------------------------------------"
#define STR_SPACE "                                                                                "

			/* dynamic formatting to display spaces */
			printf("\n");
			if (alt_opt & ALT_DISPLAY_T) {
				printf("%*.*s %*.*s %*.*s %*.*s %*.*s %*.*s %*.*s ", SIZEJOBID_W, SIZEJOBID_W, STR_SPACE,
				       SIZEUSER_W, SIZEUSER_W, STR_SPACE,
				       PBS_MAXQUEUENAME, PBS_MAXQUEUENAME, STR_SPACE,
				       SIZEJOBNAME_W, SIZEJOBNAME_W, STR_SPACE,
				       SIZESESSID_W, SIZESESSID_W, STR_SPACE,
				       SIZENDS_W, SIZENDS_W, STR_SPACE,
				       SIZETSK_W, SIZETSK_W, STR_SPACE);
				printf("               Est\n");
			}

			printf("%*.*s %*.*s %*.*s %*.*s %*.*s %*.*s %*.*s ", SIZEJOBID_W, SIZEJOBID_W, STR_SPACE,
			       SIZEUSER_W, SIZEUSER_W, STR_SPACE,
			       PBS_MAXQUEUENAME, PBS_MAXQUEUENAME, STR_SPACE,
			       SIZEJOBNAME_W, SIZEJOBNAME_W, STR_SPACE,
			       SIZESESSID_W, SIZESESSID_W, STR_SPACE,
			       SIZENDS_W, SIZENDS_W, STR_SPACE,
			       SIZETSK_W, SIZETSK_W, STR_SPACE);
			if (alt_opt & ALT_DISPLAY_T)
				printf("Req'd  Req'd   Start\n");
			else
				printf("Req'd  Req'd   Elap\n");

			/* dynamic formatting to display header */
			printf("%-*.*s %-*.*s %-*.*s %-*.*s %-*.*s %-*.*s %-*.*s ", SIZEJOBID_W, SIZEJOBID_W, "Job ID",
			       SIZEUSER_W, SIZEUSER_W, "Username",
			       PBS_MAXQUEUENAME, PBS_MAXQUEUENAME, "Queue",
			       SIZEJOBNAME_W, SIZEJOBNAME_W, "Jobname",
			       SIZESESSID_W, SIZESESSID_W, "SessID",
			       SIZENDS_W, SIZENDS_W, "NDS",
			       SIZETSK_W, SIZETSK_W, "TSK");
			printf("Memory Time  S Time\n");

			/* dynamic formatting to display dashes */
			printf("%-*.*s %-*.*s %-*.*s %-*.*s %-*.*s %-*.*s %-*.*s ", SIZEJOBID_W, SIZEJOBID_W, STR_DASH,
			       SIZEUSER_W, SIZEUSER_W, STR_DASH,
			       PBS_MAXQUEUENAME, PBS_MAXQUEUENAME, STR_DASH,
			       SIZEJOBNAME_W, SIZEJOBNAME_W, STR_DASH,
			       SIZESESSID_W, SIZESESSID_W, STR_DASH,
			       SIZENDS_W, SIZENDS_W, STR_DASH,
			       SIZETSK_W, SIZETSK_W, STR_DASH);
			printf("------ ----- - -----\n");
		} else {
			if (alt_opt & ALT_DISPLAY_T) {
				if (how_opt & ALT_DISPLAY_INCR_WIDTH)
					printf("\n%80s%s\n%65s%-7s%-8s%s\n", " ", "Est", " ", "Req'd", "Req'd", "Start");
				else
					printf("\n%75s%s\n%60s%-7s%-8s%s\n", " ", "Est", " ", "Req'd", "Req'd", "Start");
			} else {
				if (how_opt & ALT_DISPLAY_INCR_WIDTH)
					printf("\n%65s%-7s%-8s%s\n", " ", "Req'd", "Req'd", "Elap");
				else
					printf("\n%60s%-7s%-8s%s\n", " ", "Req'd", "Req'd", "Elap");
			}
			if (how_opt & ALT_DISPLAY_INCR_WIDTH) {
				printf("Job ID               Username Queue    Jobname    SessID NDS TSK Memory Time  S Time\n");
				printf("-------------------- -------- -------- ---------- ------ --- --- ------ ----- - -----\n");
			} else {
				printf("Job ID          Username Queue    Jobname    SessID NDS TSK Memory Time  S Time\n");
				printf("--------------- -------- -------- ---------- ------ --- --- ------ ----- - -----\n");
			}
		}
	}
	while (pstat) {
		exechost = blank;
		sess = blank;
		nodect = blank;
		tasks = blank;
		rqtimecpu = blank;
		rqtimewal = blank;
		eltimecpu = blank;
		eltimewal = blank;
		jstate = blank;
		comment = blank;
		usern = blank;
		jobn = blank;
		queuen = blank;
		est_time = NULL;
		/*		*pfs      = *blank;  */
		strcpy(pfs, blank);
		/*		*rqmem    = *blank;  */
		strcpy(rqmem, blank);
		/*		*srfsbig  = *blank;  */
		strcpy(srfsbig, blank);
		/*		*srfsfast = *blank;  */
		strcpy(srfsfast, blank);
		usecput = 0;

		pat = pstat->attribs;

		while (pat) {
			if (strcmp(pat->name, ATTR_N) == 0) {
				jobn = pat->value;
				trunc_value(jobn, SIZEJOBNAME, SIZEJOBNAME_W, wide);
			} else if (strcmp(pat->name, ATTR_owner) == 0) {
				usern = pat->value;
				if ((pc = strchr(usern, (int) '@')) != NULL)
					*pc = '\0';
				trunc_value(usern, SIZEUSER, SIZEUSER_W, wide);
			} else if (strcmp(pat->name, ATTR_state) == 0) {
				jstate = pat->value;
			} else if (strcmp(pat->name, ATTR_queue) == 0) {
				queuen = pat->value;
				trunc_value(queuen, SIZEQUEUENAME, PBS_MAXQUEUENAME, wide);
			} else if (strcmp(pat->name, ATTR_session) == 0) {
				sess = pat->value;
				trunc_value(sess, SIZESESSID, SIZESESSID_W, wide);
			} else if (strcmp(pat->name, ATTR_l) == 0) {
				if (strcmp(pat->resource, "nodect") == 0) {
					nodect = pat->value;
					trunc_value(nodect, SIZENDS, SIZENDS_W, wide);
				} else if (strcmp(pat->resource, "ncpus") == 0) {
					if (strcmp(pat->value, "0") != 0) {
						tasks = pat->value;
						trunc_value(tasks, SIZETSK, SIZETSK_W, wide);
					}
				} else if (strcmp(pat->resource, "mppe") == 0) {
					if (strcmp(pat->value, "0") != 0) {
						tasks = pat->value;
						trunc_value(tasks, SIZETSK, SIZETSK_W, wide);
					}
				} else if (strcmp(pat->resource, "mem") == 0) {
					pbs_strncpy(rqmem,
						    cnv_size(pat->value, alt_opt), sizeof(rqmem));
				} else if (strcmp(pat->resource, "walltime") == 0) {
					rqtimewal = pat->value;
				} else if (strcmp(pat->resource, "cput") == 0) {
					rqtimecpu = pat->value;
					usecput = 1;
				} else if (strcmp(pat->resource, "srfs_big") == 0) {
					pbs_strncpy(srfsbig,
						    cnv_size(pat->value, alt_opt), sizeof(srfsbig));
				} else if (strcmp(pat->resource, "srfs_fast") == 0) {
					pbs_strncpy(srfsfast,
						    cnv_size(pat->value, alt_opt), sizeof(srfsfast));
				} else if (strcmp(pat->resource, "piofs") == 0) {
					pbs_strncpy(pfs,
						    cnv_size(pat->value, alt_opt), sizeof(pfs));
				}

			} else if (strcmp(pat->name, ATTR_exechost) == 0) {
				exechost = pat->value;
			} else if (strcmp(pat->name, ATTR_estimated) == 0) {
				if (strcmp(pat->resource, "start_time") == 0) {
					est_time = pat->value;
				}
			} else if (strcmp(pat->name, ATTR_used) == 0) {
				if (strcmp(pat->resource, "walltime") == 0) {
					eltimewal = pat->value;
				} else if (strcmp(pat->resource, "cput") == 0) {
					eltimecpu = pat->value;
				}
			} else if (strcmp(pat->name, ATTR_comment) == 0) {
				/* there are 3 blank spaces after & before comment string */
				/* hence, for 80char line - 74 chars are displayed and for */
				/* 120 char line - 114 chars are displayed */
				if (strlen(pat->value) > COMMENTLENSCOPE_SHORT) {
					if (wide) {
						if (strlen(pat->value) > COMMENTLENSCOPE_WIDE) {
							pbs_strncpy(buf, pat->value, COMMENTLEN_WIDE);
							strcat(buf, "...");
							comment = buf;
						} else {
							comment = pat->value;
						}
					} else {
						pbs_strncpy(buf, pat->value, COMMENTLEN_SHORT);
						strcat(buf, "...");
						comment = buf;
					}
				} else {
					comment = pat->value;
				}
			}

			pat = pat->next;
		}

		if (alt_opt & ALT_DISPLAY_T) {
			pc = get_attr(pstat->attribs, ATTR_state, NULL);
			if (pc != NULL && (*pc == 'Q' || *pc == 'S' || *pc == 'B'))
				timeval = cnvt_est_start_time(est_time, 0);
			else
				timeval = "--";
		} else
			timeval = usecput ? eltimecpu : eltimewal;

		id_len = how_opt & ALT_DISPLAY_INCR_WIDTH ? SIZEJOBID_INCR : SIZEJOBID;
		trunc_value(pstat->name, id_len, SIZEJOBID_W, wide);

		if (wide) {
			/* dynamic formatting of values as defined by constants */
			printf("%-*.*s %-*.*s %-*.*s %-*.*s %*.*s %*.*s %*.*s ", SIZEJOBID_W, SIZEJOBID_W, pstat->name,
			       SIZEUSER_W, SIZEUSER_W, usern,
			       PBS_MAXQUEUENAME, PBS_MAXQUEUENAME, queuen,
			       SIZEJOBNAME_W, SIZEJOBNAME_W, jobn,
			       SIZESESSID_W, SIZESESSID_W, sess,
			       SIZENDS_W, SIZENDS_W, nodect,
			       SIZETSK_W, SIZETSK_W, tasks);
			/* static formatting of fixed size values */
			printf("%6.6s %5.5s %1s %5.5s",
			       rqmem,
			       usecput ? rqtimecpu : rqtimewal,
			       jstate,
			       timeval);
		} else {
			if (how_opt & ALT_DISPLAY_INCR_WIDTH) {
				printf("%-*.*s %-*.*s %-*.*s ",
				       SIZEJOBID_INCR, SIZEJOBID_INCR, pstat->name,
				       SIZEUSER, SIZEUSER, usern,
				       SIZEQUEUENAME, SIZEQUEUENAME, queuen);
			} else {
				printf("%-*.*s %-*.*s %-*.*s ",
				       SIZEJOBID, SIZEJOBID, pstat->name,
				       SIZEUSER, SIZEUSER, usern,
				       SIZEQUEUENAME, SIZEQUEUENAME, queuen);
			}
			/* dynamic formatting of values as defined by constants */
			printf("%-*.*s %*.*s %*.*s %*.*s ",
			       SIZEJOBNAME, SIZEJOBNAME, jobn,
			       SIZESESSID, SIZESESSID, sess,
			       SIZENDS, SIZENDS, nodect,
			       SIZETSK, SIZETSK, tasks);
			/* static formatting of fixed size values */
			printf("%6.6s %5.5s %1.1s %5.5s",
			       rqmem,
			       usecput ? rqtimecpu : rqtimewal,
			       jstate,
			       timeval);
		}
		if (!(alt_opt & ALT_DISPLAY_1l))
			printf("\n");
		else
			printf(" ");

		if (alt_opt & ALT_DISPLAY_n) {
			/* print assigned nodes */
			prt_nodes(exechost, alt_opt & ALT_DISPLAY_1l);
		}
		if (alt_opt & ALT_DISPLAY_s) {
			/* print (scheduler) comment */
			if (*comment != '\0')
				printf("   %s\n", show_nonprint_chars(comment));
		}

		pstat = pstat->next;
	}
}

/**
 * @brief
 * 	get_ct - get count of jobs in queue/run state
 *	support function for altdsp_statque()
 */
static void
get_ct(char *str, int *jque, int *jrun)
{
	char *ps;
	int colon = (int) ':';

	ps = strchr(str, colon);    /* Transit - skip */
	ps = strchr(ps + 1, colon); /* Queued  - add to jque */
	*jque += atoi(ps + 1);
	ps = strchr(ps + 1, colon); /* Held    - add to jque  */
	*jque += atoi(ps + 1);
	ps = strchr(ps + 1, colon); /* Waiting - add to jque  */
	*jque += atoi(ps + 1);
	ps = strchr(ps + 1, colon); /* Running - add to jrun  */
	*jrun += atoi(ps + 1);
}

/**
 * @brief
 * 	altdsp_statque - alternative display for queue information, -q option
 */

static void
altdsp_statque(char *serv, struct batch_status *pstat, int opt)
{
	char rmem[SIZEL];
	char *cput;
	char *wallt;
	char *jmax;
	char *nodect;
	char *blank = "  --   ";
	int jrun;
	int jque;
	char qenabled;
	char qstarted;
	int tot_jrun = 0;
	int tot_jque = 0;
	struct attrl *pat;

	printf("\nserver: %s\n\n", serv);
	printf("Queue            Memory CPU Time Walltime Node   Run   Que   Lm  State\n");
	printf("---------------- ------ -------- -------- ---- ----- ----- ----  -----\n");

	while (pstat) {
		/* *rmem = '\0'; */
		strcpy(rmem, "--  ");
		cput = blank;
		wallt = blank;
		nodect = "-- ";
		jrun = 0;
		jque = 0;
		jmax = blank;

		qenabled = 'D';
		qstarted = 'S';
		pat = pstat->attribs;

		while (pat) {
			if (strcmp(pat->name, ATTR_maxrun) == 0) {
				jmax = pat->value;
			} else if (strcmp(pat->name, ATTR_enable) == 0) {
				if (*pat->value == 'T')
					qenabled = 'E';
			} else if (strcmp(pat->name, ATTR_start) == 0) {
				if (*pat->value == 'T')
					qstarted = 'R';
			} else if (strcmp(pat->name, ATTR_count) == 0) {
				get_ct(pat->value, &jque, &jrun);
				tot_jque += jque;
				tot_jrun += jrun;
			} else if (strcmp(pat->name, ATTR_rescmax) == 0) {
				if (strcmp(pat->resource, "mem") == 0) {
					pbs_strncpy(rmem,
						    cnv_size(pat->value, opt), sizeof(rmem));
				} else if (strcmp(pat->resource, "cput") == 0) {
					cput = pat->value;
				} else if (strcmp(pat->resource, "walltime") == 0) {
					wallt = pat->value;
				} else if (strcmp(pat->resource, "nodect") == 0) {
					nodect = pat->value;
				}
			}
			pat = pat->next;
		}

		printf("%-16.16s %6.6s %8.8s %8.8s %4.4s ",
		       pstat->name, rmem, cput, wallt, nodect);
		printf("%5d %5d %4.4s   %c %c\n",
		       jrun, jque, jmax, qenabled, qstarted);

		pstat = pstat->next;
	}
	printf("                                               ----- -----\n");
	printf("                                               %5d %5d\n", tot_jrun, tot_jque);
}

/* build and add an attropl struct to the list */

static void
add_atropl(struct attropl **list, char *name, char *resc, char *value, enum batch_op op)
{
	struct attropl *patro;

	patro = (struct attropl *) malloc(sizeof(struct attropl));
	if (patro == 0)
		exit_qstat("out of memory");
	patro->next = *list;
	patro->name = name;
	patro->resource = resc;
	patro->value = value;
	patro->op = op;
	*list = patro;
}

static long
cvt_time_to_seconds(char *ts)
{
	char *workval;
	char *pc;
	char *pv;
	long rv = 0;

	if ((workval = strdup(ts)) == NULL)
		exit_qstat("out of memory");
	for (pc = workval, pv = workval; *pc; ++pc) {
		if (*pc == ':') {
			*pc = '\0';
			rv = (rv * 60) + atol(pv);
			pv = pc + 1;
		}
	}
	rv = rv * 60 + atol(pv);
	free(workval);
	return rv;
}

/**
 * @brief
 * 	percent_cal - calculate the percent done for the -p option
 *	Calculation is either:
 *	1.  expired / total subjobs for an array,
 *	2.  cput_used / cput_requested, if cput specified, or
 *	3.  walltime_used / walltime_requested if walltime specified, or
 *	4.  "--" if none of the above apply
 */
char *
percent_cal(char *state, char *timeu, char *timer, char *wtimu, char *wtimr, char *arsct)
{
	char *rtn = NULL;
	long bot = 0;
	long top = 0;
	int qu, ru, ex, ep;

	switch (*state) {

		case 'Q':
		case 'T':
		case 'W':
			pbs_asprintf(&rtn, "%3s", "-- ");
			return (rtn);

		case 'X':
			pbs_asprintf(&rtn, "%3s", "100");
			return (rtn);
	}

	if (arsct) { /* array job: percent expired */
		long percexp = -1;
		sscanf(arsct, "Queued:%d Running:%d Exiting:%d Expired:%d", &qu, &ru, &ex, &ep);
		bot = qu + ru + ex + ep;
		top = ep;
		if (bot != 0)
			percexp = (top * 100) / bot;
		if ((percexp >= 0) && (percexp < 1000)) {
			pbs_asprintf(&rtn, "%3ld ", percexp);
		}
	} else {
		long perccpu = -1;
		long percwal = -1;
		if (timer && timeu) { /* if cput specified */
			top = cvt_time_to_seconds(timeu);
			bot = cvt_time_to_seconds(timer);
			if (bot != 0)
				perccpu = (top * 100) / bot;
		}
		if (wtimr && wtimu) { /* if walltime specified */
			top = cvt_time_to_seconds(wtimu);
			bot = cvt_time_to_seconds(wtimr);
			if (bot != 0)
				percwal = (top * 100) / bot;
		}
		if ((perccpu != -1) || (percwal != -1)) {
			pbs_asprintf(&rtn, "%3ld ",
				     perccpu > percwal ? perccpu : percwal);
		}
	}
	if (rtn == NULL) {
		pbs_asprintf(&rtn, "%3s", "-- ");
	}
	return (rtn);
}

/** @fn display_statjob
 * @brief	display job status in specific format.
 *
 * @return int
 * @retval	0	- success
 * @retval	1	- failure
 *
 */

int
display_statjob(struct batch_status *status, struct batch_status *prtheader, int full, int how_opt, int alt_opt, int wide)
{
	struct batch_status *p;
	struct attrl *a;
	int l;
	char *c;
	char *jid;
	char *name;
	char *owner;
	char *timeu;
	char *timer;
	char *wtimu;
	char *wtimr;
	char *arsct;
	char *state;
	char *location;
	char format[80];
	char long_name[NAMEL + 1] = {'\0'};
	char *cmdargs = NULL;
	char *hpcbp_executable;
	json_data *json_jobs = NULL;
	json_data *json_job = NULL;

	if (wide) {
		sprintf(format, "%%-%ds %%-%ds %%-%ds  %%%ds %%%ds %%-%ds\n",
			SIZEJOBID_W, SIZEJOBNAME_W, SIZEUSER_W, TIMEUL, STATEL, PBS_MAXQUEUENAME);
	} else if (how_opt & ALT_DISPLAY_INCR_WIDTH) {
		sprintf(format, "%%-%ds %%-%ds %%-%ds  %%%ds %%%ds %%-%ds\n",
			PBS_MAXSEQNUM + 10, NAMEL, OWNERL, TIMEUL, STATEL, LOCL);
	} else {
		sprintf(format, "%%-%ds %%-%ds %%-%ds  %%%ds %%%ds %%-%ds\n",
			PBS_MAXSEQNUM + 5, NAMEL, OWNERL, TIMEUL, STATEL, LOCL);
	}

	if (!full && prtheader && output_format == FORMAT_DEFAULT) {
		c = get_attr(prtheader->attribs, ATTR_comment, NULL);
		if (c)
			printf("%s\n", show_nonprint_chars(c));
		if (how_opt & ALT_DISPLAY_p) {
			if (wide) {
				printf("Job id                         Name            User              %% done  S Queue\n");
				printf("-----------------------------  --------------- ---------------  -------- - ---------------\n");
			} else if (how_opt & ALT_DISPLAY_INCR_WIDTH) {
				printf("Job id                 Name             User               %% done  S Queue\n");
				printf("---------------------  ---------------- ----------------  -------- - -----\n");
			} else {
				printf("Job id            Name             User               %% done  S Queue\n");
				printf("----------------  ---------------- ----------------  -------- - -----\n");
			}
		} else {
			if (wide) {
				printf("Job id                         Name            User             Time Use S Queue\n");
				printf("-----------------------------  --------------- ---------------  -------- - ---------------\n");
			} else if (how_opt & ALT_DISPLAY_INCR_WIDTH) {
				printf("Job id                 Name             User              Time Use S Queue\n");
				printf("---------------------  ---------------- ----------------  -------- - -----\n");
			} else {
				printf("Job id            Name             User              Time Use S Queue\n");
				printf("----------------  ---------------- ----------------  -------- - -----\n");
			}
		}
	}

	if (output_format == FORMAT_JSON && first_stat) {
		if ((json_jobs = pbs_json_create_object()) == NULL)
			return 1;
		pbs_json_insert_item(json_root, "Jobs", json_jobs);
		first_stat = 0;
	}
	p = status;
	while (p != NULL) {
		jid = NULL;
		name = NULL;
		owner = NULL;
		timeu = NULL;
		timer = NULL;
		wtimu = NULL;
		wtimr = NULL;
		arsct = NULL;
		state = NULL;
		location = NULL;
		hpcbp_executable = NULL;
		prev_resc_name = NULL;
		json_job = NULL;
		if (full) {
			if (output_format == FORMAT_DSV || output_format == FORMAT_DEFAULT)
				printf("Job Id: %s%s", p->name, delimiter);
			else if (output_format == FORMAT_JSON) {
				if ((json_job = pbs_json_create_object()) == NULL)
					return 1;
				pbs_json_insert_item(json_jobs, p->name, json_job);
			}
			a = p->attribs;
			while (a != NULL) {
				if (a->name != NULL) {
					time_t epoch;

					if (strcmp(a->name, ATTR_ctime) == 0 ||
					    strcmp(a->name, ATTR_etime) == 0 ||
					    strcmp(a->name, ATTR_stime) == 0 ||
					    strcmp(a->name, ATTR_obittime) == 0 ||
					    strcmp(a->name, ATTR_mtime) == 0 ||
					    strcmp(a->name, ATTR_qtime) == 0 ||
					    strcmp(a->name, ATTR_resv_start) == 0 ||
					    strcmp(a->name, ATTR_resv_end) == 0 ||
					    strcmp(a->name, ATTR_cred_validity) == 0 ||
					    (strcmp(a->name, ATTR_estimated) == 0 &&
					     strcmp(a->resource, "start_time") == 0) ||
					    strcmp(a->name, ATTR_a) == 0) {
						epoch = (time_t) atol(a->value);
						if (epoch == 0 &&
						    strcmp(a->name, ATTR_estimated) == 0 &&
						    strcmp(a->resource, "start_time") == 0) {
							/*
							 * Must not pass constant string to
							 * ptr_attr due to strtok bug in Linux.
							 * Use a stack variable instead.
							 */
							char noval[] = "UNKNOWN";
							prt_attr(a->name, a->resource, noval, alt_opt & ALT_DISPLAY_w, json_job);
						} else {
							char time_buffer[32];
							pbs_strncpy(time_buffer, ctime(&epoch), sizeof(time_buffer));
							time_buffer[strlen(time_buffer) - 1] = '\0';
							prt_attr(a->name, a->resource, time_buffer, alt_opt & ALT_DISPLAY_w, json_job);
						}
					} else if (strcmp(a->name, ATTR_resv_state) == 0) {
						prt_attr(a->name, a->resource, cvtResvstate(a->value), alt_opt & ALT_DISPLAY_w, json_job);
					} else if (strcmp(a->name, ATTR_submit_arguments) == 0) {
						if (decode_xml_arg_list_str((a->value), &cmdargs) == -1)
							exit_qstat("out of memory");
						prt_attr(a->name, a->resource, cmdargs, alt_opt & ALT_DISPLAY_w, json_job);
						free(cmdargs);
					} else if (strcmp(a->name, ATTR_executable) == 0) {
						/*
						 * Prefix and suffix attribute value with
						 * HPCBP_EXEC_TAG value.
						 */
						hpcbp_executable =
							malloc((strlen(HPCBP_EXEC_TAG) * 2) +
							       sizeof("<></>") + strlen(a->value) + 1);
						if (hpcbp_executable == NULL)
							exit_qstat("out of memory");
						(void) sprintf(hpcbp_executable, "<%s>%s</%s>",
							       HPCBP_EXEC_TAG, a->value, HPCBP_EXEC_TAG);
						prt_attr(a->name, a->resource, hpcbp_executable, alt_opt & ALT_DISPLAY_w, json_job);
						free(hpcbp_executable);
					} else {
						prt_attr(a->name, a->resource, a->value, alt_opt & ALT_DISPLAY_w, json_job);
					}
				}
				a = a->next;
				if (a)
					printf("%s", delimiter);
			}
			if (output_format == FORMAT_DEFAULT)
				printf("%s", delimiter);
		} else {
			if (p->name != NULL) {
				c = p->name;
				while (*c != '.' && *c != '\0')
					c++;
				c++; /* List the first part of the server name, too. */
				while (*c != '.' && *c != '\0')
					c++;
				*c = '\0';
				l = strlen(p->name);
				if (wide) {
					if (l > SIZEJOBID_W) {
						c = p->name + SIZEJOBID_W;
						*(c - 1) = DISPLAY_TRUNC_CHAR;
						*c = '\0';
					}
				} else if (how_opt & ALT_DISPLAY_INCR_WIDTH) {
					if (l > (PBS_MAXSEQNUM + 10)) {
						c = p->name + PBS_MAXSEQNUM + 10;
						*(c - 1) = DISPLAY_TRUNC_CHAR;
						*c = '\0';
					}
				} else {
					if (l > (PBS_MAXSEQNUM + 5)) {
						c = p->name + PBS_MAXSEQNUM + 5;
						*(c - 1) = DISPLAY_TRUNC_CHAR;
						*c = '\0';
					}
				}
				jid = p->name;
			}
			a = p->attribs;
			while (a != NULL) {
				if (a->name != NULL) {
					if (strcmp(a->name, ATTR_name) == 0) {
						l = strlen(a->value);
						if (wide) {
							if (l >= SIZEJOBNAME_W) {
								snprintf(long_name, SIZEJOBNAME_W + 1, "%.*s%c", (SIZEJOBNAME_W - 1), a->value, DISPLAY_TRUNC_CHAR);
								c = long_name;
							} else {
								c = a->value;
							}
						} else {
							if (l >= NAMEL) {
								snprintf(long_name, NAMEL + 1, "%.*s%c", (NAMEL - 1), a->value, DISPLAY_TRUNC_CHAR);
								c = long_name;
							} else
								c = a->value;
						}
						name = c;
					} else if (strcmp(a->name, ATTR_owner) == 0) {
						c = a->value;
						while (*c != '@' && *c != '\0')
							c++;
						*c = '\0';
						l = strlen(a->value);
						if (wide) {
							if (l > SIZEUSER_W) {
								c = a->value + SIZEUSER_W;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
						} else {
							if (l > OWNERL) {
								c = a->value + OWNERL;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
						}
						owner = a->value;
					} else if (strcmp(a->name, ATTR_used) == 0) {
						if (strcmp(a->resource, "cput") == 0) {
							l = strlen(a->value);
							if (l > TIMEUL) {
								c = a->value + TIMEUL;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
							timeu = a->value;
						} else if (strcmp(a->resource, "walltime") == 0) {
							l = strlen(a->value);
							if (l > TIMEUL) {
								c = a->value + TIMEUL;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
							wtimu = a->value;
						}
					} else if (strcmp(a->name, ATTR_l) == 0) {
						if (strcmp(a->resource, "cput") == 0) {
							l = strlen(a->value);
							if (l > TIMEUL) {
								c = a->value + TIMEUL;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
							timer = a->value;
						} else if (strcmp(a->resource, "walltime") == 0) {
							l = strlen(a->value);
							if (l > TIMEUL) {
								c = a->value + TIMEUL;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
							wtimr = a->value;
						}
					} else if (strcmp(a->name, ATTR_state) == 0) {
						l = strlen(a->value);
						if (l > STATEL) {
							c = a->value + STATEL;
							*(c - 1) = DISPLAY_TRUNC_CHAR;
							*c = '\0';
						}
						state = a->value;
					} else if (strcmp(a->name, ATTR_queue) == 0) {
						c = a->value;
						while (*c != '@' && *c != '\0')
							c++;
						*c = '\0';
						l = strlen(a->value);
						if (wide) {
							if (l > PBS_MAXQUEUENAME) {
								c = a->value + PBS_MAXQUEUENAME;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
						} else {
							if (l > LOCL) {
								c = a->value + LOCL;
								*(c - 1) = DISPLAY_TRUNC_CHAR;
								*c = '\0';
							}
						}
						location = a->value;
					} else if (strcmp(a->name, ATTR_array_state_count) == 0) {
						arsct = a->value;
					}
				}
				a = a->next;
			}
			if (timeu == NULL)
				timeu = "0";
			if (how_opt & ALT_DISPLAY_p) {
				char *pc = percent_cal(state, timeu, timer, wtimu, wtimr, arsct);
				printf(format, jid, name, owner, pc, state, location);
				free(pc);
			} else
				printf(format, jid, name, owner, timeu, state, location);
		}
		if (full && output_format != FORMAT_JSON)
			printf("\n");
		p = p->next;
	}
	return 0;
}

#define TYPEL 4
/**
 * @brief
 *      Helper function to accumulate new-type restriction to a running string
 *
 * @param[in] keys - array of  keys
 * @param[in] values - array of values corresponding to each key
 * @param[in] count - pointer to current number of unqiue keys stored in keys/values
 * @param[in] max - maximum allowed number of unique keys 
 * @param[in] key - new key to process 
 * @param[in] val - value associated with the key to accumulate 
 *
 */
static void accumulate_restriction(char **keys, char **values, int *count, int max, const char *key, const char *val) {
	/* check NULL-ness of parameters*/
	if (!keys || !values || !count || !key || !val) {
		exit_qstat("accumulate_restriction: NULL key or value");
	}
	for (int i = 0; i < *count; i++) {
		/* check if key already exists */
		if (strcmp(keys[i], key) == 0) {
			size_t new_len = strlen(values[i]) + strlen(val) + 2; /* ",\0" */
			char *new_buf = malloc(new_len);
			if (!new_buf) {
				exit_qstat("out of memory");
			}
			snprintf(new_buf, new_len, "%s,%s", values[i], val); /* append to running output */
			free(values[i]);
			values[i] = new_buf;
			return;
		}
	}

	/* first time restriction seen, create new key */
	if (*count < max) {
		char *new_key = strndup(key, strlen(key) + 1);
		if (!new_key) {
			exit_qstat("out of memory");
		}

		char *new_val = strndup(val, strlen(val) + 1);
		if (!new_val) {
			free(new_key);
			exit_qstat("out of memory");
		}

		/* assign values*/
		keys[*count] = new_key;
		values[*count] = new_val;
		(*count)++;
	}
}

/**
 * @brief
 *	Displays the status of queue.
 *
 * @param[in] status - batch request for queue status
 * @param[in] prtheader - true or false
 * @param[in] full - server full name
 *
 * @return	int
 * @retval	0	- success
 * @retval	1	- failure
 *
 */
int
display_statque(struct batch_status *status, int prtheader, int full, int alt_opt)
{
	struct batch_status *p;
	struct attrl *a;
	int l;
	char *c;
	char *name;
	char *max;
	char *tot;
	char ena[3 + 1];
	char str[3 + 1];
	char que[NUML + 1];
	char run[NUML + 1];
	char hld[NUML + 1];
	char wat[NUML + 1];
	char trn[NUML + 1];
	char ext[NUML + 1];
	char *type;
	char format[80];
	json_data *json_queues = NULL;
	json_data *json_queue = NULL;

	sprintf(format, "%%-%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%-%ds\n",
		NAMEL, NUML, NUML, 3, 3, NUML,
		NUML, NUML, NUML, NUML, NUML, TYPEL);

	if (!full && prtheader && output_format == FORMAT_DEFAULT) {
		printf("Queue              Max   Tot Ena Str   Que   Run   Hld   Wat   Trn   Ext Type\n");
		printf("---------------- ----- ----- --- --- ----- ----- ----- ----- ----- ----- ----\n");
	}

	if (output_format == FORMAT_JSON && first_stat) {
		if ((json_queues = pbs_json_create_object()) == NULL)
			return 1;
		pbs_json_insert_item(json_root, "Queue", json_queues);
		first_stat = 0;
	}
	p = status;
	while (p != NULL) {
		name = NULL;
		max = "0";
		tot = "0";
		strcpy(ena, "no");
		strcpy(str, "no");
		strcpy(que, "0");
		strcpy(run, "0");
		strcpy(hld, "0");
		strcpy(wat, "0");
		strcpy(trn, "0");
		strcpy(ext, "0");
		type = "not defined";
		prev_resc_name = NULL;

		char *attr_names[MAX_ATTRS] = {0};
		char *attr_values[MAX_ATTRS] = {0};
		int attr_count = 0;

		char *res_new_type_name = NULL;
		char *res_names[MAX_RES] = {0};
		char *res_values[MAX_RES] = {0};
		int res_count = 0;

		if (full) {
			if (output_format == FORMAT_DSV || output_format == FORMAT_DEFAULT)
				printf("Queue: %s%s", p->name, delimiter);
			else if (output_format == FORMAT_JSON) {
				if ((json_queue = pbs_json_create_object()) == NULL)
					return 1;
				pbs_json_insert_item(json_queues, p->name, json_queue);
			}
			a = p->attribs;
			while (a != NULL) {
				if (a->name != NULL) {
					if (output_format == FORMAT_JSON && a->value[0] == '[' && strchr(a->value, '=') != NULL && a->value[strlen(a->value)-1] == ']') { /* new type queue restriction */
						if (a->resource) { /* resource + new type queue restriction + json */
							accumulate_restriction(res_names, res_values, &res_count, MAX_RES, a->resource, a->value);
							res_new_type_name = a->name;
						}
						else { /* new type but not a sub resource */
							accumulate_restriction(attr_names, attr_values, &attr_count, MAX_ATTRS, a->name, a->value);
						}
					} else { /* not new-type queue restriction */
						prt_attr(a->name, a->resource, a->value,
							alt_opt & ALT_DISPLAY_w, json_queue);
					}
				}
				a = a->next;
				if (a)
					printf("%s", delimiter);
			}
			if (attr_count > 0) { /* new type restriction */
				for (int i = 0; i < attr_count; i++) {
					pbs_json_insert_string(json_queue, attr_names[i], attr_values[i]);
					free(attr_names[i]);
					free(attr_values[i]);
				}
			}
			if (res_count > 0) { /* new type restiction + resource type */
				json_data *json_obj = pbs_json_create_object();
				for (int i = 0; i < res_count; i++) {
					pbs_json_insert_string(json_obj, res_names[i], res_values[i]);
					free(res_names[i]);
					free(res_values[i]);
				}
				pbs_json_insert_item(json_queue, res_new_type_name, json_obj);
			}
			if (output_format == FORMAT_DEFAULT)
				printf("%s", delimiter);
		} else {
			if (p->name != NULL) {
				l = strlen(p->name);
				if (l > NAMEL) {
					c = p->name + NAMEL;
					*(c - 1) = DISPLAY_TRUNC_CHAR;
					*c = '\0';
				}
				name = p->name;
			}
			a = p->attribs;
			while (a != NULL) {
				if (a->name != NULL) {
					if (strcmp(a->name, ATTR_maxrun) == 0) {
						l = strlen(a->value);
						if (l > NUML) {
							c = a->value + NUML;
							*(c - 1) = DISPLAY_TRUNC_CHAR;
							*c = '\0';
						}
						max = a->value;
					} else if (strcmp(a->name, ATTR_total) == 0) {
						l = strlen(a->value);
						if (l > NUML) {
							c = a->value + NUML;
							*(c - 1) = DISPLAY_TRUNC_CHAR;
							*c = '\0';
						}
						tot = a->value;
					} else if (strcmp(a->name, ATTR_enable) == 0) {
						if (istrue(a->value))
							strcpy(ena, "yes");
						else
							strcpy(ena, "no");
					} else if (strcmp(a->name, ATTR_start) == 0) {
						if (istrue(a->value))
							strcpy(str, "yes");
						else
							strcpy(str, "no");
					} else if (strcmp(a->name, ATTR_count) == 0) {
						states(a->value, que, run, hld, wat, trn, ext, NUML);
					} else if (strcmp(a->name, ATTR_qtype) == 0) {
						l = strlen(a->value);
						if (l > TYPEL) {
							c = a->value + TYPEL;
							*(c - 1) = DISPLAY_TRUNC_CHAR;
							*c = '\0';
						}
						type = a->value;
					}
				}
				a = a->next;
			}
			printf(format, name, max, tot, ena, str, que, run, hld, wat, trn, ext, type);
		}
		if (full && output_format != FORMAT_JSON)
			printf("\n");
		p = p->next;
	}
	return 0;
}

#define STATUSL 10

/**
 * @brief
 *      Displays the status of server.
 *
 * @param[in] status - batch request for server status
 * @param[in] prtheader - true or false
 * @param[in] full - server full name
 *
 * @return  int
 * @retval	0	- success
 * @retval	1	- failure
 *
 */

int
display_statserver(struct batch_status *status, int prtheader, int full, int alt_opt)
{
	struct batch_status *p;
	struct attrl *a;
	int l;
	char *c;
	char *name;
	char *max;
	char *tot;
	char que[NUML + 1];
	char run[NUML + 1];
	char hld[NUML + 1];
	char wat[NUML + 1];
	char trn[NUML + 1];
	char ext[NUML + 1];
	char *stats;
	char format[80];
	json_data *json_servers = NULL;
	json_data *json_server = NULL;

	sprintf(format, "%%-%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%%ds %%-%ds\n",
		NAMEL, NUML, NUML, NUML, NUML, NUML, NUML, NUML, NUML, STATUSL);

	if (!full && prtheader && output_format == FORMAT_DEFAULT) {
		printf("Server             Max   Tot   Que   Run   Hld   Wat   Trn   Ext Status\n");
		printf("---------------- ----- ----- ----- ----- ----- ----- ----- ----- -----------\n");
	}

	if (output_format == FORMAT_JSON && first_stat) {
		if ((json_servers = pbs_json_create_object()) == NULL)
			return 1;
		pbs_json_insert_item(json_root, "Server", json_servers);
		first_stat = 0;
	}
	p = status;
	while (p != NULL) {
		name = NULL;
		max = "0";
		tot = "0";
		strcpy(que, "0");
		strcpy(run, "0");
		strcpy(hld, "0");
		strcpy(wat, "0");
		strcpy(trn, "0");
		strcpy(ext, "0");
		stats = "";
		if (full) {
			if (output_format == FORMAT_DSV || output_format == FORMAT_DEFAULT)
				printf("Server: %s%s", p->name, delimiter);
			else if (output_format == FORMAT_JSON) {
				if ((json_server = pbs_json_create_object()) == NULL)
					return 1;
				pbs_json_insert_item(json_servers, p->name, json_server);
			}
			a = p->attribs;
			while (a != NULL) {
				if (a->name != NULL) {
					prt_attr(a->name, a->resource, a->value, alt_opt & ALT_DISPLAY_w, json_server);
				}
				a = a->next;
				if ((a || output_format == FORMAT_DEFAULT))
					printf("%s", delimiter);
			}
		} else {
			if (p->name != NULL) {
				l = strlen(p->name);
				if (l > NAMEL) {
					c = p->name + NAMEL;
					*(c - 1) = DISPLAY_TRUNC_CHAR;
					*c = '\0';
				}
				name = p->name;
			}
			a = p->attribs;
			while (a != NULL) {
				if (a->name != NULL) {
					if (strcmp(a->name, ATTR_maxrun) == 0) {
						l = strlen(a->value);
						if (l > NUML) {
							c = a->value + NUML;
							*(c - 1) = DISPLAY_TRUNC_CHAR;
							*c = '\0';
						}
						max = a->value;
					} else if (strcmp(a->name, ATTR_total) == 0) {
						l = strlen(a->value);
						if (l > NUML) {
							c = a->value + NUML;
							*(c - 1) = DISPLAY_TRUNC_CHAR;
							*c = '\0';
						}
						tot = a->value;
					} else if (strcmp(a->name, ATTR_count) == 0) {
						states(a->value, que, run, hld, wat, trn, ext, NUML);
					} else if (strcmp(a->name, ATTR_status) == 0) {
						l = strlen(a->value);
						if (l > STATUSL) {
							c = a->value + STATUSL;
							*(c - 1) = DISPLAY_TRUNC_CHAR;
							*c = '\0';
						}
						stats = a->value;
					}
				}
				a = a->next;
			}
			printf(format, name, max, tot, que, run, hld, wat, trn, ext, stats);
		}
		if (full && output_format != FORMAT_JSON)
			printf("\n");
		p = p->next;
	}
	return 0;
}

#if TCL_QSTAT
#ifdef NAS /* localmod 071 */
static Tcl_Obj *
attrlist(struct attrl *ap)
{
	char nameres[256];
	int rc;
	Tcl_Obj *ret;
	Tcl_Obj *sublist;

	/*
	 * Build a list out of sublists made from attribute name / value
	 * pairs
	 */
	ret = Tcl_NewListObj(0, NULL);
	if (ret == NULL)
		return ret;
	while (ap) {
		Tcl_Obj *twol[2];

		if (ap->resource) {
			sprintf(nameres, "%s%s%s",
				ap->name, tcl_atrsep, ap->resource);
			twol[0] = Tcl_NewStringObj(nameres, -1);
		} else
			twol[0] = Tcl_NewStringObj(ap->name, -1);
		twol[1] = Tcl_NewStringObj(ap->value, -1);
		sublist = Tcl_NewListObj(2, twol);
		if (sublist == NULL) {
			if (twol[0])
				Tcl_DecrRefCount(twol[0]);
			if (twol[1])
				Tcl_DecrRefCount(twol[1]);
			break;
		}
		rc = Tcl_ListObjAppendElement(NULL, ret, sublist);
		if (rc != TCL_OK) {
			Tcl_DecrRefCount(sublist);
			break;
		}
		ap = ap->next;
	}
	return (ret);
}
#else
#define ARGNUM 1024

char *
attrlist(struct attrl *ap)
{
	char nameres[256];
	char *argv[ARGNUM];
	char *ret;
	int i, num = 0;

	while (ap) {
		char *twol[2];

		if (ap->resource) {
			sprintf(nameres, "%s%s%s",
				ap->name, TCL_ATRSEP, ap->resource);
			twol[0] = nameres;
		} else
			twol[0] = ap->name;
		twol[1] = ap->value;
		argv[num++] = Tcl_Merge(2, twol);
		if (num == ARGNUM)
			break;
		ap = ap->next;
	}
	ret = Tcl_Merge(num, argv);
	for (i = 0; i < num; i++)
		free(argv[i]);
	return (ret);
}
#endif /* localmod 071 */

Tcl_Interp *interp = NULL;
char script[200];
char flags[] = "flags";
char ops[] = "operands";
char error[] = "error";

#ifdef NAS /* localmod 071 */
char log_buffer[4096];
extern int quiet;

extern void add_cmds(Tcl_Interp *interp);

/**
 * @brief
 *	log error msg on error
 *
 * @param[in] errnum - error number
 * @param[in] func - function name where error occured
 * @param[in] text - error msg
 *
 * @return	Void
 *
 */
void
log_err(int errnum, char *func, char *text)
{
	if (quiet)
		return;
	fprintf(stderr, "%s: %s: %s\n",
		(errnum < 0) ? "Internal error" : strerror(errnum),
		func, text);
}

/**
 * @brief
 *	initialise the tcl.
 */
void
tcl_init()
{
	struct passwd *pw;
	uid_t uid;
	struct stat sb;
	struct batch_status *bp;
	int i, ret = 1;
	char *home;

	if ((home = getenv("QSTATRCHOME")) == NULL &&
	    (home = getenv("HOME")) == NULL) {
		uid = getuid();
		pw = getpwuid(uid);
		if (pw == NULL)
			return;
		home = pw->pw_dir;
	}

	snprintf(script, sizeof(script), "%s/.qstatrc", home);
	if (stat(script, &sb) == -1) {
		pbs_strncpy(script, QSTATRC_PATH, sizeof(script));
		if (stat(script, &sb) == -1)
			return;
	}

	interp = Tcl_CreateInterp();
	if (Tcl_Init(interp) == TCL_ERROR) {
		fprintf(stderr, "Tcl_Init error: %s",
			Tcl_GetStringResult(interp));
	}
#if TCLX
#if TCL_MINOR_VERSION < 5 && TCL_MAJOR_VERSION < 8
	if (TclX_Init(interp) == TCL_ERROR)
#else
	if (Tclx_Init(interp) == TCL_ERROR)
#endif
	{
		fprintf(stderr, "Tclx_Init error: %s",
			interp->result);
	}
#endif /* TCLX */
	add_cmds(interp);
	return;
}
#else

/**
 * @brief
 *      initialise the tcl lib.
 */

void
tcl_init()
{
	struct passwd *pw;
	uid_t uid;
	struct stat sb;
	struct batch_status *bp;
	int i, ret = 1;

	uid = getuid();
	pw = getpwuid(uid);
	if (pw == NULL)
		return;

	snprintf(script, sizeof(script), "%s/.qstatrc", pw->pw_dir);
	if (stat(script, &sb) == -1) {
		pbs_strncpy(script, QSTATRC_PATH, sizeof(script));
		if (stat(script, &sb) == -1)
			return;
	}

	interp = Tcl_CreateInterp();
	if (Tcl_Init(interp) == TCL_ERROR) {
		fprintf(stderr, "Tcl_Init error: %s",
			Tcl_GetStringResult(interp));
	}
#if TCLX
#if TCL_MINOR_VERSION < 5 && TCL_MAJOR_VERSION < 8
	if (TclX_Init(interp) == TCL_ERROR)
#else
	if (Tclx_Init(interp) == TCL_ERROR)
#endif
	{
		fprintf(stderr, "Tclx_Init error: %s",
			interp->result);
	}
#endif /* TCLX */
	return;
}
#endif /* localmod 071 */

/**
 * @brief
 *	add argument to tcl list.
 *
 * @param[in] name - flag
 * @param[in] arg - argument
 *
 * @return	Void
 *
 */

void
tcl_addarg(char *name, char *arg)
{
	if (interp == NULL)
		return;

	if (arg == NULL || *arg == '\0')
		return;

	Tcl_SetVar(interp, name, arg,
		   TCL_GLOBAL_ONLY |
			   TCL_LIST_ELEMENT |
			   TCL_APPEND_VALUE);
}

/**
 * @brief
 *      set tcl status .
 *
 * @param[in] type - type
 * @param[in] bs - batch request for tcl status
 * @param[in] f_opt - file option
 *
 * @return      int
 * @retval      0       success
 * @retval      1       error
 *
 */

#ifdef NAS /* localmod 071 */
int tcl_stat(char *, struct batch_status *, int);
int
tcl_stat(char *type, struct batch_status *bs, int tcl_opt)
{
	struct batch_status *bp;
	Tcl_Obj *twol[2];
	Tcl_Obj *value;
	Tcl_Obj *result;
	Tcl_Obj *name;
	int rc;
	int i;
	int errs = 0;

	if (interp == NULL)
		return 1;

	if (tcl_opt == 0)
		return 1;

	value = Tcl_NewListObj(0, NULL);
	if (value == NULL)
		return 1;

	for (bp = bs; bp; bp = bp->next) {
		Tcl_Obj *threel[3];
		Tcl_Obj *sublist;

		threel[0] = Tcl_NewStringObj(bp->name, -1);
		threel[1] = attrlist(bp->attribs);
		threel[2] = Tcl_NewStringObj(bp->text, -1);

		sublist = Tcl_NewListObj(3, threel);
		if (sublist == NULL) {
			for (i = 0; i < 3; ++i) {
				if (threel[i] != NULL) {
					Tcl_DecrRefCount(threel[i]);
				}
			}
			++errs;
			break;
		}
		rc = Tcl_ListObjAppendElement(interp, value, sublist);
		if (rc != TCL_OK) {
			Tcl_DecrRefCount(sublist);
			++errs;
			break;
		}
	}
	if (errs) {
		Tcl_DecrRefCount(value);
		return 1;
	}
	twol[0] = Tcl_NewStringObj(type, -1);
	twol[1] = value;

	result = Tcl_NewListObj(2, twol);
	if (result == NULL) {
		for (i = 0; i < 2; ++i) {
			if (twol[i] != NULL) {
				Tcl_DecrRefCount(twol[i]);
			}
		}
		return 1;
	}
	name = Tcl_NewStringObj("objects", -1);
	if (name == NULL) {
		Tcl_DecrRefCount(result);
		return 1;
	}

	Tcl_ObjSetVar2(interp, name, NULL, result,
		       TCL_GLOBAL_ONLY |
			       TCL_LIST_ELEMENT |
			       TCL_APPEND_VALUE);
	return 0;
}
#else
/**
 * @brief
 *	set tcl status .
 *
 * @param[in] type - type
 * @param[in] bs - batch request for tcl status
 * @param[in] f_opt - file option
 *
 * @return	int
 * @retval	0	success
 * @retval	1	error
 *
 */
int
tcl_stat(char *type, struct batch_status *bs, int f_opt)
{
	struct batch_status *bp;
	char *twol[2];
	char *argv[ARGNUM];
	int i, num = 0;
	char *result;

	if (interp == NULL)
		return 1;

	if (f_opt == 0)
		return 1;

	twol[0] = type;
	for (bp = bs; bp; bp = bp->next) {
		char *threel[3];

		threel[0] = bp->name;
		threel[1] = attrlist(bp->attribs);
		threel[2] = bp->text;

		argv[num++] = Tcl_Merge(3, threel);
		free(threel[1]); /* malloc'ed in attrlist() */
		if (num == ARGNUM)
			break;
	}
	twol[1] = Tcl_Merge(num, argv);
	for (i = 0; i < num; i++)
		free(argv[i]);

	result = Tcl_Merge(2, twol);
	Tcl_SetVar(interp, "objects", result,
		   TCL_GLOBAL_ONLY |
			   TCL_LIST_ELEMENT |
			   TCL_APPEND_VALUE);
	free(twol[1]);
	free(result);
	return 0;
}
#endif /* localmod 071 */

void
#ifdef NAS /* localmod 071 */
tcl_run(int tcl_opt)
#else
tcl_run(int f_opt)
#endif /* localmod 071 */
{
	if (interp == NULL)
		return;

#ifdef NAS /* localmod 071 */
	if (tcl_opt &&
#else
	if (f_opt &&
#endif /* localmod 071 */
	    Tcl_EvalFile(interp, script) != TCL_OK) {
		char *trace;

		trace = (char *) Tcl_GetVar(interp, "errorInfo", 0);
		if (trace == NULL)
			trace = Tcl_GetStringResult(interp);

		fprintf(stderr, "%s: TCL error @ line %d: %s\n",
			script, Tcl_GetErrorLine(interp), trace);
	}
	Tcl_DeleteInterp(interp);
}

#else
#define tcl_init()
#define tcl_addarg(name, arg)
#ifdef NAS /* localmod 071 */
#define tcl_stat(type, bs, tcl_opt) 1
#define tcl_run(tcl_opt)
#else
#define tcl_stat(type, bs, f_opt) 1
#define tcl_run(f_opt)
#endif /* localmod 071 */
#endif /* TCL_QSTAT */

int
main(int argc, char **argv, char **envp) /* qstat */
{
	int added_queue;
	int c;
	int errflg = 0;
	int any_failed = 0;
	extern char *optarg;
	char *conflict = "qstat: conflicting options.\n";
	char *pc;
	int located = FALSE;
	char extend[4];
	int wide = 0;
	int format = 0;
	time_t timenow;

#if TCL_QSTAT
	char option[3];
#endif

	char job_id[PBS_MAXCLTJOBID];

	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME] = {0};
	char prev_server[MAXSERVERNAME] = {0};
	char server_old[MAXSERVERNAME] = "";
	char rmt_server[MAXSERVERNAME];
	char destination[PBS_MAXDEST + 1];

	char *queue_name_out;
	char *server_name_out;

	char operand[PBS_MAXCLTJOBID + 1];
	int alt_opt;
	int f_opt, B_opt, Q_opt, how_opt, E_opt;
	int p_header = TRUE;
	int stat_single_job = 0;
	int new_remote_server = 0;
	enum { JOBS,
	       QUEUES,
	       SERVERS } mode;
	struct batch_status *p_status;
	struct batch_status *p_server = NULL;
	struct attropl *p_atropl = 0;
	struct attropl *new_atropl;
#ifdef NAS /* localmod 071 */
	int tcl_opt;
	struct batch_status *p_rsvstat;
#endif /* localmod 071 */

	char *errmsg;
	char *job_list = NULL;
	size_t job_list_size = 0;
	char *query_job_list = NULL;

#if !defined(PBS_NO_POSIX_VIOLATION)
#ifdef NAS /* localmod 071 */
#define GETOPT_ARGS "aeinpqrstwxu:fGHJMQEBW:T1"
#else
#define GETOPT_ARGS "ainpqrstwxu:fGHJMQEBW:T1F:D:"
#endif /* localmod 071 */
#else
#define GETOPT_ARGS "fQBW:"
#endif /* PBS_NO_POSIX_VIOLATION */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);
	delay_query();
	if (initsocketlib())
		return 1;

	mode = JOBS; /* default */
	alt_opt = 0;
	f_opt = 0;
	B_opt = 0;
	Q_opt = 0;
	E_opt = 0;
	how_opt = 0;
#ifdef NAS /* localmod 071 */
	tcl_opt = -2;
#endif /* localmod 071 */
	extend[0] = '\0';

#if TCL_QSTAT

	tcl_init();
	tcl_addarg(flags, argv[0]);
	option[0] = '-';
	option[2] = '\0';
#endif /* TCL_QSTAT */

	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF) {
#if TCL_QSTAT
		option[1] = (char) c;
		tcl_addarg(flags, option);
		tcl_addarg(flags, optarg);
#endif /* TCL_QSTAT */
		switch (c) {

#if !defined(PBS_NO_POSIX_VIOLATION)

			case 'a':
				alt_opt |= ALT_DISPLAY_a;
				display_attribs = &alt_attribs[0];
				break;

#ifdef NAS /* localmod 071 */
			case 'e':
				tcl_opt += 1;
				break;
#endif /* localmod 071 */

			case 'T':
				alt_opt |= ALT_DISPLAY_T;
				display_attribs = &alt_attribs[0];
				add_atropl((struct attropl **) &display_attribs, ATTR_estimated, "start_time", "", SET);
				add_atropl((struct attropl **) &display_attribs, ATTR_stime, NULL, "", SET);
				break;

			case 'i':
				alt_opt |= ALT_DISPLAY_i;
				display_attribs = &alt_attribs[0];
#ifdef NAS /* localmod 071 */
				add_atropl(&p_atropl, ATTR_state, NULL, "HQTW", EQ);
#else
				add_atropl(&p_atropl, ATTR_state, NULL, "EHQTW", EQ);
#endif /* localmod 071 */
				break;

			case 'r':
				alt_opt |= ALT_DISPLAY_r;
				display_attribs = &alt_attribs[0];
#ifdef NAS /* localmod 071 */
				add_atropl(&p_atropl, ATTR_state, NULL, "BERS", EQ);
#else
				add_atropl(&p_atropl, ATTR_state, NULL, "RS", EQ);
#endif /* localmod 071 */
				break;

			case 'H':
				alt_opt |= ALT_DISPLAY_H;
				display_attribs = &alt_attribs[0];
				if (strchr(extend, (int) 'x') == NULL)
					strcat(extend, "x");
				add_atropl(&p_atropl, ATTR_state, NULL, "MFX", EQ);
				break;

			case 't':
				/* send 't' in extend field to include sub jobs */
				if (strchr(extend, (int) 't') == NULL)
					strcat(extend, "t");
				break;

			case 'x':
				/* send 'x' in extend field to include history jobs */
				if (strchr(extend, (int) 'x') == NULL)
					strcat(extend, "x");
				break;

			case 'u':
				alt_opt |= ALT_DISPLAY_u;
				display_attribs = &alt_attribs[0];
				add_atropl(&p_atropl, ATTR_u, NULL, optarg, EQ);
				break;

			case 'n':
				alt_opt |= ALT_DISPLAY_n;
				if (display_attribs == &basic_attribs[0] || f_opt == 1)
					display_attribs = &alt_attribs[0];
				add_atropl((struct attropl **) &display_attribs, ATTR_exechost,
					   NULL, "", SET);
				f_opt = 0;
				break;

			case 'p':
				how_opt |= ALT_DISPLAY_p;
				add_atropl((struct attropl **) &display_attribs, ATTR_l, NULL, "", EQ);
				add_atropl((struct attropl **) &display_attribs, ATTR_array_state_count, NULL, "", EQ);
				break;

			case 's':
				alt_opt |= ALT_DISPLAY_s;
				if (display_attribs == &basic_attribs[0] || f_opt == 1)
					display_attribs = &alt_attribs[0];
				add_atropl((struct attropl **) &display_attribs, ATTR_comment,
					   NULL, "", SET);
				f_opt = 0;
				break;

			case 'q':
				alt_opt |= ALT_DISPLAY_q;
				mode = QUEUES;
				break;

			case 'G':
				alt_opt |= ALT_DISPLAY_G;
				display_attribs = &alt_attribs[0];
				break;

			case 'J':
				add_atropl(&p_atropl, ATTR_array, NULL, "True", EQ);
				break;

			case 'M':
				alt_opt |= ALT_DISPLAY_Mw;
				display_attribs = &alt_attribs[0];
				break;

			case '1':
				alt_opt |= ALT_DISPLAY_1l;
				break;

			case 'w':
				alt_opt |= ALT_DISPLAY_w;
				wide = 1;
				break;
#endif /* PBS_NO_POSIX_VIOLATION */

			case 'f':
				f_opt = 1;
				display_attribs = NULL; /* get all attributes */
				break;

			case 'B':
				B_opt = 1;
				mode = SERVERS;
				if (Q_opt || (alt_opt && !wide)) {
					fprintf(stderr, "%s", conflict);
					errflg++;
				}
				break;

			case 'Q':
				Q_opt = 1;
				mode = QUEUES;
				if (B_opt || (alt_opt && !wide)) {
					fprintf(stderr, "%s", conflict);
					errflg++;
				}
				break;
			case 'E':
				E_opt = 1;
				break;

			case 'D':
				if (output_format == FORMAT_DSV)
					dsv_delim = optarg;
				else
					errflg++;
				break;

			case 'F':
				for (format = FORMAT_DEFAULT; format < FORMAT_MAX; format++) {
					if (strcasecmp(optarg, output_format_names[format]) == 0) {
						output_format = format;
						break;
					}
				}
				if (format >= FORMAT_MAX)
					errflg++;
				break;

			case 'W':
#if (TCL_QSTAT == 0)
				pc = optarg;
				while (*pc) {
					switch (*pc) {
						case 'a':
							alt_opt |= ALT_DISPLAY_a;
							break;

						case 'i':
							alt_opt |= ALT_DISPLAY_i;
							add_atropl(&p_atropl, ATTR_state, NULL, "EHQTW", EQ);
							break;

						case 'r':
							alt_opt |= ALT_DISPLAY_r;
#ifdef NAS /* localmod 071 */
							add_atropl(&p_atropl, ATTR_state, NULL, "BRS", EQ);
#else
							add_atropl(&p_atropl, ATTR_state, NULL, "RS", EQ);
#endif /* localmod 071 */
							break;

						case 'H':
							alt_opt |= ALT_DISPLAY_H;
							if (strchr(extend, (int) 'x') == NULL)
								strcat(extend, "x");
							add_atropl(&p_atropl, ATTR_state, NULL, "MF", EQ);
							break;

						case 'u':
							/* note - u option is assumed to be last in  */
							/* string and all remaining is the name list */
							alt_opt |= ALT_DISPLAY_u;
							while (*++pc == ' ')
								;
							add_atropl(&p_atropl, ATTR_u, NULL, pc, EQ);
							pc = pc + strlen(pc) - 1; /* for the later incr */
							break;

						case 'n':
							alt_opt |= ALT_DISPLAY_n;
							break;

						case 's':
							alt_opt |= ALT_DISPLAY_s;
							break;

						case 'q':
							alt_opt |= ALT_DISPLAY_q;
							mode = QUEUES;
							break;

						case 'G':
							alt_opt |= ALT_DISPLAY_G;
							break;

						case 'M':
							alt_opt |= ALT_DISPLAY_Mw;
							break;

						case '1':
							alt_opt |= ALT_DISPLAY_1l;
							break;

						case ' ':
							break; /* ignore blanks */

						default:
							errflg++;
					}
					++pc;
				}
#endif /* (TCL_QSTAT == 0) */
				break;

			case '?':
			default:
				errflg++;
		}
	}

#if !defined(PBS_NO_POSIX_VIOLATION)
#ifdef NAS /* localmod 071 */
#if TCL_QSTAT
	if (tcl_opt) {
		display_attribs = NULL; /* get all attributes */
	}
#endif
#endif /* localmod 071 */

	/* certain combinations are not allowed */

#ifdef NAS /* localmod 071 */
	if (f_opt == 1 && alt_opt != 0) {
		fprintf(stderr, conflict);
		errflg++;
	}
#endif /* localmod 071 */
	c = alt_opt & (ALT_DISPLAY_a | ALT_DISPLAY_i | ALT_DISPLAY_r | ALT_DISPLAY_q | ALT_DISPLAY_H);
	if ((c != 0) && ((c != ALT_DISPLAY_a) && (c != ALT_DISPLAY_i) &&
			 (c != ALT_DISPLAY_r) && (c != ALT_DISPLAY_q) &&
			 (c != ALT_DISPLAY_H))) {
		fprintf(stderr, "%s", conflict);
		errflg++;
	}
	c = alt_opt & (ALT_DISPLAY_Mw | ALT_DISPLAY_G);
	if (c == (ALT_DISPLAY_Mw | ALT_DISPLAY_G)) {
		fprintf(stderr, "%s", conflict);
		errflg++;
	}
	if (!(output_format == FORMAT_DEFAULT || f_opt) || (output_format != FORMAT_DEFAULT && alt_opt)) {
		fprintf(stderr, "%s", conflict);
		errflg++;
	}
#ifndef NAS /* localmod 071 */
	if ((alt_opt & ALT_DISPLAY_q) && (f_opt == 1)) {
		fprintf(stderr, "%s", conflict);
		errflg++;
	}
#endif /* localmod 071 */
	if ((alt_opt & ALT_DISPLAY_1l) && !(alt_opt & (ALT_DISPLAY_n | ALT_DISPLAY_s))) {
		fprintf(stderr, "%s", conflict);
		errflg++;
	}
	if (wide) {
		if (output_format != FORMAT_DEFAULT) {
			fprintf(stderr, "qstat: option w cannot be used with -F\n");
			errflg++;
		}
	}
#endif /* PBS_NO_POSIX_VIOLATION */

	if (errflg) {
		static char usag2[] = "qstat --version\n";
		static char usage[] = "usage: \n\
qstat [-f] [-J] [-p] [-t] [-x] [-E] [-F format | -w] [-D delim] [ job_identifier... | destination... ]\n\
qstat [-a|-i|-r|-H|-T] [-J] [-t] [-u user] [-n] [-s] [-G|-M] [-1] [-w]\n\
\t[ job_identifier... | destination... ]\n\
qstat -Q [-f] [-F format] [-D delim] [ destination... ]\n\
qstat -q [-G|-M] [ destination... ]\n\
qstat -B [-f] [-F format] [-D delim] [ server_name... ]\n";
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(2);
	}

	def_server = pbs_default();
	if (def_server == NULL)
		def_server = "";

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS)
		exit_qstat("unable to initialize security library.");

	/* keep original list for reuse with next operand */
	/* in case a queue_name is added to front of list */
	added_queue = 0;
	new_atropl = p_atropl;

	if (output_format == FORMAT_DSV)
		delimiter = dsv_delim;
	else if (output_format == FORMAT_JSON) {
		delimiter = "";
		/* adding prologue to json output. */
		timenow = time(0);
		if ((json_root = pbs_json_create_object()) == NULL)
			exit_qstat("json error");
		if (pbs_json_insert_number(json_root, "timestamp", (double) timenow))
			exit_qstat("json error");
		if (pbs_json_insert_string(json_root, "pbs_version", PBS_VERSION))
			exit_qstat("json error");
		if (pbs_json_insert_string(json_root, "pbs_server", def_server))
			exit_qstat("json error");
	}

	if (optind >= argc) { /* If no arguments, then set defaults */
		switch (mode) {

			case JOBS:
				server_out[0] = '@';
				pbs_strncpy(&server_out[1], def_server, sizeof(server_out) - 1);
				tcl_addarg(ops, server_out);

				job_id_out[0] = '\0';
				server_out[0] = '\0';
				goto job_no_args;
			case QUEUES:
				server_out[0] = '@';
				pbs_strncpy(&server_out[1], def_server, sizeof(server_out) - 1);
				tcl_addarg(ops, server_out);

				queue_name_out = NULL;
				server_out[0] = '\0';
				goto que_no_args;
			case SERVERS:
				tcl_addarg(ops, def_server);

				server_out[0] = '\0';
				goto svr_no_args;
		}
	}
	if (E_opt == 1 && mode == JOBS) {
		/* allocate enough memory to store list of job ids */
		job_list_size = ((argc - 1) * (PBS_MAXCLTJOBID + 1));
		job_list = calloc(argc - 1, PBS_MAXCLTJOBID + 1);
		if (job_list == NULL)
			exit_qstat("out of memory");
		/* sort all jobs */
		qsort(&argv[optind], (argc - optind), sizeof(char *), cmp_jobs);
	}
	for (; optind < argc; optind++) {

		located = FALSE;

		pbs_strncpy(operand, argv[optind], sizeof(operand));
		tcl_addarg(ops, operand);

		switch (mode) {

			case JOBS:			    /* get status of batch jobs */
				if (pbs_isjobid(operand)) { /* must be a job-id */
					stat_single_job = 1;
					pbs_strncpy(job_id, operand, sizeof(job_id));
					if (get_server(job_id, job_id_out, server_out)) {
						fprintf(stderr, "qstat: illegally formed job identifier: %s\n", job_id);
#ifdef NAS /* localmod 071 */
						(void) tcl_stat(error, NULL, tcl_opt);
#else
						(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
						any_failed = 1;
						break;
					}
					if (E_opt == 1) {
						/* Local Server */
						if (server_out[0] == '\0' || (strcmp(server_out, def_server) == 0)) {
							/* This is probably the first job id requested from primary server */
							if (prev_server[0] == '\0')
								pbs_strncpy(prev_server, def_server, sizeof(prev_server));
							strncat(job_list, job_id_out, job_list_size - strlen(job_list));
							strncat(job_list, ",", job_list_size - strlen(job_list));
							if (optind != argc - 1)
								continue;
							else {
								free(query_job_list);
								query_job_list = strdup(job_list);
								job_list[0] = '\0';
							}
						} else {
							/* Remote server but jobs in continuation */
							if ((prev_server[0] == '\0') || (strcmp(server_out, prev_server) == 0)) {
								/* This is probably the first job id requested and not from primary server */
								if (prev_server[0] == '\0')
									pbs_strncpy(prev_server, server_out, sizeof(prev_server));
								strncat(job_list, job_id_out, job_list_size - strlen(job_list));
								strncat(job_list, ",", job_list_size - strlen(job_list));
								if (optind != argc - 1)
									continue;
								else {
									/* It's a new remote server and the only job */
									new_remote_server = 1;
									free(query_job_list);
									query_job_list = strdup(job_list);
									job_list[0] = '\0';
								}
							} else {
								/* A new remote server */
								new_remote_server = 1;
								free(query_job_list);
								query_job_list = strdup(job_list);
								snprintf(job_list, job_list_size, "%s,", job_id_out);
							}
						}
					}
				} else { /* must be a destination-id */
					if (E_opt == 1) {
						fprintf(stderr, "qstat: Express option can only be used with job ids\n");
						return 1;
					}
					stat_single_job = 0;
					pbs_strncpy(destination, operand, sizeof(destination));
					if (parse_destination_id(destination,
								 &queue_name_out,
								 &server_name_out)) {
						fprintf(stderr, "qstat: illegally formed destination: %s\n", destination);
#ifdef NAS /* localmod 071 */
						(void) tcl_stat(error, NULL, tcl_opt);
#else
						(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
						any_failed = 1;
						break;
					} else {
						if (notNULL(server_name_out)) {
							pbs_strncpy(server_out, server_name_out, sizeof(server_out));
						} else {
							server_out[0] = '\0';
						}
						pbs_strncpy(job_id_out, queue_name_out, sizeof(job_id_out));
						if (*queue_name_out != '\0') {
							/* add "destination" to front of list */
							add_atropl(&new_atropl, ATTR_q, NULL, queue_name_out, EQ);
							added_queue = 1;
						}
					}
				}
			job_no_args:
				/* We could have been sent here after p_server was set. Free it. */
				pbs_statfree(p_server);
				p_server = NULL;
				if (E_opt == 1)
					conn = cnt2server(prev_server);
				else
					conn = cnt2server(server_out);

				if (conn <= 0) {
					fprintf(stderr, "qstat: cannot connect to server %s (errno=%d)\n",
						def_server, pbs_errno);
#ifdef NAS /* localmod 071 */
					(void) tcl_stat(error, NULL, tcl_opt);
#else
					(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
					any_failed = conn;
					break;
				}

				if (strcmp(pbs_server, server_old) != 0) {
					/* changing to a different server */
					p_server = pbs_statserver(conn, NULL, NULL);
#ifdef NAS /* localmod 071 */
					p_rsvstat = pbs_statresv(conn, NULL, NULL, NULL);
#endif /* localmod 071 */
					pbs_strncpy(server_old, pbs_server, sizeof(server_old));
				} else {
					p_server = NULL;
				}

				if (p_server == NULL && pbs_errno != PBSE_NONE) {
					any_failed = pbs_errno;
					if ((errmsg = pbs_geterrmsg(conn)) != NULL)
						fprintf(stderr, "qstat: %s\n", errmsg);
					else
						fprintf(stderr, "qstat: Error %d\n", pbs_errno);
					break;
				}

				/* check the server attribute max_job_sequence_id value */
				if (p_server != NULL) {
					int check_seqid_len; /* for dynamic qstat width */
					check_seqid_len = check_max_job_sequence_id(p_server);
					if (check_seqid_len == 1) {
						how_opt |= ALT_DISPLAY_INCR_WIDTH; /* increase column width */
					}
				}

				if ((stat_single_job == 1) || (new_atropl == 0)) {
					if (E_opt == 1)
						p_status = pbs_statjob(conn, query_job_list, display_attribs, extend);
					else
						p_status = pbs_statjob(conn, job_id_out, display_attribs, extend);
				} else {
					p_status = pbs_selstat(conn, new_atropl, NULL, extend);
				}

				if (added_queue) {
					/* added queue name as first entry in atropl list,  */
					/* remove it and reset list pointer to base list    */
					free(new_atropl);
					new_atropl = p_atropl;
					added_queue = 0;
				}
				if (p_status == NULL) {
					if ((pbs_errno == PBSE_UNKJOBID) && !located) {
						located = TRUE;
						if (locate_job(job_id_out, server_out, rmt_server)) {
							pbs_disconnect(conn);
							strcpy(server_out, rmt_server);
							goto job_no_args;
						}
#ifdef NAS /* localmod 071 */
						(void) tcl_stat("job", NULL, tcl_opt);
#else
						(void) tcl_stat("job", NULL, f_opt);
#endif /* localmod 071 */
						if (pbs_errno != PBSE_HISTJOBID) {
							prt_job_err("qstat", conn, job_id_out);
							any_failed = pbs_errno;
						}
					} else {
#ifdef NAS /* localmod 071 */
						if (p_server) {
							tcl_stat("serverhdr", p_server, tcl_opt);
							tcl_stat("resv", p_rsvstat, tcl_opt);
						}
						(void) tcl_stat("job", NULL, tcl_opt);
#else
						(void) tcl_stat("job", NULL, f_opt);
#endif /* localmod 071 */
						if (pbs_errno != PBSE_NONE && pbs_errno != PBSE_HISTJOBID) {
							if (pbs_errno == PBSE_ATTRRO && alt_opt & ALT_DISPLAY_T)
								fprintf(stderr, "qstat: -T option is unavailable.\n");
							else
								prt_job_err("qstat", conn, job_id_out);
							any_failed = pbs_errno;
						}
					}

					/*
					 * If it is qstat command and error is PBSE_HISTJOBID, then
					 * handle it separately without using prt_job_err() API as we
					 * are adding some extra message.
					 */
					if (pbs_errno == PBSE_HISTJOBID) {
						errmsg = pbs_geterrmsg(conn);
						if (errmsg) {
							fprintf(stderr,
								"qstat: %s %s, use -x or -H to obtain historical job information\n",
								job_id_out, errmsg);
						}
						any_failed = pbs_errno;
					}
				} else {

#ifdef NAS /* localmod 071 */
					if (p_server) {
						tcl_stat("serverhdr", p_server, tcl_opt);
						tcl_stat("resv", p_rsvstat, tcl_opt);
					}
					if (tcl_stat("job", p_status, tcl_opt)) {
						if (alt_opt != 0) {
							altdsp_statjob(p_status, p_server, alt_opt, wide, how_opt);
						} else if (display_statjob(p_status, p_server, f_opt, how_opt))
							exit_qstat("out of memory");
					}
#else

					if ((alt_opt & ~ALT_DISPLAY_w) != 0 && !(wide && f_opt)) {
						altdsp_statjob(p_status, p_server, alt_opt, wide, how_opt);
					} else if (f_opt == 0 || tcl_stat("job", p_status, f_opt))
						if (display_statjob(p_status, p_server, f_opt, how_opt, alt_opt, wide))
							exit_qstat("out of memory");
#endif /* localmod 071 */
					p_header = FALSE;
					pbs_statfree(p_status);
				}
				pbs_statfree(p_server);
				p_server = NULL;
				pbs_disconnect(conn);
				if (E_opt == 1) {
					free(query_job_list);
					query_job_list = NULL;
					if (new_remote_server == 1) {
						/* If there is a new remote server
						* then update the prev_server to new server
						*/
						strcpy(prev_server, server_out);
						new_remote_server = 0;
						/* If we are at the end of the loop then
						* query jobs one more time if and only if
						* there are jobs present in job_list
						*/
						if (optind == argc - 1) {
							if (query_job_list != NULL) {
								free(query_job_list);
								query_job_list = NULL;
							}
							if (job_list[0] != '\0') {
								query_job_list = strdup(job_list);
								optind++;
								goto job_no_args;
							}
						}
					}
				}
				break;

			case QUEUES: /* get status of batch queues */
				pbs_strncpy(destination, operand, sizeof(destination));
				if (parse_destination_id(destination,
							 &queue_name_out,
							 &server_name_out)) {
					fprintf(stderr, "qstat: illegal 'destination' value\n");
#ifdef NAS /* localmod 071 */
					(void) tcl_stat(error, NULL, tcl_opt);
#else
					(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
					any_failed = 1;
					break;
				} else {
					if (notNULL(server_name_out)) {
						strcpy(server_out, server_name_out);
					} else
						server_out[0] = '\0';
				}
			que_no_args:
				conn = cnt2server(server_out);
				if (conn <= 0) {
					fprintf(stderr, "qstat: cannot connect to server %s (errno=%d)\n", def_server, pbs_errno);
#ifdef NAS /* localmod 071 */
					(void) tcl_stat(error, NULL, tcl_opt);
#else
					(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
					any_failed = conn;
					break;
				}

				p_status = pbs_statque(conn, queue_name_out, NULL, NULL);
				if (p_status == NULL) {
					if (pbs_errno) {
						errmsg = pbs_geterrmsg(conn);
						if (errmsg != NULL) {
							fprintf(stderr, "qstat: %s ", errmsg);
						} else
							fprintf(stderr, "qstat: Error (%d) getting status of queue ", pbs_errno);
						fprintf(stderr, "%s\n", queue_name_out);
#ifdef NAS /* localmod 071 */
						(void) tcl_stat(error, NULL, tcl_opt);
#else
						(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
						any_failed = pbs_errno;
					}
				} else {
					if (alt_opt & ALT_DISPLAY_q) {
						altdsp_statque(pbs_server, p_status, alt_opt);
#ifdef NAS /* localmod 071 */
					} else if (tcl_stat("queue", p_status, tcl_opt)) {
#else
					} else if (tcl_stat("queue", p_status, f_opt)) {
#endif /* localmod 071 */
						if (display_statque(p_status, p_header, f_opt, alt_opt))
							exit_qstat("out of memory");
					}
					p_header = FALSE;
					pbs_statfree(p_status);
				}
				pbs_disconnect(conn);
				break;

			case SERVERS: /* get status of batch servers */
				pbs_strncpy(server_out, operand, sizeof(server_out));
			svr_no_args:
				conn = cnt2server(server_out);
				if (conn <= 0) {
					fprintf(stderr, "qstat: cannot connect to server %s (errno=%d)\n",
						def_server, pbs_errno);
#ifdef NAS /* localmod 071 */
					(void) tcl_stat(error, NULL, tcl_opt);
#else
					(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
					any_failed = conn;
					break;
				}

				p_status = pbs_statserver(conn, NULL, NULL);
				if (p_status == NULL) {
					if (pbs_errno) {
						errmsg = pbs_geterrmsg(conn);
						if (errmsg != NULL) {
							fprintf(stderr, "qstat: %s ", errmsg);
						} else
							fprintf(stderr, "qstat: Error (%d) getting status of server ", pbs_errno);
						fprintf(stderr, "%s\n", server_out);
#ifdef NAS /* localmod 071 */
						(void) tcl_stat(error, NULL, tcl_opt);
#else
						(void) tcl_stat(error, NULL, f_opt);
#endif /* localmod 071 */
						any_failed = pbs_errno;
					}
				} else {
#ifdef NAS /* localmod 071 */
					if (tcl_stat("server", p_status, tcl_opt))
#else
					if (tcl_stat("server", p_status, f_opt))
#endif /* localmod 071 */
						if (display_statserver(p_status, p_header, f_opt, alt_opt))
							exit_qstat("out of memory");
					p_header = FALSE;
					pbs_statfree(p_status);
				}
				pbs_disconnect(conn);
				break;

		} /* switch */

		if (any_failed == PBSE_PERM)
			break;
	}
	if (output_format == FORMAT_JSON) {
		if (pbs_json_print(json_root, stdout))
			fprintf(stderr, "json error\n");
		pbs_json_delete(json_root);
	}
#ifdef NAS /* localmod 071 */
	tcl_run(tcl_opt);
#else
	tcl_run(f_opt);
#endif /* localmod 071 */
	if (E_opt == 1) {
		if (query_job_list != NULL)
			free(query_job_list);
		free(job_list);
	}
	/*cleanup security library initializations before exiting*/
	CS_close_app();

	/*
	 * If the server is not configured for history jobs i.e. job_history_enable
	 * svr attr is unset/set to FALSE, qstat command with -x/-H option is being
	 * used, then pbs_selstat()/pbs_statjob() will return PBSE_JOBHISTNOTSET
	 * error code. But command will exit with exit code '0'after printing the
	 * corresponding error message. i.e. "job_history_enable is set to false".
	 */
	if (any_failed == PBSE_JOBHISTNOTSET)
		any_failed = 0;
	exit(any_failed);
}

/**
 * @brief
 *	cvtResvstate - converts a job reservation "state code" to
 *	descriptive text string
 *
 * @param[out] pcode - descriptive text string
 *
 * @return	string
 * @retval	Pointer to the descriptive text string
 * @retval	The input pointer if conversion fails
 */

static char *
cvtResvstate(char *pcode)
{
	int i;
	static char *resvStrings[] = {"RESV_NONE", "RESV_UNCONFIRMED",
				      "RESV_CONFIRMED", "RESV_WAIT",
				      "RESV_TIME_TO_RUN", "RESV_RUNNING",
				      "RESV_FINISHED", "RESV_BEING_DELETED",
				      "RESV_DELETED", "RESV_DELETING_JOBS",
				      "RESV_BEING_ALTERED"};

	/*Remark: the static buffer below is used to get around a problem with
	 *	the linux strtok() library function.  There is a "bugs" comment
	 *	on the man page for strtok() that mentions that the function can't
	 *	be called on constant strings.  I presume that this is what is
	 *	causing strtok in prt_attr() to fail when fed the return value
	 *	resvStrings[i], as we had been doing.  So, we return acopy instead
	 */
	static char acopy[25];

	switch (i = atoi(pcode)) {
		case RESV_NONE:
		case RESV_UNCONFIRMED:
		case RESV_CONFIRMED:
		case RESV_WAIT:
		case RESV_TIME_TO_RUN:
		case RESV_RUNNING:
		case RESV_FINISHED:
		case RESV_BEING_DELETED:
		case RESV_DELETED:
		case RESV_DELETING_JOBS:
		case RESV_BEING_ALTERED:
			pbs_strncpy(acopy, resvStrings[i], sizeof(acopy));
			return acopy;

		default:
			return pcode;
	}
}

/*!
 *	cmp_est_time -  compare function used with bs_isort
 *		        compares based on:
 *			1. stime
 *			2. if estimated.start_time < now sort to bottom
 *			3. estimated.start_time
 *
 *	\param a
 *	\param b
 *
 *	\return -1: a < b
 *	\return  0: a == b
 *	\return  1: a > b
 *
 */
static int
cmp_est_time(struct batch_status *a, struct batch_status *b)
{
	char *attrval;
	time_t est_a = -1;
	time_t est_b = -1;
	time_t stime_a = -1;
	time_t stime_b = -1;
	time_t now;

	attrval = get_attr(a->attribs, ATTR_estimated, "start_time");
	if (attrval != NULL)
		est_a = atol(attrval);

	attrval = get_attr(b->attribs, ATTR_estimated, "start_time");
	if (attrval != NULL)
		est_b = atol(attrval);

	attrval = get_attr(a->attribs, ATTR_stime, NULL);
	if (attrval != NULL)
		stime_a = atol(attrval);

	attrval = get_attr(b->attribs, ATTR_stime, NULL);
	if (attrval != NULL)
		stime_b = atol(attrval);

	/* sort running jobs first by stime */
	if (stime_a >= 0 || stime_b >= 0) {
		if (stime_a == -1 && stime_b >= 0)
			return 1;
		else if (stime_a >= 0 && stime_b == -1)
			return -1;
		else if (stime_a < stime_b)
			return -1;
		else if (stime_a > stime_b)
			return 1;
		else
			return 0;
	}

	if (est_a == est_b)
		return 0;

	time(&now);
	/* if estimated start time is before now, sort to bottom */
	if (est_a == -1 || est_a < now)
		return 1;

	if (est_b == -1 || est_b < now)
		return -1;

	if (est_a < est_b)
		return -1;

	if (est_a > est_b)
		return 1;

	return 0;
}

#define SEC_IN_WEEK 604800
/*!
 *	cnvt_est_start_time - convert estimated start time to a time form
 *			      either a short form of 5 characters or the
 *			      wider form of convert_time().
 *
 *	\param est_time - the string value of estimated.start time
 *				ex: "1247683654"
 *	\param wide	- 1 if we should use the wide format 0 if not
 *
 *	\return converted time string
 *	\return "--" if estimated.start_time  < now or est_time == NULL
 *	\return "?" if estimated.start_time == 0
 *
 */
char *
cnvt_est_start_time(char *est_time, int wide)
{
	time_t t;
	time_t start_time;
	char buf[16];
	char buf2[16];
	static char timebuf[32];
	struct tm *tmptr;
	struct tm nowtm;
	struct tm esttm;

	if (est_time == NULL)
		return "--";

	start_time = atol(est_time);

	/* special case: unknown estimated start time: return "?" */
	if (start_time == 0)
		return "?";

	time(&t);
	tmptr = localtime(&t);
	if (tmptr != NULL) {
		nowtm = *tmptr;
		tmptr = localtime(&start_time);
		if (tmptr != NULL)
			esttm = *tmptr;
		else
			return "--";
	} else
		return "--";

	/* special case: estimated start time before now: return "--" */
	if (start_time < t)
		return "--";

	if (wide)
		return convert_time(est_time);

	/* within the current day: HH:MM */
	if (nowtm.tm_year == esttm.tm_year && nowtm.tm_yday == esttm.tm_yday) {
		strftime(timebuf, 32, "%H:%M", &esttm);
	} /* within 7 days of now */
	else if ((start_time - t) < SEC_IN_WEEK) {
		strftime(buf, 16, "%a", &esttm);
		strftime(buf2, 16, "%H", &esttm);
		snprintf(timebuf, 32, "%2.2s %s", buf, buf2);
	} /* within the current year: short form of the month */
	else if (nowtm.tm_year == esttm.tm_year) {
		strftime(timebuf, 32, "%b", &esttm);
		/* after the current year: the 4 digit year */
	} else if (esttm.tm_year - nowtm.tm_year < 5) {
		strftime(timebuf, 32, "%Y", &esttm);
	} else { /* after 5 years, print ">5yrs" */
		strcpy(timebuf, ">5yrs");
	}

	return timebuf;
}


================================================
FILE: src/cmds/qstop.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qstop.c
 * @brief
 *  The qstop command directs that a destination should stop scheduling
 *  or routing batch jobs.
 *
 * @par	Synopsis:
 *  qstop destination ...
 *
 * @par Arguments:
 *  destination ...
 *      A list of destinations.  A destination has one of the following
 *      three forms:
 *          queue
 *          @server
 *          queue@server
 *      If queue is specified, the request is to stop the queue at
 *      the default server.  If @server is given, the request is to
 *      stop all queues at the server.  If queue@server is used,
 *      the request is to stop the named queue at the named server.
 *
 *  @author	Bruce Kelly
 *  		National Energy Research Supercomputer Center, Livermore, CA
 *  		May, 1993
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include <pbs_version.h>

int exitstatus = 0; /* Exit Status */
static void execute(char *, char *);

int
main(int argc, char **argv)
{
	/*
	 *  This routine sends a Manage request to the batch server specified by
	 * the destination.  The STARTED queue attribute is set to {False}.  If the
	 * batch request is accepted, the server will stop scheduling or routing
	 * requests for the specified queue.
	 */

	int dest;     /* Index into the destination array (argv) */
	char *queue;  /* Queue name part of destination */
	char *server; /* Server name part of destination */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	if (argc == 1) {
		fprintf(stderr, "Usage: qstop [queue][@server] ...\n");
		fprintf(stderr, "       qstop --version\n");
		exit(1);
	}

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qstop: unable to initialize security library.\n");
		exit(1);
	}

	for (dest = 1; dest < argc; dest++)
		if (parse_destination_id(argv[dest], &queue, &server) == 0)
			execute(queue, server);
		else {
			fprintf(stderr, "qstop: illegally formed destination: %s\n",
				argv[dest]);
			exitstatus = 1;
		}

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(exitstatus);
}

/**
 * @brief
 *	disables a destination (queue)
 *
 * @param queue - The name of the queue to disable.
 * @param server - The name of the server that manages the queue.
 *
 * @return - Void
 *
 * @File Variables:
 * exitstatus  Set to two if an error occurs.
 *
 */
static void
execute(char *queue, char *server)
{
	int ct;	      /* Connection to the server */
	int merr;     /* Error return from pbs_manager */
	char *errmsg; /* Error message from pbs_manager */
	/* The disable request */
	static struct attropl attr = {NULL, "started", NULL, "FALSE", SET};

	if ((ct = cnt2server(server)) > 0) {
		merr = pbs_manager(ct, MGR_CMD_SET, MGR_OBJ_QUEUE, queue, &attr, NULL);
		if (merr != 0) {
			errmsg = pbs_geterrmsg(ct);
			if (errmsg != NULL) {
				fprintf(stderr, "qstop: %s ", errmsg);
			} else {
				fprintf(stderr, "qstop: Error (%d) disabling queue ", pbs_errno);
			}
			if (notNULL(queue))
				fprintf(stderr, "%s", queue);
			if (notNULL(server))
				fprintf(stderr, "@%s", server);
			fprintf(stderr, "\n");
			exitstatus = 2;
		}
		pbs_disconnect(ct);
	} else {
		fprintf(stderr, "qstop: could not connect to server %s (%d)\n", server, pbs_errno);
		exitstatus = 2;
	}
}


================================================
FILE: src/cmds/qsub.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qsub.c
 * @brief
 *	qsub - (PBS) submit batch job
 *
 * @author Terry Heidelberg
 *         Livermore Computing
 *
 * @author Bruce Kelly
 *         National Energy Research Supercomputer Center
 *
 * @author Lawrence Livermore National Laboratory
 *         University of California
 */

/**
 * @file    qsub.c
 *
 * @brief
 * qsub now has two components:
 * A forground process and a background process.
 * - The background process is loaded initially (per user, per target server)
 *   by the foreground.
 * - The background process reuses a authenticated server connection.
 * - The foreground process sends job information to background process
 *   which in turn communicates over the already established connection to the
 *   server. It returns back any jobid or error string (and code) to the
 *   foreground process.
 * - The background process quits silently if:
 *    a) The connection to the server is lost
 *    b) There are no requests sent to it for the last 1 minute.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>

#include <sys/types.h>
#include <sys/socket.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <sys/utsname.h>
#include <sys/wait.h>
#include <netinet/in.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <signal.h>
#include <termios.h>
#include <assert.h>
#include <sys/un.h>
#include <syslog.h>
#include <unistd.h>
#include "pbs_ifl.h"
#include "cmds.h"
#include "libpbs.h"
#include "net_connect.h"
#include "dis.h"
#include "port_forwarding.h"
#include "credential.h"
#include "ticket.h"
#include "portability.h"

#ifdef LOG_BUF_SIZE
/* Also defined in port_forwarding.h */
#undef LOG_BUF_SIZE
#endif

#define LOG_BUF_SIZE 1024
#define ENV_PBS_JOBID "PBS_JOBID"
#define CMDLINE 3

#undef DEBUG
#undef DBPRT
#ifdef DEBUG
#define DBPRT(x) printf x;
#else
#define DBPRT(x)
#endif

#if defined(HAVE_SYS_IOCTL_H)
#include <sys/ioctl.h>
#endif /* HAVE_SYS_IOCTL_H */

#if defined(FD_SET_IN_SYS_SELECT_H)
#include <sys/select.h>
#endif

/*
 * For the purpose of unit testing, qsub is capable of printing a backtrace
 * when it exits with a non-zero status. This behavior is limited to systems
 * that support the backtrace(3) library function. To enable this behavior,
 * define the BACKTRACE_SIZE macro immediately following this comment. The
 * value assigned to BACKTRACE_SIZE is an integer that defines the maximum
 * depth of the backtrace. For example:
 * #define BACKTRACE_SIZE 100
 */
#ifdef BACKTRACE_SIZE
#include <execinfo.h>
#endif

#define MAX_QSUB_PREFIX_LEN 32
#define DMN_REFUSE_EXIT 7 /* return code when daemon can't serve a job and exits */

extern char *msg_force_qsub_update;

#define PBS_DPREFIX_DEFAULT "#PBS"
#define PBS_O_ENV "PBS_O_" /* prefix for environment variables created by qsub */

/* Warning/Error messages */
#define INTER_GUI_WARN "qsub: only interactive jobs can have GUI\n"
#define INTER_BLOCK_WARN "qsub (Warning) : setting \"block\" attribute as \"true\"" \
			 " for an interactive job will not return job's exit status\n"
#define INTER_ARRAY "qsub: interactive and array job submission cannot be used together\n"
#define NO_RERUN_ARRAY "qsub:  cannot submit non-rerunable Array Job\n"
#define INTER_RERUN_WARN "qsub (Warning): Interactive jobs will be treated as not rerunnable\n"
#define BAD_W "qsub: illegal -W value\n"
#define MULTIPLE_MAX_RUN "qsub: multiple max_run_subjobs values found\n"

/* Security library variables */
static int cs_init = 0; /*1 == security library initialized, 0 == not initialized*/
static int cred_type = -1;
size_t cred_len = 0;
char *cred_buf = NULL;
char cred_name[32];  /* space to hold small credential name */
char *tmpdir = NULL; /* Path of temp directory in which to put the job script */

/* variables for Interactive mode */
int comm_sock; /* Socket for interactive and block job */

#define X11_MSG_OFFSET sizeof(XAUTH_ERR_REDIRECTION) /* offset of the redirection clause */

extern char fl[];
char retmsg[MAXPATHLEN];				 /* holds the message that background qsub process will send */
char qsub_cwd[MAXPATHLEN + 1];				 /* buffer to pass cwd to background qsub */
char *new_jobname = NULL;				 /* return from submit request */
char destination[PBS_MAXDEST];				 /* Destination of the batch job, specified by q opt */
char server_out[PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2]; /* Destination server, parsed from destination[] */
char script_tmp[MAXPATHLEN + 1] = {'\0'};		 /* name of script file copy */
int sd_svr;						 /* return from pbs_connect */
char *display;						 /* environment variable DISPLAY */
struct attrl *attrib = NULL;				 /* Attribute list */
static struct attrl *attrib_o = NULL;			 /* Original attribute list, before applying default_qsub_arguments */
static char dir_prefix[MAX_QSUB_PREFIX_LEN + 1];	 /* Directive Prefix, specified by C opt */
static struct batch_status *ss = NULL;
static char *dfltqsubargs = NULL;			/* Default qsub arguments */
static char *pbs_hostvar = NULL;			/* buffer containing ",PBS_O_HOST=" and host name */
static int pbs_o_hostsize = sizeof(",PBS_O_HOST=") + 1; /* size of prefix for hostvar */

int pid = -1;

/*
 * Flag to check if current process is the background process.
 * This variable is set only once and is read-only afterwards.
 */
int is_background = 0;
char *basic_envlist = NULL;    /* basic comma-separated environment variables list string */
char *qsub_envlist = NULL;     /* comma-separated variables list string */
char *v_value = NULL;	       /* expanded variable list from v opt */
static int no_background = 0;  /* flag to disable backgrounding */
static char roptarg = 'y';     /* whether the job is rerunnable */
static char *v_value_o = NULL; /* copy of v_value before set_job_env() */
static int x11_disp = FALSE;   /* whether DISPLAY environment variable is available */

/* state booleans for protecting already-set options */
static int a_opt = FALSE;
static int c_opt = FALSE;
static int e_opt = FALSE;
static int h_opt = FALSE;
static int j_opt = FALSE;
static int k_opt = FALSE;
static int l_opt = FALSE;
static int m_opt = FALSE;
static int o_opt = FALSE;
static int p_opt = FALSE;
static int q_opt = FALSE;
static int r_opt = FALSE;
static int u_opt = FALSE;
static int v_opt = FALSE;
static int z_opt = FALSE;
static int A_opt = FALSE;
static int C_opt = FALSE;
static int J_opt = FALSE;
static int M_opt = FALSE;
static int N_opt = FALSE;
static int P_opt = FALSE;
static int R_opt = FALSE;
static int S_opt = FALSE;
static int V_opt = FALSE;
static int Depend_opt = FALSE;
static int Stagein_opt = FALSE;
static int Stageout_opt = FALSE;
static int Sandbox_opt = FALSE;
static int Grouplist_opt = FALSE;
static int Resvstart_opt = FALSE;
static int Resvend_opt = FALSE;
static int pwd_opt = FALSE;
static int cred_opt = FALSE;
static int block_opt = FALSE;
static int relnodes_on_stageout_opt = FALSE;
static int tolerate_node_failures_opt = FALSE;
static int roptarg_inter = FALSE;
int Interact_opt = FALSE;
int Forwardx11_opt = FALSE;
int gui_opt = FALSE;

/* for saving option booleans */
static int a_opt_o = FALSE;
static int c_opt_o = FALSE;
static int e_opt_o = FALSE;
static int h_opt_o = FALSE;
static int j_opt_o = FALSE;
static int k_opt_o = FALSE;
static int l_opt_o = FALSE;
static int m_opt_o = FALSE;
static int o_opt_o = FALSE;
static int p_opt_o = FALSE;
static int q_opt_o = FALSE;
static int r_opt_o = FALSE;
static int u_opt_o = FALSE;
static int v_opt_o = FALSE;
static int z_opt_o = FALSE;
static int A_opt_o = FALSE;
static int C_opt_o = FALSE;
static int J_opt_o = FALSE;
static int M_opt_o = FALSE;
static int N_opt_o = FALSE;
static int P_opt_o = FALSE;
static int S_opt_o = FALSE;
static int V_opt_o = FALSE;
static int Depend_opt_o = FALSE;
static int Interact_opt_o = FALSE;
static int Stagein_opt_o = FALSE;
static int Stageout_opt_o = FALSE;
static int Sandbox_opt_o = FALSE;
static int Grouplist_opt_o = FALSE;
static int gui_opt_o = FALSE;
static int Resvstart_opt_o = FALSE;
static int Resvend_opt_o = FALSE;
static int pwd_opt_o = FALSE;
static int cred_opt_o = FALSE;
static int block_opt_o = FALSE;
static int relnodes_on_stageout_opt_o = FALSE;
static int tolerate_node_failures_opt_o = FALSE;
static int max_run_opt = FALSE;

extern char **environ;

extern void blockint(int sig);
extern void do_daemon_stuff();
extern void enable_gui(void);
extern void set_sig_handlers(void);
extern void interactive(void);
extern int dorecv(void *, char *, int);
extern int dosend(void *, char *, int);
extern int daemon_submit(int *, int *);
extern int get_script(FILE *, char *, char *);
extern int check_for_background(int, char **);

void exit_qsub(int exitstatus);

/* The following are "Utility" functions. */

/**
 * @brief
 * 	Process comma separated tokens with consideration for quotes.
 *
 * @param[in]	str	source string to scan for tokens
 *
 * @retval	NULL	no more tokens
 *
 */
static char *
comma_token(char *str)
{
	static char *p = NULL;
	char quote = 0;
	char *tok;

	if (str != NULL)
		p = str;

	/* check for no more tokens */
	if ((p == NULL) || (*p == 0))
		return NULL;

	tok = p;
	for (; *p != '\0'; p++) {
		switch (*p) {

			case '\'':
			case '"':
				if (*p == quote) /* ending quote */
					quote = 0;
				else /* starting quote */
					quote = *p;
				break;

			case ',':
				if (quote == 0) { /* normal comma */
					*p++ = 0; /* terminate token */
					return tok;
				}
				break; /* comma inside quotes, keep scanning */

			case ESC_CHAR:		   /* pass over next char */
				if (*(p + 1) != 0) /* check '\' is not last */
					p++;
				break;
		}
	}
	return tok;
}

/**
 * @brief
 *      Copy an environment variable to a specified location
 *
 * @param[in]	dest	- The destination address
 * @param[in]   pv	- The source address
 * @param[in]   quote_flg - Whether quote characters should be escaped
 *
 * @return	char*
 * @retval	NULL - Failure
 * @retval	!NULL - Success - Pointer to pv parameter
 */
static char *
copy_env_value(char *dest, char *pv, int quote_flg)
{
	int go = 1;
	int q_ch = 0;
	int is_func = 0;
	char *dest_full = dest;

	while (*dest)
		++dest;

	is_func = ((*pv == '(') && (*(pv + 1) == ')') && (*(pv + 2) == ' ') && (*(pv + 3) == '{'));

	/*
	 * Keep the list of special characters consistent with encode_arst_bs()
	 * and parse_comma_string_bs().
	 */

	while (go && *pv) {
		switch (*pv) {
			case '"':
			case '\'':
				if (q_ch) { /* local quoting is in progress */
					if (q_ch == (int) *pv) {
						q_ch = 0; /* end quote */
					} else {
						*dest++ = ESC_CHAR; /* escape quote */
						*dest++ = *pv;
					}
				} else if (quote_flg) {	    /* global quoting is on */
					*dest++ = ESC_CHAR; /* escape quote */
					*dest++ = *pv;
				} else {
					q_ch = (int) *pv; /* turn local quoting on */
				}
				break;

			case ESC_CHAR: /* backslash in value, escape it */
				*dest++ = *pv;
				if (*(pv + 1) != ',') /* do not escape if ESC_CHAR already escapes */
					*dest++ = *pv;
				break;

			case ',':
				if (q_ch || quote_flg) {
					*dest++ = ESC_CHAR;
					*dest++ = *pv;
				} else if (dest_full != dest && *(dest - 1) == ESC_CHAR) { /* the comma is escaped, not finished yet */
					*dest++ = *pv;
				} else {
					go = 0; /* end of value string */
				}
				break;

			case ';':
				*dest++ = *pv;
				if (is_func && (*(pv + 1) == '\n'))
					pv++;
				break;

			default:
				*dest++ = *pv;
				break;
		}
		pv++;
	}

	*dest = '\0';
	if (q_ch)
		return NULL; /* error-unterminated quote */
	else
		return (pv);
}

/**
 * @brief
 *	Given a comma-separated list of "variable" or "variable=value"
 *	entries, return a new variable list with those "variable" entries
 *	expanded to contain their values obtained from the current
 *	environment.
 *
 * @param[in] varlist - variable list
 *
 * @return char *
 *	The malloced list of expanded variables list.
 *	NULL if any error encountered.
 *
 */
static char *
expand_varlist(char *varlist)
{
	char *v_value1 = NULL;
	char *v_value2 = NULL;
	char *vn = NULL;
	char *vv = NULL;
	char *p1, *p2, *p;
	char *ev;
	char *ev2;
	int v_value1_sz = 0;
	char *pc;
	int special_char_cnt = 0;
	int len = 0;
	int esc_char_cnt = 0;

	/*
	 * count special characters as they are escaped with '\' in copy_env_value function
	 * so that this is useful while calculating the accurate size of the destination string.
	 * Also calculating the length of the string.
	 */
	pc = varlist;
	for (; *pc; pc++) {
		if ((*pc == '"') || (*pc == '\'') || (*pc == ',') || (*pc == '\\'))
			special_char_cnt++;
		len++;
	}

	v_value1_sz = len + special_char_cnt + 1;
	/* final copy */
	v_value1 = malloc(v_value1_sz);
	if (v_value1 == NULL) {
		fprintf(stderr, "qsub: out of memory\n");
		return NULL;
	}
	v_value1[0] = '\0';

	/* working copy */
	v_value2 = strdup(varlist);
	if (v_value2 == NULL) {
		fprintf(stderr, "qsub: out of memory\n");
		goto expand_varlist_err;
	}

	p1 = comma_token(v_value2);
	while (p1 != NULL) {
		vn = p1;
		vv = NULL;
		if ((p2 = strchr(p1, '=')) != NULL) {
			*p2 = '\0';
			vv = p2 + 1;
		}
		if ((vv == NULL) && (strncmp(vn, PBS_O_ENV, sizeof(PBS_O_ENV) - 1) != 0)
				 && (strncmp(vn, PBS_JOBCOOKIE, sizeof(PBS_JOBCOOKIE) - 1) != 0)
				 && (strncmp(vn, PBS_INTERACTIVE_COOKIE, sizeof(PBS_INTERACTIVE_COOKIE) - 1) != 0)) {
			/* do not add PBS_O_* env variables, as these are set by qsub
			 * Job related cookies should not be sent and are excluded to
			 * prevent exposing internal PBS interactive session information. */

			ev = getenv(vn);
			if (ev == NULL) {
				fprintf(stderr, "qsub: cannot send environment with the job\n");
				goto expand_varlist_err;
			}
			/* count escape characters as they are escaped with '\'*/
			ev2 = ev;
			len = 0;
			for (; *ev2; ev2++) {
				if ((*ev2 == ESC_CHAR))
					esc_char_cnt++;

				len++;
			}
			v_value1_sz = v_value1_sz + len + esc_char_cnt + 1; /* include '=' */
			p = realloc(v_value1, v_value1_sz);
			if (p == NULL) {
				fprintf(stderr, "qsub: out of memory\n");
				goto expand_varlist_err;
			}
			v_value1 = p;
			if (v_value1[0] != '\0')
				strcat(v_value1, ",");
			strcat(v_value1, vn);
			strcat(v_value1, "=");

			if (copy_env_value(v_value1, ev, 1) == NULL) {
				fprintf(stderr, "qsub: cannot send environment with the job\n");
				goto expand_varlist_err;
			}
		} else if (vv != NULL) {
			/* no need to adjust */
			if (v_value1[0] != '\0')
				strcat(v_value1, ",");
			strcat(v_value1, vn);
			strcat(v_value1, "=");
			if (copy_env_value(v_value1, vv, 0) == NULL) {
				fprintf(stderr, "qsub: cannot send environment with the job\n");
				goto expand_varlist_err;
			}
		}

		p1 = comma_token(NULL);
	}
	free(v_value2);
	return (v_value1);

expand_varlist_err:
	free(v_value1);
	free(v_value2);
	return NULL;
}

/**
 * @brief
 *	Query the server for a new value to "default_qsub_arguments".
 * @note
 *	References the global variables 'sd_svr', 'ss', and "dfltqsubargs'.
 *	'dfltqsubargs' is updated with the new value.
 *
 */
static void
refresh_dfltqsubargs(void)
{
	struct attrl *attr;
	struct batch_status *ss_save = NULL;
	char *errmsg;

	if (sd_svr == -1)
		return;

	free(dfltqsubargs);

	dfltqsubargs = NULL;
	ss = pbs_statserver(sd_svr, NULL, NULL);

	if (ss == NULL && pbs_errno != PBSE_NONE) {
		if ((errmsg = pbs_geterrmsg(sd_svr)) != NULL)
			fprintf(stderr, "qsub: %s\n", errmsg);
		else
			fprintf(stderr, "qsub: Error %d\n", pbs_errno);
		return;
	}

	ss_save = ss;
	while (ss != NULL) {
		for (attr = ss->attribs; attr != NULL; attr = attr->next) {
			if (strcmp(attr->name, ATTR_dfltqsubargs) == 0) {
				dfltqsubargs = strdup(attr->value);
				break;
			}
		}
		ss = ss->next;
	}
	pbs_statfree(ss_save);
}

/**
 * @brief
 *	exit_qsub - issues the exit system call with the "exit" argument after
 * 	doing and needed library shutdown.
 *
 * @param[in] exitstatus integer value indiacting exit
 *
 * @return None
 *
 */
void
exit_qsub(int exitstatus)
{
	/* A thread that makes qsub exit, should try and acquire the Critical Section. */
	critical_section();

	if (cs_init == 1)
		/* Cleanup security library initializations before exiting */
		CS_close_app();

#ifdef BACKTRACE_SIZE
	if (exitstatus != 0) {
		int i, frames;
		void *bt_buf[BACKTRACE_SIZE];
		char **bt_strings;

		frames = backtrace(bt_buf, BACKTRACE_SIZE);
		printf("Backtrace has %d frames.\n", frames);
		bt_strings = backtrace_symbols(bt_buf, frames);
		if (bt_strings == NULL) {
			printf("No backtrace symbols present!\n");
		} else {
			for (i = 0; i < frames; i++) {
				printf("%s\n", bt_strings[i]);
			}
			free(bt_strings);
		}
	}
#endif

	exit(exitstatus);
}

/**
 * @brief
 *	strdup_esc_commas - duplicate a string escaping commas
 *	The string is duplicated with all commas in the original string
 *	escaped by preceding escape character.
 *
 * @param[in] str_to_dup - string to be duplicated
 *
 * @return
 * @retval string Succes
 * @retval NULL   Failure
 */
char *
strdup_esc_commas(char *str_to_dup)
{
	char *roaming = str_to_dup;
	char *endstr, *returnstr;

	if (str_to_dup == NULL)
		return NULL;

	returnstr = endstr = malloc(strlen(str_to_dup) * 2 + 2);
	/* even for an all-comma string, this should suffice */
	if (returnstr == NULL)
		return NULL; /* just return null on malloc failure */
	while (*roaming != '\0') {
		while (*roaming != '\0' && *roaming != ',')
			*(endstr++) = *(roaming++);
		if (*roaming == ',') {
			*(endstr++) = ESC_CHAR;
			*(endstr++) = ',';
			roaming++;
		}
	}
	*endstr = '\0';
	return (returnstr);
}

/**
 * @brief
 *	prints the usage format for qsub
 *
 */
static void
print_usage(void)
{
	static char usage2[] = "       qsub --version\n";
	extern char usage[];
	fprintf(stderr, "%s", usage);
	fprintf(stderr, "%s", usage2);
}

/* End of "Utility" functions. */

/* The following functions support the "Interactive Job" capability of PBS. */

/**
 * @brief
 * 	interactive_port - get a socket to listen to for "interactive" job
 *	When the "interactive" job is run, its standard in, out, and error
 *	will be connected to this socket.
 *
 * @return string
 * @retval portstring holding port info
 * @note exits from program on failure
 *
 */
static char *
interactive_port(void)
{
	pbs_socklen_t namelen;
	static char portstring[8];
	struct sockaddr_in myaddr;
	unsigned short port;

	if ((isatty(0) == 0) || (isatty(1) == 0)) {
		fprintf(stderr, "qsub:\tstandard input and output must be a terminal for\n"
				"\tinteractive job submission\n");
		exit_qsub(1);
	}
	comm_sock = socket(AF_INET, SOCK_STREAM, 0);
	if (comm_sock < 0) {
		perror("qsub: unable to obtain socket");
		exit_qsub(1);
	}
	myaddr.sin_family = AF_INET;
	myaddr.sin_addr.s_addr = INADDR_ANY;
	myaddr.sin_port = 0;
	if (bind(comm_sock, (struct sockaddr *) &myaddr, sizeof(myaddr)) < 0) {
		perror("qsub: unable to bind to socket");
		exit_qsub(1);
	}

	/* get port number assigned */

	namelen = sizeof(myaddr);
	if (getsockname(comm_sock, (struct sockaddr *) &myaddr, &namelen) < 0) {
		perror("qsub: unable to get port number");
		exit_qsub(1);
	}
	port = ntohs(myaddr.sin_port);
	(void) sprintf(portstring, "%u", (unsigned int) port);
	if (listen(comm_sock, 1) < 0) {
		perror("qsub: listen on interactive socket");
		exit_qsub(1);
	}

	return (portstring);
}

/**
 * @brief
 *	Shut and Close a socket
 *
 * @param	sock	file descriptor
 *
 * @return Void
 *
 */
static void
shut_close_sock(int sock)
{
	shutdown(sock, 2);
	closesocket(sock);
}

/**
 * @brief
 * 	send delete job request, disconnect with server and exit qsub
 *
 * @param[in]	ret	qsub exit code
 *
 * @return      void
 *
 */
void
bailout(int ret)
{
	int c;

	shut_close_sock(comm_sock);
	printf("Job %s is being deleted\n", new_jobname);
	c = cnt2server(server_out);
	if (c <= 0) {
		fprintf(stderr,
			"qsub: cannot connect to server %s (errno=%d)\n",
			pbs_server, pbs_errno);
		exit_qsub(1);
	}
	(void) pbs_deljob(c, new_jobname, NULL);
	pbs_disconnect(c);
	exit_qsub(ret);
}

/* The following functions support the "Block Job" capability of PBS. */

/**
 * @brief
 *	creates a socket and blocks the port
 *
 * @return char *
 * @retval portstring string holding port info
 *
 */
static char *
block_port(void)
{
	pbs_socklen_t namelen;
	static char portstring[8];
	struct sockaddr_in myaddr;
	unsigned short port;

	comm_sock = socket(AF_INET, SOCK_STREAM, 0);
	if (comm_sock < 0) {
		perror("qsub: unable to obtain socket");
		exit_qsub(1);
	}
	myaddr.sin_family = AF_INET;
	myaddr.sin_addr.s_addr = INADDR_ANY;
	myaddr.sin_port = 0;
	if (bind(comm_sock, (struct sockaddr *) &myaddr, sizeof(myaddr)) < 0) {
		perror("qsub: unable to bind to socket");
		exit_qsub(1);
	}

	/* get port number assigned */

	namelen = sizeof(myaddr);
	if (getsockname(comm_sock, (struct sockaddr *) &myaddr, &namelen) < 0) {
		perror("qsub: unable to get port number");
		exit_qsub(1);
	}
	port = ntohs(myaddr.sin_port);
	(void) sprintf(portstring, "%u", (unsigned int) port);
	DBPRT(("block_port: %s\n", portstring))

	if (listen(comm_sock, 1) < 0) {
		perror("qsub: listen on block socket");
		exit_qsub(1);
	}

	return (portstring);
}

int sig_happened = 0;

#define BAIL(message)             \
	if (ret != DIS_SUCCESS) { \
		fail = message;   \
		goto err;         \
	}

/**
 * @brief
 *	block - set up to wait for a job to end.
 *
 * @return Void
 * Exits on failre
 *
 */
static void
block(void)
{
	struct sockaddr_in from;
	pbs_socklen_t fromlen;
	char *jobid = "none";
	char *message = NULL;
	char *fail = NULL;
	int news;
	int ret;
	int version;
	int exitval;

#ifndef WIN32
	struct sigaction act;

	/* Catch SIGHUP, SIGINT, SIGQUIT and SIGTERM */

	sigemptyset(&act.sa_mask);
	act.sa_handler = blockint;
	act.sa_flags = 0;
	if ((sigaction(SIGHUP, &act, NULL) < 0) ||
	    (sigaction(SIGINT, &act, NULL) < 0) ||
	    (sigaction(SIGQUIT, &act, NULL) < 0) ||
	    (sigaction(SIGTERM, &act, NULL) < 0)) {
		perror("qsub: unable to catch signals");
		exit_qsub(1);
	}
#endif

retry:
	fromlen = sizeof(from);
	if ((news = accept(comm_sock, (struct sockaddr *) &from,
			   &fromlen)) < 0) {
#ifdef WIN32
		if (errno == WSAEINTR)
#else
		if (errno == EINTR)
#endif
		{
			fprintf(stderr, "qsub: wait for job %s "
					"interrupted by signal %d\n",
				new_jobname, sig_happened);
			bailout(2);
		}
		perror("qsub: accept error");
		exit_qsub(1);
	}
	DBPRT(("got connection from %s:%d\n", inet_ntoa(from.sin_addr), (int) ntohs(from.sin_port)))

	/*
	 * if SIGINT or SIGBREAK interrupt is raised, then child thread win_blockint()
	 * does job deletion and other related stuff. So main thread can exit now.
	 */

#ifdef WIN32
	if ((sig_happened == SIGINT) || (sig_happened == SIGBREAK))
		exit_qsub(3);
#endif

	/* When Mom connects back, the first thing that needs
	 * to happen is to engage in an authentication activity.
	 * Any return value other than CS_SUCCESS or CS_AUTH_USE_IFF
	 * means the authentication failed.
	 */
	ret = CS_client_auth(news);

	if ((ret != CS_SUCCESS) && (ret != CS_AUTH_USE_IFF)) {
		fprintf(stderr, "qsub: failed authentication with execution host\n");
		shut_close_sock(news);
		goto retry;
	}

	DIS_tcp_funcs();
	version = disrsi(news, &ret);
	if (ret != DIS_SUCCESS) {
		/*
		 * We couldn't read data so try again if it is a port scan.
		 */
		shut_close_sock(news);
		goto retry;
	}
	if (version != 1) {
		fprintf(stderr, "qsub: unknown protocol version %d\n", version);
		shut_close_sock(news);
		goto retry;
	}

	jobid = disrst(news, &ret);
	if ((ret != DIS_SUCCESS) || (strcmp(jobid, new_jobname) != 0)) {
		fprintf(stderr, "qsub: Unknown Job Identifier %s\n", jobid);
		shut_close_sock(news);
		goto retry;
	}

	/* after getting the correct jobid, give up on error */
	message = disrst(news, &ret);
	BAIL("message")
	if (message != NULL && *message != '\0') { /* non-null message */
		fprintf(stderr, "qsub: %s %s\n", jobid, message);
		exit_qsub(3);
	}
	exitval = disrsi(news, &ret);
	BAIL("exitval");
	exit_qsub(exitval);

err:
	fprintf(stderr, "qsub: Bad Request Protocol, %s\n",
		((fail != NULL) && (*fail != '\0')) ? fail : "unknown error");
	exit_qsub(3);
}

/* End of "Block Job" functions. */

/* End of "Authentication" functions. */

/*
 * The following functions support the "Options Processing"
 * functionality of qsub.
 */

/**
 * @brief
 *  This function processes all the options specified while submitting a job. It
 *  validates all these options and sets their corresponding flags.
 *
 * @param[in] argc  Number of options present in argv.
 * @param[in] argv  An array containing all the options and their values.
 * @param[in] passet The value that will be used to set the options. It can have
 *                   value as CMDLINE (for command line options), CMDLINE-1 (for
 *                   job script options), CMDLINE-2 (server default options).
 *
 * @return int - It returns number of erroneous options processed.
 *
 */
static int
process_opts(int argc, char **argv, int passet)
{
	int i;
	int c;
	char *erp;
	int errflg = 0;
	time_t after;
	char a_value[512];
	char *keyword;
	char *valuewd;
	char *pc;
	struct attrl *pattr = NULL;
	size_t N_len = 0;
	int ddash_index = -1;

	extern char GETOPT_ARGS[];

/*
 * The following macro, together the value of passet is used
 * to enforce the following rules:
 * 1. option on the command line take precedence over those in script directives.
 * 2. With in the command line or within the script, the last occurance of an option takes
 *    precedence over the earlier occurance.
 */

/*
 * The passet value is saved in the opt register. The option will
 * only be set if the value of passet is greater then or equal to the
 * opt regiester.
 */
#define if_cmd_line(x) if (x <= passet)

	if (passet != CMDLINE) {
#if defined(linux) || defined(WIN32)
		optind = 0; /* prime getopt's starting point */
#else
		optind = 1; /* prime getopt's starting point */
#endif
	}
	while ((c = getopt(argc, argv, GETOPT_ARGS)) != EOF) {
		/*
		 * qsub uses "--" to specify the executable to run for a job,
		 * so, if "--" is used as a value, we need to make sure that
		 * there is another "--" for providing the executable name (if any).
		 */
		if (optarg && (strcmp(optarg, "--") == 0))
			ddash_index = optind - 1;

		switch (c) {
			case 'a':
				if_cmd_line(a_opt)
				{
					a_opt = passet;
					if ((after = cvtdate(optarg)) < 0) {
						fprintf(stderr, "qsub: illegal -a value\n");
						errflg++;
						break;
					}
					sprintf(a_value, "%ld", (long) after);
					(void) set_attr_error_exit(&attrib, ATTR_a, a_value);
				}
				break;
			case 'A':
				if_cmd_line(A_opt)
				{
					A_opt = passet;
					(void) set_attr_error_exit(&attrib, ATTR_A, optarg);
				}
				break;
			case 'P':
				if_cmd_line(P_opt)
				{
					P_opt = passet;
					(void) set_attr_error_exit(&attrib, ATTR_project, optarg);
				}
				break;
			case 'c':
				if_cmd_line(c_opt)
				{
					c_opt = passet;
					while (isspace((int) *optarg))
						optarg++;
					pc = optarg;
					if (strlen(optarg) == 1) {
						if (*pc == 'u') {
							fprintf(stderr, "qsub: illegal -c value\n");
							errflg++;
							break;
						}
					}
					set_attr_error_exit(&attrib, ATTR_c, optarg);
				}
				break;
			case 'C':
				if_cmd_line(C_opt)
				{
					C_opt = passet;
					snprintf(dir_prefix, sizeof(dir_prefix), "%s", optarg);
				}
				break;
			case 'e':
				if_cmd_line(e_opt)
				{
					e_opt = passet;
					set_attr_error_exit(&attrib, ATTR_e, optarg);
				}
				break;
			case 'h':
				if_cmd_line(h_opt)
				{
					h_opt = passet;
					set_attr_error_exit(&attrib, ATTR_h, "u");
				}
				break;
			case 'f':
				no_background = 1;
				break;
#if !defined(PBS_NO_POSIX_VIOLATION)
			case 'I':
				if (J_opt != 0) {
					fprintf(stderr, "%s", INTER_ARRAY);
					errflg++;
					break;
				}
				if_cmd_line(Interact_opt)
				{
					Interact_opt = passet;
					if (block_opt != FALSE) {
						fprintf(stderr, "%s", INTER_BLOCK_WARN);
						block_opt = FALSE;
					}
					if (roptarg_inter == TRUE) {
						fprintf(stderr, "%s", INTER_RERUN_WARN);
					}
					set_attr_error_exit(&attrib, ATTR_inter, interactive_port());
				}
				break;
#endif /* PBS_NO_POSIX_VIOLATION */
			case 'j':
				if_cmd_line(j_opt)
				{
					j_opt = passet;
					set_attr_error_exit(&attrib, ATTR_j, optarg);
				}
				break;
			case 'J':
				if (Interact_opt != FALSE) {
					fprintf(stderr, "%s", INTER_ARRAY);
					errflg++;
					break;
				}
				if (roptarg != 'y') {
					fprintf(stderr, "%s", NO_RERUN_ARRAY);
					errflg++;
					break;
				}
				if_cmd_line(J_opt)
				{
					char *p;
					J_opt = passet;
					p = strpbrk(optarg, "%");
					if (p != NULL)
						*p = '\0';
					set_attr_error_exit(&attrib, ATTR_J, optarg);
					if (p != NULL) {
						if (max_run_opt == FALSE) {
							max_run_opt = TRUE;
							set_attr_error_exit(&attrib, ATTR_max_run_subjobs, ++p);
						} else {
							fprintf(stderr, "%s", MULTIPLE_MAX_RUN);
							errflg++;
							break;
						}
					}
				}
				break;
			case 'k':
				if_cmd_line(k_opt)
				{
					k_opt = passet;
					set_attr_error_exit(&attrib, ATTR_k, optarg);
				}
				break;
			case 'l':
				l_opt = passet;
				if ((i = set_resources(&attrib, optarg, (passet == CMDLINE), &erp))) {
					if (i > 1) {
						pbs_prt_parse_err("qsub: illegal -l value\n", optarg,
								  (int) (erp - optarg), i);
					} else
						fprintf(stderr, "qsub: illegal -l value\n");
					errflg++;
				}
				break;
			case 'm':
				if_cmd_line(m_opt)
				{
					m_opt = passet;
					while (isspace((int) *optarg))
						optarg++;
					set_attr_error_exit(&attrib, ATTR_m, optarg);
				}
				break;
			case 'M':
				if_cmd_line(M_opt)
				{
					M_opt = passet;
					set_attr_error_exit(&attrib, ATTR_M, optarg);
				}
				break;
			case 'N':
				if_cmd_line(N_opt)
				{
					N_opt = passet;
					/* If ATTR_N is not set previously */
					if (get_attr(attrib, ATTR_N, NULL) == NULL) {
						set_attr_error_exit(&attrib, ATTR_N, optarg);
					}
					/* If N_opt is not set previously but if ATTR_N is set
					 * earlier directly without verification based on the
					 * job script name and if there is a value for ATTR_N
					 * after parsing the job script for PBS directives
					 * replace the earlier value with the current value
					 * for this attribute
					 */
					else {
						for (pattr = attrib; pattr; pattr = pattr->next) {
							if (strcmp(pattr->name, ATTR_N) == 0) {
								N_len = strlen(optarg);
								if (strlen(pattr->value) < N_len) {
									pattr->value = (char *) realloc(pattr->value, N_len + 1);
									if (pattr->value == NULL) {
										fprintf(stderr, "Out of memory\n");
										exit(2);
									}
								}
								strcpy(pattr->value, optarg); /* safe because we just allocated enough space */
							}
						}
					}
				}
				break;
			case 'o':
				if_cmd_line(o_opt)
				{
					o_opt = passet;
					set_attr_error_exit(&attrib, ATTR_o, optarg);
				}
				break;
			case 'p':
				if_cmd_line(p_opt)
				{
					p_opt = passet;
					while (isspace((int) *optarg))
						optarg++;
					set_attr_error_exit(&attrib, ATTR_p, optarg);
				}
				break;
			case 'q':
				if_cmd_line(q_opt)
				{
					q_opt = passet;
					snprintf(destination, sizeof(destination), "%s", optarg);
				}
				break;
			case 'r':
				if_cmd_line(r_opt)
				{
					r_opt = passet;
					if (strlen(optarg) != 1) {
						fprintf(stderr, "qsub: illegal -r value\n");
						errflg++;
						break;
					}
					if (*optarg != 'y' && *optarg != 'n') {
						fprintf(stderr, "qsub: illegal -r value\n");
						errflg++;
						break;
					} else if ((*optarg == 'n') && (J_opt != 0)) {
						fprintf(stderr, "%s", NO_RERUN_ARRAY);
						errflg++;
						break;
					}
					if (*optarg == 'y') {
						roptarg_inter = TRUE;
						if (Interact_opt)
							fprintf(stderr, "%s", INTER_RERUN_WARN);
					}
					roptarg = *optarg;
					set_attr_error_exit(&attrib, ATTR_r, optarg);
				}
				break;
			case 'R':
				if_cmd_line(R_opt)
				{
					R_opt = passet;
					set_attr_error_exit(&attrib, ATTR_R, optarg);
				}
				break;
			case 'S':
				if_cmd_line(S_opt)
				{
					S_opt = passet;
					set_attr_error_exit(&attrib, ATTR_S, optarg);
				}
				break;
			case 'u':
				if_cmd_line(u_opt)
				{
					u_opt = passet;
					set_attr_error_exit(&attrib, ATTR_u, optarg);
				}
				break;
			case 'v':
				if_cmd_line(v_opt)
				{
					v_opt = passet;
					free(v_value);
					/*
					 * Need to change '\' to '/' before expanding the
					 * environment because '\' is used to protect commas
					 * inside quoted values.
					 */
					fix_path(optarg, 1);
					v_value = expand_varlist(optarg);
					if (v_value == NULL)
						exit(1);
				}
				break;
			case 'V':
				if_cmd_line(V_opt)
				{
					V_opt = passet;
				}
				break;
			case 'W':
				while (isspace((int) *optarg))
					optarg++;
				if (strlen(optarg) == 0) {
					fprintf(stderr, "%s", BAD_W);
					errflg++;
					break;
				}
				fix_path(optarg, 2);
				i = parse_equal_string(optarg, &keyword, &valuewd);

				/*
				 * All the arguments to option 'W' are
				 * accepted in the format of -Wattrname=value.
				 */

				while (i == 1) {
					if (strcmp(keyword, ATTR_depend) == 0) {
						if_cmd_line(Depend_opt)
						{
							Depend_opt = passet;
							set_attr_error_exit(&attrib, ATTR_depend, valuewd);
						}
					} else if (strcmp(keyword, ATTR_stagein) == 0) {
						if_cmd_line(Stagein_opt)
						{
							Stagein_opt = passet;
							set_attr_error_exit(&attrib, ATTR_stagein, valuewd);
						}
					} else if (strcmp(keyword, ATTR_stageout) == 0) {
						if_cmd_line(Stageout_opt)
						{
							Stageout_opt = passet;
							set_attr_error_exit(&attrib, ATTR_stageout, valuewd);
						}
					} else if (strcmp(keyword, ATTR_sandbox) == 0) {
						if_cmd_line(Sandbox_opt)
						{
							Sandbox_opt = passet;
							set_attr_error_exit(&attrib, ATTR_sandbox, valuewd);
						}
					} else if (strcmp(keyword, ATTR_g) == 0) {
						if_cmd_line(Grouplist_opt)
						{
							Grouplist_opt = passet;
							set_attr_error_exit(&attrib, ATTR_g, valuewd);
						}
					} else if (strcmp(keyword, ATTR_inter) == 0) {
						if_cmd_line(Interact_opt)
						{
							if (J_opt != 0) {
								fprintf(stderr, "%s", INTER_ARRAY);
								errflg++;
								break;
							}
							/*
							 * SPID 232472: can't set interactive attribute to false
							 * Problem: "qsub -W interactive=false" throws an error
							 * Cause: There should be check to compare the user value
							 *   with "false" string and accordingly decide whether it
							 *   is an interactive job or not.
							 * Solution: Added additional checks which will not set
							 *   Interact_opt and will not call set_attr_error_exit() to create
							 *   interactive port if user gives a value "false"
							 */
							if (!(strcasecmp(valuewd, "true"))) {
								Interact_opt = passet;
								set_attr_error_exit(&attrib, ATTR_inter, interactive_port());
							} else if (!(strcasecmp(valuewd, "false"))) {
								/* Do Nothing, let it run as a non-interactive job */
							} else {
								/* Any value other than true/false is not acceptable */
								fprintf(stderr, "%s", BAD_W);
								errflg++;
								break;
							}
							if (roptarg_inter == TRUE) {
								fprintf(stderr, "%s", INTER_RERUN_WARN);
							}
							/* check if both block and interactive are true */
							if ((block_opt != FALSE) && (Interact_opt)) {
								fprintf(stderr, "%s", INTER_BLOCK_WARN);
								block_opt = FALSE;
								break;
							}
						}
					} else if (strcmp(keyword, ATTR_block) == 0) {
						if_cmd_line(block_opt)
						{
							if (!(strcasecmp(valuewd, "true"))) {
								block_opt = passet;
							} else if (!(strcasecmp(valuewd, "false"))) {
								/* Do Nothing, Let it run as a non-blocking job */
							} else {
								/* Any value other than true/false is not acceptable */
								fprintf(stderr, "%s", BAD_W);
								errflg++;
								break;
							}
							if ((Interact_opt != FALSE) && (block_opt == passet)) {
								fprintf(stderr, "%s", INTER_BLOCK_WARN);
								block_opt = FALSE;
								break;
							}
						}
					} else if (strcmp(keyword, ATTR_resv_start) == 0) {
						if_cmd_line(Resvstart_opt)
						{
							Resvstart_opt = passet;
							if ((after = cvtdate(valuewd)) < 0) {
								fprintf(stderr, "%s", BAD_W);
								errflg++;
								break;
							}
							sprintf(a_value, "%ld", (long) after);
							set_attr_error_exit(&attrib, ATTR_resv_start, a_value);
						}
					} else if (strcmp(keyword, ATTR_resv_end) == 0) {
						if_cmd_line(Resvend_opt)
						{
							Resvend_opt = passet;
							if ((after = cvtdate(valuewd)) < 0) {
								fprintf(stderr, "%s", BAD_W);
								errflg++;
								break;
							}
							sprintf(a_value, "%ld", (long) after);
							set_attr_error_exit(&attrib, ATTR_resv_end, a_value);
						}
					} else if (strcmp(keyword, ATTR_cred) == 0) {
						if_cmd_line(cred_opt)
						{
							cred_opt = passet;
							snprintf(cred_name, sizeof(cred_name), "%s", valuewd);
							set_attr_error_exit(&attrib, ATTR_cred, valuewd);
						}
					} else if (strcmp(keyword, ATTR_tolerate_node_failures) == 0) {
						if_cmd_line(tolerate_node_failures_opt)
						{
							tolerate_node_failures_opt = passet;
							set_attr_error_exit(&attrib, ATTR_tolerate_node_failures, valuewd);
						}
					} else if (strcmp(keyword, ATTR_max_run_subjobs) == 0) {
						if (max_run_opt == FALSE) {
							max_run_opt = TRUE;
							set_attr_error_exit(&attrib, keyword, valuewd);
						} else {
							fprintf(stderr, "%s", MULTIPLE_MAX_RUN);
							errflg++;
							break;
						}
					} else {
						set_attr_error_exit(&attrib, keyword, valuewd);
					}
					i = parse_equal_string(NULL, &keyword, &valuewd);
				} /* bottom of long while loop */
				if (i == -1) {
					fprintf(stderr, "%s", BAD_W);
					errflg++;
				}
				break;

			case 'X':
				if_cmd_line(Forwardx11_opt)
				{
					Forwardx11_opt = passet;
#if !defined(PBS_NO_POSIX_VIOLATION) && !defined(WIN32)
					if (!(display = getenv("DISPLAY"))) {
						fprintf(stderr, "qsub: DISPLAY not set\n");
						errflg++;
					}
#endif
				}
				break;
			case 'G':
				if_cmd_line(gui_opt)
				{
					gui_opt = passet;
					set_attr_error_exit(&attrib, ATTR_GUI, "TRUE");
				}
				break;
			case 'z':
				if_cmd_line(z_opt) z_opt = passet;
				break;
			case '?':
			default:
				errflg++;
		}
	}
	if ((block_opt == passet) && (Interact_opt == FALSE))
		set_attr_error_exit(&attrib, ATTR_block, block_port());
	if ((Forwardx11_opt == CMDLINE) && (Interact_opt == FALSE) && (errflg == 0)) {
		fprintf(stderr, "qsub: X11 Forwarding possible only for "
				"interactive jobs\n");
		exit_qsub(1);
	}
	if ((gui_opt == CMDLINE) && (Interact_opt == FALSE)) {
		fprintf(stderr, INTER_GUI_WARN);
		gui_opt = FALSE;
		exit_qsub(1);
	}

	if (errflg == 0 && J_opt == 0 && get_attr(attrib, ATTR_m, NULL) != NULL &&
	    strchr(get_attr(attrib, ATTR_m, NULL), 'j') != NULL) {
		fprintf(stderr, "qsub: mail option 'j' can not be used without array job\n");
		exit_qsub(1);
	}

	/*
	 * If argv[optind] points to '--' string, then
	 * decrement optind, so that it would always point
	 * to first non-command line option.
	 * And also confirm if "--" was consumed by getopt
	 * and not used as an argument value.
	 * If used as an argument value, we cannot use it as
	 * an indicator that an executable name follows the "--".
	 */
	if (strcmp(argv[optind - 1], "--") == 0) {
		if (ddash_index != optind - 1)
			optind--;
		else
			errflg++;
	}

	if ((optind != 0) && (argc > 1) && (argv[optind] != NULL)) {
		/* Now, optind is pointing to first non-command line option */
		char *s = argv[optind];
		if ((s[0] == '-') && (s[1] == '-') && (s[2] == '\0')) {
			/* optind points to '--', it should not be last character */
			if (optind == (argc - 1))
				errflg++;
		} else {
			/* optind points to 'script-file path' */
			/* It should be a last argument in command-line options */
			if (optind != (argc - 1))
				errflg++;
		}
	}
	if (!errflg && passet != CMDLINE) {
		errflg = (optind != argc);
	}
	/* use PBS_SHELL if specified only if -S was not specified */
	if (S_opt == FALSE) {
		char *c = getenv("PBS_SHELL");
		if (c)
			set_attr_error_exit(&attrib, ATTR_S, c);
	}

	if (u_opt && cred_name[0]) {
		fprintf(stderr, "qsub: credential incompatable with -u\n");
		errflg++;
	}
	return (errflg);
}

/**
 * @brief
 *  Process special arguments.
 *  The "--" argument indicates an executable and possible arguments to that
 *  exectuable. qsub will treat that executable and its arguments as the job
 *  rather than reading from a job script.
 *
 * @param[in]  argc         - argument count
 * @param[in]  argv         - pointer to array of argument variables
 * @param[out] script       - path of job script
 * @return     command_flag - indicates whether an executable was specified instead of a job script
 */
static int
process_special_args(int argc, char **argv, char *script)
{
	int command_flag = 0;
	char *arg_list = NULL;
	if (optind < argc) {
		if (strcmp(argv[optind], "--") == 0) {
			command_flag = 1;
			/* set executable */
			set_attr_error_exit(&attrib, ATTR_executable, argv[optind + 1]);
			if (argc > (optind + 2)) {
				/* user has specified arguments to executable as well. */
				arg_list = encode_xml_arg_list(optind + 2, argc, argv);
				if (arg_list == NULL) {
					fprintf(stderr, "qsub: out of memory\n");
					exit_qsub(2);
				} else {
					/* set argument list */
					set_attr_error_exit(&attrib, ATTR_Arglist, arg_list);
					free(arg_list);
					arg_list = NULL;
				}
			}
			if (!N_opt) /* '-N' is not set */
				set_attr_error_exit(&attrib, ATTR_N, "STDIN");
		} else {
			if (optind + 1 != argc) {
				/* argument is a job script, it should be last */
				print_usage();
				exit_qsub(2);
			}
			snprintf(script, MAXPATHLEN, "%s", argv[optind]);
		}
	}
	return command_flag;
}

/**
 * @brief
 * 	processes and creates arguments passed for qsub
 *
 * @param[in] argc - argument count
 * @param[in] argv - pointer to array of argument variables
 * @param[in] line - character pointer for whole line
 *
 */
static void
make_argv(int *argc, char *argv[], char *line)
{
	char *l, *b, *c;
	char static_buffer[MAX_LINE_LEN + 1];
	char *buffer;
	int line_len = 0;
	int len;
	char quote;
	int i;

	*argc = 0;
	argv[(*argc)++] = "qsub";
	l = line;
	line_len = strlen(line);
	if (line_len > MAX_LINE_LEN) {
		buffer = malloc(line_len + 1);
		if (buffer == NULL) {
			fprintf(stderr, "qsub: out of memory\n");
			exit_qsub(2);
		}
	} else
		buffer = static_buffer;
	b = buffer;
	while (isspace(*l))
		l++;
	c = l;
	while (*c != '\0') {
		if ((*c == '"') || (*c == '\'')) {
			quote = *c;
			c++;
			while ((*c != quote) && *c)
				*b++ = *c++;
			if (*c == '\0') {
				fprintf(stderr, "qsub: unmatched %c\n", *c);
				exit_qsub(1);
			}
			c++;
		} else if (*c == ESC_CHAR) {
			c++;
			*b++ = *c++;
		} else if (isspace(*c)) {
			len = c - l;
			free(argv[*argc]);
			argv[*argc] = (char *) malloc(len + 1);
			if (argv[*argc] == NULL) {
				fprintf(stderr, "qsub: out of memory\n");
				exit_qsub(2);
			}
			*b = '\0';
			strcpy(argv[(*argc)++], buffer);
			while (isspace(*c))
				c++;
			l = c;
			b = buffer;
		} else
			*b++ = *c++;
	}
	if (c != l) {
		len = c - l;
		free(argv[*argc]);
		argv[*argc] = (char *) malloc(len + 1);
		if (argv[*argc] == NULL) {
			fprintf(stderr, "qsub: out of memory\n");
			exit_qsub(2);
		}
		*b = '\0';
		strcpy(argv[(*argc)++], buffer);
	}
	i = *argc;
	/*
	 * free and null any pointers used for the prior call that are not used
	 * for this line. Otherwise the argv array would not be null terminated
	 */
	while (argv[i] != NULL) {
		free(argv[i]);
		argv[i++] = NULL;
	}
	if (buffer != static_buffer)
		free(buffer);
}

/**
 * @brief
 *      Create and process qsub argument list from the string 'opts'
 *
 * @param[in]	opts     - The qsub options as single parameter.
 * @param[in]   opt_pass - priority set based on precedence.
 *
 * @return      int
 * @retval	>0 - Failure - Other than PBS directive error.
 * @retval      -1 - Failure - PBS directive error.
 * @retval	 0 - Success
 *
 */
int
do_dir(char *opts, int opt_pass, char *retmsg, size_t ret_size)
{
	int argc;
	int ret = -1;
	int index = 0;
	int len = 0;
	int nxt_pos = 0;
	size_t max_size = ret_size - 2 /* 2 deducted for adding newline at end */;
#define MAX_ARGV_LEN 128
	static char *vect[MAX_ARGV_LEN + 1];

	make_argv(&argc, vect, opts);
	ret = process_opts(argc, vect, opt_pass);
	if ((ret != 0) && (opt_pass != CMDLINE)) {
		nxt_pos = snprintf(retmsg, max_size, "qsub: directive error: ");
		if (nxt_pos < 0)
			return (ret);
		max_size = max_size - nxt_pos;
		for (index = 1; index < argc; index++) {
			/* +1 is added to strlen(vect[index]) to reserve space */
			if ((max_size > 0) && (max_size > strlen(vect[index]) + 1)) {
				len = snprintf(retmsg + nxt_pos, max_size, "%s ", vect[index]);
				if (len < 0)
					break;
				nxt_pos = nxt_pos + len;
				max_size = max_size - len;
			} else {
				break;
			}
		}
		snprintf(retmsg + nxt_pos, 2, "\n");
		return (-1);
	}
	return (ret);
}

/*
 * @brief
 *	set_opt_defaults - if not already set, set certain job attributes to
 *	their default value
 *
 */
static void
set_opt_defaults(void)
{
	if (c_opt == FALSE)
		set_attr_error_exit(&attrib, ATTR_c, CHECKPOINT_UNSPECIFIED);
	if (h_opt == FALSE)
		set_attr_error_exit(&attrib, ATTR_h, NO_HOLD);
	if (j_opt == FALSE)
		set_attr_error_exit(&attrib, ATTR_j, NO_JOIN);
	if (k_opt == FALSE)
		set_attr_error_exit(&attrib, ATTR_k, NO_KEEP);
	if (m_opt == FALSE)
		set_attr_error_exit(&attrib, ATTR_m, MAIL_AT_ABORT);
	if (p_opt == FALSE)
		set_attr_error_exit(&attrib, ATTR_p, "0");
	if (r_opt == FALSE)
		set_attr_error_exit(&attrib, ATTR_r, "TRUE");
}

/* End of "Options Processing" functions. */

/**
 * @brief
 *	Returns the directory prefix string, which is chosen from the following possibilities:
 *	1. the prefix parameter, if not empty
 *	2. an empty string
 *	3. the PBS_DPREFIX environment variable
 *	4. the PBS_DPREFIX_DEFAULT constant
 *
 * @param[in] prefix - string to be prefixed
 * @param[in] diropt - boolean value indicating directory prefix to be set or not
 *
 * @return String
 * @retval Success - pbs directory prefix
 * @retval Failure - NULL
 *
 */
static char *
set_dir_prefix(char *prefix, int diropt)
{
	char *s;

	if (notNULL(prefix))
		return (prefix);
	else if (diropt != FALSE)
		return ("");
	else if ((s = getenv("PBS_DPREFIX")) != NULL)
		return (s);
	else
		return (PBS_DPREFIX_DEFAULT);
}

/**
 * @brief
 * Read the job script from a file or stdin.
 *
 * @param[in] script - path of job script to read from
 */
static void
read_job_script(char *script)
{
	extern char read_script_msg[];
	int errflg; /* error code from get_script() */
	struct stat statbuf;
	char *bnp;
	char basename[MAXPATHLEN + 1]; /* base name of script for job name*/
	FILE *f;		       /* FILE pointer to the script */

	/* if script is empty, get standard input */
	if ((strcmp(script, "") == 0) || (strcmp(script, "-") == 0)) {
		/* if this is a terminal, print a short info */
		if (isatty(STDIN_FILENO) && Interact_opt == FALSE) {
			printf("%s", read_script_msg);
		}

		if (!N_opt)
			set_attr_error_exit(&attrib, ATTR_N, "STDIN");
		if (Interact_opt == FALSE) {
			errflg = get_script(stdin, script_tmp, set_dir_prefix(dir_prefix, C_opt));
			if (errflg > 0) {
				(void) unlink(script_tmp);
				exit_qsub(1);
			} else if (errflg < 0) {
				exit_qsub(1);
			}
		}
	} else { /* non-empty script, read it for directives */
		if (stat(script, &statbuf) < 0) {
			perror("qsub: script file:");
			exit_qsub(1);
		}
		if (!S_ISREG(statbuf.st_mode)) {
			fprintf(stderr, "qsub: script not a file\n");
			exit_qsub(1);
		}
		if ((f = fopen(script, "r")) != NULL) {
			if (!N_opt) {
				if ((bnp = strrchr(script, (int) '/')) != NULL)
					bnp++;
				else
					bnp = script;

				snprintf(basename, sizeof(basename), "%s", bnp);
				/*
				 * set ATTR_N directly - verification would be done
				 * by IFL later
				 */
				set_attr_error_exit(&attrib, ATTR_N, basename);
			}
			errflg = get_script(f, script_tmp, set_dir_prefix(dir_prefix, C_opt));
			if (errflg > 0) {
				(void) unlink(script_tmp);
				exit_qsub(1);
			} else if (errflg < 0) {
				exit_qsub(1);
			}
			(void) fclose(f);
			f = NULL;
		} else {
			perror("qsub: opening script file:");
			exit_qsub(8);
		}
	}
}

/* End of "Job Script" functions. */

/* The following functions supports the "Environment Variables" feature of qsub. */

/**
 * @brief
 *	Constructs the basic comma-separated environment variables
 *	list string for a PBS job.
 *
 * @return	char *
 * @retval	NULL for failure.
 * @retval	A comma-separated list of environment variable=value entries.
 *
 */
static char *
job_env_basic(void)
{
	char *job_env = NULL;
	char *s = NULL;
	char *c = NULL;
	char *p = NULL;
	char *env = NULL;
#ifdef WIN32
	OSVERSIONINFO os_info;
#else
	struct utsname uns;
#endif
	int len = 0;

	/* Calculate how big to make the variable string. */
	len = 0;
	env = strdup_esc_commas(getenv("HOME"));
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(getenv("LANG"));
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(getenv("LOGNAME"));
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(getenv("PATH"));
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(getenv("MAIL"));
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(getenv("SHELL"));
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(getenv("TZ"));
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(pbs_conf.interactive_auth_method);
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	env = strdup_esc_commas(pbs_conf.interactive_encrypt_method);
	if (env != NULL) {
		len += strlen(env);
		free(env);
	}
	len += PBS_MAXHOSTNAME;
	len += MAXPATHLEN;
	len *= 2; /* Double it for all the commas, etc. */

	if ((job_env = (char *) malloc(len)) == NULL) {
		fprintf(stderr, "malloc failure (errno %d)\n", errno);
		return NULL;
	}
	memset(job_env, '\0', len);

	/* Send the required variables with the job. */
	c = strdup_esc_commas(getenv("HOME"));
	fix_path(c, 1);
	strcat(job_env, "PBS_O_HOME=");
	if (c != NULL) {
		strcat(job_env, c);
		free(c);
	} else
		strcat(job_env, "/");
	c = strdup_esc_commas(getenv("LANG"));
	if (c != NULL) {
		strcat(job_env, ",PBS_O_LANG=");
		strcat(job_env, c);
		free(c);
	}
	c = strdup_esc_commas(getenv("LOGNAME"));
	if (c != NULL) {
		strcat(job_env, ",PBS_O_LOGNAME=");
		strcat(job_env, c);
		free(c);
	}
	c = strdup_esc_commas(getenv("PATH"));
	fix_path(c, 1);
	if (c != NULL) {
		strcat(job_env, ",PBS_O_PATH=");
		strcat(job_env, c);
		free(c);
	}
	c = strdup_esc_commas(getenv("MAIL"));
	fix_path(c, 1);
	if (c != NULL) {
		strcat(job_env, ",PBS_O_MAIL=");
		strcat(job_env, c);
		free(c);
	}
	c = strdup_esc_commas(getenv("SHELL"));
	fix_path(c, 1);
	if (c != NULL) {
		strcat(job_env, ",PBS_O_SHELL=");
		strcat(job_env, c);
		free(c);
	}

	c = strdup_esc_commas(getenv("TZ"));
	if (c != NULL) {
		strcat(job_env, ",PBS_O_TZ=");
		strcat(job_env, c);
		free(c);
	}
	c = strdup_esc_commas(pbs_conf.interactive_auth_method);
	if (c != NULL) {
		if (*job_env)
			strcat(job_env, ",PBS_O_INTERACTIVE_AUTH_METHOD=");
		else
			strcat(job_env, "PBS_O_INTERACTIVE_AUTH_METHOD=");
		strcat(job_env, c);
		free(c);
	}
	c = strdup_esc_commas(pbs_conf.interactive_encrypt_method);
	if (c != NULL) {
		if (*job_env)
			strcat(job_env, ",PBS_O_INTERACTIVE_ENCRYPT_METHOD=");
		else
			strcat(job_env, "PBS_O_INTERACTIVE_ENCRYPT_METHOD=");
		strcat(job_env, c);
		free(c);
	}
	/*
	 * Don't detect the hostname here because it utilizes network services
	 * that slow everthing down. PBS_O_HOST is set in the daemon later on.
	 */

	/* get current working directory, use $PWD if available, it is more
	 * NFS automounter "friendly". But must double check that is right
	 */
	s = job_env + strlen(job_env);
	strcat(job_env, ",PBS_O_WORKDIR=");
	c = getenv("PWD");
	if (c != NULL) {
		struct stat statbuf;
		dev_t dev;
		ino_t ino;

		if (stat(c, &statbuf) < 0) {
			/* cannot stat, cannot trust it */
			c = NULL;
		} else {
			dev = statbuf.st_dev;
			ino = statbuf.st_ino;
			if (stat(".", &statbuf) < 0) {
				perror("qsub: cannot stat current directory: ");
				free(job_env);
				return NULL;
			}
			/* compare against "." */
			if ((dev != statbuf.st_dev) || (ino != statbuf.st_ino))
				/* "." and $PWD is different, cannot trust it */
				c = NULL;
		}
	}

	if (c == NULL) {
		p = c = job_env + strlen(job_env);
		if (getcwd(c, MAXPATHLEN) == NULL)
			c = NULL;
	} else
		p = job_env + strlen(job_env);

	if (c != NULL) {
		char *c_escaped = NULL;

		/* save current working dir for daemon */
		snprintf(qsub_cwd, sizeof(qsub_cwd), "%s", c);
		/* get UNC path (if available) if it is mapped drive */
		get_uncpath(c);
		c_escaped = strdup_esc_commas(c);
		if (c_escaped != NULL) {
			fix_path(c_escaped, 1);
			pbs_strncpy(p, c_escaped, len - (p - job_env));
			free(c_escaped);
			c_escaped = NULL;
		} else
			*s = '\0';
	} else
		*s = '\0';

#ifdef WIN32 /* Windows */
	os_info.dwOSVersionInfoSize = sizeof(OSVERSIONINFO);
	if (GetVersionEx(&os_info)) {
		switch (os_info.dwPlatformId) {
			case 0:
				strcat(job_env, ",PBS_O_SYSTEM=VER_PLATFORM_WIN32s");
				break;
			case 1:
				strcat(job_env, ",PBS_O_SYSTEM=VER_PLATFORM_WIN32_WINDOWS");
				break;
			case 2:
				strcat(job_env, ",PBS_O_SYSTEM=VER_PLATFORM_WIN32_NT");
				break;
		}
	}
#else /* Unix */
	if (uname(&uns) != -1) {
		strcat(job_env, ",PBS_O_SYSTEM=");
		strcat(job_env, uns.sysname);
	}
#endif
	else {
		perror("qsub: cannot get uname info:");
		free(job_env);
		return NULL;
	}

	return (job_env);
}

/**
 * @brief
 *	Converts an array of environment variable=value strings,
 *	into a comma-separated variables list string that can be
 *	exported to a job.
 *
 * @par	 NOTE: Variables in the list beginning with "PBS_O" are ignored
 *	 as these will be preconstructed somewhere else.
 *	 PBS_JOBCOOKIE and PBS_INTERACTIVE_JOBCOOKIE are also ignored
 *
 * @param[in]	envp - aray of strings making up the current environment.
 *
 * @return      char *
 * @retval      NULL - Failure
 * @retval      A comma-separated list of environment variables and values.
 *		The returned string is malloc-ed so it must be freed later.
 */
static char *
env_array_to_varlist(char **envp)
{
	char **evp;
	int len;
	char *job_env = NULL;
	char *s;

	if (envp == NULL) {
		fprintf(stderr, "env_array_to_varlist: no envp array!\n");
		return NULL;
	}

	evp = envp;
	len = 0;
	while (notNULL(*evp)) {
		len += strlen(*evp);
		evp++;
	}
	len += len; /* Double it for all the commas, etc. */

	if ((len > 0) && ((job_env = (char *) malloc(len)) == NULL)) {
			fprintf(stderr, "env_array_to_varlist: malloc failure errno=%d", errno);
			return NULL;
	}

	*job_env = '\0';

	evp = envp;
	while (notNULL(*evp)) {
		s = *evp;
		while ((*s != '=') && *s)
			++s;
		*s = '\0';
		/* Check for PBS_O_, PBS_JOBCOOKIE, and PBS_INTERACTIVE_COOKIE
		 * PBS_O_* env variables, are set by qsub
		 * Job related cookies should not be sent and are excluded to
		 * prevent exposing internal PBS interactive session information. */
		if ((strncmp(*evp, PBS_O_ENV, sizeof(PBS_O_ENV) - 1) != 0) &&
			(strcmp(*evp, PBS_JOBCOOKIE) != 0) &&
			(strcmp(*evp, PBS_INTERACTIVE_COOKIE)) != 0) {
			strcat(job_env, ",");
			strcat(job_env, *evp);
			strcat(job_env, "=");
			fix_path(s + 1, 1);
			(void) copy_env_value(job_env, s + 1, 1);
		}
		*s = '=';
		evp++;
	}

	return (job_env);
}

/**
 * @brief
 *	Adds to the global 'attrib' structure an entry:
 *
 *	"-v <basic_vlist>,<v_value>,<current_vlist>
 *	and this 'attrib' is something that will be passed onto a
 *	PBS job before submission.
 *
 * @param[in]	basic_vlist - the basic variables list string of job.
 * @param[in]	curent_envlist - the variables list
 *		string representing the environment where qsub was
 *		invoked.
 *
 * @return	boolean (int)
 * @retval	TRUE for success.
 * @retval	FALSE for failure.
 *
 */
static int
set_job_env(char *basic_vlist, char *current_vlist)
{
	char *job_env;
	int len;

	char *s, *c, *env, l, *pc;

	/* Calculate how big to make the variable string. */
	len = 0;
	if (v_opt)
		len += strlen(v_value);

	if ((basic_vlist == NULL) || (basic_vlist[0] == '\0'))
		return FALSE;

	len += strlen(basic_vlist);

	if (V_opt && (current_vlist != NULL) && (current_vlist[0] != '\0'))
		len += strlen(current_vlist);

	len += len; /* Double it for all the commas, etc. */
	if ((job_env = (char *) malloc(len)) == NULL)
		return FALSE;
	*job_env = '\0';

	pbs_strncpy(job_env, basic_vlist, len);

	/* Send these variables with the job. */
	/* POSIX requirement: If a variable is given without a value, supply the
	 value from the environment. */
	/* MY requirement: There can be no white space in -v value. */
	if (v_opt) {
		c = v_value;
	state1: /* Initial state comes here */
		switch (*c) {
			case ',':
			case '=':
				free(job_env);
				return FALSE;
			case '\0':
				goto final;
		}
		s = c;
	state2: /* Variable name */
		switch (*c) {
			case ',':
			case '\0':
				goto state3;
			case '=':
				goto state4;
			default:
				c++;
				goto state2;
		}
	state3: /* No value - get it from qsub environment */

		/* From state3, goes back to state1, using 'c' as input */
		l = *c;
		*c = '\0';
		if (strncmp(s, PBS_O_ENV, sizeof(PBS_O_ENV) - 1) != 0) {
			/* do not add PBS_O_* env variables, as these are set by qsub */

			env = getenv(s);
			if (env == NULL) {
				free(job_env);
				return FALSE;
			}

			strcat(job_env, ",");
			strcat(job_env, s);
			strcat(job_env, "=");
			fix_path(env, 1);
			if (copy_env_value(job_env, env, 1) == NULL) {
				free(job_env);
				return FALSE;
			}
		}

		if (l == ',')
			c++;
		goto state1;
	state4: /* Value specified */

		/* From state4, goes back to state1, using 'c' as input */
		*c++ = '\0';
		;
		if (v_opt && Forwardx11_opt) {
			if (strcmp(s, "DISPLAY") == 0) {
				x11_disp = TRUE;
				free(job_env);
				return FALSE;
			}
		}
		pc = job_env + strlen(job_env);
		(void) strcat(job_env, ",");
		(void) strcat(job_env, s);
		(void) strcat(job_env, "=");
		fix_path(c, 1);
		if ((c = copy_env_value(job_env, c, 0)) == NULL) {
			free(job_env);
			return FALSE;
		}

		/* Have to undo here, since 'c' was incremented by copy_env_value */
		if (strncmp(s, PBS_O_ENV, sizeof(PBS_O_ENV) - 1) == 0)
			/* ignore PBS_O_ env variables as these are created by qsub */
			*pc = '\0';

		goto state1;
	}

final:

	if (V_opt && (current_vlist != NULL) && (current_vlist[0] != '\0'))
		/* Send every environment variable with the job. */
		strcat(job_env, current_vlist);

	set_attr_error_exit(&attrib, ATTR_v, job_env);
	free(job_env);

	return TRUE;
}

/* End of "Environment Variables" functions. */

/* The following functions support the "Daemon" capability of qsub. */

/*
 * static buffer and length used by various messages for communication
 * between the qsub foreground and background process
 */
static char *daemon_buf = NULL;
static int daemon_buflen = 0;

/**
 * @brief
 *  Resize the static variable daemon_buf.
 *
 * @param bufused - Amount of the buffer already used
 * @param lenreq - Amount of length required by new data
 *
 * @return - Error code
 * @retval - 0 - Success
 * @retval - -1 - Error
 *
 */
static int
resize_daemon_buf(int bufused, int lenreq)
{
	char *p;
	int new_buflen = lenreq + bufused;

	if (daemon_buflen < new_buflen) {
		new_buflen += 1000; /* adding 1000 so that we realloc fewer times */
		p = realloc(daemon_buf, new_buflen);
		if (p == NULL) {
			free(daemon_buf);
			daemon_buf = NULL;
			daemon_buflen = 0;
			return -1;
		}
		daemon_buf = p;
		daemon_buflen = new_buflen;
	}
	return 0;
}

/**
 * @brief
 *	Send the attrl list to the background qsub process. This is the
 * 	attribute list that was created by the foreground process based on
 *	the options that the user has provided to qsub.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 * @parma[in]	attrib - List of attributes created by foreground qsub process
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
send_attrl(void *s, struct attrl *attrib)
{
	int bufused = 0;
	int len_n = 0, len_r = 0, len_v = 0;
	char *p;
	int lenreq = 0;

	while (attrib) {
		len_n = strlen(attrib->name) + 1;
		if (attrib->resource)
			len_r = strlen(attrib->resource) + 1;
		else
			len_r = 0;
		len_v = strlen(attrib->value) + 1;

		lenreq = len_n + len_r + len_v + 3 * sizeof(int);
		if (resize_daemon_buf(bufused, lenreq) != 0)
			return -1;

		/* write the lengths */
		p = daemon_buf + bufused;
		memmove(p, &len_n, sizeof(int));
		p += sizeof(int);
		memmove(p, &len_r, sizeof(int));
		p += sizeof(int);
		memmove(p, &len_v, sizeof(int));
		p += sizeof(int);

		/* now add the strings */
		memmove(p, attrib->name, len_n);
		p += len_n;
		if (len_r > 0) {
			memmove(p, attrib->resource, len_r);
			p += len_r;
		}
		memmove(p, attrib->value, len_v);
		p += len_v;

		bufused += lenreq;

		attrib = attrib->next;
	}
	if ((dosend(s, (char *) &bufused, sizeof(int)) != 0) ||
	    (dosend(s, daemon_buf, bufused) != 0))
		return -1;

	return 0;
}

/**
 * @brief
 * 	Send a null terminated string to the peer process. Used by backrgound and
 * 	foreground qsub processes to communicate error-strings, job-ids etc.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 * @parma[in]	str - null terminated string to send
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
send_string(void *s, char *str)
{
	int len = strlen(str) + 1;

	if ((dosend(s, (char *) &len, sizeof(int)) != 0) ||
	    (dosend(s, str, len) != 0))
		return -1;

	return 0;
}

/**
 * @brief
 *	Recv the attrl list from the foreground qsub process. This is the
 * 	attribute list that was created by the foreground process based on
 * 	the options that the user has provided to qsub.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 * @parma[in]	attrib - List of attributes created by foreground qsub process
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
recv_attrl(void *s, struct attrl **attrib)
{
	int recvlen = 0;
	struct attrl *attr = NULL;
	char *p;
	int len_n = 0, len_r = 0, len_v = 0;
	char *attr_v_val = NULL;

	if (dorecv(s, (char *) &recvlen, sizeof(int)) != 0)
		return -1;
	if (resize_daemon_buf(0, recvlen) != 0)
		return -1;

	if (dorecv(s, daemon_buf, recvlen) != 0)
		return -1;

	p = daemon_buf;
	while (p - daemon_buf < recvlen) {
		memmove(&len_n, p, sizeof(int));
		p += sizeof(int);
		memmove(&len_r, p, sizeof(int));
		p += sizeof(int);
		memmove(&len_v, p, sizeof(int));
		p += sizeof(int);

		if (len_r > 0) {
			/* strings have null character also in daemon_buf */
			set_attr_resc_error_exit(&attr, p,
						 p + len_n,
						 p + len_n + len_r);
		} else {
			/*
			 * if value is ATTR_v, we need to add PBS_O_HOSTNAME to it
			 * Since determininig PBS_O_HOSTNAME is expensive, we do it
			 * once in the background qsub, and add it to the list that comes
			 * from the front end qsub
			 */
			if (strcmp(p, ATTR_v) == 0 && pbs_hostvar != NULL) {
				int attr_v_len = len_v + strlen(pbs_hostvar) + 1;
				attr_v_val = malloc(attr_v_len);
				if (!attr_v_val)
					return -1;
				strcpy(attr_v_val, p + len_n);
				strcat(attr_v_val, pbs_hostvar);
				set_attr_error_exit(&attr, p, attr_v_val);
				free(attr_v_val);
			} else {
				set_attr_error_exit(&attr, p, p + len_n);
			}
		}
		p += len_n + len_r + len_v;
	}
	*attrib = attr;
	return 0;
}

/**
 * @brief
 *  Recv a null terminated string from the peer process. Used by backrgound and
 * 	foreground qsub processes to communicate error-strings, job-ids etc.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 * @parma[in]	str - null terminated string to send
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
recv_string(void *s, char *str)
{
	int len = 0;

	if ((dorecv(s, (char *) &len, sizeof(int)) != 0) ||
	    (dorecv(s, str, len) != 0))
		return -1;

	return 0;
}

/**
 * @brief
 *  Recv a null terminated string from the peer process. Used by background and
 * 	foreground qsub processes to communicate error-strings, job-ids etc.
 * 	This is like recv_string() except the 'strp' parameter will hold a pointer
 * 	to a newly-malloced string holding the resultant string.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 * @parma[out]	strp - holds a pointer to the newly-malloced string.
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
recv_dyn_string(void *s, char **strp)
{
	int recvlen = 0;

	if (dorecv(s, (char *) &recvlen, sizeof(int)) != 0)
		return -1;
	/* resizes the global 'daemon_buf' array */
	if (resize_daemon_buf(0, recvlen) != 0)
		return -1;
	if (dorecv(s, daemon_buf, recvlen) != 0)
		return -1;

	*strp = strdup(daemon_buf);
	if (*strp == NULL)
		return -1;
	return 0;
}

/**
 * @brief
 *	Send the cmd opt values for each parameter supported by qsub to the
 *	background qsub process.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
send_opts(void *s)
{
	/*
	 * we are allocating a fixed size of 100. This is because we know that
	 * the list of opts to send is going to fit within 100. Specifically, for each
	 * opt we need 2 characters, and currently we have 35 opts.
	 * If a new set of opts are added, the buffer space of 100 allocated here
	 * needs to be double checked.
	 */
	if (resize_daemon_buf(0, 100) != 0)
		return -1;

	sprintf(daemon_buf,
		"%d %d %d %d %d %d %d %d %d %d "
		"%d %d %d %d %d %d %d %d %d %d "
		"%d %d %d %d %d %d %d %d %d %d "
		"%d %d %d %d %d %d ",
		a_opt, c_opt, e_opt, h_opt, j_opt,
		k_opt, l_opt, m_opt, o_opt, p_opt,
		q_opt, r_opt, u_opt, v_opt, z_opt,
		A_opt, C_opt, J_opt, M_opt, N_opt,
		S_opt, V_opt, Depend_opt, Interact_opt, Stagein_opt,
		Stageout_opt, Sandbox_opt, Grouplist_opt, Resvstart_opt,
		Resvend_opt, pwd_opt, cred_opt, block_opt, P_opt,
		relnodes_on_stageout_opt, tolerate_node_failures_opt);

	return (send_string(s, daemon_buf));
}

/**
 * @brief
 *	Recv the cmd opt values for each parameter supported by qsub from the
 *	foreground qsub process.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
recv_opts(void *s)
{
	/*
	 * we are allocating a fixed size of 100. This is because we know that
	 * the list of opts to send is going to fit within 100. Specifically, for each
	 * opt we need 2 characters, and currently we have 35 opts.
	 * If a new set of opts are added, the buffer space of 100 allocated here
	 * needs to be double checked.
	 */
	if (resize_daemon_buf(0, 100) != 0)
		return -1;

	if (recv_string(s, daemon_buf) != 0)
		return -1;

	sscanf(daemon_buf,
	       "%d %d %d %d %d %d %d %d %d %d "
	       "%d %d %d %d %d %d %d %d %d %d "
	       "%d %d %d %d %d %d %d %d %d %d "
	       "%d %d %d %d %d %d ",
	       &a_opt, &c_opt, &e_opt, &h_opt, &j_opt,
	       &k_opt, &l_opt, &m_opt, &o_opt, &p_opt,
	       &q_opt, &r_opt, &u_opt, &v_opt, &z_opt,
	       &A_opt, &C_opt, &J_opt, &M_opt, &N_opt,
	       &S_opt, &V_opt, &Depend_opt, &Interact_opt, &Stagein_opt,
	       &Stageout_opt, &Sandbox_opt, &Grouplist_opt, &Resvstart_opt,
	       &Resvend_opt, &pwd_opt, &cred_opt, &block_opt, &P_opt,
	       &relnodes_on_stageout_opt, &tolerate_node_failures_opt);
	return 0;
}

/**
 * @brief
 *	Handles the attribute errors listed from the ECL layer
 *	by iterating through the err_list parameter. It then
 *	compares the attribute name and sets and appropriate
 *	error message in retmsg to be shown to the user.
 *
 * @param[in]	err_list - The list of attribute errors returned from
 *			the ECL verification layer
 * @param[out] retmsg - The return error message to the caller
 *			to be shown to the user
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
static int
handle_attribute_errors(struct ecl_attribute_errors *err_list, char *retmsg)
{
	struct attropl *attribute;
	char *opt;
	int i;

	for (i = 0; i < err_list->ecl_numerrors; i++) {
		attribute = err_list->ecl_attrerr[i].ecl_attribute;
		if (strcmp(attribute->name, ATTR_a) == 0)
			opt = "a";
		else if (strcmp(attribute->name, ATTR_A) == 0)
			opt = "A";
		else if (strcmp(attribute->name, ATTR_project) == 0)
			opt = "P";
		else if (strcmp(attribute->name, ATTR_c) == 0)
			opt = "c";
		else if (strcmp(attribute->name, ATTR_e) == 0)
			opt = "e";
		else if (strcmp(attribute->name, ATTR_h) == 0)
			opt = "h";
		else if (strcmp(attribute->name, ATTR_inter) == 0)
			opt = "I";
		else if (strcmp(attribute->name, ATTR_j) == 0)
			opt = "j";
		else if (strcmp(attribute->name, ATTR_J) == 0)
			opt = "J";
		else if (strcmp(attribute->name, ATTR_k) == 0)
			opt = "k";
		else if (strcmp(attribute->name, ATTR_l) == 0)
			opt = "l";
		else if (strcmp(attribute->name, ATTR_m) == 0)
			opt = "m";
		else if (strcmp(attribute->name, ATTR_M) == 0)
			opt = "M";
		else if (strcmp(attribute->name, ATTR_N) == 0)
			opt = "N";
		else if (strcmp(attribute->name, ATTR_o) == 0)
			opt = "o";
		else if (strcmp(attribute->name, ATTR_p) == 0)
			opt = "p";
		else if (strcmp(attribute->name, ATTR_r) == 0)
			opt = "r";
		else if (strcmp(attribute->name, ATTR_R) == 0)
			opt = "R";
		else if (strcmp(attribute->name, ATTR_S) == 0)
			opt = "S";
		else if (strcmp(attribute->name, ATTR_u) == 0)
			opt = "u";
		else if ((strcmp(attribute->name, ATTR_depend) == 0) ||
			 (strcmp(attribute->name, ATTR_stagein) == 0) ||
			 (strcmp(attribute->name, ATTR_stageout) == 0) ||
			 (strcmp(attribute->name, ATTR_sandbox) == 0) ||
			 (strcmp(attribute->name, ATTR_g) == 0) ||
			 (strcmp(attribute->name, ATTR_inter) == 0) ||
			 (strcmp(attribute->name, ATTR_block) == 0) ||
			 (strcmp(attribute->name, ATTR_relnodes_on_stageout) == 0) ||
			 (strcmp(attribute->name, ATTR_tolerate_node_failures) == 0) ||
			 (strcmp(attribute->name, ATTR_resv_start) == 0) ||
			 (strcmp(attribute->name, ATTR_resv_end) == 0) ||
			 (strcmp(attribute->name, ATTR_umask) == 0) ||
			 (strcmp(attribute->name, ATTR_runcount) == 0) ||
			 (strcmp(attribute->name, ATTR_cred) == 0))
			opt = "W";
		else
			return 0;

		if (*opt == 'l') {
			sprintf(retmsg, "qsub: %s\n",
				err_list->ecl_attrerr[i].ecl_errmsg);
			return (err_list->ecl_attrerr[i].ecl_errcode);
		} else if (err_list->ecl_attrerr->ecl_errcode == PBSE_JOBNBIG) {
			sprintf(retmsg, "qsub: Job %s \n", err_list->ecl_attrerr->ecl_errmsg);
			return (2);
		} else {
			sprintf(retmsg, "qsub: illegal -%s value\n", opt);
			return (2);
		}
	}
	return 0;
}

/**
 * @brief
 *	This functions connects to the pbs_server.
 *
 * @param[in] server_out - The target server name, if any, else NULL
 * @param[out] retmsg	 - Any error string is returned in this parameter
 *
 * @return int
 * @retval 0 - Success
 * @retval 1/pbs_errno - Failure, retmsg paramter is set
 *
 */
int
do_connect(char *server_out, char *retmsg)
{
	int rc = 0;
	char host[PBS_MAXHOSTNAME + 1];

	/* Set single threaded mode */
	pbs_client_thread_set_single_threaded_mode();

	/* Perform needed security library initializations (including none) */
	if (CS_client_init() == CS_SUCCESS) {
		cs_init = 1;
	} else {
		sprintf(retmsg, "qsub: unable to initialize security library.\n");
		return 1;
	}

	/* Connect to the server */
	if ((Interact_opt == FALSE) && (block_opt == FALSE))
		sd_svr = cnt2server_extend(server_out, QSUB_DAEMON);
	else
		sd_svr = cnt2server(server_out);

	if (sd_svr <= 0) {
		sprintf(retmsg, "qsub: cannot connect to server %s (errno=%d)\n",
			pbs_default() == NULL ? "" : pbs_default(), pbs_errno);
		return (pbs_errno);
	}

	refresh_dfltqsubargs();

	pbs_hostvar = malloc(pbs_o_hostsize + PBS_MAXHOSTNAME + 1);
	if (!pbs_hostvar) {
		sprintf(retmsg, "qsub: out of memory\n");
		return (2);
	}
	if ((rc = gethostname(host, (sizeof(host) - 1))) == 0) {
		if ((rc = get_fullhostname(host, host, (sizeof(host) - 1))) == 0) {
			snprintf(pbs_hostvar, pbs_o_hostsize + PBS_MAXHOSTNAME + 1, ",PBS_O_HOST=%s", host);
		}
	}
	if (rc != 0) {
		sprintf(retmsg, "qsub: cannot get full local host name\n");
		return (3);
	}
	return 0;
}

/**
 * @brief
 *	This functions does a job submission to the server using the global
 *	connected server socket sd_svr.
 *
 * @param[out] retmsg	 - Any error string is returned in this parameter
 *
 * @return int
 * @retval 0 - Success
 * @retval 1/-1/pbs_errno - Failure, retmsg paramter is set
 * @retval DMN_REFUSE_EXIT - If daemon can't submit the job
 *
 */
static int
do_submit(char *retmsg)
{
	struct ecl_attribute_errors *err_list;
	char *new_jobname = NULL;
	int rc;
	char *errmsg;
	int retries;

	if (dfltqsubargs != NULL) {
		/*
		 * Setting options from the server defaults will not overwrite
		 * options set from the job script. CMDLINE-2 means
		 * "one less than job script priority"
		 */
		for (retries = 2; retries > 0; retries--) {
			rc = do_dir(dfltqsubargs, CMDLINE - 2, retmsg, MAXPATHLEN);
			if (rc >= 0)
				break;
			if (retries == 2) {
				refresh_dfltqsubargs();
				if (pbs_errno != PBSE_NONE)
					return (pbs_errno);
			}
		}
		if (rc != 0)
			return (rc);
	}

	/*
	 * get environment variable if -V option is set. Return the code
	 * DMN_REFUSE_EXIT if -V option is detected in background qsub.
	 */
	if (V_opt) {
		if (is_background)
			return DMN_REFUSE_EXIT;
		qsub_envlist = env_array_to_varlist(environ);
	}

	/* set_job_env must be done here to pick up -v, -V options passed by default_qsub_arguments */
	if (!set_job_env(basic_envlist, qsub_envlist)) {
		if (x11_disp)
			snprintf(retmsg, MAXPATHLEN, "qsub: invalid usage of incompatible option –X with –v DISPLAY\n");
		else
			snprintf(retmsg, MAXPATHLEN, "qsub: cannot send environment with the job\n");
		return 1;
	}

	/* Send submit request to the server. */
	pbs_errno = 0;
	if (cred_buf) {
		/* A credential was obtained, call the credential version of submit */
		new_jobname = pbs_submit_with_cred(sd_svr, (struct attropl *) attrib,
						   script_tmp, destination, NULL, cred_type,
						   cred_len, cred_buf);
	} else {
		new_jobname = pbs_submit(sd_svr, (struct attropl *) attrib,
					 script_tmp, destination, NULL);
	}
	if (new_jobname == NULL) {

		if ((err_list = pbs_get_attributes_in_error(sd_svr))) {
			rc = handle_attribute_errors(err_list, retmsg);
			if (rc != 0)
				return rc;
		}

		errmsg = pbs_geterrmsg(sd_svr);
		if (errmsg != NULL) {
			if (strcmp(errmsg, msg_force_qsub_update) == 0)
				return PBSE_FORCE_QSUB_UPDATE;
			sprintf(retmsg, "qsub: %s\n", errmsg);
		} else {
			sprintf(retmsg, "qsub: Error (%d) submitting job\n", pbs_errno);
		}
		return (pbs_errno);
	} else {
		sprintf(retmsg, "%s", new_jobname);
		free(new_jobname);
	}
	return 0;
}

/**
 * @brief
 *	Save original values of qsub option variables.
 *
 */
static void
save_opts(void)
{
	/* save the values */
	a_opt_o = a_opt;
	c_opt_o = c_opt;
	e_opt_o = e_opt;
	h_opt_o = h_opt;
	j_opt_o = j_opt;
	k_opt_o = k_opt;
	l_opt_o = l_opt;
	m_opt_o = m_opt;
	o_opt_o = o_opt;
	p_opt_o = p_opt;
	q_opt_o = q_opt;
	r_opt_o = r_opt;
	u_opt_o = u_opt;
	v_opt_o = v_opt;
	z_opt_o = z_opt;
	A_opt_o = A_opt;
	C_opt_o = C_opt;
	J_opt_o = J_opt;
	M_opt_o = M_opt;
	N_opt_o = N_opt;
	P_opt_o = P_opt;
	S_opt_o = S_opt;
	V_opt_o = V_opt;
	Depend_opt_o = Depend_opt;
	Interact_opt_o = Interact_opt;
	Stagein_opt_o = Stagein_opt;
	Stageout_opt_o = Stageout_opt;
	Sandbox_opt_o = Sandbox_opt;
	Grouplist_opt_o = Grouplist_opt;
	gui_opt_o = gui_opt;
	Resvstart_opt_o = Resvstart_opt;
	Resvend_opt_o = Resvend_opt;
	pwd_opt_o = pwd_opt;
	cred_opt_o = cred_opt;
	block_opt_o = block_opt;
	relnodes_on_stageout_opt_o = relnodes_on_stageout_opt;
	tolerate_node_failures_opt_o = tolerate_node_failures_opt;
}

/**
 * @brief
 *	Initialize qsub option variables to their original values.
 *
 */
static void
restore_opts(void)
{
	/* save the values */
	a_opt = a_opt_o;
	c_opt = c_opt_o;
	e_opt = e_opt_o;
	h_opt = h_opt_o;
	j_opt = j_opt_o;
	k_opt = k_opt_o;
	l_opt = l_opt_o;
	m_opt = m_opt_o;
	o_opt = o_opt_o;
	p_opt = p_opt_o;
	q_opt = q_opt_o;
	r_opt = r_opt_o;
	u_opt = u_opt_o;
	v_opt = v_opt_o;
	z_opt = z_opt_o;
	A_opt = A_opt_o;
	C_opt = C_opt_o;
	J_opt = J_opt_o;
	M_opt = M_opt_o;
	N_opt = N_opt_o;
	P_opt = P_opt_o;
	S_opt = S_opt_o;
	V_opt = V_opt_o;
	Depend_opt = Depend_opt_o;
	Interact_opt = Interact_opt_o;
	Stagein_opt = Stagein_opt_o;
	Stageout_opt = Stageout_opt_o;
	Sandbox_opt = Sandbox_opt_o;
	Grouplist_opt = Grouplist_opt_o;
	Resvstart_opt = Resvstart_opt_o;
	Resvend_opt = Resvend_opt_o;
	pwd_opt = pwd_opt_o;
	cred_opt = cred_opt_o;
	block_opt = block_opt_o;
	relnodes_on_stageout_opt = relnodes_on_stageout_opt_o;
	tolerate_node_failures_opt = tolerate_node_failures_opt_o;
}

/**
 * @brief
 *	Helper function to free a list of attributes. This is called from
 *	do_daemon_stuff, since that function loops over for each client request.
 *	No freeing the list of attributes created would result in a lot of
 *	memory leak.
 *
 * @param[in]	attrib - The list of attributes to free
 *
 */
void
qsub_free_attrl(struct attrl *attrib)
{
	struct attrl *attr;

	while (attrib) {
		free(attrib->name);
		free(attrib->resource);
		free(attrib->value);

		attr = attrib;
		attrib = attrib->next;
		free(attr);
	}
}

/**
 * @brief
 *	Helper function to duplicate the passed attrl structure.
 *
 * @param[in]	attrib - The list of attributes to copy
 *
 * @return	struct attrl * - the duplicated 'attrib' (malloced).
 * @retval	non-NULL - success.
 * @retval	NULL - failure.
 *
 */
static struct attrl *
dup_attrl(struct attrl *attrib)
{
	struct attrl *attr = NULL;
	struct attrl *attr_new = NULL;

	for (attr = attrib; attr != NULL; attr = attr->next) {
		if (attr->resource != NULL) {
			/* strings have null character also in buf */
			set_attr_resc_error_exit(&attr_new, attr->name,
						 attr->resource,
						 attr->value);
		} else {
			set_attr_error_exit(&attr_new, attr->name, attr->value);
		}
	}

	return attr_new;
}

/**
 *
 * @brief
 *	The wrapper program to "do_submit()".
 * @par
 *	This attempts up to 'retry' times to do_submit(), when this function
 *	returns PBSE_FORCE_QSUB_UPDATE.
 *
 * @param[in]	retmsg - gets filled with the error message.
 *
 * @return 	int
 * @retval	the return code of do_submit().
 * @retval	if retry time exhausted or any unexpected failure,
 * 		return PBSE_PROTOCOL
 *
 */
int
do_submit2(char *rmsg)
{
	int retry; /* do a retry count to prevent infinite loop */
	int rc;

	rmsg[0] = '\0';
	/*
	 * Save the original job attributes/resources (attrib)
	 * before 'default_qsub_arguments" was applied.
	 */
	if (attrib != NULL) {
		if (attrib_o != NULL)
			qsub_free_attrl(attrib_o);
		attrib_o = dup_attrl(attrib); /* save attributes list */
		if (attrib_o == NULL) {
			snprintf(rmsg, MAXPATHLEN, "Failed to duplicate attributes list.\n");
			return PBSE_PROTOCOL;
		}
	}

	/* original v_value also needs to be saved as it gets mangled inside set_job_env() */
	if (v_value != NULL) {
		free(v_value_o);
		v_value_o = strdup(v_value);
		if (v_value_o == NULL) {
			snprintf(rmsg, MAXPATHLEN, "Failed to duplicate original -v value\n");
			return PBSE_PROTOCOL;
		}
	}

	/*
	 * Need to save original values of qsub option variables,
	 * as "reset_dfltqsubargs() below could "lose" memory
	 * of the option variable values. The values are
	 * needed in case a new "default_qsub_arguments come and
	 * gets reparsed.
	 */
	save_opts();

	rc = do_submit(rmsg);
	for (retry = 5; (rc == PBSE_FORCE_QSUB_UPDATE) && (retry > 0); retry--) {
		/* Let's retry with the new "default_qsub_arguments" */
		refresh_dfltqsubargs();
		if (pbs_errno != PBSE_NONE)
			return (pbs_errno);

		/* Use the original attrib value before the previous "default_qsub_arguments" was applied. */
		if (attrib_o != NULL) {
			if (attrib != NULL)
				qsub_free_attrl(attrib);
			attrib = dup_attrl(attrib_o);
			if (attrib == NULL) {
				snprintf(rmsg, MAXPATHLEN, "Failed to duplicate attributes list\n");
				return PBSE_PROTOCOL;
			}
		}

		/* use original -v value */
		if (v_value_o != NULL) {
			free(v_value);
			v_value = strdup(v_value_o);
			if (v_value == NULL) {
				snprintf(rmsg, MAXPATHLEN, "Failed to duplicate -v value\n");
				return PBSE_PROTOCOL;
			}
		}

		restore_opts();
		rc = do_submit(rmsg);
	}
	if (retry == 0) {
		snprintf(rmsg, MAXPATHLEN, "Retry to submit a job exhausted.\n");
		rc = PBSE_PROTOCOL;
	}
	return (rc);
}

/*
 * @brief
 *  Perform a regular submit, without the daemon.
 *
 * @param[in] daemon_up - Indicates whether daemon is running
 * @return    rc        - Error code
 */
static int
regular_submit(int daemon_up)
{
	int rc = 0;
	rc = do_connect(server_out, retmsg);
	if (rc == 0) {
		if (sd_svr != -1) {
			rc = do_submit2(retmsg);
		} else
			rc = -1;
	}
	if ((rc == 0) && !(Interact_opt != FALSE || block_opt) && (daemon_up == 0) && (no_background == 0) && !V_opt)
		do_daemon_stuff();
	return rc;
}

/* End of "Daemon" functions. */

int
main(int argc, char **argv, char **envp) /* qsub */
{
	int errflg;				 /* option error */
	static char script[MAXPATHLEN + 1] = ""; /* name of script file */
	char *q_n_out;				 /* queue part of destination */
	char *s_n_out;				 /* server part of destination */
	/* server:port to send request to */
	char *cmdargs = NULL;
	int command_flag = 0;
	int rc = 0;		   /* error code for submit */
	int do_regular_submit = 1; /* used if daemon based submit fails */
	int daemon_up = 0;
	char **argv_cpy; /* copy argv for getopt */
	int i;

	/* Set signal handlers */
	(void) set_sig_handlers();

	/*
	 * Print version info and exit, if specified with --version option.
	 * Otherwise, proceed normally.
	 */
	PRINT_VERSION_AND_EXIT(argc, argv);

	/*
	 * Identify the configured tmpdir without calling pbs_loadconf().
	 * We do not want to incur the cost of parsing the services DB.
	 */
	tmpdir = pbs_get_tmpdir();
	if (tmpdir == NULL) {
		fprintf(stderr, "qsub: Failed to load configuration parameters!\n");
		exit_qsub(2);
	}

	/*
	 * If qsub command is submitted with arguments, then capture them and
	 * encode in XML format using encode_xml_arg_list() and set the
	 * "Submit_arguments" job attribute.
	 */
	if ((argc >= 2) && (cmdargs = encode_xml_arg_list(1, argc, argv))) {
		set_attr_error_exit(&attrib, ATTR_submit_arguments, cmdargs);
		free(cmdargs);
		cmdargs = NULL;
	}

	/* Process options */
	argv_cpy = calloc(argc + 1, sizeof(char *));
	if (argv_cpy == NULL) {
		fprintf(stderr, "qsub: out of memory\n");
		exit_qsub(2);
	}
	for (i = 0; i < argc; i++) {
		argv_cpy[i] = argv[i];
	}
	argv_cpy[argc] = NULL;

	errflg = process_opts(argc, argv_cpy, CMDLINE); /* get cmd-line options */
	if (errflg || ((optind < argc) && (strcmp(argv[optind], argv_cpy[optind]) != 0))) {
		/*
		 * The arguments changed, the script and "--" must have been present.
		 * getopt will move all non-options to the end of the array. In qsub's
		 * case, it will only happen if both the "script" and "-- executable"
		 * were present in the qsub command. This is unsupported usage and
		 * should exit.
		 */
		print_usage();
		exit_qsub(2);
	}
	free(argv_cpy);
	/* Process special arguments */
	command_flag = process_special_args(argc, argv, script);
	fix_path(script, 1);

	if (command_flag == 0)
		/* Read the job script from a file or stdin */
		read_job_script(script);

	/* Needs to be done before job_env_basic(), so that it gets the correct interactive auth method */
	if (Interact_opt)
		pbs_loadconf(0);

	/* Enable X11 Forwarding or GUI if specified */
	enable_gui();

	/* Set option default values */
	set_opt_defaults();

	/* Parse destination string */
	server_out[0] = '\0';
	if (parse_destination_id(destination, &q_n_out, &s_n_out)) {
		fprintf(stderr, "qsub: illegally formed destination: %s\n", destination);
		(void) unlink(script_tmp);
		exit_qsub(2);
	} else if (notNULL(s_n_out)) {
		snprintf(server_out, sizeof(server_out), "%s", s_n_out);
	}

	/*
	 * Get required environment variables to be sent to the server.
	 * Must be done early here, as basic_envlist and qsub_envlist will
	 * be sent to the qsub daemon if needed.
	 */
	basic_envlist = job_env_basic();
	if (basic_envlist == NULL)
		exit_qsub(3);
	if (V_opt)
		qsub_envlist = env_array_to_varlist(envp);

	/*
	 * Disable backgrounding if we are inside another qsub
	 */
	if (getenv(ENV_PBS_JOBID) != NULL)
		no_background = 1;

	/*
	 * In case of interactive jobs, jobs with block=true, or no_background == 1,
	 * qsub should fully execute from the foreground, so daemon_submit() is not called.
	 * It should not fork, neither should it send the data to the background qsub.
	 *
	 * If all 3 of these options are zero, then try to submit via daemon.
	 */
	if ((Interact_opt || block_opt || no_background) == 0) {
		/* Try to submit jobs using a daemon */
		rc = daemon_submit(&daemon_up, &do_regular_submit);
	}

	if (do_regular_submit == 1)
		/* submission via daemon was not successful, so do regular submit */
		rc = regular_submit(daemon_up);

	/* remove temporary job script file */
	(void) unlink(script_tmp);

	if (rc == 0) { /* submit was successful */
		new_jobname = retmsg;
		if (!z_opt && Interact_opt == FALSE)
			printf("%s\n", retmsg); /* print jobid with a \n */
	} else {
		/* error, print whatever our daemon gave us back */
		fprintf(stderr, "%s", retmsg);
		/* check if the retmsg has "qsub: illegal -" string, if so print usage */
		if (strstr(retmsg, "qsub: illegal -"))
			print_usage();
		exit_qsub(rc);
	}

	/* is this an interactive job ??? */
	if (Interact_opt != FALSE)
		interactive();
	else if (block_opt) { /* block until job completes? */
		fflush(stdout);
		block();
	}

	exit_qsub(0);
	return (0);
} /* end of main() */


================================================
FILE: src/cmds/qsub_sup.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * qsub_sup.c
 *
 *  Created on: Jul 3, 2020
 *      Author: bhagatr
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_version.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <sys/utsname.h>
#include <sys/wait.h>
#include <netinet/in.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <signal.h>
#include <termios.h>
#include <assert.h>
#include <sys/un.h>
#include <syslog.h>
#include <openssl/sha.h>
#include "pbs_ifl.h"
#include "ifl_internal.h"
#include "cmds.h"
#include "libpbs.h"
#include "net_connect.h"
#include "dis.h"
#include "port_forwarding.h"
#include "credential.h"
#include "libutil.h"

#if defined(HAVE_SYS_IOCTL_H)
#include <sys/ioctl.h>
#endif /* HAVE_SYS_IOCTL_H */

#define MAXPIPENAME sizeof(((struct sockaddr_un *) 0)->sun_path)
#define QSUB_DMN_TIMEOUT_SHORT 5
#define QSUB_DMN_TIMEOUT_LONG 60 /* timeout for qsub background process */
#define DMN_REFUSE_EXIT 7	 /* return code when daemon can't serve a job and exits */
#define CMDLINE 3
#define XAUTH_LEN 512		     /* Max size of buffer to store Xauth cookie length */
#define XAUTH_ERR_REDIRECTION "2>&1" /* redirection string used for xauth command */
#define X11_PORT_LEN 8		     /* Max size of buffer to store port information as string */

#if !defined(PBS_NO_POSIX_VIOLATION)
char GETOPT_ARGS[] = "a:A:c:C:e:fhIj:J:k:l:m:M:N:o:p:q:r:R:S:u:v:VW:XzP:";
#else
char GETOPT_ARGS[] = "a:A:c:C:e:fhj:J:k:l:m:M:N:o:p:q:r:R:S:u:v:VW:zP:";
#endif /* PBS_NO_POSIX_VIOLATION */

char usage[] =
	"usage: qsub [-a date_time] [-A account_string] [-c interval]\n"
	"\t[-C directive_prefix] [-e path] [-f ] [-h ] [-I [-X]] [-j oe|eo] [-J X-Y[:Z]]\n"
	"\t[-k keep] [-l resource_list] [-m mail_options] [-M user_list]\n"
	"\t[-N jobname] [-o path] [-p priority] [-P project] [-q queue] [-r y|n]\n"
	"\t[-R o|e|oe] [-S path] [-u user_list] [-W otherattributes=value...]\n"
	"\t[-v variable_list] [-V ] [-z] [script | -- command [arg1 ...]]\n";

char read_script_msg[] =
	"Job script will be read from standard input. Submit with CTRL+D.\n";

static struct termios oldtio;					/* Terminal info */
static struct winsize wsz;					/* Window size */
extern struct attrl *attrib;					/* Attribute list */
char fl[MAXPIPENAME];						/* the filename used as the pipe name */
extern char *new_jobname;					/* return from submit request */
extern char server_out[PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2]; /* Destination server, parsed from destination[] */
extern char *tmpdir;						/* Path of temp directory in which to put the job script */
extern char cred_name[32];					/* space to hold small credential name */
extern char destination[PBS_MAXDEST];				/* Destination of the batch job, specified by q opt */
extern char script_tmp[MAXPATHLEN + 1];				/* name of script file copy */
extern char retmsg[MAXPATHLEN];					/* holds the message that background qsub process will send */
extern char qsub_cwd[MAXPATHLEN + 1];				/* buffer to pass cwd to background qsub */
extern char *basic_envlist;					/* basic comma-separated environment variables list string */
extern char *qsub_envlist;					/* comma-separated variables list string */
extern char *v_value;						/* expanded variable list from v opt */
extern char *cred_buf;
extern char *display; /* environment variable DISPLAY */
extern int comm_sock; /* Socket for interactive and block job */
int X11_comm_sock;    /* Socket for x11 communication */
extern int Forwardx11_opt;
extern int sd_svr; /* return from pbs_connect */
extern int is_background;
extern size_t cred_len;

extern int recv_attrl(void *s, struct attrl **attrib);
extern int recv_string(void *s, char *str);
extern int recv_dyn_string(void *s, char **strp);
extern int send_string(void *s, char *str);
extern int send_attrl(void *s, struct attrl *attrib);
extern int send_opts(void *s);
extern int recv_opts(void *s);
extern int do_submit2(char *rmsg);
extern int dosend(void *s, char *buf, int bufsize);
extern int dorecv(void *s, char *buf, int bufsize);
extern int do_dir(char *, int, char *, size_t);
extern int check_qsub_daemon(char *);
extern int Interact_opt;
extern int sig_happened;
extern void log_syslog(char *msg);
extern void exit_qsub(int exitstatus);
extern void qsub_free_attrl(struct attrl *attrib);
extern void bailout(int ret);
extern char *strdup_esc_commas(char *str_to_dup);
static char *X11_get_authstring(void);
extern void set_attr_error_exit(struct attrl **attrib, char *attrib_name, char *attrib_value);
static char *port_X11(void);
static void daemon_stuff(void);

/**
 * @brief
 * 	Log a simple message to syslog
 * 	To be used from the qsub background daemon
 *
 * @param[in]	msg - string to be logged
 *
 */
void
log_syslog(char *msg)
{
	openlog("qsub", LOG_PID | LOG_CONS | LOG_NOWAIT, LOG_USER);
	syslog(LOG_ERR, "%s", msg);
	closelog();
}

/**
 * @brief
 *	Helper function to get the pbs conf file path, and
 *	convert it to a string, later added to the filename
 *	(pipe or unix domain socket filename) that is used
 *	for communications between the front-end and
 *	background qsub processes.
 *	The path to the pbs conf file is converted to a string
 *	by replacing the slashes with underscore char.
 *	If PBS_CONF_FILE is not set, then an empty string is returned.
 *
 * @return - The string representing path to the pbs conf file
 *
 */
static char *
get_conf_path(void)
{
	char *cnf = getenv("PBS_CONF_FILE");
	/* static pointer so we can free heap memory from previous invocation of this function */
	static char *dup_cnf_path = NULL;
	char *p;

	if (cnf) {
		p = strdup(cnf);
		if (p) {
			free(dup_cnf_path);
			dup_cnf_path = p;
			while (*p) {
				if (*p == '/' || *p == ' ' || *p == '.')
					*p = '_';
				p++;
			}
		}
		return dup_cnf_path;
	} else if (dup_cnf_path) {
		return dup_cnf_path;
	} else {
		return "";
	}
}

/**
 * @brief
 *      Check the line does not end with win cr,lf.
 *
 * @param[in]	s	- input line
 *
 * @return      int
 * @retval -1 - input error
 * @retval 0 - unix
 * @retval 1 - win (cr, lf)
 */
int
check_crlf(char * s)
{
	if (s == NULL) {
		return -1;
	}
	int len = strlen(s);
	if (len == 0) {
		return 0;
	}
	if (len > 1 && s[len - 2] == '\r' && s[len - 1] == '\n') {
		return 1;
	}
	return 0;
}

/**
 * @brief
 *      Create a temporary file that will house the job script
 *
 * @param[in]	file	- Input file pointer
 * @param[out]  script	- Temp file location
 * @param[in]   prefix	- Prefix for PBS directives
 *
 * @return      int
 * @retval	-1 - Error processing qsub parameters
 * @retval      3 - Error writing script file
 * @retval      4 - Temp file creation failure
 * @retval      5 - Error reading input file
 * @retval      6 - Unexpected EOF on read
 */
int
get_script(FILE *file, char *script, char *prefix)
{
	char *sopt;
	int err = 0;
	int exec = FALSE;
	char tmp_name[MAXPATHLEN + 1];
	FILE *TMP_FILE;
	char *in;
	char *s_in = NULL;
	int s_len = 0;
	char *extend;
	char *extend_in = NULL;
	int extend_len = 0;
	int extend_loc;
	static char tmp_template[] = "pbsscrptXXXXXX";
	int fds;

	/*
	 * Note: Need to populate script variable as soon as temp file is created so it
	 * gets cleaned up in case of an error.
	 */
	snprintf(tmp_name, sizeof(tmp_name), "%s/%s", tmpdir, tmp_template);
	fds = mkstemp(tmp_name); /* returns file descriptor */
	if (fds != -1) {
		snprintf(script, MAXPATHLEN + 1, "%s", tmp_name);
		if ((TMP_FILE = fdopen(fds, "w+")) == NULL)
			err = 1;
	} else {
		err = 1;
	}

	if (err != 0) {
		perror("mkstemp");
		fprintf(stderr, "qsub: could not create/open tmp file %s for script\n", tmp_name);
		return (4);
	}

	while ((in = pbs_fgets(&s_in, &s_len, file)) != NULL) {
		if (!exec && ((sopt = pbs_ispbsdir(s_in, prefix)) != NULL)) {
			/* Check if this is a directive line that should be extended */
			extend_loc = pbs_extendable_line(in);
			if (extend_loc >= 0) {
				in[extend_loc] = '\0'; /* remove the backslash (\) */
				extend = pbs_fgets_extend(&extend_in, &extend_len, file);
				if (extend != NULL) {
					if (pbs_strcat(&s_in, &s_len, extend) == NULL)
						return (5);
					in = s_in;
					sopt = pbs_ispbsdir(s_in, prefix);
				}
			}

			/*
			 * Setting options from the job script will not overwrite
			 * options set on the command line. CMDLINE-1 means
			 * "one less than CMDLINE priority"
			 */
			if (do_dir(sopt, CMDLINE - 1, retmsg, MAXPATHLEN) != 0) {
				fprintf(stderr, "%s", retmsg);
				free(extend_in);
				free(s_in);
				return (-1);
			}
		} else if (!exec && pbs_isexecutable(s_in)) {
			exec = TRUE;
		}
#ifndef WIN32
		if (check_crlf(in)) {
			fprintf(stderr, "qsub: script contains cr, lf\n");
			fclose(TMP_FILE);
			free(extend_in);
			free(s_in);
			return (5);
		}
#endif
		if (fputs(in, TMP_FILE) < 0) {
			perror("fputs");
			fprintf(stderr, "qsub: error writing copy of script, %s\n",
				tmp_name);
			fclose(TMP_FILE);
			free(extend_in);
			free(s_in);
			return (3);
		}
	}

	free(extend_in);
	free(s_in);
	if (fclose(TMP_FILE) != 0) {
		perror(" qsub: copy of script to tmp failed on close");
		return (5);
	}
	if (ferror(file)) {
		fprintf(stderr, "qsub: error reading script file\n");
		return (5);
	}
	return (0);
}

/**
 * @brief
 *	signal handler to avoid race condition
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
blockint(int sig)
{
	sig_happened = sig;
}

/**
 * @brief
 *  Enable X11 Forwarding (on Unix) if specified.
 */
void
enable_gui(void)
{
	char *x11authstr = NULL;
	if (Forwardx11_opt) {
		if (!Interact_opt) {
			fprintf(stderr, "qsub: X11 Forwarding possible only for interactive jobs\n");
			exit_qsub(1);
		}
		/* get the DISPLAY's auth protocol, hexdata, and screen number */
		if ((x11authstr = X11_get_authstring()) != NULL) {
			set_attr_error_exit(&attrib, ATTR_X11_cookie, x11authstr);
			set_attr_error_exit(&attrib, ATTR_X11_port, port_X11());
#ifdef DEBUG
			fprintf(stderr, "x11auth string: %s\n", x11authstr);
#endif
		} else {
			exit_qsub(1);
		}
	}
}

/**
 * @Brief
 *      This function returns a string that consists of the protocol getting
 *      used, the hex data and the screen number . This string will form the
 *      basis of X authentication . It will be passed as a job attribute to
 *      MOM.
 * @return char*
 * @retval authstring Success
 * @retval NULL Failure
 *
 */
static char *
X11_get_authstring(void)
{
	char line[XAUTH_LEN] = {'\0'};
	char command[XAUTH_LEN] = {'\0'};
	char protocol[XAUTH_LEN];
	char hexdata[XAUTH_LEN];
	char screen[XAUTH_LEN];
	char format[XAUTH_LEN];
	char *authstring = NULL;
	FILE *f;
	int got_data = 0, ret = 0;
	char *p;

	protocol[0] = '\0';
	hexdata[0] = '\0';
	screen[0] = '\0';

	sprintf(format, " %%*s %%%ds %%%ds ", XAUTH_LEN - 1, XAUTH_LEN - 1);

	p = strchr(display, ':');
	if (p == NULL) {
		fprintf(stderr, "qsub: Failed to get xauth data "
				"(check $DISPLAY variable)\n");
		return NULL;
	}

	/* Try to get Xauthority information for the display. */
	if (strncmp(display, "localhost", sizeof("localhost") - 1) == 0) {
		/*
		 * Handle FamilyLocal case where $DISPLAY does
		 * not match an authorization entry. For this we
		 * just try "xauth list unix:displaynum.screennum".
		 * "localhost" match to determine FamilyLocal
		 * is not perfect.
		 */
		ret = snprintf(line, sizeof(line), "%s list unix:%s %s",
			       XAUTH_BINARY,
			       p + 1,
			       XAUTH_ERR_REDIRECTION);
		if (ret >= sizeof(line)) {
			fprintf(stderr, " qsub: line overflow\n");
			return NULL;
		}
	} else {
		ret = snprintf(line, sizeof(line), "%s list %.255s %s",
			       XAUTH_BINARY,
			       display,
			       XAUTH_ERR_REDIRECTION);
		if (ret >= sizeof(line)) {
			fprintf(stderr, " qsub: line overflow\n");
			return NULL;
		}
	}
	snprintf(command, sizeof(command), "%s", line);

	if (p != NULL)
		p = strchr(p, '.');

	if (p != NULL)
		snprintf(screen, sizeof(screen), "%s", p + 1);
	else
		strcpy(screen, "0"); /* Should be safe because sizeof(screen) = XAUTH_LEN which is >= 2 */

#ifdef DEBUG
	fprintf(stderr, "X11_get_authstring: %s\n", line);
#endif
	f = popen(line, "r");
	if (f == NULL) {
		fprintf(stderr, "execution of '%s' failed, errno=%d \n", command, errno);
	} else if (fgets(line, sizeof(line), f) == 0) {
		fprintf(stderr, "cannot read data from '%s', errno=%d \n", command, errno);
	} else if (sscanf(line, format,
			  protocol,
			  hexdata) != 2) {
		fprintf(stderr, "cannot parse output from '%s'\n", command);
	} else {
		/* SUCCESS */
		got_data = 1;
	}

	if (f != NULL) {
		/*
		 * Check the return value of pclose to see if the command failed?
		 * In that case, the "line" read from stdout is probably an
		 * error message (since stderr is redirected to stdout) from the shell or xauth,
		 * so display that to the user.
		 */
		if (pclose(f) != 0) {
			fprintf(stderr, "execution of xauth failed: %s", line);
			return NULL;
		}
	}

	if (!got_data)
		/* FAILURE */
		return NULL;

	/**
	 * Allocate 4 additional bytes for the terminating NULL character for
	 * each of the strings inside malloc
	 */
	authstring = malloc(strlen(protocol) + strlen(hexdata) +
			    strlen(screen) + 4);
	if (authstring == NULL) {
		/* FAILURE */
		fprintf(stderr, " qsub: Malloc Failed\n");
		return NULL;
	}
	sprintf(authstring, "%s:%s:%s",
		protocol,
		hexdata,
		screen);

	return (authstring);
}

/**
 * @brief
 *	This function creates a socket to listen for "X11" data
 *	and returns a port number where its listening for X data.
 *
 * @return	char*
 * @retval	portstring	success
 *
 * @par Side Effects
 *		If this function fails, it will exit the qsub process.
 *
 */
static char *
port_X11(void)
{
	pbs_socklen_t namelen;
	struct sockaddr_in myaddr;
	static char X11_port_str[X11_PORT_LEN];
	unsigned short X11_port;

	X11_comm_sock = socket(AF_INET, SOCK_STREAM, 0);
	if (X11_comm_sock < 0) {
		perror("qsub: unable to create socket");
		exit_qsub(1);
	}
	myaddr.sin_family = AF_INET;
	myaddr.sin_addr.s_addr = INADDR_ANY;
	myaddr.sin_port = 0;

	if (bind(X11_comm_sock, (struct sockaddr *) &myaddr,
		 sizeof(myaddr)) < 0) {
		perror("qsub: unable to bind to socket");
		exit_qsub(1);
	}
	/* get port number assigned */
	namelen = sizeof(myaddr);
	if (getsockname(X11_comm_sock, (struct sockaddr *) &myaddr,
			&namelen) < 0) {
		perror("qsub: unable to get port number");
		exit_qsub(1);
	}
	X11_port = ntohs(myaddr.sin_port);
	(void) sprintf(X11_port_str, "%u", (unsigned int) X11_port);
	if (listen(X11_comm_sock, 1) < 0) {
		perror("qsub: listening on X11 socket failed");
		exit_qsub(1);
	}
	return (X11_port_str);
}

/**
 * @brief
 *	Fork the current process. Call the daemon_stuff function in the
 *	child process which starts listening on the unix domain socket etc.
 *	The parent process continues out of this function and eventually
 *	returns back control to the calling shell.
 *
 * @param[in] fname  - The filename used for the communication pipe/socket for
 *                     the communication between background and forground qsub processes.
 * @param[in] handle - Handle to synchronization event between foreground and
 *                     background qsub processes.
 * @param[in] server - Target server name of NULL in case of default
 *
 * exits program on failure
 *
 */
void
do_daemon_stuff()
{
	int pid;

	pid = fork();
	if (pid == 0) {
		/*
		 * Try to become the session leader.
		 * If that fails, exit with a syslog message
		 */
		if (setsid() == -1) {
			log_syslog("setsid failed");
			exit(1);
		}

		/*
		 * Just close standard files. We don't want to
		 * be session leader or close all other files.
		 */
		(void) fclose(stdin);
		(void) fclose(stdout);
		(void) fclose(stderr);

		/* clear off all the attributes */
		qsub_free_attrl(attrib);
		attrib = NULL;
		free(v_value);
		v_value = NULL;
		free(basic_envlist);
		basic_envlist = NULL;
		free(qsub_envlist);
		qsub_envlist = NULL;

		/* set single threaded mode */
		pbs_client_thread_set_single_threaded_mode();

		/* set when background qsub is running */
		is_background = 1;
		daemon_stuff();
		/*
		 * Control should never reach here.
		 * Still adding an exit, so it does not traverse parent code.
		 */
		exit(1);
	}
}

/**
 * @brief
 *	Signal handler for SIGPIPE
 * @param[in]	sig - signal number
 * @return	void
 *
 */
void
exit_on_sigpipe(int sig)
{
	perror("qsub: SIGPIPE received, job submission interrupted.");
	exit_qsub(1);
}

/**
 * @brief
 *  Set the signal handlers.
 */
void
set_sig_handlers(void)
{
	/* Catch SIGPIPE on write() failures. */
	struct sigaction act;
	sigemptyset(&act.sa_mask);
	act.sa_handler = exit_on_sigpipe;
	act.sa_flags = 0;
	if (sigaction(SIGPIPE, &act, NULL) < 0) {
		perror("qsub: unable to catch SIGPIPE");
		exit_qsub(1);
	}
}

/**
 * @brief
 *	Send data of bufsize length to the peer. Used for communications
 * 	between the foreground and background qsub processes.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 * @param[in]	buf - The buf to send data from
 * @param[in]	bufsize - The amount of data to send
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
dosend(void *s, char *buf, int bufsize)
{
	int bytes = 0;
	int sock = (int) *((int *) s);
	int rc;
	char *p = buf;
	int remaining = bufsize;
	do {
		/*
		 * For systems with MSG_NOSIGNAL defined (e.g. Linux 2.2 and later),
		 * we use send() rather than write() in order to block the SIGPIPE
		 * that qsub would receive if the remote side closes the stream. For
		 * other systems, the exit_on_sigpipe() handler gets called.
		 */
		errno = 0;
#ifdef MSG_NOSIGNAL
		rc = send(sock, p, remaining, MSG_NOSIGNAL);
#else
		rc = write(sock, p, remaining);
#endif
		if (rc == -1)
			return -1;
		if (rc == 0)
			break;
		bytes += rc;
		p += rc;
		remaining -= rc;
	} while (bytes < bufsize);

	if (bytes != bufsize)
		return -1;
	return 0;
}

/**
 * @brief
 *	Receive data of bufsize length from the peer. Used for communications
 * 	between the foreground and background qsub processes.
 *
 * @param[in]	s - pointer to the windows PIPE or Unix domain socket
 * @param[in]	buf - The buf to receive data into
 * @param[in]	bufsize - The amount of data to read
 *
 * @return int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
dorecv(void *s, char *buf, int bufsize)
{
	int bytes = 0;
	char *p = buf;
	int remaining = bufsize;
	int sock = *((int *) s);
	int rc;

	do {
		errno = 0;
		rc = read(sock, p, remaining);
		if (rc == -1)
			return -1;
		if (rc == 0)
			break;
		bytes += rc;
		p += rc;
		remaining -= rc;
	} while (bytes < bufsize);

	if (bytes != bufsize)
		return -1;
	return 0;
}

/**
 * @brief
 *	Interactive Reader process: reads from the remote socket,
 *	and writes that out to the stdout
 *
 * @param[in] s - socket (file descriptor)
 *
 * @return   Error code
 * @retval  -1  Failure
 * @retval   0   Success
 *
 */
int
reader(int s)
{
	char buf[4096];
	int c;
	char *p;
	int wc;

	/* read from the socket, and write to stdout */
	while (1) {
		c = CS_read(s, buf, sizeof(buf));
		if (c > 0) {
			p = buf;
			while (c) {
				if ((wc = write(1, p, c)) < 0) {
					if (errno == EINTR) {
						continue;
					} else {
						perror("qsub: write error");
						return (-1);
					}
				}
				c -= wc;
				p += wc;
			}
		} else if (c == 0) {
			return (0); /* EOF - all done */
		} else {
			if (errno == EINTR)
				continue;
			else {
				perror("qsub: read error");
				return (-1);
			}
		}
	}
}

/**
 * @brief
 *	Interactive Paket Reader process: reads from the remote socket,
 *	and writes that out to the stdout
 *
 * @param[in] s - socket (file descriptor)
 *
 * @return   Error code
 * @retval  -1  Failure
 * @retval   0   Success
 *
 */
int
pkt_reader(int s)
{
	int c;
	char *p;
	int wc;
	void *data_in = NULL;
	size_t len_in = 0;
	int type = 0;

	/* read from the socket, and write to stdout */
	while (1) {
		pbs_tcp_timeout = -1;
		c = transport_recv_pkt(s, &type, &data_in, &len_in);
		if (c > 0) {
			p = data_in;
			while (c) {
				if ((wc = write(1, p, c)) < 0) {
					if (errno == EINTR) {
						continue;
					} else {
						perror("qsub: write error");
						return (-1);
					}
				}
				c -= wc;
				p += wc;
			}
		} else if (c == -2) { /* tcp_recv returns -2 on EOF */
			return (0); /* EOF - all done */
		} else {
			if (errno == EINTR)
				continue;
			else {
				perror("qsub: read error");
				return (-1);
			}
		}
	}
}

/**
 * @brief       This is a reader function which reads from the remote socket
 *              when X forwarding is enabled and writes it back to stdout.
 *
 * @param[in] s - socket descriptor from where data is to be read.
 *
 * @return	int
 * @retval	 0	Success
 * @retval	-1	Failure
 * @retval      -2      Peer Closed connection
 *
 */
int
reader_Xjob(int s)
{
	static char buf[PF_BUF_SIZE];
	int c = 0;
	char *p;
	int wc;
	int d = fileno(stdout);

	/* read from the socket and write to stdout */
	c = CS_read(s, buf, sizeof(buf));
	if (c > 0) {
		p = buf;
		while (c) {
			/*write data back to stdout*/
			if ((wc = write(d, p, c)) < 0) {
				if (errno == EINTR) {
					continue;
				} else {
					perror("qsub: write error");
					return (-1);
				}
			}
			c -= wc;
			p += wc;
		}
	} else if (c == 0) {
		/*
		 * If control reaches here, then it means peer has closed the
		 * connection.
		 */
		return (-2);
	} else if (errno == EINTR) {
		return (0);
	} else {
		perror("qsub: read error");
		return (-1);
	}

	return (0);
}

/**
 * @brief       This is a packet reader function which reads from the remote socket
 *              when X forwarding is enabled and writes it back to stdout.
 *
 * @param[in] s - socket descriptor from where data is to be read.
 *
 * @return	int
 * @retval	 0	Success
 * @retval	-1	Failure
 * @retval      -2      Peer Closed connection
 *
 */
int
pkt_reader_Xjob(int s)
{
	int c = 0;
	char *p;
	int wc;
	int d = fileno(stdout);
	void *data_in = NULL;
	size_t len_in = 0;
	int type = 0;

	/* read from the socket and write to stdout */
	c = transport_recv_pkt(s, &type, &data_in, &len_in);
	if (c > 0) {
		p = data_in;
		while (c) {
			/*write data back to stdout*/
			if ((wc = write(d, p, c)) < 0) {
				if (errno == EINTR) {
					continue;
				} else {
					perror("qsub: write error");
					return (-1);
				}
			}
			c -= wc;
			p += wc;
		}
	} else if (c == -2) { /* tcp_recv returns -2 on EOF */
		/*
		 * If control reaches here, then it means peer has closed the
		 * connection.
		 */
		return (-2);
	} else if (errno == EINTR) {
		return (0);
	} else {
		perror("qsub: read error");
		return (-1);
	}

	return (0);
}

/**
 * @brief       This is a reader wrapper function which selects reader for remote socket
 *              when X forwarding is enabled and writes it back to stdout.
 *
 * @param[in] s - socket descriptor from where data is to be read.
 *
 * @return	int
 * @retval	 0	Success
 * @retval	-1	Failure
 * @retval      -2      Peer Closed connection
 *
 */
int
get_reader_Xjob(int s)
{
	if (transport_chan_get_ctx_status(s, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		return pkt_reader_Xjob(s);
	} else {
		return reader_Xjob(s);
	}
}

/**
 * @brief
 * 	settermraw - set terminal into "raw" mode
 *
 * @param[in] ptio - pointer to termios structure
 *
 * @return None
 * @retval Void
 *
 */
void
settermraw(struct termios *ptio)
{
	struct termios tio;

	tio = *ptio;

	tio.c_lflag &= ~(ICANON | ISIG | ECHO | ECHOE | ECHOK);
	tio.c_iflag &= ~(IGNBRK | INLCR | ICRNL | IXON | IXOFF);
	tio.c_oflag = 0;
	tio.c_oflag |= (OPOST); /* TAB3 */
	tio.c_cc[VMIN] = 1;
	tio.c_cc[VTIME] = 0;

#if defined(TABDLY) && defined(TAB3)
	if ((tio.c_oflag & TABDLY) == TAB3)
		tio.c_oflag &= ~TABDLY;
#endif
	tio.c_cc[VKILL] = -1;
	tio.c_cc[VERASE] = -1;

	if (tcsetattr(0, TCSANOW, &tio) < 0)
		perror("qsub: set terminal mode");
}

/**
 * @brief
 * 	stopme - suspend process on ~^Z or ~^Y
 *	on suspend, reset terminal to normal "cooked" mode;
 *	when resumed, again set terminal to raw.
 *
 * @param[in] p - process id
 *
 * @return None
 * @retval Void
 *
 */
void
stopme(pid_t p)
{
	(void) tcsetattr(0, TCSANOW, &oldtio); /* reset terminal */
	kill(p, SIGTSTP);
	settermraw(&oldtio); /* back to raw when we resume */
}

/**
 * @brief
 * 	Writer process: reads from stdin, and writes
 * 	data out to the rem socket
 *
 * @param[in] s - file descriptor
 *
 * @return Void
 *
 */
void
writer(int s)
{
	char c;
	int i;
	int newline = 1;
	char tilde = '~';
	int wi;

	bool as_pkt = transport_chan_get_ctx_status(s, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY;

	/* read from stdin, and write to the socket */

	while (1) {
		i = read(0, &c, 1);
		if (i > 0) { /* read data */
			if (newline) {
				if (c == tilde) { /* maybe escape character */

					/* read next character to check */

					while ((i = read(0, &c, 1)) != 1) {
						if ((i == -1) && (errno == EINTR))
							continue;
						else
							break;
					}
					if (i != 1)
						break;
					if (c == '.') /* termination character */
						break;
					else if (c == oldtio.c_cc[VSUSP]) {
						stopme(0); /* ^Z suspend all */
						continue;
#ifdef VDSUSP
					} else if (c == oldtio.c_cc[VDSUSP]) {
						stopme(getpid());
						continue;
#endif						 /* VDSUSP */
					} else { /* not escape, write out tilde */
						if (as_pkt) {
							wi = transport_send_pkt(s, AUTH_ENCRYPTED_DATA, &tilde, 1);
							if (wi < 1)
								break;
						} else {
							while ((wi = CS_write(s, &tilde, 1)) != 1) {
								if ((wi == -1) && (errno == EINTR))
									continue;
								else
									break;
							}
							if (wi != 1)
								break;
						}
					}
				}
				newline = 0; /* no longer at start of line */
			} else {
				/* reset to newline if \n \r kill or interrupt */
				newline = (c == '\n') ||
					  (c == oldtio.c_cc[VKILL]) ||
					  (c == oldtio.c_cc[VINTR]) ||
					  (c == '\r');
			}
			if (as_pkt) {
				wi = transport_send_pkt(s, AUTH_ENCRYPTED_DATA, &c, 1);
				if (wi < 1)
					break;
			} else {
				while ((wi = CS_write(s, &c, 1)) != 1) { /* write out character */
					if ((wi == -1) && (errno == EINTR))
						continue;
					else
						break;
				}
				if (wi != 1)
					break;
			}

		} else if (i == 0) { /* EOF */
			break;
		} else if (i < 0) { /* error */
			if (errno == EINTR)
				continue;
			else {
				perror("qsub: read error");
				return;
			}
		}
	}
	return;
}

/**
 * @brief
 * 	send_term - send the current TERM type and certain control characters
 *
 * @param[in] sock - file descriptor
 *
 * @return Void
 *
 */
void
send_term(int sock)
{
	char buf[PBS_TERM_BUF_SZ];
	char *term;
	char cc_array[PBS_TERM_CCA];

	term = getenv("TERM");
	term = strdup_esc_commas(term);
	if (term == NULL)
		snprintf(buf, sizeof(buf), "TERM=unknown");
	else {
		snprintf(buf, sizeof(buf), "TERM=%s", term);
		free(term);
	}

	if (transport_chan_get_ctx_status(sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		transport_send_pkt(sock, AUTH_ENCRYPTED_DATA, buf, PBS_TERM_BUF_SZ);
	} else {
		(void) CS_write(sock, buf, PBS_TERM_BUF_SZ);
	}

	cc_array[0] = oldtio.c_cc[VINTR];
	cc_array[1] = oldtio.c_cc[VQUIT];
	cc_array[2] = oldtio.c_cc[VERASE];
	cc_array[3] = oldtio.c_cc[VKILL];
	cc_array[4] = oldtio.c_cc[VEOF];
	cc_array[5] = oldtio.c_cc[VSUSP];

	if (transport_chan_get_ctx_status(sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		transport_send_pkt(sock, AUTH_ENCRYPTED_DATA, cc_array, PBS_TERM_CCA);
	} else {
		(void) CS_write(sock, cc_array, PBS_TERM_CCA);
	}
}

/**
 * @brief
 *	send_winsize = send the current tty's window size
 *
 * @param[in] sock - file descriptor
 *
 * @return Void
 *
 */
void
send_winsize(int sock)
{
	char buf[PBS_TERM_BUF_SZ];

	(void) sprintf(buf, "WINSIZE %hu,%hu,%hu,%hu", wsz.ws_row, wsz.ws_col, wsz.ws_xpixel, wsz.ws_ypixel);

	if (transport_chan_get_ctx_status(sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		transport_send_pkt(sock, AUTH_ENCRYPTED_DATA, buf, PBS_TERM_BUF_SZ);
	} else {
		(void) CS_write(sock, buf, PBS_TERM_BUF_SZ);
	}
	return;
}

/**
 * @brief
 *	getwinsize - get the current window size
 *
 * @param[in] pwsz - pointer to winsize structure
 *
 * @return   Error code
 * @retval  -1    Failure
 * @retval   0    Success
 *
 */
int
getwinsize(struct winsize *pwsz)
{
	if (ioctl(0, TIOCGWINSZ, &wsz) < 0) {
		perror("qsub: unable to get window size");
		return (-1);
	}
	return (0);
}

/**
 * @brief
 *	catchchild = signal handler for Death of Child
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
catchchild(int sig)
{
	int status;
	int pid;

	while (1) {
		pid = waitpid(-1, &status, WNOHANG | WUNTRACED);
		if (pid == 0)
			return;
		if ((pid > 0) && (WIFSTOPPED(status) == 0))
			break;
		if ((pid == -1) && (errno != EINTR)) {
			perror("qsub: bad status in catchchild: ");
			return;
		}
	}

	/* reset terminal to cooked mode */

	(void) tcsetattr(0, TCSANOW, &oldtio);
	exit_qsub(0);
}

/**
 * @brief
 *	prints can't suspend qsub process on arrival of signal causing suspension
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
no_suspend(int sig)
{
	printf("Sorry, you cannot suspend qsub until the job is started\n");
	fflush(stdout);
}

/**
 * @brief
 *	signal handler function for interrupt signal
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
catchint(int sig)
{
	int c;

	printf("Do you wish to terminate the job and exit (y|[n])? ");
	fflush(stdout);
	while (1) {
		alarm(60); /* give a minute to think about it */
		c = getchar();

		if ((c == 'n') || (c == 'N') || (c == '\n'))
			break;
		else if ((c == 'y') || (c == 'Y') || (c == EOF)) {
			bailout(0);
		} else {
			printf("yes or no please\n");
			while ((c != '\n') && (c != EOF))
				c = getchar();
		}
	}
	alarm(0); /* reset alarm */
	while ((c != '\n') && (c != EOF))
		c = getchar();
	return;
}

/**
 * @brief
 *	signal handler for timeout scenario
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
toolong(int sig)
{
	printf("Timeout -- deleting job\n");
	bailout(0);
}

/**
 * @brief
 *  Function used to log port forwarding messages.
 *
 * @param[in] msg - error message to be logged
 *
 * @return Void
 *
 */
static void
log_cmds_portfw_msg(char *msg)
{
	fprintf(stderr, "%s\n", msg);
	(void) fflush(stderr);
	(void) fflush(stdout);
}

/**
 * @brief
 *	This function initializes pfwdsock structure and eventually
 *	calls port_forwarder.
 *
 * @param[in]	X_data_socket - socket descriptor used to read X data from mom
 *				port forwarders.
 * @param[in]	interactive_reader_socket - socket descriptor used to read
 *				interactive job data coming from mom writer.
 * @return	void
 *
 * @par Side Effects
 * 	On failure, the function will cause the qsub process to exit.
 *
 */
static void
x11handler(int X_data_socket, int interactive_reader_socket)
{
	int n;
	struct pfwdsock *socks;
	socks = calloc(sizeof(struct pfwdsock), NUM_SOCKS);
	if (!socks) {
		fprintf(stderr, "Calloc failed : out of memory\n");
		exit_qsub(1);
	}
	for (n = 0; n < NUM_SOCKS; n++) {
		(socks + n)->active = 0;
	}
	socks->sock = X_data_socket;
	socks->active = 1;
	socks->listening = 1;

	/* Try to open a socket for the local X server. */

	port_forwarder(socks, x11_connect_display, display, 0,
		       interactive_reader_socket, get_reader_Xjob, log_cmds_portfw_msg,
			   QSUB_SIDE, pbs_conf.interactive_auth_method,
			   pbs_conf.interactive_encrypt_method, new_jobname);
}

/**
 * @brief
 *	interactive - set up for interactive communication with job
 *
 * @return      void
 *
 * @par Side Effects
 *	On failure, the function will cause the qsub process to exit.
 *
 */
void
interactive(void)
{
	int amt;
	char cur_server[PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2];
	pbs_socklen_t fromlen;
	char momjobid[PBS_MAXSVRJOBID + 1];
	int news;
	int nsel;
	char *pc;
	fd_set selset;

	struct sigaction act;
	struct sockaddr_in from;
	struct timeval timeout;
	struct winsize wsz;
	int child;
	int ret;
	int type;
	void *data_in = NULL;
	size_t len_in = 0;

	/* disallow ^Z which hangs up MOM starting an interactive job */
	sigemptyset(&act.sa_mask);
	act.sa_handler = no_suspend;
	act.sa_flags = 0;
	if (sigaction(SIGTSTP, &act, NULL) < 0) {
		perror("sigaction(SIGTSTP)");
		exit_qsub(1);
	}

	/* Catch SIGINT and SIGTERM, and setup to catch Death of child */
	act.sa_handler = catchint;
	if ((sigaction(SIGINT, &act, NULL) < 0) ||
	    (sigaction(SIGTERM, &act, NULL) < 0)) {
		perror("unable to catch signals");
		exit_qsub(1);
	}
	act.sa_handler = toolong;
	if ((sigaction(SIGALRM, &act, NULL) < 0)) {
		perror("cannot catch alarm");
		exit_qsub(2);
	}

	/* save the old terminal setting */
	if (tcgetattr(0, &oldtio) < 0) {
		perror("qsub: unable to get terminal settings");
		exit_qsub(1);
	}

	/* Get the current window size, to be sent to MOM later */
	if (getwinsize(&wsz)) {
		/* unable to get actual values, set defaults */
		wsz.ws_row = 20;
		wsz.ws_col = 80;
		wsz.ws_xpixel = 0;
		wsz.ws_ypixel = 0;
	}

	printf("qsub: waiting for job %s to start\n", new_jobname);

	/* Accept connection on socket set up earlier */
	nsel = 0;
	while (nsel == 0) {
		FD_ZERO(&selset);
		FD_SET(comm_sock, &selset);
		timeout.tv_usec = 0;
		timeout.tv_sec = 30;
		nsel = select(FD_SETSIZE, &selset, NULL, NULL, &timeout);
		if (nsel == -1) {
			if (errno == EINTR)
				nsel = 0;
			else {
				perror("qsub: select failed");
				exit_qsub(1);
			}
		}
		if (nsel == 0) {
			/* connect to server, status job to see if still there */
			if (!locate_job(new_jobname, server_out, cur_server)) {
				fprintf(stderr, "qsub: job %s apparently deleted\n", new_jobname);
				exit_qsub(1);
			}
		}
	}

	/* apparently someone is attempting to connect to us */

retry:
	fromlen = sizeof(from);
	if ((news = accept(comm_sock, (struct sockaddr *) &from, &fromlen)) < 0) {
		perror("qsub: accept error from Interactive socket ");
		exit_qsub(1);
	}

	/*
	 * When Mom connects we expect:
	 * first, to engage in an authentication activity
	 * second, mom sends the job id for us to verify
	 */

	ret = auth_exec_socket(news, &from, pbs_conf.interactive_auth_method, pbs_conf.interactive_encrypt_method, new_jobname);
	if (ret != INTERACTIVE_AUTH_SUCCESS) {
 		fprintf(stderr, "qsub: failed authentication with execution host\n");
		shutdown(news, SHUT_RDWR);
		close(news);
		dis_destroy_chan(news);
		if (ret == INTERACTIVE_AUTH_RETRY)
			goto retry;
		else
			exit_qsub(1);
 	}

	/* now verify the value of job id */

	if (transport_chan_get_ctx_status(news, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		int len = transport_recv_pkt(news, &type, &data_in, &len_in);
		if (len <= 0) { /* no data read */
			shutdown(news, 2);
			close(news);
			dis_destroy_chan(news);
			goto retry;
		}
		strncpy(momjobid, (char *) data_in, len_in);
	} else {
		amt = PBS_MAXSVRJOBID + 1;
		pc = momjobid;
		while (amt > 0) {
			int len = CS_read(news, pc, amt);
			if (len <= 0)
				break;
			pc += len;
			if (*(pc - 1) == '\0')
				break;
			amt -= len;
		}
		if (pc == momjobid) { /* no data read */
			shutdown(news, 2);
			close(news);
			dis_destroy_chan(news);
			goto retry;
		}
	}

	if (strncmp(momjobid, new_jobname, PBS_MAXSVRJOBID) != 0) {
		fprintf(stderr, "qsub: invalid job name from execution server\n");
		shutdown(news, 2);
		dis_destroy_chan(news);
		exit_qsub(1);
	}

	/*
	 * got the right job, send:
	 *		terminal type as "TERM=xxxx"
	 *		window size as   "WINSIZE=r,c,x,y"
	 */
	send_term(news);
	send_winsize(news);

	printf("qsub: job %s ready\n\n", new_jobname);

	/* set SIGINT, SIGTERM processing to default */

	act.sa_handler = SIG_DFL;
	if ((sigaction(SIGINT, &act, NULL) < 0) ||
	    (sigaction(SIGTERM, &act, NULL) < 0) ||
	    (sigaction(SIGALRM, &act, NULL) < 0) ||
	    (sigaction(SIGTSTP, &act, NULL) < 0)) {
		perror("unable to reset signals");
		exit_qsub(1);
	}

	child = fork();
	if (child == 0) {
		/* child process - start the reader function set terminal into raw mode */
		settermraw(&oldtio);

		if (Forwardx11_opt) {
			/*
			 * if forwardx11_opt is set call x11handler which
			 * will act as a reader as well as a port forwarder
			 */
			x11handler(X11_comm_sock, news);
		} else {
			/* call interactive job's reader */
			if (transport_chan_get_ctx_status(news, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
				(void) pkt_reader(news);
			} else {
				(void) reader(news);
			}
		}
		/* reset terminal */
		tcsetattr(0, TCSANOW, &oldtio);
		printf("\nqsub: job %s completed\n", new_jobname);
		exit_qsub(0);

	} else if (child > 0) {
		/* parent - start the writer function */
		act.sa_handler = catchchild;
		if (sigaction(SIGCHLD, &act, NULL) < 0)
			exit_qsub(1);

		writer(news);

		/* all done - make sure the child is gone and reset the terminal */
		kill(child, SIGTERM);
		shutdown(comm_sock, SHUT_RDWR);
		close(comm_sock);

		tcsetattr(0, TCSANOW, &oldtio);
		printf("\nqsub: job %s completed\n", new_jobname);
		exit_qsub(0);
	} else {
		perror("qsub: unable to fork");
		exit_qsub(1);
	}
}

/**
 * @brief
 *	Sets the filename to be used for the unix domain socket based comm.
 *	This is formed by appending the UID and the target server name to the
 *	filename. The length of the string is restricted to the length of the
 *	global variable fl. This is fairly small (108 characters) for Linux.
 *
 * @param[out] fname - The filename in tmpdir that is used as the unix domain socket
 *			file.
 *
 */
void
get_comm_filename(char *fname)
{
	char *env_svr = getenv(PBS_CONF_SERVER_NAME);
	char *env_port = getenv(PBS_CONF_BATCH_SERVICE_PORT);
	int count = 0;
	char buf[LARGE_BUF_LEN];
	int len;
	unsigned char hash[SHA_DIGEST_LENGTH];
	int i;

	count = snprintf(fname, MAXPIPENAME, "%s/pbs_%.16s_%lu_%.8s_%.32s_%.16s_%.5s",
			 tmpdir,
			 server_out[0] == '\0' ? "default" : server_out,
			 (unsigned long int) getuid(),
			 cred_name,
			 get_conf_path(),
			 env_svr ? env_svr : "",
			 env_port ? env_port : "");

	if (count >= MAXPIPENAME) {
		count = snprintf(fname, MAXPIPENAME, "%s/pbs_", TMP_DIR);
		len = snprintf(buf, MAXPIPENAME, "%.16s_%lu_%.8s_%.32s_%.16s_%.5s",
			       server_out[0] == '\0' ? "default" : server_out,
			       (unsigned long int) getuid(),
			       cred_name,
			       get_conf_path(),
			       (env_svr == NULL) ? "" : env_svr,
			       (env_port == NULL) ? "" : env_port);

		if (len + count < MAXPIPENAME) {
			pbs_strncpy(fname + count, buf, MAXPIPENAME - count);
		} else {
			if (SHA1((const unsigned char *) buf, SHA_DIGEST_LENGTH, (unsigned char *) &hash)) {
				for (i = 0; i < SHA_DIGEST_LENGTH; i++)
					sprintf(buf + (i * 2), "%02x", hash[i]);

				buf[SHA_DIGEST_LENGTH * 2] = 0;
			}
			pbs_strncpy(fname + count, buf, MAXPIPENAME - count);
		}
	}
}

/**
 * @brief
 *	Check whether a unix domain socket file is available.
 *	That is an indication that a background qsub might already be running.
 *
 * @param[out]	fname - The filename used for the communication pipe/socket for
 *			the communication between background and forground
 *			qsub processes.
 *
 * @return int
 * @retval	0 - Not available
 * @retval	1 - available
 *
 */
int
check_qsub_daemon(char *fname)
{
	get_comm_filename(fname);
	if (access(fname, F_OK) == 0) {
		/* check if file is usable */
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	The daemon_stuff Unix counterpart.
 *	It creates a unix domain socket server and starts listening on it.
 *	The umask is set to 077 so that the domain socket file is owned and
 *	accessible by the user executing qsub only. Once a client (foreground
 *	qsub) connects, it receives all the data from the foreground qsub and
 *	executes do_submit, on the pre-established connection to pbs_server.
 *	The connection to server was estiblished by the caller of this function
 *	by calling do_connect().
 *	This function also does a "select" wait on input of data from foreground
 *	qsub processes, and a close notification on the socket with pbs_server.
 *	The select breaks if foreground qsubs connect, the pbs_server dies, or
 *	the timeout of 1 minutes expires. For the latter two cases, this function
 *	does a silent exit of the background qsub daemon.
 *
 */
static void
daemon_stuff(void)
{
	int sock, bindfd;
	struct sockaddr_un s_un;
	struct sockaddr from;
	socklen_t fromlen;
	int rc;
	fd_set readset;
	fd_set workset;
	struct timeval timeout;
	int n, maxfd;
	mode_t cmask = 0077;
	time_t connect_time = time(0);
	sigset_t newsigmask, oldsigmask;
	char *err_op = "";
	char log_buf[LOG_BUF_SIZE];
	int cred_timeout = 0;

	/* set umask so socket file created is only accessible by same user */
	umask(cmask);
	sigemptyset(&newsigmask);
	sigaddset(&newsigmask, SIGPIPE);
	sigprocmask(SIG_BLOCK, &newsigmask, NULL);

	/* start up a unix domain socket to listen */
	if ((bindfd = socket(AF_UNIX, SOCK_STREAM, 0)) == -1) {
		err_op = "socket";
		goto error;
	}

	s_un.sun_family = AF_UNIX;
	snprintf(s_un.sun_path, sizeof(s_un.sun_path), "%s", fl);

	if (bind(bindfd, (const struct sockaddr *) &s_un, sizeof(s_un)) == -1)
		exit(1); /* dont go to error */

	FD_ZERO(&readset);
	if (listen(bindfd, 1) != 0) {
		err_op = "listen";
		goto error;
	}

	FD_SET(bindfd, &readset);
	FD_SET(sd_svr, &readset);
	maxfd = (bindfd > sd_svr) ? bindfd : sd_svr;
	while (1) {

		err_op = "";

		memcpy(&workset, &readset, sizeof(readset));

		timeout.tv_usec = 0;
		/* since timeout gets reset on Linux */
		if (cred_timeout == 1)
			timeout.tv_sec = QSUB_DMN_TIMEOUT_SHORT; /* Short timeout to allow any foreground process to finsih before exiting */
		else
			timeout.tv_sec = QSUB_DMN_TIMEOUT_LONG;
		n = select(maxfd + 1, &workset, NULL, NULL, &timeout);
		if (n == 0)
			goto out; /* daemon timed out waiting for connect from foreground */
		else if (n == -1) {
			err_op = "select failed";
			goto error;
		}

		/*
		 * check if we are past the credential timeout
		 * Error out even if it is close to CREDENTIAL_LIFETIME, as
		 * request could take a while to reach server and get processed
		 * Qsub then does a regular submit (new connection)
		 */
		if (cred_timeout == 0 && ((time(0) - connect_time) > (CREDENTIAL_LIFETIME - QSUB_DMN_TIMEOUT_LONG))) {
			unlink(fl);
			cred_timeout = 1;
		}

		/* Shut the qsub daemon if the server had closed the connection */
		if (FD_ISSET(sd_svr, &workset)) {
			if (recv(sd_svr, &rc, 1, MSG_OOB) < 1)
				goto out;
		}

		/* accept the connection */
		fromlen = sizeof(from);
		if ((sock = accept(bindfd, &from, &fromlen)) == -1) {
			err_op = "accept";
			goto error;
		}

		if ((recv_attrl(&sock, &attrib) != 0) ||
		    (recv_string(&sock, destination) != 0) ||
		    (recv_string(&sock, script_tmp) != 0) ||
		    (recv_string(&sock, cred_name) != 0) ||
		    (recv_dyn_string(&sock, &v_value) != 0) ||
		    (recv_dyn_string(&sock, &basic_envlist) != 0) ||
		    (recv_dyn_string(&sock, &qsub_envlist) != 0) ||
		    (recv_string(&sock, qsub_cwd) != 0) ||
		    (recv_opts(&sock) != 0)) {
			err_op = "recv data from foreground";
			goto error;
		}

		/*
		 * At this point the background qsub daemon has received all the data from the
		 * foreground. Lets tell the foreground that we have received the data, so that
		 * if the we crashed at any point after this the foreground should not end up
		 * submitting a duplicate job. However, if the foreground did not get this intimation,
		 * then it could go ahead and do a regular job submit.
		 */
		rc = 0;
		if (dosend(&sock, (char *) &rc, sizeof(int)) != 0) {
			err_op = "send data to foreground";
			goto error;
		}

		/* set the current work directory by doing a chdir */
		if (chdir(qsub_cwd) != 0) {
			err_op = "chdir";
			goto error;
		}

		if (setenv("PWD", qsub_cwd, 1) != 0) {
			err_op = "setenv";
			goto error;
		}

		sigemptyset(&newsigmask);
		sigaddset(&newsigmask, SIGXCPU);
		sigaddset(&newsigmask, SIGXFSZ);
		sigaddset(&newsigmask, SIGTSTP);
		sigaddset(&newsigmask, SIGINT);
		sigaddset(&newsigmask, SIGSTOP);
		sigaddset(&newsigmask, SIGTERM);
		sigaddset(&newsigmask, SIGTSTP);
		sigaddset(&newsigmask, SIGALRM);
		sigaddset(&newsigmask, SIGQUIT);
		sigaddset(&newsigmask, SIGUSR1);
		sigaddset(&newsigmask, SIGUSR2);
		sigprocmask(SIG_BLOCK, &newsigmask, &oldsigmask);

		rc = do_submit2(retmsg);

		if (send_string(&sock, retmsg) != 0) {
			err_op = "send data to foreground";
			goto error;
		}
		if (dosend(&sock, (char *) &rc, sizeof(int)) != 0) {
			err_op = "send data to foreground";
			goto error;
		}

		close(sock);
		sigprocmask(SIG_SETMASK, &oldsigmask, NULL);

		qsub_free_attrl(attrib);
		attrib = NULL;
		free(v_value);
		v_value = NULL;
		free(basic_envlist);
		basic_envlist = NULL;
		free(qsub_envlist);
		qsub_envlist = NULL;

		if (cred_buf != NULL) {
			memset(cred_buf, 0, cred_len);
			free(cred_buf);
			cred_buf = NULL;
		}

		/* Exit the daemon if it can't submit the job */
		if (rc == DMN_REFUSE_EXIT)
			goto out;
	}

out:
	close(bindfd);
	if (cred_timeout != 1)
		unlink(fl);
	exit(0);

error:
	sprintf(log_buf, "Background qsub: Failed at %s, errno=%d", err_op, errno);
	log_syslog(log_buf);
	unlink(fl);
	close(bindfd);
	exit(1);
}

/*
 * @brief
 *  Try to submit job through daemon. On Unix, the daemon would be created by
 *  forking during a prior invocation of the qsub command. The foregound qsub
 *  process tries to send the job to the daemon using Unix domain sockets.
 *
 * @param[out] daemon_up         - Indicate whether daemon is running
 * @param[out] do_regular_submit - Indicate whether to do regular submit
 * @param[in]  qsub_exe          - Name of the qsub command
 *
 * @return     rc                - Error code
 */
int
daemon_submit(int *daemon_up, int *do_regular_submit)
{
	int sock; /* UNIX domain socket for talking to daemon */
	struct sockaddr_un s_un;
	sigset_t newsigmask;
	int rc = 0;
again:
	/*
	 * In case of Unix, use fork. Foreground checks if connection is
	 * possible with background daemon. The communication used is unix
	 * domain sockets. Only the specified user can connect to this socket
	 * since the domain socket is created with a 0600 permission.
	 *
	 * If connection fails, proceed with qsub in the normal flow, and at
	 * the end fork and stay in the background, while the foreground
	 * process returns control to the shell. Subsequent qsubs will be able
	 * to connect to this forked background qsub.
	 *
	 */
	*daemon_up = check_qsub_daemon(fl);
	if (*daemon_up == 1) {
		/* pass information to daemon */
		/* wait for job-id or error string */
		if ((sock = socket(AF_UNIX, SOCK_STREAM, 0)) == -1)
			return rc;

		s_un.sun_family = AF_UNIX;
		snprintf(s_un.sun_path, sizeof(s_un.sun_path), "%s", fl);

		if (connect(sock, (const struct sockaddr *) &s_un, sizeof(s_un)) == -1) {
			int refused = (errno == ECONNREFUSED);

			close(sock);
			if (refused) {
				/* daemon unavailable, del temp file, restart */
				if (unlink(fl) != 0)
					return rc;

				goto again;
			}
			return rc;
		}

		/* block SIGPIPE on write() failures. */
		sigemptyset(&newsigmask);
		sigaddset(&newsigmask, SIGPIPE);
		sigprocmask(SIG_BLOCK, &newsigmask, NULL);

		if ((send_attrl(&sock, attrib) == 0) &&
		    (send_string(&sock, destination) == 0) &&
		    (send_string(&sock, script_tmp) == 0) &&
		    (send_string(&sock, cred_name) == 0) &&
		    (send_string(&sock, v_value ? v_value : "") == 0) &&
		    (send_string(&sock, basic_envlist) == 0) &&
		    (send_string(&sock, qsub_envlist ? qsub_envlist : "") == 0) &&
		    (send_string(&sock, qsub_cwd) == 0) &&
		    (send_opts(&sock) == 0)) {

			/*
			 * Read back the first error code from the background,
			 * which confirms whether the background received our data.
			 */
			if (dorecv(&sock, (char *) &rc, sizeof(int)) == 0) {
				/*
				 * We were able to send data to the background daemon.
				 * Now, even if we fail to read back response from
				 * background, we do not want to submit again.
				 */
				*do_regular_submit = 0;
			}

			/* read back response from background daemon */
			if ((recv_string(&sock, retmsg) != 0) ||
			    (dorecv(&sock, (char *) &rc, sizeof(int)) != 0) ||
			    rc == DMN_REFUSE_EXIT) {
				/*
				 * Something bad happened, either background submitted
				 * and failed to send us response, or it failed before
				 * submitting. If background qsub detects -V option, then
				 * submit the job through foreground.
				 */
				if (rc != DMN_REFUSE_EXIT) {
					rc = -1;
					sprintf(retmsg, "Failed to recv data from background qsub\n");
					/* Error message will be printed in caller */
				} else
					*do_regular_submit = 1;
			}
		}
		/* going down, no need to free stuff */
		close(sock);
	}

	return rc;
}


================================================
FILE: src/cmds/qterm.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	qterm.c
 * @brief
 *  The qterm command terminates the batch server.
 *
 * @par	Synopsis:
 *  qterm [-t type] [-F|-f|-i] [-s] [-m] [server ...]
 *
 * @par	Options:
 *  -t  delay   Jobs are (1) checkpointed if possible; otherwise, (2) jobs are
 *		rerun (requeued) if possible; otherwise, (3) jobs are left to
 *              run.
 *
 *      immediate
 *              Jobs are (1) checkpointed if possible; otherwise, (2) jobs are
 *		rerun if possible; otherwise, (3) jobs are aborted.
 *
 *	quick (the new default)
 *		The server will save state and exit leaving running jobs
 *		still running.  Good for shutting down when you wish to
 *		quickly restart the server.
 *
 *  -F	shutdonw the Secndary Server only (Primary stays up),
 *  -f  shutdown Secondary Servers as well, or
 *  -i	idle the Secondary Server
 *
 *  -s	shutdown scheduler as well
 *
 *  -m  shutdown Moms also
 *
 * @par	Arguments:
 *  server ...
 *      A list of servers to terminate.
 *
 * @author	Bruce Kelly
 *  National Energy Research Supercomputer Center
 *  Livermore, CA
 *  May, 1993
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include <pbs_version.h>

int exitstatus = 0; /* Exit Status */

static void execute(int, char *);

int
main(int argc, char **argv)
{
	/*
	 *  This routine sends a Server Shutdown request to the batch server.  If the
	 * batch request is accepted, and the type is IMMEDIATE, then no more jobs
	 * are accepted and all jobs are checkpointed or killed.  If the type is
	 * DELAY, then only privileged users can submit jobs, and jobs will be
	 * checkpointed if available.
	 */

	static char opts[] = "t:smfFi"; /* See man getopt */
	int s;				/* The execute line option */
	static char usage[] = "Usage: qterm [-t immediate|delay|[quick]] [-m] [-s] [-f|-i] [server ...]\n";
	static char usag2[] = "       qterm --version\n";
	char *type = NULL; /* Pointer to the type of termination */
	int downsched = 0;
	int downmom = 0;
	int downsecd = 0;
	int idlesecd = 0;
	int manner;	/* The type of termination */
	int errflg = 0; /* Error flag */

	/*test for real deal or just version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	/* Command line options */
	while ((s = getopt(argc, argv, opts)) != EOF)
		switch (s) {
			case 't':
				type = optarg;
				break;
			case 's':
				downsched = 1;
				break;
			case 'm':
				if (idlesecd == 2)
					errflg++;
				downmom = 1;
				break;
			case 'f':
				if ((idlesecd != 0) | (downsecd == 2))
					errflg++;
				downsecd = 1;
				break;
			case 'F':
				if ((idlesecd != 0) | (downsecd == 1) | (downmom != 0))
					errflg++;
				downsecd = 2;
				break;
			case 'i':
				if (downsecd)
					errflg++;
				idlesecd = 1;
				break;
			case '?':
			default:
				errflg++;
				break;
		}
	if (errflg) {
		fprintf(stderr, "%s", usage);
		fprintf(stderr, "%s", usag2);
		exit(1);
	} else if (type != NULL) {
		if (strcmp(type, "delay") == 0)
			manner = SHUT_DELAY;
		else if (strcmp(type, "immediate") == 0)
			manner = SHUT_IMMEDIATE;
		else if (strcmp(type, "quick") == 0)
			manner = SHUT_QUICK;
		else {
			fprintf(stderr, "%s", usage);
			fprintf(stderr, "%s", usag2);
			exit(1);
		}
	} else
		manner = SHUT_QUICK;

	if (downsched)
		manner |= SHUT_WHO_SCHED;
	if (downmom)
		manner |= SHUT_WHO_MOM;
	if (downsecd == 1)
		manner |= SHUT_WHO_SECDRY;
	if (downsecd == 2)
		manner |= SHUT_WHO_SECDONLY;
	else if (idlesecd)
		manner |= SHUT_WHO_IDLESECDRY;

	/*perform needed security library initializations (including none)*/

	if (CS_client_init() != CS_SUCCESS) {
		fprintf(stderr, "qterm: unable to initialize security library.\n");
		exit(1);
	}

	if (optind < argc)
		for (; optind < argc; optind++)
			execute(manner, argv[optind]);
	else
		execute(manner, "");

	/*cleanup security library initializations before exiting*/
	CS_close_app();

	exit(exitstatus);
}

/**
 * @brief
 *	executes to terminate server
 *
 * @param[in] manner - The manner in which to terminate the server.
 * @param[in] server - The name of the server to terminate.
 *
 * @return - Void
 *
 * @File Variables:
 * exitstatus  Set to two if an error occurs.
 *
 */
static void
execute(int manner, char *server)
{
	int ct;	      /* Connection to the server */
	int err;      /* Error return from pbs_terminate */
	char *errmsg; /* Error message from pbs_terminate */

	if ((ct = cnt2server(server)) > 0) {
		err = pbs_terminate(ct, manner, NULL);
		if (err != 0) {
			errmsg = pbs_geterrmsg(ct);
			if (errmsg != NULL) {
				fprintf(stderr, "qterm: %s ", errmsg);
			} else {
				fprintf(stderr, "qterm: Error (%d) terminating server ", pbs_errno);
			}
			fprintf(stderr, "%s\n", server);
			exitstatus = 2;
		}
		pbs_disconnect(ct);
	} else {
		fprintf(stderr, "qterm: could not connect to server %s (%d)\n", server, pbs_errno);
		exitstatus = 2;
	}
}


================================================
FILE: src/cmds/sample.qstatrc
================================================
#
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
#
proc niceprint {level name} {
	upvar $name str

	if {$level == 0} {
		set colone ""
		set limit 78
	} else {
		set colone "\t"
		set limit 70
	}

	set comma [string first "," $str]
	if {$comma != -1} {
		if {$comma < $limit} {
			set line ""
			while {[string length $line] + $comma < $limit} {
				set line "$line[string range $str 0 $comma]"
				set str [string range $str [expr $comma+1] end]

				set comma [string first "," $str]
				if {$comma == -1} {
					break
				}
			}
		} else {
			set line [string range $str 0 $comma]
			set str [string range $str [expr $comma+1] end]
		}
	} else {
		set line $str
		set str ""
	}

	puts "$colone[string range $line 0 $limit]"
	set line [string range $line [expr $limit+1] end]
	set len [string length $line]
	while {$len > 0} {
		puts "\t[string range $line 0 70]"
		set line [string range $line 71 end]
		set len [string length $line]
	}
}

if {[lsearch [info vars] objects] == -1} return

foreach object $objects {
	foreach obj [lindex $object 1] {
		puts "[lindex $object 0]: [lindex $obj 0]"
		foreach attr [lindex $obj 1] {
			set name [lindex $attr 0]
			set value [lindex $attr 1]

			set line "   $name = $value"
			set len [string length $line]
			if {$len < 80} {
				puts $line
				continue
			}

			set comma [string first "," $line]
			if {$comma == -1} {
				puts [string range $line 0 78]
				set line [string range $line 79 end]
				set len [string length $line]
				while {$len > 0} {
					puts "\t[string range $line 0 70]"
					set line [string range $line 71 end]
					set len [string length $line]
				}
				continue;
			}

			niceprint 0 line
			set len [string length $line]
			while {$len > 0} {
				niceprint 1 line
				set len [string length $line]
			}
		}
		puts [lindex $obj 3]
	}
}


================================================
FILE: src/cmds/scripts/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

libinitdir = $(libdir)/init.d

dist_libinit_DATA = \
	limits.pbs_mom \
	limits.pbs_mom.compat \
	limits.post_services \
	limits.post_services.compat 

libmpidir = $(libdir)/MPI

dist_libmpi_DATA = \
	pbsrun.ch_gm.init.in \
	pbsrun.ch_mx.init.in \
	pbsrun.gm_mpd.init.in \
	pbsrun.intelmpi.init.in \
	pbsrun.mpich2.init.in \
	pbsrun.mvapich1.init.in \
	pbsrun.mvapich2.init.in \
	pbsrun.mx_mpd.init.in \
	sgiMPI.awk

pythonlibdir = $(libdir)/python

dist_pythonlib_PYTHON = \
	pbs_bootcheck.py \
	pbs_topologyinfo.py

sysprofiledir = /etc/profile.d

dist_sysprofile_DATA = \
	pbs.csh \
	pbs.sh

unitfiledir = @_unitdir@

dist_unitfile_DATA = \
	pbs.service

dist_libexec_SCRIPTS = \
	pbs_habitat \
	pbs_init.d \
	pbs_postinstall \
	pbs_preuninstall \
	pbs_posttrans \
	pbs_reload

dist_bin_SCRIPTS = \
	pbs_topologyinfo \
	printjob

dist_sbin_SCRIPTS = \
	pbs_dataservice \
	pbs_ds_password \
	pbs_server \
	pbs_snapshot

dist_sysconf_DATA = \
	modulefile \
	pbs.csh \
	pbs.sh

CLEANFILES = \
	pbs_init.d \
	limits.pbs_mom \
	limits.post_services

limits.pbs_mom: $(srcdir)/limits.pbs_mom.compat
	cp $? $@

limits.post_services: $(srcdir)/limits.post_services.compat
	cp $? $@


================================================
FILE: src/cmds/scripts/limits.pbs_mom.compat
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#	This file will be sourced by the PBS startup script, pbs_init.d.
#	It is here only for binary compatibility with previous releases.
#	Feel free to replace its contents.
MEMLOCKLIM=`ulimit -l`
NOFILESLIM=`ulimit -n`
STACKLIM=`ulimit -s`
ulimit -l unlimited
ulimit -n 16384
ulimit -s unlimited


================================================
FILE: src/cmds/scripts/limits.post_services.compat
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#	This file will be sourced by the PBS startup script, pbs_init.d.
#	It is here only for binary compatibility with previous releases.
#	Feel free to replace its contents.
if [ -n "${MEMLOCKLIM}" ] ; then
    ulimit -l ${MEMLOCKLIM}
    ulimit -n ${NOFILESLIM}
    ulimit -s ${STACKLIM}
fi


================================================
FILE: src/cmds/scripts/modulefile.in
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#%Module1.0
proc ModulesHelp { } {
puts stderr "The PBS module defines the default system paths and"
puts stderr "environment variables needed to utilize the PBS"
puts stderr "workload management system."
puts stderr ""
puts stderr "Use the command \"module list\" to determine whether the"
puts stderr "pbs modulefile has been loaded in your environment."
puts stderr ""
puts stderr "Use the command \"module show pbs\" to display the"
puts stderr "actions carried out by this module."
puts stderr ""
}
set _module_name [module-info name]
set is_module_rm [module-info mode remove]
set package_root @prefix@
prepend-path MANPATH [file join ${package_root} share/man]
prepend-path PATH [file join ${package_root} bin]


================================================
FILE: src/cmds/scripts/pbs.csh
================================================

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# Source in the /etc/pbs.conf file
if ( $?PBS_CONF_FILE ) then
   set conf = "$PBS_CONF_FILE"
else
   set conf = /etc/pbs.conf
endif

if ( -r "$conf" ) then
   setenv __PBS_EXEC `grep '^[[:space:]]*PBS_EXEC=' "$conf" | tail -1 | sed 's/^[[:space:]]*PBS_EXEC=\([^[:space:]]*\)[[:space:]]*/\1/'`
   if ( $?__PBS_EXEC ) then
      # Define the PATH and MANPATH for the users
      if ( $?PATH && -d ${__PBS_EXEC}/bin ) then
         setenv PATH ${PATH}:${__PBS_EXEC}/bin
      endif
      if ( $?MANPATH && -d ${__PBS_EXEC}/man ) then
         setenv MANPATH ${MANPATH}:${__PBS_EXEC}/man
      endif
      if ( $?MANPATH && -d ${__PBS_EXEC}/share/man ) then
         setenv MANPATH ${MANPATH}:${__PBS_EXEC}/share/man
      endif
      if ( `whoami` == "root" ) then
         if ( $?PATH && -d ${__PBS_EXEC}/sbin ) then
            setenv PATH ${PATH}:${__PBS_EXEC}/sbin
         endif
      endif
      unsetenv __PBS_EXEC
   endif
endif


================================================
FILE: src/cmds/scripts/pbs.service.in
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# It's not recommended to modify this file in-place, because it will be
# overwritten during package upgrades.  If you want to customize, the
# best way is to create a file "/etc/systemd/system/pbs.service",
# containing
#       .include /lib/systemd/system/pbs.service
#       ...make your changes here...
# For more info about custom unit files, see -
# http://fedoraproject.org/wiki/Systemd#How_do_I_customize_a_unit_file.2F_add_a_custom_unit_file.3F


[Unit]
Documentation=man:pbs(8)
SourcePath=@prefix@/libexec/pbs_init.d
Description=Portable Batch System
After=network-online.target remote-fs.target nss-lookup.target
Wants=network-online.target
DefaultDependencies=true

[Service]
Type=forking
Restart=no
TimeoutStartSec=0
TimeoutStopSec=5min
Delegate=yes
IgnoreSIGPIPE=no
GuessMainPID=no
ExecStart=@prefix@/libexec/pbs_init.d start
ExecStop=@prefix@/libexec/pbs_init.d stop
ExecReload=@prefix@/libexec/pbs_reload @prefix@/libexec/pbs_init.d start
TasksMax=infinity

[Install]
WantedBy=multi-user.target


================================================
FILE: src/cmds/scripts/pbs.sh
================================================

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# Source in the /etc/pbs.conf file
conf="${PBS_CONF_FILE:-/etc/pbs.conf}"
if [ -r "${conf}" ]; then
   __PBS_EXEC=`grep '^[[:space:]]*PBS_EXEC=' "$conf" | tail -1 | sed 's/^[[:space:]]*PBS_EXEC=\([^[:space:]]*\)[[:space:]]*/\1/'`
   if [ "X${__PBS_EXEC}" != "X" ]; then
      # Define PATH and MANPATH for the users
      [ -d "${__PBS_EXEC}/bin" ] && export PATH="${PATH}:${__PBS_EXEC}/bin"
      [ -d "${__PBS_EXEC}/man" ] && export MANPATH="${MANPATH}:${__PBS_EXEC}/man"
      [ -d "${__PBS_EXEC}/share/man" ] && export MANPATH="${MANPATH}:${__PBS_EXEC}/share/man"
      if [ `whoami` = "root" ]; then
         [ -d "${__PBS_EXEC}/sbin" ] && export PATH="${PATH}:${__PBS_EXEC}/sbin"
      fi
   fi
   unset __PBS_EXEC
fi


================================================
FILE: src/cmds/scripts/pbs_bootcheck.py
================================================
# coding: utf-8
#

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

try:
    import os
    import time
    import sys
    from operator import itemgetter
    import socket
    from fcntl import flock, LOCK_EX, LOCK_UN

    def __get_uptime():
        """
        This function will return system uptime in epoch pattern
        it will find system uptime either reading to '/proc/uptime' file is
        exists otherwise by using 'uptime' command
        """
        _boot_time = 0
        if os.path.exists('/proc/uptime'):
            # '/proc/uptime' file exists, get system uptime from it
            _uptime = open('/proc/uptime', 'r')
            _boot_time = int(
                time.time() - float(_uptime.readline().split()[0]))
            _uptime.close()
        else:
            # '/proc/uptime' file not exists, get system uptime from 'uptime'
            # command here uptime format will be as follow:
            # <current time> <uptime>, <number of user logged into system>,
            # <load average>
            # Example: 11:14pm  up 150 days  5:39,  5 users,  load average:
            # 0.07, 0.25, 0.22
            # from above format the <uptime> will be one of the following
            # format:
            #
            # 1. up MM min,
            # 	Example 1: up 1 min,
            # 	Example 2: up 12 min,
            #
            # 2. up HH:MM,
            # 	Example 2: up 12:45,
            #
            # 3. up <number of days> day<(s)>,
            # 	Example 3.1: up 23 day(s),
            # 	Example 3.2: up 23 days
            #
            # 4. up <number of days> day<(s)> HH:MM,
            # 	Example 4.1: up 23 day(s) 12:45,
            # 	Example 4.2: up 23 days 12:45,
            # 	Example 4.3: up 23 days, 12:45,

            _uptime = os.popen('uptime').readline()
            _days = _hours = _min = 0
            if 'day' in _uptime:
                (_days, _hm) = itemgetter(2, 4)(_uptime.split())
            else:
                _hm = itemgetter(2)(_uptime.split())
            if ':' in _hm:
                (_hours, _min) = _hm.split(':')
                _min = _min.strip(',')
            else:
                _min = _hm
            _boot_time = int(time.time()) - \
                (int(_days) * 86400 + int(
                    _hours) * 3600 + int(_min) * 60)
        return _boot_time

    boot_time = __get_uptime()
    boot_check_file = sys.argv[1]
    prev_pbs_start_time = int(time.time())
    hostname = socket.gethostname()
    new_lines = ['###################################',
                 '#      DO NOT EDIT THIS FILE      #',
                 '#   THIS FILE IS MANAGED BY PBS   #',
                 '###################################',
                 hostname + '==' + str(prev_pbs_start_time)]
    if os.path.exists(boot_check_file):
        f = open(boot_check_file, 'a+')
    else:
        f = open(boot_check_file, 'w+')
    flock(f.fileno(), LOCK_EX)
except Exception:
    sys.exit(255)
try:
    f.seek(0)
    lines = f.readlines()
    for (line_no, line_content) in enumerate(lines):
        if line_content[0] != '#' and line_content.strip() != '':
            (host, start_time) = line_content.split('==')
            if host == hostname:
                prev_pbs_start_time = int(start_time)
            else:
                new_lines.append(line_content)
    f.seek(0)
    f.truncate()
    f.writelines('\n'.join(new_lines))
    flock(f.fileno(), LOCK_UN)
except Exception:
    flock(f.fileno(), LOCK_UN)
    f.close()
    sys.exit(255)
f.close()
os.chmod(boot_check_file, 0o644)
# if system being booted then exit with 0 otherwise exit with 1
if boot_time >= prev_pbs_start_time:
    sys.exit(0)
else:
    sys.exit(1)


================================================
FILE: src/cmds/scripts/pbs_dataservice
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


. ${PBS_CONF_FILE:-/etc/pbs.conf}

PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"
export PBS_TMPDIR

version_mismatch=3

get_db_user() {
	dbusr_file="${PBS_HOME}/server_priv/db_user"
	if [ ! -f "${dbusr_file}" ]; then
		echo "pbsdata"
		return 0
	else
		cat "${dbusr_file}"
		return $?
	fi
}


# The get_port function does the following:
# Setting PBS_DATA_SERVICE_PORT based on availability  in following order:
# 1. Set PBS_DATA_SERVICE_PORT to port provided by pbs
# 2. Set PBS_DATA_SERVICE_PORT to port provided by pbs.conf
# 3. Set PBS_DATA_SERVICE_PORT to port provided by /etc/services
# 4. Set PBS_DATA_SERVICE_PORT to default port

get_port() {
	if [ "$1" ]; then
		PBS_DATA_SERVICE_PORT="$1"
	else
		if [ -z "${PBS_DATA_SERVICE_PORT}" ]; then
			PBS_DATA_SERVICE_PORT=`awk '{if($1=="pbs_dataservice") {x=$2}} END {{split(x,a,"/")} {if ( a[2] == "tcp" ) print a[1]}}' /etc/services`
		fi
	fi

	if [ -z "${PBS_DATA_SERVICE_PORT}" ]; then
		PBS_DATA_SERVICE_PORT="15007"
	fi
}

#Set PBS_DATA_SERVICE_PORT
export PBS_DATA_SERVICE_PORT
get_port $3

DBPORT=${PBS_DATA_SERVICE_PORT}
export DBPORT

. ${PBS_EXEC}/libexec/pbs_db_env

DBUSER=`get_db_user`
if [ $? -ne 0 ]; then
	echo "Could not retrieve PBS Data Service User"
	exit 1
fi
export DBUSER

if [ -z "${PBS_DATA_SERVICE_PORT}" ]; then
	PBS_DATA_SERVICE_PORT="15007"
fi

CWD=`pwd`

if [ -z "$(ls -A ${PBS_HOME}/datastore)" ]; then
	echo "PBS Data Service not initialized"
	exit 1
fi

# Check if DBUSER is defined and is non-root
id=`id ${DBUSER} 2>&1`
if [ $? -ne 0 ]; then
	echo "User ${DBUSER} does not exist"
	exit 1
fi

# Check that id is not 0
id=`echo ${id} | cut -c5- | cut -d "(" -f1`
if [ "${id}" = "0" ]; then
	echo "PBS Data Service User should not be root"
	exit 1
fi

# check I am root
myid=`id | cut -c5- | cut -d "(" -f1 2>&1`
if [ "${myid}" != "0" ]; then
	echo "Please run as root"
	exit 1
fi

# Check if DBUSER is enabled, try to cd to user home
su - ${DBUSER} -c "cd" >/dev/null 2>&1
if [ $? -ne 0 ]; then
	echo "Unable to login as user ${DBUSER}. Is the user enabled/home directory accessible?"
	exit 1
fi

# check that the user has not tampered with the data user manually
if [ -d "${PBS_HOME}/datastore" ]; then
	dbstore_owner=`ls -ld ${PBS_HOME}/datastore | awk '{print $3}'`
	if [ "${dbstore_owner}" != "${DBUSER}" ]; then
		echo "PBS DataService user value has been changed manually. Please revert back to the original value \"${dbstore_owner}\""
		exit 1
	fi
else
	echo "Path ${PBS_HOME}/datastore is not accessible by Data Service User ${DBUSER}"
	exit 1
fi

#
# The check_status function does the following:
# Checks what LIBDB thinks about the database status. If LIBDB says db is up,
# just return 0 (running locally) else check if the datastore directory can be
# locked.
# If we cannot obtain exclusive lock, then return 2
#
# Return code values:
#	-1 - failed to execute
#	0  - Data service running on local host
#	1  - Data service definitely NOT running
#	2  - Failed to obtain exclusive lock
#

check_status() {
	cd ${PBS_HOME}/datastore
	if [ $? -ne 0 ]; then
		echo "Could not change directory to ${PBS_HOME}/datastore"
		exit -1
	fi

	res=`${data_srv_bin} -s status 2>&1`
	status=$?

	if [ ${status} -eq 0 ]; then
		echo "${res}" | grep 'no server running'
		if [ $? -eq 0 ]; then
			status=1
		else
			msg="PBS data service running locally"
		fi
	else
		# check further only if LIBDB thinks no DATABASE is running
		status=1
		msg="PBS data service not running"
		out=`${data_srv_mon} check 2>&1`
		if [ $? -ne 0 ]; then
			status=2
			msg="${out}"
		fi
	fi

	cd ${CWD}
	export msg
	return ${status}
}

data_srv_bin="${PBS_EXEC}/sbin/pbs_dataservice.bin"
data_srv_mon="${PBS_EXEC}/sbin/pbs_ds_monitor"

case "$1" in
	start)
		check_status
		ret=$?
		if [ ${ret} -eq 1 ]; then
			echo "Starting PBS Data Service.."
			${data_srv_bin} -s start
			ret=$?

			if [ ${ret} -ne 0 ]; then
				echo "Failed to start PBS Data Service"
				if [ ${ret} -eq ${version_mismatch} ]; then
					echo "PBS database needs to be upgraded."
					echo "Consult the documentation/release notes for details."
				fi
			fi
		else
			echo "${msg} - cannot start"
		fi

		exit ${ret}
		;;

	stop)
		check_status
		ret=$?
		if [ ${ret} -ne 0 ]; then
			echo "${msg} - cannot stop"
			exit 0
		fi

		# Check if PBS is running
		${PBS_EXEC}/bin/qstat -Bf >/dev/null 2>&1
		if [ $? -eq 0 ]; then
			echo "PBS server is running. Cannot stop PBS Data Service now."
			server_pid="`ps -ef | grep "pbs_server.bi[n]" | awk '{print $2}'`"
			if [ -z "${server_pid}" ]; then
				server_host="`${PBS_EXEC}/bin/qstat -Bf | grep 'server_host' | awk '{print $NF}'`"
				if [ ! -z "${server_host}" ]; then
					echo "PBS server is running on host ${server_host}."
				fi
				echo "Please check pbs.conf file to verify PBS is configured with correct server host value. Exiting."
			fi
			exit 1
		fi
		echo "Stopping PBS Data Service.."

		cd ${PBS_HOME}/datastore
		if [ $? -ne 0 ]; then
			echo "Could not change directory to ${PBS_HOME}/datastore"
			exit 1
		fi
		${data_srv_bin} -s stop
		ret=$?
		cd ${CWD}
		if [ ${ret} -ne 0 ]; then
			echo "Failed to stop PBS Data Service"
			echo "(Check if there are active connections to the data service)"
		else
			# check that we are able to acquire locks again, ie, monitor has died
			i=0
			check_status
			sret=$?
			while [ $i -lt 10 -a ${sret} -ne 1 ]
			do
				sleep 1
				check_status
				sret=$?
				i=`expr $i + 1`
			done
			if [ ${sret} -ne 1 ]; then
				echo "Failed to stop PBS Data Service"
				exit 1
			fi
		fi
		exit ${ret}
		;;

	status)
		check_status
		ret=$?
		echo "${msg}"
		exit ${ret}
		;;

	*) echo "Usage: `basename $0` {start|stop|status}"
		exit 1
		;;
esac
exit 1


================================================
FILE: src/cmds/scripts/pbs_ds_password
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# Source the PBS configuration file
. ${PBS_CONF_FILE:-/etc/pbs.conf}

# Source the file that sets PGSQL_LIBSTR
. "$PBS_EXEC"/libexec/pbs_db_env

exec $PBS_EXEC/sbin/pbs_ds_password.bin ${1+"$@"}


================================================
FILE: src/cmds/scripts/pbs_habitat.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


if [ $# -eq 1 -a "$1" = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

PBS_VERSION=@PBS_VERSION@
INSTALL_DB="install_db"
UPGRADE_DB="upgrade_db"

get_db_user() {
	[ -f "${dbuser_fl}" ] && dbuser_name=`cat "${dbuser_fl}" | tr -d '[:space:]'`
	[ -z "${dbuser_name}" ] && dbuser_name="${PBS_DATA_SERVICE_USER:-@database_user@}"
	if [ ! -f "${dbuser_fl}" ]; then
		printf "%s" "$dbuser_name" >"${dbuser_fl}"
		chmod 0600 "${dbuser_fl}"
	fi
	cat "${dbuser_fl}"
	return $?
}

chk_dataservice_user() {
	chk_usr="$1"

	# do user-id related stuff first
	id=`id ${chk_usr} 2>&1`
	if [ $? -ne 0 ]; then
		echo "PBS Data Service user ${chk_usr} does not exist"
		return 1;
	fi

	id=`echo ${id} | cut -c5- | cut -d "(" -f1`
	if [ "$id" = "0" ]; then
		echo "User ${chk_usr} should not have root privileges"
		return 1;
	fi

	# login as ${chk_usr} and try to cd to user home dir
	su - ${chk_usr} -c "cd" > /dev/null 2>&1

	if [ $? -ne 0 ]; then
		echo "Unable to login as user ${chk_usr}. Is the user enabled/home directory accessible?"
		return 1
	fi
	return 0
}

is_cray_xt() {
	if [ -f /proc/cray_xt/cname ] ; then
		return 0
	fi
	return 1
}

chkenv() {
	line=`grep -s "^${1}=" $envfile`
	if [ -z "$line" ]; then
		echo "*** setting ${1}=$2"
		echo "${1}=$2" >> $envfile
	else
		echo "*** leave existing $line"
	fi
}

createdir() {
	if [ -n "$1" -a ! -d "$1" ]; then
		if ! mkdir -p "$1"; then
			echo "*** Could not create $1"
			exit 1
		fi
	fi
	if [ -n "$1" -a -n "$2" ]; then
		chmod "$2" "$1"
	fi
}

createpath() {
	while read mode dir ;do
		createdir "${PBS_HOME}/${dir}" $mode
	done
}

# Return the name of the PBS server host
get_server_hostname() {
	shn=""
	if [ -z "${PBS_PRIMARY}" -o -z "${PBS_SECONDARY}" ] ; then
		if [ -z "${PBS_SERVER_HOST_NAME}" ]; then
			shn="${PBS_SERVER}"
		else
			shn="${PBS_SERVER_HOST_NAME}"
		fi
	else
		shn="${PBS_PRIMARY}"
	fi
	echo ${shn} | awk '{print tolower($0)}'
}

# Ensure the supplied hostname is valid
check_hostname() {
	# Check the hosts file
	getent hosts "${1}" >/dev/null 2>&1 && return 0
	# Check DNS
	host "${1}" >/dev/null 2>&1 && return 0
	return 1
}

# Backup pgsql binaries and libraries to PBS_EXEC
backup_pgsql() {
	psql_ver=`psql --version | cut -d ' ' -f3 | cut -d '.' -f 1,2`
	mkdir -p "$PBS_HOME/pgsql.forupgrade/bin"
	mkdir -p "$PBS_HOME/pgsql.forupgrade/lib"
	mkdir -p "$PBS_HOME/pgsql.forupgrade/lib64/pgsql"
	mkdir -p "$PBS_HOME/pgsql.forupgrade/share/pgsql/timezonesets"
	mkdir -p "$PBS_HOME/pgsql.forupgrade/share/timezonesets"
	pgsql_lib_dir=`dirname $PGSQL_BIN`"/lib64/pgsql"
	if [ ! -d $pgsql_lib_dir ];then
		pgsql_lib_dir="/usr/pgsql-${psql_ver}/lib"
	fi
	cp -r $pgsql_lib_dir/* "$PBS_HOME/pgsql.forupgrade/lib64/pgsql"
	cp -r $pgsql_lib_dir/* "$PBS_HOME/pgsql.forupgrade/lib/"
	pgsql_share_dir=`dirname $PGSQL_BIN`"/share/pgsql"
	if [ ! -d $pgsql_share_dir ];then
		pgsql_share_dir="/usr/pgsql-${psql_ver}/share"
	fi
	cp -r $pgsql_share_dir/timezonesets/* "$PBS_HOME/pgsql.forupgrade/share/pgsql/timezonesets"
	cp -r $pgsql_share_dir/timezonesets/* "$PBS_HOME/pgsql.forupgrade/share/timezonesets"
	cp "$PGSQL_BIN/pg_ctl" "$PBS_HOME/pgsql.forupgrade/bin"
	cp "$PGSQL_BIN/postgres" "$PBS_HOME/pgsql.forupgrade/bin"
	cp "$PGSQL_BIN/pg_controldata" "$PBS_HOME/pgsql.forupgrade/bin"
	cp "$PGSQL_BIN/pg_resetxlog" "$PBS_HOME/pgsql.forupgrade/bin"
	cp "$PGSQL_BIN/psql" "$PBS_HOME/pgsql.forupgrade/bin"
	cp "$PGSQL_BIN/pg_dump" "$PBS_HOME/pgsql.forupgrade/bin"
	cp "$PGSQL_BIN/pg_restore" "$PBS_HOME/pgsql.forupgrade/bin"
	psql_ver_min=9.3
	if [ ${psql_ver_min%.*} -eq ${psql_ver%.*} ] && [ ${psql_ver_min#*.} \> ${psql_ver#*.} ] || [ ${psql_ver_min%.*} -gt ${psql_ver%.*} ]; then
		touch "$PBS_HOME/pgsql.forupgrade/oss"
	fi
}

#
# Start of the pbs_habitat script
#
conf=${PBS_CONF_FILE:-@PBS_CONF_FILE@}
ostype=`uname 2>/dev/null`
umask 022

echo "***"

# Source pbs.conf to get paths: PBS_EXEC and PBS_HOME and PBS_START_*
. $conf

# Ensure certain variables are set
if [ -z "$PBS_EXEC" ]; then
	echo "*** PBS_EXEC is not set"
	exit 1
fi
if [ ! -d "$PBS_EXEC" ]; then
	echo "*** $PBS_EXEC directory does not exist"
	exit 1
fi
if [ -z "$PBS_HOME" ]; then
	echo "*** PBS_HOME is not set"
	exit 1
fi
if [ ! -d "$PBS_HOME" -o ! "$(/bin/ls -A $PBS_HOME)" ]; then
	echo "*** WARNING: PBS_HOME not found in $PBS_HOME"
	if [ -x "$PBS_EXEC/sbin/pbs_server" ]; then
		component="server"
	elif [ -x "$PBS_EXEC/sbin/pbs_mom" ]; then
		component="execution"
	else
		echo "*** No need to execute pbs_habitat in client installation."
		exit 0
	fi
	${PBS_EXEC}/libexec/pbs_postinstall $component $PBS_VERSION $PBS_EXEC $PBS_HOME "" "sameconf"
fi


# Get the current PBS version from qstat
if [ -x "$PBS_EXEC/bin/qstat" ]; then
	pbs_version=`"${PBS_EXEC}/bin/qstat" --version | sed -e 's/^.* = //'`
	if [ -z "$pbs_version" ]; then
		echo "*** Could not obtain PBS version from qstat"
		exit 1
	fi
	if [ "$pbs_version" != "$PBS_VERSION" ]; then
		echo "*** Version mismatch."
		echo "*** Build version is $PBS_VERSION"
		echo "*** qstat version is $pbs_version"
		exit 1
	fi
else
	echo "*** File not found: $PBS_EXEC/bin/qstat"
	exit 1
fi

# Perform sanity check on server name in pbs.conf
server_hostname=`get_server_hostname`
[ "$server_hostname" = 'change_this_to_pbs_server_hostname' ] && server_hostname=''
if [ -z "${server_hostname}" ] ; then
	echo "***" >&2
	echo "*** The hostname of the PBS server in ${conf} is invalid." >&2
	echo "*** Update the configuration file before starting PBS." >&2
	echo "***" >&2
	exit 1
fi
check_hostname "${server_hostname}"
if [ $? -ne 0 ]; then
	echo "***" >&2
	echo "*** The PBS server could not be found: $server_hostname" >&2
	echo "*** This value must resolve to a valid IP address." >&2
	echo "***" >&2
	exit 1
fi
server=`echo ${server_hostname} | awk -F. '{print $1}'`

if [ "${PBS_START_SERVER:-0}" != 0 ] ; then
	# Check for the db install script
	if [ ! -x "${PBS_EXEC}/libexec/pbs_db_utility" ]; then
		echo "${PBS_EXEC}/libexec/pbs_db_utility not found"
		exit 1
	fi

	# Source the file that sets DB env variables
	. "$PBS_EXEC"/libexec/pbs_db_env
	if [ $? -ne 0 ]; then
		echo "Could not setup PBS Data Service environment"
		exit 1
	fi

	PBS_licensing_loc_file=PBS_licensing_loc

	dbuser_fl="${PBS_HOME}/server_priv/db_user"
	PBS_DATA_SERVICE_USER=`get_db_user`
	if [ $? -ne 0 ]; then
		echo "Could not retrieve PBS Data Service User"
		exit 1
	fi

	# Do not export the PBS_DATA_SERVICE_USER as a env var
	# since that would cause a false warning message
	# that "deprecated" variable PBS_DATA_SERVICE_USER is
	# being ignored.

	chk_dataservice_user ${PBS_DATA_SERVICE_USER}
	if [ $? -ne 0 ]; then
		exit 1
	fi
	export PBS_DATA_SERVICE_USER

	server_started=0
	PBS_DATA_SERVICE_PORT=${PBS_DATA_SERVICE_PORT:-"@database_port@"}
	export PBS_DATA_SERVICE_PORT

	create_new_svr_data=1

	# invoke the dataservice creation script for pbs
	resp=`${PBS_EXEC}/libexec/pbs_db_utility ${INSTALL_DB} 2>&1`
	ret=$?
	if [ $ret -eq 2 ]; then
		create_new_svr_data=0
	elif [ $ret -ne 0 ]; then
		echo "*** Error initializing the PBS dataservice"
		echo "Error details:"
		echo "$resp"
		exit $ret
	fi

	export PBS_HOME
	export PBS_EXEC
	export PBS_SERVER
	export PBS_ENVIRONMENT

	if [ $create_new_svr_data -eq 0 ]; then
		# datastore directory already exists
		# do the database upgrade
		${PBS_EXEC}/libexec/pbs_db_utility ${UPGRADE_DB}
	fi

	if [ $create_new_svr_data -eq 1 ] ; then
		echo "*** Setting default queue and resource limits."
		echo "***"

		${PBS_EXEC}/sbin/pbs_server -t create > /dev/null
		ret=$?
		if [ $ret -ne 0 ]; then
			echo "*** Error starting pbs server"
			exit $ret
		fi
		server_started=1

		if is_cray_xt; then
			${PBS_EXEC}/bin/qmgr <<-EOF > /dev/null
				set server restrict_res_to_release_on_suspend = ncpus
			EOF
		fi
		tries=3
		while [ $tries -ge 0 ]
		do
			${PBS_EXEC}/bin/qmgr <<-EOF > /dev/null
				create queue workq
			EOF
			ret=$?
			if [ $ret -eq 0 ]; then
				break
			fi
			tries=$((tries-1))
			sleep 2
		done
		${PBS_EXEC}/bin/qmgr <<-EOF > /dev/null
			set queue workq queue_type = Execution
			set queue workq enabled = True
			set queue workq started = True
			set server default_queue = workq
		EOF
		if [ -f ${PBS_HOME}/server_priv/$PBS_licensing_loc_file ]; then
			read ans < ${PBS_HOME}/server_priv/$PBS_licensing_loc_file
			echo "*** Setting license file location(s)."
			echo "***"
			${PBS_EXEC}/bin/qmgr <<-EOF > /dev/null
				set server pbs_license_info = $ans
			EOF
			if ! is_cray_xt; then
				rm -f ${PBS_HOME}/server_priv/$PBS_licensing_loc_file	# clean up after INSTALL
			fi
		fi
	else
		# the upgrade case:  serverdb already exists, but license file
		# information is new
		if [ -f ${PBS_HOME}/server_priv/$PBS_licensing_loc_file ]; then
			read ans < ${PBS_HOME}/server_priv/$PBS_licensing_loc_file
			echo "*** Setting license file location(s)."
			echo "***"
			${PBS_EXEC}/sbin/pbs_server > /dev/null
			${PBS_EXEC}/bin/qmgr <<-EOF > /dev/null
				set server pbs_license_info = $ans
			EOF
			if ! is_cray_xt; then
				rm -f ${PBS_HOME}/server_priv/$PBS_licensing_loc_file	# clean up after INSTALL
			else
				${PBS_EXEC}/bin/qmgr <<-EOF > /dev/null
					set server restrict_res_to_release_on_suspend += ncpus
				EOF
			fi
			server_started=1
		fi
	fi

	if [ $PBS_START_MOM != 0 ]; then
		if [ $server_started -eq 0 ]; then
			${PBS_EXEC}/sbin/pbs_server > /dev/null
			server_started=1
		fi

		if ${PBS_EXEC}/bin/pbsnodes localhost > /dev/null 2>&1 ||
		   ${PBS_EXEC}/bin/pbsnodes $server > /dev/null 2>&1; then
			:
		else
			# node $server is not already available, create
			${PBS_EXEC}/bin/qmgr <<-EOF > /dev/null
				create node $server
			EOF
		fi
	fi

	if [ $server_started -eq 1 ]; then
		${PBS_EXEC}/bin/qterm
	fi

	# Take a backup of pgsql binaries and lib to the PBS_EXEC folder
	backup_pgsql

fi

#
# For overlay upgrades PBS_START_MOM will be disabled per the install
# instructions. There may still be job and task files present that
# require updating.
#
if [ -d ${PBS_HOME}/mom_priv/jobs ]; then
	upgrade_cmd="${PBS_EXEC}/sbin/pbs_upgrade_job"
	if [ -x ${upgrade_cmd} ]; then
		total=0
		upgraded=0
		for file in ${PBS_HOME}/mom_priv/jobs/*.JB; do
			if [ -f ${file} ]; then
				${upgrade_cmd} -f ${file}
				if [ $? -ne 0 ]; then
					echo "Failed to upgrade ${file}"
				else
					upgraded=`expr ${upgraded} + 1`
				fi
				total=`expr ${total} + 1`
			fi
		done
		if [ ${total} -gt 0 ]; then
			echo "Upgraded ${upgraded} of ${total} job files."
		fi
	else
		echo "WARNING: $upgrade_cmd not found!"
	fi
fi

# Update the version file at the very end, after everything else succeeds.
# This allows it to be re-run, in case a previous update attempt failed.
# Clobber the existing pbs_version file and populate it with current version.
# This will prevent updating PBS_HOME if this same version is re-installed
#
echo "${pbs_version}" >"$PBS_HOME/pbs_version"

echo "*** End of ${0}"
exit 0


================================================
FILE: src/cmds/scripts/pbs_init.d.in
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

#
#    PBS init script
#
#        Recognized arguments:
#            start   - start PBS
#            stop    - terminate PBS
#            restart - terminate and start PBS
#            status  - report PBS deamon pids
#
#
# chkconfig: 35 90 10
# description: The Portable Batch System (PBS) is a flexible workload
# management  system. It operates on # networked, multi-platform UNIX
# environments, including heterogeneous clusters of workstations,
# supercomputers, and massively parallel systems.
#
### BEGIN INIT INFO
# Provides:       pbs
# Required-Start: $network $local_fs $remote_fs $named
# Should-Start: $sshd
# Required-Stop:  $network $local_fs $remote_fs $named
# Default-Start:  3 5
# Default-Stop:   0 1 2 4 6
# Description:    Portable Batch System
### END INIT INFO

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
	echo pbs_version = @PBS_VERSION@
	exit 0
fi

tmpdir=${PBS_TMPDIR:-${TMPDIR:-"/var/tmp"}}
ostype=`uname 2>/dev/null`

getpid() {
	if [ -f $1 ]; then
		cat $1
	else
		echo -1
	fi
}

# update_pids may cause an I/O read to block if PBS_HOME is on a shared
# mount, it is called selectively after sanity checks are performed
update_pids() {
	pbs_server_pid=`getpid ${PBS_HOME}/server_priv/server.lock`
	pbs_secondary_server_pid=`getpid ${PBS_HOME}/server_priv/server.lock.secondary`
	pbs_mom_pid=`getpid ${PBS_MOM_HOME}/mom_priv/mom.lock`
	pbs_sched_pid=`getpid ${PBS_HOME}/sched_priv/sched.lock`
	pbs_secondary_sched_pid=`getpid ${PBS_HOME}/sched_priv/sched.lock.secondary`
	pbs_comm_pid=`getpid ${PBS_HOME}/server_priv/comm.lock`
	pbs_secondary_comm_pid=`getpid ${PBS_HOME}/server_priv/comm.lock.secondary`
}

# lc_host_name - convert host name into lower case short host name
# also handle multiple names in PBS_LEAF_NAME
# PBS_LEAF_NAME is now of the format: host:port,host:port so the following code is to cut on , (to get the first host) and then : to parse our the port
lc_host_name()
{
  echo $1 | cut -d, -f1 | cut -d: -f1 | cut -d. -f1 | sed -e "y/ABCDEFGHIJKLMNOPQRSTUVWXYZ/abcdefghijklmnopqrstuvwxyz/"
}

# check_started - check if a particular pid is the program which is expected.
#                 pbs stores the pid of the currently running incarnation of
#                 itself.  This function is used to see if that pid is correct
#                  program.
#         $1 - the pid
#         $2 - the program name (pbs_server pbs_mom pbs_sched)
#
# return value: 0 - program is already running
#                1 - program is not running
#
: check_started
check_started() {
	ps_out=`ps -p $1 -o args 2> /dev/null | tail -1`
	if [ -z "${ps_out}" -o "`echo ${ps_out} | cut -c1`" = "[" ]; then
		ps_out=`ps -p $1 -o command 2> /dev/null | tail -1`
		if [ -z "${ps_out}" ]; then
			return 1
		fi
	fi

	# strip out everything except executable name
	prog_name=`echo ${ps_out} | grep -how "$2"`
	if [ "x${prog_name}" = "x$2" ]; then
		return 0;
	fi

	return 1;
}

# check_prog - this function checks to see if a prog is still running.  It will
#              get the pid out of the prog.lock file and run check_started
#               on that pid.
#
#        $1 is either "server" "pbs_comm" "mom" or "sched"
#
# return value: 0 - program is still running
#                1 - program is not running
#
: check_prog
check_prog() {

	case $1 in
		mom)
			daemon_name="pbs_mom"
			pid=${pbs_mom_pid} ;;
		server)
			daemon_name="pbs_server.bin"
			if [ ${is_secondary} -eq 0 ] ; then
				pid=${pbs_server_pid}
			else
				pid=${pbs_secondary_server_pid}
			fi ;;
		sched)
			daemon_name="pbs_sched"
			if [ ${is_secondary} -eq 0 ] ; then
				pid=${pbs_sched_pid} ;
			else
				pid=${pbs_secondary_sched_pid} ;
			fi ;;
		pbs_comm)
			daemon_name="pbs_comm"
			if [ ${is_secondary} -eq 0 ] ; then
				pid=${pbs_comm_pid} ;
			else
				pid=${pbs_secondary_comm_pid} ;
			fi ;;

		*)	echo Invalid PBS daemon name: $1 >&2;
			return 1;;
	esac

	if [ -n "${pid}" ]; then
		if [ "${pid}" -ne -1 ] ; then
			if check_started "${pid}" "${daemon_name}" ; then
				return 0
			fi
		fi
	fi

	# Since the pid file does not exist, PBS has never been run
	return 1
}

# Look to see if restrict_user_maxsysid exists in MOM config file
# If it is there, nothing else needs to be done.
# Otherwise, see if a default can be determined from login.defs.
check_maxsys()
{
	if grep '^$restrict_user_maxsysid' ${PBS_MOM_HOME}/mom_priv/config > /dev/null ; then
		return
	fi

	file=/etc/login.defs
	if [ -f ${file} ]; then
		val=`awk '$1 == "SYSTEM_UID_MAX" {print $2}' ${file}`
		if [ -z "${val}" ]; then
			val=`awk '$1 == "UID_MIN" {print $2 - 1}' ${file}`
		fi
		if [ -n "${val}" ]; then
			echo '$restrict_user_maxsysid' ${val} \
				>> ${PBS_MOM_HOME}/mom_priv/config
		fi
	fi
}

# Look if core or core.pid file exists in given _priv directory
# If exists format the name to core_<next_sequence_number>
# When core file found set core flag
check_core() {
	core_dir="$1"
	[ -n "${core_dir}" ] || core_dir="."

	core_list=`/bin/ls -1 "${core_dir}"/core* 2> /dev/null`
	if [ -n "${core_list}" ]; then
		seq_files=`echo "${core_list}" | grep "core_"`
		if [ $? -eq 0 ]; then
			max_seq=`echo "${seq_files}" | sed -e 's/[^0-9 ]*//g' | sort -n | tail -1`
		else
			max_seq=0
		fi

		for core_name in `/bin/ls "${core_dir}"/core* | grep -v "core_" 2> /dev/null`
		do
			max_seq=`expr ${max_seq} + 1`
			new_seq=`printf "%04d" ${max_seq}`
			mv ${core_name} "${core_dir}"/"core_${new_seq}"
		done

		core_flag=1
	fi
}

# Return the name of the PBS server host
get_server_hostname() {
	shn=""
	if [ -z "${PBS_PRIMARY}" -o -z "${PBS_SECONDARY}" ] ; then
		if [ -z "${PBS_SERVER_HOST_NAME}" ]; then
			shn="${PBS_SERVER}"
		else
			shn="${PBS_SERVER_HOST_NAME}"
		fi
	else
		shn="${PBS_PRIMARY}"
	fi
	echo `lc_host_name "${shn}"`
}

# Ensure the supplied hostname is valid
check_hostname() {
	# Check the hosts file
	getent hosts "$1" >/dev/null 2>&1 && return 0
	# Check DNS
	host "$1" >/dev/null 2>&1 && return 0
	return 1
}

start_pbs() {
	echo "Starting PBS"

	# Perform sanity checks
	server_hostname=`get_server_hostname`
	if [ -z "${server_hostname}" -o "${server_hostname}" = 'CHANGE_THIS_TO_PBS_SERVER_HOSTNAME' ] ; then
		echo "***" >&2
		echo "*** The hostname of the PBS server in ${conf} is invalid." >&2
		echo "*** Update the configuration file before starting PBS." >&2
		echo "***" >&2
		exit 1
	fi
	check_hostname "${server_hostname}"
	if [ $? -ne 0 ]; then
		echo "***" >&2
		echo "*** The PBS server could not be found: ${server}" >&2
		echo "*** This value must resolve to a valid IP address." >&2
		echo "***" >&2
		exit 1
	fi

	update_pids

	# See if we need to populate PBS_HOME. We do if...
	# 1) PBS_HOME doesn't exist  (needmakehome=1 -> create PBS_HOME)
	# 2) PBS_HOME/pbs_version doesn't exist
	# 3) if the version number in PBS_HOME/pbs_version does not match
	#    the version of the commands  (2 and 3 needmakehome=2 -> update)
	# 4) PBS_HOME/datastore does not exist and this is a server
	needmakehome=0
	[ ! -d "${PBS_HOME}" ] && needmakehome=1
	[ ${needmakehome} -eq 0 -a ! -f "${PBS_HOME}/pbs_version" ] && needmakehome=2
	if [ ${needmakehome} -eq 0 ]; then
		qstatver=`${PBS_EXEC}/bin/qstat --version | sed -e "s/^.* = //"`
		homever=`cat ${PBS_HOME}/pbs_version`
		[ "${qstatver}" != "${homever}" ] && needmakehome=3
	fi
	[ ${needmakehome} -eq 0 -a "${PBS_START_SERVER}" != "0" -a ! -d "${PBS_HOME}/datastore" ] && needmakehome=4

	if [ ${needmakehome} -ne 0 -a ! -x ${PBS_EXEC}/libexec/pbs_habitat ]; then
		echo "***" >&2
		echo "*** ${PBS_EXEC}/libexec/pbs_habitat is missing." >&2
		echo "***" >&2
		exit 1
	fi

	case ${needmakehome} in
		1)
			echo PBS Home directory ${PBS_HOME} does not exist.
			echo Running ${PBS_EXEC}/libexec/pbs_habitat to create it.
			${PBS_EXEC}/libexec/pbs_habitat || return 1
			echo Home directory ${PBS_HOME} created.
			;;
		2|3)
			echo PBS Home directory ${PBS_HOME} needs updating.
			echo Running ${PBS_EXEC}/libexec/pbs_habitat to update it.
			${PBS_EXEC}/libexec/pbs_habitat || return 1
			echo Home directory ${PBS_HOME} updated.
			;;
		4)
			echo PBS Home directory ${PBS_HOME} needs datastore.
			echo Running ${PBS_EXEC}/libexec/pbs_habitat to initialize it.
			${PBS_EXEC}/libexec/pbs_habitat || return 1
			echo Datastore directory ${PBS_HOME}/datastore initialized.
			;;
	esac

	core_flag=0
	if [ -d ${PBS_HOME}/server_priv ]; then
		check_core ${PBS_HOME}/server_priv
	fi
	if [ -d ${PBS_HOME}/sched_priv ]; then
		check_core ${PBS_HOME}/sched_priv
	fi
	if [ -d ${PBS_HOME}/mom_priv ]; then
		check_core ${PBS_HOME}/mom_priv
	fi

	if [ ${core_flag} -eq 1 ];then
		echo "Warning: PBS has detected core file(s) in PBS_HOME that require attention!!!"
		echo "Warning: Please inform your administrator immediately or contact Altair customer support"
	fi

	if [ "${PBS_START_COMM}" -gt 0 ]; then
		if check_prog "pbs_comm" ; then
			echo "PBS comm already running."
		else
			if ${PBS_EXEC}/sbin/pbs_comm
			then
				echo "PBS comm"
			else
				ret_val=$?
				echo "pbs_comm startup failed, exit ${retval} aborting." >&2
				exit 1
			fi
		fi
	fi

	if [ "${PBS_START_MOM}" -gt 0 ]; then
		if check_prog "mom" ; then
			echo "PBS mom already running."
		else
			if [ -f ${pbslibdir}/init.d/limits.pbs_mom ]; then
				. ${pbslibdir}/init.d/limits.pbs_mom
			fi
			check_maxsys

			if  ${PBS_EXEC}/sbin/pbs_mom
			then
				echo "PBS mom"
			else
				ret_val=$?
				echo "pbs_mom startup failed, exit ${ret_val} aborting." >&2
				return 1
			fi
		fi
	fi

	if [ "${PBS_START_SCHED}" -gt 0 ]; then
		if check_prog "sched" ; then
			echo "PBS scheduler already running."
		else
			if [ -f ${pbslibdir}/init.d/limits.pbs_sched ]; then
				. ${pbslibdir}/init.d/limits.pbs_sched
			fi
			if ${PBS_EXEC}/sbin/pbs_sched
			then
				echo "PBS sched"
			else
				ret_val=$?
				echo "pbs_sched startup failed, exit ${ret_val} aborting." >&2
				return 1
			fi
		fi
	fi

	if [ "${PBS_START_SERVER}" -gt 0 ] ; then
		if check_prog "server" ; then
			echo "PBS Server already running."
		else
			if [ -f ${pbslibdir}/init.d/limits.pbs_server ] ; then
				. ${pbslibdir}/init.d/limits.pbs_server
			fi
			if ${PBS_EXEC}/sbin/pbs_server ; then
				echo "PBS server"
			else
				ret_val=$?
				if [ ${ret_val} -eq 4 ] ; then
					echo "pbs_server failed to start, will retry once in 30 seconds" >&2
					sleep 30
					if ${PBS_EXEC}/sbin/pbs_server ; then
						echo "PBS server"
					else
						ret_val=$?
						echo "pbs_server startup failed, exit ${ret_val} aborting." >&2
						return 1
					fi
				else
					echo "pbs_server startup failed, exit ${ret_val} aborting." >&2
					return 1
				fi
			fi
		fi
	fi

	if [ -f ${pbslibdir}/init.d/limits.post_services ] ; then
		. ${pbslibdir}/init.d/limits.post_services
	fi
	if [ -f /etc/redhat-release ]; then
		touch ${redhat_subsys_filepath}
	fi

	return 0
}

stop_pbs() {
	echo "Stopping PBS"
	update_pids
	if [ "${PBS_START_SERVER}" -gt 0 ] ; then
		active_server=`lc_host_name \`${PBS_EXEC}/bin/qstat -Bf 2>/dev/null | \
		grep "server_host = " | \
		sed -e "s/.*server_host = //"\``
		if check_prog "server" ; then
			if [ "${my_hostname}" = "${active_server}" ]; then
				if [ -z "${PBS_SECONDARY}" -o ${is_secondary} -eq 1 ]; then
					echo "Shutting server down with qterm."
				else
					echo "This is active server, shutting down with qterm, secondary will take over."
				fi
				if [ -r "${PBS_HOME}/server_priv/qmgr_shutdown" ]; then
					echo "pbs_server evaluating ${PBS_HOME}/server_priv/qmgr_shutdown"
					${PBS_EXEC}/bin/qmgr <"${PBS_HOME}/server_priv/qmgr_shutdown"
				fi
				${PBS_EXEC}/bin/qterm -t quick
				echo "PBS server - was pid: ${pbs_server_pid}"
			elif [ ${is_secondary} -eq 1 ]; then
				echo "This is secondary server, killing process."
				kill ${pbs_secondary_server_pid}
				echo "PBS server - was pid: ${pbs_secondary_server_pid}"
				rm -f ${PBS_HOME}/server_priv/server.lock.secondary
			else
				echo "Killing Server."
				kill ${pbs_server_pid}
				echo "PBS server - was pid: ${pbs_server_pid}"
			fi
		fi
		${PBS_EXEC}/sbin/pbs_dataservice status > /dev/null 2>&1
		if [ $? -eq 0 ]; then
			${PBS_EXEC}/sbin/pbs_dataservice stop > /dev/null 2>&1
		fi
	fi
	if [ "${PBS_START_MOM}" -gt 0 ] ; then
		if check_prog "mom" ; then
			kill ${pbs_mom_pid}
			echo "PBS mom - was pid: ${pbs_mom_pid}"
		fi
	fi
	if [ "${PBS_START_SCHED}" -gt 0 ] ; then
		if check_prog "sched" ; then
			if [ ${is_secondary} -eq 0 ] ; then
				kill ${pbs_sched_pid}
				echo "PBS sched - was pid: ${pbs_sched_pid}"
			else
				kill ${pbs_secondary_sched_pid}
				echo "PBS schedx - was pid: ${pbs_secondary_sched_pid}"
				rm -f ${PBS_HOME}/sched_priv/sched.lock.secondary
			fi
		fi
	fi
	if [ "${PBS_START_COMM}" -gt 0 ] ; then
		if check_prog "pbs_comm" ; then
			if [ ${is_secondary} -eq 0 ] ; then
				kill -TERM ${pbs_comm_pid}
				echo "PBS comm - was pid: ${pbs_comm_pid}"
			else
				kill -TERM ${pbs_secondary_comm_pid}
				echo "PBS comm - was pid: ${pbs_secondary_comm_pid}"
				rm -f ${PBS_HOME}/server_priv/comm.lock.secondary
			fi
		fi
	fi
	if [ -f ${redhat_subsys_filepath} ] ; then
		rm -f ${redhat_subsys_filepath}
	fi
	# make sure the daemons have exited for up to 180 seconds
	# if any still there, exit with message and error
	waitloop=1
	echo "Waiting for shutdown to complete"
	while [ ${waitloop} -lt 180 ]
	do
		sleep 1
		something_running=""
		if [ "${PBS_START_SERVER}" -gt 0 ] ; then
			if check_prog "server" ; then
				something_running=" pbs_server"
			fi
		fi
		if [ "${PBS_START_MOM}" -gt 0 ] ; then
			if check_prog "mom" ; then
				something_running="${something_running} pbs_mom"
			fi
		fi
		if [ "${PBS_START_SCHED}" -gt 0 ] ; then
			if check_prog "sched" ; then
				something_running="${something_running} pbs_sched"
			fi
		fi
		if [ "${PBS_START_COMM}" -gt 0 ] ; then
			if check_prog "pbs_comm" ; then
				something_running=" pbs_comm"
			fi
		fi
		if [ "${something_running}" = "" ]; then
			return
		fi
		waitloop=`expr ${waitloop} + 1`
	done
	echo "Unable to stop PBS,${something_running} still active"
	exit 1
}

status_pbs() {
	update_pids
	if [ "${PBS_START_SERVER}" -gt 0 ]; then
		if check_prog "server" ; then
			echo "pbs_server is pid ${pid}"
		else
			echo "pbs_server is not running"
		fi
	fi
	if [ "${PBS_START_MOM}" -gt 0 ]; then
		if check_prog "mom" ; then
			echo "pbs_mom is pid ${pbs_mom_pid}"
		else
			echo "pbs_mom is not running"
		fi
	fi
	if [ "${PBS_START_SCHED}" -gt 0 ]; then
		if check_prog "sched" ; then
			echo "pbs_sched is pid ${pbs_sched_pid}"
		else
			echo "pbs_sched is not running"
		fi
	fi
	if [ "${PBS_START_COMM}" -gt 0 ]; then
		if check_prog "pbs_comm" ; then
			echo "pbs_comm is ${pbs_comm_pid}"
		else
			echo "pbs_comm is not running"
		fi
	fi
}

# Check whether PBS is registered to start at boot time
is_registered()
{
	if command -v systemctl >/dev/null 2>&1; then
		systemctl is-enabled pbs > /dev/null 2>&1
		return $?
	elif command -v chkconfig; then
		chkconfig pbs > /dev/null 2>&1
		return $?
	fi
	return 0
}

# Check whether system is being booted or not
# and also update the time in /var/tmp/pbs_boot_check file
# return 0 if system is being booted otherwise return 1
is_boottime()
{
	is_registered
	[ $? -ne 0 ] && return 1

	PYTHON_EXE=${PBS_EXEC}/python/bin/python
	if [ -z "${PYTHON_EXE}" -o ! -x "${PYTHON_EXE}" ] ; then
		PYTHON_EXE=`type python3 2>/dev/null | cut -d' ' -f3`
		if [ -z "${PYTHON_EXE}" -o ! -x "${PYTHON_EXE}" ] ; then
			return 1
		fi
	fi

	BOOTPYFILE="${pbslibdir}/python/pbs_bootcheck.py"
	BOOTCHECKFILE="/var/tmp/pbs_boot_check"

	if [ ! -r "${BOOTPYFILE}" ] ; then
		return 1
	fi

	${PYTHON_EXE} ${BOOTPYFILE} ${BOOTCHECKFILE} > /dev/null 2>&1
	ret=$?
	return ${ret}
}

pre_start_pbs()
{
	if is_boottime
	then
		case "${ostype}" in
			Linux) echo -e "\nStarting PBS in background\c" ;;
			*)  echo "\nStarting PBS in background\c" ;;
		esac
		(
			TEMP_DIR=${PBS_TMPDIR:-${TMPDIR:-"/var/tmp"}}
			TEMPFILE=${TEMP_DIR}/start_pbs_logs_tmp_$$
			start_pbs > ${TEMPFILE} 2>&1
			ret=$?
			logger -i -t PBS -f ${TEMPFILE}
			rm -f ${TEMPFILE}
			exit ${ret}
		) &
	else
		start_pbs
		exit $?
	fi
}

: main code
# save env variables in a temp file
env_save="/tmp/$$_$(date +'%s')_env_save"
declare -x > "${env_save}"

conf=${PBS_CONF_FILE:-@PBS_CONF_FILE@}
[ -r "${conf}" ] && . "${conf}"

# re-apply saved env variables
. "${env_save}"

rm -f "${env_save}"

if [ -z "${PBS_EXEC}" ]; then
	echo "PBS_EXEC is undefined." >&2
	exit 1
fi
if [ ! -d "${PBS_EXEC}" ]; then
	echo "${PBS_EXEC} is not a directory." >&2
	echo "PBS_EXEC directory does not exist: ${PBS_EXEC}" >&2
	exit 1
fi

pbslibdir="${PBS_EXEC}/lib"
[ ! -d "${pbslibdir}" -a -d "${PBS_EXEC}/lib64" ] && pbslibdir="${PBS_EXEC}/lib64"

if [ -z "${PBS_HOME}" ]; then
	echo "PBS_HOME is undefined." >&2
	exit 1
fi

[ -z "${PBS_START_SERVER}" ] && PBS_START_SERVER=0
[ -z "${PBS_START_MOM}" ] && PBS_START_MOM=0
[ -z "${PBS_START_SCHED}" ] && PBS_START_SCHED=0
[ -z "${PBS_START_COMM}" ] && PBS_START_COMM=0

UNIX95=1
export UNIX95
PBS_MOM_HOME=${PBS_MOM_HOME:-$PBS_HOME}

redhat_subsys_filepath="/var/lock/subsys/pbs"

# Determine the hostname that the local system should use
if [ -n "${PBS_LEAF_NAME}" ]; then
	my_hostname=`lc_host_name "${PBS_LEAF_NAME}"`
else
	my_hostname=`lc_host_name \`hostname\``
fi

# Check whether the hostname has an IP address
check_hostname "${my_hostname}"
if [ $? -ne 0 ]; then
	echo "***" >&2
	echo "*** Invalid local hostname: $my_hostname" >&2
	echo "*** This value must resolve to a valid IP address." >&2
	echo "***" >&2
	exit 1
fi

is_secondary=0
if [ -n "${PBS_SECONDARY}" ]; then
	sec_host=`lc_host_name ${PBS_SECONDARY}`
	if [ ${sec_host} = ${my_hostname} ]; then
		is_secondary=1
	fi
fi

# lets see how we were called
case "`basename $0`" in
	pbs_start)
		pre_start_pbs
		;;
	pbs_stop)
		stop_pbs
		;;
	*)
		case "$1" in
			start_msg)
				echo "Starting PBS"
				;;
			stop_msg)
				echo "Stopping PBS"
				;;
			status)
				status_pbs
				;;
			start)
				pre_start_pbs
				;;
			stop)
				stop_pbs
				;;
			restart)
				echo "Restarting PBS"
				stop_pbs
				pre_start_pbs
				;;
			*)
				echo "Usage: `basename $0` --version"
				echo "Usage: `basename $0` {start|stop|restart|status}"
				exit 1
				;;
		esac
		;;
esac


================================================
FILE: src/cmds/scripts/pbs_poerun.in
================================================
#!/usr/bin/env ksh93
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
#
# This script is run on each node of an MPI job by poe.  It uses the
# MP_CHILD value to figure out what adapter information to put into
# MP_MPI_NETWORK or MP_LAPI_NETWORK.  If the value of PBS_EUILIB is not
# "ip" and $PBS_HPS_JOBKEY has a value, the setup is done to use the HPS.
# Similarly, if the value of PBS_EUILIB is not "ip" and $PBS_AIXIB_JOBKEY
# has a value, the setup is done to use the InfiniBand.  The function
# extract_wins takes the window list and extracts the window information
# for the child being run.  The PBS_EUILIB variable is used instead of
# MP_EUILIB because poe may change MP_EUILIB.
#
# All arguments are passed to pbs_attach to run the MPI program.
#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

extract_wins() {
	# Extract our list of switch windows from full list
	# arguments:
	#	number of windows per process
	#	window list
	#	split windows between MPI and LAPI

	winsperproc=$1
	winlist=$2
	split=${3:-0}

	(( start = MP_CHILD * winsperproc ))
	oldifs="$IFS"
	IFS=":"
	set -A all_windows $winlist
	set -A windows1
	set -A windows2

	i=0
	while (( i < winsperproc )) ;do
		# use windows2 to save the second half of the windows list
		# if it is being split
		if (( $split && $i >= $split )) ;then
			windows2[$i]="${all_windows[(( start + i ))]}"
		else
			windows1[$i]="${all_windows[(( start + i ))]}"
		fi
		(( i = i + 1 ))
	done
	data1="${windows1[*]}"
	data2="${windows2[*]}"
	IFS="$oldifs"
}

if [ "XX$PBS_EUILIB" != "XXip" -a "${PBS_HPS_JOBKEY:-XX}" != "XX" ]; then
	export MP_PARTITION=$PBS_HPS_JOBKEY

	extract_wins $PBS_HPS_ADAPTERS $PBS_HPS_WINDOWS
	if [ "$MP_MSG_API" = "MPI" ]; then
		unset MP_CHILD_INET_ADDR
		export MP_MPI_NETWORK=@$PBS_HPS_ADAPTERS:$data1
	fi

	if [ "$MP_MSG_API" = "LAPI" ]; then
		unset MP_LAPI_INET_ADDR
		export MP_LAPI_NETWORK=@$PBS_HPS_ADAPTERS:$data1
	fi
elif [ "XX$PBS_EUILIB" != "XXip" -a "${PBS_AIXIB_JOBKEY:-XX}" != "XX" ]; then
	export MP_PARTITION=$PBS_AIXIB_JOBKEY

	# The lapi keywords are only genereated in lower case by poe.
	# The mpi keyword will be "MPI" if the user doesn't set it and
	# all lower case if the user sets it.
	if [ "$MP_MSG_API" = "MPI" -o "$MP_MSG_API" = "mpi" ]; then
		extract_wins $PBS_AIXIB_NETWORKS $PBS_AIXIB_WINDOWS
		unset MP_CHILD_INET_ADDR
		export MP_MPI_NETWORK=@$PBS_AIXIB_NETWORKS:$data1
	elif [ "$MP_MSG_API" = "lapi" -o "$MP_MSG_API" = "mpi_lapi" ]; then
		extract_wins $PBS_AIXIB_NETWORKS $PBS_AIXIB_WINDOWS
		unset MP_LAPI_INET_ADDR
		export MP_LAPI_NETWORK=@$PBS_AIXIB_NETWORKS:$data1
	elif [ "$MP_MSG_API" = "mpi,lapi" ]; then
		(( wins = PBS_AIXIB_NETWORKS / 2 ))
		extract_wins $PBS_AIXIB_NETWORKS $PBS_AIXIB_WINDOWS $wins
		unset MP_CHILD_INET_ADDR
		unset MP_LAPI_INET_ADDR
		export MP_MPI_NETWORK=@$wins:$data1
		export MP_LAPI_NETWORK=@$wins:$data2
	fi
fi

exec pbs_attach -s -j $PBS_JOBID "$@"


================================================
FILE: src/cmds/scripts/pbs_postinstall.in
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

#
# This script is responsible for creating and/or updating the PBS
# configuration file and the PBS_HOME directory. It does not start
# any PBS services. Additional configuration steps are performed
# by pbs_habitat.
#

if [ $# -eq 1 -a "$1" = "--version" ]; then
	echo pbs_version = @PBS_VERSION@
	exit 0
fi

# Used to determine if this is Cray XT system
is_cray_xt() {
	[ -f /proc/cray_xt/cname ] && return 0
	return 1
}

poe_interactive() {
	#Check if poe will allow interactive jobs
	if [ -f /etc/poe.limits ]; then
		. /etc/poe.limits
		if [ -z "$MP_POE_LAUNCH" ]; then
			echo "*** WARNING: MP_POE_LAUNCH unset may not allow jobs to run correctly"
		elif [ "$MP_POE_LAUNCH" = "none" -o \
				"$MP_POE_LAUNCH" = "ip" ]; then
			echo "*** WARNING: MP_POE_LAUNCH=$MP_POE_LAUNCH may not allow jobs to run correctly"
		fi
	fi
	return 0
}

createdir() {
	if [ -n "$1" -a ! -d "$1" ]; then
		if ! mkdir -p "$1"; then
			echo "*** Could not create $1"
			exit 1
		fi
	fi
	if [ -n "$1" -a -n "$2" ]; then
		chmod "$2" "$1"
	fi
}

createpath() {
	while read mode dir; do
		createdir "${PBS_HOME}/${dir}" $mode
	done
}


create_conf() {
	# If we have an existing @PBS_CONF_FILE@, save the old PBS_EXEC from
	# the existing pbs.conf and make a backup. It may be a directory or
	# a symbolic link so use cp rather than mv.
	if [ -f "$conf" ] ; then
		echo "*** Existing configuration file found: $conf"
		oldpbs_exec=`grep '^[[:space:]]*PBS_EXEC=' "$conf" | tail -1 | sed 's/^[[:space:]]*PBS_EXEC=\([^[:space:]]*\)[[:space:]]*/\1/'`
		oldpbs_home=`grep '^[[:space:]]*PBS_HOME=' "$conf" | tail -1 | sed 's/^[[:space:]]*PBS_HOME=\([^[:space:]]*\)[[:space:]]*/\1/'`
		conforig="${conf}.pre.${PBS_VERSION}"
		[ -f "$conforig" ] && conforig="${conforig}.`date +%Y%m%d%H%M%S`"
		echo "***"
		echo "*** Saving $conf as $conforig"
		cp "$conf" "$conforig"
	else
		echo "*** No configuration file found."
		echo "*** Creating new configuration file: $conf"
		oldpbs_exec=''
		oldpbs_home=''
	fi
	oldpbs_exec=`readlink -f "$oldpbs_exec"`

	case $INSTALL_METHOD in
	rpm)
		[ -f "$newconf" ] && newconf="${newconf}.`date +%Y%m%d%H%M%S`"
		# If an existing configuration file is present, adapt it.
		declare -a env_array=("PBS_HOME" "PBS_SERVER" "PBS_MOM_HOME" "PBS_PRIMARY" "PBS_SECONDARY" "PBS_LEAF_ROUTERS" "PBS_DAEMON_SERVICE_USER")
		if [ -f "$conf" ]; then
			eval "sed 's;\(^[[:space:]]*PBS_EXEC=\)[^[:space:]]*;\1$newpbs_exec;' \"$conf\" >$newconf"
			update_pbs_conf() {
				unset env_var env_value
				env_var=$1;
				env_value=$(eval echo \$$env_var)
				grep -q "^[[:space:]]*$env_var=[^[:space:]]*" "$newconf" \
					&& sed -i "s;\(^[[:space:]]*${env_var}=\)[^[:space:]]*;\1${env_value};" "$newconf" \
					|| echo "$env_var=${env_value}" >>"$newconf"
			}
			for var in "${env_array[@]}"
			do
				[ "${!var:+set}" ] && update_pbs_conf ${var}
			done
		else
			[ ${newpbs_exec:+set} ] && echo "PBS_EXEC=$newpbs_exec" >"$newconf"
			for var in "${env_array[@]}"
			do
				[ "${!var:+set}" ] && echo "${var}=${!var}" >>"$newconf"
			done
		fi
		;;

	script)
		# Need to set INSTALL_PACKAGE for script method.
		if [ -f "$newpbs_exec/sbin/pbs_server.bin" ]; then
			INSTALL_PACKAGE=server
		elif [ -f "$newpbs_exec/sbin/pbs_mom" ]; then
			INSTALL_PACKAGE=execution
		elif [ -f "$newpbs_exec/bin/qstat" ]; then
			INSTALL_PACKAGE=client
			newpbs_home=''
		else
			echo "***"
			echo "*** Unable to locate PBS executables!"
			echo "***"
			exit 1
		fi
		# if both conf files are present merge the files but precedence should be given to newconf
		if [ -f "$newconf" -a -f "$conf" ]; then
			while IFS='=' read -r key value; do
				if [ -z `grep -q "$key" "$newconf" && echo $?` ]; then
					echo "$key=$value" >> "$newconf"
				fi
			done < "$conf"
		fi
		# The INSTALL script may have already created newconf. If it
		# did, leave it alone. If not, and an existing configuration
		# file is present, adapt it by substituting the new value
		# of PBS_EXEC.
		if [ ! -f "$newconf" -a -f "$conf" ]; then
			# If an existing configuration file is present, adapt it by
			# substituting the new value of PBS_EXEC.
			eval "sed 's;\(^[[:space:]]*PBS_EXEC=\)[^[:space:]]*;\1$newpbs_exec;' \"$conf\"" >"$newconf"
		fi
		;;
	esac

	# Ensure newconf exists.
	touch "$newconf"
	chmod 644 "$newconf"

	# Source the new configuration file.
	. "$newconf"

	# Add some additional required fields if not present.
	if is_cray_xt ; then
		if [ -z "$PBS_SERVER" ]; then
			PBS_SERVER='CHANGE_THIS_TO_PBS_SERVER_HOSTNAME'
			echo "PBS_SERVER=$PBS_SERVER" >>"$newconf"
		fi
		[ -z "$PBS_START_SERVER" ] && echo "PBS_START_SERVER=0" >>"$newconf"
		[ -z "$PBS_START_SCHED" ] && echo "PBS_START_SCHED=0" >>"$newconf"
		[ -z "$PBS_START_COMM" ] && echo "PBS_START_COMM=0" >>"$newconf"
		[ -z "$PBS_START_MOM" ] && echo "PBS_START_MOM=0" >>"$newconf"
	else
		case $INSTALL_PACKAGE in
		server)
			if [ -z "$PBS_SERVER" ]; then
				PBS_SERVER=`hostname | awk -F. '{print $1}'`
				echo "PBS_SERVER=$PBS_SERVER" >>"$newconf"
			fi
			[ -z "$PBS_START_SERVER" ] && echo "PBS_START_SERVER=1" >>"$newconf"
			[ -z "$PBS_START_SCHED" ] && echo "PBS_START_SCHED=1" >>"$newconf"
			[ -z "$PBS_START_COMM" ] && echo "PBS_START_COMM=1" >>"$newconf"
			[ -z "$PBS_START_MOM" ] && echo "PBS_START_MOM=0" >>"$newconf"
			;;
		execution)
			if [ -z "$PBS_SERVER" ]; then
				PBS_SERVER='CHANGE_THIS_TO_PBS_SERVER_HOSTNAME'
				echo "PBS_SERVER=$PBS_SERVER" >>"$newconf"
			fi
			[ -z "$PBS_START_SERVER" ] && echo "PBS_START_SERVER=0" >>"$newconf"
			[ -z "$PBS_START_SCHED" ] && echo "PBS_START_SCHED=0" >>"$newconf"
			[ -z "$PBS_START_COMM" ] && echo "PBS_START_COMM=0" >>"$newconf"
			[ -z "$PBS_START_MOM" ] && echo "PBS_START_MOM=1" >>"$newconf"
			;;
		client)
			if [ -z "$PBS_SERVER" ]; then
				PBS_SERVER='CHANGE_THIS_TO_PBS_SERVER_HOSTNAME'
				echo "PBS_SERVER=$PBS_SERVER" >>"$newconf"
			fi
			[ -z "$PBS_START_SERVER" ] && echo "PBS_START_SERVER=0" >>"$newconf"
			[ -z "$PBS_START_SCHED" ] && echo "PBS_START_SCHED=0" >>"$newconf"
			[ -z "$PBS_START_COMM" ] && echo "PBS_START_COMM=0" >>"$newconf"
			[ -z "$PBS_START_MOM" ] && echo "PBS_START_MOM=0" >>"$newconf"
			;;
		esac
	fi

	[ -z "$PBS_EXEC" ] && echo "PBS_EXEC=$newpbs_exec" >>"$newconf"
	[ -z "$PBS_HOME" -a -n "$newpbs_home" ] && echo "PBS_HOME=$newpbs_home" >>"$newconf"
	[ -z "${PBS_CORE_LIMIT}" ] && echo "PBS_CORE_LIMIT=@PBS_CORE_LIMIT@" >>"$newconf"
	if ! grep "^PBS_SCP=" $newconf>/dev/null 2>&1; then
		PBS_SCP=`type -P scp`
		[ -n "$PBS_SCP" ] && echo "PBS_SCP=$PBS_SCP" >>"$newconf"
	fi

	# Source the new configuation file again to pick up any changes
	. "$newconf"
}


perform_checks() {
	fail=0
	if [ ${PBS_START_SERVER} != 0 -a ! -x ${PBS_EXEC}/sbin/pbs_server ] ;then
		echo "*** Server does not exist!"
		fail=1
	fi
	if [ ${PBS_START_SCHED} != 0 -a ! -x ${PBS_EXEC}/sbin/pbs_sched ] ;then
		echo "*** Scheduler does not exist!"
		fail=1
	fi
	if [ ${PBS_START_COMM} != 0 -a ! -x ${PBS_EXEC}/sbin/pbs_comm ] ;then
		echo "*** Communication agent does not exist!"
		fail=1
	fi
	if [ ${PBS_START_MOM} != 0 -a ! -x ${PBS_EXEC}/sbin/pbs_mom ] ;then
		echo "*** MOM does not exist!"
		fail=1
	fi
	if [ $fail -ne 0 ] ;then
		echo "***"
		echo "*** A required PBS executable is missing. This could be"
		echo "*** due to values defined in $conf"
		echo "*** Please edit or remove $conf and run the following command:"
		echo "*** $0 $*"
		echo "***"
		exit 1
	fi

	# Issue a warning if PBS_EXEC has changed.
	if [ -n "$oldpbs_exec" -a "$PBS_EXEC" != "$oldpbs_exec" ]; then
		echo "***"
		echo "*** ======="
		echo "*** NOTICE:"
		echo "*** ======="
		echo "*** PBS commands have moved."
		echo "*** Old location: $oldpbs_exec"
		echo "*** New location: $PBS_EXEC"
		echo "*** Users will need to ensure their PATH and MANPATH are set correctly."
		echo "*** In most cases, users must simply logout and log back in to source"
		echo "*** the new files in /etc/profile.d."
		echo "***"
	fi

	# Issue warning if PBS_HOME has changed.
	if [ -n "$oldpbs_home" -a "$PBS_HOME" != "$oldpbs_home" ]; then
		echo "***"
		echo "*** ======="
		echo "*** NOTICE:"
		echo "*** ======="
		echo "*** PBS_HOME has moved."
		echo "*** Old location: $oldpbs_home"
		echo "*** New location: $PBS_HOME"
		echo "*** To utilize PBS_HOME from the prior installation, you must perform"
		echo "*** one of the following actions:"
		echo "*** 1. Update PBS_HOME in $conf"
		echo "*** 2. mv $oldpbs_home $PBS_HOME"
		echo "*** 3. ln -s $oldpbs_home $PBS_HOME"
		echo "***"
	fi

	# Issue a warning if PBS_SERVER is invalid
	if [ -z "$PBS_SERVER" -o "$PBS_SERVER" = 'CHANGE_THIS_TO_PBS_SERVER_HOSTNAME' ]; then
		echo "*** ======="
		echo "*** NOTICE:"
		echo "*** ======="
		echo "*** The value of PBS_SERVER in ${conf} is invalid."
		echo "*** PBS_SERVER should be set to the PBS server hostname."
		echo "*** Update this value before starting PBS."
		echo "***"
	fi
}


install_pbsinitd() {
	if is_cray_xt ; then
		if [ -d /etc/init.d ]; then
			initscript="/etc/init.d/pbs"
		else
			initscript="/etc/rc.d/init.d/pbs"
		fi
		cp ${PBS_EXEC}/libexec/pbs_init.d $initscript
		rm -f /etc/rc.d/rc?.d/*pbs
		# For now, for Cray XT only, install "modulefile" in hard location
		if [ -d /opt/modulefiles -a -f ${PBS_EXEC}/etc/modulefile ]; then
			if [ ! -d /opt/modulefiles/pbs ] ; then
				createdir /opt/modulefiles/pbs 0755
			fi
			cp ${PBS_EXEC}/etc/modulefile /opt/modulefiles/pbs/${PBS_VERSION}
			chmod 0644 /opt/modulefiles/pbs/${PBS_VERSION}
		fi
	elif [ $INSTALL_PACKAGE != client ] ; then
		echo "*** Registering PBS as a service."
		case "$ostype" in
		Linux)
			if [ -d /etc/init.d ]; then
				initscript="/etc/init.d/pbs"
			else
				initscript="/etc/rc.d/init.d/pbs"
			fi
			cp ${PBS_EXEC}/libexec/pbs_init.d $initscript
			rm -f /etc/rc.d/rc?.d/*pbs
			if [ -x /sbin/chkconfig ] ; then
				/sbin/chkconfig --add pbs
			elif [ -x /usr/sbin/update-rc.d ] ; then
				/usr/sbin/update-rc.d pbs enable
			else
				ln -sf $initscript /etc/rc.d/rc0.d/K10pbs
				ln -sf $initscript /etc/rc.d/rc1.d/K10pbs
				ln -sf $initscript /etc/rc.d/rc2.d/K10pbs
				ln -sf $initscript /etc/rc.d/rc3.d/S90pbs
				ln -sf $initscript /etc/rc.d/rc4.d/K10pbs
				ln -sf $initscript /etc/rc.d/rc5.d/S90pbs
				ln -sf $initscript /etc/rc.d/rc6.d/K10pbs
			fi
			if [ -d /etc/profile.d ]; then
				[ -f /etc/profile.d/pbs.csh ] || cp ${PBS_EXEC}/etc/pbs.csh /etc/profile.d
				[ -f /etc/profile.d/pbs.sh ] || cp ${PBS_EXEC}/etc/pbs.sh /etc/profile.d
			fi

			pbs_unitfile="@_unitdir@/pbs.service"
			if [ -f "${pbs_unitfile}" ]; then
				presetdir="@_unitdir@-preset"
				eval "sed -i 's;\(^[[:space:]]*SourcePath=\)[^[:space:]]*;\1${PBS_EXEC}/libexec/pbs_init.d;' \"$pbs_unitfile\""
				eval "sed -i 's;\(^[[:space:]]*ExecStart=\)[^[:space:]]*;\1${PBS_EXEC}/libexec/pbs_init.d;' \"$pbs_unitfile\""
				eval "sed -i 's;\(^[[:space:]]*ExecStop=\)[^[:space:]]*;\1${PBS_EXEC}/libexec/pbs_init.d;' \"$pbs_unitfile\""
				if command -v systemctl >/dev/null 2>&1; then
					systemctl enable pbs && systemctl daemon-reload
					if [ $? != 0 -a -d "${presetdir}" ]; then
						echo "*** Creating preset file ${presetdir}/95-pbs.preset"
						echo "enable pbs.service" > "${presetdir}/95-pbs.preset"
					fi
				else
					echo "*** Systemctl binary is not available; Failed to register PBS as a service"
				fi
			fi
			;;
		esac
		pbslibdir="${PBS_EXEC}/lib64"
		[ -d "${pbslibdir}" ] || pbslibdir="${PBS_EXEC}/lib"
		if [ -f /var/tmp/pbs_boot_check ] ; then
			rm -f /var/tmp/pbs_boot_check
		fi
	fi
	echo "***"

	if [ "$conf" != "@PBS_CONF_FILE@" ]; then
		echo "*** ======="
		echo "*** NOTICE:"
		echo "*** ======="
		echo "*** PBS configuration information has been saved to a location"
		echo "*** other than the default. In order to make this the default"
		echo "*** installation, a symbolic link must be created to the new"
		echo "*** configuration file by manually issuing a command similar"
		echo "*** to the following:"
		echo "*** ln -s $conf @PBS_CONF_FILE@"
		echo "***"
	fi
}


create_home() {
	if [ $INSTALL_PACKAGE = client ]; then
		if [ -x ${PBS_EXEC}/bin/qstat ] ;then
			echo "*** The PBS commands have been installed in ${PBS_EXEC}/bin."
			echo "***"
		fi
		echo "*** End of ${0}"
		exit 0
	fi

	# This is not a client install. Create PBS_HOME.
	echo "*** PBS_HOME is $PBS_HOME"
	createdir "$PBS_HOME" 0755

	# Create the pbs_environment file if it does not exist
	envfile="${PBS_HOME}/pbs_environment"
	if [ ! -f "$envfile" ]; then
		newtz=""
		if [ -f /etc/TIMEZONE ]; then
			echo "*** Setting TZ from /etc/TIMEZONE"
			newtz=`grep '^TZ' /etc/TIMEZONE`
		elif [ -f /etc/sysconfig/clock ]; then
			echo "*** Setting TZ from /etc/sysconfig/clock"
			. /etc/sysconfig/clock
			if [ -f /etc/redhat-release ]; then
				if [ -n "$ZONE" ]; then
					newtz="`echo TZ=${ZONE} | sed 's/ /_/g'`"
				fi
			else
				if [ -n "$TIMEZONE" ]; then
					newtz="`echo TZ=${TIMEZONE} | sed 's/ /_/g'`"
				fi
			fi
		elif [ -n "$TZ" ]; then
			echo "*** Setting TZ from \$TZ"
			newtz="TZ=${TZ}"
		fi

		euilibus="us"
		if [ -f $envfile ] ; then
			echo "*** Found existing $envfile"
			if [ -n "$newtz" ]; then
				echo "*** Replacing TZ with $newtz"
				grep -v '^TZ' $envfile > ${envfile}.new
				echo $newtz >> ${envfile}.new
				mv -f $envfile ${envfile}.old
				mv -f ${envfile}.new $envfile
			fi
		else
			echo "*** Creating new file $envfile"
			touch $envfile
			chmod 644 $envfile
			if [ -n "$newtz" ]; then
				echo $newtz >> $envfile
			else
				echo "*** WARNING: TZ not set in $envfile"
			fi

			echo PATH="/bin:/usr/bin" >> $envfile
		fi
	else
		echo "*** Existing environment file left unmodified: $envfile"
	fi
	echo "***"

	# Configure PBS_HOME for server
	if [ -x "$PBS_EXEC/sbin/pbs_server" ]; then
		echo "*** The PBS server has been installed in ${PBS_EXEC}/sbin."
		createpath <<-EOF
			0755 server_logs
			1777 spool
			0750 server_priv
			0755 server_priv/accounting
			0750 server_priv/jobs
			0750 server_priv/users
			0750 server_priv/hooks
			0750 server_priv/hooks/tmp
		EOF
		# copy PBS hooks into place
		pbslibdir="${PBS_EXEC}/lib64"
		[ -d "${pbslibdir}" ] || pbslibdir="${PBS_EXEC}/lib"
		if [ -d ${pbslibdir}/python/altair/pbs_hooks ]; then
			cp -p ${pbslibdir}/python/altair/pbs_hooks/* \
					${PBS_HOME}/server_priv/hooks
		fi
		# special for Cray
		if is_cray_xt; then
			sed --in-place "s/enabled=false/enabled=true/" $PBS_HOME/server_priv/hooks/PBS_alps_inventory_check.HK
		else
			rm -f ${PBS_HOME}/server_priv/hooks/PBS_xeon_phi_provision.{HK,PY}
		fi
		# create the database user file if it does not exist
		dbuser_fl="${PBS_HOME}/server_priv/db_user"
		if [ ! -f "${dbuser_fl}" ]; then
			printf "${dbuser:-@database_user@}" >"${dbuser_fl}"
			chmod 0600 "${dbuser_fl}"
		fi
	fi

	# Configure PBS_HOME for scheduler
	if [ -x "$PBS_EXEC/sbin/pbs_sched" ]; then
		echo "*** The PBS scheduler has been installed in ${PBS_EXEC}/sbin."
		createpath <<-EOF
			0755 sched_logs
			0750 sched_priv
		EOF
		[ -f "${PBS_HOME}/sched_priv/dedicated_time" ] || cp "${PBS_EXEC}/etc/pbs_dedicated" "${PBS_HOME}/sched_priv/dedicated_time"
		[ -f "${PBS_HOME}/sched_priv/holidays" ] || cp "${PBS_EXEC}/etc/pbs_holidays" "${PBS_HOME}/sched_priv/holidays"
		[ -f "${PBS_HOME}/sched_priv/resource_group" ] || cp "${PBS_EXEC}/etc/pbs_resource_group" "${PBS_HOME}/sched_priv/resource_group"
		if [ ! -f ${PBS_HOME}/sched_priv/sched_config ]; then
			cp ${PBS_EXEC}/etc/pbs_sched_config ${PBS_HOME}/sched_priv/sched_config
			chmod 644 ${PBS_HOME}/sched_priv/sched_config
		fi
		# special for cray... add vntype and hbmem to sched_config if it isn't already there
		if is_cray_xt; then
			sconfig="${PBS_HOME}/sched_priv/sched_config"
			grep '^[[:space:]]*resources:.*vntype' $sconfig > /dev/null
			if [ $? -ne 0 ]; then
				echo "*** Added vntype to sched_config resources"
				sed --in-place '/^[[:space:]]*resources:/ s/\"$/, vntype\"/' $sconfig
			fi

			grep '^[[:space:]]*resources:.*hbmem' $sconfig > /dev/null
			if [ $? -ne 0 ]; then
				echo "*** Added hbmem to sched_config resources"
				sed --in-place '/^[[:space:]]*resources:/ s/\"$/, hbmem\"/' $sconfig
			fi
		fi

		if [ "${PBS_DAEMON_SERVICE_USER}x" != "x" ]; then
			id=`id ${PBS_DAEMON_SERVICE_USER} 2>&1`
			if [ $? -ne 0 ]; then
				echo "*** PBS_DAEMON_SERVICE_USER ${PBS_DAEMON_SERVICE_USER} does not exist"
			else
				chown -R "${PBS_DAEMON_SERVICE_USER}" "${PBS_HOME}/sched_priv"
				chown -R "${PBS_DAEMON_SERVICE_USER}" "${PBS_HOME}/sched_logs"
			fi
		fi

		echo "***"

	fi

	# Configure PBS_HOME for pbs_comm
	if [ -x "$PBS_EXEC/sbin/pbs_comm" ]; then
		echo "*** The PBS communication agent has been installed in ${PBS_EXEC}/sbin."
		createpath <<-EOF
			0755 comm_logs
			0750 server_priv
			1777 spool
		EOF
		echo "***"
	fi

	# Configure PBS_HOME for MOM
	if [ -x "$PBS_EXEC/sbin/pbs_mom" ] ;then
		echo "*** The PBS MOM has been installed in ${PBS_EXEC}/sbin."
		createpath <<-EOF
			0755 aux
			0700 checkpoint
			0755 mom_logs
			0751 mom_priv
			0751 mom_priv/jobs
			0750 mom_priv/hooks
			0750 mom_priv/hooks/tmp
			1777 spool
			1777 undelivered
		EOF
		mompriv="${PBS_HOME}/mom_priv"
		momconfig="${mompriv}/config"
		if [ ! -f "$momconfig" ]; then
			touch "$momconfig"
			chmod 0644 "$momconfig"
		fi

		if is_cray_xt; then
			grep "^\$vnodedef_additive" "$momconfig" >/dev/null
			if [ $? -ne 0 ] ; then
				echo "\$vnodedef_additive 0" >> $momconfig
			fi
			grep "^\$alps_client" "$momconfig" >/dev/null
			if [ $? -ne 0 ] ; then
				echo "\$alps_client /opt/cray/alps/default/bin/apbasil" >> $momconfig
			fi
		fi
		echo "***"
	fi

	if [ -x "${PBS_EXEC}/bin/qstat" ] ;then
		echo "*** The PBS commands have been installed in ${PBS_EXEC}/bin."
		echo "***"
	else
		echo "*** The PBS commands are missing in ${PBS_EXEC}/bin."
		echo "***"
		exit 1
	fi

	# Do not update PBS_HOME/pbs_version here, pbs_habitat will do that.

}

echo "*** PBS Installation Summary"
echo "***"
echo "*** Postinstall script called as follows:"
printf "*** $0 "; printf "%q " "$@"; printf "\n"
echo "***"
PBS_VERSION='@PBS_VERSION@'
conf="${PBS_CONF_FILE:-@PBS_CONF_FILE@}"
oldconfdir=`dirname "${conf}"`
ostype=`uname 2>/dev/null`
unset PBS_EXEC
unset preset_dbuser
unset preset_serviceuser
umask 022
if [ "${PBS_DATA_SERVICE_USER:+set}" ]; then
	preset_dbuser="${PBS_DATA_SERVICE_USER}"
fi
if [ "${PBS_DAEMON_SERVICE_USER:+set}" ]; then
	preset_serviceuser="${PBS_DAEMON_SERVICE_USER}"
fi

# Define the location of a file that the INSTALL script may have created.
# This file will be used regardless of installation method.
newconf=${oldconfdir}/pbs.conf.${PBS_VERSION}

INSTALL_METHOD="rpm"
case "$1" in
server)
	INSTALL_PACKAGE=$1
	PBS_VERSION="${2:-@PBS_VERSION@}"
	newpbs_exec="${3:-@prefix@}"
	newpbs_home="${4:-@PBS_SERVER_HOME@}"
	dbuser="${preset_dbuser:-${5:-@database_user@}}"
	if [ "$6" = "sameconf" ]; then
		sameconf="true"
	else
		sameconf="false"
	fi
	serviceuser="${preset_serviceuser:-${7:-@service_user@}}"
	if [ ! -x "$newpbs_exec/sbin/pbs_server" ]; then
		echo "***"
		echo "*** Unable to locate PBS executables!"
		echo "***"
		exit 1
	fi
	;;
execution)
	INSTALL_PACKAGE=$1
	PBS_VERSION="${2:-@PBS_VERSION@}"
	newpbs_exec="${3:-@prefix@}"
	newpbs_home="${4:-@PBS_SERVER_HOME@}"
	if [ "$5" = "sameconf" ]; then
		sameconf="true"
	else
		sameconf="false"
	fi
	if [ ! -x "$newpbs_exec/sbin/pbs_mom" ]; then
		echo "***"
		echo "*** Unable to locate PBS executables!"
		echo "***"
		exit 1
	fi
	;;
client)
	INSTALL_PACKAGE=$1
	PBS_VERSION="${2:-@PBS_VERSION@}"
	newpbs_exec="${3:-@prefix@}"
	newpbs_home='@PBS_SERVER_HOME@'
	if [ "$4" = "sameconf" ]; then
		sameconf="true"
	else
		sameconf="false"
	fi
	if [ ! -x "$newpbs_exec/bin/qstat" ]; then
		echo "***"
		echo "*** Unable to locate PBS executables!"
		echo "***"
		exit 1
	fi
	;;
*)
	INSTALL_METHOD="script"
	sameconf="false"
	if [ -f "$newconf" ]; then
		newpbs_exec=`grep '^[[:space:]]*PBS_EXEC=' "$newconf" | tail -1 | sed 's/^[[:space:]]*PBS_EXEC=\([^[:space:]]*\)[[:space:]]*/\1/'`
		newpbs_home=`grep '^[[:space:]]*PBS_HOME=' "$newconf" | tail -1 | sed 's/^[[:space:]]*PBS_HOME=\([^[:space:]]*\)[[:space:]]*/\1/'`
	else
		newpbs_exec=@prefix@
		newpbs_home=@PBS_SERVER_HOME@
	fi
	;;
esac

# Ensure newpbs_exec exists.
if [ ! -d "$newpbs_exec" ]; then
	echo "***"
	echo "*** Directory does not exist: $newpbs_exec"
	echo "***"
	exit 1
fi

if [ "$sameconf" != "true" ]; then
	# Edit the new configuration file based on the install method.
	# Create newconf for the rpm install method.
	create_conf

	# Set defaultdir based on the installed location of PBS. It controls whether
	# a symbolic link named "default" will be created or updated.
	defaultdir=0
	[ `basename "$PBS_EXEC"` = "$PBS_VERSION" ] && defaultdir=1

	# Adjust PBS_EXEC defaultdir is enabled
	if [ $defaultdir -ne 0 ]; then
		realexec="${PBS_EXEC}"
		PBS_EXEC=`dirname ${PBS_EXEC}`/default
		eval "sed -i 's;\(^[[:space:]]*PBS_EXEC=\)[^[:space:]]*;\1$PBS_EXEC;' \"$newconf\""
		if [ -h "${PBS_EXEC}" ] ; then
			echo "*** Removing old symbolic link ${PBS_EXEC}"
			rm -f ${PBS_EXEC}
		fi
		echo "*** Creating new symbolic link ${realexec} pointing to ${PBS_EXEC}"
		ln -s "${realexec}" "${PBS_EXEC}"
	fi

	# Perform some sanity checks.
	perform_checks

	echo "*** Replacing $conf with $newconf"
	mv -f "$newconf" "$conf"

	if [ -n "$conforig" ]; then
		echo "*** $conf has been modified."
		echo "*** The original contents have been saved to $conforig"
	else
		echo "*** $conf has been created."
	fi
	echo "***"

	# If any daemon is to be started, we need to install the init.d script
	# also if installing on Cray XT; but for Cray don't do chkconfig, see AG
	install_pbsinitd
fi

. "$conf"
# The remainder of the script deals with creating and configuring PBS_HOME.
# This is not necessary for a client installation.
create_home

# Now need to save the license information into PBS_HOME for pbs_habitat
	if [ ${PBS_LICENSE_INFO:+set} ] ; then
		if is_cray_xt ; then
			xtopview -e "[ -d ${PBS_HOME}/server_priv/ ] && echo ${PBS_LICENSE_INFO} > ${PBS_HOME}/server_priv/PBS_licensing_loc"
		else
			[ -d ${PBS_HOME}/server_priv/ ] && echo ${PBS_LICENSE_INFO} > ${PBS_HOME}/server_priv/PBS_licensing_loc
		fi
	fi
echo "*** End of ${0}"
exit 0


================================================
FILE: src/cmds/scripts/pbs_posttrans
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

# The %preun section of 14.x unconditially removes /etc/init.d/pbs
# because it does not check whether the package is being removed
# or upgraded. Make sure it exists here.
if [ -r $1/libexec/pbs_init.d ]; then
	install -D $1/libexec/pbs_init.d /etc/init.d/pbs
fi


================================================
FILE: src/cmds/scripts/pbs_preuninstall
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
pbs_version="$2"
pbs_exec="$3"
pbs_home="${4:-/var/spool/pbs}"
have_systemd="${5:-0}"

if [ `basename $pbs_exec` = $pbs_version ]; then
    top_level=`dirname $pbs_exec`
    if [ -h $top_level/default ]; then
        link_target=`readlink $top_level/default`
        [ `basename "$link_target"` = $pbs_version ] && rm -f $top_level/default
    fi
fi
rm -f /opt/modulefiles/pbs/$pbs_version

case "$1" in
server|execution)
    [ -x /etc/init.d/pbs ] && /etc/init.d/pbs stop
    [ -x /sbin/chkconfig ] && /sbin/chkconfig --del pbs >/dev/null 2>&1
    rm -f /etc/rc.d/rc?.d/[KS]??pbs
    rm -f /var/tmp/pbs_boot_check
    if [ $have_systemd = 1 ]; then
        echo "have systemd"
        systemctl disable pbs
        rm -f /usr/lib/systemd/system-preset/95-pbs.preset
        if command -v python &> /dev/null && [ -f ${pbs_home}/mom_priv/hooks/pbs_cgroups.CF ]; then
            service_name=`cat ${pbs_home}/mom_priv/hooks/pbs_cgroups.CF | python -c "import sys, json; print(json.load(sys.stdin)['cgroup_prefix'])"`
            systemctl stop ${service_name}.service
            [ -d /sys/fs/cgroup/cpuset/${service_name}.service/jobid ] && rmdir /sys/fs/cgroup/cpuset/${service_name}.service/jobid
            [ -d /sys/fs/cgroup/cpuset/${service_name}.service ] && rmdir /sys/fs/cgroup/cpuset/${service_name}.service
        fi
        [ -d /sys/fs/cgroup/cpuset/pbspro.service/jobid ] && rmdir /sys/fs/cgroup/cpuset/pbspro.service/jobid
        [ -d /sys/fs/cgroup/cpuset/pbspro.service ] && rmdir /sys/fs/cgroup/cpuset/pbspro.service
        exit 0
    fi
    ;;
esac


================================================
FILE: src/cmds/scripts/pbs_reload.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2020 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

check_cgroup=$$
path=`awk '/cgroup/ {print $2; exit}' /proc/mounts`
cgpath=$path/systemd/system.slice/pbs.service
if [ -e $cgpath/cgroup.procs ]; then
    echo $check_cgroup > $cgpath/cgroup.procs
fi
exec "$@"


================================================
FILE: src/cmds/scripts/pbs_server
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# save env variables in a temp file
env_save="/tmp/$$_$(date +'%s')_env_save"
declare -x > "${env_save}"

. ${PBS_CONF_FILE:-/etc/pbs.conf}

# re-apply saved env variables
. "${env_save}"

rm -f "${env_save}"

# Source the file that sets DB ENV variables
. ${PBS_EXEC}/libexec/pbs_db_env


# Loading dynamic library at PBS_EXEC/lib
export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$PBS_EXEC/lib/:$PBS_EXEC/lib64/


exec $PBS_EXEC/sbin/pbs_server.bin ${1+"$@"}


================================================
FILE: src/cmds/scripts/pbs_snapshot
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


ptllibpath=
ptlbinpath=
ptl_prefix_lib=

# Try package install paths
if [ -f /etc/debian_version ]; then
    __ptlpkgname=$(dpkg-query -W -f='${binary:Package}\n' 2>/dev/null | grep -E '*-ptl$')
    if [ "x${__ptlpkgname}" != "x" ]; then
        ptl_prefix_lib=$(dpkg -L ${__ptlpkgname} 2>/dev/null | grep -m 1 lib$ 2>/dev/null)
    fi
else
    __ptlpkgname=$(rpm -qa 2>/dev/null | grep -E '*-ptl-[[:digit:]]')
    if [ "x${__ptlpkgname}" != "x" ]; then
        ptl_prefix_lib=$(rpm -ql ${__ptlpkgname} 2>/dev/null | grep -m 1 lib$ 2>/dev/null)
    fi
fi

# Try system paths
if [ "x${ptl_prefix_lib}" != "x" ]; then
    if [ ! -d ${ptl_prefix_lib} ]; then
        ptl_prefix_lib=/usr/local/lib/python3.[[:digit:]]/site-packages
        if [ ! -d ${ptl_prefix_lib} ]; then
            ptl_prefix_lib=/usr/lib/python3.[[:digit:]]/site-packages
        fi
    fi
fi

conf="${PBS_CONF_FILE:-/etc/pbs.conf}"
if [ -r "${conf}" ]; then
    # we only need PBS_EXEC from pbs.conf
    __PBS_EXEC=$( grep '^[[:space:]]*PBS_EXEC=' "$conf" | tail -1 | sed 's/^[[:space:]]*PBS_EXEC=\([^[:space:]]*\)[[:space:]]*/\1/' )
else
    echo "Error: Unable to read PBS conf file" >&2
    exit 1
fi
unset conf

__pbs_snapshot=pbs_snapshot

if [ "x${ptl_prefix_lib}" != "x" ]; then
    python_dir=$(/bin/ls -1 ${ptl_prefix_lib})
    prefix=$(dirname ${ptl_prefix_lib})

    ptllibpath=${prefix}/lib/${python_dir}/site-packages
    ptlbinpath=${prefix}/bin
else
    if [ "X${__PBS_EXEC}" != "X" ]; then
        # Define PATH and PYTHONPATH for the users
        PTL_PREFIX=$(dirname ${__PBS_EXEC})/ptl
        if [ ! -d "${PTL_PREFIX}/lib/site-packages" ]; then
            ptlbinpath=${__PBS_EXEC}/unsupported/fw/bin
            ptllibpath=${__PBS_EXEC}/unsupported/fw
            __pbs_snapshot=${__pbs_snapshot}.py
        else
            python_dir=$(/bin/ls -1 ${PTL_PREFIX}/lib)/site-packages
            ptllibpath=${PTL_PREFIX}/lib/${python_dir}
            ptlbinpath=${PTL_PREFIX}/bin
        fi
       unset PTL_PREFIX
       unset python_dir
    fi
fi

export PYTHONPATH=${ptllibpath}:${PYTHONPATH}

if [ -d $ptlbinpath ] && [ -d $ptllibpath ];then
    if [ -x "${__PBS_EXEC}/python/bin/python" ]; then
        ${__PBS_EXEC}/python/bin/python ${ptlbinpath}/${__pbs_snapshot} "${@}"
    else
        python3 ${ptlbinpath}/${__pbs_snapshot} "${@}"
    fi
else
    echo "***" >&2
    echo "*** Ptllib/Ptlbin Path Not found" >&2
    echo "***" >&2
    exit 1
fi

unset __PBS_EXEC
unset __pbs_snapshot


================================================
FILE: src/cmds/scripts/pbs_topologyinfo
================================================
#!/bin/sh -
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


. ${PBS_CONF_FILE:-/etc/pbs.conf}
export PBS_HOME

pbslibdir="${PBS_EXEC}/lib64"
[ -d "${pbslibdir}" ] || pbslibdir="${PBS_EXEC}/lib"
exec $PBS_EXEC/bin/pbs_python $pbslibdir/python/pbs_topologyinfo.py ${1+"$@"}


================================================
FILE: src/cmds/scripts/pbs_topologyinfo.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import errno
from optparse import OptionParser
import os
import re
import sys
import math
import platform


class Inventory(object):
    """
    This class is used to parse the inventory details
    and hold the device information
    """

    def reset(self):
        self.nsockets = 0
        self.nnodes = 0
        self.hwloclatest = 0
        self.CrayVersion = "0.0"
        self.ndevices = 0
        self.gpudevices = 0
        self.cardflag = False
        self.renderflag = False

    def __init__(self):
        self.reset()

    def reportsockets_win(self, topo_file):
        """
        counting devices by parsing topo_file
        """
        temp = topo_file.read().decode('utf-8').split(',')
        for item in temp:
            if item.find('sockets:') != -1:
                self.nsockets = int(item[8:])  # len('sockets:') = 8
                self.ndevices += int(item[8:])
            if item.find('gpus:') != -1:
                self.ndevices += int(item[5:])  # len('gpus:') = 5
            if item.find('mics:') != -1:
                self.ndevices += int(item[5:])  # len('mics:') = 5

    def latest_hwloc(self, hwlocVersion):
        """
        socket tag is different on versions above 1.11
        turning hwloclatest flag on if the version is above 1.11
        """
        hwlocVersion = hwlocVersion.split('.')
        major = int(hwlocVersion[0])
        minor = int(hwlocVersion[1]) if len(hwlocVersion) > 1 else 0
        if ((major == 1) and (minor >= 11)) or (major > 1):
            self.hwloclatest = 1

    def calculate(self):
        """
        Returns the number of licenses required based on specific formula
        """
        self.ndevices += self.gpudevices
        return(int(math.ceil(self.ndevices / 4.0)))

    def reportsockets(self, dirs, files, options):
        """
        Look for and report the number of socket/node licenses
        required by the cluster. Uses expat to parse the XML.
        dirs - directory to look for topology files.
        files - files for which inventory needs to be parsed
        options - node / socket.
        """

        if files is None:
            compute_socket_nodelist = True
            try:
                files = os.listdir(dirs)
                if not files:
                    return
            except (IOError, OSError) as err:
                (e, strerror) = err.args
                print("%s:  %s (%s)" % (dirs, strerror, e))
                return
        else:
            compute_socket_nodelist = False
        try:
            maxwidth = max(list(map(len, files)))
        except Exception as e:
            print('max/map failed: %s' % e)
            return

        try:
            import xml.parsers.expat
            from xml.parsers.expat import ExpatError
            ExpatParser = True
        except ImportError:
            ExpatParser = False

        for name in files:
            pathname = os.sep.join((dirs, name))
            self.reset()
            try:
                with open(pathname, "rb") as topo_file:
                    temp_buf = topo_file.readline().decode('utf-8')
                    topo_file.seek(0)
                    # Windows topology file are not XML files. So if
                    # a file does not start with '<', it is a Windows
                    # topology file
                    if not temp_buf.startswith('<'):
                        self.reportsockets_win(topo_file)
                    elif ExpatParser:
                        try:
                            p = xml.parsers.expat.ParserCreate()
                            p.StartElementHandler = socketXMLstart
                            p.ParseFile(topo_file)
                        except ExpatError as e:
                            print("%s:  parsing error at line %d, column %d"
                                  % (name, e.lineno, e.offset))
                    else:
                        self.countsockets(topo_file)
                    if options.sockets:
                        print("%-*s%d" % (maxwidth + 1, name, self.nsockets))
                    else:
                        self.nnodes += self.calculate()
                        print("%-*s%d" % (maxwidth + 1, name,
                                          inventory.nnodes))

            except IOError as err:
                (e, strerror) = err.args
                if e == errno.ENOENT:
                    if not compute_socket_nodelist:
                        print("no socket information available for node %s"
                              % name)
                    continue
                else:
                    print("%s:  %s (%s)" % (pathname, strerror, e))
                    raise

    def countsockets(self, topo_file):
        """
        Used when an import of the xml.parsers.expat module fails.
        This version makes use of regex expressions.
        """
        socketpattern = r'<\s*object\s+type="Socket"'
        packagepattern = r'<\s*object\s+type="Package"'
        gpupattern = r'<\s*object\s+type="OSDev"\s+name="card\d+"\s+' \
            'osdev_type="1"'
        renderpattern = r'<\s*object\s+type="OSDev"\s+name="renderD\d+"\s+' \
            'osdev_type="1"'
        micpattern = r'<\s*object\s+type="OSDev"\s+name="mic\d+"\s+' \
            'osdev_type="5"'
        craypattern = r'<\s*BasilResponse\s+'
        craynodepattern = r'<\s*Node\s+node_id='
        craysocketpattern = r'<\s*Socket\s+ordinal='
        craygpupattern = r'<\s*Accelerator\s+.*type="GPU"'
        hwloclatestpattern = r'<\s*info\s+name="hwlocVersion"\s+'

        for line in topo_file:
            line = line.decode('utf-8')
            if re.search(craypattern, line):
                start_index = line.find('protocol="') + len('protocol="')
                self.CrayVersion = line[start_index:
                                        line.find('"', start_index)]
                continue
            if re.search(hwloclatestpattern, line):
                hwlocVer = line[line.find('value="') + len('value="'):
                                line.rfind('"/>')]
                self.latest_hwloc(hwlocVer)
                continue

            if self.CrayVersion != "0.0":
                if re.search(craynodepattern, line):
                    self.nnodes += self.calculate()
                    self.ndevices = 0
                    if float(self.CrayVersion) <= 1.2:
                        self.nsockets += 2
                        self.ndevices += 2
                elif re.search(craysocketpattern, line):
                    self.nsockets += 1
                    self.ndevices += 1
                if re.search(craygpupattern, line):
                    self.ndevices += 1
            else:
                if ((self.hwloclatest and re.search(packagepattern, line)) or
                        (not self.hwloclatest and re.search(socketpattern,
                                                            line))):
                    self.nsockets += 1
                    self.ndevices += 1
                self.cardflag += 1 if re.search(gpupattern, line) else 0
                self.renderflag += 1 if re.search(renderpattern, line) else 0
                self.ndevices += 1 if re.search(micpattern, line) else 0
        self.gpudevices = min(self.cardflag, self.renderflag)


def socketXMLstart(name, attrs):
    """
    StartElementHandler for expat parser
    """
    global inventory
    if name == "BasilResponse":
        inventory.CrayVersion = attrs.get("protocol")
        return
    if (name == "info" and attrs.get("name") == "hwlocVersion"):
        inventory.latest_hwloc(attrs.get("value"))
        return
    if inventory.CrayVersion != "0.0":
        if name == "Node":
            inventory.nnodes += inventory.calculate()
            inventory.ndevices = 0
            if float(inventory.CrayVersion) <= 1.2:
                inventory.nsockets += 2
                inventory.ndevices += 2
        elif name == "Socket":
            inventory.nsockets += 1
            inventory.ndevices += 1
        if name == "Accelerator" and attrs.get("type") == "GPU":
            inventory.ndevices += 1
    else:
        if (name == "object" and ((inventory.hwloclatest == 1 and
            attrs.get("type") == "Package") or
            (inventory.hwloclatest == 0 and attrs.get("type") ==
                "Socket"))):
            inventory.nsockets += 1
            inventory.ndevices += 1
        if (name == "object" and attrs.get("type") == "OSDev" and
            attrs.get("osdev_type") == "1" and
                attrs.get("name").startswith("card")):
            inventory.cardflag = True
        elif (name == "object" and attrs.get("type") == "OSDev" and
              attrs.get("osdev_type") == "1" and
                attrs.get("name").startswith("renderD")):
            if inventory.cardflag is True:
                inventory.gpudevices += 1
                inventory.cardflag = False
        else:
            inventory.cardflag = False
        if (name == "object" and attrs.get("type") == "OSDev" and
            attrs.get("osdev_type") == "5" and
                attrs.get("name").startswith("mic")):
            inventory.ndevices += 1


if __name__ == "__main__":
    usagestr = "usage:  %prog [ -a -s ]\n\t%prog -s node1 [ node2 ... ]"
    parser = OptionParser(usage=usagestr)
    parser.add_option("-a", "--all", action="store_true", dest="allnodes",
                      help="report on all nodes")
    parser.add_option("-s", "--sockets", action="store_true", dest="sockets",
                      help="report node socket count")
    parser.add_option("-l", "--license", action="store_true", dest="license",
                      help="report license count")
    (options, progargs) = parser.parse_args()

    try:
        topology_dir = os.sep.join((os.environ["PBS_HOME"], "server_priv",
                                    "topology"))
    except KeyError:
        print("PBS_HOME must be present in the caller's environment")
        sys.exit(1)
    if not (options.sockets or options.license):
        sys.exit(1)
    inventory = Inventory()
    if options.allnodes:
        inventory.reportsockets(topology_dir, None, options)
    else:
        inventory.reportsockets(topology_dir, progargs, options)


================================================
FILE: src/cmds/scripts/pbsrun.ch_gm.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun_ch_gm.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-v \
-t \
-s \
-r \
-h \
--gm-no-shmem \
-gm-no-shmem \
--gm-shmem-prefix \
-gm-shmem-prefix \
--gm-numa-shmem \
--gm-label \
-gm-label \
--gm-no-sigcatch \
-gm-no-sigcatch \
--gm-copy-env \
-gm-copy-env \
-totalview \
-tv \
-ddt \
-usage \
-help \
--help \
-mvback \
-mvhome \
--INIT \
--gm-tree-spawn \
-gm-tree-spawn \
--gm-fixed-alloc \
-gm-fixed-alloc \
--gm-spawn-servers \
-gm-spawn-servers \
-np <n> \
-wd <path> \
--gm-wait <n> \
-gm-wait <n> \
--gm-kill <n> \
-gm-kill <n> \
--gm-eager <n> \
-gm-eager <n> \
--gm-recv <m> \
-gm-recv <m> \
--gm-lock-mbytes <n> \
-gm-lock-mbytes <n> \
--gm-bounce-buffers <n> \
-gm-bounce-buffers <n> \
-pg <file> \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-machinefile <file> \
"

#####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
"

#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_with_another_form="\
"

####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
#####################################################################
pbs_attach="pbs_attach"

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach="-j $PBS_JOBID"

################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorious for the following behavior:
#		echo "-n"      		--> prints empty (-n is an echo opt)
#     Desired behavior:
#		printf "%s" "-n" 	--> prints "-n"
#
########################################################################
transform_action () {
	args=$*

	printf "%s" "$*"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {

	mpirun_location=$1
	return 0
}

################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorious for the following behavior:
#		echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
# 		printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {
	args=$*

	found_np=0
	while [ $# -gt 0 ]; do
          if [ "XX$1" = "XX-np" ]; then
		found_np=1
		break
	  fi
	  shift
	done

	if [ $found_np -eq 0 ] ; then
		usernp=`cat ${PBS_NODEFILE} | wc -l | tr -d ' '`
		args="-np $usernp $args"
	fi

        pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        args="-machinefile $pbs_machinefile $args"


	printf "%s" "$args"

}

################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {
	args=$*

        printf ""

}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	printf ""
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {
	mpirun_location=$1
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
	rm -f $pbs_machinefile 2>/dev/null
}


================================================
FILE: src/cmds/scripts/pbsrun.ch_mx.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun.ch_mx.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brakcets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-v \
-t \
-s \
-r \
-totalview \
-tv \
-usage \
-help \
--help \
-h \
--INIT \
-mvback \
-mvhome \
-totalview \
-ddt \
-wd <path> \
-np <n> \
--mx-wait <n> \
-mx-wait <n> \
--mx-kill <n> \
-mx-kill <n> \
--mx-recv <m> \
-mx-recv <m> \
--mx-noshmem \
-mx-noshmem \
--mx-copy-env \
-mx-copy-env \
--mx-tree-spawn \
-mx-tree-spawn \
--mx-label \
-mx-label \
--mx-no-sigcatch \
-mx-no-sigcatch \
-pg <file> \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-machinefile <file> \
"

#####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
"

#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_with_another_form="\
"

####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
#####################################################################
pbs_attach="pbs_attach"

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach="-j $PBS_JOBID"

################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorious for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
transform_action () {
	args=$*

	printf "%s" "$*"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {
 	mpirun_location=$1
	return 0
}

################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorious for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {

	args=$*

	found_np=0
	while [ $# -gt 0 ]; do
          if [ "XX$1" = "XX-np" ]; then
		found_np=1
		break
	  fi
	  shift
	done

	if [ $found_np -eq 0 ] ; then
		usernp=`cat ${PBS_NODEFILE} | wc -l | tr -d ' '`
		args="-np $usernp $args"
	fi

        pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        args="-machinefile $pbs_machinefile $args"

	printf "%s" "$args"
}

################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {
	args=$*

        printf ""

}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	printf ""
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {
	 mpirun_location=$1
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
	rm -f $pbs_machinefile 2>/dev/null
}


================================================
FILE: src/cmds/scripts/pbsrun.gm_mpd.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun.gm_mpd.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-np <n> \
-s \
-h \
-g <group_size> \
-iI \
-l \
-1 \
-y \
-whole \
-wdir <dirname> \
-jid <jobid> \
-jidfile <file> \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-m <file> \
"

####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
"

#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_with_another_form="\
"

####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
#####################################################################
pbs_attach="pbs_attach"

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach="-j $PBS_JOBID"

################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
transform_action () {
       args=$*

        printf "%s" "$*"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {
	mpirun_location=$1
	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"

	if [ "$RSHCOMMAND" = "" ] ; then
		RSHCOMMAND=rsh
	fi

	MPD=${mpirun_location}/mpd
	MPDKILL=${mpirun_location}/mpdallexit
	MPDTRACE=${mpirun_location}/mpdtrace

	# Get the host.list from PBS and uniq it.
	sort -u $PBS_NODEFILE > $pbs_hostsfile

	# Kill a previous ring
	rm -f /tmp/mpd.console_${USER}
	$MPDKILL >/dev/null 2>/dev/null

	# Start a ring here : (assuming the first host in pbs_hostsfile is here)
	# check that the port is valid : 12345

	port=$($MPD -b -t|tail -1)
	if [ $? -ne 0 ] || [ "x${port}" = "x" ]
	then
  		rm -f $pbs_hostsfile
  		return 1
	fi

	# For all remaining hosts in the pbs_hostsfile, join the ring
	hostname=`hostname | awk -F. '{print $1}'`
	master=$(hostname)
	for h in `cat $pbs_hostsfile |grep -vw $hostname`
	do
   		$RSHCOMMAND $h "$MPDKILL;rm -f /tmp/mpd.console_${USER};$MPD -h $master -p $port -b" >/dev/null 2>/dev/null
	done

	# Ring is ready
	$MPDTRACE > /dev/null 2>/dev/null
	if [ $? -ne 0 ]
	then
   		echo Well ring is not ready
   		rm -f $pbs_hostsfile
   		return 2
	fi

	rm -f $pbs_hostsfile
	return 0
}

################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {
	args=$*

	found_np=0
	while [ $# -gt 0 ]; do
          if [ "XX$1" = "XX-np" ]; then
		found_np=1
		break
	  fi
	  shift
	done

	if [ $found_np -eq 0 ] ; then
		usernp=`cat ${PBS_NODEFILE} | wc -l | tr -d ' '`
		args="-np $usernp $args"
	fi

        pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        args="-m $pbs_machinefile $args"

	printf "%s" "$args"

}

################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {
	args=$*

        printf ""

}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	printf ""
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {
	mpirun_location=$1

	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

	rm -f $pbs_hostsfile
	rm -f $pbs_machinefile 2>/dev/null

	${mpirun_location}/mpdallexit >/dev/null 2>/dev/null

}


================================================
FILE: src/cmds/scripts/pbsrun.intelmpi.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun.intelmpi.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-h \
--help \
-help \
-nolocal \
-perhost <n> \
-tv \
-n <n> \
-np <n> \
-wdir <directory> \
-path <directory> \
-soft <spec> \
-arch <arch> \
-env <envvar> <value> \
-envall \
-envnone \
-envlist <list_of_env_var_names> \
-version \
-V \
-genv <envvar> <value> \
-genvnone \
-gn <n> \
-gnp <n> \
-gwdir <directory> \
-gpath <directory> \
-gsoft <spec> \
-garch <arch> \
-genv <envvar> <value> \
-genvall \
-genvnone \
-genvlist <list_of_env_var_names> \
-gversion \
-gV \
-l \
-if \
-kx \
-bnr \
-d \
-v \
--help \
--rsh=* \
--user=* \
--mpd=* \
--loccons \
--remcons \
--shell \
--verbose \
-1 \
--ncpus=* \
-r <rshcmd> \
-u <user> \
-m <mpdcmd> \
-file <XML_job_description> \
-s <spec> \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-host <hostname> \
-ghost <hostname> \
--totalnum=* \
--file=* \
-f <mpd_hosts_file> \
-machinefile <file> \
"

#####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
-configfile <configfile> \
"
#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################

options_with_another_form="\
-s <spec> \
"

#####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
#####################################################################
pbs_attach=$PBS_EXEC/bin/pbs_attach

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach="-j $PBS_JOBID -P"


################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
transform_action () {
    args=$*
    printf "%s" "$args"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {

	mpirun_location=$1

	return 0
}

# Check if version is older than "4.0.3"
# awk exit 0 means true (version is older)
# awk exit 1 means false (version is equal or newer)
ver_older () {
	file="/tmp/ckver$$"
	cat <<-EOF > $file
	{
		if (NF < 3)
			exit 0;
		if (\$1 < 4)
			exit 0;
		if (\$1 > 4)
			exit 1;
		if (\$2 > 0)
			exit 1;
		if (\$3 < 3)
			exit 0;
		exit 1;
	}
	EOF
	echo $1 | awk -F. -f $file
	ret=$?
	rm $file
	return $ret
}

# get mpirun version and see if it is at least 4.0.3
hydra_supported () {
	file="/tmp/getver$$"
	cat <<-EOF > $file
	BEGIN {
		ver = "0.0";
		update = "0";
	}

	{
		for(i=1;i<=NF;i++) {
			if (\$i == "Version" && i<NF)
				ver = \$(i+1);
			if (\$i == "Update" && i<NF)
				update = \$(i+1);
		}
	}

	END {
		printf("%s.%s\n", ver, update);
	}
	EOF

	ver=`$mpirun -V |awk -f $file`
	rm $file

	if ver_older $ver ;then
		return 1
	else
		return 0	# hydra supported
	fi
}

################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {

# 	Special handling of --rsh and -r because they have to
#	be added before other options.
	first=""
	args=""

	while [ $# -gt 0 ] ; do
		case "$1" in
		$pbs_attach)
			args="$args $*"
			break
			;;

		-r|-u|-m)
			first="$first $1 $2"
			shift
			;;

		--rsh=*|--user=*|--mpd=*)
			first="$first $1"
			;;

		*)
			args="$args $1"
			;;
		esac
		shift
	done

	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

	sort -u $PBS_NODEFILE > $pbs_hostsfile
	num_mpds=`wc -l $pbs_hostsfile | awk '{print $1}'`

	cat -n ${PBS_NODEFILE} | \
		sort -k2 | uniq -f1 -c | \
		awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
		sort -n | awk '{print $2}' > $pbs_machinefile

	if [ "x$I_MPI_PROCESS_MANAGER" != "xmpd" -a \
				"x$I_MPI_PROCESS_MANAGER" != "xMPD" ] && hydra_supported ;then
		printf "%s" "-hostfile=$pbs_hostsfile $first -machinefile $pbs_machinefile $args"
	else
		printf "%s" "--totalnum=$num_mpds --file=$pbs_hostsfile $first -machinefile $pbs_machinefile $args"
	fi
}


################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {

# 	Special handling of --rsh and -r because they have to
#	be added before other options.
	first=""
	args=""

	while [ $# -gt 0 ] ; do
		case "$1" in
		$pbs_attach)
			args="$args $*"
			break
			;;

		-r|-u|-m)
			first="$first $1 $2"
			shift
			;;

		--rsh=*|--user=*|--mpd=*)
			first="$first $1"
			;;

		*)
			args="$args $1"
			;;
		esac
		shift
	done

	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"

	sort -u $PBS_NODEFILE > $pbs_hostsfile
	num_mpds=`wc -l $pbs_hostsfile | awk '{print $1}'`

	if [ "x$I_MPI_PROCESS_MANAGER" != "xmpd" -a \
				"x$I_MPI_PROCESS_MANAGER" != "xMPD" ] && hydra_supported ;then
		printf "%s" "-hostfile=$pbs_hostsfile $first $args"
	else
		printf "%s" "--totalnum=$num_mpds --file=$pbs_hostsfile $first $args"
	fi
}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        printf "%s" "-machinefile $pbs_machinefile"
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {

    mpirun_location=$1

    pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
    pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

    rm -f $pbs_hostsfile
    rm -f $pbs_machinefile
}


================================================
FILE: src/cmds/scripts/pbsrun.mpich2.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun.mpich2.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-h \
-help \
--help \
-n <x> \
-np <x> \
-path <search_path> \
-wdir <dirname> \
-file <filename> \
-soft <spec> \
-arch <arch> \
-env <var> <val> \
-envall \
-envlist <env_var_names> \
-envnone \
-gn <x> \
-gnp <x> \
-gwdir <dirname> \
-gsoft <spec> \
-garch <arch> \
-genv <var> <val> \
-genvall \
-genvlist <env_var_names> \
-genvnone \
-gpath <search_path> \
-gumask <umask> \
-l \
-1 \
-ifhn \
-tv \
-usize \
-bnr \
-s <spec> \
-m \
-a \
-ecfn \
-kx \
-help2 \
-dir <drive_path> \
-exitcodes \
-noprompt \
-localroot \
-port <port> \
-p <port> \
-phrase <passphrase> \
-smpdfile <filename> \
-timeout <seconds>
-map <drive_path> \
-logon \
-pwdfile <filename> \
-nopopup_debug  \
-priority <class_level> \
-register \
-remove \
-validate \
-delegate \
-impersonate \
-plaintext \
-maxtime <seconds> \
-gdb \
-umask <umask> \
-gdba <jobid> \
-localonly \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-host <hostname> \
-ghost <hostname> \
-machinefile <file> \
"

#####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
-hosts \
-ghosts \
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
-configfile <configfile> \
"

#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_with_another_form="\
-localonly \
"

#####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
#####################################################################
pbs_attach=pbs_attach

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach="-j $PBS_JOBID -s -P"


################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
transform_action () {
    args=$*
    printf "%s" "$args"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {

	mpirun_location=$1

	 # Get the host.list from PBS and uniq it.
	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
        sort -u $PBS_NODEFILE > $pbs_hostsfile
	num_mpds=`wc -l $pbs_hostsfile | awk '{print $1}'`
	$mpirun_location/mpdboot -n $num_mpds --file=$pbs_hostsfile
	return 0
}


################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {
	args=$*

	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        printf "%s" "-machinefile $pbs_machinefile $args"
}


################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {
	args=$*

        printf "%s" "$args"
}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        printf "%s" "-machinefile $pbs_machinefile"
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {

    mpirun_location=$1

    pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
    pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
    $mpirun_location/mpdallexit  >/dev/null 2>/dev/null

    rm -f $pbs_hostsfile
    rm -f $pbs_machinefile
}


================================================
FILE: src/cmds/scripts/pbsrun.mvapich1.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun_mvapich1.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

if [ "${PBS_NODEFILE:-XX}" != "XX" ]; then
#	save any value of P4_RSHCOMMAND
	if [ -n "$P4_RSHCOMMAND" -a -z "$PBS_RSHCOMMAND" ]; then
		export PBS_RSHCOMMAND=$P4_RSHCOMMAND
	fi

#	set P4_RSHCOMMAND to pbs_remsh
	export P4_RSHCOMMAND="$PBS_EXEC/bin/pbs_remsh"
fi

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-h \
-v \
-t \
-ksq \
-dbg=<debugger> \
-stdin <file> \
-all-local \
-machine <machinename> \
-machinedir <directory> \
-np <n> \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-machinefile <file> \
-exclude <list> \
-map <list> \
"

#####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
"

#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_with_another_form="\
"

####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
# In mvapich1, the full path seems to be needed, otherwise the
# parse of the command line fails.
#####################################################################
pbs_attach=""

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach=""

################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorious for the following behavior:
#		echo "-n"      		--> prints empty (-n is an echo opt)
#     Desired behavior:
#		printf "%s" "-n" 	--> prints "-n"
#
########################################################################
transform_action () {
	args=$*

	printf "%s" "$*"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {
	mpirun_location=$1
	return 0
}

################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorious for the following behavior:
#		echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
# 		printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {
	args=$*

	found_np=0
	while [ $# -gt 0 ]; do
          if [ "XX$1" = "XX-np" ]; then
		found_np=1
		break
	  fi
	  shift
	done

	if [ $found_np -eq 0 ] ; then
		usernp=`cat ${PBS_NODEFILE} | wc -l | tr -d ' '`
		args="-np $usernp $args"
	fi

        pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
        cat ${PBS_NODEFILE} > $pbs_machinefile

        args="-machinefile $pbs_machinefile $args"


	printf "%s" "$args"

}

################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {
	args=$*

        printf ""

}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	printf ""
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {
	mpirun_location=$1
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
	rm -f $pbs_machinefile 2>/dev/null
}


================================================
FILE: src/cmds/scripts/pbsrun.mvapich2.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun.mvapich2.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-l \
-bnr \
-s <spec> \
-1 \
-ifhn \
-tv \
-gdb \
-m \
-a \
-ecfn \
-n <n> \
-np <n> \
-wdir <dirname> \
-umask <umask> \
-path <dirname> \
-soft <spec> \
-arch <arch> \
-envall \
-envnone \
-envlist <list> \
-env <var> <val> \
-gn <x> \
-gnp <x> \
-gwdir <dirname> \
-gsoft <spec> \
-garch <arch> \
-genv <var> <val> \
-genvall \
-genvlist <env_var_names> \
-genvnone \
-gpath <search_path> \
-gumask <umask> \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-host <hostname> \
-machinefile <file> \
"

#####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
-configfile <configfile> \
"

#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_with_another_form="\
"

#####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
#####################################################################
pbs_attach=pbs_attach

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach="-j $PBS_JOBID"


################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
transform_action () {
    args=$*
    printf "%s" "$args"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {
	mpirun_location=$1

#	If user has done mpdboot then we don't need to do it.
	$mpirun_location/mpdtrace >/dev/null 2>/dev/null
	if [ $? -eq 0 ]; then
		return 0
	fi

	# Get the host.list from PBS and uniq it.
	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
        sort -u $PBS_NODEFILE > $pbs_hostsfile
	num_mpds=`wc -l $pbs_hostsfile | awk '{print $1}'`
	$mpirun_location/mpdboot -n $num_mpds --file=$pbs_hostsfile
	return 0
}


################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorius for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {
	args=$*

	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        printf "%s" "-machinefile $pbs_machinefile $args"
}


################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {
	args=$*

        printf "%s" "$args"
}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        printf "%s" "-machinefile $pbs_machinefile"
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {

	mpirun_location=$1

	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

	if [ -f $pbs_hostsfile ]; then
    		$mpirun_location/mpdallexit  >/dev/null 2>/dev/null
		rm -f $pbs_hostsfile
	fi
	rm -f $pbs_machinefile
}


================================================
FILE: src/cmds/scripts/pbsrun.mx_mpd.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun.mx_mpd.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

#####################################################################
# options_to_retain:  space-separted list of options and values that
# "pbsrun" will pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_retain="\
-np <n> \
-s \
-h \
-g <group_size> \
-iI \
-l \
-1 \
-y \
-whole \
-wdir <dirname> \
-jid <jobid> \
-jidfile <file> \
"

#####################################################################
# options_to_ignore:  space-separted list of options and values that
# "pbsrun" will NOT pass on to the actual mpirun call. options must begin
# with "-" or "--", option name can contain a wildcard (*) to match a
# number of characters (e.g. --totalnum=*), and option arguments must
# be specified by some arbitrary name bounded by angle brackets,
# as in "<val1>".
#####################################################################
options_to_ignore="\
-m <file> \
"

####################################################################
# options_to_transform:  space-separted list of options and values that
# "pbsrun" will modify before passing on to the actual mpirun call.
# options must begin with "-" or "--", option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*),
# and option arguments must be specified by some arbitrary name
# bounded by angle brackets, as in "<val1>".
# NOTE: Adding values here require code to be added to
# transform_action() function appearing later in this file.
#####################################################################
options_to_transform="\
"

#####################################################################
# options_to_fail: space-separated list of options that will cause "pbsrun"
# to exit upon encountering a match.
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_to_fail="\
"

#####################################################################
# option_to_configfile: the SINGLE option and value that refers to the
# name of the "configfile" containing command line segments, found
# in certain versions of mpirun.
# option must begin with "-" or "--".
#
#####################################################################
option_to_configfile="\
"

#####################################################################
# options_with_another_form: space-separated list of options and values
# that can be found in options_to_retain, options_to_ignore, or
# options_to_transform, whose syntax has an alternate, unsupported
# form.
# This usually occurs if a version of mpirun has different forms for
# the same option.
# For instance,
#       MPICH2's mpirun provides:
#               mpirun -localonly <x>
#               mpirun -localonly
# If options_to_retain lists "-localonly" as supported value, then
# set options_with_another_form="-localonly" as well.
# This would cause "pbsrun" to issue a
# warning about alternate forms upon encountering the  option.
#
# options must begin with "-" or "--", and option name can contain a
# wildcard (*) to match a number of characters (e.g. --totalnum=*).
#
#####################################################################
options_with_another_form="\
"

####################################################################
# pbs_attach: full path or relative path to the pbs_attach executable.
#
#####################################################################
pbs_attach="pbs_attach"

#####################################################################
# options_to_pbs_attach:  are the special options to pass to the
# pbs_attach call. You may pass variable references (e.g. $PBS_JOBID)
# and they will be substituted  by pbsrun to actual values.
#####################################################################
options_to_pbs_attach="-j $PBS_JOBID"

################## transform_action() ###################################
# The action to be performed for each actual item and value matched in
# options_to_transform.
# RETURN: echo the replacement item and value for the matched arguments.
# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote the <value>) in place
#     of "echo" command here since we're returning an option, and 'echo' is
#     notorious for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
transform_action () {
       args=$*

        printf "%s" "$*"
}

################## boot_action() ###################################
# The action to be performed BEFORE before calling mpirun.
# The location of actual mpirun is passed as first argument.
# RETURN: 0 for success; non-zero otherwise.
# NOTES:
# (1) 'return' produces the exit status of this function:
#     0 for success; non-zero for failure.
####################################################################
boot_action () {
	mpirun_location=$1
	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"

	if [ "$RSHCOMMAND" = "" ] ; then
		RSHCOMMAND=rsh
	fi

	MPD=${mpirun_location}/mpd
	MPDKILL=${mpirun_location}/mpdallexit
	MPDTRACE=${mpirun_location}/mpdtrace

	# Get the host.list from PBS and uniq it.
	sort -u $PBS_NODEFILE > $pbs_hostsfile

	# Kill a previous ring
	rm -f /tmp/mpd.console_${USER}
	$MPDKILL >/dev/null 2>/dev/null

	# Start a ring here : (assuming the first host in pbs_hostsfile is here)
	# check that the port is valid : 12345

	port=$($MPD -b  -t|tail -1)
	if [ $? -ne 0 ] || [ "x${port}" = "x" ]
	then
  		rm -f $pbs_hostsfile
  		return 1
	fi

	# For all remaining hosts in the pbs_hostsfile, join the ring
	hostname=`hostname | awk -F. '{print $1}'`
	master=$(hostname)
	for h in `cat $pbs_hostsfile |grep -vw $hostname`
	do
   		$RSHCOMMAND $h "$MPDKILL;rm -f /tmp/mpd.console_${USER};$MPD -h $master -p $port -b" >/dev/null 2>/dev/null
	done

	# Ring is ready
	$MPDTRACE > /dev/null 2>/dev/null
	if [ $? -ne 0 ]
	then
   		echo Well ring is not ready
   		rm -f $pbs_hostsfile
   		return 2
	fi

	rm -f $pbs_hostsfile
	return 0
}

################## evaluate_options_action() #######################
# The action to be performed on the actual options and values matched
# in options_to_retain, not including those in options_to_ignore, and
# those changed arguments in options_to_transform, as well as any
# other transformation needed on the program name and program arguments.
#
# RETURN: echo the list of final arguments and program arguments
# to be passed on to mpirun command line.

# NOTES:
# (1) "echo" produces the return value of this function;
#     do not arbitrarily invoke echo statements.
# (2) Please use 'printf "%s" "<value>"' (must quote <value>) in place of
#     "echo" command here since we're returning option string, and
#     'echo' is notorious for the following behavior:
#               echo "-n"               --> prints empty (-n is an echo opt)
#     Desired behavior:
#               printf "%s" "-n"        --> prints "-n"
#
########################################################################
evaluate_options_action () {
	args=$*

	found_np=0
	while [ $# -gt 0 ]; do
          if [ "XX$1" = "XX-np" ]; then
		found_np=1
		break
	  fi
	  shift
	done

	if [ $found_np -eq 0 ] ; then
		usernp=`cat ${PBS_NODEFILE} | wc -l | tr -d ' '`
		args="-np $usernp $args"
	fi

        pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"
        cat -n ${PBS_NODEFILE} | \
        sort -k2 | uniq -f1 -c | \
        awk '{if ($1 == 1) print $2, $3; else print $2, $3 ":" $1}'|\
        sort -n | awk '{print $2}' > $pbs_machinefile

        args="-m $pbs_machinefile $args"

	printf "%s" "$args"

}

################## configfile_cmdline_action() #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, then this function gets passed any leading options
# and values found before option_to_configfile.
#
# RETURN: return the actual options and values to be put in before the
# option_to_configfile parameter. For instance,
#	returning "--totalnum=N --file=Y" would result in
# an mpirun command line of:
#	mpirun --totalnum=N --file=Y -configfile pbs_config
#
########################################################################
configfile_cmdline_action () {
	args=$*

        printf ""

}

################## configfile_firstline_action () #######################
# If the option_to_configfile (e.g. -configfile) is specified in the
# mpirun command line, return here the item that will be put in the
# FIRST line of the configuration file.
# This is the place to put  the "-machinefile <filename>" parameter
# which determines the processes to hosts mappings. Some versions
# of mpirun (MPICH2, Intel MPI) require that the -machinefile parameter
# must appear inside the config file and not on the commmand line.
########################################################################
configfile_firstline_action () {
	printf ""
}

################## end_action() ########################################
# The action to be performed AFTER calling mpirun, and also when
# mpirun wrap script is prematurely interrupted.
# INPUT: The location of actual mpirun is passed as first argument.
# RETURN: none
########################################################################
end_action () {
	mpirun_location=$1

	pbs_hostsfile="${PBS_TMPDIR:-/var/tmp}/pbsrun_hosts$$"
	pbs_machinefile="${PBS_TMPDIR:-/var/tmp}/pbsrun_machfile$$"

	rm -f $pbs_hostsfile
	rm -f $pbs_machinefile 2>/dev/null

	${mpirun_location}/mpdallexit >/dev/null 2>/dev/null

}


================================================
FILE: src/cmds/scripts/pbsrun.poe.in
================================================
#!/usr/bin/env ksh93
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

# We need to get name of the actual binary, and not some link
# that resulted from wrapping
if [ -h $0 ] ; then
   realpath=`ls -l $0 | awk -F "->" '{print $2}'| tr -d ' '`
   name=`basename $realpath`
else
   name=`basename $0`
fi

. ${PBS_CONF_FILE:-@PBS_CONF_FILE@}
PBS_LIB_PATH="${PBS_EXEC}/lib"
if [ ! -d ${PBS_LIB_PATH} -a -d ${PBS_EXEC}/lib64 ] ; then
	PBS_LIB_PATH=${PBS_EXEC}/lib64
fi

PBS_TMPDIR="${PBS_TMPDIR:-${TMPDIR:-/var/tmp}}"

if [ -h ${PBS_LIB_PATH}/MPI/${name}.link ] ; then
   ibmpoe=`ls -l ${PBS_LIB_PATH}/MPI/${name}.link | \
		awk -F "->" '{print $2}'| tr -d ' '`
   if [ ! -x "$ibmpoe" ] ; then
	echo "poe=$ibmpoe is not executable!"
	exit 127

   fi
else
   echo "No poe link found under ${PBS_LIB_PATH}/MPI/$name.link !"
   echo "Please run pbsrun_wrap to create the link"
   exit 127
fi

# let's source the initialization script
if [ -s ${PBS_LIB_PATH}/MPI/${name}.init ] ; then
   . ${PBS_LIB_PATH}/MPI/${name}.init
else
   echo "No ${PBS_LIB_PATH}/MPI/{$name}.init file exists!"
   exit 127
fi

if [ "${PBS_NODEFILE:-XX}" = "XX" ]; then
   echo "$name: Warning, not running under PBS"

   if [ ${strict_pbs:=0} -eq 1 ] ; then
         echo "$name: exiting since strict_pbs is enabled; execute only in PBS"
         exit 1
   fi
   exec $ibmpoe "$@"
fi

# invoke man page
if [ $# -eq 1 -a "XX$1" = "XX-h" ]; then
	exec $ibmpoe -h
elif [ $# -eq 0 ]; then
	echo "$name: Error, interactive program name entry not supported under PBS"
	exit 1
fi

# count number of entries in nodefile
(( pbsnp=`wc -l < $PBS_NODEFILE` ))

# make "list" an array
set -A list
while [ $# -gt 0 ]; do
	if [ "XX$1" = "XX-procs" ]; then
		shift
		export MP_PROCS="$1"
	elif [ "XX$1" = "XX-hostfile" -o "XX$1" = "XX-hfile" ]; then
		echo "$name: Warning, $1 value replaced by PBS"
		shift
	elif [ "XX$1" = "XX-euilib" ]; then
		shift
		export MP_EUILIB="$1"
	elif [ "XX$1" = "XX-msg_api" ]; then
		shift
		export MP_MSG_API="$1"
	elif [ "XX$1" = "XX-devtype" ]; then
		shift
		export MP_DEVTYPE="$1"
	elif [ "XX$1" = "XX-instances" ]; then
		shift
		echo "$name: Warning, -instances cmd line option removed by PBS"
	elif [ "XX$1" = "XX-cmdfile" ]; then
		shift
		export MP_CMDFILE="$1"
	else
#		Append an element to list
		list[${#list[@]}]="$1"
	fi
	shift
done

# PBS is HPS enabled, only MPI and LAPI are supported
if [ -n "$PBS_HPS_JOBKEY" ]; then
	if [ "XX$MP_MSG_API" = "XX" ]; then
		export MP_MSG_API="MPI"
	elif [ "XX$MP_MSG_API" != "XXMPI" -a "XX$MP_MSG_API" != "XXLAPI" \
			-a "XX$MP_EUILIB" = "XXus" ]; then
		export MP_EUILIB=ip
	fi
fi

if [ -n "$MP_HOSTFILE" ]; then
	echo "$name: Warning, MP_HOSTFILE value replaced by PBS"
fi

export MP_HOSTFILE=$PBS_NODEFILE
if [ -n "$MP_PROCS" ]; then	# user has set a value for procs
	if [ $MP_PROCS -lt $pbsnp -a "$MP_EUILIB" = "us" ]; then
		echo "$name: Warning, usermode disabled due to MP_PROCS setting"
		export MP_EUILIB="ip"
		test "$MP_RESD" = "$PBS_MP_RESD" && unset MP_RESD
		test "$MP_EUIDEVICE" = "$PBS_MP_EUIDEVICE" && unset MP_EUIDEVICE
		test "$MP_DEVTYPE" = "$PBS_MP_DEVTYPE" && unset MP_DEVTYPE
	fi
else
	export MP_PROCS="$pbsnp"	# set procs to PBS value
fi

# Duplicate the value of MP_EUILIB in an internal PBS variable so
# we can depend on it being available to pbs_poerun.  Some versions
# of poe seem to set MP_EUILIB="ip" if it has no other value set.
export PBS_EUILIB="$MP_EUILIB"

# Don't change MP_RESD if we are doing "mixed mode" i.e. IB is requested but
# PBS doesn't support it.  Otherwise, LoadLeveler shouldn't allocate nodes.
if [ "$MP_DEVTYPE" != "ib" -o -n "$PBS_AIXIB_JOBKEY" ]; then
	export MP_RESD=no
	unset MP_INSTANCES
fi

# If user mode is set and PBS will provide it, unset MP_EUILIB so poe
# doesn't contact LoadLeveler to do switch setup.
if [ "$MP_EUILIB" = "us" ]; then
	if [ "$MP_DEVTYPE" = "ib" -a -n "$PBS_AIXIB_JOBKEY" ]; then
		unset MP_EUILIB
		export NRT_WINDOW_COUNT=$PBS_AIXIB_NETWORKS
	elif [ "$MP_DEVTYPE" != "ib" -a -n "$PBS_HPS_JOBKEY" ]; then
		unset MP_EUILIB
	fi
fi

if [ "$MP_CMDFILE" ]; then
	if [ -s "$MP_CMDFILE" ]; then
		cmd="${PBS_TMPDIR}/PBS_cmd$$"
		sed "s;^;${PBS_LIB_PATH}/MPI/pbs_poerun ;" "$MP_CMDFILE" > $cmd
		export MP_CMDFILE="$cmd"
		$ibmpoe "${list[@]}"
		ret=$?
		/bin/rm -f $cmd
		exit $ret
	fi
else
	exec $ibmpoe ${PBS_LIB_PATH}/MPI/pbs_poerun "${list[@]}"
fi


================================================
FILE: src/cmds/scripts/pbsrun.poe.init.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

### FILE: pbsrun_poe.init ###

####################################################################
# strict_pbs: set to 1 if you want the wrapper script to be executed
#             only if in a PBS environment
#
#####################################################################
strict_pbs=0

# Reasonable defaults for MP_ environment variables
MP_EUILIB=${MP_EUILIB:-$PBS_MP_EUILIB}
MP_DEVTYPE=${MP_DEVTYPE:-$PBS_MP_DEVTYPE}
MP_EUIDEVICE=${MP_EUIDEVICE:-$PBS_MP_EUIDEVICE}
MP_RESD=${MP_RESD:-$PBS_MP_RESD}
export MP_EUILIB MP_DEVTYPE MP_EUIDEVICE MP_RESD


================================================
FILE: src/cmds/scripts/printjob
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


. ${PBS_CONF_FILE:-/etc/pbs.conf}

if [ -n "$PBS_START_SERVER" -a "$PBS_START_SERVER" != "0" ]; then
	# Source the file that sets PGSQL_LIBSTR
	. "$PBS_EXEC"/libexec/pbs_db_env
	exec "$PBS_EXEC"/bin/printjob_svr.bin ${1+"$@"}
else
	exec "$PBS_EXEC"/bin/printjob.bin ${1+"$@"}
fi


================================================
FILE: src/cmds/scripts/sgiMPI.awk
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


#	When an MPI job executes within the PBS environment, MPI resource
#	specification and PBS resource selections may conflict (for example,
#	on choice of execution host).  This script works in conjunction with
#	the PBS mpiexec script to transform those MPI resource specifications
#	to instead use the resources provided by PBS.
#
#	It does this by consulting the PBS nodes file (whose name appears in
#	the "PBS_NODEFILE" environment variable) to determine the host names
#	and available number of CPUs per host (the latter by counting the
#	number of times a given host name appears in the nodes file), then
#	assigning hosts and CPUs to MPI resource specifications in a round-
#	robin fashion.
#
#	We expect to be passed values for these variables by the PBS mpiexec
#	that invokes us,
#
#		configfile	is a file either supplied as an argument to
#				mpiexec, or constructed by the PBS mpiexec
#				script to represent the concatenation of rank
#				specifications on the mpiexec command line,
#
#		runfile		is the output file into which this program
#				should put the vendor-specific invocations
#				that implement the various mpiexec directives
#
#		pbs_exec	is the value of $PBS_EXEC from the pbs.conf file
#
#		debug		may be set to enable this program to report
#				some of its internal workings
#
#	To customize this program for a different vendor, change the functions
#
#		vendor_init	which does one-time per-vendor initializations,
#				and
#
#		vendor_dorank	which formats and returns a rank specification
#				for output to the supplied runfile

function init()
{
	if ((jobid = ENVIRON["PBS_JOBID"]) == "") {
		printf("cannot find \"PBS_JOBID\" in environment\n");
		exit 1;
	}

	if (configfile == "") {
		printf("no mpiexec configfile specified\n");
		exit 1;
	}

	if (runfile == "") {
		printf("no output run file specified\n");
		exit 1;
	}

	vendor_init();
}

function vendor_init()
{
	SGIMPI_init();
}

function vendor_dorank()
{
	return SGIMPI_dorank();
}

function SGIMPI_init()
{
	SGIMPI_cmdfmt = sprintf("%%s%%s -np %%d %%s -j %s  %%s %%s",
	    jobid);
}

function SGIMPI_dorank(ret)
{
	ret = sprintf(SGIMPI_cmdfmt, ranksep, rank[HOST], rank[NCPUS],
	    pbs_exec "/bin/pbs_attach", prog, args);
	ranksep = ": ";		# for all but the first line of the config file

	return (ret);
}

#	Break a line from the supplied configuration file into ranks, validate
#	the syntax, assign nodes to the ranks, and emit the vendor-specific
#	invocations for later use by the calling PBS mpiexec script.
function doline(i, type, val)
{
	linenum++;
	ranknum = 0;
	reset_rank();
	for (i = 1; i <= NF; i++) {
		type = $i;
		if (type ~ argpat) {
			# mpiexec directive
			in_rankdef = 1;
			sub(/^-/, "", type);
			if (i == NF) {
				printf(missingvalfmt,
				       configfile, linenum, type);
				return;
				exit 1;
			} else {
				i++;
				val = $i;
			}
			rank[type] = val;
		} else if (type == ":") {
			# rank separator
			in_rankdef = 0;
			break;
		} else {
			# program and its arguments
			prog = $i;
			i++;
			for (; i <= NF; i++) {
				if ($i == ":")
					break;
				else
					args = args " " $i;
			}
			assign_nodes();
			ranknum++;
			reset_rank();
			in_rankdef = 0;
		}
	}

	if ((in_rankdef == 1) && (prog == "")) {
		printf(missingcmdfmt, configfile, linenum, ranknum);
		return;
		exit 1;
	}

}

#	(re)initializations to be done when beginning a new rank
function reset_rank(r)
{
	for (r in rank)
		delete rank[r];

	prog = "";
	args = "";

	rank[NCPUS] = num_nodes;	# default is implementation-dependent
}

#	Emit a rank specification into the runfile.
function dorank(r)
{
	if (debug) {
		for (r in rank)
			printf("line %d, rank #%d:  %s=%s\n",
			    linenum, ranknum, r, rank[r]);
		printf("line %d, rank #%d:  prog:  %s, args %s\n",
		    linenum, ranknum, prog, args);
	}

	printf("%s\n", vendor_dorank()) >> runfile;
}

#	Read the PBS nodes file, remembering the node names and CPUs per node.
function read_nodefile(nf, pbs_nodefile)
{
	pbs_nodefile = "PBS_NODEFILE";

	if ((nf = ENVIRON[pbs_nodefile]) == "") {
		printf("cannot find \"%s\" in environment\n", pbs_nodefile);
		exit 1;
	}

	nodeindex = 0;
	while ((getline < nf) > 0) {
		if ($0 in cpus_per_node)
			cpus_per_node[$0]++;
		else {
			nodelist[nodeindex] = $0;
			cpus_per_node[$0] = 1;
			nodeindex++;
		}
	}
	close(nf);

	if (nodeindex == 0) {
		if ((getline < nf) == -1)
			printf(badnodefilefmt, nf);
		else
			printf(nonodesfmt, nf);
		exit 1;
	}
	num_nodes = nodeindex;
	reinit_avail();
}

#	for debugging
function report_nodefile(node)
{
	print "report_nodefile:  num_nodes " num_nodes;
	for (node = 0; node < num_nodes; node++)
		printf("\tnode %s:  CPUs available:  %d\n", nodelist[node],
		    cpus_per_node[nodelist[node]]);
}

#	This does a virtual rewind of the PBS nodes list, resetting the
#	number of CPUs available to that determined in read_nodefile().
function reinit_avail(node)
{
	for (node = 0; node < num_nodes; node++)
		cur_avail[node] = cpus_per_node[nodelist[node]];
	nodeindex = 0;
}

#	Step through the nodelist[] array, consuming CPU resources.  When doing
#	so, either we satisfy a rank specification or must go on to the next
#	host;  in either case we emit the current rank spec before proceeding.
function assign_nodes(cpus_needed, node)
{
	cpus_needed = rank[NCPUS];

	while (cpus_needed > 0) {
		for (node = nodeindex; node < num_nodes; node++) {
			rank[HOST] = nodelist[node];
			if (cur_avail[node] >= cpus_needed) {
				cur_avail[node] -= cpus_needed;
				rank[NCPUS] = cpus_needed;
				dorank();
				if (cur_avail[node] == 0)
					nodeindex++;
				return;
			} else {
				rank[NCPUS] = cur_avail[node];
				cpus_needed -= cur_avail[node];
				cur_avail[node] = 0;
				dorank();
				nodeindex++;
				continue;
			}
		}
		reinit_avail();
	}
}

BEGIN	{
		linenum = 0;
		argpat = "^-(arch|host|file|n|path|soft|wdir)$";
		badnodefilefmt = "could not read PBS_NODEFILE \"%s\"\n";
			nonodesfmt = "no nodes found in PBS_NODEFILE \"%s\"\n";
		missingcmdfmt = "%s line %d rank %d has no executable\n";
		missingvalfmt = "%s line %d:  argument \"-%s\":  missing val\n";
		# symbolic name for readability
		HOST = "host"
		NCPUS = "n";

		init();

		read_nodefile();
		if (debug)
			report_nodefile();

		while ((getline < configfile) > 0)
			doline();
		close(configfile);
	}


================================================
FILE: src/hooks/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

pbshooksdir = $(libdir)/python/altair/pbs_hooks

dist_pbshooks_DATA = \
	cgroups/pbs_cgroups.HK \
	cgroups/pbs_cgroups.PY \
	cgroups/pbs_cgroups.CF


================================================
FILE: src/hooks/cgroups/pbs_cgroups.CF
================================================
{
    "cgroup_prefix"         : "pbs_jobs",
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "ncpus_are_cores"       : false,
    "discover_gpus"         : true,
    "manage_rlimit_as"      : true,
    "cgroup" : {
        "cpuacct" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "cpuset" : {
            "enabled"            : true,
            "exclude_cpus"       : [],
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "mem_fences"         : false,
            "mem_hardwall"       : false,
            "memory_spread_page" : false
        },
        "devices" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "allow"              : [
                "b *:* rwm",
                "c *:* rwm"
            ]
        },
        "memory" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "soft_limit"         : false,
            "enforce_default"    : true,
            "exclhost_ignore_default" : false,
            "default"            : "256MB",
            "reserve_percent"    : 0,
            "reserve_amount"     : "1GB"
        },
        "memsw" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "enforce_default"    : true,
            "exclhost_ignore_default" : false,
            "default"            : "0B",
            "reserve_percent"    : 0,
            "reserve_amount"     : "64MB",
            "manage_cgswap"      : false
        },
        "hugetlb" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "enforce_default"    : true,
            "exclhost_ignore_default" : false,
            "default"            : "0B",
            "reserve_percent"    : 0,
            "reserve_amount"     : "0B"
        }
    }
}


================================================
FILE: src/hooks/cgroups/pbs_cgroups.HK
================================================
type=site
enabled=false
debug=false
user=pbsadmin
event=exechost_periodic,exechost_startup,execjob_attach,execjob_begin,execjob_end,execjob_epilogue,execjob_launch,execjob_resize,execjob_abort,execjob_postsuspend,execjob_preresume
fail_action=offline_vnodes
order=100
alarm=90
freq=120


================================================
FILE: src/hooks/cgroups/pbs_cgroups.PY
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
PBS hook for managing cgroups on Linux execution hosts.
This hook contains the handlers required for PBS to support
cgroups on Linux hosts that support them (kernel 2.6.28 and higher)

This hook services the following events:
- exechost_periodic
- exechost_startup
- execjob_attach
- execjob_begin
- execjob_end
- execjob_epilogue
- execjob_launch
- execjob_resize
- execjob_abort
- execjob_postsuspend
- execjob_preresume
"""

# NOTES:
#
# When soft_limit is true for memory, memsw represents the hard limit.
#
# The resources value in sched_config must contain entries for mem and
# vmem if those subsystems are enabled in the hook configuration file. The
# amount of resource requested will not be avaiable to the hook if they
# are not present.

# if we are not on a Linux system then the hook should always do nothing
# and accept, and certainly not try Linux-only module imports
import platform

# Module imports
#
# This one is needed to log messages
import pbs

if platform.system() != 'Linux':
    pbs.logmsg(pbs.EVENT_DEBUG,
               'Cgroup hook not on supported OS '
               '-- just accepting event')
    pbs.event().accept()

# we're on Linux, but does the kernel support cgroups?
rel = list(map(int, (platform.release().split('-')[0].split('.'))))
pbs.logmsg(pbs.EVENT_DEBUG4,
           'Cgroup hook: detected Linux kernel version %d.%d.%d' %
           (rel[0], rel[1], rel[2]))

supported = False
if rel[0] > 2:
    supported = True
elif rel[0] == 2:
    if rel[1] > 6:
        supported = True
    elif rel[1] == 6:
        if rel[2] >= 28:
            supported = True

if not supported:
    pbs.logmsg(pbs.EVENT_DEBUG,
               'Cgroup hook: kernel %s.%s.%s < 2.6.28; not supported'
               % (rel[0], rel[1], rel[2]))
    pbs.event.accept()
else:
    # Now we know that at least the hook might do something useful
    # so import other modules (some of them Linux-specific)
    # Note the else is needed to be PEP8-compliant:  the imports must
    # not be unindented since they are not top-of-file
    import sys
    import os
    import stat
    import errno
    import signal
    import subprocess
    import re
    import glob
    import time
    import string
    import traceback
    import copy
    import operator
    import fnmatch
    import math
    import types
    try:
        import json
    except Exception:
        import simplejson as json
    multiprocessing = None
    try:
        # will fail in Python 2.5
        import multiprocessing
    except Exception:
        # but we can use isinstance(multiprocessing, types.ModuleType) later
        # to find out if it worked
        pass
    import fcntl
    import pwd

    PYTHON2 = sys.version_info[0] < 3

    try:
        bytearray
        BYTEARRAY_EXISTS = True
    except NameError:
        BYTEARRAY_EXISTS = False

# Define some globals that get set in main
PBS_EXEC = ''
PBS_HOME = ''
PBS_MOM_HOME = ''
PBS_MOM_JOBS = ''

# ============================================================================
# Derived error classes
# ============================================================================


class AdminError(Exception):
    """
    Base class for errors fixable only by administrative action.
    """
    pass


class ProcessingError(Exception):
    """
    Base class for errors in processing, unknown cause.
    """
    pass


class UserError(Exception):
    """
    Base class for errors fixable by the user.
    """
    pass


class JobValueError(Exception):
    """
    Errors in PBS job resource values.
    """
    pass


class CgroupBusyError(ProcessingError):
    """
    Errors when the cgroup is busy.
    """
    pass


class CgroupConfigError(AdminError):
    """
    Errors in configuring cgroup.
    """
    pass


class CgroupLimitError(AdminError):
    """
    Errors in configuring cgroup.
    """
    pass


class CgroupProcessingError(ProcessingError):
    """
    Errors processing cgroup.
    """
    pass


class TimeoutError(ProcessingError):
    """
    Timeout encountered.
    """
    pass


# ============================================================================
# Utility functions
# ============================================================================

#
# FUNCTION stringified_output
#
def stringified_output(out):
    if PYTHON2:
        if isinstance(out, str):
            return(out)
        elif isinstance(out, unicode):
            return(out.encode('utf-8'))
        else:
            return(str(out))
    else:
        if isinstance(out, str):
            return(out)
        elif isinstance(out, (bytes, bytearray)):
            return(out.decode('utf-8'))
        else:
            return(str(out))


#
# FUNCTION caller_name
#
def caller_name():
    """
    Return the name of the calling function or method.
    """
    return str(sys._getframe(1).f_code.co_name)


#
# FUNCTION systemd_escape
#
def systemd_escape(buf):
    """
    Escape strings for usage in system unit names
    Some distros don't provide the systemd-escape command
    """
    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
    if not isinstance(buf, str):
        raise ValueError('Not a basetype string')
    ret = ''
    for i, char in enumerate(buf):
        if i < 1 and char == '.':
            if PYTHON2:
                ret += '\\x' + '.'.encode('hex')
            else:
                ret += '\\x' + b'.'.hex()
        elif char.isalnum() or char in '_.':
            ret += char
        elif char == '/':
            ret += '-'
        else:
            # Will turn non-ASCII into UTF-8 hex sequence on both Py2/3
            if PYTHON2:
                hexval = char.encode('hex')
            else:
                hexval = char.encode('utf-8').hex()
            for j in range(0, len(hexval), 2):
                ret += '\\x' + hexval[j:j + 2]
    return ret


#
# FUNCTION convert_size
#
def convert_size(value, units='b'):
    """
    Convert a string containing a size specification (e.g. "1m") to a
    string using different units (e.g. "1024k").

    This function only interprets a decimal number at the start of the string,
    stopping at any unrecognized character and ignoring the rest of the string.

    When down-converting (e.g. MB to KB), all calculations involve integers and
    the result returned is exact. When up-converting (e.g. KB to MB) floating
    point numbers are involved. The result is rounded up. For example:

    1023MB -> GB yields 1g
    1024MB -> GB yields 1g
    1025MB -> GB yields 2g  <-- This value was rounded up

    Pattern matching or conversion may result in exceptions.
    """
    logs = {'b': 0, 'k': 10, 'm': 20, 'g': 30,
            't': 40, 'p': 50, 'e': 60, 'z': 70, 'y': 80}
    try:
        new = units[0].lower()
        if new not in logs:
            raise ValueError('Invalid unit value')
        result = re.match(r'([-+]?\d+)([bkmgtpezy]?)',
                          str(value).lower())
        if not result:
            raise ValueError('Unrecognized value')
        val, old = result.groups()
        if int(val) < 0:
            raise ValueError('Value may not be negative')
        if old not in logs:
            old = 'b'
        factor = logs[old] - logs[new]
        val = float(val)
        val *= 2 ** factor
        if (val - int(val)) > 0.0:
            val += 1.0
        val = int(val)
        # pbs.size() does not like units following zero
        if val <= 0:
            return '0'
        return str(val) + new
    except Exception:
        return None


#
# FUNCTION size_as_int
#
def size_as_int(value):
    """
    Convert a size string to an integer representation of size in bytes
    """
    in_bytes = convert_size(value, units='b')
    if in_bytes is not None:
        return int(convert_size(value).rstrip(string.ascii_lowercase))
    else:
        pbs.logmsg(pbs.EVENT_ERROR, "size_as_int: Value %s "
                   "does not convert to int, returning None" % value)
        return None


#
# FUNCTION convert_time
#
def convert_time(value, units='s'):
    """
    Converts a integer value for time into the value of the return unit

    A valid decimal number, with optional sign, may be followed by a character
    representing a scaling factor.  Scaling factors may be either upper or
    lower case. Examples include:
    250ms
    40s
    +15min

    Valid scaling factors are:
    ns  = 10**-9
    us  = 10**-6
    ms  = 10**-3
    s   =      1
    min =     60
    hr  =   3600

    Pattern matching or conversion may result in exceptions.
    """
    multipliers = {'': 1, 'ns': 10 ** -9, 'us': 10 ** -6,
                   'ms': 10 ** -3, 's': 1, 'min': 60, 'hr': 3600}
    new = units.lower()
    if new not in multipliers:
        raise ValueError('Invalid unit value')
    result = re.match(r'([-+]?\d+)\s*([a-zA-Z]+)',
                      str(value).lower())
    if not result:
        raise ValueError('Unrecognized value')
    num, factor = result.groups()
    # Check to see if there was not unit of time specified
    if factor is None:
        factor = ''
    # Check to see if the unit is valid
    if str.lower(factor) not in multipliers:
        raise ValueError('Time unit not recognized')
    # Convert the value to seconds
    value = float(num) * float(multipliers[str.lower(factor)])
    if units != 's':
        value = value / multipliers[new]
    # _pbs_v1.validate_input breaks with very small time values
    # because Python converts them to values like 1e-05
    if value < 0.001:
        value = 0.0
    return value


def decode_list(data):
    """
    json hook to convert lists from non string type to str
    """
    ret = []
    for item in data:
        if isinstance(item, str):
            pass
        if isinstance(item, list):
            item = decode_list(item)
        elif isinstance(item, dict):
            item = decode_dict(item)
        elif PYTHON2:
            if isinstance(item, unicode):
                item = item.encode('utf-8')
            elif BYTEARRAY_EXISTS and isinstance(item, bytearray):
                item = str(item)
        elif isinstance(item, (bytes, bytearray)):
            item = str(item, 'utf-8')
        ret.append(item)
    return ret


def decode_dict(data):
    """
    json hook to convert dictionaries from non string type to str
    """
    ret = {}
    for key, value in list(data.items()):
        # first the key
        if isinstance(key, str):
            pass
        elif PYTHON2:
            if isinstance(key, unicode):
                key = key.encode('utf-8')
            elif BYTEARRAY_EXISTS and isinstance(key, bytearray):
                key = str(key)
        elif isinstance(key, (bytes, bytearray)):
            key = str(key, 'utf-8')

        # now the value
        if isinstance(value, str):
            pass
        if isinstance(value, list):
            value = decode_list(value)
        elif isinstance(value, dict):
            value = decode_dict(value)
        elif PYTHON2:
            if isinstance(value, unicode):
                value = value.encode('utf-8')
            elif BYTEARRAY_EXISTS and isinstance(key, bytearray):
                value = str(value)
        elif isinstance(value, (bytes, bytearray)):
            value = str(value, 'utf-8')

        # add stringified (key, value) pair to result
        ret[key] = value
    return ret


def merge_dict(base, new):
    """
    Merge together two multilevel dictionaries where new
    takes precedence over base
    """
    if not isinstance(base, dict):
        raise ValueError('base must be type dict')
    if not isinstance(new, dict):
        raise ValueError('new must be type dict')
    newkeys = list(new.keys())
    merged = {}
    for key in base:
        if key in newkeys and isinstance(base[key], dict):
            # Take it off the list of keys to copy
            newkeys.remove(key)
            merged[key] = merge_dict(base[key], new[key])
        else:
            merged[key] = copy.deepcopy(base[key])
    # Copy the remaining unique keys from new
    for key in newkeys:
        merged[key] = copy.deepcopy(new[key])
    return merged


def expand_list(old):
    """
    Convert condensed list format (with ranges) to an expanded Python list.
    The input string is a comma separated list of digits and ranges.
    Examples include:
    0-3,8-11
    0,2,4,6
    2,5-7,10
    """
    new = []
    if isinstance(old, list):
        old = ",".join(list(map(str, old)))
    stripped = old.strip()
    if not stripped:
        return new
    for entry in stripped.split(','):
        if '-' in entry[1:]:
            start, end = entry.split('-', 1)
            for i in range(int(start), int(end) + 1):
                new.append(i)
        else:
            new.append(int(entry))
    return new


def find_files(path, pattern='*', kind='',
               follow_links=False, follow_mounts=True):
    """
    Return a list of files similar to the find command
    """
    if isinstance(pattern, str):
        pattern = [pattern]
    if isinstance(kind, str):
        if not kind:
            kind = []
        else:
            kind = [kind]
    if not isinstance(pattern, list):
        raise TypeError('Pattern must be a string or list')
    if not isinstance(kind, list):
        raise TypeError('Kind must be a string or list')
    # Top level not excluded if it is a mount point
    mounts = []
    for root, dirs, files in os.walk(path, followlinks=follow_links):
        for name in [os.path.join(root, x) for x in dirs + files]:
            if not follow_mounts:
                if os.path.isdir(name) and os.path.ismount(name):
                    mounts.append(os.path.join(name, ''))
                    continue
                undermount = False
                for mountpoint in mounts:
                    if name.startswith(mountpoint):
                        undermount = True
                        break
                if undermount:
                    continue
            pattern_matched = False
            for pat in pattern:
                if fnmatch.fnmatchcase(os.path.basename(name), pat):
                    pattern_matched = True
                    break
            if not pattern_matched:
                continue
            if not kind:
                yield name
                continue
            statinfo = os.lstat(name).st_mode
            for entry in kind:
                if not entry:
                    yield name
                    break
                for letter in entry:
                    if letter == 'f' and stat.S_ISREG(statinfo):
                        yield name
                        break
                    elif letter == 'l' and stat.S_ISLNK(statinfo):
                        yield name
                        break
                    elif letter == 'c' and stat.S_ISCHR(statinfo):
                        yield name
                        break
                    elif letter == 'b' and stat.S_ISBLK(statinfo):
                        yield name
                        break
                    elif letter == 'p' and stat.S_ISFIFO(statinfo):
                        yield name
                        break
                    elif letter == 's' and stat.S_ISSOCK(statinfo):
                        yield name
                        break
                    elif letter == 'd' and stat.S_ISDIR(statinfo):
                        yield name
                        break


def initialize_resource(resc):
    """
    Return a properly cast zero value
    """
    if isinstance(resc, pbs.pbs_int):
        ret = pbs.pbs_int(0)
    elif isinstance(resc, pbs.pbs_float):
        ret = pbs.pbs_float(0)
    elif isinstance(resc, pbs.size):
        ret = pbs.size('0')
    elif isinstance(resc, int):
        ret = 0
    elif isinstance(resc, float):
        ret = 0.0
    elif isinstance(resc, list):
        ret = []
    elif isinstance(resc, dict):
        ret = {}
    elif isinstance(resc, tuple):
        ret = ()
    elif isinstance(resc, str):
        ret = ''
    else:
        raise ValueError('Unable to initialize unknown resource type')
    return ret


def printjob_info(jobid, include_attributes=False):
    """
    Use printjob to acquire the job information
    """
    info = {}
    jobfile = os.path.join(PBS_MOM_JOBS, '%s.JB' % jobid)
    if not os.path.isfile(jobfile):
        pbs.logmsg(pbs.EVENT_DEBUG4, 'File not found: %s' % (jobfile))
        return info
    cmd = [os.path.join(PBS_EXEC, 'bin', 'printjob')]
    if not include_attributes:
        cmd.append('-a')
    cmd.append(jobfile)
    try:
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Running: %s' % cmd)
        process = subprocess.Popen(cmd, shell=False,
                                   stdout=subprocess.PIPE,
                                   stderr=subprocess.PIPE,
                                   universal_newlines=True)
        out, err = process.communicate()
        if process.returncode != 0:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'command return code non-zero: %s'
                       % str(process.returncode))
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'command stderr: %s'
                       % stringified_output(err))
    except Exception as exc:
        pbs.logmsg(pbs.EVENT_DEBUG2, 'Error running command: %s' % cmd)
        pbs.logmsg(pbs.EVENT_DEBUG2, 'Exception: %s' % exc)
        return {}
    # if we get a non-str type then convert before calling splitlines
    # should not happen since we pass universal_newlines True
    out_split = stringified_output(out).splitlines()
    pattern = re.compile(r'^(\w.*):\s*(\S+)')
    for line in out_split:
        result = re.match(pattern, line)
        if not result:
            continue
        key, val = result.groups()
        if not key or not val:
            continue
        if val.startswith('0x'):
            info[key] = int(val, 16)
        elif val.isdigit():
            info[key] = int(val)
        else:
            info[key] = val
    pbs.logmsg(pbs.EVENT_DEBUG4, 'JB file info returned: %s' % repr(info))
    return info


def job_is_suspended(jobid):
    """
    Returns True if job is in a suspended or unknown substate
    """
    jobinfo = printjob_info(jobid)
    if 'substate' in jobinfo:
        return jobinfo['substate'] in [43, 45, 'unknown']
    return False


def job_is_running(jobid):
    """
    Returns True if job shows a running state and substate
    """
    jobinfo = printjob_info(jobid)
    if 'substate' in jobinfo:
        return jobinfo['substate'] == 42
    return False


def fetch_vnode_comments_nomp(vnode_list, timeout=10):
    comment_dict = {}
    failure = False
    pbs.logmsg(pbs.EVENT_DEBUG4,
               "vnode list in fetch_vnode_comment is %s"
               % vnode_list)
    try:
        with Timeout(timeout, 'Timed out contacting server'):
            for vn in vnode_list:
                comment_dict[vn] = pbs.server().vnode(vn).comment
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           "comment for vnode %s fetched from server is %s"
                           % (str(vn), comment_dict[vn]))
    except TimeoutError:
        # pbs.server().vnode(xx).comment got stuck, or the timeout
        # was too short for the number of nodes supplied
        pbs.logmsg(pbs.EVENT_ERROR,
                   'Timed out while fetching comments from server, '
                   'timeout was %s' % str(timeout))
        failure = True
    except Exception as exc:
        # other exception, like e.g. wrong vnode name
        pbs.logmsg(pbs.EVENT_ERROR,
                   'Unexpected error in fetch_vnode_comments: %s'
                   % repr(exc))
        failure = True
    # only return a full dictionary if you got the comment for all vnodes
    if not failure:
        return (comment_dict, failure)
    else:
        return ({}, failure)


def fetch_vnode_comments_queue(vnode_list, commq):
    comment_dict = {}
    failure = False
    pbs.logmsg(pbs.EVENT_DEBUG4,
               "vnode list in fetch_vnode_comment is %s"
               % vnode_list)
    try:
        for vn in vnode_list:
            comment_dict[vn] = pbs.server().vnode(vn).comment
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       "comment for vnode %s fetched from server is %s"
                       % (str(vn), comment_dict[vn]))

    except Exception as exc:
        # other exception, like e.g. wrong vnode name
        pbs.logmsg(pbs.EVENT_ERROR,
                   'Unexpected error in fetch_vnode_comments: %s'
                   % repr(exc))
        failure = True
    # only return a full dictionary if you got the comment for all vnodes
    if not failure:
        commq.put(comment_dict)
    else:
        commq.put({})
    return True


def fetch_vnode_comments_mp(vnode_list, timeout=10):
    worker_comment_dict = {}
    commq = multiprocessing.Queue()
    worker = multiprocessing.Process(target=fetch_vnode_comments_queue,
                                     args=(vnode_list, commq))
    worker.start()
    worker.join(timeout)
    if worker.is_alive():
        pbs.logmsg(pbs.EVENT_ERROR,
                   "comment fetcher for %s timed out after %s seconds"
                   % (str(vnode_list), timeout))
        # will mess up the commq Queue but we don't care
        # will send SIGTERM, but it's possible that is masked
        # while in a SWIG function
        # we don't really care since unline in threading,
        # in multiprocessing we can exit and orphan the worker
        worker.terminate()
        pbs.logmsg(pbs.EVENT_ERROR,
                   'Timed out while fetching comments from server,'
                   'timeout was %s' % str(timeout))
        return ({}, True)
    else:
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   "comments fetched from server without timeout")
        comment_dict = {}
        try:
            comment_dict = commq.get()
        except Exception:
            # Treat failure to get comments dictionary from queue
            # as a timeout
            return ({}, True)
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   "worker comment_dict is %r" % comment_dict)

        return (comment_dict, False)


def fetch_vnode_comments(vnode_list, timeout=10):
    if not isinstance(multiprocessing, types.ModuleType):
        pbs.logmsg(pbs.EVENT_DEBUG4, "multiprocessing not available, "
                   "fetch_vnode_comment will use SIGALRM timeout")
        return fetch_vnode_comments_nomp(vnode_list, timeout)
    else:
        pbs.logmsg(pbs.EVENT_DEBUG4, "multiprocessing available, "
                   "fetch_vnode_comment will use mp for timeout")
        return fetch_vnode_comments_mp(vnode_list, timeout)


# ============================================================================
# Utility classes
# ============================================================================

#
# CLASS Lock
#
class Lock(object):
    """
    Implement a simple locking mechanism using a file lock
    """

    def __init__(self, path):
        self.path = path
        self.lockfd = None

    def getpath(self):
        """
        Return the path of the lock file.
        """
        return self.path

    def getlockfd(self):
        """
        Return the file descriptor of the lock file.
        """
        return self.lockfd

    def __enter__(self):
        self.lockfd = open(self.path, 'w')
        fcntl.flock(self.lockfd, fcntl.LOCK_EX)
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s file lock acquired by %s' %
                   (self.path, str(sys._getframe(1).f_code.co_name)))

    def __exit__(self, exc, val, trace):
        if self.lockfd:
            fcntl.flock(self.lockfd, fcntl.LOCK_UN)
            self.lockfd.close()
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s file lock released by %s' %
                   (self.path, str(sys._getframe(1).f_code.co_name)))


#
# CLASS Timeout
#
class Timeout(object):
    """
    Implement a timeout mechanism via SIGALRM
    """

    def __init__(self, duration=1, message='Operation timed out'):
        self.duration = duration
        self.message = message

    def handler(self, sig, frame):
        """
        Throw a timeout error when SIGALRM is received
        """
        raise TimeoutError(self.message)

    def getduration(self):
        """
        Return the timeout duration
        """
        return self.duration

    def getmessage(self):
        """
        Return the timeout message
        """
        return self.message

    def __enter__(self):
        if signal.getsignal(signal.SIGALRM):
            raise RuntimeError('Alarm handler already registered')
        signal.signal(signal.SIGALRM, self.handler)
        signal.alarm(self.duration)

    def __exit__(self, exc, val, trace):
        signal.alarm(0)
        signal.signal(signal.SIGALRM, signal.SIG_DFL)


#
# CLASS HookUtils
#
class HookUtils(object):
    """
    Hook utility methods
    """

    def __init__(self, hook_events=None):
        if hook_events is not None:
            self.hook_events = hook_events
        else:
            # Defined in the order they appear in module_pbs_v1.c
            # if adding new events that may not exist in all PBS versions,
            # use hasattr() to prevent exceptions when the hook is used
            # on older PBS versions - see e.g. EXECJOB_ABORT
            self.hook_events = {}
            self.hook_events[pbs.QUEUEJOB] = {
                'name': 'queuejob',
                'handler': None
            }
            self.hook_events[pbs.MODIFYJOB] = {
                'name': 'modifyjob',
                'handler': None
            }
            self.hook_events[pbs.RESVSUB] = {
                'name': 'resvsub',
                'handler': None
            }
            if hasattr(pbs, "MODIFYRESV"):
                self.hook_events[pbs.MODIFYRESV] = {
                    'name': 'modifyresv',
                    'handler': None
                }
            self.hook_events[pbs.MOVEJOB] = {
                'name': 'movejob',
                'handler': None
            }
            self.hook_events[pbs.RUNJOB] = {
                'name': 'runjob',
                'handler': None
            }
            if hasattr(pbs, "MANAGEMENT"):
                self.hook_events[pbs.MANAGEMENT] = {
                    'name': 'management',
                    'handler': None
                }
            if hasattr(pbs, "MODIFYVNODE"):
                self.hook_events[pbs.MODIFYVNODE] = {
                    'name': 'modifyvnode',
                    'handler': None
                }
            self.hook_events[pbs.PROVISION] = {
                'name': 'provision',
                'handler': None
            }
            if hasattr(pbs, "RESV_END"):
                self.hook_events[pbs.RESV_END] = {
                'name': 'resv_end',
                'handler': None
                }
            if hasattr(pbs, "RESV_BEGIN"):
                self.hook_events[pbs.RESV_BEGIN] = {
                'name': 'resv_begin',
                'handler': None
                }
            if hasattr(pbs, "RESV_CONFIRM"):
                self.hook_events[pbs.RESV_CONFIRM] = {
                'name': 'resv_confirm',
                'handler': None
                }
            self.hook_events[pbs.EXECJOB_BEGIN] = {
                'name': 'execjob_begin',
                'handler': self._execjob_begin_handler
            }
            self.hook_events[pbs.EXECJOB_PROLOGUE] = {
                'name': 'execjob_prologue',
                'handler': None
            }
            self.hook_events[pbs.EXECJOB_EPILOGUE] = {
                'name': 'execjob_epilogue',
                'handler': self._execjob_epilogue_handler
            }
            self.hook_events[pbs.EXECJOB_PRETERM] = {
                'name': 'execjob_preterm',
                'handler': None
            }
            self.hook_events[pbs.EXECJOB_END] = {
                'name': 'execjob_end',
                'handler': self._execjob_end_handler
            }
            self.hook_events[pbs.EXECJOB_LAUNCH] = {
                'name': 'execjob_launch',
                'handler': self._execjob_launch_handler
            }
            self.hook_events[pbs.EXECHOST_PERIODIC] = {
                'name': 'exechost_periodic',
                'handler': self._exechost_periodic_handler
            }
            self.hook_events[pbs.EXECHOST_STARTUP] = {
                'name': 'exechost_startup',
                'handler': self._exechost_startup_handler
            }
            self.hook_events[pbs.EXECJOB_ATTACH] = {
                'name': 'execjob_attach',
                'handler': self._execjob_attach_handler
            }
            if hasattr(pbs, "EXECJOB_RESIZE"):
                self.hook_events[pbs.EXECJOB_RESIZE] = {
                    'name': 'execjob_resize',
                    'handler': self._execjob_resize_handler
                }
            if hasattr(pbs, "EXECJOB_ABORT"):
                self.hook_events[pbs.EXECJOB_ABORT] = {
                    'name': 'execjob_abort',
                    'handler': self._execjob_end_handler
                }
            if hasattr(pbs, "EXECJOB_POSTSUSPEND"):
                self.hook_events[pbs.EXECJOB_POSTSUSPEND] = {
                    'name': 'execjob_postsuspend',
                    'handler': self._execjob_postsuspend_handler
                }
            if hasattr(pbs, "EXECJOB_PRERESUME"):
                self.hook_events[pbs.EXECJOB_PRERESUME] = {
                    'name': 'execjob_preresume',
                    'handler': self._execjob_preresume_handler
                }
            self.hook_events[pbs.MOM_EVENTS] = {
                'name': 'mom_events',
                'handler': None
            }

    def __repr__(self):
        return 'HookUtils(%s)' % (repr(self.hook_events))

    def event_name(self, hooktype):
        """
        Return the event name for the supplied hook type.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if hooktype in self.hook_events:
            return self.hook_events[hooktype]['name']
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   '%s: Type: %s not found' % (caller_name(), type))
        return None

    def hashandler(self, hooktype):
        """
        Return the handler for the supplied hook type.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if hooktype in self.hook_events:
            return self.hook_events[hooktype]['handler'] is not None
        return None

    def invoke_handler(self, event, cgroup, jobutil, *args):
        """
        Call the appropriate handler for the supplied event.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: UID: real=%d, effective=%d' %
                   (caller_name(), os.getuid(), os.geteuid()))
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: GID: real=%d, effective=%d' %
                   (caller_name(), os.getgid(), os.getegid()))
        if self.hashandler(event.type):
            return self.hook_events[event.type]['handler'](event, cgroup,
                                                           jobutil, *args)
        pbs.logmsg(pbs.EVENT_DEBUG2,
                   '%s: %s event not handled by this hook' %
                   (caller_name(), self.event_name(event.type)))
        return False

    def _execjob_begin_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_begin events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Instantiate the NodeUtils class for get_memory_on_node and
        # get_vmem_on node
        node = NodeUtils(cgroup.cfg)
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: NodeUtils class instantiated' %
                   caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Host assigned job resources: %s' %
                   (caller_name(), jobutil.assigned_resources))
        # Make sure the parent cgroup directories exist
        cgroup.create_paths()
        # Make sure the cgroup does not already exist
        # from a failed run
        cgroup.delete(event.job.id, False)
        # Now that we have a lock, determine the current cgroup tree assigned
        # resources
        cgroup.assigned_resources = cgroup._get_assigned_cgroup_resources()
        # Create the cgroup(s) for the job
        cgroup.create_job(event.job.id, node)
        if (cgroup.cfg['cgroup']['cpuset']['enabled']
                and not cgroup.cfg['cgroup']['cpuset']['allow_zero_cpus']):
            if ('ncpus' not in jobutil.assigned_resources
                    or jobutil.assigned_resources['ncpus'] <= 0):
                if event.job.in_ms_mom():
                    pbs.logmsg(pbs.EVENT_ERROR,
                               'cpuset enabled with mandatory ncpus >= 1, '
                               'but job does not request ncpus on '
                               'mother superior: rejecting job')
                    event.reject('cpuset enabled with mandatory ncpus >= 1, '
                                 'but job does not request ncpus on '
                                 'mother superior: rejecting job')
                else:
                    # will be done in configure_job
                    pbs.logmsg(pbs.EVENT_JOB_USAGE,
                               'cpuset enabled with mandatory ncpus >= 1, '
                               'but job does not request ncpus on host: '
                               'deleting cpuset cgroup')

        # Configure the new cgroup
        cgroup.configure_job(event.job, jobutil.assigned_resources,
                             node, cgroup, event.type)

        # Write out the assigned resources
        cgroup.write_cgroup_assigned_resources(event.job.id)
        # Write out the environment variable for the host (pbs_attach)
        if 'device_names' in cgroup.assigned_resources:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Devices: %s' %
                       (caller_name(),
                        cgroup.assigned_resources['device_names']))
            env_list = []
            if cgroup.assigned_resources['device_names']:
                mics = []
                gpus = []
                for key in cgroup.assigned_resources['device_names']:
                    if key.startswith('mic'):
                        mics.append(key[3:])
                    elif (key.startswith('nvidia')
                            and "gpu" in node.devices
                            and key in node.devices['gpu']):
                        if 'uuid' in node.devices['gpu'][key]:
                            gpus.append(node.devices['gpu'][key]['uuid'])
                        if 'uuids' in node.devices['gpu'][key]:
                            gpus.extend(node.devices['gpu'][key]['uuids'])
                if mics:
                    env_list.append('OFFLOAD_DEVICES=%s' %
                                    ",".join(mics))
                if gpus:
                    # Don't put quotes around the values. ex "0" or "0,1".
                    # This will cause it to fail.
                    env_list.append('CUDA_VISIBLE_DEVICES=%s' %
                                    ",".join(gpus))
                    env_list.append('CUDA_DEVICE_ORDER=PCI_BUS_ID')
            pbs.logmsg(pbs.EVENT_DEBUG4, 'ENV_LIST: %s' % env_list)
            cgroup.write_job_env_file(event.job.id, env_list)
        # Add jobid to cgroup_jobs file to tell periodic handler that this
        # job is new and its cgroup should not be cleaned up
        cgroup.add_jobid_to_cgroup_jobs(event.job.id)

        # Initialize resources_used values that the hook will update
        # so that they are not updated through MoM polling.
        # Particularly important for resources_used.vmem which has
        # different semantics when the cgroup hook manages mem+swap.
        # Add 'force' flag because we haven't reached substate 42 yet
        cgroup.update_job_usage(event.job.id, event.job.resources_used,
                                force=True)
        return True

    def _execjob_epilogue_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_epilogue events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # delete this jobid from cgroup_jobs in case hook events before me
        # failed to do that
        cgroup.remove_jobid_from_cgroup_jobs(event.job.id)
        # The resources_used information has a base type of pbs_resource.
        # Update the usage data
        cgroup.update_job_usage(event.job.id, event.job.resources_used)
        # The job script has completed, but the obit has not been sent.
        # Delete the cgroups for this job so that they don't interfere
        # with incoming jobs assigned to this node.
        cgroup.delete(event.job.id)
        return True

    def _execjob_end_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_end events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # delete this jobid from cgroup_jobs in case hook events before me
        # failed to do that
        cgroup.remove_jobid_from_cgroup_jobs(event.job.id)
        # The cgroup is usually deleted in the execjob_epilogue event
        # There are certain corner cases where epilogue can fail or skip
        # Delete files again here to make sure we catch those
        # cgroup.delete() does nothing if files are already deleted
        cgroup.delete(event.job.id)
        # Remove the assigned_resources and job_env files.
        filelist = []
        filelist.append(os.path.join(cgroup.hook_storage_dir, event.job.id))
        filelist.append(cgroup.host_job_env_filename % event.job.id)
        for filename in filelist:
            try:
                os.remove(filename)
            except OSError:
                pbs.logmsg(pbs.EVENT_DEBUG4, 'File: %s not found' % (filename))
            except Exception:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Error removing file: %s' % (filename))
        return True

    def manage_rlimit_as(self, job):
        """
        Sets rlimit_as according to pvmem (if present)
        if pvmem is not present, sets it to unlimited
        (since we know vmem specifies memory+swap usage limit,
         not address space limit)
        """
        import resource
        rlimit_as = None
        parent_pid = os.getppid()
        if 'pvmem' in job.Resource_List and job.Resource_List['pvmem']:
            rlimit_as = size_as_int(job.Resource_List['pvmem'])
        else:
            rlimit_as = resource.RLIM_INFINITY

        prlimit_command = None
        if hasattr(resource, 'prlimit'):
            # No need to call command -- Python has direct support
            prlimit_command = ''
            pbs.logmsg(pbs.EVENT_DEBUG3,
                       'Calling resource.prlimit(%s, resource.RLIMIT_AS, %s)'
                       % (parent_pid, str((rlimit_as, rlimit_as))))
            resource.prlimit(parent_pid, resource.RLIMIT_AS,
                             (rlimit_as, rlimit_as))
        elif os.path.isfile('/usr/bin/prlimit'):
            prlimit_command = '/usr/bin/prlimit'
        elif os.path.isfile('/bin/prlimit'):
            prlimit_command = '/bin/prlimit'

        if prlimit_command is None:
            pbs.logmsg(pbs.EVENT_DEBUG, "cannot set rlimit_as for task: "
                       "prlimit command not found")
        elif prlimit_command != '':
            cmd = [prlimit_command,
                   '--as=' + str(rlimit_as) + ':' + str(rlimit_as),
                   '--pid=' + str(parent_pid)]
            pbs.logmsg(pbs.EVENT_DEBUG3, 'Running: ' + ' '.join(cmd))
            try:
                # Try running the prlimit command
                process = subprocess.Popen(cmd, shell=False,
                                           stdout=subprocess.PIPE,
                                           stderr=subprocess.PIPE)
                out = process.communicate()[0]
            except Exception:
                pbs.logmsg(pbs.EVENT_ERROR,
                           'Found but to failed to execute: %s' %
                           ' '.join(cmd))

    def _execjob_launch_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_launch events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        node = NodeUtils(cgroup.cfg)
        # delete this jobid from cgroup_jobs in case hook events before me
        # failed to do that
        cgroup.remove_jobid_from_cgroup_jobs(event.job.id)
        # Add the parent process id to the appropriate cgroups.
        cgroup.add_pids(os.getppid(), jobutil.job.id)
        # FUTURE: Add environment variable to the job environment
        # if job requested mic or gpu
        cgroup.read_cgroup_assigned_resources(event.job.id)
        if cgroup.assigned_resources is not None:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'assigned_resources: %s' %
                       (cgroup.assigned_resources))
            if "gpu" in node.devices:
                cgroup.setup_job_devices_env(node.devices['gpu'])

        # If vmem was requested, set per process address space limit
        # or clear the one MoM has set,
        # if possible (requires prlimit support)
        if (cgroup.cfg['manage_rlimit_as']
                and cgroup.cfg['cgroup']['memsw']['enabled']):
            self.manage_rlimit_as(pbs.event().job)
        return True

    def _exechost_periodic_handler(self, event, cgroup, jobutil):
        """
        Handler for exechost_periodic events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Instantiate the NodeUtils class for gather_jobs_on_node
        node = NodeUtils(cgroup.cfg)
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: NodeUtils class instantiated' %
                   caller_name())
        # Cleanup cgroups for jobs not present on this node
        jobdict = node.gather_jobs_on_node(cgroup)
        for jobid in event.job_list:
            if jobid not in jobdict:
                jobdict[jobid] = float()
        remaining = cgroup.cleanup_orphans(jobdict)
        # Offline the node if there are remaining orphans
        if remaining > 0:
            try:
                node.take_node_offline()
            except Exception as exc:
                pbs.logmsg(pbs.EVENT_DEBUG, '%s: Failed to offline node: %s' %
                           (caller_name(), exc))
        # Online nodes that were offlined due to a cgroup not cleaning up
        if remaining == 0 and cgroup.cfg['online_offlined_nodes']:
            node.bring_node_online()
        # Update the resource usage information for each job
        if cgroup.cfg['periodic_resc_update']:
            # Using event.job_list, without the parenthesis, will
            # make the dictionary iterable.
            for jobid in event.job_list:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           '%s: Updating resource usage for %s' %
                           (caller_name(), jobid))
                try:
                    cgroup.update_job_usage(jobid, (event.job_list[jobid]
                                                    .resources_used))
                except Exception:
                    pbs.logmsg(pbs.EVENT_DEBUG, '%s: Failed to update %s' %
                               (caller_name(), jobid))
        return True

    def _exechost_startup_handler(self, event, cgroup, jobutil):
        """
        Handler for exechost_startup events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        cgroup.create_paths()
        node = NodeUtils(cgroup.cfg)
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: NodeUtils class instantiated' %
                   caller_name())
        node.create_vnodes(cgroup.vntype)
        host = node.hostname
        # The memory limits are interdependent and might fail when set.
        # There are three limits. Worst case scenario is to loop three
        # times in order to set them all.
        mem_on_node = 0
        for _ in range(3):
            result = True
            if 'memory' in cgroup.subsystems:
                val = node.get_memory_on_node()
                mem_on_node = val
                if val is not None and val > 0:
                    try:
                        cgroup.set_limit('mem', val)
                    except Exception:
                        result = False
                try:
                    val = int(cgroup.cfg['cgroup']['memory']['swappiness'])
                    cgroup.set_swappiness(val)
                except Exception:
                    # error is not fatal, do not set result to False
                    pbs.logmsg(pbs.EVENT_DEBUG,
                               '%s: Failed to set swappiness' % caller_name())
            if 'memsw' in cgroup.subsystems:
                val = node.get_vmem_on_node()
                if val < mem_on_node:
                    val = mem_on_node
                if val is not None and val > 0:
                    try:
                        cgroup.set_limit('vmem', val)
                    except Exception:
                        result = False
            if 'hugetlb' in cgroup.subsystems:
                val = node.get_hpmem_on_node(ignore_reserved=False)
                if val is not None and val > 0:
                    try:
                        cgroup.set_limit('hpmem', val)
                    except Exception:
                        result = False
            if result:
                return True
        return False

    def _execjob_attach_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_attach events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Ensure the job ID has been removed from cgroup_jobs
        cgroup.remove_jobid_from_cgroup_jobs(event.job.id)
        pbs.logjobmsg(jobutil.job.id, '%s: Attaching PID %s' %
                      (caller_name(), event.pid))
        # Add all processes in the job session to the appropriate cgroups
        cgroup.add_pids(event.pid, jobutil.job.id)
        return True

    def _execjob_resize_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_resize events.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Instantiate the NodeUtils class for get_memory_on_node and
        # get_vmem_on node
        node = NodeUtils(cgroup.cfg)
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: NodeUtils class instantiated' %
                   caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Host assigned job resources: %s' %
                   (caller_name(), jobutil.assigned_resources))
        if (cgroup.cfg['cgroup']['cpuset']['enabled']
                and not cgroup.cfg['cgroup']['cpuset']['allow_zero_cpus']):
            if ('ncpus' not in jobutil.assigned_resources
                    or jobutil.assigned_resources['ncpus'] <= 0):
                if event.job.in_ms_mom():
                    pbs.logmsg(pbs.EVENT_ERROR,
                               'cpuset enabled with mandatory ncpus >= 1, '
                               'but job does not request ncpus on '
                               'mother superior: rejecting resize')
                    event.reject('cpuset enabled with mandatory ncpus >= 1, '
                                 'but job does not request ncpus on '
                                 'mother superior: rejecting resize')
                else:
                    # will be done in configure_job
                    pbs.logmsg(pbs.EVENT_ERROR,
                               'cpuset enabled with mandatory ncpus >= 1, '
                               'but job no longer requests ncpus on host: '
                               'deleting cpuset cgroup')

        # Configure the cgroup
        cgroup.configure_job(event.job, jobutil.assigned_resources,
                             node, cgroup, event.type)
        # Write out the assigned resources
        cgroup.write_cgroup_assigned_resources(event.job.id)
        # Write out the environment variable for the host (pbs_attach)
        if 'device_names' in cgroup.assigned_resources:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Devices: %s' %
                       (caller_name(),
                        cgroup.assigned_resources['device_names']))
            env_list = []
            if cgroup.assigned_resources['device_names']:
                mics = []
                gpus = []
                for key in cgroup.assigned_resources['device_names']:
                    if key.startswith('mic'):
                        mics.append(key[3:])
                    elif (key.startswith('nvidia')
                            and "gpu" in node.devices
                            and key in node.devices['gpu']):
                        if 'uuid' in node.devices['gpu'][key]:
                            gpus.append(node.devices['gpu'][key]['uuid'])
                        if 'uuids' in node.devices['gpu'][key]:
                            gpus.extend(node.devices['gpu'][key]['uuids'])
                if mics:
                    env_list.append('OFFLOAD_DEVICES=%s' %
                                    ",".join(mics))
                if gpus:
                    # Don't put quotes around the values. ex "0" or "0,1".
                    # This will cause it to fail.
                    env_list.append('CUDA_VISIBLE_DEVICES=%s' %
                                    ",".join(gpus))
                    env_list.append('CUDA_DEVICE_ORDER=PCI_BUS_ID')
            pbs.logmsg(pbs.EVENT_DEBUG4, 'ENV_LIST: %s' % env_list)
            cgroup.write_job_env_file(event.job.id, env_list)
        return True

    def _execjob_postsuspend_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_postsuspend events.
        """
        return True

    def _execjob_preresume_handler(self, event, cgroup, jobutil):
        """
        Handler for execjob_preresume events.
        """
        return True

#
# CLASS JobUtils
#


class JobUtils(object):
    """
    Job utility methods
    """

    def __init__(self, job, hostname=None, assigned_resources=None):
        self.job = job
        if hostname is not None:
            self.hostname = hostname
        else:
            self.hostname = pbs.get_local_nodename()
        if assigned_resources is not None:
            self.assigned_resources = assigned_resources
        else:
            self.assigned_resources = self._get_assigned_job_resources()

    def __repr__(self):
        return ('JobUtils(%s, %s, %s)' %
                (repr(self.job),
                 repr(self.hostname),
                 repr(self.assigned_resources)))

    def _get_assigned_job_resources(self, hostname=None):
        """
        Return a dictionary of assigned resources on the local node
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Bail out if no hostname was provided
        if not hostname:
            hostname = self.hostname
        if not hostname:
            raise CgroupProcessingError('No hostname available')
        # Bail out if no job information is present
        if self.job is None:
            raise CgroupProcessingError('No job information available')
        # Create a list of local vnodes
        vnodes = []
        vnhost_pattern = r'%s\[[\d]+\]' % hostname
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: vnhost pattern: %s' %
                   (caller_name(), vnhost_pattern))
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Job exec_vnode list: %s' %
                   (caller_name(), self.job.exec_vnode))
        for match in re.findall(vnhost_pattern, str(self.job.exec_vnode)):
            vnodes.append(match)
        if vnodes:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Vnodes on %s: %s' %
                       (caller_name(), hostname, vnodes))
        # Collect host assigned resources
        resources = {}
        for chunk in self.job.exec_vnode.chunks:
            if vnodes:
                # Vnodes list is not empty
                if chunk.vnode_name not in vnodes:
                    continue
                if 'vnodes' not in resources:
                    resources['vnodes'] = {}
                if chunk.vnode_name not in resources['vnodes']:
                    resources['vnodes'][chunk.vnode_name] = {}
                # Initialize any missing resources for the vnode.
                # This check is needed because some resources might
                # not be present in each chunk of a job. For example:
                # exec_vnodes =
                # (node1[0]:ncpus=4:mem=4gb+node1[1]:mem=2gb) +
                # (node1[1]:ncpus=3+node[0]:ncpus=1:mem=4gb)
                for resc in list(chunk.chunk_resources.keys()):
                    vnresc = resources['vnodes'][chunk.vnode_name]
                    if resc in list(vnresc.keys()):
                        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: %s:%s defined' %
                                   (caller_name(), chunk.vnode_name, resc))
                    else:
                        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: %s:%s missing' %
                                   (caller_name(), chunk.vnode_name, resc))
                        vnresc[resc] = \
                            initialize_resource(chunk.chunk_resources[resc])
                pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Chunk %s resources: %s' %
                           (caller_name(), chunk.vnode_name, resources))
            else:
                # Vnodes list is empty
                if chunk.vnode_name != hostname:
                    continue
            for resc in list(chunk.chunk_resources.keys()):
                if resc not in list(resources.keys()):
                    resources[resc] = \
                        initialize_resource(chunk.chunk_resources[resc])
                # Add resource value to total
                if isinstance(chunk.chunk_resources[resc],
                              (pbs.pbs_int, pbs.pbs_float, pbs.size)):
                    resources[resc] += chunk.chunk_resources[resc]
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               '%s: resources[%s][%s] is now %s' %
                               (caller_name(), hostname, resc,
                                resources[resc]))
                    if vnodes:
                        resources['vnodes'][chunk.vnode_name][resc] += \
                            chunk.chunk_resources[resc]
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               '%s: Setting resource %s to string %s' %
                               (caller_name(), resc,
                                str(chunk.chunk_resources[resc])))
                    resources[resc] = str(chunk.chunk_resources[resc])
                    if vnodes:
                        resources['vnodes'][chunk.vnode_name][resc] = \
                            str(chunk.chunk_resources[resc])
        if resources:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Resources for %s: %s' %
                       (caller_name(), hostname, repr(resources)))
            # Return assigned resources for specified host
            return resources
        else:
            pbs.logmsg(pbs.EVENT_JOB_USAGE, "WARNING: job seems "
                       + "to have no resources assigned to this host.")
            pbs.logmsg(pbs.EVENT_JOB_USAGE,
                       "Server and MoM vnode names may not be consistent.")
            pbs.logmsg(pbs.EVENT_JOB_USAGE,
                       "Pattern for expected vnode name(s) is %s"
                       % vnhost_pattern)
            pbs.logmsg(pbs.EVENT_JOB_USAGE,
                       "Job exec_vnode is %s" % str(self.job.exec_vnode))
            pbs.logmsg(pbs.EVENT_JOB_USAGE,
                       "You may have forgotten to set PBS_MOM_NODE_NAME to "
                       "the desired matching entry in the exec_vnode string")
            pbs.logmsg(pbs.EVENT_JOB_USAGE,
                       "Job will fail or be configured with default ncpus/mem")
            return {}


#
# CLASS NodeUtils
#
class NodeUtils(object):
    """
    Node utility methods
    NOTE: Multiple log messages pertaining to devices have been commented
          out due to the size of the messages. They may be uncommented for
          additional debugging if necessary.
    """

    def __init__(self, cfg, hostname=None, cpuinfo=None, meminfo=None,
                 numa_nodes=None, devices=None):
        self.cfg = cfg
        if hostname is not None:
            self.hostname = hostname
        else:
            self.hostname = pbs.get_local_nodename()
        if cpuinfo is not None:
            self.cpuinfo = cpuinfo
        else:
            self.cpuinfo = self._discover_cpuinfo()
        if meminfo is not None:
            self.meminfo = meminfo
        else:
            self.meminfo = self._discover_meminfo()
        if numa_nodes is not None:
            self.numa_nodes = numa_nodes
        else:
            self.numa_nodes = dict()
            self.numa_nodes = self._discover_numa_nodes()
        if devices is not None:
            self.devices = devices
        elif self.cfg['cgroup']['devices']['enabled']:
            self.devices = self._discover_devices()
        else:
            self.devices = {}
        # Add the devices count i.e. nmics and ngpus to the numa nodes
        self._add_device_counts_to_numa_nodes()
        # Information for offlining nodes
        self.offline_file = os.path.join(PBS_MOM_HOME, 'mom_priv', 'hooks',
                                         ('%s.offline' %
                                          pbs.event().hook_name))
        self.offline_msg = 'Hook %s: ' % pbs.event().hook_name
        self.offline_msg += 'Unable to clean up one or more cgroups'

    def __repr__(self):
        return ('NodeUtils(%s, %s, %s, %s, %s, %s)' %
                (repr(self.cfg),
                 repr(self.hostname),
                 repr(self.cpuinfo),
                 repr(self.meminfo),
                 repr(self.numa_nodes),
                 repr(self.devices)))

    def _add_device_counts_to_numa_nodes(self):
        """
        Update the device counts per numa node
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        for dclass in self.devices:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Device class: %s' %
                       (caller_name(), dclass))
            if dclass == 'mic' or dclass == 'gpu':
                for inst in self.devices[dclass]:
                    numa_node = self.devices[dclass][inst]['numa_node']
                    if dclass == 'mic' and inst.find('mic') != -1:
                        if 'nmics' not in self.numa_nodes[numa_node]:
                            self.numa_nodes[numa_node]['nmics'] = 1
                        else:
                            self.numa_nodes[numa_node]['nmics'] += 1
                    elif dclass == 'gpu':
                        if 'ngpus' not in self.numa_nodes[numa_node]:
                            self.numa_nodes[numa_node]['ngpus'] = 1
                        else:
                            self.numa_nodes[numa_node]['ngpus'] += 1
        pbs.logmsg(pbs.EVENT_DEBUG4, 'NUMA nodes: %s' % (self.numa_nodes))
        return

    def _discover_numa_nodes(self):
        """
        Discover what type of hardware is on this node and how it
        is partitioned
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        numa_nodes = {}
        for node in glob.glob(os.path.join(os.sep, 'sys', 'devices',
                                           'system', 'node', 'node*')):
            # The basename will be node0, node1, etc.
            # Capture the numeric portion as the identifier/ordinal.
            num = int(os.path.basename(node)[4:])
            if num not in numa_nodes:
                numa_nodes[num] = {}
                numa_nodes[num]['devices'] = []
            exclude = expand_list(self.cfg['cgroup']['cpuset']['exclude_cpus'])
            with open(os.path.join(node, 'cpulist'), 'r') as desc:
                avail = expand_list(desc.readline())
                numa_nodes[num]['cpus'] = [
                    x for x in avail if x not in exclude]
            with open(os.path.join(node, 'meminfo'), 'r') as desc:
                for line in desc:
                    # Each line will contain four or five fields. Examples:
                    # Node 0 MemTotal:       32995028 kB
                    # Node 0 HugePages_Total:     0
                    entries = line.split()
                    if len(entries) < 4:
                        continue
                    if entries[2] == 'MemTotal:':
                        numa_nodes[num]['MemTotal'] = \
                            convert_size(entries[3] + entries[4], 'kb')
                    elif entries[2] == 'HugePages_Total:':
                        numa_nodes[num]['HugePages_Total'] = int(entries[3])
        # Adjust NUMA nodes wrt reserved memory resource
        # note that the get_* routines only work because this routine
        # is called in the constructor; that constructor first
        # sets self.numa_nodes to the empty dict, which triggers
        # the get_* routines to use the non-NUMA section
        num_numa_nodes = len(numa_nodes)
        if self.cfg['vnode_per_numa_node'] and num_numa_nodes > 0:
            # Huge page memory
            host_hpmem = self.get_hpmem_on_node(ignore_reserved=True)
            host_resv_hpmem = host_hpmem - self.get_hpmem_on_node()
            if host_resv_hpmem < 0:
                host_resv_hpmem = 0
            node_resv_hpmem = int(math.ceil(host_resv_hpmem / num_numa_nodes))
            if 'Hugepagesize' in self.meminfo:
                node_resv_hpmem -= \
                    (node_resv_hpmem
                     % size_as_int(self.meminfo['Hugepagesize']))
            # Physical memory
            host_mem = self.get_memory_on_node(ignore_reserved=True)
            host_mem_net = self.get_memory_on_node(ignore_reserved=False)
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: gross mem = %s, net mem = %s'
                       % (caller_name(), host_mem, host_mem_net))
            host_resv_mem = host_mem - host_mem_net
            if host_resv_mem < 0:
                host_resv_mem = 0
            node_resv_mem = int(math.ceil(host_resv_mem / num_numa_nodes))
            node_resv_mem -= node_resv_mem % (1024 * 1024)
            # Swap to be added to virtual memory
            # net values, taking into account reserved memory
            host_vmem_net = self.get_vmem_on_node(ignore_reserved=False)
            node_swapmem = int(math.floor((host_vmem_net - host_mem_net)
                                          / num_numa_nodes))
            if node_swapmem < 0:
                node_swapmem = 0
            node_swapmem -= node_swapmem % (1024 * 1024)
            # Set the NUMA node values
            for num in numa_nodes:
                val = 0
                if 'HugePages_Total' in numa_nodes[num]:
                    val = numa_nodes[num]['HugePages_Total']
                    if 'Hugepagesize' in self.meminfo:
                        val *= size_as_int(self.meminfo['Hugepagesize'])
                    val -= node_resv_hpmem
                numa_nodes[num]['hpmem'] = val
                val = size_as_int(numa_nodes[num]['MemTotal'])
                # round down only svr-reported values, not internal values
                val -= node_resv_mem
                numa_nodes[num]['mem'] = val
                val += node_swapmem
                # round down only svr-reported values, not internal values
                numa_nodes[num]['vmem'] = val
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: %s' % (caller_name(), numa_nodes))
        return numa_nodes

    def _devinfo(self, path):
        """
        Returns major minor and type from device
        """
        # If the stat fails, log it and continue.
        try:
            statinfo = os.stat(path)
        except OSError:
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Stat error on %s' %
                       (caller_name(), path))
            return None
        major = os.major(statinfo.st_rdev)
        minor = os.minor(statinfo.st_rdev)
        if stat.S_ISCHR(statinfo.st_mode):
            dtype = 'c'
        else:
            dtype = 'b'
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Path: %s, Major: %d, Minor: %d, Type: %s' %
                   (path, major, minor, dtype))
        return {'major': major, 'minor': minor, 'type': dtype}

    def _discover_devices(self):
        """
        Identify devices and to which numa nodes they are attached
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        devices = {}
        # First loop identifies all devices and determines their true path,
        # major/minor device IDs, and NUMA node affiliation (if any).
        paths = glob.glob(os.path.join(os.sep, 'sys', 'class', '*', '*'))
        paths.extend(glob.glob(os.path.join(
            os.sep, 'sys', 'bus', 'pci', 'devices', '*')))
        for path in paths:
            # Skip this path if it is not a directory
            if not os.path.isdir(path):
                continue
            dirs = path.split(os.sep)   # Path components
            dclass = dirs[-2]   # Device class
            inst = dirs[-1]   # Device instance
            if dclass not in devices:
                devices[dclass] = {}
            devices[dclass][inst] = {}
            devices[dclass][inst]['realpath'] = os.path.realpath(path)
            # Determine the PCI bus ID of the device
            devices[dclass][inst]['bus_id'] = ''
            if dirs[-3] == 'pci' and dirs[-2] == 'devices':
                devices[dclass][inst]['bus_id'] = dirs[-1]
            # Determine the major and minor device numbers
            filename = os.path.join(devices[dclass][inst]['realpath'], 'dev')
            devices[dclass][inst]['major'] = None
            devices[dclass][inst]['minor'] = None
            if os.path.isfile(filename):
                with open(filename, 'r') as desc:
                    major, minor = list(
                        map(int, desc.readline().strip().split(':')))
                    devices[dclass][inst]['major'] = int(major)
                    devices[dclass][inst]['minor'] = int(minor)
            numa_node = -1
            subdir = os.path.join(devices[dclass][inst]['realpath'], 'device')
            # The numa_node file is not always in the same place
            # so work our way up the path trying to find it.
            while len(subdir.split(os.sep)) > 2:
                filename = os.path.join(subdir, 'numa_node')
                if os.path.isfile(filename):
                    # The file should contain a single integer
                    with open(filename, 'r') as desc:
                        numa_node = int(desc.readline().strip())
                    break
                subdir = os.path.dirname(subdir)
            if numa_node < 0:
                numa_node = 0
            devices[dclass][inst]['numa_node'] = numa_node
        # Second loop determines device types and their location
        # under /dev. Only look for block and character devices.
        for path in find_files(os.path.join(os.sep, 'dev'), kind='bc',
                               follow_mounts=False):
            # If the stat fails, log it and continue.
            devinfo = self._devinfo(path)
            if not devinfo:
                continue

            for dclass in devices:
                for inst in devices[dclass]:
                    if 'type' not in devices[dclass][inst]:
                        devices[dclass][inst]['type'] = None
                    if 'device' not in devices[dclass][inst]:
                        devices[dclass][inst]['device'] = None
                    if devices[dclass][inst]['major'] == devinfo['major']:
                        if devices[dclass][inst]['minor'] == devinfo['minor']:
                            devices[dclass][inst]['type'] = devinfo['type']
                            devices[dclass][inst]['device'] = path
        # Check to see if there are gpus on the node and copy them
        # into their own dictionary.
        devices['gpu'] = {}
        gpus = self._discover_gpus()
        if gpus:
            for dclass in devices:
                for inst in devices[dclass]:
                    for gpuid in gpus:
                        bus_id = devices[dclass][inst]['bus_id'].lower()
                        if bus_id == gpus[gpuid]['pci_bus_id']:
                            devices['gpu'][gpuid] = devices[dclass][inst]
                            # For NVIDIA devices, sysfs doesn't contain a dev
                            # file, so we must get the major, minor and device
                            # type from the matching /dev/nvidia[0-9]*
                            if gpuid.startswith('nvidia'):
                                path = os.path.join(os.sep, 'dev', gpuid)
                                # If the stat fails, continue.
                                devinfo = self._devinfo(path)
                                if not devinfo:
                                    continue
                                devices[dclass][inst]['major'] = \
                                    devinfo['major']
                                devices[dclass][inst]['minor'] = \
                                    devinfo['minor']
                                devices[dclass][inst]['type'] = \
                                    devinfo['type']
                                devices[dclass][inst]['device'] = path
                                devices[dclass][inst]['uuid'] = \
                                    gpus[gpuid]['uuid']
        # if any gpu has mig enabled, let's use them
        if gpus and any(gpus[gpu]['mig'] for gpu in gpus):
            nvidia_cap_major = None
            with open(os.path.join(os.sep, 'proc', 'devices')) as f:
                for line in f:
                    device = line.split()
                    if len(device) != 2:
                        continue
                    if device[1] == 'nvidia-caps':
                        nvidia_cap_major = int(device[0])
                        break
            if nvidia_cap_major is None:
                pbs.logmsg(pbs.EVENT_SYSTEM, '%s: A GPU has MIG enabled, but'
                           'nvidia-caps is not found in /proc/devices. '
                           'Skipping MIG configuration'
                           % caller_name())
            else:
                gis = {}
                # we need major, minor, type, uuids, numa_node
                for gpuid in gpus:
                    if 'gis' not in gpus[gpuid]:
                        continue
                    for giid in gpus[gpuid]['gis']:
                        gi = gpus[gpuid]['gis'][giid]
                        if 'cis' not in gi:
                            # no cis found for this gi, just skip
                            continue
                        name = 'nvidia-cap%d' % gi['minor']
                        numa = devices['gpu'][gpuid]['numa_node']
                        major = devices['gpu'][gpuid]['major']
                        minor = devices['gpu'][gpuid]['minor']
                        # extra_devs are the device numbers of the physical
                        # gpu, as well as the nvidia controller
                        new_gpu = {'major': nvidia_cap_major,
                                   'minor': gi['minor'],
                                   'is_gi': True,
                                   'type': 'c',
                                   'numa_node': numa,
                                   'extra_devs': ['%d:%d' % (major, minor),
                                                  '%d:255' % (major)],
                                   'uuids': []
                                   }
                        for ciid in gi['cis']:
                            ci = gi['cis'][ciid]
                            new_gpu['uuids'].append(ci['uuid'])
                            major = nvidia_cap_major
                            minor = ci['minor']
                            new_gpu['extra_devs'].append(
                                '%d:%d' % (major, minor))
                        devices['gpu'][name] = new_gpu
                    del devices['gpu'][gpuid]

        pbs.logmsg(pbs.EVENT_DEBUG4, 'Processed GPUs: %s' % devices['gpu'])
        if gpus and not devices['gpu']:
            pbs.logmsg(pbs.EVENT_SYSTEM, '%s: GPUs discovered but could not '
                       'be successfully mapped to devices.' % (caller_name()))
        return devices

    def _discover_gpus(self):
        """
        Return a dictionary where the keys are the name of the GPU devices
        and the values are the PCI bus IDs.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        gpus = {}
        if self.cfg['discover_gpus'] and self.cfg['nvidia-smi']:
            cmd = [self.cfg['nvidia-smi'], '-q', '-x']
        else:
            return gpus
        pbs.logmsg(pbs.EVENT_DEBUG4, 'NVIDIA SMI command: %s' % cmd)
        time_start = time.time()
        mig_found = False
        try:
            # Try running the nvidia-smi command
            process = subprocess.Popen(cmd, shell=False,
                                       stdout=subprocess.PIPE,
                                       stderr=subprocess.PIPE,
                                       universal_newlines=True)
            out = process.communicate()[0]
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Failed to execute: %s' %
                       " ".join(cmd))
            pbs.logmsg(pbs.EVENT_DEBUG3, '%s: No GPUs found' % caller_name())
            return gpus
        elapsed_time = time.time() - time_start
        if elapsed_time > 2.0:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: nvidia-smi call took %f seconds' %
                       (caller_name(), elapsed_time))
        # if we get a non-str type then convert before calling xmlet
        # should not happen since we passed universal_newlines True
        try:
            # Try parsing the output
            import xml.etree.ElementTree as xmlet
            root = xmlet.fromstring(stringified_output(out))
            pbs.logmsg(pbs.EVENT_DEBUG4, 'root.tag: %s' % root.tag)
            for child in root:
                if child.tag == 'gpu':
                    bus_id = child.get('id')
                    result = re.match(r'([^:]+):(.*)', bus_id)
                    if not result:
                        raise ValueError('GPU ID not recognized: ' + bus_id)
                    domain, instance = result.groups()
                    # Make sure the PCI domain is 16 bits (4 hex digits)
                    if len(domain) == 8:
                        domain = domain[-4:]
                    if len(domain) != 4:
                        raise ValueError('GPU ID not recognized: ' + bus_id)
                    name = 'nvidia%s' % child.find('minor_number').text
                    mig_enabled = False
                    mig_mode = child.find('mig_mode')
                    if mig_mode is not None:
                        current_mig = mig_mode.find('current_mig')
                        if current_mig is not None:
                            if current_mig.text == 'Enabled':
                                mig_found = True
                                mig_enabled = True
                    gpus[name] = {
                        'pci_bus_id': (domain + ':' + instance).lower(),
                        'uuid': child.find('uuid').text,
                        'mig': mig_enabled
                    }
        except Exception as exc:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Unexpected error: %s' % exc)

        # at least one gpu had mig enabled, let's add the gis
        if mig_found:
            self._discover_migs(gpus)

        pbs.logmsg(pbs.EVENT_DEBUG4, 'GPUs: %s' % gpus)
        return gpus

    def _discover_migs(self, gpus):
        """
        Mutate the gpus dictionary with mig info, GIs and CIs
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # find GIs
        cmd = [self.cfg['nvidia-smi'], 'mig', '-lgi']
        pbs.logmsg(pbs.EVENT_DEBUG4, 'NVIDIA SMI command: %s' % cmd)
        time_start = time.time()
        out = []
        try:
            # Try running the nvidia-smi command
            process = subprocess.Popen(cmd, shell=False,
                                       stdout=subprocess.PIPE,
                                       stderr=subprocess.PIPE,
                                       universal_newlines=True)
            out = process.communicate()[0].split('\n')
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Failed to execute: %s' %
                       " ".join(cmd))
            pbs.logmsg(pbs.EVENT_DEBUG3, '%s: No MIGs found' % caller_name())
            return
        elapsed_time = time.time() - time_start
        if elapsed_time > 2.0:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: nvidia-smi call took %f seconds' %
                       (caller_name(), elapsed_time))

        # format is
        # | GPUID   NAME       ProfileID  GIID       PLACE     |
        # |====================================================|
        # |   0  MIG 1g.5gb       19        7          4:1     |
        # +----------------------------------------------------+
        # |   0  MIG 1g.5gb       19        8          5:1     |
        r = re.compile(r'^\|\s+(\d+)\s+MIG\s+\S+\s+\d+\s+(\d+)\s+\S+\s+\|$')
        for out_line in out:
            match = r.match(out_line)
            if not match:
                continue
            gpu_num = int(match.group(1))
            gpuid = 'nvidia%d' % gpu_num
            giid = int(match.group(2))
            minor = self._discover_mig_minor(gpu_num, giid, ci=None)
            gi = {'minor': minor, 'gi': giid}
            pbs.logmsg(pbs.EVENT_DEBUG4, 'GI found %s' % str(gi))
            if 'gis' not in gpus[gpuid]:
                gpus[gpuid]['gis'] = {}
            gpus[gpuid]['gis'][giid] = gi

        # Find all MIG UUIDs using nvidia-smi -L
        # and update it later while finding the CIs
        cmd = [self.cfg['nvidia-smi'], '-L']
        pbs.logmsg(pbs.EVENT_DEBUG4, 'NVIDIA SMI command: %s' % cmd)
        time_start = time.time()
        out = []

        try:
            # Try running the nvidia-smi command
            process = subprocess.Popen(cmd, shell=False,
                                       stdout=subprocess.PIPE,
                                       stderr=subprocess.PIPE,
                                       universal_newlines=True)
            out = process.communicate()[0].split('\n')
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Failed to execute: %s' %
                       " ".join(cmd))
            pbs.logmsg(pbs.EVENT_DEBUG3, '%s: No MIGs found' % caller_name())
            return
        elapsed_time = time.time() - time_start
        if elapsed_time > 2.0:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: nvidia-smi call took %f seconds' %
                       (caller_name(), elapsed_time))

        # format is:
        # GPU gpuID: gpu_name (UUID: GPU UUID)
        # MIG xg.ygb      Device  0: (UUID: MIG-UUID)
        # MIG xg.ygb      Device  1: (UUID: MIG-UUID)

        # Map (gpu_id, instance_id) to a MIG UUID
        uuid_map = dict()
        r_gpu = re.compile(r'\s*GPU\s(\d+)')
        r_mig = re.compile(r'\s*MIG.*Device\s*(\d+)')
        current_gpu = 0
        for out_line in out:
            gpu_match = r_gpu.match(out_line)
            mig_match = r_mig.match(out_line)
            if gpu_match:
                current_gpu = int(gpu_match.group(1))
                uuid_map[current_gpu] = dict()
            if mig_match:
                mig_uuid = out_line.split()[-1].rstrip(")")
                uuid_map[current_gpu][int(mig_match.group(1))] = mig_uuid

        pbs.logmsg(pbs.EVENT_DEBUG4, "uuid map: %s" % str(uuid_map))

        # now find all CIs
        cmd = [self.cfg['nvidia-smi'], 'mig', '-lci']
        pbs.logmsg(pbs.EVENT_DEBUG4, 'NVIDIA SMI command: %s' % cmd)
        time_start = time.time()
        out = []
        try:
            # Try running the nvidia-smi command
            process = subprocess.Popen(cmd, shell=False,
                                       stdout=subprocess.PIPE,
                                       stderr=subprocess.PIPE,
                                       universal_newlines=True)
            out = process.communicate()[0].split('\n')
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Failed to execute: %s' %
                       " ".join(cmd))
            pbs.logmsg(pbs.EVENT_DEBUG3, '%s: No MIGs found' % caller_name())
            return
        elapsed_time = time.time() - time_start
        if elapsed_time > 2.0:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: nvidia-smi call took %f seconds' %
                       (caller_name(), elapsed_time))

        # format is either
        # | Compute instances:                                    |
        # | GPU     GPU       Name             Profile   Instance |
        # |       Instance                       ID        ID     |
        # |         ID                                            |
        # |   0      7       MIG 1g.5gb           0         0     |
        # or
        # | Compute instances:                                             |
        # | GPU     GPU       Name         Profile   Instance   Placement  |
        # |       Instance                   ID        ID       Start:Size |
        # |         ID                                                     |
        # |   0      7       MIG 1g.5gb       0         0          0:1     |
        r = re.compile(
            r'^\|\s+(\d+)\s+(\d+)\s+MIG\s+\S+\s+\d+\s+(\d+)\s+(\S+\s+)?\|$')

        uuid_count = 0
        gpu_num = 0
        for out_line in out:
            match = r.match(out_line)
            if not match:
                continue
            # reset count if a new gpu is parsed
            if gpu_num != int(match.group(1)):
                uuid_count = 0
            gpu_num = int(match.group(1))
            gpuid = 'nvidia%d' % gpu_num
            giid = int(match.group(2))
            ciid = int(match.group(3))
            minor = self._discover_mig_minor(gpu_num, giid, ciid)
            if minor == -1:
                continue
            uuid = uuid_map[gpu_num][uuid_count]
            uuid_count += 1
            ci = {'minor': minor, 'gi': giid, 'ci': ciid, 'uuid': uuid}
            pbs.logmsg(pbs.EVENT_DEBUG4, 'CI found %s' % str(ci))
            if 'cis' not in gpus[gpuid]['gis'][giid]:
                gpus[gpuid]['gis'][giid]['cis'] = {}
            gpus[gpuid]['gis'][giid]['cis'][ciid] = ci

    def _discover_mig_minor(self, gpu, gi, ci=None):
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        path = os.path.join(os.sep, 'proc', 'driver',
                            'nvidia-caps', 'mig-minors')
        if ci is None:
            capname = 'gpu%d/gi%d/access' % (gpu, gi)
        else:
            capname = 'gpu%d/gi%d/ci%d/access' % (gpu, gi, ci)
        with open(path, 'r') as minors:
            for line in minors:
                cap, minor = line.split(' ', 1)
                if cap == capname:
                    return int(minor)
        pbs.logmsg(pbs.EVENT_DEBUG, 'Cannot find minor number for %s'
                   % capname)
        return -1

    def _discover_meminfo(self):
        """
        Return a dictionary where the keys are the NUMA node ordinals
        and the values are the various memory sizes
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        meminfo = {}
        with open(os.path.join(os.sep, 'proc', 'meminfo'), 'r') as desc:
            for line in desc:
                entries = line.split()
                if entries[0] == 'MemTotal:':
                    meminfo[entries[0].rstrip(':')] = \
                        convert_size(entries[1] + entries[2], 'kb')
                elif entries[0] == 'SwapTotal:':
                    meminfo[entries[0].rstrip(':')] = \
                        convert_size(entries[1] + entries[2], 'kb')
                elif entries[0] == 'Hugepagesize:':
                    meminfo[entries[0].rstrip(':')] = \
                        convert_size(entries[1] + entries[2], 'kb')
                elif entries[0] == 'HugePages_Total:':
                    meminfo[entries[0].rstrip(':')] = int(entries[1])
                elif entries[0] == 'HugePages_Rsvd:':
                    meminfo[entries[0].rstrip(':')] = int(entries[1])
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Discover meminfo: %s' % meminfo)
        return meminfo

    def _discover_cpuinfo(self):
        """
        Return a dictionary where the keys include both global settings
        and individual CPU characteristics
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        cpuinfo = {}
        cpuinfo['cpu'] = {}
        proc = None
        with open(os.path.join(os.sep, 'proc', 'cpuinfo'), 'r') as desc:
            for line in desc:
                entries = line.strip().split(':')
                if len(entries) < 2:
                    # Blank line indicates end of processor
                    proc = None
                    continue
                key = entries[0].strip()
                val = entries[1].strip()
                if proc is None and key != 'processor':
                    raise ProcessingError('Failed to parse /proc/cpuinfo')
                if key == 'processor':
                    proc = int(val)
                    if proc in cpuinfo:
                        raise ProcessingError('Duplicate CPU ID found')
                    cpuinfo['cpu'][proc] = {}
                    cpuinfo['cpu'][proc]['threads'] = []
                elif key == 'flags':
                    cpuinfo['cpu'][proc][key] = val.split()
                elif val.isdigit():
                    cpuinfo['cpu'][proc][key] = int(val)
                else:
                    cpuinfo['cpu'][proc][key] = val
        if not cpuinfo['cpu']:
            raise ProcessingError('No CPU information found')
        cpuinfo['logical_cpus'] = len(cpuinfo['cpu'])
        cpuinfo['hyperthreads_per_core'] = 1
        cpuinfo['hyperthreads'] = []
        # Now try to construct a dictionary with hyperthread information
        # if this is an Intel based processor
        try:
            if ('Intel' in cpuinfo['cpu'][0]['vendor_id']
                    or 'AuthenticAMD' in cpuinfo['cpu'][0]['vendor_id']):
                if 'ht' in cpuinfo['cpu'][0]['flags']:
                    cpuinfo['hyperthreads_per_core'] = \
                        int(cpuinfo['cpu'][0]['siblings']
                            // cpuinfo['cpu'][0]['cpu cores'])
                    # Map hyperthreads to physical cores
                    if cpuinfo['hyperthreads_per_core'] > 1:
                        pbs.logmsg(pbs.EVENT_DEBUG4,
                                   'Mapping hyperthreads to cores')
                        cores = list(cpuinfo['cpu'].keys())
                        threads = set()
                        # CPUs with matching core IDs are hyperthreads
                        # sharing the same physical core. Loop through
                        # the cores to construct a list of threads.
                        for xid in cores:
                            xcore = cpuinfo['cpu'][xid]
                            for yid in cores:
                                if yid < xid:
                                    continue
                                if yid == xid:
                                    cpuinfo['cpu'][xid]['threads'].append(yid)
                                    continue
                                ycore = cpuinfo['cpu'][yid]
                                if xcore['physical id'] != \
                                        ycore['physical id']:
                                    continue
                                if xcore['core id'] == ycore['core id']:
                                    cpuinfo['cpu'][xid]['threads'].append(yid)
                                    cpuinfo['cpu'][yid]['threads'].append(xid)
                                    threads.add(yid)
                        pbs.logmsg(pbs.EVENT_DEBUG4, 'HT cores: %s' % threads)
                        cpuinfo['hyperthreads'] = sorted(threads)
                    else:
                        cores = cpuinfo['cpu'].keys()
                        for xid in cores:
                            cpuinfo['cpu'][xid]['threads'].append(xid)
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG, '%s: Hyperthreading check failed' %
                       caller_name())
        cpuinfo['physical_cpus'] = int(cpuinfo['logical_cpus']
                                       // cpuinfo['hyperthreads_per_core'])
        wanted_keys = ['physical_cpus', 'logical_cpus',
                       'hyperthreads_per_core', 'hyperthreads']
        cpuinfo_short = dict((k, cpuinfo[k])
                             for k in wanted_keys if k in cpuinfo)
        pbs.logmsg(pbs.EVENT_DEBUG4, "%s returning: %s"
                   % (caller_name(), cpuinfo_short))
        if 0 in cpuinfo['cpu']:
            pbs.logmsg(pbs.EVENT_DEBUG4, "%s For CPU 0: cpuinfo['cpu'][0]: %s"
                       % (caller_name(), cpuinfo['cpu'][0]))
        return cpuinfo

    def gather_jobs_on_node(self, cgroup):
        """
        Gather the jobs assigned to this node and local vnodes
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Construct a dictionary where the keys are job IDs and the values
        # are timestamps. The job IDs are collected from the cgroup jobs
        # file and by inspecting MoM's job directory. Both are needed to
        # ensure orphans are properly identified.
        jobdict = cgroup.read_cgroup_jobs()
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'cgroup_jobs file content: %s' % str(jobdict))
        try:
            for jobfile in glob.glob(os.path.join(PBS_MOM_JOBS, '*.JB')):
                (jobid, dot_jb) = os.path.splitext(os.path.basename(jobfile))
                if jobid not in jobdict:
                    if os.stat_float_times():
                        jobdict[jobid] = os.path.getmtime(jobfile)
                    else:
                        jobdict[jobid] = float(os.path.getmtime(jobfile))
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Could not get job list for %s' %
                       self.hostname)
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Local job dictionary: %s' % str(jobdict))
        return jobdict

    def get_memory_on_node(self, memtotal=None, ignore_reserved=False):
        """
        Get the memory resource on this mom
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        total = 0
        if self.numa_nodes and self.cfg['vnode_per_numa_node']:
            # Caller wants the sum of all NUMA nodes
            for nnid in self.numa_nodes:
                if 'mem' in self.numa_nodes[nnid]:
                    total += self.numa_nodes[nnid]['mem']
                else:
                    # NUMA node unreliable, make sure other method is used
                    total = 0
                    break
            # only round down svr-reported values, not internal values
            if total > 0:
                return total
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: Failed to obtain memory using NUMA node method' %
                       caller_name())
        # Calculate total memory
        try:
            if memtotal is None:
                total = size_as_int(self.meminfo['MemTotal'])
            else:
                total = size_as_int(memtotal)
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: Could not determine total node memory' %
                       caller_name())
            raise
        if total <= 0:
            raise ValueError('Total node memory value invalid')
        pbs.logmsg(pbs.EVENT_DEBUG4, 'total visible mem: %d' % total)
        # Calculate reserved memory
        reserved = 0
        if not ignore_reserved:
            reserve_pct = int(self.cfg['cgroup']['memory']['reserve_percent'])
            reserved += int(total * (reserve_pct / 100.0))
            reserve_amount = self.cfg['cgroup']['memory']['reserve_amount']
            reserved += size_as_int(reserve_amount)
        pbs.logmsg(pbs.EVENT_DEBUG4, 'reserved mem: %d' % reserved)
        # Calculate remaining memory
        remaining = total - reserved
        # only round down svr-reported values, not internal values
        if remaining <= 0:
            raise ValueError('Too much reserved memory')
        pbs.logmsg(pbs.EVENT_DEBUG4, 'remaining mem: %d' % remaining)
        amount = convert_size(str(remaining), 'kb')
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Returning: %s' %
                   (caller_name(), amount))
        return remaining

    def get_vmem_on_node(self, vmemtotal=None, ignore_reserved=False):
        """
        Get the virtual memory resource on this mom
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        total = 0
        # If NUMA nodes were not yet discovered then get totals
        # using non-NUMA methods
        if self.numa_nodes and self.cfg['vnode_per_numa_node']:
            # Caller wants the sum of all NUMA nodes, and they were
            # computed earlier
            for nnid in self.numa_nodes:
                if 'vmem' in self.numa_nodes[nnid]:
                    total += self.numa_nodes[nnid]['vmem']
                else:
                    total = 0
                    break
            # only round down svr-reported values, not internal values
            if total > 0:
                return total
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: Failed to obtain vmem using NUMA node method' %
                       caller_name())
        # Calculate total vmem; start with visible or usable physical memory
        total = self.get_memory_on_node(None, ignore_reserved)
        if ignore_reserved:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'total visible mem: %d' % total)
        else:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'total usable mem: %d' % total)
        # Calculate total swap
        try:
            if vmemtotal is None:
                swap = size_as_int(self.meminfo['SwapTotal'])
            else:
                swap = size_as_int(vmemtotal)
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: Could not determine total node swap' %
                       caller_name())
            raise
        if swap <= 0:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: No swap space detected' %
                       caller_name())
            swap = 0
        pbs.logmsg(pbs.EVENT_DEBUG4, 'total swap: %d' % swap)
        # Calculate reserved swap
        reserved = 0
        if not ignore_reserved:
            reserve_pct = int(self.cfg['cgroup']['memsw']['reserve_percent'])
            reserved += int(swap * (reserve_pct / 100.0))
            reserve_amount = self.cfg['cgroup']['memsw']['reserve_amount']
            reserved += size_as_int(reserve_amount)
            pbs.logmsg(pbs.EVENT_DEBUG4, 'reserved swap: %d' % reserved)
            if reserved > swap:
                reserved = swap
        # Calculate remaining vmem
        remaining = total + swap - reserved
        # only round down svr-reported values, not internal values
        if remaining <= 0:
            raise ValueError('Too much reserved vmem')
        pbs.logmsg(pbs.EVENT_DEBUG4, 'remaining vmem: %d' % remaining)
        amount = convert_size(str(remaining), 'kb')
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Returning: %s' %
                   (caller_name(), amount))
        return remaining

    def get_hpmem_on_node(self, hpmemtotal=None, ignore_reserved=False):
        """
        Get the huge page memory resource on this mom
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        total = 0
        if self.numa_nodes and self.cfg['vnode_per_numa_node']:
            # Caller wants the sum of all NUMA nodes
            for nnid in self.numa_nodes:
                if 'hpmem' in self.numa_nodes[nnid]:
                    total += self.numa_nodes[nnid]['hpmem']
                else:
                    total = 0
                    break
            # only round down svr-reported values, not internal values
            if total > 0:
                return total
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: Failed to obtain memory using NUMA node method' %
                       caller_name())
        # Calculate hpmem
        try:
            if hpmemtotal is None:
                total = size_as_int(self.meminfo['Hugepagesize'])
                total *= (self.meminfo['HugePages_Total'] -
                          self.meminfo['HugePages_Rsvd'])
            else:
                total = size_as_int(hpmemtotal)
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG3,
                       '%s: Could not determine huge page availability' %
                       caller_name())
            total = 0
        if total <= 0:
            total = 0
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: No huge page memory detected' %
                       caller_name())
            return 0
        # Calculate reserved hpmem
        reserved = 0
        if not ignore_reserved:
            reserve_pct = int(self.cfg['cgroup']['hugetlb']['reserve_percent'])
            reserved += int(total * (reserve_pct / 100.0))
            reserve_amount = self.cfg['cgroup']['hugetlb']['reserve_amount']
            reserved += size_as_int(reserve_amount)
        pbs.logmsg(pbs.EVENT_DEBUG4, 'reserved hpmem: %d' % reserved)
        # Calculate remaining vmem
        remaining = total - reserved
        # Round down to nearest huge page
        if 'Hugepagesize' in self.meminfo:
            remaining -= (remaining
                          % (size_as_int(self.meminfo['Hugepagesize'])))
        if remaining <= 0:
            raise ValueError('Too much reserved hpmem')
        pbs.logmsg(pbs.EVENT_DEBUG4, 'remaining hpmem: %d' % remaining)
        amount = convert_size(str(remaining), 'kb')
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Returning: %s' %
                   (caller_name(), amount))
        # Remove any bytes beyond the last MB
        return remaining

    def create_vnodes(self, vntype=None):
        """
        Create individual vnodes per socket
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        vnode_list = pbs.event().vnode_list
        if self.cfg['vnode_per_numa_node']:
            vnodes = True
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: vnode_per_numa_node is enabled' %
                       caller_name())
        else:
            vnodes = False
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: vnode_per_numa_node is disabled' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: numa nodes: %s' %
                   (caller_name(), self.numa_nodes))
        vnode_name = self.hostname
        # In some cases the hostname and vnode name do not match
        # admin should fix this!
        # Give hints
        if vnode_name not in vnode_list:
            pbs.logmsg(pbs.EVENT_ERROR,
                       "Could not find hostname %s in vnode_list %s"
                       % (vnode_name, str(vnode_list.keys())))
            pbs.logmsg(pbs.EVENT_ERROR,
                       "This error is FATAL. Possible causes:")
            pbs.logmsg(pbs.EVENT_ERROR, "a) the server's name for "
                       "the natural node created on the server "
                       "does not match the output of 'hostname' on the host.")
            pbs.logmsg(pbs.EVENT_ERROR, "   Please use PBS_MOM_NODE_NAME "
                       "in /etc/pbs.conf to tell MoM the correct vnode name.")
            pbs.logmsg(pbs.EVENT_ERROR, "b) v2 config files are used "
                       "but none mention the natural vnode. Add a line for "
                       "the natural vnode in one of the v2 config files.")
            raise ProcessingError('Could not identify local vnode')
        vnode_list[vnode_name] = pbs.vnode(vnode_name)
        host_resc_avail = vnode_list[vnode_name].resources_available
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: host_resc_avail: %s' %
                   (caller_name(), host_resc_avail))
        # Set resources_available.vntype of natural node according
        # to what's in local file if it needs to be propagated to server
        if (vntype and self.cfg['propagate_vntype_to_server']):
            host_resc_avail['vntype'] = vntype
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: vnode type set to %s'
                       % (caller_name(), vntype))

        vnode_msg_cpu = '%s: vnode_list[%s].resources_available[ncpus] = %d'
        vnode_msg_mem = '%s: vnode_list[%s].resources_available[mem] = %s'

        host_resc_avail['diag_messages'] = ''

        if not vnodes:
            # memory (global for host)
            mem = self.get_memory_on_node(ignore_reserved=False)
            # remove X MB - handle jitter in MemTotal observed in field
            mem -= (1024 * 1024
                    * self.cfg['cgroup']['memory']['vnode_hidden_mb'])
            if mem < 0:
                mem = 0
            mem -= mem % (1024 * 1024)
            mem = pbs.size(convert_size(mem, 'mb'))
            host_resc_avail['mem'] = mem
            pbs.logmsg(pbs.EVENT_DEBUG4, vnode_msg_mem %
                       (caller_name(), vnode_name,
                        str(host_resc_avail['mem'])))
            # memory+swap ('vmem') (global for host)
            vmem = self.get_vmem_on_node(ignore_reserved=False)
            # remove X MB - handle jitter in MemTotal observed in field
            vmem -= (1024 * 1024
                     * self.cfg['cgroup']['memory']['vnode_hidden_mb'])
            if vmem < 0:
                vmem = 0
            vmem -= vmem % (1024 * 1024)
            # if there is no swap, trying to subtract vnode_hidden_mb
            # will lower vmem under mem, do not allow
            if vmem < mem:
                vmem = mem
            vmem = pbs.size(convert_size(vmem, 'mb'))
            host_resc_avail['vmem'] = vmem
            pbs.logmsg(pbs.EVENT_DEBUG4, vnode_msg_mem %
                       (caller_name(), vnode_name,
                        str(host_resc_avail['mem'])))
            # huge page mem (global for host)
            val = self.get_hpmem_on_node(ignore_reserved=False)
            # remove X MB - handle jitter in mem reported by OS
            val -= (1024 * 1024
                    * self.cfg['cgroup']['hugetlb']
                              ['vnode_hidden_mb'])
            if val < 0:
                val = 0
            val -= val % (1024 * 1024)  # round down to MB
            host_resc_avail['hpmem'] = \
                pbs.size(convert_size(val, 'mb'))
            if (self.cfg['cgroup']['memsw']['enabled']
                    and self.cfg['cgroup']['memsw']['manage_cgswap']):
                # special case 0 cgswap because assigning a "0mb"
                # pbs.size difference causes a bug
                if vmem == mem:
                    host_resc_avail['cgswap'] = pbs.size('0')
                else:
                    host_resc_avail['cgswap'] = (host_resc_avail['vmem']
                                                 - host_resc_avail['mem'])
            else:
                # This unsets it if it was defined earlier and needs to
                # disappear
                host_resc_avail['cgswap'] = None
        else:
            # set the value on the host to 0
            host_resc_avail['mem'] = pbs.size('0')
            host_resc_avail['vmem'] = pbs.size('0')
            host_resc_avail['hpmem'] = pbs.size('0')
            if (self.cfg['cgroup']['memsw']['enabled']
                    and self.cfg['cgroup']['memsw']['manage_cgswap']):
                host_resc_avail['cgswap'] = pbs.size('0')
            # Some kernel drivers "reserve" memory on /proc/meminfo
            # and this is not reflected in the node meminfo; if necessary,
            # adjust the values published as resources_available.mem
            # on the per-socket vnodes by the difference spread over nodes
            adjust_bytes_per_node = 0
            num_numa_nodes = len(self.numa_nodes)
            total_nodemem = 0
            for num in self.numa_nodes:
                total_nodemem += size_as_int(self.numa_nodes[num]['MemTotal'])
            total_hostmem = size_as_int(self.meminfo['MemTotal'])
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: host memtotal %s; node memtotal %s'
                       % (caller_name(),
                          str(total_hostmem), str(total_nodemem)))
            if total_hostmem < total_nodemem:
                adjust_bytes_per_node = \
                    int(math.ceil((total_nodemem - total_hostmem)
                                  / float(num_numa_nodes)))
                pbs.logmsg(pbs.EVENT_DEBUG,
                           '%s: host memtotal %s < node memtotal %s, '
                           'adjusting each vnode mem down by %s bytes'
                           % (caller_name(),
                              str(total_hostmem), str(total_nodemem),
                              str(adjust_bytes_per_node)))
        for nnid in self.numa_nodes:
            if vnodes:
                vnode_key = vnode_name + '[%d]' % nnid
                vnode_list[vnode_key] = pbs.vnode(vnode_name)
                vnode_resc_avail = vnode_list[vnode_key].resources_available
                # ensure that if no devices were discovered that
                # ngpus is set to 0; otherwise MoM may still use stale value
                vnode_resc_avail['ngpus'] = 0
                if (vntype and self.cfg['propagate_vntype_to_server']):
                    vnode_resc_avail['vntype'] = vntype
            for key, val in sorted(self.numa_nodes[nnid].items()):
                if key is None:
                    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: key is None'
                               % caller_name())
                    continue
                if val is None:
                    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: val is None'
                               % caller_name())
                    continue
                pbs.logmsg(pbs.EVENT_DEBUG4, '%s: %s = %s'
                           % (caller_name(), key, val))
                if key in ['MemTotal', 'HugePages_Total']:
                    # Irrelevant: transformed to other keys if vnodes is True
                    # done outside of loop if vnodes is False
                    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: key %s skipped'
                               % (caller_name(), key))
                elif key == 'cpus':
                    threads = len(val)
                    if not self.cfg['use_hyperthreads']:
                        # Do not treat a hyperthread as a core when
                        # use_hyperthreads is false.
                        threads = int(threads
                                      // self.cpuinfo['hyperthreads_per_core'])
                    elif self.cfg['ncpus_are_cores']:
                        # use_hyperthreads and ncpus_are_cores are both true,
                        # advertise only one thread per core
                        threads = int(threads
                                      // self.cpuinfo['hyperthreads_per_core'])
                    if vnodes:
                        # set the value on the host to 0
                        host_resc_avail['ncpus'] = 0
                        pbs.logmsg(pbs.EVENT_DEBUG4, vnode_msg_cpu %
                                   (caller_name(), vnode_name,
                                    host_resc_avail['ncpus']))
                        # set the vnode value
                        vnode_resc_avail['ncpus'] = threads
                        pbs.logmsg(pbs.EVENT_DEBUG4, vnode_msg_cpu %
                                   (caller_name(), vnode_key,
                                    vnode_resc_avail['ncpus']))
                    else:
                        if 'ncpus' not in host_resc_avail:
                            host_resc_avail['ncpus'] = 0
                        if not isinstance(host_resc_avail['ncpus'],
                                          (int, pbs.pbs_int)):
                            host_resc_avail['ncpus'] = 0
                        # update the cumulative value
                        host_resc_avail['ncpus'] += threads
                        pbs.logmsg(pbs.EVENT_DEBUG4, vnode_msg_cpu %
                                   (caller_name(), vnode_name,
                                    host_resc_avail['ncpus']))
                elif key in ['mem', 'vmem', 'hpmem']:
                    # Used for vnodes per NUMA socket
                    if vnodes:
                        mem_val = val
                        if isinstance(val, float):
                            mem_val = int(val)
                        # remove X MB - handle jitter in mem reported by OS
                        key_to_subsys = ({'mem': 'memory',
                                          'vmem': 'memsw',
                                          'hpmem': 'hugetlb'})
                        if key != 'hpmem':
                            mem_val -= adjust_bytes_per_node
                        mem_val -= (1024 * 1024
                                    * self.cfg['cgroup'][key_to_subsys[key]]
                                                        ['vnode_hidden_mb'])
                        if mem_val < 0:
                            mem_val = 0
                        mem_val -= mem_val % (1024 * 1024)
                        vnode_resc_avail[key] = \
                            pbs.size(convert_size(mem_val, 'mb'))
                elif isinstance(val, list):
                    pass
                elif isinstance(val, dict):
                    pass
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: key = %s (%s)' %
                               (caller_name(), key, type(key)))
                    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: val = %s (%s)' %
                               (caller_name(), val, type(val)))
                    if vnodes:
                        vnode_resc_avail[key] = val
                        host_resc_avail[key] = initialize_resource(val)
                    else:
                        if key not in host_resc_avail:
                            host_resc_avail[key] = initialize_resource(val)
                        else:
                            if not host_resc_avail[key]:
                                host_resc_avail[key] = initialize_resource(val)
                        host_resc_avail[key] += val
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: vnode list: %s' %
                   (caller_name(), str(vnode_list)))
        if vnodes:
            for nnid in self.numa_nodes:
                vnode_key = vnode_name + '[%d]' % nnid
                vnode_resc_avail = vnode_list[vnode_key].resources_available
                # vmem can be smaller than mem if there is no swap, since
                # we try to hide 1MB of swap from the server
                if vnode_resc_avail['vmem'] < vnode_resc_avail['mem']:
                    vnode_resc_avail['vmem'] = vnode_resc_avail['mem']
                if (self.cfg['cgroup']['memsw']['enabled']
                        and self.cfg['cgroup']['memsw']['manage_cgswap']):
                    # Special case 0 cgswap since a bug creates a crash when
                    # the "0mb" pbs.size difference is assigned to the resource
                    if vnode_resc_avail['vmem'] == vnode_resc_avail['mem']:
                        vnode_resc_avail['cgswap'] = pbs.size('0')
                    else:
                        vnode_resc_avail['cgswap'] = \
                            vnode_resc_avail['vmem'] - vnode_resc_avail['mem']
                else:
                    # This unsets it if it was defined earlier and needs to
                    # disappear
                    host_resc_avail['cgswap'] = None

                pbs.logmsg(pbs.EVENT_DEBUG4, '%s: %s vnode_resc_avail: %s' %
                           (caller_name(), vnode_key, vnode_resc_avail))
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: host_resc_avail: %s' %
                   (caller_name(), host_resc_avail))
        return True

    def take_node_offline(self):
        """
        Take the local node and associated vnodes offline
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Taking vnode(s) offline' %
                   caller_name())
        # Check the offline file is present and skip if the node
        # is already offline (to reduce server traffic)
        if os.path.isfile(self.offline_file):
            pbs.logmsg(pbs.EVENT_DEBUG2,
                       '%s: Offline file already exists, skipping' %
                       caller_name())
            return
        # Attempt to take vnodes that match this host offline
        # Assume vnode names resemble self.hostname[#]
        (vnode_comments, failure) = \
            fetch_vnode_comments(pbs.event().vnode_list.keys(),
                                 timeout=self.cfg['server_timeout'])
        if failure:
            pbs.logmsg(pbs.EVENT_ERROR,
                       '%s: Failed contacting server for vnode comments'
                       % caller_name())
            pbs.logmsg(pbs.EVENT_ERROR, '%s: Not bringing vnodes offline'
                       % caller_name())
            return
        match_found = False
        for vnode_name in pbs.event().vnode_list:
            if (vnode_name == self.hostname or
                    re.match(self.hostname + r'\[.*\]', vnode_name)):
                pbs.event().vnode_list[vnode_name].state = pbs.ND_OFFLINE
                vnode_comment = vnode_comments[vnode_name]
                if vnode_comment:
                    if not self.offline_msg in vnode_comment:
                        vnode_comment += " " + self.offline_msg
                else:
                    vnode_comment = self.offline_msg
                pbs.event().vnode_list[vnode_name].comment = vnode_comment
                pbs.logmsg(pbs.EVENT_DEBUG2, '%s: %s; offlining %s' %
                           (caller_name(), self.offline_msg, vnode_name))
                match_found = True
        if not match_found:
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: No vnodes match %s' %
                       (caller_name(), self.hostname))
            return
        # Write a file locally to reduce server traffic when the node
        # is brought back online
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Offline file: %s' %
                   (caller_name(), self.offline_file))
        try:
            # Write a timestamp so that exechost_periodic can avoid
            # cleaning up before this event has sent updates to server
            with open(self.offline_file, 'w') as fd:
                fd.write(str(time.time()))
        except Exception as exc:
            pbs.logmsg(pbs.EVENT_DEBUG, '%s: Failed to write to %s: %s' %
                       (caller_name(), self.offline_file, exc))
            pass
        if not os.path.isfile(self.offline_file):
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Offline file not present: %s' %
                       (caller_name(), self.offline_file))
        pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Node taken offline' %
                   caller_name())

    def bring_node_online(self):
        """
        Bring the local node and associated vnodes online
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if not os.path.isfile(self.offline_file):
            pbs.logmsg(pbs.EVENT_DEBUG3, '%s: Offline file not present: %s' %
                       (caller_name(), self.offline_file))
            return
        # Read timestamp from offline file
        timestamp = float()
        try:
            with open(self.offline_file, 'r') as fd:
                timestamp = float(fd.read())
        except Exception as exc:
            pbs.logmsg(pbs.EVENT_DEBUG, '%s: Failed to read from %s: %s' %
                       (caller_name(), self.offline_file, exc))
            return
        # Only bring node online after minimum delay has passed
        delta = time.time() - timestamp
        if delta < float(self.cfg['online_nodes_min_delay']):
            pbs.logmsg(pbs.EVENT_DEBUG2,
                       '%s: Too soon since node was offlined' % caller_name())
            return
        # Get comments for vnodes associated with this event
        vnl = pbs.event().vnode_list.keys()
        (vnode_comments, failure) = \
            fetch_vnode_comments(vnl, timeout=self.cfg['server_timeout'])
        if failure:
            pbs.logmsg(pbs.EVENT_ERROR,
                       '%s: Failed contacting server for vnode comments'
                       % caller_name())
            pbs.logmsg(pbs.EVENT_ERROR, '%s: Not bringing vnodes online'
                       % caller_name())
            return
        # Bring vnodes online that this hook has taken offline
        for vnode_name in vnode_comments:
            if not self.offline_msg in vnode_comments[vnode_name]:
                pbs.logmsg(pbs.EVENT_DEBUG, ('%s: Comment for vnode %s '
                                             + 'was not set by this hook')
                           % (caller_name(), vnode_name))
                continue
            vnode = pbs.event().vnode_list[vnode_name]
            vnode.state = pbs.ND_FREE
            vnode_comment = vnode_comments[vnode_name]\
                .replace(self.offline_msg, "").strip()
            if len(vnode_comment) == 0:
                vnode_comment = None
            vnode.comment = vnode_comment
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: Vnode %s will be brought back online' %
                       (caller_name(), vnode_name))
        # Remove the offline file
        try:
            os.remove(self.offline_file)
        except Exception as exc:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: Failed to remove offline file: %s' %
                       (caller_name(), exc))


#
# CLASS CgroupUtils
#
class CgroupUtils(object):
    """
    Cgroup utility methods
    """

    def __init__(self, hostname, vnode, cfg=None, subsystems=None,
                 paths=None, vntype=None, assigned_resources=None,
                 systemd_version=None):
        self.hostname = hostname
        self.vnode = vnode

        # Read in the config file
        if cfg is not None:
            self.cfg = cfg
        else:
            self.cfg = self.parse_config_file()
        # Determine the systemd version (zero for no systemd)
        if systemd_version:
            self.systemd_version = systemd_version
        else:
            self.systemd_version = self._get_systemd_version()
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: systemd version seems to be %d'
                   % (caller_name(), self.systemd_version))
        # Collect the cgroup mount points
        if paths is not None:
            self.paths = paths
        else:
            self.paths = self._get_paths()

        # Define the local vnode type
        if vntype is not None:
            self.vntype = vntype
        else:
            self.vntype = self._get_vnode_type()

        # morph the strings that should become booleans
        # into booleans depending on host/vntype
        self.morph_config_dict_bools(self.cfg)
        pbs.logmsg(pbs.EVENT_DEBUG4, "Final cgroup cfg: %s" % repr(self.cfg))

        # Remove the added "enabled" in the cgroup section
        # it's added at all levels in the cfg because of the recursion,
        # but some of the code assumes only iterables are
        # in the "cgroup" dictionary,
        # without any guards to protect against extras!!
        if "enabled" in self.cfg['cgroup']:
            del self.cfg['cgroup']['enabled']

        if not self.cfg['cgroup']['devices']['enabled']:
            self.cfg['discover_gpus'] = False
            pbs.logmsg(pbs.EVENT_DEBUG, 'discover_gpus set to False because '
                       'devices subsystem is disabled')

        # Determine which subsystems we care about
        if subsystems is not None:
            self.subsystems = subsystems
        else:
            self.subsystems = self._target_subsystems()

        # Check if memsw is enabled despite lack of kernel support
        # if so disable memsw
        if 'memsw' in self.subsystems:
            memsw_limit_file = (self.paths['memsw']
                                + 'limit_in_bytes')
            if not os.path.isfile(memsw_limit_file):
                pbs.logmsg(pbs.EVENT_ERROR,
                           'CONFIG ERROR: CF enables memsw '
                           'but %s is missing'
                           % memsw_limit_file)
                pbs.logmsg(pbs.EVENT_ERROR,
                           'CONFIG ERROR: kernel swapaccount parameter is 0, '
                           'disabling memsw subsystem')
                pbs.logmsg(pbs.EVENT_ERROR,
                           'CONFIG ERROR: to fix this, either add '
                           'swapaccount=1 to kernel command line '
                           'or disable memsw')
                self.cfg['cgroup']['memsw']['enabled'] = False
                self.subsystems.remove('memsw')
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'remaining enabled subsystems: '
                           + repr(self.subsystems))

        # Return now if nothing is enabled
        if not self.subsystems:
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: No cgroups enabled' %
                       caller_name())
            self.assigned_resources = {}
            return

        # Collect the cgroup resources
        if assigned_resources:
            self.assigned_resources = assigned_resources
        else:
            self.assigned_resources = self._get_assigned_cgroup_resources()

        # location to store information for the different hook events
        self.hook_storage_dir = os.path.join(PBS_MOM_HOME, 'mom_priv',
                                             'hooks', 'hook_data')

        if not os.path.isdir(self.hook_storage_dir):
            try:
                os.makedirs(self.hook_storage_dir, 0o700)
            except OSError:
                pbs.logmsg(pbs.EVENT_DEBUG, 'Failed to create %s' %
                           self.hook_storage_dir)
        self.host_job_env_dir = os.path.join(PBS_MOM_HOME, 'aux')
        self.host_job_env_filename = os.path.join(self.host_job_env_dir,
                                                  '%s.env')
        # Temporarily stores list of new jobs that came after job_list was
        # written to mom hook input file (work around for periodic
        # and begin race condition)
        self.cgroup_jobs_file = os.path.join(self.hook_storage_dir,
                                             'cgroup_jobs')
        if not os.path.isfile(self.cgroup_jobs_file):
            self.empty_cgroup_jobs_file()

    def __repr__(self):
        return ('CgroupUtils(%s, %s, %s, %s, %s, %s, %s, %s)' %
                (repr(self.hostname),
                 repr(self.vnode),
                 repr(self.cfg),
                 repr(self.subsystems),
                 repr(self.paths),
                 repr(self.vntype),
                 repr(self.assigned_resources),
                 repr(self.systemd_version)))

    def write_to_stderr(self, job, msg):
        """
        Write a message to the job stderr file
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        filename = None
        try:
            if str(job.Join_Path) == 'oe':
                # If we write in stderr we might do it after the join!
                # so write in stdout instead
                filename = job.stdout_file()
            else:
                filename = job.stderr_file()
            pbs.logmsg(pbs.EVENT_DEBUG4, "Message to be written to %s: %s"
                       % (str(filename), msg.strip()))
            if filename is None:
                return
            # sticky bit requires leaving out os.O_CREAT
            fd = os.open(filename, os.O_APPEND|os.O_WRONLY)
            with os.fdopen(fd, 'a') as desc:
                desc.write(msg)
        except Exception:
            # tough luck for user, but not fatal to system
            # Note: sometimes normal (e.g. interactive jobs)
            pass

    def set_diag_messages(self, resc_used, msg, concate):
        """
        Sets the 'diag_messages' resource to msg. A json format of msg
        is required in order to merge msgs from sis moms and primary mom.
        Settting concate=true concates multiple string values of the
        same dict key into one.
        """
        try:
            json_msg = json.loads(msg)
        except Exception:
            json_msg = {}
        if 'diag_messages' not in resc_used:
            resc_used['diag_messages'] = json.dumps(json_msg)
        elif concate:
            try:
                json_resc = json.loads(resc_used['diag_messages'])
            except Exception:
                json_resc = {}
            for k in json_msg:
                if k in json_resc.keys() and not json_msg[k] in json_resc[k]:
                    json_resc[k] += f", {json_msg[k]}"
                else:
                    json_resc[k] = json_msg[k]
            resc_used['diag_messages'] = json.dumps(json_resc)
        else:
            resc_used['diag_messages'] = json.dumps(json_msg)

    def _target_subsystems(self):
        """
        Determine which subsystems are being requested
        Note that config file parsing has set "enabled" to false/true
        if necessary by now, no need to delve in config dictionary
        since self.enabled will discover it
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Check to see if this node is in the approved hosts list
        subsystems = []
        for key in self.cfg['cgroup']:
            if self.enabled(key):
                subsystems.append(key)
        # Add an entry for systemd if anything else is enabled. This allows
        # the hook to cleanup any directories systemd leaves behind.
        # Add at start since we want this processed first
        if subsystems and self.systemd_version >= 205:
            subsystems.insert(0, 'systemd')
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Enabled subsystems: %s' %
                   (caller_name(), subsystems))
        # It is not an error for all subsystems to be disabled.
        # This host or vnode type may be in the excluded list.
        return subsystems

    def _copy_from_parent(self, dest):
        """
        Copy a setting from the parent cgroup
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        filename = os.path.basename(dest)
        subdir = os.path.dirname(dest)
        parent = os.path.dirname(subdir)
        source = os.path.join(parent, filename)
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Copying value from %s to %s'
                   % (source, dest))
        if not os.path.isfile(source):
            raise CgroupConfigError('Failed to read %s' % (source))
        with open(source, 'r') as desc:
            self.write_value(dest, desc.read().strip())

    def _assemble_path(self, subsys, mnt_point, flags):
        """
        Determine the path for a cgroup directory given the subsystem, mount
        point, and mount flags
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if 'noprefix' in flags:
            prefix = ''
        else:
            if subsys == 'hugetlb':
                # hugetlb includes size in prefix
                # TODO: make size component configurable
                prefix = subsys + '.2MB.'
            elif subsys == 'memsw':
                prefix = 'memory.' + subsys + '.'
            elif subsys in ['systemd', 'perf_event']:
                prefix = ''
            else:
                prefix = subsys + '.'
        return os.path.join(mnt_point,
                            str(self.cfg['cgroup_prefix'])
                            + '.service/jobid',
                            prefix)

    def _get_paths(self):
        """
        Create a dictionary of the cgroup subsystems and their corresponding
        directories taking mount options (noprefix) into account
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        paths = {}
        subsys_to_discover = {'blkio', 'cpu', 'cpuacct', 'cpuset', 'devices',
                              'freezer', 'hugetlb', 'memory', 'net_cls',
                              'net_prio', 'perf_event', 'pids', 'rdma',
                              'systemd'}
        subsys_to_skip = set()

        # First deal with the ones with paths set in the configuration file
        for subsys in subsys_to_discover:
            if (subsys in self.cfg['cgroup']
                    and 'mount_path' in self.cfg['cgroup'][subsys]
                    and self.cfg['cgroup'][subsys]['mount_path']):
                flags = []
                if (subsys == 'cpuset'
                        and os.path.exists(os.path.join(self.cfg['cgroup']
                                                                ['cpuset']
                                                                ['mount_path'],
                                                        'cpus'))):
                    flags = ['noprefix']
                paths[subsys] = \
                    self._assemble_path(subsys,
                                        self.cfg['cgroup'][subsys]
                                                ['mount_path'],
                                        flags)
                # memory -> memsw, different prefix
                if (subsys == 'memory'):
                    paths['memsw'] = \
                        self._assemble_path(subsys,
                                            self.cfg['cgroup']['memory']
                                                    ['mount_path'],
                                            flags)
                subsys_to_skip.add(subsys)
        subsys_to_discover -= subsys_to_skip

        # Loop through the mounts and collect the ones for cgroups
        with open(os.path.join(os.sep, 'proc', 'mounts'), 'r') as desc:
            for line in desc:
                entries = line.split()
                if entries[2] != 'cgroup':
                    continue
                # It is possible to have more than one cgroup mounted in
                # the same place, so check them all for each mount.
                flags = entries[3].split(',')
                for subsys in subsys_to_discover:
                    if (subsys in flags
                            or (subsys == 'systemd'
                                and ('name=systemd' in flags))):
                        subsys_path_candidate = \
                            self._assemble_path(subsys, entries[1], flags)
                        # If there are more than one option, prefer shortest
                        if (subsys not in paths
                            or (len(paths[subsys])
                                > len(subsys_path_candidate))):
                            if subsys in paths:
                                pbs.logmsg(pbs.EVENT_DEBUG3,
                                           '_get_paths: shorter path+prefix '
                                           '%s used for subsystem %s'
                                           % (subsys_path_candidate, subsys))
                            if subsys == 'memory':
                                # memory and memsw share a common mount point,
                                # but use a different prefix
                                paths['memsw'] = \
                                    self._assemble_path('memsw', entries[1],
                                                        flags)
                            paths[subsys] = subsys_path_candidate

        # if a host does not have any cgroup controllers mounted
        # don't panic here, let main code handle it by just accepting event

        return paths

    def _cgroup_path(self, subsys, cgfile='', jobid=''):
        """
        Return the path to a cgroup file or directory
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Note: The tasks file never uses a prefix (e.g. use tasks and not
        # cpuset.tasks).
        # Note: The os.path.join() method is smart enough to ignore
        # empty strings unless they occur as the last parameter.
        if not subsys or subsys not in self.paths:
            return None
        try:
            subdir, prefix = os.path.split(self.paths[subsys])
        except Exception:
            return None
        if not cgfile:
            if jobid:
                # Caller wants parent directory of job
                return os.path.join(subdir, jobid, '')
            # Caller wants job parent directory for subsystem
            return os.path.join(subdir, '')
        # Caller wants full path to file
        if cgfile == 'tasks':
            # tasks file never uses a prefix
            return os.path.join(subdir, jobid,
                                cgfile)
        if jobid:
            return os.path.join(subdir, jobid,
                                prefix + cgfile)
        return os.path.join(subdir, prefix + cgfile)

    def morph_config_dict_bools(self, config_dict, subsection=None):
        """
        function to morph 'vntype in: vntype1,vntype2,...'
        and 'vntype not in: ...' values
        into booleans depending on the vntype in the CgroupConfig object
        Ditto for 'host in:' and 'host not in:'
        Convert old run_only_on_hosts and exclude_vntypes to derive
        'enabled' boolean (which will now _always_ be defined)
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        vntype = self.vntype
        # avoid crashes in fnmatch if no vntype was specified on the host
        if not vntype:
            vntype = "__UNKNOWN__"
        # get a 'basestring' type that identifies all string types
        # already exists in Python 2 (has both std and unicode strings)
        # but not in Python 3, which only has "str" (always unicode)
        try:
            basestring
        except NameError:
            basestring = str
        # We want a view/iterator object, not something that creates copied
        # lists. iteritems/viewitems() no longer exists in Py3
        # since items() itself is now implemented as a view object.
        dict_iter_object = (config_dict.iteritems() if PYTHON2
                            else config_dict.items())
        for key_found, value_found in dict_iter_object:
            if isinstance(value_found, dict):
                # subsection found
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           "%s: Cfg file parsing, subsection for %s"
                           % (caller_name(), key_found))
                self.morph_config_dict_bools(value_found, key_found)
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           "%s: Cfg file parsing, finished subsection for %s"
                           % (caller_name(), key_found))
            elif isinstance(value_found, basestring):
                # string value -- could be morphable description
                value_split = value_found.strip().split(':', 1)
                if (len(value_split) > 1
                        and value_split[0].lower().strip() == 'vntype in'):
                    vntypes_t_unstripped = value_split[1].split(',')
                    vntypes_t = [item.strip() for item in vntypes_t_unstripped]
                    if any([fnmatch.fnmatch(vntype, p) for p in vntypes_t]):
                        config_dict[key_found] = True
                    else:
                        config_dict[key_found] = False
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               "%s: Config file parsing,"
                               " set %s to %s based on vntype inclusion"
                               % (caller_name(), key_found,
                                  str(config_dict[key_found])))
                elif (len(value_split) > 1
                        and value_split[0].lower().strip() == 'vntype not in'):
                    vntypes_f_unstripped = value_split[1].split(',')
                    vntypes_f = [item.strip() for item in vntypes_f_unstripped]
                    if any([fnmatch.fnmatch(vntype, p) for p in vntypes_f]):
                        config_dict[key_found] = False
                    else:
                        config_dict[key_found] = True
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               "%s: Config file parsing,"
                               " set %s to %s based on vntype exclusion"
                               % (caller_name(), key_found,
                                  str(config_dict[key_found])))
                elif (len(value_split) > 1
                        and value_split[0].lower().strip() == 'host in'):
                    hosts_t_unstripped = value_split[1].split(',')
                    hosts_t = [item.strip() for item in hosts_t_unstripped]
                    if any([fnmatch.fnmatch(self.hostname, p)
                            for p in hosts_t]):
                        config_dict[key_found] = True
                    else:
                        config_dict[key_found] = False
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               "%s: Config file parsing,"
                               " set %s to %s based on host inclusion"
                               % (caller_name(), key_found,
                                  str(config_dict[key_found])))
                elif (len(value_split) > 1
                        and value_split[0].lower().strip() == 'host not in'):
                    hosts_f_unstripped = value_split[1].split(',')
                    hosts_f = [item.strip() for item in hosts_f_unstripped]
                    if any([fnmatch.fnmatch(self.hostname, p)
                            for p in hosts_f]):
                        config_dict[key_found] = False
                    else:
                        config_dict[key_found] = True
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               "%s: Config file parsing,"
                               " set %s to %s based on host exclusion"
                               % (caller_name(), key_found,
                                  str(config_dict[key_found])))

        # Old "exclude_vntypes" now modulates current "enabled"
        # (if present) or creates it if non-empty
        if ("exclude_vntypes" in config_dict
                and config_dict['exclude_vntypes']):
            if ("enabled" not in config_dict
                    or not isinstance(config_dict['enabled'], bool)):
                config_dict['enabled'] = False
            if (config_dict['enabled'] and
                    any([fnmatch.fnmatch(vntype, p)
                         for p in config_dict['exclude_vntypes']])):
                config_dict['enabled'] = False
                if subsection is None:
                    subname = 'all subsystems'
                else:
                    subname = 'subsystem ' + subsection
                pbs.logmsg(pbs.EVENT_DEBUG,
                           '%s: cgroup excluded for '
                           '%s on vnode type %s' %
                           (caller_name(), subname, vntype))
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           '%s is in the excluded vnode type list: %s' %
                           (vntype, config_dict['exclude_vntypes']))
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       "%s: Config file parsing, "
                       "set %s to %s based on exclude_vntypes"
                       % (caller_name(), 'enabled',
                          str(config_dict['enabled'])))

        # Old "exclude_hosts" now modulates current "enabled" (if present)
        # or creates enabled if it is non-empty
        if ("exclude_hosts" in config_dict
                and config_dict['exclude_hosts']):
            if ("enabled" not in config_dict
                    or not isinstance(config_dict['enabled'], bool)):
                config_dict['enabled'] = False
            if (config_dict['enabled'] and
                any([fnmatch.fnmatch(self.hostname, p)
                     for p in config_dict['exclude_hosts']])):
                config_dict['enabled'] = False
                if subsection is None:
                    subname = 'all subsystems'
                else:
                    subname = 'subsystem ' + subsection
                pbs.logmsg(pbs.EVENT_DEBUG,
                           '%s: cgroup excluded for '
                           '%s on host %s' %
                           (caller_name(), subname, self.hostname))
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           '%s is in the excluded host list: %s' %
                           (self.hostname, config_dict['exclude_hosts']))
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       "%s: Config file parsing, "
                       "set %s to %s based on exclude_hosts"
                       % (caller_name(), 'enabled',
                          str(config_dict['enabled'])))
        # mirror image include_hosts of old "exclude_hosts"
        # now modulates current "enabled" (if present)
        # or creates enabled if it is non-empty
        if ("include_hosts" in config_dict
                and config_dict['include_hosts']):
            if ("enabled" not in config_dict
                    or not isinstance(config_dict['enabled'], bool)):
                config_dict['enabled'] = \
                    (any([fnmatch.fnmatch(self.hostname, p)
                          for p in config_dict['include_hosts']]))
            else:
                config_dict['enabled'] = \
                    (config_dict['enabled']
                     or any([fnmatch.fnmatch(self.hostname, p)
                             for p in config_dict['include_hosts']]))
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       "%s: Config file parsing, "
                       "set %s to %s based on include_hosts"
                       % (caller_name(), 'enabled',
                          str(config_dict['enabled'])))

        # Add "disabled" if unspecified
        if "enabled" not in config_dict:
            config_dict['enabled'] = False
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       "%s: Config file parsing, "
                       "section disabled by default"
                       % caller_name())

        # Old "run_only_on_hosts" limits enabled hosts if present
        if ("run_only_on_hosts" in config_dict
                and config_dict['run_only_on_hosts']):
            config_dict['enabled'] = \
                (config_dict['enabled']
                 and any([fnmatch.fnmatch(self.hostname, p)
                          for p in config_dict['run_only_on_hosts']]))
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       "%s: Config file parsing,"
                       " set %s to %s based on run_only_on_hosts"
                       % (caller_name(), 'enabled',
                          str(config_dict['enabled'])))

    @staticmethod
    def parse_config_file():
        """
        Read the config file in json format
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Turn everything off by default. These settings be modified
        # when the configuration file is read. Keep the keys in sync
        # with the default cgroup configuration files.
        defaults = {}
        defaults['enabled'] = True
        defaults['cgroup_prefix'] = 'pbs_jobs'
        defaults['cgroup_lock_file'] = os.path.join(PBS_MOM_HOME, 'mom_priv',
                                                    'cgroups.lock')
        defaults['discover_gpus'] = True
        defaults['nvidia-smi'] = os.path.join(os.sep, 'usr', 'bin',
                                              'nvidia-smi')
        defaults['exclude_hosts'] = []
        defaults['exclude_vntypes'] = []
        defaults['run_only_on_hosts'] = []
        defaults['periodic_resc_update'] = False
        defaults['vnode_per_numa_node'] = False
        defaults['online_offlined_nodes'] = False
        defaults['online_nodes_min_delay'] = 30
        defaults['use_hyperthreads'] = False
        defaults['ncpus_are_cores'] = False
        defaults['kill_timeout'] = 10
        defaults['server_timeout'] = 15
        defaults['job_setup_timeout'] = 30
        defaults['placement_type'] = 'load_balanced'
        defaults['propagate_vntype_to_server'] = True
        defaults['manage_rlimit_as'] = True
        defaults['cgroup'] = {}
        defaults['cgroup']['cpu'] = {}
        defaults['cgroup']['cpu']['enabled'] = False
        defaults['cgroup']['cpu']['exclude_hosts'] = []
        defaults['cgroup']['cpu']['exclude_vntypes'] = []
        defaults['cgroup']['cpu']['cfs_period_us'] = 100000
        defaults['cgroup']['cpu']['cfs_quota_fudge_factor'] = 1.03
        defaults['cgroup']['cpu']['enforce_per_period_quota'] = False
        # For zero_cpus_shares_fraction, the default value of 0.002 * 1000 = 2,
        # which is the smallest value allowed by kernel as cpu.shares
        defaults['cgroup']['cpu']['zero_cpus_shares_fraction'] = 0.002
        defaults['cgroup']['cpu']['zero_cpus_quota_fraction'] = 0.2
        defaults['cgroup']['blkio'] = {}
        defaults['cgroup']['blkio']['enabled'] = False
        defaults['cgroup']['cpuacct'] = {}
        defaults['cgroup']['cpuacct']['enabled'] = False
        defaults['cgroup']['cpuacct']['exclude_hosts'] = []
        defaults['cgroup']['cpuacct']['exclude_vntypes'] = []
        defaults['cgroup']['cpuset'] = {}
        defaults['cgroup']['cpuset']['enabled'] = False
        defaults['cgroup']['cpuset']['exclude_cpus'] = []
        defaults['cgroup']['cpuset']['exclude_hosts'] = []
        defaults['cgroup']['cpuset']['exclude_vntypes'] = []
        defaults['cgroup']['cpuset']['mem_fences'] = True
        defaults['cgroup']['cpuset']['mem_hardwall'] = False
        defaults['cgroup']['cpuset']['memory_spread_page'] = False
        defaults['cgroup']['cpuset']['allow_zero_cpus'] = True
        defaults['cgroup']['devices'] = {}
        defaults['cgroup']['devices']['enabled'] = False
        defaults['cgroup']['devices']['exclude_hosts'] = []
        defaults['cgroup']['devices']['exclude_vntypes'] = []
        defaults['cgroup']['devices']['allow'] = []
        defaults['cgroup']['memory'] = {}
        defaults['cgroup']['memory']['enabled'] = False
        defaults['cgroup']['memory']['exclude_hosts'] = []
        defaults['cgroup']['memory']['exclude_vntypes'] = []
        defaults['cgroup']['memory']['soft_limit'] = False
        defaults['cgroup']['memory']['default'] = '0MB'
        defaults['cgroup']['memory']['enforce_default'] = True
        defaults['cgroup']['memory']['exclhost_ignore_default'] = False
        defaults['cgroup']['memory']['reserve_percent'] = 0
        defaults['cgroup']['memory']['reserve_amount'] = '0MB'
        defaults['cgroup']['memory']['vnode_hidden_mb'] = 1
        defaults['cgroup']['memory']['swappiness'] = 1
        defaults['cgroup']['memsw'] = {}
        defaults['cgroup']['memsw']['enabled'] = False
        defaults['cgroup']['memsw']['exclude_hosts'] = []
        defaults['cgroup']['memsw']['exclude_vntypes'] = []
        defaults['cgroup']['memsw']['default'] = '0MB'
        defaults['cgroup']['memsw']['enforce_default'] = True
        defaults['cgroup']['memsw']['exclhost_ignore_default'] = False
        defaults['cgroup']['memsw']['reserve_percent'] = 0
        defaults['cgroup']['memsw']['reserve_amount'] = '0MB'
        defaults['cgroup']['memsw']['vnode_hidden_mb'] = 1
        defaults['cgroup']['memsw']['manage_cgswap'] = False
        defaults['cgroup']['hugetlb'] = {}
        defaults['cgroup']['hugetlb']['enabled'] = False
        defaults['cgroup']['hugetlb']['exclude_hosts'] = []
        defaults['cgroup']['hugetlb']['exclude_vntypes'] = []
        defaults['cgroup']['hugetlb']['default'] = '0MB'
        defaults['cgroup']['hugetlb']['enforce_defaults'] = True
        defaults['cgroup']['hugetlb']['exclhost_ignore_default'] = False
        defaults['cgroup']['hugetlb']['reserve_percent'] = 0
        defaults['cgroup']['hugetlb']['reserve_amount'] = '0MB'
        defaults['cgroup']['hugetlb']['vnode_hidden_mb'] = 1

        # These are unmanaged -- if enabled only creation/removal
        # and filling in 'tasks' are currently performed
        defaults['cgroup']['blkio'] = {}
        defaults['cgroup']['blkio']['enabled'] = False
        defaults['cgroup']['freezer'] = {}
        defaults['cgroup']['freezer']['enabled'] = False
        defaults['cgroup']['net_cls'] = {}
        defaults['cgroup']['net_cls']['enabled'] = False
        defaults['cgroup']['net_prio'] = {}
        defaults['cgroup']['net_prio']['enabled'] = False
        defaults['cgroup']['perf_event'] = {}
        defaults['cgroup']['perf_event']['enabled'] = False
        defaults['cgroup']['pids'] = {}
        defaults['cgroup']['pids']['enabled'] = False
        defaults['cgroup']['rdma'] = {}
        defaults['cgroup']['rdma']['enabled'] = False

        # Identify the config file and read in the data
        config_file = ''
        if 'PBS_HOOK_CONFIG_FILE' in os.environ:
            config_file = os.environ['PBS_HOOK_CONFIG_FILE']
        if not config_file:
            tmpcfg = os.path.join(PBS_MOM_HOME, 'mom_priv', 'hooks',
                                  'pbs_cgroups.CF')
            if os.path.isfile(tmpcfg):
                config_file = tmpcfg
        if not config_file:
            tmpcfg = os.path.join(PBS_HOME, 'server_priv', 'hooks',
                                  'pbs_cgroups.CF')
            if os.path.isfile(tmpcfg):
                config_file = tmpcfg
        if not config_file:
            tmpcfg = os.path.join(PBS_MOM_HOME, 'mom_priv', 'hooks',
                                  'pbs_cgroups.json')
            if os.path.isfile(tmpcfg):
                config_file = tmpcfg
        if not config_file:
            tmpcfg = os.path.join(PBS_HOME, 'server_priv', 'hooks',
                                  'pbs_cgroups.json')
            if os.path.isfile(tmpcfg):
                config_file = tmpcfg
        if not config_file:
            raise CgroupConfigError('Config file not found')
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Config file is %s' %
                   (caller_name(), config_file))
        try:
            with open(config_file, 'r') as desc:
                config = merge_dict(defaults,
                                    json.load(desc, object_hook=decode_dict))
            # config file entries denotes reserved _swap_
            # but vnode_hidden_mb used in code for vmem relies
            # on total for physical plus swap (i.e. memsw)
            config['cgroup']['memsw']['vnode_hidden_mb'] += \
                config['cgroup']['memory']['vnode_hidden_mb']

        except IOError:
            raise CgroupConfigError('I/O error reading config file')
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   '%s: cgroup hook configuration: %s' %
                   (caller_name(), config))
        config['cgroup_prefix'] = systemd_escape(config['cgroup_prefix'])
        return config

    def _create_service(self):
        """
        Create the pbs_jobs.service systemd service
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if self.systemd_version < 205:
            return
        if (pbs.event().type == pbs.EXECJOB_BEGIN):
            # normally service is there for this event -- if so, return
            try:
                cmd = ['systemctl', 'is-active', self.cfg['cgroup_prefix']]
                process = subprocess.Popen(cmd, shell=False,
                                           stdout=subprocess.PIPE,
                                           stderr=subprocess.PIPE,
                                           universal_newlines=True)
                out = process.communicate()[0]
                if (process.returncode == 0):
                    # service is already active -- no need to create it
                    return
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG,
                               '%s: systemctl is-active <svc> return code %s'
                               % (caller_name(), process.returncode))
            except Exception:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           '%s: Failed to call systemctl is-active'
                           % caller_name())
                # was worth a try -- try to create service now
                # and see if that fails
                pass
        description = 'PBS Pro job parent service'
        servicefile = os.path.join(os.sep, 'run', 'systemd', 'system',
                                   self.cfg['cgroup_prefix'] + '.service')
        try:
            with open(servicefile, 'w') as desc:
                desc.write('[Unit]\n'
                           'Description=%s\n'
                           '[Service]\n'
                           'Type=simple\n'
                           'Slice=-.slice\n'
                           'TasksMax=infinity\n'
                           'RemainAfterExit=yes\n'
                           'ExecStart=/bin/sleep infinity\n'
                           'ExecStop=/bin/true\n'
                           'CPUAccounting=off\n'
                           'MemoryAccounting=off\n'
                           'Delegate=yes'
                           % description)
                desc.truncate()
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG, '%s: Failed to write service file: %s'
                       % (caller_name(), servicefile))
            raise
        try:
            cmd = ['systemctl', 'start', os.path.basename(servicefile)]
            process = subprocess.Popen(cmd, shell=False,
                                       stdout=subprocess.PIPE,
                                       stderr=subprocess.PIPE,
                                       universal_newlines=True)
            out, err = process.communicate()
            if (process.returncode == 0):
                pbs.logmsg(pbs.EVENT_DEBUG,
                           '%s: Started systemd service with file %s'
                           % (caller_name(), servicefile))
            else:
                pbs.logmsg(pbs.EVENT_ERROR,
                           '%s: systemctl start <svc> return code %s'
                           % (caller_name(), process.returncode))
                pbs.logmsg(pbs.EVENT_ERROR, '%s: stderr of systemctl was: %s'
                           % (caller_name(),
                              stringified_output(err)))
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG,
                       '%s: Failed to start systemd service: %s'
                       % (caller_name(), os.path.basename(servicefile)))
            raise

    def create_paths(self):
        """
        Create the cgroup parent directories that will contain the jobs
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        old_umask = os.umask(0o022)
        try:
            # Create a systemd service for PBS jobs (if necessary)
            self._create_service()
            # Create the directories that PBS will use to house the jobs
            # now under the controller mount at <prefix>.service/jobid
            for subsys in self.subsystems:
                subdir = self._cgroup_path(subsys)
                if not subdir:
                    raise CgroupConfigError('No path for subsystem: %s'
                                            % (subsys))
                created = False
                if not os.path.exists(subdir):
                    os.makedirs(subdir, 0o755)
                    created = True
                    pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Created directory %s' %
                               (caller_name(), subdir))
                if (not created and pbs.event().type == pbs.EXECJOB_BEGIN):
                    # only exechost_startup configures values in the cgroups
                    # if they exist
                    continue
                if subsys == 'memory' or subsys == 'memsw':
                    # Enable 'use_hierarchy' for memory when either memory
                    # or memsw is in use.
                    filename = self._cgroup_path('memory', 'use_hierarchy')
                    if not os.path.isfile(filename):
                        raise CgroupConfigError('Failed to configure %s' %
                                                (filename))
                    try:
                        self.write_value(filename, 1)
                    except CgroupBusyError:
                        # Some kernels do not like the value written when
                        # other jobs are running, or if the parent already
                        # enabled use_hierarchy.
                        # But then things were already set up anyway
                        pass
                elif subsys == 'cpuset':
                    # copy <cgroup_prefix>.services cpuset values
                    # from its parent (root), then copy those to
                    # directory under it; necessary if systemd is not there
                    (cpuset_dir, cpus_file) = \
                        os.path.split(self._cgroup_path(subsys, 'cpus'))
                    (memset_dir, mems_file) = \
                        os.path.split(self._cgroup_path(subsys, 'mems'))
                    cpuset_pardir = \
                        os.path.dirname(cpuset_dir)
                    self._copy_from_parent(os.path.join(cpuset_pardir,
                                                        cpus_file))
                    self._copy_from_parent(os.path.join(cpuset_pardir,
                                                        mems_file))
                    self._copy_from_parent(self._cgroup_path(subsys, 'cpus'))
                    self._copy_from_parent(self._cgroup_path(subsys, 'mems'))
        except Exception as exc:
            raise CgroupConfigError('Failed to create cgroup paths: %s' % exc)
        finally:
            os.umask(old_umask)

    def _get_vnode_type(self):
        """
        Return the vnode type of the local node
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # self.vnode is not defined for pbs_attach events so the vnode
        # type gets cached in the mom_priv/vntype file. First, check
        # to see if it is defined.
        resc_vntype = ''
        if self.vnode is not None:
            if 'vntype' in self.vnode.resources_available:
                if self.vnode.resources_available['vntype']:
                    resc_vntype = self.vnode.resources_available['vntype']
        pbs.logmsg(pbs.EVENT_DEBUG4, 'resc_vntype: %s' % resc_vntype)
        # Next, read it from the cache file.
        file_vntype = ''
        filename = os.path.join(PBS_MOM_HOME, 'mom_priv', 'vntype')
        try:
            with open(filename, 'r') as desc:
                file_vntype = desc.readline().strip()
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: Failed to read vntype file %s' %
                       (caller_name(), filename))
        pbs.logmsg(pbs.EVENT_DEBUG4, 'file_vntype: %s' % file_vntype)
        # If vntype was not set then log a message. It is too expensive
        # to have all moms query the server for large jobs.
        if not resc_vntype and not file_vntype:
            pbs.logmsg(pbs.EVENT_DEBUG3,
                       '%s: Could not determine vntype' % caller_name())
            return None
        # Return file_vntype if it is set and resc_vntype is not.
        if not resc_vntype and file_vntype:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'vntype: %s' % file_vntype)
            return file_vntype
        # Make sure the cache file is up to date.
        if resc_vntype and resc_vntype != file_vntype:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Updating vntype file')
            try:
                with open(filename, 'w') as desc:
                    desc.write(resc_vntype)
            except Exception:
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           '%s: Failed to update vntype file %s' %
                           (caller_name(), filename))
        pbs.logmsg(pbs.EVENT_DEBUG4, 'vntype: %s' % resc_vntype)
        return resc_vntype

    def _get_assigned_cgroup_resources(self):
        """
        Return a dictionary of currently assigned cgroup resources per job
        """
        # if jobs have a limit *exactly* equal to the total limit available
        # for all jobs, then they have no explicit memory req and the
        # limit is the result of an 'unlimited' default;
        # in that case, the scheduler assigned 0, so be consistent with it

        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        assigned = {}

        # Get totals available for all jobs to compare with later
        mem_avail = None
        filename = self._cgroup_path('memory', 'limit_in_bytes')
        if filename and os.path.isfile(filename):
            with open(filename) as desc:
                mem_avail = int(desc.readline())
        vmem_avail = None
        filename = self._cgroup_path('memsw', 'limit_in_bytes')
        if filename and os.path.isfile(filename):
            with open(filename) as desc:
                vmem_avail = int(desc.readline())
        hpmem_avail = None
        filename = self._cgroup_path('hugetlb', 'limit_in_bytes')
        if filename and os.path.isfile(filename):
            with open(filename) as desc:
                hpmem_avail = int(desc.readline())
        pbs.logmsg(pbs.EVENT_DEBUG4, "get_assigned_cgroup_resources:"
                   " total host avail mem=%s vmem=%s hpmem=%s"
                   % (mem_avail, vmem_avail, hpmem_avail))

        for key in self.paths:
            if key in ('blkio', 'cpu', 'cpuacct', 'freezer',
                       'net_cls', 'net_prio', 'perf_event',
                       'pids', 'rdma', 'systemd'):
                continue
            if not self.enabled(key):
                continue
            path = os.path.dirname(self._cgroup_path(key))
            # do not exclude orphans
            pattern = self._glob_subdir_wildcard()
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Examining %s' %
                       (caller_name(), os.path.join(path, pattern)))
            for subdir in glob.glob(os.path.join(path, pattern)):
                jobid = os.path.basename(subdir)
                if not jobid:
                    continue
                pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Job ID is %s' %
                           (caller_name(), jobid))
                if jobid not in assigned:
                    assigned[jobid] = {}
                if key not in assigned[jobid]:
                    assigned[jobid][key] = {}
                if key == 'cpuset':
                    with open(self._cgroup_path(key, 'cpus', jobid)) as desc:
                        assigned[jobid][key]['cpus'] = \
                            expand_list(desc.readline())
                    with open(self._cgroup_path(key, 'mems', jobid)) as desc:
                        assigned[jobid][key]['mems'] = \
                            expand_list(desc.readline())
                elif key == 'memory':
                    filename = self._cgroup_path(key, 'limit_in_bytes', jobid)
                    if filename and os.path.isfile(filename):
                        with open(filename) as desc:
                            assigned[jobid][key]['limit_in_bytes'] = \
                                int(desc.readline())
                        if assigned[jobid][key]['limit_in_bytes'] == mem_avail:
                            # not explicitly assigned, 'unlimited' raised dflt
                            assigned[jobid][key]['limit_in_bytes'] = 0
                    filename = self._cgroup_path(key,
                                                 'soft_limit_in_bytes', jobid)
                    if filename and os.path.isfile(filename):
                        with open(filename) as desc:
                            assigned[jobid][key]['soft_limit_in_bytes'] = \
                                int(desc.readline())
                        if (assigned[jobid][key]['soft_limit_in_bytes']
                                == mem_avail):
                            # not explicitly assigned, 'unlimited' raised dflt
                            assigned[jobid][key]['soft_limit_in_bytes'] = 0
                elif key == 'memsw':
                    filename = self._cgroup_path(key, 'limit_in_bytes', jobid)
                    if filename and os.path.isfile(filename):
                        with open(filename) as desc:
                            assigned[jobid][key]['limit_in_bytes'] = \
                                int(desc.readline())
                        if (assigned[jobid][key]['limit_in_bytes']
                                == vmem_avail):
                            # not explicitly assigned, 'unlimited' raised dflt
                            assigned[jobid][key]['limit_in_bytes'] = 0
                    else:
                        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: No such file: %s' %
                                   (caller_name(), filename))
                elif key == 'hugetlb':
                    filename = self._cgroup_path(key, 'limit_in_bytes', jobid)
                    if filename and os.path.isfile(filename):
                        with open(filename) as desc:
                            assigned[jobid][key]['limit_in_bytes'] = \
                                int(desc.readline())
                        if (assigned[jobid][key]['limit_in_bytes']
                                == hpmem_avail):
                            # not explicitly assigned, 'unlimited' raised dflt
                            assigned[jobid][key]['limit_in_bytes'] = 0
                elif key == 'devices':
                    path = self._cgroup_path(key, 'list', jobid)
                    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Devices path is %s' %
                               (caller_name(), path))
                    if path and os.path.isfile(path):
                        with open(path) as desc:
                            assigned[jobid][key]['list'] = []
                            for line in desc:
                                pbs.logmsg(pbs.EVENT_DEBUG4, '%s: '
                                           'Appending %s'
                                           % (caller_name(), line))
                                assigned[jobid][key]['list'].append(line)
                                pbs.logmsg(pbs.EVENT_DEBUG4,
                                           '%s: assigned[%s][%s][list] '
                                           '= %s'
                                           % (caller_name(), jobid, key,
                                              assigned[jobid][key]['list']))
                # Note: unmanaged but known subsystems should be filtered
                # at the top of the loop body
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Unknown subsystem %s' %
                               (caller_name(), key))
                    raise CgroupConfigError('Unknown subsystem: %s' % key)
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Returning %s' %
                   (caller_name(), str(assigned)))
        return assigned

    def _get_systemd_version(self):
        """
        Return an integer reflecting the systemd version, zero for no systemd
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        ver = 0
        try:
            process = subprocess.Popen(['systemctl', '--system', 'show',
                                        '--property=Version'],
                                       shell=False,
                                       stdout=subprocess.PIPE,
                                       stderr=subprocess.PIPE,
                                       universal_newlines=True)
            out = process.communicate()[0]
            # if we get a non-str type then convert
            # before calling splitlines
            # should not happen since we pass universal_newlines True
            # Note: some versions prepend "Version=", other versions
            # add a more precise version in parentheses after a space
            out_split = stringified_output(out).splitlines()
            ver = int(re.sub(r'Version=\D*(\d+).*', r'\1',
                             out_split[0].split()[0]))
        except Exception:
            # Note we also get here if we can't decode an int version
            return 0
        if not os.path.exists(
                os.path.join(os.sep, 'run', 'systemd', 'system')):
            # no place to drop unit files? systemd not running in system mode?
            return 0
        return ver

    def _glob_subdir_wildcard(self, extension=''):
        """
        Return a string that may be used as a pattern with glob.glob
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        buf = '[0-9]*'
        if extension:
            buf += '.' + extension
        return buf

    def enabled(self, subsystem):
        """
        Return whether a subsystem is enabled.
        if we get here OS is supported: if a controller is enabled
        in the cfg file but the controller is not mounted,
        it is a configuration error that should be fixed
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Check whether the subsystem is enabled in the configuration file
        if subsystem not in self.cfg['cgroup']:
            return False
        if ('enabled' in self.cfg
                and isinstance(self.cfg['enabled'], bool)
                and not self.cfg['enabled']):
            return False
        if ('enabled' not in self.cfg['cgroup'][subsystem]
                or not self.cfg['cgroup'][subsystem]['enabled']):
            return False
        # Check whether the cgroup is mounted for this subsystem
        if subsystem not in self.paths:
            raise CgroupConfigError('%s: cgroups enabled '
                                    'but not mounted for subsystem %s'
                                    % (caller_name(), subsystem))
            return False
        return True

    def default(self, subsystem):
        """
        Return the default value for a subsystem
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if subsystem in self.cfg['cgroup']:
            if 'default' in self.cfg['cgroup'][subsystem]:
                return self.cfg['cgroup'][subsystem]['default']
        return None

    def _is_pid_owner(self, pid, job_uid):
        """
        Check to see if the pid's owner matches the job's owner
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            proc_uid = os.stat('/proc/%d' % pid).st_uid
        except OSError:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Unknown pid: %d' % pid)
            return False
        except Exception as exc:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Unexpected error: %s' % exc)
            return False
        pbs.logmsg(pbs.EVENT_DEBUG4, '/proc/%d uid:%d' % (pid, proc_uid))
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Job uid: %d' % job_uid)
        if proc_uid != job_uid:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Proc uid: %d != Job owner: %d' %
                       (proc_uid, job_uid))
            return False
        return True

    def _get_pids_in_sid(self, sid=None):
        """
        Return a list of all PIDS associated with a session ID
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pids = []
        if not sid:
            return pids
        # Older kernels will not have a task directory
        if os.path.isdir(os.path.join(os.sep, 'proc', 'self', 'task')):
            check_tasks = True
        else:
            check_tasks = False
        pattern = os.path.join(os.sep, 'proc', '[0-9]*', 'stat')
        for filename in glob.glob(pattern):
            try:
                with open(filename, 'r') as desc:
                    line = desc.readline()
                    # valid columns are \(.+\) or [^\s]+
                    entries = re.split(r'\s+(\(.+\)|[^\s]+)\s+', line)
                    if int(entries[5]) != sid:
                        continue
                    if check_tasks:
                        # Thread group leader will have a task entry.
                        # No need to append entry from stat file.
                        taskdir = os.path.join(os.path.dirname(filename),
                                               'task')
                        for task in glob.glob(os.path.join(taskdir, '[0-9]*')):
                            pid = int(os.path.basename(task))
                            if pid not in pids:
                                pids.append(pid)
                    else:
                        # Append entry from stat file
                        if int(entries[0]) not in pids:
                            pids.append(int(entries[0]))
            except (OSError, IOError):
                # PIDs may come and go as we read /proc so the glob data can
                # become stale. Tolerate failures in this case.
                pass
        return pids

    def add_pids(self, pidarg, jobid):
        """
        Add some number of PIDs to the cgroup tasks files for each subsystem
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # make pids a list
        pids = []
        if isinstance(pidarg, int):
            sid = 0
            try:
                sid = os.getsid(pidarg)
            except OSError as exc:
                sid = -1
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           '%s: Request to attach session of non-existing'
                           ' PID %s to jobid %s'
                           % (caller_name(), pidarg, jobid))
            if (sid > 1):
                pids = self._get_pids_in_sid(sid)
        elif isinstance(pidarg, list):
            for pid in pidarg:
                if not isinstance(pid, int):
                    raise ValueError('PID list must contain integers')
            pids = pidarg
        else:
            raise ValueError('PID argument must be integer or list')
        if not pids:
            return
        if pbs.event().type == pbs.EXECJOB_LAUNCH:
            if 1 in pids:
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           '%s: Job %s contains defunct process' %
                           (caller_name(), jobid))
                # Use a list comprehension to remove all instances of the
                # number 1
                pids = [x for x in pids if x != 1]
        if not pids:
            return
        # check pids to make sure that they are owned by the job owner
        if pbs.event().type == pbs.EXECJOB_ATTACH:
            pbs.logmsg(pbs.EVENT_DEBUG4, 'event type: attach')
            try:
                uid = pwd.getpwnam(pbs.event().job.euser).pw_uid
            except Exception:
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           'Failed to lookup UID by name')
                raise
            tmp_pids = []
            for process in pids:
                if self._is_pid_owner(process, uid):
                    tmp_pids.append(process)
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG2,
                               'process %d not owned by %s' %
                               (process, uid))
            pids = tmp_pids
        if not pids:
            return
        # Determine which subsystems will be used
        for subsys in self.subsystems:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: subsys = %s' %
                       (caller_name(), subsys))
            # memsw and memory use the same tasks file
            if subsys == 'memsw' and 'memory' in self.subsystems:
                continue
            tasks_file = self._cgroup_path(subsys, 'tasks', jobid)
            if ((not os.path.exists(tasks_file))
                    and (subsys == 'cpuset')):
                if (self.cfg['cgroup']['cpuset']['enabled']
                        and not self.cfg['cgroup']['cpuset']
                                        ['allow_zero_cpus']):
                    pbs.logmsg(pbs.EVENT_JOB_USAGE,
                               'No cpuset cgroup present '
                               'and npcus==0 disallowed')
                    pbs.event().reject('No cpuset cgroup present '
                                       'and npcus==0 disallowed')
                else:
                    # zero CPU job: should be attached to root pbs cpuset
                    tasks_file = self._cgroup_path(subsys, 'tasks')
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: tasks file = %s' %
                       (caller_name(), tasks_file))
            try:
                for process in pids:
                    self.write_value(tasks_file, process, 'a')
            except IOError as exc:
                raise CgroupLimitError('Failed to add PIDs %s to %s (%s)' %
                                       (str(pids), tasks_file,
                                        errno.errorcode[exc.errno]))
            except Exception:
                raise

    def setup_job_devices_env(self, gpus):
        """
        Setup the job environment for the devices assigned to the job for an
        execjob_launch hook
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if 'devices' in self.subsystems:
            # prevent using GPUs without user awareness
            pbs.event().env['CUDA_VISIBLE_DEVICES'] = ''
        if 'device_names' in self.assigned_resources:
            names = self.assigned_resources['device_names']
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'devices: %s' % (names))
            offload_devices = []
            cuda_visible_devices = []
            for name in names:
                if name.startswith('mic'):
                    offload_devices.append(name[3:])
                elif name.startswith('nvidia'):
                    if 'uuid' in gpus[name]:
                        cuda_visible_devices.append(gpus[name]['uuid'])
                    if 'uuids' in gpus[name]:
                        cuda_visible_devices.extend(gpus[name]['uuids'])
            if offload_devices:
                value = "\\,".join(offload_devices)
                pbs.event().env['OFFLOAD_DEVICES'] = '%s' % value
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'offload_devices: %s' % offload_devices)
            if cuda_visible_devices:
                value = "\\,".join(cuda_visible_devices)
                pbs.event().env['CUDA_VISIBLE_DEVICES'] = '%s' % value
                pbs.event().env['CUDA_DEVICE_ORDER'] = 'PCI_BUS_ID'
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'cuda_visible_devices: %s' % cuda_visible_devices)
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'Environment: %s' % pbs.event().env)
            return [offload_devices, cuda_visible_devices]
        else:
            return False

    def _setup_subsys_devices(self, jobid, node):
        """
        Configure access to devices given the job ID and node resources
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if 'devices' not in self.subsystems:
            return
        devices_list_file = self._cgroup_path('devices', 'list', jobid)
        devices_deny_file = self._cgroup_path('devices', 'deny', jobid)
        devices_allow_file = self._cgroup_path('devices', 'allow', jobid)
        # Add devices the user is granted access to
        with open(devices_list_file, 'r') as desc:
            devices_allowed = desc.read().splitlines()
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Initial devices.list: %s' %
                   devices_allowed)
        # Deny access to mic and gpu devices
        accelerators = []
        devices = node.devices
        for devclass in devices:
            if devclass == 'mic' or devclass == 'gpu':
                for instance in devices[devclass]:
                    dev = devices[devclass][instance]
                    if 'extra_devs' in dev:
                        accelerators.extend(dev['extra_devs'])
                    accelerators.append('%d:%d' % (dev['major'], dev['minor']))
        # For CentOS 7 we need to remove a *:* rwm from devices.list
        # before we can add anything to devices.allow. Otherwise our
        # changes are ignored. Check to see if a *:* rwm is in devices.list
        # If so remove it
        value = 'a *:* rwm'
        if value in devices_allowed:
            self.write_value(devices_deny_file, value)
        # Verify that the following devices are not in devices.list
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Removing access to the following: %s' %
                   accelerators)
        for entry in accelerators:
            value = 'c %s rwm' % entry
            self.write_value(devices_deny_file, value)
        # Add devices back to the list
        devices_allow = self.cfg['cgroup']['devices']['allow']
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Allowing access to the following: %s' %
                   devices_allow)
        for item in devices_allow:
            if isinstance(item, str):
                pbs.logmsg(pbs.EVENT_DEBUG4, 'string item: %s' % item)
                self.write_value(devices_allow_file, item)
                pbs.logmsg(pbs.EVENT_DEBUG4, 'write_value: %s' % value)
                continue
            if not isinstance(item, list):
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           '%s: Entry is not a string or list: %s' %
                           (caller_name(), item))
                continue
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Device allow: %s' % item)
            stat_filename = os.path.join(os.sep, 'dev', item[0])
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Stat file: %s' % stat_filename)
            try:
                statinfo = os.stat(stat_filename)
            except OSError:
                pbs.logmsg(pbs.EVENT_DEBUG,
                           '%s: Entry not added to devices.allow: %s' %
                           (caller_name(), item))
                pbs.logmsg(pbs.EVENT_DEBUG4, '%s: File not found: %s' %
                           (caller_name(), stat_filename))
                continue
            except Exception as exc:
                pbs.logmsg(pbs.EVENT_DEBUG, 'Unexpected error: %s' % exc)
                continue
            device_type = None
            if stat.S_ISBLK(statinfo.st_mode):
                device_type = 'b'
            elif stat.S_ISCHR(statinfo.st_mode):
                device_type = 'c'
            if not device_type:
                pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Unknown device type: %s' %
                           (caller_name(), stat_filename))
                continue
            if len(item) == 3 and isinstance(item[2], str):
                value = '%s %s:%s %s' % (device_type,
                                         os.major(statinfo.st_rdev),
                                         item[2], item[1])
            else:
                value = '%s %s:%s %s' % (device_type,
                                         os.major(statinfo.st_rdev),
                                         os.minor(statinfo.st_rdev),
                                         item[1])
            self.write_value(devices_allow_file, value)
            pbs.logmsg(pbs.EVENT_DEBUG4, 'write_value: %s' % value)
        with open(devices_list_file, 'r') as desc:
            devices_allowed = desc.read().splitlines()
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Updated devices.list: %s' %
                   devices_allowed)

    def _assign_devices(self, device_kind, device_list, device_count, node):
        """
        Select devices to assign to the job
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        devices = device_list[:device_count]
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Device List: %s' % devices)
        device_names = []
        device_allowed = []
        for dev in devices:
            # Skip device if already present in names
            if dev in device_names:
                continue
            # Skip device if already present in allowed
            device_info = node.devices[device_kind][dev]
            dev_entry = '%s %d:%d rwm' % (device_info['type'],
                                          device_info['major'],
                                          device_info['minor'])
            if dev_entry in device_allowed:
                continue
            # Device controllers must also be added for certain devices
            if device_kind == 'mic':
                # Requires the ctrl (0) and the scif (1) to be added
                dev_entry = '%s %d:0 rwm' % (device_info['type'],
                                             device_info['major'])
                if dev_entry not in device_allowed:
                    device_allowed.append(dev_entry)
                dev_entry = '%s %d:1 rwm' % (device_info['type'],
                                             device_info['major'])
                if dev_entry not in device_allowed:
                    device_allowed.append(dev_entry)
            elif device_kind == 'gpu' and not device_info.get('is_gi', False):
                # Requires the ctrl (255) to be added
                # unless GPU is a GI from a MIG GPU
                dev_entry = '%s %d:255 rwm' % (device_info['type'],
                                               device_info['major'])
                if dev_entry not in device_allowed:
                    device_allowed.append(dev_entry)
            # Now append the device name and entry
            device_names.append(dev)
            dev_entry = '%s %d:%d rwm' % (device_info['type'],
                                          device_info['major'],
                                          device_info['minor'])
            if dev_entry not in device_allowed:
                device_allowed.append(dev_entry)
            # if there are extra majors/minors, add them too
            if 'extra_devs' in device_info:
                for extra in device_info['extra_devs']:
                    dev_entry = '%s %s rwm' % (device_info['type'],
                                               extra)
                    if dev_entry not in device_allowed:
                        device_allowed.append(dev_entry)

        return device_names, device_allowed

    def get_device_name(self, node, available, socket, major, minor):
        """
        Find the device name
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Get device name: major: %s, minor: %s' % (major, minor))
        if not isinstance(major, int):
            return None
        if not isinstance(minor, int):
            return None
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Possible devices: %s' % (available[socket]['devices']))
        for avail_device in available[socket]['devices']:
            avail_major = None
            avail_minor = None
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'Checking device: %s' % (avail_device))
            if avail_device.find('mic') != -1:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Check mic device: %s' % (avail_device))
                avail_major = node.devices['mic'][avail_device]['major']
                avail_minor = node.devices['mic'][avail_device]['minor']
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Device major: %s, minor: %s' % (major, minor))
            elif avail_device.find('nvidia') != -1:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Check gpu device: %s' % (avail_device))
                avail_major = node.devices['gpu'][avail_device]['major']
                avail_minor = node.devices['gpu'][avail_device]['minor']
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Device major: %s, minor: %s' % (major, minor))
            if avail_major == major and avail_minor == minor:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Device match: name: %s, major: %s, minor: %s' %
                           (avail_device, major, minor))
                return avail_device
        pbs.logmsg(pbs.EVENT_DEBUG4, 'No match found')
        return None

    def _combine_resources(self, dict1, dict2):
        """
        Take two dictionaries containing known types and combine them together
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        dest = {}
        for src in [dict1, dict2]:
            for key in src:
                val = src[key]
                vtype = type(val)
                if key not in dest:
                    if vtype is int:
                        dest[key] = 0
                    elif vtype is float:
                        dest[key] = 0.0
                    elif vtype is str:
                        dest[key] = ''
                    elif vtype is list:
                        dest[key] = []
                    elif vtype is dict:
                        dest[key] = {}
                    elif vtype is tuple:
                        dest[key] = ()
                    elif vtype is pbs.size:
                        dest[key] = pbs.size(0)
                    elif vtype is pbs.int:
                        dest[key] = pbs.int(0)
                    elif vtype is pbs.float:
                        dest[key] = pbs.float(0.0)
                    else:
                        raise ValueError('Unrecognized resource type')
                dest[key] += val
        return dest

    def _assign_resources(self, requested, available, socketlist, node):
        """
        Determine whether a job fits within resources
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        assigned = {'cpuset.cpus': [], 'cpuset.mems': []}
        if 'ncpus' in requested and int(requested['ncpus']) > 0:
            cores = set(available['cpus'])
            if not self.cfg['use_hyperthreads']:
                # Hyperthreads are excluded from core list
                cores -= set(node.cpuinfo['hyperthreads'])
            avail = len(cores)
            needed = int(requested['ncpus'])
            if self.cfg['use_hyperthreads'] and self.cfg['ncpus_are_cores']:
                needed *= node.cpuinfo['hyperthreads_per_core']
            if needed > avail:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           '%s: insufficient ncpus: %s needed, %s available'
                           % (caller_name(), needed, avail))
                return {}
            if self.cfg['use_hyperthreads']:
                # Find cores that are fully available
                empty_cores = set()
                for corenum in sorted(cores):
                    if (corenum not in node.cpuinfo['hyperthreads']
                            and set(node.cpuinfo['cpu'][corenum]['threads'])
                            .issubset(set(available['cpus']))):
                        # All hyperthreads available for this core
                        empty_cores.add(corenum)
                # Assign threads from the empty cores
                for corenum in sorted(empty_cores):
                    for thread in node.cpuinfo['cpu'][corenum]['threads']:
                        if thread in assigned['cpuset.cpus']:
                            # this thread is already assigned
                            continue
                        assigned['cpuset.cpus'].append(thread)
                        needed -= 1
                        if thread in cores:
                            cores.remove(thread)
                        if needed <= 0:
                            break
                    if needed <= 0:
                        break
            # When use_hyperthreads is enabled, the above block already
            # assigned all of the fully avaiable cores. There still may
            # be cores to assign. When use_hyperthreads is disabled, we
            # assign all the cores here.
            if needed <= 0:
                # we're done (will always hold if use_hyperthreads
                # and ncpus_are_cores are both True)
                pass
            elif needed <= len(cores):
                corelist = sorted(cores)
                assigned['cpuset.cpus'] += corelist[:needed]
            else:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           '%s: in final pass, '
                           '%d more ncpus needed than available'
                           % (caller_name(), needed - len(cores)))
                return {}

            # Set cpuset.mems to the socketlist for now even though
            # there may not be sufficient memory. Memory gets
            # checked later in this method.
            assigned['cpuset.mems'] = socketlist
        if 'mem' in requested or 'ngpus' in requested or 'nmics' in requested:
            # for multivnode systems asking memory/ngpus/nmics without asking
            # cpus is valid, need access to memory
            assigned['cpuset.mems'] = socketlist
        if 'nmics' in requested and int(requested['nmics']) > 0:
            assigned['device_names'] = []
            assigned['devices'] = []
            regex = re.compile('.*(mic).*')
            nmics = int(requested['nmics'])
            # Use a list comprehension to construct the mics list
            mics = [m.group(0)
                    for d in available['devices']
                    for m in [regex.search(d)] if m]
            if nmics > len(mics):
                pbs.logmsg(pbs.EVENT_DEBUG4, 'Insufficient nmics: %s/%s' %
                           (nmics, mics))
                return {}
            names, devices = self._assign_devices('mic', mics[:nmics],
                                                  nmics, node)
            for val in names:
                assigned['device_names'].append(val)
            for val in devices:
                assigned['devices'].append(val)
        if 'ngpus' in requested and int(requested['ngpus']) > 0:
            if 'device_names' not in assigned:
                assigned['device_names'] = []
                assigned['devices'] = []
            regex = re.compile('.*(nvidia).*')
            ngpus = int(requested['ngpus'])
            # Use a list comprehension to construct the gpus list
            gpus = [m.group(0)
                    for d in available['devices']
                    for m in [regex.search(d)] if m]
            if ngpus > len(gpus):
                pbs.logmsg(pbs.EVENT_DEBUG4, 'Insufficient ngpus: %s/%s' %
                           (ngpus, gpus))
                return {}
            names, devices = self._assign_devices('gpu', gpus[:ngpus],
                                                  ngpus, node)
            for val in names:
                assigned['device_names'].append(val)
            for val in devices:
                assigned['devices'].append(val)
        if 'mem' in requested:
            req_mem = size_as_int(requested['mem'])
            avail_mem = available['memory']
            if req_mem > avail_mem:
                if self.cfg['vnode_per_numa_node']:
                    # scheduler is not supposed to let this happen
                    debug_level = pbs.EVENT_ERROR
                else:
                    # can happen if chunk needs to be split over sockets
                    debug_level = pbs.EVENT_DEBUG4
                pbs.logmsg(debug_level,
                           ('Insufficient memory on socket(s) '
                            '%s: requested:%s, available:%s') %
                           (socketlist, req_mem, available['memory']))
                return {}
            if 'mem' not in assigned:
                assigned['mem'] = 0
            assigned['mem'] += req_mem
            if 'cpuset.mems' not in assigned:
                assigned['cpuset.mems'] = socketlist
        return assigned

    def assign_job(self, requested, available, node):
        """
        Assign resources to the job. There are two scenarios that need to
        be handled:
        1. If vnodes are present in the requested resources, then the
           scheduler has already decided where the job is to run. Check
           the available resources to ensure an orphaned cgroup is not
           consuming them.
        2. If no vnodes are present in the requested resources, try to
           span the fewest number of sockets when creating the assignment.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Requested: %s, Available: %s, Numa Nodes: %s' %
                   (requested, available, node.numa_nodes))
        # Create a list of memory-only NUMA nodes (for KNL). These get assigned
        # in addition to NUMA nodes with assigned devices or cpus.
        memory_only_nodes = []
        for nnid in node.numa_nodes:
            if not node.numa_nodes[nnid]['cpus'] and \
                    not node.numa_nodes[nnid]['devices']:
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Found memory only NUMA node: %s' %
                           (node.numa_nodes[nnid]))
                memory_only_nodes.append(nnid)
        # Create a list of vnode/socket pairs
        if 'vnodes' in requested:
            regex = re.compile(r'(.*)\[(\d+)\].*')
            pairlist = []
            for vnode in requested['vnodes']:
                pairlist.append([regex.search(vnode).group(1),
                                 int(regex.search(vnode).group(2))])
        else:
            sockets = list(available.keys())
            # If placement type is job_balanced, reorder the sockets
            if self.cfg['placement_type'] == 'job_balanced':
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Requested job_balanced placement')
                # Look at assigned_resources and determine which socket
                # to start with
                jobcount = {}
                for sock in sockets:
                    jobcount[sock] = 0
                for job in self.assigned_resources:
                    jobresc = self.assigned_resources[job]
                    if 'cpuset' in jobresc and 'mems' in jobresc['cpuset']:
                        for sock in jobresc['cpuset']['mems']:
                            jobcount[sock] += 1
                sorted_jobcounts = sorted(list(jobcount.items()),
                                          key=operator.itemgetter(1))
                reordered = []
                for count in sorted_jobcounts:
                    reordered.append(count[0])
                sockets = reordered
            elif self.cfg['placement_type'] == 'load_balanced':
                cpucounts = dict()
                for sock in sockets:
                    cpucounts[sock] = len(available[sock]['cpus'])
                sorted_cpucounts = sorted(list(cpucounts.items()),
                                          key=operator.itemgetter(1),
                                          reverse=True)
                reordered = list()
                for count in sorted_cpucounts:
                    reordered.append(count[0])
                sockets = reordered
            elif self.cfg['placement_type'] == 'load_packed':
                cpucounts = dict()
                for sock in sockets:
                    cpucounts[sock] = len(available[sock]['cpus'])
                sorted_cpucounts = sorted(list(cpucounts.items()),
                                          key=operator.itemgetter(1),
                                          reverse=False)
                reordered = list()
                for count in sorted_cpucounts:
                    reordered.append(count[0])
                sockets = reordered
            pairlist = []
            for sock in sockets:
                pairlist.append([None, int(sock)])
        # Loop through the sockets or vnodes and assign resources
        assigned = {}
        for pair in pairlist:
            vnode = pair[0]
            socket = pair[1]
            if vnode:
                myname = 'vnode %s[%d]' % (vnode, socket)
                req = requested['vnodes']['%s[%d]' % (vnode, socket)]
            else:
                myname = 'socket %d' % socket
                req = requested
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Current target is %s' % myname)
            new = None
            if socket in available:
                new = self._assign_resources(req, available[socket],
                                             [socket], node)
            else:
                pbs.logmsg(pbs.EVENT_ERROR, 'Attempt to allocate resources '
                           'on non-existing socket #' + str(socket))
            if new:
                new['cpuset.mems'].append(socket)
                # Add the memory-only NUMA nodes
                for nnid in memory_only_nodes:
                    if nnid not in new['cpuset.mems']:
                        new['cpuset.mems'].append(nnid)
                pbs.logmsg(pbs.EVENT_DEBUG4, 'Resources assigned to %s' %
                           myname)
                if vnode:
                    assigned = self._combine_resources(assigned, new)
                else:
                    # Requested resources fit on this socket
                    return new
            else:
                pbs.logmsg(pbs.EVENT_DEBUG4, 'Resources not assigned to %s' %
                           myname)
                # This is fatal in the case of vnodes
                if vnode:
                    return {}
        if vnode:
            if 'cpuset.cpus' in assigned:
                assigned['cpuset.cpus'].sort()
            if 'cpuset.mems' in assigned:
                assigned['cpuset.mems'].sort()
            if 'devices' in assigned:
                assigned['devices'].sort()
            if 'device_names' in assigned:
                assigned['device_names'].sort()
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'Assigned Resources: %s' % (assigned))
            return assigned
        # Not using vnodes so try spanning sockets
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Attempting to span sockets')
        total = {}
        socketlist = []
        for pair in pairlist:
            socket = pair[1]
            socketlist.append(socket)
            total = self._combine_resources(total, available[socket])
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Combined available resources: %s' %
                   (total))
        return self._assign_resources(requested, total, socketlist, node)

    def available_node_resources(self, node, exclude_jobid=None):
        """
        Determine which resources are available from the supplied node
        dictionary (i.e. the local node) by removing resources already
        assigned to jobs.
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        available = copy.deepcopy(node.numa_nodes)
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Available Keys: %s' % (available[0]))
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Available: %s' % (available))
        for socket in available:
            if 'mem' in available[socket]:
                available[socket]['memory'] = \
                    size_as_int(str(available[socket]['mem']))
            elif 'MemTotal' in available[socket]:
                # Find the memory on the socket in bytes.
                # Remove the 'b' to simplfy the math
                available[socket]['memory'] = size_as_int(
                    available[socket]['MemTotal'])
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Available prior to device add: %s' %
                   (available))
        for device in node.devices:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: Device Names: %s' %
                       (caller_name(), device))
            if device == 'mic' or device == 'gpu':
                pbs.logmsg(pbs.EVENT_DEBUG4, 'Devices: %s' %
                           node.devices[device])
                for device_name in node.devices[device]:
                    device_socket = \
                        node.devices[device][device_name]['numa_node']
                    if 'devices' not in available[device_socket]:
                        available[device_socket]['devices'] = []
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               'Device: %s, Socket: %s' %
                               (device, device_socket))
                    available[device_socket]['devices'].append(device_name)
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Available: %s' % (available))
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Assigned: %s' % (self.assigned_resources))
        # Remove all of the resources that are assigned to other jobs
        for jobid in self.assigned_resources:
            if exclude_jobid and (jobid == exclude_jobid):
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           ('Job %s res not removed from host '
                            'available res: excluded job') % jobid)
                continue

            # Support suspended jobs on nodes
            if job_is_suspended(jobid):
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           ('Job %s res not removed from host '
                            'available res: suspended job') % jobid)
                continue
            cpus = []
            sockets = []
            devices = []
            memory = 0
            jra = self.assigned_resources[jobid]
            if 'cpuset' in jra:
                if 'cpus' in jra['cpuset']:
                    cpus = jra['cpuset']['cpus']
                if 'mems' in jra['cpuset']:
                    sockets = jra['cpuset']['mems']
            if 'devices' in jra:
                if 'list' in jra['devices']:
                    devices = jra['devices']['list']
            if 'memory' in jra:
                if 'limit_in_bytes' in jra['memory']:
                    memory = size_as_int(jra['memory']['limit_in_bytes'])
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'cpus: %s, sockets: %s, memory limit: %s' %
                       (cpus, sockets, memory))
            pbs.logmsg(pbs.EVENT_DEBUG4, 'devices: %s' % devices)
            # Loop through the sockets and remove cpus that are
            # assigned to other cgroups
            for socket in sockets:
                for cpu in cpus:
                    try:
                        available[socket]['cpus'].remove(cpu)
                    except ValueError:
                        pass
                    except Exception:
                        pbs.logmsg(pbs.EVENT_DEBUG4,
                                   'Error removing %d from %s' %
                                   (cpu, available[socket]['cpus']))
            if len(sockets) == 1:
                avail_mem = available[sockets[0]]['memory']
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Sockets: %s\tAvailable: %s' %
                           (sockets, available))
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Decrementing memory: %d by %d' %
                           (size_as_int(avail_mem), memory))
                if memory <= available[sockets[0]]['memory']:
                    available[sockets[0]]['memory'] -= memory
            # Loop throught the available sockets
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'Assigned device to %s: %s' % (jobid, devices))
            for socket in available:
                for device in devices:
                    try:
                        # loop through known devices and see if they match
                        if available[socket]['devices']:
                            pbs.logmsg(pbs.EVENT_DEBUG4,
                                       'Check device: %s' % (device))
                            pbs.logmsg(pbs.EVENT_DEBUG4,
                                       'Available device: %s' %
                                       (available[socket]['devices']))
                            major, minor = device.split()[1].split(':')
                            avail_device = self.get_device_name(node,
                                                                available,
                                                                socket,
                                                                int(major),
                                                                int(minor))
                            pbs.logmsg(pbs.EVENT_DEBUG4,
                                       'Returned device: %s' %
                                       (avail_device))
                            if avail_device is not None:
                                pbs.logmsg(pbs.EVENT_DEBUG4,
                                           ('socket: %d,\t'
                                            'devices: %s,\t'
                                            'device to remove: %s') %
                                           (socket,
                                            available[socket]['devices'],
                                            avail_device))
                                available[socket]['devices'].remove(
                                    avail_device)
                    except ValueError:
                        pass
                    except Exception as exc:
                        pbs.logmsg(pbs.EVENT_DEBUG2,
                                   'Unexpected error: %s' % exc)
                        pbs.logmsg(pbs.EVENT_DEBUG2,
                                   'Error removing %s from %s' %
                                   (device, available[socket]['devices']))
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Available resources: %s' % (available))
        return available

    def set_swappiness(self, value, jobid=''):
        """
        Set the swappiness for a memory cgroup
        """
        pbs.logmsg(pbs.EVENT_DEBUG3, "%s: Method called" % (caller_name()))
        path = self._cgroup_path('memory', 'swappiness', jobid)
        try:
            self.write_value(path, value)
        except Exception as exc:
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Failed to adjust %s: %s' %
                       (caller_name(), path, exc))

    def set_limit(self, resource, value, jobid=''):
        """
        Set a cgroup limit on a node or a job
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if jobid:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: %s = %s for job %s' %
                       (caller_name(), resource, value, jobid))
        else:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: %s = %s for node' %
                       (caller_name(), resource, value))
        if resource == 'mem':
            if 'memory' in self.subsystems:
                path = self._cgroup_path('memory', 'limit_in_bytes', jobid)
                self.write_value(path, size_as_int(value))
        elif resource == 'softmem':
            if 'memory' in self.subsystems:
                path = self._cgroup_path('memory', 'soft_limit_in_bytes',
                                         jobid)
                self.write_value(path, size_as_int(value))
        elif resource == 'vmem':
            if 'memsw' in self.subsystems:
                if 'memory' not in self.subsystems:
                    path = self._cgroup_path('memory', 'limit_in_bytes',
                                             jobid)
                    self.write_value(path, size_as_int(value))
                path = self._cgroup_path('memsw', 'limit_in_bytes', jobid)
                self.write_value(path, size_as_int(value))
        elif resource == 'hpmem':
            if 'hugetlb' in self.subsystems:
                path = self._cgroup_path('hugetlb', 'limit_in_bytes', jobid)
                self.write_value(path, size_as_int(value))
        elif resource == 'ncpus':
            if 'cpu' in self.subsystems:
                # Note the value is already multiplied by threads/core
                # if ncpus_are_cores and use_hyperthreads are True
                path = self._cgroup_path('cpu', 'shares', jobid)
                weightless = False
                # 'zero' cpu jobs have the minimum shares, but value for
                # clamping to quota needs to be realistic
                if (value <= 0):
                    weightless = True
                    weightless_shares = (self.cfg['cgroup']
                                                 ['cpu']
                                                 ['zero_cpus_shares_fraction'])
                    # Note that the minimum in the kernel is 2
                    self.write_value(
                        path, int(max(2, weightless_shares * 1000)))
                    value = (self.cfg['cgroup']
                                     ['cpu']
                                     ['zero_cpus_quota_fraction'])
                else:
                    self.write_value(path, int(value * 1000))
                if (self.cfg['cgroup']['cpu']['enforce_per_period_quota']
                        or weightless):
                    # zero cpu jobs ALWAYS get a quota -- keep them honest
                    cfs_period_us = self.cfg['cgroup']['cpu']['cfs_period_us']
                    path = self._cgroup_path('cpu', 'cfs_period_us', jobid)
                    self.write_value(path, cfs_period_us)

                    cfs_quota_fudge_factor = \
                        self.cfg['cgroup']['cpu']['cfs_quota_fudge_factor']
                    path = self._cgroup_path('cpu', 'cfs_quota_us', jobid)
                    # zero cpu jobs are clamped to use less than one cpu
                    # during each period
                    cfs_quota_us_calculated = (cfs_period_us
                                               * value
                                               * cfs_quota_fudge_factor)

                    # Get the parent cgroup's maximum cfs_quota_us
                    # we cannot set the child cgroup value to anything more
                    # Note that some kernels display "unlimited" as signed -1
                    # So we should ignore non-positive values
                    max_cfs_quota_us = self._get_cfs_quota_us()
                    if ((max_cfs_quota_us is not None)
                            and (max_cfs_quota_us > 0)
                            and (cfs_quota_us_calculated > max_cfs_quota_us)):
                        cfs_quota_us_calculated = max_cfs_quota_us
                    self.write_value(path, int(cfs_quota_us_calculated))
        elif resource == 'cpuset.cpus':
            if 'cpuset' in self.subsystems:
                path = self._cgroup_path('cpuset', 'cpus', jobid)
                cpus = value
                if not cpus:
                    raise CgroupLimitError('Failed to configure cpuset cpus')
                cpus = ",".join(list(map(str, cpus)))
                self.write_value(path, cpus)
        elif resource == 'cpuset.mems':
            if 'cpuset' in self.subsystems:
                path = self._cgroup_path('cpuset', 'mems', jobid)
                if not os.path.exists(path):
                    # probably zero cpu job now in root cpuset -- do nothing
                    return
                if self.cfg['cgroup']['cpuset']['mem_fences']:
                    mems = value
                    if not mems:
                        raise CgroupLimitError(
                            'Failed to configure cpuset mems')
                    mems = ','.join(list(map(str, mems)))
                    self.write_value(path, mems)
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG4, ('Memory fences disabled, '
                                                  'copying cpuset.mems from '
                                                  ' parent for %s') % jobid)
                    self._copy_from_parent(path)
        elif resource == 'devices':
            if 'devices' in self.subsystems:
                path = self._cgroup_path('devices', 'allow', jobid)
                devices = value
                if not devices:
                    raise CgroupLimitError('Failed to configure devices')
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Setting devices: %s for %s' % (devices, jobid))
                for dev in devices:
                    self.write_value(path, dev)
                path = self._cgroup_path('devices', 'list', jobid)
                with open(path, 'r') as desc:
                    output = desc.readlines()
                pbs.logmsg(pbs.EVENT_DEBUG4, 'devices.list: %s' % output)
        else:
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Resource %s not handled' %
                       (caller_name(), resource))

    def update_job_usage(self, jobid, resc_used, force=False):
        """
        Update resource usage for a job
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: resc_used = %s' %
                   (caller_name(), str(resc_used)))
        if not job_is_running(jobid) and not force:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Job %s is not running' %
                       (caller_name(), jobid))
            return
        if pbs.event().type in [pbs.EXECHOST_PERIODIC, pbs.EXECJOB_EPILOGUE]:
            # Initialize diag_messages in order to be able
            # to merge msgs only from sisters
            self.set_diag_messages(resc_used, '{}', True)
        # Sort the subsystems so that we consistently look at the subsystems
        # in the same order every time
        self.subsystems.sort()
        for subsys in self.subsystems:
            if subsys == 'memory':
                max_mem = self._get_max_mem_usage(jobid)
                if max_mem is None:
                    pbs.logjobmsg(jobid, '%s: No max mem data' % caller_name())
                else:
                    resc_used['mem'] = pbs.size(convert_size(max_mem, 'kb'))
                    pbs.logjobmsg(jobid, '%s: Memory usage: mem=%s' %
                                  (caller_name(), resc_used['mem']))
                mem_failcnt = self._get_mem_failcnt(jobid)
                if mem_failcnt is None:
                    pbs.logjobmsg(jobid, '%s: No mem fail count data' %
                                  caller_name())
                else:
                    # Check to see if the job exceeded its resource limits
                    if mem_failcnt > 0:
                        err_msg = self._get_error_msg(jobid)
                        pbs.logjobmsg(jobid,
                                      'Cgroup memory limit exceeded: %s' %
                                      (err_msg))
                        if (pbs.event().type == pbs.EXECJOB_EPILOGUE
                                and pbs.event().job.in_ms_mom()):
                            self.write_to_stderr(pbs.event().job,
                                                 "Cgroup mem limit "
                                                 "exceeded: %s\n" % (err_msg))
                        if pbs.event().type in \
                           [pbs.EXECHOST_PERIODIC, pbs.EXECJOB_EPILOGUE]:
                            self.set_diag_messages(resc_used, '{"%s":'
                                                   '"Cgroup mem limit '
                                                   'exceeded"}'
                                                   % pbs.get_local_nodename(),
                                                   True)
            elif subsys == 'memsw':
                max_vmem = self._get_max_memsw_usage(jobid)
                if max_vmem is None:
                    pbs.logjobmsg(jobid, '%s: No max vmem data' %
                                  caller_name())
                else:
                    resc_used['vmem'] = pbs.size(convert_size(max_vmem, 'kb'))
                    pbs.logjobmsg(jobid, '%s: Memory usage: vmem=%s' %
                                  (caller_name(), resc_used['vmem']))
                vmem_failcnt = self._get_memsw_failcnt(jobid)
                if vmem_failcnt is None:
                    pbs.logjobmsg(jobid, '%s: No vmem fail count data' %
                                  caller_name())
                else:
                    pbs.logjobmsg(jobid, '%s: vmem fail count: %d ' %
                                  (caller_name(), vmem_failcnt))
                    if vmem_failcnt > 0:
                        err_msg = self._get_error_msg(jobid)
                        pbs.logjobmsg(jobid,
                                      'Cgroup memsw limit exceeded: %s\n' %
                                      (err_msg))
                        if (pbs.event().type == pbs.EXECJOB_EPILOGUE
                                and pbs.event().job.in_ms_mom()):
                            self.write_to_stderr(pbs.event().job,
                                                 "Cgroup memsw limit "
                                                 "exceeded: %s" % (err_msg))
                        if pbs.event().type in \
                           [pbs.EXECHOST_PERIODIC, pbs.EXECJOB_EPILOGUE]:
                            self.set_diag_messages(resc_used, '{"%s":'
                                                   '"Cgroup memsw limit '
                                                   'exceeded"}'
                                                   % pbs.get_local_nodename(),
                                                   True)
            elif subsys == 'hugetlb':
                max_hpmem = self._get_max_hugetlb_usage(jobid)
                if max_hpmem is None:
                    pbs.logjobmsg(jobid, '%s: No max hpmem data' %
                                  caller_name())
                    return
                hpmem_failcnt = self._get_hugetlb_failcnt(jobid)
                if hpmem_failcnt is None:
                    pbs.logjobmsg(jobid, '%s: No hpmem fail count data' %
                                  caller_name())
                    return
                if hpmem_failcnt > 0:
                    err_msg = self._get_error_msg(jobid)
                    pbs.logjobmsg(jobid, 'Cgroup hugetlb limit exceeded: %s' %
                                  (err_msg))
                    if (pbs.event().type == pbs.EXECJOB_EPILOGUE
                            and pbs.event().job.in_ms_mom()):
                        self.write_to_stderr(pbs.event().job,
                                             "Cgroup hugetlb limit "
                                             "exceeded: %s" % (err_msg))
                    if pbs.event().type in \
                       [pbs.EXECHOST_PERIODIC, pbs.EXECJOB_EPILOGUE]:
                        self.set_diag_messages(resc_used, '{"%s":'
                                               '"Cgroup hugetlb limit '
                                               'exceeded"}'
                                               % pbs.get_local_nodename(),
                                               True)
                resc_used['hpmem'] = pbs.size(convert_size(max_hpmem, 'kb'))
                pbs.logjobmsg(jobid, '%s: Hugepage usage: %s' %
                              (caller_name(), resc_used['hpmem']))
            elif subsys == 'cpuacct':
                if 'walltime' not in resc_used:
                    walltime = 0
                else:
                    if resc_used['walltime']:
                        walltime = int(resc_used['walltime'])
                    else:
                        walltime = 0
                if 'cput' not in resc_used:
                    cput = 0
                else:
                    if resc_used['cput']:
                        cput = int(resc_used['cput'])
                    else:
                        cput = 0
                # Calculate cpupercent based on the reported values
                if walltime > 0:
                    cpupercent = (100.0 * cput) / walltime
                else:
                    cpupercent = 0
                resc_used['cpupercent'] = pbs.pbs_int(int(cpupercent))
                pbs.logjobmsg(jobid, '%s: CPU percent: %d' %
                              (caller_name(), cpupercent))
                # Now update cput
                cput = self._get_cpu_usage(jobid)
                if cput is None:
                    pbs.logjobmsg(jobid, '%s: No CPU usage data' %
                                  caller_name())
                    return
                cput = convert_time(str(cput) + 'ns')
                resc_used['cput'] = pbs.duration(cput)
                pbs.logjobmsg(jobid, '%s: CPU usage: %.3lf secs' %
                              (caller_name(), cput))

    def create_job(self, jobid, node):
        """
        Creates the cgroup if it doesn't exists
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Iterate over the enabled subsystems
        for subsys in self.subsystems:
            # Create a directory for the job
            old_umask = os.umask(0o022)
            try:
                path = self._cgroup_path(subsys, jobid=jobid)
                if not os.path.exists(path):
                    pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Creating directory %s' %
                               (caller_name(), path))
                    os.makedirs(path, 0o755)
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG3,
                               '%s: Directory %s already exists' %
                               (caller_name(), path))
                if subsys == 'devices':
                    self._setup_subsys_devices(jobid, node)
            except OSError as exc:
                raise CgroupConfigError('Failed to create directory: %s (%s)' %
                                        (path, errno.errorcode[exc.errno]))
            except Exception:
                raise
            finally:
                os.umask(old_umask)

    def configure_job(self, job, hostresc, node, cgroup, event_type):
        """
        Determine the cgroup limits and configure the cgroups
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        jobid = job.id

        # Get available totals for mem, vmem and hpmem from parent cgroup
        # Calling node.get_memory_on_node etc. may give slightly different
        # results if kernel drivers have freshly reserved memory since
        # exechost_startup was called
        mem_avail = 0
        filename = self._cgroup_path('memory', 'limit_in_bytes')
        if filename and os.path.isfile(filename):
            with open(filename) as desc:
                mem_avail = int(desc.readline())
        vmem_avail = 0
        filename = self._cgroup_path('memsw', 'limit_in_bytes')
        if filename and os.path.isfile(filename):
            with open(filename) as desc:
                vmem_avail = int(desc.readline())
        hpmem_avail = 0
        filename = self._cgroup_path('hugetlb', 'limit_in_bytes')
        if filename and os.path.isfile(filename):
            with open(filename) as desc:
                hpmem_avail = int(desc.readline())

        # Sanity check vmem_avail >= mem_avail
        # -- unnecessary by construction in exechost_startup
        # but memsw may be disabled or swap accounting disabled
        if vmem_avail < mem_avail:
            vmem_avail = mem_avail

        pbs.logmsg(pbs.EVENT_DEBUG4, "configure_job:"
                   " total host avail mem=%s vmem=%s hpmem=%s"
                   % (mem_avail, vmem_avail, hpmem_avail))

        mem_enabled = 'memory' in self.subsystems
        vmem_enabled = 'memsw' in self.subsystems
        if mem_enabled or vmem_enabled:
            # Initialize mem variables
            mem_requested = None
            if 'mem' in hostresc:
                mem_requested = convert_size(hostresc['mem'], 'kb')
            mem_default = None
            if mem_enabled and self.default('memory') is not None:
                mem_default = size_as_int(self.default('memory'))
            # Initialize vmem variables
            vmem_requested = None
            if 'vmem' in hostresc:
                vmem_requested = convert_size(hostresc['vmem'], 'kb')
            vmem_default = 0
            if (vmem_enabled and (self.default('memsw') is not None)
                    and (vmem_avail > mem_avail)):
                vmem_default = size_as_int(self.default('memsw'))
                if vmem_default > (vmem_avail - mem_avail):
                    vmem_default = vmem_avail - mem_avail
            # Initialize softmem variables
            if 'soft_limit' in self.cfg['cgroup']['memory']:
                softmem_enabled = self.cfg['cgroup']['memory']['soft_limit']
            else:
                softmem_enabled = False
            # Determine the mem limit
            if mem_requested is not None:
                # mem requested may not exceed available
                if size_as_int(mem_requested) > mem_avail:
                    raise JobValueError(
                        'mem requested (%s) exceeds mem available (%s)' %
                        (mem_requested, str(mem_avail)))
                mem_limit = mem_requested
            else:
                # mem was not requested
                if (mem_default is None
                        or not self.cfg['cgroup']['memory']
                                       ['enforce_default']
                        or (self.cfg['cgroup']['memory']
                                    ['exclhost_ignore_default']
                            and "place" in job.Resource_List
                            and 'exclhost'
                                in repr(job.Resource_List['place']))):
                    mem_limit = str(mem_avail)
                else:
                    mem_limit = str(mem_default)
            # Determine the vmem limit
            if not vmem_enabled:
                # set as equal, but will not be used to set cgroup limit
                vmem_limit = mem_limit
            elif vmem_requested is not None:
                # vmem requested may not exceed available
                if size_as_int(vmem_requested) > vmem_avail:
                    raise JobValueError(
                        'vmem requested (%s) exceeds vmem available (%s)' %
                        (vmem_requested, str(vmem_avail)))
                vmem_limit = vmem_requested
            else:
                # vmem was not requested
                if (vmem_default is None
                        or not self.cfg['cgroup']['memsw']
                                       ['enforce_default']
                        or (self.cfg['cgroup']['memsw']
                                    ['exclhost_ignore_default']
                            and 'place' in job.Resource_List
                            and 'exclhost'
                                in repr(job.Resource_List['place']))):
                    vmem_limit = str(vmem_avail)
                else:
                    vmem_limit = str(min(vmem_avail,
                                         size_as_int(mem_limit)
                                         + vmem_default))
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       "Limits computed from requests/defaults: "
                       "mem: %s vmem: %s" % (mem_limit, vmem_limit))
            # Ensure vmem is at least as large as mem
            if size_as_int(vmem_limit) < size_as_int(mem_limit):
                vmem_limit = mem_limit
            # Adjust for soft limits if enabled
            if mem_enabled and softmem_enabled:
                softmem_limit = mem_limit
                # The hard memory limit is assigned the lesser of the vmem
                # limit and available memory
                if size_as_int(vmem_limit) < mem_avail:
                    mem_limit = vmem_limit
                else:
                    mem_limit = str(mem_avail)
            # Again, ensure vmem is at least as large as mem
            if size_as_int(vmem_limit) < size_as_int(mem_limit):
                vmem_limit = mem_limit
            # Sanity checks when both memory and memsw are enabled
            if mem_enabled and vmem_enabled:
                if vmem_requested is not None:
                    if size_as_int(vmem_requested) < size_as_int(vmem_limit):
                        # The user requested an invalid limit
                        raise JobValueError(
                            'vmem requested (%s) under minimum possible (%s)'
                            % (vmem_requested, vmem_limit))
                if size_as_int(vmem_limit) > size_as_int(mem_limit):
                    # This job may try to utilize swap
                    if vmem_avail <= mem_avail:
                        # No swap available
                        if vmem_requested is not None:
                            raise CgroupLimitError('Job might utilize swap'
                                                   ' and no swap on host')
                        else:
                            # It got an impossible vmem>mem
                            # undo that since there is no swap
                            vmem_limit = mem_limit
            # Assign mem and vmem
            if mem_enabled:
                if mem_requested is None:
                    pbs.logmsg(pbs.EVENT_DEBUG2,
                               '%s: mem not requested, '
                               'assigning %s to cgroup'
                               % (caller_name(), mem_limit))
                    hostresc['mem'] = pbs.size(mem_limit)
                if softmem_enabled:
                    hostresc['softmem'] = pbs.size(softmem_limit)
            if vmem_enabled:
                if vmem_requested is None:
                    pbs.logmsg(pbs.EVENT_DEBUG2,
                               '%s: vmem not requested, '
                               'assigning %s to cgroup'
                               % (caller_name(), vmem_limit))
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               '%s: INFO: vmem is enabled in the hook '
                               'configuration file and should also be '
                               'listed in the resources line of the '
                               'scheduler configuration file' %
                               caller_name())
                    hostresc['vmem'] = pbs.size(vmem_limit)

        # Initialize hpmem variables
        hpmem_default = None
        hpmem_limit = None
        hpmem_enabled = 'hugetlb' in self.subsystems
        if hpmem_enabled:
            if self.default('hugetlb') is not None:
                hpmem_default = size_as_int(self.default('hugetlb'))
            if (hpmem_default is None
                    or not self.cfg['cgroup']['hugetlb']
                                   ['enforce_default']
                    or (self.cfg['cgroup']['hugetlb']
                                ['exclhost_ignore_default']
                        and "place" in job.Resource_List
                        and 'exclhost' in repr(job.Resource_List['place']))):
                hpmem_default = hpmem_avail
            if 'hpmem' in hostresc:
                hpmem_limit = convert_size(hostresc['hpmem'], 'kb')
            else:
                hpmem_limit = str(hpmem_default)
            # Assign hpmem
            if size_as_int(hpmem_limit) > hpmem_avail:
                raise JobValueError('hpmem limit (%s) exceeds available (%s)' %
                                    (hpmem_limit, str(hpmem_avail)))
            hostresc['hpmem'] = pbs.size(hpmem_limit)
        # Initialize cpuset variables
        cpuset_enabled = 'cpuset' in self.subsystems
        if cpuset_enabled:
            cpu_limit = 0
            if 'ncpus' in hostresc:
                cpu_limit = hostresc['ncpus']
            # support weightless jobs in root cpuset
            # do not clamp cpu_limit to min 1
            hostresc['ncpus'] = pbs.pbs_int(cpu_limit)
        # Find the available resources and assign the right ones to the job
        assigned = dict()
        jobdict = dict()
        # Make two attempts since self.cleanup_orphans may actually fix the
        # problem we see in a first attempt
        for attempt in range(2):
            if (hasattr(pbs, "EXECJOB_RESIZE")
                    and event_type == pbs.EXECJOB_RESIZE):
                # consider current job's resources as being available,
                # where a subset of them would be re-assigned to the
                # the same job.
                avail_resc = self.available_node_resources(node, jobid)
            else:
                avail_resc = self.available_node_resources(node)
            assigned = self.assign_job(hostresc, avail_resc, node)
            # If this was not the first attempt, do not bother trying to
            # clean up again. This is handled immediately after the loop.
            if attempt != 0:
                break
            if not assigned:
                # No resources were assigned to the job, most likely because
                # a cgroup has not been cleaned up yet
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           '%s: Failed to assign job resources' %
                           caller_name())
                pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Resyncing local job data' %
                           caller_name())
                # Collect the jobs on the node (try reading mom_priv/jobs)
                try:
                    jobdict = node.gather_jobs_on_node(cgroup)
                except Exception:
                    jobdict = dict()
                    pbs.logmsg(pbs.EVENT_DEBUG2,
                               '%s: Failed to gather local job data' %
                               caller_name())
                # There may not be a .JB file present for this job yet
                if jobid not in jobdict:
                    jobdict[jobid] = time.time()
                self.cleanup_orphans(jobdict)
                # Resynchronize after cleanup
                self.assigned_resources = self._get_assigned_cgroup_resources()
        if not assigned:
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Assignment of resources failed '
                       'for %s, attempting cleanup' % (caller_name(), jobid))
            # Cleanup cgroups for jobs not present on this node
            jobdict = node.gather_jobs_on_node(cgroup)
            if jobdict and jobid in jobdict:
                del jobdict[jobid]
            self.cleanup_orphans(jobdict)
            # Log a message and rerun the job
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Requeuing job %s' %
                       (caller_name(), jobid))
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Run count for job %s: %d' %
                       (caller_name(), jobid, pbs.event().job.run_count))
            pbs.event().job.rerun()
            raise CgroupProcessingError('Failed to assign resources')
        # Print out the assigned resources
        pbs.logmsg(pbs.EVENT_DEBUG2,
                   'Assigned resources: %s' % (assigned))
        self.assigned_resources = assigned
        if cpuset_enabled:
            # Do not remove the ncpus key if it exists:
            # used by the "cpu" controller now.
            for key in ['cpuset.cpus', 'cpuset.mems']:
                if key in assigned:
                    hostresc[key] = assigned[key]
                else:
                    pbs.logmsg(pbs.EVENT_DEBUG2,
                               'Key: %s not found in assigned' % key)
        # Initialize devices variables
        key = 'devices'
        if key in self.subsystems:
            if key in assigned:
                hostresc[key] = assigned[key]
            else:
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           'Key: %s not found in assigned' % key)
        # Apply the resource limits to the cgroups
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Setting cgroup limits for: %s' %
                   (caller_name(), hostresc))
        # The vmem limit must be set after the mem limit, so sort the keys
        # also ensures we get to cpuset.cpus before cpuset.mem
        # important for zero cpu jobs migrated to root cpuset
        for resc in sorted(hostresc):
            if resc == 'ncpus':
                # In case of HT, may need to multiply the ncpus;
                # done here since "node" is not passed down to set_limit
                # This only sets the cpu controller limits/shares,
                # since the cpuset stuff is done through
                # cpuset.cpus and cpuset.mems
                # Note the set_limit in the final 'else' should be
                # skipped -- its replacement is at the end here
                htpc = 1
                if (self.cfg['cgroup']['cpu']['enabled']
                        and self.cfg['use_hyperthreads']
                        and self.cfg['ncpus_are_cores']):
                    if 'hyperthreads_per_core' in node.cpuinfo:
                        htpc = node.cpuinfo['hyperthreads_per_core']
                self.set_limit(resc, hostresc[resc] * htpc, jobid)
            elif ((resc == "cpuset.cpus")
                  and not hostresc['cpuset.cpus']):
                # zero cpus jobs -- delete the cpuset made for the job;
                # later allows job processes to be placed in the root cpuset.
                # Note the set_limit in the final else should likewise
                # be skipped.
                # Since the advent of "resize" we may need to
                # clean up processes in a pre-existing cpuset
                finished = False
                giveup_time = time.time() + self.cfg['kill_timeout']
                path = self._cgroup_path('cpuset', '', jobid)
                while not finished:
                    success = self._remove_cgroup(path)
                    if success:
                        finished = True
                    elif time.time() > giveup_time:
                        finished = True
                    else:
                        time.sleep(0.2)
            else:
                # For all the rest just pass hostresc[resc] down to set_limit
                self.set_limit(resc, hostresc[resc], jobid)
        # Set additional parameters
        # Note some kernels will surprisingly not let you set things
        # to the value that is already there in some corner cases
        # hence some of the reads to see "if we need to write"
        if cpuset_enabled:
            path = self._cgroup_path('cpuset', 'mem_hardwall', jobid)
            lines = self.read_value(path)
            curval = 0
            if lines and lines[0] == '1':
                curval = 1
            if self.cfg['cgroup']['cpuset']['mem_hardwall']:
                if curval == 0:
                    self.write_value(path, '1')
            else:
                if curval == 1:
                    self.write_value(path, '0')
            path = self._cgroup_path('cpuset', 'memory_spread_page', jobid)
            lines = self.read_value(path)
            curval = 0
            if lines and lines[0] == '1':
                curval = 1
            if self.cfg['cgroup']['cpuset']['memory_spread_page']:
                if curval == 0:
                    self.write_value(path, '1')
            else:
                if curval == 1:
                    self.write_value(path, '0')

    def _kill_tasks(self, tasks_file):
        """
        Kill any processes contained within a tasks file
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if not os.path.isfile(tasks_file):
            return 0
        count = 0
        with open(tasks_file, 'r') as tasks_desc:
            for line in tasks_desc:
                count += 1
                try:
                    os.kill(int(line.strip()), signal.SIGKILL)
                except Exception:
                    pass
        # Give the OS a moment to update the tasks file
        time.sleep(0.1)
        count = 0
        try:
            with open(tasks_file, 'r') as tasks_desc:
                for line in tasks_desc:
                    count += 1
                    pid = line.strip()
                    filename = os.path.join(os.sep, 'proc', pid, 'status')
                    statlist = []
                    try:
                        with open(filename, 'r') as status_desc:
                            for line2 in status_desc:
                                if line2.find('Name:') != -1:
                                    statlist.append(line2.strip())
                                if line2.find('State:') != -1:
                                    statlist.append(line2.strip())
                                if line2.find('Uid:') != -1:
                                    statlist.append(line2.strip())
                    except Exception:
                        pass
                    pbs.logmsg(pbs.EVENT_DEBUG2, '%s: PID %s survived: %s' %
                               (caller_name(), pid, statlist))
        except Exception as exc:
            if exc.errno != errno.ENOENT:
                raise
        return count

    def _delete_cgroup_children(self, path):
        """
        Recursively delete all children within a cgroup, but not the parent
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if not os.path.isdir(path):
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: No such directory: %s' %
                       (caller_name(), path))
            return 0
        remaining_children = 0
        for filename in os.listdir(path):
            subdir = os.path.join(path, filename)
            if not os.path.isdir(subdir):
                continue
            remaining_children += self._delete_cgroup_children(subdir)
            tasks_file = os.path.join(subdir, 'tasks')
            remaining_tasks = self._kill_tasks(tasks_file)
            if remaining_tasks > 0:
                remaining_children += 1
                continue
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Removing directory %s' %
                       (caller_name(), subdir))
            try:
                os.rmdir(subdir)
            except Exception as exc:
                pbs.logmsg(pbs.EVENT_SYSTEM,
                           'Error removing cgroup path %s: %s' %
                           (subdir, str(exc)))
        return remaining_children

    def _remove_cgroup(self, path, jobid=None):
        """
        Perform the actual removal of the cgroup directory.
        Make only one attempt at killing tasks in cgroup,
        since this method could be called many times (for N
        directories times M jobs).
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        if not os.path.isdir(path):
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: No such directory: %s' %
                       (caller_name(), path))
            return True
        if not jobid:
            parent = path
        else:
            parent = os.path.join(path, jobid)
        # Recursively delete children
        self._delete_cgroup_children(parent)
        # Delete the parent
        tasks_file = os.path.join(parent, 'tasks')
        remaining = 0
        if not os.path.isfile(tasks_file):
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: No such file: %s' %
                       (caller_name(), tasks_file))
        else:
            try:
                remaining = self._kill_tasks(tasks_file)
            except Exception:
                pass
        if remaining == 0:
            pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Removing directory %s' %
                       (caller_name(), parent))
            for _ in range(2):
                try:
                    os.rmdir(parent)
                except OSError as exc:
                    pbs.logmsg(pbs.EVENT_SYSTEM,
                               'OS error removing cgroup path %s: %s' %
                               (parent, errno.errorcode[exc.errno]))
                except Exception as exc:
                    pbs.logmsg(pbs.EVENT_SYSTEM,
                               'Failed to remove cgroup path %s: %s' %
                               (parent, exc))
                    raise
                if not os.path.isdir(parent):
                    break
                time.sleep(0.5)
            return True
        if not os.path.isdir(parent):
            return True
        # Cgroup removal has failed
        pbs.logmsg(pbs.EVENT_SYSTEM, 'cgroup still has %d tasks: %s' %
                   (remaining, parent))
        # Nodes are taken offline in the delete() method
        return False

    def cleanup_hook_data(self, local_jobs=[]):
        pattern = os.path.join(self.hook_storage_dir, '[0-9]*.*')
        for filename in glob.glob(pattern):
            if os.path.basename(filename) in local_jobs:
                continue
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'Stale file %s to be removed' % filename)
            try:
                os.remove(filename)
            except Exception as exc:
                pbs.logmsg(pbs.EVENT_ERROR, 'Error removing file: %s' % exc)

    def cleanup_env_files(self, local_jobs=[]):
        pattern = os.path.join(self.host_job_env_dir, '[0-9]*.env')
        for filename in glob.glob(pattern):
            (jobid, extension) = os.path.splitext(os.path.basename(filename))
            if jobid in local_jobs:
                continue
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       'Stale file %s to be removed' % filename)
            try:
                os.remove(filename)
            except Exception as exc:
                pbs.logmsg(pbs.EVENT_ERROR, 'Error removing file: %s' % exc)

    def cleanup_orphans(self, local_jobs):
        """
        Removes cgroup directories that are not associated with a local job
        and cleanup any environment and assigned_resources files
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Local jobs: %s' % local_jobs)
        self.cleanup_hook_data(local_jobs)
        self.cleanup_env_files(local_jobs)
        remaining = 0
        # Always do systemd first, to prevent it from re-"mirroring"
        # that directory into other hierarchies behind our back
        if 'systemd' in self.paths:
            keys_to_process = \
                (['systemd']
                 + [x for x in self.paths if x != 'systemd'])
        else:
            keys_to_process = [x for x in self.paths]
        for key in keys_to_process:
            path = os.path.dirname(self._cgroup_path(key))
            # Identify any orphans and append an orphan suffix
            pattern = self._glob_subdir_wildcard()
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Searching for orphans: %s' %
                       (caller_name(), os.path.join(path, pattern)))
            for subdir in glob.glob(os.path.join(path, pattern)):
                jobid = os.path.basename(subdir)
                if jobid in local_jobs or jobid.endswith('.orphan'):
                    continue
                # Now rename the directory.
                filename = jobid + '.orphan'
                new_subdir = os.path.join(path, filename)
                pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Renaming %s to %s' %
                           (caller_name(), subdir, new_subdir))
                # Make sure the directory still exists before it is renamed
                # or the logs could contain extraneous messages
                if os.path.exists(subdir):
                    try:
                        os.rename(subdir, new_subdir)
                    except Exception:
                        pbs.logmsg(pbs.EVENT_DEBUG2,
                                   '%s: Failed to rename %s to %s' %
                                   (caller_name(), subdir, new_subdir))
            # Attempt to remove the orphans
            pattern = self._glob_subdir_wildcard(extension='orphan')
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Cleaning up orphans: %s' %
                       (caller_name(), os.path.join(path, pattern)))
            for subdir in glob.glob(os.path.join(path, pattern)):
                pbs.logmsg(pbs.EVENT_DEBUG2,
                           '%s: Removing orphaned cgroup: %s' %
                           (caller_name(), subdir))
                if not self._remove_cgroup(subdir):
                    pbs.logmsg(pbs.EVENT_DEBUG,
                               '%s: Removing orphaned cgroup %s failed ' %
                               (caller_name(), subdir))
                    remaining += 1
        return remaining

    def delete(self, jobid, offline_node=True):
        """
        Removes the cgroup directories for a job
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        # Make multiple attempts to kill tasks in the cgroup. Keep
        # trying for kill_timeout seconds.
        if not jobid:
            raise ValueError('Invalid job ID')
        finished = False
        giveup_time = time.time() + self.cfg['kill_timeout']
        try:
            while not finished:
                failure = False
                # Always do systemd first
                if 'systemd' in self.paths:
                    keys_to_process = \
                        (['systemd']
                         + [x for x in self.paths if x != 'systemd'])
                else:
                    keys_to_process = [x for x in self.paths]
                for key in keys_to_process:
                    cgroup_path = self._cgroup_path(key)
                    path = os.path.dirname(self._cgroup_path(key))
                    subdir_basename = jobid
                    subdir = os.path.join(path, subdir_basename)
                    subdir_parent = path
                    # Make sure it still exists
                    if not os.path.isdir(subdir):
                        pbs.logmsg(pbs.EVENT_DEBUG4,
                                   '%s: Skipping because %s is gone' %
                                   (caller_name(), subdir))
                        continue
                    # Remove it
                    pbs.logmsg(pbs.EVENT_DEBUG4,
                               '%s: Attempting to delete %s' %
                               (caller_name(), subdir))
                    if not self._remove_cgroup(subdir_parent, jobid):
                        pbs.logmsg(pbs.EVENT_DEBUG2, '%s: Unable to '
                                   'delete cgroup for job %s' %
                                   (caller_name(), jobid))
                    # Check again
                    if os.path.isdir(subdir):
                        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Deletion '
                                   'failed: %s still exists' %
                                   (caller_name(), subdir))
                        failure = True
                    else:
                        pbs.logmsg(pbs.EVENT_DEBUG4,
                                   '%s: Deleted %s' %
                                   (caller_name(), subdir))
                if not failure:
                    finished = True
                elif time.time() > giveup_time:
                    finished = True
                else:
                    time.sleep(0.2)
        except Exception as exc:
            failure = True
            pbs.logmsg(pbs.EVENT_DEBUG, '%s: Error removing cgroup '
                       'for %s: %s' % (caller_name(), jobid, exc))

        if finished and not failure:
            return True

        # Handle deletion failure
        if not offline_node:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Offline not requested' %
                       caller_name())
            return False
        node = NodeUtils(self.cfg)
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: NodeUtils class instantiated' %
                   caller_name())
        try:
            node.take_node_offline()
        except Exception as exc:
            pbs.logmsg(pbs.EVENT_DEBUG, '%s: Failed to offline node: %s' %
                       (caller_name(), exc))
        return False

    def read_value(self, filename):
        """
        Read value(s) from a limit file
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        lines = []
        try:
            with open(filename, 'r') as desc:
                lines = desc.readlines()
        except IOError:
            pbs.logmsg(pbs.EVENT_SYSTEM, '%s: Failed to read file: %s' %
                       (caller_name(), filename))
        return [x.strip() for x in lines]

    def write_value(self, filename, value, mode='w'):
        """
        Write a value to a limit file
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: writing %s to %s' %
                   (caller_name(), value, filename))
        try:
            with open(filename, mode) as desc:
                desc.write(str(value) + '\n')
        except IOError as exc:
            if exc.errno == errno.ENOENT:
                pbs.logmsg(pbs.EVENT_SYSTEM, '%s: No such file: %s' %
                           (caller_name(), filename))
            elif exc.errno in [errno.EACCES, errno.EPERM]:
                pbs.logmsg(pbs.EVENT_SYSTEM, '%s: Permission denied: %s' %
                           (caller_name(), filename))
            elif exc.errno == errno.EBUSY:
                raise CgroupBusyError('Limit %s rejected: %s' %
                                      (value, filename))
            elif exc.errno == errno.ENOSPC:
                raise CgroupLimitError('Limit %s too small: %s' %
                                       (value, filename))
            elif exc.errno == errno.EINVAL:
                raise CgroupLimitError('Invalid limit value: %s, file: %s' %
                                       (value, filename))
            else:
                pbs.logmsg(pbs.EVENT_SYSTEM,
                           '%s: Uncaught exception writing %s to %s' %
                           (value, filename))
                raise
        except Exception:
            raise

    def _get_cfs_quota_us(self, jobid=''):
        pbs.logmsg(pbs.EVENT_DEBUG3, "%s: Method called" % (caller_name()))
        # default for _cgroup_path for parent is empty string
        try:
            with open(self._cgroup_path('cpu', 'cfs_quota_us',
                                        jobid), 'r') as fd:
                return int(fd.readline().strip())
        except Exception:
            return None

    def _get_mem_failcnt(self, jobid):
        """
        Return memory failcount
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            with open(self._cgroup_path('memory', 'failcnt', jobid),
                      'r') as desc:
                return int(desc.readline().strip())
        except Exception:
            return None

    def _get_memsw_failcnt(self, jobid):
        """
        Return vmem failcount
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            with open(self._cgroup_path('memsw', 'failcnt', jobid),
                      'r') as desc:
                return int(desc.readline().strip())
        except Exception:
            return None

    def _get_hugetlb_failcnt(self, jobid):
        """
        Return hpmem failcount
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            with open(self._cgroup_path('hugetlb', 'failcnt', jobid),
                      'r') as desc:
                return int(desc.readline().strip())
        except Exception:
            return None

    def _get_max_mem_usage(self, jobid):
        """
        Return the max usage of memory in bytes
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            with open(self._cgroup_path('memory', 'max_usage_in_bytes',
                                        jobid), 'r') as desc:
                return int(desc.readline().strip())
        except Exception:
            return None

    def _get_max_memsw_usage(self, jobid):
        """
        Return the max usage of memsw in bytes
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            with open(self._cgroup_path('memsw', 'max_usage_in_bytes', jobid),
                      'r') as desc:
                return int(desc.readline().strip())
        except Exception:
            return None

    def _get_max_hugetlb_usage(self, jobid):
        """
        Return the max usage of hugetlb in bytes
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            with open(self._cgroup_path('hugetlb', 'max_usage_in_bytes',
                                        jobid),
                      'r') as desc:
                return int(desc.readline().strip())
        except Exception:
            return None

    def _get_cpu_usage(self, jobid):
        """
        Return the cpuacct.usage in cpu seconds
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        path = self._cgroup_path('cpuacct', 'usage', jobid)
        try:
            with open(path, 'r') as desc:
                return int(desc.readline().strip())
        except Exception:
            return None

    def select_cpus(self, path, ncpus):
        """
        Assign CPUs to the cpuset
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: path is %s' % (caller_name(), path))
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: ncpus is %s' %
                   (caller_name(), ncpus))
        if ncpus < 1:
            ncpus = 1
        # Must select from those currently available
        cpufile = os.path.basename(path)
        base = os.path.dirname(path)
        parent = os.path.dirname(base)
        with open(os.path.join(parent, cpufile), 'r') as desc:
            avail = expand_list(desc.read().strip())
        if len(avail) < 1:
            raise CgroupProcessingError('No CPUs available in cgroup')
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Available CPUs: %s' %
                   (caller_name(), avail))
        for filename in glob.glob(os.path.join(parent, '[0-9]*', cpufile)):
            if filename.endswith('.orphan'):
                continue
            with open(filename, 'r') as desc:
                cpus = expand_list(desc.read().strip())
            for entry in cpus:
                if entry in avail:
                    avail.remove(entry)
        if len(avail) < ncpus:
            raise CgroupProcessingError('Insufficient CPUs in cgroup')
        if len(avail) == ncpus:
            return avail
        # TODO: Try to minimize NUMA nodes based on memory requirement
        return avail[:ncpus]

    def _get_error_msg(self, jobid):
        """
        Return the error message in system message file
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        try:
            proc = subprocess.Popen(['dmesg'], shell=False,
                                    stdout=subprocess.PIPE,
                                    universal_newlines=True)
            out = proc.communicate()[0]
            # if we get a non-str type then convert before calling splitlines
            # should not happen since we pass universal_newlines True
            out_split = stringified_output(out).splitlines()
        except Exception:
            return ''
        out_split.reverse()
        # Check to see if the job id is found in dmesg output
        for line in out_split:
            start = line.find('Killed process ')
            if start < 0:
                start = line.find('Task in /%s' % self.cfg['cgroup_prefix'])
            if start < 0:
                continue
            kill_line = line[start:]
            job_start = line.find(jobid)
            if job_start < 0:
                continue
            return kill_line

        # Found nothing -- more recent kernels have different messages
        for line in out_split:
            start = line.find('oom-kill')
            kill_line = line[start:]
            job_start = line.find(jobid)
            if job_start < 0:
                continue
            return kill_line

        return ''

    def write_job_env_file(self, jobid, env_list):
        """
        Write out host cgroup environment for this job
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        jobid = str(jobid)
        if not os.path.exists(self.host_job_env_dir):
            os.makedirs(self.host_job_env_dir, 0o755)
        # Write out assigned_resources
        try:
            lines = "\n".join(env_list)
            filename = self.host_job_env_filename % jobid
            with open(filename, 'w') as desc:
                desc.write(lines)
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Wrote out file: %s' % (filename))
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Data: %s' % (lines))
            return True
        except Exception:
            return False

    def write_cgroup_assigned_resources(self, jobid):
        """
        Write out host cgroup assigned resources for this job
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        jobid = str(jobid)
        if not os.path.exists(self.hook_storage_dir):
            os.makedirs(self.hook_storage_dir, 0o700)
        # Write out assigned_resources
        try:
            json_str = json.dumps(self.assigned_resources)
            filename = os.path.join(self.hook_storage_dir, jobid)
            with open(filename, 'w') as desc:
                desc.write(json_str)
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Wrote out file: %s' %
                       (os.path.join(self.hook_storage_dir, jobid)))
            pbs.logmsg(pbs.EVENT_DEBUG4, 'Data: %s' % (json_str))
            return True
        except Exception:
            return False

    def read_cgroup_assigned_resources(self, jobid):
        """
        Read assigned resources from job file stored in hook storage area
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Method called' % caller_name())
        jobid = str(jobid)
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Host assigned resources: %s' %
                   (self.assigned_resources))
        hrfile = os.path.join(self.hook_storage_dir, jobid)
        if os.path.isfile(hrfile):
            # Read in assigned_resources
            try:
                with open(hrfile, 'r') as desc:
                    json_data = json.load(desc, object_hook=decode_dict)
                self.assigned_resources = json_data
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           'Host assigned resources: %s' %
                           (self.assigned_resources))
            except IOError:
                raise CgroupConfigError('I/O error reading config file')
            except json.JSONDecodeError:
                raise CgroupConfigError(
                    'JSON parsing error reading config file')
        return self.assigned_resources is not None

    def add_jobid_to_cgroup_jobs(self, jobid):
        """
        Add a job ID to the file where local jobs are maintained
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Adding jobid %s to cgroup_jobs' % jobid)
        try:
            with open(self.cgroup_jobs_file, 'r+') as fd:
                jobdict = eval(fd.read())
                if not isinstance(jobdict, dict):
                    pbs.logmsg(pbs.EVENT_ERROR, 'Incompatibly formatted '
                               'cgroup_jobs; emptying it first')
                    jobdict = dict()
                if jobid not in jobdict:
                    jobdict[jobid] = time.time()
                    fd.seek(0)
                    fd.write(str(jobdict))
        except IOError:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Failed to open cgroup_jobs file')
            raise
        except SyntaxError:
            pbs.logmsg(pbs.EVENT_ERROR, 'Incompatibly formatted cgroup_jobs; '
                                        'emptying it first')
            jobdict = dict()
            jobdict[jobid] = time.time()
            try:
                with open(self.cgroup_jobs_file, 'w') as fd:
                    fd.write(str(jobdict))
            except Exception:
                pbs.logsmg('Error adding jobid %s to cgroup_jobs' % jobid)
                self.empty_cgroup_jobs_file()

    def remove_jobid_from_cgroup_jobs(self, jobid):
        """
        Remove a job ID from the file where local jobs are maintained
        """
        pbs.logmsg(pbs.EVENT_DEBUG4,
                   'Removing jobid %s from cgroup_jobs' % jobid)
        try:
            with open(self.cgroup_jobs_file, 'r+') as fd:
                jobdict = eval(fd.read())
                if not isinstance(jobdict, dict):
                    pbs.logmsg(pbs.EVENT_ERROR, 'Incompatibly formatted '
                               'cgroup_jobs; emptying it')
                    jobdict = dict()
                if jobid in jobdict:
                    del jobdict[jobid]
                    fd.seek(0)
                    fd.write(str(jobdict))
                    fd.truncate()
        except IOError:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Failed to open cgroup_jobs file')
            raise
        except SyntaxError:
            pbs.logmsg(pbs.EVENT_ERROR, 'Incompatibly formatted cgroup_jobs; '
                                        'emptying it')
            self.empty_cgroup_jobs_file()

    def read_cgroup_jobs(self):
        """
        Read the file where local jobs are maintained
        """
        jobdict = dict()
        try:
            with open(self.cgroup_jobs_file, 'r') as fd:
                jobdict = eval(fd.read())
                if not isinstance(jobdict, dict):
                    pbs.logmsg(pbs.EVENT_ERROR, 'Incompatibly formatted '
                               'cgroup_jobs; emptying it')
                    jobdict = dict()
                    self.empty_cgroup_jobs_file()
        except IOError:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Failed to open cgroup_jobs file')
            raise
        except SyntaxError:
            pbs.logmsg(pbs.EVENT_ERROR, 'Incompatibly formatted cgroup_jobs; '
                                        'emptying it')
            self.empty_cgroup_jobs_file()
            jobdict = dict()
        cutoff = time.time() - float(self.cfg['job_setup_timeout'])
        result = {key: val for key, val in jobdict.items() if val >= cutoff}
        if len(result) != len(jobdict):
            pbs.logmsg(pbs.EVENT_DEBUG, 'Removing stale jobs from cgroup_jobs')
            try:
                with open(self.cgroup_jobs_file, 'w') as fd:
                    fd.write(str(result))
            except Exception:
                # we tolerate even bad files
                pass
        return result

    def delete_cgroup_jobs_file(self, jobid):
        """
        Delete the file where local jobs are maintained
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Deleting file: %s' %
                   self.cgroup_jobs_file)
        if os.path.isfile(self.cgroup_jobs_file):
            os.remove(self.cgroup_jobs_file)

    def empty_cgroup_jobs_file(self):
        """
        Remove all keys from the file where local jobs are maintained
        """
        pbs.logmsg(pbs.EVENT_DEBUG4, 'Emptying file: %s' %
                   self.cgroup_jobs_file)
        try:
            with open(self.cgroup_jobs_file, 'w') as fd:
                fd.write(str(dict()))
        except IOError:
            pbs.logmsg(pbs.EVENT_DEBUG, 'Failed to open cgroup_jobs file: %s' %
                       self.cgroup_jobs_file)
            raise


def set_global_vars():
    """
    Define some global variables that the hook may use
    """
    global PBS_EXEC
    global PBS_HOME
    global PBS_MOM_HOME
    global PBS_MOM_JOBS
    # Determine location of PBS_HOME, PBS_MOM_HOME, and PBS_EXEC. These
    # should have each be initialized to empty strings near the beginning
    # of this hook.
    # Try the environment first
    if not PBS_EXEC and 'PBS_EXEC' in os.environ:
        PBS_EXEC = os.environ['PBS_EXEC']
    if not PBS_HOME and 'PBS_HOME' in os.environ:
        PBS_HOME = os.environ['PBS_HOME']
    if not PBS_MOM_HOME and 'PBS_MOM_HOME' in os.environ:
        PBS_MOM_HOME = os.environ['PBS_MOM_HOME']
    # Try the built in config values next
    pbs_conf = pbs.get_pbs_conf()
    if pbs_conf:
        if not PBS_EXEC and 'PBS_EXEC' in pbs_conf:
            PBS_EXEC = pbs_conf['PBS_EXEC']
        if not PBS_HOME and 'PBS_HOME' in pbs_conf:
            PBS_HOME = pbs_conf['PBS_HOME']
        if not PBS_MOM_HOME and 'PBS_MOM_HOME' in pbs_conf:
            PBS_MOM_HOME = pbs_conf['PBS_MOM_HOME']
    # Try reading the config file directly
    if not PBS_EXEC or not PBS_HOME or not PBS_MOM_HOME:
        if 'PBS_CONF_FILE' in os.environ:
            pbs_conf_file = os.environ['PBS_CONF_FILE']
        else:
            pbs_conf_file = os.path.join(os.sep, 'etc', 'pbs.conf')
        regex = re.compile(r'\s*([^\s]+)\s*=\s*([^\s]+)\s*')
        try:
            with open(pbs_conf_file, 'r') as desc:
                for line in desc:
                    match = regex.match(line)
                    if match:
                        if not PBS_EXEC and match.group(1) == 'PBS_EXEC':
                            PBS_EXEC = match.group(2)
                        if not PBS_HOME and match.group(1) == 'PBS_HOME':
                            PBS_HOME = match.group(2)
                        if not PBS_MOM_HOME and (match.group(1) ==
                                                 'PBS_MOM_HOME'):
                            PBS_MOM_HOME = match.group(2)
        except Exception:
            pass
    # If PBS_MOM_HOME is not set, use the PBS_HOME value
    if not PBS_MOM_HOME:
        PBS_MOM_HOME = PBS_HOME
    PBS_MOM_JOBS = os.path.join(PBS_MOM_HOME, 'mom_priv', 'jobs')
    # Sanity check to make sure each global path is set
    if not PBS_EXEC:
        raise CgroupConfigError('Unable to determine PBS_EXEC')
    if not PBS_HOME:
        raise CgroupConfigError('Unable to determine PBS_HOME')
    if not PBS_MOM_HOME:
        raise CgroupConfigError('Unable to determine PBS_MOM_HOME')


def missing_str(memspecs):
    if 'vmem' in memspecs and 'mem' in memspecs:
        try:
            if size_as_int(memspecs['vmem']) > 0:
                vmem_size = pbs.size(memspecs['vmem'])
            else:
                vmem_size = pbs.size("0B")
            if size_as_int(memspecs['mem']) > 0:
                mem_size = pbs.size(memspecs['mem'])
            else:
                mem_size = pbs.size("0B")
            if mem_size > vmem_size:
                event.reject("invalid specification: vmem>mem")
            elif mem_size == vmem_size:
                # Avoid creating a "0mb" pbs.size
                return("cgswap=0B")
            else:
                cgswap_size = vmem_size - mem_size
                return ("cgswap="
                        + str(cgswap_size))
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       str(traceback.format_exc().strip().splitlines()))
            event.reject("Invalid (v)mem size requested")

    if 'mem' in memspecs and 'cgswap' in memspecs:
        try:
            if size_as_int(memspecs['mem']) > 0:
                mem_size = pbs.size(memspecs['mem'])
            else:
                mem_size = pbs.size("0B")
            if size_as_int(memspecs['cgswap']) > 0:
                cgswap_size = pbs.size(memspecs['cgswap'])
                vmem_size = mem_size + cgswap_size
            else:
                vmem_size = mem_size
            return ("vmem="
                    + str(vmem_size))
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       str(traceback.format_exc().strip().splitlines()))
            event.reject("Invalid mem or cgswap size requested")

    if 'vmem' in memspecs and 'cgswap' in memspecs:
        try:
            if size_as_int(memspecs['vmem']) > 0:
                vmem_size = pbs.size(memspecs['vmem'])
            else:
                vmem_size = pbs.size("0B")
            # Woraround for bug: no arithmetic on zero pbs.size
            # since user may have specified e.g. "0mb" cgswap
            if size_as_int(memspecs['cgswap']) == 0:
                mem_size = vmem_size
                return ("mem=" + str(mem_size))
            else:
                cgswap_size = pbs.size(memspecs['cgswap'])
                if cgswap_size >= vmem_size:
                    event.reject("invalid specification: mem<=0")
                else:
                    mem_size = vmem_size - cgswap_size
                    return ("mem=" + str(mem_size))
        except Exception:
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       str(traceback.format_exc().strip().splitlines()))
            event.reject("Invalid (v)mem size requested")
    return ""


def fill_cgswap():
    selspec = None
    event = pbs.event()

    job = event.job
    job_o = None
    if event.type == pbs.MODIFYJOB:
        job_o = event.job_o

    if (hasattr(job, 'Resource_List') and 'select' in job.Resource_List
            and job.Resource_List.select):
        # either a submission using -lselect or a qalter specifying -lselect
        selspec = repr(job.Resource_List["select"])
        pbs.logmsg(pbs.EVENT_DEBUG3, "fill_cgswap: original selspec is: %s"
                   % selspec)
        newspec = []
        for chunkspec in selspec.split('+'):
            chunkspec_split = chunkspec.split(':')
            try:
                chunkspec_quantity = int(chunkspec_split[0])
            except Exception:
                event.reject("Invalid number of chunks in -lselect")
            newchunk = chunkspec
            if len(chunkspec_split) == 1:
                newspec.append(newchunk)
            else:
                # more than just a number of chunks
                # -- get resources specified
                memspecs = {}
                for t in chunkspec_split[1:]:
                    if t.startswith('mem='):
                        memstr = t.split('=')[1]
                        memspecs['mem'] = memstr
                    if t.startswith('vmem='):
                        vmemstr = t.split('=')[1]
                        memspecs['vmem'] = vmemstr
                    if t.startswith('cgswap='):
                        cgswapstr = t.split('=')[1]
                        memspecs['cgswap'] = cgswapstr
                if len(memspecs) > 2:
                    event.reject("chunk specification overconstrained, "
                                 "specify only 2 of mem/vmem/cgswap")
                elif len(memspecs) == 2:
                    to_add = missing_str(memspecs)
                    if to_add:
                        newchunk += ":" + to_add
                    newspec.append(newchunk)
                else:
                    newspec.append(newchunk)
        newselspec = '+'.join(newspec)
        pbs.logmsg(pbs.EVENT_DEBUG3, "fill_cgswap: old selspec was: %s, "
                   "new selspec is %s"
                   % (selspec, newselspec))
        job.Resource_List['select'] = pbs.select(newselspec)
        # need to remove possibly stale "global" cgswap
        # if there is a select now but if the job was originally submitted
        # with "old style" per-job resources, as cgswap chunk values are
        # not summed into Resource_List as for vmem and mem
        try:
            job.Resource_List['cgswap'] = None
        except Exception:
            pass
    else:
        # Old style submission without -lselect
        # We set 'global' per-job resources; will fail (by design)
        # if original submission used -lselect.
        to_add = None
        memspecs_o = {}
        memspecs_n = {}
        memspecs = {}
        for res in ['vmem', 'mem', 'cgswap']:
            if (hasattr(job_o, 'Resource_List')
                    and res in job_o.Resource_List
                    and job_o.Resource_List[res] is not None):
                memspecs_o[res] = job_o.Resource_List[res]
            if (hasattr(job, 'Resource_List')
                    and res in job.Resource_List
                    and job.Resource_List[res] is not None):
                memspecs_n[res] = job.Resource_List[res]
        memspecs = {**memspecs_o, **memspecs_n}
        pbs.logmsg(pbs.EVENT_DEBUG3, "memspecs read is: %s"
                   % str(memspecs))

        if len(memspecs) == 3:
            # overconstrained -- we have 3 values for mem, vmem and cgswap
            if (event.type == pbs.QUEUEJOB or len(memspecs_n) > 2):
                event.reject("chunk specification overconstrained, "
                             "specify only 2 of mem/vmem/cgswap")
            else:
                # modifyjob -- values in the new dictionary are controlling
                if len(memspecs_n) == 2:
                    # the two new values determine the third
                    to_add = missing_str(memspecs_n)
                elif len(memspecs_n) == 1:
                    # specified one new value in qalter
                    # -- pick which old one to keep
                    # if new value is cgswap, keep old mem and recompute vmem
                    # if new value is vmem, keep old mem and recompute cgswap
                    # if new value is mem, keep old vmem and recompute cgswap
                    if 'cgswap' in memspecs_n:
                        del memspecs['vmem']
                    else:
                        del memspecs['cgswap']
        if len(memspecs) == 2 and not to_add:
            to_add = missing_str(memspecs)
        if to_add:
            to_add_split = to_add.split('=')
            job.Resource_List[to_add_split[0]] = pbs.size(to_add_split[1])


#
# FUNCTION main
#
def main():
    """
    Main function for execution
    """
    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Function called' % caller_name())
    # If an exception occurs, jobutil must be set to something
    jobutil = None
    hostname = pbs.get_local_nodename()
    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Host is %s' % (caller_name(), hostname))
    # Log the hook event type
    event = pbs.event()
    pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Hook name is %s' %
               (caller_name(), event.hook_name))

    if event.type in [pbs.MODIFYJOB, pbs.QUEUEJOB]:
        fill_cgswap()
        event.accept()

    try:
        set_global_vars()
    except Exception:
        pbs.logmsg(pbs.EVENT_DEBUG,
                   '%s: Hook failed to initialize configuration properly' %
                   caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG,
                   str(traceback.format_exc().strip().splitlines()))
        event.accept()
    # Instantiate the hook utility class
    try:
        hooks = HookUtils()
        pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Hook utility class instantiated' %
                   caller_name())
    except Exception:
        pbs.logmsg(pbs.EVENT_DEBUG,
                   '%s: Failed to instantiate hook utility class' %
                   caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG,
                   str(traceback.format_exc().strip().splitlines()))
        event.accept()
    # Bail out if there is no handler for this event
    if not hooks.hashandler(event.type):
        pbs.logmsg(pbs.EVENT_DEBUG, '%s: %s event not handled by this hook' %
                   (caller_name(), hooks.event_name(event.type)))
        event.accept()
    try:
        # Instantiate the job utility class first so jobutil can be accessed
        # by the exception handlers.
        if hasattr(event, 'job'):
            jobutil = JobUtils(event.job)
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: Job information class instantiated' %
                       caller_name())
        else:
            pbs.logmsg(pbs.EVENT_DEBUG4, '%s: Event does not include a job' %
                       caller_name())
        # Parse the cgroup configuration file here so we can use the file lock
        cfg = CgroupUtils.parse_config_file()
        # Instantiate the cgroup utility class
        vnode = None
        if hasattr(event, 'vnode_list'):
            if hostname in event.vnode_list:
                vnode = event.vnode_list[hostname]
        with Lock(cfg['cgroup_lock_file']):
            # Only write this once we grabbed the lock,
            # otherwise *another* event could actually win the lock
            # even though *this* event printed this message last,
            # and we'd be confused about the event that the winner services
            if event.type == pbs.EXECHOST_PERIODIC:
                loglevel = pbs.EVENT_DEBUG3
            else:
                loglevel = pbs.EVENT_DEBUG2
            if hasattr(event, 'job') and hasattr(event.job, 'id'):
                pbs.logmsg(loglevel, '%s: Event type is %s, job ID is %s'
                           % (caller_name(), hooks.event_name(event.type),
                              event.job.id))
            else:
                pbs.logmsg(loglevel, '%s: Event type is %s'
                           % (caller_name(), hooks.event_name(event.type)))

            cgroup = CgroupUtils(hostname, vnode, cfg=cfg)
            pbs.logmsg(pbs.EVENT_DEBUG4,
                       '%s: Cgroup utility class instantiated' % caller_name())

            # Bail out if there is nothing to do
            if not cgroup.subsystems:
                pbs.logmsg(pbs.EVENT_DEBUG,
                           '%s: Cgroups disabled or none to manage' %
                           caller_name())
                event.accept()

            # Call the appropriate handler
            if hooks.invoke_handler(event, cgroup, jobutil):
                pbs.logmsg(pbs.EVENT_DEBUG4,
                           '%s: Hook handler returned success for %s event' %
                           (caller_name(), hooks.event_name(event.type)))
                event.accept()
            else:
                pbs.logmsg(pbs.EVENT_DEBUG,
                           '%s: Hook handler returned failure for %s event' %
                           (caller_name(), hooks.event_name(event.type)))
                event.reject()
    except SystemExit:
        # The event.accept() and event.reject() methods generate a SystemExit
        # exception.
        pass
    except UserError as exc:
        # User must correct problem and resubmit job, job gets deleted
        msg = ('User error in %s handling %s event' %
               (event.hook_name, hooks.event_name(event.type)))
        if jobutil is not None:
            msg += (' for job %s' % (event.job.id))
            try:
                event.job.delete()
                msg += ' (deleted)'
            except Exception:
                msg += ' (deletion failed)'
        msg += (': %s %s' % (exc.__class__.__name__, str(exc.args)))
        pbs.logmsg(pbs.EVENT_ERROR, msg)
        event.reject(msg)
    except CgroupProcessingError as exc:
        # Something went wrong manipulating the cgroups
        pbs.logmsg(pbs.EVENT_DEBUG,
                   str(traceback.format_exc().strip().splitlines()))
        msg = ('Processing error in %s handling %s event' %
               (event.hook_name, hooks.event_name(event.type)))
        if jobutil is not None:
            msg += (' for job %s' % (event.job.id))
        msg += (': %s %s' % (exc.__class__.__name__, str(exc.args)))
        pbs.logmsg(pbs.EVENT_ERROR, msg)
        event.reject(msg)
    except Exception as exc:
        # Catch all other exceptions and report them, job gets held
        # and a stack trace is logged
        pbs.logmsg(pbs.EVENT_DEBUG,
                   str(traceback.format_exc().strip().splitlines()))
        msg = ('Unexpected error in %s handling %s event' %
               (event.hook_name, hooks.event_name(event.type)))
        if jobutil is not None:
            msg += (' for job %s' % (event.job.id))
            try:
                event.job.Hold_Types = pbs.hold_types('s')
                event.job.rerun()
                msg += ' (system hold set)'
            except Exception:
                msg += ' (system hold failed)'
        msg += (': %s %s' % (exc.__class__.__name__, str(exc.args)))
        pbs.logmsg(pbs.EVENT_ERROR, msg)
        event.reject(msg)


# The following block is skipped if this is a unit testing environment.
if (__name__ == 'builtins') or (__name__ == '__builtin__'):
    START = time.time()
    try:
        main()
    except SystemExit:
        # The event.accept() and event.reject() methods generate a
        # SystemExit exception.
        pass
    except Exception:
        # "Should never happen" since main() is supposed to catch these
        pbs.logmsg(pbs.EVENT_DEBUG,
                   str(traceback.format_exc().strip().splitlines()))
        pbs.event().reject(str(traceback.format_exc().strip().splitlines()))
    finally:
        event = pbs.event()
        if event.type == pbs.EXECHOST_PERIODIC:
            loglevel = pbs.EVENT_DEBUG3
        else:
            loglevel = pbs.EVENT_DEBUG2
        if hasattr(event, 'job') and hasattr(event.job, 'id'):
            pbs.logmsg(loglevel, 'Hook ended: %s, job ID %s, '
                       'event_type %s (elapsed time: %0.4lf)' %
                       (pbs.event().hook_name,
                        event.job.id,
                        str(pbs.event().type),
                        (time.time() - START)))
        else:
            pbs.logmsg(loglevel, 'Hook ended: %s, '
                       'event_type %s (elapsed time: %0.4lf)' %
                       (pbs.event().hook_name,
                        str(pbs.event().type),
                        (time.time() - START)))


================================================
FILE: src/iff/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

sbin_PROGRAMS = pbs_iff

pbs_iff_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

pbs_iff_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	@KRB5_LIBS@ \
	-lpthread \
	@socket_lib@ \
	@libz_lib@

pbs_iff_SOURCES = iff2.c $(top_srcdir)/src/lib/Libcmds/cmds_common.c


================================================
FILE: src/iff/iff2.c
================================================
#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <assert.h>
#include <netdb.h>
#include <pwd.h>
#include <sys/types.h>
#include <sys/param.h>
#include <sys/socket.h>
#include <sys/stat.h>
#include <netinet/in.h>
#include "libpbs.h"
#include "dis.h"
#include "server_limits.h"
#include "net_connect.h"
#include "credential.h"
#include "pbs_version.h"
#include "pbs_ecl.h"

#define PBS_IFF_MAX_CONN_RETRIES 6

/**
 * @file	iff2.c
 * @brief
 * 	pbs_iff - authenticates the user to the PBS server.
 *
 * @par	Usage: call via pbs_connect() with
 *		pbs_iff [-t] hostname port [parent_connection_port]
 *		pbs_iff --version
 *
 *		The parent_connection_port is required unless -t (for test) is given.
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

int
main(int argc, char *argv[], char *envp[])
{
	int err = 0;
	pbs_net_t hostaddr = 0;
	int i;
	unsigned int parentport;
	int parentsock = -1;
	int parentsock_port = -1;
	short legacy = -1;
	uid_t myrealuid;
	struct passwd *pwent;
	int servport = -1;
	int sock;
	struct sockaddr_in sockname;
	pbs_socklen_t socknamelen;
	int testmode = 0;
	extern int optind;
	char *cln_hostaddr = NULL;

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	cln_hostaddr = getenv(PBS_IFF_CLIENT_ADDR);

	/* Need to unset LOCALDOMAIN if set, want local host name */

	for (i = 0; envp[i]; ++i) {
		if (!strncmp(envp[i], "LOCALDOMAIN=", 12)) {
			envp[i] = "";
			break;
		}
	}

	while ((i = getopt(argc, argv, "ti:")) != EOF) {
		switch (i) {
			case 't':
				testmode = 1;
				break;
			case 'i':
				cln_hostaddr = optarg;
				break;
			default:
				err = 1;
		}
	}
	if ((cln_hostaddr != NULL) && (testmode == 1)) {
		err = 1;
	}

	/* Keep the backward compatibility of pbs_iff.
	 * If the invoker component is older version,
	 * It will pass one lesser argument to pbs_iff.
	 * in case of test mode, the (argc - optind) should always be 2.
	 * Setting legacy true for testmode and correct num ot args,
	 * because getsockname() should be called on LOCAL socket
	 * to get the port number.
	 */
	if ((testmode && (argc - optind) == 2) ||
	    (!testmode && (argc - optind) == 3)) {
		legacy = 1;
	} else if ((!testmode && (argc - optind) == 4)) {
		legacy = 0;
	}

	if ((err == 1) || (legacy == -1)) {
		fprintf(stderr,
			"Usage: %s [-t] host port [parent_sock][parent_port]\n",
			argv[0]);
		fprintf(stderr, "       %s --version\n", argv[0]);
		return (1);
	}

	if (!testmode && isatty(fileno(stdout))) {
		fprintf(stderr, "pbs_iff: output is a tty & not test mode\n");
		return (1);
	}

	if (initsocketlib())
		return 1;

	/* first, make sure we have a valid server (host), and ports */

	if ((hostaddr = get_hostaddr(argv[optind])) == (pbs_net_t) 0) {
		fprintf(stderr, "pbs_iff: unknown host %s\n", argv[optind]);
		return (1);
	}
	if ((servport = atoi(argv[++optind])) <= 0)
		return (1);

	/* set single threaded mode */
	pbs_client_thread_set_single_threaded_mode();
	/* disable attribute verification */
	set_no_attribute_verification();

	/* initialize the thread context */
	if (pbs_client_thread_init_thread_context() != 0) {
		fprintf(stderr, "pbs_iff: thread initialization failed\n");
		return (1);
	}

	for (i = 0; i < PBS_IFF_MAX_CONN_RETRIES; i++) {
		sock = client_to_svr_extend(hostaddr, (unsigned int) servport, 1, cln_hostaddr);
		if (sock != PBS_NET_RC_RETRY)
			break;
		sleep(i * i + 1); /* exponential sleep increase */
	}
	if (sock < 0) {
		fprintf(stderr, "pbs_iff: cannot connect to host\n");
		if (i == PBS_IFF_MAX_CONN_RETRIES)
			fprintf(stderr, "pbs_iff: all reserved ports in use\n");
		return (4);
	}

	DIS_tcp_funcs();

	/* setup connection level thread context */
	if (pbs_client_thread_init_connect_context(sock) != 0) {
		fprintf(stderr, "pbs_iff: connect initialization failed\n");
		return (1);
	}

	if (testmode == 0) {
		/*legacy component will still take one argument less and will still have getsockname() call
		 * to get the parent port*/
		if ((parentsock = atoi(argv[++optind])) < 0)
			return (1);
		if (legacy == 0) {
			if ((parentsock_port = atoi(argv[++optind])) < 0)
				return (1);
		}
	} else {
		/* for test mode, use my own port rather than the parents */
		parentsock = sock;
	}

	/* next, get the real user name */

	myrealuid = getuid();
	pwent = getpwuid(myrealuid);
	if (pwent == NULL)
		return (3);

	/* now get the parent's client-side port */

	socknamelen = sizeof(sockname);

	/* getsockname()should be called in case of legacy
	 * or testmode.
	 */
	if (legacy == 1 || testmode) {
		if (getsockname(parentsock, (struct sockaddr *) &sockname, &socknamelen) < 0)
			return (3);
		parentport = ntohs(sockname.sin_port);
	} else
		parentport = ntohs(parentsock_port);

	pbs_errno = 0;
	err = tcp_send_auth_req(sock, parentport, pwent->pw_name, AUTH_RESVPORT_NAME, getenv(PBS_CONF_ENCRYPT_METHOD));
	if (err != 0 && pbs_errno != PBSE_BADCRED)
		return 2;

	err = pbs_errno;
	while (write(fileno(stdout), &err, sizeof(int)) == -1) {
		if (errno != EINTR)
			break;
	}
	if (pbs_errno != 0) {
		char *msg = get_conn_errtxt(sock);
		int len = 0;
		if (msg != NULL)
			len = strlen(msg);
		while (write(fileno(stdout), (char *) &len, sizeof(int)) == -1) {
			if (errno != EINTR)
				break;
		}
		if (len > 0) {
			while (write(fileno(stdout), msg, strlen(msg)) == -1) {
				if (errno != EINTR)
					break;
			}
		}
		return (1);
	}

	(void) close(sock);
	(void) fclose(stdout);
	return (0);
}


================================================
FILE: src/include/Long.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _LONG_H
#define _LONG_H
#ifdef __cplusplus
extern "C" {
#endif

#include <limits.h>

/*
 * Define Long and u_Long to be the largest integer types supported by the
 * native compiler.  They need not be supported by printf or scanf or their
 * ilk.  Ltostr, uLtostr, strtoL, strtouL, and atoL provide conversion to and
 * from character string form.
 *
 * The following sections are listed in decreasing order of brain damage.
 */

/****************************************************************************/
#if defined(__GNUC__)

/* On these systems, the compiler supports 64-bit integers as long longs but */
/* there seems to be neither defined constant support nor library support. */

typedef long long Long;
typedef unsigned long long u_Long;

#define lONG_MIN (-0x7FFFFFFFFFFFFFFFLL - 1)
#define lONG_MAX 0x7FFFFFFFFFFFFFFFLL
#define UlONG_MAX 0xFFFFFFFFFFFFFFFFULL

Long strToL(const char *nptr, char **endptr, int base);
u_Long strTouL(const char *nptr, char **endptr, int base);
#define atoL(nptr) strToL((nptr), NULL, 10)

/****************************************************************************/
#elif defined(WIN32) /* Windows */

/* long long and unsigned long long are 64 bit signed  and unsigned */
/* integers on Windows platforms. */
/* C compilers under Windows has built in functions for conversion */
/* from string to 64 bit integers of signed and unsigned version. */

typedef long long Long;
typedef unsigned long long u_Long;

#define lONG_MIN LLONG_MIN
#define lONG_MAX LLONG_MAX
#define UlONG_MAX ULLONG_MAX

#define strToL(n, e, b) _strtoi64(n, e, (b))
#define strTouL(n, e, b) _strtoui64(n, e, (b))
#define aToL(nptr) _atoi64((nptr))
#define atoL(nptr) aToL((nptr))

/****************************************************************************/

#endif

const char *uLTostr(u_Long value, int base);
#ifdef __cplusplus
}
#endif
#endif /* _LONG_H */


================================================
FILE: src/include/Long_.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#define LONG_DIG_VALUE "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ"
extern int Long_neg;


================================================
FILE: src/include/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

include_HEADERS = \
	pbs_error.h \
	pbs_ifl.h \
	rm.h \
	tm_.h \
	tm.h

noinst_HEADERS = \
	acct.h \
	libauth.h \
	auth.h \
	attribute.h \
	avltree.h \
	basil.h \
	batch_request.h \
	bitfield.h \
	cmds.h \
	credential.h \
	dedup_jobids.h \
	dis.h \
	grunt.h \
	hook_func.h \
	hook.h \
	ifl_internal.h \
	job.h \
	libpbs.h \
	libsec.h \
	libutil.h \
	list_link.h \
	log.h \
	Long_.h \
	Long.h \
	Makefile.in \
	mom_func.h \
	mom_hook_func.h \
	mom_server.h \
	mom_vnode.h \
	net_connect.h \
	pbs_array_list.h \
	pbs_assert.h \
	pbs_client_thread.h \
	pbs_db.h \
	pbs_ecl.h \
	pbs_entlim.h \
	pbs_idx.h \
	pbs_internal.h \
	pbs_reliable.h \
	pbs_license.h \
	pbs_mpp.h \
	pbs_nodes.h \
	pbs_python.h \
	pbs_python_private.h \
	pbs_share.h \
	pbs_v1_module_common.i \
	pbs_version.h \
	pbs_json.h \
	placementsets.h \
	portability.h \
	port_forwarding.h \
	provision.h \
	qmgr.h \
	queue.h \
	range.h \
	reservation.h \
	resmon.h \
	resource.h \
	resv_node.h \
	tpp.h \
	sched_cmds.h \
	pbs_sched.h \
	server.h \
	server_limits.h \
	site_queue.h \
	site_job_attr_def.h \
	site_job_attr_enum.h \
	site_qmgr_node_print.h \
	site_qmgr_que_print.h \
	site_qmgr_sched_print.h \
	site_qmgr_svr_print.h \
	site_que_attr_def.h \
	site_que_attr_enum.h \
	site_resc_attr_def.h \
	site_resv_attr_def.h \
	site_resv_attr_enum.h \
	site_sched_attr_def.h \
	site_sched_attr_enum.h \
	site_svr_attr_def.h \
	site_svr_attr_enum.h \
	job_attr_enum.h \
	node_attr_enum.h \
	queue_attr_enum.h \
	resc_def_enum.h \
	resv_attr_enum.h \
	sched_attr_enum.h \
	svr_attr_enum.h \
	svrfunc.h \
	ticket.h \
	tracking.h \
	user.h \
	work_task.h


CLEANFILES = \
	job_attr_enum.h \
	node_attr_enum.h \
	queue_attr_enum.h \
	resc_def_enum.h \
	resv_attr_enum.h \
	sched_attr_enum.h \
	svr_attr_enum.h

job_attr_enum.h: $(top_srcdir)/src/lib/Libattr/master_job_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_job_attr_def.xml -d $@

node_attr_enum.h: $(top_srcdir)/src/lib/Libattr/master_node_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_node_attr_def.xml -d $@

queue_attr_enum.h: $(top_srcdir)/src/lib/Libattr/master_queue_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_queue_attr_def.xml -d $@

resc_def_enum.h: $(top_srcdir)/src/lib/Libattr/master_resc_def_all.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_resc_def_all.xml -d $@

resv_attr_enum.h: $(top_srcdir)/src/lib/Libattr/master_resv_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_resv_attr_def.xml -d $@

sched_attr_enum.h: $(top_srcdir)/src/lib/Libattr/master_sched_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_sched_attr_def.xml -d $@

svr_attr_enum.h: $(top_srcdir)/src/lib/Libattr/master_svr_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_svr_attr_def.xml -d $@


================================================
FILE: src/include/acct.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _ACCT_H
#define _ACCT_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * header file supporting PBS accounting information
 */

#define PBS_ACCT_MAX_RCD 4095
#define PBS_ACCT_LEAVE_EXTRA 500

/* for JOB accounting */

#define PBS_ACCT_QUEUE (int) 'Q'   /* Job Queued record */
#define PBS_ACCT_RUN (int) 'S'	   /* Job run (Started) */
#define PBS_ACCT_PRUNE (int) 's'   /* Job run (Reliably-Started, assigned resources pruned) */
#define PBS_ACCT_RERUN (int) 'R'   /* Job Rerun record */
#define PBS_ACCT_CHKPNT (int) 'C'  /* Job Checkpointed and held */
#define PBS_ACCT_RESTRT (int) 'T'  /* Job resTart (from chkpnt) record */
#define PBS_ACCT_END (int) 'E'	   /* Job Ended/usage record */
#define PBS_ACCT_DEL (int) 'D'	   /* Job Deleted by request */
#define PBS_ACCT_ABT (int) 'A'	   /* Job Abort by server */
#define PBS_ACCT_LIC (int) 'L'	   /* Floating License Usage */
#define PBS_ACCT_MOVED (int) 'M'   /* Job moved to other server */
#define PBS_ACCT_UPDATE (int) 'u'  /* phased job update record */
#define PBS_ACCT_NEXT (int) 'c'	   /* phased job next record */
#define PBS_ACCT_LAST (int) 'e'	   /* phased job last usage record */
#define PBS_ACCT_ALTER (int) 'a'   /* Job attribute is being altered */
#define PBS_ACCT_SUSPEND (int) 'z' /* Job is suspended */
#define PBS_ACCT_RESUME (int) 'r'  /* Suspended Job is resumed */

/* for RESERVATION accounting */

#define PBS_ACCT_UR (int) 'U'	    /* Unconfirmed reservation enters system */
#define PBS_ACCT_CR (int) 'Y'	    /* Unconfirmed to a Confirmed reservation */
#define PBS_ACCT_BR (int) 'B'	    /* Beginning of the reservation period */
#define PBS_ACCT_FR (int) 'F'	    /* Reservation period Finished */
#define PBS_ACCT_DRss (int) 'K'	    /* sched/server requests reservation's removal */
#define PBS_ACCT_DRclient (int) 'k' /* client requests reservation's removal */

/* for PROVISIONING accounting */
#define PBS_ACCT_PROV_START (int) 'P' /* Provisioning start record */
#define PBS_ACCT_PROV_END (int) 'p'   /* Provisioning end record */

extern int acct_open(char *filename);
extern void acct_close(void);
extern void account_record(int acctype, const job *pjob, char *text);
extern void write_account_record(int acctype, const char *jobid, char *text);

#ifdef _RESERVATION_H
extern void account_recordResv(int acctype, resc_resv *presv, char *text);
extern void account_resvstart(resc_resv *presv);
#endif

extern void account_jobstr(const job *pjob, int type);
extern void account_job_update(job *pjob, int type);
extern void account_jobend(job *pjob, char *used, int type);
extern void log_alter_records_for_attrs(job *pjob, svrattrl *plist);
extern void log_suspend_resume_record(job *pjob, int acct_type);
extern void set_job_ProvAcctRcd(job *pjob, long time_se, int type);

extern int concat_rescused_to_buffer(char **buffer, int *buffer_size, svrattrl *patlist, char *delim, const job *pjob);

#define PROVISIONING_STARTED 1
#define PROVISIONING_SUCCESS 2
#define PROVISIONING_FAILURE 3

#ifdef __cplusplus
}
#endif
#endif /* _ACCT_H */


================================================
FILE: src/include/attribute.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _ATTRIBUTE_H
#define _ATTRIBUTE_H
#ifdef __cplusplus
extern "C" {
#endif

#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "Long.h"
#include "grunt.h"
#include "list_link.h"
#include "pbs_db.h"

#ifndef _TIME_H
#include <sys/types.h>
#endif
/*
 * This header file contains the definitions for attributes
 *
 * Other required header files:
 *	"list_link.h"
 *	"portability.h"
 *
 * Attributes are represented in one or both of two forms, external and
 * internal.  When an attribute is moving external to the server, either
 * to the network or to disk (for saving), it is represented in the
 * external form, a "svrattropl" structure.  This structure holds the
 * attribute name as a string.  If the attribute is a resource type, the
 * resource name and resource value are encoded as strings, a total of three
 * strings.  If the attribute is not a resource, then the attribute value is
 * coded into a string for a total of two strings.
 *
 * Internally, attributes exist in two separate structures.  The
 * attribute type is defined by a "definition structure" which contains
 * the name of the attribute, flags, and pointers to the functions used
 * to access the value.  This info is "hard coded".  There is one
 * "attribute definition" per (attribute name, parent object type) pair.
 *
 * The attribute value is contained in another struture which contains
 * the value and flags.  Both the attribute value and definition are in
 * arrays and share the same index.  When an
 * object is created, the attributes associated with that object
 * are created with default values.
 */

/* define the size of fields in the structures */

#define ATRDFLAG 24
#define ATRVFLAG 16

#define ATRDTYPE 4
#define ATRVTYPE 8

#define ATRPART 4

#define BUF_SIZE 512
#define RESC_USED_BUF_SIZE 2048

#define MAX_STR_INT 40
#define ENDATTRIBUTES -711

/*
 * The following structure, svrattrl is used to hold the external form of
 * attributes.
 *
 */

struct svrattrl {
	pbs_list_link al_link;
	struct svrattrl *al_sister;	  /* co-resource svrattrl		     */
	struct attropl al_atopl;	  /* name,resource,value, see pbs_ifl.h   */
	int al_tsize;			  /* size of this structure (variable)    */
	int al_nameln;			  /* len of name string (including null)  */
	int al_rescln;			  /* len of resource name string (+ null) */
	int al_valln;			  /* len of value, may contain many nulls */
	unsigned int al_flags : ATRVFLAG; /* copy of attribute value flags */
	int al_refct : 16;		  /* reference count */
					  /*
	 * data follows directly after
	 */
};
typedef struct svrattrl svrattrl;

#define al_name al_atopl.name
#define al_resc al_atopl.resource
#define al_value al_atopl.value
#define al_op al_atopl.op

/*
 * The value of an attribute is contained in the following structure.
 *
 * The length field specifies the amount of memory that has been
 * malloc-ed for the value (used for at_str, at_array, and at_resrc).
 * If zero, no space has been malloc-ed.
 *
 * The union member is selected based on the value type given in the
 * flag field of the definition.
 */

struct size_value {
	u_Long atsv_num;	     /* numeric part of a size value */
	unsigned int atsv_shift : 8; /* binary shift count, K=10, g=20 */
	unsigned int atsv_units : 1; /* units (size in words or bytes) */
};
#define ATR_SV_BYTESZ 0 /* size is in bytes */
#define ATR_SV_WORDSZ 1 /* size is in words */

/* used for Finer Granularity Control */
struct attr_entity {
	void *ae_tree;	      /* root of tree */
	time_t ae_newlimittm; /* time last limit added */
};

union attrval {
	int type_int;
	long type_long;
	char *type_str;
};
typedef union attrval attrval_t;

enum attr_type {
	ATTR_TYPE_LONG,
	ATTR_TYPE_INT,
	ATTR_TYPE_STR,
};

union attr_val {		       /* the attribute value	*/
	long at_long;		       /* long integer */
	long long at_ll;	       /* largest long integer */
	char at_char;		       /* single character */
	char *at_str;		       /* char string  */
	struct array_strings *at_arst; /* array of strings */
	struct size_value at_size;     /* size value */
	pbs_list_head at_list;	       /* list of resources,  ... */
	struct pbsnode *at_jinfo;      /* ptr to node's job info  */
	short at_short;		       /* short int; node's state */
	float at_float;		       /* floating point value */
	struct attr_entity at_enty;    /* FGC entity tree head */
};

struct attribute {
	unsigned int at_flags : ATRVFLAG; /* attribute flags	*/
	unsigned int at_type : ATRVTYPE;  /* type of attribute    */
	svrattrl *at_user_encoded;	  /* encoded svrattrl form for users*/
	svrattrl *at_priv_encoded;	  /* encoded svrattrl form for mgr/op*/
	union attr_val at_val;		  /* the attribute value	*/
};
typedef struct attribute attribute;

/*
 * The following structure is used to define an attribute for any parent
 * object.  The structure declares the attribute's name, value type, and
 * access methods.  This information is "built into" the server in an array
 * of attribute_def structures.  The definition occurs once for a given name.
 */

struct attribute_def {
	char *at_name;
	int (*at_decode)(attribute *patr, char *name, char *rn, char *val);
	int (*at_encode)(const attribute *pattr, pbs_list_head *phead, char *aname, char *rsname, int mode, svrattrl **rtnl);
	int (*at_set)(attribute *pattr, attribute *nattr, enum batch_op);
	int (*at_comp)(attribute *pattr, attribute *with);
	void (*at_free)(attribute *pattr);
	int (*at_action)(attribute *pattr, void *pobject, int actmode);
	unsigned int at_flags : ATRDFLAG; /* flags: perms, ...		*/
	unsigned int at_type : ATRDTYPE;  /* type of attribute		*/
	unsigned int at_parent : ATRPART; /* type of parent object	*/
};
typedef struct attribute_def attribute_def;

/**
 * This structure is used by IFL verification mechanism to associate
 * specific verification routines to specific attributes. New attributes added
 * to the above attribute_def array should also be added to this array to enable
 * attribute verification.
 */
struct ecl_attribute_def {
	char *at_name;
	unsigned int at_flags; /* flags: perms, ...		*/
	unsigned int at_type;  /* type of attribute		*/
	/** function pointer to the datatype verification routine */
	int (*at_verify_datatype)(struct attropl *, char **);
	/** function pointer to the value verification routine */
	int (*at_verify_value)(int, int, int, struct attropl *, char **);
};
typedef struct ecl_attribute_def ecl_attribute_def;

/* the following is a special flag used in granting permission to create      */
/* indirect references to resources in vnodes.  This bit does not actually    */
/* appear within the at_flags field of an attribute definition.               */
#define ATR_PERM_ALLOW_INDIRECT 0x1000000

/* combination defines for permission field */

#define READ_ONLY (ATR_DFLAG_USRD | ATR_DFLAG_OPRD | ATR_DFLAG_MGRD)
#define READ_WRITE (ATR_DFLAG_USRD | ATR_DFLAG_OPRD | ATR_DFLAG_MGRD | ATR_DFLAG_USWR | ATR_DFLAG_OPWR | ATR_DFLAG_MGWR)
#define NO_USER_SET (ATR_DFLAG_USRD | ATR_DFLAG_OPRD | ATR_DFLAG_MGRD | ATR_DFLAG_OPWR | ATR_DFLAG_MGWR)
#define MGR_ONLY_SET (ATR_DFLAG_USRD | ATR_DFLAG_OPRD | ATR_DFLAG_MGRD | ATR_DFLAG_MGWR)
#define PRIV_READ (ATR_DFLAG_OPRD | ATR_DFLAG_MGRD)
#define ATR_DFLAG_SSET (ATR_DFLAG_SvWR | ATR_DFLAG_SvRD)

/* What permission needed to be settable in a hook script */
#define ATR_DFLAG_HOOK_SET (ATR_DFLAG_USWR | ATR_DFLAG_OPWR | ATR_DFLAG_MGWR)

/* Defines for Flag field in attribute (value) 		*/

#define ATR_VFLAG_SET 0x01		 /* has specifed value (is set)	*/
#define ATR_VFLAG_MODIFY 0x02		 /* value has been modified	*/
#define ATR_VFLAG_DEFLT 0x04		 /* value is default value	*/
#define ATR_VFLAG_MODCACHE 0x08		 /* value modified since cache 	*/
#define ATR_VFLAG_INDIRECT 0x10		 /* indirect pointer to resource */
#define ATR_VFLAG_TARGET 0x20		 /* target of indirect resource  */
#define ATR_VFLAG_HOOK 0x40		 /* value set by a hook script   */
#define ATR_VFLAG_IN_EXECVNODE_FLAG 0x80 /* resource key value pair was found in execvnode */

#define ATR_MOD_MCACHE (ATR_VFLAG_MODIFY | ATR_VFLAG_MODCACHE)
#define ATR_SET_MOD_MCACHE (ATR_VFLAG_SET | ATR_MOD_MCACHE)
#define ATR_UNSET(X) (X)->at_flags = (((X)->at_flags & ~ATR_VFLAG_SET) | ATR_MOD_MCACHE)

/* Defines for Parent Object type field in the attribute definition	*/
/* really only used for telling queue types apart			*/

#define PARENT_TYPE_JOB 1
#define PARENT_TYPE_QUE_ALL 2
#define PARENT_TYPE_QUE_EXC 3
#define PARENT_TYPE_QUE_RTE 4
#define PARENT_TYPE_QUE_PULL 5
#define PARENT_TYPE_SERVER 6
#define PARENT_TYPE_NODE 7
#define PARENT_TYPE_RESV 8
#define PARENT_TYPE_SCHED 9

/*
 * values for the "actmode" parameter to at_action()
 */
#define ATR_ACTION_NOOP 0
#define ATR_ACTION_NEW 1
#define ATR_ACTION_ALTER 2
#define ATR_ACTION_RECOV 3
#define ATR_ACTION_FREE 4

/*
 * values for the mode parameter to at_encode(), determines:
 *	- list separater character for encode_arst()
 *	- which resources are encoded (see attr_fn_resc.c[encode_resc]
 */
#define ATR_ENCODE_CLIENT 0 /* encode for sending to client	+ sched	*/
#define ATR_ENCODE_SVR 1    /* encode for sending to another server */
#define ATR_ENCODE_MOM 2    /* encode for sending to MOM		*/
#define ATR_ENCODE_SAVE 3   /* encode for saving to disk	        */
#define ATR_ENCODE_HOOK 4   /* encode for sending to hook 		*/
#define ATR_ENCODE_DB 5	    /* encode for saving to database        */

/*
 * structure to hold array of pointers to character strings
 */

struct array_strings {
	int as_npointers;   /* number of pointer slots in this block */
	int as_usedptr;	    /* number of used pointer slots */
	int as_bufsize;	    /* size of buffer holding strings */
	char *as_buf;	    /* address of buffer */
	char *as_next;	    /* first available byte in buffer */
	char *as_string[1]; /* first string pointer */
};

/*
 * specific attribute value function prototypes
 */
extern struct attrl *attropl2attrl(struct attropl *from);
struct attrl *new_attrl(void);
struct attrl *dup_attrl(struct attrl *oattr);
struct attrl *dup_attrl_list(struct attrl *oattr_list);
void free_attrl(struct attrl *at);
void free_attrl_list(struct attrl *at_list);
extern void clear_attr(attribute *pattr, attribute_def *pdef);
extern int find_attr(void *attrdef_idx, attribute_def *attr_def, char *name);
extern int recov_attr_fs(int fd, void *parent, void *padef_idx, attribute_def *padef,
			 attribute *pattr, int limit, int unknown);
extern void free_null(attribute *attr);
extern void free_none(attribute *attr);
extern svrattrl *attrlist_alloc(int szname, int szresc, int szval);
extern svrattrl *attrlist_create(char *aname, char *rname, int szval);
svrattrl *dup_svrattrl(svrattrl *osvrat);
extern void free_svrattrl(svrattrl *pal);
extern void free_attrlist(pbs_list_head *attrhead);
extern void free_svrcache(attribute *attr);
extern int attr_atomic_set(svrattrl *plist, attribute *old,
			   attribute *nattr, void *adef_idx, attribute_def *pdef, int limit,
			   int unkn, int privil, int *badattr);
extern int attr_atomic_node_set(svrattrl *plist, attribute *old,
				attribute *nattr, attribute_def *pdef, int limit,
				int unkn, int privil, int *badattr);
extern void attr_atomic_kill(attribute *temp, attribute_def *pdef, int);
extern void attr_atomic_copy(attribute *old, attribute *nattr, attribute_def *pdef, int limit);

extern int copy_svrattrl_list(pbs_list_head *from_phead, pbs_list_head *to_head);
extern int convert_attrl_to_svrattrl(struct attrl *from_list, pbs_list_head *to_head);
extern int compare_svrattrl_list(pbs_list_head *list1, pbs_list_head *list2);
extern svrattrl *find_svrattrl_list_entry(pbs_list_head *phead, char *name,
					  char *resc);
extern int add_to_svrattrl_list(pbs_list_head *phead, char *name_str, char *resc_str,
				char *val_str, unsigned int flag, char *name_prefix);
extern int add_to_svrattrl_list_sorted(pbs_list_head *phead, char *name_str, char *resc_str,
				       char *val_str, unsigned int flag, char *name_prefix);
extern unsigned int get_svrattrl_flag(char *name, char *resc, char *val,
				      pbs_list_head *svrattrl_list, int hook_set_flag);
extern int compare_svrattrl_list(pbs_list_head *l1, pbs_list_head *l2);

extern void free_str_array(char **);
extern char **svrattrl_to_str_array(pbs_list_head *);
extern int str_array_to_svrattrl(char **str_array, pbs_list_head *to_head, char *header_str);
extern char *str_array_to_str(char **str_array, char delimiter);
extern char *env_array_to_str(char **env_array, char delimiter);
extern char **str_to_str_array(char *str, char delimiter);
extern char *strtok_quoted(char *source, char delimiter);

extern int decode_b(attribute *patr, char *name, char *rn, char *val);
extern int decode_c(attribute *patr, char *name, char *rn, char *val);
extern int decode_entlim(attribute *patr, char *name, char *rn, char *val);
extern int decode_entlim_res(attribute *patr, char *name, char *rn, char *val);
extern int decode_f(attribute *patr, char *name, char *rn, char *val);
extern int decode_l(attribute *patr, char *name, char *rn, char *val);
extern int decode_ll(attribute *patr, char *name, char *rn, char *val);
extern int decode_size(attribute *patr, char *name, char *rn, char *val);
extern int decode_str(attribute *patr, char *name, char *rn, char *val);
extern int decode_jobname(attribute *patr, char *name, char *rn, char *val);
extern int decode_time(attribute *patr, char *name, char *rn, char *val);
extern int decode_arst(attribute *patr, char *name, char *rn, char *val);
extern int decode_arst_bs(attribute *patr, char *name, char *rn, char *val);
extern int decode_resc(attribute *patr, char *name, char *rn, char *val);
extern int decode_depend(attribute *patr, char *name, char *rn, char *val);
extern int decode_hold(attribute *patr, char *name, char *rn, char *val);
extern int decode_sandbox(attribute *patr, char *name, char *rn, char *val);
extern int decode_project(attribute *patr, char *name, char *rn, char *val);
extern int decode_uacl(attribute *patr, char *name, char *rn, char *val);
extern int decode_unkn(attribute *patr, char *name, char *rn, char *val);
extern int decode_nodes(attribute *, char *, char *, char *);
extern int decode_select(attribute *, char *, char *, char *);
extern int decode_Mom_list(attribute *, char *, char *, char *);

extern int encode_b(const attribute *attr, pbs_list_head *phead, char *atname,
		    char *rsname, int mode, svrattrl **rtnl);
extern int encode_c(const attribute *attr, pbs_list_head *phead, char *atname,
		    char *rsname, int mode, svrattrl **rtnl);
extern int encode_entlim(const attribute *attr, pbs_list_head *phead, char *atname,
			 char *rsname, int mode, svrattrl **rtnl);
extern int encode_f(const attribute *attr, pbs_list_head *phead, char *atname,
		    char *rsname, int mode, svrattrl **rtnl);
extern int encode_l(const attribute *attr, pbs_list_head *phead, char *atname,
		    char *rsname, int mode, svrattrl **rtnl);
extern int encode_ll(const attribute *attr, pbs_list_head *phead, char *atname,
		     char *rsname, int mode, svrattrl **rtnl);
extern int encode_size(const attribute *attr, pbs_list_head *phead, char *atname,
		       char *rsname, int mode, svrattrl **rtnl);
extern int encode_str(const attribute *attr, pbs_list_head *phead, char *atname,
		      char *rsname, int mode, svrattrl **rtnl);
extern int encode_time(const attribute *attr, pbs_list_head *phead, char *atname,
		       char *rsname, int mode, svrattrl **rtnl);
extern int encode_arst(const attribute *attr, pbs_list_head *phead, char *atname,
		       char *rsname, int mode, svrattrl **rtnl);
extern int encode_arst_bs(const attribute *attr, pbs_list_head *phead, char *atname,
			  char *rsname, int mode, svrattrl **rtnl);
extern int encode_resc(const attribute *attr, pbs_list_head *phead, char *atname,
		       char *rsname, int mode, svrattrl **rtnl);
extern int encode_inter(const attribute *attr, pbs_list_head *phead, char *atname,
			char *rsname, int mode, svrattrl **rtnl);
extern int encode_unkn(const attribute *attr, pbs_list_head *phead, char *atname,
		       char *rsname, int mode, svrattrl **rtnl);
extern int encode_depend(const attribute *attr, pbs_list_head *phead, char *atname,
			 char *rsname, int mode, svrattrl **rtnl);
extern int encode_hold(const attribute *attr, pbs_list_head *phead, char *atname,
		       char *rsname, int mode, svrattrl **rtnl);

extern int set_b(attribute *attr, attribute *nattr, enum batch_op);
extern int set_c(attribute *attr, attribute *nattr, enum batch_op);
extern int set_entlim(attribute *attr, attribute *nattr, enum batch_op);
extern int set_entlim_res(attribute *attr, attribute *nattr, enum batch_op);
extern int set_f(attribute *attr, attribute *nattr, enum batch_op);
extern int set_l(attribute *attr, attribute *nattr, enum batch_op);
extern int set_ll(attribute *attr, attribute *nattr, enum batch_op);
extern int set_size(attribute *attr, attribute *nattr, enum batch_op);
extern int set_str(attribute *attr, attribute *nattr, enum batch_op);
extern int set_arst(attribute *attr, attribute *nattr, enum batch_op);
extern int set_arst_uniq(attribute *attr, attribute *nattr, enum batch_op);
extern int set_resc(attribute *attr, attribute *nattr, enum batch_op);
extern int set_hostacl(attribute *attr, attribute *nattr, enum batch_op);
extern int set_uacl(attribute *attr, attribute *nattr, enum batch_op);
extern int set_gacl(attribute *attr, attribute *nattr, enum batch_op);
extern int set_unkn(attribute *attr, attribute *nattr, enum batch_op);
extern int set_depend(attribute *attr, attribute *nattr, enum batch_op);
extern u_Long get_kilobytes_from_attr(attribute *);
extern u_Long get_bytes_from_attr(attribute *);

extern int comp_b(attribute *attr, attribute *with);
extern int comp_c(attribute *attr, attribute *with);
extern int comp_f(attribute *attr, attribute *with);
extern int comp_l(attribute *attr, attribute *with);
extern int comp_ll(attribute *attr, attribute *with);
extern int comp_size(attribute *attr, attribute *with);
extern void from_size(const struct size_value *, char *);
extern int comp_str(attribute *attr, attribute *with);
extern int comp_arst(attribute *attr, attribute *with);
extern int comp_resc(attribute *attr, attribute *with);
extern int comp_unkn(attribute *attr, attribute *with);
extern int comp_depend(attribute *attr, attribute *with);
extern int comp_hold(attribute *attr, attribute *with);

extern int action_depend(attribute *attr, void *pobj, int mode);
extern int check_no_entlim(attribute *attr, void *pobj, int mode);
extern int action_entlim_chk(attribute *attr, void *pobj, int mode);
extern int action_entlim_ct(attribute *attr, void *pobj, int mode);
extern int action_entlim_res(attribute *attr, void *pobj, int mode);
extern int at_non_zero_time(attribute *attr, void *pobj, int mode);
extern int set_log_events(attribute *pattr, void *pobject, int actmode);

extern void free_str(attribute *attr);
extern void free_arst(attribute *attr);
extern void free_entlim(attribute *attr);
extern void free_resc(attribute *attr);
extern void free_depend(attribute *attr);
extern void free_unkn(attribute *attr);
extern int parse_equal_string(char *start, char **name, char **value);
extern char *parse_comma_string(char *start);
extern char *return_external_value(char *name, char *val);
extern char *return_internal_value(char *name, char *val);

#define NULL_FUNC_CMP (int (*)(attribute *, attribute *)) 0
#define NULL_FUNC_RESC (int (*)(resource *, attribute *, void *, int, int)) 0
#define NULL_FUNC (int (*)(attribute *, void *, int)) 0
#define NULL_VERIFY_DATATYPE_FUNC (int (*)(struct attropl *, char **)) 0
#define NULL_VERIFY_VALUE_FUNC (int (*)(int, int, int, struct attropl *, char **)) 0

/* other associated funtions */

extern int acl_check(attribute *, char *canidate, int type);
extern int check_duplicates(struct array_strings *strarr);

extern char *arst_string(char *str, attribute *pattr);
extern void attrl_fixlink(pbs_list_head *svrattrl);
extern int save_attr_fs(attribute_def *, attribute *, int);

extern int encode_state(const attribute *, pbs_list_head *, char *,
			char *, int, svrattrl **rtnl);
extern int encode_props(const attribute *, pbs_list_head *, char *,
			char *, int, svrattrl **rtnl);
extern int encode_jobs(const attribute *, pbs_list_head *, char *,
		       char *, int, svrattrl **rtnl);
extern int encode_resvs(const attribute *, pbs_list_head *, char *,
			char *, int, svrattrl **rtnl);
extern int encode_ntype(const attribute *, pbs_list_head *, char *,
			char *, int, svrattrl **rtnl);
extern int encode_sharing(const attribute *, pbs_list_head *, char *,
			  char *, int, svrattrl **rtnl);
extern int decode_state(attribute *, char *, char *, char *);
extern int decode_props(attribute *, char *, char *, char *);
extern int decode_ntype(attribute *, char *, char *, char *);
extern int decode_sharing(attribute *, char *, char *, char *);
extern int decode_null(attribute *, char *, char *, char *);
extern int comp_null(attribute *, attribute *);
extern int count_substrings(char *, int *);
extern int set_resources_min_max(attribute *, attribute *, enum batch_op);
extern int set_node_state(attribute *, attribute *, enum batch_op);
extern int set_node_ntype(attribute *, attribute *, enum batch_op);
extern int set_node_props(attribute *, attribute *, enum batch_op);
extern int set_null(attribute *, attribute *, enum batch_op);
extern int node_state(attribute *, void *, int);
extern int node_np_action(attribute *, void *, int);
extern int node_ntype(attribute *, void *, int);
extern int node_prop_list(attribute *, void *, int);
extern int node_comment(attribute *, void *, int);
extern int is_true_or_false(char *val);
extern void unset_entlim_resc(attribute *, char *);
extern int action_node_partition(attribute *, void *, int);

/* Action routines for OS provisioning */
extern int node_prov_enable_action(attribute *, void *, int);
extern int node_current_aoe_action(attribute *, void *, int);
extern int svr_max_conc_prov_action(attribute *, void *, int);

/* Manager functions */
extern void mgr_log_attr(char *, struct svrattrl *, int, char *, char *);
extern int mgr_set_attr(attribute *, void *, attribute_def *, int, svrattrl *, int, int *, void *, int);
/* Extern functions (at_action) called  from job_attr_def*/

extern int job_set_wait(attribute *, void *, int);
extern int setup_arrayjob_attrs(attribute *pattr, void *pobject, int actmode);
extern int fixup_arrayindicies(attribute *pattr, void *pobject, int actmode);
extern int action_resc_job(attribute *pattr, void *pobject, int actmode);
extern int ck_chkpnt(attribute *pattr, void *pobject, int actmode);
extern int keepfiles_action(attribute *pattr, void *pobject, int actmode);
extern int removefiles_action(attribute *pattr, void *pobject, int actmode);
/*extern int depend_on_que(attribute *, void *, int);*/
extern int comp_chkpnt(attribute *, attribute *);
extern int alter_eligibletime(attribute *, void *, int);
extern int action_max_run_subjobs(attribute *, void *, int);
/* Extern functions from svr_attr_def */
extern int manager_oper_chk(attribute *pattr, void *pobject, int actmode);
extern int poke_scheduler(attribute *pattr, void *pobject, int actmode);
extern int cred_name_okay(attribute *pattr, void *pobject, int actmode);
extern int action_reserve_retry_time(attribute *pattr, void *pobject, int actmode);
extern int action_reserve_retry_init(attribute *pattr, void *pobject, int actmode);
extern int set_rpp_retry(attribute *pattr, void *pobject, int actmode);
extern int set_node_fail_requeue(attribute *pattr, void *pobject, int actmode);
extern int set_resend_term_delay(attribute *pattr, void *pobject, int actmode);
extern int set_rpp_highwater(attribute *pattr, void *pobject, int actmode);
extern int set_license_location(attribute *pattr, void *pobject, int actmode);
extern int set_license_min(attribute *pattr, void *pobject, int actmode);
extern int set_license_max(attribute *pattr, void *pobject, int actmode);
extern int set_license_linger(attribute *pattr, void *pobject, int actmode);
extern int set_job_history_enable(attribute *pattr, void *pobject, int actmode);
extern int set_job_history_duration(attribute *pattr, void *pobject, int actmode);
extern int default_queue_chk(attribute *pattr, void *pobject, int actmode);
extern int force_qsub_daemons_update_action(attribute *pattr, void *pobject, int actmode);
extern int action_resc_dflt_svr(attribute *pattr, void *pobj, int actmode);
extern int action_jobscript_max_size(attribute *pattr, void *pobj, int actmode);
extern int action_check_res_to_release(attribute *pattr, void *pobj, int actmode);
extern int set_max_job_sequence_id(attribute *pattr, void *pobj, int actmode);
extern int set_cred_renew_enable(attribute *pattr, void *pobject, int actmode);
extern int set_cred_renew_period(attribute *pattr, void *pobject, int actmode);
extern int set_cred_renew_cache_period(attribute *pattr, void *pobject, int actmode);
extern int action_clear_topjob_estimates(attribute *pattr, void *pobj, int actmode);

/* Extern functions from sched_attr_def*/
extern int action_opt_bf_fuzzy(attribute *pattr, void *pobj, int actmode);

extern int encode_svrstate(const attribute *pattr, pbs_list_head *phead, char *aname,
			   char *rsname, int mode, svrattrl **rtnl);

extern int decode_rcost(attribute *patr, char *name, char *rn, char *val);
extern int encode_rcost(const attribute *attr, pbs_list_head *phead, char *atname,
			char *rsname, int mode, svrattrl **rtnl);
extern int set_rcost(attribute *attr, attribute *nattr, enum batch_op);
extern void free_rcost(attribute *attr);
extern int decode_null(attribute *patr, char *name, char *rn, char *val);
extern int set_null(attribute *patr, attribute *nattr, enum batch_op op);
extern int eligibletime_action(attribute *pattr, void *pobject, int actmode);
extern int decode_formula(attribute *patr, char *name, char *rn, char *val);
extern int action_backfill_depth(attribute *pattr, void *pobj, int actmode);
extern int action_est_start_time_freq(attribute *pattr, void *pobj, int actmode);
extern int action_sched_iteration(attribute *pattr, void *pobj, int actmode);
extern int action_sched_priv(attribute *pattr, void *pobj, int actmode);
extern int action_sched_log(attribute *pattr, void *pobj, int actmode);
extern int action_sched_user(attribute *pattr, void *pobj, int actmode);
extern int action_sched_host(attribute *pattr, void *pobj, int actmode);
extern int action_sched_partition(attribute *pattr, void *pobj, int actmode);
extern int action_sched_preempt_order(attribute *pattr, void *pobj, int actmode);
extern int action_sched_preempt_common(attribute *pattr, void *pobj, int actmode);
extern int action_job_run_wait(attribute *pattr, void *pobj, int actmode);
extern int action_throughput_mode(attribute *pattr, void *pobj, int actmode);

/* Extern functions from queue_attr_def */
extern int decode_null(attribute *patr, char *name, char *rn, char *val);
extern int set_null(attribute *patr, attribute *nattr, enum batch_op op);
extern int cred_name_okay(attribute *pattr, void *pobject, int actmode);
extern int action_resc_dflt_queue(attribute *pattr, void *pobj, int actmode);
extern int action_queue_partition(attribute *pattr, void *pobj, int actmode);
/* Extern functions (at_action) called  from resv_attr_def */
extern int action_resc_resv(attribute *pattr, void *pobject, int actmode);

/* Functions used to save and recover the attributes from the database */
extern int encode_single_attr_db(attribute_def *padef, attribute *pattr, pbs_db_attr_list_t *db_attr_list);
extern int encode_attr_db(attribute_def *padef, attribute *pattr, int numattr, pbs_db_attr_list_t *db_attr_list, int all);
extern int decode_attr_db(void *parent, pbs_list_head *attr_list,
			  void *padef_idx, attribute_def *padef, attribute *pattr, int limit, int unknown);

extern int is_attr(int, char *, int);

extern int set_attr(struct attrl **attrib, const char *attrib_name, const char *attrib_value);
extern int set_attr_resc(struct attrl **attrib, const char *attrib_name, const char *attrib_resc, const char *attrib_value);

extern svrattrl *make_attr(char *attr_name, char *attr_resc, char *attr_value, int attr_flags);
extern void *cr_attrdef_idx(attribute_def *adef, int limit);

/* Attr setters */
int set_attr_generic(attribute *pattr, attribute_def *pdef, char *value, char *rescn, enum batch_op op);
int set_attr_with_attr(attribute_def *pdef, attribute *oattr, attribute *nattr, enum batch_op op);
void set_attr_l(attribute *pattr, long value, enum batch_op op);
void set_attr_ll(attribute *pattr, long long value, enum batch_op op);
void set_attr_c(attribute *pattr, char value, enum batch_op op);
void set_attr_b(attribute *pattr, long val, enum batch_op op);
void set_attr_short(attribute *pattr, short value, enum batch_op op);
void mark_attr_not_set(attribute *attr);
void mark_attr_set(attribute *attr);
void post_attr_set(attribute *attr);

/* Attr getters */
char get_attr_c(const attribute *pattr);
long get_attr_l(const attribute *pattr);
long long get_attr_ll(const attribute *pattr);
char *get_attr_str(const attribute *pattr);
struct array_strings *get_attr_arst(const attribute *pattr);
int is_attr_set(const attribute *pattr);
attribute *_get_attr_by_idx(attribute *list, int attr_idx);
pbs_list_head get_attr_list(const attribute *pattr);
void free_attr(attribute_def *attr_def, attribute *pattr, int attr_idx);

/* "type" to pass to acl_check() */
#define ACL_Host 1
#define ACL_User 2
#define ACL_Group 3
#define ACL_Subnet 4

#ifdef __cplusplus
}
#endif
#endif /* _ATTRIBUTE_H */


================================================
FILE: src/include/auth.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _AUTH_H
#define _AUTH_H
#ifdef __cplusplus
extern "C" {
#endif

#include <netdb.h>

#include "libauth.h"

#define AUTH_RESVPORT_NAME "resvport"
#define AUTH_MUNGE_NAME "munge"
#define AUTH_GSS_NAME "gss"
#ifndef MAXPATHLEN
#define MAXPATHLEN 1024
#endif

#define FOR_AUTH 0
#define FOR_ENCRYPT 1

enum AUTH_CTX_STATUS {
	AUTH_STATUS_UNKNOWN = 0,
	AUTH_STATUS_CTX_ESTABLISHING,
	AUTH_STATUS_CTX_READY
};

typedef struct auth_def auth_def_t;
struct auth_def {
	/* name of authentication method name */
	char name[MAXAUTHNAME + 1];

	/* pointer to store handle from loaded auth library */
	void *lib_handle;

	/*
	 * the function pointer to set logger method for auth lib
	 */
	void (*set_config)(const pbs_auth_config_t *auth_config);

	/*
	 * the function pointer to create new auth context used by auth lib
	 */
	int (*create_ctx)(void **ctx, int mode, int conn_type, const char *hostname);

	/*
	 * the function pointer to free auth context used by auth lib
	 */
	void (*destroy_ctx)(void *ctx);

	/*
	 * the function pointer to get user, host and realm information from authentication context
	 */
	int (*get_userinfo)(void *ctx, char **user, char **host, char **realm);

	/*
	 * the function pointer to process auth handshake data and authenticate user/connection
	 */
	int (*process_handshake_data)(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out, int *is_handshake_done);

	/*
	 * the function pointer to encrypt data
	 */
	int (*encrypt_data)(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out);

	/*
	 * the function pointer to decrypt data
	 */
	int (*decrypt_data)(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out);

	/*
	 * pointer to next authdef structure
	 */
	auth_def_t *next;
};

enum AUTH_MSG_TYPES {
	AUTH_CTX_DATA = 1, /* starts from 1, zero means EOF */
	AUTH_ERR_DATA,
	AUTH_CTX_OK,
	AUTH_ENCRYPTED_DATA,
	AUTH_LAST_MSG
};

extern auth_def_t *get_auth(char *);
extern int load_auths(int mode);
extern void unload_auths(void);
int is_valid_encrypt_method(char *);
pbs_auth_config_t *make_auth_config(char *, char *, char *, char *, void *);
void free_auth_config(pbs_auth_config_t *);

extern int engage_client_auth(int, const char *, int, char *, size_t);
extern int engage_server_auth(int, char *, int, int, char *, size_t);
int handle_client_handshake(int fd, const char *hostname, char *method, int for_encrypt, pbs_auth_config_t *config, char *ebuf, size_t ebufsz);

/* For qsub interactive - execution host authentication */
enum INTERACTIVE_AUTH_STATUS {
	INTERACTIVE_AUTH_SUCCESS = 0,
	INTERACTIVE_AUTH_FAILED,
	INTERACTIVE_AUTH_RETRY
};
int auth_exec_socket(int sock, struct sockaddr_in *from, char *auth_method, char *encrypt_method, char *jobid);
int auth_with_qsub(int sock, unsigned short port, char* hostname, char *auth_method, char *encrypt_method, char *jobid);
int client_cipher_auth(int fd, char *text, char *ebuf, size_t ebufsz);
int server_cipher_auth(int fd, char *text, char *ebuf, size_t ebufsz);

#ifdef __cplusplus
}
#endif
#endif /* _AUTH_H */


================================================
FILE: src/include/avltree.h
================================================
/*
 *	The  first  version  of  this  code  was written in Algol 68 by Gregory
 *	Tseytin  (tseyting@acm.org)  who  later  translated  it  to   C.    The
 *	AVL_COUNT_DUPS  option  was  added  at  the  suggestion  of  Bill  Ross
 *	(bross@nas.nasa.gov), who also packaged the code for distribution.
 *
 *	Taken from NetBSD avltree-1.1.tar.gz.
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _AVLTREE_H
#define _AVLTREE_H
#ifdef __cplusplus
extern "C" {
#endif

#define AVL_DEFAULTKEYLEN (4 * sizeof(int)) /* size of default key */

typedef void *AVL_RECPOS;

typedef struct {
	AVL_RECPOS recptr;
	unsigned int count;
	char key[AVL_DEFAULTKEYLEN];
	/* actually can be of any length */
} rectype;

typedef rectype AVL_IX_REC;

typedef struct {
	void *root;
	int keylength; /* zero for null-terminated strings */
	int flags;
} AVL_IX_DESC;

/*  return codes  */
#define AVL_IX_OK 1
#define AVL_IX_FAIL 0
#define AVL_EOIX -2

/* default behavior is no-dup-keys and case-sensitive search */
#define AVL_DUP_KEYS_OK 0x01 /* repeated key & rec cause an error message */
#define AVL_CASE_CMP 0x02    /* case insensitive search */

extern void avl_set_maxthreads(int n);
extern void *get_avl_tls(void);
extern void free_avl_tls(void);
extern int avl_create_index(AVL_IX_DESC *pix, int flags, int keylength);
extern void avl_destroy_index(AVL_IX_DESC *pix);
extern int avl_find_key(AVL_IX_REC *pe, AVL_IX_DESC *pix);
extern int avl_add_key(AVL_IX_REC *pe, AVL_IX_DESC *pix);
extern int avl_delete_key(AVL_IX_REC *pe, AVL_IX_DESC *pix);
extern void avl_first_key(AVL_IX_DESC *pix);
extern int avl_next_key(AVL_IX_REC *pe, AVL_IX_DESC *pix);

/* Added by Altair */
AVL_IX_REC *avlkey_create(AVL_IX_DESC *tree, void *key);

#ifdef __cplusplus
}
#endif
#endif /* _AVLTREE_H */


================================================
FILE: src/include/basil.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * This file is provided as a convenience to anyone wishing to utilize
 * the Batch and Application Scheduler Interface Layer (BASIL) for the
 * Application Level Placement Scheduler (ALPS). It contains macro and
 * structure definitions that identify the elements and attributes
 * found in BASIL.
 *
 * BASIL was originally designed and coded by Michael Karo (mek@cray.com).
 *
 * BASIL has been improved and updated by contributors including:
 *  - Jason Coverston (jcovers@cray.com)
 *  - Benjamin Landsteiner (ben@cray.com)
 *
 */
/* WARNING - this file has been modified by Altair from the original
 * file provided by Cray. Please merge this file with any new basil.h
 * copies that Cray may provide.
 */

// clang-format off

#ifndef _BASIL_H
#define _BASIL_H


#ifndef __GNUC__
#define __attribute__(x) /* nothing */
#endif

#define BASIL_STRING_SHORT (16)
#define BASIL_STRING_MEDIUM (32)
#define BASIL_STRING_LONG (64)
#define BASIL_ERROR_BUFFER_SIZE (256)

#define BASIL_STRSET_SHORT(dst, src) 	snprintf(dst, BASIL_STRING_SHORT, "%s", src)
#define BASIL_BZERO_SHORT(p)		memset(p, 0, BASIL_STRING_SHORT)
#define BASIL_STRSET_MEDIUM(dst, src)	snprintf(dst, BASIL_STRING_MEDIUM, "%s", src)
#define BASIL_BZERO_MEDIUM(p) 		memset(p, 0, BASIL_STRING_MEDIUM)
#define BASIL_STRSET_LONG(dst, src)	snprintf(dst, BASIL_STRING_LONG, "%s", src)
#define BASIL_BZERO_LONG(p)		memset(p, 0, BASIL_STRING_LONG)

/*
 *	Macro Name		Text			May Appear Within
 *	==========		====			=================
 */

/* XML element names */

#define BASIL_ELM_MESSAGE	"Message"		/* All elements */
#define BASIL_ELM_REQUEST	"BasilRequest"		/* Top level */
#define BASIL_ELM_RESVPARAMARRAY "ReserveParamArray"	/* BASIL_ELM_REQUEST */
#define BASIL_ELM_RESERVEPARAM	"ReserveParam"		/* BASIL_ELM_RESVPARAMARRAY */
#define BASIL_ELM_NODEPARMARRAY "NodeParamArray"	/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ELM_NODEPARAM	"NodeParam"		/* BASIL_ELM_NODEPARMARRAY */
#define BASIL_ELM_MEMPARAMARRAY "MemoryParamArray"	/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ELM_MEMPARAM	"MemoryParam"		/* BASIL_ELM_MEMPARAMARRAY */
#define BASIL_ELM_LABELPARAMARRAY "LabelParamArray"	/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ELM_LABELPARAM	"LabelParam"		/* BASIL_ELM_LABELPARAMARRAY */

#define BASIL_ELM_RESPONSE	"BasilResponse"		/* Top level */
#define BASIL_ELM_RESPONSEDATA	"ResponseData"		/* BASIL_ELM_RESPONSE */
#define BASIL_ELM_RESERVED	"Reserved"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_CONFIRMED	"Confirmed"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_RELEASED	"Released"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_ENGINE	"Engine"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_INVENTORY	"Inventory"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_NETWORK	"Network"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_TOPOLOGY	"Topology"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_FILTARRAY	"FilterArray"		/* BASIL_ELM_TOPOLOGY */
#define BASIL_ELM_FILTER	"Filter"		/* BASIL_ELM_FILTARRAY */
#define BASIL_ELM_NODEARRAY	"NodeArray"		/* BASIL_ELM_INVENTORY */
#define BASIL_ELM_NODE		"Node"			/* BASIL_ELM_NODEARRAY */
#define BASIL_ELM_ACCELPARAMARRAY "AccelParamArray"	/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ELM_ACCELPARAM	"AccelParam"		/* BASIL_ELM_ACCELPARAMARRAY */
#define BASIL_ELM_ACCELERATORARRAY "AcceleratorArray"	/* BASIL_ELM_NODE */
#define BASIL_ELM_ACCELERATOR	"Accelerator"		/* BASIL_ELM_ACCELERATORARRAY */
							/* BASIL_ELM_ACCELSUM */
#define BASIL_ELM_ACCELERATORALLOC "AcceleratorAllocation" /* BASIL_ELM_ACCELERATOR */
#define BASIL_ELM_SOCKETARRAY	"SocketArray"		/* BASIL_ELM_NODE */
#define BASIL_ELM_SOCKET	"Socket"		/* BASIL_ELM_SOCKETARRAY */
#define BASIL_ELM_SEGMENTARRAY	"SegmentArray"		/* BASIL_ELM_SOCKET */
#define BASIL_ELM_SEGMENT	"Segment"		/* BASIL_ELM_SEGMENTARRAY */
#define BASIL_ELM_CUARRAY	"ComputeUnitArray"	/* BASIL_ELM_SEGMENT */
#define BASIL_ELM_COMPUTEUNIT	"ComputeUnit"		/* BASIL_ELM_CUARRAY */
#define BASIL_ELM_PROCESSORARRAY "ProcessorArray"	/* BASIL_ELM_SEGMENT */
							/* BASIL_ELM_COMPUTEUNIT */
#define BASIL_ELM_PROCESSOR	"Processor"		/* BASIL_ELM_PROCESSORARRAY */
#define BASIL_ELM_PROCESSORALLOC "ProcessorAllocation"	/* BASIL_ELM_PROCESSOR */
#define BASIL_ELM_MEMORYARRAY	"MemoryArray"		/* BASIL_ELM_SEGMENT */
#define BASIL_ELM_MEMORY	"Memory"		/* BASIL_ELM_MEMORYARRAY */
#define BASIL_ELM_MEMORYALLOC	"MemoryAllocation"	/* BASIL_ELM_MEMORY */
#define BASIL_ELM_LABELARRAY	"LabelArray"		/* BASIL_ELM_SEGMENT */
#define BASIL_ELM_LABEL		"Label"			/* BASIL_ELM_LABELARRAY */
#define BASIL_ELM_RSVNARRAY	"ReservationArray"	/* BASIL_ELM_INVENTORY */
							/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_RESERVATION	"Reservation"		/* BASIL_ELM_RSVNARRAY */
#define BASIL_ELM_APPARRAY	"ApplicationArray"	/* BASIL_ELM_RESERVATION */
							/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_APPLICATION	"Application"		/* BASIL_ELM_APPARRAY */
#define BASIL_ELM_CMDARRAY	"CommandArray"		/* BASIL_ELM_APPLICATION */
#define BASIL_ELM_COMMAND	"Command"		/* BASIL_ELM_CMDARRAY */
#define BASIL_ELM_RSVD_NODEARRAY "ReservedNodeArray"	/* BASIL_ELM_RESERVED */
#define BASIL_ELM_RSVD_NODE	"ReservedNode"		/* BASIL_ELM_RSVD_NODEARRAY */
#define BASIL_ELM_RSVD_SGMTARRAY "ReservedSegmentArray" /* BASIL_ELM_RSVD_NODE */
#define BASIL_ELM_RSVD_SGMT	"ReservedSegment"	/* BASIL_ELM_RSVD_SGMTARRAY */
#define BASIL_ELM_RSVD_PROCARRAY "ReservedProcessorArray"/* BASIL_ELM_RSVD_SGMT */
#define BASIL_ELM_RSVD_PROCESSOR "ReservedProcessor"	/* BASIL_ELM_RSVD_PROCARRAY */
#define BASIL_ELM_RSVD_MEMARRAY "ReservedMemoryArray"	/* BASIL_ELM_RSVD_SGMT */
#define BASIL_ELM_RSVD_MEMORY	"ReservedMemory"	/* BASIL_ELM_RSVD_MEMARRAY */
#define BASIL_ELM_SUMMARY	"Summary"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_NODESUM	"NodeSummary"		/* BASIL_ELM_SUMMARY */
#define BASIL_ELM_ACCELSUM	"AccelSummary"		/* BASIL_ELM_SUMMARY */
#define BASIL_ELM_UP		"Up"			/* BASIL_ELM_NODESUM */
							/* BASIL_ELM_ACCELSUM */
#define BASIL_ELM_DOWN		"Down"			/* BASIL_ELM_NODESUM */
							/* BASIL_ELM_ACCELSUM */
/* XML attribute names */
#define BASIL_ATR_PROTOCOL	"protocol"		/* BASIL_ELM_REQUEST */
							/* BASIL_ELM_RESPONSE */
#define BASIL_ATR_METHOD	"method"		/* BASIL_ELM_REQUEST */
							/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ATR_STATUS	"status"		/* BASIL_ELM_RESPONSEDATA */
							/* BASIL_ELM_APPLICATION */
							/* BASIL_ELM_RESERVATION */
#define BASIL_ATR_ERROR_CLASS	"error_class"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ATR_ERROR_SOURCE	"error_source"		/* BASIL_ELM_RESPONSEDATA */
#define BASIL_ATR_SEVERITY	"severity"		/* BASIL_ELM_MSG */
#define BASIL_ATR_TYPE		"type"			/* BASIL_ELM_REQUEST:query */
							/* BASIL_ELM_MEMORY */
							/* BASIL_ELM_LABEL */
							/* BASIL_ELM_ACCELERATOR */
#define BASIL_ATR_USER_NAME	"user_name"		/* BASIL_ELM_RESERVEARRAY */
							/* BASIL_ELM_RESERVATION */
#define BASIL_ATR_ACCOUNT_NAME	"account_name"		/* BASIL_ELM_RESERVEARRAY */
							/* BASIL_ELM_RESERVATION */
#define BASIL_ATR_BATCH_ID	"batch_id"		/* BASIL_ELM_RESERVEARRAY */
							/* BASIL_ELM_RESERVATION */
#define BASIL_ATR_PAGG_ID	"pagg_id"		/* BASIL_ELM_RESERVATION */
							/* BASIL_ELM_REQUEST:confirm */
							/* BASIL_ELM_REQUEST:cancel */
#define BASIL_ATR_ADMIN_COOKIE	"admin_cookie"		/* synonymous with pagg_id */
#define BASIL_ATR_ALLOC_COOKIE	"alloc_cookie"		/* deprecated as of 1.1 */
#define BASIL_ATR_CHANGECOUNT	"changecount"		/* BASIL_ELM_NODEARRAY */
#define BASIL_ATR_SCHEDCOUNT	"schedchangecount"	/* BASIL_ELM_SUMMARY */
							/* BASIL_ELM_NODEARRAY */
#define BASIL_ATR_CLAIMS	"claims"		/* BASIL_ELM_RELEASED */
#define BASIL_ATR_RSVN_ID	"reservation_id"	/* BASIL_ELM_RESERVATION */
							/* BASIL_ELM_REQUEST:confirm */
							/* BASIL_ELM_REQUEST:release */
#define BASIL_ATR_JOB_NAME	"job_name"		/* BASIL_ELM_REQUEST:confirm */
#define BASIL_ATR_NODE_ID	"node_id"		/* BASIL_ELM_NODE */
#define BASIL_ATR_ROUTER_ID	"router_id"		/* BASIL_ELM_NODE */
#define BASIL_ATR_ARCH		"architecture"		/* BASIL_ELM_RESERVE */
							/* BASIL_ELM_NODEARRAY */
							/* BASIL_ELM_NODE */
							/* BASIL_ELM_PROCESSOR */
							/* BASIL_ELM_COMMAND */
#define BASIL_ATR_ROLE		"role"			/* BASIL_ELM_NODE */
							/* BASIL_ELM_NODES */
#define BASIL_ATR_WIDTH		"width"			/* BASIL_ELM_RESERVEPARAM */
							/* BASIL_ELM_COMMAND */
#define BASIL_ATR_DEPTH		"depth"			/* BASIL_ELM_RESERVEPARAM */
							/* BASIL_ELM_COMMAND */
#define BASIL_ATR_RSVN_MODE	"reservation_mode"	/* BASIL_ELM_RESERVEPARAM */
							/* BASIL_ELM_RESERVATION */
#define BASIL_ATR_GPC_MODE	"gpc_mode"		/* BASIL_ELM_RESERVEPARAM */
							/* BASIL_ELM_RESERVATION */
#define BASIL_ATR_OSCPN		"oscpn"			/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ATR_NPPN		"nppn"			/* BASIL_ELM_RESERVEPARAM */
							/* BASIL_ELM_COMMAND */
#define BASIL_ATR_NPPS		"npps"			/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ATR_NSPN		"nspn"			/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ATR_NPPCU		"nppcu"			/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ATR_SEGMENTS	"segments"		/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ATR_SIZE_MB	"size_mb"		/* BASIL_ELM_MEMORY */
#define BASIL_ATR_NAME		"name"			/* BASIL_ELM_LABEL */
							/* BASIL_ELM_NODE */
							/* BASIL_ELM_ENGINE */
							/* BASIL_ELM_FILTER */
#define BASIL_ATR_DISPOSITION	"disposition"		/* BASIL_ELM_LABEL */
#define BASIL_ATR_STATE		"state"			/* BASIL_ELM_NODE */
							/* BASIL_ELM_ACCELERATOR */
							/* BASIL_ELM_NODES */

#define BASIL_ATR_ORDINAL	"ordinal"		/* BASIL_ELM_NODE */
							/* BASIL_ELM_SOCKET */
							/* BASIL_ELM_SEGMENT */
							/* BASIL_ELM_PROCESSOR */
							/* BASIL_ELM_ACCELERATOR */
#define BASIL_ATR_CLOCK_MHZ	"clock_mhz"		/* BASIL_ELM_SOCKET */
							/* BASIL_ELM_PROCESSOR */
							/* BASIL_ELM_ACCELERATOR */
#define BASIL_ATR_PAGE_SIZE_KB	"page_size_kb"		/* BASIL_ELM_MEMORY */
							/* BASIL_ELM_NODES */
#define BASIL_ATR_PAGE_COUNT	"page_count"		/* BASIL_ELM_MEMORY */
							/* BASIL_ELM_MEMORYALLOC */
							/* BASIL_ELM_NODES */
#define BASIL_ATR_PAGES_RSVD	"pages_rsvd"		/* BASIL_ELM_MEMORY */
#define BASIL_ATR_VERSION	"version"		/* BASIL_ELM_ENGINE */
#define BASIL_ATR_SUPPORTED	"basil_support"		/* BASIL_ELM_ENGINE */
#define BASIL_ATR_MPPHOST	"mpp_host"		/* BASIL_ELM_INVENTORY */
#define BASIL_ATR_TIMESTAMP	"timestamp"		/* BASIL_ELM_INVENTORY */
#define BASIL_ATR_APPLICATION_ID "application_id"	/* BASIL_ELM_APPLICATION */
#define BASIL_ATR_USER_ID	"user_id"		/* BASIL_ELM_APPLICATION */
#define BASIL_ATR_GROUP_ID	"group_id"		/* BASIL_ELM_APPLICATION */
#define BASIL_ATR_TIME_STAMP	"time_stamp"		/* BASIL_ELM_APPLICATION */
#define BASIL_ATR_MEMORY	"memory"		/* BASIL_ELM_COMMAND */
#define BASIL_ATR_MEMORY_MB	"memory_mb"		/* BASIL_ELM_ACCELERATOR */
#define BASIL_ATR_NODE_COUNT	"node_count"		/* BASIL_ELM_COMMAND */
#define BASIL_ATR_COMMAND	"cmd"			/* BASIL_ELM_COMMAND */
#define BASIL_ATR_SEGMENT_ID	"segment_id"		/* BASIL_ELM_RSVD_SGMT */
#define BASIL_ATR_FAMILY	"family"		/* BASIL_ELM_ACCELERATOR */
#define BASIL_ATR_ACTION	"action"		/* BASIL_ELM_APPLICATION */
							/* BASIL_ELM_RESERVATION */
#define BASIL_ATR_PGOVERNOR	"p-governor"		/* BASIL_ELM_RESERVEPARAM */
#define BASIL_ATR_PSTATE	"p-state"		/* BASIL_ELM_RESERVEPARAM */

/* XML attribute values */

#define BASIL_VAL_VERSION_1_0	"1.0"			/* BASIL_ATR_PROTOCOL 1.0 */
#define BASIL_VAL_VERSION_1_1	"1.1"			/* BASIL_ATR_PROTOCOL 1.1 */
#define BASIL_VAL_VERSION_1_2   "1.2"			/* BASIL_ATR_PROTOCOL 1.2 */
#define BASIL_VAL_VERSION_1_3   "1.3"			/* BASIL_ATR_PROTOCOL 1.3 */
#define BASIL_VAL_VERSION_1_4   "1.4"			/* BASIL_ATR_PROTOCOL 1.4 */


#define BASIL_VAL_UNDEFINED	"UNDEFINED"	/* All attributes */
#define BASIL_VAL_SUCCESS	"SUCCESS"	/* BASIL_ATR_STATUS */
#define BASIL_VAL_FAILURE	"FAILURE"	/* BASIL_ATR_STATUS */
#define BASIL_VAL_PERMANENT	"PERMANENT"	/* BASIL_ATR_ERROR_CLASS */
#define BASIL_VAL_TRANSIENT	"TRANSIENT"	/* BASIL_ATR_ERROR_CLASS */
#define BASIL_VAL_INTERNAL	"INTERNAL"	/* BASIL_ATR_ERROR_SOURCE */
#define BASIL_VAL_SYSTEM	"SYSTEM"	/* BASIL_ATR_ERROR_SOURCE */
						/* BASIL_ATR_QRY_TYPE */
#define BASIL_VAL_PARSER	"PARSER"	/* BASIL_ATR_ERROR_SOURCE */
#define BASIL_VAL_SYNTAX	"SYNTAX"	/* BASIL_ATR_ERROR_SOURCE */
#define BASIL_VAL_BACKEND	"BACKEND"	/* BASIL_ATR_ERROR_SOURCE */
#define BASIL_VAL_ERROR		"ERROR"		/* BASIL_ATR_SEVERITY */
#define BASIL_VAL_WARNING	"WARNING"	/* BASIL_ATR_SEVERITY */
#define BASIL_VAL_DEBUG		"DEBUG"		/* BASIL_ATR_SEVERITY */
#define BASIL_VAL_RESERVE	"RESERVE"	/* BASIL_ATR_METHOD */
#define BASIL_VAL_CONFIRM	"CONFIRM"	/* BASIL_ATR_METHOD */
#define BASIL_VAL_RELEASE	"RELEASE"	/* BASIL_ATR_METHOD */
#define BASIL_VAL_QUERY		"QUERY"		/* BASIL_ATR_METHOD */
#define BASIL_VAL_SWITCH	"SWITCH"	/* BASIL_ATR_METHOD */
#define BASIL_VAL_STATUS	"STATUS"	/* BASIL_ATR_QRY_TYPE */
#define BASIL_VAL_SUMMARY	"SUMMARY"	/* BASIL_ATR_QRY_TYPE */
#define BASIL_VAL_ENGINE	"ENGINE"	/* BASIL_ATR_QRY_TYPE */
#define BASIL_VAL_INVENTORY	"INVENTORY"	/* BASIL_ATR_QRY_TYPE */
#define BASIL_VAL_NETWORK	"NETWORK"	/* BASIL_ATR_QRY_TYPE */
#define BASIL_VAL_TOPOLOGY	"TOPOLOGY"	/* BASIL_ATR_QRY_TYPE */
#define BASIL_VAL_SHARED	"SHARED"	/* BASIL_ATR_MODE */
#define BASIL_VAL_EXCLUSIVE	"EXCLUSIVE"	/* BASIL_ATR_MODE */
#define BASIL_VAL_CATAMOUNT	"CATAMOUNT"	/* BASIL_ATR_OS */
#define BASIL_VAL_LINUX		"LINUX"		/* BASIL_ATR_OS */
#define BASIL_VAL_XT		"XT"		/* BASIL_ATR_ARCH:node */
#define BASIL_VAL_X2		"X2"		/* BASIL_ATR_ARCH:node */
#define BASIL_VAL_X86_64	"x86_64"	/* BASIL_ATR_ARCH:proc */
#define BASIL_VAL_AARCH64	"aarch64"	/* BASIL_ATR_ARCH:proc */
#define BASIL_VAL_CRAY_X2	"cray_x2"	/* BASIL_ATR_ARCH:proc */
#define BASIL_VAL_OS		"OS"		/* BASIL_ATR_MEM_TYPE */
#define BASIL_VAL_HUGEPAGE	"HUGEPAGE"	/* BASIL_ATR_MEM_TYPE */
#define BASIL_VAL_VIRTUAL	"VIRTUAL"	/* BASIL_ATR_MEM_TYPE */
#define BASIL_VAL_HARD		"HARD"		/* BASIL_ATR_LABEL_TYPE */
#define BASIL_VAL_SOFT		"SOFT"		/* BASIL_ATR_LABEL_TYPE */
#define BASIL_VAL_ATTRACT	"ATTRACT"	/* BASIL_ATR_LABEL_DSPN */
#define BASIL_VAL_REPEL		"REPEL"		/* BASIL_ATR_LABEL_DSPN */
#define BASIL_VAL_INTERACTIVE	"INTERACTIVE"	/* BASIL_ATR_ROLE */
#define BASIL_VAL_BATCH		"BATCH"		/* BASIL_ATR_ROLE */
#define BASIL_VAL_UP		"UP"		/* BASIL_ATR_STATE */
#define BASIL_VAL_DOWN		"DOWN"		/* BASIL_ATR_STATE */
#define BASIL_VAL_UNAVAILABLE	"UNAVAILABLE"	/* BASIL_ATR_STATE */
#define BASIL_VAL_ROUTING	"ROUTING"	/* BASIL_ATR_STATE */
#define BASIL_VAL_SUSPECT	"SUSPECT"	/* BASIL_ATR_STATE */
#define BASIL_VAL_ADMIN		"ADMIN"		/* BASIL_ATR_STATE */
#define BASIL_VAL_UNKNOWN	"UNKNOWN"	/* BASIL_ATR_STATE */
						/* BASIL_ATR_ARCH:node */
						/* BASIL_ATR_ARCH:proc */
#define BASIL_VAL_NONE		"NONE"		/* BASIL_ATR_GPC */
#define BASIL_VAL_PROCESSOR	"PROCESSOR"	/* BASIL_ATR_GPC */
#define BASIL_VAL_LOCAL		"LOCAL"		/* BASIL_ATR_GPC */
#define BASIL_VAL_GLOBAL	"GLOBAL"	/* BASIL_ATR_GPC */
#define BASIL_VAL_GPU		"GPU"		/* BASIL_ATR_TYPE */
#define BASIL_VAL_INVALID	"INVALID"	/* BASIL_ATR_STATUS */
#define BASIL_VAL_RUN		"RUN"		/* BASIL_ATR_STATUS */
#define BASIL_VAL_SUSPEND	"SUSPEND"	/* BASIL_ATR_STATUS */
#define BASIL_VAL_SWITCH	"SWITCH"	/* BASIL_ATR_STATUS */
#define BASIL_VAL_UNKNOWN	"UNKNOWN"	/* BASIL_ATR_STATUS */
#define BASIL_VAL_EMPTY		"EMPTY"		/* BASIL_ATR_STATUS */
#define BASIL_VAL_MIX		"MIX"		/* BASIL_ATR_STATUS */
#define BASIL_VAL_IN		"IN"		/* BASIL_ATR_ACTION */
#define BASIL_VAL_OUT		"OUT"		/* BASIL_ATR_ACTION */

/*
 * The following SYSTEM Query (and BASIL 1.7) specific Macro definitions have
 * been copied from the Cray-supplied basil.h header file.
 * ('Role', 'State', 'Page_Size' & 'Page_Count' related Macros already exist.
 * These attributes are common across XML Elements such as Inventory & System.)
 */
#define BASIL_ELM_SYSTEM        "System"        /* BASIL_ELM_RESPONSEDATA */
#define BASIL_ELM_NODES         "Nodes"         /* BASIL_ELM_SYSTEM */
#define BASIL_ATR_CPCU          "cpcu"          /* BASIL_ELM_SYSTEM */
#define BASIL_ATR_SPEED         "speed"         /* BASIL_ELM_NODES */
#define BASIL_ATR_NUMA_NODES    "numa_nodes"    /* BASIL_ELM_NODES */
#define BASIL_ATR_DIES          "dies"          /* BASIL_ELM_NODES */
#define BASIL_ATR_COMPUTE_UNITS "compute_units" /* BASIL_ELM_NODES */
#define BASIL_ATR_CPUS_PER_CU   "cpus_per_cu"   /* BASIL_ELM_NODES */
#define BASIL_ATR_ACCELS        "accels"        /* BASIL_ELM_NODES */
#define BASIL_ATR_ACCEL_STATE   "accel_state"   /* BASIL_ELM_NODES */
#define BASIL_ATR_NUMA_CFG      "numa_cfg"      /* BASIL_ELM_NODES */
#define BASIL_ATR_HBMSIZE       "hbm_size_mb"   /* BASIL_ELM_NODES */
#define BASIL_ATR_HBM_CFG       "hbm_cache_pct" /* BASIL_ELM_NODES */
#define BASIL_VAL_VERSION_1_7   "1.7"           /* BASIL_ATR_PROTOCOL 1.7 */
#define BASIL_VAL_VERSION       BASIL_VAL_VERSION_1_7

/*
 * The following Macro definitions have been created by Altair to support
 * SYSTEM Query processing.
 */
#define BASIL_VAL_INTERACTIVE_SYS "interactive" /* BASIL_ATR_ROLE */
#define BASIL_VAL_BATCH_SYS     "batch"		/* BASIL_ATR_ROLE */
#define BASIL_VAL_UP_SYS        "up"          	/* BASIL_ATR_STATE */
#define BASIL_VAL_DOWN_SYS      "down"        	/* BASIL_ATR_STATE */
#define BASIL_VAL_UNAVAILABLE_SYS "unavailable" /* BASIL_ATR_STATE */
#define BASIL_VAL_ROUTING_SYS   "routing"     	/* BASIL_ATR_STATE */
#define BASIL_VAL_SUSPECT_SYS   "suspect"     	/* BASIL_ATR_STATE */
#define BASIL_VAL_ADMIN_SYS     "admin"       	/* BASIL_ATR_STATE */
#define BASIL_VAL_EMPTY_SYS	""              /* BASIL_ATR_NUMA_CFG */
#define BASIL_VAL_A2A_SYS     	"a2a"           /* BASIL_ATR_NUMA_CFG */
#define BASIL_VAL_SNC2_SYS    	"snc2"          /* BASIL_ATR_NUMA_CFG */
#define BASIL_VAL_SNC4_SYS    	"snc4"          /* BASIL_ATR_NUMA_CFG */
#define BASIL_VAL_HEMI_SYS    	"hemi"          /* BASIL_ATR_NUMA_CFG */
#define BASIL_VAL_QUAD_SYS    	"quad"          /* BASIL_ATR_NUMA_CFG */
#define BASIL_VAL_0_SYS       	"0"             /* BASIL_ATR_HBM_CFG */
#define BASIL_VAL_25_SYS      	"25"            /* BASIL_ATR_HBM_CFG */
#define BASIL_VAL_50_SYS      	"50"            /* BASIL_ATR_HBM_CFG */
#define BASIL_VAL_100_SYS     	"100"           /* BASIL_ATR_HBM_CFG */

/* if set, the specified env var is the href (i.e., url) of an xslt file */
#define BASIL_XSLT_HREF_ENV	"BASIL_XSLT_HREF"

/*
 * BASIL versions.
 * To add a new version, define the BASIL_VAL_VERSION_#_# string, above,
 * then place it at the top of the supported_versions array.
 * Define a numeric version value in the enum, below.
 * Add the strcmp to match the string to the enum value in
 * request_start() in handlers.c
 */

/* BASIL supported versions string array */

/* The first version listed is considered the current version. */
static const char *basil_supported_versions[] __attribute__((unused)) = {
	BASIL_VAL_VERSION_1_7,
	BASIL_VAL_VERSION_1_4,
	BASIL_VAL_VERSION_1_3,
	BASIL_VAL_VERSION_1_2,
	BASIL_VAL_VERSION_1_1,
	BASIL_VAL_VERSION_1_0,
	NULL
};

/*
 * BASIL versions -- numerical
 */
typedef enum {
	basil_1_0 = 10,
	basil_1_1,
	basil_1_2,
	basil_1_3,
	basil_1_4,
	/* basil_1_5 and basil_1_6 are not supported */
	basil_1_7 = 17
} basil_version_t;

/*
 * For conversion from enum to string array index
 * always make BASIL_VERSION_MAX the current, largest version
 * number from the basil_version_t enum.
 */
#define BASIL_VERSION_MAX basil_1_7
#define BASIL_VERSION_MIN basil_1_0

/* BASIL enumerated types */

typedef enum {
	basil_method_none = 0,
	basil_method_reserve,
	basil_method_confirm,
	basil_method_release,
	basil_method_query,
	basil_method_switch
} basil_method_t;

typedef enum {
	basil_query_none = 0,
	basil_query_engine,
	basil_query_inventory,
	basil_query_network,
	basil_query_status,
	basil_query_summary,
	basil_query_system,
	basil_query_topology
} basil_query_t;

typedef enum {
	basil_node_arch_none = 0,
	basil_node_arch_x2,
	basil_node_arch_xt,
	basil_node_arch_unknown
} basil_node_arch_t;

typedef enum {
	basil_node_state_none = 0,
	basil_node_state_up,
	basil_node_state_down,
	basil_node_state_unavail,
	basil_node_state_route,
	basil_node_state_suspect,
	basil_node_state_admindown,
	basil_node_state_unknown
} basil_node_state_t;

typedef enum {
	basil_node_role_none = 0,
	basil_node_role_interactive,
	basil_node_role_batch,
	basil_node_role_unknown
} basil_node_role_t;

typedef enum {
	basil_accel_none = 0,
	basil_accel_gpu
} basil_accel_t;

typedef enum {
	basil_accel_state_none = 0,
	basil_accel_state_up,
	basil_accel_state_down,
	basil_accel_state_unknown
} basil_accel_state_t;

typedef enum {
	basil_processor_arch_none = 0,
	basil_processor_cray_x2,
	basil_processor_x86_64,
	basil_processor_aarch64,
	basil_processor_arch_unknown
} basil_processor_arch_t;

typedef enum {
	basil_memory_type_none = 0,
	basil_memory_type_os,
	basil_memory_type_hugepage,
	basil_memory_type_virtual
} basil_memory_type_t;

typedef enum {
	basil_label_type_none = 0,
	basil_label_type_hard,
	basil_label_type_soft
} basil_label_type_t;

typedef enum {
	basil_label_disposition_none = 0,
	basil_label_disposition_attract,
	basil_label_disposition_repel
} basil_label_disposition_t;

typedef enum {
	basil_component_state_none = 0,
	basil_component_state_available,
	basil_component_state_unavailable
} basil_component_state_t;

typedef enum {
	basil_rsvn_mode_none = 0,
	basil_rsvn_mode_exclusive,
	basil_rsvn_mode_shared
} basil_rsvn_mode_t;

typedef enum {
	basil_gpc_mode_none = 0,
	basil_gpc_mode_processor,
	basil_gpc_mode_local,
	basil_gpc_mode_global
} basil_gpc_mode_t;

typedef enum {
	basil_application_status_none = 0,
	basil_application_status_invalid,
	basil_application_status_run,
	basil_application_status_suspend,
	basil_application_status_switch,
	basil_application_status_unknown
} basil_application_status_t;

typedef enum {
	basil_reservation_status_none = 0,
	basil_reservation_status_empty,
	basil_reservation_status_invalid,
	basil_reservation_status_mix,
	basil_reservation_status_run,
	basil_reservation_status_suspend,
	basil_reservation_status_switch,
	basil_reservation_status_unknown
} basil_reservation_status_t;

typedef enum {
	basil_switch_action_none = 0,
	basil_switch_action_in,
	basil_switch_action_out,
	basil_switch_action_unknown
} basil_switch_action_t;

typedef enum {
	basil_switch_status_none = 0,
	basil_switch_status_success,
	basil_switch_status_failure,
	basil_switch_status_invalid,
	basil_switch_status_unknown
} basil_switch_status_t;

/* Basil data structures common to requests and responses */

typedef struct basil_label {
	char name[BASIL_STRING_MEDIUM];
	basil_label_type_t type;
	basil_label_disposition_t disposition;
	struct basil_label *next;
} basil_label_t;

typedef basil_label_t basil_label_param_t;

typedef struct basil_accelerator_gpu {
	char *family;
	unsigned int memory;
	unsigned int clock_mhz;
} basil_accelerator_gpu_t;

/* BASIL request data structures */

typedef struct basil_accelerator_param {
	basil_accel_t type;
	basil_accel_state_t state;
	union {
		basil_accelerator_gpu_t *gpu;
	} data;
	struct basil_accelerator_param *next;
} basil_accelerator_param_t;

typedef struct basil_memory_param {
	long size_mb;
	basil_memory_type_t type;
	struct basil_memory_param *next;
} basil_memory_param_t;

typedef struct basil_nodelist_param {
	char *nodelist;
	struct basil_nodelist_param *next;
} basil_nodelist_param_t;

typedef struct basil_reserve_param {
	basil_node_arch_t arch;
	long width;
	long depth;
	long oscpn;
	long nppn;
	long npps;
	long nspn;
	long nppcu;
	long pstate;
	char pgovernor[BASIL_STRING_SHORT];
	basil_rsvn_mode_t rsvn_mode;
	basil_gpc_mode_t gpc_mode;
	char segments[BASIL_STRING_MEDIUM];
	basil_memory_param_t *memory;
	basil_label_param_t *labels;
	basil_nodelist_param_t *nodelists;
	basil_accelerator_param_t *accelerators;
	struct basil_reserve_param *next;
} basil_reserve_param_t;

typedef struct basil_request_reserve {
	char user_name[BASIL_STRING_MEDIUM];
	char account_name[BASIL_STRING_MEDIUM];
	char batch_id[BASIL_STRING_LONG];
	long rsvn_id;	/* debug only */
	basil_reserve_param_t *params;
} basil_request_reserve_t;

typedef struct basil_request_confirm {
	long rsvn_id;
	unsigned long long pagg_id;
	char job_name[BASIL_STRING_LONG];
} basil_request_confirm_t;

typedef struct basil_request_release {
	long rsvn_id;
	unsigned long long pagg_id;
} basil_request_release_t;

typedef struct basil_request_query_inventory {
	unsigned long long changecount;
	int doNodeArray;
	int doResvArray;
} basil_request_query_inventory_t;

typedef struct basil_request_query_status_app {
	unsigned long long apid;
	struct basil_request_query_status_app *next;
} basil_request_query_status_app_t;

typedef struct basil_request_query_status_res {
	long rsvn_id;
	struct basil_request_query_status_res *next;
} basil_request_query_status_res_t;

typedef struct basil_request_query_status {
	int doAppArray;
	basil_request_query_status_app_t *application;
	int doResvArray;
	basil_request_query_status_res_t *reservation;
} basil_request_query_status_t;

/*
 * Copied this System Query specific (BASIL 1.7) structure definition
 * (basil_request_query_system_t) from the Cray-supplied basil.h file.
 */
typedef struct basil_request_query_system {
    unsigned long long changecount;
} basil_request_query_system_t;

typedef struct basil_topology_filter {
	char name[BASIL_STRING_LONG];
	struct basil_topology_filter *next;
} basil_topology_filter_t;

typedef struct basil_request_query_topology {
	int executeFilters;
	basil_topology_filter_t *filters;
} basil_request_query_topology_t;

typedef struct basil_request_query {
	basil_query_t type;
	union {
		basil_request_query_inventory_t *inv;
		basil_request_query_status_t *status;
		basil_request_query_system_t *system;
		basil_request_query_topology_t *topology;
	} data;
} basil_request_query_t;

typedef struct basil_request_switch_app {
	unsigned long long apid;
	basil_switch_action_t action;
	struct basil_request_switch_app *next;
} basil_request_switch_app_t;

typedef struct basil_request_switch_res {
	long rsvn_id;
	basil_switch_action_t action;
	struct basil_request_switch_res *next;
} basil_request_switch_res_t;

typedef struct basil_request_switch {
	basil_request_switch_app_t *application;
	basil_request_switch_res_t *reservation;
} basil_request_switch_t;

typedef struct basil_request {
	basil_version_t protocol;
	basil_method_t method;
	union {
		basil_request_reserve_t reserve;
		basil_request_confirm_t confirm;
		basil_request_release_t release;
		basil_request_switch_t swtch;
		basil_request_query_t query;
	} data;
} basil_request_t;

/* BASIL response data structures */

typedef struct basil_rsvn_application_cmd {
	int width;
	int depth;
	int nppn;
	int memory;
	basil_node_arch_t arch;
	char cmd[BASIL_STRING_MEDIUM];
	struct basil_rsvn_application_cmd *next;
} basil_rsvn_application_cmd_t;

typedef struct basil_rsvn_application {
	unsigned long long application_id;
	unsigned int user_id;
	unsigned int group_id;
	char time_stamp[BASIL_STRING_MEDIUM];
	basil_rsvn_application_cmd_t *cmds;
	struct basil_rsvn_application *next;
} basil_rsvn_application_t;

typedef struct basil_rsvn {
	long rsvn_id;
	char user_name[BASIL_STRING_MEDIUM];
	char account_name[BASIL_STRING_MEDIUM];
	char batch_id[BASIL_STRING_LONG];
	char time_stamp[BASIL_STRING_MEDIUM];
	char rsvn_mode[BASIL_STRING_MEDIUM];
	char gpc_mode[BASIL_STRING_MEDIUM];
	basil_rsvn_application_t *applications;
	struct basil_rsvn *next;
} basil_rsvn_t;

typedef struct basil_memory_allocation {
	long rsvn_id;
	long page_count;
	struct basil_memory_allocation *next;
} basil_memory_allocation_t;

typedef struct basil_node_memory {
	basil_memory_type_t type;
	long page_size_kb;
	long page_count;
	basil_memory_allocation_t *allocations;
	struct basil_node_memory *next;
} basil_node_memory_t;

typedef struct basil_node_computeunit {
	int ordinal;
	int proc_per_cu_count;
	struct basil_node_computeunit *next;
} basil_node_computeunit_t;

typedef struct basil_processor_allocation {
	long rsvn_id;
	struct basil_processor_allocation *next;
} basil_processor_allocation_t;

typedef struct basil_node_processor {
	int ordinal;
	basil_processor_arch_t arch;
	int clock_mhz;
	basil_processor_allocation_t *allocations;
	struct basil_node_processor *next;
} basil_node_processor_t;

typedef struct basil_node_segment {
	int ordinal;
	basil_node_processor_t *processors;
	basil_node_memory_t *memory;
	basil_label_t *labels;
	basil_node_computeunit_t *computeunits;
	struct basil_node_segment *next;
} basil_node_segment_t;

typedef struct basil_node_socket {
	int ordinal;
	basil_processor_arch_t arch;
	int clock_mhz;
	basil_node_segment_t *segments;
	struct basil_node_socket *next;
} basil_node_socket_t;

typedef struct basil_accelerator_allocation {
	long rsvn_id;
	struct basil_accelerator_allocation *next;
} basil_accelerator_allocation_t;

typedef struct basil_node_accelerator {
	basil_accel_t type;
	basil_accel_state_t state;
	union {
		basil_accelerator_gpu_t *gpu;
	} data;
	basil_accelerator_allocation_t *allocations;
	struct basil_node_accelerator *next;
} basil_node_accelerator_t;

typedef struct basil_node {
	long node_id;
	long router_id;
	basil_node_arch_t arch;
	basil_node_state_t state;
	basil_node_role_t role;
	unsigned int numcpus;	/* numcores */
	long clock_mhz;
	char name[BASIL_STRING_SHORT];
	basil_node_socket_t *sockets;
	basil_node_segment_t *segments;
	basil_node_accelerator_t *accelerators;
	struct basil_node *next;
} basil_node_t;

typedef struct basil_response_query_inventory {
	long long timestamp;
	char mpp_host[BASIL_STRING_LONG];
	int node_count;
	int node_maxid;
	unsigned long long int changecount;
	unsigned long long int schedcount;
	basil_node_t *nodes;
	int rsvn_count;
	basil_rsvn_t *rsvns;
} basil_response_query_inventory_t;

typedef struct basil_response_query_engine {
	char *name;
	char *version;
	char *basil_support;
} basil_response_query_engine_t;

typedef struct basil_response_query_network {
} basil_response_query_network_t;

typedef struct basil_response_query_status_app {
	unsigned long long apid;
	basil_application_status_t status;
	struct basil_response_query_status_app *next;
} basil_response_query_status_app_t;

typedef struct basil_response_query_status_res {
	long rsvn_id;
	basil_reservation_status_t status;
	struct basil_response_query_status_res *next;
} basil_response_query_status_res_t;

typedef struct basil_response_query_status {
	basil_response_query_status_app_t *application;
	basil_response_query_status_res_t *reservation;
} basil_response_query_status_t;

/*
 * Selectively copied System Query specific (BASIL 1.7) structure definitions
 * (basil_system_element_t, basil_response_query_system_t) from the cray
 * supplied basil.h file.
 */
typedef struct basil_system_element {
    char role[BASIL_STRING_SHORT];
    char state[BASIL_STRING_SHORT];
    char speed[BASIL_STRING_SHORT];
    char numa_nodes[BASIL_STRING_SHORT];
    char n_dies[BASIL_STRING_SHORT];
    char compute_units[BASIL_STRING_SHORT];
    char cpus_per_cu[BASIL_STRING_SHORT];
    char pgszl2[BASIL_STRING_SHORT];
    char avlmem[BASIL_STRING_SHORT];
    char accel_name[BASIL_STRING_SHORT];
    char accel_state[BASIL_STRING_SHORT];
    char numa_cfg[BASIL_STRING_SHORT];
    char hbmsize[BASIL_STRING_SHORT];
    char hbm_cfg[BASIL_STRING_SHORT];
    char *nidlist;
    struct basil_system_element *next;
} basil_system_element_t;

typedef struct basil_response_query_system {
    long long timestamp;
    char mpp_host[BASIL_STRING_LONG];
    int cpcu_val;
    basil_system_element_t *elements;
} basil_response_query_system_t;

typedef struct basil_response_query_topology {
	int executeFilters;
	basil_topology_filter_t *filters;
} basil_response_query_topology_t;

typedef struct basil_response_query {
	basil_query_t type;
	union {
		basil_response_query_inventory_t inventory;
		basil_response_query_engine_t engine;
		basil_response_query_network_t network;
		basil_response_query_status_t status;
		basil_response_query_system_t system;
		basil_response_query_topology_t topology;
	} data;
} basil_response_query_t;

typedef struct basil_response_reserve {
	long rsvn_id;
	basil_node_t **nodes;
	int *nids;
	size_t nidslen;
	/* CPA admin_cookie deprecated as of 1.1 */
	/* CPA alloc_cookie deprecated as of 1.1 */
} basil_response_reserve_t;

typedef struct basil_response_confirm {
	long rsvn_id;
	unsigned long long pagg_id;
} basil_response_confirm_t;

typedef struct basil_response_release {
	long rsvn_id;
	unsigned int claims;
} basil_response_release_t;

typedef struct basil_response_switch_app {
	unsigned long long apid;
	basil_switch_status_t status;
	struct basil_response_switch_app *next;
} basil_response_switch_app_t;

typedef struct basil_response_switch_res {
	long rsvn_id;
	basil_switch_status_t status;
	struct basil_response_switch_res *next;
} basil_response_switch_res_t;

typedef struct basil_response_switch {
	basil_response_switch_app_t *application;
	basil_response_switch_res_t *reservation;
} basil_response_switch_t;

typedef struct basil_response {
	basil_version_t protocol;
	basil_method_t method;
	unsigned long error_flags;
	char error[BASIL_ERROR_BUFFER_SIZE];
	union {
		basil_response_reserve_t reserve;
		basil_response_confirm_t confirm;
		basil_response_release_t release;
		basil_response_query_t query;
		basil_response_switch_t swtch;
	} data;
} basil_response_t;

/*
 * Bit assignments for error_flags define in basil_response_t for
 * use in callback functions.
 */
#define BASIL_ERR_TRANSIENT	0x00000001UL

#endif /* _BASIL_H */

// clang-format on


================================================
FILE: src/include/batch_request.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _BATCH_REQUEST_H
#define _BATCH_REQUEST_H
#ifdef __cplusplus
extern "C" {
#endif

#include "pbs_share.h"
#include "attribute.h"
#include "libpbs.h"
#include "net_connect.h"

#define PBS_SIGNAMESZ 16
#define MAX_JOBS_PER_REPLY 500

/* QueueJob */
struct rq_queuejob {
	char rq_destin[PBS_MAXSVRRESVID + 1];
	char rq_jid[PBS_MAXSVRJOBID + 1];
	pbs_list_head rq_attr; /* svrattrlist */
};

/* PostQueueJob */
struct rq_postqueuejob {
	struct job *rq_pjob;
	char rq_destin[PBS_MAXSVRRESVID + 1];
	char rq_jid[PBS_MAXSVRJOBID + 1];
	pbs_list_head rq_attr; /* svrattrlist */
};

/* JobCredential */
struct rq_jobcred {
	int rq_type;
	long rq_size;
	char *rq_data;
};

/* UserCredential */
struct rq_usercred {
	char rq_user[PBS_MAXUSER + 1];
	int rq_type;
	long rq_size;
	char *rq_data;
};

/* Job File */
struct rq_jobfile {
	int rq_sequence;
	int rq_type;
	long rq_size;
	char rq_jobid[PBS_MAXSVRJOBID + 1];
	char *rq_data;
};

/* Hook File */
struct rq_hookfile {
	int rq_sequence;
	long rq_size;
	char rq_filename[MAXPATHLEN + 1];
	char *rq_data;
};

/*
 * job or destination id - used by RdyToCommit, Commit, RerunJob,
 * status ..., and locate job - is just a char *
 *
 * Manage - used by Manager, DeleteJob, ReleaseJob, ModifyJob
 */
struct rq_manage {
	int rq_cmd;
	int rq_objtype;
	char rq_objname[PBS_MAXSVRJOBID + 1];
	pbs_list_head rq_attr; /* svrattrlist */
};

/* DeleteJobList */
struct rq_deletejoblist {
	int rq_count;
	int mails;
	char **rq_jobslist;
	bool rq_resume;
	int jobid_to_resume;
	int subjobid_to_resume;
};

/* Management - used by PBS_BATCH_Manager requests */
struct rq_management {
	struct rq_manage rq_manager;
	struct batch_reply *rq_reply;
	time_t rq_time;
};

/* ModifyVnode - used for node state changes */
struct rq_modifyvnode {
	struct pbsnode *rq_vnode_o; /* old/previous vnode state */
	struct pbsnode *rq_vnode;   /* new/current vnode state */
};

/* HoldJob -  plus preference flag */
struct rq_hold {
	struct rq_manage rq_orig;
	int rq_hpref;
};

/* MessageJob */
struct rq_message {
	int rq_file;
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char *rq_text;
};

/* RelnodesJob */
struct rq_relnodes {
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char *rq_node_list;
};

/* PySpawn */
struct rq_py_spawn {
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char **rq_argv;
	char **rq_envp;
};

/* MoveJob */
struct rq_move {
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char rq_destin[(PBS_MAXSVRRESVID > PBS_MAXDEST ? PBS_MAXSVRRESVID : PBS_MAXDEST) + 1];
};

/* Resource Query/Reserve/Free */
struct rq_rescq {
	int rq_rhandle;
	int rq_num;
	char **rq_list;
};

/* RunJob */
struct rq_runjob {
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char *rq_destin;
	unsigned long rq_resch;
};

/* JobObit */
struct rq_jobobit {
	struct job *rq_pjob;
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char *rq_destin;
};

/* SignalJob */
struct rq_signal {
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char rq_signame[PBS_SIGNAMESZ + 1];
};

/* Status (job, queue, server, hook) */
struct rq_status {
	char *rq_id; /* allow mulitple (job) ids */
	pbs_list_head rq_attr;
};

/* Select Job  and selstat */
struct rq_selstat {
	pbs_list_head rq_selattr;
	pbs_list_head rq_rtnattr;
};

/* TrackJob */
struct rq_track {
	int rq_hopcount;
	char rq_jid[PBS_MAXSVRJOBID + 1];
	char rq_location[PBS_MAXDEST + 1];
	char rq_state[2];
};

/* RegisterDependentJob */
struct rq_register {
	char rq_owner[PBS_MAXUSER + 1];
	char rq_svr[PBS_MAXSERVERNAME + 1];
	char rq_parent[PBS_MAXSVRJOBID + 1];
	char rq_child[PBS_MAXCLTJOBID + 1]; /* need separate entry for */
	int rq_dependtype;		    /* from server_name:port   */
	int rq_op;
	long rq_cost;
};

/* Authenticate request */
struct rq_auth {
	char rq_auth_method[MAXAUTHNAME + 1];
	char rq_encrypt_method[MAXAUTHNAME + 1];
	unsigned int rq_port;
};

/* Deferred Scheduler Reply */
struct rq_defschrpy {
	int rq_cmd;
	char *rq_id;
	int rq_err;
	char *rq_txt;
};

/* Copy/Delete Files (Server -> MOM Only) */

#define STDJOBFILE 1
#define JOBCKPFILE 2
#define STAGEFILE 3

#define STAGE_DIR_IN 0
#define STAGE_DIR_OUT 1

#define STAGE_DIRECTION 1 /* mask for setting/extracting direction of file copy from rq_dir */
#define STAGE_JOBDIR 2	  /* mask for setting/extracting "sandbox" mode flag from rq_dir */

struct rq_cpyfile {
	char rq_jobid[PBS_MAXSVRJOBID + 1]; /* used in Copy & Delete */
	char rq_owner[PBS_MAXUSER + 1];	    /* used in Copy only	   */
	char rq_user[PBS_MAXUSER + 1];	    /* used in Copy & Delete */
	char rq_group[PBS_MAXGRPN + 1];	    /* used in Copy only     */
	int rq_dir;			    /* direction and sandbox flags: used in Copy & Delete */
	pbs_list_head rq_pair;		    /* list of rqfpair,  used in Copy & Delete */
};

struct rq_cpyfile_cred {
	struct rq_cpyfile rq_copyfile; /* copy/delete info */
	int rq_credtype;	       /* cred type */
	size_t rq_credlen;	       /* credential length bytes */
	char *rq_pcred;		       /* encrpyted credential */
};

struct rq_cred {
	char rq_jobid[PBS_MAXSVRJOBID + 1];
	char rq_credid[PBS_MAXUSER + 1]; /* contains id specific for the used security mechanism */
	long rq_cred_validity;		 /* validity of provided credentials */
	int rq_cred_type;		 /* type of credentials like CRED_KRB5, CRED_TLS ... */
	char *rq_cred_data;		 /* credentials in base64 */
	size_t rq_cred_size;		 /* size of credentials */
};

struct rqfpair {
	pbs_list_link fp_link;
	int fp_flag;	/* 1 for std[out|err] 2 for stageout */
	char *fp_local; /* used in Copy & Delete */
	char *fp_rmt;	/* used in Copy only     */
};

struct rq_register_sched {
	char *rq_name;
};

/*
 * ok we now have all the individual request structures defined,
 * so here is the union ...
 */
struct batch_request {
	pbs_list_link rq_link;		   /* linkage of all requests */
	struct batch_request *rq_parentbr; /* parent request for job array request */
	int rq_refct;			   /* reference count - child requests */
	int rq_type;			   /* type of request */
	int rq_perm;			   /* access permissions for the user */
	int rq_fromsvr;			   /* true if request from another server */
	int rq_conn;			   /* socket connection to client/server */
	int rq_orgconn;			   /* original socket if relayed to MOM */
	int rq_extsz;			   /* size of "extension" data */
	long rq_time;			   /* time batch request created */
	char rq_user[PBS_MAXUSER + 1];	   /* user name request is from */
	char rq_host[PBS_MAXHOSTNAME + 1]; /* name of host sending request */
	void *rq_extra;			   /* optional ptr to extra info */
	char *rq_extend;		   /* request "extension" data */
	int prot;			   /* PROT_TCP or PROT_TPP */
	int tpp_ack;			   /* send acks for this tpp stream? */
	char *tppcmd_msgid;		   /* msg id for tpp commands */
	struct batch_reply rq_reply;	   /* the reply area for this request */
	union indep_request {
		struct rq_register_sched rq_register_sched;
		struct rq_auth rq_auth;
		int rq_connect;
		struct rq_queuejob rq_queuejob;
		struct rq_postqueuejob rq_postqueuejob;
		struct rq_jobcred rq_jobcred;
		struct rq_jobfile rq_jobfile;
		char rq_rdytocommit[PBS_MAXSVRJOBID + 1];
		char rq_commit[PBS_MAXSVRJOBID + 1];
		struct rq_manage rq_delete;
		struct rq_manage rq_resresvbegin;
		struct rq_deletejoblist rq_deletejoblist;
		struct rq_hold rq_hold;
		char rq_locate[PBS_MAXSVRJOBID + 1];
		struct rq_manage rq_manager;
		struct rq_management rq_management;
		struct rq_modifyvnode rq_modifyvnode;
		struct rq_message rq_message;
		struct rq_relnodes rq_relnodes;
		struct rq_py_spawn rq_py_spawn;
		struct rq_manage rq_modify;
		struct rq_move rq_move;
		struct rq_register rq_register;
		struct rq_manage rq_release;
		char rq_rerun[PBS_MAXSVRJOBID + 1];
		struct rq_rescq rq_rescq;
		struct rq_runjob rq_run;
		struct rq_jobobit rq_obit;
		struct rq_selstat rq_select;
		int rq_shutdown;
		struct rq_signal rq_signal;
		struct rq_status rq_status;
		struct rq_track rq_track;
		struct rq_cpyfile rq_cpyfile;
		struct rq_cpyfile_cred rq_cpyfile_cred;
		int rq_failover;
		struct rq_usercred rq_usercred;
		struct rq_defschrpy rq_defrpy;
		struct rq_hookfile rq_hookfile;
		struct rq_preempt rq_preempt;
		struct rq_cred rq_cred;
	} rq_ind;
};

extern struct batch_request *alloc_br(int);
extern struct batch_request *copy_br(struct batch_request *);
extern void reply_ack(struct batch_request *);
extern void req_reject(int, int, struct batch_request *);
extern void req_reject_msg(int, int, struct batch_request *, int);
extern void reply_badattr(int, int, svrattrl *, struct batch_request *);
extern void reply_badattr_msg(int, int, svrattrl *, struct batch_request *, int);
extern int reply_text(struct batch_request *, int, char *);
extern int reply_send(struct batch_request *);
extern int reply_send_status_part(struct batch_request *);
extern int reply_jobid(struct batch_request *, char *, int);
extern int reply_jobid_msg(struct batch_request *, char *, int, int);
extern void reply_free(struct batch_reply *);
extern void dispatch_request(int, struct batch_request *);
extern void free_br(struct batch_request *);
extern int isode_request_read(int, struct batch_request *);
extern void req_stat_job(struct batch_request *);
extern void req_stat_resv(struct batch_request *);
extern void req_stat_resc(struct batch_request *);
extern void req_rerunjob(struct batch_request *);
extern void arrayfree(char **);

#ifdef PBS_NET_H
extern int authenticate_user(struct batch_request *, conn_t *);
#endif

#ifndef PBS_MOM
extern void req_confirmresv(struct batch_request *);
extern void req_connect(struct batch_request *);
extern void req_defschedreply(struct batch_request *);
extern void req_locatejob(struct batch_request *);
extern void req_manager(struct batch_request *);
extern void req_movejob(struct batch_request *);
extern void req_register(struct batch_request *);
extern void req_releasejob(struct batch_request *);
extern void req_rescq(struct batch_request *);
extern void req_runjob(struct batch_request *);
extern void req_selectjobs(struct batch_request *);
extern void req_stat_que(struct batch_request *);
extern void req_stat_svr(struct batch_request *);
extern void req_stat_sched(struct batch_request *);
extern void req_trackjob(struct batch_request *);
extern void req_stat_rsc(struct batch_request *);
extern void req_preemptjobs(struct batch_request *);
#else
extern void req_cpyfile(struct batch_request *);
extern void req_delfile(struct batch_request *);
extern void req_copy_hookfile(struct batch_request *);
extern void req_del_hookfile(struct batch_request *);
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
extern void req_cred(struct batch_request *);
#endif
#endif

/* PBS Batch Request Decode/Encode routines */
extern int decode_DIS_Authenticate(int, struct batch_request *);
extern int decode_DIS_CopyFiles(int, struct batch_request *);
extern int decode_DIS_CopyFiles_Cred(int, struct batch_request *);
extern int decode_DIS_JobCred(int, struct batch_request *);
extern int decode_DIS_UserCred(int, struct batch_request *);
extern int decode_DIS_JobFile(int, struct batch_request *);
extern int decode_DIS_CopyHookFile(int, struct batch_request *);
extern int decode_DIS_DelHookFile(int, struct batch_request *);
extern int decode_DIS_Manage(int, struct batch_request *);
extern int decode_DIS_DelJobList(int, struct batch_request *);
extern int decode_DIS_MoveJob(int, struct batch_request *);
extern int decode_DIS_MessageJob(int, struct batch_request *);
extern int decode_DIS_ModifyResv(int, struct batch_request *);
extern int decode_DIS_PySpawn(int, struct batch_request *);
extern int decode_DIS_QueueJob(int, struct batch_request *);
extern int decode_DIS_Register(int, struct batch_request *);
extern int decode_DIS_RelnodesJob(int, struct batch_request *);
extern int decode_DIS_ReqExtend(int, struct batch_request *);
extern int decode_DIS_ReqHdr(int, struct batch_request *, int *, int *);
extern int decode_DIS_Rescl(int, struct batch_request *);
extern int decode_DIS_Rescq(int, struct batch_request *);
extern int decode_DIS_Run(int, struct batch_request *);
extern int decode_DIS_ShutDown(int, struct batch_request *);
extern int decode_DIS_SignalJob(int, struct batch_request *);
extern int decode_DIS_Status(int, struct batch_request *);
extern int decode_DIS_TrackJob(int, struct batch_request *);
extern int decode_DIS_replySvr(int, struct batch_reply *);
extern int decode_DIS_svrattrl(int, pbs_list_head *);
extern int decode_DIS_Cred(int, struct batch_request *);
extern int encode_DIS_failover(int, struct batch_request *);
extern int encode_DIS_CopyFiles(int, struct batch_request *);
extern int encode_DIS_CopyFiles_Cred(int, struct batch_request *);
extern int encode_DIS_Register(int, struct batch_request *);
extern int encode_DIS_TrackJob(int, struct batch_request *);
extern int encode_DIS_reply(int, struct batch_reply *);
extern int encode_DIS_replyTPP(int, char *, struct batch_reply *);
extern int encode_DIS_svrattrl(int, svrattrl *);
extern int encode_DIS_Cred(int, char *, char *, int, char *, size_t, long);
extern int dis_request_read(int, struct batch_request *);
extern int dis_reply_read(int, struct batch_reply *, int);
extern int decode_DIS_PreemptJobs(int, struct batch_request *);

#ifdef __cplusplus
}
#endif
#endif /* _BATCH_REQUEST_H */


================================================
FILE: src/include/bitfield.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _BITFIELD_H
#define _BITFIELD_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * Definition of interface for dealing with arbitrarily large numbers of
 * contiguous bits.  Size of the bitfield is declared at compile time with
 * the BITFIELD_SIZE #define (default is 128 bits).
 *
 * Macros/inlines all take pointers to a Bitfield, and provide :
 *
 * Macro BITFIELD_WORD(Bitfield *p,int ndx)
 * Macro BITFIELD_SET_WORD(Bitfield *p, int ndx, unsigned long long word)
 *
 * Macro BITFIELD_CLRALL(Bitfield *p)
 * Macro BITFIELD_SETALL(Bitfield *p)
 * 	Clear or set all bits in a Bitfield.
 *
 * Macro BITFIELD_SET_LSB(Bitfield *p)
 * Macro BITFIELD_CLR_LSB(Bitfield *p)
 * Macro BITFIELD_SET_MSB(Bitfield *p)
 * Macro BITFIELD_CLR_MSB(Bitfield *p)
 *	Set the least or most significant bit of a Bitfield.
 *
 * Macro BITFIELD_LSB_ISONE(Bitfield *p)
 * Macro BITFIELD_MSB_ISONE(Bitfield *p)
 * 	Equals non-zero if the least or most significant bit of the Bitfield
 * 	    is set, or zero otherwise.
 *
 * Macro BITFIELD_SETB(Bitfield *p, int bit)
 * Macro BITFIELD_CLRB(Bitfield *p, int bit)
 * Macro BITFIELD_TSTB(Bitfield *p, int bit)
 * 	Set, clear, or test the bit at position 'bit' in the Bitfield '*p'.
 * 	BITFIELD_TSTB() is non-zero if the bit at position 'bit' is set, or
 *	     zero if it is clear.
 *
 * Inline BITFIELD_IS_ZERO(Bitfield *p)
 * Inline BITFIELD_IS_ONES(Bitfield *p)
 * 	Return non-zero if the bitfield is composed of all zeros or ones,
 *	     or zero if the bitfield is non-homogeneous.
 *
 * Inline BITFIELD_IS_NONZERO(Bitfield *p)
 *	Returns non-zero if the bitfield contains at least one set bit.
 *
 * Inline BITFIELD_NUM_ONES(Bitfield *p)
 *	Returns number of '1' bits in the bitfield.
 *
 * Inline BITFIELD_MS_ONE(Bitfield *p)
 * Inline BITFIELD_LS_ONE(Bitfield *p)
 *	Returns bit position number of least or most significant 1-bit in
 *	the Bitfield.
 *
 * Inline BITFIELD_EQ(Bitfield *p, Bitfield *q)
 * Inline BITFIELD_NOTEQ(Bitfield *p, Bitfield *q)
 *	Return non-zero if Bitfields '*p' and '*q' are (not) equal.
 *
 * Inline BITFIELD_SETM(Bitfield *p, Bitfield *mask)
 * Inline BITFIELD_CLRM(Bitfield *p, Bitfield *mask)
 * Inline BITFIELD_ANDM(Bitfield *p, Bitfield *mask)
 * Inline BITFIELD_TSTM(Bitfield *p, Bitfield *mask)
 * Inline BITFIELD_TSTALLM(Bitfield *p, Bitfield *mask)
 *	Apply the specified 'mask' to the given bitfield 'p':
 *	SETM() sets bits in 'p' for any bits set in 'mask' ('p |= mask').
 *	CLRM() clears bits in 'p' for any bits set in 'mask' ('p &=~ mask').
 *	ANDM() logical-and's 'mask' into 'p' ('p &= mask');
 *	TSTM() returns non-zero if *any* bits set in 'mask' are set in 'p'.
 *	TSTMALL() returns non-zero if *all* bits set in 'mask' are also set
 *		in 'p'.
 *
 * Inline BITFIELD_CPY(Bitfield *p, Bitfield *q)
 * Inline BITFIELD_CPYNOTM(Bitfield *p, Bitfield *q)
 *	Copy the (inverse of) bitfield 'q' into 'p'.
 *
 * Inline BITFIELD_ORNOTM(Bitfield *p, Bitfield *q)
 * 	Set any bits in 'p' where the corresponding bit in 'q' is clear.
 * 	    (p |= ~q)
 *
 * Inline BITFIELD_SHIFTL(Bitfield *p)
 * Inline BITFIELD_SHIFTR(Bitfield *p)
 * 	Shift the bits in Bitfield 'p' one bit to the right or left.
 */

/* The size of bitfields being used.  Default to 256 bits. */
#ifndef BITFIELD_SIZE
#define BITFIELD_SIZE 256
#endif /* !BITFIELD_SIZE */

#include <assert.h>
#define BITFIELD_BPW ((int) (sizeof(unsigned long long) * 8))

#define BITFIELD_SHIFT(bit) ((bit) / BITFIELD_BPW)
#define BITFIELD_OFFSET(bit) ((bit) & (BITFIELD_BPW - 1))
#define BITFIELD_WORDS (BITFIELD_SHIFT(BITFIELD_SIZE))

typedef struct bitfield {
	unsigned long long _bits[BITFIELD_WORDS];
} Bitfield;

#define INLINE __inline

/* Word-oriented operations on bitfields */
#define BITFIELD_WORD(p, ndx) \
	(((ndx) >= 0 && (ndx) < BITFIELD_WORDS) ? (p)->_bits[ndx] : 0ULL)

#define BITFIELD_SET_WORD(p, ndx, word)                   \
	{                                                 \
		if ((ndx) >= 0 && (ndx) < BITFIELD_WORDS) \
			(p)->_bits[ndx] = word;           \
	}

/* Operate on least significant bit of a bitfield. */

#define BITFIELD_LSB_ISONE(p) \
	((p)->_bits[0] & 1ULL)

#define BITFIELD_SET_LSB(p) \
	((p)->_bits[0] |= 1ULL)

#define BITFIELD_CLR_LSB(p) \
	((p)->_bits[0] &= ~(1ULL))

/* Operate on most significant bit of a bitfield. */

#define BITFIELD_MSB_ISONE(p) \
	((p)->_bits[BITFIELD_SHIFT(BITFIELD_SIZE - 1)] & (1ULL << (BITFIELD_BPW - 1)))

#define BITFIELD_SET_MSB(p) \
	((p)->_bits[BITFIELD_SHIFT(BITFIELD_SIZE - 1)] |= (1ULL << (BITFIELD_BPW - 1)))

#define BITFIELD_CLR_MSB(p) \
	((p)->_bits[BITFIELD_SHIFT(BITFIELD_SIZE - 1)] &= ~(1ULL << (BITFIELD_BPW - 1)))

/* Operate on arbitrary bits within the bitfield. */

#define BITFIELD_SETB(p, bit) (((bit) >= 0 && (bit) < BITFIELD_SIZE) ? (p)->_bits[BITFIELD_SHIFT(bit)] |= (1ULL << BITFIELD_OFFSET(bit)) : 0)

#define BITFIELD_CLRB(p, bit) (((bit) >= 0 && (bit) < BITFIELD_SIZE) ? (p)->_bits[BITFIELD_SHIFT(bit)] &= ~(1ULL << BITFIELD_OFFSET(bit)) : 0)

#define BITFIELD_TSTB(p, bit) (((bit) >= 0 && (bit) < BITFIELD_SIZE) ? ((p)->_bits[BITFIELD_SHIFT(bit)] & (1ULL << BITFIELD_OFFSET(bit))) : 0)

/* Clear or set all the bits in the bitfield. */

#define BITFIELD_CLRALL(p)                           \
	{                                            \
		int w;                               \
		assert(p != NULL);                   \
		for (w = 0; w < BITFIELD_WORDS; w++) \
			(p)->_bits[w] = 0ULL;        \
	}

#define BITFIELD_SETALL(p)                           \
	{                                            \
		int w;                               \
		assert(p != NULL);                   \
		for (w = 0; w < BITFIELD_WORDS; w++) \
			(p)->_bits[w] = ~(0ULL);     \
	}

/* Comparison functions for two bitfield. */

INLINE int
BITFIELD_IS_ZERO(Bitfield *p)
{
	int w;
	assert(p != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		if ((p)->_bits[w])
			return 0;
	return 1;
}

INLINE int
BITFIELD_IS_ONES(Bitfield *p)
{
	int w;
	assert(p != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		if ((p)->_bits[w] != ~(0ULL))
			return 0;
	return 1;
}

INLINE int
BITFIELD_IS_NONZERO(Bitfield *p)
{
	int w;
	assert(p != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		if ((p)->_bits[w])
			return 1;
	return 0;
}

INLINE int
BITFIELD_NUM_ONES(Bitfield *p)
{
	int w, cnt;
	unsigned long long n;
	assert(p != NULL);

	cnt = 0;
	for (w = 0; w < BITFIELD_WORDS; w++)
		for (n = (p)->_bits[w]; n != 0ULL; cnt++)
			n &= (n - 1);

	return (cnt);
}

INLINE int
BITFIELD_LS_ONE(Bitfield *p)
{
	int w, bit;
	unsigned long long n, x;
	assert(p != NULL);

	bit = 0;
	for (w = 0; w < BITFIELD_WORDS; w++) {
		n = (p)->_bits[w];

		/* Look for the first non-zero word. */
		if (n != 0ULL)
			break;

		bit += BITFIELD_BPW;
	}

	/* No non-zero words found in the bitfield. */
	if (w == BITFIELD_WORDS)
		return (-1);

	/* Slide a single bit left, looking for the non-zero bit. */
	for (x = 1ULL; !(n & x); bit++)
		x <<= 1;

	return (bit);
}

INLINE int
BITFIELD_MS_ONE(Bitfield *p)
{
	int w, bit;
	unsigned long long n, x;
	assert(p != NULL);

	bit = BITFIELD_SIZE - 1;
	for (w = BITFIELD_WORDS - 1; w >= 0; w--) {
		n = (p)->_bits[w];

		/* Look for the first non-zero word. */
		if (n != 0ULL)
			break;

		bit -= BITFIELD_BPW;
	}

	/* No non-zero words found in the bitfield. */
	if (w < 0)
		return (-1);

	/* Slide a single bit right, looking for the non-zero bit. */
	for (x = 1ULL << BITFIELD_BPW - 1; !(n & x); bit--)
		x >>= 1;

	return (bit);
}

INLINE int
BITFIELD_EQ(Bitfield *p, Bitfield *q)
{
	int w;
	assert(p != NULL && q != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		if ((p)->_bits[w] != (q)->_bits[w])
			return 0;
	return 1;
}

INLINE int
BITFIELD_NOTEQ(Bitfield *p, Bitfield *q)
{
	int w;
	assert(p != NULL && q != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		if ((p)->_bits[w] != (q)->_bits[w])
			return 1;
	return 0;
}

/* Logical manipulation functions for applying one bitfield to another. */

INLINE int
BITFIELD_SETM(Bitfield *p, Bitfield *mask)
{
	int w;
	assert(p != NULL && mask != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		(p)->_bits[w] |= (mask)->_bits[w];
	return 0;
}

INLINE int
BITFIELD_CLRM(Bitfield *p, Bitfield *mask)
{
	int w;
	assert(p != NULL && mask != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		(p)->_bits[w] &= ~((mask)->_bits[w]);
	return 0;
}

INLINE int
BITFIELD_ANDM(Bitfield *p, Bitfield *mask)
{
	int w;
	assert(p != NULL && mask != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		(p)->_bits[w] &= (mask)->_bits[w];
	return 0;
}

INLINE int
BITFIELD_TSTM(Bitfield *p, Bitfield *mask)
{
	int w;
	assert(p != NULL && mask != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		if ((p)->_bits[w] & (mask)->_bits[w])
			return 1;
	return 0;
}

INLINE int
BITFIELD_TSTALLM(Bitfield *p, Bitfield *mask)
{
	int w;
	assert(p != NULL && mask != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		if (((p)->_bits[w] & (mask)->_bits[w]) != (mask)->_bits[w])
			return 0;
	return 1;
}

INLINE int
BITFIELD_CPY(Bitfield *p, Bitfield *q)
{
	int w;
	assert(p != NULL && q != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		(p)->_bits[w] = (q)->_bits[w];
	return 0;
}

INLINE int
BITFIELD_CPYNOTM(Bitfield *p, Bitfield *q)
{
	int w;
	assert(p != NULL && q != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		(p)->_bits[w] = ~((q)->_bits[w]);
	return 0;
}

INLINE int
BITFIELD_ORNOTM(Bitfield *p, Bitfield *q)
{
	int w;
	assert(p != NULL && q != NULL);
	for (w = 0; w < BITFIELD_WORDS; w++)
		(p)->_bits[w] |= ~((q)->_bits[w]);
	return 0;
}

/* Logical shift left and shift right for bitfield. */

INLINE int
BITFIELD_SHIFTL(Bitfield *p)
{
	int w, upper;
	assert(p != NULL);

	for (w = 0; w < BITFIELD_WORDS - 1; w++) {
		upper = (p->_bits[w] & (1ULL << (BITFIELD_BPW - 1))) ? 1 : 0;
		p->_bits[w] <<= 1;
		p->_bits[w + 1] <<= 1;
		p->_bits[w + 1] |= upper;
	}
	return 0;
}

INLINE int
BITFIELD_SHIFTR(Bitfield *p)
{
	int w, lower;
	assert(p != NULL);

	for (w = BITFIELD_WORDS - 1; w > 0; w--) {
		lower = p->_bits[w] & 1ULL;
		p->_bits[w] >>= 1;
		p->_bits[w - 1] >>= 1;
		p->_bits[w - 1] |= (lower ? (1ULL << (BITFIELD_BPW - 1)) : 0);
	}
	return 0;
}
#ifdef __cplusplus
}
#endif
#endif /* _BITFIELD_H */


================================================
FILE: src/include/cmds.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * cmds.h
 *
 *	Header file for the PBS utilities.
 */

#ifndef _CMDS_H
#define _CMDS_H
#ifdef __cplusplus
extern "C" {
#endif

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <ctype.h>
#include <string.h>
#include <time.h>

#include "pbs_error.h"
#include "libpbs.h"
#include "libsec.h"

/* Needed for qdel and pbs_deljoblist */
#define DELJOB_DFLT_NUMIDS 1000

typedef struct svr_jobid_list svr_jobid_list_t;
struct svr_jobid_list {
	int max_sz;
	int total_jobs;
	int svr_fd;
	char svrname[PBS_MAXSERVERNAME + 1];
	char **jobids;
	svr_jobid_list_t *next;
};

#ifndef TRUE
#define TRUE 1
#define FALSE 0
#endif

#define notNULL(x) (((x) != NULL) && (strlen(x) > (size_t) 0))
#define NULLstr(x) (((x) == NULL) || (strlen(x) == 0))

#define MAX_LINE_LEN 4095
#define LARGE_BUF_LEN 4096
#define MAXSERVERNAME PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2
#define PBS_DEPEND_LEN 2040

/* for calling pbs_parse_quote:  to accept whitespace as data or separators */
#define QMGR_ALLOW_WHITE_IN_VALUE 1
#define QMGR_NO_WHITE_IN_VALUE 0

#define QDEL_MAIL_SUPPRESS 1000

#define PBS_JOBCOOKIE "PBS_JOBCOOKIE"
#define PBS_INTERACTIVE_COOKIE "PBS_INTERACTIVE_COOKIE"

extern int optind, opterr;
extern char *optarg;

extern int parse_at_item(char *, char *, char *);
extern int parse_jobid(char *, char **, char **, char **);
extern int parse_stage_name(char *, char *, char *, char *);
extern void prt_error(char *, char *, int);
extern int check_max_job_sequence_id(struct batch_status *);
extern void set_attr_error_exit(struct attrl **, char *, char *);
extern void set_attr_resc_error_exit(struct attrl **, char *, char *, char *);

#ifdef __cplusplus
}
#endif
#endif /* _CMDS_H */


================================================
FILE: src/include/credential.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _CREDENTIAL_H
#define _CREDENTIAL_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * credential.h - header file for default authentication system provided
 *	with PBS.
 *
 * Other Requrired Header Files:
 *	"portability.h"
 *	"libpbs.h"
 *
 */

/*
 * a full ticket (credential) as passed from the client to the server
 * is of the following size: 8 for the pbs_iff key + 8 for the timestamp +
 * space for user and host name rounded up to multiple of 8 which is the
 * sub-credential size
 */
#define PBS_KEY_SIZE 8
#define PBS_TIMESTAMP_SZ 8
#define PBS_SUBCRED_SIZE ((PBS_MAXUSER + PBS_MAXHOSTNAME + 7) / 8 * 8)
#define PBS_SEALED_SIZE (PBS_SUBCRED_SIZE + PBS_TIMESTAMP_SZ)
#define PBS_TICKET_SIZE (PBS_KEY_SIZE + PBS_SEALED_SIZE)

#define CREDENTIAL_LIFETIME 1800
#define CREDENTIAL_TIME_DELTA 300
#define ENV_AUTH_KEY "PBS_AUTH_KEY"

#ifdef __cplusplus
}
#endif
#endif /* _CREDENTIAL_H */


================================================
FILE: src/include/dedup_jobids.h
================================================
/*
 * Copyright (C) 1994-2023 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <ctype.h>
#include "list_link.h"

struct array_job_range_list {
	char *range;
	struct array_job_range_list *next;
};
typedef struct array_job_range_list array_job_range_list;

int is_array_job(char *id);
array_job_range_list * new_job_range(void);
void free_array_job_range_list(array_job_range_list *head);
int dedup_jobids(char **jobids, int *numjids, char *malloc_track);


================================================
FILE: src/include/dis.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _DIS_H
#define _DIS_H
#ifdef __cplusplus
extern "C" {
#endif

#include <string.h>
#include <limits.h>
#include <float.h>
#include "Long.h"
#include "auth.h"

#ifndef TRUE
#define TRUE 1
#define FALSE 0
#endif

/*
 * Integer function return values from Data-is-Strings reading calls
 */

#define DIS_SUCCESS 0	/* No error */
#define DIS_OVERFLOW 1	/* Value too large to convert */
#define DIS_HUGEVAL 2	/* Tried to write floating point infinity */
#define DIS_BADSIGN 3	/* Negative sign on an unsigned datum */
#define DIS_LEADZRO 4	/* Input count or value has leading zero */
#define DIS_NONDIGIT 5	/* Non-digit found where a digit was expected */
#define DIS_NULLSTR 6	/* String read has an embedded ASCII NUL */
#define DIS_EOD 7	/* Premature end of message */
#define DIS_NOMALLOC 8	/* Unable to malloc space for string */
#define DIS_PROTO 9	/* Supporting protocol failure */
#define DIS_NOCOMMIT 10 /* Protocol failure in commit */
#define DIS_EOF 11	/* End of File */

unsigned long disrul(int stream, int *retval);

/*#if UINT_MAX == ULONG_MAX*/
#if SIZEOF_UNSIGNED == SIZEOF_LONG
#define disrui(stream, retval) (unsigned) disrul(stream, (retval))
#else
unsigned disrui(int stream, int *retval);
#endif

/*#if USHRT_MAX == UINT_MAX*/
#if SIZEOF_UNSIGNED_SHORT == SIZEOF_UNSIGNED_INT
#define disrus(stream, retval) (unsigned short) disrui(stream, (retval))
#else
unsigned short disrus(int stream, int *retval);
#endif

/*#if UCHAR_MAX == USHRT_MAX*/
#if SIZEOF_UNSIGNED_CHAR == SIZEOF_UNSIGNED_SHORT
#define disruc(stream, retval) (unsigned char) disrus(stream, (retval))
#else
unsigned char disruc(int stream, int *retval);
#endif

long disrsl(int stream, int *retval);
/*#if INT_MIN == LONG_MIN && INT_MAX == LONG_MAX*/
#if SIZEOF_INT == SIZEOF_LONG
#define disrsi(stream, retval) (int) disrsl(stream, (retval))
#else
int disrsi(int stream, int *retval);
#endif

/*#if SHRT_MIN == INT_MIN && SHRT_MAX == INT_MAX*/
#if SIZEOF_SHORT == SIZEOF_INT
#define disrss(stream, retval) (short) disrsi(stream, (retval))
#else
short disrss(int stream, int *retval);
#endif

/*#if CHAR_MIN == SHRT_MIN && CHAR_MAX == SHRT_MAX*/
#if SIZEOF_SIGNED_CHAR == SIZEOF_SHORT
#define disrsc(stream, retval) (signed char) disrss(stream, (retval))
#else
signed char disrsc(int stream, int *retval);
#endif

/*#if CHAR_MIN, i.e. if chars are signed*/
/* also, flip the order of statements */
#if __CHAR_UNSIGNED__
#define disrc(retval, stream) (char) disruc(stream, (retval))
#else
#define disrc(stream, retval) (char) disrsc(stream, (retval))
#endif

char *disrcs(int stream, size_t *nchars, int *retval);
int disrfcs(int stream, size_t *nchars, size_t achars, char *value);
char *disrst(int stream, int *retval);
int disrfst(int stream, size_t achars, char *value);

/*
 * some compilers do not like long doubles, if long double is the same
 * as a double, just use a double.
 */
#if SIZEOF_DOUBLE == SIZEOF_LONG_DOUBLE
typedef double dis_long_double_t;
#else
typedef long double dis_long_double_t;
#endif

dis_long_double_t disrl(int stream, int *retval);
/*#if DBL_MANT_DIG == LDBL_MANT_DIG && DBL_MAX_EXP == LDBL_MAX_EXP*/
#if SIZEOF_DOUBLE == SIZEOF_LONG_DOUBLE
#define disrd(stream, retval) (double) disrl(stream, (retval))
#else
double disrd(int stream, int *retval);
#endif

/*#if FLT_MANT_DIG == DBL_MANT_DIG && FLT_MAX_EXP == DBL_MAX_EXP*/
#if SIZEOF_FLOAT == SIZEOF_DOUBLE
#define disrf(stream, retval) (float) disrd(stream, (retval))
#else
float disrf(int stream, int *retval);
#endif

int diswul(int stream, unsigned long value);
/*#if UINT_MAX == ULONG_MAX*/
#if SIZEOF_UNSIGNED_INT == SIZEOF_UNSIGNED_LONG
#define diswui(stream, value) diswul(stream, (unsigned long) (value))
#else
int diswui(int stream, unsigned value);
#endif
#define diswus(stream, value) diswui(stream, (unsigned) (value))
#define diswuc(stream, value) diswui(stream, (unsigned) (value))

int diswsl(int stream, long value);
/*#if INT_MIN == LONG_MIN && INT_MAX == LONG_MAX*/
#if SIZEOF_INT == SIZEOF_LONG
#define diswsi(stream, value) diswsl(stream, (long) (value))
#else
int diswsi(int stream, int value);
#endif
#define diswss(stream, value) diswsi(stream, (int) (value))
#define diswsc(stream, value) diswsi(stream, (int) (value))

/*#if CHAR_MIN*/
#if __UNSIGNED_CHAR__
#define diswc(stream, value) diswui(stream, (unsigned) (value))
#else
#define diswc(stream, value) diswsi(stream, (int) (value))
#endif

int diswcs(int stream, const char *value, size_t nchars);
#define diswst(stream, value) diswcs(stream, value, strlen(value))

int diswl_(int stream, dis_long_double_t value, unsigned int ndigs);
#define diswl(stream, value) diswl_(stream, (value), LDBL_DIG)
#define diswd(stream, value) diswl_(stream, (dis_long_double_t) (value), DBL_DIG)
/*#if FLT_MANT_DIG == DBL_MANT_DIG || DBL_MANT_DIG == LDBL_MANT_DIG*/
#if SIZEOF_FLOAT == SIZEOF_DOUBLE
#define diswf(stream, value) diswl_(stream, (dis_long_double_t) (value), FLT_DIG)
#else
int diswf(int stream, double value);
#endif

int diswull(int stream, u_Long value);
u_Long disrull(int stream, int *retval);

extern const char *dis_emsg[];

/* the following routines set/control DIS over tcp */
extern void DIS_tcp_funcs();

#define PBS_DIS_BUFSZ 8192

#define DIS_WRITE_BUF 0
#define DIS_READ_BUF 1

typedef struct pbs_dis_buf {
	size_t tdis_bufsize;
	size_t tdis_len;
	char *tdis_pos;
	char *tdis_data;
} pbs_dis_buf_t;

typedef struct pbs_tcp_auth_data {
	int ctx_status;
	void *ctx;
	auth_def_t *def;
} pbs_tcp_auth_data_t;

typedef struct pbs_tcp_chan {
	pbs_dis_buf_t readbuf;
	pbs_dis_buf_t writebuf;
	int is_old_client; /* This is just for backward compatibility */
	pbs_tcp_auth_data_t auths[2];
} pbs_tcp_chan_t;

void dis_clear_buf(pbs_dis_buf_t *);
void dis_reset_buf(int, int);
int disr_skip(int, size_t);
int dis_getc(int);
int dis_gets(int, char *, size_t);
int dis_puts(int, const char *, size_t);
int dis_flush(int);
void dis_setup_chan(int, pbs_tcp_chan_t *(*) (int) );
void dis_destroy_chan(int);

void transport_chan_set_ctx_status(int, int, int);
int transport_chan_get_ctx_status(int, int);
void transport_chan_set_authctx(int, void *, int);
void *transport_chan_get_authctx(int, int);
void transport_chan_set_authdef(int, auth_def_t *, int);
auth_def_t *transport_chan_get_authdef(int, int);
int transport_send_pkt(int, int, void *, size_t);
int transport_recv_pkt(int, int *, void **, size_t *);

extern pbs_tcp_chan_t *(*pfn_transport_get_chan)(int);
extern int (*pfn_transport_set_chan)(int, pbs_tcp_chan_t *);
extern int (*pfn_transport_recv)(int, void *, int);
extern int (*pfn_transport_send)(int, void *, int);

#define transport_recv(x, y, z) (*pfn_transport_recv)(x, y, z)
#define transport_send(x, y, z) (*pfn_transport_send)(x, y, z)
#define transport_get_chan(x) (*pfn_transport_get_chan)(x)
#define transport_set_chan(x, y) (*pfn_transport_set_chan)(x, y)

#ifdef __cplusplus
}
#endif
#endif /* _DIS_H */


================================================
FILE: src/include/grunt.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _GRUNT_H
#define _GRUNT_H
#ifdef __cplusplus
extern "C" {
#endif
/* structure used by grunt syntax parser located in libpbs.h */
typedef struct key_value_pair {
	char *kv_keyw;
	char *kv_val;
} key_value_pair;

#define KVP_SIZE 50
#define MPIPROCS "mpiprocs"
#define OMPTHREADS "ompthreads"

extern struct resc_sum *svr_resc_sum;
extern int parse_chunk(char *str, int *nchk, int *nl, struct key_value_pair **kv, int *dflt);
extern int parse_chunk_r(char *str, int *nchk, int *pnelem, int *nkve, struct key_value_pair **pkv, int *dflt);
extern int parse_chunk_make_room(int inuse, int extra, struct key_value_pair **rtn);
extern int parse_chunk_make_room_r(int inuse, int extra, int *pnkve, struct key_value_pair **ppkve);
extern int parse_node_resc(char *str, char **nodep, int *nl, struct key_value_pair **kv);
extern int parse_node_resc_r(char *str, char **nodep, int *pnelem, int *nlkv, struct key_value_pair **kv);
extern char *parse_plus_spec(char *selstr, int *rc);
extern char *parse_plus_spec_r(char *selstr, char **last, int *hp);
extern int parse_resc_equal_string(char *start, char **name, char **value, char **last);
char *get_first_vnode(char *execvnode);
#ifdef __cplusplus
}
#endif
#endif /* _GRUNT_H */


================================================
FILE: src/include/hook.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _HOOK_H
#define _HOOK_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * hook.h - structure definitions for hook objects
 *
 * Include Files Required:
 *	<sys/types.h>
 *	"list_link.h"
 *	"batch_request.h"
 *	"pbs_ifl.h"
 */
#ifndef TRUE
#define TRUE 1
#endif

#ifndef FALSE
#define FALSE 0
#endif

#include "pbs_python.h"

enum hook_type {
	HOOK_SITE,
	HOOK_PBS
};
typedef enum hook_type hook_type;

enum hook_user {
	HOOK_PBSADMIN,
	HOOK_PBSUSER
};
typedef enum hook_user hook_user;

#define HOOK_FAIL_ACTION_NONE 0x01
#define HOOK_FAIL_ACTION_OFFLINE_VNODES 0x02
#define HOOK_FAIL_ACTION_CLEAR_VNODES 0x04
#define HOOK_FAIL_ACTION_SCHEDULER_RESTART_CYCLE 0x08

/* server hooks */

#define HOOK_EVENT_QUEUEJOB 0x01
#define HOOK_EVENT_MODIFYJOB 0x02
#define HOOK_EVENT_RESVSUB 0x04
#define HOOK_EVENT_MOVEJOB 0x08
#define HOOK_EVENT_RUNJOB 0x10
#define HOOK_EVENT_JOBOBIT 0x800000
#define HOOK_EVENT_PROVISION 0x20
#define HOOK_EVENT_PERIODIC 0x8000
#define HOOK_EVENT_RESV_END 0x10000
#define HOOK_EVENT_MANAGEMENT 0x200000
#define HOOK_EVENT_MODIFYVNODE 0x400000
#define HOOK_EVENT_RESV_BEGIN 0x1000000
#define HOOK_EVENT_RESV_CONFIRM 0x2000000
#define HOOK_EVENT_MODIFYRESV 0x4000000
#define HOOK_EVENT_POSTQUEUEJOB 0x8000000

/* mom hooks */
#define HOOK_EVENT_EXECJOB_BEGIN 0x40
#define HOOK_EVENT_EXECJOB_PROLOGUE 0x80
#define HOOK_EVENT_EXECJOB_EPILOGUE 0x100
#define HOOK_EVENT_EXECJOB_END 0x200
#define HOOK_EVENT_EXECJOB_PRETERM 0x400
#define HOOK_EVENT_EXECJOB_LAUNCH 0x800
#define HOOK_EVENT_EXECHOST_PERIODIC 0x1000
#define HOOK_EVENT_EXECHOST_STARTUP 0x2000
#define HOOK_EVENT_EXECJOB_ATTACH 0x4000
#define HOOK_EVENT_EXECJOB_RESIZE 0x20000
#define HOOK_EVENT_EXECJOB_ABORT 0x40000
#define HOOK_EVENT_EXECJOB_POSTSUSPEND 0x80000
#define HOOK_EVENT_EXECJOB_PRERESUME 0x100000

#define MOM_EVENTS (HOOK_EVENT_EXECJOB_BEGIN | HOOK_EVENT_EXECJOB_PROLOGUE | HOOK_EVENT_EXECJOB_EPILOGUE | HOOK_EVENT_EXECJOB_END | HOOK_EVENT_EXECJOB_PRETERM | HOOK_EVENT_EXECHOST_PERIODIC | HOOK_EVENT_EXECJOB_LAUNCH | HOOK_EVENT_EXECHOST_STARTUP | HOOK_EVENT_EXECJOB_ATTACH | HOOK_EVENT_EXECJOB_RESIZE | HOOK_EVENT_EXECJOB_ABORT | HOOK_EVENT_EXECJOB_POSTSUSPEND | HOOK_EVENT_EXECJOB_PRERESUME)
#define USER_MOM_EVENTS (HOOK_EVENT_EXECJOB_PROLOGUE | HOOK_EVENT_EXECJOB_EPILOGUE | HOOK_EVENT_EXECJOB_PRETERM)
#define FAIL_ACTION_EVENTS (HOOK_EVENT_EXECJOB_BEGIN | HOOK_EVENT_EXECHOST_STARTUP | HOOK_EVENT_EXECJOB_PROLOGUE)
struct hook {
	char *hook_name;	  /* unique name of the hook */
	hook_type type;		  /* site-defined or pbs builtin */
	int enabled;		  /* TRUE or FALSE */
	int debug;		  /* TRUE or FALSE */
	hook_user user;		  /* who executes the hook */
	unsigned int fail_action; /* what to do when hook fails unexpectedly */
	unsigned int event;	  /* event  flag */
	short order;		  /* -1000..1000 */
	/* -1000..0 for pbs hooks */
	/* 1..1000 for site hooks */
	int alarm;    /* number of seconds */
	void *script; /* actual script content in some fmt */

	int freq; /* # of seconds in between calls */
	/* install hook */
	int pending_delete;		     /* set to 1 if a mom hook and pending */
	unsigned long hook_control_checksum; /* checksum for .HK file */
	unsigned long hook_script_checksum;  /* checksum for .PY file */
	unsigned long hook_config_checksum;  /* checksum for .CF file */
	/* deletion */
	pbs_list_link hi_allhooks;
	pbs_list_link hi_queuejob_hooks;
	pbs_list_link hi_postqueuejob_hooks;
	pbs_list_link hi_modifyjob_hooks;
	pbs_list_link hi_resvsub_hooks;
	pbs_list_link hi_modifyresv_hooks;
	pbs_list_link hi_movejob_hooks;
	pbs_list_link hi_runjob_hooks;
	pbs_list_link hi_jobobit_hooks;
	pbs_list_link hi_management_hooks;
	pbs_list_link hi_modifyvnode_hooks;
	pbs_list_link hi_provision_hooks;
	pbs_list_link hi_periodic_hooks;
	pbs_list_link hi_resv_confirm_hooks;
	pbs_list_link hi_resv_begin_hooks;
	pbs_list_link hi_resv_end_hooks;
	pbs_list_link hi_execjob_begin_hooks;
	pbs_list_link hi_execjob_prologue_hooks;
	pbs_list_link hi_execjob_epilogue_hooks;
	pbs_list_link hi_execjob_end_hooks;
	pbs_list_link hi_execjob_preterm_hooks;
	pbs_list_link hi_execjob_launch_hooks;
	pbs_list_link hi_exechost_periodic_hooks;
	pbs_list_link hi_exechost_startup_hooks;
	pbs_list_link hi_execjob_attach_hooks;
	pbs_list_link hi_execjob_resize_hooks;
	pbs_list_link hi_execjob_abort_hooks;
	pbs_list_link hi_execjob_postsuspend_hooks;
	pbs_list_link hi_execjob_preresume_hooks;
	struct work_task *ptask; /* work task pointer, used in periodic hooks */
};

typedef struct hook hook;

/* Hook-related files and directories */
#define HOOK_FILE_SUFFIX ".HK"	   /* hook control file */
#define HOOK_SCRIPT_SUFFIX ".PY"   /* hook script file */
#define HOOK_REJECT_SUFFIX ".RJ"   /* hook error reject message */
#define HOOK_TRACKING_SUFFIX ".TR" /* hook pending action tracking file */
#define HOOK_BAD_SUFFIX ".BD"	   /* a bad (moved out of the way) hook file */
#define HOOK_CONFIG_SUFFIX ".CF"
#define PBS_HOOKDIR "hooks"
#define PBS_HOOK_WORKDIR PBS_HOOKDIR "/tmp"
#define PBS_HOOK_TRACKING PBS_HOOKDIR "/tracking"
#define PBS_HOOK_NAME_SIZE 512

/* Some hook-related buffer sizes */
#define HOOK_BUF_SIZE 512
#define HOOK_MSG_SIZE 3172

/* parameters to import and export qmgr command */
#define CONTENT_TYPE_PARAM "content-type"
#define CONTENT_ENCODING_PARAM "content-encoding"
#define INPUT_FILE_PARAM "input-file"
#define OUTPUT_FILE_PARAM "output-file"

/* attribute default values */
/* Save only the non-defaults */
#define HOOK_TYPE_DEFAULT HOOK_SITE
#define HOOK_USER_DEFAULT HOOK_PBSADMIN
#define HOOK_FAIL_ACTION_DEFAULT HOOK_FAIL_ACTION_NONE
#define HOOK_ENABLED_DEFAULT TRUE
#define HOOK_DEBUG_DEFAULT FALSE
#define HOOK_EVENT_DEFAULT 0
#define HOOK_ORDER_DEFAULT 1
#define HOOK_ALARM_DEFAULT 30
#define HOOK_FREQ_DEFAULT 120
#define HOOK_PENDING_DELETE_DEFAULT 0

/* Various attribute names in string format */
#define HOOKATT_NAME "hook_name"
#define HOOKATT_TYPE "type"
#define HOOKATT_USER "user"
#define HOOKATT_ENABLED "enabled"
#define HOOKATT_DEBUG "debug"
#define HOOKATT_EVENT "event"
#define HOOKATT_ORDER "order"
#define HOOKATT_ALARM "alarm"
#define HOOKATT_FREQ "freq"
#define HOOKATT_FAIL_ACTION "fail_action"
#define HOOKATT_PENDING_DELETE "pending_delete"

#define HOOK_PBS_PREFIX "PBS" /* valid Hook name prefix for PBS hook */

/* Valid Hook type values */
#define HOOKSTR_SITE "site"
#define HOOKSTR_PBS "pbs"
#define HOOKSTR_UNKNOWN "" /* empty string is the value for */
/* unknown Hook type and Hook user */

/*  Valid Hook user values */
#define HOOKSTR_ADMIN "pbsadmin"
#define HOOKSTR_USER "pbsuser"

/*  Valid Hook fail_action values */
#define HOOKSTR_FAIL_ACTION_NONE "none"
#define HOOKSTR_FAIL_ACTION_OFFLINE_VNODES "offline_vnodes"
#define HOOKSTR_FAIL_ACTION_CLEAR_VNODES "clear_vnodes_upon_recovery"
#define HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE "scheduler_restart_cycle"

/* Valid hook enabled or debug values */
#define HOOKSTR_TRUE "true"
#define HOOKSTR_FALSE "false"

/* Valid Hook event values */
#define HOOKSTR_QUEUEJOB "queuejob"
#define HOOKSTR_POSTQUEUEJOB "postqueuejob"
#define HOOKSTR_MODIFYJOB "modifyjob"
#define HOOKSTR_RESVSUB "resvsub"
#define HOOKSTR_MODIFYRESV "modifyresv"
#define HOOKSTR_MOVEJOB "movejob"
#define HOOKSTR_RUNJOB "runjob"
#define HOOKSTR_PROVISION "provision"
#define HOOKSTR_PERIODIC "periodic"
#define HOOKSTR_RESV_CONFIRM "resv_confirm"
#define HOOKSTR_RESV_BEGIN "resv_begin"
#define HOOKSTR_RESV_END "resv_end"
#define HOOKSTR_MANAGEMENT "management"
#define HOOKSTR_JOBOBIT "jobobit"
#define HOOKSTR_MODIFYVNODE "modifyvnode"
#define HOOKSTR_EXECJOB_BEGIN "execjob_begin"
#define HOOKSTR_EXECJOB_PROLOGUE "execjob_prologue"
#define HOOKSTR_EXECJOB_EPILOGUE "execjob_epilogue"
#define HOOKSTR_EXECJOB_END "execjob_end"
#define HOOKSTR_EXECJOB_PRETERM "execjob_preterm"
#define HOOKSTR_EXECJOB_LAUNCH "execjob_launch"
#define HOOKSTR_EXECJOB_ATTACH "execjob_attach"
#define HOOKSTR_EXECJOB_RESIZE "execjob_resize"
#define HOOKSTR_EXECJOB_ABORT "execjob_abort"
#define HOOKSTR_EXECJOB_POSTSUSPEND "execjob_postsuspend"
#define HOOKSTR_EXECJOB_PRERESUME "execjob_preresume"
#define HOOKSTR_EXECHOST_PERIODIC "exechost_periodic"
#define HOOKSTR_EXECHOST_STARTUP "exechost_startup"
#define HOOKSTR_NONE "\"\"" /* double quote val for event == 0 */

#define HOOKSTR_FAIL_ACTION_EVENTS HOOKSTR_EXECJOB_BEGIN ", " HOOKSTR_EXECHOST_STARTUP ", " HOOKSTR_EXECJOB_PROLOGUE

/* Valid Hook order valid ranges */
/* for SITE hooks */
#define HOOK_SITE_ORDER_MIN 1
#define HOOK_SITE_ORDER_MAX 1000

/* for PBS hooks */
#define HOOK_PBS_ORDER_MIN -1000
#define HOOK_PBS_ORDER_MAX 2000

/* For cleanup_hooks_workdir() parameters */
#define HOOKS_TMPFILE_MAX_AGE 1200 /* a temp hooks file's maximum age (in  */
/* in secs) before getting removed      */
#define HOOKS_TMPFILE_NEXT_CLEANUP_PERIOD 600 /* from this time, when (secs) */
/* cleanup_hooks_workdir()     */
/* gets called. 		     */

/* for import/export actions */
#define HOOKSTR_CONTENT "application/x-python"
#define HOOKSTR_CONFIG "application/x-config"
#define HOOKSTR_BASE64 "base64"
#define HOOKSTR_DEFAULT "default"

#define PBS_HOOK_CONFIG_FILE "PBS_HOOK_CONFIG_FILE"

/* default import statement printed out on a "print hook" request */
#define PRINT_HOOK_IMPORT_CALL "import hook %s application/x-python base64 -\n"
#define PRINT_HOOK_IMPORT_CONFIG "import hook %s application/x-config base64 -\n"

/* Format: The first %s is the directory location */
#define FMT_HOOK_PREFIX "hook_"
#define FMT_HOOK_JOB_OUTFILE "%s" FMT_HOOK_PREFIX "%s.out"
#define FMT_HOOK_INFILE "%s" FMT_HOOK_PREFIX "%s_%s_%d.in"
#define FMT_HOOK_OUTFILE "%s" FMT_HOOK_PREFIX "%s_%s_%d.out"
#define FMT_HOOK_DATAFILE "%s" FMT_HOOK_PREFIX "%s_%s_%d.data"
#define FMT_HOOK_SCRIPT "%s" FMT_HOOK_PREFIX "script%d"
#define FMT_HOOK_SCRIPT_COPY "%s" FMT_HOOK_PREFIX "script_%s.%s"
#define FMT_HOOK_CONFIG "%s" FMT_HOOK_PREFIX "config%d"
#define FMT_HOOK_CONFIG_COPY "%s" FMT_HOOK_PREFIX "config_%s.%s"
#define FMT_HOOK_RESCDEF "%s" FMT_HOOK_PREFIX "resourcedef%d"
#define FMT_HOOK_RESCDEF_COPY "%s" FMT_HOOK_PREFIX "resourcedef.%s"
#define FMT_HOOK_LOG "%s" FMT_HOOK_PREFIX "log%d"

/* Special log levels  - values must not intersect PBS_EVENT* values in log.h */

#define SEVERITY_LOG_DEBUG 0x0005   /* syslog DEBUG */
#define SEVERITY_LOG_WARNING 0x0006 /* syslog WARNING */
#define SEVERITY_LOG_ERR 0x0007	    /* syslog ERR */

/* Power hook name */
#define PBS_POWER "PBS_power"

/* External functions */
extern int
set_hook_name(hook *, char *, char *, size_t);
extern int
set_hook_enabled(hook *, char *, char *, size_t);
extern int
set_hook_debug(hook *, char *, char *, size_t);
extern int
set_hook_type(hook *, char *, char *, size_t, int);
extern int
set_hook_user(hook *, char *, char *, size_t, int);
extern int
set_hook_event(hook *, char *, char *, size_t);
extern int
add_hook_event(hook *, char *, char *, size_t);
extern int
del_hook_event(hook *, char *, char *, size_t);
extern int
set_hook_fail_action(hook *, char *, char *, size_t, int);
extern int
add_hook_fail_action(hook *, char *, char *, size_t, int);
extern int
del_hook_fail_action(hook *, char *, char *, size_t);
extern int
set_hook_order(hook *, char *, char *, size_t);
extern int
set_hook_alarm(hook *, char *, char *, size_t);
extern int
set_hook_freq(hook *, char *, char *, size_t);

extern int
unset_hook_enabled(hook *, char *, size_t);
extern int
unset_hook_debug(hook *, char *, size_t);
extern int
unset_hook_type(hook *, char *, size_t);
extern int
unset_hook_user(hook *, char *, size_t);
extern int
unset_hook_fail_action(hook *, char *, size_t);
extern int
unset_hook_event(hook *, char *, size_t);
extern int
unset_hook_order(hook *, char *, size_t);
extern int
unset_hook_alarm(hook *, char *, size_t);
extern int
unset_hook_freq(hook *, char *, size_t);
extern hook *hook_alloc(void);
extern void hook_free(hook *, void (*)(struct python_script *));
extern void hook_purge(hook *, void (*)(struct python_script *));
extern int hook_save(hook *);
extern hook *hook_recov(char *, FILE *, char *, size_t,
			int (*)(const char *, struct python_script **),
			void (*)(struct python_script *));

extern hook *find_hook(char *);
extern hook *find_hookbyevent(int);
extern int encode_hook_content(char *, char *, char *, char *, size_t);
extern int decode_hook_content(char *, char *, char *, char *, size_t);
extern void print_hooks(unsigned int);
extern void mark_hook_file_bad(char *);

extern char *hook_event_as_string(unsigned int);
extern unsigned int hookstr_event_toint(char *);
extern char *hook_enabled_as_string(int);
extern char *hook_debug_as_string(int);
extern char *hook_type_as_string(hook_type);
extern char *hook_alarm_as_string(int);
extern char *hook_freq_as_string(int);
extern char *hook_order_as_string(short);
extern char *hook_user_as_string(hook_user);
extern char *hook_fail_action_as_string(unsigned int);
extern int num_eligible_hooks(unsigned int);

#ifdef _WORK_TASK_H
extern void cleanup_hooks_workdir(struct work_task *);
#endif

#ifdef WIN32
#define ALARM_HANDLER_ARG void
#else
#define ALARM_HANDLER_ARG int sig
#endif

extern void catch_hook_alarm(ALARM_HANDLER_ARG);
extern int set_alarm(int sec, void (*)(void));

extern void hook_perf_stat_start(char *label, char *action, int);
extern void hook_perf_stat_stop(char *label, char *action, int);
#define HOOK_PERF_POPULATE "populate"
#define HOOK_PERF_FUNC "hook_func"
#define HOOK_PERF_RUN_CODE "run_code"
#define HOOK_PERF_START_PYTHON "start_interpreter"
#define HOOK_PERF_LOAD_INPUT "load_hook_input_file"
#define HOOK_PERF_HOOK_OUTPUT "hook_output"
#define HOOK_PERF_POPULATE_VNODE "populate:pbs.event().vnode"
#define HOOK_PERF_POPULATE_VNODE_O "populate:pbs.event().vnode_o"
#define HOOK_PERF_POPULATE_VNODELIST "populate:pbs.event().vnode_list"
#define HOOK_PERF_POPULATE_VNODELIST_FAIL "populate:pbs.event().vnode_list_fail"
#define HOOK_PERF_POPULATE_RESVLIST "populate:pbs.event().resv_list"
#define HOOK_PERF_POPULATE_JOBLIST "populate:pbs.event().job_list"
#define HOOK_PERF_LOAD_DATA "load_hook_data"
#ifdef __cplusplus
}
#endif
#endif /* _HOOK_H */


================================================
FILE: src/include/hook_func.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _HOOK_FUNC_H
#define _HOOK_FUNC_H
#ifdef __cplusplus
extern "C" {
#endif

#include "work_task.h"
#include "job.h"
#include "hook.h"

/*
 * hook_func.h - structure definitions for hook objects
 *
 * Include Files Required:
 *	<sys/types.h>
 *	"list_link.h"
 *	"batch_request.h"
 *	"pbs_ifl.h"
 */

#define MOM_HOOK_ACTION_NONE 0
#define MOM_HOOK_ACTION_SEND_ATTRS 0x01
#define MOM_HOOK_ACTION_SEND_SCRIPT 0x02
#define MOM_HOOK_ACTION_DELETE 0x04
#define MOM_HOOK_ACTION_SEND_RESCDEF 0x08
#define MOM_HOOK_ACTION_DELETE_RESCDEF 0x10
#define MOM_HOOK_ACTION_SEND_CONFIG 0x20

/* MOM_HOOK_ACTION_SEND_RESCDEF is really not part of this */
#define MOM_HOOK_SEND_ACTIONS (MOM_HOOK_ACTION_SEND_ATTRS | MOM_HOOK_ACTION_SEND_SCRIPT | MOM_HOOK_ACTION_SEND_CONFIG)

struct mom_hook_action {
	char hookname[PBS_HOOK_NAME_SIZE];
	unsigned int action;
	unsigned int reply_expected; /* reply expected from mom for sent out actions */
	int do_delete_action_first;  /* force order between delete and send actions */
	long long int tid;	     /* transaction id to group actions under */
};

/* Return values to sync_mom_hookfilesTPP() function */
enum sync_hookfiles_result {
	SYNC_HOOKFILES_NONE,
	SYNC_HOOKFILES_SUCCESS_ALL,
	SYNC_HOOKFILES_SUCCESS_PARTIAL,
	SYNC_HOOKFILES_FAIL
};

typedef struct mom_hook_action mom_hook_action_t;

extern int add_mom_hook_action(mom_hook_action_t ***,
			       int *, char *, unsigned int, int, long long int);

extern int delete_mom_hook_action(mom_hook_action_t **, int,
				  char *, unsigned int);

extern mom_hook_action_t *find_mom_hook_action(mom_hook_action_t **,
					       int, char *);

extern void add_pending_mom_hook_action(void *minfo, char *, unsigned int);

extern void delete_pending_mom_hook_action(void *minfo, char *, unsigned int);

extern void add_pending_mom_allhooks_action(void *minfo, unsigned int);

extern int has_pending_mom_action_delete(char *);

extern void hook_track_save(void *, int);
extern void hook_track_recov(void);
extern int mc_sync_mom_hookfiles(void);
extern void uc_delete_mom_hooks(void *);
extern int sync_mom_hookfiles_count(void *);
extern void next_sync_mom_hookfiles(void);
extern void send_rescdef(int);
extern unsigned long get_hook_rescdef_checksum(void);
extern void mark_mom_hooks_seen(void);
extern int mom_hooks_seen_count(void);
extern void hook_action_tid_set(long long int);
extern long long int hook_action_tid_get(void);
extern void set_srv_pwr_prov_attribute(void);
extern void fprint_svrattrl_list(FILE *, char *, pbs_list_head *);

#ifdef _BATCH_REQUEST_H
extern int status_hook(hook *, struct batch_request *, pbs_list_head *, char *, size_t);
extern void mgr_hook_import(struct batch_request *);
extern void mgr_hook_export(struct batch_request *);
extern void mgr_hook_set(struct batch_request *);
extern void mgr_hook_unset(struct batch_request *);
extern void mgr_hook_create(struct batch_request *);
extern void mgr_hook_delete(struct batch_request *);
extern void req_stat_hook(struct batch_request *);

/* Hook script processing */
extern int server_process_hooks(int rq_type, char *rq_user, char *rq_host, hook *phook,
				int hook_event, job *pjob, hook_input_param_t *req_ptr,
				char *hook_msg, int msg_len, void (*pyinter_func)(void),
				int *num_run, int *event_initialized);
extern int process_hooks(struct batch_request *, char *, size_t, void (*)(void));
extern int recreate_request(struct batch_request *);

/* Server periodic hook call-back */
extern void run_periodic_hook(struct work_task *ptask);

extern int get_server_hook_results(char *input_file, int *accept_flag, int *reject_flag,
				   char *reject_msg, int reject_msg_size, job *pjob, hook *phook, hook_output_param_t *hook_output);
#endif

#ifdef __cplusplus
}
#endif
#endif /* _HOOK_FUNC_H */


================================================
FILE: src/include/ifl_internal.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _IFL_INTERNAL_H
#define _IFL_INTERNAL_H

#ifdef __cplusplus
extern "C" {
#endif

#include "pbs_ifl.h"
#include "pbs_internal.h"

/* Used for non blocking connect */
#define NOBLK_FLAG "NOBLK"
#define NOBLK_TOUT 2

/* IFL functions */
int __pbs_asyrunjob(int, const char *, const char *, const char *);

int __pbs_asyrunjob_ack(int c, const char *jobid, const char *location, const char *extend);

int __pbs_alterjob(int, const char *, struct attrl *, const char *);

int __pbs_asyalterjob(int, const char *, struct attrl *, const char *);

int __pbs_confirmresv(int, const char *, const char *, unsigned long, const char *);

int __pbs_connect(const char *);

int __pbs_connect_extend(const char *, const char *);

char *__pbs_default(void);

int __pbs_deljob(int, const char *, const char *);

struct batch_deljob_status *__pbs_deljoblist(int, char **, int, const char *);

int __pbs_disconnect(int);

char *__pbs_geterrmsg(int);

int __pbs_holdjob(int, const char *, const char *, const char *);

int __pbs_loadconf(int);

char *__pbs_locjob(int, const char *, const char *);

int __pbs_manager(int, int, int, const char *, struct attropl *, const char *);

int __pbs_movejob(int, const char *, const char *, const char *);

int __pbs_msgjob(int, const char *, int, const char *, const char *);

int __pbs_orderjob(int, const char *, const char *, const char *);

int __pbs_rerunjob(int, const char *, const char *);

int __pbs_rlsjob(int, const char *, const char *, const char *);

int __pbs_runjob(int, const char *, const char *, const char *);

char **__pbs_selectjob(int, struct attropl *, const char *);

int __pbs_sigjob(int, const char *, const char *, const char *);

void __pbs_statfree(struct batch_status *);

void __pbs_delstatfree(struct batch_deljob_status *);

struct batch_status *__pbs_statrsc(int, const char *, struct attrl *, const char *);

struct batch_status *__pbs_statjob(int, const char *, struct attrl *, const char *);

struct batch_status *__pbs_selstat(int, struct attropl *, struct attrl *, const char *);

struct batch_status *__pbs_statque(int, const char *, struct attrl *, const char *);

struct batch_status *__pbs_statserver(int, struct attrl *, const char *);

struct batch_status *__pbs_statsched(int, struct attrl *, const char *);

struct batch_status *__pbs_stathost(int, const char *, struct attrl *, const char *);

struct batch_status *__pbs_statnode(int, const char *, struct attrl *, const char *);

struct batch_status *__pbs_statvnode(int, const char *, struct attrl *, const char *);

struct batch_status *__pbs_statresv(int, const char *, struct attrl *, const char *);

struct batch_status *__pbs_stathook(int, const char *, struct attrl *, const char *);

struct ecl_attribute_errors *__pbs_get_attributes_in_error(int);

char *__pbs_submit(int, struct attropl *, const char *, const char *, const char *);

char *__pbs_submit_resv(int, struct attropl *, const char *);

char *__pbs_modify_resv(int c, const char *resv_id, struct attropl *attrib, const char *extend);

int __pbs_delresv(int, const char *, const char *);

int __pbs_relnodesjob(int c, const char *jobid, const char *node_list, const char *extend);

int __pbs_terminate(int, int, const char *);

preempt_job_info *__pbs_preempt_jobs(int, char **);

int __pbs_register_sched(const char *sched_id, int primary_conn_id, int secondary_conn_id);

#ifdef __cplusplus
}
#endif

#endif /* _IFL_INTERNAL_H */


================================================
FILE: src/include/job.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_JOB_H
#define _PBS_JOB_H
#ifdef __cplusplus
extern "C" {
#endif

#include "list_link.h"
#include "attribute.h"
#include "range.h"
#include "Long.h"

/*
 * job.h - structure definations for job objects
 *
 * Include Files Required:
 *	<sys/types.h>
 *	"list_link.h"
 *	"attribute.h"
 *	"server_limits.h"
 *	"reservation.h"
 */

#ifndef _SERVER_LIMITS_H
#include "server_limits.h"
#endif
#include "work_task.h"

#ifdef PBS_MOM /* For the var_table used in env funcs */
/* struct var_table = used to hold environment variables for the job */

struct var_table {
	char **v_envp;
	int v_ensize;
	int v_used;
};
#endif

/*
 * Dependent Job Structures
 *
 * This set of structures are used by the server to track job
 * dependency.
 *
 * The depend (parent) structure is used to record the type of
 * dependency.  It also heads the list of depend_job related via this type.
 * For a type of "sycnto", the number of jobs expected, registered and
 * ready are also recorded.
 */

struct depend {
	pbs_list_link dp_link; /* link to next dependency, if any       */
	short dp_type;	       /* type of dependency (all) 	         */
	short dp_numexp;       /* num jobs expected (on or syncct only) */
	short dp_numreg;       /* num jobs registered (syncct only)     */
	short dp_released;     /* This job released to run (syncwith)   */
	short dp_numrun;       /* num jobs supposed to run		 */
	pbs_list_head dp_jobs; /* list of related jobs  (all)           */
};

/*
 * The depend_job structure is used to record the name and location
 * of each job which is involved with the dependency
 */

struct depend_job {
	pbs_list_link dc_link;
	short dc_state;			    /* released / ready to run (syncct)	 */
	long dc_cost;			    /* cost of this child (syncct)		 */
	char dc_child[PBS_MAXSVRJOBID + 1]; /* child (dependent) job	 */
	char dc_svr[PBS_MAXSERVERNAME + 1]; /* server owning job	 */
};

/*
 * Warning: the relation between the numbers assigned to after* and before*
 * is critical.
 */
#define JOB_DEPEND_TYPE_AFTERSTART 0
#define JOB_DEPEND_TYPE_AFTEROK 1
#define JOB_DEPEND_TYPE_AFTERNOTOK 2
#define JOB_DEPEND_TYPE_AFTERANY 3
#define JOB_DEPEND_TYPE_BEFORESTART 4
#define JOB_DEPEND_TYPE_BEFOREOK 5
#define JOB_DEPEND_TYPE_BEFORENOTOK 6
#define JOB_DEPEND_TYPE_BEFOREANY 7
#define JOB_DEPEND_TYPE_ON 8
#define JOB_DEPEND_TYPE_RUNONE 9
#define JOB_DEPEND_NUMBER_TYPES 11

#define JOB_DEPEND_OP_REGISTER 1
#define JOB_DEPEND_OP_RELEASE 2
#define JOB_DEPEND_OP_READY 3
#define JOB_DEPEND_OP_DELETE 4
#define JOB_DEPEND_OP_UNREG 5

/*
 * The badplace structure is used to keep track of destinations
 * which have been tried by a route queue and given a "reject"
 * status back, see svr_movejob.c.
 */
typedef struct badplace {
	pbs_list_link bp_link;
	char bp_dest[PBS_MAXROUTEDEST + 1];
} badplace;

/*
 * The grpcache structure defined here is used by MOM to maintain the
 * home directory, uid and gid of the user name under
 * which the job is running.
 * The information is keep here rather than make repeated hits on the
 * password and group files.
 */
struct grpcache {
	uid_t gc_uid;	    /* uid job will execute under */
	gid_t gc_gid;	    /* gid job will execute under */
	gid_t gc_rgid;	    /* login gid of user uid      */
	char gc_homedir[1]; /* more space allocated as part of this	 */
			    /* structure following here		 */
};

/*
 * Job attributes/resources are maintained in one of two ways.
 * Most of the attributes are maintained in a decoded or parsed form.
 * This allows quick access to the attribute and resource values
 * when making decisions about the job (scheduling, routing, ...),
 *
 * Any attribute or resource which is not recognized on this server
 * are kept in an "attrlist", a linked list of the "external"
 * form (attr_extern, see attribute.h).  These are maintained because
 * the job may be passed on to another server (route or qmove) that
 * does recognize them.
 * See the job structure entry ji_attrlist and the attrlist structure.
 */

/*
 * The following job_atr enum provide an index into the array of
 * decoded job attributes, for quick access.
 * Most of the attributes here are "public", but some are Read Only,
 * Private, or even Internal data items; maintained here because of
 * their variable size.
 *
 * "JOB_ATR_LAST" must be the last value as its number is used to
 * define the size of the array.
 */

enum job_atr {
#include "job_attr_enum.h"
#include "site_job_attr_enum.h"
	JOB_ATR_UNKN, /* the special "unknown" type */
	JOB_ATR_LAST  /* This MUST be LAST	*/
};

/* the following enum defines the type of checkpoint to be done */
/* none, based on cputime or walltime.   Used only by Mom       */
enum PBS_Chkpt_By {
	PBS_CHECKPOINT_NONE, /* no checkpoint                   */
	PBS_CHECKPOINT_CPUT, /* checkpoint by cputime interval  */
	PBS_CHECKPOINT_WALLT /* checkpoint by walltime interval */
};

typedef struct string_and_number_t {
	char *str;
	int num;
} string_and_number_t;

typedef struct resc_limit {		   /* per node limits for Mom	*/
	int rl_ncpus;			   /* number of cpus		*/
	int rl_ssi;			   /* ssinodes (for irix cpusets	*/
	long long rl_mem;		   /* working set size (real mem)	*/
	long long rl_vmem;		   /* total mem space (virtual)	*/
	int rl_naccels;			   /* number of accelerators	*/
	long long rl_accel_mem;		   /* accelerator mem (real mem)	*/
	pbs_list_head rl_other_res;	   /* list of all other resources found in execvnode and sched select*/
	unsigned int rl_res_count;	   /* total count of resources */
	char *chunkstr;			   /* chunk represented */
	int chunkstr_sz;		   /* size of chunkstr */
	char *chunkspec;		   /* the spec in select string representing the chunk */
	string_and_number_t host_chunk[2]; /* chunks representing exec_host/exec_host2  */
} resc_limit_t;

/*
 * The "definations" for the job attributes are in the following array,
 * it is also indexed by the JOB_ATR_... enums.
 */

extern attribute_def job_attr_def[];
extern void *job_attr_idx;

#ifndef PBS_MOM

typedef enum histjob_type {
	T_FIN_JOB, /* Job finished execution or terminated */
	T_MOV_JOB, /* Job moved to different destination */
	T_MOM_DOWN /* Non-rerunnable Job failed because of
			 MOM failure.*/
} histjob_type;

#endif /* SERVER only! */

#ifdef PBS_MOM
#include "tm_.h"

/*
 * host_vlist - an array of these is hung off of the hnodent for this host,
 *	i.e. if the hnodent index equals that in ji_nodeid;
 *	The array contains one entry for each vnode allocated for this job
 *	from this host.
 *
 *	WARNING: This array only exists for cpuset machines !
 *
 *		 The mom hooks code (src/resmom/mom_hook_func.c:run_hook())
 *		 depends on this structure. If newer resource members
 *		 are added (besides hv_ncpus, hv_mem), then please update
 *		 mom hooks code, as well as the appropriate RFE.
 *
 */
typedef struct host_vlist {
	char hv_vname[PBS_MAXNODENAME + 1]; /* vnode name     */
	int hv_ncpus;			    /* ncpus assigned */
	size_t hv_mem;			    /* mem assigned   */
} host_vlist_t;

/*
 **	Track nodes with an array of structures which each
 **	point to a list of events
 */
typedef struct hnodent {
	tm_host_id hn_node;	 /* host (node) identifier (index) */
	char *hn_host;		 /* hostname of node */
	int hn_port;		 /* port of Mom */
	int hn_stream;		 /* stream to MOM on node */
	time_t hn_eof_ts;	 /* timestamp of when the stream went down */
	int hn_sister;		 /* save error for KILL_JOB event */
	int hn_nprocs;		 /* num procs allocated to this node */
	int hn_vlnum;		 /* num entries in vlist */
	host_vlist_t *hn_vlist;	 /* list of vnodes allocated */
	resc_limit_t hn_nrlimit; /* resc limits per node */
	void *hn_setup;		 /* save any setup info here */
	pbs_list_head hn_events; /* pointer to list of events */
} hnodent;

typedef struct vmpiprocs {
	tm_node_id vn_node; /* user's vnode identifier */
	hnodent *vn_host;   /* parent (host) nodeent entry */
	char *vn_hname;	    /* host name for MPI, if null value */
	/* use vn_host->hn_host             */
	/* host name for MPI */
	char *vn_vname;		/* vnode name */
	int vn_cpus;		/* number of cpus allocated to proc */
	int vn_mpiprocs;	/* number for mpiprocs  */
	int vn_threads;		/* number for OMP_NUM_THREADS */
	long long vn_mem;	/* working set size (real mem)	*/
	long long vn_vmem;	/* total mem space (virtual)	*/
	int vn_naccels;		/* number of accelerators */
	int vn_need_accel;	/* should we reserve the accelerators */
	char *vn_accel_model;	/* model of the desired accelerator */
	long long vn_accel_mem; /* amt of accelerator memory wanted */
} vmpiprocs;

/* the following enum defines if a node resource is to be reported by Mom */
enum PBS_NodeRes_Status {
	PBS_NODERES_ACTIVE, /* resource reported from a non-released node */
	PBS_NODERES_DELETE  /* resource reported from a released node */
};

/*
 * Mother Superior gets to hold an array of information from each
 * of the other nodes for resource usage.
 */
typedef struct noderes {
	char *nodehost;	    /* corresponding node name */
	long nr_cput;	    /* cpu time */
	long nr_mem;	    /* memory */
	long nr_cpupercent; /* cpu percent */
	attribute nr_used;  /* node resources used */
	enum PBS_NodeRes_Status nr_status;
} noderes;

/* State for a sister */

#define SISTER_OKAY 0
#define SISTER_KILLDONE 1000
#define SISTER_BADPOLL 1001
#define SISTER_EOF 1099

/* job flags for ji_flags (mom only) */

#define MOM_CHKPT_ACTIVE 0x0001	  /* checkpoint in progress */
#define MOM_CHKPT_POST 0x0002	  /* post checkpoint call returned */
#define MOM_SISTER_ERR 0x0004	  /* a sisterhood operation failed */
#define MOM_NO_PROC 0x0008	  /* no procs found for job */
#define MOM_RESTART_ACTIVE 0x0010 /* restart in progress */

#define PBS_MAX_POLL_DOWNTIME 300 /* 5 minutes by default */
#endif				  /* MOM */

/*
 * specific structures for Job Array attributes
 */

/* subjob index table */
typedef struct ajinfo {
	int tkm_ct;			  /* count of original entries in table */
	int tkm_start;			  /* start of range (x in x-y:z) */
	int tkm_end;			  /* end of range (y in x-y:z) */
	int tkm_step;			  /* stepping factor for range (z in x-y:z) */
	int tkm_flags;			  /* special flags for array job */
	int tkm_subjsct[PBS_NUMJOBSTATE]; /* count of subjobs in various states */
	int tkm_dsubjsct;		  /* count of deleted subjobs */
	range *trm_quelist;		  /* pointer to range list */
} ajinfo_t;

/*
 * Discard Job Structure,  see Server's discard_job function
 *	Used to record which Mom has responded to when we need to tell them
 *	to discard a running job because of problems with a Mom
 */

struct jbdscrd {
	struct machine_info *jdcd_mom; /* ptr to Mom */
	int jdcd_state;		       /* 0 - waiting on her */
};
#define JDCD_WAITING 0 /* still waiting to hear from this Mom */
#define JDCD_REPLIED 1 /* this Mom has replied to the discard job */
#define JDCD_DOWN -1   /* this Mom is down */

/* Special array job flags in tkm_flags */
#define TKMFLG_NO_DELETE 0x01 /* delete subjobs in progess */
#define TKMFLG_CHK_ARRAY 0x02 /* chk_array_doneness() already in call stack */

/* Structure for block job reply processing */
struct block_job_reply {
	char jobid[PBS_MAXSVRJOBID + 1];
	char client[PBS_MAXHOSTNAME + 1];
	int port;
	int exitstat;
	time_t reply_time; /* The timestamp at which the block job tried it's first attempt to reply */
	char *msg;	   /* Abort message to be send to client */
	int fd;
};
#define BLOCK_JOB_REPLY_TIMEOUT 60

/*
 * THE JOB
 *
 * This structure is used by the server to maintain internal
 * quick access to the state and status of each job.
 * There is one instance of this structure per job known by the server.
 *
 * This information must be PRESERVED and is done so by updating the
 * job file in the jobs subdirectory which corresponds to this job.
 *
 * ji_state is the state of the job.  It is kept up front to provide for a
 * "quick" update of the job state with minimum rewritting of the job file.
 * Which is why the sub-struct ji_qs exists, that is the part which is
 * written on the "quick" save.  Update the symbolic constants JSVERSION_**
 * if any changes to the format of the "quick-save" area are made.
 *
 * The unparsed string set forms of the attributes (including resources)
 * are maintained in the struct attrlist as discussed above.
 */

#define JSVERSION_18 800  /* 18 denotes the PBS version and it covers the job structure from >= 13.x to <= 18.x */
#define JSVERSION_19 1900 /* 1900 denotes the 19.x.x version */
#define JSVERSION 2200	  /* denotes 22.x and newer */
#define ji_taskid ji_extended.ji_ext.ji_taskidx
#define ji_nodeid ji_extended.ji_ext.ji_nodeidx

enum bg_hook_request {
	BG_NONE,
	BG_IS_DISCARD_JOB,
	BG_PBS_BATCH_DeleteJob,
	BG_PBSE_SISCOMM,
	BG_IM_DELETE_JOB_REPLY,
	BG_IM_DELETE_JOB,
	BG_IM_DELETE_JOB2,
	BG_CHECKPOINT_ABORT
};

struct job {

	/*
	 * Note: these members, upto ji_qs, are not saved to disk
	 * IMPORTANT: if adding to this are, see create_subjob()
	 * in array_func.c; add the copy of the required elements
	 */

	pbs_list_link ji_alljobs;	     /* links to all jobs in server */
	pbs_list_link ji_jobque;	     /* SVR: links to jobs in same queue, MOM: links to polled jobs */
	pbs_list_link ji_unlicjobs;	     /* links to unlicensed jobs */
	int ji_momhandle;		     /* open connection handle to MOM */
	int ji_mom_prot;		     /* PROT_TCP or PROT_TPP */
	struct batch_request *ji_rerun_preq; /* outstanding rerun request */
#ifdef PBS_MOM
	void *ji_pending_ruu;			    /* pending last update */
	struct batch_request *ji_preq;		    /* outstanding request */
	struct grpcache *ji_grpcache;		    /* cache of user's groups */
	enum PBS_Chkpt_By ji_chkpttype;		    /* checkpoint type  */
	time_t ji_chkpttime;			    /* periodic checkpoint time */
	time_t ji_chkptnext;			    /* next checkpoint time */
	time_t ji_sampletim;			    /* last usage sample time, irix only */
	time_t ji_polltime;			    /* last poll from mom superior */
	time_t ji_actalarm;			    /* time of site callout alarm */
	time_t ji_joinalarm;			    /* time of job's sister join job alarm, also, time obit sent, all */
	time_t ji_overlmt_timestamp;		    /*time the job exceeded limit*/
	int ji_jsmpipe;				    /* pipe from child starter process */
	int ji_mjspipe;				    /* pipe to   child starter for ack */
	int ji_jsmpipe2;			    /* pipe for child starter process to send special requests to parent mom */
	int ji_mjspipe2;			    /* pipe for parent mom to ack special request from child starter process */
	int ji_child2parent_job_update_pipe;	    /* read pipe to receive special request from child starter process */
	int ji_parent2child_job_update_pipe;	    /* write pipe for parent mom to send info to child starter process */
	int ji_parent2child_job_update_status_pipe; /* write pipe for parent mom to send job update status to child starter process */
	int ji_parent2child_moms_status_pipe;	    /* write pipe for parent mom to send sister moms status to child starter process */
	int ji_updated;				    /* set to 1 if job's node assignment was updated */
	time_t ji_walltime_stamp;		    /* time stamp for accumulating walltime */
	struct work_task *ji_bg_hook_task;
	struct work_task *ji_report_task;
#ifdef WIN32
	HANDLE ji_momsubt;	 /* process HANDLE to mom subtask */
#else				 /* not WIN32 */
	pid_t ji_momsubt; /* pid of mom subtask   */
#endif				 /* WIN32 */
	struct var_table ji_env; /* environment for the job */
	/* ptr to post processing func  */
	void (*ji_mompost)(struct job *, int);
	tm_event_t ji_postevent;	   /* event waiting on mompost */
	int ji_numnodes;		   /* number of nodes (at least 1) */
	int ji_numrescs;		   /* number of entries in ji_resources*/
	int ji_numvnod;			   /* number of virtual nodes */
	int ji_num_assn_vnodes;		   /* number of virtual nodes (full count) */
	tm_event_t ji_obit;		   /* event for end-of-job */
	hnodent *ji_hosts;		   /* ptr to job host management stuff */
	vmpiprocs *ji_vnods;		   /* ptr to job vnode management stuff */
	noderes *ji_resources;		   /* ptr to array of node resources */
	vmpiprocs *ji_assn_vnodes;	   /* ptr to actual assigned vnodes (for hooks) */
	pbs_list_head ji_tasks;		   /* list of task structs */
	pbs_list_head ji_failed_node_list; /* list of mom nodes which fail to join job */
	pbs_list_head ji_node_list;	   /* list of functional mom nodes with vnodes assigned to the job */
	tm_node_id ji_nodekill;		   /* set to nodeid requesting job die */
	int ji_flags;			   /* mom only flags */
	void *ji_setup;			   /* save setup info */

#ifdef WIN32
	HANDLE ji_hJob;				    /* handle for job */
	struct passwd *ji_user;			    /* user info */
#endif						    /* WIN32 */
	int ji_stdout;				    /* socket for stdout */
	int ji_stderr;				    /* socket for stderr */
	int ji_ports[2];			    /* ports for stdout/err */
	enum bg_hook_request ji_hook_running_bg_on; /* set when hook starts in the background*/
	int ji_msconnected;			    /* 0 - not connected, 1 - connected */
	pbs_list_head ji_multinodejobs;		    /* links to recovered multinode jobs */
#else						    /* END Mom ONLY -  start Server ONLY */
	struct batch_request *ji_pmt_preq; /* outstanding preempt job request for deleting jobs */
	int ji_discarding;		   /* discarding job */
	struct batch_request *ji_prunreq;  /* outstanding runjob request */
	pbs_list_head ji_svrtask;	   /* links to svr work_task list */
	struct pbs_queue *ji_qhdr;	   /* current queue header */
	struct resc_resv *ji_myResv;	   /* !=0 job belongs to a reservation, see also, attribute JOB_ATR_myResv */

	int ji_lastdest;	     /* last destin tried by route */
	int ji_retryok;		     /* ok to retry, some reject was temp */
	int ji_terminated;	     /* job terminated by deljob batch req */
	int ji_deletehistory;	     /* job history should not be saved */
	pbs_list_head ji_rejectdest; /* list of rejected destinations */
	struct job *ji_parentaj;     /* subjob: parent Array Job */
	ajinfo_t *ji_ajinfo;	     /* ArrayJob: information about subjobs and its state counts */
	struct jbdscrd *ji_discard;  /* see discard_job() */
	int ji_jdcd_waiting;	     /* set if waiting on a mom for a response to discard job request */
	char *ji_acctrec;	     /* holder for accounting info */
	char *ji_clterrmsg;	     /* error message to return to client */

	/*
	 * This variable is used to temporarily hold the script for a new job
	 * in memory instead of immediately saving it to the database in the
	 * req_jobscript function. The script is eventually saved into the
	 * database along with saving the job structure as part of req_commit
	 * under one single transaction. After this the memory is freed.
	 */
	char *ji_script;

	/*
	 * This flag is to indicate if queued entity limit attribute usage
	 * is decremented when the job is run
	 */
	int ji_etlimit_decr_queued;

	struct preempt_ordering *preempt_order;
	int preempt_order_index;
	struct work_task *ji_prov_startjob_task;

#endif /* END SERVER ONLY */

	/*
	 * fixed size internal data - maintained via "quick save"
	 * some of the items are copies of attributes, if so this
	 * internal version takes precendent
	 *
	 * This area CANNOT contain any pointers!
	 */
#ifndef PBS_MOM
	char qs_hash[DIGEST_LENGTH];
#endif
	struct jobfix {
		int ji_jsversion;		      /* job structure version - JSVERSION */
		int ji_svrflags;		      /* server flags */
		time_t ji_stime;		      /* time job started execution */
		time_t ji_obittime;		      /* time job has ended execution */
		char ji_jobid[PBS_MAXSVRJOBID + 1];   /* job identifier */
		char ji_fileprefix[PBS_JOBBASE + 1];  /* no longer used */
		char ji_queue[PBS_MAXQUEUENAME + 1];  /* name of current queue */
		char ji_destin[PBS_MAXROUTEDEST + 1]; /* dest from qmove/route, MomS for execution */

		int ji_un_type;				 /* type of ji_un union */
		union {					 /* depends on type of queue currently in */
			struct {			 /* if in execution queue .. */
				pbs_net_t ji_momaddr;	 /* host addr of Server */
				unsigned int ji_momport; /* port # */
				int ji_exitstat;	 /* job exit status from MOM */
			} ji_exect;
			struct {
				time_t ji_quetime;  /* time entered queue */
				time_t ji_rteretry; /* route retry time */
			} ji_routet;
			struct {
				int ji_fromsock;	  /* socket job coming over */
				pbs_net_t ji_fromaddr;	  /* host job coming from   */
				unsigned int ji_scriptsz; /* script size */
			} ji_newt;
			struct {
				pbs_net_t ji_svraddr; /* host addr of Server */
				int ji_exitstat;      /* job exit status from MOM */
				uid_t ji_exuid;	      /* execution uid */
				gid_t ji_exgid;	      /* execution gid */
			} ji_momt;
		} ji_un;
	} ji_qs;
	/*
	 * Extended job save area
	 *
	 * This area CANNOT contain any pointers!
	 */
	union jobextend {
		char fill[256]; /* fill to keep same size */
		struct {
			char ji_jid[8];	 /* extended job save data for ALPS */
			int ji_credtype; /* credential type */
#ifdef PBS_MOM
			tm_host_id ji_nodeidx; /* my node id */
			tm_task_id ji_taskidx; /* generate task id's for job */
			int ji_stdout;
			int ji_stderr;
#if MOM_ALPS
			long ji_reservation;
			/* ALPS reservation identifier */
			unsigned long long ji_pagg;
			/* ALPS process aggregate ID */
#endif /* MOM_ALPS */
#endif /* PBS_MOM */
		} ji_ext;
	} ji_extended;

	/*
	 * The following array holds the decode	 format of the attributes.
	 * Its presence is for rapid acces to the attributes.
	 */

	attribute ji_wattr[JOB_ATR_LAST]; /* decoded attributes  */

	short newobj; /* newly created job? */
};

typedef struct job job;

#ifdef PBS_MOM
/*
 **	Tasks are sessions belonging to a job, running on one of the
 **	nodes assigned to the job.
 */
typedef struct pbs_task {
	job *ti_job;		  /* pointer to owning job */
	unsigned long ti_cput;	  /* track cput by task */
	pbs_list_link ti_jobtask; /* links to tasks for this job */
	int *ti_tmfd;		  /* DIS file descriptors to tasks */
	int ti_tmnum;		  /* next avail entry in ti_tmfd */
	int ti_tmmax;		  /* size of ti_tmfd */
	int ti_protover;	  /* protocol version number */
	int ti_flags;		  /* task internal flags */

#ifdef WIN32
	HANDLE ti_hProc; /* keep proc handle */
#endif

	tm_event_t ti_register; /* event if task registers */
	pbs_list_head ti_obits; /* list of obit events */
	pbs_list_head ti_info;	/* list of named info */
	struct taskfix {
		char ti_parentjobid[PBS_MAXSVRJOBID + 1];
		tm_node_id ti_parentnode; /* parent vnode */
		tm_node_id ti_myvnode;	  /* my vnode */
		tm_task_id ti_parenttask; /* parent task */
		tm_task_id ti_task;	  /* task's taskid */
		int ti_status;		  /* status of task */
		pid_t ti_sid;		  /* session id */
		int ti_exitstat;	  /* exit status */
		union {
			int ti_hold[16]; /* reserved space */
		} ti_u;
	} ti_qs;
} pbs_task;

/*
 **	A linked list of eventent structures is maintained for all events
 **	for which we are waiting for another MOM to report back.
 */
typedef struct eventent {
	int ee_command;	       /* command event is for */
	int ee_fd;	       /* TM stream */
	int ee_retry;	       /* event message retry attempt number */
	tm_event_t ee_client;  /* client event number */
	tm_event_t ee_event;   /* MOM event number */
	tm_task_id ee_taskid;  /* which task id */
	char **ee_argv;	       /* save args for spawn */
	char **ee_envp;	       /* save env for spawn */
	pbs_list_link ee_next; /* link to next one */
} eventent;

/*
 **	The information needed for a task manager obit request
 **	is indicated with OBIT_TYPE_TMEVENT.  The information needed
 **	for a batch request is indicated with OBIT_TYPE_BREVENT.
 */
#define OBIT_TYPE_TMEVENT 0
#define OBIT_TYPE_BREVENT 1

/*
 **	A task can have events which are triggered when it exits.
 **	These are tracked by obitent structures linked to the task.
 */
typedef struct obitent {
	int oe_type; /* what kind of obit */
	union oe_u {
		struct oe_tm {
			int oe_fd;	      /* TM reply fd */
			tm_node_id oe_node;   /* where does notification go */
			tm_event_t oe_event;  /* event number */
			tm_task_id oe_taskid; /* which task id */
		} oe_tm;
		struct batch_request *oe_preq;
	} oe_u;
	pbs_list_link oe_next; /* link to next one */
} obitent;

/*
 **	A task can have a list of named infomation which it makes
 **	available to other tasks in the job.
 */
typedef struct infoent {
	char *ie_name;	       /* published name */
	void *ie_info;	       /* the glop */
	size_t ie_len;	       /* how much glop */
	pbs_list_link ie_next; /* link to next one */
} infoent;

#define TI_FLAGS_INIT 1	   /* task has called tm_init */
#define TI_FLAGS_CHKPT 2   /* task has checkpointed */
#define TI_FLAGS_ORPHAN 4  /* MOM not parent of task */
#define TI_FLAGS_SAVECKP 8 /* save value of CHKPT flag during checkpoint op */

#define TI_STATE_EMBRYO 0
#define TI_STATE_RUNNING 1
#define TI_STATE_EXITED 2 /* ti_exitstat valid */
#define TI_STATE_DEAD 3

/*
 **      Here is the set of commands for InterMOM (IM) requests.
 */
#define IM_ALL_OKAY 0
#define IM_JOIN_JOB 1
#define IM_KILL_JOB 2
#define IM_SPAWN_TASK 3
#define IM_GET_TASKS 4
#define IM_SIGNAL_TASK 5
#define IM_OBIT_TASK 6
#define IM_POLL_JOB 7
#define IM_GET_INFO 8
#define IM_GET_RESC 9
#define IM_ABORT_JOB 10
#define IM_GET_TID 11 /* no longer used */
#define IM_SUSPEND 12
#define IM_RESUME 13
#define IM_CHECKPOINT 14
#define IM_CHECKPOINT_ABORT 15
#define IM_RESTART 16
#define IM_DELETE_JOB 17
#define IM_REQUEUE 18
#define IM_DELETE_JOB_REPLY 19
#define IM_SETUP_JOB 20
#define IM_DELETE_JOB2 21 /* sent by sister mom to delete job early */
#define IM_SEND_RESC 22
#define IM_UPDATE_JOB 23
#define IM_EXEC_PROLOGUE 24
#define IM_CRED 25
#define IM_PMIX 26
#define IM_RECONNECT_TO_MS 27
#define IM_JOIN_RECOV_JOB 28

#define IM_ERROR 99
#define IM_ERROR2 100

eventent *
event_alloc(job *pjob,
	    int command,
	    int fd,
	    hnodent *pnode,
	    tm_event_t event,
	    tm_task_id taskid);

pbs_task *momtask_create(job *pjob);

pbs_task *
task_find(job *pjob,
	  tm_task_id taskid);

#endif /* MOM */

/*
 * server flags (in ji_svrflags)
 */
#define JOB_SVFLG_HERE 0x01 /* SERVER: job created here */
/* MOM: set for Mother Superior */
#define JOB_SVFLG_HASWAIT 0x02	   /* job has timed task entry for wait time */
#define JOB_SVFLG_HASRUN 0x04	   /* job has been run before (being rerun) */
#define JOB_SVFLG_HOTSTART 0x08	   /* job was running, if hot init, restart */
#define JOB_SVFLG_CHKPT 0x10	   /* job has checkpoint file for restart */
#define JOB_SVFLG_SCRIPT 0x20	   /* job has a Script file */
#define JOB_SVFLG_OVERLMT1 0x40	   /* job over limit first time, MOM only */
#define JOB_SVFLG_OVERLMT2 0x80	   /* job over limit second time, MOM only */
#define JOB_SVFLG_ChkptMig 0x100   /* job has migratable checkpoint */
#define JOB_SVFLG_Suspend 0x200	   /* job suspended (signal suspend) */
#define JOB_SVFLG_StagedIn 0x400   /* job has files that have been staged in */
#define JOB_SVFLG_HASHOLD 0x800	   /* job has a hold request sent to MoM */
#define JOB_SVFLG_HasNodes 0x1000  /* job has nodes allocated to it */
#define JOB_SVFLG_RescAssn 0x2000  /* job resources accumulated in server/que */
#define JOB_SVFLG_SPSwitch 0x2000  /* SP switch loaded for job, SP MOM only */
#define JOB_SVFLG_Actsuspd 0x4000  /* job suspend because workstation active */
#define JOB_SVFLG_cpuperc 0x8000   /* cpupercent violation logged, MOM only */
#define JOB_SVFLG_ArrayJob 0x10000 /* Job is an Array Job */
#define JOB_SVFLG_SubJob 0x20000   /* Job is a subjob of an Array */
#define JOB_SVFLG_StgoFal 0x40000  /* Stageout failed, del jobdir, MOM only */
#define JOB_SVFLG_TERMJOB 0x80000  /* terminate in progress by TERM, MOM only */
/* 0x100000 is UNUSED, previously called JOB_SVFLG_StgoDel for stageout succ */
/* If you intend to use it, make sure jobs to be recovered do not have
 * 0x100000 bit set. Refer SPM229744
 */
#define JOB_SVFLG_AdmSuspd 0x200000 /* Job is suspended for maintenance */

#define MAIL_NONE (int) 'n'
#define MAIL_ABORT (int) 'a'
#define MAIL_BEGIN (int) 'b'
#define MAIL_END (int) 'e'
#define MAIL_OTHER (int) 'o'
#define MAIL_STAGEIN (int) 's'
#define MAIL_CONFIRM (int) 'c' /*scheduler requested reservation be confirmed*/
#define MAIL_SUBJOB (int) 'j'
#define MAIL_NORMAL 0
#define MAIL_FORCE 1

#define JOB_FILE_COPY ".JC"	 /* tmp copy while updating */
#define JOB_FILE_SUFFIX ".JB"	 /* job control file */
#define JOB_CRED_SUFFIX ".CR"	 /* job credential file */
#define JOB_EXPORT_SUFFIX ".XP"	 /* job export security context */
#define JOB_SCRIPT_SUFFIX ".SC"	 /* job script file  */
#define JOB_STDOUT_SUFFIX ".OU"	 /* job standard out */
#define JOB_STDERR_SUFFIX ".ER"	 /* job standard error */
#define JOB_CKPT_SUFFIX ".CK"	 /* job checkpoint file */
#define JOB_TASKDIR_SUFFIX ".TK" /* job task directory */
#define JOB_BAD_SUFFIX ".BD"	 /* save bad job file */
#define JOB_DEL_SUFFIX ".RM"	 /* file pending to be removed */

/*
 * Job states are defined by POSIX as:
 */
#define JOB_STATE_TRANSIT 0
#define JOB_STATE_QUEUED 1
#define JOB_STATE_HELD 2
#define JOB_STATE_WAITING 3
#define JOB_STATE_RUNNING 4
#define JOB_STATE_EXITING 5
#define JOB_STATE_EXPIRED 6
#define JOB_STATE_BEGUN 7
/* Job states defined for history jobs and OGF-BES model */
#define JOB_STATE_MOVED 8
#define JOB_STATE_FINISHED 9

#define JOB_STATE_LTR_UNKNOWN '0'
#define JOB_STATE_LTR_BEGUN 'B'
#define JOB_STATE_LTR_EXITING 'E'
#define JOB_STATE_LTR_FINISHED 'F'
#define JOB_STATE_LTR_HELD 'H'
#define JOB_STATE_LTR_MOVED 'M'
#define JOB_STATE_LTR_QUEUED 'Q'
#define JOB_STATE_LTR_RUNNING 'R'
#define JOB_STATE_LTR_SUSPENDED 'S'
#define JOB_STATE_LTR_TRANSIT 'T'
#define JOB_STATE_LTR_USUSPENDED 'U'
#define JOB_STATE_LTR_WAITING 'W'
#define JOB_STATE_LTR_EXPIRED 'X'

/*
 * job sub-states are defined by PBS (more detailed) as:
 */
#define JOB_SUBSTATE_UNKNOWN -1
#define JOB_SUBSTATE_TRANSIN 00	 /* Transit in, wait for commit, commit not yet called */
#define JOB_SUBSTATE_TRANSICM 01 /* Transit in, job is being commited */
#define JOB_SUBSTATE_TRNOUT 02	 /* transiting job outbound */
#define JOB_SUBSTATE_TRNOUTCM 03 /* transiting outbound, rdy to commit */

#define JOB_SUBSTATE_QUEUED 10	   /* job queued and ready for selection */
#define JOB_SUBSTATE_PRESTAGEIN 11 /* job queued, has files to stage in */
#define JOB_SUBSTATE_SYNCRES 13	   /* job waiting on sync start ready */
#define JOB_SUBSTATE_STAGEIN 14	   /* job staging in files then wait */
#define JOB_SUBSTATE_STAGEGO 15	   /* job staging in files and then run */
#define JOB_SUBSTATE_STAGECMP 16   /* job stage in complete */

#define JOB_SUBSTATE_HELD 20	 /* job held - user or operator */
#define JOB_SUBSTATE_SYNCHOLD 21 /* job held - waiting on sync regist */
#define JOB_SUBSTATE_DEPNHOLD 22 /* job held - waiting on dependency */

#define JOB_SUBSTATE_WAITING 30	  /* job waiting on execution time */
#define JOB_SUBSTATE_STAGEFAIL 37 /* job held - file stage in failed */

#define JOB_SUBSTATE_PRERUN 41	/* job set to MOM to run */
#define JOB_SUBSTATE_RUNNING 42 /* job running */
#define JOB_SUBSTATE_SUSPEND 43 /* job suspended by client */
#define JOB_SUBSTATE_SCHSUSP 45 /* job supsended by scheduler */

#define JOB_SUBSTATE_EXITING 50	  /* Start of job exiting processing */
#define JOB_SUBSTATE_STAGEOUT 51  /* job staging out (other) files   */
#define JOB_SUBSTATE_STAGEDEL 52  /* job deleting staged out files  */
#define JOB_SUBSTATE_EXITED 53	  /* job exit processing completed   */
#define JOB_SUBSTATE_ABORT 54	  /* job is being aborted by server  */
#define JOB_SUBSTATE_KILLSIS 56	  /* (MOM) job kill IM to sisters    */
#define JOB_SUBSTATE_RUNEPILOG 57 /* (MOM) job epilogue running      */
#define JOB_SUBSTATE_OBIT 58	  /* (MOM) job obit notice sent	   */
#define JOB_SUBSTATE_TERM 59	  /* Job is in site termination stage */
#define JOB_SUBSTATE_DELJOB 153	  /* (MOM) Job del_job_wait to sisters  */

#define JOB_SUBSTATE_RERUN 60	/* job is rerun, recover output stage */
#define JOB_SUBSTATE_RERUN1 61	/* job is rerun, stageout phase */
#define JOB_SUBSTATE_RERUN2 62	/* job is rerun, delete files stage */
#define JOB_SUBSTATE_RERUN3 63	/* job is rerun, mom delete job */
#define JOB_SUBSTATE_EXPIRED 69 /* subjob (of an array) is gone */

#define JOB_SUBSTATE_BEGUN 70		 /* Array job has begun */
#define JOB_SUBSTATE_PROVISION 71	 /* job is waiting for provisioning tocomplete */
#define JOB_SUBSTATE_WAITING_JOIN_JOB 72 /* job waiting on IM_JOIN_JOB completion */

/*
 * Job sub-states defined in PBS to support history jobs and OGF-BES model:
 */
#define JOB_SUBSTATE_TERMINATED 91
#define JOB_SUBSTATE_FINISHED 92
#define JOB_SUBSTATE_FAILED 93
#define JOB_SUBSTATE_MOVED 94

/* decriminator for ji_un union type */

#define JOB_UNION_TYPE_NEW 0
#define JOB_UNION_TYPE_EXEC 1
#define JOB_UNION_TYPE_ROUTE 2
#define JOB_UNION_TYPE_MOM 3

/* job hold (internal) types */

#define HOLD_n 0
#define HOLD_u 1
#define HOLD_o 2
#define HOLD_s 4
#define HOLD_bad_password 8

/* Array Job related Defines */

/* See is_job_array() in array_func.c */
#define IS_ARRAY_NO 0	    /* Not an array job nor subjob */
#define IS_ARRAY_ArrayJob 1 /* Is an Array Job    */
#define IS_ARRAY_Single 2   /* A single Sub Job   */
#define IS_ARRAY_Range 3    /* A range of Subjobs */
#define PBS_FILE_ARRAY_INDEX_TAG "^array_index^"

/* Special Job Exit Values,  Set by the job starter (child of MOM)   */
/* see server/req_jobobit() & mom/start_exec.c			     */

#define JOB_EXEC_OK 0		       /* job exec successfull */
#define JOB_EXEC_FAIL1 -1	       /* Job exec failed, before files, no retry */
#define JOB_EXEC_FAIL2 -2	       /* Job exec failed, after files, no retry  */
#define JOB_EXEC_RETRY -3	       /* Job execution failed, do retry    */
#define JOB_EXEC_INITABT -4	       /* Job aborted on MOM initialization */
#define JOB_EXEC_INITRST -5	       /* Job aborted on MOM init, chkpt, no migrate */
#define JOB_EXEC_INITRMG -6	       /* Job aborted on MOM init, chkpt, ok migrate */
#define JOB_EXEC_BADRESRT -7	       /* Job restart failed */
#define JOB_EXEC_FAILUID -10	       /* invalid uid/gid for job */
#define JOB_EXEC_RERUN -11	       /* Job rerun */
#define JOB_EXEC_CHKP -12	       /* Job was checkpointed and killed */
#define JOB_EXEC_FAIL_PASSWORD -13     /* Job failed due to a bad password */
#define JOB_EXEC_RERUN_SIS_FAIL -14    /* Job rerun */
#define JOB_EXEC_QUERST -15	       /* requeue job for restart from checkpoint */
#define JOB_EXEC_FAILHOOK_RERUN -16    /* job exec failed due to a hook rejection, requeue job for later retry (usually returned by the "early" hooks" */
#define JOB_EXEC_FAILHOOK_DELETE -17   /* job exec failed due to a hook rejection, delete the job at end */
#define JOB_EXEC_HOOK_RERUN -18	       /* a hook requested for job to be requeued */
#define JOB_EXEC_HOOK_DELETE -19       /* a hook requested for job to be deleted */
#define JOB_EXEC_RERUN_MS_FAIL -20     /* Mother superior connection failed */
#define JOB_EXEC_FAIL_SECURITY -21     /* Security breach in PBS directory */
#define JOB_EXEC_HOOKERROR -22	       /* job exec failed due to
				     * unexpected exception or
				     * hook execution timed out
				     */
#define JOB_EXEC_FAIL_KRB5 -23	       /* Error no kerberos credentials supplied */
#define JOB_EXEC_UPDATE_ALPS_RESV_ID 1 /* Update ALPS reservation ID to parent mom as soon
					* as it is available.
					* This is neither a success nor a failure exit code,
					* so we are using a positive value
					*/
#define JOB_EXEC_KILL_NCPUS_BURST -24  /* job exec failed due to exceeding ncpus (burst) */
#define JOB_EXEC_KILL_NCPUS_SUM -25    /* job exec failed due to exceeding ncpus (sum) */
#define JOB_EXEC_KILL_VMEM -26	       /* job exec failed due to exceeding vmem */
#define JOB_EXEC_KILL_MEM -27	       /* job exec failed due to exceeding mem */
#define JOB_EXEC_KILL_CPUT -28	       /* job exec failed due to exceeding cput */
#define JOB_EXEC_KILL_WALLTIME -29     /* job exec failed due to exceeding walltime */
#define JOB_EXEC_JOINJOB -30	       /* Job exec failed due to join job error */

/*
 * Fake "random" number added onto the end of the staging
 * and execution directory when sandbox=private
 * used in jobdirname()
 */
#define FAKE_RANDOM "x8z"

/* The default project assigned to jobs when project attribute is unset */
#define PBS_DEFAULT_PROJECT "_pbs_project_default"

extern void add_dest(job *);
extern int depend_on_que(attribute *, void *, int);
extern int depend_on_exec(job *);
extern int depend_runone_remove_dependency(job *);
extern int depend_runone_hold_all(job *);
extern int depend_runone_release_all(job *);
extern int depend_on_term(job *);
extern struct depend *find_depend(int type, attribute *pattr);
extern struct depend_job *find_dependjob(struct depend *pdep, char *name);
extern int send_depend_req(job *pjob, struct depend_job *pparent, int type, int op, int schedhint, void (*postfunc)(struct work_task *));
extern void post_runone(struct work_task *pwt);
extern job *find_job(char *);
extern char *get_variable(job *, char *);
extern void check_block(job *, char *);
extern char *lookup_variable(void *, int, char *);
extern void issue_track(job *);
extern void issue_delete(job *);
extern int job_abt(job *, char *);
extern int job_delete_attr(job *, int);
extern job *job_alloc(void);
extern void job_free(job *);
extern int modify_job_attr(job *, svrattrl *, int, int *);
extern char *prefix_std_file(job *, int);
extern void cat_default_std(job *, int, char *, char **);
extern int set_objexid(void *, int, attribute *);
extern bool update_deljob_rply(struct batch_request *, char *, int);
#if 0
extern int   site_check_user_map(job *, char *);
#endif
extern int site_check_user_map(void *, int, char *);
extern int site_allow_u(char *user, char *host);
extern void svr_dequejob(job *);
extern int svr_enquejob(job *, char *);
extern void svr_evaljobstate(job *, char *, int *, int);
extern int svr_setjobstate(job *, char, int);
extern int state_char2int(char);
extern char state_int2char(int);
extern int uniq_nameANDfile(char *, char *, char *);
extern long determine_accruetype(job *);
extern int update_eligible_time(long, job *);

#define TOLERATE_NODE_FAILURES_ALL "all"
#define TOLERATE_NODE_FAILURES_JOB_START "job_start"
#define TOLERATE_NODE_FAILURES_NONE "none"
extern int do_tolerate_node_failures(job *);
int check_job_state(const job *pjob, char state);
int check_job_substate(const job *pjob, int substate);
char get_job_state(const job *pjob);
int get_job_state_num(const job *pjob);
long get_job_substate(const job *pjob);
char *get_jattr_str(const job *pjob, int attr_idx);
struct array_strings *get_jattr_arst(const job *pjob, int attr_idx);
pbs_list_head get_jattr_list(const job *pjob, int attr_idx);
long get_jattr_long(const job *pjob, int attr_idx);
long long get_jattr_ll(const job *pjob, int attr_idx);
svrattrl *get_jattr_usr_encoded(const job *pjob, int attr_idx);
svrattrl *get_jattr_priv_encoded(const job *pjob, int attr_idx);
void set_job_state(job *pjob, char val);
void set_job_substate(job *pjob, long val);
int set_jattr_str_slim(job *pjob, int attr_idx, char *val, char *rscn);
int set_jattr_l_slim(job *pjob, int attr_idx, long val, enum batch_op op);
int set_jattr_ll_slim(job *pjob, int attr_idx, long long val, enum batch_op op);
int set_jattr_b_slim(job *pjob, int attr_idx, long val, enum batch_op op);
int set_jattr_c_slim(job *pjob, int attr_idx, char val, enum batch_op op);
int set_jattr_generic(job *pjob, int attr_idx, char *val, char *rscn, enum batch_op op);
int is_jattr_set(const job *pjob, int attr_idx);
void free_jattr(job *pjob, int attr_idx);
void mark_jattr_not_set(job *pjob, int attr_idx);
void mark_jattr_set(job *pjob, int attr_idx);
attribute *get_jattr(const job *pjob, int attr_idx);
void clear_jattr(job *pjob, int attr_idx);

/*
 *	The filesystem related recovery/save routines are renamed
 *	with the suffix "_fs", and the database versions of them
 *	are suffixed "_db". This distinguishes between the two
 *	version. The "_fs" version will continue to be used by
 *	migration routine "svr_migrate_data" and by "mom". Rest of
 *	the server code will typically use only the "_db" routines.
 *	Since mom uses only the "_fs" versions, define the "_fs"
 *	versions to names with the suffix, so that the mom code
 *	remain unchanges and continues to use the "_fs" versions.
 */
#ifdef PBS_MOM

extern job *job_recov_fs(char *);
extern int job_save_fs(job *);

#define job_save job_save_fs
#define job_recov job_recov_fs

#else

extern job *job_recov_db(char *, job *pjob);
extern int job_save_db(job *);

#define job_save job_save_db
#define job_recov job_recov_db

extern char *get_job_credid(char *);
#endif

#ifdef _BATCH_REQUEST_H
extern job *chk_job_request(char *, struct batch_request *, int *, int *);
extern int net_move(job *, struct batch_request *);
extern int svr_chk_owner(struct batch_request *, job *);
extern int svr_movejob(job *, char *, struct batch_request *);
extern struct batch_request *cpy_stage(struct batch_request *, job *, enum job_atr, int);

#ifdef _RESERVATION_H
extern int svr_chk_ownerResv(struct batch_request *, resc_resv *);
#endif /* _RESERVATION_H */
#endif /* _BATCH_REQUEST_H */

#ifdef _QUEUE_H
extern int svr_chkque(job *, pbs_queue *, char *, char *, int mtype);
extern int default_router(job *, pbs_queue *, long);
extern int site_alt_router(job *, pbs_queue *, long);
extern int site_acl_check(job *, pbs_queue *);
#endif /* _QUEUE_H */

#ifdef _WORK_TASK_H
extern int issue_signal(job *, char *, void (*)(struct work_task *), void *);
extern int delayed_issue_signal(job *pjob, char *signame, void (*func)(struct work_task *), void *extra, int delay);
extern void on_job_exit(struct work_task *);
#endif /* _WORK_TASK_H */

#ifdef _PBS_IFL_H
extern int update_resources_list(job *, char *, int, char *, enum batch_op op, int, int);
#endif

extern int Mystart_end_dur_wall(void *, int);
extern int get_wall(job *);
extern int get_softwall(job *);
extern int get_used_wall(job *);
extern int get_used_cput(job *);
extern int get_cput(job *);
extern void remove_deleted_resvs(void);
extern void degrade_corrupted_confirmed_resvs(void);
extern int pbsd_init_job(job *pjob, int type);

extern void del_job_related_file(job *pjob, char *fsuffix);
#ifdef PBS_MOM
extern void del_job_dirs(job *pjob, char *taskdir);
extern void del_chkpt_files(job *pjob);
#endif

extern void get_jobowner(char *, char *);
extern struct batch_request *cpy_stage(struct batch_request *, job *, enum job_atr, int);
extern struct batch_request *cpy_stdfile(struct batch_request *, job *, enum job_atr);
extern int has_stage(job *);

void svr_evalsetjobstate(job *jobp);

#ifdef __cplusplus
}
#endif
#endif /* _PBS_JOB_H */


================================================
FILE: src/include/libauth.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */
#ifndef _LIBAUTH_H
#define _LIBAUTH_H
#ifdef __cplusplus
extern "C" {
#endif

#include "log.h"
#include "portability.h"

/* Max length of auth method name */
#define MAXAUTHNAME 100

/* Type of roles */
enum AUTH_ROLE {
	/* Unknown role, mostly used as initial value */
	AUTH_ROLE_UNKNOWN = 0,
	/* Client role, aka who is initiating authentication */
	AUTH_CLIENT,
	/* Server role, aka who is authenticating incoming user/connection */
	AUTH_SERVER,
	/* qsub side, when authenticating an interactive connection (i.e. qsub -I) from an execution host */
	AUTH_INTERACTIVE,
	/* last role, mostly used while error checking for role value */
	AUTH_ROLE_LAST
};

/* Type of connections */
enum AUTH_CONN_TYPE {
	/* user-oriented connection (aka like PBS client is connecting to PBS Server) */
	AUTH_USER_CONN = 0,
	/* service-oriented connection (aka like PBS Mom is connecting to PBS Server via PBS Comm) */
	AUTH_SERVICE_CONN
};

typedef struct pbs_auth_config {
	/* Path to PBS_HOME directory (aka PBS_HOME in pbs.conf). This should be a null-terminated string. */
	char *pbs_home_path;

	/* Path to PBS_EXEC directory (aka PBS_EXEC in pbs.conf). This should be a null-terminated string. */
	char *pbs_exec_path;

	/* Name of authentication method (aka PBS_AUTH_METHOD in pbs.conf). This should be a null-terminated string. */
	char *auth_method;

	/* Name of encryption method (aka PBS_ENCRYPT_METHOD in pbs.conf). This should be a null-terminated string. */
	char *encrypt_method;

	/*
	 * Function pointer to the logging method with the same signature as log_event from Liblog.
	 * With this, the user of the authentication library can redirect logs from the authentication
	 * library into respective log files or stderr in case no log files.
	 * If func is set to NULL then logs will be written to stderr (if available, else no logging at all).
	 */
	void (*logfunc)(int type, int objclass, int severity, const char *objname, const char *text);
} pbs_auth_config_t;

/** @brief
 *	pbs_auth_set_config - Set auth config
 *
 * @param[in] config - auth config structure
 *
 * @return void
 *
 */
extern DLLEXPORT void pbs_auth_set_config(const pbs_auth_config_t *config);

/** @brief
 *	pbs_auth_create_ctx - allocates auth context structure
 *
 * @param[in] ctx - pointer in which auth context to be allocated
 * @param[in] mode - AUTH_SERVER or AUTH_CLIENT
 * @param[in] conn_type - AUTH_USER_CONN or AUTH_SERVICE_CONN
 * @param[in] hostname - hostname of other authenticating party in case of AUTH_CLIENT else not used
 *
 * @return	int
 * @retval	0 - success
 * @retval	1 - error
 */
extern DLLEXPORT int pbs_auth_create_ctx(void **ctx, int mode, int conn_type, const char *hostname);

/** @brief
 *	pbs_auth_destroy_ctx - destroy given auth context structure
 *
 * @param[in] ctx - pointer to auth context
 *
 * @return void
 */
extern DLLEXPORT void pbs_auth_destroy_ctx(void *ctx);

/** @brief
 *	pbs_auth_get_userinfo - get user, host and realm from authentication context
 *
 * @param[in] ctx - pointer to auth context
 * @param[out] user - username assosiate with ctx
 * @param[out] host - hostname/realm assosiate with ctx
 * @param[out] realm - realm assosiate with ctx
 *
 * @return	int
 * @retval	0 on success
 * @retval	1 on error
 */
extern DLLEXPORT int pbs_auth_get_userinfo(void *ctx, char **user, char **host, char **realm);

/** @brief
 *	pbs_auth_process_handshake_data - process incoming auth handshake data or start auth handshake if no incoming data
 *
 * @param[in] ctx - pointer to auth context
 * @param[in] data_in - received auth token data (if any, else NULL)
 * @param[in] len_in - length of received auth token data (if any else 0)
 * @param[out] data_out - auth token data to send (if any, else NULL)
 * @param[out] len_out - lenght of auth token data to send (if any, else 0)
 * @param[out] is_handshake_done - indicates whether handshake is done (1) or not (0)
 *
 * @return	int
 * @retval	0 on success
 * @retval	!0 on error
 */
extern DLLEXPORT int pbs_auth_process_handshake_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out, int *is_handshake_done);

/** @brief
 *	pbs_auth_encrypt_data - encrypt data based on given auth context.
 *
 * @param[in] ctx - pointer to auth context
 * @param[in] data_in - clear text data
 * @param[in] len_in - length of clear text data
 * @param[out] data_out - encrypted data
 * @param[out] len_out - length of encrypted data
 *
 * @return	int
 * @retval	0 on success
 * @retval	1 on error
 */
extern DLLEXPORT int pbs_auth_encrypt_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out);

/** @brief
 *	pbs_auth_decrypt_data - decrypt data based on given auth context.
 *
 * @param[in] ctx - pointer to auth context
 * @param[in] data_in - encrypted data
 * @param[in] len_in - length of encrypted data
 * @param[out] data_out - clear text data
 * @param[out] len_out - length of clear text data
 *
 * @return	int
 * @retval	0 on success
 * @retval	1 on error
 */
extern DLLEXPORT int pbs_auth_decrypt_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out);

#ifdef __cplusplus
}
#endif
#endif /* _LIBAUTH_H */


================================================
FILE: src/include/libpbs.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _LIBPBS_H
#define _LIBPBS_H
#ifdef __cplusplus
extern "C" {
#endif

#include <stdlib.h>
#include <string.h>
#include <memory.h>
#include <limits.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "pbs_error.h"
#include "pbs_internal.h"
#include "pbs_client_thread.h"
#include "net_connect.h"
#include "dis.h"

#define VALUE(str) #str
#define TOSTR(str) VALUE(str)

/* Protocol types when connecting to another server (eg mom) */
#define PROT_INVALID -1
#define PROT_TCP 0 /* For TCP based connection */
#define PROT_TPP 1 /* For TPP based connection */

#define PBS_BATCH_PROT_TYPE 2
#define PBS_BATCH_PROT_VER_OLD 1
#define PBS_BATCH_PROT_VER 2
#define SCRIPT_CHUNK_Z (65536)
#ifndef TRUE
#define TRUE 1
#define FALSE 0
#endif
#ifndef EOF
#define EOF (-1)
#endif

/* enums for standard job files */
enum job_file {
	JScript,
	StdIn,
	StdOut,
	StdErr,
	Chkpt
};

/*
 * This variable has been moved to Thread local storage
 * The define points to a function pointer which locates
 * the actual variable from the TLS of the calling thread
 */
#ifndef __PBS_CURRENT_USER
#define __PBS_CURRENT_USER
extern char *__pbs_current_user_location(void);
#define pbs_current_user (__pbs_current_user_location())
#endif

#ifndef __PBS_TCP_TIMEOUT
#define __PBS_TCP_TIMEOUT
extern time_t *__pbs_tcptimeout_location(void);
#define pbs_tcp_timeout (*__pbs_tcptimeout_location())
#endif

#ifndef __PBS_TCP_INTERRUPT
#define __PBS_TCP_INTERRUPT
extern int *__pbs_tcpinterrupt_location(void);
#define pbs_tcp_interrupt (*__pbs_tcpinterrupt_location())
#endif

#ifndef __PBS_TCP_ERRNO
#define __PBS_TCP_ERRNO
extern int *__pbs_tcperrno_location(void);
#define pbs_tcp_errno (*__pbs_tcperrno_location())
#endif

extern char pbs_current_group[];

#define NCONNECTS 50		 /* max connections per client */
#define PBS_MAX_CONNECTIONS 5000 /* Max connections in the connections array */
#define PBS_LOCAL_CONNECTION INT_MAX

typedef struct pbs_conn {
	int ch_errno;		  /* last error on this connection */
	char *ch_errtxt;	  /* pointer to last server error text	*/
	pthread_mutex_t ch_mutex; /* serialize connection between threads */
	pbs_tcp_chan_t *ch_chan;  /* pointer tcp chan structure for this connection */
} pbs_conn_t;

int destroy_connection(int);
int set_conn_errtxt(int, const char *);
char *get_conn_errtxt(int);
int set_conn_errno(int, int);
int get_conn_errno(int);
pbs_tcp_chan_t *get_conn_chan(int);
int set_conn_chan(int, pbs_tcp_chan_t *);
pthread_mutex_t *get_conn_mutex(int);

#define SVR_CONN_STATE_DOWN 0
#define SVR_CONN_STATE_UP 1

/* max number of preempt orderings */
#define PREEMPT_ORDER_MAX 20

/* PBS Batch Reply Structure */

/* reply to Select Job Request */
struct brp_select {
	struct brp_select *brp_next;
	char brp_jobid[PBS_MAXSVRJOBID + 1];
};

/* reply to Status Job/Queue/Server Request */
struct brp_status {
	pbs_list_link brp_stlink;
	int brp_objtype;
	char brp_objname[(PBS_MAXSVRJOBID > PBS_MAXDEST ? PBS_MAXSVRJOBID : PBS_MAXDEST) + 1];
	pbs_list_head brp_attr; /* head of svrattrlist */
};

/* reply to Resource Query Request */
struct brp_rescq {
	int brq_number; /* number of items in following arrays */
	int *brq_avail;
	int *brq_alloc;
	int *brq_resvd;
	int *brq_down;
};

struct rq_preempt {
	int count;
	preempt_job_info *ppj_list;
};

typedef struct rq_preempt brp_preempt_jobs;

#define BATCH_REPLY_CHOICE_NULL 1	  /* no reply choice, just code */
#define BATCH_REPLY_CHOICE_Queue 2	  /* Job ID, see brp_jid */
#define BATCH_REPLY_CHOICE_RdytoCom 3	  /* select, see brp_jid */
#define BATCH_REPLY_CHOICE_Commit 4	  /* commit, see brp_jid */
#define BATCH_REPLY_CHOICE_Select 5	  /* select, see brp_select */
#define BATCH_REPLY_CHOICE_Status 6	  /* status, see brp_status */
#define BATCH_REPLY_CHOICE_Text 7	  /* text, see brp_txt */
#define BATCH_REPLY_CHOICE_Locate 8	  /* locate, see brp_locate */
#define BATCH_REPLY_CHOICE_RescQuery 9	  /* Resource Query */
#define BATCH_REPLY_CHOICE_PreemptJobs 10 /* Preempt Job */
#define BATCH_REPLY_CHOICE_Delete 11	  /* Delete Job status */

/*
 * the following is the basic Batch Reply structure
 */
struct batch_reply {
	int brp_code;
	int brp_auxcode;
	int brp_choice; /* the union discriminator */
	int brp_is_part;
	int brp_count;
	int brp_type;
	struct batch_status *last;
	union {
		char brp_jid[PBS_MAXSVRJOBID + 1];
		struct brp_select *brp_select;	/* select replies */
		pbs_list_head brp_status;	/* status (svr) replies */
		struct batch_status *brp_statc; /* status (cmd) replies) */
		struct {
			void *undeleted_job_idx;		  /* tracking undeleted jobs */
			struct batch_deljob_status *brp_delstatc; /* list of failed jobs with errcode */
		} brp_deletejoblist;
		struct {
			int brp_txtlen;
			char *brp_str;
		} brp_txt; /* text and credential reply */
		char brp_locate[PBS_MAXDEST + 1];
		struct brp_rescq brp_rescq;	   /* query resource reply */
		brp_preempt_jobs brp_preempt_jobs; /* preempt jobs reply */
	} brp_un;
};

/*
 * The Batch Request ID numbers
 */
#define PBS_BATCH_Connect 0
#define PBS_BATCH_QueueJob 1
#define PBS_BATCH_PostQueueJob 2
/* Unused -- #define PBS_BATCH_JobCred 2 */
#define PBS_BATCH_jobscript 3
#define PBS_BATCH_RdytoCommit 4
#define PBS_BATCH_Commit 5
#define PBS_BATCH_DeleteJob 6
#define PBS_BATCH_HoldJob 7
#define PBS_BATCH_LocateJob 8
#define PBS_BATCH_Manager 9
#define PBS_BATCH_MessJob 10
#define PBS_BATCH_ModifyJob 11
#define PBS_BATCH_MoveJob 12
#define PBS_BATCH_ReleaseJob 13
#define PBS_BATCH_Rerun 14
#define PBS_BATCH_RunJob 15
#define PBS_BATCH_SelectJobs 16
#define PBS_BATCH_Shutdown 17
#define PBS_BATCH_SignalJob 18
#define PBS_BATCH_StatusJob 19
#define PBS_BATCH_StatusQue 20
#define PBS_BATCH_StatusSvr 21
#define PBS_BATCH_TrackJob 22
#define PBS_BATCH_AsyrunJob 23
#define PBS_BATCH_Rescq 24
#define PBS_BATCH_ReserveResc 25
#define PBS_BATCH_ReleaseResc 26
#define PBS_BATCH_FailOver 27
#define PBS_BATCH_JobObit 28
#define PBS_BATCH_StageIn 48
/* Unused -- #define PBS_BATCH_AuthenResvPort 49 */
#define PBS_BATCH_OrderJob 50
#define PBS_BATCH_SelStat 51
#define PBS_BATCH_RegistDep 52
#define PBS_BATCH_CopyFiles 54
#define PBS_BATCH_DelFiles 55
/* Unused -- #define PBS_BATCH_JobObit 56 */
#define PBS_BATCH_MvJobFile 57
#define PBS_BATCH_StatusNode 58
#define PBS_BATCH_Disconnect 59
/* Unused -- #define PBS_BATCH_CopyFiles_Cred 60 */
/* Unused -- #define PBS_BATCH_DelFiles_Cred 61 */
#define PBS_BATCH_JobCred 62
#define PBS_BATCH_CopyFiles_Cred 63
#define PBS_BATCH_DelFiles_Cred 64
/* Unused -- #define PBS_BATCH_GSS_Context 65 */
#define PBS_BATCH_SubmitResv 70
#define PBS_BATCH_StatusResv 71
#define PBS_BATCH_DeleteResv 72
#define PBS_BATCH_BeginResv 76
#define PBS_BATCH_UserCred 73
/* Unused -- #define PBS_BATCH_UserMigrate		74 */
#define PBS_BATCH_ConfirmResv 75
#define PBS_BATCH_DefSchReply 80
#define PBS_BATCH_StatusSched 81
#define PBS_BATCH_StatusRsc 82
#define PBS_BATCH_StatusHook 83
#define PBS_BATCH_PySpawn 84
#define PBS_BATCH_CopyHookFile 85
#define PBS_BATCH_DelHookFile 86
/* Unused -- #define PBS_BATCH_MomRestart 87 */
/* Unused -- #define PBS_BATCH_AuthExternal 88 */
#define PBS_BATCH_HookPeriodic 89
#define PBS_BATCH_RelnodesJob 90
#define PBS_BATCH_ModifyResv 91
#define PBS_BATCH_ResvOccurEnd 92
#define PBS_BATCH_PreemptJobs 93
#define PBS_BATCH_Cred 94
#define PBS_BATCH_Authenticate 95
#define PBS_BATCH_ModifyJob_Async 96
#define PBS_BATCH_AsyrunJob_ack 97
#define PBS_BATCH_RegisterSched 98
#define PBS_BATCH_ModifyVnode 99
#define PBS_BATCH_DeleteJobList 100

#define PBS_BATCH_FileOpt_Default 0
#define PBS_BATCH_FileOpt_OFlg 1
#define PBS_BATCH_FileOpt_EFlg 2

#define PBS_IFF_CLIENT_ADDR "PBS_IFF_CLIENT_ADDR"

/* time out values for tcp_dis read/write */
#define PBS_DIS_TCP_TIMEOUT_CONNECT 10
#define PBS_DIS_TCP_TIMEOUT_REPLY 10
#define PBS_DIS_TCP_TIMEOUT_SHORT 30
#define PBS_DIS_TCP_TIMEOUT_RERUN 45 /* timeout used in pbs_rerunjob() */
#define PBS_DIS_TCP_TIMEOUT_LONG 600
#define PBS_DIS_TCP_TIMEOUT_VLONG 10800

#define FAILOVER_Register 0	  /* secondary server register with primary */
#define FAILOVER_HandShake 1	  /* handshake from secondary to primary */
#define FAILOVER_PrimIsBack 2	  /* Primary is taking control again */
#define FAILOVER_SecdShutdown 3	  /* Primary going down, secondary go down */
#define FAILOVER_SecdGoInactive 4 /* Primary down, secondary go inactive */
#define FAILOVER_SecdTakeOver 5	  /* Primary down, secondary take over */

#define EXTEND_OPT_IMPLICIT_COMMIT ":C:" /* option added to pbs_submit() extend parameter to request implicit commit */
#define EXTEND_OPT_NEXT_MSG_TYPE "next_msg_type"
#define EXTEND_OPT_NEXT_MSG_PARAM "next_msg_param"

int is_compose(int, int);
int is_compose_cmd(int, int, char **);
void PBS_free_aopl(struct attropl *);
void advise(char *, ...);
int PBSD_commit(int, char *, int, char **, char *);
int PBSD_jcred(int, int, char *, int, int, char **);
int PBSD_jscript(int, const char *, int, char **);
int PBSD_jscript_direct(int, char *, int, char **);
int PBSD_copyhookfile(int, char *, int, char **);
int PBSD_delhookfile(int, char *, int, char **);
int PBSD_mgr_put(int, int, int, int, const char *, struct attropl *, const char *, int, char **);
int PBSD_manager(int, int, int, int, const char *, struct attropl *, const char *);
int PBSD_msg_put(int, const char *, int, const char *, const char *, int, char **);
int PBSD_relnodes_put(int, const char *, const char *, const char *, int, char **);
int PBSD_py_spawn_put(int, char *, char **, char **, int, char **);
int PBSD_sig_put(int, const char *, const char *, const char *, int, char **);
int PBSD_jobfile(int, int, char *, char *, enum job_file, int, char **);
int PBSD_status_put(int, int, const char *, struct attrl *, const char *, int, char **);
int PBSD_select_put(int, int, struct attropl *, struct attrl *, const char *);
char **PBSD_select_get(int);
struct batch_reply *PBSD_rdrpy(int);
struct batch_reply *PBSD_rdrpy_sock(int, int *, int prot);
void PBSD_FreeReply(struct batch_reply *);
struct batch_status *PBSD_status(int, int, const char *, struct attrl *, const char *);
struct batch_status *PBSD_status_get(int c);
char *PBSD_queuejob(int, char *, const char *, struct attropl *, const char *, int, char **, int *);
int decode_DIS_svrattrl(int, pbs_list_head *);
int decode_DIS_attrl(int, struct attrl **);
int decode_DIS_JobId(int, char *);
int decode_DIS_replyCmd(int, struct batch_reply *, int);
int encode_DIS_JobCred(int, int, const char *, int);
int encode_DIS_UserCred(int, const char *, int, const char *, int);
int encode_DIS_JobFile(int, int, const char *, int, const char *, int);
int encode_DIS_JobId(int, const char *);
int encode_DIS_Manage(int, int, int, const char *, struct attropl *);
int encode_DIS_MessageJob(int, const char *, int, const char *);
int encode_DIS_MoveJob(int, const char *, const char *);
int encode_DIS_ModifyResv(int, const char *, struct attropl *);
int encode_DIS_RelnodesJob(int, const char *, const char *);
int encode_DIS_PySpawn(int, const char *, char **, char **);
int encode_DIS_QueueJob(int, char *, const char *, struct attropl *);
int encode_DIS_SubmitResv(int, const char *, struct attropl *);
int encode_DIS_ReqExtend(int, const char *);
int encode_DIS_ReqHdr(int, int, const char *);
int encode_DIS_Run(int, const char *, const char *, unsigned long);
int encode_DIS_ShutDown(int, int);
int encode_DIS_SignalJob(int, const char *, const char *);
int encode_DIS_Status(int, const char *, struct attrl *);
int encode_DIS_attrl(int, struct attrl *);
int encode_DIS_attropl(int, struct attropl *);
int encode_DIS_CopyHookFile(int, int, const char *, int, const char *);
int encode_DIS_DelHookFile(int, const char *);
int encode_DIS_JobsList(int, char **, int);
char *PBSD_submit_resv(int, const char *, struct attropl *, const char *);
int DIS_reply_read(int, struct batch_reply *, int);
int tcp_pre_process(conn_t *);
char *PBSD_modify_resv(int, const char *, struct attropl *, const char *);
int PBSD_cred(int, char *, char *, int, char *, long, int, char **);
int tcp_send_auth_req(int, unsigned int, const char *, const char *, const char *);
int pbs_register_sched(const char *sched_id, int primary_conn_id, int secondary_conn_id);
char *PBS_get_server(const char *, char *, uint *);

void pbs_statfree_single(struct batch_status *bsp);
#ifdef __cplusplus
}
#endif
#endif /* _LIBPBS_H */


================================================
FILE: src/include/libsec.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*------------------------------------------------------------------------
 * Possible return values for the various external functions in the library
 *------------------------------------------------------------------------
 */

#ifndef _LIBSEC_H
#define _LIBSEC_H
#ifdef __cplusplus
extern "C" {
#endif

#define STD 0  /* standard PBS security (pbs_iff program) */
#define KRB5 1 /* krb5/gssapi based authentication and encryption */

#define CS_SUCCESS 0	     /* success			*/
#define CS_FATAL_NOMEM 1     /* memory allocation failure	*/
#define CS_FATAL_NOAUTH 2    /* authentication failure	*/
#define CS_FATAL 3	     /* non-specific failure		*/
#define CS_NOTIMPLEMENTED 4  /* function not implmeneted	*/
#define CS_AUTH_CHECK_PORT 6 /* STD CS_server_auth return code */
#define CS_AUTH_USE_IFF 7    /* STD CS_client_auth return code */
#define CS_REMAP_CTX_FAIL 8

#define CS_IO_FAIL -1	     /* error in CS_read, CS_write   */
#define CS_CTX_TRAK_FATAL -2 /* error with context tracking  */

#define CS_MODE_CLIENT 0
#define CS_MODE_SERVER 1

extern int CS_read(int sd, char *buf, size_t len);
extern int CS_write(int sd, char *buf, size_t len);
extern int CS_client_auth(int sd);
extern int CS_server_auth(int sd);
extern int CS_close_socket(int sd);
extern int CS_close_app(void);
extern int CS_client_init(void);
extern int CS_server_init(void);
extern int CS_verify(void);
extern int CS_reset_vector(int sd);
extern int CS_remap_ctx(int sd, int newsd);
extern void (*p_cslog)(int ecode, const char *caller, const char *txtmsg);

#define cs_logerr(a, b, c) ((*p_cslog)((a), (b), (c)))

#ifdef __cplusplus
}
#endif
#endif /* _LIBSEC_H */


================================================
FILE: src/include/libutil.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _HAVE_LIB_UTIL_H
#define _HAVE_LIB_UTIL_H
#ifdef __cplusplus
extern "C" {
#endif

#include <time.h>
#include <stdio.h>
#include <stdbool.h>
#include <netinet/in.h>

#include "pbs_ifl.h"

/* misc_utils specific */

#define IS_EMPTY(str) (!str || str[0] == '\0')

/* replace - Replace sub-string  with new pattern in string */
void replace(char *, char *, char *, char *);

/* show_nonprint_chars - show non-printable characters in string */
char *show_nonprint_chars(char *);

/*	char_in_set - is the char c in the tokenset */
int char_in_set(char c, const char *tokset);

/* string_token - strtok() without an an internal state pointer */
char *string_token(char *str, const char *tokset, char **ret_str);
int in_string_list(char *str, char sep, char *string_list);

int copy_file_internal(char *src, char *dst);

int is_full_path(char *path);
int file_exists(char *path);
int is_same_host(char *, char *);

/* Determine if a placement directive is present in a placment string. */
int place_sharing_check(char *, char *);

/* execvnode_seq_util specific */
#define TOKEN_SEPARATOR "~"
#define MAX_INT_LENGTH 10

#define WORD_TOK "{"
#define MAP_TOK ","
#define WORD_MAP_TOK "}"
#define RANGE_TOK "-"
#define COUNT_TOK "#"

/* Memory Allocation Error Message */
#define MALLOC_ERR_MSG "No memory available"

/* Dictionary is a list of words */
typedef struct dict {
	struct word *first;
	struct word *last;
	int count;
	int length;
	int max_idx;
} dictionary;

/* Each word maps to an associated set (map) in the dictionary */
struct word {
	char *name;
	struct word *next;
	struct map *map;
	int count;
};

/* A map is the associated set of a word */
struct map {
	int val;
	struct map *next;
};

/* Compress a delimited string into a dictionary compressed representation */
char *condense_execvnode_seq(const char *);

/* Decompress a compress string into an array of words (strings) indexed by
 * their associated indices */
char **unroll_execvnode_seq(char *, char ***);

/*
 * Get the total number of indices represented in the condensed string
 * which corresponds to the total number of occurrences in the execvnode string
 */
int get_execvnodes_count(char *);

/* Free the memory allocated to an unrolled string */
void free_execvnode_seq(char **ptr);

/* pbs_ical specific */

/* Define the location of ical zoneinfo directory
 * this will be relative to PBS_EXEC (see pbsd_init and pbs_sched) */
#define ICAL_ZONEINFO_DIR "/lib/ical/zoneinfo"

/* Returns the number of occurrences defined by a recurrence rule */
int get_num_occurrences(char *rrule, time_t dtstart, char *tz);

/* Get the occurrence as defined by the given recurrence rule,
 * start time, and index. This function assumes that the
 * time dtsart passed in is the one to start the occurrence from.
 */
time_t get_occurrence(char *, time_t, char *, int);

/*
 * Check if a recurrence rule is valid and consistent.
 * The recurrence rule is verified against a start date and checks
 * that the frequency of the recurrence matches the duration of the
 * submitted reservation. If the duration of a reservation exceeds the
 * granularity of the frequency then an error message is displayed.
 *
 * The recurrence rule is checked to contain a COUNT or an UNTIL.
 *
 * Note that the TZ environment variable HAS to be set for the occurrence's
 * dates to be correctly computed.
 */
int check_rrule(char *, time_t, time_t, char *, int *);

/*
 * Displays the occurrences in a two-column format:
 * the first column corresponds to the occurrence date and time
 * the second column corresponds to the reserved execvnode
 */
void display_occurrences(char *, time_t, char *, char *, int, int);

/*
 * Set the zoneinfo directory
 */
void set_ical_zoneinfo(char *path);

/*
 * values for the vnode 'sharing' attribute
 */
enum vnode_sharing {
	VNS_UNSET,
	VNS_DFLT_SHARED,
	VNS_DFLT_EXCL,
	VNS_IGNORE_EXCL,
	VNS_FORCE_EXCL,
	VNS_DFLT_EXCLHOST,
	VNS_FORCE_EXCLHOST,
	VNS_FORCE_SHARED,
};

/*
 * convert vnode sharing enum into string form
 */
char *vnode_sharing_to_str(enum vnode_sharing vns);
/*
 * convert string form of vnode sharing to enum
 */
enum vnode_sharing str_to_vnode_sharing(char *vn_str);

/*
 * concatenate two strings by expanding target string as needed.
 * 	  Operation: strbuf += str
 */
char *pbs_strcat(char **strbuf, int *ssize, const char *str);

/*
 * like strcpy, but returns pointer to end of copied data
 * useful for chain copies instead of sprintf which is very
 * slow
 *
 */
char *pbs_strcpy(char *dest, const char *src);

/*
 * general purpose strncpy function that will make sure to
 * copy '\0' at the end of the buffer.
 */
char *pbs_strncpy(char *dest, const char *src, size_t n);

int pbs_extendable_line(char *buf);
char *pbs_fgets(char **pbuf, int *pbuf_size, FILE *fp);
char *pbs_fgets_extend(char **pbuf, int *pbuf_size, FILE *fp);

/*
 * Internal asprintf() implementation for use on all platforms
 */
extern int pbs_asprintf(char **dest, const char *fmt, ...);
extern char *pbs_asprintf_format(int len, const char *fmt, va_list args);

/*
 * calculate the number of digits to the right of the decimal point in
 *        a floating point number.  This can be used in conjunction with
 *        printf() to not print trailing zeros.
 *
 * Use: int x = float_digits(fl, 8);
 * printf("%0.*f\n", x, fl);
 *
 */
int float_digits(double fl, int digits);

/* Various helper functions in hooks processing */
int starts_with_triple_quotes(char *str);
int ends_with_triple_quotes(char *str, int strip_quotes);

/* Special symbols for copy_file_internal() */

#define COPY_FILE_BAD_INPUT 1
#define COPY_FILE_BAD_SOURCE 2
#define COPY_FILE_BAD_DEST 3
#define COPY_FILE_BAD_WRITE 4

#define LOCK_RETRY_DEFAULT 2
int
lock_file(int fd, int op, char *filename, int lock_retry,
	  char *err_msg, size_t err_msg_len);

/* RSHD/RCP related */
/* Size of the buffer used in communication with rshd deamon */
#define RCP_BUFFER_SIZE 65536

#define MAXBUFLEN 1024
#define BUFFER_GROWTH_RATE 2

/*
 *      break_comma_list - break apart a comma delimited string into an array
 *                         of strings
 */
char **break_comma_list(char *list);

/*
 *      break_delimited_str - break apart a delimited string into an array
 *                         of strings
 */
char **break_delimited_str(char *list, char delim);

/*
 * find index of str in strarr
 */
int find_string_idx(char **strarr, const char *str);

/*
 *	is_string_in_arr - Does a string exist in the given array?
 */
int is_string_in_arr(char **strarr, const char *str);

/*
 * Make copy of string array
 */
char **dup_string_arr(char **strarr);

/*
 *      free_string_array - free an array of strings with NULL as sentinel
 */
void free_string_array(char **arr);

/*
 * ensure_string_not_null - if string is NULL, allocate an empty string
 */
void ensure_string_not_null(char **str);

/*
 * convert_string_to_lowercase - convert string to lower case
 */
char *convert_string_to_lowercase(char *str);

/*
 * Escape every occurrence of 'delim' in 'str' with 'esc'
 */
char *escape_delimiter(char *str, char *delim, char esc);

#ifdef HAVE_MALLOC_INFO
char *get_mem_info(void);
#endif

/* Size of time buffer */
#define TIMEBUF_SIZE 128

/**
 *
 * 	convert_duration_to_str - Convert a duration to HH:MM:SS format string
 *
 */
void convert_duration_to_str(time_t duration, char *buf, int bufsize);

/**
 * deduce the preemption ordering to be used for a job
 */
struct preempt_ordering *get_preemption_order(struct preempt_ordering *porder, int req, int used);

/**
 * Begin collecting performance stats (e.g. walltime)
 */
void perf_stat_start(char *instance);

/**
 * Remove a performance stats entry.
 */
void perf_stat_remove(char *instance);

/**
 * check delay in client commands
 */
void create_query_file(void);
void delay_query(void);

/**
 * End collecting performance stats (e.g. walltime)
 */
char *perf_stat_stop(char *instance);

extern char *netaddr(struct sockaddr_in *);
extern unsigned long crc_file(char *fname);
extern int get_fullhostname(char *, char *, int);
extern char *get_hostname_from_addr(struct in_addr addr);
extern char *parse_servername(char *, unsigned int *);
extern int rand_num(void);

extern char *gen_hostkey(char *cluster_key, char *salt, size_t *len);
extern int validate_hostkey(char *host_key, size_t host_keylen, char **cluster_key);
void set_rand_str(char *str, int len);

/* thread utils */
extern int init_mutex_attr_recursive(void *attr);

#ifdef _USRDLL
#ifdef DLL_EXPORT
#define DECLDIR __declspec(dllexport)
#else
#define DECLDIR __declspec(dllimport)
#endif
DECLDIR void encode_SHA(char *, size_t, char **);
#else
void encode_SHA(char *, size_t, char **);
#endif

void set_proc_limits(char *, int);
int get_index_from_jid(char *jid);
char *get_range_from_jid(char *jid);
char *create_subjob_id(char *parent_jid, int sjidx);

#define GET_IP_PORT(x) ((struct sockaddr_in *) (x))->sin_port
#define IS_VALID_IP(x) (((struct sockaddr_in *)(x))->sin_family == AF_INET)

#ifdef __cplusplus
}
#endif
#endif


================================================
FILE: src/include/list_link.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _LIST_LINK_H
#define _LIST_LINK_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * list_link.h - header file for general linked list routines
 *		see list_link.c
 *
 *	A user defined linked list can be managed by these routines if
 *	the first element of the user structure is the pbs_list_link struct
 *	defined below.
 */

/* list entry list sub-structure */

typedef struct pbs_list_link {
	struct pbs_list_link *ll_prior;
	struct pbs_list_link *ll_next;
	void *ll_struct;
} pbs_list_link;
typedef pbs_list_link pbs_list_head;

/* macros to clear list head or link */

#define CLEAR_HEAD(e) e.ll_next = &e, e.ll_prior = &e, e.ll_struct = NULL
#define CLEAR_LINK(e) e.ll_next = &e, e.ll_prior = &e

#define LINK_INSET_BEFORE 0
#define LINK_INSET_AFTER 1

#if defined(DEBUG) && !defined(NDEBUG)
#define GET_NEXT(pe) get_next((pe), __FILE__, __LINE__)
#define GET_PRIOR(pe) get_prior((pe), __FILE__, __LINE__)
#else
#define GET_NEXT(pe) (pe).ll_next->ll_struct
#define GET_PRIOR(pe) (pe).ll_prior->ll_struct
#endif

/* function prototypes */

extern void insert_link(pbs_list_link *oldp, pbs_list_link *newp, void *pobj, int pos);
extern void append_link(pbs_list_head *head, pbs_list_link *newp, void *pnewobj);
extern void delete_link(pbs_list_link *oldp);
extern void delete_clear_link(pbs_list_link *oldp);
extern void swap_link(pbs_list_link *, pbs_list_link *);
extern int is_linked(pbs_list_link *head, pbs_list_link *oldp);
extern void list_move(pbs_list_head *oldp, pbs_list_head *newp);

#ifndef NDEBUG
extern void *get_next(pbs_list_link, char *file, int line);
extern void *get_prior(pbs_list_link, char *file, int line);
#endif /* NDEBUG */

#ifdef __cplusplus
}
#endif
#endif /* _LIST_LINK_H */


================================================
FILE: src/include/log.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _LOG_H
#define _LOG_H

#ifdef __cplusplus
extern "C" {
#endif

#include <stdio.h>
#if SYSLOG
#include <syslog.h>
#else
/* normally found in syslog.h, need to be defined for calls, but */
/* will be ingnored in pbs_log.c				 */
#define LOG_EMERG 0
#define LOG_ALERT 1
#define LOG_CRIT 2
#define LOG_ERR 3
#define LOG_WARNING 4
#define LOG_NOTICE 5
#define LOG_INFO 6
#define LOG_DEBUG 7
#define LOG_AUTH 8
#endif /* SYSLOG */

#include <sys/stat.h>

/*
 * include file for error/event logging
 */

/*
 * The default log buffer size should be large enough to hold a short message
 * together with the full pathname of a file. A full pathname may be up to 4096
 * characters. Add to this an extra 256 characters. This helps to avoid format
 * truncation warnings from certain compilers.
 */
#define LOG_BUF_SIZE 4352

/* The following macro assist in sharing code between the Server and Mom */
#define LOG_EVENT log_event

/*
 ** Set up a debug print macro.
 */
#define sys_printf(...) syslog(LOG_NOTICE, __VA_ARGS__);
#ifdef DEBUG
#define DBPRT(x) printf x;
#endif
#ifdef DBPRT_LOG
#include <stdlib.h>
#include <errno.h>
#include "libutil.h"
#define STRIP_PARENS(...) __VA_ARGS__
#undef DBPRT
#define DBPRT(x)                                                                     \
	if (will_log_event(PBSEVENT_DEBUGPRT)) {                                     \
		char *msg_;                                                          \
		int msg_len_;                                                        \
		int save_errno_ = errno;                                             \
		msg_len_ = pbs_asprintf(&msg_, STRIP_PARENS x);                      \
		if (msg_len_ >= 0) {                                                 \
			if (msg_len_ > 0 && msg_[msg_len_ - 1] == '\n') {            \
				msg_[msg_len_ - 1] = '\0';                           \
			}                                                            \
			log_record(PBSEVENT_DEBUGPRT, 0, LOG_DEBUG, __func__, msg_); \
			free(msg_);                                                  \
		}                                                                    \
		errno = save_errno_;                                                 \
	}
#endif
#ifndef DBPRT
#define DBPRT(x)
#endif

#define IFNAME_MAX 256
#define IFFAMILY_MAX 16

struct log_net_info { /* interface info for logging */
	struct log_net_info *next;
	char ifname[IFNAME_MAX];
	char iffamily[IFFAMILY_MAX];
	char **ifhostnames;
};

extern char *msg_daemonname;

extern long *log_event_mask;

extern void set_logfile(FILE *fp);
extern int set_msgdaemonname(const char *ch);
void set_log_conf(char *leafname, char *nodename,
		  unsigned int islocallog, unsigned int sl_fac, unsigned int sl_svr,
		  unsigned int log_highres);

extern struct log_net_info *get_if_info(char *msg);
extern void free_if_info(struct log_net_info *ni);

extern void log_close(int close_msg);
extern void log_err(int err, const char *func, const char *text);
extern void log_errf(int errnum, const char *routine, const char *fmt, ...);
extern void log_joberr(int err, const char *func, const char *text, const char *pjid);
extern void log_event(int type, int objclass, int severity, const char *objname, const char *text);
extern void do_log_eventf(int eventtype, int objclass, int sev, const char *objname, const char *fmt, va_list args);
extern void log_eventf(int eventtype, int objclass, int sev, const char *objname, const char *fmt, ...);
extern int will_log_event(int type);
extern void log_suspect_file(const char *func, const char *text, const char *file, struct stat *sb);
extern int log_open(char *name, char *directory);
extern int log_open_main(char *name, char *directory, int silent);
extern void log_record(int type, int objclass, int severity, const char *objname, const char *text);
extern char log_buffer[LOG_BUF_SIZE];
extern int log_level_2_etype(int level);

extern int chk_path_sec(char *path, int dir, int sticky, int bad, int);
extern int chk_file_sec(char *path, int isdir, int sticky, int disallow, int fullpath);
extern int chk_file_sec_user(char *path, int isdir, int sticky, int disallow, int fullpath, int uid);
extern int tmp_file_sec(char *path, int isdir, int sticky, int disallow, int fullpath);
extern int tmp_file_sec_user(char *path, int isdir, int sticky, int disallow, int fullpath, int uid);

#ifdef WIN32
extern int chk_file_sec2(char *path, int isdir, int sticky,
			 int disallow, int fullpath, char *owner);
#endif
extern char *get_script_name(char *input);

extern int setup_env(char *filename);
extern void log_supported_auth_methods(char **supported_auth_methods);

/* Event types */

#define PBSEVENT_ERROR 0x0001	  /* internal errors */
#define PBSEVENT_SYSTEM 0x0002	  /* system (server) events */
#define PBSEVENT_ADMIN 0x0004	  /* admin events */
#define PBSEVENT_JOB 0x0008	  /* job related events */
#define PBSEVENT_JOB_USAGE 0x0010 /* End of Job accounting */
#define PBSEVENT_SECURITY 0x0020  /* security violation events */
#define PBSEVENT_SCHED 0x0040	  /* scheduler events */
#define PBSEVENT_DEBUG 0x0080	  /* common debug messages */
#define PBSEVENT_DEBUG2 0x0100	  /* less needed debug messages */
#define PBSEVENT_RESV 0x0200	  /* reservation related msgs */
#define PBSEVENT_DEBUG3 0x0400	  /* less needed debug messages */
#define PBSEVENT_DEBUG4 0x0800	  /* rarely needed debugging */
#ifndef PBSEVENT_DEBUGPRT
#define PBSEVENT_DEBUGPRT 0x1000 /* messages from the DBPRT macro */
#endif
#define PBSEVENT_FORCE 0x8000 /* set to force a message */
#define SVR_LOG_DFLT PBSEVENT_ERROR | PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_JOB | PBSEVENT_JOB_USAGE | PBSEVENT_SECURITY | PBSEVENT_SCHED | PBSEVENT_DEBUG | PBSEVENT_DEBUG2
#define SCHED_LOG_DFLT PBSEVENT_ERROR | PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_JOB | PBSEVENT_JOB_USAGE | PBSEVENT_SECURITY | PBSEVENT_SCHED | PBSEVENT_DEBUG | PBSEVENT_RESV

/* Event Object Classes, see array class_names[] in ../lib/Liblog/pbs_log.c */

#define PBS_EVENTCLASS_SERVER 1	 /* The server itself */
#define PBS_EVENTCLASS_QUEUE 2	 /* Queues */
#define PBS_EVENTCLASS_JOB 3	 /* Jobs	 */
#define PBS_EVENTCLASS_REQUEST 4 /* Batch Requests */
#define PBS_EVENTCLASS_FILE 5	 /* A Job related File */
#define PBS_EVENTCLASS_ACCT 6	 /* Accounting info */
#define PBS_EVENTCLASS_NODE 7	 /* Nodes */
#define PBS_EVENTCLASS_RESV 8	 /* Reservations */
#define PBS_EVENTCLASS_SCHED 9	 /* Scheduler */
#define PBS_EVENTCLASS_HOOK 10	 /* Hook	 */
#define PBS_EVENTCLASS_RESC 11	 /* Resource */
#define PBS_EVENTCLASS_TPP 12	 /* TPP */

/* Logging Masks */

#define PBSEVENT_MASK 0x01ff

#ifdef __cplusplus
}
#endif

#endif /* _LOG_H */


================================================
FILE: src/include/mom_func.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _MOM_FUNC_H
#define _MOM_FUNC_H
#ifdef __cplusplus
extern "C" {
#endif

#include <stdio.h>

#ifndef MOM_MACH
#include "mom_mach.h"
#endif /* MOM_MACH */

#include "port_forwarding.h"
#include "batch_request.h"
#include "pbs_internal.h"

/* struct sig_tbl = used to hold map of local signal names to values */

struct sig_tbl {
	char *sig_name;
	int sig_val;
};

#define NUM_LCL_ENV_VAR 10

/* used by mom_main.c and requests.c for $usecp */

struct cphosts {
	char *cph_hosts;
	char *cph_from;
	char *cph_to;
#ifdef NAS /* localmod 009 */
	/* support $usecp rules that exclude a pattern */
	int cph_exclude;
#endif /* localmod 009 */
};
extern int cphosts_num;
extern struct cphosts *pcphosts;

/* used by mom_main.c and start_exec.c for TMPDIR */

extern char pbs_tmpdir[];

/* used by mom_main.c and start_exec.c for PBS_JOBDIR */
extern char pbs_jobdir_root[];
extern int pbs_jobdir_root_shared;
#define JOBDIR_DEFAULT "PBS_USER_HOME"

/* test bits */
#define PBSQA_DELJOB_SLEEP 1
#define PBSQA_DELJOB_CRASH 2
#define PBSQA_POLLJOB_CRASH 4
#define PBSQA_POLLJOB_SLEEP 8
#define PBSQA_NTBL_STATUS 16
#define PBSQA_NTBL_ADAPTER 32
#define PBSQA_NTBL_LOAD 64
#define PBSQA_NTBL_UNLOAD 128
#define PBSQA_NTBL_CLEAN 256
#define PBSQA_DELJOB_SLEEPLONG 512
#define PBSQA_NTBL_NOPORTS 1024

extern unsigned long QA_testing;

/* used by Mom for external actions */

enum Action_Event {		     /* enum should start with zero	*/
		    TerminateAction, /* On Job Termination		*/
		    ChkptAction,     /* On Checkpoint		*/
		    ChkptAbtAction,  /* On Checkpoint with abort	*/
		    RestartAction,   /* On Restart (chkpt)		*/
		    MultiNodeBusy,   /* when desktop goes keyboard busy */
		    LastAction	     /* Must be last entry		*/
};

enum Action_Verb {
	Default, /* default action  */
	Script,	 /* external script */
	Requeue	 /* requeue job     */
};

extern struct mom_action {
	char *ma_name;		  /* action name (noun)	     */
	int ma_timeout;		  /* allowable time for action */
	enum Action_Verb ma_verb; /* action verb		     */
	char *ma_script;	  /* absolute script path      */
	char **ma_args;		  /* args to pass to script    */
} mom_action[(int) LastAction];

/**
 * values for call_hup
 */
enum hup_action {
	HUP_CLEAR = 0, /* No HUP processing needed */
	HUP_REAL,      /* a HUP signal was received */
	HUP_INIT       /* a job failure requires init processing */
};

/**
 * Flag used to indicate that HUP processing should take place.
 */
extern enum hup_action call_hup;

extern int mock_run;

/* public funtions within MOM */

#ifdef _PBS_JOB_H

#define COMM_MATURITY_TIME 60 /* time when we consider a pbs_comm connection as mature */
#define MOM_DELTA_NORMAL 1    /* Normal mode of operation for time_delta_hellosvr function */
#define MOM_DELTA_RESET 0     /* Reset the values of time_delta_hellosvr function back to 1 */

typedef int (*pbs_jobfunc_t)(job *);
typedef int (*pbs_jobnode_t)(job *, hnodent *);
typedef int (*pbs_jobstream_t)(job *, int);
typedef int (*pbs_jobndstm_t)(job *, hnodent *, int);
typedef void (*pbs_jobvoid_t)(job *);
typedef void (*pbs_jobnodevoid_t)(job *, hnodent *);

extern pbs_jobnode_t job_join_extra;
extern pbs_jobndstm_t job_join_ack;
extern pbs_jobndstm_t job_join_read;
extern pbs_jobndstm_t job_setup_send;
extern pbs_jobstream_t job_setup_final;
extern pbs_jobvoid_t job_end_final;
extern pbs_jobfunc_t job_clean_extra;
extern pbs_jobvoid_t job_free_extra;
extern pbs_jobnodevoid_t job_free_node;

extern int local_supres(job *, int, struct batch_request *);
extern void post_suspend(job *, int);
extern void post_resume(job *, int);
extern void post_restart(job *, int);
extern void post_chkpt(job *, int);
extern int start_checkpoint(job *, int, struct batch_request *);
extern int local_checkpoint(job *, int, struct batch_request *);
extern int start_restart(job *, struct batch_request *);
extern int local_restart(job *, struct batch_request *);
extern int time_delta_hellosvr(int);

#ifdef WIN32
extern void wait_action(void);
#endif

typedef enum {
	HANDLER_FAIL = 0,
	HANDLER_SUCCESS = 1,
	HANDLER_REPARSE = 2
} handler_ret_t;
extern handler_ret_t set_boolean(const char *id, char *value, int *flag);
extern int do_susres(job *pjob, int which);
extern int error(char *string, int value);
extern int kill_job(job *, int sig);
extern int kill_task(pbs_task *, int sig, int dir);
extern void del_job_hw(job *);
extern void mom_deljob(job *);
extern void mom_deljob_wait2(job *);
extern int send_sisters_deljob_wait(job *);
extern void del_job_resc(job *);
extern int do_mom_action_script(int, job *, pbs_task *, char *,
				void (*)(job *, int));
extern enum Action_Verb chk_mom_action(enum Action_Event);
extern void mom_freenodes(job *);
extern void unset_job(job *, int);
struct passwd *check_pwd(job *);
extern char *set_shell(job *, struct passwd *);
extern void start_exec(job *);
extern void send_obit(job *, int);
extern void send_hellosvr(int);
extern void send_wk_job_idle(char *, int);
extern int site_job_setup(job *);
extern int site_mom_chkuser(job *);
extern int site_mom_postchk(job *, int);
extern int site_mom_prerst(job *);
extern int terminate_job(job *, int);
extern int mom_deljob_wait(job *);
extern int run_pelog(int which, char *file, job *pjob, int pe_io_type);
extern int is_joined(job *);
extern void update_jobs_status(void);
extern void calc_cpupercent(job *, unsigned long, unsigned long, time_t);
extern void dorestrict_user(void);
extern int task_save(pbs_task *ptask);
extern void send_join_job_restart(int, eventent *, int, job *, pbs_list_head *);
extern int send_resc_used_to_ms(int stream, job *pjob);
extern int recv_resc_used_from_sister(int stream, job *pjob, int nodeidx);
extern int is_comm_up(int);

/* Defines for pe_io_type, see run_pelog() */

#define PE_IO_TYPE_NULL -1
#define PE_IO_TYPE_ASIS 0
#define PE_IO_TYPE_STD 1
#define PE_PROLOGUE 1
#define PE_EPILOGUE 2

typedef enum {
	PRE_FINISH_SUCCESS,
	PRE_FINISH_SUCCESS_JOB_SETUP_SEND,
	PRE_FINISH_FAIL,
	PRE_FINISH_FAIL_JOB_SETUP_SEND,
	PRE_FINISH_FAIL_JOIN_EXTRA
} pre_finish_results_t;

#ifdef _LIBPBS_H
extern int open_std_file(job *, enum job_file, int, gid_t);
extern char *std_file_name(job *, enum job_file, int *keeping);
extern int task_recov(job *pjob);
extern int send_sisters(job *pjob, int com, pbs_jobndstm_t);
extern int send_sisters_inner(job *pjob, int com, pbs_jobndstm_t, char *);
extern int send_sisters_job_update(job *pjob);
extern int im_compose(int stream, char *jobid, char *cookie, int command, tm_event_t event, tm_task_id taskid, int version);
extern int message_job(job *pjob, enum job_file jft, char *text);
extern void term_job(job *pjob);
extern int start_process(pbs_task *pt, char **argv, char **envp, bool nodemux);
extern pre_finish_results_t pre_finish_exec(job *pjob, int do_job_setup_send);
extern void finish_exec(job *pjob);
extern void exec_bail(job *pjob, int code, char *txt);
extern int generate_pbs_nodefile(job *pjob, char *nodefile, int nodefile_sz, char *err_msg, int err_msg_sz);
extern int job_nodes_inner(struct job *pjob, hnodent **mynp);
extern int job_nodes(job *pjob);
extern int tm_reply(int stream, int version, int com, tm_event_t event);
#ifdef WIN32
extern void end_proc(void);
extern int dep_procinfo(pid_t pid, pid_t *psid, uid_t *puid, char *puname, size_t uname_len, char *comm, size_t comm_len);
#else
extern int dep_procinfo(pid_t, pid_t *, uid_t *, char *, size_t);
#endif
#ifdef NAS_UNKILL /* localmod 011 */
extern int kill_procinfo(pid_t, pid_t *, u_Long *);
#endif /* localmod 011 */
extern int dep_attach(pbs_task *ptask);
#endif /* _LIBPBS_H */

#ifdef _RESOURCE_H
extern u_long gettime(resource *pres);
extern u_long getsize(resource *pres);
extern int local_gettime(resource *, unsigned long *ret);
extern int local_getsize(resource *, unsigned long *ret);
#endif /* _RESOURCE_H */

#ifdef _BATCH_REQUEST_H
extern int start_checkpoint(job *, int abt, struct batch_request *pq);

#endif /* _BATCH_REQUEST_H */

#endif /* _PBS_JOB_H */

struct cpy_files {
	int stageout_failed; /* for stageout failed */
	int bad_files;	     /* for failed to stageout file */
	int from_spool;	     /* copy from spool */
	int file_num;	     /* no. of file name in file_list */
	int file_max;	     /* no. of file name that can reside in file_list */
	char **file_list;    /* list of file name to be deleted later*/
	int sandbox_private; /* for stageout with PRIVATE sandbox */
	char *bad_list;	     /* list of failed stageout filename */
	int direct_write;    /* whether direct write has requested by the job */
};
typedef struct cpy_files cpy_files;

#ifdef WIN32
enum stagefile_errcode {
	STAGEFILE_OK = 0,
	STAGEFILE_NOCOPYFILE,
	STAGEFILE_FATAL,
	STAGEFILE_BADUSER,
	STAGEFILE_LAST
};

struct copy_info {
	pbs_list_link al_link;	    /* link to all copy info list */
	char *jobid;		    /* job id to which this info belongs */
	job *pjob;		    /* pointer to job structure */
	struct work_task *ptask;    /* pointer to work task */
	struct batch_request *preq; /* pointer to batch request */
	pio_handles pio;	    /* process info struct */
};
typedef struct copy_info copy_info;

#define CPY_PIPE_BUFSIZE 4096 /* buffer size for pipe */
extern pbs_list_head mom_copyreqs_list;
extern void post_cpyfile(struct work_task *);
extern copy_info *get_copyinfo_from_list(char *);
#endif
extern char *tmpdirname(char *);
#ifdef NAS /* localmod 010 */
extern char *NAS_tmpdirname(job *);
#endif /* localmod 010 */
extern char *jobdirname(char *, char *);
extern void rmtmpdir(char *);
extern int local_or_remote(char **);
extern void add_bad_list(char **, char *, int);
extern int is_child_path(char *, char *);
extern int pbs_glob(char *, char *);
extern void rmjobdir(char *, char *, uid_t, gid_t, int);
extern int stage_file(int, int, char *, struct rqfpair *, int, cpy_files *, char *, char *);
#ifdef WIN32
extern int mktmpdir(char *, char *);
extern int mkjobdir(char *, char *, char *, HANDLE login_handle);
extern int isdriveletter(int);
extern void send_pcphosts(pio_handles *, struct cphosts *);
extern int send_rq_cpyfile_cred(pio_handles *, struct rq_cpyfile *);
extern int recv_pcphosts(void);
extern int recv_rq_cpyfile_cred(struct rq_cpyfile *);
extern int remdir(char *);
extern void check_err(const char *func_name, char *buf, int len);
#else
extern int mktmpdir(char *, uid_t, gid_t, struct var_table *);
extern int mkjobdir(char *, char *, uid_t, gid_t);
extern int impersonate_user(uid_t, gid_t);
extern void revert_from_user(void);
extern int open_file_as_user(char *path, int oflag, mode_t mode,
			     uid_t exuid, gid_t exgid);
#endif
extern int find_env_slot(struct var_table *, char *);
extern void bld_env_variables(struct var_table *, char *, char *);
extern void add_envp(char **, struct var_table *);
extern pid_t fork_me(int sock);

extern ssize_t readpipe(int pfd, void *vptr, size_t nbytes);
extern ssize_t writepipe(int pfd, void *vptr, size_t nbytes);
extern int get_la(double *);
extern void init_abort_jobs(int, pbs_list_head *);
extern void checkret(char **spot, int len);
extern void mom_nice(void);
extern void mom_unnice(void);
extern int mom_reader(int, int, char *);
extern int mom_reader_pkt(int, int, char *);
extern int mom_reader_Xjob(int);
extern int mom_reader_pkt_Xjob(int);
extern int mom_get_reader_Xjob(int);
extern int mom_writer(int, int);
extern int mom_writer_pkt(int, int);
extern void log_mom_portfw_msg(char *msg);
extern void nodes_free(job *);
extern int open_demux(u_long, int);
extern int open_master(char **);
extern int open_slave(void);
extern char *rcvttype(int);
extern int rcvwinsize(int);
extern int remtree(char *);
extern void scan_for_exiting(void);
extern void scan_for_terminated(void);
extern int setwinsize(int);
extern void set_termcc(int);
extern int conn_qsub(char *host, long port);
extern int conn_qsub_resvport(char *host, long port);
extern int state_to_server(int, int);
extern int send_hook_vnl(void *vnl);
extern int hook_requests_to_server(pbs_list_head *);
extern int init_x11_display(struct pfwdsock *, int, char *, char *, char *);
extern int setcurrentworkdir(char *);
extern int becomeuser(job *);
extern int becomeuser_args(char *, uid_t, gid_t, gid_t);
extern void close_update_pipes(job *);
extern void mom_set_use_all(void);
void job_purge_mom(job *pjob);

/* From popen.c */
extern FILE *pbs_popen(const char *, const char *);
extern int pbs_pkill(FILE *, int);
extern int pbs_pclose(FILE *);

/* from mom_walltime.c */
extern void start_walltime(job *);
extern void update_walltime(job *);
extern void stop_walltime(job *);
extern void recover_walltime(job *);

/* Define for max xauth data*/
#define X_DISPLAY_LEN 512

/* Defines for when resource usage is polled by Mom */
#define MAX_CHECK_POLL_TIME 120
#define MIN_CHECK_POLL_TIME 10

/* For windows only, define the window station to use */
/* for launching processes. */
#define PBS_DESKTOP_NAME "PBSWS\\default"

/* max # of users that will be exempted from dorestrict_user process killing */
#ifdef NAS /* localmod 008 */
#define NUM_RESTRICT_USER_EXEMPT_UIDS 99
#else
#define NUM_RESTRICT_USER_EXEMPT_UIDS 10
#endif /* localmod 008 */

/* max length of the error message generated due to database issues */
#define PBS_MAX_DB_ERR 500

/* Defines for state_to_server */
#define UPDATE_VNODES 0
#define UPDATE_MOM_ONLY 1
#ifdef __cplusplus
}
#endif
#endif /* _MOM_FUNC_H */


================================================
FILE: src/include/mom_hook_func.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _MOM_HOOK_FUNC_H
#define _MOM_HOOK_FUNC_H
#ifdef __cplusplus
extern "C" {
#endif

#ifdef linux
#define REBOOT_CMD "/sbin/reboot"
#elif WIN32
#define REBOOT_CMD "\\windows\\system32\\shutdown.exe /g /f /t 5"
#else
#define REBOOT_CMD "/usr/sbin/reboot"
#endif

/* These are attribute names whose value if set from a hook will be */
/* merged withe mom's vnlp list, which is sent to the server upon */
/* receiving IS_HELLO sequeunce.  */
#define HOOK_VNL_PERSISTENT_ATTRIBS "resources_available sharing pcpus resources_assigned"

#define HOOK_RUNNING_IN_BACKGROUND (3)

/* used to send hook's job delete/requeue request to server */
struct hook_job_action {
	pbs_list_link hja_link;
	char hja_jid[PBS_MAXSVRJOBID + 1]; /* job id */
	unsigned long hja_actid;	   /* action id number */
	int hja_runct;			   /* job's run count */
	enum hook_user hja_huser;	   /* admin or user */
	int hja_action;			   /* delete or requeue */
};

#ifdef VNL_NODENUM
struct hook_vnl_action {
	pbs_list_link hva_link;
	unsigned long hva_actid;	 /* action id number */
	char hva_euser[PBS_MAXUSER + 1]; /* effective hook user */
	vnl_t *hva_vnl;			 /* vnl updates */
	int hva_update_cmd;		 /* e.g. IS_UPDATE_FROM_HOOK */
};
#endif

/**
 * @brief
 * 	The mom_hook_input_t holds the input request parameters
 * 	to the mom_process_hooks() function.
 * @param[in]	pjob - a job for which a hook is executing in behalf.
 * @param[in]	progname - used by execjob_launch hook as the
 * 			pbs.event().progname value.
 * @param[in]	argv - used by execjob_launch hook as the
 * 			pbs.event().argv value.
 * @param[in]	env - used by execjob_launch hook as the
 * 			pbs.event().env value.
 * @param[in]	vnl - a vnl_t * structure used by various hooks
 * 			that enumerate the list of vnodes and
 * 			their attributes/resources assigned to a
 * 			job, or for exechost_periodic and exechost_startup
 * 			hooks, the vnodes managed by the system.
 * @param[in]	vnl_fail - a vnl_t * structure used by various hooks
 * 			that enumerate the list of vnodes and
 * 			their attributes/resources assigned to a
 * 			job, whose parent moms are non-functional.
 * @param[in]	failed_mom_list - a svattrl structure enumerating the
 *			sister mom hosts that have been seen as down.
 * @param[in]	succeeded_mom_list - a svattrl structure enumerating the
 *			sister mom hosts that have been seen as up.
 * @param[in]	pid - used by execjob_atttach hook as the
 * 			pbs.event().pid value.
 * @param[in]	jobs_list - list of jobs and their attributes/resources
 * 			    used by the exechost_periodic hook.
 *
 */
typedef struct mom_hook_input {
	job *pjob;
	char *progname;
	char **argv;
	char **env;
	void *vnl;
	void *vnl_fail;
	void *failed_mom_list;
	void *succeeded_mom_list;
	pid_t pid;
	pbs_list_head *jobs_list;
} mom_hook_input_t;

/**
 * @brief
 * 	The mom_hook_output_t holds the output request parameters
 * 	that are filled in, after calling mom_process_hooks().
 * @param[out]	reject_errcode - the resultant errorcode
 * 		(e.g. PBSE_HOOKERROR) when job is rejected due
 * 		to hook.
 * @param[out]	last_phook - the most recent hook that executed.
 * @param[out]	fail_action - the accumulation of fail_action
 * 			values seen for the hooks that
 * 			executed; mom_process_hooks() will
 * 			execute all hooks responding to a particular
 * 			event until reject is encountered.
 * @param[out]	progname - the resultant pbs.event().progname value
 * 			 after executing the execjob_launch hooks
 * 			 responding to a particular event.
 * @param[out]	argv - the resultant pbs.event().argv value after
 * 			executing the execjob_launch hooks
 * 			responding to a particular event.
 * @param[out]	env - the resultant pbs.event().env value after
 * 			executing the execjob_launch hooks
 * 			responding to a particular event.
 * @param[in]	vnl - a vnl_t * structure holding the vnode changes
 * 			made after executing mom_process_hooks().
 * @param[in]	vnl_fail - a vnl_t * structure holding the changes to
 * 			failed vnodes made after executing
 *			mom_process_hooks().
 *holding the changes to
 * 			failed vnodes made after executing
 *			mom_process_hooks().
 */
typedef struct mom_hook_output {
	int *reject_errcode;
	hook **last_phook;
	unsigned int *fail_action;
	char **progname;
	pbs_list_head *argv;
	char **env;
	void *vnl;
	void *vnl_fail;
} mom_hook_output_t;

/**
 * @brief
 * 	The mom_process_hooks_params_t holds the arguments of
 *  mom_process_hooks function, which will be prcessed in
 *  the post_run_hook function.
 */
typedef struct mom_process_hooks_params {
	char *hook_msg;
	char *req_user;
	char *req_host;
	int update_svr;
	int parent_wait;
	unsigned int hook_event;
	pid_t child;
	size_t msg_len;
	mom_hook_input_t *hook_input;
	mom_hook_output_t *hook_output;
} mom_process_hooks_params_t;

void post_reply(job *, int);
extern int mom_process_hooks(unsigned int hook_event, char *req_user, char *req_host,
			     mom_hook_input_t *hook_input,
			     mom_hook_output_t *hook_output,
			     char *hook_msg, size_t msg_len, int update_svr);
extern void cleanup_hooks_in_path_spool(struct work_task *ptask);
extern int python_script_alloc(const char *script_path, struct python_script **py_script);
extern void python_script_free(struct python_script *py_script);
extern void run_periodic_hook_bg(hook *phook);
extern int get_hook_results(char *input_file, int *accept_flag, int *reject_flag,
			    char *reject_msg, int reject_msg_size, int *reject_rerunjob,
			    int *reject_deletejob, int *reboot_flag, char *reboot_cmd,
			    int reboot_cmd_size, pbs_list_head *p_obj, job *pjob, hook *phook,
			    int copy_file, mom_hook_output_t *hook_output);
extern void send_hook_job_action(struct hook_job_action *phja);
extern void attach_hook_requestor_merge_vnl(hook *phook, void *pnv, job *pjob);
extern void new_job_action_req(job *pjob, enum hook_user huser, int action);
extern void send_hook_fail_action(hook *);
extern void vna_list_free(pbs_list_head);
extern void mom_hook_input_init(mom_hook_input_t *hook_input);
extern void mom_hook_output_init(mom_hook_output_t *hook_output);
extern void send_hook_fail_action(hook *);

#ifdef __cplusplus
}
#endif
#endif /* _MOM_HOOK_FUNC_H */


================================================
FILE: src/include/mom_server.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _MOM_SERVER_H
#define _MOM_SERVER_H
#ifdef __cplusplus
extern "C" {
#endif

#include "list_link.h"

/*
 * Definition of basic structures and functions used for Mom -> Server
 * TPP communication.
 *
 * Job Obituary/Resource Usage requests...
 *
 * These are from Mom to Server only and only via TPP
 */

typedef struct resc_used_update ruu;
struct resc_used_update {
	ruu *ru_next;
	char *ru_pjobid;       /* pointer to job id */
	char *ru_comment;      /* a general message */
	int ru_status;	       /* job exit status (or zero) */
	int ru_hop;	       /* hop/run count of job	*/
	pbs_list_head ru_attr; /* list of svrattrl */
#ifdef PBS_MOM
	time_t ru_created_at;	  /* time in epoch at which this ruu was created */
	job *ru_pjob;		  /* pointer to job structure for this ruu */
	int ru_cmd;		  /* cmd for this ruu */
	pbs_list_link ru_pending; /* link to mom_pending_ruu list */
#endif
};

#ifdef PBS_MOM
#define FREE_RUU(x)                                        \
	do {                                               \
		if (x->ru_pjob) {                          \
			x->ru_pjob->ji_pending_ruu = NULL; \
			x->ru_pjob = NULL;                 \
		}                                          \
		delete_link(&x->ru_pending);               \
		free_attrlist(&x->ru_attr);                \
		if (x->ru_pjobid)                          \
			free(x->ru_pjobid);                \
		if (x->ru_comment)                         \
			free(x->ru_comment);               \
		free(x);                                   \
	} while (0)
#else
#define FREE_RUU(x)                          \
	do {                                 \
		free_attrlist(&x->ru_attr);  \
		if (x->ru_pjobid)            \
			free(x->ru_pjobid);  \
		if (x->ru_comment)           \
			free(x->ru_comment); \
		free(x);                     \
	} while (0)
#endif

extern int job_obit(ruu *, int);
extern int enqueue_update_for_send(job *, int);
extern void send_resc_used(int cmd, int count, ruu *rud);
extern void send_pending_updates(void);
extern char mom_short_name[];

#ifdef _PBS_JOB_H
extern u_long resc_used(job *, char *, u_long (*func)(resource *pres));
#endif /* _PBS_JOB_H */
#ifdef __cplusplus
}
#endif
#endif /* _MOM_SERVER_H */


================================================
FILE: src/include/mom_vnode.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include "job.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_nodes.h"

/*
 *	A mom that manages its own lists of CPUs needs to provide a function
 *	that frees these CPUs when the job terminates.  If non-NULL, this
 *	function pointer will be called from mom_deljob().
 */
extern void (*free_job_CPUs)(job *);

/*
 *	These are interfaces to functions that manipulate CPU states for moms
 *	that manage their own CPU lists.  The cpuindex_*() functions are used
 *	when referring to a CPU by its relative position on a given mom_vninfo_t
 *	CPU list, while the cpunum_*() functions deal with physical CPU numbers.
 *
 *	get_cpubits() and get_membits() initialize memory bitmasks used to
 *	represent the CPUs (resp. memory boards) discovered while parsing
 *	vnode definitions files.
 */
extern void cpuindex_free(mom_vninfo_t *, unsigned int);
extern void cpuindex_inuse(mom_vninfo_t *, unsigned int, job *);
extern void cpunum_outofservice(unsigned int);
extern void cpu_raresync(void);


================================================
FILE: src/include/net_connect.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _NET_CONNECT_H
#define _NET_CONNECT_H

/*
 * Other Include Files Required
 *	<sys/types.h>
 *       "pbs_ifl.h"
 */
#include <sys/types.h>
#include <unistd.h>
#include "list_link.h"
#include "auth.h"
#define PBS_NET_H
#ifndef PBS_NET_TYPE
typedef unsigned long pbs_net_t; /* for holding host addresses */
#define PBS_NET_TYPE
#endif

#ifndef INADDR_NONE
#define INADDR_NONE (unsigned int) 0xFFFFFFFF
#endif

#define PBS_NET_MAXCONNECTIDLE 900

/* flag bits for cn_authen field */
#define PBS_NET_CONN_AUTHENTICATED 0x01
#define PBS_NET_CONN_FROM_PRIVIL 0x02
#define PBS_NET_CONN_NOTIMEOUT 0x04
#define PBS_NET_CONN_FROM_QSUB_DAEMON 0x08
#define PBS_NET_CONN_FORCE_QSUB_UPDATE 0x10
#define PBS_NET_CONN_PREVENT_IP_SPOOFING 0x20

#define QSUB_DAEMON "qsub-daemon"

/*
 **	Protocol numbers and versions for PBS communications.
 */

#define RM_PROTOCOL 1 /* resource monitor protocol number */
#define TM_PROTOCOL 2 /* task manager protocol number */
#define IM_PROTOCOL 3 /* inter-mom protocol number */
#define IS_PROTOCOL 4 /* inter-server protocol number */

/* When protocol changes, increment the version
* not to be changed lightly as it makes everything incompatable.
*/
#define RM_PROTOCOL_VER 1     /* resmon protocol version number */
#define TM_PROTOCOL_VER 2     /* task manager protocol version number */
#define TM_PROTOCOL_OLD 1     /* old task manager protocol version number */
#define IM_PROTOCOL_VER 6     /* inter-mom protocol version number */
#define IM_OLD_PROTOCOL_VER 5 /* inter-mom old protocol version number */
#define IS_PROTOCOL_VER 4     /* inter-server protocol version number */

/*	Types of Inter Server messages (between Server and Mom). */
#define IS_NULL 0
#define IS_CMD 1
#define IS_CMD_REPLY 2
#define IS_CLUSTER_ADDRS 3
#define IS_UPDATE 4
#define IS_RESCUSED 5
#define IS_JOBOBIT 6
#define IS_OBITREPLY 7
#define IS_REPLYHELLO 8
#define IS_SHUTDOWN 9
#define IS_IDLE 10
#define IS_REGISTERMOM 11
#define IS_UPDATE2 12
#define IS_DISCARD_JOB 13
#define IS_DISCARD_DONE 14
#define IS_UPDATE_FROM_HOOK 15		   /* request to update vnodes from a hook running on parent mom host */
#define IS_RESCUSED_FROM_HOOK 16	   /* request from child mom for a hook */
#define IS_HOOK_JOB_ACTION 17		   /* request from hook to delete/requeue job */
#define IS_HOOK_ACTION_ACK 18		   /* acknowledge a request of the above 2    */
#define IS_HOOK_SCHEDULER_RESTART_CYCLE 19 /* hook wish scheduler to recycle */
#define IS_HOOK_CHECKSUMS 20		   /* mom reports about hooks seen */
#define IS_UPDATE_FROM_HOOK2 21		   /* request to update vnodes from a hook running on a parent mom host or an allowed non-parent mom host */
#define IS_HELLOSVR 22			   /* hello send to server from mom to initiate a hello sequence */

/* return codes for client_to_svr() */

#define PBS_NET_RC_FATAL -1
#define PBS_NET_RC_RETRY -2

/* bit flags: authentication method (resv ports/external) and authentication mode(svr/client) */

#define B_RESERVED 0x1 /* need reserved port */
#define B_SVR 0x2      /* generate server type auth message */

/**
 * @brief
 * enum conn_type is used to (1) indicate that a connection table entry is in
 * use or is free (Idle).  Additional meaning for the entries are:
 *
 * @verbatim
 * 	Primary
 * 		the primary entry (port) on which the daemon is listening for
 *		connections from a client
 * 	Secondary
 * 		another connection on which the daemon is listening, a different
 *		service such as "resource monitor" part of Mom.
 *		If init_network() is called twice, the second port/entry is
 *		marked as the Secondary
 *	FromClientDIS
 *		a client initiated connection
 *	TppComm
 *		TPP based connection
 *	ChildPipe
 *		Used by Mom for a "unix" pipe between herself and a child;
 *		this is not a IP connection.
 *
 * @endverbatim
 *
 * @note
 *	The entries marked as Primary, Secondary, and TppComm do not require
 *	additional authenication of the user making the request.
 */
typedef struct connection conn_t;
enum conn_type {
	Primary = 0,
	Secondary,
	FromClientDIS,
	ToServerDIS,
	TppComm,
	ChildPipe,
	Idle
};

/*
 * This is used to know where the connection is originated from.
 * This can be extended to have MOM and other clients of Server in future.
 */
typedef enum conn_origin {
	CONN_UNKNOWN = 0,
	CONN_SCHED_PRIMARY,
	CONN_SCHED_SECONDARY,
	CONN_SCHED_ANY
} conn_origin_t;

/* functions available in libnet.a */

conn_t *add_conn(int sock, enum conn_type, pbs_net_t, unsigned int port, int (*ready_func)(conn_t *), void (*func)(int));
int set_conn_as_priority(conn_t *);
int add_conn_data(int sock, void *data); /* Adds the data to the connection */
void *get_conn_data(int sock);		 /* Gets the pointer to the data present with the connection */
int client_to_svr(pbs_net_t, unsigned int port, int);
int client_to_svr_extend(pbs_net_t, unsigned int port, int, char *);
void close_conn(int socket);
pbs_net_t get_connectaddr(int sock);
int get_connecthost(int sock, char *namebuf, int size);
pbs_net_t get_hostaddr(char *hostname);
int comp_svraddr(pbs_net_t, char *, pbs_net_t *);
int compare_short_hostname(char *shost, char *lhost);
unsigned int get_svrport(char *servicename, char *proto, unsigned int df);
int init_network(unsigned int port);
int init_network_add(int sock, int (*readyreadfunc)(conn_t *), void (*readfunc)(int));
void net_close(int);
int wait_request(float waittime, void *priority_context);
extern void *priority_context;
void net_add_close_func(int, void (*)(int));
extern pbs_net_t get_addr_of_nodebyname(char *name, unsigned int *port);
extern int make_host_addresses_list(char *phost, u_long **pul);

conn_t *get_conn(int sock); /* gets the connection, for a given socket id */
void connection_idlecheck(void);
void connection_init(void);
char *build_addr_string(pbs_net_t);
int set_nodelay(int fd);
extern void process_IS_CMD(int);

struct connection {
	int cn_sock;			/* socket descriptor */
	pbs_net_t cn_addr;		/* internet address of client */
	int cn_sockflgs;		/* file status flags - fcntl(F_SETFL) */
	unsigned int cn_port;		/* internet port number of client */
	unsigned short cn_authen;	/* authentication flags */
	enum conn_type cn_active;	/* idle or type if active */
	time_t cn_lasttime;		/* time last active */
	int (*cn_ready_func)(conn_t *); /* true if data rdy for cn_func */
	void (*cn_func)(int);		/* read function when data rdy */
	void (*cn_oncl)(int);		/* func to call on close */
	unsigned short cn_prio_flag;	/* flag for a priority socket */
	pbs_list_link cn_link;		/* link to the next connection in the linked list */
	/* following attributes are for */
	/* credential checking */
	time_t cn_timestamp;
	void *cn_data; /* pointer to some data for cn_func */
	char cn_username[PBS_MAXUSER + 1];
	char cn_hostname[PBS_MAXHOSTNAME + 1];
	char *cn_credid;
	char cn_physhost[PBS_MAXHOSTNAME + 1];
	pbs_auth_config_t *cn_auth_config;
	conn_origin_t cn_origin; /* used to know the origin of the connection i.e. Scheduler, MOM etc. */
};
#endif /* _NET_CONNECT_H */


================================================
FILE: src/include/pbs_array_list.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef PBS_ARRAY_LIST_H__
#define PBS_ARRAY_LIST_H__

/*
 * The data structures, macros and functions in this header file are used for
 * compressing the list of IP addresses sent across from the
 * server to the MOM(s) as part of the IS_CLUSTER_ADDRS message.
 *
 * The high-level algorithm is to reduce a given set of IP addresses to range(s)
 * E.g.: Given: 1,2,3,4,5,8,9,10,11 => {1-5},{8,11}
 * The ranges are stores as an ordered pair: (a,b). The first element 'a' refers
 * to the first IP address in the range and the second element 'b' refers to
 * the number of continuous IP addresses.
 * e.g. (1,5) => {1,2,3,4,5,6}  from 1  to (1+5)
 *      (5,3) => {5,6,7,8}      from 5  to (5+3)
 *     (11,0) => {11}           from 11 to (11+0)
 *
 * Each ordered pair is represented by a 'PBS_IP_RANGE' data structure.
 * For a given ordered pair (a,b), the first element 'a' is referred
 * to as 'ra_low' and the second element 'b' is referred to as 'ra_high' in the
 * code/documentation.
 *
 */

/**
 * 'T' is used to store 'ra_low' and 'ra_high'.
 * This was 'typedef-ed to allow for inclusion of IP v6 addresses possibly
 * in the future
 */
typedef long unsigned int T;

/**
 * 'PBS_IP_RANGE' is used to store the ordered pair (ra_low,ra_high) where 'ra_low' is the
 * starting IP address in a range and 'ra_high' gives the number of IP address
 * in the range
 */
typedef struct pbs_ip_range {
	T ra_low;
	T ra_high;
} PBS_IP_RANGE; /* ra_high  is the number of addresses in the range 'in addition' to the starting address */

typedef PBS_IP_RANGE *pntPBS_IP_RANGE;

/**
 * The PBS_IP_LIST data structure contains an array of ordered pairs (PBS_IP_RANGE)
 * Carries meta-data about the range: the number of slots used and number of
 * slots available
 */
typedef struct pbs_ip_list {
	pntPBS_IP_RANGE li_range;
	int li_nrowsused;
	int li_totalsize;
} PBS_IP_LIST;

typedef PBS_IP_LIST *pntPBS_IP_LIST;
#define CHUNK 5 /* The number of slots by which PBS_IP_LIST is resized */
#define INIT_VALUE 0

/* Various macros to retrieve or set 'ra_low' or 'ra_high' for a given PBS_IP_RANGE */
#define IPLIST_GET_LOW(X, Y) (X)->li_range[(Y)].ra_low
#define IPLIST_GET_HIGH(X, Y) (X)->li_range[(Y)].ra_high
#define IPLIST_SET_LOW(X, Y, Z) (X)->li_range[(Y)].ra_low = (Z)
#define IPLIST_SET_HIGH(X, Y, Z) (X)->li_range[(Y)].ra_high = (Z)
#define IPLIST_IS_CONTINUOUS(X, Y) ((X) + 1 == (Y))

#define IPLIST_IS_CONTINUOUS_ROW(X, Y, Z) (IPLIST_IS_CONTINUOUS((IPLIST_GET_LOW(X, Y) + IPLIST_GET_HIGH(X, Y)), (Z)))
#define IPLIST_IS_ROW_SAME(X, Y, Z) ((IPLIST_GET_LOW(X, Y) + IPLIST_GET_HIGH(X, Y)) == (Z))
#define IPLIST_MOVE_DOWN(X, Y) (((X) - (Y)) * sizeof(PBS_IP_RANGE))
#define IPLIST_MOVE_UP(X, Y) (((X) - ((Y) + 1)) * sizeof(PBS_IP_RANGE))
#define IPLIST_SHIFT_ALL_DOWN_BY_ONE(X, Y, Z) memmove((X)->li_range + (Y) + 1, (X)->li_range + (Y), (Z) * sizeof(PBS_IP_RANGE))
#define IPLIST_SHIFT_ALL_UP_BY_ONE(X, Y, Z) memmove((X)->li_range + (Y), (X)->li_range + (Y) + 1, (Z) * sizeof(PBS_IP_RANGE))

#define IPLIST_INSERT_SUCCESS 0
#define IPLIST_INSERT_FAILURE -1
#define IPLIST_DELETE_SUCCESS 0
#define IPLIST_DELETE_FAILURE -1

/**
 * @brief
 *	Creates an array of size CHUNK of type PBS_IP_RANGE
 *
 * @par Functionality:
 *      This function is invoked by create_pbs_iplist
 *      It results in an array of PBS_IP_RANGE type of size CHUNK
 *      which is an array of ordered pairs (a,b)
 *
 * @param[in]	void
 *
 * @return	pntPBS_IP_RANGE a pointer to PBS_IP_RANGE
 */
pntPBS_IP_RANGE create_pbs_range(void);

/**
 * @brief
 *	Reallocates the array of PBS_IP_RANGE by CHUNK
 *
 * @par Functionality:
 *      Since the PBS_IP_LIST is build dynamically at run-time, therefore
 *      if required, more slots are created by invoking this function.
 *
 * @param[in]	void
 *
 * @return	pntPBS_IP_RANGE a pointer to the newly reallocated PBS_IP_RANGE
 */
pntPBS_IP_LIST resize_pbs_iplist(pntPBS_IP_LIST);

/**
 * @brief
 *	Creates an instance of PBS_IP_LIST
 *
 * @par Functionality:
 *      Invokes create_pbs_range() to
 *      create a PBS_IP_RANGE to store ordered pairs and sets 'totalsize' to CHUNK
 *
 * @param[in]	void
 *
 * @return	pntPBS_IP_RANGE a pointer to PBS_IP_RANGE or NULL if memory allocation fails
 */
pntPBS_IP_LIST create_pbs_iplist(void);

/**
 * @brief
 *	Frees memory associated with PBS_IP_LIST and PBS_IP_RANGE
 *
 * @param[in]	pntPBS_IP_LIST, pointer to PBS_IP_LIST to be freed
 *
 * @return	void
 */
void delete_pbs_iplist(pntPBS_IP_LIST);

/**
 * @brief
 *	Identifies location of slot in which to insert new incoming element.
 *
 * @par Functionality:
 *      This function is invoked by both insert_pbs_element( ) and delete_pbs_element( )
 *      The function takes pointer to PBS_IP_LIST in which to search for key 'T'
 *      The function performs a binary search over only the 'ra_low' elements of
 *      all the ordered pairs in the PBS_IP_LIST. If the element is found, the
 *      function returns the index at which the key is found. Else the function
 *      returns the index at which the element should be inserted. This is set
 *      in the third variable which is passed by reference to the function.
 *
 * @param[in]	pntPBS_IP_LIST pointer to the PBS_IP_LIST in which search is done
 * @param[in]  T the key for which to search in PBS_IP_LIST
 * @param[in]  int* The variable in which location of insertion/deletion is set
 *
 * @return	Non-negative if location found, -1 if location not found
 */
int search_iplist_location(pntPBS_IP_LIST, T, int *);

/**
 * @brief
 *	Inserts provided key into provided PBS_IP_LIST
 *
 * @par Functionality:
 *      The function first calls search_iplist_location to determine location at
 *      which to insert the new element.
 *      The function can determine when the insertion of new key may cause
 *      two distinct ranges to merge and does so.
 *      Function invokes resize_pbs_iplist to resize PBS_IP_LIST as required.
 *      Builds the PBS_IP_LIST dynamically at run-time.
 *
 * @param[in]	pntPBS_IP_LIST pointer to the PBS_IP_LIST in which to insert key.
 * @param[in]  T the key to insert in PBS_IP_LIST
 *
 * @return
 * 0 - SUCCESS
 * 1 - FAILURE
 */
int insert_iplist_element(pntPBS_IP_LIST, T);

/**
 * @brief
 *	Deletes provided key from given PBS_IP_LIST
 *
 * @par Functionality:
 *      The function takes the provided key and removes it from the given
 *      PBS_IP_LIST. If the key matches an element inside a range, then the
 *      range needs to be split into two ranges. The function takes care of
 *      the splitting of the ranges.
 *
 * @param[in]	pntPBS_IP_LIST pointer to the pntPBS_IP_LIST from which to delete key.
 * @param[in]  T the key to delete from PBS_IP_LIST
 *
 * @return
 * 0 - SUCCESS
 * 1 - FAILURE
 */
int delete_iplist_element(pntPBS_IP_LIST, T);

#endif


================================================
FILE: src/include/pbs_assert.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef NDEBUG
#define assert(as)                                                                                              \
	{                                                                                                       \
		if (!(as)) {                                                                                    \
			(void) fprintf(stderr, "Assertion failed: file \"%s\", line %d\n", __FILE__, __LINE__); \
			exit(1);                                                                                \
		}                                                                                               \
	}
#else
#define assert(ex)
#endif


================================================
FILE: src/include/pbs_client_thread.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    pbs_client_thread.h
 *
 * @brief
 *	Pbs threading related functions declarations and structures
 */

#ifndef _PBS_CLIENT_THREAD_H
#define _PBS_CLIENT_THREAD_H

#ifdef __cplusplus
extern "C" {
#endif

#include <pthread.h>

/**
 * @brief
 *  Structure used for storing the connection related context data
 *
 *  Since each thread can open multiple connections, these connection specific
 *  data that might be accessed by the thread after an API call needs to be
 *  saved. An example of this is a thread calling pbs_submit(c1) and
 *  pbs_submit(c2) and then calling pbs_geterrmsg(c1) and pbs_geterrmsg(c2).
 *  The connection level errtxt and errno cannot be left at a global connection
 *  table level, since multiple threads will overwrite it when they share a
 *  connection (since the locking is done at an API level, and the errmsg might
 *  be requested past lock boundaries).
 *
 *  The structure connect_context captures ch_errno, and ch_errtxt from the
 *  connection handle. For each connection associated with a thread, a node of
 *  type struct connect_context is stored into the linked list headed by member
 *  th_ch_conn_context in structure thread_context
 */
struct pbs_client_thread_connect_context {
	/** connection handle */
	int th_ch;
	/** last error number that occured on this connection handle */
	int th_ch_errno;
	/** last server error text on this connection handle */
	char *th_ch_errtxt;
	/** link to the next node in the linked list */
	struct pbs_client_thread_connect_context
		*th_ch_next;
};

/**
 * @brief
 *  Structure used to store thread level context data (TLS)
 *
 *  struct thread_context is the consolidated data that is required by each
 *  thread during its flow throught IFL API and communication to server.
 *  The structure is allocated and stored into TLS area during thread_init
 */
struct pbs_client_thread_context {
	/** stores the global pbs errno */
	int th_pbs_errno;
	/** head pointer to the linked list of connection contexts */
	struct pbs_client_thread_connect_context
		*th_conn_context;
	/** pointer to the array of attribute error structures */
	struct ecl_attribute_errors
		*th_errlist;
	/** pointer to the location for the dis_buffer for each thread */
	char *th_dis_buffer;
	/** pointer to the cred_info structure used by pbs_submit_with_cred */
	void *th_cred_info;
	/** used by totpool and usepool functions */
	void *th_node_pool;
	char th_pbs_server[PBS_MAXSERVERNAME + 1];
	char th_pbs_defserver[PBS_MAXSERVERNAME + 1];
	char th_pbs_current_user[PBS_MAXUSER + 1];
	time_t th_pbs_tcp_timeout;
	int th_pbs_tcp_interrupt;
	int th_pbs_tcp_errno;
	int th_pbs_mode;
};

/* corresponding function pointers for the externally used functions */
extern int (*pfn_pbs_client_thread_lock_connection)(int connect);
extern int (*pfn_pbs_client_thread_unlock_connection)(int connect);
extern struct pbs_client_thread_context *(*pfn_pbs_client_thread_get_context_data)(void);
extern int (*pfn_pbs_client_thread_lock_conntable)(void);
extern int (*pfn_pbs_client_thread_unlock_conntable)(void);
extern int (*pfn_pbs_client_thread_lock_conf)(void);
extern int (*pfn_pbs_client_thread_unlock_conf)(void);
extern int (*pfn_pbs_client_thread_init_thread_context)(void);
extern int (*pfn_pbs_client_thread_init_connect_context)(int connect);
extern int (*pfn_pbs_client_thread_destroy_connect_context)(int connect);

/* #defines for functions called by other code */
#define pbs_client_thread_lock_connection(connect) \
	(*pfn_pbs_client_thread_lock_connection)(connect)
#define pbs_client_thread_unlock_connection(connect) \
	(*pfn_pbs_client_thread_unlock_connection)(connect)
#define pbs_client_thread_get_context_data() \
	(*pfn_pbs_client_thread_get_context_data)()
#define pbs_client_thread_lock_conntable() \
	(*pfn_pbs_client_thread_lock_conntable)()
#define pbs_client_thread_unlock_conntable() \
	(*pfn_pbs_client_thread_unlock_conntable)()
#define pbs_client_thread_lock_conf() \
	(*pfn_pbs_client_thread_lock_conf)()
#define pbs_client_thread_unlock_conf() \
	(*pfn_pbs_client_thread_unlock_conf)()
#define pbs_client_thread_init_thread_context() \
	(*pfn_pbs_client_thread_init_thread_context)()
#define pbs_client_thread_init_connect_context(connect) \
	(*pfn_pbs_client_thread_init_connect_context)(connect)
#define pbs_client_thread_destroy_connect_context(connect) \
	(*pfn_pbs_client_thread_destroy_connect_context)(connect)

/* functions to add/remove/find connection context to the thread context */
struct pbs_client_thread_connect_context *
pbs_client_thread_add_connect_context(int connect);
int pbs_client_thread_remove_connect_context(int connect);
struct pbs_client_thread_connect_context *
pbs_client_thread_find_connect_context(int connect);
void free_errlist(struct ecl_attribute_errors *errlist);

/* function called by daemons to set them to use the unthreaded functions */
void pbs_client_thread_set_single_threaded_mode(void);

#ifdef __cplusplus
}
#endif

#endif /* _PBS__CLIENT_THREAD_H */


================================================
FILE: src/include/pbs_db.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    pbs_db.h
 *
 * @brief
 * PBS database interface. (Functions declarations and structures)
 *
 * This header file contains functions to access the PBS data store
 * Only these functions should be used by PBS code. Actual implementation
 * of these functions are database specific and are implemented in Libdb.
 *
 * In most cases, the size of the fields in the structures correspond
 * one to one with the column size of the respective tables in database.
 * The functions/interfaces in this header are PBS Private.
 */

#ifndef _PBS_DB_H
#define _PBS_DB_H

#include <pbs_ifl.h>
#include <sys/types.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include "list_link.h"

#ifdef __cplusplus
extern "C" {
#endif

#ifndef MIN
#define MIN(x, y) (((x) < (y)) ? (x) : (y))
#endif
#ifndef MAX
#define MAX(x, y) (((x) > (y)) ? (x) : (y))
#endif

#define PBS_MAX_DB_CONN_INIT_ERR (MAXPATHLEN * 2)

/* type of saves bit wise flags - see savetype */
#define OBJ_SAVE_NEW 1 /* object is new, so whole object should be saved */
#define OBJ_SAVE_QS 2  /* quick save area modified, it should be saved */

/**
 * @brief
 * Following are a set of mapping of DATABASE vs C data types. These are
 * typedefed here to allow mapping the database data types easily.
 */
typedef short SMALLINT;
typedef int INTEGER;
typedef long long BIGINT;
typedef char *TEXT;

struct pbs_db_attr_list {
	int attr_count;
	pbs_list_head attrs;
};

typedef struct pbs_db_attr_list pbs_db_attr_list_t;

/**
 * @brief
 *  Structure used to map database server structure to C
 *
 */
struct pbs_db_svr_info {
	BIGINT sv_jobidnumber;
	pbs_db_attr_list_t db_attr_list; /* list of attributes */
};
typedef struct pbs_db_svr_info pbs_db_svr_info_t;

/**
 * @brief
 *  Structure used to map database scheduler structure to C
 *
 */
struct pbs_db_sched_info {
	char sched_name[PBS_MAXSCHEDNAME + 1]; /* sched name */
	pbs_db_attr_list_t db_attr_list;       /* list of attributes */
};
typedef struct pbs_db_sched_info pbs_db_sched_info_t;

/**
 * @brief
 *  Structure used to map database queue structure to C
 *
 */
struct pbs_db_que_info {
	char qu_name[PBS_MAXQUEUENAME + 1]; /* queue name */
	INTEGER qu_type;		    /* queue type: exec, route */
	pbs_db_attr_list_t db_attr_list;    /* list of attributes */
};
typedef struct pbs_db_que_info pbs_db_que_info_t;

/**
 * @brief
 *  Structure used to map database node structure to C
 *
 */
struct pbs_db_node_info {
	char nd_name[PBS_MAXSERVERNAME + 1];	 /* vnode's name */
	INTEGER nd_index;			 /* global node index */
	BIGINT mom_modtime;			 /* node config update time */
	char nd_hostname[PBS_MAXSERVERNAME + 1]; /* node hostname */
	INTEGER nd_state;			 /* state of node */
	INTEGER nd_ntype;			 /* node type */
	char nd_pque[PBS_MAXSERVERNAME + 1];	 /* queue to which it belongs */
	pbs_db_attr_list_t db_attr_list;	 /* list of attributes */
};
typedef struct pbs_db_node_info pbs_db_node_info_t;

/**
 * @brief
 *  Structure used to map database mominfo_time structure to C
 *
 */
struct pbs_db_mominfo_time {
	BIGINT mit_time; /* time of the host to vnode map */
	INTEGER mit_gen; /* generation of the host to vnode map */
};
typedef struct pbs_db_mominfo_time pbs_db_mominfo_time_t;

/**
 * @brief
 *  Structure used to map database job structure to C
 *
 */
struct pbs_db_job_info {
	char ji_jobid[PBS_MAXSVRJOBID + 1];   /* job identifier */
	INTEGER ji_state;		      /* Internal copy of state */
	INTEGER ji_substate;		      /* job sub-state */
	INTEGER ji_svrflags;		      /* server flags */
	BIGINT ji_stime;		      /* time job started execution */
	char ji_queue[PBS_MAXQUEUENAME + 1];  /* name of current queue */
	char ji_destin[PBS_MAXROUTEDEST + 1]; /* dest from qmove/route */
	INTEGER ji_un_type;		      /* job's queue type */
	INTEGER ji_exitstat;		      /* job exit status from MOM */
	BIGINT ji_quetime;		      /* time entered queue */
	BIGINT ji_rteretry;		      /* route retry time */
	INTEGER ji_fromsock;		      /* socket job coming over */
	BIGINT ji_fromaddr;		      /* host job coming from   */
	char ji_jid[8];			      /* extended job save data */
	INTEGER ji_credtype;		      /* credential type */
	BIGINT ji_qrank;		      /* sort key for db query */
	pbs_db_attr_list_t db_attr_list;      /* list of attributes for database */
};
typedef struct pbs_db_job_info pbs_db_job_info_t;

/**
 * @brief
 *  Structure used to map database job script to C
 *
 */
struct pbs_db_jobscr_info {
	char ji_jobid[PBS_MAXSVRJOBID + 1]; /* job identifier */
	TEXT script;			    /* job script */
};
typedef struct pbs_db_jobscr_info pbs_db_jobscr_info_t;

/**
 * @brief
 *  Structure used to map database resv structure to C
 *
 */
struct pbs_db_resv_info {
	char ri_resvid[PBS_MAXSVRJOBID + 1]; /* reservation identifier */
	char ri_queue[PBS_MAXQUEUENAME + 1]; /* queue used by reservation */
	INTEGER ri_state;		     /* internal copy of state */
	INTEGER ri_substate;		     /* substate of resv state */
	BIGINT ri_stime;		     /* left window boundry  */
	BIGINT ri_etime;		     /* right window boundry */
	BIGINT ri_duration;		     /* reservation duration */
	INTEGER ri_tactive;		     /* time reservation became active */
	INTEGER ri_svrflags;		     /* server flags */
	pbs_db_attr_list_t db_attr_list;     /* list of attributes */
};
typedef struct pbs_db_resv_info pbs_db_resv_info_t;

/**
 * @brief
 *  Structure used to pass database query options to database functions
 *
 *  Flags field can be used to pass any flags to a query function.
 *  Timestamp field can be used to pass a timestamp, to return rows that have
 *  a modification timestamp newer (more recent) than the timestamp passed.
 *  (Basically to return rows that have been modified since a point of time)
 *
 */
struct pbs_db_query_options {
	int flags;
	time_t timestamp;
};
typedef struct pbs_db_query_options pbs_db_query_options_t;

#define PBS_DB_SVR 0
#define PBS_DB_SCHED 1
#define PBS_DB_QUEUE 2
#define PBS_DB_NODE 3
#define PBS_DB_MOMINFO_TIME 4
#define PBS_DB_JOB 5
#define PBS_DB_JOBSCR 6
#define PBS_DB_RESV 7
#define PBS_DB_NUM_TYPES 8

/* connection error code */
#define PBS_DB_SUCCESS 0
#define PBS_DB_CONNREFUSED 1
#define PBS_DB_AUTH_FAILED 2
#define PBS_DB_CONNFAILED 3
#define PBS_DB_NOMEM 4
#define PBS_DB_STILL_STARTING 5
#define PBS_DB_ERR 6
#define PBS_DB_OOM_ERR 7

/* Database connection states */
#define PBS_DB_CONNECT_STATE_NOT_CONNECTED 1
#define PBS_DB_CONNECT_STATE_CONNECTING 2
#define PBS_DB_CONNECT_STATE_CONNECTED 3
#define PBS_DB_CONNECT_STATE_FAILED 4

/* Database states */
#define PBS_DB_DOWN 1
#define PBS_DB_STARTING 2
#define PBS_DB_STARTED 3

/**
 * @brief
 *  Wrapper object structure. Contains a pointer to one of the several database
 *  structures.
 *
 *  Most of the database manipulation/query functions take this structure as a
 *  parmater. Depending on the contained structure type, an appropriate internal
 *  database manipulation/query function is eventually called. This allows to
 *  keep the interace simpler and generic.
 *
 */
struct pbs_db_obj_info {
	int pbs_db_obj_type; /* identifies the contained object type */
	union {
		pbs_db_svr_info_t *pbs_db_svr;		  /* map database server structure to C */
		pbs_db_sched_info_t *pbs_db_sched;	  /* map database scheduler structure to C */
		pbs_db_que_info_t *pbs_db_que;		  /* map database queue structure to C */
		pbs_db_node_info_t *pbs_db_node;	  /* map database node structure to C */
		pbs_db_mominfo_time_t *pbs_db_mominfo_tm; /* map database mominfo_time structure to C */
		pbs_db_job_info_t *pbs_db_job;		  /* map database job structure to C */
		pbs_db_jobscr_info_t *pbs_db_jobscr;	  /* map database job script to C */
		pbs_db_resv_info_t *pbs_db_resv;	  /* map database resv structure to C */
	} pbs_db_un;
};
typedef struct pbs_db_obj_info pbs_db_obj_info_t;
typedef void (*query_cb_t)(pbs_db_obj_info_t *, int *);

#define PBS_DB_CNT_TIMEOUT_NORMAL 30
#define PBS_DB_CNT_TIMEOUT_INFINITE 0

/* Database start stop control commands */
#define PBS_DB_CONTROL_STATUS "status"
#define PBS_DB_CONTROL_START "start"
#define PBS_DB_CONTROL_STOP "stop"

/**
 * @brief
 *	Initialize a database connection handle
 *      - creates a database connection handle
 *      - Initializes various fields of the connection structure
 *      - Retrieves connection password and sets the database
 *        connect string
 *
 * @param[out]  conn		- Initialized connecetion handler
 * @param[in]   host		- The name of the host on which database resides
 * @param[in]	port		- The port number where database is running
 * @param[in]   timeout		- The timeout value in seconds to attempt the connection
 *
 * @return      int
 * @retval      !0  - Failure
 * @retval      0 - Success
 *
 */
int pbs_db_connect(void **conn, char *host, int port, int timeout);

/**
 * @brief
 *	Disconnect from the database and frees all allocated memory.
 *
 * @param[in]   conn - Connected database handle
 *  
 * @return      Failure error code
 * @retval      Non-zero  - Failure
 * @retval      0 - Success
 *
 */
int pbs_db_disconnect(void *conn);

/**
 * @brief
 *	Insert a new object into the database
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - Wrapper object that describes the object
 *              (and data) to insert
 * @param[in]   savetype - Update or Insert
 *
 * @return      int
 * @retval      -1  - Failure
 * @retval       0  - success
 *
 */
int pbs_db_save_obj(void *conn, pbs_db_obj_info_t *obj, int savetype);

/**
 * @brief
 *	Delete an existing object from the database
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - Wrapper object that describes the object
 *              (and data) to delete
 *
 * @return      int
 * @retval      -1  - Failure
 * @retval       0  - success
 * @retval       1 -  Success but no rows deleted
 *
 */
int pbs_db_delete_obj(void *conn, pbs_db_obj_info_t *obj);

/**
 * @brief
 *	Delete attributes of an existing object from the database
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - The pointer to the wrapper object which
 *				describes the PBS object (job/resv/node etc) that is wrapped
 *				inside it.
 * @param[in]	obj_id - The object id of the parent (jobid, node-name etc)
 * @param[in]	db_attr_list - List of attributes to remove from DB
 *
 * @return      int
 * @retval      -1  - Failure
 * @retval       0  - success
 * @retval       1 -  Success but no rows deleted
 *
 */
int pbs_db_delete_attr_obj(void *conn, pbs_db_obj_info_t *obj, void *obj_id, pbs_db_attr_list_t *db_attr_list);

/**
 * @brief
 *	Search the database for existing objects and load the server structures.
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - The pointer to the wrapper object which
 *				describes the PBS object (job/resv/node etc) that is wrapped
 *				inside it.
 * @param[in]	pbs_db_query_options_t - Pointer to the options object that can
 *				contain the flags or timestamp which will effect the query.
 * @param[in]	callback function which will process the result from the database
 * 				and update the server strctures.
 *
 * @return	int
 * @retval	0	- Success but no rows found
 * @retval	-1	- Failure
 * @retval	>0	- Success and number of rows found
 *
 */
int pbs_db_search(void *conn, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts, query_cb_t query_cb);

/**
 * @brief
 *	Load a single existing object from the database
 *
 * @param[in]     conn - Connected database handle
 * @param[in/out] pbs_db_obj_info_t - Wrapper object that describes the object
 *                (and data) to load. This parameter used to return the data about
 *                the object loaded
 *
 * @return      int
 * @retval      -1  - Failure
 * @retval       0  - success
 * @retval       1 -  Success but no rows loaded
 *
 */
int pbs_db_load_obj(void *conn, pbs_db_obj_info_t *obj);

/**
 * @brief
 *	Function to check whether data-service is running
 *
 * @return      Error code
 * @retval	-1 - Error in routine
 * @retval	0  - Data service running
 * @retval	1  - Data service not running
 *
 */
int pbs_status_db(char *pbs_ds_host, int pbs_ds_port);

/**
 * @brief
 *	Start the database daemons/service.
 *
 * @param[out]	errmsg - returns the startup error message if any
 *
 * @return	    int
 * @retval       0     - success
 * @retval       !=0   - Failure
 *
 */
int pbs_start_db(char *pbs_ds_host, int pbs_ds_port);

/**
 * @brief
 *	Stop the database daemons/service
 *
 * @param[out]	errmsg - returns the db  error message if any
 *
 * @return      Error code
 * @retval      !=0 - Failure
 * @retval       0  - Success
 *
 */
int pbs_stop_db(char *pbs_ds_host, int pbs_ds_port);

/**
 * @brief
 *	Translates the error code to an error message
 *
 * @param[in]   err_code - Error code to translate
 * @param[out]  err_msg  - The translated error message (newly allocated memory)
 *
 */
void pbs_db_get_errmsg(int err_code, char **err_msg);

/**
 * @brief
 *	Function to create new databse user or change password of current user.
 *
 * @param[in] conn[in]: The database connection handle which was created by pbs_db_connection.
 * @param[in] user_name[in]: Databse user name.
 * @param[in] password[in]:  New password for the database.
 * @param[in] olduser[in]: old database user name.
 *
 * @retval       -1 - Failure
 * @retval        0  - Success
 *
 */
int pbs_db_password(void *conn, char *userid, char *password, char *olduser);

#ifdef __cplusplus
}
#endif

#endif /* _PBS_DB_H */


================================================
FILE: src/include/pbs_ecl.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_ECL_H
#define _PBS_ECL_H

#ifdef __cplusplus
extern "C" {
#endif

#include "portability.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"

#define SLOT_INCR_SIZE 10

extern ecl_attribute_def ecl_svr_attr_def[];
extern ecl_attribute_def ecl_node_attr_def[];
extern ecl_attribute_def ecl_que_attr_def[];
extern ecl_attribute_def ecl_job_attr_def[];
extern ecl_attribute_def ecl_svr_resc_def[];
extern ecl_attribute_def ecl_resv_attr_def[];
extern ecl_attribute_def ecl_sched_attr_def[];

extern int ecl_svr_resc_size;
extern int ecl_job_attr_size;
extern int ecl_que_attr_size;
extern int ecl_node_attr_size;
extern int ecl_resv_attr_size;
extern int ecl_svr_attr_size;
extern int ecl_sched_attr_size;

void set_no_attribute_verification(void);

extern int (*pfn_pbs_verify_attributes)(int connect, int batch_request,
					int parent_object, int command, struct attropl *attribute_list);

#define pbs_verify_attributes(connect, batch_request, parent_object, \
			      cmd, attribute_list)                   \
	(*pfn_pbs_verify_attributes)(connect, batch_request,         \
				     parent_object, cmd, attribute_list)

int verify_an_attribute(int, int, int, struct attropl *, int *, char **);
int verify_attributes(int, int, int, struct attropl *, struct ecl_attribute_errors **);

ecl_attribute_def *ecl_find_resc_def(ecl_attribute_def *, char *, int);
struct ecl_attribute_errors *ecl_get_attr_err_list(int);
void ecl_free_attr_err_list(int);

/* verify datatype functions */
int verify_datatype_bool(struct attropl *, char **);
int verify_datatype_short(struct attropl *, char **);
int verify_datatype_long(struct attropl *, char **);
int verify_datatype_size(struct attropl *, char **);
int verify_datatype_float(struct attropl *, char **);
int verify_datatype_time(struct attropl *, char **);
int verify_datatype_nodes(struct attropl *, char **);
int verify_datatype_select(struct attropl *, char **);
int verify_datatype_long_long(struct attropl *, char **);

/* verify value functions */
int verify_value_resc(int, int, int, struct attropl *, char **);
int verify_value_select(int, int, int, struct attropl *, char **);
int verify_value_preempt_targets(int, int, int, struct attropl *, char **);
int verify_value_preempt_queue_prio(int, int, int, struct attropl *, char **);
int verify_value_preempt_prio(int, int, int, struct attropl *, char **);
int verify_value_preempt_order(int, int, int, struct attropl *, char **);
int verify_value_preempt_sort(int, int, int, struct attropl *, char **);
int verify_value_dependlist(int, int, int, struct attropl *, char **);
int verify_value_user_list(int, int, int, struct attropl *, char **);
int verify_value_authorized_users(int, int, int, struct attropl *, char **);
int verify_value_authorized_groups(int, int, int, struct attropl *, char **);
int verify_value_path(int, int, int, struct attropl *, char **);
int verify_value_jobname(int, int, int, struct attropl *, char **);
int verify_value_checkpoint(int, int, int, struct attropl *, char **);
int verify_value_hold(int, int, int, struct attropl *, char **);
int verify_value_credname(int, int, int, struct attropl *, char **);
int verify_value_zero_or_positive(int, int, int, struct attropl *, char **);
int verify_value_non_zero_positive(int, int, int, struct attropl *, char **);
int verify_value_non_zero_positive_long_long(int, int, int, struct attropl *, char **);
int verify_value_maxlicenses(int, int, int, struct attropl *, char **);
int verify_value_minlicenses(int, int, int, struct attropl *, char **);
int verify_value_licenselinger(int, int, int, struct attropl *, char **);
int verify_value_mgr_opr_acl_check(int, int, int, struct attropl *, char **);
int verify_value_queue_type(int, int, int, struct attropl *, char **);
int verify_value_joinpath(int, int, int, struct attropl *, char **);
int verify_value_keepfiles(int, int, int, struct attropl *, char **);
int verify_keepfiles_common(char *value);
int verify_value_mailpoints(int, int, int, struct attropl *, char **);
int verify_value_mailusers(int, int, int, struct attropl *, char **);
int verify_value_removefiles(int, int, int, struct attropl *, char **);
int verify_removefiles_common(char *value);
int verify_value_priority(int, int, int, struct attropl *, char **);
int verify_value_shellpathlist(int, int, int, struct attropl *, char **);
int verify_value_sandbox(int, int, int, struct attropl *, char **);
int verify_value_stagelist(int, int, int, struct attropl *, char **);
int verify_value_jrange(int, int, int, struct attropl *, char **);
int verify_value_state(int, int, int, struct attropl *, char **);
int verify_value_tolerate_node_failures(int, int, int, struct attropl *, char **);

/* verify object name function */
int pbs_verify_object_name(int, const char *);

#ifdef __cplusplus
}
#endif

#endif /* _PBS_ECL_H */


================================================
FILE: src/include/pbs_entlim.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_ENTLIM_H
#define _PBS_ENTLIM_H
#ifdef __cplusplus
extern "C" {
#endif

/* PBS Limits on Entities */

#include "pbs_idx.h"

#define PBS_MAX_RESC_NAME 1024

#define ENCODE_ENTITY_MAX 100

enum lim_keytypes {
	LIM_USER,
	LIM_GROUP,
	LIM_PROJECT,
	LIM_OVERALL
};

#define PBS_GENERIC_ENTITY "PBS_GENERIC"
#define PBS_ALL_ENTITY "PBS_ALL"
#define ETLIM_INVALIDCHAR "/[]\";:|<>+,?*"

/* Flags used for account_entity_limit_usages() */
#define ETLIM_ACC_CT 1 << 0	/* flag for set_entity_ct_sum_ */
#define ETLIM_ACC_RES 1 << 1	/* flag for set_entity_resc_sum_ */
#define ETLIM_ACC_QUEUED 1 << 2 /* flag for set_entity_-_sum_max */
#define ETLIM_ACC_MAX 1 << 3	/* flag for set_entity_-_sum_queued */

#define ETLIM_ACC_CT_QUEUED (ETLIM_ACC_CT | ETLIM_ACC_QUEUED)	/* set_entity_ct_sum_queued */
#define ETLIM_ACC_CT_MAX (ETLIM_ACC_CT | ETLIM_ACC_MAX)		/* set_entity_ct_sum_max */
#define ETLIM_ACC_RES_QUEUED (ETLIM_ACC_RES | ETLIM_ACC_QUEUED) /* set_entity_resc_sum_queued */
#define ETLIM_ACC_RES_MAX (ETLIM_ACC_RES | ETLIM_ACC_MAX)	/* set_entity_resc_sum_max */

#define ETLIM_ACC_ALL_RES (ETLIM_ACC_QUEUED | ETLIM_ACC_MAX | ETLIM_ACC_RES)		/* set_entity_resc_sum_* */
#define ETLIM_ACC_ALL_CT (ETLIM_ACC_QUEUED | ETLIM_ACC_MAX | ETLIM_ACC_CT)		/* set_entity_ct_sum_* */
#define ETLIM_ACC_ALL_MAX (ETLIM_ACC_CT | ETLIM_ACC_RES | ETLIM_ACC_MAX)		/* set_entity_*_sum_max */
#define ETLIM_ACC_ALL_QUEUED (ETLIM_ACC_CT | ETLIM_ACC_RES | ETLIM_ACC_QUEUED)		/* set_entity_*_sum_queued */
#define ETLIM_ACC_ALL (ETLIM_ACC_CT | ETLIM_ACC_RES | ETLIM_ACC_QUEUED | ETLIM_ACC_MAX) /* for all 4 set_entity_* */

void *entlim_initialize_ctx(void);

/* get data record from an entry based on a key string */
void *entlim_get(const char *keystr, void *ctx);

/* add a record including key and data, based on a key string */
int entlim_add(const char *entity, const void *recptr, void *ctx);

/* replace a record including key and data, based on a key string */
int entlim_replace(const char *entity, void *recptr, void *ctx, void free_leaf(void *));

/* delete a record based on a key string */
int entlim_delete(const char *entity, void *ctx, void free_leaf(void *));

/* free the entire data context and all associated data and keys */
/* the function "free_leaf" is used to free the data record      */
int entlim_free_ctx(void *ctx, void free_leaf(void *));

/* walk the records returning a key object for the next entry found */
void *entlim_get_next(void *ctx, void **key);

/* entlim_parse - parse a comma separated set of "entity limit strings */
int entlim_parse(char *str, char *resc, void *ctx,
		 int (*addfunc)(void *ctx, enum lim_keytypes kt, char *fulent,
				char *entname, char *resc, char *value));
char *parse_comma_string_r(char **start);
char *entlim_mk_runkey(enum lim_keytypes kt, const char *entity);
char *entlim_mk_reskey(enum lim_keytypes kt, const char *entity, const char *resc);
int entlim_resc_from_key(char *key, char *rtnresc, size_t ln);
int entlim_entity_from_key(char *key, char *rtnname, size_t ln);

#ifdef __cplusplus
}
#endif
#endif /* _PBS_ENTLIM_H */


================================================
FILE: src/include/pbs_error.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_ERROR_H
#define _PBS_ERROR_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * The error returns possible to a Batch Request
 *
 * Each error is prefixed with the string PBSE_ for Portable (Posix)
 * Batch System Error.  The numeric values start with 15000 since the
 * POSIX Batch Extensions Working group is 1003.15
 */

/*
 * The following error numbers should not be used while adding new PBS errors.
 * As a general guideline, do not use a number if number%256=0.
 * If PBS code erroneously uses these error numbers for future errors
 * and use them as command exit code, the behavior
 * will be erroneous on many standards-compliant systems.
 */
#define PBSE_DONOTUSE1 15360
#define PBSE_DONOTUSE2 15616
#define PBSE_DONOTUSE3 15872
#define PBSE_DONOTUSE4 16128
#define PBSE_DONOTUSE5 16384

#define PBSE_ 15000

#define PBSE_NONE 0		    /* no error */
#define PBSE_UNKJOBID 15001	    /* Unknown Job Identifier */
#define PBSE_NOATTR 15002	    /* Undefined Attribute */
#define PBSE_ATTRRO 15003	    /* attempt to set READ ONLY attribute */
#define PBSE_IVALREQ 15004	    /* Invalid request */
#define PBSE_UNKREQ 15005	    /* Unknown batch request */
#define PBSE_TOOMANY 15006	    /* Too many submit retries */
#define PBSE_PERM 15007		    /* No permission */
#define PBSE_BADHOST 15008	    /* access from host not allowed */
#define PBSE_JOBEXIST 15009	    /* job already exists */
#define PBSE_SYSTEM 15010	    /* system error occurred */
#define PBSE_INTERNAL 15011	    /* internal server error occurred */
#define PBSE_REGROUTE 15012	    /* parent job of dependent in rte que */
#define PBSE_UNKSIG 15013	    /* unknown signal name */
#define PBSE_BADATVAL 15014	    /* bad attribute value */
#define PBSE_MODATRRUN 15015	    /* Cannot modify attrib in run state */
#define PBSE_BADSTATE 15016	    /* request invalid for job state */
#define PBSE_UNKQUE 15018	    /* Unknown queue name */
#define PBSE_BADCRED 15019	    /* Invalid Credential in request */
#define PBSE_EXPIRED 15020	    /* Expired Credential in request */
#define PBSE_QUNOENB 15021	    /* Queue not enabled */
#define PBSE_QACESS 15022	    /* No access permission for queue */
#define PBSE_BADUSER 15023	    /* Bad user - no password entry */
#define PBSE_HOPCOUNT 15024	    /* Max hop count exceeded */
#define PBSE_QUEEXIST 15025	    /* Queue already exists */
#define PBSE_ATTRTYPE 15026	    /* incompatable queue attribute type */
#define PBSE_OBJBUSY 15027	    /* Object Busy (not empty) */
#define PBSE_QUENBIG 15028	    /* Queue name too long */
#define PBSE_NOSUP 15029	    /* Feature/function not supported */
#define PBSE_QUENOEN 15030	    /* Cannot enable queue,needs add def */
#define PBSE_PROTOCOL 15031	    /* Batch Protocol error */
#define PBSE_BADATLST 15032	    /* Bad attribute list structure */
#define PBSE_NOCONNECTS 15033	    /* No free connections */
#define PBSE_NOSERVER 15034	    /* No server to connect to */
#define PBSE_UNKRESC 15035	    /* Unknown resource */
#define PBSE_EXCQRESC 15036	    /* Job exceeds Queue resource limits */
#define PBSE_QUENODFLT 15037	    /* No Default Queue Defined */
#define PBSE_NORERUN 15038	    /* Job Not Rerunnable */
#define PBSE_ROUTEREJ 15039	    /* Route rejected by all destinations */
#define PBSE_ROUTEEXPD 15040	    /* Time in Route Queue Expired */
#define PBSE_MOMREJECT 15041	    /* Request to MOM failed */
#define PBSE_BADSCRIPT 15042	    /* (qsub) cannot access script file */
#define PBSE_STAGEIN 15043	    /* Stage In of files failed */
#define PBSE_RESCUNAV 15044	    /* Resources temporarily unavailable */
#define PBSE_BADGRP 15045	    /* Bad Group specified */
#define PBSE_MAXQUED 15046	    /* Max number of jobs in queue */
#define PBSE_CKPBSY 15047	    /* Checkpoint Busy, may be retries */
#define PBSE_EXLIMIT 15048	    /* Limit exceeds allowable */
#define PBSE_BADACCT 15049	    /* Bad Account attribute value */
#define PBSE_ALRDYEXIT 15050	    /* Job already in exit state */
#define PBSE_NOCOPYFILE 15051	    /* Job files not copied */
#define PBSE_CLEANEDOUT 15052	    /* unknown job id after clean init */
#define PBSE_NOSYNCMSTR 15053	    /* No Master in Sync Set */
#define PBSE_BADDEPEND 15054	    /* Invalid dependency */
#define PBSE_DUPLIST 15055	    /* Duplicate entry in List */
#define PBSE_DISPROTO 15056	    /* Bad DIS based Request Protocol */
#define PBSE_EXECTHERE 15057	    /* cannot execute there */
#define PBSE_SISREJECT 15058	    /* sister rejected */
#define PBSE_SISCOMM 15059	    /* sister could not communicate */
#define PBSE_SVRDOWN 15060	    /* req rejected -server shutting down */
#define PBSE_CKPSHORT 15061	    /* not all tasks could checkpoint */
#define PBSE_UNKNODE 15062	    /* Named node is not in the list */
#define PBSE_UNKNODEATR 15063	    /* node-attribute not recognized */
#define PBSE_NONODES 15064	    /* Server has no node list */
#define PBSE_NODENBIG 15065	    /* Node name is too big */
#define PBSE_NODEEXIST 15066	    /* Node name already exists */
#define PBSE_BADNDATVAL 15067	    /* Bad node-attribute value */
#define PBSE_MUTUALEX 15068	    /* State values are mutually exclusive */
#define PBSE_GMODERR 15069	    /* Error(s) during global modification of nodes */
#define PBSE_NORELYMOM 15070	    /* could not contact Mom */
#define PBSE_NOTSNODE 15071	    /* No time-share node available */
#define PBSE_RESV_NO_WALLTIME 15075 /* job reserv lacking walltime */
#define PBSE_JOBNOTRESV 15076	    /* not a reservation job       */
#define PBSE_TOOLATE 15077	    /* too late for job reservation*/
#define PBSE_IRESVE 15078	    /* internal reservation-system error */
/* 15079 unused */
#define PBSE_RESVEXIST 15080   /* reservation already exists */
#define PBSE_resvFail 15081    /* reservation failed */
#define PBSE_genBatchReq 15082 /* batch request generation failed */
#define PBSE_mgrBatchReq 15083 /* qmgr batch request failed */
#define PBSE_UNKRESVID 15084   /* unknown reservation ID */
#define PBSE_delProgress 15085 /* delete already in progress */
#define PBSE_BADTSPEC 15086    /* bad time specification(s) */
#define PBSE_RESVMSG 15087     /* so reply_text can send back a msg */
#define PBSE_NOTRESV 15088     /* not a reservation */
#define PBSE_BADNODESPEC 15089 /* node(s) specification error */
#define PBSE_UNUSED1 15090     /* Licensed CPUs exceeded */
#define PBSE_LICENSEINV 15091  /* License is invalid     */
#define PBSE_RESVAUTH_H 15092  /* Host machine not authorized to */
/* submit reservations            */
#define PBSE_RESVAUTH_G 15093 /* Requestor's group not authorized */
/* to submit reservations           */
#define PBSE_RESVAUTH_U 15094 /* Requestor not authorized to make */
/* reservations                     */
#define PBSE_R_UID 15095       /* Bad effective UID for reservation */
#define PBSE_R_GID 15096       /* Bad effective GID for reservation */
#define PBSE_IBMSPSWITCH 15097 /* IBM SP Switch error */
#define PBSE_UNUSED2 15098     /* Floating License unavailable  */
#define PBSE_NOSCHEDULER 15099 /* Unable to contact Scheduler */
#define PBSE_RESCNOTSTR 15100  /* resource is not of type string */

#define PBSE_MaxArraySize 15107	   /* max array size exceeded */
#define PBSE_INVALSELECTRESC 15108 /* resc invalid in select spec */
#define PBSE_INVALJOBRESC 15109	   /* invalid job resource */
#define PBSE_INVALNODEPLACE 15110  /* node invalid w/ place|select */
#define PBSE_PLACENOSELECT 15111   /* cannot have place w/o select */
#define PBSE_INDIRECTHOP 15112	   /* too many indirect resc levels */
#define PBSE_INDIRECTBT 15113	   /* target resc undefined */
/* Error number 15114 not used */
#define PBSE_NODESTALE 15115		 /* Cannot change state of stale nd */
#define PBSE_DUPRESC 15116		 /* cannot dup resc within a chunk */
#define PBSE_CONNFULL 15117		 /* server connection table full */
#define PBSE_LICENSE_MIN_BADVAL 15118	 /* bad value for pbs_license_min */
#define PBSE_LICENSE_MAX_BADVAL 15119	 /* bad value for pbs_license_max */
#define PBSE_LICENSE_LINGER_BADVAL 15120 /* bad value for pbs_license_linger_time*/
#define PBSE_UNUSED3 15121		 /* License server is down */
#define PBSE_UNUSED4 15122		 /* Not allowed action with FLEX licensing */
#define PBSE_BAD_FORMULA 15123		 /* invalid sort formula */
#define PBSE_BAD_FORMULA_KW 15124	 /* invalid keyword in formula */
#define PBSE_BAD_FORMULA_TYPE 15125	 /* invalid resource type in formula */
#define PBSE_BAD_RRULE_YEARLY 15126	 /* reservation duration exceeds 1 year */
#define PBSE_BAD_RRULE_MONTHLY 15127	 /* reservation duration exceeds 1 month */
#define PBSE_BAD_RRULE_WEEKLY 15128	 /* reservation duration exceeds 1 week */
#define PBSE_BAD_RRULE_DAILY 15129	 /* reservation duration exceeds 1 day */
#define PBSE_BAD_RRULE_HOURLY 15130	 /* reservation duration exceeds 1 hour */
#define PBSE_BAD_RRULE_MINUTELY 15131	 /* reservation duration exceeds 1 minute */
#define PBSE_BAD_RRULE_SECONDLY 15132	 /* reservation duration exceeds 1 second */
#define PBSE_BAD_RRULE_SYNTAX 15133	 /* invalid recurrence rule syntax */
#define PBSE_BAD_RRULE_SYNTAX2 15134	 /* invalid recurrence rule syntax. COUNT/UNTIL required*/
#define PBSE_BAD_ICAL_TZ 15135		 /* Undefined timezone info directory */
#define PBSE_HOOKERROR 15136		 /* error encountered related to hooks */
#define PBSE_NEEDQUET 15137		 /* need queue type set */
#define PBSE_ETEERROR 15138		 /* not allowed to alter attribute when eligible_time_enable is off */
#define PBSE_HISTJOBID 15139		 /* History job ID */
#define PBSE_JOBHISTNOTSET 15140	 /* job_history_enable not SET */
#define PBSE_MIXENTLIMS 15141		 /* mixing old and new limit enformcement */
#define PBSE_ENTLIMCT 15142		 /* entity count limit exceeded */
#define PBSE_ENTLIMRESC 15143		 /* entity resource limit exceeded */
#define PBSE_ATVALERANGE 15144		 /* attribute value out of range */
#define PBSE_PROV_HEADERROR 15145	 /* not allowed to set provisioningattributes on head node */
#define PBSE_NODEPROV_NOACTION 15146	 /* cannot modify attribute while node is provisioning */
#define PBSE_NODEPROV 15147		 /* Cannot change state of provisioning node */
#define PBSE_NODEPROV_NODEL 15148	 /* Cannot del node if provisioning*/
#define PBSE_NODE_BAD_CURRENT_AOE 15149	 /* current aoe is not one of resources_available.aoe */
#define PBSE_NOLOOPBACKIF 15153		 /* Local host does not have loopback interface configured. */
#define PBSE_IVAL_AOECHUNK 15155	 /* aoe not following chunk rules */
#define PBSE_JOBINRESV_CONFLICT 15156	 /* job and reservation conflict */

#define PBSE_NORUNALTEREDJOB 15157	   /* cannot run altered/moved job */
#define PBSE_HISTJOBDELETED 15158	   /* Job was in F or M state . Its history deleted upon request. */
#define PBSE_NOHISTARRAYSUBJOB 15159	   /* Request invalid for finished array subjob */
#define PBSE_FORCE_QSUB_UPDATE 15160	   /* a qsub action needs to be redone */
#define PBSE_SAVE_ERR 15161		   /* failed to save job or resv to database */
#define PBSE_MAX_NO_MINWT 15162		   /* no max walltime w/o min walltime */
#define PBSE_MIN_GT_MAXWT 15163		   /* min_walltime can not be > max_walltime */
#define PBSE_NOSTF_RESV 15164		   /* There can not be a shrink-to-fit reservation */
#define PBSE_NOSTF_JOBARRAY 15165	   /* There can not be a shrink-to-fit job array */
#define PBSE_NOLIMIT_RESOURCE 15166	   /* Resource limits can not be set for the resource */
#define PBSE_MOM_INCOMPLETE_HOOK 15167	   /* mom hook not fully transferred */
#define PBSE_MOM_REJECT_ROOT_SCRIPTS 15168 /* no hook, root job scripts */
#define PBSE_HOOK_REJECT 15169		   /* mom receives a hook rejection */
#define PBSE_HOOK_REJECT_RERUNJOB 15170	   /* hook rejection requiring a job rerun */
#define PBSE_HOOK_REJECT_DELETEJOB 15171   /* hook rejection requiring a job delete */
#define PBSE_IVAL_OBJ_NAME 15172	   /* invalid object name */

#define PBSE_JOBNBIG 15173 /* Job name is too long */

#define PBSE_RESCBUSY 15174	       /* Resource is set on an object */
#define PBSE_JOBSCRIPTMAXSIZE 15175    /* job script max size exceeded */
#define PBSE_BADJOBSCRIPTMAXSIZE 15176 /* user set size more than 2GB */
#define PBSE_WRONG_RESUME 15177	       /* user tried to resume job with wrong resume signal*/

/* Error code specific to altering reservation start and end times */
#define PBSE_RESV_NOT_EMPTY 15178	   /* cannot change start time of a non-empty reservation */
#define PBSE_STDG_RESV_OCCR_CONFLICT 15179 /* cannot change start time of a non-empty reservation */

#define PBSE_SOFTWT_STF 15180 /* soft_walltime is incompatible with STF jobs */

#define PBSE_RESV_FROM_RESVJOB 15181 /* Job already in a reservation used to create a reservation */
#define PBSE_RESV_FROM_ARRJOB 15182  /* Array job used to create a reservation */
#define PBSE_SELECT_NOT_SUBSET 15183 /* ralter select spec is not a smaller subset of the original */
/*
 ** 	Resource monitor specific
 */
#define PBSE_RMUNKNOWN 15201  /* resource unknown */
#define PBSE_RMBADPARAM 15202 /* parameter could not be used */
#define PBSE_RMNOPARAM 15203  /* a parameter needed did not exist */
#define PBSE_RMEXIST 15204    /* something specified didn't exist */
#define PBSE_RMSYSTEM 15205   /* a system error occured */
#define PBSE_RMPART 15206     /* only part of reservation made */
#define RM_ERR_UNKNOWN PBSE_RMUNKNOWN
#define RM_ERR_BADPARAM PBSE_RMBADPARAM
#define RM_ERR_NOPARAM PBSE_RMNOPARAM
#define RM_ERR_EXIST PBSE_RMEXIST
#define RM_ERR_SYSTEM PBSE_RMSYSTEM

#define PBSE_TRYAGAIN 15208   /* Try the request again later */
#define PBSE_ALPSRELERR 15209 /* ALPS failed to release the resv */

#define PBSE_JOB_MOVED 15210			  /* Job moved to another server */
#define PBSE_SCHEDEXIST 15211			  /* Scheduler already exists */
#define PBSE_SCHED_NAME_BIG 15212		  /* Scheduler name too long */
#define PBSE_UNKSCHED 15213			  /* sched not in the list */
#define PBSE_SCHED_NO_DEL 15214			  /* can not delete scheduler */
#define PBSE_SCHED_PRIV_EXIST 15215		  /* Scheduler sched_priv directory already exists */
#define PBSE_SCHED_LOG_EXIST 15216		  /* Scheduler sched_log directory already exists */
#define PBSE_ROUTE_QUE_NO_PARTITION 15217	  /*Partition can not be assigned to route queue */
#define PBSE_CANNOT_SET_ROUTE_QUE 15218		  /*Can not set queue type to route */
#define PBSE_QUE_NOT_IN_PARTITION 15219		  /* Queue does not belong to the partition */
#define PBSE_PARTITION_NOT_IN_QUE 15220		  /* Partition does not belong to the queue */
#define PBSE_INVALID_PARTITION_QUE 15221	  /* Invalid partition to the queue */
#define PBSE_ALPS_SWITCH_ERR 15222		  /* ALPS failed to do the suspend/resume */
#define PBSE_SCHED_OP_NOT_PERMITTED 15223	  /* Operation not permitted on default scheduler */
#define PBSE_SCHED_PARTITION_ALREADY_EXISTS 15224 /* Partition already exists */
#define PBSE_INVALID_MAX_JOB_SEQUENCE_ID 15225	  /* Invalid max_job_sequence_id < 9999999, or > 999999999999 */
#define PBSE_SVR_SCHED_JSF_INCOMPAT 15226	  /* Server's job_sort_formula is incompatible with sched's */
#define PBSE_NODE_BUSY 15227			  /* Node is busy */
#define PBSE_DEFAULT_PARTITION 15228		  /* Default partition name is not allowed */
#define PBSE_HISTDEPEND 15229			  /* Finished job did not satisfy dependency */
#define PBSE_SCHEDCONNECTED 15230
#define PBSE_NOTARRAY_ATTR 15231 /* Not an array job */

/* the following structure is used to tie error number      */
/* with text to be returned to a client, see svr_messages.c */

struct pbs_err_to_txt {
	int err_no;
	char **err_txt;
};

extern char *pbse_to_txt(int);

/* This variable has been moved to Thread local storage
 * The define points to a function pointer which locates
 * the actual variable from the TLS of the calling thread
 */
#ifndef __PBS_ERRNO
#define __PBS_ERRNO
extern int *__pbs_errno_location(void);
#define pbs_errno (*__pbs_errno_location())
#endif
#ifdef __cplusplus
}
#endif
#endif /* _PBS_ERROR_H */


================================================
FILE: src/include/pbs_idx.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_IDX_H
#define _PBS_IDX_H
#ifdef __cplusplus
extern "C" {
#endif

#include <stdbool.h>

#define PBS_IDX_DUPS_OK 0x01   /* duplicate key allowed in index */
#define PBS_IDX_ICASE_CMP 0x02 /* set case-insensitive compare */

#define PBS_IDX_RET_OK 0    /* index op succeed */
#define PBS_IDX_RET_FAIL -1 /* index op failed */

/**
 * @brief
 *	Create an empty index
 *
 * @param[in] - dups   - Whether duplicates are allowed or not in index
 * @param[in] - keylen - length of key in index (can be 0 for default size)
 *
 * @return void *
 * @retval !NULL - success
 * @retval NULL  - failure
 *
 */
extern void *pbs_idx_create(int dups, int keylen);

/**
 * @brief
 *	destroy index
 *
 * @param[in] - idx - pointer to index
 *
 * @return void
 *
 */
extern void pbs_idx_destroy(void *idx);

/**
 * @brief
 *	add entry in index
 *
 * @param[in] - idx  - pointer to index
 * @param[in] - key  - key of entry
 * @param[in] - data - data of entry
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 */
extern int pbs_idx_insert(void *idx, void *key, void *data);

/**
 * @brief
 *	delete entry from index
 *
 * @param[in] - idx - pointer to index
 * @param[in] - key - key of entry
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 */
extern int pbs_idx_delete(void *idx, void *key);

/**
 * @brief
 *	delete exact entry from index using given context
 *
 * @param[in] - ctx - pointer to context used while
 *                    deleting exact entry in index
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 */
extern int pbs_idx_delete_byctx(void *ctx);

/**
 * @brief
 *	find or iterate entry in index
 *
 * @param[in]     - idx  - pointer to index
 * @param[in/out] - key  - key of the entry
 *                         if *key is NULL then this routine will
 *                         return the first entry in index
 * @param[in/out] - data - data of the entry
 * @param[in/out] - ctx  - context to be set for iteration
 *                         can be NULL, if caller doesn't want
 *                         iteration context
 *                         if *ctx is not NULL, then this routine
 *                         will return next entry in index
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 * @note
 * 	ctx should be free'd after use, using pbs_idx_free_ctx()
 *
 */
extern int pbs_idx_find(void *idx, void **key, void **data, void **ctx);

/**
 * @brief
 *	free given iteration context
 *
 * @param[in] - ctx - pointer to context for iteration
 *
 * @return void
 *
 */
extern void pbs_idx_free_ctx(void *ctx);

/**
 * @brief check whether idx is empty and has no key associated with it
 * 
 * @param[in] idx - pointer to avl index
 * 
 * @return int
 * @retval 1 - idx is empty
 * @retval 0 - idx is not empty
 */
extern bool pbs_idx_is_empty(void *idx);

#ifdef __cplusplus
}
#endif
#endif /* _PBS_IDX_H */


================================================
FILE: src/include/pbs_ifl.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_IFL_H
#define _PBS_IFL_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 *
 *  pbs_ifl.h
 *
 */

#include <stdio.h>
#include <time.h>

/* types of attributes: read only, public, all */
#define TYPE_ATTR_READONLY 1
#define TYPE_ATTR_PUBLIC 2
#define TYPE_ATTR_INVISIBLE 4
#define TYPE_ATTR_ALL TYPE_ATTR_READONLY | TYPE_ATTR_PUBLIC | TYPE_ATTR_INVISIBLE

/* Attribute Names used by user commands */

#define ATTR_a "Execution_Time"
#define ATTR_c "Checkpoint"
#define ATTR_e "Error_Path"
#define ATTR_g "group_list"
#define ATTR_h "Hold_Types"
#define ATTR_j "Join_Path"
#define ATTR_J "array_indices_submitted"
#define ATTR_k "Keep_Files"
#define ATTR_l "Resource_List"
#define ATTR_l_orig "Resource_List_orig"
#define ATTR_l_acct "Resource_List_acct"
#define ATTR_m "Mail_Points"
#define ATTR_o "Output_Path"
#define ATTR_p "Priority"
#define ATTR_q "destination"
#define ATTR_R "Remove_Files"
#define ATTR_r "Rerunable"
#define ATTR_u "User_List"
#define ATTR_v "Variable_List"
#define ATTR_A "Account_Name"
#define ATTR_M "Mail_Users"
#define ATTR_N "Job_Name"
#define ATTR_S "Shell_Path_List"
#define ATTR_array_indices_submitted ATTR_J
#define ATTR_depend "depend"
#define ATTR_inter "interactive"
#define ATTR_sandbox "sandbox"
#define ATTR_stagein "stagein"
#define ATTR_stageout "stageout"
#define ATTR_resvTag "reserve_Tag"
#define ATTR_resv_start "reserve_start"
#define ATTR_resv_end "reserve_end"
#define ATTR_resv_duration "reserve_duration"
#define ATTR_resv_state "reserve_state"
#define ATTR_resv_substate "reserve_substate"
#define ATTR_resv_job "reserve_job"
#define ATTR_auth_u "Authorized_Users"
#define ATTR_auth_g "Authorized_Groups"
#define ATTR_auth_h "Authorized_Hosts"
#define ATTR_cred "cred"
#define ATTR_nodemux "no_stdio_sockets"
#define ATTR_umask "umask"
#define ATTR_block "block"
#define ATTR_convert "qmove"
#define ATTR_DefaultChunk "default_chunk"
#define ATTR_X11_cookie "forward_x11_cookie"
#define ATTR_X11_port "forward_x11_port"
#define ATTR_GUI "gui"
#define ATTR_max_run_subjobs "max_run_subjobs"

/* Begin Standing Reservation Attributes */
#define ATTR_resv_standing "reserve_standing"
#define ATTR_resv_count "reserve_count"
#define ATTR_resv_idx "reserve_index"
#define ATTR_resv_rrule "reserve_rrule"
#define ATTR_resv_execvnodes "reserve_execvnodes"
#define ATTR_resv_timezone "reserve_timezone"
/* End of standing reservation specific */

/* additional job and general attribute names */
#define ATTR_ctime "ctime"
#define ATTR_estimated "estimated"
#define ATTR_exechost "exec_host"
#define ATTR_exechost_acct "exec_host_acct"
#define ATTR_exechost_orig "exec_host_orig"
#define ATTR_exechost2 "exec_host2"
#define ATTR_execvnode "exec_vnode"
#define ATTR_execvnode_acct "exec_vnode_acct"
#define ATTR_execvnode_deallocated "exec_vnode_deallocated"
#define ATTR_execvnode_orig "exec_vnode_orig"
#define ATTR_resv_nodes "resv_nodes"
#define ATTR_mtime "mtime"
#define ATTR_qtime "qtime"
#define ATTR_session "session_id"
#define ATTR_jobdir "jobdir"
#define ATTR_euser "euser"
#define ATTR_egroup "egroup"
#define ATTR_project "project"
#define ATTR_hashname "hashname"
#define ATTR_hopcount "hop_count"
#define ATTR_security "security"
#define ATTR_sched_hint "sched_hint"
#define ATTR_SchedSelect "schedselect"
#define ATTR_SchedSelect_orig "schedselect_orig"
#define ATTR_substate "substate"
#define ATTR_name "Job_Name"
#define ATTR_owner "Job_Owner"
#define ATTR_used "resources_used"
#define ATTR_used_acct "resources_used_acct"
#define ATTR_used_update "resources_used_update"
#define ATTR_relnodes_on_stageout "release_nodes_on_stageout"
#define ATTR_tolerate_node_failures "tolerate_node_failures"
#define ATTR_released "resources_released"
#define ATTR_rel_list "resource_released_list"
#define ATTR_state "job_state"
#define ATTR_queue "queue"
#define ATTR_resv "resv"
#define ATTR_server "server"
#define ATTR_maxrun "max_running"
#define ATTR_max_run "max_run"
#define ATTR_max_run_res "max_run_res"
#define ATTR_max_run_soft "max_run_soft"
#define ATTR_max_run_res_soft "max_run_res_soft"
#define ATTR_total "total_jobs"
#define ATTR_comment "comment"
#define ATTR_cookie "cookie"
#define ATTR_qrank "queue_rank"
#define ATTR_altid "alt_id"
#define ATTR_altid2 "alt_id2"
#define ATTR_acct_id "accounting_id"
#define ATTR_array "array"
#define ATTR_array_id "array_id"
#define ATTR_array_index "array_index"
#define ATTR_array_state_count "array_state_count"
#define ATTR_array_indices_remaining "array_indices_remaining"
#define ATTR_etime "etime"
#define ATTR_gridname "gridname"
#define ATTR_refresh "last_context_refresh"
#define ATTR_ReqCredEnable "require_cred_enable"
#define ATTR_ReqCred "require_cred"
#define ATTR_runcount "run_count"
#define ATTR_run_version "run_version"
#define ATTR_stime "stime"
#define ATTR_obittime "obittime"
#define ATTR_executable "executable"
#define ATTR_Arglist "argument_list"
#define ATTR_version "pbs_version"
#define ATTR_eligible_time "eligible_time"
#define ATTR_accrue_type "accrue_type"
#define ATTR_sample_starttime "sample_starttime"
#define ATTR_job_kill_delay "job_kill_delay"
#define ATTR_topjob "topjob"
#define ATTR_topjob_ineligible "topjob_ineligible"
#define ATTR_submit_host "Submit_Host"
#define ATTR_cred_id "credential_id"
#define ATTR_cred_validity "credential_validity"
#define ATTR_history_timestamp "history_timestamp"
#define ATTR_create_resv_from_job "create_resv_from_job"
/* Added for finished jobs RFE */
#define ATTR_stageout_status "Stageout_status"
#define ATTR_exit_status "Exit_status"
#define ATTR_submit_arguments "Submit_arguments"
/* additional Reservation attribute names */

#define ATTR_resv_name "Reserve_Name"
#define ATTR_resv_owner "Reserve_Owner"
#define ATTR_resv_Tag "reservation_Tag"
#define ATTR_resv_ID "reserve_ID"
#define ATTR_resv_retry "reserve_retry"
#define ATTR_del_idle_time "delete_idle_time"

/* additional queue attributes names */

#define ATTR_aclgren "acl_group_enable"
#define ATTR_aclgroup "acl_groups"
#define ATTR_aclhten "acl_host_enable"
#define ATTR_aclhost "acl_hosts"
#define ATTR_aclhostmomsen "acl_host_moms_enable"
#define ATTR_acluren "acl_user_enable"
#define ATTR_acluser "acl_users"
#define ATTR_altrouter "alt_router"
#define ATTR_chkptmin "checkpoint_min"
#define ATTR_enable "enabled"
#define ATTR_fromroute "from_route_only"
#define ATTR_HasNodes "hasnodes"
#define ATTR_killdelay "kill_delay"
#define ATTR_maxgrprun "max_group_run"
#define ATTR_maxgrprunsoft "max_group_run_soft"
#define ATTR_maxque "max_queuable"
#define ATTR_max_queued "max_queued"
#define ATTR_max_queued_res "max_queued_res"
#define ATTR_queued_jobs_threshold "queued_jobs_threshold"
#define ATTR_queued_jobs_threshold_res "queued_jobs_threshold_res"
#define ATTR_maxuserrun "max_user_run"
#define ATTR_maxuserrunsoft "max_user_run_soft"
#define ATTR_qtype "queue_type"
#define ATTR_rescassn "resources_assigned"
#define ATTR_rescdflt "resources_default"
#define ATTR_rescmax "resources_max"
#define ATTR_rescmin "resources_min"
#define ATTR_rndzretry "rendezvous_retry"
#define ATTR_routedest "route_destinations"
#define ATTR_routeheld "route_held_jobs"
#define ATTR_routewait "route_waiting_jobs"
#define ATTR_routeretry "route_retry_time"
#define ATTR_routelife "route_lifetime"
#define ATTR_rsvexpdt "reserved_expedite"
#define ATTR_rsvsync "reserved_sync"
#define ATTR_start "started"
#define ATTR_count "state_count"
#define ATTR_number "number_jobs"
#define ATTR_jobscript_max_size "jobscript_max_size"
#ifdef NAS
/* localmod 046 */
#define ATTR_maxstarve "max_starve"
/* localmod 034 */
#define ATTR_maxborrow "max_borrow"
#endif

/* additional server attributes names */

#define ATTR_SvrHost "server_host"
#define ATTR_aclroot "acl_roots"
#define ATTR_managers "managers"
#define ATTR_dfltque "default_queue"
#define ATTR_defnode "default_node"
#define ATTR_locsvrs "location_servers"
#define ATTR_logevents "log_events"
#define ATTR_logfile "log_file"
#define ATTR_mailer "mailer"
#define ATTR_mailfrom "mail_from"
#define ATTR_nodepack "node_pack"
#define ATTR_nodefailrq "node_fail_requeue"
#define ATTR_resendtermdelay "resend_term_delay"
#define ATTR_operators "operators"
#define ATTR_queryother "query_other_jobs"
#define ATTR_resccost "resources_cost"
#define ATTR_rescavail "resources_available"
#define ATTR_maxuserres "max_user_res"
#define ATTR_maxuserressoft "max_user_res_soft"
#define ATTR_maxgroupres "max_group_res"
#define ATTR_maxgroupressoft "max_group_res_soft"
#define ATTR_maxarraysize "max_array_size"
#define ATTR_PNames "pnames"
#define ATTR_schediteration "scheduler_iteration"
#define ATTR_scheduling "scheduling"
#define ATTR_status "server_state"
#define ATTR_syscost "system_cost"
#define ATTR_FlatUID "flatuid"
#define ATTR_ResvEnable "resv_enable"
#define ATTR_aclResvgren "acl_resv_group_enable"
#define ATTR_aclResvgroup "acl_resv_groups"
#define ATTR_aclResvhten "acl_resv_host_enable"
#define ATTR_aclResvhost "acl_resv_hosts"
#define ATTR_aclResvuren "acl_resv_user_enable"
#define ATTR_aclResvuser "acl_resv_users"
#define ATTR_NodeGroupEnable "node_group_enable"
#define ATTR_NodeGroupKey "node_group_key"
#define ATTR_dfltqdelargs "default_qdel_arguments"
#define ATTR_dfltqsubargs "default_qsub_arguments"
#define ATTR_rpp_retry "rpp_retry"
#define ATTR_rpp_highwater "rpp_highwater"
#define ATTR_pbs_license_info "pbs_license_info"
#define ATTR_license_min "pbs_license_min"
#define ATTR_license_max "pbs_license_max"
#define ATTR_license_linger "pbs_license_linger_time"
#define ATTR_license_count "license_count"
#define ATTR_job_sort_formula "job_sort_formula"
#define ATTR_EligibleTimeEnable "eligible_time_enable"
#define ATTR_resv_retry_time "reserve_retry_time"
#define ATTR_resv_retry_init "reserve_retry_init"
#define ATTR_JobHistoryEnable "job_history_enable"
#define ATTR_JobHistoryDuration "job_history_duration"
#define ATTR_max_concurrent_prov "max_concurrent_provision"
#define ATTR_resv_post_processing "resv_post_processing_time"
#define ATTR_backfill_depth "backfill_depth"
#define ATTR_clearesten "clear_topjob_estimates_enable"
#define ATTR_job_requeue_timeout "job_requeue_timeout"
#define ATTR_show_hidden_attribs "show_hidden_attribs"
#define ATTR_python_restart_max_hooks "python_restart_max_hooks"
#define ATTR_python_restart_max_objects "python_restart_max_objects"
#define ATTR_python_restart_min_interval "python_restart_min_interval"
#define ATTR_power_provisioning "power_provisioning"
#define ATTR_sync_mom_hookfiles_timeout "sync_mom_hookfiles_timeout"
#define ATTR_max_job_sequence_id "max_job_sequence_id"
#define ATTR_has_runjob_hook "has_runjob_hook"
#define ATTR_acl_krb_realm_enable "acl_krb_realm_enable"
#define ATTR_acl_krb_realms "acl_krb_realms"
#define ATTR_acl_krb_submit_realms "acl_krb_submit_realms"
#define ATTR_cred_renew_enable "cred_renew_enable"
#define ATTR_cred_renew_tool "cred_renew_tool"
#define ATTR_cred_renew_period "cred_renew_period"
#define ATTR_cred_renew_cache_period "cred_renew_cache_period"
#define ATTR_attr_update_period "attr_update_period"

/**
 * RPP_MAX_PKT_CHECK_DEFAULT controls the number of loops used to process
 * backend data before servicing frontend requests. Smaller values can
 * starve the amount of time spent on backend processing.
 * Larger values can have a marginal impact on latency of frontend requests.
 */
#define ATTR_rpp_max_pkt_check "rpp_max_pkt_check"

/* additional scheduler "attribute" names */

#define ATTR_SchedHost "sched_host"
#define ATTR_sched_cycle_len "sched_cycle_length"
#define ATTR_do_not_span_psets "do_not_span_psets"
#define ATTR_only_explicit_psets "only_explicit_psets"
#define ATTR_sched_preempt_enforce_resumption "sched_preempt_enforce_resumption"
#define ATTR_preempt_targets_enable "preempt_targets_enable"
#define ATTR_job_sort_formula_threshold "job_sort_formula_threshold"
#define ATTR_throughput_mode "throughput_mode"
#define ATTR_opt_backfill_fuzzy "opt_backfill_fuzzy"
#define ATTR_partition "partition"
#define ATTR_sched_priv "sched_priv"
#define ATTR_sched_log "sched_log"
#define ATTR_sched_user "sched_user"
#define ATTR_sched_state "state"
#define ATTR_sched_preempt_queue_prio "preempt_queue_prio"
#define ATTR_sched_preempt_prio "preempt_prio"
#define ATTR_sched_preempt_order "preempt_order"
#define ATTR_sched_preempt_sort "preempt_sort"
#define ATTR_sched_server_dyn_res_alarm "server_dyn_res_alarm"
#define ATTR_job_run_wait "job_run_wait"

/* additional node "attributes" names */

#define ATTR_NODE_Host "Host" /* in 8.0, replaced with ATTR_NODE_Mom */
#define ATTR_NODE_Mom "Mom"
#define ATTR_NODE_Port "Port"
#define ATTR_NODE_state "state"
#define ATTR_NODE_ntype "ntype"
#define ATTR_NODE_jobs "jobs"
#define ATTR_NODE_resvs "resv"
#define ATTR_NODE_resv_enable "resv_enable"
#define ATTR_NODE_np "np"
#define ATTR_NODE_pcpus "pcpus"
#define ATTR_NODE_properties "properties"
#define ATTR_NODE_NoMultiNode "no_multinode_jobs"
#define ATTR_NODE_No_Tasks "no_tasks"
#define ATTR_NODE_Sharing "sharing"
#define ATTR_NODE_ProvisionEnable "provision_enable"
#define ATTR_NODE_current_aoe "current_aoe"
#define ATTR_NODE_in_multivnode_host "in_multivnode_host"
#define ATTR_NODE_License "license"
#define ATTR_NODE_LicenseInfo "license_info"
#define ATTR_NODE_TopologyInfo "topology_info"
#define ATTR_NODE_MaintJobs "maintenance_jobs"
#define ATTR_NODE_VnodePool "vnode_pool"
#define ATTR_NODE_current_eoe "current_eoe"
#define ATTR_NODE_power_provisioning "power_provisioning"
#define ATTR_NODE_poweroff_eligible "poweroff_eligible"
#define ATTR_NODE_last_state_change_time "last_state_change_time"
#define ATTR_NODE_last_used_time "last_used_time"

#define ND_RESC_LicSignature "lic_signature" /* custom resource used for licensing */

/* Resource "attribute" names */
#define ATTR_RESC_TYPE "type"
#define ATTR_RESC_FLAG "flag"

/* various attribute values */

#define CHECKPOINT_UNSPECIFIED "u"
#define NO_HOLD "n"
#define NO_JOIN "n"
#define NO_KEEP "n"
#define MAIL_AT_ABORT "a"

#define USER_HOLD "u"
#define OTHER_HOLD "o"
#define SYSTEM_HOLD "s"
#define BAD_PASSWORD_HOLD "p"

/* Add new MGR_CMDs before MGR_CMD_LAST */
enum mgr_cmd {
	MGR_CMD_NONE = -1,
	MGR_CMD_CREATE,
	MGR_CMD_DELETE,
	MGR_CMD_SET,
	MGR_CMD_UNSET,
	MGR_CMD_LIST,
	MGR_CMD_PRINT,
	MGR_CMD_ACTIVE,
	MGR_CMD_IMPORT,
	MGR_CMD_EXPORT,
	MGR_CMD_LAST
};

/* Add new MGR_OBJs before MGR_OBJ_LAST */
enum mgr_obj {
	MGR_OBJ_NONE = -1,
	MGR_OBJ_SERVER,		 /* Server	*/
	MGR_OBJ_QUEUE,		 /* Queue	*/
	MGR_OBJ_JOB,		 /* Job		*/
	MGR_OBJ_NODE,		 /* Vnode  	*/
	MGR_OBJ_RESV,		 /* Reservation	*/
	MGR_OBJ_RSC,		 /* Resource	*/
	MGR_OBJ_SCHED,		 /* Scheduler	*/
	MGR_OBJ_HOST,		 /* Host  	*/
	MGR_OBJ_HOOK,		 /* Hook         */
	MGR_OBJ_PBS_HOOK,	 /* PBS Hook     */
	MGR_OBJ_JOBARRAY_PARENT, /* Job array parent */
	MGR_OBJ_SUBJOB,		 /* Sub Job */
	MGR_OBJ_LAST		 /* Last entry	*/
};

#define MGR_OBJ_SITE_HOOK MGR_OBJ_HOOK
#define SITE_HOOK "hook"
#define PBS_HOOK "pbshook"

/* Misc defines for various requests */
#define MSG_OUT 1
#define MSG_ERR 2

/* SUSv2 guarantees that host names are limited to 255 bytes */
#define PBS_MAXHOSTNAME 255 /* max host name length */
#ifndef MAXPATHLEN
#define MAXPATHLEN 1024 /* max path name length */
#endif
#ifndef MAXNAMLEN
#define MAXNAMLEN 255
#endif
#define MSVR_JID_NCHARS_SVR 2 /* No. of chars reserved for svr instance in job ids for multi-server */
#define PBS_MAXSCHEDNAME 15
#define PBS_MAXUSER 256											   /* max user name length */
#define PBS_MAXPWLEN 256										   /* max password length */
#define PBS_MAXGRPN 256											   /* max group name length */
#define PBS_MAXQUEUENAME 15										   /* max queue name length */
#define PBS_MAXJOBNAME 230										   /* max job name length */
#define PBS_MAXSERVERNAME PBS_MAXHOSTNAME								   /* max server name length */
#define MAX_SVR_ID (PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 1)						   /* svr_id is of the form sever_name:port */
#define PBS_MAXSEQNUM 12										   /* max sequence number length */
#define PBS_DFLT_MAX_JOB_SEQUENCE_ID 9999999								   /* default value of max_job_sequence_id server attribute */
#define PBS_MAXPORTNUM 5										   /* udp/tcp port numbers max=16 bits */
#define PBS_MAXSVRJOBID (PBS_MAXSEQNUM + MSVR_JID_NCHARS_SVR - 1 + PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2) /* server job id size, -1 to keep same length when made SEQ 7 */
#define PBS_MAXSVRRESVID (PBS_MAXSVRJOBID + 1)
#define PBS_MAXQRESVNAME (PBS_MAXQUEUENAME)
#define PBS_MAXCLTJOBID (PBS_MAXSVRJOBID + PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2)   /* client job id size */
#define PBS_MAXDEST 256								     /* destination size */
#define PBS_MAXROUTEDEST (PBS_MAXQUEUENAME + PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2) /* destination size */
#define PBS_INTERACTIVE 1							     /* Support of Interactive jobs */
#define PBS_TERM_BUF_SZ 80							     /* Interactive term buffer size */
#define PBS_TERM_CCA 6								     /* Interactive term cntl char array */
#define PBS_RESV_ID_CHAR 'R'							     /* Character in front of a resv ID */
#define PBS_STDNG_RESV_ID_CHAR 'S'						     /* Character in front of a resv ID */
#define PBS_MNTNC_RESV_ID_CHAR 'M'						     /* Character in front of a resv ID */
#define PBS_AUTH_KEY_LEN (129)
#define PBS_MAXIP_LEN 15							     /* max ip address length */

/* the pair to this list is in module_pbs_v1.c and must be updated to reflect any changes */
enum batch_op { SET,
		UNSET,
		INCR,
		DECR,
		EQ,
		NE,
		GE,
		GT,
		LE,
		LT,
		DFLT,
		INTERNAL
};

/* shutdown manners externally visible */
#define SHUT_IMMEDIATE 0
#define SHUT_DELAY 1
#define SHUT_QUICK 2

/* messages that may be passsed  by pbs_deljob() api to the server  via its extend parameter*/

#define FORCE "force"
#define NOMAIL "nomail"
#define SUPPRESS_EMAIL "suppress_email"
#define DELETEHISTORY "deletehist"

/*
 ** This structure is identical to attropl so they can be used
 ** interchangably.  The op field is not used.
 */
struct attrl {
	struct attrl *next;
	char *name;
	char *resource;
	char *value;
	enum batch_op op; /* not used */
};

struct attropl {
	struct attropl *next;
	char *name;
	char *resource;
	char *value;
	enum batch_op op;
};

struct batch_status {
	struct batch_status *next;
	char *name;
	struct attrl *attribs;
	char *text;
};

struct batch_deljob_status {
	struct batch_deljob_status *next;
	char *name;
	int code;
};

/* structure to hold an attribute that failed verification at ECL
 * and the associated errcode and errmsg
 */
struct ecl_attrerr {
	struct attropl *ecl_attribute;
	int ecl_errcode;
	char *ecl_errmsg;
};

/* structure to hold a number of attributes that failed verification */
struct ecl_attribute_errors {
	int ecl_numerrors;		 /* num of attributes that failed verification */
	struct ecl_attrerr *ecl_attrerr; /* ecl_attrerr array of structs */
};

enum preempt_method {
	PREEMPT_METHOD_LOW,
	PREEMPT_METHOD_SUSPEND,
	PREEMPT_METHOD_CHECKPOINT,
	PREEMPT_METHOD_REQUEUE,
	PREEMPT_METHOD_DELETE,
	PREEMPT_METHOD_HIGH
};

typedef struct preempt_job_info {
	char job_id[PBS_MAXSVRJOBID + 1];
	char order[PREEMPT_METHOD_HIGH + 1];
} preempt_job_info;

/* Resource Reservation Information */
typedef int pbs_resource_t; /* resource reservation handle */

#define RESOURCE_T_NULL (pbs_resource_t) 0
#define RESOURCE_T_ALL (pbs_resource_t) - 1

enum resv_states { RESV_NONE,
		   RESV_UNCONFIRMED,
		   RESV_CONFIRMED,
		   RESV_WAIT,
		   RESV_TIME_TO_RUN,
		   RESV_RUNNING,
		   RESV_FINISHED,
		   RESV_BEING_DELETED,
		   RESV_DELETED,
		   RESV_DELETING_JOBS,
		   RESV_DEGRADED,
		   RESV_BEING_ALTERED,
		   RESV_IN_CONFLICT };

#ifdef _USRDLL /* This is only for building Windows DLLs
			 * and not their static libraries
			 */

#ifdef DLL_EXPORT
#define DECLDIR __declspec(dllexport)
#else
#define DECLDIR __declspec(dllimport)
#endif

#ifndef __PBS_ERRNO
#define __PBS_ERRNO
DECLDIR int *__pbs_errno_location(void);
#define pbs_errno (*__pbs_errno_location())
#endif

/* server attempted to connect | connected to */
/* see pbs_connect(3B)			      */
#ifndef __PBS_SERVER
#define __PBS_SERVER
DECLDIR char *__pbs_server_location(void);
#define pbs_server (__pbs_server_location())
#endif

DECLDIR int pbs_asyrunjob(int, char *, char *, char *);

DECLDIR int pbs_alterjob(int, char *, struct attrl *, char *);

DECLDIR int pbs_connect(char *);

DECLDIR int pbs_connect_extend(char *, char *);

DECLDIR char *pbs_default(void);

DECLDIR int pbs_deljob(int, char *, char *);

DECLDIR struct batch_deljob_status *pbs_deljoblist(int, char **, int, char *);

DECLDIR int pbs_disconnect(int);

DECLDIR char *pbs_geterrmsg(int);

DECLDIR int pbs_holdjob(int, char *, char *, char *);

DECLDIR char *pbs_locjob(int, char *, char *);

DECLDIR int pbs_manager(int, int, int, char *, struct attropl *, char *);

DECLDIR int pbs_movejob(int, char *, char *, char *);

DECLDIR int pbs_msgjob(int, char *, int, char *, char *);

DECLDIR int pbs_relnodesjob(int, char *, char *, char *);

DECLDIR int pbs_orderjob(int, char *, char *, char *);

DECLDIR int pbs_rerunjob(int, char *, char *);

DECLDIR int pbs_rlsjob(int, char *, char *, char *);

DECLDIR int pbs_runjob(int, char *, char *, char *);

DECLDIR char **pbs_selectjob(int, struct attropl *, char *);

DECLDIR int pbs_sigjob(int, char *, char *, char *);

DECLDIR void pbs_statfree(struct batch_status *);

DECLDIR struct batch_status *pbs_statrsc(int, char *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_statjob(int, char *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_selstat(int, struct attropl *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_statque(int, char *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_statserver(int, struct attrl *, char *);

DECLDIR struct batch_status *pbs_statsched(int, struct attrl *, char *);

DECLDIR struct batch_status *pbs_stathost(int, char *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_statnode(int, char *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_statvnode(int, char *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_statresv(int, char *, struct attrl *, char *);

DECLDIR struct batch_status *pbs_stathook(int, char *, struct attrl *, char *);

DECLDIR struct ecl_attribute_errors *pbs_get_attributes_in_error(int);

DECLDIR char *pbs_submit(int, struct attropl *, char *, char *, char *);

DECLDIR char *pbs_submit_resv(int, struct attropl *, char *);

DECLDIR int pbs_delresv(int, char *, char *);

DECLDIR int pbs_terminate(int, int, char *);

DECLDIR char *pbs_modify_resv(int, char *, struct attropl *, char *);

DECLDIR preempt_job_info *pbs_preempt_jobs(int, char **);
#else

#ifndef __PBS_ERRNO
#define __PBS_ERRNO
extern int *__pbs_errno_location(void);
#define pbs_errno (*__pbs_errno_location())
#endif

/* see pbs_connect(3B)			      */
#ifndef __PBS_SERVER
#define __PBS_SERVER
extern char *__pbs_server_location(void);
#define pbs_server (__pbs_server_location())
#endif

extern int pbs_asyrunjob(int, const char *, const char *, const char *);

extern int pbs_asyrunjob_ack(int, const char *, const char *, const char *);

extern int pbs_alterjob(int, const char *, struct attrl *, const char *);

extern int pbs_asyalterjob(int c, const char *jobid, struct attrl *attrib, const char *extend);

extern int pbs_confirmresv(int, const char *, const char *, unsigned long, const char *);

extern int pbs_connect(const char *);

extern int pbs_connect_extend(const char *, const char *);

extern int pbs_disconnect(int);

extern int pbs_manager(int, int, int, const char *, struct attropl *, const char *);

extern char *pbs_default(void);

extern int pbs_deljob(int, const char *, const char *);

extern struct batch_deljob_status *pbs_deljoblist(int, char **, int, const char *);

extern char *pbs_geterrmsg(int);

extern int pbs_holdjob(int, const char *, const char *, const char *);

extern int pbs_loadconf(int);

extern char *pbs_locjob(int, const char *, const char *);

extern int pbs_movejob(int, const char *, const char *, const char *);

extern int pbs_msgjob(int, const char *, int, const char *, const char *);

extern int pbs_relnodesjob(int, const char *, const char *, const char *);

extern int pbs_orderjob(int, const char *, const char *, const char *);

extern int pbs_rerunjob(int, const char *, const char *);

extern int pbs_rlsjob(int, const char *, const char *, const char *);

extern int pbs_runjob(int, const char *, const char *, const char *);

extern char **pbs_selectjob(int, struct attropl *, const char *);

extern int pbs_sigjob(int, const char *, const char *, const char *);

extern void pbs_statfree(struct batch_status *);

extern void pbs_delstatfree(struct batch_deljob_status *);

extern struct batch_status *pbs_statrsc(int, const char *, struct attrl *, const char *);

extern struct batch_status *pbs_statjob(int, const char *, struct attrl *, const char *);

extern struct batch_status *pbs_selstat(int, struct attropl *, struct attrl *, const char *);

extern struct batch_status *pbs_statque(int, const char *, struct attrl *, const char *);

extern struct batch_status *pbs_statserver(int, struct attrl *, const char *);

extern struct batch_status *pbs_statsched(int, struct attrl *, const char *);

extern struct batch_status *pbs_stathost(int, const char *, struct attrl *, const char *);

extern struct batch_status *pbs_statnode(int, const char *, struct attrl *, const char *);

extern struct batch_status *pbs_statvnode(int, const char *, struct attrl *, const char *);

extern struct batch_status *pbs_statresv(int, const char *, struct attrl *, const char *);

extern struct batch_status *pbs_stathook(int, const char *, struct attrl *, const char *);

extern struct ecl_attribute_errors *pbs_get_attributes_in_error(int);

extern char *pbs_submit(int, struct attropl *, const char *, const char *, const char *);

extern char *pbs_submit_resv(int, struct attropl *, const char *);

extern int pbs_delresv(int, const char *, const char *);

extern int pbs_terminate(int, int, const char *);

extern char *pbs_modify_resv(int, const char *, struct attropl *, const char *);

extern preempt_job_info *pbs_preempt_jobs(int, char **);
#endif /* _USRDLL */

#ifdef __cplusplus
}
#endif
#endif /* _PBS_IFL_H */


================================================
FILE: src/include/pbs_internal.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_INTERNAL_H
#define _PBS_INTERNAL_H

#ifdef __cplusplus
extern "C" {
#endif

#include <stdbool.h>
#include "pbs_ifl.h"
#include "portability.h"
#include "libutil.h"
#include "auth.h"

/*
 *
 *  pbs_internal.h
 *  This file contains all the definitions that are used by internal tools/cmds
 *  by pbs/pbs suite products like Aif.
 *
 */

/* node-attribute values (state,ntype) */

#define ND_free "free"
#define ND_offline "offline"
#define ND_offline_by_mom "offline_by_mom"
#define ND_down "down"
#define ND_Stale "Stale"
#define ND_jobbusy "job-busy"
#define ND_job_exclusive "job-exclusive"
#define ND_resv_exclusive "resv-exclusive"
#define ND_job_sharing "job-sharing"
#define ND_busy "busy"
#define ND_state_unknown "state-unknown"
#define ND_prov "provisioning"
#define ND_wait_prov "wait-provisioning"
#define ND_maintenance "maintenance"
#define ND_pbs "PBS"
#define ND_Default_Shared "default_shared"
#define ND_Default_Excl "default_excl"
#define ND_Default_Exclhost "default_exclhost"
#define ND_Ignore_Excl "ignore_excl"
#define ND_Force_Excl "force_excl"
#define ND_Force_Exclhost "force_exclhost"
#define ND_Initializing "initializing"
#define ND_unresolvable "unresolvable"
#define ND_sleep "sleep"

/* Defines for type of Attribute based on data type 			*/
/* currently limited to 4 bits (max number 15)				*/

#define ATR_TYPE_NONE 0	   /* Not to be used */
#define ATR_TYPE_LONG 1	   /* Long integer, also Boolean */
#define ATR_TYPE_CHAR 2	   /* single character */
#define ATR_TYPE_STR 3	   /* string, null terminated */
#define ATR_TYPE_ARST 4	   /* Array of strings (char **) */
#define ATR_TYPE_SIZE 5	   /* size (integer + suffix) */
#define ATR_TYPE_RESC 6	   /* list type: resources only */
#define ATR_TYPE_LIST 7	   /* list type:  dependencies, unkn, etc */
#define ATR_TYPE_ACL 8	   /* Access Control Lists */
#define ATR_TYPE_LL 9	   /* Long (64 bit) integer */
#define ATR_TYPE_SHORT 10  /* short integer    */
#define ATR_TYPE_BOOL 11   /* boolean	    */
#define ATR_TYPE_JINFOP 13 /* struct jobinfo*  */
#define ATR_TYPE_FLOAT 14  /* Float  */
#define ATR_TYPE_ENTITY 15 /* FGC Entity Limit */
/* WARNING: adding anther WILL overflow the type field in the attribut_def */

/* Defines for  Flag field in attribute_def */

#define ATR_DFLAG_USRD 0x01    /* User client can read (status) attribute */
#define ATR_DFLAG_USWR 0x02    /* User client can write (set)   attribute */
#define ATR_DFLAG_OPRD 0x04    /* Operator client can read   attribute */
#define ATR_DFLAG_OPWR 0x08    /* Operator client can write  attribute */
#define ATR_DFLAG_MGRD 0x10    /* Manager client can read  attribute */
#define ATR_DFLAG_MGWR 0x20    /* Manager client can write attribute */
#define ATR_DFLAG_OTHRD 0x40   /* Reserved */
#define ATR_DFLAG_Creat 0x80   /* Can be set on create only */
#define ATR_DFLAG_SvRD 0x100   /* job attribute is sent to server on move */
#define ATR_DFLAG_SvWR 0x200   /* job attribute is settable by server/Sch */
#define ATR_DFLAG_MOM 0x400    /* attr/resc sent to MOM "iff" set	   */
#define ATR_DFLAG_RDACC 0x515  /* Read access mask  */
#define ATR_DFLAG_WRACC 0x6AA  /* Write access mask */
#define ATR_DFLAG_ACCESS 0x7ff /* Mask access flags */

#define ATR_DFLAG_ALTRUN 0x0800	 /* (job) attr/resc is alterable in Run state  */
#define ATR_DFLAG_NOSAVM 0x1000	 /* object not saved on attribute modify       */
#define ATR_DFLAG_SELEQ 0x2000	 /* attribute is only selectable eq/ne	      */
#define ATR_DFLAG_RASSN 0x4000	 /* resc in server/queue resources_assigned    */
#define ATR_DFLAG_ANASSN 0x8000	 /* resource in all node resources_assigned  */
#define ATR_DFLAG_FNASSN 0x10000 /* resource in 1st node resources_assigned  */
#define ATR_DFLAG_CVTSLT 0x20000 /* used in or converted to select directive */
#define ATR_DFLAG_SCGALT 0x40000 /* if altered during sched cycle dont run job*/
#define ATR_DFLAG_HIDDEN 0x80000 /* if set, keep attribute hidden to client */

#define SHUT_MASK 0xf
#define SHUT_WHO_MASK 0x1f0
#define SHUT_SIG 8
#define SHUT_WHO_SCHED 0x10	 /* also shutdown Scheduler	  */
#define SHUT_WHO_MOM 0x20	 /* also shutdown Moms		  */
#define SHUT_WHO_SECDRY 0x40	 /* also shutdown Secondary Server */
#define SHUT_WHO_IDLESECDRY 0x80 /* idle the Secondary Server    */
#define SHUT_WHO_SECDONLY 0x100	 /* shut down the Secondary only */

#define SIG_RESUME "resume"
#define SIG_SUSPEND "suspend"
#define SIG_TermJob "TermJob"
#define SIG_RERUN "Rerun"
#define SIG_ADMIN_SUSPEND "admin-suspend"
#define SIG_ADMIN_RESUME "admin-resume"

#define PLACE_Group "group"
#define PLACE_Excl "excl"
#define PLACE_ExclHost "exclhost"
#define PLACE_Shared "shared"
#define PLACE_Free "free"
#define PLACE_Pack "pack"
#define PLACE_Scatter "scatter"
#define PLACE_VScatter "vscatter"

#define ATR_TRUE "True"
#define ATR_FALSE "False"

#ifdef WIN32
#define ESC_CHAR '^' /* commonly used in windows cmd shell */
#else
#define ESC_CHAR '\\'
#endif

/* set of characters that are not allowed in a queue name */
#define INVALID_QUEUE_NAME_CHARS "`~!$%^&*()+=<>?;'\"|"

/*constant related to sum of string lengths for above strings*/
#define MAX_ENCODE_BFR 100

/* Default value of Node fail requeue (ATTR_nodefailrq)*/
#define PBS_NODE_FAIL_REQUEUE_DEFAULT 310

/* Default value of resend_term_delay (ATTR_resendtermdelay)*/
#define PBS_RESEND_TERM_DELAY_DEFAULT 5

/* Default value of preempt_queue_prio */
#define PBS_PREEMPT_QUEUE_PRIO_DEFAULT 150

/* Default value of server_dyn_res_alarm */
#define PBS_SERVER_DYN_RES_ALARM_DEFAULT 30

/* Default value of preempt_prio */
#define PBS_PREEMPT_PRIO_DEFAULT "express_queue, normal_jobs"

/* Default value of preempt_order */
#define PBS_PREEMPT_ORDER_DEFAULT "SCR"

/* Default value of preempt_sort */
#define PBS_PREEMPT_SORT_DEFAULT "min_time_since_start"

// clang-format off
struct pbs_config
{
	unsigned loaded:1;			/* has the conf file been loaded? */
	unsigned load_failed:1;		/* previously loaded and failed */
	unsigned start_server:1;		/* should the server be started */
	unsigned start_mom:1;			/* should the mom be started */
	unsigned start_sched:1;		/* should the scheduler be started */
	unsigned start_comm:1; 		/* should the comm daemon be started */
	unsigned locallog:1;			/* do local logging */
	char **supported_auth_methods;		/* supported auth methods on server */
	char **auth_service_users;		/* recognised service users */
	char encrypt_method[MAXAUTHNAME + 1];	/* auth method to used for encrypt/decrypt data */
	char auth_method[MAXAUTHNAME + 1];	/* default auth_method to used by client */
	char interactive_auth_method[MAXAUTHNAME + 1];	/* auth_method used in interactive qsub sessions */
	char interactive_encrypt_method[MAXAUTHNAME + 1];	/* encrypt_method used in interactive qsub sessions */
	unsigned int sched_modify_event:1;	/* whether to trigger modifyjob hook event or not */
	unsigned syslogfac;		        /* syslog facility */
	unsigned syslogsvr;			/* min priority to log to syslog */
	unsigned int batch_service_port;	/* PBS batch_service_port */
	unsigned int batch_service_port_dis;	/* PBS batch_service_port_dis */
	unsigned int mom_service_port;	/* PBS mom_service_port */
	unsigned int manager_service_port;	/* PBS manager_service_port */
	unsigned int pbs_data_service_port;    /* PBS data_service port */
	char *pbs_conf_file;			/* full path of the pbs.conf file */
	char *pbs_home_path;			/* path to the pbs home dir */
	char *pbs_exec_path;			/* path to the pbs exec dir */
	char *pbs_server_name;		/* name of PBS Server, usually hostname of host on which PBS server is executing */
	char *cp_path;			/* path to local copy function */
	char *scp_path;			/* path to scp, overriding the default (OS-dependent) one */
	char *scp_args;			/* arguments for scp, overriding the default (OS-dependent) ones */
	char *rcp_path;			/* path to pbs_rsh */
	char *pbs_demux_path;			/* path to pbs demux */
	char *pbs_environment;		/* path to pbs_environment file */
	char *iff_path;			/* path to pbs_iff */
	char *pbs_primary;			/* FQDN of host with primary server */
	char *pbs_secondary;			/* FQDN of host with secondary server */
	char *pbs_mom_home;			/* path to alternate home for Mom */
	char *pbs_core_limit;			/* RLIMIT_CORE setting */
	char *pbs_data_service_host;		/* dataservice host */
	char *pbs_tmpdir;			/* temporary file directory */
	char *pbs_server_host_name;	/* name of host on which Server is running */
	char *pbs_public_host_name;	/* name of the local host for outgoing connections */
	char *pbs_mail_host_name;	/* name of host to which to address mail */
	char *pbs_smtp_server_name;   /* name of SMTP host to which to send mail */
	char *pbs_output_host_name;	/* name of host to which to stage std out/err */
	unsigned pbs_use_compression:1;	/* whether pbs should compress communication data */
	unsigned pbs_use_mcast:1;		/* whether pbs should multicast communication */
	char *pbs_leaf_name;			/* non-default name of this leaf in the communication network */
	char *pbs_leaf_routers;		/* for this leaf, the optional list of routers to talk to */
	char *pbs_comm_name;			/* non-default name of this router in the communication network */
	char *pbs_comm_routers;		/* for this router, the optional list of other routers to talk to */
	long  pbs_comm_log_events;      /* log_events for pbs_comm process, default 0 */
	unsigned int pbs_comm_threads;	/* number of threads for router, default 4 */
	char *pbs_mom_node_name;	/* mom short name used for natural node, default NULL */
	unsigned int pbs_log_highres_timestamp; /* high resolution logging */
	unsigned int pbs_sched_threads;	/* number of threads for scheduler */
	char *pbs_daemon_service_user; /* user the scheduler runs as */
	char *pbs_daemon_service_auth_user; /* auth user the scheduler runs as */
	char *pbs_privileged_auth_user; /* auth user with admin access */
	char *pbs_gss_user_creds_bin; /* path to user credentials program */
	char current_user[PBS_MAXUSER+1]; /* current running user */
#ifdef WIN32
	char *pbs_conf_remote_viewer; /* Remote viewer client executable for PBS GUI jobs, along with launch options */
#endif
};

extern struct pbs_config pbs_conf;

// clang-format on

/*
 * NOTE: PBS_CONF_PATH is no longer defined here. It has moved into
 * the pbs_config.h file generated by configure and has been renamed
 * to PBS_CONF_FILE to reflect the environment variable that can
 * now override the value defined at compile time.
 */

/* names in the pbs.conf file */
#define PBS_CONF_START_SERVER	"PBS_START_SERVER"	/* start the server? */
#define PBS_CONF_START_MOM	"PBS_START_MOM"		   /* start the mom? */
#define PBS_CONF_START_SCHED	"PBS_START_SCHED"    /* start the scheduler? */
#define PBS_CONF_START_COMM 	"PBS_START_COMM"    /* start the comm? */
#define PBS_CONF_LOCALLOG	"PBS_LOCALLOG"	/* non-zero to force logging */
#define PBS_CONF_SYSLOG		"PBS_SYSLOG"	  /* non-zero for syslogging */
#define PBS_CONF_SYSLOGSEVR	"PBS_SYSLOGSEVR"  /* severity lvl for syslog */
#define PBS_CONF_BATCH_SERVICE_PORT	     "PBS_BATCH_SERVICE_PORT"
#define PBS_CONF_BATCH_SERVICE_PORT_DIS	     "PBS_BATCH_SERVICE_PORT_DIS"
#define PBS_CONF_MOM_SERVICE_PORT	     "PBS_MOM_SERVICE_PORT"
#define PBS_CONF_MANAGER_SERVICE_PORT	     "PBS_MANAGER_SERVICE_PORT"
#define PBS_CONF_DATA_SERVICE_PORT           "PBS_DATA_SERVICE_PORT"
#define PBS_CONF_DATA_SERVICE_HOST           "PBS_DATA_SERVICE_HOST"
#define PBS_CONF_USE_COMPRESSION     	     "PBS_USE_COMPRESSION"
#define PBS_CONF_USE_MCAST		     "PBS_USE_MCAST"
#define PBS_CONF_LEAF_NAME		     "PBS_LEAF_NAME"
#define PBS_CONF_LEAF_ROUTERS		     "PBS_LEAF_ROUTERS"
#define PBS_CONF_COMM_NAME		     "PBS_COMM_NAME"
#define PBS_CONF_COMM_ROUTERS		     "PBS_COMM_ROUTERS"
#define PBS_CONF_COMM_THREADS		     "PBS_COMM_THREADS"
#define PBS_CONF_COMM_LOG_EVENTS	     "PBS_COMM_LOG_EVENTS"
#define PBS_CONF_HOME		"PBS_HOME"	 	 /* path to pbs home */
#define PBS_CONF_EXEC		"PBS_EXEC"		 /* path to pbs exec */
#define PBS_CONF_DEFAULT_NAME	"PBS_DEFAULT"	  /* old name for PBS_SERVER */
#define PBS_CONF_SERVER_NAME	"PBS_SERVER"	   /* name of the pbs server */
#define PBS_CONF_INSTALL_MODE    "PBS_INSTALL_MODE" /* PBS installation mode */
#define PBS_CONF_RCP		"PBS_RCP"
#define PBS_CONF_CP		"PBS_CP"
#define PBS_CONF_SCP		"PBS_SCP"		      /* path to scp */
#define PBS_CONF_SCP_ARGS	"PBS_SCP_ARGS"		      /* args for scp */
#define PBS_CONF_ENVIRONMENT    "PBS_ENVIRONMENT" /* path to pbs_environment */
#define PBS_CONF_PRIMARY	"PBS_PRIMARY"  /* Primary Server in failover */
#define PBS_CONF_SECONDARY	"PBS_SECONDARY"	/* Secondary Server failover */
#define PBS_CONF_MOM_HOME	"PBS_MOM_HOME"  /* alt Mom home for failover */
#define PBS_CONF_CORE_LIMIT	"PBS_CORE_LIMIT"      /* RLIMIT_CORE setting */
#define PBS_CONF_SERVER_HOST_NAME "PBS_SERVER_HOST_NAME"
#define PBS_CONF_PUBLIC_HOST_NAME "PBS_PUBLIC_HOST_NAME"
#define PBS_CONF_MAIL_HOST_NAME "PBS_MAIL_HOST_NAME"
#define PBS_CONF_OUTPUT_HOST_NAME "PBS_OUTPUT_HOST_NAME"
#define PBS_CONF_SMTP_SERVER_NAME "PBS_SMTP_SERVER_NAME" /* Name of SMTP Host to send mail to */
#define PBS_CONF_TMPDIR		"PBS_TMPDIR"     /* temporary file directory */
#define PBS_CONF_INTERACTIVE_AUTH_METHOD	"PBS_INTERACTIVE_AUTH_METHOD"	/* Authentication method used in qsub interactive */
#define PBS_CONF_INTERACTIVE_ENCRYPT_METHOD	"PBS_INTERACTIVE_ENCRYPT_METHOD"	/* Encryption method used in qsub interactive */
#define PBS_CONF_AUTH		"PBS_AUTH_METHOD"
#define PBS_CONF_ENCRYPT_METHOD	"PBS_ENCRYPT_METHOD"
#define PBS_CONF_SUPPORTED_AUTH_METHODS	"PBS_SUPPORTED_AUTH_METHODS"
#define PBS_CONF_AUTH_SERVICE_USERS	"PBS_AUTH_SERVICE_USERS"
#define PBS_CONF_SCHEDULER_MODIFY_EVENT	"PBS_SCHEDULER_MODIFY_EVENT"
#define PBS_CONF_MOM_NODE_NAME	"PBS_MOM_NODE_NAME"
#define PBS_CONF_LOG_HIGHRES_TIMESTAMP	"PBS_LOG_HIGHRES_TIMESTAMP"
#define PBS_CONF_SCHED_THREADS	"PBS_SCHED_THREADS"
#define PBS_CONF_DAEMON_SERVICE_USER "PBS_DAEMON_SERVICE_USER"
#define PBS_CONF_DAEMON_SERVICE_AUTH_USER "PBS_DAEMON_SERVICE_AUTH_USER"
#define PBS_CONF_PRIVILEGED_AUTH_USER "PBS_PRIVILEGED_AUTH_USER" /* e.g.: used for gss/krb and krb host principal (host/<fqdn>@<REALM>) is expected */
#define PBS_CONF_GSS_USER_CREDENTIALS_BIN "PBS_GSS_USER_CREDENTIALS_BIN"
#ifdef WIN32
#define PBS_CONF_REMOTE_VIEWER "PBS_REMOTE_VIEWER"	/* Executable for remote viewer application alongwith its launch options, for PBS GUI jobs */
#endif
#define LOCALHOST_FULLNAME "localhost.localdomain"
#define LOCALHOST_SHORTNAME "localhost"

/* someday the PBS_*_PORT definition will go away and only the	*/
/* PBS_*_SERVICE_NAME form will be used, maybe			*/

#define PBS_BATCH_SERVICE_NAME		"pbs"
#define PBS_BATCH_SERVICE_PORT		15001
#define PBS_BATCH_SERVICE_NAME_DIS	"pbs_dis"	/* new DIS port   */
#define PBS_BATCH_SERVICE_PORT_DIS	15001		/* new DIS port   */
#define PBS_MOM_SERVICE_NAME		"pbs_mom"
#define PBS_MOM_SERVICE_PORT		15002
#define PBS_MANAGER_SERVICE_NAME	"pbs_resmon"
#define PBS_MANAGER_SERVICE_PORT	15003
#define PBS_SCHEDULER_SERVICE_NAME	"pbs_sched"
#define PBS_SCHEDULER_SERVICE_PORT	15004
#define PBS_DATA_SERVICE_NAME           "pbs_dataservice"
#define PBS_DATA_SERVICE_STORE_NAME     "pbs_datastore"

/* Values for Job's ATTR_accrue_type */
enum accrue_types {
	JOB_INITIAL = 0,
	JOB_INELIGIBLE,
	JOB_ELIGIBLE,
	JOB_RUNNING,
	JOB_EXIT
};

#define	ACCRUE_NEW	"0"
#define	ACCRUE_INEL	"1"
#define	ACCRUE_ELIG	"2"
#define	ACCRUE_RUNN	"3"
#define	ACCRUE_EXIT	"4"


/* Default values for degraded reservation retry times boundary. 7200 seconds
 * is 2hrs and is considered to be a reasonable amount of time to wait before
 * confirming that a reservation is indeed degraded, and that an attempt to
 * reconfirm won't be made if the reservation is to start within the cutoff
 * time.
 */

#define RESV_RETRY_TIME_DEFAULT 600

#define PBS_RESV_CONFIRM_FAIL "PBS_RESV_CONFIRM_FAIL"   /* Used to inform server that a reservation could not be confirmed */
#define PBS_RESV_CONFIRM_SUCCESS "PBS_RESV_CONFIRM_SUCCESS"   /* Used to inform server that a reservation could be confirmed */
#define DEFAULT_PARTITION "pbs-default" /* Default partition name set on the reservation queue when the reservation is confirmed by default scheduler */

#define PBS_USE_IFF		1	/* pbs_connect() to call pbs_iff */


/* time flag 2030-01-01 01:01:00 for ASAP reservation */
#define PBS_RESV_FUTURE_SCH 1893488460L


/* this is the PBS default max_concurrent_provision value */
#define PBS_MAX_CONCURRENT_PROV 5

/* this is the PBS max lenth of quote parse error messages */
#define PBS_PARSE_ERR_MSG_LEN_MAX 50

/* this is the PBS defult jobscript_max_size default value is 100MB*/
#define DFLT_JOBSCRIPT_MAX_SIZE "100mb"

/* internal attributes */
#define ATTR_prov_vnode	"prov_vnode"	/* job attribute */
#define ATTR_ProvisionEnable	"provision_enable"  /* server attribute */
#define ATTR_provision_timeout	"provision_timeout" /* server attribute */
#define ATTR_node_set		"node_set"	    /* job attribute */
#define ATTR_sched_preempted    "ptime"   /* job attribute */
#define ATTR_restrict_res_to_release_on_suspend "restrict_res_to_release_on_suspend"	    /* server attr */
#define ATTR_resv_alter_revert		"reserve_alter_revert"
#define ATTR_resv_standing_revert	"reserve_standing_revert"

#ifndef IN_LOOPBACKNET
#define IN_LOOPBACKNET	127
#endif
#define LOCALHOST_SHORTNAME "localhost"

#ifdef _USRDLL		/* This is only for building Windows DLLs
			 * and not their static libraries
			 */

#ifdef DLL_EXPORT
#define DECLDIR __declspec(dllexport)
#else
#define DECLDIR __declspec(dllimport)
#endif

DECLDIR int pbs_connect_noblk(char *, int);

DECLDIR int pbs_query_max_connections(void);

DECLDIR int pbs_connection_set_nodelay(int);

DECLDIR int pbs_geterrno(void);

DECLDIR int pbs_py_spawn(int, char *, char **, char **);

DECLDIR int pbs_encrypt_pwd(unsigned char *, int *, unsigned char **, size_t *, const unsigned char *, const unsigned char *);

DECLDIR int pbs_decrypt_pwd(unsigned char *, int, size_t, unsigned char **, const unsigned char * , const unsigned char *);

DECLDIR char *
pbs_submit_with_cred(int, struct attropl *, char *,
	char *, char *, int, size_t, char *);

DECLDIR char *pbs_get_tmpdir(void);

DECLDIR char *pbs_strsep(char **, const char *);

DECLDIR int pbs_defschreply(int, int, char *, int, char *, char *);

DECLDIR int pbs_quote_parse(char *, char **, char **, int);

DECLDIR const char *pbs_parse_err_msg(int);

DECLDIR void pbs_prt_parse_err(char *, char *, int, int);

/* This was added to pbs_ifl.h for use by AIF */
DECLDIR int      pbs_isexecutable(char *);
DECLDIR char    *pbs_ispbsdir(char *, char *);
DECLDIR int      pbs_isjobid(char *);
DECLDIR int      check_job_name(char *, int);
DECLDIR int      chk_Jrange(char *);
DECLDIR time_t   cvtdate(char *);
DECLDIR int      locate_job(char *, char *, char *);
DECLDIR int      parse_destination_id(char *, char **, char **);
DECLDIR int      parse_at_list(char *, int, int);
DECLDIR int      parse_equal_string(char *, char **, char **);
DECLDIR int      parse_depend_list(char *, char **, int);
DECLDIR int      parse_stage_list(char *);
DECLDIR int      prepare_path(char *, char*);
DECLDIR void     prt_job_err(char *, int, char *);
DECLDIR int		 set_attr(struct attrl **, const char *, const char *);
DECLDIR int      set_attr_resc(struct attrl **, char *, char *, char *);
DECLDIR int      set_resources(struct attrl **, char *, int, char **);
DECLDIR int      cnt2server(char *);
DECLDIR int      cnt2server_extend(char *, char *);
DECLDIR int      get_server(char *, char *, char *);
DECLDIR int      PBSD_ucred(int, char *, int, char *, int);

#else

extern int pbs_connect_noblk(const char *);

extern int pbs_connection_set_nodelay(int);

extern int pbs_geterrno(void);

extern int pbs_py_spawn(int, char *, char **, char **);

extern int pbs_encrypt_pwd(char *, int *, char **, size_t *, const unsigned char *, const unsigned char *);

extern int pbs_decrypt_pwd(char *, int, size_t, char **, const unsigned char *, const unsigned char *);

extern char *pbs_submit_with_cred(int, struct attropl *, char *,
	char *, char *, int, size_t , char *);

extern int pbs_query_max_connections(void);

extern char *pbs_get_tmpdir(void);

extern FILE *pbs_popen(const char *, const char *);

extern int pbs_pkill(FILE *, int);

extern int pbs_pclose(FILE *);

extern char* pbs_strsep(char **, const char *);

extern int pbs_defschreply(int, int, char *, int, char *, char *);

extern char *pbs_strsep(char **, const char *);

extern int pbs_quote_parse(char *, char **, char **, int);

extern const char *pbs_parse_err_msg(int);

extern void pbs_prt_parse_err(char *, char *, int, int);

extern int pbs_rescquery(int, char **, int, int *, int *, int *, int *);

extern int pbs_rescreserve(int, char **, int, pbs_resource_t *);

extern int pbs_rescrelease(int, pbs_resource_t);

extern char *avail(int, char *);

extern int totpool(int, int);

extern int usepool(int, int);

extern enum vnode_sharing place_sharing_type(char *, enum vnode_sharing);

/* This was added to pbs_ifl.h for use by AIF */
extern int 	pbs_isexecutable(char *);
extern char 	*pbs_ispbsdir(char *, char *);
extern int 	pbs_isjobid(char *);
extern int      check_job_name(char *, int);
extern int      chk_Jrange(char *);
extern time_t   cvtdate(char *);
extern int      locate_job(char *, char *, char *);
extern int      parse_destination_id(char *, char **, char **);
extern int      parse_at_list(char *, int, int);
extern int      parse_equal_string(char *, char **, char **);
extern int      parse_depend_list(char *, char **, int);
extern int      parse_destination_id(char *, char **, char **);
extern int      parse_stage_list(char *);
extern int      prepare_path(char *, char*);
extern void     prt_job_err(char *, int, char *);
extern int     set_attr(struct attrl **, const char *, const char *);
#ifndef pbs_get_dataservice_usr
extern char*    pbs_get_dataservice_usr(char *, int);
#endif
extern char*	get_attr(struct attrl *, const char *, const char *);
extern int      set_resources(struct attrl **, const char *, int, char **);
extern int      cnt2server(char *server);
extern int      cnt2server_extend(char *server, char *);
extern int      get_server(char *, char *, char *);
extern int      PBSD_ucred(int, char *, int, char *, int);
extern char	*encode_xml_arg_list(int, int, char **);
extern int	decode_xml_arg_list(char *, char *, char **, char ***);
extern int	decode_xml_arg_list_str(char *, char **);
extern char *convert_time(char *);
extern struct batch_status *bs_isort(struct batch_status *bs,
	int (*cmp_func)(struct batch_status*, struct batch_status *));
extern struct batch_status *bs_find(struct batch_status *, const char *);
extern void init_bstat(struct batch_status *);

/* IFL function pointers */
extern int (*pfn_pbs_asyrunjob)(int, const char *, const char *, const char *);
extern int (*pfn_pbs_asyrunjob_ack)(int, const char *, const char *, const char *);
extern int (*pfn_pbs_alterjob)(int, const char *, struct attrl *, const char *);
extern int (*pfn_pbs_asyalterjob)(int, const char *, struct attrl *, const char *);
extern int (*pfn_pbs_confirmresv)(int, const char *, const char *, unsigned long, const char *);
extern int (*pfn_pbs_connect)(const char *);
extern int (*pfn_pbs_connect_extend)(const char *, const char *);
extern char *(*pfn_pbs_default)(void);
extern int (*pfn_pbs_deljob)(int, const char *, const char *);
extern struct batch_deljob_status *(*pfn_pbs_deljoblist)(int, char **, int, const char *);
extern int (*pfn_pbs_disconnect)(int);
extern char *(*pfn_pbs_geterrmsg)(int);
extern int (*pfn_pbs_holdjob)(int, const char *, const char *, const char *);
extern int (*pfn_pbs_loadconf)(int);
extern char *(*pfn_pbs_locjob)(int, const char *, const char *);
extern int (*pfn_pbs_manager)(int, int, int, const char *, struct attropl *, const char *);
extern int (*pfn_pbs_movejob)(int, const char *, const char *, const char *);
extern int (*pfn_pbs_msgjob)(int, const char *, int, const char *, const char *);
extern int (*pfn_pbs_orderjob)(int, const char *, const char *, const char *);
extern int (*pfn_pbs_rerunjob)(int, const char *, const char *);
extern int (*pfn_pbs_rlsjob)(int, const char *, const char *, const char *);
extern int (*pfn_pbs_runjob)(int, const char *, const char *, const char *);
extern char **(*pfn_pbs_selectjob)(int, struct attropl *, const char *);
extern int (*pfn_pbs_sigjob)(int, const char *, const char *, const char *);
extern void (*pfn_pbs_statfree)(struct batch_status *);
extern void (*pfn_pbs_delstatfree)(struct batch_deljob_status *);
extern struct batch_status *(*pfn_pbs_statrsc)(int, const char *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_statjob)(int, const char *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_selstat)(int, struct attropl *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_statque)(int, const char *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_statserver)(int, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_statsched)(int, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_stathost)(int, const char *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_statnode)(int, const char *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_statvnode)(int, const char *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_statresv)(int, const char *, struct attrl *, const char *);
extern struct batch_status *(*pfn_pbs_stathook)(int, const char *, struct attrl *, const char *);
extern struct ecl_attribute_errors * (*pfn_pbs_get_attributes_in_error)(int);
extern char *(*pfn_pbs_submit)(int, struct attropl *, const char *, const char *, const char *);
extern char *(*pfn_pbs_submit_resv)(int, struct attropl *, const char *);
extern int (*pfn_pbs_delresv)(int, const char *, const char *);
extern char *(*pfn_pbs_modify_resv)(int, const char *, struct attropl *, const char *);
extern int (*pfn_pbs_relnodesjob)(int, const char *, const char *, const char *);
extern int (*pfn_pbs_terminate)(int, int, const char *);
extern preempt_job_info *(*pfn_pbs_preempt_jobs)(int, char**);
extern int (*pfn_pbs_register_sched)(const char *, int, int);

#endif /* _USRDLL */

extern const char pbs_parse_err_msges[][PBS_PARSE_ERR_MSG_LEN_MAX + 1];

#ifdef	__cplusplus
}
#endif

#endif	/* _PBS_INTERNAL_H */


================================================
FILE: src/include/pbs_json.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_JSON_H
#define _PBS_JSON_H
#ifdef __cplusplus
extern "C" {
#endif

#include <stdlib.h>
#include <stdio.h>

typedef void json_data;

json_data *pbs_json_create_object();
json_data *pbs_json_create_array();

void pbs_json_insert_item(json_data *parent, char *key, json_data *value);
int pbs_json_insert_string(json_data *parent, char *key, char *value);
int pbs_json_insert_number(json_data *parent, char *key, double value);
int pbs_json_insert_parsed(json_data *parent, char *key, char *value, int ignore_empty);

int pbs_json_print(json_data *data, FILE *stream);
void pbs_json_delete(json_data *data);

#ifdef __cplusplus
}
#endif
#endif /* _PBS_JSON_H */


================================================
FILE: src/include/pbs_license.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_LICENSE_H
#define _PBS_LICENSE_H
#ifdef __cplusplus
extern "C" {
#endif

#include <limits.h>
#include "work_task.h"
/* Node license types */

#define ND_LIC_TYPE_locked 'l'
#define ND_LIC_TYPE_cloud 'c'
#define ND_LIC_locked_str "l"
#define ND_LIC_cloud_str "c"

typedef struct {
	long licenses_min;	       /* minimum no.of licenses to be kept handy 		*/
	long licenses_max;	       /* maximum licenses that can be used			*/
	long licenses_linger_time;     /* time for which unused licenses can be kept		*/
	long licenses_checked_out;     /* licenses that are  checked out			*/
	long licenses_checkout_time;   /* time at which licenses were checked out		*/
	long licenses_total_needed;    /* licenses needed to license all nodes in the complex	*/
	int expiry_warning_email_yday; /* expiry warning email sent on this day of the year	*/
} pbs_licensing_control;

typedef struct {
	int lu_max_hr;	    /* max number of licenses used in the hour  */
	int lu_max_day;	    /* max number of licenses used in the day   */
	int lu_max_month;   /* max number of licenses used in the month */
	int lu_max_forever; /* max number of licenses used so far	    */
	int lu_day;	    /* which day of month			    */
	int lu_month;	    /* which month				    */
} pbs_licenses_high_use;

typedef struct {
	long licenses_global; /* licenses available at pbs_license_info   */
	long licenses_local;  /* licenses that are checked out but unused */
	long licenses_used;   /* licenses in use			    */
	pbs_licenses_high_use licenses_high_use;

} pbs_license_counts;

enum node_topology_type {
	tt_hwloc,
	tt_Cray,
	tt_Win
};
typedef enum node_topology_type ntt_t;

extern pbs_list_head unlicensed_nodes_list;

#define PBS_MIN_LICENSING_LICENSES 0
#define PBS_MAX_LICENSING_LICENSES INT_MAX
#define PBS_LIC_LINGER_TIME 31536000 /* keep extra licenses 1 year by default */
#define PBS_LICENSE_LOCATION \
	(pbs_licensing_location ? pbs_licensing_location : "null")

extern void unset_signature(void *, char *);
extern int release_node_lic(void *);

extern void license_nodes();
extern void init_licensing(struct work_task *ptask);
extern void reset_license_counters(pbs_license_counts *);
extern void remove_from_unlicensed_node_list(struct pbsnode *pnode);

/* Licensing-related variables */
extern char *pbs_licensing_location;
extern pbs_licensing_control licensing_control;
extern pbs_license_counts license_counts;
#ifdef __cplusplus
}
#endif
#endif /* _PBS_LICENSE_H */


================================================
FILE: src/include/pbs_mpp.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_MPP_H
#define _PBS_MPP_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 *	Header file for defining MPP CPU states and scheduling restrictions.
 */

#define MPP_MAX_CPUS_PER_NODE 16
#define MPP_MAX_APPS_PER_CPU 16

typedef enum {
	mpp_node_arch_none = 0,
	mpp_node_arch_Cray_XT3,
	mpp_node_arch_Cray_X1,
	mpp_node_arch_Cray_X2,
	mpp_node_arch_max
} mpp_node_arch_t;

static char *mpp_node_arch_name[] = {
	"NONE",
	"XT3",
	"X1",
	"X2",
	"UNKNOWN"};

typedef enum {
	mpp_node_state_none = 0,
	mpp_node_state_avail,
	mpp_node_state_unavail,
	mpp_node_state_down,
	mpp_node_state_max
} mpp_node_state_t;

static char *mpp_node_state_name[] = {
	"NONE",
	"AVAILABLE",
	"UNAVAILABLE",
	"DOWN",
	"UNKNOWN"};

typedef enum {
	mpp_cpu_type_none = 0,
	mpp_cpu_type_x86_64,
	mpp_cpu_type_Cray_X1,
	mpp_cpu_type_Cray_X2,
	mpp_cpu_type_max
} mpp_cpu_type_t;

static char *mpp_cpu_type_name[] = {
	"NONE",
	"x86_64",
	"craynv1",
	"Cray-BlackWidow",
	"UNKNOWN"};

typedef enum {
	mpp_cpu_state_none = 0,
	mpp_cpu_state_up,
	mpp_cpu_state_down,
	mpp_cpu_state_max
} mpp_cpu_state_t;

static char *mpp_cpu_state_name[] = {
	"NONE",
	"UP",
	"DOWN",
	"UNKNOWN"};

typedef enum {
	mpp_label_type_hard = 0,
	mpp_label_type_soft
} mpp_label_type_t;

#ifdef __cplusplus
}
#endif
#endif /* _PBS_MPP_H */


================================================
FILE: src/include/pbs_nodes.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_NODES_H
#define _PBS_NODES_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 *	Header file used for the node tracking routines.
 */

#include "resv_node.h"
#include "resource.h"
#include "job.h"

#include "libutil.h"
#ifndef PBS_MOM
#include "pbs_db.h"
extern void *svr_db_conn;
#endif

#include "pbs_array_list.h"
#include "hook.h"
#include "hook_func.h"

/* Attributes in the Server's vnode (old node) object */
enum nodeattr {
#include "node_attr_enum.h"
	ND_ATR_LAST /* WARNING: Must be the highest valued enum */
};

#ifndef PBS_MAXNODENAME
#define PBS_MAXNODENAME 79
#endif

/* Daemon info structure which are common for both mom and peer server */
struct daemon_info {
	unsigned long dmn_state;	 /* Daemon's state */
	int dmn_stream;			 /* TPP stream to service */
	unsigned long *dmn_addrs;	 /* IP addresses of host */
	pbs_list_head dmn_deferred_cmds; /* links to svr work_task list for TPP replies */
};
typedef struct daemon_info dmn_info_t;

/*
 * mominfo structure - used by both the Server and Mom
 *	to hold contact information for an instance of a pbs_mom on a host
 */

struct machine_info {
	char mi_host[PBS_MAXHOSTNAME + 1]; /* hostname where service is */
	unsigned int mi_port;		   /* port to which service is listening */
	unsigned int mi_rmport;		   /* port for service RM */
	time_t mi_modtime;		   /* time configuration changed */
	dmn_info_t *mi_dmn_info;	   /* daemon specific data which are common for all */
	void *mi_data;			   /* daemon dependent substructure */
	pbs_list_link mi_link;		   /* forward/backward links */
};
typedef struct machine_info mominfo_t;

/*
 * The following structure is used by the Server for each Mom.
 * It is pointed to by the mi_data element in mominfo_t
 */

struct mom_svrinfo {
	long msr_pcpus;			/* number of physical cpus reported by Mom */
	long msr_acpus;			/* number of avail    cpus reported by Mom */
	u_Long msr_pmem;		/* amount of physical mem  reported by Mom */
	int msr_numjobs;		/* number of jobs on this node */
	char *msr_arch;			/* reported "arch" */
	char *msr_pbs_ver;		/* mom's reported "pbs_version" */
	time_t msr_timedown;		/* time Mom marked down */
	struct work_task *msr_wktask;	/* work task for reque jobs */
	int msr_numvnds;		/* number of vnodes */
	int msr_numvslots;		/* number of slots in msr_children */
	struct pbsnode **msr_children;	/* array of vnodes supported by Mom */
	int msr_jbinxsz;		/* size of job index array */
	struct job **msr_jobindx;	/* index array of jobs on this Mom */
	long msr_vnode_pool;		/* the pool of vnodes that belong to this Mom */
	int msr_has_inventory;		/* Tells whether mom is an inventory reporting mom */
	mom_hook_action_t **msr_action; /* pending hook copy/delete on mom */
	int msr_num_action;		/* # of hook actions in msr_action */
};
typedef struct mom_svrinfo mom_svrinfo_t;

struct vnpool_mom {
	long vnpm_vnode_pool;
	int vnpm_nummoms;
	mominfo_t *vnpm_inventory_mom;
	mominfo_t **vnpm_moms;
	struct vnpool_mom *vnpm_next;
};
typedef struct vnpool_mom vnpool_mom_t;

#ifdef PBS_MOM

enum vnode_sharing_state { isshared = 0,
			   isexcl = 1 };
enum rlplace_value { rlplace_unset = 0,
		     rlplace_share = 1,
		     rlplace_excl = 2 };

extern enum vnode_sharing_state vnss[][rlplace_excl - rlplace_unset + 1];

/*
 *	The following information is used by pbs_mom to track per-Mom
 *	information.  The mi_data member of a mominfo_t structure points to it.
 */
struct mom_vnodeinfo {
	char *mvi_id;			/* vnode ID */
	enum vnode_sharing mvi_sharing; /* declared "sharing" value */
	unsigned int mvi_memnum;	/* memory board node ID */
	unsigned int mvi_ncpus;		/* number of CPUs in mvi_cpulist[] */
	unsigned int mvi_acpus;		/* of those, number of CPUs available */
	struct mvi_cpus {
		unsigned int mvic_cpunum;
#define MVIC_FREE 0x1
#define MVIC_ASSIGNED 0x2
#define MVIC_CPUISFREE(m, j) (((m)->mvi_cpulist[j].mvic_flags) & MVIC_FREE)
		unsigned int mvic_flags;
		job *mvic_job; /* job this CPU is assigned */
	} * mvi_cpulist;       /* CPUs owned by this vnode */
};
typedef struct mvi_cpus mom_mvic_t;
typedef struct mom_vnodeinfo mom_vninfo_t;

extern enum rlplace_value getplacesharing(job *pjob);

#endif /* PBS_MOM */

/* The following are used by Mom to map vnodes to the parent host */

struct mom_vnode_map {
	char mvm_name[PBS_MAXNODENAME + 1];
	char *mvm_hostn; /* host name for MPI via PBS_NODEFILE */
	int mvm_notask;
	mominfo_t *mvm_mom;
};
typedef struct mom_vnode_map momvmap_t;

/* used for generation control on the Host to Vnode mapping */
struct mominfo_time {
	time_t mit_time;
	int mit_gen;
};
typedef struct mominfo_time mominfo_time_t;

extern momvmap_t **mommap_array;
extern int mommap_array_size;
extern mominfo_time_t mominfo_time;
extern vnpool_mom_t *vnode_pool_mom_list;

struct prop {
	char *name;
	short mark;
	struct prop *next;
};

struct jobinfo {
	char *jobid;
	int has_cpu;
	size_t mem;
	struct jobinfo *next;
};

struct resvinfo {
	resc_resv *resvp;
	struct resvinfo *next;
};

struct node_req {
	int nr_ppn; /* processes (tasks) per node */
	int nr_cpp; /* cpus per process           */
	int nr_np;  /* nr_np = nr_ppn * nr_cpp    */
};

/* virtual cpus - one for each resource_available.ncpus on a vnode */
struct pbssubn {
	struct pbssubn *next;
	struct jobinfo *jobs;
	unsigned long inuse;
	long index;
};

union ndu_ninfo {
	struct {
		unsigned int __nd_lic_info : 24; /* OEM license information */
		unsigned int __nd_spare : 8;	 /* unused bits in this integer */
	} __ndu_bitfields;
	unsigned int __nd_int;
};

/*
 * Vnode structure
 */
struct pbsnode {
	char *nd_name;		/* vnode's name */
	mominfo_t **nd_moms;	/* array of parent Moms */
	int nd_nummoms;		/* number of Moms */
	int nd_nummslots;	/* number of slots in nd_moms */
	int nd_index;		/* global node index */
	int nd_arr_index;	/* index of myself in the svr node array, only in mem, not db */
	char *nd_hostname;	/* ptr to hostname */
	struct pbssubn *nd_psn; /* ptr to list of virt cpus */
	struct resvinfo *nd_resvp;
	long nd_nsn;			 /* number of VPs  */
	long nd_nsnfree;		 /* number of VPs free */
	long nd_ncpus;			 /* number of phy cpus on node */
	unsigned long nd_state;		 /* state of node */
	unsigned short nd_ntype;	 /* node type */
	struct pbs_queue *nd_pque;	 /* queue to which it belongs */
	void *nd_lic_info;		 /* information set and used for licensing */
	int nd_added_to_unlicensed_list; /* To record if the node is added to the list of unlicensed node */
	pbs_list_link un_lic_link;	 /*Link to unlicense list */
	int nd_svrflags;		 /* server flags */
	int nd_modified;
	attribute nd_attr[ND_ATR_LAST];
};
typedef struct pbsnode pbs_node;

enum warn_codes { WARN_none,
		  WARN_ngrp_init,
		  WARN_ngrp_ck,
		  WARN_ngrp };
enum nix_flags { NIX_none,
		 NIX_qnodes,
		 NIX_nonconsume };
enum part_flags { PART_refig,
		  PART_add,
		  PART_rmv };

#define NDPTRBLK 50 /* extend a node ptr array by this amt */

/*
 * The following INUSE_* flags are used for several structures
 * (subnode.inuse, node.nd_state, and dmn_info.dmn_state).
 * The database schema stores node.nd_state as a 4 byte integer.
 * If more than 32 flags bits need to be added, the database schema will
 * need to be updated.  If not, the excess flags will be lost upon server restart
 */
#define INUSE_FREE 0x00		/* Node has one or more avail VPs	*/
#define INUSE_OFFLINE 0x01	/* Node was removed by administrator	*/
#define INUSE_DOWN 0x02		/* Node is down/unresponsive 		*/
#define INUSE_DELETED 0x04	/* Node is "deleted"			*/
#define INUSE_UNRESOLVABLE 0x08 /* Node not reachable */
#define INUSE_JOB 0x10		/* VP   in used by a job (normal use)	*/
/* Node all VPs in use by jobs		*/
#define INUSE_STALE 0x20	   /* Vnode not reported by Mom            */
#define INUSE_JOBEXCL 0x40	   /* Node is used by one job (exclusive)	*/
#define INUSE_BUSY 0x80		   /* Node is busy (high loadave)		*/
#define INUSE_UNKNOWN 0x100	   /* Node has not been heard from yet	*/
#define INUSE_NEEDS_HELLOSVR 0x200 /* Fresh hello sequence needs to be initiated */
#define INUSE_INIT 0x400	   /* Node getting vnode map info		*/
#define INUSE_PROV 0x800	   /* Node is being provisioned		*/
#define INUSE_WAIT_PROV 0x1000	   /* Node is being provisioned		*/
/* INUSE_WAIT_PROV is 0x1000 - this should not clash with MOM_STATE_BUSYKB
 * since INUSE_WAIT_PROV is used as part of the node_state and MOM_STATE_BUSYKB
 * is used inside mom for variable internal_state
 */
#define INUSE_RESVEXCL 0x2000	       /* Node is exclusive to a reservation	*/
#define INUSE_OFFLINE_BY_MOM 0x4000    /* Node is offlined by mom */
#define INUSE_MARKEDDOWN 0x8000	       /* TPP layer marked node down */
#define INUSE_NEED_ADDRS 0x10000       /* Needs to be sent IP addrs */
#define INUSE_MAINTENANCE 0x20000      /* Node has a job in the admin suspended state */
#define INUSE_SLEEP 0x40000	       /* Node is sleeping */
#define INUSE_NEED_CREDENTIALS 0x80000 /* Needs to be sent credentials */

#define VNODE_UNAVAILABLE (INUSE_STALE | INUSE_OFFLINE | INUSE_DOWN | \
			   INUSE_DELETED | INUSE_UNKNOWN | INUSE_UNRESOLVABLE | INUSE_OFFLINE_BY_MOM | INUSE_MAINTENANCE | INUSE_SLEEP)

/* states that are set by the admin OR cannot be determined on the fly */
#define INUSE_NOAUTO_MASK (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM | INUSE_MAINTENANCE | INUSE_SLEEP | INUSE_PROV | INUSE_WAIT_PROV)

/* the following are used in Mom's internal state			*/
#define MOM_STATE_DOWN INUSE_DOWN
#define MOM_STATE_BUSY INUSE_BUSY
#define MOM_STATE_BUSYKB 0x1000	      /* keyboard is busy 		   */
#define MOM_STATE_INBYKB 0x2000	      /* initial period of keyboard busy */
#define MOM_STATE_CONF_HARVEST 0x4000 /* MOM configured to cycle-harvest */
#define MOM_STATE_MASK 0x0fff	      /* to mask what is sent to server  */

#define FLAG_OKAY 0x01	   /* "ok" to consider this node in the search */
#define FLAG_THINKING 0x02 /* "thinking" to use node to satisfy specif */
#define FLAG_CONFLICT 0x04 /* "conflict" temporarily  ~"thinking"      */
#define FLAG_IGNORE 0x08   /* "no use"; reality, can't use node in spec*/

/* bits both in nd_state and inuse	*/
#define INUSE_SUBNODE_MASK (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM | INUSE_DOWN | INUSE_JOB | INUSE_STALE |            \
			    INUSE_JOBEXCL | INUSE_BUSY | INUSE_UNKNOWN | INUSE_INIT | INUSE_PROV | INUSE_WAIT_PROV | \
			    INUSE_RESVEXCL | INUSE_UNRESOLVABLE | INUSE_MAINTENANCE | INUSE_SLEEP)

#define INUSE_COMMON_MASK (INUSE_OFFLINE | INUSE_DOWN)
/* state bits that go from node to subn */
#define CONFLICT 1   /*search process must consider conflicts*/
#define NOCONFLICT 0 /*be oblivious to conflicts in search*/

/*
 * server flags (in nd_svrflags)
 */
#define NODE_UNLICENSED 0x01 /* To record if the node is added to the list of unlicensed node */
#define NODE_NEWOBJ 0x02     /* new node ? */
#define NODE_ACCTED 0x04     /* resc recorded in job acct */

/* operators to set the state of a vnode. Nd_State_Set is "=",
 * Nd_State_Or is "|=" and Nd_State_And is "&=". This is used in set_vnode_state
 */
enum vnode_state_op {
	Nd_State_Set,
	Nd_State_Or,
	Nd_State_And
};

/* To indicate whether a degraded time should be set on a reservation */
enum vnode_degraded_op {
	Skip_Degraded_Time,
	Set_Degraded_Time,
};

/*
 * NTYPE_* values are used in "node.nd_type"
 */
#define NTYPE_PBS 0x00 /* Node is normal node	*/

#define PBSNODE_NTYPE_MASK 0xf /* relevant ntype bits */

/* tree for mapping contact info to node struture */
struct tree {
	unsigned long key1;
	unsigned long key2;
	mominfo_t *momp;
	struct tree *left, *right;
};

extern void *node_attr_idx;
extern attribute_def node_attr_def[]; /* node attributes defs */
extern struct pbsnode **pbsndlist;    /* array of ptr to nodes  */
extern int svr_totnodes;	      /* number of nodes (hosts) */
extern struct tree *ipaddrs;
extern struct tree *streams;
extern mominfo_t **mominfo_array;
extern pntPBS_IP_LIST pbs_iplist;
extern int mominfo_array_size;
extern int mom_send_vnode_map;
extern int svr_num_moms;

/* Handlers for vnode state changing.for degraded reservations */
extern void vnode_unavailable(struct pbsnode *, int);
extern void vnode_available(struct pbsnode *);
extern int find_degraded_occurrence(resc_resv *, struct pbsnode *, enum vnode_degraded_op);
extern int find_vnode_in_execvnode(char *, char *);
extern void set_vnode_state(struct pbsnode *, unsigned long, enum vnode_state_op);
extern struct resvinfo *find_vnode_in_resvs(struct pbsnode *, enum vnode_degraded_op);
extern void free_rinf_list(struct resvinfo *);
extern void degrade_offlined_nodes_reservations(void);
extern void degrade_downed_nodes_reservations(struct work_task *);

extern int mod_node_ncpus(struct pbsnode *pnode, long ncpus, int actmode);
extern int initialize_pbsnode(struct pbsnode *, char *, int);
extern void initialize_pbssubn(struct pbsnode *, struct pbssubn *, struct prop *);
extern struct pbssubn *create_subnode(struct pbsnode *, struct pbssubn *lstsn);
extern void effective_node_delete(struct pbsnode *);
extern void setup_notification(void);
extern struct pbssubn *find_subnodebyname(char *);
extern struct pbsnode *find_nodebyname(char *);
extern struct pbsnode *find_nodebyaddr(pbs_net_t);
extern void free_prop_list(struct prop *);
extern void recompute_ntype_cnts(void);
extern int process_host_name_part(char *, svrattrl *, char **, int *);
extern int create_pbs_node(char *, svrattrl *, int, int *, struct pbsnode **, int);
extern int create_pbs_node2(char *, svrattrl *, int, int *, struct pbsnode **, int, int);
extern int mgr_set_node_attr(struct pbsnode *, attribute_def *, int, svrattrl *, int, int *, void *, int);
extern int node_queue_action(attribute *, void *, int);
extern int node_pcpu_action(attribute *, void *, int);
struct prop *init_prop(char *pname);
extern void set_node_license(void);
extern int set_node_topology(attribute *, void *, int);
extern void unset_node_license(struct pbsnode *);
extern mominfo_t *tfind2(const unsigned long, const unsigned long, struct tree **);
extern int set_node_host_name(attribute *, void *, int);
extern int set_node_hook_action(attribute *, void *, int);
extern int set_node_mom_port(attribute *, void *, int);
extern mominfo_t *create_mom_entry(char *, unsigned int);
extern mominfo_t *find_mom_entry(char *, unsigned int);
extern void momptr_down(mominfo_t *, char *);
extern void momptr_offline_by_mom(mominfo_t *, char *);
extern void momptr_clear_offline_by_mom(mominfo_t *, char *);
extern void delete_mom_entry(mominfo_t *);
extern mominfo_t *create_svrmom_entry(char *, unsigned int, unsigned long *);
extern void delete_svrmom_entry(mominfo_t *);
extern int legal_vnode_char(char, int);
extern char *parse_node_token(char *, int, int *, char *);
extern int cross_link_mom_vnode(struct pbsnode *, mominfo_t *);
extern int fix_indirectness(resource *, struct pbsnode *, int);
extern int chk_vnode_pool(attribute *, void *, int);
extern void free_pnode(struct pbsnode *);
extern int save_nodes_db(int, void *);
extern void propagate_socket_licensing(mominfo_t *);
extern void update_jobs_on_node(char *, char *, int, int);
extern int mcast_add(mominfo_t *, int *, bool);
void stream_eof(int, int, char *);

extern char *msg_daemonname;

#define NODE_TOPOLOGY_TYPE_HWLOC "hwloc"
#define NODE_TOPOLOGY_TYPE_CRAY "Cray-v1:"
#define NODE_TOPOLOGY_TYPE_WIN "Windows:"

#define CRAY_COMPUTE "cray_compute" /* vntype for a Cray compute node */
#define CRAY_LOGIN "cray_login"	    /* vntype for a Cray login node */

/* Mom Job defines */
#define JOB_ACT_REQ_REQUEUE 0
#define JOB_ACT_REQ_DELETE 1
#define JOB_ACT_REQ_DEALLOCATE 2

extern void remove_mom_from_pool(mominfo_t *);
extern void mcast_moms();

#ifndef PBS_MOM
extern int node_save_db(struct pbsnode *pnode);
struct pbsnode *node_recov_db(char *nd_name, struct pbsnode *pnode);
extern int add_mom_to_pool(mominfo_t *);
extern void reset_pool_inventory_mom(mominfo_t *);
extern vnpool_mom_t *find_vnode_pool(mominfo_t *pmom);
extern void mcast_msg(struct work_task *);
int get_job_share_type(struct job *pjob);
#endif

extern int recover_vmap(void);
extern void delete_momvmap_entry(momvmap_t *);
extern momvmap_t *create_mommap_entry(char *, char *hostn, mominfo_t *, int);
extern mominfo_t *find_mom_by_vnodename(const char *);
extern momvmap_t *find_vmap_entry(const char *);
extern mominfo_t *add_mom_data(const char *, void *);
extern mominfo_t *find_mominfo(const char *);
extern int create_vmap(void **);
extern void destroy_vmap(void *);
extern mominfo_t *find_vmapent_byID(void *, const char *);
extern int add_vmapent_byID(void *, const char *, void *);
extern int open_conn_stream(mominfo_t *);
extern void close_streams(int stm, int ret);
extern void delete_daemon_info(struct machine_info *pmi);
extern dmn_info_t *init_daemon_info(unsigned long *pul, unsigned int port, struct machine_info *pmi);

attribute *get_nattr(const struct pbsnode *pnode, int attr_idx);
char *get_nattr_str(const struct pbsnode *pnode, int attr_idx);
struct array_strings *get_nattr_arst(const struct pbsnode *pnode, int attr_idx);
pbs_list_head get_nattr_list(const struct pbsnode *pnode, int attr_idx);
long get_nattr_long(const struct pbsnode *pnode, int attr_idx);
char get_nattr_c(const struct pbsnode *pnode, int attr_idx);
int set_nattr_generic(struct pbsnode *pnode, int attr_idx, char *val, char *rscn, enum batch_op op);
int set_nattr_str_slim(struct pbsnode *pnode, int attr_idx, char *val, char *rscn);
int set_nattr_l_slim(struct pbsnode *pnode, int attr_idx, long val, enum batch_op op);
int set_nattr_b_slim(struct pbsnode *pnode, int attr_idx, long val, enum batch_op op);
int set_nattr_c_slim(struct pbsnode *pnode, int attr_idx, char val, enum batch_op op);
int set_nattr_short_slim(struct pbsnode *pnode, int attr_idx, short val, enum batch_op op);
int is_nattr_set(const struct pbsnode *pnode, int attr_idx);
void free_nattr(struct pbsnode *pnode, int attr_idx);
void clear_nattr(struct pbsnode *pnode, int attr_idx);
void set_nattr_jinfo(struct pbsnode *pnode, int attr_idx, struct pbsnode *val);

#ifdef __cplusplus
}
#endif
#endif /* _PBS_NODES_H */


================================================
FILE: src/include/pbs_python.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_PYTHON_DEF
#define _PBS_PYTHON_DEF

#ifdef __cplusplus
extern "C" {
#endif

#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
#include <errno.h>
#include <stdlib.h>
#include <string.h>
#include <pbs_ifl.h>
#include <pbs_config.h>
#include "pbs_internal.h"
#include <log.h>
#include "list_link.h"
#include "attribute.h"

#ifdef WIN32
#define DIRSEP '\\'
#define DIRSEP_STR "\\"
#else
#define DIRSEP '/'
#define DIRSEP_STR "/"
#endif

#ifdef LOG_BUF_SIZE /* from log.h */
#define STRBUF LOG_BUF_SIZE
#else
#define STRBUF 4096
#endif

/*
 * Header file providing external callable routines without regardless
 * of whether it is linked with the python interpreter.
 *
 * NOTE: This is the external interface to basically start/stop/run commands
 *       associated with the embedded python interpreter.
 * ====================== IMPORTANT =======================
 * This file should *NOT* depend on the Python header files
 * use generic pointers!
 * ====================== IMPORTANT =======================
 */

#define PBS_PYTHON_PROGRAM "pbs_python"
struct python_interpreter_data {
	int data_initialized;			   /* data initialized */
	int interp_started;			   /* status flag*/
	char *daemon_name;			   /* useful for logging */
	char local_host_name[PBS_MAXHOSTNAME + 1]; /* short host name */
	int pbs_python_types_loaded;		   /* The PBS python types */
	void (*init_interpreter_data)(struct python_interpreter_data *);
	void (*destroy_interpreter_data)(struct python_interpreter_data *);
};

struct python_script {
	int check_for_recompile;
	char *path;	      /* FULL pathname of script */
	void *py_code_obj;    /* the actual compiled code string
					      * type is PyCodeObject *
					      */
	void *global_dict;    /* this is the globals() dictionary
					      * type is PyObject *
					      */
	struct stat cur_sbuf; /* last modification time */
};

/**
 *
 * @brief
 * 	The hook_input_param_t structure contains the input request
 * 	parameters to the pbs_python_event_set() function.
 *
 * @param[in]	rq_job - maps to a struct rq_quejob batch request.
 * @param[in]	rq_postqueuejob - resultant struct rq_postqueuejob batch request values.
 * @param[in]	rq_manage - maps to a struct rq_manage batch request.
 * @param[in]	rq_modifyvnode - maps to a struct rq_modifyvnode.
 * @param[in]	rq_move - maps to a struct rq_move batch request.
 * @param[in]	rq_prov - maps to a struct prov_vnode_info.
 * @param[in]	rq_run - maps to a struct rq_runjob batch request.
 * @param[in]	rq_obit - maps to a struct rq_jobobit batch request.
 * @param[in]	progname - value to pbs.event().progname in an execjob_launch
 * 				hook.
 * @param[in]	argv_list - pbs.event().argv but in list form, used by
 * 				execjob_launch hook.
 * @param[in]	env - value to pbs.event().env in an execjob_launch hook.
 * @param[in]	jobs_list - list of jobs and their attributes/resources
 * 				passed to an exechost_periodic hook.
 * @param[in]	vns_list - list of vnodes and their attributes/resources
 * 				passed to various hooks.
 * @param[in]	vns_list_fail - list of failed vnodes and their
 *				attributes/resources passed to various hooks.
 * @param[in]	failed_mom_list - list of parent moms that have been
 *				seen as down.
 * @param[in]	succeeded_mom_list - list of parent moms that have been
 *				seend as healthy.
 * @param[in]	pid - value to pbs.event().pid in an execjob_attach hook.
 *
 */
typedef struct hook_input_param {
	void *rq_job;
	void *rq_postqueuejob;
	void *rq_manage;
	void *rq_modifyvnode;
	void *rq_move;
	void *rq_prov;
	void *rq_run;
	void *rq_obit;
	char *progname;
	pbs_list_head *argv_list;
	char *env;
	pbs_list_head *jobs_list;
	pbs_list_head *vns_list;
	pbs_list_head *resv_list;
	pbs_list_head *vns_list_fail;
	pbs_list_head *failed_mom_list;
	pbs_list_head *succeeded_mom_list;
	pid_t pid;
} hook_input_param_t;

/**
 *
 * @brief
 * 	The hook_output_param_t structure contains the output request
 * 	parameters to be filled in by pbs_python_event_to_request() function.
 *
 * @param[out]	rq_job - resultant struct rq_quejob batch request values.
 * @param[out]	rq_postqueuejob - resultant struct rq_postqueuejob batch request values.
 * @param[out]	rq_manage - resultant struct rq_manage batch request values.
 * @param[out]	rq_move - resultant struct rq_move batch request values.
 * @param[out]	rq_prov - resultant struct prov_vnode_info values.
 * @param[out]	rq_run - resultant struct rq_runjob batch request values.
 * @param[in]	rq_obit - maps to a struct rq_jobobit batch request.
 * @param[out]	progname - resultant value to pbs.event().progname
 * 			   after executing execjob_launch hook.
 * @param[out]	argv_list - resultant pbs.event().argv value after
 * 			   executing execjob_launch hook.
 * @param[out]	env - resultant value to pbs.event().env after executing
 * 			execjob_launch hook.
 * @param[out]	jobs_list - list of modifications done to jobs after
 * 			executing exechost_periodic hook.
 * @param[out]	vns_list - list of modifications done to vnodes
 * 			after executing various hooks.
 * @param[out]	vns_list_fail - list of modifications done to failed
 * 			vnodes after executing various hooks.
 *
 */
typedef struct hook_output_param {
	void *rq_job;
	void *rq_postqueuejob;
	void *rq_manage;
	void *rq_move;
	void *rq_prov;
	void *rq_run;
	void *rq_obit;
	char **progname;
	pbs_list_head *argv_list;
	char **env;
	pbs_list_head *jobs_list;
	pbs_list_head *vns_list;
	pbs_list_head *resv_list;
	pbs_list_head *vns_list_fail;
} hook_output_param_t;

/* global constants */

/* this is a pointer to interp data -> pbs_python_daemon_name.
 * Since some of the routines could be shared by all three daemons, this saves
 * passing the struct python_interpreter_data all over the place just get the
 * daemon name
 */

extern char *pbs_python_daemon_name; /* pbs_python_external.c */

/* -- BEGIN pbs_python_external.c implementations -- */
extern int pbs_python_ext_start_interpreter(
	struct python_interpreter_data *interp_data);
extern void pbs_python_ext_shutdown_interpreter(
	struct python_interpreter_data *interp_data);

extern int pbs_python_load_python_types(
	struct python_interpreter_data *interp_data);
extern void pbs_python_unload_python_types(
	struct python_interpreter_data *interp_data);

extern void *pbs_python_ext_namespace_init(
	struct python_interpreter_data *interp_data);

extern int pbs_python_check_and_compile_script(
	struct python_interpreter_data *interp_data,
	struct python_script *py_script);

extern int pbs_python_run_code_in_namespace(
	struct python_interpreter_data *interp_data,
	struct python_script *script_file,
	int *exit_code);

extern void pbs_python_ext_free_python_script(
	struct python_script *py_script);
extern void	pbs_python_ext_free_code_obj(
	struct python_script *py_script);
extern void	pbs_python_ext_free_global_dict(
	struct python_script *py_script);
extern int pbs_python_ext_alloc_python_script(
	const char *script_path,
	struct python_script **py_script);

extern void pbs_python_ext_quick_start_interpreter(void);
extern void pbs_python_ext_quick_shutdown_interpreter(void);
extern int set_py_progname(void);
extern int get_py_progname(char **);
extern void pbs_python_clear_attributes();

/* -- END pbs_python_external.c implementations -- */

/* -- BEGIN PBS Server/Python implementations -- */

/* For the symbolic constants below, cross-reference src/modules files */

#define PY_ATTRIBUTES "attributes" /* list of valid PBS attributes */
#define PY_ATTRIBUTES_READONLY "attributes_readonly"
/* valid PBS attributes not */
/* settable in a hook script */
#define PY_ATTRIBUTES_HOOK_SET "_attributes_hook_set"
/* attributes that got set in */
/* a hook script */
#define PY_READONLY_FLAG "_readonly" /* an object is read-only */
#define PY_RERUNJOB_FLAG "_rerun"    /* flag some job to rerun */
#define PY_DELETEJOB_FLAG "_delete"  /* flag some job to be deleted*/

/* List of attributes appearing in a Python job, resv, server, queue,	*/
/* resource, and other PBS-related objects,  that are only defined in	*/
/* Python but not in PBS. 	 					*/
/* This means the attributes are not settable inside a hook script.	*/
#define PY_PYTHON_DEFINED_ATTRIBUTES "id resvid _name _has_value"

/* special event object attributes - in modules/pbs/v1.1 _svr_types.py */
#define PY_EVENT_TYPE "type"
#define PY_EVENT_HOOK_NAME "hook_name"
#define PY_EVENT_HOOK_TYPE "hook_type"
#define PY_EVENT_REQUESTOR "requestor"
#define PY_EVENT_REQUESTOR_HOST "requestor_host"
#define PY_EVENT_PARAM "_param"
#define PY_EVENT_FREQ "freq"

/* The event parameter keys */
#define PY_EVENT_PARAM_JOB "job"
#define PY_EVENT_PARAM_JOB_O "job_o"
#define PY_EVENT_PARAM_RESV "resv"
#define PY_EVENT_PARAM_RESV_O "resv_o"
#define PY_EVENT_PARAM_SRC_QUEUE "src_queue"
#define PY_EVENT_PARAM_VNODE "vnode"
#define PY_EVENT_PARAM_VNODE_O "vnode_o"
#define PY_EVENT_PARAM_VNODELIST "vnode_list"
#define PY_EVENT_PARAM_VNODELIST_FAIL "vnode_list_fail"
#define PY_EVENT_PARAM_JOBLIST "job_list"
#define PY_EVENT_PARAM_RESVLIST "resv_list"
#define PY_EVENT_PARAM_AOE "aoe"
#define PY_EVENT_PARAM_PROGNAME "progname"
#define PY_EVENT_PARAM_ARGLIST "argv"
#define PY_EVENT_PARAM_ENV "env"
#define PY_EVENT_PARAM_PID "pid"
#define PY_EVENT_PARAM_MANAGEMENT "management"

/* special job object attributes */
#define PY_JOB_FAILED_MOM_LIST "failed_mom_list"
#define PY_JOB_SUCCEEDED_MOM_LIST "succeeded_mom_list"

/* special resource object attributes - in modules/pbs/v1.1/_base_types.py */

#define PY_RESOURCE "resc"
#define PY_RESOURCE_NAME "_name"
#define PY_RESOURCE_HAS_VALUE "_has_value"
#define PY_RESOURCE_GENERIC_VALUE "<generic resource>"

/* descriptor-related symbols - in modules/pbs/v1.1/_base_types.py */
#define PY_DESCRIPTOR_NAME "_name"
#define PY_DESCRIPTOR_VALUE "_value"
#define PY_DESCRIPTOR_VALUE_TYPE "_value_type"
#define PY_DESCRIPTOR_CLASS_NAME "_class_name"
#define PY_DESCRIPTOR_IS_RESOURCE "_is_resource"
#define PY_DESCRIPTOR_RESC_ATTRIBUTE "_resc_attribute"

/* optional value attrib of a pbs.hold_types instance */
#define PY_OPVAL "opval"
#define PY_DELVAL "delval"

/* refers to the __sub__ method of pbs.hold_types */
#define PY_OPVAL_SUB "__sub__"

/* class-related - in modules/pbs/v1.1/_base_types.py */
#define PY_CLASS_DERIVED_TYPES "_derived_types"

/* PBS Python types - in modules/pbs/v1.1 files */

#define PY_TYPE_ATTR_DESCRIPTOR "attr_descriptor"
#define PY_TYPE_GENERIC "generic_type"
#define PY_TYPE_SIZE "size"
#define PY_TYPE_TIME "generic_time"
#define PY_TYPE_ACL "generic_acl"
#define PY_TYPE_BOOL "pbs_bool"
#define PY_TYPE_JOB "job"
#define PY_TYPE_QUEUE "queue"
#define PY_TYPE_SERVER "server"
#define PY_TYPE_RESV "resv"
#define PY_TYPE_VNODE "vnode"
#define PY_TYPE_EVENT "event"
#define PY_TYPE_RESOURCE "pbs_resource"
#define PY_TYPE_LIST "pbs_list"
#define PY_TYPE_INT "pbs_int"
#define PY_TYPE_STR "pbs_str"
#define PY_TYPE_FLOAT "pbs_float"
#define PY_TYPE_FLOAT2 "float"
#define PY_TYPE_ENTITY "pbs_entity"
#define PY_TYPE_ENV "pbs_env"
#define PY_TYPE_MANAGEMENT "management"
#define PY_TYPE_SERVER_ATTRIBUTE "server_attribute"

/* PBS Python Exception errors - in modules/pbs/v1.1 files */
#define PY_ERROR_EVENT_INCOMPATIBLE "EventIncompatibleError"
#define PY_ERROR_EVENT_UNSET_ATTRIBUTE "UnsetAttributeNameError"
#define PY_ERROR_BAD_ATTRIBUTE_VALUE_TYPE "BadAttributeValueTypeError"
#define PY_ERROR_BAD_ATTRIBUTE_VALUE "BadAttributeValueError"
#define PY_ERROR_UNSET_RESOURCE "UnsetResourceNameError"
#define PY_ERROR_BAD_RESOURCE_VALUE_TYPE "BadResourceValueTypeError"
#define PY_ERROR_BAD_RESOURCE_VALUE "BadResourceValueError"

/* Special values */

/* Value of an unset Job_Name attribute */
#define JOB_NAME_UNSET_VALUE "none"
#define WALLTIME_RESC "walltime" /* correlates with resv_duration */

/* Determines if attribute being set in C or in a Python script */
#define PY_MODE 1
#define C_MODE 2

/* Special Method names */
#define PY_GETRESV_METHOD "get_resv"
#define PY_GETVNODE_METHOD "get_vnode"
#define PY_ITER_NEXTFUNC_METHOD "iter_nextfunc"
#define PY_SIZE_TO_KBYTES_METHOD "size_to_kbytes"
#define PY_MARK_VNODE_SET_METHOD "mark_vnode_set"
#define PY_LOAD_RESOURCE_VALUE_METHOD "load_resource_value"
#define PY_RESOURCE_STR_VALUE_METHOD "resource_str_value"
#define PY_SET_C_MODE_METHOD "set_c_mode"
#define PY_SET_PYTHON_MODE_METHOD "set_python_mode"
#define PY_STR_TO_VNODE_STATE_METHOD "str_to_vnode_state"
#define PY_STR_TO_VNODE_NTYPE_METHOD "str_to_vnode_ntype"
#define PY_STR_TO_VNODE_SHARING_METHOD "str_to_vnode_sharing"
#define PY_VNODE_STATE_TO_STR_METHOD "vnode_state_to_str"
#define PY_VNODE_SHARING_TO_STR_METHOD "vnode_sharing_to_str"
#define PY_VNODE_NTYPE_TO_STR_METHOD "vnode_ntype_to_str"
#define PY_GET_PYTHON_DAEMON_NAME_METHOD "get_python_daemon_name"
#define PY_GET_PBS_SERVER_NAME_METHOD "get_pbs_server_name"
#define PY_GET_LOCAL_HOST_NAME_METHOD "get_local_host_name"
#define PY_GET_PBS_CONF_METHOD "get_pbs_conf"
#define PY_TYPE_PBS_ITER "pbs_iter"
#define ITER_QUEUES "queues"
#define ITER_JOBS "jobs"
#define ITER_RESERVATIONS "resvs"
#define ITER_VNODES "vnodes"
#define PY_LOGJOBMSG_METHOD "logjobmsg"
#define PY_REBOOT_HOST_METHOD "reboot"
#define PY_SCHEDULER_RESTART_CYCLE_METHOD "scheduler_restart_cycle"
#define PY_SET_PBS_STATOBJ_METHOD "set_pbs_statobj"
#define PY_GET_SERVER_STATIC_METHOD "get_server_static"
#define PY_GET_JOB_STATIC_METHOD "get_job_static"
#define PY_GET_RESV_STATIC_METHOD "get_resv_static"
#define PY_GET_VNODE_STATIC_METHOD "get_vnode_static"
#define PY_GET_QUEUE_STATIC_METHOD "get_queue_static"
#define PY_GET_SERVER_DATA_FP_METHOD "get_server_data_fp"
#define PY_GET_SERVER_DATA_FILE_METHOD "get_server_data_file"
#define PY_USE_STATIC_DATA_METHOD "use_static_data"

/* Event parameter names */
#define PBS_OBJ "pbs"
#define PBS_REBOOT_OBJECT "reboot"
#define PBS_REBOOT_CMD_OBJECT "reboot_cmd"
#define GET_NODE_NAME_FUNC "get_local_nodename()"
#define EVENT_OBJECT "pbs.event()"
#define EVENT_JOB_OBJECT EVENT_OBJECT ".job"
#define EVENT_JOB_O_OBJECT EVENT_OBJECT ".job_o"
#define EVENT_RESV_OBJECT EVENT_OBJECT ".resv"
#define EVENT_SRC_QUEUE_OBJECT EVENT_OBJECT ".src_queue"
#define EVENT_VNODE_OBJECT EVENT_OBJECT ".vnode"
#define EVENT_VNODE_O_OBJECT EVENT_OBJECT ".vnode_o"
#define EVENT_VNODELIST_OBJECT EVENT_OBJECT ".vnode_list"
#define EVENT_VNODELIST_FAIL_OBJECT EVENT_OBJECT ".vnode_list_fail"
#define EVENT_JOBLIST_OBJECT EVENT_OBJECT ".job_list"
#define EVENT_AOE_OBJECT EVENT_OBJECT ".aoe"
#define EVENT_ACCEPT_OBJECT EVENT_OBJECT ".accept"
#define EVENT_REJECT_OBJECT EVENT_OBJECT ".reject"
#define EVENT_REJECT_MSG_OBJECT EVENT_OBJECT ".reject_msg"
#define EVENT_HOOK_EUSER EVENT_OBJECT ".hook_euser"
#define EVENT_JOB_RERUNFLAG_OBJECT EVENT_OBJECT ".job._rerun"
#define EVENT_JOB_DELETEFLAG_OBJECT EVENT_OBJECT ".job._delete"
#define EVENT_PROGNAME_OBJECT EVENT_OBJECT ".progname"
#define EVENT_ARGV_OBJECT EVENT_OBJECT ".argv"
#define EVENT_ENV_OBJECT EVENT_OBJECT ".env"
#define EVENT_PID_OBJECT EVENT_OBJECT ".pid"
#define EVENT_MANAGEMENT_OBJECT EVENT_OBJECT ".management"

/* Special Job parameters */
#define JOB_FAILED_MOM_LIST_OBJECT EVENT_JOB_OBJECT "." PY_JOB_FAILED_MOM_LIST
#define JOB_SUCCEEDED_MOM_LIST_OBJECT EVENT_JOB_OBJECT "." PY_JOB_SUCCEEDED_MOM_LIST

/* Server parameter names */
#define SERVER_OBJECT "pbs.server()"
#define SERVER_JOB_OBJECT SERVER_OBJECT ".job"
#define SERVER_QUEUE_OBJECT SERVER_OBJECT ".queue"
#define SERVER_RESV_OBJECT SERVER_OBJECT ".resv"
#define SERVER_VNODE_OBJECT SERVER_OBJECT ".vnode"

extern void pbs_python_set_mode(int mode);

extern int pbs_python_event_mark_readonly(void);

extern int pbs_python_event_set(
	unsigned int hook_event,
	char *req_user,
	char *req_host,
	hook_input_param_t *req_params,
	char *perf_label);

extern int pbs_python_event_to_request(unsigned int hook_event,
				       hook_output_param_t *req_params, char *perf_label, char *perf_action);

extern int pbs_python_event_set_attrval(char *name, char *value);

extern char *
pbs_python_event_get_attrval(char *name);

extern void *pbs_python_event_get(void);

extern void
pbs_python_event_accept(void);

extern void
pbs_python_event_reject(char *msg);

extern char *
pbs_python_event_get_reject_msg(void);

extern int
pbs_python_event_get_accept_flag(void);

extern void
pbs_python_reboot_host(char *cmd);

extern void
pbs_python_scheduler_restart_cycle(void);

extern void
pbs_python_no_scheduler_restart_cycle(void);

int
pbs_python_get_scheduler_restart_cycle_flag(void);

extern char *
pbs_python_get_reboot_host_cmd(void);

extern int
pbs_python_get_reboot_host_flag(void);

extern void
pbs_python_event_param_mod_allow(void);

extern void
pbs_python_event_param_mod_disallow(void);

extern int
pbs_python_event_param_get_mod_flag(void);

extern void
pbs_python_set_interrupt(void);

extern char *
pbs_python_event_job_getval_hookset(char *attrib_name, char *opval,
				    int opval_len, char *delval, int delval_len);

extern char *
pbs_python_event_job_getval(char *attrib_name);

extern char *
pbs_python_event_jobresc_getval_hookset(char *attrib_name, char *resc_name);

extern int
pbs_python_event_jobresc_clear_hookset(char *attrib_name);

extern char *
pbs_python_event_jobresc_getval(char *attrib_name, char *resc_name);

extern int
pbs_python_has_vnode_set(void);

extern void
pbs_python_do_vnode_set(void);

extern void
pbs_python_set_hook_debug_input_fp(FILE *);

extern FILE *
pbs_python_get_hook_debug_input_fp(void);

extern void
pbs_python_set_hook_debug_input_file(char *);

extern char *
pbs_python_get_hook_debug_input_file(void);

extern void
pbs_python_set_hook_debug_output_file(char *);

extern char *
pbs_python_get_hook_debug_output_file(void);

extern void
pbs_python_set_hook_debug_output_fp(FILE *fp);

FILE *
pbs_python_get_hook_debug_output_fp(void);

extern void
pbs_python_set_hook_debug_data_fp(FILE *);

extern FILE *
pbs_python_get_hook_debug_data_fp(void);

extern void
pbs_python_set_hook_debug_data_file(char *);

extern char *
pbs_python_get_hook_debug_data_file(void);

extern void
pbs_python_set_use_static_data_value(int);

extern void
pbs_python_set_server_info(pbs_list_head *);

extern void
pbs_python_unset_server_info(void);

extern void
pbs_python_set_server_jobs_info(pbs_list_head *, pbs_list_head *);

extern void
pbs_python_unset_server_jobs_info(void);

extern void
pbs_python_set_server_queues_info(pbs_list_head *, pbs_list_head *);

extern void
pbs_python_unset_server_queues_info(void);

extern void
pbs_python_set_server_resvs_info(pbs_list_head *, pbs_list_head *);

extern void
pbs_python_unset_server_resvs_info(void);

extern void
pbs_python_set_server_vnodes_info(pbs_list_head *, pbs_list_head *);

extern void
pbs_python_unset_server_vnodes_info(void);

extern int
varlist_same(char *varl1, char *varl2);

extern int
pbs_python_set_os_environ(char *env_var, char *env_val);

extern int
pbs_python_set_pbs_hook_config_filename(char *conf_file);

extern void
hook_input_param_init(hook_input_param_t *hook_input);

extern void
hook_output_param_init(hook_output_param_t *hook_output);

/* -- END PBS Server/Python implementations -- */

#ifdef __cplusplus
}
#endif

#endif /* _PBS_PYTHON_DEF */


================================================
FILE: src/include/pbs_python_private.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_PYTHON_PRIVATE_DEF
#define _PBS_PYTHON_PRIVATE_DEF

/*
 * This header file contains dependencies to be *ONLY* used by the embedded or
 * extesion Python/C routines. These are typically found in src/lib/Libpython.
 *
 * Always include this header file within #ifdef PYTHON
 *
 * IMPORTANT:
 *   Under no circumstance this header file should be included by sources out-
 *   side the src/lib/Libpython directory. Extranlize any needed functionalities
 *   provided by this routine using generic pointers and place them in <pbs_python.h>.
 *
 *   The motivation for doing this is care has been taken so that the actual python
 *   build environment CPPFLAGS and CFLAGS are passed to the compiler that acts on the
 *   source files that include this header file. There will be situations where this
 *   compiler flags could break or spit out warnings if it is passed to the whole build
 *   environment.
 *
 *
 *
 */

#ifndef PY_SSIZE_T_CLEAN
#define PY_SSIZE_T_CLEAN
#endif
#include <Python.h>
#include <pbs_python.h> /* the pbs python external header file supporting
                             with or without built-in python */

/* The below is the C pbs python extension module */
#ifndef PBS_PYTHON_V1_MODULE_EXTENSION_NAME
#define PBS_PYTHON_V1_MODULE_EXTENSION_NAME "_pbs_v1"
#endif

/* The below is the pure pbs.v1 package */
#ifndef PBS_PYTHON_V1_MODULE
#define PBS_PYTHON_V1_MODULE "pbs.v1"
#endif

/* this is the dictionary containing all the types for the embedded interp */
#define PBS_PYTHON_V1_TYPES_DICTIONARY "EXPORTED_TYPES_DICT"

/*             BEGIN CONVENIENCE LOGGING MACROS                              */

/* Assumptions:
 *    log_buffer
 *    pbs_python_daemon_name
 */

#define LOG_EVENT_DEBUG_MACRO(_evtype)                                              \
	if (_evtype & PBSEVENT_DEBUG3)                                              \
		log_event(_evtype,                                                  \
			  PBS_EVENTCLASS_SERVER, LOG_DEBUG, pbs_python_daemon_name, \
			  log_buffer);                                              \
	else                                                                        \
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | _evtype,               \
			  PBS_EVENTCLASS_SERVER, LOG_DEBUG, pbs_python_daemon_name, \
			  log_buffer);

#define DEBUG_ARG1_WRAP(_evtype, fmt, a)                        \
	do {                                                    \
		snprintf(log_buffer, LOG_BUF_SIZE - 1, fmt, a); \
		log_buffer[LOG_BUF_SIZE - 1] = '\0';            \
		LOG_EVENT_DEBUG_MACRO(_evtype);                 \
	} while (0)

#define DEBUG_ARG2_WRAP(_evtype, fmt, a, b)                        \
	do {                                                       \
		snprintf(log_buffer, LOG_BUF_SIZE - 1, fmt, a, b); \
		log_buffer[LOG_BUF_SIZE - 1] = '\0';               \
		LOG_EVENT_DEBUG_MACRO(_evtype);                    \
	} while (0)

#define DEBUG1_ARG1(fmt, a) DEBUG_ARG1_WRAP(PBSEVENT_DEBUG, fmt, a)
#define DEBUG2_ARG1(fmt, a) DEBUG_ARG1_WRAP(PBSEVENT_DEBUG2, fmt, a)
#define DEBUG3_ARG1(fmt, a) DEBUG_ARG1_WRAP(PBSEVENT_DEBUG3, fmt, a)
#define DEBUG1_ARG2(fmt, a, b) DEBUG_ARG2_WRAP(PBSEVENT_DEBUG, fmt, a, b)
#define DEBUG2_ARG2(fmt, a, b) DEBUG_ARG2_WRAP(PBSEVENT_DEBUG2, fmt, a, b)
#define DEBUG3_ARG2(fmt, a, b) DEBUG_ARG2_WRAP(PBSEVENT_DEBUG3, fmt, a, b)

#define LOG_ERROR_ARG2(fmt, a, b)                                  \
	do {                                                       \
		snprintf(log_buffer, LOG_BUF_SIZE - 1, fmt, a, b); \
		log_buffer[LOG_BUF_SIZE - 1] = '\0';               \
		(void) log_record(PBSEVENT_ERROR | PBSEVENT_FORCE, \
				  PBS_EVENTCLASS_SERVER, LOG_ERR,  \
				  pbs_python_daemon_name,          \
				  log_buffer);                     \
	} while (0)

#define IS_PBS_PYTHON_CMD(a) (((a) != NULL) && (strcmp((a), "pbs_python") == 0))

/*             END CONVENIENCE LOGGING MACROS                              */

/*
 * All Python Types from the pbs.v1 module
 */

/* declarations from common_python_utils.c */

extern void pbs_python_write_object_to_log(PyObject *, char *, int);

extern void pbs_python_write_error_to_log(const char *);
extern int pbs_python_modify_syspath(const char *, int);
extern int pbs_python_dict_set_item_integral_value(PyObject *,
						   const char *,
						   const Py_ssize_t);
extern int pbs_python_dict_set_item_string_value(PyObject *,
						 const char *,
						 const char *);
extern int pbs_python_object_set_attr_string_value(PyObject *,
						   const char *,
						   const char *);

extern int pbs_python_object_set_attr_integral_value(PyObject *,
						     const char *,
						     int);

extern int pbs_python_object_get_attr_integral_value(PyObject *,
						     const char *);

extern char *pbs_python_object_get_attr_string_value(PyObject *,
						     const char *);

extern char *pbs_python_object_str(PyObject *);

extern char *pbs_python_list_get_item_string_value(PyObject *, int);

extern PyObject *pbs_python_import_name(const char *, const char *);

/* declarations from module_pbs_v1.c */

extern PyObject *pbs_v1_module_init(void);
extern PyObject *pbs_v1_module_inittab(void);

/* declrations from pbs_python_svr_internal.c */

extern PyObject *
_pbs_python_event_get_param(char *name);

#endif /* _PBS_PYTHON_PRIVATE_DEF */


================================================
FILE: src/include/pbs_reliable.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_RELIABLE_H
#define _PBS_RELIABLE_H

#ifdef __cplusplus
extern "C" {
#endif

#include "pbs_ifl.h"
#include "libutil.h"
#include "placementsets.h"
#include "list_link.h"

#define DEFAULT_JOINJOB_ALARM 30
#define DEFAULT_JOB_LAUNCH_DELAY 30
/*
 *
 *  pbs_reliable.h
 *  This file contains all the definitions that are used by
 *  server/mom/hooks for supporting reliable job startup.
 *
 */

/*
 * The reliable_job_node structure is used to keep track of nodes
 * representing mom hosts fore reliable job startup.
 */
typedef struct reliable_job_node {
	pbs_list_link rjn_link;
	int prologue_hook_success;	    /* execjob_prologue hook execution succeeded */
	char rjn_host[PBS_MAXHOSTNAME + 1]; /* mom host name */
} reliable_job_node;

extern reliable_job_node *reliable_job_node_find(pbs_list_head *, char *);
extern int reliable_job_node_add(pbs_list_head *, char *);
extern void reliable_job_node_delete(pbs_list_head *, char *);
extern reliable_job_node *reliable_job_node_set_prologue_hook_success(pbs_list_head *, char *);
extern void reliable_job_node_free(pbs_list_head *);
extern void reliable_job_node_print(char *, pbs_list_head *, int);

/**
 *
 * @brief
 * 	The relnodes_input_t structure contains the input request
 * 	parameters to the pbs_release_nodes_*() function.
 *
 * @param[in]	jobid - pointer to id of the job being released
 * @param[in]	vnodes_data - list of vnodes and their data in the system
 * @param[in]	execvnode - job's exec_vnode value
 * @param[in]	exechost - job's exec_host value
 * @param[in]	exechost2 - job's exec_host2 value
 * @param[in]	schedselect - job's schedselect value
 * @param[out]	p_new_exec_vhode - holds the new exec_vnode value after release
 * @param[out]	p_new_exec_host - holds the new exec_host value after release
 * @param[out]	p_new_exec_host2 - holds the new exec_host2 value after release
 * @param[out]	p_new_schedselect - holds the new schedselect value after release
 *
 */
typedef struct relnodes_input {
	char *jobid;
	void *vnodes_data;
	char *execvnode;
	char *exechost;
	char *exechost2;
	char *schedselect;
	char **p_new_exec_vnode;
	char **p_new_exec_host[2];
	char **p_new_schedselect;
} relnodes_input_t;

/**
 *
 * @brief
 * 	The relnodes_given_nodelist_t structure contains the additional
 * 	input parameters to the pbs_release_nodes(_given_vnodelist) function
 *	when called to release a set of vnodes.
 *
 * @param[in]	vnodelist - list of vnodes to release
 * @param[in]	deallocated_nodes_orig - job's current deallocated_exevnode value
 * @param[out]	p_new_deallocated_execvnode - holds the new deallocated_exec_vnode after release
 */
typedef struct relnodes_input_vnodelist {
	char *vnodelist;
	char *deallocated_nodes_orig;
	char **p_new_deallocated_execvnode;
} relnodes_input_vnodelist_t;

/**
 *
 * @brief
 * 	The relnodes_given_select_t structure contains the input
 * 	parameters to the pbs_release_nodes_given_select() function
 *	when called to satisfy select_str parameter.
 *
 * @param[in]	select_str - job's select value after nodes are released
 * @param[in]	failed_mom_list - list of unhealthy moms
 * @param[in]	succeeded_mom_list - list of healthy moms
 * @param[in]	failed_vnodes - list of vnodes assigned to the job managed by unhealthy moms
 * @param[in]	good_vnodes- list of vnodes assigned to the job managed by healthy moms
 */
typedef struct relnodes_input_select {
	char *select_str;
	pbs_list_head *failed_mom_list;
	pbs_list_head *succeeded_mom_list;
	vnl_t **failed_vnodes;
	vnl_t **good_vnodes;
} relnodes_input_select_t;

extern void relnodes_input_init(relnodes_input_t *r_input);
extern void relnodes_input_vnodelist_init(relnodes_input_vnodelist_t *r_input);
extern void relnodes_input_select_init(relnodes_input_select_t *r_input);
extern int pbs_release_nodes_given_select(relnodes_input_t *r_input, relnodes_input_select_t *r_input2, char *err_msg, int err_msg_sz);

extern int pbs_release_nodes_given_nodelist(relnodes_input_t *r_input, relnodes_input_vnodelist_t *r_input2, char *err_msg, int err_msg_sz);

extern int do_schedselect(char *, void *, void *, char **, char **);

#include "placementsets.h"
extern int prune_exec_vnode(job *pjob, char *select_str, vnl_t **failed_vnodes, vnl_t **good_vnodes, char *err_msg, int err_msg_sz);

// clang-format off
#define FREE_VNLS(vnf, vng) { \
vnl_free(vnf); \
vnf = NULL; \
vnl_free(vng); \
vng = NULL; \
}

// clang-format on

#ifdef __cplusplus
}
#endif

#endif /* _PBS_INTERNAL_H */


================================================
FILE: src/include/pbs_sched.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_SCHED_H
#define _PBS_SCHED_H

#ifdef __cplusplus
extern "C" {
#endif

#include "pbs_config.h"
#include "pbs_ifl.h"
#include "libpbs.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_ifl.h"
#include "server_limits.h"
#include "sched_cmds.h"
#include "work_task.h"
#include "net_connect.h"
#include "resv_node.h"
#include "queue.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"

#define PBS_SCHED_CYCLE_LEN_DEFAULT 1200

/* Default value of preempt_queue_prio */
#define PBS_PREEMPT_QUEUE_PRIO_DEFAULT 150

#define SC_STATUS_LEN 10

/*
 * Attributes for the server's sched object
 * Must be the same order as listed in sched_attr_def (master_sched_attr_def.xml)
 */
enum sched_atr {
#include "sched_attr_enum.h"
#include "site_sched_attr_enum.h"
	/* This must be last */
	SCHED_ATR_LAST
};

extern void *sched_attr_idx;
extern attribute_def sched_attr_def[];

typedef struct pbs_sched {
	pbs_list_link sc_link;					      /* link to all scheds known to server */
	int sc_primary_conn;					      /* primary connection to sched */
	int sc_secondary_conn;					      /* secondary connection to sched */
	int svr_do_schedule;					      /* next sched command which will be sent to sched */
	int svr_do_sched_high;					      /* next high prio sched command which will be sent to sched */
	pbs_net_t sc_conn_addr;					      /* sched host address */
	time_t sch_next_schedule;				      /* time when to next run scheduler cycle */
	char sc_name[PBS_MAXSCHEDNAME + 1];			      /* name of sched this sched */
	struct preempt_ordering preempt_order[PREEMPT_ORDER_MAX + 1]; /* preempt order for this sched */
	int sc_cycle_started;					      /* indicates whether sched cycle is started or not, 0 - not started, 1 - started */
	attribute sch_attr[SCHED_ATR_LAST];			      /* sched object's attributes  */
	short newobj;						      /* is this new sched obj? */
} pbs_sched;

extern pbs_sched *dflt_scheduler;
extern pbs_list_head svr_allscheds;
extern void set_scheduler_flag(int flag, pbs_sched *psched);
extern int find_assoc_sched_jid(char *jid, pbs_sched **target_sched);
extern int find_assoc_sched_pque(pbs_queue *pq, pbs_sched **target_sched);
extern pbs_sched *find_sched_from_sock(int sock, conn_origin_t which);
extern pbs_sched *find_sched(char *sched_name);
extern int validate_job_formula(attribute *pattr, void *pobject, int actmode);
extern pbs_sched *find_sched_from_partition(char *partition);
extern int recv_sched_cycle_end(int sock);
extern void handle_deferred_cycle_close(pbs_sched *psched);

attribute *get_sched_attr(const pbs_sched *psched, int attr_idx);
char *get_sched_attr_str(const pbs_sched *psched, int attr_idx);
struct array_strings *get_sched_attr_arst(const pbs_sched *psched, int attr_idx);
pbs_list_head get_sched_attr_list(const pbs_sched *psched, int attr_idx);
long get_sched_attr_long(const pbs_sched *psched, int attr_idx);
int set_sched_attr_generic(pbs_sched *psched, int attr_idx, char *val, char *rscn, enum batch_op op);
int set_sched_attr_str_slim(pbs_sched *psched, int attr_idx, char *val, char *rscn);
int set_sched_attr_l_slim(pbs_sched *psched, int attr_idx, long val, enum batch_op op);
int set_sched_attr_b_slim(pbs_sched *psched, int attr_idx, long val, enum batch_op op);
int set_sched_attr_c_slim(pbs_sched *psched, int attr_idx, char val, enum batch_op op);
int is_sched_attr_set(const pbs_sched *psched, int attr_idx);
void free_sched_attr(pbs_sched *psched, int attr_idx);
void clear_sched_attr(pbs_sched *psched, int attr_idx);

#ifdef __cplusplus
}
#endif
#endif /* _PBS_SCHED_H */


================================================
FILE: src/include/pbs_share.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * The purpose of this file is to share information between different parts
 * of PBS.
 * An example would be to share a constant between the server and the scheduler
 */

#ifndef PBS_SHARE
#define PBS_SHARE

#ifdef __cplusplus
extern "C" {
#endif

#include "pbs_ifl.h"

/* Formula special case constants */

#define FORMULA_FSPERC "fairshare_perc"
#define FORMULA_FSPERC_DEP "fair_share_perc"
#define FORMULA_TREE_USAGE "fairshare_tree_usage"
#define FORMULA_FSFACTOR "fairshare_factor"
#define FORMULA_QUEUE_PRIO "queue_priority"
#define FORMULA_JOB_PRIO "job_priority"
#define FORMULA_ELIGIBLE_TIME "eligible_time"
#define FORMULA_ACCRUE_TYPE "accrue_type"

/* Well known file to store job sorting formula */
#define FORMULA_FILENAME "sched_formula"
#define FORMULA_ATTR_PATH "server_priv/" FORMULA_FILENAME

/* Constant to check preempt_targets for NONE */
#define TARGET_NONE "NONE"

/* Constants for qstat's comment field */

/* comment buffer can hold max 255 chars */
#define COMMENT_BUF_SIZE 256
/* buffer takes only 255 chars, minus 34 chars for timespec, hence the remaining.
 * sacrificing 3 chars for ...
 */
#define MAXCOMMENTSCOPE COMMENT_BUF_SIZE - 1 - 34
#define MAXCOMMENTLEN COMMENT_BUF_SIZE - 1 - 37
/* comment line has 3 spaces each at beginning and at end. hence, for qstat -s
 * 74 chars can be displayed and for qstat -sw 114 chars can be displayed.
 */
#define COMMENTLENSCOPE_SHORT 74
#define COMMENTLENSCOPE_WIDE 114
/* if comment string is longer than length of the scope then ... is appended.
 * this reduces the actual display length by 3
 */
#define COMMENTLEN_SHORT 71
#define COMMENTLEN_WIDE 111

/* number of digits to print after the decimal point for floats */
#define FLOAT_NUM_DIGITS 4

/* the size (in bytes) of a word.  All resources are kept in kilobytes
 * internally in the server.  If any specification is in words, it will be
 * converted into kilobytes with this constant
 */
#define SIZEOF_WORD 8

/* Default scheduler name */
#define PBS_DFLT_SCHED_NAME "default"

/* scheduler-attribute values (state) */
#define SC_DOWN "down"
#define SC_IDLE "idle"
#define SC_SCHEDULING "scheduling"

#define MAX_INT_LEN 10

/* Values of sched attribute 'job_run_wait' */
#define RUN_WAIT_NONE "none"
#define RUN_WAIT_RUNJOB_HOOK "runjob_hook"
#define RUN_WAIT_EXECJOB_HOOK "execjob_hook"

struct preempt_ordering {
	unsigned high_range; /* high end of the walltime range */
	unsigned low_range;  /* low end of the walltime range */

	enum preempt_method order[PREEMPT_METHOD_HIGH]; /* the order to preempt jobs */
};

#ifdef __cplusplus
}
#endif
#endif


================================================
FILE: src/include/pbs_v1_module_common.i
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#if !defined(PBS_v1_COMMON_I_INCLUDED)
#define PBS_v1_COMMON_I_INCLUDED 1

time_t time_now = 0;

/*
 * the names of the Server:
 *    pbs_server_name - from PBS_SERVER_HOST_NAME
 *	  server_name - from PBS_SERVER
 *	  server_host - Set as follows:
 *	  		1. FQDN of pbs_server_name if set
 *	  		2. FQDN of server_name if set
 *	  		3. Call gethostname()
 *
 * The following is an excerpt from the EDD for SPID 4534 that explains
 * how PBS_SERVER_HOST_NAME is used:
 *
 * I.1.2.3	Synopsis:
 * Add new optional entry in PBS Configuration whose value is the fully
 * qualified domain name (FQDN) of the host on which the PBS Server is
 * running.
 *	I.1.2.3.1	This name is used by clients to contact the Server.
 *	I.1.2.3.2	If PBS Failover is configured (PBS_PRIMARY and
 *			PBS_SECONDARY in the PBS Configuration), this symbol
 *			and its value will be ignored and the values of
 *			PBS_PRIMARY and PBS_SECONDARY will be use as per
 *			sectionI.1.1.1.
 *	I.1.2.3.3	When  PBS failover is not configured and
 *			PBS_SERVER_HOST_NAME is specified, if the server_name
 *			is not specified by the client or is specified and
 *			matches the value of PBS_SERVER, then the value of
 *			PBS_SERVER_HOST_NAME is used as the name of the Server
 *			to contact.
 *	I.1.2.3.4	Note: When PBS_SERVER_HOST_NAME is not specified,
 *			the current behavior for determining the name of the
 *			Server to contact will still apply.
 *	I.1.2.3.5	The value of the configuration variable should be a
 *			fully qualified host name to avoid the possibility of
 *			host name collisions (e.g. master.foo.domain.name and
 *			master.bar.domain.name).
 */
char *pbs_server_name = NULL;
char server_name[PBS_MAXSERVERNAME+1] = "";  /* host_name[:service|port] */
char server_host[PBS_MAXHOSTNAME+1] = "";  /* host_name of this svr */
struct server server = {{0}};  /* the server structure */
struct pbsnode **pbsndlist = NULL;  /* array of ptr to nodes */
int svr_totnodes = 0;  /* number of nodes (hosts) */
struct python_interpreter_data  svr_interp_data;
int svr_delay_entry = 0;
pbs_list_head svr_queues;  /* list of queues */
pbs_list_head svr_alljobs;  /* list of all jobs in server */
pbs_list_head svr_allresvs;  /* all reservations in server */
pbs_list_head svr_queues;
pbs_list_head svr_alljobs;
pbs_list_head svr_allresvs;
pbs_list_head svr_allhooks;
pbs_list_head svr_queuejob_hooks;
pbs_list_head svr_postqueuejob_hooks;
pbs_list_head svr_modifyjob_hooks;
pbs_list_head svr_resvsub_hooks;
pbs_list_head svr_modifyresv_hooks;
pbs_list_head svr_movejob_hooks;
pbs_list_head svr_runjob_hooks;
pbs_list_head svr_jobobit_hooks;
pbs_list_head svr_management_hooks;
pbs_list_head svr_modifyvnode_hooks;
pbs_list_head svr_provision_hooks;
pbs_list_head svr_periodic_hooks;
pbs_list_head svr_resv_confirm_hooks;
pbs_list_head svr_resv_begin_hooks;
pbs_list_head svr_resv_end_hooks;
pbs_list_head svr_execjob_begin_hooks;
pbs_list_head svr_execjob_prologue_hooks;
pbs_list_head svr_execjob_epilogue_hooks;
pbs_list_head svr_execjob_preterm_hooks;
pbs_list_head svr_execjob_launch_hooks;
pbs_list_head svr_execjob_end_hooks;
pbs_list_head svr_exechost_periodic_hooks;
pbs_list_head svr_exechost_startup_hooks;
pbs_list_head svr_execjob_attach_hooks;
pbs_list_head svr_execjob_resize_hooks;
pbs_list_head svr_execjob_abort_hooks;
pbs_list_head svr_execjob_postsuspend_hooks;
pbs_list_head svr_execjob_preresume_hooks;

pbs_list_head task_list_immed;
pbs_list_head task_list_interleave;
pbs_list_head task_list_timed;
pbs_list_head task_list_event;

char *path_hooks = NULL;
char *path_hooks_workdir = NULL;
char *path_rescdef = NULL;
char *resc_in_err = NULL;

void *job_attr_idx = NULL;
void *resv_attr_idx = NULL;
void *node_attr_idx = NULL;
void *que_attr_idx = NULL;
void *svr_attr_idx = NULL;
void *sched_attr_idx = NULL;

#if defined(PBS_V1_COMMON_MODULE_DEFINE_STUB_FUNCS)
/*
 *	The following are a set of unused stub functions needed so that pbs_python
 *	and the loadable pbs_v1 Python module can be linked to svr_attr_def.o,
 *	job_attr_def.o, node_attr_def.o, queue_attr_def.o, resv_attr_def.o
 *
 */
#ifndef PBS_PYTHON
PyObject *
PyInit__pbs_ifl(void) {
	return NULL;
}
#endif

int
node_state(attribute *new, void *pnode, int actmode) {
	return 0;
}

int
set_resources_min_max(attribute *old, attribute *new, enum batch_op op) {
	return (0);
}

void
set_scheduler_flag(int flag, pbs_sched *psched) {
	return;
}

job	*
find_job(char *jobid) {
	return NULL;
}

resc_resv *
find_resv(char *resvid) {
	return NULL;
}

pbs_queue *
find_queuebyname(char *qname) {
	return NULL;
}

struct pbsnode *find_nodebyname(char *nname) {
	return NULL;
}

void
write_node_state(void) {
	return;
}

void
mgr_log_attr(char *msg, struct svrattrl *plist, int logclass,
		char *objname, char *hookname) {
	return;
}

int
mgr_set_attr(attribute *pattr, void *pidx, attribute_def *pdef, int limit,
		svrattrl *plist, int privil, int *bad, void *parent, int mode) {
	return (0);
}

int
svr_chk_history_conf(void) {
	return (0);
}

int
save_nodes_db(int flag, void *pmom) {
	return (0);
}

void
update_state_ct(attribute *pattr, int *ct_array, attribute_def *attr_def) {
	return;
}

void
update_license_ct() {
	return;
}

int
is_job_array(char *jobid) {
	return (0);
}

job *
find_arrayparent(char *subjobid) {
	return NULL;
}

int
ck_chkpnt(attribute *pattr, void *pobject, int mode) {
	return (0);
}

int
cred_name_okay(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
poke_scheduler(attribute *attr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
action_sched_priv(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
action_sched_log(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
action_sched_iteration(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
action_sched_user(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
action_queue_partition(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
action_sched_preempt_order(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
action_sched_preempt_common(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
action_reserve_retry_time(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
action_reserve_retry_init(attribute *pattr, void *pobj, int actmode) {
        return PBSE_NONE;
}

int
set_rpp_retry(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
set_rpp_highwater(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
is_valid_resource(attribute *pattr, void *pobject, int actmode) {

	return PBSE_NONE;
}

int
deflt_chunk_action(attribute *pattr, void *pobj, int mode) {

	return 0;
}

int
action_svr_iteration(attribute *pattr, void *pobj, int mode) {
	return 0;
}

int
set_license_location(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

void
unset_license_location(void) {
	return;
}

int
set_node_fail_requeue(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

void
unset_node_fail_requeue(void) {
	return;
}

int
set_resend_term_delay(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

void
unset_resend_term_delay(void) {
	return;
}

int
action_node_partition(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

int
set_license_min(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

void
unset_license_min(void) {
	return;
}

int
set_license_max(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

void
unset_license_max(void) {
	return;
}

int
set_license_linger(attribute *pattr, void *pobject, int actmode) {

	return (PBSE_NONE);
}

void
unset_license_linger(void) {
	return;
}

void
unset_job_history_enable(void) {
	return;
}

int
set_job_history_enable(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

int
set_job_history_duration(attribute *pattr, void *pobject, int actmode) {

	return (PBSE_NONE);
}

void
unset_job_history_duration(void) {
	return;
}

int
set_max_job_sequence_id(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

void
unset_max_job_sequence_id(void) {
	return;
}

int
eligibletime_action(attribute *pattr, void *pobject, int actmode) {
	return 0;
}

int
decode_formula(attribute *patr, char *name, char *rescn, char *val) {
	return PBSE_NONE;
}

int
action_entlim_chk(attribute *pattr, void *pobject, int actmode) {
	return PBSE_NONE;
}

int
action_entlim_ct(attribute *pattr, void *pobject, int actmode) {
	return PBSE_NONE;
}

int
action_entlim_res(attribute *pattr, void *pobject, int actmode) {
	return PBSE_NONE;
}

int
check_no_entlim(attribute *pattr, void *pobject, int actmode) {
	return 0;
}

int
default_queue_chk(attribute *pattr, void *pobj, int actmode) {
	return (PBSE_NONE);
}

void
set_vnode_state(struct pbsnode *pnode, unsigned long state_bits,
		 enum vnode_state_op type) {
	return;
}

int
ctcpus(char *buf, int *hascpp) {
	return 0;
}

int
validate_nodespec(char *str) {
	return 0;
}

int
check_que_enable(attribute *pattr, void *pque, int mode) {
	return (0);
}

int
set_queue_type(attribute *pattr, void *pque, int mode) {
	return (0);
}

int
manager_oper_chk(attribute *pattr, void *pobject, int actmode) {
	return (0);
}

int
node_comment(attribute *pattr, void *pobj, int act) {
	return 0;
}

int
node_prov_enable_action(attribute *new, void *pobj, int act) {
	return PBSE_NONE;
}

int
set_log_events(attribute *new, void *pobj, int act) {
	return PBSE_NONE;
}

int
node_current_aoe_action(attribute *new, void *pobj, int act) {
	return PBSE_NONE;
}

int
action_sched_host(attribute *new, void *pobj, int act)
{
	return PBSE_NONE;
}

int
action_throughput_mode(attribute *new, void *pobj, int act)
{
	return PBSE_NONE;
}

int
action_job_run_wait(attribute *new, void *pobj, int act)
{
	return PBSE_NONE;
}

int
action_opt_bf_fuzzy(attribute *new, void *pobj, int act)
{
	return PBSE_NONE;
}

int
action_sched_partition(attribute *new, void *pobj, int act)
{
	return PBSE_NONE;
}

int
action_max_run_subjobs(attribute *pattr, void *pobject, int actmode)
{
	return 0;
}

int
decode_rcost(attribute *patr, char *name, char *rescn, char *val) {
	return 0;
}

int
encode_rcost(const attribute *attr, pbs_list_head *phead, char *atname,
		char *rsname, int mode, svrattrl **rtnl) {
	return (1);
}

int
set_rcost(attribute *old, attribute *new, enum batch_op op) {
	return (0);
}

void
free_rcost(attribute *pattr) {
	return;
}

int
svr_max_conc_prov_action(attribute *new, void *pobj, int act) {
	return 0;
}

int
action_backfill_depth(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
action_jobscript_max_size(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
action_check_res_to_release(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
queuestart_action(attribute *pattr, void *pobject, int actmode) {
	return 0;
}

int
set_cred_renew_enable(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
set_cred_renew_period(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
set_cred_renew_cache_period(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
encode_svrstate(const attribute *pattr, pbs_list_head *phead, char *atname,
		char *rsname, int mode, svrattrl **rtnl) {
	return (1);
}

int
comp_chkpnt(attribute *attr, attribute *with) {
	return 0;
}

int
decode_depend(attribute *patr, char *name, char *rescn, char *val) {
	return (0);
}

int
encode_depend(const attribute *attr, pbs_list_head *phead, char *atname,
		char *rsname, int mode, svrattrl **rtnl) {
	return 0;
}

int
set_depend(attribute *attr, attribute *new, enum batch_op op) {
	return (0);
}

int
comp_depend(attribute *attr, attribute *with) {
	return (-1);
}

void
free_depend(attribute *attr) {
	return;
}

int
depend_on_que(attribute *pattr, void *pobj, int mode) {
	return 0;
}

int
job_set_wait(attribute *pattr, void *pjob, int mode) {
	return (0);
}

int
alter_eligibletime(attribute *pattr, void *pobject, int actmode) {
	return PBSE_NONE;
}

int
keepfiles_action(attribute *pattr, void *pobject, int actmode) {
    return PBSE_NONE;
}

int
removefiles_action(attribute *pattr, void *pobject, int actmode) {
    return PBSE_NONE;
}

int
action_est_start_time_freq(attribute *pattr, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
setup_arrayjob_attrs(attribute *pattr, void *pobj, int mode) {
	return (PBSE_NONE);
}

int
fixup_arrayindicies(attribute *pattr, void *pobj, int mode) {
	return (PBSE_NONE);
}

int
decode_Mom_list(attribute *patr, char *name, char *rescn, char *val) {
	return (0);
}

int
node_queue_action(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
set_node_host_name(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
set_node_mom_port(attribute *pattr, void *pobj, int actmode) {
	return 0;
}

int
node_np_action(attribute *new, void *pobj, int actmode) {
	return PBSE_NONE;
}

int
node_pcpu_action(attribute *new, void *pobj, int actmode) {
	return (0);
}

char*
find_aoe_from_request(resc_resv *presv) {
	return NULL;
}

int
force_qsub_daemons_update_action(attribute *pattr, void *pobject,
	int actmode) {
	return (PBSE_NONE);
}

int
set_node_topology(attribute *pattr, void *pobject, int actmode) {

	return (PBSE_NONE);
}

int
chk_vnode_pool(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

int
validate_job_formula(attribute *pattr, void *pobject, int actmode) {
	return (PBSE_NONE);
}

int
action_clear_topjob_estimates(attribute *pattr, void *pobj, int actmode) {
	return (PBSE_NONE);
}
#endif /* defined(PBS_V1_COMMON_MODULE_DEFINE_STUB_FUNCS) */

#endif /* defined(PBS_v1_COMMON_I_INCLUDED) */


================================================
FILE: src/include/pbs_version.h.in
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_VERSION_H
#define _PBS_VERSION_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * The version of this file and the PBS version have no simple correlation.
 *
 */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#ifdef WIN32
#define PBS_BUILD "mach=WIN32:security=:configure_args="
#define PBS_VERSION "@PBS_WIN_VERSION@"
#else
#include <pbs_config.h>

#ifndef PBS_BUILD
#define PBS_BUILD "mach=N/A:security=N/A:configure_args=N/A"
#endif

#ifndef PBS_VERSION
#define PBS_VERSION "@PBS_VERSION@"
#endif /* PBS_VERSION */

#endif

#define PRINT_VERSION_AND_EXIT(argc, argv) if (argc == 2 && strcasecmp(argv[1], "--version") == 0) { fprintf(stdout, "pbs_version = %s\n", PBS_VERSION); exit(0); }

#ifdef __cplusplus
}
#endif
#endif /* _PBS_VERSION_H */


================================================
FILE: src/include/placementsets.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	placementsets.h
 *
 * @brief
 *	Manage vnodes and their associated attributes
 */

#ifndef _PBS_PLACEMENTSETS_H
#define _PBS_PLACEMENTSETS_H

#include <sys/types.h>
#include <stdio.h>
#include "pbs_idx.h"

/*
 *	This structure is used to describe a dynamically-sized list, one which
 *	grows when needed.
 */
typedef struct dynlist {
	unsigned long dl_nelem; /* number of elements in dl_list[] */
	unsigned long dl_used;	/* of which this many are used */
	unsigned long dl_cur;	/* the one currently being filled in */
	void *dl_list;
} dl_t;

/**
 * @brief
 * @verbatim
 *	The list of vnodes and their associated attributes is tracked and
 *	maintained using a list that looks like this:
 *
 *	 +------------------------------+			vnl_t
 *	 |  	file mod time	        |
 *	 +------------------------------+
 *	 |	index tree		|
 *	 +------------------------------+
 *	 |	size of vnode list  	|
 *	 |	number of used entries	|
 *	 |	current entry index 	|
 *	 +------------------------------+
 *	 |	pointer to list head |	|
 *	 +---------------------------|--+
 *				     |
 *				    \ /
 *	   +---------------------------------------+ 	 	vnal_t
 *	   |	vnode ID		     | ... |
 *	   +---------------------------------------+
 *	   |	size of vnode attribute list | 	   |
 *	   |	number of used entries	     | ... |
 *	   |	current entry index	     | 	   |
 *	   +---------------------------------------+
 *	   |	pointer to list head | 	     | ... |
 *	   +-------------------------|-------------+
 *				     |
 *				    \ /
 *	      		     +-------------------------+	vna_t
 *			     | 	 attribute name  | ... |
 *			     |------------------ |-----+
 *			     | 	 attribute value | ... |
 *			     |------------------ |-----+
 *			     | 	 attribute type  | ... |    in V4 of message
 *			     |------------------ |-----+
 *			     | 0 (will be flags) | ... |    in V4 of message
 *			     +-------------------------+
 * @endverbatim
 */
typedef struct vnode_list {
	time_t vnl_modtime; /* last mod time for these data */
	void *vnl_ix;	    /* index with vnode name as key */
	dl_t vnl_dl;	    /* current state of vnal_t list */
#define vnl_nelem vnl_dl.dl_nelem
#define vnl_used vnl_dl.dl_used
#define vnl_cur vnl_dl.dl_cur
	/* vnl_list is a list of vnal_t structures */
#define vnl_list vnl_dl.dl_list
} vnl_t;
#define VNL_NODENUM(vnlp, n) (&((vnal_t *) ((vnlp)->vnl_list))[n])
#define CURVNLNODE(vnlp) VNL_NODENUM(vnlp, (vnlp)->vnl_cur)

typedef struct vnode_attrlist {
	char *vnal_id; /* unique ID for this vnode */
	dl_t vnal_dl;  /* current state of vna_t list */
#define vnal_nelem vnal_dl.dl_nelem
#define vnal_used vnal_dl.dl_used
#define vnal_cur vnal_dl.dl_cur
	/* vnal_list is a list of vna_t structures */
#define vnal_list vnal_dl.dl_list
} vnal_t;
#define VNAL_NODENUM(vnrlp, n) (&((vna_t *) ((vnrlp)->vnal_list))[n])
#define CURVNRLNODE(vnrlp) VNAL_NODENUM(vnrlp, (vnrlp)->vnal_cur)

typedef struct vnode_attr {
	char *vna_name; /* attribute[.resource] name */
	char *vna_val;	/* attribute/resource  value */
	int vna_type;	/* attribute/resource  data type */
	int vna_flag;	/* attribute/resource  flags */
} vna_t;

#define PS_DIS_V1 1
#define PS_DIS_V2 2
#define PS_DIS_V3 3
#define PS_DIS_V4 4
#define PS_DIS_CURVERSION PS_DIS_V4

/**
 * @brief
 *	An attribute named VNATTR_PNAMES attached to a ``special'' vnode
 *	will have as its value the list of placement set types.
 */
#define VNATTR_PNAMES "pnames"

/**
 * @brief
 *	An attribute named VNATTR_HOOK_REQUESTOR attached to a ``special'' vnode
 *	will have as its value as the requestor (user@host) who is
 *	making a hook request to update vnodes information.
 */
#define VNATTR_HOOK_REQUESTOR "requestor"

/**
 * @brief
 *	An attribute named VNATTR_OFFLINE_VNODES attached to a `special' vnode
 *	will have a "1.<hook_name>" value to mean: a hook named <hook_name>
 *	instucted the server to 'offline_by_mom' all the vnodes managed by the mom owning
 *	this special vnode.
 *	A value of "0.<hook_name>" means a hook named <hook_name> instructed
 *	the server to 'clear offline_by_mom' states of all the vnodes managed by the mom
 *	owning the special vnode.
 */
#define VNATTR_HOOK_OFFLINE_VNODES "offline_vnodes"

/**
 * @brief
 *	An attribute named VNATTR_SCHEDULER_RESTART_CYCLE
 *	attached to a `special' vnode
 *	will have a "1,<hook_name>" value to mean a hook named
 *	<hook_name> has requested that a message be sent to the
 *	scheduler to restart its scheduling cycle.
 */
#define VNATTR_HOOK_SCHEDULER_RESTART_CYCLE "scheduler_restart_cycle"

typedef int(callfunc_t)(char *, char *, char *);

/**
 * @brief	add attribute to vnode
 *
 * @retval	0	success
 *
 * @retval	-1	failure
 */
extern int vn_addvnr(vnl_t *, char *, char *, char *, int, int, callfunc_t);

/**
 * @return
 *	an attribute in a vnal_t
 *
 * @retval	NULL	attribute does not exist
 */
extern char *attr_exist(vnal_t *, char *);

/**
 * @return	vnal_t	pointer to vnode
 * @retval	NULL	node does not exist
 */
extern vnal_t *vn_vnode(vnl_t *, char *);

/**
 * @return
 * the value of the attribute
 *
 * @retval	NULL	attribute does not exist
 */
extern char *vn_exist(vnl_t *, char *, char *);

/**
 * @brief	allocate new vnode list
 *
 * @return
 *	a pointer to an empty vnode list
 *
 * @retval	NULL	error
 *
 * @par Side-effects
 *	Space allocated for vnode list should be freed with vnl_free().
 */
extern vnl_t *vnl_alloc(vnl_t **);

/**
 * @brief	free vnode list
 */
extern void vnl_free(vnl_t *);

/**
 * @brief	merge new vnode list into existing list
 *
 * @return
 *	the existing vnode list
 *
 * @retval	NULL	error
 */
extern vnl_t *vn_merge(vnl_t *, vnl_t *, callfunc_t);

/**
 * @brief	merge new vnode list into existing list
 * 		for those vnodes with certain attribute names.
 *
 * @return
 *	the existing vnode list
 *
 * @retval	NULL	error
 */
extern vnl_t *vn_merge2(vnl_t *, vnl_t *, char **, callfunc_t);

/**
 * @brief	parse a file containing vnode information into a vnode list
 *
 * @return
 *	a pointer to the resulting vnode list
 *
 * @retval	NULL	error
 *
 * @par Side-effects
 *	Space allocated by the parse functions should be freed with vnl_free().
 */
extern vnl_t *vn_parse(const char *, callfunc_t);

/**
 * @brief	parse an already opened stream containing vnode information
 *
 * @return
 *	a pointer to the resulting vnode list
 *
 * @retval	NULL	error
 *
 * @par Side-effects
 *	Space allocated by the parse functions should be freed with vnl_free().
 */
extern vnl_t *vn_parse_stream(FILE *, callfunc_t);

/**
 * @brief	read a vnode list off the wire
 *
 * @return
 *	a pointer to the resulting vnode list
 *
 * @retval	NULL	error
 *
 * @par Side-effects
 *	Space allocated for vnode list should be freed with vnl_free().
 */
extern vnl_t *vn_decode_DIS(int, int *);

/**
 * @brief	send a vnode list over the network
 *
 * @return
 *	a DIS error code
 *
 * @retval	DIS_SUCCESS	success
 */
extern int vn_encode_DIS(int, vnl_t *);
#endif /* _PBS_PLACEMENTSETS_H */


================================================
FILE: src/include/port_forwarding.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PORT_FORWARDING_H
#define _PORT_FORWARDING_H
#ifdef __cplusplus
extern "C" {
#endif

/*Defines used by port_forwarding.c*/
/* Max size of buffer to store data*/
#define PF_BUF_SIZE 8192

/* Limits the number of simultaneous X applications that a single job
 can run in the background to 24 . 1 socket fd is used for storing
 the X11 listening socket fd and 2 socket fds are used whenever an
 X application is started . Hence (24*2+1)=49 fds will be used when
 an attempt is make to start 24 X applications in the background .*/
#define NUM_SOCKS 50

/* Attempt to bind to a available port in the range of 6000+X11OFFSET to
 6000+X11OFFSET+MAX_DISPLAYS */
#define MAX_DISPLAYS 500
#define X11OFFSET 50

#define X_PORT 6000

/* derived from XF4/xc/lib/dps/Xlibnet.h */
#ifndef X_UNIX_PATH
#define X_UNIX_PATH "/tmp/.X11-unix/X%u"
#endif /* X_UNIX_PATH */

#ifndef NI_MAXSERV
#define NI_MAXSERV 32
#endif /* !NI_MAXSERV */

#define QSUB_SIDE 1
#define EXEC_HOST_SIDE 0

/*
 * Structure which maintains the relationship between the producer/consumer
 * sockets and also about the length of the data read/written.
 */
struct pfwdsock {
	int sock;
	int listening;
	int remotesock;
	int bufavail;
	int bufwritten;
	int active;
	int peer;
	char buff[PF_BUF_SIZE];
};
/*Functions available in port_forwarding.h*/
void port_forwarder(struct pfwdsock *, int (*connfunc)(char *phost, long pport),
		    char *, int, int inter_read_sock, int (*readfunc)(int), void (*logfunc)(char *),
		    int is_qsub_side, char *auth_method, char *encrypt_method, char *jobid);
int connect_local_xsocket(u_int);
int x11_connect_display(char *, long);
int set_nonblocking(int);

#ifdef __cplusplus
}
#endif
#endif /* _PORT_FORWARDING_H */


================================================
FILE: src/include/portability.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PORTABILITY_H
#define _PORTABILITY_H

#define closesocket(X) close(X)
#define initsocketlib() 0
#define SOCK_ERRNO errno

#define NULL_DEVICE "/dev/null"

#undef DLLEXPORT
#define DLLEXPORT

#define dlerror_reset() dlerror()
#define SHAREDLIB_EXT "so"
#define fix_path(char, int)
#define get_uncpath(char)
#define critical_section()

#ifdef PBS_MOM
#define TRAILING_CHAR '/'
#define verify_dir(dir_val, isdir, sticky, disallow, fullpath) tmp_file_sec(dir_val, isdir, sticky, disallow, fullpath)
#define FULLPATH 1
#define process_string(str, tok, len) wtokcpy(str, tok, len)

/* Check and skip if there are any special trailing character */
#define skip_trailing_spcl_char(line, char_to_skip) \
	{                                           \
	}

/* Check whether character is special allowed character */
#define check_spl_ch(check_char) 1
#endif

#endif


================================================
FILE: src/include/provision.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PROVISION_H
#define _PROVISION_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * provision.h - header file for maintaining provisioning related definitions
 *
 * These are linked into the server structure.  Entries are added or
 * updated upon the receipt of Track Provision Requests and are used to
 * satisfy Locate Provision requests.
 *
 * The main data is kept in the form of the track batch request so
 * that copying is easy.
 *
 * Other required header files:
 *	"server_limits.h"
 */

#ifdef WIN32
typedef HANDLE prov_pid;
#else
typedef pid_t prov_pid;
#endif /* WIN32 */

extern void prov_track_save(void);

/* Provisioning functions and structures*/
/**
 * @brief
 *
 */

struct prov_vnode_info {
	pbs_list_link al_link;
	char *pvnfo_vnode;
	char *pvnfo_aoe_req;
	char pvnfo_jobid[PBS_MAXSVRJOBID + 1]; /* job id */
	struct work_task *ptask_defer;
	struct work_task *ptask_timed;
};

/**
 * @brief
 *
 */

struct prov_tracking {
	time_t pvtk_mtime; /* time this entry modified */
	prov_pid pvtk_pid;
	char *pvtk_vnode;
	char *pvtk_aoe_req;
	struct prov_vnode_info *prov_vnode_info;
};

typedef char (*exec_vnode_listtype)[PBS_MAXHOSTNAME + 1]; /* typedef to pointer to an array*/

extern int check_and_enqueue_provisioning(job *, int *);

extern void do_provisioning(struct work_task *wtask);

#ifdef __cplusplus
}
#endif
#endif /* _PROVISION_H */


================================================
FILE: src/include/qmgr.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/* $I$ */

/* symbolic constants */
#define ALL_SERVERS -1 /* all servers for connect_servers() */
/* server name used for the default PBS server ("") */
#define DEFAULT_SERVER "default"
/* server name used for all the active servers */
#define ACTIVE_SERVER "active"
/* max word length in the reqest */
#define MAX_REQ_WORD_LEN 10240

/* there can be three words before the attribute list
 * command object name <attribute list> */
#define MAX_REQ_WORDS 3
#define IND_CMD 0
#define IND_OBJ 1
#define IND_NAME 2
#define IND_FIRST IND_CMD
#define IND_LAST IND_NAME

/* Macros */

/* This macro will determine if the char it is passed is a qmgr operator. */
#define Oper(x) ((*(x) == '=') ||                      \
		 (*(x) == '+' && *((x) + 1) == '=') || \
		 (*(x) == '-' && *((x) + 1) == '='))

/* This macro will determine if the char it is passed is white space. */
#define White(x) (isspace((int) (x)))

/* This macro will determine if the char is the end of a line. */
#define EOL(x) ((unsigned long) (x) == (unsigned long) '\0')

/* This macro will allocate memory for a character string */
#define Mstring(x, y)                             \
	if ((x = (char *) malloc(y)) == NULL) {   \
		pstderr("qmgr: Out of memory\n"); \
		clean_up_and_exit(5);             \
	}
/* This macro will duplicate string */
#define Mstrdup(x, y)                             \
	if ((x = strdup(y)) == NULL) {            \
		pstderr("qmgr: Out of memory\n"); \
		clean_up_and_exit(5);             \
	}
/* This macro will allocate memory for some fixed size object */
#define Mstruct(x, y)                                \
	if ((x = (y *) malloc(sizeof(y))) == NULL) { \
		pstderr("qmgr: Out of memory\n");    \
		clean_up_and_exit(5);                \
	}
/* server name: "" is the default server and NULL is all active servers */
#define Svrname(x) (((x) == NULL) ? ACTIVE_SERVER : ((strlen((x)->s_name)) ? (x)->s_name : DEFAULT_SERVER))
/*
 *
 *	PSTDERR1 - print error message to stdard error with one argument.
 *		   Message will not be printed if "-z" option was specifed
 *
 *	  string - format string to fprintf
 *	  arg    - argument to be printed
 *
 */
#define PSTDERR1(fmt, parm) \
	if (!zopt)          \
		fprintf(stderr, fmt, parm);
/* print an input line and then a caret under where the error has occured */
#define CaretErr(x, y)         \
	PSTDERR1("%s\n", (x)); \
	blanks((y));           \
	pstderr("^\n");
#define CLEAN_UP_REQ(x)                               \
	{                                             \
		int i;                                \
		for (i = 0; i < MAX_REQ_WORDS; i++) { \
			free(x[i]);                   \
		}                                     \
		free(x);                              \
	}

#define QMGR_HIST_SIZE 500 /* size of the qmgr history area */

/* structures */

/* this struct is for the open servers */
struct server {
	char *s_name;		    /* name of server */
	int s_connect;		    /* PBS connection descriptor to server */
	int ref;		    /* number of references to server */
	struct batch_status *s_rsc; /* ptr to status of resources on server */
	struct server *next;	    /* next server in list */
};

/* objname - name of an object with a possible server associated with it
 * i.e. batch@server1   -> queue batch at server server1
 */
struct objname {
	int obj_type;	      /* type of object */
	char *obj_name;	      /* name of object */
	char *svr_name;	      /* name of server associated with object */
	struct server *svr;   /* short cut to server associated with object */
	struct objname *next; /* next object in list */
};

/* prototypes */
struct objname *commalist2objname(char *, int);
struct server *find_server(char *);
struct server *make_connection(char *);
struct server *new_server();
struct objname *new_objname();
struct objname *strings2objname(char **, int, int);
struct objname *default_server_name();
struct objname *temp_objname(char *, char *, struct server *);
int parse_request(char *, char ***);
void clean_up_and_exit(int);
void freeattropl(struct attropl *);
void pstderr(const char *);
void pstderr_big(char *, char *, char *);
void free_objname_list(struct objname *);
void free_server(struct server *);
void free_objname(struct objname *);
void close_non_ref_servers();
int connect_servers(struct objname *, int);
int set_active(int, struct objname *);
int get_request(char **);
int parse(char *, int *, int *, char **, struct attropl **);
int execute(int, int, int, char *, struct attropl *);
int is_valid_object(struct objname *, int);

/* help messages */

#define HELP_DEFAULT                                                                                           \
	"General syntax: command [object][@server] [name attribute[.resource] OP value]\n"                     \
	"To get help on any topic or subtopic, type help <topic>\n"                                            \
	"Help is available on all commands and topics.\n"                                                      \
	"Available commands: \n"                                                                               \
	"active                 The active command will set the active objects.\n"                             \
	"create                 The create command will create the specified object on the PBS server(s).\n"   \
	"delete                 The delete command will delete the specified object from the PBS server(s).\n" \
	"set                    The set command sets the value for an attribute on the specified object.\n"    \
	"unset                  The unset command will unset an attribute on the specified object.\n"          \
	"list                   The list command will list out all the attributes for the specified object.\n" \
	"print                  The print command's output can be fed back into qmgr as input.\n"              \
	"import                 This takes hook script contents.\n"                                            \
	"export                 Dumps output of hook script into.\n"                                           \
	"quit                   The quit command will exit from qmgr.\n"                                       \
	"history                The history command will show qmgr command history.\n"                         \
	"Other topics: \n"                                                                                     \
	"attributes             type help or ? <attributes>.\n"                                                \
	"operators              type help or ? <operators>.\n"                                                 \
	"names                  type help or ? <names>.\n"                                                     \
	"values                 type help or ? <values>.\n"

#define HELP_ACTIVE                                                                      \
	"Syntax active object [name [,name...]]\n"                                       \
	"Objects can be \"server\" \"queue\" \"resource\" or \"node\"\n"                 \
	"The active command will set the active objects.  The active objects are used\n" \
	"when no name is specified for different commands.\n"                            \
	"If no server is specified for nodes or queues, the command will be sent\n"      \
	"to all active servers.\n"                                                       \
	"Examples:\n"                                                                    \
	"active queue q1,batch@server1\n"                                                \
	"active server server2,server3\n"                                                \
	"Now if the following command is typed:\n"                                       \
	"set queue max_running = 10\n"                                                   \
	"The attribute max_running will be set to ten on the batch queue on server1\n"   \
	"and the q1 queue on server2 and server3.\n\n"                                   \
	"active server s1, s2\n"                                                         \
	"active node @active\n"                                                          \
	"This would specify all nodes at all servers.\n\n"                               \
	"active queue @s2\n"                                                             \
	"This would specify all queues at server s2\n"

#define HELP_CREATE                                                                        \
	"Syntax: create object name[,name...] \n"                                          \
	"Objects can be \"queue\", \"node\", \"resource\" or \"hook\"\n"                   \
	"The create command will create the specified object on the PBS server(s).\n"      \
	"For multiple names, use a comma seperated list with no intervening whitespace.\n" \
	"A hook object can only be created by the Administrator, and only on the \n"       \
	"host on which the server runs.\n"                                                 \
	"\nExamples:\n"                                                                    \
	"create queue q1,q2,q3\n"                                                          \
	"create resource r1,r2,r3 type=long,flag=nh\n"

#define HELP_DELETE                                                                     \
	"Syntax: delete object name[,name...]\n"                                        \
	"Objects can be \"queue\", \"node\", \"resource\" or \"hook\"\n"                \
	"The delete command will delete the specified object from the PBS server(s).\n" \
	"A hook object can only be deleted by the Administrator, and only on the \n"    \
	"host on which the server runs.\n"                                              \
	"\nExamples:\n"                                                                 \
	"delete queue q1\n"

#define HELP_SET                                                                                  \
	"Syntax: set object [name,][,name...] attribute[.resource] OP value\n"                    \
	"Objects can be \"server\", \"queue\", \"node\", \"hook\", \"resource\" or \"pbshook\"\n" \
	"The \"set\" command sets the value for an attribute on the specified object.\n"          \
	"If the object is \"server\" and name is not specified, the attribute will be\n"          \
	"set on all the servers specified on the command line.\n"                                 \
	"For multiple names, use a comma seperated list with no intervening whitespace.\n"        \
	"A hook object can only be set by the Administrator, and only on the \n"                  \
	"host on which the server runs.\n"                                                        \
	"Examples:\n"                                                                             \
	"set server s1 max_running = 5\n"                                                         \
	"set server managers = root@host.domain.com\n"                                            \
	"set server managers += susan@*.domain.com\n"                                             \
	"set node n1,n2 state=offline\n"                                                          \
	"set queue q1@s3 resources_max.mem += 5mb\n"                                              \
	"set queue @s3 default_queue = batch\n"                                                   \
	"set server default_qdel_arguments = \"-Wsuppress_email = 1000\"\n"                       \
	"set server default_qsub_arguments = \"-m n -r n\"\n"                                     \
	"set resource r1 type=long\n"

#define HELP_UNSET                                                                                  \
	"Syntax: unset object [name][,name...]\n"                                                   \
	"Objects can be \"server\", \"queue\", \"node\", \"hook\", \"resource\" or \"pbshook\"\n"   \
	"The unset command will unset an attribute on the specified object except resource type.\n" \
	"If the object is \"server\" and name is not specified, the attribute will be\n"            \
	"unset on all the servers specified on the command line.\n"                                 \
	"For multiple names, use a comma seperated list with no intervening whitespace.\n"          \
	"A hook object can only be unset by the Administrator, and only on the \n"                  \
	"host on which the server runs.\n"                                                          \
	"Examples:\n"                                                                               \
	"unset server s1 max_running\n"                                                             \
	"unset server managers\n"                                                                   \
	"unset queue enabled\n"                                                                     \
	"unset resource r1 flag\n"

#define HELP_LIST                                                                                 \
	"Syntax: list object [name][,name...]\n"                                                  \
	"Object can be \"server\", \"queue\", \"node\", \"resource\", \"hook\", or \"pbshook\"\n" \
	"The list command will list out all the attributes for the specified object.\n"           \
	"If the object is \"server\" and name is not specified, all the servers\n"                \
	"specified on the command line will be listed.\n"                                         \
	"For multiple names, use a comma seperated list with no intervening whitespace.\n"        \
	"Hooks can only be listed by the Administrator, and only on the \n"                       \
	"host on which the server runs.\n"                                                        \
	"Examples:\n"                                                                             \
	"list server\n"                                                                           \
	"list queue q1\n"                                                                         \
	"list node n1,n2,n3\n"

#define HELP_PRINT                                                                         \
	"Syntax: print object [name][,...]\n"                                              \
	"Object can be \"server\", \"queue\", \"node\", \"resource\" or \"hook\"\n"        \
	"The print command's output can be fed back into qmgr as input.\n"                 \
	"If the object is \"server\", all the queues and nodes associated \n"              \
	"with the server are printed as well as the server information.\n"                 \
	"For multiple names, use a comma seperated list with no intervening whitespace.\n" \
	"Hooks can only be printed via \"print hook [name][,...]\" \n"                     \
	"and by the Administrator, and only on the host on which the server runs.\n"       \
	"Examples:\n"                                                                      \
	"print server\n"                                                                   \
	"print node n1\n"                                                                  \
	"print queue q3\n"

#define HELP_IMPORT                                                                    \
	"Syntax: import hook hook_name content-type content-encoding {input_file|-}\n" \
	"This takes hook script contents from \"input_file\" or STDIN (-)\n"           \
	"\"content-type\" is currently \"application/x-python\" only. \n"              \
	"\"content-encoding\" is currently \"default\" (7bit/ASCII), or \"base64\".\n" \
	"Hooks can only be imported by the Administrator, and only on the \n"          \
	"host on which the server runs.\n"

#define HELP_EXPORT                                                                      \
	"Syntax: export hook hook_name content-type content-encoding [output_file]\n"    \
	"Dumps output of hook script into \"output_file\" if specified, or to STDOUT.\n" \
	"\"content-type\" is currently \"application/x-python\" only.\n"                 \
	"\"content-encoding\" is currently \"default\" (7bit/ASCII), or \"base64\".\n"   \
	"Hooks can only be exported by the Administrator, and only on the \n"            \
	"host on which the server runs.\n"

/* HELP_QUIT macro name changed to HELP_QUIT0 here, as it clashes with one */
/* defined under Windows' winuser.h */
#define HELP_QUIT0       \
	"Syntax: quit\n" \
	"The quit command will exit from qmgr.\n"

#define HELP_EXIT        \
	"Syntax: exit\n" \
	"The exit command will exit from qmgr.\n"

#define HELP_OPERATOR                                                             \
	"Syntax: ... attribute OP new value\n"                                    \
	"Qmgr accepts three different operators for its commands.\n"              \
	"\t=\tAssign value into attribute.\n"                                     \
	"\t+=\tAdd new value and old value together and assign into attribute.\n" \
	"\t-=\tSubtract new value from old value and assign into attribute.\n"    \
	"These operators are used in the \"set\" and the \"unset\" commands\n"

#define HELP_VALUE                                                                        \
	"Syntax ... OP value[multiplier]\n"                                               \
	"A multipler can be added to the end of a size in bytes or words.\n"              \
	"The multipliers are: tb, gb, mb, kb, b, tw, gw, mw, kw, w.  The second letter\n" \
	"stands for bytes or words.  b is the default multiplier.\n"                      \
	"The multipliers are case insensitive i.e. gw is the same as GW.\n"               \
	"Examples:\n"                                                                     \
	"100mb\n"                                                                         \
	"2gw\n"                                                                           \
	"10\n"

#define HELP_NAME                                                                     \
	"Syntax: [name][@server]\n"                                                   \
	"Names can be in several parts.  There can be the name of an object, \n"      \
	"the name of an object at a server, or just at a server.\n"                   \
	"The name of an object specifys a name.  A name of an object at a server\n"   \
	"specifys the name of an object at a specific server.  Lastly, at a server\n" \
	"specifys all objects of a type at a server\n"                                \
	"Examples:\n"                                                                 \
	"batch     - An object called batch\n"                                        \
	"batch@s1  - An object called batch at the server s1\n"                       \
	"@s1       - All the objects of a cirtain type at the server s1\n"

#define HELP_ATTRIBUTE                                                               \
	"The help for attributes are broken up into the following help subtopics:\n" \
	"\tserverpublic\t- Public server attributes\n"                               \
	"\tserverro\t- Read only server attributes\n"                                \
	"\tqueuepublic\t- Public queue attributes\n"                                 \
	"\tqueueexec\t- Attributes specific to execution queues\n"                   \
	"\tqueueroute\t- Attributes specified to routing queues\n"                   \
	"\tqueuero \t- Read only queue attributes\n"                                 \
	"\tnodeattr\t- Node Attributes\n"

#define HELP_SERVERPUBLIC                                                                                   \
	"Server Public Attributes:\n"                                                                       \
	"acl_host_enable - enables host level access control\n"                                             \
	"acl_user_enable - enables user level access control\n"                                             \
	"acl_users - list of users allowed/denied access to server\n"                                       \
	"comment - informational text string about the server\n"                                            \
	"default_queue - default queue used when a queue is not specified\n"                                \
	"log_events - a bit string which specfiies what is logged\n"                                        \
	"mail_uid - uid of sender of mail which is sent by the server\n"                                    \
	"managers - list of users granted administrator privledges\n"                                       \
	"max_running - maximum number of jobs that can run on the server\n"                                 \
	"max_user_run - maximum number of jobs that a user can run on the server\n"                         \
	"max_group_run - maximum number of jobs a UNIX group can run on the server\n"                       \
	"max_queued - set of enqueued-count based limits to control futher job enqueueing\n"                \
	"max_queued_res - set of resource count based limits to control futher job enqueueing\n"            \
	"queued_jobs_threshold - set of resource count based limits to control futher job enqueueing\n"     \
	"queued_jobs_threshold_res - set of resource count based limits to control futher job enqueueing\n" \
	"max_run - set of running-count based limits to control job scheduling\n"                           \
	"max_run_soft - set of soft running-count based limits to control job scheduling\n"                 \
	"max_run_res - set of resource based limits to control job scheduling\n"                            \
	"max_run_soft_res - set of soft resource based limits to control job scheduling\n"                  \
	"operators - list of users granted operator privledges\n"                                           \
	"query_other_jobs - when true users can query jobs owned by other users\n"                          \
	"resources_available - ammount of resources which are available to the server\n"                    \
	"resources_cost - the cost factors of resources.  Used for sync. job starting\n"                    \
	"resources_default - the default resource value when the job does not specify\n"                    \
	"resource_max - the maximum ammount of resources that are on the system\n"                          \
	"scheduler_iteration - the amount of seconds between timed scheduler iterations\n"                  \
	"scheduling - when true the server should tell the scheduler to run\n"                              \
	"system_cost - arbitirary value factored into resource costs\n"                                     \
	"default_qdel_arguments - default arguments for qdel command\n"                                     \
	"default_qsub_arguments - default arguments for qsub command\n"

#define HELP_SERVERRO                                                                 \
	"Server Read Only Attributes:\n"                                              \
	"resources_assigned - total ammount of resources allocated to running jobs\n" \
	"server_name - the name of the server and possibly a port number\n"           \
	"server_state - the current state of the server\n"                            \
	"state_count - total number of jobs in each state\n"                          \
	"total_jobs - total number of jobs managed by the server\n"                   \
	"PBS_version - the release version of PBS\n"

#define HELP_QUEUEPUBLIC                                                                         \
	"Queue Public Attributes:\n"                                                             \
	"acl_group_enable - enables group level access control on the queue\n"                   \
	"acl_groups - list of groups which have been allowed or denied access\n"                 \
	"acl_host_enable - enables host level access control on the queue\n"                     \
	"acl_hosts - list of hosts which have been allowed or denied access\n"                   \
	"acl_user_enable - enables user level access control on the queue\n"                     \
	"acl_users - list of users which have been allowed or denied access\n"                   \
	"enabled - when true users can enqueue jobs\n"                                           \
	"from_route_only - when true queue only accepts jobs when routed by servers\n"           \
	"max_queuable - maximum number of jobs allowed to reside in the queue\n"                 \
	"max_running - maximum number of jobs in the queue that can be routed or running\n"      \
	"max_queued - set of enqueued-count based limits to control futher job enqueueing\n"     \
	"max_queued_res - set of resource count based limits to control futher job enqueueing\n" \
	"max_run - set of running-count based limits to control job scheduling\n"                \
	"max_run_soft - set of soft running-count based limits to control job scheduling\n"      \
	"max_run_res - set of resource based limits to control job scheduling\n"                 \
	"max_run_soft_res - set of soft resource based limits to control job scheduling\n"       \
	"priority - the priority of the queue\n"                                                 \
	"queue_type - type of queue: execution or routing\n"                                     \
	"resources_max - maximum ammount of a resource which can be requested by a job\n"        \
	"resources_min - minimum ammount of a resource which can be requested by a job\n"        \
	"resources_default - the default resource value when the job does not specify\n"         \
	"started - when true jobs can be scheduled for execution\n"

#define HELP_QUEUEEXEC                                                                      \
	"Attributes for Execution queues only:\n"                                           \
	"checkpoint_min - min. number of mins. of CPU time allowed bwtween checkpointing\n" \
	"resources_available - ammount of resources which are available to the queue\n"     \
	"kill_delay - ammount of time between SIGTERM and SIGKILL when deleting a job\n"    \
	"max_user_run - maximum number of jobs a user can run in the queue\n"               \
	"max_group_run - maximum number of jobs a UNIX group can run in a queue\n"

#define HELP_QUEUEROUTE                                                               \
	"Attributes for Routing queues only:\n"                                       \
	"route_destinations - list of destinations which jobs may be routed to\n"     \
	"alt_router - when true a alternate routing function is used to route jobs\n" \
	"route_held_jobs - when true held jobs may be routed from this queue\n"       \
	"route_waiting_jobs - when true waiting jobs may be routed from this queue\n" \
	"route_retry_time - time delay between route retries.\n"                      \
	"route_lifetime - maximum ammount of time a job can be in this routing queue\n"

#define HELP_QUEUERO                                                      \
	"Queue read only attributes:\n"                                   \
	"total_jobs - total number of jobs in queue\n"                    \
	"state_count - total number of jobs in each state in the queue\n" \
	"resources_assigned - ammount of resources allocated to jobs running in queue\n"

#define HELP_NODEATTR                           \
	"Node attributes:\n"                    \
	"state - the current state of a node\n" \
	"properties - the properties the node has\n"


================================================
FILE: src/include/queue.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _QUEUE_H
#define _QUEUE_H
#ifdef __cplusplus
extern "C" {
#endif

#include "attribute.h"
#include "server_limits.h"

#define QTYPE_Unset 0
#define QTYPE_Execution 1
#define QTYPE_RoutePush 2
#define QTYPE_RoutePull 3

/*
 * Attributes, including the various resource-lists are maintained in an
 * array in a "decoded or parsed" form for quick access to the value.
 *
 * The following enum defines the index into the array.
 */

enum queueattr {
#include "queue_attr_enum.h"
#include "site_que_attr_enum.h"
	QA_ATR_LAST /* WARNING: Must be the highest valued enum */
};

extern void *que_attr_idx;
extern attribute_def que_attr_def[];

/* at last we come to the queue definition itself	*/

struct pbs_queue {
	pbs_list_link qu_link; /* forward/backward links */
	pbs_list_head qu_jobs; /* jobs in this queue */
	resc_resv *qu_resvp;   /* != NULL if que established */
	/* to support a reservation */
	int qu_nseldft;		   /* number of elm in qu_seldft */
	key_value_pair *qu_seldft; /* defaults for job -l select */

	char qs_hash[DIGEST_LENGTH];
	struct queuefix {
		int qu_type;			    /* queue type: exec, route */
		char qu_name[PBS_MAXQUEUENAME + 1]; /* queue name */
	} qu_qs;

	int qu_numjobs;			 /* current numb jobs in queue */
	int qu_njstate[PBS_NUMJOBSTATE]; /* # of jobs per state */

	/* the queue attributes */

	attribute qu_attr[QA_ATR_LAST];
	short newobj;
};
typedef struct pbs_queue pbs_queue;

extern void *queues_idx;

extern pbs_queue *find_queuebyname(char *);
#ifdef NAS /* localmod 075 */
extern pbs_queue *find_resvqueuebyname(char *);
#endif /* localmod 075 */
extern pbs_queue *get_dfltque(void);
extern pbs_queue *que_alloc(char *);
extern pbs_queue *que_recov_db(char *, pbs_queue *);
extern void que_free(pbs_queue *);
extern int que_save_db(pbs_queue *);

#define QUE_SAVE_FULL 0
#define QUE_SAVE_NEW 1

attribute *get_qattr(const pbs_queue *pq, int attr_idx);
char *get_qattr_str(const pbs_queue *pq, int attr_idx);
struct array_strings *get_qattr_arst(const pbs_queue *pq, int attr_idx);
pbs_list_head get_qattr_list(const pbs_queue *pq, int attr_idx);
long get_qattr_long(const pbs_queue *pq, int attr_idx);
int set_qattr_generic(pbs_queue *pq, int attr_idx, char *val, char *rscn, enum batch_op op);
int set_qattr_str_slim(pbs_queue *pq, int attr_idx, char *val, char *rscn);
int set_qattr_l_slim(pbs_queue *pq, int attr_idx, long val, enum batch_op op);
int set_qattr_b_slim(pbs_queue *pq, int attr_idx, long val, enum batch_op op);
int set_qattr_c_slim(pbs_queue *pq, int attr_idx, char val, enum batch_op op);
int is_qattr_set(const pbs_queue *pq, int attr_idx);
void free_qattr(pbs_queue *pq, int attr_idx);

#ifdef __cplusplus
}
#endif
#endif /* _QUEUE_H */


================================================
FILE: src/include/range.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _RANGE_H
#define _RANGE_H

#ifdef __cplusplus
extern "C" {
#endif

/**
 * Control whether to consider stepping or not
 */
enum range_step_type {
	DISABLE_SUBRANGE_STEPPING,
	ENABLE_SUBRANGE_STEPPING
};

typedef struct range {
	int start;
	int end;
	int step;
	int count;
	struct range *next;
} range;

/* Error message when we fail to allocate memory */
#define RANGE_MEM_ERR_MSG "Unable to allocate memory (malloc error)"

#define INIT_RANGE_ARR_SIZE 2048

/*
 *	new_range - allocate and initialize a range structure
 */

range *new_range(int start, int end, int step, int count, range *next);

/*
 *	free_range_list - free a list of ranges
 */
void free_range_list(range *r);

/*
 *	free_range - free a range structure
 */
void free_range(range *r);

/*
 *	dup_range_list - duplicate a range list
 */
range *dup_range_list(range *old_r);

/*
 *	dup_range - duplicate a range structure
 */
range *dup_range(range *old_r);

/**
 * @brief
 *	range_count - count number of elements in a given range structure
 *
 * @param[in]	r - range structure to count
 *
 * @return int
 * @retval # - number of elements in range
 *
 */
int range_count(range *r);

/*
 *	range_parse - parse string of ranges delimited by comma
 */
range *range_parse(char *str);

/*
 *
 *	range_next_value - get the next value in a range
 *			   if a current value is given, return the next
 *			   if no current value is given, return the first
 *
 */
int range_next_value(range *r, int cur_value);

/*
 *	range_contains - find if a range contains a value
 */
int range_contains(range *r, int val);

/*
 *	range_contains_single - is a value contained in a single range
 *				  structure
 */
int range_contains_single(range *r, int val);

/*
 *	range_remove_value - remove a value from a range list
 *
 */
int range_remove_value(range **r, int val);

/*
 *	range_add_value - add a value to a range list
 *
 */
int range_add_value(range **r, int val, int range_step);

/*
 *	range_intersection - create an intersection between two ranges
 */
range *range_intersection(range *r1, range *r2);

extern int parse_subjob_index(char *, char **, int *, int *, int *, int *);

/*
 * Return a string representation of a range structure
 */
char *range_to_str(range *r);

range * range_join(range *r1, range *r2);

#ifdef __cplusplus
}
#endif

#endif /* _RANGE_H */


================================================
FILE: src/include/reservation.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _RESERVATION_H
#define _RESERVATION_H
#ifdef __cplusplus
extern "C" {
#endif
/*
 * reservation.h - structure definations for reservation objects
 *
 * Include Files Required:
 *	<sys/types.h>
 *	"list_link.h"
 *	"attribute.h"
 *	"server_limits.h"
 *	"batch_request.h"
 *	"pbs_nodes.h"
 *	"job.h"
 */

#ifndef _RESV_NODE_H
#include "resv_node.h"
#endif

#define JOB_OBJECT 1
#define RESC_RESV_OBJECT 2

#define RESV_START_TIME_MODIFIED 0x1
#define RESV_END_TIME_MODIFIED 0x2
#define RESV_DURATION_MODIFIED 0x4
#define RESV_SELECT_MODIFIED 0x8
#define RESV_ALTER_FORCED 0x10

/*
 * The following resv_atr enum provide an index into the array of
 * decoded reservation attributes, for quick access.
 * Most of the attributes here are "public", but some are Read Only,
 * Private, or even Internal data items; maintained here because of
 * their variable size.
 *
 * "RESV_ATR_LAST" must be the last value as its number is used to
 * define the size of the array.
 */

enum resv_atr {
#include "resv_attr_enum.h"
	RESV_ATR_UNKN,
	RESV_ATR_LAST
};

enum resvState_discrim {
	RESVSTATE_gen_task_Time4resv,
	RESVSTATE_Time4resv,
	RESVSTATE_req_deleteReservation,
	RESVSTATE_add_resc_resv_to_job,
	RESVSTATE_is_resv_window_in_future,
	RESVSTATE_req_resvSub,
	RESVSTATE_alter_failed
};

/*
 * The "definations" for the reservation attributes are in the following array,
 * it is also indexed by the RESV_ATR_... enums.
 */

extern void *resv_attr_idx;
extern attribute_def resv_attr_def[];
extern int index_atrJob_to_atrResv[][2];

/* linked list of vnodes associated to the soonest reservation */
typedef struct pbsnode_list_ {
	struct pbsnode *vnode;
	struct pbsnode_list_ *next;
} pbsnode_list_t;

/* Structure used to revert reservation back if the ralter failed */
struct resv_alter {
	long ra_state;
	unsigned long ra_flags;
};

/*
 * THE RESERVATION
 *
 * This structure is used by the server to maintain internal
 * quick access to the state and status of each reservation.
 * There is one instance of this structure per reservation known by the server.
 *
 * This information must be PRESERVED and is done so by updating the
 * reservation file in the reservation subdirectory which corresponds to this
 * reservation.
 *
 * ri_state is the state of the reservation.  It is kept up front to provide
 * for a "quick" update of the reservation state with minimum rewritting of the
 * reservation file.
 * Which is why the sub-struct ri_qs exists, that is the part which is
 * written on the "quick" save.  If in the future the format of this area
 * is modified the value of RSVERSION needs to be be bumped.
 *
 * The unparsed string set forms of the attributes (including resources)
 * are maintained in the struct attrlist as discussed above.
 */

#define RSVERSION 500
struct resc_resv {

	/* Note: these members, upto ri_qs, are not saved to disk */

	pbs_list_link ri_allresvs; /* links this resc_resv into the
							 * server's global list
							 */

	struct pbs_queue *ri_qp; /* pbs_queue that got created
							 * to support this "reservation
							 * note: for a "reservation job"
							 * this value is NULL
							 */

	int ri_futuredr; /* non-zero if future delete resv
							 * task placed on "task_list_timed
							 */

	job *ri_jbp;	      /* for a "reservation job" this
							 * points to the associated job
							 */
	resc_resv *ri_parent; /* reservation in a reservation */

	int ri_giveback; /*flag, return resources to parent */

	int ri_vnodes_down; /* the number of vnodes that are unavailable */
	int ri_vnodect;	    /* the number of vnodes associated to an advance
							 * reservation or a standing reservation occurrence
							 */

	pbs_list_head ri_svrtask; /* place to keep work_task struct that
							 * are "attached" to this reservation
							 */

	pbs_list_head ri_rejectdest; /* place to keep badplace structs that
							 * are "attached" to this reservation
							 * Will only be useful if we later make
							 */

	struct batch_request *ri_brp; /* NZ if choose interactive (I) mode */

	/*resource reservations routeable objs*/
	int ri_downcnt; /* used when deleting the reservation*/

	long ri_resv_retry; /* time at which the reservation will be reconfirmed */

	long ri_degraded_time; /* a tentative time to reconfirm the reservation */

	pbsnode_list_t *ri_pbsnode_list; /* vnode list associated to the reservation */

	/* objects used while altering a reservation. */
	struct resv_alter ri_alter; /* object used to alter a reservation */

	/* Reservation start and end tasks */
	struct work_task *resv_start_task;
	struct work_task *resv_end_task;
	int resv_from_job;

	/* A count to keep track of how many schedulers have been requested and
	 * responsed to this reservation request
	 */
	int req_sched_count;
	int rep_sched_count;

	/*
	 * fixed size internal data - maintained via "quick save"
	 * some of the items are copies of attributes, if so this
	 * internal version takes precendent
	 */
#ifndef PBS_MOM
	char qs_hash[DIGEST_LENGTH];
#endif
	struct resvfix {
		int ri_rsversion;			   /* reservation struct verison#, see RSVERSION */
		int ri_state; /* internal copy of state */ // FIXME: can we remove this like we did for job?
		int ri_substate;			   /* substate of resv state */
		time_t ri_stime;			   /* left window boundry  */
		time_t ri_etime;			   /* right window boundry */
		time_t ri_duration;			   /* reservation duration */
		time_t ri_tactive;			   /* time reservation became active */
		int ri_svrflags;			   /* server flags */
		char ri_resvID[PBS_MAXSVRRESVID];	   /* reservation identifier */
		char ri_fileprefix[PBS_RESVBASE + 1];	   /* reservation file prefix */
		char ri_queue[PBS_MAXQRESVNAME + 1];	   /* queue used by reservation */
	} ri_qs;

	/*
	 * The following array holds the decode	 format of the attributes.
	 * Its presence is for rapid access to the attributes.
	 */
	attribute ri_wattr[RESV_ATR_LAST]; /*reservation's attributes*/
	short newobj;
};

/*
 * server flags (in ri_svrflags)
 */
#define RESV_SVFLG_HERE 0x01	   /* SERVER: job created here */
#define RESV_SVFLG_HASWAIT 0x02	   /* job has timed task entry for wait time*/
#define RESV_SVFLG_HASRUN 0x04	   /* job has been run before (being rerun */
#define RESV_SVFLG_Suspend 0x200   /* job suspended (signal suspend) */
#define RESV_SVFLG_HasNodes 0x1000 /* job has nodes allocated to it */

#define RESV_FILE_COPY ".RC"   /* tmp copy while updating */
#define RESV_FILE_SUFFIX ".RB" /* reservation control file */
#define RESV_BAD_SUFFIX ".RBD" /* save bad reservation file */

#define RESV_UNION_TYPE_NEW 0

#define RESV_RETRY_DELAY 10	/* for degraded standing reservation retries */
#define RESV_ASAP_IDLE_TIME 600 /* default delete_idle_time for ASAP reservations */

/* reservation hold (internal) types */

#define RHOLD_n 0
#define RHOLD_u 1
#define RHOLD_o 2
#define RHOLD_s 4
#define RHOLD_bad_password 8

/* other symbolic constants */
#define Q_CHNG_ENABLE 0
#define Q_CHNG_START 1

extern void *resvs_idx;
extern resc_resv *find_resv(char *);
extern resc_resv *resv_alloc(char *);
extern resc_resv *resv_recov(char *);
extern void resv_purge(resc_resv *);
extern int start_end_dur_wall(resc_resv *);

#ifdef _BATCH_REQUEST_H
extern resc_resv *chk_rescResv_request(char *, struct batch_request *);
extern void resv_mailAction(resc_resv *, struct batch_request *);
extern int chk_resvReq_viable(resc_resv *);
#endif /* _BATCH_REQUEST_H */

#ifdef _WORK_TASK_H
extern int gen_task_Time4resv(resc_resv *);
extern int gen_task_EndresvWindow(resc_resv *);
extern int gen_future_deleteResv(resc_resv *, long);
extern int gen_future_reply(resc_resv *, long);
extern int gen_negI_deleteResv(resc_resv *, long);
extern void time4resvFinish(struct work_task *);
extern void Time4resvFinish(struct work_task *);
extern void Time4_I_term(struct work_task *);
extern void tickle_for_reply(void);
extern void remove_deleted_resvs();
extern void add_resv_beginEnd_tasks();
extern void resv_retry_handler(struct work_task *);
extern void set_idle_delete_task(resc_resv *presv);
#endif /* _WORK_TASK_H */

extern int change_enableORstart(resc_resv *, int, char *);
extern void unset_resv_retry(resc_resv *);
extern void set_resv_retry(resc_resv *, long);
extern void force_resv_retry(resc_resv *, long);
extern void eval_resvState(resc_resv *, enum resvState_discrim, int, int *, int *);
extern void free_resvNodes(resc_resv *);
extern int act_resv_add_owner(attribute *, void *, int);
extern void svr_mailownerResv(resc_resv *, int, int, char *);
extern void resv_free(resc_resv *);
extern void set_old_subUniverse(resc_resv *);
extern int assign_resv_resc(resc_resv *, char *, int);
extern void resv_exclusive_handler(resc_resv *);
extern void resv_exclusive_handler_forced(resc_resv *);
extern long determine_resv_retry(resc_resv *presv);

extern resc_resv *resv_recov_db(char *resvid, resc_resv *presv);
extern int resv_save_db(resc_resv *presv);
extern void pbsd_init_resv(resc_resv *presv, int type);

attribute *get_rattr(const resc_resv *presv, int attr_idx);
char *get_rattr_str(const resc_resv *presv, int attr_idx);
struct array_strings *get_rattr_arst(const resc_resv *presv, int attr_idx);
pbs_list_head get_rattr_list(const resc_resv *presv, int attr_idx);
long get_rattr_long(const resc_resv *presv, int attr_idx);
int set_rattr_generic(resc_resv *presv, int attr_idx, char *val, char *rscn, enum batch_op op);
int set_rattr_str_slim(resc_resv *presv, int attr_idx, char *val, char *rscn);
int set_rattr_l_slim(resc_resv *presv, int attr_idx, long val, enum batch_op op);
int set_rattr_b_slim(resc_resv *presv, int attr_idx, long val, enum batch_op op);
int set_rattr_c_slim(resc_resv *presv, int attr_idx, char val, enum batch_op op);
int is_rattr_set(const resc_resv *presv, int attr_idx);
void free_rattr(resc_resv *presv, int attr_idx);
void clear_rattr(resc_resv *presv, int attr_idx);

#ifdef __cplusplus
}
#endif
#endif /* _RESERVATION_H */


================================================
FILE: src/include/resmon.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

struct rm_attribute {
	char *a_qualifier;
	char *a_value;
};

/*
 ** The config structure is used to save a name to be used as a key
 ** for searching and a value or function call to provide an "answer"
 ** for the name in question.
 */
typedef char *(*confunc)(struct rm_attribute *);
struct config {
	char *c_name;
	union {
		confunc c_func;
		char *c_value;
	} c_u;
};

#define RM_NPARM 20 /* max number of parameters for child */

#define RM_CMD_CLOSE 1
#define RM_CMD_REQUEST 2
#define RM_CMD_CONFIG 3
#define RM_CMD_SHUTDOWN 4

#define RM_RSP_OK 100
#define RM_RSP_ERROR 999

#define UPDATE_MOM_STATE 1

/*
 ** Macros for fast min/max.
 */
#ifndef MIN
#define MIN(a, b) (((a) < (b)) ? (a) : (b))
#endif
#ifndef MAX
#define MAX(a, b) (((a) > (b)) ? (a) : (b))
#endif

extern char *arch(struct rm_attribute *);
extern char *physmem(struct rm_attribute *);


================================================
FILE: src/include/resource.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _RESOURCE_H
#define _RESOURCE_H
#ifdef __cplusplus
extern "C" {
#endif
#include "attribute.h"
#include "list_link.h"

/*
 * This header file contains the definitions for resources.
 *
 * Other required header files:
 *	"portability.h"
 *	"attribute.h"
 *	"list_link.h"
 *
 * Resources are "a special case" of attributes.  Resources use similiar
 * structures as attributes.  Certain types, type related functions,
 * and flags may differ between the two.
 *
 * Within the resource structure, the value is contained in an attribute
 * substructure, this is done so the various attribute decode and encode
 * routines can be "reused".
 *
 * For any server, queue or job attribute which is a set of resources,
 * the attribute points to an list  of "resource" structures.
 * The value of the resource is contained in these structures.
 *
 * Unlike "attributes" which are typically identical between servers
 * within an administrative domain,  resources vary between systems.
 * Hence, the resource instance has a pointer to the resource definition
 * rather than depending on a predefined index.
 */

#define RESOURCE_UNKNOWN "|unknown|"

enum resc_enum {
#include "resc_def_enum.h"
	RESC_UNKN,
	RESC_LAST
};

#define RESC_NOOP_DEF "noop"

typedef enum resdef_op {
	RESDEF_CREATE,
	RESDEF_UPDATE,
	RESDEF_DELETE
} resdef_op_t;

typedef struct resource {
	pbs_list_link rs_link;	       /* link to other resources in list */
	struct resource_def *rs_defin; /* pointer to definition entry */
	attribute rs_value;	       /* attribute struct holding value */
} resource;

typedef struct resource_def {
	char *rs_name;
	int (*rs_decode)(attribute *prsc, char *name, char *rn, char *val);
	int (*rs_encode)(const attribute *prsv, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl);
	int (*rs_set)(attribute *old, attribute *nattr, enum batch_op op);
	int (*rs_comp)(attribute *prsc, attribute *with);
	void (*rs_free)(attribute *prsc);
	int (*rs_action)(resource *presc, attribute *pat, void *pobj, int type, int actmode);
	unsigned int rs_flags : ATRDFLAG; /* flags: R/O, ..., see attribute.h */
	unsigned int rs_type : ATRDTYPE;  /* type of resource,see attribute.h */
	unsigned int rs_entlimflg;	  /* tracking entity limits for this  */
	struct resource_def *rs_next;
	unsigned int rs_custom; /* bit flag to indicate custom resource or builtin */
} resource_def;

struct resc_sum {
	struct resource_def *rs_def; /* ptr to this resources's def   */
	struct resource *rs_prs;     /* ptr resource in Resource_List */
	attribute rs_attr;	     /* used for summation of values  */
	int rs_set;		     /* set if value is set here      */
};

/* following used for Entity Limits for Finer Granularity Control */
typedef struct svr_entlim_leaf {
	resource_def *slf_rescd;
	attribute slf_limit;
	attribute slf_sum;
} svr_entlim_leaf_t;

extern struct resc_sum *svr_resc_sum;
extern void *resc_attrdef_idx;
extern resource_def *svr_resc_def; /* the resource definition array */
extern int svr_resc_size;	   /* size (num elements) in above  */
extern int svr_resc_unk;	   /* index to "unknown" resource   */

extern resource *add_resource_entry(attribute *, resource_def *);
extern int cr_rescdef_idx(resource_def *resc_def, int limit);
extern resource_def *find_resc_def(resource_def *, char *);
extern resource *find_resc_entry(const attribute *, resource_def *);
extern int update_resource_def_file(char *name, resdef_op_t op, int type, int perms);
extern int add_resource_def(char *name, int type, int perms);
extern int restart_python_interpreter(const char *);
extern long long to_kbsize(char *val);
extern int alloc_svrleaf(char *resc_name, svr_entlim_leaf_t **pplf);
extern int parse_resc_type(char *val, int *resc_type_p);
extern int parse_resc_flags(char *val, int *flag_ir_p, int *resc_flag_p);
extern int verify_resc_name(char *name);
extern int verify_resc_type_and_flags(int resc_type, int *pflag_ir, int *presc_flag, const char *rescname, char *buf, int buflen, int autocorrect);
extern void update_resc_sum(void);

/* Defines for entity limit tracking */
#define PBS_ENTLIM_NOLIMIT 0  /* No entity limit has been set for this resc */
#define PBS_ENTLIM_LIMITSET 1 /* this set in rs_entlim if limit exists */

/*
 * struct for providing mapping between resource type name or a
 * resource type value and the corresponding functions.
 * See lib/Libattr/resc_map.c
 */
struct resc_type_map {
	char *rtm_rname;
	int rtm_type;
	int (*rtm_decode)(attribute *prsc, char *name, char *rn, char *val);
	int (*rtm_encode)(const attribute *prsv, pbs_list_head *phead, char *atname,
			  char *rsname, int mode, svrattrl **rtnl);
	int (*rtm_set)(attribute *old, attribute *nattr, enum batch_op op);
	int (*rtm_comp)(attribute *prsc, attribute *with);
	void (*rtm_free)(attribute *prsc);
};
extern struct resc_type_map *find_resc_type_map_by_typev(int);
extern struct resc_type_map *find_resc_type_map_by_typest(char *);
extern char *find_resc_flag_map(int);

#ifdef __cplusplus
}
#endif
#endif /* _RESOURCE_H */


================================================
FILE: src/include/resv_node.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _RESV_NODE_H
#define _RESV_NODE_H
#ifdef __cplusplus
extern "C" {
#endif

typedef struct subUniverse subUniverse;
typedef struct spec_and_context spec_and_context;
typedef struct spec_and_context spec_ctx;
typedef struct resc_resv resc_resv;
typedef struct pbsnode pbsnode;
typedef unsigned reservationTag;

/*"specification and solving context"*/

/*pointer to an instantiation of "spec_and_context" is passed to the node
 *solving routine, "node_spec".  It finds, if possible, a set of nodes in the
 *specified subUniverse that satisfies the node specification stored in field
 *"nspec"
 */

struct subUniverse {

	struct pbsnode **univ; /*solve relative to this "universe",
						 which is just an array of pbsnode
						 pointers
						 */
	int usize;	       /*number of entries in "universe" array*/
	int inheap;	       /*set non-zero if univ is in heap and
					 should be freed */
};

struct spec_and_context {
	char *nspec; /*specification of a node set*/

	subUniverse subUniv;

	unsigned int when : 4; /*NEEDNOW or NEEDFUTURE*/
	unsigned int type : 4; /*SPECTYPE_JOB; SPECTYPE_RESV*/

	resc_resv *belong_to;	/*0==no parent else, ptr to parent*/
	reservationTag resvTag; /*if trying to find nodes for a */
	/*reservation or reservation job*/
	/*this is the resv's "handle"   */
	/*currently not being used      */

	long stime; /*job or reservation "start" time*/
	long etime; /*best estimate of "end" time*/
};

extern spec_and_context *create_context(void *, int, char *);
extern void free_context(spec_and_context *);

#ifdef __cplusplus
}
#endif
#endif /*_RESV_NODE_H*/


================================================
FILE: src/include/rm.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 **	Header file defining the library calls and message formats for
 **	connecting to and communicating with the resource monitor.
 */

#ifdef __cplusplus
extern "C" {
#endif

int openrm(char *, unsigned int);
int closerm(int);
int downrm(int);
int configrm(int, char *);
int addreq(int, char *);
int allreq(char *);
char *getreq(int);
int flushreq(void);
int activereq(void);
void fullresp(int);

#ifdef __cplusplus
}
#endif


================================================
FILE: src/include/sched_cmds.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _SCHED_CMDS_H
#define _SCHED_CMDS_H
#ifdef __cplusplus
extern "C" {
#endif

#include "pbs_ifl.h"
typedef struct sched_cmd sched_cmd;

struct sched_cmd {
	/* sched command */
	int cmd;

	/* jobid assisiated with cmd if any else NULL */
	char *jid;
};

/* server to scheduler commands: */
enum svr_sched_cmd {
	SCH_SCHEDULE_NULL,
	SCH_SCHEDULE_NEW,   /* New job queued or eligible	*/
	SCH_SCHEDULE_TERM,  /* Running job terminated	*/
	SCH_SCHEDULE_TIME,  /* Scheduler interval reached	*/
	SCH_SCHEDULE_RECYC, /* Not currently used		*/
	SCH_SCHEDULE_CMD,   /* Schedule on command 		*/
	SCH_CONFIGURE,
	SCH_QUIT,
	SCH_RULESET,
	SCH_SCHEDULE_FIRST,	     /* First schedule after server starts */
	SCH_SCHEDULE_JOBRESV,	     /* Arrival of an existing reservation time */
	SCH_SCHEDULE_AJOB,	     /* run one, named job */
	SCH_SCHEDULE_STARTQ,	     /* Stopped queue started */
	SCH_SCHEDULE_MVLOCAL,	     /* Job moved to local queue */
	SCH_SCHEDULE_ETE_ON,	     /* eligible_time_enable is turned ON */
	SCH_SCHEDULE_RESV_RECONFIRM, /* Reconfirm a reservation */
	SCH_SCHEDULE_RESTART_CYCLE,  /* Restart a scheduling cycle */
	SCH_CMD_HIGH		     /* This has to be the last command always. Any new command can be inserted above if required */
};

int schedule(int sd, const sched_cmd *cmd);

#ifdef __cplusplus
}
#endif
#endif /* _SCHED_CMDS_H */


================================================
FILE: src/include/server.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _SERVER_H
#define _SERVER_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * server.h - definitions for the server object (structure)
 *
 * Other include files required:
 *	<sys/types.h>
 *	"attribute.h"
 *	"list_link.h"
 *	"server_limits.h"
 *
 * The server object (structure) contains the parameters which
 * control the operation of the server itself.  This includes
 * the server attributes and resource (limits).
 */
#include <stdbool.h>
#ifndef _GRUNT_H
#include "grunt.h"
#endif
#include "pbs_sched.h"
#include "server_limits.h"

#define SYNC_SCHED_HINT_NULL 0
#define SYNC_SCHED_HINT_FIRST 1
#define SYNC_SCHED_HINT_OTHER 2

enum srv_atr {
#include "svr_attr_enum.h"
#include "site_svr_attr_enum.h"
	/* This must be last */
	SVR_ATR_LAST
};

extern char *pbs_server_name;
extern char server_host[];
extern uint pbs_server_port_dis;
extern void *svr_attr_idx;
extern attribute_def svr_attr_def[];
/* for trillion job id */
extern long long svr_max_job_sequence_id;

/* for history jobs*/
extern long svr_history_enable;
extern long svr_history_duration;

struct server {
	struct server_qs {
		int sv_numjobs;		  /* number of job owned by server   */
		int sv_numque;		  /* number of queues managed  */
		long long sv_jobidnumber; /* next number to use in new jobid  */
		long long sv_lastid;	  /* block increment to avoid many saves */
	} sv_qs;
	attribute sv_attr[SVR_ATR_LAST]; /* the server attributes */
	short newobj;
	time_t sv_started;		   /* time server started */
	time_t sv_hotcycle;		   /* if RECOV_HOT,time of last restart */
	time_t sv_next_schedule;	   /* when to next run scheduler cycle */
	int sv_jobstates[PBS_NUMJOBSTATE]; /* # of jobs per state */
	int sv_nseldft;			   /* num of elems in sv_seldft */
	key_value_pair *sv_seldft;	   /* defelts for job's -l select	*/

	int sv_trackmodifed;		     /* 1 if tracking list modified	    */
	int sv_tracksize;		     /* total number of sv_track entries */
	struct tracking *sv_track;	     /* array of track job records	    */
	int sv_provtrackmodifed;	     /* 1 if prov_tracking list modified */
	int sv_provtracksize;		     /* total number of sv_prov_track entries */
	struct prov_tracking *sv_prov_track; /* array of provision records */
	int sv_cur_prov_records;	     /* number of provisiong requests currently running */
};

extern struct server server;
extern pbs_list_head svr_alljobs;
extern pbs_list_head svr_allresvs; /* all reservations in server */

/* degraded reservations globals */
extern long resv_retry_time;

/*
 * server state values
 */
#define SV_STATE_DOWN 0
#define SV_STATE_INIT 1
#define SV_STATE_HOT 2
#define SV_STATE_RUN 3
#define SV_STATE_SHUTDEL 4
#define SV_STATE_SHUTIMM 5
#define SV_STATE_SHUTSIG 6
#define SV_STATE_SECIDLE 7
#define SV_STATE_PRIMDLY 0x10

/*
 * Other misc defines
 */
#define SVR_HOSTACL "svr_hostacl"
#define PBS_DEFAULT_NODE "1"

#define SVR_SAVE_QUICK 0
#define SVR_SAVE_FULL 1
#define SVR_SAVE_NEW 2

#define SVR_HOT_CYCLE 15  /* retry mom every n sec on hot start     */
#define SVR_HOT_LIMIT 300 /* after n seconds, drop out of hot start */

#define PBS_SCHED_DAEMON_NAME "Scheduler"
#define WALLTIME "walltime"
#define MIN_WALLTIME "min_walltime"
#define MAX_WALLTIME "max_walltime"
#define SOFT_WALLTIME "soft_walltime"
#define MCAST_WAIT_TM 2


#define ESTIMATED_DELAY_NODES_UP 60 /* delay reservation reconf at boot until nodes expected up */

/*
 * Server failover role
 */
enum failover_state {
	FAILOVER_NONE,	       /* Only Server, no failover */
	FAILOVER_PRIMARY,      /* Primary in failover configuration */
	FAILOVER_SECONDARY,    /* Secondary in failover */
	FAILOVER_CONFIG_ERROR, /* error in configuration */
};

/*
 * Server job history defines & globals
 */
#define SVR_CLEAN_JOBHIST_TM 120	    /* after 2 minutes, reschedule the work task */
#define SVR_CLEAN_JOBHIST_SECS 5	    /* never spend more than 5 seconds in one sweep to clean hist */
#define SVR_JOBHIST_DEFAULT 1209600	    /* default time period to keep job history: 2 weeks */
#define SVR_MAX_JOB_SEQ_NUM_DEFAULT 9999999 /* default max job id is 9999999 */

/* function prototypes */

extern int svr_recov_db();
extern int svr_save_db(struct server *);
extern pbs_sched *sched_recov_db(char *, pbs_sched *ps);
extern int sched_save_db(pbs_sched *);
extern enum failover_state are_we_primary(void);
extern int have_licensed_nodes(void);
extern void unlicense_nodes(void);
extern void set_sched_default(pbs_sched *, int from_scheduler);
extern void memory_debug_log(struct work_task *ptask);

extern pbs_list_head *fetch_sched_deferred_request(pbs_sched *psched, bool create);
extern void clear_sched_deferred_request(pbs_sched *psched);

attribute *get_sattr(int attr_idx);
char *get_sattr_str(int attr_idx);
struct array_strings *get_sattr_arst(int attr_idx);
pbs_list_head get_sattr_list(int attr_idx);
long get_sattr_long(int attr_idx);
int set_sattr_generic(int attr_idx, char *val, char *rscn, enum batch_op op);
int set_sattr_str_slim(int attr_idx, char *val, char *rscn);
int set_sattr_l_slim(int attr_idx, long val, enum batch_op op);
int set_sattr_b_slim(int attr_idx, long val, enum batch_op op);
int set_sattr_c_slim(int attr_idx, char val, enum batch_op op);
int is_sattr_set(int attr_idx);
void free_sattr(int attr_idx);

#ifdef __cplusplus
}
#endif
#endif /* _SERVER_H */


================================================
FILE: src/include/server_limits.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _SERVER_LIMITS_H
#define _SERVER_LIMITS_H
#ifdef __cplusplus
extern "C" {
#endif
#include <pbs_config.h>

/*
 * This section contains size limit definitions
 *
 * BEWARE OF CHANGING THESE
 */
#ifndef PBS_MAXNODENAME
#define PBS_MAXNODENAME 79 /* max length of a vnode name		    */
#endif
#define PBS_JOBBASE 11 /* basename size for job file, 11 = 14 -3   */
/* where 14 is min file name, 3 for suffix  */

#define PBS_RESVBASE 11 /* basename size for job file, 10 = 14 -3   */
/* where 14 is max file name, 3 for suffix - ".RF" */
#define PBS_NUMJOBSTATE 10 /* TQHWREXBMF */

#ifdef NAS		   /* localmod 083 */
#define PBS_MAX_HOPCOUNT 3 /* limit on number of routing hops per job */
#else
#define PBS_MAX_HOPCOUNT 10 /* limit on number of routing hops per job */
#endif			    /* localmod 083 */

#define PBS_SEQNUMTOP 999999999999 /* top number for job sequence number, reset */
/* to zero when reached, see req_quejob.c    */

#define PBS_NET_RETRY_TIME 30	    /* Retry time between re-sending requests  */
#define PBS_NET_RETRY_LIMIT 14400   /* Max retry time */
#define PBS_SCHEDULE_CYCLE 600	    /* re-schedule even if no change, 10 min   */
#define PBS_RESTAT_JOB 30	    /* ask mom for status only once in 30 sec  */
#define PBS_STAGEFAIL_WAIT 1800	    /* retry time after stage in failuere */
#define PBS_MAX_ARRAY_JOB_DFL 10000 /* default max size of an array job */

/* Server Database information - path names */

#define PBS_SVR_PRIVATE "server_priv"
#define PBS_ACCT "accounting"
#define PBS_JOBDIR "jobs"
#define PBS_USERDIR "users"
#define PBS_RESCDEF "resourcedef"
#define PBS_RESVDIR "resvs"
#define PBS_SPOOLDIR "spool"
#define PBS_QUEDIR "queues"
#define PBS_LOGFILES "server_logs"
#define PBS_ACTFILES "accounting"
#define PBS_SERVERDB "serverdb"
#define PBS_SVRACL "acl_svr"
#define PBS_TRACKING "tracking"
#define NODE_DESCRIP "nodes"
#define NODE_STATUS "node_status"
#define VNODE_MAP "vnodemap"
#define PBS_PROV_TRACKING "prov_tracking"
#define PBS_SCHEDDB "scheddb"
#define PBS_SCHED_PRIVATE "sched_priv"
#define PBS_SVRLIVE "svrlive"
#define DIGEST_LENGTH 20 /* for now making this equal to SHA_DIGEST_LENGTH  which is 20 */

/*
 * Security, Authentication, Authorization Control:
 *
 *	- What account is PBS mail from
 *	- Who is the default administrator (when none defined)
 *	- Is "root" always an batch adminstrator (manager) (YES/no)
 */

#define PBS_DEFAULT_MAIL "adm"
#define PBS_DEFAULT_ADMIN "root"
#define PBS_ROOT_ALWAYS_ADMIN 1

/* #define NO_SPOOL_OUTPUT 1	User output in home directory,not spool */

/* "simplified" network address structure */

#ifndef PBS_NET_TYPE
typedef unsigned long pbs_net_t; /* for holding host addresses */
#define PBS_NET_TYPE
#endif /* PBS_NET_TYPE */

/*
 * the following funny business is due to the fact that O_SYNC
 * is not currently POSIX
 */
#if defined(O_SYNC)
#define O_Sync O_SYNC
#elif defined(_FSYNC)
#define O_Sync _FSYNC
#elif defined(O_FSYNC)
#define O_Sync O_FSYNC
#else
#define O_Sync 0
#endif

/* defines for job moving (see net_move() ) */

#define MOVE_TYPE_Move 1  /* Move by user request */
#define MOVE_TYPE_Route 2 /* Route from routing queue */
#define MOVE_TYPE_Exec 3  /* Execution (move to MOM) */
#define MOVE_TYPE_MgrMv 4 /* Mover by privileged user, a manager */
#define MOVE_TYPE_Order 5 /* qorder command by user */

#define SEND_JOB_OK 0			 /* send_job sent successfully	  */
#define SEND_JOB_FATAL 1		 /* send_job permenent fatal error */
#define SEND_JOB_RETRY 2		 /* send_job failed, retry later	  */
#define SEND_JOB_NODEDW 3		 /* send_job node down, mark down  */
#define SEND_JOB_HOOKERR 4		 /* send_job hook error */
#define SEND_JOB_HOOK_REJECT 5		 /* send_job hook reject */
#define SEND_JOB_HOOK_REJECT_RERUNJOB 6	 /*send_job hook reject,requeue job*/
#define SEND_JOB_HOOK_REJECT_DELETEJOB 7 /*send_job hook reject, delete job*/
#define SEND_JOB_SIGNAL 8		 /* send_job response for signal received  */

/*
 * server initialization modes
 */
#define RECOV_HOT 0	 /* restart prior running jobs   */
#define RECOV_WARM 1	 /* requeue/reschedule  all jobs */
#define RECOV_COLD 2	 /* discard all jobs		*/
#define RECOV_CREATE 3	 /* discard all info		*/
#define RECOV_UPDATEDB 4 /* migrate data from fs to database */
#define RECOV_Invalid 5

/*
 * for protecting the daemons from kernel killers
 */
enum PBS_Daemon_Protect {
	PBS_DAEMON_PROTECT_OFF,
	PBS_DAEMON_PROTECT_ON
};
void daemon_protect(pid_t, enum PBS_Daemon_Protect);

#ifdef __cplusplus
}
#endif
#endif /* _SERVER_LIMITS_H */


================================================
FILE: src/include/site_job_attr_def.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the array of
 * site job attribute definitions, see job_attr_def.c
 *
 * Array elements must be of the form:
 *	    {	"name",
 *		decode_Func,
 *		encode_Func,
 *		set_Func,
 *		comp_Func,
 *		free_Func,
 *		action_routine,
 *		permissions,
 *		ATR_TYPE_*,
 *		PARENT_TYPE_JOB
 *	    },
 *
 * Matching entry must be added in site_job_attr_enum.h
 */


================================================
FILE: src/include/site_job_attr_enum.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the job's enumerated
 * list of attributes,  see job.h.
 *
 * List should be of the form:
 *	JOB_SITE_ATR_name,
 *
 * Matching entry must be added in site_job_attr_def.h
 */


================================================
FILE: src/include/site_qmgr_node_print.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * list of site defined queue attribute names which qmgr should
 * include in its "print node" output
 *
 * format is (do include the quote marks):
 *	"attribute_name",
 */


================================================
FILE: src/include/site_qmgr_que_print.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * list of site defined queue attribute names which qmgr should
 * include in its "print queue" output
 *
 * format is (do include the quote marks):
 *	"attribute_name",
 */


================================================
FILE: src/include/site_qmgr_sched_print.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * list of site defined scheduler attribute names which qmgr should
 * include in its "print sched" output
 *
 * format is (do include the quote marks):
 *	"attribute_name",
 */


================================================
FILE: src/include/site_qmgr_svr_print.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * list of site defined server attribute names which qmgr should
 * include in its "print server" output
 *
 * format is (do include the quote marks):
 *	"attribute_name",
 */


================================================
FILE: src/include/site_que_attr_def.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the array of
 * site queue attribute definitions, see server/queue_attr_def.c
 *
 * Array elements must be of the form:
 *	    {	"name",
 *		decode_Func,
 *		encode_Func,
 *		set_Func,
 *		comp_Func,
 *		free_Func,
 *		action_routine,
 *		permissions,
 *		ATR_TYPE_*,
 *		PARENT_TYPE_QUE_[ALL|EXC|RTE]
 *	    },
 *
 * Matching entry must be added in site_que_attr_enum.h
 */
#ifdef NAS
/* localmod 046 */
{ATTR_maxstarve,
 decode_time,
 encode_time,
 set_l,
 comp_l,
 free_null,
 NULL_FUNC,
 NO_USER_SET,
 ATR_TYPE_LONG,
 PARENT_TYPE_QUE_EXC},
	/* localmod 034 */
	{ATTR_maxborrow,
	 decode_time,
	 encode_time,
	 set_l,
	 comp_l,
	 free_null,
	 NULL_FUNC,
	 NO_USER_SET,
	 ATR_TYPE_LONG,
	 PARENT_TYPE_QUE_EXC},
#endif


================================================
FILE: src/include/site_que_attr_enum.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the queue's enumerated
 * list of attributes,  see queue.h.
 *
 * List should be of the form:
 *	Q_SITE_ATR_name,
 *
 * Matching entry must be added in site_que_attr_def.h
 */
#ifdef NAS
/* localmod 046 */
Q_SITE_ATR_maxstarve,
	/* localmod 034 */
	Q_SITE_ATR_maxborrow,
#endif


================================================
FILE: src/include/site_queue.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * site_queue.h - Site additions to queue information
 */

#ifdef NAS

/*
 * Magic cookie value for max_starve indicating jobs in queue never starve
 */
#define Q_SITE_STARVE_NEVER (9999 * 3600)

#endif


================================================
FILE: src/include/site_resc_attr_def.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the array of
 * resource definitions, see server/resc_def_all.c
 *
 * Array elements must be of the form:
 *	    {	"name",
 *		decode_Func,
 *		encode_Func,
 *		set_Func,
 *		comp_Func,
 *		free_Func,
 *		action_routine,
 *		permissions,
 *		ATR_TYPE_*
 *	    },
 */


================================================
FILE: src/include/site_resv_attr_def.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the array of
 * site resc_resv attribute definitions, see server/resv_attr_def.c
 *
 * Array elements must be of the form:
 *	    {	"name",
 *		decode_Func,
 *		encode_Func,
 *		set_Func,
 *		comp_Func,
 *		free_Func,
 *		action_routine,
 *		permissions,
 *		ATR_TYPE_*,
 *		PARENT_TYPE_RESV
 *	    },
 *
 * Matching entry must be added in site_resv_attr_enum.h
 */


================================================
FILE: src/include/site_resv_attr_enum.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the reservation's enumerated
 * list of attributes,  see reservation.h.
 *
 * List should be of the form:
 *	RESV_SITE_ATR_name,
 *
 * Matching entry must be added in site_resv_attr_def.h
 */


================================================
FILE: src/include/site_sched_attr_def.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the array of site
 * scheduler attribute definitions, see server/svr_attr_def.c
 *
 * Array elements must be of the form:
 *	    {	"name",
 *		decode_Func,
 *		encode_Func,
 *		set_Func,
 *		comp_Func,
 *		free_Func,
 *		action_routine,
 *		permissions,
 *		ATR_TYPE_*,
 *		PARENT_TYPE_SERVER
 *	    },
 *
 * Matching entry must be added in site_sched_attr_enum.h
 */


================================================
FILE: src/include/site_sched_attr_enum.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the scheduler's enumerated
 * list of attributes.
 *
 * List should be of the form:
 *	SCHED_SITE_ATR_name,
 *
 * Matching entry must be added in site_sched_attr_def.h
 */


================================================
FILE: src/include/site_svr_attr_def.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the array of site
 * server attribute definitions, see server/svr_attr_def.c
 *
 * Array elements must be of the form:
 *	    {	"name",
 *		decode_Func,
 *		encode_Func,
 *		set_Func,
 *		comp_Func,
 *		free_Func,
 *		action_routine,
 *		permissions,
 *		ATR_TYPE_*,
 *		PARENT_TYPE_SERVER
 *	    },
 *
 * Matching entry must be added in site_sv_attr_enum.h
 */


================================================
FILE: src/include/site_svr_attr_enum.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Place holder for site supplied additions to the server's enumerated
 * list of attributes,  see server.h.
 *
 * List should be of the form:
 *	SVR_SITE_ATR_name,
 *
 * Matching entry must be added in site_sv_attr_def.h
 */


================================================
FILE: src/include/svrfunc.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _SVRFUNC_H
#define _SVRFUNC_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * misc server function prototypes
 */

#include "net_connect.h"
#include "pbs_db.h"
#include "reservation.h"
#include "resource.h"
#include "pbs_sched.h"
#include "pbs_entlim.h"

extern int check_num_cpus(void);
extern int chk_hold_priv(long, int);
extern void close_client(int);
extern void scheduler_close(int);
extern int send_sched_cmd(pbs_sched *, int, char *);
extern void count_node_cpus(void);
extern int ctcpus(char *, int *);
extern void cvrt_fqn_to_name(char *, char *);
extern int failover_send_shutdown(int);
extern char *get_hostPart(char *);
extern int is_compose(int, int);
extern int is_compose_cmd(int, int, char **);
extern char *get_servername(unsigned int *);
extern void process_Areply(int);
extern void process_Dreply(int);
extern void process_DreplyTPP(int);
extern void process_request(int);
extern void process_dis_request(int);
extern int save_flush(void);
extern void save_setup(int);
extern int save_struct(char *, unsigned int);
extern int schedule_jobs(pbs_sched *);
extern int schedule_high(pbs_sched *);
extern void shutdown_nodes(void);
extern char *site_map_user(char *, char *);
extern char *site_map_resvuser(char *, char *);
extern void svr_disconnect(int);
extern void svr_disconnect_with_wait_option(int, int);
extern int svr_connect(pbs_net_t, unsigned int, void (*)(int), enum conn_type, int);
extern void svr_force_disconnect(int);
extern void svr_shutdown(int);
extern int svr_get_privilege(char *, char *);
extern int setup_nodes(void);
extern int setup_resc(int);
extern void update_job_node_rassn(job *, attribute *, enum batch_op);
extern void mark_node_down(char *, char *);
extern void mark_node_offline_by_mom(char *, char *);
extern void clear_node_offline_by_mom(char *, char *);
extern void mark_which_queues_have_nodes(void);
#ifndef DEBUG
extern void pbs_close_stdfiles(void);
#endif
extern int is_job_array(char *);
extern int get_queued_subjobs_ct(job *);
extern int parse_subjob_index(char *, char **, int *, int *, int *, int *);
extern int expand_resc_array(char *, int, int);
extern void resv_timer_init(void);
extern int validate_nodespec(char *);
extern long longto_kbsize(char *);
extern int is_vnode_up(char *);
extern char *convert_long_to_time(long);
extern int svr_chk_history_conf(void);
extern int update_svrlive(void);
extern void init_socket_licenses(char *);
extern void update_job_finish_comment(job *, int, char *);
extern void svr_saveorpurge_finjobhist(job *);
extern int recreate_exec_vnode(job *, char *, char *, char *, int);
extern void unset_extra_attributes(job *);
extern int node_delete_db(struct pbsnode *);
extern int pbsd_init(int);
extern int svr_chk_histjob(job *);
extern int chk_and_update_db_svrhost(void);
extern int apply_aoe_inchunk_rules(resource *, attribute *, void *, int);
extern int apply_select_inchunk_rules(resource *, attribute *, void *, int, int);
extern int svr_create_tmp_jobscript(job *, char *);
extern void unset_jobscript_max_size(void);
extern char *svr_load_jobscript(job *);
extern int direct_write_requested(job *);
extern void spool_filename(job *, char *, char *);
extern enum failover_state are_we_primary(void);
extern void license_more_nodes(void);
extern void reset_svr_sequence_window(void);
extern void reply_preempt_jobs_request(int, int, struct job *);
extern int copy_params_from_job(char *, resc_resv *);
extern int confirm_resv_locally(resc_resv *, struct batch_request *, char *);
extern int set_select_and_place(int, void *, attribute *);
extern int make_schedselect(attribute *, resource *, pbs_queue *, attribute *);
extern long long get_next_svr_sequence_id(void);
extern int compare_obj_hash(void *, int, void *);
extern void panic_stop_db();
extern void free_db_attr_list(pbs_db_attr_list_t *);
extern bool delete_pending_arrayjobs(struct batch_request *);

#ifdef _PROVISION_H
extern int find_prov_vnode_list(job *, exec_vnode_listtype *, char **);
#endif /* _PROVISION_H */

extern void *jobs_idx;

#ifdef _RESERVATION_H
extern int set_nodes(void *, int, char *, char **, char **, char **, int, int);
#endif /* _RESERVATION_H */

#ifdef _PBS_NODES_H
extern void tinsert2(const u_long, const u_long, mominfo_t *, struct tree **);
extern void *tdelete2(const u_long, const u_long, struct tree **);
extern void tfree2(struct tree **);
#ifdef _RESOURCE_H
extern int fix_indirect_resc_targets(struct pbsnode *, resource *, int, int);
#endif /* _RESOURCE_H */
#endif /* _PBS_NODES_H */

#ifdef _PBS_JOB_H
extern int assign_hosts(job *, char *, int);
extern void clear_exec_on_run_fail(job *);
extern void discard_job(job *, char *, int);
extern void post_rerun(struct work_task *);
extern void force_reque(job *);
extern void set_resc_assigned(void *, int, enum batch_op);
extern int is_ts_node(char *);
extern char *cnv_eh(job *);
extern char *find_ts_node(void);
extern void job_purge(job *);
extern void check_block(job *, char *);
extern void free_nodes(job *);
extern int job_route(job *);
extern void rel_resc(job *);
extern int remove_stagein(job *);
extern size_t check_for_cred(job *, char **);
extern void svr_mailowner(job *, int, int, char *);
extern void svr_mailowner_id(char *, job *, int, int, char *);
extern char *lastname(char *);
extern void chk_array_doneness(job *);
extern job *create_subjob(job *, char *, int *);
extern job *find_arrayparent(char *);
extern job *get_subjob_and_state(job *, int, char *, int *);
extern void update_sj_parent(job *, job *, char *, char, char);
extern void update_subjob_state_ct(job *);
extern char *subst_array_index(job *, char *);
#ifndef PBS_MOM
extern void svr_setjob_histinfo(job *, histjob_type);
extern void svr_histjob_update(job *, char, int);
extern char *form_attr_comment(const char *, const char *);
extern void complete_running(job *);
extern void am_jobs_add(job *);
extern int was_job_alteredmoved(job *);
extern void check_failed_attempts(job *);
#endif
#ifdef _QUEUE_H
extern int check_entity_ct_limit_max(job *, pbs_queue *);
extern int check_entity_ct_limit_queued(job *, pbs_queue *);
extern int check_entity_resc_limit_max(job *, pbs_queue *, attribute *);
extern int check_entity_resc_limit_queued(job *, pbs_queue *, attribute *);
extern int set_entity_ct_sum_max(job *, pbs_queue *, enum batch_op);
extern int set_entity_ct_sum_queued(job *, pbs_queue *, enum batch_op);
extern int set_entity_resc_sum_max(job *, pbs_queue *, attribute *, enum batch_op);
extern int set_entity_resc_sum_queued(job *, pbs_queue *, attribute *, enum batch_op);
extern int account_entity_limit_usages(job *, pbs_queue *, attribute *, enum batch_op, int);
extern void eval_chkpnt(job *pjob, attribute *queckp);
#endif /* _QUEUE_H */

#ifdef _BATCH_REQUEST_H
extern int svr_startjob(job *, struct batch_request *);
extern int svr_authorize_jobreq(struct batch_request *, job *);
extern int dup_br_for_subjob(struct batch_request *, job *, int (*)(struct batch_request *, job *));
extern void set_old_nodes(job *);
extern int send_job_exec_update_to_mom(job *, char *, int, struct batch_request *);
extern int free_sister_vnodes(job *, char *, char *, char *, int, struct batch_request *);
#ifdef _WORK_TASK_H
extern int send_job(job *, pbs_net_t, int, int, void (*)(struct work_task *), struct batch_request *);
extern int relay_to_mom(job *, struct batch_request *, void (*)(struct work_task *));
extern int relay_to_mom2(job *, struct batch_request *, void (*)(struct work_task *), struct work_task **);
extern int recreate_exec_vnode(job *, char *, char *, char *, int);
extern int send_job_exec_update_to_mom(job *, char *, int, struct batch_request *);
extern int free_sister_vnodes(job *, char *, char *, char *, int, struct batch_request *);
extern void indirect_target_check(struct work_task *);
extern void primary_handshake(struct work_task *);
extern void secondary_handshake(struct work_task *);
#endif /* _WORK_TASK_H */
#endif /* _BATCH_REQUEST_H */
#ifdef _TICKET_H
extern int write_cred(job *, char *, size_t);
extern int read_cred(job *, char **, size_t *);
extern int get_credential(char *, job *, int, char **, size_t *);
#endif /* _TICKET_H */
extern int local_move(job *, struct batch_request *);
extern int user_read_password(char *, char **, size_t *);

#endif /* _PBS_JOB_H */

#ifdef _BATCH_REQUEST_H
extern void req_quejob(struct batch_request *);
extern void req_jobcredential(struct batch_request *);
extern void req_usercredential(struct batch_request *);
extern void req_jobscript(struct batch_request *);
extern void req_commit(struct batch_request *);
extern void req_commit_now(struct batch_request *, job *);
extern void req_deletejob(struct batch_request *);
extern void req_holdjob(struct batch_request *);
extern void req_messagejob(struct batch_request *);
extern void req_py_spawn(struct batch_request *);
extern void req_relnodesjob(struct batch_request *);
extern void req_modifyjob(struct batch_request *);
extern void req_modifyReservation(struct batch_request *);
extern void req_orderjob(struct batch_request *);
extern void req_rescreserve(struct batch_request *);
extern void req_rescfree(struct batch_request *);
extern void req_shutdown(struct batch_request *);
extern void req_signaljob(struct batch_request *);
extern void req_mvjobfile(struct batch_request *);
extern void req_stat_node(struct batch_request *);
extern void req_track(struct batch_request *);
extern void req_stagein(struct batch_request *);
extern void req_resvSub(struct batch_request *);
extern void req_deleteReservation(struct batch_request *);
extern void req_reservationOccurrenceEnd(struct batch_request *);
extern void req_failover(struct batch_request *);
extern int put_failover(int, struct batch_request *);
extern void set_last_used_time_node(void *, int);

#endif /* _BATCH_REQUEST_H */

#ifdef _ATTRIBUTE_H
extern int check_que_enable(attribute *, void *, int);
extern int set_queue_type(attribute *, void *, int);
extern int chk_characteristic(struct pbsnode *pnode, int *pneed_todo);
extern int is_valid_str_resource(attribute *pattr, void *pobject, int actmode);
extern int setup_arrayjob_attrs(attribute *, void *, int);
extern int deflt_chunk_action(attribute *pattr, void *pobj, int mode);
extern int action_svr_iteration(attribute *pattr, void *pobj, int mode);
extern void update_node_rassn(attribute *, enum batch_op);
extern void update_job_node_rassn(job *, attribute *, enum batch_op);
extern int cvt_nodespec_to_select(char *, char **, size_t *, attribute *);
extern int is_valid_resource(attribute *pattr, void *pobject, int actmode);
extern int queuestart_action(attribute *pattr, void *pobject, int actmode);
extern int alter_eligibletime(attribute *pattr, void *pobject, int actmode);
extern int set_chunk_sum(attribute *pselectattr, attribute *pattr);
extern int update_resources_rel(job *, attribute *, enum batch_op);
extern int keepfiles_action(attribute *pattr, void *pobject, int actmode);
extern int removefiles_action(attribute *pattr, void *pobject, int actmode);

/* Functions below exposed as they are now accessed by the Python hooks */
extern void update_state_ct(attribute *, int *, attribute_def *attr_def);
extern void update_license_ct();

#ifdef _PBS_JOB_H
extern int job_set_wait(attribute *, void *, int);
#endif /* _PBS_JOB_H */
#ifdef _QUEUE_H
extern int chk_resc_limits(attribute *, pbs_queue *);
extern int set_resc_deflt(void *, int, pbs_queue *);
extern void queue_route(pbs_queue *);
extern int que_purge(pbs_queue *);
#endif /* _QUEUE_H */
#endif /* _ATTRIBUTE_H */

#ifdef PBS_MOM
extern void addrinsert(const unsigned long);
extern int addrfind(const unsigned long);
#endif /* PBS_MOM */

#ifdef PBS_NET_H
extern int svr_connect(pbs_net_t, unsigned int, void (*)(int), enum conn_type, int);
#endif /* PBS_NET_H */
#ifdef _WORK_TASK_H
extern void release_req(struct work_task *);
#ifdef _BATCH_REQUEST_H
extern int issue_Drequest(int, struct batch_request *, void (*)(struct work_task *), struct work_task **, int);
#endif /* _BATCH_REQUEST_H */
#endif /* _WORK_TASK_H */

#ifdef _RESERVATION_H
extern void is_resv_window_in_future(resc_resv *);
extern void resv_setResvState(resc_resv *, int, int);
extern void is_resv_window_in_future(resc_resv *);
extern int gen_task_EndResvWindow(resc_resv *);
extern int gen_future_deleteResv(resc_resv *, long);
extern int gen_deleteResv(resc_resv *, long);
extern int node_avail(spec_and_context *, int *, int *, int *, int *);
extern int node_avail_complex(spec_and_context *, int *, int *, int *, int *);
extern int node_reserve(spec_and_context *, pbs_resource_t);
extern void node_unreserve(pbs_resource_t);
extern int node_spec(struct spec_and_context *, int);
extern int notify_scheds_about_resv(int, resc_resv *);
extern char *create_resv_destination(resc_resv *presv);
#endif /* _RESERVATION_H */

#ifdef _LIST_LINK_H
/*
 * This structure is used to hold information for a runjob batch request
 * from a client (that is not the Scheduler) which is being forwarded to
 * the Scheduler for consideration.   Since the Scheduler will make many
 * requests to the Server before replying to this request, the normal
 * request/reply mechanism breaks down.
 *
 * The request currently may be in the following states:
 *	Pending - waiting for the next scheduling cycle
 *	Sent    - sent to the Scheduler
 * When the Scheduler deals with the request, it will use the Deferred
 * Scheduler Reply request;  the Server will look in the list for one with
 * a matching Job ID and on finding it, reply to the original runjob request
 * and remove the structure from the list.
 */
struct deferred_request {
	pbs_list_link dr_link;
	char dr_id[PBS_MAXSVRJOBID + 1];
	struct batch_request *dr_preq;
	int dr_sent; /* sent to Scheduler */
};

struct sched_deferred_request {
	pbs_list_link sdr_link;
	pbs_list_head sdr_deferred_req; /* list of deferred requests of the scheduler */
	pbs_sched *sdr_psched; /* Scheduler */
};

#endif /* _LIST_LINK_H */

/*
 * The following is used are req_stat.c and req_select.c
 * Also defined in status_job.c
 */
#ifdef STAT_CNTL
struct select_list {
	struct select_list *sl_next; /* ptr to next in list   */
	enum batch_op sl_op;	     /* comparison operator   */
	attribute_def *sl_def;	     /* ptr to attr definition, for at_comp */
	int sl_atindx;		     /* index into attribute_def, for type */
	attribute sl_attr;	     /* the attribute (value) */
};

/* used in req_stat_job */
struct stat_cntl {
	int sc_XXXX;
	int sc_type;
	int sc_XXXY;
	int sc_conn;
	pbs_queue *sc_pque;
	struct batch_request *sc_origrq;
	struct select_list *sc_select;
	void (*sc_post)(struct stat_cntl *);
	char sc_jobid[PBS_MAXSVRJOBID + 1];
};

extern int status_job(job *, struct batch_request *, svrattrl *, pbs_list_head *, int *, int);
extern int status_subjob(job *, struct batch_request *, svrattrl *, int, pbs_list_head *, int *, int);
extern int stat_to_mom(job *, struct stat_cntl *);

#endif /* STAT_CNTL */
#ifdef __cplusplus
}
#endif
#endif /* _SVRFUNC_H */


================================================
FILE: src/include/ticket.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _TICKET_H
#define _TICKET_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * ticket.h - header file for dealing with security systems such as kerberos.
 */

#include <sys/types.h>

#define PBS_CREDVER 1
#define PBS_CREDTYPE_NONE 0
#define PBS_CREDTYPE_GRIDPROXY 2 /* Deprecated */
#define PBS_CREDTYPE_AES 3

#define PBS_GC_BATREQ 100
#define PBS_GC_CPYFILE 101
#define PBS_GC_EXEC 102

#define PBS_CREDNAME_AES "aes"

extern int encode_to_base64(const unsigned char *buffer, size_t buffer_len, char **ret_encoded_data);
extern int decode_from_base64(char *buffer, unsigned char **ret_decoded_data, size_t *ret_decoded_len);

#ifdef __cplusplus
}
#endif
#endif /* _TICKET_H */


================================================
FILE: src/include/tm.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 **	Header file defineing the datatypes and library visiable
 **	variables for paralell awareness.
 */

#ifndef _TM_H
#define _TM_H

#include "tm_.h"

/*
 **	The tm_roots structure contains data for the last
 **	tm_init call whose event has been polled.  <Me> is the
 **	caller's identity.  <Daddy> is the identity of the task that
 **	spawned the caller.  If <daddy> is the TM_NULL_TASK, the caller
 **	is the initial task of the job, running on job-relative
 **	node 0.
 */
struct tm_roots {
	tm_task_id tm_me;
	tm_task_id tm_parent;
	int tm_nnodes;
	int tm_ntasks;
	int tm_taskpoolid;
	tm_task_id *tm_tasklist;
};

/*
 **	The tm_whattodo structure contains data for the last
 **	tm_register event polled.  This is not implemented yet.
 */
typedef struct tm_whattodo {
	int tm_todo;
	tm_task_id tm_what;
	tm_node_id tm_where;
} tm_whattodo_t;

/*
 **	Prototypes for all the TM API calls.
 */
int
tm_init(void *info,
	struct tm_roots *roots);

int
tm_poll(tm_event_t poll_event,
	tm_event_t *result_event,
	int wait,
	int *tm_errno);

int tm_notify(int tm_signal);

int
tm_spawn(int argc,
	 char *argv[],
	 char *envp[],
	 tm_node_id where,
	 tm_task_id *tid,
	 tm_event_t *event);

int
tm_kill(tm_task_id tid,
	int sig,
	tm_event_t *event);

int
tm_obit(tm_task_id tid,
	int *obitval,
	tm_event_t *event);

int
tm_nodeinfo(tm_node_id **list,
	    int *nnodes);

int
tm_taskinfo(tm_node_id node,
	    tm_task_id *list,
	    int lsize,
	    int *ntasks,
	    tm_event_t *event);

int
tm_atnode(tm_task_id tid,
	  tm_node_id *node);

int
tm_rescinfo(tm_node_id node,
	    char *resource,
	    int len,
	    tm_event_t *event);

int
tm_publish(char *name,
	   void *info,
	   int nbytes,
	   tm_event_t *event);

int
tm_subscribe(tm_task_id tid,
	     char *name,
	     void *info,
	     int len,
	     int *amount,
	     tm_event_t *event);

int tm_finalize(void);

int
tm_alloc(char *resources,
	 tm_event_t *event);

int
tm_dealloc(tm_node_id node,
	   tm_event_t *event);

int tm_create_event(tm_event_t *event);

int tm_destroy_event(tm_event_t *event);

int
tm_register(tm_whattodo_t *what,
	    tm_event_t *event);

int
tm_attach(char *jobid,
	  char *cookie,
	  pid_t pid,
	  tm_task_id *tid,
	  char *host,
	  int port);

#endif /* _TM_H */


================================================
FILE: src/include/tm_.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 **	Header file defineing the datatypes and library visiable
 **	variables for paralell awareness.
 */

#ifndef _TM__H
#define _TM__H

#include <sys/types.h>

typedef int tm_host_id; /* physical node index  */
typedef int tm_node_id; /* job-relative node id */
#define TM_ERROR_NODE ((tm_node_id) -1)

typedef int tm_event_t; /* event handle, > 0 for real events */
#define TM_NULL_EVENT ((tm_event_t) 0)
#define TM_ERROR_EVENT ((tm_event_t) -1)

typedef unsigned int tm_task_id;
#define TM_NULL_TASK (tm_task_id) 0
#define TM_INIT_TASK (tm_task_id) 1

/*
 **	Protocol message type defines
 */
#define TM_INIT 100	 /* tm_init request	*/
#define TM_TASKS 101	 /* tm_taskinfo request	*/
#define TM_SPAWN 102	 /* tm_spawn request	*/
#define TM_SIGNAL 103	 /* tm_signal request	*/
#define TM_OBIT 104	 /* tm_obit request	*/
#define TM_RESOURCES 105 /* tm_rescinfo request	*/
#define TM_POSTINFO 106	 /* tm_publish request	*/
#define TM_GETINFO 107	 /* tm_subscribe request	*/
#define TM_GETTID 108	 /* tm_gettasks request */
#define TM_REGISTER 109	 /* tm_register request	*/
#define TM_RECONFIG 110	 /* tm_register deferred reply */
#define TM_ACK 111	 /* tm_register event acknowledge */
#define TM_FINALIZE 112	 /* tm_finalize request, there is no reply */
#define TM_ATTACH 113	 /* tm_attach request */
#define TM_OKAY 0

#define TM_ERROR 999

/*
 **	Error numbers returned from library
 */
#define TM_SUCCESS 0
#define TM_ESYSTEM 17000
#define TM_ENOEVENT 17001
#define TM_ENOTCONNECTED 17002
#define TM_EUNKNOWNCMD 17003
#define TM_ENOTIMPLEMENTED 17004
#define TM_EBADENVIRONMENT 17005
#define TM_ENOTFOUND 17006
#define TM_BADINIT 17007
#define TM_ESESSION 17008
#define TM_EUSER 17009
#define TM_EOWNER 17010
#define TM_ENOPROC 17011
#define TM_EHOOK 17012

#define TM_TODO_NOP 5000  /* Do nothing (the nodes value may be new) */
#define TM_TODO_CKPT 5001 /* Checkpoint <what> and continue it */
#define TM_TODO_MOVE 5002 /* Move <what> to <where> */
#define TM_TODO_QUIT 5003 /* Terminate <what> */
#define TM_TODO_STOP 5004 /* Suspend execution of <what> */

#endif /* _TM__H */


================================================
FILE: src/include/tpp.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef __TPP_H
#define __TPP_H
#ifdef __cplusplus
extern "C" {
#endif

#include <pbs_config.h>
#include <errno.h>
#include "pbs_internal.h"
#include "auth.h"

#if defined(PBS_HAVE_DEVPOLL)
#define PBS_USE_DEVPOLL
#elif defined(PBS_HAVE_EPOLL)
#define PBS_USE_EPOLL
#elif defined(PBS_HAVE_POLLSET)
#define PBS_USE_POLLSET
#elif defined(HAVE_POLL)
#define PBS_USE_POLL
#elif defined(HAVE_SELECT)
#define PBS_USE_SELECT
#endif

#if defined(PBS_USE_EPOLL)

#include <sys/epoll.h>

#elif defined(PBS_USE_POLL)

#include <poll.h>

#elif defined(PBS_USE_SELECT)

#if defined(FD_SET_IN_SYS_SELECT_H)
#include <sys/select.h>
#endif

#elif defined(PBS_USE_DEVPOLL)

#include <sys/devpoll.h>

#elif defined(PBS_USE_POLLSET)

#include <sys/poll.h>
#include <sys/pollset.h>
#include <fcntl.h>

#endif

/*
 * Default number of RPP packets to check every server iteration
 */
#define RPP_MAX_PKT_CHECK_DEFAULT 64

/* TPP specific definitions and structures */
#define TPP_DEF_ROUTER_PORT 17001
#define TPP_MAXOPENFD 8192 /* limit for pbs_comm max open files */

/* tpp node types, leaf and router */
#define TPP_LEAF_NODE 1	       /* leaf node that does not care about TPP_CTL_LEAVE messages from other leaves */
#define TPP_LEAF_NODE_LISTEN 2 /* leaf node that wants to be notified of TPP_CTL_LEAVE messages from other leaves */
#define TPP_ROUTER_NODE 3      /* router */
#define TPP_AUTH_NODE 4	       /* authenticated, but yet unknown node type till a join happens */

extern int tpp_fd;
struct tpp_config {
	int node_type;	/* leaf, proxy */
	char **routers; /* other proxy names (and backups) to connect to */
	int numthreads;
	char *node_name; /* list of comma separated node names */
	int compress;
	int tcp_keepalive; /* use keepalive? */
	int tcp_keep_idle;
	int tcp_keep_intvl;
	int tcp_keep_probes;
	int tcp_user_timeout;
	int buf_limit_per_conn; /* buffer limit per physical connection */
	pbs_auth_config_t *auth_config;
	char **supported_auth_methods;
};

/* TPP specific functions */
extern int tpp_init(struct tpp_config *);
extern void tpp_set_app_net_handler(void (*app_net_down_handler)(void *), void (*app_net_restore_handler)(void *));
extern void tpp_set_logmask(long);
extern int set_tpp_config(struct pbs_config *, struct tpp_config *, char *, int, char *);
extern void free_tpp_config(struct tpp_config *);
extern void DIS_tpp_funcs();
extern int tpp_open(char *, unsigned int);
extern int tpp_close(int);
extern int tpp_eom(int);
extern int tpp_bind(unsigned int);
extern int tpp_poll(void);
extern void tpp_terminate(void);
extern void tpp_shutdown(void);
extern struct sockaddr_in *tpp_getaddr(int);
extern void tpp_add_close_func(int, void (*func)(int));
extern char *tpp_parse_hostname(char *, int *);
extern int tpp_init_router(struct tpp_config *);
extern void tpp_router_shutdown(void);

/* special tpp only multicast function prototypes */
extern int tpp_mcast_open(void);
extern int tpp_mcast_add_strm(int, int, bool);
extern int *tpp_mcast_members(int, int *);
extern int tpp_mcast_send(int, void *, unsigned int, unsigned int);
extern int tpp_mcast_close(int);

/**********************************************************************/
/* em related definitions (external version) */
/**********************************************************************/
#if defined(PBS_USE_POLL)

typedef struct {
	int fd;
	int events;
} em_event_t;

#define EM_GET_FD(ev, i) ev[i].fd
#define EM_GET_EVENT(ev, i) ev[i].events

#define EM_IN POLLIN
#define EM_OUT POLLOUT
#define EM_HUP POLLHUP
#define EM_ERR POLLERR

#elif defined(PBS_USE_EPOLL)

typedef struct epoll_event em_event_t;

#define EM_GET_FD(ev, i) ev[i].data.fd
#define EM_GET_EVENT(ev, i) ev[i].events

#define EM_IN EPOLLIN
#define EM_OUT EPOLLOUT
#define EM_HUP EPOLLHUP
#define EM_ERR EPOLLERR

#elif defined(PBS_USE_POLLSET)

typedef struct pollfd em_event_t;

#define EM_GET_FD(ev, i) ev[i].fd
#define EM_GET_EVENT(ev, i) ev[i].revents

#define EM_IN POLLIN
#define EM_OUT POLLOUT
#define EM_HUP POLLHUP
#define EM_ERR POLLERR

#elif defined(PBS_USE_SELECT)

typedef struct {
	int fd;
	int events;
} em_event_t;

#define EM_GET_FD(ev, i) ev[i].fd
#define EM_GET_EVENT(ev, i) ev[i].events

#define EM_IN 0x001
#define EM_OUT 0x002
#define EM_HUP 0x004
#define EM_ERR 0x008

#elif defined(PBS_USE_DEVPOLL)

typedef struct pollfd em_event_t;

#define EM_GET_FD(ev, i) ev[i].fd
#define EM_GET_EVENT(ev, i) ev[i].revents

#define EM_IN POLLIN
#define EM_OUT POLLOUT
#define EM_HUP POLLHUP
#define EM_ERR POLLERR

#endif

/* platform independent functions that handle the underlying platform specific event
 * handling mechanism. Internally it could use epoll, poll, select etc, depending on the
 * platform.
 */
void *tpp_em_init(int);
void tpp_em_destroy(void *);
int tpp_em_add_fd(void *, int, int);
int tpp_em_mod_fd(void *, int, int);
int tpp_em_del_fd(void *, int);
int tpp_em_wait(void *, em_event_t **, int);
#ifndef WIN32
int tpp_em_pwait(void *, em_event_t **, int, const sigset_t *);
#else
int tpp_em_wait_win(void *, em_event_t **, int);
#endif

extern char *get_all_ips(char *, char *, size_t);

#ifdef __cplusplus
}
#endif
#endif /* _TPP_H */


================================================
FILE: src/include/tracking.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * tracking.h - header file for maintaining job tracking records
 *
 * These are linked into the server structure.  Entries are added or
 * updated upon the receipt of Track Job Requests and are used to
 * satisfy Locate Job requests.
 *
 * The main data is kept in the form of the track batch request so
 * that copying is easy.
 *
 * Other required header files:
 *	"server_limits.h"
 */

#define PBS_TRACK_MINSIZE 100 /* mininum size of buffer in records */
#define PBS_SAVE_TRACK_TM 300 /* time interval between saves of track data */

struct tracking {
	time_t tk_mtime; /* time this entry modified */
	int tk_hopcount;
	char tk_jobid[PBS_MAXSVRJOBID + 1];
	char tk_location[PBS_MAXDEST + 1];
	char tk_state;
};

extern void track_save(struct work_task *);


================================================
FILE: src/include/user.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _USER_H
#define _USER_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * user.h - structure definations for user concept
 * Other required header files:
 *     "list_link.h"
 *     "server_limits.h"
 *     "attribute.h"
 *     "credential.h"
 *     "batch_request.h"
 *
 */

#define USER_PASSWORD_SUFFIX ".CR" /* per user/per server password */

extern int user_write_password(char *user, char *cred, size_t len);
extern int user_read_password(char *user, char **cred, size_t *len);

#ifdef __cplusplus
}
#endif
#endif /* _USER_H */


================================================
FILE: src/include/work_task.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _WORK_TASK_H
#define _WORK_TASK_H
#ifdef __cplusplus
extern "C" {
#endif

/*
 * Server Work Tasks
 *
 * This structure is used by the server to track deferred work tasks.
 *
 * This information need not be preserved.
 *
 * Other Required Header Files
 *	"list_link.h"
 */

enum work_type {
	WORK_Immed,	     /* immediate action: see state */
	WORK_Interleave,     /* immediate action: but allow other work to interleave */
	WORK_Timed,	     /* action at certain time */
	WORK_Deferred_Child, /* On Death of a Child */
	WORK_Deferred_Reply, /* On reply to an outgoing service request */
	WORK_Deferred_Local, /* On reply to a local service request */
	WORK_Deferred_Other, /* various other events */

	WORK_Deferred_Cmp, /* Never set directly, used to indicate that */
	/* a WORK_Deferred_Child is ready            */
	WORK_Deferred_cmd /* used by TPP for deferred
	                        * reply but without a preq attached
	                        */
};

enum wtask_delete_option {
	DELETE_ONE,
	DELETE_ALL
};

struct work_task {
	pbs_list_link wt_linkevent;	     /* link to event type work list */
	pbs_list_link wt_linkobj;	     /* link to others of same object */
	pbs_list_link wt_linkobj2;	     /* link to another set of similarity */
	long wt_event;			     /* event id: time, pid, socket, ... */
	char *wt_event2;		     /* if replies on the same handle, then additional distinction */
	enum work_type wt_type;		     /* type of event */
	void (*wt_func)(struct work_task *); /* function to perform task */
	void *wt_parm1;			     /* obj pointer for use by func */
	void *wt_parm2;			     /* optional pointer for use by func */
	void *wt_parm3;			     /* used to store reply for deferred cmds TPP */
	int wt_aux;			     /* optional info: e.g. child status */
	int wt_aux2;			     /* optional info 2: e.g. *real* child pid (windows), tpp msgid etc */
};

extern struct work_task *set_task(enum work_type, long event, void (*func)(struct work_task *), void *param);
extern int convert_work_task(struct work_task *ptask, enum work_type);
extern void clear_task(struct work_task *ptask);
extern void dispatch_task(struct work_task *);
extern void delete_task(struct work_task *);
extern void delete_task_by_parm1_func(void *parm1, void (*func)(struct work_task *), enum wtask_delete_option option);
extern int has_task_by_parm1(void *parm1);
extern time_t default_next_task(void);
extern struct work_task *find_work_task(enum work_type, void *, void *);

#ifdef __cplusplus
}
#endif
#endif /* _WORK_TASK_H */


================================================
FILE: src/lib/Libattr/Long_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

int Long_neg = 0;


================================================
FILE: src/lib/Libattr/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

lib_LIBRARIES = libattr.a

libattr_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

libattr_a_SOURCES = \
	attr_atomic.c \
	attr_fn_acl.c \
	attr_fn_arst.c \
	attr_fn_b.c \
	attr_fn_c.c \
	attr_fn_entlim.c \
	attr_fn_f.c \
	attr_fn_hold.c \
	attr_fn_intr.c \
	attr_fn_l.c \
	attr_fn_ll.c \
	attr_fn_resc.c \
	attr_fn_size.c \
	attr_fn_str.c \
	attr_fn_time.c \
	attr_fn_unkn.c \
	attr_func.c \
	attr_node_func.c \
	attr_resc_func.c \
	job_attr_def.c \
	Long_.c \
	node_attr_def.c \
	queue_attr_def.c \
	resc_def_all.c \
	resc_map.c \
	resv_attr_def.c \
	sched_attr_def.c \
	strToL.c \
	strTouL.c \
	svr_attr_def.c \
	uLTostr.c

EXTRA_DIST = \
	master_job_attr_def.xml \
	master_node_attr_def.xml \
	master_queue_attr_def.xml \
	master_resc_def_all.xml \
	master_resv_attr_def.xml \
	master_sched_attr_def.xml \
	master_svr_attr_def.xml

CLEANFILES = \
	job_attr_def.c \
	node_attr_def.c \
	queue_attr_def.c \
	resc_def_all.c \
	resv_attr_def.c \
	sched_attr_def.c \
	svr_attr_def.c

job_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_job_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_job_attr_def.xml -s $@

svr_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_svr_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_svr_attr_def.xml -s $@

queue_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_queue_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_queue_attr_def.xml -s $@

node_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_node_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_node_attr_def.xml -s $@

sched_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_sched_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_sched_attr_def.xml -s $@

resv_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_resv_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_resv_attr_def.xml -s $@

resc_def_all.c: $(top_srcdir)/src/lib/Libattr/master_resc_def_all.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	@PYTHON@ $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_resc_def_all.xml -s $@


================================================
FILE: src/lib/Libattr/attr_atomic.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "portability.h"
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"

/**
 * @file	attr_atomic.c
 * @brief
 * 	This file contains general functions for manipulating an attribute array.
 *
 * @par	Included is:
 *	attr_atomic_set()
 *	attr_atomic_kill()
 *
 * 	The prototypes are declared in "attr_func.h"
 */

/* Global Variables */

extern int resc_access_perm; /* see lib/Libattr/attr_fn_resc.c */

/**
 * @brief
 *	atomically set a attribute array with values from a svrattrl
 *
 * @param[in] plist - Pointer to list of attributes to set
 * @param[in] old - Pointer to the original/old attribute
 * @param[in] new - Pointer to the new/updated attribute
 * @param[in] pdef_idx - Search index for the attribute def array
 * @param[in] pdef - Pointer to the attribute definition
 * @param[in] limit - The index up to which to search for a definition
 * @param[in] unkn - Whether to allow unknown resources or not
 * @param[in] privil - Permissions of the caller requesting the operation
 * @param[out] badattr - Pointer to the attribute index in case of a failed
 * 			operation
 *
 * @return 	int
 * @retval 	PBSE_NONE 	on success
 * @retval 	PBS error code 	otherwise
 *
 */

int
attr_atomic_set(struct svrattrl *plist, attribute *old, attribute *new, void *pdef_idx, attribute_def *pdef, int limit, int unkn, int privil, int *badattr)
{
	int acc;
	int index;
	int listidx;
	resource *prc;
	int rc;
	attribute temp;
	int privil2;

	for (index = 0; index < limit; index++)
		clear_attr(new + index, pdef + index);

	resc_access_perm = privil; /* set privilege for decode_resc()  */

	for (listidx = 1, rc = PBSE_NONE; (rc == PBSE_NONE) && (plist != NULL); plist = (struct svrattrl *) GET_NEXT(plist->al_link), listidx++) {

		if ((index = find_attr(pdef_idx, pdef, plist->al_name)) < 0) {
			if (unkn < 0) { /*unknown attr isn't allowed*/
				rc = PBSE_NOATTR;
				break;
			} else
				index = unkn; /* if unknown attr are allowed */
		}

		/* have we privilege to set the attribute ? */
		privil2 = privil;
		if ((plist->al_flags & ATR_VFLAG_HOOK)) {
			privil2 = ATR_DFLAG_USRD | ATR_DFLAG_USWR |
				  ATR_DFLAG_OPRD | ATR_DFLAG_OPWR |
				  ATR_DFLAG_MGRD | ATR_DFLAG_MGWR |
				  ATR_DFLAG_SvWR;
		}
		resc_access_perm = privil2; /* set privilege for decode_resc() */

		acc = (pdef + index)->at_flags & ATR_DFLAG_ACCESS;
		if ((acc & privil2 & ATR_DFLAG_WRACC) == 0) {
			if (privil2 & ATR_DFLAG_SvWR) {
				/*from a daemon, just ignore this attribute*/
				continue;
			} else {
				/*from user, error if can't write attribute*/
				rc = PBSE_ATTRRO;
				break;
			}
		}

		/* decode new value */

		clear_attr(&temp, pdef + index);
		if ((rc = (pdef + index)->at_decode(&temp, plist->al_name, plist->al_resc, plist->al_value)) != 0) {
			/* Even if the decode failed, it is possible for list types to
			 * have allocated some memory.  Call at_free() to free that.
			 */
			(pdef + index)->at_free(&temp);
			if ((rc == PBSE_UNKRESC) && (unkn > 0)) {
				rc = PBSE_NONE; /* ignore the "error" */
				continue;
			} else
				break;
		}

		/* duplicate current value, if set AND not already dup-ed */

		if (((old + index)->at_flags & ATR_VFLAG_SET) &&
		    !((new + index)->at_flags & ATR_VFLAG_SET)) {
			if ((rc = (pdef + index)->at_set(new + index, old + index, SET)) != 0)
				break;
			/*
			 * we need to know if the value is changed during
			 * the next step, so clear MODIFY here; including
			 * within resources.
			 */
			(new + index)->at_flags &= ~ATR_MOD_MCACHE;
			if ((new + index)->at_type == ATR_TYPE_RESC) {
				prc = (resource *) GET_NEXT((new + index)->at_val.at_list);
				while (prc) {
					prc->rs_value.at_flags &= ~ATR_MOD_MCACHE;
					prc = (resource *) GET_NEXT(prc->rs_link);
				}
			}
		}

		/* update new copy with temp, MODIFY is set on ones changed */

		if ((plist->al_op != INCR) && (plist->al_op != DECR) &&
		    (plist->al_op != SET))
			plist->al_op = SET;

		if (temp.at_flags & ATR_VFLAG_SET) {
			rc = (pdef + index)->at_set(new + index, &temp, plist->al_op);
			if (rc) {
				(pdef + index)->at_free(&temp);
				break;
			}
		} else if (temp.at_flags & ATR_VFLAG_MODIFY) {
			(pdef + index)->at_free(new + index);
			(new + index)->at_flags |= ATR_MOD_MCACHE; /* SET was removed by at_free */
		}

		(pdef + index)->at_free(&temp);
	}

	if (rc != PBSE_NONE) {
		*badattr = listidx;
		for (index = 0; index < limit; index++)
			(pdef + index)->at_free(new + index);
	}

	return rc;
}

/**
 * @brief
 * 	attr_atomic_kill - kill (free) a temporary attribute array which
 *	was set up by attr_atomic_set().
 *
 *	at_free() is called on each element on the array, then
 *	the array itself is freed.
 *
 * @param[in] temp - pointer  to attribute structure
 * @param[in] pdef - pointer to attribute_def structure
 * @param[in] limit -  Last attribute in the list
 *
 * @return 	Void
 *
 */

void
attr_atomic_kill(attribute *temp, attribute_def *pdef, int limit)
{
	int i;

	for (i = 0; i < limit; i++)
		(pdef + i)->at_free(temp + i);
	free(temp);
}

/**
 * @brief
 * 	attr_atomic_copy - make a copy of the attributes in attribute array 'from' to the attribute array 'to'.
 * 				'to' must be preallocated.  Attributes that use set_null() as their set function
 * 				are not meant to be set via the attribute framework.  Leave these attributes
 * 				alone in 'to'
 *
 * 	@param[out] to - attribute array copied into
 * 	@param[in] from - attribute array copied from
 * 	@param[in] pdef - pointer to attribute_def structure
 * 	@param[in] limit - Last attribute in the list
 */

void
attr_atomic_copy(attribute *to, attribute *from, attribute_def *pdef, int limit)
{
	int i;
	for (i = 0; i < limit; i++) {
		if (((to + i)->at_flags & ATR_VFLAG_SET) && (pdef + i)->at_set != set_null)
			(pdef + i)->at_free(to + i);

		if ((pdef + i)->at_set != set_null)
			clear_attr(to + i, pdef + i);
		if ((from + i)->at_flags & ATR_VFLAG_SET) {
			(pdef + i)->at_set((to + i), (from + i), SET);
			(to + i)->at_flags = (from + i)->at_flags;
		}
	}
}


================================================
FILE: src/lib/Libattr/attr_fn_acl.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include <pwd.h>
#include <grp.h>
#include <unistd.h>
#include <arpa/inet.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_acl.c
 * @brief
 * 	This file contains general functions for attributes of type
 *      User/Group/Hosts Acess Control List.
 * @details
 * 	The following functions should be used for the 3 types of ACLs:
 *
 *	 User ACL	 Group ACL	 Host ACL
 *	(+ mgrs + ops)
 *	---------------------------------------------
 * 	decode_arst	decode_arst	decode_arst
 * 	encode_arst	encode_arst	encode_arst
 *	set_uacl	set_gacl	set_hostacl
 *	comp_arst	comp_arst	comp_arst
 *	free_arst	free_arst	free_arst
 *
 * 	The "encoded" or external form of the value is a string with the orginial
 * 	strings separated by commas (or new-lines) and terminated by a null.
 *
 * 	The "decoded" form is a set of strings pointed to by an array_strings struct
 *
 * 	These forms are identical to ATR_TYPE_ARST, and in fact encode_arst(),
 * 	comp_arst(), and free_arst() are used for those functions.
 *
 * 	set_ugacl() is different because of the special  sorting required.
 */

/* External Functions called */

/* Private Functions */

static int hacl_match(const char *can, const char *master);
static int gacl_match(const char *can, const char *master);
static int user_match(const char *can, const char *master);
static int sacl_match(const char *can, const char *master);
static int host_order(char *old, char *new);
static int user_order(char *old, char *new);
static int group_order(char *old, char *new);
static int
set_allacl(attribute *, attribute *, enum batch_op,
	   int (*order_func)(char *, char *));

/* for all decode_*acl() - use decode_arst() */
/* for all encode_*acl() - use encode_arst() */

/**
 * @brief
 * 	set_uacl - set value of one User ACL attribute to another
 *	with special sorting.
 *
 *	A=B --> set of strings in A replaced by set of strings in B
 *	A+B --> set of strings in B appended to set of strings in A
 *	A-B --> any string in B found is A is removed from A
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return	int
 * @retval	0	if ok
 * @retval     >0	if error
 *
 */

int
set_uacl(attribute *attr, attribute *new, enum batch_op op)
{

	return (set_allacl(attr, new, op, user_order));
}

/**
 * @brief
 * 	set_gacl - set value of one Group ACL attribute to another
 *	with special sorting.
 *
 *	A=B --> set of strings in A replaced by set of strings in B
 *	A+B --> set of strings in B appended to set of strings in A
 *	A-B --> any string in B found is A is removed from A
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_gacl(attribute *attr, attribute *new, enum batch_op op)
{

	return (set_allacl(attr, new, op, group_order));
}

/**
 * @brief
 * 	set_hostacl - set value of one Host ACL attribute to another
 *	with special sorting.
 *
 *	A=B --> set of strings in A replaced by set of strings in B
 *	A+B --> set of strings in B appended to set of strings in A
 *	A-B --> any string in B found is A is removed from A
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_hostacl(attribute *attr, attribute *new, enum batch_op op)
{

	return (set_allacl(attr, new, op, host_order));
}

/**
 * @brief
 * 	acl_check - check a name:
 *		user or [user@]full_host_name
 *		group_name
 *		full_host_name
 *	against the entries in an access control list.
 *	Match is done by calling the approprate comparison function
 *	with the name and each string from the list in turn.
 *
 * @param[in] pattr - pointer to attribute list
 * @param[in] name - acl name to be checked
 * @param[in] type - type of acl
 *
 * @return	int
 * @retval	1	if access allowed
 * @retval	0	if not allowed
 *
 */

int
acl_check(attribute *pattr, char *name, int type)
{
	int i;
#ifdef HOST_ACL_DEFAULT_ALL
	int default_rtn = 1;
#else  /* HOST_ACL_DEFAULT_ALL */
	int default_rtn = 0;
#endif /* HOST_ACL_DEFAULT_ALL */
	struct array_strings *pas;
	char *pstr;
	int (*match_func)(const char *name, const char *master);

	extern char server_host[];

	switch (type) {
		case ACL_Host:
			match_func = hacl_match;
			break;
		case ACL_User:
			match_func = user_match;
			break;
		case ACL_Group:
			match_func = gacl_match;
			break;
		case ACL_Subnet:
			match_func = sacl_match;
			break;
		default:
			match_func = (int (*)(const char *, const char *)) strcmp;
			break;
	}

	if (name == NULL)
		return (default_rtn);

	if (!(pattr->at_flags & ATR_VFLAG_SET) ||
	    ((pas = pattr->at_val.at_arst) == NULL) ||
	    (pas->as_usedptr == 0)) {

#ifdef HOST_ACL_DEFAULT_ALL
		/* no list, default to everybody is allowed */
		return (1);
#else
		if (type == ACL_Host) {
			/* if there is no list set, allow only from my host */
			return (!hacl_match(name, server_host));
		} else
			return (0);
#endif
	}

	for (i = 0; i < pas->as_usedptr; i++) {
		pstr = pas->as_string[i];
		if ((*pstr == '+') || (*pstr == '-')) {
			if (*(pstr + 1) == '\0') { /* "+" or "-" sets default */
				if (*pstr == '+')
					default_rtn = 1;
				else
					default_rtn = 0;
			}
			pstr++; /* skip over +/- if present */
		}
		if (!match_func(name, pstr)) {
			if (*pas->as_string[i] == '-')
				return (0); /* deny */
			else
				return (1); /* allow */
		}
	}
	return (default_rtn);
}

/**
 * @brief
 * 	chk_dup_acl - check for duplicate in list (array_strings)
 *
 * @param[in] old - old list of acl
 * @param[in] new - new list of acl
 *
 * @return 	int
 * @retval	0	if no duplicate
 * @retval	1	if duplicate within the new list or
 *      		between the new and old list.
 *
 */

static int
chk_dup_acl(struct array_strings *old, struct array_strings *new)
{
	int i;
	int j;

	for (i = 0; i < new->as_usedptr; ++i) {

		/* first check against self */

		for (j = 0; j < new->as_usedptr; ++j) {

			if (i != j) {
				if (strcmp(new->as_string[i], new->as_string[j]) == 0)
					return 1;
			}
		}

		/* next check new against existing (old) strings */

		for (j = 0; j < old->as_usedptr; ++j) {

			if (strcmp(new->as_string[i], old->as_string[j]) == 0)
				return 1;
		}
	}
	return 0;
}

/**
 * @brief
 * 	set_allacl - general set function for all types of acls
 *	This function is private to this file.  It is called
 *	by the public set function which is specific to the
 *	ACL type.  The public function passes an extra
 *	parameter which indicates the ACL type.
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 * @param[in] order_func - function pointer to indicate action depending on acl type
 *
 * @return	int
 * @retval	PBSE error number	Failure
 * @retval	0			Success
 *
 */

static int
set_allacl(attribute *attr, attribute *new, enum batch_op op, int (*order_func)(char *, char *))
{
	int i;
	int j;
	int k;
	unsigned long nsize;
	unsigned long need;
	long offset;
	char *pc;
	char *where;
	int used;
	struct array_strings *tmppas;
	struct array_strings *pas;
	struct array_strings *newpas;
	extern void free_arst(attribute *);

	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	pas = attr->at_val.at_arst;   /* array of strings control struct */
	newpas = new->at_val.at_arst; /* array of strings control struct */
	if (!newpas)
		return (PBSE_INTERNAL);

	if (!pas) {

		/* no array_strings control structure, make one */

		i = newpas->as_npointers;
		pas = (struct array_strings *) malloc((i - 1) * sizeof(char *) +
						      sizeof(struct array_strings));
		if (!pas)
			return (PBSE_SYSTEM);
		pas->as_npointers = i;
		pas->as_usedptr = 0;
		pas->as_bufsize = 0;
		pas->as_buf = NULL;
		pas->as_next = NULL;
		attr->at_val.at_arst = pas;
	}

	/*
	 * At this point we know we have a array_strings struct initialized
	 */

	switch (op) {
		case SET:

			/*
			 * Replace old array of strings with new array, this is
			 * simply done by deleting old strings and adding the
			 * new strings one at a time via Incr
			 */

			for (i = 0; i < pas->as_usedptr; i++)
				pas->as_string[i] = NULL; /* clear all pointers */
			pas->as_usedptr = 0;
			pas->as_next = pas->as_buf;

			if (newpas->as_usedptr == 0)
				break; /* none to set */

			nsize = newpas->as_next - newpas->as_buf; /* space needed */
			if (nsize > pas->as_bufsize) {		  /* new won't fit */
				if (pas->as_buf)
					free(pas->as_buf);
				nsize += nsize / 2; /* alloc extra space */
				if (!(pas->as_buf = malloc(nsize))) {
					pas->as_bufsize = 0;
					return (PBSE_SYSTEM);
				}
				pas->as_bufsize = nsize;

			} else { /* str does fit, clear buf */
				(void) memset(pas->as_buf, 0, pas->as_bufsize);
			}

			pas->as_next = pas->as_buf;

			/* No break, "Set" falls into "Incr" to add strings */

		case INCR:

			/* check for duplicates within new and between new and old  */

			if (chk_dup_acl(pas, newpas))
				return (PBSE_DUPLIST);

			nsize = newpas->as_next - newpas->as_buf; /* space needed */
			used = pas->as_next - pas->as_buf;	  /* space used   */

			if (nsize > (pas->as_bufsize - used)) {

				/* need to make more room for sub-strings */

				need = pas->as_bufsize + 2 * nsize; /* alloc new buf */
				if (pas->as_buf)
					pc = realloc(pas->as_buf, need);
				else
					pc = malloc(need);
				if (pc == NULL)
					return (PBSE_SYSTEM);
				offset = pc - pas->as_buf;
				pas->as_buf = pc;
				pas->as_next = pc + used;
				pas->as_bufsize = need;

				for (j = 0; j < pas->as_usedptr; j++) /* adjust points */
					pas->as_string[j] += offset;
			}

			j = pas->as_usedptr + newpas->as_usedptr;
			if (j > pas->as_npointers) {

				/* need more pointers */

				j = 3 * j / 2; /* allocate extra     */
				need = sizeof(struct array_strings) + (j - 1) * sizeof(char *);
				tmppas = (struct array_strings *) realloc((char *) pas, need);
				if (tmppas == NULL)
					return (PBSE_SYSTEM);
				tmppas->as_npointers = j;
				pas = tmppas;
				attr->at_val.at_arst = pas;
			}

			/* now put in new strings in special ugacl sorted order */

			for (i = 0; i < newpas->as_usedptr; i++) {
				for (j = 0; j < pas->as_usedptr; j++) {
					if (order_func(pas->as_string[j], newpas->as_string[i]) > 0)
						break;
				}
				/* push up rest of old strings to make room for new */

				offset = strlen(newpas->as_string[i]) + 1;
				if (j < pas->as_usedptr) {
					where = pas->as_string[j]; /* where to put in new */

					pc = pas->as_next - 1;
					while (pc >= pas->as_string[j]) { /* shift data up */
						*(pc + offset) = *pc;
						pc--;
					}
					for (k = pas->as_usedptr; k > j; k--)
						/* re adjust pointrs */
						pas->as_string[k] = pas->as_string[k - 1] + offset;
				} else {
					where = pas->as_next;
				}
				(void) strcpy(where, newpas->as_string[i]);
				pas->as_string[j] = where;
				pas->as_usedptr++;
				pas->as_next += offset;
			}
			break;

		case DECR: /* decrement (remove) string from array */
			for (j = 0; j < newpas->as_usedptr; j++) {
				for (i = 0; i < pas->as_usedptr; i++) {
					if (!strcmp(pas->as_string[i], newpas->as_string[j])) {
						/* compact buffer */
						nsize = strlen(pas->as_string[i]) + 1;
						pc = pas->as_string[i] + nsize;
						need = pas->as_next - pc;
						(void) memmove(pas->as_string[i], pc, (size_t) need);
						pas->as_next -= nsize;
						/* compact pointers */
						for (++i; i < pas->as_npointers; i++)
							pas->as_string[i - 1] = pas->as_string[i] - nsize;
						pas->as_string[i - 1] = NULL;
						pas->as_usedptr--;
						break;
					}
				}
			}
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 *	user_match - User order match
 *	Match two strings by user, then from the tail end first
 *
 * @param[in] can - Canidate string (first parameter) is a single user@host string.
 * @param[in] master - Master string (2nd parameter) is an entry from a user/group acl.
 * It should have a leading + or - which is ignored.  Next is the user name
 * which is compared first.  If the user name matches, then the host name is
 * checked.  The host name may be a wild carded or null (including no '@').
 * If the hostname is null, it is treated the same as "@*", a fully wild
 * carded hostname that matches anything.
 *
 * @return	int
 * @retval	0	if string match
 * @retval	1	if not
 *
 */

static int
user_match(const char *can, const char *master)
{

	/* match user name first */

	do {
		if (*master != *can)
			return (1); /* doesn't match */
		master++;
		can++;
	} while ((*master != '@') && (*master != '\0'));

	if (*master == '\0') {
		/* if full match or if master has no host (=wildcard) */
		if ((*can == '\0') || (*can == '@'))
			return (0);
		else
			return (1);
	} else if (*can != '@')
		return (1);

	/* ok, now compare host/domain name working backwards     */
	/* if hit wild card in master ok to stop and report match */

	return (hacl_match(can + 1, master + 1));
}

/**
 * @brief
 * 	user_order - user order compare
 *
 * @param[in] s1 - user name
 * @param[in] s2 - user name
 *
 * @return	int
 * @retval	-1 	if entry s1 sorts before s2
 * @retval	0 	if equal
 * @retval	1 	if s1 sorts after s2
 *
 */

static int
user_order(char *s1, char *s2)
{
	int d;

	/* skip over the + or - prefix */

	if ((*s1 == '+') || (*s1 == '-'))
		s1++;
	if ((*s2 == '+') || (*s2 == '-'))
		s2++;

	/* compare user names first, stop with '@' */

	while (1) {
		d = (int) *s1 - (int) *s2;
		if (d)
			return (d);
		if ((*s1 == '@') || (*s1 == '\0'))
			return (host_order(s1 + 1, s2 + 1)); /* order host names */
		s1++;
		s2++;
	}
}

/**
 * @brief
 *	comapre the group names
 *
 * @param[in]   s1 - group name
 * @param[in]   s2 - group name
 *
 * @return 	int
 * @retval  	0	if equal
 * @retval 	-1	if entry s1 sorts before s2
 * @retval  	1   	if s1 sorts after s2
 *
 */
static int
group_order(char *s1, char *s2)
{

	/* skip over the + or - prefix */

	if ((*s1 == '+') || (*s1 == '-'))
		s1++;
	if ((*s2 == '+') || (*s2 == '-'))
		s2++;

	return strcmp(s1, s2);
}

/**
 * @brief
 * 	host acl order match - match two strings from the tail end first
 *
 * @param[in] can - Canidate string (first parameter) is a single user@host string.
 * @param[in] master -  Master string (2nd parameter) is an entry from a host acl.  It may have a
 * leading + or - which is ignored.  It may also have an '*' as a leading
 * name segment to be a wild card - match anything.
 *
 * Strings match if identical, or if match up to leading '*' on master which
 * like a wild card, matches any prefix string on canidate domain name
 *
 * @return	int
 * @retval	0	if strings match
 * @retval	1	if not
 *
 */

static int
hacl_match(const char *can, const char *master)
{
	const char *pc;
	const char *pm;

	pc = can + strlen(can) - 1;
	pm = master + strlen(master) - 1;
	while ((pc > can) && (pm > master)) {
		if (tolower((int) *pc) != tolower((int) *pm))
			return (1);
		pc--;
		pm--;
	}

	/* comparison of one or both reached the start of the string */

	if (pm == master) {
		if (*pm == '*')
			return (0);
		else if ((pc == can) && (tolower(*pc) == tolower(*pm)))
			return (0);
	}
	return (1);
}

/**
 * @brief
 * 	group acl order match - match two strings when user is in group
 *
 * @param[in] can - Canidate string (first parameter) is a euser string (egroup on Windows).
 * @param[in] master -  Master string (2nd parameter) is an entry from a group acl.
 *
 * Strings match if can is a member of master (strings are equal on windows).
 *
 * @return	int
 * @retval	0	if strings match
 * @retval	1	if not
 *
 */

static int
gacl_match(const char *can, const char *master)
{
#ifdef WIN32
	return (strcmp(can, master));
#else
	int i, ng = 0;
	struct passwd *pw;
	struct group *gr;
	gid_t *groups = NULL;

	if ((pw = getpwnam(can)) == NULL)
		return (1);

	if (getgrouplist(can, pw->pw_gid, NULL, &ng) < 0) {
		if ((groups = (gid_t *) malloc(ng * sizeof(gid_t))) == NULL)
			return (1);
		getgrouplist(can, pw->pw_gid, groups, &ng);
	}

	for (i = 0; i < ng; i++) {
		if ((gr = getgrgid(groups[i])) != NULL) {
			if (!strcmp(gr->gr_name, master)) {
				free(groups);
				return (0);
			}
		}
	}

	free(groups);

	return (1);
#endif
}

/**
 * @brief
 * 	subnet acl order match - match two strings: ip and subnet with mask
 *  in short or long version
 *
 * @param[in] can - Canidate string (first parameter) is a ip string.
 * @param[in] master -  Master string (2nd parameter) is an entry from a host acl.
 *
 * Strings match if ip is in subnet.
 *
 * @return	int
 * @retval	0	if strings match
 * @retval	1	if not
 *
 */

static int
sacl_match(const char *can, const char *master)
{
	struct in_addr addr;
	uint32_t ip;
	uint32_t subnet;
	uint32_t mask;
	char tmpsubnet[PBS_MAXIP_LEN + 1];
	char *delimiter;
	int len;
	int short_mask;

	/* check and convert candidate to numeric IP */
	if (inet_pton(AF_INET, can, &addr) == 0)
		return 1;
	ip = ntohl(addr.s_addr);

	/* split master to subnet and mask */
	if ((delimiter = strchr(master, '/')) == NULL)
		return 1;

	if (*(delimiter + 1) == '\0')
		return 1;

	len = delimiter - master;
	if (len > PBS_MAXIP_LEN)
		return 1;

	/* get subnet */
	strncpy(tmpsubnet, master, len);
	tmpsubnet[len] = '\0';
	if (inet_pton(AF_INET, tmpsubnet, &addr) == 0)
		return 1;
	subnet = ntohl(addr.s_addr);

	/* get mask */
	if (strchr(delimiter + 1, '.')) {
		/* long mask */
		if (inet_pton(AF_INET, delimiter + 1, &addr) == 0)
			return 1;
		mask = ntohl(addr.s_addr);
	} else {
		/* short mask */
		short_mask = atoi(delimiter + 1);
		if (short_mask < 0 || short_mask > 32)
			return 1;
		mask = short_mask ? ~0 << (32 - short_mask) : 0;
	}

	if (mask == 0)
		return 1;

	return ! ((ip & mask) == (subnet & mask));
}

/**
 * @brief
 *	host reverse order compare - compare two host entrys from the tail end first
 *	domain name segment at at time.
 *
 * @param[in] s1 - hostname
 * @param[in] s2 - hostname
 *
 * @return	int
 * @retval	-1 	if entry s1 sorts before s2
 * @retval	0 	if equal
 * @retval	1 	if s1 sorts after s2
 *
 */

static int
host_order(char *s1, char *s2)
{
	int d;
	char *p1;
	char *p2;

	if ((*s1 == '+') || (*s1 == '-'))
		s1++;
	if ((*s2 == '+') || (*s2 == '-'))
		s2++;

	p1 = s1 + strlen(s1) - 1;
	p2 = s2 + strlen(s2) - 1;
	while (1) {
		d = (int) *p2 - (int) *p1;
		if ((p1 > s1) && (p2 > s2)) {
			if (d != 0)
				return (d);
			else {
				p1--;
				p2--;
			}
		} else if ((p1 == s1) && (p2 == s2)) {
			if (*p1 == '*')
				return (1);
			else if (*p2 == '*')
				return (-1);
			else
				return (d);
		} else if (p1 == s1) {
			return (1);
		} else {
			return (-1);
		}
	}
}


================================================
FILE: src/lib/Libattr/attr_fn_arst.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_arst.c
 * @brief
 * 	This file contains general function for attributes of type
 * 	array of (pointers to) strings
 * @details
 * 	Each set has functions for:
 *		Decoding the value string to the machine representation.
 *		Encoding the internal representation of the attribute to external
 *		Setting the value by =, + or - operators.
 *		Comparing a (decoded) value with the attribute value.
 *		Freeing the space malloc-ed to the attribute value.
 *
 * 	Some or all of the functions for an attribute type may be shared with
 * 	other attribute types.
 *
 * 	The prototypes are declared in "attribute.h"
 *
 * 	Attribute functions for attributes with value type "array of strings":
 *
 * 	The "encoded" or external form of the value is a string with the orginial
 * 	strings separated by commas (or new-lines) and terminated by a null.
 * 	Any embedded commas or back-slashes must be escaped by a prefixed back-
 * 	slash.
 *
 * 	The "decoded" form is a set of strings pointed to by an array_strings
 * 	struct
 */

/**
 * @brief
 *	decode a comma string into an attribute of type ATR_TYPE_ARST
 *
 * @par Functionality:
 *	1. Call count_substrings to find out the number of sub strings separated
 *	   by comma
 *	2. Call parse_comma_string function to parse the value of the attribute
 *
 * @see
 *
 * @param[in,out] patr	- Pointer to attribute structure
 * @param[in]	  val	- Value of the attribute as comma separated string. This
 *                        parameter's value cannot be modified by any of the
 *                        functions that are called inside this function.
 *
 * @return	int
 * @retval	0  -  Success
 * @retval	>0 -  Failure
 *
 *
 */
static int
decode_arst_direct(attribute *patr, char *val)
{
	unsigned long bksize;
	int j;
	int ns;
	char *pbuf = NULL;
	char *pc;
	char *pstr;
	struct array_strings *stp = NULL;
	int rc;
	char strbuf[BUF_SIZE]; /* Should handle most values */
	char *sbufp = NULL;
	size_t slen;

	if (!patr || !val)
		return (PBSE_INTERNAL);

	/*
	 * determine number of sub strings, each sub string is terminated
	 * by a non-escaped comma or a new-line, the whole string is terminated
	 * by a null
	 */

	if ((rc = count_substrings(val, &ns)) != 0)
		return (rc);

	slen = strlen(val);

	pbuf = calloc(slen + 1, sizeof(char));
	if (pbuf == NULL)
		return (PBSE_SYSTEM);
	bksize = ((ns - 1) * sizeof(char *)) + sizeof(struct array_strings);
	stp = (struct array_strings *) malloc(bksize);
	if (!stp) {
		free(pbuf);
		return (PBSE_SYSTEM);
	}

	/* number of slots (sub strings) */
	stp->as_npointers = ns;
	stp->as_usedptr = 0;
	/* for the strings themselves */
	stp->as_buf = pbuf;
	stp->as_next = pbuf;
	stp->as_bufsize = slen + 1;

	/*
	 * determine string storage requirement and copy the string "val"
	 * to a work buffer area
	 */
	if (slen < BUF_SIZE) {
		/* buffer on stack */
		snprintf(strbuf, sizeof(strbuf), "%s", val);
		sbufp = strbuf;
	} else {
		/* buffer on heap */
		sbufp = strdup(val);
		if (sbufp == NULL) {
			free(pbuf);
			free(stp);
			return (PBSE_SYSTEM);
		}
	}

	/* now copy in substrings and set pointers */
	pc = pbuf;
	j = 0;
	pstr = parse_comma_string(sbufp);
	while ((pstr != NULL) && (j < ns)) {
		stp->as_string[j] = pc;
		while (*pstr) {
			*pc++ = *pstr++;
		}
		*pc++ = '\0';
		pstr = parse_comma_string(NULL);
		j++;
	}

	stp->as_usedptr = j;
	stp->as_next = pc;
	post_attr_set(patr);
	patr->at_val.at_arst = stp;

	if (sbufp != strbuf) /* buffer on heap, not stack */
		free(sbufp);
	return (0);
}

/**
 * @brief
 * 	decode_arst - decode a comma string into an attr of type ATR_TYPE_ARST
 *
 * @param[in] patr - pointer to attribute structure
 * @param[in] name - attribute name
 * @param[in] rescn - resource name
 * @param[in] val - attribute value
 *
 * @return	int
 * @retval	0	if ok
 * @retval	>0	error number1 if error
 * @retval	patr	members set
 *
 */

int
decode_arst(attribute *patr, char *name, char *rescn, char *val)
{
	int rc;
	attribute temp;

	if ((val == NULL) || (strlen(val) == 0)) {
		free_arst(patr);
		/* _SET cleared in free_arst */
		patr->at_flags |= ATR_MOD_MCACHE;

		return (0);
	}

	if ((patr->at_flags & ATR_VFLAG_SET) && (patr->at_val.at_arst)) {
		/* already have values, decode new into temp	*/
		/* then use set(incr) to add new to existing	*/

		temp.at_flags = 0;
		temp.at_type = ATR_TYPE_ARST;
		temp.at_user_encoded = NULL;
		temp.at_priv_encoded = NULL;
		temp.at_val.at_arst = 0;
		if ((rc = decode_arst_direct(&temp, val)) != 0)
			return (rc);
		rc = set_arst(patr, &temp, SET);
		free_arst(&temp);
		return (rc);

	} else {
		/* decode directly into real attribute */
		return (decode_arst_direct(patr, val));
	}
}

/**
 * @brief
 * 	encode_arst - encode attr of type ATR_TYPE_ARST into attrlist entry
 *
 * Mode ATR_ENCODE_CLIENT - encode strings into single super string
 *			    separated by ','
 *
 * Mode ATR_ENCODE_SVR    - treated as above
 *
 * Mode ATR_ENCODE_MOM    - treated as above
 *
 * Mode ATR_ENCODE_HOOK   - treated as above
 *
 * Mode ATR_ENCODE_SAVE - encode strings into single super string
 *			  separated by '\n'
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval	int
 * @retval	>0	if ok, entry created and linked into list
 * @retval	=0	no value to encode, entry not created
 * @retval	-1	if error
 *
 */

/*ARGSUSED*/

int
encode_arst(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	char *end;
	int i;
	int j;
	svrattrl *pal;
	char *pc;
	char *pfrom;
	char separator;

	if (!attr)
		return (-2);
	if (((attr->at_flags & ATR_VFLAG_SET) == 0) || !attr->at_val.at_arst ||
	    !attr->at_val.at_arst->as_usedptr)
		return (0); /* no values */

	i = (int) (attr->at_val.at_arst->as_next - attr->at_val.at_arst->as_buf);
	if (mode == ATR_ENCODE_SAVE) {
		separator = '\n'; /* new-line for encode_acl  */
		/* allow one extra byte for final new-line */
		j = i + 1;
	} else {
		separator = ','; /* normally a comma is the separator */
		j = i;
	}

	/* in the future will need to expand the size of value	*/
	/* if we are escaping special characters		*/

	pal = attrlist_create(atname, rsname, j);
	if (pal == NULL)
		return (-1);

	pal->al_flags = attr->at_flags;

	pc = pal->al_value;
	pfrom = attr->at_val.at_arst->as_buf;

	/* replace nulls between sub-strings with separator characters */
	/* in the future we need to escape any embedded special character */

	end = attr->at_val.at_arst->as_next;
	while (pfrom < end) {
		if (*pfrom == '\0') {
			*pc = separator;
		} else {
			*pc = *pfrom;
		}
		pc++;
		pfrom++;
	}

	/* convert the last null to separator only if going to new-lines */

	if (mode == ATR_ENCODE_SAVE)
		*pc = '\0'; /* insure string terminator */
	else
		*(pc - 1) = '\0';
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1);
}

/**
 * @brief
 * 	set_arst - set value of attribute of type ATR_TYPE_ARST to another
 *
 *	A=B --> set of strings in A replaced by set of strings in B
 *	A+B --> set of strings in B appended to set of strings in A
 *	A-B --> any string in B found is A is removed from A
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_arst(attribute *attr, attribute *new, enum batch_op op)
{
	int i;
	int j;
	unsigned long nsize;
	unsigned long need;
	long offset;
	char *pc;
	long used;
	struct array_strings *newpas;
	struct array_strings *pas;
	struct array_strings *xpasx;
	void free_arst(attribute *);

	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	pas = attr->at_val.at_arst;
	xpasx = new->at_val.at_arst;
	if (!xpasx)
		return (PBSE_INTERNAL);

	if (!pas) {

		/* not array_strings control structure, make one */

		j = xpasx->as_npointers;
		if (j < 1)
			return (PBSE_INTERNAL);
		need = sizeof(struct array_strings) + (j - 1) * sizeof(char *);
		pas = (struct array_strings *) malloc(need);
		if (!pas)
			return (PBSE_SYSTEM);
		pas->as_npointers = j;
		pas->as_usedptr = 0;
		pas->as_bufsize = 0;
		pas->as_buf = NULL;
		pas->as_next = NULL;
		attr->at_val.at_arst = pas;
	}
	if ((op == INCR) && !pas->as_buf)
		op = SET; /* no current strings, change op to SET */

	/*
	 * At this point we know we have a array_strings struct initialized
	 */

	switch (op) {
		case SET:

			/*
			 * Replace old array of strings with new array, this is
			 * simply done by deleting old strings and appending the
			 * new (to the null set).
			 */

			for (i = 0; i < pas->as_usedptr; i++)
				pas->as_string[i] = NULL; /* clear all pointers */
			pas->as_usedptr = 0;
			pas->as_next = pas->as_buf;

			if (new->at_val.at_arst == NULL)
				break; /* none to set */

			nsize = xpasx->as_next - xpasx->as_buf; /* space needed */
			if (nsize > pas->as_bufsize) {		/* new wont fit */
				if (pas->as_buf)
					free(pas->as_buf);
				nsize += nsize / 2; /* alloc extra space */
				if (!(pas->as_buf = malloc(nsize))) {
					pas->as_bufsize = 0;
					return (PBSE_SYSTEM);
				}
				pas->as_bufsize = nsize;

			} else { /* str does fit, clear buf */
				(void) memset(pas->as_buf, 0, pas->as_bufsize);
			}

			pas->as_next = pas->as_buf;

			/* No break, "SET" falls into "INCR" to add strings */

		case INCR:

			nsize = xpasx->as_next - xpasx->as_buf; /* space needed */
			used = pas->as_next - pas->as_buf;

			if (nsize > (pas->as_bufsize - used)) {
				need = pas->as_bufsize + 2 * nsize; /* alloc new buf */
				if (pas->as_buf)
					pc = realloc(pas->as_buf, need);
				else
					pc = malloc(need);
				if (pc == NULL)
					return (PBSE_SYSTEM);
				offset = pc - pas->as_buf;
				pas->as_buf = pc;
				pas->as_next = pc + used;
				pas->as_bufsize = need;

				for (j = 0; j < pas->as_usedptr; j++) /* adjust points */
					pas->as_string[j] += offset;
			}

			j = pas->as_usedptr + xpasx->as_usedptr;
			if (j > pas->as_npointers) { /* need more pointers */
				j = 3 * j / 2;	     /* allocate extra     */
				need = sizeof(struct array_strings) + (j - 1) * sizeof(char *);
				newpas = (struct array_strings *) realloc((char *) pas, need);
				if (newpas == NULL)
					return (PBSE_SYSTEM);
				newpas->as_npointers = j;
				pas = newpas;
				attr->at_val.at_arst = pas;
			}

			/* now append new strings */

			for (i = 0; i < xpasx->as_usedptr; i++) {
				(void) strcpy(pas->as_next, xpasx->as_string[i]);
				pas->as_string[pas->as_usedptr++] = pas->as_next;
				pas->as_next += strlen(pas->as_next) + 1;
			}
			break;

		case DECR: /* decrement (remove) string from array */
			for (j = 0; j < xpasx->as_usedptr; j++) {
				for (i = 0; i < pas->as_usedptr; i++) {
					if (!strcmp(pas->as_string[i], xpasx->as_string[j])) {
						/* compact buffer */
						nsize = strlen(pas->as_string[i]) + 1;
						pc = pas->as_string[i] + nsize;
						need = pas->as_next - pc;
						(void) memmove(pas->as_string[i], pc, (size_t) need);
						pas->as_next -= nsize;
						/* compact pointers */
						for (++i; i < pas->as_npointers; i++)
							pas->as_string[i - 1] = pas->as_string[i] - nsize;
						pas->as_string[i - 1] = NULL;
						pas->as_usedptr--;
						break;
					}
				}
			}
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 * 	comp_arst - compare two attributes of type ATR_TYPE_ARST
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return	int
 * @retval	0	if the set of strings in "with" is a subset of "attr"
 * @retval	1	otherwise
 *
 */

int
comp_arst(attribute *attr, attribute *with)
{
	int i;
	int j;
	int match = 0;
	struct array_strings *apa;
	struct array_strings *bpb;

	if (!attr || !with || !attr->at_val.at_arst || !with->at_val.at_arst)
		return (1);
	if ((attr->at_type != ATR_TYPE_ARST) ||
	    (with->at_type != ATR_TYPE_ARST))
		return (1);
	apa = attr->at_val.at_arst;
	bpb = with->at_val.at_arst;

	for (j = 0; j < bpb->as_usedptr; j++) {
		for (i = 0; i < apa->as_usedptr; i++) {
			if (strcmp(bpb->as_string[j], apa->as_string[i]) == 0) {
				match++;
				break;
			}
		}
	}

	if (match == bpb->as_usedptr)
		return (0); /* all in "with" are in "attr" */
	else
		return (1);
}

/**
 * @brief
 *	frees arst attribute.
 *
 * @param[in] attr - pointer to attribute
 *
 * @return	Void
 *
 */

void
free_arst(attribute *attr)
{
	if ((attr->at_flags & ATR_VFLAG_SET) && (attr->at_val.at_arst)) {
		(void) free(attr->at_val.at_arst->as_buf);
		(void) free((char *) attr->at_val.at_arst);
	}
	free_null(attr);
}

/**
 * @brief
 * 	arst_string - see if a string occurs as a prefix in an arst attribute entry
 *	Search each entry in the value of an arst attribute for a sub-string
 *	that begins with the passed string
 *
 * @param[in] pattr - pointer to attribute structure
 * @param[in] str - string which is prefix to be searched in an attribute
 *
 * @return	string
 * @retval	arst attribute		Success
 * @retval	NULL			Failure
 *
 */

char *
arst_string(char *str, attribute *pattr)
{
	int i;
	size_t len;
	struct array_strings *parst;

	if ((pattr->at_type != ATR_TYPE_ARST) || !(pattr->at_flags & ATR_VFLAG_SET))
		return NULL;

	len = strlen(str);
	parst = pattr->at_val.at_arst;
	for (i = 0; i < parst->as_usedptr; i++) {
		if (strncmp(str, parst->as_string[i], len) == 0)
			return (parst->as_string[i]);
	}
	return NULL;
}

/**
 * @brief
 * 	parse_comma_string_bs() - parse a string of the form:
 *		value1 [, value2 ...]
 *
 *	For use by decode_arst_direct_bs(), the old 8.0 version.
 *	On the first call, start is non null, a pointer to the first value
 *	element upto a comma, new-line, or end of string is returned.
 *
 *	Commas escaped by a back-slash '\' are ignored.
 *
 *	Newlines (\n) are allowed because they could be present in
 *	environment variables.
 *
 *	On any following calls with start set to a null pointer NULL,
 *	the next value element is returned...
 *
 * @param[in] start - string to be parsed
 *
 * @return 	string
 * @retval	start address for string	Success
 * @retval	NULL				Failure
 *
 */

static char *
parse_comma_string_bs(char *start)
{
	static char *pc = NULL; /* if start is null, restart from here */
	char *dest;
	char *back;
	char *rv;

	if (start != NULL)
		pc = start;

	/* skip over leading white space */
	while (pc && *pc && isspace((int) *pc))
		pc++;

	if (!pc || !*pc)
		return NULL; /* already at end, no strings */

	rv = dest = pc; /* the start point which will be returned */

	/* find comma */
	while (*pc) {
		if (*pc == ESC_CHAR) {
			/*
			 * Both copy_env_value() and encode_arst_bs() escape certain
			 * characters. Unescape them here.
			 */
			pc++;
			if (*pc == '\0') {
				/* should not happen, but handle it */
				break;
			} else if ((*pc == '"') || (*pc == '\'') || (*pc == ',') || (*pc == ESC_CHAR)) {
				/* omit the ESC_CHAR preceding these characters */
				*dest = *pc;
			} else {
				/* unrecognized escape sequence, just copy it */
				*dest++ = ESC_CHAR;
				*dest = *pc;
			}
		} else if (*pc == ',') {
			break;
		} else {
			*dest = *pc;
		}
		++pc;
		++dest;
	}

	if (*pc)
		*pc++ = '\0'; /* if not end, terminate this and adv past */

	*dest = '\0';
	back = dest;
	while (isspace((int) *--back)) /* strip trailing spaces */
		*back = '\0';

	return (rv);
}

/**
 * @brief
 * 	count_substrings_bs - counts number of substrings in a comma separated
 * 	string.
 *
 * 	Newlines (\n) are allowed because they could be present in environment
 * 	variables.
 *
 *	See also count_substrings
 *
 * @param val comma separated string of substrings
 * @param pcnt where to return the value
 */
int
count_substrings_bs(char *val, int *pcnt)
{
	int rc = 0;
	int ns;
	char *pc;

	if (val == NULL)
		return (PBSE_INTERNAL);

	/*
	 * determine number of substrings, each sub string is terminated
	 * by a non-escaped comma or a new-line, the whole string is terminated
	 * by a null
	 */

	ns = 1;
	for (pc = val; *pc; pc++) {
		if (*pc == ESC_CHAR) {
			if (*(pc + 1))
				pc++;
		} else {
			if (*pc == ',')
				++ns;
		}
	}
	if (pc > val)
		pc--;
	if (*pc == ',') {
		if ((pc > val) && (*(pc - 1) != ESC_CHAR)) {
			/* strip trailing empty string */
			ns--;
			*pc = '\0';
		}
	}

	*pcnt = ns;
	return rc;
}

/**
 * @brief
 *	decode_arst_direct_bs - this version of the decode routine treats
 *	back-slashes (hence the "_bs" on the name) as escape characters
 *	It is needed to deal with environment variables that contain a
 *	comma and was taken from the 8.0 version.
 *
 * @param[in] patr - pointer to attribute structure
 * @param[in] val - string holding value for attribute structure
 *
 * @retuan	int
 * @retval	0	Success
 * @retval	>0	PBSE error code
 *
 */
static int
decode_arst_direct_bs(attribute *patr, char *val)
{
	unsigned long bksize;
	int j;
	int ns;
	int rc;
	size_t slen;
	char *pbuf = NULL;
	char *pc;
	char *pstr;
	char *sbufp = NULL;
	struct array_strings *stp = NULL;
	char strbuf[BUF_SIZE]; /* Should handle most values */

	if (!patr || !val)
		return (PBSE_INTERNAL);

	/*
	 * determine number of sub strings, each sub string is terminated
	 * by a non-escaped comma, the whole string is terminated by a null
	 */

	if ((rc = count_substrings_bs(val, &ns)) != 0)
		return (rc);

	slen = strlen(val);

	pbuf = calloc(slen + 1, sizeof(char));
	if (pbuf == NULL)
		return (PBSE_SYSTEM);
	bksize = ((ns - 1) * sizeof(char *)) + sizeof(struct array_strings);
	stp = (struct array_strings *) malloc(bksize);
	if (!stp) {
		free(pbuf);
		return (PBSE_SYSTEM);
	}

	/* number of slots (sub strings) */
	stp->as_npointers = ns;
	stp->as_usedptr = 0;
	/* for the strings themselves */
	stp->as_buf = pbuf;
	stp->as_next = pbuf;
	stp->as_bufsize = slen + 1;

	/*
	 * determine string storage requirement and copy the string "val"
	 * to a work buffer area
	 */
	if (slen < BUF_SIZE) {
		/* buffer on stack */
		snprintf(strbuf, sizeof(strbuf), "%s", val);
		sbufp = strbuf;
	} else {
		/* buffer on heap */
		sbufp = strdup(val);
		if (sbufp == NULL) {
			free(pbuf);
			free(stp);
			return (PBSE_SYSTEM);
		}
	}

	/* now copy in substrings and set pointers */
	pc = pbuf;
	j = 0;
	pstr = parse_comma_string_bs(sbufp);
	while ((pstr != NULL) && (j < ns)) {
		stp->as_string[j] = pc;
		while (*pstr) {
			*pc++ = *pstr++;
		}
		*pc++ = '\0';
		pstr = parse_comma_string_bs(NULL);
		j++;
	}

	stp->as_usedptr = j;
	stp->as_next = pc;
	post_attr_set(patr);
	patr->at_val.at_arst = stp;

	if (sbufp != strbuf) /* buffer on heap, not stack */
		free(sbufp);
	return (0);
}

/**
 * @brief
 * 	decode_arst_bs - decode a comma string into an attr of type ATR_TYPE_ARST
 *	Calls decode_arst_direct_bs() instead of decode_arst_direct() for
 *	environment variables that may contain commas
 *
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0	if ok
 * @retval      >0	error number1 if error,
 * @retval      *patr 	members set
 *
 */

int
decode_arst_bs(attribute *patr, char *name, char *rescn, char *val)
{
	int rc;
	attribute temp;

	if ((val == NULL) || (strlen(val) == 0)) {
		free_arst(patr);
		/* _SET cleared in free_arst */
		patr->at_flags |= ATR_MOD_MCACHE;

		return (0);
	}

	if ((patr->at_flags & ATR_VFLAG_SET) && (patr->at_val.at_arst)) {
		/* already have values, decode new into temp	*/
		/* then use set(incr) to add new to existing	*/

		temp.at_flags = 0;
		temp.at_type = ATR_TYPE_ARST;
		temp.at_user_encoded = NULL;
		temp.at_priv_encoded = NULL;
		temp.at_val.at_arst = 0;
		if ((rc = decode_arst_direct_bs(&temp, val)) != 0)
			return (rc);
		rc = set_arst(patr, &temp, SET);
		free_arst(&temp);
		return (rc);

	} else {
		/* decode directly into real attribute */
		return (decode_arst_direct_bs(patr, val));
	}
}

/**
 * @brief
 * 	encode_arst_bs - encode attr of type ATR_TYPE_ARST into attrlist entry
 *	Used in conjunction with decode_arst_bs() and decode_arst_direct_bs()
 *	for environment variables that may contain commas.
 *
 * Mode ATR_ENCODE_CLIENT - encode strings into single super string
 *			    separated by ','
 *
 * Mode ATR_ENCODE_SVR    - treated as above
 *
 * Mode ATR_ENCODE_MOM    - treated as above
 *
 * Mode ATR_ENCODE_HOOK   - treated as above
 *
 * Mode ATR_ENCODE_SAVE - encode strings into single super string
 *			  separated by '\n'
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

int
encode_arst_bs(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	char *end;
	int i;
	int j;
	svrattrl *pal;
	char *pc;
	char *pfrom;
	char separator;

	if (!attr)
		return (-2);
	if (((attr->at_flags & ATR_VFLAG_SET) == 0) || !attr->at_val.at_arst ||
	    !attr->at_val.at_arst->as_usedptr)
		return (0); /* no values */

	i = (int) (attr->at_val.at_arst->as_next - attr->at_val.at_arst->as_buf);
	separator = ','; /* normally a comma is the separator */
	j = i;

	/* how many back-slashes are required */

	for (pc = attr->at_val.at_arst->as_buf; pc < attr->at_val.at_arst->as_next; ++pc) {
		if ((*pc == '"') || (*pc == '\'') || (*pc == ',') || (*pc == ESC_CHAR))
			++j;
	}
	pal = attrlist_create(atname, rsname, j);
	if (pal == NULL)
		return (-1);

	pal->al_flags = attr->at_flags;

	pc = pal->al_value;
	pfrom = attr->at_val.at_arst->as_buf;

	/*
	 * replace nulls between sub-strings with separater characters
	 * escape any embedded special character
	 *
	 * Keep the list of special characters consistent with copy_env_value()
	 * and parse_comma_string_bs().
	 */

	end = attr->at_val.at_arst->as_next;
	while (pfrom < end) {
		if ((*pfrom == '"') || (*pfrom == '\'') || (*pfrom == ',') || (*pfrom == ESC_CHAR)) {
			*pc++ = ESC_CHAR;
			*pc = *pfrom;
		} else if (*pfrom == '\0') {
			*pc = separator;
		} else {
			*pc = *pfrom;
		}
		pc++;
		pfrom++;
	}

	/* convert the last null to separator only if going to new-lines */

	*(pc - 1) = '\0';
	append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1);
}

/**
 * @brief
 * set_arst_uniq - set value of attribute of type ATR_TYPE_ARST to another
 * discarding duplicate entries on the INCR operation.
 *
 * @par Functionality:
 * Set value of one attribute of type ATR_TYPE_ARST to another discarding
 * duplicate entries on the INCR operator. For example:
 *	(A B C) + (D B E) = (A B C D E)
 *
 * The operators are:
 *   SET   A=B --> set of strings in A replaced by set of strings in B
 *	Done by clearing A and then setting A = A + B
 *   INCR  A+B --> set of strings in B appended to set of strings in A
 *	except no duplicates are appended
 *   DECR  A-B --> any string in B found in A is removed from A
 *	Done via basic set_arst() function
 *
 * @param[in]	attr - pointer to new attribute to be set (A)
 * @param[in]	new  - pointer to attribute (B)
 * @param[in]	op   - operator
 *
 * @return	int
 * @retval	 PBSE_NONE on success
 * @retval	 PBSE_* on error
 *
 * @par Side Effects: None
 *
 * @par MT-safe: unknown
 *
 */

int
set_arst_uniq(attribute *attr, attribute *new, enum batch_op op)
{
	int i;
	int j;
	unsigned long nsize;
	unsigned long need;
	long offset;
	char *pc;
	long used;
	struct array_strings *newpas;
	struct array_strings *pas;
	struct array_strings *xpasx;
	void free_arst(attribute *);

	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	/* if the operation is DECR, just use the normal set_arst() function */
	if (op == DECR)
		return (set_arst(attr, new, op));

	pas = attr->at_val.at_arst;  /* old attribute, A */
	xpasx = new->at_val.at_arst; /* new attribute, B */
	if (!xpasx)
		return (PBSE_INTERNAL);

	/* if the operation is SET, free the existing and then INCR (add) new */
	if (op == SET) {
		free_arst(attr); /* clear old and use INCR to set w/o dups */
		pas = NULL;	 /* just freed what it was point to */
		op = INCR;
	}

	if (!pas) {

		/* not array_strings control structure, make one */

		j = xpasx->as_npointers;
		if (j < 1)
			return (PBSE_INTERNAL);
		need = sizeof(struct array_strings) + (j - 1) * sizeof(char *);
		pas = (struct array_strings *) malloc(need);
		if (!pas)
			return (PBSE_SYSTEM);
		pas->as_npointers = j;
		pas->as_usedptr = 0;
		pas->as_bufsize = 0;
		pas->as_buf = NULL;
		pas->as_next = NULL;
		attr->at_val.at_arst = pas;
	}

	/*
	 * At this point we know we have a array_strings struct initialized
	 * and we are doing the equivalent of the INCR operation
	 */

	nsize = xpasx->as_next - xpasx->as_buf; /* space needed */
	used = pas->as_next - pas->as_buf;

	if (nsize > (pas->as_bufsize - used)) {
		need = pas->as_bufsize + 2 * nsize; /* alloc new buf */
		if (pas->as_buf)
			pc = realloc(pas->as_buf, need);
		else
			pc = malloc(need);
		if (pc == NULL)
			return (PBSE_SYSTEM);
		offset = pc - pas->as_buf;
		pas->as_buf = pc;
		pas->as_next = pc + used;
		pas->as_bufsize = need;

		if (offset != 0) {
			for (j = 0; j < pas->as_usedptr; j++) /* adjust points */
				pas->as_string[j] += offset;
		}
	}

	j = pas->as_usedptr + xpasx->as_usedptr;
	if (j > pas->as_npointers) { /* need more pointers */
		j = 3 * j / 2;	     /* allocate extra     */
		need = sizeof(struct array_strings) + (j - 1) * sizeof(char *);
		newpas = (struct array_strings *) realloc((char *) pas, need);
		if (newpas == NULL)
			return (PBSE_SYSTEM);
		newpas->as_npointers = j;
		pas = newpas;
		attr->at_val.at_arst = pas;
	}

	/* now append new strings ingoring enties already present  */

	for (i = 0; i < xpasx->as_usedptr; i++) {
		for (j = 0; j < pas->as_usedptr; ++j) {
			if (strcasecmp(xpasx->as_string[i], pas->as_string[j]) == 0)
				break;
		}
		if (j == pas->as_usedptr) {
			/* didn't find this there already, so copy it in */

			(void) strcpy(pas->as_next, xpasx->as_string[i]);
			pas->as_string[pas->as_usedptr++] = pas->as_next;
			pas->as_next += strlen(pas->as_next) + 1;
		}
	}

	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 *	check for duplicate entries in a string array
 *
 * @param[in] strarr - the string array to check for duplicates
 *
 * @retval 0 - no duplicate entries found
 * @retval 1 - duplicate entries found
 *
 */

int
check_duplicates(struct array_strings *strarr)
{
	int i, j;

	if (strarr == NULL)
		return 0;

	for (i = 0; i < strarr->as_usedptr; i++) {
		for (j = i + 1; j < strarr->as_usedptr; j++) {
			if (strcmp(strarr->as_string[i],
				   strarr->as_string[j]) == 0)
				return 1;
		}
	}
	return 0;
}

struct array_strings *
get_attr_arst(const attribute *pattr)
{
	return pattr->at_val.at_arst;
}


================================================
FILE: src/lib/Libattr/attr_fn_b.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_b.c
 * @brief
 * 	This file contains functions for manipulating attributes of type
 *	boolean
 * @details
 * Each set has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the machine representation of the value to a string
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *	Freeing the space malloc-ed to the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * -------------------------------------------------------
 * Set of General functions for attributes of type boolean
 * -------------------------------------------------------
 */

static char *true_val = ATR_TRUE;
static char *false_val = ATR_FALSE;

/**
 * @brief
 * 	is_true_or_false - examine input for possible true/value values
 *
 * @param[in] val - value string
 *
 * @return	int
 * @retval	1 	for true
 * @retval	0 	for false
 * @retval	-1 	for error
 *
 */

int
is_true_or_false(char *val)
{
	if ((strcmp(val, true_val) == 0) ||
	    (strcmp(val, "TRUE") == 0) ||
	    (strcmp(val, "true") == 0) ||
	    (strcmp(val, "t") == 0) ||
	    (strcmp(val, "T") == 0) ||
	    (strcmp(val, "1") == 0) ||
	    (strcmp(val, "y") == 0) ||
	    (strcmp(val, "Y") == 0))
		return 1; /* true */
	else if ((strcmp(val, false_val) == 0) ||
		 (strcmp(val, "FALSE") == 0) ||
		 (strcmp(val, "false") == 0) ||
		 (strcmp(val, "f") == 0) ||
		 (strcmp(val, "F") == 0) ||
		 (strcmp(val, "0") == 0) ||
		 (strcmp(val, "n") == 0) ||
		 (strcmp(val, "N") == 0))
		return 0; /* false */
	else
		return (-1);
}
/**
 * @brief
 * 	decode_b - decode string into boolean attribute
 *
 *	String of "1" decodes to true, all else to false
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_b(attribute *patr, char *name, char *rescn, char *val)
{
	int i;

	if ((val == NULL) || (strlen(val) == 0)) {
		ATR_UNSET(patr);
		patr->at_val.at_long = 0; /* default to false */
	} else {
		if ((i = is_true_or_false(val)) != -1)
			patr->at_val.at_long = i;
		else
			return (PBSE_BADATVAL);
		post_attr_set(patr);
	}
	return (0);
}

/**
 * @brief
 * 	encode_b - encode attribute of type ATR_TYPE_BOOL to attr_extern
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

/*ARGSUSED*/

int
encode_b(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	size_t ct;
	svrattrl *pal;
	char *value;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);

	if (attr->at_val.at_long) {
		value = true_val;
	} else {
		value = false_val;
	}
	ct = strlen(value) + 1;

	pal = attrlist_create(atname, rsname, ct);
	if (pal == NULL)
		return (-1);
	strcpy(pal->al_value, value);
	pal->al_flags = attr->at_flags;

	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;
	return (1);
}

/**
 * @brief
 * 	set_b - set attribute of type ATR_TYPE_BOOL
 *
 *	A=B --> A set to value of B
 *	A+B --> A = A | B  (inclusive or, turn on)
 *	A-B --> A = A & ~B  (and not, clear)
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_b(attribute *attr, attribute *new, enum batch_op op)
{
	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {
		case SET:
			attr->at_val.at_long = new->at_val.at_long;
			break;

		case INCR:
			attr->at_val.at_long =
				attr->at_val.at_long | new->at_val.at_long; /* "or" */
			break;

		case DECR:
			attr->at_val.at_long = attr->at_val.at_long &
					       ~new->at_val.at_long;
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 *	comp_b - compare two attributes of type ATR_TYPE_BOOL
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_b(attribute *attr, attribute *with)
{
	if (!attr || !with)
		return (1);
	if (((attr->at_val.at_long == 0) && (with->at_val.at_long == 0)) ||
	    ((attr->at_val.at_long != 0) && (with->at_val.at_long != 0)))
		return (0);
	else
		return (1);
}

/*
 * free_b - use free_null() to (not) free space
 */

/**
 * @brief	Attribute setter function for boolean type values
 *
 * @param[in]	pattr	-	pointer to attribute being set
 * @param[in]	value	-	value to be set
 * @param[in]	op		-	operation to do
 *
 * @return	void
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
void
set_attr_b(attribute *pattr, long val, enum batch_op op)
{
	switch (op) {
		case SET:
			pattr->at_val.at_long = val;
			break;

		case INCR:
			pattr->at_val.at_long = pattr->at_val.at_long | val; /* "or" */
			break;

		case DECR:
			pattr->at_val.at_long = pattr->at_val.at_long & ~val;
			break;

		default:
			return;
	}
	post_attr_set(pattr);
}


================================================
FILE: src/lib/Libattr/attr_fn_c.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_c.c
 * @brief
 * 	This file contains functions for manipulating attributes
 *	character, a single
 * @details
 * Each set has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the machine representation of the attribute to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * --------------------------------------------------
 * The Set of Attribute Functions for attributes with
 * value type "char"
 * --------------------------------------------------
 */

/**
 * @brief
 * 	decode_c - decode first character of string into attribute structure
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_c(attribute *patr, char *name, char *rescn, char *val)
{
	if ((val == NULL) || (strlen(val) == 0)) {
		ATR_UNSET(patr);
		patr->at_val.at_char = '\0';
	} else {
		post_attr_set(patr);
		patr->at_val.at_char = *val;
	}
	return (0);
}

/**
 * @brief
 * 	encode_c - encode attribute of type character into attr_extern
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

int
encode_c(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)

{

	svrattrl *pal;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);

	pal = attrlist_create(atname, rsname, 2);
	if (pal == NULL)
		return (-1);

	*pal->al_value = attr->at_val.at_char;
	*(pal->al_value + 1) = '\0';
	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1);
}

/**
 * @brief
 * 	set_c - set attribute A to attribute B,
 *	either A=B, A += B, or A -= B
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_c(attribute *attr, attribute *new, enum batch_op op)
{
	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {
		case SET:
			attr->at_val.at_char = new->at_val.at_char;
			break;

		case INCR:
			attr->at_val.at_char =
				(char) ((int) attr->at_val.at_char +
					(int) new->at_val.at_char);
			break;

		case DECR:
			attr->at_val.at_char =
				(char) ((int) attr->at_val.at_char -
					(int) new->at_val.at_char);
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 * 	comp_c - compare two attributes of type character
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_c(attribute *attr, attribute *with)
{
	if (!attr || !with)
		return (-1);
	if (attr->at_val.at_char < with->at_val.at_char)
		return (-1);
	else if (attr->at_val.at_char > with->at_val.at_char)
		return (1);
	else
		return (0);
}

/*
 * free_c - use free_null() to (not) free space
 */

/**
 * @brief	Attribute setter function for char type values
 *
 * @param[in]	pattr	-	pointer to attribute being set
 * @param[in]	value	-	value to be set
 * @param[in]	op		-	operation to do
 *
 * @return	void
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
void
set_attr_c(attribute *pattr, char value, enum batch_op op)
{
	if (pattr == NULL) {
		log_err(-1, __func__, "Invalid pointer to attribute");
		return;
	}

	switch (op) {
		case SET:
			pattr->at_val.at_char = value;
			break;
		case INCR:
			pattr->at_val.at_char += value;
			break;
		case DECR:
			pattr->at_val.at_char -= value;
			break;
		default:
			return;
	}

	post_attr_set(pattr);
}

void
set_attr_short(attribute *pattr, short value, enum batch_op op)
{
	if (pattr == NULL) {
		log_err(-1, __func__, "Invalid pointer to attribute");
		return;
	}

	switch (op) {
		case SET:
			pattr->at_val.at_short = value;
			break;
		case INCR:
			pattr->at_val.at_short += value;
			break;
		case DECR:
			pattr->at_val.at_short -= value;
			break;
		default:
			return;
	}

	post_attr_set(pattr);
}

/**
 * @brief	Attribute getter function for char type values
 *
 * @param[in]	pattr	-	pointer to the attribute
 *
 * @return	char
 * @retval	char value of the attribute
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 */
char
get_attr_c(const attribute *pattr)
{
	return pattr->at_val.at_char;
}


================================================
FILE: src/lib/Libattr/attr_fn_entlim.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include <strings.h>
#include <sys/types.h>
#include <pbs_ifl.h>
#include "log.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"
#include "pbs_entlim.h"

/**
 * @file	attr_fn_entlim.c
 * @brief
 * 	This file contains functions for manipulating attributes of type "entlim"
 * 	entity limits for Finer Granularity Control (FGC)
 * @details
 * The entities are maintained in an index tree for fast searching,
 *	see attr_entity in attribute.h.
 * The "key" is the entity+resource and the corresponding data is
 *	an "fgc union", see resource.h.
 */

void free_entlim(attribute *); /* found in lib/Libattr/attr_fn_entlim.c */

/**
 * @brief
 *	Free a server style entity-limit leaf from the tree;  does not free
 *	the key associated with the leaf.
 *
 * @param[in] pvdlf - pointer to the leaf; void type to allow for indirect
 *		calls to this or similar functions.
 *
 * @return	Void
 *
 */

static void
svr_freeleaf(void *pvdlf)
{
	svr_entlim_leaf_t *plf = pvdlf;

	if (plf) {
		plf->slf_rescd->rs_free(&plf->slf_limit);
		plf->slf_rescd->rs_free(&plf->slf_sum);
		free(plf);
	}
}

/**
 * @brief
 * 	dup_svr_entlim_leaf - duplicate the leaf data (a svr_entlim_leaf struct)
 *	Used when adding a entry from one context (tree) to another, i.e.
 *	in set_entilm():INCR
 *
 *	WARNING: this simple code works only because we are allowing only
 *	data such as integers, floats, sizes; that is self contained within
 *	the attribute structure (no external data as needed for strings, ...)
 *	I.e. it is doing a structure to structure shallow copy.
 *
 * @param[in] orig - pointer to the original svr_entlim_leaf structure
 *
 * @return pointer to new svr_entlim_leaf structure
 *
 */

svr_entlim_leaf_t *
dup_svr_entlim_leaf(svr_entlim_leaf_t *orig)
{
	svr_entlim_leaf_t *newlf;

	newlf = malloc(sizeof(svr_entlim_leaf_t));
	if (newlf)
		*newlf = *orig;
	return (newlf);
}

/**
 * @brief
 * 	alloc_svrleaf - allocate memory for Server entity leaf and do basic
 *	initialization
 *
 * @param[in]	resc_name - either (1) the name of the limited resource for
 *	max_queued_resc and such, or (2) is NULL for the job count attributes
 *	such as max_queued.
 * @param[out] pplf - address of a pointer to a svr_entlim_leaf, set to
 *	newly allocated memory
 *
 * @return  int
 * @retval 0 - success
 * @retval PBS_UNKRESC - resource name is unknown
 * @retval PBS_SYSTEM  - unable to allocate memory
 *
 */

int
alloc_svrleaf(char *resc_name, svr_entlim_leaf_t **pplf)
{
	resource_def *prdef;
	svr_entlim_leaf_t *plf;

	if (resc_name == NULL) /* use "ncpus" resource_def for the various functions	*/
		prdef = &svr_resc_def[RESC_NCPUS];
	else
		prdef = find_resc_def(svr_resc_def, resc_name);

	if (prdef == NULL)
		return PBSE_UNKRESC;

	plf = malloc(sizeof(svr_entlim_leaf_t));
	if (plf == NULL)
		return PBSE_SYSTEM;

	memset((void *) plf, 0, sizeof(svr_entlim_leaf_t));
	plf->slf_rescd = prdef;
	*pplf = plf;
	return (PBSE_NONE);
}

/**
 * @brief
 * 	svr_addleaf - add an entity limit leaf to the specified context (tree)
 *	and set the slf_limit (server leaf) member.  Also sets
 *	PBS_ELNTLIM_LIMITSET flag in the resource_def structure for the
 *	resource (if one).  Used only by the Server.
 *
 * @param[in] ctx - pointer to "context" - i.e. the tree
 * @param[in] kt  - the entity type enum value
 * @param[in] fulent - the letter associated with the entity type
 * @param[in] entity - the entity name
 * @param[in] rescn  - the resource name, may be null for simple counts
 * @param[in] value  - the resource or count value
 *
 * @return int
 * @retval 0 on success
 * @retval PBSE_ error number on error
 *
 */

int
svr_addleaf(void *ctx, enum lim_keytypes kt, char *fulent, char *entity,
	    char *rescn, char *value)
{
	char *kstr;
	svr_entlim_leaf_t *plf = NULL;
	int rc;

	if (rescn == NULL) {
		/* use "ncpus" resource_def for the various functions	*/
		/* as it is simple integer type needed here		*/
		kstr = entlim_mk_runkey(kt, entity);
	} else {
		kstr = entlim_mk_reskey(kt, entity, rescn);
	}

	if (kstr == NULL)
		return (PBSE_UNKRESC);

	if ((rc = alloc_svrleaf(rescn, &plf)) != PBSE_NONE) {
		free(kstr);
		return (rc);
	}

	rc = plf->slf_rescd->rs_decode(&plf->slf_limit, NULL, rescn, value);
	if (rc != 0) {
		free(kstr);
		free(plf);
		return rc;
	}

	/* flag that limits are set for this resource name */
	if (rescn != NULL)
		plf->slf_rescd->rs_entlimflg |= PBS_ENTLIM_LIMITSET;

	/* add key+record */
	rc = entlim_add(kstr, (void *) plf, ctx);
	if (rc != 0) {
		svr_freeleaf(plf);
	}
	free(kstr); /* all cases, free the key string */
	return (rc);
}

/**
 * @brief
 * 	internal_decode_entlim - decode a "attribute name/optional resource/value"
 *		set into a entity type attribute
 *	Used by decode_entlim() and decode_entlim_resc() to do the real work
 *
 * @param[in]  patr - pointer to attribute value into which we are decoding
 *			attribute structure is modified/set
 * @param[in]  name - attribute name, not used
 * @param[in]  rn   - resource name
 * @param[in]  prdef - pointer to resource defininition
 * @param[in]  value - string to be decoded as the attribute value
 *
 * @return int
 * @retval  0 on success
 * @retval  PBSE_* on error
 *
 */

static int
internal_decode_entlim(attribute *patr, char *name, char *rn,
		       struct resource_def *prdef, char *val)
{
	void *petree;
	int rc = 0;
	char *valcopy;

	if ((patr->at_flags & ATR_VFLAG_SET) ||
	    (patr->at_val.at_enty.ae_tree != NULL))
		free_entlim(patr);

	/* create header for tree,  no duplicate keys and variable length key */

	petree = entlim_initialize_ctx();
	if (petree == NULL)
		return PBSE_SYSTEM;

	/* entlim_parse munges the input string, so give it a copy */
	valcopy = strdup(val);
	if (valcopy == NULL) {
		(void) entlim_free_ctx(petree, svr_freeleaf);
		return PBSE_SYSTEM;
	}
	rc = entlim_parse(valcopy, rn, petree, svr_addleaf);
	free(valcopy);
	if (rc != 0) {
		(void) entlim_free_ctx(petree, svr_freeleaf);
		return (PBSE_BADATVAL);
	}
	patr->at_val.at_enty.ae_tree = petree;
	post_attr_set(patr);

	return (0);
}

/**
 * @brief
 * 	decode_entlim - decode a "attribute name/value" pair into
 *	a entity count type attribute (without resource)
 *	The value is of the form "[L:Ename=Rvalue],..."
 *	where L is 'u' (user), 'g' (group), or 'o' (overall)
 *	Ename is a user or group name or "PBS_ALL"
 *	Rvalue is a integer value such as "10"
 *
 * @param[in] 	patr	pointer to attribute to be set
 * @param[in] 	name	attribute name (not used)
 * @param[in] 	rescn	resource name - should be null
 * @param[in] 	val	string to decode as the entity value
 *
 * @return int
 * @retval 0 - success
 * @retval non zero - PBSE_* error number
 *
 */

int
decode_entlim(attribute *patr, char *name, char *rescn, char *val)
{

	if (patr == NULL)
		return (PBSE_INTERNAL);
	if (rescn != NULL)
		return (PBSE_INTERNAL);

	return (internal_decode_entlim(patr, name, NULL, NULL, val));
}

/**
 * @brief
 * 	decode_entlim_res - decode a "attribute name/resource name/value" triplet
 *	into a entity type attribute (with resource)
 *	The value is of the form "[L:Ename=Rvalue],..."
 *	where L is 'u' (user), 'g' (group), or 'o' (overall)
 *	Ename is a user or group name or "PBS_ALL"
 *	Rvalue is a resource value such as "10" or "4gb"
 *
 * @param[in] 	patr	pointer to attribute to be set
 * @param[in] 	name	attribute name (not used)
 * @param[in] 	rescn	resource name - must not be null
 * @param[in] 	val	string to decode as the entity value
 *
 * @return int
 * @retval 0 - success
 * @retval non zero - PBSE_* error number
 *
 */

int
decode_entlim_res(attribute *patr, char *name, char *rescn, char *val)
{
	resource_def *prdef;

	if (patr == NULL)
		return (PBSE_INTERNAL);
	if (rescn == NULL)
		return (PBSE_UNKRESC);
	prdef = find_resc_def(svr_resc_def, rescn);
	if (prdef == NULL) {
		/*
		 * didn't find resource with matching name
		 * return PBSE_UNKRESC
		 */
		return (PBSE_UNKRESC);
	}
	if ((prdef->rs_type != ATR_TYPE_LONG) &&
	    (prdef->rs_type != ATR_TYPE_SIZE) &&
	    (prdef->rs_type != ATR_TYPE_LL) &&
	    (prdef->rs_type != ATR_TYPE_SHORT) &&
	    (prdef->rs_type != ATR_TYPE_FLOAT))
		return (PBSE_INVALJOBRESC);

	return (internal_decode_entlim(patr, name, rescn, NULL, val));
}

/**
 * @brief
 * 	encode_entlim_db - encode attr of type ATR_TYPE_ENTITY into a form suitable
 * 	to be stored as a single record into the database.
 *
 * Here we are a little different from the typical attribute.  Most have a
 * single value to be encoded.  But an entity attribute may have a whole bunch.
 * First get the name of the parent attribute.
 * Then for each entry in the tree, call the individual resource encode
 * routine with "aname" set to the parent attribute name and with a null
 * pbs_list_head .  The encoded resource value is then prepended with the "entity
 * string" and "=" character which is then concatenated together to create a
 * single value string for the entire attribute value. As we find a new pair of
 * "attribute_name+resc_name", we add to a list where we continue to assemble
 * the value strings.
 *
 * Note: entities with an "unset" value will not be encoded.
 *
 *
 *	Returns: >0 if ok
 *		 =0 if no value to encode, no entries added to list
 *		 <0 if some resource entry had an encode error.
 *
 * @param[in] 	attr	pointer to attribute to encode
 * @param[in]	phead;	head of attrlist list onto which the encoded is appended
 * @param[in] 	atname	attribute name (not used)
 * @param[in] 	rsname	resource name, null on call
 * @param[in] 	mode	encode mode
 * @param[out]  rtnl	address of pointer to encoded svrattrl entry which
 *			is also appended to list
 *
 * @return int
 * @retval >0 - success
 * @retval =0  - no value to encode, nothing added to list (phead)
 * @retval <0 - if some entry had an encode error
 *
 */

int
encode_entlim_db(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	void *ctx;
	char *key = NULL;
	char rescn[PBS_MAX_RESC_NAME + 1];
	char etname[PBS_MAX_RESC_NAME + 1];
	char *pc;
	int needquotes;
	svrattrl *pal;
	svrattrl *tmpsvl;
	int len = 0;
	svr_entlim_leaf_t *plf;
	char *pos = NULL, *p;
	int oldlen = 0;
	svrattrl *xprior = NULL;

	/*
	 * structure to hold the various entity attributes along with their
	 * concatenated values, as we walk the tree
	 */
	struct db_attrib {
		char atname[PBS_MAX_RESC_NAME];
		char rescn[PBS_MAX_RESC_NAME];
		char *val;
	};
	struct db_attrib *db_attrlist = NULL;
	int cursize = 0;
	int index = 0;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0); /* nothing up the tree */

	ctx = attr->at_val.at_enty.ae_tree;

	/* ok, now process each separate entry in the tree */
	while ((plf = entlim_get_next(ctx, (void **) &key)) != NULL) {

		rescn[0] = '\0';
		needquotes = 0;

		if ((entlim_entity_from_key(key, etname, PBS_MAX_RESC_NAME) == 0) &&
		    (entlim_resc_from_key(key, rescn, PBS_MAX_RESC_NAME) >= 0)) {

			/* decode leaf value into a local svrattrl structure in */
			/* order to obtain a string represnetation of the value */

			if (plf->slf_rescd->rs_encode(&plf->slf_limit, NULL, atname, rescn, mode, &tmpsvl) > 0) {

				/* find out if this etname + rescn pair is created already, if not create an attribute */
				for (index = 0; index < cursize; index++) {
					if ((strcmp(db_attrlist[index].atname, atname) == 0) &&
					    (strcmp(db_attrlist[index].rescn, rescn) == 0)) {
						/* found the resource or NULL resource */
						break;
					}
				}
				if (index == cursize) {
					cursize++;
					if (!(p = realloc(db_attrlist, sizeof(struct db_attrib) * cursize)))
						goto err;
					db_attrlist = (struct db_attrib *) p;
					strcpy(db_attrlist[index].atname, atname);
					strcpy(db_attrlist[index].rescn, rescn);
					db_attrlist[index].val = NULL;
				}

				/* Allocate the "real" svrattrl sufficiently large to     */
				/* hold the form "[l:entity;rname=value_string]" plus one */
				/* and assemble the real value into the real svrattrl     */

				/* [u:=]  null = 6 extra characters */
				len = tmpsvl->al_valln + strlen(etname) + 6;

				/* is there whitespace in the entity name ? */
				/* if so, then we quote the whole thing.    */
				pc = etname;
				while (*pc) {
					if (isspace((int) *pc++)) {
						needquotes = 1;
						len += 2;
						break;
					}
				}

				if (!db_attrlist[index].val) {
					if (!(db_attrlist[index].val = malloc(len)))
						goto err;
					pos = db_attrlist[index].val;
				} else {
					oldlen = strlen(db_attrlist[index].val);
					/* add old length + space for comma to total len */
					len = len + oldlen + 1;
					if (!(p = realloc(db_attrlist[index].val, len)))
						goto err;
					db_attrlist[index].val = p;
					strcat(db_attrlist[index].val, ",");
					pos = db_attrlist[index].val + oldlen + 1;
				}

				if (needquotes) {
					sprintf(pos, "[%c:\"%s\"=%s]", *key, etname, tmpsvl->al_atopl.value);
				} else {
					sprintf(pos, "[%c:%s=%s]", *key, etname, tmpsvl->al_atopl.value);
				}
				free(tmpsvl);
			}
		}
	}

	/*
	 * now we are done with the tree and should have assembled the strings
	 * for the various attributes. Walk this array and create the real
	 * attribute list
	 */
	for (index = 0; index < cursize; index++) {
		len = strlen(db_attrlist[index].val) + 1;
		if (db_attrlist[index].rescn[0] == '\0')
			pal = attrlist_create(db_attrlist[index].atname, NULL, len);
		else
			pal = attrlist_create(db_attrlist[index].atname, db_attrlist[index].rescn, len);

		strcpy(pal->al_atopl.value, db_attrlist[index].val);
		free(db_attrlist[index].val);
		pal->al_flags = attr->at_flags;
		/* op is not stored in db, so no need to set it */

		if (phead)
			append_link(phead, &pal->al_link, pal);

		if (index == 0) {
			if (rtnl)
				*rtnl = pal;
		} else {
			xprior->al_sister = pal;
		}
		xprior = pal;
	}
	/* finally free the whole db_attrlist */
	if (db_attrlist)
		free(db_attrlist);

	return (cursize);

err:
	/* walk the array and free every set index */
	if (db_attrlist) {
		for (index = 0; index < cursize; index++) {
			if (db_attrlist[index].val)
				free(db_attrlist[index].val);
		}
		free(db_attrlist);
	}

	return (-1);
}

/**
 * @brief
 * 	encode_entlim - encode attr of type ATR_TYPE_ENTITY into attr_extern form
 *
 * Here we are a little different from the typical attribute.  Most have a
 * single value to be encoded.  But an entity attribute may have a whole bunch.
 * First get the name of the parent attribute.
 * Then for each entry in the tree, call the individual resource encode
 * routine with "aname" set to the parent attribute name and with a null
 * pbs_list_head .  The encoded resource value is then prepended with the "entity
 * string" and "=" character which is then placed in a new svrattrl entry
 * which is then added to the real list head.
 *
 * Note: entities with an "unset" value will not be encoded.
 *
 *
 * @param[in] 	attr	pointer to attribute to encode
 * @param[in]	phead;	head of attrlist list onto which the encoded is appended
 * @param[in] 	atname	attribute name
 * @param[in] 	rsname	resource name, null on call
 * @param[in] 	mode	encode mode
 * @param[out]  rtnl	address of pointer to encoded svrattrl entry which
 *			is also appended to list
 * @return int
 * @retval  >0 if ok
 * @retval  =0 if no value to encode, no entries added to list
 * @retval  <0 if some resource entry had an encode error.
 *
 */
int
encode_entlim(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	void *ctx;
	int grandtotal = 0;
	int first = 1;
	svrattrl *xprior = NULL;
	char *key = NULL;
	char rescn[PBS_MAX_RESC_NAME + 1];
	char etname[PBS_MAX_RESC_NAME + 1];
	char *pc;
	int needquotes;
	svrattrl *pal;
	svrattrl *tmpsvl;
	int len;
	enum batch_op op = SET;
	svr_entlim_leaf_t *plf;
	char **rescn_array;
	char **temp_rescn_array;
	int index = 0;
	int i = 0;
	int array_size = ENCODE_ENTITY_MAX;

	if (mode == ATR_ENCODE_DB)
		return (encode_entlim_db(attr, phead, atname, rsname, mode, rtnl));

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0); /* nothing up the tree */

	ctx = attr->at_val.at_enty.ae_tree;

	rescn_array = malloc(array_size * sizeof(char *));
	if (rescn_array == NULL)
		return (PBSE_SYSTEM);

	/* ok, now process each separate entry in the tree */
	while ((plf = entlim_get_next(ctx, (void **) &key)) != NULL) {

		rescn[0] = '\0';
		needquotes = 0;

		if ((entlim_entity_from_key(key, etname, PBS_MAX_RESC_NAME) == 0) &&
		    (entlim_resc_from_key(key, rescn, PBS_MAX_RESC_NAME) >= 0)) {

			/* decode leaf value into a local svrattrl structure in */
			/* order to obtain a string represnetation of the value */

			if (plf->slf_rescd->rs_encode(&plf->slf_limit, NULL, atname, rescn, mode, &tmpsvl) > 0) {

				/* Allocate the "real" svrattrl sufficiently large to     */
				/* hold the form "[l:entity;rname=value_string]" plus one */
				/* and assemble the real value into the real svrattrl     */

				/* [u:=]  null = 6 extra characters */
				len = tmpsvl->al_valln + strlen(etname) + 6;

				/* is there whitespace in the entity name ? */
				/* if so, then we quote the whole thing.    */
				pc = etname;
				while (*pc) {
					if (isspace((int) *pc++)) {
						needquotes = 1;
						len += 2;
						break;
					}
				}

				if (rescn[0] == '\0')
					pal = attrlist_create(atname, NULL, len);
				else
					pal = attrlist_create(atname, rescn, len);

				if (needquotes) {
					sprintf(pal->al_atopl.value, "[%c:\"%s\"=%s]", *key, etname, tmpsvl->al_atopl.value);
				} else {
					sprintf(pal->al_atopl.value, "[%c:%s=%s]", *key, etname, tmpsvl->al_atopl.value);
				}
				free(tmpsvl);
				pal->al_flags = attr->at_flags;
				op = SET;

				/* check whether the resource is appeared first time or is repeated */
				/* After check set the op accordingly */
				if (rescn[0]) {
					for (i = 0; i < index; i++) {
						if (strcmp(rescn, rescn_array[i]) == 0) {
							op = INCR;
							break;
						}
					}
					if (op == SET) {
						/* Doubling the size of array */
						if (index == array_size) {
							array_size = array_size * 2;
							temp_rescn_array = realloc(rescn_array, array_size * sizeof(char *));
							if (temp_rescn_array != NULL) {
								rescn_array = temp_rescn_array;
							} else {
								for (i = 0; i < index; i++)
									free(rescn_array[i]);
								free(rescn_array);
								return (PBSE_SYSTEM);
							}
						}
						rescn_array[index] = strdup(rescn);
						if (rescn_array[index] == NULL) {
							for (i = 0; i < index; i++)
								free(rescn_array[i]);
							free(rescn_array);
							return (PBSE_SYSTEM);
						}
						index++;
					}
				}
				pal->al_atopl.op = op;
				if (phead)
					append_link(phead, &pal->al_link, pal);
				if (first) {
					if (rtnl)
						*rtnl = pal;
					first = 0;
				} else {
					xprior->al_sister = pal;
				}
				xprior = pal;

				++grandtotal;
			}
		}
	}
	for (i = 0; i < index; i++)
		free(rescn_array[i]);
	free(rescn_array);
	return (grandtotal);
}

/**
 * @brief
 * 	set_entlim - set value of an attribute of type ATR_TYPE_ENTITY to the
 *	value of another attribute of type ATR_TYPE_ENTITY.
 *
 * @par Functionality:
 *	This function is used for all operations on the etlim attributes
 *	EXCEPT for "SET" when the entlim involves a resource, see
 *	set_entlim_resc() below.
 *
 *	For each entity in the list headed by the "new" attribute,
 *	the correspondingly entity in the list headed by "old"
 *	is modified.
 *
 *	The mapping of the operations incr and decr depend on the type are
 *		SET:  all of old entries are replaced by the new entries
 *		INCR: if existing old key (matching new key),
 *		      it is replaced by new (old removed, then set)
 *		      if no existing old key (matching new key), then
 *		      same as set
 *		DECR: old is removed if (a) new has no Rvalue following the
 *		      entity's name or (b) new's Rvalue matches Old's Rvalue
 *
 * @param[in] old pointer to attribute with existing values to be modified
 * @param[in] new pointer to (temp) attribute with new values to be set
 * @param[in] op  set operator: SET, INCR, DECR
 *
 * @return 	int
 * @retval	0 	if ok
 * @retval	>0 	if error
 *
 */

int
set_entlim(attribute *old, attribute *new, enum batch_op op)
{
	char *key = NULL;
	void *newctx;
	void *oldctx;
	svr_entlim_leaf_t *newptr;
	svr_entlim_leaf_t *exptr;
	attribute save_old;

	assert(old && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {
		case SET:
			/* free the old, reinitialize it and then set old  */
			/* to to new by by falling into the "INCR" case    */
			save_old = *old;
			old->at_val.at_enty.ae_tree = entlim_initialize_ctx();
			if (old->at_val.at_enty.ae_tree == NULL) {
				*old = save_old;
				return (PBSE_SYSTEM);
			}
			free_entlim(&save_old); /* have new alloc, discard the saved */
						/* fall into INCR case */

		case INCR:
			/* walk "new" and for each leaf, add it to "old" */
			newctx = new->at_val.at_enty.ae_tree;
			if (old->at_val.at_enty.ae_tree == NULL) {
				/* likely the += without any prior values */
				old->at_val.at_enty.ae_tree = entlim_initialize_ctx();
			}
			oldctx = old->at_val.at_enty.ae_tree;
			while ((newptr = entlim_get_next(newctx, (void **) &key)) != NULL) {
				/* duplicate the record to be added */
				newptr = dup_svr_entlim_leaf(newptr);
				if (newptr) {
					if (entlim_replace(key, newptr, oldctx, svr_freeleaf) != 0) {
						/* failed to add */
						svr_freeleaf(newptr);
						return (PBSE_SYSTEM);
					}
				}
			}
			old->at_val.at_enty.ae_newlimittm = time(0);
			break;

		case DECR:

			if ((old->at_flags & ATR_VFLAG_SET) == 0) {
				/* nothing to unset, just return as done */
				return 0;
			}

			/* walk "new" and for each leaf, remove matching from "old" */
			/* if no "value" for new leaf, then remove if keys match    */
			/* if new leaf has a value, remove old only if values match */

			newctx = new->at_val.at_enty.ae_tree;
			oldctx = old->at_val.at_enty.ae_tree;

			while ((newptr = entlim_get_next(newctx, (void **) &key)) != NULL) {
				/* "exptr" points to record in "old" attribute */
				if ((exptr = entlim_get(key, oldctx)) != NULL) {

					/* found existing ("old") record with matching key */
					if (newptr->slf_limit.at_flags & ATR_VFLAG_SET) {

						int (*compf)(attribute * pattr, attribute * with);

						/* user specifed a value that must match current */
						/* if the current one is to be deleted           */
						char rsbuf[PBS_MAX_RESC_NAME + 1];
						resource_def *prdef;

						if (entlim_resc_from_key(key, rsbuf, PBS_MAX_RESC_NAME) == 0) {

							/* find compare function for this resource */
							prdef = find_resc_def(svr_resc_def, rsbuf);
							if (prdef)
								compf = prdef->rs_comp;
							else
								compf = comp_l; /* default unknown resc to long */

						} else {
							compf = comp_l; /* no resource, use long type */
						}
						if (compf(&newptr->slf_limit, &exptr->slf_limit) == 0) {
							/* value matches, delete "old" */
							(void) entlim_delete(key, oldctx, svr_freeleaf);
						}
					} else {
						/* DECR (a) case in function block comment, */
						/* no value supplied which must match, just */
						/* delete "old"				*/
						(void) entlim_delete(key, oldctx, svr_freeleaf);
					}
				}
			}
			/* having removed one or more elements from the value tree */
			/* see if any entries are left or if the value is now null */
			key = NULL;
			if (entlim_get_next(oldctx, (void **) &key) == NULL) {
				/* no entries left set, clear the entire attribute */
				free_entlim(old);
				/* set _MODIFY flag so up level functions */
				/* know the attribute has been changed    */
				old->at_flags |= ATR_VFLAG_MODIFY;
				return (0);
			}
			break;

		default:
			return (PBSE_INTERNAL);
	}

	post_attr_set(old);
	return (0);
}

/**
 * @brief
 *	set_entlim_res - set value of attribute of type ATR_TYPE_ENTITY to another
 *	This function is used for all operations on the etlim attributes which
 *	involves a resource.  However, except for the "SET" operation, the
 *	operations are identical to set_entlim() above and that function does
 *	the real work.
 *
 *	For each entity in the list headed by the "new" attribute,
 *	the correspondingly entity in the list headed by "old"
 *	is modified.
 *
 *	The mapping of the operations incr and decr depend on the type are
 *	   ****	SET:  all of old wth same resource are replace by new ****
 *		INCR: if existing old key (matching new key),
 *		      it is replaced by new (old removed, then set)
 *		      if no existing old key (matching new key), then
 *		      same as set
 *		DECR: old is removed if (a) new has no Rvalue following the
 *		      entity's name or (b) new's Rvalue matches Old's Rvalue
 * @param old pointer to attribute with existing values to be modified
 * @param new pointer to (temp) attribute with new values to be set
 * @param op  set operator: SET, INCR, DECR
 *
 * @return	int
 * @retval	0 	if ok
 * @retval	>0 	if error
 *
 */

int
set_entlim_res(attribute *old, attribute *new, enum batch_op op)
{
	char *keynew = NULL;
	char *keyold = NULL;
	void *valnew;
	void *valold;
	void *newctx;
	void *oldctx;
	char newresc[PBS_MAX_RESC_NAME + 1];
	char oldresc[PBS_MAX_RESC_NAME + 1];

	assert(old && new && (new->at_flags &ATR_VFLAG_SET));

	if (op == SET) {

		if (old->at_val.at_enty.ae_tree == NULL) {
			/* nothing in old, change op to INCR and use */
			/* other set_entlim function		     */
			op = INCR;
			return (set_entlim(old, new, op));
		}

		newctx = new->at_val.at_enty.ae_tree;
		oldctx = old->at_val.at_enty.ae_tree;

		/* walk the new tree identifying which resources are */
		/* being changed,  walk the old tree and remove any  */
		/* record with the same resource in its key	     */
		while ((valnew = entlim_get_next(newctx, (void **) &keynew)) != NULL) {
			/* get the resource name from the "new" key */
			if (entlim_resc_from_key(keynew, newresc, PBS_MAX_RESC_NAME) != 0)
				continue; /* no resc, go to next */

			keyold = NULL;
			while ((valold = entlim_get_next(oldctx, (void **) &keyold)) != NULL) {
				/* get the resource name from the "old" key */
				if (entlim_resc_from_key(keyold, oldresc, PBS_MAX_RESC_NAME) != 0)
					continue; /* no resc, go to next */

				/* if old and new resource names match, */
				/* delete old record			*/
				if (strcasecmp(oldresc, newresc) == 0)
					(void) entlim_delete(keyold, oldctx, svr_freeleaf);
			}
		}

		/* now the operation is the same as an INCR, adding	*/
		/* new values and thus we change the operator and use	*/
		/* the set_entlim() code above				*/
		op = INCR;
	}

	/* The other operators (and the SET turned into INCR)	*/
	/* use the set_entlim() code above			*/

	return (set_entlim(old, new, op));
}

/**
 * @brief
 * 	free_entlim - free space associated with attribute value
 *
 *	For each leaf in the tree, the associated structure is freed,
 *	and the key is deleted until the tree is complete pruned.  Then
 *	the tree itself is uprooted and placed in the compost pile.
 *
 * @param[in] pattr - pointer to attrbute
 *
 * @return	Void
 *
 */

void
free_entlim(attribute *pattr)
{
	/* entlim_free_cts walks tree and for each leaf,  */
	/* prunes it and then uproots the tree (frees it) */

	if (pattr->at_val.at_enty.ae_tree)
		(void) entlim_free_ctx(pattr->at_val.at_enty.ae_tree, svr_freeleaf);

	/* now clear the basic attribute */
	pattr->at_val.at_enty.ae_newlimittm = 0;
	free_null(pattr);
	return;
}

/**
 * @brief
 *	Unset the entity limits for a specific resource (rather than the
 *	entire attribute).  For example,  unset the limits on "ncpus" while
 *	leaving the "mem" limits set.
 *
 * @param[in] pattr - pointer to the attribute
 * @param[in] rescname - name of resource for which limits are to be unset
 *
 * @return	Void
 *
 */

void
unset_entlim_resc(attribute *pattr, char *rescname)
{
	void *oldctx;
	char *key = NULL;
	void *value = NULL;
	char rsbuf[PBS_MAX_RESC_NAME + 1];
	int modified = 0;
	int hasentries = 0;

	if (((pattr->at_flags & ATR_VFLAG_SET) == 0) ||
	    (rescname == NULL) ||
	    (*rescname == '\0'))
		return; /* nothing to unset */

	/* walk "old" and for each leaf, remove */
	/* entry with matching  resource name   */
	oldctx = pattr->at_val.at_enty.ae_tree;
	while ((value = entlim_get_next(oldctx, (void **) &key)) != NULL) {

		hasentries = 1; /* found at least one (remaining) entry */

		if (entlim_resc_from_key(key, rsbuf, PBS_MAX_RESC_NAME) == 0) {
			if (strcasecmp(rsbuf, rescname) == 0) {
				(void) entlim_delete(key, oldctx, svr_freeleaf);
				modified = 1;
				hasentries = 0; /* will see any in next pass */
				/*
				 * now restart search from beginning as we are
				 * not sure what the deletion did to the order
				 */
				key = NULL;
				continue;
			}
		}
	}
	if (modified)
		pattr->at_flags |= ATR_MOD_MCACHE;
	if (hasentries == 0)
		free_entlim(pattr); /* no entries left, clear attribute */
	return;
}


================================================
FILE: src/lib/Libattr/attr_fn_f.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <assert.h>
#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <pbs_ifl.h>
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server_limits.h"
#include "job.h"
#include "pbs_error.h"
#include "libutil.h"
#include "pbs_share.h"

/**
 * @file	attr_fn_f.c
 * @brief
 * This file contains functions for manipulating attributes of type float
 * @details
 * Each set has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the internal attribute to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * --------------------------------------------------
 * The Set of Attribute Functions for attributes with
 * value type "float"
 * --------------------------------------------------
 */

/**
 * @brief
 * 	decode_f - decode float into attribute structure
 *
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_f(attribute *patr, char *name, char *rescn, char *val)
{
	size_t len;
	if ((val != NULL) && ((len = strlen(val)) != 0)) {
		char *end;
		float fval;

		errno = 0;
		/*
		 * The function strtof cannot be used because on some machines
		 * it is only available in C99 mode.  Use strtod instead.
		 * @see https://lists.debian.org/debian-glibc/2004/02/msg00176.html
		 */
		fval = (float) strtod(val, &end);
		/* if any part of val is not converted or errno set, error */
		if (&val[len] != end || errno != 0)
			return (PBSE_BADATVAL); /* invalid string */
		post_attr_set(patr);
		patr->at_val.at_float = fval;
	} else {
		ATR_UNSET(patr);
		patr->at_val.at_float = 0.0;
	}
	return (0);
}

/**
 * @brief
 *	encode attribute of type float into attr_extern
 *
 * @param[in] attr - ptr to attribute
 * @param[in] phead - head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode, unused here
 * @param[out] rtnl - Return: ptr to svrattrl
 *
 * @return int
 * @retval >0 if ok
 * @retval =0 if no value, no attrlist link added
 * @retval <0 if error
 *
 */

/*ARGSUSED*/

#define CVNBUFSZ 32

int
encode_f(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	size_t ct;
	char cvnbuf[CVNBUFSZ];
	svrattrl *pal;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);

	(void) snprintf(cvnbuf, CVNBUFSZ, "%-.*f",
			float_digits(attr->at_val.at_float, FLOAT_NUM_DIGITS),
			attr->at_val.at_float);
	ct = strlen(cvnbuf) + 1;

	pal = attrlist_create(atname, rsname, ct);
	if (pal == NULL)
		return (-1);

	(void) memcpy(pal->al_value, cvnbuf, ct);
	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1);
}

/**
 * @brief
 * 	set_f - set attribute A to attribute B,
 *	either A=B, A += B, or A -= B
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_f(attribute *attr, attribute *new, enum batch_op op)
{
	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {
		case SET:
			attr->at_val.at_float = new->at_val.at_float;
			break;

		case INCR:
			attr->at_val.at_float += new->at_val.at_float;
			break;

		case DECR:
			attr->at_val.at_float -= new->at_val.at_float;
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 * 	comp_f - compare two attributes of type float
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_f(attribute *attr, attribute *with)
{
	if (!attr || !with)
		return (-1);
	if (attr->at_val.at_float < with->at_val.at_float)
		return (-1);
	else if (attr->at_val.at_float > with->at_val.at_float)
		return (1);
	else
		return (0);
}

/*
 * free_f - use free_null to (not) free space
 */


================================================
FILE: src/lib/Libattr/attr_fn_hold.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "job.h"
#include "pbs_error.h"

#define HOLD_ENCODE_SIZE 4

/**
 * @file	attr_fn_hold.c
 * @brief
 * 	This file contains special decode and encode functions for the hold-types
 * 	attribute.  All other functions for this attribute are the standard
 * 	_b (boolean) routines.
 *
 */

/**
 * @brief
 *	decode_hold - decode string into hold attribute
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_hold(attribute *patr, char *name, char *rescn, char *val)
{
	char *pc;

	patr->at_val.at_long = 0;
	if ((val != NULL) && (strlen(val) > (size_t) 0)) {
		for (pc = val; *pc != '\0'; pc++) {
			switch (*pc) {
				case 'n':
					patr->at_val.at_long = HOLD_n;
					break;
				case 'u':
					patr->at_val.at_long |= HOLD_u;
					break;
				case 'o':
					patr->at_val.at_long |= HOLD_o;
					break;
				case 's':
					patr->at_val.at_long |= HOLD_s;
					break;
				case 'p':
					patr->at_val.at_long |= HOLD_bad_password;
					break;
				default:
					return (PBSE_BADATVAL);
			}
		}
		post_attr_set(patr);
	} else
		ATR_UNSET(patr);

	return (0);
}

/**
 * @brief
 * 	encode_str - encode attribute of type ATR_TYPE_STR into attr_extern
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

int
encode_hold(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)

{
	int i;
	svrattrl *pal;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);

	pal = attrlist_create(atname, rsname, HOLD_ENCODE_SIZE + 1);
	if (pal == NULL)
		return (-1);

	i = 0;
	if (attr->at_val.at_long == 0)
		*(pal->al_value + i++) = 'n';
	else {
		if (attr->at_val.at_long & HOLD_s)
			*(pal->al_value + i++) = 's';
		if (attr->at_val.at_long & HOLD_o)
			*(pal->al_value + i++) = 'o';
		if (attr->at_val.at_long & HOLD_u)
			*(pal->al_value + i++) = 'u';
		if (attr->at_val.at_long & HOLD_bad_password)
			*(pal->al_value + i++) = 'p';
	}
	while (i < HOLD_ENCODE_SIZE + 1)
		*(pal->al_value + i++) = '\0';

	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1);
}

/**
 * @brief
 * 	comp_hold - compare two attributes of type hold
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_hold(attribute *attr, attribute *with)
{
	if (!attr || !with)
		return -1;
	if (attr->at_val.at_long == with->at_val.at_long)
		return 0;
	else
		return 1;
}


================================================
FILE: src/lib/Libattr/attr_fn_intr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_intr.c
 * @brief
 * 	This file contains functions for manipulating attributes of type
 *		interactive
 * @details
 * Each set has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the machine representation of the value to a string
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *	Freeing the space malloc-ed to the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * -----------------------------------------------------------
 * Set of General functions for attributes of type interactive
 * -----------------------------------------------------------
 *
 * This attribute contains the port number to which an Interactive qsub is
 * listening.
 */

/* decode_interactive - use decode_l() */

/**
 * @brief
 * 	encode_inter - encode attribute of type ATR_TYPE_STR to attr_extern
 *
 *	Special case for "interactive" attribute,  encode into TRUE/FALSE
 *	for  client, encode into port number for all others.
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

int
encode_inter(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	if ((mode == ATR_ENCODE_CLIENT) || (mode == ATR_ENCODE_HOOK))
		return (encode_b(attr, phead, atname, rsname, mode, rtnl));
	else
		return (encode_l(attr, phead, atname, rsname, mode, rtnl));
}


================================================
FILE: src/lib/Libattr/attr_fn_l.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <assert.h>
#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <pbs_ifl.h>
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server_limits.h"
#include "job.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_l.c
 * @brief
 * 	This file contains functions for manipulating attributes of type
 *		long integer
 * @details
 * 	Each set has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the internal attribute to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *
 * 	Some or all of the functions for an attribute type may be shared with
 * 	other attribute types.
 *
 * 	The prototypes are declared in "attribute.h"
 *
 * --------------------------------------------------
 * The Set of Attribute Functions for attributes with
 * value type "long"
 * --------------------------------------------------
 */

/**
 * @brief
 * 	decode_l - decode long integer into attribute structure
 *
 * @param[in] patr - pointer to attribute structure
 * @param[in] name - attribute name
 * @param[in] rescn - resource name
 * @param[in] val - attribute value
 *
 * @return      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error
 * @retval      patr    members set
 *
 */

int
decode_l(attribute *patr, char *name, char *rescn, char *val)
{
	char *pc;
	char *endp;

	if ((val != NULL) && (strlen(val) != 0)) {

		pc = val;
		if ((*pc == '+') || (*pc == '-'))
			pc++;
		while (*pc != '\0') {
			if (isdigit((int) *pc) == 0)
				return (PBSE_BADATVAL); /* invalid string */
			pc++;
		}
		post_attr_set(patr);
		patr->at_val.at_long = strtol(val, &endp, 10);
	} else if ((val != NULL) && (strlen(val) == 0)) {
		patr->at_val.at_long = 0;
		post_attr_set(patr);
	} else {
		ATR_UNSET(patr);
		patr->at_val.at_long = 0;
	}
	return (0);
}

/**
 * @brief
 * 	encode_l - encode attribute of type long into attr_extern
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

#define CVNBUFSZ 21

int
encode_l(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	size_t ct;
	char cvnbuf[CVNBUFSZ];
	svrattrl *pal;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);

	(void) sprintf(cvnbuf, "%ld", attr->at_val.at_long);
	ct = strlen(cvnbuf) + 1;

	pal = attrlist_create(atname, rsname, ct);
	if (pal == NULL)
		return (-1);

	(void) memcpy(pal->al_value, cvnbuf, ct);
	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	if ((phead == NULL) && (rtnl == NULL))
		free(pal);

	return (1);
}

/**
 * @brief
 * 	set_l - set attribute A to attribute B,
 *	either A=B, A += B, or A -= B
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_l(attribute *attr, attribute *new, enum batch_op op)
{
	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {
		case SET:
			attr->at_val.at_long = new->at_val.at_long;
			break;

		case INCR:
			attr->at_val.at_long += new->at_val.at_long;
			break;

		case DECR:
			attr->at_val.at_long -= new->at_val.at_long;
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 *	comp_l - compare two attributes of type long
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_l(attribute *attr, attribute *with)
{
	if (!attr || !with)
		return (-1);
	if (attr->at_val.at_long < with->at_val.at_long)
		return (-1);
	else if (attr->at_val.at_long > with->at_val.at_long)
		return (1);
	else
		return (0);
}

/*
 * free_l - use free_null to (not) free space
 */

/**
 * @brief	Attribute setter function for long type values
 *
 * @param[in]	pattr	-	pointer to attribute being set
 * @param[in]	value	-	value to be set
 * @param[in]	op		-	operation to do
 *
 * @return	void
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
void
set_attr_l(attribute *pattr, long value, enum batch_op op)
{
	if (pattr == NULL) {
		log_err(-1, __func__, "Invalid pointer to attribute");
		return;
	}

	switch (op) {
		case SET:
			pattr->at_val.at_long = value;
			break;
		case INCR:
			pattr->at_val.at_long += value;
			break;
		case DECR:
			pattr->at_val.at_long -= value;
			break;
		default:
			return;
	}

	post_attr_set(pattr);
}

/**
 * @brief	Attribute getter function for long type values
 *
 * @param[in]	pattr	-	pointer to the attribute
 *
 * @return	long
 * @retval	long value of the attribute
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 */
long
get_attr_l(const attribute *pattr)
{
	return pattr->at_val.at_long;
}


================================================
FILE: src/lib/Libattr/attr_fn_ll.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <pbs_ifl.h>
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_ll.c
 * @brief
 * 	This file contains functions for manipulating attributes of type
 *	Long integer, where "Long" is defined as the largest integer
 *	available.
 * @details
 * Each set has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the internal attribute to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * --------------------------------------------------
 * The Set of Attribute Functions for attributes with
 * value type "Long" (_ll)
 * --------------------------------------------------
 */

#define CVNBUFSZ 23

/**
 * @brief
 * 	decode_ll - decode Long integer into attribute structure
 *	Unlike decode_long, this function will decode octal (leading zero) and
 *	hex (leading 0x or 0X) data as well as decimal
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_ll(attribute *patr, char *name, char *rescn, char *val)
{
	char *pc;

	if ((val != NULL) && (strlen(val) != 0)) {

		patr->at_val.at_ll = strtoll(val, &pc, 0);
		if (*pc != '\0')
			return (PBSE_BADATVAL); /* invalid string */
		post_attr_set(patr);
	} else {
		ATR_UNSET(patr);
		patr->at_val.at_ll = 0;
	}
	return (0);
}

/**
 * @brief
 * 	encode_ll - encode attribute of type Long into attr_extern
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

int
encode_ll(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	size_t ct;
	const char *cvn;
	svrattrl *pal;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);

	cvn = uLTostr(attr->at_val.at_ll, 10);
	ct = strlen(cvn) + 1;

	pal = attrlist_create(atname, rsname, ct);
	if (pal == NULL)
		return (-1);

	(void) memcpy(pal->al_value, cvn, ct);
	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1);
}

/**
 * @brief
 * 	set_ll - set attribute A to attribute B,
 *	either A=B, A += B, or A -= B
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_ll(attribute *attr, attribute *new, enum batch_op op)
{
	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {
		case SET:
			attr->at_val.at_ll = new->at_val.at_ll;
			break;

		case INCR:
			attr->at_val.at_ll += new->at_val.at_ll;
			break;

		case DECR:
			attr->at_val.at_ll -= new->at_val.at_ll;
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);
	return (0);
}

/**
 * @brief
 * 	comp_ll - compare two attributes of type Long
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_ll(attribute *attr, attribute *with)
{
	if (!attr || !with)
		return (-1);
	if (attr->at_val.at_ll < with->at_val.at_ll)
		return (-1);
	else if (attr->at_val.at_ll > with->at_val.at_ll)
		return (1);
	else
		return (0);
}

/**
 * @brief	Attribute setter function for long type values
 *
 * @param[in]	pattr	-	pointer to attribute being set
 * @param[in]	value	-	value to be set
 * @param[in]	op		-	operation to do
 *
 * @return	void
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
void
set_attr_ll(attribute *pattr, long long value, enum batch_op op)
{
	if (pattr == NULL) {
		log_err(-1, __func__, "Invalid pointer to attribute");
		return;
	}

	switch (op) {
		case SET:
			pattr->at_val.at_ll = value;
			break;
		case INCR:
			pattr->at_val.at_ll += value;
			break;
		case DECR:
			pattr->at_val.at_ll -= value;
			break;
		default:
			return;
	}

	post_attr_set(pattr);
}

/**
 * @brief	Attribute getter function for long long type values
 *
 * @param[in]	pattr	-	pointer to the attribute
 *
 * @return	long long
 * @retval	long long value of the attribute
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 */
long long
get_attr_ll(const attribute *pattr)
{
	return pattr->at_val.at_ll;
}

/*
 * free_ll - use free_null to (not) free space
 */


================================================
FILE: src/lib/Libattr/attr_fn_resc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include <pbs_ifl.h>
#include "log.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"
#include "pbs_idx.h"

/**
 * @file	attr_fn_resc.c
 * @brief
 * 	This file contains functions for manipulating attributes of type
 *	resource
 *
 *  A "resource" is similiar to an attribute but with two levels of
 *  names.  The first name is the attribute name, e.g. "resource-list",
 *  the second name is the resource name, e.g. "mem".
 * @details
 * Each resource_def has functions for:
 *	Decoding the value string to the internal representation.
 *	Encoding the internal attribute to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *	freeing the resource value space (if extra memory is allocated)
 *
 * Some or all of the functions for an resource type may be shared with
 * other resource types or even attributes.
 *
 * The prototypes are declared in "attribute.h", also see resource.h
 *
 * ----------------------------------------------------------------------------
 * Attribute functions for attributes with value type resource
 * ----------------------------------------------------------------------------
 */

/* Global Variables */

int resc_access_perm;

/* External Global Items */

int comp_resc_gt; /* count of resources compared > */
int comp_resc_eq; /* count of resources compared = */
int comp_resc_lt; /* count of resources compared < */
int comp_resc_nc; /* count of resources not compared  */
void *resc_attrdef_idx = NULL;

/**
 * @brief
 * 	decode_resc - decode a "attribute name/resource name/value" triplet into
 *	         a resource type attribute
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_resc(attribute *patr, char *name, char *rescn, char *val)
{
	resource *prsc;
	resource_def *prdef;
	int rc = 0;
	int rv;

	if (patr == NULL)
		return (PBSE_INTERNAL);
	if (rescn == NULL)
		return (PBSE_UNKRESC);
	if (!(patr->at_flags & ATR_VFLAG_SET))
		CLEAR_HEAD(patr->at_val.at_list);

	/* check the resource name is not nasty e.g.: from user input */
	if (verify_resc_name(rescn)) {
		return (PBSE_BADATVAL);
	}

	prdef = find_resc_def(svr_resc_def, rescn);
	if (prdef == NULL) {
		/*
		 * didn't find resource with matching name, use unknown;
		 * but return PBSE_UNKRESC incase caller dosn`t wish to
		 * accept unknown resources
		 */
		rc = PBSE_UNKRESC;
		prdef = &svr_resc_def[RESC_UNKN];
	}

	prsc = find_resc_entry(patr, prdef);
	if (prsc == NULL) /* no current resource entry, add it */
		if ((prsc = add_resource_entry(patr, prdef)) == NULL) {
			return (PBSE_SYSTEM);
		}

	/* note special use of ATR_DFLAG_ACCESS, see server/attr_recov() */

	if (((prsc->rs_defin->rs_flags & resc_access_perm & ATR_DFLAG_WRACC) == 0) &&
	    ((resc_access_perm & ATR_DFLAG_ACCESS) != ATR_DFLAG_ACCESS))
		return (PBSE_ATTRRO);

	post_attr_set(patr);

	if ((resc_access_perm & ATR_PERM_ALLOW_INDIRECT) && (*val == '@')) {
		if (strcmp(rescn, "ncpus") != 0)
			rv = decode_str(&prsc->rs_value, name, rescn, val);
		else
			rv = PBSE_BADNDATVAL;
		if (rv == 0)
			prsc->rs_value.at_flags |= ATR_VFLAG_INDIRECT;
	} else {
		rv = prdef->rs_decode(&prsc->rs_value, name, rescn, val);
	}
	if (rv)
		return (rv);
	else
		return (rc);
}

/**
 * @brief
 * 	Encode attr of type ATR_TYPE_RESR into attr_extern form
 *
 * Here we are a little different from the typical attribute.  Most have a
 * single value to be encoded.  But resource attribute may have a whole bunch.
 * First get the name of the parent attribute (typically "resource-list").
 * Then for each resource in the list, call the individual resource encode
 * routine with "atname" set to the parent attribute name.
 *
 * @param[in] attr -  ptr to attribute to encode
 * @param[in] phead - head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name, null on call
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * If mode is either ATR_ENCODE_SAVE or ATR_ENCODE_SVR, then any resource
 * currently set to the default value is not encoded.   This allows it to be
 * reset if the default changes or it is moved.
 *
 * If the mode is ATR_ENCODE_CLIENT or ATR_ENCODE_MOM, the client permission
 * passed in the global variable resc_access_perm is checked against each
 * definition.  This allows a resource by resource access setting, not just
 * on the attribute.
 *
 * If the mode is ATR_ENCODE_HOOK, resource permission checking is bypassed.
 *
 * @return - Error code
 * @retval  =0 if no value to encode, no entries added to list
 * @retval  <0 if some resource entry had an encode error.
 *
 */
int
encode_resc(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	int dflt;
	resource *prsc;
	int rc;
	int grandtotal = 0;
	int perm;
	int first = 1;
	svrattrl *xrtnl;
	svrattrl *xprior = NULL;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0); /* no resources at all */

	/* ok now do each separate resource */

	for (prsc = (resource *) GET_NEXT(attr->at_val.at_list);
	     prsc != NULL;
	     prsc = (resource *) GET_NEXT(prsc->rs_link)) {

		/*
		 * encode if sending to client or MOM with permission
		 * encode if saving and ( not default value or save on deflt set)
		 * encode if sending to server and not default and have permission
		 */

		perm = prsc->rs_defin->rs_flags & resc_access_perm;
		dflt = prsc->rs_value.at_flags & ATR_VFLAG_DEFLT;
		if (((mode == ATR_ENCODE_CLIENT) && perm) ||
		    (mode == ATR_ENCODE_HOOK) ||
		    (mode == ATR_ENCODE_DB) ||
		    ((mode == ATR_ENCODE_MOM) && perm) ||
		    (mode == ATR_ENCODE_SAVE) ||
		    ((mode == ATR_ENCODE_SVR) && (dflt == 0) && perm)) {

			rsname = prsc->rs_defin->rs_name;
			xrtnl = NULL;
			if (prsc->rs_value.at_flags & ATR_VFLAG_INDIRECT)
				rc = encode_str(&prsc->rs_value, phead,
						atname, rsname, mode, &xrtnl);
			else
				rc = prsc->rs_defin->rs_encode(&prsc->rs_value, phead,
							       atname, rsname, mode, &xrtnl);

			if (rc < 0)
				return (rc);
			if (xrtnl == NULL)
				continue;
			if (first) {
				if (rtnl)
					*rtnl = xrtnl;
				first = 0;
			} else {
				if (xprior)
					xprior->al_sister = xrtnl;
			}
			xprior = xrtnl;

			grandtotal += rc;
		}
	}
	return (grandtotal);
}

/**
 * @brief
 * 	set_resc - set value of attribute of type ATR_TYPE_RESR to another
 *
 *	For each resource in the list headed by the "new" attribute,
 *	the correspondingly name resource in the list headed by "old"
 *	is modified.
 *
 *	The mapping of the operations incr and decr depend on the type
 *	of each individual resource.
 *
 * @param[in]   old - pointer to old attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_resc(attribute *old, attribute *new, enum batch_op op)
{
	enum batch_op local_op;
	resource *newresc;
	resource *oldresc;
	int rc;

	assert(old && new);

	newresc = (resource *) GET_NEXT(new->at_val.at_list);
	while (newresc != NULL) {

		local_op = op;

		/* search for old that has same definition as new */

		oldresc = find_resc_entry(old, newresc->rs_defin);
		if (oldresc == NULL) {
			/* add new resource to list */
			oldresc = add_resource_entry(old, newresc->rs_defin);
			if (oldresc == NULL) {
				log_err(-1, "set_resc", "Unable to malloc space");
				return (PBSE_SYSTEM);
			}
		}

		/*
		 * unlike other attributes, resources can be "unset"
		 * if new is "set" to a value, the old one is set to that
		 * value; if the new resource is unset (no value), then the
		 * old resource is unset by freeing it.
		 */

		if (newresc->rs_value.at_flags & ATR_VFLAG_SET) {

			/*
			 * An indirect resource is a string of the form
			 * "@<node>", it may be of a different type than the
			 * resource definition itself. free_str() must be called
			 * explicitly to clear away indirectness before the
			 * value can be set again.
			 */
			if (oldresc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
				free_str(&oldresc->rs_value);
			}
			if (newresc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
				oldresc->rs_defin->rs_free(&oldresc->rs_value);
				rc = set_str(&oldresc->rs_value,
					     &newresc->rs_value, local_op);
				oldresc->rs_value.at_flags |= ATR_VFLAG_INDIRECT;
			} else {
				rc = oldresc->rs_defin->rs_set(&oldresc->rs_value,
							       &newresc->rs_value, local_op);
				oldresc->rs_value.at_flags &= ~ATR_VFLAG_INDIRECT;
			}
			if (rc != 0)
				return (rc);
			oldresc->rs_value.at_flags |=
				(newresc->rs_value.at_flags & ATR_VFLAG_DEFLT);
		} else {
			oldresc->rs_defin->rs_free(&oldresc->rs_value);
		}

		newresc = (resource *) GET_NEXT(newresc->rs_link);
	}
	post_attr_set(old);
	return (0);
}

/**
 * @brief
 * 	comp_resc - compare two attributes of type ATR_TYPE_RESR
 *
 *	DANGER Will Robinson, DANGER
 *
 *	As you can see from the returns, this is different from the
 *	at_comp model...  PLEASE read the Internal Design Spec
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      -1       otherwise
 *
 */

int
comp_resc(attribute *attr, attribute *with)
{
	resource *atresc;
	resource *wiresc;
	int rc;

	comp_resc_gt = 0;
	comp_resc_eq = 0;
	comp_resc_lt = 0;
	comp_resc_nc = 0;

	if ((attr == NULL) || (with == NULL))
		return (-1);

	wiresc = (resource *) GET_NEXT(with->at_val.at_list);
	while (wiresc != NULL) {
		if (wiresc->rs_value.at_flags & ATR_VFLAG_SET) {
			atresc = find_resc_entry(attr, wiresc->rs_defin);
			if (atresc != NULL) {
				if (atresc->rs_value.at_flags & ATR_VFLAG_SET) {
					if ((rc = atresc->rs_defin->rs_comp(&atresc->rs_value, &wiresc->rs_value)) > 0)
						comp_resc_gt++;
					else if (rc < 0)
						comp_resc_lt++;
					else
						comp_resc_eq++;
				}
			} else {
				comp_resc_nc++;
			}
		}
		wiresc = (resource *) GET_NEXT(wiresc->rs_link);
	}
	return (0);
}

/**
 * @brief
 * 	free_resc - free space associated with attribute value
 *
 *	For each entry in the resource list, the entry is delinked,
 *	the resource entry value space freed (by calling the resource
 *	free routine), and then the resource structure is freed.
 *
 * @param[in] pattr - pointer to attribute structure
 *
 * @return	Void
 *
 */
void
free_resc(attribute *pattr)
{
	resource *next;
	resource *pr;

	if (!pattr)
		return;

	pr = (resource *) GET_NEXT(pattr->at_val.at_list);
	while (pr != NULL) {
		next = (resource *) GET_NEXT(pr->rs_link);
		delete_link(&pr->rs_link);
		if (pr->rs_value.at_flags & ATR_VFLAG_INDIRECT)
			free_str(&pr->rs_value);
		else
			pr->rs_defin->rs_free(&pr->rs_value);
		free(pr);
		pr = next;
	}
	free_null(pattr);
	CLEAR_HEAD(pattr->at_val.at_list);
}

/**
 * @brief
 * 	 create the search index for resource deinitions
 *
 * @param[in] rscdf - address of array of resource_def structs
 * @param[in] limit - number of members in resource_def array
 *
 * @return	error code
 * @retval	0  - Success
 * @retval	-1 - Failure
 *
 */
int
cr_rescdef_idx(resource_def *resc_def, int limit)
{
	int i;

	if (!resc_def)
		return -1;

	/* create the attribute index */
	if ((resc_attrdef_idx = pbs_idx_create(PBS_IDX_ICASE_CMP, 0)) == NULL)
		return -1;

	/* add all attributes to the tree with key as the attr name */
	for (i = 0; i < limit; i++) {
		if (strcmp(resc_def->rs_name, RESC_NOOP_DEF) != 0) {
			if (pbs_idx_insert(resc_attrdef_idx, resc_def->rs_name, resc_def) != PBS_IDX_RET_OK)
				return -1;
		}
		resc_def++;
	}
	return 0;
}

/**
 * @brief
 * 	find the resource_def structure for a resource with a given name
 *
 * @param[in] rscdf - address of array of resource_def structs
 * @param[in] name - name of resource
 *
 * @return	pointer to structure
 * @retval	pointer to resource_def structure - Success
 * @retval	NULL - Error
 *
 */
resource_def *
find_resc_def(resource_def *resc_def, char *name)
{
	resource_def *found_def = NULL, *def = NULL;

	if (pbs_idx_find(resc_attrdef_idx, (void **) &name, (void **) &found_def, NULL) == PBS_IDX_RET_OK)
		def = &resc_def[found_def - resc_def];

	return def;
}

/**
 * @brief
 * 	find_resc_entry - find a resource (value) entry in a list headed in
 * 	an attribute that points to the specified resource_def structure
 *
 * @param[in] pattr - pointer to attribute structure
 * @param[in] rscdf - pointer to resource_def structure
 *
 * @return	structure handler
 * @retval	pointer to struct resource 	Success
 * @retval	NULL				Error
 *
 */

resource *
find_resc_entry(const attribute *pattr, resource_def *rscdf)
{
	resource *pr;

	pr = (resource *) GET_NEXT(pattr->at_val.at_list);
	while (pr != NULL) {
		if (pr->rs_defin == rscdf)
			break;
		pr = (resource *) GET_NEXT(pr->rs_link);
	}
	return (pr);
}

/**
 * @brief
 * 	add_resource_entry - add and "unset" entry for a resource type to a
 *	list headed in an attribute.  Just for later displaying, the
 *	resource list is maintained in an alphabetic order.
 *	The parent attribute is marked with ATR_VFLAG_SET and ATR_VFLAG_MODIFY
 *
 * @param[in] pattr - pointer to attribute structure
 * @param[in] prdef -  pointer to resource_def structure
 *
 * @return	structure handler
 * @retval      pointer to struct resource      Success
 * @retval      NULL                            Error
 *
 */

resource *
add_resource_entry(attribute *pattr, resource_def *prdef)
{
	int i;
	resource *new;
	resource *pr;

	pr = (resource *) GET_NEXT(pattr->at_val.at_list);
	while (pr != NULL) {
		i = strcasecmp(pr->rs_defin->rs_name, prdef->rs_name);
		if (i == 0) /* found a matching entry */
			return (pr);
		else if (i > 0)
			break;
		pr = (resource *) GET_NEXT(pr->rs_link);
	}
	new = (resource *) malloc(sizeof(resource));
	if (new == NULL) {
		log_err(-1, "add_resource_entry", "unable to malloc space");
		return NULL;
	}
	CLEAR_LINK(new->rs_link);
	new->rs_defin = prdef;
	new->rs_value.at_type = prdef->rs_type;
	new->rs_value.at_flags = 0;
	new->rs_value.at_user_encoded = 0;
	new->rs_value.at_priv_encoded = 0;
	prdef->rs_free(&new->rs_value);

	if (pr != NULL) {
		insert_link(&pr->rs_link, &new->rs_link, new, LINK_INSET_BEFORE);
	} else {
		append_link(&pattr->at_val.at_list, &new->rs_link, new);
	}
	post_attr_set(pattr);
	return (new);
}

/**
 * @brief
 *      This function is called by action routine of resource_list attribute
 *	of job and reservation. For each resource in the list, if it has its
 *	own action routine,it calls it.
 *
 * @see
 *	action_resc_job
 *	action_resc_resv
 *
 * @param[in]   pattr   -     pointer to new attribute value
 * @param[in]   pobject -     pointer to object
 * @param[in]   type    -     object is job or reservation
 * @param[in]   actmode -     action mode
 *
 * @return      int
 * @retval       PBSE_NONE : success
 * @retval       Error code returned by resource action routine
 *
 * @par Side Effects: None
 *
 * @par MT-safe: Yes
 *
 */

int
action_resc(attribute *pattr, void *pobject, int type, int actmode)
{
	resource *pr;
	int rc;

	pr = (resource *) GET_NEXT(pattr->at_val.at_list);
	while (pr) {
		if ((pr->rs_value.at_flags & ATR_VFLAG_MODIFY) &&
		    (pr->rs_defin->rs_action)) {
			if ((rc = pr->rs_defin->rs_action(pr, pattr, pobject,
							  type, actmode)) != 0)
				return (rc);
		}

		pr->rs_value.at_flags &= ~ATR_VFLAG_MODIFY;
		pr = (resource *) GET_NEXT(pr->rs_link);
	}
	return (0);
}

/**
 * @brief
 *      the at_action for the resource_list attribute of a job
 *
 * @see
 *	action_resc
 *
 * @param[in]   pattr    -     pointer to new attribute value
 * @param[in]   pobject  -     pointer to job
 * @param[in]   actmode  -     action mode
 *
 * @return      int
 * @retval       PBSE_NONE : success
 * @retval       Error code returned by resource action routine
 *
 * @par Side Effects: None
 *
 * @par MT-safe: Yes
 *
 */

int
action_resc_job(attribute *pattr, void *pobject, int actmode)
{
	return (action_resc(pattr, pobject, PARENT_TYPE_JOB, actmode));
}

/**
 * @brief
 *      the at_action for the resource_list attribute of a reservation
 *
 * @see
 *	action_resc
 *
 * @param[in]   pattr    -     pointer to new attribute value
 * @param[in]   pobject  -     pointer to reservation
 * @param[in]   actmode  -     action mode
 *
 * @return      int
 * @retval       PBSE_NONE : success
 * @retval       Error code returned by resource action routine
 *
 * @par Side Effects: None
 *
 * @par MT-safe: Yes
 *
 */

int
action_resc_resv(attribute *pattr, void *pobject, int actmode)
{
	return (action_resc(pattr, pobject, PARENT_TYPE_RESV, actmode));
}

/**
 * @brief
 *      the at_action for the resource_default attribute of a server
 *
 * @param[in]   pattr    -     pointer to new attribute value
 * @param[in]   pobject  -     pointer to reservation
 * @param[in]   actmode  -     action mode
 *
 * @return      int
 * @retval       PBSE_NONE : success
 * @retval       Error code returned by action_resc_dflt routine
 *
 * @par Side Effects: None
 *
 * @par MT-safe: Yes
 *
 */
int
action_resc_dflt_svr(attribute *pattr, void *pobj, int actmode)
{
	return (action_resc(pattr, pobj, PARENT_TYPE_SERVER, actmode));
}

/**
 * @brief
 *      the at_action for the resource_default attribute of a queue
 *
 * @param[in]   pattr    -     pointer to new attribute value
 * @param[in]   pobject  -     pointer to reservation
 * @param[in]   actmode  -     action mode
 *
 * @return      int
 * @retval       PBSE_NONE : success
 * @retval       Error code returned by action_resc_dflt routine
 *
 * @par Side Effects: None
 *
 * @par MT-safe: Yes
 *
 */
int
action_resc_dflt_queue(attribute *pattr, void *pobj, int actmode)
{
	return (action_resc(pattr, pobj, PARENT_TYPE_QUE_ALL, actmode));
}


================================================
FILE: src/lib/Libattr/attr_fn_size.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <pbs_ifl.h>
#include <errno.h>
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"
#include "pbs_share.h"

/**
 * @file	attr_fn_size.c
 * @brief
 * 	This file contains functions for manipulating attributes of type
 *	size, which is an integer optionally followed by k,K,m,M,g,
 *	G,t, or T, optionally followed by w,W,b,B.
 *	If 'w' or 'W' is not specified, b for bytes is assumed.
 * @details
 * The attribute has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the internal attribute to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * --------------------------------------------------
 * The Set of Attribute Functions for attributes with
 * value type "size"
 * --------------------------------------------------
 */

/**
 * @brief
 * 	decode_size - decode size into attribute structure
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_size(attribute *patr, char *name, char *rescn, char *val)
{
	int to_size(char *, struct size_value *);

	patr->at_val.at_size.atsv_num = 0;
	patr->at_val.at_size.atsv_shift = 0;
	if ((val != NULL) && (strlen(val) != 0)) {
		errno = 0;
		if (to_size(val, &patr->at_val.at_size) != 0)
			return (PBSE_BADATVAL);
		if (errno != 0)
			return (PBSE_BADATVAL);
		post_attr_set(patr);
	} else
		ATR_UNSET(patr);

	return (0);
}

/**
 * @brief
 * 	encode_size - encode attribute of type size into attr_extern
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */

/*ARGSUSED*/

#define CVNBUFSZ 23

int
encode_size(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	size_t ct;
	char cvnbuf[CVNBUFSZ];
	svrattrl *pal;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);

	from_size(&attr->at_val.at_size, cvnbuf);
	ct = strlen(cvnbuf) + 1;

	pal = attrlist_create(atname, rsname, ct);
	if (pal == NULL)
		return (-1);

	(void) memcpy(pal->al_value, cvnbuf, ct);
	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;
	if ((phead == NULL) && (rtnl == NULL))
		free(pal);

	return (1);
}

/*
 * set_size - set attribute A to attribute B,
 *	either A=B, A += B, or A -= B
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_size(attribute *attr, attribute *new, enum batch_op op)
{
	u_Long old;
	struct size_value tmpa; /* the two temps are used to insure that the */
	struct size_value tmpn; /* real attributes are not changed if error  */
	int normalize_size(struct size_value * a, struct size_value * b,
			   struct size_value * c, struct size_value * d);

	assert(attr && new && (new->at_flags &ATR_VFLAG_SET));

	if (op == INCR) {
		if (((attr->at_flags & ATR_VFLAG_SET) == 0) ||
		    ((attr->at_val.at_size.atsv_num == 0)))
			op = SET; /* if adding to null, just set instead */
	}

	switch (op) {
		case SET:
			attr->at_val.at_size.atsv_num = new->at_val.at_size.atsv_num;
			attr->at_val.at_size.atsv_shift = new->at_val.at_size.atsv_shift;
			attr->at_val.at_size.atsv_units = new->at_val.at_size.atsv_units;
			break;

		case INCR:
			if (normalize_size(&attr->at_val.at_size,
					   &new->at_val.at_size, &tmpa, &tmpn) < 0)
				return (PBSE_BADATVAL);
			old = tmpa.atsv_num;
			tmpa.atsv_num += tmpn.atsv_num;
			if (tmpa.atsv_num < old)
				return (PBSE_BADATVAL);
			attr->at_val.at_size = tmpa;
			break;

		case DECR:
			if (normalize_size(&attr->at_val.at_size,
					   &new->at_val.at_size, &tmpa, &tmpn) < 0)
				return (PBSE_BADATVAL);
			old = tmpa.atsv_num;
			tmpa.atsv_num -= tmpn.atsv_num;
			if (tmpa.atsv_num > old)
				return (PBSE_BADATVAL);
			attr->at_val.at_size = tmpa;
			break;

		default:
			return (PBSE_INTERNAL);
	}
	post_attr_set(attr);

	return (0);
}

/*
 * comp_size - compare two attributes of type size
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0	if 1st == 2nd
 * @retval      1	if 1st > 2nd
 * @retval	-1 	if 1st < 2nd
 *
 */

int
comp_size(attribute *attr, attribute *with)
{
	struct size_value tmpa;
	struct size_value tmpw;
	int normalize_size(struct size_value * a, struct size_value * b,
			   struct size_value * c, struct size_value * d);

	if (normalize_size(&attr->at_val.at_size, &with->at_val.at_size,
			   &tmpa, &tmpw) != 0) {
		if (tmpa.atsv_shift >
		    tmpw.atsv_shift)
			return (1);
		else if (tmpa.atsv_shift <
			 tmpw.atsv_shift)
			return (-1);
		else
			return (0);
	} else if (tmpa.atsv_num > tmpw.atsv_num)
		return (1);
	else if (tmpa.atsv_num < tmpw.atsv_num)
		return (-1);
	else
		return (0);
}

/*
 * free_size - use free_null to (not) free space
 */

/**
 * @brief
 * 	normalize_size - normalize two size values, adjust so the shift
 *	counts are the same, but not less than 10 (KB) otherwise a
 *	chance for overflow.
 *
 * param[in] a - pointer to size_value structure
 * param[in] b -  pointer to size_value structure
 * param[in] ta -  pointer to size_value structure
 * param[in] tb -  pointer to size_value structure
 *
 */

int
normalize_size(struct size_value *a, struct size_value *b, struct size_value *ta, struct size_value *tb)
{
	int adj;
	u_Long temp;

	/*
	 * we do the work in copies of the original attributes
	 * to preserve the original (in case of error)
	 */
	*ta = *a;
	*tb = *b;

	/* if either unit is in bytes (vs words), then both must be */

	if ((ta->atsv_units == ATR_SV_WORDSZ) &&
	    (tb->atsv_units != ATR_SV_WORDSZ)) {
		ta->atsv_num *= SIZEOF_WORD;
		ta->atsv_units = ATR_SV_BYTESZ;
	} else if ((ta->atsv_units != ATR_SV_WORDSZ) &&
		   (tb->atsv_units == ATR_SV_WORDSZ)) {
		tb->atsv_num *= SIZEOF_WORD;
		tb->atsv_units = ATR_SV_BYTESZ;
	}

	/* if either value is in units, round it up to kilos */
	if (ta->atsv_shift == 0) {
		ta->atsv_num = (ta->atsv_num + 1023) >> 10;
		ta->atsv_shift = 10;
	}
	if (tb->atsv_shift == 0) {
		tb->atsv_num = (tb->atsv_num + 1023) >> 10;
		tb->atsv_shift = 10;
	}

	adj = ta->atsv_shift - tb->atsv_shift;

	if (adj > 0) {
		temp = ta->atsv_num;
		if ((adj > sizeof(u_Long) * 8) ||
		    (((temp << adj) >> adj) != ta->atsv_num))
			return (-1); /* would overflow */
		ta->atsv_shift = tb->atsv_shift;
		ta->atsv_num = ta->atsv_num << adj;
	} else if (adj < 0) {
		adj = -adj;
		temp = tb->atsv_num;
		if ((adj > sizeof(u_Long) * 8) ||
		    (((temp << adj) >> adj) != tb->atsv_num))
			return (-1); /* would overflow */
		tb->atsv_shift = ta->atsv_shift;
		tb->atsv_num = tb->atsv_num << adj;
	}
	return (0);
}

/**
 * @brief
 *	Decode the value string into a size_value structure.
 *
 * @param[in] val - String containing the text to convert.
 * @param[out] psize - The size_value structure for the decoded value.
 *
 * @return - int
 * @retval - 0 - Success
 * @retval - !=0 - Failure
 *
 */

int
to_size(char *val, struct size_value *psize)
{
	int havebw = 0;
	char *pc;

	if ((val == NULL) || (psize == NULL))
		return (PBSE_BADATVAL);

	psize->atsv_units = ATR_SV_BYTESZ;
	psize->atsv_num = strTouL(val, &pc, 10);
	psize->atsv_shift = 0;
	if (pc == val) /* no numeric part */
		return (PBSE_BADATVAL);

	switch (*pc) {
		case '\0':
			break;
		case 'k':
		case 'K':
			psize->atsv_shift = 10;
			break;
		case 'm':
		case 'M':
			psize->atsv_shift = 20;
			break;
		case 'g':
		case 'G':
			psize->atsv_shift = 30;
			break;
		case 't':
		case 'T':
			psize->atsv_shift = 40;
			break;
		case 'p':
		case 'P':
			psize->atsv_shift = 50;
			break;
		case 'b':
		case 'B':
			havebw = 1;
			break;
		case 'w':
		case 'W':
			havebw = 1;
			psize->atsv_units = ATR_SV_WORDSZ;
			break;
		default:
			return (PBSE_BADATVAL); /* invalid string */
	}
	if (*pc != '\0')
		pc++;
	if (*pc != '\0') {
		if (havebw)
			return (PBSE_BADATVAL); /* invalid string */
		switch (*pc) {
			case 'b':
			case 'B':
				break;
			case 'w':
			case 'W':
				psize->atsv_units = ATR_SV_WORDSZ;
				break;
			default:
				return (PBSE_BADATVAL);
		}
		pc++;
	}
	/* Make sure we reached the end of the size specification. */
	if (*pc != '\0')
		return (PBSE_BADATVAL); /* invalid string */
	return (0);
}

/**
 * @brief
 * 	from_size - encode a string FROM a size_value structure
 *
 * @param[in] psize - pointer to size_value structure
 * @param[out] cvnbuf - buffer to hold size_value info
 *
 * @return	Void
 *
 */

void
from_size(const struct size_value *psize, char *cvnbuf)
{

#ifdef WIN32
	(void) sprintf(cvnbuf, "%I64u", psize->atsv_num);
#else
	(void) sprintf(cvnbuf, "%llu", psize->atsv_num);
#endif

	switch (psize->atsv_shift) {
		case 0:
			break;
		case 10:
			strcat(cvnbuf, "k");
			break;
		case 20:
			strcat(cvnbuf, "m");
			break;
		case 30:
			strcat(cvnbuf, "g");
			break;
		case 40:
			strcat(cvnbuf, "t");
			break;
		case 50:
			strcat(cvnbuf, "p");
	}
	if (psize->atsv_units & ATR_SV_WORDSZ)
		strcat(cvnbuf, "w");
	else
		strcat(cvnbuf, "b");
}

/**
 * @brief
 * 	get_kilobytes - return the size in the number of kilobytes from
 *	a "size" type attribute.  A value saved in bytes/words is rounded up.
 *	If the value is not set, or the attriute is not type "size", then
 *	zero is returned.
 *
 * @param[in] attr - pointer to attribute structure
 *
 * @return	u_Long
 * @retval	0	Error
 * @retval	val 	kilobytes
 *
 */
u_Long
get_kilobytes_from_attr(attribute *attr)
{
	u_Long val;

	if (!attr || !(attr->at_flags & ATR_VFLAG_SET) ||
	    attr->at_type != ATR_TYPE_SIZE)
		return (0);

	val = attr->at_val.at_size.atsv_num;
	if (attr->at_val.at_size.atsv_units == ATR_SV_WORDSZ)
		val *= SIZEOF_WORD;
	if (attr->at_val.at_size.atsv_shift == 0)
		val = (val + 1023) >> 10;
	else
		val = val << (attr->at_val.at_size.atsv_shift - 10);
	return val;
}

/**
 * @brief  Return the size in the number of bytes from
 *	a "size" type attribute.  A value saved in bytes/words is rounded up.
 *	If the value is not set, or the attriute is not type "size", then
 *	zero is returned.
 *
 * @param[in] attr- server attributes
 *
 * @return - size in bytes
 *
 */
u_Long
get_bytes_from_attr(attribute *attr)
{
	u_Long val;

	if (!attr || !(attr->at_flags & ATR_VFLAG_SET) ||
	    attr->at_type != ATR_TYPE_SIZE)
		return (0);

	val = attr->at_val.at_size.atsv_num;
	if (attr->at_val.at_size.atsv_units == ATR_SV_WORDSZ)
		val *= SIZEOF_WORD;
	if (attr->at_val.at_size.atsv_shift != 0)
		val = val << (attr->at_val.at_size.atsv_shift);
	return val;
}


================================================
FILE: src/lib/Libattr/attr_fn_str.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_str.c
 * @brief
 * 	This file contains functions for manipulating attributes of type string
 *
 * 	Then there are a set of functions for each type of attribute:
 *	string
 * @details
 * Each set has functions for:
 *	Decoding the value string to the internal representation.
 *	Encoding the internal attribute form to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * -------------------------------------------------
 * Set of general attribute functions for attributes
 * with value type "string"
 * -------------------------------------------------
 */

/**
 * @brief
 * 	decode_str - decode string into string attribute
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_str(attribute *patr, char *name, char *rescn, char *val)
{
	size_t len;

	if ((patr->at_flags & ATR_VFLAG_SET) && (patr->at_val.at_str))
		(void) free(patr->at_val.at_str);

	if ((val != NULL) && ((len = strlen(val) + 1) > 1)) {
		patr->at_val.at_str = malloc((unsigned) len);
		if (patr->at_val.at_str == NULL)
			return (PBSE_SYSTEM);
		(void) strcpy(patr->at_val.at_str, val);
		post_attr_set(patr);
	} else {
		ATR_UNSET(patr);
		patr->at_val.at_str = NULL;
	}
	return (0);
}

/**
 * @brief
 * 	encode_str - encode attribute of type ATR_TYPE_STR into attr_extern
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */

/*ARGSUSED*/

int
encode_str(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)

{
	svrattrl *pal;

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET) || !attr->at_val.at_str ||
	    (*attr->at_val.at_str == '\0'))
		return (0);

	pal = attrlist_create(atname, rsname, (int) strlen(attr->at_val.at_str) + 1);
	if (pal == NULL)
		return (-1);

	(void) strcpy(pal->al_value, attr->at_val.at_str);
	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	if ((phead == NULL) && (rtnl == NULL))
		free(pal);

	return (1);
}

/**
 * @brief
 * 	set_str - set attribute value based upon another
 *
 *	A+B --> B is concatenated to end of A
 *	A=B --> A is replaced with B
 *	A-B --> If B is a substring at the end of A, it is stripped off
 *
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

int
set_str(attribute *attr, attribute *new, enum batch_op op)
{
	char *new_value;
	char *p;
	size_t nsize;

	assert(attr && new &&new->at_val.at_str && (new->at_flags &ATR_VFLAG_SET));
	nsize = strlen(new->at_val.at_str) + 1; /* length of new string */
	if ((op == INCR) && !attr->at_val.at_str)
		op = SET; /* no current string, change INCR to SET */

	switch (op) {

		case SET: /* set is replace old string with new */

			if (attr->at_val.at_str)
				(void) free(attr->at_val.at_str);
			if ((attr->at_val.at_str = malloc(nsize)) == NULL)
				return (PBSE_SYSTEM);
			(void) strcpy(attr->at_val.at_str, new->at_val.at_str);
			break;

		case INCR: /* INCR is concatenate new to old string */

			nsize += strlen(attr->at_val.at_str);
			if (attr->at_val.at_str)
				new_value = realloc(attr->at_val.at_str, nsize);
			else
				new_value = malloc(nsize);
			if (new_value == NULL)
				return (PBSE_SYSTEM);
			attr->at_val.at_str = new_value;
			(void) strcat(attr->at_val.at_str, new->at_val.at_str);
			break;

		case DECR: /* DECR is remove substring if match, start at end */

			if (!attr->at_val.at_str)
				break;

			if (--nsize == 0)
				break;
			p = attr->at_val.at_str + strlen(attr->at_val.at_str) - nsize;
			while (p >= attr->at_val.at_str) {
				if (strncmp(p, new->at_val.at_str, (int) nsize) == 0) {
					do {
						*p = *(p + nsize);
					} while (*p++);
				}
				p--;
			}
			break;

		default:
			return (PBSE_INTERNAL);
	}
	if ((attr->at_val.at_str != NULL) && (*attr->at_val.at_str != '\0'))
		post_attr_set(attr);
	else
		attr->at_flags &= ~ATR_VFLAG_SET;

	return (0);
}

/**
 * @brief
 * 	comp_str - compare two attributes of type ATR_TYPE_STR
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_str(attribute *attr, attribute *with)
{
	if (!attr || !attr->at_val.at_str)
		return (-1);
	return (strcmp(attr->at_val.at_str, with->at_val.at_str));
}

/**
 * @brief
 * 	free_str - free space malloc-ed for string attribute value
 *
 * @param[in] attr - pointer to attribute structure
 *
 * @return	Void
 *
 */

void
free_str(attribute *attr)
{
	if ((attr->at_flags & ATR_VFLAG_SET) && (attr->at_val.at_str)) {
		(void) free(attr->at_val.at_str);
	}
	free_null(attr);
	attr->at_val.at_str = NULL;
}

/**
 * @brief
 *	Special function that verifies the size of the input
 * 	for jobname before calling decode_str
 *
 * @param[in] patr - attribute structure
 * @param[in] name - attribute name
 * @param[in] rescn - resource name - unused here
 * @param[in] val - attribute value
 *
 * @return  int
 * @retval  0 if 0k
 * @retval  >0 error number if error
 *
 */

int
decode_jobname(attribute *patr, char *name, char *rescn, char *val)
{

	if (val != NULL) {
		if (strlen(val) > (size_t) PBS_MAXJOBNAME)
			return (PBSE_BADATVAL);
	}
	return (decode_str(patr, name, rescn, val));
}

/**
 * set_attr_str: use set_attr_generic() instead
 */

/**
 * @brief	Attribute getter function for string type values
 *
 * @param[in]	pattr	-	pointer to the attribute
 *
 * @return	char *
 * @retval	string value of the attribute
 * @retval	NULL if attribute is NULL
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 */
char *
get_attr_str(const attribute *pattr)
{
	if (pattr != NULL)
		return pattr->at_val.at_str;
	return NULL;
}


================================================
FILE: src/lib/Libattr/attr_fn_time.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <limits.h>
#include <assert.h>
#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <pbs_ifl.h>
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_time.c
 * @brief
 * 	This file contains functions for manipulating attributes of type
 *	time:	[[hh:]mm:]ss[.sss]
 * @details
 * 	Each set has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the internal attribute to external form
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *
 * Some or all of the functions for an attribute type may be shared with
 * other attribute types.
 *
 * The prototypes are declared in "attribute.h"
 *
 * --------------------------------------------------
 * The Set of Attribute Functions for attributes with
 * value type "long"
 * --------------------------------------------------
 */

/**
 * @brief
 *	decode time into attribute structure of type ATR_TYPE_LONG
 *
 * @param[in/out]   patr - pointer to attribute structure
 * @param[in]   name - attribute name
 * @param[in]   rescn - resource name
 * @param[in]   val - attribute value
 *
 * @return int
 * @retval  0	if ok
 * @retval >0   error
 * @retval *patr elements set
 *
 */

#define PBS_MAX_TIME (LONG_MAX - 1)
int
decode_time(attribute *patr, char *name, char *rescn, char *val)
{
	int i;
	char msec[4] = {'\0'};
	int ncolon = 0;
	char *pc;
	long rv = 0;
	char *workval;
	char *workvalsv;
	long strtol_ret = 0;
	int index = -1;

	if ((val == NULL) || (strlen(val) == 0)) {
		ATR_UNSET(patr);
		patr->at_val.at_long = 0;
		return (0);
	}

	workval = strdup(val);
	if (workval == NULL)
		return (PBSE_SYSTEM);
	workvalsv = workval;

	for (i = 0; i < 3; ++i)
		msec[i] = '0';

	for (pc = workval; *pc; ++pc) {
		index++;
		if (*pc == ':') {
			if ((++ncolon > 2) || (index == 0) || (!isdigit(val[index - 1])))
				goto badval;
			*pc = '\0';
			errno = 0;
			strtol_ret = strtol(workval, NULL, 10);
			if ((strtol_ret < 0) || (errno != 0))
				goto badval;
			rv = (rv * 60) + strtol_ret;
			workval = pc + 1;

		} else if (*pc == '.') {
			*pc++ = '\0';
			if ((index == 0) || (!isdigit(val[index - 1])))
				goto badval;
			for (i = 0; *pc; ++pc) {
				if (!isdigit((int) *pc)) {
					goto badval;
				}
				if (i < 3) {
					msec[i++] = *pc;
				}
			}
			break;
		} else if (!isdigit((int) *pc)) {
			goto badval; /* bad value */
		}
	}
	errno = 0;
	strtol_ret = strtol(workval, NULL, 10);
	if ((strtol_ret < 0) || (errno != 0))
		goto badval;
	rv = (rv * 60) + strtol_ret;
	if ((rv > PBS_MAX_TIME) || (rv < 0))
		goto badval;
	if (atoi(msec) >= 500)
		rv++;
	patr->at_val.at_long = rv;
	post_attr_set(patr);
	(void) free(workvalsv);
	return (0);

badval:
	(void) free(workvalsv);
	return (PBSE_BADATVAL);
}

/**
 * @brief
 *	encode_time - encode attribute of type long into attr_extern
 *	with value in form of hh:mm:ss
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

#define CVNBUFSZ 24

int
encode_time(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	size_t ct;
	unsigned long n;
	unsigned long hr;
	unsigned int min;
	unsigned int sec;
	svrattrl *pal;
	char *pv;
	char cvnbuf[CVNBUFSZ] = {'\0'};

	if (!attr)
		return (-1);
	if (!(attr->at_flags & ATR_VFLAG_SET))
		return (0);
	if (attr->at_val.at_long < 0)
		return (-1);

	n = attr->at_val.at_long;
	hr = n / 3600;
	n %= 3600;
	min = n / 60;
	sec = n % 60;

	pv = cvnbuf;
	(void) sprintf(pv, "%02lu:%02u:%02u", hr, min, sec);
	pv += strlen(pv);

	ct = strlen(cvnbuf) + 1;

	pal = attrlist_create(atname, rsname, ct);
	if (pal == NULL)
		return (-1);

	(void) memcpy(pal->al_value, cvnbuf, ct);
	pal->al_flags = attr->at_flags;
	if (phead)
		append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1);
}

/*
 * set_time  - use the function set_l()
 *
 * comp_time - use the funttion comp_l()
 *
 * free_l - use free_null to (not) free space
 */

/**
 * @brief
 *	Action routine for attributes of type time (or long) where a zero
 *	value is to be disallowed.
 *
 * @param[in]   pattr - pointer to the changed attribute
 * @param[in]   pobject - pointer to parent object of the attribute - unused
 * @param[in]   actmode - if being set/altered - unused
 *
 * @return      int - a PBSE_ defined error
 * @retval	PBSE_NONE - no error
 * @retval	PBSE_BADATVAL - if being set to zero
 *
 */

int
at_non_zero_time(attribute *pattr, void *pobject, int actmode)
{
	if ((pattr->at_flags & ATR_VFLAG_SET) == 0)
		return PBSE_NONE;
	if (pattr->at_val.at_long == 0)
		return PBSE_BADATVAL;
	else
		return PBSE_NONE;
}


================================================
FILE: src/lib/Libattr/attr_fn_unkn.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include <pbs_ifl.h>
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"

/**
 * @file	attr_fn_unkn.c
 * @brief
 * This file contains functions for manipulating attributes of an
 * unknown (unrecognized) name (and therefore unknown type).
 * It is a collection point for all "other" attributes, other than
 * the types with specific definition and meaning.
 *
 * Because the type is unknown, it cannot be decoded into a native
 * form.  Thus the attribute is maintained in the attrlist form.
 * Any attribute/value located here will be sent to the Scheduler and it
 * within its rules may do as it choses with them.
 *
 * The prototypes are declared in "attribute.h"
 *
 * ----------------------------------------------------------------------------
 * Attribute functions for attributes with value type "unknown"
 * ----------------------------------------------------------------------------
 */

/* External Global Items */

/* private functions */

/**
 * @brief
 * 	decode_unkn - decode a pair of strings (name and value) into the Unknown
 *	type attribute/resource which is maintained as a "svrattrl", a
 *	linked list of structures containing strings.
 *
 * @param[in] patr - ptr to attribute to decode
 * @param[in] name - attribute name
 * @param[in] rescn - resource name or null
 * @param[out] val - string holding values for attribute structure
 *
 * @retval      int
 * @retval      0       if ok
 * @retval      >0      error number1 if error,
 * @retval      *patr   members set
 *
 */

int
decode_unkn(attribute *patr, char *name, char *rescn, char *value)
{
	svrattrl *entry;
	size_t valln;

	if (patr == NULL)
		return (PBSE_INTERNAL);

	if (!(patr->at_flags & ATR_VFLAG_SET))
		CLEAR_HEAD(patr->at_val.at_list);

	if (name == NULL)
		return (PBSE_INTERNAL);

	if (value == NULL)
		valln = 0;
	else
		valln = strlen(value) + 1;

	entry = attrlist_create(name, rescn, valln);
	if (entry == NULL)
		return (PBSE_SYSTEM);

	if (valln)
		memcpy(entry->al_value, value, valln);

	append_link(&patr->at_val.at_list, &entry->al_link, entry);
	post_attr_set(patr);
	return (0);
}

/**
 * @brief
 * 	encode_unkn - encode attr of unknown type into attrlist form
 *
 * Here things are different from the typical attribute.  Most have a
 * single value to be encoded.  But "the unknown" attribute may have a whole
 * list.
 *
 * This function does not use the parent attribute name, after all "_other_"
 * is rather meaningless.  In addition, each unknown already is in an
 * attrlist form.
 *
 * Thus for each entry in the list, encode_unkn duplicates the existing
 * attrlist struct and links the copy into the list.
 *
 * @param[in] attr - ptr to attribute to encode
 * @param[in] phead - ptr to head of attrlist list
 * @param[in] atname - attribute name
 * @param[in] rsname - resource name or null
 * @param[in] mode - encode mode
 * @param[out] rtnl - ptr to svrattrl
 *
 * @retval      int
 * @retval      >0      if ok, entry created and linked into list
 * @retval      =0      no value to encode, entry not created
 * @retval      -1      if error
 *
 */
/*ARGSUSED*/

int
encode_unkn(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	svrattrl *plist;
	svrattrl *pnew;
	svrattrl *xprior = NULL;
	int first = 1;

	if (!attr)
		return (-2);

	plist = (svrattrl *) GET_NEXT(attr->at_val.at_list);
	if (plist == NULL)
		return (0);

	while (plist != NULL) {
		pnew = (svrattrl *) malloc(plist->al_tsize);
		if (pnew == NULL)
			return (-1);
		CLEAR_LINK(pnew->al_link);
		pnew->al_sister = NULL;
		pnew->al_tsize = plist->al_tsize;
		pnew->al_nameln = plist->al_nameln;
		pnew->al_rescln = plist->al_rescln;
		pnew->al_valln = plist->al_valln;
		pnew->al_flags = plist->al_flags;
		pnew->al_refct = 1;

		pnew->al_name = (char *) pnew + sizeof(svrattrl);
		(void) memcpy(pnew->al_name, plist->al_name, plist->al_nameln);
		if (plist->al_rescln) {
			pnew->al_resc = pnew->al_name + pnew->al_nameln;
			(void) memcpy(pnew->al_resc, plist->al_resc,
				      plist->al_rescln);
		} else {
			pnew->al_resc = NULL;
		}
		if (plist->al_valln) {
			pnew->al_value = pnew->al_name + pnew->al_nameln +
					 pnew->al_rescln;
			(void) memcpy(pnew->al_value, plist->al_value,
				      pnew->al_valln);
		}
		if (phead)
			append_link(phead, &pnew->al_link, pnew);
		if (first) {
			if (rtnl)
				*rtnl = pnew;
			first = 0;
		} else {
			if (xprior)
				xprior->al_sister = pnew;
		}
		xprior = pnew;

		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}
	return (1);
}

/**
 * @brief
 * 	set_unkn - set value of attribute of unknown type  to another
 *
 *	Each entry in the list headed by the "new" attribute is appended
 *	to the list headed by "old".
 *
 *	All operations, set, incr, and decr, map to append.
 * @param[in]   attr - pointer to new attribute to be set (A)
 * @param[in]   new  - pointer to attribute (B)
 * @param[in]   op   - operator
 *
 * @return      int
 * @retval      0       if ok
 * @retval     >0       if error
 *
 */

/*ARGSUSED*/
int
set_unkn(attribute *old, attribute *new, enum batch_op op)
{
	svrattrl *plist;
	svrattrl *pnext;

	assert(old && new && (new->at_flags &ATR_VFLAG_SET));

	plist = (svrattrl *) GET_NEXT(new->at_val.at_list);
	while (plist != NULL) {
		pnext = (svrattrl *) GET_NEXT(plist->al_link);
		delete_link(&plist->al_link);
		append_link(&old->at_val.at_list, &plist->al_link, plist);
		plist = pnext;
	}
	post_attr_set(old);
	return (0);
}

/**
 * @brief
 * 	comp_unkn - compare two attributes of type ATR_TYPE_RESR
 *
 *	How do you compare something when you don't know what it is...
 *	So, always returns +1
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return      int
 * @retval      0       if the set of strings in "with" is a subset of "attr"
 * @retval      1       otherwise
 *
 */

int
comp_unkn(attribute *attr, attribute *with)
{
	return (1);
}

/**
 * @brief
 * 	free_unkn - free space associated with attribute value
 *
 *	For each entry in the list, it is delinked, and freed.
 *
 * @param[in] pattr - pointer to attribute structure
 *
 * @return	Void
 *
 */

void
free_unkn(attribute *pattr)
{
	svrattrl *plist;

	if (pattr->at_flags & ATR_VFLAG_SET) {
		while ((plist = (svrattrl *) GET_NEXT(pattr->at_val.at_list)) !=
		       NULL) {
			delete_link(&plist->al_link);
			(void) free(plist);
		}
	}
	free_null(pattr);
	CLEAR_HEAD(pattr->at_val.at_list);
}


================================================
FILE: src/lib/Libattr/attr_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <ctype.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_error.h"
#include "libpbs.h"
#include "pbs_idx.h"
#include "pbs_entlim.h"
#include "job.h"

/**
 *
 * @brief
 * 	This file contains general functions for manipulating attributes and attribute lists.
 *
 */

/**
 * @brief
 * 	clear_attr - clear an attribute value structure and clear ATR_VFLAG_SET
 *
 * @param[in] pattr - pointer to attribute structure
 * @param[in] pdef - pointer to attribute_def structure
 *
 * @return	Void
 *
 */

void
clear_attr(attribute *pattr, attribute_def *pdef)
{
#ifndef NDEBUG
	if (pdef == 0) {
		(void) fprintf(stderr, "Assertion failed, bad pdef in clear_attr\n");
		abort();
	}
#endif
	(void) memset((char *) pattr, 0, sizeof(struct attribute));
	pattr->at_type = pdef->at_type;
	if ((pattr->at_type == ATR_TYPE_RESC) ||
	    (pattr->at_type == ATR_TYPE_LIST))
		CLEAR_HEAD(pattr->at_val.at_list);
}

/**
 * @brief
 * 	Create the search index for the provided attribute def array
 *
 * @param[in] attr_def - ptr to attribute definitions
 * @param[in] limit - limit on size of def array
 *
 * @return	void *
 * @retval	 NULL	Failure
 * @retval	!NULL	The address of the search index created
 *
 */
void *
cr_attrdef_idx(attribute_def *adef, int limit)
{
	int i;
	void *attrdef_idx = NULL;

	if (!adef)
		return NULL;

	/* create the attribute index */
	if ((attrdef_idx = pbs_idx_create(PBS_IDX_ICASE_CMP, 0)) == NULL)
		return NULL;

	/* add all attributes to the tree with key as the attr name */
	for (i = 0; i < limit; i++) {
		if (pbs_idx_insert(attrdef_idx, adef->at_name, adef) != PBS_IDX_RET_OK)
			return NULL;

		adef++;
	}
	return attrdef_idx;
}

/**
 * @brief
 * 	find attribute definition by name
 *
 *	Searches array of attribute definition strutures to find one
 *	whose name matches the requested name.
 *
 * @param[in] attr_idx - search index of the attribute def array
 * @param[in] attr_def - ptr to attribute definitions
 * @param[in] name - attribute name to find
 *
 * @return	int
 * @retval	>=0	index into definition struture array
 * @retval	-1	if didn't find matching name
 *
 */
int
find_attr(void *attrdef_idx, attribute_def *attr_def, char *name)
{
	int index = -1;
	attribute_def *found_def = NULL;

	if (pbs_idx_find(attrdef_idx, (void **) &name, (void **) &found_def, NULL) == PBS_IDX_RET_OK)
		index = (found_def - attr_def);

	return index;
}

/**
 * @brief
 * 	free_svrcache - free the cached svrattrl entries associated with an attribute
 *
 * @param[in] attr - pointer to attribute structure
 *
 * @return	Void
 *
 */

void
free_svrcache(attribute *attr)
{
	struct svrattrl *working;
	struct svrattrl *sister;

	working = attr->at_user_encoded;
	if ((working != NULL) && (--working->al_refct <= 0)) {
		while (working) {
			sister = working->al_sister;
			delete_link(&working->al_link);
			(void) free(working);
			working = sister;
		}
	}
	attr->at_user_encoded = NULL;

	working = attr->at_priv_encoded;
	if ((working != NULL) && (--working->al_refct <= 0)) {
		while (working) {
			sister = working->al_sister;
			delete_link(&working->al_link);
			(void) free(working);
			working = sister;
		}
	}
	attr->at_priv_encoded = NULL;
}

/**
 * @brief
 *	free_null - A free routine for attributes which do not
 *	have malloc-ed space ( boolean, char, long ).
 *
 * @param[in] attr - pointer to attribute structure
 *
 * @return	Void
 *
 */
/*ARGSUSED*/
void
free_null(attribute *attr)
{
	memset(&attr->at_val, 0, sizeof(attr->at_val));
	if (attr->at_type == ATR_TYPE_SIZE)
		attr->at_val.at_size.atsv_shift = 10;
	attr->at_flags &= ~(ATR_VFLAG_SET | ATR_VFLAG_INDIRECT | ATR_VFLAG_TARGET);
	if (attr->at_user_encoded != NULL || attr->at_priv_encoded != NULL)
		free_svrcache(attr);
}

/**
 * @brief
 * 		decode_null - Null attribute decode routine for Read Only (server
 *		and queue ) attributes.  It just returns 0.
 *
 * @param[in]	patr	-	not used
 * @param[in]	name	-	not used
 * @param[in]	rn	-	not used
 * @param[in]	val	-	not used
 *
 * @return	zero
 */

int
decode_null(attribute *patr, char *name, char *rn, char *val)
{
	return 0;
}

/**
 * @brief
 * 		set_null - Null set routine for Read Only attributes.
 *
 * @param[in]	pattr	-	not used
 * @param[in]	new	-	not used
 * @param[in]	op	-	not used
 *
 * @return	zero
 */

int
set_null(attribute *pattr, attribute *new, enum batch_op op)
{
	return 0;
}

/**
 * @brief
 * 	comp_null - A do nothing, except return 0, attribute comparison
 *	function.
 *
 * @param[in] attr - pointer to attribute structure
 * @param[in] with - pointer to attribute structure
 *
 * @return	int
 * @retval	0
 *
 */

int
comp_null(attribute *attr, attribute *with)
{
	return 0;
}

/**
 * @brief
 * 	attrlist_alloc - allocate space for an svrattrl structure entry
 *
 *	The space required for the entry is calculated and allocated.
 *	The total size and three string lengths are set in the entry,
 *	but no values are placed in it.
 *
 * @param[in] szname - string size for name
 * @param[in] szresc - string size for resource
 * @param[in] szval - string size for value
 *
 * @return 	svrattrl *
 * @retval	ptr to entry 	on success
 * @retval	NULL 		if error
 *
 */

svrattrl *
attrlist_alloc(int szname, int szresc, int szval)
{
	register size_t tsize;
	svrattrl *pal;

	if (szname < 0 || szresc < 0 || szval < 0)
		return NULL;
	tsize = sizeof(svrattrl) + szname + szresc + szval;
	pal = (svrattrl *) malloc(tsize);
	if (pal == NULL)
		return NULL;
#ifdef DEBUG
	memset(pal, 0, sizeof(svrattrl));
#endif

	CLEAR_LINK(pal->al_link); /* clear link */
	pal->al_sister = NULL;
	pal->al_atopl.next = 0;
	pal->al_tsize = tsize; /* set various string sizes */
	pal->al_nameln = szname;
	pal->al_rescln = szresc;
	pal->al_valln = szval;
	pal->al_flags = 0;
	pal->al_op = SET;
	pal->al_name = (char *) pal + sizeof(svrattrl);
	if (szresc)
		pal->al_resc = pal->al_name + szname;
	else
		pal->al_resc = NULL;
	pal->al_value = pal->al_name + szname + szresc;
	pal->al_refct = 0;
	return (pal);
}

/**
 * @brief
 * 	attrlist_create - create an svrattrl structure entry
 *
 *	The space required for the entry is calculated and allocated.
 * 	The attribute and resource name is copied into the entry.
 * 	Note, the value string should be inserted by the caller after this returns.
 *
 * @param[in] aname - attribute name
 * @param[in] rname - resource name if needed or null
 * @param[in] vsize - size of resource value
 *
 * @return      svrattrl *
 * @retval      ptr to entry    on success
 * @retval      NULL            if error
 *
 */

svrattrl *
attrlist_create(char *aname, char *rname, int vsize)
{
	svrattrl *pal;
	size_t asz;
	size_t rsz;

	asz = strlen(aname) + 1; /* attribute name,allow for null term */

	if (rname == NULL) /* resource name only if type resource */
		rsz = 0;
	else
		rsz = strlen(rname) + 1;

	pal = attrlist_alloc(asz, rsz, vsize + 1);
	if (pal != NULL) {
		strcpy(pal->al_name, aname); /* copy name right after struct */
		if (rsz)
			strcpy(pal->al_resc, rname);
		pal->al_refct++;
	}
	return (pal);
}

/**
 * @brief
 *	free_attrlist - free the space allocated to a list of svrattrl
 *	structures
 *
 * @param[in] pattrlisthead - Pointer to the head of the linked list to free
 *
 * @return	Void
 *
 */
void
free_attrlist(pbs_list_head *pattrlisthead)
{
	free_svrattrl((svrattrl *) GET_NEXT(*pattrlisthead));
}

/**
 * @brief
 *	free an attribute list
 *
 * @param[in] pal - Pointer to the attribute list
 *
 * @return void
 *
 */
void
free_svrattrl(svrattrl *pal)
{
	svrattrl *nxpal;
	svrattrl *sister;

	while (pal != NULL) {
		if (--pal->al_refct <= 0) {
			/* if we have any sisters, need to delete them now */
			/* just in case we end up deleting them later and  */
			/* still pointing to them			   */
			sister = pal->al_sister;
			while (sister) {
				nxpal = sister->al_sister;
				delete_link(&sister->al_link);
				(void) free(sister);
				sister = nxpal;
			}
		}
		nxpal = (struct svrattrl *) GET_NEXT(pal->al_link);
		delete_link(&pal->al_link);
		if (pal->al_refct <= 0)
			(void) free(pal);
		pal = nxpal;
	}
}

/**
 * @brief
 * 	parse_comma_string() - parse a string of the form:
 *		value1 [, value2 ...]
 *
 *	On the first call, start is non null, a pointer to the first value
 *	element upto a comma, new-line, or end of string is returned.
 *
 *	On any following calls with start set to a null pointer NULL,
 *	the next value element is returned...
 *
 *	A null pointer is returned when there are no (more) value elements.
 */

char *
parse_comma_string(char *start)
{
	static char *pc; /* if start is null, restart from here */

	char *back;
	char *rv;

	if (start != NULL)
		pc = start;

	if (*pc == '\0')
		return NULL; /* already at end, no strings */

	/* skip over leading white space */

	while ((*pc != '\n') && isspace((int) *pc) && *pc)
		pc++;

	rv = pc; /* the start point which will be returned */

	/* go find comma or end of line */

	while (*pc) {
		if (((*pc == ',') && ((rv == pc) || (*(pc - 1) != ESC_CHAR))) || (*pc == '\n'))
			break;
		++pc;
	}
	back = pc;
	while (isspace((int) *--back)) /* strip trailing spaces */
		*back = '\0';

	if (*pc)
		*pc++ = '\0'; /* if not end, terminate this and adv past */

	return (rv);
}

/**
 * @brief
 * 	count_substrings - counts number of substrings in a comma separated string
 *
 * @see parse_comma_string
 *
 * @param[in] val - comma separated string of substrings
 * @param[in] pcnt - where to return the value
 *
 * @return	int
 * @retval	0			success
 * @retval	PBSE error code		error
 */
int
count_substrings(char *val, int *pcnt)
{
	int rc = 0;
	int ns;
	char *pc;

	if (val == NULL)
		return (PBSE_INTERNAL);
	/*
	 * determine number of substrings, each sub string is terminated
	 * by a non-escaped comma or a new-line, the whole string is terminated
	 * by a null
	 */

	ns = 1;
	for (pc = val; *pc; pc++) {
		if (*pc == ESC_CHAR) {
			if (*(pc + 1))
				pc++;
		} else {
			if (*pc == ',' || *pc == '\n')
				++ns;
		}
	}
	if (pc > val)
		pc--;
	if ((*pc == '\n') || (*pc == ',')) {
		if ((pc > val) && (*(pc - 1) != ESC_CHAR)) {
			/* strip trailing empty string */
			ns--;
			*pc = '\0';
		}
	}

	*pcnt = ns;
	return rc;
}

/**
 * @brief
 * 	attrl_fixlink - fix up the next pointer within the attropl substructure
 *	within a svrattrl list.
 *
 * @param[in] phead - pointer to head of svrattrl list
 *
 * @return	Void
 *
 */

void
attrl_fixlink(pbs_list_head *phead)
{
	svrattrl *pal;
	svrattrl *pnxt;

	pal = (svrattrl *) GET_NEXT(*phead);
	while (pal) {
		pnxt = (svrattrl *) GET_NEXT(pal->al_link);
		if (pal->al_flags & ATR_VFLAG_DEFLT) {
			pal->al_atopl.op = DFLT;
		} else {
			pal->al_atopl.op = SET;
		}
		if (pnxt)
			pal->al_atopl.next = &pnxt->al_atopl;
		else
			pal->al_atopl.next = NULL;
		pal = pnxt;
	}
}

/**
 * @brief
 * 	free_none - when scheduler modifies accrue_type, we don't
 *            want to delete previous value.
 *
 * @param[in] attr - pointer to attribute structure
 *
 * @return	Void
 *
 */

void
free_none(attribute *attr)
{
	/* do nothing */
	/* to be used for accrue_type attribute of job */
	if (attr->at_user_encoded != NULL || attr->at_priv_encoded != NULL) {
		free_svrcache(attr);
	}
}

/**
 *  @brief duplicate svrattrl structure
 *
 *  @param[in] osvrat - svrattrl to dup
 *
 *  @return dup'd svrattrl or NULL (failure)
 */

svrattrl *
dup_svrattrl(svrattrl *osvrat)
{
	svrattrl *psvrat;
	size_t tsize;

	if (osvrat == NULL)
		return NULL;

	tsize = sizeof(svrattrl) + osvrat->al_nameln + osvrat->al_valln + 2;
	if (osvrat->al_rescln > 0)
		tsize += osvrat->al_rescln + 1;

	if ((psvrat = (svrattrl *) malloc(tsize)) == 0)
		return NULL;

	CLEAR_LINK(psvrat->al_link);
	psvrat->al_sister = NULL;
	psvrat->al_atopl.next = 0;
	psvrat->al_tsize = tsize;

	psvrat->al_name = (char *) psvrat + sizeof(svrattrl);
	strcpy(psvrat->al_name, osvrat->al_name);
	psvrat->al_nameln = osvrat->al_nameln;

	if (osvrat->al_rescln > 0) {
		psvrat->al_resc = psvrat->al_name + psvrat->al_nameln + 1;
		strcpy(psvrat->al_resc, osvrat->al_resc);
		psvrat->al_rescln = osvrat->al_rescln;
		psvrat->al_value = psvrat->al_resc + psvrat->al_rescln + 1;
	} else {
		psvrat->al_resc = NULL;
		psvrat->al_rescln = 0;
		psvrat->al_value = psvrat->al_name + psvrat->al_nameln + 1;
	}

	strcpy(psvrat->al_value, osvrat->al_value);
	psvrat->al_valln = osvrat->al_valln;

	psvrat->al_flags = osvrat->al_flags;
	psvrat->al_refct = 1;
	psvrat->al_op = osvrat->al_op;

	return psvrat;
}

/**
 * @brief
 * 	Adds a new entry (name_str, resc_str, val_str, flag) to the 'phead'
 *	svrattrl list.
 *	If 'name_prefix' is not NULL, then instead of adding 'name_str',
 *	add 'name_prefix.name_str'.
 *
 * @param[in/out]	phead - head of the svrattrl list to be populated.
 * @param[in]		name_str - the name field
 * @param[in]		resc_str - the resource name field
 * @param[in]		val_str - the value field.
 * @param[in]		flag - the flag entry
 * @param[in]		name_prefix - string to prefix the 'name_str'
 *
 * @return int
 * @retval 0 for sucess
 * @retval -1 for error
 *
 */
int
add_to_svrattrl_list(pbs_list_head *phead, char *name_str, char *resc_str,
		     char *val_str, unsigned int flag, char *name_prefix)
{
	svrattrl *psvrat = NULL;
	int valln = 0;
	char *tmp_str = NULL;
	size_t sz;
	char *the_str;

	if (name_str == NULL)
		return -1;

	the_str = name_str;

	if (name_prefix != NULL) {

		/* for <name_prefix>.<name_str>\0 */
		sz = strlen(name_prefix) + strlen(name_str) + 2;
		tmp_str = (char *) malloc(sz);
		if (tmp_str == NULL) {
			return -1;
		} else {
			snprintf(tmp_str, sz, "%s.%s", name_prefix, name_str);
			the_str = tmp_str;
		}
	}

	if (val_str) {
		valln = (int) strlen(val_str) + 1;
	}
	psvrat = attrlist_create(the_str, resc_str, valln);

	free(tmp_str);

	if (!psvrat) {
		return -1;
	}
	if (val_str) {
		strcpy(psvrat->al_value, val_str);
	}
	psvrat->al_flags = flag;
	append_link(phead, &psvrat->al_link, psvrat);

	return 0;
}

/**
 * @brief
 * 	Adds a new entry (name_str, resc_str, val_str, flag) to the 'phead'
 *	svrattrl list in a sorted (by [name_prefix.]name_str) way.
 *
 * @param[in]	phead	- pointer to the targeted list.
 * @param[in]	name_str - fills in the svrattrl al_name field
 * @param[in]	resc_str - fills in the svrattrl al_resc field
 * @param[in]	val_str - fills in the svrattrl al_value field
 * @param[in]	flag - fills in the svrattrl al_flags field
 * @param[in]	name_prefix - string to prefix the 'name_str'
 *
 * @return int
 * @retval 0	success
 * @retval -1	error
 */
int
add_to_svrattrl_list_sorted(pbs_list_head *phead, char *name_str, char *resc_str,
			    char *val_str, unsigned int flag, char *name_prefix)
{
	svrattrl *psvrat = NULL;
	int valln = 0;
	pbs_list_link *plink_cur;
	svrattrl *psvr_cur;
	char *tmp_str = NULL;
	size_t sz;
	char *the_str;

	the_str = name_str;

	if (name_prefix != NULL) {

		/* for <name_prefix>.<name_str>\0 */
		sz = strlen(name_prefix) + strlen(name_str) + 2;
		tmp_str = (char *) malloc(sz);
		if (tmp_str == NULL) {
			return -1;
		} else {
			snprintf(tmp_str, sz, "%s.%s", name_prefix, name_str);
			the_str = tmp_str;
		}
	}

	if (val_str) {
		valln = (int) strlen(val_str) + 1;
	}
	psvrat = attrlist_create(the_str, resc_str, valln);

	if (tmp_str != NULL)
		free(tmp_str);

	if (!psvrat) {
		return -1;
	}
	if (val_str) {
		strcpy(psvrat->al_value, val_str);
	}
	psvrat->al_flags = flag;

	plink_cur = phead;
	psvr_cur = (svrattrl *) GET_NEXT(*phead);

	while (psvr_cur) {
		plink_cur = &psvr_cur->al_link;

		if (strcmp(psvr_cur->al_name, psvrat->al_name) > 0) {
			break;
		}
		psvr_cur = (svrattrl *) GET_NEXT(*plink_cur);
	}

	if (psvr_cur) {
		/* link before 'current' svrattrl in list */
		insert_link(plink_cur, &psvrat->al_link, psvrat, LINK_INSET_BEFORE);
	} else {
		/* attach either at the beginning or the last of the list */
		insert_link(plink_cur, &psvrat->al_link, psvrat, LINK_INSET_AFTER);
	}
	return 0;
}

/**
 * @brief
 * 	Copies contents of list headed by 'from_head' into 'to_head'
 *
 * @param[in]		from_head	- source list
 * @param[in,out]	to_head		- destination list
 *
 * @return int
 * @retval 0	- success
 * @retval -1	- failure
 *
 */
int
copy_svrattrl_list(pbs_list_head *from_head, pbs_list_head *to_head)
{
	svrattrl *plist = NULL;

	if ((from_head == NULL) || (to_head == NULL))
		return -1;

	CLEAR_HEAD((*to_head));
	plist = (svrattrl *) GET_NEXT((*from_head));
	while (plist) {

		if (add_to_svrattrl_list(to_head, plist->al_name, plist->al_resc,
					 plist->al_value, plist->al_op, NULL) == -1) {
			free_attrlist(to_head);
			CLEAR_HEAD((*to_head));
			return -1;
		}

		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}
	return 0;
}

/**
 * @brief
 * 	Copies contents of attr list headed by 'from_list' into 'to_head'
 * 	It does not free the original list
 *
 * @param[in]		from_list	- source list
 * @param[in,out]	to_head		- destination list
 *
 * @return int
 * @retval 0	- success
 * @retval -1	- failure
 *
 */
int
convert_attrl_to_svrattrl(struct attrl *from_list, pbs_list_head *to_head)
{
	struct attrl *plist = NULL;

	if ((from_list == NULL) || (to_head == NULL))
		return -1;

	CLEAR_HEAD((*to_head));

	for (plist = from_list; plist; plist = plist->next) {

		if (add_to_svrattrl_list(to_head, plist->name, plist->resource,
					 plist->value, plist->op, NULL) == -1) {
			free_attrlist(to_head);
			CLEAR_HEAD((*to_head));
			return -1;
		}
	}

	return 0;
}

/**
 * @brief
 * 	returns the svrattrl list matching 'name' and 'resc' (if resc is non-NULL)
 *  @param[in]	phead	- list being searched
 *  *param[in]	name	- search name
 *  @param[in]	resc	- search resource
 *
 *  @retval	*svrattrl
 *
 *  @retval	<pointer to the matching svrattrl entry>
 *  @retval	NULL - none found
 */
svrattrl *
find_svrattrl_list_entry(pbs_list_head *phead, char *name, char *resc)
{
	svrattrl *plist = NULL;

	if (!name)
		return NULL;

	plist = (svrattrl *) GET_NEXT(*phead);
	while (plist) {

		if ((strcmp(plist->al_name, name) == 0) &&
		    (!resc || (strcmp(plist->al_resc, resc) == 0))) {
			return plist;
		}

		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}
	return NULL;
}

/**
 * @brief
 * 	 Checks svrattrl_list to see if 'name' and 'resc' (if set) appear
 * as al_name and al_resc values. if so, return that entry's al_flags value.
 *
 * @param[in]	name - al_name value to match
 * @param[in]	resc - al_resc value to match
 * @param[in]	hook_set_flag -  if set to 1, then add the ATR_VFLAG_HOOK flag
 * 			to the return value of al_flags
 * @return	int
 * @retval	ATR_VFLAG_HOOK	if there's no matching entry found for 'name' and
 *				'resc', but 'hook_set_flag' is set to 1.
 * @retval	0		if there's no matching entry found for 'name' and
 * 				'resc', and 'hook_set_flag' is 0.
 * @retval	<value>		al_flags matching entry for 'name' and 'resc',
 * 				appended with ATR_VFLAG_HOOK if 'hook_set_flag' is
 * 				set to 1.
 *
 */
unsigned int
get_svrattrl_flag(char *name, char *resc, char *val,
		  pbs_list_head *svrattrl_list, int hook_set_flag)
{
	svrattrl *svrattrl_e;
	unsigned int flag = 0;

	/* get the flag to set */
	if ((svrattrl_e = find_svrattrl_list_entry(svrattrl_list, name, resc)) != NULL)
		flag = svrattrl_e->al_flags;

	if (hook_set_flag == 1)
		flag |= ATR_VFLAG_HOOK;

	return (flag);
}

/**
 * @brief
 *	Compares 2 svrattrl linked lists.
 *
 * @param[in]	l1 - svrattrl list #1
 * @param[in]	l2 - svrattrl list #2
 *
 * @return int
 * @retval 1	if the 2 lists are the same
 * @retval 0	otherwise
 */
int
compare_svrattrl_list(pbs_list_head *l1, pbs_list_head *l2)
{
	pbs_list_head list1;
	pbs_list_head list2;
	svrattrl *pal1 = NULL;
	svrattrl *pal2 = NULL;
	svrattrl *nxpal1 = NULL;
	svrattrl *nxpal2 = NULL;
	int rc;
	int found_match = 0;

	if (copy_svrattrl_list(l1, &list1) == -1) {
		rc = 0;
		goto compare_svrattrl_list_exit;
	}
	if (copy_svrattrl_list(l2, &list2) == -1) {
		rc = 0;
		goto compare_svrattrl_list_exit;
	}

	/* now compare the 2 lists */
	pal1 = (svrattrl *) GET_NEXT(list1);
	while (pal1 != NULL) {

		nxpal1 = (svrattrl *) GET_NEXT(pal1->al_link);

		pal2 = (svrattrl *) GET_NEXT(list2);
		found_match = 0;
		while (pal2 != NULL) {
			nxpal2 = (struct svrattrl *) GET_NEXT(pal2->al_link);
			if ((strcmp(pal1->al_name, pal2->al_name) == 0) &&
			    (strcmp(pal1->al_value, pal2->al_value) == 0)) {
				found_match = 1;
				delete_link(&pal2->al_link);
				free(pal2);

				delete_link(&pal1->al_link);
				free(pal1);
				break;
			}

			pal2 = nxpal2;
		}
		if (!found_match) {
			rc = 0;
			goto compare_svrattrl_list_exit;
		}
		pal1 = nxpal1;
	}
	pal1 = (svrattrl *) GET_NEXT(list1);
	pal2 = (svrattrl *) GET_NEXT(list2);

	if ((pal1 == NULL) && (pal2 == NULL)) {
		rc = 1;
	} else {
		rc = 0;
	}

compare_svrattrl_list_exit:
	free_attrlist(&list1);
	free_attrlist(&list2);

	return (rc);
}

/**
 * @brief
 *	Free up malloc-ed entries of a 'str_array' and the array itself.
 *
 * @param[in]	str_array	- array of strings terminated by a NULL entry
 *
 * @return void
 *
 */
void
free_str_array(char **str_array)
{
	int i;

	if (str_array == NULL)
		return;

	i = 0;
	while (str_array[i]) {
		free(str_array[i]);
		i++;
	}
	free(str_array);
}

/**
 * @brief
 * 	Given a 'pbs_list', store the al_value field values into
 * 	a string array, and return that array.
 *
 * @param[in]	pbs_list	- the source list
 *
 * @return	char **
 * @retval	pointer to the string array
 * @retval	NULL	- could not allocate memory or input invalid.
 */
char **
svrattrl_to_str_array(pbs_list_head *pbs_list)
{
	int i;
	int len;
	char **str_array = NULL;
	svrattrl *plist = NULL;

	if (pbs_list == NULL)
		return NULL;

	/* calculate the list size */
	len = 0;
	plist = (svrattrl *) GET_NEXT(*pbs_list);
	while (plist) {
		if (plist->al_value == NULL) {
			return NULL;
		}

		len++;
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	/* add one more entry to calloc for the terminating NULL entry */
	str_array = (char **) calloc(len + 1, sizeof(char *));
	if (str_array == NULL) {
		return NULL;
	}

	plist = (svrattrl *) GET_NEXT(*pbs_list);
	i = 0;
	while (plist) {
		if (plist->al_value != NULL) {
			str_array[i] = strdup(plist->al_value);
			if (str_array[i] == NULL) {
				free_str_array(str_array);
				return NULL;
			}
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
		i++;
	}
	return (str_array);
}
/**
 * @brief
 * 	Given a string array 'str_array', dumps its contents
 * 	into the 'to_head' list, in the same order as indexed
 * 	in the array.
 *
 * @param[in]		str_array - the array of strings to dump
 * @param[in,out]	to_head - the destination list
 * @param[in]		name_str - name to associate the values with
 *
 * @return	int
 * @retval	0	- success
 * @retval	-1	- error
 *
 */
int
str_array_to_svrattrl(char **str_array, pbs_list_head *to_head, char *name_str)
{
	int i;

	if ((str_array == NULL) || (to_head == NULL))
		return -1;

	CLEAR_HEAD((*to_head));
	i = 0;
	while (str_array[i]) {
		if (add_to_svrattrl_list(to_head, name_str, NULL, str_array[i], 0, NULL) == -1) {
			/* clear what we've accumulated so far*/
			free_attrlist(to_head);
			CLEAR_HEAD((*to_head));
			return -1;
		}
		i++;
	}
	return (0);
}

/**
 * @brief
 * 	Given a string array 'str_array', return a malloc-ed
 * 	string, containing the entries of 'str_array' separated
 *	by 'delimiter'.
 * @note
 *	Need to free() returned value.
 *
 * @param[in]	str_array - the array of strings to dump
 * @param[in]	delimiter  - the separator character used in the resultant
 *				string.
 *
 * @return	char *
 * @retval	<string>	- pointer to a malloced area holding
 *				  the contents of 'str_array'.
 * @retval	NULL		- error or the input <string> passed
 * 				  is empty.
 *
 */
char *
str_array_to_str(char **str_array, char delimiter)
{
	int i, j, len;
	char *ret_string = NULL;

	if (str_array == NULL)
		return NULL;

	len = 0;
	i = 0;

	while (str_array[i]) {

		len += strlen(str_array[i]);
		len++; /* for 'delimiter' */
		i++;
	}
	len++; /* for trailing '\0' */

	if (len > 1) { /* not just an empty string */

		ret_string = (char *) malloc(len);

		if (ret_string == NULL)
			return NULL;
		i = 0;
		while (str_array[i]) {

			if (i == 0) {
				strcpy(ret_string, str_array[i]);
			} else {
				j = strlen(ret_string);
				ret_string[j] = delimiter;
				ret_string[j + 1] = '\0';
				strcat(ret_string, str_array[i]);
			}
			i++;
		}
	}
	return (ret_string);
}

/**
 * @brief
 * 	Given a 'delimiter'-separated string 'str', store the
 * 	the string entities into
 * 	a string array, and return that array.
 * @note
 *	Need to free() returned value.
 *
 * @param[in]	str_array - the array of strings to dump
 * @param[in]	delimiter  - the delimiter to match.
 *
 * @return	char *
 * @retval	<string>	- pointer to a malloced area holding
 *				  the contents of 'str_array'.
 * @retval	NULL		- error
 *
 */
char **
str_to_str_array(char *str, char delimiter)
{
	int i;
	int len;
	char **str_array = NULL;
	char *str1;
	char *p;

	if (str == NULL)
		return NULL;

	/* calculate the list size */
	len = 0;

	str1 = strdup(str);
	if (str1 == NULL)
		return NULL;

	len = 0;
	p = strtok_quoted(str1, delimiter);
	while (p) {
		len++;
		p = strtok_quoted(NULL, delimiter);
	}
	(void) free(str1);

	/* add one more entry to calloc for the terminating NULL entry */
	str_array = (char **) calloc(len + 1, sizeof(char *));
	if (str_array == NULL) {
		return NULL;
	}
	str1 = strdup(str);
	if (str1 == NULL) {
		free_str_array(str_array);
		return NULL;
	}
	p = strtok_quoted(str1, delimiter);
	i = 0;
	while (p) {
		str_array[i] = strdup(p);
		if (str_array[i] == NULL) {
			free_str_array(str_array);
			free(str1);
			return NULL;
		}
		i++;
		p = strtok_quoted(NULL, delimiter);
	}
	free(str1);

	return (str_array);
}

/**
 * @brief
 * 	Given a environment string array 'env_array' where there are
 *	<var>=<value> entries, return a malloc-ed
 * 	string, containing the entries of 'env_array' separated
 *	by 'delimiter'.
 *
 * @note
 *	Need to free() returned value.
 *	If 'env_array' has a <value> entry containing the 'delimiter' character,
 *	then it is escaped (using ESC_CHAR). Similarly, if <value> contains the escape
 *	character, then that is also escaped.
 *	Ex:  env_array_to_str(envstr, ',')
 *		where   envstr[0]='HOME=/home/somebody'
 *			envstr[1]='G_FILENAME_ENCODING=@locale,UTF-8,ISO-8859-15,CP1252'
 *	then string returned will be:
 *		'HOME=/home/somebody,G_FILENAME_ENCODING="@locale\,UTF-8\,ISO-8859-15\,CP1252"'
 *
 * @param[in]	env_array - the environment array of strings to dump
 * @param[in]	delimiter  - the separator character
 *
 * @return	char *
 * @retval	<string>	- pointer to a malloced area holding
 *				  the contents of 'env_array'.
 * @retval	NULL		- error or the input <string> passed
 * 				  is empty.
 *
 */
char *
env_array_to_str(char **env_array, char delimiter)
{
	int i, j, len;
	char *ret_string = NULL;
	int escape = 0;
	char *var = NULL;
	char *val = NULL;
	char *pc = NULL;
	char *pc2 = NULL;

	if (env_array == NULL)
		return NULL;

	len = 0;
	i = 0;

	while (env_array[i]) {
		val = strchr(env_array[i], '=');
		if (val != NULL) {
			val++;
			escape = 0;
			for (pc2 = val; *pc2 != 0; pc2++) {
				if ((*pc2 == delimiter) || (*pc2 == ESC_CHAR)) {
					escape++;
				}
			}
		}

		len += strlen(env_array[i]);
		if (escape > 0) {
			len += escape; /* the ESC_CHAR */
		}
		len++; /* for delimiter */
		i++;
	}
	len++; /* for trailing '\0' */

	if (len > 1) { /* not just an empty string */

		ret_string = (char *) malloc(len);

		if (ret_string == NULL)
			return NULL;
		i = 0;
		while (env_array[i]) {
			var = env_array[i];
			pc = strchr(env_array[i], '=');
			val = NULL;
			if (pc != NULL) {
				*pc = '\0';
				val = pc + 1;
			}

			if (i == 0) {
				sprintf(ret_string, "%s=", var);
			} else {
				j = strlen(ret_string);
				ret_string[j] = delimiter;
				ret_string[j + 1] = '\0';
				strcat(ret_string, var);
				strcat(ret_string, "=");
			}
			if (val != NULL) {
				pc2 = ret_string + strlen(ret_string);
				while (*val != '\0') {
					if ((*val == delimiter) ||
					    (*val == ESC_CHAR)) {
						*pc2 = ESC_CHAR;
						pc2++;
					}
					*pc2++ = *val++;
				}
				*pc2 = '\0';
			}

			if (pc != NULL)
				*pc = '='; /* restore */
			i++;
		}
	}
	return (ret_string);
}

/* @brief
 * 	Function that takes a string 'str', and modifies it "in-place",
 *	removing each escape backslash preceding the character being
 *	escaped.
 *
 * @param[in,out]	str	- input string.
 *
 * @return void
 *
 */
static void
prune_esc_backslash(char *str)
{

	int s, d, skip_idx;

	if (str == NULL)
		return;

	s = 0; /* source */
	d = 0; /* dest */

	/* initialize to an index that cannot be matched at the start */
	skip_idx = -2;

	do {
		while ((str[s] == ESC_CHAR) && (skip_idx != (s - 1))) {
			skip_idx = s;
			s++;
		}
		str[d++] = str[s++];
	} while (str[s - 1] != '\0');
}

/**
 * @brief
 * 	Like strtok, except this understands quoted (unescaped) substrings
 * 	(single quotes, or double quotes) and include the value as is.
 *	 For instance, given_str: 'foo_float=1.5,foo_stra="glad,elated"some,squote=',foo_size=10mb,dquote="'
 *	string, this would return tokens:
 *		strtok_quoted(given_str, ',')=foo_float=1.5
 *		strtok_quoted(NULL,',')=foo_stra="glad,elated"some
 *		strtok_quoted(NULL,',')=squote='
 * 		strtok_quoted(NULL,',')=foo_size=10mb
 *		strtok_quoted(NULL,',')=dquote="
 *
 * @param[in]	source - input string
 * @param[in]	delimiter  - each element in this string represents the delimeter to match.
 *
 * @return	char *
 * @retval	<string token>
 * @retval	NULL if end of processing, or problem found with quoted string.
 */
char *
strtok_quoted(char *source, char delimiter)
{
	static char *pc = NULL; /* save pointer position */
	char *stok = NULL;	/* token to return */
	char *quoted = NULL;

	if (source != NULL) {
		pc = source;
	}

	if ((pc == NULL) || (*pc == '\0'))
		return NULL;

	for (stok = pc; *pc != 0; pc++) {

		/* must not match <ESC_CHAR><delim> or <ESC_CHAR><ESC_CHAR><delim>
		 * the latter means <ESC_CHAR> is the one escaped not <delim>
		 */
		if ((*pc == delimiter) &&
		    (((pc - 1) < stok) || (*(pc - 1) != ESC_CHAR) ||
		     ((pc - 2) < stok) || (*(pc - 2) == ESC_CHAR))) {
			*pc = '\0';
			pc++;
			prune_esc_backslash(stok);
			return (stok);
		}

		/* check for a quoted value and advance
		 * pointer up to the closing quote. If a non-escaped
		 * delimiter appears first, ex. "apple,bee", this will
		 * return the token string just before the delimiter
		 * (ex. "apple).
		 */
		if ((*pc == '\'') || (*pc == '"')) {

			/* if immediately following the quote, try to match
			 * one of:
			 * 	'<null>
			 *	'<delimiter>
			 * 	"<null>
			 *	"<delimiter>
			 */
			if ((*(pc + 1) == '\0') || (*(pc + 1) == delimiter)) {
				pc++;
				if (*pc != '\0') {
					*pc = '\0';
					pc++;
				}
				prune_esc_backslash(stok);
				return (stok);
			}
			/* Otherwise, look for the matching endquote<delimiter>
			 * or <endquote<null>
			 * if not, just use the value as is, up to but not
			 * including the non-escaped <delimiter>.
			 */
			quoted = pc;
			while (*++pc) {
				if (*pc == *quoted) {
					if ((*(pc + 1) == '\0') ||
					    (*(pc + 1) == delimiter)) {
						quoted = NULL;
						break;
					}
				} else if ((*pc == delimiter) &&
					   (((pc - 1) < stok) || (*(pc - 1) != ESC_CHAR) ||
					    ((pc - 2) < stok) || (*(pc - 2) == ESC_CHAR))) {
					*pc = '\0';
					pc++;
					prune_esc_backslash(stok);
					return (stok);
				}
			}

			if (quoted != NULL) { /* didn't find a close quote */
				pc = NULL;    /* use quote value as is */
				prune_esc_backslash(stok);
				return (stok);
			}
		}
	}

	prune_esc_backslash(stok);
	return (stok);
}

/**
 * @brief	Convert an attropl struct to an attrl struct
 *
 * @param[in]	from - the attropl struct to convert
 *
 * @return struct attrl*
 * @retval a newly converted attrl struct
 * @retval NULL on error
 */
struct attrl *
attropl2attrl(struct attropl *from)
{
	struct attrl *ap = NULL, *rattrl = NULL;

	while (from != NULL) {
		if (ap == NULL) {
			if ((ap = new_attrl()) == NULL) {
				perror("Out of memory");
				return NULL;
			}
			rattrl = ap;
		} else {
			if ((ap->next = new_attrl()) == NULL) {
				perror("Out of memory");
				return NULL;
			}
			ap = ap->next;
		}

		if (from->name != NULL) {
			if ((ap->name = (char *) malloc(strlen(from->name) + 1)) == NULL) {
				perror("Out of memory");
				free_attrl_list(rattrl);
				return NULL;
			}
			strcpy(ap->name, from->name);
		}
		if (from->resource != NULL) {
			if ((ap->resource = (char *) malloc(strlen(from->resource) + 1)) == NULL) {
				perror("Out of memory");
				free_attrl_list(rattrl);
				return NULL;
			}
			strcpy(ap->resource, from->resource);
		}
		if (from->value != NULL) {
			if ((ap->value = (char *) malloc(strlen(from->value) + 1)) == NULL) {
				perror("Out of memory");
				free_attrl_list(rattrl);
				return NULL;
			}
			strcpy(ap->value, from->value);
		}
		from = from->next;
	}

	return rattrl;
}

/**
 *  @brief attrl copy constructor
 *
 *  @param[in] oattr - attrl to dup
 *
 *  @return dup'd attrl
 */

struct attrl *
dup_attrl(struct attrl *oattr)
{
	struct attrl *nattr;

	if (oattr == NULL)
		return NULL;

	nattr = new_attrl();
	if (nattr == NULL)
		return NULL;
	if (oattr->name != NULL)
		nattr->name = strdup(oattr->name);
	if (oattr->resource != NULL)
		nattr->resource = strdup(oattr->resource);
	if (oattr->value != NULL)
		nattr->value = strdup(oattr->value);

	nattr->op = oattr->op;
	return nattr;
}

/**
 * @brief copy constructor for attrl list
 * @param oattr_list - list to dup
 * @return dup'd attrl list
 */

struct attrl *
dup_attrl_list(struct attrl *oattr_list)
{
	struct attrl *nattr_head = NULL;
	struct attrl *nattr;
	struct attrl *nattr_prev = NULL;
	struct attrl *oattr;

	if (oattr_list == NULL)
		return NULL;

	for (oattr = oattr_list; oattr != NULL; oattr = oattr->next) {
		nattr = dup_attrl(oattr);
		if (nattr_prev == NULL) {
			nattr_head = nattr;
			nattr_prev = nattr_head;
		} else {
			nattr_prev->next = nattr;
			nattr_prev = nattr;
		}
	}
	return nattr_head;
}

/**
 *	@brief create a new attrl structure and initialize it
 */
struct attrl *
new_attrl()
{
	struct attrl *at;

	if ((at = malloc(sizeof(struct attrl))) == NULL)
		return NULL;

	at->next = NULL;
	at->name = NULL;
	at->resource = NULL;
	at->value = NULL;
	at->op = SET;

	return at;
}

/**
 * @brief frees attrl structure
 *
 * @param [in] at - attrl to free
 * @return nothing
 */
void
free_attrl(struct attrl *at)
{
	if (at == NULL)
		return;

	free(at->name);
	free(at->resource);
	free(at->value);

	free(at);
}

/**
 * @brief frees attrl list
 *
 * @param[in] at_list - attrl list to free
 * @return nothing
 */
void
free_attrl_list(struct attrl *at_list)
{
	struct attrl *cur, *tmp;
	if (at_list == NULL)
		return;

	for (cur = at_list; cur != NULL; cur = tmp) {
		tmp = cur->next;
		free_attrl(cur);
	}
}

/**
 * @brief	Generic attribute setter function, accepts all values as string regardless of the type
 * 			Tip: use this when you want at_set() and at_decode() to be invoked, otherwise use the
 * 			type based setters below
 *
 * @param[in]	pattr	-	pointer to attribute being set
 * @param[in]	pdef 	-	attribute definition
 * @param[in]	value	-	value to be set
 * @param[in]	resc	-	value of resource, if applicable
 * @param[in]	op	-	the batch_op op to perform (SET, INCR, etc.)
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
int
set_attr_generic(attribute *pattr, attribute_def *pdef, char *value, char *rescn, enum batch_op op)
{
	int rc;
	attribute tempat;

	if (pattr == NULL || pdef == NULL) {
		log_err(-1, __func__, "Invalid pointer to attribute or its definition");
		return 1;
	}

	if (!pdef->at_decode)
		return 1;

	/* Just call decode and set the value of attribute directly */
	if (op == INTERNAL) {
		if ((rc = pdef->at_decode(pattr, pdef->at_name, rescn, value)) != 0) {
			log_errf(rc, __func__, "decode of %s failed", pdef->at_name);
			return rc;
		}
		return 0;
	}

	clear_attr(&tempat, pdef);
	if ((rc = pdef->at_decode(&tempat, pdef->at_name, rescn, value)) != 0) {
		log_errf(rc, __func__, "decode of %s failed", pdef->at_name);
		return rc;
	}

	rc = set_attr_with_attr(pdef, pattr, &tempat, op);

	pdef->at_free(&tempat);

	return rc;
}

/**
 * @brief	Set attribute using another attribute
 *
 * @param[in]	pdef 	-	attribute definition
 * @param[in]	oattr	-	pointer to attribute being set
 * @param[in]	nattr	-	pointer to attribute to set with
 * @param[in]	op		-	operation to do
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
int
set_attr_with_attr(attribute_def *pdef, attribute *oattr, attribute *nattr, enum batch_op op)
{
	int rc;

	if ((rc = pdef->at_set(oattr, nattr, op)) != 0)
		log_errf(rc, __func__, "set of %s failed", pdef->at_name);

	return rc;
}

/**
 * @brief	Mark an attribute as "not set"
 *
 * @param[in]	attr	-	pointer to attribute being modified
 *
 * @return	void
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
void
mark_attr_not_set(attribute *attr)
{
	if (attr != NULL)
		attr->at_flags &= ~ATR_VFLAG_SET;
}

/**
 * @brief	Mark an attribute as "set"
 *
 * @param[in]	attr	-	pointer to attribute being modified
 *
 * @return	void
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 *
 */
void
mark_attr_set(attribute *attr)
{
	if (attr != NULL)
		attr->at_flags |= ATR_VFLAG_SET;
}

/**
 * @brief	Check if an attribute is set
 *
 * @param[in]	pattr	-	pointer to the attribute
 *
 * @return	int
 * @retval	1 if the attribute is set
 * @retval	0 otherwise
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 */
int
is_attr_set(const attribute *pattr)
{
	if (pattr != NULL)
		return pattr->at_flags & ATR_VFLAG_SET;
	return 0;
}

/**
 * @brief	Common function to update attribute after set action performed.
 *
 * @param[in]	attr	-	pointer to the attribute
 *
 * @return	void
 *
 * @par MT-Safe: No
 * @par Side Effects: None
 */
void
post_attr_set(attribute *attr)
{
	attr->at_flags |= ATR_SET_MOD_MCACHE;
}

/**
 * @brief
 *		decode_sandbox - decode sandbox into string attribute
 *
 * @param[in,out]	patr - the string attribute that holds the decoded value
 * @param[in]		name - project attribute name
 * @param[in]		resc - resource name (unused here)
 * @param[in]		val - project attribute value
 *
 * @return int
 * @retval	0	- success
 * @retval	>0	- error number if error.
 *
 * @note
 *		argument rescn is unused here.
 */

int
decode_sandbox(attribute *patr, char *name, char *rescn, char *val)
{
	char *pc;

	pc = val;
	while (isspace((int) *pc))
		++pc;
	if (*pc == '\0' || !isalpha((int) *pc))
		return PBSE_BADATVAL;

	/* compare to valid values of sandbox */
	if ((strcasecmp(pc, "HOME") != 0) &&
	    (strcasecmp(pc, "O_WORKDIR") != 0) &&
	    (strcasecmp(pc, "PRIVATE") != 0)) {
		return PBSE_BADATVAL;
	}

	return (decode_str(patr, name, rescn, val));
}

/**
 * @brief
 *	Decode project into string attribute.
 *
 * @param[in,out]	patr - the string attribute that holds the decoded value
 * @param[in]		name - project attribute name
 * @param[in]		resc - resource name (unused here)
 * @param[in]		val - project attribute value
 *
 * @return	int
 * @retval      0 if success
 * @retval      > 0 error number if error
 * @retval      *patr members set
 */

int
decode_project(attribute *patr, char *name, char *rescn, char *val)
{
	char *pc;

	pc = val;
	while (isspace((int) *pc))
		++pc;

	if (strpbrk(pc, ETLIM_INVALIDCHAR) != NULL)
		return PBSE_BADATVAL;

	return (decode_str(patr, name, rescn,
			   (*val == '\0') ? PBS_DEFAULT_PROJECT : val));
}

/**
 * @brief
 *	Generic function to return the ponter to the attribute.
 *	Use of this function only within object getter functions.
 *
 * @param[in]	list		- Pointer to object's attribute list
 * @param[in]	attr_idx	- Index of the attribute to be freed.
 *
 */
attribute *
_get_attr_by_idx(attribute *list, int attr_idx)
{
	return &(list[attr_idx]);
}

/**
 * @brief
 *	Generic function to free the attribute with corresponding free routine.
 *
 * @param[in]	attr_def	- Pointer to object's attribute defition
 * @param[in]	pattr 		- Pointer to attribute list
 * @param[in]	attr_idx	- Index of the attribute to be freed.
 *
 */
void
free_attr(attribute_def *attr_def, attribute *pattr, int attr_idx)
{
	if (attr_def != NULL && pattr != NULL && attr_def[attr_idx].at_free != NULL)
		attr_def[attr_idx].at_free(pattr);
}

/**
 * @brief	Generic getter for attribute's list value
 * 
 *
 * @param[in]	pattr - pointer to the object
 *
 * @return	pbs_list_head
 * @retval	value of attribute
 * @retval	dummy pbs_list_head if pattr is NULL. This is to avoid GET_NEXT failing.
 */
pbs_list_head
get_attr_list(const attribute *pattr)
{
	const pbs_list_head dummy = {(pbs_list_link *) &dummy, (pbs_list_link *) &dummy, NULL};
	if (pattr)
		return pattr->at_val.at_list;
	else
		return dummy;
}


================================================
FILE: src/lib/Libattr/attr_node_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <ctype.h>
#include <memory.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <assert.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "net_connect.h"
#include "job.h"
#include "reservation.h"
#include "pbs_nodes.h"
#include "pbs_error.h"
#include "pbs_internal.h"

static struct node_state {
	unsigned long bit;
	char *name;
} ns[] = {{INUSE_UNKNOWN, ND_state_unknown},
	  {INUSE_DOWN, ND_down},
	  {INUSE_STALE, ND_Stale},
	  {INUSE_OFFLINE, ND_offline},
	  {INUSE_JOB, ND_jobbusy},
	  {INUSE_JOBEXCL, ND_job_exclusive},
	  {INUSE_BUSY, ND_busy},
	  {INUSE_INIT, ND_Initializing},
	  {INUSE_PROV, ND_prov},
	  {INUSE_WAIT_PROV, ND_wait_prov},
	  {INUSE_RESVEXCL, ND_resv_exclusive},
	  {INUSE_UNRESOLVABLE, ND_unresolvable},
	  {INUSE_OFFLINE_BY_MOM, ND_offline_by_mom},
	  {INUSE_MAINTENANCE, ND_maintenance},
	  {INUSE_SLEEP, ND_sleep},
	  {0, NULL}};

static struct node_type {
	short bit;
	char *name;
} nt[] = {{NTYPE_PBS, ND_pbs},
	  {0, NULL}};

/**
 * @file	attr_node_func.c
 * @brief
 * 	This file contains functions for deriving attribute values from a pbsnode
 * 	and for updating the "state" (inuse), "node type" (ntype) or "properties"
 * 	list using the "value" carried in an attribute.
 *
 * @par Included are:
 *
 * global:
 * decode_state()		"functions for at_decode func pointer"
 * decode_ntype()
 * decode_props()
 * decode_sharing()
 *
 * encode_state()		"functions for at_encode func pointer"
 * encode_ntype()
 * encode_props()
 * encode_jobs()
 * encode_sharing()
 *
 * set_node_state()		"functions for at_set func pointer"
 * set_node_ntype()
 *
 * node_state()			"functions for at_action func pointer"
 * node_ntype()
 *
 * get_vnode_state_str()	"helper functions"
 * vnode_state_to_str()
 * vnode_ntype_to_str()
 * str_to_vnode_state()
 * str_to_vnode_ntype()
 *
 * local:
 * load_prop()
 * set_nodeflag()
 *
 * The prototypes are declared in "attr_func.h"
 */

/*
 * Set of forward declarations for functions used before defined
 * keeps the compiler happy
 */
static int set_nodeflag(char *, unsigned long *);

/**
 * @brief
 *	Given a 'state_bit' value of a vnode, returns the human-readable
 *	form.
 *
 * @par Example:
 *	If <state_bit> == 3, this returns string "offline,down"
 *	since bit 1 is INUSE_OFFLINE and bit 3 is INUSE_DOWN.
 *
 * @par Note:
 * 	Do not free the return value - it's a statically allocated string.
 *
 * @param[in]	state_bit - the numeric state bit value
 *
 * @return	char * (i.e. string)
 * @retval	"<state1>,<state2>,..." - a comma-separated list of states.
 * @retval	""			- corresponding state not found.
 *
 */
char *
vnode_state_to_str(int state_bit)
{
	static char *state_str = NULL;
	int state_bit_tmp;
	int i;

	/* Ensure that the state_bit_str value contains only valid */
	/* vnode state values. */

	state_bit_tmp = state_bit;
	for (i = 0; ns[i].name && (state_bit_tmp != 0); i++) {
		/* clear all the valid states in the value */
		state_bit_tmp &= ~ns[i].bit;
	}

	/* Now clear any internal states */
	if (state_bit_tmp != 0)
		state_bit_tmp &= ~(INUSE_DELETED | INUSE_NEEDS_HELLOSVR | INUSE_INIT);

	if (state_bit_tmp != 0)
		return (""); /* found an unknown state bit set! */

	if (state_str == NULL) {

		int alloc_sz = 0;

		alloc_sz = strlen(ND_free) + 1;

		for (i = 0; ns[i].name; i++) {
			alloc_sz += strlen(ns[i].name) + 1; /* +1 for comma */
		}
		alloc_sz += 1; /* for null character */

		state_str = malloc(alloc_sz);

		if (state_str == NULL)
			return (""); /* malloc failure, just return empty */
	}

	if (state_bit == 0) {
		strcpy(state_str, ND_free);
	} else {
		state_str[0] = '\0';
		for (i = 0; ns[i].name; i++) {
			if (state_bit & ns[i].bit) {
				if (state_str[0] != '\0')
					(void) strcat(state_str, ",");
				(void) strcat(state_str, ns[i].name);
			}
		}
	}

	return (state_str);
}

/**
 *
 * @brief
 *	Same as vnode_state_to_str() ecept the argument is a string
 *	instead of an int.
 *
 * @param[in]	state_bit_str - the numeric state bit value in string format.
 *
 * @return	char * (i.e. string)
 * @retval	"<state1>,<state2>,..." - a comma-separated list of states.
 * @retval	""			- corresponding state not found.
 *
 */
char *
get_vnode_state_str(char *state_bit_str)
{
	int state_bit;

	if ((state_bit_str == NULL) || (state_bit_str[0] == '\0'))
		return ("");

	state_bit = atoi(state_bit_str);

	return (vnode_state_to_str(state_bit));
}

/**
 *
 * @brief
 *	Given a vnode state string 'vnstate', containing the list of descriptive
 *	states, comma separated, return the int bit mask equivalent.
 *
 * @param[in]	vnstate - the vnode state attribute: "<state1>,<state2>,..."
 *
 * @return int
 * @reteval <n>	the bitmask value
 *
 */
int
str_to_vnode_state(char *vnstate)
{
	int statebit = 0;
	char *pc = NULL;
	char *vnstate_dup = NULL;
	int i;

	if (vnstate == NULL) {
		return 0;
	}

	vnstate_dup = strdup(vnstate);
	if (vnstate_dup == NULL)
		return 0;

	pc = strtok(vnstate_dup, ",");
	while (pc) {
		for (i = 0; ns[i].name; i++) {
			if (strcmp(ns[i].name, pc) == 0) {
				statebit |= ns[i].bit;
				break;
			}
		}
		pc = strtok(NULL, ",");
	}
	free(vnstate_dup);

	return (statebit);
}

/*
 * @brief
 * 	Encodes the node attribute pattr's  state into an external
 * 	representation, via the  head of a svrattrl structure (ph).
 *
 * @param[in]	pattr	- input attribute
 * @param[in] 	ph 	- head of a list of "svrattrl" structs.
 * @param[out] 	aname	- attribute name
 * @param[out] 	rname	- resource's name (null if none)
 * @param[out] 	mode	- action mode code, unused here
 * @param[out] 	rtnl	- pointer to the actual svrattrl entry.
 *
 * @return   int
 * @retval    <0  an error encountered; value is negative of an error code
 * @retval    ==1 ok, encode succeeded and returning one item
 */

int
encode_state(const attribute *pattr, pbs_list_head *ph, char *aname, char *rname, int mode, svrattrl **rtnl)
{
	int i;
	svrattrl *pal;
	unsigned long state;
	static char state_str[MAX_ENCODE_BFR];
	int offline_str_seen;
	char *ns_name;

	if (!pattr)
		return -(PBSE_INTERNAL);

	if (!(pattr->at_flags & ATR_VFLAG_SET))
		return (0); /*nothing to report back*/

	state = pattr->at_val.at_long & INUSE_SUBNODE_MASK;
	if (!state)
		strcpy(state_str, ND_free);

	else {
		state_str[0] = '\0';
		offline_str_seen = 0;
		for (i = 0; ns[i].name; i++) {
			if (state & ns[i].bit) {
				ns_name = ns[i].name;
				if (strcmp(ns_name, ND_offline) == 0) {
					offline_str_seen = 1;
				} else if (strcmp(ns_name,
						  ND_offline_by_mom) == 0) {
					if (offline_str_seen)
						continue;
					/* ND_offline_by_mom will always be */
					/* shown externally as ND_offline */
					ns_name = ND_offline;
				}

				if (state_str[0] != '\0') {
					(void) strcat(state_str, ",");
				}
				(void) strcat(state_str, ns_name);
			}
		}
	}

	pal = attrlist_create(aname, rname, (int) strlen(state_str) + 1);
	if (pal == NULL)
		return -(PBSE_SYSTEM);

	(void) strcpy(pal->al_value, state_str);
	pal->al_flags = ATR_VFLAG_SET;
	if (ph)
		append_link(ph, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1); /*success*/
}

/**
 *
 * @brief
 *	Given a vnode type string 'vntype', return the int equivalent.
 *
 * @param[in]	vntype - the vnode type attribute as a string.
 *
 * @return 	int
 * @retval  	<n> 	mapped value from nt[] array.
 * @retval  	-1  	if failed to find a mapping.
 *
 */
int
str_to_vnode_ntype(char *vntype)
{
	int i;

	if (vntype == NULL)
		return (-1);

	for (i = 0; nt[i].name; i++) {
		if (strcmp(vntype, nt[i].name) == 0)
			return nt[i].bit;
	}

	return (-1);
}

/**
 *
 * @brief
 *	Given a vnode type 'vntype' in int form, return the string equivalent.
 *
 * @par Note:
 * 	Do not free the return value - it's a statically allocated string.
 *
 * @param[in]	vntype - the vnode type value in int.
 *
 * @return 	str
 * @retval 	mapped value in the nt[] array from int to string.
 * @retval 	""	empty string if not found in nt[] array.
 *
 */
char *
vnode_ntype_to_str(int vntype)
{
	int i;

	for (i = 0; nt[i].name; i++) {
		if (vntype == nt[i].bit)
			return nt[i].name;
	}

	return ("");
}

/**
 *
 * @brief
 *	Encodes a node type attribute into a svrattrl structure
 *
 * @param[in]	pattr - attribute being encoded
 * @param[in]	ph - head of a list of 'svrattrl' structs which are to be
 *		     return.
 * @param[out]  aname - attribute's name
 * @param[out]  rname - resource's name (null if none)
 * @param[out]	mode - mode code, unused here
 * @param[out]	rtnl - the return value, a pointer to svrattrl
 *
 * @note
 * 	Once the node's "ntype" field is converted to an attribute,
 * 	the attribute can be passed to this function for encoding into
 * 	an svrattrl structure
 *
 * @return 	int
 * @retval    	< 0	an error encountered; value is negative of an error code
 * @retval    	0	ok, encode happened and svrattrl created and linked in,
 *		     	or nothing to encode
 *
 */
int
encode_ntype(const attribute *pattr, pbs_list_head *ph, char *aname, char *rname, int mode, svrattrl **rtnl)
{
	svrattrl *pal;
	short ntype;

	static char ntype_str[MAX_ENCODE_BFR];
	int i;

	if (!pattr)
		return -(PBSE_INTERNAL);

	if (!(pattr->at_flags & ATR_VFLAG_SET))
		return (0); /*nothing to report back*/

	ntype = pattr->at_val.at_short & PBSNODE_NTYPE_MASK;
	ntype_str[0] = '\0';
	for (i = 0; nt[i].name; i++) {
		if (ntype == nt[i].bit) {
			strcpy(ntype_str, nt[i].name);
			break;
		}
	}

	if (ntype_str[0] == '\0') {
		return -(PBSE_ATVALERANGE);
	}

	pal = attrlist_create(aname, rname, (int) strlen(ntype_str) + 1);
	if (pal == NULL)
		return -(PBSE_SYSTEM);

	(void) strcpy(pal->al_value, ntype_str);
	pal->al_flags = ATR_VFLAG_SET;
	if (ph)
		append_link(ph, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (0); /*success*/
}

/**
 * @brief
 * 	encode_jobs
 * 	Once the node's struct jobinfo pointer is put in the data area of
 *	temporary attribute containing a pointer to the parent node, this
 * 	function will walk the list of jobs and generate the comma separated
 * 	list to send back via an svrattrl structure.
 *
 * @param[in]   pattr - attribute being encoded
 * @param[in]   ph - head of a  list of "svrattrl"
 * @param[out]  aname - attribute's name
 * @param[out]  rname - resource's name (null if none)
 * @param[out]  mode - mode code, unused here
 * @param[out]  rtnl - the return value, a pointer to svrattrl
 *
 * @return	int
 * @retval	<0	an error encountered; value is negative of an error code
 * @retval	 0	ok, encode happened and svrattrl created and linked in,
 *			or nothing to encode
 *
 */

int
encode_jobs(const attribute *pattr, pbs_list_head *ph, char *aname, char *rname, int mode, svrattrl **rtnl)

{
	svrattrl *pal;
	struct jobinfo *jip;
	struct pbsnode *pnode;
	struct pbssubn *psubn;
	int i;
	int j;
	int offset;
	int jobcnt;    /*number of jobs using the node     */
	int strsize;   /*computed string size		    */
	char *job_str; /*holds comma separated list of jobs*/

	if (!pattr)
		return (-1);
	if (!(pattr->at_flags & ATR_VFLAG_SET) || !pattr->at_val.at_jinfo)
		return (0); /*nothing to report back   */

	/*cnt number of jobs and estimate size of string buffer required*/
	jobcnt = 0;
	strsize = 1; /*allow for terminating null char*/
	pnode = pattr->at_val.at_jinfo;
	for (psubn = pnode->nd_psn; psubn; psubn = psubn->next) {
		for (jip = psubn->jobs; jip; jip = jip->next) {
			jobcnt++;
			/* add 3 to length of node name for slash, comma, and space */
			/* plus one for the cpu index				   */
			strsize += strlen(jip->jobid) + 4;
			i = psubn->index;
			/* now add additional space needed for the cpu index */
			while ((i = i / 10) != 0)
				strsize++;
		}
	}

	if (jobcnt == 0)
		return (0); /*no jobs currently on this node*/

	else if (!(job_str = (char *) malloc(strsize + 1)))
		return -(PBSE_SYSTEM);

	job_str[0] = '\0';
	i = 0;
	j = 0;
	offset = 0;
	for (psubn = pnode->nd_psn; psubn; psubn = psubn->next) {
		for (jip = psubn->jobs; jip; jip = jip->next) {
			if (i != 0) {
				sprintf(job_str + offset, ", ");
				offset += 2; /* accounting for comma and space */
			} else
				i++;

			sprintf(job_str + offset, "%s/%ld",
				jip->jobid, psubn->index);
			offset += strlen(jip->jobid) + 1;
			j = psubn->index;
			while ((j = j / 10) != 0)
				offset++;
			offset++;
		}
	}

	pal = attrlist_create(aname, rname, (int) strlen(job_str) + 1);
	if (pal == NULL) {
		free(job_str);
		return -(PBSE_SYSTEM);
	}

	(void) strcpy(pal->al_value, job_str);
	pal->al_flags = ATR_VFLAG_SET;
	free(job_str);

	if (ph)
		append_link(ph, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (0); /*success*/
}

/**
 * @brief
 * 	encode_resvs
 * 	Once the node's struct resvinfo pointer is put in the data area of
 * 	temporary attribute containing a pointer to the parent node, this
 * 	function will walk the list of reservations and generate the comma
 * 	separated list to send back via an svrattrl structure.
 *
 * @param[in]    pattr - attribute being encoded
 * @param[in]    ph - head of a  list of "svrattrl"
 * @param[out]   aname - attribute's name
 * @param[out]   rname - resource's name (null if none)
 * @param[out]   mode - mode code, unused here
 * @param[out]   rtnl - the return value, a pointer to svrattrl
 *
 * @return      int
 * @retval      <0      an error encountered; value is negative of an error code
 * @retval       0      ok, encode happened and svrattrl created and linked in,
 *                      or nothing to encode
 */

int
encode_resvs(const attribute *pattr, pbs_list_head *ph, char *aname, char *rname, int mode, svrattrl **rtnl)
{
	svrattrl *pal;
	struct resvinfo *rip;
	struct pbsnode *pnode;
	int i;
	int resvcnt;	/*number of reservations on the node*/
	int strsize;	/*computed string size		    */
	char *resv_str; /*comma separated reservations list */

	if (!pattr)
		return (-1);
	if (!(pattr->at_flags & ATR_VFLAG_SET) || !pattr->at_val.at_jinfo)
		return (0); /*nothing to report back   */

	/*cnt number of reservations and estimate size of string buffer required*/
	resvcnt = 0;
	strsize = 1; /*allow for terminating null char*/
	pnode = pattr->at_val.at_jinfo;
	for (rip = pnode->nd_resvp; rip; rip = rip->next) {
		resvcnt++;
		strsize += strlen(rip->resvp->ri_qs.ri_resvID) + 9; /*4digit*/
	}

	if (resvcnt == 0)
		return (0); /*no reservations currently on this node*/

	else if (!(resv_str = (char *) malloc(strsize)))
		return -(PBSE_SYSTEM);

	resv_str[0] = '\0';
	i = 0;
	for (rip = pnode->nd_resvp; rip; rip = rip->next) {
		if (i != 0)
			strcat(resv_str, ", ");
		else
			i++;

		sprintf(resv_str + strlen(resv_str), "%s",
			rip->resvp->ri_qs.ri_resvID);
	}

	pal = attrlist_create(aname, rname, (int) strlen(resv_str) + 1);
	if (pal == NULL) {
		free(resv_str);
		return -(PBSE_SYSTEM);
	}

	(void) strcpy(pal->al_value, resv_str);
	pal->al_flags = ATR_VFLAG_SET;
	free(resv_str);

	if (ph)
		append_link(ph, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (0); /*success*/
}

/**
 * @brief
 * 	encode_sharing
 * 	Encode the sharing attribute value into one of its possible values,
 *	see "share_words" above
 *
 * @param[in]    pattr - attribute being encoded
 * @param[in]    ph - head of a  list of "svrattrl"
 * @param[out]   aname - attribute's name
 * @param[out]   rname - resource's name (null if none)
 * @param[out]   mode - mode code, unused here
 * @param[out]   rtnl - the return value, a pointer to svrattrl
 *
 * @return      int
 * @retval      <0      an error encountered; value is negative of an error code
 * @retval     ==1      ok, encode succeeded and returning one item
 *
 */

int
encode_sharing(const attribute *pattr, pbs_list_head *ph, char *aname, char *rname, int mode, svrattrl **rtnl)
{
	int n;
	svrattrl *pal;
	char *vn_str;

	if (!pattr)
		return -(PBSE_INTERNAL);

	if (!(pattr->at_flags & ATR_VFLAG_SET))
		return (0); /*nothing to report back*/

	n = (int) pattr->at_val.at_long;
	vn_str = vnode_sharing_to_str((enum vnode_sharing) n);
	if (vn_str == NULL)
		return -(PBSE_INTERNAL);

	pal = attrlist_create(aname, rname, (int) strlen(vn_str) + 1);
	if (pal == NULL)
		return -(PBSE_SYSTEM);

	(void) strcpy(pal->al_value, vn_str);
	pal->al_flags = ATR_VFLAG_SET;
	if (ph)
		append_link(ph, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;

	return (1); /*success*/
}

/**
 * @brief
 * 	decode_state
 * 	In this case, the two arguments that get  used are
 *
 * pattr - it points to an attribute whose value is a short,
 * and the argument "val".
 * Once the "value" argument, val, is decoded from its form
 * as a string of comma separated substrings, the component
 * values are used to set the appropriate bits in the attribute's
 * value field.
 *
 * @param[in]    pattr - it points to an attribute whose value is a short,
 *                       and the argument "val".
 * @param[out]   aname - attribute's name
 * @param[out]   rname - resource's name (null if none)
 *
 * @return	int
 * @retval	PBSE_*	error code
 * @retval	0	Success
 *
 */

int
decode_state(attribute *pattr, char *name, char *rescn, char *val)
{
	int rc = 0; /*return code; 0==success*/
	unsigned long flag, currflag;
	char *str;

	char strbuf[512]; /*should handle most vals*/
	char *sbufp;
	int slen;

	if (val == NULL)
		return (PBSE_BADNDATVAL);

	/*
	 * determine string storage requirement and copy the string "val"
	 * to a work buffer area
	 */

	slen = strlen(val); /*bufr either on stack or heap*/
	if (slen - 512 < 0)
		sbufp = strbuf;
	else {
		if (!(sbufp = (char *) malloc(slen + 1)))
			return (PBSE_SYSTEM);
	}

	strcpy(sbufp, val);

	if ((str = parse_comma_string(sbufp)) == NULL) {
		if (slen >= 512)
			free(sbufp);
		return rc;
	}

	flag = 0;
	if ((rc = set_nodeflag(str, &flag)) != 0) {
		if (slen >= 512)
			free(sbufp);
		return rc;
	}
	currflag = flag;

	/*calling parse_comma_string with a null ptr continues where*/
	/*last call left off.  The initial comma separated string   */
	/*copy pointed to by sbufp is modified with each func call  */

	while ((str = parse_comma_string(NULL)) != 0) {
		if ((rc = set_nodeflag(str, &flag)) != 0)
			break;

		if ((currflag == 0 && flag) || (currflag && flag == 0)) {
			rc = PBSE_MUTUALEX; /*free is mutually exclusive*/
			break;
		}
		currflag = flag;
	}

	if (!rc) {
		pattr->at_val.at_long = flag;
		post_attr_set(pattr);
	}

	if (slen >= 512) /*buffer on heap, not stack*/
		free(sbufp);

	return rc;
}

/**
 * @brief
 * 	decode_ntype
 * 	We no longer decode the node type.  Instead, we simply pretend to do so
 * 	and return success.
 *
 * 	Historical information from the previous version of this function:
 *	In this case, the two arguments that get used are
 *	pattr-- it points to an attribute whose value is a short,
 *	and the argument "val". We once had "time-shared" and "cluster"
 *	node types. There may come a time when other ntype values are
 *	needed. The one thing that is assumed is that the types are
 *	going to be mutually exclusive.
 *
 * @param[in] pattr - pointer to attribute structure
 * @param[in] name - attribute name
 * @param[in] rescn - resource name, unused here
 * @param[in] val - attribute value
 *
 * @return	int
 * @retval	0	Success
 */

int
decode_ntype(attribute *pattr, char *name, char *rescn, char *val)
{
	pattr->at_val.at_short = NTYPE_PBS;
	post_attr_set(pattr);

	return 0;
}

/**
 * @brief
 * 	decode_sharing - decode one of the acceptable share value strings into
 *	the array index which is stored as the attribute value;
 *
 * @param[in] pattr - pointer to attribute structure
 * @param[in] name - attribute name
 * @param[in] rescn - resource name, unused here
 * @param[in] val - attribute value
 *
 * @return      int
 * @retval      0       	Success
 * @retval	PBSE code	error
 */

int
decode_sharing(attribute *pattr, char *name, char *rescn, char *val)
{
	int vns;
	int rc = 0; /*return code; 0==success*/

	if (val == NULL)
		rc = (PBSE_BADNDATVAL);
	else {
		vns = (int) str_to_vnode_sharing(val);
		if (vns == VNS_UNSET)
			rc = (PBSE_BADNDATVAL);
	}

	if (!rc) {
		pattr->at_val.at_long = vns;
		post_attr_set(pattr);
	}

	return rc;
}

/**
 * @brief
 *
 *	Update the state information  of 'pattr' using the info from 'new'.
 *
 * @param[out]	pattr - attribute whose  node state is to be updated.
 * @param[in]	new - input information.
 * @param[in]	op - update mode (SET, INCR, DECR).
 *
 * @return int
 * @retval 0 	- for success
 * @retval != 0 - for any failure
 */
int
set_node_state(attribute *pattr, attribute *new, enum batch_op op)
{
	int rc = 0;

	assert(pattr && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {

		case SET:
			pattr->at_val.at_long = new->at_val.at_long;
			break;

		case INCR:
			if (pattr->at_val.at_long && new->at_val.at_long == 0) {
				rc = PBSE_BADNDATVAL; /*"free" mutually exclusive*/
				break;
			}

			pattr->at_val.at_long |= new->at_val.at_long;
			break;

		case DECR:
			if (pattr->at_val.at_long && new->at_val.at_long == 0) {
				rc = PBSE_BADNDATVAL; /*"free" mutually exclusive*/
				break;
			}

			pattr->at_val.at_long &= ~new->at_val.at_long;
			if (new->at_val.at_long & INUSE_OFFLINE) {
				/* if INUSE_OFFLINE is being cleared, must also */
				/* clear INUSE_OFFLINE_BY_MOM. */
				pattr->at_val.at_long &= ~INUSE_OFFLINE_BY_MOM;
			}
			break;

		default:
			rc = PBSE_INTERNAL;
			break;
	}

	if (!rc)
		post_attr_set(pattr);

	return rc;
}

/**
 * @brief
 * 	set_node_ntype - the value entry in attribute "new" is a short.  It was
 *	generated by the decode routine is used to update the
 *	value portion of the attribute *pattr
 *	the mode of the update is goverened by the argument "op"
 *	(SET,INCR,DECR)
 *
 * @param[out]	pattr - attribute whose  node state is to be updated.
 * @param[in]	new - input information.
 * @param[in]	op - update mode (SET, INCR, DECR).
 *
 * @return int
 * @retval 0 	- for success
 * @retval != 0 - for any failure
 */

int
set_node_ntype(attribute *pattr, attribute *new, enum batch_op op)
{
	int rc = 0;

	assert(pattr && new && (new->at_flags &ATR_VFLAG_SET));

	switch (op) {

		case SET:
			pattr->at_val.at_short = new->at_val.at_short;
			break;

		case INCR:
			if (pattr->at_val.at_short != new->at_val.at_short) {

				rc = PBSE_MUTUALEX; /*types are mutually exclusive*/
			}
			break;

		case DECR:
			if (pattr->at_val.at_short != new->at_val.at_short)
				rc = PBSE_MUTUALEX; /*types are mutually exclusive*/

			break;

		default:
			rc = PBSE_INTERNAL;
	}

	if (!rc)
		post_attr_set(pattr);
	return rc;
}

/**
 * @brief
 *	sets the node flag
 *
 * @param
 * 	Use the input 'str's value to set a bit in
 *	the "flags" variable pointed to by 'pflag'.
 * @note
 *	Each call sets one more bit in the flags
 *	variable or it clears the flags variable
 *	in the case where *str is the value "free".
 *
 * @param[in]	str - input string state value.
 * @param[out]	pflag - pointer to the variable holding the result.
 *
 * @return	int
 * @retval	0			success
 * @retval	PBSE_BADNDATVAL		error
 *
 */

static int
set_nodeflag(char *str, unsigned long *pflag)
{
	int rc = 0;

	if (*str == '\0')
		return (PBSE_BADNDATVAL);

	if (!strcmp(str, ND_free))
		*pflag = 0;
	else if (!strcmp(str, ND_offline))
		*pflag = *pflag | INUSE_OFFLINE;
	else if (!strcmp(str, ND_offline_by_mom))
		*pflag = *pflag | INUSE_OFFLINE_BY_MOM;
	else if (!strcmp(str, ND_down))
		*pflag = *pflag | INUSE_DOWN;
	else if (!strcmp(str, ND_sleep))
		*pflag = *pflag | INUSE_SLEEP;
	else {
		rc = PBSE_BADNDATVAL;
	}

	return rc;
}

/**
 * @brief
 * 	node_ntype - Either derive an "ntype" attribute from the node
 *	or update node's "ntype" field using the
 *	attribute's data
 *
 * @param[out] new - derive ntype into this attribute
 * @param[in] pnode - pointer to a pbsnode struct
 * @param[in] actmode - action mode; "NEW" or "ALTER"
 *
 * @return      int
 * @retval      0                       success
 * @retval      PBSE_INTERNAL	        error
 *
 */

int
node_ntype(attribute *new, void *pnode, int actmode)
{
	int rc = 0;
	struct pbsnode *np;

	np = (struct pbsnode *) pnode; /*because of def of at_action  args*/
	switch (actmode) {

		case ATR_ACTION_NOOP:
			break;

		case ATR_ACTION_NEW:
		case ATR_ACTION_ALTER:
			np->nd_ntype = new->at_val.at_short;
			break;

		case ATR_ACTION_RECOV:
		case ATR_ACTION_FREE:
		default:
			rc = PBSE_INTERNAL;
	}
	return rc;
}

/**
 *
 * @brief
 *
 *	Returns the "external" form of the attribute 'val' given 'name'.
 *
 * @param[in] 	name - attribute name
 * @param[in] 	val - attribute value
 *
 * @return char * - the external form for name=state: "3" -> "down,offline"
 * @Note
 *     	Returns a static value that can potentially get cleaned up on next call.
 * 	Must use return value immediately!
 */
char *
return_external_value(char *name, char *val)
{
	char *vns;

	if ((name == NULL) || (val == NULL))
		return ("");

	if (strcmp(name, ATTR_NODE_state) == 0) {
		return vnode_state_to_str(atoi(val));
	} else if (strcmp(name, ATTR_NODE_Sharing) == 0) {
		vns = vnode_sharing_to_str((enum vnode_sharing) atoi(val));
		return (vns ? vns : "");
	} else if (strcmp(name, ATTR_NODE_ntype) == 0) {
		return vnode_ntype_to_str(atoi(val));
	} else {
		return val;
	}
}

/**
 * @brief
 *		Returns the "internal" form of the attribute 'val' given 'name'.
 *
 * @param[in]	name	-	attribute name
 * @param[in]	val	-	attribute value
 *
 * @return char *	: the external form for name=state: "down,offline" -> "3"
 * @Note
 *     	Returns a static value that can potentially get cleaned up on next call.
 * 		Must use return value immediately!
 *
 * @par MT-safe: No
 */
char *
return_internal_value(char *name, char *val)
{
	static char ret_str[MAX_STR_INT];
	enum vnode_sharing share;
	int v;

	if ((name == NULL) || (val == NULL))
		return ("");

	if (strcmp(name, ATTR_NODE_state) == 0) {
		v = str_to_vnode_state(val);
		sprintf(ret_str, "%d", v);
		return (ret_str);
	} else if (strcmp(name, ATTR_NODE_Sharing) == 0) {
		share = str_to_vnode_sharing(val);
		if (share == VNS_UNSET)
			return val;
		sprintf(ret_str, "%d", share);
		return (ret_str);
	} else if (strcmp(name, ATTR_NODE_ntype) == 0) {
		v = str_to_vnode_ntype(val);
		if (v == -1)
			return val;
		sprintf(ret_str, "%d", v);
		return (ret_str);
	} else {
		return (val);
	}
}

/**
 *
 * @brief
 *	Prints out the file on opened stream 'fp', the attribute names or
 *	resources and their values as in:
 *		<attribute_name>=<attribute_value>
 *		<attribute_name>[<resource_name>]=<resource_value>
 *		<vnode_name>.<attribute_name>=<attribute value>
 *		<vnode_name>.<attribute_name>[<resource_name>]=<attribute value>
 *		<head_str>[<attribute_name>].p[<resource_name>]=<resource_value>
 * @Note
 *	Only prints out values that were set in a hook script.
 *
 * @param[in]	fp 	- the stream pointer of the file to write output into
 * @param[in]	head_str- some string to print out the beginning.
 * @param[in]	phead	- pointer to the head of the list containing data.
 *
 * @return none
 */
void
fprint_svrattrl_list(FILE *fp, char *head_str, pbs_list_head *phead)
{
	svrattrl *plist = NULL;
	char *p, *p0;

	if ((fp == NULL) || (head_str == NULL) || (phead == NULL)) {
		log_err(errno, __func__, "NULL input parameters!");
		return;
	}

	for (plist = (svrattrl *) GET_NEXT(*phead); plist != NULL;
	     plist = (svrattrl *) GET_NEXT(plist->al_link)) {
		if (plist->al_flags & ATR_VFLAG_HOOK) {
			p = strrchr(plist->al_name, '.');
			p0 = p;
			if (p != NULL) {
				*p = '\0';
				p++; /* this is the actual attribute name */
			}

			if (plist->al_resc != NULL) {
				if (p != NULL)
					fprintf(fp, "%s[\"%s\"].%s[%s]=%s\n", head_str,
						plist->al_name, p,
						plist->al_resc,
						return_external_value(p, plist->al_value));
				else
					fprintf(fp, "%s.%s[%s]=%s\n", head_str,
						plist->al_name, plist->al_resc,
						return_external_value(plist->al_name,
								      plist->al_value));
			} else {
				if (p != NULL) {
					fprintf(fp, "%s[\"%s\"].%s=%s\n", head_str,
						plist->al_name, p,
						return_external_value(p, plist->al_value));
				} else {
					if (strcmp(plist->al_name, ATTR_v) == 0) {
						fprintf(fp, "%s.%s=\"\"\"%s\"\"\"\n",
							head_str,
							plist->al_name,
							return_external_value(
								plist->al_name,
								plist->al_value));
					} else {
						fprintf(fp, "%s.%s=%s\n", head_str,
							plist->al_name,
							return_external_value(
								plist->al_name,
								plist->al_value));
					}
				}
			}
			if (p0 != NULL)
				*p0 = '.';
		}
	}
}


================================================
FILE: src/lib/Libattr/attr_resc_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include <pbs_ifl.h>
#include "pbs_internal.h"
#include "log.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"

/**
 * @file	attr_resc_func.c
 * @brief
 * This file contains functions for decoding "nodes" and "select" resources
 *
 * The prototypes are declared in "attribute.h", also see resource.h
 *
 * ----------------------------------------------------------------------------
 * Attribute functions for attributes with value type resource
 * ----------------------------------------------------------------------------
 */

/**
 * @brief
 * 	decode_nodes - decode a node requirement specification,
 *	Check if node requirement specification is syntactically ok,
 *	then call decode_str()
 *
 *	val if of the form:	node_spec[+node_spec...]
 *	where node_spec is:	number | properity | number:properity
 *
 * @param[out] patr - pointer to attribute structure
 * @param[in] name - attribute name
 * @param[in] rescn - resource name
 * @param[in] val - attribute value
 *
 * @return	int
 * @retval	0	success
 * @retval	>0	error
 *
 */

int
decode_nodes(attribute *patr, char *name, char *rescn, char *val)
{
	char *pc;

	pc = val;

	if ((pc == NULL) || (*pc == '\0')) /* effectively unsetting value */
		return (decode_str(patr, name, rescn, val));

	while (1) {
		while (isspace((int) *pc))
			++pc;

		if (!isalnum((int) *pc))
			return (PBSE_BADATVAL);
		if (isdigit((int) *pc)) {
			while (isalnum((int) *++pc))
				;
			if (*pc == '\0')
				break;
			else if ((*pc != '+') && (*pc != ':') && (*pc != '#'))
				return (PBSE_BADATVAL);
		} else if (isalpha((int) *pc)) {
			while (isalnum((int) *++pc) || *pc == '-' || *pc == '.' || *pc == '=' || *pc == '_')
				;
			if (*pc == '\0')
				break;
			else if ((*pc != '+') && (*pc != ':') && (*pc != '#'))
				return (PBSE_BADATVAL);
		}
		++pc;
	}
	return (decode_str(patr, name, rescn, val));
}

/**
 * @brief
 * 	decode_select - decode a selection specification,
 *	Check if the specification is syntactically ok, then call decode_str()
 *
 *	Spec is of the form:
 *
 * @param[out] patr - pointer to attribute structure
 * @param[in] name - attribute name
 * @param[in] rescn - resource name
 * @param[in] val - attribute value
 *
 * @return      int
 * @retval      0       success
 * @retval      >0      error
 *
 */

int
decode_select(attribute *patr, char *name, char *rescn, char *val)
{
	int new_chunk = 1;
	char *pc;
	char *quoted = NULL;

	if (val == NULL)
		return (PBSE_BADATVAL);
	pc = val;
	/* skip leading white space */
	while (isspace((int) *pc))
		++pc;

	if (*pc == '\0')
		return (PBSE_BADATVAL);

	while (*pc) {

		/* each chunk must start with number or letter */
		if (!isalnum((int) *pc))
			return (PBSE_BADATVAL);

		if (new_chunk && isdigit((int) *pc)) {
			/* if digit, it is chunk multipler */
			while (isdigit((int) *++pc))
				;
			if (*pc == '\0') /* just number is ok */
				return (decode_str(patr, name, rescn, val));
			else if (*pc == '+') {
				++pc;
				if (*pc == '\0')
					return (PBSE_BADATVAL);
				continue;
			} else if (*pc != ':')
				return (PBSE_BADATVAL);
			++pc;
			/* a colon must be followed by a resource=value */
		}

		/* resource=value pairs */
		new_chunk = 0;

		/* resource first and must start with alpha */
		if (!isalpha((int) *pc))
			return (PBSE_BADATVAL);

		while (isalnum((int) *pc) || *pc == '-' || *pc == '_')
			++pc;
		if (*pc != '=')
			return (PBSE_BADATVAL);

		++pc; /* what following the '=' */
		if (*pc == '\0')
			return (PBSE_BADATVAL);

		/* next comes the value substring */

		while (*pc) {

			/* is it a quoted substring ? */
			if (*pc == '\'' || *pc == '"') {
				/* quoted substring, goto close quote */
				quoted = pc;
				while (*++pc) {
					if (*pc == *quoted) {
						quoted = NULL;
						break;
					}
				}
				if (quoted != NULL) /* didn't find close */
					return (PBSE_BADATVAL);
				++pc;
				continue;
			}

			if (*pc == '\0') {
				/* valid end of string */
				return (decode_str(patr, name, rescn, val));

			} else if (*pc == ':') {
				/* should start new resource=value */
				++pc;
				if (*pc)
					break;
				else
					return (PBSE_BADATVAL);
			} else if (*pc == '+') {
				/* should start new chunk */
				++pc;
				new_chunk = 1;
				if (*pc)
					break; /* end of chunk, next */
				else
					return (PBSE_BADATVAL);
			}
			if (isprint((int) *pc)) {
				++pc; /* legal character */

			} else
				return (PBSE_BADATVAL);
		}
	}
	return (decode_str(patr, name, rescn, val));
}

/**
 * @brief Verification of resource name
 *
 * A custom resource must start with an alpha character,
 * must be followed by alphanumeric characters excluding '_' and '-'
 *
 * @param[in] name of the resource
 *
 * @retval -1 if resource name does not start with an alpha character
 * @retval -2 if resource name, past first character does not follow the
 * required format
 * @retval 0 if resource name matches required format
 */
int
verify_resc_name(char *name)
{

	char *val;

	if (!isalpha((int) *name)) {
		return -1;
	}

	val = name;

	while (*++val) {
		if (!isalnum((int) *val) && (*val != '_') &&
		    (*val != '-')) {
			return -2;
		}
	}

	return 0;
}

/**
 * @brief Verification of type and flag values
 *
 * @param[in] resc_type - The resource type
 * @param[in] pflag_ir - The invisible and read-only flags
 * @param[in][out] presc_flag - Pointer to the resource flags
 * @param[in] rescname - The name of the resource
 * @param[in][out] buf - A buffer to hold error message if any
 * @param[in] autocorrect - If possible, fix inconsistencies in types and flags
 * @retval 0 on success
 * @retval -1 on error
 * @retval -2 when errors that got autocorrected
 */
int
verify_resc_type_and_flags(int resc_type, int *pflag_ir, int *presc_flag, const char *rescname, char *buf, int buflen, int autocorrect)
{
	char fchar;
	int correction = 0;

	if (*pflag_ir == 2) { /* both flag i and r are set */
		if (autocorrect) {
			snprintf(buf, buflen, "Erroneous to have flag "
					      "'i' and 'r' on resource \"%s\"; ignoring 'r' flag.",
				 rescname);
			correction = 1;
		} else {
			snprintf(buf, buflen, "Erroneous to have flag "
					      "'i' and 'r' on resource \"%s\".",
				 rescname);
			return -1;
		}
	}
	*pflag_ir = 0;
	if ((*presc_flag & (ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) &&
	    ((*presc_flag & ATR_DFLAG_CVTSLT) == 0)) {
		if (*presc_flag & ATR_DFLAG_ANASSN)
			fchar = 'n';
		else
			fchar = 'f';
		if (autocorrect) {
			snprintf(buf, buflen, "Erroneous to have flag '%c' without "
					      "'h' on resource \"%s\"; adding 'h' flag.",
				 fchar, rescname);
			correction = 1;
		} else {
			snprintf(buf, buflen, "Erroneous to have flag '%c' without "
					      "'h' on resource \"%s\".",
				 fchar, rescname);
			return -1;
		}
	}

	if ((*presc_flag & (ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) ==
	    (ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) {
		*presc_flag &= ~ATR_DFLAG_FNASSN;
		if (autocorrect) {
			snprintf(buf, buflen, "Erroneous to have flag 'n' and 'f' "
					      "on resource \"%s\"; ignoring 'f' flag.",
				 rescname);
			correction = 1;
		} else {
			snprintf(buf, buflen, "Erroneous to have flag 'n' and 'f' "
					      "on resource \"%s\".",
				 rescname);
			return -1;
		}
	}

	if (((resc_type == ATR_TYPE_BOOL) || (resc_type == ATR_TYPE_STR) || (resc_type == ATR_TYPE_ARST)) &&
	    ((*presc_flag & (ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) != 0)) {
		*presc_flag &= ~(ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN);
		if (autocorrect) {
			snprintf(buf, buflen, "Erroneous to have flag 'n', 'f', "
					      "or 'q' on resource \"%s\" which is type string, "
					      "string_array, or boolean; ignoring those flags.",
				 rescname);
			correction = 1;
		} else {
			snprintf(buf, buflen, "Erroneous to have flag 'n', 'f', "
					      "or 'q' on resource \"%s\" which is type string, "
					      "string_array, or boolean.",
				 rescname);
			return -1;
		}
	}

	if (autocorrect && correction)
		return -2;

	return 0;
}

/**
 * @brief parse type expression associated to the definition of a new resource
 *
 * @param[in] val - The value associated to the resource
 * @param[out] resc_type_p - resource type
 *
 * @retval 0 on success
 * @retval -1 on error
 */
int
parse_resc_type(char *val, int *resc_type_p)
{
	struct resc_type_map *p_resc_type_map;

	p_resc_type_map = find_resc_type_map_by_typest(val);
	if (p_resc_type_map == NULL)
		return -1;
	*resc_type_p = p_resc_type_map->rtm_type;

	return 0;
}

/**
 * @brief parse flags expression associated to the definition of a new resource
 *
 * @param[in] val - The value associated to the resource
 * @param[out] flag_ir_p - invisible and read-only flags
 * @param[out] resc_flag_p - resource flags
 *
 * @retval 0 on success
 * @retval -1 on error;
 */
int
parse_resc_flags(char *val, int *flag_ir_p, int *resc_flag_p)
{
	int resc_flag = READ_WRITE;
	int flag_ir = 0;

	if ((val == NULL) || (flag_ir_p == NULL) || (resc_flag_p == NULL))
		return -1;

	while (*val) {
		if (*val == 'q')
			resc_flag |= ATR_DFLAG_RASSN;
		else if (*val == 'f')
			resc_flag |= ATR_DFLAG_FNASSN;
		else if (*val == 'n')
			resc_flag |= ATR_DFLAG_ANASSN;
		else if (*val == 'h')
			resc_flag |= ATR_DFLAG_CVTSLT;
		else if (*val == 'm')
			resc_flag |= ATR_DFLAG_MOM;
		else if (*val == 'r') {
			if (flag_ir == 0) {
				resc_flag &= ~READ_WRITE;
				resc_flag |= NO_USER_SET;
			}
			flag_ir++;
		} else if (*val == 'i') {
			resc_flag &= ~READ_WRITE;
			resc_flag |= ATR_DFLAG_OPRD |
				     ATR_DFLAG_OPWR |
				     ATR_DFLAG_MGRD | ATR_DFLAG_MGWR;
			flag_ir++;
		} else
			return -1;
		val++;
	}
	*flag_ir_p = flag_ir;
	*resc_flag_p = resc_flag;
	return 0;
}


================================================
FILE: src/lib/Libattr/master_job_attr_def.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<data>
   <!--
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

   NOTE (Server File)

   job_attr_def is the array of attribute definitions for jobs.
   Each legal job attribute is defined here.
   The entries for each attribute are (see attribute.h):
       name,
       decode function,
       encode function,
       set function,
       compare function,
       free value space function,
       action function,
       access permission flags,
       value type,
       parent object type

   NOTE (ECL File)

   The entries for each attribute are (see attribute.h):\n
       name,
       type,
       flag,
       verify datatype function,
       verify value function

   NOTE NOTE NOTE NOTE NOTE
      For array jobs, if you want the job attribute to be
      included in a subjob, you must also modify
      "attrs_to_copy" in array_func.c

      Also status of subjobs are dependent on order of
      this list, please check status_subjob()->status_attrib()
      (with limit argument) and expand_remaining_subjob()
      before changing order
      -->
   <head>
      <SVR>
      #include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include "pbs_ifl.h"
      #include "list_link.h"
      #include "attribute.h"
      #include "job.h"
      #include "server_limits.h"

      attribute_def job_attr_def[] = {
      </SVR>
      <ECL>
      #include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include "pbs_ifl.h"
      #include "pbs_ecl.h"
      ecl_attribute_def ecl_job_attr_def[] = {
      </ECL>
   </head>
   <attributes>
      <member_index>JOB_ATR_jobname</member_index>
      <member_name>ATTR_N</member_name>
      <member_at_decode>decode_jobname</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>
         <SVR>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</SVR>
         <ECL>READ_ONLY</ECL>
      </member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_jobname</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_job_owner</member_index>
      <member_name>ATTR_owner</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resc_used</member_index>
      <member_name>ATTR_used</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resc_used_acct</member_index>
      <member_name>ATTR_used_acct</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR | ATR_DFLAG_NOSAVM | ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resc_used_update</member_index>
      <member_name>ATTR_used_update</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR | ATR_DFLAG_NOSAVM | ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_state</member_index>
      <member_name>ATTR_state</member_name>
      <member_at_decode>decode_c</member_at_decode>
      <member_at_encode>encode_c</member_at_encode>
      <member_at_set>set_c</member_at_set>
      <member_at_comp>comp_c</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_CHAR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_state</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resv</member_index>
      <member_name>ATTR_resv</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_in_queue</member_index>
      <member_name>ATTR_queue</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_at_server</member_index>
      <member_name>ATTR_server</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_account</member_index>
      <member_name>ATTR_A</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM | ATR_DFLAG_SCGALT</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_chkpnt</member_index>
      <member_name>ATTR_c</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>
#ifdef PBS_MOM
		comp_str
#else
		comp_chkpnt
#endif
      </member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifdef PBS_MOM
		NULL_FUNC
#else
		ck_chkpnt
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_checkpoint</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_ctime</member_index>
      <member_name>ATTR_ctime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_depend</member_index>
      <member_name>ATTR_depend</member_name>
      <member_at_decode>
#ifndef PBS_MOM
		decode_depend
#else
		decode_str
#endif
      </member_at_decode>
      <member_at_encode>
#ifndef PBS_MOM
		encode_depend
#else
		encode_str
#endif
      </member_at_encode>
      <member_at_set>
#ifndef PBS_MOM
		set_depend
#else
      set_str
#endif
      </member_at_set>
      <member_at_comp>
#ifndef PBS_MOM
		comp_depend
#else
		comp_str
#endif
      </member_at_comp>
      <member_at_free>
#ifndef PBS_MOM
		free_depend
#else
		free_str
#endif
      </member_at_free>
      <member_at_action>
#ifndef PBS_MOM
		depend_on_que
#else
		NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_LIST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_dependlist</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_errpath</member_index>
      <member_name>ATTR_e</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_path</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_host</member_index>
      <member_name>ATTR_exechost</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>
         <SVR>
#ifdef PBS_MOM
		READ_ONLY | ATR_DFLAG_MOM
#else
		READ_ONLY
#endif
      </SVR>
         <ECL>READ_ONLY</ECL>
      </member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_host2</member_index>
      <member_name>ATTR_exechost2</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_host_acct</member_index>
      <member_name>ATTR_exechost_acct</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>
         <SVR>
#ifdef PBS_MOM
		READ_ONLY | ATR_DFLAG_MOM
#else
		READ_ONLY | ATR_DFLAG_HIDDEN
#endif
      </SVR>
         <ECL>READ_ONLY</ECL>
      </member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_host_orig</member_index>
      <member_name>ATTR_exechost_orig</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>
         <SVR>
#ifdef PBS_MOM
		READ_ONLY | ATR_DFLAG_MOM
#else
		READ_ONLY | ATR_DFLAG_HIDDEN
#endif
      </SVR>
         <ECL>READ_ONLY</ECL>
      </member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_vnode</member_index>
      <member_name>ATTR_execvnode</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_vnode_acct</member_index>
      <member_name>ATTR_execvnode_acct</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM | ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_vnode_deallocated</member_index>
      <member_name>ATTR_execvnode_deallocated</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM |ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exec_vnode_orig</member_index>
      <member_name>ATTR_execvnode_orig</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM | ATR_DFLAG_SvWR | ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exectime</member_index>
      <member_name>ATTR_a</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
		job_set_wait
#else
		NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_grouplst</member_index>
      <member_name>ATTR_g</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM | ATR_DFLAG_SCGALT</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_user_list</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_hold</member_index>
      <member_name>ATTR_h</member_name>
      <member_at_decode>decode_hold</member_at_decode>
      <member_at_encode>encode_hold</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_hold</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_hold</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_interactive</member_index>
      <member_name>ATTR_inter</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_inter</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_join</member_index>
      <member_name>ATTR_j</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_joinpath</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_keep</member_index>
      <member_name>ATTR_k</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifdef PBS_MOM
		NULL_FUNC
#else
		keepfiles_action
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_keepfiles</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_mailpnts</member_index>
      <member_name>ATTR_m</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_mailpoints</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_mailuser</member_index>
      <member_name>ATTR_M</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_mailusers</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_mtime</member_index>
      <member_name>ATTR_mtime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_nodemux</member_index>
      <member_name>ATTR_nodemux</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_outpath</member_index>
      <member_name>ATTR_o</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_path</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_priority</member_index>
      <member_name>ATTR_p</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_priority</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_qtime</member_index>
      <member_name>ATTR_qtime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_remove</member_index>
      <member_name>ATTR_R</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifdef PBS_MOM
		NULL_FUNC
#else
		removefiles_action
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_removefiles</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_rerunable</member_index>
      <member_name>ATTR_r</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resource</member_index>
      <member_name>ATTR_l</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_job</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_MOM | ATR_DFLAG_SCGALT</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resource_orig</member_index>
      <member_name>ATTR_l_orig</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_job</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR| ATR_DFLAG_ALTRUN | ATR_DFLAG_MOM | ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resource_acct</member_index>
      <member_name>ATTR_l_acct</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_job</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | ATR_DFLAG_ALTRUN | ATR_DFLAG_MOM | ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_SchedSelect</member_index>
      <member_name>ATTR_SchedSelect</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_SchedSelect_orig</member_index>
      <member_name>ATTR_SchedSelect_orig</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MOM |ATR_DFLAG_HIDDEN</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_stime</member_index>
      <member_name>ATTR_stime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
      <attributes>
      <member_index>JOB_ATR_obittime</member_index>
      <member_name>ATTR_obittime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_session_id</member_index>
      <member_name>ATTR_session</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_shell</member_index>
      <member_name>ATTR_S</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_shellpathlist</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_sandbox</member_index>
      <member_name>ATTR_sandbox</member_name>
      <member_at_decode>decode_sandbox</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_sandbox</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_jobdir</member_index>
      <member_name>ATTR_jobdir</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_stagein</member_index>
      <member_name>ATTR_stagein</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_stagelist</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_stageout</member_index>
      <member_name>ATTR_stageout</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_stagelist</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_substate</member_index>
      <member_name>ATTR_substate</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_USRD | ATR_DFLAG_OPRD | ATR_DFLAG_MGRD | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_userlst</member_index>
      <member_name>ATTR_u</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>
#ifndef PBS_MOM
		set_uacl
#else
		set_arst
#endif
      </member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_SCGALT</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_user_list</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_variables</member_index>
      <member_name>ATTR_v</member_name>
      <member_at_decode>decode_arst_bs</member_at_decode>
      <member_at_encode>encode_arst_bs</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_euser</member_index>
      <member_name>ATTR_euser</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_egroup</member_index>
      <member_name>ATTR_egroup</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_hashname</member_index>
      <member_name>ATTR_hashname</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_hopcount</member_index>
      <member_name>ATTR_hopcount</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_qrank</member_index>
      <member_name>ATTR_qrank</member_name>
      <member_at_decode>decode_ll</member_at_decode>
      <member_at_encode>encode_ll</member_at_encode>
      <member_at_set>set_ll</member_at_set>
      <member_at_comp>comp_ll</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_LL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_queuetype</member_index>
      <member_name>ATTR_qtype</member_name>
      <member_at_decode>decode_c</member_at_decode>
      <member_at_encode>encode_c</member_at_encode>
      <member_at_set>set_c</member_at_set>
      <member_at_comp>comp_c</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_CHAR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_sched_hint</member_index>
      <member_name>ATTR_sched_hint</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MGWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_security</member_index>
      <member_name>ATTR_security</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_Comment</member_index>
      <member_name>ATTR_comment</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_SvWR | ATR_DFLAG_ALTRUN | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_Cookie</member_index>
      <member_name>ATTR_cookie</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvRD | ATR_DFLAG_SvWR | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_altid</member_index>
      <member_name>ATTR_altid</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_altid2</member_index>
      <member_name>ATTR_altid2</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_etime</member_index>
      <member_name>ATTR_etime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_reserve_ID</member_index>
      <member_name>ATTR_resv_ID</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_Creat | ATR_DFLAG_SvWR | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_refresh</member_index>
      <member_name>ATTR_refresh</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvRD | ATR_DFLAG_SvWR | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_gridname</member_index>
      <member_name>ATTR_gridname</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_umask</member_index>
      <member_name>ATTR_umask</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_block</member_index>
      <member_name>ATTR_block</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_inter</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_cred</member_index>
      <member_name>ATTR_cred</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_runcount</member_index>
      <member_name>ATTR_runcount</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_acct_id</member_index>
      <member_name>ATTR_acct_id</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_eligible_time</member_index>
      <member_name>ATTR_eligible_time</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
		alter_eligibletime
#else
		NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_SSET | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_accrue_type</member_index>
      <member_name>ATTR_accrue_type</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_none</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_ALTRUN | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_sample_starttime</member_index>
      <member_name>ATTR_sample_starttime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_job_kill_delay</member_index>
      <member_name>ATTR_job_kill_delay</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_stageout_status</member_index>
      <member_name>ATTR_stageout_status</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_exit_status</member_index>
      <member_name>ATTR_exit_status</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_submit_arguments</member_index>
      <member_name>ATTR_submit_arguments</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <!--
       Attributes to store command and its argument list specified
       in qsub command-line options list.
    -->
   <attributes>
      <member_index>JOB_ATR_executable</member_index>
      <member_name>ATTR_executable</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_Arglist</member_index>
      <member_name>ATTR_Arglist</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_prov_vnode</member_index>
      <member_name>ATTR_prov_vnode</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvRD | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <!--
	The following, Array Job related, attributes should be at the end of the
	job attributes, see status_subjob() to understand why.   When statusing
	a subjob,  they are not copied from the parent array job and having them
	at the end helps to do that.
    -->
   <attributes>
      <member_index>JOB_ATR_array</member_index>
      <member_name>ATTR_array</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | ATR_DFLAG_Creat | READ_ONLY | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_array_id</member_index>
      <member_name>ATTR_array_id</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_array_index</member_index>
      <member_name>ATTR_array_index</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MOM | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_array_state_count</member_index>
      <member_name>ATTR_array_state_count</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | READ_ONLY | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_array_indices_submitted</member_index>
      <member_name>ATTR_array_indices_submitted</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
		setup_arrayjob_attrs
#else
		NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_jrange</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_array_indices_remaining</member_index>
      <member_name>ATTR_array_indices_remaining</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
		fixup_arrayindicies
#else
		NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | ATR_DFLAG_SvRD | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_estimated</member_index>
      <member_name>ATTR_estimated</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_job</member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <!--
	the following is not really a job attribute, but used by selectjobs
	so listing them here at the end
    -->
   <attributes flag="ECL">
      <member_name>
         <ECL>ATTR_q</ECL>
      </member_name>
      <member_at_flags>ATR_DFLAG_SvWR|ATR_DFLAG_MGWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_node_set</member_index>
      <member_name>ATTR_node_set</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR|ATR_DFLAG_MGWR</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_history_timestamp</member_index>
      <member_name>ATTR_history_timestamp</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY|ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_project</member_index>
      <member_name>ATTR_project</member_name>
      <member_at_decode>decode_project</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM | ATR_DFLAG_SCGALT</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_X11_cookie</member_index>
      <member_name>ATTR_X11_cookie</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_USWR | ATR_DFLAG_MGRD | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_X11_port</member_index>
      <member_name>ATTR_X11_port</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_inter</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_sched_preempted</member_index>
      <member_name>ATTR_sched_preempted</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | ATR_DFLAG_MGWR | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_run_version</member_index>
      <member_name>ATTR_run_version</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_GUI</member_index>
      <member_name>ATTR_GUI</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_topjob</member_index>
      <member_name>ATTR_topjob</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>PRIV_READ | ATR_DFLAG_SvWR | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_topjob_ineligible</member_index>
      <member_name>ATTR_topjob_ineligible</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MGWR | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resc_released</member_index>
      <member_name>ATTR_released</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>PRIV_READ | ATR_DFLAG_SvWR | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_resc_released_list</member_index>
      <member_name>ATTR_rel_list</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_job</member_at_action>
      <member_at_flags>PRIV_READ</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_relnodes_on_stageout</member_index>
      <member_name>ATTR_relnodes_on_stageout</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_tolerate_node_failures</member_index>
      <member_name>ATTR_tolerate_node_failures</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SvRD | ATR_DFLAG_Creat | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_tolerate_node_failures</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_submit_host</member_index>
      <member_name>ATTR_submit_host</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_SvRD | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_cred_id</member_index>
      <member_name>ATTR_cred_id</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_SvRD | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_cred_validity</member_index>
      <member_name>ATTR_cred_validity</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY|ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_create_resv_from_job</member_index>
      <member_name>ATTR_create_resv_from_job</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>JOB_ATR_max_run_subjobs</member_index>
      <member_name>ATTR_max_run_subjobs</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifdef PBS_MOM
	  NULL_FUNC
#else
	  action_max_run_subjobs
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      #include "site_job_attr_def.h"
      /* THIS MUST BE THE LAST ENTRY */
      <member_name>"_other_"</member_name>
      <member_at_decode>decode_unkn</member_at_decode>
      <member_at_encode>encode_unkn</member_at_encode>
      <member_at_set>set_unkn</member_at_set>
      <member_at_comp>comp_unkn</member_at_comp>
      <member_at_free>free_unkn</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_LIST</member_at_type>
      <member_at_parent>PARENT_TYPE_JOB</member_at_parent>
   </attributes>
   <tail>
      <SVR>};</SVR>
      <ECL>};
int ecl_job_attr_size = sizeof(ecl_job_attr_def) / sizeof(ecl_attribute_def);</ECL>
   </tail>
</data>


================================================
FILE: src/lib/Libattr/master_node_attr_def.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<data>
   <!--
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

    NOTE (Server File)
    node_attr_def is the array of attribute definitions for nodes.
    Each legal node attribute is defined here.
    The entries for each attribute are (see attribute.h):
	name,
	decode function,
	encode function,
	set function,
	compare function,
	free value space function,
	action function,
	access permission flags,
	value type,
	parent object type

    NOTE (ECL File)
    The entries for each attribute are (see attribute.h):
	name,
	type,
	flag,
	verify datatype function,
	verify value function
    -->
   <head>
   <SVR>
   #include &lt;pbs_config.h&gt;
	#include &lt;sys/types.h&gt;
	#include &lt;stdlib.h&gt;
	#include &lt;ctype.h&gt;
	#include "server_limits.h"
	#include "pbs_ifl.h"
	#include &lt;string.h&gt;
	#include "list_link.h"
	#include "attribute.h"
	#include "resource.h"
	#include "pbs_error.h"
	#include "pbs_nodes.h"

	attribute_def node_attr_def[] = {
   </SVR>
   <ECL>#include &lt;pbs_config.h&gt;
	#include &lt;sys/types.h&gt;
	#include "pbs_ifl.h"
	#include "pbs_ecl.h"

	ecl_attribute_def ecl_node_attr_def[] = {
   </ECL>
   </head>
   <attributes>
      <member_index>ND_ATR_Mom</member_index>
      <member_name>ATTR_NODE_Mom</member_name>
      <member_at_decode>
#ifndef PBS_MOM
      decode_Mom_list
#else
      decode_null
#endif
      </member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst_uniq</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      set_node_host_name
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_Port</member_index>
      <member_name>ATTR_NODE_Port</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      set_node_mom_port
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>ATR_DFLAG_OPRD | ATR_DFLAG_MGRD | ATR_DFLAG_OPWR | ATR_DFLAG_MGWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_version</member_index>
      <member_name>ATTR_version</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_OPRD | ATR_DFLAG_MGRD | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_ntype</member_index>
      <member_name>ATTR_NODE_ntype</member_name>
      <member_at_decode>decode_ntype</member_at_decode>
      <member_at_encode>encode_ntype</member_at_encode>
      <member_at_set>set_node_ntype</member_at_set>
      <member_at_comp>comp_null</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>node_ntype</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_SHORT</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_state</member_index>
      <member_name>ATTR_NODE_state</member_name>
      <member_at_decode>decode_state</member_at_decode>
      <member_at_encode>encode_state</member_at_encode>
      <member_at_set>set_node_state</member_at_set>
      <member_at_comp>comp_null</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
#ifndef PBS_PYTHON
      node_state
#else
      NULL_FUNC
#endif
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_SHORT</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_pcpus</member_index>
      <member_name>ATTR_NODE_pcpus</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      node_pcpu_action
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_priority</member_index>
      <member_name>ATTR_p</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_priority</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_jobs</member_index>
      <member_name>ATTR_NODE_jobs</member_name>
      <member_at_decode>decode_null</member_at_decode>
      <member_at_encode>encode_jobs</member_at_encode>
      <member_at_set>set_null</member_at_set>
      <member_at_comp>comp_null</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_RDACC | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_JINFOP</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_MaxRun</member_index>
      <member_name>ATTR_maxrun</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_MaxUserRun</member_index>
      <member_name>ATTR_maxuserrun</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_MaxGrpRun</member_index>
      <member_name>ATTR_maxgrprun</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_No_Tasks</member_index>
      <member_name>ATTR_NODE_No_Tasks</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_PNames</member_index>
      <member_name>ATTR_PNames</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_resvs</member_index>
      <member_name>ATTR_NODE_resvs</member_name>
      <member_at_decode>decode_null</member_at_decode>
      <member_at_encode>encode_resvs</member_at_encode>
      <member_at_set>set_null</member_at_set>
      <member_at_comp>comp_null</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_RDACC | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_JINFOP</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_ResourceAvail</member_index>
      <member_name>ATTR_rescavail</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      node_np_action
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_ResourceAssn</member_index>
      <member_name>ATTR_rescassn</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_Queue</member_index>
      <member_name>ATTR_queue</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      node_queue_action
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_Comment</member_index>
      <member_name>ATTR_comment</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      node_comment
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_ResvEnable</member_index>
      <member_name>ATTR_NODE_resv_enable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_NoMultiNode</member_index>
      <member_name>ATTR_NODE_NoMultiNode</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_Sharing</member_index>
      <member_name>ATTR_NODE_Sharing</member_name>
      <member_at_decode>decode_sharing</member_at_decode>
      <member_at_encode>encode_sharing</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_ProvisionEnable</member_index>
      <member_name>ATTR_NODE_ProvisionEnable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      node_prov_enable_action
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_current_aoe</member_index>
      <member_name>ATTR_NODE_current_aoe</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      node_current_aoe_action
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_in_multivnode_host</member_index>
      <member_name>ATTR_NODE_in_multivnode_host</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MGWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_MaintJobs</member_index>
      <member_name>ATTR_NODE_MaintJobs</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR | ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>ND_ATR_License</member_index>
      <member_name>ATTR_NODE_License</member_name>
      <member_at_decode>decode_c</member_at_decode>
      <member_at_encode>encode_c</member_at_encode>
      <member_at_set>set_c</member_at_set>
      <member_at_comp>comp_c</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_CHAR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
   </attributes>
   <attributes flag="SVR">
      <member_index>ND_ATR_LicenseInfo</member_index>
      <member_name>ATTR_NODE_LicenseInfo</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
   </attributes>
   <attributes flag="SVR">
      <member_index>ND_ATR_TopologyInfo</member_index>
      <member_name>ATTR_NODE_TopologyInfo</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      set_node_topology
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>ATR_DFLAG_SSET | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
   </attributes>
   <attributes>
      <member_index>ND_ATR_vnode_pool</member_index>
      <member_name>ATTR_NODE_VnodePool</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      chk_vnode_pool
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_Power_Provisioning</member_index>
      <member_name>ATTR_NODE_power_provisioning</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      node_prov_enable_action
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_current_eoe</member_index>
      <member_name>ATTR_NODE_current_eoe</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_partition</member_index>
      <member_name>ATTR_partition</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifndef PBS_MOM
      action_node_partition
#else
      NULL_FUNC
#endif
      </member_at_action>
      <member_at_flags>ATR_DFLAG_OPRD | ATR_DFLAG_MGRD | ATR_DFLAG_OPWR | ATR_DFLAG_MGWR | ATR_DFLAG_USRD</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_poweroff_eligible</member_index>
      <member_name>ATTR_NODE_poweroff_eligible</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_last_state_change_time</member_index>
      <member_name>ATTR_NODE_last_state_change_time</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>ND_ATR_last_used_time</member_index>
      <member_name>ATTR_NODE_last_used_time</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_NODE</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <tail>
   <SVR>};</SVR>
   <ECL>};
	int ecl_node_attr_size = sizeof(ecl_node_attr_def)/sizeof(ecl_attribute_def);</ECL>
   </tail>
</data>


================================================
FILE: src/lib/Libattr/master_queue_attr_def.xml
================================================
<?xml version="1.0" encoding="utf-8"?>
<data>
	<!--
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

	NOTE (Server File)

	queue_attr_def is the array of attribute definitions for queue.
    Each legal job attribute is defined here.
    The entries for each attribute are (see attribute.h):
       name,
       decode function,
       encode function,
       set function,
       compare function,
       free value space function,
       action function,
       access permission flags,
       value type,
       parent object type

	 NOTE (ECL File)

	 The entries for each attribute are (see attribute.h):\n
       name,
       type,
       flag,
       verify datatype function,
       verify value function
	-->
    <head>
      <SVR>
      #include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include "pbs_ifl.h"
      #include "list_link.h"
      #include "attribute.h"
      #include "pbs_nodes.h"
      #include "svrfunc.h"

      attribute_def que_attr_def[] = {
      </SVR>
      <ECL>
      #include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include "pbs_ifl.h"
      #include "pbs_ecl.h"

      ecl_attribute_def ecl_que_attr_def[] = {
      </ECL>
    </head>
    <attributes>
	<member_index>QA_ATR_QType</member_index>
	<member_name>ATTR_qtype</member_name>		<!-- "queue_type"- type of queue -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>set_queue_type</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_queue_type</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_Priority</member_index>
	<member_name>ATTR_p</member_name>			<!-- "priority" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>verify_value_priority</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_MaxJobs</member_index>
	<member_name>ATTR_maxque</member_name>		<!-- "max_queuable" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_TotalJobs</member_index>
	<member_name>ATTR_total</member_name>		<!-- "total_jobs" -->
	<member_at_decode>decode_null</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_null</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>READ_ONLY</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_JobsByState</member_index>
	<member_name>ATTR_count</member_name>		<!-- "state_count" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_null</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>READ_ONLY</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_MaxRun</member_index>
	<member_name>ATTR_maxrun</member_name>		<!-- "max_running" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_max_queued</member_index>
	<member_name>ATTR_max_queued</member_name>	<!-- "max_queued" -->
	<member_at_decode>decode_entlim</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_ct</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_max_queued_res</member_index>
	<member_name>ATTR_max_queued_res</member_name>	<!-- "max_queued_res" -->
	<member_at_decode>decode_entlim_res</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim_res</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_res</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_AclHostEnabled</member_index>
	<member_name>ATTR_aclhten</member_name>		 <!-- "acl_host_enable" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_AclHost</member_index>
	<member_name>ATTR_aclhost</member_name>		<!-- "acl_hosts" -->
	<member_at_decode>decode_arst</member_at_decode>
	<member_at_encode>encode_arst</member_at_encode>
	<member_at_set>set_hostacl</member_at_set>
	<member_at_comp>comp_arst</member_at_comp>
	<member_at_free>free_arst</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ACL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_AclUserEnabled</member_index>
	<member_name>ATTR_acluren</member_name>		<!-- "acl_user_enable" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_AclUsers</member_index>
	<member_name>ATTR_acluser</member_name>		<!-- "acl_users" -->
	<member_at_decode>decode_arst</member_at_decode>
	<member_at_encode>encode_arst</member_at_encode>
	<member_at_set>set_uacl</member_at_set>
	<member_at_comp>comp_arst</member_at_comp>
	<member_at_free>free_arst</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ACL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_FromRouteOnly</member_index>
	<member_name>ATTR_fromroute</member_name>		 <!-- "from_route_only" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_ResourceMax</member_index>
	<member_name>ATTR_rescmax</member_name>		<!-- "resources_max" -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resources_min_max</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_ResourceMin</member_index>
	<member_name>ATTR_rescmin</member_name>		 <!-- "resources_min" -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resources_min_max</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_ResourceDefault</member_index>
	<member_name>ATTR_rescdflt</member_name>		 <!-- "resources_default" -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>action_resc_dflt_queue</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_ReqCredEnable</member_index>
	<member_name>ATTR_ReqCredEnable</member_name>	<!-- "require_cred_enable" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_ReqCred</member_index>
	<member_name>ATTR_ReqCred</member_name>		 <!-- "require_cred" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>cred_name_okay</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_credname</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_maxarraysize</member_index>
	<member_name>ATTR_maxarraysize</member_name>	 <!-- max_array_size -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_Comment</member_index>
	<member_name>ATTR_comment</member_name>			<!-- "comment" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET | ATR_DFLAG_NOSAVM</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_AclGroupEnabled</member_index>
	<member_name>ATTR_aclgren</member_name>		 <!-- "acl_group_enable" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_AclGroup</member_index>
	<member_name>ATTR_aclgroup</member_name>		 <!-- "acl_groups" -->
	<member_at_decode>decode_arst</member_at_decode>
	<member_at_encode>encode_arst</member_at_encode>
	<member_at_set>set_gacl</member_at_set>
	<member_at_comp>comp_arst</member_at_comp>
	<member_at_free>free_arst</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ACL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_ChkptMin</member_index>
	<member_name>ATTR_chkptmin</member_name>		<!-- "checkpoint_min" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
    <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_RendezvousRetry</member_index>
	<member_name>"rendezvous_retry"</member_name>
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_ReservedExpedite</member_index>
	<member_name>"reserved_expedite"</member_name>
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_ReservedSync</member_index>
	<member_name>"reserved_sync"</member_name>
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_DefaultChunk</member_index>
	<member_name>ATTR_DefaultChunk</member_name>	<!-- default_chunk -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>deflt_chunk_action</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_ResourceAvail</member_index>
	<member_name>"resources_available"</member_name>
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_ResourceAssn</member_index>
	<member_name>ATTR_rescassn</member_name>		<!-- "resources_assigned" -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>READ_ONLY | ATR_DFLAG_NOSAVM</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_KillDelay</member_index>
	<member_name>ATTR_killdelay</member_name>		<!-- "kill_delay" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxUserRun</member_index>
	<member_name>ATTR_maxuserrun</member_name>	<!-- "max_user_run" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxGrpRun</member_index>
	<member_name>ATTR_maxgrprun</member_name>		<!-- "max_group_run" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_max_run</member_index>
	<member_name>ATTR_max_run</member_name>		<!-- "max_run" -->
	<member_at_decode>decode_entlim</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_chk</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_max_run_res</member_index>
	<member_name>ATTR_max_run_res</member_name>		<!-- "max_run_res" -->
	<member_at_decode>decode_entlim_res</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim_res</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_chk</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_max_run_soft</member_index>
	<member_name>ATTR_max_run_soft</member_name>		<!-- "max_run_soft" -->
	<member_at_decode>decode_entlim</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_chk</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_max_run_res_soft</member_index>
	<member_name>ATTR_max_run_res_soft</member_name>		<!-- "max_run_res_soft" -->
	<member_at_decode>decode_entlim_res</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim_res</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_chk</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_HasNodes</member_index>
	<member_name>ATTR_HasNodes</member_name>		<!-- "hasnodes" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>READ_ONLY | ATR_DFLAG_NOSAVM</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxUserRes</member_index>
	<member_name>ATTR_maxuserres</member_name> 	<!-- max_user_res -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxGroupRes</member_index>
	<member_name>ATTR_maxgroupres</member_name> 	<!-- max_group_res -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxUserRunSoft</member_index>
	<member_name>ATTR_maxuserrunsoft</member_name>	<!-- max_user_run_soft -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxGrpRunSoft</member_index>
	<member_name>ATTR_maxgrprunsoft</member_name>	<!-- max_group_run_soft -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxUserResSoft</member_index>
	<member_name>ATTR_maxuserressoft</member_name>	<!-- max_user_res_soft -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_MaxGroupResSoft</member_index>
	<member_name>ATTR_maxgroupressoft</member_name>	<!-- max_group_res_soft -->
	<member_at_decode>decode_resc</member_at_decode>
	<member_at_encode>encode_resc</member_at_encode>
	<member_at_set>set_resc</member_at_set>
	<member_at_comp>comp_resc</member_at_comp>
	<member_at_free>free_resc</member_at_free>
	<member_at_action>check_no_entlim</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_RESC</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>verify_value_resc</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QE_ATR_NodeGroupKey</member_index>
	<member_name>ATTR_NodeGroupKey</member_name>	<!-- node_group_key -->
	<member_at_decode>decode_arst</member_at_decode>
	<member_at_encode>encode_arst</member_at_encode>
	<member_at_set>set_arst</member_at_set>
	<member_at_comp>comp_arst</member_at_comp>
	<member_at_free>free_arst</member_at_free>
	<member_at_action>is_valid_resource</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ARST</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
   <attributes>
   <member_index>QE_ATR_BackfillDepth</member_index>
        <member_name>ATTR_backfill_depth</member_name>             <!-- "backfill_depth" -->
        <member_at_decode>decode_l</member_at_decode>
        <member_at_encode>encode_l</member_at_encode>
        <member_at_set>set_l</member_at_set>
        <member_at_comp>comp_l</member_at_comp>
        <member_at_free>free_null</member_at_free>
        <member_at_action>action_backfill_depth</member_at_action>
        <member_at_flags>NO_USER_SET</member_at_flags>
        <member_at_type>ATR_TYPE_LONG</member_at_type>
        <member_at_parent>PARENT_TYPE_QUE_EXC</member_at_parent>
        <member_verify_function>
        <ECL>verify_datatype_long</ECL>
        <ECL>verify_value_zero_or_positive</ECL>
       </member_verify_function>
   </attributes>

    <attributes>
	<member_index>QR_ATR_RouteDestin</member_index>
	<member_name>ATTR_routedest</member_name>		<!-- "route_destinations" -->
	<member_at_decode>decode_arst</member_at_decode>
	<member_at_encode>encode_arst</member_at_encode>
	<member_at_set>set_arst</member_at_set>
	<member_at_comp>comp_arst</member_at_comp>
	<member_at_free>free_arst</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ARST</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_RTE</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QR_ATR_AltRouter</member_index>
	<member_name>ATTR_altrouter</member_name>		<!-- "alt_router" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_RTE</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QR_ATR_RouteHeld</member_index>
	<member_name>ATTR_routeheld</member_name>		<!-- "route_held_jobs" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_RTE</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QR_ATR_RouteWaiting</member_index>
	<member_name>ATTR_routewait</member_name>		<!-- "route_waiting_jobs" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_RTE</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QR_ATR_RouteRetryTime</member_index>
	<member_name>ATTR_routeretry</member_name>	<!-- "route_retry_time" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_RTE</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QR_ATR_RouteLifeTime</member_index>
	<member_name>ATTR_routelife</member_name>		<!-- "route_lifetime" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_RTE</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_Enabled</member_index>
	<member_name>ATTR_enable</member_name>		<!-- "enabled" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>check_que_enable</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_Started</member_index>
	<member_name>ATTR_start</member_name>		<!-- "started" -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>queuestart_action</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
 	<member_index>QA_ATR_queued_jobs_threshold</member_index>
	<member_name>ATTR_queued_jobs_threshold</member_name>	<!-- "queued_jobs_threshold" -->
	<member_at_decode>decode_entlim</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_ct</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_queued_jobs_threshold_res</member_index>
	<member_name>ATTR_queued_jobs_threshold_res</member_name>	<!-- "queued_jobs_threshold_res" -->
	<member_at_decode>decode_entlim_res</member_at_decode>
	<member_at_encode>encode_entlim</member_at_encode>
	<member_at_set>set_entlim_res</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_entlim</member_at_free>
	<member_at_action>action_entlim_res</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_ENTITY</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <attributes>
	<member_index>QA_ATR_partition</member_index>
	<member_name>ATTR_partition</member_name>	<!-- partition -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>action_queue_partition</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_QUE_ALL</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC </ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
    </attributes>
    <tail>
      <SVR>
	  #include "site_que_attr_def.h"
	};
      </SVR>
      <ECL>
	};
	int   ecl_que_attr_size = sizeof(ecl_que_attr_def)/sizeof(ecl_attribute_def);
      </ECL>
    </tail>
</data>


================================================
FILE: src/lib/Libattr/master_resc_def_all.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<data>
   <!--
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

	NOTE (Server File)

	resc_def_all is the array of attribute definitions for resc.
    Each legal job attribute is defined here.
    The entries for each attribute are (see attribute.h):
       name,
       decode function,
       encode function,
       set function,
       compare function,
       free value space function,
       action function,
       access permission flags,
       value type,
	   member_at_entlim,
	   member_at_struct,

	 NOTE (ECL File)

	 The entries for each attribute are (see attribute.h):\n
       name,
       type,
       flag,
       verify datatype function,
       verify value function
    -->
   <head>
      <SVR>
      #include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include &lt;stdlib.h&gt;
      #include &lt;stdio.h&gt;
      #include &lt;ctype.h&gt;
      #include "pbs_ifl.h"
      #include "server_limits.h"
      #include &lt;string.h&gt;
      #include "list_link.h"
      #include "attribute.h"
      #include "resource.h"
      #include "pbs_error.h"
      #include "pbs_nodes.h"
      #include "svrfunc.h"
      #include "grunt.h"

      extern int set_node_ct(resource *, attribute *, void *, int, int actmode);
      extern int decode_place(attribute *, char *, char *, char *);
      extern int preempt_targets_action(resource *presc, attribute *pattr, void *pobject, int type, int actmode);
      extern int action_soft_walltime(resource *presc, attribute *pattr, void *pobject, int type, int actmode);
      extern int action_walltime(resource *presc, attribute *pattr, void *pobject, int type, int actmode);
      extern int action_min_walltime(resource *presc, attribute *pattr, void *pobject, int type, int actmode);
      extern int action_max_walltime(resource *presc, attribute *pattr, void *pobject, int type, int actmode);
      extern int zero_or_positive_action  (resource *, attribute *, void *, int, int actmode);
      #ifndef PBS_MOM
      extern int host_action(resource *, attribute *, void *, int, int actmode);
      extern int resc_select_action(resource *, attribute *, void *, int, int);
      #endif /* PBS_MOM */
      /* ordered by guess to put ones most often used at front */

      static resource_def svr_resc_defm[] = {
      </SVR>
      <ECL>
      #include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include "pbs_ifl.h"
      #include "pbs_ecl.h"

      ecl_attribute_def ecl_svr_resc_def[] = {
      </ECL>
   </head>
   <attributes>
      <member_index>RESC_CPUT</member_index>
      <member_name>"cput"</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_MEM</member_index>
      <member_name>"mem"</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN |ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_size</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_WALLTIME</member_index>
      <member_name>"walltime"</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_walltime</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_SOFT_WALLTIME</member_index>
      <member_name>"soft_walltime"</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_soft_walltime</member_at_action>
      <member_at_flags>MGR_ONLY_SET | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_MIN_WALLTIME</member_index>
      <member_name>"min_walltime"</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_min_walltime</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_MAX_WALLTIME</member_index>
      <member_name>"max_walltime"</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_max_walltime</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_NCPUS</member_index>
      <member_name>"ncpus"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>zero_or_positive_action</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_NACCELERATORS</member_index>
      <member_name>"naccelerators"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes>
      <member_index>RESC_SELECT</member_index>
      <member_name>"select"</member_name>
      <member_at_decode>decode_select</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifdef PBS_MOM
		NULL_FUNC_RESC
#else
		resc_select_action
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_select</ECL>
         <ECL>verify_value_select</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_PLACE</member_index>
      <member_name>"place"</member_name>
      <member_at_decode>decode_place</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_NODES</member_index>
      <member_name>"nodes"</member_name>
      <member_at_decode>decode_nodes</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>set_node_ct</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_nodes</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_NODECT</member_index>
      <member_name>"nodect"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MGWR | ATR_DFLAG_RASSN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_ARCH</member_index>
      <member_name>"arch"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_NCHUNK</member_index>
      <member_name>"nchunk"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_VNTYPE</member_index>
      <member_name>"vntype"</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes>
      <member_index>RESC_MPIPROCS</member_index>
      <member_name>MPIPROCS</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>zero_or_positive_action</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_RASSN | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_OMPTHREADS</member_index>
      <member_name>OMPTHREADS</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>zero_or_positive_action</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_CPUPERCENT</member_index>
      <member_name>"cpupercent"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_ENERGY</member_index>
      <member_name>"energy"</member_name>
      <member_at_decode>decode_f</member_at_decode>
      <member_at_encode>encode_f</member_at_encode>
      <member_at_set>set_f</member_at_set>
      <member_at_comp>comp_f</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_FLOAT</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_float</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_FILE</member_index>
      <member_name>"file"</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_size</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_PMEM</member_index>
      <member_name>"pmem"</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_size</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_VMEM</member_index>
      <member_name>"vmem"</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_size</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_PVMEM</member_index>
      <member_name>"pvmem"</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_size</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_NICE</member_index>
      <member_name>"nice"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_PCPUT</member_index>
      <member_name>"pcput"</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_NODEMASK</member_index>
      <member_name>"nodemask"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_HPM</member_index>
      <member_name>"hpm"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_RASSN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_SSINODES</member_index>
      <member_name>"ssinodes"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_HOST</member_index>
      <member_name>"host"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>
#ifdef PBS_MOM
		NULL_FUNC_RESC
#else
		host_action
#endif
      </member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_VNODE</member_index>
      <member_name>"vnode"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_RESC</member_index>
      <member_name>"resc"</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_SOFTWARE</member_index>
      <member_name>"software"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_SITE</member_index>
      <member_name>"site"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_EXEC_VNODE</member_index>
      <member_name>"exec_vnode"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_START_TIME</member_index>
      <member_name>"start_time"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes macro="#if PE_MASK != 0">
      <member_index>RESC_PE_MASK</member_index>
      <member_name>"pe_mask"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_PARTITION</member_index>
      <member_name>"partition"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>NO_USER_SET | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes macro="#ifndef PBS_MOM" mflag="SVR">
      <member_index>RESC_AOE</member_index>
      <member_name>"aoe"</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes macro="#ifndef PBS_MOM" mflag="SVR">
      <member_index>RESC_EOE</member_index>
      <member_name>"eoe"</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESC_PREEMPT_TARGETS</member_index>
      <member_name>"preempt_targets"</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>preempt_targets_action</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_preempt_targets</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_ACCELERATOR</member_index>
      <member_name>"accelerator"</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_ACCELERATOR_MODEL</member_index>
      <member_name>"accelerator_model"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_ACCELERATOR_MEMORY</member_index>
      <member_name>"accelerator_memory"</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN |ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_ACCELERATOR_GROUP</member_index>
      <member_name>"accelerator_group"</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_PSTATE</member_index>
      <member_name>"pstate"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes>
      <member_index>RESC_HBMEM</member_index>
      <member_name>"hbmem"</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN |ATR_DFLAG_CVTSLT</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>(struct resource_def *)0</member_at_struct>
      <member_verify_function>
         <ECL>verify_datatype_size</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_PGOV</member_index>
      <member_name>"pgov"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_PCAP_NODE</member_index>
      <member_name>"pcap_node"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>zero_or_positive_action</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESC_PCAP_ACCELERATOR</member_index>
      <member_name>"pcap_accelerator"</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>zero_or_positive_action</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <attributes flag="SVR">
      <member_name>"|unknown|"</member_name>
      <member_at_decode>decode_unkn</member_at_decode>
      <member_at_encode>encode_unkn</member_at_encode>
      <member_at_set>set_unkn</member_at_set>
      <member_at_comp>comp_unkn</member_at_comp>
      <member_at_free>free_unkn</member_at_free>
      <member_at_action>NULL_FUNC_RESC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_LIST</member_at_type>
      <member_at_entlim>PBS_ENTLIM_NOLIMIT</member_at_entlim>
      <member_at_struct>NULL</member_at_struct>
   </attributes>
   <tail>
   <SVR>};
int svr_resc_size = sizeof(svr_resc_defm) / sizeof(resource_def);
resource_def *svr_resc_def = svr_resc_defm;
int svr_resc_unk = sizeof(svr_resc_defm) / sizeof(resource_def) - 1;</SVR>
   <ECL>};
int ecl_svr_resc_size = sizeof(ecl_svr_resc_def)/sizeof(ecl_attribute_def);</ECL>
   </tail>
</data>


================================================
FILE: src/lib/Libattr/master_resv_attr_def.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<data>
   <!--
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */


   The entries for each attribute are (see attribute.h):
       name,
       decode function,
       encode function,
       set function,
       compare function,
       free value space function,
       action function,
       access permission flags,
       value type,
       parent object type

     NOTE (ECL File)

     The entries for each attribute are (see attribute.h):\n
       name,
       type,
       flag,
       verify datatype function,
       verify value function
    -->
   <head>
      <SVR>#include &lt;pbs_config.h&gt;
     #include &lt;fcntl.h&gt;
     #include &lt;sys/types.h&gt;
     #include "pbs_ifl.h"
     #include "list_link.h"
     #include "attribute.h"
     #include "server_limits.h"
     #include "job.h"
     #include "reservation.h"


     attribute_def resv_attr_def[] = {</SVR>
      <ECL>#include &lt;pbs_config.h&gt;
     #include "pbs_ifl.h"
     #include "pbs_ecl.h"

    /* ordered by guess to put ones most often used at front */

     ecl_attribute_def ecl_resv_attr_def[] = {</ECL>
   </head>
   <attributes>
      <member_index>RESV_ATR_resv_name</member_index>
      <member_name>ATTR_resv_name</member_name>
      <member_at_decode>decode_jobname</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_jobname</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_owner</member_index>
      <member_name>ATTR_resv_owner</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_state</member_index>
      <member_name>ATTR_resv_state</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_RDACC | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_substate</member_index>
      <member_name>ATTR_resv_substate</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_RDACC | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_reserve_Tag</member_index>
      <member_name>ATTR_resv_Tag</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_Creat | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_reserveID</member_index>
      <member_name>ATTR_resv_ID</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_Creat | ATR_DFLAG_SvWR | READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_start</member_index>
      <member_name>ATTR_resv_start</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_end</member_index>
      <member_name>ATTR_resv_end</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_duration</member_index>
      <member_name>ATTR_resv_duration</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_queue</member_index>
      <member_name>ATTR_queue</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resource</member_index>
      <member_name>ATTR_l</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_resv</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_SchedSelect</member_index>
      <member_name>ATTR_SchedSelect</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resc_used</member_index>
      <member_name>ATTR_used</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_nodes</member_index>
      <member_name>ATTR_resv_nodes</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_userlst</member_index>
      <member_name>ATTR_u</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_uacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_user_list</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_grouplst</member_index>
      <member_name>ATTR_g</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_user_list</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_auth_u</member_index>
      <member_name>ATTR_auth_u</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_uacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_authorized_users</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_auth_g</member_index>
      <member_name>ATTR_auth_g</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_authorized_groups</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_auth_h</member_index>
      <member_name>ATTR_auth_h</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_at_server</member_index>
      <member_name>ATTR_server</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_account</member_index>
      <member_name>ATTR_A</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_ctime</member_index>
      <member_name>ATTR_ctime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_mailpnts</member_index>
      <member_name>ATTR_m</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_mailpoints</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_mailuser</member_index>
      <member_name>ATTR_M</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN | ATR_DFLAG_SELEQ</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_mailusers</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_mtime</member_index>
      <member_name>ATTR_mtime</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_hashname</member_index>
      <member_name>ATTR_hashname</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_hopcount</member_index>
      <member_name>ATTR_hopcount</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SSET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_priority</member_index>
      <member_name>ATTR_p</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_priority</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_interactive</member_index>
      <member_name>ATTR_inter</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_variables</member_index>
      <member_name>ATTR_v</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_SELEQ | ATR_DFLAG_MOM</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_euser</member_index>
      <member_name>ATTR_euser</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_egroup</member_index>
      <member_name>ATTR_egroup</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_convert</member_index>
      <member_name>ATTR_convert</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_standing</member_index>
      <member_name>ATTR_resv_standing</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_rrule</member_index>
      <member_name>ATTR_resv_rrule</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_idx</member_index>
      <member_name>ATTR_resv_idx</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_count</member_index>
      <member_name>ATTR_resv_count</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_ALTRUN</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_execvnodes</member_index>
      <member_name>ATTR_resv_execvnodes</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_resv_timezone</member_index>
      <member_name>ATTR_resv_timezone</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_retry</member_index>
      <member_name>ATTR_resv_retry</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_del_idle_time</member_index>
      <member_name>ATTR_del_idle_time</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_job</member_index>
      <member_name>ATTR_resv_job</member_name>
      <member_at_decode>decode_jobname</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_SchedSelect_orig</member_index>
      <member_name>ATTR_SchedSelect_orig</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_submit_host</member_index>
      <member_name>ATTR_submit_host</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_SvRD | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>RESV_ATR_cred_id</member_index>
      <member_name>ATTR_cred_id</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_WRITE | ATR_DFLAG_MOM | ATR_DFLAG_SvRD | ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESV_ATR_node_set</member_index>
      <member_name>
         <SVR>ATTR_node_set</SVR>
      </member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>
         <SVR>ATR_DFLAG_SvWR|ATR_DFLAG_MGWR</SVR>
      </member_at_flags>
      <member_at_type>
         <SVR>ATR_TYPE_ARST</SVR>
      </member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESV_ATR_partition</member_index>
      <member_name>
         <SVR>ATTR_partition</SVR>
      </member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>
         <SVR>ATR_DFLAG_SSET | READ_ONLY</SVR>
      </member_at_flags>
      <member_at_type>
         <SVR>ATR_TYPE_STR</SVR>
      </member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESV_ATR_alter_revert</member_index>
      <member_name>ATTR_resv_alter_revert</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_resv</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      <member_index>RESV_ATR_standing_revert</member_index>
      <member_name>ATTR_resv_standing_revert</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_resv</member_at_action>
      <member_at_flags>ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes flag="SVR">
      #include "site_resv_attr_def.h"
      <member_name>
         <SVR>"_other_"</SVR>
      </member_name>
      <member_at_decode>decode_unkn</member_at_decode>
      <member_at_encode>encode_unkn</member_at_encode>
      <member_at_set>set_unkn</member_at_set>
      <member_at_comp>comp_unkn</member_at_comp>
      <member_at_free>free_unkn</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>
         <SVR>READ_WRITE | ATR_DFLAG_SELEQ</SVR>
      </member_at_flags>
      <member_at_type>
         <SVR>ATR_TYPE_LIST</SVR>
      </member_at_type>
      <member_at_parent>PARENT_TYPE_RESV</member_at_parent>
   </attributes>
   <tail>
      <SVR>};</SVR>
      <ECL>};
	int   ecl_resv_attr_size = sizeof(ecl_resv_attr_def) / sizeof(ecl_attribute_def);</ECL>
   </tail>
</data>


================================================
FILE: src/lib/Libattr/master_sched_attr_def.xml
================================================
<?xml version="1.0"?>

<data>
   <!--
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

	NOTE (Server File)

	sched_attr_def the array of attribute definitions for sched object.
	Each legal sched attribute is defined here
	The entries for each attribute are (see attribute.h):
       name,
       decode function,
       encode function,
       set function,
       compare function,
       free value space function,
       action function,
       access permission flags,
       value type,
       parent object type

	NOTE (ECL File)

	ecl_sched_attr_def is the array of attribute and resource
 	definitions for scheduler.
 	The structure is used by the ECL verification functionality
 	to determine which verification function to be called for each
 	attribute.

	The entries for each attribute are (see attribute.h):
		name,
		type,
        flag,
		verify datatype function,
		verify value function
   -->
   <head>
     <SVR>
     #include &lt;pbs_config.h&gt;
     #include &lt;sys/types.h&gt;
     #include "pbs_ifl.h"
     #include "list_link.h"
     #include "attribute.h"
     #include "pbs_nodes.h"
     #include "svrfunc.h"
     #include "pbs_error.h"
     #include "pbs_python.h"

     attribute_def sched_attr_def[] = {
     </SVR>
     <ECL>
     #include &lt;pbs_config.h&gt;
     #include &lt;sys/types.h&gt;
     #include "pbs_ifl.h"
     #include "pbs_ecl.h"

     ecl_attribute_def ecl_sched_attr_def[] = {
     </ECL>
   </head>
   <attributes>
	<member_index>SCHED_ATR_SchedHost</member_index>
	<member_name>ATTR_SchedHost</member_name>		<!-- "Sched_Host" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>action_sched_host</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_sched_cycle_len</member_index>
	<member_name>ATTR_sched_cycle_len</member_name>	<!-- "sched_cycle_length" -->
	<member_at_decode>decode_time</member_at_decode>
	<member_at_encode>encode_time</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_time</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>  <member_index>SCHED_ATR_dont_span_psets</member_index>
	<member_name>ATTR_do_not_span_psets</member_name> 	<!-- do_not_span_psets -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>  <member_index>SCHED_ATR_only_explicit_psets</member_index>
	<member_name>ATTR_only_explicit_psets</member_name> 	<!-- only_explicit_psets -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>NO_USER_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
    <attributes>  <member_index>SCHED_ATR_sched_preempt_enforce_resumption</member_index>
	<member_name>ATTR_sched_preempt_enforce_resumption</member_name> 	<!-- sched_preempt_enforce_resumption -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>  <member_index>SCHED_ATR_preempt_targets_enable</member_index>
	<member_name>ATTR_preempt_targets_enable</member_name> 	<!-- preempt_targets_enable -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_BOOL</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_job_sort_formula_threshold</member_index>
	<member_name>ATTR_job_sort_formula_threshold</member_name>	<!-- "job_sort_formula_threshold" -->
	<member_at_decode>decode_f</member_at_decode>
	<member_at_encode>encode_f</member_at_encode>
	<member_at_set>set_f</member_at_set>
	<member_at_comp>comp_f</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>PRIV_READ | ATR_DFLAG_MGWR</member_at_flags>
	<member_at_type>ATR_TYPE_FLOAT</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_float</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>  <member_index>SCHED_ATR_throughput_mode</member_index>
	<member_name>ATTR_throughput_mode</member_name> 	<!-- throughput_mode -->
	<member_at_decode>decode_b</member_at_decode>
	<member_at_encode>encode_b</member_at_encode>
	<member_at_set>set_b</member_at_set>
	<member_at_comp>comp_b</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>action_throughput_mode</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_bool</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_job_run_wait</member_index>
        <member_name>ATTR_job_run_wait</member_name>    <!-- job_run_wait -->
        <member_at_decode>decode_str</member_at_decode>
        <member_at_encode>encode_str</member_at_encode>
        <member_at_set>set_str</member_at_set>
        <member_at_comp>comp_str</member_at_comp>
        <member_at_free>free_str</member_at_free>
        <member_at_action>action_job_run_wait</member_at_action>
        <member_at_flags>MGR_ONLY_SET</member_at_flags>
        <member_at_type>ATR_TYPE_STR</member_at_type>
        <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
        <member_verify_function>
        <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
        <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
        </member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_opt_backfill_fuzzy</member_index>
        <member_name>ATTR_opt_backfill_fuzzy</member_name>
        <member_at_decode>decode_str</member_at_decode>
        <member_at_encode>encode_str</member_at_encode>
        <member_at_set>set_str</member_at_set>
        <member_at_comp>comp_str</member_at_comp>
        <member_at_free>free_str</member_at_free>
        <member_at_action>action_opt_bf_fuzzy</member_at_action>
        <member_at_flags>MGR_ONLY_SET</member_at_flags>
        <member_at_type>ATR_TYPE_STR</member_at_type>
        <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
        <member_verify_function>
        <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
        <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
        </member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_partition</member_index>
	<member_name>ATTR_partition</member_name>		<!-- "partition" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>action_sched_partition</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
<member_index>SCHED_ATR_sched_priv</member_index>
	<member_name>ATTR_sched_priv</member_name>		<!-- "sched_priv" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>action_sched_priv</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
<member_index>SCHED_ATR_sched_log</member_index>
	<member_name>ATTR_sched_log</member_name>		<!-- "sched_log" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>action_sched_log</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_scheduling</member_index>
        <member_name>ATTR_scheduling</member_name>
        <member_at_decode>decode_b</member_at_decode>
        <member_at_encode>encode_b</member_at_encode>
        <member_at_set>set_b</member_at_set>
        <member_at_comp>comp_b</member_at_comp>
        <member_at_free>free_null</member_at_free>
        <member_at_action>poke_scheduler</member_at_action>
        <member_at_flags>MGR_ONLY_SET</member_at_flags>
        <member_at_type>ATR_TYPE_BOOL</member_at_type>
        <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
        <member_verify_function>
        <ECL>verify_datatype_bool</ECL>
        <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
        </member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_schediteration</member_index>
        <member_name>ATTR_schediteration</member_name>            <!-- "scheduler_iteration" -->
        <member_at_decode>decode_l</member_at_decode>
        <member_at_encode>encode_l</member_at_encode>
        <member_at_set>set_l</member_at_set>
        <member_at_comp>comp_l</member_at_comp>
        <member_at_free>free_null</member_at_free>
        <member_at_action>action_sched_iteration</member_at_action>
        <member_at_flags>MGR_ONLY_SET</member_at_flags>
        <member_at_type>ATR_TYPE_LONG</member_at_type>
        <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
        <member_verify_function>
        <ECL>verify_datatype_long</ECL>
        <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
        </member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_sched_user</member_index>
	<member_name>ATTR_sched_user</member_name>		<!-- "sched_user" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>action_sched_user</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_sched_comment</member_index>
        <member_name>ATTR_comment</member_name>                   <!-- "comment" -->
        <member_at_decode>decode_str</member_at_decode>
        <member_at_encode>encode_str</member_at_encode>
        <member_at_set>set_str</member_at_set>
        <member_at_comp>comp_str</member_at_comp>
        <member_at_free>free_str</member_at_free>
        <member_at_action>NULL_FUNC</member_at_action>
        <member_at_flags>MGR_ONLY_SET</member_at_flags>
        <member_at_type>ATR_TYPE_STR</member_at_type>
        <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
        <member_verify_function>
        <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
        <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
        </member_verify_function>
    </attributes>
    <attributes>
	<member_index>SCHED_ATR_sched_state</member_index>
	<member_name>ATTR_sched_state</member_name>	<!-- "state" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>READ_ONLY | ATR_DFLAG_SSET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_preempt_queue_prio</member_index>
	<member_name>ATTR_sched_preempt_queue_prio</member_name>	<!-- "preempt_queue_prio" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_preempt_prio</member_index>
	<member_name>ATTR_sched_preempt_prio</member_name>	<!-- "preempt_prio" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>verify_value_preempt_prio</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_preempt_order</member_index>
	<member_name>ATTR_sched_preempt_order</member_name>	<!-- "preempt_order" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>action_sched_preempt_order</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>verify_value_preempt_order</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_preempt_sort</member_index>
	<member_name>ATTR_sched_preempt_sort</member_name>	<!-- "preempt_sort" -->
	<member_at_decode>decode_str</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>verify_value_preempt_sort</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
   <member_index>SCHED_ATR_log_events</member_index>
        <member_name>ATTR_logevents</member_name>          <!-- "log_events" -->
        <member_at_decode>decode_l</member_at_decode>
        <member_at_encode>encode_l</member_at_encode>
        <member_at_set>set_l</member_at_set>
        <member_at_comp>comp_l</member_at_comp>
        <member_at_free>free_null</member_at_free>
        <member_at_action>NULL_FUNC</member_at_action>
        <member_at_flags>NO_USER_SET</member_at_flags>
        <member_at_type>ATR_TYPE_LONG</member_at_type>
        <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
        <member_verify_function>
        <ECL>verify_datatype_long</ECL>
        <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
        </member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_job_sort_formula</member_index>
	<member_name>ATTR_job_sort_formula</member_name>     <!-- "job_sort_formula" -->
	<member_at_decode>decode_formula</member_at_decode>
	<member_at_encode>encode_str</member_at_encode>
	<member_at_set>set_str</member_at_set>
	<member_at_comp>comp_str</member_at_comp>
	<member_at_free>free_str</member_at_free>
	<member_at_action>validate_job_formula</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_STR</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
	<ECL>NULL_VERIFY_VALUE_FUNC</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_server_dyn_res_alarm</member_index>
	<member_name>ATTR_sched_server_dyn_res_alarm</member_name>	<!-- "server_dyn_res_alarm" -->
	<member_at_decode>decode_l</member_at_decode>
	<member_at_encode>encode_l</member_at_encode>
	<member_at_set>set_l</member_at_set>
	<member_at_comp>comp_l</member_at_comp>
	<member_at_free>free_null</member_at_free>
	<member_at_action>NULL_FUNC</member_at_action>
	<member_at_flags>MGR_ONLY_SET</member_at_flags>
	<member_at_type>ATR_TYPE_LONG</member_at_type>
	<member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
	<member_verify_function>
	<ECL>verify_datatype_long</ECL>
	<ECL>verify_value_zero_or_positive</ECL>
	</member_verify_function>
   </attributes>
   <attributes>
	<member_index>SCHED_ATR_attr_update_period</member_index>
    <member_name>ATTR_attr_update_period</member_name> <!-- "attr_update_period" -->
    <member_at_decode>decode_l</member_at_decode>
    <member_at_encode>encode_l</member_at_encode>
    <member_at_set>set_l</member_at_set>
    <member_at_comp>comp_l</member_at_comp>
    <member_at_free>free_null</member_at_free>
    <member_at_action>NULL_FUNC</member_at_action>
    <member_at_flags>MGR_ONLY_SET</member_at_flags>
    <member_at_type>ATR_TYPE_LONG</member_at_type>
    <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
    <member_verify_function>
    <ECL>verify_datatype_long</ECL>
    <ECL>verify_value_zero_or_positive</ECL>
    </member_verify_function>
   </attributes>

    <tail>
     <SVR>
         #include "site_sched_attr_def.h"
	};
     </SVR>
     <ECL>
	};
	int ecl_sched_attr_size=sizeof(ecl_sched_attr_def)/sizeof(ecl_attribute_def);
     </ECL>
   </tail>
</data>


================================================
FILE: src/lib/Libattr/master_svr_attr_def.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<data>
   <!--
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

  svr_attr_def is the array of attribute definitions for the server.
  The entries for each attribute are (see attribute.h):
       name,
       decode function,
       encode function,
       set function,
       compare function,
       free value space function,
       action function,
       access permission flags,
       value type

  Each legal server attribute is defined here
  ecl_svr_attr_def is the array of attribute definitions
  for server.\n
  The structure is used by the ECL verification functionality
  to determine which verification function to be called for each
  attribute/resource.
  The entries for each attribute are (see attribute.h):
       name,
       member_flag,
       member_type,
       verify datatype function,
       verify value function

  -->
   <head>
      <SVR>#include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include "pbs_ifl.h"
      #include "list_link.h"
      #include "attribute.h"
      #include "pbs_nodes.h"
      #include "svrfunc.h"
      #include "pbs_error.h"
      #include "pbs_python.h"

      long resv_retry_time = RESV_RETRY_TIME_DEFAULT;

      attribute_def svr_attr_def[] = {</SVR>
      <ECL>#include &lt;pbs_config.h&gt;
      #include &lt;sys/types.h&gt;
      #include "pbs_ifl.h"
      #include "pbs_ecl.h"

      ecl_attribute_def ecl_svr_attr_def[] = {</ECL>
   </head>
   <attributes>
      <member_index>SVR_ATR_State</member_index>
      <member_name>ATTR_status</member_name>
      <member_at_decode>decode_null</member_at_decode>
      <member_at_encode>encode_svrstate</member_at_encode>
      <member_at_set>set_null</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY | ATR_DFLAG_NOSAVM</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_SvrHost</member_index>
      <member_name>ATTR_SvrHost</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_null</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_scheduling</member_index>
      <member_name>ATTR_scheduling</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>poke_scheduler</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_running</member_index>
      <member_name>ATTR_maxrun</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_queued</member_index>
      <member_name>ATTR_max_queued</member_name>
      <member_at_decode>decode_entlim</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_ct</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_queued_res</member_index>
      <member_name>ATTR_max_queued_res</member_name>
      <member_at_decode>decode_entlim_res</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim_res</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_res</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_run</member_index>
      <member_name>ATTR_max_run</member_name>
      <member_at_decode>decode_entlim</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_chk</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_run_res</member_index>
      <member_name>ATTR_max_run_res</member_name>
      <member_at_decode>decode_entlim_res</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim_res</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_chk</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_run_soft</member_index>
      <member_name>ATTR_max_run_soft</member_name>
      <member_at_decode>decode_entlim</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_chk</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_run_res_soft</member_index>
      <member_name>ATTR_max_run_res_soft</member_name>
      <member_at_decode>decode_entlim_res</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim_res</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_chk</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxUserRun</member_index>
      <member_name>ATTR_maxuserrun</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxGrpRun</member_index>
      <member_name>ATTR_maxgrprun</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxUserRes</member_index>
      <member_name>ATTR_maxuserres</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxGroupRes</member_index>
      <member_name>ATTR_maxgroupres</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxUserRunSoft</member_index>
      <member_name>ATTR_maxuserrunsoft</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxGrpRunSoft</member_index>
      <member_name>ATTR_maxgrprunsoft</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxUserResSoft</member_index>
      <member_name>ATTR_maxuserressoft</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_MaxGroupResSoft</member_index>
      <member_name>ATTR_maxgroupressoft</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>check_no_entlim</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_PNames</member_index>
      <member_name>ATTR_PNames</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_TotalJobs</member_index>
      <member_name>ATTR_total</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_null</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_JobsByState</member_index>
      <member_name>ATTR_count</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_null</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_host_enable</member_index>
      <member_name>ATTR_aclhten</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_hosts</member_index>
      <member_name>ATTR_aclhost</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_hostacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_host_moms_enable</member_index>
      <member_name>ATTR_aclhostmomsen</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_Resvhost_enable</member_index>
      <member_name>ATTR_aclResvhten</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_Resvhosts</member_index>
      <member_name>ATTR_aclResvhost</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_hostacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_ResvGroup_enable</member_index>
      <member_name>ATTR_aclResvgren</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_ResvGroups</member_index>
      <member_name>ATTR_aclResvgroup</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_AclUserEnabled</member_index>
      <member_name>ATTR_acluren</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_AclUsers</member_index>
      <member_name>ATTR_acluser</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_uacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_AclResvUserEnabled</member_index>
      <member_name>ATTR_aclResvuren</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_AclResvUsers</member_index>
      <member_name>ATTR_aclResvuser</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_uacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_AclRoot</member_index>
      <member_name>ATTR_aclroot</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_uacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_managers</member_index>
      <member_name>ATTR_managers</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_uacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>manager_oper_chk</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_mgr_opr_acl_check</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_operators</member_index>
      <member_name>ATTR_operators</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_uacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>manager_oper_chk</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_mgr_opr_acl_check</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_dflt_que</member_index>
      <member_name>ATTR_dfltque</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>default_queue_chk</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_log_events</member_index>
      <member_name>ATTR_logevents</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_log_events</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_mailer</member_index>
      <member_name>ATTR_mailer</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_mailfrom</member_index>
      <member_name>ATTR_mailfrom</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_query_others</member_index>
      <member_name>ATTR_queryother</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_resource_avail</member_index>
      <member_name>ATTR_rescavail</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_resource_deflt</member_index>
      <member_name>ATTR_rescdflt</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>action_resc_dflt_svr</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_DefaultChunk</member_index>
      <member_name>ATTR_DefaultChunk</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>deflt_chunk_action</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_ResourceMax</member_index>
      <member_name>ATTR_rescmax</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resources_min_max</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_resource_assn</member_index>
      <member_name>ATTR_rescassn</member_name>
      <member_at_decode>decode_resc</member_at_decode>
      <member_at_encode>encode_resc</member_at_encode>
      <member_at_set>set_resc</member_at_set>
      <member_at_comp>comp_resc</member_at_comp>
      <member_at_free>free_resc</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_resource_cost</member_index>
      <member_name>ATTR_resccost</member_name>
      <member_at_decode>decode_rcost</member_at_decode>
      <member_at_encode>encode_rcost</member_at_encode>
      <member_at_set>set_rcost</member_at_set>
      <member_at_comp>NULL_FUNC_CMP</member_at_comp>
      <member_at_free>free_rcost</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_RESC</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_resc</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_sys_cost</member_index>
      <member_name>ATTR_syscost</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>NULL_FUNC_CMP</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_scheduler_iteration</member_index>
      <member_name>ATTR_schediteration</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_svr_iteration</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_Comment</member_index>
      <member_name>ATTR_comment</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_DefNode</member_index>
      <member_name>ATTR_defnode</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_NodePack</member_index>
      <member_name>ATTR_nodepack</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_FlatUID</member_index>
      <member_name>ATTR_FlatUID</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_ResvEnable</member_index>
      <member_name>ATTR_ResvEnable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_NodeFailReq</member_index>
      <member_name>ATTR_nodefailrq</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_node_fail_requeue</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_maxarraysize</member_index>
      <member_name>ATTR_maxarraysize</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_ResendTermDelay</member_index>
      <member_name>ATTR_resendtermdelay</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_resend_term_delay</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_ReqCredEnable</member_index>
      <member_name>ATTR_ReqCredEnable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_ReqCred</member_index>
      <member_name>ATTR_ReqCred</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>cred_name_okay</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>verify_value_credname</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_NodeGroupEnable</member_index>
      <member_name>ATTR_NodeGroupEnable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_NodeGroupKey</member_index>
      <member_name>ATTR_NodeGroupKey</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>is_valid_resource</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_dfltqdelargs</member_index>
      <member_name>ATTR_dfltqdelargs</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_dfltqsubargs</member_index>
      <member_name>ATTR_dfltqsubargs</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>force_qsub_daemons_update_action</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_rpp_retry</member_index>
      <member_name>ATTR_rpp_retry</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_rpp_retry</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_rpp_highwater</member_index>
      <member_name>ATTR_rpp_highwater</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_rpp_highwater</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_non_zero_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_pbs_license_info</member_index>
      <member_name>ATTR_pbs_license_info</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>set_license_location</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_license_min</member_index>
      <member_name>ATTR_license_min</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_license_min</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_minlicenses</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_license_max</member_index>
      <member_name>ATTR_license_max</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_license_max</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_maxlicenses</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_license_linger</member_index>
      <member_name>ATTR_license_linger</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_license_linger</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_licenselinger</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_license_count</member_index>
      <member_name>ATTR_license_count</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_null</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_version</member_index>
      <member_name>"pbs_version"</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>READ_ONLY</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_job_sort_formula</member_index>
      <member_name>ATTR_job_sort_formula</member_name>
      <member_at_decode>decode_formula</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>validate_job_formula</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_EligibleTimeEnable</member_index>
      <member_name>ATTR_EligibleTimeEnable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>eligibletime_action</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_resv_retry_time</member_index>
      <member_name>ATTR_resv_retry_time</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_reserve_retry_time</member_at_action>
      <member_at_flags>ATR_DFLAG_MGWR | ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_resv_retry_init</member_index>
      <member_name>ATTR_resv_retry_init</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_reserve_retry_init</member_at_action>
      <member_at_flags>ATR_DFLAG_MGWR | ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_JobHistoryEnable</member_index>
      <member_name>ATTR_JobHistoryEnable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_job_history_enable</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_JobHistoryDuration</member_index>
      <member_name>ATTR_JobHistoryDuration</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_job_history_duration</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_ProvisionEnable</member_index>
      <member_name>ATTR_ProvisionEnable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR|ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_concurrent_prov</member_index>
      <member_name>ATTR_max_concurrent_prov</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>svr_max_conc_prov_action</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_provision_timeout</member_index>
      <member_name>ATTR_provision_timeout</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_resv_post_processing</member_index>
      <member_name>ATTR_resv_post_processing</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_BackfillDepth</member_index>
      <member_name>ATTR_backfill_depth</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_backfill_depth</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_zero_or_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_clear_est_enable</member_index>
      <member_name>ATTR_clearesten</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_clear_topjob_estimates</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_JobRequeTimeout</member_index>
      <member_name>ATTR_job_requeue_timeout</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>at_non_zero_time</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_PythonRestartMaxHooks</member_index>
      <member_name>ATTR_python_restart_max_hooks</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_non_zero_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_PythonRestartMaxObjects</member_index>
      <member_name>ATTR_python_restart_max_objects</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_non_zero_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_PythonRestartMinInterval</member_index>
      <member_name>ATTR_python_restart_min_interval</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>at_non_zero_time</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      #include "site_svr_attr_def.h"
      <member_index>SVR_ATR_queued_jobs_threshold</member_index>
      <member_name>ATTR_queued_jobs_threshold</member_name>
      <member_at_decode>decode_entlim</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_ct</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_queued_jobs_threshold_res</member_index>
      <member_name>ATTR_queued_jobs_threshold_res</member_name>
      <member_at_decode>decode_entlim_res</member_at_decode>
      <member_at_encode>encode_entlim</member_at_encode>
      <member_at_set>set_entlim_res</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_entlim</member_at_free>
      <member_at_action>action_entlim_res</member_at_action>
      <member_at_flags>NO_USER_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ENTITY</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_jobscript_max_size</member_index>
      <member_name>ATTR_jobscript_max_size</member_name>
      <member_at_decode>decode_size</member_at_decode>
      <member_at_encode>encode_size</member_at_encode>
      <member_at_set>set_size</member_at_set>
      <member_at_comp>comp_size</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>action_jobscript_max_size</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_SIZE</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_size</ECL>
         <ECL>verify_value_non_zero_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_restrict_res_to_release_on_suspend</member_index>
      <member_name>ATTR_restrict_res_to_release_on_suspend</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_arst</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>action_check_res_to_release</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ARST</member_at_type>
      <member_at_parent>PARENT_TYPE_SCHED</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_PowerProvisioning</member_index>
      <member_name>ATTR_power_provisioning</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR|ATR_DFLAG_MGRD</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_show_hidden_attribs</member_index>
      <member_name>ATTR_show_hidden_attribs</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_sync_mom_hookfiles_timeout</member_index>
      <member_name>ATTR_sync_mom_hookfiles_timeout</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_non_zero_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_rpp_max_pkt_check</member_index>
      <member_name>ATTR_rpp_max_pkt_check</member_name>
      <member_at_decode>decode_l</member_at_decode>
      <member_at_encode>encode_l</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long</ECL>
         <ECL>verify_value_non_zero_positive</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_max_job_sequence_id</member_index>
      <member_name>ATTR_max_job_sequence_id</member_name>
      <member_at_decode>decode_ll</member_at_decode>
      <member_at_encode>encode_ll</member_at_encode>
      <member_at_set>set_ll</member_at_set>
      <member_at_comp>comp_ll</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_max_job_sequence_id</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_long_long</ECL>
         <ECL>verify_value_non_zero_positive_long_long</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_has_runjob_hook</member_index>
      <member_name>ATTR_has_runjob_hook</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>ATR_DFLAG_SvWR</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_krb_realm_enable</member_index>
      <member_name>ATTR_acl_krb_realm_enable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_krb_realms</member_index>
      <member_name>ATTR_acl_krb_realms</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_hostacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_acl_krb_submit_realms</member_index>
      <member_name>ATTR_acl_krb_submit_realms</member_name>
      <member_at_decode>decode_arst</member_at_decode>
      <member_at_encode>encode_arst</member_at_encode>
      <member_at_set>set_hostacl</member_at_set>
      <member_at_comp>comp_arst</member_at_comp>
      <member_at_free>free_arst</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_ACL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_cred_renew_enable</member_index>
      <member_name>ATTR_cred_renew_enable</member_name>
      <member_at_decode>decode_b</member_at_decode>
      <member_at_encode>encode_b</member_at_encode>
      <member_at_set>set_b</member_at_set>
      <member_at_comp>comp_b</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_cred_renew_enable</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_BOOL</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_bool</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_cred_renew_tool</member_index>
      <member_name>ATTR_cred_renew_tool</member_name>
      <member_at_decode>decode_str</member_at_decode>
      <member_at_encode>encode_str</member_at_encode>
      <member_at_set>set_str</member_at_set>
      <member_at_comp>comp_str</member_at_comp>
      <member_at_free>free_str</member_at_free>
      <member_at_action>NULL_FUNC</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_STR</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>NULL_VERIFY_DATATYPE_FUNC</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_cred_renew_period</member_index>
      <member_name>ATTR_cred_renew_period</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_cred_renew_period</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <attributes>
      <member_index>SVR_ATR_cred_renew_cache_period</member_index>
      <member_name>ATTR_cred_renew_cache_period</member_name>
      <member_at_decode>decode_time</member_at_decode>
      <member_at_encode>encode_time</member_at_encode>
      <member_at_set>set_l</member_at_set>
      <member_at_comp>comp_l</member_at_comp>
      <member_at_free>free_null</member_at_free>
      <member_at_action>set_cred_renew_cache_period</member_at_action>
      <member_at_flags>MGR_ONLY_SET</member_at_flags>
      <member_at_type>ATR_TYPE_LONG</member_at_type>
      <member_at_parent>PARENT_TYPE_SERVER</member_at_parent>
      <member_verify_function>
         <ECL>verify_datatype_time</ECL>
         <ECL>NULL_VERIFY_VALUE_FUNC</ECL>
      </member_verify_function>
   </attributes>
   <tail>
      <SVR>};</SVR>
      <ECL>};
	int   ecl_svr_attr_size = sizeof(ecl_svr_attr_def) / sizeof(ecl_attribute_def);</ECL>
   </tail>
</data>


================================================
FILE: src/lib/Libattr/resc_map.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <memory.h>
#ifndef NDEBUG
#include <stdio.h>
#endif
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"

/**
 * @file	resc_map.c
 * @brief
 * This file contains functions for mapping a known resource type into the
 * corresponding functions.  They are used for adding custom resources where
 * the type is specified as a string such as "boolean" or "string".
 *
 * The mapping is accomplished by the resc_type_map structure which has an
 * entry for the various types of resouces.
 *
 * At some point, it might make sense to merge this with the resource_def
 * used by the Server.
 */

static struct resc_type_map resc_type_map_arr[] = {
	{"boolean",
	 ATR_TYPE_BOOL,
	 decode_b,
	 encode_b,
	 set_b,
	 comp_b,
	 free_null},

	{"long",
	 ATR_TYPE_LONG,
	 decode_l,
	 encode_l,
	 set_l,
	 comp_l,
	 free_null},

	{"string",
	 ATR_TYPE_STR,
	 decode_str,
	 encode_str,
	 set_str,
	 comp_str,
	 free_str},

	{"size",
	 ATR_TYPE_SIZE,
	 decode_size,
	 encode_size,
	 set_size,
	 comp_size,
	 free_null},

	{"float",
	 ATR_TYPE_FLOAT,
	 decode_f,
	 encode_f,
	 set_f,
	 comp_f,
	 free_null},

	{"string_array",
	 ATR_TYPE_ARST,
	 decode_arst,
	 encode_arst,
	 set_arst,
	 comp_arst,
	 free_arst}

};

/**
 * @brief
 *	Return a pointer to the resc_type_map entry corresponding to the
 *	numerical resource type as defined by ATR_TYPE_*.
 *
 * @par Functionality:
 *	Indexes through the resc_type_map array until a match is found or the
 *	end of the table is reached.
 *
 * @param[in]	typenum - Resource type value
 *
 * @return	resc_type_map *
 * @retval	pointer to map entry on success.
 * @retval	NULL if no matching entry found.
 *
 * @par Side Effects: None
 *
 * @par MT-safe: yes
 *
 */
struct resc_type_map *
find_resc_type_map_by_typev(int typenum)
{
	int i;
	int s = sizeof(resc_type_map_arr) / sizeof(struct resc_type_map);

	for (i = 0; i < s; ++i) {
		if (resc_type_map_arr[i].rtm_type == typenum)
			return (&resc_type_map_arr[i]);
	}
	return NULL; /* didn't find the matching type */
}

/**
 * @brief
 *	Return a pointer to the resc_type_map entry corresponding to the
 *	resource type as specified as a string.
 *
 * @par Functionality:
 *	Indexes through the resc_type_map array until a match is found or the
 *	end of the table is reached.
 *
 * @param[in]	typestr - Resource type as a string
 *
 * @return	resc_type_map *
 * @retval	pointer to map entry on success.
 * @retval	NULL if no matching entry found.
 *
 * @par Side Effects: None
 *
 * @par MT-safe: yes
 *
 */
struct resc_type_map *
find_resc_type_map_by_typest(char *typestr)
{
	int i;
	int s = sizeof(resc_type_map_arr) / sizeof(struct resc_type_map);

	if (typestr == NULL)
		return NULL;

	for (i = 0; i < s; ++i) {
		if (strcmp(typestr, resc_type_map_arr[i].rtm_rname) == 0)
			return (&resc_type_map_arr[i]);
	}
	return NULL; /* didn't find the matching type */
}

/**
 * @brief
 * 	Returns a string representation of numeric permission flags associated
 * 	to a resource
 *
 * @param[in] perms - The permission flags of the resource
 *
 * @par
 * 	Caller is responsible of freeing the returned string
 *
 * @return	string
 * @retval	flag val as string	success
 * @retval	NULL			error
 */
char *
find_resc_flag_map(int perms)
{
	char *flags;
	int i = 0;

	/* 10 is a bit over the max number of flags that could be set */
	flags = malloc(10 * sizeof(char));
	if (flags == NULL) {
		return NULL;
	}
	if (perms & ATR_DFLAG_CVTSLT)
		flags[i++] = 'h';
	if (perms & ATR_DFLAG_RASSN)
		flags[i++] = 'q';
	if (perms & ATR_DFLAG_ANASSN)
		flags[i++] = 'n';
	else if (perms & ATR_DFLAG_FNASSN)
		flags[i++] = 'f';
	if ((perms & (ATR_DFLAG_USRD | ATR_DFLAG_USWR)) == 0)
		flags[i++] = 'i';
	else if ((perms & ATR_DFLAG_USWR) == 0)
		flags[i++] = 'r';
	if (perms & ATR_DFLAG_MOM)
		flags[i++] = 'm';

	flags[i] = '\0';
	return flags;
}


================================================
FILE: src/lib/Libattr/strToL.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include "Long.h"
#include "Long_.h"

#undef strToL
#undef strTouL
u_Long strTouL(const char *nptr, char **endptr, int base);
/**
 * @file	strToL.c
 *
 * @brief
 * 	strToL - returns the Long value representing the string whose first
 *	character is *nptr, when interpreted as an integer in base, base.
 */

/**
 * @brief
 * 	strToL - returns the Long value representing the string whose first
 *	character is *nptr, when interpreted as an integer in base, base.
 *
 * @param[in]   	nptr - pointer to string to convert to u_Long
 * @param[in/out]   	endptr -  If endptr is not NULL,the function stores
 *              		the address of the first invalid character in *endptr.
 * @param[in] 		base - If base is zero, the base of the integer is determined by the way the
 * 			string starts.  The string is interpreted as decimal if the first
 * 			character after leading white space and an optional sign is a digit
 * 			between 1 and 9, inclusive.  The string is interpreted as octal if the
 * 			first character after leading white space and an optional sign is the
 * 			digit "0" and the next character is not an "X" (either upper or lower
 * 			case).  The string is interpreted as hexidecimal if the first character
 * 			after leading white space and an optional sign is the digit "0",
 * 			followed by an "X" (either upper or lower case).
 *
 * 	If base is greater than 1 and less than the number of characters in the
 *	Long_dig array, it represents the base in which the number will be
 *	interpreted.  Characters for digits beyond 9 are represented by the
 *	letters of the alphabet, either upper case or lower case.
 *
 * @return Long Returns the result of the conversion
 * @retval >= 0 The result of the conversion
 * @retval 0    FAILURE
 *
 */

Long
strToL(const char *nptr, char **endptr, int base)
{
	Long value;

	value = (Long) strTouL(nptr, endptr, base);
	if (Long_neg) {
		if (value >= 0) {
			value = lONG_MIN;
			errno = ERANGE;
		}
	} else if (value < 0) {
		value = lONG_MAX;
		errno = ERANGE;
	}
	return (value);
}


================================================
FILE: src/lib/Libattr/strTouL.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	strTouL.c
 *
 * @brief
 *	returns the unsigned Long value representing the string whose
 * 	first character is *nptr, when interpreted as an integer in base,
 *	base.
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <ctype.h>
#include <stddef.h>
#include <string.h>
#include <errno.h>

#include "Long.h"
#include "Long_.h"

#undef strTouL

#ifndef TRUE
#define TRUE 1
#define FALSE 0
#endif

static unsigned x_val;
static const char letters[] = "abcdefghijklmnopqrstuvwxyz";
static const char Long_dig[] = LONG_DIG_VALUE;
static char table[UCHAR_MAX + 1];

/**
 * @brief
 *	returns the unsigned Long value representing the string whose
 * 	first character is *nptr, when interpreted as an integer in base,
 *	base.
 *
 * @param[in]   nptr - pointer to string to convert to u_Long
 * @param[in/out]   endptr -  If endptr is not NULL,the function stores
 *              the address of the first invalid character in *endptr.
 * @param[in]   base - If base is zero, the base of the integer is determined by the way the
 * 	        string starts.  The string is interpreted as decimal if the first
 * 	        character after leading white space and an optional sign is a digit
 * 	        between 1 and 9, inclusive.  The string is interpreted as octal if the
 * 	        first character after leading white space and an optional sign is the
 * 	        digit "0" and the next character is not an "X" (either upper or lower
 * 	        case).  The string is interpreted as hexidecimal if the first character
 * 	        after leading white space and an optional sign is the digit "0",
 * 	        followed by an "X" (either upper or lower case).
 *              If base is greater than 1 and less than the number of characters in the
 *	        Long_dig array, it represents the base in which the number will be
 *	        interpreted.  Characters for digits beyond 9 are represented by the
 *	        letters of the alphabet, either upper case or lower case.
 *
 * @return u_Long Returns the result of the conversion
 * @retval >= 0	The result of the conversion
 * @retval 0	FAILURE
 */
u_Long
strTouL(const char *nptr, char **endptr, int base)
{
	unsigned digit;
	u_Long limit = 0, value;
	enum {
		unknown1,
		unknown2,
		hex1,
		hex2,
		hex3,
		known,
		working,
		overflow
	} state;

	if (table[(unsigned char) '1'] != 1) {
		int i; /* Initialize conversion table */

		(void) memset(table, CHAR_MAX, sizeof(table));
		for (i = (int) strlen(Long_dig) - 1; i >= 0; i--)
			table[(unsigned char) Long_dig[i]] = i;
		for (i = (int) strlen(letters) - 1; i >= 0; i--)
			table[(unsigned char) letters[i]] = i + 10;
		x_val = table[(unsigned char) 'x'];
	}
	if (nptr == NULL) {
		if (endptr != NULL)
			*endptr = (char *) nptr;
		return (0);
	}
	if (base < 0 || base == 1 || (size_t) base > strlen(Long_dig)) {
		errno = EDOM;
		if (endptr != NULL)
			*endptr = (char *) nptr;
		return (0);
	}
	switch (base) {
		case 0:
			state = unknown1;
			break;
		case 16:
			state = hex1;
			break;
		default:
			state = known;
	}
	while (isspace(*nptr++))
		;
	Long_neg = FALSE;
	switch (*--nptr) {
		case '-':
			Long_neg = TRUE;
		case '+':
			nptr++;
	}
	value = 0;
	while ((digit = table[(unsigned char) *nptr++]) != CHAR_MAX) {
		switch (state) {
			case unknown1:
				if (digit >= 10)
					goto done;
				if (digit == 0) {
					state = unknown2;
					break;
				}
				base = 10;
				state = working;
				limit = UlONG_MAX / 10;
				value = digit;
				break;
			case unknown2:
				if (digit >= 8) {
					if (digit != x_val)
						goto done;
					base = 16;
					state = hex3;
					break;
				}
				base = 8;
				state = working;
				limit = UlONG_MAX / 8;
				value = digit;
				break;
			case hex1:
				if (digit >= base)
					goto done;
				if (digit == 0) {
					state = hex2;
					break;
				}
				state = working;
				limit = UlONG_MAX / 16;
				value = digit;
				break;
			case hex2:
				if (digit == x_val) {
					state = hex3;
					break;
				}
			case hex3:
			case known:
				if (digit >= base)
					goto done;
				state = working;
				limit = UlONG_MAX / base;
				value = digit;
				break;
			case working:
				if (digit >= base)
					goto done;
				if (value < limit) {
					value = value * base + digit;
					break;
				}
				if (value > limit ||
				    UlONG_MAX - (value *= base) < digit) {
					state = overflow;
					value = UlONG_MAX;
					errno = ERANGE;
					break;
				}
				value += digit;
				break;
			case overflow:
				if (digit >= base)
					goto done;
		}
	}
done:
	if (endptr != NULL) {
		if (state == hex3)
			nptr--;
		*endptr = (char *) --nptr;
	}
	if (Long_neg)
		errno = ERANGE;
	return value;
}


================================================
FILE: src/lib/Libattr/uLTostr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	uLTostr.c
 *
 * @brief
 * 	uLTostr -  returns a pointer to the character string representation of the
 *	u_Long, value, represented in base, base.
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <errno.h>
#include "Long.h"
#include "Long_.h"

#define LBUFSIZ (CHAR_BIT * sizeof(u_Long) + 2)

static char buffer[LBUFSIZ];
static const char Long_dig[] = LONG_DIG_VALUE;

/**
 * @brief
 * 	uLTostr -  returns a pointer to the character string representation of the
 *	u_Long, value, represented in base, base.
 *
 *	If base is outside its domain of 2 through the number of characters in
 *	the Long_dig array, uLTostr returns a zero-length string and sets errno
 *	to EDOM.
 *
 *	The string is stored in a static array and will be clobbered the next
 *	time either LTostr or uLTostr is called.  The price of eliminating the
 *	possibility of memory leaks is the necessity to copy the string
 *	immediately to a safe place if it must last.
 *
 * @param[in] value - u_Long value
 * @param[in] base - base representation of val
 *
 * @return      string
 * @retval      char reprsn of u_Long     Success
 * @retval      NULL                      error
 *
 */

const char *
uLTostr(u_Long value, int base)
{
	char *bp = &buffer[LBUFSIZ];

	*--bp = '\0';
	if (base < 2 || base > strlen(Long_dig)) {
		errno = EDOM;
		return (bp);
	}
	do {
		*--bp = Long_dig[value % base];
		value /= base;
	} while (value);
	switch (base) {
		case 16:
			*--bp = 'x';
		case 8:
			*--bp = '0';
	}
	return (bp);
}


================================================
FILE: src/lib/Libauth/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = \
	gss \
	munge


================================================
FILE: src/lib/Libauth/README.md
================================================
***This file explains about LibAuth API Interface descriptions and design...***

# pbs_auth_set_config
 - **Synopsis:** void pbs_auth_set_config(const pbs_auth_config_t *auth_config)
 - **Description:** This API sets configuration for the authentication library like logging method, where it can find required credentials etc... This API should be called first before calling any other LibAuth API.
 - **Arguments:**

	- const pbs_auth_config_t *auth_config

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to a configuration structure as shown below for the authentication library.

		```c
		typedef struct pbs_auth_config {
			/* Path to PBS_HOME directory (aka same value as PBS_HOME in pbs.conf). This must be a null-terminated string. */
			char *pbs_home_path;

			/* Path to PBS_EXEC directory (aka same value as PBS_EXEC in pbs.conf). This must be a null-terminated string. */
			char *pbs_exec_path;

			/* Name of authentication method (aka same value as PBS_AUTH_METHOD in pbs.conf). This must be a null-terminated string. */
			char *auth_method;

			/* Name of encryption method (aka same value as PBS_ENCRYPT_METHOD in pbs.conf). This must be a null-terminated string. */
			char *encrypt_method;

			/*
			 * Function pointer to the logging method with the same signature as log_event from Liblog.
			 * With this, the user of the authentication library can redirect logs from the authentication
			 * library into respective log files or stderr in case no log files.
			 * If func is set to NULL then logs will be written to stderr (if available, else no logging at all).
			 */
			void (*logfunc)(int type, int objclass, int severity, const char *objname, const char *text);
		} pbs_auth_config_t;
		```

 - **Return Value:** None, void

# pbs_auth_create_ctx
 - **Synopsis:** int pbs_auth_create_ctx(void **ctx, int mode, int conn_type, char *hostname)
 - **Description:** This API creates an authentication context for a given mode and conn_type, which will be used by other LibAuth API for authentication, encrypt and decrypt data.
 - **Arguments:**

	- void **ctx

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to auth context to be created

	- int mode

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Specify which type of context to be created, should be one of AUTH_CLIENT or AUTH_SERVER.

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Use AUTH_CLIENT for client-side (aka who is initiating authentication) context

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Use AUTH_SERVER for server-side (aka who is authenticating incoming user/connection) context

		```c
		enum AUTH_ROLE {
			AUTH_ROLE_UNKNOWN = 0,
			AUTH_CLIENT,
			AUTH_SERVER,
			AUTH_ROLE_LAST
		};
		```

	- int conn_type

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Specify which type of connection is for which context to be created, should be one of AUTH_USER_CONN or AUTH_SERVICE_CONN

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Use AUTH_USER_CONN for user-oriented connection (aka like PBS client is connecting to PBS Server)


		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Use AUTH_SERVICE_CONN for service-oriented connection (aka like PBS Mom is connecting to PBS Server via PBS Comm)

		```c
		enum AUTH_CONN_TYPE {
			AUTH_USER_CONN = 0,
			AUTH_SERVICE_CONN
		};
		```

	- char *hostname

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;The null-terminated hostname of another authenticating party

 - **Return Value:** Integer

	- 0 - On Success

	- 1 - On Failure

 - **Cleanup:** A context created by this API should be destroyed by auth_free_ctx when the context is no more required

# pbs_auth_destroy_ctx
 - **Synopsis:** void pbs_auth_destroy_ctx(void *ctx)
 - **Description:** This API destroys the authentication context created by pbs_auth_create_ctx
 - **Arguments:**

	- void *ctx

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to auth context to be destroyed

 - **Return Value:** None, void

# pbs_auth_get_userinfo
 - **Synopsis:** int pbs_auth_get_userinfo(void *ctx, char **user, char **host, char **realm)
 - **Description:** Extract username and its realm, hostname of the connecting party from the given authentication context. Extracted user, host and realm values will be a null-terminated string. This API is mostly useful on authenticating server-side to get another party (aka auth client) information and the auth server might want to use this information from the auth library to match against the actual username/realm/hostname provided by the connecting party.
 - **Arguments:**

	- void *ctx

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to auth context from which information will be extracted

	- char **user

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to a buffer in which this API will write the user name

	- char **host

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to a buffer in which this API will write hostname

	- char **realm

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to a buffer in which this API will write the realm

 - **Return Value:** Integer

	- 0 - On Success

	- 1 - On Failure

 - **Cleanup:** Returned user, host, and realm should be freed using free() when no more required, as it will be allocated heap memory.

 - **Example:** This example shows what will be the value of the user, host, and realm. Let's take an example of GSS/Kerberos authentication, where auth client hostname is "xyz.abc.com", the username is "test" and in Kerberos configuration domain realm is "PBS" so when this auth client authenticates to server using Kerberos authentication method, it will be authenticated as "test@PBS" and this API will return user = test, host = xyz.abc.com, and realm = PBS.

# pbs_auth_process_handshake_data
 - **Synopsis:** int pbs_auth_process_handshake_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out, int *is_handshake_done)
 - **Description:** Process incoming handshake data and do the handshake, and if required generate handshake data which will be sent to another party. If there is no incoming data then initiate a handshake and generate initial handshake data to be sent to the authentication server.
 - **Arguments:**

	- void *ctx

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to auth context for which handshake is happening

	- void *data_in

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Incoming handshake data to process if any. This can be NULL which indicates to initiate handshake and generate initial handshake data to be sent to the authentication server.

	- size_t len_in

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Length of incoming handshake data if any, else 0

	- void **data_out

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Outgoing handshake data to be sent to another authentication party, this can be NULL is handshake is completed and no further data needs to be sent.

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;On failure (aka return 1 by this API), data in data_out will be considered as error data/message, which will be sent to another authentication party as auth error data.

	- size_t *len_out

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Length of outgoing handshake/auth error data if any, else 0

	- int *is_handshake_done

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;To indicate whether handshake is completed or not, 0 - means handshake is not completed or 1 - means handshake is completed

 - **Return Value:** Integer

	- 0 - On Success

	- 1 - On Failure

 - **Cleanup:** Returned data_out (if any) should be freed using free() when no more required, as it will be allocated heap memory.

# pbs_auth_encrypt_data
 - **Synopsis:** int pbs_auth_encrypt_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out)
 - **Description:** Encrypt given clear text data with the given authentication context
 - **Arguments:**

	- void *ctx

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to auth context which will be used while encrypting given clear text data

	- void *data_in

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;clear text data to encrypt

	- size_t len_in

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Length of clear text data

	- void **data_out

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Encrypted data

	- size_t *len_out

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Length of encrypted data

 - **Return Value:** Integer

	- 0 - On Success

	- 1 - On Failure

 - **Cleanup:** Returned data_out should be freed using free() when no more required, as it will be allocated heap memory.

# pbs_auth_decrypt_data
 - **Synopsis:** int pbs_auth_decrypt_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out)
 - **Description:** Decrypt given encrypted data with the given authentication context
 - **Arguments:**

	- void *ctx

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Pointer to auth context which will be used while decrypting given encrypted data

	- void *data_in

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Encrypted data to decrypt

	- size_t len_in

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Length of Encrypted data

	- void **data_out

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;clear text data

	- size_t *len_out

		&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Length of clear text data

 - **Return Value:** Integer

	- 0 - On Success

	- 1 - On Failure

 - **Cleanup:** Returned data_out should be freed using free() when no more required, as it will be allocated heap memory.


================================================
FILE: src/lib/Libauth/gss/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
if KRB5_ENABLED

lib_LTLIBRARIES = libauth_gss.la

libauth_gss_la_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

libauth_gss_la_LDFLAGS = -version-info 0:0:0 -shared -fPIC

libauth_gss_la_LIBADD= \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	@KRB5_LIBS@ \
	-lpthread

libauth_gss_la_SOURCES = \
	pbs_gss.c

endif


================================================
FILE: src/lib/Libauth/gss/pbs_gss.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include <unistd.h>
#include <pthread.h>
#include <gssapi.h>
#include <gssapi.h>
#include <krb5.h>
#include <errno.h>
#include <termios.h>
#include <pty.h>
#include <sys/wait.h>
#include "pbs_ifl.h"
#include "libauth.h"
#include "pbs_internal.h"

#if defined(KRB5_HEIMDAL)
#define PBS_GSS_MECH_OID GSS_KRB5_MECHANISM
#else
#include <gssapi/gssapi_krb5.h>
#define PBS_GSS_MECH_OID (gss_OID) gss_mech_krb5
#endif

static pthread_mutex_t gss_mutex;
static pthread_once_t gss_init_once = PTHREAD_ONCE_INIT;
static char gss_log_buffer[LOG_BUF_SIZE];
static void (*logger)(int type, int objclass, int severity, const char *objname, const char *text);
#define DEFAULT_CREDENTIAL_LIFETIME 7200

#define __GSS_LOGGER(e, c, s, m)                                          \
	do {                                                              \
		if (logger == NULL) {                                     \
			if (s != LOG_DEBUG)                               \
				fprintf(stderr, "%s: %s\n", __func__, m); \
		} else {                                                  \
			logger(e, c, s, "", m);                           \
		}                                                         \
	} while (0)
#define GSS_LOG_ERR(m) __GSS_LOGGER(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, m)
#define GSS_LOG_DBG(m) __GSS_LOGGER(PBSEVENT_DEBUG | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_DEBUG, m)
#define __GSS_LOGGER_STS(m, s, c)                                                                                  \
	do {                                                                                                       \
		OM_uint32 _mstat;                                                                                  \
		gss_buffer_desc _msg;                                                                              \
		OM_uint32 _msg_ctx;                                                                                \
		_msg_ctx = 0;                                                                                      \
		char buf[LOG_BUF_SIZE];                                                                            \
		do {                                                                                               \
			buf[0] = '\0';                                                                             \
			gss_display_status(&_mstat, s, c, GSS_C_NULL_OID, &_msg_ctx, &_msg);                       \
			snprintf(buf, LOG_BUF_SIZE, "GSS - %s : %.*s", m, (int) _msg.length, (char *) _msg.value); \
			GSS_LOG_ERR(buf);                                                                          \
			(void) gss_release_buffer(&_mstat, &_msg);                                                 \
		} while (_msg_ctx != 0);                                                                           \
	} while (0)
#define GSS_LOG_STS(m, mjs, mis)                  \
	__GSS_LOGGER_STS(m, mjs, GSS_C_GSS_CODE); \
	__GSS_LOGGER_STS(m, mis, GSS_C_MECH_CODE)

#define PBS_KRB5_SERVICE_NAME "host"
#define PBS_KRB5_CLIENT_CCNAME "FILE:/tmp/krb5cc_pbs_client"

#define GSS_NT_SERVICE_NAME GSS_C_NT_HOSTBASED_SERVICE

typedef struct {
	gss_ctx_id_t gssctx;	/* gss security context */
	int gssctx_established; /* true if gss context has been established */
	int is_secure;		/* wrapping includes encryption */
	enum AUTH_ROLE role;	/* value is client or server */
	int conn_type;		/* type of connection one of user-oriented or service-oriented */
	char *hostname;		/* server name */
	char *clientname;	/* client name in string */
} pbs_gss_extra_t;

enum PBS_GSS_ERRORS {
	PBS_GSS_OK = 0,
	PBS_GSS_CONTINUE_NEEDED,
	PBS_GSS_ERR_INTERNAL,
	PBS_GSS_ERR_IMPORT_NAME,
	PBS_GSS_ERR_ACQUIRE_CREDS,
	PBS_GSS_ERR_CONTEXT_INIT,
	PBS_GSS_ERR_CONTEXT_ACCEPT,
	PBS_GSS_ERR_CONTEXT_DELETE,
	PBS_GSS_ERR_CONTEXT_ESTABLISH,
	PBS_GSS_ERR_NAME_CONVERT,
	PBS_GSS_ERR_WRAP,
	PBS_GSS_ERR_UNWRAP,
	PBS_GSS_ERR_OID,
	PBS_GSS_ERR_LAST
};

static int pbs_gss_can_get_creds(const gss_OID_set oidset);
static int pbs_gss_ask_user_creds();
static int init_pbs_client_ccache_from_keytab(char *err_buf, int err_buf_size);
static void init_gss_mutex(void);

/**
 * @brief
 *	Acquire lock on a mutex
 *
 * @param[in] - lock - ptr to a mutex variable
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
static int
gss_lock(pthread_mutex_t *lock)
{
	if (pthread_mutex_lock(lock) != 0) {
		GSS_LOG_ERR("Failed to lock mutex");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Release lock on a mutex
 *
 * @param[in] - lock - ptr to a mutex variable
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
static int
gss_unlock(pthread_mutex_t *lock)
{
	if (pthread_mutex_unlock(lock) != 0) {
		GSS_LOG_ERR("Failed to unlock mutex");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	wrapper function for gss_fork_mutex_lock().
 *
 */
void
gss_atfork_prepare()
{
	gss_lock(&gss_mutex);
}

/**
 * @brief
 *	wrapper function for gss_fork_mutex_unlock().
 *
 */
void
gss_atfork_parent()
{
	gss_unlock(&gss_mutex);
}

/**
 * @brief
 *	wrapper function for init_gss_mutex().
 *
 */
void
gss_atfork_child()
{
	init_gss_mutex();
}

/**
 * @brief
 *	Initialize gss mutex.
 *
 */
static void
init_gss_mutex(void)
{
	pthread_mutexattr_t attr;

	if (pthread_mutexattr_init(&attr) != 0) {
		GSS_LOG_ERR("Failed to initialize mutex attr");
		return;
	}

	if (pthread_mutexattr_settype(&attr, PTHREAD_MUTEX_RECURSIVE_NP)) {
		GSS_LOG_ERR("Failed to set mutex type");
		return;
	}

	if (pthread_mutex_init(&gss_mutex, &attr) != 0) {
		GSS_LOG_ERR("Failed to initialize gss mutex");
		return;
	}

	return;
}

/**
 * @brief
 *	Initialize gss at fork.
 *
 */
static void
init_gss_atfork(void)
{
	init_gss_mutex();

	if (pthread_atfork(gss_atfork_prepare, gss_atfork_parent, gss_atfork_child) != 0) {
		GSS_LOG_ERR("gss atfork handler failed");
		return;
	}

	return;
}

/** @brief
 *	If oid set is null then create oid set. Once we have the oid set,
 *	the appropriate gss mechanism is added (e.g. kerberos).
 *
 * @param[in/out] oidset - oid set for change
 *
 * @return	int
 * @retval	PBS_GSS_OK on success
 * @retval	!= PBS_GSS_OK on error
 */
static int
pbs_gss_oidset_mech(gss_OID_set *oidset)
{
	OM_uint32 maj_stat;
	OM_uint32 min_stat;
	if (*oidset == GSS_C_NULL_OID_SET) {
		maj_stat = gss_create_empty_oid_set(&min_stat, oidset);
		if (maj_stat != GSS_S_COMPLETE) {
			GSS_LOG_STS("gss_create_empty_oid_set", maj_stat, min_stat);
			return PBS_GSS_ERR_OID;
		}
	}

	maj_stat = gss_add_oid_set_member(&min_stat, PBS_GSS_MECH_OID, oidset);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_add_oid_set_member", maj_stat, min_stat);
		return PBS_GSS_ERR_OID;
	}

	return PBS_GSS_OK;
}

/** @brief
 *	Release oid set
 *
 * @param[in] oidset - oid set for releasing
 *
 * @return void
 *
 */
static void
pbs_gss_release_oidset(gss_OID_set *oidset)
{
	OM_uint32 maj_stat;
	OM_uint32 min_stat;

	maj_stat = gss_release_oid_set(&min_stat, oidset);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_release_oid_set", maj_stat, min_stat);
	}
}

/** @brief
 *	Copy data from gss buffer into string and provides the length of the data.
 *
 * @param[in] tok - token with source data
 * @param[out] data - data to be filled
 * @param[out] len - length of data
 *
 * @return	int
 * @retval	PBS_GSS_OK on success
 * @retval	!= PBS_GSS_OK on error
 */
static int
pbs_gss_fill_data(gss_buffer_t tok, void **data, size_t *len)
{
	*data = malloc(tok->length);
	if (*data == NULL) {
		GSS_LOG_ERR("malloc failure");
		return PBS_GSS_ERR_INTERNAL;
	}

	memcpy(*data, tok->value, tok->length);
	*len = tok->length;
	return PBS_GSS_OK;
}

/** @brief
 *	Imports a service name and acquires credentials for it. The service name
 *	is imported with gss_import_name, and service credentials are acquired
 *	with gss_acquire_cred.
 *
 * @param[in] service_name - the service name
 * @param[out] server_creds - the GSS-API service credentials
 *
 * @return	int
 * @retval	PBS_GSS_OK on success
 * @retval	!= PBS_GSS_OK on error
 */
static int
pbs_gss_server_acquire_creds(char *service_name, gss_cred_id_t *server_creds)
{
	gss_name_t server_name;
	OM_uint32 maj_stat;
	OM_uint32 min_stat = 0;
	gss_OID_set oidset = GSS_C_NO_OID_SET;
	gss_buffer_desc name_buf;

	name_buf.value = service_name;
	name_buf.length = strlen(service_name) + 1;

	maj_stat = gss_import_name(&min_stat, &name_buf, GSS_NT_SERVICE_NAME, &server_name);

	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_import_name", maj_stat, min_stat);
		return PBS_GSS_ERR_IMPORT_NAME;
	}

	if (pbs_gss_oidset_mech(&oidset) != PBS_GSS_OK)
		return PBS_GSS_ERR_OID;

	maj_stat = gss_acquire_cred(&min_stat, server_name, 0, oidset, GSS_C_ACCEPT, server_creds, NULL, NULL);

	pbs_gss_release_oidset(&oidset);

	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_acquire_cred", maj_stat, min_stat);

		if (gss_release_name(&min_stat, &server_name) != GSS_S_COMPLETE) {
			GSS_LOG_STS("gss_release_name", maj_stat, min_stat);
			return PBS_GSS_ERR_INTERNAL;
		}

		return PBS_GSS_ERR_ACQUIRE_CREDS;
	}

	maj_stat = gss_release_name(&min_stat, &server_name);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_release_name", maj_stat, min_stat);
		return PBS_GSS_ERR_INTERNAL;
	}

	return PBS_GSS_OK;
}

/* @brief
 *	Client part of GSS hadshake
 *
 * @param[in] service_name - GSS service name
 * @param[in] creds - client credentials
 * @param[in] oid - The security mechanism to use. GSS_C_NULL_OID for default
 * @param[in] gss_flags - Flags indicating additional services or parameters requested for the context.
 * @param[in/out] gss_context - this context is being established here
 * @param[out] ret_flags - Flags indicating additional services or parameters requested for the context.
 * @param[in] data_in - received GSS token data
 * @param[in] len_in - length of data_in
 * @param[out] data_out - GSS token data for transmitting
 * @param[out] len_out - length of data_out
 *
 * @return	int
 * @retval	PBS_GSS_OK on success
 * @retval	!= PBS_GSS_OK on error
 */
static int
pbs_gss_client_establish_context(char *service_name, gss_cred_id_t creds, gss_OID oid, OM_uint32 gss_flags, gss_ctx_id_t *gss_context, OM_uint32 *ret_flags, void *data_in, size_t len_in, void **data_out, size_t *len_out)
{
	gss_buffer_desc send_tok;
	gss_buffer_desc recv_tok;
	gss_buffer_desc *token_ptr;
	gss_name_t target_name;
	OM_uint32 maj_stat;
	OM_uint32 min_stat = 0;
	OM_uint32 init_sec_maj_stat;
	OM_uint32 init_sec_min_stat = 0;

	send_tok.value = service_name;
	send_tok.length = strlen(service_name);
	maj_stat = gss_import_name(&min_stat, &send_tok, GSS_NT_SERVICE_NAME, &target_name);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_import_name", maj_stat, min_stat);
		return PBS_GSS_ERR_IMPORT_NAME;
	}

	send_tok.value = NULL;
	send_tok.length = 0;

	recv_tok.value = (void *) data_in;
	recv_tok.length = len_in;

	if (recv_tok.length > 0)
		token_ptr = &recv_tok;
	else
		token_ptr = GSS_C_NO_BUFFER;

	init_sec_maj_stat = gss_init_sec_context(&init_sec_min_stat, creds ? creds : GSS_C_NO_CREDENTIAL, gss_context, target_name, oid, gss_flags, 0, NULL, token_ptr, NULL, &send_tok, ret_flags, NULL);

	if (send_tok.length != 0) {
		pbs_gss_fill_data(&send_tok, data_out, len_out);

		maj_stat = gss_release_buffer(&min_stat, &send_tok);
		if (maj_stat != GSS_S_COMPLETE) {
			GSS_LOG_STS("gss_release_buffer", maj_stat, min_stat);
			return PBS_GSS_ERR_INTERNAL;
		}
	}

	maj_stat = gss_release_name(&min_stat, &target_name);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_release_name", maj_stat, min_stat);
		return PBS_GSS_ERR_INTERNAL;
	}

	if (init_sec_maj_stat != GSS_S_COMPLETE && init_sec_maj_stat != GSS_S_CONTINUE_NEEDED) {
		GSS_LOG_STS("gss_init_sec_context", init_sec_maj_stat, init_sec_min_stat);

		if (*gss_context != GSS_C_NO_CONTEXT) {
			maj_stat = gss_delete_sec_context(&min_stat, gss_context, GSS_C_NO_BUFFER);
			if (maj_stat != GSS_S_COMPLETE) {
				GSS_LOG_STS("gss_delete_sec_context", maj_stat, min_stat);
				return PBS_GSS_ERR_CONTEXT_DELETE;
			}
		}

		return PBS_GSS_ERR_CONTEXT_INIT;
	}

	if (init_sec_maj_stat == GSS_S_CONTINUE_NEEDED)
		return PBS_GSS_CONTINUE_NEEDED;

	return PBS_GSS_OK;
}

/* @brief
 *	Server part of GSS hadshake
 *
 * @param[in] server_creds - server credentials
 * @param[in] client_creds - optional credentials, can be NULL
 * @param[in/out] gss_context - this context is being established here
 * @param[out] client_name - GSS client name
 * @param[out] ret_flags - Flags indicating additional services or parameters requested for the context.
 * @param[in] data_in - received GSS token data
 * @param[in] len_in - length of data_in
 * @param[out] data_out - GSS token data for transmitting
 * @param[out] len_out - length of data_out
 *
 * @return	int
 * @retval	PBS_GSS_OK on success
 * @retval	!= PBS_GSS_OK on error
 */
static int
pbs_gss_server_establish_context(gss_cred_id_t server_creds, gss_cred_id_t *client_creds, gss_ctx_id_t *gss_context, gss_buffer_t client_name, OM_uint32 *ret_flags, void *data_in, size_t len_in, void **data_out, size_t *len_out)
{
	gss_buffer_desc send_tok;
	gss_buffer_desc recv_tok;
	gss_name_t client;
	gss_OID doid;
	OM_uint32 maj_stat;
	OM_uint32 min_stat = 0;
	OM_uint32 acc_sec_maj_stat;
	OM_uint32 acc_sec_min_stat = 0;

	recv_tok.value = data_in;
	recv_tok.length = len_in;

	if (recv_tok.length == 0) {
		GSS_LOG_ERR("Invalid input data");
		return PBS_GSS_ERR_INTERNAL;
	}

	send_tok.value = NULL;
	send_tok.length = 0;

	acc_sec_maj_stat = gss_accept_sec_context(&acc_sec_min_stat, gss_context, server_creds, &recv_tok, GSS_C_NO_CHANNEL_BINDINGS, &client, &doid, &send_tok, ret_flags, NULL, client_creds);

	if (send_tok.length != 0) {
		pbs_gss_fill_data(&send_tok, data_out, len_out);

		maj_stat = gss_release_buffer(&min_stat, &send_tok);
		if (maj_stat != GSS_S_COMPLETE) {
			GSS_LOG_STS("gss_release_buffer", maj_stat, min_stat);
			return PBS_GSS_ERR_INTERNAL;
		}
	}

	if (acc_sec_maj_stat != GSS_S_COMPLETE && acc_sec_maj_stat != GSS_S_CONTINUE_NEEDED) {
		GSS_LOG_STS("gss_accept_sec_context", acc_sec_maj_stat, acc_sec_min_stat);

		if (*gss_context != GSS_C_NO_CONTEXT) {
			if ((maj_stat = gss_delete_sec_context(&min_stat, gss_context, GSS_C_NO_BUFFER)) != GSS_S_COMPLETE) {
				GSS_LOG_STS("gss_delete_sec_context", maj_stat, min_stat);
				return PBS_GSS_ERR_CONTEXT_DELETE;
			}
		}

		return PBS_GSS_ERR_CONTEXT_ACCEPT;
	}

	maj_stat = gss_display_name(&min_stat, client, client_name, &doid);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_display_name", maj_stat, min_stat);
		return PBS_GSS_ERR_NAME_CONVERT;
	}

	maj_stat = gss_release_name(&min_stat, &client);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_release_name", maj_stat, min_stat);
		return PBS_GSS_ERR_INTERNAL;
	}

	if (acc_sec_maj_stat == GSS_S_CONTINUE_NEEDED)
		return PBS_GSS_CONTINUE_NEEDED;

	return PBS_GSS_OK;
}

/**
 * @brief
 *	Determines whether GSS credentials can be acquired
 *
 * @return	int
 * @retval	!= 0 if creds can be acquired
 * @retval	0 if creds can not be acquired
 */
static int
pbs_gss_can_get_creds(const gss_OID_set oidset)
{
	OM_uint32 maj_stat;
	OM_uint32 min_stat;
	OM_uint32 valid_sec = 0;
	gss_cred_id_t creds = GSS_C_NO_CREDENTIAL;

	maj_stat = gss_acquire_cred(&min_stat, GSS_C_NO_NAME, GSS_C_INDEFINITE, oidset, GSS_C_INITIATE, &creds, NULL, &valid_sec);
	if (maj_stat == GSS_S_COMPLETE && creds != GSS_C_NO_CREDENTIAL)
		gss_release_cred(&min_stat, &creds);

	/*
	 * There is a bug in old MIT implementation.
	 * It causes valid_sec is always 0.
	 * The problem is fixed in version >= 1.14
	 */
	return (maj_stat == GSS_S_COMPLETE && valid_sec > 10);
}

/**
 * @brief
 *	If in tty, ask user for credentials. The custom binary is run in a new session.
 *  The pipes are created for passing stdin and stdout to the new session.
 *  User can therfore insert password using tools like 'kinit' and get credentials.
 *
 * @return	int
 * @retval	!= 0 if creds not be acquired
 * @retval	0 if creds acquired
 */
static int
pbs_gss_ask_user_creds()
{
	int master_fd, slave_fd; /* PTY file descriptors */
	static struct termios original_term;
	struct termios pty_tios, raw_tios;
    pid_t pid;
	int status;

	char *user_creds_bin = pbs_conf.pbs_gss_user_creds_bin ? pbs_conf.pbs_gss_user_creds_bin : NULL;

	if (!user_creds_bin) {
		return -1;
	}

	char *cmd[] = { user_creds_bin, 0 };

	if (! isatty(fileno(stdout) || ! isatty(fileno(stdin))))
		return -1; /* not a terminal, cannot ask user for creds */

	/* save current terminal settings*/
	if (tcgetattr(STDIN_FILENO, &original_term) == -1) {
		return -1;
	}

	/* configure new terminal - disable echo for inserting password */
	raw_tios = original_term;
    raw_tios.c_lflag &= ~(ICANON | ECHO | ECHOCTL | ECHONL);
    raw_tios.c_cc[VMIN] = 1;
    raw_tios.c_cc[VTIME] = 0;

	if (tcsetattr(STDIN_FILENO, TCSAFLUSH, &raw_tios) == -1) {
        return -1;
    }

	if (tcgetattr(slave_fd, &pty_tios) == 0) {
        pty_tios.c_cc[VERASE] = 127; /* fix backspace key */
        tcsetattr(slave_fd, TCSANOW, &pty_tios);
    }

	/* create peseudo terminal for user cred bin to run */
	if (openpty(&master_fd, &slave_fd, NULL, NULL, NULL) == -1) {
		return -1;
	}

	pid = fork();
    if (pid < 0) {
        return -1; /* fork failed */
	}

	if (pid == 0) {
		/* child */
		close(master_fd);
		if (setsid() == -1) {
            exit(1);
        }

		if (dup2(slave_fd, STDIN_FILENO) == -1 ||
            dup2(slave_fd, STDOUT_FILENO) == -1 ||
            dup2(slave_fd, STDERR_FILENO) == -1) {
            exit(1);
        }

		close(slave_fd);

		if (execvp(cmd[0], cmd) < 0) {
			exit(1);
		}
	} else {
		/* parent */

		const int size = 1024;
		char buffer[size];
        ssize_t bytes_read;
		int get_password = 1;

		close(slave_fd);

		while (1) {
			fd_set read_fds;
			int max_fd = master_fd;

			FD_ZERO(&read_fds);
			FD_SET(master_fd, &read_fds);
			FD_SET(STDIN_FILENO, &read_fds);

			if (select(max_fd + 1, &read_fds, NULL, NULL, NULL) < 0) {
                if (errno == EINTR)
					continue;
                break;
            }

			if (FD_ISSET(master_fd, &read_fds)) {
                bytes_read = read(master_fd, buffer, size - 1);
                if (bytes_read > 0) {
                    /* Write child's output directly to the parent's terminal STDOUT */
                    write(STDOUT_FILENO, buffer, bytes_read);
                } else if (bytes_read == 0) {
                    break;
                } else {
                    break;
                }
            }

			if (FD_ISSET(STDIN_FILENO, &read_fds)) {
                bytes_read = read(STDIN_FILENO, buffer, size - 1);
                if (bytes_read > 0) {
                    /* Write user input to the PTY master (to the child's STDIN) */
                    write(master_fd, buffer, bytes_read);
                } else if (bytes_read == 0) {
                    close(master_fd);
                    break;
                } else {
                    break;
                }
            }

			if (waitpid(pid, &status, WNOHANG) > 0) {
                break;
            }
		}

		waitpid(pid, &status, 0);
	}

	close(master_fd);
	tcsetattr(STDIN_FILENO, TCSAFLUSH, &original_term);
	return WEXITSTATUS(status);
}

/**
 * @brief
 * 	create or renew ccache from keytab for the gss client side.
 *
 * @param[in] err_buf - buffer to put error log
 * @param[in] err_buf_size - err_buf size
 *
 * @return 	int
 * @retval	0 on success
 * @retval	!= 0 otherwise
 */
static int
init_pbs_client_ccache_from_keytab(char *err_buf, int err_buf_size)
{
	krb5_error_code ret = KRB5KRB_ERR_GENERIC;
	krb5_context context = NULL;
	krb5_principal pbs_service = NULL;
	krb5_keytab keytab = NULL;
	krb5_creds *creds = NULL;
	krb5_get_init_creds_opt *opt = NULL;
	krb5_ccache ccache = NULL;
	krb5_creds *mcreds = NULL;
	char *realm;
	char **realms = NULL;
	char hostname[PBS_MAXHOSTNAME + 1];
	int endtime = 0;

	creds = malloc(sizeof(krb5_creds));
	if (creds == NULL) {
		snprintf(err_buf, err_buf_size, "malloc failure");
		goto out;
	}
	memset(creds, 0, sizeof(krb5_creds));

	mcreds = malloc(sizeof(krb5_creds));
	if (mcreds == NULL) {
		snprintf(err_buf, err_buf_size, "malloc failure");
		goto out;
	}
	memset(mcreds, 0, sizeof(krb5_creds));

	setenv("KRB5CCNAME", PBS_KRB5_CLIENT_CCNAME, 1);

	ret = krb5_init_context(&context);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Cannot initialize Kerberos context.");
		goto out;
	}

	ret = krb5_sname_to_principal(context, NULL, PBS_KRB5_SERVICE_NAME, KRB5_NT_SRV_HST, &pbs_service);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Preparing principal failed (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	ret = krb5_cc_resolve(context, PBS_KRB5_CLIENT_CCNAME, &ccache);
	if (ret) /* for ret = true it is not a real error, we will just create new ccache */
		snprintf(err_buf, err_buf_size, "Couldn't resolve ccache name (%s) New ccache will be created.", krb5_get_error_message(context, ret));

	ret = gethostname(hostname, PBS_MAXHOSTNAME + 1);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Failed to get host name");
		goto out;
	}

	ret = krb5_get_host_realm(context, hostname, &realms);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Failed to get host realms (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	realm = realms[0];
	ret = krb5_build_principal(context, &mcreds->server, strlen(realm), realm, KRB5_TGS_NAME, realm, NULL);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Couldn't build server principal (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	ret = krb5_copy_principal(context, pbs_service, &mcreds->client);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Couldn't copy client principal (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	ret = krb5_cc_retrieve_cred(context, ccache, 0, mcreds, creds);
	if (ret) /* for ret = true it is not a real error, we will just create new ccache */
		snprintf(err_buf, err_buf_size, "Couldn't retrieve credentials from cache (%s) New ccache will be created.", krb5_get_error_message(context, ret));
	else
		endtime = creds->times.endtime;

	/* if we have valid credentials in ccache goto out
	 * if the credentials are about to expire soon (60 * 30 = 30 minutes)
	 * then try to renew from keytab.
	 */
	if (endtime - (60 * 30) >= time(NULL)) {
		ret = 0;
		goto out;
	}

	ret = krb5_cc_resolve(context, PBS_KRB5_CLIENT_CCNAME, &ccache);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Couldn't resolve cache name (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	ret = krb5_kt_default(context, &keytab);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Couldn't open keytab (%s)", krb5_get_error_message(context, ret));
		goto out;
	}
	ret = krb5_get_init_creds_opt_alloc(context, &opt);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Couldn't allocate a new initial credential options structure (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	krb5_get_init_creds_opt_set_forwardable(opt, 1);

	ret = krb5_get_init_creds_keytab(context, creds, pbs_service, keytab, 0, NULL, opt);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Couldn't get initial credentials using a key table (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	ret = krb5_cc_initialize(context, ccache, creds->client);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Credentials cache initializing failed (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

	ret = krb5_cc_store_cred(context, ccache, creds);
	if (ret) {
		snprintf(err_buf, err_buf_size, "Couldn't store ccache (%s)", krb5_get_error_message(context, ret));
		goto out;
	}

out:
	if (creds)
		krb5_free_creds(context, creds);
	if (mcreds)
		krb5_free_creds(context, mcreds);
	if (opt)
		krb5_get_init_creds_opt_free(context, opt);
	if (pbs_service)
		krb5_free_principal(context, pbs_service);
	if (ccache)
		krb5_cc_close(context, ccache);
	if (realms)
		krb5_free_host_realm(context, realms);
	if (keytab)
		krb5_kt_close(context, keytab);
	if (context)
		krb5_free_context(context);
	return (ret);
}

/** @brief
 *	This is the main gss handshake function for asynchronous handshake.
 *	It has two branches: client and server. Once the handshake is finished
 *	the GSS structure is set to ready for un/wrapping.
 *
 *
 * @param[in] gss_extra - gss structure
 * @param[in] data_in - received GSS token data
 * @param[in] len_in - length of data_in
 * @param[out] data_out - GSS token data for transmitting
 * @param[out] len_out - length of data_out
 *
 * @return int
 * @retval PBS_GSS_OK - success
 * @retval !PBS_GSS_OK - failure
 *
 */
int
pbs_gss_establish_context(pbs_gss_extra_t *gss_extra, void *data_in, size_t len_in, void **data_out, size_t *len_out)
{
	OM_uint32 maj_stat;
	OM_uint32 min_stat = 0;
	gss_ctx_id_t gss_context = GSS_C_NO_CONTEXT;
	static gss_cred_id_t server_creds = GSS_C_NO_CREDENTIAL;
	gss_cred_id_t creds = GSS_C_NO_CREDENTIAL;
	char *service_name = NULL;
	time_t now = time((time_t *) NULL);
	static time_t lastcredstime = 0;
	static time_t credlifetime = 0;
	OM_uint32 lifetime;
	OM_uint32 gss_flags;
	OM_uint32 ret_flags;
	gss_OID oid;
	gss_OID_set oidset = GSS_C_NO_OID_SET;
	int ret;
	gss_buffer_desc client_name = {0};
	int ccache_from_keytab = 0;

	if (gss_extra == NULL)
		return PBS_GSS_ERR_INTERNAL;

	if (gss_extra->role == AUTH_ROLE_UNKNOWN)
		return PBS_GSS_ERR_INTERNAL;

	if (gss_extra->hostname == NULL)
		return PBS_GSS_ERR_INTERNAL;

	gss_context = gss_extra->gssctx;

	if (service_name == NULL) {
		service_name = (char *) malloc(strlen(PBS_KRB5_SERVICE_NAME) + 1 + strlen(gss_extra->hostname) + 1);
		if (service_name == NULL) {
			GSS_LOG_ERR("malloc failure");
			return PBS_GSS_ERR_INTERNAL;
		}
		sprintf(service_name, "%s@%s", PBS_KRB5_SERVICE_NAME, gss_extra->hostname);
	}

	switch (gss_extra->role) {

		case AUTH_CLIENT:
			if (pbs_gss_oidset_mech(&oidset) != PBS_GSS_OK)
				return PBS_GSS_ERR_OID;

			if (gss_extra->conn_type == AUTH_USER_CONN) {
				char *ccname = getenv("KRB5CCNAME");
				int can_get_creds = 0;

				if (pbs_gss_can_get_creds(oidset)) {
					can_get_creds = 1;
				}

				if (!can_get_creds && ccname) {
					unsetenv("KRB5CCNAME");

					/* try get credentials with default ccache */

					if (pbs_gss_can_get_creds(oidset)) {
						can_get_creds = 1;
					} else {
						if (ccname) {
							setenv("KRB5CCNAME", ccname, 1);
						}
					}
				}

				if (!can_get_creds) {
					if (init_pbs_client_ccache_from_keytab(gss_log_buffer, LOG_BUF_SIZE)) {
						GSS_LOG_DBG(gss_log_buffer);
						unsetenv("KRB5CCNAME");
					} else {
						ccache_from_keytab = 1;
						can_get_creds = 1;
					}

					if (!ccache_from_keytab && ccname) {
						setenv("KRB5CCNAME", ccname, 1);
					}
				}

				if (!can_get_creds) {
					if (ccname) {
						setenv("KRB5CCNAME", ccname, 1);
					}

					/* no credentials at all, ask user for creds */
					if (pbs_gss_ask_user_creds()) {
						unsetenv("KRB5CCNAME");
					}
				}
			} else {
				if (init_pbs_client_ccache_from_keytab(gss_log_buffer, LOG_BUF_SIZE)) {
					GSS_LOG_DBG(gss_log_buffer);
					unsetenv("KRB5CCNAME");
				}
			}

			maj_stat = gss_acquire_cred(&min_stat, GSS_C_NO_NAME, GSS_C_INDEFINITE, oidset, GSS_C_INITIATE, &creds, NULL, NULL);

			pbs_gss_release_oidset(&oidset);

			if (maj_stat != GSS_S_COMPLETE) {
				GSS_LOG_STS("gss_acquire_cred", maj_stat, min_stat);
				if (ccache_from_keytab || gss_extra->conn_type == AUTH_SERVICE_CONN)
					unsetenv("KRB5CCNAME");
				return PBS_GSS_ERR_ACQUIRE_CREDS;
			}

			gss_flags = GSS_C_MUTUAL_FLAG | GSS_C_DELEG_FLAG | GSS_C_INTEG_FLAG | GSS_C_CONF_FLAG;
			oid = PBS_GSS_MECH_OID;

			ret = pbs_gss_client_establish_context(service_name, creds, oid, gss_flags, &gss_context, &ret_flags, data_in, len_in, data_out, len_out);
			gss_extra->gssctx = gss_context;

			if (ccache_from_keytab || gss_extra->conn_type == AUTH_SERVICE_CONN)
				unsetenv("KRB5CCNAME");

			if (creds != GSS_C_NO_CREDENTIAL) {
				maj_stat = gss_release_cred(&min_stat, &creds);
				if (maj_stat != GSS_S_COMPLETE) {
					GSS_LOG_STS("gss_release_cred", maj_stat, min_stat);
					return PBS_GSS_ERR_INTERNAL;
				}
			}

			break;

		case AUTH_INTERACTIVE:
		case AUTH_SERVER:
			/*
			 * if credentials are old, try to get new ones. If we can't, keep the old
			 * ones since they're probably still valid and hope that
			 * we can get new credentials next time
			 */
			if (now - lastcredstime > credlifetime) {
				gss_cred_id_t new_server_creds = GSS_C_NO_CREDENTIAL;

				if (pbs_gss_server_acquire_creds(service_name, &new_server_creds) != PBS_GSS_OK) {
					snprintf(gss_log_buffer, LOG_BUF_SIZE, "Failed to acquire server credentials for %s", service_name);
					GSS_LOG_ERR(gss_log_buffer);

					/* try again in 2 minutes */
					lastcredstime = now + 120;
				} else {
					lastcredstime = now;
					snprintf(gss_log_buffer, LOG_BUF_SIZE, "Refreshing server credentials at %ld", (long) now);
					GSS_LOG_DBG(gss_log_buffer);

					if (server_creds != GSS_C_NO_CREDENTIAL) {
						maj_stat = gss_release_cred(&min_stat, &server_creds);
						if (maj_stat != GSS_S_COMPLETE) {
							GSS_LOG_STS("gss_release_cred", maj_stat, min_stat);
							return PBS_GSS_ERR_INTERNAL;
						}
					}

					server_creds = new_server_creds;

					/* fetch information about the fresh credentials */
					if (gss_inquire_cred(&ret_flags, server_creds, NULL, &lifetime, NULL, NULL) == GSS_S_COMPLETE) {
						if (lifetime == GSS_C_INDEFINITE) {
							credlifetime = DEFAULT_CREDENTIAL_LIFETIME;
							snprintf(gss_log_buffer, LOG_BUF_SIZE, "Server credentials renewed with indefinite lifetime, using %d.", DEFAULT_CREDENTIAL_LIFETIME);
							GSS_LOG_DBG(gss_log_buffer);
						} else {
							snprintf(gss_log_buffer, LOG_BUF_SIZE, "Server credentials renewed with lifetime as %u.", lifetime);
							GSS_LOG_DBG(gss_log_buffer);
							credlifetime = lifetime;
						}
					} else {
						/* could not read information from credential */
						credlifetime = 0;
					}
				}
			}

			ret = pbs_gss_server_establish_context(server_creds, NULL, &gss_context, &(client_name), &ret_flags, data_in, len_in, data_out, len_out);
			gss_extra->gssctx = gss_context;

			break;

		default:
			return -1;
	}

	if (service_name != NULL)
		free(service_name);

	if (gss_context == GSS_C_NO_CONTEXT) {
		GSS_LOG_ERR("Failed to establish gss context");
		return PBS_GSS_ERR_CONTEXT_ESTABLISH;
	}

	if (ret == PBS_GSS_CONTINUE_NEEDED) {
		return PBS_GSS_OK;
	}

	if (client_name.length) {
		gss_extra->clientname = malloc(client_name.length + 1);
		if (gss_extra->clientname == NULL) {
			GSS_LOG_ERR("malloc failure");
			return PBS_GSS_ERR_INTERNAL;
		}

		memcpy(gss_extra->clientname, client_name.value, client_name.length);
		gss_extra->clientname[client_name.length] = '\0';
	}

	if (ret == PBS_GSS_OK) {
		gss_extra->gssctx_established = 1;
		gss_extra->is_secure = (ret_flags & GSS_C_CONF_FLAG);
		if (gss_extra->role == AUTH_SERVER || gss_extra->role == AUTH_INTERACTIVE) {
			snprintf(gss_log_buffer, LOG_BUF_SIZE, "GSS context established with client %s", gss_extra->clientname);
		} else {
			snprintf(gss_log_buffer, LOG_BUF_SIZE, "GSS context established with server %s", gss_extra->hostname);
		}
		GSS_LOG_DBG(gss_log_buffer);
	} else {
		if (gss_extra->role == AUTH_SERVER || gss_extra->role == AUTH_INTERACTIVE) {
			if (gss_extra->clientname)
				snprintf(gss_log_buffer, LOG_BUF_SIZE, "Failed to establish GSS context with client %s", gss_extra->clientname);
			else
				snprintf(gss_log_buffer, LOG_BUF_SIZE, "Failed to establish GSS context with client");
		} else {
			snprintf(gss_log_buffer, LOG_BUF_SIZE, "Failed to establish GSS context with server %s", gss_extra->hostname);
		}
		GSS_LOG_ERR(gss_log_buffer);
		return PBS_GSS_ERR_CONTEXT_ESTABLISH;
	}

	return PBS_GSS_OK;
}

/********* START OF EXPORTED FUNCS *********/

/** @brief
 *	pbs_auth_set_config - Set config for this lib
 *
 * @param[in] config - auth config structure
 *
 * @return void
 *
 */
void
pbs_auth_set_config(const pbs_auth_config_t *config)
{
	logger = config->logfunc;
}

/** @brief
 *	pbs_auth_create_ctx - allocates external auth context structure for GSS authentication
 *
 * @param[in] ctx - pointer to external auth context to be allocated
 * @param[in] mode - AUTH_SERVER or AUTH_CLIENT
 * @param[in] conn_type - AUTH_USER_CONN or AUTH_SERVICE_CONN
 * @param[in] hostname - hostname of other authenticating party in case of AUTH_CLIENT else not used
 *
 * @return	int
 * @retval	0 - success
 * @retval	1 - error
 */
int
pbs_auth_create_ctx(void **ctx, int mode, int conn_type, const char *hostname)
{
	pbs_gss_extra_t *gss_extra = NULL;

	*ctx = NULL;

	gss_extra = (pbs_gss_extra_t *) calloc(1, sizeof(pbs_gss_extra_t));
	if (gss_extra == NULL) {
		return 1;
	}

	gss_extra->gssctx = GSS_C_NO_CONTEXT;
	gss_extra->role = mode;
	gss_extra->conn_type = conn_type;
	if (gss_extra->role == AUTH_SERVER || gss_extra->role == AUTH_INTERACTIVE) {
		char *hn = NULL;
		if ((hn = malloc(PBS_MAXHOSTNAME + 1)) == NULL) {
			return PBS_GSS_ERR_INTERNAL;
		}
		gethostname(hn, PBS_MAXHOSTNAME + 1);
		gss_extra->hostname = hn;
	} else {
		gss_extra->hostname = strdup(hostname);
		if (gss_extra->hostname == NULL) {
			return PBS_GSS_ERR_INTERNAL;
		}
	}

	*ctx = gss_extra;
	return 0;
}

/** @brief
 *	pbs_auth_destroy_ctx - destroy external auth context structure for GSS authentication
 *
 * @param[in] ctx - pointer to external auth context
 *
 * @return void
 */
void
pbs_auth_destroy_ctx(void *ctx)
{
	pbs_gss_extra_t *gss_extra = (pbs_gss_extra_t *) ctx;
	OM_uint32 min_stat = 0;

	if (gss_extra == NULL)
		return;

	free(gss_extra->hostname);
	free(gss_extra->clientname);

	if (gss_extra->gssctx != GSS_C_NO_CONTEXT)
		(void) gss_delete_sec_context(&min_stat, &gss_extra->gssctx, GSS_C_NO_BUFFER);

	memset(gss_extra, 0, sizeof(pbs_gss_extra_t));
	free(gss_extra);
	ctx = NULL;
}

/** @brief
 *	pbs_auth_get_userinfo - get user, host and realm from authentication context
 *
 * @param[in] ctx - pointer to external auth context
 * @param[out] user - username assosiate with ctx
 * @param[out] host - hostname/realm assosiate with ctx
 * @param[out] realm - realm assosiate with ctx
 *
 * @return	int
 * @retval	0 on success
 * @retval	1 on error
 */
int
pbs_auth_get_userinfo(void *ctx, char **user, char **host, char **realm)
{
	pbs_gss_extra_t *gss_extra = (pbs_gss_extra_t *) ctx;

	*user = NULL;
	*host = NULL;
	*realm = NULL;

	if (gss_extra != NULL && gss_extra->clientname != NULL) {
		char *cn = NULL;
		char *p = NULL;

		cn = strdup(gss_extra->clientname);
		if (cn == NULL) {
			GSS_LOG_ERR("malloc failure");
			return 1;
		}
		p = strchr(cn, '@');
		if (p == NULL) {
			free(cn);
			GSS_LOG_ERR("Invalid clientname in auth context");
			return 1;
		}
		*p = '\0';
		if (strlen(cn) > PBS_MAXUSER || strlen(p + 1) > PBS_MAXHOSTNAME) {
			free(cn);
			GSS_LOG_ERR("Invalid clientname in auth context");
			return 1;
		}
		*user = strdup(cn);
		if (*user == NULL) {
			GSS_LOG_ERR("malloc failure");
			free(cn);
			return 1;
		}
		*realm = strdup(p + 1);
		if (*realm == NULL) {
			GSS_LOG_ERR("malloc failure");
			free(*user);
			*user = NULL;
			free(cn);
			return 1;
		}
		*host = strdup(*realm);
		if (*host == NULL) {
			GSS_LOG_ERR("malloc failure");
			free(*user);
			*user = NULL;
			free(*realm);
			*realm = NULL;
			free(cn);
			return 1;
		}
	}

	return 0;
}

/** @brief
 *	pbs_auth_process_handshake_data - do GSS auth handshake
 *
 * @param[in] ctx - pointer to external auth context
 * @param[in] data_in - received auth token data (if any)
 * @param[in] len_in - length of received auth token data (if any)
 * @param[out] data_out - auth token data to send (if any)
 * @param[out] len_out - lenght of auth token data to send (if any)
 * @param[out] is_handshake_done - indicates whether handshake is done (1) or not (0)
 *
 * @return	int
 * @retval	0 on success
 * @retval	!0 on error
 */
int
pbs_auth_process_handshake_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out, int *is_handshake_done)
{
	pbs_gss_extra_t *gss_extra = (pbs_gss_extra_t *) ctx;
	int rc = 0;

	if (gss_extra == NULL) {
		GSS_LOG_ERR("No auth context available");
		return 1;
	}

	if (gss_extra->gssctx_established) {
		GSS_LOG_ERR("GSS context already established");
		return 1;
	}

	*is_handshake_done = 0;

	pthread_once(&gss_init_once, init_gss_atfork);

	if (gss_lock(&gss_mutex)) {
		return PBS_GSS_ERR_INTERNAL;
	}

	rc = pbs_gss_establish_context(gss_extra, data_in, len_in, data_out, len_out);

	if (gss_unlock(&gss_mutex)) {
		return PBS_GSS_ERR_INTERNAL;
	}

	if (gss_extra->gssctx_established) {
		*is_handshake_done = 1;

		if (gss_extra->role == AUTH_SERVER || gss_extra->role == AUTH_INTERACTIVE) {
			snprintf(gss_log_buffer, LOG_BUF_SIZE, "Entered encrypted communication with client %s", gss_extra->clientname);
			GSS_LOG_DBG(gss_log_buffer);
		} else {
			snprintf(gss_log_buffer, LOG_BUF_SIZE, "Entered encrypted communication with server %s", gss_extra->hostname);
			GSS_LOG_DBG(gss_log_buffer);
		}
	}

	return rc;
}

/** @brief
 *	pbs_auth_encrypt_data - encrypt data based on given GSS context.
 *
 * @param[in] ctx - pointer to external auth context
 * @param[in] data_in - clear text data
 * @param[in] len_in - length of clear text data
 * @param[out] data_out - encrypted data
 * @param[out] len_out - length of encrypted data
 *
 * @return	int
 * @retval	0 on success
 * @retval	1 on error
 */
int
pbs_auth_encrypt_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out)
{
	pbs_gss_extra_t *gss_extra = (pbs_gss_extra_t *) ctx;
	OM_uint32 maj_stat;
	OM_uint32 min_stat = 0;
	gss_buffer_desc unwrapped;
	gss_buffer_desc wrapped;
	int conf_state = 0;

	if (gss_extra == NULL) {
		GSS_LOG_ERR("No auth context available");
		return PBS_GSS_ERR_INTERNAL;
	}

	if (len_in == 0) {
		GSS_LOG_ERR("No data available to encrypt");
		return PBS_GSS_ERR_INTERNAL;
	}

	wrapped.length = 0;
	wrapped.value = NULL;

	unwrapped.length = len_in;
	unwrapped.value = data_in;

	pthread_once(&gss_init_once, init_gss_atfork);

	if (gss_lock(&gss_mutex)) {
		return PBS_GSS_ERR_INTERNAL;
	}

	maj_stat = gss_wrap(&min_stat, gss_extra->gssctx, gss_extra->is_secure, GSS_C_QOP_DEFAULT, &unwrapped, &conf_state, &wrapped);

	if (gss_unlock(&gss_mutex)) {
		return PBS_GSS_ERR_INTERNAL;
	}

	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_wrap", maj_stat, min_stat);

		maj_stat = gss_release_buffer(&min_stat, &wrapped);
		if (maj_stat != GSS_S_COMPLETE) {
			GSS_LOG_STS("gss_release_buffer", maj_stat, min_stat);
			return PBS_GSS_ERR_INTERNAL;
		}

		return PBS_GSS_ERR_WRAP;
	}

	*len_out = wrapped.length;
	*data_out = malloc(wrapped.length);
	if (*data_out == NULL) {
		GSS_LOG_ERR("malloc failure");
		return PBS_GSS_ERR_INTERNAL;
	}
	memcpy(*data_out, wrapped.value, wrapped.length);

	maj_stat = gss_release_buffer(&min_stat, &wrapped);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_release_buffer", maj_stat, min_stat);
		return PBS_GSS_ERR_INTERNAL;
	}

	return PBS_GSS_OK;
}

/** @brief
 *	pbs_auth_decrypt_data - decrypt data based on given GSS context.
 *
 * @param[in] ctx - pointer to external auth context
 * @param[in] data_in - encrypted data
 * @param[in] len_in - length of encrypted data
 * @param[out] data_out - clear text data
 * @param[out] len_out - length of clear text data
 *
 * @return	int
 * @retval	0 on success
 * @retval	1 on error
 */
int
pbs_auth_decrypt_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out)
{
	pbs_gss_extra_t *gss_extra = (pbs_gss_extra_t *) ctx;
	OM_uint32 maj_stat;
	OM_uint32 min_stat = 0;
	gss_buffer_desc wrapped;
	gss_buffer_desc unwrapped;

	if (gss_extra == NULL) {
		GSS_LOG_ERR("No auth context available");
		return PBS_GSS_ERR_INTERNAL;
	}

	if (len_in == 0) {
		GSS_LOG_ERR("No data available to decrypt");
		return PBS_GSS_ERR_INTERNAL;
	}

	if (gss_extra->is_secure == 0) {
		GSS_LOG_ERR("wrapped data ready but auth context is not secure");
		return PBS_GSS_ERR_INTERNAL;
	}

	unwrapped.length = 0;
	unwrapped.value = NULL;

	wrapped.length = len_in;
	wrapped.value = data_in;

	pthread_once(&gss_init_once, init_gss_atfork);

	if (gss_lock(&gss_mutex)) {
		return PBS_GSS_ERR_INTERNAL;
	}

	maj_stat = gss_unwrap(&min_stat, gss_extra->gssctx, &wrapped, &unwrapped, NULL, NULL);

	if (gss_unlock(&gss_mutex)) {
		return PBS_GSS_ERR_INTERNAL;
	}

	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_unwrap", maj_stat, min_stat);

		maj_stat = gss_release_buffer(&min_stat, &unwrapped);
		if (maj_stat != GSS_S_COMPLETE) {
			GSS_LOG_STS("gss_release_buffer", maj_stat, min_stat);
			return PBS_GSS_ERR_INTERNAL;
		}

		return PBS_GSS_ERR_UNWRAP;
	}

	if (unwrapped.length == 0)
		return PBS_GSS_ERR_UNWRAP;

	*len_out = unwrapped.length;
	*data_out = malloc(unwrapped.length);
	if (*data_out == NULL) {
		GSS_LOG_ERR("malloc failure");
		return PBS_GSS_ERR_INTERNAL;
	}
	memcpy(*data_out, unwrapped.value, unwrapped.length);

	maj_stat = gss_release_buffer(&min_stat, &unwrapped);
	if (maj_stat != GSS_S_COMPLETE) {
		GSS_LOG_STS("gss_release_buffer", maj_stat, min_stat);
		return PBS_GSS_ERR_INTERNAL;
	}

	return PBS_GSS_OK;
}

/********* END OF EXPORTED FUNCS *********/

#endif /* PBS_SECURITY */


================================================
FILE: src/lib/Libauth/munge/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

lib_LTLIBRARIES = libauth_munge.la

libauth_munge_la_CPPFLAGS = \
	-I$(top_srcdir)/src/include

libauth_munge_la_LDFLAGS = -version-info 0:0:0

libauth_munge_la_SOURCES = \
	munge_supp.c


================================================
FILE: src/lib/Libauth/munge/munge_supp.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <errno.h>
#include <unistd.h>
#include <pwd.h>
#include <pthread.h>
#include <dlfcn.h>
#include <grp.h>
#include "libauth.h"
#include "libutil.h"
#include "pbs_ifl.h"

static pthread_once_t munge_init_once = PTHREAD_ONCE_INIT;

static void *munge_dlhandle = NULL;							       /* MUNGE dynamic loader handle */
static int (*munge_encode)(char **, void *, const void *, int) = NULL;			       /* MUNGE munge_encode() function pointer */
static int (*munge_decode)(const char *cred, void *, void **, int *, uid_t *, gid_t *) = NULL; /* MUNGE munge_decode() function pointer */
static char *(*munge_strerror)(int) = NULL;						       /* MUNGE munge_stderror() function pointer */
static void (*logger)(int type, int objclass, int severity, const char *objname, const char *text);

#define __MUNGE_LOGGER(e, c, s, m)                                        \
	do {                                                              \
		if (logger == NULL) {                                     \
			if (s != LOG_DEBUG)                               \
				fprintf(stderr, "%s: %s\n", __func__, m); \
		} else {                                                  \
			logger(e, c, s, __func__, m);                     \
		}                                                         \
	} while (0)
#define MUNGE_LOG_ERR(m) __MUNGE_LOGGER(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, m)
#define MUNGE_LOG_DBG(m) __MUNGE_LOGGER(PBSEVENT_DEBUG | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_DEBUG, m)

typedef struct {
	/* If set to non-zero, munge_validate_auth_data will also check that
	 * the token received originated from root user (uid == 0)
	 */
	int check_root;
	char user[PBS_MAXUSER + 1];
} munge_extra_t;

static void init_munge(void);
static char *munge_get_auth_data(char *, size_t);
static int munge_validate_auth_data(munge_extra_t *, void *, int, char *, size_t);

/**
 * @brief
 *	init_munge Check if libmunge.so shared library is present in the system
 *	and assign specific function pointers to be used at the time
 *	of decode or encode.
 *
 * @note
 *	This function should get invoked only once. Using pthread_once for this purpose.
 *	This function is not expecting any arguments. So storing error messages in a static
 *	variable in case of error.
 *
 * @return void
 *
 */
static void
init_munge(void)
{
	static const char libmunge[] = "libmunge.so";
	char ebuf[LOG_BUF_SIZE];

	ebuf[0] = '\0';
	munge_dlhandle = dlopen(libmunge, RTLD_LAZY);
	if (munge_dlhandle == NULL) {
		snprintf(ebuf, sizeof(ebuf), "%s not found", libmunge);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	munge_encode = dlsym(munge_dlhandle, "munge_encode");
	if (munge_encode == NULL) {
		snprintf(ebuf, sizeof(ebuf), "symbol munge_encode not found in %s", libmunge);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	munge_decode = dlsym(munge_dlhandle, "munge_decode");
	if (munge_decode == NULL) {
		snprintf(ebuf, sizeof(ebuf), "symbol munge_decode not found in %s", libmunge);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	munge_strerror = dlsym(munge_dlhandle, "munge_strerror");
	if (munge_strerror == NULL) {
		snprintf(ebuf, sizeof(ebuf), "symbol munge_strerror not found in %s", libmunge);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	return;

err:
	if (munge_dlhandle)
		dlclose(munge_dlhandle);

	munge_dlhandle = NULL;
	munge_encode = NULL;
	munge_decode = NULL;
	munge_strerror = NULL;
	return;
}

/**
 * @brief
 *	munge_get_auth_data - Call Munge encode API's to get the authentication data for the current user
 *
 * @param[in] ebuf - buffer to hold error msg if any
 * @param[in] ebufsz - size of ebuf
 *
 * @return char *
 * @retval !NULL - success
 * @retval  NULL - failure
 *
 */
static char *
munge_get_auth_data(char *ebuf, size_t ebufsz)
{
	char *cred = NULL;
	uid_t myrealuid;
	struct passwd *pwent;
	struct group *grp;
	char payload[PBS_MAXUSER + PBS_MAXGRPN + 1] = {'\0'};
	int munge_err = 0;

	/*
	 * ebuf passed to this function is initialized with nulls all through
	 * and ebufsz value passed is sizeof(ebuf) - 1
	 * So, we don't need to null terminate the last byte in the below
	 * all snprintf
	 *
	 * see pbs_auth_process_handshake_data()
	 */

	if (munge_dlhandle == NULL) {
		pthread_once(&munge_init_once, init_munge);
		if (munge_encode == NULL) {
			snprintf(ebuf, ebufsz, "Failed to load munge lib");
			MUNGE_LOG_ERR(ebuf);
			goto err;
		}
	}

	myrealuid = getuid();
	pwent = getpwuid(myrealuid);
	if (pwent == NULL) {
		snprintf(ebuf, ebufsz, "Failed to obtain user-info for uid = %d", myrealuid);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	grp = getgrgid(pwent->pw_gid);
	if (grp == NULL) {
		snprintf(ebuf, ebufsz, "Failed to obtain group-info for gid=%d", pwent->pw_gid);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	snprintf(payload, PBS_MAXUSER + PBS_MAXGRPN, "%s:%s", pwent->pw_name, grp->gr_name);

	munge_err = munge_encode(&cred, NULL, payload, strlen(payload));
	if (munge_err != 0) {
		snprintf(ebuf, ebufsz, "MUNGE user-authentication on encode failed with `%s`", munge_strerror(munge_err));
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}
	return cred;

err:
	free(cred);
	return NULL;
}

/**
 * @brief
 *	munge_validate_auth_data - validate given munge authentication data
 *
 * @param[in] ctx - pointer to external auth context
 * @param[in] auth_data - auth data to be verified
 * @param[in] with_root - If set to non-zero, verify that token received matches root uid (0)
 * @param[in] ebuf - buffer to hold error msg if any
 * @param[in] ebufsz - size of ebuf
 *
 * @return int
 * @retval 0 - Success
 * @retval -1 - Failure
 *
 */
static int
munge_validate_auth_data(munge_extra_t *ctx, void *auth_data, int with_root, char *ebuf, size_t ebufsz)
{
	uid_t uid;
	gid_t gid;
	int recv_len = 0;
	struct passwd *pwent = NULL;
	struct group *grp = NULL;
	void *recv_payload = NULL;
	int munge_err = 0;
	char *p;
	int rc = -1;

	/*
	 * ebuf passed to this function is initialized with nulls all through
	 * and ebufsz value passed is sizeof(ebuf) - 1
	 * So, we don't need to null terminate the last byte in the below
	 * all snprintf
	 *
	 * see pbs_auth_process_handshake_data()
	 */

	if (munge_dlhandle == NULL) {
		pthread_once(&munge_init_once, init_munge);
		if (munge_decode == NULL) {
			snprintf(ebuf, ebufsz, "Failed to load munge lib");
			MUNGE_LOG_ERR(ebuf);
			goto err;
		}
	}

	munge_err = munge_decode(auth_data, NULL, &recv_payload, &recv_len, &uid, &gid);
	if (munge_err != 0) {
		snprintf(ebuf, ebufsz, "MUNGE user-authentication on decode failed with `%s`", munge_strerror(munge_err));
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	if ((pwent = getpwuid(uid)) == NULL) {
		snprintf(ebuf, ebufsz, "Failed to obtain user-info for uid = %d", uid);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}

	if ((grp = getgrgid(pwent->pw_gid)) == NULL) {
		snprintf(ebuf, ebufsz, "Failed to obtain group-info for gid=%d", gid);
		MUNGE_LOG_ERR(ebuf);
		goto err;
	}
	/* Keep the username for verification */
	pbs_strncpy(ctx->user, pwent->pw_name, PBS_MAXUSER);

	p = strtok((char *) recv_payload, ":");

	if (p && (strncmp(pwent->pw_name, p, PBS_MAXUSER) == 0) && /* inline with current pbs_iff we compare with username only */
	    (with_root == 0 || pwent->pw_uid == 0))
		rc = 0;
	else {
		snprintf(ebuf, ebufsz, "User credentials do not match");
		MUNGE_LOG_ERR(ebuf);
	}

err:
	if (recv_payload)
		free(recv_payload);
	return rc;
}

/********* START OF EXPORTED FUNCS *********/

/** @brief
 *	pbs_auth_set_config - Set config for this lib
 *
 * @param[in] config - auth config structure
 *
 * @return void
 *
 */
void
pbs_auth_set_config(const pbs_auth_config_t *config)
{
	logger = config->logfunc;
}

/** @brief
 *	pbs_auth_create_ctx - allocates external auth context structure for MUNGE authentication
 *
 * @param[in] ctx - pointer to external auth context to be allocated
 * @param[in] mode - AUTH_SERVER, AUTH_CLIENT, or AUTH_INTERACTIVE
 * @param[in] conn_type - AUTH_USER_CONN or AUTH_SERVICE_CONN
 * @param[in] hostname - hostname of other authenticating party
 *
 * @return	int
 * @retval	0 - success
 * @retval	1 - error
 */
int
pbs_auth_create_ctx(void **ctx, int mode, int conn_type, const char *hostname)
{
	munge_extra_t *munge_extra = NULL;

 	*ctx = NULL;

	munge_extra = calloc(1, sizeof(munge_extra_t));
	if (munge_extra == NULL) {
		MUNGE_LOG_ERR("Out of memory!");
		return 1;
	}

	/* AUTH_INTERACTIVE used by qsub -I when authenticating an execution host connection */
	if (mode == AUTH_INTERACTIVE || conn_type == AUTH_SERVICE_CONN)
		munge_extra->check_root = 1;
	else
		munge_extra->check_root = 0;

	*ctx = munge_extra;
 	return 0;
}

/** @brief
 *	pbs_auth_destroy_ctx - destroy external auth context structure for MUNGE authentication
 *
 * @param[in] ctx - pointer to external auth context
 *
 * @return void
 */
void
pbs_auth_destroy_ctx(void *ctx)
{
	munge_extra_t *munge_extra = (munge_extra_t *) ctx;
	if (munge_extra)
		free(munge_extra);
 	ctx = NULL;
}

/** @brief
 *	pbs_auth_get_userinfo - get user, host and realm from authentication context
 *
 * @param[in] ctx - pointer to external auth context
 * @param[out] user - username assosiate with ctx
 * @param[out] host - hostname/realm assosiate with ctx
 * @param[out] realm - realm assosiate with ctx
 *
 * @return	int
 * @retval	0 on success
 * @retval	1 on error
 *
 */
int
pbs_auth_get_userinfo(void *ctx, char **user, char **host, char **realm)
{
	munge_extra_t *munge_extra = (munge_extra_t *) ctx;
	if (munge_extra == NULL) {
		MUNGE_LOG_ERR("Munge context not initialized");
		return 1;
	}

	*user = strdup(munge_extra->user);
	if ((*user) == NULL) {
		MUNGE_LOG_ERR("Failed to allocate memory for username");
		return 1;
	}
 	*host = NULL;
 	*realm = NULL;
 	return 0;
}

/** @brief
 *	pbs_auth_process_handshake_data - do Munge auth handshake
 *
 * @param[in] ctx - pointer to external auth context
 * @param[in] data_in - received auth token data (if any)
 * @param[in] len_in - length of received auth token data (if any)
 * @param[out] data_out - auth token data to send (if any)
 * @param[out] len_out - lenght of auth token data to send (if any)
 * @param[out] is_handshake_done - indicates whether handshake is done (1) or not (0)
 *
 * @return	int
 * @retval	0 on success
 * @retval	!0 on error
 */
int
pbs_auth_process_handshake_data(void *ctx, void *data_in, size_t len_in, void **data_out, size_t *len_out, int *is_handshake_done)
{
	int rc = -1;
	char ebuf[LOG_BUF_SIZE] = {'\0'};

	munge_extra_t *munge_extra = (munge_extra_t *) ctx;
	if (munge_extra == NULL) {
		MUNGE_LOG_ERR("Munge context not initialized");
		return 1;
	}

	*len_out = 0;
	*data_out = NULL;
	*is_handshake_done = 0;

	pthread_once(&munge_init_once, init_munge);

	if (munge_dlhandle == NULL) {
		*data_out = strdup("Munge lib is not loaded");
		if (*data_out != NULL)
			*len_out = strlen(*data_out);
		return 1;
	}

	if (len_in > 0) {
		char *data = (char *) data_in;
		/* enforce null char at given length of data */
		data[len_in - 1] = '\0';
		rc = munge_validate_auth_data(ctx, data, munge_extra->check_root, ebuf, sizeof(ebuf) - 1);
		if (rc == 0) {
			*is_handshake_done = 1;
			return 0;
		} else if (ebuf[0] != '\0') {
			*data_out = strdup(ebuf);
			if (*data_out != NULL)
				*len_out = strlen(ebuf);
		}
	} else {
		*data_out = (void *) munge_get_auth_data(ebuf, sizeof(ebuf) - 1);
		if (*data_out) {
			*len_out = strlen((char *) *data_out) + 1; /* +1 to include null char also in data_out */
			*is_handshake_done = 1;
			return 0;
		} else if (ebuf[0] != '\0') {
			*data_out = strdup(ebuf);
			if (*data_out != NULL)
				*len_out = strlen(ebuf);
		}
	}

	return 1;
}

/********* END OF EXPORTED FUNCS *********/


================================================
FILE: src/lib/Libcmds/batch_status.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <stdio.h>
#include <string.h>

#include "pbs_ifl.h"

/**
 * @file	batch_status.c
 *
 * @brief
 *	batch_status.c - batch_status structures utilities
 */

/**
 * @brief
 *	bs_isort - insertion sort for batch_status structures
 *
 * @param[in] bs - batch_status linked list
 * @param[in] cmp_func - compare function to compare two batch_status
 *
 *
 * @return 	structure handle
 * @retval	head of sorted batch status list
 *
 */
struct batch_status *
bs_isort(struct batch_status *bs,
	 int (*cmp_func)(struct batch_status *, struct batch_status *))
{
	struct batch_status *new_head = NULL; /* new list head */
	struct batch_status *cur_old;	      /*where we are in the old list*/
	struct batch_status *cur_new;	      /* where we are in the new list */
	struct batch_status *prev_new = NULL;
	struct batch_status *tmp; /* tmp ptr to hold next */

	cur_old = bs;
	new_head = NULL;

	while (cur_old != NULL) {
		tmp = cur_old->next;

		if (new_head == NULL) {
			cur_old->next = NULL;
			new_head = cur_old;
		} else {
			/* find where our node goes in the new list */
			for (cur_new = new_head, prev_new = NULL;
			     cur_new != NULL && cmp_func(cur_new, cur_old) <= 0;
			     prev_new = cur_new, cur_new = cur_new->next)
				;
			if (prev_new == NULL) {
				cur_old->next = new_head;
				new_head = cur_old;
			} else {
				cur_old->next = cur_new;
				prev_new->next = cur_old;
			}
		}
		cur_old = tmp;
	}
	return new_head;
}

/**
 * @brief
 *	bs_find - find a batch_status with given name in a batch_status structures list.
 *
 * @param[in] bs - batch_status linked list
 * @param[in] name - name of the batch_status structure to be searched
 *
 *
 * @return 	batch_status structure handle
 * @retval	batch_status structure pointer with given name or NULL
 *
 */
struct batch_status *
bs_find(struct batch_status *bs, const char *name)
{

	if (name == NULL)
		return NULL;

	for (; ((bs != NULL) && strcmp(name, bs->name)); bs = bs->next)
		; /* empty for loop */

	return bs;
}

/**
 * @brief
 *	init_bstat - Initialize batch status
 *
 * @param[in] bstat - batch_status struct
 *
 * @return 	void
 */
void
init_bstat(struct batch_status *bstat)
{
	bstat->next = NULL;
	bstat->text = NULL;
	bstat->attribs = NULL;
}


================================================
FILE: src/lib/Libcmds/check_job_script.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	check_job_script.c
 * @brief
 * 	These were moved from qsub so that AIF could access them.
 */
#include <pbs_config.h>

#include <ctype.h>
#include <string.h>

#include "cmds.h"
#include "libpbs.h"

/**
 * @brief
 *	check whether the script content in buf s executable or not
 *
 * @param[in] s - buf with script content(job)
 *
 * @return	int
 * @retval	TRUE	executable
 * @retval	FALSE	not executable
 *
 */
int
pbs_isexecutable(char *s)
{
	char *c;

	c = s;
	if ((*c == ':') || ((*c == '#') && (*(c + 1) == '!')))
		return FALSE;
	while (isspace(*c))
		c++;
	if (notNULL(c))
		return (*c != '#');
	return FALSE;
}

/**
 * @brief
 *	returns the pbs directive
 *
 * @param[in] s - copy of script file
 * @param[in] prefix - prefix for pbs directives
 *
 * @return	string
 * @retval	NULL		error
 *
 */
char *
pbs_ispbsdir(char *s, char *prefix)
{
	char *it;
	int l;

	it = s;
	while (isspace(*it))
		it++;
	l = strlen(prefix);
	if (l > 0 && strncmp(it, prefix, l) == 0)
		return (it + l);
	else
		return NULL;
}


================================================
FILE: src/lib/Libcmds/chk_Jrange.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	chk_Jrange.c
 *
 * @brief
 * 	chk_Jrange - validate the subjob index range for the J option to qsub/qalter
 */
#include <pbs_config.h>
#include <ctype.h>
#include <limits.h>
#include <stdlib.h>
#include "pbs_ifl.h"
#include "pbs_internal.h"

/**
 * @brief
 * 	chk_Jrange - validate the subjob index range for the J option to qsub/qalter
 *
 * @param[in] arg - argument list
 *
 * @return	int
 * @retval	0 if ok,
 * @retval	1 if invalid form
 * @retval	2 if any of the individual numbers is too large
 */
int
chk_Jrange(char *arg)
{
	char *pc;
	char *s;
	long start;
	long end;
	long step;

	pc = arg;
	if (!isdigit((int) *pc))
		return (1); /* no a positive number */
	s = arg;
	while (*pc && isdigit((int) *pc))
		++pc;
	if (*pc != '-') {
		return (1);
	}
	start = strtol(s, NULL, 10);
	if (start < 0)
		return 1;
	if (start == LONG_MAX)
		return 2;
	s = ++pc;
	if (!isdigit((int) *pc)) {
		return (1);
	}
	while (*pc && isdigit((int) *pc))
		++pc;
	if ((*pc != '\0') && (*pc != ':')) {
		return (1);
	}
	end = strtol(s, NULL, 10);
	if (start >= end)
		return 1;
	if (end == LONG_MAX)
		return 2;

	if (*pc++ == ':') {
		s = pc;
		while (*pc && isdigit((int) *pc))
			++pc;
		if (*pc != '\0') {
			return (1);
		}
		step = strtol(s, NULL, 10);
		if (step < 1)
			return (1);
		if (step == LONG_MAX)
			return (2);
	}
	return 0;
}


================================================
FILE: src/lib/Libcmds/ck_job_name.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include "pbs_ifl.h"
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
/**
 * @file	ck_job_name.c
 */

/**
 * @brief
 * 	isalnumspch = if char is alpha numeric or from allowed set of special char
 *
 * @param[in] c - input
 *
 * @return	int
 */
static int
isalnumspch(int c)
{
	if (isalnum(c) != 0)
		return c;

	if (c == '-' || c == '_' || c == '+' || c == '.')
		return c;

	return 0;
}

/**
 * @brief
 *	validates the job name
 * 	check_job_name = job name must be <= PBS_MAXJOBNAME "printable" characters with
 *	first alphabetic, maybe.  The POSIX Batch standard calls for only
 *	alphanumeric, but then conflicts with itself to default to the
 *	script base-name which may have non-alphanumeric characters and
 *	the first character not alphabetic.
 *
 *	We check for visible, printable characters and the first being
 *	alphabetic if comining from a -N option (chk_alpha = 1).
 *
 * @param[in]       name        - job name
 * @param[in]	    chk_alpha   - flag to allow numeric first char
 *
 * @return int
 * @retval 0    validation of job name was successful.
 * @retval -1   illeagal character in job name.
 * @retval -2	job name length is too long.
 */
int
check_job_name(char *name, int chk_alpha)
{

	char *p;
	if (!name)
		return (-1);

	if (strlen(name) > (size_t) PBS_MAXJOBNAME)
		return (-2);
	else if ((chk_alpha == 1) && (isalpha((int) *name) == 0))
		return (-1);

	for (p = name; *p; p++)
		if (isalnumspch((int) *p) == 0)
			return (-1);
	return (0);
}


================================================
FILE: src/lib/Libcmds/cmds_common.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	cmds_common.c
 * @brief
 *	Functions shared by all pbs commands C files
 */

#include <stdlib.h>
#include <pbs_config.h> /* the master config generated by configure */
#include "attribute.h"

/**
 * @brief
 *	Add an entry to an attribute list. First, create the entry and set
 * 	the fields. If the attribute list is empty, then just point it at the
 * 	new entry. Otherwise, append the new entry to the list.
 *
 *  This function is a wrapper of set_attr function in libpbs. It exits when
 *  a non-zero error code is returned by set_attr.
 *
 * @param[in/out] attrib - pointer to attribute list
 * @param[in]     attrib_name - attribute name
 * @param[in]     attrib_value - attribute value
 *
 * @return	Void
 */
void
set_attr_error_exit(struct attrl **attrib, char *attrib_name, char *attrib_value)
{
	if (set_attr(attrib, attrib_name, attrib_value))
		exit(2);
}

/**
 * @brief
 *	wrapper function for set_attr_resc in libpbs. Exits if a non-zero error
 *  code is returned by set_attr_resc.
 *
 * @param[in/out] attrib - pointer to attribute list
 * @param[in]     attrib_name - attribute name
 * @param[in]     attrib_value - attribute value
 *
 * @return      Void
 */
void
set_attr_resc_error_exit(struct attrl **attrib, char *attrib_name, char *attrib_resc, char *attrib_value)
{
	if (set_attr_resc(attrib, attrib_name, attrib_resc, attrib_value))
		exit(2);
}

/*
 * Stub function of actual DIS_tpp_funcs for PBS clients commands
 * which doesn't use TPP
 */
void
DIS_tpp_funcs()
{
}


================================================
FILE: src/lib/Libcmds/cnt2server.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	cnt2server
 *	Connect to the server, and if there is an error, print a more
 * 	descriptive message.
 *
 * @par	Synopsis:
 *	int cnt2server( char *server )
 *
 *	server	The name of the server to connect to. A NULL or null string
 *		for the default server.
 *
 * @par	Returns:
 *	The connection returned by pbs_connect().
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include "cmds.h"
#include "auth.h"

/**
 * @brief
 *	Makes a connection to the server, returning the pbs_connect() result.
 *
 * @param[in]	server	- hostname of the pbs server to connect to
 * @param[in]	extend  - extend data to send along with the connection.
 *
 * @return	int
 * @retval	connection	success
 * @retval	0		fail
 */
int
cnt2server_extend(char *server, char *extend)
{
	int connect;

	connect = pbs_connect_extend(server, extend);
	if (connect <= 0) {
		if (pbs_errno > PBSE_) {
			switch (pbs_errno) {

				case PBSE_BADHOST:
					fprintf(stderr, "Unknown Host.\n");
					break;

				case PBSE_NOCONNECTS:
					fprintf(stderr, "Too many open connections.\n");
					break;

				case PBSE_NOSERVER:
					fprintf(stderr, "No default server name.\n");
					break;

				case PBSE_SYSTEM:
					if (errno != 0)
						perror(NULL);
					else
						fprintf(stderr, "System call failure.\n");
					break;

				case PBSE_PERM:
					fprintf(stderr, "No Permission.\n");
					break;

				case PBSE_PROTOCOL:
					fprintf(stderr, "Communication failure.\n");
					break;

				case PBSE_NOSUP:
					fprintf(stderr, "No support for requested service.\n");
					break;
			}
		} else if (errno != 0) {
			perror(NULL);
		}

		return (connect);
	}

	return (connect);
}

/**
 * @brief
 *	A wrapper function to the cnt2server_extend() call where there's
 *	no 'extend' parameter passed.
 *
 * @param[in]	server	- hostname of the pbs server to connect to
 *
 * @return      int
 * @retval      connection      success
 * @retval	0		fail
 */
int
cnt2server(char *server)
{
	return (cnt2server_extend(server, NULL));
}


================================================
FILE: src/lib/Libcmds/cs_error.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	cs_logerr.c
 * @brief
 *	This function is ment to be called by the "CS" library code in the
 *	case where the CS library is being used in a command executable.
 *
 * @note
 *	  A function by the same name but with a different definition
 *	is also part of PBS' Liblog library.  We can do this because the PBS
 *	commands are not linked against the Liblog library.  That function
 *	will be the one used by the CS library when the executable is a PBS
 *	daemon.
 */

#include <stdio.h> /* the master config generated by configure */

/**
 * @brief
 *	prints error message when cs library is
 *	being used in a command executable.
 *
 * param[in] ecode - error code
 * param[in] caller - function
 * param[in] txtmsg - error message
 *
 * @return	Void
 *
 */

void
cs_logerr(int ecode, char *caller, char *txtmsg)
{
	if (caller != NULL && txtmsg != NULL) {

		if (ecode != -1)
			fprintf(stderr, "%s: %s (%d)\n", caller, txtmsg, ecode);
		else
			fprintf(stderr, "%s: %s\n", caller, txtmsg);
	}
}


================================================
FILE: src/lib/Libcmds/cvtdate.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	cvtdate.c
 * @brief
 * 	cvtdate - convert POSIX touch date/time to seconds since epoch time
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"

/**
 * @brief
 * 	cvtdate - convert POSIX touch date/time to seconds since epoch time
 *
 * @param[in]	datestr - date/time string in the form: [[[[CC]YY]MM]DD]hhmm[.SS]
 *			  as defined by POSIX.
 *
 *		CC = centry, ie 19 or 20
 *		YY = year, if CC is not provided and YY is < 69, then
 *		     CC is assumed to be 20, else 19.
 *		MM = Month, [1,12], if YY is not provided and MM is less than
 *		     the current month, YY is next year, else it is the
 *		     current year.
 *		DD = Day of month, [1,31], if MM is not provided and DD is less
 *		     than the current day, MM is next month, else it is the
 *		     next month.
 *		hh = hour, [00, 23], if DD is not provided and hh is less than
 *		     the current hour, DD is tomorrow, else it is today.
 *		mm = minute, [00, 59]
 *		SS = seconds, [00, 59]
 *
 * @return	time_t
 * @retval	number of seconds since epoch (Coordinated Univ. Time)
 * @retval	-1 if error.
 */

time_t
cvtdate(char *datestr)
{
	char buf[3];
	time_t clock;
	int i;
	char *pc;
	struct tm tm;
	int year = 0;
	int month = -1;
	int day = 0;
#ifdef WIN32
	SYSTEMTIME win_ltm;
#endif /* WIN32 */
	struct tm ltm;
	struct tm *ptm;

	if ((pc = strchr(datestr, (int) '.')) != 0) {
		*pc++ = '\0';
		if ((strlen(pc) != 2) ||
		    (isdigit((int) *pc) == 0) ||
		    (isdigit((int) *(pc + 1)) == 0))
			return (-1);
		tm.tm_sec = atoi(pc);
		if (tm.tm_sec > 59)
			return (-1);
	} else
		tm.tm_sec = 0;

	for (pc = datestr; *pc; ++pc)
		if (isdigit((int) *pc) == 0)
			return (-1);

	buf[2] = '\0';
	clock = time(NULL);
#ifdef WIN32
	GetLocalTime(&win_ltm);
	ltm.tm_year = win_ltm.wYear - 1900; /* unix is counted from 1900 */
	ltm.tm_mon = win_ltm.wMonth - 1;    /* unix starts from 0 */
	ltm.tm_mday = win_ltm.wDay;
	ltm.tm_hour = win_ltm.wHour;
	ltm.tm_min = win_ltm.wMinute;
	ltm.tm_sec = win_ltm.wSecond;
	ltm.tm_isdst = -1;
#else
	localtime_r(&clock, &ltm);
#endif /* WIN32 */
	ptm = &ltm;
	tm.tm_year = ptm->tm_year; /* default year to current */
	tm.tm_mon = ptm->tm_mon;   /* default month to current */
	tm.tm_mday = ptm->tm_mday; /* default day to current */

	switch (strlen(datestr)) {

		case 12: /* CCYYMMDDhhmm */
			buf[0] = datestr[0];
			buf[1] = datestr[1];
			year = atoi(buf) * 100;
			datestr += 2;

			/* no break, fall into next case */

		case 10: /* YYMMDDhhmm */
			buf[0] = datestr[0];
			buf[1] = datestr[1];
			i = atoi(buf);
			if (year == 0)
				if (i > 68)
					year = 1900 + i;
				else
					year = 2000 + i;

			else
				year += i;
			tm.tm_year = year - 1900;
			datestr += 2;

			/* no break, fall into next case */

		case 8: /* MMDDhhmm */
			buf[0] = datestr[0];
			buf[1] = datestr[1];
			i = atoi(buf);
			if (i < 1 || i > 12)
				return (-1);
			if (year == 0)
				if (i <= ptm->tm_mon)
					tm.tm_year++;
			month = i - 1;
			tm.tm_mon = month;
			datestr += 2;

			/* no break, fall into next case */

		case 6: /* DDhhmm */
			buf[0] = datestr[0];
			buf[1] = datestr[1];
			day = atoi(buf);
			if (day < 1 || day > 31)
				return (-1);
			if (month == -1)
				if (day < ptm->tm_mday)
					tm.tm_mon++;
			tm.tm_mday = day;
			datestr += 2;

			/* no break, fall into next case */

		case 4: /* hhmm */
			buf[0] = datestr[0];
			buf[1] = datestr[1];
			tm.tm_hour = atoi(buf);
			if (tm.tm_hour > 23)
				return (-1);

			tm.tm_min = atoi(&datestr[2]); /* mm -  minute portion */
			if (tm.tm_min > 59)
				return (-1);
			if (day == 0) /* day not specified */
				if ((tm.tm_hour < ptm->tm_hour) ||
				    ((tm.tm_hour == ptm->tm_hour) &&
				     (tm.tm_min <= ptm->tm_min)))
					tm.tm_mday++; /* time for tomorrow */

			break;

		default:
			return (-1);
	}

	tm.tm_isdst = -1;

	return (mktime(&tm));
}

/**
 * @brief
 *	convert_time - convert a string time_t into
 *		       a short human readable string
 *		       today     : time of resv (i.e. 15:30)
 *		       this year : day of month & time of resv (Mar 24 15:30)
 *		       else      : day of month and year (Mar 24 2000)
 *
 * @param[in]  ptime - the string time_t
 *
 *
 * @return 	a pointer to a static string
 * @retval	converted time			success
 *
 */
char *
convert_time(char *ptime)
{
	static char buf[64];
	struct tm *ptm;	   /* used to get a struct tm from localtime() */
	struct tm now_tm;  /* current time */
	struct tm then_tm; /* time to print */
	time_t then;
	time_t now;

	time(&now);
	then = atol(ptime);

	ptm = localtime(&now);
	now_tm = *ptm;

	ptm = localtime(&then);
	then_tm = *ptm;

	if (then_tm.tm_year == now_tm.tm_year) {
		/* time input is a time within this current year */

		if (then_tm.tm_yday == now_tm.tm_yday)

			/* time input is a time within the current day */
			strftime(buf, 64, "Today %H:%M", &then_tm);

		else if ((then_tm.tm_yday >= now_tm.tm_yday - now_tm.tm_wday) &&
			 (then_tm.tm_yday <= now_tm.tm_yday + 6 - now_tm.tm_wday))

			/* time input is a time within the current week */
			strftime(buf, 64, "%a %H:%M", &then_tm);
		else

			/* time input is in the current year and outside the current week */
			strftime(buf, 64, "%a %b %d %H:%M", &then_tm);

	} else {

		/* time input outside the current year */
		strftime(buf, 64, "%a %b %d %Y %H:%M", &then_tm);
	}

	return buf;
}


================================================
FILE: src/lib/Libcmds/err_handling.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	err_handling.c
 * @brief
 *	This file is meant for common error handling functions 
 *      within commands
 */

#include <pbs_config.h>

#include <errno.h>
#include <string.h>

#include "libutil.h"
#include "libpbs.h"
#include "libutil.h"

/**
 * @brief
 *	Print the error message returned by the server, if supplied. Otherwise,
 * 	print a default error message.
 *
 * @param[in] cmd - error msg
 * @param[in] connect - fd
 * @param[in] id - error id
 *
 * @return	Void
 *
 */

void
prt_job_err(char *cmd, int connect, char *id)
{
	char *errmsg;
	char *histerrmsg = NULL;

	errmsg = pbs_geterrmsg(connect);
	if (errmsg) {
		if (pbs_geterrno() == PBSE_HISTJOBID) {
			pbs_asprintf(&histerrmsg, errmsg, id);
			if (histerrmsg) {
				fprintf(stderr, "%s: %s\n", cmd, histerrmsg);
				free(histerrmsg);
			} else {
				fprintf(stderr,
					"%s: Server returned error %d for job %s\n",
					cmd, pbs_errno, id);
			}
			return;
		}
		fprintf(stderr, "%s: %s %s\n", cmd, errmsg, id);
	} else {
		fprintf(stderr, "%s: Server returned error %d for job %s\n", cmd, pbs_errno, id);
	}
}


================================================
FILE: src/lib/Libcmds/get_attr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	get_ttr.c
 * @brief
 *      Locate an attribute (attrl) by name (and resource).
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "cmds.h"
#include "pbs_ifl.h"

/**
 * @brief
 *      Locate an attribute (attrl) by name (and resource).
 *
 * @param[in] pattrl    - Attribute list.
 * @param[in] name      - name to find in attribute list.
 * @param[in] resc      - resource to find in attribute list.
 *
 * @return	pointer to string
 * @retval      value of the located name and resource from attribute list,
 * @retval 	othewise NULL.
 */

char *
get_attr(struct attrl *pattrl, const char *name, const char *resc)
{
	while (pattrl) {
		if (strcmp(name, pattrl->name) == 0) {
			if (resc) {
				if (strcmp(resc, pattrl->resource) == 0) {
					return (pattrl->value);
				}
			} else {
				return (pattrl->value);
			}
		}
		pattrl = pattrl->next;
	}
	return NULL;
}

/*
 * @brief
 *	check_max_job_sequence_id - retrieve the max_job_sequence_id attribute value
 *
 *	@param[in]server_attrs - Batch status
 *
 *	@retval  1	success
 *	@retval  0	error/attribute is not set
 *
 */
int
check_max_job_sequence_id(struct batch_status *server_attrs)
{
	char *value;
	value = get_attr(server_attrs->attribs, ATTR_max_job_sequence_id, NULL);
	if (value == NULL) {
		/* if server is not configured for max_job_sequence_id
		* or attribute is unset */
		return 0;
	} else {
		/* if attribute is set set */
		long long seq_id = 0;
		seq_id = strtoul(value, NULL, 10);
		if (seq_id > PBS_DFLT_MAX_JOB_SEQUENCE_ID) {
			return 1;
		}
		return 0;
	}
}


================================================
FILE: src/lib/Libcmds/get_dataservice_usr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	get_dataservice_usr.c
 * @brief
 *	Retrieves the database user. The database user-id is retrieved from
 *	the file PBS_HOME/server_priv/db_user.
 */
#include <pbs_config.h> /* the master config generated by configure */
#include "cmds.h"
#include <sys/stat.h>
#include <fcntl.h>
#include <errno.h>

/**
 * @brief
 *	Retrieves the database user. The database user-id is retrieved from
 *	the file PBS_HOME/server_priv/db_user.
 *	If this file is not found, then the default username
 *	"pbsdata" is returned as the default db user.
 *
 *      NOTE: pbs_get_dataservice_usr() was put into a separate file because
 *      the other database functions are only used by the server
 *
 * @param[out]  errmsg - Details of the error
 * @param[in]   len    - length of error messge variable
 *
 * @return      username String
 * @retval	 NULL - Failed to retrieve user-id
 * @retval	!NULL - Pointer to allocated memory with user-id string.
 *			Caller should free this memory after usage.
 *
 */
char *
pbs_get_dataservice_usr(char *errmsg, int len)
{
	char usr_file[MAXPATHLEN + 1];
	int fd = 0;
	struct stat st = {0};
	char buf[MAXPATHLEN + 1];

	snprintf(usr_file, MAXPATHLEN + 1, "%s/server_priv/db_user", pbs_conf.pbs_home_path);
	if ((fd = open(usr_file, O_RDONLY)) == -1) {
		if (access(usr_file, F_OK) == 0) {
			snprintf(errmsg, len, "%s: open failed, errno=%d", usr_file, errno);
			return NULL; /* file exists but open failed */
		} else {
			return strdup(PBS_DATA_SERVICE_USER); /* return default */
		}
	} else {
		if (fstat(fd, &st) == -1) {
			close(fd);
			snprintf(errmsg, len, "%s: stat failed, errno=%d", usr_file, errno);
			return NULL;
		}
		if (st.st_size >= sizeof(buf)) {
			close(fd);
			snprintf(errmsg, len, "%s: file too large", usr_file);
			return NULL;
		}

		if (read(fd, buf, st.st_size) != st.st_size) {
			close(fd);
			snprintf(errmsg, len, "%s: read failed, errno=%d", usr_file, errno);
			return NULL;
		}
		buf[st.st_size] = 0;
		close(fd);

		return (strdup(buf));
	}
}


================================================
FILE: src/lib/Libcmds/get_server.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	get_server.c
 * @brief
 * ------------------------------------
 * As specified in section 5 of the ERS:
 *
 *  5.1.2.  Directing Requests to Correct Server
 *
 *  A  command  shall  perform  its  function  by  sending   the
 *  corresponding  request  for  service  to the a batch server.
 *  The choice of batch servers to which to send the request  is
 *  governed by the following ordered set of rules:
 *
 *  1. For those commands which require or accept a job identif-
 *     ier  operand, if the server is specified in the job iden-
 *     tifier operand as @server, then the batch  requests  will
 *     be sent to the server named by server.
 *
 *  2. For those commands which require or accept a job identif-
 *     ier  operand  and  the @server is not specified, then the
 *     command will attempt to determine the current location of
 *     the  job  by  sending  a  Locate Job batch request to the
 *     server which created the job.
 *
 *  3. If a server component of a destination  is  supplied  via
 *     the  -q  option,  such  as  on  qsub and qselect, but not
 *     qalter, then the server request is sent to that server.
 *
 *  4. The server request is sent to the  server  identified  as
 *     the default server, see section 2.6.3.
 *     [pbs_connect() implements this]
 *
 *  2.6.3.  Default Server
 *
 *  When a server is not specified to a client, the client  will
 *  send  batch requests to the server identified as the default
 *  server.  A client identifies the default server by  (a)  the
 *  setting  of  the environment variable PBS_DEFAULT which con-
 *  tains a destination, or (b) the  destination  in  the  batch
 *  administrator established file {PBS_DIR}/default_destn.
 * ------------------------------------
 *
 * Takes a job_id_in string as input, calls parse_jobid to separate
 * the pieces, then applies the above rules in order
 * If things go OK, the function value is set to 0,
 * if errors, it is set to 1.
 *
 * @par Full legal syntax is:
 *  seq_number[.parent_server[:port]][@current_server[:port]]
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <netdb.h>
#include <sys/param.h>
#include "cmds.h"
#include "pbs_ifl.h"
#include "net_connect.h"

/**
 * @brief
 *	processes input jobid according to above mentioned rules
 *
 * @param[in] job_id_in - input job id
 * @param[out] job_id_out - processed job id
 * @param[out] server_out - server name
 *
 * @return	int
 * @retval	0	success
 * @retval	1	error
 *
 */
int
get_server(char *job_id_in, char *job_id_out, char *server_out)
{
	char *seq_number = NULL;
	char *parent_server = NULL;
	char *current_server = NULL;
	char host_server[PBS_MAXSERVERNAME + 1];

	if (!job_id_in || !job_id_out || !server_out)
		return 1;

	if (pbs_loadconf(0) != 1)
		return 1;

	/* parse the job_id_in into components */

	if (parse_jobid(job_id_in, &seq_number, &parent_server,
			&current_server)) {
		free(seq_number);
		free(parent_server);
		free(current_server);
		return 1;
	}

	/* Apply the above rules, in order, except for the locate job request.
	 That request is only sent if the job is not found on the local server.
	 */

	server_out[0] = '\0';
	if (notNULL(current_server)) /* @server found */
		strcpy(server_out, current_server);
	free(current_server);

	strcpy(job_id_out, seq_number);
	free(seq_number);

	if (notNULL(parent_server)) {

		/* If parent_server matches PBS_SERVER then use it */
		if (pbs_conf.pbs_server_name) {
			if (strcasecmp(parent_server, pbs_conf.pbs_server_name) == 0) {
				strcat(job_id_out, ".");
				strcat(job_id_out, pbs_conf.pbs_server_name);
				free(parent_server);
				return 0;
			}
		}

		if (get_fullhostname(parent_server, host_server,
				     PBS_MAXSERVERNAME) != 0) {
			free(parent_server);
			return 1;
		}

		strcat(job_id_out, ".");

		strcat(job_id_out, parent_server);
		if (server_out[0] == '\0')
			strcpy(server_out, parent_server);
		free(parent_server);
		return 0;
	}

	free(parent_server);

	if (pbs_conf.pbs_server_name) {
		strcat(job_id_out, ".");
		strcat(job_id_out, pbs_conf.pbs_server_name);
	} else {
		return 1;
	}

	return 0;
}


================================================
FILE: src/lib/Libcmds/isjobid.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <ctype.h>
#include <string.h>
#include "pbs_ifl.h"
#include "pbs_internal.h"

/**
 * @file	isjobid.c
 */
/**
 * @brief
 *	validates whether the input string is jobid
 *
 * @param[in] string - jobid
 *
 * @return	int
 * @retval	1	if jobid
 * @retval	0	not jobid/error
 *
 */

int
pbs_isjobid(char *string)
{
	int i;
	int result;

	i = strspn(string, " "); /* locate first non-blank */
	if (isdigit(string[i]))
		result = 1; /* job_id */
	else if (isalpha(string[i]))
		result = 0; /* not a job_id */
	else
		result = 0; /* who knows - probably a syntax error */

	return (result);
}


================================================
FILE: src/lib/Libcmds/locate_job.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	locate_job.c
 * @brief
 *	Connect to the server the job was submitted to, and issue a
 *  Locate Job command. The result should be the server that the job
 *  is currently at.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"

/**
 * @brief
 *	returns the location of job running at.
 *
 * @param[in] job_id - job id
 * @param[in] parent_server - server name
 * @param[out] located_server - server name
 *
 * @return	int
 * @retval	TRUE	success
 * @retval	-1	error
 *
 */

int
locate_job(char *job_id, char *parent_server, char *located_server)
{
	int connect;
	char jid_server[PBS_MAXCLTJOBID + 1];
	char *location;

	if ((connect = pbs_connect(parent_server)) > 0) {
		strcpy(jid_server, job_id);
		if (notNULL(parent_server)) {
			strcat(jid_server, "@");
			strcat(jid_server, parent_server);
		}
		location = pbs_locjob(connect, jid_server, NULL);
		if (location == NULL) {
			pbs_disconnect(connect);
			return FALSE;
		}
		strcpy(located_server, location);
		free(location);
		pbs_disconnect(connect);
		return TRUE;
	} else
		return -1;
}


================================================
FILE: src/lib/Libcmds/parse_at.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	parse_at.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "pbs_ifl.h"
#include "portability.h"

#ifdef WIN32 /* we're including the space character under windows */
#define ISNAMECHAR(x) ((isprint(x)) && ((x) != '#') && ((x) != '@'))
#else
#define ISNAMECHAR(x) ((isgraph(x)) && ((x) != '#') && ((x) != '@'))
#endif

struct hostlist {
	char host[PBS_MAXHOSTNAME + 1];
	struct hostlist *next;
};

/** @fn int parse_at_item(char *at_item, char *at_name, char *host_name)
 * @brief	parse a single name[@host] item and return name and host
 *
 * @param[in]	at_item
 * @param[out]	at_name
 * @param[out]	host_name
 *
 * @return	int
 * @retval	1	success
 * @retval	0	parsing failure

 * @par MT-Safe:	yes
 * @par Side Effects:
 *	None
 *
 * @par Note:
 *	This function requires caller to provide output parameters with
 *	required memory allocated.  Checks in this function are removed
 *	for speed.
 */
int
parse_at_item(char *at_item, char *at_name, char *host_name)
{
	char *c;
	int a_pos = 0;
	int h_pos = 0;

	/* Begin the parse */
	c = at_item;
	while (isspace(*c))
		c++;

	/* Looking for something before the @ sign */
	while (*c != '\0') {
		if (ISNAMECHAR(*c)) {
			if (a_pos >= MAXPATHLEN)
				return 1;
			at_name[a_pos++] = *c;
		} else
			break;
		c++;
	}
	if (a_pos == 0)
		return 1;

	/* Looking for a server */
	if (*c == '@') {
		c++;
		while (*c != '\0') {
			if (ISNAMECHAR(*c)) {
				if (h_pos >= PBS_MAXSERVERNAME)
					return 1;
				host_name[h_pos++] = *c;
			} else
				break;
			c++;
		}
		if (h_pos == 0)
			return 1;
	}

	if (*c != '\0')
		return 1;

	/* set null chars at the end of the string */
	at_name[a_pos] = '\0';
	host_name[h_pos] = '\0';

	return (0);
}

/** @fn int parse_at_list(char *list, int use_count, int abs_path)
 * @brief	parse a comma-separated list of name[@host] items
 *
 * @param[in]	list
 * @param[out]	use_count	if true, make sure no host is repeated
 *				in the list, and host is defaulted only
 *				once
 * @param[out]	abs_path	if true, make sure the item appears to
 *				begin with an absolute path name
 *
 * @return	int
 * @retval	1	parsing failure
 * @retval	0	success

 * @par MT-Safe:	no
 * @par Side Effects:
 *	exits with return code 1 on memory allocation failure
 */
int
parse_at_list(char *list, int use_count, int abs_path)
{
	char *b, *c, *s, *list_dup;
	int rc = 0;
	char user[MAXPATHLEN + 1];
	char host[PBS_MAXSERVERNAME + 1];
	struct hostlist *ph, *nh, *hostlist = NULL;

	if ((list == NULL) || (*list == '\0'))
		return 1;

	fix_path(list, 1);

	if ((list_dup = strdup(list)) == NULL) {
		fprintf(stderr, "Out of memory.\n");
		return 1;
	}

	for (c = list_dup; *c != '\0'; rc = 0) {
		rc = 1;

		/* Drop leading white space */
		while (isspace(*c))
			c++;

		/* If requested, is this an absolute path */
		if (abs_path && !is_full_path(c))
			break;

		/* Find the next comma */
		for (s = c; *c && *c != ','; c++)
			;

		/* Drop any trailing blanks */
		for (b = c - 1; (b >= list_dup) && isspace(*b); b--)
			*b = '\0';

		/* Make sure the list does not end with a comma */
		if (*c == ',') {
			*c++ = '\0';
			if (*c == '\0')
				break;
		}

		/* Parse the individual list item */
		if (parse_at_item(s, user, host))
			break;

		/* The user part must be given */
		if (*user == '\0')
			break;

		/* If requested, make sure the host name is not repeated */
		if (use_count) {
			ph = hostlist;
			while (ph) {
				if (strcmp(ph->host, host) == 0)
					goto duplicate;
				ph = ph->next;
			}
			nh = (struct hostlist *) malloc(sizeof(struct hostlist));
			if (nh == NULL) {
				fprintf(stderr, "Out of memory\n");
				return 1;
			}
			nh->next = hostlist;
			strcpy(nh->host, host);
			hostlist = nh;
		}
	}
duplicate:

	/* Release memory for hostlist and argument list */
	ph = hostlist;
	while (ph) {
		nh = ph->next;
		free(ph);
		ph = nh;
	}
	free(list_dup);

	return rc;
}


================================================
FILE: src/lib/Libcmds/parse_depend.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	parse_depend.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "pbs_ifl.h"
#include "cmds.h"

static char *deptypes[] = {
	"on", /* "on" and "synccount" must be first two */
	"synccount",
	"after",
	"afterok",
	"afternotok",
	"afterany",
	"before",
	"beforeok",
	"beforenotok",
	"beforeany",
	"syncwith",
	"runone",
	NULL};

/**
 * @brief
 *	Append to an allocated string which will be expanded as needed.
 *
 * @param[in/out]	dest	destination location (malloc'ed)
 * @param[in]		str	source string
 * @param[in/out]	size	length of destination allocation
 *
 * @return 0	success
 * @return 1	failure
 */
static int
append_string(char **dest, char *str, int *size)
{
	size_t used, add;

	if (dest == NULL || *dest == NULL || str == NULL ||
	    size == NULL || *size == 0)
		return 1;

	used = strlen(*dest);
	add = strlen(str);
	if (used + add > *size) {
		char *temp;
		int newsize = 2 * (used + add);

		temp = (char *) realloc(*dest, newsize);
		if (temp == NULL)
			return 1;
		*dest = temp;
		*size = newsize;
	}
	strcat(*dest, str);
	return 0;
}

/**
 * @brief
 * 	Parse a string of depend jobs.
 *
 * @param[in]		depend_list	depend jobs syntax: "jobid[:jobid...]"
 * @param[in/out]	rtn_list	expanded jobids appended here
 * @param[in/out]	rtn_size	size of rtn_list
 *
 * @return      int
 * @retval      0       success
 * @retval      1       failure
 *
 */
static int
parse_depend_item(char *depend_list, char **rtn_list, int *rtn_size)
{
	char *at;
	int i = 0;
	int first = 1;
	char *b1, *b2;
	char *s = NULL;
	char *c;
	char full_job_id[PBS_MAXCLTJOBID + 1];
	char server_out[PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2];

	/* Begin the parse */
	c = depend_list;

	/* Loop on strings between colons */
	while ((c != NULL) && (*c != '\0')) {
		s = c;
		while (((*c != ':') || ((c != depend_list) && (*(c - 1) == '\\'))) && (*c != '\0'))
			c++;
		if (s == c)
			return 1;

		if (*c == ':') {
			*c++ = '\0';
		}

		if (first) {
			first = 0;
			for (i = 0; deptypes[i]; ++i) {
				if (strcmp(s, deptypes[i]) == 0)
					break;
			}
			if (deptypes[i] == NULL)
				return 1;
			if (append_string(rtn_list, deptypes[i], rtn_size))
				return 1;

			/* It's an error if there are no values after ':' */
			if (*c == '\0')
				return 1;

		} else {

			if (i < 2) { /* for "on" and "synccount", number */
				if (append_string(rtn_list, s, rtn_size))
					return 1;
			} else { /* for others, job id */
				at = strchr(s, (int) '@');
				if (get_server(s, full_job_id, server_out) != 0)
					return 1;
				/* disallow subjob or range of subjobs, [] ok */
				if ((b1 = strchr(full_job_id, (int) '[')) != NULL) {
					if ((b2 = strchr(full_job_id, (int) ']')) != NULL)
						if (b2 != b1 + 1) {
							fprintf(stderr,
								"cannot have "
								"dependancy on subjob "
								"or range\n");
							return 1;
						}
				}
				if (append_string(rtn_list, full_job_id, rtn_size))
					return 1;
				if (at) {
					if (append_string(rtn_list, "@", rtn_size))
						return 1;
					if (append_string(rtn_list, server_out,
							  rtn_size))
						return 1;
				}
			}
		}
		if (*c) {
			if (append_string(rtn_list, ":", rtn_size))
				return 1;
		}
	}
	if (s == c)
		return 1;

	return 0;
}

/**
 * @brief
 *	Parse dependency lists with
 * 	syntax depend_list[,depend_list...]
 *
 * @param[in]		list		dependency list
 * @param[in/out]	rtn_list	address of allocated string for parsed result
 * @param[in]		rtn_size	size of rtn_list buffer
 *
 * @return	int
 * @retval 	0 	success
 * @retval 	1 	failure
 *
 * @par Side Effects:
 * May exit if malloc fails.
 */
int
parse_depend_list(char *list, char **rtn_list, int rtn_size)

{
	char *b, *c, *s, *lc;
	int comma = 0;

	if (list == NULL || rtn_list == NULL || *rtn_list == NULL || rtn_size == 0)
		return 1;

	if (strlen(list) == 0)
		return (1);

	if ((lc = (char *) malloc(strlen(list) + 1)) == NULL) {
		fprintf(stderr, "Out of memory.\n");
		return 1;
	}
	strcpy(lc, list);
	c = lc;
	**rtn_list = '\0';

	while (*c != '\0') {
		/* Drop leading white space */
		while (isspace(*c))
			c++;

		/* Find the next comma */
		s = c;
		while (*c != ',' && *c)
			c++;

		/* Drop any trailing blanks */
		comma = (*c == ',');
		*c = '\0';
		b = c - 1;
		while (isspace((int) *b))
			*b-- = '\0';

		/* Parse the individual list item */

		if (parse_depend_item(s, rtn_list, &rtn_size)) {
			free(lc);
			return 1;
		}

		if (comma) {
			c++;
			append_string(rtn_list, ",", &rtn_size);
		}
	}
	free(lc);

	if (comma)
		return 1;

	return 0;
}


================================================
FILE: src/lib/Libcmds/parse_destid.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	parse_destid
 * @brief
 * full syntax permitted;
 *
 * queue_name[@server_name[:port_number]]
 * @server_name[:port_number]
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "cmds.h"

#define ISNAMECHAR(x) ((isgraph(x)) && ((x) != '#') && ((x) != '@'))

/*
 * note the queue_name_out and server_name_out is now allocated on heap
 * so caller should free them after using
 */

/**
 * @brief
 *	parse destination id
 *
 * @param[in] destination_in - destination string
 * @param[out] queue_name_out - queue name
 * @param[out] server_name_out - server name
 *
 * @return      int
 * @retval      0       success
 * @retval      1       failure
 *
 * NOTE: the queue_name_out and server_name_out is now allocated on heap
 * so caller should free them after using
 *
 */

int
parse_destination_id(char *destination_in, char **queue_name_out, char **server_name_out)
{
	char *c;
	/* moved following static vars to stack */
	char *queue_name = NULL;
	int q_pos = 0;
	char *server_name = NULL;
	int c_pos = 0;

	queue_name = calloc(PBS_MAXQUEUENAME + 1, 1);
	if (queue_name == NULL)
		goto err;

	server_name = calloc(MAXSERVERNAME, 1);
	if (server_name == NULL)
		goto err;

	/* Begin the parse */
	c = destination_in;
	while (isspace(*c))
		c++;

	/* Looking for a queue */
	while (*c != '\0') {
		if (ISNAMECHAR(*c)) {
			if (q_pos >= PBS_MAXQUEUENAME)
				goto err;
			queue_name[q_pos++] = *c;
		} else
			break;
		c++;
	}

	/* Looking for a server */
	if (*c == '@') {
		c++;
		while (*c != '\0') {
			if (ISNAMECHAR(*c)) {
				if (c_pos >= MAXSERVERNAME)
					goto err;
				server_name[c_pos++] = *c;
			} else
				break;
			c++;
		}
		if (c_pos == 0)
			goto err;
	}

	if (*c != '\0')
		goto err;

	/* set char * pointers to static data, to arguments */
	if (queue_name_out != NULL)
		*queue_name_out = queue_name;
	else
		free(queue_name);

	if (server_name_out != NULL)
		*server_name_out = server_name;
	else
		free(server_name);

	return 0;

err:
	if (queue_name)
		free(queue_name);
	if (server_name)
		free(server_name);
	return 1;
}


================================================
FILE: src/lib/Libcmds/parse_equal.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "cmds.h"

/**
 * @file	parse_equal.c
 */
/**
 * @brief
 * 	parse_equal_string - parse a string of the form:
 *		name1 = value1[, value2 ...][, name2 = value3 [, value4 ...]]
 *	into <name1> <value1[, value2 ...>
 *	     <name2> <value3 [, value4 ...>
 *
 *	On the first call,
 *		*name will point to "name1"
 *		*value will point to "value1 ..." upto but not
 *			including the comma before "name2".
 *	On a second call, with start = NULL,
 *		*name will point to "name2"
 *		*value will point t0 "value3 ..."
 *
 * @param[in]	start	the start of the string to parse
 * @param[in]	name    set to point to the name string
 * @param[in]  	value	set to point to the value string
 *
 *      start is the start of the string to parse.  If called again with
 *      start  being a null pointer, it will resume parsing where it stoped
 *      on the prior call.

 * @return	int
 * @retval	1 	if  name and value are found
 * @retval	0 	if nothing (more) is parsed (null input)
 * @retval	-1 	if a syntax error was detected.
 *
 */

int
parse_equal_string(char *start, char **name, char **value)
{
	static char *pc; /* where prior call left off */
	char *backup;
	int quoting = 0;

	if (start != NULL)
		pc = start;

	if (*pc == '\0') {
		*name = NULL;
		return (0); /* already at end, return no strings */
	}

	/* strip leading spaces */

	while (isspace((int) *pc) && *pc)
		pc++;

	if (*pc == '\0') {
		*name = NULL; /* null name */
		return (0);
	} else if ((*pc == '=') || (*pc == ','))
		return (-1); /* no name, return error */

	*name = pc;

	/* have found start of name, look for end of it */

	while (!isspace((int) *pc) && (*pc != '=') && *pc)
		pc++;

	/* now look for =, while stripping blanks between end of name and = */

	while (isspace((int) *pc) && *pc)
		*pc++ = '\0';
	if (*pc != '=')
		return (-1); /* should have found a = as first non blank */
	*pc++ = '\0';

	/* that follows is the value string, skip leading white space */

	while (isspace((int) *pc) && *pc)
		pc++;

	/* is the value string to be quoted ? */

	if ((*pc == '"') || (*pc == '\''))
		quoting = (int) *pc++;
	*value = pc;

	/*
	 * now go to first equal sign, or if quoted, the first equal sign
	 * after the close quote
	 */

	if (quoting) {
		while ((*pc != (char) quoting) && *pc) /* look for matching */
			pc++;
		if (*pc)
			*pc = ' '; /* change close quote to space */
		else
			return (-1);
	}
	while ((*pc != '=') && *pc)
		pc++;

	if (*pc == '\0') {
		while (isspace((int) *--pc))
			;
		if (*pc == ',') /* trailing comma is a no no */
			return (-1);
		pc++;
		return (1); /* no equal, just end of line, stop here */
	}

	/* back up to the first comma found prior to the equal sign */

	while (*--pc != ',')
		if (pc <= *value) /* gone back too far, no comma, error */
			return (-1);
	backup = pc++;
	*backup = '\0'; /* null the comma */

	/* strip off any trailing white space */

	while (isspace((int) *--backup))
		*backup = '\0';
	return (1);
}


================================================
FILE: src/lib/Libcmds/parse_jobid.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	parse_jobid.c
 * @brief
 * takes a job_id string as input, parses it to separate the
 * 'current_server[:port]' part, and returns this in the return
 * argument 'server'; if things go OK, the function value is
 * set to 0, if errors, it is set to 1.   The 'current_server[:port]'
 * part of 'job_id' is removed, if it was present.
 *
 * Full legal syntax is:
 *  seq_number[.parent_server[:port]][@current_server[:port]]
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "cmds.h"

#define ISNAMECHAR(x) ((isgraph(x)) && ((x) != '#') && ((x) != '@'))

/* static vars removed to make this a thread_safe function */

/**
 * @brief
 *	parses the job id for current server[:port] part
 *
 * @param[in] job_id - job id
 * @param[out] arg_seq_number - sequence number
 * @param[out] arg_parent_server - parent server
 * @param[out] arg_current_server - current server
 *
 * @return	int
 * @retval	0	success
 * @retval	1	error
 *
 */
int
parse_jobid(char *job_id, char **arg_seq_number, char **arg_parent_server, char **arg_current_server)
{
	int is_resv = 0;
	char *c;
	char *seq_number = NULL;
	int s_pos = 0;
	char *parent_server = NULL;
	int p_pos = 0;
	char *current_server = NULL;
	int c_pos = 0;
	int ret = 0;

	seq_number = calloc(PBS_MAXCLTJOBID + 1, 1);
	if (seq_number == NULL) {
		ret = 1;
		goto err;
	}
	parent_server = calloc(MAXSERVERNAME, 1);
	if (parent_server == NULL) {
		ret = 1;
		goto err;
	}
	current_server = calloc(MAXSERVERNAME, 1);
	if (current_server == NULL) {
		ret = 1;
		goto err;
	}

	/* Begin the parse */
	c = job_id;
	while (isspace(*c))
		c++;

	/* skip past initial char if reservation */
	if (*c == PBS_RESV_ID_CHAR || *c == PBS_STDNG_RESV_ID_CHAR || *c == PBS_MNTNC_RESV_ID_CHAR) {
		is_resv = 1;
		seq_number[s_pos++] = *c;
		c++;
	}

	/* Looking for a seq_number */
	while (*c != '\0') {
		if (isdigit(*c)) {
			if ((s_pos >= PBS_MAXSEQNUM && !is_resv) ||
			    (s_pos >= PBS_MAXSEQNUM + 1 && is_resv)) {
				ret = 3;
				goto err;
			}
			seq_number[s_pos++] = *c;
		} else
			break;
		c++;
	}
	if (s_pos == 0) {
		ret = 1;
		goto err;
	}

	/* Is this an ArrayJob identifier or a Array subjob id? */
	if (*c == '[') {
		if (is_resv) {
			ret = 1;
			goto err; /* cannot be both Array... and reservation */
		}

		if (s_pos >= PBS_MAXCLTJOBID) {
			ret = 3;
			goto err;
		}
		seq_number[s_pos++] = *c++; /* copy over opening brace */
		while (*c != ']') {
			while (isdigit((int) *c)) {
				if (s_pos >= PBS_MAXCLTJOBID) {
					ret = 3;
					goto err;
				}
				seq_number[s_pos++] = *c++;
			}
			if (*c == '-') {
				if (s_pos >= PBS_MAXCLTJOBID) {
					ret = 3;
					goto err;
				}
				seq_number[s_pos++] = *c++;
			} else if (*c == ':') {
				if (s_pos >= PBS_MAXCLTJOBID) {
					ret = 3;
					goto err;
				}
				seq_number[s_pos++] = *c++;
			} else if (*c != ']') {
				ret = 1;
				goto err;
			}
		}
		if (s_pos >= PBS_MAXCLTJOBID) {
			ret = 3;
			goto err;
		}
		seq_number[s_pos++] = *c++; /* copy in closing brace */
	}

	/* Looking for a parent_server */
	if (*c == '.') {
		c++;
		while (*c != '\0') {
			if (ISNAMECHAR(*c)) {
				if (p_pos >= MAXSERVERNAME) {
					ret = 3;
					goto err;
				}
				parent_server[p_pos++] = *c;
			} else
				break;
			c++;
		}
		if (p_pos == 0) {
			ret = 1;
			goto err;
		}
	}

	/* Looking for a current_server */
	if (*c == '@') {
		c++;
		while (*c != '\0') {
			if (ISNAMECHAR(*c)) {
				if (c_pos >= MAXSERVERNAME) {
					ret = 3;
					goto err;
				}
				current_server[c_pos++] = *c;
			} else
				break;
			c++;
		}
		if (c_pos == 0) {
			ret = 1;
			goto err;
		}
	}

	if (*c != '\0') {
		ret = 2;
		goto err;
	}

	if ((s_pos + p_pos + 2) > PBS_MAXCLTJOBID) {
		ret = 3;
		goto err;
	}

	/* set char * pointers to static data, to arguments */
	if (arg_seq_number != NULL)
		*arg_seq_number = seq_number;
	else
		free(seq_number);

	if (arg_parent_server != NULL)
		*arg_parent_server = parent_server;
	else
		free(parent_server);

	if (arg_current_server != NULL)
		*arg_current_server = current_server;
	else
		free(current_server);

	return 0;

err:
	if (seq_number)
		free(seq_number);
	if (current_server)
		free(current_server);
	if (parent_server)
		free(parent_server);
	return ret;
}


================================================
FILE: src/lib/Libcmds/parse_stage.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"

/**
 * @file	parse_stage.c
 */

#define ISNAMECHAR(x) (((isprint(x)) || (isspace(x))) && ((x) != '@'))
#define ISNAMECHAR2(x) ((isprint(x)) && (!isspace(x)) && ((x) != '@') && ((x) != ':'))

/**
 * @brief
 *	parses the staging file name
 *      syntax:	locat_file@hostname:remote_file
 *		on Windows if remote_file is UNC path then
 *		hostname is optional so syntax can be
 *		local_file@remote_unc_file
 *      Note: The arguments local_name, host_name, remote_name are mandatory and
 *	must be allocated with required memory by the caller.
 *
 * @param[in]       pair        - a staged file name pair
 * @param[in/out]   local_name  - local file name
 * @param[in/out]   host_name   - remote host
 * @param[in/out]   remote_name - remote file namea
 *
 * @return int
 * @retval 0    parsing was successful
 * @retval 1	error in parsing
 */
int
parse_stage_name(char *pair, char *local_name, char *host_name, char *remote_name)
{
	char *c = NULL;
	int l_pos = 0;
	int h_pos = 0;
	int r_pos = 0;

	/* Begin the parse */
	c = pair;
	while (isspace(*c))
		c++;

	/* Looking for something before the @ sign */
	while (*c != '\0') {
		if (ISNAMECHAR(*c)) { /* allow whitespace and stop on '@' */
			if (l_pos >= MAXPATHLEN)
				return 1;
			local_name[l_pos++] = *c;
		} else
			break;
		c++;
	}
	if (l_pos == 0)
		return 1;

#ifdef WIN32
	if ((*c == '@') && (c + 1 != NULL) && (IS_UNCPATH(c + 1))) {
		c++;
		/*
		 * remote_name is UNC path without host part
		 * so skip parsing of host_name and parse
		 * remote_name
		 */
		while (*c != '\0') {
			if (ISNAMECHAR(*c)) { /* allow whitespace */
				if (r_pos >= MAXPATHLEN)
					return 1;
				remote_name[r_pos++] = *c;
			} else
				break;
			c++;
		}
	}
#endif
	/* Looking for something between the @ and the : */
	if (*c == '@') {
		c++;
		while (*c != '\0') {
			if (ISNAMECHAR2(*c)) { /* no whitespace allowed in host */
				if (h_pos >= PBS_MAXSERVERNAME)
					return 1;
				host_name[h_pos++] = *c;
			} else
				break;
			c++;
		}
		if (h_pos == 0)
			return 1;
	}

#ifdef WIN32
	/*
	 * h_pos may be 1 if non-UNC path is given
	 * without host part which is not allowed
	 * so return parsing error
	 * example: -Wstagein=C:\testdir@D:\testdir1
	 */
	if (h_pos == 1)
		return 1;
#endif

	/* Looking for something after the : */
	if (*c == ':') {
		c++;
		while (*c != '\0') {
			if (ISNAMECHAR(*c)) { /* allow whitespace */
				if (r_pos >= MAXPATHLEN)
					return 1;
				remote_name[r_pos++] = *c;
			} else
				break;
			c++;
		}
	}
	if (r_pos == 0)
		return 1;

	if (*c != '\0')
		return 1;

	/* set null chars at end of string */
	local_name[l_pos] = '\0';
	remote_name[r_pos] = '\0';
	host_name[h_pos] = '\0';

	return (0);
}

/**
 * @brief
 * 	parse_stage_list
 *
 * syntax:
 *	local_file@hostname:remote_file [,...]
 *
 * @param[in]	list	List of staged file name pairs.
 *
 * @return	int
 * @retval	0	success
 * @retval	1	error
 *
 */

int
parse_stage_list(char *list)
{
	char *b = NULL;
	char *c = NULL;
	char *s = NULL;
	char *l = NULL;
	int comma = 0;
	char local[MAXPATHLEN + 1] = {'\0'};
	char host[PBS_MAXSERVERNAME] = {'\0'};
	char remote[MAXPATHLEN + 1] = {'\0'};

	if (strlen(list) == 0)
		return (1);

	if ((l = (char *) malloc(strlen(list) + 1)) == NULL) {
		fprintf(stderr, "Out of memory.\n");
		return 1;
	}
	memset(l, 0, strlen(list) + 1);
	strcpy(l, list);
	c = l;
	while (*c != '\0') {
		/* Drop leading white space */
		while (isspace((int) *c))
			c++;

		/* Find the next comma */
		s = c;
		while (*c != '\0') {
			if (*c == ',' && (s != c) && *(c - 1) != '\\')
				break;
			c++;
		}

		/* Drop any trailing blanks */
		comma = (*c == ',');
		*c = '\0';
		b = c - 1;
		while (isspace((int) *b))
			*b-- = '\0';

		/* Parse the individual list item */
		if (parse_stage_name(s, local, host, remote)) {
			(void) free(l);
			return 1;
		}

		/* Make sure all parts of the item are present */
		if (strlen(local) == 0) {
			(void) free(l);
			return 1;
		}
#ifdef WIN32
		if ((strlen(host) == 0) && (strlen(remote) > 0) && (!IS_UNCPATH(remote)))
#else
		if (strlen(host) == 0)
#endif
		{
			(void) free(l);
			return 1;
		}
		if (strlen(remote) == 0) {
			(void) free(l);
			return 1;
		}

		if (comma) {
			c++;
		}
	}
	if (comma) {
		(void) free(l);
		return 1;
	}

	(void) free(l);

	return 0;
}


================================================
FILE: src/lib/Libcmds/prepare_path.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	perpare_path.c
 * @brief
 *	Prepare a full path name to give to the server.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include <netdb.h>
#include <sys/stat.h>
#include "cmds.h"
#include "pbs_ifl.h"
#include "net_connect.h"

/**
 * @brief
 *	validate if hname is local host
 *
 * @param[in] hname - host name
 *
 * @return	int
 * @retval	0	success
 * @retval	1	error
 *
 */
int
is_local_host(char *hname)
{
	char hname_full[PBS_MAXSERVERNAME + 1];
	char cname_short[PBS_MAXSERVERNAME + 1];
	char cname_full[PBS_MAXSERVERNAME + 1];

	if (gethostname(cname_short, PBS_MAXSERVERNAME) != 0)
		return (0);
		/*
	 * Compare with "locahost" and "localhost.localdomain".
	 */
#ifdef WIN32
	if (stricmp(hname, cname_short) == 0 ||
	    stricmp(hname, LOCALHOST_SHORTNAME) == 0 ||
	    stricmp(hname, LOCALHOST_FULLNAME) == 0)
		return (1);
#else
	if (strcmp(hname, cname_short) == 0 ||
	    strcmp(hname, LOCALHOST_SHORTNAME) == 0 ||
	    strcmp(hname, LOCALHOST_FULLNAME) == 0)
		return (1);
#endif
	if (get_fullhostname(cname_short, cname_full, PBS_MAXSERVERNAME) != 0)
		return (0);

	if (get_fullhostname(hname, hname_full, PBS_MAXSERVERNAME) != 0)
		return (0);

	if (strcmp(hname_full, cname_full) == 0)
		return (1);

	return (0);
}

/**
 * @brief
 *	parses path and prepares complete path name
 *
 * @param[in]      path_in - the path name provided as input to be parsed
 * @param[out]     path_out - contains final parsed and prepared path, must
 *                            be at least MAXPATHLEN+1 bytes.
 *
 * @return int
 * @retval  0 - success in parsing
 * @retval  nonzero - error encountered in parsing
 */
int
prepare_path(char *path_in, char *path_out)
{
	char *c = NULL;
	int have_fqdn = 0;
	/* Initialization with {'\0'} populates entire array */
	char host_name[PBS_MAXSERVERNAME + 1] = {'\0'}; /* short host name */
	int h_pos = 0;
	char path_name[MAXPATHLEN + 1] = {'\0'};
	size_t path_len;
	int p_pos = 0;
	char *host_given = NULL;
	struct stat statbuf = {0};
	dev_t dev = 0;
	ino_t ino = 0;

	if (!path_out)
		return 1;
	*path_out = '\0';
	if (!path_in)
		return 1;

	/* Begin the parse */
	for (c = path_in; *c; c++) {
		if (isspace(*c) == 0)
			break;
	}
	if (*c == '\0')
		return 1;

#ifdef WIN32
	/* Check for drive letter in Windows */
	if (!(isalpha(*c) && (*(c + 1) == ':')))
#endif
	{
		/* Looking for a hostname */
		if ((host_given = strchr(c, ':')) != NULL) {
			/* Capture the hostname portion */
			for (h_pos = 0; (h_pos < sizeof(host_name)); h_pos++, c++) {
				if (isalnum(*c) || (*c == '.') || (*c == '-')
#ifdef WIN32
				    /* Underscores are legal in Windows */
				    || (*c == '_')
#endif
				) {
					host_name[h_pos] = *c;
				} else {
					break;
				}
			}
			if (*c != ':') {
				if (*c == '/') {
					/* There's a colon in the path */
					host_given = NULL;
					host_name[0] = '\0';
					for (c = path_in; *c; c++) {
						if (isspace(*c) == 0)
							break;
					}
				} else
					return 1;
			} else {
				/* Advance past the colon */
				c++;
			}
		}
	}

	/* Looking for a posix path */
	for (p_pos = 0; p_pos < sizeof(path_name); p_pos++, c++) {
		if (!isprint(*c))
			break;
		path_name[p_pos] = *c;
	}
	/* Should be at end of string */
	if (*c != '\0')
		return 1;

	path_len = strlen(path_name);
	if (path_len == 0 && strlen(host_name) == 0)
		return 1;

	/* appending a slash in the end to indicate that it is a directory */
	if ((path_name[path_len - 1] != '/') &&
	    (path_name[path_len - 1] != '\\') &&
	    (stat(path_name, &statbuf) == 0) &&
	    S_ISDIR(statbuf.st_mode)) {
		if ((path_len + 1) < sizeof(path_name)) {
			strcat(path_name, "/");
			path_len++;
		}
	}

#ifdef WIN32
	if (IS_UNCPATH(path_name)) {
		/*
		 * given path is UNC path
		 * so just skip hostname
		 * as UNC path dose not require it
		 */
		host_given = NULL;
		host_name[0] = '\0';
	} else
#endif
	{
		/* get full host name */
		if (host_name[0] == '\0') {
			if (pbs_conf.pbs_output_host_name) {
				/* use the specified host for returning the file */
				snprintf(host_name, sizeof(host_name), "%s", pbs_conf.pbs_output_host_name);
				have_fqdn = 1;
			} else {
				if (gethostname(host_name, sizeof(host_name)) != 0)
					return 2;
				host_name[sizeof(host_name) - 1] = '\0';
			}
		}
		if (have_fqdn == 0) {
			char host_fqdn[PBS_MAXSERVERNAME + 1] = {'\0'};
			/* need to fully qualify the host name */
			if (get_fullhostname(host_name, host_fqdn, PBS_MAXSERVERNAME) != 0)
				return 2;
			strncpy(path_out, host_fqdn, MAXPATHLEN); /* FQ host name */
		} else {
			strncpy(path_out, host_name, MAXPATHLEN); /* "localhost" or pbs_output_host_name */
		}
		path_out[MAXPATHLEN - 1] = '\0';

		/* finish preparing complete host name */
		if (strlen(path_out) < MAXPATHLEN)
			strcat(path_out, ":");
	}

#ifdef WIN32
	if (path_name[0] != '/' && path_name[0] != '\\' &&
	    host_given == NULL && strchr(path_name, ':') == NULL)
#else
	if (path_name[0] != '/' && host_given == NULL)
#endif
	{
		char cwd[MAXPATHLEN + 1] = {'\0'};

		c = getenv("PWD"); /* PWD carries a name that will cause */
		if (c != NULL) {   /* the NFS to mount */

			if (stat(c, &statbuf) < 0) { /* can't stat PWD */
				c = NULL;
			} else {
				dev = statbuf.st_dev;
				ino = statbuf.st_ino;
				if (stat(".", &statbuf) < 0) {
					perror("prepare_path: cannot stat current directory:");
					*path_out = '\0';
					return (1);
				}
			}
			if (dev == statbuf.st_dev && ino == statbuf.st_ino) {
				snprintf(cwd, sizeof(cwd), "%s", c);
			} else {
				c = NULL;
			}
		}
		if (c == NULL) {
			c = getcwd(cwd, MAXPATHLEN);
			if (c == NULL) {
				perror("prepare_path: getcwd failed : ");
				*path_out = '\0';
				return (1);
			}
		}
#ifdef WIN32
		/* get UNC path (if available) if it is mapped drive */
		get_uncpath(cwd);
		if (IS_UNCPATH(cwd)) {
			strcpy(path_out, cwd);
			if (cwd[strlen(cwd) - 1] != '\\')
				strcat(path_out, "\\");
		} else
#endif
		{
			strncat(path_out, cwd, (MAXPATHLEN + 1) - strlen(path_out));
			if (strlen(path_out) < MAXPATHLEN)
				strcat(path_out, "/");
		}
	}

#ifdef WIN32
	/* get UNC path (if available) if it is mapped drive */
	get_uncpath(path_name);
	if (IS_UNCPATH(path_name))
		strcpy(path_out, path_name);
	else {
		/*
		 * check whether given <path_name> is relative path
		 * without drive on localhost and <cwd> is not UNC path?
		 * if yes then do not append drive into <path_out>
		 * otherwise append drive into <path_out>
		 */
		if (is_local_host(host_name) &&
		    (strchr(path_name, ':') == NULL) &&
		    (path_out[strlen(path_out) - 1] != '/') &&
		    (!IS_UNCPATH(path_out))) {

			char drivestr[3] = {'\0'};
			char drivestr_unc[MAXPATHLEN + 1] = {'\0'};

			drivestr[0] = _getdrive() + 'A' - 1;
			drivestr[1] = ':';
			drivestr[2] = '\0';
			/*
			 * check whether <drivestr> is mapped drive?
			 * by calling get_uncpath()
			 * if yes then remove <hostname> part from <path_out>
			 *
			 * This is the case when user submit job
			 * from mapped drive with relative path without drive
			 * in path ex. localhost:err or localhost:out
			 */
			snprintf(drivestr_unc, sizeof(drivestr_unc), "%s\\", drivestr);
			get_uncpath(drivestr_unc);
			if (IS_UNCPATH(drivestr_unc)) {
				strncpy(path_out, drivestr_unc, MAXPATHLEN);
			} else {
				strncat(path_out, drivestr, MAXPATHLEN - strlen(path_out));
			}
		}
		strncat(path_out, path_name, MAXPATHLEN - strlen(path_out));
	}
	fix_path(path_out, 1);
	strcpy(path_out, replace_space(path_out, "\\ "));
	path_out[MAXPATHLEN - 1] = '\0';
#else
	strncat(path_out, path_name, (MAXPATHLEN + 1) - strlen(path_out));
#endif

	return (0);
}


================================================
FILE: src/lib/Libcmds/set_attr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	set_attr.c
 * @brief
 *	Add an entry to an attribute list. First, create the entry and set
 *  the fields. If the attribute list is empty, then just point it at the
 *  new entry. Otherwise, append the new entry to the list.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "cmds.h"
#include "attribute.h"

/* static pointer to be used by set_attr_resc */
static struct attrl *new_attr;

/**
 * @brief
 *	Add an entry to an attribute list. First, create the entry and set
 * 	the fields. If the attribute list is empty, then just point it at the
 * 	new entry. Otherwise, append the new entry to the list.
 *
 * @param[in/out] attrib - pointer to attribute list
 * @param[in]     attrib_name - attribute name
 * @param[in]     attrib_value - attribute value
 *
 * @return	error code
 * @return	0	success
 * @return	1	error
 *
 */

int
set_attr(struct attrl **attrib, const char *attrib_name, const char *attrib_value)
{
	struct attrl *attr, *ap;

	attr = new_attrl();
	if (attr == NULL) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}
	if (attrib_name == NULL)
		attr->name = NULL;
	else {
		attr->name = (char *) malloc(strlen(attrib_name) + 1);
		if (attr->name == NULL) {
			fprintf(stderr, "Out of memory\n");
			return 1;
		}
		strcpy(attr->name, attrib_name);
	}
	if (attrib_value == NULL)
		attr->value = NULL;
	else {
		attr->value = (char *) malloc(strlen(attrib_value) + 1);
		if (attr->name == NULL) {
			fprintf(stderr, "Out of memory\n");
			return 1;
		}
		strcpy(attr->value, attrib_value);
	}
	new_attr = attr; /* set global var new_attrl in case set_attr_resc want to add resource to it */
	if (*attrib == NULL) {
		*attrib = attr;
	} else {
		ap = *attrib;
		while (ap->next != NULL)
			ap = ap->next;
		ap->next = attr;
	}

	return 0;
}

/**
 * @brief
 *	wrapper function for set_attr.
 *
 * @param[in/out] attrib - pointer to attribute list
 * @param[in]     attrib_name - attribute name
 * @param[in]     attrib_value - attribute value
 *
 * @return	error code
 * @retval	0	success
 * @retval	1	failure
 */

int
set_attr_resc(struct attrl **attrib, const char *attrib_name, const char *attrib_resc, const char *attrib_value)
{
	if (set_attr(attrib, attrib_name, attrib_value))
		return 1;

	if (attrib_resc != NULL) {
		new_attr->resource = (char *) malloc(strlen(attrib_resc) + 1);
		if (new_attr->resource == NULL) {
			fprintf(stderr, "Out of memory\n");
			return 1;
		}
		strcpy(new_attr->resource, attrib_resc);
	}
	return 0;
}


================================================
FILE: src/lib/Libcmds/set_resource.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	set_resources
 * @brief
 *	Append entries to the attribute list that are from the resource list.
 * 	If the add flag is set, append the resource regardless. Otherwise, append
 * 	it only if it is not already on the list.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "cmds.h"
#include "attribute.h"

static int allowresc = 1;

/**
 * @brief
 *	 Append entries to the attribute list that are from the resource list.
 * 	If the add flag is set, append the resource regardless. Otherwise, append
 * 	it only if it is not already on the list.
 *
 * @param[in] attrib - pointer to attribute list
 * @param[in] resources - resources
 * @param[in] add - flag to indicate appending resource
 * @param[in] erptr - resource
 *
 * @return	int
 * @retval	0	resource set
 * @retval	1	resource not set / error
 *
 */

int
set_resources(struct attrl **attrib, const char *resources, int add, char **erptr)
{
	char *eq, *v, *e;
	char *r = (char *) resources;
	char *str;
	struct attrl *attr, *ap, *priorap;
	int i, found, len;
	int haveresc = 0;

	while (*r != '\0') {

		/* Skip any leading whitespace */
		while (isspace((int) *r))
			r++;

		/* Get the resource name */
		eq = r;
		while (*eq != '=' && *eq != ',' && *eq != '\0')
			eq++;

		/* Make sure there is a resource name */
		if (r == eq) {
			*erptr = r;
			return (1);
		}

		/*
		 * Count the number of non-space character that make up the
		 * resource name.  Count only up to the last character before the
		 * separator ('\0', ',' or '=').
		 */
		for (str = r, len = 0; str < eq && !isspace((int) *str); str++)
			len++;

		/* If separated by an equal sign, get the value */
		if (*eq == '=') {
			char *t;

			t = eq + 1;
			while (isspace((int) *t))
				++t;

			/* Added a special case for preempt_targets as this resource is of
			 * type array string and can have comma seperated resources and queues as its value.
			 */
			if ((r != NULL) && (strncmp(r, "preempt_targets", 15) == 0) &&
			    (t != NULL)) {
				e = t;
				while (*e != '\0') {
					e++;
				}
				v = malloc(e - t + 1);
				if (v == NULL)
					return (-1);
				strncpy(v, t, e - t);
				v[e - t] = '\0';
			} else {
				/* Normal resource: if no error, v will be on the heap */
				if ((i = pbs_quote_parse(t, &v, &e, QMGR_NO_WHITE_IN_VALUE)) != 0) {
					*erptr = e;
					return (i);
				}
			}
		} else {
			v = NULL;
		}

		/* Allocate memory for the attrl structure */
		attr = new_attrl();
		if (attr == NULL) {
			free(v);
			fprintf(stderr, "Out of memory\n");
			return 2;
		}

		/* Allocate memory for the attribute name and copy */
		str = (char *) malloc(strlen(ATTR_l) + 1);
		if (str == NULL) {
			free(v);
			free_attrl(attr);
			fprintf(stderr, "Out of memory\n");
			return 2;
		}
		strcpy(str, ATTR_l);
		attr->name = str;

		/* Allocate memory for the resource name and copy */
		str = (char *) malloc(len + 1);
		if (str == NULL) {
			free(v);
			free_attrl(attr);
			fprintf(stderr, "Out of memory\n");
			return 2;
		}
		strncpy(str, r, len);
		str[len] = '\0';
		attr->resource = str;

		/* insert value */
		if (v != NULL) {
			attr->value = v;
		} else {
			str = (char *) malloc(1);
			if (str == NULL) {
				free_attrl(attr);
				fprintf(stderr, "Out of memory\n");
				return 2;
			}
			str[0] = '\0';
			attr->value = str;
		}

		/* if we find "resc" in the command lines, disallow it in directives */
		if (strcasecmp(attr->resource, "resc") == 0) {
			haveresc = 1;
			if (add)
				allowresc = 0;
		}

		/* Put it on the attribute list */
		/* If the argument add is true, add to the list regardless.
		 * Otherwise, add it to the list only if the resource name
		 * is not already on the list.
		 */
		found = FALSE;
		attr->next = NULL;
		if (*attrib == NULL) {
			*attrib = attr;
		} else {
			ap = *attrib;
			while (ap != NULL) {
				priorap = ap;
				if (strcmp(ap->name, ATTR_l) == 0 &&
				    strcmp(ap->resource, attr->resource) == 0)
					found = TRUE;
				ap = ap->next;
			}
			/* have to special case "resc" since it can appear multiple times */
			if (add || !found || (haveresc && allowresc))
				priorap->next = attr;
		}

		/* Get ready for next resource/value pair */
		if (v != NULL)
			r = e;
		else
			r = eq;
		if (*r == ',') {
			r++;
			if (*r == '\0') {
				*erptr = r;
				return (1);
			}
		}
	}
	return (0);
}


================================================
FILE: src/lib/Libdb/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = \
	pgsql

lib_LTLIBRARIES = libpbsdb.la
libpbsdb_la_LDFLAGS = -version-info 0:0:0
libpbsdb_la_LIBADD = pgsql/libpbsdbpg.la @database_lib@
libpbsdb_la_SOURCES =


================================================
FILE: src/lib/Libdb/pgsql/Makefile.am
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

noinst_LTLIBRARIES = libpbsdbpg.la

libpbsdbpg_la_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@database_inc@

libpbsdbpg_la_LIBADD = \
	@database_lib@

libpbsdbpg_la_SOURCES = \
	db_postgres.h \
	db_common.c \
	db_attr.c \
	db_job.c \
	db_resv.c \
	db_svr.c \
	db_que.c \
	db_node.c \
	db_sched.c

dist_libexec_SCRIPTS = \
	pbs_db_utility \
	pbs_db_env \
	pbs_db_schema.sql \
	pbs_schema_upgrade

dist_sbin_SCRIPTS = \
	pbs_ds_systemd


================================================
FILE: src/lib/Libdb/pgsql/db_attr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *	Implementation of the attribute related functions for postgres
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include "db_postgres.h"
#include "assert.h"

/*
 * initially allocate some space to buffer, anything more will be
 * allocated later as required. Just allocate 1000 chars, hoping that
 * most common sql's might fit within it without needing to resize
 */
#define INIT_BUF_SIZE 1000

#define TEXTOID 25
#define DBARRAY_BUF_LEN 4096
#define DBARRAY_BUF_INC 1024

struct str_data {
	int32_t len;
	char str[0];
};

/* Structure of array header to determine array type */
struct pg_array {
	int32_t ndim; /* Number of dimensions */
	int32_t off;  /* offset for data, removed by libpq */
	Oid elemtype; /* type of element in the array */

	/* First dimension */
	int32_t size;  /* Number of elements */
	int32_t index; /* Index of first element */
		       /* data follows this portion */
};

/**
 * @brief
 *	Create a svrattrl structure from the attr_name, and values
 *
 * @param[in]	attr_name - name of the attributes
 * @param[in]	attr_resc - name of the resouce, if any
 * @param[in]	attr_value - value of the attribute
 * @param[in]	attr_flags - Flags associated with the attribute
 *
 * @retval - Pointer to the newly created attribute
 * @retval - NULL - Failure
 * @retval - Not NULL - Success
 *
 */
svrattrl *
make_attr(char *attr_name, char *attr_resc, char *attr_value, int attr_flags)
{
	int tsize;
	svrattrl *psvrat = NULL;
	int nlen = 0, rlen = 0, vlen = 0;
	char *p = NULL;

	tsize = sizeof(svrattrl);
	if (!attr_name)
		return NULL;

	nlen = strlen(attr_name);
	tsize += nlen + 1;

	if (attr_resc) {
		rlen = strlen(attr_resc);
		tsize += rlen + 1;
	}

	if (attr_value) {
		vlen = strlen(attr_value);
		tsize += vlen + 1;
	}

	if ((psvrat = (svrattrl *) malloc(tsize)) == 0)
		return NULL;

	CLEAR_LINK(psvrat->al_link);
	psvrat->al_sister = NULL;
	psvrat->al_atopl.next = 0;
	psvrat->al_tsize = tsize;
	psvrat->al_name = (char *) psvrat + sizeof(svrattrl);
	psvrat->al_resc = 0;
	psvrat->al_value = 0;
	psvrat->al_nameln = nlen;
	psvrat->al_rescln = 0;
	psvrat->al_valln = 0;
	psvrat->al_refct = 1;

	strcpy(psvrat->al_name, attr_name);
	p = psvrat->al_name + psvrat->al_nameln + 1;

	if (attr_resc && attr_resc[0] != '\0') {
		psvrat->al_resc = p;
		strcpy(psvrat->al_resc, attr_resc);
		psvrat->al_rescln = rlen;
		p = p + psvrat->al_rescln + 1;
	}

	psvrat->al_value = p;
	if (attr_value && attr_value[0] != '\0') {
		strcpy(psvrat->al_value, attr_value);
		psvrat->al_valln = vlen;
	}

	psvrat->al_flags = attr_flags;
	psvrat->al_op = SET;

	return (psvrat);
}
/**
 * @brief
 *	Converts a postgres hstore(which is in the form of array) to attribute linked list
 *
 * @param[in]	raw_array - Array string which is in the form of postgres hstore
 * @param[out]  attr_list - List of pbs_db_attr_list_t objects
 *
 * @return      Error code
 * @retval	-1 - On Error
 * @retval	 0 - On Success
 * @retval	>1 - Number of attributes
 *
 */
int
dbarray_to_attrlist(char *raw_array, pbs_db_attr_list_t *attr_list)
{
	int i;
	int j;
	int rows;
	int flags;
	char *endp;
	char *attr_name;
	char *attr_value;
	char *attr_flags;
	char *attr_resc;
	svrattrl *pal;
	struct pg_array *array = (struct pg_array *) raw_array;
	struct str_data *val = (struct str_data *) (raw_array + sizeof(struct pg_array));

	CLEAR_HEAD(attr_list->attrs);
	attr_list->attr_count = 0;

	if (ntohl(array->ndim) == 0)
		return 0;

	if (ntohl(array->ndim) > 1 || ntohl(array->elemtype) != TEXTOID)
		return -1;

	rows = ntohl(array->size);

	for (i = 0, j = 0; j < rows; i++, j += 2) {

		attr_resc = NULL;
		attr_value = NULL;

		attr_name = val->str;
		val = (struct str_data *) ((char *) val->str + ntohl(val->len));

		attr_flags = val->str;
		val = (struct str_data *) ((char *) val->str + ntohl(val->len));

		if ((attr_resc = strchr(attr_name, '.'))) {
			*attr_resc = '\0';
			attr_resc++;
		}

		if ((attr_value = strchr(attr_flags, '.'))) {
			*attr_value = '\0';
			attr_value++;
		}

		flags = strtol(attr_flags, &endp, 10);
		if (*endp != '\0')
			return -1;

		if (!(pal = make_attr(attr_name, attr_resc, attr_value, flags)))
			return -1;

		append_link(&(attr_list->attrs), &pal->al_link, pal);
	}
	attr_list->attr_count = i;
	return 0;
}

/**
 * @brief
 *	Converts an PBS link list of attributes to DB hstore(array) format
 *
 * @param[out]  raw_array - Array string which is in the form of postgres hstore
 * @param[in]	attr_list - List of pbs_db_attr_list_t objects
 * @param[in]	keys_only - if true, convert only the keys, not values also
 *
 * @return      Error code
 * @retval	-1 - On Error
 * @retval	 length of array - On Success
 *
 */
int
attrlist_to_dbarray_ex(char **raw_array, pbs_db_attr_list_t *attr_list, int keys_only)
{
	/* use static variables to improve performance by not allocating memory for each object save */
	static struct pg_array *array = NULL, *tmp;
	static int len = sizeof(struct pg_array) + DBARRAY_BUF_LEN;
	struct str_data *val = NULL;
	svrattrl *pal;
	char *p;
	int spc_avl, spc_req, len_to_val;
	/* (len_field * 2) + PBS_MAXATTRNAME + PBS_MAXATTRRESC + max 3 digits flags +  2 dots + 1 null terminator */
	static int fixed_part_req = (sizeof(int32_t) * 2) + PBS_MAXATTRNAME + PBS_MAXATTRRESC + 3 + 2 + 1;

	if (!array) {
		array = malloc(len);
		if (!array)
			return -1;
	}

	array->ndim = htonl(1);
	array->off = 0;
	array->elemtype = htonl(TEXTOID);
	if (keys_only)
		array->size = htonl(attr_list->attr_count);
	else
		array->size = htonl(attr_list->attr_count * 2);
	array->index = htonl(1);

	/* point to data area */
	val = (struct str_data *) ((char *) array + sizeof(struct pg_array));

	for (pal = (svrattrl *) GET_NEXT(attr_list->attrs); pal != NULL; pal = (svrattrl *) GET_NEXT(pal->al_link)) {
		len_to_val = (char *) val - (char *) array;
		spc_avl = len - len_to_val;
		spc_req = fixed_part_req + (pal->al_atopl.value ? strlen(pal->al_atopl.value) : 0); /* value can have arbitrary length */
		if (spc_avl <= spc_req) {
			len += (spc_req > DBARRAY_BUF_LEN) ? spc_req : DBARRAY_BUF_LEN;
			tmp = realloc(array, len);
			if (!tmp)
				return -1;

			val = (struct str_data *) ((char *) tmp + len_to_val); /* move val since array moved */
			array = tmp;
		}
		p = pbs_strcpy(val->str, pal->al_atopl.name);
		if (pal->al_atopl.resource && pal->al_atopl.resource[0] != '\0') {
			*p++ = '.';
			p = pbs_strcpy(p, pal->al_atopl.resource);
		}
		val->len = htonl(p - val->str);
		val = (struct str_data *) p; /* p is already pointing to the end */

		if (keys_only == 0) {
			p = pbs_strcpy(val->str, uLTostr(pal->al_flags, 10)); /* can't fail; uLtostr has buffer for long, we pass very small value */
			if (pal->al_atopl.value && pal->al_atopl.value[0] != '\0') {
				*p++ = '.';
				p = pbs_strcpy(p, pal->al_atopl.value);
			}
			val->len = htonl(p - val->str);
			val = (struct str_data *) p; /* p is already pointing to the end */
		}
	}
	*raw_array = (char *) array;

	return ((char *) val - (char *) array);
}

/**
 * @brief
 *	Converts an PBS link list of attributes to DB hstore(array) format
 *
 * @param[out]  raw_array - Array string which is in the form of postgres hstore
 * @param[in]	attr_list - List of pbs_db_attr_list_t objects
 *
 * @return      Error code
 * @retval	-1 - On Error
 * @retval	 0 - On Success
 *
 */
int
attrlist_to_dbarray(char **raw_array, pbs_db_attr_list_t *attr_list)
{
	return attrlist_to_dbarray_ex(raw_array, attr_list, 0);
}


================================================
FILE: src/lib/Libdb/pgsql/db_common.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *	This file contains Postgres specific implementation of functions
 *	to access the PBS postgres database.
 *	This is postgres specific data store implementation, and should not be
 *	used directly by the rest of the PBS code.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include "db_postgres.h"
#include <sys/wait.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
#include <fcntl.h>
#include <errno.h>
#include <arpa/inet.h>
#include "ticket.h"
#include "log.h"
#include "server_limits.h"

#define IPV4_STR_LEN 15

char *errmsg_cache = NULL;
pg_conn_data_t *conn_data = NULL;
pg_conn_trx_t *conn_trx = NULL;
static char pg_ctl[MAXPATHLEN + 1] = "";
static char *pg_user = NULL;

static int is_conn_error(void *conn, int *failcode);
static char *get_dataservice_password(char *user, char *errmsg, int len);
static char *db_escape_str(void *conn, char *str);
static char *get_db_connect_string(char *host, int timeout, int *err_code, char *errmsg, int len);
static int db_prepare_sqls(void *conn);
static int db_cursor_next(void *conn, void *state, pbs_db_obj_info_t *obj);

extern char *pbs_get_dataservice_usr(char *, int);
extern int pbs_decrypt_pwd(char *, int, size_t, char **, const unsigned char *, const unsigned char *);
extern unsigned char pbs_aes_key[][16];
extern unsigned char pbs_aes_iv[][16];

// clang-format off
/**
 * An array of structures(of function pointers) for each of the database object
 */
pg_db_fn_t db_fn_arr[PBS_DB_NUM_TYPES] = {
	{	/* PBS_DB_SVR */
		pbs_db_save_svr,
		NULL,
		pbs_db_load_svr,
		NULL,
		NULL,
		pbs_db_del_attr_svr
	},
	{	/* PBS_DB_SCHED */
		pbs_db_save_sched,
		pbs_db_delete_sched,
		pbs_db_load_sched,
		pbs_db_find_sched,
		pbs_db_next_sched,
		pbs_db_del_attr_sched
	},
	{	/* PBS_DB_QUE */
		pbs_db_save_que,
		pbs_db_delete_que,
		pbs_db_load_que,
		pbs_db_find_que,
		pbs_db_next_que,
		pbs_db_del_attr_que
	},
	{	/* PBS_DB_NODE */
		pbs_db_save_node,
		pbs_db_delete_node,
		pbs_db_load_node,
		pbs_db_find_node,
		pbs_db_next_node,
		pbs_db_del_attr_node
	},
	{	/* PBS_DB_MOMINFO_TIME */
		pbs_db_save_mominfo_tm,
		NULL,
		pbs_db_load_mominfo_tm,
		NULL,
		NULL,
		NULL
	},
	{	/* PBS_DB_JOB */
		pbs_db_save_job,
		pbs_db_delete_job,
		pbs_db_load_job,
		pbs_db_find_job,
		pbs_db_next_job,
		pbs_db_del_attr_job
	},
	{	/* PBS_DB_JOBSCR */
		pbs_db_save_jobscr,
		NULL,
		pbs_db_load_jobscr,
		NULL,
		NULL,
		NULL
	},
	{	/* PBS_DB_RESV */
		pbs_db_save_resv,
		pbs_db_delete_resv,
		pbs_db_load_resv,
		pbs_db_find_resv,
		pbs_db_next_resv,
		pbs_db_del_attr_resv
	}
};

// clang-format on

/**
 * @brief
 *	Initialize a query state variable, before being used in a cursor
 *
 * @param[in]	conn - Database connection handle
 * @param[in]	query_cb - Object handler query back function
 *
 * @return	void *
 * @retval	NULL - Failure to allocate memory
 * @retval	!NULL - Success - returns the new state variable
 *
 */
static void *
db_initialize_state(void *conn, query_cb_t query_cb)
{
	db_query_state_t *state = malloc(sizeof(db_query_state_t));
	if (!state)
		return NULL;
	state->count = -1;
	state->res = NULL;
	state->row = -1;
	state->query_cb = query_cb;
	return state;
}

/**
 * @brief
 *	Destroy a query state variable.
 *	Clears the database resultset and free's the memory allocated to
 *	the state variable
 *
 * @param[in]	st - Pointer to the state variable
 *
 * @return void
 */
static void
db_destroy_state(void *st)
{
	db_query_state_t *state = st;
	if (state) {
		if (state->res)
			PQclear(state->res);
		free(state);
	}
}

/**
 * @brief
 *	Search the database for exisitn objects and load the server structures.
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - The pointer to the wrapper object which
 *		describes the PBS object (job/resv/node etc) that is wrapped
 *		inside it.
 * @param[in/out]	pbs_db_query_options_t - Pointer to the options object that can
 *		contain the flags or timestamp which will effect the query.
 * @param[in]	callback function which will process the result from the database
 * 		and update the server strctures.
 *
 * @return	int
 * @retval	0	- Success but no rows found
 * @retval	-1	- Failure
 * @retval	>0	- Success and number of rows found
 *
 */
int
pbs_db_search(void *conn, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts, query_cb_t query_cb)
{
	void *st;
	int ret;
	int totcount;
	int refreshed;
	int rc;

	st = db_initialize_state(conn, query_cb);
	if (!st)
		return -1;

	ret = db_fn_arr[obj->pbs_db_obj_type].pbs_db_find_obj(conn, st, obj, opts);
	if (ret == -1) {
		/* error in executing the sql */
		db_destroy_state(st);
		return -1;
	}
	totcount = 0;
	while ((rc = db_cursor_next(conn, st, obj)) == 0) {
		query_cb(obj, &refreshed);
		if (refreshed)
			totcount++;
	}

	db_destroy_state(st);
	return totcount;
}

/**
 * @brief
 *	Get the next row from the cursor. It also is used to get the first row
 *	from the cursor as well.
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	state - The cursor state handle.
 * @param[out]	pbs_db_obj_info_t - The pointer to the wrapper object which
 *		describes the PBS object (job/resv/node etc) that is wrapped
 *		inside it. The row data is loaded into this parameter.
 *
 * @return	Error code
 * @retval	-1  - Failure
 * @retval	0  - success
 * @retval	1  - Success but no more rows
 *
 */
static int
db_cursor_next(void *conn, void *st, pbs_db_obj_info_t *obj)
{
	db_query_state_t *state = (db_query_state_t *) st;
	int ret;

	if (state->row < state->count) {
		ret = db_fn_arr[obj->pbs_db_obj_type].pbs_db_next_obj(conn, st, obj);
		state->row++;
		return ret;
	}
	return 1; /* no more rows */
}

/**
 * @brief
 *	Delete an existing object from the database
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - Wrapper object that describes the object
 *		(and data) to delete
 *
 * @return	int
 * @retval	-1  - Failure
 * @retval	0   - success
 * @retval	1   -  Success but no rows deleted
 *
 */
int
pbs_db_delete_obj(void *conn, pbs_db_obj_info_t *obj)
{
	return (db_fn_arr[obj->pbs_db_obj_type].pbs_db_delete_obj(conn, obj));
}

/**
 * @brief
 *	Load a single existing object from the database
 *
 * @param[in]	conn - Connected database handle
 * @param[in/out]pbs_db_obj_info_t - Wrapper object that describes the object
 *		(and data) to load. This parameter used to return the data about
 *		the object loaded
 *
 * @return      Error code
 * @retval       0  - success
 * @retval	-1  - Failure
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_obj(void *conn, pbs_db_obj_info_t *obj)
{
	return (db_fn_arr[obj->pbs_db_obj_type].pbs_db_load_obj(conn, obj));
}

/**
 * @brief
 *	Initializes all the sqls before they can be used
 *
 * @param[in]   conn - Connected database handle
 *
 * @return      Error code
 * @retval       0  - success
 * @retval	-1  - Failure
 *
 *
 */
static int
db_prepare_sqls(void *conn)
{
	if (db_prepare_job_sqls(conn) != 0)
		return -1;
	if (db_prepare_svr_sqls(conn) != 0)
		return -1;
	if (db_prepare_que_sqls(conn) != 0)
		return -1;
	if (db_prepare_resv_sqls(conn) != 0)
		return -1;
	if (db_prepare_node_sqls(conn) != 0)
		return -1;
	if (db_prepare_sched_sqls(conn) != 0)
		return -1;
	return 0;
}

/**
 * @brief
 *	Execute a direct sql string on the open database connection
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	sql  - A string describing the sql to execute.
 *
 * @return      Error code
 * @retval	-1  - Error
 * @retval       0  - success
 * @retval	 1  - Execution succeeded but statement did not return any rows
 *
 */
int
db_execute_str(void *conn, char *sql)
{
	PGresult *res;
	char *rows_affected = NULL;
	int status;

	res = PQexec((PGconn *) conn, sql);
	status = PQresultStatus(res);
	if (status != PGRES_COMMAND_OK && status != PGRES_TUPLES_OK) {
		char *sql_error = PQresultErrorField(res, PG_DIAG_SQLSTATE);
		db_set_error(conn, &errmsg_cache, "Execution of string statement\n", sql, sql_error);
		PQclear(res);
		return -1;
	}
	rows_affected = PQcmdTuples(res);
	if ((rows_affected == NULL || strtol(rows_affected, NULL, 10) <= 0) && (PQntuples(res) <= 0)) {
		PQclear(res);
		return 1;
	}

	PQclear(res);
	return 0;
}

/**
 * @brief
 *	Function to start/stop the database service/daemons
 *	Basically calls the psql command with the specified command.
 *
 * @return      Error code
 * @retval       !=0 - Failure
 * @retval         0 - Success
 *
 */
int
pbs_dataservice_control(char *cmd, char *pbs_ds_host, int pbs_ds_port)
{
	char dbcmd[4 * MAXPATHLEN + 1];
	int rc = 0;
	int ret = 0;
	char errfile[MAXPATHLEN + 1];
	char log_file[MAXPATHLEN + 1];
	char oom_file[MAXPATHLEN + 1];
	char *oom_score_adj = "/proc/self/oom_score_adj";
	char *oom_adj = "/proc/self/oom_adj";
	char *oom_val = NULL;
	struct stat stbuf;
	int fd = 0;
	char *p = NULL;
	char *pg_bin = NULL;
	char *pg_libstr = NULL;
	char *errmsg = NULL;

	if (pg_ctl[0] == '\0') {
		pg_libstr = getenv("PGSQL_LIBSTR");
		if ((pg_bin = getenv("PGSQL_BIN")) == NULL) {
			if (errmsg_cache)
				free(errmsg_cache);
			errmsg_cache = strdup("PGSQL_BIN not found in the environment. Please run PBS_EXEC/libexec/pbs_db_env and try again.");
			return -1;
		}
		sprintf(pg_ctl, "%s %s/pg_ctl -D %s/datastore", pg_libstr ? pg_libstr : "", pg_bin, pbs_conf.pbs_home_path);
	}
	if (pg_user == NULL) {
		if (errmsg_cache) {
			free(errmsg_cache);
			errmsg_cache = NULL;
		}
		errmsg = (char *) malloc(PBS_MAX_DB_CONN_INIT_ERR + 1);
		if (errmsg == NULL) {
			errmsg_cache = strdup("Out of memory\n");
			return -1;
		}
		if ((pg_user = pbs_get_dataservice_usr(errmsg, PBS_MAX_DB_CONN_INIT_ERR)) == NULL) {
			errmsg_cache = strdup(errmsg);
			free(errmsg);
			return -1;
		}
		free(errmsg);
	}

	if (!(strcmp(cmd, PBS_DB_CONTROL_START))) {
		/*
		 * try protect self from Linux OOM killer
		 * but don't fail if can't update OOM score
		 */
		if (access(oom_score_adj, F_OK) != -1) {
			strcpy(oom_file, oom_score_adj);
			oom_val = strdup("-1000");
		} else if (access(oom_adj, F_OK) != -1) {
			strcpy(oom_file, oom_adj);
			oom_val = strdup("-17");
		}
		if (oom_val != NULL) {
			if ((fd = open(oom_file, O_TRUNC | O_WRONLY, 0600)) != -1) {
				if (write(fd, oom_val, strlen(oom_val)) == -1)
					ret = PBS_DB_OOM_ERR;
				close(fd);
			} else
				ret = PBS_DB_OOM_ERR;
			free(oom_val);
		}
		sprintf(errfile, "%s/spool/pbs_ds_monitor_errfile", pbs_conf.pbs_home_path);
		/* launch monitoring program which will fork to background */
		sprintf(dbcmd, "%s/sbin/pbs_ds_monitor monitor > %s 2>&1", pbs_conf.pbs_exec_path, errfile);
		rc = system(dbcmd);
		if (WIFEXITED(rc))
			rc = WEXITSTATUS(rc);
		if (rc != 0) {
			/* read the contents of errfile and and see */
			/* if pbs_ds_monitor is already running */
			if ((fd = open(errfile, 0)) != -1) {
				if (fstat(fd, &stbuf) != -1) {
					errmsg = (char *) malloc(stbuf.st_size + 1);
					if (errmsg == NULL) {
						close(fd);
						unlink(errfile);
						return -1;
					}
					rc = read(fd, errmsg, stbuf.st_size);
					if (rc == -1)
						return -1;
					*(errmsg + stbuf.st_size) = 0;
					p = errmsg + strlen(errmsg) - 1;
					while ((p >= errmsg) && (*p == '\r' || *p == '\n'))
						*p-- = 0; /* suppress the last newline */
					if (strstr((char *) errmsg, "Lock seems to be held by pid")) {
						/* pbs_ds_monitor is already running */
						rc = 0;
					} else {
						if (errmsg_cache)
							free(errmsg_cache);
						errmsg_cache = strdup(errmsg);
					}
					free(errmsg);
				}
				close(fd);
			}
			if (rc)
				return -1;
		}
		unlink(errfile);
	}

	/* create unique filename by appending pid */
	sprintf(errfile, "%s/spool/db_errfile_%s_%d", pbs_conf.pbs_home_path, cmd, getpid());
	sprintf(log_file, "%s/spool/db_start.log", pbs_conf.pbs_home_path);

	if (!(strcmp(cmd, PBS_DB_CONTROL_START))) {
		sprintf(dbcmd,
			"su - %s -c \"/bin/sh -c '%s -o \\\"-p %d \\\" -W start -l %s > %s 2>&1'\"",
			pg_user,
			pg_ctl,
			pbs_ds_port,
			log_file,
			errfile);
	} else if (!(strcmp(cmd, PBS_DB_CONTROL_STATUS))) {
		sprintf(dbcmd,
			"su - %s -c \"/bin/sh -c '%s -o \\\"-p %d \\\" -w status > %s 2>&1'\"",
			pg_user,
			pg_ctl,
			pbs_ds_port,
			errfile);
	} else if (!(strcmp(cmd, PBS_DB_CONTROL_STOP))) {
		sprintf(dbcmd,
			"su - %s -c \"/bin/sh -c '%s -w stop -m fast > %s 2>&1'\"",
			pg_user,
			pg_ctl,
			errfile);
	}

	rc = system(dbcmd);
	if (WIFEXITED(rc))
		rc = WEXITSTATUS(rc);

	if (rc != 0) {
		ret = 1;
		if (!(strcmp(cmd, PBS_DB_CONTROL_STATUS))) {
			sprintf(errfile, "%s/spool/pbs_ds_monitor_errfile", pbs_conf.pbs_home_path);
			/* check further only if pg_ctl thinks no DATABASE is running */
			sprintf(dbcmd, "%s/sbin/pbs_ds_monitor check > %s 2>&1", pbs_conf.pbs_exec_path, errfile);
			rc = system(dbcmd);
			if (WIFEXITED(rc))
				rc = WEXITSTATUS(rc);
			if (rc != 0)
				ret = 2;
		} else if (!(strcmp(cmd, PBS_DB_CONTROL_START))) {
			/* read the contents of logfile */
			if ((fd = open(log_file, 0)) != -1) {
				if (fstat(fd, &stbuf) != -1) {
					errmsg = (char *) malloc(stbuf.st_size + 1);
					if (errmsg == NULL) {
						close(fd);
						unlink(log_file);
						return -1;
					}
					rc = read(fd, errmsg, stbuf.st_size);
					if (rc == -1) {
						close(fd);
						unlink(log_file);
						return -1;
					}
					*(errmsg + stbuf.st_size) = 0;
					p = errmsg + strlen(errmsg) - 1;
					while ((p >= errmsg) && (*p == '\r' || *p == '\n'))
						*p-- = 0; /* suppress the last newline */
					if (strstr((char *) errmsg, "database files are incompatible with server"))
						ret = 3; /* DB version mismatch */
					free(errmsg);
				}
				close(fd);
			}
		}
		if (rc != 0) {
			/* read the contents of errfile and load to errmsg */
			if ((fd = open(errfile, 0)) != -1) {
				if (fstat(fd, &stbuf) != -1) {
					errmsg = (char *) malloc(stbuf.st_size + 1);
					if (errmsg == NULL) {
						close(fd);
						unlink(errfile);
						return -1;
					}
					rc = read(fd, errmsg, stbuf.st_size);
					if (rc == -1)
						return -1;
					*(errmsg + stbuf.st_size) = 0;
					p = errmsg + strlen(errmsg) - 1;
					while ((p >= errmsg) && (*p == '\r' || *p == '\n'))
						*p-- = 0; /* suppress the last newline */
					if (errmsg_cache)
						free(errmsg_cache);
					errmsg_cache = strdup(errmsg);
					free(errmsg);
				}
				close(fd);
			}
		}
	} else if (rc == 0 && !(strcmp(cmd, PBS_DB_CONTROL_START))) {
		/* launch systemd setup script */
		sprintf(dbcmd, "%s/sbin/pbs_ds_systemd", pbs_conf.pbs_exec_path);
		rc = system(dbcmd);
		if (WIFEXITED(rc))
			rc = WEXITSTATUS(rc);
		if (rc != 0) {
			if (errmsg_cache)
				free(errmsg_cache);
			errmsg_cache = strdup("systemd service setup for pbs failed");
			return -1;
		}
	}
	unlink(log_file);
	unlink(errfile);
	return ret;
}

/**
 * @brief
 *	Function to check whether data-service is running
 *
 * @return      Error code
 * @retval      -1  - Error in routine
 * @retval       0  - Data service running on local host
 * @retval       1  - Data service not running
 * @retval       2  - Data service running on another host
 *
 */
int
pbs_status_db(char *pbs_ds_host, int pbs_ds_port)
{
	return (pbs_dataservice_control(PBS_DB_CONTROL_STATUS, pbs_ds_host, pbs_ds_port));
}

/**
 * @brief
 *	Start the database daemons/service in synchronous mode.
 *  This function waits for the database to complete startup.
 *
 * @param[out]	errmsg - returns the startup error message if any
 *
 * @return       int
 * @retval       0     - success
 * @retval       !=0   - Failure
 *
 */
int
pbs_start_db(char *pbs_ds_host, int pbs_ds_port)
{
	return (pbs_dataservice_control(PBS_DB_CONTROL_START, pbs_ds_host, pbs_ds_port));
}

/**
 * @brief
 *	Function to stop the database service/daemons
 *	This passes the parameter STOP to the
 *	pbs_dataservice script.
 *
 * @param[out]	errmsg - returns the db error message if any
 *
 * @return      Error code
 * @retval       !=0 - Failure
 * @retval        0  - Success
 *
 */
int
pbs_stop_db(char *pbs_ds_host, int pbs_ds_port)
{
	return (pbs_dataservice_control(PBS_DB_CONTROL_STOP, pbs_ds_host, pbs_ds_port));
}

/**
 * @brief
 *	Function to create new databse user or
 *  change password of current user.
 *
 * @param[in] conn[in]: The database connection handle which was created by pbs_db_connection.
 * @param[in] user_name[in]: Databse user name.
 * @param[in] password[in]:  New password for the database.
 * @param[in] olduser[in]: old database user name.
 *
 * @return      Error code
 * @retval       -1 - Failure
 * @retval        0  - Success
 *
 */
int
pbs_db_password(void *conn, char *userid, char *password, char *olduser)
{
	char sqlbuff[1024];
	char *pquoted = NULL;
	char prog[] = "pbs_db_password";
	int change_user = 0;

	if (userid[0] != 0) {
		if (strcmp(olduser, userid) != 0) {
			change_user = 1;
		}
	}

	/* escape password to use in sql strings later */
	if ((pquoted = db_escape_str(conn, password)) == NULL) {
		fprintf(stderr, "%s: Out of memory\n", prog);
		return -1;
	}

	if (change_user == 1) {
		/* check whether user exists */
		snprintf(sqlbuff, sizeof(sqlbuff), "select usename from pg_user where usename = '%s'", userid);
		if (db_execute_str(conn, sqlbuff) == 1) {
			/* now attempt to create new user & set the database passwd to the un-encrypted password */
			snprintf(sqlbuff, sizeof(sqlbuff), "create user \"%s\" SUPERUSER ENCRYPTED PASSWORD '%s'", userid, pquoted);
		} else {
			/* attempt to alter new user & set the database passwd to the un-encrypted password */
			snprintf(sqlbuff, sizeof(sqlbuff), "alter user \"%s\" SUPERUSER ENCRYPTED PASSWORD '%s'", userid, pquoted);
		}
	} else {
		/* now attempt to set the database passwd to the un-encrypted password */
		/* alter user ${user} SUPERUSER ENCRYPTED PASSWORD '${passwd}' */
		sprintf(sqlbuff, "alter user \"%s\" SUPERUSER ENCRYPTED PASSWORD '%s'", olduser, pquoted);
	}
	free(pquoted);

	if (db_execute_str(conn, sqlbuff) == -1)
		return -1;
	if (change_user) {
		/* delete the old user from the database */
		sprintf(sqlbuff, "drop user \"%s\"", olduser);
		if (db_execute_str(conn, sqlbuff) == -1)
			return -1;
	}
	return 0;
}

/**
 * @brief
 *	Static helper function to retrieve postgres error string,
 *	analyze it and find out what kind of error it is. Based on
 *	that, a PBS DB layer specific error code is generated.
 *
 * @param[in]	conn - Connected database handle
 *
 * @return      Connection status
 * @retval      -1 - Connection down
 * @retval       0 - Connection fine
 *
 */
static int
is_conn_error(void *conn, int *failcode)
{
	/* Check to see that the backend connection was successfully made */
	if (conn == NULL || PQstatus(conn) == CONNECTION_BAD) {
		if (conn) {
			db_set_error(conn, &errmsg_cache, "Connection:", "", "");
			if (strstr((char *) errmsg_cache, "Connection refused") || strstr((char *) errmsg_cache, "No such file or directory"))
				*failcode = PBS_DB_CONNREFUSED;
			else if (strstr((char *) errmsg_cache, "authentication"))
				*failcode = PBS_DB_AUTH_FAILED;
			else if (strstr((char *) errmsg_cache, "database system is starting up"))
				*failcode = PBS_DB_STILL_STARTING;
			else
				*failcode = PBS_DB_CONNFAILED; /* default failure code */
		} else
			*failcode = PBS_DB_CONNFAILED; /* default failure code */
		return 1;			       /* true - connection error */
	}
	return 0; /* no connection error */
}

/**
 * @brief
 *	Create a new connection structure and initialize the fields
 *
 * @param[out]  conn - Pointer to database connection handler.
 * @param[in]   host - The hostname to connect to
 * @param[in]	port - The port to connect to
 * @param[in]   timeout - The connection attempt timeout
 *
 * @return      int - failcode
 * @retval      non-zero  - Failure
 * @retval      0 - Success
 *
 */
int
pbs_db_connect(void **db_conn, char *host, int port, int timeout)
{
	int failcode = PBS_DB_SUCCESS;
	int len = PBS_MAX_DB_CONN_INIT_ERR;
	char db_sys_msg[PBS_MAX_DB_CONN_INIT_ERR + 1] = {0};
	char *conn_info = NULL;

	conn_data = malloc(sizeof(pg_conn_data_t));
	if (!conn_data) {
		failcode = PBS_DB_NOMEM;
		return failcode;
	}

	/*
	 * calloc ensures that everything is initialized to zeros
	 * so no need to explicitly set fields to 0.
	 */
	conn_trx = calloc(1, sizeof(pg_conn_trx_t));
	if (!conn_trx) {
		free(conn_data);
		failcode = PBS_DB_NOMEM;
		return failcode;
	}

	conn_info = get_db_connect_string(host, timeout, &failcode, db_sys_msg, len);
	if (!conn_info) {
		errmsg_cache = strdup(db_sys_msg);
		goto db_cnerr;
	}

	/* Make a connection to the database */
	*db_conn = (PGconn *) PQconnectdb(conn_info);

	/*
	 * For security remove the connection info from the memory.
	 */
	memset(conn_info, 0, strlen(conn_info));
	free(conn_info);

	/* Check to see that the backend connection was successfully made */
	if (!(is_conn_error(*db_conn, &failcode))) {
		if (db_prepare_sqls(*db_conn) != 0) {
			/* this means there is programmatic/unrecoverable error, so we quit */
			failcode = PBS_DB_ERR;
			pbs_stop_db(host, port);
		}
	}

db_cnerr:
	if (failcode != PBS_DB_SUCCESS) {
		free(conn_data);
		free(conn_trx);
		*db_conn = NULL;
	}
	return failcode;
}

/**
 * @brief
 *	Disconnect from the database and frees all allocated memory.
 *
 * @param[in]   conn - Connected database handle
 *
 * @return      Error code
 * @retval       0  - success
 * @retval      -1  - Failure
 *
 */
int
pbs_db_disconnect(void *conn)
{
	if (!conn)
		return -1;

	if (conn)
		PQfinish(conn);

	free(conn_data);
	free(conn_trx);

	return 0;
}

/**
 * @brief
 *	Saves a new object into the database
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - Wrapper object that describes the object (and data) to insert
 * @param[in]	savetype - quick or full save
 *
 * @return      Error code
 * @retval	-1  - Failure
 * @retval	 0  - Success
 * @retval	 1  - Success but no rows inserted
 *
 */
int
pbs_db_save_obj(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	return (db_fn_arr[obj->pbs_db_obj_type].pbs_db_save_obj(conn, obj, savetype));
}

/**
 * @brief
 *	Delete attributes of an object from the database
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	pbs_db_obj_info_t - Wrapper object that describes the object
 * @param[in]	id - Object id
 * @param[in]	@param[in]	db_attr_list - pointer to the structure of type pbs_db_attr_list_t for deleting from DB
 * @return      Error code
 *
 * @retval      0  - success
 * @retval     -1  - Failure
 *
 */
int
pbs_db_delete_attr_obj(void *conn, pbs_db_obj_info_t *obj, void *obj_id, pbs_db_attr_list_t *db_attr_list)
{
	return (db_fn_arr[obj->pbs_db_obj_type].pbs_db_del_attr_obj(conn, obj_id, db_attr_list));
}

/**
 * @brief
 *	Function to set the database error into the db_err field of the
 *	connection object
 *
 * @param[in]	conn - Pointer to db connection handle.
 * @param[out]	conn_db_err - Pointer to cached db error.
 * @param[in]	fnc - Custom string added to the error message
 *			This can be used to provide the name of the functionality.
 * @param[in]	msg - Custom string added to the error message. This can be
 *			used to provide a failure message.
 * @param[in]	diag_msg - Additional diagnostic message from the resultset, if any
 */
void
db_set_error(void *conn, char **conn_db_err, char *fnc, char *msg, char *diag_msg)
{
	char *str;
	char *p;
	char fmt[] = "%s %s failed: %s %s";

	if (*conn_db_err) {
		free(*conn_db_err);
		*conn_db_err = NULL;
	}

	str = PQerrorMessage((PGconn *) conn);
	if (!str)
		return;

	p = str + strlen(str) - 1;
	while ((p >= str) && (*p == '\r' || *p == '\n'))
		*p-- = 0; /* supress the last newline */

	if (!diag_msg)
		diag_msg = "";

	pbs_asprintf(conn_db_err, fmt, fnc, msg, str, diag_msg);

#ifdef DEBUG
	printf("%s\n", *conn_db_err);
	fflush(stdout);
#endif
}

/**
 * @brief
 *	Function to prepare a database statement
 *
 * @param[in]	conn - The connnection handle
 * @param[in]	stmt - Name of the statement
 * @param[in]	sql  - The string sql that has to be prepared
 * @param[in]	num_vars - The number of parameters in the sql ($1, $2 etc)
 *
 * @return      Error code
 * @retval	-1 Failure
 * @retval	 0 Success
 *
 */
int
db_prepare_stmt(void *conn, char *stmt, char *sql, int num_vars)
{
	PGresult *res;
	res = PQprepare((PGconn *) conn, stmt, sql, num_vars, NULL);
	if (PQresultStatus(res) != PGRES_COMMAND_OK) {
		char *sql_error = PQresultErrorField(res, PG_DIAG_SQLSTATE);
		db_set_error(conn, &errmsg_cache, "Prepare of statement", stmt, sql_error);
		PQclear(res);
		return -1;
	}
	PQclear(res);
	return 0;
}

/**
 * @brief
 *	Execute a prepared DML (insert or update) statement
 *
 * @param[in]	conn - The connnection handle
 * @param[in]	stmt - Name of the statement (prepared previously)
 * @param[in]	num_vars - The number of parameters in the sql ($1, $2 etc)
 *
 * @return      Error code
 * @retval	-1 - Execution of prepared statement failed
 * @retval	 0 - Success and > 0 rows were affected
 * @retval	 1 - Execution succeeded but statement did not affect any rows
 *
 *
 */
int
db_cmd(void *conn, char *stmt, int num_vars)
{
	PGresult *res;
	char *rows_affected = NULL;

	res = PQexecPrepared((PGconn *) conn, stmt, num_vars,
			     conn_data->paramValues,
			     conn_data->paramLengths,
			     conn_data->paramFormats, 0);
	if (PQresultStatus(res) != PGRES_COMMAND_OK) {
		char *sql_error = PQresultErrorField(res, PG_DIAG_SQLSTATE);
		db_set_error(conn, &errmsg_cache, "Execution of Prepared statement", stmt, sql_error);
		PQclear(res);
		return -1;
	}
	rows_affected = PQcmdTuples(res);

	/*
	*  we can't call PQclear(res) yet, since rows_affected
	* (used below) is a pointer to a field inside res (PGresult)
	*/
	if (rows_affected == NULL || strtol(rows_affected, NULL, 10) <= 0) {
		PQclear(res);
		return 1;
	}
	PQclear(res);

	return 0;
}

/**
 * @brief
 *	Execute a prepared query (select) statement
 *
 * @param[in]	conn - The connnection handle
 * @param[in]	stmt - Name of the statement (prepared previously)
 * @param[in]	num_vars - The number of parameters in the sql ($1, $2 etc)
 * @param[out]  res - The result set of the query
 *
 * @return      Error code
 * @retval	-1 - Execution of prepared statement failed
 * @retval	 0 - Success and > 0 rows were returned
 * @retval	 1 - Execution succeeded but statement did not return any rows
 *
 */
int
db_query(void *conn, char *stmt, int num_vars, PGresult **res)
{
	int conn_result_format = 1;
	*res = PQexecPrepared((PGconn *) conn, stmt, num_vars,
			      conn_data->paramValues, conn_data->paramLengths,
			      conn_data->paramFormats, conn_result_format);

	if (PQresultStatus(*res) != PGRES_TUPLES_OK) {
		char *sql_error = PQresultErrorField(*res, PG_DIAG_SQLSTATE);
		db_set_error(conn, &errmsg_cache, "Execution of Prepared statement", stmt, sql_error);
		PQclear(*res);
		return -1;
	}

	if (PQntuples(*res) <= 0) {
		PQclear(*res);
		return 1;
	}

	return 0;
}

/**
 * @brief
 *	Retrieves the database password for an user. Currently, the database
 *	password is retrieved from the file under server_priv, called db_passwd
 *	Currently, this function returns the same username as the password, if
 *	a password file is not found under server_priv. However, if a password
 *	file is found but is not readable etc, then an error (indicated by
 *	returning NULL) is returned.
 *
 * @param[in]	user - Name of the user
 * @param[out]  errmsg - Details of the error
 * @param[in]   len    - length of error messge variable
 *
 * @return      Password String
 * @retval	 NULL - Failed to retrieve password
 * @retval	!NULL - Pointer to allocated memory with password string.
 *			Caller should free this memory after usage.
 *
 */
static char *
get_dataservice_password(char *user, char *errmsg, int len)
{
	char pwd_file[MAXPATHLEN + 1];
	int fd;
	struct stat st;
	char buf[MAXPATHLEN + 1];
	char *str;

	sprintf(pwd_file, "%s/server_priv/db_password", pbs_conf.pbs_home_path);
	if ((fd = open(pwd_file, O_RDONLY)) == -1) {
		return strdup(user);
	} else {
		if (fstat(fd, &st) == -1) {
			close(fd);
			snprintf(errmsg, len, "%s: stat failed, errno=%d", pwd_file, errno);
			return NULL;
		}
		if (st.st_size >= sizeof(buf)) {
			close(fd);
			snprintf(errmsg, len, "%s: file too large", pwd_file);
			return NULL;
		}

		if (read(fd, buf, st.st_size) != st.st_size) {
			close(fd);
			snprintf(errmsg, len, "%s: read failed, errno=%d", pwd_file, errno);
			return NULL;
		}
		buf[st.st_size] = 0;
		close(fd);

		if (pbs_decrypt_pwd(buf, PBS_CREDTYPE_AES, st.st_size, &str, (const unsigned char *) pbs_aes_key, (const unsigned char *) pbs_aes_iv) != 0)
			return NULL;

		return (str);
	}
}

/**
 * @brief
 *	Escape any special characters contained in a database password.
 *	The list of such characters is found in the description of PQconnectdb
 *	at http://www.postgresql.org/docs/<current_pgsql_version>/static/libpq-connect.html.
 *
 * @param[out]	dest - destination string, which will hold the escaped password
 * @param[in]	src - the original password string, which may contain characters
 *		      that must be escaped
 * @param[in]   len - amount of space in the destination string;  to ensure
 *		      successful conversion, this value should be at least one
 *		      more than twice the length of the original password string
 *
 * @return      void
 *
 */
void
escape_passwd(char *dest, char *src, int len)
{
	char *p = dest;

	while (*src && ((p - dest) < len)) {
		if (*src == '\'' || *src == '\\') {
			*p = '\\';
			p++;
		}
		*p = *src;
		p++;
		src++;
	}
	*p = '\0';
}

/**
 * @brief
 *	Creates the database connect string by retreiving the
 *      database password and appending the other connection
 *      parameters.
 *	If parameter host is passed as NULL, then the "host =" portion
 *	of the connection info is not set, allowing the database to
 *	connect to the default host (which is local).
 *
 * @param[in]   host - The hostname to connect to, if NULL the not used
 * @param[in]   timeout - The timeout parameter of the connection
 * @param[in]   err_code - The error code in case of failure
 * @param[out]  errmsg - Details of the error
 * @param[in]   len    - length of error messge variable
 *
 * @return      The newly allocated and populated connection string
 * @retval       NULL  - Failure
 * @retval       !NULL - Success
 *
 */
static char *
get_db_connect_string(char *host, int timeout, int *err_code, char *errmsg, int len)
{
	char *svr_conn_info;
	int pquoted_len = 0;
	char *p = NULL, *pquoted = NULL;
	char *usr = NULL;
	pbs_net_t hostaddr;
	struct in_addr in;
	char hostaddr_str[IPV4_STR_LEN + 1];
	char *q;
	char template1[] = "hostaddr = '%s' port = %d dbname = '%s' user = '%s' password = '%s' connect_timeout = %d";
	char template2[] = "port = %d dbname = '%s' user = '%s' password = '%s' connect_timeout = %d";

	usr = pbs_get_dataservice_usr(errmsg, len);
	if (usr == NULL) {
		*err_code = PBS_DB_AUTH_FAILED;
		return NULL;
	}

	p = get_dataservice_password(usr, errmsg, len);
	if (p == NULL) {
		free(usr);
		*err_code = PBS_DB_AUTH_FAILED;
		return NULL;
	}

	pquoted_len = strlen(p) * 2 + 1;
	pquoted = malloc(pquoted_len);
	if (!pquoted) {
		free(p);
		free(usr);
		*err_code = PBS_DB_NOMEM;
		return NULL;
	}

	escape_passwd(pquoted, p, pquoted_len);

	svr_conn_info = malloc(MAX(sizeof(template1), sizeof(template2)) +
			       ((host) ? IPV4_STR_LEN : 0) + /* length of IPv4 only if host is not NULL */
			       5 +			     /* possible length of port */
			       strlen(PBS_DATA_SERVICE_STORE_NAME) +
			       strlen(usr) + /* NULL checked earlier */
			       strlen(p) +   /* NULL checked earlier */
			       10);	     /* max 9 char timeout + null char */
	if (svr_conn_info == NULL) {
		free(pquoted);
		free(p);
		free(usr);
		*err_code = PBS_DB_NOMEM;
		return NULL;
	}

	if (host == NULL) {
		sprintf(svr_conn_info,
			template2,
			pbs_conf.pbs_data_service_port,
			PBS_DATA_SERVICE_STORE_NAME,
			usr,
			pquoted,
			timeout);
	} else {
		if ((hostaddr = get_hostaddr(host)) == (pbs_net_t) 0) {
			free(pquoted);
			free(svr_conn_info);
			free(p);
			free(usr);
			snprintf(errmsg, len, "Could not resolve dataservice host %s", host);
			*err_code = PBS_DB_CONNFAILED;
			return NULL;
		}
		in.s_addr = htonl(hostaddr);
		q = inet_ntoa(in);
		if (!q) {
			free(pquoted);
			free(svr_conn_info);
			free(p);
			free(usr);
			snprintf(errmsg, len, "inet_ntoa failed, errno=%d", errno);
			*err_code = PBS_DB_CONNFAILED;
			return NULL;
		}
		strncpy(hostaddr_str, q, IPV4_STR_LEN);
		hostaddr_str[IPV4_STR_LEN] = '\0';

		sprintf(svr_conn_info,
			template1,
			hostaddr_str,
			pbs_conf.pbs_data_service_port,
			PBS_DATA_SERVICE_STORE_NAME,
			usr,
			pquoted,
			timeout);
	}
	memset(p, 0, strlen(p));	     /* clear password from memory */
	memset(pquoted, 0, strlen(pquoted)); /* clear password from memory */
	free(pquoted);
	free(p);
	free(usr);

	return svr_conn_info;
}

/**
 * @brief
 *	Function to escape special characters in a string
 *	before using as a column value in the database
 *
 * @param[in]	conn - Handle to the database connection
 * @param[in]	str - the string to escape
 *
 * @return      Escaped string
 * @retval        NULL - Failure to escape string
 * @retval       !NULL - Newly allocated area holding escaped string,
 *                       caller needs to free
 *
 */
static char *
db_escape_str(void *conn, char *str)
{
	char *val_escaped;
	int error;
	int val_len;

	if (str == NULL)
		return NULL;

	val_len = strlen(str);
	/* Use calloc() to ensure the character array is initialized. */
	val_escaped = calloc(((2 * val_len) + 1), sizeof(char)); /* 2*orig + 1 as per Postgres API documentation */
	if (val_escaped == NULL)
		return NULL;

	PQescapeStringConn((PGconn *) conn, val_escaped, str, val_len, &error);
	if (error != 0) {
		free(val_escaped);
		return NULL;
	}

	return val_escaped;
}

/**
 * @brief
 *	Translates the error code to an error message
 *
 * @param[in]   err_code - Error code to translate
 * @param[out]   err_msg - The translated error message (newly allocated memory)
 *
 */
void
pbs_db_get_errmsg(int err_code, char **err_msg)
{
	if (*err_msg) {
		free(*err_msg);
		*err_msg = NULL;
	}

	switch (err_code) {
		case PBS_DB_STILL_STARTING:
			*err_msg = strdup("PBS dataservice is still starting up");
			break;

		case PBS_DB_AUTH_FAILED:
			*err_msg = strdup("PBS dataservice authentication failed");
			break;

		case PBS_DB_NOMEM:
			*err_msg = strdup("PBS out of memory in connect");
			break;

		case PBS_DB_CONNREFUSED:
			*err_msg = strdup("PBS dataservice not running");
			break;

		case PBS_DB_CONNFAILED:
			*err_msg = strdup("Failed to connect to PBS dataservice");
			break;

		case PBS_DB_OOM_ERR:
			*err_msg = strdup("Failed to protect PBS from Linux OOM killer. No access to OOM score file.");
			break;

		case PBS_DB_ERR:
			*err_msg = NULL;
			if (errmsg_cache)
				*err_msg = strdup(errmsg_cache);
			break;

		default:
			*err_msg = strdup("PBS dataservice error");
			break;
	}
}

/**
 * @brief convert network to host byte order to unsigned long long
 *
 * @param[in]   x - Value to convert
 *
 * @return Value converted from network to host byte order. Return the original
 * value if network and host byte order are identical.
 */
unsigned long long
db_ntohll(unsigned long long x)
{
	if (ntohl(1) == 1)
		return x;

	/*
	 * htonl and ntohl always work on 32 bits, even on a 64 bit platform,
	 * so there is no clash.
	 */
	return (unsigned long long) (((unsigned long long) ntohl((x) &0xffffffff)) << 32) | ntohl(((unsigned long long) (x)) >> 32);
}


================================================
FILE: src/lib/Libdb/pgsql/db_job.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *      Implementation of the job data access functions for postgres
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include "db_postgres.h"

/**
 * @brief
 *	Prepare all the job related sqls. Typically called after connect
 *	and before any other sql exeuction
 *
 * @param[in]	conn - Database connection handle
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
db_prepare_job_sqls(void *conn)
{
	char conn_sql[MAX_SQL_LENGTH];
	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into pbs.job ("
					   "ji_jobid,"
					   "ji_state,"
					   "ji_substate,"
					   "ji_svrflags,"
					   "ji_stime,"
					   "ji_queue,"
					   "ji_destin,"
					   "ji_un_type,"
					   "ji_exitstat,"
					   "ji_quetime,"
					   "ji_rteretry,"
					   "ji_fromsock,"
					   "ji_fromaddr,"
					   "ji_jid,"
					   "ji_credtype,"
					   "ji_qrank,"
					   "ji_savetm,"
					   "ji_creattm,"
					   "attributes"
					   ") "
					   "values ($1, $2, $3, $4, $5, $6, $7, $8, $9, "
					   "$10, $11, $12, $13, $14, $15, $16, "
					   "localtimestamp, localtimestamp, hstore($17::text[]))");
	if (db_prepare_stmt(conn, STMT_INSERT_JOB, conn_sql, 17) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.job set "
					   "ji_state = $2,"
					   "ji_substate = $3,"
					   "ji_svrflags = $4,"
					   "ji_stime = $5,"
					   "ji_queue  = $6,"
					   "ji_destin = $7,"
					   "ji_un_type = $8,"
					   "ji_exitstat = $9,"
					   "ji_quetime = $10,"
					   "ji_rteretry = $11,"
					   "ji_fromsock = $12,"
					   "ji_fromaddr = $13,"
					   "ji_jid = $14,"
					   "ji_credtype = $15,"
					   "ji_qrank = $16,"
					   "ji_savetm = localtimestamp,"
					   "attributes = attributes || hstore($17::text[]) "
					   "where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_JOB, conn_sql, 17) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.job set "
					   "ji_savetm = localtimestamp,"
					   "attributes = attributes || hstore($2::text[]) "
					   "where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_JOB_ATTRSONLY, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.job set "
					   "ji_savetm = localtimestamp,"
					   "attributes = attributes - $2::text[] "
					   "where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_REMOVE_JOBATTRS, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.job set "
					   "ji_state = $2,"
					   "ji_substate = $3,"
					   "ji_svrflags = $4,"
					   "ji_stime = $5,"
					   "ji_queue  = $6,"
					   "ji_destin = $7,"
					   "ji_un_type = $8,"
					   "ji_exitstat = $9,"
					   "ji_quetime = $10,"
					   "ji_rteretry = $11,"
					   "ji_fromsock = $12,"
					   "ji_fromaddr = $13,"
					   "ji_jid = $14,"
					   "ji_credtype = $15,"
					   "ji_qrank = $16,"
					   "ji_savetm = localtimestamp "
					   "where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_JOB_QUICK, conn_sql, 16) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "ji_jobid,"
					   "ji_state,"
					   "ji_substate,"
					   "ji_svrflags,"
					   "ji_stime,"
					   "ji_queue,"
					   "ji_destin,"
					   "ji_un_type,"
					   "ji_exitstat,"
					   "ji_quetime,"
					   "ji_rteretry,"
					   "ji_fromsock,"
					   "ji_fromaddr,"
					   "ji_jid,"
					   "ji_credtype,"
					   "ji_qrank,"
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.job where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_SELECT_JOB, conn_sql, 1) != 0)
		return -1;

	/*
	 * Use the sql encode function to encode the $2 parameter. Encode using
	 * 'escape' mode. Encode considers $2 as a bytea and returns a escaped
	 * string using 'escape' syntax. Refer to the following postgres link
	 * for details:
	 * http://www.postgresql.org/docs/8.3/static/functions-string.html
	 */
	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into "
					   "pbs.job_scr (ji_jobid, script) "
					   "values "
					   "($1, encode($2, 'escape'))");
	if (db_prepare_stmt(conn, STMT_INSERT_JOBSCR, conn_sql, 2) != 0)
		return -1;

	/*
	 * Use the sql decode function to decode the script parameter. Decode
	 * using 'escape' mode. Decode considers script as encoded TEXT and
	 * decodes it using 'escape' syntax, returning a bytea. The :: is used
	 * to "typecast" the output to a bytea.
	 * Refer to the following postgres link for details:
	 * http://www.postgresql.org/docs/8.3/static/functions-string.html
	 */
	snprintf(conn_sql, MAX_SQL_LENGTH, "select decode(script, 'escape')::bytea as script "
					   "from pbs.job_scr "
					   "where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_SELECT_JOBSCR, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "ji_jobid,"
					   "ji_state,"
					   "ji_substate,"
					   "ji_svrflags,"
					   "ji_stime,"
					   "ji_queue,"
					   "ji_destin,"
					   "ji_un_type,"
					   "ji_exitstat,"
					   "ji_quetime,"
					   "ji_rteretry,"
					   "ji_fromsock,"
					   "ji_fromaddr,"
					   "ji_jid,"
					   "ji_credtype,"
					   "ji_qrank,"
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.job order by ji_qrank");
	if (db_prepare_stmt(conn, STMT_FINDJOBS_ORDBY_QRANK, conn_sql, 0) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "ji_jobid,"
					   "ji_state,"
					   "ji_substate,"
					   "ji_svrflags,"
					   "ji_stime,"
					   "ji_queue,"
					   "ji_destin,"
					   "ji_un_type,"
					   "ji_exitstat,"
					   "ji_quetime,"
					   "ji_rteretry,"
					   "ji_fromsock,"
					   "ji_fromaddr,"
					   "ji_jid,"
					   "ji_credtype,"
					   "ji_qrank,"
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.job where ji_queue = $1"
					   " order by ji_qrank");
	if (db_prepare_stmt(conn, STMT_FINDJOBS_BYQUE_ORDBY_QRANK,
			    conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "delete from pbs.job where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_DELETE_JOB, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "delete from pbs.job_scr where ji_jobid = $1");
	if (db_prepare_stmt(conn, STMT_DELETE_JOBSCR, conn_sql, 1) != 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Load job data from the row into the job object
 *
 * @param[in]	res - Resultset from an earlier query
 * @param[out]  pj  - Job object to load data into
 * @param[in]	row - The current row to load within the resultset
 *
 * @return error code
 * @retval 0 Success
 * @retval -1 Error
 *
 */
static int
load_job(const PGresult *res, pbs_db_job_info_t *pj, int row)
{
	char *raw_array;
	static int ji_jobid_fnum;
	static int ji_state_fnum;
	static int ji_substate_fnum;
	static int ji_svrflags_fnum;
	static int ji_stime_fnum;
	static int ji_queue_fnum;
	static int ji_destin_fnum;
	static int ji_un_type_fnum;
	static int ji_exitstat_fnum;
	static int ji_quetime_fnum;
	static int ji_rteretry_fnum;
	static int ji_fromsock_fnum;
	static int ji_fromaddr_fnum;
	static int ji_jid_fnum;
	static int ji_credtype_fnum;
	static int ji_qrank_fnum;
	static int attributes_fnum;
	static int fnums_inited = 0;

	if (fnums_inited == 0) {
		/* cache the column numbers of various job table fields */
		ji_jobid_fnum = PQfnumber(res, "ji_jobid");
		ji_state_fnum = PQfnumber(res, "ji_state");
		ji_substate_fnum = PQfnumber(res, "ji_substate");
		ji_svrflags_fnum = PQfnumber(res, "ji_svrflags");
		ji_stime_fnum = PQfnumber(res, "ji_stime");
		ji_queue_fnum = PQfnumber(res, "ji_queue");
		ji_destin_fnum = PQfnumber(res, "ji_destin");
		ji_un_type_fnum = PQfnumber(res, "ji_un_type");
		ji_exitstat_fnum = PQfnumber(res, "ji_exitstat");
		ji_quetime_fnum = PQfnumber(res, "ji_quetime");
		ji_rteretry_fnum = PQfnumber(res, "ji_rteretry");
		ji_fromsock_fnum = PQfnumber(res, "ji_fromsock");
		ji_fromaddr_fnum = PQfnumber(res, "ji_fromaddr");
		ji_jid_fnum = PQfnumber(res, "ji_jid");
		ji_qrank_fnum = PQfnumber(res, "ji_qrank");
		ji_credtype_fnum = PQfnumber(res, "ji_credtype");
		attributes_fnum = PQfnumber(res, "attributes");
		fnums_inited = 1;
	}

	GET_PARAM_STR(res, row, pj->ji_jobid, ji_jobid_fnum);
	GET_PARAM_INTEGER(res, row, pj->ji_state, ji_state_fnum);
	GET_PARAM_INTEGER(res, row, pj->ji_substate, ji_substate_fnum);
	GET_PARAM_INTEGER(res, row, pj->ji_svrflags, ji_svrflags_fnum);
	GET_PARAM_BIGINT(res, row, pj->ji_stime, ji_stime_fnum);
	GET_PARAM_STR(res, row, pj->ji_queue, ji_queue_fnum);
	GET_PARAM_STR(res, row, pj->ji_destin, ji_destin_fnum);
	GET_PARAM_INTEGER(res, row, pj->ji_un_type, ji_un_type_fnum);
	GET_PARAM_INTEGER(res, row, pj->ji_exitstat, ji_exitstat_fnum);
	GET_PARAM_BIGINT(res, row, pj->ji_quetime, ji_quetime_fnum);
	GET_PARAM_BIGINT(res, row, pj->ji_rteretry, ji_rteretry_fnum);
	GET_PARAM_INTEGER(res, row, pj->ji_fromsock, ji_fromsock_fnum);
	GET_PARAM_BIGINT(res, row, pj->ji_fromaddr, ji_fromaddr_fnum);
	GET_PARAM_STR(res, row, pj->ji_jid, ji_jid_fnum);
	GET_PARAM_INTEGER(res, row, pj->ji_credtype, ji_credtype_fnum);
	GET_PARAM_BIGINT(res, row, pj->ji_qrank, ji_qrank_fnum);
	GET_PARAM_BIN(res, row, raw_array, attributes_fnum);

	/* convert attributes from postgres raw array format */
	return (dbarray_to_attrlist(raw_array, &pj->db_attr_list));
}

/**
 *@brief
 *	Save (insert/update) a new/existing job
 *
 * @param[in]	conn - The connnection handle
 * @param[in]	obj  - The job object to save
 * @param[in]	savetype - The kind of save 
 *                         (insert, update full, or full qs area only)
 *
 * @return      Error code
 * @retval	-1 - Execution of prepared statement failed
 * @retval	 0 - Success and > 0 rows were affected
 *
 */
int
pbs_db_save_job(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	char *stmt = NULL;
	pbs_db_job_info_t *pjob = obj->pbs_db_un.pbs_db_job;
	int params;
	int rc = 0;
	char *raw_array = NULL;

	SET_PARAM_STR(conn_data, pjob->ji_jobid, 0);

	if (savetype & OBJ_SAVE_QS) {
		SET_PARAM_INTEGER(conn_data, pjob->ji_state, 1);
		SET_PARAM_INTEGER(conn_data, pjob->ji_substate, 2);
		SET_PARAM_INTEGER(conn_data, pjob->ji_svrflags, 3);
		SET_PARAM_BIGINT(conn_data, pjob->ji_stime, 4);
		SET_PARAM_STR(conn_data, pjob->ji_queue, 5);
		SET_PARAM_STR(conn_data, pjob->ji_destin, 6);
		SET_PARAM_INTEGER(conn_data, pjob->ji_un_type, 7);
		SET_PARAM_INTEGER(conn_data, pjob->ji_exitstat, 8);
		SET_PARAM_BIGINT(conn_data, pjob->ji_quetime, 9);
		SET_PARAM_BIGINT(conn_data, pjob->ji_rteretry, 10);
		SET_PARAM_INTEGER(conn_data, pjob->ji_fromsock, 11);
		SET_PARAM_BIGINT(conn_data, pjob->ji_fromaddr, 12);
		SET_PARAM_STR(conn_data, pjob->ji_jid, 13);
		SET_PARAM_INTEGER(conn_data, pjob->ji_credtype, 14);
		SET_PARAM_BIGINT(conn_data, pjob->ji_qrank, 15);

		stmt = STMT_UPDATE_JOB_QUICK;
		params = 16;
	}

	if ((pjob->db_attr_list.attr_count > 0) || (savetype & OBJ_SAVE_NEW)) {
		int len = 0;
		/* convert attributes to postgres raw array format */

		if ((len = attrlist_to_dbarray(&raw_array, &pjob->db_attr_list)) <= 0)
			return -1;

		if (savetype & OBJ_SAVE_QS) {
			SET_PARAM_BIN(conn_data, raw_array, len, 16);
			params = 17;
			stmt = STMT_UPDATE_JOB;
		} else {
			SET_PARAM_BIN(conn_data, raw_array, len, 1);
			params = 2;
			stmt = STMT_UPDATE_JOB_ATTRSONLY;
		}
	}

	if (savetype & OBJ_SAVE_NEW)
		stmt = STMT_INSERT_JOB;

	if (stmt)
		rc = db_cmd(conn, stmt, params);

	return rc;
}

/**
 * @brief
 *	Load job data from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in/out]obj  - Load job information into this object where
 *			jobid = obj->pbs_db_un.pbs_db_job->ji_jobid
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_job(void *conn, pbs_db_obj_info_t *obj)
{
	PGresult *res;
	int rc;
	pbs_db_job_info_t *pj = obj->pbs_db_un.pbs_db_job;

	SET_PARAM_STR(conn_data, pj->ji_jobid, 0);

	if ((rc = db_query(conn, STMT_SELECT_JOB, 1, &res)) != 0)
		return rc;

	rc = load_job(res, pj, 0);

	PQclear(res);

	return rc;
}

/**
 * @brief
 *	Find jobs
 *
 * @param[in]	conn - Connection handle
 * @param[out]  st   - The cursor state variable updated by this query
 * @param[in]	obj  - Information of job to be found
 * @param[in]	opts - Any other options (like flags, timestamp)
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows found
 *
 */
int
pbs_db_find_job(void *conn, void *st, pbs_db_obj_info_t *obj,
		pbs_db_query_options_t *opts)
{
	PGresult *res;
	char conn_sql[MAX_SQL_LENGTH];
	db_query_state_t *state = (db_query_state_t *) st;
	pbs_db_job_info_t *pdjob = obj->pbs_db_un.pbs_db_job;
	int rc;
	int params;

	if (!state)
		return -1;

	if (opts != NULL && opts->flags == FIND_JOBS_BY_QUE) {
		SET_PARAM_STR(conn_data, pdjob->ji_queue, 0);
		params = 1;
		strcpy(conn_sql, STMT_FINDJOBS_BYQUE_ORDBY_QRANK);
	} else {
		strcpy(conn_sql, STMT_FINDJOBS_ORDBY_QRANK);
		params = 0;
	}

	if ((rc = db_query(conn, conn_sql, params, &res)) != 0)
		return rc;

	state->row = 0;
	state->res = res;
	state->count = PQntuples(res);

	return 0;
}

/**
 * @brief
 *	Get the next job from the cursor
 *
 * @param[in]	conn - Connection handle
 * @param[in]	st   - The cursor state
 * @param[out]  obj  - Job information is loaded into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_next_job(void *conn, void *st, pbs_db_obj_info_t *obj)
{
	db_query_state_t *state = (db_query_state_t *) st;

	return load_job(state->res, obj->pbs_db_un.pbs_db_job, state->row);
}

/**
 * @brief
 *	Delete the job from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Job information
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_delete_job(void *conn, pbs_db_obj_info_t *obj)
{
	pbs_db_job_info_t *pj = obj->pbs_db_un.pbs_db_job;
	int rc = 0;

	SET_PARAM_STR(conn_data, pj->ji_jobid, 0);

	if ((rc = db_cmd(conn, STMT_DELETE_JOB, 1)) == -1)
		goto err;

	if (db_cmd(conn, STMT_DELETE_JOBSCR, 1) == -1)
		goto err;

	return rc;
err:
	return -1;
}

/**
 * @brief
 *	Insert job script
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Job script object
 * @param[in]	savetype - Just a place holder here. Maintained the same prototype as with
 * 		           the other database save functions since this is called through function pointer.
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_save_jobscr(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	pbs_db_jobscr_info_t *pscr = obj->pbs_db_un.pbs_db_jobscr;

	SET_PARAM_STR(conn_data, pscr->ji_jobid, 0);

	/*
	 * The script data could contain non-UTF8 characters. We therefore
	 * consider it binary and encode it into TEXT by using the "encode"
	 * sql function. The input data to load, therefore, is binary data
	 * and so we use the function "LOAD_BIN" to load the parameter to
	 * the prepared statement
	 */
	SET_PARAM_BIN(conn_data, pscr->script, (pscr->script) ? strlen(pscr->script) : 0, 1);

	return (db_cmd(conn, STMT_INSERT_JOBSCR, 2));
}

/**
 * @brief
 *	load job script
 *
 * @param[in]	  conn - Connection handle
 * @param[in/out] obj  - Job script is loaded into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_load_jobscr(void *conn, pbs_db_obj_info_t *obj)
{
	PGresult *res;
	pbs_db_jobscr_info_t *pscr = obj->pbs_db_un.pbs_db_jobscr;
	char *script = NULL;
	static int script_fnum = -1;

	SET_PARAM_STR(conn_data, pscr->ji_jobid, 0);

	/*
	 * The data (script) we stored was a "encoded" binary. We "decode" it
	 * back while reading, giving us "binary" data. Since we want the
	 * result data to be returned in binary, we set conn_result_format
	 * to 1 to indicate binary result. This setting is a one-time,
	 * auto-reset switch which resets to 0 (TEXT) mode after each execution
	 * of pbs_db_query.
	 */
	if (db_query(conn, STMT_SELECT_JOBSCR, 1, &res) != 0)
		return -1;

	if (script_fnum == -1)
		script_fnum = PQfnumber(res, "script");

	GET_PARAM_BIN(res, 0, script, script_fnum);
	pscr->script = strdup(script);

	/* Cleans up memory associated with a resultset */
	PQclear(res);

	return 0;
}

/**
 * @brief
 *	Deletes attributes of a job
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Job information
 * @param[in]	obj_id  - Job id
 * @param[in]	attr_list - List of attributes
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - On Failure
 *
 */
int
pbs_db_del_attr_job(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list)
{
	char *raw_array = NULL;
	int len = 0;
	int rc = 0;

	if ((len = attrlist_to_dbarray_ex(&raw_array, attr_list, 1)) <= 0)
		return -1;

	SET_PARAM_STR(conn_data, obj_id, 0);
	SET_PARAM_BIN(conn_data, raw_array, len, 1);

	rc = db_cmd(conn, STMT_REMOVE_JOBATTRS, 2);

	return rc;
}


================================================
FILE: src/lib/Libdb/pgsql/db_node.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *      Implementation of the node data access functions for postgres
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include "db_postgres.h"

/**
 * @brief
 *	Prepare all the node related sqls. Typically called after connect
 *	and before any other sql exeuction
 *
 * @param[in]	conn - Database connection handle
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
db_prepare_node_sqls(void *conn)
{
	char conn_sql[MAX_SQL_LENGTH];
	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into pbs.node("
					   "nd_name, "
					   "nd_index, "
					   "mom_modtime, "
					   "nd_hostname, "
					   "nd_state, "
					   "nd_ntype, "
					   "nd_pque, "
					   "nd_savetm, "
					   "nd_creattm, "
					   "attributes "
					   ") "
					   "values "
					   "($1, $2, $3, $4, $5, $6, $7, localtimestamp, localtimestamp, hstore($8::text[]))");
	if (db_prepare_stmt(conn, STMT_INSERT_NODE, conn_sql, 8) != 0)
		return -1;

	/* in case of nodes do not use || with existing attributes, since we re-write all attributes */
	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.node set "
					   "nd_index = $2, "
					   "mom_modtime = $3, "
					   "nd_hostname = $4, "
					   "nd_state = $5, "
					   "nd_ntype = $6, "
					   "nd_pque = $7, "
					   "nd_savetm = localtimestamp, "
					   "attributes = attributes || hstore($8::text[]) "
					   "where nd_name = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_NODE, conn_sql, 8) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.node set "
					   "nd_index = $2, "
					   "mom_modtime = $3, "
					   "nd_hostname = $4, "
					   "nd_state = $5, "
					   "nd_ntype = $6, "
					   "nd_pque = $7, "
					   "nd_savetm = localtimestamp "
					   "where nd_name = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_NODE_QUICK, conn_sql, 7) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.node set "
					   "nd_savetm = localtimestamp,"
					   "attributes = attributes || hstore($2::text[]) "
					   "where nd_name = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_NODE_ATTRSONLY, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.node set "
					   "nd_savetm = localtimestamp,"
					   "attributes = attributes - $2::text[] "
					   "where nd_name = $1");
	if (db_prepare_stmt(conn, STMT_REMOVE_NODEATTRS, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "nd_name, "
					   "nd_index, "
					   "mom_modtime, "
					   "nd_hostname, "
					   "nd_state, "
					   "nd_ntype, "
					   "nd_pque, "
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.node "
					   "where nd_name = $1");
	if (db_prepare_stmt(conn, STMT_SELECT_NODE, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "nd_name, "
					   "nd_index, "
					   "mom_modtime, "
					   "nd_hostname, "
					   "nd_state, "
					   "nd_ntype, "
					   "nd_pque, "
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.node order by nd_creattm");
	if (db_prepare_stmt(conn, STMT_FIND_NODES_ORDBY_CREATTM, conn_sql, 0) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
#ifdef NAS /* localmod 079 */
					   "n.nd_name, "
					   "n.mom_modtime, "
					   "n.nd_hostname, "
					   "n.nd_state, "
					   "n.nd_ntype, "
					   "n.nd_pque "
					   "from pbs.node n left outer join pbs.nas_node i on "
					   "n.nd_name=i.nd_name order by i.nd_nasindex");
#else
					   "nd_name, "
					   "mom_modtime, "
					   "nd_hostname, "
					   "nd_state, "
					   "nd_ntype, "
					   "nd_pque, "
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.node order by nd_index, nd_creattm");
#endif /* localmod 079 */
	if (db_prepare_stmt(conn, STMT_FIND_NODES_ORDBY_INDEX, conn_sql, 0) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "delete from pbs.node where nd_name = $1");
	if (db_prepare_stmt(conn, STMT_DELETE_NODE, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "mit_time, "
					   "mit_gen "
					   "from pbs.mominfo_time ");
	if (db_prepare_stmt(conn, STMT_SELECT_MOMINFO_TIME, conn_sql, 0) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into pbs.mominfo_time("
					   "mit_time, "
					   "mit_gen) "
					   "values "
					   "($1, $2)");
	if (db_prepare_stmt(conn, STMT_INSERT_MOMINFO_TIME, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.mominfo_time set "
					   "mit_time = $1, "
					   "mit_gen = $2 ");
	if (db_prepare_stmt(conn, STMT_UPDATE_MOMINFO_TIME, conn_sql, 2) != 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Load node data from the row into the node object
 *
 * @param[in]	res - Resultset from a earlier query
 * @param[in]	pnd  - Node object to load data into
 * @param[in]	row - The current row to load within the resultset
 *
 * @return      Error code
 * @retval	-1 - On Error
 * @retval	 0 - On Success
 * @retval	>1 - Number of attributes
 *
 */
static int
load_node(PGresult *res, pbs_db_node_info_t *pnd, int row)
{
	char *raw_array;
	static int nd_name_fnum;
	static int mom_modtime_fnum;
	static int nd_hostname_fnum;
	static int nd_state_fnum;
	static int nd_ntype_fnum;
	static int nd_pque_fnum;
	static int attributes_fnum;
	static int fnums_inited = 0;

	if (fnums_inited == 0) {
		nd_name_fnum = PQfnumber(res, "nd_name");
		mom_modtime_fnum = PQfnumber(res, "mom_modtime");
		nd_hostname_fnum = PQfnumber(res, "nd_hostname");
		nd_state_fnum = PQfnumber(res, "nd_state");
		nd_ntype_fnum = PQfnumber(res, "nd_ntype");
		nd_pque_fnum = PQfnumber(res, "nd_pque");
		attributes_fnum = PQfnumber(res, "attributes");
		fnums_inited = 1;
	}

	GET_PARAM_STR(res, row, pnd->nd_name, nd_name_fnum);
	GET_PARAM_BIGINT(res, row, pnd->mom_modtime, mom_modtime_fnum);
	GET_PARAM_STR(res, row, pnd->nd_hostname, nd_hostname_fnum);
	GET_PARAM_INTEGER(res, row, pnd->nd_state, nd_state_fnum);
	GET_PARAM_INTEGER(res, row, pnd->nd_ntype, nd_ntype_fnum);
	GET_PARAM_STR(res, row, pnd->nd_pque, nd_pque_fnum);
	GET_PARAM_BIN(res, row, raw_array, attributes_fnum);

	/* convert attributes from postgres raw array format */
	return (dbarray_to_attrlist(raw_array, &pnd->db_attr_list));
}

/**
 * @brief
 *	Insert node data into the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Information of node to be inserted
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_save_node(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	pbs_db_node_info_t *pnd = obj->pbs_db_un.pbs_db_node;
	char *stmt = NULL;
	int params;
	int rc = 0;
	char *raw_array = NULL;

	SET_PARAM_STR(conn_data, pnd->nd_name, 0);

	if (savetype & OBJ_SAVE_QS) {
		SET_PARAM_INTEGER(conn_data, pnd->nd_index, 1);
		SET_PARAM_BIGINT(conn_data, pnd->mom_modtime, 2);
		SET_PARAM_STR(conn_data, pnd->nd_hostname, 3);
		SET_PARAM_INTEGER(conn_data, pnd->nd_state, 4);
		SET_PARAM_INTEGER(conn_data, pnd->nd_ntype, 5);
		SET_PARAM_STR(conn_data, pnd->nd_pque, 6);
		params = 7;
		stmt = STMT_UPDATE_NODE_QUICK;
	}

	if ((pnd->db_attr_list.attr_count > 0) || (savetype & OBJ_SAVE_NEW)) {
		int len = 0;
		/* convert attributes to postgres raw array format */
		if ((len = attrlist_to_dbarray(&raw_array, &pnd->db_attr_list)) <= 0)
			return -1;

		if (savetype & OBJ_SAVE_QS) {
			SET_PARAM_BIN(conn_data, raw_array, len, 7);
			params = 8;
			stmt = STMT_UPDATE_NODE;
		} else {
			SET_PARAM_BIN(conn_data, raw_array, len, 1);
			params = 2;
			stmt = STMT_UPDATE_NODE_ATTRSONLY;
		}
	}

	if (savetype & OBJ_SAVE_NEW)
		stmt = STMT_INSERT_NODE;

	if (stmt)
		rc = db_cmd(conn, stmt, params);

	return rc;
}

/**
 * @brief
 *	Load node data from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Load node information into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_node(void *conn, pbs_db_obj_info_t *obj)
{
	PGresult *res;
	int rc;
	pbs_db_node_info_t *pnd = obj->pbs_db_un.pbs_db_node;

	SET_PARAM_STR(conn_data, pnd->nd_name, 0);

	if ((rc = db_query(conn, STMT_SELECT_NODE, 1, &res)) != 0)
		return rc;

	rc = load_node(res, pnd, 0);

	PQclear(res);

	return rc;
}

/**
 * @brief
 *	Find nodes
 *
 * @param[in]	conn - Connection handle
 * @param[in]	st   - The cursor state variable updated by this query
 * @param[in]	obj  - Information of node to be found
 * @param[in]	opts - Any other options (like flags, timestamp)
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 - Success, but no rows found
 *
 */
int
pbs_db_find_node(void *conn, void *st, pbs_db_obj_info_t *obj,
		 pbs_db_query_options_t *opts)
{
	PGresult *res;
	int rc;
	db_query_state_t *state = (db_query_state_t *) st;

	if (!state)
		return -1;

	if ((rc = db_query(conn, STMT_FIND_NODES_ORDBY_INDEX, 0, &res)) != 0)
		return rc;

	state->row = 0;
	state->res = res;
	state->count = PQntuples(res);
	return 0;
}

/**
 * @brief
 *	Get the next node from the cursor
 *
 * @param[in]	conn - Connection handle
 * @param[in]	st   - The cursor state
 * @param[in]	obj  - Node information is loaded into this object
 *
 * @return      Error code
 *		(Even though this returns only 0 now, keeping it as int
 *			to support future change to return a failure)
 * @retval	 0 - Success
 *
 */
int
pbs_db_next_node(void *conn, void *st, pbs_db_obj_info_t *obj)
{
	PGresult *res = ((db_query_state_t *) st)->res;
	db_query_state_t *state = (db_query_state_t *) st;

	return (load_node(res, obj->pbs_db_un.pbs_db_node, state->row));
}

/**
 * @brief
 *	Delete the node from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Node information
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_delete_node(void *conn, pbs_db_obj_info_t *obj)
{
	pbs_db_node_info_t *pnd = obj->pbs_db_un.pbs_db_node;
	SET_PARAM_STR(conn_data, pnd->nd_name, 0);
	return (db_cmd(conn, STMT_DELETE_NODE, 1));
}

/**
 * @brief
 *	Deletes attributes of a node
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj_id  - Node id
 * @param[in]	attr_list - List of attributes
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - On Failure
 *
 */
int
pbs_db_del_attr_node(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list)
{
	char *raw_array = NULL;
	int len = 0;
	int rc = 0;

	if ((len = attrlist_to_dbarray_ex(&raw_array, attr_list, 1)) <= 0)
		return -1;

	SET_PARAM_STR(conn_data, obj_id, 0);
	SET_PARAM_BIN(conn_data, raw_array, len, 1);

	rc = db_cmd(conn, STMT_REMOVE_NODEATTRS, 2);

	return rc;
}

/**
 * @brief
 *	Insert mominfo_time into the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Information of node to be inserted
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_save_mominfo_tm(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	char *stmt;
	pbs_db_mominfo_time_t *pmi = obj->pbs_db_un.pbs_db_mominfo_tm;

	SET_PARAM_BIGINT(conn_data, pmi->mit_time, 0);
	SET_PARAM_INTEGER(conn_data, pmi->mit_gen, 1);

	if (savetype & OBJ_SAVE_NEW)
		stmt = STMT_INSERT_MOMINFO_TIME;
	else
		stmt = STMT_UPDATE_MOMINFO_TIME;

	return (db_cmd(conn, stmt, 2));
}

/**
 * @brief
 *	Load node mominfo_time from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Load node information into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_mominfo_tm(void *conn, pbs_db_obj_info_t *obj)
{
	PGresult *res;
	int rc;
	pbs_db_mominfo_time_t *pmi = obj->pbs_db_un.pbs_db_mominfo_tm;
	static int mit_time_fnum = -1;
	static int mit_gen_fnum = -1;

	if ((rc = db_query(conn, STMT_SELECT_MOMINFO_TIME, 0, &res)) != 0)
		return rc;

	if (mit_time_fnum == -1 || mit_gen_fnum == -1) {
		mit_time_fnum = PQfnumber(res, "mit_time");
		mit_gen_fnum = PQfnumber(res, "mit_gen");
	}

	GET_PARAM_BIGINT(res, 0, pmi->mit_time, mit_time_fnum);
	GET_PARAM_INTEGER(res, 0, pmi->mit_gen, mit_gen_fnum);

	PQclear(res);
	return 0;
}


================================================
FILE: src/lib/Libdb/pgsql/db_postgres.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *  Postgres specific implementation
 *
 * This header file contains Postgres specific data structures and functions
 * to access the PBS postgres database. These structures are used only by the
 * postgres specific data store implementation, and should not be used directly
 * by the rest of the PBS code.
 *
 * The functions/interfaces in this header are PBS Private.
 */

#ifndef _DB_POSTGRES_H
#define _DB_POSTGRES_H

#ifdef __cplusplus
extern "C" {
#endif

#include <libpq-fe.h>
#include <netinet/in.h>
#include <sys/types.h>
#include <inttypes.h>
#include "net_connect.h"
#include "list_link.h"
#include "portability.h"
#include "attribute.h"

/*
 * Conversion macros for long long type
 */
#if !defined(ntohll)
#define ntohll(x) db_ntohll(x)
#endif
#if !defined(htonll)
#define htonll(x) ntohll(x)
#endif

#define PBS_MAXATTRNAME 64
#define PBS_MAXATTRRESC 64
#define MAX_SQL_LENGTH 8192

/* job sql statement names */
#define STMT_SELECT_JOB "select_job"
#define STMT_INSERT_JOB "insert_job"
#define STMT_UPDATE_JOB "update_job"
#define STMT_UPDATE_JOB_ATTRSONLY "update_job_attrsonly"
#define STMT_UPDATE_JOB_QUICK "update_job_quick"
#define STMT_FINDJOBS_ORDBY_QRANK "findjobs_ordby_qrank"
#define STMT_FINDJOBS_BYQUE_ORDBY_QRANK "findjobs_byque_ordby_qrank"
#define STMT_DELETE_JOB "delete_job"
#define STMT_REMOVE_JOBATTRS "remove_jobattrs"

/* JOBSCR stands for job script */
#define STMT_INSERT_JOBSCR "insert_jobscr"
#define STMT_SELECT_JOBSCR "select_jobscr"
#define STMT_DELETE_JOBSCR "delete_jobscr"

/* reservation statement names */
#define STMT_INSERT_RESV "insert_resv"
#define STMT_UPDATE_RESV "update_resv"
#define STMT_UPDATE_RESV_QUICK "update_resv_quick"
#define STMT_UPDATE_RESV_ATTRSONLY "update_resv_attrsonly"
#define STMT_SELECT_RESV "select_resv"
#define STMT_DELETE_RESV "delete_resv"
#define STMT_REMOVE_RESVATTRS "remove_resvattrs"

/* creattm is the table field that holds the creation time */
#define STMT_FINDRESVS_ORDBY_CREATTM "findresvs_ordby_creattm"

/* server & seq statement names */
#define STMT_INSERT_SVR "insert_svr"
#define STMT_UPDATE_SVR "update_svr"
#define STMT_SELECT_SVR "select_svr"
#define STMT_SELECT_DBVER "select_dbver"
#define STMT_SELECT_NEXT_SEQID "select_nextseqid"
#define STMT_REMOVE_SVRATTRS "remove_svrattrs"
#define STMT_INSERT_SVRINST "stmt_insert_svrinst"
#define STMT_UPDATE_SVRINST "stmt_update_svrinst"
#define STMT_SELECT_SVRINST "stmt_select_svrinst"

/* queue statement names */
#define STMT_INSERT_QUE "insert_que"
#define STMT_UPDATE_QUE "update_que"
#define STMT_UPDATE_QUE_QUICK "update_que_quick"
#define STMT_UPDATE_QUE_ATTRSONLY "update_que_attrsonly"
#define STMT_SELECT_QUE "select_que"
#define STMT_DELETE_QUE "delete_que"
#define STMT_FIND_QUES_ORDBY_CREATTM "find_ques_ordby_creattm"
#define STMT_REMOVE_QUEATTRS "remove_queattrs"

/* node statement names */
#define STMT_INSERT_NODE "insert_node"
#define STMT_UPDATE_NODE "update_node"
#define STMT_UPDATE_NODE_QUICK "update_node_quick"
#define STMT_UPDATE_NODE_ATTRSONLY "update_node_attrsonly"
#define STMT_SELECT_NODE "select_node"
#define STMT_DELETE_NODE "delete_node"
#define STMT_REMOVE_NODEATTRS "remove_nodeattrs"
#define STMT_UPDATE_NODEATTRS "update_nodeattrs"
#define STMT_FIND_NODES_ORDBY_CREATTM "find_nodes_ordby_creattm"
#define STMT_FIND_NODES_ORDBY_INDEX "find_nodes_ordby_index"
#define STMT_SELECT_MOMINFO_TIME "select_mominfo_time"
#define STMT_INSERT_MOMINFO_TIME "insert_mominfo_time"
#define STMT_UPDATE_MOMINFO_TIME "update_mominfo_time"

/* node job statements */
#define STMT_SELECT_NODEJOB "select_nodejob"
#define STMT_FIND_NODEJOB_USING_NODEID "select_nodejob_with_nodeid"
#define STMT_INSERT_NODEJOB "insert_nodejob"
#define STMT_UPDATE_NODEJOB "update_nodejob"
#define STMT_UPDATE_NODEJOB_QUICK "update_nodejob_quick"
#define STMT_UPDATE_NODEJOB_ATTRSONLY "update_nodejob_attrsonly"
#define STMT_DELETE_NODEJOB "delete_nodejob"

/* scheduler statement names */
#define STMT_INSERT_SCHED "insert_sched"
#define STMT_UPDATE_SCHED "update_sched"
#define STMT_SELECT_SCHED "select_sched"
#define STMT_SELECT_SCHED_ALL "select_sched_all"
#define STMT_DELETE_SCHED "sched_delete"
#define STMT_REMOVE_SCHEDATTRS "remove_schedattrs"

#define POSTGRES_QUERY_MAX_PARAMS 30

/**
 * @brief
 *  Prepared statements require parameter postion, formats and values to be
 *  supplied to the query. This structure is stored as part of the connection
 *  object and re-used for every prepared statement
 *
 */
struct postgres_conn_data {
	const char *paramValues[POSTGRES_QUERY_MAX_PARAMS];
	int paramLengths[POSTGRES_QUERY_MAX_PARAMS];
	int paramFormats[POSTGRES_QUERY_MAX_PARAMS];

	/* followin are two tmp arrays used for conversion of binary data*/
	INTEGER temp_int[POSTGRES_QUERY_MAX_PARAMS];
	BIGINT temp_long[POSTGRES_QUERY_MAX_PARAMS];
};
typedef struct postgres_conn_data pg_conn_data_t;

/**
 * @brief
 * Postgres transaction management helper structure.
 */
struct pg_conn_trx {
	int conn_trx_nest;     /* incr/decr with each begin/end trx */
	int conn_trx_rollback; /* rollback flag in case of nested trx */
	int conn_trx_async;    /* 1 - async, 0 - sync, one-shot reset */
};
typedef struct pg_conn_trx pg_conn_trx_t;

extern pg_conn_data_t *conn_data;
extern pg_conn_trx_t *conn_trx;

/**
 * @brief
 *  This structure is used to represent the cursor state for a multirow query
 *  result. The row field keep track of which row is the current row (or was
 *  last returned to the caller). The count field contains the total number of
 *  rows that are available in the resultset.
 *
 */
struct db_query_state {
	PGresult *res;
	int row;
	int count;
	query_cb_t query_cb;
};
typedef struct db_query_state db_query_state_t;

/**
 * @brief
 * Each database object type supports most of the following 6 operations:
 *	- insertion
 *	- updation
 *	- deletion
 *	- loading
 *	- find rows matching a criteria
 *	- get next row from a cursor (created in a find command)
 *
 * The following structure has function pointers to all the above described
 * operations.
 *
 */
struct postgres_db_fn {
	int (*pbs_db_save_obj)(void *conn, pbs_db_obj_info_t *obj, int savetype);
	int (*pbs_db_delete_obj)(void *conn, pbs_db_obj_info_t *obj);
	int (*pbs_db_load_obj)(void *conn, pbs_db_obj_info_t *obj);
	int (*pbs_db_find_obj)(void *conn, void *state, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts);
	int (*pbs_db_next_obj)(void *conn, void *state, pbs_db_obj_info_t *obj);
	int (*pbs_db_del_attr_obj)(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list);
};

typedef struct postgres_db_fn pg_db_fn_t;

/*
 * The following are defined as macros as they are used very frequently
 * Making them functions would effect performance.
 *
 * SET_PARAM_STR     - Loads null terminated string to postgres parameter at index "i"
 * SET_PARAM_STRSZ   - Same as SET_PARAM_STR, only size of string is provided
 * SET_PARAM_INTEGER - Loads integer to postgres parameter at index "i"
 * SET_PARAM_BIGINT  - Loads BIGINT value to postgres parameter at index "i"
 * SET_PARAM_BIN     - Loads a BINARY value to postgres parameter at index "i"
 *
 * Basically there are 3 values that need to be supplied for every paramter
 * of any prepared sql statement. They are:
 *	1) The value - The value to be "bound/loaded" to the parameter. This
 *			is the adress of the variable which holds the value.
 *			The variable paramValues[i] is used to hold that address
 *			For strings, its the address of the string, for integers
 *			etc, we need to convert the integer value to network
 *			byte order (htonl - and store it in temp_int/long[i],
 *			and pass the address of temp_int/long[i]
 *
 *	2) The length - This is the length of the value that is loaded. It is
 *			loaded to variable paramLengths[i]. For strings, this
 *			is the string length or passed length value (LOAD_STRSZ)
 *			For integers (& bigints), its the sizeof(int) or
 *			sizeof(BIGINT). In case of BINARY data, the len is set
 *			to the length supplied as a parameter.
 *
 *	3) The format - This is the format of the datatype that is being passed
 *			For strings, the value is "0", for binary value is "1".
 *			This is loaded into paramValues[i].
 *
 * The Postgres specific connection structure pg_conn_data_t has the following
 * arrays defined, so that they dont have to be created every time needed.
 * - paramValues - array to hold values of each parameter
 * - paramLengths - Lengths of each of these values (corresponding index)
 * - paramFormats - Formats of the datatype passed for each value (corr index)
 * - temp_int	  - array to use to convert int to network byte order
 * - temp_long	  - array to use to convery BIGINT to network byte order
 */
#define SET_PARAM_STR(conn_data, itm, i)                                       \
	((pg_conn_data_t *) conn_data)->paramValues[i] = (itm);                \
	if (itm)                                                               \
		((pg_conn_data_t *) conn_data)->paramLengths[i] = strlen(itm); \
	else                                                                   \
		((pg_conn_data_t *) conn_data)->paramLengths[i] = 0;           \
	((pg_conn_data_t *) conn_data)->paramFormats[i] = 0;

#define SET_PARAM_STRSZ(conn_data, itm, size, i)                  \
	((pg_conn_data_t *) conn_data)->paramValues[i] = (itm);   \
	((pg_conn_data_t *) conn_data)->paramLengths[i] = (size); \
	((pg_conn_data_t *) conn_data)->paramFormats[i] = 0;

#define SET_PARAM_INTEGER(conn_data, itm, i)                                \
	((pg_conn_data_t *) conn_data)->temp_int[i] = (INTEGER) htonl(itm); \
	((pg_conn_data_t *) conn_data)->paramValues[i] =                    \
		(char *) &(((pg_conn_data_t *) conn_data)->temp_int[i]);    \
	((pg_conn_data_t *) conn_data)->paramLengths[i] = sizeof(int);      \
	((pg_conn_data_t *) conn_data)->paramFormats[i] = 1;

#define SET_PARAM_BIGINT(conn_data, itm, i)                                  \
	((pg_conn_data_t *) conn_data)->temp_long[i] = (BIGINT) htonll(itm); \
	((pg_conn_data_t *) conn_data)->paramValues[i] =                     \
		(char *) &(((pg_conn_data_t *) conn_data)->temp_long[i]);    \
	((pg_conn_data_t *) conn_data)->paramLengths[i] = sizeof(BIGINT);    \
	((pg_conn_data_t *) conn_data)->paramFormats[i] = 1;

#define SET_PARAM_BIN(conn_data, itm, len, i)                    \
	((pg_conn_data_t *) conn_data)->paramValues[i] = (itm);  \
	((pg_conn_data_t *) conn_data)->paramLengths[i] = (len); \
	((pg_conn_data_t *) conn_data)->paramFormats[i] = 1;

#define GET_PARAM_STR(res, row, itm, fnum) \
	strcpy((itm), PQgetvalue((res), (row), (fnum)));

#define GET_PARAM_INTEGER(res, row, itm, fnum) \
	(itm) = ntohl(*((uint32_t *) PQgetvalue((res), (row), (fnum))));

#define GET_PARAM_BIGINT(res, row, itm, fnum) \
	(itm) = ntohll(*((uint64_t *) PQgetvalue((res), (row), (fnum))));

#define GET_PARAM_BIN(res, row, itm, fnum) \
	(itm) = PQgetvalue((res), (row), (fnum));

#define FIND_JOBS_BY_QUE 1

/* common functions */
int db_prepare_job_sqls(void *conn);
int db_prepare_resv_sqls(void *conn);
int db_prepare_svr_sqls(void *conn);
int db_prepare_node_sqls(void *conn);
int db_prepare_sched_sqls(void *conn);
int db_prepare_que_sqls(void *conn);

void db_set_error(void *conn, char **conn_db_err, char *fnc, char *msg, char *msg2);
int db_prepare_stmt(void *conn, char *stmt, char *sql, int num_vars);
int db_cmd(void *conn, char *stmt, int num_vars);
int db_query(void *conn, char *stmt, int num_vars, PGresult **res);
unsigned long long db_ntohll(unsigned long long);
int dbarray_to_attrlist(char *raw_array, pbs_db_attr_list_t *attr_list);
int attrlist_to_dbarray(char **raw_array, pbs_db_attr_list_t *attr_list);
int attrlist_to_dbarray_ex(char **raw_array, pbs_db_attr_list_t *attr_list, int keys_only);

/* job functions */
int pbs_db_save_job(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_job(void *conn, pbs_db_obj_info_t *obj);
int pbs_db_find_job(void *conn, void *st, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts);
int pbs_db_next_job(void *conn, void *st, pbs_db_obj_info_t *obj);
int pbs_db_delete_job(void *conn, pbs_db_obj_info_t *obj);

int pbs_db_save_jobscr(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_jobscr(void *conn, pbs_db_obj_info_t *obj);

/* resv functions */
int pbs_db_save_resv(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_resv(void *conn, pbs_db_obj_info_t *obj);
int pbs_db_find_resv(void *conn, void *st, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts);
int pbs_db_next_resv(void *conn, void *st, pbs_db_obj_info_t *obj);
int pbs_db_delete_resv(void *conn, pbs_db_obj_info_t *obj);

/* svr functions */
int pbs_db_save_svr(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_svr(void *conn, pbs_db_obj_info_t *obj);

/* node functions */
int pbs_db_save_node(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_node(void *conn, pbs_db_obj_info_t *obj);
int pbs_db_find_node(void *conn, void *st, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts);
int pbs_db_next_node(void *conn, void *st, pbs_db_obj_info_t *obj);
int pbs_db_delete_node(void *conn, pbs_db_obj_info_t *obj);

/* mominfo_time functions */
int pbs_db_save_mominfo_tm(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_mominfo_tm(void *conn, pbs_db_obj_info_t *obj);

/* queue functions */
int pbs_db_save_que(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_que(void *conn, pbs_db_obj_info_t *obj);
int pbs_db_find_que(void *conn, void *st, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts);
int pbs_db_next_que(void *conn, void *st, pbs_db_obj_info_t *obj);
int pbs_db_delete_que(void *conn, pbs_db_obj_info_t *obj);

/* scheduler functions */
int pbs_db_save_sched(void *conn, pbs_db_obj_info_t *obj, int savetype);
int pbs_db_load_sched(void *conn, pbs_db_obj_info_t *obj);

int pbs_db_find_sched(void *conn, void *st, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts);
int pbs_db_next_sched(void *conn, void *st, pbs_db_obj_info_t *obj);
int pbs_db_delete_sched(void *conn, pbs_db_obj_info_t *obj);

int pbs_db_del_attr_job(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list);
int pbs_db_del_attr_sched(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list);
int pbs_db_del_attr_resv(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list);
int pbs_db_del_attr_svr(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list);
int pbs_db_del_attr_que(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list);
int pbs_db_del_attr_node(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list);

/**
 * @brief
 *	Execute a direct sql string on the open database connection
 *
 * @param[in]	conn - Connected database handle
 * @param[in]	sql  - A string describing the sql to execute.
 *
 * @return      int
 * @retval      -1  - Error
 * @retval       0  - success
 * @retval       1  - Execution succeeded but statement did not return any rows
 *
 */
int db_execute_str(void *conn, char *sql);

#ifdef __cplusplus
}
#endif

#endif /* _DB_POSTGRES_H */


================================================
FILE: src/lib/Libdb/pgsql/db_que.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *      Implementation of the queue data access functions for postgres
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include "db_postgres.h"

/**
 * @brief
 *	Prepare all the queue related sqls. Typically called after connect
 *	and before any other sql exeuction
 *
 * @param[in]	conn - Database connection handle
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
db_prepare_que_sqls(void *conn)
{
	char conn_sql[MAX_SQL_LENGTH];

	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into pbs.queue("
					   "qu_name, "
					   "qu_type, "
					   "qu_creattm, "
					   "qu_savetm, "
					   "attributes "
					   ") "
					   "values "
					   "($1, $2,  localtimestamp, localtimestamp, hstore($3::text[]))");
	if (db_prepare_stmt(conn, STMT_INSERT_QUE, conn_sql, 3) != 0)
		return -1;

	/* rewrite all attributes for FULL update */
	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.queue set "
					   "qu_type = $2, "
					   "qu_savetm = localtimestamp, "
					   "attributes = attributes || hstore($3::text[]) "
					   "where qu_name = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_QUE, conn_sql, 3) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.queue set "
					   "qu_type = $2, "
					   "qu_savetm = localtimestamp "
					   "where qu_name = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_QUE_QUICK, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.queue set "
					   "qu_savetm = localtimestamp, "
					   "attributes = attributes || hstore($2::text[]) "
					   "where qu_name = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_QUE_ATTRSONLY, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.queue set "
					   "qu_savetm = localtimestamp,"
					   "attributes = attributes - $2::text[] "
					   "where qu_name = $1");
	if (db_prepare_stmt(conn, STMT_REMOVE_QUEATTRS, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select qu_name, "
					   "qu_type, "
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.queue "
					   "where qu_name = $1");
	if (db_prepare_stmt(conn, STMT_SELECT_QUE, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "qu_name, "
					   "qu_type, "
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.queue order by qu_creattm");
	if (db_prepare_stmt(conn, STMT_FIND_QUES_ORDBY_CREATTM, conn_sql, 0) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "delete from pbs.queue where qu_name = $1");
	if (db_prepare_stmt(conn, STMT_DELETE_QUE, conn_sql, 1) != 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Load queue data from the row into the queue object
 *
 * @param[in]	res - Resultset from a earlier query
 * @param[in]	pq  - Queue object to load data into
 * @param[in]	row - The current row to load within the resultset
 *
 * @return      Error code
 * @retval	-1 - On Error
 * @retval	 0 - On Success
 * @retval	>1 - Number of attributes
 */
static int
load_que(PGresult *res, pbs_db_que_info_t *pq, int row)
{
	char *raw_array;
	static int qu_name_fnum, qu_type_fnum, attributes_fnum;
	static int fnums_inited = 0;

	if (fnums_inited == 0) {
		qu_name_fnum = PQfnumber(res, "qu_name");
		qu_type_fnum = PQfnumber(res, "qu_type");
		attributes_fnum = PQfnumber(res, "attributes");
		fnums_inited = 1;
	}

	GET_PARAM_STR(res, row, pq->qu_name, qu_name_fnum);
	GET_PARAM_INTEGER(res, row, pq->qu_type, qu_type_fnum);
	GET_PARAM_BIN(res, row, raw_array, attributes_fnum);

	/* convert attributes from postgres raw array format */
	return (dbarray_to_attrlist(raw_array, &pq->db_attr_list));
}

/**
 * @brief
 *	Insert queue data into the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Information of queue to be inserted
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_save_que(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	pbs_db_que_info_t *pq = obj->pbs_db_un.pbs_db_que;
	char *stmt = NULL;
	int params;
	int rc = 0;
	char *raw_array = NULL;

	SET_PARAM_STR(conn_data, pq->qu_name, 0);

	if (savetype & OBJ_SAVE_QS) {
		SET_PARAM_INTEGER(conn_data, pq->qu_type, 1);
		params = 2;
		stmt = STMT_UPDATE_QUE_QUICK;
	}

	if ((pq->db_attr_list.attr_count > 0) || (savetype & OBJ_SAVE_NEW)) {
		int len = 0;
		/* convert attributes to postgres raw array format */
		if ((len = attrlist_to_dbarray(&raw_array, &pq->db_attr_list)) <= 0)
			return -1;

		if (savetype & OBJ_SAVE_QS) {
			SET_PARAM_BIN(conn_data, raw_array, len, 2);
			params = 3;
			stmt = STMT_UPDATE_QUE;
		} else {
			SET_PARAM_BIN(conn_data, raw_array, len, 1);
			params = 2;
			stmt = STMT_UPDATE_QUE_ATTRSONLY;
		}
	}

	if (savetype & OBJ_SAVE_NEW)
		stmt = STMT_INSERT_QUE;

	if (stmt)
		rc = db_cmd(conn, stmt, params);

	return rc;
}

/**
 * @brief
 *	Load queue data from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Load queue information into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_que(void *conn, pbs_db_obj_info_t *obj)
{
	PGresult *res;
	int rc;
	pbs_db_que_info_t *pq = obj->pbs_db_un.pbs_db_que;

	SET_PARAM_STR(conn_data, pq->qu_name, 0);

	if ((rc = db_query(conn, STMT_SELECT_QUE, 1, &res)) != 0)
		return rc;

	rc = load_que(res, pq, 0);

	PQclear(res);

	return rc;
}

/**
 * @brief
 *	Find queues
 *
 * @param[in]	conn - Connection handle
 * @param[in]	st   - The cursor state variable updated by this query
 * @param[in]	obj  - Information of queue to be found
 * @param[in]	opts - Any other options (like flags, timestamp)
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 - Success, but no rows found
 *
 */
int
pbs_db_find_que(void *conn, void *st, pbs_db_obj_info_t *obj, pbs_db_query_options_t *opts)
{
	PGresult *res;
	char conn_sql[MAX_SQL_LENGTH];
	int rc;
	db_query_state_t *state = (db_query_state_t *) st;

	if (!state)
		return -1;

	strcpy(conn_sql, STMT_FIND_QUES_ORDBY_CREATTM);
	if ((rc = db_query(conn, conn_sql, 0, &res)) != 0)
		return rc;

	state->row = 0;
	state->res = res;
	state->count = PQntuples(res);

	return 0;
}

/**
 * @brief
 *	Get the next queue from the cursor
 *
 * @param[in]	conn - Connection handle
 * @param[in]	st   - The cursor state
 * @param[in]	obj  - queue information is loaded into this object
 *
 * @return      Error code
 *		(Even though this returns only 0 now, keeping it as int
 *			to support future change to return a failure)
 * @retval	 0 - Success
 *
 */
int
pbs_db_next_que(void *conn, void *st, pbs_db_obj_info_t *obj)
{
	db_query_state_t *state = (db_query_state_t *) st;

	return (load_que(state->res, obj->pbs_db_un.pbs_db_que, state->row));
}

/**
 * @brief
 *	Delete the queue from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - queue information
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_delete_que(void *conn, pbs_db_obj_info_t *obj)
{
	pbs_db_que_info_t *pq = obj->pbs_db_un.pbs_db_que;
	SET_PARAM_STR(conn_data, pq->qu_name, 0);
	return (db_cmd(conn, STMT_DELETE_QUE, 1));
}

/**
 * @brief
 *	Deletes attributes of a queue
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj_id  - queue id
 * @param[in]	attr_list - List of attributes
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - On Failure
 *
 */
int
pbs_db_del_attr_que(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list)
{
	char *raw_array = NULL;
	int len = 0;
	int rc = 0;

	if ((len = attrlist_to_dbarray_ex(&raw_array, attr_list, 1)) <= 0)
		return -1;

	SET_PARAM_STR(conn_data, obj_id, 0);
	SET_PARAM_BIN(conn_data, raw_array, len, 1);

	rc = db_cmd(conn, STMT_REMOVE_QUEATTRS, 2);

	return rc;
}


================================================
FILE: src/lib/Libdb/pgsql/db_resv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *      Implementation of the resv data access functions for postgres
 */
#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include "db_postgres.h"

/**
 * @brief
 *	Prepare all the reservation related sqls. Typically called after connect
 *	and before any other sql exeuction
 *
 * @param[in]	conn - Database connection handle
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
db_prepare_resv_sqls(void *conn)
{
	char conn_sql[MAX_SQL_LENGTH];
	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into pbs.resv ("
					   "ri_resvID, "
					   "ri_queue, "
					   "ri_state, "
					   "ri_substate, "
					   "ri_stime, "
					   "ri_etime, "
					   "ri_duration, "
					   "ri_tactive, "
					   "ri_svrflags, "
					   "ri_savetm, "
					   "ri_creattm, "
					   "attributes "
					   ") "
					   "values "
					   "($1, $2, $3, $4, $5, $6, $7, $8, $9, "
					   "localtimestamp, localtimestamp, hstore($10::text[]))");
	if (db_prepare_stmt(conn, STMT_INSERT_RESV, conn_sql, 10) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.resv set "
					   "ri_queue = $2, "
					   "ri_state = $3, "
					   "ri_substate = $4, "
					   "ri_stime = $5, "
					   "ri_etime = $6, "
					   "ri_duration = $7, "
					   "ri_tactive = $8, "
					   "ri_svrflags = $9, "
					   "ri_savetm = localtimestamp, "
					   "attributes = attributes || hstore($10::text[]) "
					   "where ri_resvID = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_RESV, conn_sql, 10) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.resv set "
					   "ri_queue = $2, "
					   "ri_state = $3, "
					   "ri_substate = $4, "
					   "ri_stime = $5, "
					   "ri_etime = $6, "
					   "ri_duration = $7, "
					   "ri_tactive = $8, "
					   "ri_svrflags = $9, "
					   "ri_savetm = localtimestamp "
					   "where ri_resvID = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_RESV_QUICK, conn_sql, 9) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.resv set "
					   "ri_savetm = localtimestamp, "
					   "attributes = attributes || hstore($2::text[]) "
					   "where ri_resvID = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_RESV_ATTRSONLY, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.resv set "
					   "ri_savetm = localtimestamp,"
					   "attributes = attributes - $2::text[] "
					   "where ri_resvID = $1");
	if (db_prepare_stmt(conn, STMT_REMOVE_RESVATTRS, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "ri_resvID, "
					   "ri_queue, "
					   "ri_state, "
					   "ri_substate, "
					   "ri_stime, "
					   "ri_etime, "
					   "ri_duration, "
					   "ri_tactive, "
					   "ri_svrflags, "
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.resv where ri_resvid = $1");
	if (db_prepare_stmt(conn, STMT_SELECT_RESV, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "ri_resvID, "
					   "ri_queue, "
					   "ri_state, "
					   "ri_substate, "
					   "ri_stime, "
					   "ri_etime, "
					   "ri_duration, "
					   "ri_tactive, "
					   "ri_svrflags, "
					   "hstore_to_array(attributes) as attributes "
					   "from pbs.resv "
					   "order by ri_creattm");
	if (db_prepare_stmt(conn, STMT_FINDRESVS_ORDBY_CREATTM,
			    conn_sql, 0) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "delete from pbs.resv where ri_resvid = $1");
	if (db_prepare_stmt(conn, STMT_DELETE_RESV, conn_sql, 1) != 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Load resv data from the row into the resv object
 *
 * @param[in]	res - Resultset from a earlier query
 * @param[in]	presv  - resv object to load data into
 * @param[in]	row - The current row to load within the resultset
 *
 * @return      Error code
 * @retval	-1 - On Error
 * @retval	 0 - On Success
 * @retval	>1 - Number of attributes
 */
static int
load_resv(PGresult *res, pbs_db_resv_info_t *presv, int row)
{
	char *raw_array;
	static int ri_resvid_fnum;
	static int ri_queue_fnum;
	static int ri_state_fnum;
	static int ri_substate_fnum;
	static int ri_stime_fnum;
	static int ri_etime_fnum;
	static int ri_duration_fnum;
	static int ri_tactive_fnum;
	static int ri_svrflags_fnum;
	static int attributes_fnum;
	static int fnums_inited = 0;

	if (fnums_inited == 0) {
		ri_resvid_fnum = PQfnumber(res, "ri_resvID");
		ri_queue_fnum = PQfnumber(res, "ri_queue");
		ri_state_fnum = PQfnumber(res, "ri_state");
		ri_substate_fnum = PQfnumber(res, "ri_substate");
		ri_stime_fnum = PQfnumber(res, "ri_stime");
		ri_etime_fnum = PQfnumber(res, "ri_etime");
		ri_duration_fnum = PQfnumber(res, "ri_duration");
		ri_tactive_fnum = PQfnumber(res, "ri_tactive");
		ri_svrflags_fnum = PQfnumber(res, "ri_svrflags");
		attributes_fnum = PQfnumber(res, "attributes");
		fnums_inited = 1;
	}

	GET_PARAM_STR(res, row, presv->ri_resvid, ri_resvid_fnum);
	GET_PARAM_STR(res, row, presv->ri_queue, ri_queue_fnum);
	GET_PARAM_INTEGER(res, row, presv->ri_state, ri_state_fnum);
	GET_PARAM_INTEGER(res, row, presv->ri_substate, ri_substate_fnum);
	GET_PARAM_BIGINT(res, row, presv->ri_stime, ri_stime_fnum);
	GET_PARAM_BIGINT(res, row, presv->ri_etime, ri_etime_fnum);
	GET_PARAM_BIGINT(res, row, presv->ri_duration, ri_duration_fnum);
	GET_PARAM_INTEGER(res, row, presv->ri_tactive, ri_tactive_fnum);
	GET_PARAM_INTEGER(res, row, presv->ri_svrflags, ri_svrflags_fnum);
	GET_PARAM_BIN(res, row, raw_array, attributes_fnum);

	/* convert attributes from postgres raw array format */
	return (dbarray_to_attrlist(raw_array, &presv->db_attr_list));
}

/**
 * @brief
 *	Insert resv data into the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Information of resv to be inserted
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_save_resv(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	pbs_db_resv_info_t *presv = obj->pbs_db_un.pbs_db_resv;
	char *stmt = NULL;
	int params;
	int rc = 0;
	char *raw_array = NULL;

	SET_PARAM_STR(conn_data, presv->ri_resvid, 0);

	if (savetype & OBJ_SAVE_QS) {
		SET_PARAM_STR(conn_data, presv->ri_queue, 1);
		SET_PARAM_INTEGER(conn_data, presv->ri_state, 2);
		SET_PARAM_INTEGER(conn_data, presv->ri_substate, 3);
		SET_PARAM_BIGINT(conn_data, presv->ri_stime, 4);
		SET_PARAM_BIGINT(conn_data, presv->ri_etime, 5);
		SET_PARAM_BIGINT(conn_data, presv->ri_duration, 6);
		SET_PARAM_INTEGER(conn_data, presv->ri_tactive, 7);
		SET_PARAM_INTEGER(conn_data, presv->ri_svrflags, 8);
		stmt = STMT_UPDATE_RESV_QUICK;
		params = 9;
	}

	if ((presv->db_attr_list.attr_count > 0) || (savetype & OBJ_SAVE_NEW)) {
		int len = 0;
		/* convert attributes to postgres raw array format */
		if ((len = attrlist_to_dbarray(&raw_array, &presv->db_attr_list)) <= 0)
			return -1;

		if (savetype & OBJ_SAVE_QS) {
			SET_PARAM_BIN(conn_data, raw_array, len, 9);
			stmt = STMT_UPDATE_RESV;
			params = 10;
		} else {
			SET_PARAM_BIN(conn_data, raw_array, len, 1);
			params = 2;
			stmt = STMT_UPDATE_RESV_ATTRSONLY;
		}
	}

	if (savetype & OBJ_SAVE_NEW)
		stmt = STMT_INSERT_RESV;

	if (stmt)
		rc = db_cmd(conn, stmt, params);

	return rc;
}

/**
 * @brief
 *	Load resv data from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Load resv information into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_resv(void *conn, pbs_db_obj_info_t *obj)
{
	pbs_db_resv_info_t *presv = obj->pbs_db_un.pbs_db_resv;
	PGresult *res;
	int rc;

	SET_PARAM_STR(conn_data, presv->ri_resvid, 0);

	if ((rc = db_query(conn, STMT_SELECT_RESV, 1, &res)) != 0)
		return rc;

	rc = load_resv(res, presv, 0);

	PQclear(res);

	return rc;
}

/**
 * @brief
 *	Find resv
 *
 * @param[in]	conn - Connection handle
 * @param[in]	st   - The cursor state variable updated by this query
 * @param[in]	obj  - Information of resv to be found
 * @param[in]	opts - Any other options (like flags, timestamp)
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 - Success, but no rows found
 *
 */
int
pbs_db_find_resv(void *conn, void *st, pbs_db_obj_info_t *obj,
		 pbs_db_query_options_t *opts)
{
	PGresult *res;
	int rc;
	int params;
	char conn_sql[MAX_SQL_LENGTH];
	db_query_state_t *state = (db_query_state_t *) st;

	if (!state)
		return -1;

	params = 0;
	strcpy(conn_sql, STMT_FINDRESVS_ORDBY_CREATTM);

	if ((rc = db_query(conn, conn_sql, params, &res)) != 0)
		return rc;

	state->row = 0;
	state->res = res;
	state->count = PQntuples(res);
	return 0;
}

/**
 * @brief
 *	Get the next resv from the cursor
 *
 * @param[in]	conn - Connection handle
 * @param[in]	st   - The cursor state
 * @param[in]	obj  - Resv information is loaded into this object
 *
 * @return      Error code
 *		(Even though this returns only 0 now, keeping it as int
 *			to support future change to return a failure)
 * @retval	 0 - Success
 *
 */
int
pbs_db_next_resv(void *conn, void *st, pbs_db_obj_info_t *obj)
{
	db_query_state_t *state = (db_query_state_t *) st;
	return (load_resv(state->res, obj->pbs_db_un.pbs_db_resv, state->row));
}

/**
 * @brief
 *	Delete the resv from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Resv information
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_delete_resv(void *conn, pbs_db_obj_info_t *obj)
{
	pbs_db_resv_info_t *presv = obj->pbs_db_un.pbs_db_resv;
	SET_PARAM_STR(conn_data, presv->ri_resvid, 0);
	return (db_cmd(conn, STMT_DELETE_RESV, 1));
}

/**
 * @brief
 *	Deletes attributes of a Resv
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj_id  - Resv id
 * @param[in]	attr_list - List of attributes
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - On Failure
 *
 */
int
pbs_db_del_attr_resv(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list)
{
	char *raw_array = NULL;
	int len = 0;
	int rc = 0;

	if ((len = attrlist_to_dbarray_ex(&raw_array, attr_list, 1)) <= 0)
		return -1;

	SET_PARAM_STR(conn_data, obj_id, 0);
	SET_PARAM_BIN(conn_data, raw_array, len, 1);

	rc = db_cmd(conn, STMT_REMOVE_RESVATTRS, 2);

	return rc;
}


================================================
FILE: src/lib/Libdb/pgsql/db_sched.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *      Implementation of the scheduler data access functions for postgres
 */
#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include "db_postgres.h"

/**
 * @brief
 *	Prepare all the scheduler related sqls. Typically called after connect
 *	and before any other sql exeuction
 *
 * @param[in]	conn - Database connection handle
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
db_prepare_sched_sqls(void *conn)
{
	char conn_sql[MAX_SQL_LENGTH];
	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into "
					   "pbs.scheduler( "
					   "sched_name, "
					   "sched_savetm, "
					   "sched_creattm, "
					   "attributes "
					   ") "
					   "values ($1, localtimestamp, localtimestamp, hstore($2::text[]))");
	if (db_prepare_stmt(conn, STMT_INSERT_SCHED, conn_sql, 2) != 0)
		return -1;

	/* rewrite all attributes for a FULL update */
	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.scheduler set "
					   "sched_savetm = localtimestamp, "
					   "attributes = attributes || hstore($2::text[]) "
					   "where sched_name = $1");
	if (db_prepare_stmt(conn, STMT_UPDATE_SCHED, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.scheduler set "
					   "sched_savetm = localtimestamp,"
					   "attributes = attributes - $2::text[] "
					   "where sched_name = $1");
	if (db_prepare_stmt(conn, STMT_REMOVE_SCHEDATTRS, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "sched_name, "
					   "hstore_to_array(attributes) as attributes "
					   "from "
					   "pbs.scheduler "
					   "where sched_name = $1");
	if (db_prepare_stmt(conn, STMT_SELECT_SCHED, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "sched_name, "
					   "hstore_to_array(attributes) as attributes "
					   "from "
					   "pbs.scheduler ");
	if (db_prepare_stmt(conn, STMT_SELECT_SCHED_ALL, conn_sql, 0) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "delete from pbs.scheduler where sched_name = $1");
	if (db_prepare_stmt(conn, STMT_DELETE_SCHED, conn_sql, 1) != 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Insert scheduler data into the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Information of scheduler to be inserted
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_save_sched(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	pbs_db_sched_info_t *psch = obj->pbs_db_un.pbs_db_sched;
	char *stmt = NULL;
	int params;
	int rc = 0;
	char *raw_array = NULL;

	SET_PARAM_STR(conn_data, psch->sched_name, 0);

	/* sched does not have a QS area, so ignoring that */

	if ((psch->db_attr_list.attr_count > 0) || (savetype & OBJ_SAVE_NEW)) {
		int len = 0;
		/* convert attributes to postgres raw array format */
		if ((len = attrlist_to_dbarray(&raw_array, &psch->db_attr_list)) <= 0)
			return -1;

		SET_PARAM_BIN(conn_data, raw_array, len, 1);
		stmt = STMT_UPDATE_SCHED;
		params = 2;
	}

	if (savetype & OBJ_SAVE_NEW)
		stmt = STMT_INSERT_SCHED;

	if (stmt)
		rc = db_cmd(conn, stmt, params);

	return rc;
}

/**
 * @brief
 *	Load scheduler data from the row into the scheduler object
 *
 * @param[in]	res - Resultset from a earlier query
 * @param[out]	psch  - Scheduler object to load data into
 * @param[in]	row - The current row to load within the resultset
 *
 * @return      Error code
 * @retval	-1 - On Error
 * @retval	 0 - On Success
 * @retval	>1 - Number of attributes
 */
static int
load_sched(PGresult *res, pbs_db_sched_info_t *psch, int row)
{
	char *raw_array;
	static int sched_name_fnum;
	static int attributes_fnum;
	static int fnums_inited = 0;

	if (fnums_inited == 0) {
		sched_name_fnum = PQfnumber(res, "sched_name");
		attributes_fnum = PQfnumber(res, "attributes");
		fnums_inited = 1;
	}

	GET_PARAM_STR(res, row, psch->sched_name, sched_name_fnum);
	GET_PARAM_BIN(res, row, raw_array, attributes_fnum);

	/* convert attributes from postgres raw array format */
	return (dbarray_to_attrlist(raw_array, &psch->db_attr_list));
}

/**
 * @brief
 *	Load scheduler data from the database
 *
 * @param[in]	conn - Connection handle
 * @param[out]	obj  - Load scheduler information into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_sched(void *conn, pbs_db_obj_info_t *obj)
{
	PGresult *res;
	int rc;
	pbs_db_sched_info_t *psch = obj->pbs_db_un.pbs_db_sched;

	SET_PARAM_STR(conn_data, psch->sched_name, 0);

	if ((rc = db_query(conn, STMT_SELECT_SCHED, 1, &res)) != 0)
		return rc;

	rc = load_sched(res, psch, 0);

	PQclear(res);

	return rc;
}

/**
 * @brief
 *	Find scheduler
 *
 * @param[in]	conn - Connection handle
 * @param[out]	st   - The cursor state variable updated by this query
 * @param[in]	obj  - Information of sched to be found
 * @param[in]	opts - Any other options (like flags, timestamp)
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows found
 *
 */
int
pbs_db_find_sched(void *conn, void *st, pbs_db_obj_info_t *obj,
		  pbs_db_query_options_t *opts)
{
	PGresult *res;
	db_query_state_t *state = (db_query_state_t *) st;
	int rc;
	int params;

	if (!state)
		return -1;

	params = 0;
	if ((rc = db_query(conn, STMT_SELECT_SCHED_ALL, params, &res)) != 0)
		return rc;

	state->row = 0;
	state->res = res;
	state->count = PQntuples(res);

	return 0;
}

/**
 * @brief
 *	Deletes attributes of a Scheduler
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj_id  - Scheduler id
 * @param[in]	attr_list - List of attributes
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - On Failure
 *
 */
int
pbs_db_del_attr_sched(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list)
{
	char *raw_array = NULL;
	int len = 0;
	int rc = 0;

	if ((len = attrlist_to_dbarray_ex(&raw_array, attr_list, 1)) <= 0)
		return -1;

	SET_PARAM_STR(conn_data, obj_id, 0);
	SET_PARAM_BIN(conn_data, raw_array, len, 1);

	rc = db_cmd(conn, STMT_REMOVE_SCHEDATTRS, 2);

	return rc;
}

/**
 * @brief
 *	Get the next scheduler from the cursor
 *
 * @param[in]	conn - Connection handle
 * @param[out]	st   - The cursor state
 * @param[in]	obj  - Scheduler information is loaded into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_next_sched(void *conn, void *st, pbs_db_obj_info_t *obj)
{
	db_query_state_t *state = (db_query_state_t *) st;

	return (load_sched(state->res, obj->pbs_db_un.pbs_db_sched, state->row));
}

/**
 * @brief
 *	Delete the scheduler from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - scheduler information
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_delete_sched(void *conn, pbs_db_obj_info_t *obj)
{
	pbs_db_sched_info_t *sc = obj->pbs_db_un.pbs_db_sched;
	SET_PARAM_STR(conn_data, sc->sched_name, 0);
	return (db_cmd(conn, STMT_DELETE_SCHED, 1));
}


================================================
FILE: src/lib/Libdb/pgsql/db_svr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *      Implementation of the svr data access functions for postgres
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_db.h"
#include <errno.h>
#include "db_postgres.h"

extern char *errmsg_cache;
static int pbs_db_truncate_all(void *conn);

/**
 * @brief
 *	Prepare all the server related sqls. Typically called after connect
 *	and before any other sql exeuction
 *
 * @param[in]	conn - Database connection handle
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
db_prepare_svr_sqls(void *conn)
{
	char conn_sql[MAX_SQL_LENGTH];

	snprintf(conn_sql, MAX_SQL_LENGTH, "insert into pbs.server( "
					   "sv_jobidnumber, "
					   "sv_savetm, "
					   "sv_creattm, "
					   "attributes "
					   ") "
					   "values "
					   "($1, localtimestamp, localtimestamp, hstore($2::text[]))");
	if (db_prepare_stmt(conn, STMT_INSERT_SVR, conn_sql, 2) != 0)
		return -1;

	/* replace all attributes for a FULL update */
	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.server set "
					   "sv_jobidnumber = $1, "
					   "sv_savetm = localtimestamp, "
					   "attributes = attributes || hstore($2::text[])");
	if (db_prepare_stmt(conn, STMT_UPDATE_SVR, conn_sql, 2) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "update pbs.server set "
					   "sv_savetm = localtimestamp,"
					   "attributes = attributes - $1::text[]");
	if (db_prepare_stmt(conn, STMT_REMOVE_SVRATTRS, conn_sql, 1) != 0)
		return -1;

	snprintf(conn_sql, MAX_SQL_LENGTH, "select "
					   "sv_jobidnumber, "
					   "hstore_to_array(attributes) as attributes "
					   "from "
					   "pbs.server ");
	if (db_prepare_stmt(conn, STMT_SELECT_SVR, conn_sql, 0) != 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Truncate all data from ALL tables from the database
 *
 * @param[in]	conn - The database connection handle
 *
 * @return      Error code
 * @retval	-1 - Failure
 *		 0 - Success
 *
 */
static int
pbs_db_truncate_all(void *conn)
{
	char conn_sql[MAX_SQL_LENGTH]; /* sql buffer */

	snprintf(conn_sql, MAX_SQL_LENGTH, "truncate table 	"
					   "pbs.scheduler, "
					   "pbs.node, "
					   "pbs.queue, "
					   "pbs.resv, "
					   "pbs.job_scr, "
					   "pbs.job, "
					   "pbs.server");

	if (db_execute_str(conn, conn_sql) == -1)
		return -1;

	return 0;
}

/**
 * @brief
 *	Insert server data into the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Information of server to be inserted
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_db_save_svr(void *conn, pbs_db_obj_info_t *obj, int savetype)
{
	pbs_db_svr_info_t *ps = obj->pbs_db_un.pbs_db_svr;
	char *stmt = NULL;
	int params;
	char *raw_array = NULL;
	int len = 0;
	int rc = 0;

	/* Svr does not have a QS area, so ignoring that */
	SET_PARAM_BIGINT(conn_data, ps->sv_jobidnumber, 0);

	if ((ps->db_attr_list.attr_count > 0) || (savetype & OBJ_SAVE_NEW)) {
		/* convert attributes to postgres raw array format */
		if ((len = attrlist_to_dbarray(&raw_array, &ps->db_attr_list)) <= 0)
			return -1;

		SET_PARAM_BIN(conn_data, raw_array, len, 1);
		params = 2;
		stmt = STMT_UPDATE_SVR;
	}

	if (savetype & OBJ_SAVE_NEW) {
		stmt = STMT_INSERT_SVR;
		/* reinitialize schema by dropping PBS schema */
		if (pbs_db_truncate_all(conn) == -1) {
			db_set_error(conn, &errmsg_cache, "Could not truncate PBS data", stmt, "");
			return -1;
		}
	}

	if (stmt)
		rc = db_cmd(conn, stmt, params);

	return rc;
}

/**
 * @brief
 *	Load server data from the database
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj  - Load server information into this object
 *
 * @return      Error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 * @retval	 1 -  Success but no rows loaded
 *
 */
int
pbs_db_load_svr(void *conn, pbs_db_obj_info_t *obj)
{
	PGresult *res;
	int rc;
	char *raw_array;
	pbs_db_svr_info_t *ps = obj->pbs_db_un.pbs_db_svr;
	static int sv_jobidnumber_fnum;
	static int attributes_fnum;
	static int fnums_inited = 0;

	if ((rc = db_query(conn, STMT_SELECT_SVR, 0, &res)) != 0)
		return rc;

	if (fnums_inited == 0) {
		sv_jobidnumber_fnum = PQfnumber(res, "sv_jobidnumber");
		attributes_fnum = PQfnumber(res, "attributes");
		fnums_inited = 1;
	}

	GET_PARAM_BIGINT(res, 0, ps->sv_jobidnumber, sv_jobidnumber_fnum);
	GET_PARAM_BIN(res, 0, raw_array, attributes_fnum);

	/* convert attributes from postgres raw array format */
	rc = dbarray_to_attrlist(raw_array, &ps->db_attr_list);

	PQclear(res);

	return rc;
}

/**
 * @brief
 *	Deletes attributes of a server
 *
 * @param[in]	conn - Connection handle
 * @param[in]	obj_id  - server id
 * @param[in]	attr_list - List of attributes
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - On Failure
 *
 */
int
pbs_db_del_attr_svr(void *conn, void *obj_id, pbs_db_attr_list_t *attr_list)
{
	char *raw_array = NULL;
	int len = 0;
	int rc;

	if ((len = attrlist_to_dbarray_ex(&raw_array, attr_list, 1)) <= 0)
		return -1;

	SET_PARAM_BIN(conn_data, raw_array, len, 0);

	rc = db_cmd(conn, STMT_REMOVE_SVRATTRS, 1);

	return rc;
}


================================================
FILE: src/lib/Libdb/pgsql/pbs_db_env
================================================
#!/bin/false
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
# For legacy installations, PostgreSQL was packaged together with PBS.
# If this is a legacy installation, setup the appropiate dynamic
# library paths. Otherwise, set some variables the are used later.
#

PGSQL_LIBSTR=""
if [ -z "$PBS_EXEC" ]; then
	. ${PBS_CONF_FILE:-/etc/pbs.conf}
fi
if [ -d "$PBS_EXEC/pgsql" ]; then
	# Using PostgreSQL packaged with PBS
	if [ -n "$PGSQL_INST_DIR" ]; then
		PGSQL_DIR="$PGSQL_INST_DIR"
		PGSQL_BIN="$PGSQL_INST_DIR/bin"
	else
		PGSQL_DIR="$PBS_EXEC/pgsql"
		PGSQL_BIN="$PBS_EXEC/pgsql/bin"
	fi
	if [ ! -d "$PGSQL_BIN" ]; then
		echo "\*\*\* $PGSQL_BIN directory does not exist"
		exit 1
	fi
	PGSQL_CMD="$PGSQL_BIN/psql"
	if [ ! -x "$PGSQL_CMD" ]; then
		echo "\*\*\* $PGSQL_BIN/psql not executable"
		exit 1
	fi
	[ -d "$PGSQL_DIR/lib" ] && LD_LIBRARY_PATH="$PGSQL_DIR/lib:$LD_LIBRARY_PATH"
	[ -d "$PGSQL_DIR/lib64" ] && LD_LIBRARY_PATH="$PGSQL_DIR/lib64:$LD_LIBRARY_PATH"
	PGSQL_LIBSTR="LD_LIBRARY_PATH=$LD_LIBRARY_PATH; export LD_LIBRARY_PATH; "
	export PGSQL_LIBSTR
else
	# Using system installed PostgreSQL package
	PGSQL_CMD=`type psql 2>/dev/null | cut -d' ' -f3`
	if [ -z "$PGSQL_CMD" ]; then
		echo "\*\*\* psql command is not in PATH"
		exit 1
	fi
	PGSQL_CONF=`type pg_config 2>/dev/null | cut -d' ' -f3`
	if [ -z "$PGSQL_CONF" ]; then
		PGSQL_BIN=`dirname ${PGSQL_CMD}`
	else
		PGSQL_BIN=`${PGSQL_CONF} | awk '/BINDIR/{ print $3 }'`
	fi
	PGSQL_DIR=`dirname $PGSQL_BIN`
	[ "$PGSQL_DIR" = "/" ] && PGSQL_DIR=""
fi
export PGSQL_BIN=$PGSQL_BIN
[ -d "$PBS_EXEC/lib" ] && LD_LIBRARY_PATH="$PBS_EXEC/lib:$LD_LIBRARY_PATH"
export LD_LIBRARY_PATH


================================================
FILE: src/lib/Libdb/pgsql/pbs_db_schema.sql
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */


/*
 * pbs_schema.sql - contains sql code to re-create the PBS database schema
 *
 */

drop schema pbs cascade; -- Drop any existing schema called pbs
create schema pbs;	 -- Create a new schema called pbs
create extension hstore; -- Create the hstore extension if it does not exit
---------------------- VERSION -----------------------------

/*
 * Table pbs.info holds information about the schema
 * - The schema version, used for migrating and updating PBS
 */
CREATE TABLE pbs.info (
    pbs_schema_version TEXT    NOT NULL
);

INSERT INTO pbs.info values('1.5.0'); /* schema version */

---------------------- SERVER ------------------------------

/*
 * Table pbs.server holds server object information
 */
CREATE TABLE pbs.server (
    sv_jobidnumber  BIGINT      NOT NULL,
    sv_savetm       TIMESTAMP   NOT NULL,
    sv_creattm      TIMESTAMP   NOT NULL,
    attributes      hstore      NOT NULL DEFAULT ''	
);

---------------------- SCHED -------------------------------

/*
 * Table pbs.scheduler holds scheduler instance information
 */
CREATE TABLE pbs.scheduler (
    sched_name      TEXT        NOT NULL,
    sched_savetm    TIMESTAMP   NOT NULL,
    sched_creattm   TIMESTAMP   NOT NULL,
    attributes      hstore      NOT NULL default '',	
    CONSTRAINT scheduler_pk PRIMARY KEY (sched_name)
);

---------------------- NODE --------------------------------

/*
 * Table pbs.mominfo_time holds information about the generation and time of
 * the host to vnode map
 */
CREATE TABLE pbs.mominfo_time (
    mit_time    BIGINT,
    mit_gen     INTEGER
);

/*
 * Table pbs.node holds information about PBS nodes
 */
CREATE TABLE pbs.node (
    nd_name         TEXT        NOT NULL,
    mom_modtime     BIGINT,
    nd_hostname     TEXT        NOT NULL,
    nd_state        INTEGER     NOT NULL,
    nd_ntype        INTEGER     NOT NULL,
    nd_pque         TEXT,
    nd_index        INTEGER     NOT NULL,
    nd_savetm       TIMESTAMP   NOT NULL,
    nd_creattm      TIMESTAMP   NOT NULL,
    attributes      hstore      NOT NULL default '',
    CONSTRAINT pbsnode_pk PRIMARY KEY (nd_name)
);
CREATE INDEX nd_idx_cr
ON pbs.node
( nd_creattm );

---------------------- QUEUE -------------------------------

/*
 * Table pbs.queue holds queue information
 */
CREATE TABLE pbs.queue (
    qu_name     TEXT        NOT NULL,
    qu_type     INTEGER     NOT NULL,
    qu_creattm  TIMESTAMP   NOT NULL,
    qu_savetm   TIMESTAMP   NOT NULL,
    attributes  hstore      NOT NULL default '',
    CONSTRAINT queue_pk PRIMARY KEY (qu_name)
);
CREATE INDEX que_idx_cr
ON pbs.queue
( qu_creattm );


---------------------- RESERVATION -------------------------

/*
 * Table pbs.resv holds reservation information
 */
CREATE TABLE pbs.resv (
    ri_resvID       TEXT        NOT NULL,
    ri_queue        TEXT        NOT NULL,
    ri_state        INTEGER     NOT NULL,
    ri_substate     INTEGER     NOT NULL,
    ri_stime        BIGINT      NOT NULL,
    ri_etime        BIGINT      NOT NULL,
    ri_duration     BIGINT      NOT NULL,
    ri_tactive      INTEGER     NOT NULL,
    ri_svrflags     INTEGER     NOT NULL,
    ri_savetm       TIMESTAMP   NOT NULL,
    ri_creattm      TIMESTAMP   NOT NULL,
    attributes      hstore      NOT NULL default '',
    CONSTRAINT resv_pk PRIMARY KEY (ri_resvID)
);


---------------------- JOB ---------------------------------

/*
 * Table pbs.job holds job information
 */
CREATE TABLE pbs.job (
    ji_jobid        TEXT        NOT NULL,
    ji_state        INTEGER     NOT NULL,
    ji_substate     INTEGER     NOT NULL,
    ji_svrflags     INTEGER     NOT NULL,
    ji_stime        BIGINT,
    ji_queue        TEXT        NOT NULL,
    ji_destin       TEXT,
    ji_un_type      INTEGER     NOT NULL,
    ji_exitstat     INTEGER,
    ji_quetime      BIGINT,
    ji_rteretry     BIGINT,
    ji_fromsock     INTEGER,
    ji_fromaddr     BIGINT,
    ji_jid          TEXT,
    ji_credtype     INTEGER,
    ji_qrank        BIGINT      NOT NULL,
    ji_savetm       TIMESTAMP   NOT NULL,
    ji_creattm      TIMESTAMP   NOT NULL,
    attributes      hstore      NOT NULL default '',
    CONSTRAINT jobid_pk PRIMARY KEY (ji_jobid)
);

CREATE INDEX job_rank_idx
ON pbs.job
( ji_qrank );


/*
 * Table pbs.job_scr holds the job script
 */
CREATE TABLE pbs.job_scr (
    ji_jobid    TEXT       NOT NULL,
    script      TEXT
);
CREATE INDEX job_scr_idx ON pbs.job_scr (ji_jobid);

---------------------- END OF SCHEMA -----------------------


================================================
FILE: src/lib/Libdb/pgsql/pbs_db_utility
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

. ${PBS_CONF_FILE:-/etc/pbs.conf}


trap cleanup 1 2 3 15

dir=`dirname $0`
CWD=`pwd`
upgrade=0
PBS_AES_SWITCH_VER='14.0'
change_locale=0
opt_err=1
opt="$1"

#---------------------------------------------------------------------------------------------------
# Helper functions.
cleanup() {
	cd ${CWD}
	rm -rf ${data_dir}
	rm -f ${schema}
	rm -f ${tmp_file}
}

cleanup_on_finish () {
	# change back to our dir and quit
	cd ${CWD}
	err=`rm -f ${schema}`
	if [ $? -ne 0 ]; then
		echo "${err}"
	fi
}

set_db_trust_login() {
	datastore_dir=$1
	err=`cp -p ${datastore_dir}/pg_hba.conf ${datastore_dir}/pg_hba.conf.orig 2>&1`
	if [ $? -ne 0 ]; then
		echo "${err}"
		return 1
	fi
	err=`chown ${PBS_DATA_SERVICE_USER} ${datastore_dir}/pg_hba.conf.orig`
	if [ $? -ne 0 ]; then
		echo "${err}"
		return 1
	fi
	err=`sed 's/md5/trust/g' ${datastore_dir}/pg_hba.conf > ${datastore_dir}/pg_hba.conf.new 2>&1`
	if [ $? -ne 0 ]; then
		echo "${err}"
		return 1
	fi
	err=`chown ${PBS_DATA_SERVICE_USER} ${datastore_dir}/pg_hba.conf.new`
	if [ $? -ne 0 ]; then
		echo "${err}"
		return 1
	fi
	err=`mv ${datastore_dir}/pg_hba.conf.new ${datastore_dir}/pg_hba.conf 2>&1`
	if [ $? -ne 0 ]; then
		echo "${err}"
		return 1
	fi
}

revoke_db_trust_login() {
	datastore_dir=$1
	err=`cp -p ${datastore_dir}/pg_hba.conf.orig ${datastore_dir}/pg_hba.conf 2>&1`
	if [ $? -eq 0 ]; then
		rm -f ${datastore_dir}/pg_hba.conf.orig
	else
		echo "${err}"
		return 1
	fi
}

backupdir() {
	if [ -d "$1" -a -d "$2" ]; then
		backupdir="$(basename $1).pre.${PBS_VERSION}"
		echo "*** Backing up $1 to ${2}/${backupdir}"
		mv "$1" "${2}/${backupdir}"
	fi
}

# DB Upgrade functions
upgrade_pbs_database() {
	sys_pgsql_ver=$1
	old_pgsql_ver=$2
	user="${PBS_DATA_SERVICE_USER}"
	inst_dir="${PGSQL_DIR}"
	data_dir="${PBS_HOME}/datastore"

	# Check for existence of old data service directory.
	if [ -d "${PBS_HOME}/pgsql.old" ]; then
		old_inst_dir="${PBS_HOME}/pgsql.old"
		old_data_dir="${PBS_HOME}/datastore.old"
	elif [ -d "${PBS_HOME}/pgsql.forupgrade" ]; then
		old_inst_dir="${PBS_HOME}/pgsql.forupgrade"
		old_data_dir="${PBS_HOME}/datastore.forupgrade"
	else
		echo "Data service directory from previous PBS installation not found,"
		echo "Datastore upgrade cannot continue"
		return 1
	fi

	# strip the minor version from sys_pgsql_ver if old_pgsql_ver does not have minor version (for comparison).
	[[ ! $old_pgsql_ver =~ "." ]] && sys_pgsql_ver=$(echo $sys_pgsql_ver | cut -d '.' -f 1)

	[ ${sys_pgsql_ver%.*} -eq ${old_pgsql_ver%.*} ] && [ ${sys_pgsql_ver#*.} \> ${old_pgsql_ver#*.} ] || [ ${sys_pgsql_ver%.*} -gt ${old_pgsql_ver%.*} ];
	result=$?
	if [ ${result} -eq 0 ]; then
		if [ -d "$PBS_EXEC/pgsql" ]; then
			#Start upgrade process of datastore
			upgrade_db
			return $?
		else
			return 2
		fi
	elif [ "${old_pgsql_ver}" = "${sys_pgsql_ver}" ]; then
		return 0
	fi

	echo "Upgrade from version ${old_pgsql_ver} unsupported"
	return 1
}

upgrade_db() {
	#
	# This routine will insatll a postgres database cluster,
	# will perform the pre-upgrade checks for datastore
	# with appropriate authentication management.
	#

	server_ctl="${PBS_EXEC}/sbin/pbs_dataservice"
	if [ ! -x "${server_ctl}" ]; then
		echo "${server_ctl} not found"
		return 1
	fi

	if [ ! -x "${PBS_EXEC}/sbin/pbs_ds_password" ]; then
		echo "${PBS_EXEC}/sbin/pbs_ds_password not found"
		return 1
	fi

	if [ ! -x "${inst_dir}/bin/pg_upgrade" ]; then
		echo "${inst_dir}/bin/pg_upgrade not found"
		return 1
	fi

	# Backup datastore directory, if backup directory already
	# present then exit.
	if [ -d "${old_data_dir}" ]; then
		echo "Files from previous datastore upgrade found,"
		echo "Datastore upgrade cannot continue"
		return 1
	else
		err=`mv ${data_dir} ${old_data_dir} 2>&1`
		if [ $? -ne 0 ]; then
			echo "${err}"
			return 1
		fi
	fi

	# Invoke the dataservice creation script for pbs

	upgrade=1
	pbs_install_db
	ret=$?

	if [ ${ret} -ne 0 ]; then
		echo "*** Error initializing the PBS dataservice"
		echo "Error details:"
		echo "$resp"
		return ${ret}
	fi

	# Copy the pg_hba.conf from old cluster.
	err=`cp -p ${old_data_dir}/pg_hba.conf ${data_dir}/pg_hba.conf`
	if [ $? -ne 0 ]; then
		echo "${err}"
		return 1
	fi

	set_db_trust_login "${data_dir}"
	ret=$?
	if [ $ret -ne 0 ]; then
		return $ret
	fi
	set_db_trust_login "${old_data_dir}"
	ret=$?
	if [ $ret -ne 0 ]; then
		return $ret
	fi

	CWD=`pwd`
	cd "${data_dir}"
	#Perform pg_upgrade -c to check if we can upgrade the cluster or not
	err=`su ${user} -c "/bin/sh -c '${PGSQL_LIBSTR} ${inst_dir}/bin/pg_upgrade -b ${old_inst_dir}/bin -B ${inst_dir}/bin -d ${old_data_dir} -D ${data_dir} -c'" 2>&1`
	if [ $? -ne 0 ]; then
		echo "Refer pg_upgrade log files at $PBS_HOME/datastore/pg_upgrade_internal.log,"
		echo "$PBS_HOME/datastore/pg_upgrade_server.log and"
		echo "$PBS_HOME/datastore/pg_upgrade_utility.log for more information"
		revoke_db_trust_login "${data_dir}"
		ret=$?
		if [ $ret -ne 0 ]; then
			return $ret
		fi

		revoke_db_trust_login "${old_data_dir}"
		ret=$?
		if [ $ret -ne 0 ]; then
			return $ret
		fi

		return 1
	fi

	#Perform pg_upgrade for database upgrade
	err=`su ${user} -c "/bin/sh -c '${PGSQL_LIBSTR} ${inst_dir}/bin/pg_upgrade -b ${old_inst_dir}/bin -B ${inst_dir}/bin -d ${old_data_dir} -D ${data_dir}'" 2>&1`
	if [ $? -ne 0 ]; then
		echo "Refer pg_upgrade log files at $PBS_HOME/datastore/pg_upgrade_internal.log,"
		echo "$PBS_HOME/datastore/pg_upgrade_server.log and"
		echo "$PBS_HOME/datastore/pg_upgrade_utility.log for more information"
		revoke_db_trust_login "${data_dir}"
		ret=$?
		if [ $ret -ne 0 ]; then
			return $ret
		fi

		revoke_db_trust_login "${old_data_dir}"
		ret=$?
		if [ $ret -ne 0 ]; then
			return $ret
		fi

		return 1
	fi

	# start the dataservice
	${server_ctl} start > /dev/null
	if [ $? -ne 0 ]; then
		echo "Error starting PBS Data Service"
		return 1
	fi

	# Optimizer statistics are not transferred by pg_upgrade, so do it manually.
	ENVSTR="PGPORT=${PBS_DATA_SERVICE_PORT}; export PGPORT; PGHOST=${PBS_SERVER}; export PGHOST; PGUSER=${user}; export PGUSER; "
	err=`su ${user} -c "/bin/sh -c '${PGSQL_LIBSTR} ${ENVSTR} ${data_dir}/analyze_new_cluster.sh'"`

	# Update locale of pbs database to C
	if [ ${change_locale} -eq 1 ]; then
		${inst_dir}/bin/psql -A -t -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${user} -c "update pg_database set datcollate='C', datctype='C'" > /dev/null
		ret=$?
		if [ $ret -ne 0 ]; then
			return $ret
		fi
	fi

	# stop the dataservice
	${server_ctl} stop > /dev/null
	if [ $? -ne 0 ]; then
		echo "Error stopping PBS Data Service"
		kill -s SIGTERM `ps -ef | grep "${inst_dir}/bin/postgres" | grep -v grep | awk '{if ($3 == 1) print $2}'`
		return 1
	fi
	revoke_db_trust_login "${data_dir}"
	ret=$?
	if [ $ret -ne 0 ]; then
		return $ret
	fi

	cd "${CWD}"
	# Delete old cluster
	err=`${data_dir}/delete_old_cluster.sh`
	ret=$?
	if [ $ret -ne 0 ]; then
		return $ret
	fi
}


pbs_install_db () {
	locale=""
	if [ "${change_locale}" = "0" ]; then
		locale="--locale=C"
	fi

	if [ ! -z "${PBS_DATA_SERVICE_HOST}" ]; then
		echo "Custom data service host used...configure manually"
		exit 0
	fi

	if [ -z "${PBS_DATA_SERVICE_PORT}" ]; then
		PBS_DATA_SERVICE_PORT="15007"
	fi
	export PBS_DATA_SERVICE_PORT

	bin_dir="${PGSQL_BIN}"
	data_dir="${PBS_HOME}/datastore"
	server_ctl="${PBS_EXEC}/sbin/pbs_dataservice"
	tmp_file="${PBS_HOME}/spool/tmp_inst_$$"
	db_user="${PBS_HOME}/server_priv/db_user"

	# Get non symbolic absolute path of pgsql directory
	real_inst_dir="`/bin/ls -l $PBS_EXEC | awk '{print $NF "/pgsql"}'`"

	schema_in="${PBS_EXEC}/libexec/pbs_db_schema.sql"
	if [ ! -f "${schema_in}" ]; then
		echo "PBS datastore schema file not found"
		exit 1
	fi
	schema="${PBS_HOME}/spool/pbs_install_db_schema"
	cat ${schema_in} > ${schema}
	chmod 600 ${schema}
	if [ $? -ne 0 ]; then
		echo "chmod of ${schema} failed"
		rm -f ${schema}
		exit 1
	fi

	lwd=`pwd`

	if [ ! -d "${bin_dir}" ]; then
		# Using the system installed Postgres instead
		initdb_loc=`type initdb 2>/dev/null | cut -d' ' -f3`
		if [ -z "$initdb_loc" ]; then
			echo "PBS Data Service directory ${bin_dir}"
			echo "not present and postgresql-server not installed."
			rm -f ${schema}
			exit 1
		fi
		bin_dir=`dirname $initdb_loc`
	fi

	user="${PBS_DATA_SERVICE_USER}"
	port="${PBS_DATA_SERVICE_PORT}"

	chown ${user} ${schema}
	if [ $? -ne 0 ]; then
		echo "chown of ${schema} to user ${user} failed"
		rm -f ${schema}
		exit 1
	fi

	if [ ! -x "${bin_dir}/initdb" ]; then
		echo "${bin_dir} exists, binaries missing...exiting"
		rm -f ${schema}
		exit 1
	fi

	if [ -d "${data_dir}/base" ]; then
		olduser=`ls -ld ${data_dir} | awk '{print $3}'`
		if [ $? -ne 0 ]; then
			echo "Failed to stat directory ${data_dir}"
			rm -f ${schema}
			exit 1
		fi
		if [ "$olduser" != "$user" ]; then
			echo "Existing PBS Data Store ${data_dir} owned by different user ${olduser}"
			echo "Use the same user name or install in a different location"
			rm -f ${schema}
			exit 1
		fi
		rm -f ${schema}
		exit 2
	fi

	if [ ! -d "${data_dir}" ]; then
		mkdir -p "${data_dir}"
		if [ $? -ne 0 ]; then
			echo "Error creating dir ${data_dir}"
			rm -f ${schema}
			exit 1
		fi
	fi

	# delete the password file, if any, since we are creating new db
	[ ${upgrade} -eq 0 ] && rm -f "${PBS_HOME}/server_priv/db_password"
	passwd="${user}"

	chown ${user} ${data_dir}
	if [ $? -ne 0 ]; then
		echo "Chown of ${data_dir} to user ${user} failed"
		rm -f ${schema}
		exit 1
	fi

	chmod 700 ${data_dir}
	if [ $? -ne 0 ]; then
		echo "chmod of ${data_dir} failed"
		rm -f ${schema}
		exit 1
	fi

	echo "Creating the PBS Data Service..."

	# change directory to data_dir to ensure that we don't get cd errors from postgres later
	cd ${data_dir}

	err=`su ${user} -c "/bin/sh -c '${PGSQL_LIBSTR} ${bin_dir}/initdb -D ${data_dir} -U \"${user}\" -E SQL_ASCII ${locale}'" 2>&1`

	if [ $? -ne 0 ]; then
		echo "$err"
		echo "Error creating PBS datastore"
		cleanup
		exit 1
	fi

	# check for postgres config files existence
	if [ ! -f "${data_dir}/postgresql.conf" ]; then
		echo "PBS Data Sevice Config files not found"
		cleanup
		exit 1
	fi

	if [ ! -f "${data_dir}/pg_hba.conf" ]; then
		echo "PBS Data Sevice Config files not found"
		cleanup
		exit 1
	fi

	# update postgresql.conf
	sed "{
		s/#checkpoint_segments = 3/checkpoint_segments = 20/g
		s/#port = 5432/port = ${port}/g
		s/#listen_addresses = 'localhost'/listen_addresses = '*'/g
		s/#standard_conforming_strings = off/standard_conforming_strings = on/g
		s/#logging_collector = off/logging_collector = on/g
		s/#log_directory = 'pg_log'/log_directory = 'pg_log'/g
		s/#log_filename = 'postgresql-%Y-%m-%d_%H%M%S.log'/log_filename = 'pbs_dataservice_log.%a'/g
		s/#log_truncate_on_rotation = off/log_truncate_on_rotation = on/g
		s/#log_rotation_age = 1d/log_rotation_age = 1440/g
		s/#log_line_prefix = ''/log_line_prefix = '%t'/g
		}" ${data_dir}/postgresql.conf > ${tmp_file}
	if [ $? -ne 0 ]; then
		echo "Error creating PBS datastore"
		cleanup
		exit 1
	fi
	mv ${tmp_file} ${data_dir}/postgresql.conf
	if [ $? -ne 0 ]; then
		echo "Error moving ${tmp_file} to ${data_dir}/postgresql.conf"
		cleanup
		exit 1
	fi

	chown ${user} ${data_dir}/postgresql.conf
	if [ $? -ne 0 ]; then
		echo "Error setting ownership to file ${data_dir}/postgresql.conf"
		cleanup
		exit 1
	fi

	chmod 600 ${data_dir}/postgresql.conf
	if [ $? -ne 0 ]; then
		echo "Error setting permissions to file ${data_dir}/postgresql.conf"
		cleanup
		exit 1
	fi

	# Copy pgsql directory to PBS_HOME (as pgsql.forupgrade) for it's future upgrade
	[ ! -d "${PBS_HOME}/pgsql.forupgrade" -a -d "${PBS_EXEC}/pgsql" -a -d "${PBS_HOME}" ] && cp -pr --no-preserve=timestamps "${PBS_EXEC}/pgsql" "${PBS_HOME}/pgsql.forupgrade" 2>&1

	if [ $upgrade -eq 1 ]; then
		cleanup_on_finish
		exit 0
	fi

	# Add IPV6 local address to pg_hba.conf so the pbs_ds_password is fine
	echo "host    all             all             ::1/128                 trust" >> ${data_dir}/pg_hba.conf

	${server_ctl} start
	if [ $? -ne 0 ]; then
		echo "Error starting PBS Data Service"
		cleanup
		exit 1
	fi
	# Wait for postgres to start.
	tries=5
	while [ $tries -ge 0 ]
	do
		${server_ctl} status > /dev/null 2>&1
		ret=$?
		if [ $ret -eq 0 ]; then
			break
		fi
		tries=$((tries-1))
		sleep 2
	done
	if [ $ret -ne 0 ]; then
		echo "Error starting PBS Data Service"
		cleanup
		exit 1
	fi

	err=`su ${user} -c "/bin/sh -c '${PGSQL_LIBSTR} ${bin_dir}/createdb -p ${port} pbs_datastore'" 2>&1`

	if [ $? -ne 0 ]; then
		echo "$err"
		echo "Error creating PBS datastore"
		${server_ctl} stop > /dev/null 2>&1
		cleanup
		exit 1
	fi

	# now install the pbs datastore schema onto the datastore
	err=`su ${user} -c "/bin/sh -c '${PGSQL_LIBSTR} ${bin_dir}/psql -p ${port} -d pbs_datastore -U \"${user}\" -f ${schema}'" 2>&1`

	if [ $? -ne 0 ]; then
		echo $err
		echo "Error initializing PBS datastore"
		${server_ctl} stop > /dev/null 2>&1
		cleanup
		exit 1
	fi

	err=`${PBS_EXEC}/sbin/pbs_ds_password -r`
	if [ $? -ne 0 ]; then
		echo $err
		echo "Error setting password for PBS Data Service"
		${server_ctl} stop > /dev/null 2>&1
		cleanup
		exit 1
	fi

	# stop the dataservice
	${server_ctl} stop
	if [ $? -ne 0 ]; then
		echo $err
		echo "Error stopping PBS Data Service"
		kill -TERM `ps -ef | grep "${bin_dir}/postgres" | grep -v grep | awk '{if ($3 == 1) print $2}'`
		cleanup
		exit 1
	fi

	# update the pg_hba.conf, so that no passwordless entry is allowed
	num=`grep -n "#.*TYPE.*DATABASE.*USER.*ADDRESS.*METHOD" ${data_dir}/pg_hba.conf | awk -F: '{print $1}'`
	head -n $num ${data_dir}/pg_hba.conf > ${tmp_file}
	mv ${tmp_file} ${data_dir}/pg_hba.conf

	echo "# IPv4 local connections: " >> ${data_dir}/pg_hba.conf
	echo "local   all             all                                     md5" >> ${data_dir}/pg_hba.conf
	echo "host    all             all             0.0.0.0/0               md5" >> ${data_dir}/pg_hba.conf
	echo "host    all             all             127.0.0.1/32            md5" >> ${data_dir}/pg_hba.conf
	echo "# IPv6 local connections:" >> ${data_dir}/pg_hba.conf
	echo "host    all             all             ::1/128                 md5" >> ${data_dir}/pg_hba.conf

	chown ${user} ${data_dir}/pg_hba.conf
	chmod 600 ${data_dir}/pg_hba.conf

	cleanup_on_finish
	exit 0
}

if [ "${opt}" = "upgrade_db" ]; then
	opt_err=0
	# Store the old PBS VERSION for later use
	if [ -f "${PBS_HOME}/pbs_version" ]; then
		old_pbs_version=`cat ${PBS_HOME}/pbs_version`
	fi

	data_dir="${PBS_HOME}/datastore"
	if [ ! -f "${data_dir}/PG_VERSION" ]; then
		echo "Database version file: ${data_dir}/PG_VERSION not found, cannot continue"
		exit 1
	fi
	sys_pgsql_ver=$(echo `${PGSQL_BIN}/postgres -V` | awk 'NR==1 {print $NF}' | cut -d '.' -f 1,2)
	old_pgsql_ver=`cat ${data_dir}/PG_VERSION`
	if [ "${sys_pgsql_ver}" != "${old_pgsql_ver}" ]; then
		# Upgrade postgres
		upgrade_pbs_database "${sys_pgsql_ver}" "${old_pgsql_ver}"
		ret=$?
		if [ $ret -ne 0 ]; then
			if [ $ret -eq 2 ]; then
				echo "It appears that PostgreSQL has been upgraded independently of PBS."
				echo "The PBS database must be manually upgraded. Please refer to the"
				echo "documentation/release notes for details."
			else
				echo "Failed to upgrade PBS Datastore"
			fi
			exit $ret
		else
			if [ -d "${old_inst_dir}" ]; then
				backupdir "$old_inst_dir" "$PBS_HOME"
				if [ $? -ne 0 ]; then
					echo "Failed to backup $old_inst_dir, please follow the below instructions:"
					echo "*** Backup "$old_inst_dir" if you need to downgrade pgsql later on."
					echo "*** For future upgrades to be successful run the below command."
					echo "*** cp -pr ${PBS_EXEC}/pgsql ${PBS_HOME}/pgsql.forupgrade"
				else
					echo "*** ${PBS_HOME}/$(basename ${old_inst_dir}).pre.${PBS_VERSION} may need to be manually removed if you do not wish to downgrade PBS."
				fi
			fi
		fi
	fi

	# do schema upgrade
	set_db_trust_login "${PBS_HOME}/datastore"
	${PBS_EXEC}/libexec/pbs_schema_upgrade ${PBS_DATA_SERVICE_PORT} ${PBS_DATA_SERVICE_USER}
	ret=$?
	if [ $ret -ne 0 ]; then
		revoke_db_trust_login "${PBS_HOME}/datastore"
		echo "Failed to upgrade PBS Datastore"
		exit $ret
	fi

	# We need to regenerate the db_password file since we have changed encryption/decryption
	# library from DES to AES in PBS Version PBS_AES_SWITCH_VER
	if [ "$old_pbs_version" \< "${PBS_AES_SWITCH_VER}" ] ;then
		rm -f  "${PBS_HOME}/server_priv/db_password"
		err=`${PBS_EXEC}/sbin/pbs_ds_password -r`
		if [ $? -ne 0 ]; then
			echo $err
			echo "Error setting password for PBS Data Service"
			${server_ctl} stop > /dev/null 2>&1
			revoke_db_trust_login "${PBS_HOME}/datastore"
			exit 1
		fi
	fi
	revoke_db_trust_login "${PBS_HOME}/datastore"

elif [ "${opt}" = "install_db" ]; then
	opt_err=0
	pbs_install_db
fi

if [ "${opt_err}" -eq 1 ]; then
	echo "Usage: pbs_db_utility [install_db|upgrade_db]"
	exit 1
fi


================================================
FILE: src/lib/Libdb/pgsql/pbs_ds_systemd
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

. ${PBS_CONF_FILE:-/etc/pbs.conf}

is_systemd=1
_status=$(systemctl is-system-running 2>/dev/null)
if [ ! "${_status}" -o "x${_status}" = "xoffline" -o "x${_status}" = "xunknown" ] ; then
    is_systemd=0
fi
if [ $is_systemd -eq 1 ] ; then
    SYSTEMD_CGROUP=`grep ^cgroup /proc/mounts | grep systemd | head -1 | cut -d ' ' -f2`
    if [ ! -d $SYSTEMD_CGROUP/system.slice/pbs.service ] ; then
        mkdir -p $SYSTEMD_CGROUP/system.slice/pbs.service
    fi

    pstmstr_pid_found=0
    try=0
    while [ $try -lt 10 -a $pstmstr_pid_found -ne 1 ]
    do
        sleep 1
        if [ -f ${PBS_HOME}/datastore/postmaster.pid ] ; then
            pstmstr_pid_found=1
        fi
        try=`expr $try + 1`
    done

    if [ $pstmstr_pid_found -eq 1 ] ; then
        P_PID=`head -n 1 ${PBS_HOME}/datastore/postmaster.pid`
        if [ -n "$P_PID" ] ; then
            echo $P_PID >> $SYSTEMD_CGROUP/system.slice/pbs.service/tasks
            pidlist=`pgrep -P $P_PID`
            if [ -n "$pidlist" ] ; then
                for PID in $pidlist; do
                    echo $PID >> $SYSTEMD_CGROUP/system.slice/pbs.service/tasks
                done
            fi
        fi
    fi
fi
exit 0


================================================
FILE: src/lib/Libdb/pgsql/pbs_schema_upgrade
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


upgrade_pbs_schema_from_v1_0_0() {

	${PGSQL_DIR}/bin/psql -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${PBS_DATA_SERVICE_USER} <<-EOF > /dev/null
		alter table pbs.node alter column nd_index drop default;
		alter table pbs.node drop constraint node_nd_index_key;
		create index job_scr_idx on pbs.job_scr (ji_jobid);
		drop sequence pbs.node_sequence;
		\set PBS_MAXHOSTNAME	'64'
		create sequence pbs.svr_id_seq;
		alter table pbs.server add column sv_hostname varchar(:PBS_MAXHOSTNAME);
		update pbs.server set sv_hostname = sv_name;
		alter table pbs.server alter column sv_hostname set not null;
	EOF
	ret=$?
	if [ $ret -ne 0 ]; then
		echo "Some datastore transformations failed to complete"
		echo "Please check dataservice logs"
		return $ret
	fi

	${PBS_EXEC}/sbin/pbs_server -t updatedb > /dev/null
	ret=$?
	if [ $ret -ne 0 -o -f ${PBS_HOME}/server_priv/serverdb ] ; then
		echo "*** Error during overlay upgrade"
		return $ret
	fi
}

upgrade_pbs_schema_from_v1_1_0() {

	${PGSQL_DIR}/bin/psql -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${PBS_DATA_SERVICE_USER} <<-EOF > /dev/null
		ALTER TABLE pbs.info ALTER COLUMN pbs_schema_version TYPE text;
		ALTER TABLE pbs.job ALTER COLUMN ji_jobid TYPE text;
		ALTER TABLE pbs.job ALTER COLUMN ji_sv_name TYPE text;
		ALTER TABLE pbs.job ALTER COLUMN ji_queue TYPE text;
		ALTER TABLE pbs.job ALTER COLUMN ji_destin TYPE text;
		ALTER TABLE pbs.job ALTER COLUMN ji_4jid TYPE text;
		ALTER TABLE pbs.job ALTER COLUMN ji_4ash TYPE text;
		ALTER TABLE pbs.job_attr ALTER COLUMN ji_jobid TYPE text;
		ALTER TABLE pbs.job_attr ALTER COLUMN attr_name TYPE text;
		ALTER TABLE pbs.job_attr ALTER COLUMN attr_resource TYPE text;
		ALTER TABLE pbs.job_scr ALTER COLUMN ji_jobid TYPE text;
		ALTER TABLE pbs.node ALTER COLUMN nd_name TYPE text;
		ALTER TABLE pbs.node ALTER COLUMN nd_hostname TYPE text;
		ALTER TABLE pbs.node ALTER COLUMN nd_pque TYPE text;
		ALTER TABLE pbs.node_attr ALTER COLUMN nd_name TYPE text;
		ALTER TABLE pbs.node_attr ALTER COLUMN attr_name TYPE text;
		ALTER TABLE pbs.node_attr ALTER COLUMN attr_resource TYPE text;
		ALTER TABLE pbs.queue ALTER COLUMN qu_name TYPE text;
		ALTER TABLE pbs.queue ALTER COLUMN qu_sv_name TYPE text;
		ALTER TABLE pbs.queue_attr ALTER COLUMN qu_name TYPE text;
		ALTER TABLE pbs.queue_attr ALTER COLUMN attr_name TYPE text;
		ALTER TABLE pbs.queue_attr ALTER COLUMN attr_resource TYPE text;
		ALTER TABLE pbs.resv ALTER COLUMN ri_resvid TYPE text;
		ALTER TABLE pbs.resv ALTER COLUMN ri_sv_name TYPE text;
		ALTER TABLE pbs.resv ALTER COLUMN ri_queue TYPE text;
		ALTER TABLE pbs.resv_attr ALTER COLUMN ri_resvid TYPE text;
		ALTER TABLE pbs.resv_attr ALTER COLUMN attr_name TYPE text;
		ALTER TABLE pbs.resv_attr ALTER COLUMN attr_resource TYPE text;
		ALTER TABLE pbs.scheduler ALTER COLUMN sched_name TYPE text;
		ALTER TABLE pbs.scheduler ALTER COLUMN sched_sv_name TYPE text;
		ALTER TABLE pbs.scheduler_attr ALTER COLUMN sched_name TYPE text;
		ALTER TABLE pbs.scheduler_attr ALTER COLUMN attr_name TYPE text;
		ALTER TABLE pbs.scheduler_attr ALTER COLUMN attr_resource TYPE text;
		ALTER TABLE pbs.server ALTER COLUMN sv_name TYPE text;
		ALTER TABLE pbs.server ALTER COLUMN sv_hostname TYPE text;
		ALTER TABLE pbs.server_attr ALTER COLUMN sv_name TYPE text;
		ALTER TABLE pbs.server_attr ALTER COLUMN attr_name TYPE text;
		ALTER TABLE pbs.server_attr ALTER COLUMN attr_resource TYPE text;
		ALTER TABLE pbs.subjob_track ALTER COLUMN ji_jobid TYPE text;
		alter table pbs.job drop constraint job_pkey cascade;
		create index ji_jobid_idx on pbs.job (ji_jobid);
		drop index pbs.job_attr_idx;
		create index job_attr_idx on pbs.job_attr (ji_jobid, attr_name, attr_resource);
		alter table pbs.subjob_track drop constraint subjob_track_pkey cascade;
		create index subjob_jid_idx on pbs.subjob_track (ji_jobid, trk_index);
		update pbs.info set pbs_schema_version = '1.2.0';
	EOF
	ret=$?
	if [ $ret -ne 0 ]; then
		echo "Some datastore transformations failed to complete"
		echo "Please check dataservice logs"
		return $ret
	fi
}

upgrade_pbs_schema_from_v1_2_0() {

	${PGSQL_DIR}/bin/psql -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${PBS_DATA_SERVICE_USER} <<-EOF > /dev/null
		DROP TABLE pbs.subjob_track;
		INSERT INTO pbs.scheduler (sched_name, sched_sv_name, sched_savetm, sched_creattm) VALUES ('default', '1', localtimestamp, localtimestamp);
		ALTER TABLE pbs.scheduler_attr DROP CONSTRAINT scheduler_attr_fk;
		UPDATE pbs.scheduler_attr SET sched_name='default' WHERE sched_name='1';
		ALTER TABLE pbs.scheduler_attr ADD CONSTRAINT scheduler_attr_fk
			FOREIGN KEY (sched_name)
			REFERENCES pbs.scheduler (sched_name)
			ON DELETE CASCADE
			ON UPDATE NO ACTION
			NOT DEFERRABLE;
		DELETE FROM pbs.scheduler WHERE sched_name='1';
		UPDATE pbs.info SET pbs_schema_version = '1.3.0';
	EOF
	ret=$?
	if [ $ret -ne 0 ]; then
		echo "Some datastore transformations failed to complete"
		echo "Please check dataservice logs"
		return $ret
	fi
}

upgrade_pbs_schema_from_v1_3_0() {

	${PGSQL_DIR}/bin/psql -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${PBS_DATA_SERVICE_USER} <<-EOF > /dev/null
		ALTER TABLE pbs.job ADD CONSTRAINT jobid_pk PRIMARY KEY (ji_jobid);
	EOF
	ret=$?
	if [ $ret -ne 0 ]; then
		echo "Primary key violation"
		echo "Please check dataservice logs"
		return $ret
	fi

	${PGSQL_DIR}/bin/psql -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${PBS_DATA_SERVICE_USER} <<-EOF > /dev/null

		CREATE EXTENSION hstore SCHEMA public;

		ALTER TABLE pbs.job ADD attributes hstore DEFAULT ''::hstore;
		UPDATE pbs.job SET attributes=(
			SELECT hstore(array_agg(attr.key ), array_agg(attr.value))
				FROM ( SELECT concat(attr_name, '.' , attr_resource) AS key,
					      concat(attr_flags, '.' , attr_value) AS value
						FROM pbs.job_attr WHERE pbs.job_attr.ji_jobid=pbs.job.ji_jobid) AS attr);
		UPDATE pbs.job SET attributes='' WHERE attributes IS NULL;
		ALTER TABLE pbs.job ALTER COLUMN attributes SET NOT NULL;

		ALTER TABLE pbs.node ADD attributes hstore DEFAULT ''::hstore;
		UPDATE pbs.node SET attributes=(
			SELECT hstore(array_agg(attr.key ), array_agg(attr.value))
				FROM ( SELECT concat(attr_name, '.' , attr_resource) AS key,
					      concat(attr_flags, '.' , attr_value) AS value
						FROM pbs.node_attr WHERE pbs.node_attr.nd_name=pbs.node.nd_name) AS attr);
		UPDATE pbs.node SET attributes='' WHERE attributes IS NULL;
		ALTER TABLE pbs.node ALTER COLUMN attributes SET NOT NULL;

		ALTER TABLE pbs.queue ADD attributes hstore DEFAULT ''::hstore;
		UPDATE pbs.queue SET attributes=(
			SELECT hstore(array_agg(attr.key ), array_agg(attr.value))
				FROM ( SELECT concat(attr_name, '.' , attr_resource) AS key,
					      concat(attr_flags, '.' , attr_value) AS value
						FROM pbs.queue_attr WHERE pbs.queue_attr.qu_name=pbs.queue.qu_name) AS attr);
		UPDATE pbs.queue SET attributes='' WHERE attributes IS NULL;
		ALTER TABLE pbs.queue ALTER COLUMN attributes SET NOT NULL;

		ALTER TABLE pbs.resv ADD attributes hstore DEFAULT ''::hstore;
		UPDATE pbs.resv SET attributes=(
			SELECT hstore(array_agg(attr.key ), array_agg(attr.value))
				FROM ( SELECT concat(attr_name, '.' , attr_resource) AS key,
					      concat(attr_flags, '.' , attr_value) AS value
						FROM pbs.resv_attr WHERE pbs.resv_attr.ri_resvid=pbs.resv.ri_resvid) AS attr);
		UPDATE pbs.resv SET attributes='' WHERE attributes IS NULL;
		ALTER TABLE pbs.resv ALTER COLUMN attributes SET NOT NULL;

		ALTER TABLE pbs.scheduler ADD attributes hstore DEFAULT ''::hstore;
		UPDATE pbs.scheduler SET attributes=(
			SELECT hstore(array_agg(attr.key ), array_agg(attr.value))
				FROM ( SELECT concat(attr_name, '.' , attr_resource) AS key,
					      concat(attr_flags, '.' , attr_value) AS value
						FROM pbs.scheduler_attr WHERE pbs.scheduler_attr.sched_name=pbs.scheduler.sched_name) AS attr);
		UPDATE pbs.scheduler SET attributes='' WHERE attributes IS NULL;
		ALTER TABLE pbs.scheduler ALTER COLUMN attributes SET NOT NULL;

		ALTER TABLE pbs.server ADD attributes hstore DEFAULT ''::hstore;
		UPDATE pbs.server SET attributes=(
			SELECT hstore(array_agg(attr.key ), array_agg(attr.value))
				FROM ( SELECT concat(attr_name, '.' , attr_resource) AS key,
					      concat(attr_flags, '.' , attr_value) AS value
						FROM pbs.server_attr WHERE pbs.server_attr.sv_name=pbs.server.sv_name) AS attr);
		UPDATE pbs.server SET attributes='' WHERE attributes IS NULL;
		ALTER TABLE pbs.server ALTER COLUMN attributes SET NOT NULL;

		DROP TABLE pbs.server_attr;
		DROP TABLE pbs.scheduler_attr;
		DROP TABLE pbs.node_attr;
		DROP TABLE pbs.queue_attr;
		DROP TABLE pbs.resv_attr;
		DROP TABLE pbs.job_attr;
		DROP INDEX pbs.resv_idx_cr;
		DROP INDEX pbs.ji_jobid_idx;
		DROP sequence pbs.svr_id_seq;

		ALTER INDEX pbs.job_src_idx RENAME TO job_scr_idx;
		ALTER TABLE pbs.server ALTER COLUMN sv_jobidnumber TYPE BIGINT;
		ALTER TABLE pbs.scheduler DROP COLUMN sched_sv_name;
		ALTER TABLE pbs.queue DROP COLUMN qu_sv_name;
		ALTER TABLE pbs.resv DROP COLUMN ri_sv_name;
		ALTER TABLE pbs.job DROP COLUMN ji_sv_name;
		ALTER TABLE pbs.server
		DROP COLUMN sv_name,
		DROP COLUMN sv_hostname;

		UPDATE pbs.info SET pbs_schema_version = '1.4.0';
	EOF
	ret=$?
	if [ $ret -ne 0 ]; then
		echo "Some datastore transformations failed to complete"
		echo "Please check dataservice logs"
		return $ret
	fi
}

upgrade_pbs_schema_from_v1_4_0() {
	${PGSQL_DIR}/bin/psql -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${PBS_DATA_SERVICE_USER} <<-EOF > /dev/null
		ALTER TABLE pbs.job DROP COLUMN ji_numattr;
		ALTER TABLE pbs.job DROP COLUMN ji_ordering;
		ALTER TABLE pbs.job DROP COLUMN ji_priority;
		ALTER TABLE pbs.job DROP COLUMN ji_endtbdry;
		ALTER TABLE pbs.job DROP COLUMN ji_momaddr;
		ALTER TABLE pbs.job DROP COLUMN ji_momport;
		ALTER TABLE pbs.job RENAME COLUMN ji_4jid to ji_jid;
		ALTER TABLE pbs.job ALTER COLUMN ji_qrank TYPE BIGINT;
		ALTER TABLE pbs.job DROP COLUMN ji_4ash;
		ALTER TABLE pbs.resv DROP COLUMN ri_type;
		ALTER TABLE pbs.resv DROP COLUMN ri_numattr;
		ALTER TABLE pbs.resv DROP COLUMN ri_resvTag;
		ALTER TABLE pbs.resv DROP COLUMN ri_un_type;
		ALTER TABLE pbs.resv DROP COLUMN ri_fromsock;
		ALTER TABLE pbs.resv DROP COLUMN ri_fromaddr;
		ALTER TABLE pbs.server DROP COLUMN sv_numjobs;
		ALTER TABLE pbs.server DROP COLUMN sv_numque;
		ALTER TABLE pbs.server DROP COLUMN sv_svraddr;
		ALTER TABLE pbs.server DROP COLUMN sv_svrport;
		ALTER TABLE pbs.queue RENAME COLUMN qu_ctime to qu_creattm;
		ALTER TABLE pbs.queue RENAME COLUMN qu_mtime to qu_savetm;
		UPDATE pbs.info SET pbs_schema_version = '1.5.0';
	EOF
	ret=$?
	if [ $ret -ne 0 ]; then
		echo "Error deleting ri_type during upgrade"
		echo "Please check dataservice logs"
		return $ret
	fi
}

# start of the upgrade schema script
. ${PBS_EXEC}/libexec/pbs_db_env
tmpdir=${PBS_TMPDIR:-${TMPDIR:-"/var/tmp"}}
PBS_CURRENT_SCHEMA_VER='1.5.0'

#
# pbs_dataservice command now has more diagnostic output.
# It can tell why it could not start, for example, that
# dataservice might be running on another host.
# So capture pbs_dataservice output and display in case of
# errors during starting.
#
outfile="${tmpdir}/pbs_dataservice_output_$$"

${PBS_EXEC}/sbin/pbs_dataservice status > /dev/null
if [ $? -eq 0 ]; then
	# running stop now
	${PBS_EXEC}/sbin/pbs_dataservice stop > /dev/null
	if [ $? -ne 0 ]; then
		echo "Failed to stop PBS Dataservice"
		exit 1
	fi
fi

ret=$?
if [ $ret -ne 0 ]; then
	exit $ret
fi

# restart with new credentials
# redirect the output, dont execute inside `` since
# postgres processes would otherwise cause the script
# to hang forever
#
${PBS_EXEC}/sbin/pbs_dataservice start > ${outfile}
if [ $? -ne 0 ]; then
	cat ${outfile}
	rm -f ${outfile}
	ret=$?
	if [ $ret -ne 0 ]; then
		exit $ret
	fi
	return 1
fi
rm -f ${outfile}

ver=`${PGSQL_DIR}/bin/psql -A -t -p ${PBS_DATA_SERVICE_PORT} -d pbs_datastore -U ${PBS_DATA_SERVICE_USER} -c "select pbs_schema_version from pbs.info"`
if [ "$ver" = "${PBS_CURRENT_SCHEMA_VER}" ]; then
	ret=$?
	if [ $ret -ne 0 ]; then
		exit $ret
	fi
	exit 0
fi

if [ "$ver" = "1.0.0" ]; then
	upgrade_pbs_schema_from_v1_0_0
	ret=$?
	if [ $ret -ne 0 ]; then
		ret=$?
		if [ $ret -ne 0 ]; then
		exit $ret
		fi
		exit 1
	fi
	ver="1.1.0"
fi

${PBS_EXEC}/sbin/pbs_dataservice status > /dev/null
if [ $? -eq 1 ]; then
	# not running, start now
	${PBS_EXEC}/sbin/pbs_dataservice start > ${outfile}
	if [ $? -ne 0 ]; then
		cat ${outfile}
		rm -f ${outfile}
		ret=$?
		if [ $ret -ne 0 ]; then
			exit $ret
		fi
		exit 1
	fi
	rm -f ${outfile}
fi

if [ "$ver" = "1.1.0" ]; then
	upgrade_pbs_schema_from_v1_1_0
	ret=$?
	if [ $ret -ne 0 ]; then
		exit $ret
	fi
	ver="1.2.0"
fi

if [ "$ver" = "1.2.0" ]; then
	upgrade_pbs_schema_from_v1_2_0
	ret=$?
	if [ $ret -ne 0 ]; then
		exit $ret
	fi
	ver="1.3.0"
fi

if [ "$ver" = "1.3.0" ]; then
	upgrade_pbs_schema_from_v1_3_0
	ret=$?
	if [ $ret -ne 0 ]; then
		exit $ret
	fi
	ver="1.4.0"
fi

if [ "$ver" = "1.4.0" ]; then
	upgrade_pbs_schema_from_v1_4_0
	ret=$?
	if [ $ret -ne 0 ]; then
		exit $ret
	fi
	ver="1.5.0"
else
	echo "Cannot upgrade PBS datastore version $ver"
	ret=$?
	if [ $ret -ne 0 ]; then
		exit $ret
	fi
	exit 1
fi

${PBS_EXEC}/sbin/pbs_dataservice status > /dev/null
if [ $? -eq 1 ]; then
	# not running, start now
	${PBS_EXEC}/sbin/pbs_dataservice start > ${outfile}
	if [ $? -ne 0 ]; then
		cat ${outfile}
		rm -f ${outfile}
		ret=$?
		if [ $ret -ne 0 ]; then
			exit $ret
		fi
		exit 1
	fi
fi
rm -f ${outfile}

${PBS_EXEC}/sbin/pbs_dataservice stop > /dev/null

ret=$?
exit $ret


================================================
FILE: src/lib/Libdis/dis.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "dis_.h"

const char *dis_emsg[] = {"No error",
			  "Input value too large to convert to this type",
			  "Tried to write floating point infinity",
			  "Negative sign on an unsigned datum",
			  "Input count or value has leading zero",
			  "Non-digit found where a digit was expected",
			  "Input string has an embedded ASCII NUL",
			  "Premature end of message",
			  "Unable to malloc enough space for string",
			  "Supporting protocol failure",
			  "Protocol failure in commit",
			  "End of File"};

pbs_tcp_chan_t *(*pfn_transport_get_chan)(int);
int (*pfn_transport_set_chan)(int, pbs_tcp_chan_t *);
int (*pfn_transport_recv)(int, void *, int);
int (*pfn_transport_send)(int, void *, int);

/* this is for our client threading functionlity to get the DIS_BUFSZ */
long dis_buffsize = DIS_BUFSIZ;

/**
 * @brief
 * 	called once per process to initialize the dis tables
 *
 */

void
dis_init_tables(void)
{
	if (dis_dmx10 == 0)
		disi10d_();
	if (dis_lmx10 == 0)
		disi10l_();
	if (dis_umaxd == 0)
		disiui_();
	init_ulmax();
}


================================================
FILE: src/lib/Libdis/dis_.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <limits.h>
#include <stddef.h>

#include <dis.h>

#define DIS_BUFSIZ (CHAR_BIT * sizeof(ULONG_MAX))
/* define a limit for the number of times DIS will recurse when      */
/* processing a sequence of character counts;  prvent stack overflow */
#define DIS_RECURSIVE_LIMIT 30

char *discui_(char *cp, unsigned value, unsigned *ndigs);
char *discul_(char *cp, unsigned long value, unsigned *ndigs);
char *discull_(char *cp, u_Long value, unsigned *ndigs);
void disi10d_();
void disi10l_();
void disiui_(void);
void dis_init_tables(void); /* called once per process to init dis tables */
void init_ulmax(void);
double disp10d_(int expon);
dis_long_double_t disp10l_(int expon);
int
disrl_(int stream, dis_long_double_t *ldval, unsigned *ndigs,
       unsigned *nskips, unsigned sigd, unsigned count, int recursv);
int disrsi_(int stream, int *negate, unsigned *value, unsigned count, int rescuvr);
int
disrsl_(int stream, int *negate, unsigned long *value,
	unsigned long count, int recursv);
int disrsll_(int stream, int *negate, u_Long *value, unsigned long count, int recursv);
int diswui_(int stream, unsigned value);

extern unsigned dis_dmx10;
extern double *dis_dp10;
extern double *dis_dn10;

extern unsigned dis_lmx10;
extern dis_long_double_t *dis_lp10;
extern dis_long_double_t *dis_ln10;

extern char *__dis_buffer_location(void);
#define dis_buffer (__dis_buffer_location())

extern char *dis_umax;
extern unsigned dis_umaxd;


================================================
FILE: src/lib/Libdis/dis_helpers.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */
#include <pbs_config.h>
#include <arpa/inet.h>
#include <assert.h>
#include <errno.h>
#include <stdlib.h>
#include "auth.h"
#include "dis.h"
#include "pbs_error.h"
#include "pbs_internal.h"

#define PKT_MAGIC "PKTV1"
#define PKT_MAGIC_SZ sizeof(PKT_MAGIC)
#define PKT_HDR_SZ (PKT_MAGIC_SZ + 1 + sizeof(int))

static pbs_dis_buf_t *dis_get_readbuf(int);
static pbs_dis_buf_t *dis_get_writebuf(int);
static int dis_resize_buf(pbs_dis_buf_t *, size_t);
static int transport_chan_is_encrypted(int);

/**
 * @brief
 * 	transport_chan_set_ctx_status - set auth context status tcp chan assosiated with given fd
 *
 * @param[in] fd - file descriptor
 * @param[in] status - auth ctx status
 * @param[in] for_encrypt - is authctx for encrypt/decrypt?
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
transport_chan_set_ctx_status(int fd, int status, int for_encrypt)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return;
	chan->auths[for_encrypt].ctx_status = status;
}

/**
 * @brief
 * 	transport_chan_get_ctx_status - get auth context status tcp chan assosiated with given fd
 *
 * @param[in] fd - file descriptor
 * @param[in] for_encrypt - whether to get encrypt/decrypt authctx status or for authentication
 *
 * @return int
 *
 * @retval -1 - error
 * @retval !-1 - status
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
transport_chan_get_ctx_status(int fd, int for_encrypt)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return -1;
	return chan->auths[for_encrypt].ctx_status;
}

/**
 * @brief
 * 	transport_chan_set_authctx - associates authenticaion context with connection
 *
 * @param[in] fd - file descriptor
 * @param[in] authctx - the context
 * @param[in] for_encrypt - is authctx for encrypt/decrypt?
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
transport_chan_set_authctx(int fd, void *authctx, int for_encrypt)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return;
	chan->auths[for_encrypt].ctx = authctx;
}

/**
 * @brief
 * 	transport_chan_get_authctx - gets authentication context associated with connection
 *
 * @param[in] fd - file descriptor
 * @param[in] for_encrypt - whether to get encrypt/decrypt authctx or for authentication
 *
 * @return void *
 *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void *
transport_chan_get_authctx(int fd, int for_encrypt)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return NULL;
	return chan->auths[for_encrypt].ctx;
}

/**
 * @brief
 * 	transport_chan_set_authdef - associates authdef structure with connection
 *
 * @param[in] fd - file descriptor
 * @param[in] authdef - the authdef structure for association
 * @param[in] for_encrypt - is authdef for encrypt/decrypt?
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
transport_chan_set_authdef(int fd, auth_def_t *authdef, int for_encrypt)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return;
	chan->auths[for_encrypt].def = authdef;
}

/**
 * @brief
 * 	transport_chan_get_authdef - gets authdef structure associated with connection
 *
 * @param[in] fd - file descriptor
 * @param[in] for_encrypt - whether to get encrypt/decrypt authdef or for authentication
 *
 * @return auth_def_t *
 *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
auth_def_t *
transport_chan_get_authdef(int fd, int for_encrypt)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return NULL;
	return chan->auths[for_encrypt].def;
}

/**
 * @brief
 * 	transport_chan_is_encrypted - is chan assosiated with given fd is encrypted?
 *
 * @param[in] fd - file descriptor
 *
 * @return int
 *
 * @retval 0 - not encrypted
 * @retval 1 - encrypted
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
transport_chan_is_encrypted(int fd)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return 0;
	return (chan->auths[FOR_ENCRYPT].def != NULL && chan->auths[FOR_ENCRYPT].ctx_status == AUTH_STATUS_CTX_READY);
}

/**
 * @brief
 * 	send pkt from given DIS buffer over network
 * 	after patching pkt header for data size and
 * 	if not encrypted already and chan is encrypted
 * 	then encrypt data before send
 *
 * @param[in] fd - file descriptor
 * @param[in] tp - pointer to DIS buffer
 * @param[in] encrypt_done - is data already encrypted
 *
 * @return int
 *
 * @retval >= 0  - success
 * @retval -1 - failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
__send_pkt(int fd, pbs_dis_buf_t *tp, int encrypt_done)
{
	int i;

	if (!encrypt_done && transport_chan_is_encrypted(fd)) {
		void *authctx = transport_chan_get_authctx(fd, FOR_ENCRYPT);
		auth_def_t *authdef = transport_chan_get_authdef(fd, FOR_ENCRYPT);
		void *data_out;
		size_t len_out;

		if (authdef == NULL || authdef->encrypt_data == NULL)
			return -1;

		if (authdef->encrypt_data(authctx, (void *) (tp->tdis_data + PKT_HDR_SZ), tp->tdis_len - PKT_HDR_SZ, &data_out, &len_out) != 0)
			return -1;

		dis_resize_buf(tp, len_out + PKT_HDR_SZ);
		memcpy((void *) (tp->tdis_data + PKT_HDR_SZ), data_out, len_out);
		free(data_out);
		tp->tdis_len = len_out + PKT_HDR_SZ;
	}

	i = htonl(tp->tdis_len - PKT_HDR_SZ);
	memcpy((void *) (tp->tdis_data + PKT_HDR_SZ - sizeof(int)), &i, sizeof(int));

	i = transport_send(fd, (void *) tp->tdis_data, tp->tdis_len);
	if (i < 0)
		return i;
	if (i != tp->tdis_len)
		return -1;
	dis_clear_buf(tp);
	return i;
}

/**
 * @brief
 * 	create pkt based on given value
 * 	and send it over network. If channel for given fd is
 * 	encrypted then given data will be encrypted first
 * 	then pkt will be sent
 *
 * @param[in] fd - file descriptor
 * @param[in] type - type of pkt
 * @param[in] data_in - data of pkt
 * @param[in] len_in - length of data
 *
 * @return int
 *
 * @retval >= 0  - success
 * @retval -1 - failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
transport_send_pkt(int fd, int type, void *data_in, size_t len_in)
{
	pbs_dis_buf_t *tp;

	if (data_in == NULL || len_in == 0 || (tp = dis_get_writebuf(fd)) == NULL)
		return -1;

	dis_clear_buf(tp);
	dis_resize_buf(tp, len_in + PKT_HDR_SZ);
	strcpy(tp->tdis_data, PKT_MAGIC);
	*(tp->tdis_data + PKT_MAGIC_SZ) = (char) type;
	tp->tdis_pos = tp->tdis_data + PKT_HDR_SZ;

	if (transport_chan_is_encrypted(fd)) {
		void *authctx = transport_chan_get_authctx(fd, FOR_ENCRYPT);
		auth_def_t *authdef = transport_chan_get_authdef(fd, FOR_ENCRYPT);
		void *data_out;
		size_t len_out;

		if (authdef == NULL || authdef->encrypt_data == NULL)
			return -1;

		if (authdef->encrypt_data(authctx, data_in, len_in, &data_out, &len_out) != 0)
			return -1;

		dis_resize_buf(tp, len_out + PKT_HDR_SZ);
		memcpy(tp->tdis_pos, data_out, len_out);
		free(data_out);
		tp->tdis_len = len_out;
	} else {
		memcpy(tp->tdis_pos, data_in, len_in);
		tp->tdis_len = len_in;
	}
	tp->tdis_len += PKT_HDR_SZ;

	return __send_pkt(fd, tp, 1);
}

/**
 * @brief
 * 	receive pkt in given DIS buffer from network
 * 	If channel for given fd is encrypted then decrypt data
 * 	in received pkt
 *
 * @param[in] fd - file descriptor
 * @param[out] type - type of pkt
 * @param[in/out] tp - pointer to DIS buffer
 *
 * @return int
 *
 * @retval >= 0  - success
 * @retval -1 - failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
__recv_pkt(int fd, int *type, pbs_dis_buf_t *tp)
{
	int i;
	size_t datasz;
	char pkthdr[PKT_HDR_SZ];

	dis_clear_buf(tp);
	i = transport_recv(fd, (void *) &pkthdr, PKT_HDR_SZ);
	if (i != PKT_HDR_SZ)
		return (i < 0 ? i : -1);
	if (strncmp(pkthdr, PKT_MAGIC, PKT_MAGIC_SZ) != 0) {
		/* no pkt magic match, reject data/connection */
		return -1;
	}

	*type = (int) pkthdr[PKT_MAGIC_SZ];
	memcpy(&i, (void *) &(pkthdr[PKT_HDR_SZ - sizeof(int)]), sizeof(int));
	datasz = ntohl(i);
	if (datasz <= 0)
		return -1;
	dis_resize_buf(tp, datasz);
	i = transport_recv(fd, tp->tdis_data, datasz);
	if (i != datasz)
		return (i < 0 ? i : -1);

	if (transport_chan_is_encrypted(fd)) {
		void *data;
		void *authctx = transport_chan_get_authctx(fd, FOR_ENCRYPT);
		auth_def_t *authdef = transport_chan_get_authdef(fd, FOR_ENCRYPT);

		if (authdef == NULL || authdef->decrypt_data == NULL)
			return -1;

		if (authdef->decrypt_data(authctx, tp->tdis_data, i, &data, &datasz) != 0)
			return -1;

		free(tp->tdis_data);
		tp->tdis_data = data;
		tp->tdis_bufsize = datasz;
	}
	tp->tdis_pos = tp->tdis_data;
	tp->tdis_len = datasz;
	return datasz;
}

/**
 * @brief
 * 	transport_recv_pkt - receive pkt over network.
 * 	If channel for given fd is encrypted then decrypt it
 * 	and parse pkt to find pkt type, data and its length
 *
 * 	@warning returned data should not be free'd as it is
 * 		 internal dis buffer
 *
 * @param[in] fd - file descriptor
 * @param[out] type - type of pkt
 * @param[out] data_out - data of pkt
 * @param[out] len_out - length of data
 *
 * @return int
 *
 * @retval >= 0  - success
 * @retval -1 - failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
transport_recv_pkt(int fd, int *type, void **data_out, size_t *len_out)
{
	int i;
	pbs_dis_buf_t *tp = dis_get_readbuf(fd);

	*type = 0;
	*data_out = NULL;
	*len_out = 0;

	if (tp == NULL)
		return -1;
	i = __recv_pkt(fd, type, tp);
	if (i <= 0)
		return i;
	*data_out = (void *) tp->tdis_data;
	*len_out = i;
	dis_clear_buf(tp);
	return *len_out;
}

/**
 * @brief
 * 	dis_get_readbuf - get dis read buffer associated with connection
 *
 * @return pbs_dis_but_t *
 *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static pbs_dis_buf_t *
dis_get_readbuf(int fd)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return NULL;
	return &(chan->readbuf);
}

/**
 * @brief
 * 	dis_get_writebuf - get dis write buffer associated with connection
 *
 * @return pbs_dis_but_t *
 *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static pbs_dis_buf_t *
dis_get_writebuf(int fd)
{
	pbs_tcp_chan_t *chan = transport_get_chan(fd);

	if (chan == NULL)
		return NULL;
	return &(chan->writebuf);
}

/**
 * @brief
 * 	dis_resize_buf - resize given dis buffer to appropriate size based on given needed
 *
 * 	if use_lead is true then it will use tdis_lead to calculate new size else tdis_eod
 *
 * @param[in] tp - dis buffer to pack
 * @param[in] needed - min needed buffer size
 *
 * @return int
 *
 * @retval 0 - success
 * @retval -1 - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
dis_resize_buf(pbs_dis_buf_t *tp, size_t needed)
{
	if ((tp->tdis_len + needed) >= tp->tdis_bufsize) {
		int offset = tp->tdis_len > 0 ? (tp->tdis_pos - tp->tdis_data) : 0;
		char *tmpcp = (char *) realloc(tp->tdis_data, tp->tdis_bufsize + needed + PBS_DIS_BUFSZ);
		if (tmpcp == NULL) {
			return -1; /* realloc failed */
		} else {
			tp->tdis_data = tmpcp;
			tp->tdis_bufsize = tp->tdis_bufsize + needed + PBS_DIS_BUFSZ;
			tp->tdis_pos = tp->tdis_data + offset;
		}
	}
	return 0;
}

/**
 * @brief
 * 	dis_clear_buf - reset dis buffer to empty by updating its counter
 *
 *
 * @param[in] tp - dis buffer to clear
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
dis_clear_buf(pbs_dis_buf_t *tp)
{
	tp->tdis_pos = tp->tdis_data;
	tp->tdis_len = 0;
}

/**
 * @brief
 * 	dis_reset_buf - reset appropriate dis buffer associated with connection
 *
 * @param[in] fd - file descriptor
 * @param[in] rw - reset write buffer if true else read buffer
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
dis_reset_buf(int fd, int rw)
{
	dis_clear_buf((rw == DIS_WRITE_BUF) ? dis_get_writebuf(fd) : dis_get_readbuf(fd));
}

/**
 * @brief
 * 	disr_skip - dis suport routine to skip over data in read buffer
 *
 * @param[in] fd - file descriptor
 * @param[in] ct - count
 *
 * @return	int
 *
 * @retval	number of characters skipped
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
disr_skip(int fd, size_t ct)
{
	pbs_dis_buf_t *tp = dis_get_readbuf(fd);

	if (tp == NULL)
		return 0;
	if (ct > tp->tdis_len)
		dis_clear_buf(tp);
	else {
		tp->tdis_pos += ct;
		tp->tdis_len -= ct;
	}
	return (int) ct;
}

/**
 * @brief
 * 	dis_getc - dis support routine to get next character from read buffer
 *
 * @param[in] fd - file descriptor
 *
 * @return	int
 *
 * @retval	>0 	number of characters read
 * @retval	-1 	if EOD or error
 * @retval	-2 	if EOF (stream closed)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
dis_getc(int fd)
{
	pbs_dis_buf_t *tp = dis_get_readbuf(fd);
	int c;

	if (tp == NULL)
		return -1;
	if (tp->tdis_len <= 0) {
		/* not enought data, try to get more */
		int unused;

		dis_clear_buf(tp);
		if ((c = __recv_pkt(fd, &unused, tp)) <= 0) {
			dis_clear_buf(tp);
			return c; /* Error or EOF */
		}
	}
	c = *tp->tdis_pos;
	tp->tdis_pos++;
	tp->tdis_len--;
	return c;
}

/**
 * @brief
 * 	dis_gets - dis support routine to get a string from read buffer
 *
 * @param[in] fd - file descriptor
 * @param[in] str - string to be written
 * @param[in] ct - count
 *
 * @return	int
 *
 * @retval	>0 	number of characters read
 * @retval	0 	if EOD (no data currently avalable)
 * @retval	-1 	if error
 * @retval	-2 	if EOF (stream closed)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
dis_gets(int fd, char *str, size_t ct)
{
	pbs_dis_buf_t *tp = dis_get_readbuf(fd);

	if (tp == NULL) {
		*str = '\0';
		return -1;
	}
	if (ct == 0) {
		*str = '\0';
		return ct;
	}
	if (tp->tdis_len <= 0) {
		/* not enought data, try to get more */
		int unused;
		int c;

		if ((c = __recv_pkt(fd, &unused, tp)) <= 0) {
			dis_clear_buf(tp);
			return c; /* Error or EOF */
		}
	}
	memcpy(str, tp->tdis_pos, ct);
	tp->tdis_pos += ct;
	tp->tdis_len -= ct;
	return (int) ct;
}

/**
 * @brief
 * 	dis_puts - dis support routine to put a counted string of characters
 *	into the write buffer.
 *
 * @param[in] fd - file descriptor
 * @param[in] str - string to be written
 * @param[in] ct - count
 *
 * @return	int
 *
 * @retval	>= 0	the number of characters placed
 * @retval	-1 	if error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
dis_puts(int fd, const char *str, size_t ct)
{
	pbs_dis_buf_t *tp = dis_get_writebuf(fd);

	if (tp == NULL)
		return -1;
	if (tp->tdis_len <= 0) {
		if (dis_resize_buf(tp, ct + PKT_HDR_SZ) != 0)
			return -1;
		strcpy(tp->tdis_data, PKT_MAGIC);
		tp->tdis_pos = tp->tdis_data + PKT_HDR_SZ;
		tp->tdis_len = PKT_HDR_SZ;
	} else {
		if (dis_resize_buf(tp, ct) != 0)
			return -1;
	}
	memcpy(tp->tdis_pos, str, ct);
	tp->tdis_pos += ct;
	tp->tdis_len += ct;
	return ct;
}

/**
 * @brief
 *	flush dis write buffer
 *
 *	Writes "committed" data in buffer to file descriptor,
 *	packs remaining data (if any), resets pointers
 *
 * @param[in] - fd - file descriptor
 *
 * @return int
 *
 * @retval  0 on success
 * @retval -1 on error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
dis_flush(int fd)
{
	pbs_dis_buf_t *tp = dis_get_writebuf(fd);

	if (tp == NULL)
		return -1;
	if (tp->tdis_len == 0)
		return 0;
	if (__send_pkt(fd, tp, 0) <= 0)
		return -1;
	return 0;
}

/**
 * @brief
 * 	dis_destroy_chan - release structures associated with fd
 *
 * @param[in] fd - socket descriptor
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
dis_destroy_chan(int fd)
{
	pbs_tcp_chan_t *chan = NULL;

	if (pfn_transport_get_chan == NULL)
		return;
	chan = transport_get_chan(fd);
	if (chan != NULL) {
		if (chan->auths[FOR_AUTH].ctx || chan->auths[FOR_ENCRYPT].ctx) {
			/* DO NOT free authdef here, it will be done in unload_auths() */
			if (chan->auths[FOR_AUTH].ctx && chan->auths[FOR_AUTH].def) {
				chan->auths[FOR_AUTH].def->destroy_ctx(chan->auths[FOR_AUTH].ctx);
			}
			if (chan->auths[FOR_ENCRYPT].def != chan->auths[FOR_AUTH].def &&
			    chan->auths[FOR_ENCRYPT].ctx &&
			    chan->auths[FOR_ENCRYPT].def) {
				chan->auths[FOR_ENCRYPT].def->destroy_ctx(chan->auths[FOR_ENCRYPT].ctx);
			}
			chan->auths[FOR_AUTH].ctx = NULL;
			chan->auths[FOR_AUTH].def = NULL;
			chan->auths[FOR_AUTH].ctx_status = AUTH_STATUS_UNKNOWN;
			chan->auths[FOR_ENCRYPT].ctx = NULL;
			chan->auths[FOR_ENCRYPT].def = NULL;
			chan->auths[FOR_ENCRYPT].ctx_status = AUTH_STATUS_UNKNOWN;
		}
		if (chan->readbuf.tdis_data) {
			free(chan->readbuf.tdis_data);
			chan->readbuf.tdis_data = NULL;
		}
		if (chan->writebuf.tdis_data) {
			free(chan->writebuf.tdis_data);
			chan->writebuf.tdis_data = NULL;
		}
		free(chan);
		transport_set_chan(fd, NULL);
	}
}

/**
 * @brief
 *	allocate dis buffers associated with connection, if already allocated then clear it
 *
 * @param[in] fd - file descriptor
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
dis_setup_chan(int fd, pbs_tcp_chan_t *(*inner_transport_get_chan)(int) )
{
	pbs_tcp_chan_t *chan;
	int rc;

	/* check for bad file descriptor */
	if (fd < 0)
		return;
	chan = (pbs_tcp_chan_t *) (*inner_transport_get_chan)(fd);
	if (chan == NULL) {
		if (errno == ENOTCONN)
			return;
		chan = (pbs_tcp_chan_t *) calloc(1, sizeof(pbs_tcp_chan_t));
		assert(chan != NULL);
		dis_resize_buf(&(chan->readbuf), PBS_DIS_BUFSZ);
		dis_resize_buf(&(chan->writebuf), PBS_DIS_BUFSZ);
		rc = transport_set_chan(fd, chan);
		assert(rc == 0);
	}

	/* initialize read and write buffers */
	dis_clear_buf(&(chan->readbuf));
	dis_clear_buf(&(chan->writebuf));
}


================================================
FILE: src/lib/Libdis/discui_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
/**
 * @file	discui.c
 */
/**
 * @brief
 *      -Function to convert a value of data type unsigned to string form and
 *      computes the number of characters/digits in that string.
 *
 * @param[out] cp - copy string
 * @param[in] value - value to be converted
 * @param[out]  ndigs - number of digits
 *
 * @retrun      string
 * @retval      converted string
 *
 */

char *
discui_(char *cp, unsigned value, unsigned *ndigs)
{
	char *ocp;

	ocp = cp;
	while (value > 9) {
		*--cp = value % 10 + '0';
		value /= 10;
	}
	*--cp = value + '0';
	*ndigs = ocp - cp;
	return (cp);
}


================================================
FILE: src/lib/Libdis/discul_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
/**
 * @file	discul.c
 */
/**
 * @brief
 *      -Function to convert a value of data type unsigned long to string form and
 *      computes the number of characters/digits in that string.
 *
 * @param[out] cp - copy string
 * @param[in] value - value to be converted
 * @param[out]  ndigs - number of digits
 *
 * @retrun      string
 * @retval      converted string
 *
 */

char *
discul_(char *cp, unsigned long value, unsigned *ndigs)
{
	char *ocp;

	ocp = cp;
	while (value > 9) {
		*--cp = value % 10 + '0';
		value /= 10;
	}
	*--cp = value + '0';
	*ndigs = ocp - cp;
	return (cp);
}


================================================
FILE: src/lib/Libdis/discull_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "Long.h"
/**
 * @file	discull.c
 */
/**
 * @brief
 * 	-Function to convert a value of data type u_Long to string form and
 * 	computes the number of characters/digits in that string.
 *
 * @param[out] cp - copy string
 * @param[in] value - value to be converted
 * @param[out]  ndigs - number of digits
 *
 * @retrun	string
 * @retval	converted string
 *
 */

char *
discull_(char *cp, u_Long value, unsigned *ndigs)
{
	char *ocp;

	ocp = cp;
	while (value > 9) {
		*--cp = value % 10 + '0';
		value /= 10;
	}
	*--cp = value + '0';
	*ndigs = ocp - cp;
	return (cp);
}


================================================
FILE: src/lib/Libdis/disi10d_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <float.h>
#include <stddef.h>
#include <stdlib.h>

#include <dis.h>

unsigned dis_dmx10 = 0;
double *dis_dp10 = NULL;
double *dis_dn10 = NULL;
/**
 * @file	disi10d_.c
 */
/**
 * @brief
 *	-Allocate and fill tables with all powers of 10 that fit the forms:
 *
 *				  n
 *				 2
 *		*dis_dp10[n] = 10
 *
 *				  ( n)
 *				 -(2 )
 *		*dis_dn10[n] = 10
 *
 *	For all values of n supported by the floating point format.  Set
 *	dis_dmx10 equal to the largest value of n that fits the format.
 */

void
disi10d_()
{
	int i;
	unsigned long ul;
	dis_long_double_t accum;
	size_t tabsize;

	assert(dis_dp10 == NULL);
	assert(dis_dn10 == NULL);
	assert(dis_dmx10 == 0);

#if DBL_MAX_10_EXP + DBL_MIN_10_EXP > 0
	ul = DBL_MAX_10_EXP;
#else
	ul = -DBL_MIN_10_EXP;
#endif
	while (ul >>= 1)
		dis_dmx10++;
	tabsize = (dis_dmx10 + 1) * sizeof(double);
	dis_dp10 = (double *) malloc(tabsize);
	assert(dis_dp10 != NULL);
	dis_dn10 = (double *) malloc(tabsize);
	assert(dis_dn10 != NULL);
	assert(dis_dmx10 > 0);
	dis_dp10[0] = accum = 10.0L;
	dis_dn10[0] = 1.0L / accum;
	for (i = 1; i <= dis_dmx10; i++) {
		accum *= accum;
		dis_dp10[i] = accum;
		dis_dn10[i] = 1.0L / accum;
	}
}


================================================
FILE: src/lib/Libdis/disi10l_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <float.h>
#include <stddef.h>
#include <stdlib.h>

#include <dis.h>
/**
 * @file	disi10l_.c
 */
unsigned dis_lmx10 = 0;
dis_long_double_t *dis_lp10 = NULL;
dis_long_double_t *dis_ln10 = NULL;

/**
 * @brief
 *	-Allocate and fill tables with all powers of 10 that fit the forms:
 *
 *				  n
 *				 2
 *		*dis_lp10[n] = 10
 *
 *				  ( n)
 *				 -(2 )
 *		*dis_ln10[n] = 10
 *
 *	For all values of n supported by the floating point format.  Set
 *	dis_lmx10 equal to the largest value of n that fits the format.
 */

void
disi10l_()
{
	int i;
	unsigned long ul;
	dis_long_double_t accum;
	size_t tabsize;

	assert(dis_lp10 == NULL);
	assert(dis_ln10 == NULL);
	assert(dis_lmx10 == 0);

#if LDBL_MAX_10_EXP + LDBL_MIN_10_EXP > 0
	ul = LDBL_MAX_10_EXP;
#else
	ul = -LDBL_MIN_10_EXP;
#endif
	while (ul >>= 1)
		dis_lmx10++;
	tabsize = (dis_lmx10 + 1) * sizeof(dis_long_double_t);
	dis_lp10 = (dis_long_double_t *) malloc(tabsize);
	assert(dis_lp10 != NULL);
	dis_ln10 = (dis_long_double_t *) malloc(tabsize);
	assert(dis_ln10 != NULL);
	assert(dis_lmx10 > 0);
	dis_lp10[0] = accum = 10.0L;
	dis_ln10[0] = 1.0L / accum;
	for (i = 1; i <= dis_lmx10; i++) {
		accum *= accum;
		dis_lp10[i] = accum;
		dis_ln10[i] = 1.0L / accum;
	}
}


================================================
FILE: src/lib/Libdis/disiui_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdlib.h>

#include "dis.h"
#include "dis_.h"

char *dis_umax = NULL;
unsigned dis_umaxd = 0;
/**
 * @file	disiui_.c
 */
/**
 * @brief
 *	Allocate and fill a counted string containing the constant, UINT_MAX,
 *	expressed as character codes of decimal digits.
 *
 * @par SEE:
 *      dis_umaxd = number of digits in UINT_MAX\n
 *	dis_umax[0] through dis_umax[dis_umaxd - 1] = the digits, in order.
 */

void
disiui_()
{
	char *cp;

	assert(dis_umax == NULL);
	assert(dis_umaxd == 0);

	cp = discui_(dis_buffer + DIS_BUFSIZ, UINT_MAX, &dis_umaxd);
	assert(dis_umaxd > 0);
	dis_umax = (char *) malloc(dis_umaxd);
	assert(dis_umax != NULL);
	memcpy(dis_umax, cp, dis_umaxd);
}


================================================
FILE: src/lib/Libdis/disp10d_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <math.h>
#include "dis_.h"
/**
 * @file	disp10d_.c
 */
/**
 * @brief
 *		  expon
 *	Returns 10	as a double precision value.
 *
 * @param[in] expon - exponant value
 *
 * @return	double
 * @retval	10^expon value	success
 * @retval	0.0		error
 *
 */

double
disp10d_(int expon)
{
	int negate;
	int pow2;
	double accum;

	if (expon == 0)
		return (1.0);

	/* dis_dmx10 would be initialized by prior call to dis_init_tables */

	if (expon < 0) {
		expon = -expon;
		negate = TRUE;
	} else {
		negate = FALSE;
	}
	pow2 = 0;
	do {
		if (expon & 1) {
			accum = dis_dp10[pow2];
			while (expon >>= 1) {
				if (++pow2 > dis_dmx10)
					return (negate ? 0.0 : HUGE_VAL);
				if (expon & 1)
					accum *= dis_dp10[pow2];
			}
			return (negate ? 1.0 / accum : accum);
		}
		expon >>= 1;
	} while (pow2++ < dis_dmx10);
	return (negate ? 0.0 : HUGE_VAL);
}


================================================
FILE: src/lib/Libdis/disp10l_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <math.h>

#include <dis.h>
#include "dis_.h"

void disi10l_();
/**
 * @file	disp10l_.c
 */
/**
 * @brief	   expon
 *	-Returns 10	as a dis_long_double_t value.
 *
 * @param[in] expon - exponant value
 *
 * @return      dis_long_double_t
 * @retval      10^expon value  success
 * @retval      0.0             error
 *
 */

dis_long_double_t
disp10l_(int expon)
{
	int negate;
	int pow2;
	dis_long_double_t accum;

	if (expon == 0)
		return (1.0L);

	/* dis_lmx10 would be initialized by prior call to dis_init_tables */

	if (expon < 0) {
		negate = TRUE;
		expon = -expon;
	} else {
		negate = FALSE;
	}
	pow2 = 0;
	do {
		if (expon & 1) {
			accum = dis_lp10[pow2];
			while (expon >>= 1) {
				if (++pow2 > dis_lmx10)
					return (negate ? 0.0L : HUGE_VAL);
				if (expon & 1)
					accum *= dis_lp10[pow2];
			}
			return (negate ? 1.0L / accum : accum);
		}
		expon >>= 1;
	} while (pow2++ < dis_lmx10);
	return (negate ? 0.0L : HUGE_VAL);
}


================================================
FILE: src/lib/Libdis/disrcs.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrcs.c
 *
 * @par Synopsis:
 *	char *disrcs(int stream, size_t *nchars, int *retval)
 *
 *	Gets a Data-is-Strings character string from <stream> and converts it
 *	into a counted string, returns a pointer to it, and puts the character
 *	count into *<nchars>.  The character string in <stream> consists of an
 *	unsigned integer, followed by a number of characters determined by the
 *	unsigned integer.
 *
 *	The data returned has an NULL byte appended to the end in case the
 *	calling program wishes to treat it as a NULL terminated string.
 *	This means the space allocated for the data is one byte larger than
 *	indicated by the count.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 *	In case of an error, disrcs returns NULL and <nchars> is set to 0.
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdlib.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *	-Gets a Data-is-Strings character string from <stream> and converts it
 *      into a counted string, returns a pointer to it, and puts the character
 *      count into *<nchars>.  The character string in <stream> consists of an
 *      unsigned integer, followed by a number of characters determined by the
 *      unsigned integer.
 *
 * @param[in] stream - socket descriptor
 * @param[out] nchars - character count
 * @param[out] retval - success/error code
 *
 * @return	char*
 * @retval	pointer to converted string	success
 * @retval	NULL				error
 *
 */
char *
disrcs(int stream, size_t *nchars, int *retval)
{
	int locret;
	int negate;
	unsigned count = 0;
	char *value = NULL;

	assert(nchars != NULL);
	assert(retval != NULL);

	locret = disrsi_(stream, &negate, &count, 1, 0);
	locret = negate ? DIS_BADSIGN : locret;
	if (locret == DIS_SUCCESS) {
		if (negate)
			locret = DIS_BADSIGN;
		else {
			value = (char *) malloc((size_t) count + 1);
			if (value == NULL)
				locret = DIS_NOMALLOC;
			else {
				if (dis_gets(stream, value,
					     (size_t) count) != (size_t) count)
					locret = DIS_PROTO;
				else
					value[count] = '\0';
			}
		}
	}
	if ((*retval = locret) != DIS_SUCCESS && value != NULL) {
		count = 0;
		free(value);
		value = NULL;
	}
	*nchars = count;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrd.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrd.c
 *
 * @par Synopsis:
 * 	double disrd(int stream, int *retval)
 *
 *	Gets a Data-is-Strings floating point number from <stream> and converts
 *	it into a double which it returns.  The number from <stream> consists of
 *	two consecutive signed integers.  The first is the coefficient, with its
 *	implied decimal point at the low-order end.  The second is the exponent
 *	as a power of 10.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 *
 *	By fiat of the author, neither loss of significance nor underflow are
 *	errors.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <math.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"
#undef disrd

/**
 * @brief
 *      Gets a Data-is-Strings floating point number from <stream> and converts
 *      it into a double which it returns.  The number from <stream> consists of
 *      two consecutive signed integers.  The first is the coefficient, with its
 *      implied decimal point at the low-order end.  The second is the exponent
 *      as a power of 10.
 *
 * @param[in] stream - socket descriptor
 * @param[out] nchars - character count
 * @param[out] retval - success/error code
 *
 * @return      double
 * @retval      double value    success
 * @retval      0.0		error
 *
 */
double
disrd(int stream, int *retval)
{
	int expon;
	unsigned uexpon;
	int locret;
	int negate;
	unsigned ndigs;
	unsigned nskips;
	dis_long_double_t ldval;

	assert(retval != NULL);

	ldval = 0.0L;
	locret = disrl_(stream, &ldval, &ndigs, &nskips, DBL_DIG, 1, 0);
	if (locret == DIS_SUCCESS) {
		locret = disrsi_(stream, &negate, &uexpon, 1, 0);
		if (locret == DIS_SUCCESS) {
			expon = negate ? nskips - uexpon : nskips + uexpon;
			if (expon + (int) ndigs > DBL_MAX_10_EXP) {
				if (expon + (int) ndigs > DBL_MAX_10_EXP + 1) {
					ldval = ldval < 0.0L ? -HUGE_VAL : HUGE_VAL;
					locret = DIS_OVERFLOW;
				} else {
					ldval *= disp10l_(expon - 1);
					if (ldval > DBL_MAX / 10.0L) {
						ldval = ldval < 0.0L ? -HUGE_VAL : HUGE_VAL;
						locret = DIS_OVERFLOW;
					} else
						ldval *= 10.0L;
				}
			} else {
				if (expon < LDBL_MIN_10_EXP) {
					ldval *= disp10l_(expon + (int) ndigs);
					ldval /= disp10l_((int) ndigs);
				} else
					ldval *= disp10l_(expon);
			}
		}
	}
	*retval = locret;
	return ((double) ldval);
}


================================================
FILE: src/lib/Libdis/disrf.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrf.c
 *
 * @par Synopsis:
 * 	float disrf(int stream, int *retval)
 *
 *	Gets a Data-is-Strings floating point number from <stream> and converts
 *	it into a float and returns it.  The number from <stream> consists of
 *	two consecutive signed integers.  The first is the coefficient, with its
 *	implied decimal point at the low-order end.  The second is the exponent
 *	as a power of 10.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 *
 *	By fiat of the author, neither loss of significance nor underflow are
 *	errors.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <math.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disrf

/**
 * @brief
 *	-Gets a Data-is-Strings floating point number from <stream> and converts
 *      it into a double and returns it.  The number from <stream> consists of
 *      two consecutive signed integers.  The first is the coefficient, with its
 *      implied decimal point at the low-order end.  The second is the exponent
 *      as a power of 10.
 *
 * @return	int
 * @retval	DIS_success/error status
 *
 */
static int
disrd_(int stream, unsigned count, unsigned *ndigs, unsigned *nskips, double *dval, int recursv)
{
	int c;
	int negate;
	unsigned unum;
	char *cp;

	if (++recursv > DIS_RECURSIVE_LIMIT)
		return (DIS_PROTO);

	/* dis_umaxd would be initialized by prior call to dis_init_tables */
	switch (c = dis_getc(stream)) {
		case '-':
		case '+':
			negate = c == '-';
			*nskips = count > FLT_DIG ? count - FLT_DIG : 0;
			count -= *nskips;
			*ndigs = count;
			*dval = 0.0;
			do {
				if ((c = dis_getc(stream)) < '0' || c > '9') {
					if (c < 0)
						return (DIS_EOD);
					return (DIS_NONDIGIT);
				}
				*dval = *dval * 10.0 + (double) (c - '0');
			} while (--count);
			if ((count = *nskips) > 0) {
				count--;
				switch (dis_getc(stream)) {
					case '5':
						if (count == 0)
							break;
					case '6':
					case '7':
					case '8':
					case '9':
						*dval += 1.0;
					case '0':
					case '1':
					case '2':
					case '3':
					case '4':
						if (count > 0 &&
						    disr_skip(stream, (size_t) count) < 0)
							return (DIS_EOD);
						break;
					default:
						return (DIS_NONDIGIT);
				}
			}
			*dval = negate ? -(*dval) : (*dval);
			return (DIS_SUCCESS);
		case '0':
			return (DIS_LEADZRO);
		case '1':
		case '2':
		case '3':
		case '4':
		case '5':
		case '6':
		case '7':
		case '8':
		case '9':
			unum = c - '0';
			if (count > 1) {
				if (count > dis_umaxd)
					break;
				if (dis_gets(stream, dis_buffer + 1, count - 1) !=
				    count - 1)
					return (DIS_EOD);
				cp = dis_buffer;
				if (count == dis_umaxd) {
					*cp = c;
					if (memcmp(dis_buffer, dis_umax, dis_umaxd) > 0)
						break;
				}
				while (--count) {
					if ((c = *++cp) < '0' || c > '9')
						return (DIS_NONDIGIT);
					unum = unum * 10 + (unsigned) (c - '0');
				}
			}
			return (disrd_(stream, unum, ndigs, nskips, dval, recursv));
		case -1:
			return (DIS_EOD);
		case -2:
			return (DIS_EOF);
		default:
			return (DIS_NONDIGIT);
	}
	*dval = HUGE_VAL;
	return (DIS_OVERFLOW);
}

/**
 * @brief
 *      Gets a Data-is-Strings floating point number from <stream> and converts
 *      it into a float which it returns.  The number from <stream> consists of
 *      two consecutive signed integers.  The first is the coefficient, with its
 *      implied decimal point at the low-order end.  The second is the exponent
 *      as a power of 10.
 *
 * @param[in] stream - socket descriptor
 * @param[out] retval - success/error code
 *
 * @return      double
 * @retval      double value    success
 * @retval      0.0             error
 *
 */

float
disrf(int stream, int *retval)
{
	int expon;
	unsigned uexpon;
	int locret;
	int negate;
	/* following were static vars, so initializing them to defaults */
	unsigned ndigs = 0; /* 3 vars now stack variables for threads */
	unsigned nskips = 0;
	double dval = 0.0;

	assert(retval != NULL);
	assert(stream >= 0);

	dval = 0.0;
	if ((locret = disrd_(stream, 1, &ndigs, &nskips, &dval, 0)) == DIS_SUCCESS) {
		locret = disrsi_(stream, &negate, &uexpon, 1, 0);
		if (locret == DIS_SUCCESS) {
			expon = negate ? nskips - uexpon : nskips + uexpon;
			if (expon + (int) ndigs > FLT_MAX_10_EXP) {
				if (expon + (int) ndigs > FLT_MAX_10_EXP + 1) {
					dval = dval < 0.0 ? -HUGE_VAL : HUGE_VAL;
					locret = DIS_OVERFLOW;
				} else {
					dval *= disp10d_(expon - 1);
					if (dval > FLT_MAX / 10.0) {
						dval = dval < 0.0 ? -HUGE_VAL : HUGE_VAL;
						locret = DIS_OVERFLOW;
					} else
						dval *= 10.0;
				}
			} else {
				if (expon < DBL_MIN_10_EXP) {
					dval *= disp10d_(expon + (int) ndigs);
					dval /= disp10d_((int) ndigs);
				} else
					dval *= disp10d_(expon);
			}
		}
	}
	*retval = locret;
	return (dval);
}


================================================
FILE: src/lib/Libdis/disrfcs.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrfcs.c
 *
 * @par Synopsis:
 *	int disrfcs(int stream, size_t *nchars, size_t achars, char *value)
 *
 *	Gets a Data-is-Strings character string from <stream> and converts it
 *	into a counted string, puts the string into <value>, a pre-allocated
 *	string, <achars> long, and puts the count into *<nchars>.  The character
 *	string in <stream> consists of an unsigned integer, followed by a number
 *	of characters determined by the unsigned integer.
 *
 *	Disrfcs returns DIS_SUCCESS if everything works well.  It returns an
 *	error code otherwise.  In case of an error, the <stream> character
 *	pointer is reset, making it possible to retry with some other conversion
 *	strategy, and <nchars> is set to 0.
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdlib.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *	-Gets a Data-is-Strings character string from <stream> and converts it
 *      into a counted string, puts the string into <value>, a pre-allocated
 *      string, <achars> long, and puts the count into *<nchars>.  The character
 *      string in <stream> consists of an unsigned integer, followed by a number
 *      of characters determined by the unsigned integer.
 *
 * @param[in] stream - socket descriptor
 * @param[out] nchars - chars count
 * @param[out] achars - long value
 * @param[out] value - string value
 *
 * @return	int
 * @retval	DIS_success/error status
 *
 */
int
disrfcs(int stream, size_t *nchars, size_t achars, char *value)
{
	int locret;
	int negate;
	unsigned count = 0;

	assert(nchars != NULL);
	assert(value != NULL);

	locret = disrsi_(stream, &negate, &count, 1, 0);
	if (locret == DIS_SUCCESS) {
		if (negate)
			locret = DIS_BADSIGN;
		else if ((*nchars = count) > achars)
			locret = DIS_OVERFLOW;
		else if (dis_gets(stream, value, *nchars) != *nchars)
			locret = DIS_PROTO;
	}
	if (locret != DIS_SUCCESS)
		*nchars = 0;
	return (locret);
}


================================================
FILE: src/lib/Libdis/disrfst.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrfst.c
 *
 * @par Synopsis:
 *	int disrfst(int stream, size_t achars, char *value)
 *
 *	Gets a Data-is-Strings character string from <stream> and converts it
 *	into an ASCII NUL-terminated string, and puts the string into <value>,
 *	a pre-allocated string, <achars> long.  The character string in <stream>
 *	consists of an unsigned integer, followed by a number of characters
 *	determined by the unsigned integer.
 *
 *	Disrfst returns DIS_SUCCESS if everything works well.  It returns an
 *	error code otherwise.  In case of an error, the <stream> character
 *	pointer is reset, making it possible to retry with some other conversion
 *	strategy, and the first character of <value> is set to ASCII NUL.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdlib.h>

#ifndef NDEBUG
#include <string.h>
#endif

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *      -Gets a Data-is-Strings character string from <stream> and converts it
 *      into an ASCII NUL-terminated string, and puts the string into <value>,
 *      a pre-allocated string, <achars> long.  The character string in <stream>
 *      consists of an unsigned integer, followed by a number of characters
 *      determined by the unsigned integer.
 *
 * @param[in] stream - socket descriptor
 * @param[out] achars - long value
 * @param[out] value - string value
 *
 * @return      int
 * @retval      DIS_success/error status
 *
 */

int
disrfst(int stream, size_t achars, char *value)
{
	int locret;
	int negate;
	unsigned count;

	assert(value != NULL);

	locret = disrsi_(stream, &negate, &count, 1, 0);
	if (locret == DIS_SUCCESS) {
		if (negate)
			locret = DIS_BADSIGN;
		else if (count > achars)
			locret = DIS_OVERFLOW;
		else if (dis_gets(stream, value, (size_t) count) !=
			 (size_t) count)
			locret = DIS_PROTO;
#ifndef NDEBUG
		else if (memchr(value, 0, (size_t) count))
			locret = DIS_NULLSTR;
#endif
		else
			value[count] = '\0';
	}
	if (locret != DIS_SUCCESS)
		*value = '\0';
	return (locret);
}


================================================
FILE: src/lib/Libdis/disrl.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrl.c
 *
 * @par Synopsis:
 * 	long double disrl(int stream, int *retval)
 *
 *	Gets a Data-is-Strings floating point number from <stream> and converts
 *	it into a long double and returns it.  The number from <stream> consists
 *	of two consecutive signed integers.  The first is the coefficient, with
 *	its implied decimal point at the low-order end.  The second is the
 *	exponent as a power of 10.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 *
 *	By fiat of the author, neither loss of significance nor underflow are
 *	errors.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <math.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *      Gets a Data-is-Strings floating point number from <stream> and converts
 *      it into a long double which it returns.  The number from <stream> consists of
 *      two consecutive signed integers.  The first is the coefficient, with its
 *      implied decimal point at the low-order end.  The second is the exponent
 *      as a power of 10.
 *
 * @param[in] stream - socket descriptor
 * @param[out] retval - success/error code
 *
 * @return      dis_long_double_t
 * @retval      long double value	success
 * @retval      0.0L             	error
 *
 */

dis_long_double_t
disrl(int stream, int *retval)
{
	int expon;
	unsigned uexpon;
	int locret;
	int negate;
	unsigned ndigs;
	unsigned nskips;
	dis_long_double_t ldval;

	assert(retval != NULL);

	ldval = 0.0L;
	locret = disrl_(stream, &ldval, &ndigs, &nskips, LDBL_DIG, 1, 0);
	if (locret == DIS_SUCCESS) {
		locret = disrsi_(stream, &negate, &uexpon, 1, 0);
		if (locret == DIS_SUCCESS) {
			expon = negate ? nskips - uexpon : nskips + uexpon;
			if (expon + (int) ndigs > LDBL_MAX_10_EXP) {
				if (expon + (int) ndigs > LDBL_MAX_10_EXP + 1) {
					ldval = ldval < 0.0L ? -HUGE_VAL : HUGE_VAL;
					locret = DIS_OVERFLOW;
				} else {
					ldval *= disp10l_(expon - 1);
					if (ldval > LDBL_MAX / 10.0L) {
						ldval = ldval < 0.0L ? -HUGE_VAL : HUGE_VAL;
						locret = DIS_OVERFLOW;
					} else
						ldval *= 10.0L;
				}
			} else {
				if (expon < LDBL_MIN_10_EXP) {
					ldval *= disp10l_(expon + (int) ndigs);
					ldval /= disp10l_((int) ndigs);
				} else
					ldval *= disp10l_(expon);
			}
		}
	}
	*retval = locret;
	return (ldval);
}


================================================
FILE: src/lib/Libdis/disrl_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <math.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
/**
 * @file	disrl_.c
 */
/**
 * @brief
 *      -Gets a Data-is-Strings floating point number from <stream> and converts
 *      it into a long double and returns it.  The number from <stream> consists of
 *      two consecutive signed integers.  The first is the coefficient, with its
 *      implied decimal point at the low-order end.  The second is the exponent
 *      as a power of 10.
 *
 * @return      int
 * @retval      DIS_success/error status
 *
 */
int
disrl_(int stream, dis_long_double_t *ldval, unsigned *ndigs, unsigned *nskips, unsigned sigd, unsigned count, int recursv)
{
	int c;
	int negate;
	unsigned unum;
	char *cp;
	dis_long_double_t fpnum;

	assert(stream >= 0);

	if (++recursv > DIS_RECURSIVE_LIMIT)
		return (DIS_PROTO);

	/* dis_umaxd would be initialized by prior call to dis_init_tables */
	switch (c = dis_getc(stream)) {
		case '-':
		case '+':
			negate = c == '-';
			*nskips = count > sigd ? count - sigd : 0;
			count -= *nskips;
			*ndigs = count;
			fpnum = 0.0L;
			do {
				if ((c = dis_getc(stream)) < '0' || c > '9') {
					if (c < 0)
						return (DIS_EOD);
					return (DIS_NONDIGIT);
				}
				fpnum = fpnum * 10.0L + (dis_long_double_t) (c - '0');
			} while (--count);
			if ((count = *nskips) > 0) {
				count--;
				switch (dis_getc(stream)) {
					case '5':
						if (count == 0)
							break;
					case '6':
					case '7':
					case '8':
					case '9':
						fpnum += 1.0L;
					case '0':
					case '1':
					case '2':
					case '3':
					case '4':
						if (count > 0 &&
						    disr_skip(stream, (size_t) count) == count)
							return (DIS_EOD);
						break;
					default:
						return (DIS_NONDIGIT);
				}
			}
			*ldval = negate ? -fpnum : fpnum;
			return (DIS_SUCCESS);
		case '0':
			return (DIS_LEADZRO);
		case '1':
		case '2':
		case '3':
		case '4':
		case '5':
		case '6':
		case '7':
		case '8':
		case '9':
			unum = c - '0';
			if (count > 1) {
				if (count > dis_umaxd)
					break;
				if (dis_gets(stream, dis_buffer + 1, count - 1) !=
				    count - 1)
					return (DIS_EOD);
				cp = dis_buffer;
				if (count == dis_umaxd) {
					*cp = c;
					if (memcmp(dis_buffer, dis_umax, dis_umaxd) > 0)
						break;
				}
				while (--count) {
					if ((c = *++cp) < '0' || c > '9')
						return (DIS_NONDIGIT);
					unum = unum * 10 + (unsigned) (c - '0');
				}
			}
			return (disrl_(stream, ldval, ndigs, nskips, sigd, unum, recursv));
		case -1:
			return (DIS_EOD);
		case -2:
			return (DIS_EOF);
		default:
			return (DIS_NONDIGIT);
	}
	*ldval = HUGE_VAL;
	return (DIS_OVERFLOW);
}


================================================
FILE: src/lib/Libdis/disrsc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrsc.c
 *
 * @par Synopsis:
 *	signed char disrsc(int stream, int *retval)
 *
 *	Gets a Data-is-Strings signed integer from <stream>, converts it into a
 *	signed char, and returns it.  The signed integer in <stream> consists
 *	of a counted string of digits, starting with a zero or a minus sign,
 *	which represents the number.  If the number doesn't lie between -9 and
 *	9, inclusive, it is preceeded by at least one count.
 *
 *	This format for character strings representing signed integers can best
 *	be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next digit; if it is a sign, go to step (4).
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the magnitude of the signed integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disrsc

/**
 * @brief
 *      -Gets a Data-is-Strings signed integer from <stream>, converts it into a
 *      signed char, and returns it.  The signed integer in <stream> consists
 *      of a counted string of digits, starting with a zero or a minus sign,
 *      which represents the number.  If the number doesn't lie between -9 and
 *      9, inclusive, it is preceeded by at least one count.
 *
 * @param[in] stream - socket descriptor
 * @param[out] retval - dis status val
 *
 * @return      signed char
 * @retval      signed char val		success
 * @retval	0			error
 *
 */
signed char
disrsc(int stream, int *retval)
{
	int locret;
	int negate;
	signed char value;
	unsigned int uvalue;

	assert(retval != NULL);

	value = 0;
	switch (locret = disrsi_(stream, &negate, &uvalue, 1, 0)) {
		case DIS_SUCCESS:
			if (negate ? -uvalue >= SCHAR_MIN : uvalue <= SCHAR_MAX) {
				value = negate ? -uvalue : uvalue;
				break;
			} else
				locret = DIS_OVERFLOW;
		case DIS_OVERFLOW:
			value = negate ? SCHAR_MIN : SCHAR_MAX;
	}
	*retval = locret;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrsi.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrsi.c
 *
 * @par Synopsis:
 *	int disrsi(int stream, int *retval)
 *
 *	Gets a Data-is-Strings signed integer from <stream>, converts it into
 *	an int and returns it.
 *
 *	This format for character strings representing signed integers can best
 *	be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next digit; if it is a sign, go to step (4).
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the magnitude of the signed integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disrsi

/**
 * @brief
 *	-  Gets a Data-is-Strings signed integer from <stream>, converts it into
 *      an int and returns it.
 *
 * @param[in] stream - socket descriptor
 * @param[out] retval - dis status val
 *
 * @return      int
 * @retval      integer value		success
 * @retval      0                       error
 *
 */

int
disrsi(int stream, int *retval)
{
	int locret;
	int negate;
	int value;
	unsigned int uvalue;

	assert(retval != NULL);

	value = 0;
	switch (locret = disrsi_(stream, &negate, &uvalue, 1, 0)) {
		case DIS_SUCCESS:
			if (negate ? uvalue <= (unsigned) -(INT_MIN + 1) + 1 : uvalue <= (unsigned) INT_MAX) {
				value = negate ? -uvalue : uvalue;
				break;
			} else
				locret = DIS_OVERFLOW;
		case DIS_OVERFLOW:
			value = negate ? INT_MIN : INT_MAX;
	}
	*retval = locret;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrsi_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
/**
 * @file	disrsi_.c
 */
/**
 * @brief
 *      -Gets a Data-is-Strings signed integer from <stream>, converts it into a
 *      signed char, and returns it.  The signed integer in <stream> consists
 *      of a counted string of digits, starting with a zero or a minus sign,
 *      which represents the number.  If the number doesn't lie between -9 and
 *      9, inclusive, it is preceeded by at least one count.
 *
 *
 * @return      int
 * @retval      DIS_success/error status
 *
 */
int
disrsi_(int stream, int *negate, unsigned *value, unsigned count, int recursv)
{
	int c;
	unsigned locval;
	unsigned ndigs;
	char *cp;

	assert(negate != NULL);
	assert(value != NULL);
	assert(count);
	assert(stream >= 0);

	if (++recursv > DIS_RECURSIVE_LIMIT)
		return (DIS_PROTO);
	/* dis_umaxd would be initialized by prior call to dis_init_tables */
	switch (c = dis_getc(stream)) {
		case '-':
		case '+':
			*negate = c == '-';
			if (count > dis_umaxd)
				goto overflow;
			if (dis_gets(stream, dis_buffer, count) != count)
				return (DIS_EOD);
			if (count == dis_umaxd) {
				if (memcmp(dis_buffer, dis_umax, dis_umaxd) > 0)
					goto overflow;
			}
			cp = dis_buffer;
			locval = 0;
			do {
				if ((c = *cp++) < '0' || c > '9')
					return (DIS_NONDIGIT);
				locval = 10 * locval + c - '0';
			} while (--count);
			*value = locval;
			return (DIS_SUCCESS);
		case '0':
			return (DIS_LEADZRO);
		case '1':
		case '2':
		case '3':
		case '4':
		case '5':
		case '6':
		case '7':
		case '8':
		case '9':
			ndigs = c - '0';
			if (count > 1) {
				if (count > dis_umaxd)
					break;
				if (dis_gets(stream, dis_buffer + 1, count - 1) !=
				    count - 1)
					return (DIS_EOD);
				cp = dis_buffer;
				if (count == dis_umaxd) {
					*cp = c;
					if (memcmp(dis_buffer, dis_umax, dis_umaxd) > 0)
						break;
				}
				while (--count) {
					if ((c = *++cp) < '0' || c > '9')
						return (DIS_NONDIGIT);
					ndigs = 10 * ndigs + c - '0';
				}
			}
			return (disrsi_(stream, negate, value, ndigs, recursv));
		case -1:
			return (DIS_EOD);
		case -2:
			return (DIS_EOF);
		default:
			return (DIS_NONDIGIT);
	}
	*negate = FALSE;
overflow:
	*value = UINT_MAX;
	return (DIS_OVERFLOW);
}


================================================
FILE: src/lib/Libdis/disrsl.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrsl.c
 *
 * @par Synopsis:
 *	long disrsl(int stream, int *retval)
 *
 *	Gets a Data-is-Strings signed integer from <stream>, converts it into a
 *	long, and returns it.
 *
 *	This format for character strings representing signed integers can best
 *	be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next digit; if it is a sign, go to step (4).
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the magnitude of the signed integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disrsl

/**
 * @brief
 *	Gets a Data-is-Strings signed integer from <stream>, converts it into a
 *      long, and returns it.
 *
 * @param[in] stream - socket descriptor
 * @param[out] retval - dis status val
 *
 * @return      long
 * @retval      long value           success
 * @retval      0                       error
 *
 */

long
disrsl(int stream, int *retval)
{
	int locret;
	int negate;
	long value;
	unsigned long uvalue;

	assert(retval != NULL);

	value = 0;
	switch (locret = disrsl_(stream, &negate, &uvalue, 1, 0)) {
		case DIS_SUCCESS:
			if (negate ? uvalue <= (unsigned long) -(LONG_MIN + 1) + 1 : uvalue <= LONG_MAX) {
				value = negate ? -uvalue : uvalue;
				break;
			} else
				locret = DIS_OVERFLOW;
		case DIS_OVERFLOW:
			value = negate ? LONG_MIN : LONG_MAX;
	}
	*retval = locret;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrsl_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stdio.h>
#include <string.h>
#include <stdlib.h>

#include "dis.h"
#include "dis_.h"

extern char *ulmax;
extern unsigned ulmaxdigs;
/**
 * @file	disrsl.c
 */
/**
 * @brief
 *      -  Gets a Data-is-Strings signed integer from <stream>, converts it into
 *      an int and returns it.
 *
 * @return      int
 * @retval      DIS_success/error status
 *
 */

int
disrsl_(int stream, int *negate, unsigned long *value, unsigned long count, int recursv)
{
	int c;
	unsigned long locval;
	unsigned long ndigs;
	char *cp;

	assert(negate != NULL);
	assert(value != NULL);
	assert(count);
	assert(stream >= 0);

	if (++recursv > DIS_RECURSIVE_LIMIT)
		return (DIS_PROTO);

	switch (c = dis_getc(stream)) {
		case '-':
		case '+':
			if (count > ulmaxdigs)
				goto overflow;
			*negate = c == '-';
			if (dis_gets(stream, dis_buffer, count) != count)
				return (DIS_EOD);
			if (count == ulmaxdigs) {
				if (memcmp(dis_buffer, ulmax, ulmaxdigs) > 0)
					goto overflow;
			}
			cp = dis_buffer;
			locval = 0;
			do {
				if ((c = *cp++) < '0' || c > '9')
					return (DIS_NONDIGIT);
				locval = 10 * locval + c - '0';
			} while (--count);
			*value = locval;
			return (DIS_SUCCESS);
		case '0':
			return (DIS_LEADZRO);
		case '1':
		case '2':
		case '3':
		case '4':
		case '5':
		case '6':
		case '7':
		case '8':
		case '9':
			ndigs = c - '0';
			if (count > 1) {
				if (count > ulmaxdigs)
					break;
				if (dis_gets(stream, dis_buffer + 1, count - 1) !=
				    count - 1)
					return (DIS_EOD);
				cp = dis_buffer;
				if (count == ulmaxdigs) {
					*cp = c;
					if (memcmp(dis_buffer, ulmax, ulmaxdigs) > 0)
						break;
				}
				while (--count) {
					if ((c = *++cp) < '0' || c > '9')
						return (DIS_NONDIGIT);
					ndigs = 10 * ndigs + c - '0';
				}
			}
			return (disrsl_(stream, negate, value, ndigs, recursv));
		case -1:
			return (DIS_EOD);
		case -2:
			return (DIS_EOF);
		default:
			return (DIS_NONDIGIT);
	}
	*negate = FALSE;
overflow:
	*value = ULONG_MAX;
	return (DIS_OVERFLOW);
}


================================================
FILE: src/lib/Libdis/disrsll_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stdio.h>
#include <string.h>
#include <stdlib.h>

#include "dis.h"
#include "dis_.h"

char *ulmax = NULL;
unsigned ulmaxdigs = 0;
/**
 * @file	disrsll_.c
 */
/**
 * @brief
 *	-initialise u_long max
 *
 */
void
init_ulmax()
{
	char *cp;
	if (ulmaxdigs == 0) {
		cp = discull_(dis_buffer + DIS_BUFSIZ, UlONG_MAX, &ulmaxdigs);
		ulmax = (char *) malloc(ulmaxdigs);
		assert(ulmax != NULL);
		memcpy(ulmax, cp, ulmaxdigs);
	}
}

/**
 * @brief
 *	-Function to convert a string into numeric form of type u_Long
 *
 * @return	int
 * @retval	DIS_success/error
 *
 */

int
disrsll_(int stream, int *negate, u_Long *value, unsigned long count, int recursv)
{
	int c;
	u_Long locval;
	unsigned long ndigs;
	char *cp;

	assert(negate != NULL);
	assert(value != NULL);
	assert(count);
	assert(stream >= 0);

	if (++recursv > DIS_RECURSIVE_LIMIT)
		return (DIS_PROTO);

	/* ulmaxdigs  would be initialized from dis_init_tables */
	switch (c = dis_getc(stream)) {
		case '-':
		case '+':
			*negate = (c == '-');
			if (count > ulmaxdigs)
				goto overflow;
			if (dis_gets(stream, dis_buffer, count) != count)
				return (DIS_EOD);
			if (count == ulmaxdigs) {
				if (memcmp(dis_buffer, ulmax, ulmaxdigs) > 0)
					goto overflow;
			}
			cp = dis_buffer;
			locval = 0;
			do {
				if ((c = *cp++) < '0' || c > '9')
					return (DIS_NONDIGIT);
				locval = (10 * locval) + c - '0';
			} while (--count);
			*value = locval;
			return (DIS_SUCCESS);
		case '0':
			return (DIS_LEADZRO);
		case '1':
		case '2':
		case '3':
		case '4':
		case '5':
		case '6':
		case '7':
		case '8':
		case '9':
			ndigs = c - '0';
			if (count > 1) {
				if (count > ulmaxdigs)
					break;
				if (dis_gets(stream, dis_buffer + 1, count - 1) !=
				    count - 1)
					return (DIS_EOD);
				cp = dis_buffer;
				if (count == ulmaxdigs) {
					*cp = c;
					if (memcmp(dis_buffer, ulmax, ulmaxdigs) > 0)
						break;
				}
				while (--count) {
					if ((c = *++cp) < '0' || c > '9')
						return (DIS_NONDIGIT);
					ndigs = (10 * ndigs) + c - '0';
				}
			}
			return (disrsll_(stream, negate, value, ndigs, recursv));
		case -1:
			return (DIS_EOD);
		case -2:
			return (DIS_EOF);
		default:
			return (DIS_NONDIGIT);
	}
	*negate = FALSE;
overflow:
	*value = UlONG_MAX;
	return (DIS_OVERFLOW);
}


================================================
FILE: src/lib/Libdis/disrss.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrss.c
 *
 * @par Synopsis:
 *	short disrss(int stream, int *retval)
 *
 *	Gets a Data-is-Strings signed integer from <stream>, converts it
 *	into a short, and returns it.  The signed integer in <stream> consists
 *	of a counted string of digits, starting with a zero or a minus sign,
 *	which represents the number.  If the number doesn't lie between -9 and
 *	9, inclusive, it is preceeded by at least one count.
 *
 *	This format for character strings representing signed integers can best
 *	be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next digit; if it is zero or a minus sign, go to step (4).
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the magnitude of the signed integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disrss

/**
 * @brief
 *	Gets a Data-is-Strings signed integer from <stream>, converts it
 *	into a short, and returns it
 *
 * @param[in] stream - pointer to data stream
 * @param[out] retval - return value
 *
 * @return      short
 * @retval      converted value         success
 * @retval      0                       error
 *
 */
short
disrss(int stream, int *retval)
{
	int locret;
	int negate;
	short value;
	unsigned uvalue;

	assert(retval != NULL);

	value = 0;
	switch (locret = disrsi_(stream, &negate, &uvalue, 1, 0)) {
		case DIS_SUCCESS:
			if (negate ? -uvalue >= SHRT_MIN : uvalue <= SHRT_MAX) {
				value = negate ? -uvalue : uvalue;
				break;
			} else
				locret = DIS_OVERFLOW;
		case DIS_OVERFLOW:
			value = negate ? SHRT_MIN : SHRT_MAX;
	}
	*retval = locret;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrst.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrst.c
 *
 * @par Synopsis:
 *	char *disrst(int stream, int *retval)
 *
 *	Gets a Data-is-Strings character string from <stream> and converts it
 *	into a null-terminated string, and returns a pointer to the result.  The
 *	character string in <stream> consists of an unsigned integer, followed
 *	by a number of characters determined by the unsigned integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 *	In case of an error, the return value is NULL.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdlib.h>

#ifndef NDEBUG
#include <string.h>
#endif

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *      Gets a Data-is-Strings signed integer from <stream>, converts it
 *      into a null-terminated string, and returns a pointer to the result.
 *
 * @param[in] stream - pointer to data stream
 * @param[out] retval - return value
 *
 * @return      string
 * @retval      converted value         success
 * @retval      0                       error
 *
 */

char *
disrst(int stream, int *retval)
{
	int locret;
	int negate;
	unsigned count;
	char *value = NULL;

	assert(retval != NULL);

	locret = disrsi_(stream, &negate, &count, 1, 0);
	if (locret == DIS_SUCCESS) {
		if (negate)
			locret = DIS_BADSIGN;
		else {
			value = (char *) malloc((size_t) count + 1);
			if (value == NULL)
				locret = DIS_NOMALLOC;
			else {
				if (dis_gets(stream, value,
					     (size_t) count) != (size_t) count)
					locret = DIS_PROTO;
#ifndef NDEBUG
				else if (memchr(value, 0, (size_t) count))
					locret = DIS_NULLSTR;
#endif
				else
					value[count] = '\0';
			}
		}
	}
	if ((*retval = locret) != DIS_SUCCESS && value != NULL) {
		free(value);
		value = NULL;
	}
	return (value);
}


================================================
FILE: src/lib/Libdis/disruc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disruc.c
 *
 * @par Synopsis:
 *	unsigned char disruc(int stream, int *<retval>)
 *
 *	Gets a Data-is-Strings unsigned integer from <stream>, converts it into
 *	an unsigned char, and returns it.  The unsigned integer in <stream>
 *	consists of a counted string of digits, starting with a zero, which
 *	represents the number.  If the number doesn't lie between 0 and 9,
 *	inclusive, it is preceeded by at least one count.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next digit; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disruc

/**
 * @brief
 *      Gets a Data-is-Strings signed integer from <stream>, converts it
 *      into a unsigned char, and returns it
 *
 * @param[in] stream - pointer to data stream
 * @param[out] retval - return value
 *
 * @return      unsigned char
 * @retval      converted value         success
 * @retval      0                       error
 *
 */

unsigned char
disruc(int stream, int *retval)
{
	int locret;
	int negate;
	unsigned value;

	assert(retval != NULL);

	locret = disrsi_(stream, &negate, &value, 1, 0);
	if (locret != DIS_SUCCESS) {
		value = 0;
	} else if (negate) {
		value = 0;
		locret = DIS_BADSIGN;
	} else if (value > UCHAR_MAX) {
		value = UCHAR_MAX;
		locret = DIS_OVERFLOW;
	}
	*retval = locret;
	return ((unsigned char) value);
}


================================================
FILE: src/lib/Libdis/disrui.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrui.c
 *
 * @par Synopsis:
 *	unsigned disrui(int stream, int *value)
 *
 *	Gets a Data-is-Strings unsigned integer from <stream>, converts it into
 *	an unsigned int, and returns it.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disrui

/**
 * @brief
 *      Gets a Data-is-Strings signed integer from <stream>, converts it
 *      into an unsigned int, and returns it
 *
 * @param[in] stream - pointer to data stream
 * @param[out] retval - return value
 *
 * @return      short
 * @retval      converted value         success
 * @retval      0                       error
 *
 */

unsigned
disrui(int stream, int *retval)
{
	int locret;
	int negate;
	unsigned value;

	locret = disrsi_(stream, &negate, &value, 1, 0);
	if (locret != DIS_SUCCESS) {
		value = 0;
	} else if (negate) {
		value = 0;
		locret = DIS_BADSIGN;
	}
	*retval = locret;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrul.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrul.c
 *
 * @par Synopsis:
 *	unsigned long disrul(int stream, int *retval)
 *
 *	Gets a Data-is-Strings unsigned integer from <stream>, converts it into
 *	an unsigned long, and returns it.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *      Gets a Data-is-Strings signed integer from <stream>, converts it
 *      into a unsigned long, and returns it
 *
 * @param[in] stream - pointer to data stream
 * @param[out] retval - return value
 *
 * @return      unsigned long
 * @retval      converted value         success
 * @retval      0                       error
 *
 */
unsigned long
disrul(int stream, int *retval)
{
	int locret;
	int negate;
	unsigned long value;

	locret = disrsl_(stream, &negate, &value, 1, 0);
	if (locret != DIS_SUCCESS) {
		value = 0;
	} else if (negate) {
		value = 0;
		locret = DIS_BADSIGN;
	}
	*retval = locret;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrull.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrull.c
 *
 * @par Synopsis:
 *	u_Long disrull(int stream, int *retval)
 *
 *	Gets a Data-is-Strings unsigned integer from <stream>, converts it into
 *	an u_Long, and returns it.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *  	Function to read a string which comes over network from
 *  	mom to server and convert that string data to numeric form of type
 *  	u_Long
 *
 * @param[in] stream - pointer to data stream
 * @param[out] retval - return value
 *
 * @return	u_Long
 * @retval	converted value		success
 * @retval	0			error
 *
 */

u_Long
disrull(int stream, int *retval)
{
	int locret;
	int negate;
	u_Long value;

	assert(retval != NULL);

	locret = disrsll_(stream, &negate, &value, 1, 0);
	if (locret != DIS_SUCCESS) {
		value = 0;
	} else if (negate) {
		value = 0;
		locret = DIS_BADSIGN;
	}
	*retval = locret;
	return (value);
}


================================================
FILE: src/lib/Libdis/disrus.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	disrus.c
 *
 * @par Synopsis:
 *	unsigned short disrus(int stream, int *retval)
 *
 *	Gets a Data-is-Strings unsigned integer from <stream>, converts it into
 *	an unsigned short, and returns it.  The unsigned integer in <stream>
 *	consists of a counted string of digits, starting with a zero, which
 *	represents the number.  If the number doesn't lie between 0 and 9,
 *	inclusive, it is preceeded by at least one count.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next digit; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	*<retval> gets DIS_SUCCESS if everything works well.  It gets an error
 *	code otherwise.  In case of an error, the <stream> character pointer is
 *	reset, making it possible to retry with some other conversion strategy.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef disrus

/**
 * @brief
 *      Gets a Data-is-Strings signed integer from <stream>, converts it
 *      into a unsigned short, and returns it
 *
 * @param[in] stream - pointer to data stream
 * @param[out] retval - return value
 *
 * @return      unsigned short
 * @retval      converted value         success
 * @retval      0                       error
 *
 */

unsigned short
disrus(int stream, int *retval)
{
	int locret;
	int negate;
	unsigned value;

	assert(retval != NULL);

	locret = disrsi_(stream, &negate, &value, 1, 0);
	if (locret != DIS_SUCCESS) {
		value = 0;
	} else if (negate) {
		value = 0;
		locret = DIS_BADSIGN;
	} else if (value > USHRT_MAX) {
		value = USHRT_MAX;
		locret = DIS_OVERFLOW;
	}
	*retval = locret;
	return ((unsigned short) value);
}


================================================
FILE: src/lib/Libdis/diswcs.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswcs.c
 *
 * @par Synopsis:
 *	int diswcs(int stream, char *value, size_t nchars)
 *
 *	Converts a counted string in *<value> into a Data-is-Strings character
 *	string and sends it to <stream>.  The character string in <stream>
 *	consists of the unsigned integer representation of <nchars>, followed by
 *	<nchars> characters from *<value>.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *	Converts a counted string in *<value> into a Data-is-Strings character
 *      string and sends it to <stream>.
 *
 * @param[in] stream - pointer to data stream
 * @param[in] value - value to be converted
 * @param[in] nchars - size of chars
 *
 * @return	int
 * @return	DIS_SUCCESS	success
 * @retval	error code	error
 *
 */
int
diswcs(int stream, const char *value, size_t nchars)
{
	int retval;

	assert(nchars <= UINT_MAX);

	retval = diswui_(stream, (unsigned) nchars);
	if (retval == DIS_SUCCESS && nchars > 0 &&
	    dis_puts(stream, value, nchars) != nchars)
		retval = DIS_PROTO;
	return retval;
}


================================================
FILE: src/lib/Libdis/diswf.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswf.c
 *
 * @par Synopsis:
 * 	int diswf(int stream, float value)
 *
 *	Converts <value> into a Data-is-Strings floating point number and sends
 *	it to <stream>.  The converted number consists of two consecutive signed
 *	integers.  The first is the coefficient, at most <ndigs> long, with its
 *	implied decimal point at the low-order end.  The second is the exponent
 *	as a power of 10.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"
#undef diswf

/**
 * @brief
 *	Converts <value> into a Data-is-Strings floating point number and sends
 *      it to <stream>.
 *
 * @param[in] stream	socket fd
 * @param[in] value 	value to be converted
 *
 * @return	int
 * @retval	DIS_SUCCESS	success
 * @retval	error code	error
 *
 */
int
diswf(int stream, double value)
{
	int c;
	int expon;
	unsigned ndigs;
	int negate;
	int retval;
	unsigned pow2;
	char *cp;
	char *ocp;
	double dval;

	assert(stream >= 0);

	/* Make zero a special case.  If we don't it will blow exponent		*/
	/* calculation.								*/
	if (value == 0.0) {
		return (dis_puts(stream, "+0+0", 4) != 4 ? DIS_PROTO : DIS_SUCCESS);
	}
	/* Extract the sign from the coefficient.				*/
	dval = (negate = value < 0.0) ? -value : value;
	/* Detect and complain about the infinite form.				*/
	if (dval > FLT_MAX)
		return (DIS_HUGEVAL);
	/* Compute the integer part of the log to the base 10 of dval.  As a	*/
	/* byproduct, reduce the range of dval to the half-open interval,       */
	/* [1, 10).								*/

	/* dis_dmx10 would be initialized by prior call to dis_init_tables */
	expon = 0;
	pow2 = dis_dmx10 + 1;
	if (dval < 1.0) {
		do {
			if (dval < dis_dn10[--pow2]) {
				dval *= dis_dp10[pow2];
				expon += 1 << pow2;
			}
		} while (pow2);
		dval *= 10.0;
		expon = -expon - 1;
	} else {
		do {
			if (dval >= dis_dp10[--pow2]) {
				dval *= dis_dn10[pow2];
				expon += 1 << pow2;
			}
		} while (pow2);
	}
	/* Round the value to the last digit					*/
	dval += 5.0 * disp10d_(-FLT_DIG);
	if (dval >= 10.0) {
		expon++;
		dval *= 0.1;
	}
	/* Starting in the middle of the buffer, convert coefficient digits,	*/
	/* most significant first.						*/
	ocp = cp = &dis_buffer[DIS_BUFSIZ - FLT_DIG];
	ndigs = FLT_DIG;
	do {
		c = dval;
		dval = (dval - c) * 10.0;
		*ocp++ = c + '0';
	} while (--ndigs);
	/* Eliminate trailing zeros.						*/
	while (*--ocp == '0')
		;
	/* The decimal point is at the low order end of the coefficient		*/
	/* integer, so adjust the exponent for the number of digits in the	*/
	/* coefficient.								*/
	ndigs = ++ocp - cp;
	expon -= ndigs - 1;
	/* Put the coefficient sign into the buffer, left of the coefficient.	*/
	*--cp = negate ? '-' : '+';
	/* Insert the necessary number of counts on the left.			*/
	while (ndigs > 1)
		cp = discui_(cp, ndigs, &ndigs);
	/* The complete coefficient integer is done.  Put it out.		*/
	retval = dis_puts(stream, cp, (size_t) (ocp - cp)) < 0 ? DIS_PROTO : DIS_SUCCESS;
	/* If that worked, follow with the exponent, commit, and return.	*/
	if (retval == DIS_SUCCESS)
		return (diswsi(stream, expon));
	/* If coefficient didn't work, negative commit and return the error.	*/
	return retval;
}


================================================
FILE: src/lib/Libdis/diswl_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswl_.c
 *
 * @par Synopsis:
 * 	int diswl_(int stream, dis_long_double_t value, unsigned int ndigs)
 *
 *	Converts <value> into a Data-is-Strings floating point number and sends
 *	it to <stream>.  The converted number consists of two consecutive signed
 *	integers.  The first is the coefficient, at most <ndigs> long, with its
 *	implied decimal point at the low-order end.  The second is the exponent
 *	as a power of 10.
 *
 *	This function is only invoked through the macros, diswf, diswd, and
 *	diswl, which are defined in the header file, dis.h.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *      Converts <value> into a Data-is-Strings floating point number and sends
 *      it to <stream>.
 *
 * @param[in] stream    socket fd
 * @param[in] ndigs	length of number
 * @param[in] value     value to be converted
 *
 * @return      int
 * @retval      DIS_SUCCESS     success
 * @retval      error code      error
 *
 */
int
diswl_(int stream, dis_long_double_t value, unsigned ndigs)
{
	int c;
	int expon;
	int negate;
	int retval;
	unsigned pow2;
	char *cp;
	char *ocp;
	dis_long_double_t ldval;

	assert(ndigs > 0 && ndigs <= LDBL_DIG);
	assert(stream >= 0);

	/* Make zero a special case.  If we don't it will blow exponent		*/
	/* calculation.								*/
	if (value == 0.0L) {
		return (dis_puts(stream, "+0+0", 4) < 0 ? DIS_PROTO : DIS_SUCCESS);
	}
	/* Extract the sign from the coefficient.				*/
	ldval = (negate = value < 0.0L) ? -value : value;
	/* Detect and complain about the infinite form.				*/
	if (ldval > LDBL_MAX)
		return (DIS_HUGEVAL);
	/* Compute the integer part of the log to the base 10 of ldval.  As a	*/
	/* byproduct, reduce the range of ldval to the half-open interval,      */
	/* [1, 10).								*/

	/* dis_lmx10 would be initialized by prior call to dis_init_tables */
	expon = 0;
	pow2 = dis_lmx10 + 1;
	if (ldval < 1.0L) {
		do {
			if (ldval < dis_ln10[--pow2]) {
				ldval *= dis_lp10[pow2];
				expon += 1 << pow2;
			}
		} while (pow2);
		ldval *= 10.0;
		expon = -expon - 1;
	} else {
		do {
			if (ldval >= dis_lp10[--pow2]) {
				ldval *= dis_ln10[pow2];
				expon += 1 << pow2;
			}
		} while (pow2);
	}
	/* Round the value to the last digit					*/
	ldval += 5.0L * disp10l_(-ndigs);
	if (ldval >= 10.0L) {
		expon++;
		ldval *= 0.1L;
	}
	/* Starting in the middle of the buffer, convert coefficient digits,	*/
	/* most significant first.						*/
	ocp = cp = &dis_buffer[DIS_BUFSIZ - ndigs];
	do {
		c = ldval;
		ldval = (ldval - c) * 10.0L;
		*ocp++ = c + '0';
	} while (--ndigs);
	/* Eliminate trailing zeros.						*/
	while (*--ocp == '0')
		;
	/* The decimal point is at the low order end of the coefficient		*/
	/* integer, so adjust the exponent for the number of digits in the	*/
	/* coefficient.								*/
	ndigs = ++ocp - cp;
	expon -= ndigs - 1;
	/* Put the coefficient sign into the buffer, left of the coefficient.	*/
	*--cp = negate ? '-' : '+';
	/* Insert the necessary number of counts on the left.			*/
	while (ndigs > 1)
		cp = discui_(cp, ndigs, &ndigs);
	/* The complete coefficient integer is done.  Put it out.		*/
	retval = dis_puts(stream, cp, (size_t) (ocp - cp)) < 0 ? DIS_PROTO : DIS_SUCCESS;
	/* If that worked, follow with the exponent, commit, and return.	*/
	if (retval == DIS_SUCCESS)
		return (diswsi(stream, expon));
	/* If coefficient didn't work, negative commit and return the error.	*/
	return retval;
}


================================================
FILE: src/lib/Libdis/diswsi.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswsi.c
 *
 * @par Synopsis:
 * 	int diswsi(int stream, int value)
 *
 *	Converts <value> into a Data-is-Strings signed integer and sends it to
 *	<stream>.
 *
 *	This format for character strings representing integers can best be
 *	understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a sign, go to step (4).
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"
#undef diswsi

/**
 * @brief
 *	Converts <value> into a Data-is-Strings signed integer and sends it to
 *      <stream>.
 *
 * @param[in] stream    socket fd
 * @param[in] value     value to be converted
 *
 * @return      int
 * @retval      DIS_SUCCESS     success
 * @retval      error code      error
 *
 */
int
diswsi(int stream, int value)
{
	int retval;
	unsigned ndigs;
	unsigned uval;
	char c;
	char *cp;

	assert(stream >= 0);

	if (value < 0) {
		uval = (unsigned) -(value + 1) + 1;
		c = '-';
	} else {
		uval = value;
		c = '+';
	}
	cp = discui_(&dis_buffer[DIS_BUFSIZ], uval, &ndigs);
	*--cp = c;
	while (ndigs > 1)
		cp = discui_(cp, ndigs, &ndigs);
	retval = dis_puts(stream, cp,
			  (size_t) (&dis_buffer[DIS_BUFSIZ] - cp)) < 0
			 ? DIS_PROTO
			 : DIS_SUCCESS;
	return retval;
}


================================================
FILE: src/lib/Libdis/diswsl.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswsl.c
 *
 * @par Synopsis:
 * 	int diswsl(int stream, long value)
 *
 *	Converts <value> into a Data-is-Strings signed integer and sends it to
 *	<stream>.
 *
 *	This format for character strings representing integers can best be
 *	understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a sign, go to step (4).
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *      Converts <value> into a Data-is-Strings signed integer and sends it to
 *      <stream>.
 *
 * @param[in] stream    socket fd
 * @param[in] value     value to be converted
 *
 * @return      int
 * @retval      DIS_SUCCESS     success
 * @retval      error code      error
 *
 */

int
diswsl(int stream, long value)
{
	int retval;
	unsigned ndigs;
	unsigned long ulval;
	char c;
	char *cp;

	assert(stream >= 0);

	if (value < 0) {
		ulval = (unsigned long) -(value + 1) + 1;
		c = '-';
	} else {
		ulval = value;
		c = '+';
	}
	cp = discul_(&dis_buffer[DIS_BUFSIZ], ulval, &ndigs);
	*--cp = c;
	while (ndigs > 1)
		cp = discui_(cp, ndigs, &ndigs);
	retval = dis_puts(stream, cp,
			  (size_t) (&dis_buffer[DIS_BUFSIZ] - cp)) < 0
			 ? DIS_PROTO
			 : DIS_SUCCESS;
	return retval;
}


================================================
FILE: src/lib/Libdis/diswui.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswui.c
 *
 * @par Synopsis:
 *	int diswui(int stream, unsigned value)
 *
 *	Converts <value> into a Data-is-Strings unsigned integer and sends it to
 *	<stream>.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>

#include "dis.h"
#include "dis_.h"
#undef diswui

/**
 * @brief
 *      Converts <value> into a Data-is-Strings unsigned integer and sends
 *      it to <stream>.
 *
 * @param[in] stream    socket fd
 * @param[in] value     value to be converted
 *
 * @return      int
 * @retval      DIS_SUCCESS     success
 * @retval      error code      error
 *
 */
int
diswui(int stream, unsigned value)
{
	return diswui_(stream, value);
}


================================================
FILE: src/lib/Libdis/diswui_.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"
/**
 * @file	diswui_.c
 */
/**
 * @brief
 *      Converts <value> into a Data-is-Strings unsigned integer and sends
 *      it to <stream>.
 *
 * @param[in] stream    socket fd
 * @param[in] value     value to be converted
 *
 * @return      int
 * @retval      DIS_SUCCESS     success
 * @retval      error code      error
 *
 */
int
diswui_(int stream, unsigned value)
{
	unsigned ndigs;
	char *cp;

	assert(stream >= 0);

	cp = discui_(&dis_buffer[DIS_BUFSIZ], value, &ndigs);
	*--cp = '+';
	while (ndigs > 1)
		cp = discui_(cp, ndigs, &ndigs);
	if (dis_puts(stream, cp, (size_t) (&dis_buffer[DIS_BUFSIZ] - cp)) < 0)
		return (DIS_PROTO);
	return (DIS_SUCCESS);
}


================================================
FILE: src/lib/Libdis/diswul.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswul.c
 *
 * @par Synopsis:
 *	int diswul(int stream, unsigned long value)
 *
 *	Converts <value> into a Data-is-Strings unsigned integer and sends it to
 *	<stream>.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *      Converts <value> into a Data-is-Strings unsigned integer and sends
 *      it to <stream>.
 *
 * @param[in] stream    socket fd
 * @param[in] value     value to be converted
 *
 * @return      int
 * @retval      DIS_SUCCESS     success
 * @retval      error code      error
 *
 */
int
diswul(int stream, unsigned long value)
{
	int retval;
	unsigned ndigs;
	char *cp;

	assert(stream >= 0);
	cp = discul_(&dis_buffer[DIS_BUFSIZ], value, &ndigs);
	*--cp = '+';
	while (ndigs > 1)
		cp = discui_(cp, ndigs, &ndigs);
	retval = dis_puts(stream, cp,
			  (size_t) (&dis_buffer[DIS_BUFSIZ] - cp)) < 0
			 ? DIS_PROTO
			 : DIS_SUCCESS;
	return retval;
}


================================================
FILE: src/lib/Libdis/diswull.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	diswull.c
 *
 * @par Synopsis:
 *	int diswull(int stream, u_Long value)
 *
 *	Converts <value> into a Data-is-Strings unsigned integer and sends it to
 *	<stream>.
 *
 *	This format for character strings representing unsigned integers can
 *	best be understood through the decoding algorithm:
 *
 *	1. Initialize the digit count to 1.
 *
 *	2. Read the next character; if it is a plus sign, go to step (4); if it
 *	   is a minus sign, post an error.
 *
 *	3. Decode a new count from the digit decoded in step (2) and the next
 *	   count - 1 digits; repeat step (2).
 *
 *	4. Decode the next count digits as the unsigned integer.
 *
 *	Returns DIS_SUCCESS if everything works well.  Returns an error code
 *	otherwise.  In case of an error, no characters are sent to <stream>.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stddef.h>
#include <stdio.h>

#include "dis.h"
#include "dis_.h"

/**
 * @brief
 *  Function to convert a numeric value of data type u_Long to string
 *  form and  writes over network to send that string data from mom to
 *  PBS server
 *
 * @param[in] stream    socket fd
 * @param[in] value     value to be converted
 *
 * @return      int
 * @retval      DIS_SUCCESS     success
 * @retval      error code      error
 *
 */

int
diswull(int stream, u_Long value)
{
	int retval;
	unsigned ndigs;
	char *cp;

	assert(stream >= 0);

	cp = discull_(&dis_buffer[DIS_BUFSIZ], value, &ndigs);
	*--cp = '+';
	while (ndigs > 1)
		cp = discui_(cp, ndigs, &ndigs);
	retval = dis_puts(stream, cp,
			  (size_t) (&dis_buffer[DIS_BUFSIZ] - cp)) < 0
			 ? DIS_PROTO
			 : DIS_SUCCESS;
	return retval;
}


================================================
FILE: src/lib/Libdis/ps_dis.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <stdlib.h>
#include <unistd.h>
#include <assert.h>
#include "dis.h"
#include "placementsets.h"

static vnl_t *vn_decode_DIS_V3(int, int *);
static vnl_t *vn_decode_DIS_V4(int, int *);
static int vn_encode_DIS_V4(int, vnl_t *);
static vnl_t *free_and_return(vnl_t *); /* expedient error function */
/**
 * @file	ps_dis.c
 */
/**
 * @brief
 *	vn_decode_DIS - read verison 3 or 4 vnode definition information from
 * Mom.
 * @par Functionality:
 *	The V4 over-the-wire representation of a placement set list (vnl_t) is
 *	a superset of V3.  V4 adds the ability to specify the type of an
 *	attribute/resource (and reserves a place in the protocol for flags).
 *	The V3 over-the-wire representation of a placement set list (vnl_t) is
 *
 *	version		unsigned integer	the version of the following
 *						information
 *
 *	Version PS_DIS_V3 consists of
 *
 *	vnl_modtime	signed long		this OTW format could be
 *						problematic:   the Open Group
 *						Base Specifications Issue 6
 *						says that time_t ``shall be
 *						integer or real-floating''
 *
 *	vnl_used	unsigned integer	number of entries in the vnal_t
 *						array to follow
 *
 *
 *	There follows, for each element of the vnal_t array,
 *
 *	vnal_id		string
 *
 *	vnal_used	unsigned integer	number of entries in the vna_t
 *						array to follow
 *
 *	vna_name	string			name of resource
 *	vna_val		string			value of resource
 *		Following added in V4
 *	vna_type	int			type of attribute/resource
 *	vna_flag	int			flag of attribute/resource (-h)
 *
 *
 * @param[in]	fd  - file (socket) descriptor from which to read
 * @param[out]	rcp - pointer to int into which to return the error value,
 *			either DIS_SUCCESS or some DIS_* error.
 *
 * @return	vnl_t *
 * @retval	pointer to decoded vnode information which has been malloc-ed.
 * @retval	NULL on error, see rcp value
 *
 * @par Side Effects: None
 *
 * @par MT-safe: yes
 *
 */
vnl_t *
vn_decode_DIS(int fd, int *rcp)
{
	unsigned int vers;

	vers = disrui(fd, rcp);
	if (*rcp != DIS_SUCCESS)
		return NULL;

	switch (vers) {
		case PS_DIS_V3:
			return (vn_decode_DIS_V3(fd, rcp));
		case PS_DIS_V4:
			return (vn_decode_DIS_V4(fd, rcp));

		default:
			*rcp = DIS_PROTO;
			return NULL;
	}
}

/**
 * @brief
 *	vn_decode_DIS_V4 - decode version 4 vnode information from Mom
 *
 * @par Functionality:
 *	See vn_decode_DIS() above, This is called from there to decode
 *	V4 information.
 *
 * @param[in]	fd  -     socket descriptor from which to read
 * @param[out]	rcp -     pointer to place to return error code if error.
 *
 * @return	vnl_t *
 * @retval	pointer to decoded vnode information which has been malloc-ed.
 * @retval	NULL on error, see rcp value
 *
 * @par Side Effects: None
 *
 * @par MT-safe: yes
 *
 */
static vnl_t *
vn_decode_DIS_V4(int fd, int *rcp)
{
	unsigned int i, j;
	unsigned int size;
	time_t t;
	vnl_t *vnlp;

	if ((vnlp = calloc(1, sizeof(vnl_t))) == NULL) {
		*rcp = DIS_NOMALLOC;
		return NULL;
	}

	t = (time_t) disrsl(fd, rcp);
	if (*rcp != DIS_SUCCESS) {
		free(vnlp);
		return NULL;
	} else {
		vnlp->vnl_modtime = t;
	}
	size = disrui(fd, rcp);
	if (*rcp != DIS_SUCCESS) {
		free(vnlp);
		return NULL;
	} else {
		vnlp->vnl_nelem = vnlp->vnl_used = size;
	}

	if ((vnlp->vnl_list = calloc(vnlp->vnl_nelem,
				     sizeof(vnal_t))) == NULL) {
		free(vnlp);
		*rcp = DIS_NOMALLOC;
		return NULL;
	}

	for (i = 0; i < vnlp->vnl_used; i++) {
		vnal_t *curreslist = VNL_NODENUM(vnlp, i);

		/*
		 *	In case an error occurs and we need to free
		 *	whatever's been allocated so far, we use the
		 *	vnl_cur entry to record the number of vnal_t
		 *	entries to free.
		 */
		vnlp->vnl_cur = i;

		curreslist->vnal_id = disrst(fd, rcp);
		if (*rcp != DIS_SUCCESS)
			return (free_and_return(vnlp));

		size = disrui(fd, rcp);
		if (*rcp != DIS_SUCCESS)
			return (free_and_return(vnlp));
		else
			curreslist->vnal_nelem = curreslist->vnal_used = size;
		if ((curreslist->vnal_list = calloc(curreslist->vnal_nelem,
						    sizeof(vna_t))) == NULL)
			return (free_and_return(vnlp));

		for (j = 0; j < size; j++) {
			vna_t *curres = VNAL_NODENUM(curreslist, j);

			/*
			 *	In case an error occurs and we need to free
			 *	whatever's been allocated so far, we use the
			 *	vnal_cur entry to record the number of vna_t
			 *	entries to free.
			 */
			curreslist->vnal_cur = j;

			curres->vna_name = disrst(fd, rcp);
			if (*rcp != DIS_SUCCESS)
				return (free_and_return(vnlp));
			curres->vna_val = disrst(fd, rcp);
			if (*rcp != DIS_SUCCESS)
				return (free_and_return(vnlp));
			curres->vna_type = disrsi(fd, rcp);
			if (*rcp != DIS_SUCCESS)
				return (free_and_return(vnlp));
			curres->vna_flag = disrsi(fd, rcp);
			if (*rcp != DIS_SUCCESS)
				return (free_and_return(vnlp));
		}
	}

	*rcp = DIS_SUCCESS;
	return (vnlp);
}

/**
 * @brief
 *	vn_decode_DIS_V3 - decode version 3 vnode information from Mom
 *
 * @par Functionality:
 *	See vn_decode_DIS() above, This is called from there to decode
 *	V3 information.
 *
 * @param[in]	fd  -     socket descriptor from which to read
 * @param[out]	rcp -     pointer to place to return error code if error.
 *
 * @return	vnl_t *
 * @retval	pointer to decoded vnode information which has been malloc-ed.
 * @retval	NULL on error, see rcp value
 *
 * @par Side Effects: None
 *
 * @par MT-safe: yes
 *
 */
static vnl_t *
vn_decode_DIS_V3(int fd, int *rcp)
{
	unsigned int i, j;
	unsigned int size;
	time_t t;
	vnl_t *vnlp;

	if ((vnlp = calloc(1, sizeof(vnl_t))) == NULL) {
		*rcp = DIS_NOMALLOC;
		return NULL;
	}

	t = (time_t) disrsl(fd, rcp);
	if (*rcp != DIS_SUCCESS) {
		free(vnlp);
		return NULL;
	} else
		vnlp->vnl_modtime = t;
	size = disrui(fd, rcp);
	if (*rcp != DIS_SUCCESS) {
		free(vnlp);
		return NULL;
	} else
		vnlp->vnl_nelem = vnlp->vnl_used = size;

	if ((vnlp->vnl_list = calloc(vnlp->vnl_nelem,
				     sizeof(vnal_t))) == NULL) {
		free(vnlp);
		*rcp = DIS_NOMALLOC;
		return NULL;
	}

	for (i = 0; i < vnlp->vnl_used; i++) {
		vnal_t *curreslist = VNL_NODENUM(vnlp, i);

		/*
		 *	In case an error occurs and we need to free
		 *	whatever's been allocated so far, we use the
		 *	vnal_cur entry to record the number of vnal_t
		 *	entries to free.
		 */
		vnlp->vnl_cur = i;

		curreslist->vnal_id = disrst(fd, rcp);
		if (*rcp != DIS_SUCCESS)
			return (free_and_return(vnlp));

		size = disrui(fd, rcp);
		if (*rcp != DIS_SUCCESS)
			return (free_and_return(vnlp));
		else
			curreslist->vnal_nelem = curreslist->vnal_used = size;
		if ((curreslist->vnal_list = calloc(curreslist->vnal_nelem,
						    sizeof(vna_t))) == NULL)
			return (free_and_return(vnlp));

		for (j = 0; j < size; j++) {
			vna_t *curres = VNAL_NODENUM(curreslist, j);

			/*
			 *	In case an error occurs and we need to free
			 *	whatever's been allocated so far, we use the
			 *	vnal_cur entry to record the number of vna_t
			 *	entries to free.
			 */
			curreslist->vnal_cur = j;

			curres->vna_name = disrst(fd, rcp);
			if (*rcp != DIS_SUCCESS)
				return (free_and_return(vnlp));
			curres->vna_val = disrst(fd, rcp);
			if (*rcp != DIS_SUCCESS)
				return (free_and_return(vnlp));
		}
	}

	*rcp = DIS_SUCCESS;
	return (vnlp);
}

/**
 * @brief
 *	vn_encode_DIS - encode vnode information, used by Mom.
 *
 * @par Functionality:
 *	Used to encode vnode information.  See vn_decode_DIS() above for a
 *	description of the information encoded/decoded.  Only the latest
 *	version of information is currently supported for encode.
 *
 * @param[in]	fd   - socket descriptor to which to write the encode info.
 * @param[in]	vnlp - structure to encode and send.
 *
 * @return	int
 * @retval	DIS_SUCCESS (0) on success
 * @retval	DIS_* on error.
 *
 * @par Side Effects: None
 *
 * @par MT-safe: No, the structure pointed to by vnlp needs to be locked
 *
 */
int
vn_encode_DIS(int fd, vnl_t *vnlp)
{
	switch (PS_DIS_CURVERSION) {
		case PS_DIS_V4:
			return (vn_encode_DIS_V4(fd, vnlp));

		default:
			return (DIS_PROTO);
	}
}

/**
 * @brief
 *	vn_encode_DIS_V4 - encode version 4 vnode information, used by Mom.
 *
 * @par Functionality:
 *	Used to encode vnode information.  See vn_encode_DIS() above for a
 *	description of the information.  Supports version 4 only.
 *
 * @param[in]	fd   - socket descriptor to which to write the encode info.
 * @param[in]	vnlp - structure to encode and send.
 *
 * @return	int
 * @retval	DIS_SUCCESS (0) on success
 * @retval	DIS_* on error.
 *
 * @par Side Effects: None
 *
 * @par MT-safe: No, the structure pointed to by vnlp needs to be locked
 *
 */
static int
vn_encode_DIS_V4(int fd, vnl_t *vnlp)
{
	int rc;
	unsigned int i, j;

	if (((rc = diswui(fd, PS_DIS_V4)) != 0) ||
	    ((rc = diswsl(fd, (long) vnlp->vnl_modtime)) != 0) ||
	    ((rc = diswui(fd, vnlp->vnl_used)) != 0))
		return (rc);

	for (i = 0; i < vnlp->vnl_used; i++) {
		vnal_t *curreslist = VNL_NODENUM(vnlp, i);

		if ((rc = diswst(fd, curreslist->vnal_id)) != 0)
			return (rc);
		if ((rc = diswui(fd, curreslist->vnal_used)) != 0)
			return (rc);

		for (j = 0; j < curreslist->vnal_used; j++) {
			vna_t *curres = VNAL_NODENUM(curreslist, j);

			if ((rc = diswst(fd, curres->vna_name)) != 0)
				return (rc);
			if ((rc = diswst(fd, curres->vna_val)) != 0)
				return (rc);
			if ((rc = diswsi(fd, curres->vna_type)) != 0)
				return (rc);
			if ((rc = diswsi(fd, curres->vna_flag)) != 0)
				return (rc);
		}
	}

	return (DIS_SUCCESS);
}

/**
 * @brief
 *	free_and_return - free a vnl_t data structure.
 *
 * @par Functionality:
 *	Note that this function is nearly identical to vnl_free() (q.v.),
 *	with the exception of using the *_cur values to free partially-
 *
 * @param[in]	vnlp - pointer to structure to free
 *
 * @return	vnl_t *
 * @retval	NULL
 *
 * @par Side Effects: None
 *
 * @par MT-safe: No, vnlp needs to be locked.
 *
 */
static vnl_t *
free_and_return(vnl_t *vnlp)
{
	unsigned int i, j;

	/* N.B. <=, not < because we may have a partially-allocated ith one */
	for (i = 0; i <= vnlp->vnl_cur; i++) {
		vnal_t *vnrlp = VNL_NODENUM(vnlp, i);

		/* N.B. <=, not < (as above) for partially-allocated jth one */
		for (j = 0; j <= vnrlp->vnal_cur; j++) {
			vna_t *vnrp = VNAL_NODENUM(vnrlp, j);
			free(vnrp->vna_name);
			free(vnrp->vna_val);
		}
		free(vnrlp->vnal_list);
		free(vnrlp->vnal_id);
	}
	free(vnlp->vnl_list);
	free(vnlp);

	return NULL;
}


================================================
FILE: src/lib/Libecl/ecl_verify.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	ecl_verify.c
 *
 * @brief	The top level verification functionality
 *
 * @par		Functionality:
 *		Top level verification routines which in-turn call attribute
 *		level verification functions for datatype and value.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <stdlib.h>
#include <string.h>

#include "pbs_ifl.h"
#include "pbs_ecl.h"
#include "pbs_error.h"

#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "pbs_nodes.h"
#include "server.h"
#include "libpbs.h"
#include "pbs_client_thread.h"

static enum batch_op seljobs_opstring_enums[] = {EQ, NE, GE, GT, LE, LT};
static int size_seljobs = sizeof(seljobs_opstring_enums) / sizeof(enum batch_op);

/* static function declarations */
static int
__pbs_verify_attributes(int connect, int batch_request,
			int parent_object, int command, struct attropl *attribute_list);
static int
__pbs_verify_attributes_dummy(int connect, int batch_request,
			      int parent_object, int command, struct attropl *attribute_list);
static struct ecl_attribute_def *ecl_findattr(int, struct attropl *);
static struct ecl_attribute_def *ecl_find_attr_in_def(
	struct ecl_attribute_def *, char *, int);
static int get_attr_type(struct ecl_attribute_def attr_def);

/* default function pointer assignments */
int (*pfn_pbs_verify_attributes)(int connect, int batch_request,
				 int parent_object, int cmd, struct attropl *attribute_list) = &__pbs_verify_attributes;

/**
 * @brief
 *	Bypass attribute verification on IFL API calls
 *
 * @par Functionality:
 *	This function resets the attribute verifcation function pointer to a
 *	dummy function, called from daemons, such that attribute verification is
 *	bypassed.
 *
 * @see
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
set_no_attribute_verification(void)
{
	pfn_pbs_verify_attributes = &__pbs_verify_attributes_dummy;
}

/**
 * @brief
 *	The dummy verify attributes function
 *
 * @par Functionality:
 *	This is the function that gets called when IFL API is invoked by an
 *	application which has earlier called "set_no_attribute_verification"
 *
 * @see
 *
 * @param[in]	connect		-	Connection Identifier
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	attribute_list	-	list of attributes
 *
 * @return	int
 * @retval	Zero
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
__pbs_verify_attributes_dummy(int connect, int batch_request,
			      int parent_object, int cmd, struct attropl *attribute_list)
{
	return 0;
}

/**
 * @brief
 *	The real verify function called from most IFL API calls
 *
 * @par Functionality:
 *	1. Gets the attr_errlist from the TLS data, deallocates it, if already
 *         allocated and then allocates it again.\n
 *	2. Clears the connect context values from the TLS\n
 *	3. Calls verify_attributes to verify the list of attributes passed\n
 *
 * @see verify_attributes
 *
 * @param[in]	connect		-	Connection Identifier
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	attribute_list	-	list of attributes
 *
 * @return	int
 * @retval 	0 - No failed attributes
 * @retval 	+n - Number of failed attributes (pbs_errno set to last error)
 * @retval 	-1 - System error verifying attributes (pbs_errno is set)
 *
 * @par		Side effects:
 *		Modifies the TLS data for this thread\n
 *		pbs_errno is set on encourtering error
 *
 * @par MT-safe: Yes
 */
static int
__pbs_verify_attributes(int connect, int batch_request,
			int parent_object, int cmd, struct attropl *attribute_list)
{
	struct pbs_client_thread_context *ptr;
	struct pbs_client_thread_connect_context *con;
	int rc;

	/* get error list from TLS */
	ptr = (struct pbs_client_thread_context *)
		pbs_client_thread_get_context_data();
	if (ptr == NULL) {
		/* very unlikely case */
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	/* since api is going to reuse err_list, free it first */
	free_errlist(ptr->th_errlist);
	ptr->th_errlist = NULL;

	con = pbs_client_thread_find_connect_context(connect);
	if (con == NULL) {
		if ((con = pbs_client_thread_add_connect_context(connect)) == NULL) {
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
	}

	/* clear the TLS error codes */
	con->th_ch_errno = 0;
	if (con->th_ch_errtxt)
		free(con->th_ch_errtxt);
	con->th_ch_errtxt = NULL;

	if (attribute_list == NULL)
		return 0;

	rc = verify_attributes(batch_request, parent_object, cmd,
			       attribute_list, &ptr->th_errlist);
	if (rc > 0) {
		/* also set the pbs error code */
		pbs_errno = ptr->th_errlist->ecl_attrerr[0].ecl_errcode;

		/* copy first error code into TLS connection context */
		con->th_ch_errno = ptr->th_errlist->ecl_attrerr[0].ecl_errcode;
		if (ptr->th_errlist->ecl_attrerr[0].ecl_errmsg) {
			con->th_ch_errtxt =
				strdup(ptr->th_errlist->ecl_attrerr[0].ecl_errmsg);
			if (con->th_ch_errtxt == NULL) {
				pbs_errno = PBSE_SYSTEM;
				return -1;
			}
		}
	}
	return rc;
}

/**
 * @brief
 *	Verify one attribute
 *
 * @par Functionality:
 *      1. Finds the attribute in the correct object attribute list\n
 *      2. Invokes the at_verify_datatype function to check datatype is good\n
 *      3. Invokes the at_verify_value function to check if the value is good\n
 *	4. This function is also called from the hooks verification functions,
 *	   "is_job_input_valid" and "is_resv_input_valid" from
 *	    lib\Libpython\pbs_python_svr_internal.c
 *
 * @see verify_attributes
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	list of attributes
 * @param[out]	verified	-	Whether verification was done
 * @param[out]	err_msg		-	Error message for attribute verification
 *					failure
 * @return	int
 * @retval	0   - Passed verification
 * @retval	> 0 - attribute failed verification (pbs error number returned)
 * @retval	-1  - Out of memory
 *
 * @par	verified:
 *	1 - if the verification could be done\n
 *	0 - No verification handlers present, verification not done\n
 *	This output parameter is primarily used by the hooks verification
 *	functions to figure out whether any attribute verification was really
 *	done. If not done (value was 0) then the hooks code calls the server
 *	decode functions in an attempt to verify the attribute values.
 *
 * @par	err_msg:
 *	If the attribute fails verification, the err_msg parameter is set
 *	to the reason of failure. \n
 *	The err_msg parameter is passed to all the attribute verifiction
 *	routines, such that if a need arises, it would be possible for the
 *	individual routines to set a custom error message. \n
 * 	If the called attribute verification routines do not set any custom
 *	verification error message, then this routine sets the error message
 *	by calling "pbse_to_txt" to convert the return error code to error msg.
 *
 * @par	Side effects:
 *	pbs_errno set on error
 *
 * @par MT-safe: Yes
 */
int
verify_an_attribute(int batch_request, int parent_object, int cmd,
		    struct attropl *pattr,
		    int *verified,
		    char **err_msg)
{
	ecl_attribute_def *p_eclattr = NULL;
	int err_code = PBSE_NONE;
	char *p;

	*verified = 1; /* set to verified */

	/* skip check when dealing with a "resource" parent object */
	if (parent_object == MGR_OBJ_RSC)
		return PBSE_NONE;

	if ((p_eclattr = ecl_findattr(parent_object, pattr)) == NULL) {
		err_code = PBSE_NOATTR;
		goto err;
	}

	if (pattr->value == NULL || pattr->value[0] == '\0') {

		/* allow empty/null values for unset/delete of pbs_manager */
		if ((batch_request == PBS_BATCH_Manager) &&
		    (cmd == MGR_CMD_UNSET || cmd == MGR_CMD_DELETE))
			return PBSE_NONE;

		/* for the following stat calls, the value can be null/empty */
		if (batch_request == PBS_BATCH_StatusJob ||
		    batch_request == PBS_BATCH_StatusQue ||
		    batch_request == PBS_BATCH_StatusSvr ||
		    batch_request == PBS_BATCH_StatusNode ||
		    batch_request == PBS_BATCH_StatusRsc ||
		    batch_request == PBS_BATCH_StatusHook ||
		    batch_request == PBS_BATCH_StatusResv ||
		    batch_request == PBS_BATCH_StatusSched)
			return PBSE_NONE;
	}

	/* for others, value shouldn't be null */
	if (pattr->value == NULL) {
		err_code = PBSE_BADATVAL;
		goto err;
	}

	/*
	 * When using ifl library directly, there is a possibility where resource is passed as NULL
	 * Check this variable for NULL and send error if it is NULL.
	 */
	if (strcasecmp(pattr->name, ATTR_l) == 0) {
		if (pattr->resource == NULL) {
			err_code = PBSE_UNKRESC;
			goto err;
		}
	}

	if (p_eclattr->at_verify_datatype) {
		if ((err_code = p_eclattr->at_verify_datatype(pattr, err_msg)))
			goto err;
	}

	if (p_eclattr->at_verify_value) {
		if ((err_code = p_eclattr->at_verify_value(batch_request,
							   parent_object, cmd, pattr, err_msg)))
			goto err;
	}

	if (p_eclattr->at_verify_value == NULL) /* no verify func */
		*verified = 0;

	return PBSE_NONE;

err:
	if ((err_code != 0) && (*err_msg == NULL)) {
		/* find err_msg and update it */
		p = pbse_to_txt(err_code);
		if (p) {
			*err_msg = strdup(p);
			if (*err_msg == NULL)
				return -1;
		}
	}
	return err_code;
}

/**
 * @brief
 *	Duplicate an attribute structure
 *
 * @par Functionality:
 *	Helper routine to safely duplicate a attribute structure
 *	frees if allocation fails anywhere.
 * @see
 *
 * @param[in]	pattr	-	list of attributes
 *
 * @return	Pointer to the duplicated attribute structure
 * @retval	address of the duplicated attribute (failure)
 * @retval	NULL (failure)
 *
 * @par Side Effects: None
 *
 * @par MT-safe: Yes
 */
static struct attropl *
duplicate_attr(struct attropl *pattr)
{
	struct attropl *new_attr = (struct attropl *)
		calloc(1, sizeof(struct attropl));
	if (new_attr == NULL)
		return NULL;
	if (pattr->name)
		if ((new_attr->name = strdup(pattr->name)) == NULL)
			goto err;
	if (pattr->resource)
		if ((new_attr->resource = strdup(pattr->resource)) == NULL)
			goto err;
	if (pattr->value)
		if ((new_attr->value = strdup(pattr->value)) == NULL)
			goto err;
	return new_attr;

err:
	free(new_attr->name);
	free(new_attr->resource);
	free(new_attr->value);
	free(new_attr);
	return NULL;
}

/**
 * @brief
 *	Loops through the attribute list and verifies each attribute
 *
 * @par	Functionality:
 *	1. Calls verify_an_attribute to verify each attribute in a loop\n
 *	2. Adjusts the attribute_list by expanding it appropriately
 *
 * @see
 *	__pbs_verify_attributes\n
 *	verify_an_attribute
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	attribute_list	-	list of attributes
 * @param[out]	arg_err_list	-	list holding attribute errors
 *
 * @return	int
 * @retval	0 - No failed attributes
 * @retval	+n - Number of failed attributes (pbs_errno set to last error)
 * @retval	-1 - System error verifying attributes (pbs_errno is set)
 *
 * @par	Side effects:
 *	 pbs_errno set on error
 *
 * @par MT-safe: Yes
 */
int
verify_attributes(int batch_request, int parent_object, int cmd,
		  struct attropl *attribute_list,
		  struct ecl_attribute_errors **arg_err_list)
{

	struct attropl *pattr = NULL;
	int failure_count = 0;
	int cur_size = 0;
	int err_code = 0;
	struct ecl_attribute_errors *err_list = NULL;
	struct ecl_attrerr *temp = NULL;
	char *msg = NULL;
	int i;
	int verified;
	struct attropl *new_attr;

	err_list = (struct ecl_attribute_errors *)
		malloc(sizeof(struct ecl_attribute_errors));
	if (err_list == NULL) {
		err_code = PBSE_SYSTEM;
		return -1;
	}
	err_list->ecl_numerrors = 0;
	err_list->ecl_attrerr = NULL;

	if ((parent_object == MGR_OBJ_SITE_HOOK) || (parent_object == MGR_OBJ_PBS_HOOK)) {
		/* exempt from attribute checks */
		*arg_err_list = err_list;
		return 0;
	}

	for (pattr = attribute_list; pattr; pattr = pattr->next) {

		err_code = verify_an_attribute(batch_request, parent_object,
					       cmd, pattr, &verified, &msg);

		/* now check the op value, for selectjob api*/
		if ((err_code == 0) &&
		    (batch_request == PBS_BATCH_SelectJobs)) {
			for (i = 0; i < size_seljobs; i++)
				if (pattr->op == seljobs_opstring_enums[i])
					break;
			if (i == sizeof(seljobs_opstring_enums))
				err_code = PBSE_BADATVAL;
		}

		if (err_code != 0) {
			if (cur_size - failure_count < 1) {
				cur_size += SLOT_INCR_SIZE;
				temp = (struct ecl_attrerr *)
					realloc(err_list->ecl_attrerr,
						cur_size * sizeof(struct ecl_attrerr));
				if (temp == NULL) {
					free_errlist(err_list);
					pbs_errno = PBSE_SYSTEM;
					return -1;
				}
				err_list->ecl_attrerr = temp;
			}
			failure_count++;

			/* keep a copy of the whole attribute, incase attribute
			 * was allocated from stack by caller etc, it might be
			 * lost, and a pointer alone would be of no good
			 */
			new_attr = duplicate_attr(pattr);
			if (new_attr == NULL) {
				free_errlist(err_list);
				pbs_errno = PBSE_SYSTEM;
				return -1;
			}
			err_list->ecl_attrerr[failure_count - 1].ecl_attribute = (struct attropl *) new_attr;
			err_list->ecl_attrerr[failure_count - 1].ecl_errcode = err_code;
			err_list->ecl_attrerr[failure_count - 1].ecl_errmsg = NULL;
			if (msg != NULL) {
				if ((err_list->ecl_attrerr[failure_count - 1].ecl_errmsg = strdup(msg)) == NULL) {
					pbs_errno = PBSE_SYSTEM;
					free_errlist(err_list);
					free(msg);
					msg = NULL;
					return -1;
				}
				free(msg);
				msg = NULL;
			}
		}
	}

	if ((failure_count > 0) && (failure_count != cur_size)) {
		temp = (struct ecl_attrerr *)
			realloc(err_list->ecl_attrerr, failure_count *
							       sizeof(struct ecl_attrerr));
		if (temp == NULL) {
			free_errlist(err_list);
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
		err_list->ecl_attrerr = temp;
	}

	err_list->ecl_numerrors = failure_count;
	*arg_err_list = err_list;
	return failure_count;
}

/**
 * @brief
 *	Name: ecl_findattr
 *
 * @par		Functionality:
 *		1. Find the attribute in the list associated with the
 *		parent_object by calling ecl_find_attr_in_def().
 *
 * @see
 *
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	pattr		-	list of attributes
 *
 * @return	pointer to the ecl_attribute_def structure
 * @retval	Return value: Address of the ecl_attribute_def structure
 *		associated with the given attribute, NULL if not found
 *
 * @par		Side effects:
 *		None
 *
 * @par MT-safe: Yes
 */
static struct ecl_attribute_def *
ecl_findattr(int parent_object,
	     struct attropl *pattr)
{
	switch (parent_object) {
		case MGR_OBJ_JOB:
			return (ecl_find_attr_in_def(ecl_job_attr_def, pattr->name,
						     ecl_job_attr_size));
		case MGR_OBJ_SERVER:
			return (ecl_find_attr_in_def(ecl_svr_attr_def, pattr->name,
						     ecl_svr_attr_size));
		case MGR_OBJ_SCHED:
			return (ecl_find_attr_in_def(ecl_sched_attr_def, pattr->name,
						     ecl_sched_attr_size));
		case MGR_OBJ_QUEUE:
			return (ecl_find_attr_in_def(ecl_que_attr_def, pattr->name,
						     ecl_que_attr_size));
		case MGR_OBJ_NODE:
		case MGR_OBJ_HOST:
			return (ecl_find_attr_in_def(ecl_node_attr_def, pattr->name,
						     ecl_node_attr_size));
		case MGR_OBJ_RESV:
			return (ecl_find_attr_in_def(ecl_resv_attr_def, pattr->name,
						     ecl_resv_attr_size));
	}
	return NULL;
}

/**
 * @brief
 * 	find_attr - find attribute definition by name
 *
 * @see
 *
 * @par
 *	Searches array of attribute definition strutures to find one whose name
 *	matches the requested name.
 *
 * @param[in]	attr_def	-	ptr to attribute definition
 * @param[in]	name		-	attribute name to find
 * @param[in]	limit		-	limit on size of defintion array
 *
 * @return	ecl_attribute_def  - ptr to attribute defintion
 * @retval	>= pointer to attribute (success case)
 * @retval	NULL - if didn't find matching name (failed)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
static struct ecl_attribute_def *
ecl_find_attr_in_def(
	struct ecl_attribute_def *attr_def,
	char *name, int limit)
{
	int index;

	if (attr_def) {
		for (index = 0; index < limit; index++) {
			char *pc = NULL;

			if (strncasecmp(name, attr_def[index].at_name,
					strlen(attr_def[index].at_name)) == 0) {
				pc = name + strlen(attr_def[index].at_name);
				if ((*pc == '\0') || (*pc == '.') || (*pc == ','))
					return &(attr_def[index]);
			}
		}
	}
	return NULL;
}

/**
 * @brief 	Return the type of attribute (public, invisible or read-only)
 *
 * @param[in]	attr_def	-	the attribute to check
 *
 * @return	int
 * @retval	TYPE_ATTR_PUBLIC if the attribute is public
 * @retval	TYPE_ATTR_INVISIBLE if the attribute is a SvWR or SvRD (invisible)
 * @retval	TYPE_ATTR_READONLY otherwise
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
static int
get_attr_type(struct ecl_attribute_def attr_def)
{
	/*
	 * Consider an attr def public if it has any of the write flags set
	 */
	if (attr_def.at_flags & (ATR_DFLAG_USWR | ATR_DFLAG_OPWR | ATR_DFLAG_MGWR))
		return TYPE_ATTR_PUBLIC;
	else if (attr_def.at_flags & (ATR_DFLAG_MGRD | ATR_DFLAG_OPRD | ATR_DFLAG_OTHRD | ATR_DFLAG_USRD))
		return TYPE_ATTR_READONLY;
	else
		return TYPE_ATTR_INVISIBLE;
}

/**
 * @brief
 *	find_resc_def - find the resource_def structure for a resource
 *	with a given name.
 *
 * @see
 *
 * @param[in]	rscdf		-	ptr to attribute definition strcture
 * @param[in]	name		-	name of resouce
 * @param[in] 	limit		-	number of members in resource_def array
 *
 * @return 	ecl_attribute_def - ptr to attribute definition
 * @retval	pointer to the found resource structure (success)
 * @retval	NULL(failure)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
struct ecl_attribute_def *
ecl_find_resc_def(struct ecl_attribute_def *rscdf, char *name, int limit)
{
	while (limit--) {
		if (strcasecmp(rscdf->at_name, name) == 0)
			return (rscdf);
		rscdf++;
	}
	return NULL;
}

/**
 * @brief
 * 	Returns TRUE if the name passed in is an attribute.
 *
 * @note
 * 	This must not be called with object of type MGR_OBJ_SITE_HOOK or MGR_OBJ_PBS_HOOK.
 *
 * @param[in]	object - type of object
 * @param[in]	name  - name of the attribute
 * @param[in]	attr_type  - type of the attribute
 *
 * @eturn int
 * @retval	TRUE - means if the input is an attribute of the given 'object' type
 *        	    and 'attr_type'.
 * @retval	FALSE - otherwise.
 *
 */
int
is_attr(int object, char *name, int attr_type)
{
	struct ecl_attribute_def *attr_def = NULL;

	if ((object == MGR_OBJ_SITE_HOOK) || (object == MGR_OBJ_PBS_HOOK)) {
		return FALSE;
	}

	else if (object == MGR_OBJ_RSC) {
		return TRUE;
	}

	if ((attr_def = ecl_find_attr_in_def(ecl_svr_attr_def, name, ecl_svr_attr_size)) != NULL) {
		/* Make sure that the attribute types match */
		if (get_attr_type(*attr_def) & attr_type)
			return TRUE;
		else
			return FALSE;
	} else if ((attr_def = ecl_find_attr_in_def(ecl_node_attr_def, name, ecl_node_attr_size)) != NULL) {
		/* Make sure that the attribute types match */
		if (get_attr_type(*attr_def) & attr_type)
			return TRUE;
		else
			return FALSE;
	} else if ((attr_def = ecl_find_attr_in_def(ecl_que_attr_def, name, ecl_que_attr_size)) != NULL) {
		/* Make sure that the attribute types match */
		if (get_attr_type(*attr_def) & attr_type)
			return TRUE;
		else
			return FALSE;
	} else if ((attr_def = ecl_find_attr_in_def(ecl_sched_attr_def, name, ecl_sched_attr_size)) != NULL) {
		/* Make sure that the attribute types match */
		if (get_attr_type(*attr_def) & attr_type)
			return TRUE;
		else
			return FALSE;
	}

	return FALSE;
}


================================================
FILE: src/lib/Libecl/ecl_verify_datatypes.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	ecl_verify_datatypes.c
 *
 * @brief	Attribute datatype verification functions
 *
 * @par Functionality:
 *	This module contains attribute datatype verification functions\n
 *	Each function in this module takes a common format as follows:\n
 *	int verify_datatype_xxxx(struct attropl * pattr, char **err_msg)\n
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <stdlib.h>
#include <string.h>

#include "pbs_ifl.h"
#include "pbs_ecl.h"
#include "pbs_error.h"

/**
 * @brief
 *	verifies boolean attribute
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_bool(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	atr.at_flags = 0;
	return (decode_b(&atr, pattr->name, pattr->resource, pattr->value));
}

/**
 * @brief
 *      verifies  attribute of short datatype
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_short(struct attropl *pattr, char **err_msg)
{
	short s;
	int ret;
	attribute atr;
	atr.at_flags = 0;
	if ((ret = decode_l(&atr, pattr->name, pattr->resource, pattr->value)))
		return ret;
	s = (short) atr.at_val.at_long;
	if (atr.at_val.at_long != (long) s)
		return (PBSE_BADATVAL);

	return PBSE_NONE;
}

/**
 * @brief
 *      verifies  attribute of long datatype
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_long(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	atr.at_flags = 0;
	return (decode_l(&atr, pattr->name, pattr->resource, pattr->value));
}

/**
 * @brief
 *      verifies  attribute of long long datatype
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return      int
 * @retval  0 - Attribute passed verification
 * @retval >0 - Attribute failed verification - pbs error code returned
 */

int
verify_datatype_long_long(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	atr.at_flags = 0;
	return (decode_ll(&atr, pattr->name, pattr->resource, pattr->value));
}

/**
 * @brief
 *      verifies  attribute of float datatype
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_float(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	atr.at_flags = 0;
	return (decode_f(&atr, pattr->name, pattr->resource, pattr->value));
}

/**
 * @brief
 *      verifies  attribute of size type
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_size(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	atr.at_flags = 0;
	return (decode_size(&atr, pattr->name, pattr->resource, pattr->value));
}

/**
 * @brief
 *      verifies  attribute of time type
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_time(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	atr.at_flags = 0;
	return (decode_time(&atr, pattr->name, pattr->resource, pattr->value));
}

/**
 * @brief
 *      verifies  attribute of node type
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_nodes(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	atr.at_flags = 0;
	return (decode_nodes(&atr, pattr->name, pattr->resource, pattr->value));
}

/**
 * @brief
 *      verifies  attribute of select type
 *
 * @param[in] pattr - struct attropl - Address of attribute to verify
 * @param[out] err_msg - char ** - Sets the error message if any
 *
 * @return int
 * @retval 0 - Attribute passed verification\n
 * @retval >0 - Attribute failed verification - pbs error code returned\n
 */

int
verify_datatype_select(struct attropl *pattr, char **err_msg)
{
	attribute atr;
	int ret = PBSE_BADATVAL;
	memset(&atr, 0, sizeof(struct attribute));
	ret = decode_select(&atr, pattr->name,
			    pattr->resource, pattr->value);
	(void) free(atr.at_val.at_str);
	return ret;
}


================================================
FILE: src/lib/Libecl/ecl_verify_object_name.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	ecl_verify_object_name.c
 *
 * @brief	Contains a function to validate object names
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>

#include "pbs_ifl.h"
#include "pbs_ecl.h"
#include "pbs_error.h"
#include "pbs_nodes.h"
#include "libpbs.h"

/**
 * @brief
 *	pbs_verify_object_name - Validate an object name
 *
 * @par Functionality:
 *	Verify that the name of an object conforms to the type provided.
 *
 * @see
 *	Formats chapter of the PBS Reference Guide for further information.
 *
 * @param[in]	type - Object type
 * @param[in]	name - Object name to check
 *
 * @return	int
 * @retval	0 - The name conforms
 * @retval	1 - The name does not conform (pbs_errno is modified)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
pbs_verify_object_name(int type, const char *name)
{
	const char *ptr;

	if ((type < 0) || (type >= MGR_OBJ_LAST)) {
		pbs_errno = PBSE_IVAL_OBJ_NAME;
		return 1;
	}
	/*
	 * In many cases, the object name will be empty. This is normal
	 * for qmgr commands such as "set server scheduling=true" because
	 * the command will be sent to the default server. Don't bother
	 * checking empty names.
	 */
	if ((name == NULL) || (*name == '\0'))
		return 0;
	switch (type) {
		case MGR_OBJ_SERVER:
			if (strlen(name) > PBS_MAXSERVERNAME) {
				pbs_errno = PBSE_IVAL_OBJ_NAME;
				return 1;
			}
			break;
		case MGR_OBJ_QUEUE:
			if (strlen(name) > PBS_MAXQUEUENAME) {
				pbs_errno = PBSE_QUENBIG;
				return 1;
			}
			/* Must begin with an alphanumeric character. */
			ptr = name;
			if (!isalnum(*ptr)) {
				pbs_errno = PBSE_IVAL_OBJ_NAME;
				return 1;
			}
			for (ptr++; *ptr != '\0'; ptr++) {
				switch (*ptr) {
					case '_':
					case '-':
						break;
					default:
						if (!isalnum(*ptr)) {
							pbs_errno = PBSE_IVAL_OBJ_NAME;
							return 1;
						}
						break;
				}
			}
			break;
		case MGR_OBJ_JOB:
			if (strlen(name) > PBS_MAXJOBNAME) {
				pbs_errno = PBSE_IVAL_OBJ_NAME;
				return 1;
			}
			break;
		case MGR_OBJ_NODE:
			if (strlen(name) > PBS_MAXNODENAME) {
				pbs_errno = PBSE_NODENBIG;
				return 1;
			}
			break;
		case MGR_OBJ_RESV:
			if (strlen(name) > PBS_MAXQRESVNAME) {
				pbs_errno = PBSE_IVAL_OBJ_NAME;
				return 1;
			}
			break;
		case MGR_OBJ_HOST:
			if (strlen(name) > PBS_MAXHOSTNAME) {
				pbs_errno = PBSE_IVAL_OBJ_NAME;
				return 1;
			}
			break;
		case MGR_OBJ_RSC:
		case MGR_OBJ_SCHED:
		case MGR_OBJ_SITE_HOOK:
		case MGR_OBJ_PBS_HOOK:
		default:
			break;
	}

	return 0;
}


================================================
FILE: src/lib/Libecl/ecl_verify_values.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	ecl_verify_values.c
 *
 * @brief	The attribute value verification functions
 *
 * @par Functionality:
 *	This module contains the attribute value verification functions.\n
 *	Each function in this module takes a common format as follows:\n
 *
 * @par Signature:
 *	int verify_value_xxxx(int batch_request, int parent_object,
 *                      struct attropl * pattr, char **err_msg)\n
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 - Attribute passed verification
 * @retval	>0 - Failed verification - pbs errcode is returned
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdlib.h>
#include <string.h>

#include "pbs_ifl.h"
#include "pbs_ecl.h"
#include "pbs_error.h"
#include "cmds.h"
#include "ticket.h"
#include "pbs_license.h"

#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "pbs_nodes.h"
#include "server.h"
#include "batch_request.h"
#include "pbs_share.h"

const char *preempt_prio_names[] = {
	"normal_jobs",
	"fairshare",
	"queue_softlimits",
	"server_softlimits",
	"express_queue",
};
static long ecl_pbs_max_licenses = PBS_MAX_LICENSING_LICENSES;

/**
 * @brief
 *	verify the datatype and value of a resource
 *
 * @par Functionality:
 *	1. Call ecl_find_resc_def to find the resource defn\n
 *	2. Call at_verify_datatype to verify the datatype of the resource\n
 *	3. Call at_verify_value to verify the value of a resource
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 - Attribute passed verification
 * @retval	>0 - Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	Some functions reset the value pointer to a new value. It thus
 *	frees the old value pointer.
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_resc(int batch_request, int parent_object, int cmd,
		  struct attropl *pattr, char **err_msg)
{
	ecl_attribute_def *prdef;
	int err_code = PBSE_NONE;
	char *p;

	struct attropl resc_attr;

	if (pattr == NULL)
		return (PBSE_INTERNAL);

	if (pattr->resource == NULL)
		return (PBSE_NONE);

	if ((prdef = ecl_find_resc_def(ecl_svr_resc_def, pattr->resource, ecl_svr_resc_size))) {
		/* found the resource, verify type and value of resource */
		resc_attr.name = pattr->resource;
		resc_attr.value = pattr->value;

		if (prdef->at_verify_datatype)
			err_code = prdef->at_verify_datatype(&resc_attr,
							     err_msg);

		if ((err_code == 0) && (prdef->at_verify_value)) {
			err_code = prdef->at_verify_value(batch_request,
							  parent_object, cmd, &resc_attr, err_msg);
		}
		if ((err_code != 0) && (*err_msg == NULL)) {
			p = pbse_to_txt(err_code);
			if (p) {
				*err_msg = malloc(strlen(p) + strlen(pattr->name) + strlen(pattr->resource) + 3);
				if (*err_msg == NULL) {
					err_code = PBSE_SYSTEM;
					return -1;
				}
				sprintf(*err_msg, "%s %s.%s",
					p, pattr->name, pattr->resource);
			}
		}
	}
	/*
	 * unknown resources are okay at this point of time
	 * we dont return error if resource is not found
	 * since custom resources are known only to server
	 * and verified by server
	 */
	return err_code;
}

/**
 * @brief
 *	Verify function for user_list (ATTR_g)
 *
 * @par Functionality:
 *	verify function for the user/group lists related attributes(ATTR_g)\n
 *	calls parse_at_list
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_user_list(int batch_request, int parent_object, int cmd,
		       struct attropl *pattr, char **err_msg)
{
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	if (batch_request == PBS_BATCH_SelectJobs) {
		if (parse_at_list(pattr->value, FALSE, FALSE))
			return PBSE_BADATVAL;
	} else {
		if (parse_at_list(pattr->value, TRUE, FALSE))
			return PBSE_BADATVAL;
	}
	return PBSE_NONE;
}

/**
 * @brief
 *	Verify authorized users (ATTR_auth_u)
 *
 * @par Functionality:
 *	verify function for the attribute ATTR_auth_u
 *	calls parse_at_list to parse the list of values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_authorized_users(int batch_request, int parent_object, int cmd,
			      struct attropl *pattr, char **err_msg)
{
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	if (parse_at_list(pattr->value, FALSE, FALSE))
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	Verify authorized groups (ATTR_auth_g)
 *
 * @par Functionality:
 *	verify function for the attribute ATTR_auth_g
 *	calls parse_at_list to parse the list of values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_authorized_groups(int batch_request, int parent_object, int cmd,
			       struct attropl *pattr, char **err_msg)
{
	if (pattr->value == NULL)
		return PBSE_BADATVAL;

	if (pattr->value[0] == '\0') {
		/* unset group */
		return PBSE_NONE;
	}

	if (parse_at_list(pattr->value, FALSE, FALSE))
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_depend
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_depend\n
 *	calls parse_depend_list to parse the list of job dependencies\n
 *	NOTE: This function also resets the value pointer to the new (expanded)
 *	dependancy list. It frees the original value pointer
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_dependlist(int batch_request, int parent_object, int cmd,
			struct attropl *pattr, char **err_msg)
{
	char *pdepend;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	pdepend = malloc(PBS_DEPEND_LEN);
	if (pdepend == NULL)
		return -1;

	if (parse_depend_list(pattr->value, &pdepend, PBS_DEPEND_LEN)) {
		free(pdepend);
		return PBSE_BADATVAL;
	}
	/* replace the value with the expanded value */
	free(pattr->value);
	pattr->value = pdepend;
	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_o, ATTR_e etc
 *
 * @par Functionality
 *	calls prepare_path to parse the path associatedd with ATTR_o, ATTR_e etc
 *	NOTE: This function also resets the value pointer to the new (expanded)
 *	dependancy list. It frees the original value pointer
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_path(int batch_request, int parent_object, int cmd,
		  struct attropl *pattr, char **err_msg)
{
	char *path_out;

	if ((pattr == NULL) || (pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	path_out = malloc(MAXPATHLEN + 1);
	if (path_out == NULL)
		return PBSE_SYSTEM;
	else
		memset(path_out, 0, MAXPATHLEN + 1);

	if (prepare_path(pattr->value, path_out) != 0) {
		free(path_out);
		return (PBSE_BADATVAL);
	}
	/* replace with prepared path */
	free(pattr->value);
	pattr->value = path_out;
	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_J
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_J\n
 *	calls chk_Jrange to verify that the range of the value is proper
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_jrange(int batch_request, int parent_object, int cmd,
		    struct attropl *pattr, char **err_msg)
{
	int ret;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	ret = chk_Jrange(pattr->value);
	if (ret == 1)
		return PBSE_BADATVAL;
	else if (ret == 2)
		return PBSE_ATVALERANGE;

	return PBSE_NONE;
}

/**
 * @brief
 * verify function for the attributes ATTR_N (job or resv)
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_N (job or resv)\n
 *	calls check_job_name to verify that the job/resv name is proper
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_jobname(int batch_request, int parent_object, int cmd,
		     struct attropl *pattr, char **err_msg)
{
	int chk_alpha = 1; /* by default disallow numeric first char  */
	int ret;

	if (pattr->value == NULL)
		return PBSE_BADATVAL;

	if (pattr->value[0] == '\0') {
		if ((batch_request == PBS_BATCH_StatusJob) ||
		    (batch_request == PBS_BATCH_SelectJobs))
			return PBSE_NONE;
		else
			return PBSE_BADATVAL;
	}

	if (batch_request == PBS_BATCH_QueueJob ||   /* for queuejob allow numeric first char */
	    batch_request == PBS_BATCH_ModifyJob ||  /* for alterjob allow numeric first char */
	    batch_request == PBS_BATCH_SubmitResv || /* for reservation submit allow numeric first char */
	    batch_request == PBS_BATCH_ModifyResv || /* for reservation modify allow numeric first char */
	    batch_request == PBS_BATCH_SelectJobs)   /* for selectjob allow numeric first char */
		chk_alpha = 0;

	ret = check_job_name(pattr->value, chk_alpha);
	if (ret == -1)
		return PBSE_BADATVAL;
	else if (ret == -2)
		return PBSE_JOBNBIG;

	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_c (checkpoint)
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_c (checkpoint)\n
 *	Checks that the format of ATTR_c is proper
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_checkpoint(int batch_request, int parent_object, int cmd,
			struct attropl *pattr, char **err_msg)
{
	char *val = pattr->value;
	char *pc;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	pc = val;
	if (strlen(val) == 1) {
		/* include 'u' as a valid one since unset is set as 'u' */
		if (*pc != 'n' && *pc != 's' && *pc != 'c' && *pc != 'w' && *pc != 'u')
			return PBSE_BADATVAL;
	} else {
		if (((*pc != 'c') && (*pc != 'w')) || (*(pc + 1) != '='))
			return PBSE_BADATVAL;

		pc += 2;
		if (*pc == '\0')
			return PBSE_BADATVAL;

		while (isdigit(*pc))
			pc++;
		if (*pc != '\0')
			return PBSE_BADATVAL;
	}

	if (batch_request == PBS_BATCH_SelectJobs) {
		if (strcmp(pc, "u") == 0) {
			if ((pattr->op != EQ) && (pattr->op != NE))
				return PBSE_BADATVAL;
		}
	}
	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_h (hold)
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_h (hold)\n
 *	Checks that the format of ATTR_h is proper
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_hold(int batch_request, int parent_object, int cmd,
		  struct attropl *pattr, char **err_msg)
{
	char *val = pattr->value;
	char *pc;
	int u_cnt = 0;
	int o_cnt = 0;
	int s_cnt = 0;
	int p_cnt = 0;
	int n_cnt = 0;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	for (pc = val; *pc != '\0'; pc++) {
		if (*pc == 'u')
			u_cnt++;
		else if (*pc == 'o')
			o_cnt++;
		else if (*pc == 's')
			s_cnt++;
		else if (*pc == 'p')
			p_cnt++;
		else if (*pc == 'n')
			n_cnt++;
		else
			return (PBSE_BADATVAL);
	}
	if (n_cnt && (u_cnt + o_cnt + s_cnt + p_cnt))
		return (PBSE_BADATVAL);
	if (p_cnt && (u_cnt + o_cnt + s_cnt + n_cnt))
		return (PBSE_BADATVAL);

	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_j
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_j\n
 *	Checks that the format of ATTR_j is proper
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_joinpath(int batch_request, int parent_object, int cmd,
		      struct attropl *pattr, char **err_msg)
{
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	if (strcmp(pattr->value, "oe") != 0 &&
	    strcmp(pattr->value, "eo") != 0 &&
	    strcmp(pattr->value, "n") != 0) {

		return PBSE_BADATVAL;
	}
	return PBSE_NONE;
}

/**
 * @brief
 *  verify function for the attributes ATTR_k
 *
 * @par Functionality:
 *  verify function for the attributes ATTR_k
 *  Checks that the format of ATTR_k is proper
 *
 * @param[in]   value       -   string value to verify
 *
 * @return  int
 * @retval  0   -   Attribute passed verification
 * @retval  >0  -   Failed verification - pbs errcode is returned
 *
 * @par Side effects:
 *  None
 *
 * @par Reentrancy
 *  MT-safe
 */
int
verify_keepfiles_common(char *value)
{
	char *ch;
	int keep_files = 0;
	int dont_keep = 0;
	int direct_write = 0;
	if ((value == NULL) || (value[0] == '\0'))
		return PBSE_BADATVAL;

	for (ch = value; *ch; ch++) {
		if (*ch == 'o' || *ch == 'e')
			keep_files = 1;
		if (*ch == 'n')
			dont_keep = 1;
		if (*ch == 'd')
			direct_write = 1;
		if (*ch != 'o' && *ch != 'e' && *ch != 'd' && *ch != 'n')
			return PBSE_BADATVAL;
	}
	if ((keep_files && dont_keep) || (direct_write && !(keep_files || dont_keep)))
		return PBSE_BADATVAL;
	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_k
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_k
 *	Checks that the format of ATTR_k is proper
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_keepfiles(int batch_request, int parent_object, int cmd,
		       struct attropl *pattr, char **err_msg)
{
	return verify_keepfiles_common(pattr->value);
}

/**
 * @brief
 *	verify function for the attributes ATTR_m (mailpoints)
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_m (mailpoints)\n
 *	Checks that the format of ATTR_m is proper
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_mailpoints(int batch_request, int parent_object, int cmd,
			struct attropl *pattr, char **err_msg)
{
	char *pc;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	while (isspace((int) *pattr->value))
		pattr->value++;
	if (strlen(pattr->value) == 0)
		return PBSE_BADATVAL;

	if (strlen(pattr->value) == 1 && *pattr->value == 'j')
		return PBSE_BADATVAL;

	if (strcmp(pattr->value, "n") != 0) {
		for (pc = pattr->value; *pc; pc++) {
			if (batch_request == PBS_BATCH_SubmitResv || batch_request == PBS_BATCH_ModifyResv) {
				if (*pc != 'a' && *pc != 'b' && *pc != 'e' && *pc != 'c')
					return PBSE_BADATVAL;
			} else {
				if (*pc != 'a' && *pc != 'b' && *pc != 'e' && *pc != 'j')
					return PBSE_BADATVAL;
			}
		}
	}
	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_M (mailusers)
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_M (mailusers)\n
 *	Checks that the format of ATTR_M is proper by calling parse_at_list
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_mailusers(int batch_request, int parent_object, int cmd,
		       struct attropl *pattr, char **err_msg)
{
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	if (parse_at_list(pattr->value, FALSE, FALSE))
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_S
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_S\n
 *	Checks that the format of ATTR_S is proper by calling parse_at_list
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_shellpathlist(int batch_request, int parent_object, int cmd,
			   struct attropl *pattr, char **err_msg)
{
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	if (parse_at_list(pattr->value, TRUE, TRUE))
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_p
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_p\n
 *	Checks that the format of ATTR_p is proper (between -1024 & +1023)
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_priority(int batch_request, int parent_object, int cmd,
		      struct attropl *pattr, char **err_msg)
{
	int i;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	i = atoi(pattr->value);
	if (i < -1024 || i > 1023) {
		if (batch_request == PBS_BATCH_SelectJobs)
			return PBSE_NONE;
		else
			return PBSE_BADATVAL;
	}

	return PBSE_NONE;
}

/**
 * @brief
 *  verify function for the attributes ATTR_R
 *
 * @par Functionality:
 *  verify function for the attributes ATTR_R
 *  Checks that the format of ATTR_R is proper
 *
 * @param[in]   value       -   string value to verify
 *
 * @return  int
 * @retval  0   -   Attribute passed verification
 * @retval  >0  -   Failed verification - pbs errcode is returned
 *
 * @par Side effects:
 *  None
 *
 * @par Reentrancy
 *  MT-safe
 */

int
verify_removefiles_common(char *value)
{
	char *ch;
	if ((value == NULL) || (value[0] == '\0'))
		return PBSE_BADATVAL;

	for (ch = value; *ch; ch++)
		if (*ch != 'o' && *ch != 'e')
			return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_R
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_R
 *	Checks that the format of ATTR_R is proper
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_removefiles(int batch_request, int parent_object, int cmd,
			 struct attropl *pattr, char **err_msg)
{
	return verify_removefiles_common(pattr->value);
}

/**
 * @brief
 *	verify function for the attributes ATTR_sandbox
 *
 * @par Functionality:
 *	verify function for the attributes ATTR_sandbox
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_sandbox(int batch_request, int parent_object, int cmd,
		     struct attropl *pattr, char **err_msg)
{
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	if ((strcasecmp(pattr->value, "HOME") != 0) &&
	    (strcasecmp(pattr->value, "O_WORKDIR") != 0) &&
	    (strcasecmp(pattr->value, "PRIVATE") != 0)) {
		return PBSE_BADATVAL;
	}

	return PBSE_NONE;
}

/**
 * @brief
 *	 verify function for the attributes ATTR_stagein, ATTR_stageout
 *	Checks that the format by calling parse_stage_list
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_stagelist(int batch_request, int parent_object, int cmd,
		       struct attropl *pattr, char **err_msg)
{
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	if (parse_stage_list(pattr->value))
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	verify function for the attributes ATTR_ReqCred
 *	Checks that the value is one of the allowed values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_credname(int batch_request, int parent_object, int cmd,
		      struct attropl *pattr, char **err_msg)
{
	static const char *cred_list[] = {
		PBS_CREDNAME_AES,
		NULL /* must be last */
	};

	char *val = pattr->value;
	int i;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	for (i = 0; cred_list[i]; i++) {
		if (strcmp(cred_list[i], val) == 0)
			return PBSE_NONE;
	}
	return PBSE_BADATVAL;
}

/**
 * @brief
 *	 for some attributes which can have 0 or +ve values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_zero_or_positive(int batch_request, int parent_object, int cmd,
			      struct attropl *pattr, char **err_msg)
{
	long lval;
	char *end = NULL;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	errno = 0;
	lval = strtol(pattr->value, &end, 10);
	if ((errno != 0) || (lval < 0))
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	Function checks the resource "preempt_targets" and verifies its values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 */
int
verify_value_preempt_targets(int batch_request, int parent_object, int cmd,
			     struct attropl *pattr, char **err_msg)
{
	char *val = NULL;
	char *result = NULL;
	char *temp = NULL;
	char *p = NULL;
	char *q = NULL;
	char ch = 0;
	char ch1 = 0;
	int err_code = PBSE_NONE;
	ecl_attribute_def *prdef = NULL;
	char *value = NULL;
	char *msg = NULL;
	int attrib_found = 0;
	char *lcase_val = NULL;
	char *chk_arr[] = {ATTR_l, ATTR_queue, NULL};
	int i = 0;
	int j = 0;
	int res_len = 0;
	ecl_attribute_def *ecl_def = ecl_svr_resc_def;
	int ecl_def_size = ecl_svr_resc_size;
	struct attropl resc_attr = {0};

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;
	val = pattr->value;
	while (isspace(*val))
		val++;
	/* Check if preempt_targets is set to "NONE" */
	if (strncasecmp(val, TARGET_NONE, strlen(TARGET_NONE)) == 0) {
		if (strcasecmp(val, TARGET_NONE) != 0)
			err_code = PBSE_BADATVAL;
		return err_code;
	}
	for (i = 0; chk_arr[i] != NULL; i++) {
		if (strcmp(chk_arr[i], ATTR_queue) == 0) {
			ecl_def = ecl_resv_attr_def;
			ecl_def_size = ecl_resv_attr_size;
			/*
			 * Implementation for case insensitive search of string "queue", as many
			 * platforms like Windows does not have any case insensitive string search
			 */
			if (lcase_val != NULL) {
				free(lcase_val);
				lcase_val = NULL;
			}
			lcase_val = strdup(val);
			if (lcase_val == NULL)
				return PBSE_SYSTEM;
			for (j = 0; lcase_val[j] != '\0'; j++) {
				lcase_val[j] = tolower(lcase_val[j]);
			}
			val = lcase_val;
		} else
			val = pattr->value;
		/* Check preempt_targets for one of the attrib names in its values */
		result = strstr(val, chk_arr[i]);
		res_len = strlen(chk_arr[i]);
		/* Traverse through the values, it may have multiple comma seperated values */
		while (result != NULL) {
			/*At least one of the recognized attributes was found */
			attrib_found = 1;
			if (strcmp(chk_arr[i], ATTR_l) == 0) {
				/* We need to skip "Resource_List" */
				temp = result + res_len;
				if (*temp != '.') {
					free(lcase_val);
					return PBSE_BADATVAL;
				}
				/* Ignoring '.' character */
				temp = temp + 1;
			} else
				temp = result;
			p = strpbrk(temp, "=");
			if (p == NULL) {
				free(lcase_val);
				return PBSE_BADATVAL;
			}
			ch = *p;
			value = p + 1;
			*p = '\0';
			/* find the resource definition */
			prdef = ecl_find_resc_def(ecl_def, temp, ecl_def_size);
			if (prdef == NULL) {
				*p = ch;
				/* Assuming custom resource, don't know datatype to verify */
				result = strstr(temp, chk_arr[i]);
				continue;
			}
			q = strchr(value, ',');
			if (q != NULL) {
				ch1 = *q;
				*q = '\0';
			}
			resc_attr.name = strdup(temp);
			if (resc_attr.name == NULL) {
				free(lcase_val);
				return PBSE_SYSTEM;
			}
			resc_attr.value = strdup(value);
			if (resc_attr.value == NULL) {
				free(lcase_val);
				free(resc_attr.name);
				return PBSE_SYSTEM;
			}
			if (q != NULL)
				*q = ch1;
			*p = ch;
			if (prdef->at_verify_datatype)
				err_code = prdef->at_verify_datatype(&resc_attr,
								     err_msg);

			if ((err_code == 0) && (prdef->at_verify_value)) {
				err_code = prdef->at_verify_value(batch_request,
								  parent_object, cmd, &resc_attr, err_msg);
			}
			if ((err_code != 0) && (*err_msg == NULL)) {
				msg = pbse_to_txt(err_code);
				if (msg) {
					*err_msg = malloc(strlen(msg) + 1);
					if (*err_msg == NULL) {
						free(lcase_val);
						return PBSE_SYSTEM;
					}
					sprintf(*err_msg, "%s",
						msg);
				}
				return err_code;
			}
			val = p;
			free(resc_attr.name);
			free(resc_attr.value);
			resc_attr.name = resc_attr.value = NULL;
			result = strstr(val, chk_arr[i]);
		}
	}
	free(lcase_val);
	if (attrib_found == 0)
		err_code = PBSE_BADATVAL;
	return err_code;
}

/**
 * @brief
 *	for some attributes which can have only +ve values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_non_zero_positive(int batch_request, int parent_object,
			       int cmd, struct attropl *pattr, char **err_msg)
{
	long l;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	l = atol(pattr->value);
	if (l <= 0)
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	for some attributes which can have only +ve long values, eg, ATTR_max_job_sequence_id
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_non_zero_positive_long_long(int batch_request, int parent_object,
					 int cmd, struct attropl *pattr, char **err_msg)
{
	long long l = -1;
	char *pc = NULL;
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	l = strTouL(pattr->value, &pc, 10);
	if ((*pc != '\0') || (errno == ERANGE)) {
		return PBSE_BADATVAL;
	}
	if (l <= 0)
		return PBSE_BADATVAL;

	return PBSE_NONE;
}

/**
 * @brief
 *	verifies attribute ATTR_license_min
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_minlicenses(int batch_request, int parent_object, int cmd,
			 struct attropl *pattr, char **err_msg)
{
	long l;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	l = atol(pattr->value);
	if ((l < 0) || (l > ecl_pbs_max_licenses))
		return (PBSE_LICENSE_MIN_BADVAL);

	return PBSE_NONE;
}

/**
 * @brief
 *	verifies attribute ATTR_license_max
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_maxlicenses(int batch_request, int parent_object, int cmd,
			 struct attropl *pattr, char **err_msg)
{
	long l;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	l = atol(pattr->value);

	if ((l < 0) || (l > ecl_pbs_max_licenses))
		return (PBSE_LICENSE_MAX_BADVAL);

	return PBSE_NONE;
}

/**
 * @brief
 *	verifies attribute ATTR_license_linger
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_licenselinger(int batch_request, int parent_object, int cmd,
			   struct attropl *pattr, char **err_msg)
{
	long l;

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	l = atol(pattr->value);
	if (l <= 0)
		return (PBSE_LICENSE_LINGER_BADVAL);

	return PBSE_NONE;
}

/**
 * @brief
 *	verifies attributes like ATTR_managers, ATTR_operators etc
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_mgr_opr_acl_check(int batch_request, int parent_object,
			       int cmd, struct attropl *pattr, char **err_msg)
{
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	/* with kerberos, we cannot really check validity */
	return PBSE_NONE;
#endif

	char *dup_val;
	char *token;
	char *entry;
	char *p;
	char *comma;
	int err = PBSE_NONE;
	char hostname[PBS_MAXHOSTNAME + 1];

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	dup_val = strdup(pattr->value);
	if (!dup_val)
		return -1;

	token = dup_val;
	comma = strchr(token, ',');
	while (token) {
		/* eliminate trailing spaces in token */
		if (comma)
			p = comma;
		else
			p = token + strlen(token);
		while (*--p == ' ' && p != token)
			;
		*(p + 1) = 0;

		/* eliminate spaces in the front */
		while (token && *token == ' ')
			token++;

		entry = strchr(token, (int) '@');
		if (entry == NULL) {
			err = PBSE_BADHOST;
			break;
		}
		entry++;	     /* point after the '@' */
		if (*entry != '*') { /* if == * cannot check it any more */

			/* if not wild card, must be fully qualified host */
			if (get_fullhostname(entry, hostname, (sizeof(hostname) - 1)) || strncasecmp(entry, hostname, (sizeof(hostname) - 1))) {
				err = PBSE_BADHOST;
				break;
			}
		}

		token = NULL;
		if (comma) {
			token = comma + 1;
			comma = strchr(token, ',');
		}
	}

	free(dup_val);
	return err;
}

/**
 * @brief
 *	verifies the queue type specified by attribute ATTR_q
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_queue_type(int batch_request, int parent_object, int cmd,
			struct attropl *pattr, char **err_msg)
{
	int i;
	char *name[2] = {"Execution", "Route"};

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	/* does the requested value match a legal value? */
	for (i = 0; i < 2; i++) {
		if (strncasecmp(name[i], pattr->value,
				strlen(pattr->value)) == 0)
			return PBSE_NONE;
	}
	return (PBSE_BADATVAL);
}

/**
 * @brief
 *	verifies job state specified by attribute ATTR_state
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_state(int batch_request, int parent_object, int cmd,
		   struct attropl *pattr, char **err_msg)
{
	char *pc = pattr->value;

	if (pattr->value == NULL)
		return PBSE_BADATVAL;

	if (pattr->value[0] == '\0') {
		if (batch_request != PBS_BATCH_StatusJob)
			return PBSE_BADATVAL;
	}
	while (*pc) {
		if (*pc != 'E' && *pc != 'H' && *pc != 'Q' &&
		    *pc != 'R' && *pc != 'T' && *pc != 'W' &&
		    *pc != 'S' && *pc != 'U' && *pc != 'B' &&
		    *pc != 'X' && *pc != 'F' && *pc != 'M')
			return PBSE_BADATVAL;
		pc++;
	}
	return PBSE_NONE;
}
/**
 * @brief
 *	Parses select specification and verifies the datatype and value of each resource
 *
 * @par Functionality:
 *	1. Parses select specification by calling parse_chunk function.
 *	2. Decodes each chunk
 *	3. Calls verify_value_resc for each resource in a chunk.
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 - Attribute passed verification
 * @retval	>0 - Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	Some functions reset the value pointer to a new value. It thus
 *	frees the old value pointer.
 *
 */
int
verify_value_select(int batch_request, int parent_object, int cmd,
		    struct attropl *pattr, char **err_msg)
{
	char *chunk;
	int nchk;
	int nelem;
	struct key_value_pair *pkvp;
	int rc = 0;
	int j;
	struct attropl resc_attr;
	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	chunk = parse_plus_spec(pattr->value, &rc); /* break '+' seperated substrings */
	if (rc != 0)
		return (rc);

	while (chunk) {
		if (parse_chunk(chunk, &nchk, &nelem, &pkvp, NULL) == 0) {
			for (j = 0; j < nelem; ++j) {
				resc_attr.name = pattr->name;
				resc_attr.resource = pkvp[j].kv_keyw;
				resc_attr.value = pkvp[j].kv_val;
				rc = verify_value_resc(batch_request, parent_object, cmd, &resc_attr, err_msg);
				if (rc > 0)
					return rc;
			}
		} else {
			return PBSE_BADATVAL;
		}
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0)
			return (rc);
	} /* while */
	return PBSE_NONE;
}

/**
 * @brief
 *	verifies the values specified by attribute ATTR_tolerate_node_failures
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 * @par Reentrancy
 *	MT-safe
 */
int
verify_value_tolerate_node_failures(int batch_request, int parent_object, int cmd,
				    struct attropl *pattr, char **err_msg)
{
	int i;
	char *tolerance_level[] = {TOLERATE_NODE_FAILURES_ALL, TOLERATE_NODE_FAILURES_JOB_START, TOLERATE_NODE_FAILURES_NONE, NULL};
	/* does the requested value match a legal value? */
	for (i = 0; tolerance_level[i] != NULL; i++) {
		if (strcmp(tolerance_level[i], pattr->value) == 0)
			return PBSE_NONE;
	}
	return (PBSE_BADATVAL);
}

/**
 * @brief
 *	Function checks the resource "preempt_prio" and verifies its values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 */
int
verify_value_preempt_prio(int batch_request, int parent_object, int cmd,
			  struct attropl *pattr, char **err_msg)
{
	char **list;
	char *saveptr;

	list = break_comma_list(pattr->value);
	if (list != NULL) {
		int i;
		int j;
		for (i = 0; list[i] != NULL; i++) {
			char *tok;
			short found;
			found = 0;
			tok = strtok_r(list[i], "+", &saveptr);
			while (tok != NULL) {
				for (j = 0; j < (sizeof(preempt_prio_names) / sizeof(char *)); j++)
					if (!strcmp(preempt_prio_names[j], tok))
						found = 1;

				if (!found) {
					free_string_array(list);
					return PBSE_BADATVAL;
				}
				tok = strtok_r(NULL, "+", &saveptr);
			}
		}
		free_string_array(list);
	} else
		return PBSE_BADATVAL;

	return 0;
}

/**
 * @brief
 *	Function checks the resource "preempt_order" and verifies its values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 */
int
verify_value_preempt_order(int batch_request, int parent_object, int cmd,
			   struct attropl *pattr, char **err_msg)
{
	char *save_ptr;
	char *tok = NULL;
	char *endp = NULL;
	char copy[256] = {0};

	if ((pattr->value == NULL) || (pattr->value[0] == '\0'))
		return PBSE_BADATVAL;

	strcpy(copy, pattr->value);
	tok = strtok_r(copy, "\t ", &save_ptr);

	if (tok != NULL && !isdigit(tok[0])) {
		int i = 0;
		char s_done = 0;
		char c_done = 0;
		char r_done = 0;
		char d_done = 0;
		char next_is_num = 0;
		do {
			int j = 0;
			j = isdigit(tok[0]);
			if (j) {
				if (next_is_num) {
					(void) strtol(tok, &endp, 10);
					if (*endp == '\0') {
						i++;
						next_is_num = 0;
					} else
						return PBSE_BADATVAL;
				} else
					return PBSE_BADATVAL;
			} else if (!next_is_num) {
				for (j = 0; tok[j] != '\0'; j++) {
					switch (tok[j]) {
						case 'S':
							if (!s_done)
								s_done = 1;
							else
								return PBSE_BADATVAL;
							break;
						case 'C':
							if (!c_done)
								c_done = 1;
							else
								return PBSE_BADATVAL;
							break;
						case 'R':
							if (!r_done)
								r_done = 1;
							else
								return PBSE_BADATVAL;
							break;
						case 'D':
							if (!d_done)
								d_done = 1;
							else
								return PBSE_BADATVAL;
							break;
						default:
							return PBSE_BADATVAL;
					}
					next_is_num = 1;
				}
				s_done = 0;
				c_done = 0;
				r_done = 0;
				d_done = 0;
			} else
				return PBSE_BADATVAL;
			tok = strtok_r(NULL, "\t ", &save_ptr);
		} while (tok != NULL && i < PREEMPT_ORDER_MAX);

		if (tok != NULL)
			return PBSE_BADATVAL;
	} else
		return PBSE_BADATVAL;

	return 0;
}

/**
 * @brief
 *	Function checks the resource "preempt_sort" and verifies its values
 *
 * @see
 *
 * @param[in]	batch_request	-	Batch Request Type
 * @param[in]	parent_object	-	Parent Object Type
 * @param[in]	cmd		-	Command Type
 * @param[in]	pattr		-	address of attribute to verify
 * @param[out]	err_msg		-	error message list
 *
 * @return	int
 * @retval	0 	- 	Attribute passed verification
 * @retval	>0 	- 	Failed verification - pbs errcode is returned
 *
 * @par	Side effects:
 * 	None
 *
 */
int
verify_value_preempt_sort(int batch_request, int parent_object, int cmd,
			  struct attropl *pattr, char **err_msg)
{
	if (strcmp(pattr->value, PBS_PREEMPT_SORT_DEFAULT) != 0)
		return PBSE_BADATVAL;

	return 0;
}


================================================
FILE: src/lib/Libecl/pbs_client_thread.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_client_thread.c
 *
 * @brief	Pbs threading related functions
 *
 * @par		Functionality:
 *	This module provides an higher level abstraction of the
 *	pthread calls by wrapping them with some additional logic to the
 *	rest of the PBS world.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <unistd.h>
#include <sys/types.h>
#include <pwd.h>
#include "libpbs.h"
#include "pbs_client_thread.h"

/**
 * @brief
 *	initializes the dis static tables for future use
 *
 * @par Functionality:
 *	Initializes the dis static tables for future use\n
 *	This is called only once from @see __init_thread_data via
 *	the pthread_once mechanism
 */
extern void dis_init_tables(void);
extern long dis_buffsize; /* defn of DIS_BUFSZ in dis headers */

/**
 * @brief
 *	Function to free the node pool structure
 *
 * @par Functionality:
 *	Frees the node pool structure. \n
 *	This is called only once when the thread is being destroyed
 */
extern void free_node_pool(void *);

/**
 * For capturing errors inside the once function. \n
 * Even though this is a global var, this won't cause threading issues, \n
 * since pthread calls the once function only once in a processes lifetime
 */
static int __pbs_client_thread_init_rc = 0;

/* the __ functions have the actual threaded functionality */
static int __pbs_client_thread_lock_connection(int connect);
static int __pbs_client_thread_unlock_connection(int connect);
static struct pbs_client_thread_context *
__pbs_client_thread_get_context_data(void);
static int __pbs_client_thread_lock_conntable(void);
static int __pbs_client_thread_unlock_conntable(void);
static int __pbs_client_thread_lock_conf(void);
static int __pbs_client_thread_unlock_conf(void);
static int __pbs_client_thread_init_thread_context(void);
static int __pbs_client_thread_init_connect_context(int connect);
static int __pbs_client_thread_destroy_connect_context(int connect);
static void __pbs_client_thread_destroy_thread_data(void *p);

/*
 * The pfn_pbs_client_thread function pointers are assigned to the real
 * functions here. This is the default assignment. If an internal 'client'
 * (like the daemons) wish to bypass the verification and threading behavior
 * they can call pbs_client_thread_set_single_threaded_mode() to reset these
 * function pointers to point to single threaded mode funcs, most of which have
 * an empty implementation
 */

int (*pfn_pbs_client_thread_lock_connection)(int connect) = &__pbs_client_thread_lock_connection;

int (*pfn_pbs_client_thread_unlock_connection)(int connect) = &__pbs_client_thread_unlock_connection;

struct pbs_client_thread_context *(*pfn_pbs_client_thread_get_context_data)(void) = &__pbs_client_thread_get_context_data;

int (*pfn_pbs_client_thread_lock_conntable)(void) = &__pbs_client_thread_lock_conntable;

int (*pfn_pbs_client_thread_unlock_conntable)(void) = &__pbs_client_thread_unlock_conntable;

int (*pfn_pbs_client_thread_lock_conf)(void) = &__pbs_client_thread_lock_conf;

int (*pfn_pbs_client_thread_unlock_conf)(void) = &__pbs_client_thread_unlock_conf;

int (*pfn_pbs_client_thread_init_thread_context)(void) = &__pbs_client_thread_init_thread_context;

int (*pfn_pbs_client_thread_init_connect_context)(int connect) = &__pbs_client_thread_init_connect_context;

int (*pfn_pbs_client_thread_destroy_connect_context)(int connect) = &__pbs_client_thread_destroy_connect_context;

/* following are some global thread related variables, like initializers etc */
static pthread_key_t key_tls;				     /* the key used to set/retrieve the TLS data */
static pthread_once_t pre_init_key_once = PTHREAD_ONCE_INIT; /* once keys */
static pthread_once_t post_init_key_once = PTHREAD_ONCE_INIT;

static pthread_mutex_t pbs_client_thread_conntable_mutex; /* for conn table */
static pthread_mutex_t pbs_client_thread_conf_mutex;	  /* for pbs_loadconf */
static pthread_mutexattr_t attr;

/**
 * This is a local thread_context variable which is used by the single threaded
 * model functions. This way the semantics is similar between single/multi
 * threaded code. The only difference in single threaded mode is that it uses a
 * global data structure to store the data instead of the TLS
 */
static struct pbs_client_thread_context
	pbs_client_thread_single_threaded_context;

/** single threaded mode dummy function definition */
static int
__pbs_client_thread_lock_connection_single_threaded(int connect)
{
	return 0;
}

/** single threaded mode dummy function definition */
static int
__pbs_client_thread_unlock_connection_single_threaded(int connect)
{
	return 0;
}

/** single threaded mode function definition
 * @brief
 *	Returns the thread context data
 *
 * @par Functionality:
 *	Returns the address of the global thread context variable called
 *	@see pbs_client_thread_single_threaded_context
 *
 * @retval - Address of the thread context data
 *
 */
struct pbs_client_thread_context *
__pbs_client_thread_get_context_data_single_threaded(void)
{
	return &pbs_client_thread_single_threaded_context;
}

/** single threaded mode dummy function definition */
static int
__pbs_client_thread_lock_conntable_single_threaded(void)
{
	return 0;
}

/** single threaded mode dummy function definition */
static int
__pbs_client_thread_unlock_conntable_single_threaded(void)
{
	return 0;
}

/** single threaded mode dummy function definition */
static int
__pbs_client_thread_lock_conf_single_threaded(void)
{
	return 0;
}

/** single threaded mode dummy function definition */
static int
__pbs_client_thread_unlock_conf_single_threaded(void)
{
	return 0;
}

/** single threaded mode dummy function definition */
static int
__pbs_client_thread_destroy_connect_context_single_threaded(int connect)
{
	return 0;
}

/**
 * this is a global variable but is used only when single threaded model is set,
 * so is not a issue with threading
 */
static int single_threaded_init_done = 0;

/**
 * @brief
 *	Initialize the thread context for single threaded applications.
 *
 * @par Functionality:
 *      1. Sets the context using global variable
 *	   pbs_client_thread_single_threaded_context \n
 *      2. Initializes the members of this structure \n
 *      3. Sets single_threaded_init_done to 1 \n
 *	This is the function that gets called when single threaded applications
 *	call pbs_client_thread_init_thread_context.
 *
 * @return	int
 *
 * @retval	0 - success
 * @retval	1 - failure (pbs_errno is set)
 *
 * @par Side-effects:
 *	Modifies global variable, single_threaded_init_done.
 *
 * @par Reentrancy:
 *	MT unsafe
 */
static int
__pbs_client_thread_init_thread_context_single_threaded(void)
{
	struct pbs_client_thread_context *ptr;

	if (single_threaded_init_done)
		return 0;

	ptr = &pbs_client_thread_single_threaded_context;

	/* initialize any elements of the single_threaded_context */
	memset(ptr, 0, sizeof(struct pbs_client_thread_context));

	ptr->th_dis_buffer = calloc(1, dis_buffsize); /* defined in tcp_dis.c */
	if (ptr->th_dis_buffer == NULL) {
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	/* set any default values for the TLS vars */
	ptr->th_pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_SHORT;
	ptr->th_pbs_tcp_interrupt = 0;
	ptr->th_pbs_tcp_errno = 0;

	ptr->th_pbs_errno = 0;

	dis_init_tables();

	single_threaded_init_done = 1;
	ptr->th_pbs_mode = 1; /* single threaded */
	return 0;
}

/** single threaded mode dummy functions definition */
static int
__pbs_client_thread_init_connect_context_single_threaded(int connect)
{
	return 0;
}

/**
 * @brief
 *	Set single threaded mode for the caller
 *
 * @par Functionality:
 *	The functions pointers are reset to a different set of functions,
 *	most of which have an empty implementation.
 *	Called by the daemons to bypass multithreading functions.
 *	The functions pointers are reset to a different set of functions,
 *	most of which have an empty implementation.
 *
 * @return	void
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	MT unsafe - should be called only in a single threaded application
 */
void
pbs_client_thread_set_single_threaded_mode(void)
{
	/* point these to dummy functions */
	pfn_pbs_client_thread_lock_connection =
		__pbs_client_thread_lock_connection_single_threaded;
	pfn_pbs_client_thread_unlock_connection =
		__pbs_client_thread_unlock_connection_single_threaded;
	pfn_pbs_client_thread_get_context_data =
		__pbs_client_thread_get_context_data_single_threaded;
	pfn_pbs_client_thread_lock_conntable =
		__pbs_client_thread_lock_conntable_single_threaded;
	pfn_pbs_client_thread_unlock_conntable =
		__pbs_client_thread_unlock_conntable_single_threaded;
	pfn_pbs_client_thread_lock_conf =
		__pbs_client_thread_lock_conf_single_threaded;
	pfn_pbs_client_thread_unlock_conf =
		__pbs_client_thread_unlock_conf_single_threaded;
	pfn_pbs_client_thread_init_thread_context =
		__pbs_client_thread_init_thread_context_single_threaded;
	pfn_pbs_client_thread_init_connect_context =
		__pbs_client_thread_init_connect_context_single_threaded;
	pfn_pbs_client_thread_destroy_connect_context =
		__pbs_client_thread_destroy_connect_context_single_threaded;
}

/* following are the definitions of the actual threaded functions */

/**
 * @brief
 *	Pre/First initialization routine
 *
 * @par Functionality:
 *      1. Creates the key to be used to set/retrieve TLS data for a thread \n
 *      2. Creates the mutex attribute attr of type recursive mutex \n
 *      3. Creates the recursive mutex used to seralize access to global data \n
 *	This is the function called by pthread_once mechanism exactly once in
 *	the process lifetime from "__pbs_client_thread_init_thread_context".
 *
 * @see __pbs_client_thread_init_thread_context\n __post_init_thread_data
 *
 * @return	void
 *
 * @par Side-effects:
 *	Modifies global variable, __pbs_client_thread_init_rc. This variable is
 *	used to hold any error that might happen inside this function. (since
 *	pthread_once only takes a function with a void return type). This won't
 *	be a thread race/issue, since the variable is modified only by the init
 *	function which is called only once via pthread_once(). This global var
 *	is set by this function and used by the caller routine
 *	"__pbs_client_thread_init_thread_context" to know whether the code
 *	inside __init_thead_data executed successfully or not.
 *
 * @par Reentrancy:
 *	MT unsafe - must be called via pthread_once()
 */
static void
__init_thread_data(void)
{
	if ((__pbs_client_thread_init_rc =
		     pthread_key_create(&key_tls,
					&__pbs_client_thread_destroy_thread_data)) != 0)
		return;

	/*
	 * since this function is called only once in the processes lifetime
	 * use this place to initialize mutex attribute and the mutexes
	 */
	if ((__pbs_client_thread_init_rc = pthread_mutexattr_init(&attr)) != 0)
		return;

	if ((__pbs_client_thread_init_rc = pthread_mutexattr_settype(&attr,
	/*
	 * linux does not have a PTHREAD_MUTEX_RECURSIVE attr_type, instead
	 * has a PTHREAD_MUTEX_RECURSIVE_NP (NP stands for non-portable). Thus
	 * need a conditional compile to ensure it builds properly in linux as
	 * well as the other unixes. The windows implementation of pthread, the
	 * Libpbspthread.dll library, however knows only about
	 * "PTHREAD_MUTEX_RECURSIVE", and will reject any other attr_type.
	 *
	 */
#if defined(linux)
								     PTHREAD_MUTEX_RECURSIVE_NP
#else
								     PTHREAD_MUTEX_RECURSIVE
#endif
								     )) != 0)
		return;

	/*
	 * initialize the process-wide conntable mutex
	 * Recursive mutex
	 */
	if ((__pbs_client_thread_init_rc =
		     pthread_mutex_init(&pbs_client_thread_conntable_mutex, &attr)) != 0)
		return;

	/*
	 * initialize the process-wide conf mutex
	 * Recursive mutex
	 */
	if ((__pbs_client_thread_init_rc =
		     pthread_mutex_init(&pbs_client_thread_conf_mutex, &attr)) != 0)
		return;

	pthread_mutexattr_destroy(&attr);
	return;
}

/**
 * @brief
 *	Post initialization routine
 *
 * @par Functionality:
 *	1. Initializes the dis tables, by calling the function dis_init_tables.
 *	This is the function called by pthread_once mechanism exactly once in
 *	the process lifetime from "__pbs_client_thread_init_thread_context".
 *
 * @see __pbs_client_thread_init_thread_context\n __init_thread_data
 *
 * @note
 *	Called at the end of the __pbs_client_thread_init_thread_context.
 *      The reason is that the functionality depends on TLS data area set by
 *      __pbs_thead_init_context.
 *
 *
 * @return	void
 *
 * @par Reentrancy:
 *	MT unsafe - must be called via pthread_once()
 */
static void
__post_init_thread_data(void)
{
	dis_init_tables();
}

/**
 * @brief
 *	Initialize the thread context
 *
 * @par Functionality:
 *      1. Calls __init_thread_data via pthread_once to init mutexes/TLS key \n
 *      2. If TLS data is not already created, then create it \n
 *      3. Finally calls __post_init_thread_data function via pthread_once
 *         to ensure that the dis tables are initialized only once in the
 *         process lifetime. \n
 *	All external API calls should call this function first before calling
 *	any other pbs_client_thread_ functions.
 *
 * @see __init_thread_data\n __post_init_thread_data
 *
 * @return	int
 *
 * @retval	0 Success
 * @retval	>0 Failure (set to the pbs_errno)
 *
 * @par Side effects:
 *	If a failure occurs in this function, then it calls
 *	set_single_threaded_model to switch to a single threaded model to be
 *	able to return the error code reliably to the caller.
 *
 * @par Reentrancy:
 *	MT safe
 */
static int
__pbs_client_thread_init_thread_context(void)
{
	struct pbs_client_thread_context *ptr;
	int ret;
	int free_ptr = 0;

	/* initialize the TLS key for all threads */
	if (pthread_once(&pre_init_key_once, __init_thread_data) != 0) {
		ret = PBSE_SYSTEM;
		goto err;
	}

	if (__pbs_client_thread_init_rc != 0) {
		ret = PBSE_SYSTEM;
		goto err;
	}

	if (pthread_getspecific(key_tls) != NULL)
		return 0; /* thread data already initialized */

	ptr = calloc(1, sizeof(struct pbs_client_thread_context));
	if (!ptr) {
		ret = PBSE_SYSTEM;
		goto err;
	}

	/* set any default values for the TLS vars */
	ptr->th_pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_SHORT;
	ptr->th_pbs_tcp_interrupt = 0;
	ptr->th_pbs_tcp_errno = 0;

	ptr->th_pbs_errno = 0;

	/* initialize any elements of the ptr */
	ptr->th_dis_buffer = calloc(1, dis_buffsize); /* defined in tcp_dis.c */
	if (ptr->th_dis_buffer == NULL) {
		free_ptr = 1;
		ret = PBSE_SYSTEM;
		goto err;
	}

	/*
	 * synchronize this part, since the getuid, getpwuid functions are not
	 * thread-safe
	 */
	if (pbs_client_thread_lock_conf() != 0) {
		free_ptr = 1;
		ret = PBSE_SYSTEM;
		goto err;
	}

	if (pthread_setspecific(key_tls, ptr) != 0) {
		ret = PBSE_SYSTEM;
		pbs_client_thread_unlock_conf();
		goto err;
	}
	if (pbs_client_thread_unlock_conf() != 0) {
		ret = PBSE_SYSTEM;
		goto err;
	}

	if (pthread_once(&post_init_key_once, __post_init_thread_data) != 0) {
		ret = PBSE_SYSTEM;
		goto err;
	}

	return 0;

err:
	/*
	 * this is a unlikely case and should not happen unless the system is
	 * low on memory before even before the program started, or if there
	 * are bugs in the pthread calls
	 */

	/*
	 * since thread init could not be set, set back single threaded mode,
	 * so that at least the pbs_errno etc would work for the client side
	 * to read the error code out of it.
	 */
	pbs_client_thread_set_single_threaded_mode();
	if (free_ptr) {
		free(ptr->th_dis_buffer);
		free(ptr);
	}
	pbs_errno = ret; /* set the errno so that client can access it */
	return ret;
}

/**
 * @brief
 *	Free the attribute error list from TLS
 *
 * @par Functionality:
 *      Helper function to free the list of attributes in error that is stored
 *	in the threads TLS
 *
 * @param[in]	errlist  - pointer to the array of attributes structures to free
 *
 * @return	void
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
void
free_errlist(struct ecl_attribute_errors *errlist)
{
	int i;
	struct attropl *attr;
	if (errlist) {
		/* iterate through the error list and free everything */
		for (i = 0; i < errlist->ecl_numerrors; i++) {
			attr = errlist->ecl_attrerr[i].ecl_attribute;
			if (attr) {
				/* free the attropl structure pointer */
				if (attr->name != NULL)
					free(attr->name);
				if (attr->resource != NULL)
					free(attr->resource);
				if (attr->value != NULL)
					free(attr->value);
				free(attr);
			}
			/* free the errmsg pointer */
			if (errlist->ecl_attrerr[i].ecl_errmsg)
				free(errlist->ecl_attrerr[i].ecl_errmsg);
		}
		if (errlist->ecl_attrerr)
			free(errlist->ecl_attrerr);
		free(errlist);
	}
}

/**
 * @brief
 *	Destroy the thread context data
 *
 * @par Functionality:
 *      Called by pbs_client_thread_destroy_context to free the TLS data
 *	allocated for this thread
 *
 * @see __init_thread_data
 *
 * @param[in]	p - pointer to TLS data area
 *
 * @return	void
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
static void
__pbs_client_thread_destroy_thread_data(void *p)
{
	struct pbs_client_thread_connect_context *th_conn, *temp;
	struct pbs_client_thread_context *ptr =
		(struct pbs_client_thread_context *) p;

	if (ptr) {
		free_errlist(ptr->th_errlist);

		if (ptr->th_cred_info)
			free(ptr->th_cred_info);

		if (ptr->th_dis_buffer)
			free(ptr->th_dis_buffer);

		free_node_pool(ptr->th_node_pool);

		th_conn = ptr->th_conn_context;
		while (th_conn) {
			if (th_conn->th_ch_errtxt)
				free(th_conn->th_ch_errtxt);

			temp = th_conn;
			th_conn = th_conn->th_ch_next;
			free(temp);
		}
		free(ptr);
	}
}

/**
 * @brief
 *	Add a the connection related data to the TLS
 *
 * @par Functionality:
 *	Allocates memory for struct connect_context, initializes the members.
 *      Finally adds the structure to a linked list in the thread_context
 *      headed by the member th_conn_context. See struct thread_context for
 *      more information.
 *	Called by __pbs_cleint_thread_init_connect_context/
 *	__pbs_client_thread_lock_connection functions to add a connection
 *	context to the TLS data
 *
 * @see __pbs_client_thread_init_connect_context\n
 *	__pbs_client_thread_lock_connection\n
 *
 * @param[in]	connect - the connection identifier
 *
 * @retval	Address of the newly allocated node (success)
 * @retval	NULL (failure)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
struct pbs_client_thread_connect_context *
pbs_client_thread_add_connect_context(int connect)
{
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	struct pbs_client_thread_connect_context *new =
		malloc(sizeof(struct pbs_client_thread_connect_context));
	if (new == NULL)
		return NULL;

	new->th_ch = connect;
	new->th_ch_errno = 0;
	new->th_ch_errtxt = NULL;
	if (p->th_conn_context)
		new->th_ch_next = p->th_conn_context;
	else
		new->th_ch_next = NULL;

	p->th_conn_context = new; /* chain at the head */

	return new;
}

/**
 * @brief
 *	Remove the data associated with the connection from TLS
 *
 * @par Functionality:
 *	Deallocates memory for struct connect_context for the connection handle
 *	specified. The node is deallocated from the linked list headed by
 *	member th_conn_context in struct thread_context. For more information
 *	see definition of struct thread_context.
 *	Called by __pbs_client_thread_destroy_connect_context functions to
 *	remove a connection context from the TLS (struct thread_context)
 *
 * @see	__pbs_client_thread_destroy_connect_context
 *
 * @param[in]	connect - the connection identifier from pbs_connect call
 *
 * @retval	0  -  (success)
 * @retval	-1 -  (failure)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
int
pbs_client_thread_remove_connect_context(int connect)
{
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	struct pbs_client_thread_connect_context *prev = NULL;
	struct pbs_client_thread_connect_context *ptr = p->th_conn_context;
	while (ptr) {
		if (ptr->th_ch == connect) {
			if (prev)
				prev->th_ch_next = ptr->th_ch_next;
			else
				p->th_conn_context = ptr->th_ch_next;

			if (ptr->th_ch_errtxt)
				free(ptr->th_ch_errtxt);

			free(ptr);
			return 0;
		}
		prev = ptr;
		ptr = ptr->th_ch_next;
	}
	return -1;
}

/**
 * @brief
 *	Find the address of connection context data
 *
 * @par Functionality:
 *	The node is searched from the linked list headed by the
 *	th_conn_context member of struct thread_context (TLS data)
 *	Called by functions __pbs_client_thread_lock_connection,
 *	__pbs_client_thread_unlock_connection,
 *	pbs_geterrmsg to locate the node associated to connection handle
 *	specified.
 *
 * @see	__pbs_client_thread_lock_connection\n
 *	__pbs_client_thread_unlock_connection
 *
 * @param[in]	connect - the connection identifier from pbs_connect call
 *
 * @retval	Address of the node  -  (success)
 * @retval	NULL, node not found -  (failure)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
struct pbs_client_thread_connect_context *
pbs_client_thread_find_connect_context(int connect)
{
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	struct pbs_client_thread_connect_context *ptr = p->th_conn_context;
	while (ptr) {
		if (ptr->th_ch == connect)
			return ptr;
		ptr = ptr->th_ch_next;
	}
	return NULL;
}

/**
 * @brief
 *	Initializes the connection related data
 *
 * @par Functionality:
 *	1. Initialize the ch_mutex member of the struct connection to a
 *		recursively lockable mutex
 *	2. Calls pbs_client_thread_add_connect_context to add connect context
 *		to the linked list of connections headed by the member
 *		th_ch_conn_context of struct thread_context (TLS data).
 *
 * @see	pbs_client_thread_add_connect_context\n
 *	thread_context
 *
 * @param[in]	connect - the connection identifier from pbs_connect call
 *
 * @retval	0  -  (success)
 * @retval	pbs_errno -  (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_init_connect_context(int connect)
{
	/* create an entry inside the thread context for this connect */
	if (pbs_client_thread_add_connect_context(connect) == NULL) {
		pbs_errno = PBSE_SYSTEM;
		return pbs_errno;
	}
	return 0;
}

/**
 * @brief
 *	Destroys the connection related data
 *
 * @par Functionality:
 *	1. Destroy the ch_mutex member of the struct connection
 *	2. Calls pbs_client_thread_remove_connect_context to remove connection
 *		context from the linked list of connections headed by the member
 *		th_ch_conn_context of struct thread_context (TLS data).
 *
 * @see	pbs_client_thread_add_connect_context\n
 *	pbs_client_thread_remove_connect_context\n
 *	thread_context
 *
 * @param[in]	connect - the connection identifier from pbs_connect call
 *
 * @retval	0  -  (success)
 * @retval	pbs_errno -  (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_destroy_connect_context(int connect)
{
	/* dont ever destroy a connect level mutex */
	/* remove entry frm thread context for this connect */
	if (pbs_client_thread_remove_connect_context(connect) != 0) {
		pbs_errno = PBSE_SYSTEM;
		return pbs_errno;
	}
	return 0;
}

/**
 * @brief
 *	Fetches the thread context data pointer
 *
 * @par Functionality:
 *	Convenience function to get the thread context data of type
 *	struct thread_context from the TLS using pthread_getspecific call.
 *	In case pthread_getspecific returns NULL, it means that the thread_init
 *	function was not called before calling this method. This can happen
 *	when clients might access pbs_errno before calling any IFL API. In such
 *	case, pbs_client_thread_init_thread_context is called to initialize the
 *	the TLS data and then a call to pbs_client_thread_get_context_data gives
 *	us the address to the thread context data for this thread.
 *
 * @see	pbs_client_thread_init_thread_context\n
 *	pbs_client_thread_context
 *
 * @retval	Address of the thread context data
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static struct pbs_client_thread_context *
__pbs_client_thread_get_context_data(void)
{
	struct pbs_client_thread_context *p = NULL;
	p = pthread_getspecific(key_tls);
	if (p == NULL) {
		/* this thread has not entered pthread init, so call it */
		/* if this fails, it sets local context */
		(void) pbs_client_thread_init_thread_context();
		p = pbs_client_thread_get_context_data();
	}
	return p;
}

/**
 * @brief
 *	Locks the connection level mutex
 *
 * @par Functionality:
 *	1. Locks ch_mutex member (recursive mutex) of the connection structure
 *		thus providing the semantics of locking a connection
 *	2. If the connection context was not previously added to TLS area for
 *		this thread (if this is the first call to lock_connection) then
 *		add it to the TLS by calling
 *		pbs_client_thread_add_connect_context())
 *
 * @see	pbs_client_thread_find_connect_context\n
 *	pbs_client_thread_add_connect_context
 *
 * @param[in]	connect - the connection identifier from pbs_connect call
 *
 * @retval	0 (success)
 * @retval	pbs_errno (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_lock_connection(int connect)
{
	struct pbs_client_thread_connect_context *con;
	pthread_mutex_t *mutex = NULL;

	if ((mutex = get_conn_mutex(connect)) == NULL) {
		return (pbs_errno = PBSE_SYSTEM);
	}

	if (pthread_mutex_lock(mutex) != 0) {
		return (pbs_errno = PBSE_SYSTEM);
	}

	con = pbs_client_thread_find_connect_context(connect);
	if (con == NULL) {
		/*
		 * add the connect context to thread, since this thread is
		 * sharing a connection handle amongst threads
		 */
		if ((con = pbs_client_thread_add_connect_context(connect)) == NULL) {
			(void) pthread_mutex_unlock(mutex);
			return (pbs_errno = PBSE_SYSTEM);
		}
	}

	/* copy stuff from con to connection handle slot */
	set_conn_errno(connect, con->th_ch_errno);
	if (set_conn_errtxt(connect, con->th_ch_errtxt) != 0) {
		(void) pthread_mutex_unlock(mutex);
		return (pbs_errno = PBSE_SYSTEM);
		;
	}
	return 0;
}

/**
 * @brief
 *	Unlocks the connection level mutex
 *
 * @par Functionality:
 *	1. Removes the connection context from the TLS for this thread by
 *		calling pbs_client_thread_remove_connect_context()
 *	2. Unlocks the ch_mutex member (recursive mutex) of connection structure
 *		thus providing the semantics of unlocking a connection
 *
 * @param[in]	connect - the connection identifier from pbs_connect call
 *
 * @see	pbs_client_thread_find_connect_context
 *
 * @retval	0 (success)
 * @retval	pbs_errno (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_unlock_connection(int connect)
{
	pthread_mutex_t *mutex = NULL;
	struct pbs_client_thread_connect_context *con = NULL;
	char *errtxt = NULL;

	if ((mutex = get_conn_mutex(connect)) == NULL) {
		return (pbs_errno = PBSE_SYSTEM);
	}

	con = pbs_client_thread_find_connect_context(connect);
	if (con == NULL) {
		return (pbs_errno = PBSE_SYSTEM);
	}

	/* copy stuff from con to connection handle slot */
	con->th_ch_errno = get_conn_errno(connect);
	errtxt = get_conn_errtxt(connect);
	if (errtxt) {
		if (con->th_ch_errtxt)
			free(con->th_ch_errtxt);
		con->th_ch_errtxt = strdup(errtxt);
		if (con->th_ch_errtxt == NULL)
			return (pbs_errno = PBSE_SYSTEM);
	}

	if (pthread_mutex_unlock(mutex) != 0) {
		return (pbs_errno = PBSE_SYSTEM);
	}

	return 0;
}

/**
 * @brief
 *	Locks the connection table level mutex
 *
 * @retval	0 (success)
 * @retval	pbs_errno (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_lock_conntable(void)
{
	if (pthread_mutex_lock(&pbs_client_thread_conntable_mutex) != 0) {
		pbs_errno = PBSE_SYSTEM;
		return pbs_errno;
	}
	return 0;
}

/**
 * @brief
 *	Unlocks the connection table level mutex
 *
 * @retval	0 (success)
 * @retval	pbs_errno (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_unlock_conntable(void)
{
	if (pthread_mutex_unlock(&pbs_client_thread_conntable_mutex) != 0) {
		pbs_errno = PBSE_SYSTEM;
		return pbs_errno;
	}
	return 0;
}

/**
 * @brief
 *	Locks the configuration level mutex (conf_mutex)
 *
 * @retval	0 (success)
 * @retval	pbs_errno (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_lock_conf(void)
{
	if (pthread_mutex_lock(&pbs_client_thread_conf_mutex) != 0) {
		pbs_errno = PBSE_SYSTEM;
		return pbs_errno;
	}
	return 0;
}

/**
 * @brief
 *	Unlocks the configuration level mutex (conf_mutex)
 *
 * @retval	0 (success)
 * @retval	pbs_errno (failure)
 *
 * @par Side-effects:
 *	Sets pbs_errno
 *
 * @par Reentrancy:
 *	Reentrant
 */
static int
__pbs_client_thread_unlock_conf(void)
{
	if (pthread_mutex_unlock(&pbs_client_thread_conf_mutex) != 0) {
		pbs_errno = PBSE_SYSTEM;
		return pbs_errno;
	}
	return 0;
}

/**
 * @brief
 *	Returns the address of dis_buffer used in dis communication.
 *
 * @par Functionality:
 *	This function returns the address of the per thread dis_buffer location
 *	from the TLS by calling @see __pbs_client_thread_get_context_data
 *
 * @retval	Address of the dis_buffer from TLS (success)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
char *
__dis_buffer_location(void)
{
	/*
	 * returns real thread context or data from a global structure
	 * called local_thread_context
	 */
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	return (p->th_dis_buffer);
}

/**
 * @brief
 *	Returns the address of pbs_errno.
 *
 * @par Functionality:
 *	This function returns the address of the per thread location of
 *	pbs_errno variable from the TLS by calling
 *	@see __pbs_client_thread_get_context_data
 *
 * @retval	Address of the pbs_errno from TLS (success)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
int *
__pbs_errno_location(void)
{
	/*
	 * returns real thread context or data from a global structure called
	 * local_thread_context
	 */
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	return (&p->th_pbs_errno);
}

/**
 * @brief
 *	Returns the address of pbs_server.
 *
 * @par Functionality:
 *	This function returns the address of the per thread location of
 *	pbs_server from the TLS by calling
 *	@see __pbs_client_thread_get_context_data
 *
 * @retval	Address of the pbs_server from TLS (success)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
char *
__pbs_server_location(void)
{
	/*
	 * returns real thread context or data from a global structure
	 * called local_thread_context
	 */
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	return (p->th_pbs_server);
}

/**
 * @brief
 *	Returns the address of pbs_current_user.
 *
 * @par Functionality:
 *	This function returns address of the per thread location of
 *	pbs_current_user from the TLS by calling
 *	@see __pbs_client_thread_get_context_data
 *
 * @retval	Address of the pbs_current_user from TLS (success)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
char *
__pbs_current_user_location(void)
{
	return (pbs_conf.current_user);
}

/**
 * @brief
 *	Returns the address of pbs_tcp_timeout.
 *
 * @par Functionality:
 *	This function returns address of the per thread location of
 *	pbs_tcp_timeout from the TLS by calling
 *	@see __pbs_client_thread_get_context_data
 *
 * @retval	Address of the pbs_tcp_timeout from TLS (success)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
time_t *
__pbs_tcptimeout_location(void)
{
	/*
	 * returns real thread context or data from a global structure
	 * called local_thread_context
	 */
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	return (&p->th_pbs_tcp_timeout);
}

/**
 * @brief
 *	Returns the address of pbs_tcp_interrupt.
 *
 * @par Functionality:
 *	This function returns address of the per thread location of
 *	pbs_tcp_interrupt from the TLS by calling
 *	@see __pbs_client_thread_get_context_data
 *
 * @retval	Address of the pbs_tcp_interrupt from TLS (success)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
int *
__pbs_tcpinterrupt_location(void)
{
	/*
	 * returns real thread context or data from a global structure
	 * called local_thread_context
	 */
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	return (&p->th_pbs_tcp_interrupt);
}

/**
 * @brief
 *	Returns the location of pbs_tcp_errno.
 *
 * @par Functionality:
 *	This function returns address of the per thread location of
 *	pbs_tcp_errno from the TLS
 *	by calling @see __pbs_client_thread_get_context_data
 *
 * @retval	Address of the pbs_tcp_errno from TLS (success)
 *
 * @par Side-effects:
 *	None
 *
 * @par Reentrancy:
 *	Reentrant
 */
int *
__pbs_tcperrno_location(void)
{
	/*
	 * returns real thread context or data from a global structure
	 * called local_thread_context
	 */
	struct pbs_client_thread_context *p =
		pbs_client_thread_get_context_data();
	return (&p->th_pbs_tcp_errno);
}


================================================
FILE: src/lib/Libifl/DIS_decode.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	DIS_encode.c
 * 
 * @brief
 * DIS decode routines
 */

#include "batch_request.h"
#include "dis.h"

/**
 * @brief
 *      Decode PBS batch request to authenticate based on external (non-resv-port) mechanisms.
 *      The batch request contains type and the auth data.
 *
 * @param [in] sock socket connection
 * @param [in] preq PBS bath request
 * @return in
 * @retval 0 on success
 * @retval > 0 on failure
 */
int
decode_DIS_Authenticate(int sock, struct batch_request *preq)
{
	int rc;
	int len = 0;

	memset(preq->rq_ind.rq_auth.rq_auth_method, '\0', sizeof(preq->rq_ind.rq_auth.rq_auth_method));
	len = disrsi(sock, &rc);
	if (rc != DIS_SUCCESS)
		return (rc);
	if (len <= 0) {
		return DIS_PROTO;
	}
	rc = disrfst(sock, len, preq->rq_ind.rq_auth.rq_auth_method);
	if (rc != DIS_SUCCESS)
		return (rc);

	memset(preq->rq_ind.rq_auth.rq_encrypt_method, '\0', sizeof(preq->rq_ind.rq_auth.rq_encrypt_method));
	len = disrsi(sock, &rc);
	if (rc != DIS_SUCCESS)
		return (rc);
	if (len > 0) {
		rc = disrfst(sock, len, preq->rq_ind.rq_auth.rq_encrypt_method);
		if (rc != DIS_SUCCESS)
			return (rc);
	}

	preq->rq_ind.rq_auth.rq_port = disrui(sock, &rc);
	if (rc != DIS_SUCCESS)
		return (rc);

	return (rc);
}

/**
 *
 * @brief
 *	Decode the data items needed for a Copy Hook Filecopy request as:
 * 			u int	block sequence number
 *			u int	size of data in block
 *			string	hook file name
 *			cnt str	file data contents
 *
 * @param[in]	sock	- the connection to get data from.
 * @param[in]	preq	- a request structure
 *
 * @return	int
 * @retval	0 for success
 *		non-zero otherwise
 */

int
decode_DIS_CopyHookFile(int sock, struct batch_request *preq)
{
	int rc = 0;
	size_t amt;

	if (preq == NULL)
		return 0;

	preq->rq_ind.rq_hookfile.rq_data = 0;

	preq->rq_ind.rq_hookfile.rq_sequence = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_hookfile.rq_size = disrui(sock, &rc);
	if (rc)
		return rc;

	if ((rc = disrfst(sock, MAXPATHLEN + 1,
			  preq->rq_ind.rq_hookfile.rq_filename)) != 0)
		return rc;

	preq->rq_ind.rq_hookfile.rq_data = disrcs(sock, &amt, &rc);
	if ((amt != preq->rq_ind.rq_hookfile.rq_size) && (rc == 0))
		rc = DIS_EOD;
	if (rc) {
		if (preq->rq_ind.rq_hookfile.rq_data)
			(void) free(preq->rq_ind.rq_hookfile.rq_data);
		preq->rq_ind.rq_hookfile.rq_data = 0;
	}

	return rc;
}

/**
 * @brief
 *	decode a Job Credential batch request
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * NOTE:The batch_request structure must already exist (be allocated by the
 *      caller.   It is assumed that the header fields (protocol type,
 *      protocol version, request type, and user name) have already be decoded.
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_Cred(int sock, struct batch_request *preq)
{
	int rc;

	preq->rq_ind.rq_cred.rq_cred_data = NULL;

	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_cred.rq_jobid);
	if (rc)
		return rc;

	rc = disrfst(sock, PBS_MAXUSER + 1, preq->rq_ind.rq_cred.rq_credid);
	if (rc)
		return rc;

	preq->rq_ind.rq_cred.rq_cred_type = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_cred.rq_cred_data = disrcs(sock, (size_t *) &preq->rq_ind.rq_cred.rq_cred_size, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_cred.rq_cred_validity = disrul(sock, &rc);
	return rc;
}

/**
 * @brief
 *	Decode data item(s) needed for a Delete Hook File request.
 *
 *	Data item is:	string	hook  filename
 *			cnt str	data
 *
 * @param[in]		sock - communication channel
 * @param[in/out]	preq - request structure to fill in
 *
 * @return 	int
 * @retval 	0 for success
 * @retval 	non-zero otherwise
 */

int
decode_DIS_DelHookFile(int sock, struct batch_request *preq)
{
	int rc;

	if ((rc = disrfst(sock, MAXPATHLEN + 1,
			  preq->rq_ind.rq_hookfile.rq_filename)) != 0)
		return rc;

	return 0;
}

/**
 * @brief
 *	-decode a Delete Job Batch Request
 *
 * @par	Functionality:
 *	This function is used to decode the request for deletion of list of jobids.
 *
 *
 *      The batch_request structure must already exist (be allocated by the
 *      caller.   It is assumed that the header fields (protocol type,
 *      protocol version, request type, and user name) have already be decoded.
 *
 * @par	Data items are:\n
 *		unsigned int    command\n
 *              unsigned int    object type\n
 *              string          object name\n
 *              attropl         attributes
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_DelJobList(int sock, struct batch_request *preq)
{
	int rc;
	int count = 0;
	char **tmp_jobslist = NULL;
	int i = 0;

	preq->rq_ind.rq_deletejoblist.rq_count = disrui(sock, &rc);
	if (rc)
		return rc;

	count = preq->rq_ind.rq_deletejoblist.rq_count;

	tmp_jobslist = malloc((count + 1) * sizeof(char *));
	if (tmp_jobslist == NULL)
		return DIS_NOMALLOC;

	for (i = 0; i < count; i++) {
		tmp_jobslist[i] = disrst(sock, &rc);
		if (rc) {
			free(tmp_jobslist);
			return rc;
		}
	}
	tmp_jobslist[i] = NULL;

	preq->rq_ind.rq_deletejoblist.rq_jobslist = tmp_jobslist;
	preq->rq_ind.rq_deletejoblist.rq_resume = FALSE;

	return rc;
}

/**
 * @brief
 *	decode a Job Credential batch request
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * NOTE:The batch_request structure must already exist (be allocated by the
 *      caller.   It is assumed that the header fields (protocol type,
 *      protocol version, request type, and user name) have already be decoded.
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_JobCred(int sock, struct batch_request *preq)
{
	int rc;

	preq->rq_ind.rq_jobcred.rq_data = 0;
	preq->rq_ind.rq_jobcred.rq_type = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_jobcred.rq_data = disrcs(sock,
						 (size_t *) &preq->rq_ind.rq_jobcred.rq_size,
						 &rc);
	return rc;
}

/**
 * @brief -
 *	decode a Job Related Job File Move request
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 *
 * @par Data items are:
 *			u int -	block sequence number\n
 *		 	u int -  file type (stdout, stderr, ...)\n
 *		 	u int -  size of data in block\n
 *		 	string - job id\n
 *		 	cnt str - data\n
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_JobFile(int sock, struct batch_request *preq)
{
	int rc;
	size_t amt;

	preq->rq_ind.rq_jobfile.rq_data = 0;

	preq->rq_ind.rq_jobfile.rq_sequence = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_jobfile.rq_type = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_jobfile.rq_size = disrui(sock, &rc);
	if (rc)
		return rc;

	if ((rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_jobfile.rq_jobid)) != 0)
		return rc;

	preq->rq_ind.rq_jobfile.rq_data = disrcs(sock, &amt, &rc);
	if ((amt != preq->rq_ind.rq_jobfile.rq_size) && (rc == 0))
		rc = DIS_EOD;
	if (rc) {
		if (preq->rq_ind.rq_jobfile.rq_data)
			(void) free(preq->rq_ind.rq_jobfile.rq_data);
		preq->rq_ind.rq_jobfile.rq_data = 0;
	}

	return rc;
}

/**
 * @brief
 *	decode_DIS_JobId() - decode a Job ID string into a batch_request
 *
 * @par Functionality:
 *		This is used for the following batch requests:\n
 *              	Ready_to_Commit\n
 *              	Commit\n
 *              	Locate Job\n
 *              	Rerun Job
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_JobId(int sock, char *jobid)
{
	return (disrfst(sock, PBS_MAXSVRJOBID + 1, jobid));
}

/**
 * @brief
 *	-decode a Manager Batch Request
 *
 * @par	Functionality:
 *	This request is used for most operations where an object is being
 *      created, deleted, or altered.
 *
 *      The batch_request structure must already exist (be allocated by the
 *      caller.   It is assumed that the header fields (protocol type,
 *      protocol version, request type, and user name) have already be decoded.
 *
 * @par	Data items are:\n
 *		unsigned int    command\n
 *              unsigned int    object type\n
 *              string          object name\n
 *              attropl         attributes
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_Manage(int sock, struct batch_request *preq)
{
	int rc;

	CLEAR_HEAD(preq->rq_ind.rq_manager.rq_attr);
	preq->rq_ind.rq_manager.rq_cmd = disrui(sock, &rc);
	if (rc)
		return rc;
	preq->rq_ind.rq_manager.rq_objtype = disrui(sock, &rc);
	if (rc)
		return rc;
	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_manager.rq_objname);
	if (rc)
		return rc;
	return (decode_DIS_svrattrl(sock, &preq->rq_ind.rq_manager.rq_attr));
}

/**
 * @brief Read the modify request for a reservation.
 *
 * @param[in] sock - connection identifier
 * @param[out] preq - batch_request that the information will be read into.
 *
 * @return 0 - on success
 * @return DIS error
 */
int
decode_DIS_ModifyResv(int sock, struct batch_request *preq)
{
	int rc = 0;

	CLEAR_HEAD(preq->rq_ind.rq_modify.rq_attr);
	preq->rq_ind.rq_modify.rq_objtype = disrui(sock, &rc);
	if (rc)
		return rc;
	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_modify.rq_objname);
	if (rc)
		return rc;
	return (decode_DIS_svrattrl(sock, &preq->rq_ind.rq_modify.rq_attr));
}

/**
 * @brief -
 *	decode a Move Job batch request
 *	also used for an Order Job batch request
 *
 * @par	Functionality:
 *		The batch_request structure must already exist (be allocated by the
 *		caller.   It is assumed that the header fields (protocol type,
 *		protocol version, request type, and user name) have already be decoded.
 *
 * @par	 Data items are:
 *		string          job id\n
 *		string          destination
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_MoveJob(int sock, struct batch_request *preq)
{
	int rc;

	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_move.rq_jid);
	if (rc)
		return rc;

	rc = disrfst(sock, PBS_MAXDEST + 1, preq->rq_ind.rq_move.rq_destin);

	return rc;
}

/**
 * @brief-
 *	decode a Message Job batch request
 *
 * @par	Functionality:
 *		The batch_request structure must already exist (be allocated by the
 *      	caller.   It is assumed that the header fields (protocol type,
 *      	protocol version, request type, and user name) have already be decoded.
 *
 * @par	 Data items are:
 *		string          job id
 *		unsigned int    which file
 *		string          the message
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_MessageJob(int sock, struct batch_request *preq)
{
	int rc;

	preq->rq_ind.rq_message.rq_text = 0;

	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_message.rq_jid);
	if (rc)
		return rc;

	preq->rq_ind.rq_message.rq_file = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_message.rq_text = disrst(sock, &rc);
	return rc;
}

/**
 * @brief Read the preempt multiple jobs request.
 *
 * @param[in] sock - connection identifier
 * @param[out] preq - batch_request that the information will be read into.
 *
 * @return 0 - on success
 * @return DIS error
 */
int
decode_DIS_PreemptJobs(int sock, struct batch_request *preq)
{
	int rc = 0;
	int i = 0;
	int count = 0;
	preempt_job_info *ppj = NULL;

	preq->rq_ind.rq_preempt.count = disrui(sock, &rc);
	if (rc)
		return rc;

	count = preq->rq_ind.rq_preempt.count;

	ppj = calloc(sizeof(struct preempt_job_info), count);
	if (ppj == NULL)
		return DIS_NOMALLOC;

	for (i = 0; i < count; i++) {
		if ((rc = disrfst(sock, PBS_MAXSVRJOBID + 1, ppj[i].job_id))) {
			free(ppj);
			return rc;
		}
	}

	preq->rq_ind.rq_preempt.ppj_list = ppj;

	return rc;
}

/**
 * @brief -
 *	decode a Queue Job Batch Request
 *
 * @par	Functionality:
 *		string  job id\n
 *		string  destination\n
 *		list of attributes (attropl)
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_QueueJob(int sock, struct batch_request *preq)
{
	int rc;

	CLEAR_HEAD(preq->rq_ind.rq_queuejob.rq_attr);
	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_queuejob.rq_jid);
	if (rc)
		return rc;

	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_queuejob.rq_destin);
	if (rc)
		return rc;

	return (decode_DIS_svrattrl(sock, &preq->rq_ind.rq_queuejob.rq_attr));
}

/**
 * @brief -
 *	decode a Register Dependency Batch Request
 *
 * @par	Functionality:
 *		The batch_request structure must already exist (be allocated by the
 *      	caller.   It is assumed that the header fields (protocol type,
 *      	protocol version, request type, and user name) have already be decoded
 *
 * @par	Data items are:
 *		string          job owner\n
 *		string          parent job id\n
 *		string          child job id\n
 *		unsigned int    dependency type\n
 *		unsigned int    operation\n
 *		signed long     cost\n
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_Register(int sock, struct batch_request *preq)
{
	int rc;

	rc = disrfst(sock, PBS_MAXUSER, preq->rq_ind.rq_register.rq_owner);
	if (rc)
		return rc;
	rc = disrfst(sock, PBS_MAXSVRJOBID, preq->rq_ind.rq_register.rq_parent);
	if (rc)
		return rc;
	rc = disrfst(sock, PBS_MAXCLTJOBID, preq->rq_ind.rq_register.rq_child);
	if (rc)
		return rc;
	preq->rq_ind.rq_register.rq_dependtype = disrui(sock, &rc);

	if (rc)
		return rc;

	preq->rq_ind.rq_register.rq_op = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_register.rq_cost = disrsl(sock, &rc);

	return rc;
}

/**
 * @brief -
 *	decode a batch_request Extend string
 *
 * @par	Functionality:
 *		The batch_request structure must already exist (be allocated by the
 *      	caller.   It is assumed that the header fields (protocol type,
 *		protocol version, request type, and user name) and the request body
 *		have already be decoded.
 *
 * Note:The next field is an unsigned integer which is 1 if there is an
 *      extension string and zero if not.
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_ReqExtend(int sock, struct batch_request *preq)
{
	int i;
	int rc;

	i = disrui(sock, &rc); /* indicates if an extension exists */

	if (rc == 0) {
		if (i != 0) {
			preq->rq_extend = disrst(sock, &rc);
		}
	}
	return (rc);
}

/**
 * @brief-
 *	Decode the Request Header Fields
 *      common to all requests
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return	int
 * @retval	-1    on EOF (end of file on first read only)
 * @retval	0    on success
 * @retval	>0    a DIS error return, see dis.h
 *
 */

int
decode_DIS_ReqHdr(int sock, struct batch_request *preq, int *proto_type, int *proto_ver)
{
	int rc;

	*proto_type = disrui(sock, &rc);
	if (rc) {
		return rc;
	}
	if (*proto_type != PBS_BATCH_PROT_TYPE)
		return DIS_PROTO;
	*proto_ver = disrui(sock, &rc);
	if (rc) {
		return rc;
	}

	preq->rq_type = disrui(sock, &rc);
	if (rc) {
		return rc;
	}

	return (disrfst(sock, PBS_MAXUSER + 1, preq->rq_user));
}

/**
 * @brief-
 *	decode a resource request
 *
 * @par	Functionality:
 *		Used for resource query, resource reserver, resource free.
 *
 *		The batch_request structure must already exist (be allocated by the
 *		caller.   It is assumed that the header fields (protocol type,
 *		protocol version, request type, and user name) have been decoded.
 *
 * @par	Data items are:\n
 *		signed int	resource handle\n
 *		unsigned int	count of resource queries\n
 *	followed by that number of:\n
 *		string		resource list
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_Rescl(int sock, struct batch_request *preq)
{
	int ct;
	int i;
	char **ppc;
	int rc;

	/* first, the resource handle (even if not used in request) */

	preq->rq_ind.rq_rescq.rq_rhandle = disrsi(sock, &rc);
	if (rc)
		return rc;

	/* next need to know how many query strings */

	ct = disrui(sock, &rc);
	if (rc)
		return rc;
	preq->rq_ind.rq_rescq.rq_num = ct;
	if (ct) {
		if ((ppc = (char **) malloc(ct * sizeof(char *))) == 0)
			return PBSE_RMSYSTEM;

		for (i = 0; i < ct; i++)
			*(ppc + i) = NULL;

		preq->rq_ind.rq_rescq.rq_list = ppc;
		for (i = 0; i < ct; i++) {
			*(ppc + i) = disrst(sock, &rc);
			if (rc)
				break;
		}
	}

	return rc;
}

/**
 * @brief-
 *	decode a Run Job batch request
 *
 * @par	Functionality:
 *		The batch_request structure must already exist (be allocated by the
 *      	caller.   It is assumed that the header fields (protocol type,
 *      	protocol version, request type, and user name) have already be decoded.
 *
 * @par	Data items are:\n
 *		string          job id\n
 *		string          destination\n
 *		unsigned int    resource_handle\n
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_Run(int sock, struct batch_request *preq)
{
	int rc;

	/* job id */
	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_run.rq_jid);
	if (rc)
		return rc;

	/* variable length list of vnodes (destination) */
	preq->rq_ind.rq_run.rq_destin = disrst(sock, &rc);
	if (rc)
		return rc;

	/* an optional flag, used by reservations */
	preq->rq_ind.rq_run.rq_resch = disrul(sock, &rc);
	return rc;
}

/**
 * @brief-
 *	decode a Server Shut Down batch request
 *
 * @par	Functionality:
 *		The batch_request structure must already exist (be allocated by the
 *      	caller.   It is assumed that the header fields (protocol type,
 *		protocol version, request type, and user name) have already be decoded.
 *
 * @par	 Data items are:\n
 *		u int           manner
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_ShutDown(int sock, struct batch_request *preq)
{
	int rc;

	preq->rq_ind.rq_shutdown = disrui(sock, &rc);

	return rc;
}

/**
 * @brief-
 *	decode a Signal Job batch request
 *
 * @par	Functionality:
 *		The batch_request structure must already exist (be allocated by the
 *      	caller.   It is assumed that the header fields (protocol type,
 *      	protocol version, request type, and user name) have already be decoded.
 *
 * @par	Data items are:\n
 *		string          job id\n
 *		string          signal (name)
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_SignalJob(int sock, struct batch_request *preq)
{
	int rc;

	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_signal.rq_jid);
	if (rc)
		return rc;

	rc = disrfst(sock, PBS_SIGNAMESZ + 1, preq->rq_ind.rq_signal.rq_signame);
	return rc;
}

/**
 * @brief
 *	Decode a Status batch request
 *
 * @par
 *	The batch_request structure must already exist (be allocated by the
 *	caller).   It is assumed that the header fields (protocol type,
 *	protocol version, request type, and user name) have already be decoded.
 *
 * @param[in]     sock - socket handle from which to read.
 * @param[in,out] preq - pointer to the batch request structure. The following
 *		elements of the rq_ind.rq_status union are updated:
 *		rq_id     - object id, a variable length string.
 *		rq_status - the linked list of attribute structures
 *
 * @return int
 * @retval 0 - request read and decoded successfully.
 * @retval non-zero - DIS decode error.
 */

int
decode_DIS_Status(int sock, struct batch_request *preq)
{
	int rc;
	size_t nchars = 0;

	preq->rq_ind.rq_status.rq_id = NULL;

	CLEAR_HEAD(preq->rq_ind.rq_status.rq_attr);

	/*
	 * call the disrcs function to allocate and return a string of all ids
	 * freed in free_br()
	 */
	preq->rq_ind.rq_status.rq_id = disrcs(sock, &nchars, &rc);
	if (rc)
		return rc;

	rc = decode_DIS_svrattrl(sock, &preq->rq_ind.rq_status.rq_attr);
	return rc;
}

/**
 * @brief-
 *	decode a Track Job batch request
 *
 * @par	NOTE:
 *	The batch_request structure must already exist (be allocated by the
 *      caller.   It is assumed that the header fields (protocol type,
 *      protocol version, request type, and user name) have already be decoded.
 *
 * @par	 Data items are:\n
 *		string          job id\n
 *		unsigned int    hopcount\n
 *		string          location\n
 *		u char          state\n
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_TrackJob(int sock, struct batch_request *preq)
{
	int rc;

	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_track.rq_jid);
	if (rc)
		return rc;

	preq->rq_ind.rq_track.rq_hopcount = disrui(sock, &rc);
	if (rc)
		return rc;

	rc = disrfst(sock, PBS_MAXDEST + 1, preq->rq_ind.rq_track.rq_location);
	if (rc)
		return rc;

	preq->rq_ind.rq_track.rq_state[0] = disruc(sock, &rc);
	return rc;
}

/**
 * @brief-
 *	decode a User Credential batch request
 *
 * @par	NOTE:
 *	The batch_request structure must already exist (be allocated by the
 *	caller.   It is assumed that the header fields (protocol type,
 *	protocol version, request type, and user name) have already be decoded.
 *
 * @par	Data items are:\n
 *		string          user whose credential is being set\n
 *		unsigned int	credential type\n
 *		counted string	the credential data
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_UserCred(int sock, struct batch_request *preq)
{
	int rc;

	rc = disrfst(sock, PBS_MAXUSER + 1, preq->rq_ind.rq_usercred.rq_user);
	if (rc)
		return rc;

	preq->rq_ind.rq_usercred.rq_type = disrui(sock, &rc);
	if (rc)
		return rc;

	preq->rq_ind.rq_usercred.rq_data = 0;
	preq->rq_ind.rq_usercred.rq_data = disrcs(sock,
						  (size_t *) &preq->rq_ind.rq_usercred.rq_size,
						  &rc);
	return rc;
}

/**
 * @brief
 *	decode into a list of PBS API "attrl" structures
 *
 *	The space for the attrl structures is allocated as needed.
 *
 *	The first item is a unsigned integer, a count of the
 *	number of attrl entries in the linked list.  This is encoded
 *	even when there are no entries in the list.
 *
 *	Each individual entry is encoded as:
 *		u int	size of the three strings (name, resource, value)
 *			including the terminating nulls, see dec_svrattrl.c
 *		string	attribute name
 *		u int	1 or 0 if resource name does or does not follow
 *		string	resource name (if one)
 *		string  value of attribute/resource
 *		u int	"op" of attrlop (also flag of svrattrl)
 *
 *	Note, the encoding of a attrl is the same as the encoding of
 *	the pbs_ifl.h structures "attropl" and the server struct svrattrl.
 *	Any one of the three forms can be decoded into any of the three with
 *	the possible loss of the "flags" field (which is the "op" of the
 *	attrlop).
 *
 * @param[in]   sock - socket descriptor
 * @param[in]   ppatt - pointer to list of attributes
 *
 * @return int
 * @retval 0 on SUCCESS
 * @retval >0 on failure
 */

int
decode_DIS_attrl(int sock, struct attrl **ppatt)
{
	int hasresc;
	int i;
	unsigned int numpat;
	struct attrl *pat = 0;
	struct attrl *patprior = 0;
	int rc;

	numpat = disrui(sock, &rc);
	if (rc)
		return rc;

	for (i = 0; i < numpat; ++i) {

		(void) disrui(sock, &rc);
		if (rc)
			break;

		pat = new_attrl();
		if (pat == 0)
			return DIS_NOMALLOC;

		pat->name = disrst(sock, &rc);
		if (rc)
			break;

		hasresc = disrui(sock, &rc);
		if (rc)
			break;
		if (hasresc) {
			pat->resource = disrst(sock, &rc);
			if (rc)
				break;
		}

		pat->value = disrst(sock, &rc);
		if (rc)
			break;

		pat->op = (enum batch_op) disrui(sock, &rc);
		if (rc)
			break;

		if (i == 0) {
			/* first one, link to passing in pointer */
			*ppatt = pat;
		} else {
			patprior->next = pat;
		}
		patprior = pat;
	}

	if (rc)
		PBS_free_aopl((struct attropl *) pat);
	return rc;
}

/**
 * @brief
 *	decode into a list of PBS API "attropl" structures
 *
 *	The space for the attropl structures is allocated as needed.
 *
 *	The first item is a unsigned integer, a count of the
 *	number of attropl entries in the linked list.  This is encoded
 *	even when there are no entries in the list.
 *
 *	Each individual entry is encoded as:
 *		u int	size of the three strings (name, resource, value)
 *			including the terminating nulls, see dec_svrattrl.c
 *		string	attribute name
 *		u int	1 or 0 if resource name does or does not follow
 *		string	resource name (if one)
 *		string  value of attribute/resource
 *		u int	"op" of attrlop (also flag of svrattrl)
 *
 *	Note, the encoding of a attropl is the same as the encoding of
 *	the pbs_ifl.h structures "attrl" and the server struct svrattrl.
 *	Any one of the three forms can be decoded into any of the three with
 *	the possible loss of the "flags" field (which is the "op" of the
 *	attrlop).
 *
 * @param[in]   sock - socket descriptor
 * @param[in]   ppatt - pointer to list of attributes
 *
 * @return int
 * @retval 0 on SUCCESS
 * @retval >0 on failure
 */

int
decode_DIS_attropl(int sock, struct attropl **ppatt)
{
	int hasresc;
	int i;
	unsigned int numpat;
	struct attropl *pat = 0;
	struct attropl *patprior = 0;
	int rc;

	numpat = disrui(sock, &rc);
	if (rc)
		return rc;

	for (i = 0; i < numpat; ++i) {

		(void) disrui(sock, &rc);
		if (rc)
			break;

		pat = malloc(sizeof(struct attropl));
		if (pat == 0)
			return DIS_NOMALLOC;

		pat->next = NULL;
		pat->name = NULL;
		pat->resource = NULL;
		pat->value = NULL;

		pat->name = disrst(sock, &rc);
		if (rc)
			break;

		hasresc = disrui(sock, &rc);
		if (rc)
			break;
		if (hasresc) {
			pat->resource = disrst(sock, &rc);
			if (rc)
				break;
		}

		pat->value = disrst(sock, &rc);
		if (rc)
			break;

		pat->op = (enum batch_op) disrui(sock, &rc);
		if (rc)
			break;

		if (i == 0) {
			/* first one, link to passing in pointer */
			*ppatt = pat;
		} else {
			patprior->next = pat;
		}
		patprior = pat;
	}

	if (rc)
		PBS_free_aopl(pat);
	return rc;
}

/**
 * @brief-
 *	 decode into a list of server "svrattrl" structures
 *
 * @par	Functionality:
 *		The space for the svrattrl structures is allocated as needed.
 *
 *      The first item is a unsigned integer, a count of the
 *      number of svrattrl entries in the linked list.  This is encoded
 *      even when there are no entries in the list.
 *
 * @par	Each individual entry is encoded as:\n
 *			u int	- size of the three strings (name, resource, value)
 *                      	  including the terminating nulls\n
 *			string  - attribute name\n
 *			u int   - 1 or 0 if resource name does or does not follow\n
 *			string  - resource name (if one)\n
 *			string  - value of attribute/resource\n
 *			u int   - "op" of attrlop\n
 *
 * NOTE:
 *	the encoding of a svrattrl is the same as the encoding of
 *      the pbs_ifl.h structures "attrl" and "attropl".  Any one of
 *      the three forms can be decoded into any of the three with the
 *      possible loss of the "flags" field (which is the "op" of the attrlop).
 *
 * @param[in] sock - socket descriptor
 * @param[in] phead - head pointer to list entry list sub-structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_svrattrl(int sock, pbs_list_head *phead)
{
	int i;
	unsigned int hasresc;
	size_t ls;
	unsigned int data_len;
	unsigned int numattr;
	svrattrl *psvrat;
	int rc;
	size_t tsize;

	numattr = disrui(sock, &rc); /* number of attributes in set */
	if (rc)
		return rc;

	for (i = 0; i < numattr; ++i) {

		data_len = disrui(sock, &rc); /* here it is used */
		if (rc)
			return rc;

		tsize = sizeof(svrattrl) + data_len;
		if ((psvrat = (svrattrl *) malloc(tsize)) == 0)
			return DIS_NOMALLOC;

		CLEAR_LINK(psvrat->al_link);
		psvrat->al_sister = NULL;
		psvrat->al_atopl.next = 0;
		psvrat->al_tsize = tsize;
		psvrat->al_name = (char *) psvrat + sizeof(svrattrl);
		psvrat->al_resc = 0;
		psvrat->al_value = 0;
		psvrat->al_nameln = 0;
		psvrat->al_rescln = 0;
		psvrat->al_valln = 0;
		psvrat->al_flags = 0;
		psvrat->al_refct = 1;

		if ((rc = disrfcs(sock, &ls, data_len, psvrat->al_name)) != 0)
			break;
		*(psvrat->al_name + ls++) = '\0';
		psvrat->al_nameln = (int) ls;
		data_len -= ls;

		hasresc = disrui(sock, &rc);
		if (rc)
			break;
		if (hasresc) {
			psvrat->al_resc = psvrat->al_name + ls;
			rc = disrfcs(sock, &ls, data_len, psvrat->al_resc);
			if (rc)
				break;
			*(psvrat->al_resc + ls++) = '\0';
			psvrat->al_rescln = (int) ls;
			data_len -= ls;
		}

		psvrat->al_value = psvrat->al_name + psvrat->al_nameln +
				   psvrat->al_rescln;
		if ((rc = disrfcs(sock, &ls, data_len, psvrat->al_value)) != 0)
			break;
		*(psvrat->al_value + ls++) = '\0';
		psvrat->al_valln = (int) ls;

		psvrat->al_op = (enum batch_op) disrui(sock, &rc);
		if (rc)
			break;

		append_link(phead, &psvrat->al_link, psvrat);
	}

	if (rc) {
		(void) free(psvrat);
	}

	return (rc);
}


================================================
FILE: src/lib/Libifl/DIS_encode.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	DIS_encode.c
 * 
 * @brief
 * DIS encode routines
 */

#include "batch_request.h"
#include "dis.h"

/**
 * @brief encode the Preempt Jobs request for sending to the server.
 *
 * @param[in] sock - socket descriptor for the connection.
 * @param[in] jobs - list of job ids.
 *
 * @return - error code while writing data to the socket.
 */
int
encode_DIS_JobsList(int sock, char **jobs_list, int numofjobs)
{
	int i = 0;
	int rc = 0;
	int count = 0;

	if (numofjobs == -1)
		for (; jobs_list[count]; count++)
			;
	else
		count = numofjobs;

	if (((rc = diswui(sock, count)) != 0))
		return rc;

	for (i = 0; i < count; i++)
		if ((rc = diswst(sock, jobs_list[i])) != 0)
			return rc;

	return rc;
}

/**
 *
 * @brief
 *	Encode a Copy Hook File request.
 *	Send over 'sock' the data items:
 *			u int	block sequence number
 *			u int	file type (stdout, stderr, ...)
 *			u int	size of data in block
 *			string	hook file name
 *			cnt str	data
 *
 * @param[in]	sock -  the communication end point.
 * @param[in]	seq -	sequence number of the current block of data being sent
 * @param[in] 	buf - block of data to be sent
 * @param[in]	len - # of characters in 'buf'
 * @param[in]	filename - name of the hook file being sent.
 *
 * @return 	int
 * @retval 	0 for success
 * @retval	non-zero otherwise
 */

int
encode_DIS_CopyHookFile(int sock, int seq, const char *buf, int len, const char *filename)
{
	int rc;

	if ((rc = diswui(sock, seq) != 0) ||
	    (rc = diswui(sock, len) != 0) ||
	    (rc = diswst(sock, filename) != 0) ||
	    (rc = diswcs(sock, buf, len) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-encode a Copy Files Dependency Batch Request
 *
 * @param[in] sock - socket descriptor
 * @param[in] preq - pointer to batch_request
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
encode_DIS_CopyFiles(int sock, struct batch_request *preq)
{
	int pair_ct = 0;
	char *nullstr = "";
	struct rqfpair *ppair;
	int rc;

	ppair = (struct rqfpair *) GET_NEXT(preq->rq_ind.rq_cpyfile.rq_pair);
	while (ppair) {
		++pair_ct;
		ppair = (struct rqfpair *) GET_NEXT(ppair->fp_link);
	}

	if ((rc = diswst(sock, preq->rq_ind.rq_cpyfile.rq_jobid) != 0) ||
	    (rc = diswst(sock, preq->rq_ind.rq_cpyfile.rq_owner) != 0) ||
	    (rc = diswst(sock, preq->rq_ind.rq_cpyfile.rq_user) != 0) ||
	    (rc = diswst(sock, preq->rq_ind.rq_cpyfile.rq_group) != 0) ||
	    (rc = diswui(sock, preq->rq_ind.rq_cpyfile.rq_dir) != 0))
		return rc;

	if ((rc = diswui(sock, pair_ct) != 0))
		return rc;
	ppair = (struct rqfpair *) GET_NEXT(preq->rq_ind.rq_cpyfile.rq_pair);
	while (ppair) {
		if (ppair->fp_rmt == NULL)
			ppair->fp_rmt = nullstr;
		if ((rc = diswui(sock, ppair->fp_flag) != 0) ||
		    (rc = diswst(sock, ppair->fp_local) != 0) ||
		    (rc = diswst(sock, ppair->fp_rmt) != 0))
			return rc;
		ppair = (struct rqfpair *) GET_NEXT(ppair->fp_link);
	}

	return 0;
}

/**
 * @brief
 * 	-encode_DIS_CopyFiles_Cred() - encode a Copy Files with Credential Dependency
 *	Batch Request
 *
 * @par Note:
 *	This request is used by the server ONLY; its input is a server
 *	batch request structure.
 *
 * @param[in] sock - socket descriptor
 * @param[in] preq - pointer to batch request
 *
 * @par	Data items are:\n
 *		string		job id\n
 *		string		job owner(may be null)\n
 *		string		execution user name\n
 *		string		execution group name(may be null)\n
 *		unsigned int	direction & job_dir_enable flag\n
 *		unsigned int	count of file pairs in set\n
 *	set of	file pairs:\n
 *		unsigned int	flag\n
 *		string		local path name\n
 *		string		remote path name (may be null)\n
 *		unsigned int	credential type\n
 *		unsigned int	credential length (bytes)\n
 *		byte string	credential\n
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
encode_DIS_CopyFiles_Cred(int sock, struct batch_request *preq)
{
	int pair_ct = 0;
	char *nullstr = "";
	struct rqfpair *ppair;
	int rc;
	size_t clen;
	struct rq_cpyfile *rcpyf;

	clen = (size_t) preq->rq_ind.rq_cpyfile_cred.rq_credlen;
	rcpyf = &preq->rq_ind.rq_cpyfile_cred.rq_copyfile;
	ppair = (struct rqfpair *) GET_NEXT(rcpyf->rq_pair);

	while (ppair) {
		++pair_ct;
		ppair = (struct rqfpair *) GET_NEXT(ppair->fp_link);
	}

	if ((rc = diswst(sock, rcpyf->rq_jobid) != 0) ||
	    (rc = diswst(sock, rcpyf->rq_owner) != 0) ||
	    (rc = diswst(sock, rcpyf->rq_user) != 0) ||
	    (rc = diswst(sock, rcpyf->rq_group) != 0) ||
	    (rc = diswui(sock, rcpyf->rq_dir) != 0))
		return rc;

	if ((rc = diswui(sock, pair_ct) != 0))
		return rc;
	ppair = (struct rqfpair *) GET_NEXT(rcpyf->rq_pair);
	while (ppair) {
		if (ppair->fp_rmt == NULL)
			ppair->fp_rmt = nullstr;
		if ((rc = diswui(sock, ppair->fp_flag) != 0) ||
		    (rc = diswst(sock, ppair->fp_local) != 0) ||
		    (rc = diswst(sock, ppair->fp_rmt) != 0))
			return rc;
		ppair = (struct rqfpair *) GET_NEXT(ppair->fp_link);
	}

	rc = diswui(sock, preq->rq_ind.rq_cpyfile_cred.rq_credtype);
	if (rc != 0)
		return rc;
	rc = diswcs(sock, preq->rq_ind.rq_cpyfile_cred.rq_pcred, clen);
	if (rc != 0)
		return rc;

	return 0;
}

/**
 *
 * @brief
 *	Encode a Hook Delete File request
 *	Send over to 'sock' the data item:
 *			string	hook filename
 * @param[in]	sock - communication channel
 * @param[in]	filename - hook filename
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */

int
encode_DIS_DelHookFile(int sock, const char *filename)
{
	int rc;

	if ((rc = diswst(sock, filename) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-encode a Job Credential Batch Request
 *
 * @par	Data items are:\n
 *		char		job id
 *		char		cred id (e.g principal)
 *		int	credential type
 *		counted string	the message
 *		long		credential validity
 *
 * @param[in] sock - socket descriptor
 * @param[in] jobid - job id
 * @param[in] owner - cred id (e.g. principal)
 * @param[in] type - cred type
 * @param[in] data - credential
 * @param[in] size - length of credential
 * @param[in] long - credential validity
 *
 * @return	int
 * @retval      0 for success
 * @retval      non-zero otherwise
 */

int
encode_DIS_Cred(int sock, char *jobid, char *credid, int type, char *data, size_t size, long validity)
{
	int rc;

	if ((rc = diswst(sock, jobid) != 0) ||
	    (rc = diswst(sock, credid) != 0) ||
	    (rc = diswui(sock, type) != 0) ||
	    (rc = diswcs(sock, data, size) != 0) ||
	    (rc = diswul(sock, validity) != 0))
		return rc;

	return rc;
}

/**
 * @brief
 *	-encode a Job Credential Batch Request
 *
 * @par	Data items are:\n
 *		unsigned int    Credential type\n
 *		string          the credential (octet array)\n
 *
 * @param[in] sock - socket descriptor
 * @param[in] type - cred type
 * @param[in] cred - credential
 * @param[in] len - length of credentials
 *
 * @return	int
 * @retval      0 for success
 * @retval      non-zero otherwise
 */

int
encode_DIS_JobCred(int sock, int type, const char *cred, int len)
{
	int rc;

	if ((rc = diswui(sock, type)) != 0)
		return rc;
	rc = diswcs(sock, cred, (size_t) len);

	return rc;
}

/**
 * @brief
 *	-encode a Job Releated File
 *
 * @param[in]   sock -  the communication end point.
 * @param[in]   seq -   sequence number of the current block of data being sent
 * @param[in]   buf - block of data to be sent
 * @param[in]   len - # of characters in 'buf'
 * @param[in]	jobid - job id
 * @param[in] 	which - file type
 *
 * @return      int
 * @retval      0 for success
 * @retval      non-zero otherwise
 */

int
encode_DIS_JobFile(int sock, int seq, const char *buf, int len, const char *jobid, int which)
{
	int rc;

	if (jobid == NULL)
		jobid = "";
	if ((rc = diswui(sock, seq) != 0) ||
	    (rc = diswui(sock, which) != 0) ||
	    (rc = diswui(sock, len) != 0) ||
	    (rc = diswst(sock, jobid) != 0) ||
	    (rc = diswcs(sock, buf, len) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *      - decode a Job ID string into a batch_request
 *
 * @par Functionality:
 *              This is used for the following batch requests:\n
 *                      Ready_to_Commit\n
 *                      Commit\n
 *                      Locate Job\n
 *                      Rerun Job
 *
 * @param[in] sock - socket descriptor
 * @param[in] jobid - job id
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_JobId(int sock, const char *jobid)
{
	return (diswst(sock, jobid));
}

/**
 * @brief
 *	-encode a Manager Batch Request
 *
 * @par	Functionality:
 *		This request is used for most operations where an object is being
 *      	created, deleted, or altered.
 *
 * @param[in] sock - socket descriptor
 * @param[in] command - command type
 * @param[in] objtype - object type
 * @param[in] objname - object name
 * @param[in] aoplp - pointer to attropl structure(list)
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_Manage(int sock, int command, int objtype, const char *objname, struct attropl *aoplp)
{
	int rc;

	if ((rc = diswui(sock, command) != 0) ||
	    (rc = diswui(sock, objtype) != 0) ||
	    (rc = diswst(sock, objname) != 0))
		return rc;

	return (encode_DIS_attropl(sock, aoplp));
}

/**
 * @brief encode the Modify Reservation request for sending to the server.
 *
 * @param[in] sock - socket descriptor for the connection.
 * @param[in] resv_id - Reservation identifier of the reservation that would be modified.
 * @param[in] aoplp - list of attributes that will be modified.
 *
 * @return - error code while writing data to the socket.
 */
int
encode_DIS_ModifyResv(int sock, const char *resv_id, struct attropl *aoplp)
{
	int rc = 0;

	if (resv_id == NULL)
		resv_id = "";

	if (((rc = diswui(sock, MGR_OBJ_RESV)) != 0) ||
	    ((rc = diswst(sock, resv_id)) != 0))
		return rc;

	return (encode_DIS_attropl(sock, aoplp));
}

/**
 * @brief
 *	-encode a Move Job Batch Request
 *	also used for an Order Job Batch Request
 *
 * @param[in] sock - socket descriptor
 * @param[in] jobid - job id to be moved
 * @param[in] destin - destination to which job to be moved
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_MoveJob(int sock, const char *jobid, const char *destin)
{
	int rc;

	if ((rc = diswst(sock, jobid) != 0) ||
	    (rc = diswst(sock, destin) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	- encode a Message Job Batch Request
 *
 * @param[in] sock - socket descriptor
 * @param[in] jobid - job id
 * @param[in] fileopt - which file
 * @param[in] msg - msg to be encoded
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_MessageJob(int sock, const char *jobid, int fileopt, const char *msg)
{
	int rc;

	if ((rc = diswst(sock, jobid) != 0) ||
	    (rc = diswui(sock, fileopt) != 0) ||
	    (rc = diswst(sock, msg) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-Write a python spawn request onto the wire.
 *	Each of the argv and envp arrays is sent by writing a counted
 *	string followed by a zero length string ("").  They are read
 *	by the function read_carray() in dec_MsgJob.c
 *
 * @param[in] sock - socket descriptor
 * @param[in] jobid - job id
 * @param[in] argv - pointer to argument list
 * @param[in] envp - pointer to environment variable
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */
int
encode_DIS_PySpawn(int sock, const char *jobid, char **argv, char **envp)
{
	int rc, i;
	char *cp;

	if ((rc = diswst(sock, jobid)) != DIS_SUCCESS)
		return rc;

	if (argv != NULL) {
		for (i = 0; (cp = argv[i]) != NULL; i++) {
			if ((rc = diswcs(sock, cp, strlen(cp))) != DIS_SUCCESS)
				return rc;
		}
	}
	if ((rc = diswcs(sock, "", 0)) != DIS_SUCCESS)
		return rc;

	if (envp != NULL) {
		for (i = 0; (cp = envp[i]) != NULL; i++) {
			if ((rc = diswcs(sock, cp, strlen(cp))) != DIS_SUCCESS)
				return rc;
		}
	}
	rc = diswcs(sock, "", 0);

	return rc;
}

int
encode_DIS_RelnodesJob(int sock, const char *jobid, const char *node_list)
{
	int rc;

	if ((rc = diswst(sock, jobid) != 0) ||
	    (rc = diswst(sock, node_list) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-encode a Queue Job Batch Request
 *
 * @par	Functionality:
 *		This request is used for the first step in submitting a job, sending
 *      	the job attributes.
 *
 * @param[in] sock - socket descriptor
 * @param[in] jobid - job id
 * @param[in] destin - destination queue name
 * @param[in] aoplp - pointer to attropl structure(list)
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_QueueJob(int sock, char *jobid, const char *destin, struct attropl *aoplp)
{
	int rc;

	if (jobid == NULL)
		jobid = "";
	if (destin == NULL)
		destin = "";

	if ((rc = diswst(sock, jobid) != 0) ||
	    (rc = diswst(sock, destin) != 0))
		return rc;

	return (encode_DIS_attropl(sock, aoplp));
}

/**
 * @brief
 *      -encode a Register Dependency Batch Request
 *
 * @par Functionality:
 *       	This request is used by the server ONLY; its input is a server
 *      	batch request structure.
 *
 * @par Data items are:
 *              string          job owner\n
 *              string          parent job id\n
 *              string          child job id\n
 *              unsigned int    dependency type\n
 *              unsigned int    operation\n
 *              signed long     cost\n
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_Register(int sock, struct batch_request *preq)
{
	int rc;

	if ((rc = diswst(sock, preq->rq_ind.rq_register.rq_owner) != 0) ||
	    (rc = diswst(sock, preq->rq_ind.rq_register.rq_parent) != 0) ||
	    (rc = diswst(sock, preq->rq_ind.rq_register.rq_child) != 0) ||
	    (rc = diswui(sock, preq->rq_ind.rq_register.rq_dependtype) != 0) ||
	    (rc = diswui(sock, preq->rq_ind.rq_register.rq_op) != 0) ||
	    (rc = diswsl(sock, preq->rq_ind.rq_register.rq_cost) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-write an extension to a Batch Request
 *
 * @par	The extension is in two parts:
 *		unsigned integer - 1 if an extension string follows, 0 if not\n
 *		character string - if 1 above
 *
 * @param[in] sock - socket descriptor
 * @param[in] extend - string which used as extension for req
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_ReqExtend(int sock, const char *extend)
{
	int rc;

	if ((extend == NULL) || (*extend == '\0')) {
		rc = diswui(sock, 0);
	} else {
		if ((rc = diswui(sock, 1)) == 0) {
			rc = diswst(sock, extend);
		}
	}

	return rc;
}

/**
 * @brief
 *	-encode a Request Header
 *
 * @param[in] sock - socket descriptor
 * @param[in] reqt - request type
 * @param[in] user - user name
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_ReqHdr(int sock, int reqt, const char *user)
{
	int rc;

	if ((rc = diswui(sock, PBS_BATCH_PROT_TYPE)) ||
	    (rc = diswui(sock, PBS_BATCH_PROT_VER)) ||
	    (rc = diswui(sock, reqt)) ||
	    (rc = diswst(sock, user))) {
		return rc;
	}
	return 0;
}

/**
 * @brief
 *	-used to encode the basic information for the
 *      RunJob request and the ConfirmReservation request
 *
 * @param[in] sock - soket descriptor
 * @param[in] id - reservation id
 * @param[in] where - reservation on
 * @param[in] arg - ar
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_Run(int sock, const char *id, const char *where, unsigned long arg)
{
	int rc;

	if ((rc = diswst(sock, id) != 0) ||
	    (rc = diswst(sock, where) != 0) ||
	    (rc = diswul(sock, arg) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-encode a Server Shut Down Batch Request
 *
 * @param[in] sock - socket descriptor
 * @param[in] manner - type of shutdown
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_ShutDown(int sock, int manner)
{
	return (diswui(sock, manner));
}

/**
 * @brief
 *	-encode a Signal Job Batch Request
 *
 * @param[in] sock - socket descriptor
 * @param[in] jobid - job id
 * @param[in] signal - signal
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_SignalJob(int sock, const char *jobid, const char *signal)
{
	int rc;

	if ((rc = diswst(sock, jobid) != 0) ||
	    (rc = diswst(sock, signal) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-encode a Status Job Batch Request
 *
 * @param[in] sock - socket descriptor
 * @param[in] objid - object id
 * @param[in] pattrl - pointer to attrl struct(list)
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_Status(int sock, const char *objid, struct attrl *pattrl)
{
	int rc;

	if ((rc = diswst(sock, objid) != 0) ||
	    (rc = encode_DIS_attrl(sock, pattrl) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	-encode a Submit Resvervation Batch Request
 *
 * @par	Functionality:
 *		This request is used for the first step in submitting a reservation
 *      	sending the reservation attributes.
 *
 * @param[in] sock - socket descriptor
 * @param[in] resv_id - reservation id
 * @param[id] aoplp - pointer to attropl struct(list)
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_SubmitResv(int sock, const char *resv_id, struct attropl *aoplp)
{
	int rc;

	if (resv_id == NULL)
		resv_id = "";

	/* send the reservation ID and then an empty destination
	 * This is done so the server can use the queuejob structure
	 */
	if ((rc = diswst(sock, resv_id) != 0) ||
	    (rc = diswst(sock, "") != 0))
		return rc;

	return (encode_DIS_attropl(sock, aoplp));
}

/**
 * @brief
 *      -encode a Track Job batch request
 *
 * @par NOTE:
 *      This request is used by the server ONLY; its input is a server
 *      batch request structure.
 *
 * @par  Data items are:\n
 *              string          job id\n
 *              unsigned int    hopcount\n
 *              string          location\n
 *              u char          state\n
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_TrackJob(int sock, struct batch_request *preq)
{
	int rc;

	if ((rc = diswst(sock, preq->rq_ind.rq_track.rq_jid) != 0) ||
	    (rc = diswui(sock, preq->rq_ind.rq_track.rq_hopcount) != 0) ||
	    (rc = diswst(sock, preq->rq_ind.rq_track.rq_location) != 0) ||
	    (rc = diswuc(sock, preq->rq_ind.rq_track.rq_state[0]) != 0))
		return rc;

	return 0;
}

/**
 * @brief
 *	- encode a User Credential Batch Request
 *
 * @param[in] sock - socket descriptor
 * @param[in] user - user name
 * @param[in] type -  Credential type
 * @param[in] cred- the credential
 * @param[in] len - length of credential
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_UserCred(int sock, const char *user, int type, const char *cred, int len)
{
	int rc;

	if ((rc = diswst(sock, user)) != 0)
		return rc;
	if ((rc = diswui(sock, type)) != 0)
		return rc;
	rc = diswcs(sock, cred, (size_t) len);

	return rc;
}

/**
 * @brief-
 *	encode a list of PBS API "attrl" structures
 *
 * @par	Functionality:
 *		The first item encoded is a unsigned integer, a count of the
 *      	number of attrl entries in the linked list.  This is encoded
 *      	even when there are no svrattrl entries in the list.
 *
 * @par	 Each individual entry is then encoded as:\n
 *		u int   size of the three strings (name, resource, value)
 *                      including the terminating nulls\n
 *		string  attribute name\n
 *		u int   1 or 0 if resource name does or does not follow\n
 *		string  resource name (if one)\n
 *		string  value of attribute/resource\n
 *		u int   "op" of attrlop, forced to "Set"\n
 *
 * @param[in] sock - socket descriptor
 * @param[in] pattrl - pointer to attrl structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_attrl(int sock, struct attrl *pattrl)
{
	unsigned int ct = 0;
	unsigned int name_len;
	struct attrl *ps;
	int rc;
	char *value;

	/* count how many */
	for (ps = pattrl; ps; ps = ps->next) {
		++ct;
	}

	if ((rc = diswui(sock, ct)) != 0)
		return rc;

	for (ps = pattrl; ps; ps = ps->next) {
		/* length of three strings */
		value = ps->value ? ps->value : "";
		name_len = (int) strlen(ps->name) + (int) strlen(value) + 2;
		if (ps->resource)
			name_len += strlen(ps->resource) + 1;

		if ((rc = diswui(sock, name_len)) != 0)
			break;
		if ((rc = diswst(sock, ps->name)) != 0)
			break;
		if (ps->resource) { /* has a resource name */
			if ((rc = diswui(sock, 1)) != 0)
				break;
			if ((rc = diswst(sock, ps->resource)) != 0)
				break;
		} else {
			if ((rc = diswui(sock, 0)) != 0) /* no resource name */
				break;
		}
		if ((rc = diswst(sock, value)) ||
		    (rc = diswui(sock, (unsigned int) SET)))
			break;
	}

	return rc;
}

/**
 * @brief
 *	- encode a list of PBS API "attropl" structures
 *
 * @par	Note:
 *	The first item encoded is a unsigned integer, a count of the
 *      number of attropl entries in the linked list.  This is encoded
 *      even when there are no attropl entries in the list.
 *
 * @par	 Each individual entry is then encoded as:\n
 *			u int   size of the three strings (name, resource, value)
 *                      	including the terminating nulls\n
 *			string  attribute name\n
 *			u int   1 or 0 if resource name does or does not follow\n
 *			string  resource name (if one)\n
 *			string  value of attribute/resource\n
 *			u int   "op" of attrlop\n
 *
 * @par	Note:
 *	the encoding of a attropl is the same as the encoding of
 *      the pbs_ifl.h structures "attrl" and the server svrattrl.  Any
 *      one of the three forms can be decoded into any of the three with the
 *      possible loss of the "flags" field (which is the "op" of the attrlop).
 *
 * @param[in] sock - socket id
 * @param[in] pattropl - pointer to attropl structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_attropl(int sock, struct attropl *pattropl)
{
	unsigned int ct = 0;
	unsigned int name_len;
	struct attropl *ps;
	int rc;

	/* count how many */

	for (ps = pattropl; ps; ps = ps->next) {
		++ct;
	}

	if ((rc = diswui(sock, ct)) != 0)
		return rc;

	for (ps = pattropl; ps; ps = ps->next) {
		/* length of three strings */
		name_len = (int) strlen(ps->name) + (int) strlen(ps->value) + 2;
		if (ps->resource)
			name_len += strlen(ps->resource) + 1;

		if ((rc = diswui(sock, name_len)) != 0)
			break;
		if ((rc = diswst(sock, ps->name)) != 0)
			break;
		if (ps->resource) { /* has a resource name */
			if ((rc = diswui(sock, 1)) != 0)
				break;
			if ((rc = diswst(sock, ps->resource)) != 0)
				break;
		} else {
			if ((rc = diswui(sock, 0)) != 0) /* no resource name */
				break;
		}
		if ((rc = diswst(sock, ps->value)) ||
		    (rc = diswui(sock, (unsigned int) ps->op)))
			break;
	}
	return rc;
}

/**
 * @brief
 *	-encode a list of server "svrattrl" structures
 *
 * @par	Functionality:
 *		The first item encoded is a unsigned integer, a count of the
 *      	number of svrattrl entries in the linked list.  This is encoded
 *      	even when there are no svrattrl entries in the list.
 *
 * @par	Each individual entry is then encoded as:\n
 *			u int   size of the three strings (name, resource, value)
 *                      	including the terminating nulls\n
 *			string  attribute name\n
 *			u int   1 or 0 if resource name does or does not follow\n
 *			string  resource name (if one)\n
 *			string  value of attribute/resource\n
 *			u int   "op" of attrlop
 *
 * @param[in] sock - socket descriptor
 * @param[in] psattl - pointer to svr attr list
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
encode_DIS_svrattrl(int sock, svrattrl *psattl)
{
	unsigned int ct = 0;
	unsigned int name_len;
	svrattrl *ps;
	int rc;

	/* count how many */

	for (ps = psattl; ps; ps = (svrattrl *) GET_NEXT(ps->al_link)) {
		++ct;
	}

	if ((rc = diswui(sock, ct)) != 0)
		return rc;

	for (ps = psattl; ps; ps = (svrattrl *) GET_NEXT(ps->al_link)) {
		/* length of three strings */
		name_len = (int) strlen(ps->al_atopl.name) +
			   (int) strlen(ps->al_atopl.value) + 2;
		if (ps->al_atopl.resource)
			name_len += strlen(ps->al_atopl.resource) + 1;

		if ((rc = diswui(sock, name_len)) != 0)
			break;
		if ((rc = diswst(sock, ps->al_atopl.name)) != 0)
			break;
		if (ps->al_rescln) { /* has a resource name */
			if ((rc = diswui(sock, 1)) != 0)
				break;
			if ((rc = diswst(sock, ps->al_atopl.resource)) != 0)
				break;
		} else {
			if ((rc = diswui(sock, 0)) != 0) /* no resource name */
				break;
		}
		if ((rc = diswst(sock, ps->al_atopl.value)) ||
		    (rc = diswui(sock, (unsigned int) ps->al_op)))
			break;
	}
	return rc;
}


================================================
FILE: src/lib/Libifl/Makefile.am
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

BUILT_SOURCES = pbs_ifl_wrap.c
EXTRA_DIST = pbs_ifl.i

pbs_ifl_wrap.c: pbs_ifl.i
	@swig_dir@/bin/swig -python -outcurrentdir \
		@swig_py_inc@ -I$(top_srcdir)/src/include $^

CLEANFILES = \
	pbs_ifl.py \
	pbs_ifl_wrap.c


================================================
FILE: src/lib/Libifl/PBS_attr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	PBS_attr.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include "libpbs.h"

/**
 * @brief
 *	-parses attr list and checks if name and value are null.
 *
 * @param[in] alp - pointer to attr list
 *
 * @return	int
 * @retval	0	Success
 * @retval	-1	if val or name name
 *
 */

int
PBS_val_al(struct attrl *alp)
{
	while (alp) {
		if ((alp->name == 0) || (alp->value == 0))
			return -1;
		alp = alp->next;
	}
	return 0;
}

/**
 * @brief
 *	-frees the attr list
 *
 * @param[in] alp - pointer to attr list
 *
 * @return	Void
 *
 */
void
PBS_free_al(struct attrl *alp)
{
	struct attrl *talp;
	while (alp != NULL) {
		free(alp->name);
		free(alp->resource);
		free(alp->value);
		talp = alp;
		alp = alp->next;
		free(talp);
	}
}

/**
 * @brief
 *      -parses attr list with option and checks if name and value are null.
 *
 * @param[in] alp - pointer to attr list
 *
 * @return      int
 * @retval      0       Success
 * @retval      -1      if val or name name
 *
 */

int
PBS_val_aopl(struct attropl *aoplp)
{
	while (aoplp != NULL) {
		if ((aoplp->name == 0) || (aoplp == 0))
			return -1;
		aoplp = aoplp->next;
	}
	return 0;
}

/**
 * @brief
 *      -frees the attr list with option
 *
 * @param[in] alp - pointer to attr list
 *
 * @return      Void
 *
 */

void
PBS_free_aopl(struct attropl *aoplp)
{
	struct attropl *taoplp;
	while (aoplp != NULL) {
		if (aoplp->name) {
			free(aoplp->name);
			aoplp->name = NULL;
		}
		if (aoplp->resource) {
			free(aoplp->resource);
			aoplp->resource = NULL;
		}
		if (aoplp->value) {
			free(aoplp->value);
			aoplp->value = NULL;
		}
		taoplp = aoplp;
		aoplp = aoplp->next;
		if (taoplp) {
			free(taoplp);
			taoplp = NULL;
		}
	}
}


================================================
FILE: src/lib/Libifl/advise.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdarg.h>
#include <stdio.h>
/**
 * @file	advise.c
 */

/**
 * @brief - prints advise from user (variable  argument list ) to standard error file.
 *
 * @param[in] who - user name
 * @param[in] variable arguments
 *
 * @return	Void
 *
 */
void
advise(char *who, ...)
{
	va_list args;
	char *fmt;

#ifndef NDEBUG

	va_start(args, who);

	if (who == NULL || *who == '\0')
		fprintf(stderr, "advise:\n");
	else
		fprintf(stderr, "advise from %s:\n", who);
	fmt = va_arg(args, char *);
	fputs("\t", stderr);
	vfprintf(stderr, fmt, args);
	va_end(args);
	fputc('\n', stderr);
	fputc('\n', stderr);
	fflush(stderr);
#endif
}


================================================
FILE: src/lib/Libifl/auth.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <stdio.h>
#include <errno.h>
#include <arpa/inet.h>
#include <netinet/tcp.h>
#include <dlfcn.h>
#include <netdb.h>

#include "dis.h"
#include "pbs_ifl.h"
#include "libpbs.h"
#include "libsec.h"
#include "auth.h"
#include "log.h"

extern unsigned char pbs_aes_key[][16];
extern unsigned char pbs_aes_iv[][16];
#define SALT_SIZE 16

static auth_def_t *loaded_auths = NULL;

static int _invoke_pbs_iff(int psock, const char *server_name, int server_port, char *ebuf, size_t ebufsz);
static char *_get_load_lib_error(int reset);
static void *_load_lib(char *loc);
static void *_load_symbol(char *libloc, void *libhandle, char *name, int required);
static auth_def_t *_load_auth(char *name);
static void _unload_auth(auth_def_t *auth);

static char *
_get_load_lib_error(int reset)
{
	if (reset) {
		(void) dlerror_reset();
		return NULL;
	}
	return dlerror();
}

static void *
_load_lib(char *loc)
{
	(void) _get_load_lib_error(1);
	return dlopen(loc, RTLD_LAZY);
}

static void *
_load_symbol(char *libloc, void *libhandle, char *name, int required)
{
	void *handle = NULL;

	(void) _get_load_lib_error(1);
	handle = dlsym(libhandle, name);

	if (required && handle == NULL) {
		char *errmsg = _get_load_lib_error(0);
		if (errmsg) {
			fprintf(stderr, "%s\n", errmsg);
		} else {
			fprintf(stderr, "symbol %s not found in %s", name, libloc);
		}
		return NULL;
	}
	return handle;
}

static auth_def_t *
_load_auth(char *name)
{
	char libloc[MAXPATHLEN + 1] = {'\0'};
	char *errmsg = NULL;
	auth_def_t *auth = NULL;

	if (strcmp(name, AUTH_RESVPORT_NAME) == 0)
		return NULL;

	auth = (auth_def_t *) calloc(1, sizeof(auth_def_t));
	if (auth == NULL) {
		return NULL;
	}

	strcpy(auth->name, name);
	auth->name[MAXAUTHNAME] = '\0';

	snprintf(libloc, MAXPATHLEN, "%s/lib/libauth_%s.%s", pbs_conf.pbs_exec_path, name, SHAREDLIB_EXT);

	libloc[MAXPATHLEN] = '\0';

	auth->lib_handle = _load_lib(libloc);
	if (auth->lib_handle == NULL) {
		errmsg = _get_load_lib_error(0);
		if (errmsg) {
			fprintf(stderr, "%s\n", errmsg);
		} else {
			fprintf(stderr, "Failed to load %s\n", libloc);
		}
		return NULL;
	}

	auth->set_config = _load_symbol(libloc, auth->lib_handle, "pbs_auth_set_config", 1);
	if (auth->set_config == NULL)
		goto err;

	auth->create_ctx = _load_symbol(libloc, auth->lib_handle, "pbs_auth_create_ctx", 1);
	if (auth->create_ctx == NULL)
		goto err;

	auth->destroy_ctx = _load_symbol(libloc, auth->lib_handle, "pbs_auth_destroy_ctx", 1);
	if (auth->destroy_ctx == NULL)
		goto err;

	auth->get_userinfo = _load_symbol(libloc, auth->lib_handle, "pbs_auth_get_userinfo", 1);
	if (auth->get_userinfo == NULL)
		goto err;

	auth->process_handshake_data = _load_symbol(libloc, auth->lib_handle, "pbs_auth_process_handshake_data", 1);
	if (auth->process_handshake_data == NULL)
		goto err;

	/*
	 * There are possiblity that auth lib only support authentication
	 * but not encrypt/decrypt of data (for example munge auth lib)
	 * so below 2 methods are marked as NOT required
	 * and no error check for _load_symbol
	 */
	auth->encrypt_data = _load_symbol(libloc, auth->lib_handle, "pbs_auth_encrypt_data", 0);
	auth->decrypt_data = _load_symbol(libloc, auth->lib_handle, "pbs_auth_decrypt_data", 0);

	return auth;

err:
	(void) _unload_auth(auth);
	return NULL;
}

static void
_unload_auth(auth_def_t *auth)
{
	if (auth == NULL)
		return;
	if (auth->lib_handle != NULL) {
		(void) dlclose(auth->lib_handle);
	}
	memset(auth, 0, sizeof(auth_def_t));
	free(auth);
	return;
}

/**
 * @brief
 *	get_auth - find and return auth defination struture for given method
 *
 * @param[in] method - auth method name
 *
 * @return	auth_def_t *
 * @retval	!NULL - success
 * @retval	NULL - failure
 *
 * @note
 * 	Returned value is from global static area so
 * 	caller MUST NOT modify it
 */
auth_def_t *
get_auth(char *method)
{
	auth_def_t *auth = NULL;

	for (auth = loaded_auths; auth != NULL; auth = auth->next) {
		if (strcmp(auth->name, method) == 0)
			return auth;
	}

	/*
	 * At this point, given method is allowed
	 * but it's authdef is not loaded
	 * so lets try to load it
	 */
	auth = _load_auth(method);
	if (auth == NULL)
		return NULL;
	auth->next = loaded_auths;
	loaded_auths = auth;
	return auth;
}

/**
 * @brief
 *	load_auths - load all configured auth (aka PBS_SUPPORTED_AUTH_METHODS)
 *
 * @param[in] mode - AUTH_CLIENT or AUTH_SERVER
 *
 * @return	int
 * @retval	0 - success
 * @retval	1 - failure
 */
int
load_auths(int mode)
{
	if (loaded_auths != NULL)
		return 0;

	if (strcmp(pbs_conf.auth_method, AUTH_RESVPORT_NAME) != 0) {
		auth_def_t *auth = _load_auth(pbs_conf.auth_method);
		if (auth == NULL) {
			return 1;
		}
		loaded_auths = auth;
	}

	if (pbs_conf.encrypt_method[0] != '\0' && strcmp(pbs_conf.auth_method, pbs_conf.encrypt_method) != 0) {
		auth_def_t *auth = _load_auth(pbs_conf.encrypt_method);
		if (auth == NULL) {
			unload_auths();
			return 1;
		}
		auth->next = loaded_auths;
		loaded_auths = auth;
	}

	if (mode == AUTH_SERVER) {
		int i = 0;
		while (pbs_conf.supported_auth_methods[i] != NULL) {
			auth_def_t *auth = NULL;
			if (strcmp(pbs_conf.supported_auth_methods[i], AUTH_RESVPORT_NAME) == 0) {
				i++;
				continue;
			}
			if (get_auth(pbs_conf.supported_auth_methods[i]) != NULL) {
				i++;
				continue;
			}
			auth = _load_auth(pbs_conf.supported_auth_methods[i]);
			if (auth == NULL) {
				unload_auths();
				return 1;
			}
			auth->next = loaded_auths;
			loaded_auths = auth;
			i++;
		}
	}

	return 0;
}

/**
 * @brief
 *	unload_auths - unload all loaded auths
 *
 * @return	void
 */
void
unload_auths(void)
{
	while (loaded_auths != NULL) {
		auth_def_t *cur = loaded_auths;
		loaded_auths = loaded_auths->next;
		_unload_auth(cur);
	}
}

/**
 * @brief
 *	is_valid_encrypt_method - validate given auth method can be used as encryption/decryption or not
 *
 * @param[in] method - auth method name to be validated
 *
 * @return	int
 * @retval	0 - given method can't be used for encrypt/decrypt
 * @retval	1 - given method can be used for encrypt/decrypt
 */
int
is_valid_encrypt_method(char *method)
{
	int rc = 0;
	auth_def_t *auth = _load_auth(method);

	if (auth && auth->encrypt_data && auth->decrypt_data) {
		rc = 1;
	}

	_unload_auth(auth);
	return rc;
}

/**
 * @brief
 *	tcp_send_auth_req - encodes and sends PBS_BATCH_Authenticate request
 *
 * @param[in] sock - socket descriptor
 * @param[in] port - parent port in pbs_iff (only used in resvport auth) else 0
 * @param[in] user - authenticating user name
 * @param[in] auth_method - auth method name
 * @param[in] encrypt_method - encrypt method name
 *
 * @return	int
 * @retval	0 on success
 * @retval	-1 on error
 */
int
tcp_send_auth_req(int sock, unsigned int port, const char *user, const char *auth_method, const char *encrypt_method)
{
	struct batch_reply *reply;
	int rc;
	int am_len;
	int em_len = encrypt_method ? strlen(encrypt_method) : 0;

	if (auth_method == NULL || *auth_method == '\0') {
		/* auth method can't be null or empty string */
		pbs_errno = PBSE_INTERNAL;
		return -1;
	}
	am_len = strlen(auth_method);
	set_conn_errno(sock, 0);
	set_conn_errtxt(sock, NULL);

	if (encode_DIS_ReqHdr(sock, PBS_BATCH_Authenticate, user) ||
	    diswui(sock, am_len) ||		 /* auth method length */
	    diswcs(sock, auth_method, am_len) || /* auth method */
	    diswui(sock, em_len)) {		 /* encrypt method length */
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if (em_len > 0 && diswcs(sock, encrypt_method, em_len)) { /* encrypt method */
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if (diswui(sock, port) || /* port (only used in resvport auth) */
	    encode_DIS_ReqExtend(sock, NULL)) {
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if (dis_flush(sock)) {
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	reply = PBSD_rdrpy_sock(sock, &rc, PROT_TCP);
	if (reply == NULL) {
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if ((reply->brp_code != 0)) {
		pbs_errno = reply->brp_code;
		set_conn_errno(sock, pbs_errno);
		if (reply->brp_choice == BATCH_REPLY_CHOICE_Text)
			set_conn_errtxt(sock, reply->brp_un.brp_txt.brp_str);
		PBSD_FreeReply(reply);
		return -1;
	}

	PBSD_FreeReply(reply);

	return 0;
}

/*
 * @brief
 *	_invoke_pbs_iff - call pbs_iff(1) to authenticate user/connection to the PBS server.
 *
 * @note
 * This would create an environment variable PBS_IFF_CLIENT_ADDR set to
 * the client's connecting address, which is made known to the pbs_iff process.
 *
 * If unable to authenticate, an attempt is made to run the old method
 * 'pbs_iff -i <pbs_client_addr>' also.
 *
 *
 * @param[in]  psock           Socket descriptor used by PBS client to connect PBS server.
 * @param[in]  server_name     Connecting PBS server host name.
 * @param[in]  server_port     Connecting PBS server port number.
 *
 * @return int
 * @retval  0 on success.
 * @retval -1 on failure.
 */
static int
_invoke_pbs_iff(int psock, const char *server_name, int server_port, char *ebuf, size_t ebufsz)
{
	char cmd[2][PBS_MAXSERVERNAME + 80];
	int k;
	char *pbs_client_addr = NULL;
	u_short psock_port = 0;
	int rc;
	struct sockaddr_in sockname;
	pbs_socklen_t socknamelen;
#ifdef WIN32
	struct pio_handles pio;
#else
	int i;
	FILE *piff;
#endif

	socknamelen = sizeof(sockname);
	if (getsockname(psock, (struct sockaddr *) &sockname, &socknamelen))
		return -1;

	pbs_client_addr = inet_ntoa(sockname.sin_addr);
	if (pbs_client_addr == NULL)
		return -1;
	psock_port = sockname.sin_port;

	/* for compatibility with 12.0 pbs_iff */
	(void) snprintf(cmd[1], sizeof(cmd[1]) - 1, "%s -i %s %s %u %d %u", pbs_conf.iff_path, pbs_client_addr, server_name, server_port, psock, psock_port);
#ifdef WIN32
	if (pbs_conf.encrypt_method[0] != '\0') {
		if (!SetEnvironmentVariable(PBS_CONF_ENCRYPT_METHOD, pbs_conf.encrypt_method)) {
			fprintf(stderr, "Failed to set %s=%s with errno: %ld", PBS_CONF_ENCRYPT_METHOD, pbs_conf.encrypt_method, GetLastError());
			return -1;
		}
	}
	(void) snprintf(cmd[0], sizeof(cmd[0]) - 1, "%s %s %u %d %u", pbs_conf.iff_path, server_name, server_port, psock, psock_port);
	for (k = 0; k < 2; k++) {
		rc = 0;
		if (!SetEnvironmentVariable(PBS_IFF_CLIENT_ADDR, pbs_client_addr)) {
			fprintf(stderr, "Failed to set %s=%s with errno: %ld", PBS_IFF_CLIENT_ADDR, pbs_client_addr, GetLastError());
			rc = -1;
			break;
		}
		if (!win_popen(cmd[k], "r", &pio, NULL)) {
			fprintf(stderr, "failed to execute %s\n", cmd[k]);
			SetEnvironmentVariable(PBS_IFF_CLIENT_ADDR, NULL);
			rc = -1;
			break;
		}
		win_pread(&pio, (char *) &rc, (int) sizeof(int));
		pbs_errno = rc;
		if (rc > 0) {
			rc = -1;
			win_pread(&pio, (char *) &rc, (int) sizeof(int));
			if (rc > 0) {
				if (rc > (int) (ebufsz - 1))
					rc = (int) (ebufsz - 1);
				win_pread(&pio, ebuf, rc);
				ebuf[ebufsz] = '\0';
			}
			rc = -1;
		}
		win_pclose(&pio);
		SetEnvironmentVariable(PBS_IFF_CLIENT_ADDR, NULL);
		if (rc == 0)
			break;
	}

#else  /* UNIX code here */
	if (pbs_conf.encrypt_method[0] != '\0') {
		snprintf(cmd[0], sizeof(cmd[0]) - 1, "%s=%s %s=%s %s %s %u %d %u",
			 PBS_IFF_CLIENT_ADDR, pbs_client_addr,
			 PBS_CONF_ENCRYPT_METHOD, pbs_conf.encrypt_method,
			 pbs_conf.iff_path, server_name, server_port,
			 psock, psock_port);
	} else {
		snprintf(cmd[0], sizeof(cmd[0]) - 1, "%s=%s %s %s %u %d %u",
			 PBS_IFF_CLIENT_ADDR, pbs_client_addr,
			 pbs_conf.iff_path, server_name, server_port,
			 psock, psock_port);
	}

	for (k = 0; k < 2; k++) {
		rc = -1;
		piff = (FILE *) popen(cmd[k], "r");
		if (piff == NULL) {
			break;
		}

		while ((i = read(fileno(piff), &rc, sizeof(int))) == -1) {
			if (errno != EINTR)
				break;
		}
		pbs_errno = rc;
		if (rc > 0) {
			rc = -1;
			while ((i = read(fileno(piff), &rc, sizeof(int))) == -1) {
				if (errno != EINTR)
					break;
			}
			if (rc > 0) {
				if (rc > (ebufsz - 1))
					rc = ebufsz - 1;
				while ((i = read(fileno(piff), (void *) ebuf, rc)) == -1) {
					if (errno != EINTR)
						break;
				}
				ebuf[ebufsz] = '\0';
			}
			rc = -1;
		}

		(void) pclose(piff);
		if (rc == 0)
			break;
	}
#endif /* end of UNIX code */

	return rc;
}

int
handle_client_handshake(int fd, const char *hostname, char *method, int for_encrypt, pbs_auth_config_t *config, char *ebuf, size_t ebufsz)
{
	void *data_in = NULL;
	size_t len_in = 0;
	void *data_out = NULL;
	size_t len_out = 0;
	int type = 0;
	int is_handshake_done = 0;
	void *authctx = NULL;
	auth_def_t *authdef = NULL;

	authdef = get_auth(method);
	if (authdef == NULL) {
		snprintf(ebuf, ebufsz, "Failed to find authdef");
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	DIS_tcp_funcs();

	transport_chan_set_authdef(fd, authdef, for_encrypt);
	authdef->set_config((const pbs_auth_config_t *) config);
	if ((authctx = transport_chan_get_authctx(fd, for_encrypt)) == NULL) {
		if (authdef->create_ctx(&authctx, AUTH_CLIENT, AUTH_USER_CONN, hostname)) {
			snprintf(ebuf, ebufsz, "Failed to create auth context");
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
		transport_chan_set_authctx(fd, authctx, for_encrypt);
	}

	do {
		if (authdef->process_handshake_data(authctx, data_in, len_in, &data_out, &len_out, &is_handshake_done) != 0) {
			if (len_out > 0) {
				size_t len = len_out;
				if (len > ebufsz)
					len = ebufsz;
				strncpy(ebuf, (char *) data_out, len);
				ebuf[len] = '\0';
				free(data_out);
			} else {
				snprintf(ebuf, ebufsz, "auth_process_handshake_data failure");
			}
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}

		if (len_in) {
			data_in = NULL;
			len_in = 0;
		}

		if (len_out > 0) {
			if (transport_send_pkt(fd, AUTH_CTX_DATA, data_out, len_out) <= 0) {
				snprintf(ebuf, ebufsz, "Failed to send auth context token");
				pbs_errno = PBSE_SYSTEM;
				free(data_out);
				return -1;
			}
			free(data_out);
			data_out = NULL;
			len_out = 0;
		}

		/* recieve ctx token */
		if (transport_recv_pkt(fd, &type, &data_in, &len_in) <= 0) {
			snprintf(ebuf, ebufsz, "Failed to receive auth token");
			return -1;
		}

		if (type == AUTH_ERR_DATA) {
			if (len_in > ebufsz)
				len_in = ebufsz;
			strncpy(ebuf, (char *) data_in, len_in);
			ebuf[len_in] = '\0';
			pbs_errno = PBSE_BADCRED;
			return -1;
		}

		if ((is_handshake_done == 0 && type != AUTH_CTX_DATA) || (is_handshake_done == 1 && type != AUTH_CTX_OK)) {
			snprintf(ebuf, ebufsz, "incorrect auth token type");
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}

		if (type == AUTH_CTX_OK) {
			data_in = NULL;
			len_in = 0;
		}

		if (is_handshake_done == 1) {
			transport_chan_set_ctx_status(fd, AUTH_STATUS_CTX_READY, for_encrypt);
			transport_chan_set_authctx(fd, authctx, for_encrypt);
		}

	} while (is_handshake_done == 0);

	return 0;
}

/**
 * @brief
 * 	free_auth_config - free auth config structure
 *
 * @param[in] config - auth config structure to be freed
 *
 * @return	void
 *
 */
void
free_auth_config(pbs_auth_config_t *config)
{
	if (config) {
		if (config->auth_method)
			free(config->auth_method);
		if (config->encrypt_method)
			free(config->encrypt_method);
		if (config->pbs_exec_path)
			free(config->pbs_exec_path);
		if (config->pbs_home_path)
			free(config->pbs_home_path);
		free(config);
	}
}

/**
 * @brief
 * 	make_auth_config - allocate and return auth config structure
 *
 * @param[in] auth_method - auth method name
 * @param[in] encrypt_method - encrypt method name
 * @param[in] exec_path - path to PBS_EXEC
 * @param[in] home_path - path to PBS_HOME
 * @param[in] logger - pointer to logger function for auth lib
 *
 * @return	pbs_auth_config_t *
 * @retval	!NULL	success
 * @retval	NULL	failure
 *
 */
pbs_auth_config_t *
make_auth_config(char *auth_method, char *encrypt_method, char *exec_path, char *home_path, void *logger)
{
	pbs_auth_config_t *config = NULL;

	config = (pbs_auth_config_t *) malloc(sizeof(pbs_auth_config_t));
	if (config == NULL)
		return NULL;

	config->auth_method = strdup(auth_method);
	if (config->auth_method == NULL) {
		free(config);
		return NULL;
	}
	config->encrypt_method = strdup(encrypt_method);
	if (config->encrypt_method == NULL) {
		free(config->auth_method);
		free(config);
		return NULL;
	}
	config->pbs_exec_path = strdup(exec_path);
	if (config->pbs_exec_path == NULL) {
		free(config->auth_method);
		free(config->encrypt_method);
		free(config);
		return NULL;
	}
	config->pbs_home_path = strdup(home_path);
	if (config->pbs_home_path == NULL) {
		free(config->auth_method);
		free(config->encrypt_method);
		free(config->pbs_exec_path);
		free(config);
		return NULL;
	}
	config->logfunc = logger;
	return config;
}

/**
 * @brief
 * 	engage_client_auth - this function handles client side authenication
 *
 * @param[in] fd - socket descriptor
 * @param[in] hostname - server hostname
 * @param[out] ebuf - error buffer
 * @param[in] ebufsz - size of error buffer
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	failure
 *
 */
int
engage_client_auth(int fd, const char *hostname, int port, char *ebuf, size_t ebufsz)
{
	int rc;
	static pbs_auth_config_t *config = NULL;

	if (config == NULL) {
		config = make_auth_config(pbs_conf.auth_method,
					  pbs_conf.encrypt_method,
					  pbs_conf.pbs_exec_path,
					  pbs_conf.pbs_home_path,
					  NULL);
		if (config == NULL) {
			snprintf(ebuf, ebufsz, "Out of memory in %s!", __func__);
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
	}

	if (strcmp(pbs_conf.auth_method, AUTH_RESVPORT_NAME) == 0) {
		if ((rc = CS_client_auth(fd)) == CS_SUCCESS)
			return (0);

		if (rc == CS_AUTH_USE_IFF) {
			if (_invoke_pbs_iff(fd, hostname, port, ebuf, ebufsz) != 0) {
				snprintf(ebuf, ebufsz, "Unable to authenticate connection (%s:%d)", hostname, port);
				return -1;
			}
		}
	} else {
		if (tcp_send_auth_req(fd, 0, pbs_current_user, pbs_conf.auth_method, pbs_conf.encrypt_method) != 0) {
			snprintf(ebuf, ebufsz, "Failed to send auth request");
			return -1;
		}
	}

	if (pbs_conf.encrypt_method[0] != '\0') {
		rc = handle_client_handshake(fd, hostname, pbs_conf.encrypt_method, FOR_ENCRYPT, config, ebuf, ebufsz);
		if (rc != 0)
			return rc;
	}

	if (strcmp(pbs_conf.auth_method, AUTH_RESVPORT_NAME) != 0) {
		if (strcmp(pbs_conf.auth_method, pbs_conf.encrypt_method) != 0) {
			return handle_client_handshake(fd, hostname, pbs_conf.auth_method, FOR_AUTH, config, ebuf, ebufsz);
		} else {
			transport_chan_set_ctx_status(fd, transport_chan_get_ctx_status(fd, FOR_ENCRYPT), FOR_AUTH);
			transport_chan_set_authdef(fd, transport_chan_get_authdef(fd, FOR_ENCRYPT), FOR_AUTH);
			transport_chan_set_authctx(fd, transport_chan_get_authctx(fd, FOR_ENCRYPT), FOR_AUTH);
		}
	}
	return 0;
}

/**
 * @brief
 * 	engage_server_auth - this function handles incoming authenication related data
 *
 * @param[in] fd - socket descriptor
 * @param[in] clienthost - hostname associate with fd
 * @param[in] for_encrypt - whether to handle incoming data for encrypt/decrypt auth or for authentication
 * @param[in] auth_role - role used when initializing the auth context
 * @param[out] ebuf - error buffer
 * @param[in] ebufsz - size of error buffer
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	failure
 *
 */
int
engage_server_auth(int fd, char *clienthost, int for_encrypt, int auth_role, char *ebuf, size_t ebufsz)
{
	void *authctx;
	auth_def_t *authdef;
	void *data_in = NULL;
	size_t len_in = 0;
	void *data_out = NULL;
	size_t len_out = 0;
	int type;
	int is_handshake_done = 0;

	DIS_tcp_funcs();

	if (transport_chan_get_ctx_status(fd, for_encrypt) != (int) AUTH_STATUS_CTX_ESTABLISHING) {
		/*
		 * auth ctx not establishing
		 * consider data as clear text or encrypted data
		 * BUT not auth ctx data
		 */
		return 1;
	}

	authdef = transport_chan_get_authdef(fd, for_encrypt);
	if (authdef == NULL) {
		snprintf(ebuf, ebufsz, "No authdef associated with connection");
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if ((authctx = transport_chan_get_authctx(fd, for_encrypt)) == NULL) {
		if (authdef->create_ctx(&authctx, auth_role, AUTH_USER_CONN, clienthost)) {
			snprintf(ebuf, ebufsz, "Failed to create auth context");
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
		transport_chan_set_authctx(fd, authctx, for_encrypt);
	}

	if (transport_recv_pkt(fd, &type, &data_in, &len_in) <= 0) {
		snprintf(ebuf, ebufsz, "failed to receive auth token");
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if (type != AUTH_CTX_DATA) {
		snprintf(ebuf, ebufsz, "received incorrect auth token");
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if (authdef->process_handshake_data(authctx, data_in, len_in, &data_out, &len_out, &is_handshake_done) != 0) {
		if (len_out > 0) {
			size_t len = len_out;
			if (len > ebufsz)
				len = ebufsz;
			strncpy(ebuf, (char *) data_out, len);
			ebuf[len] = '\0';
			(void) transport_send_pkt(fd, AUTH_ERR_DATA, data_out, len_out);
			free(data_out);
		} else {
			snprintf(ebuf, ebufsz, "auth_process_handshake_data failure");
			(void) transport_send_pkt(fd, AUTH_ERR_DATA, "Unknown auth error", strlen("Unknown auth error"));
		}
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if (len_out > 0) {
		if (transport_send_pkt(fd, AUTH_CTX_DATA, data_out, len_out) <= 0) {
			snprintf(ebuf, ebufsz, "Failed to send auth context token");
			free(data_out);
			return -1;
		}
	}

	free(data_out);

	if (is_handshake_done == 1) {
		if (transport_send_pkt(fd, AUTH_CTX_OK, "", 1) <= 0) {
			snprintf(ebuf, ebufsz, "Failed to send auth context ok token");
			return -1;
		}
		transport_chan_set_ctx_status(fd, AUTH_STATUS_CTX_READY, for_encrypt);
		transport_chan_set_authctx(fd, authctx, for_encrypt);
	}

	if (for_encrypt == FOR_ENCRYPT) {
		auth_def_t *def = transport_chan_get_authdef(fd, FOR_AUTH);
		if (def != NULL && def == authdef) {
			transport_chan_set_ctx_status(fd, AUTH_STATUS_CTX_READY, FOR_AUTH);
			transport_chan_set_authctx(fd, authctx, FOR_AUTH);
		}
	}
	return 0;
}

/**
 * @brief
 *	server_cipher_auth - Validate received cipher authentication data
 *
 * @param[in] fd - The exec host side socket
 * @param[in] text - The text that will be compared against the one in the encrypted message.
 * @param[in] ebuf - buffer to hold error msg if any
 * @param[in] ebufsz - size of ebuf
 *
 * @return	int
 * @retval	INTERACTIVE_AUTH_SUCCESS(0)	success
 * @retval	INTERACTIVE_AUTH_FAILED(1)	failure
 *
 */
int
server_cipher_auth(int fd, char *text, char *ebuf, size_t ebufsz)
{
	size_t len_in = 0;
	char *data_in = NULL;
	int type;

	DIS_tcp_funcs();

	if (transport_recv_pkt(fd, &type, (void **) &data_in, &len_in) <= 0) {
		snprintf(ebuf, ebufsz, "failed to receive auth token");
		pbs_errno = PBSE_SYSTEM;
		return INTERACTIVE_AUTH_FAILED;
	}

	if (type != AUTH_CTX_DATA || len_in <= 0) {
		snprintf(ebuf, ebufsz, "received incorrect auth token");
		pbs_errno = PBSE_SYSTEM;
		return INTERACTIVE_AUTH_FAILED;
	}

	data_in[len_in - 1] = '\0';

	if (validate_hostkey(data_in, len_in - 1, &text) != 0) {
		snprintf(ebuf, ebufsz, "Failed to decrypt auth data");
		pbs_errno = PBSE_BADCRED;
		return INTERACTIVE_AUTH_FAILED;
	}

	if (transport_send_pkt(fd, AUTH_CTX_OK, "", 1) <= 0) {
		snprintf(ebuf, ebufsz, "Failed to send auth context ok token");
		pbs_errno = PBSE_SYSTEM;
		return INTERACTIVE_AUTH_FAILED;
	}

	return INTERACTIVE_AUTH_SUCCESS;
}

/**
 * @brief
 *	client_cipher_auth - Generate random string, encode it and send it over to qsub
 *
 * @param[in] fd - The qsub side socket
 * @param[in] text - The text that will be included in the encrypted message.
 * @param[in] ebuf - buffer to hold error msg if any
 * @param[in] ebufsz - size of ebuf
 *
 * @return	int
 * @retval	INTERACTIVE_AUTH_SUCCESS(0)	success
 * @retval	INTERACTIVE_AUTH_FAILED(1)	failure
 *
 */
int
client_cipher_auth(int fd, char *text, char *ebuf, size_t ebufsz)
{
	void *data_in = NULL;
	size_t len = 0;
	int type = 0;
	char salt[SALT_SIZE];
	char *msg = NULL;

	DIS_tcp_funcs();

	/* Generate random salt and append current time and text to it.
	 * In the end the string will look like this: salt;timestr;text
	 */
	set_rand_str(salt, SALT_SIZE);
	msg = gen_hostkey(text, salt, &len);
	if (!msg) {
		snprintf(ebuf, ebufsz, "Failed to encode auth data");
		free(msg);
		return INTERACTIVE_AUTH_FAILED;
	}

	if (transport_send_pkt(fd, AUTH_CTX_DATA, msg, len + 1) <= 0) {
		snprintf(ebuf, ebufsz, "Failed to send auth context token");
		pbs_errno = PBSE_SYSTEM;
		free(msg);
		return INTERACTIVE_AUTH_FAILED;
	}
	free(msg);
	msg = NULL;

	/* recieve ctx token */
	if (transport_recv_pkt(fd, &type, &data_in, &len) <= 0) {
		snprintf(ebuf, ebufsz, "Failed to receive auth token");
		pbs_errno = PBSE_SYSTEM;
		return INTERACTIVE_AUTH_FAILED;
	}

	if (type == AUTH_ERR_DATA) {
		if (len > ebufsz)
			len = ebufsz;
		strncpy(ebuf, (char *) data_in, len);
		ebuf[len] = '\0';
		pbs_errno = PBSE_BADCRED;
		return INTERACTIVE_AUTH_FAILED;
	}

	if (type != AUTH_CTX_OK) {
		snprintf(ebuf, ebufsz, "incorrect auth token type");
		pbs_errno = PBSE_SYSTEM;
		return INTERACTIVE_AUTH_FAILED;
	}

	if (type == AUTH_CTX_OK)
		data_in = NULL;

	return INTERACTIVE_AUTH_SUCCESS;
}

/**
 * @brief
 *	Authenticate an incoming connection from an execution host.
 *
 * @param[in]	sock - An integer representing the socket file descriptor.
 * @param[in]	port - The port from which the connection originated from
 * @param[in]	auth_method - Authentication method used
 * @param[in]	jobid - The job id.
 * @return	int
 * @retval	INTERACTIVE_AUTH_SUCCESS (0) - successful authentication
 * @retval	INTERACTIVE_AUTH_FAILED (1) - authentication failed
 * @retval	INTERACTIVE_AUTH_RETRY (2) - retry to connect
 *
 */
int
auth_exec_socket(int sock, struct sockaddr_in *from, char *auth_method, char *encrypt_method, char* jobid)
{
	char ebuf[LOG_BUF_SIZE] = "";
	/* Reduce timeout to avoid blocking too long */
	pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_SHORT;
	unsigned short port = ntohs(GET_IP_PORT(from));

	if (strcmp(auth_method, AUTH_RESVPORT_NAME) == 0) {
		/* For resvport, simply verify that the remote port is prvileged */
		if (port >= IPPORT_RESERVED)
			return INTERACTIVE_AUTH_RETRY;
	}

	if ((strcmp(auth_method, AUTH_MUNGE_NAME) == 0)) {
		encrypt_method[0] = '\0';
		pbs_auth_config_t *auth_config = NULL;
		auth_def_t *authdef = NULL;

		DIS_tcp_funcs();

		if (load_auths(AUTH_CLIENT)) {
			fprintf(stderr, "qsub: Failed to load auths\n");
			return INTERACTIVE_AUTH_FAILED;
		}

		auth_config = make_auth_config(auth_method,
					       encrypt_method,
					       pbs_conf.pbs_exec_path,
					       pbs_conf.pbs_home_path,
					       NULL);
		if (auth_config == NULL) {
			fprintf(stderr, "qsub: Out of memory when allocating new auth config\n");
			return INTERACTIVE_AUTH_FAILED;
		}

		authdef = get_auth(auth_method);
		if (authdef == NULL) {
			fprintf(stderr, "qsub: Auth method '%s' does not seem implemented\n", auth_method ? auth_method : "");
			free_auth_config(auth_config);
			return INTERACTIVE_AUTH_FAILED;
		} else {
			authdef->set_config((const pbs_auth_config_t *) auth_config);
			transport_chan_set_authdef(sock, authdef, FOR_AUTH);
			transport_chan_set_ctx_status(sock, AUTH_STATUS_CTX_ESTABLISHING, FOR_AUTH);
		}
		if (engage_server_auth(sock, "", FOR_AUTH, AUTH_INTERACTIVE, ebuf, sizeof(ebuf)) != 0) {
			if (ebuf[0] != '\0')
				fprintf(stderr, "qsub: %s\n", ebuf);
			free_auth_config(auth_config);
			/* If authentication process failed, retry to connect with another execution host */
			return INTERACTIVE_AUTH_RETRY;
		}
		free_auth_config(auth_config);
	}

	if (strcmp(auth_method, AUTH_GSS_NAME) == 0 || strcmp(encrypt_method, AUTH_GSS_NAME) == 0) {
		pbs_auth_config_t *auth_config = NULL;
		auth_def_t *authdef = NULL;
		char *hostname;
		int for_encrypt;
		char *method;

		method = strcmp(auth_method, AUTH_GSS_NAME) == 0 ? auth_method : encrypt_method;

		if (load_auths(AUTH_CLIENT)) {
			fprintf(stderr, "qsub: Failed to load auths\n");
			return INTERACTIVE_AUTH_FAILED;
		}

		auth_config = make_auth_config(method,
					       encrypt_method,
					       pbs_conf.pbs_exec_path,
					       pbs_conf.pbs_home_path,
					       NULL);
		if (auth_config == NULL) {
			fprintf(stderr, "qsub: Out of memory when allocating new auth config\n");
			return INTERACTIVE_AUTH_FAILED;
		}

		authdef = get_auth(method);
		if (authdef == NULL) {
			fprintf(stderr, "qsub: Auth method '%s' does not seem implemented\n", auth_method ? auth_method : "");
			free_auth_config(auth_config);
			return INTERACTIVE_AUTH_FAILED;
		}

		hostname = get_hostname_from_addr(from->sin_addr);
		if (hostname == NULL) {
			fprintf(stderr, "qsub: Unable to resolve host address\n");
			free_auth_config(auth_config);
			return INTERACTIVE_AUTH_RETRY;
		}

		if (encrypt_method[0] == '\0') {
			for_encrypt = FOR_AUTH;
		} else {
			for_encrypt = FOR_ENCRYPT;
		}

		if (handle_client_handshake(sock, hostname, method, for_encrypt, auth_config, ebuf, sizeof(ebuf)) != 0) {
			fprintf(stderr, "qsub: %s\n", ebuf);
			free_auth_config(auth_config);
			return INTERACTIVE_AUTH_RETRY;
		}
	}

	if (!is_string_in_arr(pbs_conf.supported_auth_methods, auth_method)) {
		fprintf(stderr, "qsub: Auth method '%s' not supported\n", auth_method ? auth_method : "");
		return INTERACTIVE_AUTH_FAILED;
	}
	return INTERACTIVE_AUTH_SUCCESS;
}

/**
 * @brief
 *	Authenticate a connection to a remote qsub.
 *
 * @param[in]	sock - An integer representing the socket file descriptor.
 * @param[in]	port - The port we connected to
 * @param[in]	hostname - The qsub hostname.
 * @param[in]	auth_method - The interactive auth method suggested by qsub.
 * @param[in]	jobid - The job id.
 *
 * @return	int
 * @retval	INTERACTIVE_AUTH_SUCCESS (0) - successful authentication
 * @retval	INTERACTIVE_AUTH_FAILED (1) - authentication failed
 *
 */
int auth_with_qsub(int sock, unsigned short port, char* hostname, char *auth_method, char *encrypt_method, char *jobid)
{
	char ebuf[LOG_BUF_SIZE] = "";

	/* If auth_method is resvport, we have already connected with a privileged port */

	if ((strcmp(auth_method, AUTH_GSS_NAME) == 0) || strcmp(encrypt_method, AUTH_GSS_NAME) == 0) {
		pbs_auth_config_t *auth_config = NULL;
		auth_def_t *authdef = NULL;
		int for_encrypt;
		char *method;

		method = strcmp(auth_method, AUTH_GSS_NAME) == 0 ? auth_method : encrypt_method;

		if (!is_string_in_arr(pbs_conf.supported_auth_methods, method)) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Auth method '%s' not supported", method ? method : "");
			return INTERACTIVE_AUTH_FAILED;
		}

		DIS_tcp_funcs();

		/* user credentials could be expired on qsub side, wait for user to possibly refresh credentials manually */
		pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_VLONG;

		if (load_auths(AUTH_SERVER)) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Failed to load auths");
			return INTERACTIVE_AUTH_FAILED;
		}

		auth_config = make_auth_config(method,
							encrypt_method,
							pbs_conf.pbs_exec_path,
							pbs_conf.pbs_home_path,
							NULL);
		if (auth_config == NULL) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Out of memory when allocating new auth config");
			return INTERACTIVE_AUTH_FAILED;
		}

		if (encrypt_method[0] == '\0') {
			for_encrypt = FOR_AUTH;
		} else {
			for_encrypt = FOR_ENCRYPT;
		}

		authdef = get_auth(method);
		if (authdef == NULL) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Auth method '%s' does not seem implemented\n", method ? method : "");
			free_auth_config(auth_config);
			return INTERACTIVE_AUTH_FAILED;
		} else {
			authdef->set_config((const pbs_auth_config_t *) auth_config);
			transport_chan_set_authdef(sock, authdef, for_encrypt);
			transport_chan_set_ctx_status(sock, AUTH_STATUS_CTX_ESTABLISHING, for_encrypt);
		}

		/* run handshake loop */
		while (transport_chan_get_ctx_status(sock, for_encrypt) == (int) AUTH_STATUS_CTX_ESTABLISHING) {
			if (engage_server_auth(sock, hostname, for_encrypt, AUTH_INTERACTIVE, ebuf, sizeof(ebuf)) != 0) {
				if (ebuf[0] != '\0')
					log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "qsub: %s\n", ebuf);
				free_auth_config(auth_config);
				return INTERACTIVE_AUTH_FAILED;
			}
		}
	}

	if ((strcmp(auth_method, AUTH_MUNGE_NAME) == 0)) {
		encrypt_method[0] = '\0';
		pbs_auth_config_t *auth_config = NULL;

		if (!is_string_in_arr(pbs_conf.supported_auth_methods, auth_method)) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Auth method '%s' not supported", auth_method ? auth_method : "");
			return INTERACTIVE_AUTH_FAILED;
		}

		DIS_tcp_funcs();

		if (load_auths(AUTH_CLIENT)) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Failed to load auths");
			return INTERACTIVE_AUTH_FAILED;
		}

		auth_config = make_auth_config(auth_method,
							encrypt_method,
							pbs_conf.pbs_exec_path,
							pbs_conf.pbs_home_path,
							NULL);
		if (auth_config == NULL) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Out of memory when allocating new auth config");
			return INTERACTIVE_AUTH_FAILED;
		}

		if (handle_client_handshake(sock, hostname, auth_method, FOR_AUTH, auth_config, ebuf, sizeof(ebuf)) != 0) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, "Error in handle client handshake: %s", ebuf);
			free_auth_config(auth_config);
			return INTERACTIVE_AUTH_FAILED;
		}
		free_auth_config(auth_config);
	}

	return INTERACTIVE_AUTH_SUCCESS;
}

================================================
FILE: src/lib/Libifl/conn_table.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include "pbs_config.h"
#include <errno.h>
#include "libpbs.h"

static pbs_conn_t **connection = NULL;
static int curr_connection_sz = 0;
static int allocated_connection = 0;

static pbs_conn_t *get_connection(int);
static int destroy_conntable(void);
static void _destroy_connection(int);
static int add_connection(int fd);

#ifdef WIN32
#define INVALID_SOCK(x) (x == INVALID_SOCKET || x < 0 || x >= PBS_LOCAL_CONNECTION)
#else
#define INVALID_SOCK(x) (x < 0 || x >= PBS_LOCAL_CONNECTION)
#endif

#if defined(linux)
#define MUTEX_TYPE PTHREAD_MUTEX_RECURSIVE_NP
#else
#define MUTEX_TYPE PTHREAD_MUTEX_RECURSIVE
#endif

#define LOCK_TABLE(x)                                               \
	do {                                                        \
		if (pbs_client_thread_init_thread_context() != 0) { \
			return (x);                                 \
		}                                                   \
		if (pbs_client_thread_lock_conntable() != 0) {      \
			return (x);                                 \
		}                                                   \
	} while (0)

#define UNLOCK_TABLE(x)                                          \
	do {                                                     \
		if (pbs_client_thread_unlock_conntable() != 0) { \
			return (x);                              \
		}                                                \
	} while (0)

/**
 * @brief
 * 	add_connection - Add given fd in connection table and initialize it's structures
 *
 * @note: connection table locking/unlocking should be handled by caller
 *
 * @param[in] fd - socket number
 *
 * @return int
 *
 * @retval 0 - success
 * @retval -1 - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
add_connection(int fd)
{
	pthread_mutexattr_t attr = {{0}};

	if (INVALID_SOCK(fd))
		return -1;

	if (fd >= curr_connection_sz) {
		void *p = NULL;
		int new_sz = fd + 10;
		p = realloc(connection, new_sz * sizeof(pbs_conn_t *));
		if (p == NULL)
			goto add_connection_err;
		connection = (pbs_conn_t **) (p);
		memset((connection + curr_connection_sz), 0, (new_sz - curr_connection_sz) * sizeof(pbs_conn_t *));
		curr_connection_sz = new_sz;
	}
	if (connection[fd] == NULL) {
		connection[fd] = calloc(1, sizeof(pbs_conn_t));
		if (connection[fd] == NULL)
			goto add_connection_err;
		if (pthread_mutexattr_init(&attr) != 0)
			goto add_connection_err;
		if (pthread_mutexattr_settype(&attr, MUTEX_TYPE) != 0)
			goto add_connection_err;
		if (pthread_mutex_init(&(connection[fd]->ch_mutex), &attr) != 0)
			goto add_connection_err;
		(void) pthread_mutexattr_destroy(&attr);
		allocated_connection++;
	} else {
		if (connection[fd]->ch_errtxt)
			free(connection[fd]->ch_errtxt);
		connection[fd]->ch_errtxt = NULL;
		connection[fd]->ch_errno = 0;
	}

	return 0;

add_connection_err:
	if (connection[fd]) {
		free(connection[fd]);
		connection[fd] = NULL;
	}
	return -1;
}

/** @brief
 *	_destroy_connection - destroy connection in connection table
 *
 * @param[in] fd - file descriptor
 *
 * @return void
 *
 */
static void
_destroy_connection(int fd)
{
	if (connection[fd]) {
		if (connection[fd]->ch_errtxt)
			free(connection[fd]->ch_errtxt);
		pthread_mutex_destroy(&(connection[fd]->ch_mutex));
		/*
		 * DON'T free connection[i]->ch_chan
		 * it should be done by dis_destroy_chan
		 */
		free(connection[fd]);
		allocated_connection--;
	}
	connection[fd] = NULL;
}

/** @brief
 * 	destroy_conntable - destroy connection table
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - failure
 *
 */
static int
destroy_conntable(void)
{
	int i = 0;

	if (curr_connection_sz <= 0)
		return 0;

	LOCK_TABLE(-1);
	for (i = 0; i < curr_connection_sz; i++) {
		if (connection[i]) {
			_destroy_connection(i);
		}
	}
	free(connection);
	connection = NULL;
	curr_connection_sz = 0;
	UNLOCK_TABLE(-1);

	return 0;
}

/** @brief
 *	destroy_connection - destroy connection in connection table
 *
 * @param[in] fd - file descriptor
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - failure
 *
 */
int
destroy_connection(int fd)
{
	if (INVALID_SOCK(fd))
		return -1;

	if (fd >= curr_connection_sz || allocated_connection == 0)
		return 0;

	LOCK_TABLE(-1);
	_destroy_connection(fd);
	UNLOCK_TABLE(-1);

	if (allocated_connection == 0)
		return destroy_conntable();

	return 0;
}

/**
 * @brief
 * 	get_connection - get associate connection structure with fd
 *
 * 	If given fd is not part of connection table or not initialized then
 * 	this func will call add_connection(fd) to add fd in connection
 * 	table and initialize it's structures
 *
 * @note: connection table locking/unlocking should be handled by caller
 *
 * @param[in] fd - socket number
 *
 * @return pbs_conn_t *
 *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static pbs_conn_t *
get_connection(int fd)
{
	if (INVALID_SOCK(fd))
		return NULL;
	if ((fd >= curr_connection_sz) || (connection[fd] == NULL)) {
		if (add_connection(fd) != 0)
			return NULL;
	}
	return connection[fd];
}

/**
 * @brief
 * 	set_conn_errtxt - set connection error text synchronously
 *
 * @param[in] fd - socket number
 * @param[in] errtxt - error text to set on connection
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
set_conn_errtxt(int fd, const char *errtxt)
{
	pbs_conn_t *p = NULL;

	if (INVALID_SOCK(fd))
		return -1;

	LOCK_TABLE(-1);
	p = get_connection(fd);
	if (p == NULL) {
		UNLOCK_TABLE(-1);
		return -1;
	}
	if (p->ch_errtxt) {
		free(p->ch_errtxt);
		p->ch_errtxt = NULL;
	}
	if (errtxt) {
		if ((p->ch_errtxt = strdup(errtxt)) == NULL) {
			UNLOCK_TABLE(-1);
			return -1;
		}
	}
	UNLOCK_TABLE(-1);
	return 0;
}

/**
 * @brief
 * 	get_conn_errtxt - get connection error text synchronously
 *
 * @param[in] fd - socket number
 *
 * @return char *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
char *
get_conn_errtxt(int fd)
{
	pbs_conn_t *p = NULL;
	char *errtxt = NULL;

	if (INVALID_SOCK(fd))
		return NULL;

	LOCK_TABLE(NULL);
	p = get_connection(fd);
	if (p == NULL) {
		UNLOCK_TABLE(NULL);
		return NULL;
	}
	errtxt = p->ch_errtxt;
	UNLOCK_TABLE(NULL);
	return errtxt;
}

/**
 * @brief
 * 	set_conn_errno - set connection error number synchronously
 *
 * @param[in] fd - socket number
 * @param[in] err - error number to set on connection
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
int
set_conn_errno(int fd, int err)
{
	pbs_conn_t *p = NULL;

	if (INVALID_SOCK(fd))
		return -1;

	LOCK_TABLE(-1);
	p = get_connection(fd);
	if (p == NULL) {
		UNLOCK_TABLE(-1);
		return -1;
	}
	p->ch_errno = err;
	UNLOCK_TABLE(-1);
	return 0;
}

/**
 * @brief
 * 	get_conn_errno - get connection error number synchronously
 *
 * @param[in] fd - socket number
 *
 * @return int
 * @retval >= 0 - success
 * @retval -1 - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
int
get_conn_errno(int fd)
{
	pbs_conn_t *p = NULL;
	int err = -1;

	if (INVALID_SOCK(fd))
		return -1;

	LOCK_TABLE(-1);
	p = get_connection(fd);
	if (p == NULL) {
		UNLOCK_TABLE(-1);
		return -1;
	}
	err = p->ch_errno;
	UNLOCK_TABLE(-1);
	return err;
}

/**
 * @brief
 * 	set_conn_chan - set connection tcp chan synchronously
 *
 * @param[in] fd - socket number
 * @param[in] chan - tcp chan to set on connection
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
int
set_conn_chan(int fd, pbs_tcp_chan_t *chan)
{
	pbs_conn_t *p = NULL;

	if (INVALID_SOCK(fd))
		return -1;

	LOCK_TABLE(-1);
	p = get_connection(fd);
	if (p == NULL) {
		errno = ENOTCONN;
		UNLOCK_TABLE(-1);
		return -1;
	}
	p->ch_chan = chan;
	UNLOCK_TABLE(-1);
	return 0;
}

/**
 * @brief
 * 	get_conn_chan - get connection tcp chan synchronously
 *
 * @param[in] fd - socket number
 *
 * @return pbs_tcp_chan_t *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 */
pbs_tcp_chan_t *
get_conn_chan(int fd)
{
	pbs_conn_t *p = NULL;
	pbs_tcp_chan_t *chan = NULL;

	if (INVALID_SOCK(fd))
		return NULL;

	LOCK_TABLE(NULL);
	p = get_connection(fd);
	if (p == NULL) {
		errno = ENOTCONN;
		UNLOCK_TABLE(NULL);
		return NULL;
	}
	chan = p->ch_chan;
	UNLOCK_TABLE(NULL);
	return chan;
}

/**
 * @brief
 * 	get_conn_mutex - get connection mutex synchronously
 *
 * @param[in] fd - socket number
 *
 * @return pthread_mutex_t *
 * @retval !NULL - success
 * @retval NULL - error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
pthread_mutex_t *
get_conn_mutex(int fd)
{
	pbs_conn_t *p = NULL;
	pthread_mutex_t *mutex = NULL;

	if (INVALID_SOCK(fd))
		return NULL;

	LOCK_TABLE(NULL);
	p = get_connection(fd);
	if (p == NULL) {
		UNLOCK_TABLE(NULL);
		return NULL;
	}
	mutex = &(p->ch_mutex);
	UNLOCK_TABLE(NULL);
	return mutex;
}


================================================
FILE: src/lib/Libifl/dec_DelJobList.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	dec_DelJobList.c
 * @brief
 * decode_DIS_DelJobList() - decode a Delete Job List Batch Request
 *
 *	This request is used for most operations where an object is being
 *	created, deleted, or altered.
 *
 *	The batch_request structure must already exist (be allocated by the
 *	caller.   It is assumed that the header fields (protocol type,
 *	protocol version, request type, and user name) have already be decoded.
 *
 * @par	Data items are:
 * 			unsigned int	count
 *			string array	jobslist
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include "libpbs.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "credential.h"
#include "batch_request.h"
#include "dis.h"
/**
 * @brief
 *	-decode a Delete Job Batch Request
 *
 * @par	Functionality:
 *	This function is used to decode the request for deletion of list of jobids.
 *
 *
 *      The batch_request structure must already exist (be allocated by the
 *      caller.   It is assumed that the header fields (protocol type,
 *      protocol version, request type, and user name) have already be decoded.
 *
 * @par	Data items are:\n
 *		unsigned int    command\n
 *              unsigned int    object type\n
 *              string          object name\n
 *              attropl         attributes
 *
 * @param[in] sock - socket descriptor
 * @param[out] preq - pointer to batch_request structure
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
decode_DIS_DelJobList(int sock, struct batch_request *preq)
{
	int rc;
	int count = 0;
	char **tmp_jobslist = NULL;
	int i = 0;

	preq->rq_ind.rq_deletejoblist.rq_count = disrui(sock, &rc);
	if (rc)
		return rc;

	count = preq->rq_ind.rq_deletejoblist.rq_count;

	tmp_jobslist = malloc((count + 1) * sizeof(char *));
	if (tmp_jobslist == NULL)
		return DIS_NOMALLOC;

	for (i = 0; i < count; i++) {
		tmp_jobslist[i] = disrst(sock, &rc);
		if (rc) {
			free(tmp_jobslist);
			return rc;
		}
	}
	tmp_jobslist[i] = NULL;

	preq->rq_ind.rq_deletejoblist.rq_jobslist = tmp_jobslist;
	preq->rq_ind.rq_deletejoblist.rq_resume = FALSE;

	return rc;
}


================================================
FILE: src/lib/Libifl/dec_reply.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	dec_rcpy.c
 * @brief
 * 	decode_DIS_replyCmd() - decode a Batch Protocol Reply Structure for a Command
 *
 *	This routine decodes a batch reply into the form used by commands.
 *	The only difference between this and the server version is on status
 *	replies.  For commands, the attributes are decoded into a list of
 *	attrl structure rather than the server's svrattrl.
 *
 * 	batch_reply structure defined in libpbs.h, it must be allocated
 *	by the caller.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <stdlib.h>
#include "attribute.h"
#include "range.h"
#include "libpbs.h"
#include "job.h"
#include "dis.h"

/**
 * @brief	Read one batch status from given socket
 *
 * @param[in]  sock - socket from which status to be read
 * @param[out] objtype - type of batch status
 * @param[out] rc - error code if any failure in read
 *
 * @return struct batch_status *
 * @retval !NULL - success
 * @retval NULL  - failure
 */
static struct batch_status *
read_batch_status(int sock, int *objtype, int *rc)
{
	struct batch_status *pstcmd;

	if (rc == NULL || objtype == NULL) {
		if (rc)
			*rc = DIS_PROTO;
		return NULL;
	}

	pstcmd = (struct batch_status *) malloc(sizeof(struct batch_status));
	if (pstcmd == NULL) {
		*rc = DIS_NOMALLOC;
		return NULL;
	}
	init_bstat(pstcmd);

	*objtype = disrui(sock, rc);
	if (*rc == DIS_SUCCESS)
		pstcmd->name = disrst(sock, rc);
	if (*rc) {
		pbs_statfree(pstcmd);
		return NULL;
	}
	*rc = decode_DIS_attrl(sock, &pstcmd->attribs);
	if (*rc)
		pbs_statfree(pstcmd);
	return pstcmd;
}

/**
 * @brief	Expand and append remaining subjob for given status of array job
 *
 * 	Find array_indices_remaining from given status's attributes list, parse it
 * 	and make a copy of given status for each subjob and set state and substate
 * 	in copy to queued
 *
 * 	This function is almost same as status_subjob() except that this work only on
 * 	remaining subjobs and uses batch_status struct instead of job struct
 *
 * @param[in]  array - pointer batch status of parent array job
 * @param[out] count - count of subjobs expanded
 *
 * @return int
 * @retval 0 - success
 * @retval 1 - failure
 */
static int
expand_remaining_subjob(struct batch_status *array, int *count)
{
	range *r = NULL;
	int sjidx = -1;
	char *remain;
	struct attrl *sj_attrs = NULL;
	char *parent_jid;

	if (array == NULL || count == NULL)
		return 0;

	*count = 0;
	parent_jid = array->name;
	remain = get_attr(array->attribs, ATTR_array_indices_remaining, NULL);
	if (remain == NULL || *remain == '-')
		return 0;
	r = range_parse(remain);
	if (r == NULL)
		return 1;
	sj_attrs = dup_attrl_list(array->attribs);
	if (sj_attrs != NULL) {
		struct attrl *next;
		struct attrl *prev = NULL;
		int should_break = 0;

		for (next = sj_attrs; next->next; next = next->next) {
			if (strcmp(next->name, ATTR_state) == 0) {
				free(next->value);
				next->value = malloc(2);
				if (next->value == NULL) {
					free_attrl_list(sj_attrs);
					return 1;
				}
				next->value[0] = JOB_STATE_LTR_QUEUED;
				next->value[1] = '\0';
				should_break++;
			} else if (strcmp(next->name, ATTR_substate) == 0) {
				free(next->value);
				next->value = strdup(TOSTR(JOB_SUBSTATE_QUEUED));
				if (next->value == NULL) {
					free_attrl_list(sj_attrs);
					return 1;
				}
				should_break++;
			} else if (strcmp(next->name, ATTR_array) == 0) {
				if (prev) {
					prev->next = NULL;
					free_attrl_list(next);
					next = NULL;
					should_break++;
				}
			}
			if (should_break == 3 || next == NULL)
				break;
			prev = next;
		}
	} else {
		free_range_list(r);
		return 1;
	}
	while ((sjidx = range_next_value(r, sjidx)) >= 0) {
		struct batch_status *pstcmd = (struct batch_status *) malloc(sizeof(struct batch_status));
		char *name;

		if (pstcmd == NULL) {
			free_range_list(r);
			free_attrl_list(sj_attrs);
			return 1;
		}
		pstcmd->next = NULL;
		pstcmd->text = NULL;
		pstcmd->name = NULL;
		pstcmd->attribs = dup_attrl_list(sj_attrs);
		if (pstcmd->attribs == NULL) {
			pbs_statfree(pstcmd);
			free_range_list(r);
			free_attrl_list(sj_attrs);
			return 1;
		}
		name = create_subjob_id(parent_jid, sjidx);
		if (name == NULL) {
			pbs_statfree(pstcmd);
			free_range_list(r);
			free_attrl_list(sj_attrs);
			return 1;
		}
		pstcmd->name = strdup(name);
		if (pstcmd->name == NULL) {
			pbs_statfree(pstcmd);
			free_range_list(r);
			free_attrl_list(sj_attrs);
			return 1;
		}
		pstcmd->next = array->next;
		array->next = pstcmd;
		(*count)++;
	}
	free_range_list(r);
	free_attrl_list(sj_attrs);
	return 0;
}

/**
 * @brief	compare subjob name using its index from given batch statues
 *
 * @param[in]	a - first batch status to compare
 * @param[in]	b - secound batch status to compare
 *
 * @return int
 * @retval  0 - a's index == b's index (or invalid inputs)
 * @retval  1 - a's index > b's index
 * @retval -1 - a's index < b's index
 */
static int
cmp_sj_name(struct batch_status *a, struct batch_status *b)
{
	int sjidx_a = 0;
	int sjidx_b = 0;

	if (a == NULL || b == NULL)
		return 0;
	if (a->name == NULL || b->name == NULL)
		return 0;
	sjidx_a = get_index_from_jid(a->name);
	if (sjidx_a == -1)
		return 0;
	sjidx_b = get_index_from_jid(b->name);
	if (sjidx_b == -1)
		return 0;
	if (sjidx_a > sjidx_b)
		return 1;
	if (sjidx_a < sjidx_b)
		return -1;
	return 0;
}

/**
 * @brief-
 *	decode a Batch Protocol Reply Structure for a Command
 *
 * @par	Functionality:
 *		This routine decodes a batch reply into the form used by commands.
 *      	The only difference between this and the server version is on status
 *      	replies.  For commands, the attributes are decoded into a list of
 *      	attrl structure rather than the server's svrattrl.
 *
 * Note: batch_reply structure defined in libpbs.h, it must be allocated
 *       by the caller.
 *
 * @param[in] sock - socket descriptor
 * @param[in] reply - pointer to batch_reply structure
 * @param[in] prot - protocol type
 *
 * @return	int
 * @retval	-1	error
 * @retval	0	Success
 *
 */

int
decode_DIS_replyCmd(int sock, struct batch_reply *reply, int prot)
{
	int ct;
	int i;
	struct brp_select *psel;
	struct brp_select **pselx;
	struct batch_status *pstcmd = NULL;
	struct batch_status **pstcx = NULL;
	struct batch_deljob_status *pdel;
	struct batch_status *pstcmd_last = NULL;
	struct batch_status *pstcmd_ja = NULL;
	int rc = 0;
	size_t txtlen;
	preempt_job_info *ppj = NULL;

	/* first decode "header" consisting of protocol type and version */
again:
	i = disrui(sock, &rc);
	if (rc != 0)
		return rc;
	if (i != PBS_BATCH_PROT_TYPE)
		return DIS_PROTO;
	i = disrui(sock, &rc);
	if (rc != 0)
		return rc;
	if (i != PBS_BATCH_PROT_VER)
		return DIS_PROTO;

	/* next decode code, auxcode and choice (union type identifier) */

	reply->brp_code = disrsi(sock, &rc);
	if (rc)
		return rc;
	reply->brp_auxcode = disrsi(sock, &rc);
	if (rc)
		return rc;
	reply->brp_choice = disrui(sock, &rc);
	if (rc)
		return rc;
	reply->brp_is_part = disrui(sock, &rc);
	if (rc)
		return rc;

	switch (reply->brp_choice) {

		case BATCH_REPLY_CHOICE_NULL:
			break; /* no more to do */

		case BATCH_REPLY_CHOICE_Queue:
		case BATCH_REPLY_CHOICE_RdytoCom:
		case BATCH_REPLY_CHOICE_Commit:
			disrfst(sock, PBS_MAXSVRJOBID + 1, reply->brp_un.brp_jid);
			if (rc)
				return (rc);
			break;

		case BATCH_REPLY_CHOICE_Select:

			/* have to get count of number of strings first */

			reply->brp_un.brp_select = NULL;
			pselx = &reply->brp_un.brp_select;
			ct = disrui(sock, &rc);
			if (rc)
				return rc;
			reply->brp_count = ct;

			while (ct--) {
				psel = (struct brp_select *) malloc(sizeof(struct brp_select));
				if (psel == 0)
					return DIS_NOMALLOC;
				psel->brp_next = NULL;
				psel->brp_jobid[0] = '\0';
				rc = disrfst(sock, PBS_MAXSVRJOBID + 1, psel->brp_jobid);
				if (rc) {
					(void) free(psel);
					return rc;
				}
				*pselx = psel;
				pselx = &psel->brp_next;
			}
			break;

		case BATCH_REPLY_CHOICE_Status:

			/* have to get count of number of status objects first */
			if (pstcx == NULL) {
				reply->brp_un.brp_statc = NULL;
				pstcx = &reply->brp_un.brp_statc;
				reply->brp_count = 0;
			}
			ct = disrui(sock, &rc);
			if (rc)
				return rc;
			reply->brp_count += ct;

			while (ct--) {

				rc = DIS_PROTO;
				pstcmd = read_batch_status(sock, &reply->brp_type, &rc);
				if (rc != DIS_SUCCESS || pstcmd == NULL) {
					if (pstcmd)
						pbs_statfree(pstcmd);
					return rc;
				}
				if (reply->brp_type == MGR_OBJ_JOBARRAY_PARENT) {
					if (pstcmd_ja != NULL) {
						pstcmd_ja->next = bs_isort(pstcmd_ja->next, cmp_sj_name);
						for (pstcmd_last = pstcmd_ja; pstcmd_last->next; pstcmd_last = pstcmd_last->next)
							;
						*pstcx = pstcmd_ja;
						pstcx = &pstcmd_last->next;
						pstcmd_ja = NULL;
					}
					if (expand_remaining_subjob(pstcmd, &reply->brp_count) != 0) {
						pbs_statfree(pstcmd);
						return DIS_NOMALLOC;
					}
					pstcmd_ja = pstcmd;
					continue;
				} else if (reply->brp_type == MGR_OBJ_SUBJOB) {
					pstcmd->next = pstcmd_ja->next;
					pstcmd_ja->next = pstcmd;
					continue;
				} else {
					if (pstcmd_ja != NULL) {
						pstcmd_ja->next = bs_isort(pstcmd_ja->next, cmp_sj_name);
						for (pstcmd_last = pstcmd_ja; pstcmd_last->next; pstcmd_last = pstcmd_last->next)
							;
						*pstcx = pstcmd_ja;
						pstcx = &pstcmd_last->next;
						pstcmd_ja = NULL;
					}
					*pstcx = pstcmd;
					pstcx = &pstcmd->next;
				}
			}
			if (pstcmd_ja != NULL) {
				pstcmd_ja->next = bs_isort(pstcmd_ja->next, cmp_sj_name);
				for (pstcmd_last = pstcmd_ja; pstcmd_last->next; pstcmd_last = pstcmd_last->next)
					;
				*pstcx = pstcmd_ja;
				pstcx = &pstcmd_last->next;
				pstcmd = pstcmd_last;
			}

			if (reply->brp_un.brp_statc)
				reply->last = pstcmd;
			if (reply->brp_is_part)
				goto again;
			break;

		case BATCH_REPLY_CHOICE_Delete:

			/* have to get count of number of status objects first */

			reply->brp_un.brp_deletejoblist.brp_delstatc = NULL;
			reply->brp_count = 0;

			ct = disrui(sock, &rc);
			if (rc)
				return rc;
			reply->brp_count += ct;

			while (ct--) {
				pdel = (struct batch_deljob_status *) malloc(sizeof(struct batch_deljob_status));
				if (pdel == 0)
					return DIS_NOMALLOC;
				pdel->next = reply->brp_un.brp_deletejoblist.brp_delstatc;
				pdel->code = 0;
				pdel->name = disrst(sock, &rc);
				if (rc) {
					pbs_delstatfree(pdel);
					return rc;
				}
				pdel->code = disrui(sock, &rc);
				if (rc) {
					pbs_delstatfree(pdel);
					return rc;
				}
				reply->brp_un.brp_deletejoblist.brp_delstatc = pdel;
			}

			break;

		case BATCH_REPLY_CHOICE_Text:

			/* text reply */

			reply->brp_un.brp_txt.brp_str = disrcs(sock, &txtlen, &rc);
			reply->brp_un.brp_txt.brp_txtlen = txtlen;
			break;

		case BATCH_REPLY_CHOICE_Locate:

			/* Locate Job Reply */

			rc = disrfst(sock, PBS_MAXDEST + 1, reply->brp_un.brp_locate);
			break;

		case BATCH_REPLY_CHOICE_RescQuery:

			/* Resource Query Reply */

			reply->brp_un.brp_rescq.brq_avail = NULL;
			reply->brp_un.brp_rescq.brq_alloc = NULL;
			reply->brp_un.brp_rescq.brq_resvd = NULL;
			reply->brp_un.brp_rescq.brq_down = NULL;
			ct = disrui(sock, &rc);
			if (rc)
				break;
			reply->brp_un.brp_rescq.brq_number = ct;
			reply->brp_un.brp_rescq.brq_avail = (int *) malloc(ct * sizeof(int));
			if (reply->brp_un.brp_rescq.brq_avail == NULL)
				return DIS_NOMALLOC;
			reply->brp_un.brp_rescq.brq_alloc = (int *) malloc(ct * sizeof(int));
			if (reply->brp_un.brp_rescq.brq_alloc == NULL)
				return DIS_NOMALLOC;
			reply->brp_un.brp_rescq.brq_resvd = (int *) malloc(ct * sizeof(int));
			if (reply->brp_un.brp_rescq.brq_resvd == NULL)
				return DIS_NOMALLOC;
			reply->brp_un.brp_rescq.brq_down = (int *) malloc(ct * sizeof(int));
			if (reply->brp_un.brp_rescq.brq_down == NULL)
				return DIS_NOMALLOC;

			for (i = 0; (i < ct) && (rc == 0); ++i)
				*(reply->brp_un.brp_rescq.brq_avail + i) = disrui(sock, &rc);
			for (i = 0; (i < ct) && (rc == 0); ++i)
				*(reply->brp_un.brp_rescq.brq_alloc + i) = disrui(sock, &rc);
			for (i = 0; (i < ct) && (rc == 0); ++i)
				*(reply->brp_un.brp_rescq.brq_resvd + i) = disrui(sock, &rc);
			for (i = 0; (i < ct) && (rc == 0); ++i)
				*(reply->brp_un.brp_rescq.brq_down + i) = disrui(sock, &rc);
			break;

		case BATCH_REPLY_CHOICE_PreemptJobs:

			/* Preempt Jobs Reply */
			ct = disrui(sock, &rc);
			reply->brp_un.brp_preempt_jobs.count = ct;
			if (rc)
				break;

			ppj = calloc(sizeof(struct preempt_job_info), ct);
			reply->brp_un.brp_preempt_jobs.ppj_list = ppj;

			for (i = 0; i < ct; i++) {
				if (((rc = disrfst(sock, PBS_MAXSVRJOBID + 1, ppj[i].job_id)) != 0) ||
				    ((rc = disrfst(sock, PREEMPT_METHOD_HIGH + 1, ppj[i].order)) != 0))
					return rc;
			}

			break;

		default:
			return -1;
	}

	return rc;
}


================================================
FILE: src/lib/Libifl/enc_reply.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	enc_reply.c
 * @brief
 * encode_DIS_reply() - encode a Batch Protocol Reply Structure
 *
 * 	batch_reply structure defined in libpbs.h, it must be allocated
 *	by the caller.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "list_link.h"
#include "attribute.h"
#include "dis.h"
#include "net_connect.h"

int encode_DIS_svrattrl(int sock, svrattrl *psattl);

/**
 * @brief-
 *      encode a Batch Protocol Reply Structure for a Command
 *
 * Note: batch_reply structure defined in libpbs.h, it must be allocated
 *       by the caller.
 *
 * @param[in] sock - socket descriptor
 * @param[in] reply - pointer to batch_reply structure
 *
 * @return      int
 * @retval      -1      error
 * @retval      0       Success
 *
 */

static int
encode_DIS_reply_inner(int sock, struct batch_reply *reply)
{
	int ct;
	int i;
	struct brp_select *psel;
	struct brp_status *pstat;
	struct batch_deljob_status *pdelstat;
	svrattrl *psvrl;
	preempt_job_info *ppj;

	int rc;

	/* next encode code, auxcode and choice (union type identifier) */

	if ((rc = diswsi(sock, reply->brp_code)) ||
	    (rc = diswsi(sock, reply->brp_auxcode)) ||
	    (rc = diswui(sock, reply->brp_choice)) ||
	    (rc = diswui(sock, reply->brp_is_part)))
		return rc;

	switch (reply->brp_choice) {

		case BATCH_REPLY_CHOICE_NULL:
			break; /* no more to do */

		case BATCH_REPLY_CHOICE_Queue:
		case BATCH_REPLY_CHOICE_RdytoCom:
		case BATCH_REPLY_CHOICE_Commit:
			if ((rc = diswst(sock, reply->brp_un.brp_jid)) != 0)
				return (rc);
			break;

		case BATCH_REPLY_CHOICE_Select:

			/* have to send count of number of strings first */

			if ((rc = diswui(sock, reply->brp_count)) != 0)
				return rc;

			psel = reply->brp_un.brp_select;
			while (psel) {
				/* now encode each string */
				if ((rc = diswst(sock, psel->brp_jobid)) != 0)
					return rc;
				psel = psel->brp_next;
			}
			break;

		case BATCH_REPLY_CHOICE_Status:

			/* encode "server version" of status structure.
			 *
			 * Server always uses svrattrl form.
			 * Commands decode into their form.
			 */

			if ((rc = diswui(sock, reply->brp_count)) != 0)
				return rc;
			pstat = (struct brp_status *) GET_NEXT(reply->brp_un.brp_status);
			while (pstat) {
				if ((rc = diswui(sock, pstat->brp_objtype)) || (rc = diswst(sock, pstat->brp_objname)))
					return rc;

				psvrl = (svrattrl *) GET_NEXT(pstat->brp_attr);
				if ((rc = encode_DIS_svrattrl(sock, psvrl)) != 0)
					return rc;
				pstat = (struct brp_status *) GET_NEXT(pstat->brp_stlink);
			}
			break;

		case BATCH_REPLY_CHOICE_Delete:

			/* encode "server version" of status structure.
			 *
			 * Server always uses svrattrl form.
			 * Commands decode into their form.
			 */

			if ((rc = diswui(sock, reply->brp_count)) != 0)
				return rc;
			pdelstat = reply->brp_un.brp_deletejoblist.brp_delstatc;
			while (pdelstat) {
				if ((rc = diswst(sock, pdelstat->name)) || (rc = diswui(sock, pdelstat->code)))
					return rc;

				pdelstat = pdelstat->next;
			}
			break;

		case BATCH_REPLY_CHOICE_Text:

			/* text reply */

			rc = diswcs(sock, reply->brp_un.brp_txt.brp_str, (size_t) reply->brp_un.brp_txt.brp_txtlen);
			if (rc)
				return rc;
			break;

		case BATCH_REPLY_CHOICE_Locate:

			/* Locate Job Reply */

			if ((rc = diswst(sock, reply->brp_un.brp_locate)) != 0)
				return rc;
			break;

		case BATCH_REPLY_CHOICE_RescQuery:

			/* Query Resources Reply */

			ct = reply->brp_un.brp_rescq.brq_number;
			if ((rc = diswui(sock, ct)) != 0)
				return rc;
			for (i = 0; (i < ct) && (rc == 0); ++i) {
				rc = diswui(sock, *(reply->brp_un.brp_rescq.brq_avail + i));
			}
			if (rc)
				return rc;
			for (i = 0; (i < ct) && (rc == 0); ++i) {
				rc = diswui(sock, *(reply->brp_un.brp_rescq.brq_alloc + i));
			}
			if (rc)
				return rc;
			for (i = 0; (i < ct) && (rc == 0); ++i) {
				rc = diswui(sock, *(reply->brp_un.brp_rescq.brq_resvd + i));
			}
			if (rc)
				return rc;
			for (i = 0; (i < ct) && (rc == 0); ++i) {
				rc = diswui(sock, *(reply->brp_un.brp_rescq.brq_down + i));
			}
			if (rc)
				return rc;
			break;

		case BATCH_REPLY_CHOICE_PreemptJobs:

			/* Preempt Jobs Reply */
			ct = reply->brp_un.brp_preempt_jobs.count;
			ppj = reply->brp_un.brp_preempt_jobs.ppj_list;

			if ((rc = diswui(sock, ct)) != 0)
				return rc;

			for (i = 0; i < ct; i++) {
				if (((rc = diswst(sock, ppj[i].job_id)) != 0) || ((rc = diswst(sock, ppj[i].order)) != 0))
					return rc;
			}

			break;

		default:
			return -1;
	}

	return 0;
}

int
encode_DIS_reply(int sock, struct batch_reply *reply)
{
	int rc;
	/* first encode "header" consisting of protocol type and version */

	if ((rc = diswui(sock, PBS_BATCH_PROT_TYPE)) ||
	    (rc = diswui(sock, PBS_BATCH_PROT_VER)))
		return rc;

	return (encode_DIS_reply_inner(sock, reply));
}

int
encode_DIS_replyTPP(int sock, char *tppcmd_msgid, struct batch_reply *reply)
{
	int rc;

	/* first encode "header" consisting of protocol type and version */
	if (reply->brp_choice == BATCH_REPLY_CHOICE_Status) {
		return encode_DIS_reply(sock, reply);
	} else {
		if ((rc = is_compose(sock, IS_CMD_REPLY)) != DIS_SUCCESS)
			return rc;

		/* 
		* for IS_CMD_REPLY, also send across the tppcmd_msgid, so that
		* server can match the reply with the request it had sent earlier
		*/
		if ((rc = diswst(sock, tppcmd_msgid)) != DIS_SUCCESS)
			return rc;
	}

	return (encode_DIS_reply_inner(sock, reply));
}


================================================
FILE: src/lib/Libifl/entlim_parse.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <ctype.h>
#include <string.h>
#include "pbs_entlim.h"

#include <stdio.h>

/**
 * @brief
 * 	strip_trailing_white - strip whitespace from the end of a character string
 *
 * @param[in] pw - input string
 *	The input string is null terminated at the start of any trailing
 *	white space.
 *
 * @return	Void
 */
static void
strip_trailing_white(char *pw)
{
	while (isspace((int) *pw))
		--pw;
	*(pw + 1) = '\0';
	return;
}

/**
 * @brief
 * 	-Parse a string of the form: 	value1 [, value2 ...]
 * 	returning a pointer to each "value" in turn striping out the white space
 *
 * @param[in,out] - start - address of pointer to start of string, it is
 *		updated to the start of the next substring on return;
 *
 * @return char *
 * @retval pointer to first (next) substring
 * @retval NULL if reached the end the string
 */

char *
parse_comma_string_r(char **start)
{
	char *pc;
	char *rv;

	char *back;

	if ((start == NULL) || (*start == NULL))
		return NULL;

	pc = *start;

	if (*pc == '\0')
		return NULL; /* already at end, no strings */

	/* skip over leading white space */

	while ((*pc != '\n') && isspace((int) *pc) && *pc)
		pc++;

	rv = pc; /* the start point which will be returned */

	/* go find comma or end of line */

	while (*pc) {
		if ((*pc == ',') || (*pc == '\n'))
			break;
		++pc;
	}
	back = pc;
	while (isspace((int) *--back)) /* strip trailing spaces */
		*back = '\0';

	if (*pc)
		*pc++ = '\0'; /* if not end, terminate this and adv past */
	*start = pc;

	return (rv);
}

static char pbs_all[] = PBS_ALL_ENTITY;

/**
 * @brief
 * 	-etlim_validate_name - check the entity name for:
 *	1. if type is 'o', then name must be "PBS_ALL",
 *	2. else name must not contain invalid characters
 *
 * @param[in] etype - limits on entity type
 * @param[in] ename - entity name
 *
 * @return	int
 * @retval	0	if name is ok
 * @retval	-1 	if name is invalid
 */
static int
etlim_validate_name(enum lim_keytypes etype, char *ename)
{
	if (etype == LIM_OVERALL) {
		/* do special check on entity for etype 'o' */
		if (strcmp(ename, pbs_all) != 0)
			return (-1);
	} else {
		/* other etypes cannot use "PBS_ALL" */
		if (strcmp(ename, pbs_all) == 0)
			return (-1);

		/* check for invalid characters in entity's name */
		if (strpbrk(ename, ETLIM_INVALIDCHAR) != NULL)
			return (-1);
	}
	return 0;
}

/**
 * @brief
 * 	-etlim_parse_one - parse a single "entity limit" string, for example
 *	"[ u:name=value ]" into its component parts:
 *
 * @param[in] 	etype  - entity type enum
 * @param[in]	etenty - entity type letter : name  - u:job
 * @param[in]	entity - entity name
 * @param[in]	val    - value
 *
 * @return	int
 * @retval	0 	no error; values into etype, entity, val
 * @retval	<0 	the negative of the offset (index) into the string
 *		     	at which point the sytax error occurred.
 *
 *  Warning	the input string will be munged with null characters,
 *		If you need the string intact,  pass in a copy
 */
int
entlim_parse_one(char *str, enum lim_keytypes *etype, char **etenty, char **entity, char **val)
{
	char *pc;
	char *pendname = NULL;

	pc = str;

	/* search for open bracket */
	while (isspace((int) *pc))
		++pc;
	if (*pc != '[')
		return (str - pc - 1); /* negative of offset into string */

	++pc;
	/* skip whitespace till entity type letter */
	while (isspace((int) *pc))
		++pc;
	if (*pc == 'u')
		*etype = LIM_USER;
	else if (*pc == 'g')
		*etype = LIM_GROUP;
	else if (*pc == 'p')
		*etype = LIM_PROJECT;
	else if (*pc == 'o')
		*etype = LIM_OVERALL;
	else
		return (str - pc - 1);
	*etenty = pc;

	/* next must be the colon */
	if (*++pc != ':')
		return (str - pc - 1);
	++pc;

	/* next must be start of entity's name */
	if ((*pc == '\0') || isspace((int) *pc))
		return (str - pc - 1);
	*entity = pc;

	/* Look for the end of the entity name, either the close quote or */
	/* the first white space.   If there is non-white space between   */
	/* the end (shown by "pendname") and the bracket/equal sign; then */
	/* that is an error.						  */
	if ((*pc == '"') || (*pc == '\'')) {
		/* entity name is quoted,  look for matchng quote */
		char match = *pc;
		*entity = ++pc; /* incr past the quote character */

		while (*pc && *pc != match)
			++pc;
		if (*pc == '\0')
			return (str - pc - 1); /* no closing quote */
		/* set to null, ending the name */
		*pc = '\0';
		pendname = pc; /* mark reached end of name (close quote) */
	}

	/* skip to equal sign  or closing bracket */
	++pc;
	while (*pc && (*pc != '=') && (*pc != ']')) {
		if (isspace((int) *pc)) {
			*pc = '\0';
			pendname = pc; /* mark end of name (whitespace) */
		} else if (pendname != NULL) {
			/* non-white space and already saw end of name, error */
			return (str - pc - 1);
		}
		++pc;
	}

	if (*pc == ']') {
		/* case of "[u:name]" without value */
		*pc = '\0';
		/* check name for validity */
		if (etlim_validate_name(*etype, *entity) == -1)
			return (str - ((*entity) + 2) - 1);
		*val = NULL; /* no value */
		return 0;
	} else if (*pc == '\0') {
		/* error; no ']' nor '=' */
		return (str - pc - 1);
	}

	/* hit the '=', value must follow */

	*pc = '\0';
	strip_trailing_white(pc - 1);

	/* check name for validity */
	if (etlim_validate_name(*etype, *entity) == -1)
		return (str - ((*entity) + 2) - 1);

	++pc;
	/* skip white till start of value */
	while (isspace(*pc))
		++pc;
	if (*pc == '\0')
		return (str - pc - 1); /* error, no value after = */
	else if (*pc == '-')
		return (str - pc - 1); /* error, negative value */
	*val = pc;

	/* skip to closing bracket */
	++pc;
	while (*pc && (*pc != ']') && (!isspace(*pc)))
		++pc;
	while (isspace(*pc)) /* skip trailing white */
		++pc;

	if (*pc != ']')
		return (str - pc - 1);
	strip_trailing_white(pc - 1);
	return 0;
}

/**
 * @brief
 * 	-etlim_parse - parse a comma separated set of  "entity limit" strings,
 *	for example:  "[ u:name=value ],[g:name], ..." and for each separate
 *	entity limit substring, call the specified "addfunc" function with
 *		entity name  ("u:name"),
 *		passed-in resource name ("mem" or "ncpus"), and
 *		entity limit value ("10mb" or "4")
 *
 *	The "addfunc" will add the entity entry to the collection controlled
 *	by the contex identified by 'cts".  The "addfunc" function will return
 *	0 for no error or non-zero for an error.
 *
 * @return	int
 * @retval	0	no error
 * @retval	<0 	the negative of the offset (index) into the string
 *		     	at which point the sytax error occurred.
 * @retval	>0	A general PBS error that is not specific to a location
 *		     	in the input string.
 *
 *  Warning	the input string will be munged with null characters,
 *		If you need the string intact,  pass in a copy
 */
int
entlim_parse(char *str, char *resc, void *ctx,
	     int (*addfunc)(void *ctx, enum lim_keytypes kt, char *fulent,
			    char *entity, char *resc, char *value))
{
	enum lim_keytypes etype;
	char *ett;
	char *entity;
	char *ntoken;
	char *val;
	char *pcs;
	int rc;

	ntoken = str;
	while ((pcs = parse_comma_string_r(&ntoken)) != NULL) {
		rc = entlim_parse_one(pcs, &etype, &ett, &entity, &val);
		if (rc < 0)			 /* syntax error, rc is offset in ntoken */
			return (str - pcs) + rc; /* adjust for str */
		if (addfunc) {
			if ((rc = addfunc(ctx, etype, ett, entity, resc, val)) != 0)
				if (rc != 0)
					return rc;
		}
	}
	return 0;
}

#ifdef ENTLIM_STANDALONE_TEST

static int badonly = 0;

/**
 * @brief
 * 	-this is just a dummy "addfunc" that prints what was passed in
 *
 * @return	int
 *
 */
int
dummyadd(void *ctx, enum lim_keytypes kt, char *fent, char *entity, char *resc, char *value)
{
	if (strpbrk(entity, " 	") != NULL)
		fprintf(stderr, "  Note: entity name <%s> contains space\n", entity);
	if (badonly == 1)
		return 0;
	if (value)
		printf("\t--%c--%s--%s--%s\n", *fent, entity, resc, value);
	else
		printf("\t--%c--%s--%s--<null>\n", *fent, entity, resc);
	return 0;
}

main(int argc, char *argv[])
{
	char *cstr;
	char input[256];
	char etl;
	char *etname, *val;
	char *pcs;
	int rc;
	int i;
	int goodonly = 0;

	while ((i = getopt(argc, argv, "bg")) != EOF) {
		switch (i) {
			case 'b':
				badonly = 1;
				break;

			case 'g':
				goodonly = 1;
				break;

			default:
				fprintf(stderr, "Usage: %s [-b]\n", argv[0]);
				fprintf(stderr, "\t b = print only rejected (bad) entries\n");
				fprintf(stderr, "\t g = print only valid entries\n");
				return (1);
		}
	}

	if (isatty(fileno(stdin)) == 1) {
		printf("enter string: ");
		fflush(stdout);
	}
	while (fgets(input, 255, stdin) != NULL) {
		if ((cstr = strdup(input)) == NULL) {
			fprintf(stderr, "Out of Memory!\n");
			return 1;
		}
		printf("  %s\n", cstr);
		rc = entlim_parse(cstr, "mem", NULL, dummyadd);
		if ((rc != 0) && (goodonly == 0)) {
			printf("error: %s\n", input);
			i = 7 - rc;
			while (--i)
				putchar(' ');
			printf("^\n");
		}
		free(cstr);
		bzero(input, 256);
		if (isatty(fileno(stdin)) == 1) {
			printf("enter string: ");
			fflush(stdout);
		}
	}
	return 0;
}
#endif /* ENTITY_STANDALONE_TEST */


================================================
FILE: src/lib/Libifl/get_svrport.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	get_svrport.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <netdb.h>
#include <netinet/in.h>
#include "portability.h"

/*
 * get_svrport - get the port number for a given service
 *
 *	Return the port number in an unsigned interger in host byte order.
 *	Assumes the protocol type is tcp.
 *	Returns 0 on an error.
 */

/**
 * @brief
 *	-get the port number for a given service
 *
 * @param[in] service_name - service for which port reqd
 * @param[in] ptype - port type
 * @param[in] pdefault - in host byte order
 *
 * @return	unsigned int
 * @retval	port num	success
 * @retval	0		error
 *
 */
unsigned int
get_svrport(char *service_name, char *ptype, unsigned int pdefault)
{
	struct servent *psvr;

	psvr = getservbyname(service_name, ptype);
	if (psvr)
		return ((unsigned int) ntohs(psvr->s_port));
	else
		return (pdefault);
}


================================================
FILE: src/lib/Libifl/grunt_parse.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	grunt_parse.c
 */

#include "pbs_config.h" /* the master config generated by configure */
#include <ctype.h>
#include <errno.h>
#include <stdlib.h>
#include <string.h>
#include "grunt.h"
#include "pbs_error.h"

/**
 * @brief
 * 	-parse_resc_equal_string - (thread safe) parse a string of the form:
 *		name1 = value1[,value2 ...][: name2 = value3[,value4 ...]]
 *	into <name1> <value1[,value2 ...>
 *	     <name2> <value3[,value4 ...>
 *
 * @par
 *	after call,
 *		*name will point to "name1"
 *		*value will point to "value1 ..." upto but not
 *			including the colon before "name2".
 *
 * @param[in] start - the start of the string to parse.
 * @param[in] name - point to "name1"
 * @param[in] value - will point to "value1 ..." upto but not
 *		      including the colon before "name2".
 * @param[in] last - points to where parsing stopped, use as "start" on
 *		     next call to continue.  last is set only if the function
 *		     return is "1".
 *
 * @return	int
 * @return 	int
 * @retval 	1 	if  name and value are found,
 * @retval	0 	if nothing (more) is parsed (null input)
 * @retval	-1 	if a syntax error was detected.
 *
 * @par
 *	each string is null terminated.
 */

int
parse_resc_equal_string(char *start, char **name, char **value, char **last)
{
	char *pc;
	char *backup;
	int quoting = 0;

	if ((start == NULL) || (name == NULL) || (value == NULL) || (last == NULL))
		return -1; /* error */

	pc = start;

	if (*pc == '\0') {
		*name = NULL;
		return (0); /* already at end, return no strings */
	}

	/* strip leading spaces */

	while (isspace((int) *pc) && *pc)
		pc++;

	if (*pc == '\0') {
		*name = NULL; /* null name */
		return (0);
	} else if (!isalpha((int) *pc))
		return (-1); /* no name, return error */

	*name = pc;

	/* have found start of name, look for end of it */

	while (!isspace((int) *pc) && (*pc != '=') && *pc)
		pc++;

	/* now look for =, while stripping blanks between end of name and = */

	while (isspace((int) *pc) && *pc)
		*pc++ = '\0';
	if (*pc != '=')
		return (-1); /* should have found a = as first non blank */
	*pc++ = '\0';

	/* that follows is the value string, skip leading white space */

	while (isspace((int) *pc) && *pc)
		pc++;

	/* is the value string to be quoted ? */

	if ((*pc == '"') || (*pc == '\''))
		quoting = (int) *pc++; /* adv start of "value" past quote chr */
	*value = pc;

	/*
	 * now go to first colon, or if quoted, the colon sign
	 * after the close quote
	 */

	if (quoting) {
		while ((*pc != (char) quoting) && *pc) /* look for matching */
			pc++;
		if (*pc) {
			char *pd;
			/* close string up over the trailing quote */
			pd = pc;
			while (*pd) {
				*pd = *(pd + 1);
				pd++;
			}
		} else
			return (-1);
	}
	while ((*pc != ':') && *pc)
		pc++;

	if (*pc == '\0') {
		while (isspace((int) *--pc))
			;
		if (*pc == ',') /* trailing comma is a no no */
			return (-1);
		*last = ++pc;
		return (1); /* no equal, just end of line, stop here */
	}

	/* strip off any trailing white space */

	backup = pc++;
	*backup = '\0'; /* null the colon */

	while (isspace((int) *--backup))
		*backup = '\0';
	*last = pc;
	return (1);
}

/**
 * @brief
 *	-parse_node_resc_r - (thread safe) parse the node and resource string of the form:
 *	nodeA:resc1=value1:resc2=value2
 *
 * @param[in]	str - start of string to parse (string will be
 *                    munged, so make a copy before calling this
 *                    function)
 * @param[out]	nodep - pointer to node name
 * @param[out]	pnelm - number of used elements in key_valye_pair
 *                      array
 * @param[in][out] nl - total number of elements in key_value_pair
 *                      array
 * @param[in][out] kv - pointer to array of key_value_pair structures
 *			will be malloced if nl == 0, will grow if needed
 *			will not be freed by this routine
 *
 * @return  int
 * @retval  0 = ok
 * @retval  !0 = error
 *
 */
int
parse_node_resc_r(char *str, char **nodep, int *pnelem, int *nlkv, struct key_value_pair **kv)
{
	int i;
	int nelm = 0;
	char *pc;
	char *word;
	char *value;
	char *last;

	if (str == NULL)
		return (PBSE_INTERNAL);

	if (*nlkv == 0) {
		*kv = (struct key_value_pair *) malloc(KVP_SIZE * sizeof(struct key_value_pair));
		if (*kv == NULL)
			return -1;
		*nlkv = KVP_SIZE;
	}
	for (i = 0; i < *nlkv; i++) {
		(*kv)[i].kv_keyw = NULL;
		(*kv)[i].kv_val = NULL;
	}

	pc = str;

	while (isspace((int) *pc))
		pc++;
	if (*pc == '\0') {
		*pnelem = nelm;
		return 0;
	}

	*nodep = pc;
	while ((*pc != ':') && !isspace((int) *pc) && *pc)
		pc++;

	if (pc == *nodep)
		return -1; /* error - no node name */

	if (*pc == '\0') {
		*pnelem = nelm; /* no resources */
		return 0;
	} else {
		while (*pc != ':' && *pc)
			*pc++ = '\0';
		if (*pc == ':')
			*pc++ = '\0';
	}

	/* process resource=value strings upto closing brace */

	if (*pc == '\0')
		return -1;

	i = parse_resc_equal_string(pc, &word, &value, &last);
	while (i == 1) {
		if (nelm >= *nlkv) {
			/* make more space in k_v table */
			struct key_value_pair *ttpkv;
			ttpkv = (struct key_value_pair *) realloc(*kv, (*nlkv + KVP_SIZE) * sizeof(struct key_value_pair));
			if (ttpkv == NULL)
				return PBSE_SYSTEM;
			*kv = ttpkv;
			*nlkv += KVP_SIZE;
		}
		(*kv)[nelm].kv_keyw = word;
		(*kv)[nelm].kv_val = value;
		nelm++;

		i = parse_resc_equal_string(last, &word, &value, &last);
	}
	if (i == -1)
		return PBSE_BADATVAL;

	*pnelem = nelm;
	return 0;
}

/**
 * @brief
 *	-parse_node_resc - parse the node and resource string of the form:
 *	nodeA:resc1=value1:resc2=value2
 *
 *      @param		str	start of the string to parse
 *      @param[out]	nodep	pointer to node name
 *	@param[out]	nl      number of used data elements in
 *                             	key_value_pair array
 *      @param[out]	kv      pointer to array of key_value_pair structures
 *
 *      @return  int
 *      @retval  0 = ok
 *      @retval  !0 = error
 */
int
parse_node_resc(char *str, char **nodep, int *nl, struct key_value_pair **kv)
{
	int i;
	int nelm = 0;
	static int nkvelements = 0;
	static struct key_value_pair *tpkv = NULL;

	if (str == NULL)
		return (PBSE_INTERNAL);

	i = parse_node_resc_r(str, nodep, &nelm, &nkvelements, &tpkv);

	*nl = nelm;
	*kv = tpkv;
	return i;
}

/**
 * @brief
 *	-parse_chunk_r - (thread safe) decode a chunk of a selection specification string,
 *
 *	Chunk is of the form: [#][:word=value[:word=value...]]
 *
 * @param str    = string to parse (will be munged) (input)
 * @param[in] nchk   = number of chunks, "#" (output)
 * @param[in] pnelem = of active data elements in key_value_pair
 *                     array (output)
 * @param[in] nkve   = total number of elements (size) in the
 *                     key_value_pair array (input/output)
 * @param[in] pkv    = pointer to array of key_value_pair (input/output)
 * @param[in] dflt   = upon receiving a select specification with
 *                     no number of chunks factor, we default to a nchk
 *                     factor of 1.  The new resource default_chunk.nchunk
 *                     controls the value of this chunk factor when it is
 *                     not set.  The dflt argument specifies whether the
 *                     number of nchk was provided on the select line or not
 *                     such that at a later time we can determine if
 *                     the default_chunk.nchunk resource should be
 *                     applied or not (see make_schedselect) (output)
 *
 * @par	Note:
 *	the key_value_pair array, rtn, will be grown if additional
 *	space is needed,  it is not freed by this routine
 *
 * @return 	int
 * @retval 	0 	if ok
 * @retval 	!0 	on error
 *
 */

int
parse_chunk_r(char *str, int *nchk, int *pnelem, int *nkve, struct key_value_pair **pkv, int *dflt)
{
	int i;
	int nchunk = 1; /* default number of chucks */
	int setbydefault = 1;
	int nelem = 0;
	char *pc;
	char *ps;
	char *word;
	char *value;
	char *last;

	if (str == NULL)
		return (PBSE_INTERNAL);

	if (*nkve == 0) {
		/* malloc room for array of key_value_pair structure */
		*pkv = (struct key_value_pair *) malloc(KVP_SIZE * sizeof(struct key_value_pair));
		if (*pkv == NULL)
			return PBSE_SYSTEM;
		*nkve = KVP_SIZE;
	}
	for (i = 0; i < *nkve; ++i) {
		(*pkv)[i].kv_keyw = NULL;
		(*pkv)[i].kv_val = NULL;
	}

	pc = str;

	/* start of chunk */
	while (isspace((int) *pc))
		++pc;

	/* first word must start with number or letter */

	ps = pc;
	if (!isalnum((int) *pc))
		return (PBSE_BADATVAL);

	if (isdigit((int) *pc)) {
		/* leading count, should be followed by ':' or '\0' */
		++pc;
		while (isdigit((int) *pc))
			++pc;
		nchunk = atoi(ps);
		setbydefault = 0;
		while (isspace((int) *pc))
			++pc;
		if (*pc != '\0') {
			if (*pc != ':')
				return (PBSE_BADATVAL);
			++pc;
		}
	}

	/* next comes "resc=value" pairs */

	i = parse_resc_equal_string(pc, &word, &value, &last);
	while (i == 1) {
		if (nelem >= *nkve) {
			/* make more space in k_v table */
			struct key_value_pair *ttpkv;
			ttpkv = realloc(*pkv, (*nkve + KVP_SIZE) * sizeof(struct key_value_pair));
			if (ttpkv == NULL)
				return PBSE_SYSTEM;
			*pkv = ttpkv;
			for (i = *nkve; i < *nkve + KVP_SIZE; ++i) {
				(*pkv)[i].kv_keyw = NULL;
				(*pkv)[i].kv_val = NULL;
			}
			*nkve += KVP_SIZE;
		}
		(*pkv)[nelem].kv_keyw = word;
		(*pkv)[nelem].kv_val = value;
		nelem++;
		/* continue with next resc=value pair          */

		i = parse_resc_equal_string(last, &word, &value, &last);
	}
	if (i == -1)
		return PBSE_BADATVAL;

	*pnelem = nelem;
	*nchk = nchunk;
	if (dflt)
		*dflt = setbydefault;

	return 0;
}

/**
 * @brief
 * 	parse_chunk - (not thread safe) decode a chunk of a selection specification
 *	string,
 *
 * @par
 *	Chunk is of the form: [#][:word=value[:word=value...]]
 *
 * @param[in]  str  = string to parse
 * @param[in]	nchk = number of chunks, "#"
 * @param[in]	nrtn = number of active (used) word=value pairs in the
 *		       key_value_pair array
 * @param[in]	rtn  = pointer to static array of key_value_pair
 * @param[in]  dflt = the nchk value was set to 1 by default
 *
 * @return 	int
 * @retval 	0 	if ok
 * @retval 	!0 	on error
 *
 */

static int nkvelements = 0;
static struct key_value_pair *tpkv = NULL;
int
parse_chunk(char *str, int *nchk, int *nrtn, struct key_value_pair **rtn, int *setbydflt)
{
	int i;
	int nelm = 0;

	if (str == NULL)
		return (PBSE_INTERNAL);

	i = parse_chunk_r(str, nchk, &nelm, &nkvelements, &tpkv, setbydflt);
	*nrtn = nelm;
	*rtn = tpkv;
	return i;
}

/**
 * @brief
 * 	parse_chunk_make_room_r - (thread safe) make room in key/value array
 *
 * @par
 * @param[in]	inuse = number of entries current in use
 * @param[in]	extra = number of additional entries needed
 * @param[in/out] pnkve = pointer to current size of k_v array
 * @param[in/out] ppkve = pointer to address of base of k_v array
 *
 * @return 	int
 * @retval 	0 	if ok
 * @retval 	!0 	on error
 *
 */
int
parse_chunk_make_room_r(int inuse, int extra, int *pnkve, struct key_value_pair **ppkve)
{
	int new_len;
	struct key_value_pair *ttpkv;
	int i;

	/* check if extra will fit in current allocation */
	if (inuse + extra <= *pnkve)
		return 0;
	/*
	 * Need to grow the key/value array.
	 * Keep the size a multiple of KVP_SIZE just to match parse_chunk_r's
	 * method.
	 */
	new_len = ((inuse + extra + KVP_SIZE - 1) / KVP_SIZE) * KVP_SIZE;
	ttpkv = realloc(*ppkve, new_len * sizeof(struct key_value_pair));
	if (ttpkv == NULL)
		return PBSE_SYSTEM;
	/* NULL out any new entries */
	for (i = inuse; i < new_len; i++) {
		ttpkv[i].kv_keyw = NULL;
		ttpkv[i].kv_val = NULL;
	}
	*ppkve = ttpkv;
	*pnkve = new_len;
	return 0;
}

/**
 * @brief
 * 	parse_chunk_make_room - (not thread safe) make room in default key/value
 * 	array
 *
 * @par
 * @param[in]	inuse = number of entries current in use
 * @param[in]	extra = number of additional entries needed
 * @param[in/out] rtn = pointer to address to hold possibly moved k_v array
 *
 * @return 	int
 * @retval 	0 	if ok
 * @retval 	!0 	on error
 *
 */
int
parse_chunk_make_room(int inuse, int extra, struct key_value_pair **rtn)
{
	int rc;
	/* Make sure we are using the default k_v array */
	if (*rtn != tpkv)
		return PBSE_SYSTEM;
	rc = parse_chunk_make_room_r(inuse, extra, &nkvelements, &tpkv);
	*rtn = tpkv;
	return rc;
}

/**
 * @brief
 *	parse_plus_spec_r - (thread safe)
 * @par
 *	Called with "str" set for start of string of a set of plus connnected
 *	substrings "substring1+substring2+...";
 *
 * @param[in]	selstr - string to parse, continue to parse
 * @param[in]	last   - pointer to place to resume parsing
 * @param[in]	hp     - set based on finding '(' or ')'
 *			 > 0 = found '(' at start of substring
 *			 = 0 = no parens or found both in one substring
 *			 < 0 = found ')' at end of substring
 *
 * @par
 *	IMPORTANT: the input string will be munged by the various
 *	parsing routines, if you need an untouched original,  pass
 *	in a pointer to a copy.
 *
 * @return         A pointer to next substring
 * @retval         next substring (char *)
 * @retval         NULL if end of the spec
 *
 */
char *
parse_plus_spec_r(char *selstr, char **last, int *hp)
{
	int haveparen = 0;
	char *pe;
	char *ps;

	if ((selstr == NULL) || (strlen(selstr)) == 0)
		return NULL;

	ps = selstr;

	while (isspace((int) *ps))
		++ps;
	if (*ps == '(') {
		haveparen++;
		ps++; /* skip over the ( */
	}

	pe = ps;
	while (*pe != '\0') {
		if ((*pe == '"') || (*pe == '\'')) {
			char quote;

			quote = *pe;
			pe++;
			while (*pe != '\0' && *pe != quote)
				pe++;
			if (*pe == quote)
				pe++;
		} else if (*pe != '+' && *pe != ')')
			pe++;
		else
			break;
	}

	if (*pe) {
		if (*pe == ')') {
			*pe++ = '\0'; /* null the )		*/
			haveparen--;
		}
		if (*pe != '\0')
			*pe++ = '\0'; /* null the following +	*/
	}

	if (*ps) {
		if (last != NULL)
			*last = pe;
		if (hp != NULL)
			*hp = haveparen;
		return ps;
	} else
		return NULL;
}

/**
 * @brief
 *	parse_plus_spec - not thread safe
 * @par
 *	Called with "str" set for start of string of a set of plus connnected
 *	substrings "substring1+substring2+...";  OR
 *	called with null to continue where left off.
 *
 * @param[in] selstr - string holding select specs
 * @param[out] rc - flag
 *
 * @return 	A pointer to next substring
 * @retval	next substring (char *)
 * @retval	NULL if end of the spec
 *
 * @par
 *	IMPORTANT: the "selstr" is copied into a locally allocated "static"
 *	char array for parsing.  The orignal string is untouched.  The array
 *	is grown as need to hold "selstr".
 */
char *
parse_plus_spec(char *selstr, int *rc)
{
	int hp; /* value returned by parse_pluse_spec ignored */
	size_t len;
	static char *pe;
	char *ps;
	static char *parsebuf = NULL;
	static int parsebufsz = 0;

	*rc = 0;
	if (selstr) {

		if ((len = strlen(selstr)) == 0)
			return NULL;
		else if (len >= parsebufsz) {
			if (parsebuf)
				free(parsebuf);
			parsebufsz = len * 2;
			parsebuf = (char *) malloc(parsebufsz);
			if (parsebuf == NULL) {
				parsebufsz = 0;
				*rc = errno;
				return NULL;
			}
		}

		(void) strcpy(parsebuf, selstr);
		ps = parsebuf;
	} else
		ps = pe;

	if (*ps == '+') {
		/* invalid string, starts with + */
		*rc = PBSE_BADNODESPEC;
		return NULL;
	}

	return (parse_plus_spec_r(ps, &pe, &hp));
}

/**
 * @brief
 *	get the first vnode corresponds to a selectspec
 *
 * @param[in] execvnode - selectspec
 *
 * @return 	vnode - has to be freed by the caller
 * @retval	NULL: vnode could not find in the str
 */
char *
get_first_vnode(char *execvnode)
{
	char *chunk;
	char *last;
	int hasprn;
	char *vname;
	int nelem;
	struct key_value_pair *pkvp;
	char *execvnode_dup;
	char *vname_out = NULL;

	if (!execvnode)
		return NULL;

	execvnode_dup = strdup(execvnode);

	chunk = parse_plus_spec_r(execvnode_dup, &last, &hasprn);
	if (chunk) {
		if (parse_node_resc(chunk, &vname, &nelem, &pkvp) == 0)
			vname_out = strdup(vname);
	}

	free(execvnode_dup);
	return vname_out;
}


================================================
FILE: src/lib/Libifl/ifl_impl.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    ifl_impl.c
 *
 * @brief
 * 		Pass-through call to send batch_request to server. Interfaces can
 * 		be overridden by the developer, to implement their own definition.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "ifl_internal.h"
#include "pbs_ifl.h"
#include "pbs_share.h"

/**
 * @brief
 *	-Pass-through call to send async run job batch request.
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] location - string of vnodes/resources to be allocated to the job
 * @param[in] extend - extend string for encoding req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_asyrunjob(int c, const char *jobid, const char *location, const char *extend)
{
	return (*pfn_pbs_asyrunjob)(c, jobid, location, extend);
}

/**
 * @brief
 *	-Pass-through call to send async run job batch request with ack
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] location - string of vnodes/resources to be allocated to the job
 * @param[in] extend - extend string for encoding req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_asyrunjob_ack(int c, const char *jobid, const char *location, const char *extend)
{
	return (*pfn_pbs_asyrunjob_ack)(c, jobid, location, extend);
}

/**
 * @brief
 *	-Pass-through call to send alter Job request
 *	really an instance of the "manager" request.
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
pbs_alterjob(int c, const char *jobid, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_alterjob)(c, jobid, attrib, extend);
}

/**
 * @brief
 *	-Pass-through call to send alter Job request
 *	really an instance of the "manager" request.
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
pbs_asyalterjob(int c, const char *jobid, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_asyalterjob)(c, jobid, attrib, extend);
}

/**
 * @brief
 * 	-pbs_confirmresv - this function is for exclusive use by the Scheduler
 *	to confirm an advanced reservation.
 *
 * @param[in] rid 	Reservaion ID
 * @param[in] location  string of vnodes/resources to be allocated to the resv.
 * @param[in] start 	start time of reservation if non-zero
 * @param[in] extend PBS_RESV_CONFIRM_SUCCESS or PBS_RESV_CONFIRM_FAIL
 *
 * @return	int
 * @retval	0	Success
 * @retval	!0	error
 *
 */
int
pbs_confirmresv(int c, const char *rid, const char *location, unsigned long start, const char *extend)
{
	return (*pfn_pbs_confirmresv)(c, rid, location, start, extend);
}

/**
 * @brief
 *	Pass-through call to connect to pbs server
 *	passing any 'extend' data to the connection.
 *
 * @param[in] server - server - the hostname of the pbs server to connect to.
 *
 * @retval int	- return value of pbs_connect_extend().
 */
int
pbs_connect(const char *server)
{
	return (*pfn_pbs_connect)(server);
}

/**
 * @brief
 *	Pass-through call to make a PBS_BATCH_Connect request to 'server'.
 *
 * @param[in]   server - the hostname of the pbs server to connect to.
 * @param[in]   extend_data - a string to send as "extend" data.
 *
 * @return int
 * @retval >= 0	index to the internal connection table representing the
 *		connection made.
 * @retval -1	error encountered setting up the connection.
 */
int
pbs_connect_extend(const char *server, const char *extend_data)
{
	return (*pfn_pbs_connect_extend)(server, extend_data);
}

/**
 * @brief
 *	- Pass-through call to get default server name.
 *
 * @return	string
 * @retval	dflt srvr name	success
 * @retval	NULL		error
 *
 */
char *
pbs_default()
{
	return (*pfn_pbs_default)();
}

/**
 * @brief
 *	Pass-through call to send the delete Job request
 * 	really just an instance of the manager request
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] extend - string to encode req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
pbs_deljob(int c, const char *jobid, const char *extend)
{
	return (*pfn_pbs_deljob)(c, jobid, extend);
}

/**
 * @brief
 *	Pass-through call to send the delete Job request
 * 	really just an instance of the manager request
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] extend - string to encode req
 *
 * @return	struct batch_status *
 * @retval	0	success
 * @retval	!0	error
 *
 */
struct batch_deljob_status *
pbs_deljoblist(int c, char **jobid, int numofjobs, const char *extend)
{
	return (*pfn_pbs_deljoblist)(c, jobid, numofjobs, extend);
}

/**
 * @brief
 *	-Pass-through call to send close connection batch request
 *
 * @param[in] connect - socket descriptor
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 *
 */
int
pbs_disconnect(int connect)
{
	return (*pfn_pbs_disconnect)(connect);
}

/**
 * @brief
 *	-Pass-through call to get last error message the server returned on
 *	this connection.
 *
 * @param[in] connect - soket descriptor
 *
 * @return	string
 * @retval	connection contexts
 *		TLS			multithread
 *		STRUCTURE		single thread
 * @retval	errmsg			error
 *
 */
char *
pbs_geterrmsg(int connect)
{
	return (*pfn_pbs_geterrmsg)(connect);
}

/**
 * @brief
 *	- Pass-through call to send Hold Job request to the server --
 *	really just an instance of the "manager" request.
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] holdtype - value for holdtype
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_holdjob(int c, const char *jobid, const char *holdtype, const char *extend)
{
	return (*pfn_pbs_holdjob)(c, jobid, holdtype, extend);
}

/**
 * @brief
 *	pbs_loadconf - Populate the pbs_conf structure
 *
 * @par
 *	Load the pbs_conf structure.  The variables can be filled in
 *	from either the environment or the pbs.conf file.  The
 *	environment gets priority over the file.  If any of the
 *	primary variables are not filled in, the function fails.
 *	Primary vars: pbs_home_path, pbs_exec_path, pbs_server_name
 *
 * @note
 *	Clients can now be multithreaded. So dont call pbs_loadconf with
 *	reload = TRUE. Currently, the code flow ensures that the configuration
 *	is loaded only once (never used with reload true). Thus in the rest of
 *	the code a direct read of the pbs_conf.variables is fine. There is no
 *	race of access of pbs_conf vars against the loading of pbs_conf vars.
 *	However, if pbs_loadconf is called with reload = TRUE, this assumption
 *	will be void. In that case, access to every pbs_conf.variable has to be
 *	synchronized against the reload of those variables.
 *
 * @param[in] reload		Whether to attempt a reload
 *
 * @return int
 * @retval 1 Success
 * @retval 0 Failure
 */
int
pbs_loadconf(int reload)
{
	return (*pfn_pbs_loadconf)(reload);
}

/**
* @brief
*      Pass-through call to send LocateJob request.
*
* @param[in] c - connection handler
* @param[in] jobid - job identifier
* @param[in] extend - string to encode req
*
* @return      string
* @retval      destination name	success
* @retval      NULL      		error
*
*/
char *
pbs_locjob(int c, const char *jobid, const char *extend)
{
	return (*pfn_pbs_locjob)(c, jobid, extend);
}

/**
 * @brief
 *	- Basically a pass-thru to PBS_manager
 *
 * @param[in] c - connection handle
 * @param[in] command - mgr command with respect to obj
 * @param[in] objtype - object type
 * @param[in] objname - object name
 * @param[in] attrib -  pointer to attropl structure
 * @param[in] extend - extend string to encode req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
pbs_manager(int c, int command, int objtype, const char *objname,
	    struct attropl *attrib, const char *extend)
{
	return (*pfn_pbs_manager)(c, command, objtype, objname,
				  attrib, extend);
}

/**
 * @brief
 *	Pass-through call to send move job request
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] destin - job moved to
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_movejob(int c, const char *jobid, const char *destin, const char *extend)
{
	return (*pfn_pbs_movejob)(c, jobid, destin, extend);
}

/**
 * @brief
 *	-Pass-through call to send the MessageJob request and get the reply.
 *
 * @param[in] c - socket descriptor
 * @param[in] jobid - job id
 * @param[in] fileopt - which file
 * @param[in] msg - msg to be encoded
 * @param[in] extend - extend string for encoding req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
pbs_msgjob(int c, const char *jobid, int fileopt, const char *msg, const char *extend)
{
	return (*pfn_pbs_msgjob)(c, jobid, fileopt, msg, extend);
}

/**
 * @brief
 *	-Pass-through call to send order job batch request
 *
 * @param[in] c - connection handler
 * @param[in] job1 - job identifier
 * @param[in] job2 - job identifier
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_orderjob(int c, const char *job1, const char *job2, const char *extend)
{
	return (*pfn_pbs_orderjob)(c, job1, job2, extend);
}

/**
 * @brief
 *	-Pass-through call to send rerun batch request
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_rerunjob(int c, const char *jobid, const char *extend)
{
	return (*pfn_pbs_rerunjob)(c, jobid, extend);
}

/**
 * @brief
 *	-Pass-through call to release a hold on a job.
 * 	really just an instance of the "manager" request.
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] holdtype - type of hold
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_rlsjob(int c, const char *jobid, const char *holdtype, const char *extend)
{
	return (*pfn_pbs_rlsjob)(c, jobid, holdtype, extend);
}

/**
 * @brief
 *	-Pass-through call to send preempt jobs batch request
 *
 * @param[in] c - connection handler
 * @param[in] preempt_jobs_list - list of jobs to be preempted
 *
 * @return      preempt_job_info *
 * @retval      preempt_job_info object       success
 * @retval      NULL      error
 *
 */
preempt_job_info *
pbs_preempt_jobs(int c, char **preempt_jobs_list)
{
	return (*pfn_pbs_preempt_jobs)(c, preempt_jobs_list);
}

/**
 * @brief
 *	-Pass-through call to send runjob batch request
 *
 * @param[in] c - communication handle
 * @param[in] jobid - job identifier
 * @param[in] location - location where job running
 * @param[in] extend - extend string to encode req
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */
int
pbs_runjob(int c, const char *jobid, const char *location, const char *extend)
{
	return (*pfn_pbs_runjob)(c, jobid, location, extend);
}

/**
 * @brief
 *	-Pass-through call to send SelectJob request
 *	Return a list of job ids that meet certain selection criteria.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attropl structure(selection criteria)
 * @param[in] extend - extend string to encode req
 *
 * @return	string
 * @retval	job ids		success
 * @retval	NULL		error
 *
 */
char **
pbs_selectjob(int c, struct attropl *attrib, const char *extend)
{
	return (*pfn_pbs_selectjob)(c, attrib, extend);
}

/**
 * @brief
 *	Pass-through call to sends and reads signal job batch request.
 *
 * @param[in] c - communication handle
 * @param[in] jobid - job identifier
 * @param[in] signal - signal
 * @param[in] extend - extend string for request
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
pbs_sigjob(int c, const char *jobid, const char *signal, const char *extend)
{
	return (*pfn_pbs_sigjob)(c, jobid, signal, extend);
}

/**
 * @brief
 *	-Pass-through call to deallocates a "batch_status" structure
 *
 * @param[in] bsp - pointer to batch request.
 *
 * @return	Void
 *
 */
void
pbs_statfree(struct batch_status *bsp)
{
	(*pfn_pbs_statfree)(bsp);
}

/**
 * @brief
 *	-Pass-through call to deallocates a "batch_deljob_status" structure
 *
 * @param[in] bsp - pointer to batch request.
 *
 * @return	Void
 *
 */
void
pbs_delstatfree(struct batch_deljob_status *bdsp)
{
	(*pfn_pbs_delstatfree)(bdsp);
}

/**
 * @brief
 *	Pass-through call to get status of one or more resources.
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */
struct batch_status *
pbs_statrsc(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statrsc)(c, id, attrib, extend);
}

/**
 * @brief
 *	-Pass-through call to get status of a job.
 *
 * @param[in] c - communication handle
 * @param[in] id - job id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for req
 *
 * @return	structure handle
 * @retval	pointer to batch_status struct		success
 * @retval	NULL					error
 *
 */
struct batch_status *
pbs_statjob(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statjob)(c, id, attrib, extend);
}

/**
 * @brief
 *	-Pass-through call to SelectJob request
 *	Return a list of job ids that meet certain selection criteria.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attropl structure(selection criteria)
 * @param[in] extend - extend string to encode req
 *
 * @return	struct batch_status
 * @retval	batch_status object for job		success
 * @retval	NULL		error
 *
 */
struct batch_status *
pbs_selstat(int c, struct attropl *attrib, struct attrl *rattrib, const char *extend)
{
	return (*pfn_pbs_selstat)(c, attrib, rattrib, extend);
}

/**
 * @brief
 *	-Pass-through call to get status of a queue.
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */
struct batch_status *
pbs_statque(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statque)(c, id, attrib, extend);
}

/**
 * @brief
 *	- Pass-through call to return the status of a server.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */
struct batch_status *
pbs_statserver(int c, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statserver)(c, attrib, extend);
}

/**
 * @brief
 *	- Pass-through call to return the status of sched objects.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */
struct batch_status *
pbs_statsched(int c, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statsched)(c, attrib, extend);
}

/**
 * @brief
 * 	- Pass-through call to return the status of all possible hosts.
 *
 * @param[in] con - communication handle
 * @param[in] hid - hostname to filter
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */
struct batch_status *
pbs_stathost(int con, const char *hid, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_stathost)(con, hid, attrib, extend);
}

/**
 * @brief
 * 	-Pass-through call to returns status of host
 *	maintained for backward compatibility
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL					error
 *
 */
struct batch_status *
pbs_statnode(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statnode)(c, id, attrib, extend);
}

/**
 * @brief
 * 	-Pass-through call to to get information about virtual nodes (vnodes)
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	structure handle
 * @retval	pointer to batch_status struct		Success
 * @retval	NULL					error
 *
 */
struct batch_status *
pbs_statvnode(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statvnode)(c, id, attrib, extend);
}

/**
 * @brief
 *	-Pass-through call to get the status of a reservation.
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */
struct batch_status *
pbs_statresv(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_statresv)(c, id, attrib, extend);
}

/**
 * @brief
 *	Pass-through call to get status of a hook.
 *
 * @param[in] c - communication handle
 * @param[in] id - object name
 * @param[in] attrib - pointer to attrl structure(list)
 * @param[in] extend - extend string for req
 *
 * @return	structure handle
 * @retval	pointer to attr list	success
 * @retval	NULL			error
 *
 */
struct batch_status *
pbs_stathook(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return (*pfn_pbs_stathook)(c, id, attrib, extend);
}

/**
 * @brief
 *	-Pass-through call to get the attributes that failed verification
 *
 * @param[in] connect - socket descriptor
 *
 * @return	structure handle
 * @retval	pointer to ecl_attribute_errors struct		success
 * @retval	NULL						error
 *
 */
struct ecl_attribute_errors *
pbs_get_attributes_in_error(int connect)
{
	return (*pfn_pbs_get_attributes_in_error)(connect);
}

/**
 * @brief
 *	-Pass-through call to submit job request
 *
 * @param[in] c - communication handle
 * @param[in] attrib - ponter to attr list
 * @param[in] script - job script
 * @param[in] destination - host where job submitted
 * @param[in] extend - buffer to hold cred info
 *
 * @return      string
 * @retval      jobid   success
 * @retval      NULL    error
 *
 */
char *
pbs_submit(int c, struct attropl *attrib, const char *script, const char *destination, const char *extend)
{
	return (*pfn_pbs_submit)(c, attrib, script, destination, extend);
}

/**
 * @brief
 *	Pass-through call to submit reservation request
 *
 * @param[in]   c - socket on which connected
 * @param[in]   attrib - the list of attributes for batch request
 * @parma[in]   extend - extension of batch request
 *
 * @return char*
 * @retval SUCCESS returns the reservation ID
 * @retval ERROR NULL
 */
char *
pbs_submit_resv(int c, struct attropl *attrib, const char *extend)
{
	return (*pfn_pbs_submit_resv)(c, attrib, extend);
}

/**
 * @brief
 *	Passes modify reservation request to PBSD_modify_resv( )
 *
 * @param[in]   c - socket on which connected
 * @param[in]	resv_id - reservation id
 * @param[in]   attrib - the list of attributes for batch request
 * @param[in]   extend - extension of batch request
 *
 * @return char*
 * @retval SUCCESS returns the response from the server.
 * @retval ERROR NULL
 */
char *
pbs_modify_resv(int c, const char *resv_id, struct attropl *attrib, const char *extend)
{
	return (*pfn_pbs_modify_resv)(c, resv_id, attrib, extend);
}

/**
 * @brief
 *      Pass-through call to Delete reservation
 *
 * @param[in] c - connection handler
 * @param[in] resv_id - reservation identifier
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
pbs_delresv(int c, const char *resv_id, const char *extend)
{
	return (*pfn_pbs_delresv)(c, resv_id, extend);
}

/**
 * @brief
 * 	 	Release a set of sister nodes or vnodes,
 * 	or all sister nodes or vnodes assigned to the specified PBS
 * 	batch job.
 *
 * @param[in] c 	communication handle
 * @param[in] jobid  job identifier
 * @param[in] node_list 	list of hosts or vnodes to be released
 * @param[in] extend 	additional params, currently passes -k arguments
 *
 * @return	int
 * @retval	0	Success
 * @retval	!0	error
 *
 */
int
pbs_relnodesjob(int c, const char *jobid, const char *node_list, const char *extend)
{
	return (*pfn_pbs_relnodesjob)(c, jobid, node_list, extend);
}

/**
 * @brief
 *	-Pass-through call to send termination batch_request to server.
 *
 * @param[in] c - communication handle
 * @param[in] manner - manner in which server to be terminated
 * @param[in] extend - extension string for request
 *
 * @return	int
 * @retval	0		success
 * @retval	pbs_error	error
 *
 */
int
pbs_terminate(int c, int manner, const char *extend)
{
	return (*pfn_pbs_terminate)(c, manner, extend);
}

/**
 * @brief Registers the Scheduler with all the Servers configured
 *
 * param[in]	sched_id - sched identifier which is known to server
 * param[in]	primary_conn_id - primary connection handle which represents all servers returned by pbs_connect
 * param[in]	secondary_conn_id - secondary connection handle which represents all servers returned by pbs_connect
 *
 * @return int
 * @retval !0  - couldn't register with a connected server
 * @return 0  - success
 */
int
pbs_register_sched(const char *sched_id, int primary_conn_sd, int secondary_conn_sd)
{
	return (*pfn_pbs_register_sched)(sched_id, primary_conn_sd, secondary_conn_sd);
}


================================================
FILE: src/lib/Libifl/ifl_pointers.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <stdio.h>

#include "pbs_ifl.h"
#include "ifl_internal.h"

int (*pfn_pbs_asyrunjob)(int, const char *, const char *, const char *) = __pbs_asyrunjob;
int (*pfn_pbs_asyrunjob_ack)(int, const char *, const char *, const char *) = __pbs_asyrunjob_ack;
int (*pfn_pbs_alterjob)(int, const char *, struct attrl *, const char *) = __pbs_alterjob;
int (*pfn_pbs_asyalterjob)(int, const char *, struct attrl *, const char *) = __pbs_asyalterjob;
int (*pfn_pbs_confirmresv)(int, const char *, const char *, unsigned long, const char *) = __pbs_confirmresv;
int (*pfn_pbs_connect)(const char *) = __pbs_connect;
int (*pfn_pbs_connect_extend)(const char *, const char *) = __pbs_connect_extend;
char *(*pfn_pbs_default)(void) = __pbs_default;
int (*pfn_pbs_deljob)(int, const char *, const char *) = __pbs_deljob;
struct batch_deljob_status *(*pfn_pbs_deljoblist)(int, char **, int, const char *) = __pbs_deljoblist;
int (*pfn_pbs_disconnect)(int) = __pbs_disconnect;
char *(*pfn_pbs_geterrmsg)(int) = __pbs_geterrmsg;
int (*pfn_pbs_holdjob)(int, const char *, const char *, const char *) = __pbs_holdjob;
int (*pfn_pbs_loadconf)(int) = __pbs_loadconf;
char *(*pfn_pbs_locjob)(int, const char *, const char *) = __pbs_locjob;
int (*pfn_pbs_manager)(int, int, int, const char *, struct attropl *, const char *) = __pbs_manager;
int (*pfn_pbs_movejob)(int, const char *, const char *, const char *) = __pbs_movejob;
int (*pfn_pbs_msgjob)(int, const char *, int, const char *, const char *) = __pbs_msgjob;
int (*pfn_pbs_orderjob)(int, const char *, const char *, const char *) = __pbs_orderjob;
int (*pfn_pbs_rerunjob)(int, const char *, const char *) = __pbs_rerunjob;
int (*pfn_pbs_rlsjob)(int, const char *, const char *, const char *) = __pbs_rlsjob;
int (*pfn_pbs_runjob)(int, const char *, const char *, const char *) = __pbs_runjob;
char **(*pfn_pbs_selectjob)(int, struct attropl *, const char *) = __pbs_selectjob;
int (*pfn_pbs_sigjob)(int, const char *, const char *, const char *) = __pbs_sigjob;
void (*pfn_pbs_statfree)(struct batch_status *) = __pbs_statfree;
void (*pfn_pbs_delstatfree)(struct batch_deljob_status *) = __pbs_delstatfree;
struct batch_status *(*pfn_pbs_statrsc)(int, const char *, struct attrl *, const char *) = __pbs_statrsc;
struct batch_status *(*pfn_pbs_statjob)(int, const char *, struct attrl *, const char *) = __pbs_statjob;
struct batch_status *(*pfn_pbs_selstat)(int, struct attropl *, struct attrl *, const char *) = __pbs_selstat;
struct batch_status *(*pfn_pbs_statque)(int, const char *, struct attrl *, const char *) = __pbs_statque;
struct batch_status *(*pfn_pbs_statserver)(int, struct attrl *, const char *) = __pbs_statserver;
struct batch_status *(*pfn_pbs_statsched)(int, struct attrl *, const char *) = __pbs_statsched;
struct batch_status *(*pfn_pbs_stathost)(int, const char *, struct attrl *, const char *) = __pbs_stathost;
struct batch_status *(*pfn_pbs_statnode)(int, const char *, struct attrl *, const char *) = __pbs_statnode;
struct batch_status *(*pfn_pbs_statvnode)(int, const char *, struct attrl *, const char *) = __pbs_statvnode;
struct batch_status *(*pfn_pbs_statresv)(int, const char *, struct attrl *, const char *) = __pbs_statresv;
struct batch_status *(*pfn_pbs_stathook)(int, const char *, struct attrl *, const char *) = __pbs_stathook;
struct ecl_attribute_errors *(*pfn_pbs_get_attributes_in_error)(int) = __pbs_get_attributes_in_error;
char *(*pfn_pbs_submit)(int, struct attropl *, const char *, const char *, const char *) = __pbs_submit;
char *(*pfn_pbs_submit_resv)(int, struct attropl *, const char *) = __pbs_submit_resv;
char *(*pfn_pbs_modify_resv)(int, const char *, struct attropl *, const char *) = __pbs_modify_resv;
int (*pfn_pbs_delresv)(int, const char *, const char *) = __pbs_delresv;
int (*pfn_pbs_relnodesjob)(int, const char *, const char *, const char *) = __pbs_relnodesjob;
int (*pfn_pbs_terminate)(int, int, const char *) = __pbs_terminate;
preempt_job_info *(*pfn_pbs_preempt_jobs)(int, char **) = __pbs_preempt_jobs;
int (*pfn_pbs_register_sched)(const char *, int, int) = __pbs_register_sched;


================================================
FILE: src/lib/Libifl/ifl_util.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "pbs_ifl.h"
#include "libpbs.h"
#include "pbs_error.h"
#include "dis.h"
#include "pbs_share.h"

/**
 * @brief
 *	parse out the parts from 'server_name'
 *
 * @param[in] server_id_in - server id input, could be name:port pair
 * @param[out] server_name_out - server name out, does not include port
 * @param[out] port - port number out
 *
 * @return	string
 * @retval	servr name	success
 *
 */
char *
PBS_get_server(const char *server_id_in, char *server_name_out, unsigned int *port)
{
	char *pc;
	unsigned int dflt_port = pbs_conf.batch_service_port;
	char *p;

	server_name_out[0] = '\0';

	/* first, get the "net.address[:port]" into 'server_name' */

	if ((server_id_in == NULL) || (*server_id_in == '\0')) {
		if ((p = pbs_default()) == NULL)
			return NULL;
		pbs_strncpy(server_name_out, p, PBS_MAXSERVERNAME);
	} else {
		pbs_strncpy(server_name_out, server_id_in, PBS_MAXSERVERNAME);
	}

	/* now parse out the parts from 'server_name_out' */

	if ((pc = strchr(server_name_out, (int) ':')) != NULL) {
		/* got a port number */
		*pc++ = '\0';
		*port = atoi(pc);
	} else {
		*port = dflt_port;
	}

	return server_name_out;
}


================================================
FILE: src/lib/Libifl/int_cred.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_cred.c
 *
 * @brief
 * send job credentials to the mom.
 * @note
 * This code is not mean to be used by a persistent process.
 * If an error occurs, not all the allocated structures are freed.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "dis.h"
#include "ticket.h"
#include "net_connect.h"
#include "tpp.h"
#include "attribute.h"
#include "batch_request.h"

/**
 * @brief
 *	 encode a Job Credential Batch Request
 *
 * @param[in] c - socket descriptor
 * @param[in] credid - credential id (e.g. principal)
 * @param[in] jobid - job id
 * @param[in] data - credentials
 * @param[in] validity - credential validity
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - msg id
 *
 * @return	int
 * @retval	0		success
 * @retval	!0(pbse error)	error
 *
 */
int
PBSD_cred(int c, char *credid, char *jobid, int cred_type, char *data, long validity, int prot, char **msgid)
{
	int rc;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_Cred, pbs_current_user)) ||
	    (rc = encode_DIS_Cred(c, jobid, credid, cred_type, data, strlen(data), validity)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
				return (pbs_errno = PBSE_SYSTEM);
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	return PBSE_NONE;
}


================================================
FILE: src/lib/Libifl/int_hook.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <unistd.h>
#include <stdio.h>
#include <fcntl.h>
#include "portability.h"
#include "libpbs.h"
#include "dis.h"
#include "net_connect.h"
#include "tpp.h"

/**
 * @file	int_hook.c
 */
/**
 *
 * @brief
 *	Send a chunk of data (buf) of size 'len', sequence 'seq'  associated
 *	with the 'hook_filename', over the connection handle 'c'.
 *
 * @param[in]	c - connection channel
 * @param[in]   reqtype - request type
 * @param[in] 	seq - sequence of a block of data (0,1,...)
 * @param[in] 	buf - a block of data
 * @param[in] 	len - size of buf
 * @param[in]	hook_filename - hook filename
 * @param[in]   prot - PROT_TCP or PROT_TPP
 * @param[in]   msgid - msg
 *
 * @return 	int
 * @retval	0 for success
 * @retval	non-zero otherwise.
 */
static int
PBSD_hookbuf(int c, int reqtype, int seq, char *buf, int len, char *hook_filename, int prot, char **msgid)
{
	struct batch_reply *reply;
	int rc;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((hook_filename == NULL) || (hook_filename[0] == '\0'))
		return (pbs_errno = PBSE_PROTOCOL);

	if ((rc = encode_DIS_ReqHdr(c, reqtype, pbs_current_user)) ||
	    (rc = encode_DIS_CopyHookFile(c, seq, buf, len,
					  hook_filename)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {

		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
				return (pbs_errno = PBSE_SYSTEM);
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (prot == PROT_TPP) {
		pbs_errno = PBSE_NONE;
		if (dis_flush(c))
			pbs_errno = PBSE_PROTOCOL;
		return pbs_errno;
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	/* read reply */
	reply = PBSD_rdrpy(c);
	PBSD_FreeReply(reply);

	return get_conn_errno(c);
}

/**
 *
 * @brief
 *	Copy the contents of 'hook_filepath' over the network connection
 *	handle 'c'.
 *
 * @param[in]	c - connection channel
 * @param[in]	hook_filepath - local full file pathname
 * @param[in]   prot - PROT_TCP or PROT_TPP
 * @param[in]   msgid - msg
 *
 * @return int
 * @retval	0 for success
 * @retval	-2 for success, no hookfile or empty hookfile
 * @retval	non-zero otherwise.
 */
int
PBSD_copyhookfile(int c, char *hook_filepath, int prot, char **msgid)
{
	int i;
	int fd;
	int cc;
	int rc = -2;
	char s_buf[SCRIPT_CHUNK_Z];
	char *p;
	char hook_file[MAXPATHLEN + 1];

	if ((fd = open(hook_filepath, O_RDONLY, 0)) < 0) {
		if (prot == PROT_TPP)
			return (-2); /* ok, if nothing to copy */
		else
			return 0;
	}

	/* set hook_file to the relative path of 'hook_filepath' */
	strncpy(hook_file, hook_filepath, MAXPATHLEN);
	if ((p = strrchr(hook_filepath, '/')) != NULL) {
		strncpy(hook_file, p + 1, MAXPATHLEN);
	}

	i = 0;
	cc = read(fd, s_buf, SCRIPT_CHUNK_Z);

	while ((cc > 0) &&
	       ((rc = PBSD_hookbuf(c, PBS_BATCH_CopyHookFile, i, s_buf, cc, hook_file, prot, msgid)) == 0)) {
		i++;
		cc = read(fd, s_buf, SCRIPT_CHUNK_Z);
	}

	close(fd);
	if (cc < 0) /* read failed */
		return (-1);

	return rc; /* rc has the return value from PBSD_hookbuf */
}

/**
 *
 * @brief
 *	Send a Delete Hook file request of 'hook_filename' over the network
 *	channel 'c'.
 *
 * @param[in]	c - connection channel
 * @param[in]	hook_filename - hook filename
 * @param[in] 	prot - PROT_TCP or PROT_TPP
 * @param[in] 	msgid - msg
 *
 * @return 	int
 * @retval	0 for success
 * @retval	non-zero otherwise.
 */
int
PBSD_delhookfile(int c, char *hook_filename, int prot, char **msgid)
{
	struct batch_reply *reply;
	int rc;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((hook_filename == NULL) || (hook_filename[0] == '\0'))
		return (pbs_errno = PBSE_PROTOCOL);

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_DelHookFile, pbs_current_user)) ||
	    (rc = encode_DIS_DelHookFile(c, hook_filename)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
				return (pbs_errno = PBSE_SYSTEM);
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (prot == PROT_TPP) {
		pbs_errno = PBSE_NONE;
		if (dis_flush(c))
			pbs_errno = PBSE_PROTOCOL;
		return pbs_errno;
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	/* read reply */
	reply = PBSD_rdrpy(c);
	PBSD_FreeReply(reply);

	return get_conn_errno(c);
}


================================================
FILE: src/lib/Libifl/int_jcred.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_jcred.c
 *
 * @brief
 * send job credentials to the server.
 * @note
 * This code is not mean to be used by a persistent process.
 * If an error occurs, not all the allocated structures are freed.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include <assert.h>
#include "libpbs.h"
#include "dis.h"
#include "ticket.h"
#include "net_connect.h"
#include "tpp.h"

/**
 * @brief
 *	 encode a Job Credential Batch Request
 *
 * @param[in] c - socket descriptor
 * @param[in] type - credential type
 * @param[in] buf - credentials
 * @param[in] len - credential length
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - msg id
 *
 * @return	int
 * @retval	0		success
 * @retval	!0(pbse error)	error
 *
 */
int
PBSD_jcred(int c, int type, char *buf, int len, int prot, char **msgid)
{
	int rc;
	struct batch_reply *reply = NULL;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_JobCred, pbs_current_user)) ||
	    (rc = encode_DIS_JobCred(c, type, buf, len)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
				return (pbs_errno = PBSE_SYSTEM);
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (prot == PROT_TPP) {
		pbs_errno = PBSE_NONE;
		if (dis_flush(c))
			pbs_errno = PBSE_PROTOCOL;

		return (pbs_errno);
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	reply = PBSD_rdrpy(c);

	PBSD_FreeReply(reply);

	return get_conn_errno(c);
}


================================================
FILE: src/lib/Libifl/int_manage2.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_manage2.c
 * @brief
 * 	The send-request side of the PBS_manager function
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "net_connect.h"
#include "tpp.h"

/**
 * @brief
 *      -encode a Manager Batch Request
 *
 * @par Functionality:
 *              This request is used for most operations where an object is being
 *              created, deleted, or altered.
 *
 * @param[in] c - socket descriptor
 * @param[in] command - command type
 * @param[in] objtype - object type
 * @param[in] objname - object name
 * @param[in] aoplp - pointer to attropl structure(list)
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */
int
PBSD_mgr_put(int c, int function, int command, int objtype, const char *objname, struct attropl *aoplp, const char *extend, int prot, char **msgid)
{
	int rc;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, function, pbs_current_user)) ||
	    (rc = encode_DIS_Manage(c, command, objtype, objname, aoplp)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
				return (pbs_errno = PBSE_SYSTEM);
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (prot == PROT_TPP) {
		pbs_errno = PBSE_NONE;
		if (dis_flush(c))
			pbs_errno = PBSE_PROTOCOL;
		return pbs_errno;
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}
	return 0;
}


================================================
FILE: src/lib/Libifl/int_manager.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_manager.c
 *
 * @brief
 * The function that underlies most of the job manipulation
 * routines...
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include "libpbs.h"
#include "pbs_ecl.h"
#include "cmds.h"

/**
 * @brief
 *	-send manager request and read reply to a possibly multi-svr connection
 *
 * @param[in] c - communication handle
 * @param[in] rq_type - req type
 * @param[in] command - command
 * @param[in] objtype - object type
 * @param[in] objname - object name
 * @param[in] aoplp - attribute list
 * @param[in] extend - extend string for req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
PBSD_manager(int c, int rq_type, int command, int objtype, const char *objname, struct attropl *aoplp, const char *extend)
{
	struct batch_reply *reply;
	int rc;

	/* initialize the thread context data, if not initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* verify the object name if creating a new one */
	if (command == MGR_CMD_CREATE)
		if (pbs_verify_object_name(objtype, objname) != 0)
			return pbs_errno;

	/* now verify the attributes, if verification is enabled */
	if ((pbs_verify_attributes(c, rq_type, objtype, command, aoplp)) != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* send the manage request */
	rc = PBSD_mgr_put(c, rq_type, command, objtype, objname, aoplp, extend, PROT_TCP, NULL);
	if (rc) {
		pbs_client_thread_unlock_connection(c);
		return rc;
	}

	/* read reply from stream into presentation element */
	reply = PBSD_rdrpy(c);
	PBSD_FreeReply(reply);

	rc = get_conn_errno(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/int_modify_resv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <unistd.h>
#include <stdio.h>
#include <fcntl.h>
#include "portability.h"
#include "libpbs.h"
#include "dis.h"
#include "tpp.h"

/**
 * @brief Sends the Modify Reservation request
 *
 * @param[in] connect - socket descriptor for the connection.
 * @param[in] resv-Id - Reservation Identifier
 * @param[in] attrib  - list of attributes to be modified.
 * @param[in] extend  - extended options
 *
 * @return - reply from server on no error.
 * @return - NULL on error.
 */

char *
PBSD_modify_resv(int connect, const char *resv_id, struct attropl *attrib, const char *extend)
{
	struct batch_reply *reply = NULL;
	int rc = -1;
	char *ret = NULL;

	/* initialize the thread context data, if not initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/*
	 * lock pthread mutex here for this connection
	 * blocking call, waits for mutex release
	 */
	if (pbs_client_thread_lock_connection(connect) != 0)
		return NULL;

	DIS_tcp_funcs();

	/* first, set up the body of the Modify Reservation request */

	if ((rc = encode_DIS_ReqHdr(connect, PBS_BATCH_ModifyResv, pbs_current_user)) ||
	    (rc = encode_DIS_ModifyResv(connect, resv_id, attrib)) ||
	    (rc = encode_DIS_ReqExtend(connect, extend))) {
		if (set_conn_errtxt(connect, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
			pbs_client_thread_unlock_connection(connect);
			return NULL;
		}
		if (pbs_errno == PBSE_PROTOCOL) {
			pbs_client_thread_unlock_connection(connect);
			return NULL;
		}
	}
	if (dis_flush(connect)) {
		pbs_errno = PBSE_PROTOCOL;
		pbs_client_thread_unlock_connection(connect);
		return NULL;
	}

	reply = PBSD_rdrpy(connect);
	if (reply == NULL)
		pbs_errno = PBSE_PROTOCOL;
	else {
		if ((reply->brp_code == PBSE_NONE) && (reply->brp_un.brp_txt.brp_str)) {
			ret = strdup(reply->brp_un.brp_txt.brp_str);
			if (!ret)
				pbs_errno = PBSE_SYSTEM;
		}
		PBSD_FreeReply(reply);
	}

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(connect) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/int_msg2.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_msg2.c
 * @brief
 *	send the MessageJob request
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "net_connect.h"
#include "tpp.h"

/**
 * @brief
 *	-PBS_msg_put Send the MessageJob request, does not read the reply.
 *
 * @param[in] c - socket descriptor
 * @param[in] jobid - job identifier
 * @param[in] fileopt - file type
 * @param[in] msg - msg to be sent
 * @param[in] extend - extention string for req encode
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return      int
 * @retval      0               Success
 * @retval      pbs_error(!0)   error
 */
int
PBSD_msg_put(int c, const char *jobid, int fileopt, const char *msg, const char *extend, int prot, char **msgid)
{
	int rc = 0;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_MessJob, pbs_current_user)) ||
	    (rc = encode_DIS_MessageJob(c, jobid, fileopt, msg)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		rc = pbs_errno;
	}

	return rc;
}

/**
 * @brief
 *	-Send the PySpawn request, does not read the reply.
 *
 * @param[in] c - socket descriptor
 * @param[in] jobid - job identifier
 * @param[in] argv - pointer to arguments
 * @param[in] envp - pointer to environment vars
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return	int
 * @retval	0		Success
 * @retval	pbs_error(!0)	error
 */
int
PBSD_py_spawn_put(int c, char *jobid, char **argv, char **envp, int prot, char **msgid)
{
	int rc = 0;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_PySpawn, pbs_current_user)) ||
	    (rc = encode_DIS_PySpawn(c, jobid, argv, envp)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		rc = pbs_errno;
	}

	return rc;
}

/*
 *	PBS_relnodes_put.c
 *
 *	Send the RelnodesJob request, does not read the reply.
 */
int
PBSD_relnodes_put(int c, const char *jobid, const char *node_list, const char *extend, int prot, char **msgid)
{
	int rc = 0;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_RelnodesJob, pbs_current_user)) ||
	    (rc = encode_DIS_RelnodesJob(c, jobid, node_list)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		rc = pbs_errno;
	}

	return rc;
}


================================================
FILE: src/lib/Libifl/int_rdrpy.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_rdrpy.c
 * @brief
 * Read the reply to a batch request.
 * A reply structure is allocated and cleared.
 * The reply is read and decoded into the structure.
 * The reply structure is returned.
 *
 * The caller MUST free the reply structure by calling
 * PBS_FreeReply().
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include <stdlib.h>
#include <time.h>
#include "libpbs.h"
#include "dis.h"
#include "tpp.h"

/**
 * @brief read a batch reply from the given socket
 *
 * @param[in] sock - The socket fd to read from
 * @param[out] rc  - Return DIS error code
 * @param[in] prot - protocol type
 *
 * @return Batch reply structure
 * @retval  !NULL - Success
 * @retval   NULL - Failure
 *
 */
struct batch_reply *
PBSD_rdrpy_sock(int sock, int *rc, int prot)
{
	struct batch_reply *reply;
	time_t old_timeout;

	*rc = DIS_SUCCESS;
	/* clear any prior error message */
	if ((reply = (struct batch_reply *) calloc(1, sizeof(struct batch_reply))) == 0) {
		pbs_errno = PBSE_SYSTEM;
		return NULL;
	}

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
		old_timeout = pbs_tcp_timeout;
		if (pbs_tcp_timeout < PBS_DIS_TCP_TIMEOUT_LONG)
			pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_LONG;
	} else
		DIS_tpp_funcs();

	if ((*rc = decode_DIS_replyCmd(sock, reply, prot)) != 0) {
		(void) free(reply);
		pbs_errno = PBSE_PROTOCOL;
		return NULL;
	}

	dis_reset_buf(sock, DIS_READ_BUF);
	if (prot == PROT_TCP)
		pbs_tcp_timeout = old_timeout;

	pbs_errno = reply->brp_code;
	return reply;
}

/**
 * @brief read a batch reply from the given connection index
 *
 * @param[in] c - The connection index to read from
 *
 * @return DIS error code
 * @retval   DIS_SUCCESS  - Success
 * @retval  !DIS_SUCCESS  - Failure
 */
struct batch_reply *
PBSD_rdrpy(int c)
{
	int rc;
	struct batch_reply *reply;

	/* clear any prior error message */

	if (set_conn_errtxt(c, NULL) != 0) {
		pbs_errno = PBSE_SYSTEM;
		return NULL;
	}
	/* PBSD_rdrpy() only handles TCP, hence passing PROT_TCP as prot */
	reply = PBSD_rdrpy_sock(c, &rc, PROT_TCP);
	if (reply == NULL) {
		if (set_conn_errno(c, PBSE_PROTOCOL) != 0) {
			pbs_errno = PBSE_SYSTEM;
			return NULL;
		}
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
			return NULL;
		}
		return NULL;
	}
	if (set_conn_errno(c, reply->brp_code) != 0) {
		pbs_errno = reply->brp_code;
		return NULL;
	}
	pbs_errno = reply->brp_code;

	if (reply->brp_choice == BATCH_REPLY_CHOICE_Text) {
		if (reply->brp_un.brp_txt.brp_str != NULL) {
			if (set_conn_errtxt(c, reply->brp_un.brp_txt.brp_str) != 0) {
				pbs_errno = PBSE_SYSTEM;
				return NULL;
			}
		}
	}
	return reply;
}

/*
 * PBS_FreeReply - Free a batch_reply structure allocated in PBS_rdrpy()
 *
 *	Any additional allocated substructures pointed to from the
 *	reply structure are freed, then the base struture itself is gone.
 */

void
PBSD_FreeReply(struct batch_reply *reply)
{
	struct brp_select *psel;
	struct brp_select *pselx;

	if (reply == 0)
		return;
	if (reply->brp_choice == BATCH_REPLY_CHOICE_Text) {
		if (reply->brp_un.brp_txt.brp_str) {
			free(reply->brp_un.brp_txt.brp_str);
			reply->brp_un.brp_txt.brp_str = NULL;
			reply->brp_un.brp_txt.brp_txtlen = 0;
		}

	} else if (reply->brp_choice == BATCH_REPLY_CHOICE_Select) {
		psel = reply->brp_un.brp_select;
		while (psel) {
			pselx = psel->brp_next;
			free(psel);
			psel = pselx;
		}

	} else if (reply->brp_choice == BATCH_REPLY_CHOICE_Status) {
		if (reply->brp_un.brp_statc)
			pbs_statfree(reply->brp_un.brp_statc);

	} else if (reply->brp_choice == BATCH_REPLY_CHOICE_Delete) {
		if (reply->brp_un.brp_deletejoblist.brp_delstatc)
			pbs_delstatfree(reply->brp_un.brp_deletejoblist.brp_delstatc);

	} else if (reply->brp_choice == BATCH_REPLY_CHOICE_RescQuery) {
		free(reply->brp_un.brp_rescq.brq_avail);
		free(reply->brp_un.brp_rescq.brq_alloc);
		free(reply->brp_un.brp_rescq.brq_resvd);
		free(reply->brp_un.brp_rescq.brq_down);
	} else if (reply->brp_choice == BATCH_REPLY_CHOICE_PreemptJobs) {
		free(reply->brp_un.brp_preempt_jobs.ppj_list);
	}

	free(reply);
}


================================================
FILE: src/lib/Libifl/int_sig2.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_sig2.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "net_connect.h"
#include "tpp.h"

/**
 * @brief
 *	-PBS_sig_put.c Send the Signal Job Batch Request
 *
 * @param[in] c - socket descriptor
 * @param[in] jobid - job identifier
 * @param[in] signal - signal
 * @param[in] msg - msg to be sent
 * @param[in] extend - extention string for req encode
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return      int
 * @retval      0               Success
 * @retval      pbs_error(!0)   error
 */
int
PBSD_sig_put(int c, const char *jobid, const char *signal, const char *extend, int prot, char **msgid)
{
	int rc = 0;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_SignalJob, pbs_current_user)) ||
	    (rc = encode_DIS_SignalJob(c, jobid, signal)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
				return (pbs_errno = PBSE_SYSTEM);
			}
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		rc = pbs_errno;
	}
	return rc;
}


================================================
FILE: src/lib/Libifl/int_status.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/** @file	int_status.c
 * @brief
 * The function that underlies all the status requests
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include <ctype.h>
#include "libpbs.h"
#include "pbs_ecl.h"
#include "libutil.h"
#include "attribute.h"
#include "cmds.h"
#include "pbs_internal.h"

/**
 * @brief
 *	-wrapper function for PBSD_status_put which sends
 *	status batch request
 *
 * @param[in] c - socket descriptor
 * @param[in] function - request type
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extention string for req encode
 *
 * @return	structure handle
 * @retval 	pointer to batch status on SUCCESS
 * @retval 	NULL on failure
 *
 */
struct batch_status *
PBSD_status(int c, int function, const char *objid, struct attrl *attrib, const char *extend)
{
	int rc;

	/* send the status request */

	if (objid == NULL)
		objid = ""; /* set to null string for encoding */

	rc = PBSD_status_put(c, function, objid, attrib, extend, PROT_TCP, NULL);
	if (rc) {
		return NULL;
	}

	/* get the status reply */
	return PBSD_status_get(c);
}

/**
 * @brief
 *	Returns pointer to status record
 *
 * @param[in] c - connection socket
 * @param[out] last - return pointer to the last batch status read
 *
 * @return returns a pointer to a batch_status structure
 * @retval pointer to batch status on SUCCESS
 * @retval NULL on failure
 */
struct batch_status *
PBSD_status_get(int c)
{
	struct batch_status *rbsp = NULL;
	struct batch_reply *reply;

	/* read reply from stream into presentation element */

	reply = PBSD_rdrpy(c);
	if (reply == NULL) {
		if (pbs_errno == PBSE_NONE)
			pbs_errno = PBSE_PROTOCOL;
		goto end;
	} else if (reply->brp_choice != BATCH_REPLY_CHOICE_NULL &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Text &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Status) {
		if (pbs_errno == PBSE_NONE)
			pbs_errno = PBSE_PROTOCOL;
		goto end;
	} else if (get_conn_errno(c) == 0) {
		rbsp = reply->brp_un.brp_statc;
		reply->brp_un.brp_statc = NULL;
	}

end:
	PBSD_FreeReply(reply);
	return rbsp;
}


================================================
FILE: src/lib/Libifl/int_status2.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_status2.c
 * @brief
 * The function that sends the general batch status request
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "net_connect.h"
#include "tpp.h"

/**
 * @brief
 *	send status job batch request
 *
 * @param[in] c - socket descriptor
 * @param[in] function - request type
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extention string for req encode
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return      int
 * @retval      0               Success
 * @retval      pbs_error(!0)   error
 */
int
PBSD_status_put(int c, int function, const char *id, struct attrl *attrib, const char *extend, int prot, char **msgid)
{
	int rc = 0;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, function, pbs_current_user)) ||
	    (rc = encode_DIS_Status(c, id, attrib)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
				return (pbs_errno = PBSE_SYSTEM);
			}
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	return 0;
}


================================================
FILE: src/lib/Libifl/int_submit.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_submit.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <unistd.h>
#include <stdio.h>
#include <fcntl.h>
#include <stdint.h>

#include "portability.h"
#include "libpbs.h"
#include "dis.h"
#include "tpp.h"
#include "net_connect.h"

/**
 * @brief - Start a standard inter-server message.
 *
 * @param[in] stream  - The TPP stream on which to send message
 * @param[in] command - The message type (cmd) to encode
 *
 * @return error code
 * @retval  DIS_SUCCESS - Success
 * @retval !DIS_SUCCESS - Failure
 */
int
is_compose(int stream, int command)
{
	int ret;

	if (stream < 0)
		return DIS_EOF;
	DIS_tpp_funcs();

	ret = diswsi(stream, IS_PROTOCOL);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, IS_PROTOCOL_VER);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, command);
	if (ret != DIS_SUCCESS)
		goto done;

	return DIS_SUCCESS;

done:
	return ret;
}

/**
 * @brief - Get a unique id each time this function is called
 *
 * @par NOTE:
 *	This id is used as a message id in every command sent out from
 * 	this daemon. This is done to match replies to asynchronous
 * 	command sends to the replies that we receive later
 *
 * @param[out] id - The return msgid created
 *
 * @return error code
 * @retval  DIS_SUCCESS  - Success
 * @retval  DIS_NOMALLOC - Failure
 */
int
get_msgid(char **id)
{
	char msgid[MAXNAMLEN];

	static time_t last_time = -1;
	static int counter = 0;
	time_t now = time(NULL);

	if (now != last_time) {
		counter = 0;
		last_time = now;
	} else {
		counter++;
	}
#ifdef WIN32
	sprintf(msgid, "%ld:%d", now, counter);
#else
	sprintf(msgid, "%ju:%d", (uintmax_t) now, counter);
#endif
	if ((*id = strdup(msgid)) == NULL)
		return DIS_NOMALLOC;

	return DIS_SUCCESS;
}

/**
 * @brief - Compose a command to be sent over TPP stream
 *
 * @par Functionality:
 *	calls im_compose to create the message header, get_msgid to
 * 	add a msg id to the header (unless one is passed)
 *
 * @param[in] stream - Tpp stream to write to
 * @param[in] command - The command to encode
 * @param[in,out] ret_msgid - The msgid, if passed to this function, is
 *                            the msgid to be used for this message.
 *                            If msgid is not passed, then create a unique
 *                            msgid and set for the message, also return it
 *                            back to caller.
 *
 * @return error code
 * @retval  DIS_SUCCESS - Success
 * @retval !DIS_SUCCESS - Failure
 */
int
is_compose_cmd(int stream, int command, char **ret_msgid)
{
	int ret;
	char *temp_id = NULL;

	if ((ret = is_compose(stream, command)) != DIS_SUCCESS)
		return ret;

	/* Create a temp msg id, when there is no buffer passed */
	if (ret_msgid == NULL)
		ret = get_msgid(&temp_id);
	else if (*ret_msgid == NULL || *ret_msgid[0] == '\0') /* buffer passed but NULL or empty id provided */
		if ((ret = get_msgid(ret_msgid)) != 0)
			return ret;

	if ((ret = diswst(stream, ret_msgid ? *ret_msgid : temp_id)) != DIS_SUCCESS)
		return ret;

	free(temp_id);

	return DIS_SUCCESS;
}

/**
 * @brief
 *	-PBS_commit.c This function does the Commit sub-function of
 *	the Queue Job request.
 *
 * @param[in] c - socket fd
 * @param[in] jobid - job identifier
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 * @param[in] extend - extend field, comma separated key value pair
 *
 * @return      int
 * @retval      0               success
 * @retval      !0(pbs_errno)   failure
 *
 */
int
PBSD_commit(int c, char *jobid, int prot, char **msgid, char *extend)
{
	struct batch_reply *reply;
	int rc;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_Commit, pbs_current_user)) ||
	    (rc = encode_DIS_JobId(c, jobid)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
				return (pbs_errno = PBSE_SYSTEM);
			}
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (prot == PROT_TPP) {
		pbs_errno = PBSE_NONE;
		if (dis_flush(c))
			pbs_errno = PBSE_PROTOCOL;
		return pbs_errno;
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	reply = PBSD_rdrpy(c);

	PBSD_FreeReply(reply);

	return get_conn_errno(c);
}

/**
 * @brief
 *	-PBS_scbuf.c Send a chunk of a of the job script to the server.
 *	Called by pbs_submit.  The buffer length could be
 *	zero; the server should handle that case...
 *
 * @param[in] c - connection handle
 * @param[in] reqtype - request type
 * @param[in] seq - file chunk sequence number
 * @param[in] buf - file chunk
 * @param[in] len - length of chunk
 * @param[in] jobid - ob id (for types 1 and 2 only)
 * @param[in] which - standard file type (enum)
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return      int
 * @retval      0               success
 * @retval      !0(pbs_errno)   failure
 *
 */
static int
PBSD_scbuf(int c, int reqtype, int seq, char *buf, int len, char *jobid, enum job_file which, int prot, char **msgid)
{
	struct batch_reply *reply;
	int rc;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS)
			return rc;
	}

	if (jobid == NULL)
		jobid = ""; /* use null string for null pointer */

	if ((rc = encode_DIS_ReqHdr(c, reqtype, pbs_current_user)) ||
	    (rc = encode_DIS_JobFile(c, seq, buf, len, jobid, which)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
				return (pbs_errno = PBSE_SYSTEM);
			}
		}
		return (pbs_errno = PBSE_PROTOCOL);
	}

	if (prot == PROT_TPP) {
		pbs_errno = PBSE_NONE;
		if (dis_flush(c))
			pbs_errno = PBSE_PROTOCOL;
		return pbs_errno;
	}

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	/* read reply */

	reply = PBSD_rdrpy(c);

	PBSD_FreeReply(reply);

	return get_conn_errno(c);
}

/**
 * @brief
 *	-The Job File function used to move files related to
 *	a job between servers.
 *	-- the function PBS_scbuf is called repeatedly to
 *	transfer chunks of the script to the server.
 *
 * @param[in] c - connection handle
 * @param[in] script_file - job file
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	failure
 *
 */

int
PBSD_jscript(int c, const char *script_file, int prot, char **msgid)
{
	int i;
	int fd;
	int cc;
	char s_buf[SCRIPT_CHUNK_Z];
	int rc = 0;

	if ((fd = open(script_file, O_RDONLY, 0)) < 0) {
		return (-1);
	}
	i = 0;
	cc = read(fd, s_buf, SCRIPT_CHUNK_Z);
	while ((cc > 0) &&
	       ((rc = PBSD_scbuf(c, PBS_BATCH_jobscript, i, s_buf, cc, NULL, JScript, prot, msgid)) == 0)) {
		i++;
		cc = read(fd, s_buf, SCRIPT_CHUNK_Z);
	}

	close(fd);
	if (cc < 0) /* read failed */
		return (-1);

	if (prot == PROT_TPP)
		return (rc);

	return get_conn_errno(c);
}

/**
 * @brief
 *	job file function for moving file between server/mom
 *
 * @param[in] c - connection handle
 * @param[in] script_file - job file
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      failure
 *
 */
int
PBSD_jscript_direct(int c, char *script, int prot, char **msgid)
{
	int rc;
	int tosend;
	int i = 0;
	char *p = script;
	int len;

	if (script == NULL) {
		pbs_errno = PBSE_INTERNAL;
		return -1;
	}

	len = strlen(script);
	do {
		tosend = (len > SCRIPT_CHUNK_Z) ? SCRIPT_CHUNK_Z : len;
		rc = PBSD_scbuf(c, PBS_BATCH_jobscript, i, p, tosend, NULL, JScript, prot, msgid);
		i++;
		p += tosend;
		len -= tosend;
	} while ((rc == 0) && (len > 0));

	if (prot == PROT_TPP)
		return (rc);

	return get_conn_errno(c);
}

/**
 * @brief
 *	-PBS_jobfile.c
 *	The Job File function used to move files related to
 *	a job between servers.
 *	-- the function PBS_scbuf is called repeatedly to
 *	transfer chunks of the script to the server.
 *
 * @param[in] c - connection handle
 * @param[in] reqtype - request type
 * @param[in] path - file path
 * @param[in] jobid - job id
 * @param[in] which - standard file type (enum)
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      failure
 *
 */
int
PBSD_jobfile(int c, int req_type, char *path, char *jobid, enum job_file which, int prot, char **msgid)
{
	int i;
	int cc;
	int fd;
	char s_buf[SCRIPT_CHUNK_Z];
	int rc = 0;

	if ((fd = open(path, O_RDONLY, 0)) < 0) {
		return (-1);
	}
	i = 0;
	cc = read(fd, s_buf, SCRIPT_CHUNK_Z);
	while ((cc > 0) &&
	       ((rc = PBSD_scbuf(c, req_type, i, s_buf, cc, jobid, which, prot, msgid)) == 0)) {
		i++;
		cc = read(fd, s_buf, SCRIPT_CHUNK_Z);
	}

	close(fd);
	if (cc < 0) /* read failed */
		return (-1);

	if (prot == PROT_TPP)
		return rc;

	return get_conn_errno(c);
}

/**
 * @brief
 *	-PBS_queuejob.c
 *	This function sends the first part of the Queue Job request
 *
 * @param[in] c - socket descriptor
 * @param[in] jobid - job identifier
 * @param[in] destin - destination name
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extention string for req encode
 * @param[in] prot - PROT_TCP or PROT_TPP
 * @param[in] msgid - message id
 * @param[out] commit_done - 1 if job committed, 0 if not yet committed
 *
 * @return      int
 * @retval      0               Success
 * @retval      pbs_error(!0)   error
 */
char *
PBSD_queuejob(int c, char *jobid, const char *destin, struct attropl *attrib, const char *extend, int prot, char **msgid, int *commit_done)
{
	struct batch_reply *reply;
	char *return_jobid = NULL;
	int rc;

	if (commit_done)
		*commit_done = 0;

	if (prot == PROT_TCP) {
		DIS_tcp_funcs();
	} else {
		if ((rc = is_compose_cmd(c, IS_CMD, msgid)) != DIS_SUCCESS) {
			pbs_errno = PBSE_PROTOCOL;
			return return_jobid;
		}
	}

	/* first, set up the body of the Queue Job request */

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_QueueJob, pbs_current_user)) ||
	    (rc = encode_DIS_QueueJob(c, jobid, destin, attrib)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (prot == PROT_TCP) {
			if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
				pbs_errno = PBSE_SYSTEM;
				return NULL;
			}
			pbs_errno = PBSE_PROTOCOL;
		}
		return return_jobid;
	}

	if (prot == PROT_TPP) {
		pbs_errno = PBSE_NONE;
		if (dis_flush(c))
			pbs_errno = PBSE_PROTOCOL;

		return (""); /* return something NON-NULL for tpp */
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		return return_jobid;
	}

	/* read reply from stream into presentation element */

	reply = PBSD_rdrpy(c);
	if (reply == NULL) {
		pbs_errno = PBSE_PROTOCOL;
	} else if (reply->brp_choice &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Text &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Queue &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Commit) {
		pbs_errno = PBSE_PROTOCOL;
	} else if (get_conn_errno(c) == 0) {
		return_jobid = strdup(reply->brp_un.brp_jid);
		if (return_jobid == NULL) {
			pbs_errno = PBSE_SYSTEM;
		}
		if (commit_done && (reply->brp_choice == BATCH_REPLY_CHOICE_Commit))
			*commit_done = 1;
	}

	PBSD_FreeReply(reply);
	return return_jobid;
}


================================================
FILE: src/lib/Libifl/int_submit_resv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_submit_resv.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <unistd.h>
#include <stdio.h>
#include <fcntl.h>
#include "portability.h"
#include "libpbs.h"
#include "dis.h"

/**
 * @brief
 *	This function sends the Submit Reservation request
 *
 * @param[in] c - socket descriptor
 * @param[in] resv_id - reservation identifier
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extention string for req encode
 *
 * @return      string
 * @retval      resvn id	Success
 * @retval      NULL		error
 *
 */

char *
PBSD_submit_resv(int connect, const char *resv_id, struct attropl *attrib, const char *extend)
{
	struct batch_reply *reply;
	char *return_resv_id = NULL;
	int rc;

	DIS_tcp_funcs();

	/* first, set up the body of the Submit Reservation request */

	if ((rc = encode_DIS_ReqHdr(connect, PBS_BATCH_SubmitResv, pbs_current_user)) ||
	    (rc = encode_DIS_SubmitResv(connect, resv_id, attrib)) ||
	    (rc = encode_DIS_ReqExtend(connect, extend))) {
		if (set_conn_errtxt(connect, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
			return NULL;
		}
		pbs_errno = PBSE_PROTOCOL;
		return return_resv_id;
	}
	if (dis_flush(connect)) {
		pbs_errno = PBSE_PROTOCOL;
		return return_resv_id;
	}

	/* read reply from stream into presentation element */

	reply = PBSD_rdrpy(connect);
	if (reply == NULL) {
		pbs_errno = PBSE_PROTOCOL;
	} else if (!pbs_errno && reply->brp_choice &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Text) {
		pbs_errno = PBSE_PROTOCOL;
	} else if (get_conn_errno(connect) == 0 && reply->brp_code == 0) {
		if (reply->brp_choice == BATCH_REPLY_CHOICE_Text) {
			return_resv_id = strdup(reply->brp_un.brp_txt.brp_str);
			if (return_resv_id == NULL) {
				pbs_errno = PBSE_SYSTEM;
			}
		}
	}

	PBSD_FreeReply(reply);
	return return_resv_id;
}


================================================
FILE: src/lib/Libifl/int_ucred.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	int_ucred.c
 * @brief
 * send user credentials to the server.
 *
 * migrate users info on the current server to a destination server.
 *
 * @note
 * This code is not mean to be used by a persistent process.
 * If an error occurs, not all the allocated structures are freed.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include <assert.h>
#include "libpbs.h"
#include "dis.h"
#include "ticket.h"
#include "pbs_ifl.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	send user credentials to the server.
 *
 * @param[in] c - connection handler
 * @param[in] user - username
 * @param[in] type - cred type
 * @param[in] buf - credentials
 * @param[in] len - length of buffer
 *
 * @return      int
 * @retval      0  		success
 * @retval      error code      error
 *
 */

int
PBSD_ucred(int c, char *user, int type, char *buf, int len)
{
	int rc;
	struct batch_reply *reply = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_UserCred, pbs_current_user)) ||
	    (rc = encode_DIS_UserCred(c, user, type, buf, len)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}
	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	reply = PBSD_rdrpy(c);

	PBSD_FreeReply(reply);

	rc = get_conn_errno(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/list_link.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "portability.h"
#include "list_link.h"
#ifndef NDEBUG
#include <stdio.h>
#include <stdlib.h>
#endif

/**
 * @file	list_link.c
 * @brief
 * list_link.c - general routines for maintenance of a double
 *	linked list.  A user defined structure can be managed as
 *	a double linked list if the first element in the user structure
 *	is the "pbs_list_link" struct defined in list_link.h and the list
 *	is headed by a "pbs_list_head" struct also defined in list_link.h.
 *
 * @par	These are the routines provided:
 *		insert_link - inserts a new entry before or after an old
 *		append_link - adds a new entry to the end of the list
 *		delete_link - removes an entry from the list
 *		is_linked   - returns 1 if entry is in the list
 */

/**
 * @brief
 * 	-insert_link - adds a new entry to a list.
 *	Entry is added either before (position=0) or after (position !=0)
 *	an old entry.
 *
 * @param[in] oldp	ptr to old entry in list
 * @param[in] newp	ptr to new link entry
 * @param[in] pobj 	ptr to object to link in
 * @param[in] position  0=before old, else after
 *
 * @return	Void
 */

void
insert_link(struct pbs_list_link *oldp, struct pbs_list_link *newp,
	    void *pobj, int position)
{

#ifndef NDEBUG
	/* first make sure unlinked entries are pointing to themselves	    */

	if ((pobj == NULL) ||
	    (oldp == NULL) ||
	    (oldp->ll_prior == NULL) ||
	    (oldp->ll_next == NULL) ||
	    (newp->ll_prior != (pbs_list_link *) newp) ||
	    (newp->ll_next != (pbs_list_link *) newp)) {
		(void) fprintf(stderr, "Assertion failed, bad pointer in insert_link\n");
		abort();
	}
#endif

	if (position == LINK_INSET_AFTER) { /* insert newp after oldp */
		newp->ll_prior = oldp;
		newp->ll_next = oldp->ll_next;
		(oldp->ll_next)->ll_prior = newp;
		oldp->ll_next = newp;
	} else { /* insert newp before oldp */
		newp->ll_next = oldp;
		newp->ll_prior = oldp->ll_prior;
		(oldp->ll_prior)->ll_next = newp;
		oldp->ll_prior = newp;
	}
	/*
	 * its big trouble if ll_struct is null, it would make this
	 * entry appear to be the head, so we never let that happen
	 */
	if (pobj)
		newp->ll_struct = pobj;
	else
		newp->ll_struct = (void *) newp;
}

/**
 * @brief
 * 	-append_link - append a new entry to the end of the list
 *
 * @param[in] head		ptr to head of list
 * @param[in] newp		ptr to new link entry
 * @param[in] pobj		ptr to object to link in
 *
 * @return      Void
 */

void
append_link(pbs_list_head *head, pbs_list_head *newp, void *pobj)
{

#ifndef NDEBUG
	/* first make sure unlinked entries are pointing to themselves	    */

	if ((pobj == NULL) ||
	    (head->ll_prior == NULL) ||
	    (head->ll_next == NULL) ||
	    (newp->ll_prior != (pbs_list_link *) newp) ||
	    (newp->ll_next != (pbs_list_link *) newp)) {
		(void) fprintf(stderr, "Assertion failed, bad pointer in insert_link\n");
		abort();
	}
#endif

	(head->ll_prior)->ll_next = newp;
	newp->ll_prior = head->ll_prior;
	newp->ll_next = head;
	head->ll_prior = newp;
	/*
	 * its big trouble if ll_struct is null, it would make this
	 * entry appear to be the head, so we never let that happen
	 */
	if (pobj)
		newp->ll_struct = pobj;
	else
		newp->ll_struct = (void *) newp;
}

/**
 * @brief
 * 	-delete_link - delete an entry from the list
 *
 * @par	Checks to be sure links exist before breaking them\n
 *	Note: the oldp entry is unchanged other than the list links
 *	are cleared.
 *
 * @param[in] oldp       ptr to link to delete
 *
 * @return	Void
 *
 */
void
delete_link(struct pbs_list_link *oldp)
{
	if ((oldp->ll_prior != NULL) &&
	    (oldp->ll_prior != oldp) && (oldp->ll_prior->ll_next == oldp))
		(oldp->ll_prior)->ll_next = oldp->ll_next;

	if ((oldp->ll_next != NULL) &&
	    (oldp->ll_next != oldp) && (oldp->ll_next->ll_prior == oldp))
		(oldp->ll_next)->ll_prior = oldp->ll_prior;

	oldp->ll_next = oldp;
	oldp->ll_prior = oldp;
}

/**
 * @brief delete an entry from the list and clear the struct
 *
 * @param[in] oldp       ptr to link to delete
 */
void
delete_clear_link(struct pbs_list_link *oldp)
{
	delete_link(oldp);
	oldp->ll_struct = NULL;
}

/**
 * @brief
 * 	-swap_link - swap the positions of members of a list
 *
 * @param[in] pone - member one
 * @param[in] ptwo - member two
 *
 * @return	Void
 *
 */

void
swap_link(pbs_list_link *pone, pbs_list_link *ptwo)
{
	pbs_list_link *p1p;
	pbs_list_link *p2p;

	if (pone->ll_next == ptwo) {
		delete_link(pone);
		insert_link(ptwo, pone, pone->ll_struct, LINK_INSET_AFTER);
	} else if (ptwo->ll_next == pone) {
		delete_link(ptwo);
		insert_link(pone, ptwo, ptwo->ll_struct, LINK_INSET_AFTER);
	} else {
		p1p = pone->ll_prior;
		p2p = ptwo->ll_prior;
		delete_link(pone);
		insert_link(p2p, pone, pone->ll_struct, LINK_INSET_AFTER);
		delete_link(ptwo);
		insert_link(p1p, ptwo, ptwo->ll_struct, LINK_INSET_AFTER);
	}
}

/**
 * @brief
 * 	-is_linked - determine if entry is in the list
 *
 * @param[in] head - ptr to head of list
 * @param[in] entry - entry to be searched for
 *
 * @return	int
 * @retval	1 	if in list
 * @retval	0 	if not in list
 *
 */

int
is_linked(pbs_list_link *head, pbs_list_link *entry)
{
	pbs_list_link *pl;

	pl = head->ll_next;
	while (pl != head) {
		if (pl == entry)
			return (1);
		pl = pl->ll_next;
	}
	return (0);
}

/*
 * The following routines are replaced by in-line code with the
 * GET_NEXT / GET_PRIOR macroes when NDEBUG is defined, see list_link.h
 */

#ifndef NDEBUG
/**
 * @brief
 *	get next entry in list
 *
 * @param[in] pl - list variable
 * @param[in] file -file name
 * @param[in] line - line num
 *
 * @retuan 	Void
 *
 */
void *
get_next(pbs_list_link pl, char *file, int line)
{
	if ((pl.ll_next == NULL) ||
	    ((pl.ll_next == &pl) && (pl.ll_struct != NULL))) {
		(void) fprintf(stderr, "Assertion failed, bad pointer in link: file \"%s\", line %d\n", file, line);
		abort();
	}
	return (pl.ll_next->ll_struct);
}

/**
 * @brief
 *      get previous entry in list
 *
 * @param[in] pl - list variable
 * @param[in] file -file name
 * @param[in] line - line num
 *
 * @retuan      Void
 *
 */
void *
get_prior(pbs_list_link pl, char *file, int line)
{
	if ((pl.ll_prior == NULL) ||
	    ((pl.ll_prior == &pl) && (pl.ll_struct != NULL))) {
		(void) fprintf(stderr, "Assertion failed, null pointer in link: file \"%s\", line %d\n", file, line);
		abort();
	}
	return (pl.ll_prior->ll_struct);
}
#endif

/**
 * @brief
 * 	-list_move - move an entire list from one head to another
 *
 * @param[in] from - pointer to pbs_list_head
 * @param[in] to - pointer to pbs_list_head
 *
 * @return	Void
 */

void
list_move(pbs_list_head *from, pbs_list_head *to)
{
	if (from->ll_next == from) {
		to->ll_next = to;
		to->ll_prior = to;
	} else {
		to->ll_next = from->ll_next;
		to->ll_next->ll_prior = to;
		to->ll_prior = from->ll_prior;
		to->ll_prior->ll_next = to;
		CLEAR_HEAD((*from));
	}
}


================================================
FILE: src/lib/Libifl/pbsD_Preempt_Jobs.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*	pbsD_modify_resv.c
 *
 *	The Modify Reservation request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "dis.h"
#include "libpbs.h"
#include "net_connect.h"
#include "pbs_ecl.h"
#include "pbs_idx.h"
#include "pbs_share.h"
#include "portability.h"
#include "tpp.h"
#include <fcntl.h>
#include <stdio.h>
#include <string.h>
#include <unistd.h>

/**
 * @brief
 *	-Pass-through call to send preempt jobs batch request
 *
 * @param[in] connect - connection handler
 * @param[in] preempt_jobs_list - list of jobs to be preempted
 *
 * @return      preempt_job_info *
 * @retval      list of jobs and their preempt_method
 * @retval		NULL in case of error
 *
 */
static preempt_job_info *
PBSD_preempt_jobs(int connect, char **preempt_jobs_list)
{
	struct batch_reply *reply = NULL;
	preempt_job_info *ppj_reply = NULL;
	preempt_job_info *ppj_temp = NULL;
	int rc = -1;

	DIS_tcp_funcs();

	/* first, set up the body of the Preempt Jobs request */

	if ((rc = encode_DIS_ReqHdr(connect, PBS_BATCH_PreemptJobs, pbs_current_user)) ||
	    (rc = encode_DIS_JobsList(connect, preempt_jobs_list, -1)) ||
	    (rc = encode_DIS_ReqExtend(connect, NULL))) {
		if (set_conn_errtxt(connect, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
			return NULL;
		}
		if (pbs_errno == PBSE_PROTOCOL)
			return NULL;
	}
	if (dis_flush(connect)) {
		pbs_errno = PBSE_PROTOCOL;
		return NULL;
	}

	reply = PBSD_rdrpy(connect);
	if (reply == NULL)
		pbs_errno = PBSE_PROTOCOL;
	else {
		int i = 0;
		int count = 0;
		ppj_temp = reply->brp_un.brp_preempt_jobs.ppj_list;
		count = reply->brp_un.brp_preempt_jobs.count;

		ppj_reply = calloc(sizeof(struct preempt_job_info), count);
		if (ppj_reply == NULL)
			return NULL;

		for (i = 0; i < count; i++) {
			strcpy(ppj_reply[i].job_id, ppj_temp[i].job_id);
			strcpy(ppj_reply[i].order, ppj_temp[i].order);
		}
		PBSD_FreeReply(reply);
	}
	return ppj_reply;
}

/**
 * @brief
 *	-Pass-through call to send preempt jobs batch request
 *
 * @param[in] c - connection handler
 * @param[in] preempt_jobs_list - list of jobs to be preempted
 *
 * @return	preempt_job_info *
 * @retval	list of jobs and their preempt_method
 * @retval	NULL for Error/Failure
 *
 */
preempt_job_info *
__pbs_preempt_jobs(int c, char **preempt_jobs_list)
{
	preempt_job_info *ret = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* lock pthread mutex here for this connection
	 * blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_preempt_jobs(c, preempt_jobs_list);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_alterjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_alterjob.c
 * @brief
 * Send the Alter Job request to the server --
 * really an instance of the "manager" request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include "libpbs.h"

/**
 * @brief	Convenience function to create attropl list from attrl (shallow copy)
 *
 * @param[in]	attrib - the list to copy
 *
 * @return struct attropl
 * @retval newly allocated attropl list
 * @retval NULL for malloc error
 */
static struct attropl *
attrl_to_attropl(struct attrl *attrib)
{
	struct attropl *ap = NULL;
	struct attropl *ap1 = NULL;

	/* copy the attrl to an attropl */
	while (attrib != NULL) {
		if (ap == NULL) {
			ap1 = ap = (struct attropl *) malloc(sizeof(struct attropl));
		} else {
			ap->next = (struct attropl *) malloc(sizeof(struct attropl));
			ap = ap->next;
		}
		if (ap == NULL) {
			while (ap1 != NULL) {
				ap = ap1->next;
				free(ap1);
				ap1 = ap;
			}
			pbs_errno = PBSE_SYSTEM;
			return NULL;
		}
		ap->name = attrib->name;
		ap->resource = attrib->resource;
		ap->value = attrib->value;
		ap->op = SET;
		ap->next = NULL;
		attrib = attrib->next;
	}

	return ap1;
}

/**
 * @brief	Convenience function to shallow-free oplist
 *
 * @param[out]	oplist - the list to free
 *
 * @return void
 */
static void
__free_attropl(struct attropl *oplist)
{
	struct attropl *ap = NULL;

	while (oplist != NULL) {
		ap = oplist->next;
		free(oplist);
		oplist = ap;
	}
}

/**
 * @brief
 *	-Send the Alter Job request to the server --
 *	really an instance of the "manager" request.
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
__pbs_alterjob(int c, const char *jobid, struct attrl *attrib, const char *extend)
{
	struct attropl *attrib_opl = NULL;
	int rc = 0;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	attrib_opl = attrl_to_attropl(attrib);

	rc = PBSD_manager(c, PBS_BATCH_ModifyJob, MGR_CMD_SET, MGR_OBJ_JOB, jobid, attrib_opl, extend);

	/* free up the attropl we just created */
	__free_attropl(attrib_opl);

	return rc;
}

/**
 * @brief	Send Alter Job request to the server, Asynchronously
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
__pbs_asyalterjob(int c, const char *jobid, struct attrl *attrib, const char *extend)
{
	struct attropl *attrib_opl = NULL;
	int i;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	/* initialize the thread context data, if not initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* send the manage request with modifyjob async */
	attrib_opl = attrl_to_attropl(attrib);
	i = PBSD_mgr_put(c, PBS_BATCH_ModifyJob_Async, MGR_CMD_SET, MGR_OBJ_JOB, jobid, attrib_opl, extend, PROT_TCP, NULL);
	__free_attropl(attrib_opl);

	if (i) {
		(void) pbs_client_thread_unlock_connection(c);
		return i;
	}

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return i;
}


================================================
FILE: src/lib/Libifl/pbsD_confirmresv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_confirmresv.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 * 	-pbs_confirmresv - this function is for exclusive use by the Scheduler
 *	to confirm an advanced reservation.
 *
 * @param[in] rid 	Reservaion ID
 * @param[in] location  string of vnodes/resources to be allocated to the resv.
 * @param[in] start 	start time of reservation if non-zero
 *
 * @return	int
 * @retval	0	Success
 * @retval	!0	error
 *
 */

int
__pbs_confirmresv(int c, const char *rid, const char *location, unsigned long start,
		  char *extend)
{
	int rc;
	struct batch_reply *reply;

	if ((rid == NULL) || (*rid == '\0') ||
	    (location == NULL) || (*location == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	/* send run request */

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_ConfirmResv, pbs_current_user)) ||
	    (rc = encode_DIS_Run(c, rid, location, start)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* get reply */

	reply = PBSD_rdrpy(c);
	rc = get_conn_errno(c);

	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_connect.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_connect.c
 * @brief
 *	Open a connection with the pbs server.  At this point several
 *	things are stubbed out, and other things are hard-wired.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <ctype.h>
#include <stdlib.h>
#include <errno.h>
#include <fcntl.h>
#include <stdio.h>
#include <pwd.h>
#include <string.h>
#include <netdb.h>
#include <unistd.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/time.h>
#include <netinet/in.h>
#include <netinet/tcp.h>
#include <arpa/inet.h>
#include <pbs_ifl.h>
#include "libpbs.h"
#include "net_connect.h"
#include "dis.h"
#include "libsec.h"
#include "pbs_ecl.h"
#include "pbs_internal.h"
#include "log.h"
#include "auth.h"
#include "ifl_internal.h"
#include "libutil.h"
#include "portability.h"

/**
 * @brief
 *	-returns the default server name.
 *
 * @return	string
 * @retval	dflt srvr name	success
 * @retval	NULL		error
 *
 */
char *
__pbs_default(void)
{
	char dflt_server[PBS_MAXSERVERNAME + 1];
	struct pbs_client_thread_context *p;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	p = pbs_client_thread_get_context_data();

	if (pbs_loadconf(0) == 0)
		return NULL;

	if (p->th_pbs_defserver[0] == '\0') {
		/* The check for PBS_DEFAULT is done in pbs_loadconf() */
		if (pbs_conf.pbs_primary && pbs_conf.pbs_secondary) {
			strncpy(dflt_server, pbs_conf.pbs_primary, PBS_MAXSERVERNAME);
		} else if (pbs_conf.pbs_server_host_name) {
			strncpy(dflt_server, pbs_conf.pbs_server_host_name, PBS_MAXSERVERNAME);
		} else if (pbs_conf.pbs_server_name) {
			strncpy(dflt_server, pbs_conf.pbs_server_name, PBS_MAXSERVERNAME);
		} else {
			dflt_server[0] = '\0';
		}
		strcpy(p->th_pbs_defserver, dflt_server);
	}
	return (p->th_pbs_defserver);
}

/**
 * @brief
 *	Return the IP address used in binding a socket to a host
 *	Attempts to find IPv4 address for the named host,  first address found
 *	is returned.
 *
 * @param[in]	host - The name of the host to whose address is needed
 * @param[out]	sap  - pointer to the sockaddr_in structure into which
 *						the address will be returned.
 *
 * @return	int
 * @retval  0	- success, address set in *sap
 * @retval -1	- error, *sap is left zero-ed
 */
static int
get_hostsockaddr(const char *host, struct sockaddr_in *sap)
{
	struct addrinfo hints;
	struct addrinfo *aip, *pai;

	memset(sap, 0, sizeof(struct sockaddr));
	memset(&hints, 0, sizeof(struct addrinfo));
	/*
	 *	Why do we use AF_UNSPEC rather than AF_INET?  Some
	 *	implementations of getaddrinfo() will take an IPv6
	 *	address and map it to an IPv4 one if we ask for AF_INET
	 *	only.  We don't want that - we want only the addresses
	 *	that are genuinely, natively, IPv4 so we start with
	 *	AF_UNSPEC and filter ai_family below.
	 */
	hints.ai_family = AF_UNSPEC;
	hints.ai_socktype = SOCK_STREAM;
	hints.ai_protocol = IPPROTO_TCP;

	if (getaddrinfo(host, NULL, &hints, &pai) != 0) {
		pbs_errno = PBSE_BADHOST;
		return -1;
	}
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		/* skip non-IPv4 addresses */
		if (aip->ai_family == AF_INET) {
			*sap = *((struct sockaddr_in *) aip->ai_addr);
			freeaddrinfo(pai);
			return 0;
		}
	}
	/* treat no IPv4 addresses as getaddrinfo() failure */
	pbs_errno = PBSE_BADHOST;
	freeaddrinfo(pai);
	return -1;
}

/**
 * @brief	This function establishes a network connection to the given server.
 * 			set extend_data to the value of NOBLK_FLAG to do a non-blocking connect
 *
 * @param[in]   server - The hostname of the pbs server to connect to.
 * @param[in]   port - Port number of the pbs server to connect to.
 * @param[in]   extend_data - a string to send as "extend" data
 *
 *
 * @return int
 * @retval >= 0	The physical server socket.
 * @retval -1	error encountered setting up the connection.
 */

static int
tcp_connect(const char *hostname, int server_port, const char *extend_data)
{
	int i;
	int sd;
	struct sockaddr_in server_addr;
	struct batch_reply *reply;
	char errbuf[LOG_BUF_SIZE] = {'\0'};
	bool noblk = false;
	bool connect_err = false;
#ifdef WIN32
	int non_block = 1;
#else
	int oflg = 0;
	int nflg = 0;
#endif

	if (extend_data != NULL && strcmp(NOBLK_FLAG, extend_data) == 0)
		noblk = true;

		/* get socket	*/
#ifdef WIN32
	/* the following lousy hack is needed since the socket call needs */
	/* SYSTEMROOT env variable properly set! */
	if (getenv("SYSTEMROOT") == NULL) {
		setenv("SYSTEMROOT", "C:\\WINDOWS", 1);
		setenv("SystemRoot", "C:\\WINDOWS", 1);
	}
#endif

	sd = socket(AF_INET, SOCK_STREAM, 0);
	if (sd == -1) {
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}
	if (noblk) { /* set socket non-blocking */
#ifdef WIN32
		if (ioctlsocket(sd, FIONBIO, &non_block) == SOCKET_ERROR) {
#else
		oflg = fcntl(sd, F_GETFL) & ~O_ACCMODE;
		nflg = oflg | O_NONBLOCK;
		if (fcntl(sd, F_SETFL, nflg) == -1)
#endif
			{
				pbs_errno = PBSE_SYSTEM;
				return -1;
			}
		}

		pbs_strncpy(pbs_server, hostname, sizeof(pbs_server)); /* set for error messages from commands */
		/* and connect... */

		if (get_hostsockaddr(hostname, &server_addr) != 0)
			return -1;

		server_addr.sin_port = htons(server_port);
		if (connect(sd, (struct sockaddr *) &server_addr, sizeof(struct sockaddr)) != 0)
			connect_err = true;

		if (connect_err && noblk) { /* For non-blocking, wait until timeout before erroring out */
			fd_set fdset;
			struct timeval tv;
			int n;
			pbs_socklen_t l;

			/* connect attempt failed */
			pbs_errno = SOCK_ERRNO;
			switch (pbs_errno) {
#ifdef WIN32
				case WSAEWOULDBLOCK:
#else
			case EINPROGRESS:
			case EWOULDBLOCK:
#endif
					while (1) {
						FD_ZERO(&fdset);
						FD_SET(sd, &fdset);
						tv.tv_sec = NOBLK_TOUT;
						tv.tv_usec = 0;
						n = select(sd + 1, NULL, &fdset, NULL, &tv);
						if (n > 0) {
							pbs_errno = 0;
							l = sizeof(pbs_errno);
							getsockopt(sd, SOL_SOCKET, SO_ERROR, &pbs_errno, &l);
							if (pbs_errno == 0)
								connect_err = false;
							break;
						} else {
#ifdef WIN32
							if (SOCK_ERRNO != WSAEINTR)
#else
						if (SOCK_ERRNO != EINTR)
#endif
								break;
						}
					}
					break;

				default:;
			}
		}
		if (connect_err) {
			if (pbs_errno == PBSE_NONE)
				pbs_errno = PBSE_SYSTEM;
			closesocket(sd);
			return -1; /* cannot connect */
		}

		/* reset socket blocking */
#ifdef WIN32
		non_block = 0;
		if (ioctlsocket(sd, FIONBIO, &non_block) == SOCKET_ERROR)
#else
	if (fcntl(sd, F_SETFL, oflg) < 0)
#endif

			/* setup connection level thread context */
			if (pbs_client_thread_init_connect_context(sd) != 0) {
				closesocket(sd);
				pbs_errno = PBSE_SYSTEM;
				return -1;
			}

		/*
	 * No need for global lock now on, since rest of the code
	 * is only communication on a connection handle.
	 * But we dont need to lock the connection handle, since this
	 * connection handle is not yet been returned to the client
	 */

		if (load_auths(AUTH_CLIENT)) {
			closesocket(sd);
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}

		/* setup DIS support routines for following pbs_* calls */
		DIS_tcp_funcs();

		/* The following code was originally  put in for HPUX systems to deal
	 * with the issue where returning from the connect() call doesn't
	 * mean the connection is complete.  However, this has also been
	 * experienced in some Linux ppc64 systems like js-2. Decision was
	 * made to enable this harmless code for all architectures.
	 * FIX: Need to use the socket to send
	 * a message to complete the process.  For IFF authentication there is
	 * no leading authentication message needing to be sent on the client
	 * socket, so will send a "dummy" message and discard the replyback.
	 */
		if ((i = encode_DIS_ReqHdr(sd, PBS_BATCH_Connect, pbs_current_user)) ||
		    (i = encode_DIS_ReqExtend(sd, extend_data))) {
			closesocket(sd);
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
		if (dis_flush(sd)) {
			closesocket(sd);
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}

		pbs_errno = PBSE_NONE;
		reply = PBSD_rdrpy(sd);
		PBSD_FreeReply(reply);
		if (pbs_errno != PBSE_NONE) {
			closesocket(sd);
			return -1;
		}

		if (engage_client_auth(sd, hostname, server_port, errbuf, sizeof(errbuf)) != 0) {
			if (pbs_errno == PBSE_NONE)
				pbs_errno = PBSE_PERM;
			fprintf(stderr, "auth: error returned: %d\n", pbs_errno);
			if (errbuf[0] != '\0')
				fprintf(stderr, "auth: %s\n", errbuf);
			closesocket(sd);
			return -1;
		}

		pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_VLONG; /* set for 3 hours */

		/*
	 * Disable Nagle's algorithm on the TCP connection to server.
	 * Nagle's algorithm is hurting cmd-server communication.
	 */
		if (pbs_connection_set_nodelay(sd) == -1) {
			closesocket(sd);
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}

		return sd;
	}

	/**
 * @brief	Helper function to connect to a particular server
 *
 * @param[in]	svrname - server hostname to connect to
 * @param[in]	svrport - server port to connect to
 * @param[in]	extend_data - any additional data relevant for connection
 *
 * @return	int
 * @retval	-1 for error
 * @retval	fd of connection
 */
	static int
	connect_to_server(const char *svrname, int svrport, const char *extend_data)
	{
		int sd = -1;
		struct sockaddr_in my_sockaddr;

		/* bind to pbs_public_host_name if given  */
		if (pbs_conf.pbs_public_host_name) {
			if (get_hostsockaddr(pbs_conf.pbs_public_host_name, &my_sockaddr) != 0)
				return -1; /* pbs_errno was set */
			/* my address will be in my_sockaddr,  bind the socket to it */
			my_sockaddr.sin_port = 0;
			if (bind(sd, (struct sockaddr *) &my_sockaddr, sizeof(my_sockaddr)) != 0) {
				return -1;
			}
		}

		sd = tcp_connect(svrname, svrport, extend_data);

		return sd;
	}

	/**
 * @brief	Makes a PBS_BATCH_Connect request to 'server'.
 *
 * @param[in]   server - the hostname of the pbs server to connect to.
 * @param[in]   extend_data - a string to send as "extend" data.
 *
 * @return int
 * @retval >= 0	index to the internal connection table representing the
 *		connection made.
 * @retval -1	error encountered setting up the connection.
 */
	int
	__pbs_connect_extend(const char *server, const char *extend_data)
	{
		char server_name[PBS_MAXSERVERNAME + 1];
		unsigned int server_port;
		char *altservers[2];
		int have_alt = 0;
		int sock = -1;
		int i;
		int f;

		char pbsrc[_POSIX_PATH_MAX];
		struct stat sb;
		int using_secondary = 0;

		/* initialize the thread context data, if not already initialized */
		if (pbs_client_thread_init_thread_context() != 0)
			return -1;

		if (pbs_loadconf(0) == 0)
			return -1;

		if (PBS_get_server(server, server_name, &server_port) == NULL) {
			pbs_errno = PBSE_NOSERVER;
			return -1;
		}

		if (pbs_conf.pbs_primary && pbs_conf.pbs_secondary) {
			/* failover configuered ...   */
			if (is_same_host(server_name, pbs_conf.pbs_primary)) {
				have_alt = 1;

				altservers[0] = pbs_conf.pbs_primary;
				altservers[1] = pbs_conf.pbs_secondary;

				/* We want to try the one last seen as "up" first to not   */
				/* have connection delays.   If the primary was up, there  */
				/* is no .pbsrc.NAME file.  If the last command connected  */
				/* to the Secondary, then it created the .pbsrc.USER file. */

				/* see if already seen Primary down */
				snprintf(pbsrc, _POSIX_PATH_MAX, "%s/.pbsrc.%s", pbs_conf.pbs_tmpdir, pbs_current_user);
				if (stat(pbsrc, &sb) != -1) {
					/* try secondary first */
					altservers[0] = pbs_conf.pbs_secondary;
					altservers[1] = pbs_conf.pbs_primary;
					using_secondary = 1;
				}
			}
		}

		/*
	 * connect to server ...
	 * If attempt to connect fails and if Failover configured and
	 *   if attempting to connect to Primary,  try the Secondary
	 *   if attempting to connect to Secondary, try the Primary
	 */
		for (i = 0; i < (have_alt + 1); ++i) {
			if (have_alt)
				pbs_strncpy(server_name, altservers[i], PBS_MAXSERVERNAME);
			if ((sock = connect_to_server(server_name, server_port, extend_data)) != -1)
				break;
		}

		if (i >= (have_alt + 1) && sock == -1) {
			return -1; /* cannot connect */
		}

		if (have_alt && (i == 1)) {
			/* had to use the second listed server ... */
			if (using_secondary == 1) {
				/* remove file that causes trying the Secondary first */
				unlink(pbsrc);
			} else {
				/* create file that causes trying the Primary first   */
				f = open(pbsrc, O_WRONLY | O_CREAT, 0200);
				if (f != -1)
					close(f);
			}
		}

		return sock;
	}

	/**
 * @brief
 *	Set no-delay option (disable nagles algoritm) on connection
 *
 * @param[in]   connect - connection index
 *
 * @return int
 * @retval  0	Succcess
 * @retval -1	Failure (bad index, or failed to set)
 *
 */
	int
	pbs_connection_set_nodelay(int connect)
	{
		int opt;
		pbs_socklen_t optlen;

		if (connect < 0)
			return -1;
		optlen = sizeof(opt);
		if (getsockopt(connect, IPPROTO_TCP, TCP_NODELAY, &opt, &optlen) == -1)
			return -1;

		if (opt == 1)
			return 0;

		opt = 1;
		return setsockopt(connect, IPPROTO_TCP, TCP_NODELAY, &opt, sizeof(opt));
	}

	/**
 * @brief	A wrapper progarm to pbs_connect_extend() but this one not
 *			passing any 'extend' data to the connection.
 *
 * @param[in] server - server - the hostname of the pbs server to connect to.
 *
 * @retval int	- return value of pbs_connect_extend().
 */
	int
	__pbs_connect(const char *server)
	{
		return (pbs_connect_extend(server, NULL));
	}

	/**
 * @brief
 *	-send close connection batch request
 *
 * @param[in] connect - socket descriptor
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 *
 */
	int
	__pbs_disconnect(int connect)
	{
		char x;

		if (connect < 0)
			return 0;

		/* initialize the thread context data, if not already initialized */
		if (pbs_client_thread_init_thread_context() != 0)
			return -1;

		/*
	 * Use only connection handle level lock since this is
	 * just communication with server
	 */
		if (pbs_client_thread_lock_connection(connect) != 0)
			return -1;

		/*
	 * check again to ensure that another racing thread
	 * had not already closed the connection
	 */
		if (get_conn_chan(connect) == NULL)
			return 0;

		/* send close-connection message */

		DIS_tcp_funcs();
		if ((encode_DIS_ReqHdr(connect, PBS_BATCH_Disconnect, pbs_current_user) == 0) &&
		    (dis_flush(connect) == 0)) {
			for (;;) { /* wait for server to close connection */
#ifdef WIN32
				if (recv(connect, &x, 1, 0) < 1)
#else
			if (read(connect, &x, 1) < 1)
#endif
					break;
			}
		}

		CS_close_socket(connect);
		closesocket(connect);
		dis_destroy_chan(connect);

		/* unlock the connection level lock */
		if (pbs_client_thread_unlock_connection(connect) != 0)
			return -1;

		/*
	 * this is only a per thread work, so outside lock and unlock
	 * connection needs the thread level connect context so this should be
	 * called after unlocking
	 */
		if (pbs_client_thread_destroy_connect_context(connect) != 0)
			return -1;

		destroy_connection(connect);

		return 0;
	}

	/**
 * @brief
 *	-return the number of max connections.
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
	int
	pbs_query_max_connections()
	{
		return (NCONNECTS - 1);
	}

	/*
 *	pbs_connect_noblk() - Open a connection with a pbs server.
 *		Do not allow TCP to block us if Server host is down
 *
 *	At this point, this does not attempt to find a fail_over Server
 */

	/**
 * @brief
 *	Open a connection with a pbs server.
 *	Do not allow TCP to block us if Server host is down
 *	At this point, this does not attempt to find a fail_over Server
 *
 * @param[in]   server - specifies the server to which to connect
 *
 * @return int
 * @retval >= 0	index to the internal connection table representing the
 *		connection made.
 * @retval -1	error encountered in getting index
 */
	int
	pbs_connect_noblk(const char *server)
	{
		return pbs_connect_extend(server, NOBLK_FLAG);
	}

	/**
 * @brief Registers the given connection with the Server by sending PBS_BATCH_RegisterSched
 *
 * param[in]	sched_id - sched identifier which is known to server
 * @return int
 * @retval !0  - failure
 * @return 0  - success
 */
	static int
	register_sched_conn(int c, const char *sched_id)
	{
		int rc;
		struct batch_reply *reply = NULL;

		if (sched_id == NULL)
			return -1;

		rc = encode_DIS_ReqHdr(c, PBS_BATCH_RegisterSched, pbs_current_user);
		if (rc != DIS_SUCCESS)
			goto rerr;
		rc = diswst(c, sched_id);
		if (rc != DIS_SUCCESS)
			goto rerr;
		rc = encode_DIS_ReqExtend(c, NULL);
		if (rc != DIS_SUCCESS)
			goto rerr;
		if (dis_flush(c) != 0)
			goto rerr;

		pbs_errno = 0;
		reply = PBSD_rdrpy(c);
		if (reply == NULL)
			goto rerr;

		if (pbs_errno != 0)
			goto rerr;

		PBSD_FreeReply(reply);
		return 0;

	rerr:
		pbs_disconnect(c);
		PBSD_FreeReply(reply);
		return -1;
	}

	/**
 * @brief Registers the Scheduler with all the Servers configured
 *
 * param[in]	sched_id - sched identifier which is known to server
 * param[in]	primary_conn_id - primary connection handle which represents all servers returned by pbs_connect
 * param[in]	secondary_conn_id - secondary connection handle which represents all servers returned by pbs_connect
 *
 * @return int
 * @retval !0  - couldn't register with a connected server
 * @return 0  - success
 */
	int
	__pbs_register_sched(const char *sched_id, int primary_conn_sd, int secondary_conn_sd)
	{
		if (sched_id == NULL || primary_conn_sd < 0 || secondary_conn_sd < 0)
			return -1;

		if (register_sched_conn(primary_conn_sd, sched_id) != 0)
			return -1;
		if (register_sched_conn(secondary_conn_sd, sched_id) != 0)
			return -1;

		return 0;
	}


================================================
FILE: src/lib/Libifl/pbsD_defschreply.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_defschreply.c
 * @brief
 *		Deferred reply from the Scheduler to the Server
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_error.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	- Deferred reply from the Scheduler to the Server
 *
 * @param[in] c - connection handler
 * @param[in] cmd - command
 * @param[in] id - job id
 * @param[in] err - error number
 * @param[in] txt - message
 * @param[in] extend - extend string for encoding req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
pbs_defschreply(int c, int cmd, char *id, int err, char *txt, char *extend)
{
	int rc;
	struct batch_reply *reply;
	int has_txt = 0;

	if ((id == NULL) || (*id == '\0'))
		return (pbs_errno = PBSE_IVALREQ);
	if ((txt != NULL) && (*txt != '\0'))
		has_txt = 1;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	/* encode request */

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_DefSchReply,
				    pbs_current_user)) ||
	    (rc = diswui(c, cmd) != 0) ||
	    (rc = diswst(c, id) != 0) ||
	    (rc = diswui(c, err) != 0)) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}
	rc = diswsi(c, has_txt);
	if ((has_txt == 1) && (rc == 0)) {
		rc = diswst(c, txt);
	}
	if (rc == 0)
		rc = encode_DIS_ReqExtend(c, extend);
	if (rc) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* get reply */

	reply = PBSD_rdrpy(c);
	rc = get_conn_errno(c);

	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_deljob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_deljob.c
 * @brief
 * Send the Delete Job request to the server
 * really just an instance of the manager request
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>

#include "ifl_internal.h"
#include "libpbs.h"
#include "pbs_ifl.h"

/**
 * @brief
 *	Send the Delete Job request to the server
 * 	really just an instance of the manager request
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] extend - string to encode req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */

int
__pbs_deljob(int c, const char *jobid, const char *extend)
{
	char *list[2];
	struct batch_deljob_status *res = NULL;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	list[0] = (char *) jobid;
	list[1] = NULL;

	res = pbs_deljoblist(c, list, 1, extend);
	if (res != NULL)
		return res->code;
	return PBSE_NONE;
}


================================================
FILE: src/lib/Libifl/pbsD_deljoblist.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_deljob.c
 * @brief
 * Send the Delete Job request to the server
 * really just an instance of the manager request
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "cmds.h"
#include "dis.h"
#include "libpbs.h"
#include "libutil.h"
#include "net_connect.h"
#include "pbs_ecl.h"
#include "pbs_ifl.h"
#include "tpp.h"
#include <stdio.h>
#include "dedup_jobids.h"

/**
 * @brief	Deallocate a svr_jobid_list_t list
 * @param[out]	list - the list to deallocate
 * @param[in]	shallow - shallow free (don't free the individual jobids in the array)
 * @return	void
 */
void
free_svrjobidlist(svr_jobid_list_t *list, int shallow)
{
	svr_jobid_list_t *iter_list = NULL;
	svr_jobid_list_t *next = NULL;

	for (iter_list = list; iter_list != NULL; iter_list = next) {
		next = iter_list->next;
		if (shallow)
			free(iter_list->jobids);
		else
			free_str_array(iter_list->jobids);
		free(iter_list);
	}
}

/**
 * @brief
 *	Append a given jobid to the given svr_jobid_list struct.
 *
 * @param[in] svr - Server name
 * @param[in] jobid - Job id
 *
 * @return	int
 * @retval	0 for Success
 * @retval	1 for Failure
 */
int
append_jobid(svr_jobid_list_t *svr, const char *jobid)
{
	if ((svr == NULL) || (jobid == NULL))
		return 0;

	if (svr->max_sz == 0) {
		svr->jobids = malloc((DELJOB_DFLT_NUMIDS + 1) * sizeof(char *));
		if (svr->jobids == NULL)
			goto error;
		svr->max_sz = DELJOB_DFLT_NUMIDS;
	} else if (svr->total_jobs == svr->max_sz) {
		char **realloc_ptr = NULL;

		svr->max_sz *= 2;
		realloc_ptr = realloc(svr->jobids, (svr->max_sz + 1) * sizeof(char *));
		if (realloc_ptr == NULL)
			goto error;
		svr->jobids = realloc_ptr;
	}

	svr->jobids[svr->total_jobs++] = (char *) jobid;
	svr->jobids[svr->total_jobs] = NULL;
	return 0;

error:
	pbs_errno = PBSE_SYSTEM;
	return 1;
}

/**
 * @brief
 *	Identify the respective svr_jobid_list struct
 *  and calls the append_jobid function to append the jobid.
 *
 * @param[in] job_id - Job id
 * @param[in] svrname - server name
 * @param[in,out] svr_jobid_list_hd - head of the svr_jobib_list list
 *
 * @return int
 * @retval	0	- success
 * @retval	1	- failure
 *
 */
int
add_jid_to_list_by_name(char *job_id, char *svrname, svr_jobid_list_t **svr_jobid_list_hd)
{
	svr_jobid_list_t *iter_list = NULL;
	svr_jobid_list_t *new_node = NULL;

	if ((job_id == NULL) || (svrname == NULL) || (svr_jobid_list_hd == NULL))
		return 1;

	for (iter_list = *svr_jobid_list_hd; iter_list != NULL; iter_list = iter_list->next) {
		if (strcmp(svrname, iter_list->svrname) == 0) {
			if (append_jobid(iter_list, job_id) != 0)
				return 1;
			return 0;
		}
	}

	new_node = calloc(1, sizeof(svr_jobid_list_t));
	if (new_node == NULL) {
		pbs_errno = PBSE_SYSTEM;
		return 1;
	}
	new_node->svr_fd = -1;
	pbs_strncpy(new_node->svrname, svrname, sizeof(new_node->svrname));
	if (append_jobid(new_node, job_id) != 0) {
		free(new_node);
		return 1;
	}
	new_node->next = *svr_jobid_list_hd;
	*svr_jobid_list_hd = new_node;

	return 0;
}

/**
 * @brief
 *	Send the Delete Job List request to the server
 *
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier array
 * @param[in] numjids - number of job ids
 * @param[in] extend - string to encode req
 *
 * @return	struct batch_status *
 * @retval     list of jobs which couldn't be deleted
 *
 */
struct batch_deljob_status *
__pbs_deljoblist(int c, char **jobids, int numjids, const char *extend)
{
	int rc, i;
	struct batch_reply *reply;
	struct batch_deljob_status *ret = NULL;

	if ((jobids == NULL) || (*jobids == NULL) || (**jobids == '\0') || c < 0)
		return NULL;

	char *malloc_track = calloc(1, numjids);
	/* Deletes duplicate jobids */
	if (dedup_jobids(jobids, &numjids, malloc_track) != 0)
		goto end;

	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_DeleteJobList, pbs_current_user)) ||
	    (rc = encode_DIS_JobsList(c, jobids, numjids)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
			goto end;
		}
		pbs_errno = PBSE_PROTOCOL;
		goto end;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		goto end;
	}

	if (c < 0)
		goto end;

	reply = PBSD_rdrpy(c);
	if (reply == NULL && pbs_errno == PBSE_NONE)
		pbs_errno = PBSE_PROTOCOL;

	else if (reply->brp_choice != BATCH_REPLY_CHOICE_NULL &&
		 reply->brp_choice != BATCH_REPLY_CHOICE_Text &&
		 reply->brp_choice != BATCH_REPLY_CHOICE_Delete)
		pbs_errno = PBSE_PROTOCOL;

	if ((reply != NULL) && (reply->brp_un.brp_deletejoblist.brp_delstatc != NULL)) {
		ret = reply->brp_un.brp_deletejoblist.brp_delstatc;
		reply->brp_un.brp_deletejoblist.brp_delstatc = NULL;
	}

	PBSD_FreeReply(reply);

end:
	/* We need to free the jobid's that were allocated in dedup_jobids()
		 * rest of the jobid's are not on heap */
	for (i = 0; i < numjids; i++)
		if (malloc_track[i])
			free(jobids[i]);

	free(malloc_track);
	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_delresv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_delresv.c
 *
 * @brief
 * Send the Delete Reservation request to the server
 * really just an instance of the manager request
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include "libpbs.h"

/**
 * @brief
 *      Send the Delete Job request to the server
 *      really just an instance of the manager request
 *
 * @param[in] c - connection handler
 * @param[in] resv_id - reservation identifier
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
__pbs_delresv(int c, const char *resv_id, const char *extend)
{
	struct attropl *aoplp = NULL;

	if ((resv_id == NULL) || (*resv_id == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	return PBSD_manager(c, PBS_BATCH_DeleteResv, MGR_CMD_DELETE, MGR_OBJ_JOB, resv_id, aoplp, extend);
}


================================================
FILE: src/lib/Libifl/pbsD_holdjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_holdjob.c
 * @brief
 * Send the Hold Job request to the server --
 * really just an instance of the "manager" request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include "libpbs.h"

/**
 * @brief
 *	- Send the Hold Job request to the server --
 *	really just an instance of the "manager" request.
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] holdtype - value for holdtype
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
__pbs_holdjob(int c, const char *jobid, const char *holdtype, const char *extend)
{
	struct attropl aopl;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	aopl.name = ATTR_h;
	aopl.resource = NULL;
	if ((holdtype == NULL) || (*holdtype == '\0'))
		aopl.value = "u";
	else
		aopl.value = (char *) holdtype;
	aopl.op = SET;
	aopl.next = NULL;
	return PBSD_manager(c, PBS_BATCH_HoldJob, MGR_CMD_SET, MGR_OBJ_JOB, jobid, &aopl, extend);
}


================================================
FILE: src/lib/Libifl/pbsD_locjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_locjob.c
 * @brief
 * This function does the LocateJob request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *      This function does the LocateJob request.
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] extend - string to encode req
 *
 * @return	string
 * @retval	destination name	success
 * @retval	NULL	error
 */
char *
__pbs_locjob(int c, const char *jobid, const char *extend)
{
	int rc;
	struct batch_reply *reply;
	char *ploc = NULL;

	if ((jobid == NULL) || (*jobid == '\0')) {
		pbs_errno = PBSE_IVALREQ;
		return (ploc);
	}

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;
	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;
	/* setup DIS support routines for following DIS calls */
	DIS_tcp_funcs();
	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_LocateJob, pbs_current_user)) || (rc = encode_DIS_JobId(c, jobid)) || (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		pbs_client_thread_unlock_connection(c);
		return NULL;
	}
	/* write data over tcp stream */
	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		pbs_client_thread_unlock_connection(c);
		return NULL;
	}
	/* read reply from stream */
	reply = PBSD_rdrpy(c);
	if (reply == NULL) {
		pbs_errno = PBSE_PROTOCOL;
	} else if (reply->brp_choice != BATCH_REPLY_CHOICE_NULL && reply->brp_choice != BATCH_REPLY_CHOICE_Text && reply->brp_choice != BATCH_REPLY_CHOICE_Locate) {
		advise("pbs_locjob", "Unexpected reply choice");
		pbs_errno = PBSE_PROTOCOL;
	} else if (get_conn_errno(c) == 0) {
		if ((ploc = strdup(reply->brp_un.brp_locate)) == NULL) {
			pbs_errno = PBSE_SYSTEM;
		}
	}
	PBSD_FreeReply(reply);
	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ploc;
}


================================================
FILE: src/lib/Libifl/pbsD_manager.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_manager.c
 * @brief
 * Basically a pass-thru to PBS_manager
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"

/**
 * @brief
 *	- Basically a pass-thru to PBS_manager
 *
 * @param[in] c - connection handle
 * @param[in] command - mgr command with respect to obj
 * @param[in] objtype - object type
 * @param[in] objname - object name
 * @param[in] attrib -  pointer to attropl structure
 * @param[in] extend - extend string to encode req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
__pbs_manager(int c, int command, int objtype, const char *objname,
	      struct attropl *attrib, const char *extend)
{
	return PBSD_manager(c,
			    PBS_BATCH_Manager,
			    command,
			    objtype,
			    objname,
			    attrib,
			    extend);
}


================================================
FILE: src/lib/Libifl/pbsD_modify_resv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*	pbsD_modify_resv.c
 *
 *	The Modify Reservation request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <fcntl.h>
#include <unistd.h>
#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	Passes modify reservation request to PBSD_modify_resv( )
 *
 * @param[in]   c - socket on which connected
 * @param[in]   attrib - the list of attributes for batch request
 * @param[in]   extend - extension of batch request
 *
 * @return char*
 * @retval SUCCESS returns the response from the server.
 * @retval ERROR NULL
 */
char *
__pbs_modify_resv(int c, const char *resv_id, struct attropl *attrib, const char *extend)
{
	struct attropl *pal = NULL;
	int rc = 0;
	char *ret = NULL;

	for (pal = attrib; pal; pal = pal->next)
		pal->op = SET;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	rc = pbs_verify_attributes(c, PBS_BATCH_ModifyResv, MGR_OBJ_RESV, MGR_CMD_NONE, attrib);
	if (rc)
		return NULL;

	/* lock pthread mutex here for this connection
	 * blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	/* initiate the modification of the reservation  */
	ret = PBSD_modify_resv(c, resv_id, attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_movejob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_movejob.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	send move job request
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] destin - job moved to
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
__pbs_movejob(int c, const char *jobid, const char *destin, const char *extend)
{
	int rc;
	struct batch_reply *reply;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	if (destin == NULL)
		destin = "";

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_MoveJob, pbs_current_user)) ||
	    (rc = encode_DIS_MoveJob(c, jobid, destin)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* read reply */
	reply = PBSD_rdrpy(c);
	PBSD_FreeReply(reply);
	rc = get_conn_errno(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_msgjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_msgjob.c
 * @brief
 *	send the MessageJob request and get the reply.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include <errno.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-send the MessageJob request and get the reply.
 *
 * @param[in] c - socket descriptor
 * @param[in] jobid - job id
 * @param[in] fileopt - which file
 * @param[in] msg - msg to be encoded
 * @param[in] extend - extend string for encoding req
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
__pbs_msgjob(int c, const char *jobid, int fileopt, const char *msg, const char *extend)
{
	struct batch_reply *reply;
	int rc;

	if ((jobid == NULL) || (*jobid == '\0') ||
	    (msg == NULL) || (*msg == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */
	DIS_tcp_funcs();

	if ((rc = PBSD_msg_put(c, jobid, fileopt, msg, extend, PROT_TCP, NULL)) != 0) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* read reply */
	reply = PBSD_rdrpy(c);
	rc = get_conn_errno(c);

	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}

/**
 * @brief
 *	-Send a request to spawn a python script to the MS
 *	of a job.  It will run as a task.
 *
 * @param[in] c - communication handle
 * @param[in] jobid - job id
 * @param[in] argv - pointer to argument list
 * @param[in] envp - pointer to environment variable
 *
 * @return	int
 * @retval	exit value of the task	success
 * @retval	-1			error
 *
 */
int
pbs_py_spawn(int c, char *jobid, char **argv, char **envp)
{
	struct batch_reply *reply;
	int rc;

	/*
	 ** Must have jobid and argv[0] as a minimum.
	 */
	if ((jobid == NULL) || (*jobid == '\0') ||
	    (argv == NULL) || (argv[0] == NULL)) {
		pbs_errno = PBSE_IVALREQ;
		return -1;
	}
	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return -1;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return -1;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	if ((rc = PBSD_py_spawn_put(c, jobid, argv, envp, 0, NULL)) != 0) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return -1;
	}

	/* read reply */

	reply = PBSD_rdrpy(c);
	if ((reply == NULL) || (get_conn_errno(c) != 0))
		rc = -1;
	else
		rc = reply->brp_auxcode;

	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return -1;

	return rc;
}

/**
 * @brief
 * 	-pbs_relnodesjob - release a set of sister nodes or vnodes,
 * 	or all sister nodes or vnodes assigned to the specified PBS
 * 	batch job.
 *
 * @param[in] c 	communication handle
 * @param[in] jobid  job identifier
 * @param[in] node_list 	list of hosts or vnodes to be released
 * @param[in] extend 	additional params, currently passes -k arguments
 *
 * @return	int
 * @retval	0	Success
 * @retval	!0	error
 *
 */
int
__pbs_relnodesjob(int c, const char *jobid, const char *node_list, const char *extend)
{
	struct batch_reply *reply;
	int rc;

	if ((jobid == NULL) || (*jobid == '\0') ||
	    (node_list == NULL))
		return (pbs_errno = PBSE_IVALREQ);

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* first verify the resource list in keep_select option */
	if (extend) {
		struct attrl *attrib = NULL;
		char emsg_illegal_k_value[] = "illegal -k value";
		char ebuff[PBS_PARSE_ERR_MSG_LEN_MAX + sizeof(emsg_illegal_k_value) + 4], *erp, *emsg = NULL;
		int i;
		struct pbs_client_thread_connect_context *con;
		char nd_ct_selstr[20];
		char *endptr = NULL;
		long int rc_long;

		errno = 0;
		rc_long = strtol(extend, &endptr, 10);

		if ((errno == 0) && (rc_long > 0) && (*endptr == '\0')) {
			snprintf(nd_ct_selstr, sizeof(nd_ct_selstr), "select=%s", extend);
			extend = nd_ct_selstr;
		} else if ((i = set_resources(&attrib, extend, 1, &erp))) {
			if (i > 1) {
				snprintf(ebuff, sizeof(ebuff), "%s: %s\n", emsg_illegal_k_value, pbs_parse_err_msg(i));
				emsg = strdup(ebuff);
			} else
				emsg = strdup("illegal -k value\n");
			pbs_errno = PBSE_INVALSELECTRESC;
		} else {
			if (!attrib || strcmp(attrib->resource, "select")) {
				emsg = strdup("only a \"select=\" string is valid in -k option\n");
				pbs_errno = PBSE_IVALREQ;
			} else
				pbs_errno = PBSE_NONE;
		}
		if (pbs_errno) {
			if ((con = pbs_client_thread_find_connect_context(c))) {
				free(con->th_ch_errtxt);
				con->th_ch_errtxt = emsg;
				con->th_ch_errno = pbs_errno;
			} else {
				(void) set_conn_errtxt(c, emsg);
				(void) set_conn_errno(c, pbs_errno);
				free(emsg);
			}
			return pbs_errno;
		}
		rc = pbs_verify_attributes(c, PBS_BATCH_RelnodesJob,
					   MGR_OBJ_JOB, MGR_CMD_NONE, (struct attropl *) attrib);
		if (rc)
			return rc;
	}

	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	if ((rc = PBSD_relnodes_put(c, jobid, node_list, extend, 0, NULL)) != 0) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
			pbs_errno = PBSE_SYSTEM;
		else
			pbs_errno = PBSE_PROTOCOL;

		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* read reply */

	reply = PBSD_rdrpy(c);
	rc = get_conn_errno(c);

	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_orderjo.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_orderjob.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-send order job batch request
 *
 * @param[in] c - connection handler
 * @param[in] job1 - job identifier
 * @param[in] job2 - job identifier
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
__pbs_orderjob(int c, const char *job1, const char *job2, const char *extend)
{
	struct batch_reply *reply;
	int rc;

	if ((job1 == NULL) || (*job1 == '\0') ||
	    (job2 == NULL) || (*job2 == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */
	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_OrderJob, pbs_current_user)) ||
	    (rc = encode_DIS_MoveJob(c, job1, job2)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
			pbs_errno = PBSE_SYSTEM;
		else
			pbs_errno = PBSE_PROTOCOL;

		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* read reply */
	reply = PBSD_rdrpy(c);
	PBSD_FreeReply(reply);
	rc = get_conn_errno(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_rerunjo.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_rerunjob.c
 * @brief
 * This function does the RerunJob request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-send rerun batch request
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
__pbs_rerunjob(int c, const char *jobid, const char *extend)
{
	int rc;
	struct batch_reply *reply;
	time_t old_tcp_timeout;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_Rerun, pbs_current_user)) ||
	    (rc = encode_DIS_JobId(c, jobid)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* write data */
	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* Set timeout value to very long value as rerun request */
	/* goes from Server to Mom and may take a long time      */
	old_tcp_timeout = pbs_tcp_timeout;
	pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_VLONG;

	/* read reply from stream into presentation element */

	reply = PBSD_rdrpy(c);

	/* reset timeout */
	pbs_tcp_timeout = old_tcp_timeout;

	PBSD_FreeReply(reply);

	rc = get_conn_errno(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_resc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_resc.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/* following structure is used by pbsD_resc.c, functions totpool and usepool */
struct node_pool {
	int nodes_avail;
	int nodes_alloc;
	int nodes_resrv;
	int nodes_down;
	char *resc_nodes;
};

/**
 * @brief
 *	-frees the node pool
 *
 * @param[in] np - pointer to node pool list
 *
 * @return	Void
 *
 */
void
free_node_pool(struct node_pool *np)
{
	if (np) {
		if (np->resc_nodes)
			free(np->resc_nodes);
		free(np);
	}
}

/**
 * @brief
 * 	-encode_DIS_resc() - encode a resource related request,
 *	Used by pbs_rescquery(), pbs_rescreserve() and pbs_rescfree()
 *
 * @param[in] sock - socket fd
 * @param[in] rlist - pointer to resource list
 * @param[in] ct - count of query strings
 * @param[in] rh - resource handle
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */

static int
encode_DIS_Resc(int sock, char **rlist, int ct, pbs_resource_t rh)
{
	int i;
	int rc;

	if ((rc = diswsi(sock, rh)) == 0) { /* resource reservation handle */

		/* next send the number of resource strings */

		if ((rc = diswui(sock, ct)) == 0) {

			/* now send each string (if any) */

			for (i = 0; i < ct; ++i) {
				if ((rc = diswst(sock, *(rlist + i))) != 0)
					break;
			}
		}
	}
	return rc;
}

/**
 * @brief
 * 	-PBS_resc() - internal common code for sending resource requests
 *
 * @par Functionality:
 *	Formats and sends the requests for pbs_rescquery(), pbs_rescreserve(),
 *	and pbs_rescfree().   Note, while the request is overloaded for all
 *	three, each has its own expected reply format.
 *
 * @param[in] c - communication handle
 * @param[in] reqtype - request type
 * @param[in] rescl- pointer to resource list
 * @param[in] ct - count of query strings
 * @param[in] rh - resource handle
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
static int
PBS_resc(int c, int reqtype, char **rescl, int ct, pbs_resource_t rh)
{
	int rc;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, reqtype, pbs_current_user)) ||
	    (rc = encode_DIS_Resc(c, rescl, ct, rh)) ||
	    (rc = encode_DIS_ReqExtend(c, NULL))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		return (pbs_errno);
	}
	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}
	return (0);
}

/**
 * @brief
 * 	-pbs_rescquery() - query the availability of resources
 *
 * @param[in] c - communication handle
 * @param[in] resclist - list of queries
 * @param[in] num_resc - number in list
 * @param[out] available - number available per query
 * @param[out] allocated - number allocated per query
 * @param[out] reserved - number reserved  per query
 * @param[out] down - number down/off  per query
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
pbs_rescquery(int c, char **resclist, int num_resc,
	      int *available, int *allocated, int *reserved, int *down)
{
	int i;
	struct batch_reply *reply;
	int rc = 0;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	if (resclist == 0) {
		if (set_conn_errno(c, PBSE_RMNOPARAM) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_RMNOPARAM;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* send request */

	if ((rc = PBS_resc(c, PBS_BATCH_Rescq, resclist,
			   num_resc, (pbs_resource_t) 0)) != 0) {
		(void) pbs_client_thread_unlock_connection(c);
		return rc;
	}

	/* read in reply */

	reply = PBSD_rdrpy(c);
	if ((rc = get_conn_errno(c)) == PBSE_NONE &&
	    reply->brp_choice == BATCH_REPLY_CHOICE_RescQuery) {
		struct brp_rescq *resq = &reply->brp_un.brp_rescq;

		if (resq == NULL || num_resc != resq->brq_number) {
			rc = PBSE_IRESVE;
			if (set_conn_errno(c, PBSE_IRESVE) != 0) {
				pbs_errno = PBSE_SYSTEM;
			} else {
				pbs_errno = PBSE_IRESVE;
			}
			goto done;
		}

		/* copy in available and allocated numbers */

		for (i = 0; i < num_resc; i++) {
			available[i] = resq->brq_avail[i];
			allocated[i] = resq->brq_alloc[i];
			reserved[i] = resq->brq_resvd[i];
			down[i] = resq->brq_down[i];
		}
	}

done:
	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return (rc);
}

/**
 * @brief
 * 	-pbs_reserve() - reserver resources
 *
 * @param[in] c - communication handle
 * @param[in] rl - list of resources
 * @param[in] num_resc - number of items in list
 * @param[in] prh - ptr to resource reservation handle
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
pbs_rescreserve(int c, char **rl, int num_resc, pbs_resource_t *prh)
{
	int rc;
	struct batch_reply *reply;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	if (rl == NULL) {
		if (set_conn_errno(c, PBSE_RMNOPARAM) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_RMNOPARAM;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}
	if (prh == NULL) {
		if (set_conn_errno(c, PBSE_RMNOPARAM) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_RMNOPARAM;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}
	/* send request */

	if ((rc = PBS_resc(c, PBS_BATCH_ReserveResc, rl, num_resc, *prh)) != 0) {
		(void) pbs_client_thread_unlock_connection(c);
		return (rc);
	}

	/*
	 * now get reply, if reservation successful, the reservation handle,
	 * pbs_resource_t, is in the  aux field
	 */

	reply = PBSD_rdrpy(c);

	if (((rc = get_conn_errno(c)) == PBSE_NONE) ||
	    (rc == PBSE_RMPART)) {
		*prh = reply->brp_auxcode;
	}
	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return (rc);
}

/**
 * @brief
 * 	-pbs_release() - release a resource reservation
 *
 * @par Note:
 *	To encode we send same info as for reserve except that the resource
 *	list is empty.
 *
 * @param[in] c - connection handle
 * @param[in] rh - resorce handle
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
pbs_rescrelease(int c, pbs_resource_t rh)
{
	struct batch_reply *reply;
	int rc;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	if ((rc = PBS_resc(c, PBS_BATCH_ReleaseResc, NULL, 0, rh)) != 0) {
		(void) pbs_client_thread_unlock_connection(c);
		return (rc);
	}

	/* now get reply */

	reply = PBSD_rdrpy(c);

	PBSD_FreeReply(reply);

	rc = get_conn_errno(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return (rc);
}

/*
 * The following routines are provided as a convience in converting
 * older schedulers which did addreq() of "totpool", "usepool", and
 * "avail".
 *
 * The "update" flag if non-zero, causes a new resource query to be sent
 * to the server.  If zero, the existing numbers are used.
 */

/**
 * @brief
 * 	-totpool() - return total number of nodes
 *
 * @param[in] con - connection handle
 * @param[in] update - flag indicating update or not
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
totpool(int con, int update)
{
	struct pbs_client_thread_context *ptr;
	struct node_pool *np;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return -1;

	ptr = (struct pbs_client_thread_context *)
		pbs_client_thread_get_context_data();
	if (!ptr) {
		pbs_errno = PBSE_INTERNAL;
		return -1;
	}

	if (!ptr->th_node_pool) {
		np = (struct node_pool *) malloc(sizeof(struct node_pool));
		if (!np) {
			pbs_errno = PBSE_INTERNAL;
			return -1;
		}
		ptr->th_node_pool = (void *) np;
		if ((np->resc_nodes = strdup("nodes")) == NULL) {
			free(np);
			np = NULL;
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
	} else
		np = (struct node_pool *) ptr->th_node_pool;

	if (update) {
		if (pbs_rescquery(con, &np->resc_nodes, 1,
				  &np->nodes_avail,
				  &np->nodes_alloc,
				  &np->nodes_resrv,
				  &np->nodes_down) != 0) {
			return (-1);
		}
	}
	return (np->nodes_avail +
		np->nodes_alloc +
		np->nodes_resrv +
		np->nodes_down);
}

/**
 * @brief
 * 	-usepool() - return number of nodes in use, includes reserved and down
 *
 * @param[in] con - connection handle
 * @param[in] update - flag indicating update or not
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
usepool(int con, int update)
{
	struct pbs_client_thread_context *ptr;
	struct node_pool *np;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return -1;

	ptr = (struct pbs_client_thread_context *)
		pbs_client_thread_get_context_data();
	if (!ptr) {
		pbs_errno = PBSE_INTERNAL;
		return -1;
	}
	if (!ptr->th_node_pool) {
		np = (struct node_pool *) malloc(sizeof(struct node_pool));
		if (!np) {
			pbs_errno = PBSE_INTERNAL;
			return -1;
		}
		ptr->th_node_pool = (void *) np;
		if ((np->resc_nodes = strdup("nodes")) == NULL) {
			free(np);
			np = NULL;
			pbs_errno = PBSE_SYSTEM;
			return -1;
		}
	} else
		np = (struct node_pool *) ptr->th_node_pool;

	if (update) {
		if (pbs_rescquery(con, &np->resc_nodes, 1,
				  &np->nodes_avail,
				  &np->nodes_alloc,
				  &np->nodes_resrv,
				  &np->nodes_down) != 0) {
			return (-1);
		}
	}
	return (np->nodes_alloc +
		np->nodes_resrv +
		np->nodes_down);
}

/**
 * @brief
 * 	-avail - returns answer about available of a specified node set
 *
 * @param[in] con - connection handler
 * @param[in] resc - resources
 *
 * @return	string
 * @retval	"yes"		if available (job could be run)
 * @return	"no"		if not currently available
 * @return	"never"		if can never be satified
 * @retval	"?"		if error in request
 */

char *
avail(int con, char *resc)
{
	int av;
	int al;
	int res;
	int dwn;

	if (pbs_rescquery(con, &resc, 1, &av, &al, &res, &dwn) != 0)
		return ("?");

	else if (av > 0)
		return ("yes");
	else if (av == 0)
		return ("no");
	else
		return ("never");
}


================================================
FILE: src/lib/Libifl/pbsD_rlsjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_rlsjob.c
 * @brief
 * Release a hold on a job.
 * really just an instance of the "manager" request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include "libpbs.h"

/**
 * @brief
 *	-Release a hold on a job.
 * 	really just an instance of the "manager" request.
 *
 * @param[in] c - connection handler
 * @param[in] jobid - job identifier
 * @param[in] holdtype - type of hold
 * @param[in] extend - string to encode req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
__pbs_rlsjob(int c, const char *jobid, const char *holdtype, const char *extend)
{
	struct attropl aopl;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	aopl.name = ATTR_h;
	aopl.resource = NULL;
	if ((holdtype == NULL) || (*holdtype == '\0'))
		aopl.value = "u";
	else
		aopl.value = (char *) holdtype;
	aopl.op = SET;
	aopl.next = NULL;
	return PBSD_manager(c, PBS_BATCH_ReleaseJob, MGR_CMD_SET, MGR_OBJ_JOB, jobid, &aopl, extend);
}


================================================
FILE: src/lib/Libifl/pbsD_runjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_runjob.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief	Inner function for __pbs_runjob, __pbs_asynrunjob and __pbs_asynrunjob_ack
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] location - string of vnodes/resources to be allocated to the job
 * @param[in] extend - extend string for encoding req
 * @param[in] req_type - one of PBS_BATCH_RunJob, PBS_BATCH_AsyrunJob or PBS_BATCH_AsyrunJob_ack
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 */
static int
__runjob_inner(int c, const char *jobid, const char *location, const char *extend, int req_type)
{
	int rc = 0;
	unsigned long resch = 0;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);

	if (location == NULL)
		location = "";

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	/* send run request */

	if ((rc = encode_DIS_ReqHdr(c, req_type, pbs_current_user)) ||
	    (rc = encode_DIS_Run(c, jobid, location, resch)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
			pbs_errno = PBSE_SYSTEM;
		else
			pbs_errno = PBSE_PROTOCOL;

		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (req_type != PBS_BATCH_AsyrunJob) {
		struct batch_reply *reply = NULL;

		/* Get reply */
		reply = PBSD_rdrpy(c);
		rc = get_conn_errno(c);
		PBSD_FreeReply(reply);
	}

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}

/**
 * @brief
 *	-send async run job batch request.
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] location - string of vnodes/resources to be allocated to the job
 * @param[in] extend - extend string for encoding req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
__pbs_asyrunjob(int c, const char *jobid, const char *location, const char *extend)
{
	return __runjob_inner(c, jobid, location, extend, PBS_BATCH_AsyrunJob);
}

/**
 * @brief
 *	-send a run job batch request which waits for an ack from server
 *	pbs_runjob() and pbs_asyrunjob_ack() are similar in the fact that they both wait for an ack back from the server,
 *	but this call is faster than pbs_runjob() because the server returns before contacting MoM
 *
 * @param[in] c - connection handle
 * @param[in] jobid- job identifier
 * @param[in] location - string of vnodes/resources to be allocated to the job
 * @param[in] extend - extend string for encoding req
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
__pbs_asyrunjob_ack(int c, const char *jobid, const char *location, const char *extend)
{
	return __runjob_inner(c, jobid, location, extend, PBS_BATCH_AsyrunJob_ack);
}

/**
 * @brief
 *	-send runjob batch request
 *
 * @param[in] c - communication handle
 * @param[in] jobid - job identifier
 * @param[in] location - location where job running
 * @param[in] extend - extend string to encode req
 *
 * @return      int
 * @retval      DIS_SUCCESS(0)  success
 * @retval      error code      error
 *
 */

int
__pbs_runjob(int c, const char *jobid, const char *location, const char *extend)
{
	return __runjob_inner(c, jobid, location, extend, PBS_BATCH_RunJob);
}


================================================
FILE: src/lib/Libifl/pbsD_selectj.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbsD_selectj.c
 * @brief
 *	This file contines two main library entries:
 *		pbs_selectjob()
 *		pbs_selstat()
 *
 *
 *	pbs_selectjob() - the SelectJob request
 *		Return a list of job ids that meet certain selection criteria.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include <stdlib.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-the SelectJob request
 *	Return a list of job ids that meet certain selection criteria.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attropl structure(selection criteria)
 * @param[in] extend - extend string to encode req
 *
 * @return	string
 * @retval	job ids		success
 * @retval	NULL		error
 *
 */
char **
__pbs_selectjob(int c, struct attropl *attrib, const char *extend)
{
	char **ret = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	if (pbs_verify_attributes(c, PBS_BATCH_SelectJobs, MGR_OBJ_JOB,
				  MGR_CMD_NONE, attrib))
		return NULL;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	if (PBSD_select_put(c, PBS_BATCH_SelectJobs, attrib, NULL, extend) == 0)
		ret = PBSD_select_get(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0) {
		free_string_array(ret);
		return NULL;
	}

	return ret;
}

/**
 * @brief
 * 	-pbs_selstat() - Selectable status
 *	Return status information for jobs that meet certain selection
 *	criteria.  This is a short-cut combination of pbs_selecljob()
 *	and repeated pbs_statjob().
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attropl structure(selection criteria)
 * @param[in] extend - extend string to encode req
 * @param[in] rattrib - list of attributes to return
 *
 * @return      structure handle
 * @retval      list of attr	success
 * @retval      NULL		error
 *
 */

struct batch_status *
__pbs_selstat(int c, struct attropl *attrib, struct attrl *rattrib, const char *extend)
{
	struct batch_status *ret = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	if (pbs_verify_attributes(c, PBS_BATCH_SelectJobs, MGR_OBJ_JOB,
				  MGR_CMD_NONE, attrib))
		return NULL;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	if (PBSD_select_put(c, PBS_BATCH_SelStat, attrib, rattrib, extend) == 0)
		ret = PBSD_status_get(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}

/**
 * @brief
 *	-encode and puts selectjob request  data
 *
 * @param[in] c - communication handle
 * @param[in] type - type of request
 * @param[in] attrib - pointer to attropl structure(selection criteria)
 * @param[in] extend - extend string to encode req
 * @param[in] rattrib - list of attributes to return
 *
 * @return      int
 * @retval      0	success
 * @retval      !0	error
 *
 */
int
PBSD_select_put(int c, int type, struct attropl *attrib,
		struct attrl *rattrib, const char *extend)
{
	int rc;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, type, pbs_current_user)) ||
	    (rc = encode_DIS_attropl(c, attrib)) ||
	    (rc = encode_DIS_attrl(c, rattrib)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		return (pbs_errno);
	}

	/* write data */

	if (dis_flush(c)) {
		return (pbs_errno = PBSE_PROTOCOL);
	}

	return 0;
}

/**
 * @brief
 *	-reads selectjob reply from stream
 *
 * @param[in] c - communication handle
 *
 * @return	string list
 * @retval	list of strings		success
 * @retval	NULL			error
 *
 */
char **
PBSD_select_get(int c)
{
	int i;
	struct batch_reply *reply;
	int njobs;
	struct brp_select *sr;
	char **retval = NULL;

	/* read reply from stream */

	reply = PBSD_rdrpy(c);
	if (reply == NULL) {
		pbs_errno = PBSE_PROTOCOL;
	} else if (reply->brp_choice != BATCH_REPLY_CHOICE_NULL &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Text &&
		   reply->brp_choice != BATCH_REPLY_CHOICE_Select) {
		pbs_errno = PBSE_PROTOCOL;
	} else if (get_conn_errno(c) == 0) {
		njobs = reply->brp_count;
		retval = (char **) malloc((njobs + 1) * sizeof(char *));
		if (retval == NULL) {
			pbs_errno = PBSE_SYSTEM;
			PBSD_FreeReply(reply);
			return NULL;
		}
		sr = reply->brp_un.brp_select;
		for (i = 0; i < njobs; i++) {
			retval[i] = strdup(sr->brp_jobid);
			if (retval[i] == NULL) {
				free_str_array(retval);
				pbs_errno = PBSE_SYSTEM;
				PBSD_FreeReply(reply);
				return NULL;
			}
			sr = sr->brp_next;
		}
		retval[i] = NULL;
	}

	PBSD_FreeReply(reply);

	return retval;
}


================================================
FILE: src/lib/Libifl/pbsD_sigjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_sigjob.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	sends and reads signal job batch request.
 *
 * @param[in] c - communication handle
 * @param[in] jobid - job identifier
 * @param[in] sig - signal
 * @param[in] extend - extend string for request
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
__pbs_sigjob(int c, const char *jobid, const char *sig, const char *extend)
{
	int rc = 0;
	struct batch_reply *reply;

	if ((jobid == NULL) || (*jobid == '\0') || (sig == NULL))
		return (pbs_errno = PBSE_IVALREQ);

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* send request */
	if ((rc = PBSD_sig_put(c, jobid, sig, extend, PROT_TCP, NULL)) != 0) {
		pbs_client_thread_unlock_connection(c);
		return rc;
	}

	/* read reply */
	reply = PBSD_rdrpy(c);
	PBSD_FreeReply(reply);
	rc = get_conn_errno(c);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_stagein.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_stagein.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-sends stagein job batch request and get reply.
 *
 * @param[in] c - communication handle
 * @param[in] jobid - job identifier
 * @param[in] location - destination for job
 * @param[in] extend - extend string for request
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */

int
pbs_stagein(int c, char *jobid, char *location, char *extend)
{
	int rc;
	struct batch_reply *reply;

	if ((jobid == NULL) || (*jobid == '\0'))
		return (pbs_errno = PBSE_IVALREQ);
	if (location == NULL)
		location = "";

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */

	DIS_tcp_funcs();

	/* send stagein request, a run request with a different id */

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_StageIn, pbs_current_user)) ||
	    (rc = encode_DIS_Run(c, jobid, location, 0)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0) {
			pbs_errno = PBSE_SYSTEM;
		} else {
			pbs_errno = PBSE_PROTOCOL;
		}
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		(void) pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* get reply */

	reply = PBSD_rdrpy(c);
	rc = get_conn_errno(c);

	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbsD_stathook.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_stathook.c
 * @brief
 *	Return the status of a hook.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	Return the status of a hook.
 *
 * @param[in] c - communication handle
 * @param[in] id - object name
 * @param[in] attrib - pointer to attrl structure(list)
 * @param[in] extend - extend string for req
 *
 * @return	structure handle
 * @retval	pointer to attr list	success
 * @retval	NULL			error
 *
 */
struct batch_status *
__pbs_stathook(int c, const char *id, struct attrl *attrib, const char *extend)
{
	struct batch_status *ret = NULL;
	int rc;
	int hook_obj;

	if (extend != NULL) {
		if (strcmp(extend, PBS_HOOK) == 0) {
			hook_obj = MGR_OBJ_PBS_HOOK;
		} else if (strcmp(extend, SITE_HOOK) == 0) {
			hook_obj = MGR_OBJ_SITE_HOOK;
		} else {
			return NULL; /* bad extend value */
		}
	} else {
		hook_obj = MGR_OBJ_SITE_HOOK;
	}

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	rc = pbs_verify_attributes(c, PBS_BATCH_StatusHook, hook_obj, MGR_CMD_NONE,
				   (struct attropl *) attrib);
	if (rc)
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusHook, id, attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_stathost.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_stathost.c
 * @brief
 * Return the combined status of the vnodes on a host or all hosts.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "attribute.h"

/* data structure and local data items private to this file */

/* This structure is used to determined the set of separate "hosts"   */
struct host_list {
	char hl_name[PBS_MAXHOSTNAME + 1]; /* host value */
	struct batch_status *hl_node;	   /* count of vnodes in host */
};

/* This next structure is used to track and sum consumable resources */

struct consumable {
	char *cons_resource;
	char *cons_avail_str;	  /* value in r_available if not consummable  */
	long long cons_avail_sum; /* sum of values in r_available if consumm. */
	long long cons_assn_sum;  /* sum of values in r_assigned  if consumm. */
	short cons_k;		  /* set if "size" type (kb) */
	short cons_consum;	  /* set if resource is consumable */
	short cons_set;		  /* set if resource has a value */
};

/*
 * get_resource_value - for the named resource in the indicated attribute,
 *	resources_assigned or resources_available, return the value of the
 *	resource (as a string).   NULL is returned if the resources isn't there
 */

static char *
get_resource_value(char *attrn, char *rname, struct attrl *pal)
{
	while (pal) {
		if ((strcasecmp(pal->name, attrn) == 0) &&
		    (strcasecmp(pal->resource, rname) == 0))
			return pal->value;
		pal = pal->next;
	}
	return NULL;
}

/**
 * @brief
 * add_consumable_entry - add an entry for a resource into the consumable array
 *
 * @par If the resource is found in resources_assigned, it is considered
 *	to be "consummable" and the various values are added together;
 *	- the resource is "consumable" and it is so flagged.
 *	If the resource is already in the table the consumable flag is updated
 *
 * @par If the resource is not consumable, the value string from the attrib
 *	is used acording to the following rules:
 *	 - If cons_avail_str is null, use the attrib value
 *         else if cons_avail_str == attrib value, no change
 *         else repace cons_avail_str with "<various>"
 *
 * @param[in]	patl	Pointer to element in attribute list
 * @param[in]	consum_flag	Whether the resource is consumable
 * @param[in]	consum	The array of consumables
 * @param[in]	consum	Number of elements in consum array
 *
 * @return	void
 */
static void
add_consumable_entry(struct attrl *patl,
		     int consum_flag,
		     struct consumable **consum,
		     int *consumable_size)
{
	int i;
	struct consumable *newc;

	if (!patl || !consum || !consumable_size)
		return;

	/* Ignore indirect resources (those that contain '@') */
	if (strchr(patl->value, '@') != NULL)
		return;

	for (i = 0; i < *consumable_size; ++i) {
		if (((*consum) + i)->cons_resource == NULL)
			continue;
		if (strcasecmp(patl->resource, ((*consum) + i)->cons_resource) == 0) {
			((*consum) + i)->cons_consum |= consum_flag;
			break;
		}
	}
	if (i == *consumable_size) {
		/* need to add this resource */
		newc = realloc(*consum, sizeof(struct consumable) * (*consumable_size + 1));
		if (newc) {
			*consum = newc;
			(*consumable_size)++;
			if ((((*consum) + i)->cons_resource = strdup(patl->resource)) == NULL) {
				free(newc);
				(*consumable_size)--;
				pbs_errno = PBSE_SYSTEM;
				return;
			}
			((*consum) + i)->cons_avail_str = NULL;
			((*consum) + i)->cons_avail_sum = 0;
			((*consum) + i)->cons_assn_sum = 0;
			((*consum) + i)->cons_k = 0;
			((*consum) + i)->cons_consum = consum_flag;
			((*consum) + i)->cons_set = 0;
		} else {
			pbs_errno = PBSE_SYSTEM;
			return; /* realloc failed, just return */
		}
	}
	/* Set cons_k for size values */
	if (strpbrk(patl->value, "kKmMgGtTpPbBwW") != NULL)
		((*consum) + i)->cons_k = 1;
}

/**
 * @brief
 * 	build_host_list - performs two functions while running through the vnodes
 *	1. builds a list of the various host names found in
 *	   resource_available.host
 *	2. determines which resources are in resources_assigned to know
 *	   which are consumable (and should be summed together).
 */

static void
build_host_list(struct batch_status *pbst,
		struct host_list **phost_list,
		int *host_list_size,
		struct consumable **consum,
		int *consumable_size)
{
	int i;
	char *hostn;
	struct host_list *newhl;
	struct attrl *patl;

	/* clear existing entries for reuse */

	for (i = 0; i < *host_list_size; ++i) {
		((*phost_list) + i)->hl_name[0] = '\0';
		((*phost_list) + i)->hl_node = NULL;
	}

	while (pbst) {

		/* if need be, add host_list entry for this host */
		hostn = get_resource_value(ATTR_rescavail, "host", pbst->attribs);
		if (hostn) {
			for (i = 0; i < *host_list_size; ++i) {
				if (strcasecmp(hostn, ((*phost_list) + i)->hl_name) == 0)
					break;
			}
			if (i == *host_list_size) {
				/* need to add slot for this host */
				newhl = (struct host_list *) realloc((*phost_list),
								     sizeof(struct host_list) * (*host_list_size + 1));
				if (newhl) {
					*phost_list = newhl;
					(*host_list_size)++;
				} else {
					pbs_errno = PBSE_SYSTEM;
					return; /* memory allocation failure */
				}
				strcpy(((*phost_list) + i)->hl_name, hostn);
				((*phost_list) + i)->hl_node = pbst;

			} else {
				((*phost_list) + i)->hl_node = NULL; /* null for multiple */
			}
		}

		/* now look to see what resources are in "resources_assigned" */

		patl = pbst->attribs;
		while (patl) {
			if (strcmp(patl->name, ATTR_rescavail) == 0)
				add_consumable_entry(patl, 0, consum, consumable_size);
			else if (strcmp(patl->name, ATTR_rescassn) == 0)
				add_consumable_entry(patl, 1, consum, consumable_size);
			patl = patl->next;
		}

		pbst = pbst->next;
	}

	return;
}

/**
 * @brief
 * sum_a_resources - add the value of the specified consumable resource
 *	into the "consumable" structure entry for that resource.
 *	"sized" valued resources are adjusted to be in "kb".
 *
 * @param[in]	psum	Pointer to resource
 * @param[in]	avail	Available or assigned list flag
 * @param[in]	value	Value of resource as a string
 * @param[in]	various	Label to use for multiple values
 *
 * @return	void
 */

static void
sum_a_resource(struct consumable *psum, int avail, char *value,
	       char *various)
{
	long long amt;
	char *pc;

	if (!psum || !value || !various)
		return;

	if (psum->cons_consum == 0) {
		/* not a consumable resource */
		if (avail == 0)
			return; /* this shouldn't happen, but no sweat */
		if (psum->cons_avail_str == NULL) {
			if ((psum->cons_avail_str = strdup(value)) == NULL) {
				pbs_errno = PBSE_SYSTEM;
				return;
			}
		} else if (strcasecmp(psum->cons_avail_str, value) != 0) {
			if (psum->cons_avail_str)
				free(psum->cons_avail_str);
			if ((psum->cons_avail_str = strdup(various)) == NULL) {
				pbs_errno = PBSE_SYSTEM;
				return;
			}
		}
		psum->cons_set = 1;
		return;
	}

	/* Ignore indirect resources (those that contain '@') */
	if (strchr(value, '@') != NULL)
		return;

	/* the resource is consumable so we need to add it to the current val */

	amt = strtol(value, &pc, 10);

	if (strpbrk(pc, "kKmMgGtTpPbBwW") != NULL) {

		/* adjust value to Kilobytes */
		if ((*pc == 'm') || (*pc == 'M'))
			amt = amt << 10;
		else if ((*pc == 'g') || (*pc == 'G'))
			amt = amt << 20;
		else if ((*pc == 't') || (*pc == 'T'))
			amt = amt << 30;
		else if ((*pc == 'p') || (*pc == 'P'))
			amt = amt << 30;
		else if ((*pc != 'k') && (*pc != 'K'))
			amt = amt >> 10;

		/* does the current sum need to be adjusted */
		if (psum->cons_k == 0) {
			psum->cons_avail_sum = psum->cons_avail_sum << 10;
			psum->cons_assn_sum = psum->cons_assn_sum << 10;
			psum->cons_k = 1;
		}
	}

	if (avail)
		psum->cons_avail_sum += amt;
	else
		psum->cons_assn_sum += amt;

	psum->cons_set = 1;
}

/**
 * @brief
 * 	sum_resources - for each resource found in the collection of vnodes with
 *	the have "host", the resoruces in resources_available and
 *	resources_assigned are summed.
 */
static void
sum_resources(struct batch_status *pbs,
	      struct batch_status *working,
	      const char *hostn,
	      struct consumable *consum,
	      int consumable_size,
	      char *various)
{
	char *curhn;
	int i;
	char *val;

	/* clear sums */
	for (i = 0; i < consumable_size; ++i) {
		if ((consum + i)->cons_avail_str) {
			free((consum + i)->cons_avail_str);
			(consum + i)->cons_avail_str = NULL;
		}
		(consum + i)->cons_avail_sum = 0;
		(consum + i)->cons_assn_sum = 0;
	}

	while (pbs) {

		curhn = get_resource_value(ATTR_rescavail, "host", pbs->attribs);
		if (curhn && strcasecmp(curhn, hostn) == 0) {
			for (i = 0; i < consumable_size; ++i) {

				val = get_resource_value(ATTR_rescavail, (consum + i)->cons_resource, pbs->attribs);
				sum_a_resource(consum + i, 1, val, various);

				val = get_resource_value(ATTR_rescassn, (consum + i)->cons_resource, pbs->attribs);
				sum_a_resource(consum + i, 0, val, various);
			}
		}

		pbs = pbs->next;
	}
}

/*
 * attr_names array - this array contains the possible names of vnode/host
 *	attributes to create for a "host" batch_status reply
 *	The values to be returned in the attrl list for the host are constructed
 *	in the an_value element and then converted into the attrls by the
 *	build_collective() function.
 */

#ifdef NAS /* localmod 012 */
#define SKIP_FIRST 1
#define SKIP_REST 2
#define CATENATE 4
#define UNIQUE 8
#define SKIP_ALL (SKIP_FIRST | SKIP_REST)

static struct attr_names {
	char *an_name;
	int an_type;
	int an_rest;
	char *an_value;
} attr_names[] = {
	{ATTR_NODE_Mom, UNIQUE, 0, NULL},
	{ATTR_NODE_Port, 0, 0, NULL},
	{ATTR_version, 0, 0, NULL},
	{ATTR_NODE_ntype, 0, 0, NULL},
	{ATTR_NODE_state, UNIQUE, 0, NULL},
	{ATTR_NODE_pcpus, SKIP_REST, 0, NULL},
	{ATTR_p, 0, 0, NULL},
	{ATTR_NODE_jobs, CATENATE | SKIP_FIRST, 0, NULL},
	{ATTR_maxrun, 0, 0, NULL},
	{ATTR_maxuserrun, 0, 0, NULL},
	{ATTR_maxgrprun, 0, 0, NULL},
	{ATTR_NODE_No_Tasks, SKIP_REST, 0, NULL},
	{ATTR_PNames, 0, 0, NULL},
	{ATTR_NODE_resvs, UNIQUE, 0, NULL},
	{ATTR_queue, UNIQUE, 0, NULL},
	{ATTR_comment, UNIQUE, 0, NULL},
	{ATTR_NODE_resv_enable, 0, 0, NULL},
	{ATTR_NODE_NoMultiNode, 0, 0, NULL},
	{ATTR_NODE_Sharing, UNIQUE, 0, NULL},
	{ATTR_NODE_ProvisionEnable, 0, 0, NULL},
	{ATTR_NODE_current_aoe, 0, 0, NULL},
	{ATTR_NODE_License, 0, 0, NULL},
	{ATTR_NODE_LicenseInfo, 0, 0, NULL},
	{ATTR_NODE_TopologyInfo, 0, 0, NULL},
	{ATTR_NODE_VnodePool, 0, 0, NULL},
	{ATTR_NODE_power_provisioning, 0, 0, NULL},
	{ATTR_NODE_current_eoe, 0, 0, NULL},
	{ATTR_NODE_poweroff_eligible, 0, 0, NULL},
	{ATTR_NODE_last_state_change_time, 0, 0, NULL},
	{ATTR_NODE_last_used_time, 0, 0, NULL},
	{ATTR_rescavail, SKIP_ALL, 0, NULL},
	{ATTR_rescassn, SKIP_ALL, 0, NULL},
	{NULL, 0, 0, NULL}};

/**
 * @brief
 * 	build_collective - for each vnode in the original batch_status, pbs,
 *	apply the following rules to build "host" attributes in newbsr entry
 *	"the array" refers to the array attr_names[].an_value --
 *	1. if "resources_assigned" or "resources_available", skip for now
 *	2. else if that attribute in the array has a null value, dup the value
 *		2.5. but record the null if UNIQUE form of CATENATE
 *	3. else if CATENATE attribute, append string to that in the array
 *		3.5. possibly suppress duplicates
 *	4. else if pbs attribute and array value are different, set the array
 *		to "<various>" if not already so set
 *	5. Then add in the resources_available/assigned from the consum struct
 */

static void
build_collective(struct batch_status *pbs,
		 struct batch_status *newbsr,
		 char *hostn,
		 struct consumable *consum,
		 int consumable_size,
		 char *various)
{
	char convtbuf[256];
	struct attrl *cupatl;
	struct attrl *hdpatl;
	struct attrl *nwpatl;
	char *curhn;
	char *dup;
	char *sp;
	int i;
	size_t len;

	for (i = 0; attr_names[i].an_name != NULL; ++i) {
		attr_names[i].an_rest = 0;
		attr_names[i].an_value = NULL;
	}

	for (; pbs; pbs = pbs->next) {
		if (pbs->attribs == NULL)
			continue; /* move out because it was a single host */
		curhn = get_resource_value(ATTR_rescavail, "host", pbs->attribs);
		if (curhn == NULL)
			continue;
		if (strcasecmp(hostn, curhn) != 0)
			continue;
		for (cupatl = pbs->attribs; cupatl; cupatl = cupatl->next) {
			for (i = 0; attr_names[i].an_name != NULL; ++i) {
				int rest, type;
				if (strcmp(attr_names[i].an_name, cupatl->name) != 0)
					continue;
				type = attr_names[i].an_type;
				rest = attr_names[i].an_rest;
				attr_names[i].an_rest = 1;
				if (rest == 0 && (type & SKIP_FIRST))
					break;
				if (rest && (type & SKIP_REST))
					break;
				if (!(type & UNIQUE) && attr_names[i].an_value == NULL) {
					/* rule 2. - replace null with this string */
					attr_names[i].an_value = strdup(cupatl->value);
					break;
				}
				if (type & UNIQUE) {
					if (attr_names[i].an_value == NULL) {
						if (rest == 0 || (type & SKIP_FIRST)) {
							attr_names[i].an_value = strdup(cupatl->value);
							break;
						}
						attr_names[i].an_value = strdup("<null>");
					}
					/* rule 3.5 suppress duplicates */
					len = strlen(cupatl->value);
					for (sp = attr_names[i].an_value; sp && *sp; ++sp) {
						sp = strstr(sp, cupatl->value);
						if (!sp)
							break;
						if (sp != attr_names[i].an_value && sp[-1] != ' ') {
							continue;
						}
						if (sp[len] == ',' || sp[len] == '\0')
							break;
					}
					if (sp && *sp)
						break;
					/*
					 * Fall through to CATENATE
					 */
					type |= CATENATE;
				}
				if (type & CATENATE) {
					/* rule 3. - concatenate values */
					len = strlen(attr_names[i].an_value) +
					      strlen(cupatl->value) + 3;
					/* 3 for comma, space, and null char */
					dup = malloc(len);
					if (dup) {
						strcpy(dup, attr_names[i].an_value);
						strcat(dup, ", ");
						strcat(dup, cupatl->value);
						free(attr_names[i].an_value);
						attr_names[i].an_value = dup;
					}
					break;
				}
				if ((strcmp(attr_names[i].an_value, various) != 0) && (strcmp(attr_names[i].an_value, cupatl->value) != 0)) {
					/* rule 4. - differing values = "<various>" */
					free(attr_names[i].an_value);
					attr_names[i].an_value = strdup(various);
				}
				break;
			}
		}
	}
#else
static struct attr_names {
	char *an_name;
	char *an_value;
} attr_names[] = {
	{ATTR_NODE_Mom, NULL},
	{ATTR_NODE_Port, NULL},
	{ATTR_version, NULL},
	{ATTR_NODE_ntype, NULL},
	{ATTR_NODE_state, NULL},
	{ATTR_NODE_pcpus, NULL},
	{ATTR_p, NULL},
	{ATTR_NODE_jobs, NULL},
	{ATTR_maxrun, NULL},
	{ATTR_maxuserrun, NULL},
	{ATTR_maxgrprun, NULL},
	{ATTR_NODE_No_Tasks, NULL},
	{ATTR_PNames, NULL},
	{ATTR_NODE_resvs, NULL},
	{ATTR_queue, NULL},
	{ATTR_comment, NULL},
	{ATTR_NODE_resv_enable, NULL},
	{ATTR_NODE_NoMultiNode, NULL},
	{ATTR_NODE_Sharing, NULL},
	{ATTR_NODE_ProvisionEnable, NULL},
	{ATTR_NODE_current_aoe, NULL},
	{ATTR_NODE_License, NULL},
	{ATTR_NODE_LicenseInfo, NULL},
	{ATTR_NODE_TopologyInfo, NULL},
	{ATTR_NODE_VnodePool, NULL},
	{ATTR_NODE_power_provisioning, NULL},
	{ATTR_NODE_current_eoe, NULL},
	{ATTR_NODE_poweroff_eligible, NULL},
	{ATTR_NODE_last_state_change_time, NULL},
	{ATTR_NODE_last_used_time, NULL},
	{NULL, NULL}};

/**
 * @brief
 * 	build_collective - for each vnode in the original batch_status, pbs,
 *	apply the following rules to build "host" attributes in newbsr entry
 *	"the array" refers to the array attr_names[].an_value --
 *	1. if "resources_assigned" or "resources_available", skip for now
 *	2. else if that attribute in the array has a null value, dup the value
 *	3. else if "jobs" attribute, append string to that in the array
 *	4. else if pbs attribute and array value are different, set the array
 *		to "<various>" if not already so set
 *	5. Then add in the resources_available/assigned from the consum struct
 */

static void
build_collective(struct batch_status *pbs,
		 struct batch_status *newbsr,
		 const char *hostn,
		 struct consumable *consum,
		 int consumable_size,
		 char *various)
{
	char convtbuf[256];
	struct attrl *cupatl;
	struct attrl *hdpatl;
	struct attrl *nwpatl;
	char *curhn;
	char *dup;
	int i;
	size_t len;

	for (i = 0; attr_names[i].an_name != NULL; ++i)
		attr_names[i].an_value = NULL;

	for (; pbs; pbs = pbs->next) {
		if (pbs->attribs == NULL)
			continue; /* move out because it was a single host */
		curhn = get_resource_value(ATTR_rescavail, "host", pbs->attribs);
		if (curhn == NULL)
			continue;
		if (strcasecmp(hostn, curhn) == 0) {
			for (cupatl = pbs->attribs; cupatl; cupatl = cupatl->next) {
				if ((strcmp(cupatl->name, ATTR_rescavail) == 0) ||
				    (strcmp(cupatl->name, ATTR_rescassn) == 0))
					continue; /* rule 1. */

				for (i = 0; attr_names[i].an_name != NULL; ++i) {
					if (strcmp(attr_names[i].an_name, cupatl->name) == 0) {

						if (attr_names[i].an_value == NULL) {
							/* rule 2. - replace null with this string */
							if ((attr_names[i].an_value = strdup(cupatl->value)) == NULL) {
								pbs_errno = PBSE_SYSTEM;
								return;
							}
						} else if (strcmp(cupatl->name, ATTR_NODE_jobs) == 0) {
							/* rule 3. - concatenate jobs */
							len = strlen(attr_names[i].an_value) +
							      strlen(cupatl->value) + 3;
							/* 3 for comma, space, and null char */
							dup = malloc(len);
							if (dup) {
								strcpy(dup, attr_names[i].an_value);
								strcat(dup, ", ");
								strcat(dup, cupatl->value);
								free(attr_names[i].an_value);
							} else {
								pbs_errno = PBSE_SYSTEM;
								return;
							}
							attr_names[i].an_value = dup;
						} else if ((strcmp(attr_names[i].an_value, various) != 0) && (strcmp(attr_names[i].an_value, cupatl->value) != 0)) {
							/* rule 4. - differing values = "<various>" */
							free(attr_names[i].an_value);
							if ((attr_names[i].an_value = strdup(various)) == NULL) {
								pbs_errno = PBSE_SYSTEM;
								return;
							}
						}
					}
				}
			}
		}
	}
#endif /* localmod 012 */

	/* Turn the values saved in attr_names into attrl entries */
	/* any attr_names[].an_value with a null value is ignored */

	hdpatl = NULL;

	for (i = 0; attr_names[i].an_name; ++i) {
		if (attr_names[i].an_value) {
			nwpatl = new_attrl();
			if (nwpatl) {
				if (hdpatl == NULL)
					hdpatl = nwpatl; /* head of list */
				else
					cupatl->next = nwpatl;
				if ((nwpatl->name = strdup(attr_names[i].an_name)) == NULL) {
					free_attrl_list(hdpatl);
					pbs_errno = PBSE_SYSTEM;
					return;
				}
				nwpatl->value = attr_names[i].an_value;
				/* note, the above is not dupped */
				attr_names[i].an_value = NULL;
				cupatl = nwpatl;
			} else {
				free_attrl_list(hdpatl);
				pbs_errno = PBSE_SYSTEM;
				return;
			}
		}
	}

	/* then  apply rule 5 - add in resources_available/assigned */
	/* takes two passes, first for resources_available and      */
	/* then for resources_assigned				    */

	for (i = 0; i < consumable_size; ++i) {
		if ((consum + i)->cons_set == 0)
			continue;
		if ((consum + i)->cons_consum) {
			sprintf(convtbuf, "%lld", (consum + i)->cons_avail_sum);
			if ((consum + i)->cons_k)
				strcat(convtbuf, "kb");
			dup = convtbuf;
		} else {
			dup = (consum + i)->cons_avail_str;
		}
		if (dup != NULL) {
			nwpatl = new_attrl();

			if (nwpatl) {
				if (hdpatl == NULL)
					hdpatl = nwpatl;
				else
					cupatl->next = nwpatl;
				nwpatl->next = NULL;
				if ((nwpatl->name = strdup(ATTR_rescavail)) == NULL) {
					free_attrl_list(hdpatl);
					pbs_errno = PBSE_SYSTEM;
					return;
				}
				if ((nwpatl->resource = strdup((consum + i)->cons_resource)) == NULL) {
					free_attrl_list(hdpatl);
					pbs_errno = PBSE_SYSTEM;
					return;
				}
				if ((nwpatl->value = strdup(dup)) == NULL) {
					free_attrl_list(hdpatl);
					pbs_errno = PBSE_SYSTEM;
					return;
				}
				cupatl = nwpatl;
			} else {
				free_attrl_list(hdpatl);
				pbs_errno = PBSE_SYSTEM;
				return;
			}
		}
	}

	/* now do the resources_assigned */
	for (i = 0; i < consumable_size; ++i) {
		if ((consum + i)->cons_set == 0)
			continue;
		if ((consum + i)->cons_consum) {
			sprintf(convtbuf, "%lld", (consum + i)->cons_assn_sum);
			if ((consum + i)->cons_k)
				strcat(convtbuf, "kb");
			nwpatl = new_attrl();
			if (nwpatl) {
				if (hdpatl == NULL)
					hdpatl = nwpatl;
				else
					cupatl->next = nwpatl;
				if ((nwpatl->name = strdup(ATTR_rescassn)) == NULL) {
					free_attrl_list(hdpatl);
					pbs_errno = PBSE_SYSTEM;
					return;
				}
				if ((nwpatl->resource = strdup((consum + i)->cons_resource)) == NULL) {
					free_attrl_list(hdpatl);
					pbs_errno = PBSE_SYSTEM;
					return;
				}
				if ((nwpatl->value = strdup(convtbuf)) == NULL) {
					free_attrl_list(hdpatl);
					pbs_errno = PBSE_SYSTEM;
					return;
				}
				cupatl = nwpatl;
			} else {
				free_attrl_list(hdpatl);
				pbs_errno = PBSE_SYSTEM;
				return;
			}
		}
	}

	/* NOTE: DO NOT free the attr_names[].an_value strings   */
	/* They are in use in the attrls sent back to the caller */

	newbsr->attribs = hdpatl;
}

/**
 * @brief
 * 	build_return_status_list - build a new batch_status list for the reply
 *	or append to the existing list which is passed in.
 */
struct batch_status *
build_return_status(struct batch_status *bstatus,
		    const char *hname,
		    struct batch_status *curlist,
		    struct host_list *phost_list,
		    int host_list_size,
		    struct consumable *consum,
		    int consumable_size,
		    char *various)
{
	struct batch_status *cpbs;
	struct batch_status *npbs;
	int i;

	npbs = malloc(sizeof(struct batch_status));
	if (npbs == NULL) {
		pbs_errno = PBSE_SYSTEM;
		return NULL;
	}

	npbs->next = NULL;
	npbs->text = NULL;

	/* is the host in question a single or multi-vnode host */

	for (i = 0; i < host_list_size; ++i) {
		if (strcasecmp(hname, (phost_list + i)->hl_name) == 0) {
			if ((phost_list + i)->hl_node != NULL) {

				/* single vnode host - use the real one */

				/* prevent double free: copy name, move attribs */
				if ((npbs->name = strdup((phost_list + i)->hl_node->name)) == NULL) {
					free(npbs);
					pbs_errno = PBSE_SYSTEM;
					return NULL;
				}
				npbs->attribs = (phost_list + i)->hl_node->attribs;
				(phost_list + i)->hl_node->attribs = NULL;
				if ((phost_list + i)->hl_node->text)
					if ((npbs->text = strdup((phost_list + i)->hl_node->text)) == NULL) {
						free(npbs->name);
						free(npbs);
						pbs_errno = PBSE_SYSTEM;
						return NULL;
					}

			} else {

				/* multi-vnoded host, build attrls from collection */
				/* of the attrls of all the vnode's on the host    */

				if ((npbs->name = strdup(hname)) == NULL) {
					free(npbs);
					pbs_errno = PBSE_SYSTEM;
					return NULL;
				}
				npbs->attribs = NULL;

				sum_resources(bstatus, npbs, hname,
					      consum, consumable_size, various);
				build_collective(bstatus, npbs, hname,
						 consum, consumable_size, various);
			}

			/* append new to end of the current list */
			if (curlist == NULL) {
				curlist = npbs;
			} else {
				/* curlist must be unchanged here */
				cpbs = curlist;
				while (cpbs->next)
					cpbs = cpbs->next;
				cpbs->next = npbs;
			}
			break;
		}
	}
	if (i == host_list_size) {
		/* did not find a host of the given name in the table */
		free(npbs); /* no leaking */
		pbs_errno = PBSE_UNKNODE;
	}

	return curlist;
}

/**
 * @brief
 * 	pbs_stathost - return status on a single named host or all hosts known
 *	A host is defined by the value of resources_available.host
 *
 *	Function does a pbs_statvnode() to collect information on all vnodes
 *	and then aggregates the attributes from the vndoes that share the same
 *	host value.
 *
 *	If resources in resources_assigned/resources_available are consumable,
 *	so defined by being in resources_assigned, then the values for the same
 *	resource on the collection of vnodes are summed.
 *
 *	Otherwise, if the attribute or resource values are identical across the
 *	set of vnodes, that value is reported.  Else, the string "<various>"
 *	is reported, meaing the vnodes have different values.
 *
 *	This function, like most in PBS, is NOT thread safe.
 */

struct batch_status *
__pbs_stathost(int con, const char *hid, struct attrl *attrib, const char *extend)
{
	struct batch_status *breturn; /* the list returned to the caller */
	struct batch_status *bstatus; /* used internally		   */
	int i;
	/* variables used across many function, these are what make the function */
	char *various = "<various>";
	struct host_list *phost_list = NULL;
	struct consumable *consum = NULL;
	int host_list_size = 0;
	int consumable_size = 0;
	struct pbs_client_thread_connect_context *context;

	breturn = NULL;

	/* get status of all vnodes */
	bstatus = pbs_statvnode(con, "", attrib, extend);

	if (bstatus == NULL)
		return NULL;

	build_host_list(bstatus, &phost_list, &host_list_size,
			&consum, &consumable_size);

	if ((hid == NULL) || (*hid == '\0')) {

		/*
		 * No host specified, so for each host found in the host_list
		 * entries, gather info from the vnodes associated with that host
		 */

		for (i = 0; i < host_list_size; ++i) {
			hid = (phost_list + i)->hl_name;
			breturn = build_return_status(bstatus, hid, breturn,
						      phost_list, host_list_size,
						      consum, consumable_size,
						      various);
		}

	} else {

		/*
		 * Specific host names gather info from the vnodes associate with it
		 */

		breturn = build_return_status(bstatus, hid, breturn,
					      phost_list, host_list_size,
					      consum, consumable_size,
					      various);
		if ((breturn == NULL) && (pbs_errno == PBSE_UNKNODE)) {
			/*
			 * store error in TLS if available. Fallback to
			 * connection structure.
			 */
			context = pbs_client_thread_find_connect_context(con);
			if (context != NULL) {
				if (context->th_ch_errtxt != NULL)
					free(context->th_ch_errtxt);
				if ((context->th_ch_errtxt = strdup(pbse_to_txt(pbs_errno))) == NULL) {
					pbs_errno = PBSE_SYSTEM;
					return NULL;
				}
			} else {
				if (set_conn_errtxt(con, pbse_to_txt(pbs_errno)) != 0) {
					pbs_errno = PBSE_SYSTEM;
					return NULL;
				}
			}
		}
	}

	pbs_statfree(bstatus); /* free info returned by pbs_statvnodes() */
	for (i = 0; i < consumable_size; ++i)
		free((consum + i)->cons_resource);
	free(consum);
	consum = NULL;
	consumable_size = 0;
	free(phost_list);
	phost_list = NULL;
	host_list_size = 0;
	return breturn;
}


================================================
FILE: src/lib/Libifl/pbsD_statjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statjob.c
 *
 * Return the status of a job.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-Return the status of a job.
 *
 * @param[in] c - communication handle
 * @param[in] id - job id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for req
 *
 * @return	structure handle
 * @retval	pointer to batch_status struct		success
 * @retval	NULL					error
 *
 */
struct batch_status *
__pbs_statjob(int c, const char *id, struct attrl *attrib, const char *extend)
{
	struct batch_status *ret = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	if ((pbs_verify_attributes(c, PBS_BATCH_StatusJob,
				   MGR_OBJ_JOB, MGR_CMD_NONE, (struct attropl *) attrib)))
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusJob, id, attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_statnode.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statnode.c - contains pbs_statnode() and pbs_statvnode()
 * @brief
 * Return the status of host(s) or vnodes.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 * 	-pbs_statnode() - calls pbs_stathost(), returns status of host
 *	maintained for backward compatibility
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL					error
 *
 */
struct batch_status *
__pbs_statnode(int c, const char *id, struct attrl *attrib, const char *extend)
{
	return pbs_stathost(c, id, attrib, extend);
}

/**
 * @brief
 * 	-__pbs_statvnode() - returns information about virtual nodes (vnodes)
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	structure handle
 * @retval	pointer to batch_status struct		Success
 * @retval	NULL					error
 *
 */
struct batch_status *
__pbs_statvnode(int c, const char *id, struct attrl *attrib, const char *extend)
{
	int rc;
	struct batch_status *ret = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	rc = pbs_verify_attributes(c, PBS_BATCH_StatusNode, MGR_OBJ_NODE,
				   MGR_CMD_NONE, (struct attropl *) attrib);
	if (rc)
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusNode, id, attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_statque.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statque.c
 * @brief
 * Return the status of a queue.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-Return the status of a queue.
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */

struct batch_status *
__pbs_statque(int c, const char *id, struct attrl *attrib, const char *extend)
{
	struct batch_status *ret = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	if ((pbs_verify_attributes(c, PBS_BATCH_StatusQue, MGR_OBJ_QUEUE,
				   MGR_CMD_NONE, (struct attropl *) attrib)))
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusQue, id, attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_statresv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statresv.c
 * @brief
 * Return the status of a reservation.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-Return the status of a reservation.
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */

struct batch_status *
__pbs_statresv(int c, const char *id, struct attrl *attrib, const char *extend)
{
	struct batch_status *ret = NULL;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	if ((pbs_verify_attributes(c, PBS_BATCH_StatusResv, MGR_OBJ_RESV,
				   MGR_CMD_NONE, (struct attropl *) attrib)))
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusResv, id, attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_statrsc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statrsc.c
 * @brief
 * Return the status of one or more resources.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	Return the status of one or more resources.
 *
 * @param[in] c - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */

struct batch_status *
__pbs_statrsc(int c, const char *id, struct attrl *attrib, const char *extend)
{
	struct batch_status *ret = NULL;
	int rc;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	rc = pbs_verify_attributes(c, PBS_BATCH_StatusRsc, MGR_OBJ_RSC,
				   MGR_CMD_NONE, (struct attropl *) attrib);
	if (rc)
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusRsc, id, attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_statsched.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statsched.c
 * @brief
 * Return the status of sched objects.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	- Return the status of sched objects.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */

struct batch_status *
__pbs_statsched(int c, struct attrl *attrib, const char *extend)
{
	struct batch_status *ret = NULL;
	int rc;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	rc = pbs_verify_attributes(c, PBS_BATCH_StatusSched, MGR_OBJ_SCHED,
				   MGR_CMD_NONE, (struct attropl *) attrib);
	if (rc)
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusSched, "", attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_statsrv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statserver.c
 * @brief
 * Return the status of a server.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-Return the status of a server.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return      structure handle
 * @retval      pointer to batch_status struct          Success
 * @retval      NULL                                    error
 *
 */

struct batch_status *
__pbs_statserver(int c, struct attrl *attrib, const char *extend)
{
	struct batch_status *ret = NULL;
	int rc;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	rc = pbs_verify_attributes(c, PBS_BATCH_StatusSvr, MGR_OBJ_SERVER,
				   MGR_CMD_NONE, (struct attropl *) attrib);
	if (rc)
		return NULL;

	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ret = PBSD_status(c, PBS_BATCH_StatusSvr, "", attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_submit.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *	The Submit Job request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <strings.h>
#include <fcntl.h>
#include <unistd.h>
#include <assert.h>
#include "libpbs.h"
#include "credential.h"
#include "pbs_ecl.h"
#include "pbs_client_thread.h"

#include "ticket.h"

/* for use with pbs_submit_with_cred */
struct cred_info {
	int cred_type;
	size_t cred_len;
	char *cred_buf;
};

/**
 * @brief
 *	-wrapper function for pbs_submit where submission takes credentials.
 *
 * @param[in] c - communication handle
 * @param[in] attrib - pointer to attr list
 * @param[in] script - script to be submitted
 * @param[in] destination - host where submission happens
 * @param[in] extend - extend string for encoding req
 * @param[in] credtype - credential type
 * @param[in] credlen - credential length
 * @param[in] credbuf - buffer to hold cred info
 *
 * @return 	string
 * @retval	jobid	success
 * @retval	NULL	error
 *
 */
char *
pbs_submit_with_cred(int c, struct attropl *attrib, char *script,
		     char *destination, char *extend, int credtype,
		     size_t credlen, char *credbuf)
{
	char *ret;
	struct pbs_client_thread_context *ptr;
	struct cred_info *cred_info;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	ptr = (struct pbs_client_thread_context *) pbs_client_thread_get_context_data();
	if (!ptr) {
		pbs_errno = PBSE_INTERNAL;
		(void) pbs_client_thread_unlock_connection(c);
		return NULL;
	}

	if (!ptr->th_cred_info) {
		cred_info = malloc(sizeof(struct cred_info));
		if (!cred_info) {
			pbs_errno = PBSE_INTERNAL;
			(void) pbs_client_thread_unlock_connection(c);
			return NULL;
		}
		ptr->th_cred_info = (void *) cred_info;
	} else
		cred_info = (struct cred_info *) ptr->th_cred_info;

	/* copy credentials to static variables */
	cred_info->cred_buf = credbuf;
	cred_info->cred_len = credlen;
	cred_info->cred_type = credtype;

	/* pbs_submit takes credentials from static variables */
	ret = pbs_submit(c, attrib, script, destination, extend);

	cred_info->cred_buf = NULL;
	cred_info->cred_len = 0;
	cred_info->cred_type = 0;

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}

/**
 * @brief
 *	-submit job request
 *
 * @param[in] c - communication handle
 * @param[in] attrib - ponter to attr list
 * @param[in] script - job script
 * @param[in] dest - host where job submitted
 * @param[in] extend - buffer to hold cred info
 *
 * @return      string
 * @retval      jobid   success
 * @retval      NULL    error
 *
 */
char *
__pbs_submit(int c, struct attropl *attrib, const char *script, const char *dest, const char *extend)
{
	struct attropl *pal;
	char *return_jobid = NULL;
	int rc;
	struct pbs_client_thread_context *ptr;
	struct cred_info *cred_info = NULL;
	int commit_done = 0;
	char *lextend = NULL;

	/* initialize the thread context data, if not already initialized */
	if ((pbs_errno = pbs_client_thread_init_thread_context()) != 0)
		goto error;

	ptr = (struct pbs_client_thread_context *) pbs_client_thread_get_context_data();
	if (!ptr) {
		pbs_errno = PBSE_INTERNAL;
		goto error;
	}

	/* first verify the attributes, if verification is enabled */
	if (pbs_verify_attributes(c, PBS_BATCH_QueueJob, MGR_OBJ_JOB, MGR_CMD_NONE, attrib) != 0)
		goto error; /* pbs_errno is already set in this case */

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		goto error; /* pbs_errno is already set in this case */

	/* first be sure that the script is readable if specified ... */
	if ((script != NULL) && (*script != '\0')) {
		if (access(script, R_OK) != 0) {
			pbs_errno = PBSE_BADSCRIPT;
			if (set_conn_errtxt(c, "cannot access script file") != 0)
				pbs_errno = PBSE_SYSTEM;
			goto error;
		}
	}

	/* initiate the queueing of the job */
	for (pal = attrib; pal; pal = pal->next)
		pal->op = SET; /* force operator to SET */

	cred_info = (struct cred_info *) ptr->th_cred_info;
	if ((!script || (*script == '\0')) && (!cred_info || (cred_info->cred_len <= 0))) {
		/* no cred and no script, let's request implicit commit to cut one message exchange */
		if (extend) {
			lextend = EXTEND_OPT_IMPLICIT_COMMIT;
			if (!pbs_strcat(&lextend, NULL, extend)) {
				if (set_conn_errtxt(c, "Failed to allocate memory") != 0)
					pbs_errno = PBSE_SYSTEM;
				lextend = NULL;
				goto error;
			}
			extend = lextend;
		} else
			extend = EXTEND_OPT_IMPLICIT_COMMIT;
	}

	/* Queue job with null string for job id */
	return_jobid = PBSD_queuejob(c, "", dest, attrib, extend, PROT_TCP, NULL, &commit_done);
	if (return_jobid == NULL)
		goto error;

	if (commit_done)
		goto done;

	/* send script across */
	if ((script != NULL) && (*script != '\0')) {
		if ((rc = PBSD_jscript(c, script, 0, NULL)) != 0) {
			if (rc == PBSE_JOBSCRIPTMAXSIZE)
				pbs_errno = rc;
			else
				pbs_errno = PBSE_BADSCRIPT;
			goto error;
		}
	}

	/* OK, the script got across, apparently, so we are */
	/* ready to commit */
	/* opaque information */
	if (cred_info && cred_info->cred_len > 0) {
		if (PBSD_jcred(c, cred_info->cred_type,
			       cred_info->cred_buf,
			       cred_info->cred_len, 0, NULL) != 0) {
			pbs_errno = PBSE_BADCRED;
			goto error;
		}
	}

	if (PBSD_commit(c, return_jobid, 0, NULL, NULL) != 0)
		goto error;

error:
done:
	free(lextend);
	/* unlock the thread lock and update the thread context data */
	pbs_client_thread_unlock_connection(c);
	return return_jobid;
}


================================================
FILE: src/lib/Libifl/pbsD_submit_resv.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_submit.c
 * @brief
 *	The Submit Reservation request.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <fcntl.h>
#include <unistd.h>
#include "libpbs.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	Passes submit reservation request to PBSD_submit_resv( )
 *
 * @param[in]   c - socket on which connected
 * @param[in]   attrib - the list of attributes for batch request
 * @parma[in]   extend - extension of batch request
 *
 * @return char*
 * @retval SUCCESS returns the reservation ID
 * @retval ERROR NULL
 */
char *
__pbs_submit_resv(int c, struct attropl *attrib, const char *extend)
{
	struct attropl *pal;
	int rc;
	char *ret;

	for (pal = attrib; pal; pal = pal->next)
		pal->op = SET; /* force operator to SET */

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return NULL;

	/* first verify the attributes, if verification is enabled */
	rc = pbs_verify_attributes(c, PBS_BATCH_SubmitResv,
				   MGR_OBJ_RESV, MGR_CMD_NONE, attrib);
	if (rc)
		return NULL;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return NULL;

	/* initiate the queueing of the reservation  */

	/* Queue job with null string for job id */
	ret = PBSD_submit_resv(c, "", attrib, extend);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return NULL;

	return ret;
}


================================================
FILE: src/lib/Libifl/pbsD_termin.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_terminate.c
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <stdio.h>
#include "libpbs.h"
#include "dis.h"
#include "pbs_ecl.h"

/**
 * @brief
 *	-send termination batch_request to server.
 *
 * @param[in] c - communication handle
 * @param[in] manner - manner in which server to be terminated
 * @param[in] extend - extension string for request
 *
 * @return	int
 * @retval	0		success
 * @retval	pbs_error	error
 *
 */
int
__pbs_terminate(int c, int manner, const char *extend)
{
	struct batch_reply *reply;
	int rc = 0;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return pbs_errno;

	/* lock pthread mutex here for this connection */
	/* blocking call, waits for mutex release */
	if (pbs_client_thread_lock_connection(c) != 0)
		return pbs_errno;

	/* setup DIS support routines for following DIS calls */
	DIS_tcp_funcs();

	if ((rc = encode_DIS_ReqHdr(c, PBS_BATCH_Shutdown, pbs_current_user)) ||
	    (rc = encode_DIS_ShutDown(c, manner)) ||
	    (rc = encode_DIS_ReqExtend(c, extend))) {
		if (set_conn_errtxt(c, dis_emsg[rc]) != 0)
			pbs_errno = PBSE_SYSTEM;
		else
			pbs_errno = PBSE_PROTOCOL;

		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	if (dis_flush(c)) {
		pbs_errno = PBSE_PROTOCOL;
		pbs_client_thread_unlock_connection(c);
		return pbs_errno;
	}

	/* read in reply */
	reply = PBSD_rdrpy(c);
	rc = get_conn_errno(c);
	PBSD_FreeReply(reply);

	/* unlock the thread lock and update the thread context data */
	if (pbs_client_thread_unlock_connection(c) != 0)
		return pbs_errno;

	return rc;
}


================================================
FILE: src/lib/Libifl/pbs_delstatfree.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statfree.c
 * @brief
 * The function that deallocates a "batch_status" structure
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdlib.h>
#include <stdio.h>
#include "libpbs.h"

/**
 * @brief
 *	-The function that deallocates a "batch_deljob_status" structure
 *
 * @param[in] bsp - pointer to batch request.
 *
 * @return	Void
 *
 */
void
__pbs_delstatfree(struct batch_deljob_status *bsp)
{
	struct batch_deljob_status *bsnxt;

	while (bsp != NULL) {
		if (bsp->name != NULL)
			free(bsp->name);
		bsnxt = bsp->next;
		free(bsp);
		bsp = bsnxt;
	}
}


================================================
FILE: src/lib/Libifl/pbs_get_attribute_errors.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_get_attribute_errors.c
 * @brief
 *	The function returns the attributes that failed verification
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdlib.h>
#include <stdio.h>
#include "libpbs.h"

/**
 * @brief
 *	-The function returns the attributes that failed verification
 *
 * @param[in] connect - socket descriptor
 *
 * @return	structure handle
 * @retval	pointer to ecl_attribute_errors struct		success
 * @retval	NULL						error
 *
 */
struct ecl_attribute_errors *
__pbs_get_attributes_in_error(int connect)
{
	struct ecl_attribute_errors *err_list = NULL;
	struct pbs_client_thread_context *ptr = pbs_client_thread_get_context_data();
	if (ptr)
		err_list = ptr->th_errlist;

	if (err_list && err_list->ecl_numerrors)
		return err_list;
	else
		return NULL;
}


================================================
FILE: src/lib/Libifl/pbs_geterrmg.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_geterrmsg.c
 * @brief
 * Return the last error message the server returned on
 * this connection.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"

/**
 * @brief
 *	-Return the last error message the server returned on
 *	this connection.
 *
 * @param[in] connect - soket descriptor
 *
 * @return	string
 * @retval	connection contexts
 *		TLS			multithread
 *		STRUCTURE		single thread
 * @retval	errmsg			error
 *
 */
char *
__pbs_geterrmsg(int connect)
{
	struct pbs_client_thread_connect_context *con = pbs_client_thread_find_connect_context(connect);
	struct pbs_client_thread_context *thrd_ctxt = pbs_client_thread_get_context_data();

	/*
	 * multithreaded callers will have the connection contexts stored
	 * in the TLS, whereas single threaded clients dont use the TLS
	 * So, return connection structure values after checking
	 */
	if (con && thrd_ctxt && (thrd_ctxt->th_pbs_mode == 0))
		return (con->th_ch_errtxt);
	else
		return get_conn_errtxt(connect);
}


================================================
FILE: src/lib/Libifl/pbs_geterrno.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_geterrno.c
 * @brief
 *	Return pbs_errno
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"

/**
 * @brief
 *	-returns pbs_errno
 *
 * @return	int
 * @retval	pbs_errno
 *
 */
int
pbs_geterrno(void)
{
	return pbs_errno;
}


================================================
FILE: src/lib/Libifl/pbs_ifl.i
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

%module pbs_ifl

%begin %{
#include <pbs_python_private.h>
%}

%{
#include "pbs_ifl.h"
#include "pbs_error.h"
%}

/* functions to acquire values from thread specific variables */
%inline
%{
int get_pbs_errno(void)
{
    return pbs_errno;
}

const char * get_pbs_server(void)
{
    return pbs_server;
}
%}

%include "pbs_ifl.h"
%include "pbs_error.h"


================================================
FILE: src/lib/Libifl/pbs_loadconf.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_loadconf.c
 */
#include <pbs_config.h>
#include <ctype.h>
#include <sys/types.h>
#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <netdb.h>
#include <pbs_ifl.h>
#include <pwd.h>
#include <pthread.h>
#include "pbs_internal.h"
#include <limits.h>
#include <pbs_error.h>
#include "pbs_client_thread.h"
#include "net_connect.h"
#include "portability.h"
#include "cmds.h"

#include <sys/stat.h>
#include <unistd.h>

#ifndef WIN32
#define shorten_and_cleanup_path(p) strdup(p)
#endif

char *pbs_conf_env = "PBS_CONF_FILE";

static char *pbs_loadconf_buf = NULL;
static int pbs_loadconf_len = 0;

/*
 * Initialize the pbs_conf structure.
 *
 * The order of elements must be kept in sync with the pbs_config
 * structure definition in src/include/pbs_internal.h
 */
struct pbs_config pbs_conf = {
	0,			    /* loaded */
	0,			    /* load_failed */
	0,			    /* start_server */
	0,			    /* start_mom */
	0,			    /* start_sched */
	0,			    /* start comm */
	0,			    /* locallog */
	NULL,			    /* default to NULL for supported auths */
	NULL,			    /* auth service users list, will default to just "root" if not set explicitly */
	{'\0'},			    /* default no auth method to encrypt/decrypt data */
	AUTH_RESVPORT_NAME,	    /* default to reserved port authentication */
	AUTH_RESVPORT_NAME,	    /* default to reserved port qsub -I authentication. Possible values: resvport, munge */
	{'\0'},			    /* default no method to encrypt/decrypt data in an interatcive job */
	0,			    /* sched_modify_event */
	0,			    /* syslogfac */
	3,			    /* syslogsvr - LOG_ERR from syslog.h */
	PBS_BATCH_SERVICE_PORT,	    /* batch_service_port */
	PBS_BATCH_SERVICE_PORT_DIS, /* batch_service_port_dis */
	PBS_MOM_SERVICE_PORT,	    /* mom_service_port */
	PBS_MANAGER_SERVICE_PORT,   /* manager_service_port */
	PBS_DATA_SERVICE_PORT,	    /* pbs data service port */
	NULL,			    /* pbs_conf_file */
	NULL,			    /* pbs_home_path */
	NULL,			    /* pbs_exec_path */
	NULL,			    /* pbs_server_name */
	NULL,			    /* cp_path */
	NULL,			    /* scp_path */
	NULL,			    /* scp_args */
	NULL,			    /* rcp_path */
	NULL,			    /* pbs_demux_path */
	NULL,			    /* pbs_environment */
	NULL,			    /* iff_path */
	NULL,			    /* primary name   */
	NULL,			    /* secondary name */
	NULL,			    /* aux Mom home   */
	NULL,			    /* pbs_core_limit */
	NULL,			    /* default database host  */
	NULL,			    /* pbs_tmpdir */
	NULL,			    /* pbs_server_host_name */
	NULL,			    /* pbs_public_host_name */
	NULL,			    /* pbs_mail_host_name */
	NULL,			    /* pbs_output_host_name */
	NULL,			    /* pbs_smtp_server_name */
	1,			    /* use compression by default with TCP */
	1,			    /* use mcast by default with TCP */
	NULL,			    /* default leaf name */
	NULL,			    /* for leaf, default communication routers list */
	NULL,			    /* default router name */
	NULL,			    /* for router, default communication routers list */
	0,			    /* default comm logevent mask */
	4,			    /* default number of threads */
	NULL,			    /* mom short name override */
	0,			    /* high resolution timestamp logging */
	0,			    /* number of scheduler threads */
	NULL,			    /* default scheduler user */
	NULL,			    /* default scheduler auth user */
	NULL,			    /* privileged auth user */
	NULL,			    /* path to user credentials program */
	{'\0'}			    /* current running user */
#ifdef WIN32
	,
	NULL /* remote viewer launcher executable along with launch options */
#endif
};

/**
 * @brief
 *	identify_service_entry - Maps a service name to a variable location in pbs_conf
 *
 * @par
 *	Calls to getservbyname() are expensive. Instead we want to parse the
 *	service entries using getsrvent(). This static function is used to
 *	map a service name (or alias) to the proper location in the pbs_conf
 *	structure defined above.
 *
 * @param[in] name	The name of the service being parsed
 *
 * @return unsigned int *
 * @retval !NULL for success
 * @retval NULL for not found
 */
static unsigned int *
identify_service_entry(char *name)
{
	unsigned int *p = NULL;
	if ((name == NULL) || (*name == '\0'))
		return NULL;
	if (strcmp(name, PBS_BATCH_SERVICE_NAME) == 0) {
		p = &pbs_conf.batch_service_port;
	} else if (strcmp(name, PBS_BATCH_SERVICE_NAME_DIS) == 0) {
		p = &pbs_conf.batch_service_port_dis;
	} else if (strcmp(name, PBS_MOM_SERVICE_NAME) == 0) {
		p = &pbs_conf.mom_service_port;
	} else if (strcmp(name, PBS_MANAGER_SERVICE_NAME) == 0) {
		p = &pbs_conf.manager_service_port;
	} else if (strcmp(name, PBS_DATA_SERVICE_NAME) == 0) {
		p = &pbs_conf.pbs_data_service_port;
	}
	return p;
}

/**
 * @brief
 *	pbs_get_conf_file - Identify the configuration file location
 *
 * @return char *
 * @retval !NULL pointer to the configuration file name
 * @retval NULL should never be returned
 */
static char *
pbs_get_conf_file(void)
{
	char *conf_file;

	/* If pbs_conf already been populated use that value. */
	if ((pbs_conf.loaded != 0) && (pbs_conf.pbs_conf_file != NULL))
		return (pbs_conf.pbs_conf_file);

	if (pbs_conf_env == NULL) {
		if ((conf_file = getenv("PBS_CONF_FILE")) == NULL)
			conf_file = PBS_CONF_FILE;
	} else {
		if ((conf_file = getenv(pbs_conf_env)) == NULL)
			conf_file = PBS_CONF_FILE;
	}
	return (shorten_and_cleanup_path(conf_file));
}

/**
 * @brief
 *	parse_config_line - Read and parse one line of the pbs.conf file
 *
 * @param[in] fp	File pointer to use for reading
 * @param[in/out] key	Pointer to variable name pointer
 * @param[in/out] val	Pointer to variable value pointer
 *
 * @return int
 * @retval !NULL Input remains
 * @retval NULL End of input
 */
static char *
parse_config_line(FILE *fp, char **key, char **val)
{
	char *start;
	char *end;
	char *split;
	char *ret;

	*key = "";
	*val = "";

	/* Use a do-while rather than a goto. */
	do {
		int len;

		ret = pbs_fgets(&pbs_loadconf_buf, &pbs_loadconf_len, fp);
		if (ret == NULL)
			break;
		len = strlen(pbs_loadconf_buf);
		if (len < 1)
			break;
		/* Advance the start pointer past any whitespace. */
		for (start = pbs_loadconf_buf; (*start != '\0') && isspace((int) *start); start++)
			;
		/* Is this a comment line. */
		if (*start == '#')
			break;
		/* Remove whitespace from the end. */
		for (end = pbs_loadconf_buf + len - 1; (end >= start) && isspace((int) *end); end--)
			*end = '\0';
		/* Was there nothing but white space? */
		if (start >= end)
			break;
		split = strchr(start, '=');
		if (split == NULL)
			break;
		*key = start;
		*split++ = '\0';
		*val = split;
	} while (0);

	return ret;
}

/**
 * @brief
 *	pbs_loadconf - Populate the pbs_conf structure
 *
 * @par
 *	Load the pbs_conf structure.  The variables can be filled in
 *	from either the environment or the pbs.conf file.  The
 *	environment gets priority over the file.  If any of the
 *	primary variables are not filled in, the function fails.
 *	Primary vars: pbs_home_path, pbs_exec_path, pbs_server_name
 *
 * @note
 *	Clients can now be multithreaded. So dont call pbs_loadconf with
 *	reload = TRUE. Currently, the code flow ensures that the configuration
 *	is loaded only once (never used with reload true). Thus in the rest of
 *	the code a direct read of the pbs_conf.variables is fine. There is no
 *	race of access of pbs_conf vars against the loading of pbs_conf vars.
 *	However, if pbs_loadconf is called with reload = TRUE, this assumption
 *	will be void. In that case, access to every pbs_conf.variable has to be
 *	synchronized against the reload of those variables.
 *
 * @param[in] reload	Whether to attempt a reload
 *
 * @return int
 * @retval 1 Success
 * @retval 0 Failure
 */
int
__pbs_loadconf(int reload)
{
	FILE *fp;
	char buf[256];
	char *conf_name;     /* the name of the conf parameter */
	char *conf_value;    /* the value from the conf file or env*/
	char *gvalue;	     /* used with getenv() */
	unsigned int uvalue; /* used with sscanf() */
	struct passwd *pw;
	uid_t pbs_current_uid;
#ifndef WIN32
	struct servent *servent; /* for use with getservent */
	char **servalias;	 /* service alias list */
	unsigned int *pui;	 /* for use with identify_service_entry */
#endif

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return 0;

	/* this section of the code modified the procecss-wide
	 * tcp array. Since multiple threads can get into this
	 * simultaneously, we need to serialize it
	 */
	if (pbs_client_thread_lock_conf() != 0)
		return 0;

	if (pbs_conf.loaded && !reload) {
		(void) pbs_client_thread_unlock_conf();
		return 1;
	} else if (pbs_conf.load_failed && !reload) {
		(void) pbs_client_thread_unlock_conf();
		return 0;
	}

	/*
	 * If there are service port definitions available, use them
	 * as the defaults. They may be overridden later by the config
	 * file or environment variables. If not available, retain
	 * whatever we were using before.
	 */
#ifdef WIN32
	/* Windows does not have the getservent() call. */
	pbs_conf.batch_service_port = get_svrport(
		PBS_BATCH_SERVICE_NAME, "tcp",
		pbs_conf.batch_service_port);
	pbs_conf.batch_service_port_dis = get_svrport(
		PBS_BATCH_SERVICE_NAME_DIS, "tcp",
		pbs_conf.batch_service_port_dis);
	pbs_conf.mom_service_port = get_svrport(
		PBS_MOM_SERVICE_NAME, "tcp",
		pbs_conf.mom_service_port);
	pbs_conf.manager_service_port = get_svrport(
		PBS_MANAGER_SERVICE_NAME, "tcp",
		pbs_conf.manager_service_port);
	pbs_conf.pbs_data_service_port = get_svrport(
		PBS_DATA_SERVICE_NAME, "tcp",
		pbs_conf.pbs_data_service_port);
#else
	/* Non-Windows uses getservent() for better performance. */
	while ((servent = getservent()) != NULL) {
		if (strcmp(servent->s_proto, "tcp") != 0)
			continue;
		/* First, check the official service name. */
		pui = identify_service_entry(servent->s_name);
		if (pui != NULL) {
			*pui = (unsigned int) ntohs(servent->s_port);
			continue;
		}
		/* Next, check any aliases that may be defined. */
		for (servalias = servent->s_aliases; (servalias != NULL) && (*servalias != NULL); servalias++) {
			pui = identify_service_entry(*servalias);
			if (pui != NULL) {
				*pui = (unsigned int) ntohs(servent->s_port);
				break;
			}
		}
	}
	endservent();
#endif

	/*
	 * Once we determine the location of the pbs.conf file, it never changes.
	 * The fact that it is saved to the pbs_conf global structure means that
	 * we can always see its location when debugging.
	 */
	if (pbs_conf.pbs_conf_file == NULL)
		pbs_conf.pbs_conf_file = pbs_get_conf_file();

	/*
	 * Parse through the configuration file and set variables based
	 * on the contents of the file.
	 */
	if ((fp = fopen(pbs_conf.pbs_conf_file, "r")) != NULL) {
		while (parse_config_line(fp, &conf_name, &conf_value) != NULL) {
			if ((conf_name == NULL) || (*conf_name == '\0'))
				continue;

			if (!strcmp(conf_name, PBS_CONF_START_SERVER)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.start_server = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_START_MOM)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.start_mom = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_START_SCHED)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.start_sched = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_START_COMM)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.start_comm = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_LOCALLOG)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.locallog = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_SYSLOG)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.syslogfac = ((uvalue <= (23 << 3)) ? uvalue : 0);
			} else if (!strcmp(conf_name, PBS_CONF_SYSLOGSEVR)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.syslogsvr = ((uvalue <= 7) ? uvalue : 0);
			} else if (!strcmp(conf_name, PBS_CONF_BATCH_SERVICE_PORT)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.batch_service_port =
						((uvalue <= 65535) ? uvalue : pbs_conf.batch_service_port);
			} else if (!strcmp(conf_name, PBS_CONF_BATCH_SERVICE_PORT_DIS)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.batch_service_port_dis =
						((uvalue <= 65535) ? uvalue : pbs_conf.batch_service_port_dis);
			} else if (!strcmp(conf_name, PBS_CONF_MOM_SERVICE_PORT)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.mom_service_port =
						((uvalue <= 65535) ? uvalue : pbs_conf.mom_service_port);
			} else if (!strcmp(conf_name, PBS_CONF_MANAGER_SERVICE_PORT)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.manager_service_port =
						((uvalue <= 65535) ? uvalue : pbs_conf.manager_service_port);
			} else if (!strcmp(conf_name, PBS_CONF_DATA_SERVICE_PORT)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.pbs_data_service_port =
						((uvalue <= 65535) ? uvalue : pbs_conf.pbs_data_service_port);
			} else if (!strcmp(conf_name, PBS_CONF_DATA_SERVICE_HOST)) {
				free(pbs_conf.pbs_data_service_host);
				pbs_conf.pbs_data_service_host = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_USE_COMPRESSION)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.pbs_use_compression = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_USE_MCAST)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.pbs_use_mcast = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_LEAF_NAME)) {
				if (pbs_conf.pbs_leaf_name)
					free(pbs_conf.pbs_leaf_name);
				pbs_conf.pbs_leaf_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_LEAF_ROUTERS)) {
				if (pbs_conf.pbs_leaf_routers)
					free(pbs_conf.pbs_leaf_routers);
				pbs_conf.pbs_leaf_routers = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_COMM_NAME)) {
				if (pbs_conf.pbs_comm_name)
					free(pbs_conf.pbs_comm_name);
				pbs_conf.pbs_comm_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_COMM_ROUTERS)) {
				if (pbs_conf.pbs_comm_routers)
					free(pbs_conf.pbs_comm_routers);
				pbs_conf.pbs_comm_routers = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_COMM_THREADS)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.pbs_comm_threads = uvalue;
			} else if (!strcmp(conf_name, PBS_CONF_COMM_LOG_EVENTS)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.pbs_comm_log_events = uvalue;
			} else if (!strcmp(conf_name, PBS_CONF_HOME)) {
				free(pbs_conf.pbs_home_path);
				pbs_conf.pbs_home_path = shorten_and_cleanup_path(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_EXEC)) {
				free(pbs_conf.pbs_exec_path);
				pbs_conf.pbs_exec_path = shorten_and_cleanup_path(conf_value);
			}
			/* Check for PBS_DEFAULT for backward compatibility */
			else if (!strcmp(conf_name, PBS_CONF_DEFAULT_NAME)) {
				free(pbs_conf.pbs_server_name);
				pbs_conf.pbs_server_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_SERVER_NAME)) {
				free(pbs_conf.pbs_server_name);
				pbs_conf.pbs_server_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_RCP)) {
				free(pbs_conf.rcp_path);
				pbs_conf.rcp_path = shorten_and_cleanup_path(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_SCP)) {
				free(pbs_conf.scp_path);
				pbs_conf.scp_path = shorten_and_cleanup_path(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_SCP_ARGS)) {
				free(pbs_conf.scp_args);
				pbs_conf.scp_args = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_CP)) {
				free(pbs_conf.cp_path);
				pbs_conf.cp_path = shorten_and_cleanup_path(conf_value);
			}
			/* rcp_path can be inferred from pbs_conf.pbs_exec_path - see below */
			/* pbs_demux_path is inferred from pbs_conf.pbs_exec_path - see below */
			else if (!strcmp(conf_name, PBS_CONF_ENVIRONMENT)) {
				free(pbs_conf.pbs_environment);
				pbs_conf.pbs_environment = shorten_and_cleanup_path(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_PRIMARY)) {
				free(pbs_conf.pbs_primary);
				pbs_conf.pbs_primary = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_SECONDARY)) {
				free(pbs_conf.pbs_secondary);
				pbs_conf.pbs_secondary = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_MOM_HOME)) {
				free(pbs_conf.pbs_mom_home);
				pbs_conf.pbs_mom_home = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_CORE_LIMIT)) {
				free(pbs_conf.pbs_core_limit);
				pbs_conf.pbs_core_limit = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_SERVER_HOST_NAME)) {
				free(pbs_conf.pbs_server_host_name);
				pbs_conf.pbs_server_host_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_PUBLIC_HOST_NAME)) {
				free(pbs_conf.pbs_public_host_name);
				pbs_conf.pbs_public_host_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_MAIL_HOST_NAME)) {
				free(pbs_conf.pbs_mail_host_name);
				pbs_conf.pbs_mail_host_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_SMTP_SERVER_NAME)) {
				free(pbs_conf.pbs_smtp_server_name);
				pbs_conf.pbs_smtp_server_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_OUTPUT_HOST_NAME)) {
				free(pbs_conf.pbs_output_host_name);
				pbs_conf.pbs_output_host_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_SCHEDULER_MODIFY_EVENT)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.sched_modify_event = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_MOM_NODE_NAME)) {
				free(pbs_conf.pbs_mom_node_name);
				pbs_conf.pbs_mom_node_name = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_LOG_HIGHRES_TIMESTAMP)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.pbs_log_highres_timestamp = ((uvalue > 0) ? 1 : 0);
			} else if (!strcmp(conf_name, PBS_CONF_SCHED_THREADS)) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pbs_conf.pbs_sched_threads = uvalue;
			}
#ifdef WIN32
			else if (!strcmp(conf_name, PBS_CONF_REMOTE_VIEWER)) {
				free(pbs_conf.pbs_conf_remote_viewer);
				pbs_conf.pbs_conf_remote_viewer = strdup(conf_value);
			}
#endif
			else if (!strcmp(conf_name, PBS_CONF_INTERACTIVE_AUTH_METHOD)) {
				char *value = convert_string_to_lowercase(conf_value);
				if (value == NULL)
					goto err;
				memset(pbs_conf.interactive_auth_method, '\0', sizeof(pbs_conf.interactive_auth_method));
				strcpy(pbs_conf.interactive_auth_method, value);
				free(value);
			} else if (!strcmp(conf_name, PBS_CONF_INTERACTIVE_ENCRYPT_METHOD)) {
				char *value = convert_string_to_lowercase(conf_value);
				if (value == NULL)
					goto err;
				memset(pbs_conf.interactive_encrypt_method, '\0', sizeof(pbs_conf.interactive_encrypt_method));
				strcpy(pbs_conf.interactive_encrypt_method, value);
				free(value);
			} else if (!strcmp(conf_name, PBS_CONF_AUTH)) {
				char *value = convert_string_to_lowercase(conf_value);
				if (value == NULL)
					goto err;
				memset(pbs_conf.auth_method, '\0', sizeof(pbs_conf.auth_method));
				strcpy(pbs_conf.auth_method, value);
				free(value);
			} else if (!strcmp(conf_name, PBS_CONF_ENCRYPT_METHOD)) {
				char *value = convert_string_to_lowercase(conf_value);
				if (value == NULL)
					goto err;
				memset(pbs_conf.encrypt_method, '\0', sizeof(pbs_conf.encrypt_method));
				strcpy(pbs_conf.encrypt_method, value);
				free(value);
			} else if (!strcmp(conf_name, PBS_CONF_SUPPORTED_AUTH_METHODS)) {
				char *value = convert_string_to_lowercase(conf_value);
				if (value == NULL)
					goto err;
				pbs_conf.supported_auth_methods = break_comma_list(value);
				if (pbs_conf.supported_auth_methods == NULL) {
					free(value);
					goto err;
				}
				free(value);
			} else if (!strcmp(conf_name, PBS_CONF_AUTH_SERVICE_USERS)) {
				pbs_conf.auth_service_users = break_comma_list(conf_value);
				if (pbs_conf.auth_service_users == NULL) {
					goto err;
				}
			} else if (!strcmp(conf_name, PBS_CONF_DAEMON_SERVICE_USER)) {
				free(pbs_conf.pbs_daemon_service_user);
				pbs_conf.pbs_daemon_service_user = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_DAEMON_SERVICE_AUTH_USER)) {
				free(pbs_conf.pbs_daemon_service_auth_user);
				pbs_conf.pbs_daemon_service_auth_user = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_PRIVILEGED_AUTH_USER)) {
				free(pbs_conf.pbs_privileged_auth_user);
				pbs_conf.pbs_privileged_auth_user = strdup(conf_value);
			} else if (!strcmp(conf_name, PBS_CONF_GSS_USER_CREDENTIALS_BIN)) {
				free(pbs_conf.pbs_gss_user_creds_bin);
				pbs_conf.pbs_gss_user_creds_bin = strdup(conf_value);
			}
			/* iff_path is inferred from pbs_conf.pbs_exec_path - see below */
		}
		fclose(fp);
		free(pbs_loadconf_buf);
		pbs_loadconf_buf = NULL;
		pbs_loadconf_len = 0;
	}

	/*
	 * Next, check the environment variables and set values accordingly
	 * overriding those that were set in the configuration file.
	 */

	if ((gvalue = getenv(PBS_CONF_START_SERVER)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.start_server = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_START_MOM)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.start_mom = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_START_SCHED)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.start_sched = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_START_COMM)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.start_comm = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_LOCALLOG)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.locallog = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_SYSLOG)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.syslogfac = ((uvalue <= (23 << 3)) ? uvalue : 0);
	}
	if ((gvalue = getenv(PBS_CONF_SYSLOGSEVR)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.syslogsvr = ((uvalue <= 7) ? uvalue : 0);
	}
	if ((gvalue = getenv(PBS_CONF_BATCH_SERVICE_PORT)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.batch_service_port =
				((uvalue <= 65535) ? uvalue : pbs_conf.batch_service_port);
	}
	if ((gvalue = getenv(PBS_CONF_BATCH_SERVICE_PORT_DIS)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.batch_service_port_dis =
				((uvalue <= 65535) ? uvalue : pbs_conf.batch_service_port_dis);
	}
	if ((gvalue = getenv(PBS_CONF_MOM_SERVICE_PORT)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.mom_service_port =
				((uvalue <= 65535) ? uvalue : pbs_conf.mom_service_port);
	}
	if ((gvalue = getenv(PBS_CONF_MANAGER_SERVICE_PORT)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.manager_service_port =
				((uvalue <= 65535) ? uvalue : pbs_conf.manager_service_port);
	}
	if ((gvalue = getenv(PBS_CONF_HOME)) != NULL) {
		free(pbs_conf.pbs_home_path);
		pbs_conf.pbs_home_path = shorten_and_cleanup_path(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_EXEC)) != NULL) {
		free(pbs_conf.pbs_exec_path);
		pbs_conf.pbs_exec_path = shorten_and_cleanup_path(gvalue);
	}
	/* Check for PBS_DEFAULT for backward compatibility */
	if ((gvalue = getenv(PBS_CONF_DEFAULT_NAME)) != NULL) {
		free(pbs_conf.pbs_server_name);
		if ((pbs_conf.pbs_server_name = strdup(gvalue)) == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_SERVER_NAME)) != NULL) {
		free(pbs_conf.pbs_server_name);
		if ((pbs_conf.pbs_server_name = strdup(gvalue)) == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_RCP)) != NULL) {
		free(pbs_conf.rcp_path);
		pbs_conf.rcp_path = shorten_and_cleanup_path(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_SCP)) != NULL) {
		free(pbs_conf.scp_path);
		pbs_conf.scp_path = shorten_and_cleanup_path(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_SCP_ARGS)) != NULL) {
		free(pbs_conf.scp_args);
		pbs_conf.scp_args = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_CP)) != NULL) {
		free(pbs_conf.cp_path);
		pbs_conf.cp_path = shorten_and_cleanup_path(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_PRIMARY)) != NULL) {
		free(pbs_conf.pbs_primary);
		if ((pbs_conf.pbs_primary = strdup(gvalue)) == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_SECONDARY)) != NULL) {
		free(pbs_conf.pbs_secondary);
		if ((pbs_conf.pbs_secondary = strdup(gvalue)) == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_MOM_HOME)) != NULL) {
		free(pbs_conf.pbs_mom_home);
		if ((pbs_conf.pbs_mom_home = strdup(gvalue)) == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_CORE_LIMIT)) != NULL) {
		free(pbs_conf.pbs_core_limit);
		if ((pbs_conf.pbs_core_limit = strdup(gvalue)) == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_DATA_SERVICE_HOST)) != NULL) {
		free(pbs_conf.pbs_data_service_host);
		if ((pbs_conf.pbs_data_service_host = strdup(gvalue)) == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_USE_COMPRESSION)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.pbs_use_compression = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_USE_MCAST)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.pbs_use_mcast = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_LEAF_NAME)) != NULL) {
		if (pbs_conf.pbs_leaf_name)
			free(pbs_conf.pbs_leaf_name);
		pbs_conf.pbs_leaf_name = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_LEAF_ROUTERS)) != NULL) {
		if (pbs_conf.pbs_leaf_routers)
			free(pbs_conf.pbs_leaf_routers);
		pbs_conf.pbs_leaf_routers = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_COMM_NAME)) != NULL) {
		if (pbs_conf.pbs_comm_name)
			free(pbs_conf.pbs_comm_name);
		pbs_conf.pbs_comm_name = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_COMM_ROUTERS)) != NULL) {
		if (pbs_conf.pbs_comm_routers)
			free(pbs_conf.pbs_comm_routers);
		pbs_conf.pbs_comm_routers = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_COMM_THREADS)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.pbs_comm_threads = uvalue;
	}
	if ((gvalue = getenv(PBS_CONF_COMM_LOG_EVENTS)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.pbs_comm_log_events = uvalue;
	}
	if ((gvalue = getenv(PBS_CONF_DATA_SERVICE_PORT)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.pbs_data_service_port =
				((uvalue <= 65535) ? uvalue : pbs_conf.pbs_data_service_port);
	}
	if ((gvalue = getenv(PBS_CONF_SERVER_HOST_NAME)) != NULL) {
		free(pbs_conf.pbs_server_host_name);
		pbs_conf.pbs_server_host_name = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_PUBLIC_HOST_NAME)) != NULL) {
		free(pbs_conf.pbs_public_host_name);
		pbs_conf.pbs_public_host_name = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_MAIL_HOST_NAME)) != NULL) {
		free(pbs_conf.pbs_mail_host_name);
		pbs_conf.pbs_mail_host_name = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_SMTP_SERVER_NAME)) != NULL) {
		free(pbs_conf.pbs_smtp_server_name);
		pbs_conf.pbs_smtp_server_name = strdup(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_OUTPUT_HOST_NAME)) != NULL) {
		free(pbs_conf.pbs_output_host_name);
		pbs_conf.pbs_output_host_name = strdup(gvalue);
	}

	/* support PBS_MOM_NODE_NAME to tell MOM natural node name on server */
	if ((gvalue = getenv(PBS_CONF_MOM_NODE_NAME)) != NULL) {
		free(pbs_conf.pbs_mom_node_name);
		pbs_conf.pbs_mom_node_name = strdup(gvalue);
	}

	/* rcp_path is inferred from pbs_conf.pbs_exec_path - see below */
	/* pbs_demux_path is inferred from pbs_conf.pbs_exec_path - see below */
	if ((gvalue = getenv(PBS_CONF_ENVIRONMENT)) != NULL) {
		free(pbs_conf.pbs_environment);
		pbs_conf.pbs_environment = shorten_and_cleanup_path(gvalue);
	}
	if ((gvalue = getenv(PBS_CONF_LOG_HIGHRES_TIMESTAMP)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.pbs_log_highres_timestamp = ((uvalue > 0) ? 1 : 0);
	}
	if ((gvalue = getenv(PBS_CONF_SCHED_THREADS)) != NULL) {
		if (sscanf(gvalue, "%u", &uvalue) == 1)
			pbs_conf.pbs_sched_threads = uvalue;
	}

	if ((gvalue = getenv(PBS_CONF_DAEMON_SERVICE_USER)) != NULL) {
		free(pbs_conf.pbs_daemon_service_user);
		pbs_conf.pbs_daemon_service_user = strdup(gvalue);
	}

	if ((gvalue = getenv(PBS_CONF_DAEMON_SERVICE_AUTH_USER)) != NULL) {
		free(pbs_conf.pbs_daemon_service_auth_user);
		pbs_conf.pbs_daemon_service_auth_user = strdup(gvalue);
	}

	if ((gvalue = getenv(PBS_CONF_PRIVILEGED_AUTH_USER)) != NULL) {
		free(pbs_conf.pbs_privileged_auth_user);
		pbs_conf.pbs_privileged_auth_user = strdup(gvalue);
	}

	if ((gvalue = getenv(PBS_CONF_GSS_USER_CREDENTIALS_BIN)) != NULL) {
		free(pbs_conf.pbs_gss_user_creds_bin);
		pbs_conf.pbs_gss_user_creds_bin = strdup(gvalue);
	}

#ifdef WIN32
	if ((gvalue = getenv(PBS_CONF_REMOTE_VIEWER)) != NULL) {
		free(pbs_conf.pbs_conf_remote_viewer);
		pbs_conf.pbs_conf_remote_viewer = strdup(gvalue);
	}
#endif

	/* iff_path is inferred from pbs_conf.pbs_exec_path - see below */

	/*
	 * Now that we have parsed through the configuration file and the
	 * environment variables, check to make sure that all the critical
	 * items are set.
	 */

	buf[0] = '\0';
	if (pbs_conf.pbs_home_path == NULL)
		strcat(buf, PBS_CONF_HOME);
	if (pbs_conf.pbs_exec_path == NULL) {
		if (buf[0] != '\0')
			strcat(buf, " ");
		strcat(buf, PBS_CONF_EXEC);
	}
	if (pbs_conf.pbs_server_name == NULL) {
		if (buf[0] != '\0')
			strcat(buf, " ");
		strcat(buf, PBS_CONF_SERVER_NAME);
	}
	if (buf[0] != '\0') {
		fprintf(stderr, "pbsconf error: pbs conf variables not found: %s\n", buf);
		goto err;
	}

	/*
	 * Perform sanity checks on PBS_*_HOST_NAME values and PBS_CONF_SMTP_SERVER_NAME.
	 * See IDD for SPID 4534.
	 */
	buf[0] = '\0';
	if ((pbs_conf.pbs_server_host_name != NULL) &&
	    (strchr(pbs_conf.pbs_server_host_name, ':') != NULL))
		strcpy(buf, PBS_CONF_SERVER_HOST_NAME);
	else if ((pbs_conf.pbs_public_host_name != NULL) &&
		 (strchr(pbs_conf.pbs_public_host_name, ':') != NULL))
		strcpy(buf, PBS_CONF_PUBLIC_HOST_NAME);
	else if ((pbs_conf.pbs_mail_host_name != NULL) &&
		 (strchr(pbs_conf.pbs_mail_host_name, ':') != NULL))
		strcpy(buf, PBS_CONF_MAIL_HOST_NAME);
	else if ((pbs_conf.pbs_smtp_server_name != NULL) &&
		 (strchr(pbs_conf.pbs_smtp_server_name, ':') != NULL))
		strcpy(buf, PBS_CONF_SMTP_SERVER_NAME);
	else if ((pbs_conf.pbs_output_host_name != NULL) &&
		 (strchr(pbs_conf.pbs_output_host_name, ':') != NULL))
		strcpy(buf, PBS_CONF_OUTPUT_HOST_NAME);
	else if ((pbs_conf.pbs_mom_node_name != NULL) &&
		 (strchr(pbs_conf.pbs_mom_node_name, ':') != NULL))
		strcpy(buf, PBS_CONF_MOM_NODE_NAME);

	if (buf[0] != '\0') {
		fprintf(stderr, "pbsconf error: illegal value for: %s\n", buf);
		goto err;
	}

	/*
	 * Finally, fill in the blanks for variables with inferred values.
	 */

	if (pbs_conf.pbs_environment == NULL) {
		/* a reasonable default for the pbs_environment file is in pbs_home */
		/* strlen("/pbs_environment") + '\0' == 16 + 1 == 17 */
		if ((pbs_conf.pbs_environment =
			     malloc(strlen(pbs_conf.pbs_home_path) + 17)) != NULL) {
			sprintf(pbs_conf.pbs_environment, "%s/pbs_environment",
				pbs_conf.pbs_home_path);
			fix_path(pbs_conf.pbs_environment, 1);
		} else {
			goto err;
		}
	}

	free(pbs_conf.iff_path);
	/* strlen("/sbin/pbs_iff") + '\0' == 13 + 1 == 14 */
	if ((pbs_conf.iff_path =
		     malloc(strlen(pbs_conf.pbs_exec_path) + 14)) != NULL) {
		sprintf(pbs_conf.iff_path, "%s/sbin/pbs_iff", pbs_conf.pbs_exec_path);
		fix_path(pbs_conf.iff_path, 1);
	} else {
		goto err;
	}

	if (pbs_conf.rcp_path == NULL) {
		if ((pbs_conf.rcp_path =
			     malloc(strlen(pbs_conf.pbs_exec_path) + 14)) != NULL) {
			sprintf(pbs_conf.rcp_path, "%s/sbin/pbs_rcp", pbs_conf.pbs_exec_path);
			fix_path(pbs_conf.rcp_path, 1);
		} else {
			goto err;
		}
	}
	if (pbs_conf.cp_path == NULL) {
#ifdef WIN32
		char *cmd = "xcopy";
#else
		char *cmd = "/bin/cp";
#endif
		pbs_conf.cp_path = strdup(cmd);
		if (pbs_conf.cp_path == NULL) {
			goto err;
		}
	}

	free(pbs_conf.pbs_demux_path);
	/* strlen("/sbin/pbs_demux") + '\0' == 15 + 1 == 16 */
	if ((pbs_conf.pbs_demux_path =
		     malloc(strlen(pbs_conf.pbs_exec_path) + 16)) != NULL) {
		sprintf(pbs_conf.pbs_demux_path, "%s/sbin/pbs_demux",
			pbs_conf.pbs_exec_path);
		fix_path(pbs_conf.pbs_demux_path, 1);
	} else {
		goto err;
	}

	if ((gvalue = getenv(PBS_CONF_INTERACTIVE_AUTH_METHOD)) != NULL) {
		char *value = convert_string_to_lowercase(gvalue);
		if (value == NULL)
			goto err;
		memset(pbs_conf.interactive_auth_method, '\0', sizeof(pbs_conf.interactive_auth_method));
		strcpy(pbs_conf.interactive_auth_method, value);
		free(value);
	}
	if ((gvalue = getenv(PBS_CONF_INTERACTIVE_ENCRYPT_METHOD)) != NULL) {
		char *value = convert_string_to_lowercase(gvalue);
		ensure_string_not_null(&value); /* allow unsetting */
		if (value == NULL)
			goto err;
		memset(pbs_conf.interactive_encrypt_method, '\0', sizeof(pbs_conf.interactive_encrypt_method));
		strcpy(pbs_conf.interactive_encrypt_method, value);
		free(value);
	}
	if ((gvalue = getenv(PBS_CONF_AUTH)) != NULL) {
		char *value = convert_string_to_lowercase(gvalue);
		if (value == NULL)
			goto err;
		memset(pbs_conf.auth_method, '\0', sizeof(pbs_conf.auth_method));
		strcpy(pbs_conf.auth_method, value);
		free(value);
	}
	if ((gvalue = getenv(PBS_CONF_ENCRYPT_METHOD)) != NULL) {
		char *value = convert_string_to_lowercase(gvalue);
		ensure_string_not_null(&value); /* allow unsetting */
		if (value == NULL)
			goto err;
		memset(pbs_conf.encrypt_method, '\0', sizeof(pbs_conf.encrypt_method));
		strcpy(pbs_conf.encrypt_method, value);
		free(value);
	}
	if ((gvalue = getenv(PBS_CONF_SUPPORTED_AUTH_METHODS)) != NULL) {
		char *value = convert_string_to_lowercase(gvalue);
		if (value == NULL)
			goto err;
		free_string_array(pbs_conf.supported_auth_methods);
		pbs_conf.supported_auth_methods = break_comma_list(value);
		if (pbs_conf.supported_auth_methods == NULL) {
			free(value);
			goto err;
		}
		free(value);
	}
	if (pbs_conf.supported_auth_methods == NULL) {
		pbs_conf.supported_auth_methods = break_comma_list(AUTH_RESVPORT_NAME);
		if (pbs_conf.supported_auth_methods == NULL) {
			goto err;
		}
	}
	if ((gvalue = getenv(PBS_CONF_AUTH_SERVICE_USERS)) != NULL) {
		char *value = convert_string_to_lowercase(gvalue);
		if (value == NULL)
			goto err;
		free_string_array(pbs_conf.auth_service_users);
		pbs_conf.auth_service_users = break_comma_list(value);
		if (pbs_conf.auth_service_users == NULL) {
			free(value);
			goto err;
		}
		free(value);
	}
	if (pbs_conf.auth_service_users == NULL) {
		pbs_conf.auth_service_users = break_comma_list("root");
		if (pbs_conf.auth_service_users == NULL) {
			goto err;
		}
	}
	if (pbs_conf.encrypt_method[0] != '\0') {
		/* encryption is not disabled, validate encrypt method */
		if (is_valid_encrypt_method(pbs_conf.encrypt_method) != 1) {
			fprintf(stderr, "The given PBS_ENCRYPT_METHOD = %s does not support encrypt/decrypt of data\n", pbs_conf.encrypt_method);
			goto err;
		}
	}
	if (pbs_conf.interactive_encrypt_method[0] != '\0') {
		/* encryption is not disabled, validate encrypt method */
		if (is_valid_encrypt_method(pbs_conf.interactive_encrypt_method) != 1) {
			fprintf(stderr, "The given PBS_INTERACTIVE_ENCRYPT_METHOD = %s does not support encrypt/decrypt of data\n", pbs_conf.interactive_encrypt_method);
			goto err;
		}
	}

	pbs_conf.pbs_tmpdir = pbs_get_tmpdir();

	/* if routers has null value populate with server name as the default */
	if (pbs_conf.pbs_leaf_routers == NULL) {
		if (pbs_conf.pbs_primary && pbs_conf.pbs_secondary) {
			pbs_conf.pbs_leaf_routers = malloc(strlen(pbs_conf.pbs_primary) + strlen(pbs_conf.pbs_secondary) + 2);
			if (pbs_conf.pbs_leaf_routers == NULL) {
				fprintf(stderr, "Out of memory\n");
				goto err;
			}
			sprintf(pbs_conf.pbs_leaf_routers, "%s,%s", pbs_conf.pbs_primary, pbs_conf.pbs_secondary);
		} else {
			if (pbs_conf.pbs_server_host_name) {
				pbs_conf.pbs_leaf_routers = strdup(pbs_conf.pbs_server_host_name);
			} else if (pbs_conf.pbs_server_name) {
				pbs_conf.pbs_leaf_routers = strdup(pbs_conf.pbs_server_name);
			} else {
				fprintf(stderr, "PBS server undefined\n");
				goto err;
			}
			if (pbs_conf.pbs_leaf_routers == NULL) {
				fprintf(stderr, "Out of memory\n");
				goto err;
			}
		}
	}

	/* determine who we are */
	pbs_current_uid = getuid();
	if ((pw = getpwuid(pbs_current_uid)) == NULL) {
		goto err;
	}
	if (strlen(pw->pw_name) > (PBS_MAXUSER - 1)) {
		goto err;
	}
	strcpy(pbs_conf.current_user, pw->pw_name);

	pbs_conf.loaded = 1;

	if (pbs_client_thread_unlock_conf() != 0)
		return 0;

	return 1; /* success */

err:
	if (pbs_conf.pbs_conf_file) {
		free(pbs_conf.pbs_conf_file);
		pbs_conf.pbs_conf_file = NULL;
	}
	if (pbs_conf.pbs_data_service_host) {
		free(pbs_conf.pbs_data_service_host);
		pbs_conf.pbs_data_service_host = NULL;
	}
	if (pbs_conf.pbs_home_path) {
		free(pbs_conf.pbs_home_path);
		pbs_conf.pbs_home_path = NULL;
	}
	if (pbs_conf.pbs_exec_path) {
		free(pbs_conf.pbs_exec_path);
		pbs_conf.pbs_exec_path = NULL;
	}
	if (pbs_conf.pbs_server_name) {
		free(pbs_conf.pbs_server_name);
		pbs_conf.pbs_server_name = NULL;
	}
	if (pbs_conf.rcp_path) {
		free(pbs_conf.rcp_path);
		pbs_conf.rcp_path = NULL;
	}
	if (pbs_conf.scp_path) {
		free(pbs_conf.scp_path);
		pbs_conf.scp_path = NULL;
	}
	if (pbs_conf.scp_args) {
		free(pbs_conf.scp_args);
		pbs_conf.scp_args = NULL;
	}
	if (pbs_conf.cp_path) {
		free(pbs_conf.cp_path);
		pbs_conf.cp_path = NULL;
	}
	if (pbs_conf.pbs_environment) {
		free(pbs_conf.pbs_environment);
		pbs_conf.pbs_environment = NULL;
	}
	if (pbs_conf.pbs_primary) {
		free(pbs_conf.pbs_primary);
		pbs_conf.pbs_primary = NULL;
	}
	if (pbs_conf.pbs_secondary) {
		free(pbs_conf.pbs_secondary);
		pbs_conf.pbs_secondary = NULL;
	}
	if (pbs_conf.pbs_mom_home) {
		free(pbs_conf.pbs_mom_home);
		pbs_conf.pbs_mom_home = NULL;
	}
	if (pbs_conf.pbs_core_limit) {
		free(pbs_conf.pbs_core_limit);
		pbs_conf.pbs_core_limit = NULL;
	}
	if (pbs_conf.supported_auth_methods) {
		free_string_array(pbs_conf.supported_auth_methods);
		pbs_conf.supported_auth_methods = NULL;
	}
	if (pbs_conf.auth_service_users) {
		free_string_array(pbs_conf.auth_service_users);
		pbs_conf.auth_service_users = NULL;
	}

	pbs_conf.load_failed = 1;
	(void) pbs_client_thread_unlock_conf();
	return 0;
}

/**
 * @brief
 *	pbs_get_tmpdir - Identify the configured tmpdir location
 *
 * @return char *
 * @retval !NULL pointer to the tmpdir string
 * @retval NULL failure
 */
char *
pbs_get_tmpdir(void)
{
	FILE *fp = NULL;
	char *tmpdir = NULL;
	char *conf_file = NULL;
	char *conf_name = NULL;
	char *conf_value = NULL;
	char *p = NULL;
#ifdef WIN32
	struct stat sb;
#endif

	/* If pbs_conf already been populated use that value. */
	if ((pbs_conf.loaded != 0) && (pbs_conf.pbs_tmpdir != NULL))
		return (pbs_conf.pbs_tmpdir);

		/* Next, try the environment. */
#ifdef WIN32
	if ((p = getenv("TMP")) != NULL)
#else
	if ((p = getenv("TMPDIR")) != NULL)
#endif
	{
		tmpdir = shorten_and_cleanup_path(p);
	}
	/* PBS_TMPDIR overrides TMP or TMPDIR if set */
	if ((p = getenv(PBS_CONF_TMPDIR)) != NULL) {
		free(tmpdir);
		tmpdir = shorten_and_cleanup_path(p);
	}
	if (tmpdir != NULL)
		return tmpdir;

	/* Now try pbs.conf */
	conf_file = pbs_get_conf_file();
	if ((fp = fopen(conf_file, "r")) != NULL) {
		while (parse_config_line(fp, &conf_name, &conf_value) != NULL) {
			if ((conf_name == NULL) || (*conf_name == '\0'))
				continue;
			if ((conf_value == NULL) || (*conf_value == '\0'))
				continue;
			if (!strcmp(conf_name, PBS_CONF_TMPDIR)) {
				free(tmpdir);
				tmpdir = shorten_and_cleanup_path(conf_value);
			}
		}
		fclose(fp);
	}
	free(conf_file);
	conf_file = NULL;
	if (tmpdir != NULL)
		return tmpdir;

		/* Finally, resort to the default. */
#ifdef WIN32
	if (stat(TMP_DIR, &sb) == 0) {
		tmpdir = shorten_and_cleanup_path(TMP_DIR);
	} else if (stat("C:\\WINDOWS\\TEMP", &sb) == 0) {
		tmpdir = shorten_and_cleanup_path("C:\\WINDOWS\\TEMP");
	}
#else
	tmpdir = shorten_and_cleanup_path(TMP_DIR);
#endif
	if (tmpdir == NULL) {
		/* strlen("/spool") + '\0' == 6 + 1 = 7 */
		if ((p = malloc(strlen(pbs_conf.pbs_home_path) + 7)) == NULL) {
			return NULL;
		} else {
			sprintf(p, "%s/spool", pbs_conf.pbs_home_path);
			tmpdir = shorten_and_cleanup_path(p);
			free(p);
		}
	}
	/* Strip the trailing separator. */
#ifdef WIN32
	if (tmpdir[strlen(tmpdir) - 1] == '\\')
		tmpdir[strlen(tmpdir) - 1] = '\0';
#else
	if (tmpdir[strlen(tmpdir) - 1] == '/')
		tmpdir[strlen(tmpdir) - 1] = '\0';
#endif
	return tmpdir;
}

================================================
FILE: src/lib/Libifl/pbs_quote_parse.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_quote_parse.c
 */
#include <pbs_config.h>

#include <ctype.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "pbs_internal.h"

/**
 * @brief
 * 	-pbs_quote_parse - parse quoted value string acording to BZ 6088 rules
 *	1.  One of " or ' may be used as quoting character
 *	2.  characters must be printable as defined by "isprint()"
 *	3.  '&' not accepted (reserved for future expansion).
 *	4.  Comma is a token separator characters unless quoted
 *	5.  space is a token separator characters unless quoted or unless
 *		"allow_white" is true
 *
 * @param[in] in - he input string to parse
 * @param[out] out - ptr to where output value string is to be returned
 *		     On non-error return.  This is on the HEAP and freeing is
 *                   upto the caller; if function returns non-zero, "out" is
 *                   not valid and should not be freed
 * @param[in] endptr - ptr into orignal input where we left off processing
 * @param[in] allow_white - indication for whether to allow white space.
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	malloc failure
 * @retval	>0	parse error
 *			The >0 value can be passed to  "pbs_parse_err_msg()"
 *
 */

int
pbs_quote_parse(char *in, char **out, char **endptr, int allow_white)
{
	char *d; /* destination ptr (into "work") */
	size_t len;
	int nthchar;
	char quotechar = '\0'; /* character used for quoting */
	int quoting = 0;       /* true if performing quoting */
	char *s;	       /* working ptr into "in" */
	char *work;	       /* destination buffer for parsed out */

	*out = NULL;
	*endptr = NULL;

	if (in == NULL)
		return -1;
	len = strlen(in) + 1;
	work = calloc((size_t) 1, len); /* calloc used to zero area */
	if (work == NULL)
		return -1;

	d = work;

	s = in;
	while (isspace((int) *s)) /* skip leading white space */
		++s;

	nthchar = 0;
	while (*s != '\0') {

		++nthchar;

		if (!isprint((int) *s) && !isspace((int) *s)) {
			*endptr = s;
			free(work);
			return 2; /* illegal character */

		} else if (quoting) {

			if (*s == quotechar) {
				quoting = 0; /* end of quoting */
					     /* allow quotes inside the quoted string */
			} else if (*s == '&') {
				*endptr = s;
				free(work);
				return 2; /* illegal character */
			} else {
				*d++ = *s;
			}

		} else if (((*s == '"') || (*s == '\'')) &&
			   ((allow_white == 0) || (nthchar == 1))) {

			/* start quoting */
			if ((quotechar != '\0') && (quotechar != *s)) {
				/* cannot switch quoting char in mid stream */
				/* so this is a plain character */
				*d++ = *s;
			} else {
				quotechar = *s;
				quoting = 1;
			}

		} else if ((*s == ',') ||
			   (isspace((int) *s) && (allow_white == 0))) {

			/* hit a special (parsing) character */
			*endptr = s;
			*out = work;
			return 0;

		} else { /* normal un-quoted */

			/* check for special illegal character */
			if (*s == '&') {
				*endptr = s;
				free(work);
				return 2;
			}

			*d++ = *s;
		}

		s++;
	}
	*endptr = s;

	if (quoting) {
		free(work);
		return 4; /* invalid quoting, end of string */
	}

	*out = work;
	return 0;
}

/**
 * @brief
 *	-pbs_parse_err_msges - global list of pbs parse error messages
 *
 * @note
 *	make sure the string length of any message does not
 *	exceed PBS_PARSE_ERR_MSG_LEN_MAX
 */
const char pbs_parse_err_msges[][PBS_PARSE_ERR_MSG_LEN_MAX + 1] = {
	"illegal character",
	"improper quoting syntax",
	"no closing quote"};

/**
 * @brief
 *	-pbs_parse_err_msg() - for a positive, non-zero error returned by
 *	pbs_quote_parse(), return a pointer to an error message string
 *	Accepted error number are 2 and greater,  if not in this range,
 *	the string "error" is returned for the message
 *
 * @param[in] err -error number
 *
 * @return	string
 * @retval	error msg string	success
 * @retval	"error"			error
 *
 */
const char *
pbs_parse_err_msg(int err)
{
	int i;
	i = sizeof(pbs_parse_err_msges) / sizeof(pbs_parse_err_msges[0]);
	if ((err <= 1) || ((err - 1) > i))
		return ("error");
	else
		return (pbs_parse_err_msges[err - 2]);
}

/**
 * @brief
 * 	-pbs_prt_parse_err() -  print an error message associated with an
 *	parsing/syntax error detected by pbs_quote_parse()
 *
 * @par Note:
 *	Writes to stderr;  should not be used directly by a library function
 *	or a daemon, only by user commands.
 *
 * @param[in] txt - error message
 * @param[in] str - option with argument
 * @param[in] offset - diff between txt and str
 * @param[in] err - error number
 *
 * @return	Void
 *
 */
void
pbs_prt_parse_err(char *txt, char *str, int offset, int err)
{
	int i;
	const char *emsg;

	emsg = pbs_parse_err_msg(err);
	fprintf(stderr, "%s %s:\n%s\n", txt, emsg, str);
	for (i = 0; i < offset; ++i)
		putc((int) ' ', stderr);
	putc((int) '^', stderr);
	putc((int) '\n', stderr);
}


================================================
FILE: src/lib/Libifl/pbs_statfree.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_statfree.c
 * @brief
 * The function that deallocates a "batch_status" structure
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdlib.h>
#include <stdio.h>
#include "libpbs.h"

/**
 * @brief
 *	-The function that deallocates a "batch_status" structure
 *
 * @param[in] bsp - pointer to batch request.
 *
 * @return	Void
 *
 */
void
__pbs_statfree(struct batch_status *bsp)
{
	struct batch_status *bsnxt = NULL;

	for (; bsp != NULL; bsp = bsnxt) {
		bsnxt = bsp->next;
		pbs_statfree_single(bsp);
	}
}

/**
 * @brief	There are times when we want to free just one batch_status from a list
 * 			of them and the original pbs_statfree() doesn't serve that purpose. So,
 * 			this function was created to delete just one 'link' in a chain of batch_statuses
 *
 * 	@param[in/out]	bsp - pointer to the batch_status which is being free'd
 */
void
pbs_statfree_single(struct batch_status *bsp)
{
	struct attrl *atnxt;
	if (bsp != NULL) {
		free(bsp->name);
		free(bsp->text);
		while (bsp->attribs != NULL) {
			if (bsp->attribs->name != NULL)
				free(bsp->attribs->name);
			if (bsp->attribs->resource != NULL)
				free(bsp->attribs->resource);
			if (bsp->attribs->value != NULL)
				free(bsp->attribs->value);
			atnxt = bsp->attribs->next;
			free(bsp->attribs);
			bsp->attribs = atnxt;
		}
		free(bsp);
	}
}


================================================
FILE: src/lib/Libifl/rm.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <unistd.h>
#include <stdlib.h>
#include <errno.h>
#include <string.h>
#include <fcntl.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/param.h>
#include <sys/time.h>
#include <netdb.h>
#include <netinet/in.h>
#include <arpa/inet.h>

#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "net_connect.h"
#include "resmon.h"
#include "log.h"
#include "dis.h"
#include "rm.h"
#include "tpp.h"
#if defined(FD_SET_IN_SYS_SELECT_H)
#include <sys/select.h>
#endif

/**
 * @file	rm.c
 */
static int full = 1;

/*
 **	This is the structure used to keep track of the resource
 **	monitor connections.  Each entry is linked into as list
 **	pointed to by "outs".  If len is -1, no
 **	request is active.  If len is -2, a request has been
 **	sent and is waiting to be read.  If len is > 0, the number
 **	indicates how much data is waiting to be sent.
 */
struct out {
	int stream;
	int len;
	struct out *next;
};

#define HASHOUT 32
static struct out *outs[HASHOUT];

/**
 * @brief
 *	Create an "out" structure and put it in the hash table.
 *
 * @param[in] stream	socket descriptor
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 */
static int
addrm(int stream)
{
	struct out *op, **head;

	if ((op = (struct out *) malloc(sizeof(struct out))) == NULL) {
		pbs_errno = errno;
		return -1;
	}

	head = &outs[stream % HASHOUT];
	op->stream = stream;
	op->len = -1;
	op->next = *head;
	*head = op;
	return 0;
}

/**
 * @brief
 *	Connects to a resource monitor and returns a file descriptor to
 *	talk to it.  If port is zero, use default port.
 *
 * @param[in] host - hostname
 * @param[in] port - port number
 *
 * @return	int
 * @retval	socket stream	success
 * @retval	-1		error
 */
int
openrm(char *host, unsigned int port)
{
	int stream;
	int c;
	int rc;
	struct tpp_config tpp_conf;
	fd_set selset;
	struct timeval tv;

	DBPRT(("openrm: host %s port %u\n", host, port))
	pbs_errno = 0;
	if (port == 0)
		port = pbs_conf.manager_service_port;
	DBPRT(("using port %u\n", port))

	/* call tpp_init */
	rc = set_tpp_config(&pbs_conf, &tpp_conf, pbs_conf.pbs_leaf_name, -1, pbs_conf.pbs_leaf_routers);
	if (rc == -1) {
		fprintf(stderr, "Error setting TPP config\n");
		return -1;
	}

	if ((tpp_fd = tpp_init(&tpp_conf)) == -1) {
		fprintf(stderr, "tpp_init failed\n");
		return -1;
	}

	/*
	 * Wait for net to get restored, ie, app to connect to routers
	 */
	FD_ZERO(&selset);
	FD_SET(tpp_fd, &selset);
	tv.tv_sec = 5;
	tv.tv_usec = 0;
	select(FD_SETSIZE, &selset, NULL, NULL, &tv);

	tpp_poll(); /* to clear off the read notification */

	/* get the FQDN of the mom */
	c = get_fullhostname(host, host, (sizeof(host) - 1));
	if (c == -1) {
		fprintf(stderr, "Unable to get full hostname for mom %s\n", host);
		return -1;
	}

	stream = tpp_open(host, port);
	pbs_errno = errno;
	if (stream < 0)
		return -1;
	if (addrm(stream) == -1) {
		pbs_errno = errno;
		tpp_close(stream);
		return -1;
	}
	return stream;
}

/**
 * @brief
 *	Routine to close a connection to a resource monitor
 *	and free the "out" structure.
 *
 * @param[in] stream	socket descriptor whose connection to be closed
 *
 * @return	int
 * @retval	0	all well
 * @retval	-1	error
 *
 */
static int
delrm(int stream)
{
	struct out *op, *prev = NULL;

	for (op = outs[stream % HASHOUT]; op; op = op->next) {
		if (op->stream == stream)
			break;
		prev = op;
	}
	if (op) {
		tpp_close(stream);

		if (prev)
			prev->next = op->next;
		else
			outs[stream % HASHOUT] = op->next;
		free(op);
		return 0;
	}
	return -1;
}

/**
 * @brief
 *	Internal routine to find the out structure for a stream number.
 *
 * @param[in] stream - socket descriptor
 *
 * @return	structure handle
 * @retval	nin NULL value		success
 * @retval	NULL			error
 *
 */
static struct out *
findout(int stream)
{
	struct out *op;

	for (op = outs[stream % HASHOUT]; op; op = op->next) {
		if (op->stream == stream)
			break;
	}
	if (op == NULL)
		pbs_errno = ENOTTY;
	return op;
}

/**
 * @brief
 *	start and compose command
 *
 * @param[in] stream - socket descriptor
 * @param[in] com - command
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
static int
startcom(int stream, int com)
{
	int ret;

	DIS_tpp_funcs();
	ret = diswsi(stream, RM_PROTOCOL);
	if (ret == DIS_SUCCESS) {
		ret = diswsi(stream, RM_PROTOCOL_VER);
		if (ret == DIS_SUCCESS)
			ret = diswsi(stream, com);
	}

	if (ret != DIS_SUCCESS) {
		DBPRT(("startcom: diswsi error %s\n", dis_emsg[ret]))
		pbs_errno = errno;
	}
	return ret;
}

/**
 * @brief
 *	Internal routine to compose and send a "simple" command.
 *	This means anything with a zero length body.
 *
 * @param[in] stream - socket descriptor
 * @param[in] com - command
 *
 * @return      int
 * @retval      0       success
 * @retval      -1   	error
 *
 */
static int
simplecom(int stream, int com)
{
	struct out *op;

	if ((op = findout(stream)) == NULL)
		return -1;

	op->len = -1;

	if (startcom(stream, com) != DIS_SUCCESS) {
		tpp_close(stream);
		return -1;
	}
	if (dis_flush(stream) == -1) {
		pbs_errno = errno;
		DBPRT(("simplecom: flush error %d\n", pbs_errno))
		tpp_close(stream);
		return -1;
	}
	(void) tpp_eom(stream);
	return 0;
}

/**
 * @brief
 *	Internal routine to read the return value from a command.
 *
 * @param[in] stream - socket descriptor
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      error
 *
 */
static int
simpleget(int stream)
{
	int ret, num;
	fd_set selset;

	while (1) {
		/* since tpp recvs are essentially always non blocking
		 * we can call a dis function only if we are sure we have
		 * data on that tpp fd
		 */
		FD_ZERO(&selset);
		FD_SET(tpp_fd, &selset);
		if (select(FD_SETSIZE, &selset, NULL, NULL, NULL) > 0) {
			if (tpp_poll() == stream)
				break;
		} else
			break; /* let it flow down and fail in the DIS read */
	}

	num = disrsi(stream, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("simpleget: %s\n", dis_emsg[ret]))
		pbs_errno = errno ? errno : EIO;
		tpp_close(stream);
		return -1;
	}
	if (num != RM_RSP_OK) {
#ifdef ENOMSG
		pbs_errno = ENOMSG;
#else
		pbs_errno = EINVAL;
#endif
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Close connection to resource monitor.
 *
 * @param[in] stream - socket descriptor
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      error(set pbs_errno).
 *
 */
int
closerm(int stream)
{
	pbs_errno = 0;
	(void) simplecom(stream, RM_CMD_CLOSE);
	if (delrm(stream) == -1) {
		pbs_errno = ENOTTY;
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Shutdown the resource monitor.
 *
 * @param[in] stream - socket descriptor
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      error(set pbs_errno).
 *
 */
int
downrm(int stream)
{
	pbs_errno = 0;
	if (simplecom(stream, RM_CMD_SHUTDOWN))
		return -1;
	if (simpleget(stream))
		return -1;
	(void) delrm(stream);
	return 0;
}

/**
 * @brief
 *	Cause the resource monitor to read the file named.
 *
 * @param[in] stream - socket descriptor
 * @param[in] file - file name
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      error(set pbs_errno).
 *
 */
int
configrm(int stream, char *file)
{
	int ret, len;
	struct out *op;

	pbs_errno = 0;
	if ((op = findout(stream)) == NULL)
		return -1;
	op->len = -1;

	if (file[0] != '/' || (len = strlen(file)) > (size_t) MAXPATHLEN) {
		pbs_errno = EINVAL;
		return -1;
	}

	if (startcom(stream, RM_CMD_CONFIG) != DIS_SUCCESS)
		return -1;
	ret = diswcs(stream, file, len);
	if (ret != DIS_SUCCESS) {
#if defined(ECOMM)
		pbs_errno = ECOMM;
#elif defined(ENOCONNECT)
		pbs_errno = ENOCONNECT;
#else

#ifdef WIN32
		pbs_errno = ERROR_IO_INCOMPLETE;
#else
		pbs_errno = ETXTBSY;
#endif

#endif
		DBPRT(("configrm: diswcs %s\n", dis_emsg[ret]))
		return -1;
	}
	if (dis_flush(stream) == -1) {
		pbs_errno = errno;
		DBPRT(("configrm: flush error %d\n", pbs_errno))
		return -1;
	}

	if (simpleget(stream))
		return -1;
	return 0;
}

/**
 * @brief
 *	Begin a new message to the resource monitor if necessary.
 *	Add a line to the body of an outstanding command to the resource
 *	monitor.
 *
 * @param[in] op - pointer to message structure
 * @param[in line - string
 *
 * @return	int
 * @retval	0	if all is ok
 * @retval	-1	if not (set pbs_errno).
 *
 */
static int
doreq(struct out *op, char *line)
{
	int ret;

	if (op->len == -1) { /* start new message */
		if (startcom(op->stream, RM_CMD_REQUEST) != DIS_SUCCESS)
			return -1;
		op->len = 1;
	}
	ret = diswcs(op->stream, line, strlen(line));
	if (ret != DIS_SUCCESS) {
#if defined(ECOMM)
		pbs_errno = ECOMM;
#elif defined(ENOCONNECT)
		pbs_errno = ENOCONNECT;
#else
#ifdef WIN32
		pbs_errno = ERROR_IO_INCOMPLETE;
#else
		pbs_errno = ETXTBSY;
#endif

#endif
		DBPRT(("doreq: diswcs %s\n", dis_emsg[ret]))
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Add a request to a single stream.
 *
 * @param[in] stream - socket descriptor
 * @param[in line - request string
 *
 * @return      int
 * @retval      0       if all is ok
 * @retval      -1      if not (set pbs_errno).
 *
 */
int
addreq(int stream, char *line)
{
	struct out *op;

	pbs_errno = 0;
	if ((op = findout(stream)) == NULL)
		return -1;
	DIS_tpp_funcs();
	if (doreq(op, line) == -1) {
		(void) delrm(stream);
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Add a request to every stream.
 *
 * @param[in] line - request string
 *
 * @return	int
 * @retval	num of stream acted upon	success
 * @retval	0				error
 *
 */
int
allreq(char *line)
{
	struct out *op, *prev;
	int i, num;

	DIS_tpp_funcs();
	pbs_errno = 0;
	num = 0;
	for (i = 0; i < HASHOUT; i++) {
		prev = NULL;
		op = outs[i];
		while (op) {
			if (doreq(op, line) == -1) {
				struct out *hold = op;

				tpp_close(op->stream);
				if (prev)
					prev->next = op->next;
				else
					outs[i] = op->next;
				op = op->next;
				free(hold);
			} else {
				prev = op;
				op = op->next;
				num++;
			}
		}
	}
	return num;
}

/**
 * @brief
 *	Finish (and send) any outstanding message to the resource monitor.
 *
 * @param[in] stream	socket descriptor
 *
 * @return	string
 * @retval	pointer to the next response line
 * @retval	NULL if there are no more or an error occured.  Set pbs_errno on error.
 */
char *
getreq(int stream)
{
	char *startline;
	struct out *op;
	int ret;

	pbs_errno = 0;
	if ((op = findout(stream)) == NULL)
		return NULL;
	if (op->len >= 0) { /* there is a message to send */
		if (dis_flush(stream) == -1) {
			pbs_errno = errno;
			DBPRT(("getreq: flush error %d\n", pbs_errno))
			(void) delrm(stream);
			return NULL;
		}
		op->len = -2;
		(void) tpp_eom(stream);
	}
	DIS_tpp_funcs();
	if (op->len == -2) {
		if (simpleget(stream) == -1)
			return NULL;
		op->len = -1;
	}
	startline = disrst(stream, &ret);
	if (ret == DIS_EOF) {
		return NULL;
	} else if (ret != DIS_SUCCESS) {
		pbs_errno = errno ? errno : EIO;
		DBPRT(("getreq: cannot read string %s\n", dis_emsg[ret]))
		return NULL;
	}

	if (!full) {
		char *cc, *hold;
		int indent = 0;

		for (cc = startline; *cc; cc++) {
			if (*cc == '[')
				indent++;
			else if (*cc == ']')
				indent--;
			else if (*cc == '=' && indent == 0) {
				if ((hold = strdup(cc + 1)) == NULL) {
					pbs_errno = errno ? errno : ENOMEM;
					DBPRT(("getreq: Unable to allocate memory!\n"))
				}
				free(startline);
				startline = hold;
				break;
			}
		}
	}
	return startline;
}

/**
 * @brief
 *	Finish and send any outstanding messages to all resource monitors.
 *
 * @return	int
 * @retval	num of msgs flushed	success
 * @retval	0			error
 *
 */
int
flushreq()
{
	struct out *op, *prev;
	int did, i;

	pbs_errno = 0;
	did = 0;
	for (i = 0; i < HASHOUT; i++) {
		for (op = outs[i]; op; op = op->next) {
			if (op->len <= 0) /* no message to send */
				continue;
			if (dis_flush(op->stream) == -1) {
				pbs_errno = errno;
				DBPRT(("flushreq: flush error %d\n", pbs_errno))
				tpp_close(op->stream);
				op->stream = -1;
				continue;
			}
			op->len = -2;
			(void) tpp_eom(op->stream);
			did++;
		}

		prev = NULL;
		op = outs[i];
		while (op) { /* get rid of bad streams */
			if (op->stream != -1) {
				prev = op;
				op = op->next;
				continue;
			}
			if (prev == NULL) {
				outs[i] = op->next;
				free(op);
				op = outs[i];
			} else {
				prev->next = op->next;
				free(op);
				op = prev->next;
			}
		}
	}
	return did;
}

/**
 * @brief
 *	Return the stream number of the next stream with something
 *	to read or a negative number (the return from tpp_poll)
 *	if there is no stream to read.
 *
 * @return	int
 * @retval	next stream num		success
 * @retval	-ve val			error
 */
int
activereq()
{
	struct out *op;
	int try, i, num;
	int bucket;
	struct timeval tv;
	fd_set fdset;

	pbs_errno = 0;
	flushreq();
	FD_ZERO(&fdset);

	for (try = 0; try < 3;) {
		if ((i = tpp_poll()) >= 0) {
			if ((op = findout(i)) != NULL)
				return i;

			op = (struct out *) malloc(sizeof(struct out));
			if (op == NULL) {
				pbs_errno = errno;
				return -1;
			}

			bucket = i % HASHOUT;
			op->stream = i;
			op->len = -2;
			op->next = outs[bucket];
			outs[bucket] = op;
		} else if (i == -1) {
			pbs_errno = errno;
			return -1;
		} else {
			extern int tpp_fd;

			FD_SET(tpp_fd, &fdset);
			tv.tv_sec = 5;
			tv.tv_usec = 0;
			num = select(FD_SETSIZE, &fdset, NULL, NULL, &tv);
			if (num == -1) {
				pbs_errno = errno;
				DBPRT(("%s: select %d\n", __func__, pbs_errno))
				return -1;
			}
			if (num == 0) {
				try++;
				DBPRT(("%s: timeout %d\n", __func__, try))
			}
		}
	}
	return i;
}

/**
 * @brief
 *	If flag is true, turn on "full response" mode where getreq
 *	returns a pointer to the beginning of a line of response.
 *	This makes it possible to examine the entire line rather
 *	than just the answer following the equal sign.
 *
 * @param[in] flag - value indicating whether to turn on full response mode or not.
 *
 */
void
fullresp(int flag)
{
	pbs_errno = 0;
	full = flag;
	return;
}


================================================
FILE: src/lib/Libifl/strsep.c
================================================

/*-
 * Copyright (c) 1990, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/* OPENBSD ORIGINAL: lib/libc/string/strsep.c */
/**
 * @file	strsep.c
 */

#include <pbs_config.h>

#include <string.h>
#include <stdio.h>
#include "libpbs.h" /* for aif dll export */

/**
 * @brief
 * 	Get next token from string *stringp, where tokens are possibly-empty
 * 	strings separated by characters from delim.
 *
 * @par	Functionality:
 *	Writes NULs into the string at *stringp to end tokens.
 * 	delim need not remain constant from call to call.
 * 	On return, *stringp points past the last NUL written (if there might
 * 	be further tokens), or is NULL (if there are definitely no more tokens).
 *
 * @param[in] stringp - string
 * @param[in] delim - delimeter
 *
 * @return	string
 * @retval	If *stringp is NULL, strsep returns NULL.
 *
 */
char *
pbs_strsep(char **stringp, const char *delim)
{
	char *s;
	const char *spanp;
	int c, sc;
	char *tok;

	if ((s = *stringp) == NULL)
		return NULL;
	for (tok = s;;) {
		c = *s++;
		spanp = delim;
		do {
			if ((sc = *spanp++) == c) {
				if (c == 0)
					s = NULL;
				else
					s[-1] = 0;
				*stringp = s;
				return (tok);
			}
		} while (sc != 0);
	}
	/* NOTREACHED */
}


================================================
FILE: src/lib/Libifl/tcp_dis.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>

#if defined(FD_SET_IN_SYS_SELECT_H)
#include <sys/select.h>
#endif
#include <unistd.h>
#include <poll.h>
#include "libsec.h"
#include "libpbs.h"
#include "dis.h"
#include "auth.h"

volatile int reply_timedout = 0; /* for reply_send.c -- was alarm handler called? */

static int tcp_recv(int, void *, int);
static int tcp_send(int, void *, int);

/**
 * @brief
 *	Get the user buffer associated with the tcp channel. If no buffer has
 *	been set, then allocate a pbs_tcp_chan_t structure and associate with
 *	the given tcp channel
 *
 * @param[in] - fd - tcp channel to which to get/associate a user buffer
 *
 * @retval	NULL - Failure
 * @retval	!NULL - Buffer associated with the tcp channel
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static pbs_tcp_chan_t *
tcp_get_chan(int fd)
{
	pbs_tcp_chan_t *chan = get_conn_chan(fd);
	if (chan == NULL) {
		if (errno != ENOTCONN) {
			dis_setup_chan(fd, get_conn_chan);
			chan = get_conn_chan(fd);
		}
	}
	return chan;
}

/**
 * @brief
 * 	tcp_recv - receive data from tcp stream
 *
 * @param[in] fd - socket descriptor
 * @param[out] data - data from tcp stream
 * @param[in] len - bytes to receive from tcp stream
 *
 * @return	int
 * @retval	0 	if success
 * @retval	-1 	if error
 * @retval	-2 	if EOF (stream closed)
 */
static int
tcp_recv(int fd, void *data, int len)
{
	int i = 0;
	int torecv = len;
	char *pb = (char *) data;
	int amt = 0;
#ifdef WIN32
	fd_set readset;
	struct timeval timeout;
#else
	struct pollfd pollfds[1];
	int timeout;
#endif

#ifdef WIN32
	timeout.tv_sec = (long) pbs_tcp_timeout;
	timeout.tv_usec = 0;
#else
	timeout = pbs_tcp_timeout;
	pollfds[0].fd = fd;
	pollfds[0].events = POLLIN;
	pollfds[0].revents = 0;
#endif

	while (torecv > 0) {
		/*
		 * we don't want to be locked out by an attack on the port to
		 * deny service, so we time out the read, the network had better
		 * deliver promptly
		 */
		do {
#ifdef WIN32
			FD_ZERO(&readset);
			FD_SET((unsigned int) fd, &readset);
			i = select(FD_SETSIZE, &readset, NULL, NULL, &timeout);
#else
			i = poll(pollfds, 1, timeout * 1000);
#endif
			if (pbs_tcp_interrupt)
				break;
		}
#ifdef WIN32
		while (i == -1 && ((errno = WSAGetLastError()) == WSAEINTR));
#else
		while (i == -1 && errno == EINTR);
#endif

		if (i <= 0)
			return i;

#ifdef WIN32
		i = recv(fd, pb, torecv, 0);
		errno = WSAGetLastError();
#else
		i = CS_read(fd, pb, torecv);
#endif
		if (i == 0)
			return -2;

		if (i < 0) {
#ifdef WIN32
			/*
			 * for WASCONNRESET, treat like no data for winsock
			 * will return this if remote
			 * connection prematurely closed
			 */
			if (errno == WSAECONNRESET)
				return 0;
			if (errno != WSAEINTR)
#else
			if (errno != EINTR)
#endif
				return i;
		} else {
			torecv -= i;
			pb += i;
			amt += i;
		}
	}
	return amt;
}

/**
 * @brief
 * 	tcp_send - send data to tcp stream
 *
 * @param[in] fd - socket descriptor
 * @param[out] data - data to send
 * @param[in] len - bytes to send
 *
 * @return	int
 * @retval	>0 	number of characters sent
 * @retval	0 	if EOD (no data currently avalable)
 * @retval	-1 	if error
 * @retval	-2 	if EOF (stream closed)
 */
static int
tcp_send(int fd, void *data, int len)
{
	size_t ct = (size_t) len;
	int i;
	int j;
	char *pb = (char *) data;
	struct pollfd pollfds[1];

#ifdef WIN32
	while ((i = send(fd, pb, (int) ct, 0)) != (int) ct) {
		errno = WSAGetLastError();
		if (i == -1) {
			if (errno != WSAEINTR) {
				pbs_tcp_errno = errno;
				return (-1);
			} else
				continue;
		}
#else
	while ((i = CS_write(fd, pb, ct)) != ct) {
		if (i == CS_IO_FAIL) {
			if (errno == EINTR) {
				continue;
			}
			if (errno != EAGAIN) {
				/* fatal error on write, abort output */
				pbs_tcp_errno = errno;
				return (-1);
			}

			/* write would have blocked (EAGAIN returned) */
			/* poll for socket to be ready to accept, if  */
			/* not ready in TIMEOUT_SHORT seconds, fail   */
			/* redo the poll if EINTR		      */
			do {
				if (reply_timedout) {
					/* caught alarm - timeout spanning several writes for one reply */
					/* alarm set up in dis_reply_write() */
					/* treat identically to poll timeout */
					j = 0;
					reply_timedout = 0;
				} else {
					pollfds[0].fd = fd;
					pollfds[0].events = POLLOUT;
					pollfds[0].revents = 0;
					j = poll(pollfds, 1, pbs_tcp_timeout * 1000);
				}
			} while ((j == -1) && (errno == EINTR));

			if (j == 0) {
				/* never came ready, return error */
				/* pbs_tcp_errno will add to log message */
				pbs_tcp_errno = EAGAIN;
				return (-1);
			} else if (j == -1) {
				/* some other error - fatal */
				pbs_tcp_errno = errno;
				return (-1);
			}
			continue; /* socket ready, retry write */
		}
#endif
		/* write succeeded, do more if needed */
		ct -= i;
		pb += i;
	}
	return len;
}

/**
 * @brief
 *	sets tcp related functions.
 *
 */
void
DIS_tcp_funcs()
{
	pfn_transport_get_chan = tcp_get_chan;
	pfn_transport_set_chan = set_conn_chan;
	pfn_transport_recv = tcp_recv;
	pfn_transport_send = tcp_send;
}


================================================
FILE: src/lib/Libifl/tm.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <limits.h>
#include <fcntl.h>
#include <netdb.h>
#include <string.h>
#include <errno.h>
#include <assert.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/time.h>
#include <netinet/in.h>
#include <netdb.h>

#include "dis.h"
#include "tm.h"
#include "pbs_ifl.h"
#include "pbs_client_thread.h"
#include "net_connect.h"
#include "libsec.h"
#include "pbs_internal.h"

/**
 * @file	tm.c
 */

#ifndef MIN
#define MIN(a, b) (((a) < (b)) ? (a) : (b))
#endif

#ifndef __PBS_TCP_TIMEOUT
#define __PBS_TCP_TIMEOUT
extern time_t *__pbs_tcptimeout_location(void);
#define pbs_tcp_timeout (*__pbs_tcptimeout_location())
#endif

#ifndef __PBS_TCP_INTERRUPT
#define __PBS_TCP_INTERRUPT
extern int *__pbs_tcpinterrupt_location(void);
#define pbs_tcp_interrupt (*__pbs_tcpinterrupt_location())
#endif

#ifndef __PBS_TCP_ERRNO
#define __PBS_TCP_ERRNO
extern int *__pbs_tcperrno_location(void);
#define pbs_tcp_errno (*__pbs_tcperrno_location())
#endif

/*
 **	Allocate some string space to hold the values passed in the
 **	enviornment from MOM.
 */
static char *tm_jobid = NULL;
static int tm_jobid_len = 0;
static char *tm_jobcookie = NULL;
static int tm_jobcookie_len = 0;
static tm_task_id tm_jobtid = TM_NULL_TASK;
static tm_node_id tm_jobndid = TM_ERROR_NODE;
static int tm_momport = 15003;
static int local_conn = -1;
static int init_done = 0;
static char *localhost = LOCALHOST_SHORTNAME;

/*
 **	Events are the central focus of this library.  They are tracked
 **	in a hash table.  Many of the library calls return events.  They
 **	are recorded and as information is received from MOM's, the
 **	event is updated and marked so tm_poll() can return it to the user.
 */
#define EVENT_HASH 128

/*
 * a bit of code to map a tm_ error number to the symbol
 */

struct tm_errcode {
	int trc_code;
	char *trc_name;
} tm_errcode[] = {
	{TM_ESYSTEM, "system error - MOM cannot be contacted"},
	{TM_ENOTCONNECTED, "not connected"},
	{TM_EUNKNOWNCMD, "unknown command"},
	{TM_ENOTIMPLEMENTED, "not implemented/supported"},
	{TM_EBADENVIRONMENT, "bad environment"},
	{TM_ENOTFOUND, "no matching job found"},
	{TM_ESESSION, "session is already attached"},
	{TM_EUSER, "user not permitted to attach"},
	{TM_EOWNER, "process owner does not match job"},
	{TM_ENOPROC, "process does not exist"},
	{TM_EHOOK, "a hook has rejected the task manager request"},
	{0, "unknown"}};

char *
get_ecname(int rc)
{
	struct tm_errcode *p;
	static char buf[256];

	for (p = &tm_errcode[0]; p->trc_code; ++p) {
		if (p->trc_code == rc)
			break;
	}
	sprintf(buf, "%s (%d)", p->trc_name, rc);
	return buf;
}

typedef struct event_info {
	tm_event_t e_event;	   /* event number */
	tm_node_id e_node;	   /* destination node */
	int e_mtype;		   /* message type sent */
	void *e_info;		   /* possible returned info */
	struct event_info *e_next; /* link to next event */
	struct event_info *e_prev; /* link to prev event */
} event_info;
static event_info *event_hash[EVENT_HASH];
static int event_count = 0;

/**
 * @brief
 *	Find an event number or return a NULL.
 */
static event_info *
find_event(tm_event_t x)
{
	event_info *ep;

	for (ep = event_hash[x % EVENT_HASH]; ep; ep = ep->e_next) {
		if (ep->e_event == x)
			break;
	}
	return ep;
}

/**
 * @brief
 *	Delete an event.
 *
 * @param[in] ep - pointer to event info
 *
 * @return	Void
 *
 */
static void
del_event(event_info *ep)
{

	/* unlink event from hash list */
	if (ep->e_prev)
		ep->e_prev->e_next = ep->e_next;
	else
		event_hash[ep->e_event % EVENT_HASH] = ep->e_next;
	if (ep->e_next)
		ep->e_next->e_prev = ep->e_prev;

	/*
	 **	Free any memory saved with the event.  This depends
	 **	on whay type of event it is.
	 */
	switch (ep->e_mtype) {

		case TM_INIT:
		case TM_SPAWN:
		case TM_ATTACH:
		case TM_SIGNAL:
		case TM_OBIT:
		case TM_POSTINFO:
			break;

		case TM_TASKS:
		case TM_GETINFO:
		case TM_RESOURCES:
			free(ep->e_info);
			break;

		default:
			DBPRT(("del_event: unknown event command %d\n", ep->e_mtype))
			break;
	}
	free(ep);

	if (--event_count == 0) {
		CS_close_socket(local_conn);
		closesocket(local_conn);
		local_conn = -1;
	}
	return;
}

/**
 * @brief
 *	Create a new event number.
 *
 * @return	tm_event_t
 * @retval	eventinfo	success
 *		breaks out of loop if fails.
 */
static tm_event_t
new_event()
{
	static tm_event_t next_event = TM_NULL_EVENT + 1;
	event_info *ep;
	tm_event_t ret;

	if (next_event == INT_MAX)
		next_event = TM_NULL_EVENT + 1;
	for (;;) {
		ret = next_event++;

		for (ep = event_hash[ret % EVENT_HASH]; ep; ep = ep->e_next) {
			if (ep->e_event == ret)
				break; /* innter loop: this number is in use */
		}
		if (ep == NULL)
			break; /* this number is not in use */
	}
	return ret;
}

/**
 * @brief
 *	-Link new event number into the above hash table.
 *
 * @param[in] event - event info
 * @param[in] node - job-relative node id
 * @param[in] type - type of event
 * @param[in] info - info about event
 *
 * @return	Void
 *
 */
static void
add_event(tm_event_t event, tm_node_id node, int type, void *info)
{
	event_info *ep, **head;

	ep = (event_info *) malloc(sizeof(event_info));
	assert(ep != NULL);

	head = &event_hash[event % EVENT_HASH];
	ep->e_event = event;
	ep->e_node = node;
	ep->e_mtype = type;
	ep->e_info = info;
	ep->e_next = *head;
	ep->e_prev = NULL;
	if (*head)
		(*head)->e_prev = ep;
	*head = ep;

	event_count++;
	return;
}

/*
 **	Sessions must be tracked by the library so tm_taskid objects
 **	can be resolved into real tasks on real nodes.
 **	We will use a hash table.
 */
#define TASK_HASH 256
typedef struct task_info {
	char *t_jobid;		  /* jobid */
	tm_task_id t_task;	  /* task id */
	tm_node_id t_node;	  /* node id */
	struct task_info *t_next; /* link to next task */
} task_info;
static task_info *task_hash[TASK_HASH];

/**
 * @brief
 *	-Find a task table entry for a given task number or return a NULL.
 *
 * @param[in] x - task id
 *
 * @return 	structure handle
 * @retval	pointer to task info
 *
 */
static task_info *
find_task(tm_task_id x)
{
	task_info *tp;

	for (tp = task_hash[x % TASK_HASH]; tp; tp = tp->t_next) {
		if (tp->t_task == x)
			break;
	}
	return tp;
}

/**
 * @brief
 *	-Create a new task entry and link it into the above hash
 *	table.
 *
 * @param[in] jobid - job identifier
 * @param[in] node - job-relative node id
 * @param[out] task - task id(0 or 1)
 *
 * @return	tm_task_id
 * @retval	TM_NULL_TASK		failure
 * @retval	initialized task	success
 *
 */
static tm_task_id
new_task(char *jobid, tm_node_id node, tm_task_id task)
{
	task_info *tp, **head;

	DBPRT(("%s: jobid=%s node=%d task=0x%08X\n",
	       __func__, jobid ? jobid : "none", node, task))
	if (jobid != tm_jobid && strcmp(jobid, tm_jobid) != 0) {
		DBPRT(("%s: task job %s not my job %s\n",
		       __func__, jobid, tm_jobid))
		return TM_NULL_TASK;
	}

	if ((tp = find_task(task)) != NULL) {
		DBPRT(("%s: task 0x%08X found with node %d should be %d\n",
		       __func__, task, tp->t_node, node))
		return task;
	}

	if ((tp = (task_info *) malloc(sizeof(task_info))) == NULL)
		return TM_NULL_TASK;

	head = &task_hash[task % TASK_HASH];
	tp->t_jobid = tm_jobid;
	tp->t_task = task;
	tp->t_node = node;
	tp->t_next = *head;
	*head = tp;

	return task;
}

/*
 **	Delete a task.
 ===
 === right now, this is not used.
 ===
 static void
 del_task(x)
 tm_task_id	x;
 {
 task_info	*tp, *prev;

 prev = NULL;
 for (tp=task_hash[x % TASK_HASH]; tp; prev=tp, tp=tp->t_next) {
 if (tp->t_task == x)
 break;
 }
 if (tp) {
 if (prev)
 prev->t_next = tp->t_next;
 else
 task_hash[x % TASK_HASH] = tp->t_next;
 tp->t_next = NULL;
 if (tp->t_jobid != tm_jobid && tp->t_jobid != NULL)
 free(tp->t_jobid);
 free(tp);
 }
 return;
 }
 */

/*
 **	The nodes are tracked in an array.
 */
static tm_node_id *node_table = NULL;

/**
 * @brief
 *	-localmom() - make a connection to the local pbs_mom
 *
 * @par Note:
 *	The connection will remain open as long as there is an
 *	outstanding event.
 *
 * @return	int
 * @retval	-1	connection fail
 * @retval	>=0	connection succcess
 *
 */
#define PBS_NET_RC_FATAL -1
#define PBS_NET_RC_RETRY -2

static int
localmom()
{
	static int have_addr = 0;
	static struct in_addr hostaddr;
	struct hostent *hp;
	int i;
	int ret;
	struct sockaddr_in remote;
	int sock;
	struct linger ltime;

	if (local_conn >= 0)
		return local_conn; /* already have open connection */

	if (have_addr == 0) {
		/* lookup localhost and save address */
		if ((hp = gethostbyname(localhost)) == NULL) {
			DBPRT(("%s: host %s not found\n", __func__, localhost))
			return -1;
		}
		assert(hp->h_length <= sizeof(hostaddr));
		memcpy(&hostaddr, hp->h_addr_list[0], hp->h_length);
		have_addr = 1;
	}

	for (i = 0; i < 5; i++) {

		/* get socket */

		sock = socket(AF_INET, SOCK_STREAM, 0);
		if (sock < 0)
			return -1;

		/* make sure data goes out */

		ltime.l_onoff = 1;
		ltime.l_linger = 5;
		setsockopt(sock, SOL_SOCKET, SO_LINGER, &ltime, sizeof(ltime));

		/* connect to specified local pbs_mom and port */

		remote.sin_addr = hostaddr;
		remote.sin_port = htons((unsigned short) tm_momport);
		remote.sin_family = AF_INET;
		if (connect(sock, (struct sockaddr *) &remote,
			    sizeof(remote)) < 0) {
			switch (errno) {
				case EADDRINUSE:
				case ETIMEDOUT:
				case ECONNREFUSED:
#ifdef WIN32
				case WSAEINTR:
#else
				case EINTR:
#endif
					closesocket(sock);
					sleep(1);
					continue;
				default:
					goto failed;
			}
		} else {
			local_conn = sock;
			break;
		}
	}

	if (CS_client_init() != CS_SUCCESS)
		goto failed;

	ret = CS_client_auth(local_conn);

	if ((ret != CS_SUCCESS) && (ret != CS_AUTH_USE_IFF)) {

		(void) CS_close_socket(local_conn);
		(void) CS_close_app();
		goto failed;
	}

	DIS_tcp_funcs();
	return (local_conn);

failed:

	closesocket(sock);
	local_conn = -1;
	return -1;
}

/**
 * @brief
 *	-startcom() - send request header to local pbs_mom.
 *	If required, make connection to her.
 *
 * @param[in] com - communication handle
 * @param[in] event - event
 *
 * @return	int
 * @retval	DIS_SUCCESS(0)	success
 * @retval	!0		error
 *
 */
static int
startcom(int com, tm_event_t event)
{
	int ret;

	if (localmom() == -1)
		return -1;

	ret = diswsi(local_conn, TM_PROTOCOL);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(local_conn, TM_PROTOCOL_VER);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswcs(local_conn, tm_jobid, tm_jobid_len);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswcs(local_conn, tm_jobcookie, tm_jobcookie_len);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(local_conn, com);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(local_conn, event);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswui(local_conn, tm_jobtid);
	if (ret != DIS_SUCCESS)
		goto done;
	return DIS_SUCCESS;

done:
	DBPRT(("startcom: send error %s\n", dis_emsg[ret]))
	CS_close_socket(local_conn);
	closesocket(local_conn);
	local_conn = -1;
	return ret;
}

/**
 * @brief
 *	-Initialize the Task Manager interface.
 *
 * @param[in] info - currently unused
 * @param[out] roots - data for the last tm_init call whose event has been polled
 *
 * @return	int
 * @retval	0			success
 * @retval	TM error msg(!0)	error
 */
int
tm_init(void *info, struct tm_roots *roots)
{
	tm_event_t nevent, revent;
	char *env, *hold;
	int err;
	int nerr = 0;
	extern int pbs_tcp_interrupt;

	if (init_done)
		return TM_BADINIT;

	/* initialize the thread context data, if not already initialized */
	if (pbs_client_thread_init_thread_context() != 0)
		return TM_ESYSTEM;

	pbs_tcp_interrupt = 1;

	if ((env = getenv("PBS_JOBID")) == NULL)
		return TM_EBADENVIRONMENT;
	tm_jobid_len = 0;
	free(tm_jobid);
	tm_jobid = strdup(env);
	if (!tm_jobid)
		return TM_ESYSTEM;
	tm_jobid_len = strlen(tm_jobid);

	if ((env = getenv("PBS_JOBCOOKIE")) == NULL)
		return TM_EBADENVIRONMENT;
	tm_jobcookie_len = 0;
	free(tm_jobcookie);
	tm_jobcookie = strdup(env);
	if (!tm_jobcookie)
		return TM_ESYSTEM;
	tm_jobcookie_len = strlen(tm_jobcookie);

	if ((env = getenv("PBS_NODENUM")) == NULL)
		return TM_EBADENVIRONMENT;
	tm_jobndid = (tm_node_id) strtol(env, &hold, 10);
	if (env == hold)
		return TM_EBADENVIRONMENT;
	if ((env = getenv("PBS_TASKNUM")) == NULL)
		return TM_EBADENVIRONMENT;
	if ((tm_jobtid = strtoul(env, NULL, 16)) == 0)
		return TM_EBADENVIRONMENT;
	if ((env = getenv("PBS_MOMPORT")) == NULL)
		return TM_EBADENVIRONMENT;
	if ((tm_momport = atoi(env)) == 0)
		return TM_EBADENVIRONMENT;

	init_done = 1;
	nevent = new_event();

	/*
	 * send the following request:
	 *	header		(tm_init)
	 */

	if (startcom(TM_INIT, nevent) != DIS_SUCCESS)
		return TM_ESYSTEM;
	dis_flush(local_conn);
	add_event(nevent, TM_ERROR_NODE, TM_INIT, (void *) roots);

	if ((err = tm_poll(TM_NULL_EVENT, &revent, 1, &nerr)) != TM_SUCCESS)
		return err;
	return nerr;
}

/**
 *
 * @brief
 *	Initialize and attach new task for <pid> to job <jobid>
 *
 * @param[in]	jobid  - job id to which new task will be attached
 * @param[in]	cookie - job cookie
 * @param[in]	pid    - pid of task to be attached
 * @param[in]	host   - hostname
 * @param[in] 	port   - port number
 * @param[out]	tid  - newly attached task id
 *
 * @return	int
 * @retval	TM_SUCCESS (0)  - Success
 * @retval	TM_E*	   (>0) - Failer
 *
 */
int
tm_attach(char *jobid, char *cookie, pid_t pid, tm_task_id *tid, char *host, int port)
{
	tm_event_t nevent, revent;
	int err;
	int nerr = 0;
	extern int pbs_tcp_interrupt;
#ifdef WIN32
	char usern[UNLEN + 1] = {'\0'};
	int sz = 0;
	int ret = 0;
#endif

	pbs_tcp_interrupt = 1;

	tm_jobid_len = 0;
	free(tm_jobid);
	tm_jobid = NULL;
	if (jobid && (*jobid != '\0')) {
		tm_jobid = strdup(jobid);
		if (!tm_jobid)
			return TM_ESYSTEM;
		tm_jobid_len = strlen(tm_jobid);
	}

	tm_jobcookie_len = 0;
	free(tm_jobcookie);
	tm_jobcookie = NULL;
	if (cookie && (*cookie != '\0')) {
		tm_jobcookie = strdup(cookie);
		if (!tm_jobcookie)
			return TM_ESYSTEM;
		tm_jobcookie_len = strlen(tm_jobcookie);
	}

	if (host != NULL && *host != '\0')
		localhost = host;
	tm_momport = port;

	nevent = new_event();

	/*
	 * send the following request:
	 *	header		(tm_attach)
	 *	int		uid
	 *	int		pid
	 */

	if (startcom(TM_ATTACH, nevent) != DIS_SUCCESS)
		return TM_ESYSTEM;
#ifdef WIN32
	sz = sizeof(usern);
	ret = GetUserName(usern, &sz);
	if (diswcs(local_conn, usern, strlen(usern)) != DIS_SUCCESS) /* send uid */
		return TM_ENOTCONNECTED;
#else
	if (diswsi(local_conn, getuid()) != DIS_SUCCESS) /* send uid */
		return TM_ENOTCONNECTED;
#endif

	if (diswsi(local_conn, pid) != DIS_SUCCESS) /* send pid */
		return TM_ENOTCONNECTED;

	dis_flush(local_conn);
	add_event(nevent, TM_ERROR_NODE, TM_ATTACH, (void *) tid);

	init_done = 1; /* fake having called tm_init */
	err = tm_poll(TM_NULL_EVENT, &revent, 1, &nerr);
	init_done = 0;

	if (err != TM_SUCCESS)
		return err;
	return nerr;
}

/**
 * @brief
 *	-Copy out node info.  No communication with pbs_mom is needed.
 *
 * @param[in] list - pointer to job relative node list
 * @param[out] nnodes - number of nodes
 *
 * @return	int
 * @retval	TM_SUCCESS	Success
 * @retval	TM_E*		error
 *
 */
int
tm_nodeinfo(tm_node_id **list, int *nnodes)
{
	tm_node_id *np;
	int i;
	int n = 0;

	if (!init_done)
		return TM_BADINIT;
	if (node_table == NULL)
		return TM_ESYSTEM;

	for (np = node_table; *np != TM_ERROR_NODE; np++)
		n++; /* how many nodes */

	np = (tm_node_id *) calloc(n, sizeof(tm_node_id));
	if (np == NULL)
		return TM_ESYSTEM;
	for (i = 0; i < n; i++)
		np[i] = node_table[i];
	*list = np;
	*nnodes = i;
	return TM_SUCCESS;
}

/**
 * @brief
 *	-Starts <argv>[0] with environment <envp> at <where>.
 *
 * @param[in] argc - argument count
 * @param[in] argv - argument list
 * @param[in] envp - environment variable list
 * @param[in] where - job relative node
 * @param[out] tid - task id
 * @param[out] event - event info
 *
 * @return	int
 * @retval	TM_SUCCESS	success
 * @retval	TM_ER*		error
 *
 */
int
tm_spawn(int argc, char **argv, char **envp,
	 tm_node_id where, tm_task_id *tid, tm_event_t *event)
{
	char *cp;
	int i;

	if (!init_done)
		return TM_BADINIT;
	if (argc <= 0 || argv == NULL || argv[0] == NULL || *argv[0] == '\0')
		return TM_ENOTFOUND;

	*event = new_event();
	if (startcom(TM_SPAWN, *event) != DIS_SUCCESS)
		return TM_ENOTCONNECTED;

	if (diswsi(local_conn, where) != DIS_SUCCESS) /* send where */
		return TM_ENOTCONNECTED;

	if (diswsi(local_conn, argc) != DIS_SUCCESS) /* send argc */
		return TM_ENOTCONNECTED;

	/* send argv strings across */

	for (i = 0; i < argc; i++) {
		cp = argv[i];
		if (diswcs(local_conn, cp, strlen(cp)) != DIS_SUCCESS)
			return TM_ENOTCONNECTED;
	}

	/* send envp strings across */
	if (envp != NULL) {
		for (i = 0; (cp = envp[i]) != NULL; i++) {
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
			/* never send KRB5CCNAME; it would rewrite the value on target host */
			if (strncmp(envp[i], "KRB5CCNAME", strlen("KRB5CCNAME")) == 0)
				continue;
#endif
			if (diswcs(local_conn, cp, strlen(cp)) != DIS_SUCCESS)
				return TM_ENOTCONNECTED;
		}
	}
	if (diswcs(local_conn, "", 0) != DIS_SUCCESS)
		return TM_ENOTCONNECTED;
	dis_flush(local_conn);
	add_event(*event, where, TM_SPAWN, (void *) tid);
	return TM_SUCCESS;
}

/**
 * @brief
 *	-Sends a <sig> signal to all the process groups in the task
 *	signified by the handle, <tid>.
 *
 * @param[in] tid - task id
 * @param[in] sig - signal number
 * @param[out] event - event handle
 *
 * @return	int
 * @retval	TM_SUCCESS	Success
 * @retval	TM_ER*		error
 *
 */
int
tm_kill(tm_task_id tid, int sig, tm_event_t *event)
{
	task_info *tp;

	if (!init_done)
		return TM_BADINIT;
	if ((tp = find_task(tid)) == NULL)
		return TM_ENOTFOUND;
	*event = new_event();
	if (startcom(TM_SIGNAL, *event) != DIS_SUCCESS)
		return TM_ENOTCONNECTED;
	if (diswsi(local_conn, tp->t_node) != DIS_SUCCESS)
		return TM_ENOTCONNECTED;
	if (diswui(local_conn, tid) != DIS_SUCCESS)
		return TM_ENOTCONNECTED;
	if (diswsi(local_conn, sig) != DIS_SUCCESS)
		return TM_ENOTCONNECTED;
	dis_flush(local_conn);
	add_event(*event, tp->t_node, TM_SIGNAL, NULL);
	return TM_SUCCESS;
}

/**
 * @brief
 *	-Returns an event that can be used to learn when a task
 *	dies.
 *
 * @param[in] tid - task id
 * @param[out] obitval	- obit value
 * @param[out]  event - event handle
 *
 * @return      int
 * @retval      TM_SUCCESS      Success
 * @retval      TM_ER*          error
 *
 */
int
tm_obit(tm_task_id tid, int *obitval, tm_event_t *event)
{
	task_info *tp;

	if (!init_done)
		return TM_BADINIT;
	if ((tp = find_task(tid)) == NULL)
		return TM_ENOTFOUND;
	*event = new_event();
	if (startcom(TM_OBIT, *event) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswsi(local_conn, tp->t_node) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswui(local_conn, tid) != DIS_SUCCESS)
		return TM_ESYSTEM;
	dis_flush(local_conn);
	add_event(*event, tp->t_node, TM_OBIT, (void *) obitval);
	return TM_SUCCESS;
}

struct taskhold {
	tm_task_id *list;
	int size;
	int *ntasks;
};

/**
 * @brief
 *	-Makes a request for the list of tasks on <node>.  If <node>
 *	is a valid node number, it returns the event that the list of
 *	tasks on <node> is available.
 *
 * @param[in] node - job relative node id
 * @param[out] tid_list - pointer to task list
 * @param[in] list_size - size of the task list
 * @param[out] ntasks - number of tasks
 * @param[out] event - pointer to event list
 *
 * @return	int
 * @retval	TM_SUCCESS	success
 * @retval	TM_ER*		error
 *
 */
int
tm_taskinfo(tm_node_id node, tm_task_id *tid_list,
	    int list_size, int *ntasks, tm_event_t *event)
{
	struct taskhold *thold;

	if (!init_done)
		return TM_BADINIT;
	if (tid_list == NULL || list_size == 0 || ntasks == NULL)
		return TM_EBADENVIRONMENT;
	*event = new_event();
	if (startcom(TM_TASKS, *event) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswsi(local_conn, node) != DIS_SUCCESS)
		return TM_ESYSTEM;
	dis_flush(local_conn);

	thold = (struct taskhold *) malloc(sizeof(struct taskhold));
	assert(thold != NULL);
	thold->list = tid_list;
	thold->size = list_size;
	thold->ntasks = ntasks;
	add_event(*event, node, TM_TASKS, (void *) thold);
	return TM_SUCCESS;
}

/**
 * @brief
 *	-Returns the job-relative node number that holds or held <tid>.  In
 *	case of an error, it returns TM_ERROR_NODE.
 *
 * @param[in] tid - task id
 * @param[out] node - job relative node
 *
 * @return	int
 * @retval      TM_SUCCESS      success
 * @retval      TM_ER*          error
 *
 */
int
tm_atnode(tm_task_id tid, tm_node_id *node)
{
	task_info *tp;

	if (!init_done)
		return TM_BADINIT;
	if ((tp = find_task(tid)) == NULL)
		return TM_ENOTFOUND;
	*node = tp->t_node;
	return TM_SUCCESS;
}

struct reschold {
	char *resc;
	int len;
};

/**
 * @brief
 *	-Makes a request for a string specifying the resources
 *	available on <node>.  If <node> is a valid node number, it
 *	returns the event that the string specifying the resources on
 *	<node> is available.  It returns ERROR_EVENT otherwise.
 *
 * @param[in] node - job relative node
 * @param[out] resource - resource avlbl on node
 * @param[in] len - length of string
 * @param[out] event - pointer to event info
 *
 * @return      int
 * @retval      TM_SUCCESS      success
 * @retval      TM_ER*          error
 *
 */
int
tm_rescinfo(tm_node_id node, char *resource, int len, tm_event_t *event)
{
	struct reschold *rhold;

	if (!init_done)
		return TM_BADINIT;
	if (resource == NULL || len == 0)
		return TM_EBADENVIRONMENT;
	*event = new_event();
	if (startcom(TM_RESOURCES, *event) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswsi(local_conn, node) != DIS_SUCCESS)
		return TM_ESYSTEM;
	dis_flush(local_conn);

	rhold = (struct reschold *) malloc(sizeof(struct reschold));
	assert(rhold != NULL);
	rhold->resc = resource;
	rhold->len = len;

	add_event(*event, node, TM_RESOURCES, (void *) rhold);
	return TM_SUCCESS;
}

/**
 * @brief
 *	-Posts the first <nbytes> of a copy of *<info> within MOM on
 *	this node, and associated with this task.  If <info> is
 *	non-NULL, it returns the event that the effort to post *<info>
 *	is complete.  It returns ERROR_EVENT otherwise.
 *
 * @param[in] name - name of mom
 * @param[in] info - information (event)
 * @param[in] len - length of info
 * @param[out] event - pointer to event info
 *
 * @return      int
 * @retval      TM_SUCCESS (0)  - Success
 * @retval      TM_E*      () - Failure
 *
 */
int
tm_publish(char *name, void *info, int len, tm_event_t *event)
{

	if (!init_done)
		return TM_BADINIT;
	*event = new_event();
	if (startcom(TM_POSTINFO, *event) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswst(local_conn, name) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswcs(local_conn, info, len) != DIS_SUCCESS)
		return TM_ESYSTEM;

	dis_flush(local_conn);
	add_event(*event, TM_ERROR_NODE, TM_POSTINFO, NULL);
	return TM_SUCCESS;
}

struct infohold {
	void *info;
	int len;
	int *info_len;
};

/**
 * @brief
 *	Makes a request for a copy of the info posted by <tid>.  If
 *	<tid> is a valid task, it returns the event that the
 *	string specifying the info posted by <tid> is available.
 *
 * @param[in] tid - task id
 * @param[in] name - name of
 * @param[out] info - event info
 * @param[in] len -length of info
 * @param[out] info_len - info len to be output
 * @param[out] event - handle to event
 *
 * @return      int
 * @retval      0       success
 * @retval      !0      error
 *
 */
int
tm_subscribe(tm_task_id tid, char *name, void *info, int len, int *info_len, tm_event_t *event)
{
	task_info *tp;
	struct infohold *ihold;

	if (!init_done)
		return TM_BADINIT;
	if ((tp = find_task(tid)) == NULL)
		return TM_ENOTFOUND;
	*event = new_event();
	if (startcom(TM_GETINFO, *event) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswsi(local_conn, tp->t_node) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswui(local_conn, tid) != DIS_SUCCESS)
		return TM_ESYSTEM;
	if (diswst(local_conn, name) != DIS_SUCCESS)
		return TM_ESYSTEM;
	dis_flush(local_conn);

	ihold = (struct infohold *) malloc(sizeof(struct infohold));
	assert(ihold != NULL);
	ihold->info = info;
	ihold->len = len;
	ihold->info_len = info_len;

	add_event(*event, tp->t_node, TM_GETINFO, (void *) ihold);
	return TM_SUCCESS;
}

/**
 * @brief
 *	-tm_finalize() - close out task manager interface
 *
 * @par	Note:
 *	This function should be the last one called.  It is illegal to call
 *	any other task manager function following this one.   All events are
 *	freed and any connection to the task manager (pbs_mom) is closed.
 *	This call is synchronous.
 *
 * @return      int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
tm_finalize()
{
	event_info *e;
	int i = 0;

	if (!init_done)
		return TM_BADINIT;
	while (event_count && (i < EVENT_HASH)) {
		while ((e = event_hash[i]) != NULL) {
			del_event(e);
		}
		++i; /* check next slot in hash table */
	}
	init_done = 0;
	free(tm_jobid);
	tm_jobid = NULL;
	tm_jobid_len = 0;
	free(tm_jobcookie);
	tm_jobcookie = NULL;
	tm_jobcookie_len = 0;
	return TM_SUCCESS; /* what else */
}

/**
 * @brief
 *	-tm_notify() - set the signal to be sent on event arrival.
 *
 * @param[in] tm_signal - signal number
 *
 * @return      int
 * @retval      TM_ENOTIMPLEMENTED      Success
 * @retval      TM_BADINIT              error
 *
 */
int
tm_notify(int tm_signal)
{
	if (!init_done)
		return TM_BADINIT;
	return TM_ENOTIMPLEMENTED;
}

/**
 * @brief
 *	-tm_alloc() - make a request for additional resources.
 *
 * @param[in] resources - resource list
 * @param[in] event - event handle
 *
 * @return      int
 * @retval      TM_ENOTIMPLEMENTED      Success
 * @retval      TM_BADINIT              error
 *
 */
int
tm_alloc(char *resources, tm_event_t *event)
{
	if (!init_done)
		return TM_BADINIT;
	return TM_ENOTIMPLEMENTED;
}

/**
 * @brief
 *	-tm_dealloc() - drop a node from the job.
 *
 * @param[in] node - job relative node
 * @param[in] event - event handle
 *
 * @return      int
 * @retval      TM_ENOTIMPLEMENTED      Success
 * @retval      TM_BADINIT              error
 *
 */
int
tm_dealloc(tm_node_id node, tm_event_t *event)
{
	if (!init_done)
		return TM_BADINIT;
	return TM_ENOTIMPLEMENTED;
}

/**
 * @brief
 *	-tm_create_event() - create a persistent event.
 *
 * @param[in] event - event handle
 *
 * @return      int
 * @retval      TM_ENOTIMPLEMENTED      Success
 * @retval      TM_BADINIT              error
 *
 */
int
tm_create_event(tm_event_t *event)
{
	if (!init_done)
		return TM_BADINIT;
	return TM_ENOTIMPLEMENTED;
}

/**
 * @brief
 *	-tm_destroy_event() - destroy a persistent event.
 *
 * @param[in] event - event handle
 *
 * @return      int
 * @retval      TM_ENOTIMPLEMENTED      Success
 * @retval      TM_BADINIT              error
 *
 */
int
tm_destroy_event(tm_event_t *event)
{
	if (!init_done)
		return TM_BADINIT;
	return TM_ENOTIMPLEMENTED;
}

/**
 * @brief
 *	-tm_register() - link a persistent event with action requests
 *	from the task manager.
 *
 * @param[in] what - info about last event polled
 * @param[in] event - event handle
 *
 * @return      int
 * @retval      TM_ENOTIMPLEMENTED	Success
 * @retval      TM_BADINIT		error
 *
 */
int
tm_register(tm_whattodo_t *what, tm_event_t *event)
{
	if (!init_done)
		return TM_BADINIT;
	return TM_ENOTIMPLEMENTED;
}

#define FOREVER 2147000
/**
 * @brief
 *	-tm_poll - poll to see if an event has been completed.
 *
 * @par Note:
 *	If "poll_event" is a valid event handle, see if it is completed;
 *	else if "poll_event" is the null event, check for the first event that
 *	is completed.
 *
 * @par	Functionality:
 *	result_event is set to the completed event or the null event.
 *
 *	If wait is non_zero, wait for "poll_event" to be completed.
 *
 *	If an error ocurs, set tm_errno non-zero.
 *
 * @param[in] poll_event - event handle
 * @param[in] result_event - event handle to output
 * @param[in] wait - indiacation for wait
 * @param[in] tm_errno - error number
 *
 * @return      int
 * @retval      TM_SUCCESS (0)  - Success
 * @retval      TM_E*       	- Failure
 *
 */
int
tm_poll(tm_event_t poll_event, tm_event_t *result_event, int wait, int *tm_errno)
{
	int num, i;
	int ret, mtype, nnodes;
	int prot, protver;
	int *obitvalp;
	event_info *ep = NULL;
	tm_task_id tid, *tidp;
	tm_event_t nevent;
	tm_node_id node;
	char *jobid;
	char *info;
	size_t rdsize;
	struct tm_roots *roots;
	struct taskhold *thold;
	struct infohold *ihold;
	struct reschold *rhold;

	if (!init_done)
		return TM_BADINIT;
	if (result_event == NULL)
		return TM_EBADENVIRONMENT;
	*result_event = TM_ERROR_EVENT;
	if (poll_event != TM_NULL_EVENT)
		return TM_ENOTIMPLEMENTED;
	if (tm_errno == NULL)
		return TM_EBADENVIRONMENT;

	if (event_count == 0) {
		DBPRT(("%s: no events waiting\n", __func__))
		return TM_ENOTFOUND;
	}
	if (local_conn < 0) {
		DBPRT(("%s: INTERNAL ERROR %d events but no connection\n",
		       __func__, event_count))
		return TM_ENOTCONNECTED;
	}

	/*
	 ** Setup tcp dis routines with a wait value appropriate for
	 ** the value of wait the user set.
	 */
	pbs_tcp_timeout = wait ? FOREVER : 0;
	DIS_tcp_funcs();

	prot = disrsi(local_conn, &ret);
	if (ret == DIS_EOD) {
		*result_event = TM_NULL_EVENT;
		return TM_SUCCESS;
	} else if (ret != DIS_SUCCESS) {
		DBPRT(("%s: protocol number dis error %d\n", __func__, ret))
		goto err;
	}
	if (prot != TM_PROTOCOL) {
		DBPRT(("%s: bad protocol number %d\n", __func__, prot))
		goto err;
	}

	/*
	 ** We have seen the start of a message.  Set the timeout value
	 ** so we wait for the remaining data of a message.
	 */
	pbs_tcp_timeout = FOREVER;
	protver = disrsi(local_conn, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("%s: protocol version dis error %d\n", __func__, ret))
		goto err;
	}
	if (protver != TM_PROTOCOL_VER) {
		DBPRT(("%s: bad protocol version %d\n", __func__, protver))
		goto err;
	}

	mtype = disrsi(local_conn, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("%s: mtype dis error %d\n", __func__, ret))
		goto err;
	}
	nevent = disrsi(local_conn, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("%s: event dis error %d\n", __func__, ret))
		goto err;
	}

	*result_event = nevent;
	DBPRT(("%s: got event %d return %d\n", __func__, nevent, mtype))
	if ((ep = find_event(nevent)) == NULL) {
		DBPRT(("%s: No event found for number %d\n", __func__, nevent));
		CS_close_socket(local_conn);
		closesocket(local_conn);
		local_conn = -1;
		return TM_ENOEVENT;
	}

	if (mtype == TM_ERROR) { /* problem, read error num */
		*tm_errno = disrsi(local_conn, &ret);
		DBPRT(("%s: event %d error %d\n", __func__, nevent, *tm_errno));
		goto done;
	}

	*tm_errno = TM_SUCCESS;
	switch (ep->e_mtype) {

			/*
			 **	auxiliary info (
			 **		number of nodes	int;
			 **		nodeid[0]	int;
			 **		...
			 **		nodeid[n-1]	int;
			 **		parent jobid	string;
			 **		parent nodeid	int;
			 **		parent taskid	int;
			 **	)
			 */
		case TM_INIT:
			nnodes = disrsi(local_conn, &ret);
			if (ret != DIS_SUCCESS) {
				DBPRT(("%s: INIT failed nnodes\n", __func__))
				goto err;
			}

			node_table = (tm_node_id *) calloc(nnodes + 1,
							   sizeof(tm_node_id));
			if (node_table == NULL)
				goto err;
			DBPRT(("%s: INIT nodes %d\n", __func__, nnodes))
			for (i = 0; i < nnodes; i++) {
				node_table[i] = disrsi(local_conn, &ret);
				if (ret != DIS_SUCCESS) {
					DBPRT(("%s: INIT failed nodeid %d\n", __func__, i))
					goto err;
				}
			}
			node_table[nnodes] = TM_ERROR_NODE;

			jobid = disrst(local_conn, &ret);
			if (ret != DIS_SUCCESS) {
				DBPRT(("%s: INIT failed jobid\n", __func__))
				goto err;
			}
			DBPRT(("%s: INIT daddy jobid %s\n", __func__, jobid))
			node = disrsi(local_conn, &ret);
			if (ret != DIS_SUCCESS) {
				DBPRT(("%s: INIT failed parent nodeid\n", __func__))
				goto err;
			}
			DBPRT(("%s: INIT daddy node %d\n", __func__, node))
			tid = disrui(local_conn, &ret);
			if (ret != DIS_SUCCESS) {
				DBPRT(("%s: INIT failed parent taskid\n", __func__))
				goto err;
			}
			DBPRT(("%s: INIT daddy tid %lu\n", __func__, (unsigned long) tid))

			roots = (struct tm_roots *) ep->e_info;
			roots->tm_parent = new_task(jobid, node, tid);
			roots->tm_me = new_task(tm_jobid,
						tm_jobndid,
						tm_jobtid);
			roots->tm_nnodes = nnodes;
			roots->tm_ntasks = 0;	   /* TODO */
			roots->tm_taskpoolid = -1; /* what? */
			roots->tm_tasklist = NULL; /* TODO */

			break;

		case TM_TASKS:
			thold = (struct taskhold *) ep->e_info;
			tidp = thold->list;
			num = thold->size;
			for (i = 0;; i++) {
				tid = disrui(local_conn, &ret);
				if (tid == TM_NULL_TASK)
					break;
				if (ret != DIS_SUCCESS)
					goto err;
				if (i < num) {
					tidp[i] = new_task(tm_jobid,
							   ep->e_node, tid);
				}
			}
			if (i < num)
				tidp[i] = TM_NULL_TASK;
			*(thold->ntasks) = i;
			break;

		case TM_SPAWN:
		case TM_ATTACH:
			tid = disrui(local_conn, &ret);
			if (ret != DIS_SUCCESS) {
				DBPRT(("%s: SPAWN failed tid\n", __func__))
				goto err;
			}
			tidp = (tm_task_id *) ep->e_info;
			*tidp = new_task(tm_jobid, ep->e_node, tid);
			break;

		case TM_SIGNAL:
			break;

		case TM_OBIT:
			obitvalp = (int *) ep->e_info;
			*obitvalp = disrsi(local_conn, &ret);
			if (ret != DIS_SUCCESS) {
				DBPRT(("%s: OBIT failed obitval\n", __func__))
				goto err;
			}
			break;

		case TM_POSTINFO:
			break;

		case TM_GETINFO:
			ihold = (struct infohold *) ep->e_info;
			info = disrcs(local_conn, &rdsize, &ret);
			/* save the returned length to return to user in an int, */
			/* truncation is not an issue because the length of the  */
			/* message  published lenght  must fit in a "int"        */
			*ihold->info_len = (int) rdsize;
			if (ret != DIS_SUCCESS) {
				DBPRT(("%s: GETINFO failed info\n", __func__))
				break;
			}
			memcpy(ihold->info, info, MIN(*ihold->info_len, ihold->len));
			free(info);
			break;

		case TM_RESOURCES:
			rhold = (struct reschold *) ep->e_info;
			info = disrst(local_conn, &ret);
			if (ret != DIS_SUCCESS)
				break;
			strncpy(rhold->resc, info, rhold->len);
			free(info);
			break;

		default:
			DBPRT(("%s: unknown event command %d\n", __func__, ep->e_mtype))
			goto err;
	}
done:
	del_event(ep);
	return TM_SUCCESS;

err:
	if (ep)
		del_event(ep);
	CS_close_socket(local_conn);
	closesocket(local_conn);
	local_conn = -1;
	return TM_ENOTCONNECTED;
}


================================================
FILE: src/lib/Libifl/xml_encode_decode.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	xml_encode_decode.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <string.h>
#include <unistd.h>
#include <limits.h>
#include <sys/stat.h>
#include <stdlib.h>
#include <sys/types.h>

#include "pbs_ifl.h"
#include "log.h"

#ifndef _POSIX_ARG_MAX
#define _POSIX_ARG_MAX 4096 /* largest value standards guarantee */
#endif

#define LESS_THAN "&lt;"
#define GRT_THAN "&gt;"
#define DOUBLE_QUOTE "&quot;"
#define SINGLE_QUOTE "&apos;"
#define AMPERSAND "&amp;"
#define START_JSDL_ARG "<jsdl-hpcpa:Argument>"
#define END_JSDL_ARG "</jsdl-hpcpa:Argument>"
#define PBS_NUM_ESC_CHARS 256

/* removed global variables arg_max and escape_chars
 * into function scope, so that these functions become MT-safe
 */

/*
 * init_escapechars -- initializes escape_chars array
 * indices with corresponding escape string
 */

/**
 * @brief
 *	-Find max number of chars an argument can take.
 *
 * @param[out] escape_chars  - list of escape chars
 * @param[out] arg_max - max chars
 *
 * @return	Void
 *
 */
static void
init_escapechars_maxarg(char **escape_chars, long *arg_max)
{
	long sysconf_argmax;

	if (*arg_max == -1) {
#ifdef _SC_ARG_MAX
#define PBS_MAX_ARG_MAX (1 << 24)
		sysconf_argmax = sysconf(_SC_ARG_MAX);

		/*
		 * Constrain the size of arg_max returned.  The value returned
		 * by sysconf(_SC_ARG_MAX) may be enormous:  one system we've
		 * tested regularly returns 4611686018427387903, which it then
		 * (quite reasonably) refuses to let us malloc.  We arbitrarily
		 * constrain it to no more than PBS_MAX_ARG_MAX.
		 */
		if (sysconf_argmax <= 0)
			*arg_max = _POSIX_ARG_MAX;
		else if (sysconf_argmax > PBS_MAX_ARG_MAX)
			*arg_max = PBS_MAX_ARG_MAX;
		else
			*arg_max = sysconf_argmax;
#undef PBS_MAX_ARG_MAX
#else
		*arg_max = _POSIX_ARG_MAX;
#endif /* _SC_ARG_MAX */
	}

	/* initialize escape_chars to nulls, since its no longer static var */
	memset(escape_chars, 0, PBS_NUM_ESC_CHARS * sizeof(char *));
	/*
	 * Initialize ascii value escape char indices with
	 * corresponding escape string.
	 */
	escape_chars[(int) '<'] = LESS_THAN;
	escape_chars[(int) '>'] = GRT_THAN;
	escape_chars[(int) '"'] = DOUBLE_QUOTE;
	escape_chars[(int) '\''] = SINGLE_QUOTE;
	escape_chars[(int) '&'] = AMPERSAND;
}

/**
 * @brief
 *	takes plain/simple string as an input and return the number of
 *      characters in the resultant encoded string.
 *
 * @param[in]   original_arg - the input string to be encoded
 * @param[in/out]   encoded_arg - the encoding of 'orginal_arg'
 * @param[in]   escape_chars
 *              Following table lists escape chracters along with their
 *              replacement strings used by 'encode_argument' and
 *              'decode_argument' at the time of encoding/decoding.
 * -------------------------------------------------------
 *	Original Character	--	Replacement String
 *		<		--	'&lt;
 *		>		--	'&gt;
 *		&		--	&amp;
 *		'		--	&apos;
 *		"		--	&quot;
 * @return int
 * @retval >=0	Number of characters in the resultant encoded string
 *		connection made.
 */
static int
encode_argument(char *original_arg, char *encoded_arg,
		char **escape_chars)
{
	int j = 0;
	int i, k;
	int ind;

	for (i = 0; original_arg[i] != '\0'; i++) {

		if (((int) original_arg[i] >= 0) &&
		    ((int) original_arg[i] < PBS_NUM_ESC_CHARS) &&
		    (escape_chars[(int) original_arg[i]] != NULL)) {
			/* found an escape char */
			ind = (int) original_arg[i];
			/* Replace with corresponding escape string */
			for (k = 0; escape_chars[ind][k] != '\0'; k++) {
				encoded_arg[j] = escape_chars[ind][k];
				j++;
			}
		} else {
			/* not an escape char */
			encoded_arg[j] = original_arg[i];
			j++;
		}
	}
	encoded_arg[j] = '\0';
	return j;
}

/**
 * @brief
 *	This function is used to decode arguments from given
 *	xml(tags). It is invoked by other functions like
 *	decode_xml_arg_list( ) during xml parsing/decoding
 *
 * @param[in]   encoded_arg  - the token against which to parse
 * @param[in]   original_arg - populated with the decoded string
 *
 * @return int
 * @retval >= 0	length of original_arg
 * @retval -1	error encountered during parsing
 */
static int
decode_argument(char *encoded_arg, char *original_arg)
{
	int i = 0;
	int j = 0;
	int k = 0;
	char escape_chars[10];
#ifdef WIN32
	int quotes_flag = 0;
#endif

#ifdef WIN32
	/*
	 * This is to handle differences between M$ and non-M$ platforms
	 * related to 'Double quotes'(") character at the time of reading
	 * command-line argument(with white spaces) from user(through 'qsub').
	 * In case of non-M$ platforms, it removes the '"' charater and passes
	 * it to the PBS Server. In case PBS Scheduler decides to move job
	 * to M$ MOM, then the M$ MOM would receive an argument without '"'
	 * character and consider it as two different arguments. So, if any
	 * argument(having white spaces) recieved from the PBS Server doesn't
	 * start with '&quot;' string, then the character '"' is prepended
	 * and appended to the argument at the time of decoding XML argument.
	 */
	if ((strchr(encoded_arg, ' ')) &&
	    (strncmp(encoded_arg, DOUBLE_QUOTE,
		     sizeof(DOUBLE_QUOTE)))) {
		/* argument has white space without '&quot;" string */
		/* prefix this arugment with '"' character	*/
		quotes_flag = 1;
		original_arg[k++] = '"';
	}

#endif /* WIN32 */

	while (encoded_arg[i] != '\0') {
		if (encoded_arg[i] != '&')
			original_arg[k] = encoded_arg[i];
		else {
			j = 0;
			while (encoded_arg[i] != ';') {
				escape_chars[j] = encoded_arg[i];
				j++;
				i++;
			}
			escape_chars[j] = encoded_arg[i];
			escape_chars[j + 1] = '\0';
			if (strcmp(escape_chars, LESS_THAN) == 0)
				original_arg[k] = '<';
			else if (strcmp(escape_chars, GRT_THAN) == 0)
				original_arg[k] = '>';
			else if (strcmp(escape_chars, AMPERSAND) == 0)
				original_arg[k] = '&';
			else if (strcmp(escape_chars, DOUBLE_QUOTE) == 0)
				original_arg[k] = '"';
			else if (strcmp(escape_chars, SINGLE_QUOTE) == 0)
				original_arg[k] = '\'';
		}
		i++;
		k++;
	}

#ifdef WIN32
	if (quotes_flag) {
		/* suffix with '"' character */
		original_arg[k++] = '"';
	}
#endif /* WIN32 */

	original_arg[k] = '\0';
	return k;
}

/**
 * @brief
 *	encode_xml_arg_list takes current index, number of arguments
 *      passed to 'qsub' program and arguments as input and returns
 *      an encoded string(XML form) to 'qsub' program. It loops through each
 *      argument and converts that into an equivalent encoded string using
 *      ('encode_argument' function). For eg, if a1, a2 are the arguments,
 *      then it returns following encoded XML string to 'qsub' program.
 *      encoded string   --  <jsdl-hpcpa:Argument>a1</jsdl-hpcpa:Argument>
 *                           <jsdl-hpcpa:Argument>a2</jsdl-hpcpa:Argument>
 *
 * @param[in]   optind - current index
 * @param[in]   argc - number of arguments passed to 'qsub' program
 * @param[in]   argv - arguments as input
 *
 * @return char*
 * @retval An encoded string(XML form) to 'qsub' program in case of SUCCESS
 * @retval NULL in case of failure
 */
extern char *
encode_xml_arg_list(int optind, int argc, char **argv)
{
	char *xml_string = NULL;
	int cur_len = 1;
	int j;
	char *arg = NULL;
	int jsdl_tag_len;
	char *temp;
	int first = 1;
	char *escape_chars[PBS_NUM_ESC_CHARS];
	long arg_max = -1;

	jsdl_tag_len = sizeof(START_JSDL_ARG) + sizeof(END_JSDL_ARG) - 2;
	if (argc > 0 && argv == NULL)
		return NULL;
	/*
	 * Initialize escape chars array and max number of
	 * chars an argument can hold.
	 */

	init_escapechars_maxarg(escape_chars, &arg_max);

	/* Allocate memory to hold encoded argument */
	arg = malloc(arg_max * sizeof(char *));
	if (arg == NULL)
		return NULL;

	for (j = optind; j < argc; j++) {
		if (argv[j] == NULL) {
			if (xml_string)
				free(xml_string);
			break;
		}
		cur_len += strlen(argv[j]) + jsdl_tag_len;
		temp = realloc(xml_string, cur_len);
		if (temp == NULL) {
			if (xml_string)
				free(xml_string);
			free(arg);
			return NULL;
		} else
			xml_string = temp;
		if (first) {
			strcpy(xml_string, START_JSDL_ARG);
			first = 0;
		} else
			strcat(xml_string, START_JSDL_ARG);

		cur_len += encode_argument(argv[j], arg, escape_chars);
		temp = realloc(xml_string, cur_len);
		if (temp == NULL) {
			free(xml_string);
			free(arg);
			return NULL;
		} else
			xml_string = temp;

		strcat(xml_string, arg);
		strcat(xml_string, END_JSDL_ARG);
		arg[0] = '\0';
	}
	free(arg);
	return xml_string;
}

/**
 * @brief
 *	Takes 'executable' and 'argument_list'(encoded form) as an input and
 *      stores decoded arguments in address of argarray passed to this function.
 *      It breaks an encoding string into arguments, decodes each argument into
 *      plain string and assigns it to 'argarray'.
 * @param[in]   executable - the input for decoding
 * @param[in]   arg_list - list of arguments passed on command-line
 * @param[in]   shell - 'executable' stored into shell variable
 * @param[in]   argarray - stores the decoded arguments passed to this function
 *
 * @return int
 * @retval  0	indicates SUCCESS
 * @retval -1	indicates FAILURE
 */
extern int
decode_xml_arg_list(char *executable, char *arg_list,
		    char **shell, char ***argarray)
{
	char *argument_list = NULL;
	char *token = NULL;
	char *arg = NULL;
	char seps[] = "<>";
	char **argv = NULL;
	char **argv_temp = NULL;
	int no_of_arguments = 0;
	int arg_len = 0, i;
	char *escape_chars[PBS_NUM_ESC_CHARS];
	long arg_max = -1;
	char *saveptr; /* for use with strtok_r */
	/* Check for executable */
	if (executable == NULL)
		return -1;

	/* store executable into shell variable */
	*shell = executable;

	/*
	 * Initialize escape chars array and max number of
	 * chars an argument can hold.
	 */

	init_escapechars_maxarg(escape_chars, &arg_max);

	no_of_arguments++;
	argv = calloc(no_of_arguments + 1, sizeof(char *));
	if (argv == NULL) {
		return -1;
	}

	argv[0] = malloc(strlen(*shell) + 1);
	if (argv[0] == NULL) {
		free(argv);
		return -1;
	}
	strcpy(argv[0], *shell);

	/* only executable is passed in commend-line */
	if (arg_list == NULL) {
		argv[no_of_arguments] = 0;
		*argarray = argv;
		return 0;
	}

	/* Allocate memory to hold decoded argument */
	arg = malloc(strlen(arg_list) + 1);
	if (arg == NULL) {
		free(argv);
		return -1;
	}
	arg[0] = '\0';

	argument_list = strdup(arg_list);
	if (argument_list == NULL)
		goto error;

	token = strtok_r(argument_list, seps, &saveptr);
	while (token) {
		if (strstr(token, "jsdl-hpcpa:Argument") == NULL) {
			/*
			 * '<>' is used as delimiters, so the strtok might
			 * return '<jsdl-hpcpa:Argument>' as token, so consider
			 * only those contains which doesn't contain
			 * string 'jsdl-hpcpa:Argument'.
			 */
			no_of_arguments++;
			/* found an argument */
			argv_temp = realloc(argv,
					    (no_of_arguments + 1) * sizeof(char *));
			if (argv_temp == NULL)
				goto error;
			else
				argv = argv_temp;

			arg_len = decode_argument(token, arg);
			argv[no_of_arguments - 1] = (char *) malloc(arg_len + 1);
			if (argv[no_of_arguments - 1] == NULL)
				goto error;
			strcpy(argv[no_of_arguments - 1], arg);
			arg[0] = '\0';
		}
		token = strtok_r(NULL, seps, &saveptr);
	}
	argv[no_of_arguments] = 0;
	*argarray = argv;
	free(arg);
	free(argument_list);
	DBPRT(("%s: no of arguments: %d\n", __func__, no_of_arguments))
	return 0;
error:
	if (argv) {
		for (i = 0; i < no_of_arguments; i++) {
			if (argv[i])
				free(argv[i]);
		}
		free(argv);
	}
	if (arg)
		free(arg);
	if (argument_list)
		free(argument_list);
	return -1;
}

/**
 * @brief
 *	takes an encoded XML string as an input, and assigns decoded arguments
 *      to the 'argarray' variable.
 *
 * @param[in]   arg_list - encoded XML input string
 * @param[in]   argarray - decoded argumenta string to send as "extend" data.
 *
 * @return int
 * @retval  0	on SUCCESS
 * @retval -1	on FAILURE
 */

extern int
decode_xml_arg_list_str(char *arg_list,
			char **argarray)
{
	char *argument_list = NULL;
	char *token = NULL;
	char *arg;
	char seps[] = "<>";
	int cur_len = 0;
	char *argv;
	char *argv_temp;
	int first = 1;
	size_t arg_len = 0;
	char *escape_chars[PBS_NUM_ESC_CHARS];
	long arg_max = -1;
	char *saveptr; /* for use with strtok_r */

	/* Arguments are not specified */
	if (arg_list == NULL)
		return 0;

	/*
	 * Initialize escape chars array and max number of
	 * chars an argument can hold.
	 */

	init_escapechars_maxarg(escape_chars, &arg_max);

	/* Allocate memory to hold decoded argument */
	arg_len = strlen(arg_list) + 1;
	arg = malloc(arg_len);
	if (arg == NULL)
		return -1;
	arg[0] = '\0';

	argument_list = strdup(arg_list);
	if (argument_list == NULL) {
		free(arg);
		return -1;
	}

	/* Assign memory to hold argument list */
	argv = malloc(arg_len);
	if (argv == NULL) {
		free(arg);
		free(argument_list);
		return -1;
	}

	token = strtok_r(argument_list, seps, &saveptr);
	while (token) {
		if (strstr(token, "jsdl-hpcpa:Argument") == NULL) {
			/*
			 * '<>' is used as delimiters, so the strtok might
			 * return '<jsdl-hpcpa:Argument>' as token, so consider
			 * only those contains which doesn't contain
			 * string 'jsdl-hpcpa:Argument'.
			 */
			arg_len = decode_argument(token, arg);
			cur_len += arg_len + 1;
			if (first) {
				first = 0;
				strcpy(argv, arg);
			} else {
				strcat(argv, " ");
				strcat(argv, arg);
			}
		}
		token = strtok_r(NULL, seps, &saveptr);
		arg[0] = '\0';
	}
	argv_temp = realloc(argv, cur_len);
	if (argv_temp == NULL) {
		free(arg);
		free(argument_list);
		free(argv);
		return -1;
	} else
		argv = argv_temp;
	*argarray = argv;
	free(arg);
	free(argument_list);
	return 0;
}


================================================
FILE: src/lib/Libjson/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = \
	cJSON

lib_LTLIBRARIES = libpbsjson.la
libpbsjson_la_LDFLAGS = -version-info 0:0:0
libpbsjson_la_LIBADD = cJSON/libpbscjson.la @cjson_lib@
libpbsjson_la_SOURCES =


================================================
FILE: src/lib/Libjson/cJSON/Makefile.am
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

noinst_LTLIBRARIES = libpbscjson.la

libpbscjson_la_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@cjson_inc@

libpbscjson_la_LIBADD = \
	@cjson_lib@

libpbscjson_la_SOURCES = \
	pbs_cjson.c


================================================
FILE: src/lib/Libjson/cJSON/pbs_cjson.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <stdlib.h>
#include <stdio.h>
#include <cjson/cJSON.h>
#include "pbs_json.h"

/**
 * @brief
 *	Insert cJSON structure into cJSON object or array
 *
 * @param[in] parent - parent cJSON structure
 * @param[in] key - key for object structure, ignored for arrays
 * @param[in] value - cJSON structure
 *
 */
static void
cjson_insert_item(cJSON *parent, char *key, cJSON *value)
{
    if (cJSON_IsObject(parent))
        cJSON_AddItemToObject(parent, key, value);

    if (cJSON_IsArray(parent))
        cJSON_AddItemToArray(parent, value);
}

/**
 * @brief
 *	create json object
 *
 * @return - json_data
 * @retval   NULL - Failure
 * @retval   json_data - Success
 *
 */
json_data *
pbs_json_create_object()
{
    return (json_data *) cJSON_CreateObject();
}

/**
 * @brief
 *	create json array
 *
 * @return - json_data
 * @retval   NULL - Failure
 * @retval   json_data - Success
 *
 */
json_data *
pbs_json_create_array()
{
    return (json_data *) cJSON_CreateArray();
}

/**
 * @brief
 *	insert json data into json structure (like object or array)
 *
 * @param[in] parent - json object or array
 * @param[in] key - key for object structure, ignored for arrays
 * @param[in] value - json structure
 *
 */
void
pbs_json_insert_item(json_data *parent, char *key, json_data *value)
{
    cJSON *par = (cJSON *) parent;
    cJSON *val = (cJSON *) value;
    cjson_insert_item(par, key, val);
}

/**
 * @brief
 *  insert string into json structure (like object or array)
 *
 * @param[in] parent - json object or array
 * @param[in] key - key for object structure, ignored for arrays
 * @param[in] value - string
 *
 * @return - Error code
 * @retval   1 - Failure
 * @retval   0 - Success
 *
 */
int
pbs_json_insert_string(json_data *parent, char *key, char *value)
{
    cJSON *par = (cJSON *) parent;
    cJSON *val;
    if ((val = cJSON_CreateString(value)) == NULL)
        return 1;
    cjson_insert_item(par, key, val);
    return 0;
}

/**
 * @brief
 *  insert number into json structure (like object or array)
 *
 * @param[in] parent - json object or array
 * @param[in] key - key for object structure, ignored for arrays
 * @param[in] value - number
 *
 * @return - Error code
 * @retval   1 - Failure
 * @retval   0 - Success
 *
 */
int
pbs_json_insert_number(json_data *parent, char *key, double value)
{
    cJSON *par = (cJSON *) parent;
    cJSON *val;
    if ((val = cJSON_CreateNumber(value)) == NULL)
        return 1;
    cjson_insert_item(par, key, val);
    return 0;
}

/**
 * @brief
 *  parse and insert value into json structure (like object or array)
 *
 * @param[in] parent - json object or array
 * @param[in] key - key for object structure, ignored for arrays
 * @param[in] value - string for parsing
 * @param[in] ignore_empty - do not insert empty values (like 0 or "")
 *
 * @return - Error code
 * @retval   1 - Failure
 * @retval   0 - Success
 *
 */
int
pbs_json_insert_parsed(json_data *parent, char *key, char *value, int ignore_empty)
{
    cJSON *par = (cJSON *) parent;
    cJSON *val;
    if ((val = cJSON_ParseWithOpts(value, NULL, 1)) == NULL)
        val = cJSON_CreateString(value);
    if (ignore_empty && val != NULL) {
        if (cJSON_IsString(val) && cJSON_GetStringValue(val)[0] == '0') {
            cJSON_Delete(val);
            val = NULL;
        }
#if CJSON_VERSION_MAJOR <= 17 && CJSON_VERSION_MINOR <= 7 && CJSON_VERSION_PATCH < 13
        if (cJSON_IsNumber(val) && val->valuedouble == 0)
#else
        if (cJSON_IsNumber(val) && cJSON_GetNumberValue(val) == 0)
#endif
        {
            cJSON_Delete(val);
            val = NULL;
        }
    }
    if (!ignore_empty && val == NULL)
        return 1;
    if (val)
        cjson_insert_item(par, key, val);
    return 0;
}

/**
 * @brief
 *  print json data to output
 *
 * @param[in] data - json data
 * @param[in] stream - output
 *
 * @return - Error code
 * @retval   1 - Failure
 * @retval   0 - Success
 *
 */
int
pbs_json_print(json_data *data, FILE *stream)
{
	char *json_out = cJSON_Print((cJSON *) data);
    if (json_out != NULL) {
        fprintf(stream, "%s\n", json_out);
		free(json_out);
	} else {
		return 1;
	}
    return 0;
}

/**
 * @brief
 *  free json structure
 *
 * @param[in] data - json data
 *
 */
void
pbs_json_delete(json_data *data)
{
    cJSON_Delete((cJSON *) data);
}


================================================
FILE: src/lib/Liblicensing/Makefile.am
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

lib_LTLIBRARIES = liblicensing.la

liblicensing_la_CPPFLAGS = \
	-I$(pbssrc_dir)/src/include

liblicensing_la_LDFLAGS = -version-info 0:0:0

liblicensing_la_SOURCES = license_client.c \
			  liblicense.h


================================================
FILE: src/lib/Liblicensing/liblicense.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

int lic_init(char *license_location);
int lic_obtainable();
int lic_get(int count);
char *lic_get_error();
int checkkey(char **cred_list, char *nd_name, time_t *expiry);
void lic_close();
char *lic_check_expiry();
int lic_needed_for_node(void *node_lic_ctx);


================================================
FILE: src/lib/Liblicensing/license_client.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

int
lic_init(char *license_location)
{
	return 0;
}

int
lic_obtainable()
{
	return 1000000;
}

int
lic_get(int count)
{
	return 0;
}

char
	*
	lic_get_error()
{
	return "No Error";
}

int
checkkey(char **cred_list, char *nd_name, void *expiry)
{
	return 0;
}

void
lic_close()
{
	return;
}

char *
lic_check_expiry()
{
	return (char *) 0;
}

int
lic_needed_for_node(void *node_lic_ctx)
{
	return 0;
}

int
process_topology_info(void **node_lic_ctx, char *topology_str)
{
	return 0;
}


================================================
FILE: src/lib/Liblog/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

lib_LIBRARIES = liblog.a

liblog_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

liblog_a_SOURCES = \
	chk_file_sec.c \
	log_event.c \
	pbs_log.c \
	pbs_messages.c \
	setup_env.c


================================================
FILE: src/lib/Liblog/chk_file_sec.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
/**
 * @file	chk_file_sec.c
 */
#include <errno.h>
#include <stdio.h>
#include <limits.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <assert.h>
#include <sys/param.h>
#include <sys/types.h>
#include <sys/stat.h>
#include "portability.h"
#include "log.h"
#include "libutil.h"
#include "pbs_ifl.h"

#ifndef S_ISLNK
#define S_ISLNK(m) (((m) &S_IFMT) == S_IFLNK)
#endif

#ifdef WIN32

/**
 * @brief
 *	test stat of directory by checking permission mask.
 *
 * @param[in]	sp - pointer to stat structure
 * @param[in]	isdir - value indicating directory or not
 * @param[in]	sticky - value indicating whether to allow write on directory
 * @param[in] 	disallow - value indicating whether admin and owner given access permission
 * @param[in] 	path - directory path
 * @param[in] 	errmsg - appropriate error msg
 *
 * @return	int
 * @retval	0		success
 * @retval	error code	error
 *
 */
static int
teststat(struct stat *sp, int isdir, int sticky, int disallow,
	 char *path, char *errmsg)
{

	int rc = 0;

	if (isdir && !(S_ISDIR(sp->st_mode))) {
		/* Target is supposed to be a directory, but is not. */
		rc = ENOTDIR;
	} else if (!isdir && (S_ISDIR(sp->st_mode))) {
		/* Target is not supposed to be a directory, but is. */
		rc = EISDIR;
	} else {
		rc = perm_granted_admin_and_owner(path, disallow, NULL, errmsg);
	}
	return rc;
}

#else /******* UNIX only code here ************ */

/**
 * @brief
 *      test stat of directory by checking permission mask.
 *
 * @param[in]   sp - pointer to stat structure
 * @param[in]   isdir - value indicating directory or not
 * @param[in]   sticky - value indicating whether to allow write on directory
 * @param[in]   disallow - value indicating whether admin and owner given access permission
 * @param[in]   uid - if >0, value of owner. else, check if owner <=10
 *
 * @return      int
 * @retval      0               success
 * @retval      error code      error
 *
 */

static int
teststat(struct stat *sp, int isdir, int sticky, int disallow, int uid)
{
	int rc = 0;

	if ((~disallow & S_IWUSR) && (sp->st_uid > 10 && !(uid > 0 && uid == sp->st_uid))) {
		/* Owner write is allowed, and UID is greater than 10 or uid doesn't match. */
		rc = EPERM;
	} else if ((~disallow & S_IWGRP) && (sp->st_gid > 9)) {
		/* Group write is allowed, and GID is greater than 9. */
		rc = EPERM;
	} else if ((~disallow & S_IWOTH) &&
		   (!S_ISDIR(sp->st_mode) || !(sp->st_mode & S_ISVTX) || !sticky)) {
		/*
		 * Other write is allowed, and at least one of the following
		 * is true:
		 * - target is not a directory
		 * - target does not have sticky bit set
		 * - the value of the sticky argument we were passed was zero
		 */
		rc = EPERM;
	} else if (isdir && !S_ISDIR(sp->st_mode)) {
		/* Target is supposed to be a directory, but is not. */
		rc = ENOTDIR;
	} else if (!isdir && S_ISDIR(sp->st_mode)) {
		/* Target is not supposed to be a directory, but is. */
		rc = EISDIR;
	} else if ((S_IRWXU | S_IRWXG | S_IRWXO) & disallow & sp->st_mode) {
		/* Disallowed permission bits are set in the mode mask. */
		rc = EACCES;
	}
	return rc;
}

/**
 * @brief
 *      test stat of directory by checking permission mask.
 *
 * @param[in]   sp - pointer to stat structure
 * @param[in]   isdir - value indicating directory or not
 * @param[in]   sticky - value indicating whether to allow write on directory
 * @param[in]   disallow - value indicating whether admin and owner given access permission
 * @param[in]   uid - if >0, value of owner. else, check if owner <=10
 *
 * @return      int
 * @retval      0               success
 * @retval      error code      error
 *
 */

static int
tempstat(struct stat *sp, int isdir, int sticky, int disallow, int uid)
{
	int rc = 0;

	if ((~disallow & S_IWUSR) && (sp->st_uid > 10 && !(uid > 0 && uid == sp->st_uid))) {
		/* Owner write is allowed, and UID is greater than 10 or owner is not self. */
		rc = EPERM;
	} else if ((~disallow & S_IWGRP) && (sp->st_gid > 9)) {
		/* Group write is allowed, and GID is greater than 9. */
		rc = EPERM;
	} else if (~disallow & S_IWOTH) {
		/*
		 * Other write is allowed, and at least one of the following
		 * is true:
		 * - target is not a directory
		 * - the value of the sticky argument we were passed was zero
		 */
		if (!S_ISDIR(sp->st_mode) || !sticky) {
			rc = EPERM;
		}
		/*
		 ** - sticky bit is off and other write is on
		 */
		if (!(sp->st_mode & S_ISVTX) && (sp->st_mode & S_IWOTH)) {
			rc = EPERM;
		}
	} else if (isdir && !S_ISDIR(sp->st_mode)) {
		/* Target is supposed to be a directory, but is not. */
		rc = ENOTDIR;
	} else if (!isdir && S_ISDIR(sp->st_mode)) {
		/* Target is not supposed to be a directory, but is. */
		rc = EISDIR;
	} else if ((S_IRWXU | S_IRWXG | S_IRWXO) & disallow & sp->st_mode) {
		/* Disallowed permission bits are set in the mode mask. */
		rc = EACCES;
	}
	return rc;
}

#endif /** END of UNIX only code **/

/**
 * @brief
 * 	chk_file_sec() - Check file/directory security
 *      Part of the PBS System Security "Feature"
 *
 * @par	To be secure, all directories (and final file) in path must be:
 *		owned by uid < 10
 *		owned by group < 10 if group writable
 *		not have world writable unless stick bit set & this is allowed.
 *
 * @param[in]	path - path to check
 * @param[in]	isdir - 1 = path is directory, 0 = file
 * @param[in]	sticky - allow write on directory if sticky set
 * @param[in]	disallow - perm bits to disallow
 * @param[in] 	fullpath - check full path
 *
 * @return	int
 * @retval	0 			if ok
 * @retval	errno value 		if not ok, including:
 *              			EPERM if not owned by root
 *              			ENOTDIR if not file/directory as specified
 *              			EACCESS if permissions are not ok
 */
int
chk_file_sec(char *path, int isdir, int sticky, int disallow, int fullpath)
{
	return chk_file_sec_user(path, isdir, sticky, disallow, fullpath, 0);
}

/**
 * @brief
 * 	chk_file_sec_user() - Check file/directory security
 *      Part of the PBS System Security "Feature"
 *
 * @par	To be secure, all directories (and final file) in path must be:
 *		owned by userid < 10 or owned by uid if set
 *		owned by groupid < 10 if group writable
 *		not have world writable unless stick bit set & this is allowed.
 *
 * @param[in]	path - path to check
 * @param[in]	isdir - 1 = path is directory, 0 = file
 * @param[in]	sticky - allow write on directory if sticky set
 * @param[in]	disallow - perm bits to disallow
 * @param[in]	fullpath - check full path
 * @param[in]	uid - uid to check
 *
 * @return	int
 * @retval	0 			if ok
 * @retval	errno value 		if not ok, including:
 *              			EPERM if not owned by root or by uid
 *              			ENOTDIR if not file/directory as specified
 *              			EACCESS if permissions are not ok
 */
int
chk_file_sec_user(char *path, int isdir, int sticky, int disallow, int fullpath, int uid)
{
	int rc = 0;
	struct stat sbuf;
	char *real = NULL;

	assert(path != NULL);
	assert(path[0] != '\0');

	if ((real = realpath(path, NULL)) == NULL) {
		rc = errno;
		goto chkerr;
	}

#ifdef WIN32
	if (((real[0] == '/') ||
	     ((real[1] == ':') && (real[2] == '/'))) &&
	    fullpath) {
		char *slash;

		if (real[0] == '/')
			slash = strchr(&real[1], '/');
		else
			slash = strchr(&real[3], '/');

		while (slash != NULL) {
			*slash = '\0'; /* temp end of string */

			if (lstat(real, &sbuf) == -1) {
				rc = errno;
				goto chkerr;
			}

			assert(S_ISLNK(sbuf.st_mode) == 0);
			rc = teststat(&sbuf, 1, sticky, WRITES_MASK, real,
				      log_buffer);
			if (rc != 0)
				goto chkerr;

			*slash = '/';
			slash = strchr(slash + 1, '/');
		}
	}
#else
	if ((path[0] == '/') && fullpath) {
		/* check full path starting at root */
		char *slash = strchr(&real[1], '/');

		while (slash != NULL) {
			*slash = '\0'; /* temp end of string */

			if (lstat(real, &sbuf) == -1) {
				rc = errno;
				goto chkerr;
			}

			assert(S_ISLNK(sbuf.st_mode) == 0);

			rc = teststat(&sbuf, 1, sticky, S_IWGRP | S_IWOTH, uid);

			if (rc != 0)
				goto chkerr;

			*slash = '/';
			slash = strchr(slash + 1, '/');
		}
	}
#endif

	if (lstat(real, &sbuf) == -1) {
		rc = errno;
		goto chkerr;
	}

	assert(S_ISLNK(sbuf.st_mode) == 0);

#ifdef WIN32
	rc = teststat(&sbuf, isdir, sticky, disallow, real, log_buffer);
#else
	rc = teststat(&sbuf, isdir, sticky, disallow, uid);
#endif

chkerr:
	if (rc != 0) {
		char *error_buf;

		pbs_asprintf(&error_buf,
			     "Security violation \"%s\" resolves to \"%s\"",
			     path, real);
		log_err(rc, __func__, error_buf);
#ifdef WIN32
		if (strlen(log_buffer) > 0)
			log_err(rc, __func__, log_buffer);
#endif
		free(error_buf);
	}

	free(real);
	return (rc);
}

/**
 * @brief
 * 	tmp_file_sec() - Check file/directory security
 *      Part of the PBS System Security "Feature"
 *
 * @par	To be secure, all directories (and final file) in path must be:
 *		owned by uid < 10
 *		owned by group < 10 if group writable
 *		not have world writable unless stick bit set & this is allowed.
 *
 * @param[in]   path - path to check
 * @param[in]   isdir - 1 = path is directory, 0 = file
 * @param[in]   sticky - allow write on directory if sticky set
 * @param[in]   disallow - perm bits to disallow
 * @param[in]   fullpath - check full path
 *
 * @return      int
 * @retval      0                       if ok
 * @retval      errno value             if not ok, including:
 *                                      EPERM if not owned by root
 *                                      ENOTDIR if not file/directory as specified
 *                                      EACCESS if permissions are not ok
 */

int
tmp_file_sec(char *path, int isdir, int sticky, int disallow, int fullpath)
{
	return tmp_file_sec_user(path, isdir, sticky, disallow, fullpath, 0);
}

/**
 * @brief
 * 	tmp_file_sec_user() - Check file/directory security
 *      Part of the PBS System Security "Feature"
 *
 * @par	To be secure, all directories (and final file) in path must be:
 *		owned by userid < 10 or owned by uid if set
 *		owned by groupid < 10 if group writable
 *		not have world writable unless stick bit set & this is allowed.
 *
 * @param[in]   path - path to check
 * @param[in]   isdir - 1 = path is directory, 0 = file
 * @param[in]   sticky - allow write on directory if sticky set
 * @param[in]   disallow - perm bits to disallow
 * @param[in]   fullpath - check full path
 * @param[in]   uid - userid to check
 *
 * @return      int
 * @retval      0                       if ok
 * @retval      errno value             if not ok, including:
 *                                      EPERM if not owned by root
 *                                      ENOTDIR if not file/directory as specified
 *                                      EACCESS if permissions are not ok
 */

int
tmp_file_sec_user(char *path, int isdir, int sticky, int disallow, int fullpath, int uid)
{
	int rc = 0;
	struct stat sbuf;
	char *real = NULL;

	assert(path != NULL);
	assert(path[0] != '\0');

	if ((real = realpath(path, NULL)) == NULL) {
		rc = errno;
		goto chkerr;
	}

#ifdef WIN32
	if (((real[0] == '/') ||
	     ((real[1] == ':') && (real[2] == '/'))) &&
	    fullpath) {
		char *slash;

		if (real[0] == '/')
			slash = strchr(&real[1], '/');
		else
			slash = strchr(&real[3], '/');

		while (slash != NULL) {
			*slash = '\0'; /* temp end of string */

			if (lstat(real, &sbuf) == -1) {
				rc = errno;
				goto chkerr;
			}

			assert(S_ISLNK(sbuf.st_mode) == 0);
			rc = teststat(&sbuf, 1, sticky, WRITES_MASK, real,
				      log_buffer);
			if (rc != 0)
				goto chkerr;

			*slash = '/';
			slash = strchr(slash + 1, '/');
		}
	}
#else
	if ((path[0] == '/') && fullpath) {
		/* check full path starting at root */
		char *slash = strchr(&real[1], '/');

		while (slash != NULL) {
			*slash = '\0'; /* temp end of string */

			if (lstat(real, &sbuf) == -1) {
				rc = errno;
				goto chkerr;
			}

			assert(S_ISLNK(sbuf.st_mode) == 0);

			rc = tempstat(&sbuf, 1, sticky, 0, uid);

			if (rc != 0)
				goto chkerr;

			*slash = '/';
			slash = strchr(slash + 1, '/');
		}
	}
#endif

	if (lstat(real, &sbuf) == -1) {
		rc = errno;
		goto chkerr;
	}

	assert(S_ISLNK(sbuf.st_mode) == 0);

#ifdef WIN32
	rc = teststat(&sbuf, isdir, sticky, disallow, real, log_buffer);
#else
	rc = tempstat(&sbuf, isdir, sticky, disallow, uid);
#endif

chkerr:
	if (rc != 0) {
		char *error_buf;

		pbs_asprintf(&error_buf,
			     "Security violation \"%s\" resolves to \"%s\"",
			     path, real);
		log_err(rc, __func__, error_buf);
#ifdef WIN32
		if (strlen(log_buffer) > 0)
			log_err(rc, __func__, log_buffer);
#endif
		free(error_buf);
	}

	free(real);
	return (rc);
}

/**
 * @brief - This function takes an <program name> <args> as input in string format
 *	    and returns the program name
 *
 * @return - char *
 * @retval - NULL when no valid program name is found
 * @retval - a newly allocated program name
 *
 * @note - Caller holds the responsibility of freeing up the return value
 */
char *
get_script_name(char *input)
{
	char *tok;
	char *next_space;
	int path_exists = 0;
	char *prev_space = NULL;
	int starts_with_quotes = 0;
	char *delim = " ";
	struct stat sbuf;

	if (input == NULL)
		return NULL;

	/* if path starts with double quotes, skip it */
	if (input[0] == '\"') {
		input++;
		starts_with_quotes = 1;
	}

	tok = strdup(input);
	if (tok == NULL)
		return NULL;

	/* get rid of double quotes at the end */
	if (starts_with_quotes && tok[strlen(tok) - 1] == '\"')
		tok[strlen(tok) - 1] = '\0';

	for (next_space = strpbrk(tok, delim); next_space != NULL; next_space = strpbrk(next_space, delim)) {
		int ret_fs;
		*next_space = '\0';
		memset(&sbuf, 0, sizeof(struct stat));
		ret_fs = stat(tok, &sbuf);
		if (ret_fs != 0) {
			if (path_exists == 1) {
				*prev_space = '\0';
				return (tok);
			}
		} else if (S_ISREG(sbuf.st_mode)) {
			/* even if we encounter a regular file, do not break out of loop
			 * unless we hit a case where stat call fails. This is because there is a
			 * possibility that we might be looking at a file with a prefix
			 * similar to the script but not exactly the same.
			 * Example, if input is "/get foo" and there exists a filename "/get"
			 * then we do not want to return from this place.
			 */
			path_exists = 1;
			prev_space = next_space;
		}
		*next_space = ' ';
		/* Ignore any extra spaces */
		next_space += strspn(next_space, delim);
	}

	if (path_exists == 1) {
		/* set last known space as '\0' so that returned path contains no arguments */
		*prev_space = '\0';
		return tok;
	}

	/* If control is here then it would mean that "tok" must have only file path */
	memset(&sbuf, 0, sizeof(struct stat));
	stat(tok, &sbuf);
	if (S_ISREG(sbuf.st_mode))
		return tok;

	/* No file found */
	free(tok);
	return NULL;
}


================================================
FILE: src/lib/Liblog/log_event.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	log_event.c
 * @brief
 * log_event.c - contains functions to log event messages to the log file.
 *
 *	This is specific to the PBS Server.
 *
 * @par Functions included are:
 *	log_event()
 *	log_change()
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/param.h>
#include <sys/types.h>
#include "pbs_ifl.h"
#include <time.h>
#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include "log.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "libutil.h"

/* private data */

static long log_event_lvl_priv = PBSEVENT_ERROR | PBSEVENT_SYSTEM |
				 PBSEVENT_ADMIN | PBSEVENT_JOB | PBSEVENT_SCHED |
				 PBSEVENT_JOB_USAGE | PBSEVENT_SECURITY |
				 PBSEVENT_DEBUG | PBSEVENT_DEBUG2 |
				 PBSEVENT_RESV;

/* external global data */

extern char *path_home;
long *log_event_mask = &log_event_lvl_priv;

/**
 * @brief
 * 	Checks whether or not the given event type is being recorded into
 *	log file.
 *
 * @param[in] eventtype - event type
 *
 * @return int
 *	1 - if the given event type gets logged,
 *	0 - otherwise, it's not recorded.
 *
 */
int
will_log_event(int eventtype)
{
	if (((eventtype & PBSEVENT_FORCE) != 0) ||
	    ((*log_event_mask & eventtype) != 0))
		return (1);

	return (0);
}
/**
 * @brief
 * 	log_event - log a server event to the log file
 *
 *	Checks to see if the event type is being recorded.  If they are,
 *	pass off to log_record().
 *
 *	The caller should ensure proper formating of the message if "text"
 *	is to contain "continuation lines".
 *
 * @param[in] eventtype - event type
 * @param[in] objclass - event object class
 * @param[in] sev - indication for whether to syslogging enabled or not
 * @param[in] objname - object name stating log msg related to which object
 * @param[in] text - log msg to be logged.
 *
 *	Note, "sev" or severity is used only if syslogging is enabled,
 *	see syslog(3) and log_record.c for details.
 */

void
log_event(int eventtype, int objclass, int sev, const char *objname, const char *text)
{
	if (will_log_event(eventtype))
		log_record(eventtype, objclass, sev, objname, text);
}

/**
 * @brief
 *      do_log_eventf - helper function which does the actual logging
 *
 * @param[in] eventtype - event type
 * @param[in] objclass - event object class
 * @param[in] sev - indication for whether to syslogging enabled or not
 * @param[in] objname - object name stating log msg related to which object
 * @param[in] fmt - format string
 * @param[in] ... - arguments to format string
 *
 * @return void
 */

void
do_log_eventf(int eventtype, int objclass, int sev, const char *objname, const char *fmt, va_list args)
{
	va_list args_copy;
	int len;
	char logbuf[LOG_BUF_SIZE];
	char *buf;

	if (will_log_event(eventtype) == 0)
		return;

	va_copy(args_copy, args);

	len = vsnprintf(logbuf, sizeof(logbuf), fmt, args_copy);
	va_end(args_copy);

	if (len >= sizeof(logbuf)) {
		buf = pbs_asprintf_format(len, fmt, args);
		if (buf == NULL)
			return;

	} else
		buf = logbuf;

	log_record(eventtype, objclass, sev, objname, buf);

	if (len >= sizeof(logbuf))
		free(buf);
}

/**
 * @brief
 * 	log_eventf - a combination of log_event() and printf()
 *
 * @param[in] eventtype - event type
 * @param[in] objclass - event object class
 * @param[in] sev - indication for whether to syslogging enabled or not
 * @param[in] objname - object name stating log msg related to which object
 * @param[in] fmt - format string
 * @param[in] ... - arguments to format string
 *
 * @return void
 */
void
log_eventf(int eventtype, int objclass, int sev, const char *objname, const char *fmt, ...)
{
	va_list args;
	va_start(args, fmt);
	do_log_eventf(eventtype, objclass, sev, objname, fmt, args);
	va_end(args);
}


================================================
FILE: src/lib/Liblog/pbs_log.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * 
 * @brief
 *  contains functions to log error and event messages to
 *	the log file.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "portability.h"
#include "pbs_error.h"

#include <sys/stat.h>
#include <sys/param.h>
#include <sys/types.h>
#include <sys/time.h>
#include <limits.h>
#include <time.h>
#include <fcntl.h>
#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <errno.h>
#include <stdlib.h>
#include <pthread.h>
#include <signal.h>
#include <stddef.h>
#include <stdarg.h>

#include "log.h"
#include "pbs_ifl.h"
#include "libutil.h"
#include "pbs_version.h"
#if SYSLOG
#include <syslog.h>
#endif

/* Default to no locking. */

/* Global Data */

char log_buffer[LOG_BUF_SIZE];
char log_directory[_POSIX_PATH_MAX / 2];

/*
 * PBS logging is not reentrant. Especially the log switch changes the
 * global log file pointer. Guard using a mutex.
 * Initialize the mutex once at log_open().
 */
static pthread_once_t log_once_ctl = PTHREAD_ONCE_INIT;
static pthread_mutex_t log_write_mutex;
typedef struct {
	struct tm ptm;
	char microsec_buf[8];
} ms_time; /* microsecond time stamp */

char *msg_daemonname;

/* Local Data */

static int log_auto_switch = 0;
static int log_open_day;
static FILE *logfile; /* open stream for log file */
static volatile int log_opened = 0;
#if SYSLOG
static int syslogopen = 0;
#endif /* SYSLOG */

/*
 * the order of these names MUST match the defintions of
 * PBS_EVENTCLASS_* in log.h
 */
static char *class_names[] = {
	"n/a",
	"Svr",
	"Que",
	"Job",
	"Req",
	"Fil",
	"Act",
	"Node",
	"Resv",
	"Sched",
	"Hook",
	"Resc",
	"TPP"};

static char pbs_leaf_name[PBS_MAXHOSTNAME + 1] = "N/A";
static char pbs_mom_node_name[PBS_MAXHOSTNAME + 1] = "N/A";
static unsigned int locallog = 0;
static unsigned int syslogfac = 0;
static unsigned int syslogsvr = 3;
static unsigned int pbs_log_highres_timestamp = 0;

static void log_init(void);
static int log_mutex_lock();
static int log_mutex_unlock();
static void get_timestamp(ms_time *mst);
static void log_record_inner(int eventtype, int objclass, int sev, const char *objname, const char *text, ms_time *mst);
static void log_console_error(char *);

void
set_log_conf(char *leafname, char *nodename,
	     unsigned int islocallog, unsigned int sl_fac, unsigned int sl_svr,
	     unsigned int log_highres)
{
	pthread_once(&log_once_ctl, log_init); /* initialize mutex once */

	log_mutex_lock();

	if (leafname) {
		strncpy(pbs_leaf_name, leafname, PBS_MAXHOSTNAME);
		pbs_leaf_name[PBS_MAXHOSTNAME] = '\0';
	}

	if (nodename) {
		strncpy(pbs_mom_node_name, nodename, PBS_MAXHOSTNAME);
		pbs_mom_node_name[PBS_MAXHOSTNAME] = '\0';
	}

	locallog = islocallog;
	syslogfac = sl_fac;
	syslogsvr = sl_svr;
	pbs_log_highres_timestamp = log_highres;

	log_mutex_unlock();
}

#ifdef WIN32
/**
 * @brief
 *		gettimeofday - This function returns the current calendar
 *		time as the elapsed time since the epoch in the struct timeval
 *		structure indicated by tp
 *
 * @param[in] - tp - pointer to timeval struct
 * @param[in] - tzp - pointer to timezone struct (not used)
 * @return int
 * @retval -1 - failure
 * @retval 0 - success
 */
int
gettimeofday(struct timeval *tp, struct timezone *tzp)
{
	FILETIME file_time = {0};
	ULARGE_INTEGER large_int = {0};
	/*
 	 * Microsecond different from "January 1, 1601 (UTC)" to
  	 * "00:00:00 January 1, 1970" as Windows's FILESYSTEM is represents from
 	 * "January 1, 1601 (UTC)"
  	 */
	static const unsigned __int64 epoch = 116444736000000000ULL;

	GetSystemTimeAsFileTime(&file_time);
	large_int.LowPart = file_time.dwLowDateTime;
	large_int.HighPart = file_time.dwHighDateTime;
	tp->tv_sec = (time_t) ((large_int.QuadPart - epoch) / 10000000L);
	tp->tv_usec = (time_t) ((large_int.QuadPart - epoch) % 1000000L);
	return 0;
}
#endif

/* External functions called */

/**
 * @brief
 * set_msgdaemonname - set the variable msg_daemonname
 *			as per the daemon
 * @param[in] - ch - the string msg_daemonname to be set
 * @return int
 * @retval 1 - failure
 * @retval 0 - success
 */

int
set_msgdaemonname(const char *ch)
{
	if (!(msg_daemonname = strdup(ch))) {
		return 1;
	}
	return 0;
}

/**
 * @brief
 * set_logfile - set the logfile to stderr to log the message to stderr
 * @param[in] - fp - log file pointer
 * @return void
 */

void
set_logfile(FILE *fp)
{
	log_opened = 1;
	logfile = fp;
}

/*
 * @brief
 * 	mk_log_name - make the log name used by MOM
 *	based on the date: yyyymmdd
 *
 * @param[in] pbuf - buffer to hold log file name
 * @param[in] pbufsz - max size of buffer
 *
 * @return	string
 * @retval	log file name	success
 *
 */

static char *
mk_log_name(char *pbuf, size_t pbufsz)
{
#ifndef WIN32
	struct tm ltm;
#endif
	struct tm *ptm;
	time_t time_now;

	time_now = time(NULL);

#ifdef WIN32
	ptm = localtime(&time_now);
	(void) snprintf(pbuf, pbufsz, "%s\\%04d%02d%02d", log_directory,
			ptm->tm_year + 1900, ptm->tm_mon + 1, ptm->tm_mday);
#else
	ptm = localtime_r(&time_now, &ltm);
	(void) snprintf(pbuf, pbufsz, "%s/%04d%02d%02d", log_directory,
			ptm->tm_year + 1900, ptm->tm_mon + 1, ptm->tm_mday);
#endif
	log_open_day = ptm->tm_yday; /* Julian date log opened */
	return (pbuf);
}

/**
 * @brief
 *	Lock the mutex associated with this log
 *
 * @return Error code
 * @retval -1 - failure
 * @retval  0 - success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
log_mutex_lock()
{
	if (pthread_mutex_lock(&log_write_mutex) != 0) {
		log_console_error("PBS cannot lock its log");
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Unlock the mutex associated with this log
 *
 * @return Error code
 * @retval -1 - failure
 * @retval  0 - success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
log_mutex_unlock()
{
	if (pthread_mutex_unlock(&log_write_mutex) != 0) {
		log_console_error("PBS cannot unlock its log");
		return -1;
	}
	return 0;
}

#ifndef WIN32

/**
 * @brief
 *	wrapper function for log_mutex_lock().
 *
 */
static void
log_pre_fork_handler()
{
	log_mutex_lock();
}

/**
 * @brief
 *	wrapper function for log_mutex_unlock().
 *
 */
static void
log_parent_post_fork_handler()
{
	log_mutex_unlock();
}

/**
 * @brief
 *	wrapper function for log_mutex_unlock().
 *
 */
static void
log_child_post_fork_handler()
{
	log_mutex_unlock();
}
#endif

/**
 * @brief
 *	Initialize the log mutex and tls
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static void
log_init(void)
{
	if (pthread_mutex_init(&log_write_mutex, NULL) != 0) {
		fprintf(stderr, "log write mutex init failed\n");
		return;
	}

	/* 
	 * atfork handlers are required for the logging layer
	 * since child processes might still want to log in the 
	 * child after fork, from the APP thread, then the APP thread
	 * needs access to the log mutex - else if the fork happened 
	 * when the TPP thread acquired the lock, then the APP thread
	 * after fork can never acquire it (since the TPP thread would
	 * be dead after fork - only the thread calling fork is duplicated
	 * in the child process).
	 * 
	 * Hence in the prefork handler, we acquire the lock - thus ensuring
	 * that the TPP thread does not own it, and then post fork we unlock 
	 * it both for the parent and child.
	 *  
	 */
#ifndef WIN32
	/* for unix, set a pthread_atfork handler */
	if (pthread_atfork(log_pre_fork_handler, log_parent_post_fork_handler, log_child_post_fork_handler) != 0) {
		fprintf(stderr, "log atfork handler failed\n");
		return;
	}
#endif
}

/**
 * @brief
 *	Add general debugging information in log
 *
 * @par Side Effects:
 * 	None
 *
 * @par MT-safe: Yes
 *
 */
static void
log_add_debug_info()
{
	char dest[LOG_BUF_SIZE] = {'\0'};
	char temp[PBS_MAXHOSTNAME + 1] = {'\0'};
	char host[PBS_MAXHOSTNAME + 1] = "N/A";
	ms_time mst;
	get_timestamp(&mst);

	/* Set hostname */
	if (!gethostname(temp, (sizeof(temp) - 1))) {
		snprintf(host, sizeof(host), "%s", temp);
		if (!get_fullhostname(temp, temp, (sizeof(temp) - 1)))
			/* Overwrite if full hostname is available */
			snprintf(host, sizeof(host), "%s", temp);
	}
	/* Record to log */
	snprintf(dest, sizeof(dest),
		 "hostname=%s;pbs_leaf_name=%s;pbs_mom_node_name=%s",
		 host, pbs_leaf_name, pbs_mom_node_name);
	log_record_inner(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, dest, &mst);
	return;
}

/**
 * @brief
 *	Add supported authentication method to log
 *
 * @param[in]	supported_auth_methods - An array of supported authentication method
 *
 * @return void
 *
 */
void
log_supported_auth_methods(char **supported_auth_methods)
{
	if (supported_auth_methods) {
		int i = 0;
		while (supported_auth_methods[i]) {
			log_eventf(PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname,
				   "Supported authentication method: %s", supported_auth_methods[i]);
			i++;
		}
	}
}

/**
 * @brief
 *	Add interface information to log
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */

static void
log_add_if_info()
{
	char tbuf[LOG_BUF_SIZE];
	char msg[LOG_BUF_SIZE];
	char temp[LOG_BUF_SIZE];
	int i;
	char dest[LOG_BUF_SIZE * 2];
	struct log_net_info *ni, *curr;
	ms_time mst;
	get_timestamp(&mst);

	memset(msg, '\0', sizeof(msg));
	ni = get_if_info(msg);
	if (msg[0] != '\0') {
		/* Adding error message to log */
		snprintf(tbuf, sizeof(tbuf), "%s", msg);
		log_record_inner(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, tbuf, &mst);
	}
	if (!ni)
		return;

	/* Add info to log */
	for (curr = ni; curr; curr = curr->next) {
		snprintf(tbuf, sizeof(tbuf), "%s interface %s: ",
			 (curr->iffamily[0]) ? curr->iffamily : "NULL",
			 (curr->ifname[0]) ? curr->ifname : "NULL");
		for (i = 0; curr->ifhostnames[i]; i++) {
			snprintf(temp, sizeof(temp), "%s ", curr->ifhostnames[i]);
			snprintf(dest, sizeof(dest), "%s%s", tbuf, temp);
		}
		log_record_inner(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, dest, &mst);
	}

	free_if_info(ni);
}

/**
 *
 * @brief
 *	Calls log_open_main() in non-silent mode.
 *
 * @param[in]	filename - the log filename passed to log_open_main().
 * @param[in]	log_directory -  The directory name passed to log_open_main().
 *
 * @return int	- return value of log_open_main().
 *
 */
int
log_open(char *filename, char *directory)
{
	return (log_open_main(filename, directory, 0));
}

/**
 *
 * @brief
 * 	Open the log file for append.
 *
 * @par
 *	Opens a (new) log file.
 *	If a log file is already open, and the new file is successfully opened,
 *	the old file is closed.  Otherwise the old file is left open.

 * @param[in]	filename - if non-NULL or non-empty string, then this must be
 *			   an absolute pathname, which is opened and made as
 *			   the log file.
 *			 - if NULL or empty string, then calls mk_log_name()
 *			   to create a log file named after the current date
 *			   yymmdd, which is made into the log file.
 * @param[in]	log_directory -  The directory used by mk_log_name()
 *				 as the log directory for the generated
 *				 log filename.
 * @param[in]	silent - if set to 1, then extra messages such as
 *			"Log opened", "pbs_version=", "pbs_build="
 *			are not printed out on the log file.
 *
 * @return int
 * @retval 0	for success
 * @retval != 0 for failure
 */
int
log_open_main(char *filename, char *directory, int silent)
{
	char buf[_POSIX_PATH_MAX];
	int fds;

	/*providing temporary buffer, tbuf, for forming pbs_version
	 *and pbs_build messages that get written on logfile open.
	 *Using the usual buffer, log_buffer, that one sees in calls
	 *to log_event() will result in clobbering the first message
	 *after midnight:  log_event(), calls log_record(), calls
	 *log_close() followed by log_open() - so a write into "log_buffer"
	 *inside log_open() obliterates the message that would have been
	 *placed in the newly opened, after mignight, server logfile.
	 */
	char tbuf[LOG_BUF_SIZE];

	pthread_once(&log_once_ctl, log_init); /* initialize mutex once */

	if (log_opened > 0) /* Close existing log */
		log_close(0);

	if (locallog != 0 || syslogfac == 0) {

		/* open PBS local logging */

		if (strcmp(log_directory, directory) != 0)
			(void) strncpy(log_directory, directory, _POSIX_PATH_MAX / 2 - 1);

		if ((filename == NULL) || (*filename == '\0')) {
			filename = mk_log_name(buf, _POSIX_PATH_MAX);
			log_auto_switch = 1;
		}
#ifdef WIN32
		else if (*filename != '\\' && (strlen(filename) > 1 &&
					       *(filename + 1) != ':')) {
			return (-1); /* must be absolute path */
		}
#else
		else if (*filename != '/') {
			return (-1); /* must be absolute path */
		}
#endif

#ifdef WIN32
		if ((fds = open(filename, O_CREAT | O_WRONLY | O_APPEND, S_IREAD | S_IWRITE)) < 0)
#elif defined(O_LARGEFILE)
		if ((fds = open(filename, O_CREAT | O_WRONLY | O_APPEND | O_LARGEFILE, 0644)) < 0)
#else
		if ((fds = open(filename, O_CREAT | O_WRONLY | O_APPEND, 0644)) < 0)
#endif
		{
			log_opened = -1; /* note that open failed */
			return (-1);
		}

#ifdef WIN32
		secure_file2(filename, "Administrators",
			     READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED,
			     "Everyone", READS_MASK | READ_CONTROL);
#endif
		DBPRT(("Opened log file %s\n", filename))
		if (fds < 3) {

			log_opened = fcntl(fds, F_DUPFD, 3); /* overload variable */
			if (log_opened < 0)
				return (-1);
			(void) close(fds);
			fds = log_opened;
		}
		logfile = fdopen(fds, "a");

#ifdef WIN32
		(void) setvbuf(logfile, NULL, _IONBF, 0); /* no buffering to get instant log */
#else
		(void) setvbuf(logfile, NULL, _IOLBF, 0); /* set line buffering */
#endif
		log_opened = 1; /* note that file is open */

		if (!silent) {
			ms_time mst;
			get_timestamp(&mst);
			log_record_inner(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, "Log", "Log opened", &mst);
			snprintf(tbuf, LOG_BUF_SIZE, "pbs_version=%s", PBS_VERSION);
			log_record_inner(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, tbuf, &mst);
			snprintf(tbuf, LOG_BUF_SIZE, "pbs_build=%s", PBS_BUILD);
			log_record_inner(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, tbuf, &mst);

			log_add_debug_info();
			log_add_if_info();
		}
	}
#if SYSLOG
	if (syslogopen == 0 && syslogfac > 0 && syslogfac < 10) {
		/*
		 * We do not assume that the log facilities are defined sequentially.
		 * That is why we reference them each by name.
		 */
		switch (syslogfac) {
			case 2:
				syslogopen = LOG_LOCAL0;
				break;
			case 3:
				syslogopen = LOG_LOCAL1;
				break;
			case 4:
				syslogopen = LOG_LOCAL2;
				break;
			case 5:
				syslogopen = LOG_LOCAL3;
				break;
			case 6:
				syslogopen = LOG_LOCAL4;
				break;
			case 7:
				syslogopen = LOG_LOCAL5;
				break;
			case 8:
				syslogopen = LOG_LOCAL6;
				break;
			case 9:
				syslogopen = LOG_LOCAL7;
				break;
			case 1:
			default:
				syslogopen = LOG_DAEMON;
				break;
		}
		openlog(msg_daemonname, LOG_NOWAIT, syslogopen);
		DBPRT(("Syslog enabled, facility = %d\n", syslogopen))
		if (syslogsvr != 0) {
			/* set min priority of what gets logged via syslog */
			setlogmask(LOG_UPTO(syslogsvr));
			DBPRT(("Syslog mask set to 0x%x\n", syslogsvr))
		}
	}
#endif

	return (0);
}

/**
 * @brief
 * 	log_err - log an internal error
 *	The error is recorded to the pbs log file and to syslogd if it is
 *	available.  If the error file has not been opened and if syslog is
 *	not defined, then the console is opened.
 *
 * @param[in] errnum - error number
 * @param[in] routine - error in which routine
 * @param[in] text - text to be logged
 *
 */

void
log_err(int errnum, const char *routine, const char *text)
{
	char buf[LOG_BUF_SIZE], *errmsg;
	int i;

	if (errnum == -1) {

#ifdef WIN32
		LPVOID lpMsgBuf;
		DWORD err = GetLastError();
		int len;

		snprintf(buf, LOG_BUF_SIZE, "Err(%lu): ", err);
		FormatMessage(
			FORMAT_MESSAGE_ALLOCATE_BUFFER |
				FORMAT_MESSAGE_FROM_SYSTEM |
				FORMAT_MESSAGE_IGNORE_INSERTS,
			NULL, err,
			MAKELANGID(LANG_NEUTRAL, SUBLANG_DEFAULT),
			(LPTSTR) &lpMsgBuf, 0, NULL);
		strncat(buf, lpMsgBuf, LOG_BUF_SIZE - (int) strlen(buf) - 1);
		LocalFree(lpMsgBuf);
		buf[sizeof(buf) - 1] = '\0';
		len = strlen(buf);
		if (buf[len - 1] == '\n')
			len--;
		if (buf[len - 1] == '.')
			len--;
		buf[len - 1] = '\0';
#else
		buf[0] = '\0';
#endif
	} else {
		if (((errmsg = pbse_to_txt(errnum)) == NULL) &&
		    ((errmsg = strerror(errnum)) == NULL))
			errmsg = "";
		(void) snprintf(buf, LOG_BUF_SIZE, "%s (%d) in ", errmsg, errnum);
	}
	(void) strcat(buf, routine);
	(void) strcat(buf, ", ");
	i = LOG_BUF_SIZE - (int) strlen(buf) - 2;
	(void) strncat(buf, text, i);
	buf[LOG_BUF_SIZE - 1] = '\0';

	if (log_opened == 0)
		(void) log_open("/dev/console", log_directory);

	if (isatty(2)) {
		if (msg_daemonname == NULL) {
			(void) fprintf(stderr, "%s\n", buf);
		} else {
			(void) fprintf(stderr, "%s: %s\n", msg_daemonname, buf);
		}
	}

	(void) log_record(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, msg_daemonname, buf);
}

/**
 * @brief
 * 	log_errf - a combination of log_err() and printf()
 *	The error is recorded to the pbs log file and to syslogd if it is
 *	available.  If the error file has not been opened and if syslog is
 *	not defined, then the console is opened.
 *
 * @param[in] errnum - error number
 * @param[in] routine - error in which routine
 * @param[in] fmt - format string
 * @param[in] ... - arguments to format string * 
 *
 */

void
log_errf(int errnum, const char *routine, const char *fmt, ...)
{
	va_list args;
	va_list args_copy;
	int len;
	char logbuf[LOG_BUF_SIZE];
	char *buf;

	va_start(args, fmt);
	va_copy(args_copy, args);

	len = vsnprintf(logbuf, sizeof(logbuf), fmt, args_copy);
	va_end(args_copy);

	if (len >= sizeof(logbuf)) {
		buf = pbs_asprintf_format(len, fmt, args);
		if (buf == NULL) {
			va_end(args);
			return;
		}
	} else
		buf = logbuf;

	log_err(errnum, routine, buf);

	if (len >= sizeof(logbuf))
		free(buf);
	va_end(args);
}

/**
 * @brief
 * 	log_joberr- log an internal, job-related error
 *	The error is recorded to the pbs log file and to syslogd if it is
 *	available.  If the error file has not been opened and if syslog is
 *	not defined, then the console is opened.  The record written into
 *	the log will be of type PBS_EVENTCLASS_JOB
 *
 * @param[in] errnum - error number
 * @param[in] routine - error in which routine
 * @param[in] text - text to be logged
 * @param[in] pjid - job id which logged error
 *
 * @return	void
 *
 */

void
log_joberr(int errnum, const char *routine, const char *text, const char *pjid)
{
	char buf[LOG_BUF_SIZE], *errmsg;
	int i;

	if (errnum == -1) {

#ifdef WIN32
		LPVOID lpMsgBuf;
		DWORD err = GetLastError();
		int len;
		snprintf(buf, LOG_BUF_SIZE, "Err(%lu): ", err);
		FormatMessage(
			FORMAT_MESSAGE_ALLOCATE_BUFFER |
				FORMAT_MESSAGE_FROM_SYSTEM |
				FORMAT_MESSAGE_IGNORE_INSERTS,
			NULL, err,
			MAKELANGID(LANG_NEUTRAL, SUBLANG_DEFAULT),
			(LPTSTR) &lpMsgBuf, 0, NULL);
		strncat(buf, lpMsgBuf, LOG_BUF_SIZE - (int) strlen(buf) - 1);
		LocalFree(lpMsgBuf);
		buf[sizeof(buf) - 1] = '\0';
		len = strlen(buf);
		if (buf[len - 1] == '\n')
			len--;
		if (buf[len - 1] == '.')
			len--;
		buf[len - 1] = '\0';
#else
		buf[0] = '\0';
#endif
	} else {

		if (((errmsg = pbse_to_txt(errnum)) == NULL) &&
		    ((errmsg = strerror(errnum)) == NULL))
			errmsg = "";
		(void) snprintf(buf, LOG_BUF_SIZE, "%s (%d) in ", errmsg, errnum);
	}
	(void) strcat(buf, routine);
	(void) strcat(buf, ", ");
	i = LOG_BUF_SIZE - (int) strlen(buf) - 2;
	(void) strncat(buf, text, i);
	buf[LOG_BUF_SIZE - 1] = '\0';

	if (log_opened == 0)
		(void) log_open("/dev/console", log_directory);

	if (isatty(2))
		(void) fprintf(stderr, "%s: %s\n", msg_daemonname, buf);

	(void) log_record(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_JOB,
			  LOG_ERR, pjid, buf);
}

/**
 * @brief
 * 	log_suspect_file - log security information about a file/directory
 *
 * @param[in] func - function id
 * @param[in] text - text to be logged
 * @param[in] file - file path
 * @param[in] sb - status of file
 *
 * @return	Void
 *
 */

void
log_suspect_file(const char *func, const char *text, const char *file, struct stat *sb)
{
	char buf[LOG_BUF_SIZE];

	snprintf(buf, LOG_BUF_SIZE, "Security issue from %s: %s, inode %lu, mode %#lx, uid %ld, gid %ld, ctime %#lx",
		 func,
		 text,
		 (unsigned long) sb->st_ino,
		 (unsigned long) sb->st_mode,
		 (long) sb->st_uid,
		 (long) sb->st_gid,
		 (unsigned long) sb->st_ctime);
	/*
	 * Log the data.  Note that we swap the text and file name order
	 * because the text is more important in case msg is truncated.
	 */
	log_record(PBSEVENT_SECURITY, PBS_EVENTCLASS_FILE, LOG_CRIT, buf, file);
}

/**
 * @brief
 * 	get the timestamp, include microseconds if configured
 *
 * @param[out] mst - the ms_time structure is populated and returned
 *
 */
void
get_timestamp(ms_time *mst)
{
	time_t now = 0;
	struct tm *ptm;
	struct timeval tp;
#ifndef WIN32
	struct tm ltm;
#endif
	/* if gettimeofday() fails, log messages will be printed at the epoch */
	if (gettimeofday(&tp, NULL) != -1) {
		now = tp.tv_sec;
		if (pbs_log_highres_timestamp)
			snprintf(mst->microsec_buf, sizeof(mst->microsec_buf), ".%06ld", (long) tp.tv_usec);
		else
			mst->microsec_buf[0] = '\0';
	}

#ifdef WIN32
	ptm = localtime(&now);
#else
	ptm = localtime_r(&now, &ltm);
#endif

	mst->ptm = *ptm;
}

/**
 * @brief
 * 	log_record - log a critical error to the console
 *
 * @param[in] msg - log msg to be logged
 * 
 */
void
log_console_error(char *msg)
{
	FILE *errf;
	int rc = errno;
	errf = fopen("/dev/console", "w");
	if (errf != NULL) {
		fprintf(errf, "%s - errno = %d\n", msg, rc);
		fclose(errf);
	}
}

/**
 * @brief
 * 	log a message to the log file - this function acquires a lock
 *	The log file must have been opened by log_open().
 *
 *	The caller should ensure proper formating of the message if "text"
 *	is to contain "continuation lines".
 *
 * @param[in] eventtype - event type
 * @param[in] objclass - event object class
 * @param[in] sev - indication for whether to syslogging enabled or not
 * @param[in] objname - object name stating log msg related to which object
 * @param[in] text - log msg to be logged.
 *
 * Note, "sev" (for severity) is used  only if syslogging is enabled.
 * See syslog(3) for details.
 *
 * Note: Do NOT call this function from log_open() or log_close() since log_record
 * acquires a mutex and calls log_open(), log_close(), making it a recursive call, 
 * and confusing the mutex. Rather call, log_record_inner() from log_open, log_close
 * etc
 */
void
log_record(int eventtype, int objclass, int sev, const char *objname, const char *text)
{
	ms_time mst;
#ifndef WIN32
	char slogbuf[LOG_BUF_SIZE];
	sigset_t block_mask;
	sigset_t old_mask;

	/* Block all signals to the process to make the function async-safe */
	sigfillset(&block_mask);
	sigprocmask(SIG_BLOCK, &block_mask, &old_mask);
#endif

#if SYSLOG
	if (syslogopen != 0) {
		snprintf(slogbuf, LOG_BUF_SIZE, "%s;%s;%s\n", class_names[objclass], objname, text);
		syslog(sev, "%s", slogbuf);
	}
#endif /* SYSLOG */

	if (log_opened <= 0)
		goto sigunblock;

	if ((text == NULL) || (objname == NULL))
		goto sigunblock;

	/* lock the file mutex */
	if (log_mutex_lock() == 0) {
		get_timestamp(&mst);

		/* Do we need to switch the log? */
		if (log_auto_switch && (mst.ptm.tm_yday != log_open_day)) {
			log_close(1);
			log_open(NULL, log_directory);
			if (log_opened < 1) {
				log_mutex_unlock();
				log_console_error("PBS cannot open its log");
				goto sigunblock;
			}
		}

		/* call the inner routine which does not lock */
		log_record_inner(eventtype, objclass, sev, objname, text, &mst);
		log_mutex_unlock();
	}

sigunblock:
#ifndef WIN32
	sigprocmask(SIG_SETMASK, &old_mask, NULL);
#else
	return;
#endif
}

/**
 * @brief
 * 	Inner level function to log WITHOUT acquiring locks
 *
 *	The caller should ensure proper formating of the message if "text"
 *	is to contain "continuation lines".
 *
 * @param[in] eventtype - event type
 * @param[in] objclass - event object class
 * @param[in] sev - indication for whether to syslogging enabled or not
 * @param[in] objname - object name stating log msg related to which object
 * @param[in] text - log msg to be logged
 * @param[in] mst - the ms_time format timestamp (with microseconds, if configured)
 *
 *	Note, "sev" (for severity) is used  only if syslogging is enabled.
 *	See syslog(3) for details.
 */
static void
log_record_inner(int eventtype, int objclass, int sev, const char *objname, const char *text, ms_time *mst)
{
	int rc = 0;
	if (locallog != 0 || syslogfac == 0) {
		rc = fprintf(logfile,
			     "%02d/%02d/%04d %02d:%02d:%02d%s;%04x;%s;%s;%s;%s\n",
			     mst->ptm.tm_mon + 1, mst->ptm.tm_mday, mst->ptm.tm_year + 1900,
			     mst->ptm.tm_hour, mst->ptm.tm_min, mst->ptm.tm_sec, mst->microsec_buf,
			     eventtype & ~PBSEVENT_FORCE, msg_daemonname,
			     class_names[objclass], objname, text);

		(void) fflush(logfile);
		if (rc < 0)
			log_console_error("PBS cannot write to its log");
	}
}

/**
 * @brief
 * 	log_close - close the current open log file
 *
 * @param[in] msg - indicating whether to log a message of closing log file before closing it
 *
 * @return	Void
 *
 */
void
log_close(int msg)
{
	if (log_opened == 1) {
		log_auto_switch = 0;
		if (msg) {
			ms_time mst;
			get_timestamp(&mst);
			log_record_inner(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, "Log", "Log closed", &mst);
		}
		(void) fclose(logfile);
		log_opened = 0;
	}
#if SYSLOG
	if (syslogopen) {
		closelog();
		syslogopen = 0;
	}
#endif /* SYSLOG */
}

/**
 * @brief
 *	Function to set the comm related log levels to event types
 *	on which pbs log mask works.
 *
 * @param[in]	level - The error level as per syslog
 *
 * @return - event type
 *
 */
int
log_level_2_etype(int level)
{
	int etype = PBSEVENT_DEBUG3 | PBSEVENT_DEBUG4;

	if (level == LOG_ERR)
		etype |= PBSEVENT_ERROR;
	else if (level == LOG_CRIT)
		etype |= PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_FORCE;
	else if (level == LOG_WARNING)
		etype |= PBSEVENT_SYSTEM | PBSEVENT_ADMIN;
	else if (level == LOG_NOTICE || level == LOG_INFO)
		etype |= PBSEVENT_DEBUG | PBSEVENT_DEBUG2;

	return etype;
}


================================================
FILE: src/lib/Liblog/pbs_messages.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "portability.h"
#include "pbs_error.h"

#include <stdlib.h>

/**
 * @file	pbs_messages.c
 * @brief
 * Messages issued by the server.  They are kept here in one place
 * to make translation a bit easier.
 * @warning
 *  there are places where a message and other info is stuffed
 *	into a buffer, keep the messages short!
 *
 * This first set of messages are recorded by the server or mom to the log.
 */

char *msg_abt_err = "Unable to abort Job %s which was in substate %d";
char *msg_badexit = "Abnormal exit status 0x%x: ";
char *msg_badwait = "Invalid time in work task for waiting, job = %s";
char *msg_deletejob = "Job to be deleted";
char *msg_delrunjobsig = "Job sent signal %s on delete";
char *msg_err_malloc = "malloc failed";
char *msg_err_noqueue = "Unable to requeue job,";
char *msg_err_noqueue1 = "queue is not defined";
char *msg_err_purgejob = "Unlink of job file failed";
char *msg_err_purgejob_db = "Removal of job from datastore failed";
char *msg_err_unlink = "Unlink of %s file %s failed";
char *msg_illregister = "Illegal op in register request received for job %s";
char *msg_init_abt = "Job aborted on PBS Server initialization";
char *msg_init_baddb = "Unable to read server database";
char *msg_init_badjob = "Recover of job %s failed";
char *msg_init_chdir = "unable to change to directory %s";
char *msg_init_expctq = "Expected %d, recovered %d queues";
char *msg_init_exptjobs = "Recovered %d jobs";
char *msg_init_nojobs = "No jobs to open";
char *msg_init_noqueues = "No queues to open";
char *msg_init_noresvs = "No resvs to open";
char *msg_init_norerun = "Unable to rerun job at Server initialization";
char *msg_init_queued = "Requeued in queue: ";
char *msg_init_recovque = "Recovered queue %s";
char *msg_init_recovresv = "Recovered reservation %s";
char *msg_init_resvNOq = "Queue %s for reservation %s missing";
char *msg_init_substate = "Requeueing job, substate: %d ";
char *msg_init_unkstate = "Unable to recover job in strange substate: %d";
char *msg_isodedecode = "Decode of request failed";
char *msg_issuebad = "attempt to issue invalid request of type %d";
char *msg_job_abort = "Aborted by PBS Server ";
char *msg_jobholdset = "Holds %s set at request of %s@%s";
char *msg_jobholdrel = "Holds %s released at request of %s@%s";
char *msg_job_end = "Execution terminated";
char *msg_job_end_stat = "Exit_status=%d";
char *msg_job_end_sig = "Terminated on signal %d";
char *msg_jobmod = "Job Modified";
char *msg_jobnew = "Job Queued at request of %s@%s, owner = %s, job name = %s, queue = %s";
char *msg_jobrerun = "Job Rerun";
char *msg_jobrun = "Job Run";
char *msg_job_start = "Begun execution";
char *msg_job_stageinfail = "File stage in failed, see below.\nJob will be retried later, please investigate and correct problem.";
char *msg_leftrunning = "job running on at Server shutdown";
char *msg_manager = "%s at request of %s@%s";
char *msg_man_cre = "created";
char *msg_man_del = "deleted";
char *msg_man_set = "attributes set: ";
char *msg_man_uns = "attributes unset: ";
char *msg_messagejob = "Message request to job status %d";
char *msg_mombadhold = "MOM rejected hold request: %d";
char *msg_mombadmodify = "MOM rejected modify request, error: %d";
char *msg_momsetlim = "Job start failed.  Can't set \"%s\" limit: %s.\n";
char *msg_momnoexec1 = "Job cannot be executed\nSee Administrator for help";
char *msg_momnoexec2 = "Job cannot be executed\nSee job standard error file";
char *msg_movejob = "Job moved to ";
char *msg_norelytomom = "Server could not connect to MOM";
char *msg_obitnojob = "Job Obit notice received has error %d";
char *msg_obitnocpy = "Post job file processing error; job %s on host %s";
char *msg_obitnodel = "Unable to delete files for job %s, on host %s";
char *msg_on_shutdown = " on Server shutdown";
char *msg_orighost = "Job missing PBS_O_HOST value";
char *msg_permlog = "Unauthorized Request, request type: %d, Object: %s, Name: %s, request from: %s@%s";
char *msg_postmomnojob = "Job not found after hold reply from MOM";
char *msg_request = "Type %d request received from %s@%s, sock=%d";
char *msg_regrej = "Dependency request for job rejected by ";
char *msg_registerdel = "Job deleted as result of dependency on job %s";
char *msg_registerrel = "Dependency on job %s released.";
char *msg_routexceed = "Route queue lifetime exceeded";
char *msg_script_open = "Unable to open script file";
char *msg_script_write = "Unable to write script file";
char *msg_hookfile_open = "Unable to open hook-related file";
char *msg_hookfile_write = "Unable to write hook-related file";
char *msg_shutdown_op = "Shutdown request from %s@%s ";
char *msg_shutdown_start = "Starting to shutdown the server, type is ";
char *msg_startup1 = "Version %s, started, initialization type = %d";
char *msg_startup2 = "Server pid = %d ready;  using ports Server:%d MOM:%d RM:%d";
char *msg_startup3 = "%s %s: %s mode and %s, \ndo you wish to continue y/(n)?";
char *msg_svdbopen = "Unable to open server data base";
char *msg_svdbnosv = "Unable to save server data base ";
char *msg_svrdown = "Server shutdown completed";
char *msg_resvQcreateFail = "failed to create queue for reservation";
char *msg_genBatchReq = "batch request generation failed";
char *msg_mgrBatchReq = "mgr batch request failed";
char *msg_deleteresv = "delete reservation";
char *msg_deleteresvJ = "delete reservation-job";
char *msg_noDeljobfromResv = "failed to delete job %s from reservation %s";
char *msg_purgeResvlink = "Unlink of reservation file failed";
char *msg_purgeResvDb = "Removal of reservation failed";
char *msg_purgeResvFail = "Failed to purge reservation";
char *msg_internalReqFail = "An internally generated request failed";
char *msg_qEnabStartFail = "Failed to start/enable reservation queue";
char *msg_NotResv = "not a reservation";
char *msg_resv_abort = "Reservation removed";
char *msg_resv_start = "Reservation period starting";
char *msg_resv_end = "Reservation period ended";
char *msg_resv_confirm = "Reservation transitioned from state UNCONFIRMED to CONFIRMED";
char *msg_signal_job = "job signaled with %s by %s@%s";
char *msg_license_min_badval = "pbs_license_min is < 0, or > pbs_license_max";
char *msg_license_max_badval = "pbs_license_max is < 0, or < pbs_license_min";
char *msg_license_linger_badval = "pbs_license_linger_time is <= 0";
char *msg_license_server_down = "Not running any new jobs. PBS license server is down.";
char *msg_license_bad_action = "Action not allowed with license server scheme.";
char *msg_prov_script_notfound = "Provision hook script not found";
char *msg_jobscript_max_size = "jobscript size exceeded the jobscript_max_size";
char *msg_badjobscript_max_size = "jobscript max size exceeds 2GB";
char *msg_new_inventory_mom = "Setting inventory_mom for vnode_pool %d to %s";
char *msg_auth_request = "Type %d request is authenticated. The credential id is %s@%s, host %s, sock=%d";

/*
 * This set of messages is used in e-mail to inform the user that the job exceeded resources.
 */
char *msg_momkillncpusburst = "Job exceeded resource ncpus (burst)\nSee job standard error file";
char *msg_momkillncpussum = "Job exceeded resource ncpus (sum)\nSee job standard error file";
char *msg_momkillvmem = "Job exceeded resource vmem\nSee job standard error file";
char *msg_momkillmem = "Job exceeded resource mem\nSee job standard error file";
char *msg_momkillcput = "Job exceeded resource cput\nSee job standard error file";
char *msg_momkillwalltime = "Job exceeded resource walltime\nSee job standard error file";

/*
 * This next set of messages are returned to the client on an error.
 * They may also be logged.
 */

char *msg_unkjobid = "Unknown Job Id";
char *msg_noattr = "Undefined attribute ";
char *msg_attrro = "Cannot set attribute, read only or insufficient permission ";
char *msg_ivalreq = "Invalid request";
char *msg_unkreq = "Unknown request";
char *msg_perm = "Unauthorized Request ";
char *msg_reqbadhost = "Access from host not allowed, or unknown host";
char *msg_jobexist = "Job with requested ID already exists";
char *msg_system = "System error: ";
char *msg_internal = "PBS server internal error";
char *msg_regroute = "Dependent parent job currently in routing queue";
char *msg_unksig = "Unknown/illegal signal name";
char *msg_badatval = "Illegal attribute or resource value";
char *msg_badnodeatval = "Illegal value for node";
char *msg_nodenamebig = "Node name is too big";
char *msg_jobnamebig = "name is too long";
char *msg_mutualex = "Mutually exclusive values for ";
char *msg_modatrrun = "Cannot modify attribute while job running ";
char *msg_badstate = "Request invalid for state of job";
char *msg_unkque = "Unknown queue";
char *msg_unknode = "Unknown node ";
char *msg_unknodeatr = "Unknown node-attribute ";
char *msg_nonodes = "Server has no node list";
char *msg_badcred = "Invalid credential";
char *msg_expired = "Expired credential";
char *msg_qunoenb = "Queue is not enabled";
char *msg_qacess = "Access to queue is denied";
char *msg_nodestale = "Cannot change state of stale node";
char *msg_nodeexist = "Node name already exists";

#ifdef WIN32
char *msg_baduser = "Bad UID for job execution - could be an administrator-type account currently not allowed to run jobs (can be configured)";
#else
char *msg_baduser = "Bad UID for job execution";
#endif

char *msg_bad_password = "job has bad password";
char *msg_badgrp = "Bad GID for job execution";
char *msg_badRuser = "Bad effective UID for reservation";
char *msg_badRgrp = "Bad effective GID for reservation";
char *msg_hopcount = "Job routing over too many hops";
char *msg_queexist = "Queue already exists";
char *msg_attrtype = "Warning: type of queue %s incompatible with attribute %s";
char *msg_attrtype2 = "Incompatible type";
char *msg_objbusy = "Cannot delete busy object";
char *msg_quenbig = "Queue name too long";
char *msg_nosupport = "No support for requested service";
char *msg_quenoen = "Cannot enable queue, incomplete definition";
char *msg_needquetype = "Queue type must be set";
char *msg_protocol = "Batch protocol error";
char *msg_noconnects = "No free connections";
char *msg_noserver = "No server specified";
char *msg_unkresc = "Unknown resource";
char *msg_excqresc = "Job violates queue and/or server resource limits";
char *msg_quenodflt = "No default queue specified";
char *msg_jobnorerun = "job is not rerunnable";
char *msg_routebad = "Job rejected by all possible destinations";
char *msg_momreject = "Execution server rejected request";
char *msg_nosyncmstr = "No master found for sync job set";
char *msg_sched_called = "Scheduler sent command %d";
char *msg_sched_nocall = "Could not contact Scheduler";
char *msg_stageinfail = "Stage In of files failed";
char *msg_rescunav = "Resource temporarily unavailable";
char *msg_maxqueued = "Maximum number of jobs already in queue";
char *msg_chkpointbusy = "Checkpoint busy, may retry";
char *msg_exceedlmt = "Resource limit exceeds allowable";
char *msg_badacct = "Invalid Account";
char *msg_baddepend = "Invalid Job Dependency";
char *msg_duplist = "Duplicate entry in list ";
char *msg_svrshut = "Request not allowed: Server shutting down";
char *msg_execthere = "Cannot execute at specified host because of checkpoint or stagein files";
char *msg_gmoderr = "Modification failed for ";
char *msg_notsnode = "No time-share node available";
char *msg_resvNowall = "Reservation needs walltime";
char *msg_jobNotresv = "not a reservation job";
char *msg_resvToolate = "too late for reservation";
char *msg_resvsyserr = "internal reservation-system error";

char *msg_Resv_Cancel = "Attempting to cancel reservation";
char *msg_unkresvID = "Unknown Reservation Id";
char *msg_resvExist = "Reservation with requested ID already exists";
char *msg_resvfromresvjob = "Reservation may not be created from a job already within a reservation";
char *msg_resvfromarrjob = "Reservation may not be created from an array job";
char *msg_selnotsubset = "New select must be made up of a subset of the original chunks";
char *msg_resvFail = "reservation failure";
char *msg_delProgress = "Delete already in progress";
char *msg_BadTspec = "Bad time specification(s)";
char *msg_BadNodespec = "node(s) specification error";
char *msg_licensecpu = "Exceeded number of licensed cpus";
char *msg_licenseinv = "PBS license is invalid";
char *msg_resvauth_H = "Host machine not authorized to submit reservations";
char *msg_resvauth_G = "Requestor's group not authorized to submit reservations";
char *msg_resvauth_U = "Requestor not authorized to make reservations";
char *msg_licenseunav = "Floating License unavailable";
char *msg_rescnotstr = "Resource is not of type string or array_of_strings";
char *msg_maxarraysize = "Array job exceeds server or queue size limit";
char *msg_invalselectresc = "Resource invalid in \"select\" specification";
char *msg_invaljobresc = "\"-lresource=\" cannot be used with \"select\" or \"place\", resource is";
char *msg_invalnodeplace = "Cannot be used with select or place";
char *msg_placenoselect = "Cannot have \"place\" without \"select\"";
char *msg_indirecthop = "invalid multi-level indirect reference for resource";
char *msg_indirectbadtgt = "indirect target undefined on node for resource";
char *msg_dupresc = "duplicated resource within a section of a select specification, resource is";
char *msg_connfull = "Server connection table full";
char *msg_bad_formula = "Invalid Formula Format";
char *msg_bad_formula_kw = "Formula contains invalid keyword";
char *msg_bad_formula_type = "Formula contains a resource of an invalid type";
char *msg_hook_error = "hook error";
char *msg_eligibletimeset_error = "Cannot set attribute when eligible_time_enable is OFF";
char *msg_historyjobid = "Job has finished";
char *msg_job_history_notset = "PBS is not configured to maintain job history";
char *msg_job_history_delete = "Deleting job history upon request from %s@%s";
char *msg_also_deleted_job_history = "Also deleted job history";
char *msg_nohistarrayjob = "Request invalid for finished array subjob";
char *msg_valueoutofrange = "attribute value is out of range";
char *msg_jobinresv_conflict = "job and reservation have conflicting specification";
char *msg_max_no_minwt = "Cannot have \"max_walltime\" without \"min_walltime\"";
char *msg_min_gt_maxwt = "\"min_walltime\" can not be greater than \"max_walltime\"";
char *msg_nostf_resv = "\"min_walltime\" and \"max_walltime\" are not valid resources for a reservation";
char *msg_nostf_jobarray = "\"min_walltime\" and \"max_walltime\" are not valid resources for a job array";
char *msg_nolimit_resc = "Resource limits can not be set for the resource";
char *msg_save_err = "Failed to save job/resv, refer server logs for details";
char *msg_mom_incomplete_hook = "vnode's parent mom has a pending copy hook or delete hook request";
char *msg_mom_reject_root_scripts = "mom not accepting remote hook files or root job scripts";
char *msg_hook_reject = "hook rejected request";
char *msg_hook_reject_rerunjob = "hook rejected request, requiring job to be rerun";
char *msg_hook_reject_deletejob = "hook rejected request, requiring job to be deleted";
char *msg_ival_obj_name = "Invalid object name";
char *msg_wrong_resume = "Job can not be resumed with the requested resume signal";

/* Provisioning specific */
char *msg_provheadnode_error = "Cannot set provisioning attribute on host running PBS server and scheduler";
char *msg_cantmodify_ndprov = "Cannot modify attribute while vnode is provisioning";
char *msg_nostatechange_ndprov = "Cannot change state of provisioning vnode";
char *msg_cantdel_ndprov = "Cannot delete vnode if vnode is provisioning";
char *msg_node_bad_current_aoe = "Current AOE does not match with resources_available.aoe";
char *msg_invld_aoechunk = "Invalid provisioning request in chunk(s)";

/* Standing reservation specific */
char *msg_bad_rrule_yearly = "YEARLY recurrence duration cannot exceed 1 year";
char *msg_bad_rrule_monthly = "MONTHLY recurrence duration cannot exceed 1 month";
char *msg_bad_rrule_weekly = "WEEKLY recurrence duration cannot exceed 1 week";
char *msg_bad_rrule_daily = "DAILY recurrence duration cannot exceed 24 hours";
char *msg_bad_rrule_hourly = "HOURLY recurrence duration cannot exceed 1 hour";
char *msg_bad_rrule_minutely = "MINUTELY recurrence duration cannot exceed 1 minute";
char *msg_bad_rrule_secondly = "SECONDLY recurrence duration cannot exceed 1 second";
char *msg_bad_rrule_syntax = "Undefined iCalendar syntax";
char *msg_bad_rrule_syntax2 = "Undefined iCalendar syntax. A valid COUNT or UNTIL is required";
char *msg_bad_ical_tz = "Unrecognized PBS_TZID environment variable";

/* following set of messages are for entity limit controls */
char *msg_mixedquerunlimits = "Cannot mix old and new style queue/run limit enforcement types";
char *msg_et_qct = "Maximum number of jobs already in queue %s";
char *msg_et_sct = "Maximum number of jobs already in complex";
char *msg_et_ggq = "would exceed queue %s's per-group limit";
char *msg_et_ggs = "would exceed complex's per-group limit";
char *msg_et_gpq = "would exceed queue %s's per-project limit";
char *msg_et_gps = "would exceed complex's per-project limit";

char *msg_et_guq = "would exceed queue %s's per-user limit";
char *msg_et_gus = "would exceed complex's per-user limit";
char *msg_et_sgq = "Maximum number of jobs for group %s already in queue %s";
char *msg_et_sgs = "Maximum number of jobs for group %s already in complex";
char *msg_et_spq = "Maximum number of jobs for project %s already in queue %s";
char *msg_et_sps = "Maximum number of jobs for project %s already in complex";
char *msg_et_suq = "Maximum number of jobs for user %s already in queue %s";
char *msg_et_sus = "Maximum number of jobs for user %s already in complex";
char *msg_et_raq = "would exceed limit on resource %s in queue %s";
char *msg_et_ras = "would exceed limit on resource %s in complex";
char *msg_et_rggq = "would exceed per-group limit on resource %s in queue %s";
char *msg_et_rggs = "would exceed per-group limit on resource %s in complex";
char *msg_et_rgpq = "would exceed per-project limit on resource %s in queue %s";
char *msg_et_rgps = "would exceed per-project limit on resource %s in complex";
char *msg_et_rguq = "would exceed per-user limit on resource %s in queue %s";
char *msg_et_rgus = "would exceed per-user limit on resource %s in complex";
char *msg_et_rsgq = "would exceed group %s's limit on resource %s in queue %s";
char *msg_et_rsgs = "would exceed group %s's limit on resource %s in complex";
char *msg_et_rspq = "would exceed project %s's limit on resource %s in queue %s";
char *msg_et_rsps = "would exceed project %s's limit on resource %s in complex";
char *msg_et_rsuq = "would exceed user %s's limit on resource %s in queue %s";
char *msg_et_rsus = "would exceed user %s's limit on resource %s in complex";

char *msg_et_qct_q = "Maximum number of jobs in 'Q' state already in queue %s";
char *msg_et_sct_q = "Maximum number of jobs in 'Q' state already in complex";
char *msg_et_ggq_q = "would exceed queue %s's per-group limit of jobs in 'Q' state";
char *msg_et_ggs_q = "would exceed complex's per-group limit of jobs in 'Q' state";
char *msg_et_gpq_q = "would exceed queue %s's per-project limit of jobs in 'Q' state";
char *msg_et_gps_q = "would exceed complex's per-project limit of jobs in 'Q' state";

char *msg_et_guq_q = "would exceed queue %s's per-user limit of jobs in 'Q' state";
char *msg_et_gus_q = "would exceed complex's per-user limit of jobs in 'Q' state";
char *msg_et_sgq_q = "Maximum number of jobs in 'Q' state for group %s already in queue %s";
char *msg_et_sgs_q = "Maximum number of jobs in 'Q' state for group %s already in complex";
char *msg_et_spq_q = "Maximum number of jobs in 'Q' state for project %s already in queue %s";
char *msg_et_sps_q = "Maximum number of jobs in 'Q' state for project %s already in complex";
char *msg_et_suq_q = "Maximum number of jobs in 'Q' state for user %s already in queue %s";
char *msg_et_sus_q = "Maximum number of jobs in 'Q' state for user %s already in complex";
char *msg_et_raq_q = "would exceed limit on resource %s in queue %s for jobs in 'Q' state";
char *msg_et_ras_q = "would exceed limit on resource %s in complex for jobs in 'Q' state";
char *msg_et_rggq_q = "would exceed per-group limit on resource %s in queue %s for jobs in 'Q' state";
char *msg_et_rggs_q = "would exceed per-group limit on resource %s in complex for jobs in 'Q' state";
char *msg_et_rgpq_q = "would exceed per-project limit on resource %s in queue %s for jobs in 'Q' state";
char *msg_et_rgps_q = "would exceed per-project limit on resource %s in complex for jobs in 'Q' state";
char *msg_et_rguq_q = "would exceed per-user limit on resource %s in queue %s for jobs in 'Q' state";
char *msg_et_rgus_q = "would exceed per-user limit on resource %s in complex for jobs in 'Q' state";
char *msg_et_rsgq_q = "would exceed group %s's limit on resource %s in queue %s for jobs in 'Q' state";
char *msg_et_rsgs_q = "would exceed group %s's limit on resource %s in complex for jobs in 'Q' state";
char *msg_et_rspq_q = "would exceed project %s's limit on resource %s in queue %s for jobs in 'Q' state";
char *msg_et_rsps_q = "would exceed project %s's limit on resource %s in complex for jobs in 'Q' state";
char *msg_et_rsuq_q = "would exceed user %s's limit on resource %s in queue %s for jobs in 'Q' state";
char *msg_et_rsus_q = "would exceed user %s's limit on resource %s in complex for jobs in 'Q' state";

char *msg_force_qsub_update = "force a qsub update";
char *msg_noloopbackif = "Local host does not have loopback interface configured or pingable.";

char *msg_defproject = "%s = %s is also the default project assigned to jobs with unset project attribute";
char *msg_norunalteredjob = "Cannot run job which was altered/moved during current scheduling cycle.";

/* resource limit setup specific */
char *msg_corelimit = "invalid value for PBS_CORE_LIMIT in pbs.conf, continuing with default core limit. To use PBS_CORE_LIMIT update pbs.conf with correct value";

char *msg_resc_busy = "Resource busy";

char *msg_job_moved = "Job moved to remote server";
char *msg_init_recovsched = "Recovered scheduler %s";
char *msg_sched_exist = "Scheduler already exists";
char *msg_sched_name_big = "Scheduler name is too long";
char *msg_unknown_sched = "Unknown Scheduler";
char *msg_no_del_sched = "Can not delete Scheduler";
char *msg_sched_priv_exists = "Another scheduler also has same value for its sched_priv directory";
char *msg_sched_logs_exists = "Another scheduler also has same value for its sched_log directory";
char *msg_route_que_no_partition = "Cannot assign a partition to route queue";
char *msg_cannot_set_route_que = "Route queues are incompatible with the partition attribute";
char *msg_queue_not_in_partition = "Queue %s is not part of partition for node";
char *msg_partition_not_in_queue = "Partition %s is not part of queue for node";
char *msg_invalid_partion_in_queue = "Invalid partition in queue";
char *msg_sched_op_not_permitted = "Operation is not permitted on default scheduler";
char *msg_sched_part_already_used = "Partition is already associated with other scheduler";
char *msg_invalid_max_job_sequence_id = "Cannot set max_job_sequence_id < 9999999, or > 999999999999";
char *msg_jsf_incompatible = "Server's job_sort_formula value is incompatible with sched's";

char *msg_resv_not_empty = "Reservation not empty";
char *msg_stdg_resv_occr_conflict = "Requested time(s) will interfere with a later occurrence";
char *msg_alps_switch_err = "Switching ALPS reservation failed";

char *msg_softwt_stf = "soft_walltime is not supported with Shrink to Fit jobs";
char *msg_node_busy = "Node is busy";
char *msg_default_partition = "Default partition name is not allowed";
char *msg_depend_runone = "Job deleted, a dependent job ran";
char *msg_histdepend = "Finished job did not satisfy dependency";
char *msg_sched_already_connected = "Scheduler already connected";
char *msg_notarray_attr = "Attribute has to be set on an array job";

/*
 * The following table connects error numbers with text
 * to be returned to the client.  Each is guaranteed to be pure text.
 * There are no printf formatting strings imbedded.
 */

struct pbs_err_to_txt pbs_err_to_txt[] = {
	{PBSE_UNKJOBID, &msg_unkjobid},
	{PBSE_NOATTR, &msg_noattr},
	{PBSE_ATTRRO, &msg_attrro},
	{PBSE_IVALREQ, &msg_ivalreq},
	{PBSE_UNKREQ, &msg_unkreq},
	{PBSE_PERM, &msg_perm},
	{PBSE_BADHOST, &msg_reqbadhost},
	{PBSE_JOBEXIST, &msg_jobexist},
	{PBSE_SYSTEM, &msg_system},
	{PBSE_INTERNAL, &msg_internal},
	{PBSE_REGROUTE, &msg_regroute},
	{PBSE_UNKSIG, &msg_unksig},
	{PBSE_BADATVAL, &msg_badatval},
	{PBSE_BADNDATVAL, &msg_badnodeatval},
	{PBSE_NODENBIG, &msg_nodenamebig},
	{PBSE_MUTUALEX, &msg_mutualex},
	{PBSE_MODATRRUN, &msg_modatrrun},
	{PBSE_BADSTATE, &msg_badstate},
	{PBSE_UNKQUE, &msg_unkque},
	{PBSE_UNKNODE, &msg_unknode},
	{PBSE_UNKNODEATR, &msg_unknodeatr},
	{PBSE_NONODES, &msg_nonodes},
	{PBSE_BADCRED, &msg_badcred},
	{PBSE_EXPIRED, &msg_expired},
	{PBSE_QUNOENB, &msg_qunoenb},
	{PBSE_QACESS, &msg_qacess},
	{PBSE_BADUSER, &msg_baduser},
	{PBSE_R_UID, &msg_badRuser},
	{PBSE_HOPCOUNT, &msg_hopcount},
	{PBSE_QUEEXIST, &msg_queexist},
	{PBSE_OBJBUSY, &msg_objbusy},
	{PBSE_QUENBIG, &msg_quenbig},
	{PBSE_NOSUP, &msg_nosupport},
	{PBSE_QUENOEN, &msg_quenoen},
	{PBSE_PROTOCOL, &msg_protocol},
	{PBSE_NOCONNECTS, &msg_noconnects},
	{PBSE_NOSERVER, &msg_noserver},
	{PBSE_UNKRESC, &msg_unkresc},
	{PBSE_EXCQRESC, &msg_excqresc},
	{PBSE_QUENODFLT, &msg_quenodflt},
	{PBSE_NORERUN, &msg_jobnorerun},
	{PBSE_ROUTEREJ, &msg_routebad},
	{PBSE_MOMREJECT, &msg_momreject},
	{PBSE_NOSYNCMSTR, &msg_nosyncmstr},
	{PBSE_STAGEIN, &msg_stageinfail},
	{PBSE_RESCUNAV, &msg_rescunav},
	{PBSE_BADGRP, &msg_badgrp},
	{PBSE_R_GID, &msg_badRgrp},
	{PBSE_MAXQUED, &msg_maxqueued},
	{PBSE_CKPBSY, &msg_chkpointbusy},
	{PBSE_EXLIMIT, &msg_exceedlmt},
	{PBSE_BADACCT, &msg_badacct},
	{PBSE_BADDEPEND, &msg_baddepend},
	{PBSE_DUPLIST, &msg_duplist},
	{PBSE_EXECTHERE, &msg_execthere},
	{PBSE_SVRDOWN, &msg_svrshut},
	{PBSE_ATTRTYPE, &msg_attrtype2},
	{PBSE_GMODERR, &msg_gmoderr},
	{PBSE_NORELYMOM, &msg_norelytomom},
	{PBSE_NOTSNODE, &msg_notsnode},
	{PBSE_RESV_NO_WALLTIME, &msg_resvNowall},
	{PBSE_JOBNOTRESV, &msg_jobNotresv},
	{PBSE_TOOLATE, &msg_resvToolate},
	{PBSE_IRESVE, &msg_resvsyserr},
	{PBSE_RESVEXIST, &msg_resvExist},
	{PBSE_RESV_FROM_RESVJOB, &msg_resvfromresvjob},
	{PBSE_RESV_FROM_ARRJOB, &msg_resvfromarrjob},
	{PBSE_SELECT_NOT_SUBSET, &msg_selnotsubset},
	{PBSE_resvFail, &msg_resvFail},
	{PBSE_genBatchReq, &msg_genBatchReq},
	{PBSE_mgrBatchReq, &msg_mgrBatchReq},
	{PBSE_UNKRESVID, &msg_unkresvID},
	{PBSE_delProgress, &msg_delProgress},
	{PBSE_BADTSPEC, &msg_BadTspec},
	{PBSE_NOTRESV, &msg_NotResv},
	{PBSE_BADNODESPEC, &msg_BadNodespec},
	{PBSE_LICENSEINV, &msg_licenseinv},
	{PBSE_RESVAUTH_H, &msg_resvauth_H},
	{PBSE_RESVAUTH_G, &msg_resvauth_G},
	{PBSE_RESVAUTH_U, &msg_resvauth_U},
	{PBSE_RESCNOTSTR, &msg_rescnotstr},
	{PBSE_MaxArraySize, &msg_maxarraysize},
	{PBSE_NOSCHEDULER, &msg_sched_nocall},
	{PBSE_INVALSELECTRESC, &msg_invalselectresc},
	{PBSE_INVALJOBRESC, &msg_invaljobresc},
	{PBSE_INVALNODEPLACE, &msg_invalnodeplace},
	{PBSE_PLACENOSELECT, &msg_placenoselect},
	{PBSE_INDIRECTHOP, &msg_indirecthop},
	{PBSE_INDIRECTBT, &msg_indirectbadtgt},
	{PBSE_NODESTALE, &msg_nodestale},
	{PBSE_NODEEXIST, &msg_nodeexist},
	{PBSE_DUPRESC, &msg_dupresc},
	{PBSE_CONNFULL, &msg_connfull},
	{PBSE_LICENSE_MIN_BADVAL, &msg_license_min_badval},
	{PBSE_LICENSE_MAX_BADVAL, &msg_license_max_badval},
	{PBSE_LICENSE_LINGER_BADVAL, &msg_license_linger_badval},
	{PBSE_BAD_FORMULA, &msg_bad_formula},
	{PBSE_BAD_FORMULA_KW, &msg_bad_formula_kw},
	{PBSE_BAD_FORMULA_TYPE, &msg_bad_formula_type},
	{PBSE_BAD_RRULE_YEARLY, &msg_bad_rrule_yearly},
	{PBSE_BAD_RRULE_MONTHLY, &msg_bad_rrule_monthly},
	{PBSE_BAD_RRULE_WEEKLY, &msg_bad_rrule_weekly},
	{PBSE_BAD_RRULE_DAILY, &msg_bad_rrule_daily},
	{PBSE_BAD_RRULE_HOURLY, &msg_bad_rrule_hourly},
	{PBSE_BAD_RRULE_MINUTELY, &msg_bad_rrule_minutely},
	{PBSE_BAD_RRULE_SECONDLY, &msg_bad_rrule_secondly},
	{PBSE_BAD_RRULE_SYNTAX, &msg_bad_rrule_syntax},
	{PBSE_BAD_RRULE_SYNTAX2, &msg_bad_rrule_syntax2},
	{PBSE_BAD_ICAL_TZ, &msg_bad_ical_tz},
	{PBSE_HOOKERROR, &msg_hook_error},
	{PBSE_NEEDQUET, &msg_needquetype},
	{PBSE_ETEERROR, &msg_eligibletimeset_error},
	{PBSE_HISTJOBID, &msg_historyjobid},
	{PBSE_JOBHISTNOTSET, &msg_job_history_notset},
	{PBSE_MIXENTLIMS, &msg_mixedquerunlimits},
	{PBSE_ATVALERANGE, &msg_valueoutofrange},
	{PBSE_PROV_HEADERROR, &msg_provheadnode_error},
	{PBSE_NODEPROV_NOACTION, &msg_cantmodify_ndprov},
	{PBSE_NODEPROV, &msg_nostatechange_ndprov},
	{PBSE_NODEPROV_NODEL, &msg_cantdel_ndprov},
	{PBSE_NODE_BAD_CURRENT_AOE, &msg_node_bad_current_aoe},
	{PBSE_NOLOOPBACKIF, &msg_noloopbackif},
	{PBSE_IVAL_AOECHUNK, &msg_invld_aoechunk},
	{PBSE_JOBINRESV_CONFLICT, &msg_jobinresv_conflict},
	{PBSE_MAX_NO_MINWT, &msg_max_no_minwt},
	{PBSE_MIN_GT_MAXWT, &msg_min_gt_maxwt},
	{PBSE_NOSTF_RESV, &msg_nostf_resv},
	{PBSE_NOSTF_JOBARRAY, &msg_nostf_jobarray},
	{PBSE_NOLIMIT_RESOURCE, &msg_nolimit_resc},
	{PBSE_NORUNALTEREDJOB, &msg_norunalteredjob},
	{PBSE_NOHISTARRAYSUBJOB, &msg_nohistarrayjob},
	{PBSE_FORCE_QSUB_UPDATE, &msg_force_qsub_update},
	{PBSE_SAVE_ERR, &msg_save_err},
	{PBSE_MOM_INCOMPLETE_HOOK, &msg_mom_incomplete_hook},
	{PBSE_MOM_REJECT_ROOT_SCRIPTS, &msg_mom_reject_root_scripts},
	{PBSE_HOOK_REJECT, &msg_hook_reject},
	{PBSE_HOOK_REJECT_RERUNJOB, &msg_hook_reject_rerunjob},
	{PBSE_HOOK_REJECT_DELETEJOB, &msg_hook_reject_deletejob},
	{PBSE_IVAL_OBJ_NAME, &msg_ival_obj_name},
	{PBSE_JOBNBIG, &msg_jobnamebig},
	{PBSE_RESCBUSY, &msg_resc_busy},
	{PBSE_JOB_MOVED, &msg_job_moved},
	{PBSE_JOBSCRIPTMAXSIZE, &msg_jobscript_max_size},
	{PBSE_BADJOBSCRIPTMAXSIZE, &msg_badjobscript_max_size},
	{PBSE_WRONG_RESUME, &msg_wrong_resume},
	{PBSE_SCHEDEXIST, &msg_sched_exist},
	{PBSE_SCHED_NAME_BIG, &msg_sched_name_big},
	{PBSE_UNKSCHED, &msg_unknown_sched},
	{PBSE_SCHED_NO_DEL, &msg_no_del_sched},
	{PBSE_SCHED_PRIV_EXIST, &msg_sched_priv_exists},
	{PBSE_SCHED_LOG_EXIST, &msg_sched_logs_exists},
	{PBSE_ROUTE_QUE_NO_PARTITION, &msg_route_que_no_partition},
	{PBSE_CANNOT_SET_ROUTE_QUE, &msg_cannot_set_route_que},
	{PBSE_QUE_NOT_IN_PARTITION, &msg_queue_not_in_partition},
	{PBSE_PARTITION_NOT_IN_QUE, &msg_partition_not_in_queue},
	{PBSE_INVALID_PARTITION_QUE, &msg_invalid_partion_in_queue},
	{PBSE_RESV_NOT_EMPTY, &msg_resv_not_empty},
	{PBSE_STDG_RESV_OCCR_CONFLICT, &msg_stdg_resv_occr_conflict},
	{PBSE_ALPS_SWITCH_ERR, &msg_alps_switch_err},
	{PBSE_SOFTWT_STF, &msg_softwt_stf},
	{PBSE_SCHED_OP_NOT_PERMITTED, &msg_sched_op_not_permitted},
	{PBSE_SCHED_PARTITION_ALREADY_EXISTS, &msg_sched_part_already_used},
	{PBSE_INVALID_MAX_JOB_SEQUENCE_ID, &msg_invalid_max_job_sequence_id},
	{PBSE_SVR_SCHED_JSF_INCOMPAT, &msg_jsf_incompatible},
	{PBSE_NODE_BUSY, &msg_node_busy},
	{PBSE_DEFAULT_PARTITION, &msg_default_partition},
	{PBSE_HISTDEPEND, &msg_histdepend},
	{PBSE_SCHEDCONNECTED, &msg_sched_already_connected},
	{PBSE_NOTARRAY_ATTR, &msg_notarray_attr},
	{0, NULL} /* MUST be the last entry */
};

/**
 * @brief
 * 	pbse_to_txt() - return a text message for an PBS error number
 *	if it exists
 *
 * @param[in] err - error number whose appropriate text message to be returned
 *
 * @return	string
 * @retval	text error msg	if such error exists
 * @retval	NULL		ni such error num
 *
 */

char *
pbse_to_txt(int err)
{
	int i = 0;

	while (pbs_err_to_txt[i].err_no && (pbs_err_to_txt[i].err_no != err))
		++i;
	if (pbs_err_to_txt[i].err_txt != NULL)
		return (*pbs_err_to_txt[i].err_txt);
	else
		return NULL;
}


================================================
FILE: src/lib/Liblog/setup_env.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "portability.h"
#include "log.h"

/**
 * @file	setup_env.c
 */
/**
 * @brief
 *	setup the daemon's environment
 *	To provide a "safe and secure" environment, the daemons replace their
 *	inherited one with one from a file.  Each line in the file is
 *	either a comment line, starting with '#' or ' ', or is a line of
 *	the forms:	variable=value
 *			variable
 *	In the second case the value is obtained from the current environment.
 *
 * @param[in]   filen - the daemons relace their inherited one with one from this
 *                     file
 *
 * @return int
 * @retval  0	The environment was setup successfully
 *		connection made.
 * @retval -1	error encountered setting up the environment
 */
#define PBS_ENVP_STR 64
#define PBS_ENV_CHUNCK 8191

int
setup_env(char *filen)
{
	static char id[] = "setup_env";
	char buf[PBS_ENV_CHUNCK + 1];
	FILE *efile;
	char *envbuf;
	static char *envp[PBS_ENVP_STR + 1];
	static char *nulenv[1];
	int questionable = 0;
	int i, len;
	int nstr = 0;
	char *pequal;
	char *pval = NULL;
	extern char **environ;

	if (environ == envp) {
		for (i = 0; envp[i] != NULL; i++) {
			free(envp[i]);
			envp[i] = NULL;
		}
	}
	environ = nulenv;
	if ((filen == NULL) || (*filen == '\0'))
		return 0;

	efile = fopen(filen, "r");
	if (efile != NULL) {

		while (fgets(buf, PBS_ENV_CHUNCK, efile)) {

			if (questionable) {
				/* previous bufr had no '\n' and more bytes remain */
				goto err;
			}

			if ((buf[0] != '#') && (buf[0] != ' ') && (buf[0] != '\n')) {

				len = strlen(buf);
				if (buf[len - 1] != '\n') {
					/* no newline, wonder if this is last line */
					questionable = 1;
				} else {
#ifdef WIN32
					/* take care of <carriage-return> char */
					if (len > 1 && !isalnum(buf[len - 2]))
						buf[len - 2] = '\0';
#endif
					buf[len - 1] = '\0';
				}

				if ((pequal = strchr(buf, (int) '=')) == 0) {
					if ((pval = getenv(buf)) == 0)
						continue;
					len += strlen(pval) + 1;
				}

				if ((envbuf = malloc(len + 1)) == 0)
					goto err;
				(void) strcpy(envbuf, buf);
				if (pequal == 0) {
					(void) strcat(envbuf, "=");
					(void) strcat(envbuf, pval);
				}
				envp[nstr++] = envbuf;
				if (nstr == PBS_ENVP_STR)
					goto err;
				envp[nstr] = NULL;
			}
		}
		fclose(efile);
		environ = envp;
	} else if (errno != ENOENT) {
		goto err;
	}
	sprintf(log_buffer, "read environment from %s", filen);
	log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, id, log_buffer);
	return (nstr);

err:
	log_err(errno, id, "Could not set up the environment");
	fclose(efile);
	return (-1);
}


================================================
FILE: src/lib/Libnet/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

lib_LIBRARIES = libnet.a

libnet_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

libnet_a_SOURCES = \
	get_hostaddr.c \
	net_client.c \
	net_server.c \
	net_set_clse.c \
	port_forwarding.c \
	hnls.c


================================================
FILE: src/lib/Libnet/get_hostaddr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <sys/socket.h>
#include <netdb.h>
#include <netinet/in.h>
#include <memory.h>
#include <arpa/inet.h>
#include "portability.h"
#include "server_limits.h"
#include "pbs_ifl.h"
#include "net_connect.h"
#include "pbs_error.h"
#include "pbs_internal.h"

#if !defined(H_ERRNO_DECLARED)
extern int h_errno;
#endif

/**
 * @file	get_hostaddr.c
 * @brief
 * get_hostaddr.c - contains functions to provide the internal
 *	internet address for a host and to provide the port
 *	number for a service.
 *
 * get_hostaddr - get internal internet address of a host
 *
 *	Returns a pbs_net_t (unsigned long) containing the network
 *	address in host byte order.  A Null value is returned on
 *	an error.
 */

/**
 * @brief
 *	get internal internet address of a host
 *
 * @param[in] hostname - hostname whose internet addr to be returned
 *
 * @return	pbs_net_t
 * @retval	internat address	success
 * @retval	o			error
 *
 */
pbs_net_t
get_hostaddr(char *hostname)
{
	struct addrinfo *aip, *pai;
	struct addrinfo hints;
	struct sockaddr_in *inp;
	int err;
	pbs_net_t res;

	if ((hostname == 0) || (*hostname == '\0')) {
		pbs_errno = PBS_NET_RC_FATAL;
		return ((pbs_net_t) 0);
	}

	memset(&hints, 0, sizeof(struct addrinfo));
	/*
	 *      Why do we use AF_UNSPEC rather than AF_INET?  Some
	 *      implementations of getaddrinfo() will take an IPv6
	 *      address and map it to an IPv4 one if we ask for AF_INET
	 *      only.  We don't want that - we want only the addresses
	 *      that are genuinely, natively, IPv4 so we start with
	 *      AF_UNSPEC and filter ai_family below.
	 */
	hints.ai_family = AF_UNSPEC;
	hints.ai_socktype = SOCK_STREAM;
	hints.ai_protocol = IPPROTO_TCP;
	if ((err = getaddrinfo(hostname, NULL, &hints, &pai)) != 0) {
		if (err == EAI_AGAIN)
			pbs_errno = PBS_NET_RC_RETRY;
		else
			pbs_errno = PBS_NET_RC_FATAL;
		return ((pbs_net_t) 0);
	}
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		/* skip non-IPv4 addresses */
		if (aip->ai_family == AF_INET) {
			inp = (struct sockaddr_in *) aip->ai_addr;
			break;
		}
	}
	if (aip == NULL) {
		/* treat no IPv4 addresses as fatal getaddrinfo() failure */
		pbs_errno = PBS_NET_RC_FATAL;
		freeaddrinfo(pai);
		return ((pbs_net_t) 0);
	}
	res = ntohl(inp->sin_addr.s_addr);
	freeaddrinfo(pai);
	return (res);
}

/**
 * @brief
 * 		compare a short hostname with a FQ host match if same up to dot
 *
 * @param[in]	shost	- short hostname
 * @param[in]	lhost	- FQ host
 *
 * @return	int
 * @retval	0	- match
 * @retval	1	- no match
 */
int
compare_short_hostname(char *shost, char *lhost)
{
	size_t len;
	char *pdot;
	int is_shost_ip;
	int is_lhost_ip;
	struct sockaddr_in check_ip;

	if ((shost == NULL) || (lhost == NULL))
		return 1;

	/* check if hostnames given are in IPV4 dotted-decimal form: ddd.ddd.ddd.ddd */
	is_shost_ip = inet_pton(AF_INET, shost, &(check_ip.sin_addr));
	is_lhost_ip = inet_pton(AF_INET, lhost, &(check_ip.sin_addr));
	if ((is_shost_ip > 0) || (is_lhost_ip > 0)) {
		/* ((3 * 4) + 3) = 15 characters, max length dotted decimal addr */
		if (strncmp(shost, lhost, 15) == 0)
			return 0;
		return 1;
	}

	if ((pdot = strchr(shost, '.')) != NULL)
		len = (size_t) (pdot - shost);
	else
		len = strlen(shost);
	if ((strncasecmp(shost, lhost, len) == 0) &&
	    ((*(lhost + len) == '.') || (*(lhost + len) == '\0')))
		return 0; /* match */
	else
		return 1; /* no match */
}

/**
 * @brief
 *
 * comp_svraddr - get internal internet address of the given host
 *		  check to see if any of the addresses match the given server
 *		  net address.
 *
 *
 * @param[in] svr_addr - net address of the server
 * @param[in] hostname - hostname whose internet addr needs to be compared
 * @param[out] addr - one of the address associated with hostname is returned in this argument
 *
 * @return	int
 * @retval	0 address found
 * @retval	1 address not found
 * @retval	2 failed to find address
 *
 */
int
comp_svraddr(pbs_net_t svr_addr, char *hostname, pbs_net_t *addr)
{
	struct addrinfo *aip, *pai;
	struct addrinfo hints;
	struct sockaddr_in *inp;
	pbs_net_t res;

	if ((hostname == NULL) || (*hostname == '\0')) {
		return (2);
	}
	if (addr)
		*addr = 0;

	memset(&hints, 0, sizeof(struct addrinfo));
	hints.ai_family = AF_UNSPEC;
	hints.ai_socktype = SOCK_STREAM;
	hints.ai_protocol = IPPROTO_TCP;
	if (getaddrinfo(hostname, NULL, &hints, &pai) != 0) {
		pbs_errno = PBSE_BADHOST;
		return (2);
	}
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		if (aip->ai_family == AF_INET) {
			inp = (struct sockaddr_in *) aip->ai_addr;
			res = ntohl(inp->sin_addr.s_addr);
			if (addr && *addr == 0)
				*addr = res;
			if (res == svr_addr) {
				freeaddrinfo(pai);
				return 0;
			}
		}
	}
	/* no match found */
	freeaddrinfo(pai);
	return (1);
}


================================================
FILE: src/lib/Libnet/hnls.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include "log.h"
#include "pbs_ifl.h"
#include "pbs_internal.h"

#if defined(linux)

#include <arpa/inet.h>
#include <netinet/in.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <ifaddrs.h>
#include <netdb.h>

#elif defined(WIN32)

#pragma comment(lib, "Ws2_32.lib")
#pragma comment(lib, "Iphlpapi.lib")

#else

#include <arpa/inet.h>
#include <netinet/in.h>
#include <net/if.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/socketvar.h>
#include <sys/ioctl.h>
#include <unistd.h>
#include <netdb.h>

#endif

extern char *netaddr(struct sockaddr_in *);
#define NETADDR_BUF 80

/**
 *
 * @brief
 *      Free allocated memory for pointer.
 *
 * @par Side Effects:
 *      None
 *
 * @par MT-safe: Yes
 *
 * @param[in]   names - target pointer array to be freed
 *
 * @return void
 */
void
free_if_hostnames(char **names)
{
	int i;

	if (!names)
		return;

	for (i = 0; names[i]; i++)
		free(names[i]);
	free(names);
}
/**
 *
 * @brief
 *      Return family type for socket address.
 *
 * @par Side Effects:
 *      None
 *
 * @par MT-safe: Yes
 *
 * @param[in]		sockaddr - structure holding information
 *					about particular address
 * @param[out]		family   - holds the socket's family type
 *					"ipv4" or "ipv6"
 *
 * @return void
 */
void
get_sa_family(struct sockaddr *saddr, char *family)
{
	if (!family)
		return;
	*family = '\0';
	if (!saddr)
		return;

	switch (saddr->sa_family) {
		case AF_INET:
			strncpy(family, "ipv4", IFFAMILY_MAX);
			break;
		case AF_INET6:
			strncpy(family, "ipv6", IFFAMILY_MAX);
			break;
	}
	family[IFFAMILY_MAX - 1] = '\0';
}
/**
 *
 * @brief
 *      Returns array of names related to interfaces.
 *
 * @par Side Effects:
 *      None
 *
 * @par MT-safe: Yes
 *
 * @param[in]   sockaddr - structure holding information
 *				about addresses
 *
 * @return char**
 */
char **
get_if_hostnames(struct sockaddr *saddr)
{
	int i;
	int aliases = 0;
	char **names;
	const void *addr;
	size_t addr_size;
	struct hostent *hostp;
	struct sockaddr_in *saddr_in;
	struct sockaddr_in6 *saddr_in6;
	char buf[INET6_ADDRSTRLEN];
	const char *bufp = NULL;
#ifdef WIN32
	char host[NI_MAXHOST] = {'\0'};
	int ret = 0;
#endif /* WIN32 */

	if (!saddr)
		return NULL;

	switch (saddr->sa_family) {
		case AF_INET:
			saddr_in = (struct sockaddr_in *) saddr;
#ifdef WIN32
			saddr_in->sin_family = AF_INET;
#endif /* WIN32 */
			addr = &saddr_in->sin_addr;
			addr_size = sizeof(saddr_in->sin_addr);
			bufp = inet_ntop(AF_INET, addr, buf, INET_ADDRSTRLEN);
			if (!bufp)
				return NULL;
#ifdef WIN32
			ret = getnameinfo(saddr_in, sizeof(struct sockaddr_in), host, NI_MAXHOST, NULL, NULL, 0);
			if (ret != 0 || host[0] == '\0')
				return NULL;
#else
			hostp = gethostbyaddr(addr, addr_size, saddr_in->sin_family);
			if (!hostp)
				return NULL;
#endif /* WIN32 */
			break;
		case AF_INET6:
			saddr_in6 = (struct sockaddr_in6 *) saddr;
#ifdef WIN32
			saddr_in6->sin6_family = AF_INET6;
#endif /* WIN32 */
			addr = &saddr_in6->sin6_addr;
			addr_size = sizeof(saddr_in6->sin6_addr);
			bufp = inet_ntop(AF_INET6, addr, buf, INET6_ADDRSTRLEN);
			if (!bufp)
				return NULL;
#ifdef WIN32
			ret = getnameinfo(saddr_in6, sizeof(struct sockaddr_in6), host, NI_MAXHOST, NULL, NULL, 0);
			if (ret != 0 || host[0] == '\0')
				return NULL;
#else
			hostp = gethostbyaddr(addr, addr_size, saddr_in6->sin6_family);
			if (!hostp)
				return NULL;
#endif /* WIN32 */
			break;
		default:
			return NULL;
	}

#ifdef WIN32
	names = (char **) calloc(2, sizeof(char *));
	if (!names)
		return NULL;
	names[0] = strdup(host);
#else
	/* Count the aliases. */
	for (aliases = 0; hostp->h_aliases[aliases]; aliases++)
		;
	names = (char **) calloc((aliases + 2), sizeof(char *));
	if (!names)
		return NULL;
	names[0] = strdup(hostp->h_name);
	for (i = 0; i < aliases; i++) {
		names[i + 1] = strdup(hostp->h_aliases[i]);
	}
#endif /* WIN32 */
	return names;
}

/**
 *
 * @brief
 *      Returns structure holding network information.
 *
 * @par Side Effects:
 *      None
 *
 * @par MT-safe: Yes
 *
 * @param[out]   msg - error message returned if system calls not successful
 *
 * @return struct log_net_info * - Linked list of log_net_info structures
 */
struct log_net_info *
get_if_info(char *msg)
{
	struct log_net_info *head = NULL;
	struct log_net_info *curr = NULL;
	struct log_net_info *prev = NULL;

#if defined(linux)

	int c, i, ret;
	char **hostnames;
	struct ifaddrs *ifp, *listp;

	if (!msg)
		return NULL;
	ret = getifaddrs(&ifp);
	if ((ret != 0) || (ifp == NULL)) {
		strncpy(msg, "Failed to obtain interface names", LOG_BUF_SIZE);
		msg[LOG_BUF_SIZE - 1] = '\0';
		return NULL;
	}
	for (listp = ifp; listp; listp = listp->ifa_next) {
		hostnames = get_if_hostnames(listp->ifa_addr);
		if (!hostnames)
			continue;
		curr = (struct log_net_info *) calloc(1, sizeof(struct log_net_info));
		if (!curr) {
			free_if_info(head);
			free_if_hostnames(hostnames);
			strncpy(msg, "Out of memory", LOG_BUF_SIZE);
			msg[LOG_BUF_SIZE - 1] = '\0';
			return NULL;
		}
		if (prev)
			prev->next = curr;
		if (!head)
			head = curr;
		get_sa_family(listp->ifa_addr, curr->iffamily);
		pbs_strncpy(curr->ifname, listp->ifa_name, IFNAME_MAX);
		/* Count the hostname entries and allocate space */
		for (c = 0; hostnames[c]; c++)
			;
		curr->ifhostnames = (char **) calloc(c + 1, sizeof(char *));
		if (!curr->ifhostnames) {
			free_if_info(head);
			free_if_hostnames(hostnames);
			strncpy(msg, "Out of memory", LOG_BUF_SIZE);
			msg[LOG_BUF_SIZE - 1] = '\0';
			return NULL;
		}
		for (i = 0; i < c; i++) {
			curr->ifhostnames[i] = (char *) calloc(PBS_MAXHOSTNAME, sizeof(char));
			if (!curr->ifhostnames[i]) {
				free_if_info(head);
				free_if_hostnames(hostnames);
				strncpy(msg, "Out of memory", LOG_BUF_SIZE);
				msg[LOG_BUF_SIZE - 1] = '\0';
				return NULL;
			}
			strncpy(curr->ifhostnames[i], hostnames[i], (PBS_MAXHOSTNAME - 1));
		}
		curr->ifhostnames[i] = NULL;
		free_if_hostnames(hostnames);
		prev = curr;
		curr->next = NULL;
	}
	freeifaddrs(ifp);

#elif defined(WIN32)

	int c, i;
	char **hostnames;
	PIP_ADAPTER_ADDRESSES addrlistp, addrp;
	PIP_ADAPTER_UNICAST_ADDRESS ucp;
	DWORD size = 8192;
	DWORD ret;
	WSADATA wsadata;

	if (!msg)
		return NULL;
	addrlistp = (IP_ADAPTER_ADDRESSES *) malloc(size);
	if (!addrlistp) {
		strncpy(msg, "Out of memory", LOG_BUF_SIZE);
		msg[LOG_BUF_SIZE - 1] = '\0';
		return NULL;
	}
	ret = GetAdaptersAddresses(AF_UNSPEC, GAA_FLAG_INCLUDE_PREFIX, NULL, addrlistp, &size);
	if (ret == ERROR_BUFFER_OVERFLOW) {
		addrlistp = realloc(addrlistp, size);
		if (!addrlistp) {
			strncpy(msg, "Out of memory", LOG_BUF_SIZE);
			msg[LOG_BUF_SIZE - 1] = '\0';
			return NULL;
		}
		ret = GetAdaptersAddresses(AF_UNSPEC, GAA_FLAG_INCLUDE_PREFIX, NULL, addrlistp, &size);
	}
	if (ret == ERROR_NO_DATA) {
		strncpy(msg, "No addresses found", LOG_BUF_SIZE);
		msg[LOG_BUF_SIZE - 1] = '\0';
		free(addrlistp);
		return NULL;
	}
	if (ret != NO_ERROR) {
		strncpy(msg, "Failed to obtain adapter addresses", LOG_BUF_SIZE);
		msg[LOG_BUF_SIZE - 1] = '\0';
		free(addrlistp);
		return NULL;
	}
	if (WSAStartup(MAKEWORD(2, 2), &wsadata) != 0) {
		strncpy(msg, "Failed to initialize network", LOG_BUF_SIZE);
		msg[LOG_BUF_SIZE - 1] = '\0';
		free(addrlistp);
		return NULL;
	}
	for (addrp = addrlistp; addrp; addrp = addrp->Next) {
		for (ucp = addrp->FirstUnicastAddress; ucp; ucp = ucp->Next) {
			hostnames = get_if_hostnames((struct sockaddr *) ucp->Address.lpSockaddr);
			if (!hostnames)
				continue;
			curr = (struct log_net_info *) calloc(1, sizeof(struct log_net_info));
			if (!curr) {
				free(addrlistp);
				free_if_info(head);
				free_if_hostnames(hostnames);
				strncpy(msg, "Out of memory", LOG_BUF_SIZE);
				msg[LOG_BUF_SIZE - 1] = '\0';
				return NULL;
			}
			if (prev)
				prev->next = curr;
			if (!head)
				head = curr;
			if (addrlistp->Flags & 0x0100 && addrlistp->Flags & 0x0080) {
				strncpy(curr->iffamily, "ipv4/ipv6", IFFAMILY_MAX);
			} else if (addrlistp->Flags & 0x0100) {
				strncpy(curr->iffamily, "ipv6", IFFAMILY_MAX);
			} else if (addrlistp->Flags & 0x0080) {
				strncpy(curr->iffamily, "ipv4", IFFAMILY_MAX);
			} else {
				strncpy(curr->iffamily, "unknown", IFFAMILY_MAX);
			}
			curr->iffamily[IFFAMILY_MAX - 1] = '\0';
			strncpy(curr->ifname, addrp->AdapterName, IFNAME_MAX);
			curr->ifname[IFNAME_MAX - 1] = '\0';
			/* Count the hostname entries and allocate space */
			for (c = 0; hostnames[c]; c++)
				;
			curr->ifhostnames = (char **) calloc(c + 1, sizeof(char *));
			if (!curr->ifhostnames) {
				free(addrlistp);
				free_if_info(head);
				free_if_hostnames(hostnames);
				strncpy(msg, "Out of memory", LOG_BUF_SIZE);
				msg[LOG_BUF_SIZE - 1] = '\0';
				return NULL;
			}
			for (i = 0; i < c; i++) {
				curr->ifhostnames[i] = (char *) calloc(PBS_MAXHOSTNAME, sizeof(char));
				if (!(curr->ifhostnames[i])) {
					free(addrlistp);
					free_if_info(head);
					free_if_hostnames(hostnames);
					strncpy(msg, "Out of memory", LOG_BUF_SIZE);
					msg[LOG_BUF_SIZE - 1] = '\0';
					return NULL;
				}
				strncpy(curr->ifhostnames[i], hostnames[i], (PBS_MAXHOSTNAME - 1));
			}
			curr->ifhostnames[i] = NULL;
			free_if_hostnames(hostnames);
			prev = curr;
			curr->next = NULL;
		}
	}
	WSACleanup();
	free(addrlistp);
#endif

	return (head);
}

/**
 *
 * @brief
 *      Frees structure holding network information.
 *
 * @par Side Effects:
 *      None
 *
 * @par MT-safe: Yes
 *
 * @param[in]   ni - linked list holding interface name, family,
 *			hostnames returned from system
 *
 * @return void
 */
void
free_if_info(struct log_net_info *ni)
{
	struct log_net_info *curr;
	int i;

	curr = ni;
	while (curr) {
		struct log_net_info *temp;
		temp = curr;
		curr = curr->next;
		if (temp->ifhostnames != NULL) {
			for (i = 0; temp->ifhostnames[i]; i++)
				free(temp->ifhostnames[i]);
		}
		free(temp->ifhostnames);
		free(temp);
	}
}

/**
* @brief
	Get a list of all IPs (ipv4) for a given hostname
*
* @return
*	Comma separated list of IPs in string format
*
* @par Side Effects:
*	None
*
* @par MT-safe: Yes
*
* @param[in]    host        - hostname of the current host to resolve IPs for
* @param[out]   msg_buf     - error message returned if system calls not successful
* @param[in]    msg_buf_len - length of the message buffer passed
*
*/
static char *
get_host_ips(char *host, char *msg_buf, size_t msg_buf_len)
{
	struct addrinfo *aip, *pai;
	struct addrinfo hints;
	int rc = 0;
	char buf[NETADDR_BUF] = {'\0'};
	int count = 0;
	char *nodenames = NULL;
	char *tmp;
	int len, hlen;

	errno = 0;

	memset(&hints, 0, sizeof(struct addrinfo));
	hints.ai_family = AF_INET;
	hints.ai_socktype = SOCK_STREAM;
	hints.ai_protocol = IPPROTO_TCP;

	if ((rc = getaddrinfo(host, NULL, &hints, &pai)) != 0) {
		snprintf(msg_buf, msg_buf_len, "Error %d resolving %s\n", rc, host);
		return NULL;
	}

	len = 0;
	count = 0;
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		if (aip->ai_family == AF_INET) { /* for now only count IPv4 addresses */
			char *p;
			struct sockaddr_in *sa = (struct sockaddr_in *) aip->ai_addr;
			if (ntohl(sa->sin_addr.s_addr) >> 24 == IN_LOOPBACKNET)
				continue;
			sprintf(buf, "%s", netaddr(sa));
			if (!strcmp(buf, "unknown"))
				continue;
			if ((p = strchr(buf, ':')))
				*p = '\0';

			hlen = strlen(buf);
			tmp = realloc(nodenames, len + hlen + 2); /* 2 for comma and null char */
			if (!tmp) {
				strncpy(msg_buf, "Out of memory", msg_buf_len);
				free(nodenames);
				nodenames = NULL;
				break;
			}
			nodenames = tmp;

			if (len == 0)
				strcpy(nodenames, buf);
			else {
				strcat(nodenames, ",");
				strcat(nodenames, buf);
			}
			len += hlen + 2;
			count++;
		}
	}

	freeaddrinfo(pai);

	if (count == 0) {
		snprintf(msg_buf, msg_buf_len, "Could not find any usable IP address for host %s", host);
		return NULL;
	}
	return nodenames;
}

/**
* @brief
*	Get a list of all IPs
*   First it resolves the supplied hostname to determine it's IPs
*	Then it enumerates the interfaces in the host and determines IPs
*	for each of those interfaces.
*
*	Do not supply a remote hostname in this function.
*
* @return
*	Comma separated list of IPs in string format
*
* @par Side Effects:
*	None
*
* @par MT-safe: Yes
*
* @param[in]	hostname    - hostname of the current host to resolve IPs for
* @param[out]   msg_buf     - error message returned if system calls not successful
* @param[in]    msg_buf_len - length of the message buffer passed
*
*/
char *
get_all_ips(char *hostname, char *msg_buf, size_t msg_buf_len)
{
	char *nodenames;
	int len, ret;
	char *tmp;
	char buf[NETADDR_BUF];

#if defined(linux)
	struct ifaddrs *ifp, *listp;
	char *p;
#elif defined(WIN32)
	int i;
	/* Variables used by GetIpAddrTable */
	PMIB_IPADDRTABLE pIPAddrTable;
	DWORD dwSize = 0;
	DWORD dwRetVal = 0;
	IN_ADDR IPAddr;
#endif

	msg_buf[0] = '\0';

	/* prepend the list of IPs with the IPs resolved from the passed hostname */
	nodenames = get_host_ips(hostname, msg_buf, msg_buf_len);
	if (!nodenames) {
		return NULL;
	}

	len = strlen(nodenames);

#if defined(linux)
	ret = getifaddrs(&ifp);

	if ((ret != 0) || (ifp == NULL)) {
		strncpy(msg_buf, "Failed to obtain interface names", msg_buf_len);
		free(nodenames);
		return NULL;
	}

	for (listp = ifp; listp; listp = listp->ifa_next) {
		int hlen;

		if ((listp->ifa_addr == NULL) || (listp->ifa_addr->sa_family != AF_INET))
			continue;
		sprintf(buf, "%s", netaddr((struct sockaddr_in *) listp->ifa_addr));
		if (!strcmp(buf, "unknown"))
			continue;
		if ((p = strchr(buf, ':')))
			*p = '\0';

		hlen = strlen(buf);
		tmp = realloc(nodenames, len + hlen + 2); /* 2 for comma and null char */
		if (!tmp) {
			strncpy(msg_buf, "Out of memory", msg_buf_len);
			free(nodenames);
			nodenames = NULL;
			break;
		}
		nodenames = tmp;

		if (len == 0)
			strcpy(nodenames, buf);
		else {
			strcat(nodenames, ",");
			strcat(nodenames, buf);
		}
		len += hlen + 2;
	}

	freeifaddrs(ifp);

#elif defined(WIN32)

	pIPAddrTable = (MIB_IPADDRTABLE *) malloc(sizeof(MIB_IPADDRTABLE));

	if (pIPAddrTable) {
		// Make an initial call to GetIpAddrTable to get the
		// necessary size into the dwSize variable
		if (GetIpAddrTable(pIPAddrTable, &dwSize, 0) == ERROR_INSUFFICIENT_BUFFER) {
			free(pIPAddrTable);
			pIPAddrTable = (MIB_IPADDRTABLE *) malloc(dwSize);
		}
		if (pIPAddrTable == NULL) {
			strncpy(msg_buf, "Memory allocation failed for GetIpAddrTable", msg_buf_len);
			free(nodenames);
			return NULL;
		}
	}
	// Make a second call to GetIpAddrTable to get the
	// actual data we want
	if ((dwRetVal = GetIpAddrTable(pIPAddrTable, &dwSize, 0)) != NO_ERROR) {
		strncpy(msg_buf, "GetIpAddrTable failed", msg_buf_len);
		free(pIPAddrTable);
		free(nodenames);
		return NULL;
	}

	for (i = 0; i < (int) pIPAddrTable->dwNumEntries; i++) {
		int hlen;
		IPAddr.S_un.S_addr = (u_long) pIPAddrTable->table[i].dwAddr;
		sprintf(buf, "%s", inet_ntoa(IPAddr));
		hlen = strlen(buf);
		tmp = realloc(nodenames, len + hlen + 2); /* 2 for comma and null char */
		if (!tmp) {
			strncpy(msg_buf, "Out of memory", msg_buf_len);
			free(nodenames);
			nodenames = NULL;
			break;
		}
		nodenames = tmp;
		if (len == 0)
			strcpy(nodenames, buf);
		else {
			strcat(nodenames, ",");
			strcat(nodenames, buf);
		}
		len += hlen + 2;
	}

	if (pIPAddrTable) {
		free(pIPAddrTable);
		pIPAddrTable = NULL;
	}

#endif

	return nodenames;
}


================================================
FILE: src/lib/Libnet/net_client.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <stdio.h>

#include <unistd.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <errno.h>
#include <netdb.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include <poll.h>
#include <netinet/tcp.h>
#include "portability.h"
#include "server_limits.h"
#include "libpbs.h"
#include "net_connect.h"
#include "pbs_error.h"
#include "libsec.h"
#include "pbs_internal.h"
#include "auth.h"

/**
 * @file	net_client.c
 */
static int conn_timeout = PBS_DIS_TCP_TIMEOUT_CONNECT; /* timeout for connect */

/**
 * @brief
 * 	engage_authentication - Use the security library interface to
 * 	engage the appropriate connection authentication.
 *
 * @param[in]      sd    socket descriptor to use in CS_* interface
 * @param[in]      addr  network address of the other party
 * @param[in]      port  associated port for the other party
 * @param[in]      authport_flags  authentication flags
 *
 * @return	int
 * @retval	 0  successful
 * @retval	-1 unsuccessful
 *
 * @par	Remark:	If the authentication fails, messages are logged to
 *              the server's log file and the connection's security
 *              information is closed out (freed).
 */

static int
engage_authentication(int sd, struct in_addr addr, int port, int authport_flags)
{
	int ret;
	int mode;
	char ebuf[128];
#if !defined(WIN32)
	char dst[INET_ADDRSTRLEN + 1]; /* for inet_ntop */
#endif

	if (sd < 0) {
		cs_logerr(-1, __func__, "Bad arguments, unable to authenticate.");
		return (-1);
	}

	mode = (authport_flags & B_SVR) ? CS_MODE_SERVER : CS_MODE_CLIENT;
	if (mode == CS_MODE_SERVER) {
		ret = CS_server_auth(sd);
		if (ret == CS_SUCCESS || ret == CS_AUTH_CHECK_PORT)
			return (0);
	} else if (mode == CS_MODE_CLIENT) {
		ret = CS_client_auth(sd);
		if (ret == CS_SUCCESS || ret == CS_AUTH_USE_IFF) {
			/*
				* For authentication via iff CS_client_auth
				* temporarily returning CS_AUTH_USE_IFF until such
				* time as iff becomes a part of CS_client_auth
				*/
			return (0);
		}
	}

#if defined(WIN32)
	/* inet_ntoa is thread-safe on windows */
	sprintf(ebuf,
		"Unable to authenticate with (%s:%d)",
		inet_ntoa(addr), port);
#else
	sprintf(ebuf,
		"Unable to authenticate with (%s:%d)",
		inet_ntop(AF_INET, (void *) &addr, dst,
			  INET_ADDRSTRLEN),
		port);
#endif
	cs_logerr(-1, __func__, ebuf);

	if ((ret = CS_close_socket(sd)) != CS_SUCCESS) {
#if defined(WIN32)
		sprintf(ebuf, "Problem closing context (%s:%d)",
			inet_ntoa(addr), port);
#else
		sprintf(ebuf,
			"Problem closing context (%s:%d)",
			inet_ntop(AF_INET, (void *) &addr, dst,
				  INET_ADDRSTRLEN),
			port);
#endif
		cs_logerr(-1, __func__, ebuf);
	}

	return (-1);
}

/*
 * @brief
 *      client_to_svr calls client_to_svr_extend to perform connection
 *      to server.
 *
 * @param[in]	hostaddr - address of host to which to connect (pbs_net_t)
 * @param[in]	port - port to which to connect
 * @param[in]	authport_flags  - flags or-ed together to describe
 *			authenication mode:
 *			BPRIV - use reserved local port
 *			BSVR  - Server mode if set, client mode if not
 * @returns	int
 * @retval	>=0 the socket obtained
 * @retval 	 PBS_NET_RC_FATAL (-1) if fatal error, just quit
 * @retval	 PBS_NET_RC_RETRY (-2) if temp error, should retry
 *
 */

int
client_to_svr(pbs_net_t hostaddr, unsigned int port, int authport_flags)
{
	return (client_to_svr_extend(hostaddr, port, authport_flags, NULL));
}

/**
 * @brief
 *	client_to_svr_extend - connect to a server
 *	Perform socket/tcp/ip stuff to connect to a server.
 *
 * @par Functionality
 *	Open a tcp connection to the specified address and port.
 *	Binds to a local socket, sets socket initially non-blocking,
 *	connects to remote system, resets sock blocking.
 *
 *	Note, the server's host address and port are was chosen as parameters
 *	rather than their names to possibly save extra look-ups.  It seems
 *	likely that the caller "might" make several calls to the same host or
 *	different hosts with the same port.  Let the caller keep the addresses
 *	around rather than look it up each time.
 *
 *	Special note: The reserved port mechanism is not needed when the
 *               the PBS authentication mechanism is not pbs_iff.  Being
 *               left in for minimal code change.  It should to be removed
 *               in a future version.
 *
 * @param[in]	hostaddr - address of host to which to connect (pbs_net_t)
 * @param[in]	port - port to which to connect
 * @param[in]	authport_flags  - flags or-ed together to describe
 *			authenication mode:
 *			BPRIV - use reserved local port
 *			BSVR  - Server mode if set, client mode if not
 * @param[in]   localaddr - host machine address to bind before connecting
 *                          to server.
 *
 * @returns	int
 * @retval	>=0 the socket obtained
 * @retval 	 PBS_NET_RC_FATAL (-1) if fatal error, just quit
 * @retval	 PBS_NET_RC_RETRY (-2) if temp error, should retry
 */

int
client_to_svr_extend(pbs_net_t hostaddr, unsigned int port, int authport_flags, char *localaddr)
{
	struct sockaddr_in remote;
	int sock;
	int local_port;
	int errn;
	int rc;
#ifdef WIN32
	int ret;
	int non_block = 1;
	struct linger li;
	struct timeval tv;
	fd_set writeset;
#else
	struct pollfd fds[1];
	pbs_socklen_t len = sizeof(rc);
	int oflag;
#endif

	/*	If local privilege port requested, bind to one	*/
	/*	Must be root privileged to do this		*/
	local_port = authport_flags & B_RESERVED;

	if (local_port) {
#ifdef IP_PORTRANGE_LOW
		int lport = IPPORT_RESERVED - 1;

		sock = rresvport(&lport);
		if (sock < 0) {
			if (errno == EAGAIN)
				return PBS_NET_RC_RETRY;
			else
				return PBS_NET_RC_FATAL;
		}
#else /* IP_PORTRANGE_LOW */
		struct sockaddr_in local;
		unsigned short tryport;
		static unsigned short start_port = 0;

		sock = socket(AF_INET, SOCK_STREAM, 0);
		if (sock < 0) {
			return PBS_NET_RC_FATAL;
		}

		if (start_port == 0) { /* arbitrary start point */
			start_port = (getpid() % (IPPORT_RESERVED / 2)) +
				     IPPORT_RESERVED / 2;
		} else if (--start_port < IPPORT_RESERVED / 2)
			start_port = IPPORT_RESERVED - 1;
		tryport = start_port;

		memset(&local, 0, sizeof(local));
		local.sin_family = AF_INET;
		if (localaddr != NULL) {
			local.sin_addr.s_addr = inet_addr(localaddr);
			if (local.sin_addr.s_addr == INADDR_NONE) {
				perror("inet_addr failed");
				return (PBS_NET_RC_FATAL);
			}
		} else if (pbs_conf.pbs_public_host_name) {
			pbs_net_t public_addr;
			public_addr = get_hostaddr(pbs_conf.pbs_public_host_name);
			if (public_addr == (pbs_net_t) 0) {
				return (PBS_NET_RC_FATAL);
			}
			local.sin_addr.s_addr = htonl(public_addr);
		}
		for (;;) {

			local.sin_port = htons(tryport);
			if (bind(sock, (struct sockaddr *) &local,
				 sizeof(local)) == 0)
				break;
#ifdef WIN32
			errno = WSAGetLastError();
			if (errno != EADDRINUSE && errno != EADDRNOTAVAIL && errno != WSAEACCES) {
#else
			if (errno != EADDRINUSE && errno != EADDRNOTAVAIL) {
#endif
				closesocket(sock);
				return PBS_NET_RC_FATAL;
			} else if (--tryport < (IPPORT_RESERVED / 2)) {
				tryport = IPPORT_RESERVED - 1;
			}
			if (tryport == start_port) {
				closesocket(sock);
				return PBS_NET_RC_RETRY;
			}
		}
		/*
		 ** Ensure last tryport becomes start port on next call.
		 */
		start_port = tryport;
#endif /* IP_PORTRANGE_LOW */
	} else {
		sock = socket(AF_INET, SOCK_STREAM, 0);
		if (sock < 0) {
			return PBS_NET_RC_FATAL;
		}
	}

	remote.sin_addr.s_addr = htonl(hostaddr);

	remote.sin_port = htons((unsigned short) port);
	remote.sin_family = AF_INET;
#ifdef WIN32
	li.l_onoff = 1;
	li.l_linger = 5;

	setsockopt(sock, SOL_SOCKET, SO_LINGER, (char *) &li, sizeof(li));

	if (ioctlsocket(sock, FIONBIO, &non_block) == SOCKET_ERROR) {
		errno = WSAGetLastError();
#else
	oflag = fcntl(sock, F_GETFL);
	if (fcntl(sock, F_SETFL, (oflag | O_NONBLOCK)) == -1) {
#endif
		closesocket(sock);
		return (PBS_NET_RC_FATAL);
	}

	if (connect(sock, (struct sockaddr *) &remote, sizeof(remote)) < 0) {

#ifdef WIN32
		errno = WSAGetLastError();
#endif
		/*
		 * Bacause of  threading, pbs_errno is actually a macro
		 * pointing to a variable within a tread context.  On certain
		 * platforms, the threading library resulted in errno being
		 * cleared after pbs_errno was set set from it, so save
		 * errno into a local variable first, then test it.
		 */
		errn = errno;
		pbs_errno = errn;
		switch (errn) {
#ifdef WIN32
			case WSAEINTR:
#else
			case EINTR:
#endif
			case EADDRINUSE:
			case ETIMEDOUT:
			case ECONNREFUSED:
				closesocket(sock);
				return (PBS_NET_RC_RETRY);

#ifdef WIN32
			case WSAEWOULDBLOCK:
				FD_ZERO(&writeset);
				FD_SET((unsigned int) sock, &writeset);
				tv.tv_sec = conn_timeout; /* connect timeout */
				tv.tv_usec = 0;
				ret = select(1, NULL, &writeset, NULL, &tv);
				if (ret == SOCKET_ERROR) {
					errno = WSAGetLastError();
					errn = errno;
					pbs_errno = errn;
					closesocket(sock);
					return PBS_NET_RC_FATAL;
				} else if (ret == 0) {
					closesocket(sock);
					return PBS_NET_RC_RETRY;
				}
				break;
#else  /* UNIX */
			case EWOULDBLOCK:
			case EINPROGRESS:
				while (1) {
					fds[0].fd = sock;
					fds[0].events = POLLOUT;
					fds[0].revents = 0;

					rc = poll(fds, (nfds_t) 1, conn_timeout * 1000);
					if (rc == -1) {
						errn = errno;
						if ((errn != EAGAIN) && (errn != EINTR))
							break;
					} else
						break; /* no error */
				}

				if (rc == 1) {
					/* socket may be connected and ready to write */
					rc = 0;
					if ((getsockopt(sock, SOL_SOCKET, SO_ERROR, &rc, &len) == -1) || (rc != 0)) {
						closesocket(sock);
						return PBS_NET_RC_FATAL;
					}
					break;

				} else if (rc == 0) {
					/* socket not ready - not connected in time */
					closesocket(sock);
					return PBS_NET_RC_RETRY;
				} else {
					/* socket not ready - error */
					closesocket(sock);
					return PBS_NET_RC_FATAL;
				}
#endif /* end UNIX */

			default:
				closesocket(sock);
				return (PBS_NET_RC_FATAL);
		}
	}

	/* reset socket to blocking */
#ifdef WIN32
	non_block = 0;
	if (ioctlsocket(sock, FIONBIO, &non_block) == SOCKET_ERROR) {
		errno = WSAGetLastError();
#else /* UNIX */
	if (fcntl(sock, F_SETFL, oflag) == -1) {
#endif
		closesocket(sock);
		return PBS_NET_RC_FATAL;
	}

	if (engage_authentication(sock,
				  remote.sin_addr, port, authport_flags) != -1)
		return sock;

	/*authentication unsuccessful*/

	closesocket(sock);
	return (PBS_NET_RC_FATAL);
}

/**
 * @brief
 *      This function sets socket options to TCP_NODELAY
 * @param fd
 * @return 0 for SUCCESS
 *        -1 for FAILURE
 */
int
set_nodelay(int fd)
{
	int opt;
	pbs_socklen_t optlen;

	optlen = sizeof(opt);
	if (getsockopt(fd, IPPROTO_TCP, TCP_NODELAY, &opt, &optlen) == -1)
		return 0;

	if (opt == 1)
		return 0;

	opt = 1;
	return setsockopt(fd, IPPROTO_TCP, TCP_NODELAY, &opt, sizeof(opt));
}


================================================
FILE: src/lib/Libnet/net_server.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <netdb.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <signal.h>
#include <stdio.h>
#include <assert.h>
#include <sys/types.h>
#include <sys/time.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <unistd.h>
#include <fcntl.h>
#include <time.h>
#include <stdlib.h>
#include <poll.h>
#include <sys/resource.h>

#include "portability.h"
#include "server_limits.h"
#include "pbs_ifl.h"
#include "net_connect.h"
#include "log.h"
#include "libsec.h"
#include "pbs_error.h"
#include "pbs_internal.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "svrfunc.h"
#include "tpp.h"

/**
 * @file	net_server.c
 */
/* Global Data (I wish I could make it private to the library, sigh, but
 * C don't support that scope of control.)
 *
 * This array of connection structures is used by the server to maintain
 * a record of the open I/O connections, it is indexed by the socket number.
 */

static conn_t **svr_conn;	  /* list of pointers to connections indexed by the socket fd. List is dynamically allocated */
#define CONNS_ARRAY_INCREMENT 100 /* Increases this many more connection pointers when dynamically allocating memory for svr_conn */
static int conns_array_size = 0;  /* Size of the svr_conn list, initialized to 0 */
pbs_list_head svr_allconns;	  /* head of the linked list of active connections */

/*
 * The following data is private to this set of network interface routines.
 */
int max_connection = -1;
static int num_connections = 0;
static int net_is_initialized = 0;
static void *poll_context; /* This is the context of the descriptors being polled */
void *priority_context;
static int init_poll_context(); /* Initialize the tpp context */
static void (*read_func[2])(int);
static int (*ready_read_func[2])(conn_t *);
static char logbuf[256];

/* Private function within this file */
static int conn_find_usable_index(int);
static int conn_find_actual_index(int);
static void accept_conn(int);
static void cleanup_conn(int);

/**
 * @brief
 * 	Makes the socket fd as index in the connection array usable and returns
 *  the socket fd.
 *
 * @par Functionality
 * 	Checks if the socket fd can be indexed into the connection array
 * 	If it is out of bounds, allocates enough slots for the connection array
 * 	and returns the index (the socket fd itself)
 *
 * @param[in] sd - The socket fd for the connection
 *
 * @return Error code
 * @retval 0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 */
static int
conn_find_usable_index(int sd)
{
	void *p;
	unsigned int new_conns_array_size = 0;

	if (sd < 0)
		return -1;

	if (sd >= conns_array_size) {
		new_conns_array_size = sd + CONNS_ARRAY_INCREMENT;
		p = realloc(svr_conn, new_conns_array_size * sizeof(conn_t *));
		if (!p)
			return -1;

		svr_conn = (conn_t **) (p);
		memset((svr_conn + conns_array_size), 0,
		       (new_conns_array_size - conns_array_size) * sizeof(conn_t *));
		conns_array_size = new_conns_array_size;
	}
	return sd;
}

/**
 * @brief
 *	Returns the index of the connection for the socket fd provided
 *
 * @par Functionality
 *	Checks if the socket fd is valid and connection is available and
 *	returns the index to the connection in the array. The index is the
 *	socket identifier itself.
 *
 * @param[in] sd - The socket fd for the connection
 *
 * @return Error code
 * @retval  0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
conn_find_actual_index(int sd)
{
	if (sd >= 0 && sd < conns_array_size) {
		if (svr_conn[sd])
			return sd;
	}
	return -1;
}

/**
 * @brief
 *	Given a socket fd, this function provides the handle to the connection
 *
 * @par Functionality
 *	Checks if the socket fd has a valid connection and if present returns
 *	pointer to the connection structure
 *
 * @param[in] sock - The socket fd for the connection
 *
 * @return Error code
 * @retval conn_t * - Success
 * @retval NULL - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
conn_t *
get_conn(int sd)
{
	int idx = conn_find_actual_index(sd);
	if (idx < 0)
		return NULL;

	return svr_conn[idx];
}

/**
 * @brief
 *	initialize the connection.
 *
 */
void
connection_init(void)
{
	conn_t *cp = NULL;

	if (!svr_allconns.ll_next) {
		CLEAR_HEAD(svr_allconns);
		return;
	}

	cp = (conn_t *) GET_NEXT(svr_allconns);
	while (cp) {
		int sock = cp->cn_sock;
		cp = GET_NEXT(cp->cn_link);
		close_conn(sock);
	}
	CLEAR_HEAD(svr_allconns);
}

/**
 * @brief
 * 	init_network - initialize the network interface
 *
 * @par	Functionality:
 *    	Normal call, port > 0
 *	allocate a socket and bind it to the service port,
 *	add the socket to the readset/pollfds for select()/poll(),
 *	add the socket to the connection structure and set the
 *	processing function to accept_conn()
 *    	Special call, port == 0
 *	Only initial the connection table and poll pollfds or select readset.
 *
 * @param[in] port - port number
 * @param[in] readfunc - callback function which indicates type of request
 *
 * @return	Error code
 * @retval	0	success
 * @retval	-1	error
 */
int
init_network(unsigned int port)
{
	int i;
	size_t j;
	int sd;
#ifdef WIN32
	struct linger li;
#endif
	struct sockaddr_in socname;

	if (port == 0)
		return 0; /* that all for the special init only call */

	sd = socket(AF_INET, SOCK_STREAM, 0);
	if (sd < 0) {
#ifdef WIN32
		errno = WSAGetLastError();
#endif
		log_err(errno, __func__, "socket() failed");
		return (-1);
	}

	i = 1;
	setsockopt(sd, SOL_SOCKET, SO_REUSEADDR, (char *) &i, sizeof(i));

#ifdef WIN32
	li.l_onoff = 1;
	li.l_linger = 5;
	setsockopt(sd, SOL_SOCKET, SO_LINGER, (char *) &li, sizeof(li));
#endif

	/* name that socket "in three notes" */

	j = sizeof(socname);
	memset((void *) &socname, 0, j);
	socname.sin_port = htons((unsigned short) port);
	socname.sin_addr.s_addr = INADDR_ANY;
	socname.sin_family = AF_INET;
	if (bind(sd, (struct sockaddr *) &socname, sizeof(socname)) < 0) {
#ifdef WIN32
		errno = WSAGetLastError();
#endif
		closesocket(sd);
		log_err(errno, __func__, "bind failed");
		return (-1);
	}
	return sd;
}

/**
 * @brief
 * 	init_network_add - initialize the network interface
 * 	and save the routine which should do the reading on connections.
 *
 * @param[in] sd - socket descriptor
 * @param[in] readfunc - routine which should do the reading on connections
 *
 * @return	Error code
 * @retval	 0	success
 * @retval	-1	error
 */
int
init_network_add(int sd, int (*readyreadfunc)(conn_t *), void (*readfunc)(int))
{
	static int initialized = 0;
	enum conn_type type;

	if (initialized == 0) {
		connection_init();
		if (init_poll_context() < 0)
			return (-1);
		type = Primary;
	} else if (initialized == 1)
		type = Secondary;
	else
		return (-1); /* too many main connections */

	net_is_initialized = 1; /* flag that net stuff is initialized */

	if (sd == -1)
		return -1;

	ready_read_func[initialized] = readyreadfunc;

	/* for normal calls ...						*/
	/* save the routine which should do the reading on connections	*/
	/* accepted from the parent socket				*/
	read_func[initialized++] = readfunc;

	/* record socket in connection structure and select set
	 *
	 * remark: passing 0 as port value causing entry's member
	 *         cn_authen to have bit PBS_NET_CONN_PRIVIL set
	 */
	if (add_conn(sd, type, (pbs_net_t) 0, 0, NULL, accept_conn) == NULL) {
#ifdef WIN32
		errno = WSAGetLastError();
#endif
		closesocket(sd);
		log_err(errno, __func__, "add_conn failed");
		return -1;
	}

	/* start listening for connections */
	if (listen(sd, 256) < 0) {
		log_err(errno, __func__, "listen failed");
#ifdef WIN32
		errno = WSAGetLastError();
#endif
		closesocket(sd);
		return (-1);
	}

	return 0;
}

/**
 * @brief
 *	checks for any connection timeout.
 *
 */
void
connection_idlecheck(void)
{
	static time_t last_checked = (time_t) 0;
	time_t now;
	conn_t *next_cp = (conn_t *) GET_NEXT(svr_allconns);

	now = time(NULL);
	if (now - last_checked < 60)
		return;

	/* have any connections timed out ?? */
	while (next_cp) {
		u_long ipaddr;
		conn_t *cp = next_cp;
		next_cp = GET_NEXT(cp->cn_link);

		if (cp->cn_active != FromClientDIS)
			continue;
		if ((now - cp->cn_lasttime) <= PBS_NET_MAXCONNECTIDLE)
			continue;
		if (cp->cn_authen & PBS_NET_CONN_NOTIMEOUT)
			continue; /* do not time-out this connection */

		ipaddr = cp->cn_addr;
		snprintf(logbuf, sizeof(logbuf),
			 "timeout connection from %lu.%lu.%lu.%lu",
			 (ipaddr & 0xff000000) >> 24, (ipaddr & 0x00ff0000) >> 16,
			 (ipaddr & 0x0000ff00) >> 8, (ipaddr & 0x000000ff));
		log_err(0, __func__, logbuf);
		close_conn(cp->cn_sock);
	}
	last_checked = now;
}

/**
 * @brief
 *	engage_authentication - Use the security library interface to
 * 	engage the appropriate connection authentication.
 *
 * @param[in] pconn  pointer to a "conn_t" variable
 *
 * @return Error code
 * @return	 0  successful
 * @retval	-1 unsuccessful
 *
 * @par Remark:
 *	If the authentication fails, messages are logged to
 *	the server's log file and the connection's security
 *	information is closed out (freed).
 */
static int
engage_authentication(conn_t *pconn)
{
	int ret;
	int sd;
	char ebuf[PBS_MAXHOSTNAME + 1] = {'\0'};
	char *msgbuf;

	if (pconn == NULL || (sd = pconn->cn_sock) < 0) {
		log_err(-1, __func__, "bad arguments, unable to authenticate");
		return (-1);
	}

	if ((ret = CS_server_auth(sd)) == CS_SUCCESS) {
		pconn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;
		return (0);
	}

	if (ret == CS_AUTH_CHECK_PORT) {
		/*dealing with STD security's  "equivalent of"  CS_sever_auth*/
		if (pconn->cn_authen & PBS_NET_CONN_FROM_PRIVIL)
			pconn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;
		return (0);
	}

	(void) get_connecthost(sd, ebuf, sizeof(ebuf));

	pbs_asprintf(&msgbuf,
		     "unable to authenticate connection from (%s:%d)",
		     ebuf, pconn->cn_port);
	log_err(-1, __func__, msgbuf);
	free(msgbuf);

	return (-1);
}

/*
 * @brief
 * process_socket  -  The static method processes given socket and
 *                    engages the appropriate connection authentication.
 *
 * @param[in]   sock 	- socket fd to process
 *
 * @retval	-1 for failure
 * @retval	0  for success
 *
 */
static int
process_socket(int sock)
{
	int idx = conn_find_actual_index(sock);
	if (idx < 0) {
		return -1;
	}
	svr_conn[idx]->cn_lasttime = time(NULL);
	if ((svr_conn[idx]->cn_active != Primary) &&
	    (svr_conn[idx]->cn_active != TppComm) &&
	    (svr_conn[idx]->cn_active != Secondary)) {
		if (!(svr_conn[idx]->cn_authen & PBS_NET_CONN_AUTHENTICATED)) {
			if (engage_authentication(svr_conn[idx]) == -1) {
				close_conn(sock);
				return -1;
			}
		}
	}

	if (svr_conn[idx]->cn_ready_func != NULL) {
		int ret = 0;
		ret = svr_conn[idx]->cn_ready_func(svr_conn[idx]);
		if (ret == -1) {
			close_conn(sock);
			return -1;
		} else if (ret == 0) {
			/* no data for cn_func */
			return 0;
		}
		/* EOF will be handled in cn_func */
	}
	svr_conn[idx]->cn_func(svr_conn[idx]->cn_sock);
	return 0;
}

/**
 * @brief
 *	Waits for events on a set of sockets and calls processing function
 *	corresponding to the socket fd.
 *
 * @par Functionality
 * wait_request - wait for a request (socket with data to read)
 *	This routine does a tpp_em_wait - which internally does poll()/epoll()/select()
 *	based on the platform on the socket fds.
 *	It loops through the socket fds which has events on them and the processing
 *	routine associated with the socket is invoked.
 *
 * @param[in] waittime - Timeout for tpp_em_wait (poll)
 * @param[in] priority_context - context consists of high priority socket connections
 *
 * @return Error code
 * @retval 0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
wait_request(float waittime, void *priority_context)
{
	int nfds;
	int pnfds;
	int i;
	em_event_t *events;
	int err;
	int prio_sock_processed;
	int em_fd;
	int em_pfd;
	int timeout = (int) (waittime * 1000); /* milli seconds */
					       /* Platform specific declarations */

#ifndef WIN32
	sigset_t pendingsigs;
	sigset_t emptyset;
	extern sigset_t allsigs;

	/* wait after unblocking signals in an atomic call */
	sigemptyset(&emptyset);
	nfds = tpp_em_pwait(poll_context, &events, timeout, &emptyset);
	err = errno;
#else
	errno = 0;
	nfds = tpp_em_wait(poll_context, &events, timeout);
	err = errno;
#endif /* WIN32 */
	if (nfds < 0) {
		if (!(err == EINTR || err == EAGAIN || err == 0)) {
			snprintf(logbuf, sizeof(logbuf), " tpp_em_wait() error, errno=%d", err);
			log_err(err, __func__, logbuf);
			return (-1);
		}
	} else {
		prio_sock_processed = 0;
		if (priority_context) {
			em_event_t *pevents;
			timeout = 0;
#ifndef WIN32
			/* wait after unblocking signals in an atomic call */
			sigemptyset(&emptyset);
			pnfds = tpp_em_pwait(priority_context, &pevents, timeout, &emptyset);
			err = errno;
#else
			pnfds = tpp_em_wait(priority_context, &pevents, timeout);
			err = errno;
#endif /* WIN32 */
			for (i = 0; i < pnfds; i++) {
				em_pfd = EM_GET_FD(pevents, i);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
					  LOG_DEBUG, __func__, "processing priority socket");
				if (process_socket(em_pfd) == -1) {
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
						  LOG_DEBUG, __func__, "process priority socket failed");
				} else {
					prio_sock_processed = 1;
				}
			}
		}

		for (i = 0; i < nfds; i++) {
			em_fd = EM_GET_FD(events, i);
#ifndef WIN32
			/* If there is any of the following signals pending, allow a small window to handle the signal */
			if (sigpending(&pendingsigs) == 0) {
				if (sigismember(&pendingsigs, SIGCHLD) || sigismember(&pendingsigs, SIGHUP) || sigismember(&pendingsigs, SIGINT) || sigismember(&pendingsigs, SIGTERM)) {

					if (sigprocmask(SIG_UNBLOCK, &allsigs, NULL) == -1)
						log_err(errno, __func__, "sigprocmask(UNBLOCK)");
					if (sigprocmask(SIG_BLOCK, &allsigs, NULL) == -1)
						log_err(errno, __func__, "sigprocmask(BLOCK)");

					return (0);
				}
			}
#endif
			if (prio_sock_processed) {
				int idx = conn_find_actual_index(em_fd);
				if (idx < 0)
					continue;
				if (svr_conn[idx]->cn_prio_flag == 1)
					continue;
			}
			if (process_socket(em_fd) == -1) {
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
					  LOG_DEBUG, __func__, "process socket failed");
			}
		}
	}

#ifndef WIN32
	connection_idlecheck();
#endif

	return (0);
}

/**
 * @brief
 *	accept request for new connection
 *	this routine is normally associated with the main socket,
 *	requests for connection on the socket are accepted and
 *	the new socket is added to the select set and the connection
 *	structure - the processing routine is set to the external
 *	function: process_request(socket)Makes a PBS_BATCH_Connect request to
 *	'server'.
 *
 * @param[in]   sd - main socket with connection request pending
 *
 * @return void
 *
 */
static void
accept_conn(int sd)
{
	int newsock;
	struct sockaddr_in from;
	pbs_socklen_t fromsize;

	int idx = conn_find_actual_index(sd);
	if (idx == -1)
		return;

	/* update last-time of main socket */

	svr_conn[idx]->cn_lasttime = time(NULL);

	fromsize = sizeof(from);
	newsock = accept(sd, (struct sockaddr *) &from, &fromsize);
	if (newsock == -1) {
#ifdef WIN32
		errno = WSAGetLastError();
#endif
		log_err(errno, __func__, "accept failed");
		return;
	}

	/*
	 * Disable Nagle's algorithm on this TCP connection to server.
	 * Nagle's algorithm is hurting cmd-server communication.
	 */
	if (set_nodelay(newsock) == -1) {
		log_err(errno, __func__, "set_nodelay failed");
		(void) close(newsock);
		return; /* set_nodelay failed */
	}

	/* add the new socket to the select set and connection structure */

	(void) add_conn(newsock, FromClientDIS,
			(pbs_net_t) ntohl(from.sin_addr.s_addr),
			(unsigned int) ntohs(from.sin_port),
			ready_read_func[(int) svr_conn[idx]->cn_active],
			read_func[(int) svr_conn[idx]->cn_active]);
}

/**
 * @brief
 *	add_conn - add a connection to the svr_conn array.
 *
 * @par Functionality:
 *	Find an empty slot in the connection table.  This is done by hashing
 *	on the socket (file descriptor).  On Windows, this is not a small
 *	interger.  The socket is then added to the poll/select set.
 *
 * @param[in]	sd: socket descriptor
 * @param[in]	type: (enumb conn_type)
 * @param[in]	addr: host IP address in host byte order
 * @param[in]	port: port number in host byte order
 * @param[in]	func: pointer to function to call when data is ready to read
 *
 * @return	pointer to conn_t
 * @retval	NULL - failure.
 */
conn_t *
add_conn(int sd, enum conn_type type, pbs_net_t addr, unsigned int port, int (*ready_func)(conn_t *), void (*func)(int))
{
	int idx;
	conn_t *conn;

	idx = conn_find_usable_index(sd);
	if (idx == -1)
		return NULL;

	conn = (conn_t *) calloc(1, sizeof(conn_t));
	if (!conn) {
		return NULL;
	}

	conn->cn_sock = sd;
	conn->cn_active = type;
	conn->cn_addr = addr;
	conn->cn_port = (unsigned short) port;
	conn->cn_lasttime = time(NULL);
	conn->cn_ready_func = ready_func;
	conn->cn_func = func;
	conn->cn_oncl = 0;
	conn->cn_authen = 0;
	conn->cn_authen |= PBS_NET_CONN_PREVENT_IP_SPOOFING;
	conn->cn_prio_flag = 0;
	conn->cn_auth_config = NULL;

	num_connections++;

	if (port < IPPORT_RESERVED)
		conn->cn_authen |= PBS_NET_CONN_FROM_PRIVIL;

	svr_conn[idx] = conn;

	/* Add to list of connections */
	CLEAR_LINK(conn->cn_link);
	append_link(&svr_allconns, &conn->cn_link, conn);

	if (tpp_em_add_fd(poll_context, sd, EM_IN | EM_HUP | EM_ERR) < 0) {
		int err = errno;
		snprintf(logbuf, sizeof(logbuf),
			 "could not add socket %d to the poll list", sd);
		log_err(err, __func__, logbuf);
		close_conn(sd);
		return NULL;
	}

	return svr_conn[idx];
}

/**
 * @brief set given conn as priority connection and add it to priority poll list
 *
 * @param[in]	conn - pointer to connection structure
 *
 * @return int
 * @retval 0 - failure
 * @retval 1 - success
 */
int
set_conn_as_priority(conn_t *conn)
{
	if (!conn || conn->cn_sock < 0)
		return 0;

	if (conn->cn_prio_flag == 1)
		return 1;

	if (tpp_em_add_fd(priority_context, conn->cn_sock, EM_IN | EM_HUP | EM_ERR) < 0) {
		log_errf(errno, __func__, "could not add socket %d to the priority poll list", conn->cn_sock);
		return 0;
	}
	conn->cn_prio_flag = 1;
	return 1;
}

/**
 * @brief
 *	add_conn_data - add some data to a connection
 *
 * @par Functionality:
 *	This function identifies the connection based on index provided
 *  and sets cn_data value
 *
 * @param[in]	sd: socket descriptor
 * @param[in]	data: void pointer to the data
 * @param[in]	func: pointer to function to call when connection is to be deleted
 *
 * @return Connection index
 * @return  0 if the connection index is valid
 * @return -1 if the connection index is invalid
 */
int
add_conn_data(int sd, void *data)
{
	int idx = conn_find_actual_index(sd);
	if (idx < 0) {
		return -1;
	}

	svr_conn[idx]->cn_data = data;
	return 0;
}

/**
 * @brief
 *	get_conn_data - get cn_data from the connection
 *
 * @par Functionality:
 *	This function identifies the connection based on index provided
 *  and sets cn_data value
 *
 * @param[in]	sd: socket descriptor
 *
 * @return pointer to the connection related data
 * @retval - Null, if sd not found
 *
 */
void *
get_conn_data(int sd)
{
	int idx = conn_find_actual_index(sd);
	if (idx < 0) {
		snprintf(logbuf, sizeof(logbuf), "could not find index for the socket %d", sd);
		log_err(-1, __func__, logbuf);
		return NULL;
	}

	return svr_conn[idx]->cn_data;
}

/**
 * @brief
 *	close_conn - close a connection in the svr_conn array.
 *
 * @par Functionality:
 *	Validate the socket (file descriptor).  For Unix/Linux it is a small
 *	integer less than the max number of connections.  For Windows, it is
 *	a valid socket value (not equal to INVALID_SOCKET).
 *	The entry in the table corresponding to the socket is found.
 *	If the entry is for a network socket (not a pipe), it is closed via
 *	CS_close_socket() which typically just does a close; for Windows,
 *	closesocket() is used.
 *	For a pipe (not a network socket), plain close() is called.
 *	If there is a function to be called, see cn_oncl table entry, that
 *	function is called.
 *	The table entry is cleared and marked "Idle" meaning it is free for
 *	reuse.
 *
 * @param[in]	sock: socket or file descriptor
 *
 */
void
close_conn(int sd)
{
	int idx;

#ifdef WIN32
	if ((sd == INVALID_SOCKET))
#else
	if ((sd < 0))
#endif
		return;

	idx = conn_find_actual_index(sd);
	if (idx == -1)
		return;

	if (svr_conn[idx]->cn_active != ChildPipe) {
		dis_destroy_chan(sd);
	}

	if (svr_conn[idx]->cn_active != ChildPipe) {
		if (CS_close_socket(sd) != CS_SUCCESS) {
			char ebuf[PBS_MAXHOSTNAME + 1] = {'\0'};
			char *msgbuf;

			(void) get_connecthost(sd, ebuf, sizeof(ebuf));
			pbs_asprintf(&msgbuf,
				     "problem closing security context for %s:%d",
				     ebuf, svr_conn[idx]->cn_port);
			log_err(-1, __func__, msgbuf);
			free(msgbuf);
		}

		/* if there is a function to call on close, do it */
		if (svr_conn[idx]->cn_oncl != 0)
			svr_conn[idx]->cn_oncl(sd);

		cleanup_conn(idx);
		num_connections--;

		closesocket(sd);
	} else {
		/* if there is a function to call on close, do it */
		if (svr_conn[idx]->cn_oncl != 0)
			svr_conn[idx]->cn_oncl(sd);

		cleanup_conn(idx);
		num_connections--;
		closesocket(sd); /* pipe so use normal close */
	}
}

/**
 * @brief
 *	cleanup_conn - reset a connection entry in the svr_conn array.
 *
 * @par Functionality:
 * 	Given an index within the svr_conn array, reset all fields back to
 * 	their defaults and clear any select/poll related flags.
 *
 * @param[in]	idx: index of the svr_conn entry
 *
 */
static void
cleanup_conn(int idx)
{
	if (tpp_em_del_fd(poll_context, svr_conn[idx]->cn_sock) < 0) {
		int err = errno;
		snprintf(logbuf, sizeof(logbuf),
			 "could not remove socket %d from poll list", svr_conn[idx]->cn_sock);
		log_err(err, __func__, logbuf);
	}
	if (svr_conn[idx]->cn_prio_flag) {
		if (tpp_em_del_fd(priority_context, svr_conn[idx]->cn_sock) < 0) {
			int err = errno;
			snprintf(logbuf, sizeof(logbuf),
				 "could not remove socket %d from priority poll list", svr_conn[idx]->cn_sock);
			log_err(err, __func__, logbuf);
		}
	}

	/* Remove connection from the linked list */
	delete_link(&svr_conn[idx]->cn_link);

	svr_conn[idx]->cn_physhost[0] = '\0';
	if (svr_conn[idx]->cn_credid) {
		free(svr_conn[idx]->cn_credid);
		svr_conn[idx]->cn_credid = NULL;
	}

	if (svr_conn[idx]->cn_auth_config) {
		free_auth_config(svr_conn[idx]->cn_auth_config);
		svr_conn[idx]->cn_auth_config = NULL;
	}

	/* Free the connection memory */
	free(svr_conn[idx]);
	svr_conn[idx] = NULL;
}

/**
 * @brief
 * 	net_close - close all network connections but the one specified,
 *	if called with impossible socket number (-1), all will be closed.
 *	This function is typically called when a server is closing down and
 *	when it is forking a child.
 *
 * @par	Note:
 *	We clear the cn_oncl field in the connection table to prevent any
 *	"special on close" functions from being called.
 *
 * @param[in] but - socket number to leave open
 *
 * @par	Note:
 *	free() the dynamically allocated data
 *
 */
void
net_close(int but)
{
	conn_t *cp = NULL;

	if (net_is_initialized == 0)
		return;

	cp = (conn_t *) GET_NEXT(svr_allconns);
	while (cp) {
		int sock = cp->cn_sock;
		cp = GET_NEXT(cp->cn_link);
		if (sock != but) {
			svr_conn[sock]->cn_oncl = NULL;
			close_conn(sock);
			destroy_connection(sock);
		}
	}

	if (but == -1) {
		tpp_em_destroy(poll_context);
		tpp_em_destroy(priority_context);
		net_is_initialized = 0;
	}
}

/**
 * @brief
 * 	get_connectaddr - return address of host connected via the socket
 *	This is in host order.
 *
 * @param[in] sd - socket descriptor
 *
 * @return address of host
 * @retval !0		success
 * @retval 0		error
 *
 */
pbs_net_t
get_connectaddr(int sd)
{
	int idx = conn_find_actual_index(sd);
	if (idx == -1)
		return (0);

	return (svr_conn[idx]->cn_addr);
}

/**
 * @brief
 * 	get_connecthost - return name of host connected via the socket
 *
 * @param[in] sd - socket descriptor
 * @param[out] namebuf - buffer to hold host name
 * @param[out] size - size of buffer
 *
 * @return Error code
 * @retval	0	success
 * @retval -1	error
 *
 */
int
get_connecthost(int sd, char *namebuf, int size)
{
	int i;
	struct hostent *phe;
	struct in_addr addr;
	int namesize = 0;
#if !defined(WIN32)
	char dst[INET_ADDRSTRLEN + 1]; /* for inet_ntop */
#endif

	int idx = conn_find_actual_index(sd);
	if (idx == -1)
		return (-1);

	size--;
	addr.s_addr = htonl(svr_conn[idx]->cn_addr);

	if ((phe = gethostbyaddr((char *) &addr, sizeof(struct in_addr),
				 AF_INET)) == NULL) {
#if defined(WIN32)
		/* inet_ntoa is thread-safe on windows */
		(void) strcpy(namebuf, inet_ntoa(addr));
#else
		(void) strcpy(namebuf,
			      inet_ntop(AF_INET, (void *) &addr, dst, INET_ADDRSTRLEN));
#endif
	} else {
		namesize = strlen(phe->h_name);
		for (i = 0; i < size; i++) {
			*(namebuf + i) = tolower((int) *(phe->h_name + i));
			if (*(phe->h_name + i) == '\0')
				break;
		}
		*(namebuf + size) = '\0';
	}
	if (namesize > size)
		return (-1);

	return (0);
}

/**
 * @brief
 *	Initialize maximum connetions.
 *	Init the pollset i.e. socket descriptors to be polled.
 *
 * @par Functionality:
 *	For select() in WIN32, max_connection is decided based on the
 *	FD_SETSIZE (max vaue, select() can handle) but for Unix variants
 *	that is decided by getrlimit() or getdtablesize(). For poll(),
 *	allocate memory for pollfds[] and init the table.
 *
 * @par Linkage scope:
 *	static (local)
 *
 * @return Error code
 * @retval	 0 for success
 * @retval	-1 for failure
 *
 * @par Reentrancy
 *	MT-unsafe
 *
 */
static int
init_poll_context(void)
{
#ifdef WIN32
	int sd_dummy;
	max_connection = FD_SETSIZE;
#else
	int idx;
	int nfiles;
	struct rlimit rl;

	idx = getrlimit(RLIMIT_NOFILE, &rl);
	if ((idx == 0) && (rl.rlim_cur != RLIM_INFINITY))
		nfiles = rl.rlim_cur;
	else
		nfiles = getdtablesize();

	if ((nfiles > 0))
		max_connection = nfiles;

#endif
	DBPRT(("#init_poll_context: initializing poll_context for %d", max_connection))
	poll_context = tpp_em_init(max_connection);
	if (poll_context == NULL) {
		log_err(errno, __func__, "could not initialize poll_context");
		return (-1);
	}
	priority_context = tpp_em_init(max_connection);
	if (priority_context == NULL) {
		log_err(errno, __func__, "could not initialize priority_context");
		return (-1);
	}
#ifdef WIN32
	/* set a dummy fd in the read set so that	*/
	/* select() does not return WSAEINVAL 		*/
	sd_dummy = socket(AF_INET, SOCK_STREAM, 0);
	if (sd_dummy < 0) {
		errno = WSAGetLastError();
		log_err(errno, __func__, "socket() failed");
		return -1;
	}
	if ((tpp_em_add_fd(poll_context, sd_dummy, EM_IN) == -1)) {
		int err = errno;
		snprintf(logbuf, sizeof(logbuf),
			 "Could not add socket %d to the read set", sd_dummy);
		log_err(err, __func__, logbuf);
		closesocket(sd_dummy);
		return -1;
	}
	if ((tpp_em_add_fd(priority_context, sd_dummy, EM_IN) == -1)) {
		int err = errno;
		snprintf(logbuf, sizeof(logbuf),
			 "Could not add socket %d to the read set for priority socket", sd_dummy);
		log_err(err, __func__, logbuf);
		closesocket(sd_dummy);
		return -1;
	}
#endif /* WIN32 */

	return 0;
}


================================================
FILE: src/lib/Libnet/net_set_clse.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	net_set_clse.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "portability.h"
#include <sys/types.h>
#include "pbs_ifl.h"
#include "net_connect.h"

/**
 * @brief
 * 	net_add_close_func - install a function to be called on close of
 *	the network connection
 *
 * @param[in] sd - socket descriptor
 * @param[in] func - callback function indicating type of request
 *
 * @return	Void
 *
 */

void
net_add_close_func(int sd, void (*func)(int))
{
	conn_t *conn = get_conn(sd);

	if (!conn)
		return;

	conn->cn_oncl = func;
}


================================================
FILE: src/lib/Libnet/port_forwarding.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <netinet/in.h>
#include <netinet/tcp.h>
#include <sys/un.h>
#include <sys/socket.h>
#include <netdb.h>

#include <errno.h>
#include <fcntl.h>
#include <stdio.h>
#include <string.h>
#include <termios.h>
#include <unistd.h>
#include <stdlib.h>

#include "port_forwarding.h"
#include "pbs_ifl.h"
#include "log.h"
#include "libutil.h"
#include "auth.h"
#include "dis.h"

#define PF_LOGGER(logfunc, msg) \
	if (logfunc != NULL) {  \
		logfunc(msg);   \
	}

/* handy utility to handle forwarding socket connections to another host
 * pass in an initialized pfwdsock struct with sockets to listen on, a function
 * pointer to get a new socket for forwarding, and a hostname and port number to
 * pass to the function pointer, and it will do the rest. The caller probably
 * should fork first since this function is an infinite loop and never returns */

/* __attribute__((noreturn)) - how do I do this portably? */
int x11_reader_go = 1;

extern int set_nodelay(int fd);

/**
 * @brief
 *      This function provides the port forwarding feature for forwarding the
 *      X data from mom to qsub and from qsub to the X server.
 *
 * @param socks[in] - Input structure which tracks the sockets that are active
 *                    and data read/written by peers.
 * @param connfunc[in] - Function pointer pointing to a function used for
 *                       either connecting the X server (if running in qsub) or
 *                       connecting qsub (if running in mom).
 * @param phost[in] - peer host that needs to be connected.
 * @param pport[in] - peer port number.
 * @param inter_read_sock[in] -  socket descriptor from where mom and qsub
 *                               readers read data.
 * @param readfunc[in] - function pointer pointing to the mom and qsub readers.
 * @param logfunc[in] - Function pointer for log function
 * @param is_qsub_side[in] - Can be one of QSUB_SIDE (1) or EXEC_HOST_SIDE (0)
 * @param auth_method[in] - Authentication method used
 * @param encrypt_method[in] - Encryption method used
 * @param jobid[in] - Job id
 *
 * @return void
 */
void
port_forwarder(
	struct pfwdsock *socks,
	int (*connfunc)(char *, long),
	char *phost,
	int pport,
	int inter_read_sock,
	int (*readfunc)(int),
	void (*logfunc)(char *),
	int is_qsub_side,
	char *auth_method,
	char *encrypt_method,
	char *jobid)
{
	fd_set rfdset, wfdset, efdset;
	int rc;
	struct sockaddr_in from;
	pbs_socklen_t fromlen;
	int n, n2, sock;
	fromlen = sizeof(from);
	char err_msg[LOG_BUF_SIZE];
	int readfunc_ret;
	/*
	 * Make the sockets in the socks structure non blocking
	 */
	for (n = 0; n < NUM_SOCKS; n++) {
		if (!(socks + n)->active || ((socks + n)->sock < 0))
			continue;
		if (set_nonblocking((socks + n)->sock) == -1) {
			close((socks + n)->sock);
			(socks + n)->active = 0;
			snprintf(err_msg, sizeof(err_msg),
				 "set_nonblocking failed for socket=%d, errno=%d",
				 (socks + n)->sock, errno);
			PF_LOGGER(logfunc, err_msg);
			continue;
		}
		if (set_nodelay((socks + n)->sock) == -1) {
			snprintf(err_msg, sizeof(err_msg),
				 "set_nodelay failed for socket=%d, errno=%d",
				 (socks + n)->sock, errno);
			PF_LOGGER(logfunc, err_msg);
		}
	}

	while (x11_reader_go) {
		int maxsock;

		FD_ZERO(&rfdset);
		FD_ZERO(&wfdset);
		FD_ZERO(&efdset);
		maxsock = inter_read_sock + 1;
		/*setting the sock fd in rfdset for qsub and mom readers to read data*/
		FD_SET(inter_read_sock, &rfdset);
		FD_SET(inter_read_sock, &efdset);
		for (n = 0; n < NUM_SOCKS; n++) {
			if (!(socks + n)->active || ((socks + n)->sock < 0))
				continue;

			if ((socks + n)->listening) {
				FD_SET((socks + n)->sock, &rfdset);
				maxsock = (socks + n)->sock > maxsock ? (socks + n)->sock : maxsock;
			} else {
				if ((socks + n)->bufavail < PF_BUF_SIZE) {
					FD_SET((socks + n)->sock, &rfdset);
					maxsock = (socks + n)->sock > maxsock ? (socks + n)->sock : maxsock;
				}
				if ((socks + ((socks + n)->peer))->bufavail -
					    (socks + ((socks + n)->peer))->bufwritten >
				    0) {
					FD_SET((socks + n)->sock, &wfdset);
					maxsock = (socks + n)->sock > maxsock ? (socks + n)->sock : maxsock;
				}
			}
		}

		maxsock++;

		rc = select(maxsock, &rfdset, &wfdset, &efdset, NULL);
		if ((rc == -1) && (errno == EINTR))
			continue;
		if (rc < 0) {
			snprintf(err_msg, sizeof(err_msg),
				 "port forwarding select() error");
			PF_LOGGER(logfunc, err_msg);
			return;
		}
		if (FD_ISSET(inter_read_sock, &efdset)) {
			snprintf(err_msg, sizeof(err_msg),
				 "exception for socket=%d, errno=%d",
				 inter_read_sock, errno);
			PF_LOGGER(logfunc, err_msg);
			close(inter_read_sock);
			return;
		}
		if (FD_ISSET(inter_read_sock, &rfdset)) {
			/*calling mom/qsub readers*/
			readfunc_ret = readfunc(inter_read_sock);
			if (readfunc_ret == -1) {
				snprintf(err_msg, sizeof(err_msg),
					 "readfunc failed for socket:%d", inter_read_sock);
				PF_LOGGER(logfunc, err_msg);
			}
			if (readfunc_ret < 0) {
				return;
			}
		}

		for (n = 0; n < NUM_SOCKS; n++) {
			if (!(socks + n)->active || ((socks + n)->sock < 0))
				continue;
			if (FD_ISSET((socks + n)->sock, &rfdset)) {
				if ((socks + n)->listening && (socks + n)->active) {
					int newsock = 0, peersock = 0;
					if ((sock = accept((socks + n)->sock, (struct sockaddr *) &from, &fromlen)) < 0) {
						if ((errno == EAGAIN) || (errno == EWOULDBLOCK) || (errno == EINTR) || (errno == ECONNABORTED))
							continue;
						snprintf(err_msg, sizeof(err_msg),
							 "closing the socket %d after accept call failure, errno=%d",
							 (socks + n)->sock, errno);
						PF_LOGGER(logfunc, err_msg);
						close((socks + n)->sock);
						(socks + n)->active = 0;
						continue;
					}

					/* authenticate execution host socket */
					if (is_qsub_side == QSUB_SIDE) {
						if (auth_exec_socket(sock, &from, auth_method, encrypt_method, jobid) != INTERACTIVE_AUTH_SUCCESS) {
							snprintf(err_msg, sizeof(err_msg),
								"Incoming connection from %s on socket %d rejected, authentication data incorrect, errno=%d",
								netaddr((struct sockaddr_in *)&from), sock, errno);
							PF_LOGGER(logfunc, err_msg);
							shutdown(sock, SHUT_RDWR);
							close(sock);
							dis_destroy_chan(sock);
							continue;
						}
					}

					/*
					 * Make the sock non blocking
					 */
					if (set_nonblocking(sock) == -1) {
						snprintf(err_msg, sizeof(err_msg),
							 "set_nonblocking failed for socket=%d, errno=%d",
							 sock, errno);
						PF_LOGGER(logfunc, err_msg);
						close(sock);
						dis_destroy_chan(sock);
						continue;
					}
					if (set_nodelay(sock) == -1) {
						snprintf(err_msg, sizeof(err_msg),
							 "set_nodelay failed for socket=%d, errno=%d",
							 sock, errno);
						PF_LOGGER(logfunc, err_msg);
					}

					newsock = peersock = 0;

					for (n2 = 0; n2 < NUM_SOCKS; n2++) {
						if ((socks + n2)->active || (((socks + n2)->peer != 0) && (socks + ((socks + n2)->peer))->active))
							continue;
						if (newsock == 0)
							newsock = n2;
						else if (peersock == 0)
							peersock = n2;
						else
							break;
					}

					(socks + newsock)->sock = (socks + peersock)->remotesock = sock;
					(socks + newsock)->listening = (socks + peersock)->listening = 0;
					(socks + newsock)->active = (socks + peersock)->active = 1;
					(socks + peersock)->sock = connfunc(phost, pport);

					/* authenticate with qsub side */
					if (is_qsub_side == EXEC_HOST_SIDE) {
						if (auth_with_qsub((socks + peersock)->sock, pport, phost, auth_method, encrypt_method, jobid) != 0) {
							snprintf(err_msg, sizeof(err_msg),
								"Authentication for outgoing connection to qsub from port %u on socket %d rejected by remote side, errno=%d",
								pport, (socks + peersock)->sock, errno);
							PF_LOGGER(logfunc, err_msg);
							close((socks + peersock)->sock);
							dis_destroy_chan((socks + peersock)->sock);
							(socks + peersock)->active = 0;
							continue;
						}
					}
					/*
					 * Make sockets non-blocking
					 */
					if (set_nonblocking((socks + peersock)->sock) == -1) {
						snprintf(err_msg, sizeof(err_msg),
							 "set_nonblocking failed for socket=%d, errno=%d",
							 (socks + peersock)->sock, errno);
						PF_LOGGER(logfunc, err_msg);
						close((socks + peersock)->sock);
						dis_destroy_chan((socks + peersock)->sock);
						(socks + peersock)->active = 0;
						continue;
					}
					if (set_nodelay((socks + peersock)->sock) == -1) {
						snprintf(err_msg, sizeof(err_msg),
							 "set_nodelay failed for socket=%d, errno=%d",
							 (socks + peersock)->sock, errno);
						PF_LOGGER(logfunc, err_msg);
					}
					(socks + newsock)->bufwritten = (socks + peersock)->bufwritten = 0;
					(socks + newsock)->bufavail = (socks + peersock)->bufavail = 0;
					(socks + newsock)->buff[0] = (socks + peersock)->buff[0] = '\0';
					(socks + newsock)->peer = peersock;
					(socks + peersock)->peer = newsock;
				} else {
					/* non-listening socket to be read */
					rc = read(
						(socks + n)->sock,
						(socks + n)->buff + (socks + n)->bufavail,
						PF_BUF_SIZE - (socks + n)->bufavail);
					if (rc == -1) {
						if ((errno == EWOULDBLOCK) || (errno == EAGAIN) || (errno == EINTR) || (errno == EINPROGRESS)) {
							continue;
						}
						shutdown((socks + n)->sock, SHUT_RDWR);
						close((socks + n)->sock);
						dis_destroy_chan((socks + n)->sock);
						(socks + n)->active = 0;
						snprintf(err_msg, sizeof(err_msg),
							 "closing the socket %d after read failure, errno=%d",
							 (socks + n)->sock, errno);
						PF_LOGGER(logfunc, err_msg);
					} else if (rc == 0) {
						shutdown((socks + n)->sock, SHUT_RDWR);
						close((socks + n)->sock);
						dis_destroy_chan((socks + n)->sock);
						(socks + n)->active = 0;
					} else {
						(socks + n)->bufavail += rc;
					}
				}
			} /* END if rfdset */
			if (FD_ISSET((socks + n)->sock, &wfdset)) {
				int peer = (socks + n)->peer;

				rc = write(
					(socks + n)->sock,
					(socks + peer)->buff + (socks + peer)->bufwritten,
					(socks + peer)->bufavail - (socks + peer)->bufwritten);

				if (rc == -1) {
					if ((errno == EWOULDBLOCK) || (errno == EAGAIN) || (errno == EINTR) || (errno == EINPROGRESS)) {
						continue;
					}
					shutdown((socks + n)->sock, SHUT_RDWR);
					close((socks + n)->sock);
					dis_destroy_chan((socks + n)->sock);
					(socks + n)->active = 0;
					snprintf(err_msg, sizeof(err_msg),
						 "closing the socket %d after write failure, errno=%d",
						 (socks + n)->sock, errno);
					PF_LOGGER(logfunc, err_msg);
				} else if (rc == 0) {
					shutdown((socks + n)->sock, SHUT_RDWR);
					close((socks + n)->sock);
					dis_destroy_chan((socks + n)->sock);
					(socks + n)->active = 0;
				} else {
					(socks + peer)->bufwritten += rc;
				}
			} /* END if wfdset */
			if (!(socks + n)->listening) {
				int peer = (socks + n)->peer;
				if ((socks + peer)->bufavail == (socks + peer)->bufwritten) {
					(socks + peer)->bufavail = (socks + peer)->bufwritten = 0;
				}
				if (!(socks + peer)->active && ((socks + peer)->bufwritten == (socks + peer)->bufavail)) {
					shutdown((socks + n)->sock, SHUT_RDWR);
					close((socks + n)->sock);
					dis_destroy_chan((socks + n)->sock);
					(socks + n)->active = 0;
				}
			}

		} /* END foreach fd */

	} /* END while(x11_reader_go) */
} /* END port_forwarder() */

/**
 * @brief
 *      This function returns a socket to the local X11 unix server.
 *
 * @param[in] dnr   Display number to which it has to connect to.
 *
 * @return	int
 * @retval	Socket fd connected to the local X11 unix server.	success
 * @retval  	-1  							Failure
 */
int
connect_local_xsocket(u_int dnr)
{
	int sock;
	struct sockaddr_un addr;

	if ((sock = socket(AF_UNIX, SOCK_STREAM, 0)) < 0) {
		fprintf(stderr, "socket: %.100s", strerror(errno));
		return -1;
	}

	memset(&addr, 0, sizeof(addr));
	addr.sun_family = AF_UNIX;
	snprintf(addr.sun_path, sizeof(addr.sun_path), X_UNIX_PATH, dnr);

	if (connect(sock, (struct sockaddr *) &addr, sizeof(addr)) == 0)
		return sock;

	close(sock);
	fprintf(stderr, "connect %.100s: %.100s", addr.sun_path, strerror(errno));
	return (-1);
}

/**
 * @brief
 *      This function is called whenever there is a connection accepted by the
 *      port forwarder at qsub side. It will further send the data read by port
 *      forwarder to the x server listening on the display number set in the
 *      environment.
 * @param[in] display - The display number where X server is listening in
 *                      qsub.
 * @param[in] alsounused - This parameter is not used. its there just to
 *                         maintain consistency between function pointers used
 *                         by port_forwarder.
 * @return	int
 * @retval	socket number which is connected to Xserver.	success
 * @retval 	-1   						Failure
 */
int
x11_connect_display(
	char *display,
	long alsounused)
{
	int display_number, sock = 0;
	/*
	 * buf will hold the display string consisting of host:screen so
	 * allow an extra 32 characters for the :screen portion
	 */
	char *buf;
	char *cp;
	struct addrinfo hints, *ai, *aitop;
	char strport[NI_MAXSERV];
	int gaierr;

	/*
	 * Now we decode the value of the DISPLAY variable and make a
	 * connection to the real X server.
	 */

	/*
	 * Check if it is a unix domain socket.  Unix domain displays are in
	 * one of the following formats: unix:d[.s], :d[.s], ::d[.s]
	 */
	if (strncmp(display, "unix:", 5) == 0 ||
	    display[0] == ':') {
		/* Connect to the unix domain socket. */
		if (sscanf(strrchr(display, ':') + 1, "%d", &display_number) != 1) {
			fprintf(stderr, "Could not parse display number from DISPLAY: %.100s",
				display);
			return -1;
		}
		/* Create a socket. */
		sock = connect_local_xsocket(display_number);
		if (sock < 0)
			return -1;
		/* OK, we now have a connection to the display. */
		return sock;
	}

	/*
	 * Connect to an inet socket.  The DISPLAY value is supposedly
	 * hostname:d[.s], where hostname may also be numeric IP address.
	 */
	pbs_asprintf(&buf, "%s", display);
	cp = strchr(buf, ':');
	if (!cp) {
		fprintf(stderr, "Could not find ':' in DISPLAY: %.100s", display);
		free(buf);
		return -1;
	}

	*cp = 0;
	/* buf now contains the host name.  But first we parse the display number. */
	if (sscanf(cp + 1, "%d", &display_number) != 1) {
		fprintf(stderr, "Could not parse display number from DISPLAY: %.100s",
			display);
		free(buf);
		return -1;
	}

	/* Look up the host address */
	memset(&hints, 0, sizeof(hints));
	hints.ai_family = AF_UNSPEC;
	hints.ai_socktype = SOCK_STREAM;
	snprintf(strport, sizeof(strport), "%d", 6000 + display_number);
	if ((gaierr = getaddrinfo(buf, strport, &hints, &aitop)) != 0) {
		fprintf(stderr, "%100s: unknown host. (%s)", buf, gai_strerror(gaierr));
		free(buf);
		return -1;
	}

	for (ai = aitop; ai; ai = ai->ai_next) {
		/* Create a socket. */
		sock = socket(ai->ai_family, SOCK_STREAM, 0);
		if (sock < 0) {
			fprintf(stderr, "socket: %.100s", strerror(errno));
			continue;
		}

		/* Connect it to the display. */
		if (connect(sock, ai->ai_addr, ai->ai_addrlen) < 0) {
			fprintf(stderr, "connect %.100s port %d: %.100s", buf,
				6000 + display_number, strerror(errno));
			close(sock);
			continue;
		}

		/* Success */
		break;
	}

	freeaddrinfo(aitop);
	if (!ai) {
		fprintf(stderr, "connect %.100s port %d: %.100s", buf, 6000 + display_number,
			strerror(errno));
		free(buf);
		return -1;
	}

	free(buf);
	set_nodelay(sock);
	return sock;
}
/**
 * @brief
 *      Set the given file descriptor to non blocking mode.
 *      Calling this on a socket causes all future read() and write() calls on
 *      that socket to do only as much as they can immediately, and return
 *      without waiting.
 *      If no data can be read or written, they return -1 and set errno
 *      to EAGAIN or EWOULDBLOCK.
 *
 * @param[in] fd - file descriptor
 *
 * @return	int
 * @retval	1	success
 * @retval 	-1   	Failure
 */
int
set_nonblocking(int fd)
{
	int flags;

	if ((flags = fcntl(fd, F_GETFL, 0)) == -1)
		flags = 0;
	if (fcntl(fd, F_SETFL, flags | O_NONBLOCK) == -1)
		return -1;
	else
		return 1;
}


================================================
FILE: src/lib/Libpbs/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

lib_LTLIBRARIES = libpbs.la

libpbs_la_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

#
# There are specific rules that must be followed when updating the library
# version. The value is completely independent of the product version. Refer
# to the following article prior to modifying the library version:
# https://autotools.io/libtool/version.html
#
pkgconfig_DATA = pbs.pc

libpbs_la_LDFLAGS = -version-info 0:0:0 @KRB5_LIBS@

libpbs_la_LIBADD= \
	@libz_lib@ \
	-lcrypto \
	-lpthread

libpbs_la_SOURCES = \
	../Libattr/attr_fn_arst.c \
	../Libattr/attr_fn_b.c \
	../Libattr/attr_fn_c.c \
	../Libattr/attr_fn_f.c \
	../Libattr/attr_fn_hold.c \
	../Libattr/attr_fn_intr.c \
	../Libattr/attr_fn_l.c \
	../Libattr/attr_fn_ll.c \
	../Libattr/attr_fn_size.c \
	../Libattr/attr_fn_str.c \
	../Libattr/attr_fn_time.c \
	../Libattr/attr_fn_unkn.c \
	../Libattr/attr_func.c \
	../Libattr/attr_resc_func.c \
	../Libattr/Long_.c \
	../Libattr/resc_map.c \
	../Libattr/uLTostr.c \
	../Libattr/strToL.c \
	../Libattr/strTouL.c \
	../Libcmds/batch_status.c \
	../Libcmds/check_job_script.c \
	../Libcmds/chk_Jrange.c \
	../Libcmds/ck_job_name.c \
	../Libcmds/cnt2server.c \
	../Libcmds/cvtdate.c \
	../Libcmds/get_attr.c \
	../Libcmds/get_dataservice_usr.c \
	../Libcmds/get_server.c \
	../Libcmds/err_handling.c \
	../Libcmds/isjobid.c \
	../Libcmds/locate_job.c \
	../Libcmds/parse_at.c \
	../Libcmds/parse_depend.c \
	../Libcmds/parse_destid.c \
	../Libcmds/parse_equal.c \
	../Libcmds/parse_jobid.c \
	../Libcmds/parse_stage.c \
	../Libcmds/prepare_path.c \
	../Libcmds/set_attr.c \
	../Libcmds/set_resource.c \
	../Libdis/dis_helpers.c \
	../Libdis/dis.c \
	../Libdis/dis_.h \
	../Libdis/discui_.c \
	../Libdis/discul_.c \
	../Libdis/disi10d_.c \
	../Libdis/disi10l_.c \
	../Libdis/disiui_.c \
	../Libdis/disp10d_.c \
	../Libdis/disp10l_.c \
	../Libdis/disrcs.c \
	../Libdis/disrd.c \
	../Libdis/disrf.c \
	../Libdis/disrfcs.c \
	../Libdis/disrfst.c \
	../Libdis/disrl.c \
	../Libdis/disrl_.c \
	../Libdis/disrsc.c \
	../Libdis/disrsi.c \
	../Libdis/disrsi_.c \
	../Libdis/disrsl.c \
	../Libdis/disrsl_.c \
	../Libdis/disrss.c \
	../Libdis/disrst.c \
	../Libdis/disruc.c \
	../Libdis/disrui.c \
	../Libdis/disrul.c \
	../Libdis/disrus.c \
	../Libdis/diswcs.c \
	../Libdis/diswf.c \
	../Libdis/diswl_.c \
	../Libdis/diswsi.c \
	../Libdis/diswsl.c \
	../Libdis/diswui.c \
	../Libdis/diswui_.c \
	../Libdis/diswul.c \
	../Libdis/ps_dis.c \
	../Libdis/diswull.c \
	../Libdis/disrull.c \
	../Libdis/discull_.c \
	../Libdis/disrsll_.c \
	../Libecl/ecl_verify.c \
	../Libecl/ecl_verify_datatypes.c \
	../Libecl/ecl_verify_values.c \
	../Libecl/ecl_verify_object_name.c \
	../Libecl/pbs_client_thread.c \
	../Libifl/advise.c \
	../Libifl/auth.c \
	../Libifl/conn_table.c \
	../Libifl/DIS_decode.c \
	../Libifl/DIS_encode.c \
	../Libifl/dec_reply.c \
	../Libifl/enc_reply.c \
	../Libifl/entlim_parse.c \
	../Libifl/get_svrport.c \
	../Libifl/grunt_parse.c \
	../Libifl/int_hook.c \
	../Libifl/int_jcred.c \
	../Libifl/int_manager.c \
	../Libifl/int_manage2.c \
	../Libifl/int_msg2.c \
	../Libifl/int_rdrpy.c \
	../Libifl/int_sig2.c \
	../Libifl/int_status2.c \
	../Libifl/int_submit.c \
	../Libifl/int_submit_resv.c \
	../Libifl/int_status.c \
	../Libifl/int_ucred.c \
	../Libifl/int_cred.c \
	../Libifl/int_modify_resv.c \
	../Libifl/list_link.c \
	../Libifl/ifl_util.c \
	../Libifl/ifl_pointers.c \
	../Libifl/PBS_attr.c \
	../Libifl/pbs_get_attribute_errors.c \
	../Libifl/pbs_geterrmg.c \
	../Libifl/pbs_geterrno.c \
	../Libifl/pbs_loadconf.c \
	../Libifl/pbs_quote_parse.c \
	../Libifl/pbs_statfree.c \
	../Libifl/pbs_delstatfree.c \
	../Libifl/pbsD_alterjob.c \
	../Libifl/pbsD_connect.c \
	../Libifl/pbsD_deljob.c \
	../Libifl/pbsD_deljoblist.c \
	../Libifl/pbsD_holdjob.c \
	../Libifl/pbsD_locjob.c \
	../Libifl/pbsD_manager.c \
	../Libifl/pbsD_movejob.c \
	../Libifl/pbsD_msgjob.c \
	../Libifl/pbsD_orderjo.c \
	../Libifl/pbsD_rerunjo.c \
	../Libifl/pbsD_resc.c \
	../Libifl/pbsD_rlsjob.c \
	../Libifl/pbsD_runjob.c \
	../Libifl/pbsD_selectj.c \
	../Libifl/pbsD_sigjob.c \
	../Libifl/pbsD_stagein.c \
	../Libifl/pbsD_stathost.c \
	../Libifl/pbsD_statjob.c \
	../Libifl/pbsD_statnode.c \
	../Libifl/pbsD_statque.c \
	../Libifl/pbsD_statsrv.c \
	../Libifl/pbsD_statsched.c \
	../Libifl/pbsD_submit.c \
	../Libifl/pbsD_termin.c \
	../Libifl/pbsD_submit_resv.c \
	../Libifl/pbsD_stathook.c \
	../Libifl/pbsD_delresv.c \
	../Libifl/pbsD_statresv.c \
	../Libifl/pbsD_confirmresv.c \
	../Libifl/pbsD_defschreply.c \
	../Libifl/pbsD_statrsc.c \
	../Libifl/pbsD_modify_resv.c \
	../Libifl/pbsD_Preempt_Jobs.c \
	../Libifl/ifl_impl.c \
	../Libifl/rm.c \
	../Libifl/strsep.c \
	../Libifl/tcp_dis.c \
	../Libifl/tm.c \
	../Libifl/xml_encode_decode.c \
	../Liblog/pbs_messages.c \
	../Liblog/pbs_log.c \
	../Liblog/log_event.c \
	../Libsec/cs_standard.c \
	../Libutil/avltree.c \
	../Libutil/get_hostname.c \
	../Libutil/misc_utils.c \
	../Libutil/thread_utils.c \
	../Libutil/pbs_secrets.c \
	../Libutil/pbs_aes_encrypt.c \
	../Libutil/pbs_idx.c \
	../Libutil/range.c \
	../Libutil/dedup_jobids.c \
	../Libnet/get_hostaddr.c \
	../Libnet/hnls.c \
	../Libtpp/tpp_client.c \
	../Libtpp/tpp_em.c \
	../Libtpp/tpp_platform.c \
	../Libtpp/tpp_transport.c \
	../Libtpp/tpp_util.c \
	ecl_job_attr_def.c \
	ecl_svr_attr_def.c \
	ecl_sched_attr_def.c \
	ecl_node_attr_def.c \
	ecl_queue_attr_def.c \
	ecl_resc_def_all.c \
	ecl_resv_attr_def.c

CLEANFILES = \
	ecl_job_attr_def.c \
	ecl_svr_attr_def.c \
	ecl_sched_attr_def.c \
	ecl_node_attr_def.c \
	ecl_queue_attr_def.c \
	ecl_resc_def_all.c \
	ecl_resv_attr_def.c

ecl_job_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_job_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	$(PYTHON) $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_job_attr_def.xml -e $@

ecl_svr_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_svr_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	$(PYTHON) $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_svr_attr_def.xml -e $@

ecl_node_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_node_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	$(PYTHON) $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_node_attr_def.xml -e $@

ecl_queue_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_queue_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	$(PYTHON) $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_queue_attr_def.xml -e $@

ecl_resv_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_resv_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	$(PYTHON) $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_resv_attr_def.xml -e $@

ecl_sched_attr_def.c: $(top_srcdir)/src/lib/Libattr/master_sched_attr_def.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	$(PYTHON) $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_sched_attr_def.xml -e $@

ecl_resc_def_all.c: $(top_srcdir)/src/lib/Libattr/master_resc_def_all.xml $(top_srcdir)/buildutils/attr_parser.py
	@echo Generating $@ from $< ; \
	$(PYTHON) $(top_srcdir)/buildutils/attr_parser.py -m $(top_srcdir)/src/lib/Libattr/master_resc_def_all.xml -e $@


================================================
FILE: src/lib/Libpbs/pbs.pc.in
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

prefix=@prefix@
exec_prefix=@exec_prefix@
libdir=@libdir@
includedir=@includedir@

Name: @PACKAGE_NAME@
Description: Library for the PBS
Version: @PACKAGE_VERSION@
Libs: -L${libdir} -lpbs
Cflags: -I${includedir}
Requires.private: libcrypto
Requires.private: libz


================================================
FILE: src/lib/Libpython/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

noinst_LIBRARIES = libpbspython.a libpbspython_svr.a

libpbspython_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@PYTHON_INCLUDES@ \
	@KRB5_CFLAGS@

libpbspython_a_SOURCES = \
	shared_python_utils.c \
	common_python_utils.c \
	pbs_python_external.c \
	pbs_python_svr_external.c \
	module_pbs_v1.c \
	pbs_python_svr_internal.c \
	pbs_python_svr_size_type.c \
	pbs_python_import_types.c

nodist_libpbspython_a_SOURCES = \
	$(top_builddir)/src/lib/Libifl/pbs_ifl_wrap.c

libpbspython_svr_a_CPPFLAGS = \
	-DLIBPYTHONSVR \
	-I$(top_srcdir)/src/include \
	@PYTHON_INCLUDES@ \
	@KRB5_CFLAGS@

libpbspython_svr_a_SOURCES = \
	shared_python_utils.c \
	common_python_utils.c \
	pbs_python_external.c \
	pbs_python_svr_external.c \
	module_pbs_v1.c \
	pbs_python_svr_internal.c \
	pbs_python_svr_size_type.c \
	pbs_python_import_types.c

nodist_libpbspython_svr_a_SOURCES = \
	$(top_builddir)/src/lib/Libifl/pbs_ifl_wrap.c


================================================
FILE: src/lib/Libpython/common_python_utils.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>
#include <pbs_python_private.h> /* include the internal python file */
#include <log.h>
#include <pbs_error.h>
#include "hook.h"

extern char *pbs_python_daemon_name;
/**
 * @file	common_python_utils.c
 * @brief
 * 	Common Python Utilities shared by extension and embedded C routines.
 */

/**
 *
 * @brief
 *	write python object info to log in the form of:
 *	<object info> [<pre message>]
 *
 * @param[in]	obj	- the Python object to write info about.
 * @param[in]	pre	- some header string to put in the log
 * @param[in]	severity - severity level of the log message
 *
 * @return	none
 *
 * @note
 *  side effects:
 *   No python exceptions are generated, if they do, it is cleared.
 */

void
pbs_python_write_object_to_log(PyObject *obj, char *pre, int severity)
{
	PyObject *py_tmp_str = NULL;
	const char *obj_str = NULL;

	if (!(py_tmp_str = PyObject_Str(obj))) {
		goto ERROR_EXIT;
	}
	if (!(obj_str = PyUnicode_AsUTF8(py_tmp_str))) {
		goto ERROR_EXIT;
	}
	if (pre) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s %s", pre, obj_str);
	} else {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s", obj_str);
	}
	log_buffer[LOG_BUF_SIZE - 1] = '\0';

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
			  severity, pbs_python_daemon_name, log_buffer);
	else
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER,
			  severity, pbs_python_daemon_name, log_buffer);

	Py_CLEAR(py_tmp_str);
	return;

ERROR_EXIT:
	Py_CLEAR(py_tmp_str);
	pbs_python_write_error_to_log("failed to convert object to str");
}

/**
 * @brief
 * 	insert directory to sys path list
 * 	if pos == -1 , then append to the end of the list.
 *
 * @param[in] dirname - directory path
 * @param[in] pos - position of python list
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 *
 */
int
pbs_python_modify_syspath(const char *dirname, int pos)
{
	PyObject *path = NULL; /* 'sys.path'  */
	PyObject *pystr_dirname = NULL;

	if (!dirname) {
		log_err(PBSE_INTERNAL, __func__, "passed NULL pointer to dirname argument!!");
		return -1;
	}

	PyErr_Clear(); /* clear any exceptions */

	/* if sucess we ger a NEW ref */
	if (!(pystr_dirname = PyUnicode_FromString(dirname))) { /* failed */
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s:creating pystr_dirname <%s>",
			 __func__, dirname);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		pbs_python_write_error_to_log(log_buffer);
		goto ERROR_EXIT;
	}

	/* if sucess we ger a NEW ref */
	if (!(path = PySys_GetObject("path"))) { /* failed */
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s:PySys_GetObject failed",
			 __func__);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		pbs_python_write_error_to_log(log_buffer);
		goto ERROR_EXIT;
	}

	if (PyList_Check(path)) {
		if (pos == -1) {
			if (PyList_Append(path, pystr_dirname) == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
#ifdef NAS /* localmod 005 */
					 "%s:could not append to list pos:<%ld>",
					 __func__, (long) pos
#else
					 "%s:could not append to list pos:<%d>",
					 __func__, pos
#endif /* localmod 005 */
				);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				pbs_python_write_error_to_log(log_buffer);
				goto ERROR_EXIT;
			}
		} else {
			if (PyList_Insert(path, pos, pystr_dirname) == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
#ifdef NAS /* localmod 005 */
					 "%s:could not append to list pos:<%ld>",
					 __func__, (long) pos
#else
					 "%s:could not append to list pos:<%d>",
					 __func__, pos
#endif /* localmod 005 */
				);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				pbs_python_write_error_to_log(log_buffer);
				goto ERROR_EXIT;
			}
		}
	} else {
		log_err(PBSE_INTERNAL, __func__, "sys.path is not a list?");
		goto ERROR_EXIT;
	}

	{
		PyObject *obj_repr;
		char *str;
		obj_repr = PyObject_Repr(path);
		str = pbs_python_object_str(obj_repr);
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "--> Python module path is now: %s <--", str);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
			  LOG_DEBUG, pbs_python_daemon_name, log_buffer);
		Py_CLEAR(obj_repr);
	}

	Py_CLEAR(pystr_dirname);
	PySys_SetObject("path", path);
	return 0;

ERROR_EXIT:
	Py_CLEAR(pystr_dirname);
	return -1;
}

/**
 * @brief
 * 	pbs_python_write_error_to_log
 *    	write python exception occurred to PBS log file.
 *    	Heavily borrowed from "Programming Python" by Mark Lutz
 *
 * @param[in] emsg - error msg to be logged
 *
 */

void
pbs_python_write_error_to_log(const char *emsg)
{
	PyObject *exc_type = NULL;	/* NEW refrence, please DECREF */
	PyObject *exc_value = NULL;	/* NEW refrence, please DECREF */
	PyObject *exc_traceback = NULL; /* NEW refrence, please DECREF */
	PyObject *exc_string = NULL;	/* the exception message to be written to pbs log */

	/* get the exception */
	if (!PyErr_Occurred()) {
		log_err(PBSE_INTERNAL, __func__, "error handler called but no exception raised!");
		return;
	}

	PyErr_Fetch(&exc_type, &exc_value, &exc_traceback);
	PyErr_Clear(); /* just in case, not clear from API doc */

	exc_string = NULL;
	if ((exc_type != NULL) && /* get the string representation of the object */
	    ((exc_string = PyObject_Str(exc_type)) != NULL) &&
	    (PyUnicode_Check(exc_string))) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s", PyUnicode_AsUTF8(exc_string));
	} else {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s", "<could not figure out the exception type>");
	}
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	Py_XDECREF(exc_string);
	if (log_buffer[0] != '\0')
		log_err(PBSE_INTERNAL, emsg, log_buffer);

	/* Log error exception value */
	exc_string = NULL;
	if ((exc_value != NULL) && /* get the string representation of the object */
	    ((exc_string = PyObject_Str(exc_value)) != NULL) &&
	    (PyUnicode_Check(exc_string))) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s", PyUnicode_AsUTF8(exc_string));
	} else {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s", "<could not figure out the exception value>");
	}
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	Py_XDECREF(exc_string);
	if (log_buffer[0] != '\0')
		log_err(PBSE_INTERNAL, emsg, log_buffer);

	Py_XDECREF(exc_type);
	Py_XDECREF(exc_value);

#if !defined(WIN32)
	Py_XDECREF(exc_traceback);
#elif !defined(_DEBUG)
	/* for some reason this crashes on Windows Debug version */
	Py_XDECREF(exc_traceback);
#endif

	return;
}

/**
 * @brief
 * 	pbs_python_object_set_attr_string_value
 *    	Current PBS API does not have an easy interface to set a C string value to a
 *    	a object attribute. Hence, a lot of boilerplate code is needed to just set a string
 *   	value, hence this routine.
 *
 * @param[in] obj - object attribute to which string value to be set
 * @param[in] key - name of the attribute to set
 * @param[in] value - string value to be set
 *
 * @par	NOTES:
 *  	- exceptions are cleared!!
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	failure
 *
 */

int
pbs_python_object_set_attr_string_value(PyObject *obj,
					const char *key,
					const char *value)
{
	PyObject *tmp_py_str = NULL;

	int rv = -1; /* default failure */

	if (!key) {
		log_err(PBSE_INTERNAL, __func__, "Null key passed!");
		return rv;
	}

	if (!value) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "Null value passed while setting attribute '%s'", key);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return rv;
	}

	tmp_py_str = PyUnicode_FromString(value); /* NEW reference */

	if (!tmp_py_str) { /* Uh-of failed */
		pbs_python_write_error_to_log(__func__);
		return rv;
	}
	rv = PyObject_SetAttrString(obj, key, tmp_py_str);

	if (rv == -1) {
		pbs_python_write_error_to_log(__func__);
	}
	Py_CLEAR(tmp_py_str);
	return rv;
}

/**
 * @brief
 *      pbs_python_object_set_attr_string_value
 *      Current PBS API does not have an easy interface to set a C integral value to a
 *      a object attribute. Hence, a lot of boilerplate code is needed to just set a integral
 *      value, hence this routine.
 *
 * @param[in] obj - object attribute to which string value to be set
 * @param[in] key - name of the attribute to set
 * @param[in] value - integer value to be set
 *
 * @par NOTES:
 *      - exceptions are cleared!!
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      failure
 *
 */

int
pbs_python_object_set_attr_integral_value(PyObject *obj,
					  const char *key,
					  int value)
{
	PyObject *tmp_py_int = PyLong_FromSsize_t(value); /* NEW reference */

	int rv = -1;	   /* default failure */
	if (!tmp_py_int) { /* Uh-of failed */
		pbs_python_write_error_to_log(__func__);
		return rv;
	}
	rv = PyObject_SetAttrString(obj, key, tmp_py_int);

	if (rv == -1)
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(tmp_py_int);

	return rv;
}

/**
 * @brief
 *      pbs_python_object_set_attr_string_value
 *      Current PBS API does not have an easy interface to get a C integral value of
 *      a object attribute. Hence, a lot of boilerplate code is needed to just get a integral
 *      value, hence this routine.
 *
 * @param[in] obj - object attribute from which integral value is taken
 * @param[in] key - name of the attribute to get
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      failure
 *
 */
int
pbs_python_object_get_attr_integral_value(PyObject *obj, const char *key)
{
	int rv = -1; /* default failure */
	PyObject *py_int = NULL;
	int retval;

	if (!key) { /* Uh-of failed */
		return rv;
	}
	if (!PyObject_HasAttrString(obj, key)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "obj %s has no key %s", pbs_python_object_str(obj), key);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		return rv;
	}

	py_int = PyObject_GetAttrString(obj, key); /* NEW ref */

	if (!py_int) {
		pbs_python_write_error_to_log(__func__);
		return rv;
	}

	if (!PyArg_Parse(py_int, "i", &retval)) {
		pbs_python_write_error_to_log(__func__);
		Py_CLEAR(py_int);
		return rv;
	}

	Py_CLEAR(py_int);
	return (retval);
}

/**
 * @brief
 * 	Returns a string representation of 'obj' in a fixed memory area that must
 * 	not be freed. This never returns NULL.
 *
 * @par Note:
 *	next call of this function would overwrite this fixed memory area
 * 	so probably best to use the result immediately, or strdup() it.
 *
 * @param[in]	obj - object
 *
 * @return	string
 * @retval	string repsn of obj
 */
char *
pbs_python_object_str(PyObject *obj)
{
	const char *str = NULL;
	PyObject *py_str;
	static char *ret_str = NULL;
	char *tmp_str = NULL;
	size_t alloc_sz = 0;

	py_str = PyObject_Str(obj); /* NEW ref */

	if (!py_str)
		return ("");

	str = PyUnicode_AsUTF8(py_str);

	if (str)
		alloc_sz = strlen(str) + 1;
	else
		alloc_sz = 1; /* for null byte */

	tmp_str = (char *) realloc((char *) ret_str, alloc_sz);
	if (!tmp_str) { /* error on realloc */
		log_err(errno, __func__, "error on realloc");
		Py_CLEAR(py_str);
		return ("");
	}
	ret_str = tmp_str;
	*ret_str = '\0';
	if (str != NULL) {
		strncpy(ret_str, str, alloc_sz);
		ret_str[alloc_sz - 1] = '\0';
	}
	Py_CLEAR(py_str);
	return (ret_str);
}

/**
 * @brief
 * 	pbs_python_object_get_attr_string_value
 *    	Current PBS API does not have an easy interface to set a C string value to a
 *    	a object attribute. Hence, a lot of boilerplate code is needed to just set a string
 *    	value, hence this routine.
 *
 * @par	NOTES:
 *  	- exceptions are cleared!!
 * 	This must return NULL if object does not have a value for attribute 'name'.
 *
 * @param[in] obj - object
 * @param[in] name - name attr
 *
 * @return	string
 * @retval	string val to object	success
 * @retval	NULL			error
 *
 */

char *
pbs_python_object_get_attr_string_value(PyObject *obj, const char *name)
{
	char *attrval_str = NULL;
	PyObject *py_attrval = NULL;

	if (!name) {
		log_err(PBSE_INTERNAL, __func__, "No value for name");
		return NULL;
	}

	if (!PyObject_HasAttrString(obj, name)) {
		return NULL;
	}

	py_attrval = PyObject_GetAttrString(obj, name);

	if (py_attrval) {
		if (py_attrval != Py_None)
			attrval_str = pbs_python_object_str(py_attrval);
		Py_DECREF(py_attrval);
	}
	return (attrval_str);
}

/**
 * @brief
 *	pbs_python_dict_set_item_string_value
 *    	Current PBS API does not have an easy interface to set a C string value to a
 *    	a dictionary. Hence, a lot of boilerplate code is needed to just set a string
 *    	value, hence this routine.
 *
 * @param[in] dict - dictionary to which string value to be set
 * @param[in] key - name of the attribute to set
 * @param[in] value - integer value to be set
 *
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      failure
 *
 */

int
pbs_python_dict_set_item_string_value(PyObject *dict,
				      const char *key,
				      const char *value)
{
	PyObject *tmp_py_str;

	int rv = -1; /* default failure */
	if (!value) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "Null value passed while setting key '%s'", key);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return rv;
	}

	tmp_py_str = PyUnicode_FromString(value); /* NEW reference */
	if (!tmp_py_str) {			  /* Uh-of failed */
		pbs_python_write_error_to_log(__func__);
		return rv;
	}
	rv = PyDict_SetItemString(dict, key, tmp_py_str);
	if (rv == -1)
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(tmp_py_str);
	return rv;
}

/**
 * @brief
 * 	Given a list Python object, return the string item at 'index'.
 *
 * @param[in]	list - the Python list object
 * @param[in]	index - index of the item in the list to return
 *
 * @return char *
 * @retval <string>  - a string value that is in a fixed memory area that
 * 			must not be freed. This would  be a an emnpty
 * 			string "" if no value is found.
 * @note
 * 	Next call to this function would overwrite the fixed memory area
 * 	returned, so probably best to use the result immediately,
 *	or strdup() it.
 *	This will never return a NULL value.
 */

char *
pbs_python_list_get_item_string_value(PyObject *list, int index)
{
	PyObject *py_item = NULL;
	char *ret_str = NULL;

	if (!PyList_Check(list)) {
		log_err(PBSE_INTERNAL, __func__, "Did not get passed a list object");
		return ("");
	}

	py_item = PyList_GetItem(list, index);
	if (!py_item) {
		pbs_python_write_error_to_log(__func__);
		return ("");
	}
	ret_str = pbs_python_object_str(py_item); /* does not return NULL */

	return ret_str;
}

/**
 * @brief
 * 	pbs_python_dict_set_item_integral_value
 *    	Current PBS API does not have an easy interface to set a C integral value to a
 *    	a dictionary. Hence, a lot of boilerplate code is needed to just set a integral
 *    	value, hence this routine.
 *
 * @param[in] dict - dictionary to which string value to be set
 * @param[in] key - name of the attribute to set
 * @param[in] value - integer value to be set
 *
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      failure
 *
 */

int
pbs_python_dict_set_item_integral_value(PyObject *dict,
					const char *key,
					const Py_ssize_t value)
{
	int rv = -1; /* default failure */

	PyObject *tmp_py_int = PyLong_FromSsize_t(value); /* NEW reference */
	if (!tmp_py_int) {				  /* Uh-of failed */
		pbs_python_write_error_to_log(__func__);
		return rv;
	}
	rv = PyDict_SetItemString(dict, key, tmp_py_int);
	if (rv == -1)
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(tmp_py_int);
	return rv;
}

/**
 * @brief
 * 	pbs_python_import_name
 *   	This imports a name from the given module. Note this returns a NEW
 *   	reference. This essentially retrieves an attribute name.
 *
 * @param[in]	module_name - imported module name
 * @param[in] 	fromname    - imported from
 *
 * @return	object
 * @retval	object of type from imported file	success
 * @retval	exiterror code				error
 *
 */

PyObject *
pbs_python_import_name(const char *module_name, const char *fromname)
{
	PyObject *py_mod_obj = NULL;
	PyObject *py_fromname_obj = NULL;

	py_mod_obj = PyImport_ImportModule(module_name); /* fetch module */
	if (py_mod_obj == NULL) {
		goto ERROR_EXIT;
	}
	if (!(py_fromname_obj = PyObject_GetAttrString(py_mod_obj, fromname))) {
		goto ERROR_EXIT;
	}

	if (py_mod_obj)
		Py_CLEAR(py_mod_obj);

	return py_fromname_obj;

ERROR_EXIT:
	pbs_python_write_error_to_log(__func__);
	if (py_mod_obj)
		Py_CLEAR(py_mod_obj);
	return NULL;
}

/*
 * logmsg module method implementation and documentation
 *
 *  TODO
 *     This could really be a log type capturing all the log.h functionality.
 */

const char pbsv1mod_meth_logmsg_doc[] =
	"logmsg(strSeverity,strMessage)\n\
  where:\n\
\n\
   strSeverity: one of module constants\n\
              pbs.LOG_WARNING\n\
              pbs.LOG_ERROR\n\
              pbs.LOG_DEBUG (default)\n\
   strMessage:  error message to write\n\
\n\
  returns:\n\
         None\n\
";

/* note this is undefind later */
#define VALID_SEVERITY_VALUE(val) \
	((val == SEVERITY_LOG_WARNING) || (val == SEVERITY_LOG_ERR) || (val == SEVERITY_LOG_DEBUG))

#define VALID_EVENTTYPE_VALUE(val)                                \
	((val == PBSEVENT_ERROR) || (val == PBSEVENT_SYSTEM) ||   \
	 (val == PBSEVENT_JOB) || (val == PBSEVENT_JOB_USAGE) ||  \
	 (val == PBSEVENT_SECURITY) || (val == PBSEVENT_SCHED) || \
	 (val == PBSEVENT_DEBUG) || (val == PBSEVENT_DEBUG2) ||   \
	 (val == PBSEVENT_RESV) || (val == PBSEVENT_DEBUG3) ||    \
	 (val == PBSEVENT_DEBUG4) || (val == PBSEVENT_FORCE) ||   \
	 (val == PBSEVENT_ADMIN))

/**
 * @brief
 *	This is the wrapper function to the pbs.logmsg() call in the hook world.
 * 	It will basically call log_event() passing in values for eventtype,
 * 	severity, and actual log message.
 *
 * @param[in]	self - parent object
 * @param[in]	args - the list of arguments:
 * 			args[0] = loglevel	(pbs.LOG_DEBUG, pbs.EVENT_DEBUG4, etc...)
 * 			args[1] = log_message
 * 			if loglevel is pbs.LOG_DEBUG, pbs.LOG_ERROR, pbs.LOG_WARNING,
 * 			then the 'severity' argument to log_event() is set to LOG_DEBUG,
 * 			LOG_ERROR, LOG_WARNING, respectively. Otherwise, it would default
 * 			to LOG_DEBUG.
 * 			NOTE: 'severity' determines the severity of the message when
 * 			sent to syslog.
 * @return PyObjectd *
 * @retval Py_None	- for success
 * @retval NULL		- which causes an exception to the executing hook script.
 *
 */
PyObject *
pbsv1mod_meth_logmsg(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"loglevel", "message", NULL};

	int loglevel;
	int severity = -1;
	int eventtype = -1;
	char *emsg = NULL;
#ifdef PY_SSIZE_T_CLEAN
	Py_ssize_t emsg_len = 0;
#else
	int emsg_len = 0;
#endif

	/* The use of "s#" below is to allow embedded NULLs, to guarantee */
	/* something will get printed and not get an exception */
	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "is#:logmsg",
					 kwlist,
					 &loglevel,
					 &emsg,
					 &emsg_len)) {
		return NULL;
	}

	if (!VALID_SEVERITY_VALUE(loglevel) &&
	    !VALID_EVENTTYPE_VALUE(loglevel)) {
		PyErr_Format(PyExc_TypeError, "Invalid severity or eventtype value <%d>",
			     loglevel);
		return NULL;
	}
	/* log the message */
	if (VALID_SEVERITY_VALUE(loglevel)) {
		if (loglevel == SEVERITY_LOG_DEBUG)
			severity = LOG_DEBUG;
		else if (loglevel == SEVERITY_LOG_ERR)
			severity = LOG_ERR;
		else if (loglevel == SEVERITY_LOG_WARNING)
			severity = LOG_WARNING;
	}
	if (VALID_EVENTTYPE_VALUE(loglevel)) {
		eventtype = loglevel;
	}

	/* This usually means what got passed are the old
	 * loglevel values (pbs.LOG_DEBUG, pbs.LOG_ERROR, pbs.LOG_WARNING).
	 * These values were actually the 'severity' values for syslog.
	 * so we use the same default as before for 'eventtype' argument
	 * to log_event().
	 */
	if (eventtype == -1) {
		eventtype = (PBSEVENT_ADMIN | PBSEVENT_SYSTEM);
	}
	/* This means what got passed are the new log level values
	 * (ex .pbs.EVENT_DEBUG4) which really maps to the 'eventtype'
	 * argument to log_event(). So we'll use a default LOG_DEBUG
	 * 'severity' value for syslog.
	 */
	if (severity == -1) {
		severity = LOG_DEBUG;
	}

	log_event(eventtype, PBS_EVENTCLASS_HOOK,
		  severity, pbs_python_daemon_name, emsg);
	Py_RETURN_NONE;
}
#undef VALID_SEVERITY_VALUE

/*
 * logjobmsg module method implementation and documentation
 *
 */

const char pbsv1mod_meth_logjobmsg_doc[] =
	"logjobmsg(strJobId,strMessage)\n\
  where:\n\
\n\
   strJobId:  a PBS  job id\n\
   strMessage:  message to write to PBS log under class of messages\n\
   		related to 'strJobId'.\n\
\n\
  returns:\n\
         None\n\
";

PyObject *
pbsv1mod_meth_logjobmsg(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"jobid", "message", NULL};

	char *jobid = NULL;
	char *msg = NULL;
#ifdef PY_SSIZE_T_CLEAN
	Py_ssize_t msg_len = 0;
#else
	int msg_len = 0;
#endif

	/* The use of "s#" below is to allow embedded NULLs, to guarantee */
	/* something will get printed and not get an exception */
	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "ss#:logjobmsg",
					 kwlist,
					 &jobid,
					 &msg,
					 &msg_len)) {
		return NULL;
	}

	if ((jobid == NULL) || (jobid[0] == '\0')) {
		PyErr_SetString(PyExc_ValueError, "no jobid given!");
		return NULL;
	}

	/* log the message */
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG, jobid, msg);

	Py_RETURN_NONE;
}


================================================
FILE: src/lib/Libpython/module_pbs_v1.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

/* include the pbs_python private file with python dependencies */
#include <pbs_python_private.h>

#include <stdio.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/param.h>
#include <memory.h>
#include <stdlib.h>
#include <libpbs.h>
#include <pbs_ifl.h>
#include <errno.h>
#include <string.h>
#include <list_link.h>
#include <log.h>
#include <attribute.h>
#include <server_limits.h>
#include <server.h>
#include <job.h>
#include <reservation.h>
#include <queue.h>
#include <pbs_error.h>
#include <hook.h>
#include <pbs_internal.h>
#include <pbs_nodes.h>
#include "pbs_internal.h"

/* pbs_python_import_types.c */
extern int ppsvr_prepare_all_types(void);
extern PyObject *ppsvr_create_types_module(void);

extern char pbsv1mod_meth_logmsg_doc[]; /* common_python_utils.c */
extern PyObject *pbsv1mod_meth_logmsg(PyObject *self,
				      PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_logjobmsg_doc[]; /* common_python_utils.c */
extern PyObject *pbsv1mod_meth_logjobmsg(PyObject *self,
					 PyObject *args, PyObject *kwds);

/* pbs_python_svr_internal.c */
extern char pbsv1mod_meth_get_queue_doc[];
extern PyObject *pbsv1mod_meth_get_queue(PyObject *self,
					 PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_job_doc[];
extern PyObject *pbsv1mod_meth_get_job(PyObject *self,
				       PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_release_nodes_doc[];
extern PyObject *pbsv1mod_meth_release_nodes(PyObject *self,
					     PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_resv_doc[];
extern PyObject *pbsv1mod_meth_get_resv(PyObject *self,
					PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_vnode_doc[];
extern PyObject *pbsv1mod_meth_get_vnode(PyObject *self,
					 PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_iter_nextfunc_doc[];
extern PyObject *pbsv1mod_meth_iter_nextfunc(PyObject *self,
					     PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_mark_vnode_set_doc[];
extern PyObject *pbsv1mod_meth_mark_vnode_set(PyObject *self,
					      PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_load_resource_value_doc[];
extern PyObject *pbsv1mod_meth_load_resource_value(PyObject *self,
						   PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_resource_str_value_doc[];
extern PyObject *pbsv1mod_meth_resource_str_value(PyObject *self,
						  PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_vnode_state_to_str_doc[];
extern PyObject *pbsv1mod_meth_vnode_state_to_str(PyObject *self,
						  PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_vnode_sharing_to_str_doc[];
extern PyObject *pbsv1mod_meth_vnode_sharing_to_str(PyObject *self,
						    PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_vnode_ntype_to_str_doc[];
extern PyObject *pbsv1mod_meth_vnode_ntype_to_str(PyObject *self,
						  PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_str_to_vnode_state_doc[];
extern PyObject *pbsv1mod_meth_str_to_vnode_state(PyObject *self,
						  PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_str_to_vnode_ntype_doc[];
extern PyObject *pbsv1mod_meth_str_to_vnode_ntype(PyObject *self,
						  PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_str_to_vnode_sharing_doc[];
extern PyObject *pbsv1mod_meth_str_to_vnode_sharing(PyObject *self,
						    PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_is_attrib_val_settable_doc[];
extern PyObject *pbsv1mod_meth_is_attrib_val_settable(PyObject *self,
						      PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_event_accept_doc[];
extern PyObject *pbsv1mod_meth_event_accept(void);

extern char pbsv1mod_meth_event_reject_doc[];
extern PyObject *pbsv1mod_meth_event_reject(PyObject *self,
					    PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_reboot_doc[];
extern PyObject *pbsv1mod_meth_reboot(PyObject *self,
				      PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_scheduler_restart_cycle_doc[];
extern PyObject *pbsv1mod_meth_scheduler_restart_cycle(PyObject *self,
						       PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_set_pbs_statobj_doc[];
extern PyObject *pbsv1mod_meth_set_pbs_statobj(PyObject *self,
					       PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_event_param_mod_allow_doc[];
extern PyObject *pbsv1mod_meth_event_param_mod_allow(void);

extern char pbsv1mod_meth_event_param_mod_disallow_doc[];
extern PyObject *pbsv1mod_meth_event_param_mod_disallow(void);

extern char pbsv1mod_meth_event_doc[];
extern PyObject *pbsv1mod_meth_event(void);

extern char pbsv1mod_meth_server_doc[];
extern PyObject *pbsv1mod_meth_server(void);

extern char pbsv1mod_meth_in_python_mode_doc[];
extern PyObject *pbsv1mod_meth_in_python_mode(void);

extern char pbsv1mod_meth_set_python_mode_doc[];
extern PyObject *pbsv1mod_meth_set_python_mode(void);

extern char pbsv1mod_meth_set_c_mode_doc[];
extern PyObject *pbsv1mod_meth_set_c_mode(void);

extern char pbsv1mod_meth_get_python_daemon_name_doc[];
extern PyObject *pbsv1mod_meth_get_python_daemon_name(void);

extern char pbsv1mod_meth_get_pbs_server_name_doc[];
extern PyObject *pbsv1mod_meth_get_pbs_server_name(void);

extern char pbsv1mod_meth_get_local_host_name_doc[];
extern PyObject *pbsv1mod_meth_get_local_host_name(void);

extern char pbsv1mod_meth_get_pbs_conf_doc[];
extern PyObject *pbsv1mod_meth_get_pbs_conf(void);

extern char pbsv1mod_meth_in_site_hook_doc[];
extern PyObject *pbsv1mod_meth_in_site_hook(void);

extern char pbsv1mod_meth_validate_input_doc[];
extern PyObject *pbsv1mod_meth_validate_input(PyObject *self,
					      PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_duration_to_secs_doc[];
extern PyObject *pbsv1mod_meth_duration_to_secs(PyObject *self,
						PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_wordsize_doc[];
extern PyObject *pbsv1mod_meth_wordsize(void);

extern char pbsv1mod_meth_size_to_kbytes_doc[];
extern PyObject *pbsv1mod_meth_size_to_kbytes(PyObject *self,
					      PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_server_static_doc[];
extern PyObject *pbsv1mod_meth_get_server_static(PyObject *self,
						 PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_vnode_static_doc[];
extern PyObject *pbsv1mod_meth_get_vnode_static(PyObject *self,
						PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_job_static_doc[];
extern PyObject *pbsv1mod_meth_get_job_static(PyObject *self,
					      PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_resv_static_doc[];
extern PyObject *pbsv1mod_meth_get_resv_static(PyObject *self,
					       PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_vnode_static_doc[];
extern PyObject *pbsv1mod_meth_get_vnode_static(PyObject *self,
						PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_queue_static_doc[];
extern PyObject *pbsv1mod_meth_get_queue_static(PyObject *self,
						PyObject *args, PyObject *kwds);

extern char pbsv1mod_meth_get_server_data_fp_doc[];
extern PyObject *pbsv1mod_meth_get_server_data_fp(void);

extern char pbsv1mod_meth_get_server_data_file_doc[];
extern PyObject *pbsv1mod_meth_get_server_data_file(void);

extern char pbsv1mod_meth_use_static_data_doc[];
extern PyObject *pbsv1mod_meth_use_static_data(void);

/* private */
static PyObject *PyPbsV1ModuleExtension_Obj = NULL; /* BORROWED reference */

/*  -----                    MODULE HELPER FUNCTIONS          -----    */

#define INSERT_STR_CONSTANT(k, v)                                                \
	do {                                                                     \
		if ((pbs_python_dict_set_item_string_value(dict, k, v) == -1)) { \
			return -1;                                               \
		}                                                                \
	} while (0)

/* special job states */
#define JOB_STATE_SUSPEND 400
#define JOB_STATE_SUSPEND_USERACTIVE 410

/**
 * @brief
 * 	_pv1mod_insert_str_constants:
 *   	insert all PBS string constants
 *
 * @param[in] dict - dictionary object
 *
 * @return	int
 * @retval	0
 */

static int
_pv1mod_insert_str_constants(PyObject *dict)
{

	return 0;
}

#define INSERT_INT_CONSTANT(k, v)                                                  \
	do {                                                                       \
		if ((pbs_python_dict_set_item_integral_value(dict, k, v) == -1)) { \
			return -1;                                                 \
		}                                                                  \
	} while (0)

/**
 * @brief
 * 	_pv1mod_insert_str_constants:
 *   	insert all PBS string constants
 *
 * @param[in] dict - dictionary object
 *
 * @return      int
 * @retval      0
 *
 */

static int
_pv1mod_insert_int_constants(PyObject *dict)
{

	/* first QTYPES */
	INSERT_INT_CONSTANT("QTYPE_EXECUTION", QTYPE_Execution);
	INSERT_INT_CONSTANT("QTYPE_ROUTE", QTYPE_RoutePush);

	/* reservation states */
	INSERT_INT_CONSTANT("RESV_STATE_NONE", RESV_NONE);
	INSERT_INT_CONSTANT("RESV_STATE_UNCONFIRMED", RESV_UNCONFIRMED);
	INSERT_INT_CONSTANT("RESV_STATE_CONFIRMED", RESV_CONFIRMED);
	INSERT_INT_CONSTANT("RESV_STATE_WAIT", RESV_WAIT);
	INSERT_INT_CONSTANT("RESV_STATE_TIME_TO_RUN", RESV_TIME_TO_RUN);
	INSERT_INT_CONSTANT("RESV_STATE_RUNNING", RESV_RUNNING);
	INSERT_INT_CONSTANT("RESV_STATE_FINISHED", RESV_FINISHED);
	INSERT_INT_CONSTANT("RESV_STATE_BEING_DELETED", RESV_BEING_DELETED);
	INSERT_INT_CONSTANT("RESV_STATE_DELETED", RESV_DELETED);
	INSERT_INT_CONSTANT("RESV_STATE_DELETING_JOBS", RESV_DELETING_JOBS);
	INSERT_INT_CONSTANT("RESV_STATE_DEGRADED", RESV_DEGRADED);
	INSERT_INT_CONSTANT("RESV_STATE_BEING_ALTERED", RESV_BEING_ALTERED);
	INSERT_INT_CONSTANT("RESV_STATE_IN_CONFLICT", RESV_IN_CONFLICT);

	/* job states */
	INSERT_INT_CONSTANT("JOB_STATE_TRANSIT", JOB_STATE_TRANSIT);
	INSERT_INT_CONSTANT("JOB_STATE_QUEUED", JOB_STATE_QUEUED);
	INSERT_INT_CONSTANT("JOB_STATE_HELD", JOB_STATE_HELD);
	INSERT_INT_CONSTANT("JOB_STATE_WAITING", JOB_STATE_WAITING);
	INSERT_INT_CONSTANT("JOB_STATE_RUNNING", JOB_STATE_RUNNING);
	INSERT_INT_CONSTANT("JOB_STATE_EXITING", JOB_STATE_EXITING);
	INSERT_INT_CONSTANT("JOB_STATE_EXPIRED", JOB_STATE_EXPIRED);
	INSERT_INT_CONSTANT("JOB_STATE_BEGUN", JOB_STATE_BEGUN);
	INSERT_INT_CONSTANT("JOB_STATE_SUSPEND", JOB_STATE_SUSPEND);
	INSERT_INT_CONSTANT("JOB_STATE_SUSPEND_USERACTIVE", JOB_STATE_SUSPEND_USERACTIVE);
	INSERT_INT_CONSTANT("JOB_STATE_MOVED", JOB_STATE_MOVED);
	INSERT_INT_CONSTANT("JOB_STATE_FINISHED", JOB_STATE_FINISHED);

	/* job substates */
	INSERT_INT_CONSTANT("JOB_SUBSTATE_UNKNOWN", JOB_SUBSTATE_UNKNOWN);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_TRANSIN", JOB_SUBSTATE_TRANSIN);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_TRANSICM", JOB_SUBSTATE_TRANSICM);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_TRNOUT", JOB_SUBSTATE_TRNOUT);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_TRNOUTCM", JOB_SUBSTATE_TRNOUTCM);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_QUEUED", JOB_SUBSTATE_QUEUED);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_PRESTAGEIN", JOB_SUBSTATE_PRESTAGEIN);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_SYNCRES", JOB_SUBSTATE_SYNCRES);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_STAGEIN", JOB_SUBSTATE_STAGEIN);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_STAGEGO", JOB_SUBSTATE_STAGEGO);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_STAGECMP", JOB_SUBSTATE_STAGECMP);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_HELD", JOB_SUBSTATE_HELD);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_SYNCHOLD", JOB_SUBSTATE_SYNCHOLD);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_DEPNHOLD", JOB_SUBSTATE_DEPNHOLD);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_WAITING", JOB_SUBSTATE_WAITING);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_STAGEFAIL", JOB_SUBSTATE_STAGEFAIL);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_PRERUN", JOB_SUBSTATE_PRERUN);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_RUNNING", JOB_SUBSTATE_RUNNING);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_SUSPEND", JOB_SUBSTATE_SUSPEND);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_SCHSUSP", JOB_SUBSTATE_SCHSUSP);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_EXITING", JOB_SUBSTATE_EXITING);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_STAGEOUT", JOB_SUBSTATE_STAGEOUT);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_STAGEDEL", JOB_SUBSTATE_STAGEDEL);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_EXITED", JOB_SUBSTATE_EXITED);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_ABORT", JOB_SUBSTATE_ABORT);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_KILLSIS", JOB_SUBSTATE_KILLSIS);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_RUNEPILOG", JOB_SUBSTATE_RUNEPILOG);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_OBIT", JOB_SUBSTATE_OBIT);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_TERM", JOB_SUBSTATE_TERM);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_DELJOB", JOB_SUBSTATE_DELJOB);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_RERUN", JOB_SUBSTATE_RERUN);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_RERUN1", JOB_SUBSTATE_RERUN1);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_RERUN2", JOB_SUBSTATE_RERUN2);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_RERUN3", JOB_SUBSTATE_RERUN3);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_EXPIRED", JOB_SUBSTATE_EXPIRED);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_BEGUN", JOB_SUBSTATE_BEGUN);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_PROVISION", JOB_SUBSTATE_PROVISION);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_WAITING_JOIN_JOB", JOB_SUBSTATE_WAITING_JOIN_JOB);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_TERMINATED", JOB_SUBSTATE_TERMINATED);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_FINISHED", JOB_SUBSTATE_FINISHED);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_FAILED", JOB_SUBSTATE_FAILED);
	INSERT_INT_CONSTANT("JOB_SUBSTATE_MOVED", JOB_SUBSTATE_MOVED);

	/* server states */
	INSERT_INT_CONSTANT("SV_STATE_IDLE", SV_STATE_INIT);
	INSERT_INT_CONSTANT("SV_STATE_ACTIVE", SV_STATE_RUN);
	INSERT_INT_CONSTANT("SV_STATE_HOT", SV_STATE_HOT);
	INSERT_INT_CONSTANT("SV_STATE_SHUTDEL", SV_STATE_SHUTDEL);
	INSERT_INT_CONSTANT("SV_STATE_SHUTIMM", SV_STATE_SHUTIMM);
	INSERT_INT_CONSTANT("SV_STATE_SHUTSIG", SV_STATE_SHUTSIG);

	/* Log message severity */
	INSERT_INT_CONSTANT("LOG_DEBUG", SEVERITY_LOG_DEBUG);
	INSERT_INT_CONSTANT("LOG_WARNING", SEVERITY_LOG_WARNING);
	INSERT_INT_CONSTANT("LOG_ERROR", SEVERITY_LOG_ERR);

	/* Log events levels */
	INSERT_INT_CONSTANT("EVENT_ERROR", PBSEVENT_ERROR);
	INSERT_INT_CONSTANT("EVENT_SYSTEM", PBSEVENT_SYSTEM);
	INSERT_INT_CONSTANT("EVENT_ADMIN", PBSEVENT_ADMIN);
	INSERT_INT_CONSTANT("EVENT_JOB", PBSEVENT_JOB);
	INSERT_INT_CONSTANT("EVENT_JOB_USAGE", PBSEVENT_JOB_USAGE);
	INSERT_INT_CONSTANT("EVENT_SECURITY", PBSEVENT_SECURITY);
	INSERT_INT_CONSTANT("EVENT_SCHED", PBSEVENT_SCHED);
	INSERT_INT_CONSTANT("EVENT_DEBUG", PBSEVENT_DEBUG);
	INSERT_INT_CONSTANT("EVENT_DEBUG2", PBSEVENT_DEBUG2);
	INSERT_INT_CONSTANT("EVENT_RESV", PBSEVENT_RESV);
	INSERT_INT_CONSTANT("EVENT_DEBUG3", PBSEVENT_DEBUG3);
	INSERT_INT_CONSTANT("EVENT_DEBUG4", PBSEVENT_DEBUG4);
	INSERT_INT_CONSTANT("EVENT_FORCE", PBSEVENT_FORCE);

	/* Event types */
	INSERT_INT_CONSTANT("QUEUEJOB", HOOK_EVENT_QUEUEJOB);
	INSERT_INT_CONSTANT("HOOK_EVENT_QUEUEJOB", HOOK_EVENT_QUEUEJOB);
	INSERT_INT_CONSTANT("POSTQUEUEJOB", HOOK_EVENT_POSTQUEUEJOB);
	INSERT_INT_CONSTANT("HOOK_EVENT_POSTQUEUEJOB", HOOK_EVENT_POSTQUEUEJOB);
	INSERT_INT_CONSTANT("MODIFYJOB", HOOK_EVENT_MODIFYJOB);
	INSERT_INT_CONSTANT("HOOK_EVENT_MODIFYJOB", HOOK_EVENT_MODIFYJOB);
	INSERT_INT_CONSTANT("RESVSUB", HOOK_EVENT_RESVSUB);
	INSERT_INT_CONSTANT("HOOK_EVENT_RESVSUB", HOOK_EVENT_RESVSUB);
	INSERT_INT_CONSTANT("MODIFYRESV", HOOK_EVENT_MODIFYRESV);
	INSERT_INT_CONSTANT("HOOK_EVENT_MODIFYRESV", HOOK_EVENT_MODIFYRESV);
	INSERT_INT_CONSTANT("MOVEJOB", HOOK_EVENT_MOVEJOB);
	INSERT_INT_CONSTANT("HOOK_EVENT_MOVEJOB", HOOK_EVENT_MOVEJOB);
	INSERT_INT_CONSTANT("RUNJOB", HOOK_EVENT_RUNJOB);
	INSERT_INT_CONSTANT("HOOK_EVENT_RUNJOB", HOOK_EVENT_RUNJOB);
	INSERT_INT_CONSTANT("JOBOBIT", HOOK_EVENT_JOBOBIT);
	INSERT_INT_CONSTANT("HOOK_EVENT_JOBOBIT", HOOK_EVENT_JOBOBIT);
	INSERT_INT_CONSTANT("MANAGEMENT", HOOK_EVENT_MANAGEMENT);
	INSERT_INT_CONSTANT("HOOK_EVENT_MANAGEMENT", HOOK_EVENT_MANAGEMENT);
	INSERT_INT_CONSTANT("MODIFYVNODE", HOOK_EVENT_MODIFYVNODE);
	INSERT_INT_CONSTANT("HOOK_EVENT_MODIFYVNODE", HOOK_EVENT_MODIFYVNODE);
	INSERT_INT_CONSTANT("PROVISION", HOOK_EVENT_PROVISION);
	INSERT_INT_CONSTANT("HOOK_EVENT_PROVISION", HOOK_EVENT_PROVISION);
	INSERT_INT_CONSTANT("RESV_END", HOOK_EVENT_RESV_END);
	INSERT_INT_CONSTANT("HOOK_EVENT_RESV_END", HOOK_EVENT_RESV_END);
	INSERT_INT_CONSTANT("RESV_BEGIN", HOOK_EVENT_RESV_BEGIN);
	INSERT_INT_CONSTANT("HOOK_EVENT_RESV_BEGIN", HOOK_EVENT_RESV_BEGIN);
	INSERT_INT_CONSTANT("RESV_CONFIRM", HOOK_EVENT_RESV_CONFIRM);
	INSERT_INT_CONSTANT("HOOK_EVENT_RESV_CONFIRM", HOOK_EVENT_RESV_CONFIRM);
	INSERT_INT_CONSTANT("EXECJOB_BEGIN", HOOK_EVENT_EXECJOB_BEGIN);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_BEGIN", HOOK_EVENT_EXECJOB_BEGIN);
	INSERT_INT_CONSTANT("EXECJOB_PROLOGUE", HOOK_EVENT_EXECJOB_PROLOGUE);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_PROLOGUE", HOOK_EVENT_EXECJOB_PROLOGUE);
	INSERT_INT_CONSTANT("EXECJOB_EPILOGUE", HOOK_EVENT_EXECJOB_EPILOGUE);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_EPILOGUE", HOOK_EVENT_EXECJOB_EPILOGUE);
	INSERT_INT_CONSTANT("EXECJOB_PRETERM", HOOK_EVENT_EXECJOB_PRETERM);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_PRETERM", HOOK_EVENT_EXECJOB_PRETERM);
	INSERT_INT_CONSTANT("EXECJOB_END", HOOK_EVENT_EXECJOB_END);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_END", HOOK_EVENT_EXECJOB_END);
	INSERT_INT_CONSTANT("EXECJOB_LAUNCH", HOOK_EVENT_EXECJOB_LAUNCH);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_LAUNCH", HOOK_EVENT_EXECJOB_LAUNCH);
	INSERT_INT_CONSTANT("EXECHOST_PERIODIC", HOOK_EVENT_EXECHOST_PERIODIC);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECHOST_PERIODIC", HOOK_EVENT_EXECHOST_PERIODIC);
	INSERT_INT_CONSTANT("EXECHOST_STARTUP", HOOK_EVENT_EXECHOST_STARTUP);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECHOST_STARTUP", HOOK_EVENT_EXECHOST_STARTUP);
	INSERT_INT_CONSTANT("EXECJOB_ATTACH", HOOK_EVENT_EXECJOB_ATTACH);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_ATTACH", HOOK_EVENT_EXECJOB_ATTACH);
	INSERT_INT_CONSTANT("EXECJOB_RESIZE", HOOK_EVENT_EXECJOB_RESIZE);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_RESIZE", HOOK_EVENT_EXECJOB_RESIZE);
	INSERT_INT_CONSTANT("EXECJOB_ABORT", HOOK_EVENT_EXECJOB_ABORT);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_ABORT", HOOK_EVENT_EXECJOB_ABORT);
	INSERT_INT_CONSTANT("EXECJOB_POSTSUSPEND", HOOK_EVENT_EXECJOB_POSTSUSPEND);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_POSTSUSPEND", HOOK_EVENT_EXECJOB_POSTSUSPEND);
	INSERT_INT_CONSTANT("EXECJOB_PRERESUME", HOOK_EVENT_EXECJOB_PRERESUME);
	INSERT_INT_CONSTANT("HOOK_EVENT_EXECJOB_PRERESUME", HOOK_EVENT_EXECJOB_PRERESUME);
	INSERT_INT_CONSTANT("MOM_EVENTS", MOM_EVENTS);
	INSERT_INT_CONSTANT("HOOK_EVENT_MOM_EVENTS", MOM_EVENTS);
	INSERT_INT_CONSTANT("PERIODIC", HOOK_EVENT_PERIODIC);
	INSERT_INT_CONSTANT("HOOK_EVENT_PERIODIC", HOOK_EVENT_PERIODIC);

	/* Vnode State Constants */
	INSERT_INT_CONSTANT("ND_FREE", INUSE_FREE);
	INSERT_INT_CONSTANT("ND_STATE_FREE", INUSE_FREE);
	INSERT_INT_CONSTANT("ND_OFFLINE", INUSE_OFFLINE);
	INSERT_INT_CONSTANT("ND_STATE_OFFLINE", INUSE_OFFLINE);
	INSERT_INT_CONSTANT("ND_DOWN", INUSE_DOWN);
	INSERT_INT_CONSTANT("ND_STATE_DOWN", INUSE_DOWN);
	INSERT_INT_CONSTANT("ND_STATE_DELETED", INUSE_DELETED);
	INSERT_INT_CONSTANT("ND_STALE", INUSE_STALE);
	INSERT_INT_CONSTANT("ND_STATE_STALE", INUSE_STALE);
	INSERT_INT_CONSTANT("ND_JOBBUSY", INUSE_JOB);
	INSERT_INT_CONSTANT("ND_STATE_JOBBUSY", INUSE_JOB);
	INSERT_INT_CONSTANT("ND_JOB_EXCLUSIVE", INUSE_JOBEXCL);
	INSERT_INT_CONSTANT("ND_STATE_JOB_EXCLUSIVE", INUSE_JOBEXCL);
	INSERT_INT_CONSTANT("ND_RESV_EXCLUSIVE", INUSE_RESVEXCL);
	INSERT_INT_CONSTANT("ND_STATE_RESV_EXCLUSIVE", INUSE_RESVEXCL);
	INSERT_INT_CONSTANT("ND_BUSY", INUSE_BUSY);
	INSERT_INT_CONSTANT("ND_STATE_BUSY", INUSE_BUSY);
	INSERT_INT_CONSTANT("ND_STATE_UNKNOWN", INUSE_UNKNOWN);
	INSERT_INT_CONSTANT("ND_STATE_NEEDS_HELLOSVR", INUSE_NEEDS_HELLOSVR);
	INSERT_INT_CONSTANT("ND_STATE_INIT", INUSE_INIT);
	INSERT_INT_CONSTANT("ND_PROV", INUSE_PROV);
	INSERT_INT_CONSTANT("ND_STATE_PROV", INUSE_PROV);
	INSERT_INT_CONSTANT("ND_WAIT_PROV", INUSE_WAIT_PROV);
	INSERT_INT_CONSTANT("ND_STATE_WAIT_PROV", INUSE_WAIT_PROV);
	INSERT_INT_CONSTANT("ND_UNRESOLVABLE", INUSE_UNRESOLVABLE);
	INSERT_INT_CONSTANT("ND_STATE_UNRESOLVABLE", INUSE_UNRESOLVABLE);
	INSERT_INT_CONSTANT("ND_SLEEP", INUSE_SLEEP);
	INSERT_INT_CONSTANT("ND_STATE_SLEEP", INUSE_SLEEP);
	INSERT_INT_CONSTANT("ND_STATE_OFFLINE_BY_MOM", INUSE_OFFLINE_BY_MOM);
	INSERT_INT_CONSTANT("ND_STATE_MARKEDDOWN", INUSE_MARKEDDOWN);
	INSERT_INT_CONSTANT("ND_STATE_NEED_ADDRS", INUSE_NEED_ADDRS);
	INSERT_INT_CONSTANT("ND_STATE_MAINTENANCE", INUSE_MAINTENANCE);
	INSERT_INT_CONSTANT("ND_STATE_NEED_CREDENTIALS", INUSE_NEED_CREDENTIALS);
	INSERT_INT_CONSTANT("ND_STATE_VNODE_UNAVAILABLE", VNODE_UNAVAILABLE);

	/* Vnode Type Constants */
	INSERT_INT_CONSTANT("ND_PBS", NTYPE_PBS);

	/* Vnode Sharing Constants */
	INSERT_INT_CONSTANT("ND_DEFAULT_SHARED", VNS_DFLT_SHARED);
	INSERT_INT_CONSTANT("ND_DEFAULT_EXCL", VNS_DFLT_EXCL);
	INSERT_INT_CONSTANT("ND_FORCE_EXCL", VNS_FORCE_EXCL);
	INSERT_INT_CONSTANT("ND_IGNORE_EXCL", VNS_IGNORE_EXCL);
	INSERT_INT_CONSTANT("ND_FORCE_EXCLHOST", VNS_FORCE_EXCLHOST);
	INSERT_INT_CONSTANT("ND_DEFAULT_EXCLHOST", VNS_DFLT_EXCLHOST);

	INSERT_INT_CONSTANT("MGR_CMD_NONE", MGR_CMD_NONE);
	INSERT_INT_CONSTANT("MGR_CMD_CREATE", MGR_CMD_CREATE);
	INSERT_INT_CONSTANT("MGR_CMD_DELETE", MGR_CMD_DELETE);
	INSERT_INT_CONSTANT("MGR_CMD_SET", MGR_CMD_SET);
	INSERT_INT_CONSTANT("MGR_CMD_UNSET", MGR_CMD_UNSET);
	INSERT_INT_CONSTANT("MGR_CMD_LIST", MGR_CMD_LIST);
	INSERT_INT_CONSTANT("MGR_CMD_PRINT", MGR_CMD_PRINT);
	INSERT_INT_CONSTANT("MGR_CMD_ACTIVE", MGR_CMD_ACTIVE);
	INSERT_INT_CONSTANT("MGR_CMD_IMPORT", MGR_CMD_IMPORT);
	INSERT_INT_CONSTANT("MGR_CMD_EXPORT", MGR_CMD_EXPORT);
	INSERT_INT_CONSTANT("MGR_CMD_LAST", MGR_CMD_LAST);

	INSERT_INT_CONSTANT("MGR_OBJ_NONE", MGR_OBJ_NONE);
	INSERT_INT_CONSTANT("MGR_OBJ_SERVER", MGR_OBJ_SERVER);
	INSERT_INT_CONSTANT("MGR_OBJ_QUEUE", MGR_OBJ_QUEUE);
	INSERT_INT_CONSTANT("MGR_OBJ_JOB", MGR_OBJ_JOB);
	INSERT_INT_CONSTANT("MGR_OBJ_NODE", MGR_OBJ_NODE);
	INSERT_INT_CONSTANT("MGR_OBJ_RESV", MGR_OBJ_RESV);
	INSERT_INT_CONSTANT("MGR_OBJ_RSC", MGR_OBJ_RSC);
	INSERT_INT_CONSTANT("MGR_OBJ_SCHED", MGR_OBJ_SCHED);
	INSERT_INT_CONSTANT("MGR_OBJ_HOST", MGR_OBJ_HOST);
	INSERT_INT_CONSTANT("MGR_OBJ_HOOK", MGR_OBJ_HOOK);
	INSERT_INT_CONSTANT("MGR_OBJ_PBS_HOOK", MGR_OBJ_PBS_HOOK);
	INSERT_INT_CONSTANT("MGR_OBJ_LAST", MGR_OBJ_LAST);

	INSERT_INT_CONSTANT("BRP_CHOICE_NULL", BATCH_REPLY_CHOICE_NULL);
	INSERT_INT_CONSTANT("BRP_CHOICE_Queue", BATCH_REPLY_CHOICE_Queue);
	INSERT_INT_CONSTANT("BRP_CHOICE_RdytoCom", BATCH_REPLY_CHOICE_RdytoCom);
	INSERT_INT_CONSTANT("BRP_CHOICE_Commit", BATCH_REPLY_CHOICE_Commit);
	INSERT_INT_CONSTANT("BRP_CHOICE_Select", BATCH_REPLY_CHOICE_Select);
	INSERT_INT_CONSTANT("BRP_CHOICE_Status", BATCH_REPLY_CHOICE_Status);
	INSERT_INT_CONSTANT("BRP_CHOICE_Text", BATCH_REPLY_CHOICE_Text);
	INSERT_INT_CONSTANT("BRP_CHOICE_Locate", BATCH_REPLY_CHOICE_Locate);
	INSERT_INT_CONSTANT("BRP_CHOICE_RescQuery", BATCH_REPLY_CHOICE_RescQuery);
	INSERT_INT_CONSTANT("BRP_CHOICE_PreemptJobs", BATCH_REPLY_CHOICE_PreemptJobs);

	/* the pair to this list is in pbs_ifl.h and must be updated to reflect any changes */
	INSERT_INT_CONSTANT("BATCH_OP_SET", SET);
	INSERT_INT_CONSTANT("BATCH_OP_UNSET", UNSET);
	INSERT_INT_CONSTANT("BATCH_OP_INCR", INCR);
	INSERT_INT_CONSTANT("BATCH_OP_DECR", DECR);
	INSERT_INT_CONSTANT("BATCH_OP_EQ", EQ);
	INSERT_INT_CONSTANT("BATCH_OP_NE", NE);
	INSERT_INT_CONSTANT("BATCH_OP_GE", GE);
	INSERT_INT_CONSTANT("BATCH_OP_GT", GT);
	INSERT_INT_CONSTANT("BATCH_OP_LE", LE);
	INSERT_INT_CONSTANT("BATCH_OP_LT", LT);
	INSERT_INT_CONSTANT("BATCH_OP_DFLT", DFLT);

	INSERT_INT_CONSTANT("ATR_VFLAG_SET", ATR_VFLAG_SET);
	INSERT_INT_CONSTANT("ATR_VFLAG_MODIFY", ATR_VFLAG_MODIFY);
	INSERT_INT_CONSTANT("ATR_VFLAG_DEFLT", ATR_VFLAG_DEFLT);
	INSERT_INT_CONSTANT("ATR_VFLAG_MODCACHE", ATR_VFLAG_MODCACHE);
	INSERT_INT_CONSTANT("ATR_VFLAG_INDIRECT", ATR_VFLAG_INDIRECT);
	INSERT_INT_CONSTANT("ATR_VFLAG_TARGET", ATR_VFLAG_TARGET);
	INSERT_INT_CONSTANT("ATR_VFLAG_HOOK", ATR_VFLAG_HOOK);

	return 0;
}

/*  -----                    MODULE METHODS                   -----    */

static PyMethodDef pbs_v1_module_methods[] = {
	{"wordsize",
	 (PyCFunction) pbsv1mod_meth_wordsize,
	 METH_NOARGS, pbsv1mod_meth_wordsize_doc},
	{"in_python_mode",
	 (PyCFunction) pbsv1mod_meth_in_python_mode,
	 METH_NOARGS, pbsv1mod_meth_in_python_mode_doc},
	{"in_site_hook",
	 (PyCFunction) pbsv1mod_meth_in_site_hook,
	 METH_NOARGS, pbsv1mod_meth_in_site_hook_doc},
	{"duration_to_secs",
	 (PyCFunction) pbsv1mod_meth_duration_to_secs,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_duration_to_secs_doc},
	{"validate_input",
	 (PyCFunction) pbsv1mod_meth_validate_input,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_validate_input_doc},
	{"event",
	 (PyCFunction) pbsv1mod_meth_event,
	 METH_NOARGS, pbsv1mod_meth_event_doc},
	{"server",
	 (PyCFunction) pbsv1mod_meth_server,
	 METH_NOARGS, pbsv1mod_meth_server_doc},
	{"_event_accept",
	 (PyCFunction) pbsv1mod_meth_event_accept,
	 METH_NOARGS, pbsv1mod_meth_event_accept_doc},
	{"_event_reject",
	 (PyCFunction) pbsv1mod_meth_event_reject,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_event_reject_doc},
	{"_event_param_mod_allow",
	 (PyCFunction) pbsv1mod_meth_event_param_mod_allow,
	 METH_NOARGS, pbsv1mod_meth_event_param_mod_allow_doc},
	{"_event_param_mod_disallow",
	 (PyCFunction) pbsv1mod_meth_event_param_mod_disallow,
	 METH_NOARGS, pbsv1mod_meth_event_param_mod_disallow_doc},
	{"is_attrib_val_settable", (PyCFunction) pbsv1mod_meth_is_attrib_val_settable,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_is_attrib_val_settable_doc},
	{"get_queue", (PyCFunction) pbsv1mod_meth_get_queue,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_queue_doc},
	{"get_job", (PyCFunction) pbsv1mod_meth_get_job,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_job_doc},
	{"release_nodes", (PyCFunction) pbsv1mod_meth_release_nodes,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_release_nodes_doc},
	{PY_GETRESV_METHOD, (PyCFunction) pbsv1mod_meth_get_resv,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_resv_doc},
	{PY_GETVNODE_METHOD, (PyCFunction) pbsv1mod_meth_get_vnode,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_vnode_doc},
	{PY_ITER_NEXTFUNC_METHOD, (PyCFunction) pbsv1mod_meth_iter_nextfunc,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_iter_nextfunc_doc},
	{PY_MARK_VNODE_SET_METHOD, (PyCFunction) pbsv1mod_meth_mark_vnode_set,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_mark_vnode_set_doc},
	{PY_LOAD_RESOURCE_VALUE_METHOD,
	 (PyCFunction) pbsv1mod_meth_load_resource_value,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_load_resource_value_doc},
	{PY_RESOURCE_STR_VALUE_METHOD,
	 (PyCFunction) pbsv1mod_meth_resource_str_value,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_resource_str_value_doc},
	{PY_VNODE_STATE_TO_STR_METHOD,
	 (PyCFunction) pbsv1mod_meth_vnode_state_to_str,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_vnode_state_to_str_doc},
	{PY_VNODE_SHARING_TO_STR_METHOD,
	 (PyCFunction) pbsv1mod_meth_vnode_sharing_to_str,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_vnode_sharing_to_str_doc},
	{PY_VNODE_NTYPE_TO_STR_METHOD,
	 (PyCFunction) pbsv1mod_meth_vnode_ntype_to_str,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_vnode_ntype_to_str_doc},
	{"logmsg", (PyCFunction) pbsv1mod_meth_logmsg,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_logmsg_doc},
	{PY_LOGJOBMSG_METHOD, (PyCFunction) pbsv1mod_meth_logjobmsg,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_logjobmsg_doc},
	{PY_GET_PYTHON_DAEMON_NAME_METHOD,
	 (PyCFunction) pbsv1mod_meth_get_python_daemon_name,
	 METH_NOARGS, pbsv1mod_meth_get_python_daemon_name_doc},
	{PY_GET_PBS_SERVER_NAME_METHOD,
	 (PyCFunction) pbsv1mod_meth_get_pbs_server_name,
	 METH_NOARGS, pbsv1mod_meth_get_pbs_server_name_doc},
	{PY_GET_LOCAL_HOST_NAME_METHOD,
	 (PyCFunction) pbsv1mod_meth_get_local_host_name,
	 METH_NOARGS, pbsv1mod_meth_get_local_host_name_doc},
	{PY_SET_PYTHON_MODE_METHOD,
	 (PyCFunction) pbsv1mod_meth_set_python_mode,
	 METH_NOARGS, pbsv1mod_meth_set_python_mode_doc},
	{PY_SET_C_MODE_METHOD,
	 (PyCFunction) pbsv1mod_meth_set_c_mode,
	 METH_NOARGS, pbsv1mod_meth_set_c_mode_doc},
	{PY_STR_TO_VNODE_STATE_METHOD, (PyCFunction) pbsv1mod_meth_str_to_vnode_state,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_str_to_vnode_state_doc},
	{PY_STR_TO_VNODE_NTYPE_METHOD, (PyCFunction) pbsv1mod_meth_str_to_vnode_ntype,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_str_to_vnode_ntype_doc},
	{PY_STR_TO_VNODE_SHARING_METHOD, (PyCFunction) pbsv1mod_meth_str_to_vnode_sharing,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_str_to_vnode_sharing_doc},
	{PY_REBOOT_HOST_METHOD,
	 (PyCFunction) pbsv1mod_meth_reboot,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_reboot_doc},
	{PY_SCHEDULER_RESTART_CYCLE_METHOD,
	 (PyCFunction) pbsv1mod_meth_scheduler_restart_cycle,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_scheduler_restart_cycle_doc},
	{PY_SET_PBS_STATOBJ_METHOD,
	 (PyCFunction) pbsv1mod_meth_set_pbs_statobj,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_set_pbs_statobj_doc},
	{PY_SIZE_TO_KBYTES_METHOD, (PyCFunction) pbsv1mod_meth_size_to_kbytes,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_size_to_kbytes_doc},
	{PY_GET_SERVER_STATIC_METHOD, (PyCFunction) pbsv1mod_meth_get_server_static,
	 METH_NOARGS, pbsv1mod_meth_get_server_static_doc},
	{PY_GET_JOB_STATIC_METHOD, (PyCFunction) pbsv1mod_meth_get_job_static,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_job_static_doc},
	{PY_GET_RESV_STATIC_METHOD, (PyCFunction) pbsv1mod_meth_get_resv_static,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_resv_static_doc},
	{PY_GET_QUEUE_STATIC_METHOD, (PyCFunction) pbsv1mod_meth_get_queue_static,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_queue_static_doc},
	{PY_GET_VNODE_STATIC_METHOD, (PyCFunction) pbsv1mod_meth_get_vnode_static,
	 METH_VARARGS | METH_KEYWORDS, pbsv1mod_meth_get_vnode_static_doc},
	{PY_GET_SERVER_DATA_FP_METHOD, (PyCFunction) pbsv1mod_meth_get_server_data_fp,
	 METH_NOARGS, pbsv1mod_meth_get_server_data_fp_doc},
	{PY_GET_SERVER_DATA_FILE_METHOD, (PyCFunction) pbsv1mod_meth_get_server_data_file,
	 METH_NOARGS, pbsv1mod_meth_get_server_data_file_doc},
	{PY_USE_STATIC_DATA_METHOD,
	 (PyCFunction) pbsv1mod_meth_use_static_data,
	 METH_NOARGS, pbsv1mod_meth_use_static_data_doc},
	{PY_GET_PBS_CONF_METHOD,
	 (PyCFunction) pbsv1mod_meth_get_pbs_conf,
	 METH_NOARGS, pbsv1mod_meth_get_pbs_conf_doc},
	{NULL, NULL} /* sentinel */
};

static char pbs_v1_module_doc[] =
	"PBS Module providing PBS C/Python glue code\n\
    \t\n\
    ";

static struct PyModuleDef pbs_v1_module = {
	PyModuleDef_HEAD_INIT,
	PBS_PYTHON_V1_MODULE_EXTENSION_NAME,
	pbs_v1_module_doc,
	-1,
	pbs_v1_module_methods};

/*
 * ----------------- EXTERNAL DEFINITIONS -----------------------
 */

/**
 * @brief
 * 	pbs_v1_module_init
 *   	This is convenience routine to be used by both embedded and extension
 *   	mechanism to initialize the module. Since Py_InitModuleX can be called
 *   	multiple time without any ill side effects :).
 *
 * @return	object
 * @retval	The module object (borrowed reference)
 */

PyObject *
pbs_v1_module_init(void)
{

	PyObject *m = NULL;	/* the module object, NEW ref */
	PyObject *mdict = NULL; /* the module object, BORROWED ref */
	PyObject *py_types_module = NULL;

	m = PyModule_Create(&pbs_v1_module);

	if (m == NULL)
		return m;

	/* IMPORTANT all our types ready */
	if (ppsvr_prepare_all_types() < 0)
		goto ERROR_EXIT;

	mdict = PyModule_GetDict(m);

	/* get svr types */
	py_types_module = ppsvr_create_types_module();
	if (py_types_module == NULL)
		goto ERROR_EXIT;
	if ((PyDict_SetItemString(mdict, "svr_types",
				  py_types_module)) == -1) {
		Py_XDECREF(py_types_module);
		return NULL;
	}

	Py_XDECREF(py_types_module);

	/* Add all our constants */
	if (_pv1mod_insert_int_constants(mdict) == -1)
		return NULL;

	if (_pv1mod_insert_str_constants(mdict) == -1)
		return NULL;

	PyPbsV1ModuleExtension_Obj = m; /* used to create separate namespaces later */
	return m;

ERROR_EXIT:
	return NULL;
}

/**
 * @brief
 * 	The below is for embedded interpreter puts it in the __main__
 * 	module.
 *
 */
PyObject *
pbs_v1_module_inittab(void)
{
	return pbs_v1_module_init();
}

/**
 * @brief
 * ==== For exposing the module as an external shared library =====
 */

PyMODINIT_FUNC
init_pbs_v1(void)
{
	return pbs_v1_module_init();
}


================================================
FILE: src/lib/Libpython/pbs_python_external.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_python_external.c
 * @brief
 *  This file contains shared routines that can be used by any of the PBS
 *  infrastructure daemons (Server,MOM or Scheduler). This file basically
 *  provides all the implementation for external interface routines found
 *  in pbs_python.h
 *
 */

#include <pbs_config.h>

/* --- BEGIN PYTHON DEPENDENCIES --- */

#ifdef PYTHON

#include <pbs_python_private.h> /* private python file  */
#include <Python.h>		/* Includes eval.h for PyEval_EvalCode  */
#include <pythonrun.h>		/* For Py_SetPythonHome */
#include <sys/types.h>
#include <sys/stat.h>
#include <signal.h>
#include <unistd.h>
#include <wchar.h>
#include "hook.h"

extern PyObject *PyInit__pbs_ifl(void);
extern pbs_list_head svr_allhooks;

static struct _inittab pbs_python_inittab_modules[] = {
	{PBS_PYTHON_V1_MODULE_EXTENSION_NAME, pbs_v1_module_inittab},
	{"_pbs_ifl", PyInit__pbs_ifl},
	{NULL, NULL} /* sentinel */
};

static PyObject *
_pbs_python_compile_file(const char *file_name,
			 const char *compiled_code_file_name);
extern int pbs_python_setup_namespace_dict(PyObject *globals);

#endif /* PYTHON */

#include <pbs_python.h>

/* --- END PYTHON DEPENDENCIES --- */

/*
 * GLOBAL
 */
/* TODO make it autoconf? */
char *pbs_python_daemon_name;

/*
 * ===================   BEGIN   EXTERNAL ROUTINES  ===================
 */

static int
initialize_python_config(int install_signal_handlers)
{
	PyStatus py_status;
	PyConfig py_config;
	char *python_binpath = NULL;
	static wchar_t w_python_binpath[MAXPATHLEN + 1] = {'\0'};

	PyConfig_InitPythonConfig(&py_config);

	py_config._install_importlib = 1;
	py_config.use_environment = 0;
	py_config.optimization_level = 2;
	py_config.isolated = 1;
	py_config.site_import = 0;
	py_config.install_signal_handlers = install_signal_handlers;

	/* Set python binary path if it's not already set */
	if (w_python_binpath[0] == '\0') {
		if (get_py_progname(&python_binpath)) {
			log_err(-1, __func__, "Failed to find python binary path!");
			return -1;
		}
		mbstowcs(w_python_binpath, python_binpath, MAXPATHLEN + 1);
		free(python_binpath);
	}

	/* Set the program name in the Python configuration */
	py_status = PyConfig_SetString(&py_config, &py_config.program_name, w_python_binpath);
	if (PyStatus_Exception(py_status))
		return -1;

	/* Initialize the top-level module */
	if (PyImport_ExtendInittab(pbs_python_inittab_modules) != 0) {
		log_err(-1, "PyImport_ExtendInittab", "--> Failed to initialize Python interpreter <--");
		return -1;
	}

	/* Initialize the Python interpreter with the given configuration */
	py_status = Py_InitializeFromConfig(&py_config);
	if (PyStatus_Exception(py_status)) {
		log_err(-1, "Py_InitializeFromConfig", "--> Failed to initialize Python interpreter <--");
		PyConfig_Clear(&py_config);  /* Clear the configuration object */
		return -1;
	}

	return 0;
}

/**
 *
 * @brief
 *	Start the Python interpreter.
 *
 * @param[in/out] interp_data - has some prefilled information about
 *				the python interpreter to start, like python
 *				daemon name. This will also get filled in
 *				with new information such as status of
 *				of the python start.
 * @note
 *	If  called by pbs_python command, then any log messages are logged as
 *	DEBUG3; otherwise, DEBUG2.
 */

int
pbs_python_ext_start_interpreter(struct python_interpreter_data *interp_data)
{

#ifdef PYTHON /* -- BEGIN ONLY IF PYTHON IS CONFIGURED -- */
	struct stat sbuf;
	char pbs_python_destlib[MAXPATHLEN + 1] = {'\0'};
	char pbs_python_destlib2[MAXPATHLEN + 1] = {'\0'};
	int evtype;
	int rc;

	/*
	 * initialize the convenience global pbs_python_daemon_name, as it is
	 * used everywhere
	 */

	pbs_python_daemon_name = interp_data->daemon_name;

	/* Need to make logging less verbose if pbs_python command */
	/* used, since it can get called many times in a pbs daemon, */
	/* and it would litter that daemon's logs */
	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		evtype = PBSEVENT_DEBUG3;
	else
		evtype = PBSEVENT_DEBUG2;

	snprintf(pbs_python_destlib, MAXPATHLEN, "%s/lib64/python/altair",
		 pbs_conf.pbs_exec_path);
	snprintf(pbs_python_destlib2, MAXPATHLEN, "%s/lib64/python/altair/pbs/v1",
		 pbs_conf.pbs_exec_path);
	rc = stat(pbs_python_destlib, &sbuf);
	if (rc != 0) {
		snprintf(pbs_python_destlib, MAXPATHLEN, "%s/lib/python/altair",
			 pbs_conf.pbs_exec_path);
		rc = stat(pbs_python_destlib, &sbuf);
		snprintf(pbs_python_destlib2, MAXPATHLEN, "%s/lib/python/altair/pbs/v1",
			 pbs_conf.pbs_exec_path);
	}
	if (rc != 0) {
		log_err(-1, __func__,
			"--> PBS Python library directory not found <--");
		goto ERROR_EXIT;
	}
	if (!S_ISDIR(sbuf.st_mode)) {
		log_err(-1, __func__,
			"--> PBS Python library path is not a directory <--");
		goto ERROR_EXIT;
	}

	if (interp_data) {
		interp_data->init_interpreter_data(interp_data); /* to be safe */
		if (interp_data->interp_started) {
			log_event(evtype, PBS_EVENTCLASS_SERVER,
				  LOG_INFO, interp_data->daemon_name,
				  "--> Python interpreter already started <--");
			goto SUCCESS_EXIT;
		} /* else { we are not started but ready } */
	} else {  /* we need to allocate memory */
		log_err(-1, __func__,
			"--> Passed NULL for interpreter data <--");
		goto ERROR_EXIT;
	}

#ifdef WIN32
	Py_NoSiteFlag = 1;
	Py_FrozenFlag = 1;
	Py_OptimizeFlag = 2;          /* TODO make this a compile flag variable */
	Py_IgnoreEnvironmentFlag = 1; /* ignore PYTHONPATH and PYTHONHOME */
	set_py_progname();
	/* we make sure our top level module is initialized */
	if ((PyImport_ExtendInittab(pbs_python_inittab_modules) != 0)) {
		log_err(-1, "PyImport_ExtendInittab",
			"--> Failed to initialize Python interpreter <--");
		goto ERROR_EXIT;
	}

	/*
	 * arg '1' means to not skip init of signals
	 * we want signals to propagate to the executing
	 * Python script to be able to interrupt it
	 */
	Py_InitializeEx(1);
#else
	if (initialize_python_config(1))
		goto ERROR_EXIT;

#endif

	if (Py_IsInitialized()) {
		char *msgbuf;

		interp_data->interp_started = 1; /* mark python as initialized */
		/* print only the first five characters, TODO check for NULL? */
		pbs_asprintf(&msgbuf,
			     "--> Python Interpreter started, compiled with version:'%s' <--",
			     Py_GetVersion());
		log_event(evtype, PBS_EVENTCLASS_SERVER,
			  LOG_INFO, interp_data->daemon_name, msgbuf);
		free(msgbuf);
	} else {
		log_err(-1, "Py_InitializeEx",
			"--> Failed to initialize Python interpreter <--");
		goto ERROR_EXIT;
	}
	/*
	 * Add Altair python module directory to sys path. NOTE:
	 *  PBS_PYTHON_MODULE_DIR is a command line define, also insert
	 * standard required python modules
	 */
	if (pbs_python_modify_syspath(pbs_python_destlib, -1) == -1) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not insert %s into sys.path shutting down",
			 pbs_python_destlib);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(-1, __func__, log_buffer);
		goto ERROR_EXIT;
	}

	if (pbs_python_modify_syspath(pbs_python_destlib2, -1) == -1) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not insert %s into sys.path shutting down",
			 pbs_python_destlib2);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(-1, __func__, log_buffer);
		goto ERROR_EXIT;
	}

	/*
	 * At this point it is safe to load the available server types from
	 * the python modules. since the syspath is setup correctly
	 */
	if ((pbs_python_load_python_types(interp_data) == -1)) {
		log_err(-1, __func__, "could not load python types into the interpreter");
		goto ERROR_EXIT;
	}

	interp_data->pbs_python_types_loaded = 1; /* just in case */

#ifdef LIBPYTHONSVR
	PyObject *m, *d, *f, *handler, *sigint;
	m = PyImport_ImportModule("signal");
	if (!m) {
		log_err(-1, __func__, "failed to import the signal module");
		goto ERROR_EXIT;
	}
	d = PyModule_GetDict(m);
	f = PyDict_GetItemString(d, "signal");
	handler = PyDict_GetItemString(d, "default_int_handler");
	sigint = PyDict_GetItemString(d, "SIGINT");
	if (f && PyCallable_Check(f)) {
		if (!PyObject_CallFunctionObjArgs(f, sigint, handler, NULL)) {
			Py_CLEAR(m);
			log_err(-1, __func__, "could not set up signal.default_int_handler");
			goto ERROR_EXIT;
		}
	} else {
		Py_CLEAR(m);
		log_err(-1, __func__, "could not call signal.signal");
		goto ERROR_EXIT;
	}
	Py_CLEAR(m);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_INFO, interp_data->daemon_name, "successfully set up signal.default_int_handler");
#endif

SUCCESS_EXIT:
	return 0;
ERROR_EXIT:
	if (interp_data->interp_started) {
		pbs_python_ext_shutdown_interpreter(interp_data);
	}
	return 1;
#else  /* !PYTHON */
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
			  PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_SERVER,
		  LOG_INFO, "start_python",
		  "--> Python interpreter not built in <--");
	return 0;
#endif /* PYTHON */
}

/**
 *
 * @brief
 *	Shuts down the Python interpreter.
 *
 * @param[in/out] interp_data - has some prefilled information about
 *				the python interpreter to shutdown,
 *				This will also get filled in
 *				with new information such as status of
 *				of the python shutdown.
 * @note
 *	If  called by pbs_python command, then any log messages are logged as
 *	DEBUG3; otherwise, DEBUG2.
 */

void
pbs_python_ext_shutdown_interpreter(struct python_interpreter_data *interp_data)
{
#ifdef PYTHON /* -- BEGIN ONLY IF PYTHON IS CONFIGURED -- */
	int evtype;
	hook *phook;

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		evtype = PBSEVENT_DEBUG3;
	else
		evtype = PBSEVENT_DEBUG2;

	if (interp_data) {
		if (interp_data->interp_started) {
			log_event(evtype, PBS_EVENTCLASS_SERVER,
				  LOG_INFO, interp_data->daemon_name,
				  "--> Stopping Python interpreter <--");
			
			if (!IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
				/* clear all code objects of hooks */
				phook = (hook *) GET_NEXT(svr_allhooks);
				while (phook) {
					if (phook->script)
						pbs_python_ext_free_code_obj(phook->script);
					phook = (hook *) GET_NEXT(phook->hi_allhooks);
				}
			}

			/* before finalize clear global python objects */
			pbs_python_unload_python_types(interp_data);
			Py_Finalize();
		}
		interp_data->destroy_interpreter_data(interp_data);
		/* reset so that we do not have a problem */
		pbs_python_daemon_name = NULL;
	}

#endif /* PYTHON */
}

/**
 * @brief
 * 	pbs_python_ext_quick_start_interpreter - the basic startup without loading
 *	of PBS attributes and resources into Python.
 */

void
pbs_python_ext_quick_start_interpreter(void)
{

#ifdef PYTHON /* -- BEGIN ONLY IF PYTHON IS CONFIGURED -- */
	char pbs_python_destlib[MAXPATHLEN + 1] = {'\0'};
	char pbs_python_destlib2[MAXPATHLEN + 1] = {'\0'};

	snprintf(pbs_python_destlib, MAXPATHLEN, "%s/lib/python/altair",
		 pbs_conf.pbs_exec_path);
	snprintf(pbs_python_destlib2, MAXPATHLEN, "%s/lib/python/altair/pbs/v1",
		 pbs_conf.pbs_exec_path);

#ifdef WIN32
	Py_NoSiteFlag = 1;
	Py_FrozenFlag = 1;
	Py_OptimizeFlag = 2;	      /* TODO make this a compile flag variable */
	Py_IgnoreEnvironmentFlag = 1; /* ignore PYTHONPATH and PYTHONHOME */
	set_py_progname();
	/* we make sure our top level module is initialized */
	if ((PyImport_ExtendInittab(pbs_python_inittab_modules) != 0)) {
		log_err(-1, "PyImport_ExtendInittab",
			"--> Failed to initialize Python interpreter <--");
		goto ERROR_EXIT;
	}

	Py_InitializeEx(0); /* SKIP initialization of signals */
#else
	if (initialize_python_config(0))
		goto ERROR_EXIT;
#endif

	if (Py_IsInitialized()) {
		char *msgbuf;

		pbs_asprintf(&msgbuf,
			     "--> Python Interpreter quick started, compiled with version:'%s' <--",
			     Py_GetVersion());
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
				  PBSEVENT_DEBUG,
			  PBS_EVENTCLASS_SERVER,
			  LOG_INFO, __func__, msgbuf);
		free(msgbuf);
	} else {
		log_err(-1, "Py_InitializeEx",
			"--> Failed to quick initialize Python interpreter <--");
		goto ERROR_EXIT;
	}
	/*
	 * Add Altair python module directory to sys path. NOTE:
	 *  PBS_PYTHON_MODULE_DIR is a command line define, also insert
	 * standard required python modules
	 */
	if (pbs_python_modify_syspath(pbs_python_destlib, -1) == -1) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not insert %s into sys.path shutting down",
			 pbs_python_destlib);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(-1, __func__, log_buffer);
		goto ERROR_EXIT;
	}

	if (pbs_python_modify_syspath(pbs_python_destlib2, -1) == -1) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not insert %s into sys.path shutting down",
			 pbs_python_destlib2);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(-1, __func__, log_buffer);
		goto ERROR_EXIT;
	}

	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "--> Inserted Altair PBS Python modules dir '%s' '%s'<--", pbs_python_destlib, pbs_python_destlib2);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
			  PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_SERVER,
		  LOG_INFO, __func__, log_buffer);

	return;

ERROR_EXIT:
	pbs_python_ext_quick_shutdown_interpreter();
	return;
#else  /* !PYTHON */
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
			  PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_SERVER,
		  LOG_INFO, "start_python",
		  "--> Python interpreter not built in <--");
	return;
#endif /* PYTHON */
}

/**
 * @brief
 * 	pbs_python_ext_quick_shutdown_interpreter
 */

void
pbs_python_ext_quick_shutdown_interpreter(void)
{
#ifdef PYTHON /* -- BEGIN ONLY IF PYTHON IS CONFIGURED -- */
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
			  PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_SERVER,
		  LOG_INFO, "pbs_python_ext_quick_shutdown_interpreter",
		  "--> Stopping Python interpreter <--");
	Py_Finalize();
#endif /* PYTHON */
}

void
pbs_python_ext_free_global_dict(
	struct python_script *py_script)
{
#ifdef PYTHON /* --- BEGIN PYTHON BLOCK --- */
	if (py_script->global_dict) {
		PyDict_Clear((PyObject *) py_script->global_dict); /* clear k,v */
		Py_CLEAR(py_script->global_dict);
	}
#endif /* --- END   PYTHON BLOCK --- */
	return;
}

void
pbs_python_ext_free_code_obj(
	struct python_script *py_script)
{
#ifdef PYTHON /* --- BEGIN PYTHON BLOCK --- */
	if (py_script->py_code_obj)
		Py_CLEAR(py_script->py_code_obj);
#endif /* --- END   PYTHON BLOCK --- */
	return;
}

void
pbs_python_ext_free_python_script(
	struct python_script *py_script)
{
	if (py_script) {
		if (py_script->path)
			free(py_script->path);
		pbs_python_ext_free_code_obj(py_script);
		pbs_python_ext_free_global_dict(py_script);
	}
	return;
}
#define COPY_STRING(dst, src)                                              \
	do {                                                               \
		if (!((dst) = strdup(src))) {                              \
			log_err(errno, __func__, "could not copy string"); \
			goto ERROR_EXIT;                                   \
		}                                                          \
	} while (0)

int
pbs_python_ext_alloc_python_script(
	const char *script_path,
	struct python_script **py_script /* returned value */
)
{

#ifdef PYTHON /* --- BEGIN PYTHON BLOCK --- */

	struct python_script *tmp_py_script = NULL;
	size_t nbytes = sizeof(struct python_script);
	struct stat sbuf;

	*py_script = NULL; /* init, to be safe */

	if (!(tmp_py_script = (struct python_script *) malloc(nbytes))) {
		log_err(errno, __func__, "failed to malloc struct python_script");
		goto ERROR_EXIT;
	}
	(void) memset(tmp_py_script, 0, nbytes);
	/* check for recompile true by default */
	tmp_py_script->check_for_recompile = 1;

	COPY_STRING(tmp_py_script->path, script_path);
	/* store the stat */
	if ((stat(script_path, &sbuf) == -1)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "failed to stat <%s>", script_path);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(errno, __func__, log_buffer);
		goto ERROR_EXIT;
	}
	(void) memcpy(&(tmp_py_script->cur_sbuf), &sbuf,
		      sizeof(tmp_py_script->cur_sbuf));
	/* ok, we are set with py_script */
	*py_script = tmp_py_script;
	return 0;

ERROR_EXIT:
	if (tmp_py_script) {
		pbs_python_ext_free_python_script(tmp_py_script);
		free(tmp_py_script);
	}
	return -1;
#else

	log_err(-1, __func__, "--> Python is disabled <--");
	return -1;
#endif /* --- END   PYTHON BLOCK --- */
}

/**
 * @brief
 * 	Function to create a separate namespace. Essentially a sandbox to run
 * 	python scrips independently.
 *
 * @param[in] interp_data - pointer to interpreter data
 *
 */

void *
pbs_python_ext_namespace_init(
	struct python_interpreter_data *interp_data)
{

#ifdef PYTHON /* --- BEGIN PYTHON BLOCK --- */

	PyObject *namespace_dict = NULL;
	PyObject *py_v1_module = NULL;

	namespace_dict = PyDict_New(); /* New Refrence MUST Decref */
	if (!namespace_dict) {
		pbs_python_write_error_to_log(__func__);
		goto ERROR_EXIT;
	}
	/*
	 * setup our namespace, by including all the modules that are needed to
	 * run the python scripts
	 */
	if ((PyDict_SetItemString(namespace_dict, "__builtins__",
				  PyEval_GetBuiltins()) == -1)) {
		pbs_python_write_error_to_log(__func__);
		goto ERROR_EXIT;
	}

	/*
	 * Now, add our extension object/module to the namespace.
	 */
	py_v1_module = pbs_v1_module_init();
	if (py_v1_module == NULL)
		goto ERROR_EXIT;
	if ((PyDict_SetItemString(namespace_dict,
				  PBS_PYTHON_V1_MODULE_EXTENSION_NAME,
				  py_v1_module) == -1)) {
		Py_XDECREF(py_v1_module);
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s|adding extension object",
			 __func__);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		pbs_python_write_error_to_log(__func__);
		goto ERROR_EXIT;
	}

	Py_XDECREF(py_v1_module);

	return namespace_dict;

ERROR_EXIT:
	if (namespace_dict) {
		PyDict_Clear(namespace_dict);
		Py_CLEAR(namespace_dict);
	}
	return namespace_dict;

#else  /* !PYTHON */
	return NULL;
#endif /* --- END   PYTHON BLOCK --- */
}

/**
 *
 * @brief
 *	Checks if hook script needs recompilation.
 *
 * @param[in] interp_data - data to the python interpreter that will interpret
 *				the script.
 * @return	int
 * @retval	-2 	script  compilation failed
 * @retval	-1 	other failures
 * @retval	0 	success
 *
 * @note
 *	If  called by pbs_python command, then any log messages are logged as
 *	DEBUG3; otherwise, DEBUG2.
 */
int
pbs_python_check_and_compile_script(struct python_interpreter_data *interp_data,
				    struct python_script *py_script)
{

#ifdef PYTHON		  /* -- BEGIN ONLY IF PYTHON IS CONFIGURED -- */
	struct stat nbuf; /* new stat buf */
	struct stat obuf; /* old buf */
	int recompile = 1;

	if (!interp_data || !py_script) {
		log_err(-1, __func__, "Either interp_data or py_script is NULL");
		return -1;
	}

	/* ok, first time go straight to compile */
	do {
		if (!py_script->py_code_obj)
			break;
		(void) memcpy(&obuf, &(py_script->cur_sbuf), sizeof(obuf));
		if (py_script->check_for_recompile) {
			if ((stat(py_script->path, &nbuf) != 1) &&
			    (nbuf.st_ino == obuf.st_ino) &&
			    (nbuf.st_size == obuf.st_size) &&
			    (nbuf.st_mtime == obuf.st_mtime)) {
				recompile = 0;
			} else {
				recompile = 1;
				(void) memcpy(&(py_script->cur_sbuf), &nbuf,
					      sizeof(py_script->cur_sbuf));
				Py_CLEAR(py_script->py_code_obj); /* we are rebuilding */
			}
		}
	} while (0);

	if (recompile) {
		snprintf(log_buffer, LOG_BUF_SIZE,
			 "Compiling script file: <%s>", py_script->path);

		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
				  LOG_INFO, interp_data->daemon_name, log_buffer);
		else
			log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
					  PBSEVENT_DEBUG,
				  PBS_EVENTCLASS_SERVER,
				  LOG_INFO, interp_data->daemon_name, log_buffer);

		if (!(py_script->py_code_obj =
			      _pbs_python_compile_file(py_script->path,
						       "<embedded code object>"))) {
			pbs_python_write_error_to_log("Failed to compile script");
			return -2;
		}
	}

	/* set dict to null during compilation, clearing previous global/local */
	/* dictionary to prevent leaks.                                        */
	if (py_script->global_dict) {
		PyDict_Clear((PyObject *) py_script->global_dict);
		Py_CLEAR(py_script->global_dict);
	}

	return 0;
#else  /* !PYTHON */
	return -1;
#endif /* PYTHON */
}

/**
 * @brief
 *	runs python script in namespace.
 *
 * @param[in] interp_data - pointer to interpreter data
 * @param[in] py_script - pointer to python script info
 * @param[out] exit_code - exit code
 *
 * @return	int
 * @retval	-3 	script executed but got KeyboardInterrupt
 * @retval	-2 	script  compiled or executed with error
 * @retval	-1 	other failures
 * @retval	0 	success
 */
int
pbs_python_run_code_in_namespace(struct python_interpreter_data *interp_data,
				 struct python_script *py_script,
				 int *exit_code)
{

#ifdef PYTHON /* -- BEGIN ONLY IF PYTHON IS CONFIGURED -- */

	PyObject *pdict;
	struct stat nbuf; /* new stat buf */
	struct stat obuf; /* old buf */
	int recompile = 1;
	PyObject *ptype;
	PyObject *pvalue;
	PyObject *ptraceback;
	PyObject *pobjStr;
	PyObject *retval;
	const char *pStr;
	int rc = 0;
	pid_t orig_pid;

	if (!interp_data || !py_script) {
		log_err(-1, __func__, "Either interp_data or py_script is NULL");
		return -1;
	}

	/* ok, first time go straight to compile */
	do {
		if (!py_script->py_code_obj)
			break;
		(void) memcpy(&obuf, &(py_script->cur_sbuf), sizeof(obuf));
		if (py_script->check_for_recompile) {
			if ((stat(py_script->path, &nbuf) != -1) &&
			    (nbuf.st_ino == obuf.st_ino) &&
			    (nbuf.st_size == obuf.st_size) &&
			    (nbuf.st_mtime == obuf.st_mtime)) {
				recompile = 0;
			} else {
				recompile = 1;
				(void) memcpy(&(py_script->cur_sbuf), &nbuf,
					      sizeof(py_script->cur_sbuf));
				Py_CLEAR(py_script->py_code_obj); /* we are rebuilding */
			}
		}
	} while (0);

	if (recompile) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "Compiling script file: <%s>", py_script->path);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
				  LOG_INFO, interp_data->daemon_name, log_buffer);
		else
			log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
					  PBSEVENT_DEBUG,
				  PBS_EVENTCLASS_SERVER,
				  LOG_INFO, interp_data->daemon_name, log_buffer);

		if (!(py_script->py_code_obj =
			      _pbs_python_compile_file(py_script->path,
						       "<embedded code object>"))) {
			pbs_python_write_error_to_log("Failed to compile script");
			return -2;
		}
	}

	/* make new namespace dictionary, NOTE new reference */

	if (!(pdict = (PyObject *) pbs_python_ext_namespace_init(interp_data))) {
		log_err(-1, __func__, "while calling pbs_python_ext_namespace_init");
		return -1;
	}
	if ((pbs_python_setup_namespace_dict(pdict) == -1)) {
		Py_CLEAR(pdict);
		return -1;
	}

	py_script->global_dict = pdict;

	orig_pid = getpid();

	PyErr_Clear(); /* clear any exceptions before starting code */
	/* precompile strings of code to bytecode objects */
	retval = PyEval_EvalCode((PyObject *) py_script->py_code_obj,
				 pdict, pdict);

	/* check for a fork of the hook, terminate fork immediately */
	if (orig_pid != getpid())
		exit(0);

	/* check for exception */
	if (PyErr_Occurred()) {
		if (PyErr_ExceptionMatches(PyExc_KeyboardInterrupt)) {
			pbs_python_write_error_to_log("Python script received a KeyboardInterrupt");
			Py_XDECREF(retval);
			return -3;
		}

		if (PyErr_ExceptionMatches(PyExc_SystemExit)) {
			PyErr_Fetch(&ptype, &pvalue, &ptraceback);
			PyErr_Clear(); /* just in case, not clear from API doc */

			if (pvalue) {
				pobjStr = PyObject_Str(pvalue); /* new ref */
				pStr = PyUnicode_AsUTF8(pobjStr);
				rc = (int) atol(pStr);
				Py_XDECREF(pobjStr);
			}

			Py_XDECREF(ptype);
			Py_XDECREF(pvalue);

#if !defined(WIN32)
			Py_XDECREF(ptraceback);
#elif !defined(_DEBUG)
			/* for some reason this crashes on Windows Debug version */
			Py_XDECREF(ptraceback);
#endif

		} else {
			pbs_python_write_error_to_log("Error evaluating Python script");
			Py_XDECREF(retval);
			return -2;
		}
	}
	PyErr_Clear();
	Py_XDECREF(retval);

	if (exit_code)
		*exit_code = rc; /* set exit code if var is not null */

	return 0;
#else  /* !PYTHON */
	return -1;
#endif /* PYTHON */
}

#ifdef PYTHON /*  === BEGIN ALL FUNCTIONS REQUIRING PYTHON HEADERS === */

/**
 * @brief
 *	only compile the python script.
 *
 * @param[in]	file_name - abs file name
 * @param[out]  compiled_code_file_name - compiled file
 *
 * @return	object
 * @retval
 * @retval	error code	error
 *
 */
static PyObject *
_pbs_python_compile_file(const char *file_name,
			 const char *compiled_code_file_name)
{
	FILE *fp = NULL;

	long len = 0;
	size_t file_sz = 0;	  /* script file no. of bytes */
	char *file_buffer = NULL; /* buffer to hold the python script file */
	char *cp = NULL;	  /* useful character pointer */
	PyObject *rv = NULL;

	fp = fopen(file_name, "rb");
	if (!fp) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not open file <%s>: %s\n", file_name, strerror(errno));
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(errno, __func__, log_buffer);
		goto ERROR_EXIT;
	}

	if ((fseek(fp, 0L, SEEK_END) == 0)) { /* ok we reached the end */
		len = ftell(fp);
		if (len == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "could not determine the file length: %s\n", strerror(errno));
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			log_err(errno, __func__, log_buffer);
			goto ERROR_EXIT;
		}
		if ((fseek(fp, 0L, SEEK_SET) == -1)) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "could not fseek to beginning: %s\n", strerror(errno));
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			log_err(errno, __func__, log_buffer);
			goto ERROR_EXIT;
		}
		file_sz = len; /* ok good we have a file size */
	} else {	       /* Uh-oh bad news */
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not fseek to end: %s\n", strerror(errno));
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(errno, __func__, log_buffer);
		goto ERROR_EXIT;
	}
	/* allocate memory for file + \n\0 */
	file_sz += 2;

	if (!(file_buffer = (char *) PyMem_Malloc(sizeof(char) * file_sz))) {
		/* could not allocate memory */
		pbs_python_write_error_to_log(__func__);
		goto ERROR_EXIT;
	}

	/* read the file, clean up the file for DOS \r stuff */
	file_sz = fread(file_buffer, sizeof(char), (file_sz - 2), fp);

	file_buffer[file_sz] = '\n';
	file_buffer[file_sz + 1] = '\0';

	if (*file_buffer == '\r')
		*file_buffer = ' ';
	/* TODO handle \r in string constants? */
	for (cp = file_buffer + 1; *cp != '\0'; cp++) {
		if (*cp == '\r') {
			if (*(cp - 1) == '\\') {
				*(cp - 1) = ' ';
				*cp = '\\';
			} else {
				*cp = ' ';
			}
		}
	}

	fclose(fp);
	/* compile the string to a code object,NEW reference caller must DECREF */
	rv = Py_CompileString(file_buffer, compiled_code_file_name, Py_file_input);
	PyMem_Free(file_buffer);
	return rv;

ERROR_EXIT:
	if (fp)
		fclose(fp);
	if (file_buffer)
		PyMem_Free(file_buffer); /* to be safe */
	return rv;
}

#endif /* PYTHON */


================================================
FILE: src/lib/Libpython/pbs_python_import_types.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_python_import_types.c
 * @brief
 * This file contains all the neccessary type initialization for the "extension"
 * module.
 * Also all Python types implemented in "C" are added as "module object"
 * "svr_types" and inserted into the extension module dictionary.
 *
 */

#include <pbs_config.h>
#include <pbs_python_private.h>

/* GLOBALS */

extern PyTypeObject PPSVR_Size_Type; /* pbs_python_svr_size_type.c */

/**
 * @brief
 * 	Prepare all the types, see the PBS Extensions Documentations on why we
 * 	need to do this. Essentially, this ensures all the "slots" for the
 * 	PyTypeObject are properly initialized.
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */

int
ppsvr_prepare_all_types(void)
{
	int rv = 0; /* success */

	if ((rv = PyType_Ready(&PPSVR_Size_Type)) < 0)
		return rv;

	return rv;
}

/*
 * -----                 svr_types MODULE METHODS               ----- *
 */

static PyMethodDef svr_types_module_methods[] = {
	{NULL, NULL} /* sentinel */
};

static char svr_types_module_doc[] =
	"PBS Server types Module providing handy access to all the types\n\
\tavailable in the PBS Python Server modules.\n\
";

static struct PyModuleDef svr_types_module = {
	PyModuleDef_HEAD_INIT,
	PBS_PYTHON_V1_MODULE_EXTENSION_NAME ".svr_types",
	svr_types_module_doc,
	-1,
	svr_types_module_methods,
	NULL,
	NULL,
	NULL,
	NULL};

/**
 * @brief
 * 	ppsvr_create_types_module-creates and returns svr)types module object
 *
 * @returns	PyObject*
 * @retval	The svr_types module object (BORROWED reference)
 */

PyObject *
ppsvr_create_types_module(void)
{
	PyObject *m = NULL;	/* create types module */
	PyObject *mdict = NULL; /* module dict  */

	m = PyModule_Create(&svr_types_module);

	if (m == NULL)
		return m;
	/* let's get the modules dict, we use this instead of PyModule_AddObject
	 * because of Py_INCREF all types and then to Py_DECREF in case of error
	 * is not going to be managable
	 */
	mdict = PyModule_GetDict(m); /* never fails */

	/* Add _size type to svr_types */
	if ((PyDict_SetItemString(mdict, "_size",
				  (PyObject *) &PPSVR_Size_Type)) == -1)
		return NULL;

	return m;
}


================================================
FILE: src/lib/Libpython/pbs_python_svr_external.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_python_svr_external.c
 * @brief
 * This file should contain interface implementation interacting with the
 * Core PBS Server. So *no* MOM and SCHED dependency should be in this file.
 *
 * @par	library:
 *   libpbspython_svr.a
 */

#include <pbs_config.h>

#ifdef PYTHON
#include <pbs_python_private.h>
#include <Python.h>
#endif

#include <pbs_python.h>
#include <server_limits.h>
#include "pbs_ifl.h" /* picks up the extern decl for pbs_config */
#include "resource.h"
#include "pbs_share.h"
#include "pbs_error.h"
#include "pbs_sched.h"
#include "server.h"

/* Functions */
#ifdef PYTHON
extern void _pbs_python_set_mode(int mode);

extern int _pbs_python_event_mark_readonly(void);

extern int _pbs_python_event_set(unsigned int hook_event, char *req_user,
				 char *req_host, hook_input_param_t *req_params, char *perf_label);

extern int _pbs_python_event_to_request(unsigned int hook_event, hook_output_param_t *req_params, char *perf_label, char *perf_action);

extern int _pbs_python_event_set_attrval(char *name, char *value);

extern char *_pbs_python_event_get_attrval(char *name);

extern void _pbs_python_event_accept(void);

extern void _pbs_python_event_reject(char *msg);

extern char *_pbs_python_event_get_reject_msg(void);

extern int _pbs_python_event_get_accept_flag(void);

extern void _pbs_python_event_param_mod_allow(void);

extern void _pbs_python_event_param_mod_disallow(void);

extern int _pbs_python_event_param_get_mod_flag(void);

extern char *
_pbs_python_event_job_getval_hookset(char *attrib_name, char *opval,
				     int opval_len, char *delval, int delval_len);

extern char *
_pbs_python_event_job_getval(char *attrib_name);

extern char *
_pbs_python_event_jobresc_getval_hookset(char *attrib_name, char *resc_name);

extern int
_pbs_python_event_jobresc_clear_hookset(char *attrib_name);

extern char *
_pbs_python_event_jobresc_getval(char *attrib_name, char *resc_name);

extern int _pbs_python_has_vnode_set(void);

extern void _pbs_python_do_vnode_set(void);

extern char *pbs_python_object_str(PyObject *);

#endif /* PYTHON */

/* GLOBAL vars */
extern char *msg_daemonname; /* pbsd_main.c for SERVER */

/*
 * Helper functions involving the PBS Server daemon
 */

/**
 * @brief
 * 	python initiliaze interpreter data
 *
 * @param[in] interp_data - pointer to python interpreter data
 *
 */
void
pbs_python_svr_initialize_interpreter_data(struct python_interpreter_data *interp_data)
{
	/* check whether we are already initialized */
	if (interp_data->data_initialized)
		return;

	interp_data->daemon_name = msg_daemonname;
	interp_data->interp_started = 0;
	interp_data->data_initialized = 1;
	interp_data->pbs_python_types_loaded = 0;
	return;
}

/**
 * @brief
 *      python destroy interpreter data
 *
 * @param[in] interp_data - pointer to python interpreter data
 *
 */
void
pbs_python_svr_destroy_interpreter_data(struct python_interpreter_data *interp_data)
{
	/* nothing to do or free data */
	interp_data->data_initialized = 0;
	interp_data->interp_started = 0;
	interp_data->pbs_python_types_loaded = 0;
	return;
}

/*
 * Helper functions related to PBS events
 */

/**
 * @brief
 * 	Sets the "operation" mode of Python: if 'mode' is PY_MODE, then we're
 * 	inside the hook script; if 'mode' is C_MODE, then we're inside some
 * 	internal C helper function.
 * 	Setting 'mode' to C_MODE usually means we don't have any restriction
 * 	as to which attributes we can or cannot set.
 *
 * @param[in] mode - value to indicate which attr val can be set
 *
 */
void
pbs_python_set_mode(int mode)
{

#ifdef PYTHON
	_pbs_python_set_mode(mode);
#endif
}

/**
 * @brief
 * 	Makes the Python PBS event object read-only, meaning none of its
 * 	could be modified in a hook script.
 *
 * @return	int
 * @retval	0 	for success
 * @retval	-1 	otherwise
 */
int
pbs_python_event_mark_readonly(void)
{

#ifdef PYTHON
	return (_pbs_python_event_mark_readonly());
#else
	return (0);
#endif
}

/**
 *
 * @brief
 *	This creates a PBS Python event object representing 'hook_event' with
 * request parameter 'req_params' and requested by:
 * 'req_user'@'req_host'.
 *
 * @param[in]	hook_event - the event represented
 * @param[in]	req_user - who requested the hook event
 * @param[in]	req_host - where the request came from
 * @param[in]	req_params - array of input parameters
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 *
 * @return int
 * @retval 0	- success
 * @retval -1	- error
 *
 */
int
pbs_python_event_set(unsigned int hook_event, char *req_user,
		     char *req_host, hook_input_param_t *req_params,
		     char *perf_label)
{
#ifdef PYTHON
	int rc;
	rc = _pbs_python_event_set(hook_event, req_user, req_host, req_params, perf_label);

	if (rc == -2) { /* _pbs_python_event_set got interrupted, retry */
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  "_pbs_python_event_set", "retrying call");
		rc = _pbs_python_event_set(hook_event, req_user, req_host,
					   req_params, perf_label);
	}
	return (rc);
#else
	return (0);
#endif
}


/**
 *
 * @brief
 * 	Recreates 'req_params' (request structures,
 *	ex. rq_queuejob, rq_manage, rq_move) consulting the parameter values
 *	obtained from current
 * 	PBS Python event object representing 'hook_event'.
 *
 * @param[in]	hook_event - the event represented
 * @param[in]	req_params - array of input parameters
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 * @param[in]	perf_action - passed on to hook_perf_stat* call.
 *
 * @return int
 * @retval 0	- success
 * @retval -1	- error
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_end() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
int
pbs_python_event_to_request(unsigned int hook_event, hook_output_param_t *req_params, char *perf_label, char *perf_action)
{

#ifdef PYTHON
	return (_pbs_python_event_to_request(hook_event, req_params, perf_label, perf_action));
#else
	return (0);
#endif
}

char *
pbs_python_event_job_getval_hookset(char *attrib_name, char *opval,
				    int opval_len, char *delval, int delval_len)
{
#ifdef PYTHON
	return (_pbs_python_event_job_getval_hookset(attrib_name, opval,
						     opval_len, delval, delval_len));
#else
	return (0);
#endif
}

/**
 *
 * @brief
 *	Wrapper function to _pbs_python_event_job_getval().
 *
 * @param[in]	attrib_name - parameter passed to the function
 *				'_pbs_python_event_job_getval()'.
 */
char *
pbs_python_event_job_getval(char *attrib_name)
{
#ifdef PYTHON
	return (_pbs_python_event_job_getval(attrib_name));
#else
	return NULL;
#endif
}

/**
 *
 * @brief
 *	Wrapper function to _pbs_python_event_jobresc_getval_hookset().
 *
 * @param[in]	attrib_name - parameter passed to the function
 *				'_pbs_python_event_jobresc_getval_hookset()'.
 * @param[in]	resc_name - parameter passed to the function
 *				'_pbs_python_event_jobresc_getval_hookset()'.
 */
char *
pbs_python_event_jobresc_getval_hookset(char *attrib_name, char *resc_name)
{
#ifdef PYTHON
	return (_pbs_python_event_jobresc_getval_hookset(attrib_name, resc_name));
#else
	return NULL;
#endif
}

/**
 *
 * @brief
 *	Wrapper function to _pbs_python_event_jobresc_clear_hookset().
 *
 * @param[in]	attrib_name - parameter passed to the function
 *				'_pbs_python_event_jobresc_clear_hookset()'.
 */
int
pbs_python_event_jobresc_clear_hookset(char *attrib_name)
{
#ifdef PYTHON
	return (_pbs_python_event_jobresc_clear_hookset(attrib_name));
#else
	return (0);
#endif
}

/**
 *
 * @brief
 *	Wrapper function to _pbs_python_event_jobresc_getval().
 *
 * @param[in]	attrib_name - parameter passed to the function
 *				'_pbs_python_event_jobresc_getval()'.
 * @param[in]	resc_name - parameter passed to the function
 *				'_pbs_python_event_jobresc_getval()'.
 */
char *
pbs_python_event_jobresc_getval(char *attrib_name, char *resc_name)
{
#ifdef PYTHON
	return (_pbs_python_event_jobresc_getval(attrib_name, resc_name));
#else
	return NULL;
#endif
}

/**
 * @brief
 * 	Sets the value of the attribute 'name' of the current Python Object event
 * 	to a string 'value'. The descriptor for the attribute will take care of
 * 	converting to an actual type.
 *
 * @param[out] name - attr name
 * @param[in] value - value for attribute name
 *
 * @return	int
 * @retval	0 	for success
 * @retval	-1  	for error.
 */
int
pbs_python_event_set_attrval(char *name, char *value)
{

#ifdef PYTHON
	return (_pbs_python_event_set_attrval(name, value));
#else
	return (0);
#endif
}

/**
 * @brief
 * 	Gets the value of the attribute 'name' of the current Python Object event
 * 	as a string. Returns NULL if it doesn't find one.
 */
char *
pbs_python_event_get_attrval(char *name)
{

#ifdef PYTHON
	return (_pbs_python_event_get_attrval(name));
#else
	return NULL;
#endif
}

/**
 * @brief
 *  	Allows the current PBS event request to proceed.
 */
void
pbs_python_event_accept(void)
{

#ifdef PYTHON
	_pbs_python_event_accept();
#endif
}

/**
 * @brief
 *  	Reject the current PBS event request.
 */
void
pbs_python_event_reject(char *msg)
{

#ifdef PYTHON
	_pbs_python_event_reject(msg);
#endif
}

/**
 * @brief
 * 	Returns the message string supplied in the hook script when it rejected
 * 	an event request.
 */
char *
pbs_python_event_get_reject_msg(void)
{

#ifdef PYTHON
	return (_pbs_python_event_get_reject_msg());
#else
	return NULL;
#endif
}

/**
 * @brief
 * 	Returns the value of the event accept flag (1 for TRUE or 0 for FALSE).
 */
int
pbs_python_event_get_accept_flag(void)
{

#ifdef PYTHON
	return (_pbs_python_event_get_accept_flag());
#else
	return (0); /* for FALSE */
#endif
}

/**
 * @brief
 * 	Sets a global flag that says modifications to the PBS Python
 * 	attributes are allowed.
 */
void
pbs_python_event_param_mod_allow(void)
{

#ifdef PYTHON
	_pbs_python_event_param_mod_allow();
#endif
}

/**
 * @brief
 * 	Sets a global flag that says any more modifications to the PBS Python
 * 	attributes would be disallowed.
 */
void
pbs_python_event_param_mod_disallow(void)
{

#ifdef PYTHON
	_pbs_python_event_param_mod_disallow();
#endif
}

/**
 * @brief
 * 	Returns the value (0 or 1) of the global flag that says whether or not
 * 	modifications to the PBS Python attributes are allowed.
 */
int
pbs_python_event_param_get_mod_flag(void)
{

#ifdef PYTHON
	return (_pbs_python_event_param_get_mod_flag());
#else
	return (0); /* for FALSE */
#endif
}

/*
 *
 * @brief
 *	Checks if there's at least one pending "set" vnode operation
 *	that needs to be performed by PBS.
 * @par
 *	See called function itself for details.
 *
 * @return int
 * @retval 1	- if a "set" operation was found.
 * @retval 0   - if not found.
 *
 */
int
pbs_python_has_vnode_set(void)
{

#ifdef PYTHON
	return (_pbs_python_has_vnode_set());
#else
	return (0); /* for FALSE */
#endif
}

/**
 * @brief
 *	Perform all the "set" vnode operations to be performed by PBS.
 * @par
 *	See called function itself for details.
 */
void
pbs_python_do_vnode_set(void)
{

#ifdef PYTHON
	_pbs_python_do_vnode_set();
#endif
}

/**
 * @brief
 * 	pbs_python_set_interrupt - wrapper to PyErr_SetInterrupt()
 *
 */

void
pbs_python_set_interrupt(void)
{

#ifdef PYTHON
	PyErr_SetInterrupt();
#endif
}

/**
 *  @brief
 *  	Initializes all the elements of hook_input_param_t structure.
 *
 *  @param[in/out]	hook_input - the structure to initialize.
 *
 *  @return void
 */

void
hook_input_param_init(hook_input_param_t *hook_input)
{

	hook_input->rq_job = NULL;
	hook_input->rq_postqueuejob = NULL;
	hook_input->rq_manage = NULL;
	hook_input->rq_move = NULL;
	hook_input->rq_prov = NULL;
	hook_input->rq_run = NULL;
	hook_input->rq_obit = NULL;
	hook_input->progname = NULL;
	hook_input->argv_list = NULL;
	hook_input->env = NULL;
	hook_input->jobs_list = NULL;
	hook_input->vns_list = NULL;
	hook_input->resv_list = NULL;
	hook_input->vns_list_fail = NULL;
}

/**
 *  @brief
 *  	Initializes all the elements of hook_output_param_t structure.
 *
 *  @param[in/out]	hook_output - the structure to initialize.
 *
 *  @return void
 */
void
hook_output_param_init(hook_output_param_t *hook_output)
{
	hook_output->rq_job = NULL;
	hook_output->rq_postqueuejob = NULL;
	hook_output->rq_manage = NULL;
	hook_output->rq_move = NULL;
	hook_output->rq_prov = NULL;
	hook_output->rq_run = NULL;
	hook_output->rq_obit = NULL;
	hook_output->progname = NULL;
	hook_output->argv_list = NULL;
	hook_output->env = NULL;
	hook_output->jobs_list = NULL;
	hook_output->vns_list = NULL;
	hook_output->resv_list = NULL;
	hook_output->vns_list_fail = NULL;
}


================================================
FILE: src/lib/Libpython/pbs_python_svr_internal.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_python_svr_internal.c
 * @brief
 * This are the internal helper functions that depend on a lot of PBS
 * Server Data structures.
 *
 */
#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_python_private.h>

#include <stdio.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/param.h>
#include <memory.h>
#include <stdlib.h>
#include <libpbs.h>
#include <pbs_ifl.h>
#include <errno.h>
#include <string.h>
#include <list_link.h>
#include <log.h>
#include <attribute.h>
#include <resource.h>
#include <server_limits.h>
#include <server.h>
#include <job.h>
#include <reservation.h>
#include <queue.h>
#include <pbs_error.h>
#include <batch_request.h>
#include <provision.h>
#include "hook.h"
#include "pbs_nodes.h"

#include "cmds.h"
#include "svrfunc.h"
#include "pbs_ecl.h"
#include "placementsets.h"
#include "pbs_reliable.h"

/* -----                        GLOBALS                        -----    */

/* pipe-separated string lists  */
#define runjob_modifiable_jobattrs ATTR_h "|" ATTR_a "|" ATTR_project "|" ATTR_e "|" ATTR_o "|" ATTR_l "|" ATTR_v "|" ATTR_depend "|" ATTR_create_resv_from_job
#define runjob_modifiable_vnattrs ATTR_NODE_state

#define FMT_RUNJOB_ERRMSG "Can only set job's (%s) attribute, or a vnode's (%s) attribute under RUNJOB event - got <%s>"

extern attribute_def que_attr_def[];
extern resource_def *svr_resc_def; /* the resource def structure */
extern int svr_resc_size;	   /* static + dynamic */
extern int svr_resc_unk;	   /* the last one */
extern char server_name[];
extern struct python_interpreter_data svr_interp_data;
extern pbs_list_head svr_queues;   /* list of queues                   */
extern pbs_list_head svr_alljobs;  /* list of all jobs in server       */
extern pbs_list_head svr_allresvs; /* all reservations in server */
extern char *msg_man_set;
extern char *path_hooks_workdir;

/* Global symbols */
extern char *vnode_state_to_str(int state_bit);
extern char *vnode_sharing_to_str(enum vnode_sharing share);
extern char *vnode_ntype_to_str(int vntype);

extern int str_to_vnode_state(char *vnstate);
extern enum vnode_sharing str_to_vnode_sharing(char *vn_str);
extern int str_to_vnode_ntype(char *vntype);
extern u_Long pps_size_to_kbytes(PyObject *l);
extern PyObject *svrattrl_list_to_pyobject(int rq_cmd, pbs_list_head *);
extern PyObject *svrattrl_to_server_attribute(int rq_cmd, svrattrl *);

static PyObject *
_pps_helper_get_resv(resc_resv *presv_o, const char *resvid, char *perf_label);

/* A dictionary for quick access to the pbs.v1 EMBEDDED_EXTENSION_TYPES */
static PyObject *PBS_PythonTypes = NULL; /* A dictionary maintaing name and type */

/*
 *  BEGIN Quick Access Types Table
 *    The below code is a convenience scheme, not really needed as they are
 *    available in the PBS_PythonTypes dict. But, since we do this for every
 *    aggregate type, comes in handy.
 */
typedef struct _pbs_python_types_entry {
	char *t_key;	   /* The key in EXPORTED TYPES DICTIONARY */
	PyObject *t_class; /* The actual type or class */
} pbs_python_types_entry;

#define PP_DESC_IDX 0
#define PP_GENERIC_IDX 1
#define PP_SIZE_IDX 2
#define PP_TIME_IDX 3
#define PP_ACL_IDX 4
#define PP_BOOL_IDX 5
#define PP_JOB_IDX 6
#define PP_QUE_IDX 7
#define PP_SVR_IDX 8
#define PP_RESV_IDX 9
#define PP_EVENT_IDX 10
#define PP_RESC_IDX 11
#define PP_ARST_IDX 12
#define PP_INT_IDX 13
#define PP_STR_IDX 14
#define PP_FLOAT_IDX 15
#define PP_EVENT_ERR_IDX 16
#define PP_UNSET_ATTR_NAME_ERR_IDX 17
#define PP_BADATTR_VTYPE_ERR_IDX 18
#define PP_BADATTR_VALUE_ERR_IDX 19
#define PP_UNSET_RESC_NAME_ERR_IDX 20
#define PP_BAD_RESC_VTYPE_ERR_IDX 21
#define PP_BAD_RESC_VALUE_ERR_IDX 22
#define PP_PBS_ITER_IDX 23
#define PP_VNODE_IDX 24
#define PP_ENTITY_IDX 25
#define PP_ENV_IDX 26
#define PP_MANAGEMENT_IDX 27
#define PP_SERVER_ATTRIBUTE_IDX 28

pbs_python_types_entry pbs_python_types_table[] = {
	{PY_TYPE_ATTR_DESCRIPTOR, NULL}, /* 0 Always first */
	{PY_TYPE_GENERIC, NULL},
	{PY_TYPE_SIZE, NULL},
	{PY_TYPE_TIME, NULL},
	{PY_TYPE_ACL, NULL},
	{PY_TYPE_BOOL, NULL},
	{PY_TYPE_JOB, NULL},
	{PY_TYPE_QUEUE, NULL},
	{PY_TYPE_SERVER, NULL},
	{PY_TYPE_RESV, NULL},
	{PY_TYPE_EVENT, NULL}, /* 10 */
	{PY_TYPE_RESOURCE, NULL},
	{PY_TYPE_LIST, NULL},
	{PY_TYPE_INT, NULL},
	{PY_TYPE_STR, NULL},
	{PY_TYPE_FLOAT, NULL},			   /* 15 */
	{PY_ERROR_EVENT_INCOMPATIBLE, NULL},	   /* 16 */
	{PY_ERROR_EVENT_UNSET_ATTRIBUTE, NULL},	   /* 17 */
	{PY_ERROR_BAD_ATTRIBUTE_VALUE_TYPE, NULL}, /* 18 */
	{PY_ERROR_BAD_ATTRIBUTE_VALUE, NULL},	   /* 19 */
	{PY_ERROR_UNSET_RESOURCE, NULL},	   /* 20 */
	{PY_ERROR_BAD_RESOURCE_VALUE_TYPE, NULL},  /* 21 */
	{PY_ERROR_BAD_RESOURCE_VALUE, NULL},	   /* 22 */
	{PY_TYPE_PBS_ITER, NULL},		   /* 23 */
	{PY_TYPE_VNODE, NULL},			   /* 24 */
	{PY_TYPE_ENTITY, NULL},			   /* 25 */
	{PY_TYPE_ENV, NULL},			   /* 26 */
	{PY_TYPE_MANAGEMENT, NULL},		   /* 27 */
	{PY_TYPE_SERVER_ATTRIBUTE, NULL},	   /* 28 */

	/* ADD ENTRIES ONLY BELOW, OR CHANGE THE PP_XXX_IDX above the table */

	{NULL, NULL} /* sentinel */
};

typedef struct _pbs_iter_item {
	PyObject *py_iter; /* *the* iterator */
	void *data;	   /* arbitrary pbs data */
	int data_index;	   /* index of data to some table */
	pbs_list_link all_iters;
} pbs_iter_item;

static pbs_list_head pbs_iter_list; /* list of PBS iterators */

typedef struct _vnode_set_req {
	char vnode_name[PBS_MAXNODENAME + 1];
	pbs_list_head rq_attr; /* list of attributes to set */
	pbs_list_link all_reqs;
} vnode_set_req;

static pbs_list_head pbs_vnode_set_list; /* list of vnode set requests */

/**
 * @brief
 * 	The pbs_resource_value structure holds the cached resource values for
 *      Python py_resource object.
 *
 * @param[in]	py_resource - the Python pbs_resource object that will later
 * 				be set with values in 'value_list'.
 * @param[in]	py_resource_str_value - a Python string object representing
 * 					the values in 'value_list'.
 * @param[in]	attr_def_p - the resource definition for the resource list
 * 			     represented by 'py_resource'.
 * @param[in]	value_list - list of values cached for the 'py_resource' object
 * @param[in]	all_resc - links various pbs_resource_value structures.
 */
typedef struct _pbs_resource_value {
	PyObject *py_resource;
	PyObject *py_resource_str_value;
	attribute_def *attr_def_p; /* corresponding resource definition */
	pbs_list_head value_list;  /* resource values to set */
	pbs_list_link all_rescs;
} pbs_resource_value;

static pbs_list_head pbs_resource_value_list; /* list of resource */
					      /* values to instantiate */

static PyObject *PyPbsV1Module_Obj = NULL; /* pbs.v1 module object */

/* an array holding all the vnode attribute descriptors (python pointers) */
static PyObject **py_vnode_attr_types = NULL;
/* an array holding all the resv attribute descriptors (python pointers) */
static PyObject **py_resv_attr_types = NULL;
/* an array holding all the server attribute descriptors (python pointers) */
static PyObject **py_svr_attr_types = NULL;
/* an array holding all the job attribute descriptors (python pointers) */
static PyObject **py_job_attr_types = NULL;
/* an array holding all the queue attribute descriptors (python pointers) */
static PyObject **py_que_attr_types = NULL;
/* an array of python objects holding all the resources (python pointers)*/
static PyObject **py_svr_resc_types = NULL;

/* The function object that  instantiates/populates a PBS object using */
static PyObject *py_pbs_statobj = NULL;

/* This is the current hook event object */
static PyObject *py_hook_pbsevent = NULL;
/* This is the cached local/server object */
static PyObject *py_hook_pbsserver = NULL;
/* An array of cached Python queue objects managed by the current server */
static PyObject **py_hook_pbsque = NULL;
static int py_hook_pbsque_max = 0;		  /* Max # of entries in py_hook_pbsque */
static int hook_pbsevent_accept = TRUE;		  /* flag to accept/reject event */
static int hook_pbsevent_stop_processing = FALSE; /* flag to stop */
/* processing event */
/* parameters */
static char hook_pbsevent_reject_msg[HOOK_MSG_SIZE];
static int hook_set_mode = C_MODE; /* in C_MODE, can set*/
/* anything */
static int hook_reboot_host = FALSE;		/* flag to reboot host or not */
static int hook_reboot_host_cmd[HOOK_BUF_SIZE]; /* cmdline to use */
/* to reboot host */
/* as alternate to */
/* reboot() call */
static int hook_scheduler_restart_cycle = FALSE; /* flag to tell local */
/* server to tell the */
/* scheduler to */
/* restart sched cycle*/

/*
 * The following limit and counter declarations are intended
 * to reduce the amount of memory consumed by the Python
 * interpreter so that the server process does not become
 * bloated. Python is able to garbage collect builtin
 * types (e.g. string, dict, etc.), but the PBS types are
 * not created such that their memory can be released.
 */
/* Max hook events to service before restarting the interpreter */
#define PBS_PYTHON_RESTART_MAX_HOOKS 100
/* Max objects created before restarting the interpreter */
#define PBS_PYTHON_RESTART_MAX_OBJECTS 1000
/* Minimum interval between interpreter restarts */
#define PBS_PYTHON_RESTART_MIN_INTERVAL 30
/* count of Python objects created */
static long object_counter = 0;

typedef struct hook_debug_t {
	FILE *input_fp;
	char input_file[MAXPATHLEN + 1];
	FILE *output_fp;
	char output_file[MAXPATHLEN + 1];
	FILE *data_fp;
	char data_file[MAXPATHLEN + 1];
	char objname[HOOK_BUF_SIZE + 1];
} hook_debug_t;

static int use_static_data = 0; /* use static server-related data */

static hook_debug_t hook_debug;

static pbs_list_head *server_data;

typedef struct server_jobs_t {
	pbs_list_head *data;
	pbs_list_head *ids;
} server_jobs_t;
static server_jobs_t server_jobs;

typedef struct server_queues_t {
	pbs_list_head *data;
	pbs_list_head *names;
} server_queues_t;
static server_queues_t server_queues;

typedef struct server_resvs_t {
	pbs_list_head *data;
	pbs_list_head *resvids;
} server_resvs_t;
static server_resvs_t server_resvs;

typedef struct server_vnodes_t {
	pbs_list_head *data;
	pbs_list_head *names;
} server_vnodes_t;
static server_vnodes_t server_vnodes;

/**
 * @brief
 * 	This is a function that logs the contents of the list
 *	headed by 'phead'.
 *
 * @param[in] head_str - some string that gets printed spearheading the list.
 * @param[in] phead - header of the list to be printed.
 *
 * @return	void
 *
 */
void
print_svrattrl_list(char *head_str, pbs_list_head *phead)
{
	svrattrl *plist = NULL;
	int i;

	if ((head_str == NULL) || (phead == NULL)) {
		return;
	}
	if (!will_log_event(PBSEVENT_DEBUG3))
		return;

	plist = (svrattrl *) GET_NEXT(*phead);
	i = 0;
	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, head_str);
	while (plist) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
#ifdef NAS /* localmod 005 */
			 "al_name=%s al_resc=%s al_value=%s al_flags=%ld",
			 plist->al_name, plist->al_resc ? plist->al_resc : "null",
			 plist->al_value, (long) plist->al_flags);
#else
			 "al_name=%s al_resc=%s al_value=%s al_flags=%d",
			 plist->al_name, plist->al_resc ? plist->al_resc : "null",
			 plist->al_value, plist->al_flags);
#endif /* localmod 005 */
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__,
			  log_buffer);

		plist = (svrattrl *) GET_NEXT(plist->al_link);
		i++;
	}
}

/**
 * @brief
 * 	This is a stub function that should be implemented to add any additional
 * 	elements to the global namespace dict.
 *
 * @param[in] globals - python object indicating reference to globals of a module
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 *
 */

int
pbs_python_setup_namespace_dict(PyObject *globals)
{
#if 0 /* enable later */
	/*
	 * First, insert our module object pbs.v1 as pbs so the hook scripts
	 * can access all the globals
	 */
	/* I believe our design REQUIRES hook write to issue a "import pbs" */
	if ((PyDict_SetItemString(globals, "pbs", PyPbsV1Module_Obj) == -1)) {
		goto ERROR_EXIT;
	}

	return 0;
ERROR_EXIT:
	pbs_python_write_error_to_log("pbs_python_setup_namespace_dict");
	return -1;
#endif
	return 0;
}

/**
 * @brief
 *      The C routine that will instantiate a PbsAttributeDescriptor
 *	class (see src/modules/_base_types.py), which wraps a
 *	PBS attribute into a descriptor.
 *
 * @param[in]	klass-the class attribute being wrapped into a data descriptor.
 * @param[in]	name - name of a PBS attribute.
 * @param[in]	default_value - given to the PBS attribute.
 * @param[in]	val_klass - the class/object type of the attribute's value.
 * @param[in]	resc_attr - if the attribute being wrapped is a pbs_resource,
 *			    then this is the name of its parent.
 *			    For example: name="ncpus", resc_attr="Resource_List"
 * @param[in]	is_entity - if the attribute being wrapped is also an
 *			    entity type.
 *			    For example: name="ncpus", resc_attr="max_run_res",
 *					is_entity=1.
 * @return      int
 * @retval      -1	Failed to create descriptor.
 * @retval 	0	Successfully created descriptor.
 * @retval 	1	Descriptor already present.
 *
 */
static int
_pps_getset_descriptor_object(PyObject *klass,
			      const char *name,
			      PyObject *default_value,
			      PyObject *val_klass,
			      const char *resc_attr,
			      int is_entity)
{
	/* this is for constructor call , see _base_types.py */
	static char *kwds[] = {"cls", "name", "default_value", "value_type",
			       "resc_attr", "is_entity"};
	PyObject *py_descr_class = NULL;
	PyObject *py_descr_args = PyTuple_New(0);
	PyObject *py_descr_kwds = NULL;
	PyObject *py_attr_descr = NULL;

	/* check we creation of tuple failed */
	if (!(py_descr_args)) {
		goto ERROR_EXIT;
	}
	/* check whether the attribute descriptor is already present */
	if (PyObject_HasAttrString(klass, name)) {
		Py_CLEAR(py_descr_args);
		return 1;
	}

	py_descr_class = pbs_python_types_table[PP_DESC_IDX].t_class;

	/* good, build the arument list NEW ref
	 *  class, name, default_value, value_class
	 */
	if (resc_attr) { /* ok we are creating a attribute for a resource */
		py_descr_kwds = Py_BuildValue("{s:O, s:s, s:O, s:(O), s:s, s:i}",
					      kwds[0], klass,
					      kwds[1], name,
					      kwds[2], default_value,
					      kwds[3], val_klass,
					      kwds[4], resc_attr,
					      kwds[5], is_entity);
	} else {
		py_descr_kwds = Py_BuildValue("{s:O, s:s, s:O, s:(O), s:i}",
					      kwds[0], klass,
					      kwds[1], name,
					      kwds[2], default_value,
					      kwds[3], val_klass,
					      kwds[5], is_entity);
	}

	if (!py_descr_kwds) {
		goto ERROR_EXIT;
	}
	py_attr_descr = PyObject_Call(py_descr_class, py_descr_args, py_descr_kwds);
	if (!py_attr_descr) {
		goto ERROR_EXIT;
	}
	Py_CLEAR(py_descr_args);
	Py_CLEAR(py_descr_kwds);
	/* now set the class attribute */
	if ((PyObject_SetAttrString(klass, name, py_attr_descr) == -1)) {
		goto ERROR_EXIT;
	}
	/* we don't need the descriptor any more */
	Py_CLEAR(py_attr_descr);
	return 0;

ERROR_EXIT:
	pbs_python_write_error_to_log(__func__);
	Py_CLEAR(py_descr_args);
	Py_CLEAR(py_descr_kwds);
	Py_CLEAR(py_attr_descr);
	return -1;
}

/*
 * pbs_python_get_python_type:
 *  This is the bulk where all the magic happens regarding the mapping from
 *  PBS to python types.
 *
 * returns:
 *   - A Borrowed Reference.
 */

/* TODO
 *  -big assumption, hopefully the DURATION/TIME encoding routine is
 *   not overloaded.
 *  -Make sure all types are there
 */
#define TYPE_DURATION(p) (((p) == encode_time))
#define TYPE_SIZE(p) (((p) == ATR_TYPE_SIZE))
#define TYPE_ACL(p) (((p) == ATR_TYPE_ACL))
#define TYPE_BOOL(p) (((p) == ATR_TYPE_BOOL))
#define TYPE_ARST(p) (((p) == ATR_TYPE_ARST))
#define TYPE_RESC(p) (((p) == ATR_TYPE_RESC))
#define TYPE_INT(p) ((((p) == ATR_TYPE_LONG) ||  \
		      ((p) == ATR_TYPE_SHORT) || \
		      ((p) == ATR_TYPE_CHAR)))
#define TYPE_STR(p) (((p) == ATR_TYPE_STR) || \
		     ((p) == ATR_TYPE_JINFOP))
#define TYPE_FLOAT(p) (((p) == ATR_TYPE_FLOAT))
#define TYPE_ENTITY(p) (((p) == ATR_TYPE_ENTITY))
#define ATTR_IS_RESC(a) (TYPE_RESC((a)->at_type) ||    \
			 (TYPE_ENTITY((a)->at_type) && \
			  ((a)->at_decode == decode_entlim_res)))
/*
 * TODO
 *  	- It is possible to combine pbs_python_setup_resc_get_value_type
 *    	and pbs_python_setup_attr_get_value_type into a macro.
 */

/*
 * NO exception raised
 */
/**
 * @brief
 *	given the resource definition return the corresponding python type.
 *
 * @param[in] resc_def_p - pointer to resource_def indicating resource list
 *
 * @return	pointer PyObject
 * @retval	resource table		success
 * @retval	return generic		failure
 *
 */
static PyObject *
pbs_python_setup_resc_get_value_type(resource_def *resc_def_p)
{
	PyObject *py_tmp = NULL; /* return value */

	/* check if we are special aka check PBS_PythonTypes first */
	py_tmp = PyDict_GetItemString(PBS_PythonTypes, resc_def_p->rs_name);
	if (py_tmp)
		return py_tmp; /* cool, we are special */

	/* careful long is overloadded so duration comes first */
	if (TYPE_DURATION(resc_def_p->rs_encode)) /* check for time type */
		return pbs_python_types_table[PP_TIME_IDX].t_class;

	if (TYPE_SIZE(resc_def_p->rs_type)) /* check for SIZE type */
		return pbs_python_types_table[PP_SIZE_IDX].t_class;

	if (TYPE_ACL(resc_def_p->rs_type)) /* check for ACL type */
		return pbs_python_types_table[PP_ACL_IDX].t_class;

	if (TYPE_BOOL(resc_def_p->rs_type)) /* check for BOOL type */
		return pbs_python_types_table[PP_BOOL_IDX].t_class;

	if (TYPE_ARST(resc_def_p->rs_type)) /* check for list of strings */
		return pbs_python_types_table[PP_ARST_IDX].t_class;

	if (TYPE_INT(resc_def_p->rs_type)) /* check for int,long,short type */
		return pbs_python_types_table[PP_INT_IDX].t_class;

	if (TYPE_STR(resc_def_p->rs_type)) /* check for str type */
		return pbs_python_types_table[PP_STR_IDX].t_class;

	if (TYPE_FLOAT(resc_def_p->rs_type)) /* check for float type */
		return pbs_python_types_table[PP_FLOAT_IDX].t_class;

	if (TYPE_ENTITY(resc_def_p->rs_type)) /* check for entity type */
		return pbs_python_types_table[PP_ENTITY_IDX].t_class;

	/* all else fails return generic */

	return pbs_python_types_table[PP_GENERIC_IDX].t_class;
}

/**
 * @brief
 *      Given an attribute defintion, return the corresponding Python type.
 *
 * @param[in]	attr_def_p	- an attribute_def type.
 * @param[in]	py_type		- a python type in string: "job", "server",
 *				"queue", "resv", or "vnode".
 * @return	PyObject *
 */

static PyObject *
pbs_python_setup_attr_get_value_type(attribute_def *attr_def_p, char *py_type)
{
	PyObject *py_tmp = NULL; /* return value */

	/* check if we are special aka check PBS_PythonTypes first */

	if ((strcmp(py_type, PY_TYPE_VNODE) != 0) ||
	    (strcmp(attr_def_p->at_name, ATTR_p) != 0)) {

		/* Only get the type from PBS_PythonTypes if not the vnode's Priority */
		/* attribute which is treated as a Python int instead of the */
		/* pbs.priority type mapped in PBS_Python_Types. */

		py_tmp = PyDict_GetItemString(PBS_PythonTypes, attr_def_p->at_name);
		if (py_tmp)
			return py_tmp; /* cool, we are special */
	}

	/* careful long is overloadded so duration comes first */
	if (TYPE_DURATION(attr_def_p->at_encode)) /* check for time type */
		return pbs_python_types_table[PP_TIME_IDX].t_class;

	if (ATTR_IS_RESC(attr_def_p))
		return pbs_python_types_table[PP_RESC_IDX].t_class;

	if (TYPE_SIZE(attr_def_p->at_type)) /* check for SIZE type */
		return pbs_python_types_table[PP_SIZE_IDX].t_class;

	if (TYPE_ACL(attr_def_p->at_type)) /* check for ACL type */
		return pbs_python_types_table[PP_ACL_IDX].t_class;

	if (TYPE_BOOL(attr_def_p->at_type)) /* check for BOOL type */
		return pbs_python_types_table[PP_BOOL_IDX].t_class;

	if (TYPE_ARST(attr_def_p->at_type)) /* check for list of strings */
		return pbs_python_types_table[PP_ARST_IDX].t_class;

	if (TYPE_INT(attr_def_p->at_type)) /* check for int,long,short */
		return pbs_python_types_table[PP_INT_IDX].t_class;

	if (TYPE_STR(attr_def_p->at_type)) /* check for str type */
		return pbs_python_types_table[PP_STR_IDX].t_class;

	if (TYPE_FLOAT(attr_def_p->at_type)) /* check for float type */
		return pbs_python_types_table[PP_FLOAT_IDX].t_class;

	if (TYPE_ENTITY(attr_def_p->at_type)) /* check for entity type */
		return pbs_python_types_table[PP_ENTITY_IDX].t_class;

	/* all else fails return generic */

	return pbs_python_types_table[PP_GENERIC_IDX].t_class;
}

/**
 * @brief
 * 	pbs_python_free_py_types_array
 *   	This frees up the global arrays
 *
 * @param[in] py_types_array - address reference to globals
 *
 * @return	Void
 */

void
pbs_python_free_py_types_array(PyObject ***py_types_array)
{
	PyObject **py_array_tmp = *py_types_array;
	PyObject *py_tmp = NULL;

	if (*py_types_array) {
		while ((py_tmp = *py_array_tmp)) {
			Py_CLEAR(py_tmp);
			py_array_tmp++;
		}
	}
	PyMem_Free(*py_types_array);
	*py_types_array = NULL; /* since we might be called again */
	return;
}

/**
 * @brief
 *	makes a call to given python object klass and maskes default value
 *
 * @param[in] klass - function
 * @param[in] args - arguments for function
 *
 * @return	PyObject *
 *
 */
PyObject *
pbs_python_make_default_value(PyObject *klass, PyObject *args)
{
	PyObject *py_default_value;

	py_default_value = PyObject_Call(klass, args, NULL);
	if (!py_default_value) {
		goto ERROR_EXIT;
	}
	return py_default_value;

ERROR_EXIT:
	pbs_python_write_error_to_log("could not make default value");
	return NULL;
}

/**
 * @brief
 *      Routine that actualizes *all* the attributes for a Python vnode object.
 *
 * @par Functionality:
 *	This takes input from node_attr_def[] and svr_resc_defm[] tables.
 *	Each attribute is setup as a descriptor for finer granularity of
 * 	control.
 *
 * @return      int
 * @retval       0 :    Successful execution of this function, with internal
 *			'py_vnode_attr_types' list populated.
 * @retval      -1 "    On failutre to populate 'py_vnode_attr_types' list.
 */
int
pbs_python_setup_vnode_class_attributes(void)
{
	int i = 0;
	attribute_def *attr_def_p = NULL; /* convenience pointer */
	PyObject *py_pbs_vnode_klass = pbs_python_types_table[PP_VNODE_IDX].t_class;
	PyObject *py_value_type = NULL;
	PyObject *py_default_value = NULL;
	PyObject *py_default_args = NULL;
	int num_entry = ND_ATR_LAST + 1; /* 1 for sentinel */
	int te;

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("BEGIN setting up all vnode attributes %s", "");
	else
		DEBUG2_ARG1("BEGIN setting up all vnode attributes %s", "");
	py_vnode_attr_types = PyMem_New(PyObject *, num_entry);

	if (py_vnode_attr_types == NULL)
		goto ERROR_EXIT;

	memset(py_vnode_attr_types, 0, sizeof(PyObject *) * num_entry);

	/* ok now set all the node_attr_def types known to the server */
	attr_def_p = node_attr_def;
	for (i = 0; i < ND_ATR_LAST; i++) {
		/* get the value type for this attribute */
		py_value_type = pbs_python_setup_attr_get_value_type(attr_def_p,
								     PY_TYPE_VNODE);
		/* create a brand new default value from value type */
		if (ATTR_IS_RESC(attr_def_p)) {
			py_default_args = Py_BuildValue("(s)", attr_def_p->at_name);
			if (py_default_args == NULL) {
				log_err(-1, attr_def_p->at_name, "could not build args for default value");
				continue;
			}
			py_default_value = pbs_python_make_default_value(py_value_type, py_default_args);
			Py_DECREF(py_default_args);
			if (py_default_value == NULL) {
				log_err(-1, attr_def_p->at_name, "could not set default value");
				continue;
			}
			te = TYPE_ENTITY(attr_def_p->at_type);
		} else {
			py_default_value = Py_None;
			te = 0;
		}
		if (_pps_getset_descriptor_object(py_pbs_vnode_klass,
						  attr_def_p->at_name,
						  py_default_value,
						  py_value_type, NULL, te) == -1)

			goto ERROR_EXIT;
		Py_INCREF(py_value_type);
		if (py_default_value != Py_None)
			Py_CLEAR(py_default_value);
		py_vnode_attr_types[i] = py_value_type;
		attr_def_p++;
	}
	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("DONE setting up all vnode attributes, number set <%d>", i);
	else
		DEBUG2_ARG1("DONE setting up all vnode attributes, number set <%d>", i);
	return 0;

ERROR_EXIT:
	if (py_default_value != Py_None)
		Py_CLEAR(py_default_value);
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "could not set attribute <%s> for vnode python class", attr_def_p->at_name);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_err(-1, __func__, log_buffer);
	return -1;
}
/**
 * @brief
 * 	pbs_python_setup_resv_class_attributes
 *   	routine that sets up *all* the attributes for a Python server Object
 *   	mapping directly to PBS Job object (struct job)
 *
 * @return	int
 * @retval	-1  	: 	failure
 * @retval	0  	: 	success
 */
int
pbs_python_setup_resv_class_attributes(void)
{
	int i = 0;
	attribute_def *attr_def_p = NULL; /* convenience pointer */
	PyObject *py_pbs_resv_klass = pbs_python_types_table[PP_RESV_IDX].t_class;
	PyObject *py_value_type = NULL;
	PyObject *py_default_value = NULL;
	PyObject *py_default_args = NULL;
	int num_entry = RESV_ATR_LAST + 1; /* 1 for sentinel */
	int te;

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("BEGIN setting up all reservation attributes %s", "");
	else
		DEBUG2_ARG1("BEGIN setting up all reservation attributes %s", "");
	py_resv_attr_types = PyMem_New(PyObject *, num_entry);
	if (!py_resv_attr_types) {
		goto ERROR_EXIT;
	}
	memset(py_resv_attr_types, 0, sizeof(PyObject *) * num_entry);

	/* ok now set all the resv_attr_def types known to the server */
	attr_def_p = resv_attr_def;
	for (i = 0; i < RESV_ATR_LAST; i++) {
		/* get the value type for this attribute */
		py_value_type = pbs_python_setup_attr_get_value_type(attr_def_p,
								     PY_TYPE_RESV);
		/* create a brand new default value from value type */
		if (ATTR_IS_RESC(attr_def_p)) {
			py_default_args = Py_BuildValue("(s)", attr_def_p->at_name);
			if (!py_default_args) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not build args for default value");
				continue;
			}
			py_default_value = pbs_python_make_default_value(py_value_type, py_default_args);
			Py_DECREF(py_default_args);
			if (!py_default_value) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not set default value");
				continue;
			}
			te = TYPE_ENTITY(attr_def_p->at_type);
		} else {
			py_default_value = Py_None;
			te = 0;
		}
		if (_pps_getset_descriptor_object(py_pbs_resv_klass,
						  attr_def_p->at_name,
						  py_default_value,
						  py_value_type, NULL, te) == -1)

			goto ERROR_EXIT;
		Py_INCREF(py_value_type);
		if (py_default_value != Py_None)
			Py_CLEAR(py_default_value);
		py_resv_attr_types[i] = py_value_type;
		attr_def_p++;
	}
	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("DONE setting up all reservation attributes, number set <%d>", i);
	else
		DEBUG2_ARG1("DONE setting up all reservation attributes, number set <%d>", i);
	return 0;

ERROR_EXIT:
	if (py_default_value != Py_None)
		Py_CLEAR(py_default_value);
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "could not set attribute <%s> for reservation python class", attr_def_p->at_name);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_err(-1, __func__, log_buffer);
	return -1;
}

/**
 * @brief
 *	pbs_python_setup_svr_class_attributes
 *  	 routine that sets up *all* the attributes for a Python server Object
 *  	 mapping directly to PBS Job object (struct job)
 *
 * @return      int
 * @retval      -1      :       failure
 * @retval      0       :       success
 */
int
pbs_python_setup_server_class_attributes(void)
{
	int i = 0;
	attribute_def *attr_def_p = NULL; /* convenience pointer */
	PyObject *py_pbs_svr_klass = pbs_python_types_table[PP_SVR_IDX].t_class;
	PyObject *py_value_type = NULL;
	PyObject *py_default_value = NULL;
	PyObject *py_default_args = NULL;
	int num_entry = SVR_ATR_LAST + 1; /* 1 for sentinel */
	int te;

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("BEGIN setting up all server attributes %s", "");
	else
		DEBUG2_ARG1("BEGIN setting up all server attributes %s", "");
	py_svr_attr_types = PyMem_New(PyObject *, num_entry);
	if (!py_svr_attr_types) {
		goto ERROR_EXIT;
	}
	memset(py_svr_attr_types, 0, sizeof(PyObject *) * num_entry);

	/* ok now set all the svr_attr_def types known to the server */
	attr_def_p = svr_attr_def;
	for (i = 0; i < SVR_ATR_LAST; i++) {
		/* get the value type for this attribute */
		py_value_type = pbs_python_setup_attr_get_value_type(attr_def_p,
								     PY_TYPE_SERVER);
		/* create a brand new default value from value type */
		if (ATTR_IS_RESC(attr_def_p)) {
			py_default_args = Py_BuildValue("(s)", attr_def_p->at_name);
			if (!py_default_args) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not build args for default value");
				continue;
			}
			py_default_value = pbs_python_make_default_value(py_value_type, py_default_args);
			Py_DECREF(py_default_args);
			if (!py_default_value) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not set default value");
				continue;
			}
			te = TYPE_ENTITY(attr_def_p->at_type);
		} else {
			py_default_value = Py_None;
			te = 0;
		}
		if (_pps_getset_descriptor_object(py_pbs_svr_klass,
						  attr_def_p->at_name,
						  py_default_value,
						  py_value_type, NULL, te) == -1)

			goto ERROR_EXIT;
		Py_INCREF(py_value_type);
		if (py_default_value != Py_None)
			Py_CLEAR(py_default_value);
		py_svr_attr_types[i] = py_value_type;
		attr_def_p++;
	}
	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("DONE setting up all server attributes, number set <%d>", i);
	else
		DEBUG2_ARG1("DONE setting up all server attributes, number set <%d>", i);
	return 0;

ERROR_EXIT:
	if (py_default_value != Py_None)
		Py_CLEAR(py_default_value);
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "could not set attribute <%s> for <server> python class", attr_def_p->at_name);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_err(-1, __func__, log_buffer);
	return -1;
}

/**
 * @brief
 * 	pbs_python_setup_job_class_attributes
 *   	routine that sets up *all* the attributes for a Python Job Object
 *   	mapping directly to PBS Job object (struct job)
 *
 * @return      int
 * @retval      -1      :       failure
 * @retval      0       :       success
 */
int
pbs_python_setup_job_class_attributes(void)
{
	int i = 0;
	attribute_def *attr_def_p = NULL; /* convenience pointer */
	PyObject *py_pbs_job_klass = pbs_python_types_table[PP_JOB_IDX].t_class;
	PyObject *py_value_type = NULL;
	PyObject *py_default_value = NULL;
	PyObject *py_default_args = NULL;
	int num_entry = JOB_ATR_LAST + 1; /* 1 for sentinel */
	int te;

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("BEGIN setting up all job attributes %s", "");
	else
		DEBUG2_ARG1("BEGIN setting up all job attributes %s", "");
	py_job_attr_types = PyMem_New(PyObject *, num_entry);
	if (!py_job_attr_types) {
		goto ERROR_EXIT;
	}
	memset(py_job_attr_types, 0, sizeof(PyObject *) * num_entry);

	/* ok now set all the job_attr_def types known to the server */
	attr_def_p = job_attr_def;
	for (i = 0; i < JOB_ATR_LAST; i++) {
		/* get the value type for this attribute */
		py_value_type = pbs_python_setup_attr_get_value_type(attr_def_p,
								     PY_TYPE_JOB);
		/* create a brand new default value from value type */
		if (ATTR_IS_RESC(attr_def_p)) {
			py_default_args = Py_BuildValue("(s)", attr_def_p->at_name);
			if (!py_default_args) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not build args for default value");
				continue;
			}
			py_default_value = pbs_python_make_default_value(py_value_type, py_default_args);
			Py_DECREF(py_default_args);
			if (!py_default_value) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not set default value");
				continue;
			}
			te = TYPE_ENTITY(attr_def_p->at_type);
		} else {
			py_default_value = Py_None;
			te = 0;
		}
		/* default to None */
		if (_pps_getset_descriptor_object(py_pbs_job_klass,
						  attr_def_p->at_name,
						  py_default_value,
						  py_value_type, NULL, te) == -1)

			goto ERROR_EXIT;
		Py_INCREF(py_value_type);
		if (py_default_value != Py_None)
			Py_CLEAR(py_default_value);
		py_job_attr_types[i] = py_value_type;
		attr_def_p++;
	}
	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("DONE setting up all job attributes, number set <%d>", i);
	else
		DEBUG2_ARG1("DONE setting up all job attributes, number set <%d>", i);
	return 0;

ERROR_EXIT:
	if (py_default_value != Py_None)
		Py_CLEAR(py_default_value);
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "could not set attribute <%s> for <job> python class", attr_def_p->at_name);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_err(-1, __func__, log_buffer);
	return -1;
}

/**
 * @brief
 * 	pbs_python_setup_queue_class_attributes
 *   	routine that sets up *all* the attributes for a Python Queue Object
 *   	mapping directly to PBS Queue object (pbs_queue)
 *
 * @return      int
 * @retval      -1      :       failure
 * @retval      0       :       success
 */
int
pbs_python_setup_queue_class_attributes(void)
{
	int i = 0;
	attribute_def *attr_def_p = NULL; /* convenience pointer */
	PyObject *py_pbs_que_klass = pbs_python_types_table[PP_QUE_IDX].t_class;
	PyObject *py_value_type = NULL;
	PyObject *py_default_value = NULL;
	PyObject *py_default_args = NULL;
	int num_entry = QA_ATR_LAST + 1; /* 1 for sentinel */
	int te;

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("BEGIN setting up all queue attributes %s", "");
	else
		DEBUG2_ARG1("BEGIN setting up all queue attributes %s", "");
	py_que_attr_types = PyMem_New(PyObject *, num_entry);
	if (!py_que_attr_types) {
		goto ERROR_EXIT;
	}
	memset(py_que_attr_types, 0, sizeof(PyObject *) * num_entry);

	/* ok now set all the resources known to the server */
	attr_def_p = que_attr_def;
	for (i = 0; i < QA_ATR_LAST; i++) {
		/* get the value type for this attribute */
		py_value_type = pbs_python_setup_attr_get_value_type(attr_def_p,
								     PY_TYPE_QUEUE);
		/* create a brand new default value from value type */
		if (ATTR_IS_RESC(attr_def_p)) {
			py_default_args = Py_BuildValue("(s)", attr_def_p->at_name);
			if (!py_default_args) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not build args for default value");
				attr_def_p++;
				continue;
			}
			py_default_value = pbs_python_make_default_value(py_value_type, py_default_args);
			Py_DECREF(py_default_args);
			if (!py_default_value) {
				/* TODO, continuing instead of fatal error */
				log_err(-1, attr_def_p->at_name, "could not set default value");
				attr_def_p++;
				continue;
			}
			te = TYPE_ENTITY(attr_def_p->at_type);
		} else {
			py_default_value = Py_None;
			te = 0;
		}
		if (_pps_getset_descriptor_object(py_pbs_que_klass,
						  attr_def_p->at_name,
						  py_default_value,
						  py_value_type, NULL, te) == -1)

			goto ERROR_EXIT;
		Py_INCREF(py_value_type);
		if (py_default_value != Py_None)
			Py_CLEAR(py_default_value);
		py_que_attr_types[i] = py_value_type;
		attr_def_p++;
	}
	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("DONE setting up all queue attributes, number set <%d>", i);
	else
		DEBUG2_ARG1("DONE setting up all queue attributes, number set <%d>", i);
	return 0;

ERROR_EXIT:
	if (py_default_value != Py_None)
		Py_CLEAR(py_default_value);
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "could not set attribute <%s> for <queue> python class", attr_def_p->at_name);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_err(-1, __func__, log_buffer);
	return -1;
}

/**
 * @brief
 * 	pbs_python_setup_python_resource_type
 *	routine that sets up *all* the resources for a Python resource Object
 *
 * @return      int
 * @retval      -1      :       failure
 * @retval      0       :       success
 */
int
pbs_python_setup_python_resource_type(void)
{
	int i = 0, j;
	resource_def *resc_def_p = NULL; /* convenience pointer */
	PyObject *py_pbs_resc_klass = pbs_python_types_table[PP_RESC_IDX].t_class;
	PyObject *py_value_type = NULL;
	int num_entry = svr_resc_size + 1; /* 1 for sentinel */

	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("BEGIN setting up all resource attributes %s", "");
	else
		DEBUG2_ARG1("BEGIN setting up all resource attributes %s", "");
	py_svr_resc_types = PyMem_New(PyObject *, num_entry);
	if (!py_svr_resc_types) {
		goto ERROR_EXIT;
	}
	memset(py_svr_resc_types, 0, sizeof(PyObject *) * num_entry);

	/* ok now set all the resources known to the server */
	resc_def_p = svr_resc_def;
	i = 0;
	j = svr_resc_size;
	while (j--) {

		/* get the value type for this resource */
		py_value_type = pbs_python_setup_resc_get_value_type(resc_def_p);
		/* default to None */

		if (_pps_getset_descriptor_object(py_pbs_resc_klass,
						  resc_def_p->rs_name,
						  Py_None,
						  py_value_type, PY_RESOURCE_GENERIC_VALUE, 0) == -1) {
			goto ERROR_EXIT;
		}
		Py_INCREF(py_value_type);
		py_svr_resc_types[i] = py_value_type;
		resc_def_p = resc_def_p->rs_next;
		i++;
	}
	if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name))
		DEBUG3_ARG1("DONE setting up all resource attributes, number set <%d>", i);
	else
		DEBUG2_ARG1("DONE setting up all resource attributes, number set <%d>", i);
	return 0;

ERROR_EXIT:
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "could not set attribute <%s> for <pbs_resource> python class", resc_def_p->rs_name);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_err(-1, __func__, log_buffer);
	return -1;
}

/**
 * @brief
 * 	pbs_python_clear_types_table clear the python pointers
 *
 * exceptions:
 *   	None
 */

static void
pbs_python_clear_types_table(void)
{
	pbs_python_types_entry *pp_type = pbs_python_types_table;

	while (pp_type->t_key) {
		Py_CLEAR(pp_type->t_class);
		pp_type++;
	}
	return;
}

/**
 * @brief
 * 	pbs_python_types_table setup routine, called at initialization of interp.
 *
 * @return      int
 * @retval      -1      :       failure
 * @retval      0       :       success
 *
 * exceptions:
 *   None
 * Assumptions:
 *   PBS_PythonTypes must be setup.
 */

static int
pbs_python_setup_types_table(void)
{
	pbs_python_types_entry *pp_type = pbs_python_types_table;

	while (pp_type->t_key) {
		pp_type->t_class = PyDict_GetItemString(PBS_PythonTypes, pp_type->t_key);
		if (!(pp_type->t_class)) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "could not find key <%s> in PBS_PythonTypes",
				 pp_type->t_key);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			log_err(-1, __func__, log_buffer);
			goto ERROR_EXIT;
		}
		/* since we are borrowed incref */
		Py_INCREF(pp_type->t_class);
		pp_type++;
	}

	return 0;

ERROR_EXIT:
	/* on error, the load_python_type ... calls the unload for globals */
	return -1;
}

/**
 * @brief
 *    Unload all the PBS python types initialized, as well as static Python
 *    objects created during the initial loading of the interpreter.
 *
 * @param[in/out]  interp_data	- data representing the interpeter that will
 *				be filled with new information.
 *
 * @return none
 *
 */

void
pbs_python_unload_python_types(struct python_interpreter_data *interp_data)
{
	Py_CLEAR(PyPbsV1Module_Obj);
	Py_CLEAR(PBS_PythonTypes);
	pbs_python_clear_types_table();
	pbs_python_free_py_types_array(&py_svr_resc_types);   /* all resources */
	pbs_python_free_py_types_array(&py_que_attr_types);   /* pbs.queue attrs */
	pbs_python_free_py_types_array(&py_job_attr_types);   /* pbs.job attrs */
	pbs_python_free_py_types_array(&py_svr_attr_types);   /* pbs.server attrs */
	pbs_python_free_py_types_array(&py_resv_attr_types);  /* pbs.resv attrs */
	pbs_python_free_py_types_array(&py_vnode_attr_types); /* pbs.vnode attrs */
	Py_CLEAR(py_pbs_statobj);

	interp_data->pbs_python_types_loaded = 0;
	return;
}

/**
 * @brief
 * 	This routine is called at the embedded intialization time, to load all
 * 	the Python types into a dictionary. Mapping the name to a python type.
 * 	The dictionary items are:
 *     	Key  = <an attribute name>
 *    	Value = <the attribute type object from python module (pure)>
 *
 * NOTES:
 *     The Dictionary overwrites if a key already exists!
 *
 * @return      int
 * @retval      -1      :       failure
 * @retval      0       :       success
 *
 * side effects:
 *      Any python exception raised is cleared via the call to
 *          pbs_python_write_error_to_log
 */

int
pbs_python_load_python_types(struct python_interpreter_data *interp_data)
{
	PyObject *py_import = NULL;	 /* new */
	PyObject *py_sys_modules = NULL; /* Borrowed ref */

	if ((PBS_PythonTypes)) { /* ok already loaded */
		return 0;
	}

	interp_data->pbs_python_types_loaded = 0; /* just to be safe */

	if (!(py_import =
		      PyImport_ImportModuleEx((char *) PBS_PYTHON_V1_MODULE, NULL, NULL,
					      NULL))) {
		goto ERROR_EXIT;
	}
	/* we don't need it any more, see next for explanation */
	Py_CLEAR(py_import);

	pbs_python_write_object_to_log(PyImport_GetModuleDict(), "sys.modules=", LOG_DEBUG);

	/* At this point the sys.modules loads module from __init__.py of
	 * PBS_PYTHON_V1_MODULE, which may as a side effect load a bunch of other
	 * modules. So now we get the actual module from sys.modules
	 */
	py_sys_modules = PyImport_GetModuleDict(); /* get sys.modules */
	if (!(PyPbsV1Module_Obj = PyDict_GetItemString(py_sys_modules, PBS_PYTHON_V1_MODULE))) {
		goto ERROR_EXIT;
	}
	Py_INCREF(PyPbsV1Module_Obj); /* since dict.get returns borrowed ref*/

	if (!(PBS_PythonTypes =
		      PyObject_GetAttrString(PyPbsV1Module_Obj,
					     PBS_PYTHON_V1_TYPES_DICTIONARY))) {
		goto ERROR_EXIT;
	}

	/* check and make sure it is a mapping */
	if (!PyDict_Check(PBS_PythonTypes)) {
		log_err(-1, pbs_python_daemon_name,
			"FATAL: PBS_PythonTypes object does not support mapping protocol");
		goto ERROR_EXIT;
	}

	if ((pbs_python_setup_types_table() == -1)) {
		goto ERROR_EXIT;
	}

	/* setup all attrs for pbs_resource class */
	if ((pbs_python_setup_python_resource_type() == -1))
		goto ERROR_EXIT;

	/* setup all attrs for queue class */
	if ((pbs_python_setup_queue_class_attributes() == -1))
		goto ERROR_EXIT;

	/* setup all attrs for job class */
	if ((pbs_python_setup_job_class_attributes() == -1))
		goto ERROR_EXIT;

	/* setup all attrs for server class */
	if ((pbs_python_setup_server_class_attributes() == -1))
		goto ERROR_EXIT;

	/* setup all attrs for reservation (resv) class */
	if ((pbs_python_setup_resv_class_attributes() == -1))
		goto ERROR_EXIT;

	/* setup all attrs for vnode class */
	if ((pbs_python_setup_vnode_class_attributes() == -1))
		goto ERROR_EXIT;

	interp_data->pbs_python_types_loaded = 1;
	return 0;

ERROR_EXIT:
	pbs_python_write_error_to_log(__func__);
	Py_CLEAR(py_import); /* just in case */
	pbs_python_unload_python_types(interp_data);
	return -1;
}

/**
 * @brief
 * 	A convenience function where given a Python object 'py_resource'
 * 	representing 'reslist_name', set its 'resc' to 'value'.
 *
 * @param[in]	py_resource - Python resource list object to set
 * @param[in]	reslist_name - name of resource list
 * @param[in]	resc - name of resource to set
 * @param[in]	value - value of resource being set
 *
 * @return 	int
 * @retval	!= -1	- success
 * @retval	-1	- failure
 *
 */
static int
set_in_python(PyObject *py_resource,
	      char *reslist_name, char *resc, char *value)
{
	int rc;
	int hook_set_mode_orig;

	hook_set_mode_orig = hook_set_mode;

	/* C_MODE is permissive mode unlike PY_MODE, which would enable */
	/* extra checks. PY_MODE is needed only if we're loading data */
	/* from outside (i.e. specified by hook writer). Here, */
	/* set_in_python() is an internal function that is called when */
	/* loading data from PBS data structures. */
	hook_set_mode = C_MODE;
	rc = pbs_python_object_set_attr_string_value(py_resource, resc, value);
	hook_set_mode = hook_set_mode_orig;

	if (rc == -1) {
		LOG_ERROR_ARG2("%s:failed to set resource <%s>",
			       reslist_name, resc);
	}
	return (rc);
}

/** @brief
 *	Given a list of entity resource values (limits) in 'resc_value_list',
 *	if py_resource' is not NULL, then set the Python resource object
 *	represented by 'py_resource' to the values given in 'resc_value_list'.
 *	Otherwise, if 'py_resource' is NULL, and then return a
 *	comma-separated string of resource values in 'resc_value_list' into
 *	'p_strbuf'.
 *  @note
 *	The returned string in 'p_strbuf' is in a privately malloced area, and
 *	should not be freed outside this function.
 *
 * @param[in]	resc_value_list - list of resource values (<resc>=<val).
 * @param[in]	reslist_name - name of the resource list (e.g. resources_used).
 * @param[in]	py_resource - the Python pbs resource object being set.
 * @param[in]	p_strbuf - pointer to a string buffer to hold return string
 *			value if 'py_resource' is NULL.
 * @return int
 * @retval 0	- for success
 * @retval -1   - for failure
 *
 */
static int
set_entity_resource_or_return_value(pbs_list_head *resc_value_list,
				    char *reslist_name, PyObject *py_resource, char **p_strbuf)
{
	static char *ret_str_value = NULL;
	static size_t ret_len = STRBUF;
	static size_t nlen = 0;
	svrattrl *svrattr_val_tmp = NULL; /* tmp pointer for traversal*/
	svrattrl *svrattr_val_next = NULL;
	svrattrl *plist = NULL;
	pbs_list_head entity_head;
	char *bef_resc = NULL;
	char *cur_resc = NULL;
	char *next_resc = NULL;
	char *tmp_str = NULL;
	int rc = 0; /* will be set to -1 if there's at least one failure */

	if (ret_str_value == NULL) {
		ret_str_value = (char *) malloc(ret_len);
		if (ret_str_value == NULL) {
			log_err(-1, __func__, "failed to malloc string buffer!");
			return (-1);
		}
	}
	ret_str_value[0] = '\0';

	/*
	 * The 'resc_value_list' for entity resource say 'max_queued_res'
	 * would look like:
	 *
	 * resc_value_list->
	 * al_name		al_resc		al_value
	 * ---------		--------	----------
	 *  max_queued_res	file		[u:alpha=110gb]
	 *  max_queued_res	ncpus		[u:bayucan=9]
	 *  max_queued_res	file		[u:fatir=120gb]
	 *  max_queued_res	file		[u:mega=115gb]
	 *
	 *  So we store these in an intermediate list (entity_head)
	 *  in a sorted way, so as to group them according to resource names.
	 *  By comparing adjacent entries, we can determine which values
	 *  belong to a particular resource name.
	 *
	 *  entity_head->
	 * al_name		al_resc		al_value
	 * ---------		--------	----------
	 *  max_queued_res	file		[u:alpha=110gb]
	 *  max_queued_res	file		[u:fatir=120gb]
	 *  max_queued_res	file		[u:omega=115gb]
	 *  max_queued_res	ncpus		[u:bayucan=9]
	 *
	 * And process 'entity_head' in a way that the following is stored in
	 * 'ret_str_value':
	 *	max_queued_res=file="[u:alpha=110gb],[u:fatir=120gb],[u:omega]",ncpus=[u:bayucan=9]
	 *	     <- note: there's an enclosing quote in multi-valued limits
	 */

	CLEAR_HEAD(entity_head);

	/* need to append values in a sorted way */
	nlen = 1; /* 1 for \0 */
	plist = (svrattrl *) GET_NEXT(*resc_value_list);
	while (plist) {
		if (add_to_svrattrl_list_sorted(&entity_head,
						plist->al_name, plist->al_resc,
						plist->al_value, plist->al_op,
						plist->al_resc) == -1) {
			free_attrlist(&entity_head);
			log_err(-1, __func__,
				"failed populating entity limits value");
			return (-1);
		}
		nlen += 1 + /*  for ',' */
			strlen(plist->al_resc) +
			1 + /* for '=' */
			strlen(plist->al_value) +
			3; /* allocate for each possible */
		/* '"' and ',' in case we have a */
		/* multi-valued resource limit. Ex. */
		/* file="[u:alpha=50gb],[u:fap=60gb]" */

		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}
	if (nlen > ret_len) {

		nlen += BUF_SIZE; /* malloc a larger size */
		tmp_str = (char *) realloc(ret_str_value, nlen);
		if (tmp_str == NULL) {
			log_err(-1, __func__,
				"failed to realloc string buffer!");
			return (-1);
		}
		ret_str_value = tmp_str;
		ret_len = nlen;
	}

	/* at this point, we have enough buffer space in */
	/* ret_str_value */
	/*

	 Algorithm:

	 3 variables are used to keep track of the individual entries
	 in the sorted 'entity_head' list.

	 1.	cur_resc is the current resource/value line being looked at.
	 2.	bef_resc is the resource/value from the previous line.
	 3.	next_resc is the resource/value on the next line.

	 Then there's a buffer 'ret_str_value' that accumulates values
	 associated with a given resource name. <resource> and <value>
	 are those associated with 'cur_resc'.

	 bef_resc == NULL, next_resc == NULL
	 -> 	if returning string value, then
	 ret_str_value=<resource>=<value>
	 else
	 set <py_resource>.<resource>=<value>

	 bef_resc == NULL, next_resc != cur_resc
	 -> 	if returning string value, then
	 ret_str_value=<resource>=<value>
	 else
	 set <py_resource>.<resource>=<value>

	 bef_resc == NULL, next_resc == cur_resc
	 ->	if returning string value, then
	 start accumulating values:
	 ret_str_value="<resource>=\"<value>"
	 else
	 ret_str_value="<value>"

	 bef_resc == cur_resc, cur_resc != next_resc
	 ->	if returning string value,
	 terminate the current string value:

	 ret_str_value += ",<value>\""
	 else
	 set <py_resource>.<resource>=<ret_str_value>,<value>

	 bef_resc == cur_resc, cur_resc == next_resc
	 ->	continue on the string value:
	 ret_str_value  += ",<value>"

	 bef_resc != cur_resc, cur_resc != next_resc
	 ->	if returning string value,
	 start a new set of resource/value pairs:
	 ret_str_value += ",<resource>=<value>"
	 else
	 set <py_resource>.<resource>=<value>

	 bef_resc != cur_resc, cur_resc == next_resc
	 if returning string value,
	 ret_str_value += "=\"<value>"
	 else
	 ret_str_value = "<value>"
	 */

	svrattr_val_tmp = (svrattrl *) GET_NEXT(entity_head);
	bef_resc = NULL;
	while (svrattr_val_tmp) {

		svrattr_val_next =
			(svrattrl *) GET_NEXT(svrattr_val_tmp->al_link);

		cur_resc = svrattr_val_tmp->al_resc;
		if (cur_resc == NULL) {
			bef_resc = cur_resc;
			svrattr_val_tmp = svrattr_val_next;
			continue;
		}
		if (svrattr_val_next != NULL) {
			if (svrattr_val_next->al_resc == NULL) {
				bef_resc = cur_resc;
				svrattr_val_tmp = svrattr_val_next;
				continue;
			}
			next_resc = svrattr_val_next->al_resc;
		} else {
			next_resc = NULL;
		}

		if (bef_resc == NULL) {
			if (next_resc == NULL) {

				if (py_resource == NULL) {
					sprintf(ret_str_value, "%s=%s",
						svrattr_val_tmp->al_resc,
						svrattr_val_tmp->al_value);
				} else {
					if (set_in_python(py_resource,
							  reslist_name,
							  svrattr_val_tmp->al_resc,
							  svrattr_val_tmp->al_value) == -1)
						rc = -1;
				}

				if (hook_debug.data_fp != NULL) {
					fprintf(hook_debug.data_fp,
						"%s.%s[%s]=%s\n",
						(char *) hook_debug.objname,
						reslist_name,
						svrattr_val_tmp->al_resc,
						svrattr_val_tmp->al_value);
				}
			} else {
				if (strcmp(cur_resc, next_resc) != 0) {
					if (py_resource == NULL) {
						sprintf(ret_str_value, "%s=%s",
							svrattr_val_tmp->al_resc,
							svrattr_val_tmp->al_value);
					} else {
						if (set_in_python(py_resource,
								  reslist_name,
								  svrattr_val_tmp->al_resc,
								  svrattr_val_tmp->al_value) == -1)
							rc = -1;
					}
					if (hook_debug.data_fp != NULL) {
						fprintf(hook_debug.data_fp,
							"%s.%s[%s]=%s\n",
							(char *) hook_debug.objname,
							reslist_name,
							svrattr_val_tmp->al_resc,
							svrattr_val_tmp->al_value);
					}
				} else {
					if (py_resource == NULL) {
						sprintf(ret_str_value,
							"%s=\"%s",
							svrattr_val_tmp->al_resc,
							svrattr_val_tmp->al_value);
					} else {
						/* use ret_str_value */
						/* as value buffer */
						strcpy(ret_str_value,
						       svrattr_val_tmp->al_value);
					}

					if (hook_debug.data_fp != NULL) {
						fprintf(hook_debug.data_fp,
							"%s.%s[%s]=%s",
							(char *) hook_debug.objname,
							reslist_name,
							svrattr_val_tmp->al_resc,
							svrattr_val_tmp->al_value);
					}
				}
			}

		} else {

			if (strcmp(bef_resc, cur_resc) == 0) {
				strcat(ret_str_value, ",");
				strcat(ret_str_value,
				       svrattr_val_tmp->al_value);
				if (hook_debug.data_fp != NULL) {
					fprintf(hook_debug.data_fp,
						",%s",
						svrattr_val_tmp->al_value);
				}
				if ((next_resc != NULL) &&
				    (strcmp(cur_resc, next_resc) != 0)) {
					if (py_resource == NULL) {
						/* terminate entity val  */
						strcat(ret_str_value, "\"");
					} else {
						if (set_in_python(py_resource,
								  reslist_name,
								  svrattr_val_tmp->al_resc,
								  ret_str_value) == -1)
							rc = -1;
					}
					if (hook_debug.data_fp != NULL) {
						fprintf(hook_debug.data_fp,
							"\n");
					}
				}
			} else { /* start new */
				if (py_resource == NULL) {
					strcat(ret_str_value, ",");
				} else {
					ret_str_value[0] = '\0';
				}
				if ((next_resc == NULL) ||
				    (strcmp(cur_resc, next_resc) != 0)) {
					if (py_resource == NULL) {
						strcat(ret_str_value,
						       svrattr_val_tmp->al_resc);
						strcat(ret_str_value, "=");
						strcat(ret_str_value,
						       svrattr_val_tmp->al_value);
					} else {
						if (set_in_python(py_resource,
								  reslist_name,
								  svrattr_val_tmp->al_resc,
								  svrattr_val_tmp->al_value) == -1)
							rc = -1;
					}

					if (hook_debug.data_fp !=
					    NULL) {
						fprintf(hook_debug.data_fp,
							"%s.%s[%s]=%s\n",
							(char *) hook_debug.objname,
							reslist_name,
							svrattr_val_tmp->al_resc,
							svrattr_val_tmp->al_value);
					}
				} else { /* cur_resc == next_resc */
					if (py_resource == NULL) {
						strcat(ret_str_value,
						       svrattr_val_tmp->al_resc);
						strcat(ret_str_value, "=\"");
						strcat(ret_str_value,
						       svrattr_val_tmp->al_value);
					} else {
						/* using as value string */
						strcpy(ret_str_value,
						       svrattr_val_tmp->al_value);
					}
					if (hook_debug.data_fp !=
					    NULL) {
						fprintf(hook_debug.data_fp,
							"%s.%s[%s]=%s",
							(char *) hook_debug.objname,
							reslist_name,
							svrattr_val_tmp->al_resc,
							svrattr_val_tmp->al_value);
					}
				}
			}
		}

		bef_resc = cur_resc;
		svrattr_val_tmp = svrattr_val_next;
	}
	free_attrlist(&entity_head);

	if (py_resource == NULL)
		*p_strbuf = ret_str_value;

	return (rc);
}

/**
 * @brief
 *	Given a list of resource values in 'resc_value_list', if
 *	py_resource' is not NULL, then set the Python resource object
 *	represented by 'py_resource' to the values given in 'resc_value_list'.
 *	If 'py_resource' is NULL, and then return a comma-separated string
 *	into 'p_strbuf', which represent the values given in 'resc_value_list'.
 * @note
 *	The returned string in 'p_strbuf' is in a private malloced area that
 *	should not be freed outside this function.
 *
 * @param[in]	resc_value_list - list of resource values (<resc>=<val).
 * @param[in]	py_resource - the Python pbs resource object being set.
 * @param[in]	p_strbuf - pointer to a string buffer to hold return string
 *			value if 'py_resource' is NULL.
 * @return 	int
 * @retval 	0    -	for success
 * @retval 	-1   - 	for failure
 *
 */
static int
set_resource_or_return_value(pbs_list_head *resc_value_list, char *reslist_name,
			     PyObject *py_resource, char **p_strbuf)
{
	static char *ret_str_value = NULL;
	static size_t ret_len = STRBUF;
	static size_t nlen = 0;
	svrattrl *svrattr_val_tmp = NULL; /* tmp pointer for traversal*/
	char *tmp_str = NULL;
	int rc = 0; /* set to 1 if there's at least 1 failure */

	if (ret_str_value == NULL) {
		ret_str_value = (char *) malloc(ret_len);
		if (ret_str_value == NULL) {
			log_err(-1, __func__, "failed to malloc string buffer!");
			return (-1);
		}
	}
	ret_str_value[0] = '\0';

	svrattr_val_tmp = (svrattrl *) GET_NEXT(*resc_value_list);
	while (svrattr_val_tmp) {

		if (py_resource == NULL) {
			nlen = strlen(ret_str_value) +
			       1 + /*  for ',' */
			       strlen(svrattr_val_tmp->al_resc) +
			       1 + /* for '=' */
			       strlen(svrattr_val_tmp->al_value) +
			       1; /* for '\0' */

			if (nlen > ret_len) {
				nlen += BUF_SIZE; /* malloc a larger size */
				tmp_str = (char *) realloc(ret_str_value, nlen);
				if (tmp_str == NULL) {
					log_err(-1, __func__,
						"failed to realloc string buffer!");
					return (-1);
				}
				ret_str_value = tmp_str;
				ret_len = nlen;
			}

			if (*ret_str_value == '\0') {

				sprintf(ret_str_value, "%s=%s",
					svrattr_val_tmp->al_resc,
					svrattr_val_tmp->al_value);
			} else {
				strcat(ret_str_value, ",");
				strcat(ret_str_value, svrattr_val_tmp->al_resc);
				strcat(ret_str_value, "=");
				strcat(ret_str_value, svrattr_val_tmp->al_value);
			}
		} else {
			if (set_in_python(py_resource,
					  reslist_name,
					  svrattr_val_tmp->al_resc,
					  svrattr_val_tmp->al_value) == -1) {
				rc = -1;
			}
		}
		if (hook_debug.data_fp != NULL) {
			fprintf(hook_debug.data_fp, "%s.%s[%s]=%s\n",
				(char *) hook_debug.objname,
				reslist_name, svrattr_val_tmp->al_resc,
				svrattr_val_tmp->al_value);
		}
		svrattr_val_tmp =
			(svrattrl *) GET_NEXT(svrattr_val_tmp->al_link);
	}

	if (py_resource == NULL)
		*p_strbuf = ret_str_value;
	return (rc);
}

/**
 * @brief
 *	Returns tthe Python string value of 'resc_val' which is of type
 *	'pbs_resource_value' representing a pbs_resource object.
 *
 * @param[in]	resc_val  a 'pbs_resource_value' input type.
 *
 * @return	PyObject *
 * @retval	NULL	- error getting string value.
 * @retval	<python string value> - a Python object representing the
 * @retval	"<resc1>=<val1>,"<entity_resc2>=<val2,val3",...<rescN>=<valN>"
 *		- a concatenation of string values for py_resource.
 *
 */
PyObject *
py_resource_string_value(pbs_resource_value *resc_val)
{
	char *ret_string = NULL;

	if (resc_val == NULL) {
		Py_RETURN_NONE;
	}

	if (TYPE_ENTITY(resc_val->attr_def_p->at_type)) {
		set_entity_resource_or_return_value(&(resc_val->value_list),
						    resc_val->attr_def_p->at_name,
						    NULL, &ret_string);
	} else { /* a regular resource */
		set_resource_or_return_value(&(resc_val->value_list),
					     resc_val->attr_def_p->at_name,
					     NULL, &ret_string);
	}
	/* New reference returned below */
	return PyUnicode_FromString(ret_string);
}

/*
 * ---------- ATTRIBUTE CONVERSION HELPER METHODS ------------
 */

/**
 * @brief
 *
 * 	Populates a Python instance 'py_instance' with values found in
 *	an attributes data array.
 *
 * @param[in] py_instance -  a Python object/class to populate
 * @param[in] attr_py_array - list of Python types to map attributes with
 * @param[in] attr_data_array - array of actual attribute names/resources/values
 * @param[in] attr_def_array - array of attribute definitions (ex. job_attr_def)
 * @param[in] attr_def_array_size - size of attr_def_array.
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 * @param[in]	perf_action - passed on to hook_perf_stat* call.
 *
 * @return indication of whether or not 'py_instance' was completely
 *	   populated or not
 * @return 0	- completely populated
 * @return -1	- incompletely populated
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */

int
pbs_python_populate_attributes_to_python_class(PyObject *py_instance,
					       PyObject **attr_py_array,
					       attribute *attr_data_array,
					       attribute_def *attr_def_array,
					       int attr_def_array_size, char *perf_label, char *perf_action)
{
	int i = 0;	   /* index */
	int encode_rv = 0; /* at_encode functions return value */
	int rc = -1;
	int ret_rc = 0;
	svrattrl *svrattr_val = NULL;	  /* tmp pointer */
	svrattrl *svrattr_val_tmp = NULL; /* tmp pointer for traversal*/
	pbs_list_head pheadp;
	attribute *attr_p = NULL;
	attribute_def *attr_def_p = NULL;
	PyObject *py_attr_resc = NULL; /* for resource types */
	char *value_str = NULL;
	char *new_value_str = NULL;
	pbs_resource_value *resc_val;

	hook_perf_stat_start(perf_label, perf_action, 0);
	for (i = 0; i < attr_def_array_size; i++) {
		attr_p = attr_data_array + i;
		attr_def_p = attr_def_array + i;

		memset(&pheadp, 0, sizeof(pheadp));
		CLEAR_HEAD(pheadp);

		svrattr_val = NULL;
		encode_rv = attr_def_p->at_encode(attr_p,
						  /* linked list */ &pheadp,
						  /* name        */ attr_def_p->at_name,
						  /* resource    */ NULL,
						  /* Encoding type */ ATR_ENCODE_HOOK,
						  /* returned svrattrl */ &svrattr_val);

		if ((encode_rv == 0) && (svrattr_val != NULL)) {
			encode_rv = 1;
		}
		if (encode_rv == 0) {
			/* not set or no value */
			continue;
		} else if (encode_rv >= 1) { /* good, single value */
			/* we could be a resource list */
			if (ATTR_IS_RESC(attr_def_p)) {
				if (!PyObject_HasAttrString(py_instance, attr_def_p->at_name)) {
					free_attrlist(&pheadp);
					continue;
				}

				/* NOTE the below is a new reference */
				py_attr_resc =
					PyObject_GetAttrString(py_instance,
							       attr_def_p->at_name);
				if (py_attr_resc == NULL) {
					pbs_python_write_error_to_log(__func__);
					free_attrlist(&pheadp);
					continue;
				}
				/* Mark resource currently has no value */
				/* loaded, but the value will be set later */
				/* as needed, by saving the value in */
				/* pbs_resource_value_list */
				rc = pbs_python_object_set_attr_integral_value(
					py_attr_resc,
					PY_RESOURCE_HAS_VALUE, FALSE);
				if (rc == -1) {
					LOG_ERROR_ARG2("%s:failed to set resource <%s> to False",
						       attr_def_p->at_name,
						       PY_RESOURCE_HAS_VALUE);
					ret_rc = -1;
				} else {
					sprintf(log_buffer, "set py_resource %s %s to FALSE",
						attr_def_p->at_name,
						PY_RESOURCE_HAS_VALUE);
					resc_val =
						(pbs_resource_value *) malloc(
							sizeof(pbs_resource_value));
					if (resc_val ==
					    NULL) {
						free_attrlist(&pheadp);
						continue;
					}

					(void) memset((char *) resc_val, (int) 0,
						      (size_t) sizeof(pbs_resource_value));
					CLEAR_LINK(resc_val->all_rescs);
					/* no need to incref py_attr_resc */
					/* since that's already done */
					/* with the PyObject_GetAttrString() */
					/* call earlier. */
					resc_val->py_resource = py_attr_resc;
					resc_val->attr_def_p = attr_def_p;

					CLEAR_HEAD(resc_val->value_list);
					list_move(&pheadp,
						  &resc_val->value_list);

					append_link(&pbs_resource_value_list,
						    &resc_val->all_rescs,
						    (pbs_resource_value *) resc_val);
					resc_val->py_resource_str_value =
						py_resource_string_value(resc_val);
				}
			} else { /* attribute */
				/* PBS' ATTR_inter/ATTR_block/ATTR_X11_port can either have a boolean-like */
				/* value for client (i.e. "True" or "False"), or an int-like */
				/* value for others (e.g. "2274" for port number)            */
				/* Python's version of these attributes are defined as ints, */
				/* and are not modifiable in a hook script. So we need to    */
				/* map the values into something consistent.                 */

				if ((strcmp(attr_def_p->at_name, ATTR_inter) == 0) ||
				    (strcmp(attr_def_p->at_name, ATTR_block) == 0) ||
				    (strcmp(attr_def_p->at_name, ATTR_X11_port) == 0)) {
					char inter_val[2];

					if (strcasecmp(svrattr_val->al_value, ATR_FALSE) == 0) {
						strcpy(inter_val, "0");
					} else {
						strcpy(inter_val, "1");
					}
					rc = pbs_python_object_set_attr_string_value(py_instance,
										     attr_def_p->at_name,
										     inter_val);
					if ((rc != -1) && (hook_debug.data_fp != NULL)) {
						fprintf(hook_debug.data_fp, "%s.%s=%s\n", (char *) hook_debug.objname,
							attr_def_p->at_name, inter_val);
					}
				} else if ((strcmp(attr_def_p->at_name,
						   ATTR_NODE_state) == 0) ||
					   (strcmp(attr_def_p->at_name,
						   ATTR_NODE_ntype) == 0)) {
					/* ignore these attributes, dealt with externally */
					free_attrlist(&pheadp);
					continue;

				} else if ((strcmp(attr_def_p->at_name,
						   ATTR_NODE_Sharing) == 0)) {

					attribute lattr;
					char nshare_str[HOOK_BUF_SIZE];

					rc = decode_sharing(&lattr, attr_def_p->at_name, 0,
							    svrattr_val->al_value);

					if (rc == 0) {
						snprintf(nshare_str, sizeof(nshare_str), "%ld",
							 lattr.at_val.at_long);

						rc = pbs_python_object_set_attr_string_value(py_instance,
											     attr_def_p->at_name, nshare_str);
						if ((rc != -1) && (hook_debug.data_fp != NULL)) {
							fprintf(hook_debug.data_fp, "%s.%s=%s\n", (char *) hook_debug.objname,
								attr_def_p->at_name, nshare_str);
						}
					}

				} else if (TYPE_ENTITY(attr_def_p->at_type)) {
					/* an entity attribute - can have a list of values */

					svrattr_val_tmp = svrattr_val;
					while (svrattr_val_tmp) {

						new_value_str = NULL;
						value_str = pbs_python_object_get_attr_string_value(
							py_instance, svrattr_val_tmp->al_name);

						if (value_str != NULL) {

							new_value_str = malloc(strlen(value_str) +
									       strlen(svrattr_val_tmp->al_value) + 2);
							/* +2 for: "," and "\0" */
							if (new_value_str == NULL) {
								LOG_ERROR_ARG2(
									"%s:malloc failed extending entity <%s>",
									attr_def_p->at_name,
									svrattr_val_tmp->al_name);
								ret_rc = -1;
							} else {
								sprintf(new_value_str, "%s,%s",
									value_str, svrattr_val_tmp->al_value);
							}
						}
						rc = pbs_python_object_set_attr_string_value(
							py_instance,
							attr_def_p->at_name,
							new_value_str ? new_value_str : svrattr_val->al_value);
						if ((rc != -1) && (hook_debug.data_fp != NULL)) {
							fprintf(hook_debug.data_fp, "%s.%s=%s\n", (char *) hook_debug.objname,
								attr_def_p->at_name,
								new_value_str ? new_value_str : svrattr_val->al_value);
						}

						if (new_value_str != NULL) {
							free(new_value_str);
						}
						svrattr_val_tmp = (svrattrl *) GET_NEXT(
							svrattr_val_tmp->al_link);

					} /* while */

				} else {
					rc = pbs_python_object_set_attr_string_value(py_instance,
										     attr_def_p->at_name,
										     svrattr_val->al_value);

					if ((rc != -1) && (hook_debug.data_fp != NULL)) {
						fprintf(hook_debug.data_fp, "%s.%s=%s\n", (char *) hook_debug.objname,
							attr_def_p->at_name, svrattr_val->al_value);
					}
				}

				if (rc == -1) {
					LOG_ERROR_ARG2("%s:failed to set attribute <%s>",
						       "", attr_def_p->at_name);
					ret_rc = -1;
				}
			}

			free_attrlist(&pheadp);
		} else { /* error */
			continue;
		}
	} /* for */
	hook_perf_stat_stop(perf_label, perf_action, 0);
	return ret_rc;
}

/**
 * @brief
 *
 * 	Populates a Python instance 'py_instance' with values found in
 *	a svrattrl list.
 *
 * @param[in] py_instance -  a Python object/class to populate
 * @param[in] svrattrl_list - a pbs_list_head with svrattrl entries whose
 *				values will be used to populate 'py_instance'
 * @param[in]	perf_label - data passed on to hook_perf_stat* call
 * @param[in]	perf_action - dat passed on to hook_perf_stat* call
 *
 * @return indication of whether or not 'py_instance' was completely
 *	   populated or not
 * @return 0	- completely populated
 * @return -1	- incompletely populated
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
int
pbs_python_populate_python_class_from_svrattrl(PyObject *py_instance, pbs_list_head *svrattrl_list, char *perf_label, char *perf_action)
{
	svrattrl *plist = NULL;

	int rc = 0;
	int ret_rc = 0;
	PyObject *py_attr_resc = NULL; /* for resource types */
	char *objname = NULL;

	if (hook_debug.input_fp != NULL) {

		if (PyObject_IsInstance(py_instance,
					pbs_python_types_table[PP_JOB_IDX].t_class))
			objname = EVENT_JOB_OBJECT;
		else if (PyObject_IsInstance(py_instance,
					     pbs_python_types_table[PP_RESV_IDX].t_class))
			objname = EVENT_RESV_OBJECT;
		else if (PyObject_IsInstance(py_instance,
					     pbs_python_types_table[PP_VNODE_IDX].t_class))
			objname = EVENT_VNODE_OBJECT;
		else
			objname = EVENT_OBJECT;
	}

	print_svrattrl_list("pbs_python_populate_python_class_from_svrattrl==>",
			    svrattrl_list);
	hook_perf_stat_start(perf_label, perf_action, 0);
	plist = (svrattrl *) GET_NEXT(*svrattrl_list);

	while (plist) {

		if (plist->al_resc) {
			if (!PyObject_HasAttrString(py_instance, plist->al_name)) {
				plist = (svrattrl *) GET_NEXT(plist->al_link);
				continue;
			}

			py_attr_resc = PyObject_GetAttrString(py_instance,
							      plist->al_name);

			if (!py_attr_resc) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "Could not find %s", plist->al_name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				pbs_python_write_error_to_log(log_buffer);
				ret_rc = -1;
			} else {
				rc = pbs_python_object_set_attr_string_value(py_attr_resc,
									     plist->al_resc, plist->al_value);
				Py_DECREF(py_attr_resc);
				if (rc == -1) {
					LOG_ERROR_ARG2("%s:failed to set resource <%s>",
						       plist->al_resc, plist->al_name);
					ret_rc = -1;
				} else if (hook_debug.input_fp != NULL) {
					fprintf(hook_debug.input_fp, "%s.%s[%s]=%s\n", objname,
						plist->al_name, plist->al_resc, plist->al_value);
				}
			}
		} else {

			if (PyObject_IsInstance(py_instance,
						pbs_python_types_table[PP_VNODE_IDX].t_class) &&
			    (strcmp(plist->al_name, VNATTR_HOOK_REQUESTOR) == 0)) {
				/* an special value not be Python set */
				plist = (svrattrl *) GET_NEXT(plist->al_link);
				continue;
			}

			rc = pbs_python_object_set_attr_string_value(py_instance,
								     plist->al_name, return_internal_value(plist->al_name, plist->al_value));
			if (rc == -1) {
				LOG_ERROR_ARG2("%s:failed to set attribute <%s>",
					       "", plist->al_name);
				ret_rc = -1;
			} else if (hook_debug.input_fp != NULL)
				fprintf(hook_debug.input_fp, "%s.%s=%s\n", objname, plist->al_name, plist->al_value);
		}

		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (ret_rc);
}

/**
 * @brief
 * 	Returns the # of seconds equivalent to the given 'time_str' which is of
 * 	the form [hh:[mm:]]ss[.ms]
 *
 * @return	long
 * @retval	-1 or -2				for error, each filling
 *							a differnt log_buffer message
 * @retval	time in[hh:[mm:]]ss[.ms] format		success
 */
static long
duration_to_secs(char *time_str)
{

	char *value_tmp = NULL;
	attribute attr;
	int rc;

	/*  The *decode* functions below "munges" the value argument, so will use */
	/*  a copy */
	value_tmp = strdup(time_str);
	if (value_tmp == NULL) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "strdup failed! (errno %d)", errno);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		return -1;
	}

	clear_attr(&attr, job_attr_def);
	/* just a dummy attribute representing "walltime" to get the # of secs */
	/* of duration time */
	rc = decode_time(&attr, WALLTIME_RESC, NULL, value_tmp);

	if (value_tmp) {
		free(value_tmp);
	}

	if (rc != 0) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "input value %s not of the right format'",
			 time_str);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		return (-2);
	}

	return (attr.at_val.at_long);
}

/**
 *
 * @brief
 *	Compares 2 pbs variables string lists (i.e. comma-separated lists of
 *	var=value entries).
 *
 * @param[in]	varl1	- variable string list #1
 * @param[in]	varl2	- variable string list #2
 *
 * @return int
 * @retval 1	if the variable string lists are the same
 * @retval 0	otherwise
 */
int
varlist_same(char *varl1, char *varl2)
{
	pbs_list_head list1; /* Caution: list maintained in sorted order */
	pbs_list_head list2; /* Caution: list maintained in sorted order */
	char *pc, *pc1;
	char *env_var;
	char *env_val;
	char *varl1_dup = NULL;
	char *varl2_dup = NULL;
	svrattrl *pal1 = NULL;
	svrattrl *pal2 = NULL;
	int rc;

	if ((varl1 == NULL) || (varl2 == NULL))
		return 0;

	/* quick test */
	if (strcmp(varl1, varl2) == 0) {
		return 1;
	}

	varl1_dup = strdup(varl1);
	if (varl1_dup == NULL)
		return 0;
	varl2_dup = strdup(varl2);
	if (varl2_dup == NULL) {
		free(varl1_dup);
		return 0;
	}

	CLEAR_HEAD(list1);
	CLEAR_HEAD(list2);

	pc = strtok(varl1_dup, ",");
	while (pc != NULL) {
		env_var = pc;
		env_val = NULL;

		pc1 = strchr(pc, '=');
		if (pc1) {
			*pc1 = '\0';
			env_val = pc1 + 1;
		}
		(void) add_to_svrattrl_list_sorted(&list1, env_var, NULL,
						   env_val ? env_val : "", 0, NULL);

		pc = strtok(NULL, ",");
	}

	pc = strtok(varl2_dup, ",");
	while (pc != NULL) {
		env_var = pc;
		env_val = NULL;

		pc1 = strchr(pc, '=');
		if (pc1) {
			*pc1 = '\0';
			env_val = pc1 + 1;
		}
		(void) add_to_svrattrl_list_sorted(&list2, env_var, NULL,
						   env_val ? env_val : "", 0, NULL);
		pc = strtok(NULL, ",");
	}

	/* now compare the 2 sorted lists, which means if the 2 lists are */
	/* the same, then there should be a line by line match. */
	pal1 = (svrattrl *) GET_NEXT(list1);
	pal2 = (svrattrl *) GET_NEXT(list2);
	rc = 1;
	while ((pal1 != NULL) && (pal2 != NULL)) {
		if ((strcmp(pal1->al_name, pal2->al_name) != 0) ||
		    (strcmp(pal1->al_value, pal2->al_value) != 0)) {
			rc = 0;
			goto varlist_same_end;
		}
		pal1 = (svrattrl *) GET_NEXT(pal1->al_link);
		pal2 = (struct svrattrl *) GET_NEXT(pal2->al_link);
	}
	/* in the end, if they both match, both pointers must not be pointing anywhere */
	if ((pal1 != NULL) || (pal2 != NULL)) {
		rc = 0;
	}

varlist_same_end:
	free_attrlist(&list1);
	free_attrlist(&list2);
	free(varl1_dup);
	free(varl2_dup);

	return (rc);
}

/**
 * @brief
 *	Load the cached values found 'pbs_resource_value_list' into the
 *	Python resource list type object, py_resource_match.
 *
 * @param[in]	py_resource_match - the Resource list type object.
 *
 * @return int
 * @retval 0	- for success.
 * @retval != 0 - if some failure occurred.
 *
 */
static int
load_cached_resource_value(PyObject *py_resource_match)
{
	pbs_resource_value *resc_val = NULL;
	int rc;

	resc_val = (pbs_resource_value *) GET_NEXT(pbs_resource_value_list);
	while (resc_val != NULL) {

		if ((resc_val->py_resource != NULL) &&
		    (py_resource_match == resc_val->py_resource)) {
			break;
		}

		resc_val = (pbs_resource_value *) GET_NEXT(resc_val->all_rescs);
	}

	if (resc_val == NULL) {
		/* no match */
		return (0); /* no cached value found */
	}

	if (TYPE_ENTITY(resc_val->attr_def_p->at_type)) {
		rc = set_entity_resource_or_return_value(
			&(resc_val->value_list), resc_val->attr_def_p->at_name,
			resc_val->py_resource, NULL);
	} else { /* a regular resource */
		rc = set_resource_or_return_value(&(resc_val->value_list),
						  resc_val->attr_def_p->at_name,
						  resc_val->py_resource, NULL);
	}

	if (rc == 0) {

		hook_set_mode = C_MODE;
		rc = pbs_python_object_set_attr_integral_value(
			resc_val->py_resource, PY_RESOURCE_HAS_VALUE, TRUE);
		hook_set_mode = PY_MODE;

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set resource <%s>",
				       resc_val->attr_def_p->at_name,
				       PY_RESOURCE_HAS_VALUE);
		}
		Py_DECREF(resc_val->py_resource);
		free_attrlist(&resc_val->value_list);
		delete_link(&resc_val->all_rescs);
		free(resc_val);
	}

	return (rc);
}

/**
 *
 * @brief
 *	Repopulates the 'svrattrl_list' (pbs_list_head) with values found from
 * 	py_instance's attributes  and resources.
 *
 * @param[in]	  py_instance	- Python object to get input from.
 * @param[in/out] svrattrl_list  - the list to populate with data, as well
 *				   as the input list containing the
 *				   attribute flags to retain for each attribute
 *				   name.
 * @param[in]	  name_prefix - If not NULL, then the value for attribute
 *				name in svrattr_list elements is prefixed
 *				with this string.
 * @param[in]	  append   - if set to 0, then 'svrattrl_list' will get
 *			   initialized and populated with
 *			   data(name, resource, value, attribute_flag)
 *			   coming from 'py_instance''s
 *			   attribute name, resource name, value, and
 *			   'attribute_flag' will retain the previous flag value
 *			   if appearing on the original 'svrattrl_list'.
 * 			   - if set to 1, then 'svrattrl_list' will accumulate
 *			   (get appended to) data(name, resource, value,
 *			   attribute_flag) from 'py_instance', with the
 *			   'attribute_flag' not be taken from the original
 *			   svrattrl_list.
 * @note
 *	'append' mode to 1 is usually done if calling this function multiple
 *	times to accumulate the 'svrattrl_list'. For instance, this can be
 * 	useful in periodic hook when trying to get all the vnode values in
 *	a vnode_list.
 *
 * @return int
 * @retval 0	for success
 * @retval != 0 for error
 *
 */
int
pbs_python_populate_svrattrl_from_python_class(PyObject *py_instance,
					       pbs_list_head *svrattrl_list, char *name_prefix, int append)
{
	PyObject *py_attr_dict = NULL;
	PyObject *py_attr_hookset_dict = NULL;
	PyObject *py_resc_hookset_dict = NULL;
	PyObject *py_attr_keys = NULL;
	PyObject *py_val = NULL;
	PyObject *py_keys = NULL;
	PyObject *py_keys_dict = NULL;
	PyObject *py_keys_dict2 = NULL;
	char *name_str_dup = NULL;
	char *val_str_dup = NULL;
	int num_attrs, i;
	pbs_list_head svrattrl_list2;
	int rc = -1;
	int hook_set_flag = 0;
	int has_resv_duration;
	char the_resc[HOOK_BUF_SIZE];
	static char *the_val = NULL;
	static int val_buf_size = HOOK_BUF_SIZE;
	PyObject *py_resc = NULL;
	long val_sec;
	char *objname = NULL;

	if (the_val == NULL) {
		the_val = (char *) malloc(val_buf_size);
		if (the_val == NULL) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "malloc failure (errno %d)",
				 errno);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			return rc;
		}
	}

	if (hook_debug.output_fp != NULL) {

		if (PyObject_IsInstance(py_instance,
					pbs_python_types_table[PP_JOB_IDX].t_class))
			objname = EVENT_JOB_OBJECT;
		else if (PyObject_IsInstance(py_instance,
					     pbs_python_types_table[PP_RESV_IDX].t_class))
			objname = EVENT_RESV_OBJECT;
		else if (PyObject_IsInstance(py_instance,
					     pbs_python_types_table[PP_VNODE_IDX].t_class))
			objname = EVENT_VNODE_OBJECT;
		else
			objname = EVENT_OBJECT;
	}

	CLEAR_HEAD(svrattrl_list2);
	/* py_attr_dict = <py_instance>.attributes[] */
	if (!PyObject_HasAttrString(py_instance, PY_ATTRIBUTES)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "python object does not have '%s'", PY_ATTRIBUTES);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return rc;
	}

	py_attr_dict = PyObject_GetAttrString(py_instance, PY_ATTRIBUTES); /* NEW*/
	if (!py_attr_dict) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "Failed to obtain event job's '%s'", PY_ATTRIBUTES);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto svrattrl_exit;
	}

	if (!PyDict_Check(py_attr_dict)) {
		log_err(PBSE_INTERNAL, __func__, "object's attributes not a dictionary!");
		goto svrattrl_exit;
	}

	/* py_attr_keys = keys of <py_instance>.attributes[] */
	py_attr_keys = PyDict_Keys(py_attr_dict); /* NEW ref */
	if (!py_attr_keys) {
		log_err(PBSE_INTERNAL, __func__,
			"Failed to obtain event job's attributes keys");
		goto svrattrl_exit;
	}

	if (!PyList_Check(py_attr_keys)) {
		log_err(PBSE_INTERNAL, __func__, "object's attributes keys not a list!");
		goto svrattrl_exit;
	}

	/* Get the attributes that have been set in the hook script */
	py_attr_hookset_dict = PyObject_GetAttrString(
		py_instance, PY_ATTRIBUTES_HOOK_SET); /* new ref */
	if (py_attr_hookset_dict == NULL || !PyDict_Check(py_attr_hookset_dict)) {
		LOG_ERROR_ARG2("%s: <%s> does not exist or is not a dict", objname,
			       PY_ATTRIBUTES_HOOK_SET);
		Py_CLEAR(py_attr_hookset_dict); /* don't use if not dict */
	}

	/* Reservation specific, let's see if our  object already contains */
	/* a non-NULL, non-None ATTR_resv_duration attribute */
	has_resv_duration = 0;
	if (PyObject_IsInstance(py_instance,
				pbs_python_types_table[PP_RESV_IDX].t_class) &&
	    PyObject_HasAttrString(py_instance, ATTR_resv_duration)) {
		py_val = PyObject_GetAttrString(py_instance, ATTR_resv_duration); /*NEW*/
		if (py_val && (py_val != Py_None)) {
			has_resv_duration = 1;
		}
		Py_CLEAR(py_val);
	}

	num_attrs = PyList_Size(py_attr_keys);

	if (!append) {
		/* svrattrl_list2 is a copy of the original list */
		/* svrattrl_list2 must be freed at the end of this func */
		if (copy_svrattrl_list(svrattrl_list, &svrattrl_list2) == -1) {
			log_err(errno, __func__, "failed to save svrattrl_list");
			goto svrattrl_exit;
		}
		free_attrlist(svrattrl_list);
	}

	for (i = 0; i < num_attrs; i++) {
		char *name_str = NULL;
		resource_def *rescdef = NULL;

		name_str_dup = strdup(pbs_python_list_get_item_string_value(py_attr_keys, i));
		if (!name_str_dup) {
			log_err(errno, __func__, "strdup error");
			goto svrattrl_exit;
		}
		name_str = name_str_dup;

		/* these don't have entries in svrattrl */
		if (!name_str || (name_str[0] == '\0') ||
		    (strcmp(name_str, ATTR_queue) == 0) ||
		    in_string_list(name_str, ',', PY_PYTHON_DEFINED_ATTRIBUTES)) {
			if (name_str_dup) {
				free(name_str_dup);
				name_str_dup = NULL;
			}
			continue;
		}

		if (!PyObject_HasAttrString(py_instance, name_str)) {
			if (name_str_dup) {
				free(name_str_dup);
				name_str_dup = NULL;
			}
			continue;
		}

		py_val = PyObject_GetAttrString(py_instance, name_str);
		/* must be Py_CLEAR(-)ed or
		 * Py_DECREF()-ed later, so as to not leak memory
		 */

		if (!py_val || (py_val == Py_None)) {

			if (name_str_dup) {
				free(name_str_dup);
				name_str_dup = NULL;
			}
			continue;
		}

		if (PyObject_IsInstance(py_val,
					pbs_python_types_table[PP_RESC_IDX].t_class)) { /* a resource */
			char *resc, *val;
			int k, num_keys;
			PyObject *py_class = pbs_python_types_table[PP_RESC_IDX].t_class;
			PyObject *py_tmp = NULL;

			/* code snippet below mimics what's done in the
			 * __str__ method of class pbs_resource under
			 * /pbs/v1/_base_types.py for accessing entries
			 * in resource list.
			 */
			if (PyObject_HasAttrString(py_val, PY_RESOURCE_HAS_VALUE)) {
				if (pbs_python_object_get_attr_integral_value(py_val, PY_RESOURCE_HAS_VALUE) == 0) { /* no value yet */
					if (load_cached_resource_value(py_val) != 0) {
						log_err(PBSE_INTERNAL, __func__,
							"Failed to to load cached value for resource list");
						goto svrattrl_exit;
					}
				}
			}

			/* Obtain list of resource names from
			 *  <class pbs_resource>._attributes  dictionary
			 */
			if (PyObject_HasAttrString(py_class, PY_ATTRIBUTES)) {
				py_keys_dict = PyObject_GetAttrString(py_class,
								      PY_ATTRIBUTES);
			}

			if (!py_keys_dict || !PyDict_Check(py_keys_dict)) {
				log_err(PBSE_INTERNAL, __func__,
					"Failed to obtain event job's resource list dictionary");
				goto svrattrl_exit;
			}
			py_tmp = py_keys_dict;
			py_keys_dict = PyDict_Copy(py_tmp);
			Py_CLEAR(py_tmp);
			if (!py_keys_dict) {
				log_err(PBSE_INTERNAL, __func__,
					"Failed to duplicate resource list dictionary");
				goto svrattrl_exit;
			}

			/* look into <class pbs_resource>._attributes_unknown
			 * for custom resource names defined in a hook but
			 * not yet in resource table.
			 */
			py_keys_dict2 = PyObject_GetAttrString(
				py_val, "_attributes_unknown"); /* new ref */
			if (py_keys_dict2) {
				/* Merge resource list dictionary with the dictionary of
				 * unknown resources
				 */
				if (PyDict_Check(py_keys_dict2)) {
					PyDict_Update(py_keys_dict, py_keys_dict2);
				}
			}

			py_keys = PyDict_Keys(py_keys_dict);
			if (!py_keys || !PyList_Check(py_keys)) {
				log_err(PBSE_INTERNAL, __func__,
					"Failed to obtain event job's resource list keys");
				goto svrattrl_exit;
			}

			/* Get the resources that have been set in the hook script */
			py_resc_hookset_dict = PyObject_GetAttrString(
				py_val, PY_ATTRIBUTES_HOOK_SET); /* new ref */
			if (py_resc_hookset_dict != NULL && !PyDict_Check(py_resc_hookset_dict)) {
				Py_CLEAR(py_resc_hookset_dict); /* don't use if not dict */
			}

			num_keys = PyList_Size(py_keys);
			for (k = 0; k < num_keys; k++) {
				char *tmpstr = NULL;
				tmpstr = pbs_python_list_get_item_string_value(py_keys, k);
				if (tmpstr == NULL)
					continue;

				resc = strdup(tmpstr);
				if (resc == NULL) {
					log_err(errno, __func__, "strdup error");
					goto svrattrl_exit;
				}
				tmpstr = pbs_python_object_get_attr_string_value(py_val, resc);
				if (tmpstr == NULL) {
					free(resc);
					continue;
				}

				val = strdup(tmpstr);
				if (val == NULL) {
					log_err(errno, __func__, "strdup error");
					free(resc);
					goto svrattrl_exit;
				}

				if ((strcmp(resc, PY_RESOURCE_NAME) == 0) ||
				    (strcmp(resc, PY_RESOURCE_HAS_VALUE) == 0)) {
					free(resc);
					free(val);
					continue;
				}

				hook_set_flag = 0;
				if (py_resc_hookset_dict != NULL &&
				    PyDict_GetItemString(py_resc_hookset_dict, resc) != NULL) {
					hook_set_flag = 1; /* resource set/unset in hook script */
				}

				if ((strcmp(resc, WALLTIME_RESC) == 0) && has_resv_duration) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1,
						 "Ignoring reservation resource '%s' since '%s' "
						 "already specified",
						 resc, ATTR_resv_duration);
					log_buffer[LOG_BUF_SIZE - 1] = '\0';
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO,
						  __func__, log_buffer);
					free(resc);
					free(val);
					continue;
				}

				the_val[0] = '\0';
				if (pbs_strcat(&the_val, &val_buf_size, val) == NULL) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "malloc failure (errno %d)",
						 errno);
					log_err(PBSE_SYSTEM, __func__, log_buffer);
					goto svrattrl_exit;
				}

				strncpy(the_resc, resc, sizeof(the_resc) - 1);
				if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {

					if ((rescdef = find_resc_def(svr_resc_def, resc)) == NULL) {
						/* not a builtin or previously defined resource */
						py_resc = PyObject_GetAttrString(py_val, resc); /* NEW */

						if (PyBool_Check(py_resc)) {
							snprintf(the_resc, sizeof(the_resc), "%s,boolean", resc);
						} else if (PyObject_IsInstance(py_resc,
									       pbs_python_types_table[PP_TIME_IDX].t_class)) {
							/* this must appear */
							/* before check to */
							/* Int instance */
							/* for TIME object */
							/* is derived from an */
							/*   int */
							snprintf(the_resc, sizeof(the_resc), "%s,long", resc);
							if (val != NULL) {
								val_sec = duration_to_secs(val);
								snprintf(the_val, val_buf_size, "%ld", val_sec);
							}
						} else if (PyLong_Check(py_resc) || PyLong_Check(py_resc)) {
							snprintf(the_resc, sizeof(the_resc), "%s,long", resc);
						} else if (PyFloat_Check(py_resc)) {
							snprintf(the_resc, sizeof(the_resc), "%s,float", resc);
						} else if (PyUnicode_Check(py_resc)) {
							/* this check should come first before the test of PP_ARST_IDX instance */
							/* for a regular string is also an instance/subset of PP_ARST_IDX type */
							snprintf(the_resc, sizeof(the_resc), "%s,string", resc);
						} else if (PyObject_IsInstance(py_resc,
									       pbs_python_types_table[PP_SIZE_IDX].t_class)) {
							snprintf(the_resc, sizeof(the_resc), "%s,size", resc);
						} else if (PyObject_IsInstance(py_resc,
									       pbs_python_types_table[PP_ARST_IDX].t_class)) {
							snprintf(the_resc, sizeof(the_resc), "%s,string_array", resc);
						} else {
							snprintf(the_resc, sizeof(the_resc), "%s,string", resc);
						}

						Py_CLEAR(py_resc);
					} else {
						if (TYPE_BOOL(rescdef->rs_type)) {
							snprintf(the_resc, sizeof(the_resc), "%s,boolean", resc);
						} else if (TYPE_INT(rescdef->rs_type)) {
							snprintf(the_resc, sizeof(the_resc), "%s,long", resc);
						} else if (TYPE_FLOAT(rescdef->rs_type)) {
							snprintf(the_resc, sizeof(the_resc), "%s,float", resc);
						} else if (TYPE_STR(rescdef->rs_type)) {
							/* this check should come first before the test of PP_ARST_IDX instance */
							/* for a regular string is also an instance/subset of PP_ARST_IDX type */
							snprintf(the_resc, sizeof(the_resc), "%s,string", resc);
						} else if (TYPE_SIZE(rescdef->rs_type)) {
							snprintf(the_resc, sizeof(the_resc), "%s,size", resc);
						} else if (TYPE_ARST(rescdef->rs_type)) {
							snprintf(the_resc, sizeof(the_resc), "%s,string_array", resc);
						} else if (TYPE_DURATION(rescdef->rs_encode)) {
							snprintf(the_resc, sizeof(the_resc), "%s,long", resc);
							if (val != NULL) {
								val_sec = duration_to_secs(val);
								snprintf(the_val, val_buf_size, "%ld", val_sec);
							}
						} else {
							snprintf(the_resc, sizeof(the_resc), "%s,string", resc);
						}
					}
				}

				if (add_to_svrattrl_list(svrattrl_list, name_str, the_resc, the_val,
							 get_svrattrl_flag(name_str, the_resc, the_val,
									   &svrattrl_list2, hook_set_flag),
							 name_prefix) == -1) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to add_to_svrattrl_list(%s,%s,%s",
						 name_str, resc, (val ? val : ""));
					log_buffer[LOG_BUF_SIZE - 1] = '\0';
					log_err(errno, __func__, log_buffer);
					free(resc);
					free(val);
					goto svrattrl_exit;
				}

				if (hook_debug.output_fp != NULL)
					fprintf(hook_debug.output_fp, "%s.%s[%s]=%s\n", objname, name_str, the_resc,
						return_external_value(name_str, the_val));
				free(resc);
				free(val);
			}
		} else {

			char *val_str2;	  /* what gets sent to the server */
			char val_buf[40]; /* holds JOB_NAME_UNSET_VALUE and */
			char *val_str;	  /* what gets sent to the server */
			/* 'long' value string */
			long nsecs;

			val_str = pbs_python_object_str(py_val); /* does not return NULL */

			val_str2 = val_str;

			/* For Job_Name attribute, if it got an "" value (meaning None    */
			/* was specified in a hook script), then mimic what PBS server    */
			/* does which is set it to "none".  We cannot have a NULL or ""   */
			/*  value for Job_Name as this is used for constructing job       */
			/* output files and accounting_logs entry and may cause the       */
			/* server to  crash later.                                        */
			if ((strcmp(name_str, ATTR_N) == 0) && (val_str[0] == '\0')) {
				strcpy(val_buf, JOB_NAME_UNSET_VALUE);
				val_str2 = val_buf;
			} else if ((strcmp(name_str, ATTR_resv_duration) == 0) &&
				   (val_str[0] != '\0')) {
				nsecs = duration_to_secs(val_str);
				if (nsecs < 0) {
					log_err(errno, __func__, log_buffer);
					goto svrattrl_exit;
				}
				sprintf(val_buf, "%ld", nsecs);
				val_str2 = val_buf;
			}

			hook_set_flag = 0;
			if (py_attr_hookset_dict != NULL &&
			    PyDict_GetItemString(py_attr_hookset_dict, name_str) != NULL) {
				hook_set_flag = 1; /* attribute set/unset in a hook script */
			}
			if (strcmp(name_str, ATTR_v) == 0) {
				svrattrl *svrattrl_e;

				/* if there's a change in Variables_List value, 	*/
				/* (svrattrl_list2 (orig) vs svrattrl_list (new)),    	*/
				/* then flag as hook set */
				svrattrl_e = find_svrattrl_list_entry(&svrattrl_list2, ATTR_v, NULL);
				if ((svrattrl_e == NULL) ||
				    !varlist_same(svrattrl_e->al_value, val_str))
					hook_set_flag = 1;
			}

			if (add_to_svrattrl_list(svrattrl_list, name_str, NULL, val_str2,
						 get_svrattrl_flag(name_str, NULL, val_str,
								   &svrattrl_list2, hook_set_flag),
						 name_prefix) == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to add_to_svrattrl_list(%s,null,%s)",
					 name_str, val_str);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				log_err(errno, __func__, log_buffer);
				goto svrattrl_exit;
			}
			if (hook_debug.output_fp != NULL)
				fprintf(hook_debug.output_fp, "%s.%s=%s\n", objname, name_str, return_external_value(name_str, val_str2));
		}
		/* must be cleared as they take on different values on each iteration */
		Py_CLEAR(py_val);
		Py_CLEAR(py_keys);
		Py_CLEAR(py_keys_dict);
		Py_CLEAR(py_keys_dict2);
		Py_CLEAR(py_resc_hookset_dict);
		free(name_str_dup);
		name_str_dup = NULL;

	} /* for loop */
	rc = 0;
svrattrl_exit:
	Py_CLEAR(py_attr_dict);
	Py_CLEAR(py_attr_hookset_dict);
	Py_CLEAR(py_resc_hookset_dict);
	Py_CLEAR(py_attr_keys);
	Py_CLEAR(py_val);
	Py_CLEAR(py_resc);
	Py_CLEAR(py_keys);
	Py_CLEAR(py_keys_dict);
	Py_CLEAR(py_keys_dict2);

	if (name_str_dup) {
		free(name_str_dup);
	}
	if (val_str_dup) {
		free(val_str_dup);
	}
	/* safe to call because start of func clears this list */
	free_attrlist(&svrattrl_list2);

	return (rc);
}

/**
 * @brief
 *  	Causes the 'py_instance' object's attributes to be unsettable.
 *
 * @param[in] py_instance - PyObject with attributes
 *
 * @return	int
 * @retval	0 	for success;
 * @retval	-1 	otherwise.
 *
 */
int
pbs_python_mark_object_readonly(PyObject *py_instance)
{
	PyObject *py_attr_dict = NULL;
	PyObject *py_attr_keys = NULL;
	PyObject *py_val = NULL;
	int num_attrs, i;
	int rc = -1;

	/* mark the owning object readonly */
	rc = pbs_python_object_set_attr_integral_value(py_instance,
						       PY_READONLY_FLAG, TRUE);
	if (rc == -1) {

		snprintf(log_buffer, LOG_BUF_SIZE - 1, "Failed set object's '%s' flag", PY_READONLY_FLAG);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return (-1);
	}

	/* Now mark attached resources read-only */

	/* py_attr_dict = <py_instance>.attributes[] */
	if (!PyObject_HasAttrString(py_instance, PY_ATTRIBUTES)) {

		snprintf(log_buffer, LOG_BUF_SIZE - 1, "encountered an object that has no '%s'",
			 PY_ATTRIBUTES);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return (-1);
	}

	py_attr_dict = PyObject_GetAttrString(py_instance, PY_ATTRIBUTES); /* NEW*/
	if (!py_attr_dict) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to obtain object's '%s'", PY_ATTRIBUTES);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return (-1);
	}

	if (!PyDict_Check(py_attr_dict)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "object's '%s' is not a dictionary!",
			 PY_ATTRIBUTES);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		rc = -1;
		goto mark_readonly_exit;
	}

	/* py_attr_keys = keys of <py_instance>.attributes[] */
	py_attr_keys = PyDict_Keys(py_attr_dict); /* NEW ref */

	if (!py_attr_keys) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "Failed to obtain object's '%s' keys",
			 PY_ATTRIBUTES);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		rc = -1;
		goto mark_readonly_exit;
	}
	if (!PyList_Check(py_attr_keys)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "object's '%s' keys is not a list!", PY_ATTRIBUTES);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, PY_ATTRIBUTES);
		rc = -1;
		goto mark_readonly_exit;
	}

	num_attrs = PyList_Size(py_attr_keys);
	for (i = 0; i < num_attrs; i++) {
		char *name_str = NULL;

		name_str = pbs_python_list_get_item_string_value(py_attr_keys, i);

		if (!name_str || (name_str[0] == '\0'))
			continue;

		if (!PyObject_HasAttrString(py_instance, name_str))
			continue;

		py_val = PyObject_GetAttrString(py_instance, name_str); /* NEW */

		if (!py_val) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to get attribute '%s' value", name_str);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			rc = -1;
			goto mark_readonly_exit;
		}

		if (PyObject_IsInstance(py_val,
					pbs_python_types_table[PP_RESC_IDX].t_class)) { /* a resource */

			rc = pbs_python_object_set_attr_integral_value(py_val,
								       PY_READONLY_FLAG, TRUE);
			if (rc == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "failed to set %s '%s'", name_str, PY_READONLY_FLAG);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto mark_readonly_exit;
			}
		}
		/* must be cleared as they take on different values on each iteration */
		Py_CLEAR(py_val);

	} /* for loop */

	rc = 0;

mark_readonly_exit:
	Py_CLEAR(py_attr_dict);
	Py_CLEAR(py_attr_keys);
	Py_CLEAR(py_val);
	return (rc);
}

/*
 * --------------------- MODULE HELPER METHODS  ----------------------------
 */

/**
 *
 * @brief
 *     Helper method returning PBS Python queue object mapping the given 'pque'
 *     (a pbs_queue struct) if set; otherwise, look into the list of pbs_queue
 *     structures managed by the local server, which  matches 'que_name'.
 *
 * @param[in]	pque - if set, this is the pbs_queue structure whose values
 *		       will be mapped into a PBS Python queue object.
 * @param[in]   queue_name - if 'pque' is not set, then create a PBS Python
 *			      queue object mapping a pbs_queue structure in
 *			      the system that matches 'queue_name'.
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 * @note
 *	This first returns any cached Python queue object found in
 *	'py_hook_pbsque[]' matching 'que_name' or pque's que_name.
 *	Otherwise, the Python queue object returned is cached in
 *	'py_hook_pbsque[]' array.
 *
 * @return	PyObject *	pointer to a Python queue object to map the
 *				queue.
 */
static PyObject *
_pps_helper_get_queue(pbs_queue *pque, const char *que_name, char *perf_label)
{
	PyObject *py_que_class = NULL;
	PyObject *py_que = NULL;
	PyObject *py_qargs = NULL;
	pbs_queue *que;
	int tmp_rc = -1;
	int i;
	char perf_action[MAXBUFLEN];
	long total_jobs;
	attribute *qattr;

	if (pque != NULL) {
		que = pque;
	} else {
		if ((que_name == NULL) || (que_name[0] == '\0')) {
			log_err(PBSE_INTERNAL, __func__,
				"Unable to populate python queue object");
			return NULL;
		}
		que = find_queuebyname((char *) que_name);
	}

	/* make sure que is not null */
	if (!que) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not find queue '%s'", que_name);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return py_que;
	}

	if (py_hook_pbsque != NULL) {

		for (i = 0; (i < py_hook_pbsque_max) && (py_hook_pbsque[i] != NULL);
		     i++) {
			char *qn;

			qn = pbs_python_object_get_attr_string_value(py_hook_pbsque[i],
								     "name");
			if ((qn != NULL) && (qn[0] != '\0') &&
			    (strcmp(qn, que->qu_qs.qu_name) == 0)) {
				Py_INCREF(py_hook_pbsque[i]);
				return py_hook_pbsque[i];
			}
		}
	}

	/*
	 * First things first create a Python queue  object.
	 *  - Borrowed reference
	 *  - Exception is *NOT* set
	 */
	py_que_class = pbs_python_types_table[PP_QUE_IDX].t_class;

	py_qargs = Py_BuildValue("(s)", que->qu_qs.qu_name); /* NEW ref */
	if (!py_qargs) {
		log_err(PBSE_INTERNAL, __func__, "could not build args list for queue");
		goto ERROR_EXIT;
	}
	py_que = PyObject_Call(py_que_class, py_qargs, NULL);
	if (!py_que) {
		log_err(PBSE_INTERNAL, __func__, "failed to create a python queue object");
		goto ERROR_EXIT;
	}
	if (py_qargs)
		Py_CLEAR(py_qargs);
	/*
	 * OK, At this point we need to start populating the que class.
	 */
	/* As done is statque update the state count */
	if (!svr_chk_history_conf()) {
		total_jobs = que->qu_numjobs;
	} else {
		total_jobs = que->qu_numjobs - (que->qu_njstate[JOB_STATE_MOVED] + que->qu_njstate[JOB_STATE_FINISHED] + que->qu_njstate[JOB_STATE_EXPIRED]);
	}
	set_qattr_l_slim(que, QA_ATR_TotalJobs, total_jobs, SET);

	qattr = get_qattr(que, QA_ATR_JobsByState);
	update_state_ct(qattr, que->qu_njstate, &que_attr_def[QA_ATR_JobsByState]);
	/* stuff all the attributes */
	snprintf((char *) hook_debug.objname, HOOK_BUF_SIZE - 1, "%s(%s)", SERVER_QUEUE_OBJECT, que->qu_qs.qu_name);
	snprintf(perf_action, sizeof(perf_action), "%s:%s", HOOK_PERF_POPULATE, hook_debug.objname);
	tmp_rc = pbs_python_populate_attributes_to_python_class(py_que,
								py_que_attr_types,
								que->qu_attr,
								que_attr_def,
								QA_ATR_LAST, perf_label, perf_action);
	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__,
			"partially populated python queue object");
	}
	free_attr(que_attr_def, qattr, QA_ATR_JobsByState);

	tmp_rc = pbs_python_mark_object_readonly(py_que);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to mark queue readonly!");
		goto ERROR_EXIT;
	}

	object_counter++;

	if (server.sv_qs.sv_numque > 0) {

		if (py_hook_pbsque == NULL) {
			py_hook_pbsque = (PyObject **) calloc(server.sv_qs.sv_numque,
							      sizeof(PyObject *));
			if (py_hook_pbsque == NULL) {
				log_err(errno, __func__,
					"Failed to calloc array of cached pbs queue objects");
				goto ERROR_EXIT;
			}
			py_hook_pbsque_max = server.sv_qs.sv_numque;
		} else if (server.sv_qs.sv_numque > py_hook_pbsque_max) {
			PyObject **py_hook_pbsque_tmp;
			py_hook_pbsque_tmp = (PyObject **) realloc(py_hook_pbsque,
								   server.sv_qs.sv_numque * sizeof(PyObject *));
			if (py_hook_pbsque_tmp == NULL) {
				log_err(errno, __func__,
					"Failed to realloc array of cached pbs queue objects");
				for (i = 0; (i < py_hook_pbsque_max) &&
					    (py_hook_pbsque[i] != NULL);
				     i++) {
					Py_CLEAR(py_hook_pbsque[i]);
				}
				free(py_hook_pbsque);
				py_hook_pbsque = NULL;
				goto ERROR_EXIT;
			}
			py_hook_pbsque = py_hook_pbsque_tmp;
			for (i = py_hook_pbsque_max; i < server.sv_qs.sv_numque; i++) {
				py_hook_pbsque[i] = NULL;
			}

			py_hook_pbsque_max = server.sv_qs.sv_numque;
		}
	}

	if (py_hook_pbsque != NULL) {
		for (i = 0; i < py_hook_pbsque_max; i++) {
			if (py_hook_pbsque[i] == NULL) {
				Py_INCREF(py_que);
				py_hook_pbsque[i] = py_que;
				break;
			}
		}
	}

	return py_que;
ERROR_EXIT:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);

	if (py_qargs)
		Py_CLEAR(py_qargs);
	if (py_que)
		Py_CLEAR(py_que);
	PyErr_SetString(PyExc_AssertionError, "Failed to create queue object");

	return NULL;
}

/**
 *
 * @brief
 * 	Helper method returning a server Python Object representing the local
 *	(current) server.
 *
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 *
 *  @note
 *	This marks the server object "read-only" in Python mode.
 *	Also, this first returns the cached 'py_hook_pbsserver' object.
 *	Otherwise, the obtained PBS Python server object is cached in
 *	'py_hook_pbsserver'.
 *
 * @return	PyObject *	pointer to a Python server object to map the
 *				local server values.
 */
static PyObject *
_pps_helper_get_server(char *perf_label)
{
	PyObject *py_svr_class = NULL;
	PyObject *py_svr = NULL;
	PyObject *py_sargs = NULL;
	int tmp_rc = -1;
	char perf_action[MAXBUFLEN];

	if (py_hook_pbsserver != NULL) {
		Py_INCREF(py_hook_pbsserver);
		return py_hook_pbsserver;
	}

	/*
	 * First things first create a Python queue  object.
	 *  - Borrowed reference
	 *  - Exception is *NOT* set
	 */
	py_svr_class = pbs_python_types_table[PP_SVR_IDX].t_class;

	py_sargs = Py_BuildValue("(s)", server_name); /* NEW ref */
	if (!py_sargs) {
		log_err(-1, pbs_python_daemon_name, "could not build args list for server");
		goto ERROR_EXIT;
	}

	py_svr = PyObject_Call(py_svr_class, py_sargs, NULL);
	if (!py_svr) {
		log_err(-1, pbs_python_daemon_name, "failed to create a python server object");
		goto ERROR_EXIT;
	}
	if (py_sargs)
		Py_CLEAR(py_sargs);
	/*
	 * OK, At this point we need to start populating the server class.
	 */
	/* As done is stat_svr update the state count */

	/* update count and state counts from sv_numjobs and sv_jobstates */
	set_sattr_l_slim(SVR_ATR_TotalJobs, server.sv_qs.sv_numjobs, SET);
	update_state_ct(get_sattr(SVR_ATR_JobsByState), server.sv_jobstates, &svr_attr_def[SVR_ATR_JobsByState]);

	update_license_ct();

	/* stuff all the attributes */
	strncpy((char *) hook_debug.objname, SERVER_OBJECT, HOOK_BUF_SIZE - 1);
	snprintf(perf_action, sizeof(perf_action), "%s:%s", HOOK_PERF_POPULATE, hook_debug.objname);
	tmp_rc = pbs_python_populate_attributes_to_python_class(py_svr,
								py_svr_attr_types,
								server.sv_attr,
								svr_attr_def,
								SVR_ATR_LAST, perf_label, perf_action);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__,
			"partially populated python server object");
	}

	tmp_rc = pbs_python_mark_object_readonly(py_svr);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to mark server readonly!");
		goto ERROR_EXIT;
	}

	object_counter++;
	Py_INCREF(py_svr);
	py_hook_pbsserver = py_svr;
	return py_svr;
ERROR_EXIT:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	if (py_sargs)
		Py_CLEAR(py_sargs);
	if (py_svr)
		Py_CLEAR(py_svr);

	PyErr_SetString(PyExc_AssertionError, "Failed to create server object");

	return NULL;
}

/**
 * @brief
 * 	Helper method returning a job Python Object from a job struct
 * 	This marks the job object "read-only" in Python mode.
 * 	If  'qname' is not NULL or "", then the job object is returned if
 * 	it is queued in 'qname'.
 *
 * @param[in] pjob_o - job info
 * @param[in] jobid - job identifier
 * @param[in] qname - queuename
 * @param[in]	perf_label - data passed on to hook_perf_stat* call
 *
 * @return	PyObject*
 * @retval	job python object	success
 * @retval	NULL			error
 *
 */
static PyObject *
_pps_helper_get_job(job *pjob_o, const char *jobid, const char *qname, char *perf_label)
{
	PyObject *py_job_class = NULL;
	PyObject *py_job = NULL;
	PyObject *py_jargs = NULL;
	PyObject *py_que = NULL;
	PyObject *py_resv = NULL;
	PyObject *py_server = NULL;
	job *pjob;
	int tmp_rc = -1;
	int t;
	char perf_action[MAXBUFLEN];

	if (pjob_o != NULL) {
		pjob = pjob_o;
	} else {
		if ((jobid == NULL) || (jobid[0] == '\0')) {
			log_err(PBSE_INTERNAL, __func__,
				"Unable to populate python job object");
			return NULL;
		}
		t = is_job_array((char *) jobid);

		if (t == IS_ARRAY_Single) {
			pjob = find_job((char *) jobid); /* has data if instantiated */
			if (pjob == NULL) {		 /* otherwise, return parent */
				pjob = find_arrayparent((char *) jobid);
			}
		} else if ((t == IS_ARRAY_NO) || (t == IS_ARRAY_ArrayJob)) {
			pjob = find_job((char *) jobid); /* regular or ArrayJob itself */
		} else {
			pjob = find_arrayparent((char *) jobid); /* subjob(s) */
		}
	}

	/* make sure pjob is not null */
	if (!pjob) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "could not find job '%s'", jobid);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return py_job;
	}
	if (qname && (qname[0] != '\0') &&
	    (strcmp(pjob->ji_qs.ji_queue, qname) != 0)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "job '%s' not in '%s'", jobid, qname);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return py_job;
	}

	/*
	 * First things first create a Python queue  object.
	 *  - Borrowed reference
	 *  - Exception is *NOT* set
	 */
	py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;

	py_jargs = Py_BuildValue("(s)", pjob->ji_qs.ji_jobid); /* NEW ref */
	if (!py_jargs) {
		log_err(-1, pbs_python_daemon_name, "could not build args list for job");
		goto ERROR_EXIT;
	}
	py_job = PyObject_Call(py_job_class, py_jargs, NULL);
	if (!py_job) {
		log_err(-1, pbs_python_daemon_name, "failed to create a python job object");
		goto ERROR_EXIT;
	}
	if (py_jargs)
		Py_CLEAR(py_jargs);
	/*
	 * OK, At this point we need to start populating the job class.
	 */
	snprintf((char *) hook_debug.objname, HOOK_BUF_SIZE - 1, "%s(%s)", SERVER_JOB_OBJECT, pjob->ji_qs.ji_jobid);
	snprintf(perf_action, sizeof(perf_action), "%s:%s", HOOK_PERF_POPULATE, hook_debug.objname);
	tmp_rc = pbs_python_populate_attributes_to_python_class(py_job,
								py_job_attr_types,
								pjob->ji_wattr,
								job_attr_def,
								JOB_ATR_LAST, perf_label, perf_action);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__,
			"partially populated python job object");
	}

	/* set job.queue to actual queue object */
	if (pjob->ji_qs.ji_queue[0]) {
		py_que = _pps_helper_get_queue(NULL, pjob->ji_qs.ji_queue, perf_label); /* NEW ref */
		if (py_que) {
			if (PyObject_HasAttrString(py_job, ATTR_queue)) {
				/* py_que ref ct incremented as part of py_job */
				(void) PyObject_SetAttrString(py_job, ATTR_queue, py_que);
			}
			Py_DECREF(py_que); /* we no longer need to reference */
		}
	}

	if (pjob->ji_myResv) {
		/* set job.resv to actual reservation object */
		py_resv = _pps_helper_get_resv(pjob->ji_myResv,
					       pjob->ji_myResv->ri_qs.ri_resvID, perf_label); /* NEW ref */
		if (py_resv) {
			if (PyObject_HasAttrString(py_job, ATTR_resv)) {
				/* py_resv ref ct incremented as part of py_job */
				(void) PyObject_SetAttrString(py_job, ATTR_resv, py_resv);
			}
			Py_DECREF(py_resv); /* we no longer need to reference */
		}
	}

	/* set job.server to actual server object */
	py_server = _pps_helper_get_server(perf_label); /* NEW Ref */

	if (py_server) {
		if (PyObject_HasAttrString(py_job, ATTR_server)) {
			/* py_server ref ct incremented as part of py_job */
			(void) PyObject_SetAttrString(py_job, ATTR_server, py_server);
		}
		Py_DECREF(py_server);
	}

	tmp_rc = pbs_python_mark_object_readonly(py_job);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to mark job readonly!");
		goto ERROR_EXIT;
	}

	object_counter++;
	return py_job;
ERROR_EXIT:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(py_jargs);
	Py_CLEAR(py_job);
	PyErr_SetString(PyExc_AssertionError, "Failed to create job object");

	return NULL;
}

/**
 * @brief
 * 	Helper method returning a resv Python Object from a a resc_resv struct.
 *
 * @param[in] presv_o - reservation structure
 * @param[in] resvid - reservation name
 * @param[in] perf_label - passed on to hook_perf_stat* call.
 *
 * @return	PyObject *
 * @retval	This returns a Python object that maps
 * 		to a resc_resv struct taken directly from presv_o if non-NULL,
 * 		or to the struct returned by find_resv(<resvid>).
 */
static PyObject *
_pps_helper_get_resv(resc_resv *presv_o, const char *resvid, char *perf_label)
{
	PyObject *py_resv_class = NULL;
	PyObject *py_resv = NULL;
	PyObject *py_rargs = NULL;
	PyObject *py_que = NULL;
	PyObject *py_server = NULL;
	resc_resv *presv;
	int tmp_rc = -1;
	char resvid_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];
	char perf_action[MAXBUFLEN];

	if (presv_o != NULL) {
		presv = presv_o;
	} else {
		if ((resvid == NULL) || (resvid[0] == '\0')) {
			log_err(PBSE_INTERNAL, __func__,
				"Unable to populate python reservation object");
			return NULL;
		}

		if (get_server((char *) resvid, (char *) resvid_out,
			       (char *) server_out)) {

			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "illegally formed reservation identifier %s", resvid);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			return NULL;
		}
		presv = find_resv((char *) resvid_out);
	}

	if (presv == NULL) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s: no such reservation", resvid);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		/* this takes care of incrementing ref cnt of Py_None */
		Py_RETURN_NONE;
	}

	/*
	 * First things first create a Python resv object.
	 *  - Borrowed reference
	 *  - Exception is *NOT* set
	 */
	py_resv_class = pbs_python_types_table[PP_RESV_IDX].t_class;

	py_rargs = Py_BuildValue("(s)", presv->ri_qs.ri_resvID); /* NEW ref */
	if (py_rargs == NULL) {
		log_err(-1, pbs_python_daemon_name,
			"could not build args list for resv");
		goto GR_ERROR_EXIT;
	}
	py_resv = PyObject_Call(py_resv_class, py_rargs, NULL);
	if (py_resv == NULL) {
		log_err(-1, pbs_python_daemon_name,
			"failed to create a python resv object");
		goto GR_ERROR_EXIT;
	}

	Py_CLEAR(py_rargs);

	/*
	 * OK, At this point we need to start populating the resv class.
	 */
	snprintf((char *) hook_debug.objname, HOOK_BUF_SIZE - 1, "%s(%s)", SERVER_RESV_OBJECT, presv->ri_qs.ri_resvID);
	snprintf(perf_action, sizeof(perf_action), "%s:%s", HOOK_PERF_POPULATE, hook_debug.objname);
	tmp_rc = pbs_python_populate_attributes_to_python_class(py_resv,
								py_resv_attr_types,
								presv->ri_wattr,
								resv_attr_def,
								RESV_ATR_LAST, perf_label, perf_action);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__,
			"partially populated python resv object");
	}

	/* set resv.queue to actual queue object */
	if (presv->ri_qs.ri_queue[0] && PyObject_HasAttrString(py_resv, ATTR_queue)) {
		py_que = _pps_helper_get_queue(NULL, presv->ri_qs.ri_queue, perf_label); /* NEW */
		if (py_que) {
			/* py_que ref ct incremented as part of py_resv */
			(void) PyObject_SetAttrString(py_resv, ATTR_queue, py_que);
			Py_DECREF(py_que); /* we no longer need to reference */
		}
	}

	/* set resv.server to actual server object */
	py_server = _pps_helper_get_server(perf_label); /* NEW */

	if (py_server) {
		if (PyObject_HasAttrString(py_resv, ATTR_server)) {
			/* py_server ref ct incremented as part of py_resv */
			(void) PyObject_SetAttrString(py_resv, ATTR_server, py_server);
		}
		Py_DECREF(py_server);
	}

	tmp_rc = pbs_python_mark_object_readonly(py_resv);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to mark resv readonly!");
		goto GR_ERROR_EXIT;
	}

	object_counter++;
	return py_resv;

GR_ERROR_EXIT:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(py_rargs);
	Py_CLEAR(py_resv);
	PyErr_SetString(PyExc_AssertionError, "Failed to create resv object");

	return NULL;
}

/**
 * @brief
 *	Returns a Python object that maps to a struct pbsnodes * taken directly
 *	from pvnode_o if non-NULL, or to the struct returned by
 *	find_nodebyname(<vname>).
 *
 * @param[in]   pvnode_o	- the "struct pbsnode *" that will be used to
 *				  populate a Python vnode object.
 * @param[in]	vname		- name of a vnode to obtain "struct pbsnode *"
 *				  content to populate a Python vnode object.
 * @param[in]	perf_label	- passed on to hook_perf_stat* call.
 *
 * @return      PyObject *	- the Python vnode object corresponding to
 *				  'pvnode_o' or 'vname'.
 */
static PyObject *
_pps_helper_get_vnode(struct pbsnode *pvnode_o, const char *vname, char *perf_label)
{
	PyObject *py_vnode_class = NULL;
	PyObject *py_vnode = NULL;
	PyObject *py_rargs = NULL;
	PyObject *py_que = NULL;
	struct pbsnode *pvnode;
	int tmp_rc = -1;
	char buf[512];
	char perf_action[MAXBUFLEN];

	if (pvnode_o != NULL) {
		pvnode = pvnode_o;
	} else {
		if ((vname == NULL) || (vname[0] == '\0')) {
			log_err(PBSE_INTERNAL, __func__,
				"Unable to populate python vnode object");
			return NULL;
		}

		pvnode = find_nodebyname((char *) vname);
	}

	if (pvnode == NULL) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s: no such vnode", vname);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		Py_RETURN_NONE;
	}

	/*
	 * First things first create a Python vnode object.
	 *  - Borrowed reference
	 *  - Exception is *NOT* set
	 */
	py_vnode_class = pbs_python_types_table[PP_VNODE_IDX].t_class;
	py_rargs = Py_BuildValue("(s)", pvnode->nd_name); /* NEW ref */
	if (py_rargs == NULL) {
		log_err(-1, pbs_python_daemon_name,
			"could not build args list for vnode");
		goto GR_ERROR_EXIT;
	}
	py_vnode = PyObject_Call(py_vnode_class, py_rargs, NULL);
	if (py_vnode == NULL) {
		log_err(-1, pbs_python_daemon_name,
			"failed to create a python vnode object");
		goto GR_ERROR_EXIT;
	}

	Py_CLEAR(py_rargs);

	/*
	 * OK, At this point we need to start populating the vnode class.
	 */
	snprintf((char *) hook_debug.objname, HOOK_BUF_SIZE - 1, "%s(%s)", SERVER_VNODE_OBJECT, pvnode->nd_name);
	snprintf(perf_action, sizeof(perf_action), "%s:%s", HOOK_PERF_POPULATE, hook_debug.objname);
	tmp_rc = pbs_python_populate_attributes_to_python_class(py_vnode,
								py_vnode_attr_types,
								pvnode->nd_attr,
								node_attr_def,
								ND_ATR_LAST, perf_label, perf_action);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__,
			"partially populated python vnode object");
	}

	/* set vnode.queue to actual queue object */
	if (pvnode->nd_pque && PyObject_HasAttrString(py_vnode, ATTR_queue)) {
		py_que = _pps_helper_get_queue(pvnode->nd_pque, NULL, perf_label); /* NEW */
		if (py_que) {
			/* py_que ref ct incremented as part of py_vnode */
			(void) PyObject_SetAttrString(py_vnode, ATTR_queue, py_que);
			Py_DECREF(py_que); /* we no longer need to reference */
		}
	}

	snprintf(buf, sizeof(buf), "%ld", pvnode->nd_state);
	tmp_rc = pbs_python_object_set_attr_string_value(py_vnode, ATTR_NODE_state,
							 buf);
	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to set vnode's state.");
		goto GR_ERROR_EXIT;
	}

	snprintf(buf, sizeof(buf), "%d", pvnode->nd_ntype);

	tmp_rc = pbs_python_object_set_attr_string_value(py_vnode, ATTR_NODE_ntype,
							 buf);
	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to set vnode's type.");
		goto GR_ERROR_EXIT;
	}

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to mark vnode readonly.");
		goto GR_ERROR_EXIT;
	}

	object_counter++;
	return py_vnode;

GR_ERROR_EXIT:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(py_rargs);
	Py_CLEAR(py_vnode);
	PyErr_SetString(PyExc_AssertionError, "Failed to create vnode object");

	return NULL;
}
/*
 * ---------- EVENT RELATED FUNCTIONS ------------
 */

/**
 * @brief
 * 	Returns the event param's item corresponding to key 'name'.
 *
 * @param[in] name - key
 *
 * @return 	PyObject *
 * @retval	a borrowed reference.
 */
PyObject *
_pbs_python_event_get_param(char *name)
{
	PyObject *py_param = NULL;
	PyObject *py_p = NULL;

	if (!py_hook_pbsevent) {
		log_err(PBSE_INTERNAL, __func__, "No hook event found!");
		return NULL;
	}

	/* py_param = event()._param[] */
	if (!PyObject_HasAttrString(py_hook_pbsevent, PY_EVENT_PARAM)) {
		log_err(PBSE_INTERNAL, __func__, "Failed to obtain event's param");
		return NULL;
	}

	py_param = PyObject_GetAttrString(py_hook_pbsevent,
					  PY_EVENT_PARAM); /* NEW */
	if (!py_param) {
		log_err(PBSE_INTERNAL, __func__, "Failed to obtain event's param");
		return NULL;
	}

	if (!PyDict_Check(py_param)) {
		log_err(PBSE_INTERNAL, __func__, "event's param is not a dictionary");
		Py_CLEAR(py_param);
		return NULL;
	}

	/* ex. py_job = event().param["job"] */
	py_p = PyDict_GetItemString(py_param, name);
	Py_DECREF(py_param);

	return (py_p);
}
/**
 * @brief
 * 	Makes the Python PBS event object read-only, meaning none of its
 * 	could be modified in a hook script.
 *
 * @return	int
 * @retval	0 	for sucess;
 * @retval	-1 	otherwise
 */
int
_pbs_python_event_mark_readonly(void)
{
	int rv;

	if (!py_hook_pbsevent) {
		log_err(PBSE_INTERNAL, __func__, "event not found!");
		return (-1);
	}

	rv = pbs_python_mark_object_readonly(py_hook_pbsevent);

	if (rv == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to mark event readonly!");
		return (-1);
	}
	return (rv);
}

/**
 * @brief
 * 	Sets the "operation" mode of Python: if 'mode' is PY_MODE, then we're
 * 	inside the hook script; if 'mode' is C_MODE, then we're inside some
 * 	internal C helper function.
 * 	Setting 'mode' to C_MODE usually means we don't have any restriction
 * 	as to which attributes we can or cannot set.
 */
void
_pbs_python_set_mode(int mode)
{
	if ((mode != PY_MODE) && (mode != C_MODE)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "unexpected mode %d", mode);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return;
	}

	hook_set_mode = mode;
}

/**
 *
 * @brief
 *	Given a list of vnode attributes/resources/values in 'vnlist',
 *	return a Python dictionary object to represent 'vnlist' as an array of
 *	vnode objects.
 *
 * @param[in]	vnlist - list of vnode attributes/resources/values.
 *			format: a list of plist entries:
 * @param[in]	plist->al_name = <node_name>.<attribute_name>
 * @param[in]	plist->al_resc =  <resource_name>,<type>
 * @param[in]	plist->al_value = <value>
 * @param[in]	perf_label - data passed on to hook_perf_stat* call
 * @param[in]	perf_action - dat passed on to hook_perf_stat* call
 *
 * @return 	PyObject *
 * @retval	<object>	- the Python dictionary object holding
 *			           the individual vnode objects, indexed by
 *				   vnode names.
 * @retval	NULL		- if an error occured.
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
static PyObject *
create_py_vnodelist(pbs_list_head *vnlist, char *perf_label, char *perf_action)
{
	svrattrl *plist, *plist_next;
	PyObject *py_vn = NULL; /* class vnode arg list */
	PyObject *py_va = NULL; /* instantiated vnode object */
	PyObject *py_vnodelist = NULL;
	PyObject *py_vnode_class = NULL;
	struct rq_node {
		char rq_id[PBS_MAXNODENAME * 2];
		pbs_list_head rq_attr;
	} rqs;
	char *p = NULL;
	char *pn = NULL;
	char *p1 = NULL;
	char *attr_name = NULL;
	PyObject *py_vnlist_ret = NULL;
	int rc;

	if (vnlist == NULL) {
		log_err(PBSE_INTERNAL, __func__, "bad input parameter");
		return (NULL);
	}

	py_vnodelist = PyDict_New(); /* NEW - empty dict */
	if (py_vnodelist == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"failed to create a Vnodes list dictionary!");
		return NULL;
	}

	hook_perf_stat_start(perf_label, perf_action, 0);

	py_vnode_class = pbs_python_types_table[PP_VNODE_IDX].t_class;

	rqs.rq_id[0] = '\0';
	CLEAR_HEAD(rqs.rq_attr);

	plist = (svrattrl *) GET_NEXT(*vnlist);
	do {
		if (plist == NULL)
			break;

		plist_next = (svrattrl *) GET_NEXT(plist->al_link);

		/* look for last dot as the name could be dotted like a node name */
		p = strrchr(plist->al_name, '.');
		if (p == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: encountered an attribute %s without a node name...ignoring", plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			plist = plist_next;
			continue;
		}
		*p = '\0';	   /* now plist->al_name would be the node name */
		attr_name = p + 1; /* p will be the actual attribute name */
		if (plist->al_resc != NULL) {
			p1 = strchr(plist->al_resc, ',');
			if (p1 != NULL) {
				*p1 = '\0';
			}
		}

		/* at this point, we have:
		 * 	plist->al_name: <node_name><p><attribute_name>
		 * 				where <p> = \0
		 * 	plist->al_resc: <resc_name><p1><type>
		 * 				where <p1> = \0
		 */

		if (add_to_svrattrl_list(&rqs.rq_attr, attr_name,
					 plist->al_resc, plist->al_value, 0, NULL) != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "warning: failed to add_to_svrattrl_list(%s,%s,%s)",
				 plist->al_name,
				 plist->al_resc ? plist->al_resc : "", plist->al_value);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			goto create_py_vnodelist_exit;
		}
		pn = NULL;

		/* Check if we're done processing the attributes/resources */
		/* of the current node. 				    */
		if (plist_next != NULL) {

			/* look at last dot for "dotted" node names */
			pn = strrchr(plist_next->al_name, '.');
			if (pn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: encountered the next attribute %s without a node name...ignoring", plist_next->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				plist = (svrattrl *) GET_NEXT(plist_next->al_link);
				continue;
			}
			*pn = '\0'; /* now plist_next->al_name would be the */
				    /* node name */
				    /* at this point, we have:
			 * 	plist_next->al_name:
			 * 		<node_name><pn><attribute_name>
			 * 				where <pn> = \0
			 */
		}

		/* The next vnlist entry is for a different node name */
		/* or we've reached the end of the line */
		if ((plist_next == NULL) ||
		    (strcmp(plist->al_name, plist_next->al_name) != 0)) {

			strncpy(rqs.rq_id, plist->al_name,
				sizeof(rqs.rq_id) - 1);

			py_va = Py_BuildValue("(s)", rqs.rq_id); /* NEW ref */
			if (py_va == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "could not build args list for vnode %s",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_vnodelist_exit;
			}

			py_vn = PyObject_Call(py_vnode_class, py_va,
					      NULL); /* NEW ref */
			if (py_vn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to create a python vnode %s object",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_vnodelist_exit;
			}

			rc = pbs_python_populate_python_class_from_svrattrl(py_vn, &rqs.rq_attr, NULL, NULL);

			if (rc == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to fully populate Python"
					 " vnode %s object",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_vnodelist_exit;
			}

			/* set vnode : now py_vn ref count auto incremented*/
			rc = PyDict_SetItemString(py_vnodelist, plist->al_name,
						  py_vn);
			if (rc == -1) {
				LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
					       PY_TYPE_EVENT, PY_EVENT_PARAM_VNODELIST);
				goto create_py_vnodelist_exit;
			}

			rqs.rq_id[0] = '\0';
			free_attrlist(&rqs.rq_attr);
			CLEAR_HEAD(rqs.rq_attr);

			Py_CLEAR(py_va);
			Py_CLEAR(py_vn);
		}

		plist = plist_next;

		if (p != NULL) {
			*p = '.'; /* restore prev plist->al_name to contain node name */
			p = NULL;
		}

		if (p1 != NULL) { /* restore prev "<resc>,<resc_type>"  value for plist->al_resc */
			*p1 = ',';
			p1 = NULL;
		}

		if (pn != NULL) {
			*pn = '.'; /* restore prev plist_next->al_name to contain node name */
			pn = NULL;
		}

	} while (plist);

	py_vnlist_ret = py_vnodelist;

create_py_vnodelist_exit:
	rqs.rq_id[0] = '\0';
	free_attrlist(&rqs.rq_attr);
	CLEAR_HEAD(rqs.rq_attr);
	if (py_vnlist_ret != py_vnodelist) {
		Py_CLEAR(py_vnodelist);
	}
	Py_CLEAR(py_va);
	Py_CLEAR(py_vn);

	if (p != NULL) {
		*p = '.'; /* restore plist->al_name to contain node name */
		p = NULL;
	}

	if (p1 != NULL) { /* restore prev "<resc>,<resc_type>"  value for plist->al_resc */
		*p1 = ',';
		p1 = NULL;
	}

	if (pn != NULL) {
		*pn = '.'; /* restore prev plist_next->al_name to contain node name */
		pn = NULL;
	}

	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (py_vnlist_ret);
}

/**
 * @brief
 *	Given a list of job attributes/resources/values in 'joblist',
 *	return a Python dictionary object to represent 'joblist' as an array of
 *	job objects.
 *
 * @param[in]	joblist - list of job attributes/resources/values.
 *			format: a list of svrattrl entries (plist):
 * @param[in]	plist->al_name:	<job_name>.<attribute_name>
 * @param[in]	plist->al_resc: <resource_name>,<type>
 * @param[in]	plist->al_value: <value>
 * @param[in]	perf_label - data passed on to hook_perf_stat* call
 * @param[in]	perf_action - dat passed on to hook_perf_stat* call
 *
 * @return 	PyObject *
 * @retval	<object>	- the Python dictionary object holding
 *			           the individual job objects, indexed by
 *				   job names.
 * @retval	NULL		- if an error occured.
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
static PyObject *
create_py_joblist(pbs_list_head *joblist, char *perf_label, char *perf_action)
{
	svrattrl *plist, *plist_next;
	PyObject *py_jn = NULL; /* class job arg list */
	PyObject *py_ja = NULL; /* instantiated job object */
	PyObject *py_joblist = NULL;
	PyObject *py_job_class = NULL;
	struct rq_job {
		char rq_id[PBS_MAXNODENAME * 2];
		pbs_list_head rq_attr;
	} rqs;
	char *p = NULL;
	char *pn = NULL;
	char *p1 = NULL;
	char *attr_name = NULL;
	PyObject *py_joblist_ret = NULL;
	int rc;

	py_joblist = PyDict_New(); /* NEW - empty dict */
	if (py_joblist == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"failed to create a jobs list dictionary!");
		return NULL;
	}

	hook_perf_stat_start(perf_label, perf_action, 0);
	py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;

	rqs.rq_id[0] = '\0';
	CLEAR_HEAD(rqs.rq_attr);

	plist = (svrattrl *) GET_NEXT(*joblist);
	do {
		if (plist == NULL)
			break;

		plist_next = (svrattrl *) GET_NEXT(plist->al_link);

		/* look for last dot as the name could be dotted like a job name */
		p = strrchr(plist->al_name, '.');
		if (p == NULL) { /* did not detect entry <job_name>.<atr_name> */
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: encountered an attribute %s without a job name...ignoring", plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			plist = plist_next;
			continue;
		}
		*p = '\0';	   /* now plist->al_name would be the job name */
		attr_name = p + 1; /* p will be the actual attribute name */
		if (plist->al_resc != NULL) {
			/* looking for resource entry "<resc>,<resc_type>" */
			p1 = strchr(plist->al_resc, ',');
			if (p1 != NULL) {
				*p1 = '\0';
			}
		}
		/* at this point we have:
		 * plist->al_name = <job_name><p><attribute_name>
		 * 				where <p> = \0
		 * plist->al_resc = <resource_name><p1><type>
		 * 				where <p1> = \0
		 */

		if (add_to_svrattrl_list(&rqs.rq_attr, attr_name,
					 plist->al_resc, plist->al_value, 0, NULL) != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "warning: failed to add_to_svrattrl_list(%s,%s,%s)",
				 plist->al_name,
				 plist->al_resc ? plist->al_resc : "", plist->al_value);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			goto create_py_joblist_exit;
		}

		/* Check if we're done processing the attributes/resources */
		/* of the current job. 				    */
		if (plist_next != NULL) {

			/* looking for the form: <job_name>.<attrib_name> */
			pn = strrchr(plist_next->al_name, '.');
			if (pn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: encountered the next attribute %s without a job name...ignoring", plist_next->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				plist = (svrattrl *) GET_NEXT(plist_next->al_link);
				if (p != NULL) {
					*p = '.'; /* restore plist->al_name to contain job name */
					p = NULL;
				}
				continue;
			}
			*pn = '\0'; /* now plist_next->al_name would be the */
				    /* job name */
				    /* at this point, we have
			 * plist_next->al_name: <job_name><pn><attrib_name>
			 * 			where <pn> = \0
			 */
		}

		/* The next joblist entry is for a different job name */
		/* or we've reached the end of the line */
		if ((plist_next == NULL) ||
		    (strcmp(plist->al_name, plist_next->al_name) != 0)) {

			strncpy(rqs.rq_id, plist->al_name,
				sizeof(rqs.rq_id) - 1);

			py_ja = Py_BuildValue("(s)", rqs.rq_id); /* NEW ref */
			if (py_ja == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "could not build args list for job %s",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_joblist_exit;
			}

			py_jn = PyObject_Call(py_job_class, py_ja,
					      NULL); /* NEW ref */
			if (py_jn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to create a python job %s object",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_joblist_exit;
			}

			rc = pbs_python_populate_python_class_from_svrattrl(py_jn, &rqs.rq_attr, NULL, NULL);

			if (rc == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to fully populate Python"
					 " job %s object",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_joblist_exit;
			}

			/* set job : now py_jn ref count auto incremented*/
			rc = PyDict_SetItemString(py_joblist, plist->al_name,
						  py_jn);
			if (rc == -1) {
				LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
					       PY_TYPE_EVENT, PY_EVENT_PARAM_JOBLIST);
				goto create_py_joblist_exit;
			}

			rqs.rq_id[0] = '\0';
			free_attrlist(&rqs.rq_attr);
			CLEAR_HEAD(rqs.rq_attr);

			Py_CLEAR(py_ja);
			Py_CLEAR(py_jn);
		}

		plist = plist_next;

		if (p != NULL) {
			/* restore prev plist->al_name to contain job name */
			*p = '.';
			p = NULL;
		}

		if (p1 != NULL) {
			/* restore prev "<resc>,<resc_type>"  value for plist->al_resc */
			*p1 = ',';
			p1 = NULL;
		}

		if (pn != NULL) {
			/* restore prev plist_next->al_name to contain job name */
			*pn = '.';
			pn = NULL;
		}

	} while (plist);

	py_joblist_ret = py_joblist;

create_py_joblist_exit:
	free_attrlist(&rqs.rq_attr);
	CLEAR_HEAD(rqs.rq_attr);
	if (py_joblist_ret != py_joblist) {
		Py_CLEAR(py_joblist);
	}
	Py_CLEAR(py_ja);
	Py_CLEAR(py_jn);

	if (p != NULL) {
		/* restore prev plist->al_name to contain job name */
		*p = '.';
		p = NULL;
	}

	if (p1 != NULL) {
		/* restore prev "<resc>,<resc_type>"  value for plist->al_resc */
		*p1 = ',';
		p1 = NULL;
	}

	if (pn != NULL) {
		/* restore prev plist_next->al_name to contain job name */
		*pn = '.';
		pn = NULL;
	}

	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (py_joblist_ret);
}

/*
 * @brief
 *	Given a list of reservation attributes/resources/values in 'resvlist',
 *	return a Python dictionary object to represent 'resvlist' as an array of
 *	reservation objects.
 *
 * @param[in]	resvlist - list of reservation attributes/resources/values.
 *			format: a list of svrattrl entries (plist):
 *	plist->al_name:	<resv_name>.<attribute_name>
 *	plist->al_resc: <resource_name>.<type>
 *	plist->al_value: <value>
 *
 * @param[in]	perf_label - data passed on to hook_perf_stat* call
 * @param[in]	perf_action - dat passed on to hook_perf_stat* call
 *
 * @return 	PyObject *
 * @retval	<object>	- the Python dictionary object holding
 *			           the individual reservation objects, indexed by
 *				   reservation names.
 * @retval	NULL		- if an error occured.
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
static PyObject *
create_py_resvlist(pbs_list_head *resvlist, char *perf_label, char *perf_action)
{
	svrattrl *plist, *plist_next;
	PyObject *py_rn = NULL; /* class reservation arg list */
	PyObject *py_ra = NULL; /* instantiated reservation object */
	PyObject *py_resvlist = NULL;
	PyObject *py_resv_class = NULL;
	struct rq_resv {
		char rq_id[PBS_MAXNODENAME * 2];
		pbs_list_head rq_attr;
	} rqs;
	char *p = NULL;
	char *pn = NULL;
	char *p1 = NULL;
	char *attr_name = NULL;
	PyObject *py_resvlist_ret = (PyObject *) NULL;
	int rc;

	py_resvlist = PyDict_New(); /* NEW - empty dict */
	if (py_resvlist == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"failed to create a reservation list dictionary!");
		return (NULL);
	}

	hook_perf_stat_start(perf_label, perf_action, 0);
	py_resv_class = pbs_python_types_table[PP_RESV_IDX].t_class;

	memset(rqs.rq_id, 0, sizeof(rqs.rq_id));
	CLEAR_HEAD(rqs.rq_attr);

	for (plist = (svrattrl *) GET_NEXT(*resvlist); plist; plist = plist_next) {

		plist_next = (svrattrl *) GET_NEXT(plist->al_link);

		/* look for last dot as the name could be dotted like a resv name */
		p = strrchr(plist->al_name, '.');
		if (p == NULL) { /* did not detect entry <resv_name>.<atr_name> */
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: encountered an attribute %s without a resv name...ignoring", plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			continue;
		}
		*p = '\0';	   /* now plist->al_name would be the resv name */
		attr_name = p + 1; /* p will be the actual attribute name */
		if (plist->al_resc != NULL) {
			/* looking for resource entry "<resc>,<resc_type>" */
			p1 = strchr(plist->al_resc, ',');
			if (p1 != NULL) {
				*p1 = '\0';
			}
		}
		/* at this point we have:
		 * plist->al_name = <resv_name><p><attribute_name>
		 * 				where <p> = \0
		 * plist->al_resc = <resource_name><p1><type>
		 * 				where <p1> = \0
		 */

		if (add_to_svrattrl_list(&rqs.rq_attr, attr_name,
					 plist->al_resc, plist->al_value, 0, NULL) != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE,
				 "warning: failed to add_to_svrattrl_list(%s,%s,%s)",
				 plist->al_name,
				 plist->al_resc ? plist->al_resc : "", plist->al_value);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			goto create_py_resvlist_exit;
		}

		/* Check if we're done processing the attributes/resources */
		/* of the current resv. 				    */
		if (plist_next != NULL) {

			/* looking for the form: <resv_name>.<attrib_name> */
			pn = strrchr(plist_next->al_name, '.');
			if (pn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: encountered the next attribute %s without a resv name...ignoring", plist_next->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				plist = (svrattrl *) GET_NEXT(plist_next->al_link);
				if (p != NULL) {
					*p = '.'; /* restore plist->al_name to contain resv name */
					p = NULL;
				}
				continue;
			}
			*pn = '\0'; /* now plist_next->al_name would be the */
				    /* resv name */
				    /* at this point, we have
			 * plist_next->al_name: <resv_name><pn><attrib_name>
			 * 			where <pn> = \0
			 */
		}

		/* The next resvlist entry is for a different resv name */
		/* or we've reached the end of the line */
		if ((plist_next == NULL) ||
		    (strcmp(plist->al_name, plist_next->al_name) != 0)) {

			snprintf(rqs.rq_id, sizeof(rqs.rq_id), "%s", plist->al_name);

			py_ra = Py_BuildValue("(s)", rqs.rq_id); /* NEW ref */
			if (py_ra == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "could not build args list for resv %s",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_resvlist_exit;
			}

			py_rn = PyObject_Call(py_resv_class, py_ra,
					      (PyObject *) NULL); /* NEW ref */
			if (py_rn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to create a python resv %s object",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_resvlist_exit;
			}

			rc = pbs_python_populate_python_class_from_svrattrl(py_rn, &rqs.rq_attr, NULL, NULL);

			if (rc == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to fully populate Python"
					 " resv %s object",
					 plist->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_resvlist_exit;
			}

			/* set resv : now py_jn ref count auto incremented*/
			rc = PyDict_SetItemString(py_resvlist, plist->al_name,
						  py_rn);
			if (rc == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "%s: partially set remaining param['%s'] attributes",
					 PY_TYPE_EVENT, PY_EVENT_PARAM_RESVLIST);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto create_py_resvlist_exit;
			}

			rqs.rq_id[0] = '\0';
			free_attrlist(&rqs.rq_attr);
			CLEAR_HEAD(rqs.rq_attr);

			Py_CLEAR(py_ra);
			Py_CLEAR(py_rn);
		}

		if (p != NULL) {
			/* restore prev plist->al_name to contain resv name */
			*p = '.';
			p = NULL;
		}

		if (p1 != NULL) {
			/* restore prev "<resc>,<resc_type>"  value for plist->al_resc */
			*p1 = ',';
			p1 = NULL;
		}

		if (pn != NULL) {
			/* restore prev plist_next->al_name to contain resv name */
			*pn = '.';
			pn = NULL;
		}
	}

	py_resvlist_ret = py_resvlist;

create_py_resvlist_exit:
	free_attrlist(&rqs.rq_attr);
	CLEAR_HEAD(rqs.rq_attr);
	if (py_resvlist_ret != py_resvlist) {
		Py_CLEAR(py_resvlist);
	}
	Py_CLEAR(py_ra);
	Py_CLEAR(py_rn);

	if (p != NULL) {
		/* restore prev plist->al_name to contain resv name */
		*p = '.';
		p = NULL;
	}

	if (p1 != NULL) {
		/* restore prev "<resc>,<resc_type>"  value for plist->al_resc */
		*p1 = ',';
		p1 = NULL;
	}

	if (pn != NULL) {
		/* restore prev plist_next->al_name to contain resv name */
		*pn = '.';
		pn = NULL;
	}

	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (py_resvlist_ret);
}

/**
 *
 * @brief
 *	Given a list of string values in 'str_list',
 *	return a Python list object to represent 'str_list'.
 *
 * @param[in]	str_list - an array of strings.
 *
 * @return 	PyObject *
 * @retval	<object>	- the Python list object holding
 *			           the individual strings.
 * @retval	NULL		- if an error occured.
 */
static PyObject *
create_py_strlist(char **str_list)
{
	int i;
	PyObject *py_str = NULL; /* a string value */
	PyObject *py_strlist = NULL;
	PyObject *py_strlist_ret = NULL;

	if (str_list == NULL)
		return NULL;

	py_strlist = PyList_New(0); /* NEW - empty list */
	if (py_strlist == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"failed to create an array of strings list!");
		return NULL;
	}
	i = 0;
	while (str_list[i]) {
		py_str = Py_BuildValue("s", str_list[i]); /* NEW ref */
		if (py_str == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "could not create python object for %s",
				 str_list[i]);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			goto create_py_strlist_exit;
		}
		/* py_str's reference count incremented inside PyList */
		if (PyList_Append(py_strlist, py_str) != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to append %s to python string list",
				 str_list[i]);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			Py_DECREF(py_str);
			goto create_py_strlist_exit;
		}
		Py_DECREF(py_str);
		i++;
	}
	py_strlist_ret = py_strlist;

create_py_strlist_exit:
	if (py_strlist_ret != py_strlist) {
		Py_CLEAR(py_strlist);
	}

	return (py_strlist_ret);
}

/**
 *
 * @brief
 *	Given a pbs_list_head 'phead', convert just the attribute names
 *      (plist->al_name) into a Python string list.
 *	return a Python list object to represent names of the given
 *	pbs list..
 *
 * @param[in]	phead - head of svrattrl entries..
 *
 * @return 	PyObject *
 * @retval	<object>	- the Python list object holding
 *			           the individual strings of svrattrl names.
 * @retval	NULL		- if an error occured.
 */
static PyObject *
create_py_strlist_from_svrattrl_names(pbs_list_head *phead)
{
	PyObject *py_str = NULL; /* a string value */
	PyObject *py_strlist = NULL;
	PyObject *py_strlist_ret = NULL;
	svrattrl *plist;

	if (phead == NULL)
		return NULL;

	py_strlist = PyList_New(0); /* NEW - empty list */
	if (py_strlist == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"failed to create a strings list!");
		return NULL;
	}

	for (plist = (svrattrl *) GET_NEXT(*phead); plist;
	     plist = (svrattrl *) GET_NEXT(plist->al_link)) {

		if (plist->al_name == NULL) {
			continue;
		}

		py_str = Py_BuildValue("s", plist->al_name); /* NEW ref */
		if (py_str == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "could not create python object for %s",
				 plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			goto create_py_strlist_from_svrattrl_names_exit;
		}
		/* py_str's reference count incremented inside PyList */
		if (PyList_Append(py_strlist, py_str) != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to append %s to python string list",
				 plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			Py_DECREF(py_str);
			goto create_py_strlist_from_svrattrl_names_exit;
		}
		Py_DECREF(py_str);
	}
	py_strlist_ret = py_strlist;

create_py_strlist_from_svrattrl_names_exit:
	if (py_strlist_ret != py_strlist) {
		Py_CLEAR(py_strlist);
	}

	return (py_strlist_ret);
}

/**
 *
 * @brief
 *	Given a Python list of string values,
 *	dump its contents into a svrattrl list.
 *
 * @param[in]	py_strlist - the input Python list
 * @param[in]	to_head - destination svrattrl list
 * @param[in]	name_str - attribute name to associate each entry
 *
 * @return 	int
 * @retval	0	- success
 * @retval	-1	- error
 */
static int
py_strlist_to_svrattrl(PyObject *py_strlist, pbs_list_head *to_head, char *name_str)
{
	char *str;
	int i;
	int len;
	char index_str[20];

	if ((py_strlist == NULL) || (to_head == NULL) || (name_str == NULL))
		return (-1);

	len = PyList_Size(py_strlist);
	if (len == 0)
		return (0);

	CLEAR_HEAD((*to_head));
	for (i = 0; (i < len) && ((str = pbs_python_list_get_item_string_value(py_strlist, i)) != NULL); i++) {
		snprintf(index_str, sizeof(index_str), "%d", i);
		if (add_to_svrattrl_list(to_head, name_str, index_str, str, ATR_VFLAG_HOOK, NULL) == -1) {
			free_attrlist(to_head);
			return (-1);
		}
	}
	return (0);
}

/**
 *
 * @brief
 *	Given a Python list of string values,
 *	dump its contents into a reliable_job_node list.
 *
 * @param[in]	py_strlist - the input Python list
 * @param[in]	to_head - destination reliable_job_node list
 *
 * @return 	int
 * @retval	0	- success
 * @retval	-1	- error
 */
static int
py_strlist_to_reliable_job_node_list(PyObject *py_strlist, pbs_list_head *to_head)
{
	char *str;
	int i;
	int len;

	if ((py_strlist == NULL) || (to_head == NULL))
		return (-1);

	len = PyList_Size(py_strlist);
	if (len == 0)
		return (0);

	CLEAR_HEAD((*to_head));
	for (i = 0; (i < len) && ((str = pbs_python_list_get_item_string_value(py_strlist, i)) != NULL); i++) {
		if (reliable_job_node_add(to_head, str) == -1) {
			free_attrlist(to_head);
			return (-1);
		}
	}
	return (0);
}

/**
 * @brief
 *	Read data from /proc/self/statm if available.
 *
 * @return char *
 * @retval NULL: No data
 * @retval !NULL: Memory usage data
 */
static char *
read_statm(void)
{
	static char buf[128] = {'\0'};
	long vmsize, vmrss;
	int rc;
	FILE *fp;

	fp = fopen("/proc/self/statm", "r");
	if (!fp)
		return NULL;
	/* Only fetch the first two entries. */
	rc = fscanf(fp, "%ld %ld", &vmsize, &vmrss);
	fclose(fp);
	if (rc != 2)
		return NULL;
	/* Convert to KB. */
	vmsize *= 4;
	vmrss *= 4;
	snprintf(buf, sizeof(buf), "VmSize=%ldkB, VmRSS=%ldkB", vmsize, vmrss);
	return (buf);
}

/**
 *
 * @brief
 *	Helper function to create a vnode_list[] type of parameter
 *	named 'param_name' under python object 'py_event_param' of
 * 	type 'event_type', with data coming from 'vnlist'.
 *
 * @param[in]	py_event_param - event parameter object
 * @param[in]	event_type - the event type requesting for this
 * @param[in]	param_name - name of the vnode_list parameter
 * @param[in]	vnlist - data for the vnode_list parameter
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 * @param[in]	perf_action - passed on to hook_perf_stat* call.
 *
 * @return PyObject *
 * @retval <python_object>	- the Python object representing the
 *				  vnode_list parameter
 * @retval NULL		- if failure is encountered
 *
 */
static PyObject *
create_hook_vnode_list_param(PyObject *py_event_param,
			     char *event_type, char *param_name, pbs_list_head *vnlist,
			     char *perf_label, char *perf_action)
{
	PyObject *py_vnlist = NULL;
	int rc;

	if ((py_event_param == NULL) || (param_name == NULL) || (vnlist == NULL)) {
		log_err(-1, __func__, "bad function parameter");
		return (NULL);
	}

	(void) PyDict_SetItemString(py_event_param, param_name, Py_None);

	py_vnlist = create_py_vnodelist(vnlist, perf_label, perf_action);
	if (py_vnlist == NULL) {
		return (NULL);
	}

	/* set vnode list: py_vnlist given to py_event_param so ref count auto incremented */
	rc = PyDict_SetItemString(py_event_param, param_name, py_vnlist);
	if (rc == -1) {
		Py_CLEAR(py_vnlist);
		LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes", event_type, param_name);
		return (NULL);
	}
	return (py_vnlist);
}

/**
 *
 * @brief
 *	Function which will clear python objects after the processing
 *  hooks
 *
 */
void
pbs_python_clear_attributes()
{
	pbs_iter_item *iter_entry = NULL;
	pbs_iter_item *nxp_iter_entry;

	vnode_set_req *vn_set_req = NULL;
	vnode_set_req *nxp_vn_set_req;

	pbs_resource_value *resc_val = NULL;
	pbs_resource_value *nxp_resc_val;
	int i;

	/* Initialize the list of PBS iterators for new runs of hooks */
	/* servicing a given event (e.g. runjob event).               */
	if (pbs_iter_list.ll_next != NULL)
		iter_entry = (pbs_iter_item *) GET_NEXT(pbs_iter_list);
	while (iter_entry != NULL) {
		/* save the next iterator item */
		nxp_iter_entry = (pbs_iter_item *) GET_NEXT(iter_entry->all_iters);

		if (iter_entry->py_iter)
			Py_CLEAR(iter_entry->py_iter);

		delete_link(&iter_entry->all_iters);
		free(iter_entry);
		iter_entry = nxp_iter_entry;
	}

	/* Initialize the list of PBS vnode set operations for new runs of hooks */
	/* servicing a given event (e.g. runjob event).               */
	if (pbs_vnode_set_list.ll_next != NULL)
		vn_set_req = (vnode_set_req *) GET_NEXT(pbs_vnode_set_list);
	while (vn_set_req != NULL) {
		/* save the next vnode_set_req item  */
		nxp_vn_set_req = (vnode_set_req *) GET_NEXT(vn_set_req->all_reqs);

		free_attrlist(&vn_set_req->rq_attr);

		delete_link(&vn_set_req->all_reqs);
		free(vn_set_req);
		vn_set_req = nxp_vn_set_req;
	}

	/* Initialize the list of PBS resource values to set for new runs of hooks */
	/* servicing a given event (e.g. runjob event).               */
	if (pbs_resource_value_list.ll_next != NULL)
		resc_val = (pbs_resource_value *) GET_NEXT(pbs_resource_value_list);
	while (resc_val != NULL) {
		/* save the next vnode_set_req item  */
		nxp_resc_val = (pbs_resource_value *) GET_NEXT(resc_val->all_rescs);

		Py_CLEAR(resc_val->py_resource);
		Py_CLEAR(resc_val->py_resource_str_value);
		free_attrlist(&resc_val->value_list);

		delete_link(&resc_val->all_rescs);
		free(resc_val);
		resc_val = nxp_resc_val;
	}

	/* py_hook_pbsevent is instantiated in C_MODE so I own it */
	if (py_hook_pbsevent != NULL)
		Py_CLEAR(py_hook_pbsevent);

	/* py_hook_pbsserver is instantiated in C_MODE so I own it */
	if (py_hook_pbsserver != NULL)
		Py_CLEAR(py_hook_pbsserver);

	if (py_hook_pbsque != NULL) {
		for (i = 0; (i < py_hook_pbsque_max) && (py_hook_pbsque[i] != NULL); i++) {
			Py_CLEAR(py_hook_pbsque[i]);
		}
	}
}


/**
 * @brief
 *      Creates a PBS Python event object that can be accessed in a hook
 *	script as: pbs.event().
 *
 * @param[in]	hook_event	- the hook event name for the event object.
 *				  (e.g. HOOK_EVENT_QUEUEJOB)
 * @param[in]	req_user	- the requesting user
 * @param[in]	req_host	- the requesting host
 * @param[in]	req_params	- a structure containing the input parameters.
 * @param[in]	perf_label - data passed on to hook_perf_stat* call
 *
 * @return int
 * @retval	0	- success
 * @retval	-1	- error
 * @retval	-2	- function failed to complete execution due to a
 *			   a keyboard interrupt. This maybe caused by the
 *			   calling process getting a SIGINT. In this case,
 *			   just rerun this call.
 */
int
_pbs_python_event_set(unsigned int hook_event, char *req_user, char *req_host,
		      hook_input_param_t *req_params, char *perf_label)
{
	PyObject *py_event = NULL;
	PyObject *py_eargs = NULL;
	PyObject *py_jargs = NULL;
	PyObject *py_rargs = NULL;
	PyObject *py_job = NULL;
	PyObject *py_job_o = NULL;
	PyObject *py_que = NULL;
	PyObject *py_resv = NULL;
	PyObject *py_resv_o = NULL;
	PyObject *py_margs = NULL;
	PyObject *py_management = NULL;
	PyObject *py_event_param = NULL;
	PyObject *py_event_class = NULL;
	PyObject *py_job_class = NULL;
	PyObject *py_management_class = NULL;
	PyObject *py_resv_class = NULL;
	PyObject *py_env_class = NULL;
	PyObject *py_varlist = NULL;
	PyObject *py_varlist_o = NULL;
	PyObject *py_vnodelist = NULL;
	PyObject *py_vnodelist_fail = NULL;
	PyObject *py_joblist = NULL;
	PyObject *py_resvlist = NULL;
	PyObject *py_exec_vnode = NULL;
	PyObject *py_vnode = NULL;
	PyObject *py_vnode_o = NULL;
	PyObject *py_aoe = NULL;
	PyObject *py_resclist = NULL;
	PyObject *py_progname = NULL;
	PyObject *py_arglist = NULL;
	PyObject *py_env = NULL;
	PyObject *py_pid = NULL;
	PyObject *py_node_list = (PyObject *) NULL;
	PyObject *py_failed_node_list = (PyObject *) NULL;
	char perf_action[MAXBUFLEN];

	static long hook_counter = 0;	      /* for tracking interpreter restart */
	static long min_restart_interval = 0; /* prevents frequent restarts */
	static int init_iters = 0;	      /* 1 to initialize the PBS iterarators list */
	static int init_vnode_set = 0;	      /* 1 to initialize the vnode set opers */

	static int init_resource_values = 0; /* 1 to initialize the */
					     /* list of pbs_resource values */
					     /* to instantiate. */
	static long max_hooks = 0;
	static long max_objects = 0;
	static time_t previous_restart = (time_t) 0;

	long lval;
	int restart_python;
	int rc = -1;

	pbs_list_head *vnlist;
	pbs_list_head *joblist;
	pbs_list_head *resvlist;

	if (!init_iters) {
		CLEAR_HEAD(pbs_iter_list);
		init_iters = 1;
	}

	if (!init_vnode_set) {
		CLEAR_HEAD(pbs_vnode_set_list);
		init_vnode_set = 1;
	}

	if (!init_resource_values) {
		CLEAR_HEAD(pbs_resource_value_list);
		init_resource_values = 1;
	}

	lval = max_hooks;
	if (is_sattr_set(SVR_ATR_PythonRestartMaxHooks))
		max_hooks = get_sattr_long(SVR_ATR_PythonRestartMaxHooks);
	else
		max_hooks = PBS_PYTHON_RESTART_MAX_HOOKS;
	if (lval != max_hooks) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "python_restart_max_hooks is now %ld", max_hooks);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, log_buffer);
	}

	lval = max_objects;
	if (is_sattr_set(SVR_ATR_PythonRestartMaxObjects))
		max_objects = get_sattr_long(SVR_ATR_PythonRestartMaxObjects);
	else
		max_objects = PBS_PYTHON_RESTART_MAX_OBJECTS;
	if (lval != max_objects) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "python_restart_max_objects is now %ld", max_objects);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, log_buffer);
	}

	lval = min_restart_interval;
	if (is_sattr_set(SVR_ATR_PythonRestartMinInterval))
		min_restart_interval = get_sattr_long(SVR_ATR_PythonRestartMinInterval);
	else
		min_restart_interval = PBS_PYTHON_RESTART_MIN_INTERVAL;
	if (lval != min_restart_interval) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "python_restart_min_interval is now %ld", min_restart_interval);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, log_buffer);
	}

	hook_counter++;
	restart_python = 0;
	if (hook_counter >= max_hooks)
		restart_python = 1;
	if (object_counter >= max_objects)
		restart_python = 1;
	if ((time(NULL) - previous_restart) < min_restart_interval)
		restart_python = 0;
	if (restart_python) {
		char *line;
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__,
			  "Restarting Python interpreter to reduce mem usage");
		pbs_python_ext_shutdown_interpreter(&svr_interp_data);
		if (pbs_python_ext_start_interpreter(&svr_interp_data) != 0) {
			log_err(PBSE_INTERNAL, __func__, "Failed to restart Python interpreter");
			goto event_set_exit;
		}
		/* Reset counters for the next interpreter restart. */
		hook_counter = 0;
		object_counter = 0;
		previous_restart = time(NULL);
		/* Log current memory usage. */
		line = read_statm();
		snprintf(log_buffer, sizeof(log_buffer),
			 "Current memory usage: %s",
			 (line ? line : "unknown"));
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, log_buffer);
	}

	hook_set_mode = C_MODE;

	/*
	 * First things first create a Python event object.
	 *  - Borrowed reference
	 *  - Exception is *NOT* set
	 */
	py_event_class = pbs_python_types_table[PP_EVENT_IDX].t_class;

	py_eargs = Py_BuildValue("(iss)", hook_event, req_user, req_host); /*NEW ref*/

	if (!py_eargs) {
		log_err(-1, __func__, "could not build args list for event");
		goto event_set_exit;
	}
	py_event = PyObject_Call(py_event_class, py_eargs, NULL); /*NEW*/

	if (!py_event) {
		log_err(-1, __func__, "failed to create a python event object");
		goto event_set_exit;
	}

	if (!PyObject_HasAttrString(py_event, PY_EVENT_PARAM)) {
		log_err(PBSE_INTERNAL, __func__, "event has no param structure!");
		goto event_set_exit;
	}

	py_event_param = PyObject_GetAttrString(py_event,
						PY_EVENT_PARAM); /* NEW ref*/
	if (!py_event_param) {
		log_err(PBSE_INTERNAL, __func__,
			"failed to get param attribute of event object");
		goto event_set_exit;
	}

	if (!PyDict_Check(py_event_param)) {
		log_err(PBSE_INTERNAL, __func__,
			"attribute of event object not a dictionary!");
		goto event_set_exit;
	}

	if (hook_event == HOOK_EVENT_QUEUEJOB) {
		struct rq_queuejob *rqj = req_params->rq_job;

		/* initialize event param to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		/*
		 * First things first create a Python job object.
		 *  - Borrowed reference
		 *  - Exception is *NOT* set
		 */
		py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;

		py_jargs = Py_BuildValue("(s)", rqj->rq_jid); /* NEW ref */
		if (!py_jargs) {
			log_err(PBSE_INTERNAL, __func__, "could not build args list for job");
			goto event_set_exit;
		}
		py_job = PyObject_Call(py_job_class, py_jargs, NULL); /*NEW*/

		if (!py_job) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python job object");
			(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
						    Py_None);
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		rc = pbs_python_object_set_attr_string_value(py_job, ATTR_queue,
							     rqj->rq_destin);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set attribute <%s>",
				       "", ATTR_queue);
			goto event_set_exit;
		}

		snprintf(perf_action, sizeof(perf_action), "%s:%s(%s)", HOOK_PERF_POPULATE, EVENT_JOB_OBJECT, rqj->rq_jid);
		rc = pbs_python_populate_python_class_from_svrattrl(py_job,
								    &rqj->rq_attr, perf_label, perf_action);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}
	} else if (hook_event == HOOK_EVENT_POSTQUEUEJOB) {
		struct rq_postqueuejob *rqj = req_params->rq_postqueuejob;

		/* initialize event param to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_jargs); /* discard previously used value */
				py_jargs = Py_BuildValue("(sss)", "job", rqj->rq_jid,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_job = PyObject_Call(py_pbs_statobj, py_jargs,
						       NULL); /*NEW*/
				hook_set_mode = C_MODE;	      /* ensure still in C mode */
			}
		} else {
			py_job = _pps_helper_get_job(NULL, rqj->rq_jid, NULL, perf_label);
		}
		/* NEW - we own ref */

		if (!py_job || (py_job == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to get job %s's python "
				       "job object",
				       PY_TYPE_EVENT, rqj->rq_jid);
			goto event_set_exit;
		}

		/* py_job given to py_event_parm...so ref. count auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		/* py_job is not read-only but only ATTR_h, ATTR_a are modifiable and */
		/* checked under is_attrib_val_settable(). Resource-type attributes   */
		/* such as ATTR_l, which is part of py_job,  go through a different   */
		/* processing mechanism.        				      */
		/* It is fatal if py_job's readonly flag could not be set to False    */
		/* as it could prevent all job attributes including ATTR_l to be      */
		/* not settable.                                                      */
		rc = pbs_python_object_set_attr_integral_value(py_job,
							       PY_READONLY_FLAG, FALSE);
		if (rc == -1) {

			log_err(PBSE_INTERNAL, __func__,
				"Failed set object's readonly flag");
			goto event_set_exit;
		}

		py_resclist = PyObject_GetAttrString(py_job, ATTR_l); /* NEW */
		if ((py_resclist != NULL) && (py_resclist != Py_None)) {
			/* Don't mark pbs.event().job.Resource_List[] as readonly */
			rc = pbs_python_object_set_attr_integral_value(py_resclist,
								       PY_READONLY_FLAG, FALSE);
			if (rc == -1) {

				log_err(PBSE_INTERNAL, __func__,
					"Failed set object's readonly flag");
				LOG_ERROR_ARG2("%s: warning - failed to set object's '%s' readonly flag", __func__, "Resource_List[]");
			}
		}
	} else if (hook_event == HOOK_EVENT_RESVSUB) {
		struct rq_queuejob *rqj = req_params->rq_job;

		/* initialize event param to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV,
					    Py_None);
		/*
		 * First things first create a Python job object.
		 *  - Borrowed reference
		 *  - Exception is *NOT* set
		 */
		py_resv_class = pbs_python_types_table[PP_RESV_IDX].t_class;

		py_rargs = Py_BuildValue("(s)", rqj->rq_jid); /* NEW ref */

		if (!py_rargs) {
			log_err(PBSE_INTERNAL, __func__, "could not build args list for resv");
			goto event_set_exit;
		}

		py_resv = PyObject_Call(py_resv_class, py_rargs,
					NULL); /*NEW*/

		if (!py_resv) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python resv object");
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV, py_resv);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_RESV);
			goto event_set_exit;
		}
		snprintf(perf_action, sizeof(perf_action), "%s:%s(%s)", HOOK_PERF_POPULATE, EVENT_RESV_OBJECT, rqj->rq_jid);
		rc = pbs_python_populate_python_class_from_svrattrl(py_resv,
								    &rqj->rq_attr, perf_label, perf_action);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_RESV);
			goto event_set_exit;
		}
	} else if (hook_event == HOOK_EVENT_MODIFYRESV) {
		struct rq_manage *rqr = req_params->rq_manage;

		/* initialize event params to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB_O,
					    Py_None);
		/*
		 * First things first create a Python job object.
		 *  - Borrowed reference
		 *  - Exception is *NOT* set
		 */
		py_resv_class = pbs_python_types_table[PP_RESV_IDX].t_class;

		py_rargs = Py_BuildValue("(s)", rqr->rq_objname); /* NEW ref */

		if (!py_rargs) {
			log_err(PBSE_INTERNAL, __func__, "could not build args list for reservation");
			goto event_set_exit;
		}

		py_resv = PyObject_Call(py_resv_class, py_rargs, NULL); /*NEW*/

		if (!py_resv) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python reservation object");
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV, py_resv);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_RESV);
			goto event_set_exit;
		}

		snprintf(perf_action, sizeof(perf_action), "%s:%s(%s)", HOOK_PERF_POPULATE, EVENT_JOB_OBJECT, rqr->rq_objname);
		rc = pbs_python_populate_python_class_from_svrattrl(py_resv,
								    &rqr->rq_attr, perf_label, perf_action);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_RESV);
			goto event_set_exit;
		}

		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_rargs); /* discard previously used value   */
				/* NOTE: *XDECREF() is safe where  */
				/* if py_jargs is NULL, then */
				/* nothing is released. */
				/* Current value of py_jargs is */
				/* released at the end of this  */
				/* function (at event_set_exit:) */
				py_rargs = Py_BuildValue("(sss)", "resv", rqr->rq_objname,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_resv_o = PyObject_Call(py_pbs_statobj, py_rargs,
							  NULL); /*NEW*/
				hook_set_mode = C_MODE;		 /* ensure still in C mode */
			}
		} else {
			/* we own this reference */
			py_resv_o = _pps_helper_get_resv(NULL, rqr->rq_objname, perf_label);
		}

		if (!py_resv_o || (py_resv_o == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to create original reservation %s's python resv object",
				       PY_TYPE_EVENT, rqr->rq_objname);
			rc = -1;
			goto event_set_exit;
		}
		/* handed off to py_event_parm...reference count incremented again */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV_O,
					  py_resv_o);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_RESV_O);
			goto event_set_exit;
		}
		/* Need to send a Variable_List of the original reservation, so that */
		/* in a hook script, we'll only allow to modify or add to existing */
		/* Variable_List */
		py_varlist_o = PyObject_GetAttrString(py_resv_o, ATTR_v); /* NEW */
		if ((py_varlist_o == NULL) || (py_varlist_o == Py_None)) {

			py_varlist = PyDict_New(); /* NEW - empty dict */
		} else {
			/* important to have a copy, so that changes in py_job's */
			/* Variable_List does not reflect in py_job_o's.	 */
			py_varlist = PyDict_Copy(py_varlist_o); /* NEW */
		}

		if (py_varlist == NULL) {
			log_err(PBSE_INTERNAL, __func__,
				"failed to create a Variable_List dictionary!");
			rc = -1;
			goto event_set_exit;
		}

		/* upon success, py_resv adds a reference count to py_varlist */
		if (PyObject_SetAttrString(py_resv, ATTR_v, py_varlist) == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "failed to set dictionary for %s", ATTR_v);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			rc = -1;
			goto event_set_exit;
		}
		/* end of Variable_List setting */

	} else if (hook_event == HOOK_EVENT_MODIFYJOB) {
		struct rq_manage *rqj = req_params->rq_manage;

		/* initialize event params to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB_O,
					    Py_None);
		/*
		 * First things first create a Python job object.
		 *  - Borrowed reference
		 *  - Exception is *NOT* set
		 */
		py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;

		py_jargs = Py_BuildValue("(s)", rqj->rq_objname); /* NEW ref */

		if (!py_jargs) {
			log_err(PBSE_INTERNAL, __func__, "could not build args list for job");
			goto event_set_exit;
		}

		py_job = PyObject_Call(py_job_class, py_jargs, NULL); /*NEW*/

		if (!py_job) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python job object");
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		snprintf(perf_action, sizeof(perf_action), "%s:%s(%s)", HOOK_PERF_POPULATE, EVENT_JOB_OBJECT, rqj->rq_objname);
		rc = pbs_python_populate_python_class_from_svrattrl(py_job,
								    &rqj->rq_attr, perf_label, perf_action);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_jargs); /* discard previously used value   */
				/* NOTE: *XDECREF() is safe where  */
				/* if py_jargs is NULL, then */
				/* nothing is released. */
				/* Current value of py_jargs is */
				/* released at the end of this  */
				/* function (at event_set_exit:) */
				py_jargs = Py_BuildValue("(sss)", "job", rqj->rq_objname,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_job_o = PyObject_Call(py_pbs_statobj, py_jargs,
							 NULL); /*NEW*/
				hook_set_mode = C_MODE;		/* ensure still in C mode */
			}
		} else {
			/* we own this reference */
			py_job_o = _pps_helper_get_job(NULL, rqj->rq_objname, NULL, perf_label);
		}

		if (!py_job_o || (py_job_o == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to create original job %s's python job object",
				       PY_TYPE_EVENT, rqj->rq_objname);
			rc = -1;
			goto event_set_exit;
		}
		/* handed off to py_event_parm...reference count incremented again */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB_O,
					  py_job_o);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB_O);
			goto event_set_exit;
		}
		/* Need to send a Variable_List of the original job, so that */
		/* in a hook script, we'll only allow to modify or add to existing */
		/* Variable_List */
		py_varlist_o = PyObject_GetAttrString(py_job_o, ATTR_v); /* NEW */
		if ((py_varlist_o == NULL) || (py_varlist_o == Py_None)) {

			py_varlist = PyDict_New(); /* NEW - empty dict */
		} else {
			/* important to have a copy, so that changes in py_job's */
			/* Variable_List does not reflect in py_job_o's.	 */
			py_varlist = PyDict_Copy(py_varlist_o); /* NEW */
		}

		if (py_varlist == NULL) {
			log_err(PBSE_INTERNAL, __func__,
				"failed to create a Variable_List dictionary!");
			rc = -1;
			goto event_set_exit;
		}

		/* upon success, py_job adds a reference count to py_varlist */
		if (PyObject_SetAttrString(py_job, ATTR_v, py_varlist) == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "failed to set dictionary for %s", ATTR_v);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			rc = -1;
			goto event_set_exit;
		}
		/* end of Variable_List setting */

	} else if (hook_event == HOOK_EVENT_MOVEJOB) {
		struct rq_move *rqj = req_params->rq_move;

		/* initialize params to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_SRC_QUEUE,
					    Py_None);
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);

		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_jargs); /* discard previously used value */
				py_jargs = Py_BuildValue("(sss)", "job", rqj->rq_jid,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_job = PyObject_Call(py_pbs_statobj, py_jargs,
						       NULL); /*NEW*/
				hook_set_mode = C_MODE;	      /* ensure still in C mode */
			}
		} else {
			py_job = _pps_helper_get_job(NULL, rqj->rq_jid, NULL, perf_label);
			/* NEW - we own ref */
		}

		if (!py_job || (py_job == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to create job %s's python "
				       "job object",
				       PY_TYPE_EVENT, rqj->rq_jid);
			goto event_set_exit;
		}

		/* py_job handed off to py_event_parm...reference count incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		if (!PyObject_HasAttrString(py_job, ATTR_queue)) {
			LOG_ERROR_ARG2("%s: does not have attribute <%s>",
				       PY_TYPE_JOB, ATTR_queue);
			rc = -1;
			goto event_set_exit;
		}

		/* save the current value of job's queue attribute */
		py_que = PyObject_GetAttrString(py_job, ATTR_queue); /* NEW */

		if (py_que == NULL || (py_que == Py_None)) {
			LOG_ERROR_ARG2("movejob %s has a bad value for attribute <%s>",
				       rqj->rq_jid, ATTR_queue);
			rc = -1;
			goto event_set_exit;
		}

		/* handed off to py_event_parm...reference count incremented again */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_SRC_QUEUE,
					  py_que);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_SRC_QUEUE);
			goto event_set_exit;
		}

		/* reset the movejob's queue attribute to the *new* queue to move to */
		rc = pbs_python_object_set_attr_string_value(py_job, ATTR_queue,
							     rqj->rq_destin);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set attribute <%s>",
				       PY_TYPE_JOB, ATTR_queue);
			goto event_set_exit;
		}

		/* py_job is not read-only but only ATTR_queue is modifiable and */
		/* checked under is_attrib_val_settable() 			 */
		rc = pbs_python_object_set_attr_integral_value(py_job,
							       PY_READONLY_FLAG, FALSE);
		if (rc == -1) {

			log_err(PBSE_INTERNAL, __func__,
				"Failed set object's readonly flag");
			goto event_set_exit;
		}

	} else if (hook_event == HOOK_EVENT_PROVISION) {
		struct prov_vnode_info *prov_vnode_info = req_params->rq_prov;

		/* initialize event params to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODE,
					    Py_None);
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_AOE,
					    Py_None);
		py_vnode = PyUnicode_FromString(prov_vnode_info->pvnfo_vnode);
		/* set vnode */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODE, py_vnode);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_VNODE);
			goto event_set_exit;
		}

		py_aoe = PyUnicode_FromString(prov_vnode_info->pvnfo_aoe_req); /* NEW ref */
		/* set aoe */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_AOE, py_aoe);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_AOE);
			goto event_set_exit;
		}
	} else if (hook_event == HOOK_EVENT_PERIODIC) {
		vnlist = (pbs_list_head *) req_params->vns_list;

		/* SET VNODE_LIST param */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODELIST,
					    Py_None);
		py_vnodelist = create_py_vnodelist(vnlist, perf_label, HOOK_PERF_POPULATE_VNODELIST);
		if (py_vnodelist == NULL) {
			LOG_ERROR_ARG2("%s: failed to create a Python vnodelist object for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_VNODELIST);
			goto event_set_exit;
		}

		/* set vnode list: py_vnodelist given to py_event_param so ref count */
		/* auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODELIST,
					  py_vnodelist);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_VNODELIST);
			goto event_set_exit;
		}

		/* SET RESV_LIST param */
		resvlist = (pbs_list_head *) req_params->resv_list;

		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESVLIST,
					    Py_None);
		py_resvlist = create_py_resvlist(resvlist, perf_label, HOOK_PERF_POPULATE_RESVLIST);
		if (py_resvlist == NULL) {
			LOG_ERROR_ARG2("%s: failed to create a Python resvlist object for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_RESVLIST);
			goto event_set_exit;
		}
		/* set resv list: py_resvlist given to py_event_param so ref count */
		/* auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESVLIST,
					  py_resvlist);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_RESVLIST);
			goto event_set_exit;
		}
	} else if (hook_event == HOOK_EVENT_RUNJOB) {
		struct rq_runjob *rqj = req_params->rq_run;

		/* initialize event param to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_jargs); /* discard previously used value */
				py_jargs = Py_BuildValue("(sss)", "job", rqj->rq_jid,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_job = PyObject_Call(py_pbs_statobj, py_jargs,
						       NULL); /*NEW*/
				hook_set_mode = C_MODE;	      /* ensure still in C mode */
			}
		} else {
			py_job = _pps_helper_get_job(NULL, rqj->rq_jid, NULL, perf_label);
		}
		/* NEW - we own ref */

		if (!py_job || (py_job == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to get job %s's python "
				       "job object",
				       PY_TYPE_EVENT, rqj->rq_jid);
			goto event_set_exit;
		}

		/* py_job given to py_event_parm...so ref. count auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		/* py_job is not read-only but only ATTR_h, ATTR_a are modifiable and */
		/* checked under is_attrib_val_settable(). Resource-type attributes   */
		/* such as ATTR_l, which is part of py_job,  go through a different   */
		/* processing mechanism.        				      */
		/* It is fatal if py_job's readonly flag could not be set to False    */
		/* as it could prevent all job attributes including ATTR_l to be      */
		/* not settable.                                                      */
		rc = pbs_python_object_set_attr_integral_value(py_job,
							       PY_READONLY_FLAG, FALSE);
		if (rc == -1) {

			log_err(PBSE_INTERNAL, __func__,
				"Failed set object's readonly flag");
			goto event_set_exit;
		}

		py_resclist = PyObject_GetAttrString(py_job, ATTR_l); /* NEW */
		if ((py_resclist != NULL) && (py_resclist != Py_None)) {
			/* Don't mark pbs.event().job.Resource_List[] as readonly */
			rc = pbs_python_object_set_attr_integral_value(py_resclist,
								       PY_READONLY_FLAG, FALSE);
			if (rc == -1) {

				log_err(PBSE_INTERNAL, __func__,
					"Failed set object's readonly flag");
				LOG_ERROR_ARG2("%s: warning - failed to set object's '%s' readonly flag", __func__, "Resource_List[]");
			}
		}

		if (!PyObject_HasAttrString(py_job, ATTR_execvnode)) {
			LOG_ERROR_ARG2("%s: does not have attribute <%s>",
				       PY_TYPE_JOB,
				       ATTR_execvnode);
			rc = -1;
			goto event_set_exit;
		}

		/* set value of job's exec_vnode attribute if not already set */
		py_exec_vnode = PyObject_GetAttrString(py_job, ATTR_execvnode); /* NEW */

		if ((rqj->rq_destin != NULL) && (*rqj->rq_destin != '\0') &&
		    ((py_exec_vnode == NULL) || (py_exec_vnode == Py_None))) {
			/* set "exec_vnodes" attribute if not set */
			rc = pbs_python_object_set_attr_string_value(py_job,
								     ATTR_execvnode, rqj->rq_destin);
			if (rc == -1) {
				LOG_ERROR_ARG2("%s:failed to set attribute <%s>",
					       PY_TYPE_JOB, ATTR_execvnode);
				goto event_set_exit;
			}
		}
	} else if (hook_event == HOOK_EVENT_JOBOBIT) {
		struct rq_jobobit *rqj = req_params->rq_obit;
		/* initialize params to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);

		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_jargs); /* discard previously used value */
				py_jargs = Py_BuildValue("(sss)", "job", rqj->rq_pjob->ji_qs.ji_jobid,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_job = PyObject_Call(py_pbs_statobj, py_jargs,
						       NULL); /*NEW*/
				hook_set_mode = C_MODE;	      /* ensure still in C mode */
			}
		} else {
			py_job = _pps_helper_get_job(NULL, rqj->rq_pjob->ji_qs.ji_jobid, NULL, perf_label);
			/* NEW - we own ref */
		}

		if (!py_job || (py_job == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to create job %s's python "
				       "job object",
				       PY_TYPE_EVENT, rqj->rq_pjob->ji_qs.ji_jobid);
			goto event_set_exit;
		}

		/* py_job handed off to py_event_parm...reference count incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}
	} else if (hook_event == HOOK_EVENT_MANAGEMENT) {
		PyObject *py_attr = (PyObject *) NULL;
		struct rq_management *rqj = req_params->rq_manage;
		py_management_class = pbs_python_types_table[PP_MANAGEMENT_IDX].t_class;
		if (!py_management_class) {
			log_err(PBSE_INTERNAL, __func__, "failed to acquire management class");
			(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_MANAGEMENT,
						    Py_None);
			goto event_set_exit;
		}

		py_attr = svrattrl_list_to_pyobject(rqj->rq_manager.rq_cmd, &rqj->rq_manager.rq_attr);
		if (!py_attr) {
			log_err(PBSE_INTERNAL, __func__, "could not build the list of server attributes");
			goto event_set_exit;
		}

		py_margs = Py_BuildValue("(iisliiisO)",
					 rqj->rq_manager.rq_cmd,
					 rqj->rq_manager.rq_objtype,
					 rqj->rq_manager.rq_objname,
					 rqj->rq_time,
					 rqj->rq_reply->brp_code,
					 rqj->rq_reply->brp_auxcode,
					 rqj->rq_reply->brp_choice,
					 (rqj->rq_reply->brp_choice == BATCH_REPLY_CHOICE_Text) ? rqj->rq_reply->brp_un.brp_txt.brp_str : NULL,
					 py_attr); /* NEW ref */
		Py_CLEAR(py_attr);

		if (!py_margs) {
			log_err(PBSE_INTERNAL, __func__, "could not build args list for management");
			goto event_set_exit;
		}
		py_management = PyObject_CallObject(py_management_class, py_margs);

		if (!py_management) {
			pbs_python_write_error_to_log(__func__);
			log_err(PBSE_INTERNAL, __func__, "failed to create a python management object");
			(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_MANAGEMENT,
						    Py_None);
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_MANAGEMENT,
					  py_management);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_MANAGEMENT);
			goto event_set_exit;
		}
	} else if (hook_event == HOOK_EVENT_MODIFYVNODE) {
		struct rq_modifyvnode *rqmvn = req_params->rq_modifyvnode;
		struct pbsnode *vnode_o = rqmvn->rq_vnode_o;
		struct pbsnode *vnode = rqmvn->rq_vnode;
		int tmpv_rc;

		/* initialize event params to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODE,
					    Py_None);
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODE_O,
					    Py_None);

		/* Retrieve the vnode_o data */
		py_vnode_o = _pps_helper_get_vnode(vnode_o, NULL, HOOK_PERF_POPULATE_VNODE_O);
		if (py_vnode_o == NULL) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python vnode_o object");
			goto event_set_exit;
		}

		/* Set the vnode_o object to readonly to prevent hook writers from modifying values */
		tmpv_rc = pbs_python_mark_object_readonly(py_vnode_o);
		if (tmpv_rc == -1) {
			log_err(PBSE_INTERNAL, __func__, "Failed to mark python vnode_o object readonly");
			goto event_set_exit;
		}

		/* Retrieve the vnode data */
		py_vnode = _pps_helper_get_vnode(vnode, NULL, HOOK_PERF_POPULATE_VNODE);
		if (py_vnode == NULL) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python vnode object");
			goto event_set_exit;
		}

		/* Set the vnode object to readonly to prevent hook writers from modifying values */
		tmpv_rc = pbs_python_mark_object_readonly(py_vnode);
		if (tmpv_rc == -1) {
			log_err(PBSE_INTERNAL, __func__, "Failed to mark python vnode object readonly");
			goto event_set_exit;
		}

		/* Set the vnode_o event param */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODE_O, py_vnode_o);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_VNODE_O);
			goto event_set_exit;
		}

		/* Set the vnode event param */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_VNODE, py_vnode);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_VNODE);
			goto event_set_exit;
		}
	} else if ((hook_event == HOOK_EVENT_RESV_END) ||
		   (hook_event == HOOK_EVENT_RESV_BEGIN)) {
		struct rq_manage *rqj = req_params->rq_manage;

		/* initialize event param to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV, Py_None);

		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_rargs); /* discard previously used value */
				py_rargs = Py_BuildValue("(sss)", "resv", rqj->rq_objname,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_resv = PyObject_Call(py_pbs_statobj, py_rargs,
							NULL); /*NEW Reservation object*/
				hook_set_mode = C_MODE;	       /* ensure still in C mode */
			}
		} else {
			py_resv = _pps_helper_get_resv(NULL, rqj->rq_objname, perf_label);
		}

		if (!py_resv || (py_resv == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to create resv %s's python resv object", PY_TYPE_EVENT, rqj->rq_objname);
			goto event_set_exit;
		}
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV, py_resv);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>", PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}
	} else if (hook_event == HOOK_EVENT_RESV_CONFIRM) {
		/* Confirm uses rq_runjob, not rq_manage and sticks the reservation id in rq_jid */
		struct rq_runjob *rqj = req_params->rq_run;

		/* initialize event param to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV, Py_None);

		if (IS_PBS_PYTHON_CMD(pbs_python_daemon_name)) {
			if (py_pbs_statobj != NULL) {
				Py_XDECREF(py_rargs); /* discard previously used value */
				py_rargs = Py_BuildValue("(sss)", "resv", rqj->rq_jid,
							 pbs_conf.pbs_server_name); /* NEW ref */
				py_resv = PyObject_Call(py_pbs_statobj, py_rargs,
							NULL); /*NEW Reservation object*/
				hook_set_mode = C_MODE;	       /* ensure still in C mode */
			}
		} else {
			py_resv = _pps_helper_get_resv(NULL, rqj->rq_jid, perf_label);
		}

		if (!py_resv || (py_resv == Py_None)) {
			LOG_ERROR_ARG2("%s:failed to create resv %s's python resv object", PY_TYPE_EVENT, rqj->rq_jid);
			goto event_set_exit;
		}
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_RESV, py_resv);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>", PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}
	} else if ((hook_event == HOOK_EVENT_EXECJOB_BEGIN) ||
		   (hook_event == HOOK_EVENT_EXECJOB_RESIZE) ||
		   (hook_event == HOOK_EVENT_EXECJOB_PROLOGUE) ||
		   (hook_event == HOOK_EVENT_EXECJOB_EPILOGUE) ||
		   (hook_event == HOOK_EVENT_EXECJOB_END) ||
		   (hook_event == HOOK_EVENT_EXECJOB_ABORT) ||
		   (hook_event == HOOK_EVENT_EXECJOB_POSTSUSPEND) ||
		   (hook_event == HOOK_EVENT_EXECJOB_PRERESUME) ||
		   (hook_event == HOOK_EVENT_EXECJOB_PRETERM)) {
		struct rq_queuejob *rqj = req_params->rq_job;

		/* initialize event param to None */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		/*
		 * First things first create a Python job object.
		 *  - Borrowed reference
		 *  - Exception is *NOT* set
		 */
		py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;

		py_jargs = Py_BuildValue("(s)", rqj->rq_jid); /* NEW ref */
		if (!py_jargs) {
			log_err(PBSE_INTERNAL, __func__, "could not build args list for job");
			goto event_set_exit;
		}
		py_job = PyObject_Call(py_job_class, py_jargs, NULL); /*NEW*/

		if (!py_job) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python job object");
			(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
						    Py_None);
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s:failed to set param attribute <%s>",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		snprintf((char *) perf_action, sizeof(perf_action), "%s:%s(%s)", HOOK_PERF_POPULATE, EVENT_JOB_OBJECT, rqj->rq_jid);
		rc = pbs_python_populate_python_class_from_svrattrl(py_job, &rqj->rq_attr, perf_label, perf_action);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		py_vnodelist = create_hook_vnode_list_param(py_event_param,
							    PY_TYPE_EVENT, PY_EVENT_PARAM_VNODELIST,
							    (pbs_list_head *) req_params->vns_list,
							    perf_label, HOOK_PERF_POPULATE_VNODELIST);

		if (py_vnodelist == NULL) {
			rc = -1;
			goto event_set_exit;
		}

		if (hook_event == HOOK_EVENT_EXECJOB_PROLOGUE) {

			py_vnodelist_fail = create_hook_vnode_list_param(py_event_param,
									 PY_TYPE_EVENT, PY_EVENT_PARAM_VNODELIST_FAIL,
									 (pbs_list_head *) req_params->vns_list_fail, perf_label, HOOK_PERF_POPULATE_VNODELIST_FAIL);

			if (py_vnodelist_fail == NULL) {
				rc = -1;
				goto event_set_exit;
			}
			py_failed_node_list = create_py_strlist_from_svrattrl_names(req_params->failed_mom_list);
			if (py_failed_node_list == NULL) {
				rc = -1;
				goto event_set_exit;
			}

			/* set failed_mom_list: py_vnlist given to py_job so ref count auto incremented */
			rc = PyObject_SetAttrString(py_job, PY_JOB_FAILED_MOM_LIST, py_failed_node_list);
			if (rc == -1)
				goto event_set_exit;

			/* set succeeded_mom_list: py_vnlist given to py_job so ref count auto incremented */
			py_node_list = create_py_strlist_from_svrattrl_names((pbs_list_head *) req_params->succeeded_mom_list);
			if (py_node_list == NULL) {
				rc = -1;
				goto event_set_exit;
			}

			/* set vnode list: py_vnlist given to py_job so ref count auto incremented */
			rc = PyObject_SetAttrString(py_job, PY_JOB_SUCCEEDED_MOM_LIST, py_node_list);
			if (rc == -1)
				goto event_set_exit;
		}

	} else if (hook_event == HOOK_EVENT_EXECJOB_LAUNCH) {
		struct rq_queuejob *rqj;
		char *progname = NULL;
		char **arg_list = NULL;
		char *env_str = NULL;

		rqj = (struct rq_queuejob *) req_params->rq_job;

		/* SET JOB param */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		/*
		 * First things first create a Python job object.
		 *  - Borrowed reference
		 *  - Exception is *NOT* set
		 */
		py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;

		py_jargs = Py_BuildValue("(s)", rqj->rq_jid); /* NEW ref */
		if (py_jargs == NULL) {
			LOG_ERROR_ARG2("%s: could not build job args list for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		py_job = PyObject_Call(py_job_class, py_jargs, NULL); /*NEW*/
		if (py_job == NULL) {
			LOG_ERROR_ARG2("%s: failed to create a python job object for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
						    Py_None);
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: failed to set param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		snprintf((char *) perf_action, sizeof(perf_action), "%s:%s(%s)", HOOK_PERF_POPULATE, EVENT_JOB_OBJECT, rqj->rq_jid);
		rc = pbs_python_populate_python_class_from_svrattrl(py_job, &rqj->rq_attr, perf_label, perf_action);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		py_vnodelist =
			create_hook_vnode_list_param(py_event_param,
						     PY_TYPE_EVENT, PY_EVENT_PARAM_VNODELIST,
						     (pbs_list_head *) req_params->vns_list, perf_label, HOOK_PERF_POPULATE_VNODELIST);

		if (py_vnodelist == NULL) {
			rc = -1;
			goto event_set_exit;
		}

		py_vnodelist_fail =
			create_hook_vnode_list_param(py_event_param,
						     PY_TYPE_EVENT, PY_EVENT_PARAM_VNODELIST_FAIL,
						     (pbs_list_head *) req_params->vns_list_fail, perf_label, HOOK_PERF_POPULATE_VNODELIST_FAIL);

		if (py_vnodelist_fail == NULL) {
			rc = -1;
			goto event_set_exit;
		}

		/* SET job's failed_mom_list param *vnlist */
		py_failed_node_list = create_py_strlist_from_svrattrl_names(req_params->failed_mom_list);
		if (py_failed_node_list == NULL) {
			rc = -1;
			goto event_set_exit;
		}

		/* set failed_mom_list: py_failed_node_list given to py_job so ref count auto incremented */
		rc = PyObject_SetAttrString(py_job, PY_JOB_FAILED_MOM_LIST, py_failed_node_list);
		if (rc == -1)
			goto event_set_exit;

		/* SET job's succeeded_mom_list param *vnlist */
		py_node_list = create_py_strlist_from_svrattrl_names((pbs_list_head *) req_params->succeeded_mom_list);
		if (py_node_list == NULL) {
			rc = -1;
			goto event_set_exit;
		}

		/* set succeeded_mom_list: py_node_list given to py_job so ref count auto incremented */
		rc = PyObject_SetAttrString(py_job, PY_JOB_SUCCEEDED_MOM_LIST, py_node_list);
		if (rc == -1)
			goto event_set_exit;

		/* SET PROGNAME param */
		progname = req_params->progname;
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_PROGNAME,
					    Py_None);

		py_progname = Py_BuildValue("s", progname); /* NEW ref */
		if (py_progname == NULL) {
			LOG_ERROR_ARG2("%s:failed to create a Python string object for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_PROGNAME);
			goto event_set_exit;
		}

		/* set progname: py_progname given to py_event_param so ref count */
		/* auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_PROGNAME,
					  py_progname);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s: failed to set param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_PROGNAME);
			goto event_set_exit;
		}

		/* SET ARGV param */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_ARGLIST,
					    Py_None);

		arg_list = svrattrl_to_str_array(req_params->argv_list);
		if (arg_list == NULL) {
			LOG_ERROR_ARG2("%s: failed to build a string array for setting param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_ARGLIST);
			goto event_set_exit;
		}
		py_arglist = create_py_strlist(arg_list);

		free_str_array(arg_list);
		arg_list = NULL;

		if (py_arglist == NULL) {
			LOG_ERROR_ARG2("%s: failed to create a Python string list for setting param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_ARGLIST);
			goto event_set_exit;
		}

		/* set arg_list: py_arglist given to py_event_param so ref count */
		/* auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_ARGLIST,
					  py_arglist);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s: failed to set param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_ARGLIST);
			goto event_set_exit;
		}

		/* SET ENV param */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_ENV,
					    Py_None);
		env_str = req_params->env;
		if (env_str == NULL) {
			LOG_ERROR_ARG2("%s: failed to build a string array for setting param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_ENV);
			goto event_set_exit;
		}

		py_env_class = pbs_python_types_table[PP_ENV_IDX].t_class;

		py_eargs = Py_BuildValue("(si)", env_str, 1); /* NEW ref */
		if (!py_eargs) {
			log_err(PBSE_INTERNAL, __func__, "could not build env list for job");
			goto event_set_exit;
		}
		py_env = PyObject_Call(py_env_class, py_eargs, NULL); /*NEW*/

		if (!py_env) {
			log_err(PBSE_INTERNAL, __func__, "failed to create a python env object");
			goto event_set_exit;
		}

		/* set env: py_env given to py_event_param so ref count */
		/* auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_ENV,
					  py_env);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s: failed to set param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_ENV);
			goto event_set_exit;
		}

	} else if ((hook_event == HOOK_EVENT_EXECHOST_PERIODIC) ||
		   (hook_event == HOOK_EVENT_EXECHOST_STARTUP)) {

		/* SET VNODELIST param */
		py_vnodelist = create_hook_vnode_list_param(py_event_param,
							    PY_TYPE_EVENT,
							    PY_EVENT_PARAM_VNODELIST,
							    (pbs_list_head *) req_params->vns_list,
							    perf_label, HOOK_PERF_POPULATE_VNODELIST);

		if (py_vnodelist == NULL) {
			rc = -1;
			goto event_set_exit;
		}

		/* SET JOB_LIST param */
		if (hook_event == HOOK_EVENT_EXECHOST_PERIODIC) {
			/* initialize event param to None */
			joblist = (pbs_list_head *) req_params->jobs_list;

			(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOBLIST,
						    Py_None);
			py_joblist = create_py_joblist(joblist, perf_label, HOOK_PERF_POPULATE_JOBLIST);
			if (py_joblist == NULL) {
				LOG_ERROR_ARG2("%s: failed to create a Python joblist object for param['%s']",
					       PY_TYPE_EVENT, PY_EVENT_PARAM_JOBLIST);
				goto event_set_exit;
			}
			/* set job list: py_vnodelist given to py_event_param so ref count */
			/* auto incremented */
			rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOBLIST,
						  py_joblist);
			if (rc == -1) {
				LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
					       PY_TYPE_EVENT, PY_EVENT_PARAM_JOBLIST);
				goto event_set_exit;
			}
		}

	} else if (hook_event == HOOK_EVENT_EXECJOB_ATTACH) {
		struct rq_queuejob *rqj;
		pid_t pid;

		rqj = (struct rq_queuejob *) req_params->rq_job;

		/* SET JOB param */
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
					    Py_None);
		/*
		 * First things first create a Python job object.
		 *  - Borrowed reference
		 *  - Exception is *NOT* set
		 */
		py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;

		py_jargs = Py_BuildValue("(s)", rqj->rq_jid); /* NEW ref */
		if (py_jargs == NULL) {
			LOG_ERROR_ARG2("%s: could not build job args list for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		py_job = PyObject_Call(py_job_class, py_jargs, NULL); /*NEW*/
		if (py_job == NULL) {
			LOG_ERROR_ARG2("%s: failed to create a python job object for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB,
						    Py_None);
			goto event_set_exit;
		}

		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_JOB, py_job);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: failed to set param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		snprintf((char *) perf_action, sizeof(perf_action), "%s:%s(%s)", HOOK_PERF_POPULATE, EVENT_JOB_OBJECT, rqj->rq_jid);
		rc = pbs_python_populate_python_class_from_svrattrl(py_job, &rqj->rq_attr, perf_label, perf_action);

		if (rc == -1) {
			LOG_ERROR_ARG2("%s: partially set remaining param['%s'] attributes",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
			goto event_set_exit;
		}

		/* SET PID param */
		pid = req_params->pid;
		(void) PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_PID,
					    Py_None);

		py_pid = Py_BuildValue("i", (int) pid); /* NEW ref */
		if (py_pid == NULL) {
			LOG_ERROR_ARG2("%s:failed to create a Python int object for param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_PID);
			goto event_set_exit;
		}

		/* set progname: py_progname given to py_event_param so ref count */
		/* auto incremented */
		rc = PyDict_SetItemString(py_event_param, PY_EVENT_PARAM_PID,
					  py_pid);
		if (rc == -1) {
			LOG_ERROR_ARG2("%s: failed to set param['%s']",
				       PY_TYPE_EVENT, PY_EVENT_PARAM_PID);
			goto event_set_exit;
		}

		py_vnodelist = create_hook_vnode_list_param(py_event_param,
							    PY_TYPE_EVENT,
							    PY_EVENT_PARAM_VNODELIST,
							    (pbs_list_head *) req_params->vns_list,
							    perf_label, HOOK_PERF_POPULATE_VNODELIST);

		if (py_vnodelist == NULL) {
			rc = -1;
			goto event_set_exit;
		}

	} else {
		LOG_ERROR_ARG2("%s:got unknown hook event %s",
			       PY_TYPE_EVENT, hook_event_as_string(hook_event));
		goto event_set_exit;
	}

	rc = 0;

event_set_exit:

	py_hook_pbsevent = py_event;

	if (py_hook_pbsevent != NULL) {
		Py_INCREF(py_hook_pbsevent); /* don't lose reference to event object */

		/* only applies to event being accessed, set  in a Python script */
		if (_pbs_python_event_mark_readonly() == -1) {
			log_err(PBSE_INTERNAL, __func__, "Failed to mark event readonly.");
			rc = -1;
		}
	}

	if (PyErr_Occurred()) {

		if (PyErr_ExceptionMatches(PyExc_KeyboardInterrupt))
			rc = -2;
		pbs_python_write_error_to_log(__func__);
	}

	Py_CLEAR(py_eargs);
	Py_CLEAR(py_event);
	Py_CLEAR(py_jargs);
	Py_CLEAR(py_job);
	Py_CLEAR(py_job_o);
	Py_CLEAR(py_que);
	Py_CLEAR(py_rargs);
	Py_CLEAR(py_resv);
	Py_CLEAR(py_event_param);
	Py_CLEAR(py_varlist);
	Py_CLEAR(py_varlist_o);
	Py_CLEAR(py_vnodelist);
	Py_CLEAR(py_vnodelist_fail);
	Py_CLEAR(py_failed_node_list);
	Py_CLEAR(py_node_list);
	Py_CLEAR(py_resclist);
	Py_CLEAR(py_exec_vnode);
	Py_CLEAR(py_vnode);
	Py_CLEAR(py_vnode_o);
	Py_CLEAR(py_aoe);
	Py_CLEAR(py_progname);
	Py_CLEAR(py_arglist);
	Py_CLEAR(py_env);
	Py_CLEAR(py_joblist);
	Py_CLEAR(py_pid);
	Py_CLEAR(py_resvlist);
	Py_CLEAR(py_margs);
	Py_CLEAR(py_management);
	return (rc);
}


/**
 *
 * @brief
 *	Helper function to populate the svrattrl list 'vnlist' with
 *	data taken from the individual vnodes in event parameter
 *	'vnodelist_name'.
 * @param[in]	vnodelist_name  - name of vnode_list[] in pbs.event().
 * @param[in,out] vnlist 	- the pbs list to populate.
 *
 * @return int
 * @retval 0	- success
 * @retval -1	- if error occurred.
 *
 */
static int
populate_svrattrl_from_vnodelist_param(char *vnodelist_name,
				       pbs_list_head *vnlist)
{
	PyObject *py_vnlist = NULL;
	PyObject *py_attr_keys = NULL;
	PyObject *py_vnode = NULL;
	int num_attrs;
	int i;

	if ((vnodelist_name == NULL) || (vnlist == NULL)) {
		log_err(PBSE_INTERNAL, __func__, "bad input param");
		return -1;
	}

	py_vnlist = _pbs_python_event_get_param(vnodelist_name);

	if (py_vnlist == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"No vnode list parameter found for event!");
		return -1;
	}

	if (!PyDict_Check(py_vnlist)) {
		log_err(PBSE_INTERNAL, __func__,
			"vnode list parameter not a dictionary!");
		return -1;
	}
	py_attr_keys = PyDict_Keys(py_vnlist); /* NEW ref */

	if (py_attr_keys == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to obtain object's '%s' keys",
			 vnodelist_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		return -1;
	}

	if (!PyList_Check(py_attr_keys)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "object's '%s' keys is not a list!",
			 vnodelist_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		Py_CLEAR(py_attr_keys);
		return -1;
	}

	num_attrs = PyList_Size(py_attr_keys);
	for (i = 0; i < num_attrs; i++) {
		char *key_str;

		key_str = strdup(pbs_python_list_get_item_string_value(py_attr_keys, i));
		if ((key_str == NULL) || (key_str[0] == '\0')) {
			if (key_str != NULL) {
				free(key_str);
				key_str = NULL;
			}
			continue;
		}

		py_vnode = PyDict_GetItemString(py_vnlist, key_str); /* no need to Py_CLEAR() later since this returns a borrowed reference */

		if (py_vnode == NULL) {
			snprintf(log_buffer, sizeof(log_buffer) - 1,
				 "failed to get attribute '%s' value",
				 key_str);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			Py_CLEAR(py_attr_keys);
			free(key_str);
			key_str = NULL;
			return -1;
		}

		if (pbs_python_populate_svrattrl_from_python_class(
			    py_vnode, vnlist, key_str, 1) == -1) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed to populate svrattrl with key '%s' value", key_str);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			Py_CLEAR(py_attr_keys);
			free(key_str);
			return -1;
		}
		free(key_str);
	}
	Py_CLEAR(py_attr_keys);

	return (0);
}

/**
 *
 * @brief
 * 	Recreates 'req_params' (structure of batch requests, ex. rq_queuejob, rq_manage,
 * 	rq_move) consulting the parameter values obtained from current
 * 	PBS Python event object representing 'hook_event'.
 *
 * @param[in]		hook_event 	- event in question
 * @param[in/out]	req_params	- results parameter
 * @param[in]		perf_label - passed on to hook_perf_stat* call.
 * @param[in]		perf_action - passed on to hook_perf_stat* call.
 * @note
 * 	Care must be taken to malloc free up allocated entries in 'req_params'
 * 	after use. The 'req_params' entries could be partially allocated upon
 * 	a failure from this function.
 *
 * @return int
 * @retval	0 	for success
 * @retval	-1	otherwise, for failure.
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
int
_pbs_python_event_to_request(unsigned int hook_event, hook_output_param_t *req_params, char *perf_label, char *perf_action)
{
	PyObject *py_job = NULL;
	PyObject *py_vnode = NULL;
	PyObject *py_vnodelist = NULL;
	PyObject *py_joblist = NULL;
	PyObject *py_resvlist = NULL;
	PyObject *py_job_o = NULL;
	PyObject *py_resv = NULL;
	PyObject *py_resv_o = NULL;
	char *queue;
	PyObject *py_varlist = NULL;
	PyObject *py_varlist_o = NULL;
	int i, num_attrs;
	char *key_str = NULL;
	PyObject *py_attr_keys = NULL;
	PyObject *py_progname = NULL;
	PyObject *py_arglist = NULL;
	PyObject *py_env = NULL;
	char *progname;
	char *env_str;
	int deletejob_flag;
	int rerunjob_flag;
	char val_str[HOOK_BUF_SIZE];
	int rc = -1;

	hook_perf_stat_start(perf_label, perf_action, 0);
	switch (hook_event) {
		case HOOK_EVENT_QUEUEJOB:
		case HOOK_EVENT_POSTQUEUEJOB:

			py_job = _pbs_python_event_get_param(PY_EVENT_PARAM_JOB);
			if (!py_job) {
				log_err(PBSE_INTERNAL, __func__,
					"No job parameter found for event!");
				goto event_to_request_exit;
			}

			queue = pbs_python_object_get_attr_string_value(py_job,
									ATTR_queue);
			if (queue) {
				if (hook_event == HOOK_EVENT_QUEUEJOB)
					strcpy(((struct rq_queuejob *) (req_params->rq_job))->rq_destin, queue);
				else
					strcpy(((struct rq_postqueuejob *) (req_params->rq_postqueuejob))->rq_destin, queue);
			}

			if (hook_event == HOOK_EVENT_QUEUEJOB) {
				if (pbs_python_populate_svrattrl_from_python_class(py_job,
										   &((struct rq_queuejob *) (req_params->rq_job))->rq_attr, NULL, 0) == -1) {
					goto event_to_request_exit;
				}
				print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", &((struct rq_queuejob *) (req_params->rq_job))->rq_attr);
			} else {
				if (pbs_python_populate_svrattrl_from_python_class(py_job,
										   &((struct rq_postqueuejob *) (req_params->rq_postqueuejob))->rq_attr, NULL, 0) == -1) {
					goto event_to_request_exit;
				}
				print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", &((struct rq_postqueuejob *) (req_params->rq_job))->rq_attr);
			}
			break;
		case HOOK_EVENT_EXECJOB_LAUNCH:
		case HOOK_EVENT_EXECJOB_BEGIN:
		case HOOK_EVENT_EXECJOB_PROLOGUE:
		case HOOK_EVENT_EXECJOB_EPILOGUE:
		case HOOK_EVENT_EXECJOB_PRETERM:
		case HOOK_EVENT_EXECJOB_END:
		case HOOK_EVENT_EXECJOB_ABORT:
		case HOOK_EVENT_EXECJOB_POSTSUSPEND:
		case HOOK_EVENT_EXECJOB_PRERESUME:

			py_job = _pbs_python_event_get_param(PY_EVENT_PARAM_JOB);
			if (!py_job) {
				log_err(PBSE_INTERNAL, __func__,
					"No job parameter found for event!");
				goto event_to_request_exit;
			}

			if (pbs_python_populate_svrattrl_from_python_class(py_job,
									   &((struct rq_queuejob *) (req_params->rq_job))->rq_attr, NULL, 0) == -1) {
				log_err(PBSE_INTERNAL, __func__,
					"Failed to populate request structure!");
				goto event_to_request_exit;
			}
			print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", &((struct rq_queuejob *) (req_params->rq_job))->rq_attr);

			if (hook_event == HOOK_EVENT_EXECJOB_PROLOGUE) {
				/* populate vnodelist_fail event param */
				if (populate_svrattrl_from_vnodelist_param(PY_EVENT_PARAM_VNODELIST_FAIL, (pbs_list_head *) (req_params->vns_list_fail))) {
					goto event_to_request_exit;
				}
			} else if (hook_event == HOOK_EVENT_EXECJOB_LAUNCH) {
				int ret;

				py_progname = _pbs_python_event_get_param(PY_EVENT_PARAM_PROGNAME);
				if (py_progname == NULL) {
					log_err(PBSE_INTERNAL, __func__,
						"No progname parameter found for event!");
					goto event_to_request_exit;
				}
				progname = strdup(pbs_python_object_str(py_progname));
				if (progname == NULL) {
					log_err(PBSE_INTERNAL, __func__,
						"Failed to strdup progname parameter!");
					goto event_to_request_exit;
				}
				*((char **) (req_params->progname)) = progname;

				py_arglist = _pbs_python_event_get_param(PY_EVENT_PARAM_ARGLIST);
				if (py_arglist == NULL) {
					log_err(PBSE_INTERNAL, __func__,
						"No argv parameter found for event!");
					goto event_to_request_exit;
				}

				ret = py_strlist_to_svrattrl(py_arglist,
							     (pbs_list_head *) (req_params->argv_list),
							     PY_EVENT_PARAM_ARGLIST);
				if (ret == -1) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "%s: Failed to dump Python string list values into a svrattrl list!",
						 PY_EVENT_PARAM_ARGLIST);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					goto event_to_request_exit;
				}

				py_env = _pbs_python_event_get_param(PY_EVENT_PARAM_ENV);
				if (py_env == NULL) {
					log_err(PBSE_INTERNAL, __func__,
						"No env parameter found for event!");
					goto event_to_request_exit;
				}

				env_str = strdup(pbs_python_object_str(py_env));
				if (env_str == NULL) {
					log_err(PBSE_INTERNAL, __func__,
						"Failed to strdup progname parameter!");
					goto event_to_request_exit;
				}
				*((char **) (req_params->env)) = env_str;

				/* populate vnodelist_fail event param */
				if (populate_svrattrl_from_vnodelist_param(PY_EVENT_PARAM_VNODELIST_FAIL, (pbs_list_head *) (req_params->vns_list_fail))) {
					goto event_to_request_exit;
				}
			}

			/* fall through here */
		case HOOK_EVENT_EXECHOST_PERIODIC:
		case HOOK_EVENT_EXECHOST_STARTUP:

			/* populate vnodelist event param */
			if (populate_svrattrl_from_vnodelist_param(PY_EVENT_PARAM_VNODELIST, (pbs_list_head *) (req_params->vns_list))) {
				goto event_to_request_exit;
			}
			print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", (pbs_list_head *) (req_params->vns_list));
			Py_CLEAR(py_attr_keys);

			if (hook_event == HOOK_EVENT_EXECHOST_PERIODIC) {

				py_joblist = _pbs_python_event_get_param(PY_EVENT_PARAM_JOBLIST);
				if (!py_joblist) {
					log_err(PBSE_INTERNAL, __func__,
						"No job list parameter found for event!");
					goto event_to_request_exit;
				}

				if (!PyDict_Check(py_joblist)) {
					log_err(PBSE_INTERNAL, __func__,
						"job list parameter not a dictionary!");
					goto event_to_request_exit;
				}

				py_attr_keys = PyDict_Keys(py_joblist); /* NEW ref */

				if (py_attr_keys == NULL) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "Failed to obtain object's '%s' keys",
						 PY_EVENT_PARAM_JOBLIST);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					goto event_to_request_exit;
				}

				if (!PyList_Check(py_attr_keys)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object's '%s' keys is not a list!",
						 PY_EVENT_PARAM_JOBLIST);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					Py_CLEAR(py_attr_keys);
					goto event_to_request_exit;
				}

				num_attrs = PyList_Size(py_attr_keys);

				for (i = 0; i < num_attrs; i++) {

					key_str = strdup(pbs_python_list_get_item_string_value(
						py_attr_keys, i));

					if ((key_str == NULL) || (key_str[0] == '\0')) {
						if (key_str != NULL) {
							free(key_str);
						}
						continue;
					}

					py_job = PyDict_GetItemString(py_joblist,
								      key_str); /* borrowed */

					if (py_job == NULL) {
						snprintf(log_buffer, sizeof(log_buffer) - 1,
							 "failed to get attribute '%s' value", key_str);
						log_err(PBSE_INTERNAL, __func__, log_buffer);
						Py_CLEAR(py_attr_keys);
						free(key_str);
						goto event_to_request_exit;
					}

					if (pbs_python_populate_svrattrl_from_python_class(py_job,
											   (pbs_list_head *) (req_params->jobs_list), key_str, 1) == -1) {
						snprintf(log_buffer, sizeof(log_buffer) - 1,
							 "failed to populate svrattrl with key '%s' value", key_str);
						log_err(PBSE_INTERNAL, __func__, log_buffer);
						Py_CLEAR(py_attr_keys);
						free(key_str);
						goto event_to_request_exit;
					}

					deletejob_flag = pbs_python_object_get_attr_integral_value(py_job,
												   PY_DELETEJOB_FLAG);
					if (deletejob_flag != -1) {
						if (deletejob_flag == 1) {
							strcpy(val_str, "True");
						} else {
							strcpy(val_str, "False");
						}
						if (add_to_svrattrl_list(
							    (pbs_list_head *) (req_params->jobs_list),
							    PY_DELETEJOB_FLAG, NULL, val_str,
							    ATR_VFLAG_HOOK, key_str) == -1) {
							snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to add_to_svrattrl_list(%s.%s,null,%s)",
								 key_str, PY_DELETEJOB_FLAG, val_str);
							log_buffer[LOG_BUF_SIZE - 1] = '\0';
							log_err(errno, __func__, log_buffer);
							Py_CLEAR(py_attr_keys);
							free(key_str);
							goto event_to_request_exit;
						}
					}

					rerunjob_flag = pbs_python_object_get_attr_integral_value(py_job,
												  PY_RERUNJOB_FLAG);
					if (rerunjob_flag != -1) {
						if (rerunjob_flag == 1) {
							strcpy(val_str, "True");
						} else {
							strcpy(val_str, "False");
						}
						if (add_to_svrattrl_list(
							    (pbs_list_head *) (req_params->jobs_list),
							    PY_RERUNJOB_FLAG, NULL,
							    val_str, ATR_VFLAG_HOOK, key_str) == -1) {
							snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to add_to_svrattrl_list(%s.%s,null,%s)",
								 key_str, PY_RERUNJOB_FLAG, val_str);
							log_buffer[LOG_BUF_SIZE - 1] = '\0';
							log_err(errno, __func__, log_buffer);
							Py_CLEAR(py_attr_keys);
							free(key_str);
							goto event_to_request_exit;
						}
					}

					if (key_str != NULL) {
						free(key_str);
					}
				}
				Py_CLEAR(py_attr_keys);
				print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", (pbs_list_head *) (req_params->jobs_list));
			}

			break;
		case HOOK_EVENT_RESVSUB:

			py_resv = _pbs_python_event_get_param(PY_EVENT_PARAM_RESV);
			if (!py_resv) {
				log_err(PBSE_INTERNAL, __func__,
					"No resv parameter found for event!");
				goto event_to_request_exit;
			}
			if (pbs_python_populate_svrattrl_from_python_class(py_resv,
									   &((struct rq_queuejob *) (req_params->rq_job))->rq_attr, NULL, 0) == -1) {
				goto event_to_request_exit;
			}

			print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", &((struct rq_queuejob *) (req_params->rq_job))->rq_attr);
			break;
		case HOOK_EVENT_MODIFYRESV:

			py_resv = _pbs_python_event_get_param(PY_EVENT_PARAM_RESV);
			if (!py_resv) {
				log_err(PBSE_INTERNAL, __func__,
					"No resv parameter found for event!");
				goto event_to_request_exit;
			}

			py_resv_o = _pbs_python_event_get_param(PY_EVENT_PARAM_RESV_O);
			if (!py_resv_o) {
				log_err(PBSE_INTERNAL, __func__,
					"No resv_o parameter found for event!");
				goto event_to_request_exit;
			}

			/* Need to check if ATTR_v (i.e. Variable_list) changed, and if */
			/* so, needs to be sent with the MODIFYRESV request.	            */

			if (PyObject_HasAttrString(py_resv, ATTR_v))
				py_varlist = PyObject_GetAttrString(py_resv, ATTR_v); /* NEW */

			if (PyObject_HasAttrString(py_resv_o, ATTR_v))
				py_varlist_o = PyObject_GetAttrString(py_resv_o, ATTR_v);
			/* NEW */

			if ((py_varlist != NULL) && (py_varlist_o != NULL) &&
			    (PyObject_RichCompareBool(py_varlist, py_varlist_o, Py_EQ))) {
				/* upon success, py_resv decreases ref count to py_varlist */
				(void) PyObject_SetAttrString(py_resv, ATTR_v, Py_None);
			}

			Py_CLEAR(py_varlist);
			Py_CLEAR(py_varlist_o);

			if (pbs_python_populate_svrattrl_from_python_class(py_resv,
									   &((struct rq_manage *) (req_params->rq_manage))->rq_attr, NULL, 0) == -1) {
				goto event_to_request_exit;
			}
			print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", &((struct rq_manage *) (req_params->rq_manage))->rq_attr);
			break;

		case HOOK_EVENT_MODIFYJOB:

			py_job = _pbs_python_event_get_param(PY_EVENT_PARAM_JOB);
			if (!py_job) {
				log_err(PBSE_INTERNAL, __func__,
					"No job parameter found for event!");
				goto event_to_request_exit;
			}

			py_job_o = _pbs_python_event_get_param(PY_EVENT_PARAM_JOB_O);
			if (!py_job_o) {
				log_err(PBSE_INTERNAL, __func__,
					"No job_o parameter found for event!");
				goto event_to_request_exit;
			}

			/* Need to check if ATTR_v (i.e. Variable_list) changed, and if */
			/* so, needs to be sent with the MODIFYJOB request.	            */

			if (PyObject_HasAttrString(py_job, ATTR_v))
				py_varlist = PyObject_GetAttrString(py_job, ATTR_v); /* NEW */

			if (PyObject_HasAttrString(py_job_o, ATTR_v))
				py_varlist_o = PyObject_GetAttrString(py_job_o, ATTR_v);
			/* NEW */

			if ((py_varlist != NULL) && (py_varlist_o != NULL) &&
			    (PyObject_RichCompareBool(py_varlist, py_varlist_o, Py_EQ))) {
				/* upon success, py_job decreases ref count to py_varlist */
				(void) PyObject_SetAttrString(py_job, ATTR_v, Py_None);
			}

			Py_CLEAR(py_varlist);
			Py_CLEAR(py_varlist_o);

			if (pbs_python_populate_svrattrl_from_python_class(py_job,
									   &((struct rq_manage *) (req_params->rq_manage))->rq_attr, NULL, 0) == -1) {
				goto event_to_request_exit;
			}
			print_svrattrl_list("pbs_populate_svrattrl_from_python_class==>", &((struct rq_manage *) (req_params->rq_manage))->rq_attr);
			break;
		case HOOK_EVENT_MOVEJOB:

			py_job = _pbs_python_event_get_param(PY_EVENT_PARAM_JOB);
			if (!py_job) {
				log_err(PBSE_INTERNAL, __func__,
					"No job parameter found for event!");
				goto event_to_request_exit;
			}
			queue = pbs_python_object_get_attr_string_value(py_job,
									ATTR_queue);
			if (queue)
				strcpy(((struct rq_move *) (req_params->rq_move))->rq_destin, queue);

			break;
		case HOOK_EVENT_PERIODIC:
			py_vnodelist = _pbs_python_event_get_param(PY_EVENT_PARAM_VNODELIST);
			if (!py_vnodelist) {
				log_err(PBSE_INTERNAL, __func__,
					"No vnode list parameter found for event!");
				goto event_to_request_exit;
			}

			if (!PyDict_Check(py_vnodelist)) {
				log_err(PBSE_INTERNAL, __func__,
					"vnode list parameter not a dictionary!");
				goto event_to_request_exit;
			}

			py_attr_keys = PyDict_Keys(py_vnodelist); /* NEW ref */

			if (py_attr_keys == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "Failed to obtain object's '%s' keys",
					 PY_EVENT_PARAM_VNODE);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto event_to_request_exit;
			}

			if (!PyList_Check(py_attr_keys)) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "object's '%s' keys is not a list!",
					 PY_EVENT_PARAM_VNODE);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				Py_CLEAR(py_attr_keys);
				goto event_to_request_exit;
			}

			num_attrs = PyList_Size(py_attr_keys);
			for (i = 0; i < num_attrs; i++) {

				key_str = strdup(pbs_python_list_get_item_string_value(
					py_attr_keys, i));

				if ((key_str == NULL) || (key_str[0] == '\0')) {
					if (key_str != NULL) {
						free(key_str);
						key_str = NULL;
					}
					continue;
				}

				py_vnode = PyDict_GetItemString(py_vnodelist, key_str);

				if (py_vnode == NULL) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "failed to get attribute '%s' value", key_str);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					Py_CLEAR(py_attr_keys);
					free(key_str);
					key_str = NULL;
					goto event_to_request_exit;
				}

				if (pbs_python_populate_svrattrl_from_python_class(py_vnode,
										   (pbs_list_head *) (req_params->vns_list), key_str, 1) == -1) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "failed to populate svrattrl with key '%s' value", key_str);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					Py_CLEAR(py_attr_keys);
					free(key_str);
					key_str = NULL;
					goto event_to_request_exit;
				}
				free(key_str);
			}
			Py_CLEAR(py_attr_keys);

			py_resvlist = _pbs_python_event_get_param(PY_EVENT_PARAM_RESVLIST);
			if (!py_resvlist) {
				log_err(PBSE_INTERNAL, __func__,
					"No reservation list parameter found for event!");
				goto event_to_request_exit;
			}

			if (!PyDict_Check(py_resvlist)) {
				log_err(PBSE_INTERNAL, __func__,
					"reservation list parameter not a dictionary!");
				goto event_to_request_exit;
			}

			py_attr_keys = PyDict_Keys(py_resvlist); /* NEW ref */

			if (py_attr_keys == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "Failed to obtain object's '%s' keys",
					 PY_EVENT_PARAM_RESVLIST);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto event_to_request_exit;
			}

			if (!PyList_Check(py_attr_keys)) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "object's '%s' keys is not a list!",
					 PY_EVENT_PARAM_RESVLIST);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				Py_CLEAR(py_attr_keys);
				goto event_to_request_exit;
			}

			num_attrs = PyList_Size(py_attr_keys);

			for (i = 0; i < num_attrs; i++) {

				key_str = strdup(pbs_python_list_get_item_string_value(
					py_attr_keys, i));

				if ((key_str == NULL) || (key_str[0] == '\0')) {
					if (key_str != NULL) {
						free(key_str);
					}
					continue;
				}

				py_job = PyDict_GetItemString(py_resvlist,
							      key_str); /* borrowed */

				if (py_job == NULL) {
					snprintf(log_buffer, sizeof(log_buffer) - 1,
						 "failed to get attribute '%s' value", key_str);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					Py_CLEAR(py_attr_keys);
					free(key_str);
					goto event_to_request_exit;
				}

				if (pbs_python_populate_svrattrl_from_python_class(py_job,
										   (pbs_list_head *) (req_params->resv_list), key_str, 1) == -1) {
					snprintf(log_buffer, sizeof(log_buffer) - 1,
						 "failed to populate svrattrl with key '%s' value", key_str);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					Py_CLEAR(py_attr_keys);
					free(key_str);
					goto event_to_request_exit;
				}

				free(key_str);
			}
			Py_CLEAR(py_attr_keys);

			break;
		default:
			log_err(PBSE_INTERNAL, __func__,
				"unexpected hook event type");
			goto event_to_request_exit;
	}
	rc = 0;
event_to_request_exit:
	hook_perf_stat_stop(perf_label, perf_action, 0);
	return rc;
}

/**
 * @brief
 *  	Allows the current PBS event request to proceed.
 */
void
_pbs_python_event_accept(void)
{

	hook_pbsevent_accept = TRUE;
}

/**
 * @brief
 *  	Reject the current PBS event request.
 */
void
_pbs_python_event_reject(char *msg)
{

	hook_pbsevent_accept = FALSE;
	memset(hook_pbsevent_reject_msg, '\0', HOOK_MSG_SIZE);
	if (msg) {
		snprintf(hook_pbsevent_reject_msg, HOOK_MSG_SIZE - 1, "%s", msg);
	}
}

/**
 * @brief
 * 	Returns the message string supplied in the hook script when it rejected
 * 	an event request.
 */
char *
_pbs_python_event_get_reject_msg(void)
{
	if (hook_pbsevent_reject_msg[0] != '\0')
		return ((char *) hook_pbsevent_reject_msg);
	return NULL;
}

/**
 * @brief
 * 	Returns the value of the event accept flag (1 for TRUE or 0 for FALSE).
 */
int
_pbs_python_event_get_accept_flag(void)
{
	return (hook_pbsevent_accept);
}

/**
 * @brief
 * 	Sets a global flag that says modifications to the PBS Python
 * 	attributes are allowed.
 */
void
_pbs_python_event_param_mod_allow(void)
{

	hook_pbsevent_stop_processing = FALSE;
}

/**
 * @brief
 * 	Sets a global flag that says any more modifications to the PBS Python
 * 	attributes would be disallowed.
 */
void
_pbs_python_event_param_mod_disallow(void)
{

	hook_pbsevent_stop_processing = TRUE;
}

/**
 * @brief
 * 	Returns the value (0 or 1) of the global flag that says whether or not
 * 	modifications to the PBS Python attributes is allowed.
 */
int
_pbs_python_event_param_get_mod_flag(void)
{
	return (hook_pbsevent_stop_processing);
}

/**
 * @brief
 * 	Sets the value of the attribute 'name' of the current Python Object event
 * 	to a string 'value'. The descriptor for the attribute will take care of
 * 	converting to an actual type.
 *
 * @param[in] name - attribute name
 * @param[in] value - attr value
 *
 * @param[in]
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 */
int
_pbs_python_event_set_attrval(char *name, char *value)
{
	int rc;

	if ((name == NULL) || (value == NULL)) {
		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, __func__, "Got a NULL 'name' or 'value'");
		return -1;
	}

	if (py_hook_pbsevent == NULL) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "can't set event attribute %s = %s: event is unset", name, value);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, __func__, log_buffer);
		return -1;
	}

	rc = pbs_python_object_set_attr_string_value(py_hook_pbsevent, name, value);

	if (rc == -1) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "failed to set event attribute %s = %s", name, value);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, __func__, log_buffer);
		return -1;
	}

	return (0);
}
/**
 * @brief
 * 	Gets the value of the attribute 'name' of the current Python Object event
 * 	as a string.
 *
 * @param[in] name - attr name
 *
 * @return	char *
 * @retval	attr name	success
 * @retval	NULL  		if it doesn't find one.
 */
char *
_pbs_python_event_get_attrval(char *name)
{
	PyObject *py_attrval = NULL;
	char *attrval_str = NULL;

	if (name == NULL) {
		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, __func__, "Got a NULL 'name'");
		return NULL;
	}

	if (py_hook_pbsevent == NULL) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "can't get event attribute %s: event is unset", name);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';

		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, __func__, log_buffer);
		return NULL;
	}

	if (!PyObject_HasAttrString(py_hook_pbsevent, name)) {
		return NULL;
	}

	py_attrval = PyObject_GetAttrString(py_hook_pbsevent, name); /* NEW */

	if (py_attrval) {
		PyArg_Parse(py_attrval, "s", &attrval_str);
		Py_DECREF(py_attrval);
	}
	return (attrval_str);
}

/*
 * --------------------- MODULE METHODS ---------------------------------
 */
/*
 * Create a queue object and stuff the attributes
 */
/* pbs_v1_module method get_queue */

const char pbsv1mod_meth_get_queue_doc[] =
	"get_queue(strName)\n\
  where:\n\
\n\
   strName:  name of the queue to retrieve\n\
\n\
  returns:\n\
         instance of _queue type representing queue 'strName'\n\
";

/**
 * @brief
 *	Create a queue object and stuff the attributes.
 *
 * @par	strName:  name of the queue to retrieve.
 *
 * @return	PyObject*
 * @retval	instance of _queue type representing queue 'strName'	success
 * @retval	NULL							error
 */
PyObject *
pbsv1mod_meth_get_queue(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"name", NULL};

	char *name = NULL;
	PyObject *py_que = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s:get_queue",
					 kwlist,
					 &name)) {
		return NULL;
	}

	hook_set_mode = C_MODE;
	py_que = _pps_helper_get_queue(NULL, name, HOOK_PERF_FUNC);
	hook_set_mode = PY_MODE;

	if (py_que != NULL)
		return py_que;
	else
		Py_RETURN_NONE;
}

/*
 * Create a job object and stuff the attributes
 */
/* pbs_v1_module method get_job */

const char pbsv1mod_meth_get_job_doc[] =
	"get_job(strName, strQueue)\n\
  where:\n\
\n\
   strName:  name of the job to retrieve\n\
\n\
   strQueue:  name of the queue where job belongs to\n\
\n\
  returns:\n\
         instance of _job type representing job 'strName' in 'strQueue'; or\n\
         None if no job was found or job 'strName' is not part of 'strQueue'\n\
";

/**
 * @brief
 *	Create a job object and stuff the attributes
 *
 * @par Note:
 *	strName:  name of the job to retrieve\n\
 *	strQueue:  name of the queue where job belongs to\n\
 *
 * @return	PyObject*
 * @retval	instance of _job type representing job 'strName' in 'strQueue'		success
 * @retval	None if no job was found or job 'strName' is not part of 'strQueue'	error
 */
PyObject *
pbsv1mod_meth_get_job(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {PY_TYPE_JOB, PY_TYPE_QUEUE, NULL};

	char *jname = NULL;
	char *qname = NULL;
	PyObject *py_job = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s|s:get_job",
					 kwlist,
					 &jname,
					 &qname)) {
		return NULL;
	}

	hook_set_mode = C_MODE;
	py_job = _pps_helper_get_job(NULL, jname, qname, HOOK_PERF_FUNC);
	hook_set_mode = PY_MODE;

	if (py_job != NULL)
		return py_job;
	else
		Py_RETURN_NONE;
}

/*
 * Create a resv object and stuff the attributes
 */
/* pbs_v1_module method get_resv */

const char pbsv1mod_meth_get_resv_doc[] =
	"get_resv(strName)\n\
  where:\n\
\n\
   strName:  name of the resv to retrieve\n\
\n\
  returns:\n\
         instance of _resv type representing resv 'strName'; or\n\
         None if no resv was found.\n\
";

/**
 * @brief
 *	Create a resv object and stuff the attributes
 *
 * @par	Note:
 *	strName:  name of the resv to retrieve.
 *
 * @return	PyObject *
 * @retval	instance of _resv type representing resv 'strName'	success
 * @retval	None							if no resv was found.
 *
 */
PyObject *
pbsv1mod_meth_get_resv(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {PY_TYPE_RESV, NULL};

	char *rname = NULL;
	PyObject *py_resv = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s:get_resv",
					 kwlist,
					 &rname)) {
		return NULL;
	}

	hook_set_mode = C_MODE;
	py_resv = _pps_helper_get_resv(NULL, rname, HOOK_PERF_FUNC);
	hook_set_mode = PY_MODE;

	if (py_resv != NULL)
		return py_resv;
	else
		Py_RETURN_NONE;
}

/*
 * Create a vnode object and stuff the attributes
 */
/* pbs_v1_module method get_vnode */

const char pbsv1mod_meth_get_vnode_doc[] =
	"get_vnode(strVname)\n\
  where:\n\
\n\
   strVname:  name of the vnode to retrieve\n\
\n\
  returns:\n\
         instance of _vnode type representing vnode 'strVname'; or\n\
         None if no vnode was found.\n\
";
/**
 * @brief
 *	This is the C->Python wrapper program to _pps_helper_get_vnode()
 *	that is callable in Python script.
 *
 * @param[in]	args[1]	- the vnode name passed by the Python function invoking
 *			this function.
 *
 * @return	PyObject *	- the Python vnode object corresponding
 *				to args[1].
 *
 */
PyObject *
pbsv1mod_meth_get_vnode(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {PY_TYPE_VNODE, NULL};

	char *vname = NULL;
	PyObject *py_vnode = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s:get_vnode",
					 kwlist,
					 &vname)) {
		return NULL;
	}

	hook_set_mode = C_MODE;
	py_vnode = _pps_helper_get_vnode(NULL, vname, HOOK_PERF_FUNC);
	hook_set_mode = PY_MODE;

	if (py_vnode != NULL)
		return py_vnode;
	else
		Py_RETURN_NONE;
}

/*
 * Create a server object and stuff the attributes
 */
/* pbs_v1_module method server */

const char pbsv1mod_meth_server_doc[] =
	"server([strName])\n\
      [strName] is an optional argument referring the server host name to\n\
             query. Use of this argument is currently not implemented.\n\
    returns:\n\
         instance of _server type representing the local server if\n\
	 'strName' is not given.\n\
 Methods:\n\
   Obtain information about the local server:\n\
      s = pbs.server()\n\
      s.pbs_version	 -> returns the PBS version\n\
      s.job(22.fest)	 -> returns a job in server\n\
\n\
   Obtain information about a queue in the local server:\n\
      q = s.queue(workq)\n\
      q.total_jobs	 -> returns the # of jobs on workq\n\
      q.job(22.fest)	 -> returns a job in the queue\n\
";

/**
 * @brief
 *	Create a server object and stuff the attributes.
 *
 * @par	Note:
 *	[strName] is an optional argument referring the server host name to
 *	query. Use of this argument is currently not implemented.
 *
 * @return	PyObject *
 * @retval	instance of _server type representing the local server if strname not given
 *
 */

PyObject *
pbsv1mod_meth_server(void)
{
	PyObject *py_svr = NULL;
	hook_set_mode = C_MODE;
	py_svr = _pps_helper_get_server(HOOK_PERF_FUNC);
	hook_set_mode = PY_MODE;
	return (py_svr);
}

const char pbsv1mod_meth_in_python_mode_doc[] =
	"in_python_mode()\n\
\n\
  returns:\n\
         True if hook_set_mode is PY_MODE; False, otherwise.\n\
  	 This is an internal function.\n\
";

/**
 * @brief
 *	check hook_set_mode.
 *
 * @return	PyObject *
 * @retval	Py_True	if hook_set_mode is PY_MODE
 * @retval	Py_False	otherwise
 *
 * @par	This is an internal function
 */
PyObject *
pbsv1mod_meth_in_python_mode(void)
{
	PyObject *ret;
	ret = (hook_set_mode == PY_MODE) ? Py_True : Py_False;
	Py_INCREF(ret);
	return (ret);
}

const char pbsv1mod_meth_in_site_hook_doc[] =
	"in_site_hook()\n\
\n\
  returns:\n\
         True if executing under a HOOK_SITE hook; False, otherwise.\n\
	 This is an internal function.\n\
";

/**
 * @brief
 *	check whether hook_site.
 *
 * @return	PyObject *
 * @retval	Py_True	if executing under a HOOK_SITE hook
 * @retval	Py_False	otherwise
 */
PyObject *
pbsv1mod_meth_in_site_hook(void)
{
	PyObject *ret;
	char *hook_type;

	hook_type = _pbs_python_event_get_attrval(PY_EVENT_HOOK_TYPE);

	if ((hook_type != NULL) && (strcmp(hook_type, HOOKSTR_SITE) == 0))
		ret = Py_True;
	else
		ret = Py_False;

	Py_INCREF(ret);
	return (ret);
}

const char pbsv1mod_meth_is_attrib_val_settable_doc[] =
	"is_attrib_val_settable(self,owner,value)\n\
  where:\n\
\n\
   self    :  obj attribute name (e.g. Resource_List or Priority)\n\
   owner   :  obj resource name of self, if it is a resource (e.g. ncpus)\n\
   value   :  obj value being set to\n\
\n\
  returns:\n\
         True, False, or an exception\n\
";

/**
 *
 * @brief
 *	Returns Python True if some object attribute name/resource name
 *	is allowed to set its value.
 *
 * @param[in]	self	- owning object
 * @param[in]	args[1]	- object attribute name (ex. Resource_List/Priority)
 * 		args[2]	- object resource name (ex. ncpus)
 * 		args[3]	- object value being set to
 * @param[in]	kwds	- keywords to objects mappings
 *
 * @return	PyObject *
 * @retval	Python True	- if settable
 * @retval	Python False	- if not settable
 * @retval	NULL		- error
 *
 */
PyObject *
pbsv1mod_meth_is_attrib_val_settable(PyObject *self, PyObject *args, PyObject *kwds)
{
	PyObject *ret;
	static char *kwlist[] = {"self", "owner", "value", NULL};

	PyObject *py_self = NULL;
	PyObject *py_owner = NULL;
	PyObject *py_value = NULL;

	char *name = NULL;     /* malloc   */
	char *resource = NULL; /* malloced */
	char *pstr;

	PyObject *py_value_type = NULL;
	PyObject *py_value_type_0 = NULL;
	PyObject *py_value_type_0_derived = NULL;
	int readonly = 0;
	int is_resource = 0;
	unsigned int event;
	int attr_idx = -1;
	resource_def *rscdef = NULL;

	int rc = 1;

	if (hook_set_mode == C_MODE) { /* can set anything */
		ret = Py_True;
		Py_INCREF(ret);
		return (ret);
	}

	memset((char *) log_buffer, '\0', LOG_BUF_SIZE);

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "OOO:is_attrib_val_settable",
					 kwlist,
					 &py_self,
					 &py_owner,
					 &py_value)) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "in func %s, PyArg_ParseTupleAndKeywords failed!",
			 __func__);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		PyErr_SetString(PyExc_SyntaxError, log_buffer);
		goto IAVS_ERROR_EXIT;
	}

	/* at this point, we can have an unset attribute (without _is_resource) */
	/* or a set attribute; or an unset resource (without is_resource with  */
	/* 'name" as attribute), or a set resource */

	readonly = 0;
	if (PyObject_HasAttrString(py_owner, "_readonly")) {
		readonly = pbs_python_object_get_attr_integral_value(py_owner,
								     PY_READONLY_FLAG);
	}

	is_resource = 0;
	if (PyObject_HasAttrString(py_self, PY_DESCRIPTOR_IS_RESOURCE)) {
		is_resource = pbs_python_object_get_attr_integral_value(py_self,
									PY_DESCRIPTOR_IS_RESOURCE);
	}

	if (is_resource == 1) {

		if (PyObject_HasAttrString(py_owner, PY_RESOURCE_NAME)) {
			/* e.g. Resource_List */
			pstr = pbs_python_object_get_attr_string_value(py_owner,
								       PY_RESOURCE_NAME);
			if (pstr) {
				if ((name = strdup(pstr)) == NULL) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "in func %s, Unable to allocate Memory!\n", __func__);
					PyErr_SetString(PyExc_MemoryError, log_buffer);
					goto IAVS_ERROR_EXIT;
				}
			}
		}

		if (PyObject_HasAttrString(py_self, PY_DESCRIPTOR_NAME)) {
			/* e.g. ncpus */
			pstr = pbs_python_object_get_attr_string_value(py_self,
								       PY_DESCRIPTOR_NAME);
			if (pstr) {
				if ((resource = strdup(pstr)) == NULL) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "in func %s, Unable to allocate Memory!\n", __func__);
					PyErr_SetString(PyExc_MemoryError, log_buffer);
					goto IAVS_ERROR_EXIT;
				}
			}
		}
	} else { /* 0 or -1 (not yet set, assume attribute) */
		if (PyObject_HasAttrString(py_self, PY_DESCRIPTOR_NAME)) {
			/* e.g. ncpus */
			pstr = pbs_python_object_get_attr_string_value(py_self,
								       PY_DESCRIPTOR_NAME);
			if (pstr) {
				if ((name = strdup(pstr)) == NULL) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "in func %s, Unable to allocate Memory!\n", __func__);
					PyErr_SetString(PyExc_MemoryError, log_buffer);
					goto IAVS_ERROR_EXIT;
				}
			}
		}
		if ((resource = strdup("")) == NULL) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "in func %s, Unable to allocate Memory!\n", __func__);
			PyErr_SetString(PyExc_MemoryError, log_buffer);
			goto IAVS_ERROR_EXIT;
		}
	}

	if (!name || !resource) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "name and/or resource is NULL: name=%s resource=%s",
			 (name ? name : "null"), (resource ? resource : "null"));
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		PyErr_SetString(PyExc_AssertionError, log_buffer);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto IAVS_ERROR_EXIT;
	}

	/* do some sanity checking */

	if (name[0] == '\0') {
		PyErr_SetString(PyExc_AssertionError, "No attribute name found");
		goto IAVS_ERROR_EXIT;
	}

	/* specia case: bypass a pbs_resource with default value */
	if ((is_resource == 1) && (strcmp(name, PY_RESOURCE_GENERIC_VALUE) == 0) && (strcmp(resource, PY_RESOURCE_NAME) == 0)) {
		rc = 0; /* return True */
		goto IAVS_OK_EXIT;
	}

	if (hook_pbsevent_stop_processing) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "Not permitted to modify attributes (name=%s,res=%s): an event.accept() or event.reject() already called.", name, resource);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		PyErr_SetString(PyExc_AssertionError, log_buffer);
		/* throw an exception */
		goto IAVS_ERROR_EXIT;
	}

	if (readonly) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "attribute '%s' is part of a readonly object", name);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		PyErr_SetString(
			pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
			log_buffer);
		/* throw an exception */
		goto IAVS_ERROR_EXIT;
	}
	if (!py_hook_pbsevent) {
		PyErr_SetString(PyExc_AssertionError, "Event not found");
		goto IAVS_ERROR_EXIT;
	}
	/* Variable_List can not be set in a python script, only individual */
	/* environment=variable settings can via dictionary setitem. */
	if (strcmp(name, ATTR_v) == 0) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "attribute '%s' cannot be directly set.", name);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		PyErr_SetString(
			pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
			log_buffer);
		goto IAVS_ERROR_EXIT;
	}

	event = pbs_python_object_get_attr_integral_value(py_hook_pbsevent, "type");
	switch (event) {
		case HOOK_EVENT_QUEUEJOB:
		case HOOK_EVENT_POSTQUEUEJOB:
		case HOOK_EVENT_MODIFYJOB:
			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_JOB_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class)) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "Can only set job,resource attributes under %s event.", ((event == HOOK_EVENT_QUEUEJOB) ? "queuejob" : "modifyjob"));
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			if (in_string_list(name, ',', PY_PYTHON_DEFINED_ATTRIBUTES)) {
				if ((strcmp(name, PY_RESOURCE_NAME) == 0) || (strcmp(name, PY_RESOURCE_HAS_VALUE) == 0)) {
					/* matched a special, internal-only attribute */
					/* holding the resc name, has_value (e.g. "Resource_List") */
					goto IAVS_OK_EXIT;
				}

				snprintf(log_buffer, LOG_BUF_SIZE - 1, "attribute '%s' is readonly", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			if ((event == HOOK_EVENT_QUEUEJOB) &&
			    strcmp(name, ATTR_queue) == 0) {
				break; /* ok to modify queue under qsub */
			}

			attr_idx = find_attr(job_attr_idx, job_attr_def, name);
			if (attr_idx == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "job attribute '%s' not found", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_LookupError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			if ((job_attr_def[attr_idx].at_flags & ATR_DFLAG_HOOK_SET) == 0) {
				/* ATTR_J, ATTR_cred override any read-only permission seen */
				if ((strcmp(name, ATTR_J) != 0) &&
				    (strcmp(name, ATTR_cred) != 0)) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "job attribute '%s' is readonly", name);
					log_buffer[LOG_BUF_SIZE - 1] = '\0';
					PyErr_SetString(pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class, log_buffer);
					goto IAVS_ERROR_EXIT;
				}
			}
			if (resource && (resource[0] != '\0')) {
				rscdef = find_resc_def(svr_resc_def, resource);
				if (!rscdef) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "resource attribute '%s' not found", resource);
					log_buffer[LOG_BUF_SIZE - 1] = '\0';
					PyErr_SetString(PyExc_LookupError, log_buffer);
					goto IAVS_ERROR_EXIT;
				}
				if ((rscdef->rs_flags & ATR_DFLAG_HOOK_SET) == 0) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "resource attribute '%s' is readonly", name);
					log_buffer[LOG_BUF_SIZE - 1] = '\0';
					PyErr_SetString(pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class, log_buffer);
					goto IAVS_ERROR_EXIT;
				}
			} else if (ATTR_IS_RESC(&job_attr_def[attr_idx])) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "can't set the head resource '%s' directly ", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			break;
		case HOOK_EVENT_EXECJOB_BEGIN:
		case HOOK_EVENT_EXECJOB_PROLOGUE:
		case HOOK_EVENT_EXECJOB_EPILOGUE:
		case HOOK_EVENT_EXECJOB_END:
		case HOOK_EVENT_EXECJOB_ABORT:
		case HOOK_EVENT_EXECJOB_POSTSUSPEND:
		case HOOK_EVENT_EXECJOB_PRERESUME:
		case HOOK_EVENT_EXECJOB_PRETERM:
			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_JOB_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_VNODE_IDX].t_class)) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "Can only set job,resource,vnode attributes under %s event.", "mom hook");
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}
			break;

		case HOOK_EVENT_EXECJOB_LAUNCH:
			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_EVENT_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_JOB_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_VNODE_IDX].t_class)) {
				snprintf(log_buffer, LOG_BUF_SIZE,
					 "Can only set progname, argv, env event parameters as well as job, resource, vnode under %s hook.", HOOKSTR_EXECJOB_LAUNCH);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}
			break;

		case HOOK_EVENT_EXECJOB_ATTACH:
			PyErr_SetString(PyExc_AssertionError, "nothing is settable inside an execjob_attach hook!");
			goto IAVS_ERROR_EXIT;

		case HOOK_EVENT_EXECJOB_RESIZE:
			PyErr_SetString(PyExc_AssertionError, "nothing is settable inside an execjob_resize hook!");
			goto IAVS_ERROR_EXIT;

		case HOOK_EVENT_EXECHOST_PERIODIC:
			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_VNODE_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_JOB_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class)) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "Can only set node,resource,job attributes under %s event.", (event == HOOK_EVENT_EXECHOST_PERIODIC) ? HOOKSTR_EXECHOST_PERIODIC : HOOKSTR_EXECHOST_STARTUP);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			break;
		case HOOK_EVENT_EXECHOST_STARTUP:
			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_VNODE_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class)) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "Can only set node,resource attributes under %s event.", (event == HOOK_EVENT_EXECHOST_PERIODIC) ? HOOKSTR_EXECHOST_PERIODIC : HOOKSTR_EXECHOST_STARTUP);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			break;
		case HOOK_EVENT_RESVSUB:
		case HOOK_EVENT_MODIFYRESV:
			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESV_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class)) {
				PyErr_SetString(PyExc_AssertionError, "Can only set job attributes under resvsub event.");
				goto IAVS_ERROR_EXIT;
			}
			if (in_string_list(name, ',', PY_PYTHON_DEFINED_ATTRIBUTES)) {
				if ((strcmp(name, PY_RESOURCE_NAME) == 0) || (strcmp(name, PY_RESOURCE_HAS_VALUE) == 0)) {
					/* matched a special, internal-only attribute */
					/* holding the resc name, has_value (e.g. "Resource_List") */
					goto IAVS_OK_EXIT;
				}
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "attribute '%s' is readonly", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class, log_buffer);
				goto IAVS_ERROR_EXIT;
			}
			attr_idx = find_attr(resv_attr_idx, resv_attr_def, name);
			if (attr_idx == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "resv attribute '%s' not found", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_LookupError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			if ((resv_attr_def[attr_idx].at_flags & ATR_DFLAG_HOOK_SET) == 0) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "resv attribute '%s' is readonly", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class, log_buffer);
				goto IAVS_ERROR_EXIT;
			}
			if (resource && (resource[0] != '\0')) {
				rscdef = find_resc_def(svr_resc_def, resource);

				if (!rscdef) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "resv resource attribute '%s' not found", resource);
					log_buffer[LOG_BUF_SIZE - 1] = '\0';
					PyErr_SetString(PyExc_LookupError, log_buffer);
					goto IAVS_ERROR_EXIT;
				}

				if ((rscdef->rs_flags & ATR_DFLAG_HOOK_SET) == 0) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "resv resource attribute '%s' is readonly", resource);
					log_buffer[LOG_BUF_SIZE - 1] = '\0';
					PyErr_SetString(pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class, log_buffer);
					goto IAVS_ERROR_EXIT;
				}
			} else if (ATTR_IS_RESC(&resv_attr_def[attr_idx])) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "can't set the head resv resource '%s' directly ", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			break;
		case HOOK_EVENT_MOVEJOB:

			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_JOB_IDX].t_class)) {
				PyErr_SetString(PyExc_AssertionError, "Can only set job attributes under MOVEJOB event.");
				goto IAVS_ERROR_EXIT;
			}

			if (strcmp(name, ATTR_queue) != 0) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "Can only set job's 'queue' attribute under MOVEJOB event - "
								       "got <%s>",
					 name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}
			break;
		case HOOK_EVENT_RUNJOB:

			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_JOB_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_VNODE_IDX].t_class)) {
				PyErr_SetString(PyExc_AssertionError, "Can only set job,vnode attributes under RUNJOB event.");
				goto IAVS_ERROR_EXIT;
			}

			/*
			 * If its a job object, then 'name' below will be refer to the job
			 * attribute name  for example Output_Path, Priority, etc. If it's
			 * a resource object, then 'name'  will actually refer to the jobs
			 * resource list like Resource_List, resources_used, etc...
			 *  Resource_List is fine since  it is listed in the
			 * runjob_modifiable_jobattrs (as ATTR_l). but if its resources_used
			 * for example, which is not in the runjob_modifiable_jobatrs, then if
			 * its not the vnode object, then issue error.
			 * If the parent is of vnode object but if 'name' is not the list of
			 * runjob_modifiable_vnattrs, then issue an error.
			 */
			if (!in_string_list(name, '|', runjob_modifiable_jobattrs) &&
			    (!PyObject_IsInstance(py_owner,
						  pbs_python_types_table[PP_VNODE_IDX].t_class) ||
			     !in_string_list(name, '|', runjob_modifiable_vnattrs) != 0)) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 FMT_RUNJOB_ERRMSG, runjob_modifiable_jobattrs,
					 runjob_modifiable_vnattrs, name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}

			break;
		case HOOK_EVENT_PERIODIC:
			if (!PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_VNODE_IDX].t_class) &&
			    !PyObject_IsInstance(py_owner,
						 pbs_python_types_table[PP_RESC_IDX].t_class)) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "Can only set node,resource attributes under %s event.", HOOKSTR_PERIODIC);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				goto IAVS_ERROR_EXIT;
			}
			break;
		default:
			PyErr_SetString(PyExc_AssertionError, "Unexpected event");
			goto IAVS_ERROR_EXIT;
	}

	/* Now check validity of the value */

	if (PyObject_HasAttrString(py_self, PY_DESCRIPTOR_VALUE_TYPE)) {
		py_value_type = PyObject_GetAttrString(py_self,
						       PY_DESCRIPTOR_VALUE_TYPE); /* NEW */
		if (!PyTuple_Check(py_value_type)) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "For name=%s res=%s, value type is not a tuple",
				 name, resource);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(PyExc_AssertionError, log_buffer);
			goto IAVS_ERROR_EXIT;
		}
	}

	if (py_value_type) {
		py_value_type_0 = PyTuple_GetItem(py_value_type, 0);
	}

	if (py_value_type_0) {
		if (PyObject_HasAttrString(py_value_type_0, PY_CLASS_DERIVED_TYPES)) {
			py_value_type_0_derived =
				PyObject_GetAttrString(py_value_type_0,
						       PY_CLASS_DERIVED_TYPES); /* NEW */
		}
	}

	/* Ok if py_value is None, or py_value is of py_value_type, or */
	/* py_value is of py_value_type_o_derived */
	if ((py_value != Py_None) &&
	    (py_value_type && !PyObject_IsInstance(py_value, py_value_type)) &&
	    (!py_value_type_0_derived || !PyObject_IsInstance(py_value,
							      py_value_type_0_derived))) {
		char cls[STRBUF];
		char att[STRBUF];
		char vtype[STRBUF];
		char dtype[STRBUF];
		int dlen = 0;
		char *the_dtype = NULL;
		char *msgbuf;

		memset(cls, '\0', STRBUF);
		memset(att, '\0', STRBUF);
		memset(vtype, '\0', STRBUF);
		memset(dtype, '\0', STRBUF);

		pstr = pbs_python_object_get_attr_string_value(py_self,
							       PY_DESCRIPTOR_CLASS_NAME);
		if (pstr)
			strncpy(cls, pstr, STRBUF - 1);

		pstr = pbs_python_object_get_attr_string_value(py_self,
							       PY_DESCRIPTOR_NAME);

		if (pstr)
			strncpy(att, pstr, STRBUF - 1);

		if (py_value_type) {
			strncpy(vtype,
				pbs_python_object_str(py_value_type), STRBUF - 1);
		}
		if (py_value_type_0_derived) {
			strncpy(dtype,
				pbs_python_object_str(py_value_type_0_derived), STRBUF - 1);
			the_dtype = dtype;
			dlen = strlen(dtype);
			/* clear extra leading '(' and trailing ',)' in */
			/* <derived_type> value if both appear. */
			if ((dtype[0] == '(') && (dlen >= 2) &&
			    (dtype[dlen - 2] == ',') && (dtype[dlen - 1] == ')')) {
				dtype[dlen - 2] = '\0';
				the_dtype = dtype + 1; /* move past leading '(' */
			}
		}

		pbs_asprintf(&msgbuf,
			     "value for class <%s> attribute <%s> must be 'None' or '%s%s%s'",
			     cls, att, vtype,
			     the_dtype ? "," : "",
			     the_dtype ? the_dtype : "");

		if (is_resource == 1)
			PyErr_SetString(
				pbs_python_types_table[PP_BAD_RESC_VTYPE_ERR_IDX].t_class,
				msgbuf);
		else
			PyErr_SetString(
				pbs_python_types_table[PP_BADATTR_VTYPE_ERR_IDX].t_class,
				msgbuf);
		free(msgbuf);
		goto IAVS_ERROR_EXIT;
	}

	if (strcmp(name, ATTR_a) == 0) {
		long exec_time = 0;
		int ret;

		/* parse floats nicely since time.time() returns floats */
		if (py_value != Py_None) {
			if (PyFloat_Check(py_value)) {
				double ftime;
				ret = PyArg_Parse(py_value, "d", &ftime);
				if (ret != 0)
					exec_time = (long) ftime;
			} else {
				ret = PyArg_Parse(py_value, "l", &exec_time);
			}

			/* if the parse worked but the time is in the past */
			if (ret == 0) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "exec_time could not be parsed");
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(
					pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
					log_buffer);
				rc = 1;
				goto IAVS_ERROR_EXIT;
			} else if (exec_time < time(0)) {
				char *str_time = NULL;

				str_time = ctime(&exec_time);
				if (str_time != NULL)
					str_time[strlen(str_time) - 1] = '\0';

				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "exec_time '%s' not in the future",
					 (str_time ? str_time : ""));
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(
					pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
					log_buffer);
				rc = 1;
				goto IAVS_ERROR_EXIT;
			}
		}
	} else if (strcmp(name, ATTR_runcount) == 0) {
		long runcount;

		if ((PyArg_Parse(py_value, "l", &runcount) == 0) ||
		    (runcount < 0)) {

			PyErr_SetString(
				pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
				"run_count value must be >= 0");
			rc = 1;
			goto IAVS_ERROR_EXIT;
		}
	}

	rc = 0;

IAVS_OK_EXIT:
	Py_CLEAR(py_value_type);
	Py_CLEAR(py_value_type_0_derived);
	free(name);
	free(resource);
	ret = (rc == 0) ? Py_True : Py_False;
	Py_INCREF(ret);
	return (ret);

IAVS_ERROR_EXIT:
	Py_CLEAR(py_value_type);
	Py_CLEAR(py_value_type_0_derived);
	free(name);
	free(resource);
	return NULL;
}

/*
 * Methods related to  hook_pbsevent_accept.
 */
/* pbs_v1_module method event */

const char pbsv1mod_meth_event_accept_doc[] =
	"event_accept()\n\
\n\
         make the current event to accept the corresponding request.\n\
";

/**
 * @brief
 *	make the current event to accept the corresponding request.
 *
 */
PyObject *
pbsv1mod_meth_event_accept(void)
{
	_pbs_python_event_accept();
	Py_RETURN_NONE;
}

const char pbsv1mod_meth_event_reject_doc[] =
	"event_reject()\n\
\n\
         make the current event to reject a corresponding request.\n\
";

/**
 * @brief
 *	make the current event to reject a corresponding request.
 */
PyObject *
pbsv1mod_meth_event_reject(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"message", NULL};
	char *emsg = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "|s:_event_reject",
					 kwlist,
					 &emsg)) {
		return NULL;
	}
	_pbs_python_event_reject(emsg);

	Py_RETURN_NONE;
}

/*
 * Methods related to  hook_pbsevent_stop_processing flag.
 */
/* pbs_v1_module method event */

const char pbsv1mod_meth_event_param_mod_allow_doc[] =
	"event_accept()\n\
\n\
         Allow changes to the event object's param.\n\
";

/**
 * @brief
 *	Allow changes to the event object's param.
 */
PyObject *
pbsv1mod_meth_event_param_mod_allow(void)
{
	_pbs_python_event_param_mod_allow();
	Py_RETURN_NONE;
}

const char pbsv1mod_meth_event_param_mod_disallow_doc[] =
	"event_reject()\n\
\n\
         Disallow changes to the event object's param.\n\
";

/**
 * @brief
 *	Disallow changes to the event object's param.
 */
PyObject *
pbsv1mod_meth_event_param_mod_disallow(PyObject *self)
{
	_pbs_python_event_param_mod_disallow();
	Py_RETURN_NONE;
}

/*
 * Create an event object and stuff the fixed attributes
 */
/* pbs_v1_module method event */

const char pbsv1mod_meth_event_doc[] =
	"event()\n\
\n\
     returns:\n\
         instance of _event type corresponding to the event that the\n\
	 current hook is responding to.\n\
\n\
    Event attributes:\n\
      e.type = {pbs.QUEUEJOB, pbs.MODIFYJOB, pbs.RESVSUB, pbs.MOVEJOB}\n\
      e. requestor - who made the request.\n\
   		   Special values: PBS_Server, Scheduler, pbs_mom\n\
\n\
      e.requestor_host  where the request came from.\n\
      e.hook_name  name of the hook being executed.\n\
\n\
    Event methods:\n\
      e.accept()       : accepts the current event request and raises SystemExit\n\
      e.reject([<msg>]): rejects the current event request and raises SystemExit\n\
		         Where <msg> shows up in STDERR of the originating\n\
			 command, and the PBS daemon log.\n\
\n\
    Event parameters:\n\
\n\
      If e.type is pbs.QUEUEJOB:   e.job\n\
	 e.job.<attribute_name> = <attribute_value>\n\
	 e.job.Priority = 7\n\
	 e.job.Resource_List[walltime] = pbs.duration(00:30:00)\n\
	 e.job.Resource_List[mem] = None\n\
\n\
      If e.type is pbs.MODIFYJOB:   e.job, e.job_o\n\
	 e.job.<attribute_name> = <attribute_value>  (where <attribute_name> != queue)\n\
\n\
      If e.type is pbs.RESVSU:   e.resv\n\
	 e.resv.<attribute_name> = <attribute_value>\n\
	 e.resv.Reserve_Name = Altair##\n\
	 e.resv.Resource_List[select] = pbs.select(5:ncpus=1:mem=2gb)\n\
\n\
      If e.type is pbs.MOVEJOB:   e.job, e.src_queue\n\
	 e.job.queue = pbs.server().queue(<destination_queue>)\n\
";

/**
 * @brief
 *      Returns the current Python event object (i.e. pbs.event()).
 *
 * @return the Python event object.
 * @retval	the current event object
 * @retval	None if no event found
 *
 */

PyObject *
pbsv1mod_meth_event(void)
{
	/* This function gets invoked in Python realm (i.e. hook script),     */
	/* which causes Python to think py_hook_pbsevent was created in that  */
	/* realm. Then under Python world, the returned py_hook_pbsevent      */
	/* gets its reference count decremented by 1 after every access.      */
	/* Continually decrementing the reference count would cause us to     */
	/* crash! So we need to bump up by 1 the count under the C realm, to  */
	/* match th decrements under the Python realm.			      */

	if (py_hook_pbsevent == NULL) {
		Py_RETURN_NONE;
	}
	Py_INCREF(py_hook_pbsevent);
	return (py_hook_pbsevent);
}

/**
 * @brief
 *	check whether job input is valid
 *
 * @return	int
 * @retval	0 	if 'value' is a valid value for job attribute/resource 'name';
 * @retval	1 	if not a valid value;
 * @retval	2 	if did not find a criteria for determining validity of value against 'name'..
 *
 * @par Note:
 *	THis code is taken from the qsub/qalter parsing of input.
 *
 */
static int
is_job_input_valid(char *name, char *value)
{
	/* create a attribute structure to pass to verify functionality */
	struct attropl pattr;
	int verified;
	int err_code;
	char *err_msg = NULL;

	/* create a copy of the attribute value pointers
	 * because the verify_an_attribute function could change it
	 */
	memset(&pattr, 0, sizeof(struct attropl));
	pattr.name = name;
	pattr.value = strdup(value);
	if (pattr.value == NULL) {
		pbs_errno = PBSE_SYSTEM;
		return (1);
	}
	err_code = verify_an_attribute(PBS_BATCH_QueueJob, MGR_OBJ_JOB,
				       MGR_CMD_NONE, &pattr, &verified, &err_msg);
	if (err_msg)
		free(err_msg);
	if (pattr.value)
		free(pattr.value);

	if (!verified)
		return (2);
	else if (err_code)
		return (1);

	return (0);
}

/**
 * @brief
 *	validate the input for reservation
 *
 * @return	int
 * @retval	0 	if 'value' is a valid value for reservation attribute/resource 'name';
 * @retval	1 	if not a valid value;
 * @retval	2 	if did not find a criteria for determining validity of value against 'name'..
 *
 * @par	NOTE:
 *	This code is taken from the pbs_rsub parsing of input.
 *
 */
static int
is_resv_input_valid(char *name, char *value)
{
	/* create a attribute structure to pass to verify functionality */
	struct attropl pattr;
	int verified;
	int err_code;
	char *err_msg = NULL;

	/* create a copy of the attribute name and value pointers
	 * because the verify_an_attribute function could change it
	 */
	memset(&pattr, 0, sizeof(struct attropl));
	pattr.name = name;
	pattr.value = strdup(value);
	if (pattr.value == NULL) {
		pbs_errno = PBSE_SYSTEM;
		return (1);
	}
	err_code = verify_an_attribute(PBS_BATCH_SubmitResv, MGR_OBJ_RESV,
				       MGR_CMD_NONE, &pattr, &verified, &err_msg);
	if (err_msg)
		free(err_msg);
	if (pattr.value)
		free(pattr.value);

	if (!verified)
		return (2);
	else if (err_code)
		return (1);

	return (0);
}

const char pbsv1mod_meth_validate_input_doc[] =
	"validate_input(table_descr, strName, strValue)\n\
\n\
   table_descr  : pbs table to consult: resc, job, queue, server, resv, float\n\
   strName      : an attribute name\n\
   strValue     : the value as a string\n\
\n\
   raises an exception if (strName, strValue) is not valid in 'table_descr'\n\
";

/**
 * @brief
 *	This is callable in a Python script, for validating  the validity
 *	of a PBS tuple: <attrbute_name>, <attribute_value>
 *
 * @param[in]	self - the calling parent object
 * @param[in]	args - the passed arguments:
 *
 *		args[1]	- the validation table("job", "resv", "server", "queue")
 * 		args[2] - the attribute name.
 * 		args[3] - the attribute value.
 * @param[in]	kwds  - Python variable arguments
 *
 * @return	PyObject *
 * @retval	NULL	- failed validation of input
 * @retval	Py_None - successful validation of input
 *
 */
PyObject *
pbsv1mod_meth_validate_input(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"table_descr", "attribute", "value", NULL};
	char *table = NULL;
	char *name = NULL;
	char *value = NULL;
	char *value_tmp = NULL;
	int attr_idx = -1;
	attribute attr;
	int rc;
	int is_v;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "sss:validate_input",
					 kwlist,
					 &table,
					 &name,
					 &value)) {
		return NULL;
	}

	if (hook_set_mode == C_MODE) {
		/* No need to validate input if not called inside a hook script. */
		Py_RETURN_NONE;
	}

	/*  The *decode* functions below "munges" the value argument, so will use */
	/*  a copy */
	value_tmp = strdup(value);
	if (value_tmp == NULL) {
		PyErr_SetString(PyExc_AssertionError, "strdup of value failed");
		goto validate_input_error_exit;
	}
	if (strcmp(table, PY_TYPE_JOB) == 0) {

		is_v = is_job_input_valid(name, value_tmp);

		if (is_v == 1) {

			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "input value %s not of the right format for '%s'",
				 value, name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(
				pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
				log_buffer);
			goto validate_input_error_exit;

		} else if (is_v == 2) { /* go to job table to validate */

			attr_idx = find_attr(job_attr_idx, job_attr_def, name);
			if (attr_idx == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "job attribute %s not found", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_LookupError, log_buffer);
				goto validate_input_error_exit;
			}

			clear_attr(&attr, job_attr_def);
			rc = set_attr_generic(&attr, &job_attr_def[attr_idx], value_tmp, NULL, INTERNAL);
			free_attr(job_attr_def, &attr, attr_idx);

			if (rc != 0) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "input value %s not of the right format for '%s'",
					 value, name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(
					pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
					log_buffer);
				goto validate_input_error_exit;
			}
		}

	} else if (strcmp(table, PY_RESOURCE) == 0) {
		resource_def *rescdef;

		rescdef = find_resc_def(svr_resc_def, name);
		if (!rescdef) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "resource attribute %s not found", name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(PyExc_LookupError, log_buffer);
			goto validate_input_error_exit;
		}

		if (rescdef->rs_decode) {
			memset((void *) &attr, 0, sizeof(attribute));
			rc = rescdef->rs_decode(&attr, name, NULL, value_tmp);

			if (rescdef->rs_free) {
				rescdef->rs_free(&attr);
			}
			if (rc != 0) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "input value %s not of the right format for '%s'",
					 value, name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(
					pbs_python_types_table[PP_BAD_RESC_VALUE_ERR_IDX].t_class,
					log_buffer);
				goto validate_input_error_exit;
			}
		}
	} else if (strcmp(table, PY_TYPE_RESV) == 0) {

		is_v = is_resv_input_valid(name, value_tmp);

		if (is_v == 1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "input value %s not of the right format for '%s'",
				 value, name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(
				pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
				log_buffer);
			goto validate_input_error_exit;
		} else if (is_v == 2) { /* go to resv table to validate */

			attr_idx = find_attr(resv_attr_idx, resv_attr_def, name);
			if (attr_idx == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "reservation attribute %s not found", name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(PyExc_LookupError, log_buffer);
				goto validate_input_error_exit;
			}

			clear_attr(&attr, resv_attr_def);
			rc = set_attr_generic(&attr, &resv_attr_def[attr_idx], value_tmp, NULL, INTERNAL);
			free_attr(resv_attr_def, &attr, attr_idx);
			if (rc != 0) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "input value %s not of the right format for '%s'",
					 value, name);
				log_buffer[LOG_BUF_SIZE - 1] = '\0';
				PyErr_SetString(
					pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
					log_buffer);
				goto validate_input_error_exit;
			}
		}
	} else if (strcmp(table, PY_TYPE_SERVER) == 0) {
		attr_idx = find_attr(svr_attr_idx, svr_attr_def, name);
		if (attr_idx == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "server attribute %s not found", name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(PyExc_LookupError, log_buffer);
			goto validate_input_error_exit;
		}

		clear_attr(&attr, svr_attr_def);
		rc = set_attr_generic(&attr, &svr_attr_def[attr_idx], value_tmp, NULL, INTERNAL);
		free_attr(svr_attr_def, &attr, attr_idx);
		if (rc != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "input value %s not of the right format for '%s'",
				 value, name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(
				pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
				log_buffer);
			goto validate_input_error_exit;
		}
	} else if (strcmp(table, PY_TYPE_QUEUE) == 0) {
		attr_idx = find_attr(que_attr_idx, que_attr_def, name);
		if (attr_idx == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "queue attribute %s not found", name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(PyExc_LookupError, log_buffer);
			goto validate_input_error_exit;
		}

		clear_attr(&attr, que_attr_def);
		rc = set_attr_generic(&attr, &que_attr_def[attr_idx], value_tmp, NULL, INTERNAL);
		free_attr(que_attr_def, &attr, attr_idx);
		if (rc != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "input value %s not of the right format for '%s'",
				 value, name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(
				pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
				log_buffer);
			goto validate_input_error_exit;
		}
	} else if (strcmp(table, PY_TYPE_FLOAT2) == 0) {
		clear_attr(&attr, que_attr_def);
		rc = decode_f(&attr, name, NULL, value_tmp);
		if (rc != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "input value %s not of the right format for '%s'",
				 value, name);
			log_buffer[LOG_BUF_SIZE - 1] = '\0';
			PyErr_SetString(
				pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
				log_buffer);
			goto validate_input_error_exit;
		}
	} else {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "could not find an attributes table called '%s'", table);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		PyErr_SetString(PyExc_LookupError, log_buffer);
		goto validate_input_error_exit;
	}

	if (value_tmp) {
		free(value_tmp);
	}
	Py_RETURN_NONE;

validate_input_error_exit:
	if (value_tmp) {
		free(value_tmp);
	}
	return NULL;
}

const char pbsv1mod_meth_duration_to_secs_doc[] =
	"duration_to_secs(strTime)\n\
\n\
   strTime:  a time string ([HH:MM:]SS[.ms]) to be converted into # of seconds \n\
\n\
         returns an int. If time_str is \"\", then returns 0\n\
";

/**
 * @brief
 *	convert the time in ([HH:MM:]SS[.ms]) format to secs.
 *
 * @return	PyObject*
 * @retval	secs		success
 * @retval	NULL		error
 *
 */
PyObject *
pbsv1mod_meth_duration_to_secs(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"time_str", NULL};
	char *time_str = NULL;
	long num_secs;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s:duration_to_secs",
					 kwlist,
					 &time_str)) {
		return NULL;
	}

	num_secs = duration_to_secs(time_str);
	if (num_secs == -1) {
		PyErr_SetString(PyExc_AssertionError, "strdup of value failed");
		goto duration_error_exit;
	}

	if (num_secs == -2) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "input value '%s' not of the right format",
			 time_str);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		PyErr_SetString(
			pbs_python_types_table[PP_BADATTR_VALUE_ERR_IDX].t_class,
			log_buffer);
		goto duration_error_exit;
	}

	return (PyLong_FromLong(num_secs));

duration_error_exit:

	return NULL;
}

/* pbs_v1_module method event */

const char pbsv1mod_meth_wordsize_doc[] =
	"wordsize()\n\
\n\
  returns:\n\
         size of a word in bytes(an int).\n\
";

/**
 * @brief
 *	return the size of a word in bytes.
 */
PyObject *
pbsv1mod_meth_wordsize(void)
{
	return (PyLong_FromSsize_t((ssize_t) sizeof(int)));
}

/**
 * @brief
 * 	_pbs_python_event_job_getval_hookset:
 * 	This is a new, general purpose function that looks into the current hook
 * 	event object's job parameter (i.e. pbs.event().job), and see if the job
 * 	attribute attrib_name was set inside a hook script. If so, return the
 * 	attributes value as a string; NULL otherwise. On some attributes like
 * 	ATTR_h, optional value strings opval and delval are returned. opval tells
 * 	how the attribute value was obtained: via __init__, __add__, or __sub__
 * 	methods; delval tells which hold values (e.g. "us") were actually removed
 * 	by a __sub__ (i.e. unset) action. opval_len and delval_len are the actual
 * 	number of bytes pre-allocated for the string arrays 'opval' and 'delval'.
 * 	The caller is responsible for allocating enough space for these parameters.
 *
 * @par	NOTE:
 *	This returns the string value returned by pbs_python_object_str(),
 * 	which returns a fixed memory area that gets overwritten by subsequent
 * 	calls to this function. So The return value of this function must be
 * 	immediately used.
 *
 */
char *
_pbs_python_event_job_getval_hookset(char *attrib_name, char *opval,
				     int opval_len, char *delval, int delval_len)
{
	PyObject *py_job = NULL;
	PyObject *py_attr_hookset_dict = NULL;
	char *strval = NULL;

	if (py_hook_pbsevent == NULL) {
		log_err(PBSE_INTERNAL, __func__, "No hook event found!");
		return NULL;
	}

	if (!PyObject_HasAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB)) {
		LOG_ERROR_ARG2("%s: does not have attribute <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}

	py_job = PyObject_GetAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB);
	/* NEW */

	if (py_job == NULL || (py_job == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}

	/*
	 * Get the attributes that have been set in the hook script via the
	 * _attributes_hook_set dictionary.
	 */
	py_attr_hookset_dict = PyObject_GetAttrString(
		py_job, PY_ATTRIBUTES_HOOK_SET); /* NEW */
	if (py_attr_hookset_dict == NULL) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_JOB, PY_ATTRIBUTES_HOOK_SET);
		goto getval_exit;
	}
	if (!PyDict_Check(py_attr_hookset_dict)) {
		LOG_ERROR_ARG2("%s: <%s> is not a dict",
			       PY_TYPE_JOB, PY_ATTRIBUTES_HOOK_SET);
		goto getval_exit;
	}

	if (PyDict_GetItemString(py_attr_hookset_dict, attrib_name) != NULL) {
		if (PyObject_HasAttrString(py_job, attrib_name)) {
			PyObject *py_attrval = NULL;

			py_attrval = PyObject_GetAttrString(py_job,
							    attrib_name); /* NEW */

			if ((py_attrval != NULL) && (py_attrval != Py_None)) {

				if ((opval != NULL) && (opval_len > 1)) {
					strval = pbs_python_object_get_attr_string_value(
						py_attrval, PY_OPVAL);
					strncpy(opval, (strval ? strval : ""), opval_len - 1);
				}
				if ((delval != NULL) && (delval_len > 1)) {
					strval = pbs_python_object_get_attr_string_value(
						py_attrval, PY_DELVAL);
					strncpy(delval, (strval ? strval : ""), delval_len - 1);
				}
				strval = pbs_python_object_str(py_attrval);
				Py_DECREF(py_attrval);
			}
		}
	}

getval_exit:

	Py_CLEAR(py_job);
	Py_CLEAR(py_attr_hookset_dict);

	return (strval);
}

const char pbsv1mod_meth_iter_nextfunc_doc[] =
	"iter_nextfunc(meth_mode, obj_name, filter1, filter2)\n\
\n\
   meth_mode:	can be 1 if called from __init__() or 0 if from next()\n\
		method of a pbs_iter type.\n\
   obj_name:	what type of object being iterated on: \"queues\", \"jobs\",\n\
		\"resvs\", \"vnodes\".\n\
   filter1:	is usually the <server_name> where the queues,\n\
		jobs, resvs, vnodes reside. A <server_name> of \"\"\n\
		means the local server host.\n\
   filter2:	can be any string that can further restrict the list\n\
		being referenced. For example, this can be set to\n\
		some <queue_name>, to have the iterator represents\n\
		a list of jobs on <queue_name>@<server_name>\n\
\n\
   Returns the next PBS object in Python form to evaluate within a looping\n\
   construct. The idea is on a iterator instantiation, the following gets\n\
   called:\n\
   	_pbs_v1.iter_nextfunc(self, 1, obj_name, filter1, filter2)\n\
   This causes an iterator reference (i.e. self) to be internally stored by\n\
   PBS in the internal pbs_iter_list, setting pbs_iter_items data field to\n\
   the first element of the obj_name (e.g. queues) list, filtered\n\
   according to filter1 (e.g. fest) and/or filter2 (e.g. workq).\n\
\n\
   Then on an interator next call, the following gets invoked:\n\
	_pbs_v1.iter_nextfunc(self, 0, obj_name, filter1, filter2)\n\
   This returns the next Python object to process among the list of PBS\n\
   objects represented by iterator self.\n\
";

PyObject *
pbsv1mod_meth_iter_nextfunc(PyObject *self, PyObject *args, PyObject *kwds)
{
#ifdef NAS /* localmod 014 */
	static char *kwlist[] = {"iter_obj", "meth_mode", "obj_name", "filter1", "filter2", "ignore_fin", "filter_user",
				 NULL};
#else
	static char *kwlist[] = {"iter_obj", "meth_mode", "obj_name", "filter1", "filter2",
				 NULL};
#endif /* localmod 014 */
	int meth_mode;
	char *obj_name = NULL;
	char *filter1 = NULL;
	char *filter2 = NULL;
#ifdef NAS /* localmod 014 */
	int ignore_fin;
	char *filter_user = NULL;
#endif /* localmod 014 */
	pbs_iter_item *iter_entry = NULL;
	pbs_queue *pque = NULL;
	PyObject *py_object = NULL;
	PyObject *py_self = NULL;
	int vi;

#ifdef NAS /* localmod 014 */
	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "Oisssis:iter_nextfunc",
					 kwlist,
					 &py_self,
					 &meth_mode,
					 &obj_name,
					 &filter1,
					 &filter2,
					 &ignore_fin,
					 &filter_user)) {
#else
	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "Oisss:iter_nextfunc",
					 kwlist,
					 &py_self,
					 &meth_mode,
					 &obj_name,
					 &filter1,
					 &filter2)) {
#endif /* localmod 014 */
		return NULL;
	}

	iter_entry = (pbs_iter_item *) GET_NEXT(pbs_iter_list);

	while (iter_entry) {
		if (iter_entry->py_iter == py_self)
			break;

		iter_entry = (pbs_iter_item *) GET_NEXT(iter_entry->all_iters);
	}

	switch (meth_mode) {

		case 1: /* in __init__ method */

			if (iter_entry != NULL) { /* must be NULL */
				PyErr_SetString(PyExc_AssertionError,
						"attempted to initialize an already initialized iterator!");
				return NULL;
			}

			iter_entry = (pbs_iter_item *) malloc(sizeof(pbs_iter_item));
			if (iter_entry == NULL) {
				log_err(errno, __func__, "no memory");
				PyErr_SetString(PyExc_AssertionError,
						"failed to malloc memory");
				return NULL;
			}
			(void) memset((char *) iter_entry, (int) 0,
				      (size_t) sizeof(pbs_iter_item));
			CLEAR_LINK(iter_entry->all_iters);

			iter_entry->py_iter = py_self;
			Py_INCREF(py_self);

			if (strcmp(obj_name, ITER_QUEUES) == 0) {
				if ((filter1 != NULL) && (filter1[0] != '\0') &&
				    (strcmp(filter1, server_name) != 0)) {
					PyErr_SetString(PyExc_StopIteration, "");
					return NULL;
				}
				iter_entry->data = (pbs_queue *) GET_NEXT(svr_queues);
			} else if (strcmp(obj_name, ITER_JOBS) == 0) {

				if ((filter1 != NULL) && (filter1[0] != '\0') &&
				    (strcmp(filter1, server_name) != 0)) {
					PyErr_SetString(PyExc_StopIteration, "");
					return NULL;
				}
#ifdef NAS /* localmod 014 */
				if (!ignore_fin &&
				    (filter_user == NULL || filter_user[0] == '\0') &&
				    (filter2 != NULL) && (filter2[0] != '\0')) {
#else
				if ((filter2 != NULL) && (filter2[0] != '\0')) {
#endif /* localmod 014 */
					/* refers to the queue name */
					pque = find_queuebyname(filter2);
					if (pque == NULL) {
						sprintf(log_buffer, "queue %s not found",
							filter2);
						PyErr_SetString(PyExc_ValueError,
								log_buffer);
						return NULL;
					}
					iter_entry->data = (job *) GET_NEXT(pque->qu_jobs);

				} else { /* get jobs from server */
					iter_entry->data = (job *) GET_NEXT(svr_alljobs);

#ifdef NAS /* localmod 014 */
					/* skip jobs according to filters requested for the iterator */
					job *njob = (job *) iter_entry->data;
					while (njob != NULL &&
					       ((ignore_fin && check_job_state(njob, JOB_STATE_LTR_FINISHED)) ||
						(filter2 != NULL && filter2[0] != '\0' && strcmp(filter2, njob->ji_qs.ji_queue)) ||
						(filter_user != NULL && filter_user[0] != '\0' && is_jattr_set(njob, JOB_ATR_euser) && get_jattr_str(njob, JOB_ATR_euser) != NULL && strcmp(filter_user, get_jattr_str(njob, JOB_ATR_euser))))) {
						njob = (job *) GET_NEXT(njob->ji_alljobs);
					}

					iter_entry->data = njob;
#endif /* localmod 014 */
				}
			} else if (strcmp(obj_name, ITER_RESERVATIONS) == 0) {
				if ((filter1 != NULL) && (filter1[0] != '\0') &&
				    (strcmp(filter1, server_name) != 0)) {
					PyErr_SetString(PyExc_StopIteration, "");
					return NULL;
				}
				iter_entry->data = (resc_resv *) GET_NEXT(svr_allresvs);
			} else if (strcmp(obj_name, ITER_VNODES) == 0) {
				if ((filter1 != NULL) && (filter1[0] != '\0') &&
				    (strcmp(filter1, server_name) != 0)) {
					PyErr_SetString(PyExc_StopIteration, "");
					return NULL;
				}

				if ((pbsndlist == NULL) || (svr_totnodes <= 0)) {
					PyErr_SetString(PyExc_StopIteration, "");
					return NULL;
				}
				iter_entry->data = NULL;

				for (vi = 0; vi < svr_totnodes; vi++) {

					if ((pbsndlist[vi]->nd_state & INUSE_DELETED) == 0) {
						iter_entry->data =
							(struct pbsnode *) pbsndlist[vi];
						iter_entry->data_index = vi;
						break;
					}
				}
			} else {
				sprintf(log_buffer,
					"invalid parameter %s to iter_nextfunc()",
					obj_name);
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				return NULL;
			}

			append_link(&pbs_iter_list, &iter_entry->all_iters,
				    (pbs_iter_item *) iter_entry);
			Py_RETURN_NONE; /* nothing to return since this is __init__ */

		case 0:				  /* in next() */
			if (iter_entry == NULL) { /* must be stored internally */
				PyErr_SetString(PyExc_AssertionError,
						"internal iterator should exist during next() call");
				return NULL;
			}

			if (iter_entry->data == NULL) {
				PyErr_SetString(PyExc_StopIteration, "");
				return NULL;
			}

			hook_set_mode = C_MODE;
			if (strcmp(obj_name, ITER_RESERVATIONS) == 0) {
				py_object = _pps_helper_get_resv((resc_resv *) iter_entry->data, NULL, HOOK_PERF_FUNC);
				iter_entry->data = (resc_resv *) GET_NEXT(
					((resc_resv *) iter_entry->data)->ri_allresvs);
			} else if (strcmp(obj_name, ITER_QUEUES) == 0) {
				py_object = _pps_helper_get_queue((pbs_queue *) iter_entry->data, NULL, HOOK_PERF_FUNC);
				iter_entry->data = (pbs_queue *) GET_NEXT(
					((pbs_queue *) iter_entry->data)->qu_link);
			} else if (strcmp(obj_name, ITER_JOBS) == 0) {
				py_object = _pps_helper_get_job((job *) iter_entry->data, NULL, NULL, HOOK_PERF_FUNC);

#ifdef NAS /* localmod 014 */
				if (!ignore_fin &&
				    (filter_user == NULL || filter_user[0] == '\0') &&
				    (filter2 != NULL) && (filter2[0] != '\0')) {
#else
				if ((filter2 != NULL) && (filter2[0] != '\0')) {
#endif /* localmod 014 */

					/* list of jobs filtered by queue   */
					/* 'filter2', as setup in meth_mode */
					/* of 1 above. So we need to return */
					/* the jobs on the same queue       */
					/* (i.e. use ji_jobque here)        */
					iter_entry->data = (job *) GET_NEXT(
						((job *) iter_entry->data)->ji_jobque);
				} else {
					iter_entry->data = (job *) GET_NEXT(
						((job *) iter_entry->data)->ji_alljobs);
#ifdef NAS /* localmod 014 */
					/* skip jobs according to filters requested for the iterator */
					job *njob = (job *) iter_entry->data;
					while (njob != NULL &&
					       ((ignore_fin && check_job_state(njob, JOB_STATE_LTR_FINISHED)) ||
						(filter2 != NULL && filter2[0] != '\0' && strcmp(filter2, njob->ji_qs.ji_queue)) ||
						(filter_user != NULL && filter_user[0] != '\0' && get_jattr_str(njob, JOB_ATR_euser) != NULL && strcmp(filter_user, get_jattr_str(njob, JOB_ATR_euser))))) {
						njob = (job *) GET_NEXT(njob->ji_alljobs);
					}

					iter_entry->data = njob;
#endif /* localmod 014 */
				}
			} else if (strcmp(obj_name, ITER_VNODES) == 0) {

				py_object = _pps_helper_get_vnode((struct pbsnode *) iter_entry->data, NULL, HOOK_PERF_FUNC);

				iter_entry->data = NULL;
				vi = iter_entry->data_index + 1;
				while (vi < svr_totnodes) {

					if ((pbsndlist[vi]->nd_state & INUSE_DELETED) == 0) {
						iter_entry->data =
							(struct pbsnode *) pbsndlist[vi];
						iter_entry->data_index = vi;
						break;
					}
					vi++;
				}

			} else {
				sprintf(log_buffer,
					"invalid parameter %s to iter_nextfunc()",
					obj_name);
				PyErr_SetString(PyExc_AssertionError, log_buffer);
				hook_set_mode = PY_MODE;
				return NULL;
			}
			hook_set_mode = PY_MODE;
			return py_object;

		default:
			sprintf(log_buffer,
				"invalid method mode %d to iter_nextfunc()",
				meth_mode);
			PyErr_SetString(PyExc_AssertionError, log_buffer);
	}
	return NULL;
}

const char pbsv1mod_meth_mark_vnode_set_doc[] =
	"mark_vnode_set(vnode_name, attr_name, attr_value)\n\
\n\
   vnode_name:  name of vnode to set\n\
   attr_name:   the attribute name\n\
   attr_value:  the attribute value\n\
\n\
   Adds to some internal, pending operations table,\n\
   an 'attr_name=attr_value' set operation for the given 'vnode_name'.\n\
";

/**
 * @brief
 *	This is callable in a Python script, for populating the internal
 *	list 'pbs_vnode_set_list' with
 *		(<vnode_name>, <attribute_name>) representing a pending "set"
 *	operation.
 *
 * @param[in]	args[1]	- the vnode name.
 * @param[in]	args[2] - the attribute name.
 * @param[in]	args[3] - the attribute value.
 *
 * @return	PyObject *
 * @retval	NULL	- with an accompanying AssertionError Python exception.
 * @retval	Py_None - successful execution.
 *
 */
PyObject *
pbsv1mod_meth_mark_vnode_set(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"vnode_name", "attr_name", "attr_value",
				 NULL};
	char *vnode_name = NULL;
	char *attr_name = NULL;
	char *attr_value = NULL;
	vnode_set_req *vn_set_req = NULL;
	svrattrl *plist = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "sss:mark_vnode_set",
					 kwlist,
					 &vnode_name,
					 &attr_name,
					 &attr_value)) {
		return NULL;
	}
	if ((attr_name == NULL) || (attr_name[0] == '\0') ||
	    (attr_value == NULL) || (attr_value[0] == '\0')) {
		PyErr_SetString(PyExc_AssertionError,
				"mark_vnode_set: bad parameter!");
		return NULL;
	}

	vn_set_req = (vnode_set_req *) GET_NEXT(pbs_vnode_set_list);

	while (vn_set_req) {
		if (strcmp(vn_set_req->vnode_name, vnode_name) == 0)
			break;

		vn_set_req = (vnode_set_req *) GET_NEXT(vn_set_req->all_reqs);
	}

	if (vn_set_req == NULL) {
		vn_set_req = (vnode_set_req *) malloc(sizeof(vnode_set_req));
		if (vn_set_req == NULL) {
			log_err(errno, __func__, "no memory");
			PyErr_SetString(PyExc_AssertionError,
					"failed to malloc memory");
			return NULL;
		}
		(void) memset((char *) vn_set_req, (int) 0,
			      (size_t) sizeof(vnode_set_req));
		CLEAR_LINK(vn_set_req->all_reqs);
		CLEAR_HEAD(vn_set_req->rq_attr);
		strncpy(vn_set_req->vnode_name, vnode_name, PBS_MAXNODENAME);
		append_link(&pbs_vnode_set_list, &vn_set_req->all_reqs,
			    (vnode_set_req *) vn_set_req);
	}

	if ((plist = find_svrattrl_list_entry(&vn_set_req->rq_attr, attr_name,
					      NULL)) != NULL) {

		/* let's remove the entry and just recreate. */
		/* it's too messy and buggy, error prone to have */
		/* to "extend" the svratrl entry!                */

		delete_link(&plist->al_link);
		free(plist);
	}

	if (add_to_svrattrl_list(&vn_set_req->rq_attr, attr_name, NULL,
				 ((strcmp(attr_name, ATTR_NODE_state) == 0) ? vnode_state_to_str(atoi(attr_value)) : attr_value),
				 ATR_VFLAG_HOOK, NULL) == -1) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "failed to add_to_svrattrl_list(%s, 0, %s, ATR_VFLAG_HOOK)",
			 attr_name, attr_value);
		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_err(errno, __func__, log_buffer);
		PyErr_SetString(PyExc_AssertionError, "");
		return NULL;
	}

	Py_RETURN_NONE; /* nothing to return since this is __init__ */
}

const char pbsv1mod_meth_vnode_state_to_str_doc[] =
	"vnode_state_to_str(state_bit)\n\
\n\
   state_bit:	vnode state in bit flag.\n\
\n\
   Returns the human readable form of 'state_bit'\n\
   Ex: vnode_state_to_str(3) -> \"offline,down\"\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program to vnode_state_to_str() function,
 *	that is callable in Python script.
 *
 * @param[in]	self	- owning object
 * @param[in]	args[1]	- the  state bit value.
 * @param[in]	kwds	- keywords to objects mappings
 *
 * @return	PyObject *
 * @retval	A Python string corresponding to args[1].
 *
 */
PyObject *
pbsv1mod_meth_vnode_state_to_str(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"state_bit", NULL};
	int state_bit;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "i:vnode_state_to_str",
					 kwlist,
					 &state_bit)) {
		return NULL;
	}

	return (PyUnicode_FromString(vnode_state_to_str(state_bit)));
}

const char pbsv1mod_meth_vnode_sharing_to_str_doc[] =
	"vnode_sharing_to_str(share_val)\n\
\n\
   share_val:	vnode sharing value in int.\n\
\n\
   Returns the human readable form of 'state_bit'\n\
   Ex: vnode_sharing_to_str(5) -> \"force_excl\"\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program to vnode_sharing_to_str() function,
 that is callable in Python script.
 *
 * @param[in]	self	- owning object
 * @param[in]	args[1]	- the  vnode sharing value.
 * @param[in]	kwds	- keywords to objects mappings
 *
 * @return	PyObject *
 * @retval	A Python string corresponding to args[1].
 *
 */
PyObject *
pbsv1mod_meth_vnode_sharing_to_str(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"share_val", NULL};
	int share_val;
	char *vns;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "i:vnode_sharing_to_str",
					 kwlist,
					 &share_val)) {
		return NULL;
	}

	vns = vnode_sharing_to_str(share_val);
	return (PyUnicode_FromString(vns ? vns : ""));
}

const char pbsv1mod_meth_vnode_ntype_to_str_doc[] =
	"vnode_ntype_to_str(ntype)\n\
\n\
   share_val:	ntype vnode type.\n\
\n\
   Returns the node type\n\
   Ex: vnode_ntype_to_str(1) -> \"PBS\"\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program to vnode_ntype_to_str() function,
 *	that is callable in Python script.
 *
 * @param[in]	self	- owning object
 * @param[in]	args[1]	- the  vnode sharing value.
 * @param[in]	kwds	- keywords to objects mappings
 *
 * @return	PyObject *
 * @retval	A Python string corresponding to args[1].
 *
 */
PyObject *
pbsv1mod_meth_vnode_ntype_to_str(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"node_type", NULL};
	int node_type;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "i:vnode_ntype_to_str",
					 kwlist,
					 &node_type)) {
		return NULL;
	}

	return (PyUnicode_FromString(vnode_ntype_to_str(node_type)));
}

/**
 *
 * @brief
 *	Checks if there's at least one pending "set"  vnode operation in
 *	the internal list 'pbs_vnode_set_list'.
 *
 * @return int
 * @retval 1	- if a "set" operation was found.
 * @retval 0   - if not found.
 *
 */
int
_pbs_python_has_vnode_set(void)
{
	if (GET_NEXT(pbs_vnode_set_list) != NULL)
		return (1);
	return (0);
}

/**
 * @brief
 *	Perform all the "set" operations found in 'pbs_vnode_set_list'.
 * @par
 *	This goes through each entry in the internal 'pbs_vnode_set_list',
 *	and for every vnode_name, obtain the struct pbsnode * entry in the
 *	system pbsdnlist[] table, and perform the set operation for the
 *	corresponding rq_attr entry.
 *
 * @note
 *	Failures in set operations will be reflected in the daemons logs
 *	output.
 *
 */
void
_pbs_python_do_vnode_set(void)
{

	vnode_set_req *vn_set_req = NULL;
	struct pbsnode *pnode;
	int bad = 0;
	int rc;
	char *hook_name = NULL;
	svrattrl *plist;
	svrattrl *pal;

	hook_name = _pbs_python_event_get_attrval(PY_EVENT_HOOK_NAME);
	if (hook_name == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"No hook name associated with set vnode operation!");
		return;
	}

	vn_set_req = (vnode_set_req *) GET_NEXT(pbs_vnode_set_list);
	while (vn_set_req != NULL) {

		pnode = find_nodebyname(vn_set_req->vnode_name);

		if ((pnode == NULL) ||
		    (pnode->nd_state & INUSE_DELETED)) {
			vn_set_req = (vnode_set_req *) GET_NEXT(vn_set_req->all_reqs);
			continue;
		}

		plist = (svrattrl *) GET_NEXT(vn_set_req->rq_attr);

		rc = mgr_set_attr(pnode->nd_attr, node_attr_idx, node_attr_def, ND_ATR_LAST,
				  plist, ATR_PERM_ALLOW_INDIRECT, &bad, (void *) pnode, ATR_ACTION_ALTER);

		if (rc != 0) {
			char *pbse_err;
			char raw_err[10];
			svrattrl *pal;
			int i;

			pbse_err = pbse_to_txt(rc);
			snprintf(raw_err, sizeof(raw_err) - 1, "%d", rc);

			i = 0;
			pal = plist;
			bad--; /* mgr_set_attr returns +1 of actual 'bad' index */
			while (pal) {
				if (i == bad) {
					sprintf(log_buffer,
						"vnode %s: failed to set %s to %s: %s",
						vn_set_req->vnode_name,
						pal->al_name, pal->al_value ? pal->al_value : "",
						pbse_err ? pbse_err : raw_err);
					log_err(PBSE_SYSTEM, __func__, log_buffer);
					break;
				}
				if (hook_debug.output_fp != NULL) {
					fprintf(hook_debug.output_fp,
						"%s(%s).%s=%s\n",
						SERVER_VNODE_OBJECT,
						pnode->nd_name,
						pal->al_name,
						pal->al_value);
				}
				i++;
				pal = (svrattrl *) GET_NEXT(pal->al_link);
			}
			return;
		} else {

			mgr_log_attr(msg_man_set, plist,
				     PBS_EVENTCLASS_NODE, pnode->nd_name, hook_name);

			pal = plist;
			while (pal) {
				if (hook_debug.output_fp != NULL) {
					fprintf(hook_debug.output_fp,
						"%s(%s).%s=%s\n",
						SERVER_VNODE_OBJECT,
						pnode->nd_name,
						pal->al_name,
						pal->al_value);
				}
				pal = (svrattrl *) GET_NEXT(pal->al_link);
			}
		}

		vn_set_req = (vnode_set_req *) GET_NEXT(vn_set_req->all_reqs);
	}

	save_nodes_db(0, NULL);
}

const char pbsv1mod_meth_set_python_mode_doc[] =
	"set_python_mode()\n\
\n\
  returns:\n\
         Sets the internal variable 'hook_set_mode' to PY_MODE.\n\
  	 This is an internal function.\n\
";

/**
 *;p
 * @brief
 *	This is the C->Python wrapper program to
 *	set the internal variable 'hook_set_mode' to PY_MODE.
 *
 * @return Python object
 * @retval PY_TRUE
 *
 */
PyObject *
pbsv1mod_meth_set_python_mode(void)
{
	PyObject *ret;
	hook_set_mode = PY_MODE;
	ret = Py_True;
	Py_INCREF(ret);
	return (ret);
}

const char pbsv1mod_meth_set_c_mode_doc[] =
	"set_c_mode()\n\
\n\
  returns:\n\
         Sets the internal variable 'hook_set_mode' to C_MODE.\n\
  	 This is an internal function.\n\
";

/**
 *
 * @brief
 *	This is the C->Python wrapper program to
 *	set the internal variable 'hook_set_mode' to C_MODE.
 *
 * @return Python object
 * @retval PY_TRUE
 *
 */
PyObject *
pbsv1mod_meth_set_c_mode(void)
{
	PyObject *ret;
	hook_set_mode = C_MODE;
	ret = Py_True;
	Py_INCREF(ret);
	return (ret);
}

const char pbsv1mod_meth_get_python_daemon_name_doc[] =
	"get_python_daemon_name()\n\
\n\
  returns:\n\
         Returns the svr_interp_data.daemon_name value.\n\
  	 This is an internal function.\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program for
 *	returning the svr_interp_data.daemon_name value.
 *	This is callable within a Python script.
 *
 * @return Python str
 * @retval name of "daemon" invoking Python interpreter.
 *
 */
PyObject *
pbsv1mod_meth_get_python_daemon_name(void)
{
	if (svr_interp_data.daemon_name == NULL)
		Py_RETURN_NONE;

	return (PyUnicode_FromString(svr_interp_data.daemon_name));
}

const char pbsv1mod_meth_str_to_vnode_state_doc[] =
	"str_to_vnode_state(state_str)\n\
\n\
   state_str:	vnode state as a  string.\n\
\n\
   Returns the human readable form of 'state_str'\n\
   Ex: str_to_vnode_state(\"offline,down\") -> \"3\"\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program to str_to_vnode_state()
 *	function, that is callable in Python script.
 *
 * @param[in]	self	- owning object
 * @param[in]	args[1]	- the  state str value.
 * @param[in]	kwds	- keywords to objects mappings
 *
 * @return	PyObject *
 * @retval	A Python int corresponding to args[1].
 *
 */
PyObject *
pbsv1mod_meth_str_to_vnode_state(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"state_str", NULL};
	char *state_str = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s:str_to_vnode_state",
					 kwlist,
					 &state_str)) {
		return NULL;
	}

	return (PyUnicode_FromFormat("%d", str_to_vnode_state(state_str)));
}

const char pbsv1mod_meth_str_to_vnode_ntype_doc[] =
	"str_to_vnode_ntype(type_str)\n\
\n\
   type_str:	vnode type as a string.\n\
\n\
   Returns the human readable form of 'type_str'\n\
   Ex: str_to_vnode_ntype(\"pbs\") -> \"0\"\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program to str_to_vnode_ntype()
 *	function, that is callable in Python script.
 *
 * @param[in]	self	- owning object
 * @param[in]	args[1]	- the  type str value.
 * @param[in]	kwds	- keywords to objects mappings
 *
 * @return	PyObject *
 * @retval	A Python string corresponding to args[1].
 *
 */
PyObject *
pbsv1mod_meth_str_to_vnode_ntype(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"type_str", NULL};
	char *type_str = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s:str_to_vnode_ntype",
					 kwlist,
					 &type_str)) {
		return NULL;
	}

	return (PyUnicode_FromFormat("%d", str_to_vnode_ntype(type_str)));
}

const char pbsv1mod_meth_str_to_vnode_sharing_doc[] =
	"str_to_vnode_sharing(share_str)\n\
\n\
   share_str:	vnode share as a  string.\n\
\n\
   Returns the human readable form of 'share_str'\n\
   Ex: str_to_vnode_sharing(\"default_shared\") -> \"1\"\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program to str_to_vnode_sharing()
 *	function that is callable in Python script.
 *
 * @param[in]	self	- owning object
 * @param[in]	args[1]	- the  share str value.
 * @param[in]	kwds	- keywords to objects mappings
 *
 * @return	PyObject *
 * @retval	A Python string corresponding to args[1].
 *
 */
PyObject *
pbsv1mod_meth_str_to_vnode_sharing(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"share_str", NULL};
	char *share_str = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "s:str_to_vnode_sharing",
					 kwlist,
					 &share_str)) {
		return NULL;
	}
	return (PyUnicode_FromFormat("%d", str_to_vnode_sharing(share_str)));
}

const char pbsv1mod_meth_get_pbs_server_name_doc[] =
	"get_pbs_server_name()\n\
\n\
  returns:\n\
         Returns the configured server host name.\n\
  	 This is an internal function.\n\
";

/**
 *
 * @brief
 *	This is the C->Python wrapper program for
 *	returning the PBS_SERVER value in pbs.conf file.
 *	This is callable within a Python script.
 *
 * @return Python str
 * @retval name of "daemon" invoking Python interpreter.
 *
 */
PyObject *
pbsv1mod_meth_get_pbs_server_name(void)
{
	if (server_host[0] == '\0')
		Py_RETURN_NONE;

	return (PyUnicode_FromString(server_host));
}

const char pbsv1mod_meth_get_local_host_name_doc[] =
	"get_local_host_name()\n\
\n\
  returns:\n\
         Returns the local host name associated with currently instantiated.\n\
	 Python interpreter.\n\
  	 This is an internal function.\n\
";

/**
 *
 * @brief
 *	This is the C->Python wrapper program for
 *	returning the local host name associated with an instantiated
 *	Python interpreter.
 *	This is callable within a Python script.
 *
 * @return Python str
 * @retval local hostname associated with the current Python interpreter.
 *
 */
PyObject *
pbsv1mod_meth_get_local_host_name(void)
{
	return (PyUnicode_FromString((char *) svr_interp_data.local_host_name));
}

/**
 * @brief
 * 	Returns the command line string that was set in  a hook
 *	as an alternate to the normal reboot() call.
 */
char *
pbs_python_get_reboot_host_cmd(void)
{
	if (hook_reboot_host_cmd[0] != '\0')
		return ((char *) hook_reboot_host_cmd);

	return NULL;
}

/**
 * @brief
 *	Returns the value of the flag that tells pbs to reboot host or not.
 *
 * @return	int
 * @retval	TRUE 	- 	means yes, reboot host
 * @retval	FALSE 	- 	means no.
 */
int
pbs_python_get_reboot_host_flag(void)
{
	return (hook_reboot_host);
}

/**
 * @brief
 *	Sets the flag that tells pbs to reboot current host.
 *	Also, if 'cmd' is not NULL, sets the reboot command to use as an
 *	alternate to the default reboot() call.
 *
 * @param[in]	cmd - the command line (including arguments) that should
 *			be used when the time comes to reboot host.
 */
void
pbs_python_reboot_host(char *cmd)
{

	hook_reboot_host = TRUE;
	hook_reboot_host_cmd[0] = '\0';
	if (cmd != NULL) {
		snprintf((char *) hook_reboot_host_cmd, sizeof(hook_reboot_host_cmd),
			 "%s", cmd);
	}
}

const char pbsv1mod_meth_reboot_doc[] =
	"reboot([cmd])\n\
\n\
         Flags pbs that current host should be rebooted.\n\
  where:\n\
\n\
   cmd:  optional command line to use by pbs to reboot host, as an\n\
   alternate to the default reboot()  call.\n\
";

/**
 *
 * @brief
 *	This is the C->Python wrapper program to the
 *	pbs_python_reboot_host() call.
 *
 *	This is callable within a Python script.
 *
 * @param[in]	args - arguments to this Python function
 * @param[in]	kwds - keywords mappings  to the alternate 'cmd' used for
 *			rebooting host.
 *
 * @return PyObject *
 * @retval Python None
 */
PyObject *
pbsv1mod_meth_reboot(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"cmd", NULL};
	char *cmd = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "|s:reboot",
					 kwlist,
					 &cmd)) {
		return NULL;
	}
	pbs_python_reboot_host(cmd);

	Py_RETURN_NONE;
}

/**
 * @brief
 *	Returns the value of the flag that tells pbs to scheduler_restart_cycle host or not.
 * @return 	int
 * @retval	TRUE	 - 	means yes, scheduler_restart_cycle host
 * @retval	FALSE 	- 	means no.
 */
int
pbs_python_get_scheduler_restart_cycle_flag(void)
{
	return (hook_scheduler_restart_cycle);
}

/**
 * @brief
 *	Sets the flag that tells pbs server to NOT tell scheduler to restart its
 *	scheduling cycle.
 */
void
pbs_python_no_scheduler_restart_cycle(void)
{

	hook_scheduler_restart_cycle = FALSE;
}

/**
 * @brief
 *	Sets the flag that tells pbs server to tell scheduler to restart its
 *	scheduling cycle.
 */
void
pbs_python_scheduler_restart_cycle(void)
{

	hook_scheduler_restart_cycle = TRUE;
}

const char pbsv1mod_meth_scheduler_restart_cycle_doc[] =
	"scheduler_restart_cycle(<server_host>)\n\
\n\
         Flags pbs server at 'server_host' to tell scheduler to restart its scheduling cycle.\n\
  where:\n\
\n\
   server_host:  the name of the server to send the request to.\n\
   NOTE: Currently, only supports on the same host.\n\
";

/**
 *
 * @brief
 *	This is the C->Python wrapper program to the
 *	pbs_python_scheduler_restart_cycle() call.
 *
 *	This is callable within a Python script.
 *
 * @param[in]	args - arguments to this Python function
 * @param[in]	kwds - keywords mappings  to the 'server_host' needing a
 *			scheduler restart cycle.
 *
 * @return PyObject *
 * @retval Python None
 */
PyObject *
pbsv1mod_meth_scheduler_restart_cycle(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"server_host", NULL};
	char *shost = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "|s:scheduler_restart_cycle",
					 kwlist,
					 &shost)) {
		return NULL;
	}

	if ((strcmp(shost, LOCALHOST_SHORTNAME) != 0) &&
	    (strcmp(shost, LOCALHOST_FULLNAME) != 0) &&
	    (strcmp(shost, pbs_conf.pbs_server_name) != 0)) {
		PyErr_SetString(PyExc_NotImplementedError,
				"Allowed only to owning pbs server host");
		return NULL;
	}

	pbs_python_scheduler_restart_cycle();

	Py_RETURN_NONE;
}

const char pbsv1mod_meth_set_pbs_statobj_doc[] =
	"set_pbs_statobj(function_name)\n\
\n\
   function_name:  name of function that creates/populates a PBS object \n\
\n\
";

/**
 * @brief
 *	set the status of job.
 */
PyObject *
pbsv1mod_meth_set_pbs_statobj(PyObject *self, PyObject *args,
			      PyObject *kwds)
{
	static char *kwlist[] = {"func", NULL};
	PyObject *f = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "O:set_pbs_statobj", kwlist, &f)) {
		PyErr_SetString(PyExc_AssertionError,
				"set_pbs_statobj: Failed to parse arguments");
		return NULL;
	}
	if (!PyCallable_Check(f)) {
		PyErr_SetString(PyExc_AssertionError,
				"Failed to get pbs_statobj function");
		return NULL;
	}
	Py_XINCREF(f);
	Py_XDECREF(py_pbs_statobj); /* release any previously set value    */
	/* NOTE: *XDECREF() is safe where      */
	/* if py_pbs_statobj is NULL, then     */
	/* nothing is released.                */
	/* Current value of py_pbs_statobj is  */
	/* released when Python interpreter is */
	/* restarted, during call to           */
	/* pbs_python_unload_python_types().   */
	py_pbs_statobj = f;
	Py_RETURN_NONE;
}

/**
 *
 * @brief
 * 	Looks into the current hook event object's job's 'attr_name'
 *	attribute, and returns the attribute value.
 *
 * @param[in]	attr_name - the name of an attribute.
 *
 * @return char *
 * @retval 	string - the string value returned by pbs_python_object_str(),
 * 			which returns a fixed memory area that gets
 *			overwritten by subsequent calls to this function.
 *			So the return value of this function must be
 *			immediately used.
 * @retval	NULL - if no proper value could be returned.
 *
 */
char *
_pbs_python_event_job_getval(char *attr_name)
{
	PyObject *py_job = NULL;
	PyObject *py_val = NULL;
	char *strval = NULL;

	if (py_hook_pbsevent == NULL) {
		log_err(PBSE_INTERNAL, __func__, "No hook event found!");
		return NULL;
	}

	if (!PyObject_HasAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB)) {
		LOG_ERROR_ARG2("%s: does not have attribute <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}

	py_job = PyObject_GetAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB); /* NEW */
	if (py_job == NULL || (py_job == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}

	if (PyObject_HasAttrString(py_job, attr_name)) {

		py_val = PyObject_GetAttrString(py_job,
						attr_name); /* NEW */

		if ((py_val != NULL) && (py_val != Py_None)) {

			strval = pbs_python_object_str(py_val);
		}
	}

	Py_CLEAR(py_job);
	Py_CLEAR(py_val);

	return (strval);
}

/**
 *
 * @brief
 * 	Looks into the current hook event object's job's 'attr_name'
 *	parameter of type resource (e.g. pbs.event().job.Resource_List),
 *	and returns the resource 'resc_name' value, if it was set inside
 *	a hook script.
 *
 * @param[in]	attr_name - the name of an attribute of type resource.
 * @param[in]	resc_name - the name of the resource whose value is being
 *				requested.
 * @return char *
 * @retval 	string - the string value returned by pbs_python_object_str(),
 * 			which returns a fixed memory area that gets
 *			overwritten by subsequent calls to this function.
 *			So the return value of this function must be
 *			immediately used.
 * @retval	NULL - if no proper value could be returned.
 *
 */
char *
_pbs_python_event_jobresc_getval_hookset(char *attr_name, char *resc_name)
{
	PyObject *py_job = NULL;
	PyObject *py_jobresc = NULL;
	PyObject *py_attr_hookset_dict = NULL;
	PyObject *py_rescval = NULL;

	char *strval = NULL;

	if (py_hook_pbsevent == NULL) {
		log_err(PBSE_INTERNAL, __func__, "No hook event found!");
		return NULL;
	}

	if (!PyObject_HasAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB)) {
		LOG_ERROR_ARG2("%s: does not have attribute <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}

	py_job = PyObject_GetAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB); /* NEW */

	if (py_job == NULL || (py_job == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}

	/* Get:pbs.event().job.<attr_name>[]
	 Ex. pbs.event().job.Resource_List[]
	 */
	py_jobresc = PyObject_GetAttrString(py_job, attr_name); /* NEW */

	if (py_jobresc == NULL || (py_jobresc == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_JOB, attr_name);
		goto jobresc_getval_hookset_exit;
	}

	/*
	 * Get the attributes that have been set in the hook script via the
	 * _attributes_hook_set dictionary.
	 */
	py_attr_hookset_dict = PyObject_GetAttrString(
		py_jobresc, PY_ATTRIBUTES_HOOK_SET); /* NEW */
	if (py_attr_hookset_dict == NULL) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       attr_name, PY_ATTRIBUTES_HOOK_SET);
		goto jobresc_getval_hookset_exit;
	}
	if (!PyDict_Check(py_attr_hookset_dict)) {
		LOG_ERROR_ARG2("%s: <%s> is not a dict",
			       attr_name, PY_ATTRIBUTES_HOOK_SET);
		goto jobresc_getval_hookset_exit;
	}

	/* And this all boils down to (whew!):
	 Ex. pbs.event().job.Resource_List[]._attributes_hook_set[<pbs.event().job.Resource_List[]'s instance>][<resc_name>] = <resc_val>
	 */

	if (PyDict_GetItemString(py_attr_hookset_dict, resc_name) != NULL) {
		if (PyObject_HasAttrString(py_jobresc, resc_name)) {
			py_rescval = PyObject_GetAttrString(py_jobresc,
							    resc_name); /* NEW */

			if ((py_rescval != NULL) && (py_rescval != Py_None)) {

				strval = pbs_python_object_str(py_rescval);
			}
		}
	}

jobresc_getval_hookset_exit:

	Py_CLEAR(py_job);
	Py_CLEAR(py_jobresc);
	Py_CLEAR(py_attr_hookset_dict);
	Py_CLEAR(py_rescval);

	return (strval);
}
/**
 *
 * @brief
 * 	Looks into the current hook event object's job's 'attr_name'
 *	parameter of type resource (e.g. pbs.event().job.Resource_List),
 *	and returns the resource 'resc_name' value.
 *
 * @param[in]	attr_name - the name of an attribute of type resource.
 * @param[in]	resc_name - the name of the resource whose value is being
 *				requested.
 * @return char *
 * @retval 	string - the string value returned by pbs_python_object_str(),
 * 			which returns a fixed memory area that gets
 *			overwritten by subsequent calls to this function.
 *			So the return value of this function must be
 *			immediately used.
 * @retval	NULL - if no proper value could be returned.
 *
 */
char *
_pbs_python_event_jobresc_getval(char *attr_name, char *resc_name)
{
	PyObject *py_job = NULL;
	PyObject *py_jobresc = NULL;
	PyObject *py_rescval = NULL;
	char *strval = NULL;

	if (py_hook_pbsevent == NULL) {
		log_err(PBSE_INTERNAL, __func__, "No hook event found!");
		return NULL;
	}

	if (!PyObject_HasAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB)) {
		LOG_ERROR_ARG2("%s: does not have attribute <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}

	py_job = PyObject_GetAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB); /* NEW */

	if (py_job == NULL || (py_job == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return NULL;
	}
	py_jobresc = PyObject_GetAttrString(py_job, attr_name); /* NEW */

	if (py_jobresc == NULL || (py_jobresc == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_JOB, attr_name);
		goto jobresc_getval_exit;
	}

	if (PyObject_HasAttrString(py_jobresc, resc_name)) {

		py_rescval = PyObject_GetAttrString(py_jobresc,
						    resc_name); /* NEW */

		if ((py_rescval != NULL) && (py_rescval != Py_None)) {

			strval = pbs_python_object_str(py_rescval);
		}
	}

jobresc_getval_exit:
	Py_CLEAR(py_jobresc);
	Py_CLEAR(py_job);
	Py_CLEAR(py_rescval);
	return (strval);
}

/**
 *
 * @brief
 * 	Clears/Empties the current hook event object's job's
 *	PY_ATTRIBUTES_HOOK_SET dictionary. This is the set of resources that
 *      have been flagged as set in a hook script.
 *
 * @param[in]	attr_name - the name of an attribute of type resource.
 * @return int
 * @retval 	0 - success
 * @retval	1 - if unsuccessful clearing the dictionary.
 *
 */
int
_pbs_python_event_jobresc_clear_hookset(char *attr_name)
{
	PyObject *py_job = NULL;
	PyObject *py_jobresc = NULL;
	PyObject *py_attr_hookset_dict = NULL;
	int rc = 1;

	if (py_hook_pbsevent == NULL) {
		log_err(PBSE_INTERNAL, __func__, "No hook event found!");
		return (1);
	}

	if (!PyObject_HasAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB)) {
		LOG_ERROR_ARG2("%s: does not have attribute <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return (1);
	}

	py_job = PyObject_GetAttrString(py_hook_pbsevent, PY_EVENT_PARAM_JOB); /* NEW */

	if (py_job == NULL || (py_job == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_EVENT, PY_EVENT_PARAM_JOB);
		return (1);
	}

	/* Get:pbs.event().job.<attr_name>[]
	 Ex. pbs.event().job.Resource_List[]
	 */
	py_jobresc = PyObject_GetAttrString(py_job, attr_name); /* NEW */

	if (py_jobresc == NULL || (py_jobresc == Py_None)) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       PY_TYPE_JOB, attr_name);
		goto jobresc_clear_hookset_exit;
	}

	/*
	 * Get the attributes that have been set in the hook script via the
	 * _attributes_hook_set dictionary.
	 */
	py_attr_hookset_dict = PyObject_GetAttrString(
		py_jobresc, PY_ATTRIBUTES_HOOK_SET); /* NEW */
	if (py_attr_hookset_dict == NULL) {
		LOG_ERROR_ARG2("%s: does not have a value for <%s>",
			       attr_name, PY_ATTRIBUTES_HOOK_SET);
		goto jobresc_clear_hookset_exit;
	}
	if (!PyDict_Check(py_attr_hookset_dict)) {
		LOG_ERROR_ARG2("%s: <%s> is not a dict",
			       attr_name, PY_ATTRIBUTES_HOOK_SET);
		goto jobresc_clear_hookset_exit;
	}

	PyDict_Clear(py_attr_hookset_dict);
	rc = 0;

jobresc_clear_hookset_exit:

	Py_CLEAR(py_job);
	Py_CLEAR(py_jobresc);
	Py_CLEAR(py_attr_hookset_dict);

	return (rc);
}

const char pbsv1mod_meth_size_to_kbytes_doc[] =
	"size_to_kbytes(py_size)\n\
\n\
   py_size: Python size object\n\
\n\
";

/**
 * @brief
 *	convert and return the size to kilobytes.
 *
 */
PyObject *
pbsv1mod_meth_size_to_kbytes(PyObject *self, PyObject *args,
			     PyObject *kwds)
{
	static char *kwlist[] = {"py_size", NULL};
	PyObject *l = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "O:size_to_kbytes", kwlist, &l)) {
		PyErr_SetString(PyExc_AssertionError,
				"size_to_kbytes: Failed to parse arguments");
		return NULL;
	}

	return (PyLong_FromUnsignedLongLong(pps_size_to_kbytes(l)));
}

/**
 * @brief
 *	set the hook debug input file name.
 */
void
pbs_python_set_hook_debug_input_fp(FILE *fp)
{
	hook_debug.input_fp = fp;
}

/**
 * @brief
 *	get the reference to hook debug input file
 *
 */
FILE *
pbs_python_get_hook_debug_input_fp(void)
{
	return (hook_debug.input_fp);
}

/**
 * @brief
 *	set the hook debug input file name.
 *
 */
void
pbs_python_set_hook_debug_input_file(char *filename)
{
	if (filename != NULL)
		strncpy(hook_debug.input_file, filename, MAXPATHLEN);
}

/**
 * @brief
 *      get the reference to hook debug input file
 *
 */
char *
pbs_python_get_hook_debug_input_file(void)
{
	if (hook_debug.input_file[0] == '\0')
		return NULL;
	return (hook_debug.input_file);
}

/**
 * @brief
 *      get the reference to hook debug output file
 *
 */
void
pbs_python_set_hook_debug_output_fp(FILE *fp)
{
	hook_debug.output_fp = fp;
}

/**
 * @brief
 *	get reference of hook debug output file
 *
 */
FILE *
pbs_python_get_hook_debug_output_fp(void)
{
	return (hook_debug.output_fp);
}

/**
 * @brief
 *      set hook debug output file
 *
 */

void
pbs_python_set_hook_debug_output_file(char *filename)
{
	if (filename != NULL)
		strncpy(hook_debug.output_file, filename, MAXPATHLEN);
}

/**
 * @brief
 *      get the reference to hook debug output file
 *
 */

char *
pbs_python_get_hook_debug_output_file(void)
{
	if (hook_debug.output_file[0] == '\0')
		return NULL;
	return (hook_debug.output_file);
}

/**
 * @brief
 *      set hook debug input file
 *
 */

void
pbs_python_set_hook_debug_data_fp(FILE *fp)
{
	hook_debug.data_fp = fp;
}

/**
 * @brief
 *	get reference of hook debug data file.
 *
 */
FILE *
pbs_python_get_hook_debug_data_fp(void)
{
	return (hook_debug.data_fp);
}

/**
 * @brief
 *	set hook debug data file.
 *
 */
void
pbs_python_set_hook_debug_data_file(char *filename)
{
	if (filename != NULL)
		strncpy(hook_debug.data_file, filename, MAXPATHLEN);
}

/**
 * @brief
 *	get hook debug data file name.
 */
char *
pbs_python_get_hook_debug_data_file(void)
{
	if (hook_debug.data_file[0] == '\0')
		return NULL;
	return (hook_debug.data_file);
}

/**
 * @brief
 *	set the hook debug object name
 */
void
pbs_python_set_hook_debug_objname(char *objname)
{
	if (objname != NULL)
		strncpy(hook_debug.objname, objname, HOOK_BUF_SIZE);
}

/**
 * @brief
 *	get the hook debug object name
 */
char *
pbs_python_get_hook_debug_objname(void)
{
	if (hook_debug.objname[0] == '\0')
		return NULL;
	return (hook_debug.objname);
}
/**
 * @brief
 *	set servr information in server data.
 *
 */
void
pbs_python_set_server_info(pbs_list_head *server_input)
{
	server_data = server_input;
}

/**
 * @brief
 *	set the job information into server_job data.
 */
void
pbs_python_set_server_jobs_info(pbs_list_head *server_jobs_input,
				pbs_list_head *ids)
{
	server_jobs.data = server_jobs_input;
	server_jobs.ids = ids;
}

/**
 * @brief
 *      set the queue information into server_queue data.
 */

void
pbs_python_set_server_queues_info(pbs_list_head *server_queues_input,
				  pbs_list_head *names)
{
	server_queues.data = server_queues_input;
	server_queues.names = names;
}

/**
 * @brief
 *      set the reservation information into server's reservation data.
 */

void
pbs_python_set_server_resvs_info(pbs_list_head *server_resvs_input,
				 pbs_list_head *resvids)
{
	server_resvs.data = server_resvs_input;
	server_resvs.resvids = resvids;
}

/**
 * @brief
 *      set the vnode information into server vnode data.
 */

void
pbs_python_set_server_vnodes_info(pbs_list_head *server_vnodes_input,
				  pbs_list_head *names)
{
	server_vnodes.data = server_vnodes_input;
	server_vnodes.names = names;
}

/**
 * @brief
 *      unset the server information.
 *
 */

void
pbs_python_unset_server_info(void)
{
	server_data = NULL;
}

/**
 * @brief
 *	unset job info from server_job data
 */
void
pbs_python_unset_server_jobs_info(void)
{
	server_jobs.data = NULL;
	server_jobs.ids = NULL;
}

/**
 * @brief
 *      unset queue info from server_queue data
 */

void
pbs_python_unset_server_queues_info(void)
{
	server_queues.data = NULL;
	server_queues.names = NULL;
}

/**
 * @brief
 *      unset reservation info from server_resv data
 */

void
pbs_python_unset_server_resvs_info(void)
{
	server_resvs.data = NULL;
	server_resvs.resvids = NULL;
}

/**
 * @brief
 *      unset vnode info from server_vnode data
 */

void
pbs_python_unset_server_vnodes_info(void)
{
	server_vnodes.data = NULL;
	server_vnodes.names = NULL;
}

/**
 *
 * @brief
 * 	Helper method returning a server Python Object representing the local
 *	(current) server, with data taken from some a static source.
 *  @note
 *	This marks the server object "read-only" in Python mode.
 *
 * @return	PyObject *	pointer to a Python server object to map the
 *				local server values.
 */
static PyObject *
py_get_server_static(void)
{
	PyObject *py_svr_class = NULL;
	PyObject *py_svr = NULL;
	PyObject *py_sargs = NULL;
	int tmp_rc = -1;
	char perf_label[MAXBUFLEN];

	if (!use_static_data || (server_data == NULL))
		Py_RETURN_NONE;

	py_svr_class = pbs_python_types_table[PP_SVR_IDX].t_class;

	py_sargs = Py_BuildValue("(s)", server_name); /* NEW ref */
	if (!py_sargs) {
		log_err(-1, pbs_python_daemon_name, "could not build args list for server");
		goto server_static_error_exit;
	}

	py_svr = PyObject_Call(py_svr_class, py_sargs, NULL);
	if (!py_svr) {
		log_err(-1, pbs_python_daemon_name, "failed to create a python server object");
		goto server_static_error_exit;
	}
	Py_CLEAR(py_sargs);

	snprintf(perf_label, sizeof(perf_label), "hook_func:%s(%s)", SERVER_OBJECT, server_name);
	tmp_rc = pbs_python_populate_python_class_from_svrattrl(py_svr,
								server_data, perf_label, HOOK_PERF_POPULATE);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__,
			"partially populated python server object");
	}

	tmp_rc = pbs_python_mark_object_readonly(py_svr);

	if (tmp_rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "Failed to mark server readonly!");
		goto server_static_error_exit;
	}

	object_counter++;
	return py_svr;
server_static_error_exit:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	if (py_sargs)
		Py_CLEAR(py_sargs);
	if (py_svr)
		Py_CLEAR(py_svr);

	PyErr_SetString(PyExc_AssertionError, "Failed to create server object");

	return NULL;
}

const char pbsv1mod_meth_get_server_static_doc[] =
	"get_server_static()\n\
\n\
  returns:\n\
         a Python server object representing the current instance of the.\n\
         PBS server from a static source.\n\
         or None of static data source\n\
";

/**
 * @brief
 *	return server object representing the current instance of the PBS server.
 *
 * @return	PyObject *
 * @retval	PBS server	success
 * @retval	NULL		error
 */
PyObject *
pbsv1mod_meth_get_server_static(void)
{
	PyObject *py_obj = NULL;

	hook_set_mode = C_MODE;
	py_obj = py_get_server_static();
	hook_set_mode = PY_MODE;
	return (py_obj);
}

/**
 * @brief
 *	Returns a Python object that maps to a struct queue * taken directly
 *	from static server_queues data,, or a list of queue names if
 *	'qname' is the empty string ("")..
 * @param[in]	qname		- name of a queue to obtain "struct queue *"
 *				  content to populate a Python queue object,
 *				  or  the empty string ("") to obtain the
 *				  list of queue names.
 * @return      PyObject *	- the Python queue object corresponding to
 *				  'qname', or to a list queue names.
 */
static PyObject *
py_get_queue_static(char *qname, char *svr_name)
{
	PyObject *py_queue_class = NULL;
	PyObject *py_queue = NULL;
	PyObject *py_qargs = NULL;
	svrattrl *plist, *plist_next;
	char *p = NULL;
	char *pn = NULL;
	char *p1 = NULL;
	char *attr_name = NULL;
	pbs_list_head queuel;
	int rc;
	char perf_label[MAXBUFLEN];

	if (!use_static_data || (server_queues.data == NULL)) {
		Py_RETURN_NONE;
	}

	if (qname == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"Unable to populate python queue object");
		return NULL;
	}

	if (qname[0] == '\0') {
		return (create_py_strlist_from_svrattrl_names(server_queues.names));
	}

	CLEAR_HEAD(queuel);

	plist = (svrattrl *) GET_NEXT(*server_queues.data);
	do {
		if (plist == NULL)
			break;

		plist_next = (svrattrl *) GET_NEXT(plist->al_link);

		/* look for last dot as the name could be dotted like a queue name */
		p = strrchr(plist->al_name, '.');
		if (p == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: encountered an attribute %s without a queue name...ignoring", plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			plist = plist_next;
			continue;
		}
		*p = '\0'; /* now plist->al_name would be the queue name */
		if (strcmp(plist->al_name, qname) != 0) {
			*p = '.'; /* restore */
			plist = plist_next;
			continue;
		}
		attr_name = p + 1; /* p will be the actual attribute name */

		p1 = NULL;
		if (plist->al_resc != NULL) {
			p1 = strchr(plist->al_resc, ',');
			if (p1 != NULL) {
				*p1 = '\0'; /* now plist->al_resc is just */
					    /* the resource */
			}
		}

		if ((strcmp(attr_name, ATTR_server) == 0) &&
		    (svr_name != NULL) && (svr_name[0] != '\0') &&
		    (strcmp(svr_name, "localhost") != 0) &&
		    (strcmp(plist->al_value, svr_name) != 0)) {
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */
			free_attrlist(&queuel);
			Py_RETURN_NONE;
		}

		if (add_to_svrattrl_list(&queuel, attr_name,
					 plist->al_resc, plist->al_value, 0, NULL) != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "warning: failed to add_to_svrattrl_list(%s,%s,%s)",
				 plist->al_name,
				 plist->al_resc ? plist->al_resc : "", plist->al_value);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore the orig plist->al_resc */
			goto get_queue_error_exit;
		}
		if (p1 != NULL)
			*p1 = ',';

		/* Check if we're done processing the attributes/resources */
		/* of the current queue. 				    */
		pn = NULL;
		if (plist_next != NULL) {
			/* look at last dot for "dotted" queue names */
			pn = strrchr(plist_next->al_name, '.');
			if (pn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: encountered the next attribute %s without a queue name...ignoring", plist_next->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				/* skip the next one */
				plist = (svrattrl *) GET_NEXT(plist_next->al_link);
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				continue;
			}
			*pn = '\0'; /* now plist_next->al_name would be the */
			/* queue name */
			/* The next queuelist entry is for a different queue name */
			/* since list is sorted according to queue name */
			if ((strcmp(plist->al_name, plist_next->al_name) != 0)) {
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				*pn = '.';	  /* restore orig plist_next->al_name */
				break;
			}
			*pn = '.'; /* restore orig plist_next->al_name */
		}

		plist = plist_next;
		if (p != NULL)
			*p = '.'; /* restore orig plist->al_name */

	} while (plist);
	if (GET_NEXT(queuel) == NULL)
		Py_RETURN_NONE;

	py_queue_class = pbs_python_types_table[PP_QUE_IDX].t_class;
	py_qargs = Py_BuildValue("(s)", qname); /* NEW ref */
	if (py_qargs == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "could not build args list for queue %s",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_queue_error_exit;
	}

	py_queue = PyObject_Call(py_queue_class, py_qargs,
				 NULL); /* NEW ref */
	if (py_queue == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to create a python queue %s object",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_queue_error_exit;
	}

	snprintf(perf_label, sizeof(perf_label), "hook_func:%s(%s)", SERVER_QUEUE_OBJECT, qname);
	rc = pbs_python_populate_python_class_from_svrattrl(py_queue, &queuel, perf_label, HOOK_PERF_POPULATE);

	if (rc == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to fully populate Python"
			 " queue %s object",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_queue_error_exit;
	}

	free_attrlist(&queuel);
	CLEAR_HEAD(queuel);
	Py_CLEAR(py_qargs);

	return (py_queue);

get_queue_error_exit:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(py_qargs);
	Py_CLEAR(py_queue);
	PyErr_SetString(PyExc_AssertionError, "Failed to create queue object");

	return NULL;
}

const char pbsv1mod_meth_get_queue_static_doc[] =
	"get_queue_static(qnamne)\n\
\n\
  'qnamne' is the name of queue whose info is beting returned.\n\
  returns:\n\
         a Python queue object representing the current instance of the.\n\
         PBS queue 'qnamne', from a static source.\n\
         or None of static data source is not available.\n\
";

/**
 * @brief
 *	return a Python queue object representing the current instance
 *	of the PBS queue 'qnamne' from a static source.
 *
 * @return	PyObject *
 * @retval	reference to queue	success
 * @retval	NULL			error
 *
 * @par	Note:
 *	'qnamne' is the name of queue whose info is beting returned.
 *
 */
PyObject *
pbsv1mod_meth_get_queue_static(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"queue", "server_name", NULL};
	char *qname = NULL;
	char *svr_name = NULL;
	PyObject *py_obj = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "ss:get_queue_static",
					 kwlist,
					 &qname,
					 &svr_name)) {
		return NULL;
	}

	hook_set_mode = C_MODE;
	py_obj = py_get_queue_static(qname, svr_name);
	hook_set_mode = PY_MODE;
	return (py_obj);
}

/**
 * @brief
 *	Returns a Python object that maps to a struct pbsnodes * taken directly
 *	from static server_vnodes, or a list of vnode names if 'vname'
 *	given is "".
 * @param[in]	vname		- name of a vnode to obtain "struct pbsnode *"
 *				  content to populate a Python vnode object,
 *				  or the empty string ("") to match a list of
 *				  vnode names.
 * @return      PyObject *	- the Python vnode object corresponding to
 *				  'vname', or a list of vnode names.
 * @retval	<actual_vnode_object>
 * @retval	None		- if vnode object was not found.
 */
static PyObject *
py_get_vnode_static(char *vname, char *svr_name)
{
	PyObject *py_vnode_class = NULL;
	PyObject *py_vnode = NULL;
	PyObject *py_vargs = NULL;
	svrattrl *plist, *plist_next;
	char *p = NULL;
	char *pn = NULL;
	char *p1 = NULL;
	char *attr_name = NULL;
	pbs_list_head vnodel;
	int rc;
	char perf_label[MAXBUFLEN];

	if (!use_static_data || (server_vnodes.data == NULL)) {
		Py_RETURN_NONE;
	}

	if (vname == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"Unable to populate python vnode object");
		return NULL;
	}

	if (vname[0] == '\0') {
		return (create_py_strlist_from_svrattrl_names(server_vnodes.names));
	}

	CLEAR_HEAD(vnodel);

	/* NOTE: The list is sorted according to vnode name */
	plist = (svrattrl *) GET_NEXT(*server_vnodes.data);
	do {
		if (plist == NULL)
			break;

		plist_next = (svrattrl *) GET_NEXT(plist->al_link);

		/* look for last dot as the name could be dotted like a node name */
		p = strrchr(plist->al_name, '.');
		if (p == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: encountered an attribute %s without a node name...ignoring", plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			plist = plist_next;
			continue;
		}
		*p = '\0'; /* now plist->al_name would be the node name */
		if (strcmp(plist->al_name, vname) != 0) {
			plist = plist_next;
			*p = '.'; /* restore orig plist->al_name */
			continue;
		}
		attr_name = p + 1; /* p will be the actual attribute name */
		p1 = NULL;
		if (plist->al_resc != NULL) {
			p1 = strchr(plist->al_resc, ',');
			if (p1 != NULL) {
				*p1 = '\0';
			}
		}

		if ((strcmp(attr_name, ATTR_server) == 0) &&
		    (svr_name != NULL) && (svr_name[0] != '\0') &&
		    (strcmp(svr_name, "localhost") != 0) &&
		    (strcmp(plist->al_value, svr_name) != 0)) {
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */
			free_attrlist(&vnodel);
			Py_RETURN_NONE;
		}

		if (add_to_svrattrl_list(&vnodel, attr_name,
					 plist->al_resc, plist->al_value, 0, NULL) != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "warning: failed to add_to_svrattrl_list(%s,%s,%s)",
				 plist->al_name,
				 plist->al_resc ? plist->al_resc : "", plist->al_value);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */
			goto get_vnode_error_exit;
		}

		if (p1 != NULL)
			*p1 = ','; /* restore the orig plist->al_resc */

		/* Check if we're done processing the attributes/resources */
		/* of the current node. 				    */
		pn = NULL;
		if (plist_next != NULL) {

			/* look at last dot for "dotted" node names */
			pn = strrchr(plist_next->al_name, '.');
			if (pn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: encountered the next attribute %s without a node name...ignoring", plist_next->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				/* skip the next one */
				plist = (svrattrl *) GET_NEXT(plist_next->al_link);
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				continue;
			}
			*pn = '\0'; /* now plist_next->al_name would be the */
			/* node name */

			if ((strcmp(plist->al_name, plist_next->al_name) != 0)) {
				*pn = '.';
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				break;
			}
			*pn = '.'; /* restore orig plist_next->al_name */
		}

		plist = plist_next;
		if (p != NULL)
			*p = '.'; /* restore orig plist->al_name */

	} while (plist);

	if (GET_NEXT(vnodel) == NULL)
		Py_RETURN_NONE;

	py_vnode_class = pbs_python_types_table[PP_VNODE_IDX].t_class;
	py_vargs = Py_BuildValue("(s)", vname); /* NEW ref */
	if (py_vargs == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "could not build args list for vnode %s",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_vnode_error_exit;
	}

	py_vnode = PyObject_Call(py_vnode_class, py_vargs,
				 NULL); /* NEW ref */
	if (py_vnode == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to create a python vnode %s object",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_vnode_error_exit;
	}

	snprintf(perf_label, sizeof(perf_label), "hook_func:%s(%s)", SERVER_VNODE_OBJECT, vname);
	rc = pbs_python_populate_python_class_from_svrattrl(py_vnode, &vnodel, perf_label, HOOK_PERF_POPULATE);
	if (rc == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to fully populate Python"
			 " vnode %s object",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_vnode_error_exit;
	}

	free_attrlist(&vnodel);
	CLEAR_HEAD(vnodel);
	Py_CLEAR(py_vargs);

	return (py_vnode);

get_vnode_error_exit:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	Py_CLEAR(py_vargs);
	Py_CLEAR(py_vnode);
	PyErr_SetString(PyExc_AssertionError, "Failed to create vnode object");

	return NULL;
}

const char pbsv1mod_meth_get_vnode_static_doc[] =
	"get_vnode_static(vname)\n\
\n\
  'vname' is the name of vnode whose info is beting returned.\n\
  returns:\n\
         a Python vnode object representing the current instance of the.\n\
         PBS vnode 'vname', from a static source.\n\
         or None of static data source is not available.\n\
";
/**
 * @brief
 *	get vnode info
 *
 * @par Note:
 *	'vname' is the name of vnode whose info is beting returned.
 *
 * @return	PyObject*
 * @retval	a Python vnode object representing the current instance of the.\n
 *		PBS vnode 'vname', from a static source.				success
 * @retval	None of static data source is not available.				error
 *
 */
PyObject *
pbsv1mod_meth_get_vnode_static(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"vnode", "server_name", NULL};
	char *vname = NULL;
	char *svr_name = NULL;
	PyObject *py_obj = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "ss:get_vnode_static",
					 kwlist,
					 &vname,
					 &svr_name)) {
		return NULL;
	}

	hook_set_mode = C_MODE;
	py_obj = py_get_vnode_static(vname, svr_name);
	hook_set_mode = PY_MODE;
	return (py_obj);
}

/**
 * @brief
 *	If 'jid' is not the empty string (""), then this returns a Python
 *	job object that maps to a struct job * taken directly from static
 *	server_jobs data.
 *	If 'jid' is the empty string (""), this returns a Python list
 *	string object enumerating the list of jobs found.
 *
 * @param[in]	jid		- name of a job to obtain "struct job *"
 *				  content to populate a Python job object,
 *				  or the empty string "", to enumerate
 *				  the list of jobs.
 *
 * @param[in]	svr_name	- return job @ server_name only
 * @param[in]	queue_name	- return job @ queue_name only
 *
 * @return      PyObject *	- the Python job object corresponding to
 *				  'jid'.
 * @retval	<job_object> or <list of string objects>
 * @retval	None		- if no matching job.
 */
static PyObject *
py_get_job_static(char *jid, char *svr_name, char *queue_name)
{
	PyObject *py_job_class = NULL;
	PyObject *py_job = NULL;
	PyObject *py_jargs = NULL;
	svrattrl *plist, *plist_next;
	char *p = NULL;
	char *pn = NULL;
	char *p1 = NULL;
	char *attr_name = NULL;
	pbs_list_head jobl;
	/* set job.queue to actual queue object */
	char *qname;
	PyObject *py_server = NULL;
	PyObject *py_que = NULL;
	int rc;
	char perf_label[MAXBUFLEN];

	if (!use_static_data || (server_jobs.data == NULL)) {
		Py_RETURN_NONE;
	}

	if (jid == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"Unable to populate python job object");
		return NULL;
	}

	if (jid[0] == '\0') {
		return (create_py_strlist_from_svrattrl_names(server_jobs.ids));
	}

	CLEAR_HEAD(jobl);

	/* NOTE: The list is sorted according to job name */
	plist = (svrattrl *) GET_NEXT(*server_jobs.data);
	do {
		if (plist == NULL)
			break;

		plist_next = (svrattrl *) GET_NEXT(plist->al_link);

		/* look for last dot as the name could be dotted like a job name */
		p = strrchr(plist->al_name, '.');
		if (p == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: encountered an attribute %s without a job name...ignoring", plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			plist = plist_next;
			continue;
		}
		*p = '\0'; /* now plist->al_name would be the job name */
		if (strcmp(plist->al_name, jid) != 0) {
			*p = '.'; /* restore orig plist->al_name */
			plist = plist_next;
			continue;
		}
		attr_name = p + 1; /* p will be the actual attribute name */
		p1 = NULL;
		if (plist->al_resc != NULL) {
			p1 = strchr(plist->al_resc, ',');
			if (p1 != NULL) {
				*p1 = '\0';
			}
		}

		if ((strcmp(attr_name, ATTR_server) == 0) &&
		    (svr_name != NULL) && (svr_name[0] != '\0') &&
		    (strcmp(svr_name, "localhost") != 0) &&
		    (strcmp(plist->al_value, svr_name) != 0)) {
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */
			free_attrlist(&jobl);
			Py_RETURN_NONE;
		}

		if ((strcmp(attr_name, ATTR_queue) == 0) &&
		    (queue_name != NULL) && (queue_name[0] != '\0') &&
		    (strcmp(plist->al_value, queue_name) != 0)) {
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */
			free_attrlist(&jobl);
			Py_RETURN_NONE;
		}

		if (add_to_svrattrl_list(&jobl, attr_name,
					 plist->al_resc, plist->al_value, 0, NULL) != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "warning: failed to add_to_svrattrl_list(%s,%s,%s)",
				 plist->al_name,
				 plist->al_resc ? plist->al_resc : "", plist->al_value);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */

			goto get_job_error_exit;
		}
		if (p1 != NULL)
			*p1 = ','; /* restore the orig plist->al_resc */

		/* Check if we're done processing the attributes/resources */
		/* of the current job. 				    */
		pn = NULL;
		if (plist_next != NULL) {

			/* look at last dot for "dotted" job names */
			pn = strrchr(plist_next->al_name, '.');
			if (pn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: encountered the next attribute %s without a job name...ignoring", plist_next->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				/* skip the next one */
				plist = (svrattrl *) GET_NEXT(plist_next->al_link);
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				continue;
			}
			*pn = '\0'; /* now plist_next->al_name would be the */
			/* job name */

			if ((strcmp(plist->al_name, plist_next->al_name) != 0)) {
				*pn = '.'; /* restore orig plist_next->al_name */
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				break;
			}
			*pn = '.'; /* restore orig plist_next->al_name */
		}

		plist = plist_next;
		if (p != NULL)
			*p = '.'; /* restore orig plist->al_name */

	} while (plist);

	if (GET_NEXT(jobl) == NULL) {
		free_attrlist(&jobl);
		Py_RETURN_NONE;
	}

	py_job_class = pbs_python_types_table[PP_JOB_IDX].t_class;
	py_jargs = Py_BuildValue("(s)", jid); /* NEW ref */
	if (py_jargs == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "could not build args list for job %s",
			 plist ? plist->al_name : "");
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_job_error_exit;
	}

	py_job = PyObject_Call(py_job_class, py_jargs,
			       NULL); /* NEW ref */
	if (py_job == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to create a python job %s object",
			 plist ? plist->al_name : "");
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_job_error_exit;
	}

	snprintf(perf_label, sizeof(perf_label), "hook_func:%s(%s)", SERVER_JOB_OBJECT, jid);
	rc = pbs_python_populate_python_class_from_svrattrl(py_job, &jobl, perf_label, HOOK_PERF_POPULATE);

	if (rc == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to fully populate Python"
			 " job %s object",
			 plist ? plist->al_name : "");
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_job_error_exit;
	}

	free_attrlist(&jobl);
	CLEAR_HEAD(jobl);
	Py_CLEAR(py_jargs);

	if (PyObject_HasAttrString(py_job, ATTR_queue)) {
		qname = pbs_python_object_get_attr_string_value(py_job, ATTR_queue);
		if (qname != NULL) {
			py_que = py_get_queue_static(qname, svr_name); /* NEW ref */
			if (py_que != NULL) {
				/* py_server queue ref ct incremented as part of py_job */
				(void) PyObject_SetAttrString(py_job, ATTR_queue, py_que);
			}
			Py_DECREF(py_que); /* we no longer need to reference */
		}
	}

	/* set job.server to actual server object */
	py_server = py_get_server_static(); /* NEW Ref */

	if (py_server != NULL) {
		if (PyObject_HasAttrString(py_job, ATTR_server)) {
			/* py_server ref ct incremented as part of py_job */
			(void) PyObject_SetAttrString(py_job, ATTR_server, py_server);
		}
		Py_DECREF(py_server);
	}

	return (py_job);

get_job_error_exit:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	free_attrlist(&jobl);
	Py_CLEAR(py_jargs);
	Py_CLEAR(py_job);
	PyErr_SetString(PyExc_AssertionError, "Failed to create job object");

	return NULL;
}

const char pbsv1mod_meth_get_job_static_doc[] =
	"get_job_static(jobid, queue_name, server_name)\n\
\n\
  'jobid' is the name of job whose info s getting returned.\n\
  'queue_name' is the name of the queue where 'jobid' reside.\n\
  'server_name' is the name of the server owning 'jobid'.\n\
  returns:\n\
         a Python job object representing the current instance of the.\n\
         PBS job 'jobid', from a static source.\n\
         or None of static data source is not available.\n\
";

/**
 * @brief
 *	a Python job object representing the current instance of the.
 *	PBS job 'jobid', from a static source.
 *
 * @return	PyObject *
 * @retval	reference to jobid	success
 * @retval	NULL			error
 *
 */

PyObject *
pbsv1mod_meth_get_job_static(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"job", "server_name", "queue_name", NULL};
	char *jobid = NULL;
	PyObject *py_obj = NULL;
	char *qname = NULL;
	char *sname = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "sss:get_job_static",
					 kwlist,
					 &jobid,
					 &sname,
					 &qname)) {
		return NULL;
	}
	hook_set_mode = C_MODE;
	py_obj = py_get_job_static(jobid, sname, qname);
	hook_set_mode = PY_MODE;
	return (py_obj);
}

/**
 * @brief
 *	Returns a Python object that maps to a struct resv * taken directly
 *	from static server_resvs, or a list of reservation ids if 'resvid'
 *	matches empty string ("").
 * @param[in]	resvid		- name of a resv to obtain "struct resv *"
 *				  content to populate a Python resv object,
 *				  or the empty string ("") to return the
 *				  list of reservation names.
 * @param[in]	svr_name	- return resv @ server_name only
 * @param[in]	queue_name	- return resv @ queue_name only
 * @return      PyObject *	- the Python resv object corresponding to
 *				  'resvid'.
 */
static PyObject *
py_get_resv_static(char *resvid, char *svr_name)
{
	PyObject *py_resv_class = NULL;
	PyObject *py_resv = NULL;
	PyObject *py_rargs = NULL;
	svrattrl *plist, *plist_next;
	char *p = NULL;
	char *pn = NULL;
	char *p1 = NULL;
	char *attr_name = NULL;
	pbs_list_head resvl;
	PyObject *py_server = NULL;
	PyObject *py_que = NULL;
	int rc;
	char perf_label[MAXBUFLEN];

	if (!use_static_data || (server_resvs.data == NULL)) {
		Py_RETURN_NONE;
	}

	if (resvid == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"Unable to populate python resv object");
		return NULL;
	}

	if (resvid[0] == '\0') {
		return (create_py_strlist_from_svrattrl_names(server_resvs.resvids));
	}

	CLEAR_HEAD(resvl);
	/* NOTE: The list is sorted according to resv name */
	plist = (svrattrl *) GET_NEXT(*server_resvs.data);
	do {
		if (plist == NULL)
			break;

		plist_next = (svrattrl *) GET_NEXT(plist->al_link);

		/* look for last dot as the name could be dotted like a resv name */
		p = strrchr(plist->al_name, '.');
		if (p == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: encountered an attribute %s without a resv name...ignoring", plist->al_name);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			plist = plist_next;
			continue;
		}
		*p = '\0'; /* now plist->al_name would be the resv name */

		if (strcmp(plist->al_name, resvid) != 0) {
			*p = '.'; /* restore orig plist->al_name */
			plist = plist_next;
			continue;
		}
		attr_name = p + 1; /* p will be the actual attribute name */

		p1 = NULL;
		if (plist->al_resc != NULL) {
			p1 = strchr(plist->al_resc, ',');
			if (p1 != NULL) {
				*p1 = '\0';
			}
		}

		if ((strcmp(attr_name, ATTR_server) == 0) &&
		    (svr_name != NULL) && (svr_name[0] != '\0') &&
		    (strcmp(svr_name, "localhost") != 0) &&
		    (strcmp(plist->al_value, svr_name) != 0)) {
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */
			free_attrlist(&resvl);
			Py_RETURN_NONE;
		}

		if (add_to_svrattrl_list(&resvl, attr_name,
					 plist->al_resc, plist->al_value, 0, NULL) != 0) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "warning: failed to add_to_svrattrl_list(%s,%s,%s)",
				 plist->al_name,
				 plist->al_resc ? plist->al_resc : "", plist->al_value);
			log_err(PBSE_INTERNAL, __func__, log_buffer);
			if (p != NULL)
				*p = '.'; /* restore orig plist->al_name */
			if (p1 != NULL)
				*p1 = ','; /* restore orig plist->al_resc */
			goto get_resv_error_exit;
		}
		if (p1 != NULL) {
			*p1 = ','; /* restore the orig plist->al_resc */
		}

		/* Check if we're done processing the attributes/resources */
		/* of the current resv. 				    */
		pn = NULL;
		if (plist_next != NULL) {

			/* look at last dot for "dotted" resv names */
			pn = strrchr(plist_next->al_name, '.');
			if (pn == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: encountered the next attribute %s without a resv name...ignoring", plist_next->al_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				/* skip the next one */
				plist = (svrattrl *) GET_NEXT(plist_next->al_link);
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				continue;
			}
			*pn = '\0'; /* now plist_next->al_name would be the */
			/* resv name */

			if ((strcmp(plist->al_name, plist_next->al_name) != 0)) {
				*pn = '.'; /* restore orig plist_next->al_name */
				if (p != NULL)
					*p = '.'; /* restore orig plist->al_name */
				break;
			}
		}

		plist = plist_next;
		if (p != NULL)
			*p = '.'; /* restore orig plist->al_name */

	} while (plist);

	if (GET_NEXT(resvl) == NULL) {
		free_attrlist(&resvl);
		Py_RETURN_NONE;
	}

	py_resv_class = pbs_python_types_table[PP_RESV_IDX].t_class;
	py_rargs = Py_BuildValue("(s)", resvid); /* NEW ref */
	if (py_rargs == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "could not build args list for resv %s",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_resv_error_exit;
	}

	py_resv = PyObject_Call(py_resv_class, py_rargs,
				NULL); /* NEW ref */
	if (py_resv == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to create a python resv %s object",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_resv_error_exit;
	}

	snprintf(perf_label, sizeof(perf_label), "hook_func:%s(%s)", SERVER_RESV_OBJECT, resvid);
	rc = pbs_python_populate_python_class_from_svrattrl(py_resv, &resvl, perf_label, HOOK_PERF_POPULATE);

	if (rc == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to fully populate Python"
			 " resv %s object",
			 plist->al_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto get_resv_error_exit;
	}

	free_attrlist(&resvl);
	CLEAR_HEAD(resvl);
	Py_CLEAR(py_rargs);

	if (PyObject_HasAttrString(py_resv, ATTR_queue)) {
		char *qname;

		qname = pbs_python_object_get_attr_string_value(py_resv, ATTR_queue);
		if (qname != NULL) {
			py_que = py_get_queue_static(qname, svr_name); /* NEW ref */
			if (py_que != NULL) {
				/* py_server queue ref ct incremented as part of py_resv */
				(void) PyObject_SetAttrString(py_resv, ATTR_queue, py_que);
				Py_DECREF(py_que); /* we no longer need to reference */
			}
		}
	}

	/* set resv.server to actual server object */
	py_server = py_get_server_static(); /* NEW Ref */

	if (py_server != NULL) {
		if (PyObject_HasAttrString(py_resv, ATTR_server)) {
			/* py_server ref ct incremented as part of py_resv */
			(void) PyObject_SetAttrString(py_resv, ATTR_server, py_server);
		}
		Py_DECREF(py_server);
	}

	return (py_resv);

get_resv_error_exit:
	if (PyErr_Occurred())
		pbs_python_write_error_to_log(__func__);
	free_attrlist(&resvl);
	Py_CLEAR(py_rargs);
	Py_CLEAR(py_resv);
	PyErr_SetString(PyExc_AssertionError, "Failed to create resv object");

	return NULL;
}

const char pbsv1mod_meth_get_resv_static_doc[] =
	"get_resv_static(resvid, server)\n\
\n\
  'resvid' is the name of resv whose info is beting returned.\n\
  'server' is the location of 'resvid'. Empty string ("
	") means local server\n\
  returns:\n\
         a Python resv object representing the current instance of the.\n\
         PBS resv 'resvid', from a static source.\n\
         or None of static data source is not available.\n\
";

/**
 * @brief
 *	'resvid' is the name of resv whose info is beting returned.
 *	server' is the location of 'resvid'. Empty string ("") means local server.
 *
 * @return	PyObject *
 * @retval	a Python resv object representing the current instance of the
 *		PBS resv 'resvid', from a static source.				success
 * @retval	None of static data source is not available				error
 */
PyObject *
pbsv1mod_meth_get_resv_static(PyObject *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"resv", "server_name", NULL};
	char *resvid = NULL;
	char *svr_name = NULL;
	PyObject *py_obj = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "ss:get_resv_static",
					 kwlist,
					 &resvid,
					 &svr_name)) {
		return NULL;
	}

	hook_set_mode = C_MODE;
	py_obj = py_get_resv_static(resvid, svr_name);
	hook_set_mode = PY_MODE;
	return (py_obj);
}

const char pbsv1mod_meth_get_server_data_fp_doc[] =
	"server_data_fp()\n\
\n\
   Returns the Python file object representing the already opened file 'fp.'\n\
\n\
";

/**
 * @brief
 *	Returns the Python file object representing the already opened file 'fp.
 */
PyObject *
pbsv1mod_meth_get_server_data_fp(void)
{
	PyObject *fp_obj = NULL;
	int data_fd;

	if (hook_debug.data_fp == NULL)
		Py_RETURN_NONE;

	data_fd = fileno(hook_debug.data_fp);

	fp_obj = PyFile_FromFd(data_fd, hook_debug.data_file, "w", -1,
			       NULL, NULL, NULL, 1);
	if (fp_obj == NULL)
		Py_RETURN_NONE;

	return (fp_obj);
}

const char pbsv1mod_meth_get_server_data_file_doc[] =
	"server_data_fp()\n\
\n\
   Returns the Python string representing the pathname to the hook data file.\n\
\n\
";

/**
 * @brief
 *	Returns the Python string representing the pathname to the hook data file.
 */
PyObject *
pbsv1mod_meth_get_server_data_file(void)
{
	if (hook_debug.data_file[0] == '\0') {
		Py_RETURN_NONE;
	}
	return (PyUnicode_FromString(hook_debug.data_file));
}

const char pbsv1mod_meth_use_static_data_doc[] =
	"use_static_data()\n\
\n\
  returns:\n\
         True if PBS is using static data for pbs.server()* calls.\n\
  	 This is an internal function.\n\
";

/**
 * @brief
 *	check for static data
 *
 * @return	PyObject*
 * @retval	Py_True	if yes
 * @retval	Py_False if not
 */
PyObject *
pbsv1mod_meth_use_static_data(void)
{
	PyObject *ret;
	ret = (use_static_data) ? Py_True : Py_False;
	Py_INCREF(ret);
	return (ret);
}

/**
 * @brief
 *	assign value to use_static_data
 */
void
pbs_python_set_use_static_data_value(int value)
{
	use_static_data = value;
}

/**
 * @brief
 * 	Set the environment variable 'env_var' to 'env_val'.
 *
 * @return int
 * @retval 0 	for success
 * @retval !=0	for error
 */
int
pbs_python_set_os_environ(char *env_var, char *env_val)
{
	PyObject *pystr_env_val = NULL;
	PyObject *pystr_env_var = NULL;
	PyObject *temp_item = NULL;
	PyObject *os_mod_obj = NULL; /* 'sys' module  */
	PyObject *os_mod_env = NULL; /* os.environ */

	if (env_var == NULL) {
		log_err(PBSE_INTERNAL, __func__, "passed NULL env_var!");
		return -1;
	}

	PyErr_Clear(); /* clear any exceptions */

	/* if sucess we get a NEW ref */
	if (!(os_mod_obj = PyImport_ImportModule("os"))) { /* failed */
		snprintf(log_buffer, sizeof(log_buffer), "%s:import os module",
			 __func__);
		pbs_python_write_error_to_log(log_buffer);
		return (-1);
	}

	/* if sucess we get a NEW ref */
	if ((os_mod_env =
		     PyObject_GetAttrString(os_mod_obj, "environ")) == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "%s:could not retrieve os environment",
			 __func__);
		pbs_python_write_error_to_log(log_buffer);
		Py_CLEAR(os_mod_obj);
		return (-1);
	}

	if ((pystr_env_var = PyUnicode_FromString(env_var)) == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "%s:creating pystr_env_var <%s>",
			 __func__, env_var);
		pbs_python_write_error_to_log(log_buffer);
		Py_CLEAR(os_mod_obj);
		Py_CLEAR(os_mod_env);
		return (-1);
	}

	if (env_val == NULL) {

		if ((temp_item = PyObject_GetItem(os_mod_env, pystr_env_var)) != NULL) {
			if (PyObject_DelItem(os_mod_env,
					     pystr_env_var) == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "%s: error unsetting environment <%s>",
					 __func__, env_var);
				pbs_python_write_error_to_log(log_buffer);
				Py_CLEAR(os_mod_obj);
				Py_CLEAR(os_mod_env);
				Py_CLEAR(pystr_env_var);
				return (-1);
			}
			Py_CLEAR(temp_item);
		}
	} else {
		/* if sucess we get a NEW ref */
		if ((pystr_env_val = PyUnicode_FromString(env_val)) == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "%s:creating pystr_env_val <%s>",
				 __func__, env_val);
			pbs_python_write_error_to_log(log_buffer);
			Py_CLEAR(os_mod_obj);
			Py_CLEAR(os_mod_env);
			Py_CLEAR(pystr_env_var);
			return (-1);
		}

		if (PyObject_SetItem(os_mod_env, pystr_env_var,
				     pystr_env_val) == -1) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "%s: error setting os.environ[%s]=%s",
				 __func__, env_var, env_val);
			pbs_python_write_error_to_log(log_buffer);
			Py_CLEAR(os_mod_obj);
			Py_CLEAR(os_mod_env);
			Py_CLEAR(pystr_env_val);
			Py_CLEAR(pystr_env_var);
			return (-1);
		}
	}
	Py_CLEAR(os_mod_obj);
	Py_CLEAR(os_mod_env);
	Py_CLEAR(pystr_env_val);
	Py_CLEAR(pystr_env_var);

	return (0);
}

/**
 * @brief
 * 	Set the pbs.hook_config_filename value to 'conf_file'.
 *
 * @param[in]	conf_file - path to the pbs hook config file.
 *
 * @return int
 * @retval 0 	for success
 * @retval !=0	for error
 */
int
pbs_python_set_pbs_hook_config_filename(char *conf_file)
{
	PyObject *pbs_mod_obj = NULL; /* 'pbs' module  */
	char *configfile_attrname = "hook_config_filename";

	PyErr_Clear(); /* clear any exceptions */

	/* if success we get a NEW ref */
	if (!(pbs_mod_obj = PyImport_ImportModule(PBS_OBJ))) { /* failed */
		snprintf(log_buffer, sizeof(log_buffer), "%s:import pbs module",
			 __func__);
		pbs_python_write_error_to_log(log_buffer);
		return (-1);
	}

	if (conf_file != NULL) {
		if (pbs_python_object_set_attr_string_value(pbs_mod_obj,
							    configfile_attrname, conf_file) == -1) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "%s: error setting pbs.hook_config_filename = %s",
				 __func__, conf_file);
			pbs_python_write_error_to_log(log_buffer);
			Py_CLEAR(pbs_mod_obj);
			return (-1);
		}
	} else {
		if (PyObject_SetAttrString(pbs_mod_obj,
					   configfile_attrname, Py_None) == -1) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "%s: error setting pbs.hook_config_filename = None",
				 __func__);
			pbs_python_write_error_to_log(log_buffer);
			Py_CLEAR(pbs_mod_obj);
			return (-1);
		}
	}
	Py_CLEAR(pbs_mod_obj);

	return (0);
}

const char pbsv1mod_meth_get_pbs_conf_doc[] =
	"get_pbs_conf()\n\
\n\
  returns:\n\
         Returns a dictionary containing the entries to pbs conf file, which is by default\n\
         /etc/pbs.conf in Linux/Unix or 'C:\\Program Files (x86)\\PBS\\pbs.conf'.\n\
";

/**
 * @brief
 *	This is the C->Python wrapper program for
 *	returning some key values in pbs.conf  file as loaded by the calling program.
 *	This is callable within a Python script.
 *
 * @return Python dict
 * @retval dictionary items are of the form: <pbs_conf_name>:<pbs_conf_value>
 *
 */
PyObject *
pbsv1mod_meth_get_pbs_conf(void)
{
	return (Py_BuildValue("{s:s,s:s,s:s,s:s,s:s,s:s,s:s,s:s,s:s,s:s,s:s,s:s,s:s}",
			      "PBS_HOME", pbs_conf.pbs_home_path ? pbs_conf.pbs_home_path : "",
			      "PBS_EXEC", pbs_conf.pbs_exec_path ? pbs_conf.pbs_exec_path : "",
			      "PBS_ENVIRONMENT", pbs_conf.pbs_environment ? pbs_conf.pbs_environment : "",
			      "PBS_RCP", pbs_conf.rcp_path ? pbs_conf.rcp_path : "",
			      "PBS_CP", pbs_conf.cp_path ? pbs_conf.cp_path : "",
			      "PBS_SCP", pbs_conf.scp_path ? pbs_conf.scp_path : "",
			      "PBS_SCP_ARGS", pbs_conf.scp_args ? pbs_conf.scp_args : "",
			      "PBS_MOM_HOME", pbs_conf.pbs_mom_home ? pbs_conf.pbs_mom_home : "",
			      "PBS_TMPDIR", pbs_conf.pbs_tmpdir ? pbs_conf.pbs_tmpdir : "",
			      "PBS_SERVER", pbs_conf.pbs_server_name ? pbs_conf.pbs_server_name : "",
			      "PBS_SERVER_HOST_NAME", pbs_conf.pbs_server_host_name ? pbs_conf.pbs_server_host_name : "",
			      "PBS_PRIMARY", pbs_conf.pbs_primary ? pbs_conf.pbs_primary : "",
			      "PBS_SECONDARY", pbs_conf.pbs_secondary ? pbs_conf.pbs_secondary : ""));
}

const char pbsv1mod_meth_load_resource_value_doc[] =
	"load_resource_value(resc_object)\n\
\n\
   resc_object:  resource object whose values are to be set\n\
\n\
   Load the values internally cached for 'resc_object'.\n\
";

/**
 * @brief
 *	This is callable in a Python script, for populating 'resc_object' of
 *	type 'pbs_resource' with values cached in the internal
 *	list 'pbs_resource_value_list'.
 *
 * @param[in]	args[1]	- the pbs_resource Python object.
 *
 * @return	PyObject *
 * @retval	NULL	- with an accompanying AssertionError Python exception.
 * @retval	Py_None - successful execution.
 *
 */
PyObject *
pbsv1mod_meth_load_resource_value(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"resc_object", NULL};
	PyObject *py_resource_match = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "O:load_resource_value",
					 kwlist,
					 &py_resource_match)) {
		return NULL;
	}

	if (load_cached_resource_value(py_resource_match) != 0) {
		PyErr_SetString(PyExc_AssertionError,
				"Failed to load cached value for resoure list");
		return NULL;
	}

	Py_RETURN_NONE;
}

const char pbsv1mod_meth_resource_str_value_doc[] =
	"str_resource_value(resc_object)\n\
\n\
   resc_object: resource object whose string value is to be returned\n\
";

/**
 * @brief
 *	This is callable in a Python script, for returning the
 *	string value of a type 'pbs_resource' resc_object. The string value
 *	is the comma-separated list of resource values for 'resc_object'.
 *
 * @param[in]	args[1]	- the pbs_resource Python object.
 *
 * @return	PyObject *
 * @retval	NULL	- with an accompanying AssertionError Python exception.
 * @retval	<python string value> - a Python object representing the
 *					string value.
 *
 */
PyObject *
pbsv1mod_meth_resource_str_value(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"resc_object", NULL};
	pbs_resource_value *resc_val;
	PyObject *py_resource_match = NULL;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "O:str_resource_value",
					 kwlist,
					 &py_resource_match)) {
		return NULL;
	}

	resc_val = (pbs_resource_value *) GET_NEXT(pbs_resource_value_list);
	while (resc_val != NULL) {

		if ((resc_val->py_resource != NULL) &&
		    (py_resource_match == resc_val->py_resource))
			break;

		resc_val = (pbs_resource_value *) GET_NEXT(resc_val->all_rescs);
	}

	if (resc_val == NULL) {
		/* no match */
		Py_RETURN_NONE;
	}

	if (resc_val->py_resource_str_value == NULL) {
		Py_RETURN_NONE;
	}

	Py_INCREF(resc_val->py_resource_str_value);
	return (resc_val->py_resource_str_value);
}

const char pbsv1mod_meth_release_nodes_doc[] =
	"release_nodes(job,node_list,keep_select)\n\
  where:\n\
\n\
   job		:  job whose nodes are being released\n\
   node_list	:  dictionary of pbs.vnode objects mapping to nodes being released\n\
   keep_select	:  string value mapping to a new job's select value\n\
\n\
  returns:\n\
	job object with new values given to the following attributes:\n\
	exec_vnode\n\
	exec_host\n\
	exec_host2\n\
       as a result of keeping nodes in 'node_list' or nodes that satisfy the\n\
	job's keep_select value.\n\
";

/**
 *
 * @brief
 *	This is callable in a Python hook script for releasing assigned nodes
  *	that don't appear in 'node_list' or are not needed
 *	to satisfy the input 'keep_select' value.
 * @param[in]	job		- Python job object in question
 * @param[in]	node_list	- Python dictionary of pbs.vnode objects mapping to
 *				nodes being released.
 * @param[in]	keep_select	- Python string representing the new value to the
 *				job's select value.
 *
 * @return	PyObject *
 * @retval	job	- the passed 'job' parameter but with new values to
 *			'exec_vnode', 'exec_host, and 'exec_host2' items  to
 *			satisfy request.
 *		None	- if release of nodes is not possible due to some error or
 *			not enough resources are available to satisfy request.
 */
PyObject *
pbsv1mod_meth_release_nodes(PyObject *self, PyObject *args, PyObject *kwds)
{
	static char *kwlist[] = {"job", "node_list", "keep_select", NULL};

	PyObject *py_job = (PyObject *) NULL;
	PyObject *py_node_list = (PyObject *) NULL;
	PyObject *py_keep_select = (PyObject *) NULL;
	PyObject *py_nodes = (PyObject *) NULL;
	PyObject *py_attr_hookset_dict = (PyObject *) NULL;
	PyObject *py_attr_keys = (PyObject *) NULL;
	char *vnodelist = NULL;
	int vnodelist_sz = 0;

	int rc = 0;
	int entry = 0;
	relnodes_input_t r_input;
	relnodes_input_vnodelist_t r_input_vnlist;
	relnodes_input_select_t r_input_select;

	char *keep_select = NULL;
	char *execvnode = NULL;
	char *exechost = NULL;
	char *exechost2 = NULL;
	char *schedselect = NULL;
	pbs_list_head exec_vnode_list;
	pbs_list_head failed_mom_list;
	pbs_list_head succeeded_mom_list;
	vnl_t *failed_vnodes = NULL;
	vnl_t *good_vnodes = NULL;
	char *new_exec_vnode = NULL;
	char *new_exec_host = NULL;
	char *new_exec_host2 = NULL;
	char *new_schedselect = NULL;
	char *tmpstr = NULL;
	PyObject *py_return = Py_None;
	int hook_set_mode_orig;
	char *jobid = NULL;
	char err_msg[LOG_BUF_SIZE] = {'\0'};

	hook_set_mode_orig = hook_set_mode;

	CLEAR_HEAD(exec_vnode_list);
	CLEAR_HEAD(succeeded_mom_list);
	CLEAR_HEAD(failed_mom_list);
	memset(log_buffer, '\0', LOG_BUF_SIZE);

	if (!PyArg_ParseTupleAndKeywords(args, kwds, "OOO:release_nodes",
					 kwlist, &py_job, &py_node_list, &py_keep_select)) {
		log_err(-1, __func__, "PyArg_ParseTupleAndKeywords failed!");
		goto release_nodes_exit;
	}

	if (py_node_list != Py_None) {
		int num_attrs;
		int i;
		char *vn_name;

		if (!PyDict_Check(py_node_list)) {
			log_err(PBSE_INTERNAL, __func__, "node_list is not a dictionary");
			goto release_nodes_exit;
		}

		py_attr_keys = PyDict_Keys(py_node_list); /* NEW ref */

		if (py_attr_keys == NULL) {
			log_err(PBSE_INTERNAL, __func__, "Failed to obtain node_list's keys");
			goto release_nodes_exit;
		}

		if (!PyList_Check(py_attr_keys)) {
			log_err(PBSE_INTERNAL, __func__, "node_list key is not a list");
			Py_CLEAR(py_attr_keys);
			goto release_nodes_exit;
		}

		vnodelist_sz = HOOK_BUF_SIZE;
		vnodelist = (char *) malloc(vnodelist_sz);
		if (vnodelist == NULL) {
			log_err(errno, __func__, "malloc failure");
			goto release_nodes_exit;
		}

		vnodelist[0] = '\0';

		num_attrs = PyList_Size(py_attr_keys);
		for (i = 0; i < num_attrs; i++) {

			vn_name = strdup(pbs_python_list_get_item_string_value(py_attr_keys, i));
			if ((vn_name == NULL) || (vn_name[0] == '\0')) {
				free(vn_name);
				continue;
			}

			if (vnodelist[0] != '\0') {
				if (pbs_strcat(&vnodelist, &vnodelist_sz, "+") == NULL) {
					log_err(errno, __func__, "pbs_strcat failure");
					free(vn_name);
					goto release_nodes_exit;
				}
			}

			if (pbs_strcat(&vnodelist, &vnodelist_sz, vn_name) == NULL) {
				log_err(errno, __func__, "pbs_strcat failure");
				free(vn_name);
				goto release_nodes_exit;
			}

			free(vn_name);
		}
	} else {
		char *str = pbs_python_object_str(py_keep_select);

		if ((str == NULL) || (str[0] == '\0')) {
			log_err(-1, __func__, "empty keep_select value");
			goto release_nodes_exit;
		}
		/* release nodes in such a way that 'keep_select' request is satisfied */
		keep_select = strdup(str);
		if (keep_select == NULL) {
			log_err(-1, __func__, "strdup keep_select failed");
			goto release_nodes_exit;
		}

		/* populate failed_mom_list used to decide which nodes to release */
		if (PyObject_HasAttrString(py_job, PY_JOB_FAILED_MOM_LIST)) {
			py_nodes = PyObject_GetAttrString(py_job, PY_JOB_FAILED_MOM_LIST);
			if (py_nodes != NULL) {
				if (PyList_Check(py_nodes)) {
					if (py_strlist_to_reliable_job_node_list(py_nodes, &failed_mom_list) == -1) {
						snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s: Failed to dump Python string list values into a svrattrl list!", PY_JOB_FAILED_MOM_LIST);
						log_err(PBSE_INTERNAL, __func__, log_buffer);
						goto release_nodes_exit;
					}
				}
				Py_CLEAR(py_nodes);
			}
		}

		/* populate succeeded_mom_list used to decide which nodes to keep */
		if (PyObject_HasAttrString(py_job, PY_JOB_SUCCEEDED_MOM_LIST)) {
			py_nodes = PyObject_GetAttrString(py_job, PY_JOB_SUCCEEDED_MOM_LIST); /* NEW */

			if (py_nodes != NULL) {
				if (PyList_Check(py_nodes)) {
					if (py_strlist_to_reliable_job_node_list(py_nodes, &succeeded_mom_list) == -1) {
						snprintf(log_buffer, sizeof(log_buffer), "%s: Failed to dump Python string list values into a svrattrl list!", PY_JOB_SUCCEEDED_MOM_LIST);
						log_err(PBSE_INTERNAL, __func__, log_buffer);
						goto release_nodes_exit;
					}
				}
				Py_CLEAR(py_nodes);
			}
		}
	}

	/* jobid */
	tmpstr = pbs_python_object_get_attr_string_value(py_job, "id");
	if ((tmpstr == NULL) || (tmpstr[0] == '\0')) {
		log_err(-1, __func__, "did not find a value to jobid");
		goto release_nodes_exit;
	}
	jobid = strdup(tmpstr);
	if (jobid == NULL) {
		log_err(-1, __func__, "strdup jobid failed");
		goto release_nodes_exit;
	}

	/* exec_vnode */
	tmpstr = pbs_python_object_get_attr_string_value(py_job, ATTR_execvnode);
	if ((tmpstr == NULL) || (tmpstr[0] == '\0')) {
		log_err(-1, __func__, "did not find a value to exec_vnode");
		goto release_nodes_exit;
	}
	execvnode = strdup(tmpstr);
	if (execvnode == NULL) {
		log_err(-1, __func__, "strdup exec_vnode failed");
		goto release_nodes_exit;
	}

	/* exec_host or exec_host2 */
	tmpstr = pbs_python_object_get_attr_string_value(py_job, ATTR_exechost);
	if ((tmpstr != NULL) && (tmpstr[0] != '\0')) {
		exechost = strdup(tmpstr);
		if (exechost == NULL) {
			log_err(-1, __func__, "strdup exec_host failed");
			goto release_nodes_exit;
		}
	}

	tmpstr = pbs_python_object_get_attr_string_value(py_job, ATTR_exechost2);
	if ((tmpstr != NULL) && (tmpstr[0] != '\0')) {
		exechost2 = strdup(tmpstr);
		if (exechost2 == NULL) {
			log_err(-1, __func__, "strdup exec_host2 failed");
			goto release_nodes_exit;
		}
	}

	if ((exechost == NULL) && (exechost2 == NULL)) {
		log_err(-1, __func__, "no value found for exec_host/exec_host2 ");
		goto release_nodes_exit;
	}

	if (exechost == NULL) {
		exechost = strdup(exechost2);
		if (exechost == NULL) {
			log_err(-1, __func__, "strdup exec_host failed");
			goto release_nodes_exit;
		}
	}

	if (exechost2 == NULL) {
		exechost2 = strdup(exechost);
		if (exechost2 == NULL) {
			log_err(-1, __func__, "strdup exec_host2 failed");
			goto release_nodes_exit;
		}
	}

	/* schedselect */
	tmpstr = pbs_python_object_get_attr_string_value(py_job, ATTR_SchedSelect);
	if ((tmpstr == NULL) || (tmpstr[0] == '\0')) {
		log_err(-1, __func__, "did not find a value to exec_vnode");
		goto release_nodes_exit;
	}
	schedselect = strdup(tmpstr);
	if (schedselect == NULL) {
		log_err(-1, __func__, "strdup schedselect failed");
		goto release_nodes_exit;
	}

	/* populate exec_vnode_list */
	if (populate_svrattrl_from_vnodelist_param(PY_EVENT_PARAM_VNODELIST, &exec_vnode_list) != 0) {
		snprintf(log_buffer, sizeof(log_buffer), "%s: Failed to dump Python string list values into a svrattrl list", PY_EVENT_PARAM_VNODELIST);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
		goto release_nodes_exit;
	}

	err_msg[0] = '\0';
	relnodes_input_init(&r_input);
	r_input.jobid = jobid;
	r_input.vnodes_data = &exec_vnode_list;
	r_input.execvnode = execvnode;
	r_input.exechost = exechost;
	r_input.exechost2 = exechost2;
	r_input.schedselect = schedselect;
	r_input.p_new_exec_vnode = &new_exec_vnode;
	r_input.p_new_exec_host[0] = &new_exec_host;
	r_input.p_new_exec_host[1] = &new_exec_host2;
	r_input.p_new_schedselect = &new_schedselect;

	if (vnodelist != NULL) {
		relnodes_input_vnodelist_init(&r_input_vnlist);
		r_input_vnlist.vnodelist = vnodelist;
		rc = pbs_release_nodes_given_nodelist(&r_input, &r_input_vnlist, err_msg, LOG_BUF_SIZE);
		snprintf(log_buffer, sizeof(log_buffer), "release_nodes_given_nodelist: AFT rc=%d jobid=%s vnodelist=%s execvnode=%s exechost=%s exechost2=%s schedselect=%s new_exec_vnode=%s new_exec_host=%s new_exec_host2=%s new_schedselect=%s", rc, jobid, vnodelist, execvnode, exechost ? exechost : "null", exechost2 ? exechost2 : "null", schedselect, new_exec_vnode, new_exec_host, new_exec_host2, new_schedselect);
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);
	} else if (keep_select != NULL) {
		relnodes_input_select_init(&r_input_select);
		r_input_select.select_str = keep_select;
		r_input_select.failed_mom_list = &failed_mom_list;
		r_input_select.succeeded_mom_list = &succeeded_mom_list;
		r_input_select.failed_vnodes = &failed_vnodes;
		r_input_select.good_vnodes = &good_vnodes;
		rc = pbs_release_nodes_given_select(&r_input, &r_input_select, err_msg, LOG_BUF_SIZE);
		snprintf(log_buffer, sizeof(log_buffer), "release_nodes_given_select: AFT rc=%d keep_select=%s execvnode=%s exechost=%s exechost2=%s new_exec_vnode=%s new_exec_host=%s new_exec_host2=%s new_schedselect=%s", rc, keep_select, execvnode, exechost ? exechost : "null", exechost2 ? exechost2 : "null", new_exec_vnode, new_exec_host, new_exec_host2, new_schedselect);
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);
	} else {
		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, "nothing to release: No values to both node_list and keep_select");
		goto release_nodes_exit;
	}

	if (rc != 0) {
		if (err_msg[0] != '\0')
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, err_msg);
		goto release_nodes_exit;
	}

	hook_set_mode = C_MODE;

	/* Get the attributes that have been set in the hook script */
	py_attr_hookset_dict = PyObject_GetAttrString(py_job, PY_ATTRIBUTES_HOOK_SET); /* new ref */
	if (py_attr_hookset_dict == NULL) {
		py_attr_hookset_dict = PyDict_New();
		PyObject_SetAttrString(py_job, PY_ATTRIBUTES_HOOK_SET, py_attr_hookset_dict);
	}

	if ((new_exec_vnode != NULL) && (new_exec_vnode[0] != '\0')) {
		entry = strlen(new_exec_vnode) - 1;
		if (new_exec_vnode[entry] == '+')
			new_exec_vnode[entry] = '\0';

		rc = pbs_python_object_set_attr_string_value(py_job, ATTR_execvnode, new_exec_vnode);
		if (rc == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to set job attribute %s = %s", ATTR_execvnode, new_exec_vnode);
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);
			goto release_nodes_exit;
		}
		if (py_attr_hookset_dict != NULL) {
			/* mark that exec_vnode of the job has been set in a hook */
			PyDict_SetItemString(py_attr_hookset_dict, ATTR_execvnode, Py_None);
		}
	}

	if ((new_exec_host != NULL) && (new_exec_host[0] != '\0')) {
		entry = strlen(new_exec_host) - 1;
		if (new_exec_host[entry] == '+')
			new_exec_host[entry] = '\0';
		rc = pbs_python_object_set_attr_string_value(py_job, ATTR_exechost, new_exec_host);
		if (rc == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "failed to set job attribute %s = %s", ATTR_exechost, new_exec_host);
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
				  LOG_ERR, __func__, log_buffer);
			goto release_nodes_exit;
		}
		if (py_attr_hookset_dict != NULL) {
			/* mark that exec_host of the job has been set in a hook */
			PyDict_SetItemString(py_attr_hookset_dict, ATTR_exechost, Py_None);
		}
	}

	if ((new_exec_host2 != NULL) && (new_exec_host2[0] != '\0')) {
		entry = strlen(new_exec_host2) - 1;
		if (new_exec_host2[entry] == '+')
			new_exec_host2[entry] = '\0';
		rc = pbs_python_object_set_attr_string_value(py_job, ATTR_exechost2, new_exec_host2);
		if (rc == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "failed to set job attribute %s = %s", ATTR_exechost2, new_exec_host2);
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);
			goto release_nodes_exit;
		}
		if (py_attr_hookset_dict != NULL) {
			/* mark that exec_host2 of the job has been set in a hook */
			PyDict_SetItemString(py_attr_hookset_dict, ATTR_exechost2, Py_None);
		}
	}

	if ((new_schedselect != NULL) && (new_schedselect[0] != '\0')) {
		rc = pbs_python_object_set_attr_string_value(py_job, ATTR_SchedSelect, new_schedselect);
		if (rc == -1) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "failed to set event attribute %s = %s", ATTR_SchedSelect, new_schedselect);
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);
			goto release_nodes_exit;
		}
		if (py_attr_hookset_dict != NULL) {
			/* mark that exec_host2 of the job has been set in a hook */
			PyDict_SetItemString(py_attr_hookset_dict, ATTR_SchedSelect, Py_None);
		}
	}

	py_return = py_job;

release_nodes_exit:
	free(vnodelist);
	Py_CLEAR(py_attr_keys);
	free(keep_select);
	free(execvnode);
	free(exechost);
	free(exechost2);
	free(schedselect);
	free_attrlist(&exec_vnode_list);
	Py_CLEAR(py_nodes);
	reliable_job_node_free(&failed_mom_list);
	reliable_job_node_free(&succeeded_mom_list);
	free(new_exec_vnode);
	free(new_exec_host);
	free(new_exec_host2);
	free(new_schedselect);
	vnl_free(failed_vnodes);
	vnl_free(good_vnodes);
	Py_CLEAR(py_attr_hookset_dict);
	free(jobid);

	hook_set_mode = hook_set_mode_orig;
	return (py_return);
}

/**
 *
 * @brief
 *	Returns a Python List of _server_attribute objects or  or NULL on error.
 * @param[in]	phead	- pointer to the head of the list containing data.
 *
 * @return 	PyObject *
 * @retval	<object>	- the Python list object holding
 * @retval				the _server_attribute objects.
 * @retval	NULL		- if an error occurred.
 * @note
 * 		the returned PyObject must be cleared(Py_CLEAR) as it's a new
 * 		reference.
 */
PyObject *
svrattrl_list_to_pyobject(int rq_cmd, pbs_list_head *phead)
{
	svrattrl *plist = NULL;
	PyObject *py_list = PyList_New(0);

	if (phead == NULL) {
		log_err(errno, __func__, "NULL input parameters!");
		Py_CLEAR(py_list);
		return NULL;
	}

	for (plist = (svrattrl *) GET_NEXT(*phead); plist != NULL;
	     plist = (svrattrl *) GET_NEXT(plist->al_link)) {
		PyObject *py_server_attribute = svrattrl_to_server_attribute(rq_cmd, plist);
		if (py_server_attribute) {
			svrattrl *slist = NULL;
			PyObject *py_slist = PyObject_GetAttrString(py_server_attribute, "sisters");
			if (py_slist) {
				for (slist = plist->al_sister; slist != NULL; slist = slist->al_sister) {
					PyObject *py_server_attribute_sister = svrattrl_to_server_attribute(rq_cmd, slist);
					if (py_server_attribute_sister) {
						PyList_Append(py_slist, py_server_attribute_sister);
						Py_CLEAR(py_server_attribute_sister);
					} else {
						snprintf(log_buffer, LOG_BUF_SIZE - 1,
							 "could not translate the sister for attribute <%s>", plist->al_name);
						log_buffer[LOG_BUF_SIZE - 1] = '\0';
						log_err(PBSE_INTERNAL, __func__, log_buffer);
						break;
					}
				}
			} /* else {
				log_err(PBSE_INTERNAL, __func__,
					"failed to acquire sisters in server_attribute object");
			} */
			PyList_Append(py_list, py_server_attribute);
			Py_CLEAR(py_server_attribute);
		}
	}
	return py_list;
}

/**
 *
 * @brief
 *	Returns a Python _server_attribute object or NULL on error.
 * @param[in]	attribute	- pointer to the head of the list containing data.
 *
 * @return 	PyObject *
 * @retval	<object>	- the Python _server_attribute object.
 * @retval	NULL		- if an error occurred.
 * @note
 * 		the returned PyObject must be cleared(Py_CLEAR) as it's a new
 * 		reference.
 */
PyObject *
svrattrl_to_server_attribute(int rq_cmd, svrattrl *attribute)
{
	PyObject *py_server_attribute = NULL;
	PyObject *py_server_attribute_class = NULL;
	PyObject *py_server_attribute_args = NULL;

	if (attribute == NULL) {
		goto server_attribute_exit;
	}

	py_server_attribute_class = pbs_python_types_table[PP_SERVER_ATTRIBUTE_IDX].t_class;
	if (!py_server_attribute_class) {
		log_err(PBSE_INTERNAL, __func__, "failed to acquire server_attribute class");
		goto server_attribute_exit;
	}

	py_server_attribute_args = Py_BuildValue("(sssii)",
						 attribute->al_name,
						 attribute->al_resc,
						 attribute->al_value,
						 (rq_cmd != MGR_CMD_UNSET ? attribute->al_op : UNSET),
						 attribute->al_flags); /* NEW ref */

	if (!py_server_attribute_args) {
		log_err(PBSE_INTERNAL, __func__, "could not build args list for server_attribute");
		goto server_attribute_exit;
	}
	py_server_attribute = PyObject_CallObject(py_server_attribute_class, py_server_attribute_args);

	if (!py_server_attribute) {
		pbs_python_write_error_to_log(__func__);
		log_err(PBSE_INTERNAL, __func__, "failed to create a python server_attribute object");
		goto server_attribute_exit;
	}
server_attribute_exit:
	Py_CLEAR(py_server_attribute_args);
	return py_server_attribute;
}


================================================
FILE: src/lib/Libpython/pbs_python_svr_size_type.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_python_svr_size_type.c
 * @brief
 * CONVENTION
 *
 *  For Types and Objects:
 *  ----------------------
 *   PPSVR   : Pbs Python Server
 *   PPSCHED : Pbs Python Scheduler
 *   PPMOM   : Pbs Python Mom
 *
 *  For methods:
 *  -----------
 *     pps_    : Pbs Python Server <?> methods
 *     ppsd_   : Pbs Python Scheduler <?> methods
 *     ppm_    : Pbs Python MOM <?> methods
 */

/*
 * --------- Python representation of a Queue Type ----------
 */
#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_python_private.h>

#include <stdio.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/param.h>
#include <memory.h>
#include <stdlib.h>
#include <pbs_ifl.h>
#include <errno.h>
#include <string.h>
#include <list_link.h>
#include <log.h>
#include <attribute.h>
#include <pbs_error.h>
#include <Long.h>

extern int comp_size(attribute *, attribute *);
extern void from_size(const struct size_value *, char *);
extern int set_size(attribute *, attribute *, enum batch_op op);
extern int to_size(char *, struct size_value *);
extern int normalize_size(struct size_value *, struct size_value *,
			  struct size_value *, struct size_value *);

/*
 * ============             Internal SIZE Type            ============
 */

typedef struct {
	PyObject_HEAD struct size_value sz_value;
	char *str_value; /* encoded represented of the above size value */
} PPSVR_Size_Object;

extern PyTypeObject PPSVR_Size_Type;
extern PyObject *PPSVR_Size_FromSizeValue(struct size_value);

#define PPSVR_Size_Type_Check(op) PyObject_TypeCheck(op, &PPSVR_Size_Type)
#define PPSVR_Size_DFLT_NAME "<unset>"

#define COPY_SIZE_VALUE(dst, src)                \
	do {                                     \
		dst.atsv_num = src.atsv_num;     \
		dst.atsv_shift = src.atsv_shift; \
		dst.atsv_units = src.atsv_units; \
	} while (0)

/**
 * @brief
 *	function for server
 *	checks whether the input object is negative number.
 *
 * @param[in] il - pointer to python object (number).
 *
 * @return	int
 * @retval	1	if negative
 * @retval	0	if not
 *
 */
static int
_pps_check_for_negative_number(PyObject *il)
{
	PyObject *str_value = NULL;
	const char *c_value;
	int rc = 0;

	if (!(str_value = PyObject_Str(il))) {
		PyErr_Clear();
		rc = -1;
		goto EXIT;
	}
	c_value = PyUnicode_AsUTF8(str_value); /* TODO, is error check needed? */
	if (c_value && (*c_value == '-')) {
		rc = 1;
	} else {
		rc = -1;
		PyErr_Clear();
		goto EXIT;
	}
EXIT:
	if (str_value)
		Py_CLEAR(str_value);
	return rc;
}

/**
 * @brief
 *	server function which encode a string
 *	FROM a PPSVR_Size_Object  structure
 *
 * @param[in] self - python object (string)
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 *
 */
static int
_pps_size_make_str_value(PyObject *self)
{

	PPSVR_Size_Object *working_copy = (PPSVR_Size_Object *) self;
	from_size(&working_copy->sz_value, log_buffer);
	if (working_copy->str_value)
		free(working_copy->str_value);
	if (!(working_copy->str_value = strdup(log_buffer))) {
		(void) PyErr_NoMemory();
		return -1;
	}
	return 0;
}

/**
 * @brief
 *      server function which encode a string
 *      FROM a PPSVR_Size_Object  structure
 *
 * @param[in] self - python object (string)
 *
 * @return	int
 * @retval	0 	: success was either a int or long
 * @retval	-1 	: failure
 * @retval	1 	: "from" is not a int or long python object
 */

static int
_pps_size_from_long_or_int(PyObject *self, PyObject *from)
{
	PPSVR_Size_Object *working_copy = (PPSVR_Size_Object *) self;
	u_Long l_value;

	if (PyLong_Check(from)) {
		if (_pps_check_for_negative_number(from) > 0) {
			PyErr_SetString(PyExc_TypeError, "_size instance cannot be negative");
			return -1;
		}
		l_value = PyLong_AsUnsignedLongLongMask(from);
		if (PyErr_Occurred())
			return -1;
		/* good no error */
		working_copy->sz_value.atsv_num = l_value;
		working_copy->sz_value.atsv_units = ATR_SV_BYTESZ;
		working_copy->sz_value.atsv_shift = 0;
		if ((_pps_size_make_str_value(self) != 0))
			return -1;
	} else if (PyLong_Check(from)) {
		if (_pps_check_for_negative_number(from) > 0) {
			PyErr_SetString(PyExc_TypeError, "_size instance cannot be negative");
			return -1;
		}
		l_value = PyLong_AsUnsignedLongLongMask(from);
		if (PyErr_Occurred())
			return -1;
		/* good no error */
		working_copy->sz_value.atsv_num = l_value;
		working_copy->sz_value.atsv_units = ATR_SV_BYTESZ;
		working_copy->sz_value.atsv_shift = 0;
		if ((_pps_size_make_str_value(self) != 0))
			return -1;
	} else {
		return 1;
	}

	return 0;
}

/**
 * @brief
 *	decodes and assigns value(from) to size value structure(self)
 *	and encodes the PPSVR_Size_Object structure(self).
 *
 * @param[out] self - python object(server size object)
 * @param[in] from - size string to be decoded and assigned
 *
 * @return	int
 * @retval	0	success was either a int or long
 * @retval	-1	failure
 * @retval	1	"from" is not a string python object
 *
 */

static int
_pps_size_from_string(PyObject *self, PyObject *from)
{

	PPSVR_Size_Object *working_copy = (PPSVR_Size_Object *) self;
	if (PyUnicode_Check(from)) {
		if ((to_size((char *) PyUnicode_AsUTF8(from), &working_copy->sz_value) != 0)) {
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s: bad value for _size",
				 pbs_python_object_str(from));
			PyErr_SetString(PyExc_TypeError, log_buffer);
			return -1;
		}
		if ((_pps_size_make_str_value(self) != 0))
			return -1;
	} else {
		return 1;
	}
	return 0;
}

/* -----                  PyTypeObject Methods                     ----- */

/**
 * @brief
 *	creates a python object size_value structure.
 *
 * @param[in] type - pointer to size_value structure
 * @param[in] args - size_value (NULL since new)
 * @param[in] kwds - str_value (NULL since new)
 *
 * @return	structure handle
 * @retval	pointer to size_val structure	success
 */
static PyObject *
pps_size_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
{
	PPSVR_Size_Object *self = NULL;
	self = (PPSVR_Size_Object *) type->tp_alloc(type, 0);
	if (self) {
		memset(&self->sz_value, 0, sizeof(self->sz_value));
		self->str_value = NULL;
	}
	return (PyObject *) self;
}

/**
 * @brief
 *	initializes the size_value structure.
 *
 * @param[out] self - pointer to size_value structure
 * @param[in] args - size_value
 * @param[in] kwds - size_str
 *
 * @return	int
 * @retval	0	success
 * @retval	-1	error
 *
 */
static int
pps_size_init(PPSVR_Size_Object *self, PyObject *args, PyObject *kwds)
{

	static char *kwlist[] = {"value", NULL};
	PyObject *py_arg0 = NULL;
	int rc;

	if (!PyArg_ParseTupleAndKeywords(args, kwds,
					 "O:_size.__init__",
					 kwlist,
					 &py_arg0)) {
		return -1;
	}

	if (PPSVR_Size_Type_Check(py_arg0)) {
		/* size object received , deep copy */
		COPY_SIZE_VALUE(self->sz_value, ((PPSVR_Size_Object *) py_arg0)->sz_value);
		if (self->str_value)
			free(self->str_value);
		if (!(self->str_value =
			      strdup(((PPSVR_Size_Object *) py_arg0)->str_value))) {
			(void) PyErr_NoMemory();
			return -1;
		}
		goto SUCCESSFUL_INIT;
	}
	if ((rc = _pps_size_from_string((PyObject *) self, py_arg0)) == -1) {
		return -1;
	}
	if (rc == 0)
		goto SUCCESSFUL_INIT;

	/* check for int or long */
	if ((rc = _pps_size_from_long_or_int((PyObject *) self, py_arg0)) == -1) {
		return -1;
	}
	if (rc == 0)
		goto SUCCESSFUL_INIT;

	/* at this point there is no hope */
	PyErr_SetString(PyExc_TypeError, "Bad _size value");
	return -1;

SUCCESSFUL_INIT:
	return 0;
}

/* __del__ */
/**
 * @brief
 *      free the memory for size_value structure.
 *
 * @param[out] self - pointer to size_value structure
 *
 * @return      int
 * @retval      0       success
 * @retval      -1      error
 *
 */

static void
pps_size_dealloc(PPSVR_Size_Object *self)
{
	if (self->str_value) {
		free(self->str_value);
	}
	Py_TYPE(self)->tp_free((PyObject *) self);
	return;
}

/* __repr__ and __str__ */
/**
 * @brief
 *      return the string_value.
 *
 * @param[out] self - pointer to size_value structure
 *
 * @return      structure handle
 * @retval      pointer to size_value structure       	success
 * @retval      NULL					error
 *
 */

static PyObject *
pps_size_repr(PPSVR_Size_Object *self)
{
	if (self->str_value) {
		return PyUnicode_FromString(self->str_value);
	} else {
		return PyUnicode_InternFromString("0");
	}
}

/* __cmp__ */
/**
 * @brief
 *	compares two size objects "self" and "with".
 *
 * @param[in] self - size object to compare
 * @param[in] with - size object to be compared with
 * @param[in] op - option for comparison
 *
 * @return	structure handle
 * @retval	Py_True			success
 * @retval	Py_False		error
 *
 */
static PyObject *
pps_size_richcompare(PPSVR_Size_Object *self, PyObject *with, int op)
{
	PyObject *result = Py_False; /* MUST incref result before return */
	attribute attr_self;
	attribute attr_with;
	int cmp_result;

	/* basic check make sure only size objects are compared */
	/* Al: I originally changed this to allow coercing compare operands but */
	/* ran into trouble with doing basic 'self' == "" as the empty string   */
	/* could not be converted into a size value. So I put back the original */
	/* assertion to only compare size values, but returning Py_False if the */
	/* size types don't match.  */
	if (!PyObject_TypeCheck(self, &PPSVR_Size_Type) ||
	    !PyObject_TypeCheck(with, &PPSVR_Size_Type)) {
		Py_INCREF(result);
		return result;
	}

	COPY_SIZE_VALUE(attr_self.at_val.at_size, self->sz_value);
	COPY_SIZE_VALUE(attr_with.at_val.at_size, ((PPSVR_Size_Object *) with)->sz_value);

	cmp_result = comp_size(&attr_self, &attr_with);

	switch (op) {
		case Py_EQ:
			result = (cmp_result == 0) ? Py_True : Py_False;
			break;
		case Py_NE:
			result = (cmp_result != 0) ? Py_True : Py_False;
			break;
		case Py_LT:
			result = (cmp_result == -1) ? Py_True : Py_False;
			break;
		case Py_LE:
			result = (cmp_result <= 0) ? Py_True : Py_False;
			break;
		case Py_GT:
			result = (cmp_result == 1) ? Py_True : Py_False;
			break;
		case Py_GE:
			result = (cmp_result >= 0) ? Py_True : Py_False;
			break;
	}

	Py_INCREF(result);
	return result;
}

#undef COPY_SIZE_VALUE

/* add of two size object returns a NEW Refrence */

/* __add__ */
/**
 * @brief
 *	adds two python size objects and returns reference to it.
 *
 * @param[in] left - size object1
 * @param[in] right - size object2
 *
 * @return      structure handle
 * @retval      Py_True                 success
 * @retval      Py_False                error
 *
 */
static PyObject *
pps_size_number_methods_add(PyObject *left, PyObject *right)
{
	PyObject *result = Py_NotImplemented;
	struct size_value tmp_left;
	struct size_value tmp_right;
	struct size_value sz_result;
	u_Long l_result;

	int rc;

	if ((PPSVR_Size_Type_Check(left)) && (PPSVR_Size_Type_Check(right))) {
		rc = normalize_size(&((PPSVR_Size_Object *) left)->sz_value,
				    &((PPSVR_Size_Object *) right)->sz_value,
				    &tmp_left,
				    &tmp_right);

		if (rc != 0)
			goto QUIT;
		l_result = tmp_left.atsv_num + tmp_right.atsv_num;
		if ((l_result < tmp_left.atsv_num) || (l_result < tmp_right.atsv_num)) {
			PyErr_SetString(PyExc_ArithmeticError,
					"expression evaluates to wrong _size value (overflow?)");
			result = NULL;
			goto QUIT;
		}
		sz_result.atsv_num = l_result;
		sz_result.atsv_shift = tmp_left.atsv_shift;
		sz_result.atsv_units = tmp_left.atsv_units;
		result = PPSVR_Size_FromSizeValue(sz_result);
	}

QUIT:
	if ((result) && (result == Py_NotImplemented))
		Py_INCREF(result);
	return result;
}

/**
 * @brief
 *      subtracts two python size objects and returns reference to it.
 *
 * @param[in] left - size object1
 * @param[in] right - size object2
 *
 * @return      structure handle
 * @retval      Py_True                 success
 * @retval      Py_False                error
 *
 */

static PyObject *
pps_size_number_methods_subtract(PyObject *left, PyObject *right)
{
	PyObject *result = Py_NotImplemented;
	struct size_value tmp_left;
	struct size_value tmp_right;
	struct size_value sz_result;
	u_Long l_result;

	int rc;

	if ((PPSVR_Size_Type_Check(left)) && (PPSVR_Size_Type_Check(right))) {
		rc = normalize_size(&((PPSVR_Size_Object *) left)->sz_value,
				    &((PPSVR_Size_Object *) right)->sz_value,
				    &tmp_left,
				    &tmp_right);

		if (rc != 0)
			goto QUIT;
		if (tmp_right.atsv_num > tmp_left.atsv_num) {
			PyErr_SetString(PyExc_ArithmeticError,
					"expression evaluates to negative _size value");
			result = NULL;
			goto QUIT;
		}
		l_result = tmp_left.atsv_num - tmp_right.atsv_num;
		sz_result.atsv_num = l_result;
		sz_result.atsv_shift = tmp_left.atsv_shift;
		sz_result.atsv_units = tmp_left.atsv_units;
		result = PPSVR_Size_FromSizeValue(sz_result);
	}

QUIT:
	if ((result) && (result == Py_NotImplemented))
		Py_INCREF(result);
	return result;
}

/**
 * @brief
 * 	Return the Python size's value in # oF kbytes.
 *
 * @param[in]	self - a Python size object
 *
 * @return long
 * @retval <n> # of bytes of the Python size object.
 * @retval 0	if there's an error
 *
 */
u_Long
pps_size_to_kbytes(PyObject *self)
{
	attribute attr;
	PPSVR_Size_Object *working_copy;
	if (!PPSVR_Size_Type_Check(self)) {
		return 0;
	}

	working_copy = (PPSVR_Size_Object *) self;

	if (working_copy == NULL)
		return 0;

	attr.at_flags = ATR_VFLAG_SET;
	attr.at_type = ATR_TYPE_SIZE;
	attr.at_val.at_size = working_copy->sz_value;

	return (get_kilobytes_from_attr(&attr));
}

/* --------- SIZE TYPE DEFINITION  --------- */

static PyNumberMethods pps_size_as_number = {
	/* nb_add */ (binaryfunc) pps_size_number_methods_add,
	/* nb_subtract */ (binaryfunc) pps_size_number_methods_subtract,
	/* nb_multiply */ 0,
	/* nb_remainder */ 0,
	/* nb_divmod */ 0,
	/* nb_power */ 0,
	/* nb_negative */ 0,
	/* nb_positive */ (unaryfunc) 0,
	/* nb_absolute */ (unaryfunc) 0,
	/* nb_bool */ (inquiry) 0,
	/* nb_invert */ 0,
	/* nb_lshift */ 0,
	/* nb_rshift */ 0,
	/* nb_and */ 0,
	/* nb_xor */ 0,
	/* nb_or */ 0,
	/* nb_int */ 0,
	/* nb_reserved */ 0,
	/* nb_float */ 0,
	/* nb_inplace_add */ 0,
	/* nb_inplace_subtract */ 0,
	/* nb_inplace_multiply */ 0,
	/* nb_inplace_remainder */ 0,
	/* nb_inplace_power */ 0,
	/* nb_inplace_lshift */ 0,
	/* nb_inplace_rshift */ 0,
	/* nb_inplace_and */ 0,
	/* nb_inplace_xor */ 0,
	/* nb_inplace_or */ 0,
	/* nb_floor_divide */ 0,
	/* nb_true_divide */ 0,
	/* nb_inplace_floor_divide */ 0,
	/* nb_inplace_true_divide */ 0,
};

static char pps_size_doc[] =
	"_size()\n\
    \tPython representation of PBS internal size structure\n\
    ";

/* external, hopefully no clash */

PyTypeObject PPSVR_Size_Type = {
	PyVarObject_HEAD_INIT(NULL, 0)
	/* ob_size*/
	/* tp_name*/ "_size",
	/* tp_basicsize*/ sizeof(PPSVR_Size_Object),
	/* tp_itemsize*/ 0,
	/* tp_dealloc*/ (destructor) pps_size_dealloc,
	/* tp_print*/ 0,
	/* tp_getattr*/ 0,
	/* tp_setattr*/ 0,
	/* tp_as_async */ 0,
	/* tp_repr*/ (reprfunc) pps_size_repr,
	/* tp_as_number*/ &pps_size_as_number,
	/* tp_as_sequence*/ 0,
	/* tp_as_mapping*/ 0,
	/* tp_hash */ 0,
	/* tp_call*/ 0,
	/* tp_str*/ 0,
	/* tp_getattro*/ 0,
	/* tp_setattro*/ 0,
	/* tp_as_buffer*/ 0,
	/* tp_flags*/ Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE,
	/* tp_doc */ pps_size_doc,
	/* tp_traverse */ 0,
	/* tp_clear */ 0,
	/* tp_richcompare */ (richcmpfunc) pps_size_richcompare,
	/* tp_weaklistoffset */ 0,
	/* tp_iter */ 0,
	/* tp_iternext */ 0,
	/* tp_methods */ 0,
	/* tp_members */ 0,
	/* tp_getset */ 0,
	/* tp_base */ 0,
	/* tp_dict */ 0,
	/* tp_descr_get */ 0,
	/* tp_descr_set */ 0,
	/* tp_dictoffset */ 0,
	/* tp_init */ (initproc) pps_size_init,
	/* tp_alloc */ 0,
	/* tp_new */ (newfunc) pps_size_new,
	/* tp_free */ 0,
	/* tp_is_gc For PyObject_IS_GC */ 0,
	/* tp_bases */ 0,
	/* tp_mro */ 0,
	/* tp_cache */ 0,
	/* tp_subclasses */ 0,
	/* tp_weaklist */ 0};

/* -----                  External Functions for size              ----- */

/**
 * @brief
 *	converts the input size_value struct to PyObject and returns reference to it.
 *
 * @param[in] from - size_value structure
 *
 * @return	structure handle
 * @retval	pointer to size PyObject	success
 * @retval	NULL				error
 *
 */
PyObject *
PPSVR_Size_FromSizeValue(struct size_value from)
{
	PPSVR_Size_Object *pyobj = NULL;

	if (!(pyobj = (PPSVR_Size_Object *) pps_size_new(&PPSVR_Size_Type, NULL, NULL)))
		goto ERROR_EXIT;
	pyobj->sz_value = from;
	if (_pps_size_make_str_value((PyObject *) pyobj) != 0)
		goto ERROR_EXIT;
	return (PyObject *) pyobj;
ERROR_EXIT:
	if (pyobj)
		Py_CLEAR(pyobj);
	return NULL;
}


================================================
FILE: src/lib/Libpython/shared_python_utils.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>
#include <wchar.h>
#include <pbs_python_private.h>
#include <Python.h>
#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "log.h"

#ifdef WIN32

/**
 * @brief get_py_homepath
 * 	Find and return where python home is located
 *
 * NOTE: The caller must free the memory allocated by this function
 *
 * @param[in, out] homepath - buffer to copy python home path
 *
 * @return int
 * @retval 0 - Success
 * @retval 1 - Fail
 */

int
get_py_homepath(char **homepath)
{
#ifdef PYTHON
	static char python_homepath[MAXPATHLEN + 1] = {'\0'};
	if (python_homepath[0] == '\0') {
		snprintf(python_homepath, MAXPATHLEN, "%s/python", pbs_conf.pbs_exec_path);
		fix_path(python_homepath, 3);
		if (!file_exists(python_homepath)) {
			log_err(-1, __func__, "Python home not found!");
			return 1;
		}
	}
	*homepath = strdup(python_homepath);
	if (*homepath == NULL)
		return 1;
	return 0;
#else
	return 1;
#endif
}
#endif

/**
 * @brief get_py_progname
 * 	Find and return where python binary is located
 *
 * NOTE: The caller must free the memory allocated by this function
 *
 * @param[in, out] binpath - buffer to copy python binary path
 *
 * @return int
 * @retval 0 - Success
 * @retval 1 - Fail
 */
int
get_py_progname(char **binpath)
{
#ifdef PYTHON
	static char python_binpath[MAXPATHLEN + 1] = {'\0'};
	if (python_binpath[0] == '\0') {
#ifndef WIN32
		snprintf(python_binpath, MAXPATHLEN, "%s/python/bin/python3", pbs_conf.pbs_exec_path);
#else
		snprintf(python_binpath, MAXPATHLEN, "%s/python/python.exe", pbs_conf.pbs_exec_path);
		fix_path(python_binpath, 3);
#endif
		if (!file_exists(python_binpath)) {
#ifdef PYTHON_BIN_PATH
			snprintf(python_binpath, MAXPATHLEN, "%s", PYTHON_BIN_PATH);
			if (!file_exists(python_binpath))
#endif
			{
				log_err(-1, __func__, "Python executable not found!");
				return 1;
			}
		}
	}
	*binpath = strdup(python_binpath);
	if (*binpath == NULL)
		return 1;
	return 0;
#else
	return 1;
#endif
}
#ifdef WIN32
/**
 * @brief set_py_progname
 * 	Find and tell Python interpreter where python binary is located
 *
 * @return int
 * @retval 0 - Success
 * @retval 1 - Fail
 */
int
set_py_progname(void)
{
#ifdef PYTHON
	char *python_binpath = NULL;
	static wchar_t w_python_binpath[MAXPATHLEN + 1] = {'\0'};

	if (w_python_binpath[0] == '\0') {
		if (get_py_progname(&python_binpath)) {
			log_err(-1, __func__, "Failed to find python binary path!");
			return 1;
		}
		mbstowcs(w_python_binpath, python_binpath, MAXPATHLEN + 1);
		free(python_binpath);
	}
	Py_SetProgramName(w_python_binpath);
	/*
	 *  There is a bug in windows version of python resulting need to set python home explicitly.
	 */
	static wchar_t w_python_homepath[MAXPATHLEN + 1] = {'\0'};
	char *python_homepath = NULL;
	if (w_python_homepath[0] == '\0') {
		if (get_py_homepath(&python_homepath)) {
			log_err(-1, __func__, "Failed to find python home path!");
			return 1;
		}
		mbstowcs(w_python_homepath, python_homepath, MAXPATHLEN + 1);
		free(python_homepath);
	}
	Py_SetPythonHome(w_python_homepath);

	return 0;
#else
	return 0;
#endif
}
#endif


================================================
FILE: src/lib/Libsec/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

noinst_LIBRARIES = libsec.a

libsec_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

libsec_a_SOURCES = \
	cs_standard.c


================================================
FILE: src/lib/Libsec/cs_standard.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	cs_standard.c
 * @brief
 * cs_standard.c - Standard PBS Authentication Module
 * 	  Authentication provided by this module is the standard (pbs_iff)
 * 	  authentication used in vanilla PBS.  Internal security interface
 * 	  (Hooks) are for the most part stubs which return CS_SUCCESS
 */

/* File is to be gutless if PBS not built vanilla w.r.t. security */

#include <pbs_config.h>
#include <stddef.h>
#include <sys/types.h>
#include "libsec.h"

#if (!defined(PBS_SECURITY) || (PBS_SECURITY == STD)) || (defined(PBS_SECURITY) && (PBS_SECURITY == KRB5))

/* system includes */

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <signal.h>
#include <string.h>

#if defined(HAVE_SYS_IOCTL_H)
#include <sys/ioctl.h>
#include <sys/uio.h>
#endif

#include <netdb.h>
#include <sys/socket.h>
#include <netdb.h>

/* PBS includes */

#include <pbs_error.h>

/*------------------------------------------------------------------------
 * interface return codes,...
 *------------------------------------------------------------------------
 * see pbs/src/include/libsec.h
 */

/*------------------------------------------------------------------------
 * External functions
 *------------------------------------------------------------------------
 */

/*------------------------------------------------------------------------
 * Global symbols and default "evaluations"
 *------------------------------------------------------------------------
 */
/**
 * @brief
 * 	Default logging function
 */
void
sec_cslog(int ecode, const char *caller, const char *txtmsg)
{
	return;
}

void (*p_cslog)(int ecode, const char *caller, const char *txtmsg) = sec_cslog;

/*========================================================================
 * PBS hook functions
 * CS_read	   - read encrypted data, decrypt and pass result to PBS
 * CS_write	   - encrypt PBS data, and write result
 * CS_client_auth  - authenticate to a server, authenticate server
 * CS_server_auth  - authenticate a client, authenticate to client
 * CS_close_socket - release per-connection security data
 * CS_close_app    - release application security data
 * CS_client_init  - initialize client global data
 * CS_server_init  - initialize server global data
 * CS_verify       - verify a user id (still to be developed)
 * CS_remap_ctx - remap connection security context to a new descriptor.
 *------------------------------------------------------------------------
 */
/**
 * @brief
 *	CS_read - read data
 *
 * @par	call:
 *	r = CS_read(fid,buf,len);
 *
 * @param[in]	fid	- file id to read from
 * @param[in]	buf	- address of the buffer to fill
 * @param[in]	len	- number of bytes to transfer
 *
 * @returns	int
 * @retval	- number of bytes read
 * @retval	CS_IO_FAIL (-1) on error
 *------------------------------------------------------------------------
 */

int
CS_read(int sd, char *buf, size_t len)
{

	return (read(sd, buf, len));
}

/**
 * @brief
 * 	CS_write - write data
 *
 * @par	call:
 *      r = CS_write ( fid, buf, len )
 *
 * @param[in]	fid     - file id to write to
 * @param[in]	buf     - address of the buffer to write
 * @param[in]	len     - number of bytes to transfer
 *
 * @returns	int
 * @retval	- number of bytes read
 * @retval	CS_IO_FAIL (-1) on error
 *------------------------------------------------------------------------
 */

int
CS_write(int sd, char *buf, size_t len)
{
	return (write(sd, buf, len));
}

/**
 * @brief
 * 	CS_client_auth - stub interface for STD authentication to a remote
 *
 * @par	server.:
 *	r = CS_client_auth ( fd );
 *
 * @param[in]	fd	- socket file id
 *
 * @returns	int
 * @retval	- CS_AUTH_USE_IFF
 *
 * @par	Note:  upon getting the above return value, the calling code should
 *	call PBSD_authenticate (which issues a read  popen of pbs_iff)
 *	and respond accordingly to its return value -  close down the
 *	connection's security, close the socket.  Otherwise,continue
 *	with the steps that follow a successful authentication..
 *------------------------------------------------------------------------
 */

int
CS_client_auth(int sd)
{
	return (CS_AUTH_USE_IFF);
}

/**
 * @brief
 * 	CS_server_auth - authenticate to a client
 *
 * @par	call:
 *	r = CS_server_auth(fd);
 *
 * @param[in]	fd	- socket file id
 *
 * @returns	int
 * @retval	- CS_AUTH_CHECK_PORT
 *
 * @par	Note:  upon getting the above return value, the calling code should
 *	check if the remote port is in the privileged range and
 *	proceed accordingly.
 *------------------------------------------------------------------------
 */

int
CS_server_auth(int sd)
{

	return (CS_AUTH_CHECK_PORT);
}

/**
 * @brief
 * 	CS_close_socket - cleanup security blob when closing a socket.
 *
 * @par	call:
 * 	r = CS_close_socket ( fd );
 *
 * @param[in]	fd	- socket file id
 *
 * @return	int
 * @retval	status result, 0 => success
 *
 * @par	note:
 * 	The socket should still be open when this function is called.
 * 	The pointer to the security blob may be modified, hence pctx
 * 	points to the pointer to the blob.
 *------------------------------------------------------------------------
 */

int
CS_close_socket(int sd)
{
	/*
	 * For standard PBS security we don't have a need for a
	 * "per connection" security context
	 */

	return (CS_SUCCESS);
}

/**
 * @brief
 * 	CS_close_app - the global cleanup function
 *
 * @par	call:
 *	r = CS_close_app();
 *
 * @returns	int
 * @retval	- CS_SUCCESS
 *
 */

int
CS_close_app(void)
{
	return (CS_SUCCESS);
}

/**
 * @brief
 *	CS_client_init - the client initialization function for global security
 * 		    data
 * @par	usage:
 * 	r = CS_client_init();
 *
 * @returns 	int
 * @retval	initialization status
 *
 */

int
CS_client_init(void)
{

	return (CS_SUCCESS); /* always return success if no error */
}

/**
 * @brief
 *	CS_server_init - the server initialization function for global security
 * 		    data
 * @par	usage:
 * 	r = CS_server_init();
 *
 * @returns	int
 * @retval	initialization status
 *
 */

int
CS_server_init(void)
{
	return (CS_SUCCESS);
}

/**
 * @brief
 * 	CS_verify - verify user is authorized on host
 * @par	call:
 * 	r = CS_verify ( ??? );
 *
 * @returns	int
 * @retval	verification status
 * @retval	CS_SUCCESS	    => start the user process
 * @retval	CS_FATAL_NOAUTH   => user is not authorized
 * @retval	CS_NOTIMPLEMENTED => do the old thing (rhosts)
 *
 */

int
CS_verify()
{
	return (CS_SUCCESS);
}

/**
 * @brief
 * 	CS_remap_ctx - interface is available to remap connection's context
 * 	to a new descriptor.   Old association is removed from the tracking
 * 	mechanism's data.
 *
 * Should the socket descriptor associated with the connection get
 * replaced by a different descriptor (e.g. mom's call of the FDMOVE
 * macro for interactive qsub job) this is the interface to use to
 * make the needed adjustment to the tracking table.
 *
 * @param[in] sd     connection's original socket descriptor
 * @param[in] newsd  connection's new socket descriptor
 *
 * @return	int
 * @retval	CS_SUCCESS
 * @retval	CS_FATAL
 *
 * @par	Remark:
 *	If the return value is CS_FATAL the connection should be
 *	CS_close_socket should be called on the original descriptor
 *	to deallocate the tracking table entry, and the connection
 *	should then be closed.
 *------------------------------------------------------------------------
 */

int
CS_remap_ctx(int sd, int newsd)
{
	/*
	 * For standard PBS security we don't have a need for a
	 * "per connection" security context remapping
	 */

	return (CS_SUCCESS);
}

#endif /* undefined( PBS_SECURITY ) || ( PBS_SECURITY == STD ) */


================================================
FILE: src/lib/Libsite/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

lib_LIBRARIES = libsite.a

libsite_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	-I$(top_srcdir)/src/resmom/linux \
	@KRB5_CFLAGS@

libsite_a_SOURCES = \
	site_alt_rte.c \
	site_mom_chu.c \
	site_mom_jst.c \
	site_allow_u.c \
	site_check_u.c \
	site_map_usr.c \
	site_mom_ckp.c


================================================
FILE: src/lib/Libsite/site_allow_u.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include "portability.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "pbs_error.h"
#include "job.h"

/**
 * @file	site_allow_u.c
 */

/**
 * @brief
 * 	site_allow_u - site allow user access
 *
 *	This routine determines if a user is privileged to access the batch
 *	ssytem on this host.
 *
 *	It's implementation is "left as an exersize for the reader."
 *
 * @param[in]	user - the user's name making the request
 * @param[in]	host - host from which the user is making the request
 *
 * @return	int
 * @retval	zero - if user is acceptable
 * @retval	non-zero error number (PBSE_PERM) if not
 */

int
site_allow_u(char *user, char *host)
{
	return 0;
}


================================================
FILE: src/lib/Libsite/site_alt_rte.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <string.h>
#include "portability.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"

/**
 * @file	site_alt_rte.c
 */
int default_router(job *jobp, struct pbs_queue *qp, long retry_time);

/**
 * @brief
 *	function for routing jobs.
 *
 * @param[in] jobp - job pointer
 * @param[in] qp - pointer to queue info
 * @param[in] retry_time - time to retry
 *
 * @return	int
 * @retval	0	success
 * @retval	!0	error
 *
 */
int
site_alt_router(job *jobp, pbs_queue *qp, long retry_time)
{
	return (default_router(jobp, qp, retry_time));
}


================================================
FILE: src/lib/Libsite/site_check_u.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <fcntl.h>
#include <netdb.h>
#include "portability.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "job.h"
#include "pbs_nodes.h"
#include "reservation.h"
#include "queue.h"
#include "log.h"
#include "pbs_ifl.h"
#include "svrfunc.h" /* to resolve cvrt_fqn_to_name */

/**
 * @file	site_check_u.c
 */
/* Global Data Items */

extern char *pbs_o_host;
extern char server_host[];
extern char *msg_orighost; /* error message: no PBS_O_HOST */

/**
 * @brief
 * 	site_check_user_map - site_check_user_map()
 *	This routine determines if the specified "luser" is authorized
 *	on this host to serve as a kind of "proxy" for the object's owner.
 *	Uses the object's "User_List" attribute.
 *
 *	As provided, this routine uses ruserok(3N).  If this is a problem,
 *	It's replacement is "left as an exercise for the reader."
 *
 * @param[in] pjob - job info
 * @param[in] objtype - type of object
 * @param[in] luser - username
 *
 * @return	int
 * @retval	0	success
 * @retval	>0	error
 *
 */

int
site_check_user_map(void *pobj, int objtype, char *luser)
{
	char *orighost;
	char owner[PBS_MAXUSER + 1];
	char *p1;
	char *objid;
	int event_type, event_class;
	int rc;

	/* set pointer variables etc based on object's type */
	if (objtype == JOB_OBJECT) {
		p1 = get_jattr_str(pobj, JOB_ATR_job_owner);
		orighost = get_jattr_str(pobj, JOB_ATR_submit_host);
		objid = ((job *) pobj)->ji_qs.ji_jobid;
		event_type = PBSEVENT_JOB;
		event_class = PBS_EVENTCLASS_JOB;
	} else {
		p1 = get_rattr_str(pobj, RESV_ATR_resv_owner);
		orighost = get_rattr_str(pobj, RESV_ATR_submit_host);
		objid = ((resc_resv *) pobj)->ri_qs.ri_resvID;
		event_type = PBSEVENT_RESV;
		event_class = PBS_EVENTCLASS_RESV;
	}

	/* the owner name, without the "@host" */
	cvrt_fqn_to_name(p1, owner);

	if ((orighost == NULL) || (*orighost == '\0')) {
		log_event(event_type, event_class, LOG_INFO, objid, msg_orighost);
		return (-1);
	}
	if (!strcasecmp(orighost, server_host) && !strcmp(owner, luser))
		return (0);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	/* if this is gss job/resv ignore the rest */
	if (objtype == JOB_OBJECT && is_jattr_set(pobj, JOB_ATR_cred_id)) {
		return -1;
	}
	if (objtype == RESC_RESV_OBJECT && is_rattr_set(pobj, RESV_ATR_cred_id)) {
		return -1;
	}
#endif

#ifdef WIN32
	rc = ruserok(orighost, isAdminPrivilege(luser), owner, luser);
	if (rc == -2) {
		sprintf(log_buffer, "User %s does not exist!", luser);
		log_err(0, "site_check_user_map", log_buffer);
		rc = -1;
	} else if (rc == -3) {
		sprintf(log_buffer,
			"User %s's [HOMEDIR]/.rhosts is unreadable! Needs SYSTEM or Everyone access", luser);
		log_err(0, "site_check_user_map", log_buffer);
		rc = -1;
	}
#else
	rc = ruserok(orighost, 0, owner, luser);
#endif

	return (rc);
}

/**
 * @brief
 *	site_check_u - site_acl_check()
 *    	This routine is a place holder for sites that wish to implement
 *    	access controls that differ from the standard PBS user, group, host
 *    	access controls.  It does NOT replace their functionality.
 *
 * @param[in] pjob - job pointer
 * @param[in] pqueue - pointer to queue defn
 *
 * @return	int
 * @retval	0	ok
 * @retval	-1	access denied
 *
 */

int
site_acl_check(job *pjob, pbs_queue *pque)
{
	return (0);
}


================================================
FILE: src/lib/Libsite/site_map_usr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	site_map_usr.c
 * @brief
 * site_map_user - map user name on a named host to user name on this host
 * @note
 *	for those of us who operate in a world of consistant
 *	user names, this routine just returns the original name.
 *
 *	This routine is "left as an exercise for the reader."
 *	If you don't have consistant names, its up to you to replace
 *	this code with what will work for you.
 *
 *	The input parameters cannot be modified.   If the replacement routine
 *	is to change the user's name, the new value should be kept in a static
 *	character array of size PBS_MAXUSER+1.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include "pbs_ifl.h"
#include "libpbs.h"
#include "portability.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_nodes.h"
#include "batch_request.h"
#include "svrfunc.h"
#include <string.h>

/* ARGSUSED */

/**
 * @brief
 *	map requestor user@host to "local" name
 *
 * @param[in] uname - username
 * @param[in] host - hostname
 *
 * @return	string
 * @retval	local name	success
 *
 */
char *
site_map_user(char *uname, char *host)
{
	return (uname);
}

char *
site_map_resvuser(char *uname, char *host)
{
	return (uname);
}


================================================
FILE: src/lib/Libsite/site_mom_chu.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	site_mom_chu.c
 * @brief
 * site_mom_chu.c = a site modifible file
 */

#include <pbs_config.h> /* the master config generated by configure */

/*
 * This is used only in mom and needs PBS_MOM defined in order to
 * have things from other .h files (such as struct task) be defined
 */
#define PBS_MOM

#include <sys/types.h>
#include <pwd.h>
#include "portability.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "job.h"
#include "mom_mach.h"
#include "mom_func.h"

/**
 * @brief
 * 	site_mom_chkuser() - for adding validity checking to the user's account
 * 	on the execution machine.  This is called from start_exec().
 *
 * @param[in] pjob - job pointer
 *
 * @return	int
 * @retval	non-zero if you wish the job to be aborted.
 *
 */
int
site_mom_chkuser(job *pjob)
{
	return (0);
}


================================================
FILE: src/lib/Libsite/site_mom_ckp.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h> /* DEBUG */
/**
 * @file	site_mom_ckp.c
 * @brief
 * site_mom_pchk.c = a site modifiable file
 *
 *	Contains Pre and Post checkpoint stubs for MOM.
 */

/*
 * This is used only in mom and needs PBS_MOM defined in order to
 * have things from other .h files (such as struct task) be defined
 */
#define PBS_MOM

#include <sys/types.h>
#include <pwd.h>
#include "portability.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "job.h"
#include "mom_mach.h"
#include "mom_func.h"

/**
 * @brief
 * 	site_mom_postchk() - Post-checkpoint stub for MOM.
 *	Called if checkpoint (on qhold,qterm) suceeded.
 *
 * @param[in] pjob - job pointer
 * @param[in] hold_type - hold type indicating what caused held state of job
 *
 * @return	int
 * @retval	0		If ok
 * @retval	non-zero	If not ok.
 */

int
site_mom_postchk(job *pjob, int hold_type)
{
	return 0;
}

/**
 * @brief
 * 	site_mom_prerst() - Pre-restart stub for MOM.
 *	Called just before restart is performed.
 *
 * @param[in] pjob - job pointer
 *
 * @return	int
 * @retval	0		if ok
 * @retval	JOB_EXEC_FATAL1 for permanent error, abort job
 * @retval	JOB_EXEC_RETRY	for temporary problem, requeue job.
 */

int
site_mom_prerst(job *pjob)
{
	return 0;
}


================================================
FILE: src/lib/Libsite/site_mom_jst.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

/**
 * @file	site_mom_jst.c
 * @brief
 * This is used only in mom and needs PBS_MOM defined in order to
 * have things from other .h files (such as struct task) be defined
 */
#define PBS_MOM

#include <sys/types.h>
#include <pwd.h>
#include "portability.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "job.h"
#include "mom_mach.h"
#include "mom_func.h"

/**
 * @brief
 * 	site_job_setup() -  to allow a site to perform site specific actions
 *	once the session has been created and before the job run.
 *
 * @param[in] pjob - job pointer
 *
 * @return	int
 * @retval	non-zero to abort the job.
 *
 */
int
site_job_setup(job *pjob)
{
	return (0);
}


================================================
FILE: src/lib/Libtpp/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

noinst_LIBRARIES = libtpp.a

libtpp_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

libtpp_a_SOURCES = \
	tpp_internal.h \
	tpp_client.c \
	tpp_em.c \
	tpp_platform.c \
	tpp_router.c \
	tpp_transport.c \
	tpp_util.c


================================================
FILE: src/lib/Libtpp/tpp_client.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	tpp_client.c
 *
 * @brief	Client side of the TCP router based network
 *
 * @par		Functionality:
 *
 *		TPP = TCP based Packet Protocol. This layer uses TCP in a multi-
 *		hop router based network topology to deliver packets to desired
 *		destinations. LEAF (end) nodes are connected to ROUTERS via
 *		persistent TCP connections. The ROUTER has intelligence to route
 *		packets to appropriate destination leaves or other routers.
 *
 *		This is the client side (referred to as leaf) in the tpp network
 *		topology. This compiles into the overall tpp library, and is
 *		linked to the PBS daemons. This code file implements the
 *		tpp_ interface functions that the daemons use to communicate
 *		with other daemons.
 *
 *		The code is driven by 2 threads. The Application thread (from
 *		the daemons) calls the main interfaces (tpp_ functions).
 *		When a piece of data is to be transmitted, its queued to a
 *		stream, and another independent thread drives the actual IO of
 *		the data. We refer to these two threads in the comments as
 *		IO thread and APP thread.
 *
 *		This also presents a single fd (a pipe) that can be used
 *		by the application to monitor for incoming data or events on
 *		the transport channel (much like the way a datagram socket works).
 *		This fd can be used by the application using a typical select or
 *		poll system call.
 *
 *		The functions in this code file are clearly de-marked as to which
 *		of the two threads drives them. In certain rare cases, a function
 *		or data structure is used by both the threads, and therefore is
 *		synchronized using a mutex, but in general, most functions are
 *		driven by only one thread. This allows for a minimal contention
 *		design, requiring minimal synchronization primitives.
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <string.h>
#include <sys/time.h>
#include <stdint.h>

#include "pbs_idx.h"
#include "libpbs.h"
#include "tpp_internal.h"
#include "dis.h"
#include "auth.h"

/*
 *	Global Variables
 */

/**
 *	file descriptor returned by tpp_init()
 */
int tpp_fd = -1;

/* whether a forked child called tpp_terminate or not? initialized to false */
int tpp_terminated_in_child = 0;

/*
 * app_mbox is the "monitoring mechanism" for the application
 * send notifications to the application about incoming data
 * or events. THIS IS EDGE TRIGGERED. Once triggered, app must
 * read all the data available, or else, it could end up with
 * a situation where data exists to be read, but there is no
 * notification to wake up waiting app thread from select/poll.
 */
tpp_mbox_t app_mbox;

/* counters for various statistics */
int oopkt_cnt = 0;  /* number of out of order packets received */
int duppkt_cnt = 0; /* number of duplicate packets received */

static struct tpp_config *tpp_conf; /* the global TPP configuration file */

static tpp_addr_t *leaf_addrs = NULL;
static int leaf_addr_count = 0;

/*
 * The structure to hold information about the multicast channel
 */
typedef struct {
	int num_fds;   /* number of streams that are part of mcast channel */
	int num_slots; /* number of slots in the channel (for resizing) */
	int *strms;    /* array of member stream descriptors */
} mcast_data_t;

/*
 * The stream structure. Information about each stream is maintained in this
 * structure.
 *
 * Various members of the stream structure are accessed by either of the threads
 * IO and APP. Some of the fields are set by the APP thread first time and then
 * on accessed/updated by the IO thread.
 */
typedef struct {
	unsigned char strm_type; /* normal stream or multicast stream */

	unsigned int sd;	 /* source stream descriptor, APP thread assigns, IO thread uses */
	unsigned int dest_sd;	 /* destination stream descriptor, IO thread only */
	unsigned int src_magic;	 /* A magically unique number that identifies src stream uniquely */
	unsigned int dest_magic; /* A magically unique number that identifies dest stream uniquely */

	short used_locally; /* Whether this stream was accessed locally by the APP, APP thread only */

	unsigned short u_state; /* stream state, APP thread updates, IO thread read-only */
	unsigned short t_state;
	short lasterr; /* updated by IO thread only, for future use */

	tpp_addr_t src_addr;  /* address of the source host */
	tpp_addr_t dest_addr; /* address of destination host - set by APP thread, read-only by IO thread */

	void *user_data; /* user data set by tpp_dis functions. Basically used for DIS encoding */

	tpp_que_t recv_queue; /* received packets - APP thread only, hence no lock */

	mcast_data_t *mcast_data; /* multicast related data in case of multicast stream type */

	void (*close_func)(int); /* close function to be called when this stream is closed */

	tpp_que_elem_t *timeout_node; /* pointer to myself in the timeout streams queue */
} stream_t;

/*
 * Slot structure - Streams are part of an array of slots
 * Using the stream sd, its easy to index into this slotarray to find the
 * stream structure
 */
typedef struct {
	int slot_state; /* state of the slot - used, free */
	stream_t *strm; /* pointer to the stream structure at this slot */
} stream_slot_t;
stream_slot_t *strmarray = NULL; /* array of streams */
pthread_rwlock_t strmarray_lock; /* global lock for the streams array and streams_idx (not for an individual stream) */
unsigned int max_strms = 0;	 /* total number of streams allocated */

/* the following two variables are used to quickly find out a unused slot */
unsigned int high_sd = UNINITIALIZED_INT; /* the highest stream sd used */
tpp_que_t freed_sd_queue;		  /* last freed stream sd */
int freed_queue_count = 0;

/* index of streams - so that we can search faster inside it */
void *streams_idx = NULL;

/* following common structure is used to do a timed action on a stream */
typedef struct {
	unsigned int sd;
	time_t strm_action_time;
	void (*strm_action_func)(unsigned int);
} strm_action_info_t;

/* global queue of stream slots to be marked FREE after TPP_CLOSE_WAIT time */
tpp_que_t strm_action_queue;
pthread_mutex_t strm_action_queue_lock;

/* leaf specific stream states */
#define TPP_STRM_STATE_OPEN 1  /* stream is open */
#define TPP_STRM_STATE_CLOSE 2 /* stream is closed */

#define TPP_TRNS_STATE_OPEN 1	     /* stream open */
#define TPP_TRNS_STATE_PEER_CLOSED 2 /* stream closed by peer */
#define TPP_TRNS_STATE_NET_CLOSED 3  /* network closed (noroute etc) */

#define TPP_MCAST_SLOT_INC 100 /* inc members in mcast group */

/* the physical connection to the router from this leaf */
static tpp_router_t **routers = NULL;
static int max_routers = 0;

/* forward declarations of functions used by this code file */

/* function pointers */
void (*the_app_net_down_handler)(void *data) = NULL;
void (*the_app_net_restore_handler)(void *data) = NULL;
time_t leaf_next_event_expiry(time_t now); /* IO thread only */

/* static functions */
static int connect_router(tpp_router_t *r);
static tpp_router_t *get_active_router();
static stream_t *get_strm_atomic(unsigned int sd);
static stream_t *get_strm(unsigned int sd);
static stream_t *alloc_stream(tpp_addr_t *src_addr, tpp_addr_t *dest_addr);
static void free_stream(unsigned int sd);
static void free_stream_resources(stream_t *strm);
static void queue_strm_close(stream_t *);     /* call only by APP thread, however inserts into strm_action_queue */
static void queue_strm_free(unsigned int sd); /* invoked by IO thread only, via acting on the strm_action_queue */
static void act_strm(time_t now, int force);
static int send_app_strm_close(stream_t *strm, int cmd, int error);
static int send_pkt_to_app(stream_t *strm, unsigned char type, void *data, int sz, int totlen);
static stream_t *find_stream_with_dest(tpp_addr_t *dest_addr, unsigned int dest_sd, unsigned int dest_magic);
static int send_spl_packet(stream_t *strm, int type);
static int leaf_send_ctl_join(int tfd, void *c);
static int send_to_router(tpp_packet_t *pkt);

/* forward declarations */
static int leaf_pkt_presend_handler(int tfd, tpp_packet_t *pkt, void *ctx, void *extra);
static int leaf_pkt_handler(int tfd, void *data, int len, void *ctx, void *extra);
static int leaf_pkt_handler_inner(int tfd, void *buf, void **data_out, int len, void *c, void *extra);
static int leaf_close_handler(int tfd, int error, void *ctx, void *extra);
static int leaf_timer_handler(time_t now);
static int leaf_post_connect_handler(int tfd, void *data, void *ctx, void *extra);

/**
 * @brief
 *	Helper function to get a stream pointer and slot state in an atomic fashion
 *
 * @par Functionality:
 *	Acquire a lock on the strmarray lock and return the stream pointer
 *
 * @param[in] sd - The stream descriptor
 *
 * @return - Stream pointer
 * @retval NULL - Bad stream index/descriptor
 * @retval !NULL - Associated stream pointer
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static stream_t *
get_strm_atomic(unsigned int sd)
{
	stream_t *strm = NULL;

	if (tpp_terminated_in_child == 1)
		return NULL;

	tpp_read_lock(&strmarray_lock); /* walking the array, so read lock */
	if (sd < max_strms) {
		if (strmarray[sd].slot_state == TPP_SLOT_BUSY)
			strm = strmarray[sd].strm;
	}
	tpp_unlock_rwlock(&strmarray_lock);

	return strm;
}

/**
 * @brief
 *	Helper function to get a stream pointer from a stream descriptor
 *
 * @par Functionality:
 *	Returns the stream pointer associated to the stream index. Does some
 *	error checking whether the stream slot is busy, and stream itself is
 *	open from an application point of view.
 *
 * @param[in] sd - The stream descriptor
 *
 * @return - Stream pointer
 * @retval NULL - Bad stream index/descriptor
 * @retval !NULL - Associated stream pointer
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static stream_t *
get_strm(unsigned int sd)
{
	stream_t *strm;

	errno = 0;
	strm = get_strm_atomic(sd);
	if (!strm) {
		errno = EBADF;
		return NULL;
	}
	if (strm->u_state == TPP_STRM_STATE_CLOSE) {
		errno = ENOTCONN;
		return NULL;
	}
	return strm;
}

/**
 * @brief
 *	Sets the APP handler to be called in case the network connection from
 *	the leaf to the router is restored, or comes back up.
 *
 * @par Functionality:
 *	When a previously down connection between the leaf and router is
 *	restored or vice-versa, IO thread sends notification to APP thread. The
 *	APP thread, then, calls the handler prior registered by this setter
 *	function. This function is called by the APP to set such a handler.
 *	For example, in the case of pbs_server, such a handler is "net_down_handler".
 *
 * @see
 *	leaf_close_handler
 *
 * @param[in] - app_net_down_handler - ptr to a function (in the calling APP)
 *	    that must be called when the network link between leaf and router
 *	    goes down.

 * @param[in] - app_net_restore_handler - ptr to function (in the calling APP)
 *	    that must be called when the network link between leaf and router
 *	    is restored.
 *
 * @return void
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_set_app_net_handler(void (*app_net_down_handler)(void *data), void (*app_net_restore_handler)(void *data))
{
	the_app_net_down_handler = app_net_down_handler;
	the_app_net_restore_handler = app_net_restore_handler;
}

static int
leaf_send_ctl_join(int tfd, void *c)
{
	tpp_context_t *ctx = (tpp_context_t *) c;
	tpp_router_t *r;
	tpp_join_pkt_hdr_t *hdr = NULL;
	tpp_packet_t *pkt = NULL;
	int len;
	int i;

	if (!ctx)
		return 0;

	if (ctx->type == TPP_ROUTER_NODE) {
		r = (tpp_router_t *) ctx->ptr;
		r->state = TPP_ROUTER_STATE_CONNECTING;

		/* send a TPP_CTL_JOIN message */
		pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_join_pkt_hdr_t), 1, (void **) &hdr);
		if (!pkt) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			return -1;
		}

		hdr->type = TPP_CTL_JOIN;
		hdr->node_type = tpp_conf->node_type;
		hdr->hop = 1;
		hdr->index = r->index;
		hdr->num_addrs = leaf_addr_count;

		/* log my own leaf name to help in troubleshooting later */
		for (i = 0; i < leaf_addr_count; i++) {
			tpp_log(LOG_CRIT, NULL, "Registering address %s to pbs_comm %s", tpp_netaddr(&leaf_addrs[i]), r->router_name);
		}

		len = leaf_addr_count * sizeof(tpp_addr_t);
		if (!tpp_bld_pkt(pkt, leaf_addrs, len, 1, NULL)) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			return -1;
		}

		if (tpp_transport_vsend(r->conn_fd, pkt) != 0) { /* this has to go irrespective of router state being down */
			tpp_log(LOG_CRIT, __func__, "tpp_transport_vsend failed, err=%d", errno);
			return -1;
		}
	}

	return 0;
}

/**
 * @brief
 *	The leaf post connect handler
 *
 * @par Functionality
 *	When the connection between this leaf and another is dropped, the IO
 *	thread continuously attempts to reconnect to it. If the connection is
 *	restored, then this prior registered function is called.
 *
 * @param[in] tfd - The actual IO connection on which data was about to be
 *			sent (unused)
 * @param[in] data - Any data the IO thread might want to pass to this function.
 *		     (unused)
 * @param[in] c - Context associated with this connection, points us to the
 *                router being connected to
 * @param[in] extra - The extra data associated with IO connection
 *
 * @return Error code
 * @retval 0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
leaf_post_connect_handler(int tfd, void *data, void *c, void *extra)
{
	tpp_context_t *ctx = (tpp_context_t *) c;
	conn_auth_t *authdata = (conn_auth_t *) extra;
	int rc = 0;

	if (!ctx)
		return 0;

	if (ctx->type != TPP_ROUTER_NODE)
		return 0;

	if (tpp_conf->auth_config->encrypt_method[0] != '\0' ||
	    strcmp(tpp_conf->auth_config->auth_method, AUTH_RESVPORT_NAME) != 0) {

		/*
		 * Since either auth is not resvport or encryption is enabled,
		 * initiate handshakes for them
		 *
		 * If encryption is enabled then first initiate handshake for it
		 * else for authentication
		 *
		 * Here we are only initiating handshake, if any handshake needs
		 * continuation then it will be handled in leaf_pkt_handler
		 */

		int conn_fd = ((tpp_router_t *) ctx->ptr)->conn_fd;
		authdata = tpp_make_authdata(tpp_conf, AUTH_CLIENT, tpp_conf->auth_config->auth_method, tpp_conf->auth_config->encrypt_method);
		if (authdata == NULL) {
			/* tpp_make_authdata already logged error */
			return -1;
		}
		authdata->conn_initiator = 1;
		tpp_transport_set_conn_extra(tfd, authdata);

		if (authdata->config->encrypt_method[0] != '\0') {
			rc = tpp_handle_auth_handshake(tfd, conn_fd, authdata, FOR_ENCRYPT, NULL, 0);
			if (rc != 1)
				return rc;
		}

		if (strcmp(authdata->config->auth_method, AUTH_RESVPORT_NAME) != 0) {
			if (strcmp(authdata->config->auth_method, authdata->config->encrypt_method) != 0) {
				rc = tpp_handle_auth_handshake(tfd, conn_fd, authdata, FOR_AUTH, NULL, 0);
				if (rc != 1)
					return rc;
			} else {
				authdata->authctx = authdata->encryptctx;
				authdata->authdef = authdata->encryptdef;
				tpp_transport_set_conn_extra(tfd, authdata);
			}
		}
	}

	/*
	 * Since we are in post conntect handler
	 * and we have completed authentication
	 * so send TPP_CTL_JOIN
	 */
	return leaf_send_ctl_join(tfd, c);
}

/**
 * @brief
 *	The function initiates a connection from the leaf to a router
 *
 * @par Functionality:
 *	This function calls tpp_transport_connect (from the transport layer)
 *	and queues a "JOIN" message to be sent to the router once the connection
 *	is established.
 *
 *	The TPP_CONTROL_JOIN message is a control message that identifies the
 *	leaf's properties to the router (registers the leaf to the router).
 *	The properties of the leaf that are sent, are the type of the node, ie,
 *	its a leaf or another router in the network, its name.
 *
 * @see
 *	tpp_transport_connect
 *
 * @param[in] r - struct router - info of the router to connect to
 *
 * @return int
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
connect_router(tpp_router_t *r)
{
	tpp_context_t *ctx;

	/* since we connected we should add a context */
	if ((ctx = (tpp_context_t *) malloc(sizeof(tpp_context_t))) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating tpp context");
		return -1;
	}
	ctx->ptr = r;
	ctx->type = TPP_ROUTER_NODE;

	/* initiate connections to the tpp router (single for now) */
	if (tpp_transport_connect(r->router_name, r->delay, ctx, &(r->conn_fd)) == -1) {
		tpp_log(LOG_ERR, NULL, "Connection to pbs_comm %s failed", r->router_name);
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Initializes the client side of the TPP library
 *
 * @par Functionality:
 *	This function creates the fd (pipe) that the APP can monitor for events,
 *	initializes the transport layer by calling tpp_transport_init.
 *	It initializes the various mutexes and global queues of structures.
 *	It also registers a set of "handlers" that the transport layer calls
 *	using the IO thread into the leaf logic code
 *	etc.
 *
 * @see
 *	tpp_transport_init
 *	tpp_transport_set_handlers
 *
 * @param[in] cnf - The tpp configuration structure
 *
 * @return - The file descriptor that APP must use to monitor for events
 * @retval -1   - Function failed
 * @retval !=-1 - Success, read end of the pipe is returned to APP to monitor
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_init(struct tpp_config *cnf)
{
	int rc, i;
	int app_fd;

	tpp_conf = cnf;
	if (tpp_conf->node_name == NULL) {
		tpp_log(LOG_CRIT, NULL, "TPP leaf node name is NULL");
		return -1;
	}

	/* before doing anything else, initialize the key to the tls */
	if (tpp_init_tls_key() != 0) {
		/* can only use prints since tpp key init failed */
		fprintf(stderr, "Failed to initialize tls key\n");
		return -1;
	}

	tpp_log(LOG_CRIT, NULL, "TPP leaf node names = %s", tpp_conf->node_name);

	tpp_init_rwlock(&strmarray_lock);
	tpp_init_lock(&strm_action_queue_lock);

	if (tpp_mbox_init(&app_mbox, "app_mbox", TPP_MAX_MBOX_SIZE) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to create application mbox");
		return -1;
	}

	/* initialize the app_mbox */
	app_fd = tpp_mbox_getfd(&app_mbox);

	TPP_QUE_CLEAR(&strm_action_queue);
	TPP_QUE_CLEAR(&freed_sd_queue);

	streams_idx = pbs_idx_create(PBS_IDX_DUPS_OK, sizeof(tpp_addr_t));
	if (streams_idx == NULL) {
		tpp_log(LOG_CRIT, __func__, "Failed to create index for leaves");
		return -1;
	}

	/* get the addresses associated with this leaf */
	leaf_addrs = tpp_get_addresses(tpp_conf->node_name, &leaf_addr_count);
	if (!leaf_addrs) {
		tpp_log(LOG_CRIT, __func__, "Failed to resolve address, err=%d", errno);
		return -1;
	}

	/*
	 * first register handlers with the transport, so these functions are called
	 * from the IO thread from the transport layer
	 */
	tpp_transport_set_handlers(
		leaf_pkt_presend_handler,  /* called before sending packet */
		leaf_pkt_handler,	   /* called when a packet arrives */
		leaf_close_handler,	   /* called when a connection closes */
		leaf_post_connect_handler, /* called when connection restores */
		leaf_timer_handler	   /* called after amt of time from previous handler */
	);

	/* initialize the tpp transport layer */
	if ((rc = tpp_transport_init(tpp_conf)) == -1)
		return -1;

	max_routers = 0;
	while (tpp_conf->routers[max_routers])
		max_routers++; /* count max_routers */

	if (max_routers == 0) {
		tpp_log(LOG_CRIT, NULL, "No pbs_comms configured, cannot start");
		return -1;
	}

	if ((routers = calloc(max_routers, sizeof(tpp_router_t *))) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating pbs_comms array");
		return -1;
	}
	routers[max_routers - 1] = NULL;

	/* initialize the router structures and initiate connections to them */
	for (i = 0; tpp_conf->routers[i]; i++) {
		if ((routers[i] = malloc(sizeof(tpp_router_t))) == NULL) {
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating pbs_comm structure");
			return -1;
		}

		routers[i]->router_name = tpp_conf->routers[i];
		routers[i]->conn_fd = -1;
		routers[i]->initiator = 1;
		routers[i]->state = TPP_ROUTER_STATE_DISCONNECTED;
		routers[i]->index = i;
		routers[i]->delay = 0;

		tpp_log(LOG_INFO, NULL, "Connecting to pbs_comm %s", routers[i]->router_name);

		/* connect to router and send initial join packet */
		if ((rc = connect_router(routers[i])) != 0)
			return -1;
	}

#ifndef WIN32

	/*
	 * As such atfork handlers are required since after a fork, fork() replicates
	 * only calling thread that called fork() and TPP layer never calls fork. So, this
	 * means that the TPP thread is always dead/unavailable in a child process.
	 *
	 * We register only a post_fork child handler to set "tpp_terminated_in_child" flag
	 * which renders TPP functions to return right away without doing anything,
	 * rendering TPP functionality "bypassed" in the child process.
	 *
	 */

	/* for unix, set a pthread_atfork handler */
	if (pthread_atfork(NULL, NULL, tpp_terminate)) {
		tpp_log(LOG_CRIT, __func__, "TPP client atfork handler registration failed");
		return -1;
	}
#endif

	return (app_fd);
}

/**
 * @brief
 *	tpp/dis support routine for ending a message that was read
 *	Skips over decoding to the next message
 *
 * @param[in] - fd - Tpp channel whose dis read packet has to be purged
 *
 * @retval	0 Success
 * @retval	-1 error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_eom(int fd)
{
	tpp_packet_t *p;
	stream_t *strm;
	pbs_tcp_chan_t *tpp;

	/* check for bad file descriptor */
	if (fd < 0)
		return -1;

	TPP_DBPRT("sd=%d", fd);
	strm = get_strm(fd);
	if (!strm) {
		TPP_DBPRT("Bad sd %d", fd);
		return -1;
	}
	p = tpp_deque(&strm->recv_queue); /* only APP thread accesses this queue, hence no lock */
	tpp_free_pkt(p);
	tpp = tpp_get_user_data(fd);
	if (tpp != NULL) {
		/* initialize read buffer */
		dis_clear_buf(&tpp->readbuf);
	}
	return 0;
}

/**
 * @brief
 *	Opens a virtual connection to another leaf (another PBS daemon)
 *
 * @par Functionality:
 *	This function merely allocates a free stream slot from the array of
 *	streams and sets the destination host and port, and returns the slot
 *	index as the fd for the application to use to read/write to the virtual
 *	connection
 *
 * @param[in] dest_host - Hostname of the destination leaf
 * @param[in] port - The port at which the destination is available
 *
 * @return - The file descriptor that APP must use to do the IO
 * @retval -1   - Function failed
 * @retval !=-1 - Success, the fd for the APP to use is returned
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_open(char *dest_host, unsigned int port)
{
	stream_t *strm;
	char *dest;
	tpp_addr_t *addrs, dest_addr;
	int count;
	void *pdest_addr = &dest_addr;
	void *idx_ctx = NULL;

	if ((dest = mk_hostname(dest_host, port)) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory opening stream");
		return -1;
	}

	addrs = tpp_get_addresses(dest, &count);
	if (!addrs) {
		tpp_log(LOG_CRIT, __func__, "Failed to resolve address, err=%d", errno);
		free(dest);
		return -1;
	}
	memcpy(&dest_addr, addrs, sizeof(tpp_addr_t));
	free(addrs);

	tpp_read_lock(&strmarray_lock); /* walking the idx, so read lock */

	/*
	 * Just try to find a fully open stream to use, else fall through
	 * to create a new stream. Any half closed streams will be closed
	 * elsewhere, either when network first dropped or if any message
	 * comes to such a half open stream
	 */
	while (pbs_idx_find(streams_idx, &pdest_addr, (void **) &strm, &idx_ctx) == PBS_IDX_RET_OK) {
		if (memcmp(pdest_addr, &dest_addr, sizeof(tpp_addr_t)) != 0)
			break;
		if (strm->u_state == TPP_STRM_STATE_OPEN && strm->t_state == TPP_TRNS_STATE_OPEN && strm->used_locally == 1) {
			tpp_unlock_rwlock(&strmarray_lock);
			pbs_idx_free_ctx(idx_ctx);

			TPP_DBPRT("Stream for dest[%s] returned = %u", dest, strm->sd);
			free(dest);
			return strm->sd;
		}
	}
	pbs_idx_free_ctx(idx_ctx);

	tpp_unlock_rwlock(&strmarray_lock);

	/* by default use the first address of the host as the source address */
	if ((strm = alloc_stream(&leaf_addrs[0], &dest_addr)) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating stream");
		free(dest);
		return -1;
	}

	/* set the used_locally flag, since the APP is aware of this fd */
	strm->used_locally = 1;

	TPP_DBPRT("Stream for dest[%s] returned = %d", dest, strm->sd);
	free(dest);

	return strm->sd;
}

/**
 * @brief
 *	Returns the active router which has an established TCP connection
 *
 * @par Functionality:
 *	Loops through the list of routers and returns the first one having
 *	an active TCP connection. Favors the currently active router
 *
 * @return - The active router
 * @retval NULL   - Function failed
 * @retval !NULL - Success, the active router is returned
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static tpp_router_t *
get_active_router()
{
	int i;
	static int index = 0;

	if (routers == NULL)
		return NULL;

	/*
	 * If we had already been using an alternate router it should be good to use
	 * without checking connection age, since we were already using it
	 */
	if (index >= 0 && index < max_routers && routers[index] && routers[index]->state == TPP_ROUTER_STATE_CONNECTED)
		return routers[index];

	for (i = 0; i < max_routers; i++) {
		if (routers[i]->state == TPP_ROUTER_STATE_CONNECTED) {
			index = i;
			return routers[index];
		}
	}

	return NULL;
}

/**
 * @brief
 *	Sends data to a stream
 *
 * @par Functionality:
 *	Basically queues data to be sent by the IO thread to the desired
 *	destination (as specified by the stream descriptor)
 *
 * @param[in] sd - The stream descriptor to which to send data
 * @param[in] data - Pointer to the data block to be sent
 * @param[in] len - Length of the data block to be sent
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval   >=0 - Success - amount of data sent
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_send(int sd, void *data, int len)
{
	stream_t *strm;
	int rc = -1;
	unsigned int to_send;
	void *data_dup;
	tpp_data_pkt_hdr_t *dhdr = NULL;
	tpp_packet_t *pkt;

	strm = get_strm(sd);
	if (!strm) {
		TPP_DBPRT("Bad sd %d", sd);
		return -1;
	}

	if ((tpp_conf->compress == 1) && (len > TPP_COMPR_SIZE)) {
		data_dup = tpp_deflate(data, len, &to_send); /* creates a copy */
		if (data_dup == NULL) {
			tpp_log(LOG_CRIT, __func__, "tpp deflate failed");
			return -1;
		}
	} else {
		data_dup = malloc(len);
		if (!data_dup) {
			tpp_log(errno, __func__, "Failed to duplicate data");
			return -1;
		}
		memcpy(data_dup, data, len);
		to_send = len;
	}
	/* we have created a copy of the data either way, compressed, or not */

	tpp_log(LOG_DEBUG, __func__, "**** sd=%d, compr_len=%d, len=%d, dest_sd=%u", sd, to_send, len, strm->dest_sd);

	if (strm->strm_type == TPP_STRM_MCAST) {
		/* do other stuff */
		return tpp_mcast_send(sd, data_dup, to_send, len);
	}

	/* create a new pkt and add the dhdr chunk first */
	pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_data_pkt_hdr_t), 1, (void **) &dhdr);
	if (!pkt) {
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		free(data_dup);
		return -1;
	}
	dhdr->type = TPP_DATA;
	dhdr->src_sd = htonl(sd);
	dhdr->src_magic = htonl(strm->src_magic);
	dhdr->dest_sd = htonl(strm->dest_sd);
	dhdr->totlen = htonl(len);
	memcpy(&dhdr->src_addr, &strm->src_addr, sizeof(tpp_addr_t));
	memcpy(&dhdr->dest_addr, &strm->dest_addr, sizeof(tpp_addr_t));

	/* add the data chunk to the already created pkt */
	if (!tpp_bld_pkt(pkt, data_dup, to_send, 0, NULL)) { /* data is already a duplicate buffer */
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		return -1;
	}

	rc = send_to_router(pkt);
	if (rc == 0)
		return len; /* all given data sent, so return len */

	if (rc == -2)
		tpp_log(LOG_CRIT, __func__, "mbox full, returning error to App!");
	else if (rc == -1)
		tpp_log(LOG_ERR, __func__, "Failed to send to router");

	send_app_strm_close(strm, TPP_CMD_NET_CLOSE, 0);
	return rc;
}

/**
 * @brief
 *	poll function to check if any streams have a message/notification
 *	waiting to be read by the APP.
 *
 * @return - Descriptor of stream which has data/notification to be read
 * @retval -2   - No streams have outstanding/pending data/notifications
 * @retval != -2 - Stream descriptor that has pending data/notifications
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_poll(void)
{
	int tfd;
	if (tpp_ready_fds(&tfd, 1) == 1) {
		return tfd;
	}
	return -2;
}

/**
 * @brief
 *	Function to recv/read data from a tpp stream
 *
 * @par Functionality:
 *	This function reads the requested amount of bytes from the "current"
 *	position of the next available data packet in the "received" queue.
 *
 *	It advances the "current position" in the data packet, so subsequent
 *	reads on this stream reads the next bytes from the data packet.
 *	It never advances the "current position" past the end of the data
 *	packet. To move to the next packet, the APP must call "tpp_eom".
 *
 * @param[in]  sd   - The stream descriptor to which to read data
 * @param[out] data - Pointer to the buffer to read data into
 * @param[in]  len  - Length of the buffer
 *
 * @return
 * @retval -1    - Error reading the stream (errno set EWOULDBLOCK if no more
 *		   data is available to be read)
 * @retval != -1 - Number of bytes of data actually read from the stream
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_recv(int sd, void *data, int len)
{
	tpp_que_elem_t *n;
	tpp_packet_t *cur_pkt = NULL;
	tpp_chunk_t *chunk = NULL;
	stream_t *strm;
	int offset, avail_bytes, trnsfr_bytes;

	errno = 0;
	if (len == 0)
		return 0;

	strm = get_strm(sd);
	if (!strm) {
		TPP_DBPRT("Bad sd %d", sd);
		return -1;
	}

	strm->used_locally = 1;

	if ((n = TPP_QUE_HEAD(&strm->recv_queue))) /* only APP thread accesses this queue, hence no lock */
		cur_pkt = TPP_QUE_DATA(n);

	/* read from head */
	if (cur_pkt == NULL) {
		errno = EWOULDBLOCK;
		return -1; /* no data currently - would block */
	}

	chunk = GET_NEXT(cur_pkt->chunks);
	if (chunk == NULL) {
		errno = EWOULDBLOCK;
		return -1; /* no data currently - would block */
	}

	offset = chunk->pos - chunk->data;
	avail_bytes = chunk->len - offset;
	trnsfr_bytes = (len < avail_bytes) ? len : avail_bytes;

	if (trnsfr_bytes == 0) {
		errno = EWOULDBLOCK;
		return -1; /* no data currently - would block */
	}

	memcpy(data, chunk->pos, trnsfr_bytes);
	chunk->pos = chunk->pos + trnsfr_bytes;

	return trnsfr_bytes;
}

/**
 * @brief
 *	Local function to allocate a stream structure
 *
 * @par Functionality:
 *	Allocates a stream structure and initializes its members. Adds the
 *	stream structure to a free slot on the array of streams. To find a free
 *	slot faster, it uses globals "last_freed_sd" and "high_sd". If it cannot
 *	find a free slot using these two indexes, it does a sequential search
 *	from the start of the streams array to find a free slot.
 *
 * @param[in] src_addr  - The address of the src host.
 * @param[in] dest_addr - The address of the destination host.
 *
 * @return	 - Pointer to the newly allocated stream structure
 * @retval NUll  - Error, out of memory
 * @retval !NULl - Ptr to the new stream
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static stream_t *
alloc_stream(tpp_addr_t *src_addr, tpp_addr_t *dest_addr)
{
	stream_t *strm;
	unsigned int sd = max_strms, i;
	void *data;
	unsigned int freed_sd = UNINITIALIZED_INT;

	errno = 0;

	tpp_write_lock(&strmarray_lock); /* updating the array + adding to idx, so WRITE lock */

	data = tpp_deque(&freed_sd_queue);
	if (data) {
		freed_sd = (unsigned int) (intptr_t) data;
		freed_queue_count--;
	}

	if (freed_sd != UNINITIALIZED_INT && strmarray[freed_sd].slot_state == TPP_SLOT_FREE) {
		sd = freed_sd;
	} else if (high_sd != UNINITIALIZED_INT && max_strms > 0 && high_sd < max_strms - 1) {
		sd = high_sd + 1;
	} else {
		sd = max_strms;

		TPP_DBPRT("***Searching for a free slot");
		/* search for a free sd */
		for (i = 0; i < max_strms; i++) {
			if (strmarray[i].slot_state == TPP_SLOT_FREE) {
				sd = i;
				break;
			}
		}
	}

	if (high_sd == UNINITIALIZED_INT || sd > high_sd) {
		high_sd = sd; /* remember the max sd used */
	}

	strm = calloc(1, sizeof(stream_t));
	if (!strm) {
		tpp_unlock_rwlock(&strmarray_lock);
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating stream");
		return NULL;
	}
	strm->strm_type = TPP_STRM_NORMAL;
	strm->sd = sd;
	strm->dest_sd = UNINITIALIZED_INT;
	strm->dest_magic = UNINITIALIZED_INT;
	if (src_addr)
		memcpy(&strm->src_addr, src_addr, sizeof(tpp_addr_t));
	if (dest_addr)
		memcpy(&strm->dest_addr, dest_addr, sizeof(tpp_addr_t));
	strm->src_magic = (unsigned int) time(0); /* for now use time as the unique magic number */
	strm->u_state = TPP_STRM_STATE_OPEN;
	strm->t_state = TPP_TRNS_STATE_OPEN;

	strm->close_func = NULL;
	strm->timeout_node = NULL;

	TPP_QUE_CLEAR(&strm->recv_queue); /* only APP thread accesses this queue, once created here, hence no lock */

	/* set to stream array */
	if (max_strms == 0 || sd > max_strms - 1) {
		unsigned int newsize;
		void *p;

		/* resize strmarray */
		newsize = sd + 100;
		p = realloc(strmarray, sizeof(stream_slot_t) * newsize);
		if (!p) {
			free(strm);
			tpp_unlock_rwlock(&strmarray_lock);
			tpp_log(LOG_CRIT, __func__, "Out of memory resizing stream array");
			return NULL;
		}
		strmarray = (stream_slot_t *) p;
		memset(&strmarray[max_strms], 0, (newsize - max_strms) * sizeof(stream_slot_t));
		max_strms = newsize;
	}

	strmarray[sd].slot_state = TPP_SLOT_BUSY;
	strmarray[sd].strm = strm;

	if (dest_addr) {
		/* also add stream to the streams_idx with the dest as key */
		if (pbs_idx_insert(streams_idx, &strm->dest_addr, strm) != PBS_IDX_RET_OK) {
			tpp_log(LOG_CRIT, __func__, "Failed to add strm with sd=%u to streams", strm->sd);
			free(strm);
			tpp_unlock_rwlock(&strmarray_lock);
			return NULL;
		}
	}

	TPP_DBPRT("*** Allocated new stream, sd=%u, src_magic=%u", strm->sd, strm->src_magic);

	tpp_unlock_rwlock(&strmarray_lock);

	return strm;
}

/**
 * @brief
 *	Socket address of the local side for the given sd
 *
 * @param[in] sd - The stream descriptor
 *
 * @return	 - Pointer to a static sockaddr structure
 * @retval NUll  - Error, failed to get socket address or bad stream descriptor
 * @retval !NULl - Ptr to the static sockaddr structure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
struct sockaddr_in *
tpp_localaddr(int fd)
{
	stream_t *strm;
	static struct sockaddr_in sa;

	strm = get_strm(fd);
	if (!strm)
		return NULL;

	memcpy((char *) &sa.sin_addr, &leaf_addrs->ip, sizeof(sa.sin_addr));
	sa.sin_port = htons(leaf_addrs->port);

	return (&sa);
}

/**
 * @brief
 *	Socket address of the remote side for the given sd
 *
 * @param[in] sd - The stream descriptor
 *
 * @return	 - Pointer to a static sockaddr structure
 * @retval NUll  - Error, failed to get socket address or bad stream descriptor
 * @retval !NULl - Ptr to the static sockaddr structure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
struct sockaddr_in *
tpp_getaddr(int fd)
{
	stream_t *strm;
	static struct sockaddr_in sa;

	strm = get_strm(fd);
	if (!strm)
		return NULL;

	memcpy((char *) &sa.sin_addr, &strm->dest_addr.ip, sizeof(sa.sin_addr));
	sa.sin_port = strm->dest_addr.port;

	return (&sa);
}

/**
 * @brief
 *	Shuts down the tpp library gracefully
 *
 * @par Functionality
 *	Closes the APP notification fd, shuts down the IO thread
 *	and destroys all the streams.
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_shutdown()
{
	unsigned int i;
	unsigned int sd;

	TPP_DBPRT("from pid = %d", getpid());

	tpp_mbox_destroy(&app_mbox);

	tpp_going_down = 1;

	tpp_transport_shutdown();
	/* all threads are dead by now, so no locks required */

	DIS_tpp_funcs();

	for (i = 0; i < max_strms; i++) {
		if (strmarray[i].slot_state == TPP_SLOT_BUSY) {
			sd = strmarray[i].strm->sd;
			dis_destroy_chan(sd);
			free_stream_resources(strmarray[i].strm);
			free_stream(sd);
		}
	}

	if (strmarray)
		free(strmarray);
	tpp_destroy_rwlock(&strmarray_lock);

	free_tpp_config(tpp_conf);
}

/**
 * @brief
 *	Terminates (un-gracefully) the tpp library
 *
 * @par Functionality
 *	Typically to be called after a fork. Threads are not preserved after
 *	fork, so this function does not attempt to stop threads, just destroys
 *	the streams.
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_terminate()
{
	/* Warning: Do not attempt to destroy any lock
	 * This is not required since our library is effectively
	 * not used after a fork.
	 * Also never log anything from (or after) a terminate handler.
	 *
	 * Don't bother to free any TPP data as well, as the forked
	 * process is usually short lived and no point spending time
	 * freeing space on a short lived forked process. Besides,
	 * the TPP thread which is lost after fork might have been in
	 * between using these data when the fork happened, so freeing
	 * some structures might be dangerous.
	 *
	 * Thus the only thing we do here is to close file/sockets
	 * so that the kernel can recognize when a close happens from the
	 * main process.
	 *
	 */
	if (tpp_terminated_in_child == 1)
		return;

	/* set flag so this function is never entered within
	 * this process again, so no fear of double frees
	 */
	tpp_terminated_in_child = 1;

	tpp_transport_terminate();

	tpp_mbox_destroy(&app_mbox);
}

/**
 * @brief
 *	Find which streams have pending notifications/data
 *
 * @param[out] sds    - Arrays to be filled with descriptors of streams
 *                      having pending notifications
 * @param[in] len - Length of supplied array
 *
 * @return Number of ready streams
 * @retval   -1  - Function failed
 * @retval !=-1  - Number of ready streams
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_ready_fds(int *sds, int len)
{
	int strms_found = 0;
	unsigned int sd = 0;
	int cmd = 0;
	void *data = NULL;
	stream_t *strm;

	errno = 0;

	/* tpp_fd works like a level triggered fd */
	while (strms_found < len) {
		data = NULL;
		if (tpp_mbox_read(&app_mbox, &sd, &cmd, &data) != 0) {
			if (errno == EWOULDBLOCK)
				break;
			else
				return -1;
		}

		if (cmd == TPP_CMD_NET_DATA) {
			tpp_packet_t *pkt = data;
			if ((strm = get_strm_atomic(sd))) {
				TPP_DBPRT("sd=%u, cmd=%d, u_state=%d, t_state=%d, len=%d, dest_sd=%u", sd, cmd, strm->u_state, strm->t_state, pkt->totlen, strm->dest_sd);

				if (strm->u_state == TPP_STRM_STATE_OPEN) {
					/* add packet to recv queue */
					if (tpp_enque(&strm->recv_queue, pkt) == NULL) { /* only APP thread accesses this queue, hence not lock */
						tpp_log(LOG_CRIT, __func__, "Failed to queue received pkt");
						tpp_free_pkt(pkt);
						return -1;
					}
					sds[strms_found++] = sd;
				} else {
					TPP_DBPRT("Data recvd on closed stream %u discarded", sd);
					tpp_free_pkt(pkt);
					/* respond back by sending the close packet once more */
					send_spl_packet(strm, TPP_CLOSE_STRM);
				}
			} else {
				TPP_DBPRT("Data recvd on deleted stream %u discarded", sd);
				tpp_free_pkt(pkt);
			}
		} else if (cmd == TPP_CMD_PEER_CLOSE || cmd == TPP_CMD_NET_CLOSE) {

			if ((strm = get_strm_atomic(sd))) {
				TPP_DBPRT("sd=%u, cmd=%d, u_state=%d, t_state=%d, data=%p", sd, cmd, strm->u_state, strm->t_state, data);

				if (strm->u_state == TPP_STRM_STATE_OPEN) {
					if (cmd == TPP_CMD_PEER_CLOSE) {
						/* ask app to close stream */
						TPP_DBPRT("Sent peer close to stream sd=%u", sd);
						sds[strms_found++] = sd;

					} else if (cmd == TPP_CMD_NET_CLOSE) {
						/* network closed, so clear all pending data to be
						 * received, and signal that sd
						 */
						TPP_DBPRT("Sent net close stream sd=%u", sd);
						sds[strms_found++] = sd;
					}
				} else {
					/* app already closed */
					queue_strm_close(strm);
				}
			}
		} else if (cmd == TPP_CMD_NET_RESTORE) {

			if (the_app_net_restore_handler)
				the_app_net_restore_handler(data);

		} else if (cmd == TPP_CMD_NET_DOWN) {

			if (the_app_net_down_handler)
				the_app_net_down_handler(data);
		}
	}
	return strms_found;
}

/**
 * @brief
 *	Get the user buffer pointer associated with the stream
 *
 * @par Functionality
 *	Used by the tpp_dis later to retrieve a previously associated buffer
 *	that is used to DIS encode/decode data before sending/after receiving
 *	Since this is associated with the stream, this eliminates the need for
 *	the dis layer to maintain a separate array of buffers for each stream.
 *
 * @param[in] sd - The stream descriptor
 *
 * @return Ptr to user buffer (previously set with tpp_set_user_data)
 * @retval NULL - Bad descriptor or not user buffer was set
 * @retval !NULL - Pts to user buffer
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void *
tpp_get_user_data(int sd)
{
	stream_t *strm;

	errno = 0;
	strm = get_strm_atomic(sd);
	if (!strm) {
		errno = ENOTCONN;
		return NULL;
	}
	return strm->user_data;
}

/**
 * @brief
 *	Associated a user buffer with the stream
 *
 * @par Functionality
 *	Used by the tpp_dis later associate a buffer to the stream.
 *	Used by tppdis_get_user_data to encode/decode data before sending/after receiving
 *	Since this is associated with the stream, this eliminates the need for
 *	the dis layer to maintain a separate array of buffers for each stream.
 *
 * @param[in] sd - The stream descriptor
 * @param[in] user_data - The user buffer allocated by the tpp_dis layer
 *
 * @return Error code
 * @retval -1 - Bad stream descriptor
 * @retval 0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_set_user_data(int sd, void *user_data)
{
	stream_t *strm;

	errno = 0;
	strm = get_strm_atomic(sd);
	if (!strm) {
		errno = ENOTCONN;
		tpp_log(LOG_WARNING, __func__, "Slot %d freed!", sd);
		return -1;
	}
	strm->user_data = user_data;
	return 0;
}

/**
 * @brief
 *	Associate a user close function to be called when the stream
 *	is being  closed
 *
 * @par Functionality
 *	When tpp_close is called, the user defined close function is triggered.
 *
 * @param[in] sd - The stream descriptor
 * @param[in] fnc - The function to register as a user defined close function
 *
 * @return Error code
 * @retval -1 - Bad stream descriptor
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
tpp_add_close_func(int sd, void (*func)(int))
{
	stream_t *strm;

	strm = get_strm(sd);
	if (!strm)
		return;

	strm->close_func = func;
}

/**
 * @brief
 *	Close this side of the communication channel associated with the
 *	stream descriptor.
 *
 * @par Functionality
 *	Queues a close packet to be sent to the peer. The stream state itself
 *	is changed to TPP_STRM_STATE_CLOSE_WAIT signifying that its sent a
 *	close packet to the peer and waiting for the peer to acknowledge it.
 *	Meantime all sends and recvs are disabled on this stream.
 *
 * @param[in] sd - The stream descriptor
 *
 * @return Error code
 * @retval -1 - Failed to close the stream (bad state or bad stream)
 * @retval 0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_close(int sd)
{
	stream_t *strm;
	tpp_packet_t *p;

	strm = get_strm(sd);
	if (!strm) {
		return -1;
	}

	/* call any user defined close function */
	if (strm->close_func)
		strm->close_func(sd);

	TPP_DBPRT("Closing sd=%d", sd);
	/* free the recv_queue also */
	while ((p = tpp_deque(&strm->recv_queue))) /* only APP thread accesses this queue, hence no lock */
		tpp_free_pkt(p);

	/* send a close packet */
	strm->u_state = TPP_STRM_STATE_CLOSE;

	DIS_tpp_funcs();
	dis_destroy_chan(strm->sd);

	if (strm->t_state != TPP_TRNS_STATE_OPEN || send_spl_packet(strm, TPP_CLOSE_STRM) != 0)
		queue_strm_close(strm);

	/* for now we do not pass any data to the peer if this side closed */
	return 0;
}

/**
 * @brief
 *	Open a multicast channel to multiple parties.
 *
 *	Allocates a multicast stream and marks the type as TPP_STRM_MCAST
 *
 * @param[in] key - Any unique identifier to identify the channel with
 *
 * @return The file descriptor of the opened multicast channel
 * @retval   -1 - Failure
 * @retval !=-1 - Success, the opened channel fd
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mcast_open(void)
{
	stream_t *strm;

	if ((strm = alloc_stream(&leaf_addrs[0], NULL)) == NULL) {
		return -1;
	}

	TPP_DBPRT("tpp_mcast_open called with fd=%u", strm->sd);

	strm->used_locally = 1;
	strm->strm_type = TPP_STRM_MCAST;
	return strm->sd;
}

/**
 * @brief
 *	Add a stream to the multicast channel
 *
 * @param[in] mtfd - The multicast channel to which to add streams to
 * @param[in] tfd - Array of stream descriptors to add to the multicast stream
 * @param[in] unique - add only unique streams. Use only if caller might call
 * 			this function with duplicate tfd.
 *
 * @return	Error code
 * @retval   -1 - Failure
 * @retval    0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mcast_add_strm(int mtfd, int tfd, bool unique)
{
	void *p;
	stream_t *mstrm;
	stream_t *strm;
	int i = 0;

	mstrm = get_strm_atomic(mtfd);
	if (!mstrm) {
		errno = ENOTCONN;
		return -1;
	}

	strm = get_strm(tfd);
	if (!strm) {
		errno = ENOTCONN;
		return -1;
	}

	if (!mstrm->mcast_data) {
		mstrm->mcast_data = malloc(sizeof(mcast_data_t));
		if (!mstrm->mcast_data) {
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating mcast data");
			return -1;
		}

		mstrm->mcast_data->strms = malloc(TPP_MCAST_SLOT_INC * sizeof(int));
		if (!mstrm->mcast_data->strms) {
			free(mstrm->mcast_data);
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating strm array of %lu bytes",
				(unsigned long) (TPP_MCAST_SLOT_INC * sizeof(int)));
			return -1;
		}
		mstrm->mcast_data->num_slots = TPP_MCAST_SLOT_INC;
		mstrm->mcast_data->num_fds = 0;
	} else if (mstrm->mcast_data->num_fds >= mstrm->mcast_data->num_slots) {
		p = realloc(mstrm->mcast_data->strms, (mstrm->mcast_data->num_slots + TPP_MCAST_SLOT_INC) * sizeof(int));
		if (!p) {
			tpp_log(LOG_CRIT, __func__, "Out of memory resizing strm array to %lu bytes", (mstrm->mcast_data->num_slots + TPP_MCAST_SLOT_INC) * sizeof(int));
			return -1;
		}
		mstrm->mcast_data->strms = p;
		mstrm->mcast_data->num_slots += TPP_MCAST_SLOT_INC;
	}

	if (unique) {
		for (i = 0; i < mstrm->mcast_data->num_fds; i++) {
			if (mstrm->mcast_data->strms[i] == tfd)
				return 0;
		}
	}

	mstrm->mcast_data->strms[mstrm->mcast_data->num_fds++] = tfd;

	return 0;
}

/**
 * @brief
 *	Return the current array of members of the mcast stream
 *
 * @param[in] mtfd - The multicast channel
 * @param[out] count - Return the number of members
 *
 * @return	member stream fd array
 * @retval   NULL  - Failure
 * @retval   !NULL - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int *
tpp_mcast_members(int mtfd, int *count)
{
	stream_t *strm;

	*count = 0;

	strm = get_strm_atomic(mtfd);
	if (!strm || !strm->mcast_data) {
		errno = ENOTCONN;
		return NULL;
	}

	*count = strm->mcast_data->num_fds;
	return strm->mcast_data->strms;
}

/**
 * @brief
 *	Send a command notification to all member streams
 *
 * @param[in]  mtfd - The mcast stream
 * @param[in]  cmd  - The command to send
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static void
tpp_mcast_notify_members(int mtfd, int cmd)
{
	stream_t *mstrm;
	int i;

	mstrm = get_strm_atomic(mtfd);
	if (!mstrm || !mstrm->mcast_data) {
		errno = ENOTCONN;
		return;
	}

	for (i = 0; i < mstrm->mcast_data->num_fds; i++) {
		int tfd;
		stream_t *strm;

		tfd = mstrm->mcast_data->strms[i];
		strm = get_strm_atomic(tfd);
		if (!strm)
			continue;
		send_app_strm_close(strm, cmd, 0);
	}
}

/**
 * @brief
 *	Create a multicast packet and send the data to all member streams
 *
 * @param[in] mtfd - The multicast channel to which to send data
 * @param[in] data - The pointer to the block of data to send
 * @param[in] to_send  - Length of the data to send
 * @param[in] len - In case of large packets data is sent in chunks,
 *                       len is the total length of the data
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval  -2 - transport buffers full
 * @retval   >=0 - Success - amount of data sent
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mcast_send(int mtfd, void *data, unsigned int to_send, unsigned int len)
{
	stream_t *mstrm = NULL;
	stream_t *strm = NULL;
	int i;
	int rc = -1;
	tpp_mcast_pkt_hdr_t *mhdr = NULL;
	tpp_mcast_pkt_info_t *minfo = NULL;
	tpp_mcast_pkt_info_t tmp_minfo;
	tpp_packet_t *pkt = NULL;
	unsigned int cmpr_len = 0;
	void *minfo_buf = NULL;
	int minfo_len;
	int ret;
	int finish;
	int num_fds;
	void *def_ctx = NULL;

	mstrm = get_strm_atomic(mtfd);
	if (!mstrm || !mstrm->mcast_data) {
		errno = ENOTCONN;
		return -1;
	}

	num_fds = mstrm->mcast_data->num_fds;

	minfo_len = sizeof(tpp_mcast_pkt_info_t) * num_fds;

	/* header data */
	pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_mcast_pkt_hdr_t), 1, (void **) &mhdr);
	if (!pkt) {
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		return -1;
	}
	mhdr->type = TPP_MCAST_DATA;
	mhdr->hop = 0;
	mhdr->totlen = htonl(len);
	memcpy(&mhdr->src_addr, &mstrm->src_addr, sizeof(tpp_addr_t));
	mhdr->num_streams = htonl(num_fds);
	mhdr->info_len = htonl(minfo_len);

	if (tpp_conf->compress == 1 && minfo_len > TPP_COMPR_SIZE) {
		def_ctx = tpp_multi_deflate_init(minfo_len);
		if (def_ctx == NULL)
			goto err;
	} else {
		minfo_buf = malloc(minfo_len);
		if (!minfo_buf) {
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating mcast buffer of %d bytes", minfo_len);
			goto err;
		}
	}

	for (i = 0; i < num_fds; i++) {
		strm = get_strm_atomic(mstrm->mcast_data->strms[i]);
		if (!strm) {
			tpp_log(LOG_ERR, NULL, "Stream %d is not open", mstrm->mcast_data->strms[i]);
			goto err;
		}

		/* per stream data */
		tmp_minfo.src_sd = htonl(strm->sd);
		tmp_minfo.src_magic = htonl(strm->src_magic);
		tmp_minfo.dest_sd = htonl(strm->dest_sd);

		TPP_DBPRT("MCAST src_sd=%u, dest_sd=%u", strm->sd, strm->dest_sd);

		memcpy(&tmp_minfo.dest_addr, &strm->dest_addr, sizeof(tpp_addr_t));

		if (def_ctx == NULL) { /* no compression */
			minfo = (tpp_mcast_pkt_info_t *) ((char *) minfo_buf + (i * sizeof(tpp_mcast_pkt_info_t)));
			memcpy(minfo, &tmp_minfo, sizeof(tpp_mcast_pkt_info_t));
		} else {
			finish = (i == (num_fds - 1)) ? 1 : 0;

			ret = tpp_multi_deflate_do(def_ctx, finish, &tmp_minfo, sizeof(tpp_mcast_pkt_info_t));
			if (ret != 0)
				goto err;
		}
	}

	if (def_ctx != NULL) {
		minfo_buf = tpp_multi_deflate_done(def_ctx, &cmpr_len);
		if (minfo_buf == NULL)
			goto err;

		TPP_DBPRT("*** mcast_send hdr orig=%d, cmprsd=%u", minfo_len, cmpr_len);
		mhdr->info_cmprsd_len = htonl(cmpr_len);
	} else {
		TPP_DBPRT("*** mcast_send uncompressed hdr orig=%d", minfo_len);
		mhdr->info_cmprsd_len = 0;
		cmpr_len = minfo_len;
	}
	def_ctx = NULL; /* done with compression */

	if (!tpp_bld_pkt(pkt, minfo_buf, cmpr_len, 0, NULL)) { /* add minfo chunk */
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		return -1;
	}

	if (!tpp_bld_pkt(pkt, data, to_send, 0, NULL)) { /* add data chunk */
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		return -1;
	}

	TPP_DBPRT("*** sending %d totlen", pkt->totlen);

	rc = send_to_router(pkt);
	if (rc == 0)
		return len; /* all given data sent, so return len */

	tpp_log(LOG_ERR, __func__, "Failed to send to router"); /* fall through */

err:
	tpp_mcast_notify_members(mtfd, TPP_CMD_NET_CLOSE);
	if (def_ctx)
		tpp_multi_deflate_done(def_ctx, &cmpr_len);

	if (minfo_buf)
		free(minfo_buf);
	return rc;
}

/**
 * @brief
 *	Close a multicast channel
 *
 * @param[in] mtfd - The multicast channel to close
 *
 * @return	Error code
 * @retval   -1 - Failure
 * @retval    0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mcast_close(int mtfd)
{
	stream_t *strm;

	if (mtfd < 0)
		return 0;

	strm = get_strm_atomic(mtfd);
	if (!strm) {
		return -1;
	}
	DIS_tpp_funcs();
	dis_destroy_chan(strm->sd);

	free_stream_resources(strm);
	free_stream(mtfd);
	return 0;
}

/**
 * @brief
 *	Add the stream to a queue of streams to be closed by the transport thread.
 *
 * @par Functionality
 *	Even if the app thread wants to free a stream, it adds the stream to this
 *	queue, so that the transport thread frees it, eliminating any thread
 *	races.
 *
 * @param[in] strm - The stream pointer
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static void
queue_strm_close(stream_t *strm)
{
	strm_action_info_t *c;
	tpp_router_t *r = get_active_router();

	if (!r)
		return;

	tpp_write_lock(&strmarray_lock); /* already under lock, dont need get_strm_atomic */

	if (strmarray[strm->sd].slot_state != TPP_SLOT_BUSY) {
		tpp_unlock_rwlock(&strmarray_lock);
		return;
	}
	strmarray[strm->sd].slot_state = TPP_SLOT_DELETED;
	tpp_unlock_rwlock(&strmarray_lock);

	TPP_DBPRT("Marked sd=%u DELETED", strm->sd);

	if ((c = malloc(sizeof(strm_action_info_t))) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating stream free info");
		return;
	}
	c->strm_action_time = time(0); /* asap */
	c->strm_action_func = queue_strm_free;
	c->sd = strm->sd;

	tpp_lock(&strm_action_queue_lock);
	if (tpp_enque(&strm_action_queue, c) == NULL)
		tpp_log(LOG_CRIT, __func__, "Failed to Queue close");

	tpp_unlock(&strm_action_queue_lock);

	TPP_DBPRT("Enqueued strm close for sd=%u", strm->sd);

	tpp_transport_wakeup_thrd(r->conn_fd);
	return;
}

/*
 * ============================================================================
 *
 * Functions below this are mostly driven by the IO thread. Some of them could
 * be accessed by both the IO and the App threads (and such functions need
 * synchronization)
 *
 * ============================================================================
 */

/**
 * @brief
 *	Free stream and add stream slot to a queue of slots to be marked free
 *	after TPP_CLOSE_WAIT time.
 *
 * @par Functionality
 *	The slot is not marked free immediately, rather after a period. This is to
 *	ensure that wandering/delayed messages do not cause havoc.
 *	Additionally deletes the stream's entry in the Stream index.
 *
 * @param[in] sd - The stream descriptor
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static void
queue_strm_free(unsigned int sd)
{
	strm_action_info_t *c;
	stream_t *strm;

	strm = get_strm_atomic(sd);
	if (!strm)
		return;

	free_stream_resources(strm);
	TPP_DBPRT("Freed sd=%u resources", sd);

	if ((c = malloc(sizeof(strm_action_info_t))) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating stream action info");
		return;
	}
	c->strm_action_time = time(0) + TPP_CLOSE_WAIT; /* time to close */
	c->strm_action_func = free_stream;
	c->sd = sd;

	tpp_lock(&strm_action_queue_lock);
	if (tpp_enque(&strm_action_queue, c) == NULL)
		tpp_log(LOG_CRIT, __func__, "Failed to Queue Free");
	tpp_unlock(&strm_action_queue_lock);

	return;
}

/**
 * @brief
 *	Pass on a close message from peer to the APP
 *
 * @par Functionality
 *	If this side had already called close, then instead of sending a
 *	notification to the app, it queues a close operation.
 *	If a NET_CLOSE happened (network between leaf and router broke), then
 *	send notification to APP.
 *
 * @param[in] strm - Pointer to the stream
 * @param[in] cmd - TPP_CMD_NET_CLOSE - network closed between leaf & router
 *		            TPP_CMD_PEER_CLOSE - Peer sent a close message
 * @param[in] error - Error code in case of network closure, set for future use
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
send_app_strm_close(stream_t *strm, int cmd, int error)
{
	errno = 0;

	strm->lasterr = error;
	strm->t_state = TPP_TRNS_STATE_NET_CLOSED;

	if (tpp_mbox_post(&app_mbox, strm->sd, cmd, NULL, 0) != 0) {
		tpp_log(LOG_CRIT, __func__, "Error writing to app mbox");
		return -1;
	}

	return 0;
}

/**
 * @brief
 *	Helper function to find a stream based on destination address,
 *	destination stream descriptor.
 *
 * @par Functionality
 *	Searches the index of streams based on the destination address.
 *	There could be several entries, since several streams could be open
 *	to the same destination. The index search quickly find the first entry
 *	that matches the address. Then on, we serially match the fd of the
 *	destination stream.
 *
 * @param[in] dest_addr  - address of the destination
 * @param[in] dest_sd    - The descriptor of the destination stream
 * @param[in] dest_magic - The magic id of the destination stream
 *
 * @return stream ptr of the stream if found
 * @retval NULL - If a matching stream was not found
 * @retval !NULL - The ptr to the matching stream
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static stream_t *
find_stream_with_dest(tpp_addr_t *dest_addr, unsigned int dest_sd, unsigned int dest_magic)
{
	void *idx_ctx = NULL;
	void *idx_nkey = dest_addr;
	stream_t *strm;

	while (pbs_idx_find(streams_idx, &idx_nkey, (void **) &strm, &idx_ctx) == PBS_IDX_RET_OK) {
		if (memcmp(idx_nkey, dest_addr, sizeof(tpp_addr_t)) != 0)
			break;
		TPP_DBPRT("sd=%u, dest_sd=%u, u_state=%d, t-state=%d, dest_magic=%u", strm->sd, strm->dest_sd, strm->u_state, strm->t_state, strm->dest_magic);
		if (strm->dest_sd == dest_sd && strm->dest_magic == dest_magic) {
			pbs_idx_free_ctx(idx_ctx);
			return strm;
		}
	}
	pbs_idx_free_ctx(idx_ctx);
	return NULL;
}

/**
 * @brief
 *	Walk the sorted global stream free queue and free  stream slot
 *	after TPP_CLOSE_WAIT time
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
act_strm(time_t now, int force)
{
	tpp_que_elem_t *n = NULL;

	tpp_lock(&strm_action_queue_lock);
	while ((n = TPP_QUE_NEXT(&strm_action_queue, n))) {
		strm_action_info_t *c;

		c = TPP_QUE_DATA(n);
		if (c && ((c->strm_action_time <= now) || (force == 1))) {
			n = tpp_que_del_elem(&strm_action_queue, n);
			TPP_DBPRT("Calling action function for stream %u", c->sd);
			tpp_unlock(&strm_action_queue_lock);

			/* unlock and call action function, then reacquire lock */
			c->strm_action_func(c->sd);

			tpp_lock(&strm_action_queue_lock);
			if (c->strm_action_func == free_stream) {
				/* free stream itself clears elements from the strm_action_queue
				 * so restart walking from the head of strm_action_queue
				 */
				n = NULL;
			}
			free(c);
		}
	}
	tpp_unlock(&strm_action_queue_lock);
}

/**
 * @brief
 *	The timer handler function registered with the IO thread.
 *
 * @par Functionality
 *	This function is called periodically (after the amount of time as
 *	specified by leaf_next_event_expiry() function) by the IO thread. This
 *	drives the close packets to be acted upon in time.
 *
 * @retval  - Time of next event expriry
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
leaf_timer_handler(time_t now)
{
	act_strm(now, 0);

	return leaf_next_event_expiry(now);
}

/**
 * @brief
 *	This function returns the amt of time after which the nearest event
 *	happens (close etc). The IO thread calls this function to determine
 *	how much time to sleep before calling the timer_handler function
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
time_t
leaf_next_event_expiry(time_t now)
{
	time_t rc1 = -1;
	time_t rc2 = -1;
	time_t rc3 = -1;
	time_t res = -1;
	tpp_que_elem_t *n;
	strm_action_info_t *f;

	tpp_lock(&strm_action_queue_lock);

	if ((n = TPP_QUE_HEAD(&strm_action_queue))) {
		if ((f = TPP_QUE_DATA(n)))
			rc3 = f->strm_action_time;
	}
	tpp_unlock(&strm_action_queue_lock);

	if (rc1 > 0)
		res = rc1;

	if (rc2 > 0 && (res == -1 || rc2 < res))
		res = rc2;

	if (rc3 > 0 && (res == -1 || rc3 < res))
		res = rc3;

	if (res != -1)
		res = res - now;

	return res;
}

/**
 * @brief
 *	Send a data packet to the APP layer
 *
 * @par Functionality
 *	Writes the packet to the pipe that the APP is monitoring, when APP reads
 *	from the read end of the pipe, it gets the pointer to the data
 *
 * @param[in] sd - The descriptor of the stream
 * @param[in] type - The type of the data packet (data, close etc)
 * @param[in] buf - The data that has to be stored
 * @param[in] sz - The size of the data
 * @param[in] totlen - Total data size
 *
 * @return Error code
 * @retval 0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
send_pkt_to_app(stream_t *strm, unsigned char type, void *data, int sz, int totlen)
{
	int rc;
	int cmd;
	void *tmp;
	tpp_packet_t *obj;

	if (type == TPP_DATA) {
		/* in case of uncompressed packets, totlen == compressed_len
		 * so amount of data on wire is compressed len, so allways check against
		 * compressed_len
		 */
		if (sz != totlen) {
			if (!(tmp = tpp_inflate(data, sz, totlen))) {
				tpp_log(LOG_CRIT, __func__, "Decompression failed");
				return -1;
			}
			data = tmp;
		} else {
			/* this is still the pointer to the data part of original buffer, must make copy */
			tmp = malloc(totlen);
			memcpy(tmp, data, totlen);
			data = tmp;
		}
		obj = tpp_bld_pkt(NULL, data, totlen, 0, NULL);
		if (!obj) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			return -1;
		}
		cmd = TPP_CMD_NET_DATA;
	} else {
		cmd = TPP_CMD_PEER_CLOSE;
		strm->t_state = TPP_TRNS_STATE_PEER_CLOSED;
		obj = NULL;
	}

	TPP_DBPRT("Sending cmd=%d to sd=%u", cmd, strm->sd);

	/* since we received one packet, send notification to app */
	rc = tpp_mbox_post(&app_mbox, strm->sd, cmd, obj, sz);
	if (rc != 0) {
		if (obj)
			tpp_free_pkt(obj);

		tpp_log(LOG_CRIT, __func__, "Error writing to app mbox");
	}
	return rc;
}

/**
 * @brief
 *	Sends a close packet to a peer. This is called when this end calls
 *	tpp_close()
 *
 * @param[in] strm - The stream to which close packet has to be sent
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
send_spl_packet(stream_t *strm, int type)
{
	tpp_data_pkt_hdr_t *dhdr = NULL;
	tpp_packet_t *pkt = NULL;

	TPP_DBPRT("Sending CLOSE packet sd=%u, dest_sd=%u", strm->sd, strm->dest_sd);

	pkt = tpp_bld_pkt(NULL, dhdr, sizeof(tpp_data_pkt_hdr_t), 1, (void **) &dhdr);
	if (!pkt) {
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		return -1;
	}

	dhdr->type = type;
	dhdr->src_sd = htonl(strm->sd);
	dhdr->src_magic = htonl(strm->src_magic);
	dhdr->dest_sd = htonl(strm->dest_sd);

	memcpy(&dhdr->src_addr, &strm->src_addr, sizeof(tpp_addr_t));
	memcpy(&dhdr->dest_addr, &strm->dest_addr, sizeof(tpp_addr_t));

	if (send_to_router(pkt) != 0) {
		tpp_log(LOG_ERR, __func__, "Failed to send to router");
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	destroy the stream finally
 *
 * @param[in] strm - The stream that needs to be freed
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
free_stream_resources(stream_t *strm)
{
	if (!strm)
		return;

	tpp_write_lock(&strmarray_lock);

	TPP_DBPRT("Freeing stream resources for sd=%u", strm->sd);

	strmarray[strm->sd].slot_state = TPP_SLOT_DELETED;

	tpp_unlock_rwlock(&strmarray_lock);

	if (strm->mcast_data) {
		if (strm->mcast_data->strms)
			free(strm->mcast_data->strms);
		free(strm->mcast_data);
	}
}

/**
 * @brief
 *	Marks the stream slot as free to be reused
 *
 * @param[in] sd - The stream descriptor that needs to be freed
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
free_stream(unsigned int sd)
{
	stream_t *strm;
	tpp_que_elem_t *n = NULL;
	strm_action_info_t *c;

	TPP_DBPRT("Freeing stream %u", sd);

	tpp_write_lock(&strmarray_lock); /* updating stream, idx, so WRITE lock */

	strm = strmarray[sd].strm;
	if (strm->strm_type != TPP_STRM_MCAST) {
		void *idx_ctx = NULL;
		int found = 0;
		stream_t *t_strm = NULL;
		void *pdest_addr = &strm->dest_addr;

		while (pbs_idx_find(streams_idx, &pdest_addr, (void **) &t_strm, &idx_ctx) == PBS_IDX_RET_OK) {
			if (memcmp(pdest_addr, &strm->dest_addr, sizeof(tpp_addr_t)) != 0)
				break;
			if (strm == t_strm) {
				found = 1;
				break;
			}
		}

		if (!found) {
			/* this should not happen ever */
			tpp_log(LOG_ERR, __func__, "Failed finding strm with dest=%s, strm=%p, sd=%u", tpp_netaddr(&strm->dest_addr), strm, strm->sd);
			tpp_unlock_rwlock(&strmarray_lock);
			pbs_idx_free_ctx(idx_ctx);
			return;
		}

		pbs_idx_delete_byctx(idx_ctx);
		pbs_idx_free_ctx(idx_ctx);
	}

	strmarray[sd].slot_state = TPP_SLOT_FREE;
	strmarray[sd].strm = NULL;
	free(strm);

	if (freed_queue_count < 100) {
		tpp_enque(&freed_sd_queue, (void *) (intptr_t) sd);
		freed_queue_count++;
	}

	tpp_unlock_rwlock(&strmarray_lock);

	tpp_lock(&strm_action_queue_lock);
	/* empty all strm actions from the strm action queue */
	while ((n = TPP_QUE_NEXT(&strm_action_queue, n))) {
		c = TPP_QUE_DATA(n);
		if (c && (c->sd == sd)) {
			n = tpp_que_del_elem(&strm_action_queue, n);
			free(c);
		}
	}
	tpp_unlock(&strm_action_queue_lock);
}

/**
 * @brief
 *	The pre-send handler registered with the IO thread.
 *
 * @par Functionality
 *	When the IO thread is ready to send out a packet over the wire, it calls
 *	a prior registered "pre-send" handler
 *
 * @param[in] tfd - The actual IO connection on which data was about to be
 *			sent (unused)
 * @param[in] pkt - The data packet that is about to be sent out by the IO thrd
 * @param[in] extra - The extra data associated with IO connection
 *
 * @par Side Effects:
 *	None
 *
 * @retval 0 - Success (Transport layer will send out the packet)
 * @retval -1 - Failure (Transport layer will not send packet and will delete packet)
 *
 * @par MT-safe: No
 *
 */
static int
leaf_pkt_presend_handler(int tfd, tpp_packet_t *pkt, void *c, void *extra)
{
	conn_auth_t *authdata = (conn_auth_t *) extra;
	tpp_context_t *ctx = (tpp_context_t *) c;
	tpp_router_t *r;
	tpp_data_pkt_hdr_t *data;
	tpp_chunk_t *first_chunk;
	unsigned char type;

	if (!pkt)
		return 0;

	first_chunk = GET_NEXT(pkt->chunks);
	if (!first_chunk)
		return 0;

	data = (tpp_data_pkt_hdr_t *) first_chunk->data;
	type = data->type;

	/* Connection accepcted by comm, set router's state to connected */
	if (type == TPP_CTL_JOIN) {
		r = (tpp_router_t *) ctx->ptr;
		r->state = TPP_ROUTER_STATE_CONNECTED;
		r->delay = 0;		/* reset connection retry time to 0 */
		r->conn_time = time(0); /* record connect time */

		tpp_log(LOG_CRIT, NULL, "Connected to pbs_comm %s", r->router_name);

		TPP_DBPRT("Sending cmd to call App net restore handler");
		if (tpp_mbox_post(&app_mbox, UNINITIALIZED_INT, TPP_CMD_NET_RESTORE, NULL, 0) != 0) {
			tpp_log(LOG_CRIT, __func__, "Error writing to app mbox");
			return -1;
		}
	}

	/*
	 * if presend handler is called from handle_disconnect()
	 * then extra will be NULL and this is just a sending simulation
	 * so no encryption needed
	 */
	if (authdata == NULL)
		return 0;

	if (authdata->encryptdef == NULL)
		return 0; /* no encryption set, so no need to encrypt packets */

	return (tpp_encrypt_pkt(authdata, pkt));
}

/**
 * @brief
 *	Check a stream based on sd, destination address,
 *	destination stream descriptor.
 *
 * @param[in] src_sd - The stream with which to match
 * @param[in] dest_addr - address of the destination
 * @param[in] dest_sd   - The descriptor of the destination stream
 * @paarm[in] msg - point to buf to return message
 * @param[in] sz - length of message buffer
 *
 * @return stream ptr of the stream info matches passed params
 * @retval NULL - If a matching stream was not found, or passed params do not match
 * @retval !NULL - The ptr to the matching stream
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static stream_t *
check_strm_valid(unsigned int src_sd, tpp_addr_t *dest_addr, int dest_sd, char *msg, int sz)
{
	stream_t *strm = NULL;

	if (strmarray == NULL || src_sd >= max_strms) {
		TPP_DBPRT("Must be data for old instance, ignoring");
		return NULL;
	}

	if (strmarray[src_sd].slot_state != TPP_SLOT_BUSY) {
		snprintf(msg, sz, "Data to sd=%u which is %s", src_sd, (strmarray[src_sd].slot_state == TPP_SLOT_DELETED ? "deleted" : "freed"));
		return NULL;
	}

	strm = strmarray[src_sd].strm;

	if (strm->t_state != TPP_TRNS_STATE_OPEN) {
		snprintf(msg, sz, "Data to sd=%u whose transport is not open (t_state=%d)", src_sd, strm->t_state);
		send_app_strm_close(strm, TPP_CMD_NET_CLOSE, 0);
		return NULL;
	}

	if ((strm->dest_sd != UNINITIALIZED_INT && strm->dest_sd != dest_sd) || memcmp(&strm->dest_addr, dest_addr, sizeof(tpp_addr_t)) != 0) {
		snprintf(msg, sz, "Data to sd=%u mismatch dest info in stream", src_sd);
		return NULL;
	}

	return strm;
}

/**
 * @brief
 *	Wrapper function for the leaf to handle incoming data. This
 *  wrapper exists only to detect if the inner function
 *  allocated memory in data_out and free that memory in a
 *  clean way, so that we do not have to add a goto or free
 *  in every return path of the inner function.
 *
 * @param[in] tfd - The physical connection over which data arrived
 * @param[in] buf - The pointer to the received data packet
 * @param[in] len - The length of the received data packet
 * @param[in] c   - The context associated with this physical connection
 * @param[in] extra - The extra data associated with IO connection
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
leaf_pkt_handler(int tfd, void *buf, int len, void *c, void *extra)
{
	void *data_out = NULL;
	int rc = leaf_pkt_handler_inner(tfd, buf, &data_out, len, c, extra);
	free(data_out);
	return rc;
}

/**
 * @brief
 *	Inner handler function for the received packet handler registered with the IO thread.
 *
 * @par Functionality
 *	When the IO thread is received a packet over the wire, it calls
 *	a prior registered "chunk-send" handler. This handler is responsible to
 *	decode the data in the packet and do the needful. This handler for the
 *	leaf checks whether data came in order, or is a duplicate packet. If
 *	OOO data arrived, then it is queued in a OOO queue, else the data is
 *	sent to the application to be read. If an acknowledgment for a prior
 *	sent packet is received, this handler releases any prior shelved packet.
 *	If a close packet is received, then a close notification is sent to the
 *	APP. If a prior sent close packet is acknowledged, then the stream is
 *	queued to be closed.
 *
 * @param[in] tfd - The actual IO connection on which data was about to be
 *			sent (unused)
 * @param[in] buf - The pointer to the data that arrived
 * @param[out] data_out - The pointer to the newly allocated data buffer, if any
 * @param[in] len  - Length of the arrived data
 * @param[in] ctx - The context (prior associated, if any) with the IO thread
 *		    (unused at the leaf)
 * @param[in] extra - The extra data associated with IO connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
leaf_pkt_handler_inner(int tfd, void *buf, void **data_out, int len, void *ctx, void *extra)
{
	stream_t *strm;
	enum TPP_MSG_TYPES type;
	tpp_data_pkt_hdr_t *dhdr = buf;
	conn_auth_t *authdata = (conn_auth_t *) extra;
	int totlen;
	int rc;

again:
	totlen = ntohl(dhdr->totlen);
	type = dhdr->type;
	errno = 0;

	if (type >= TPP_LAST_MSG)
		return -1;

	switch (type) {
		case TPP_ENCRYPTED_DATA: {
			int sz = sizeof(tpp_encrypt_hdr_t);
			int len_out;

			if (authdata == NULL) {
				tpp_log(LOG_CRIT, __func__, "tfd=%d, No auth data found", tfd);
				return -1;
			}

			if (authdata->encryptdef == NULL) {
				tpp_log(LOG_CRIT, __func__, "connetion doesn't support decryption of data");
				return -1;
			}

			if (authdata->encryptdef->decrypt_data(authdata->encryptctx, (void *) ((char *) buf + sz), (size_t) len - sz, data_out, (size_t *) &len_out) != 0) {
				return -1;
			}

			if ((len - sz) > 0 && len_out <= 0) {
				tpp_log(LOG_CRIT, __func__, "invalid decrypted data len: %d, pktlen: %d", len_out, len - sz);
				return -1;
			}
			dhdr = *data_out;
			len = len_out;
			goto again;
		} break;

		case TPP_AUTH_CTX: {
			tpp_auth_pkt_hdr_t ahdr = {0};
			size_t len_in = 0;
			void *data_in = NULL;
			int rc = 0;

			memcpy(&ahdr, dhdr, sizeof(tpp_auth_pkt_hdr_t));
			len_in = (size_t) len - sizeof(tpp_auth_pkt_hdr_t);
			data_in = calloc(1, len_in);
			if (data_in == NULL) {
				tpp_log(LOG_CRIT, __func__, "Out of memory");
				return -1;
			}
			memcpy(data_in, (char *) dhdr + sizeof(tpp_auth_pkt_hdr_t), len_in);

			rc = tpp_handle_auth_handshake(tfd, tfd, authdata, ahdr.for_encrypt, data_in, len_in);
			if (rc != 1) {
				free(data_in);
				return rc;
			}

			free(data_in);

			if (ahdr.for_encrypt == FOR_ENCRYPT && strcmp(authdata->config->auth_method, AUTH_RESVPORT_NAME) != 0) {
				if (strcmp(authdata->config->auth_method, authdata->config->encrypt_method) != 0) {
					rc = tpp_handle_auth_handshake(tfd, tfd, authdata, FOR_AUTH, NULL, 0);
					if (rc != 1) {
						return rc;
					}
				} else {
					authdata->authctx = authdata->encryptctx;
					authdata->authdef = authdata->encryptdef;
					tpp_transport_set_conn_extra(tfd, authdata);
				}
			}

			/* send TPP_CTL_JOIN msg to router */
			return leaf_send_ctl_join(tfd, ctx);
		} break; /* TPP_AUTH_CTX */

		case TPP_CTL_MSG: {
			tpp_ctl_pkt_hdr_t *hdr = (tpp_ctl_pkt_hdr_t *) dhdr;
			int code = hdr->code;

			if (code == TPP_MSG_NOROUTE) {
				unsigned int src_sd = ntohl(hdr->src_sd);
				strm = get_strm_atomic(src_sd);
				if (strm) {
					char *msg = ((char *) dhdr) + sizeof(tpp_ctl_pkt_hdr_t);
					tpp_log(LOG_DEBUG, NULL, "sd %u, Received noroute to dest %s, msg=\"%s\"", src_sd, tpp_netaddr(&hdr->src_addr), msg);
					send_app_strm_close(strm, TPP_CMD_NET_CLOSE, 0);
				}
				return 0;
			}

			if (code == TPP_MSG_UPDATE) {
				tpp_log(LOG_INFO, NULL, "Received UPDATE from pbs_comm");
				if (tpp_mbox_post(&app_mbox, UNINITIALIZED_INT, TPP_CMD_NET_RESTORE, NULL, 0) != 0) {
					tpp_log(LOG_CRIT, __func__, "Error writing to app mbox");
				}
				return 0;
			}

			if (code == TPP_MSG_AUTHERR) {
				char *msg = ((char *) dhdr) + sizeof(tpp_ctl_pkt_hdr_t);
				tpp_log(LOG_CRIT, NULL, "tfd %d, Received authentication error from router %s, err=%d, msg=\"%s\"", tfd, tpp_netaddr(&hdr->src_addr), hdr->error_num, msg);
				return -1; /* close connection */
			}
		} break; /* TPP_CTL_MSG */

		case TPP_CTL_LEAVE: {
			tpp_leave_pkt_hdr_t *hdr = (tpp_leave_pkt_hdr_t *) dhdr;
			tpp_que_t send_close_queue;
			tpp_addr_t *addrs;
			int i;

			PRTPKTHDR(__func__, hdr, 0);

			/* bother only about leave */
			tpp_read_lock(&strmarray_lock); /* walking stream idx, so read lock */
			TPP_QUE_CLEAR(&send_close_queue);

			/* go past the header and point to the list of addresses following it */
			addrs = (tpp_addr_t *) (((char *) dhdr) + sizeof(tpp_leave_pkt_hdr_t));
			for (i = 0; i < hdr->num_addrs; i++) {
				void *idx_ctx = NULL;
				void *paddr = &addrs[i];

				while (pbs_idx_find(streams_idx, &paddr, (void **) &strm, &idx_ctx) == PBS_IDX_RET_OK) {
					if (memcmp(paddr, &addrs[i], sizeof(tpp_addr_t)) != 0)
						break;
					strm->lasterr = 0;
					/* under lock already, can access directly */
					if (strmarray[strm->sd].slot_state == TPP_SLOT_BUSY) {
						if (tpp_enque(&send_close_queue, strm) == NULL) {
							tpp_log(LOG_CRIT, __func__, "Out of memory enqueing to send close queue");
							tpp_unlock_rwlock(&strmarray_lock);
							pbs_idx_free_ctx(idx_ctx);
							return -1;
						}
					}
				}
				pbs_idx_free_ctx(idx_ctx);
			}
			tpp_unlock_rwlock(&strmarray_lock);

			while ((strm = (stream_t *) tpp_deque(&send_close_queue))) {
				TPP_DBPRT("received TPP_CTL_LEAVE, sending TPP_CMD_NET_CLOSE sd=%u", strm->sd);
				send_app_strm_close(strm, TPP_CMD_NET_CLOSE, hdr->ecode);
			}

			return 0;
		} break;
			/* TPP_CTL_LEAVE */

		case TPP_DATA:
		case TPP_CLOSE_STRM: {
			char msg[TPP_GEN_BUF_SZ] = "";
			unsigned int src_sd;
			unsigned int dest_sd;
			unsigned int src_magic;
			unsigned int sz = len - sizeof(tpp_data_pkt_hdr_t);
			void *data = (char *) dhdr + sizeof(tpp_data_pkt_hdr_t);

			src_sd = ntohl(dhdr->src_sd);
			dest_sd = ntohl(dhdr->dest_sd);
			src_magic = ntohl(dhdr->src_magic);

			PRTPKTHDR(__func__, dhdr, sz);

			if (dest_sd == UNINITIALIZED_INT && type != TPP_CLOSE_STRM && sz == 0) {
				tpp_log(LOG_ERR, NULL, "ack packet without dest_sd set!!!");
				return -1;
			}

			if (dest_sd == UNINITIALIZED_INT) {
				tpp_read_lock(&strmarray_lock); /* walking stream idx, so read lock */
				strm = find_stream_with_dest(&dhdr->src_addr, src_sd, src_magic);
				tpp_unlock_rwlock(&strmarray_lock);
				if (strm == NULL) {
					TPP_DBPRT("No stream associated, Opening new stream");
					/*
					 * packet's destination address = stream's source address at our end
					 * packet's source address = stream's destination address at our end
					 */
					if ((strm = alloc_stream(&dhdr->dest_addr, &dhdr->src_addr)) == NULL) {
						tpp_log(LOG_CRIT, __func__, "Out of memory allocating stream");
						return -1;
					}
				} else {
					TPP_DBPRT("Stream sd=%u, u_state=%d, t_state=%d", strm->sd, strm->u_state, strm->t_state);
				}
				dest_sd = strm->sd;
			} else {
				TPP_DBPRT("Stream found from index in packet = %u", dest_sd);
			}

			/* In any case, check for the stream's validity */
			tpp_read_lock(&strmarray_lock); /* walking stream idx, so read lock */
			strm = check_strm_valid(dest_sd, &dhdr->src_addr, src_sd, msg, sizeof(msg));
			tpp_unlock_rwlock(&strmarray_lock);
			if (strm == NULL) {
				if (type != TPP_CLOSE_STRM && sz == 0)
					return 0; /* it is an ack packet, don't send noroute */

				tpp_log(LOG_WARNING, __func__, msg);
				tpp_send_ctl_msg(tfd, TPP_MSG_NOROUTE, &dhdr->src_addr, &dhdr->dest_addr, src_sd, 0, msg);
				return 0;
			}

			/*
			 * this should be set even close packets since
			 * we could have opened a stream locally, sent a packet
			 * and the ack carries the other sides sd, which we must store
			 * and use in the next send out.
			 */
			strm->dest_sd = src_sd;	      /* next time outgoing will have dest_fd */
			strm->dest_magic = src_magic; /* used for matching next time onwards */

			rc = send_pkt_to_app(strm, type, data, sz, totlen);

			return rc; /* 0 - success, -1 failed, -2 app mbox full */
		} break;	   /* TPP_DATA, TPP_CLOSE_STRM */

		default:
			tpp_log(LOG_ERR, NULL, "Bad header for incoming packet on fd %d, header = %d, len = %d", tfd, type, len);

	} /* switch */

	return -1;
}

/**
 * @brief
 *	The connection drop (close) handler registered with the IO thread.
 *
 * @par Functionality
 *	When the connection between this leaf and a router is dropped, the IO
 *	thread first calls this (prior registered) function to notify the leaf
 *	layer of the fact that a connection was dropped.
 *
 * @param[in] tfd - The actual IO connection on which data was about to be
 *			sent (unused)
 * @param[in] c - context associated with the IO thread (unused here)
 * @param[in] extra - The extra data associated with IO connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
leaf_close_handler(int tfd, int error, void *c, void *extra)
{
	int rc;
	tpp_context_t *ctx = (tpp_context_t *) c;
	tpp_router_t *r;
	int last_state;

	if (extra) {
		conn_auth_t *authdata = (conn_auth_t *) extra;
		if (authdata->authctx && authdata->authdef)
			authdata->authdef->destroy_ctx(authdata->authctx);
		if (authdata->authdef != authdata->encryptdef && authdata->encryptctx && authdata->encryptdef)
			authdata->encryptdef->destroy_ctx(authdata->encryptctx);
		if (authdata->config)
			free_auth_config(authdata->config);
		/* DO NOT free authdef here, it will be done in unload_auths() */
		free(authdata);
		tpp_transport_set_conn_extra(tfd, NULL);
	}

	r = (tpp_router_t *) ctx->ptr;

	/* deallocate the connection structure associated with ctx */
	tpp_transport_close(r->conn_fd);

	if (tpp_going_down == 1)
		return -1; /* while we are doing shutdown don't try to reconnect etc */

	/*
	 * Disassociate the older context, so we can attach
	 * to new connection old connection will be deleted
	 * shortly by caller
	 */
	free(ctx);
	tpp_transport_set_conn_ctx(tfd, NULL);
	last_state = r->state;
	r->state = TPP_ROUTER_STATE_DISCONNECTED;
	r->conn_fd = -1;

	if (last_state == TPP_ROUTER_STATE_CONNECTED) {
		unsigned int i;
		/* log disconnection message */
		tpp_log(LOG_CRIT, NULL, "Connection to pbs_comm %s down", r->router_name);

		/* send individual net close messages to app */
		tpp_read_lock(&strmarray_lock); /* walking stream idx, so read lock */
		for (i = 0; i < max_strms; i++) {
			if (strmarray[i].slot_state == TPP_SLOT_BUSY) {
				strmarray[i].strm->t_state = TPP_TRNS_STATE_NET_CLOSED;
				TPP_DBPRT("net down, sending TPP_CMD_NET_CLOSE sd=%u", strmarray[i].strm->sd);
				send_app_strm_close(strmarray[i].strm, TPP_CMD_NET_CLOSE, 0);
			}
		}
		tpp_unlock_rwlock(&strmarray_lock);

		if (the_app_net_down_handler) {
			if (tpp_mbox_post(&app_mbox, UNINITIALIZED_INT, TPP_CMD_NET_DOWN, NULL, 0) != 0) {
				tpp_log(LOG_CRIT, __func__, "Error writing to app mbox");
				return -1;
			}
		}

		/* if we are connected to another router, make app layer realize they need to restart streams */
		/* send a connection restore message, so app restarts streams on the alternate route */
		if (get_active_router()) {
			if (tpp_mbox_post(&app_mbox, UNINITIALIZED_INT, TPP_CMD_NET_RESTORE, NULL, 0) != 0) {
				tpp_log(LOG_CRIT, __func__, "Error writing to app mbox");
				return -1;
			}
		}
	}

	if (r->delay == 0)
		r->delay = TPP_CONNNECT_RETRY_MIN;
	else
		r->delay += TPP_CONNECT_RETRY_INC;

	if (r->delay > TPP_CONNECT_RETRY_MAX)
		r->delay = TPP_CONNECT_RETRY_MAX;

	/* since our connection with our router is down, we need to try again */
	/* connect to router and send initial join packet */
	if ((rc = connect_router(r)) != 0)
		return -1;

	return 0;
}

/* @brief
 * wrapper routine that checks the router connection status before calling
 * tpp_transport_send(). This function can check not just the router fd
 * but that the connection  is actually in fully connected state
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval  -2 - transport buffers full
 * @retval   0 - Success
 *
 */
static int
send_to_router(tpp_packet_t *pkt)
{
	tpp_router_t *router = get_active_router();
	if ((router == NULL) || (router->conn_fd == -1) || (router->state != TPP_ROUTER_STATE_CONNECTED)) {
		tpp_log(LOG_ERR, __func__, "No active router");
		return -1;
	}

	return (tpp_transport_vsend(router->conn_fd, pkt));
}


================================================
FILE: src/lib/Libtpp/tpp_em.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	tpp_em.c
 *
 * @brief	The event monitor functions for TPP
 *
 * @par		Functionality:
 *
 *		TPP = TCP based Packet Protocol. This layer uses TCP in a multi-
 *		hop router based network topology to deliver packets to desired
 *		destinations. LEAF (end) nodes are connected to ROUTERS via
 *		persistent TCP connections. The ROUTER has intelligence to route
 *		packets to appropriate destination leaves or other routers.
 *
 *		This file implements the em (event monitor) code such that it is
 *		platform independent. It provides a generic interface to add, remove
 *		and wait for file descriptors to be monitored for events.
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <pthread.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <signal.h>
#include "tpp_internal.h"
#ifdef HAVE_SYS_EVENTFD_H
#include <sys/eventfd.h>
#endif

/********************************** START OF MULTIPLEXING CODE *****************************************/
/**
 * @brief
 *	Platform independent function to wait for a event to happen on the event context.
 *	Waits for the specified timeout period. Does not care block/unblock signals.
 *
 * @param[in] -  em_ctx - The event monitor context
 * @param[out] - ev_array - Array of events returned
 * @param[in] - timeout - The timeout in milliseconds to wait for
 *
 * @return	Number of events returned
 * @retval -1	Failure
 * @retval  0	Timeout
 * @retval >0   Success (some events occured)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_wait(void *em_ctx, em_event_t **ev_array, int timeout)
{
#ifndef WIN32
	return tpp_em_pwait(em_ctx, ev_array, timeout, NULL);
#else
	return tpp_em_wait_win(em_ctx, ev_array, timeout);
#endif
}

/****************************************** Linux EPOLL ************************************************/

#if defined(PBS_USE_EPOLL)
/**
 * @brief
 *	Initialize event monitoring
 *
 * @param[in] - max_events - max events that needs to be handled
 *
 * @return	Event context
 * @retval  NULL Failure
 * @retval !NULL Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: yes
 *
 */
void *
tpp_em_init(int max_events)
{
	epoll_context_t *ctx = malloc(sizeof(epoll_context_t));
	if (!ctx)
		return NULL;

	ctx->events = malloc(sizeof(em_event_t) * max_events);
	if (ctx->events == NULL) {
		free(ctx);
		return NULL;
	}

#if defined(EPOLL_CLOEXEC)
	ctx->epoll_fd = epoll_create1(EPOLL_CLOEXEC);
#else
	ctx->epoll_fd = epoll_create(max_events);
	if (ctx->epoll_fd > -1) {
		tpp_set_close_on_exec(ctx->epoll_fd);
	}
#endif
	if (ctx->epoll_fd == -1) {
		free(ctx->events);
		free(ctx);
		return NULL;
	}
	ctx->max_nfds = max_events;
	ctx->init_pid = getpid();

	return ((void *) ctx);
}

/**
 * @brief
 *	Destroy event monitoring
 *
 * @param[in] ctx - The event monitoring context to destroy
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: yes
 *
 */
void
tpp_em_destroy(void *em_ctx)
{
	epoll_context_t *ctx = (epoll_context_t *) em_ctx;

	if (ctx != NULL) {
		close(ctx->epoll_fd);
		free(ctx->events);
		free(ctx);
	}
}

/**
 * @brief
 *	Add a file descriptor to the list of descriptors to be monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 * @param[in] - event_mask - A mask of events to monitor the fd for
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_em_add_fd(void *em_ctx, int fd, int event_mask)
{
	epoll_context_t *ctx = (epoll_context_t *) em_ctx;
	struct epoll_event ev;

	/*
	 * if not the process which called em_init, (eg a child process),
	 * we should not allow manipulating the epoll fd as it effects
	 * the epoll_fd structure pointed to by the parent process
	 */
	if (ctx->init_pid != getpid())
		return 0;

	memset(&ev, 0, sizeof(ev));
	ev.events = event_mask;
	ev.data.fd = fd;

	if (epoll_ctl(ctx->epoll_fd, EPOLL_CTL_ADD, fd, &ev) < 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Modify a file descriptor to the list of descriptors to be monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 * @param[in] - event_mask - A mask of events to monitor the fd for
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_mod_fd(void *em_ctx, int fd, int event_mask)
{
	epoll_context_t *ctx = (epoll_context_t *) em_ctx;
	struct epoll_event ev;

	/*
	 * if not the process which called em_init, (eg a child process),
	 * we should not allow manipulating the epoll fd as it effects
	 * the epoll_fd structure pointed to by the parent process
	 */
	if (ctx->init_pid != getpid())
		return 0;

	memset(&ev, 0, sizeof(ev));
	ev.events = event_mask;
	ev.data.fd = fd;

	if (epoll_ctl(ctx->epoll_fd, EPOLL_CTL_MOD, fd, &ev) < 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Remove a file descriptor from the list of descriptors monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_del_fd(void *em_ctx, int fd)
{
	epoll_context_t *ctx = (epoll_context_t *) em_ctx;
	struct epoll_event ev;

	/*
	 * if not the process which called em_init, (eg a child process),
	 * we should not allow manipulating the epoll fd as it effects
	 * the epoll_fd structure pointed to by the parent process
	 */
	if (ctx->init_pid != getpid())
		return 0;

	memset(&ev, 0, sizeof(ev));
	ev.data.fd = fd;
	if (epoll_ctl(ctx->epoll_fd, EPOLL_CTL_DEL, fd, &ev) < 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	Wait for a event to happen on the event context. Waits for the specified
 *	timeout period.
 *
 * @param[in] -  em_ctx - The event monitor context
 * @param[out] - ev_array - Array of events returned
 * @param[in] - timeout - The timeout in milliseconds to wait for
 * @param[in] - sigmask - The signal mask to atomically unblock before sleeping
 *
 * @return	Number of events returned
 * @retval -1	Failure
 * @retval  0	Timeout
 * @retval >0   Success (some events occured)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
#ifdef PBS_HAVE_EPOLL_PWAIT
int
tpp_em_pwait(void *em_ctx, em_event_t **ev_array, int timeout, const sigset_t *sigmask)
{
	epoll_context_t *ctx = (epoll_context_t *) em_ctx;
	*ev_array = ctx->events;
	return (epoll_pwait(ctx->epoll_fd, ctx->events, ctx->max_nfds, timeout, sigmask));
}
#else
int
tpp_em_pwait(void *em_ctx, em_event_t **ev_array, int timeout, const sigset_t *sigmask)
{
	epoll_context_t *ctx = (epoll_context_t *) em_ctx;
	*ev_array = ctx->events;
	sigset_t origmask;
	int n;
	sigprocmask(SIG_SETMASK, sigmask, &origmask);
	n = epoll_wait(ctx->epoll_fd, ctx->events, ctx->max_nfds, timeout);
	sigprocmask(SIG_SETMASK, &origmask, NULL);
	return n;
}
#endif

#elif defined(PBS_USE_POLL)

/************************************************* POLL ************************************************/

/**
 * @brief
 *	Initialize event monitoring
 *
 * @param[in] - max_events - max events that needs to be handled
 *
 * @return	Event context
 * @retval  NULL Failure
 * @retval !NULL Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: yes
 *
 */
void *
tpp_em_init(int max_events)
{
	int i;
	poll_context_t *ctx = malloc(sizeof(poll_context_t));
	if (!ctx)
		return NULL;

	ctx->events = malloc(sizeof(em_event_t) * max_events);
	if (ctx->events == NULL) {
		free(ctx);
		return NULL;
	}

	ctx->fds = malloc(sizeof(struct pollfd) * max_events);
	if (!ctx->fds) {
		free(ctx->events);
		free(ctx);
		return NULL;
	}
	for (i = 0; i < max_events; i++)
		ctx->fds[i].fd = -1;
	ctx->max_nfds = max_events;
	ctx->curr_nfds = max_events;

	return ((void *) ctx);
}

/**
 * @brief
 *	Destroy event monitoring
 *
 * @param[in] ctx - The event monitoring context to destroy
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: yes
 *
 */
void
tpp_em_destroy(void *em_ctx)
{
	free(((poll_context_t *) em_ctx)->fds);
	free(((poll_context_t *) em_ctx)->events);
	free(em_ctx);
}

/**
 * @brief
 *	Add a file descriptor to the list of descriptors to be monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 * @param[in] - event_mask - A mask of events to monitor the fd for
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_em_add_fd(void *em_ctx, int fd, int event_mask)
{
	poll_context_t *ctx = (poll_context_t *) em_ctx;
	int nfds;
	int i;

	if (fd > ctx->curr_nfds - 1) {
		nfds = fd + 1000;
		ctx->fds = realloc(ctx, sizeof(struct pollfd) * nfds);
		if (!ctx->fds) {
			free(ctx);
			return -1;
		}
		for (i = ctx->curr_nfds; i < nfds; i++)
			ctx->fds[i].fd = -1;

		ctx->curr_nfds = nfds;
	}

	ctx->fds[fd].fd = fd;
	ctx->fds[fd].events = event_mask;
	ctx->fds[fd].revents = 0;

	return 0;
}

/**
 * @brief
 *	Modify a file descriptor to the list of descriptors to be monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 * @param[in] - event_mask - A mask of events to monitor the fd for
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_mod_fd(void *em_ctx, int fd, int event_mask)
{
	poll_context_t *ctx = (poll_context_t *) em_ctx;

	ctx->fds[fd].fd = fd;
	ctx->fds[fd].events = event_mask;
	ctx->fds[fd].revents = 0;

	return 0;
}

/**
 * @brief
 *	Remove a file descriptor from the list of descriptors monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_del_fd(void *em_ctx, int fd)
{
	poll_context_t *ctx = (poll_context_t *) em_ctx;
	ctx->fds[fd].fd = -1;
	return 0;
}

/**
 * @brief
 *	Wait for a event to happen on the event context. Waits for the specified
 *	timeout period.
 *
 * @param[in] -  em_ctx - The event monitor context
 * @param[out] - ev_array - Array of events returned
 * @param[in] - timeout - The timeout in milliseconds to wait for
 * @param[in] - sigmask - The signal mask to atomically unblock before sleeping
 *
 * @return	Number of events returned
 * @retval -1	Failure
 * @retval  0	Timeout
 * @retval >0   Success (some events occured)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_pwait(void *em_ctx, em_event_t **ev_array, int timeout, const sigset_t *sigmask)
{
	poll_context_t *ctx = (poll_context_t *) em_ctx;
	int nready;
	int i;
	int ev_count;
#ifndef PBS_HAVE_PPOLL
	sigset_t origmask;
#endif

#ifdef PBS_HAVE_PPOLL
	nready = ppoll(ctx->fds, ctx->curr_nfds, timeout, sigmask);
#else
	if (sigmask) {
		if (sigprocmask(SIG_SETMASK, sigmask, &origmask) == -1)
			return -1;
	}

	nready = poll(ctx->fds, ctx->curr_nfds, timeout);

	if (sigmask) {
		sigprocmask(SIG_SETMASK, &origmask, NULL);
	}
#endif

	if (nready == -1 || nready == 0)
		return nready;

	ev_count = 0;
	*ev_array = ctx->events;
	for (i = 0; i < ctx->curr_nfds; i++) {
		if (ctx->fds[i].fd < 0)
			continue;

		if (ctx->fds[i].revents != 0) {
			ctx->events[ev_count].fd = ctx->fds[i].fd;
			ctx->events[ev_count].events = ctx->fds[i].revents;
			ev_count++;

			if (ev_count > ctx->max_nfds)
				return ev_count;
		}
	}
	return ev_count;
}

/*************************************** GENERIC SELECT ************************************************/

#elif defined(PBS_USE_SELECT)
/**
 * @brief
 *	Initialize event monitoring
 *
 * @param[in] - max_events - max events that needs to be handled
 *
 * @return	Event context
 * @retval  NULL Failure
 * @retval !NULL Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: yes
 *
 */
void *
tpp_em_init(int max_events)
{
	sel_context_t *ctx;

	ctx = malloc(sizeof(sel_context_t));
	if (!ctx)
		return NULL;

	ctx->events = malloc(sizeof(em_event_t) * max_events);
	if (ctx->events == NULL) {
		free(ctx);
		return NULL;
	}

	FD_ZERO(&ctx->master_read_fds);
	FD_ZERO(&ctx->master_write_fds);
	FD_ZERO(&ctx->master_err_fds);

	ctx->maxfd = 0;
	ctx->max_nfds = max_events;

	return ((void *) ctx);
}

/**
 * @brief
 *	Destroy event monitoring
 *
 * @param[in] ctx - The event monitoring context to destroy
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: yes
 *
 */
void
tpp_em_destroy(void *em_ctx)
{
	free(((sel_context_t *) em_ctx)->events);
	free(em_ctx);
}

/**
 * @brief
 *	Add a file descriptor to the list of descriptors to be monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 * @param[in] - event_mask - A mask of events to monitor the fd for
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_em_add_fd(void *em_ctx, int fd, int event_mask)
{
	sel_context_t *ctx = (sel_context_t *) em_ctx;

	if ((event_mask & EM_IN) == EM_IN)
		FD_SET(fd, &ctx->master_read_fds);

	if ((event_mask & EM_OUT) == EM_OUT)
		FD_SET(fd, &ctx->master_write_fds);

	if ((event_mask & EM_ERR) == EM_ERR)
		FD_SET(fd, &ctx->master_err_fds);

	if (fd >= ctx->maxfd)
		ctx->maxfd = fd + 1;

	return 0;
}

/**
 * @brief
 *	Modify a file descriptor to the list of descriptors to be monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 * @param[in] - event_mask - A mask of events to monitor the fd for
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_mod_fd(void *em_ctx, int fd, int event_mask)
{
	sel_context_t *ctx = (sel_context_t *) em_ctx;

	FD_CLR(fd, &ctx->master_read_fds);
	FD_CLR(fd, &ctx->master_write_fds);
	FD_CLR(fd, &ctx->master_err_fds);

	if ((event_mask & EM_IN) == EM_IN)
		FD_SET(fd, &ctx->master_read_fds);

	if ((event_mask & EM_OUT) == EM_OUT)
		FD_SET(fd, &ctx->master_write_fds);

	if ((event_mask & EM_ERR) == EM_ERR)
		FD_SET(fd, &ctx->master_err_fds);

	if (fd >= ctx->maxfd)
		ctx->maxfd = fd + 1;

	return 0;
}

/**
 * @brief
 *	Remove a file descriptor from the list of descriptors monitored for
 *	events
 *
 * @param[in] - em_ctx - The event monitor context
 * @param[in] - fd - The file descriptor to add to the monitored list
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_em_del_fd(void *em_ctx, int fd)
{
	sel_context_t *ctx = (sel_context_t *) em_ctx;

	FD_CLR(fd, &ctx->master_read_fds);
	FD_CLR(fd, &ctx->master_write_fds);
	FD_CLR(fd, &ctx->master_err_fds);

	return 0;
}

/**
 * @brief
 *	Wait for a event to happen on the event context. Waits for the specified
 *	timeout period.
 *
 * @param[in] -  em_ctx - The event monitor context
 * @param[out] - ev_array - Array of events returned
 * @param[in] - timeout - The timeout in milliseconds to wait for
 * @param[in] - sigmask - The signal mask to atomically unblock before sleeping
 *
 * @return	Number of events returned
 * @retval -1	Failure
 * @retval  0	Timeout
 * @retval >0   Success (some events occured)
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
#ifndef WIN32
int
tpp_em_pwait(void *em_ctx, em_event_t **ev_array, int timeout, const sigset_t *sigmask)
{
	sel_context_t *ctx = (sel_context_t *) em_ctx;
	int nready;
	int i;
	int ev_count;
	struct timeval tv;
	struct timeval *ptv;
	int event;

	errno = 0;

	memcpy(&ctx->read_fds, &ctx->master_read_fds, sizeof(ctx->master_read_fds));
	memcpy(&ctx->write_fds, &ctx->master_write_fds, sizeof(ctx->master_read_fds));
	memcpy(&ctx->err_fds, &ctx->master_err_fds, sizeof(ctx->master_read_fds));

	if (timeout == -1) {
		ptv = NULL;
	} else {
		tv.tv_sec = timeout / 1000;
		tv.tv_usec = (timeout % 1000) * 1000;
		ptv = &tv;
	}

	nready = pselect(ctx->maxfd, &ctx->read_fds, &ctx->write_fds, &ctx->err_fds, ptv, sigmask);

	if (nready == -1 || nready == 0)
		return nready;

	ev_count = 0;
	*ev_array = ctx->events;
	for (i = 0; i <= ctx->maxfd; i++) {
		event = 0;

		if (FD_ISSET(i, &ctx->read_fds))
			event |= EM_IN;
		if (FD_ISSET(i, &ctx->write_fds))
			event |= EM_OUT;
		if (FD_ISSET(i, &ctx->err_fds))
			event |= EM_ERR;

		if (event != 0) {
			ctx->events[ev_count].fd = i;
			ctx->events[ev_count].events = event;
			ev_count++;
		}

		if (ev_count > ctx->max_nfds)
			break;
	}
	return ev_count;
}
#else
int
tpp_em_wait_win(void *em_ctx, em_event_t **ev_array, int timeout)
{
	sel_context_t *ctx = (sel_context_t *) em_ctx;
	int nready;
	int i;
	int ev_count;
	struct timeval tv;
	struct timeval *ptv;
	int event;

	errno = 0;

	memcpy(&ctx->read_fds, &ctx->master_read_fds, sizeof(ctx->master_read_fds));
	memcpy(&ctx->write_fds, &ctx->master_write_fds, sizeof(ctx->master_read_fds));
	memcpy(&ctx->err_fds, &ctx->master_err_fds, sizeof(ctx->master_read_fds));

	if (timeout == -1) {
		ptv = NULL;
	} else {
		tv.tv_sec = timeout / 1000;
		tv.tv_usec = (timeout % 1000) * 1000;
		ptv = &tv;
	}

	nready = select(ctx->maxfd, &ctx->read_fds, &ctx->write_fds, &ctx->err_fds, ptv);
	/* for windows select, translate the errno and return value */
	if (nready == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		nready = -1;
	}

	if (nready == -1 || nready == 0)
		return nready;

	ev_count = 0;
	*ev_array = ctx->events;
	for (i = 0; i <= ctx->maxfd; i++) {
		event = 0;

		if (FD_ISSET(i, &ctx->read_fds))
			event |= EM_IN;
		if (FD_ISSET(i, &ctx->write_fds))
			event |= EM_OUT;
		if (FD_ISSET(i, &ctx->err_fds))
			event |= EM_ERR;

		if (event != 0) {
			ctx->events[ev_count].fd = i;
			ctx->events[ev_count].events = event;
			ev_count++;
		}

		if (ev_count > ctx->max_nfds)
			break;
	}
	return ev_count;
}
#endif

#endif

/********************************** END OF MULTIPLEXING CODE *****************************************/

/********************************** START OF MBOX CODE ***********************************************/
/**
 * @brief
 *	Initialize an mbox
 *
 * @param[in] - mbox   - The mbox to read from
 * @param[in] - size   - The total size allowed, or -1 for inifinite
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval   0 - success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mbox_init(tpp_mbox_t *mbox, char *name, int size)
{
	tpp_init_lock(&mbox->mbox_mutex);
	tpp_lock(&mbox->mbox_mutex);

	TPP_QUE_CLEAR(&mbox->mbox_queue);

	snprintf(mbox->mbox_name, sizeof(mbox->mbox_name), "%s", name);
	mbox->mbox_size = 0;
	mbox->max_size = size;

#ifdef HAVE_SYS_EVENTFD_H
	if ((mbox->mbox_eventfd = eventfd(0, EFD_CLOEXEC | EFD_NONBLOCK)) == -1) {
		tpp_log(LOG_CRIT, __func__, "eventfd() error, errno=%d", errno);
		tpp_unlock(&mbox->mbox_mutex);
		return -1;
	}
#else
	/*
	 * No eventfd
	 * Using signals with select(), poll() is not race-safe
	 * In linux we have ppoll() and pselect() which are race-safe
	 * but for other Unices (dev/poll, pollset etc) there is no race-safe way
	 * Use the self-pipe trick!
	 */
	if (tpp_pipe_cr(mbox->mbox_pipe) != 0) {
		tpp_log(LOG_CRIT, __func__, "pipe() error, errno=%d", errno);
		tpp_unlock(&mbox->mbox_mutex);
		return -1;
	}
	/* set the cmd pipe to nonblocking now
	 * that we are ready to rock and roll
	 */
	tpp_set_non_blocking(mbox->mbox_pipe[0]);
	tpp_set_non_blocking(mbox->mbox_pipe[1]);
	tpp_set_close_on_exec(mbox->mbox_pipe[0]);
	tpp_set_close_on_exec(mbox->mbox_pipe[1]);
#endif
	tpp_unlock(&mbox->mbox_mutex);
	return 0;
}

/**
 * @brief
 *	Get the underlying file descriptor
 *	associated with the mbox
 *
 * @param[in] - mbox   - The mbox to read from
 *
 * @return  file descriptor
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mbox_getfd(tpp_mbox_t *mbox)
{
#ifdef HAVE_SYS_EVENTFD_H
	return mbox->mbox_eventfd;
#else
	return mbox->mbox_pipe[0];
#endif
}

/**
 * @brief
 *	Destroy a message box
 *
 * @param[in] mbox - The message box to destroy
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: yes
 *
 */
void
tpp_mbox_destroy(tpp_mbox_t *mbox)
{
#ifdef HAVE_SYS_EVENTFD_H
	close(mbox->mbox_eventfd);
#else
	if (mbox->mbox_pipe[0] > -1)
		tpp_pipe_close(mbox->mbox_pipe[0]);
	if (mbox->mbox_pipe[1] > -1)
		tpp_pipe_close(mbox->mbox_pipe[1]);
#endif
}

/**
 * @brief
 *	Add mbox to the monitoring infra
 *	so that messages to the mbox will
 *	wake up handling thread
 *
 * @param[in] - em_ctx - The event monitoring context
 * @param[in] - mbox   - The mbox to read from
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval   0 - success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mbox_monitor(void *em_ctx, tpp_mbox_t *mbox)
{
	/* add eventfd to the poll set */
	if (tpp_em_add_fd(em_ctx, tpp_mbox_getfd(mbox), EM_IN) == -1) {
		tpp_log(LOG_CRIT, __func__, "em_add_fd() error for mbox=%s, errno=%d", mbox->mbox_name, errno);
		return -1;
	}

	return 0;
}

/**
 * @brief
 *	Read a command from the msg box.
 *
 * @param[in]  - mbox   - The mbox to read from
 * @param[out] - cmdval - The command or operation
 * @param[out] - tfd    - The Virtual file descriptor
 * @param[out] - data   - Data associated, if any (or NULL)
 *
 * @return Error code
 * @retval -1 Failure
 * @retval  0 Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mbox_read(tpp_mbox_t *mbox, unsigned int *tfd, int *cmdval, void **data)
{
#ifdef HAVE_SYS_EVENTFD_H
	uint64_t u;
#else
	char b;
#endif
	tpp_cmd_t *cmd = NULL;

	if (cmdval)
		*cmdval = -1;

	errno = 0;

	tpp_lock(&mbox->mbox_mutex);

	/* read the data from the mbox cmd queue head */
	cmd = (tpp_cmd_t *) tpp_deque(&mbox->mbox_queue);

	/* if no more data, clear all notifications */
	if (cmd == NULL) {
		mbox->mbox_size = 0;
#ifdef HAVE_SYS_EVENTFD_H
		if (read(mbox->mbox_eventfd, &u, sizeof(uint64_t)) == -1)
			;
#else
		while (tpp_pipe_read(mbox->mbox_pipe[0], &b, sizeof(char)) == sizeof(char))
			;
#endif
	} else {
		/* reduce from mbox size during read */
		mbox->mbox_size -= cmd->sz;
	}

	tpp_unlock(&mbox->mbox_mutex);

	if (cmd == NULL) {
		errno = EWOULDBLOCK;
		return -1;
	}

	if (tfd)
		*tfd = cmd->tfd;

	if (cmdval)
		*cmdval = cmd->cmdval;

	*data = cmd->data;

	free(cmd);
	return 0;
}

/**
 * @brief
 *	Clear pending commands pertaining to a connection
 *	from this mbox
 *	Called usually when the connection got closed and
 *	the caller wants to clear the pending commands for
 *	that connection from this thread mbox
 *
 * @param[in] - mbox   - The mbox to read from
 * @param[in] - n      - The node/position to start searching from
 * @param[in] - tfd    - The Virtual file descriptor
 * @param[out] - cmdval - Return the cmdval
 * @param[out] - data - Return any data associated
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mbox_clear(tpp_mbox_t *mbox, tpp_que_elem_t **n, unsigned int tfd, short *cmdval, void **data)
{
	tpp_cmd_t *cmd;
	int ret = -1;
	errno = 0;

	tpp_lock(&mbox->mbox_mutex);

	while ((*n = TPP_QUE_NEXT(&mbox->mbox_queue, *n))) {
		cmd = TPP_QUE_DATA(*n);
		if (cmd && cmd->tfd == tfd) {
			*n = tpp_que_del_elem(&mbox->mbox_queue, *n);
			if (cmdval)
				*cmdval = cmd->cmdval;
			if (data)
				*data = cmd->data;
			free(cmd);
			ret = 0;
			break;
		}
	}
	mbox->mbox_size = 0;

	tpp_unlock(&mbox->mbox_mutex);

	return ret;
}

/**
 * @brief
 *	Send a command to the threads msg queue
 *
 * @param[in] - mbox   - The mbox to post to
 * @param[in] - cmdval - The command or operation
 * @param[in] - tfd    - The Virtual file descriptor
 * @param[in] - data   - Any data pointer associated, if any (or NULL)
 * @param[in] - sz     - size of the data
 *
 * @return Error code
 * @retval -1 Failure
 * @retval  0 Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_mbox_post(tpp_mbox_t *mbox, unsigned int tfd, char cmdval, void *data, int sz)
{
	tpp_cmd_t *cmd;
	ssize_t s;
#ifdef HAVE_SYS_EVENTFD_H
	uint64_t u;
#else
	char b;
#endif

	errno = 0;
	cmd = malloc(sizeof(tpp_cmd_t));
	if (!cmd) {
		tpp_log(LOG_CRIT, __func__, "Out of memory in em_mbox_post for mbox=%s", mbox->mbox_name);
		return -1;
	}
	cmd->cmdval = cmdval;
	cmd->tfd = tfd;
	cmd->data = data;
	cmd->sz = sz;

	/* add the cmd to the threads queue */
	tpp_lock(&mbox->mbox_mutex);

	if (tpp_enque(&mbox->mbox_queue, cmd) == NULL) {
		tpp_unlock(&mbox->mbox_mutex);
		free(cmd);
		tpp_log(LOG_CRIT, __func__, "Out of memory in em_mbox_post for mbox=%s", mbox->mbox_name);
		return -1;
	}

	/* add to the size to global size during enque */
	mbox->mbox_size += sz;

	tpp_unlock(&mbox->mbox_mutex);

	while (1) {
		/* send a notification to the thread */
#ifdef HAVE_SYS_EVENTFD_H
		u = 1;
		s = write(mbox->mbox_eventfd, &u, sizeof(uint64_t));
		if (s == sizeof(uint64_t))
			break;
#else
		b = 1;
		s = tpp_pipe_write(mbox->mbox_pipe[1], &b, sizeof(char));
		if (s == sizeof(char))
			break;
#endif
		if (s == -1) {
			if (errno == EAGAIN || errno == EWOULDBLOCK) {
				/* pipe is full, which is fine, anyway we behave like edge triggered */
				break;
			} else if (errno != EINTR) {
				tpp_log(LOG_CRIT, __func__, "mbox post failed for mbox=%s, errno=%d", mbox->mbox_name, errno);
				return -1;
			}
		}
	}
	return 0;
}


================================================
FILE: src/lib/Libtpp/tpp_internal.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef __TPP_INTERNAL_H
#define __TPP_INTERNAL_H
#ifdef __cplusplus
extern "C" {
#endif

#include <sys/time.h>
#include <limits.h>
#include <time.h>
#include <pthread.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include "log.h"
#include "list_link.h"
#include "avltree.h"

#include "tpp.h"

#ifndef WIN32

#define tpp_pipe_cr(a) pipe(a)
#define tpp_pipe_read(a, b, c) read(a, b, c)
#define tpp_pipe_write(a, b, c) write(a, b, c)
#define tpp_pipe_close(a) close(a)

#define tpp_sock_socket(a, b, c) socket(a, b, c)
#define tpp_sock_bind(a, b, c) bind(a, b, c)
#define tpp_sock_listen(a, b) listen(a, b)
#define tpp_sock_accept(a, b, c) accept(a, b, c)
#define tpp_sock_connect(a, b, c) connect(a, b, c)
#define tpp_sock_recv(a, b, c, d) recv(a, b, c, d)
#define tpp_sock_send(a, b, c, d) send(a, b, c, d)
#define tpp_sock_select(a, b, c, d, e) select(a, b, c, d, e)
#define tpp_sock_close(a) close(a)
#define tpp_sock_getsockopt(a, b, c, d, e) getsockopt(a, b, c, d, e)
#define tpp_sock_setsockopt(a, b, c, d, e) setsockopt(a, b, c, d, e)

#else
#ifndef EINPROGRESS
#define EINPROGRESS EAGAIN
#endif

int tpp_pipe_cr(int fds[2]);
int tpp_pipe_read(int, char *, int);
int tpp_pipe_write(int, char *, int);
int tpp_pipe_close(int);

int tpp_sock_socket(int, int, int);
int tpp_sock_listen(int, int);
int tpp_sock_accept(int, struct sockaddr *, int *);
int tpp_sock_bind(int, const struct sockaddr *, int);
int tpp_sock_connect(int, const struct sockaddr *, int);
int tpp_sock_recv(int, char *, int, int);
int tpp_sock_send(int, const char *, int, int);
int tpp_sock_select(int, fd_set *, fd_set *, fd_set *, const struct timeval *);
int tpp_sock_close(int);
int tpp_sock_getsockopt(int, int, int, int *, int *);
int tpp_sock_setsockopt(int, int, int, const int *, int);

#endif

int tpp_sock_layer_init();
int tpp_get_nfiles();
int set_pipe_disposition();
int tpp_sock_attempt_connection(int, char *, int);
void tpp_invalidate_thrd_handle(pthread_t *);
int tpp_is_valid_thrd(pthread_t);

#define MAX_CON TPP_MAXOPENFD /* default max connections */
#define UNINITIALIZED_INT -1
#define TPP_GEN_BUF_SZ 1024
#define TPP_MAXADDRLEN (INET6_ADDRSTRLEN + 10)

/* some built in timing control defines to retry connections to routers */
#define TPP_CONNNECT_RETRY_MIN 2
#define TPP_CONNECT_RETRY_INC 2
#define TPP_CONNECT_RETRY_MAX 10
#define TPP_THROTTLE_RETRY 5 /* retry time after throttling a packet */

/* defines for the TPP address families
 * we don't use the AF_INET etc, since their values could (though mostly does not)
 * differ between OS flavors, so choosing something that fits in a char
 * and also is same for TPP libraries on all OS flavors
 */
#define TPP_ADDR_FAMILY_IPV4 0
#define TPP_ADDR_FAMILY_IPV6 1
#define TPP_ADDR_FAMILY_UNSPEC 2

/*
 * Structure to hold an Address (ipv4 or ipv6)
 */
typedef struct {
	int ip[4];   /* can hold ipv6 as well */
	short port;  /* hold short port, keep as int for alignment */
	char family; /* Ipv4 or IPV6 etc */
} tpp_addr_t;

typedef struct {
	pbs_list_link chunk_link;
	char *data; /* pointer to the data buffer */
	size_t len; /* length of the data buffer */
	char *pos;  /* current position - till which data is consumed */
} tpp_chunk_t;

/*
 * Packet structure used at various places to hold a data and the
 * current position to which data has been consumed or processed
 */
typedef struct {
	pbs_list_head chunks;
	tpp_chunk_t *curr_chunk;
	size_t totlen;
	int ref_count; /* number of accessors */
} tpp_packet_t;

typedef struct {
	unsigned int ntotlen;
	char type;
} tpp_encrypt_hdr_t;

/*
 * The authenticate packet header structure
 */
typedef struct {
	unsigned int ntotlen;
	unsigned char type;
	unsigned int for_encrypt;
	char auth_method[MAXAUTHNAME + 1];
	char encrypt_method[MAXAUTHNAME + 1];
} tpp_auth_pkt_hdr_t;
/* the authentication data follows this packet */

/*
 * The Join packet header structure
 */
typedef struct {
	unsigned int ntotlen;
	unsigned char type;	 /* type packet, JOIN, LEAVE etc */
	unsigned char hop;	 /* hop count */
	unsigned char node_type; /* node type - leaf or router */
	unsigned char index;	 /* in case of leaves, primary connection or backup */
	unsigned char num_addrs; /* number of addresses of source joining, max 128 */
} tpp_join_pkt_hdr_t;
/* a bunch of tpp_addr structs follow this packet */

/*
 * The Leave packet header structure
 */
typedef struct {
	unsigned int ntotlen;
	unsigned char type; /* type packet, JOIN, LEAVE etc */
	unsigned char hop;
	unsigned char ecode;
	unsigned char num_addrs; /* number of addresses of source leaving, max 128 */
} tpp_leave_pkt_hdr_t;
/* a bunch of tpp_addr structs follow this packet */

/*
 * The control packet header structure, MSG, NOROUTE etc
 */
typedef struct {
	unsigned int ntotlen;
	unsigned char type;
	unsigned char code;	 /* NOROUTE, UPDATE, ERROR */
	unsigned char error_num; /* error_num in case of NOROUTE, ERRORs */
	unsigned int src_sd;	 /* source sd in case of NO ROUTE */
	tpp_addr_t src_addr;	 /* src host address */
	tpp_addr_t dest_addr;	 /* destination host dest host address */
} tpp_ctl_pkt_hdr_t;

/*
 * The data packet header structure
 */
typedef struct {
	unsigned int ntotlen;
	unsigned char type; /* type of the packet - TPP_DATA, JOIN etc */

	unsigned int src_magic; /* magic id of source stream */

	unsigned int src_sd;  /* source stream descriptor */
	unsigned int dest_sd; /* destination stream descriptor */

	unsigned int totlen; /* total pkt len */

	tpp_addr_t src_addr;  /* src host address */
	tpp_addr_t dest_addr; /* dest host address */
} tpp_data_pkt_hdr_t;

/*
 * The multicast packet header structure
 */
typedef struct {
	unsigned int ntotlen;
	unsigned char type;	      /* type of packet - TPP_MCAST_DATA */
	unsigned char hop;	      /* hop count */
	unsigned int num_streams;     /* number of member streams */
	unsigned int info_len;	      /* total length of info */
	unsigned int info_cmprsd_len; /* compressed length of info */
	unsigned int totlen;	      /* total pkt len (in case of fragmented pkts) */
	tpp_addr_t src_addr;	      /* source host address */
} tpp_mcast_pkt_hdr_t;

/*
 * Structure describing information about each member stream.
 * The overall packet includes a mcast header and multiple member stream
 * info (each of one member stream)
 */
typedef struct {
	unsigned int src_sd;	/* source descriptor of member stream */
	unsigned int src_magic; /* magic id of source stream */
	unsigned int dest_sd;	/* destination descriptor of member stream */
	tpp_addr_t dest_addr;	/* dest host address of member */
} tpp_mcast_pkt_info_t;

#define SLOT_INC 1000

#define TPP_SLOT_FREE 0
#define TPP_SLOT_BUSY 1
#define TPP_SLOT_DELETED 2

#define TPP_MAX_MBOX_SIZE 640000

/* tpp internal message header types */
enum TPP_MSG_TYPES {
	TPP_CTL_JOIN = 1,
	TPP_CTL_LEAVE,
	TPP_DATA,
	TPP_CTL_MSG,
	TPP_CLOSE_STRM,
	TPP_MCAST_DATA,
	TPP_AUTH_CTX,
	TPP_ENCRYPTED_DATA,
	TPP_LAST_MSG
};

#define TPP_MSG_NOROUTE 1
#define TPP_MSG_UPDATE 2
#define TPP_MSG_AUTHERR 3

#define TPP_STRM_NORMAL 1
#define TPP_STRM_MCAST 2

#define TPP_MAX_ACK_DELAY 1
#define TPP_MAX_RETRY_DELAY 30
#define TPP_CLOSE_WAIT 60
#define TPP_STRM_TIMEOUT 600
#define TPP_MIN_WAIT 2
#define TPP_SEND_SIZE 8192
#define TPP_COMPR_SIZE 8192

/* tpp cmds used internally by the layer to notify messages between threads */
#define TPP_CMD_SEND 1
#define TPP_CMD_CLOSE 2
#define TPP_CMD_ASSIGN 3
#define TPP_CMD_EXIT 4
#define TPP_CMD_NET_CLOSE 5
#define TPP_CMD_PEER_CLOSE 6
#define TPP_CMD_NET_DATA 7
#define TPP_CMD_DELAYED_CONNECT 8
#define TPP_CMD_NET_RESTORE 9
#define TPP_CMD_NET_DOWN 10
#define TPP_CMD_WAKEUP 11
#define TPP_CMD_READ 12
#define TPP_CMD_CONNECT 13

#define TPP_DEF_ROUTER_PORT 17001
#define TPP_SCRATCHSIZE 8192

#define TPP_ROUTER_STATE_DISCONNECTED 0 /* Leaf not connected to router */
#define TPP_ROUTER_STATE_CONNECTING 1	/* Leaf is connecting to router */
#define TPP_ROUTER_STATE_CONNECTED 2	/* Leaf connected to router */

#define TPP_MBOX_NAME_SZ 10 /* max 10 mbox_name size */

/*
 * This structure contains the information about what kind of end-point
 * is connected over each connection to this router. When some end-point
 * connects to this router (or this router connects to others), there is a
 * TCP connection created (we call it a physical connection). The end-point
 * then send a "join" packet identifying who it is, and what type it is.
 * The router keeps track of what "kind" of end-point is connected to each of
 * such physical connections.
 */
typedef struct {
	unsigned char type; /* leaf or router */
	void *ptr;	    /* pointer to router or leaf structure */
} tpp_context_t;

/*
 * Structure to hold information about a router
 */
typedef struct {
	char *router_name;	/* router host id */
	tpp_addr_t router_addr; /* primary ip address of router */
	int conn_fd;		/* fd - in case there is direct connection to router */
	time_t conn_time;	/* time at which connection completed */
	int initiator;		/* we initialized the connection to the router */
	int state;		/* 1 - connected or 0 - disconnected */
	int delay;		/* time delay in re-connecting to the router */
	int index;		/* the preference of data going over this connection */
	void *my_leaves_idx;	/* leaves connected to this router, used by comm only */
} tpp_router_t;

/*
 * Structure to hold information of a leaf node
 */
typedef struct {
	int conn_fd;		 /* real connection id. -1 if not directly connected */
	unsigned char leaf_type; /* need notifications or not */

	int tot_routers; /* total number of routers which has this this leaf */
	int num_routers;
	tpp_router_t **r; /* list of routers leaf is connected to */

	int num_addrs;
	tpp_addr_t *leaf_addrs; /* list of leaf's addresses */
} tpp_leaf_t;

/* routines and headers to manage FIFO queues */
struct tpp_que_elem {
	void *queue_data;
	struct tpp_que_elem *prev;
	struct tpp_que_elem *next;
};
typedef struct tpp_que_elem tpp_que_elem_t;

/* queue consists of a pointer to the head and tail of the queue */
typedef struct {
	tpp_que_elem_t *head;
	tpp_que_elem_t *tail;
} tpp_que_t;

/*
 * The cmd structure is used to package the
 * command messages passed between threads
 */
typedef struct {
	unsigned int tfd;
	char cmdval;
	void *data;
	int sz;
} tpp_cmd_t;

/*
 * mbox is the "message box" for each thread
 * When a thread wants to send a msg/cmd to another
 * thread, it posts a message to that threads mbox.
 * That wakes up the thread from a poll/select
 * and allows to act on the message
 */
typedef struct {
	char mbox_name[TPP_MBOX_NAME_SZ]; /* small price for debuggability */
	pthread_mutex_t mbox_mutex;
	tpp_que_t mbox_queue;
	int max_size;
	int mbox_size;
#ifdef HAVE_SYS_EVENTFD_H
	int mbox_eventfd;
#else
	int mbox_pipe[2]; /* may be unused */
#endif
} tpp_mbox_t;

/* quickie macros to work with queues */
#define TPP_QUE_CLEAR(q)  \
	(q)->head = NULL; \
	(q)->tail = NULL
#define TPP_QUE_HEAD(q) (q)->head
#define TPP_QUE_TAIL(q) (q)->tail
#define TPP_QUE_NEXT(q, n) (((n) == NULL) ? (q)->head : (n)->next)
#define TPP_QUE_DATA(n) (((n) == NULL) ? NULL : (n)->queue_data)

typedef struct {
	void *td;
	char tppstaticbuf[TPP_GEN_BUF_SZ];
} tpp_tls_t;

typedef struct {
	void *authctx;
	auth_def_t *authdef;
	void *encryptctx;
	auth_def_t *encryptdef;
	pbs_auth_config_t *config;
	int conn_initiator;
	int conn_type;
} conn_auth_t;

extern int tpp_terminated_in_child; /* whether a forked child called tpp_terminate or not? initialized to 0 */

conn_auth_t *tpp_make_authdata(struct tpp_config *, int, char *, char *);
int tpp_handle_auth_handshake(int, int, conn_auth_t *, int, void *, size_t);
tpp_que_elem_t *tpp_enque(tpp_que_t *, void *);
void *tpp_deque(tpp_que_t *);
tpp_que_elem_t *tpp_que_del_elem(tpp_que_t *, tpp_que_elem_t *);
tpp_que_elem_t *tpp_que_ins_elem(tpp_que_t *, tpp_que_elem_t *, void *, int);
/* End - routines and headers to manage FIFO queues */

int tpp_send(int, void *, int);
int tpp_recv(int, void *, int);
int tpp_ready_fds(int *, int);
void *tpp_get_user_data(int);
int tpp_set_user_data(int, void *);
char *convert_to_ip_port(char *, int);

int tpp_init_tls_key(void);
tpp_tls_t *tpp_get_tls(void);
char *mk_hostname(char *, int);
struct sockaddr_in *tpp_localaddr(int);
tpp_packet_t *tpp_bld_pkt(tpp_packet_t *, void *, int, int, void **);

void tpp_router_terminate(void);
void tpp_free_tls(void);

int tpp_transport_connect(char *, int, void *, int *);
int tpp_transport_vsend(int, tpp_packet_t *pkt);
int tpp_transport_isresvport(int);
int tpp_transport_init(struct tpp_config *);
void tpp_transport_set_handlers(
	int (*pkt_presend_handler)(int, tpp_packet_t *, void *, void *),
	int (*pkt_handler)(int, void *, int, void *, void *),
	int (*close_handler)(int, int, void *, void *),
	int (*post_connect_handler)(int, void *, void *, void *),
	int (*timer_handler)(time_t));
void tpp_set_logmask(long);
int tpp_transport_shutdown(void);
int tpp_transport_terminate(void);
void tpp_transport_set_conn_ctx(int, void *);
void *tpp_transport_get_conn_ctx(int);
void *tpp_transport_get_thrd_context(int);
int tpp_transport_wakeup_thrd(int);
int tpp_transport_connect_spl(char *, int, void *, int *, void *);
int tpp_transport_close(int);

int tpp_init_lock(pthread_mutex_t *);
int tpp_lock(pthread_mutex_t *);
int tpp_unlock(pthread_mutex_t *);
int tpp_destroy_lock(pthread_mutex_t *);

/* rwlock is not supported by posix, so dont
 * refer to this in the header file, instead
 * use voids. The respective C sources which
 * implement this will defined _XOPEN_SOURCE
 * if necessary
 */
int tpp_init_rwlock(void *);
int tpp_read_lock(void *);
int tpp_write_lock(void *);
int tpp_unlock_rwlock(void *);
int tpp_destroy_rwlock(void *);

int tpp_set_non_blocking(int);
int tpp_set_close_on_exec(int);
void tpp_free_chunk(tpp_chunk_t *);
void tpp_free_pkt(tpp_packet_t *);
int tpp_send_ctl_msg(int, int, tpp_addr_t *, tpp_addr_t *, unsigned int, char, char *);
int tpp_cr_thrd(void *(*start_routine)(void *), pthread_t *, void *);
int tpp_set_keep_alive(int, struct tpp_config *);

void *tpp_deflate(void *, unsigned int, unsigned int *);
void *tpp_inflate(void *, unsigned int, unsigned int);
void *tpp_multi_deflate_init(int);
int tpp_multi_deflate_do(void *, int, void *, unsigned int);
void *tpp_multi_deflate_done(void *, unsigned int *);

int tpp_add_fd(int, int, int);
int tpp_del_fd(int, int);
int tpp_mod_fd(int, int, int);

#ifndef WIN32
/* a new mutex introduced to prevent inheriting lock from tpp thread
 * from getaddrinfo(nslookup) during fork for periodic hook
 * set handlers using pthread_atfork.
 */
extern pthread_mutex_t tpp_nslookup_mutex;
void tpp_nslookup_atfork_prepare();
void tpp_nslookup_atfork_parent();
void tpp_nslookup_atfork_child();
#endif

int tpp_validate_hdr(int, char *);
tpp_addr_t *tpp_get_addresses(char *, int *);
tpp_addr_t *tpp_get_local_host(int);
tpp_addr_t *tpp_get_connected_host(int);
int tpp_sock_resolve_ip(tpp_addr_t *, char *, int);
tpp_addr_t *tpp_sock_resolve_host(char *, int *);

const char *tpp_transport_get_conn_hostname(int);
void tpp_transport_set_conn_extra(int, void *);
extern int tpp_get_thrd_index();
char *tpp_netaddr(tpp_addr_t *);
char *tpp_netaddr_sa(struct sockaddr *);
int tpp_encrypt_pkt(conn_auth_t *authdata, tpp_packet_t *pkt);
extern void tpp_auth_logger(int, int, int, const char *, const char *);

void tpp_log(int level, const char *routine, const char *fmt, ...);

void free_router(tpp_router_t *);
void free_leaf(tpp_leaf_t *);

#ifdef WIN32
int tr_2_errno(int);
#endif

/**********************************************************************/
/* em related definitions (internal version) */
/**********************************************************************/
#if defined(PBS_USE_POLL)

typedef struct {
	struct pollfd *fds;
	em_event_t *events;
	int curr_nfds;
	int max_nfds;
} poll_context_t;

#elif defined(PBS_USE_EPOLL)

typedef struct {
	int epoll_fd;
	int max_nfds;
	pid_t init_pid;
	em_event_t *events;
} epoll_context_t;

#elif defined(PBS_USE_POLLSET)

typedef struct {
	pollset_t ps;
	int max_nfds;
	em_event_t *events;
} pollset_context_t;

#elif defined(PBS_USE_SELECT)

typedef struct {
	fd_set master_read_fds;
	fd_set master_write_fds;
	fd_set master_err_fds;
	fd_set read_fds;
	fd_set write_fds;
	fd_set err_fds;
	int maxfd;
	int max_nfds;
	em_event_t *events;
} sel_context_t;

#elif defined(PBS_USE_DEVPOLL)

typedef struct {
	int devpoll_fd;
	em_event_t *events;
	int max_nfds;
} devpoll_context_t;

#endif

/* platform independent functions that manipulate a mbox of a thread
 * Internally these functions may use a eventfd, signalfd, signals,
 * plain pipes etc.
 */
int tpp_mbox_init(tpp_mbox_t *, char *, int);
void tpp_mbox_destroy(tpp_mbox_t *);
int tpp_mbox_monitor(void *, tpp_mbox_t *);
int tpp_mbox_read(tpp_mbox_t *, unsigned int *, int *, void **);
int tpp_mbox_clear(tpp_mbox_t *, tpp_que_elem_t **, unsigned int, short *, void **);
int tpp_mbox_post(tpp_mbox_t *, unsigned int, char, void *, int);
int tpp_mbox_getfd(tpp_mbox_t *);

extern int tpp_going_down;
/**********************************************************************/

/* 
 * use TPPDEBUG instead of DEBUG, since DEBUG makes daemons not fork
 * and that does not work well with init scripts. Sometimes we need to
 * debug TPP in a PTL run where forked daemons are required
 * Hence use a separate macro
 */
#ifdef TPPDEBUG

#define TPP_DBPRT(...) tpp_log(LOG_CRIT, __func__, __VA_ARGS__)

void print_packet_hdr(const char *, void *, int);
#define PRTPKTHDR(id, data, len) print_packet_hdr(id, data, len);

#else

#define TPP_DBPRT(...)
#define PRTPKTHDR(id, data, len)

#endif

#ifdef __cplusplus
}
#endif
#endif /* _TPP_INTERNAL_H */


================================================
FILE: src/lib/Libtpp/tpp_platform.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	tpp_platform.c
 *
 * @brief	Miscellaneous socket and pipe routes for WIndows and Unix
 *
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <pthread.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <netinet/tcp.h>
#include <sys/resource.h>
#include <signal.h>
#include "tpp_internal.h"

#ifdef WIN32

/**
 * @brief
 *	Emulate pipe by using sockets on windows
 *
 * @param[in] - fds - returns the opened pipe fds
 *
 * @return Error code
 * @retval -1 Failure
 * @retval  0 Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_pipe_cr(int fds[2])
{
	SOCKET listenfd;
	struct sockaddr_in serv_addr;
	pbs_socklen_t len = sizeof(serv_addr);
	char *op;

	errno = 0;
	fds[0] = fds[1] = INVALID_SOCKET;

	if ((listenfd = socket(AF_INET, SOCK_STREAM, 0)) == INVALID_SOCKET) {
		op = "socket";
		goto tpp_pipe_err;
	}

	memset(&serv_addr, 0, len);
	serv_addr.sin_family = AF_INET;
	serv_addr.sin_port = htons(0);
	serv_addr.sin_addr.s_addr = htonl(INADDR_LOOPBACK);
	if (bind(listenfd, (SOCKADDR *) &serv_addr, len) == SOCKET_ERROR) {
		op = "bind";
		goto tpp_pipe_err;
	}

	if (listen(listenfd, 1) == SOCKET_ERROR) {
		op = "listen";
		goto tpp_pipe_err;
	}

	if (getsockname(listenfd, (SOCKADDR *) &serv_addr, &len) == SOCKET_ERROR) {
		op = "getsockname";
		goto tpp_pipe_err;
	}

	if ((fds[1] = socket(PF_INET, SOCK_STREAM, 0)) == INVALID_SOCKET) {
		op = "socket";
		goto tpp_pipe_err;
	}

	if (tpp_sock_connect(fds[1], (SOCKADDR *) &serv_addr, len) == SOCKET_ERROR) {
		op = "connect";
		goto tpp_pipe_err;
	}

	if ((fds[0] = accept(listenfd, (SOCKADDR *) &serv_addr, &len)) == INVALID_SOCKET) {
		op = "accept";
		goto tpp_pipe_err;
	}

	closesocket(listenfd);
	return 0;

tpp_pipe_err:
	closesocket(listenfd);
	if (fds[0] != INVALID_SOCKET)
		closesocket(fds[0]);
	if (fds[1] != INVALID_SOCKET)
		closesocket(fds[1]);

	errno = tr_2_errno(WSAGetLastError());
	tpp_log(LOG_CRIT, __func__, "%s failed, winsock errno= %d", op, WSAGetLastError());
	return -1;
}

/**
 * @brief
 *	Emulate pipe read by using sockets on windows
 *
 * @param[in] - fd  - pipe file descriptor
 * @param[in] - buf - data buffer to read from pipe
 * @param[in] - len - length of the data buffer
 *
 * @return  Amount of data written
 * @retval  0 - Failure - close pipe
 * @retval  >0 - Amount of data written
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_pipe_read(int fd, char *buf, int len)
{
	int ret = recv(fd, buf, len, 0);
	if (ret == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return ret;
}

/**
 * @brief
 *	Emulate pipe write by using sockets on windows
 *
 * @param[in] - fd  - pipe file descriptor
 * @param[in] - buf - data buffer to write to pipe
 * @param[in] - len - length of the data buffer
 *
 * @return  Amount of data written
 * @retval  0 - Failure - close pipe
 * @retval  >0 - Amount of data written
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_pipe_write(int fd, char *buf, int len)
{
	int ret = send(fd, buf, len, 0);
	if (ret == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return ret;
}

/**
 * @brief
 *	Emulate pipe close by using sockets on windows
 *
 * @param[in] - fd  - pipe file descriptor

 * @return  return value of windows closesocket
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_pipe_close(int fd)
{
	return closesocket(fd);
}

/*
 * wrapper to call windows socket() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_socket(int af, int type, int protocol)
{
	int fd;
	DWORD dwFlags = 0;

	/*
	 * Make TPP sockets un-inheritable (windows).
	 *
	 * Windows has a quirky implementation of socket inheritence due to
	 * the support for Layered Service Providers. If Firewall/antivirus
	 * are installed, the socket handle could get inherited despite
	 * the fact that we are setting this as un-inheritable via a call
	 * post the socket creation time.
	 *
	 * Use WSA_FLAG_NO_HANDLE_INHERIT available in newer windows
	 * versions (7SP1 onwards) in the call to WSASocket().
	 *
	 * Also use the SetHandleInformation for older windows. (This may
	 * not work with LSP's installed.
	 *
	 */
#ifdef WSA_FLAG_NO_HANDLE_INHERIT
	dwFlags = WSA_FLAG_NO_HANDLE_INHERIT;
#endif
	if ((fd = WSASocket(af, type, protocol, NULL, 0, dwFlags)) == INVALID_SOCKET) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}

	if (SetHandleInformation((HANDLE) fd, HANDLE_FLAG_INHERIT, 0) == 0) {
		errno = tr_2_errno(WSAGetLastError());
		closesocket(fd);
		return -1;
	}

	return fd;
}

/*
 * wrapper to call windows listen() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_listen(int s, int backlog)
{
	if (listen(s, backlog) == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return 0;
}

/*
 * wrapper to call windows accept() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_accept(int s, struct sockaddr *addr, int *addrlen)
{
	int fd;
	if ((fd = accept(s, addr, addrlen)) == INVALID_SOCKET) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return fd;
}

/*
 * wrapper to call windows bind() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_bind(int s, const struct sockaddr *name, int namelen)
{
	if (bind(s, name, namelen) == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return 0;
}

/*
 * wrapper to call windows connect() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_connect(int s, const struct sockaddr *name, int namelen)
{
	if (connect(s, name, namelen) == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return 0;
}

/*
 * wrapper to call windows recv() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_recv(int s, char *buf, int len, int flags)
{
	int ret = recv(s, buf, len, flags);
	if (ret == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return ret;
}

/*
 * wrapper to call windows send() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_send(int s, const char *buf, int len, int flags)
{
	int ret = send(s, buf, len, flags);
	if (ret == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return ret;
}

/*
 * wrapper to call windows select() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_select(int nfds, fd_set *readfds, fd_set *writefds, fd_set *exceptfds, const struct timeval *timeout)
{
	int nready = select(nfds, readfds, writefds, exceptfds, timeout);
	if (nready == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return nready;
}

/*
 * wrapper to call windows closesocket() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_close(int s)
{
	if (closesocket(s) == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return 0;
}

/*
 * wrapper to call windows getsockopt() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_getsockopt(int s, int level, int optname, int *optval, int *optlen)
{
	if (getsockopt(s, level, optname, (char *) optval, optlen) == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return 0;
}

/*
 * wrapper to call windows setsockopt() and map windows
 * error code to errno and massage the return value
 * so that callers do not need conditionally compiled
 * code
 */
int
tpp_sock_setsockopt(int s, int level, int optname, const int *optval, int optlen)
{
	if (setsockopt(s, level, optname, (const char *) optval, optlen) == SOCKET_ERROR) {
		errno = tr_2_errno(WSAGetLastError());
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Map windows error number to errno
 *
 * @param[in] - win_errno - Windows error

 * @return  errno mapped value
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tr_2_errno(int win_errno)
{
	int ret = 0;
	/* convert only a few to unix errors,
	 * for others, we do not care,
	 */
	switch (win_errno) {
		case WSAEINVAL:
			ret = EINVAL;
			break;
		case WSAEINPROGRESS:
			ret = EINPROGRESS;
			break;
		case WSAEINTR:
			ret = EINTR;
			break;
		case WSAECONNREFUSED:
			ret = ECONNREFUSED;
			break;
		case WSAEWOULDBLOCK:
			ret = EWOULDBLOCK;
			break;
		case WSAEADDRINUSE:
			ret = EADDRINUSE;
			break;
		case WSAEADDRNOTAVAIL:
			ret = EADDRNOTAVAIL;
			break;
		default:
			ret = EINVAL;
	}
	return ret;
}

/**
 * @brief
 *	Initialize winsock
 *
 * @return  errro code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_sock_layer_init()
{
	WSADATA data;
	if (WSAStartup(MAKEWORD(2, 2), &data)) {
		tpp_log(LOG_CRIT, NULL, "winsock_init failed! error=%d", WSAGetLastError());
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Retrieve the value of nfiles from OS settings
 *
 * @return  nfiles value, for windows return
 *          constant MAX_CON
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_get_nfiles()
{
	return MAX_CON;
}

/**
 * @brief
 *	Setup SIGPIPE disposition properly.
 *  NOP on windows
 *
 * @return  errro code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
set_pipe_disposition()
{
	return 0;
}

#else

/**
 * @brief
 *	Initialize socket layer
 *  NOP on non-WIndows
 *
 * @return  errro code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_sock_layer_init()
{
	return 0;
}

/**
 * @brief
 *	Retrieve the value of nfiles from OS settings
 *
 * @return  nfiles value
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_get_nfiles()
{
	struct rlimit rlp;

	if (getrlimit(RLIMIT_NOFILE, &rlp) == -1) {
		tpp_log(LOG_CRIT, __func__, "getrlimit failed");
		return -1;
	}

	tpp_log(LOG_INFO, NULL, "Max files allowed = %ld", (long) rlp.rlim_cur);

	return (rlp.rlim_cur);
}

/**
 * @brief
 *	Setup SIGPIPE disposition properly
 *
 * @return  errro code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
set_pipe_disposition()
{
	struct sigaction act;
	struct sigaction oact;

	/*
	 * Check if SIGPIPE's disposition is set to default, if so, set to ignore;
	 * else we assume the application can handle SIGPIPE without quitting.
	 *
	 * MSG_NOSIGNAL is linux specific, and SO_NOSIGPIPE is not portable either.
	 * As of now we do not need any more elegant solution than just ignoring
	 * the sigpipe, if not already handled by the application.
	 */
	if (sigaction(SIGPIPE, NULL, &oact) == 0) {
		if (oact.sa_handler == SIG_DFL) {
			act.sa_handler = SIG_IGN;
			if (sigaction(SIGPIPE, &act, &oact) != 0) {
				tpp_log(LOG_CRIT, __func__, "Could not set SIGPIPE to IGN");
				return -1;
			}
		}
	} else {
		tpp_log(LOG_CRIT, __func__, "Could not query SIGPIPEs disposition");
		return -1;
	}
	return 0;
}
#endif

/**
 * @brief
 *	Find the hostname associated with the provided ip
 *
 * @param[in] addr - The ip address for which we need to find the hostname
 * @param[in] host - The buffer to which to copy the hostname to
 * @param[in] len  - The length of the output buffer
 *
 * @return  error code
 * @retval  !0 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_sock_resolve_ip(tpp_addr_t *addr, char *host, int len)
{
	socklen_t salen;
	struct sockaddr *sa;
	struct sockaddr_in6 sa_in6;
	struct sockaddr_in sa_in;
	int rc;

	if (addr->family == TPP_ADDR_FAMILY_IPV4) {
		memcpy(&sa_in.sin_addr, (struct sockaddr_in *) addr->ip, sizeof(sa_in.sin_addr));
		salen = sizeof(struct sockaddr_in);
		sa = (struct sockaddr *) &sa_in;
		sa->sa_family = AF_INET;
	} else if (addr->family == TPP_ADDR_FAMILY_IPV6) {
		memcpy(&sa_in6.sin6_addr, (struct sockaddr_in *) addr->ip, sizeof(sa_in6.sin6_addr));
		sa = (struct sockaddr *) &sa_in6;
		salen = sizeof(struct sockaddr_in6);
		sa->sa_family = AF_INET6;
	} else
		return -1;
#ifndef WIN32
	/* 
	 * introducing a new mutex to prevent child process from 
	 * inheriting getnameinfo mutex using pthread_atfork handlers
	 */
	tpp_lock(&tpp_nslookup_mutex);
#endif
	rc = getnameinfo(sa, salen, host, len, NULL, 0, 0);
	/* unlock nslookup mutex */
#ifndef WIN32
	tpp_unlock(&tpp_nslookup_mutex);
#endif
	if (rc != 0) {
		TPP_DBPRT("Error: %s", gai_strerror(rc));
	}
	return rc;
}

/**
 * @brief
 *	Resolve the hostname to ip address list
 *
 * @param[in]  host  - The hostname to resolve
 * @param[out] count - The count of addresses returned
 *
 * @return  Array of address resolved from the host
 * @retval  NULL  - Failure
 * @retval  !NULL - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
tpp_addr_t *
tpp_sock_resolve_host(char *host, int *count)
{
	tpp_addr_t *ips = NULL;
	void *tmp;
	int i, j;
	struct addrinfo *aip, *pai;
	struct addrinfo hints;
	int rc = 0;

	errno = 0;
	*count = 0;

	memset(&hints, 0, sizeof(struct addrinfo));
	hints.ai_family = AF_INET;
	hints.ai_socktype = SOCK_STREAM;
	hints.ai_protocol = IPPROTO_TCP;

#ifndef WIN32
	/* 
	 * introducing a new mutex to prevent child process from 
	 * inheriting getaddrinfo mutex using pthread_atfork handlers
	 */
	tpp_lock(&tpp_nslookup_mutex);
#endif
	rc = getaddrinfo(host, NULL, &hints, &pai);
	/* unlock nslookup mutex */
#ifndef WIN32
	tpp_unlock(&tpp_nslookup_mutex);
#endif
	if (rc != 0) {
		tpp_log(LOG_CRIT, NULL, "Error %d resolving %s", rc, host);
		return NULL;
	}

	*count = 0;
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		if (aip->ai_family == AF_INET) { /* for now only count IPv4 addresses */
			(*count)++;
		}
	}

	if (*count == 0) {
		tpp_log(LOG_CRIT, NULL, "Could not find any usable IP address for host %s", host);
		return NULL;
	}

	ips = calloc(*count, sizeof(tpp_addr_t));
	if (!ips) {
		*count = 0;
		return NULL;
	}

	i = 0;
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		/* skip non-IPv4 addresses */
		/*if (aip->ai_family == AF_INET || aip->ai_family == AF_INET6) {*/
		if (aip->ai_family == AF_INET) { /* for now only work with IPv4 */
			if (aip->ai_family == AF_INET) {
				struct sockaddr_in *sa = (struct sockaddr_in *) aip->ai_addr;
				if (ntohl(sa->sin_addr.s_addr) >> 24 == IN_LOOPBACKNET)
					continue;
				memcpy(&ips[i].ip, &sa->sin_addr, sizeof(sa->sin_addr));
			} else if (aip->ai_family == AF_INET6) {
				struct sockaddr_in6 *sa6 = (struct sockaddr_in6 *) aip->ai_addr;
				memcpy(&ips[i].ip, &sa6->sin6_addr, sizeof(sa6->sin6_addr));
			}
			ips[i].family = (aip->ai_family == AF_INET6) ? TPP_ADDR_FAMILY_IPV6 : TPP_ADDR_FAMILY_IPV4;
			ips[i].port = 0;

			for (j = 0; j < i; j++) {
				/* check for duplicate ip addresses dont add if duplicate */
				if (memcmp(&ips[j].ip, &ips[i].ip, sizeof(ips[j].ip)) == 0) {
					break;
				}
			}
			if (j == i) {
				/* did not find duplicate so use this slot */
				i++;
			}
		}
	}
	freeaddrinfo(pai);

	if (i == 0) {
		free(ips);
		*count = 0;
		return NULL;
	}

	if (i < *count) {
		/* try to resize the buffer, don't bother if resize failed */
		tmp = realloc(ips, i * sizeof(tpp_addr_t));
		if (tmp)
			ips = tmp;
	}
	*count = i; /* adjust count */

	return ips;
}

/**
 * @brief
 *	Helper function to initiate a connection to a remote host
 *
 *
 * @param[in] conn - The physical connection structure
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_sock_attempt_connection(int fd, char *host, int port)
{
	struct sockaddr_in dest_addr;
	int rc = 0;
	tpp_addr_t *addr;
	int count = 0, i;

	errno = 0;

	addr = tpp_sock_resolve_host(host, &count);
	if (count == 0 || addr == NULL) {
		errno = EADDRNOTAVAIL;
		return -1;
	}

	for (i = 0; i < count; i++) {
		if (addr[i].family == TPP_ADDR_FAMILY_IPV4)
			break;
	}
	if (i == count) {
		/* did not find a ipv4 address, fail for now */
		free(addr);
		errno = EADDRNOTAVAIL;
		return -1;
	}

	dest_addr.sin_family = AF_INET;
	dest_addr.sin_port = htons(port);

	memcpy((char *) &dest_addr.sin_addr, &addr[i].ip, sizeof(dest_addr.sin_addr));
	rc = tpp_sock_connect(fd, (struct sockaddr *) &dest_addr, sizeof(dest_addr));
	free(addr);

	return rc;
}

/**
 * @brief
 *	Initialize thrd handle to an invalid value
 *
 * @param[in] thrd - the thrd handle to invalidate
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_invalidate_thrd_handle(pthread_t *thrd)
{
#ifdef WIN32
	thrd->thHandle = INVALID_HANDLE_VALUE;
	thrd->thId = -1;
#else
	*thrd = -1; /* initialize to -1 */
#endif
}

/**
 * @brief
 *	Check if thrd has a valid handle
 *
 * @param[in] thrd - the thrd handle to check
 *
 * @return  Error code
 * @retval   1 - Valid
 * @retval   0 - invalid handle
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_is_valid_thrd(pthread_t thrd)
{
#ifndef WIN32
	if (thrd != -1)
		return 1;
#else
	if (thrd.thHandle != INVALID_HANDLE_VALUE)
		return 1;
#endif
	return 0;
}


================================================
FILE: src/lib/Libtpp/tpp_router.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	tpp_router.c
 *
 * @brief	Router part of the TCP router based network
 *
 * @par		Functionality:
 *
 *		TPP = TCP based Packet Protocol. This layer uses TCP in a multi-
 *		hop router based network topology to deliver packets to desired
 *		destinations. LEAF (end) nodes are connected to ROUTERS via
 *		persistent TCP connections. The ROUTER has intelligence to route
 *		packets to appropriate destination leaves or other routers.
 *
 *		This is the router part in the tpp network topology.
 *		This compiles into the router process, and is
 *		linked to the PBS comm.
 *
 */
#include <pbs_config.h>
#if RWLOCK_SUPPORT == 2
#if !defined(_XOPEN_SOURCE)
#define _XOPEN_SOURCE 500
#endif
#endif

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <pthread.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#ifdef PBS_COMPRESSION_ENABLED
#include <zlib.h>
#endif
#include "pbs_idx.h"
#include "tpp_internal.h"
#include "auth.h"

#define RLIST_INC 100

struct tpp_config *tpp_conf; /* copy of the global tpp_config */

pthread_rwlock_t router_lock; /* rw lock for router avl trees, searches over avl should be thread safe now */
pthread_mutex_t lj_lock;

/* index of routers connected to this router */
void *routers_idx = NULL;

/* index of all leaves in the cluster */
void *cluster_leaves_idx = NULL;

/* index of special routers who need to be notified for join updates */
void *my_leaves_notify_idx = NULL;
time_t router_last_leaf_joined = 0;

static int router_send_ctl_join(int tfd, void *data, void *c);

/* forward declarations */
static int router_pkt_presend_handler(int tfd, tpp_packet_t *pkt, void *c, void *extra);
static int router_pkt_handler(int phy_fd, void *data, int len, void *c, void *extra);
static int router_pkt_handler_inner(int tfd, void *buf, void **data_out, int len, void *c, void *extra);
static int router_close_handler(int phy_con, int error, void *c, void *extra);
static int send_leaves_to_router(tpp_router_t *parent, tpp_router_t *target);
static tpp_router_t *get_preferred_router(tpp_leaf_t *l, tpp_router_t *this_router, int *fd);
static int add_route_to_leaf(tpp_leaf_t *l, tpp_router_t *r, int index);
static tpp_router_t *del_router_from_leaf(tpp_leaf_t *l, int tfd);
static int leaf_get_router_index(tpp_leaf_t *l, tpp_router_t *r);
static int router_timer_handler(time_t now);
static int router_post_connect_handler(int tfd, void *data, void *c, void *extra);

/* structure identifying this router */
static tpp_router_t *this_router = NULL;

static tpp_router_t *
alloc_router(char *name, tpp_addr_t *address)
{
	tpp_router_t *r;
	tpp_addr_t *addrs = NULL;
	int count = 0;
	void *unused;
	void *p_r_addr;

	/* add self name to tree */
	r = (tpp_router_t *) calloc(1, sizeof(tpp_router_t));
	if (!r) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating pbs_comm data");
		return NULL;
	}

	r->conn_fd = -1;
	r->router_name = name;
	r->initiator = 0;
	r->index = 0; /* index is not used between routers */
	r->state = TPP_ROUTER_STATE_DISCONNECTED;

	if (address == NULL) {
		/* do name resolution on the supplied name */
		addrs = tpp_get_addresses(r->router_name, &count);
		if (!addrs) {
			tpp_log(LOG_CRIT, __func__, "Failed to resolve address, pbs_comm=%s", r->router_name);
			free_router(r);
			return NULL;
		}
		memcpy(&r->router_addr, addrs, sizeof(tpp_addr_t));
		free(addrs);
	} else {
		memcpy(&r->router_addr, address, sizeof(tpp_addr_t));
	}

	/* initialize the routers leaf tree */
	r->my_leaves_idx = pbs_idx_create(0, sizeof(tpp_addr_t));
	if (r->my_leaves_idx == NULL) {
		tpp_log(LOG_CRIT, __func__, "Failed to create index for my leaves");
		free_router(r);
		return NULL;
	}

	p_r_addr = &r->router_addr;
	if (pbs_idx_find(routers_idx, &p_r_addr, &unused, NULL) == PBS_IDX_RET_OK) {
		tpp_log(LOG_CRIT, __func__, "Duplicate router %s in router list", r->router_name);
		free_router(r);
		return NULL;
	}

	if (pbs_idx_insert(routers_idx, &r->router_addr, r) != PBS_IDX_RET_OK) {
		tpp_log(LOG_CRIT, __func__, "Failed to add router %s in routers index", r->router_name);
		free_router(r);
		return NULL;
	}

	return r;
}

/*
 * Convenience function to log a no route message in the logs
 */
void
log_noroute(tpp_addr_t *src_host, tpp_addr_t *dest_host, int src_sd, char *msg)
{
	char src[TPP_MAXADDRLEN + 1];
	char dest[TPP_MAXADDRLEN + 1];

	strncpy(src, tpp_netaddr(src_host), TPP_MAXADDRLEN);
	strncpy(dest, tpp_netaddr(dest_host), TPP_MAXADDRLEN);

	tpp_log(LOG_ERR, NULL, "Pkt from src=%s[%d], noroute to dest=%s, %s", src, src_sd, dest, msg);
}

/**
 * @brief
 *	When a router joins, send all the leaves connected to that router to
 *	other routers.
 *
 * @param[in] parent - router whose leaves are to be sent
 * @param[in] target - router to which the leaves must be sent
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	This routine expects to be called with the "router_lock" and
 *	will unlock the router_lock before exiting.
 *
 * @par MT-safe: Yes
 *
 */
static int
send_leaves_to_router(tpp_router_t *parent, tpp_router_t *target)
{
	tpp_leaf_t *l;
	tpp_que_t leaf_packets;
	tpp_packet_t *pkt = NULL;
	int index;
	tpp_join_pkt_hdr_t *hdr = NULL;
	void *idx_ctx = NULL;

	TPP_QUE_CLEAR(&leaf_packets);

	TPP_DBPRT("Sending leaves to router=%s", target->router_name);

	/* traverse my leaves tree, there is only one record per leaf */
	while (pbs_idx_find(parent->my_leaves_idx, NULL, (void **) &l, &idx_ctx) == PBS_IDX_RET_OK) {
		index = leaf_get_router_index(l, this_router);
		if (index == -1) {
			tpp_log(LOG_CRIT, __func__, "Could not find index of my router in leaf's pbs_comm list");
			goto err;
		}

		/* create a new pkt and add the dhdr chunk first */
		pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_join_pkt_hdr_t), 1, (void **) &hdr);
		if (!pkt) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			goto err;
		}
		/* save hdr and addrs to be sent outside of locks */
		hdr->type = TPP_CTL_JOIN;
		hdr->node_type = l->leaf_type;
		hdr->hop = 2;
		hdr->index = index;
		hdr->num_addrs = l->num_addrs;

		/* add the addresses */
		if (!tpp_bld_pkt(pkt, l->leaf_addrs, sizeof(tpp_addr_t) * l->num_addrs, 1, NULL)) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			goto err;
		}

		if (tpp_enque(&leaf_packets, pkt) == NULL) {
			tpp_log(LOG_CRIT, __func__, "Out of memory enqueuing to leaf_packets");
			goto err;
		}
	}
	pbs_idx_free_ctx(idx_ctx);

	while ((pkt = (tpp_packet_t *) tpp_deque(&leaf_packets))) {
		if (tpp_transport_vsend(target->conn_fd, pkt) != 0) {
			tpp_log(LOG_ERR, __func__, "Send leaves to pbs_comm %s failed", target->router_name);
			/* let the dequeue continue to happen and attempt to send happen */
			/* vsend will free packets even in case of failure */
		}
	}

	return 0;

err:
	/* we jump to the error block only before starting to send, so safe to clear the queue */
	tpp_log(LOG_CRIT, __func__, "Error sending leaves to router %s", target->router_name);

	pbs_idx_free_ctx(idx_ctx);

	while ((pkt = (tpp_packet_t *) tpp_deque(&leaf_packets))) /* drain the list and free packets */
		tpp_free_pkt(pkt);

	return -1;
}

/**
 * @brief
 *	Broadcast the given data packet to all the routers connected to this
 *	router
 *
 * @param[in] - chunks - Chunks of data that needs to be sent to routers
 * @param[in] - count  - Number of chunks in the count array
 * @param[in] - origin_tfd - This routers physical connection descriptor
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	This function is not guarded by an lock around it. So it should be called 
 *  under a lock
 *
 * @par MT-safe: No
 *
 */
static int
broadcast_to_my_routers(tpp_chunk_t *chunks, int count, int origin_tfd)
{
	tpp_router_t *r;
	tpp_que_t router_list;
	void *idx_ctx = NULL;

	TPP_QUE_CLEAR(&router_list);

	while (pbs_idx_find(routers_idx, NULL, (void **) &r, &idx_ctx) == PBS_IDX_RET_OK) {
		if (r->conn_fd == -1 || r == this_router || r->conn_fd == origin_tfd || r->state != TPP_ROUTER_STATE_CONNECTED) {
			continue; /* don't send to self, or to originating router */
		}
		if (tpp_enque(&router_list, r) == NULL) {
			tpp_log(LOG_CRIT, __func__, "Out of memory enqueuing to router_list");
			pbs_idx_free_ctx(idx_ctx);
			goto err;
		}
	}
	pbs_idx_free_ctx(idx_ctx);

	while ((r = (tpp_router_t *) tpp_deque(&router_list))) {
		int j;
		tpp_packet_t *pkt = NULL;

		for (j = 0; j < count; j++) {
			pkt = tpp_bld_pkt(pkt, chunks[j].data, chunks[j].len, 1, NULL);
			if (!pkt) {
				tpp_log(LOG_CRIT, __func__, "Failed to build packet");
				goto err;
			}
		}

		if (tpp_transport_vsend(r->conn_fd, pkt) != 0) {
			TPP_DBPRT("Broadcasting leaf to router %s", r->router_name);
			if (errno != ENOTCONN) {
				tpp_log(LOG_ERR, __func__, "send failed");
				goto err;
			}
			/* vsend will free packets even in case of failure */
		}
	}
	return 0;

err:
	tpp_log(LOG_CRIT, __func__, "Error broadcasting to my routers");
	while (tpp_deque(&router_list))
		; /* drain the list, dont free packets, transport will free */
	return -1;
}

/**
 * @brief
 *	Broadcast the given data packet to all the leaves connected to this
 *	router
 *
 * @param[in] - chunks - Chunks of data that needs to be sent to routers
 * @param[in] - count  - Number of chunks in the count array
 * @param[in] - origin_tfd - This routers physical connection descriptor
 * @param[in] - type  0 - Notify all leaves
 *                    1 - Notify only listen leaves
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @note
 *   This function is not guarded by an lock around it. So it should be called 
 *   under a lock
 *
 * @par MT-safe: No
 *
 */
static int
broadcast_to_my_leaves(tpp_chunk_t *chunks, int count, int origin_tfd, int type)
{
	tpp_leaf_t *l;
	void *traverse_idx = NULL;
	void *idx_ctx = NULL;
	tpp_que_t leaf_list;

	TPP_QUE_CLEAR(&leaf_list);

	if (type == 1)
		traverse_idx = my_leaves_notify_idx;
	else
		traverse_idx = this_router->my_leaves_idx;

	while (pbs_idx_find(traverse_idx, NULL, (void **) &l, &idx_ctx) == PBS_IDX_RET_OK) {
		/*
		 * leaf directly connected to me? and not myself
		 * and is interested in events
		 */
		if (l->conn_fd != -1 && l->conn_fd != origin_tfd) {

			/* if type is 1, notify only listen leaves */
			if (type == 1 && l->leaf_type != TPP_LEAF_NODE_LISTEN)
				continue;

			if (tpp_enque(&leaf_list, l) == NULL) {
				tpp_log(LOG_CRIT, __func__, "Out of memory enqueuing to leaf_list");
				pbs_idx_free_ctx(idx_ctx);
				goto err;
			}
		}
	}
	pbs_idx_free_ctx(idx_ctx);

	while ((l = (tpp_leaf_t *) tpp_deque(&leaf_list))) {
		int j;
		tpp_packet_t *pkt = NULL;

		for (j = 0; j < count; j++) {
			pkt = tpp_bld_pkt(pkt, chunks[j].data, chunks[j].len, 1, NULL);
			if (!pkt) {
				tpp_log(LOG_CRIT, __func__, "Failed to build packet");
				goto err;
			}
		}

		if (tpp_transport_vsend(l->conn_fd, pkt) != 0) {
			if (errno != ENOTCONN) {
				tpp_log(LOG_ERR, __func__, "send failed");
				goto err;
			}
			/* vsend will free packets even in case of failure */
		}
	}
	return 0;

err:
	tpp_log(LOG_CRIT, __func__, "Error broadcasting to my leaves");
	while (tpp_deque(&leaf_list))
		; /* drain the list, dont free pacets, transport will free */
	return -1;
}

static int
router_send_ctl_join(int tfd, void *data, void *c)
{
	tpp_context_t *ctx = (tpp_context_t *) c;
	int rc = 0;

	if (!ctx)
		return 0;

	if (ctx->type == TPP_ROUTER_NODE) {
		tpp_router_t *r = NULL;
		tpp_join_pkt_hdr_t *hdr = NULL;
		tpp_packet_t *pkt = NULL;

		r = (tpp_router_t *) ctx->ptr;

		/* send a TPP_CTL_JOIN message */
		pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_join_pkt_hdr_t), 1, (void **) &hdr);
		if (!pkt) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			return -1;
		}

		hdr->type = TPP_CTL_JOIN;
		hdr->node_type = TPP_ROUTER_NODE;
		hdr->hop = 1;
		hdr->index = 0;
		hdr->num_addrs = 0;

		rc = tpp_transport_vsend(r->conn_fd, pkt);
		if (rc == 0) {
			tpp_read_lock(&router_lock);

			r->state = TPP_ROUTER_STATE_CONNECTED;

			tpp_log(LOG_CRIT, NULL, "tfd=%d, pbs_comm %s accepted connection", tfd, r->router_name);

			rc = send_leaves_to_router(this_router, r);

			tpp_unlock_rwlock(&router_lock);
		} else {
			tpp_log(LOG_CRIT, __func__, "Failed to send JOIN packet/send leaves to pbs_comm %s", this_router->router_name);
			tpp_transport_close(r->conn_fd);
			return 0;
		}
	}

	return rc;
}

/**
 * @brief
 *	The router post connect handler
 *
 * @par Functionality
 *	When the connection between this router and another is dropped, the IO
 *	thread continuously attempts to reconnect to it. If the connection is
 *	restored, then this prior registered function is called.
 *
 * @param[in] tfd - The actual IO connection on which data was about to be
 *			sent (unused)
 * @param[in] data - Any data the IO thread might want to pass to this function.
 *		     (unused)
 * @param[in] extra - The extra data associated with IO connection
 *
 * @return Error code
 * @retval 0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
router_post_connect_handler(int tfd, void *data, void *c, void *extra)
{
	tpp_context_t *ctx = (tpp_context_t *) c;
	conn_auth_t *authdata = (conn_auth_t *) extra;
	int rc = 0;

	if (!ctx)
		return 0;

	if (ctx->type != TPP_ROUTER_NODE)
		return 0;

	if (tpp_conf->auth_config->encrypt_method[0] != '\0' ||
	    strcmp(tpp_conf->auth_config->auth_method, AUTH_RESVPORT_NAME) != 0) {

		/*
		 * Since either auth is not resvport or encryption is enabled,
		 * initiate handshakes for them
		 *
		 * If encryption is enabled then first initiate handshake for it
		 * else for authentication
		 *
		 * Here we are only initiating handshake, if any handshake needs
		 * continuation then it will be handled in leaf_pkt_handler
		 */

		int conn_fd = ((tpp_router_t *) ctx->ptr)->conn_fd;
		authdata = tpp_make_authdata(tpp_conf, AUTH_CLIENT, tpp_conf->auth_config->auth_method, tpp_conf->auth_config->encrypt_method);
		if (authdata == NULL) {
			/* tpp_make_authdata already logged error */
			return -1;
		}
		authdata->conn_initiator = 1;
		tpp_transport_set_conn_extra(tfd, authdata);

		if (authdata->config->encrypt_method[0] != '\0') {
			rc = tpp_handle_auth_handshake(tfd, conn_fd, authdata, FOR_ENCRYPT, NULL, 0);
			if (rc != 1)
				return rc;
		}

		if (strcmp(authdata->config->auth_method, AUTH_RESVPORT_NAME) != 0) {
			if (strcmp(authdata->config->auth_method, authdata->config->encrypt_method) != 0) {
				rc = tpp_handle_auth_handshake(tfd, conn_fd, authdata, FOR_AUTH, NULL, 0);
				if (rc != 1)
					return rc;
			} else {
				authdata->authctx = authdata->encryptctx;
				authdata->authdef = authdata->encryptdef;
				tpp_transport_set_conn_extra(tfd, authdata);
			}
		}
	}

	/*
	 * Since we are in post conntect handler
	 * and we have completed authentication
	 * so send TPP_CTL_JOIN
	 */
	return router_send_ctl_join(tfd, data, c);
}

/**
 * @brief
 *	Handle a connection close handler
 *
 * @par Functionality:
 *	Identify what type of endpoint dropped the connection, and remove it
 *	from the appropriate indexes (router or leaf). If a leaf or router
 *	was down, inform all the other routers interested about the connection
 *	loss.
 *
 *	If a router went down, then consider all leaves connected directly to
 *	that router to be down, and repeat the process.
 *
 *	This is also called when a leaf sends a LEAVE message, which is
 *	forwarded by the router to other leaves and routers, in this case, the
 *	hop count is > 1.
 *
 *	If hop == 1, it means data came from a direct connection instead of
 *	being forwarded by another router. Leafs that are directly connected
 *	have conn_fd set to the actual socket descriptor. For leafs that are
 *	not connected directly to this router, the conn_fd is -1.
 *
 * @param[in] tfd   - The physical connection that went down
 * @param[in] error - Any error that was captured when the connection went down
 * @param[in] c     - The context that was associated with the connection
 * @param[in] hop   - The hop count - number of times that message traveled
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
router_close_handler_inner(int tfd, int error, void *c, int hop)
{
	tpp_context_t *ctx = (tpp_context_t *) c;
	tpp_leave_pkt_hdr_t hdr;
	tpp_chunk_t chunks[2];
	int i;

	if (tpp_going_down == 1)
		return 0;

	if (c == NULL) {
		/*
		 * no context available, no join was done, so don't bother
		 * about disconnection
		 */
		TPP_DBPRT("tfd = %d, No context, leaving", tfd);
		return 0;
	}

	if (ctx->type == TPP_LEAF_NODE || ctx->type == TPP_LEAF_NODE_LISTEN) {

		/* connection to a leaf node dropped or a router dropped */
		tpp_leaf_t *l = (tpp_leaf_t *) ctx->ptr;
		tpp_router_t *r = NULL;
		int leaf_type = ctx->type;

		hdr.type = TPP_CTL_LEAVE;
		hdr.hop = hop + 1;
		hdr.ecode = error;
		hdr.num_addrs = l->num_addrs;

		chunks[0].data = (void *) &hdr;
		chunks[0].len = sizeof(tpp_leave_pkt_hdr_t);

		chunks[1].data = (void *) l->leaf_addrs;
		chunks[1].len = l->num_addrs * sizeof(tpp_addr_t);

		if (hop == 1) {
			/* request came directly to me? */
			/*
			 * broadcast leave pkt to other routers,
			 * except from where it came from
			 */
			tpp_read_lock(&router_lock);
			broadcast_to_my_routers(chunks, 2, tfd);
			tpp_unlock_rwlock(&router_lock);

			tpp_log(LOG_CRIT, NULL, "tfd=%d, Connection from leaf %s down", tfd, tpp_netaddr(&l->leaf_addrs[0]));
		}

		tpp_write_lock(&router_lock);

		if ((r = del_router_from_leaf(l, tfd)) == NULL) {
			tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to clear pbs_comm from leaf %s's list", tfd, tpp_netaddr(&l->leaf_addrs[0]));
			tpp_unlock_rwlock(&router_lock);
			return -1;
		}

		/* we had only the first address record stored in the my_leaves tree */
		if (pbs_idx_delete(r->my_leaves_idx, &l->leaf_addrs[0]) != PBS_IDX_RET_OK) {
			tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to delete address from my_leaves %s", tfd, tpp_netaddr(&l->leaf_addrs[0]));
			tpp_unlock_rwlock(&router_lock);
			return -1;
		}

		if (l->num_routers > 0) {
			TPP_DBPRT("tfd=%d, Other pbs_comms for leaf %s present", tfd, tpp_netaddr(&l->leaf_addrs[0]));
			tpp_unlock_rwlock(&router_lock);
			return 0;
		}

		TPP_DBPRT("No more pbs_comms to leaf %s, deleting leaf", tpp_netaddr(&l->leaf_addrs[0]));

		/* delete all of this leaf's addresses from the search tree */
		for (i = 0; i < l->num_addrs; i++) {
			if (pbs_idx_delete(cluster_leaves_idx, &l->leaf_addrs[i]) != PBS_IDX_RET_OK) {
				tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to delete address %s from cluster leaves", tfd, tpp_netaddr(&l->leaf_addrs[i]));
				tpp_unlock_rwlock(&router_lock);
				return -1;
			}
		}

		if (leaf_type == TPP_LEAF_NODE_LISTEN) {
			/*
			 * if it is a notification leaf,
			 * then remove from this tree also
			 */
			pbs_idx_delete(my_leaves_notify_idx, &l->leaf_addrs[0]);
		}

		/* broadcast to all self connected leaves */
		broadcast_to_my_leaves(chunks, 2, tfd, 0);

		free_leaf(l);

		tpp_unlock_rwlock(&router_lock);

		return 0;

	} else if (ctx->type == TPP_ROUTER_NODE) {

		tpp_router_t *r = (tpp_router_t *) ctx->ptr;
		int rc;
		tpp_leaf_t *l;
		tpp_que_t deleted_leaves;
		tpp_que_elem_t *n = NULL;

		if (r->state == TPP_ROUTER_STATE_CONNECTED) {
			void *idx_ctx = NULL;

			/* do any logging or leaf processing only if it was connected earlier */
			tpp_log(LOG_CRIT, NULL, "tfd=%d, Connection %s pbs_comm %s down", tfd, (r->initiator == 1) ? "to" : "from", r->router_name);

			tpp_write_lock(&router_lock);
			TPP_QUE_CLEAR(&deleted_leaves);

			while (pbs_idx_find(r->my_leaves_idx, NULL, (void **) &l, &idx_ctx) == PBS_IDX_RET_OK) {
				if (l->num_routers > 0) {
					del_router_from_leaf(l, tfd);
					if (l->num_routers == 0) {
						/*
						 * delete leaf from the leaf tree, since it
						 * is not connected to any routers now
						 */
						TPP_DBPRT("All routers to leaf %s down, deleting leaf", tpp_netaddr(&l->leaf_addrs[0]));

						if (tpp_enque(&deleted_leaves, l) == NULL) {
							tpp_unlock_rwlock(&router_lock);
							tpp_log(LOG_CRIT, __func__, "Out of memory enqueuing deleted leaves");
							return -1;
						}
					}
				}
			}
			pbs_idx_free_ctx(idx_ctx);

			/* now remove each of the leaf's addresses from clusters index */
			while ((n = TPP_QUE_NEXT(&deleted_leaves, n))) {
				l = (tpp_leaf_t *) TPP_QUE_DATA(n);
				if (l == NULL)
					continue;

				if (l->leaf_type == TPP_LEAF_NODE_LISTEN) {
					pbs_idx_delete(my_leaves_notify_idx, &l->leaf_addrs[0]);
				}

				for (i = 0; i < l->num_addrs; i++) {
					if (pbs_idx_delete(cluster_leaves_idx, &l->leaf_addrs[i]) != PBS_IDX_RET_OK) {
						tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to delete address %s", tfd, tpp_netaddr(&l->leaf_addrs[i]));
						tpp_unlock_rwlock(&router_lock);

						return -1;
					}
				}
			}

			/* delete all leaf nodes from the my_leaves_idx tree of this router
			 * and finally destroy that index since the router itself had
			 * disconnected
			 */
			pbs_idx_destroy(r->my_leaves_idx);
			r->my_leaves_idx = NULL;
			if (r->initiator == 1) {
				/* initialize the routers leaf tree */
				r->my_leaves_idx = pbs_idx_create(0, sizeof(tpp_addr_t));
				if (r->my_leaves_idx == NULL) {
					tpp_log(LOG_CRIT, __func__, "Failed to create index for my leaves");
					free_router(r);
					tpp_unlock_rwlock(&router_lock);
					return -1;
				}
			}

			/*
			 * set the conn_fd of the router to -1 here and not before
			 * because the del_router_from_leaf function above matches
			 * with the routers conn_fd
			 */
			r->conn_fd = -1;
			r->state = TPP_ROUTER_STATE_DISCONNECTED;

			chunks[0].data = (void *) &hdr;
			chunks[0].len = sizeof(tpp_leave_pkt_hdr_t);

			/* broadcast leave msgs of these leaves to my leaves */
			while ((l = (tpp_leaf_t *) tpp_deque(&deleted_leaves))) {
				hdr.type = TPP_CTL_LEAVE;
				hdr.hop = 2;
				hdr.ecode = error;
				hdr.num_addrs = l->num_addrs;

				chunks[1].data = (void *) l->leaf_addrs;
				chunks[1].len = l->num_addrs * sizeof(tpp_addr_t);

				/* broadcast to all self connected leaves */
				broadcast_to_my_leaves(chunks, 2, tfd, 0);
				free_leaf(l);
			}

			tpp_unlock_rwlock(&router_lock);
		}

		if (r->initiator == 1) {
			void *thrd;
			/*
			 * Attempt reconnects only if we had initiated the
			 * connection ourselves
			 */
			if (r->delay == 0)
				r->delay = TPP_CONNNECT_RETRY_MIN;
			else
				r->delay += TPP_CONNECT_RETRY_INC;
			if (r->delay > TPP_CONNECT_RETRY_MAX)
				r->delay = TPP_CONNECT_RETRY_MAX;

			r->state = TPP_ROUTER_STATE_CONNECTING;

			/* de-associate connection context from current tfd */
			tpp_transport_set_conn_ctx(tfd, NULL);

			/* find the transport thread associated with this connection
			 * that is on its way to be closed, pass the same thrd context
			 * to the special connect call, so that the new connection is
			 * assigned to this same thread instead of new one
			 */
			tpp_log(LOG_INFO, NULL, "Connecting to pbs_comm %s", r->router_name);

			thrd = tpp_transport_get_thrd_context(tfd);
			rc = tpp_transport_connect_spl(r->router_name, r->delay, ctx, &r->conn_fd, thrd);
			if (rc != 0) {
				tpp_log(LOG_CRIT, NULL, "tfd=%d, Failed initiating connection to pbs_comm %s", tfd, r->router_name);
				return -1;
			}

			return 1; /* so caller does not free context or set anything */
		} else {
			/**
			 * remove this router from our list of registered routers
			 * ie, remove from routers_idx tree
			 **/
			tpp_write_lock(&router_lock);

			pbs_idx_delete(routers_idx, &r->router_addr);
			/*
			 * context will be freed and deleted by router_close_handler
			 * so just free router structure itself
			 */
			free_router(r);

			tpp_unlock_rwlock(&router_lock);
		}

		return 0;
	}
	return 0;
}

/**
 * @brief
 *	Wrapper to the close handle function. This is the one registered to be
 *	called from the IO thread when the IO thread detects a connection loss.
 *
 *	It calls the wrapper "router_close_handler_inner" with a hop count to 1,
 *	since its called "first hand" by the registered function.
 *
 * @par Functionality:
 *	Identify what type of endpoint dropped the connection, and remove it
 *	from the appropriate index (router or leaf). If a leaf or router
 *	was down, inform all the other routers interested about the connection
 *	loss.
 *
 *	If a router went down, then consider all leaves connected directly to
 *	that router to be down, and repeat the process.
 *
 * @param[in] tfd   - The physical connection that went down
 * @param[in] error - Any error that was captured when the connection went down
 * @param[in] c     - The context that was associated with the connection
 * @param[in] extra - The extra data associated with IO connection
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
router_close_handler(int tfd, int error, void *c, void *extra)
{
	int rc;

	if (extra) {
		conn_auth_t *authdata = (conn_auth_t *) extra;
		if (authdata->authctx && authdata->authdef)
			authdata->authdef->destroy_ctx(authdata->authctx);
		if (authdata->authdef != authdata->encryptdef && authdata->encryptctx && authdata->encryptdef)
			authdata->encryptdef->destroy_ctx(authdata->encryptctx);
		if (authdata->config)
			free_auth_config(authdata->config);
		/* DO NOT free authdef here, it will be done in unload_auths() */
		free(authdata);
		tpp_transport_set_conn_extra(tfd, NULL);
	}

	/* set hop to 1 and send to inner */
	if ((rc = router_close_handler_inner(tfd, error, c, 1)) == 0) {
		tpp_transport_set_conn_ctx(tfd, NULL);
		TPP_DBPRT("Freeing context=%p for tfd=%d", c, tfd);
		free(c);
	}
	return rc;
}

/**
 * @brief
 *	The timer handler function registered with the IO thread.
 *
 * @par Functionality
 *	This function is called periodically (after the amount of time as
 *	specified by router_next_event_expiry() function) by the IO thread. This
 *	drives sending notifications to any leaf listen nodes.
 *
 * @retval - next event time
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
router_timer_handler(time_t now)
{
	tpp_ctl_pkt_hdr_t hdr;
	tpp_chunk_t chunks[1];
	int send_update = 0;
	int ret = -1;

	tpp_lock(&lj_lock);
	if (router_last_leaf_joined > 0) {
		if ((now - router_last_leaf_joined) < 3) {
			ret = 3; /* time not yet over, retry in the next 3 seconds */
		} else {
			send_update = 1;
			router_last_leaf_joined = 0;
		}
	}
	tpp_unlock(&lj_lock);

	if (send_update == 1) {
		int len;

		memset(&hdr, 0, sizeof(tpp_ctl_pkt_hdr_t)); /* only to satisfy valgrind */
		hdr.type = TPP_CTL_MSG;
		hdr.code = TPP_MSG_UPDATE;

		len = sizeof(tpp_ctl_pkt_hdr_t);
		chunks[0].data = (void *) &hdr;
		chunks[0].len = len;

		/* broadcast to self connected leaves asking for notification */
		tpp_read_lock(&router_lock);
		broadcast_to_my_leaves(chunks, 1, -1, 1);
		tpp_unlock_rwlock(&router_lock);
	}

	return ret;
}

/**
 * @brief
 *	The pre-send handler registered with the IO thread.
 *
 * @par Functionality
 *	When the IO thread is ready to send out a packet over the wire, it calls
 *	a prior registered "pre-send" handler. This pre-send handler (for routers)
 *	takes care of encrypting data and save unencrypted data for "post-send" handler
 *	in extra data associated with IO connection
 *
 * @param[in] tfd - The actual IO connection on which data was sent (unused)
 * @param[in] pkt - The data packet that is sent out by the IO thrd
 * @param[in] extra - The extra data associated with IO connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
router_pkt_presend_handler(int tfd, tpp_packet_t *pkt, void *c, void *extra)
{
	conn_auth_t *authdata = (conn_auth_t *) extra;

	/*
	 * if presend handler is called from handle_disconnect()
	 * then extra will be NULL and this is just a sending simulation
	 * so no encryption needed
	 */
	if (authdata == NULL || authdata->encryptdef == NULL || pkt == NULL)
		return 0;

	return (tpp_encrypt_pkt(authdata, pkt));
}

/**
 * @brief
 *	Wrapper function for the router to handle incoming data. This
 *  wrapper exists only to detect if the inner function
 *  allocated memory in data_out and free that memory in a
 *  clean way, so that we do not have to add a goto or free
 *  in every return path of the inner function.
 *
 * @param[in] tfd - The physical connection over which data arrived
 * @param[in] buf - The pointer to the received data packet
 * @param[in] len - The length of the received data packet
 * @param[in] c   - The context associated with this physical connection
 * @param[in] extra - The extra data associated with IO connection
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
router_pkt_handler(int tfd, void *buf, int len, void *c, void *extra)
{
	void *data_out = NULL;
	int rc = router_pkt_handler_inner(tfd, buf, &data_out, len, c, extra);
	free(data_out);
	return rc;
}

/**
 * @brief
 *	Inner handler function for the router to handle incoming data. When data
 *	packet arrives, it determines what is the intended destination and
 *	forwards the data packet to that destination.
 *
 * @param[in] tfd - The physical connection over which data arrived
 * @param[in] buf - The pointer to the received data packet
 * @param[out] data_out - The pointer to the newly allocated data buffer, if any
 * @param[in] len - The length of the received data packet
 * @param[in] c   - The context associated with this physical connection
 * @param[in] extra - The extra data associated with IO connection
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
router_pkt_handler_inner(int tfd, void *buf, void **data_out, int len, void *c, void *extra)
{
	tpp_context_t *ctx = (tpp_context_t *) c;
	tpp_data_pkt_hdr_t *dhdr = buf;
	enum TPP_MSG_TYPES type;
	tpp_chunk_t chunks[2];
	tpp_router_t *target_router = NULL;
	int target_fd = -1;
	tpp_addr_t connected_host;
	conn_auth_t *authdata = (conn_auth_t *) extra;
	tpp_addr_t *addr = tpp_get_connected_host(tfd);
	char msg[TPP_GEN_BUF_SZ];
	short rc = -1;

	if (!addr)
		return -1;

	memcpy(&connected_host, addr, sizeof(tpp_addr_t));
	free(addr);

again:
	type = dhdr->type;
	errno = 0;

	if (type >= TPP_LAST_MSG)
		return -1;

	switch (type) {
		case TPP_ENCRYPTED_DATA: {
			int len_out;
			int sz = sizeof(tpp_encrypt_hdr_t);
			if (authdata == NULL) {
				tpp_log(LOG_CRIT, __func__, "tfd=%d, No auth data found", tfd);
				return -1;
			}

			if (authdata->encryptdef == NULL) {
				tpp_log(LOG_CRIT, __func__, "connetion doesn't support decryption of data");
				return -1;
			}

			if (authdata->encryptdef->decrypt_data(authdata->encryptctx, (void *) ((char *) buf + sz), (size_t) len - sz, data_out, (size_t *) &len_out) != 0) {
				return -1;
			}

			if ((len - sz) > 0 && len_out <= 0) {
				tpp_log(LOG_CRIT, __func__, "invalid decrypted data len: %d, pktlen: %d", len_out, len - sz);
				return -1;
			}
			dhdr = *data_out;
			len = len_out;
			goto again;
		} break;

		case TPP_AUTH_CTX: {
			tpp_auth_pkt_hdr_t ahdr = {0};
			size_t len_in = 0;
			void *data_in = NULL;
			conn_auth_t *authdata = (conn_auth_t *) extra;

			memcpy(&ahdr, dhdr, sizeof(tpp_auth_pkt_hdr_t));

			if (authdata == NULL) {
				msg[0] = '\0';
				if (!is_string_in_arr(tpp_conf->supported_auth_methods, ahdr.auth_method))
					snprintf(msg, sizeof(msg), "tfd=%d, Authentication method %s not allowed in connection %s", tfd, ahdr.auth_method, tpp_netaddr(&connected_host));

				else if (strcmp(ahdr.auth_method, AUTH_RESVPORT_NAME) != 0 && get_auth(ahdr.auth_method) == NULL)
					snprintf(msg, sizeof(msg), "tfd=%d, Authentication method not supported in connection %s", tfd, tpp_netaddr(&connected_host));

				else if (ahdr.encrypt_method[0] != '\0' && get_auth(ahdr.encrypt_method) == NULL)
					snprintf(msg, sizeof(msg), "tfd=%d, Encryption method not supported in connection %s", tfd, tpp_netaddr(&connected_host));

				if (msg[0] != '\0') {
					/* error message was set, to take action */
					tpp_log(LOG_CRIT, NULL, msg);
					tpp_send_ctl_msg(tfd, TPP_MSG_AUTHERR, &connected_host, &this_router->router_addr, -1, 0, msg);
					return 0; /* let connection be alive, so we can send error */
				}
			}

			len_in = (size_t) len - sizeof(tpp_auth_pkt_hdr_t);
			data_in = calloc(1, len_in);
			if (data_in == NULL) {
				tpp_log(LOG_CRIT, __func__, "Out of memory allocating authdata credential");
				return -1;
			}
			memcpy(data_in, (char *) dhdr + sizeof(tpp_auth_pkt_hdr_t), len_in);

			if (authdata == NULL) {
				authdata = tpp_make_authdata(tpp_conf, AUTH_SERVER, ahdr.auth_method, ahdr.encrypt_method);
				if (authdata == NULL) {
					/* tpp_make_authdata already logged error */
					free(data_in);
					return -1;
				}
				tpp_transport_set_conn_extra(tfd, authdata);
			}

			rc = tpp_handle_auth_handshake(tfd, tfd, authdata, ahdr.for_encrypt, data_in, len_in);
			if (rc != 1) {
				free(data_in);
				return rc;
			}

			free(data_in);

			if (ahdr.for_encrypt == FOR_ENCRYPT &&
			    strcmp(authdata->config->auth_method, AUTH_RESVPORT_NAME) != 0) {

				if (strcmp(authdata->config->auth_method, authdata->config->encrypt_method) != 0) {
					if (authdata->conn_initiator) {
						rc = tpp_handle_auth_handshake(tfd, tfd, authdata, FOR_AUTH, NULL, 0);
						if (rc != 1) {
							return rc;
						}
					} else
						return 0;
				} else {
					authdata->authctx = authdata->encryptctx;
					authdata->authdef = authdata->encryptdef;
					tpp_transport_set_conn_extra(tfd, authdata);
				}
			}

			if (ctx == NULL) {
				if ((ctx = (tpp_context_t *) malloc(sizeof(tpp_context_t))) == NULL) {
					tpp_log(LOG_CRIT, __func__, "Out of memory allocating tpp context");
					return -1;
				}
				ctx->ptr = NULL;
				ctx->type = TPP_AUTH_NODE; /* denoting that this is an authenticated connection */
			}

			/*
			* associate this router structure (information) with
			* this physical connection
			*/
			tpp_transport_set_conn_ctx(tfd, ctx);

			/* send TPP_CTL_JOIN msg to fellow router */
			return router_send_ctl_join(tfd, dhdr, c);

		} break;

		case TPP_CTL_JOIN: {
			unsigned char hop;
			unsigned char node_type;
			tpp_join_pkt_hdr_t *hdr = (tpp_join_pkt_hdr_t *) dhdr;

			hop = hdr->hop;
			node_type = hdr->node_type;

			if (ctx == NULL) { /* connection not yet authenticated */
				msg[0] = '\0';
				if (extra && strcmp(((conn_auth_t *) extra)->config->auth_method, AUTH_RESVPORT_NAME) != 0) {
					/*
					 * In case of external authentication, ctx must already be set
					 * so error out if ctx is not set.
					 */
					snprintf(msg, sizeof(msg), "tfd=%d Unauthenticated connection from %s", tfd, tpp_netaddr(&connected_host));
				} else {
					if (!is_string_in_arr(tpp_conf->supported_auth_methods, AUTH_RESVPORT_NAME))
						snprintf(msg, sizeof(msg), "tfd=%d, Authentication method %s not allowed in connection %s", tfd, AUTH_RESVPORT_NAME, tpp_netaddr(&connected_host));

					else if (tpp_transport_isresvport(tfd) != 0) /* reserved port based authentication, and is not yet authenticated, so check resv port */
						snprintf(msg, sizeof(msg), "Connection from non-reserved port, rejected");
				}
				if (msg[0] != '\0') {
					/* error message was set above, take action */
					tpp_log(LOG_CRIT, NULL, msg);
					tpp_send_ctl_msg(tfd, TPP_MSG_AUTHERR, &connected_host, &this_router->router_addr, -1, 0, msg);
					return 0; /* let connection be alive, so we can send error */
				}
			}

			/* check if type was router or leaf */
			if (node_type == TPP_ROUTER_NODE) {
				tpp_router_t *r = NULL;
				void *pconn_host = &connected_host;

				TPP_DBPRT("Recvd TPP_CTL_JOIN from pbs_comm node %s, len=%d", tpp_netaddr(&connected_host), len);

				tpp_write_lock(&router_lock);

				/* find associated router */
				pbs_idx_find(routers_idx, &pconn_host, (void **) &r, NULL);
				if (r) {
					if (r->conn_fd != -1) {
						/* this router had not yet disconnected,
						 * so close the existing connection
						 */
						tpp_log(LOG_CRIT, NULL, "tfd=%d, pbs_comm %s is still connected while "
									"another connect arrived, dropping existing connection %d",
							tfd, r->router_name, r->conn_fd);
						tpp_transport_close(r->conn_fd);
						tpp_unlock_rwlock(&router_lock);
						return -1;
					}
				} else {
					r = alloc_router(strdup(tpp_netaddr(&connected_host)), &connected_host);
					if (!r) {
						tpp_unlock_rwlock(&router_lock);
						return -1;
					}
				}
				r->conn_fd = tfd;
				r->initiator = 0;
				r->state = TPP_ROUTER_STATE_CONNECTED;

				tpp_log(LOG_CRIT, NULL, "tfd=%d, pbs_comm %s connected", tfd, tpp_netaddr(&r->router_addr));

				if (ctx == NULL) {
					if ((ctx = (tpp_context_t *) malloc(sizeof(tpp_context_t))) == NULL) {
						tpp_log(LOG_CRIT, __func__, "Out of memory allocating tpp context");
						tpp_unlock_rwlock(&router_lock);
						return -1;
					}
				}
				ctx->ptr = r;
				ctx->type = TPP_ROUTER_NODE;

				/*
				 * associate this router structure (information) with
				 * this physical connection
				 */
				tpp_transport_set_conn_ctx(tfd, ctx);

				/* now send new router info about all leaves I have */
				send_leaves_to_router(this_router, r);

				tpp_unlock_rwlock(&router_lock);
				return 0;

			} else if (node_type == TPP_LEAF_NODE || node_type == TPP_LEAF_NODE_LISTEN) {
				tpp_leaf_t *l = NULL;
				tpp_router_t *r = NULL;
				int found;
				int i;
				int index = (int) hdr->index;
				tpp_addr_t *addrs;
				void *paddr;

				TPP_DBPRT("Recvd TPP_CTL_JOIN FOR LEAF from pbs_comm node %s, len=%d, hop=%d", tpp_netaddr(&connected_host), len, hop);

				if (hdr->num_addrs == 0) {
					/* error, must have atleast one address associated */
					tpp_log(LOG_CRIT, NULL, "tfd=%d, No address associated with join msg from leaf", tfd);
					return -1;
				}
				addrs = (tpp_addr_t *) (((char *) dhdr) + sizeof(tpp_join_pkt_hdr_t));

				tpp_write_lock(&router_lock);

				if (ctx == NULL || ctx->ptr == NULL) {
					/* router is myself */
					r = this_router;
				} else {
					void *pconn_host = &connected_host;
					/* must be a router forwarding leaves from its database to me */

					/* find associated router */
					pbs_idx_find(routers_idx, &pconn_host, (void **) &r, NULL);
					if (!r) {
						char rname[TPP_MAXADDRLEN + 1];

						strcpy(rname, tpp_netaddr(&connected_host));
						tpp_log(LOG_CRIT, NULL, "tfd=%d, Failed to find pbs_comm %s in join for leaf %s", tfd, rname, tpp_netaddr(&addrs[0]));
						tpp_unlock_rwlock(&router_lock);
						return -1;
					}
				}

				/* find the leaf */
				found = 1;
				paddr = &addrs[0];
				pbs_idx_find(cluster_leaves_idx, &paddr, (void **) &l, NULL);
				if (!l) {
					found = 0;
					l = (tpp_leaf_t *) calloc(1, sizeof(tpp_leaf_t));
					if (l)
						l->leaf_addrs = malloc(sizeof(tpp_addr_t) * hdr->num_addrs);

					if (!l || !l->leaf_addrs) {
						free_leaf(l);
						tpp_log(LOG_CRIT, __func__, "Out of memory allocating leaf");
						tpp_unlock_rwlock(&router_lock);
						return -1;
					}

					l->leaf_type = node_type;
					memcpy(l->leaf_addrs, addrs, sizeof(tpp_addr_t) * hdr->num_addrs);
					l->num_addrs = hdr->num_addrs;

					l->conn_fd = -1;
				}

				if (hop == 1) {

					for (i = 0; i < l->num_addrs; i++) {
						tpp_log(LOG_CRIT, NULL, "tfd=%d, Leaf registered address %s", tfd, tpp_netaddr(&l->leaf_addrs[i]));
					}

					if (l->conn_fd != -1) {
						/* this leaf had not yet disconnected,
						 * so close the existing connection.
						 */
						tpp_log(LOG_CRIT, NULL, "tfd=%d, Leaf %s still connected while "
									"another leaf connect arrived, dropping existing connection %d",
							tfd, tpp_netaddr(&l->leaf_addrs[0]), l->conn_fd);
						tpp_transport_close(l->conn_fd);
						tpp_unlock_rwlock(&router_lock);
						return -1;
					}
					l->conn_fd = tfd;

					/*
					 * Set a context only if the JOIN came from a direct connection
					 * from a leaf (hop == 1), and not a forwarded JOIN message.
					 * In case of a forwarded JOIN message, the tfd is associated
					 * with the routers context
					 */
					if (ctx == NULL) {
						if ((ctx = (tpp_context_t *) malloc(sizeof(tpp_context_t))) == NULL) {
							tpp_log(LOG_CRIT, __func__, "Out of memory allocating tpp context");
							tpp_unlock_rwlock(&router_lock);
							return -1;
						}
					}
					ctx->ptr = l;
					ctx->type = l->leaf_type;
					tpp_transport_set_conn_ctx(tfd, ctx);
				}

				TPP_DBPRT("tfd=%d, Router name = %s, address leaf = %p, leaf name=%s, index=%d, hop=%d", tfd, r->router_name, (void *) l, tpp_netaddr(&l->leaf_addrs[0]), (int) index, hop);

				/*
				 * router is not part of leaf's list
				 * of routers already, so add
				 */
				i = add_route_to_leaf(l, r, index);
				if (i == -1) {
					tpp_log(LOG_CRIT, NULL, "tfd=%d, Leaf %s exists!", tfd, tpp_netaddr(&l->leaf_addrs[0]));
					tpp_unlock_rwlock(&router_lock);
					return 0;
				}

				if (pbs_idx_insert(r->my_leaves_idx, &l->leaf_addrs[0], l) != PBS_IDX_RET_OK) {
					tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to add address %s to index of my leaves", tfd, tpp_netaddr(&l->leaf_addrs[0]));
					tpp_unlock_rwlock(&router_lock);
					return -1;
				}

				if (found == 0) {
					int fatal = 0;
					/* add each address to the cluster_leaves_idx tree
					 * since this is the primary "routing table"
					 */
					for (i = 0; i < l->num_addrs; i++) {
						if (pbs_idx_insert(cluster_leaves_idx, &l->leaf_addrs[i], l) != PBS_IDX_RET_OK) {
							void *unused;
							void *pleaf_addr = &l->leaf_addrs[i];
							if (pbs_idx_find(cluster_leaves_idx, &pleaf_addr, &unused, NULL) == PBS_IDX_RET_OK) {
								int k;
								tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to add address %s to cluster-leaves index "
											    "since address already exists, dropping duplicate",
									tfd, tpp_netaddr(&l->leaf_addrs[i]));
								/* remove this address from the list of addresses of the leaf */
								for (k = i; k < (l->num_addrs - 1); k++) {
									l->leaf_addrs[k] = l->leaf_addrs[k + 1];
								}
								l->num_addrs--;

							} else {
								tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to add address %s to cluster-leaves index", tfd, tpp_netaddr(&l->leaf_addrs[i]));
								fatal++;
							}
						}
					}

					if (fatal > 0 || l->num_addrs == 0) {
						tpp_log(LOG_CRIT, NULL, "tfd=%d, Leaf %s had %s problem adding addresses, rejecting connection",
							tfd, tpp_netaddr(&l->leaf_addrs[0]), (fatal > 0) ? "fatal" : "all duplicates");
						tpp_unlock_rwlock(&router_lock);
						return -1;
					}
				}

				if (r == this_router) {
					if (l->leaf_type == TPP_LEAF_NODE_LISTEN) {
						if (pbs_idx_insert(my_leaves_notify_idx, &l->leaf_addrs[0], l) != PBS_IDX_RET_OK) {
							tpp_log(LOG_CRIT, __func__, "tfd=%d, Failed to add address %s to notify-leaves index", tfd, tpp_netaddr(&l->leaf_addrs[0]));
							tpp_unlock_rwlock(&router_lock);
							return -1;
						}
					}
				}

				if (l->leaf_type != TPP_LEAF_NODE_LISTEN) {
					/* listen type leaf nodes might be interested to hear about
					 * the other joined leaves. However don't send it updates
					 * for each leaf; rather set a timer, postponing it each time
					 * we get an update by 2 seconds
					 */
					tpp_lock(&lj_lock);
					router_last_leaf_joined = time(0);
					tpp_unlock(&lj_lock);
				}

				if (hop == 1) {
					/* broadcast to other routers if the hop is 1
					 * while forwarding to next routers, they will
					 * see incremented hop and will only update
					 * their own data structures and will not
					 * forward any further
					 */
					hop++; /* increment hop */
					hdr->hop = hop;

					chunks[0].data = (char *) dhdr;
					chunks[0].len = len;

					/*
					 * broadcast JOIN pkt to other routers,
					 * except from where it came from
					 */
					broadcast_to_my_routers(chunks, 1, tfd);
				}

				tpp_unlock_rwlock(&router_lock);
				return 0;
			}
			return 0;
		} break; /* TPP_CTL_JOIN */

		case TPP_CTL_LEAVE: {
			unsigned char hop;
			tpp_leave_pkt_hdr_t *hdr = (tpp_leave_pkt_hdr_t *) dhdr;

			hop = hdr->hop;

			if (ctx == NULL) {
				TPP_DBPRT("tfd=%d, No context, leaving", tfd);
				return 0;
			}

			TPP_DBPRT("Recvd TPP_CTL_LEAVE message tfd=%d from src=%s, hop=%d, type=%d", tfd, tpp_netaddr(&connected_host), hop, ctx->type);

			if (ctx->type == TPP_LEAF_NODE || ctx->type == TPP_LEAF_NODE_LISTEN) {
				tpp_log(LOG_CRIT, __func__, "tfd=%d, Internal error! TPP_CTL_LEAVE arrived with a leaf context", tfd);
				return -1;

			} else if (ctx->type == TPP_ROUTER_NODE) {
				/*
				 * If a TPP_CTL_LEAVE message comes, its basically
				 * from a leaf, but fd is routers context
				 */
				tpp_leaf_t *l = NULL;
				tpp_addr_t *src_addr = (tpp_addr_t *) (((char *) dhdr) + sizeof(tpp_leave_pkt_hdr_t));

				tpp_write_lock(&router_lock);

				/* find the leaf context to pass to close handler */
				pbs_idx_find(cluster_leaves_idx, (void **) &src_addr, (void **) &l, NULL);
				if (!l) {
					TPP_DBPRT("No leaf %s found", tpp_netaddr(src_addr));
					tpp_unlock_rwlock(&router_lock);
					return 0;
				}

				tpp_unlock_rwlock(&router_lock);

				if ((ctx = (tpp_context_t *) malloc(sizeof(tpp_context_t))) == NULL) {
					tpp_log(LOG_CRIT, __func__, "Out of memory allocating tpp context");
					return -1;
				}
				ctx->ptr = l;
				ctx->type = l->leaf_type;

				router_close_handler_inner(tfd, 0, ctx, hop);

				/* we created the fake context here, so delete it here */
				free(ctx);
			}
			return 0;
		} break; /* TPP_CTL_LEAVE */

		case TPP_MCAST_DATA: {
			int i, k;
			tpp_addr_t *src_host;
			typedef struct {
				int target_fd;	 /* target comm fd */
				int num_streams; /* actual number of destination streams */
				char *router_name;
				void *cmpr_ctx;
				void *minfo_buf; /* allocate size for total members */
			} target_comm_struct_t;

			target_comm_struct_t *rlist = NULL;
			int rsize = 0;
			int csize = 0;
			void *tmp;

			/* find the fd to forward to via the associated router */
			tpp_mcast_pkt_hdr_t *mhdr = (tpp_mcast_pkt_hdr_t *) dhdr;
			unsigned char orig_hop;
			tpp_mcast_pkt_info_t *minfo;
			void *minfo_base = NULL;
			void *info_start = (char *) dhdr + sizeof(tpp_mcast_pkt_hdr_t);
			unsigned int payload_len;
			void *payload;
			unsigned int cmprsd_len = ntohl(mhdr->info_cmprsd_len);
			unsigned int num_streams = ntohl(mhdr->num_streams);
			unsigned int info_len = ntohl(mhdr->info_len);

			if (cmprsd_len > 0) {
				payload_len = len - sizeof(tpp_mcast_pkt_hdr_t) - cmprsd_len;
				payload = ((char *) mhdr) + sizeof(tpp_mcast_pkt_hdr_t) + cmprsd_len;
			} else {
				payload_len = len - sizeof(tpp_mcast_pkt_hdr_t) - info_len;
				payload = ((char *) mhdr) + sizeof(tpp_mcast_pkt_hdr_t) + info_len;
				minfo_base = info_start;
			}

			src_host = &mhdr->src_addr;
			orig_hop = mhdr->hop;

			tpp_log(LOG_INFO, NULL, "tfd=%d, MCAST packet from %s, %u member streams, cmprsd_len=%d, info_len=%d, len=%d",
				tfd, tpp_netaddr(src_host), num_streams, cmprsd_len, info_len, payload_len);

#ifdef PBS_COMPRESSION_ENABLED
			if (cmprsd_len > 0) {
				minfo_base = tpp_inflate(info_start, cmprsd_len, info_len);
				if (minfo_base == NULL) {
					tpp_log(LOG_CRIT, __func__, "Decompression of mcast hdr failed");
					return -1;
				}
			}
#endif

			mhdr->hop = 1; /* set hop=1 to forward, use orig_hop for checking */

			tpp_log(LOG_INFO, __func__, "Total mcast member streams=%d", num_streams);

			/*
			 * go backwards in an attempt to distribute mcast packet
			 * first to other routers and then to local nodes
			 */
			for (k = num_streams - 1; k >= 0; k--) {
				tpp_addr_t *dest_host;
				unsigned int src_sd;
				tpp_leaf_t *l = NULL;

				minfo = (tpp_mcast_pkt_info_t *) (((char *) minfo_base) + k * sizeof(tpp_mcast_pkt_info_t));

				dest_host = &minfo->dest_addr;
				src_sd = ntohl(minfo->src_sd);

				TPP_DBPRT("MCAST data on fd=%u", src_sd);

				tpp_read_lock(&router_lock);
				pbs_idx_find(cluster_leaves_idx, (void **) &dest_host, (void **) &l, NULL);
				if (l == NULL) {
					tpp_unlock_rwlock(&router_lock);
					snprintf(msg, sizeof(msg), "pbs_comm:%s: Dest not found at pbs_comm", tpp_netaddr(&this_router->router_addr));
					log_noroute(src_host, dest_host, src_sd, msg);
					tpp_send_ctl_msg(tfd, TPP_MSG_NOROUTE, src_host, dest_host, src_sd, 0, msg);
					continue;
				}

				/* find a router that is still connected */
				target_router = get_preferred_router(l, this_router, &target_fd);
				tpp_unlock_rwlock(&router_lock);

				if (target_router == NULL) {
					snprintf(msg, sizeof(msg), "pbs_comm:%s: No target pbs_comm found", tpp_netaddr(&this_router->router_addr));
					log_noroute(src_host, dest_host, src_sd, msg);
					tpp_send_ctl_msg(tfd, TPP_MSG_NOROUTE, src_host, dest_host, src_sd, 0, msg);
					continue;
				}

				if (target_router == this_router) {
					tpp_packet_t *pkt = NULL;
					tpp_data_pkt_hdr_t *shdr = NULL;

					pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_data_pkt_hdr_t), 1, (void **) &shdr);
					if (!pkt) {
						tpp_log(LOG_CRIT, __func__, "Failed to build packet");
						goto mcast_err;
					}

					shdr->type = TPP_DATA;
					shdr->src_sd = minfo->src_sd;
					shdr->src_magic = minfo->src_magic;
					shdr->dest_sd = minfo->dest_sd;
					shdr->totlen = mhdr->totlen;
					memcpy(&shdr->src_addr, &mhdr->src_addr, sizeof(tpp_addr_t));
					memcpy(&shdr->dest_addr, &minfo->dest_addr, sizeof(tpp_addr_t));

					if (!tpp_bld_pkt(pkt, payload, payload_len, 1, NULL)) {
						tpp_log(LOG_CRIT, __func__, "Failed to build packet");
						goto mcast_err;
					}

					TPP_DBPRT("Send mcast indiv packet to %s", tpp_netaddr(&shdr->dest_addr));

					if (tpp_transport_vsend(target_fd, pkt) != 0) {
						tpp_log(LOG_ERR, __func__, "Failed to send mcast indiv pkt");
						tpp_transport_close(target_fd);
						goto mcast_err;
					}
				} else if (orig_hop == 0) {
					/* add this to list of routers to whom we need to send */
					/**
					 * now walk list backwards checking if router was already added.
					 * Rationale for checking backwards is that the last router
					 * that we added data to, is probably the one that the next
					 * few nodes are attached to as well.
					 * Might be able to use a hash here for faster search
					 **/
					int found = -1;
					for (i = csize - 1; i >= 0; i--) {
						if (rlist[i].target_fd == target_fd) {
							found = i;
							break;
						}
					}

					if (found == -1) {
						int c_minfo_len;
						if (csize == rsize) {
							/* got to add, but no space */
							tmp = realloc(rlist, sizeof(target_comm_struct_t) * (rsize + RLIST_INC));
							if (!tmp) {
								tpp_log(LOG_CRIT, __func__, "Out of memory resizing pbs_comm list to %lu bytes", (unsigned long) (sizeof(int) * rsize));
								goto mcast_err;
							}
							rsize += RLIST_INC;
							rlist = tmp;
						}
						found = csize++; /* the last index, and increment post */
						memset(&rlist[found], 0, sizeof(target_comm_struct_t));
						rlist[found].target_fd = target_fd;		       /* add this fd to the list of fds to send to */
						rlist[found].router_name = target_router->router_name; /* keep a pointer to the router name */

						/* allocate minfo_buf for this target comm */
						c_minfo_len = sizeof(tpp_mcast_pkt_info_t) * num_streams;
						if (tpp_conf->compress == 1 && c_minfo_len > TPP_COMPR_SIZE) {
							rlist[found].cmpr_ctx = tpp_multi_deflate_init(c_minfo_len);
							if (rlist[found].cmpr_ctx == NULL)
								goto mcast_err;
						} else {
							rlist[found].minfo_buf = malloc(c_minfo_len);
							if (!rlist[found].minfo_buf) {
								tpp_log(LOG_CRIT, __func__, "Out of memory allocating mcast buffer of %d bytes", c_minfo_len);
								goto mcast_err;
							}
						}
					} /* if entry not found */

					/* at this point to have the entry particular target comm */
					/* copy (or compress) the minfo for the target leaf */
					if (rlist[found].cmpr_ctx == NULL) { /* no compression */
						tpp_mcast_pkt_info_t *c_minfo =
							(tpp_mcast_pkt_info_t *) ((char *) rlist[found].minfo_buf + (rlist[found].num_streams * sizeof(tpp_mcast_pkt_info_t)));
						memcpy(c_minfo, minfo, sizeof(tpp_mcast_pkt_info_t));
					} else {
						if (tpp_multi_deflate_do(rlist[found].cmpr_ctx, 0, minfo, sizeof(tpp_mcast_pkt_info_t)) != 0)
							goto mcast_err;
					}

					rlist[found].num_streams++;
				}
			} /* for k streams */

			if (csize > 0) {
				tpp_log(LOG_INFO, __func__, "Total target comms=%d", csize);

				/* finish up the MCAST packets for each target comm and send */
				for (k = 0; k < csize; k++) {
					void *t_minfo_buf = NULL;
					unsigned int t_minfo_len = 0;
					tpp_mcast_pkt_hdr_t *t_mhdr = NULL;
					tpp_packet_t *pkt = NULL;

					pkt = tpp_bld_pkt(NULL, mhdr, sizeof(tpp_mcast_pkt_hdr_t), 1, (void **) &t_mhdr);
					if (!pkt) {
						tpp_log(LOG_CRIT, __func__, "Failed to build packet");
						goto mcast_err;
					}

					t_mhdr->num_streams = htonl(rlist[k].num_streams);
					t_minfo_len = rlist[k].num_streams * sizeof(tpp_mcast_pkt_info_t);
					t_mhdr->info_len = htonl(t_minfo_len);

					/* the router information has been collected in rlist[k] */
					if (rlist[k].cmpr_ctx != NULL) {
						if (tpp_multi_deflate_do(rlist[k].cmpr_ctx, 1, NULL, 0) != 0) /* finish the compression */
							goto mcast_err;
						t_minfo_buf = tpp_multi_deflate_done(rlist[k].cmpr_ctx, &t_minfo_len);
						if (t_minfo_buf == NULL)
							goto mcast_err;
						t_mhdr->info_cmprsd_len = htonl(t_minfo_len);
						rlist[k].cmpr_ctx = NULL; /* done with compression */
					} else {
						t_minfo_buf = rlist[k].minfo_buf;
						t_mhdr->info_cmprsd_len = 0;
					}

					if (!tpp_bld_pkt(pkt, t_minfo_buf, t_minfo_len, 0, NULL)) {
						tpp_log(LOG_CRIT, __func__, "Failed to build packet");
						goto mcast_err;
					}

					if (!tpp_bld_pkt(pkt, payload, payload_len, 1, NULL)) {
						tpp_log(LOG_CRIT, __func__, "Failed to build packet");
						goto mcast_err;
					}

					tpp_log(LOG_INFO, __func__, "Sending MCAST packet to %s, num_streams=%d", rlist[k].router_name, rlist[k].num_streams);
					if (tpp_transport_vsend(rlist[k].target_fd, pkt) != 0)
						tpp_log(LOG_ERR, __func__, "send failed: errno = %d", errno);
				}
			}
		mcast_err:
			if (cmprsd_len > 0)
				free(minfo_base);

			free(rlist); /* minfo_buf which was allocated will be freed when sent */

			tpp_log(LOG_INFO, NULL, "mcast done");

			return 0;
		} break; /* TPP_MCAST_DATA */

		case TPP_DATA:
		case TPP_CLOSE_STRM: {
			tpp_leaf_t *l = NULL;
			tpp_addr_t *src_host, *dest_host;
			tpp_packet_t *pkt = NULL;
			unsigned int src_sd;

			src_host = &dhdr->src_addr;
			dest_host = &dhdr->dest_addr;
			src_sd = ntohl(dhdr->src_sd);

			tpp_read_lock(&router_lock);

			pbs_idx_find(cluster_leaves_idx, (void **) &dest_host, (void **) &l, NULL);
			if (l == NULL) {
				tpp_unlock_rwlock(&router_lock);
				snprintf(msg, sizeof(msg), "tfd=%d, pbs_comm:%s: Dest not found", tfd, tpp_netaddr(&this_router->router_addr));
				log_noroute(src_host, dest_host, src_sd, msg);
				tpp_send_ctl_msg(tfd, TPP_MSG_NOROUTE, src_host, dest_host, src_sd, 0, msg);
				return 0;
			}

			/* find a router that is still connected */
			target_router = get_preferred_router(l, this_router, &target_fd);
			tpp_unlock_rwlock(&router_lock);

			if (target_router == NULL) {
				snprintf(msg, sizeof(msg), "tfd=%d, pbs_comm:%s: No target pbs_comm found", tfd, tpp_netaddr(&this_router->router_addr));
				log_noroute(src_host, dest_host, src_sd, msg);
				tpp_send_ctl_msg(tfd, TPP_MSG_NOROUTE, src_host, dest_host, src_sd, 0, msg);
				return 0;
			}

			pkt = tpp_bld_pkt(NULL, dhdr, len, 1, NULL);
			if (!pkt) {
				tpp_log(LOG_CRIT, __func__, "Failed to build packet");
				return 0;
			}

			rc = tpp_transport_vsend(target_fd, pkt);
			if (rc == -1) {
				tpp_log(LOG_ERR, __func__, "Failed to send TPP_DATA/TPP_CLOSE_STRM");
				tpp_transport_close(target_fd);
			}

			return rc; /* 0 - success, -1 failed, -2 app mbox full */
		} break;	   /* TPP_DATA, TPP_CLOSE_STRM */

		case TPP_CTL_MSG: {
			tpp_ctl_pkt_hdr_t *ehdr = (tpp_ctl_pkt_hdr_t *) dhdr;
			tpp_leaf_t *l = NULL;
			int subtype = ehdr->code;

			if (subtype == TPP_MSG_NOROUTE) {
				char lbuf[TPP_MAXADDRLEN + 1];
				tpp_packet_t *pkt = NULL;
				tpp_addr_t *dest_host = &ehdr->dest_addr;
				char *msg = ((char *) ehdr) + sizeof(tpp_ctl_pkt_hdr_t);

				strcpy(lbuf, tpp_netaddr(&ehdr->dest_addr));
				tpp_log(LOG_WARNING, __func__, "tfd=%d, Recvd TPP_CTL_NOROUTE for message, %s(sd=%d) -> %s: %s",
					tfd, lbuf, ntohl(ehdr->src_sd), tpp_netaddr(&ehdr->src_addr), msg);

				/* find the fd to forward to via the associated router */
				tpp_read_lock(&router_lock);

				pbs_idx_find(cluster_leaves_idx, (void **) &dest_host, (void **) &l, NULL);
				if (l == NULL) {
					tpp_unlock_rwlock(&router_lock);
					return 0;
				}
				/* find a router that is still connected */
				target_router = get_preferred_router(l, this_router, &target_fd);

				tpp_unlock_rwlock(&router_lock);
				if (target_router == NULL) {
					tpp_log(LOG_WARNING, NULL, "tfd=%d, No connections to send TPP_CTL_NOROUTE", tfd);
					return 0;
				}

				pkt = tpp_bld_pkt(NULL, dhdr, len, 1, NULL);
				if (!pkt) {
					tpp_log(LOG_CRIT, __func__, "Failed to build packet");
					return 0;
				}
				if (tpp_transport_vsend(target_fd, pkt) != 0) {
					tpp_log(LOG_ERR, NULL, "tfd=%d, Failed to send pkt type TPP_CTL_NOROUTE", tfd);
					tpp_transport_close(target_fd);
				}
				return 0;
			}
		} break; /* TPP_CTL_MSG */

		default:
			/* no known message type, log and close connection by returning error code */
			tpp_log(LOG_CRIT, __func__, "tfd=%d, Unknown message type = %d", tfd, type);
	} /* switch */

	return -1;
}

/**
 * @brief
 *	Convenience function to get the most preferred route to reach a leaf
 *	If the leaf is directly connected to this router, then the l->conn_fd is
 *	already set, so just use it.
 *	If not, then search in the list of routes for the leaf starting from index
 *	0 (since its sorted on preference), finding a router that is still
 *	connected, i.e., r[i]->conn_fd is not -1.
 *
 * @param[in] - l 	- Pointer to the leaf for which to find route
 * @param[in] - this_router - Pointer to the local router
 * @param[out] - fd - fd of the chosen router
 *
 * @return	Router to be used
 * @retval	NULL  - Could not find a connected router
 * @retval	!NULL  - Success (The router is returned).
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static tpp_router_t *
get_preferred_router(tpp_leaf_t *l, tpp_router_t *this_router, int *fd)
{
	int i;
	tpp_router_t *r = NULL;

	*fd = -1;

	if (l->conn_fd != -1) {
		r = this_router;
		*fd = l->conn_fd;
	} else {

		/*
		 * not directly connected to me, so search for a router
		 * to which it is connected
		 */
		if (l->r) {
			for (i = 0; i < l->tot_routers; i++) {
				if (l->r[i]) {
					if (l->r[i]->conn_fd != -1) {
						r = l->r[i];
						*fd = r->conn_fd;
						break;
					}
				}
			}
		}
	}
	return r;
}

/**
 * @brief
 *	Convenience function to delete a route from a leaf's list of routers at the
 *	specified preference (specified by the index attribute of the leaf, if not -1).
 *
 * @param[in] - l - Pointer to the leaf for which to find route
 * @param[in] - tfd - The fd of the connection involved
 *
 * @return	Error code
 * @retval	NULL    - Failure (Could not find router).
 * @retval	!=NULL  - Success (The router that was removed is returned).
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static tpp_router_t *
del_router_from_leaf(tpp_leaf_t *l, int tfd)
{
	int i;
	tpp_router_t *r = NULL;

	for (i = 0; i < l->tot_routers; i++) {
		if (l->r[i] &&			  /* router exists in this slot */
		    ((l->r[i]->conn_fd == tfd) || /* router fd matches tfd */
		     (l->conn_fd == tfd && l->r[i]->conn_fd == -1))) {
			TPP_DBPRT("Removing pbs_comm %s from leaf %s", l->r[i]->router_name, tpp_netaddr(&l->leaf_addrs[0]));
			r = l->r[i];
			l->r[i] = NULL;
			l->num_routers--;
			if (l->num_routers == 0)
				free(l->r);
			TPP_DBPRT("pbs_comm count for leaf=%s is %d", tpp_netaddr(&l->leaf_addrs[0]), l->num_routers);
			return r;
		}
	}
	return NULL;
}

/**
 * @brief
 *	Convenience function to add a route to a leaf's list of routes at the
 *	specified preference (specified by the index parameter).
 *
 * @param[in] - l - Pointer to the leaf for which to find route
 * @param[in] - r - Pointer to the router to add
 * @param[in] - index - The preference for this route
 *
 * @return	Error code
 * @retval	-1    - Failure (Another router exists at this index).
 * @retval	!=-1  - Success (The router index is returned).
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
add_route_to_leaf(tpp_leaf_t *l, tpp_router_t *r, int index)
{
	/*
	 * Associate the router with the leaf
	 *
	 * put the router in the list of routers of the leaf
	 * at the specified index. The index is important to know
	 * the priority of the router to reach this leaf
	 */
	if (index == -1)
		return -1; /* error - index must be set before calling add route */

	if (index >= l->tot_routers) {
		int sz;
		int i;

		sz = index + 3;
		l->r = realloc(l->r, sz * sizeof(tpp_router_t *));
		for (i = l->tot_routers; i < sz; i++)
			l->r[i] = NULL;
		l->tot_routers = sz;
	}

	l->r[index] = r;
	l->num_routers++;

#ifdef DEBUG
	{
		int i;

		fprintf(stderr, "Leaf %s:%d routers [", tpp_netaddr(&l->leaf_addrs[0]), l->conn_fd);
		for (i = 0; i < l->tot_routers; i++) {
			if (l->r[i] && l->r[i]->router_name)
				fprintf(stderr, "%s:%d,", l->r[i]->router_name, l->r[i]->conn_fd);
		}
		fprintf(stderr, "],router_count=%d\n", l->num_routers);
	}
#endif

	return index;
}

/**
 * @brief
 *	Convenience function to find the index of a router in the leaf's
 *	list of routers associated
 *
 * @param[in] - l - Pointer to the leaf
 * @param[in] - r - Pointer to the router to find
 *
 * @return	Index of the router
 * @retval	-1    - Failure (router not found)
 * @retval	!=-1  - Success (The router index is returned).
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
leaf_get_router_index(tpp_leaf_t *l, tpp_router_t *r)
{
	int i;
	for (i = 0; i < l->tot_routers; i++) {
		if (l->r[i] == r)
			return i;
	}
	return -1;
}

/**
 * @brief
 *	Initializes the Router
 *
 * @par Functionality:
 *	Creates indexes for routers and leaves connected to this router.
 *	Registers the various handlers to be called from the IO thread.
 *	Finally connect to all other routers listed.
 *
 * @see
 *	tpp_transport_init
 *	tpp_transport_set_handlers
 *
 * @param[in] cnf - The tpp configuration structure
 *
 * @return     - The file descriptor that APP must use to monitor for events
 * @retval  -1 - Function failed
 * @retval !-1 - Success, read end of the pipe is returned to APP to monitor
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_init_router(struct tpp_config *cnf)
{
	int j;
	tpp_router_t *r;
	tpp_context_t *ctx = NULL;

	tpp_conf = cnf;

	/* before doing anything else, initialize the key to the tls */
	if (tpp_init_tls_key() != 0) {
		/* can only use prints since tpp key init failed */
		fprintf(stderr, "Failed to initialize tls key\n");
		return -1;
	}

	tpp_init_lock(&lj_lock);
	tpp_init_rwlock(&router_lock);

	routers_idx = pbs_idx_create(0, sizeof(tpp_addr_t));
	if (routers_idx == NULL) {
		tpp_log(LOG_CRIT, __func__, "Failed to create index for pbs comms");
		return -1;
	}

	cluster_leaves_idx = pbs_idx_create(0, sizeof(tpp_addr_t));
	if (cluster_leaves_idx == NULL) {
		tpp_log(LOG_CRIT, __func__, "Failed to create index for cluster leaves");
		return -1;
	}

	my_leaves_notify_idx = pbs_idx_create(0, sizeof(tpp_addr_t));
	if (my_leaves_notify_idx == NULL) {
		tpp_log(LOG_CRIT, __func__, "Failed to create index for leaves requiring notification");
		return -1;
	}

	r = alloc_router(tpp_conf->node_name, NULL);
	if (!r)
		return -1; /* error already logged */

	this_router = r; /* mark this one as this router */

	/* first set the transport handlers */
	tpp_transport_set_handlers(router_pkt_presend_handler, router_pkt_handler, router_close_handler, router_post_connect_handler, router_timer_handler);

	if ((tpp_transport_init(tpp_conf)) == -1)
		return -1;

	/* initiate connections to sister routers */
	j = 0;
	tpp_write_lock(&router_lock);
	while (tpp_conf->routers && tpp_conf->routers[j]) {
		/* add to connection table */

		r = alloc_router(tpp_conf->routers[j], NULL);
		if (!r) {
			tpp_unlock_rwlock(&router_lock);
			return -1; /* error already logged */
		}
		r->initiator = 1;

		/* since we connected we should add a context */
		if ((ctx = (tpp_context_t *) malloc(sizeof(tpp_context_t))) == NULL) {
			tpp_unlock_rwlock(&router_lock);
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating tpp context");
			return -1;
		}
		ctx->ptr = r;
		ctx->type = TPP_ROUTER_NODE;

		tpp_log(LOG_INFO, NULL, "Connecting to pbs_comm %s", tpp_conf->routers[j]);

		if (tpp_transport_connect(tpp_conf->routers[j], 0, ctx, &r->conn_fd) == -1) {
			tpp_unlock_rwlock(&router_lock);
			return -1;
		}

		j++;
	}
	tpp_unlock_rwlock(&router_lock);

	sleep(1);
	return 0;
}

/**
 * @brief
 *	Shuts down the tpp library gracefully
 *
 * @par Functionality
 *	shuts down the IO threads
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_router_shutdown()
{
	tpp_going_down = 1;

	TPP_DBPRT("from pid = %d", getpid());
	tpp_transport_shutdown();

	free_tpp_config(tpp_conf);
}

/**
 * @brief
 *	Terminates (un-gracefully) the tpp library
 *
 * @par Functionality
 *	Typically to be called after a fork. Just a placeholder
 *	function for now. Does not do anything.
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_router_terminate()
{
	return;
}


================================================
FILE: src/lib/Libtpp/tpp_transport.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	tpp_transport.c
 *
 * @brief	The IO layer of the tpp library (drives the IO thread)
 *
 * @par		Functionality:
 *
 *		TPP = TCP based Packet Protocol. This layer uses TCP in a multi-
 *		hop router based network topology to deliver packets to desired
 *		destinations. LEAF (end) nodes are connected to ROUTERS via
 *		persistent TCP connections. The ROUTER has intelligence to route
 *		packets to appropriate destination leaves or other routers.
 *
 *		This is the IO side in the tpp library.
 *		This IO layer is part of all the tpp participants,
 *		both leaves (end-points) and routers.
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <pthread.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <sys/time.h>
#include <signal.h>
#include "pbs_idx.h"
#include "tpp_internal.h"
#include "auth.h"

#define TPP_CONN_DISCONNECTED 1 /* Channel is disconnected */
#define TPP_CONN_INITIATING 2	/* Channel is initiating */
#define TPP_CONN_CONNECTING 3	/* Channel is connecting */
#define TPP_CONN_CONNECTED 4	/* Channel is connected */

int tpp_going_down = 0;

/*
 * Delayed connection queue, to retry connection after
 * specific periods of time
 */
#define TPP_CONN_CONNECT_DELAY 1
typedef struct {
	int tfd;	  /* on which physical connection */
	char cmdval;	  /* cmd type */
	time_t conn_time; /* time at which to connect */
} conn_event_t;

/*
 * The per thread data structure. This library creates a thread-pool of
 * a configuration supplied number of threads. Each thread maintains some
 * information about itself in this structure.
 *
 * The command pipe is a pipe which the thread monitors for incoming events, or
 * commands, so other threads can pass information to it via this pipe.
 *
 */
typedef struct {
	int thrd_index;		  /* thread index for debugging */
	pthread_t worker_thrd_id; /* Thread id of this thread */
	int listen_fd;		  /* If this is the thread that is also doing
				 * the listening, then the listening socket
				 * descriptor
				 */
#ifdef NAS			  /* localmod 149 */
	int nas_tpp_log_enabled;  /* controls the printing of statistics
					 * to the log
					 */
	int NAS_TPP_LOG_PERIOD_A; /* this should be the shortest of the
					 * logging periods, as it is also the
					 * frequency with which we check if
					 * statistics should be printed
					 */
	int NAS_TPP_LOG_PERIOD_B;
	int NAS_TPP_LOG_PERIOD_C;
	time_t nas_last_time_A;
	double nas_kb_sent_A;
	int nas_num_lrg_sends_A;
	int nas_num_qual_lrg_sends_A;
	int nas_max_bytes_lrg_send_A;
	int nas_min_bytes_lrg_send_A;
	double nas_lrg_send_sum_kb_A;
	time_t nas_last_time_B;
	double nas_kb_sent_B;
	int nas_num_lrg_sends_B;
	int nas_num_qual_lrg_sends_B;
	int nas_max_bytes_lrg_send_B;
	int nas_min_bytes_lrg_send_B;
	double nas_lrg_send_sum_kb_B;
	time_t nas_last_time_C;
	double nas_kb_sent_C;
	int nas_num_lrg_sends_C;
	int nas_num_qual_lrg_sends_C;
	int nas_max_bytes_lrg_send_C;
	int nas_min_bytes_lrg_send_C;
	double nas_lrg_send_sum_kb_C;
#endif			       /* localmod 149 */
	void *em_context;      /* the em context */
	tpp_que_t def_act_que; /* The deferred action queue on this thread */
	tpp_mbox_t mbox;       /* message box for this thread */
	tpp_tls_t *tpp_tls;    /* tls data related to tpp work */
} thrd_data_t;

#ifdef NAS /* localmod 149 */
static char tpp_instr_flag_file[_POSIX_PATH_MAX] = "/PBS/flags/tpp_instrumentation";
#endif /* localmod 149 */

static thrd_data_t **thrd_pool; /* array of threads - holds the thread pool */
static int num_threads;		/* number of threads in the thread pool */
static int max_con = MAX_CON;	/* nfiles */

static struct tpp_config *tpp_conf; /* store a pointer to the tpp_config supplied */

/*
 * Save the connection related parameters here, so we don't have to parse
 * each time.
 */
typedef struct {
	char *hostname;	   /* the host name to connect to */
	int port;	   /* the port to connect to */
	int need_resvport; /* bind to resv port? */
} conn_param_t;

/*
 * Structure that holds information about each TCP connection between leaves and
 * router or between routers and routers. A single IO thread can handle multiple
 * such physical connections. We refer to the indexes to the physical
 * connections as "transport fd" or tfd.
 */
typedef struct {
	int sock_fd;	 /* socket fd (TCP) for this physical connection*/
	int lasterr;	 /* last error that was captured on this socket */
	short net_state; /* network status of this connection, up, down etc */
	int ev_mask;	 /* event mask in effect so far */

	conn_param_t *conn_params; /* the connection params */

	tpp_mbox_t send_mbox;	     /* mbox of pkts to send */
	tpp_chunk_t scratch;	     /* scratch to work on incoming data */
	tpp_packet_t *curr_send_pkt; /* current packet dequed from send_mbox to be sent out  */
	thrd_data_t *td;	     /* connections controller thread */

	tpp_context_t *ctx; /* upper layers context information */

	void *extra; /* extra data structure */
} phy_conn_t;

/* structure for holding an array of physical connection structures */
typedef struct {
	int slot_state;	  /* slot is busy or free */
	phy_conn_t *conn; /* the physical connection using this slot */
} conns_array_type_t;

conns_array_type_t *conns_array = NULL; /* array of physical connections */
int conns_array_size = 0;		/* the size of physical connection array */
pthread_rwlock_t cons_array_lock;	/* rwlock used to synchronize array ops */
pthread_mutex_t thrd_array_lock;	/* mutex used to synchronize thrd assignment */

/* function forward declarations */
static void *work(void *v);
static int assign_to_worker(int tfd, int delay, thrd_data_t *td);
static int handle_disconnect(phy_conn_t *conn);
static void handle_incoming_data(phy_conn_t *conn);
static void send_data(phy_conn_t *conn);
static void free_phy_conn(phy_conn_t *conn);
static void handle_cmd(thrd_data_t *td, int tfd, int cmd, void *data);
static short add_pkt(phy_conn_t *conn);
static phy_conn_t *get_transport_atomic(int tfd, int *slot_state);

/**
 * @brief
 *	Enqueue an deferred action
 *
 * @par Functionality
 *	Used for initiating a connection after a delay, or deferred close / reads
 *
 * @param[in] td    - The thread data for the controlling thread
 * @param[in] tfd   - The descriptor of the physical connection
 * @param[in] delay - The amount of time after which event has to be triggered
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
enque_deferred_event(thrd_data_t *td, int tfd, int cmd, int delay)
{
	conn_event_t *conn_ev;
	tpp_que_elem_t *n;
	void *ret;

	conn_ev = malloc(sizeof(conn_event_t));
	if (!conn_ev) {
		tpp_log(LOG_CRIT, __func__, "Out of memory queueing a lazy connect");
		return;
	}
	conn_ev->tfd = tfd;
	conn_ev->cmdval = cmd;
	conn_ev->conn_time = time(0) + delay;

	n = NULL;
	while ((n = TPP_QUE_NEXT(&td->def_act_que, n))) {
		conn_event_t *p;

		p = TPP_QUE_DATA(n);

		/* sorted list, insert before node which has higher time */
		if (p && (p->conn_time >= conn_ev->conn_time))
			break;
	}
	/* insert before this position */
	if (n)
		ret = tpp_que_ins_elem(&td->def_act_que, n, conn_ev, 1);
	else
		ret = tpp_enque(&td->def_act_que, conn_ev);

	if (ret == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory queueing a lazy connect");
		free(conn_ev);
	}
}

/**
 * @brief
 *	Trigger deferred action for those whose time has been reached
 *
 * @param[in] td   - The thread data for the controlling thread
 * @param[in] now  - Current time to check events with
 *
 * @return Wait time for the next deferred event
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
trigger_deferred_events(thrd_data_t *td, time_t now)
{
	conn_event_t *q;
	tpp_que_elem_t *n = NULL;
	int slot_state;
	time_t wait_time = -1;

	while ((n = TPP_QUE_NEXT(&td->def_act_que, n))) {
		q = TPP_QUE_DATA(n);
		if (q == NULL)
			continue;
		if (now >= q->conn_time) {
			(void) get_transport_atomic(q->tfd, &slot_state);
			if (slot_state == TPP_SLOT_BUSY)
				handle_cmd(td, q->tfd, q->cmdval, NULL);

			n = tpp_que_del_elem(&td->def_act_que, n);
			free(q);
		} else {
			wait_time = q->conn_time - now;
			break;
			/*
			 * events are sorted on time,
			 * so if first not fitting, next events wont
			 */
		}
	}
	return wait_time;
}

/**
 * @brief
 * Function called by upper layers to get the "thrd" that
 * is associated with the connection
 *
 * @param[in] tfd - Descriptor to the physical connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void *
tpp_transport_get_thrd_context(int tfd)
{
	thrd_data_t *td = NULL;

	if (tpp_read_lock(&cons_array_lock))
		return NULL;

	if (tfd >= 0 && tfd < conns_array_size) {
		if (conns_array[tfd].conn && conns_array[tfd].slot_state == TPP_SLOT_BUSY)
			td = conns_array[tfd].conn->td;
	}
	tpp_unlock_rwlock(&cons_array_lock);

	return td;
}

/**
 * @brief
 *	Function called by upper layers to get the "user data/context" that
 *	is associated with the connection (this was set earlier)
 *
 * @param[in] tfd - Descriptor to the physical connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void *
tpp_transport_get_conn_ctx(int tfd)
{
	int slot_state;
	phy_conn_t *conn;
	conn = get_transport_atomic(tfd, &slot_state);
	if (conn)
		return conn->ctx;

	return NULL;
}

/**
 * @brief
 *	Function called by upper layers to associate a context (user data) to
 *	the physical connection
 *
 * @param[in] tfd - Descriptor to the physical connection
 * @param[in] ctx - Pointer to the user context
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_transport_set_conn_ctx(int tfd, void *ctx)
{
	int slot_state;
	phy_conn_t *conn;
	conn = get_transport_atomic(tfd, &slot_state);
	if (conn)
		conn->ctx = ctx;
}

/**
 * @brief
 *	Creates a listening socket using platform specific calls
 *
 * @param[in] port - port to bind socket to
 *
 * @return - socket descriptor of server socket
 * @retval   -1 - Failure
 * @retval !=-1 - Socket descriptor of newly created server socket
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_cr_server_socket(int port)
{
	struct sockaddr_in serveraddr;
	int sd;
	int yes = 1;

	serveraddr.sin_family = AF_INET;
	serveraddr.sin_addr.s_addr = INADDR_ANY;
	serveraddr.sin_port = htons(port);
	memset(&(serveraddr.sin_zero), '\0', sizeof(serveraddr.sin_zero));

	if ((sd = tpp_sock_socket(AF_INET, SOCK_STREAM, 0)) == -1) {
		tpp_log(LOG_CRIT, __func__, "tpp_sock_socket() error, errno=%d", errno);
		return -1;
	}
	if (tpp_sock_setsockopt(sd, SOL_SOCKET, SO_REUSEADDR, &yes, sizeof(int)) == -1) {
		tpp_log(LOG_CRIT, __func__, "tpp_sock_setsockopt() error, errno=%d", errno);
		return -1;
	}
	if (tpp_sock_bind(sd, (struct sockaddr *) &serveraddr, sizeof(serveraddr)) == -1) {
		char *msgbuf;
#ifdef HAVE_STRERROR_R
		char buf[TPP_GEN_BUF_SZ];

		if (strerror_r(errno, buf, sizeof(buf)) == 0)
			pbs_asprintf(&msgbuf, "%s while binding to port %d", buf, port);
		else
#endif
			pbs_asprintf(&msgbuf, "Error %d while binding to port %d", errno, port);
		tpp_log(LOG_CRIT, NULL, msgbuf);
		free(msgbuf);
		return -1;
	}
	if (tpp_sock_listen(sd, 1000) == -1) {
		tpp_log(LOG_CRIT, __func__, "tpp_sock_listen() error, errno=%d", errno);
		return -1;
	}
	return sd;
}

/**
 * @brief
 *	Initialize the transport layer.
 *
 * @par Functionality
 *	Does the following:
 *	1. Creates the TLS used for log buffer etc
 *	2. Creates the thread pool of threads, and initialize the threads
 *	3. If the caller is a router node, then assign one thread to also be
 *	   the listening thread. (binds and listens to a port)
 *	4. Create the command pipe of each thread.
 *
 * @param[in] conf - Ptr to the tpp_config passed from upper layers
 *
 * @return Error code
 * @retval -1 - Error
 * @retval  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_init(struct tpp_config *conf)
{
	int i;
	char mbox_name[TPP_MBOX_NAME_SZ];

	if (conf->node_type == TPP_LEAF_NODE || conf->node_type == TPP_LEAF_NODE_LISTEN) {
		if (conf->numthreads != 1) {
			tpp_log(LOG_CRIT, NULL, "Leaves should start exactly one thread");
			return -1;
		}
	} else {
		if (conf->numthreads < 2) {
			tpp_log(LOG_CRIT, NULL, "pbs_comms should have at least 2 threads");
			return -1;
		}
		if (conf->numthreads > 100) {
			tpp_log(LOG_CRIT, NULL, "pbs_comms should have <= 100 threads");
			return -1;
		}
	}

	tpp_log(LOG_INFO, NULL, "Initializing TPP transport Layer");
	if (tpp_init_lock(&thrd_array_lock))
		return -1;

	if (tpp_init_rwlock(&cons_array_lock))
		return -1;

#ifndef WIN32
	/* for unix, set a pthread_atfork handler */
	if (pthread_atfork(tpp_nslookup_atfork_prepare, tpp_nslookup_atfork_parent, tpp_nslookup_atfork_child) != 0) {
		tpp_log(LOG_CRIT, __func__, "tpp nslookup mutex atfork handler failed");
		return -1;
	}
#endif

	tpp_sock_layer_init();

	max_con = tpp_get_nfiles();
	if (max_con < TPP_MAXOPENFD) {
		tpp_log(LOG_WARNING, NULL, "Max files too low - you may want to increase it.");
		if (max_con < 100) {
			tpp_log(LOG_CRIT, NULL, "Max files < 100, cannot continue");
			return -1;
		}
	}
	/* reduce max_con by 1, else on solaris devpoll could fail
	 * See https://community.oracle.com/thread/1915433?start=0&tstart=0.
	 * Snippet from that link..(lest that link goes way).
	 * "We can't monitor our /dev/poll file descriptor using /dev/poll,
	 * so the actual maximum number of file descriptors you can monitor
	 * is OPEN_MAX - 1. Solaris enforces that limit. This breaks other code
	 * out there too, e.g. the libevent library.
	 * Annoying even though it's arguably technically correct".
	 */
	max_con--;

	if (set_pipe_disposition() != 0) {
		tpp_log(LOG_CRIT, __func__, "Could not query SIGPIPEs disposition");
		return -1;
	}

	/* create num_threads worker threads */
	if ((thrd_pool = calloc(conf->numthreads, sizeof(thrd_data_t *))) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating threads");
		return -1;
	}

	for (i = 0; i < conf->numthreads; i++) {
		thrd_pool[i] = calloc(1, sizeof(thrd_data_t));
		if (thrd_pool[i] == NULL) {
			tpp_log(LOG_CRIT, __func__, "Out of memory creating threadpool");
			return -1;
		}
		tpp_invalidate_thrd_handle(&(thrd_pool[i]->worker_thrd_id));
#ifdef NAS /* localmod 149 */
		thrd_pool[i]->nas_tpp_log_enabled = 0;
		thrd_pool[i]->NAS_TPP_LOG_PERIOD_A = 60;
		thrd_pool[i]->NAS_TPP_LOG_PERIOD_B = 300;
		thrd_pool[i]->NAS_TPP_LOG_PERIOD_C = 600;
		thrd_pool[i]->nas_last_time_A = time(0);
		thrd_pool[i]->nas_kb_sent_A = 0.0;
		thrd_pool[i]->nas_num_lrg_sends_A = 0;
		thrd_pool[i]->nas_num_qual_lrg_sends_A = 0;
		thrd_pool[i]->nas_max_bytes_lrg_send_A = 0;
		thrd_pool[i]->nas_min_bytes_lrg_send_A = INT_MAX - 1;
		thrd_pool[i]->nas_lrg_send_sum_kb_A = 0.0;
		thrd_pool[i]->nas_last_time_B = time(0);
		thrd_pool[i]->nas_kb_sent_B = 0.0;
		thrd_pool[i]->nas_num_lrg_sends_B = 0;
		thrd_pool[i]->nas_num_qual_lrg_sends_B = 0;
		thrd_pool[i]->nas_max_bytes_lrg_send_B = 0;
		thrd_pool[i]->nas_min_bytes_lrg_send_B = INT_MAX - 1;
		thrd_pool[i]->nas_lrg_send_sum_kb_B = 0.0;
		thrd_pool[i]->nas_last_time_C = time(0);
		thrd_pool[i]->nas_kb_sent_C = 0.0;
		thrd_pool[i]->nas_num_lrg_sends_C = 0;
		thrd_pool[i]->nas_num_qual_lrg_sends_C = 0;
		thrd_pool[i]->nas_max_bytes_lrg_send_C = 0;
		thrd_pool[i]->nas_min_bytes_lrg_send_C = INT_MAX - 1;
		thrd_pool[i]->nas_lrg_send_sum_kb_C = 0.0;
#endif /* localmod 149 */

		thrd_pool[i]->listen_fd = -1;
		TPP_QUE_CLEAR(&thrd_pool[i]->def_act_que);

		if ((thrd_pool[i]->em_context = tpp_em_init(max_con)) == NULL) {
			tpp_log(LOG_CRIT, __func__, "em_init() error, errno=%d", errno);
			return -1;
		}

		snprintf(mbox_name, sizeof(mbox_name), "Th_%d", (char) i);
		if (tpp_mbox_init(&thrd_pool[i]->mbox, mbox_name, -1) != 0) {
			tpp_log(LOG_CRIT, __func__, "tpp_mbox_init() error, errno=%d", errno);
			return -1;
		}

		if (tpp_mbox_monitor(thrd_pool[i]->em_context, &thrd_pool[i]->mbox) != 0) {
			tpp_log(LOG_CRIT, __func__, "em_mbox_enable_monitoing() error, errno=%d", errno);
			return -1;
		}

		thrd_pool[i]->thrd_index = i;
	}

	if (conf->node_type == TPP_ROUTER_NODE) {
		char *host;
		int port;

		if ((host = tpp_parse_hostname(conf->node_name, &port)) == NULL) {
			tpp_log(LOG_CRIT, __func__, "Out of memory parsing pbs_comm name");
			return -1;
		}
		free(host);

		if ((thrd_pool[0]->listen_fd = tpp_cr_server_socket(port)) == -1) {
			tpp_log(LOG_CRIT, __func__, "pbs_comm socket creation failed");
			return -1;
		}

		if (tpp_em_add_fd(thrd_pool[0]->em_context, thrd_pool[0]->listen_fd, EM_IN) == -1) {
			tpp_log(LOG_CRIT, __func__, "Multiplexing failed");
			return -1;
		}
	}

	tpp_conf = conf;
	num_threads = conf->numthreads;

	for (i = 0; i < conf->numthreads; i++) {
		/* leave the write side of the command pipe to block */
		if (tpp_cr_thrd(work, &(thrd_pool[i]->worker_thrd_id), thrd_pool[i]) != 0) {
			tpp_log(LOG_CRIT, __func__, "Failed to create thread");
			return -1;
		}
	}
	tpp_log(LOG_INFO, NULL, "TPP initialization done");

	return 0;
}

/* the function pointer to the upper layer received packet handler */
int (*the_pkt_handler)(int tfd, void *data, int len, void *ctx, void *extra) = NULL;

/* the function pointer to the upper layer connection close handler */
int (*the_close_handler)(int tfd, int error, void *ctx, void *extra) = NULL;

/* the function pointer to the upper layer connection restore handler */
int (*the_post_connect_handler)(int tfd, void *data, void *ctx, void *extra) = NULL;

/* the function pointer to the upper layer pre packet send handler */
int (*the_pkt_presend_handler)(int tfd, tpp_packet_t *pkt, void *ctx, void *extra) = NULL;

/* upper layer timer handler */
int (*the_timer_handler)(time_t now) = NULL;

/**
 * @brief
 *	Function to register the upper layer handler functions
 *
 * @param[in] pkt_presend_handler  - function ptr to presend handler
 * @param[in] pkt_handler          - function ptr to pkt recvd handler
 * @param[in] close_handler        - function ptr to net close handler
 * @param[in] post_connect_handler - function ptr to post_connect_handler
 * @param[in] timer_handler        - function ptr called periodically
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
tpp_transport_set_handlers(
	int (*pkt_presend_handler)(int tfd, tpp_packet_t *pkt, void *ctx, void *extra),
	int (*pkt_handler)(int tfd, void *data, int len, void *ctx, void *extra),
	int (*close_handler)(int tfd, int error, void *ctx, void *extra),
	int (*post_connect_handler)(int tfd, void *data, void *ctx, void *extra),
	int (*timer_handler)(time_t now))
{
	the_pkt_handler = pkt_handler;
	the_close_handler = close_handler;
	the_post_connect_handler = post_connect_handler;
	the_pkt_presend_handler = pkt_presend_handler;
	the_timer_handler = timer_handler;
}

/**
 * @brief
 *	Allocate a physical connection structure and initialize it
 *
 * @par Functionality
 *	Resize the physical connection array. Uses the mutex cons_array_lock
 *	before it manipulates the global conns_array.
 *
 * @param[in] tfd - The file descriptor to be assigned to the new connection
 *
 * @return  Pointer to the newly allocated physical connection structure
 * @retval NULL - Failure
 * @retval !NULL - Ptr to physical connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static phy_conn_t *
alloc_conn(int tfd)
{
	phy_conn_t *conn;
	char mbox_name[TPP_MBOX_NAME_SZ];

	conn = calloc(1, sizeof(phy_conn_t));
	if (!conn) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating physical connection");
		return NULL;
	}
	conn->sock_fd = tfd;
	conn->extra = NULL;

	snprintf(mbox_name, sizeof(mbox_name), "Conn_%d", conn->sock_fd);
	if (tpp_mbox_init(&conn->send_mbox, mbox_name, TPP_MAX_MBOX_SIZE) != 0) {
		free(conn);
		tpp_log(LOG_CRIT, __func__, "tpp_mbox_init() error, errno=%d", errno);
		return NULL;
	}
	/* initialize the send queue to empty */

	/* set to stream array */
	if (tpp_write_lock(&cons_array_lock)) {
		free(conn);
		return NULL;
	}
	if (tfd >= conns_array_size - 1) {
		int newsize;
		void *p;

		/* resize conns */
		newsize = tfd + 100;
		p = realloc(conns_array, sizeof(conns_array_type_t) * newsize);
		if (!p) {
			free(conn);
			tpp_unlock_rwlock(&cons_array_lock);
			tpp_log(LOG_CRIT, __func__, "Out of memory expanding connection array");
			return NULL;
		}
		conns_array = (conns_array_type_t *) p;

		/* TPP_SLOT_FREE must remain defined as 0, for this memset to work
		 * and automatically set all new slots to FREE. We do not want to
		 * loop over 100 new slots just to set them free!
		 */
		memset(&conns_array[conns_array_size], 0, (newsize - conns_array_size) * sizeof(conns_array_type_t));
		conns_array_size = newsize;
	}
	if (conns_array[tfd].slot_state != TPP_SLOT_FREE) {
		tpp_log(LOG_ERR, __func__, "Internal error - slot not free");
		free(conn);
		tpp_unlock_rwlock(&cons_array_lock);
		return NULL;
	}

	tpp_set_non_blocking(conn->sock_fd);
	tpp_set_close_on_exec(conn->sock_fd);

	if (tpp_set_keep_alive(conn->sock_fd, tpp_conf) == -1) {
		free(conn);
		tpp_unlock_rwlock(&cons_array_lock);
		return NULL;
	}

	conns_array[tfd].slot_state = TPP_SLOT_BUSY;
	conns_array[tfd].conn = conn;

	tpp_unlock_rwlock(&cons_array_lock);

	return conn;
}

/**
 * @brief
 *	Creates a new physical connection between two routers or a router and
 *	a leaf.
 *
 * @param[in] hostname - hostname to connect to
 * @param[in] delay    - Connect after delay of this much seconds
 * @param[in] ctx      - Associate the passed ctx with the connection fd
 * @param[in] tctx     - Transport thrd context of the caller
 * @param[out] ret_tfd - The fd of the connection returned
 *
 * @return  Error code
 * @retval  -1   - Failure
 * @retval   0   - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_connect_spl(char *hostname, int delay, void *ctx, int *ret_tfd, void *tctx)
{
	phy_conn_t *conn;
	int fd;
	char *host;
	int port;

	if ((host = tpp_parse_hostname(hostname, &port)) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory while parsing hostname");
		free(host);
		return -1;
	}

	fd = tpp_sock_socket(AF_INET, SOCK_STREAM, 0);
	if (fd < 0) {
		tpp_log(LOG_CRIT, __func__, "socket() error, errno=%d", errno);
		free(host);
		return -1;
	}

	if (tpp_set_keep_alive(fd, tpp_conf) == -1) {
		tpp_sock_close(fd);
		free(host);
		return -1;
	}

	*ret_tfd = fd;

	conn = alloc_conn(fd);
	if (!conn) {
		tpp_sock_close(fd);
		free(host);
		return -1;
	}

	conn->conn_params = calloc(1, sizeof(conn_param_t));
	if (!conn->conn_params) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating connection params");
		if (tpp_write_lock(&cons_array_lock))
			return -1;
		conns_array[fd].slot_state = TPP_SLOT_FREE;
		conns_array[fd].conn = NULL;
		tpp_unlock_rwlock(&cons_array_lock);
		free_phy_conn(conn);
		tpp_sock_close(fd);
		free(host);
		return -1;
	}
	conn->conn_params->need_resvport = strcmp(tpp_conf->auth_config->auth_method, AUTH_RESVPORT_NAME) == 0;
	conn->conn_params->hostname = host;
	conn->conn_params->port = port;

	conn->sock_fd = fd;
	conn->net_state = TPP_CONN_INITIATING;

	tpp_transport_set_conn_ctx(fd, ctx);

	assign_to_worker(fd, delay, tctx);

	return 0;
}

/**
 * @brief
 *	Wrapper to the call to tpp_transport_connect_spl, It calls
 *	tpp_transport_connect_spl with the tctx parameter as NULL.
 *
 * @param[in] hostname - hostname to connect to
 * @param[in] delay    - Connect after delay of this much seconds
 * @param[in] ctx     - Associate the passed ctx with the connection fd
 * @param[out] ret_tfd - The fd of the connection returned
 *
 * @return  Error code
 * @retval  -1   - Failure
 * @retval   0   - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_connect(char *hostname, int delay, void *ctx, int *ret_tfd)
{
	return tpp_transport_connect_spl(hostname, delay, ctx, ret_tfd, NULL);
}

/**
 * @brief
 *	Helper function to get a transport channel pointer and
 *	slot state in an atomic fashion
 *
 * @par Functionality:
 *	Acquire a lock on the connsarray lock and return the conn pointer and
 *	the slot state
 *
 * @param[in] tfd - The transport descriptor
 * @param[out] slot_state - The state of the slot occupied by this stream
 *
 * @return - Transport channel pointer
 * @retval NULL - Bad stream index/descriptor
 * @retval !NULL - Associated stream pointer
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static phy_conn_t *
get_transport_atomic(int tfd, int *slot_state)
{
	phy_conn_t *conn = NULL;
	*slot_state = TPP_SLOT_FREE;

	if (tpp_read_lock(&cons_array_lock))
		return NULL;

	if (tfd >= 0 && tfd < conns_array_size) {
		conn = conns_array[tfd].conn;
		*slot_state = conns_array[tfd].slot_state;
	}
	tpp_unlock_rwlock(&cons_array_lock);

	return conn;
}

/**
 * @brief
 *	Lock the strmarray lock and send post data on the
 *	threads mbox. The check for the tfd being up,
 *	and the posting of data into the manager thread's mbox
 *	are done as an atomic operation, i.e., under the cons_array_lock.
 *
 * @param[in] tfd - The file descriptor of the connection
 * @param[in] cmd - The cmd to post if conn is up
 * @param[in] pkt - Data associated with the command
 *
 * @return  Error code
 * @retval  -1 - Failure (slot free, or bad tfd)
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	errno is set
 *
 * @par MT-safe: No
 *
 */
static int
tpp_post_cmd(int tfd, char cmd, tpp_packet_t *pkt)
{
	int rc;
	int slot_state;
	phy_conn_t *conn = NULL;
	thrd_data_t *td = NULL;

	errno = 0;

	conn = get_transport_atomic(tfd, &slot_state);
	if (conn)
		td = conn->td;

	if (!conn || slot_state != TPP_SLOT_BUSY || !td) {
		errno = EBADF;
		return -1;
	}

	if (cmd == TPP_CMD_SEND) {
		/* data associated that needs to be sent out, put directly into target mbox */
		/* write to worker threads send pipe */
		rc = tpp_mbox_post(&conn->send_mbox, tfd, cmd, (void *) pkt, pkt->totlen);
		if (rc != 0)
			return rc;
	}

	/* write to worker threads send pipe, to wakeup thread */
	rc = tpp_mbox_post(&td->mbox, tfd, cmd, NULL, 0);
	return rc;
}

/**
 * @brief
 *	Send a wakeup packet (a packet without any data) to the active
 *	transport thread, so that it wakes up and processes any pending
 *	notifications.
 *
 * @param[in] tfd   - The file descriptor of the connection
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_wakeup_thrd(int tfd)
{
	if (tfd < 0)
		return -1;

	if (tpp_post_cmd(tfd, TPP_CMD_WAKEUP, NULL) != 0) {
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Queue data to be sent out by the IO thread. This function can take a
 *	set of data buffers and sends them out after concatenating
 *
 * @param[in] tfd   - The file descriptor of the connection
 * @param[in] chunk - Array of chunks that describes each data buffer
 * @param[in] count - Number of chunks in the array of chunks
 * @param[in] totlen  - total length of data to be sent out
 * @param[in] extra - Extra data to be associated with the data packet
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval  -2 - transport buffers full
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_vsend(int tfd, tpp_packet_t *pkt)
{
	/* compute the length in network byte order for the whole packet */
	tpp_chunk_t *first_chunk = GET_NEXT(pkt->chunks);
	void *p_ntotlen = (void *) (first_chunk->data);
	int wire_len = htonl(pkt->totlen);
	int rc;

	if (tfd < 0) {
		tpp_free_pkt(pkt);
		return -1;
	}

	TPP_DBPRT("sending total length = %d", pkt->totlen);

	/* write the total packet length as the first byte of the packet header
	 * every packet header type has a ntotlen as the exact first element
	 * The total length of all the chunks of the packet is only know at this
	 * function, when all chunks are complete, so we compute the total length
	 * and set to the ntotlen element of the packet header
	 */
	memcpy(p_ntotlen, &wire_len, sizeof(int));

	/* write to worker threads send pipe */
	rc = tpp_post_cmd(tfd, TPP_CMD_SEND, (void *) pkt);
	if (rc != 0) {
		if (rc == -1)
			tpp_log(LOG_CRIT, __func__, "Error writing to thread cmd mbox");
		else if (rc == -2)
			tpp_log(LOG_CRIT, __func__, "thread cmd mbox is full");
		tpp_free_pkt(pkt);
	}
	return rc;
}

/**
 * @brief
 *	Whether the underlying connection is from a reserved port or not
 *
 * @param[in] tfd   - The file descriptor of the connection
 *
 * @return  Error code
 * @retval  -1 - Not associated with a reserved port
 * @retval   0 - Associated with a reserved port
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_isresvport(int tfd)
{
	int slot_state;
	phy_conn_t *conn;

	conn = get_transport_atomic(tfd, &slot_state);
	if (conn == NULL || slot_state != TPP_SLOT_BUSY)
		return -1;

	if (conn->conn_params->port >= 0 && conn->conn_params->port < IPPORT_RESERVED)
		return 0;

	return -1;
}

/**
 * @brief
 *	Assign a physical connection to a thread. A new connection (to be
 *	created) or a new incoming connection is assigned to one of the
 *	existing threads using this function. Assigns connections to a thread
 *	in a round-robin fashion (based on global thrd_index)
 *
 * @param[in] tfd   - The file descriptor of the connection
 * @param[in] delay - Connect/accept this new function only after this delay
 * @param[in] td    - The thread index to which to assign the conn to
 *
 * @return	Error code
 * @retval	1	Failure
 * @retval	0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
assign_to_worker(int tfd, int delay, thrd_data_t *td)
{
	int slot_state;
	phy_conn_t *conn;
	int thrd_index = 0;

	conn = get_transport_atomic(tfd, &slot_state);
	if (conn == NULL || slot_state != TPP_SLOT_BUSY)
		return 1;

	if (conn->td != NULL)
		tpp_log(LOG_CRIT, __func__, "ERROR! tfd=%d conn_td=%p, conn_td_index=%d, thrd_td=%p, thrd_td_index=%d", tfd, conn->td, conn->td->thrd_index, td, td ? td->thrd_index : -1);

	if (td == NULL) {
		if (tpp_lock(&thrd_array_lock)) {
			return 1;
		}
		/* find a thread index to assign to, since none provided */
		if (num_threads > 1)
			thrd_index = 1 + (tfd % (num_threads - 1));
		conn->td = thrd_pool[thrd_index];
		tpp_unlock(&thrd_array_lock);
	} else
		conn->td = td;

	if (tpp_mbox_post(&conn->td->mbox, tfd, TPP_CMD_ASSIGN, (void *) (long) delay, 0) != 0)
		tpp_log(LOG_CRIT, __func__, "tfd=%d, Error writing to mbox", tfd);

	return 0;
}

/**
 * @brief
 *	Add (a new) or accept (incoming) a transport connection.
 *
 *	In case of creating a new connection, it binds to a reserved port if
 *	the authentication is set to priv_fd.
 *
 * @param[in] conn - The physical connection structure, to initiate or to
 *                   accept.
 *
 * @return  Error code
 * @retval  -1 - Failure
 * @retval   0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static int
add_transport_conn(phy_conn_t *conn)
{
	if (conn->net_state == TPP_CONN_INITIATING) {

		int fd = conn->sock_fd;

		/* authentication */
		if (conn->conn_params->need_resvport) {
			int tryport;
			int start;
			int rc = -1;

			srand(time(NULL));
			start = (rand() % (IPPORT_RESERVED - 1)) + 1;
			tryport = start;

			while (1) {
				struct sockaddr_in serveraddr;
				/* bind this socket to a reserved port */
				serveraddr.sin_family = AF_INET;
				serveraddr.sin_addr.s_addr = INADDR_ANY;
				serveraddr.sin_port = htons(tryport);
				memset(&(serveraddr.sin_zero), '\0', sizeof(serveraddr.sin_zero));
				if ((rc = tpp_sock_bind(fd, (struct sockaddr *) &serveraddr, sizeof(serveraddr))) != -1)
					break;
				if ((errno != EADDRINUSE) && (errno != EADDRNOTAVAIL))
					break;

				--tryport;
				if (tryport <= 0)
					tryport = IPPORT_RESERVED;
				if (tryport == start)
					break;
			}
			if (rc == -1) {
				tpp_log(LOG_WARNING, NULL, "No reserved ports available");
				return (-1);
			}
		}

		conn->net_state = TPP_CONN_CONNECTING;

		conn->ev_mask = EM_OUT | EM_ERR | EM_HUP;
		TPP_DBPRT("New socket, Added EM_OUT to ev_mask, now=%x", conn->ev_mask);
		if (tpp_em_add_fd(conn->td->em_context, conn->sock_fd, conn->ev_mask) == -1) {
			tpp_log(LOG_ERR, __func__, "Multiplexing failed");
			return -1;
		}

		if (tpp_sock_attempt_connection(conn->sock_fd, conn->conn_params->hostname, conn->conn_params->port) == -1) {
			if (errno != EINPROGRESS && errno != EWOULDBLOCK && errno != EAGAIN) {
				char *msgbuf;
#ifdef HAVE_STRERROR_R
				char buf[TPP_GEN_BUF_SZ];

				if (strerror_r(errno, buf, sizeof(buf)) == 0)
					pbs_asprintf(&msgbuf, "%s while connecting to %s:%d", buf, conn->conn_params->hostname, conn->conn_params->port);
				else
#endif
					pbs_asprintf(&msgbuf, "Error %d while connecting to %s:%d", errno, conn->conn_params->hostname, conn->conn_params->port);
				tpp_log(LOG_ERR, NULL, msgbuf);
				free(msgbuf);
				return -1;
			}
		} else {
			TPP_DBPRT("phy_con %d connected", fd);
			conn->net_state = TPP_CONN_CONNECTED;

			/* since we connected, remove EM_OUT from the list and add EM_IN */
			conn->ev_mask = EM_IN | EM_ERR | EM_HUP;
			TPP_DBPRT("Connected, Removed EM_OUT and added EM_IN to ev_mask, now=%x", conn->ev_mask);
			if (tpp_em_mod_fd(conn->td->em_context, conn->sock_fd, conn->ev_mask) == -1) {
				tpp_log(LOG_CRIT, __func__, "Multiplexing failed");
				return -1;
			}
			if (the_post_connect_handler) {
				if (the_post_connect_handler(fd, NULL, conn->ctx, conn->extra)) {
					/* e.g.: the tpp_handle_auth_handshake could have failed */
					tpp_log(LOG_CRIT, __func__, "the_post_connect_handler failed");
					return -1;
				}
			}
		}
	} else if (conn->net_state == TPP_CONN_CONNECTED) { /* accepted socket */
		/* since we connected, remove EM_OUT from the list and add EM_IN */
		conn->ev_mask = EM_IN | EM_ERR | EM_HUP;
		TPP_DBPRT("Connected, Removed EM_OUT and added EM_IN to ev_mask, now=%x", conn->ev_mask);

		/* add it to my own monitored list */
		if (tpp_em_add_fd(conn->td->em_context, conn->sock_fd, conn->ev_mask) == -1) {
			tpp_log(LOG_ERR, __func__, "Multiplexing failed");
			return -1;
		}

		TPP_DBPRT("Phy Con %d accepted", conn->sock_fd);
	} else {
		tpp_log(LOG_CRIT, __func__, "Bad net state - internal error");
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Handle a command sent to this thread by its monitored pipe fd
 *
 * @par Functionality
 *	Commands:
 *	TPP_CMD_EXIT: The thread is being asked to exit, close all connections
 *		      and then exit this thread
 *
 *	TPP_CMD_ASSIGN: Assign new connection (incoming) or add a
 *			to-be-created connection to this thread
 *
 *	TPP_CMD_SEND: Accept data from APP thread to be sent by this thread
 *
 * @param[in] td    - The threads data pointer
 * @param[in] tfd   - The tfd associated with this command
 * @param[in] cmd   - The command to execute (listed above)
 * @param[in] data  - The data (in case of send) to be sent
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
handle_cmd(thrd_data_t *td, int tfd, int cmd, void *data)
{
	int slot_state;
	phy_conn_t *conn;
	conn_event_t *conn_ev;
	int num_cons = 0;

	conn = get_transport_atomic(tfd, &slot_state);

	if (conn && (conn->td != td))
		tpp_log(LOG_CRIT, __func__, "ERROR! tfd=%d conn_td=%p, conn_td_index=%d, thrd_td=%p, thrd_td_index=%d, cmd=%d", tfd, conn->td, conn->td->thrd_index, td, td->thrd_index, cmd);

	if (cmd == TPP_CMD_CLOSE) {
		handle_disconnect(conn);

	} else if (cmd == TPP_CMD_EXIT) {
		int i;

		for (i = 0; i < conns_array_size; i++) {
			conn = get_transport_atomic(i, &slot_state);
			if (slot_state == TPP_SLOT_BUSY && conn->td == td) {
				/* stream belongs to this thread */
				num_cons++;
				handle_disconnect(conn);
			}
		}

		tpp_mbox_destroy(&td->mbox);
		if (td->listen_fd > -1)
			tpp_sock_close(td->listen_fd);

		/* clean up the lazy conn queue */
		while ((conn_ev = tpp_deque(&td->def_act_que)))
			free(conn_ev);

		tpp_log(LOG_INFO, NULL, "Thrd exiting, had %d connections", num_cons);

		/* destory the AVL tls */
		free_avl_tls();

		pthread_exit(NULL);
		/* no execution after this */

	} else if ((cmd == TPP_CMD_ASSIGN) || (cmd == TPP_CMD_CONNECT)) {
		int delay = (int) (long) data;

		if (conn == NULL || slot_state != TPP_SLOT_BUSY) {
			tpp_log(LOG_WARNING, __func__, "Phy Con %d (cmd = %d) already deleted/closing", tfd, cmd);
			return;
		}
		if ((delay == 0) || (cmd == TPP_CMD_CONNECT)) {
			if (add_transport_conn(conn) != 0) {
				handle_disconnect(conn);
			}
		} else {
			enque_deferred_event(td, tfd, TPP_CMD_CONNECT, delay);
		}

	} else if (cmd == TPP_CMD_SEND) {
		tpp_packet_t *pkt = (tpp_packet_t *) data;

		if (conn == NULL || slot_state != TPP_SLOT_BUSY) {
			tpp_log(LOG_WARNING, __func__, "Phy Con %d (cmd = %d) already deleted/closing", tfd, cmd);
			tpp_free_pkt(pkt);
			return;
		}

		/* handle socket add calls */
		send_data(conn);

	} else if (cmd == TPP_CMD_READ) {
		add_pkt(conn);
	}
}

/**
 * @brief
 *	Return the threads index from the tls located thread data
 *
 * @return - Thread index of the calling thread
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_get_thrd_index()
{
	tpp_tls_t *tls;
	thrd_data_t *td;
	if ((tls = tpp_get_tls()) == NULL)
		return -1;

	td = (thrd_data_t *) (tpp_get_tls()->td);
	if (td == NULL)
		return -1;

	return td->thrd_index;
}

/**
 * @brief
 *	This is the IO threads "thread-function". It includes a loop of
 *	waiting for monitored piped, sockets etc, and it drives the various
 *	functionality that the IO thread does.
 *
 * @par Functionality
 *	- Creates a event monitor context
 *	- Adds the cmd socket to the event monitor set
 *	- Adds the listening socket fd (if listening thread for router) to set
 *	- Checks if any event is outstanding in event queue for this thread
 *	  and if so, dispatches them
 *	- Calls the_event_expiry_handler to find how long the next event is
 *	  places at the upper layer
 *	- Waits on em wait for the duration determined from previous step
 *	- When em_wait is woken by a event, handles that event.
 *		- Handle command sent by another thread, like
 *			- Create a new connection
 *			- Send data over a connection etc
 *			- Close a thread
 *		- Accept incoming new connections (if a listening thread)
 *		- Accept data from peer and call upper layer handler
 *		- Detect closure of socket event and call upper layer handler
 *
 * @param[in] v - The thrd_data pointer passed by the init function that created
 *		  the threads. (Basically a pointer to its own thread_data).
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void *
work(void *v)
{
	thrd_data_t *td = (thrd_data_t *) v;
	int newfd;
	int i;
	int cmd;
	void *data;
	unsigned int tfd;
	em_event_t *events;
	phy_conn_t *conn;
	int slot_state;
	struct sockaddr clientaddr;
	int new_connection = 0;
	int timeout, timeout2;
	time_t now;
	tpp_tls_t *ptr;
#ifndef WIN32
	int rc;
	sigset_t blksigs;
#endif

	/*
	 * Get the tls for this thread and store the passed thread data
	 * as a pointer in our own tls. This is for use in functions
	 * where we cannot pass the thread data as a parameter
	 */
	ptr = tpp_get_tls();
	if (!ptr) {
		fprintf(stderr, "Out of memory getting thread specific storage\n");
		return NULL;
	}
	ptr->td = (void *) td;
	td->tpp_tls = ptr; /* store allocated area for tls into td to free at shutdown/terminate */

#ifndef WIN32
	/* block a certain set of signals that we do not care about in this IO thread
	 * A signal directed to a multi-threaded program can be delivered to any thread
	 * which has a unblocked signal mask for that signal. This could cause havoc for
	 * for signal handler which are not supposed to be called from this IO thread.
	 * (example the SIGHUP handler for scheduler). Signals like SIGALRM and hardware
	 * generated signals (like SIGBUS and SIGSEGV) are always delivered to the
	 * thread that generated it (so they are thread specific anyway).
	 */
	sigemptyset(&blksigs);
	sigaddset(&blksigs, SIGHUP);
	sigaddset(&blksigs, SIGINT);
	sigaddset(&blksigs, SIGTERM);

	if ((rc = pthread_sigmask(SIG_BLOCK, &blksigs, NULL)) != 0) {
		tpp_log(LOG_CRIT, NULL, "Failed in pthread_sigmask, errno=%d", rc);
		return NULL;
	}
#endif
	tpp_log(LOG_CRIT, NULL, "Thread ready");

	/* start processing loop */
	for (;;) {
		int nfds;

		while (1) {
			now = time(0);

			/* trigger all delayed events, and return the wait time till the next one to trigger */
			timeout = trigger_deferred_events(td, now);
			if (the_timer_handler) {
				timeout2 = the_timer_handler(now);
			} else {
				timeout2 = -1;
			}

			if (timeout2 != -1) {
				if (timeout == -1 || timeout2 < timeout)
					timeout = timeout2;
			}

			if (timeout != -1) {
				timeout = timeout * 1000; /* milliseconds */
			}

			errno = 0;
			nfds = tpp_em_wait(td->em_context, &events, timeout);
			if (nfds <= 0) {
				if (!(errno == EINTR || errno == EINPROGRESS || errno == EAGAIN || errno == 0)) {
					tpp_log(LOG_ERR, __func__, "em_wait() error, errno=%d", errno);
				}
				continue;
			} else
				break;
		} /* loop around em_wait */

		new_connection = 0;

		/* check once more if cmd_pipe has any more data */
		while (tpp_mbox_read(&td->mbox, &tfd, &cmd, &data) == 0)
			handle_cmd(td, tfd, cmd, data);

		for (i = 0; i < nfds; i++) {

			int em_fd;
			int em_ev;

			em_fd = EM_GET_FD(events, i);
			em_ev = EM_GET_EVENT(events, i);

			/**
			 * at each iteration clear the command pipe, to
			 * avoid a deadlock between threads
			 **/
			while (tpp_mbox_read(&td->mbox, &tfd, &cmd, &data) == 0)
				handle_cmd(td, tfd, cmd, data);

			if (em_fd == td->listen_fd) {
				new_connection = 1;
			} else {
				conn = get_transport_atomic(em_fd, &slot_state);
				if (conn == NULL || slot_state != TPP_SLOT_BUSY)
					continue;

				if ((em_ev & EM_HUP) || (em_ev & EM_ERR)) {
					/*
					 * platforms differ in terms of when HUP or ERR is set
					 * best is to allow read to determine whether it was
					 * really a end of file
					 */
					handle_incoming_data(conn);
				} else {

					if (em_ev & EM_IN) {
						/* handle existing connections for data or closure */
						handle_incoming_data(conn);
					}

					if (em_ev & EM_OUT) {

						if (conn->net_state == TPP_CONN_CONNECTING) {
							/* check to see if the connection really completed */
							int result;
							pbs_socklen_t result_len = sizeof(result);

							if (tpp_sock_getsockopt(conn->sock_fd, SOL_SOCKET, SO_ERROR, &result, &result_len) != 0) {
								TPP_DBPRT("phy_con %d getsockopt failed", conn->sock_fd);
								handle_disconnect(conn);
								continue;
							}
							if (result == EAGAIN || result == EINPROGRESS) {
								/* not yet connected, ignore the EM_OUT */
								continue;
							} else if (result != 0) {
								/* non-recoverable error occurred, eg, ECONNRESET, so disconnect */
								TPP_DBPRT("phy_con %d disconnected", conn->sock_fd);
								handle_disconnect(conn);
								continue;
							}

							/* connected, finally!!! */
							conn->net_state = TPP_CONN_CONNECTED;

							if (the_post_connect_handler) {
								if (the_post_connect_handler(conn->sock_fd, NULL, conn->ctx, conn->extra)) {
									/* e.g.: the tpp_handle_auth_handshake could have failed */
									TPP_DBPRT("phy_con %d disconnected", conn->sock_fd);
									handle_disconnect(conn);
									continue;
								}
							}
							TPP_DBPRT("phy_con %d connected", conn->sock_fd);
						}

						/* since we connected, remove EM_OUT from the list and add EM_IN */
						conn->ev_mask = EM_IN | EM_ERR | EM_HUP;
						TPP_DBPRT("Connected, Removed EM_OUT and added EM_IN to ev_mask, now=%x", conn->ev_mask);
						if (tpp_em_mod_fd(conn->td->em_context, conn->sock_fd, conn->ev_mask) == -1) {
							tpp_log(LOG_ERR, __func__, "Multiplexing failed");
							return NULL;
						}
						send_data(conn);
					}
				}
			}
		}

		if (new_connection == 1) {
			pbs_socklen_t addrlen = sizeof(clientaddr);
			if ((newfd = tpp_sock_accept(td->listen_fd, (struct sockaddr *) &clientaddr, &addrlen)) == -1) {
				tpp_log(LOG_ERR, NULL, "tpp_sock_accept() error, errno=%d", errno);
				if (errno == EMFILE) {
					/* out of files, sleep couple of seconds to avoid error coming in loop */
					sleep(2);
				}
				continue;
			}

			conn = alloc_conn(newfd);
			if (!conn) {
				tpp_log(LOG_CRIT, __func__, "Allocating socket connection failed.");
				tpp_sock_close(newfd);
				return NULL;
			}

			conn->net_state = TPP_CONN_CONNECTED;

			conn->conn_params = calloc(1, sizeof(conn_param_t));
			if (!conn->conn_params) {
				tpp_log(LOG_CRIT, __func__, "Out of memory allocating connection params");
				if (tpp_write_lock(&cons_array_lock))
					return NULL;
				conns_array[newfd].slot_state = TPP_SLOT_FREE;
				conns_array[newfd].conn = NULL;
				tpp_unlock_rwlock(&cons_array_lock);
				free_phy_conn(conn);
				tpp_sock_close(newfd);
				return NULL;
			}
			conn->conn_params->need_resvport = strcmp(tpp_conf->auth_config->auth_method, AUTH_RESVPORT_NAME) == 0;
			conn->conn_params->hostname = strdup(tpp_netaddr_sa(&clientaddr));
			conn->conn_params->port = ntohs(((struct sockaddr_in *) &clientaddr)->sin_port);

			/**
			 *  accept socket, and add socket to stream, assign stream to
			 * thread, and write to that thread control pipe
			 **/
			assign_to_worker(newfd, 0, NULL); /* time 0 means no delay */
		}
	}
	return NULL;
}

/**
 * @brief
 *	Function to close a transport layer connection.
 *
 * @param[in] tfd - The connection descriptor to be closed
 *
 * @retval 0  - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_close(int tfd)
{
	/* write to worker threads send pipe */
	if (tpp_post_cmd(tfd, TPP_CMD_CLOSE, NULL) != 0)
		return -1;

	return 0;
}

/**
 * @brief
 *	handle a disconnect notification by calling the upper layer
 *	close_handler. Called from the thread main loop inside work().
 *
 * @param[in] conn - The physical connection that was disconnected
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 * @return Error code
 * @retval	1	Failure
 * @retval	0	Succeess
 */
static int
handle_disconnect(phy_conn_t *conn)
{
	int error;
	short cmd;
	int tfd;
	tpp_packet_t *pkt;
	pbs_socklen_t len = sizeof(error);
	tpp_que_elem_t *n = NULL;

	if (conn == NULL || conn->net_state == TPP_CONN_DISCONNECTED)
		return 1;

	if (conn->net_state == TPP_CONN_CONNECTING || conn->net_state == TPP_CONN_CONNECTED) {
		if (tpp_em_del_fd(conn->td->em_context, conn->sock_fd) == -1) {
			tpp_log(LOG_ERR, __func__, "Multiplexing failed");
			return 1;
		}
	}
	tpp_sock_getsockopt(conn->sock_fd, SOL_SOCKET, SO_ERROR, &error, &len);

	conn->net_state = TPP_CONN_DISCONNECTED;
	conn->lasterr = error;

	tfd = conn->sock_fd; /* store this since close_handler could unset this */

	if (the_close_handler)
		the_close_handler(conn->sock_fd, error, conn->ctx, conn->extra);

	conn->extra = NULL;

	if (tpp_write_lock(&cons_array_lock))
		return 1;

	/*
	 * Since we are freeing the socket connection we must
	 * empty any pending commands that were in this thread's
	 * mbox (since this thread is the connection's manager
	 *
	 */
	n = NULL;
	while (tpp_mbox_clear(&conn->td->mbox, &n, tfd, &cmd, (void **) &pkt) == 0)
		tpp_free_pkt(pkt);

	conns_array[tfd].slot_state = TPP_SLOT_FREE;
	conns_array[tfd].conn = NULL;

	tpp_unlock_rwlock(&cons_array_lock);

	/* free old connection */
	free_phy_conn(conn);
	tpp_sock_close(tfd);

	return 0;
}

/**
 * @brief
 *	handle incoming data using the scratch space which is part of each
 *	connection structure. Resize the scratch space if required.
 *
 *	Receive data as much as available, check if a packet can be formed, if
 *	so, then call app_pkts to form packets and send to the upper layer to
 *	be processed.
 *
 * @param[in] conn - The physical connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
handle_incoming_data(phy_conn_t *conn)
{
	int torecv = 0;
	int space_left;
	int offset;
	int closed;
	int pkt_len;
	char *p;
	ssize_t rc;

	while (1) {
		offset = conn->scratch.pos - conn->scratch.data;
		space_left = conn->scratch.len - offset; /* remaining space */
		if (space_left == 0) {
			/* resize buffer */
			if (conn->scratch.len == 0)
				conn->scratch.len = TPP_SCRATCHSIZE;
			else {
				conn->scratch.len += TPP_SCRATCHSIZE;
				tpp_log(LOG_INFO, __func__, "Increased scratch size for tfd=%d to %d", conn->sock_fd, conn->scratch.len);
			}
			p = realloc(conn->scratch.data, conn->scratch.len);
			if (!p) {
				tpp_log(LOG_CRIT, __func__, "Out of memory resizing scratch data");
				return;
			}
			conn->scratch.data = p;
			conn->scratch.pos = conn->scratch.data + offset;
			space_left = conn->scratch.len - offset;
		}

		if (offset > sizeof(int)) {
			pkt_len = ntohl(*((int *) conn->scratch.data));
			torecv = pkt_len - offset; /* offset amount of data already received */
			TPP_DBPRT("tfd=%d, Need to receive: pkt_len=%d, torecv=%d, space_left=%d bytes", conn->sock_fd, pkt_len, torecv, space_left);
			if (torecv > space_left)
				torecv = space_left;
		} else {
			/*
			 * we are starting to read a new packet now
			 * so we try to read the length part only first
			 * so we know how much more to read this is to
			 * avoid reading more than one packet, to eliminate memmoves
			 */
			torecv = sizeof(int) + sizeof(char) - offset; /* also read the type character */
			pkt_len = 0;
		}

		/* receive as much as we can */
		closed = 0;
		while (torecv > 0) {
			rc = tpp_sock_recv(conn->sock_fd, conn->scratch.pos, torecv, 0);
			if (rc == 0) {
				closed = 1; /* received close */
				break;
			}
			if (rc < 0) {
				if (errno != EWOULDBLOCK && errno != EAGAIN) {
					handle_disconnect(conn);
					return; /* error case - don't even process data */
				}
				break;
			}
			torecv -= rc;
			conn->scratch.pos += rc;
		}

		if (closed == 1) {
			handle_disconnect(conn);
			return;
		}
		if (torecv > 0) /* did not receive full data, do not try any more */
			break;

		if (add_pkt(conn) != 0)
			return;
	}
}

/**
 * @brief
 *	Add a packet to the receivers buffer or if buffer is full
 *  add a deffered action, so that it can be checked later
 *
 * @param[in] conn - The physical connection
 * 
 * @return Error code
 * @retval 0 - Success
 * @retval -1 - Failure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static short
add_pkt(phy_conn_t *conn)
{
	int avl_len;
	int pkt_len;

	avl_len = conn->scratch.pos - conn->scratch.data;
	if (avl_len >= sizeof(int)) {
		pkt_len = ntohl(*((int *) conn->scratch.data));
		if (pkt_len < avl_len) {
			/* some data corruption has happened, or sombody trying DOS */
			tpp_log(LOG_CRIT, __func__, "tfd=%d, Critical error in protocol header, pkt_len=%d, avl_len=%d, dropping connection", conn->sock_fd, pkt_len, avl_len);
			handle_disconnect(conn);
			return -1; /* treat as bad data rejected by upper layer */
		}
		if (avl_len == pkt_len) {
			/* we got a full packet */
			if (the_pkt_handler) {
				if (the_pkt_handler(conn->sock_fd, conn->scratch.data, pkt_len, conn->ctx, conn->extra) != 0) {
					/* upper layer rejected data, disconnect */
					handle_disconnect(conn);
					return -1;
				}
			}

			/*
			* no need to memmove or coalesce the data, since we would have read
			* just enough for a packet, so, just reset pointers
			*/
			conn->scratch.pos = conn->scratch.data;
		}
	}
	return 0;
}

/**
 * @brief
 *	Loop over the list of queued data and send out packet by packet
 *	Stop if sending would block.
 *
 * @param[in] conn - The physical connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
send_data(phy_conn_t *conn)
{
	tpp_chunk_t *p = NULL;
	tpp_packet_t *pkt = NULL;
	ssize_t rc;
	int curr_pkt_done = 0;
	size_t tosend;

	/*
	 * if a socket is still connecting, we will wait to send out data,
	 * even if app called close - so check this first
	 */
	if ((conn->net_state == TPP_CONN_CONNECTING) || (conn->net_state == TPP_CONN_INITIATING))
		return;

	while ((conn->ev_mask & EM_OUT) == 0) {
		rc = 0;
		curr_pkt_done = 0;

		pkt = conn->curr_send_pkt;
		if (!pkt) {
			/* get the next packet from send_mbox */
			if (tpp_mbox_read(&conn->send_mbox, NULL, NULL, (void **) &conn->curr_send_pkt) != 0) {
				if (!(errno == EAGAIN || errno == EWOULDBLOCK))
					tpp_log(LOG_ERR, __func__, "tpp_mbox_read failed");
				return;
			}
			pkt = conn->curr_send_pkt;
		}
		p = pkt->curr_chunk;

		/* data available, first byte, presend handler present, call handler */
		if ((p == GET_NEXT(pkt->chunks)) && (p->pos == p->data) && the_pkt_presend_handler) {
			if ((rc = the_pkt_presend_handler(conn->sock_fd, pkt, conn->ctx, conn->extra)) == 0) {
				p = pkt->curr_chunk; /* presend handler could change pkt contents */
			}
		}

		if (p && (rc == 0)) {
			tosend = p->len - (p->pos - p->data);
			while (tosend > 0) {
				rc = tpp_sock_send(conn->sock_fd, p->pos, tosend, 0);
				if (rc < 0) {
					if (errno == EWOULDBLOCK || errno == EAGAIN) {
						/* set this socket in POLLOUT */
						conn->ev_mask |= EM_OUT;
						TPP_DBPRT("EWOULDBLOCK, added EM_OUT to ev_mask, now=%x", conn->ev_mask);
						if (tpp_em_mod_fd(conn->td->em_context, conn->sock_fd, conn->ev_mask) == -1) {
							tpp_log(LOG_ERR, __func__, "Multiplexing failed");
							return;
						}
					} else {
						handle_disconnect(conn);
						return;
					}
					break;
				}
				TPP_DBPRT("tfd=%d, tosend=%d, sent=%d bytes", conn->sock_fd, tosend, rc);
				p->pos += rc;
				tosend -= rc;
			}

			if (tosend == 0) {
				p = GET_NEXT(p->chunk_link);
				if (p)
					pkt->curr_chunk = p;
				else
					curr_pkt_done = 1;
			}
		} else
			curr_pkt_done = 1;

		if (pkt && curr_pkt_done) {
			/*
			* all data in this packet has been sent or done with.
			* delete this node and get next node in queue
			*/
			tpp_free_pkt(pkt);
			conn->curr_send_pkt = NULL;
		}
	}
}

/**
 * @brief
 *	Free a physical connection
 *
 * @param[in] conn - The physical connection
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static void
free_phy_conn(phy_conn_t *conn)
{
	tpp_que_elem_t *n = NULL;
	tpp_packet_t *pkt;
	short cmd;

	if (!conn)
		return;

	if (conn->conn_params) {
		if (conn->conn_params->hostname)
			free(conn->conn_params->hostname);
		free(conn->conn_params);
	}

	while (tpp_mbox_clear(&conn->send_mbox, &n, conn->sock_fd, &cmd, (void **) &pkt) == 0) {
		if (cmd == TPP_CMD_SEND)
			tpp_free_pkt(pkt);
	}

	tpp_mbox_destroy(&conn->send_mbox);

	free(conn->ctx);
	free(conn->scratch.data);
	free(conn);
}

/**
 * @brief
 *	Shut down this layer, send "exit" commands to all threads, and then
 *	free the thread pool.
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 * @return error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_transport_shutdown()
{
	int i;
	void *ret;

	tpp_log(LOG_INFO, NULL, "Shutting down TPP transport Layer");

	for (i = 0; i < num_threads; i++) {
		tpp_mbox_post(&thrd_pool[i]->mbox, 0, TPP_CMD_EXIT, NULL, 0);
	}

	for (i = 0; i < num_threads; i++) {
		if (tpp_is_valid_thrd(thrd_pool[i]->worker_thrd_id))
			pthread_join(thrd_pool[i]->worker_thrd_id, &ret);

		tpp_em_destroy(thrd_pool[i]->em_context);
		free(thrd_pool[i]->tpp_tls);
		free(thrd_pool[i]);
	}
	free(thrd_pool);

	for (i = 0; i < conns_array_size; i++) {
		if (conns_array[i].conn) {
			tpp_sock_close(conns_array[i].conn->sock_fd);
			free_phy_conn(conns_array[i].conn);
		}
	}

	/* free the array */
	free(conns_array);
	if (tpp_destroy_rwlock(&cons_array_lock))
		return 1;

	return 0;
}

/**
 * @brief
 *	"Terminate" this layer, no threads to be stopped, just free all memory
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_transport_terminate()
{
	int i;

	/* Warning: Do not attempt to destroy any lock
	 * This is not required since our library is effectively
	 * not used after a fork.
	 *
	 * Don't bother to free any TPP data as well, as the forked
	 * process is usually short lived and no point spending time
	 * freeing space on a short lived forked process. Besides,
	 * the TPP thread which is lost after fork might have been in
	 * between using these data when the fork happened, so freeing
	 * some structures might be dangerous.
	 *
	 * Thus the only thing we do here is to close file/sockets
	 * so that the kernel can recognize when a close happens from the
	 * main process.
	 *
	 */

	for (i = 0; i < num_threads; i++) {
		if (thrd_pool[i]->listen_fd > -1)
			tpp_sock_close(thrd_pool[i]->listen_fd);
	}

	/* close all open physical connections, else child carries open socket
	 * and a later close at parent is not all sides closed
	 */
	for (i = 0; i < conns_array_size; i++) {
		if (conns_array[i].conn)
			tpp_sock_close(conns_array[i].conn->sock_fd);
	}

	return 0;
}

/**
 * @brief
 *	Retrive hostname associated with given file descriptor of physical connection
 *
 * @param[in] tfd - Descriptor to the physical connection
 *
 */
const char *
tpp_transport_get_conn_hostname(int tfd)
{
	int slot_state;
	phy_conn_t *conn;
	conn = get_transport_atomic(tfd, &slot_state);
	if (conn) {
		return ((const char *) (conn->conn_params->hostname));
	}
	return NULL;
}

/**
 * @brief
 *	Function associates some extra structure with physical connection
 *
 * @param[in] tfd - Descriptor to the physical connection
 * @param[in] extra - Pointer to extra structure
 *
 */
void
tpp_transport_set_conn_extra(int tfd, void *extra)
{
	int slot_state;
	phy_conn_t *conn;
	conn = get_transport_atomic(tfd, &slot_state);
	if (conn) {
		conn->extra = extra;
	}
}


================================================
FILE: src/lib/Libtpp/tpp_util.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	tpp_util.c
 *
 * @brief	Miscellaneous utility routines used by the TPP library
 *
 *
 */
#include <pbs_config.h>
#if RWLOCK_SUPPORT == 2
#if !defined(_XOPEN_SOURCE)
#define _XOPEN_SOURCE 500
#endif
#endif

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <pthread.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <netinet/tcp.h>
#include <arpa/inet.h>
#include <stdarg.h>
#include <ctype.h>
#include "pbs_idx.h"
#include "pbs_error.h"
#include "tpp_internal.h"
#include "dis.h"
#ifdef PBS_COMPRESSION_ENABLED
#include <zlib.h>
#endif

#define BACKTRACE_SIZE 100
#include <execinfo.h>

/*
 *	Global Variables
 */

#ifndef WIN32
pthread_mutex_t tpp_nslookup_mutex = PTHREAD_MUTEX_INITIALIZER;
#endif

/* TLS data for each TPP thread */
static pthread_key_t tpp_key_tls;
static pthread_once_t tpp_once_ctrl = PTHREAD_ONCE_INIT; /* once ctrl to initialize tls key */

long tpp_log_event_mask = 0;

/* default keepalive values */
#define DEFAULT_TCP_KEEPALIVE_TIME 30
#define DEFAULT_TCP_KEEPALIVE_INTVL 10
#define DEFAULT_TCP_KEEPALIVE_PROBES 3
#define DEFAULT_TCP_USER_TIMEOUT 60000

#define PBS_TCP_KEEPALIVE "PBS_TCP_KEEPALIVE" /* environment string to search for */

/* extern functions called from this file into the tpp_transport.c */
static pbs_tcp_chan_t *tppdis_get_user_data(int sd);

void
tpp_auth_logger(int type, int objclass, int severity, const char *objname, const char *text)
{
	tpp_log(severity, objname, (char *) text);
}

/**
 * @brief
 *	Get the user buffer associated with the tpp channel. If no buffer has
 *	been set, then allocate a tppdis_chan structure and associate with
 *	the given tpp channel
 *
 * @param[in] - fd - Tpp channel to which to get/associate a user buffer
 *
 * @retval	NULL - Failure
 * @retval	!NULL - Buffer associated with the tpp channel
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
static pbs_tcp_chan_t *
tppdis_get_user_data(int fd)
{
	void *data = tpp_get_user_data(fd);
	if (data == NULL) {
		if (errno != ENOTCONN) {
			/* fd connected, but first time - so call setup */
			dis_setup_chan(fd, (pbs_tcp_chan_t * (*) (int) ) & tpp_get_user_data);
			/* get the buffer again*/
			data = tpp_get_user_data(fd);
		}
	}
	return (pbs_tcp_chan_t *) data;
}

/**
 * @brief
 *	Setup dis function pointers to point to tpp_dis routines
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void
DIS_tpp_funcs()
{
	pfn_transport_get_chan = tppdis_get_user_data;
	pfn_transport_set_chan = (int (*)(int, pbs_tcp_chan_t *)) & tpp_set_user_data;
	pfn_transport_recv = tpp_recv;
	pfn_transport_send = tpp_send;
}

/**
 * @brief
 *		This is the log handler for tpp implemented in the daemon. The pointer to
 *		this function is used by the Libtpp layer when it needs to log something to
 *		the daemon logs
 *
 * @param[in]	level   - Logging level
 * @param[in]	objname - Name of the object about which logging is being done
 * @param[in]	mess    - The log message
 *
 */
void
tpp_log(int level, const char *routine, const char *fmt, ...)
{
	char id[2 * PBS_MAXHOSTNAME];
	char func[PBS_MAXHOSTNAME];
	int thrd_index;
	int etype;
	int len;
	char logbuf[LOG_BUF_SIZE];
	char *buf;
	va_list args;

#ifdef TPPDEBUG
	level = LOG_CRIT; /* for TPPDEBUG mode force all logs message */
#endif
	etype = log_level_2_etype(level);

	func[0] = '\0';
	if (routine)
		snprintf(func, sizeof(func), ";%s", routine);

	thrd_index = tpp_get_thrd_index();
	if (thrd_index == -1)
		snprintf(id, sizeof(id), "%s(Main Thread)%s", msg_daemonname ? msg_daemonname : "", func);
	else
		snprintf(id, sizeof(id), "%s(Thread %d)%s", msg_daemonname ? msg_daemonname : "", thrd_index, func);

	va_start(args, fmt);

	len = vsnprintf(logbuf, sizeof(logbuf), fmt, args);

	if (len >= sizeof(logbuf)) {
		buf = pbs_asprintf_format(len, fmt, args);
		if (buf == NULL) {
			va_end(args);
			return;
		}
	} else
		buf = logbuf;

	log_event(etype, PBS_EVENTCLASS_TPP, level, id, buf);

	if (len >= sizeof(logbuf))
		free(buf);

	va_end(args);
}

/**
 * @brief
 *	Helper function called by PBS daemons to set the tpp configuration to
 *	be later used during tpp_init() call.
 *
 * @param[in] pbs_conf - Pointer to the pbs_config structure
 * @param[out] tpp_conf - The tpp configuration structure duly filled based on
 *			  the input parameters
 * @param[in] nodenames - The comma separated list of name of this side of the communication.
 * @param[in] port     - The port at which this side is identified.
 * @param[in] routers  - Array of router addresses ended by a null entry
 *			 router addresses are of the form "host:port"
 *
 * @retval Error code
 * @return -1 - Failure
 * @return  0 - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
set_tpp_config(struct pbs_config *pbs_conf, struct tpp_config *tpp_conf, char *nodenames, int port, char *r)
{
	int i, end;
	int num_routers = 0;
	char *routers = NULL;
	char *s, *t, *ctx;
	char *nm;
	int len, hlen;
	char *token, *saveptr, *tmp;
	char *formatted_names = NULL;

	/* before doing anything else, initialize the key to the tls
	 * its okay to call this function multiple times since it
	 * uses a pthread_once functionality to initialize key only once
	 */
	if (tpp_init_tls_key() != 0) {
		/* can only use prints since tpp key init failed */
		fprintf(stderr, "Failed to initialize tls key\n");
		return -1;
	}

	if (r) {
		routers = strdup(r);
		if (!routers) {
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating routers");
			return -1;
		}
	}

	if (!nodenames) {
		tpp_log(LOG_CRIT, NULL, "TPP node name not set");
		return -1;
	}

	if (port == -1) {
		struct sockaddr_in in;
		int sd;
		int rc;
		tpp_addr_t *addr;

		if ((sd = tpp_sock_socket(AF_INET, SOCK_STREAM, 0)) == -1) {
			tpp_log(LOG_ERR, __func__, "tpp_sock_socket() error, errno=%d", errno);
			return -1;
		}

		/* bind this socket to a reserved port */
		in.sin_family = AF_INET;
		in.sin_addr.s_addr = INADDR_ANY;
		in.sin_port = 0;
		memset(&(in.sin_zero), '\0', sizeof(in.sin_zero));
		if ((rc = tpp_sock_bind(sd, (struct sockaddr *) &in, sizeof(in))) == -1) {
			tpp_log(LOG_ERR, __func__, "tpp_sock_bind() error, errno=%d", errno);
			tpp_sock_close(sd);
			return -1;
		}

		addr = tpp_get_local_host(sd);
		if (addr) {
			port = addr->port;
			free(addr);
		}

		if (port == -1) {
			tpp_log(LOG_ERR, __func__, "TPP client could not detect port to use");
			tpp_sock_close(sd);
			return -1;
		}
		/* don't close this socket */
		tpp_set_close_on_exec(sd);
	}

	/* add port information to the node names and format into a single string as desired by TPP */
	len = 0;
	token = strtok_r(nodenames, ",", &saveptr);
	while (token) {
		nm = mk_hostname(token, port);
		if (!nm) {
			tpp_log(LOG_CRIT, NULL, "Failed to make node name");
			return -1;
		}

		hlen = strlen(nm);
		if ((tmp = realloc(formatted_names, len + hlen + 2)) == NULL) { /* 2 for command and null char */
			tpp_log(LOG_CRIT, NULL, "Failed to make formatted node name");
			return -1;
		}

		formatted_names = tmp;

		if (len == 0) {
			strcpy(formatted_names, nm);
		} else {
			strcat(formatted_names, ",");
			strcat(formatted_names, nm);
		}
		free(nm);

		len += hlen + 2;

		token = strtok_r(NULL, ",", &saveptr);
	}

	tpp_conf->node_name = formatted_names;
	tpp_conf->node_type = TPP_LEAF_NODE;
	tpp_conf->numthreads = 1;

	tpp_conf->auth_config = make_auth_config(pbs_conf->auth_method,
						 pbs_conf->encrypt_method,
						 pbs_conf->pbs_exec_path,
						 pbs_conf->pbs_home_path,
						 (void *) tpp_auth_logger);
	if (tpp_conf->auth_config == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating auth config");
		return -1;
	}

	tpp_log(LOG_INFO, NULL, "TPP authentication method = %s", tpp_conf->auth_config->auth_method);
	if (tpp_conf->auth_config->encrypt_method[0] != '\0')
		tpp_log(LOG_INFO, NULL, "TPP encryption method = %s", tpp_conf->auth_config->encrypt_method);

	if ((tpp_conf->supported_auth_methods = dup_string_arr(pbs_conf->supported_auth_methods)) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory while making copy of supported auth methods");
		return -1;
	}

#ifdef PBS_COMPRESSION_ENABLED
	tpp_conf->compress = pbs_conf->pbs_use_compression;
#else
	tpp_conf->compress = 0;
#endif

	/* set default parameters for keepalive */
	tpp_conf->tcp_keepalive = 1;
	tpp_conf->tcp_keep_idle = DEFAULT_TCP_KEEPALIVE_TIME;
	tpp_conf->tcp_keep_intvl = DEFAULT_TCP_KEEPALIVE_INTVL;
	tpp_conf->tcp_keep_probes = DEFAULT_TCP_KEEPALIVE_PROBES;
	tpp_conf->tcp_user_timeout = DEFAULT_TCP_USER_TIMEOUT;

	/* if set, read them from environment variable PBS_TCP_KEEPALIVE */
	if ((s = getenv(PBS_TCP_KEEPALIVE))) {
		/*
		 * The format is a comma separated list of values in order, for the following variables,
		 * tcp_keepalive_enable,tcp_keepalive_time,tcp_keepalive_intvl,tcp_keepalive_probes,tcp_user_timeout
		 */
		tpp_conf->tcp_keepalive = 0;
		t = strtok_r(s, ",", &ctx);
		if (t) {
			/* this has to be the tcp_keepalive_enable value */
			if (atol(t) == 1) {
				tpp_conf->tcp_keepalive = 1;

				/* parse other values only if this is enabled */
				if ((t = strtok_r(NULL, ",", &ctx))) {
					/* tcp_keepalive_time */
					tpp_conf->tcp_keep_idle = (int) atol(t);
				}

				if (t && (t = strtok_r(NULL, ",", &ctx))) {
					/* tcp_keepalive_intvl */
					tpp_conf->tcp_keep_intvl = (int) atol(t);
				}

				if (t && (t = strtok_r(NULL, ",", &ctx))) {
					/* tcp_keepalive_probes */
					tpp_conf->tcp_keep_probes = (int) atol(t);
				}

				if (t && (t = strtok_r(NULL, ",", &ctx))) {
					/*tcp_user_timeout */
					tpp_conf->tcp_user_timeout = (int) atol(t);
				}

				/* emit a log depicting what we are going to use as keepalive */
				tpp_log(LOG_CRIT, NULL,
					"Using tcp_keepalive_time=%d, tcp_keepalive_intvl=%d, tcp_keepalive_probes=%d, tcp_user_timeout=%d",
					tpp_conf->tcp_keep_idle, tpp_conf->tcp_keep_intvl, tpp_conf->tcp_keep_probes, tpp_conf->tcp_user_timeout);
			} else {
				tpp_log(LOG_CRIT, NULL, "tcp keepalive disabled");
			}
		}
	}

	tpp_conf->buf_limit_per_conn = 5000; /* size in KB, TODO: load from pbs.conf */

	if (routers && routers[0] != '\0') {
		char *p = routers;
		char *q;

		num_routers = 1;

		while (*p) {
			if (*p == ',')
				num_routers++;
			p++;
		}

		tpp_conf->routers = calloc(num_routers + 1, sizeof(char *));
		if (!tpp_conf->routers) {
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating routers array");
			return -1;
		}

		q = p = routers;
		i = end = 0;
		while (!end) {
			if (!*p)
				end = 1;
			if ((*p && *p == ',') || end) {
				*p = 0;
				while (isspace(*q))
					q++;
				nm = mk_hostname(q, TPP_DEF_ROUTER_PORT);
				if (!nm) {
					tpp_log(LOG_CRIT, NULL, "Failed to make router name");
					return -1;
				}
				tpp_conf->routers[i++] = nm;
				q = p + 1;
			}
			if (!end)
				p++;
		}

	} else {
		tpp_conf->routers = NULL;
	}

	for (i = 0; i < num_routers; i++) {
		if (tpp_conf->routers[i] == NULL || strcmp(tpp_conf->routers[i], tpp_conf->node_name) == 0) {
			tpp_log(LOG_CRIT, NULL, "Router name NULL or points to same node endpoint %s", (tpp_conf->routers[i]) ? (tpp_conf->routers[i]) : "");
			return -1;
		}
	}

	if (routers)
		free(routers);

	return 0;
}

/* 
 * free tpp conf member variables
 * to be called before exit
 * 
 * @param[in] tpp_conf - pointer to the tpp conf structure
 * 
 */
void
free_tpp_config(struct tpp_config *tpp_conf)
{
	free(tpp_conf->routers);
	free_string_array(tpp_conf->supported_auth_methods);
	free(tpp_conf->node_name);
	free_auth_config(tpp_conf->auth_config);
}

/**
 * @brief tpp_make_authdata - allocate conn_auth_t structure based given values
 *
 * @param[in] tpp_conf - pointer to tpp config structure
 * @param[in] conn_type - one of AUTH_CLIENT or AUTH_SERVER
 * @param[in] auth_method - auth method name
 * @param[in] encrypt_method - encrypt method name
 *
 * @return conn_auth_t *
 * @return !NULL - success
 * @return NULL  - failure
 */
conn_auth_t *
tpp_make_authdata(struct tpp_config *tpp_conf, int conn_type, char *auth_method, char *encrypt_method)
{
	conn_auth_t *authdata = NULL;

	if ((authdata = (conn_auth_t *) calloc(1, sizeof(conn_auth_t))) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory");
		return NULL;
	}
	authdata->conn_type = conn_type;
	authdata->config = make_auth_config(auth_method,
					    encrypt_method,
					    tpp_conf->auth_config->pbs_exec_path,
					    tpp_conf->auth_config->pbs_home_path,
					    tpp_conf->auth_config->logfunc);
	if (authdata->config == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory");
		return NULL;
	}

	return authdata;
}

/**
 * @brief tpp_handle_auth_handshake - initiate handshake or process incoming handshake data
 *
 * @param[in] tfd - file descriptor
 * @param[in] conn_fd - connection fd for sending data
 * @param[in] authdata - pointer to conn auth data struct associated with tfd
 * @param[in] for_encrypt - whether to handle incoming data for encrypt/decrypt or for authentication
 * @param[in] data_in - incoming handshake data (if any)
 * @param[in] len_in - length of data_in else 0
 *
 * @return int
 * @return -1 - failure
 * @return 0  - need handshake continuation
 * @return 1  - handshake completed
 */
int
tpp_handle_auth_handshake(int tfd, int conn_fd, conn_auth_t *authdata, int for_encrypt, void *data_in, size_t len_in)
{
	void *data_out = NULL;
	size_t len_out = 0;
	int is_handshake_done = 0;
	void *authctx = NULL;
	auth_def_t *authdef = NULL;

	if (authdata == NULL) {
		tpp_log(LOG_CRIT, __func__, "tfd=%d, No auth data found", tfd);
		return -1;
	}

	if (for_encrypt == FOR_AUTH) {
		if (authdata->authdef == NULL) {
			authdef = get_auth(authdata->config->auth_method);
			if (authdef == NULL) {
				tpp_log(LOG_CRIT, __func__, "Failed to find authdef");
				return -1;
			}
			authdata->authdef = authdef;
			authdef->set_config((const pbs_auth_config_t *) (authdata->config));
			if (authdef->create_ctx(&(authdata->authctx), authdata->conn_type, AUTH_SERVICE_CONN, tpp_transport_get_conn_hostname(tfd))) {
				tpp_log(LOG_CRIT, __func__, "Failed to create auth context");
				return -1;
			}
		}
		authdef = authdata->authdef;
		authctx = authdata->authctx;
	} else {
		if (authdata->encryptdef == NULL) {
			authdef = get_auth(authdata->config->encrypt_method);
			if (authdef == NULL) {
				tpp_log(LOG_CRIT, __func__, "Failed to find authdef");
				return -1;
			}
			authdata->encryptdef = authdef;
			authdef->set_config((const pbs_auth_config_t *) (authdata->config));
			if (authdef->create_ctx(&(authdata->encryptctx), authdata->conn_type, AUTH_SERVICE_CONN, tpp_transport_get_conn_hostname(tfd))) {
				tpp_log(LOG_CRIT, __func__, "Failed to create encrypt context");
				return -1;
			}
		}
		authdef = authdata->encryptdef;
		authctx = authdata->encryptctx;
	}
	tpp_transport_set_conn_extra(tfd, authdata);

	if (authdef->process_handshake_data(authctx, data_in, len_in, &data_out, &len_out, &is_handshake_done) != 0) {
		if (len_out > 0) {
			tpp_log(LOG_CRIT, __func__, (char *) data_out);
			free(data_out);
		}
		return -1;
	}

	if (len_out > 0) {
		tpp_auth_pkt_hdr_t *ahdr = NULL;
		tpp_packet_t *pkt = NULL;

		pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_auth_pkt_hdr_t), 1, (void **) &ahdr);
		if (!pkt) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			free(data_out);
			return -1;
		}
		ahdr->type = TPP_AUTH_CTX;
		ahdr->for_encrypt = for_encrypt;
		strcpy(ahdr->auth_method, authdata->config->auth_method);
		strcpy(ahdr->encrypt_method, authdata->config->encrypt_method);

		if (!tpp_bld_pkt(pkt, data_out, len_out, 0, NULL)) {
			tpp_log(LOG_CRIT, __func__, "Failed to build packet");
			free(data_out);
			return -1;
		}

		if (tpp_transport_vsend(conn_fd, pkt) != 0) {
			tpp_log(LOG_CRIT, __func__, "tpp_transport_vsend failed, err=%d", errno);
			return -1;
		}
	}

	/*
	 * We didn't send any handshake data and handshake is not completed
	 * so error out as we should send some handshake data
	 * or handshake should be completed
	 */
	if (is_handshake_done == 0 && len_out == 0) {
		tpp_log(LOG_CRIT, __func__, "Auth handshake failed");
		return -1;
	}

	if (is_handshake_done != 1)
		return 0;

	/* Verify user name is in list of service users */
	if ((for_encrypt == FOR_AUTH) && (authdata->conn_type == AUTH_SERVER)) {
		char *user = NULL;
		char *host = NULL;
		char *realm = NULL;
		if (authdef->get_userinfo(authctx, &user, &host, &realm) != 0) {
			tpp_log(LOG_CRIT, __func__, "tfd=%d, Could not retrieve username from auth ctx", tfd);
			return -1;
		}
		if (user != NULL && !is_string_in_arr(pbs_conf.auth_service_users, user)) {
			tpp_log(LOG_CRIT, __func__, "tfd=%d, User %s not in service users list", tfd, user);
			return -1;
		}
		if (user)
			free(user);
	}

	return 1;
}

/**
 * @brief
 *	Create a packet structure from the inputs provided
 *
 * @param[in] - pkt  - Pointer to packet to add chunk, or create new packet if NULL
 * @param[in] - data - pointer to data buffer (if NULL provided, no copy happens)
 * @param[in] - len  - Lentgh of data buffer
 * @param[in] - dup  - Make a copy of the data provided?
 * @param[in] - dup_data  - Ptr to copy of data created, if dup is true
 *
 * @return Newly allocated packet structure
 * @retval NULL - Failure (Out of memory)
 * @retval !NULL - Address of allocated packet structure
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
tpp_packet_t *
tpp_bld_pkt(tpp_packet_t *pkt, void *data, int len, int dup, void **dup_data)
{
	tpp_chunk_t *chunk;
	void *d = data;

	/* first create the requested chunk for the packet */
	if ((chunk = malloc(sizeof(tpp_chunk_t))) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Failed to build chunk");
		tpp_free_pkt(pkt);
		return NULL;
	}
	/* dup flag was provided, so allocate space */
	if (dup) {
		d = malloc(len);
		if (!d) {
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating packet duplicate data for chunk");
			free(chunk);
			tpp_free_pkt(pkt);
			return NULL;
		}
		if (data)
			memcpy(d, data, len);
		if (dup_data)
			*dup_data = d; /* return allocated data ptr */
	}
	chunk->data = d;
	chunk->pos = chunk->data;
	chunk->len = len;
	CLEAR_LINK(chunk->chunk_link);

	/* add chunk to packet */
	/* if packet NULL, create packet now and add chunk */
	if (pkt == NULL) {
		if ((pkt = malloc(sizeof(tpp_packet_t))) == NULL) {
			if (d != data)
				free(d);
			tpp_free_pkt(pkt);
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating packet");
			return NULL;
		}
		CLEAR_HEAD(pkt->chunks);
		pkt->ref_count = 1;
		pkt->totlen = 0;
		pkt->curr_chunk = chunk;
	}

	pkt->totlen += len;
	append_link(&pkt->chunks, &chunk->chunk_link, chunk);

	return pkt;
}

/**
 * @brief
 *	Free a chunk
 *
 * @param[in] - chunk - Ptr to the chunk to be freed.
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
tpp_free_chunk(tpp_chunk_t *chunk)
{
	if (chunk) {
		delete_link(&chunk->chunk_link);
		free(chunk->data);
		free(chunk);
	}
}

/**
 * @brief
 *	Free a packet structure
 *
 * @param[in] - pkt - Ptr to the packet to be freed.
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void
tpp_free_pkt(tpp_packet_t *pkt)
{
	if (pkt) {
		pkt->ref_count--;

		if (pkt->ref_count <= 0) {
			tpp_chunk_t *chunk;
			while ((chunk = GET_NEXT(pkt->chunks)))
				tpp_free_chunk(chunk);
			free(pkt);
		}
	}
}

/**
 * @brief
 *	Mark a file descriptor as non-blocking
 *
 * @param[in] - fd - The file descriptor
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_set_non_blocking(int fd)
{
	int flags;

	/* If they have O_NONBLOCK, use the Posix way to do it */
#if defined(O_NONBLOCK)
	if (-1 == (flags = fcntl(fd, F_GETFL, 0)))
		flags = 0;
	return fcntl(fd, F_SETFL, flags | O_NONBLOCK);
#elif defined(WIN32)
	flags = 1;
	if (ioctlsocket(fd, FIONBIO, &flags) == SOCKET_ERROR)
		return -1;
	return 0;
#else
	/* Otherwise, use the old way of doing it */
	flags = 1;
	return ioctl(fd, FIOBIO, &flags);
#endif
}

/**
 * @brief
 *	Mark a file descriptor with close on exec flag
 *
 * @param[in] - fd - The file descriptor
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_set_close_on_exec(int fd)
{
#ifndef WIN32
	int flags;
	if ((flags = fcntl(fd, F_GETFD)) != -1)
		fcntl(fd, F_SETFD, flags | FD_CLOEXEC);
#endif
	return 0;
}

/**
 * @brief
 *	Mark a socket descriptor as keepalive
 *
 * @param[in] - fd - The socket descriptor
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_set_keep_alive(int fd, struct tpp_config *cnf)
{
	int optval = 1;
	pbs_socklen_t optlen;

	if (cnf->tcp_keepalive == 0)
		return 0; /* not using keepalive, return success */

	optlen = sizeof(optval);

#ifdef SO_KEEPALIVE
	optval = cnf->tcp_keepalive;
	if (tpp_sock_setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &optval, optlen) < 0) {
		tpp_log(LOG_CRIT, __func__, "setsockopt(SO_KEEPALIVE) errno=%d", errno);
		return -1;
	}
#endif

#ifndef WIN32
#ifdef TCP_KEEPIDLE
	optval = cnf->tcp_keep_idle;
	if (tpp_sock_setsockopt(fd, IPPROTO_TCP, TCP_KEEPIDLE, &optval, optlen) < 0) {
		tpp_log(LOG_CRIT, __func__, "setsockopt(TCP_KEEPIDLE) errno=%d", errno);
		return -1;
	}
#endif

#ifdef TCP_KEEPINTVL
	optval = cnf->tcp_keep_intvl;
	if (tpp_sock_setsockopt(fd, IPPROTO_TCP, TCP_KEEPINTVL, &optval, optlen) < 0) {
		tpp_log(LOG_CRIT, __func__, "setsockopt(TCP_KEEPINTVL) errno=%d", errno);
		return -1;
	}
#endif

#ifdef TCP_KEEPCNT
	optval = cnf->tcp_keep_probes;
	if (tpp_sock_setsockopt(fd, IPPROTO_TCP, TCP_KEEPCNT, &optval, optlen) < 0) {
		tpp_log(LOG_CRIT, __func__, "setsockopt(TCP_KEEPCNT) errno=%d", errno);
		return -1;
	}
#endif

#ifdef TCP_USER_TIMEOUT
	optval = cnf->tcp_user_timeout;
	if (tpp_sock_setsockopt(fd, IPPROTO_TCP, TCP_USER_TIMEOUT, &optval, optlen) < 0) {
		tpp_log(LOG_CRIT, __func__, "setsockopt(TCP_USER_TIMEOUT) errno=%d", errno);
		return -1;
	}
#endif

#endif /*for win32*/

	return 0;
}

/**
 * @brief
 *	Create a posix thread
 *
 * @param[in] - start_routine - The threads routine
 * @param[out] - id - The thread id is returned in this field
 * @param[in] - data - The ptr to be passed to the thread routine
 *
 * @return	Error code
 * @retval -1	Failure
 * @retval  0	Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_cr_thrd(void *(*start_routine)(void *), pthread_t *id, void *data)
{
	pthread_attr_t *attr = NULL;
	int rc = -1;
#ifndef WIN32
	pthread_attr_t setattr;
	size_t stack_size;

	attr = &setattr;
	if (pthread_attr_init(attr) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to initialize attribute");
		return -1;
	}
	if (pthread_attr_getstacksize(attr, &stack_size) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to get stack size of thread");
		return -1;
	} else {
		if (stack_size < MIN_STACK_LIMIT) {
			if (pthread_attr_setstacksize(attr, MIN_STACK_LIMIT) != 0) {
				tpp_log(LOG_CRIT, __func__, "Failed to set stack size for thread");
				return -1;
			}
		} else {
			if (pthread_attr_setstacksize(attr, stack_size) != 0) {
				tpp_log(LOG_CRIT, __func__, "Failed to set stack size for thread");
				return -1;
			}
		}
	}
#endif
	if (pthread_create(id, attr, start_routine, data) == 0)
		rc = 0;

#ifndef WIN32
	if (pthread_attr_destroy(attr) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to destroy attribute");
		return -1;
	}
#endif
	return rc;
}

/**
 * @brief
 *	Initialize a pthread mutex
 *
 * @param[in] - lock - A pthread mutex variable to initialize
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return error code
 * @retval	1 failure
 * @retval	0	success
 */
int
tpp_init_lock(pthread_mutex_t *lock)
{
	pthread_mutexattr_t attr;
	int type;

	if (pthread_mutexattr_init(&attr) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to initialize mutex attr");
		return 1;
	}
#if defined(linux)
	type = PTHREAD_MUTEX_RECURSIVE_NP;
#else
	type = PTHREAD_MUTEX_RECURSIVE;
#endif
	if (pthread_mutexattr_settype(&attr, type)) {
		tpp_log(LOG_CRIT, __func__, "Failed to set mutex type");
		return 1;
	}

	if (pthread_mutex_init(lock, &attr) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to initialize mutex");
		return 1;
	}

	return 0;
}

/**
 * @brief
 *	Destroy a pthread mutex
 *
 * @param[in] - lock - The pthread mutex to destroy
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return 	error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_destroy_lock(pthread_mutex_t *lock)
{
	if (pthread_mutex_destroy(lock) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to destroy mutex");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Acquire lock on a mutex
 *
 * @param[in] - lock - ptr to a mutex variable
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_lock(pthread_mutex_t *lock)
{
	if (pthread_mutex_lock(lock) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to lock mutex");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Release lock on a mutex
 *
 * @param[in] - lock - ptr to a mutex variable
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_unlock(pthread_mutex_t *lock)
{
	if (pthread_mutex_unlock(lock) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to unlock mutex");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Initialize a rw lock
 *
 * @param[in] - lock - A pthread rw variable to initialize
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_init_rwlock(void *lock)
{
	if (pthread_rwlock_init(lock, NULL) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to initialize rw lock");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Acquire read lock on a rw lock
 *
 * @param[in] - lock - ptr to a rw lock variable
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_read_lock(void *lock)
{
	if (pthread_rwlock_rdlock(lock) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed in rdlock");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Acquire write lock on a rw lock
 *
 * @param[in] - lock - ptr to a rw lock variable
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_write_lock(void *lock)
{
	if (pthread_rwlock_wrlock(lock) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to wrlock");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Unlock an rw lock
 *
 * @param[in] - lock - ptr to a rw lock variable
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_unlock_rwlock(void *lock)
{
	if (pthread_rwlock_unlock(lock) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to unlock rw lock");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Destroy a rw lock
 *
 * @param[in] - lock - The rw to destroy
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 * * @return	error code
 * @retval	1	failure
 * @retval	0	success
 */
int
tpp_destroy_rwlock(void *lock)
{
	if (pthread_rwlock_destroy(lock) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to destroy rw lock");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *	Parse a hostname:port format and break into host and port portions.
 *	If port is not available, set the default port to DEF_TPP_ROUTER_PORT.
 *
 * @param[in] - full - The full hostname (host:port)
 * @param[out] - port - The port extracted from the full hostname
 *
 * @return	hostname part
 * @retval NULL Failure
 * @retval !NULL hostname
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
char *
tpp_parse_hostname(char *full, int *port)
{
	char *p;
	char *host = NULL;

	*port = TPP_DEF_ROUTER_PORT;
	if ((host = strdup(full)) == NULL)
		return NULL;

	if ((p = strstr(host, ":"))) {
		*p = '\0';
		*port = atol(p + 1);
	}
	return host;
}

/**
 * @brief
 *	Enqueue a node to a queue
 *
 * Linked List is from right to left
 * Insertion (tail) is at the right
 * and Deletion (head) is at left
 *
 * head ---> node ---> node ---> tail
 *
 * ---> Next points to right
 *
 * @param[in] - l - The address of the queue
 * @param[in] - data   - Data to be added as a node to the queue
 *
 * @return	The ptr to the newly created queue node
 * @retval	NULL - Failed to enqueue data (out of memory)
 * @retval	!NULL - Ptr to the newly created node
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
tpp_que_elem_t *
tpp_enque(tpp_que_t *l, void *data)
{
	tpp_que_elem_t *nd;

	if ((nd = malloc(sizeof(tpp_que_elem_t))) == NULL) {
		return NULL;
	}
	nd->queue_data = data;

	if (l->tail) {
		nd->prev = l->tail;
		nd->next = NULL;
		l->tail->next = nd;
		l->tail = nd;
	} else {
		l->tail = nd;
		l->head = nd;
		nd->next = NULL;
		nd->prev = NULL;
	}
	return nd;
}

/**
 * @brief
 *	De-queue (remove) a node from a queue
 *
 * Linked List is from right to left
 * Insertion (tail) is at the right
 * and Deletion (head) is at left
 *
 * head ---> node ---> node ---> tail
 *
 * ---> Next points to right
 *
 * @param[in] - l - The address of the queue
 *
 * @return	The ptr to the data from the node just removed from queue
 * @retval	NULL - Queue is empty
 * @retval	!NULL - Ptr to the data
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
void *
tpp_deque(tpp_que_t *l)
{
	void *data = NULL;
	tpp_que_elem_t *p;
	if (l->head) {
		data = l->head->queue_data;
		p = l->head;
		l->head = l->head->next;
		if (l->head)
			l->head->prev = NULL;
		else
			l->tail = NULL;
		free(p);
	}
	return data;
}

/**
 * @brief
 *	Delete a specific node from a queue
 *
 * Linked List is from right to left
 * Insertion (tail) is at the right
 * and Deletion (head) is at left
 *
 * head ---> node ---> node ---> tail
 *
 * ---> Next points to right
 *
 * @param[in] - l - The address of the queue
 * @param[in] - n - Ptr of the node to remove
 *
 * @return	The ptr to the previous node in the queue (or NULL)
 * @retval	NULL - Failed to enqueue data (out of memory)
 * @retval	!NULL - Ptr to the previous node
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
tpp_que_elem_t *
tpp_que_del_elem(tpp_que_t *l, tpp_que_elem_t *n)
{
	tpp_que_elem_t *p = NULL;
	if (n) {
		if (n->next) {
			n->next->prev = n->prev;
		}
		if (n->prev) {
			n->prev->next = n->next;
		}

		if (n == l->head) {
			l->head = n->next;
		}
		if (n == l->tail) {
			l->tail = n->prev;
		}
		if (l->head == NULL || l->tail == NULL) {
			l->tail = NULL;
			l->head = NULL;
		}
		if (n->prev)
			p = n->prev;
		/* else return p as NULL, so list QUE_NEXT starts from head again */
		free(n);
	}
	return p;
}

/**
 * @brief
 *	Insert a node a specific position in the queue
 *
 * Linked List is from right to left
 * Insertion (tail) is at the right
 * and Deletion (head) is at left
 *
 * head ---> node ---> node ---> tail
 *
 * ---> Next points to right
 *
 * @param[in] - l - The address of the queue
 * @param[in] - n - Ptr to the location at which to insert node
 * @param[in] - data - Data to be put in the new node
 * @param[in] - before - Insert before or after the node location of n
 *
 * @return	The ptr to the just inserted node
 * @retval	NULL - Failed to insert data (out of memory)
 * @retval	!NULL - Ptr to the newly created node
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
tpp_que_elem_t *
tpp_que_ins_elem(tpp_que_t *l, tpp_que_elem_t *n, void *data, int before)
{
	tpp_que_elem_t *nd = NULL;

	if (n) {
		if ((nd = malloc(sizeof(tpp_que_elem_t))) == NULL) {
			return NULL;
		}
		nd->queue_data = data;
		if (before == 0) {
			/* after */
			nd->next = n->next;
			nd->prev = n;
			if (n->next)
				n->next->prev = nd;
			n->next = nd;
			if (n == l->tail)
				l->tail = nd;

		} else {
			/* before */
			nd->prev = n->prev;
			nd->next = n;
			if (n->prev)
				n->prev->next = nd;
			n->prev = nd;
			if (n == l->head)
				l->head = nd;
		}
	}
	return nd;
}

/**
 * @brief
 *	Convenience function to set the control header and and send the control
 *	packet (TPP_CTL_NOROUTE) to the given destination by calling
 *	tpp_transport_vsend.
 *
 * @param[in] - fd - The physical connection via which to send control packet
 * @param[in] - src - The host:port of the source (sender)
 * @param[in] - dest - The host:port of the destination
 *
 * @return	Error code
 * @retval	-1    - Failure
 * @retval	 0    - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
int
tpp_send_ctl_msg(int fd, int code, tpp_addr_t *src, tpp_addr_t *dest, unsigned int src_sd, char err_num, char *msg)
{
	tpp_ctl_pkt_hdr_t *lhdr = NULL;
	tpp_packet_t *pkt = NULL;

	/* send a packet back to where the original packet came from
	 * basically reverse src and dest
	 */
	pkt = tpp_bld_pkt(NULL, NULL, sizeof(tpp_ctl_pkt_hdr_t), 1, (void **) &lhdr);
	if (!pkt) {
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		return -1;
	}
	lhdr->type = TPP_CTL_MSG;
	lhdr->code = code;
	lhdr->src_sd = htonl(src_sd);
	lhdr->error_num = err_num;
	if (src)
		memcpy(&lhdr->dest_addr, src, sizeof(tpp_addr_t));
	if (dest)
		memcpy(&lhdr->src_addr, dest, sizeof(tpp_addr_t));
	if (msg == NULL)
		msg = "";

	if (!tpp_bld_pkt(pkt, msg, strlen(msg) + 1, 1, NULL)) {
		tpp_log(LOG_CRIT, __func__, "Failed to build packet");
		return -1;
	}

	TPP_DBPRT("Sending CTL PKT: sd=%d, msg=%s", src_sd, msg);
	if (tpp_transport_vsend(fd, pkt) != 0) {
		tpp_log(LOG_CRIT, __func__, "tpp_transport_vsend failed");
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Combine the host and port parameters to a single string.
 *
 * @param[in] - host - hostname
 * @param[in] - port - add port if not already present
 *
 * @return	The combined string with the host:port
 * @retval	NULL - Failure (out of memory)
 * @retval	!NULl - Combined string
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
char *
mk_hostname(char *host, int port)
{
	char *node_name = malloc(strlen(host) + 10);
	if (node_name) {
		if (strchr(host, ':') || port == -1)
			strcpy(node_name, host);
		else
			sprintf(node_name, "%s:%d", host, port);
	}
	return node_name;
}

/**
 * @brief
 *	Once function for initializing TLS key
 *
 *  @return    - Error code
 *	@retval -1 - Failure
 *	@retval  0 - Success
 *
 * @par Side Effects:
 *	Initializes the global tpp_key_tls, exits if fails
 *
 * @par MT-safe: No
 *
 */
static void
tpp_init_tls_key_once(void)
{
	if (pthread_key_create(&tpp_key_tls, NULL) != 0) {
		fprintf(stderr, "Failed to initialize TLS key\n");
	}
}

/**
 * @brief
 *	Initialize the TLS key
 *
 *  @return    - Error code
 *	@retval -1 - Failure
 *	@retval  0 - Success
 *
 * @par Side Effects:
 *	Initializes the global tpp_key_tls
 *
 * @par MT-safe: No
 *
 */
int
tpp_init_tls_key()
{
	if (pthread_once(&tpp_once_ctrl, tpp_init_tls_key_once) != 0)
		return -1;
	return 0;
}

/**
 * @brief
 *	Get the data from the thread TLS
 *
 * @return	Pointer of the tpp_thread_data structure from threads TLS
 * @retval	NULL - Pthread functions failed
 * @retval	!NULl - Data from TLS
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
tpp_tls_t *
tpp_get_tls()
{
	tpp_tls_t *ptr;
	if ((ptr = pthread_getspecific(tpp_key_tls)) == NULL) {
		ptr = calloc(1, sizeof(tpp_tls_t));
		if (!ptr)
			return NULL;

		if (pthread_setspecific(tpp_key_tls, ptr) != 0) {
			free(ptr);
			return NULL;
		}
	}
	return (tpp_tls_t *) ptr; /* thread data already initialized */
}

#ifdef PBS_COMPRESSION_ENABLED

#define COMPR_LEVEL Z_DEFAULT_COMPRESSION

struct def_ctx {
	z_stream cmpr_strm;
	void *cmpr_buf;
	int len;
};

/**
 * @brief
 *	Initialize a multi step deflation
 *	Allocate an initial result buffer of given length
 *
 * @param[in] initial_len -  initial length of result buffer
 *
 * @return - The deflate context
 * @retval - NULL  - Failure
 * @retval - !NULL - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void *
tpp_multi_deflate_init(int initial_len)
{
	int ret;
	struct def_ctx *ctx = malloc(sizeof(struct def_ctx));
	if (!ctx) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating context buffer %lu bytes", sizeof(struct def_ctx));
		return NULL;
	}

	if ((ctx->cmpr_buf = malloc(initial_len)) == NULL) {
		free(ctx);
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating deflate buffer %d bytes", initial_len);
		return NULL;
	}

	/* allocate deflate state */
	ctx->cmpr_strm.zalloc = Z_NULL;
	ctx->cmpr_strm.zfree = Z_NULL;
	ctx->cmpr_strm.opaque = Z_NULL;
	ret = deflateInit(&ctx->cmpr_strm, COMPR_LEVEL);
	if (ret != Z_OK) {
		free(ctx->cmpr_buf);
		free(ctx);
		tpp_log(LOG_CRIT, __func__, "Multi compression init failed");
		return NULL;
	}

	ctx->len = initial_len;
	ctx->cmpr_strm.avail_out = initial_len;
	ctx->cmpr_strm.next_out = ctx->cmpr_buf;
	return (void *) ctx;
}

/**
 * @brief
 *	Add data to a multi step deflation
 *
 * @param[in] c - The deflate context
 * @param[in] fini - Whether this call is the final data addition
 * @param[in] inbuf - Pointer to data buffer to add
 * @param[in] inlen - Length of input buffer to add
 *
 * @return - Error code
 * @retval - -1  - Failure
 * @retval -  0  - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
int
tpp_multi_deflate_do(void *c, int fini, void *inbuf, unsigned int inlen)
{
	struct def_ctx *ctx = c;
	int flush;
	int ret;
	int filled;
	void *p;

	ctx->cmpr_strm.avail_in = inlen;
	ctx->cmpr_strm.next_in = inbuf;

	flush = (fini == 1) ? Z_FINISH : Z_NO_FLUSH;
	while (1) {
		ret = deflate(&ctx->cmpr_strm, flush);
		if (ret == Z_OK && ctx->cmpr_strm.avail_out == 0) {
			/* more output pending, but no output buffer space */
			filled = (char *) ctx->cmpr_strm.next_out - (char *) ctx->cmpr_buf;
			ctx->len = ctx->len * 2;
			p = realloc(ctx->cmpr_buf, ctx->len);
			if (!p) {
				tpp_log(LOG_CRIT, __func__, "Out of memory allocating deflate buffer %d bytes", ctx->len);
				deflateEnd(&ctx->cmpr_strm);
				free(ctx->cmpr_buf);
				free(ctx);
				return -1;
			}
			ctx->cmpr_buf = p;
			ctx->cmpr_strm.next_out = (Bytef *) ((char *) ctx->cmpr_buf + filled);
			ctx->cmpr_strm.avail_out = ctx->len - filled;
		} else
			break;
	}
	if (fini == 1 && ret != Z_STREAM_END) {
		deflateEnd(&ctx->cmpr_strm);
		free(ctx->cmpr_buf);
		free(ctx);
		tpp_log(LOG_CRIT, __func__, "Multi compression step failed");
		return -1;
	}
	return 0;
}

/**
 * @brief
 *	Complete the deflate and
 *
 * @param[in] c - The deflate context
 * @param[out] cmpr_len - The total length after compression
 *
 * @return - compressed buffer
 * @retval - NULL  - Failure
 * @retval - !NULL - Success
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: No
 *
 */
void *
tpp_multi_deflate_done(void *c, unsigned int *cmpr_len)
{
	struct def_ctx *ctx = c;
	void *data = ctx->cmpr_buf;
	int ret;

	*cmpr_len = ctx->cmpr_strm.total_out;

	ret = deflateEnd(&ctx->cmpr_strm);
	free(ctx);
	if (ret != Z_OK) {
		free(data);
		tpp_log(LOG_CRIT, __func__, "Compression cleanup failed");
		return NULL;
	}
	return data;
}

/**
 * @brief Deflate (compress) data
 *
 * @param[in] inbuf   - Ptr to buffer to compress
 * @param[in] inlen   - The size of input buffer
 * @param[out] outlen - The size of the compressed data
 *
 * @return      - Ptr to the compressed data buffer
 * @retval  !NULL - Success
 * @retval   NULL - Failure
 *
 * @par MT-safe: No
 **/
void *
tpp_deflate(void *inbuf, unsigned int inlen, unsigned int *outlen)
{
	z_stream strm;
	int ret;
	void *data;
	unsigned int filled;
	void *p;
	int len;

	*outlen = 0;

	/* allocate deflate state */
	strm.zalloc = Z_NULL;
	strm.zfree = Z_NULL;
	strm.opaque = Z_NULL;
	ret = deflateInit(&strm, Z_DEFAULT_COMPRESSION);
	if (ret != Z_OK) {
		tpp_log(LOG_CRIT, __func__, "Compression failed");
		return NULL;
	}

	/* set input data to be compressed */
	len = inlen;
	strm.avail_in = len;
	strm.next_in = inbuf;

	/* allocate buffer to temporarily collect compressed data */
	data = malloc(len);
	if (!data) {
		deflateEnd(&strm);
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating deflate buffer %d bytes", len);
		return NULL;
	}

	/* run deflate() on input until output buffer not full, finish
	 * compression if all of source has been read in
	 */

	strm.avail_out = len;
	strm.next_out = data;
	while (1) {
		ret = deflate(&strm, Z_FINISH);
		if (ret == Z_OK && strm.avail_out == 0) {
			/* more output pending, but no output buffer space */
			filled = (char *) strm.next_out - (char *) data;
			len = len * 2;
			p = realloc(data, len);
			if (!p) {
				deflateEnd(&strm);
				free(data);
				tpp_log(LOG_CRIT, __func__, "Out of memory allocating deflate buffer %d bytes", len);
				return NULL;
			}
			data = p;
			strm.next_out = (Bytef *) ((char *) data + filled);
			strm.avail_out = len - filled;
		} else
			break;
	}
	deflateEnd(&strm); /* clean up */
	if (ret != Z_STREAM_END) {
		free(data);
		tpp_log(LOG_CRIT, __func__, "Compression failed");
		return NULL;
	}
	filled = (char *) strm.next_out - (char *) data;

	/* reduce the memory area occupied */
	if (filled != inlen) {
		p = realloc(data, filled);
		if (!p) {
			free(data);
			tpp_log(LOG_CRIT, __func__, "Out of memory allocating deflate buffer %d bytes", filled);
			return NULL;
		}
		data = p;
	}

	*outlen = filled;
	return data;
}

/**
 * @brief Inflate (de-compress) data
 *
 * @param[in] inbuf  - Ptr to compress data buffer
 * @param[in] inlen  - The size of input buffer
 * @param[in] totlen - The total size of the uncompress data
 *
 * @return      - Ptr to the uncompressed data buffer
 * @retval  !NULL - Success
 * @retval   NULL - Failure
 *
 * @par MT-safe: No
 **/
void *
tpp_inflate(void *inbuf, unsigned int inlen, unsigned int totlen)
{
	int ret;
	z_stream strm;
	void *outbuf = NULL;

	/*
	 * in some rare cases totlen < compressed_len (inlen)
	 * so safer to malloc the larger of the two values
	 */
	outbuf = malloc(totlen > inlen ? totlen : inlen);
	if (!outbuf) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating inflate buffer %d bytes", totlen);
		return NULL;
	}

	/* allocate inflate state */
	strm.zalloc = Z_NULL;
	strm.zfree = Z_NULL;
	strm.opaque = Z_NULL;
	strm.avail_in = 0;
	strm.next_in = Z_NULL;
	ret = inflateInit(&strm);
	if (ret != Z_OK) {
		free(outbuf);
		tpp_log(LOG_CRIT, __func__, "Decompression Init (inflateInit) failed, ret = %d", ret);
		return NULL;
	}

	/* decompress until deflate stream ends or end of file */
	strm.avail_in = inlen;
	strm.next_in = inbuf;

	/* run inflate() on input until output buffer not full */
	strm.avail_out = totlen;
	strm.next_out = outbuf;
	ret = inflate(&strm, Z_FINISH);
	inflateEnd(&strm);
	if (ret != Z_STREAM_END) {
		free(outbuf);
		tpp_log(LOG_CRIT, __func__, "Decompression (inflate) failed, ret = %d", ret);
		return NULL;
	}
	return outbuf;
}
#else
void *
tpp_multi_deflate_init(int initial_len)
{
	tpp_log(LOG_CRIT, __func__, "TPP compression disabled");
	return NULL;
}

int
tpp_multi_deflate_do(void *c, int fini, void *inbuf, unsigned int inlen)
{
	tpp_log(LOG_CRIT, __func__, "TPP compression disabled");
	return -1;
}

void *
tpp_multi_deflate_done(void *c, unsigned int *cmpr_len)
{
	tpp_log(LOG_CRIT, __func__, "TPP compression disabled");
	return NULL;
}

void *
tpp_deflate(void *inbuf, unsigned int inlen, unsigned int *outlen)
{
	tpp_log(LOG_CRIT, __func__, "TPP compression disabled");
	return NULL;
}

void *
tpp_inflate(void *inbuf, unsigned int inlen, unsigned int totlen)
{
	tpp_log(LOG_CRIT, __func__, "TPP compression disabled");
	return NULL;
}
#endif

/**
 * @brief Convenience function to validate a tpp header
 *
 * @param[in] tfd       - The transport fd
 * @param[in] pkt_start - The start address of the pkt
 *
 * @return - Packet validity status
 * @retval  0 - Packet has valid header structure
 * @retval -1 - Packet has invalid header structure
 *
 * @par MT-safe: No
 *
 **/
int
tpp_validate_hdr(int tfd, char *pkt_start)
{
	enum TPP_MSG_TYPES type;
	char *data;
	int data_len;

	data_len = ntohl(*((int *) pkt_start));
	data = pkt_start + sizeof(int);
	type = *((unsigned char *) data);

	if ((data_len < 0 || type >= TPP_LAST_MSG) ||
	    (data_len > TPP_SEND_SIZE &&
	     type != TPP_DATA &&
	     type != TPP_MCAST_DATA &&
	     type != TPP_ENCRYPTED_DATA &&
	     type != TPP_AUTH_CTX)) {
		tpp_log(LOG_CRIT, __func__, "tfd=%d, Received invalid packet type with type=%d? data_len=%d", tfd, type, data_len);
		return -1;
	}
	return 0;
}

/**
 * @brief Get a list of addresses for a given hostname
 *
 * @param[in] node_names - comma separated hostnames, each of format host:port
 * @param[out] count - return address count
 *
 * @return        - Array of addresses in tpp_addr structures
 * @retval  !NULL - Array of addresses returned
 * @retval  NULL  - call failed
 *
 * @par MT-safe: Yes
 *
 **/
tpp_addr_t *
tpp_get_addresses(char *names, int *count)
{
	tpp_addr_t *addrs = NULL;
	tpp_addr_t *addrs_tmp = NULL;
	int tot_count = 0;
	int tmp_count;
	int i, j;
	char *token;
	char *saveptr;
	int port;
	char *p;
	char *node_names;

	*count = 0;
	if ((node_names = strdup(names)) == NULL) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating address block");
		return NULL;
	}

	token = strtok_r(node_names, ",", &saveptr);
	while (token) {
		/* parse port from host name */
		if ((p = strchr(token, ':')) == NULL) {
			free(addrs);
			free(node_names);
			return NULL;
		}

		*p = '\0';
		port = atol(p + 1);

		addrs_tmp = tpp_sock_resolve_host(token, &tmp_count); /* get all ipv4 addresses */
		if (addrs_tmp) {
			tpp_addr_t *tmp;
			if ((tmp = realloc(addrs, (tot_count + tmp_count) * sizeof(tpp_addr_t))) == NULL) {
				free(addrs);
				free(node_names);
				tpp_log(LOG_CRIT, __func__, "Out of memory allocating address block");
				return NULL;
			}
			addrs = tmp;

			for (i = 0; i < tmp_count; i++) {
				for (j = 0; j < tot_count; j++) {
					if (memcmp(&addrs[j].ip, &addrs_tmp[i].ip, sizeof(addrs_tmp[i].ip)) == 0)
						break;
				}

				/* add if duplicate not found already */
				if (j == tot_count) {
					memmove(&addrs[tot_count], &addrs_tmp[i], sizeof(tpp_addr_t));
					addrs[tot_count].port = htons(port);
					tot_count++;
				}
			}
			free(addrs_tmp);
		}

		token = strtok_r(NULL, ",", &saveptr);
	}
	free(node_names);

	*count = tot_count;
	return addrs; /* free @ caller */
}

/**
 * @brief Get the address of the local end of the connection
 *
 * @param[in] sock - connection id
 *
 * @return - Address of the local end of the connection in tpp_addr format
 * @retval  !NULL - address returned
 * @retval  NULL  - call failed
 *
 * @par MT-safe: Yes
 **/
tpp_addr_t *
tpp_get_local_host(int sock)
{
	struct sockaddr_storage addrs;
	struct sockaddr *addr = (struct sockaddr *) &addrs;
	struct sockaddr_in *inp = NULL;
	struct sockaddr_in6 *inp6 = NULL;
	tpp_addr_t *taddr = NULL;
	socklen_t len = sizeof(struct sockaddr);

	if (getsockname(sock, addr, &len) == -1) {
		tpp_log(LOG_CRIT, __func__, "Could not get name of peer for sock %d, errno=%d", sock, errno);
		return NULL;
	}
	if (addr->sa_family != AF_INET && addr->sa_family != AF_INET6) {
		tpp_log(LOG_CRIT, __func__, "Bad address family for sock %d", sock);
		return NULL;
	}

	taddr = calloc(1, sizeof(tpp_addr_t));
	if (!taddr) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating address");
		return NULL;
	}

	if (addr->sa_family == AF_INET) {
		inp = (struct sockaddr_in *) addr;
		memcpy(&taddr->ip, &inp->sin_addr, sizeof(inp->sin_addr));
		taddr->port = inp->sin_port; /* keep in network order */
		taddr->family = TPP_ADDR_FAMILY_IPV4;
	} else if (addr->sa_family == AF_INET6) {
		inp6 = (struct sockaddr_in6 *) addr;
		memcpy(&taddr->ip, &inp6->sin6_addr, sizeof(inp6->sin6_addr));
		taddr->port = inp6->sin6_port; /* keep in network order */
		taddr->family = TPP_ADDR_FAMILY_IPV6;
	}

	return taddr;
}

/**
 * @brief Get the address of the remote (peer) end of the connection
 *
 * @param[in] sock - connection id
 *
 * @return  - Address of the remote end of the connection in tpp_addr format
 * @retval  !NULL - address returned
 * @retval  NULL  - call failed
 *
 * @par MT-safe: Yes
 **/
tpp_addr_t *
tpp_get_connected_host(int sock)
{
	struct sockaddr_storage addrs;
	struct sockaddr *addr = (struct sockaddr *) &addrs;
	struct sockaddr_in *inp = NULL;
	struct sockaddr_in6 *inp6 = NULL;
	tpp_addr_t *taddr = NULL;
	socklen_t len = sizeof(struct sockaddr);

	if (getpeername(sock, addr, &len) == -1) {
		if (errno == ENOTCONN)
			tpp_log(LOG_CRIT, __func__, "Peer disconnected sock %d", sock);
		else
			tpp_log(LOG_CRIT, __func__, "Could not get name of peer for sock %d, errno=%d", sock, errno);

		return NULL;
	}
	if (addr->sa_family != AF_INET && addr->sa_family != AF_INET6) {
		tpp_log(LOG_CRIT, __func__, "Bad address family for sock %d", sock);
		return NULL;
	}

	taddr = calloc(1, sizeof(tpp_addr_t));
	if (!taddr) {
		tpp_log(LOG_CRIT, __func__, "Out of memory allocating address");
		return NULL;
	}

	if (addr->sa_family == AF_INET) {
		inp = (struct sockaddr_in *) addr;
		memcpy(&taddr->ip, &inp->sin_addr, sizeof(inp->sin_addr));
		taddr->port = inp->sin_port; /* keep in network order */
		taddr->family = TPP_ADDR_FAMILY_IPV4;
	} else if (addr->sa_family == AF_INET6) {
		inp6 = (struct sockaddr_in6 *) addr;
		memcpy(&taddr->ip, &inp6->sin6_addr, sizeof(inp6->sin6_addr));
		taddr->port = inp6->sin6_port; /* keep in network order */
		taddr->family = TPP_ADDR_FAMILY_IPV6;
	}

	return taddr;
}

/**
 * @brief return a human readable string representation of an address
 *        for either an ipv4 or ipv6 address
 *
 * @param[in] ap - address in tpp_addr format
 *
 * @return  - string representation of address
 *            (uses TLS area to make it easy and yet thread safe)
 *
 * @par MT-safe: Yes
 **/
char *
tpp_netaddr(tpp_addr_t *ap)
{
	tpp_tls_t *ptr;
#ifdef WIN32
	struct sockaddr_in in;
	struct sockaddr_in6 in6;
	int len;
#endif
	char port[7];

	if (ap == NULL)
		return "unknown";

	ptr = tpp_get_tls();
	if (!ptr) {
		fprintf(stderr, "Out of memory\n");
		return "unknown";
	}

	ptr->tppstaticbuf[0] = '\0';

	if (ap->family == TPP_ADDR_FAMILY_UNSPEC)
		return "unknown";

#ifdef WIN32
	if (ap->family == TPP_ADDR_FAMILY_IPV4) {
		memcpy(&in.sin_addr, ap->ip, sizeof(in.sin_addr));
		in.sin_family = AF_INET;
		in.sin_port = 0;
		len = LOG_BUF_SIZE;
		WSAAddressToString((LPSOCKADDR) &in, sizeof(in), NULL, (LPSTR) &ptr->tppstaticbuf, &len);
	} else if (ap->family == TPP_ADDR_FAMILY_IPV6) {
		memcpy(&in6.sin6_addr, ap->ip, sizeof(in6.sin6_addr));
		in6.sin6_family = AF_INET6;
		in6.sin6_port = 0;
		len = LOG_BUF_SIZE;
		WSAAddressToString((LPSOCKADDR) &in6, sizeof(in6), NULL, (LPSTR) &ptr->tppstaticbuf, &len);
	}
#else
	if (ap->family == TPP_ADDR_FAMILY_IPV4) {
		inet_ntop(AF_INET, &ap->ip, ptr->tppstaticbuf, INET_ADDRSTRLEN);
	} else if (ap->family == TPP_ADDR_FAMILY_IPV6) {
		inet_ntop(AF_INET6, &ap->ip, ptr->tppstaticbuf, INET6_ADDRSTRLEN);
	}
#endif
	sprintf(port, ":%d", ntohs(ap->port));
	strcat(ptr->tppstaticbuf, port);

	return ptr->tppstaticbuf;
}

/**
 * @brief return a human readable string representation of an address
 *        for either an ipv4 or ipv6 address
 *
 * @param[in] sa - address in sockaddr format
 *
 * @return  - string representation of address
 *            (uses TLS area to make it easy and yet thread safe)
 *
 * @par MT-safe: Yes
 **/
char *
tpp_netaddr_sa(struct sockaddr *sa)
{
#ifdef WIN32
	int len;
#endif
	tpp_tls_t *ptr = tpp_get_tls();
	if (!ptr) {
		fprintf(stderr, "Out of memory\n");
		return NULL;
	}
	ptr->tppstaticbuf[0] = '\0';

#ifdef WIN32
	len = sizeof(ptr->tppstaticbuf);
	WSAAddressToString((LPSOCKADDR) &sa, sizeof(struct sockaddr), NULL, (LPSTR) &ptr->tppstaticbuf, &len);
#else
	if (sa->sa_family == AF_INET)
		inet_ntop(sa->sa_family, &(((struct sockaddr_in *) sa)->sin_addr), ptr->tppstaticbuf, sizeof(ptr->tppstaticbuf));
	else
		inet_ntop(sa->sa_family, &(((struct sockaddr_in6 *) sa)->sin6_addr), ptr->tppstaticbuf, sizeof(ptr->tppstaticbuf));
#endif

	return ptr->tppstaticbuf;
}

/*
 * Convenience function to delete information about a router
 */
void
free_router(tpp_router_t *r)
{
	if (r) {
		if (r->router_name)
			free(r->router_name);
		free(r);
	}
}

/*
 * Convenience function to delete information about a leaf
 */
void
free_leaf(tpp_leaf_t *l)
{
	if (l) {
		if (l->leaf_addrs)
			free(l->leaf_addrs);

		free(l);
	}
}

/**
 * @brief Set the loglevel for the tpp layer. This is used to print
 * additional information at times (like ip addresses are revers
 * looked-up and hostnames printed in logs).
 *
 * @param[in] logmask - The logmask value to set
 *
 * @par MT-safe: No
 **/
void
tpp_set_logmask(long logmask)
{
	tpp_log_event_mask = logmask;
}

#ifndef WIN32

/**
 * @brief
 *	wrapper function for tpp_nslookup_mutex_lock().
 *
 */
void
tpp_nslookup_atfork_prepare()
{
	tpp_lock(&tpp_nslookup_mutex);
}

/**
 * @brief
 *	wrapper function for tpp_nslookup_mutex_unlock().
 *
 */
void
tpp_nslookup_atfork_parent()
{
	tpp_unlock(&tpp_nslookup_mutex);
}

/**
 * @brief
 *	wrapper function for tpp_nslookup_mutex_unlock().
 *
 */
void
tpp_nslookup_atfork_child()
{
	tpp_unlock(&tpp_nslookup_mutex);
}
#endif

/**
 * @brief encrypt the pkt  with the authdata provided
 *
 * @param[in] authdata - encryption information
 * @param[in] pkt - packet of data
 *
 * @par MT-safe: No
 **/
int
tpp_encrypt_pkt(conn_auth_t *authdata, tpp_packet_t *pkt)
{
	void *data_out = NULL;
	size_t len_out = 0;
	tpp_encrypt_hdr_t *ehdr;
	int totlen = pkt->totlen;
	tpp_chunk_t *chunk, *next;
	tpp_auth_pkt_hdr_t *data = (tpp_auth_pkt_hdr_t *) (((tpp_chunk_t *) (GET_NEXT(pkt->chunks)))->data);
	unsigned char type = data->type;
	void *buf = NULL;
	char *p;

	if (type == TPP_AUTH_CTX && data->for_encrypt == FOR_ENCRYPT)
		return 0;

	buf = malloc(totlen);
	if (buf == NULL) {
		tpp_log(LOG_CRIT, __func__, "Failed to allocated buffer for encrypting pkt data");
		return -1;
	}
	p = (char *) buf;
	chunk = GET_NEXT(pkt->chunks);
	while (chunk) {
		memcpy(p, chunk->data, chunk->len);
		p += chunk->len;
		next = GET_NEXT(chunk->chunk_link);
		tpp_free_chunk(chunk);
		chunk = next;
	}
	pkt->totlen = 0;
	CLEAR_HEAD(pkt->chunks);
	pkt->curr_chunk = NULL;

	if (authdata->encryptdef->encrypt_data(authdata->encryptctx, buf, totlen, &data_out, &len_out) != 0) {
		tpp_log(LOG_CRIT, __func__, "Failed to encrypt pkt data");
		free(buf);
		return -1;
	}

	if (totlen > 0 && len_out <= 0) {
		tpp_log(LOG_CRIT, __func__, "invalid encrypted data len: %d, pktlen: %d", (int) len_out, totlen);
		free(buf);
		return -1;
	}
	free(buf);
	if (!tpp_bld_pkt(pkt, NULL, sizeof(tpp_encrypt_hdr_t), 1, (void **) &ehdr)) {
		tpp_log(LOG_CRIT, __func__, "Failed to add encrypt pkt header into pkt");
		free(data_out);
		return -1;
	}
	if (!tpp_bld_pkt(pkt, data_out, len_out, 0, NULL)) {
		tpp_log(LOG_CRIT, __func__, "Failed to add encrypted data into pkt");
		free(data_out);
		return -1;
	}
	ehdr->ntotlen = htonl(pkt->totlen);
	ehdr->type = TPP_ENCRYPTED_DATA;
	pkt->curr_chunk = GET_NEXT(pkt->chunks);

	return 0;
}

/*
 * use TPPDEBUG instead of DEBUG, since DEBUG makes daemons not fork
 * and that does not work well with init scripts. Sometimes we need to
 * debug TPP in a PTL run where forked daemons are required
 * Hence use a separate macro
 */
#ifdef TPPDEBUG
/*
 * Convenience function to print the packet header
 *
 * @param[in] fnc - name of calling function
 * @param[in] data - start of data packet
 * @param[in] len - length of data packet
 *
 * @par MT-safe: yes
 */
void
print_packet_hdr(const char *fnc, void *data, int len)
{
	tpp_ctl_pkt_hdr_t *hdr = (tpp_ctl_pkt_hdr_t *) data;

	char str_types[][20] = {"TPP_CTL_JOIN", "TPP_CTL_LEAVE", "TPP_DATA", "TPP_CTL_MSG", "TPP_CLOSE_STRM", "TPP_MCAST_DATA"};
	unsigned char type = hdr->type;

	if (type == TPP_CTL_JOIN) {
		tpp_addr_t *addrs = (tpp_addr_t *) (((char *) data) + sizeof(tpp_join_pkt_hdr_t));
		tpp_log(LOG_CRIT, __func__, "%s message arrived from src_host = %s", str_types[type - 1], tpp_netaddr(addrs));
	} else if (type == TPP_CTL_LEAVE) {
		tpp_addr_t *addrs = (tpp_addr_t *) (((char *) data) + sizeof(tpp_leave_pkt_hdr_t));
		tpp_log(LOG_CRIT, __func__, "%s message arrived from src_host = %s", str_types[type - 1], tpp_netaddr(addrs));
	} else if (type == TPP_MCAST_DATA) {
		tpp_mcast_pkt_hdr_t *mhdr = (tpp_mcast_pkt_hdr_t *) data;
		tpp_log(LOG_CRIT, __func__, "%s message arrived from src_host = %s", str_types[type - 1], tpp_netaddr(&mhdr->src_addr));
	} else if ((type == TPP_DATA) || (type == TPP_CLOSE_STRM)) {
		char buff[TPP_GEN_BUF_SZ + 1];
		tpp_data_pkt_hdr_t *dhdr = (tpp_data_pkt_hdr_t *) data;

		strncpy(buff, tpp_netaddr(&dhdr->src_addr), sizeof(buff));
		tpp_log(LOG_CRIT, __func__, "%s: src_host=%s, dest_host=%s, len=%d, data_len=%d, src_sd=%d, dest_sd=%d, src_magic=%d",
			str_types[type - 1], buff, tpp_netaddr(&dhdr->dest_addr), len + sizeof(tpp_data_pkt_hdr_t), len,
			ntohl(dhdr->src_sd), (ntohl(dhdr->dest_sd) == UNINITIALIZED_INT) ? -1 : ntohl(dhdr->dest_sd), ntohl(dhdr->src_magic));

	} else {
		tpp_log(LOG_CRIT, __func__, "%s message arrived from src_host = %s", str_types[type - 1], tpp_netaddr(&hdr->src_addr));
	}
}
#endif


================================================
FILE: src/lib/Libutil/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

noinst_LIBRARIES = libutil.a

libutil_a_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@libical_inc@ \
	@KRB5_CFLAGS@

libutil_a_SOURCES = \
	get_hostname.c \
	execvnode_seq_util.c \
	pbs_ical.c \
	misc_utils.c \
	avltree.c \
	hook.c \
	work_task.c \
	entlim.c \
	daemon_protect.c \
	pbs_array_list.c \
	pbs_secrets.c \
	pbs_aes_encrypt.c \
	pbs_idx.c \
	range.c  \
	thread_utils.c \
	dedup_jobids.c


================================================
FILE: src/lib/Libutil/avltree.c
================================================
/*
 **  avltree - AVL index routines by Gregory Tseytin.
 **
 **
 **    Copyright (c) 2000 Gregory Tseytin <tseyting@acm.org>
 **      All rights reserved.
 **
 **    Redistribution and use in source and binary forms, with or without
 **    modification, are permitted provided that the following conditions
 **    are met:
 **    1. Redistributions of source code must retain the above copyright
 **       notice, this list of conditions and the following disclaimer as
 **       the first lines of this file unmodified.
 **    2. Redistributions in binary form must reproduce the above copyright
 **       notice, this list of conditions and the following disclaimer in the
 **       documentation and/or other materials provided with the distribution.
 **
 **    THIS SOFTWARE IS PROVIDED BY Gregory Tseytin ``AS IS'' AND ANY EXPRESS OR
 **    IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 **    OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
 **    IN NO EVENT SHALL Gregory Tseytin BE LIABLE FOR ANY DIRECT, INDIRECT,
 **    INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
 **    NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 **    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 **    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 **    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
 **    THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 **
 **
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "avltree.h"
#include <limits.h>
#include <pthread.h>
#include <stdbool.h>
#include <stddef.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

/*
 **	'inner' avl stuff
 */
/* way3.h */

typedef char way3; /* -1, 0, 1 */

#define way3stop ((way3) 0)
#define way3left ((way3) -1)
#define way3right ((way3) 1)

#define way3sum(x, y) ((x) + (y)) /* assume x!=y */

#define way3opp(x) (-(x))

/* node.h */

typedef struct _node {
	struct _node *ptr[2]; /* left, right */
	way3 balance, *trace;
	rectype data;
} node;

#define stepway(n, x) (((n)->ptr)[way3ix(x)])
#define stepopp(n, x) (((n)->ptr)[way3ix(way3opp(x))])

/* tree.h */

#define SRF_FINDEQUAL 1
#define SRF_FINDLESS 2
#define SRF_FINDGREAT 4
#define SRF_SETMARK 8
#define SRF_FROMMARK 16

#define avltree_init(x) (*(x) = NULL)

typedef struct {
	short __tind; /* index of this thread */
	int __ix_keylength;
	int __ix_flags;	     /* set from AVL_IX_DESC */
	int __rec_keylength; /* set from actual key */
	int __node_overhead;

	node **__t;
	node *__r;
	node *__s;
	way3 __wayhand;
} avl_tls_t;

static pthread_once_t avl_init_once = PTHREAD_ONCE_INIT;
static pthread_key_t avl_tls_key;
pthread_mutex_t tind_lock;

#define MAX_AVLKEY_LEN 100

/**
 * Set max_threads to 2 by default since mom, server etc have basically 2 threads
 * If caller has > 2 threads, e.g. pbs_comm, it must first call avl_set_maxthreads()
 */
static int max_threads = 2;

/**
 * @brief set the max threads that the application uses, before any calls to avltree
 * 
 */
void
avl_set_maxthreads(int n)
{
	max_threads = n;
}

/**
 * @brief
 *	initializes avl tls by creating a key.
 *
 */
void
avl_init_func(void)
{
	if (pthread_key_create(&avl_tls_key, NULL) != 0) {
		fprintf(stderr, "avl tls key creation failed\n");
	}

	if (pthread_mutex_init(&tind_lock, NULL) != 0) {
		fprintf(stderr, "avl mutex init failed\n");
		return;
	}
}

/**
 * @brief
 *	return an unique thread index for each new thread
 *
 */
static short
get_thread_index(void)
{
	static short tind = -1;
	short retval;

	pthread_mutex_lock(&tind_lock);
	retval = ++tind;
	pthread_mutex_unlock(&tind_lock);
	return retval;
}

/**
 * @brief
 *	retrieves and returns the avl tls by checking key initialization
 *	setting  value in tls and adding the key to list.
 *
 * @return 	structure handle
 * @retval	pointer to avl tree info (tls)
 */
void *
get_avl_tls(void)
{
	avl_tls_t *p_avl_tls = NULL;

	pthread_once(&avl_init_once, avl_init_func);

	if ((p_avl_tls = (avl_tls_t *) pthread_getspecific(avl_tls_key)) == NULL) {
		p_avl_tls = (avl_tls_t *) calloc(1, sizeof(avl_tls_t));
		if (!p_avl_tls) {
			fprintf(stderr, "Out of memory creating avl_tls\n");
			return NULL;
		}
		p_avl_tls->__tind = get_thread_index();
		p_avl_tls->__node_overhead = sizeof(node) - AVL_DEFAULTKEYLEN;
		pthread_setspecific(avl_tls_key, (void *) p_avl_tls);
	}
	return p_avl_tls;
}

/**
 * @brief
 *	Free the thread local storage used for avltree for this thread
 */
void
free_avl_tls(void)
{
	avl_tls_t *p_avl_tls = NULL;

	pthread_once(&avl_init_once, avl_init_func);

	if ((p_avl_tls = (avl_tls_t *) pthread_getspecific(avl_tls_key)))
		free(p_avl_tls);
}

#define tind (((avl_tls_t *) get_avl_tls())->__tind)
#define ix_keylength (((avl_tls_t *) get_avl_tls())->__ix_keylength)
#define ix_flags (((avl_tls_t *) get_avl_tls())->__ix_flags)
#define rec_keylength (((avl_tls_t *) get_avl_tls())->__rec_keylength)
#define node_overhead (((avl_tls_t *) get_avl_tls())->__node_overhead)
#define avl_t (((avl_tls_t *) get_avl_tls())->__t)
#define avl_r (((avl_tls_t *) get_avl_tls())->__r)
#define avl_s (((avl_tls_t *) get_avl_tls())->__s)
#define avl_wayhand (((avl_tls_t *) get_avl_tls())->__wayhand)

/******************************************************************************
 WAY3
 ******************************************************************************/
static way3
makeway3(int n)
{
	return n > 0 ? way3right : n < 0 ? way3left
					 : way3stop;
}

static way3
way3opp2(way3 x, way3 y)
{
	return x == y ? way3opp(x) : way3stop;
}

/*****************************************************************************/

/**
 * @brief
 *	frees node n of type (node*).
 */
static void
freenode(node *n)
{
	if (n)
		free(n->trace);
	free(n);
}

/**
 * @brief
 *	compares two records r1 and r2
 *
 * @param[in] r1 - record1
 * @param[in] r2 - record2
 *
 * @return	int
 * @retval	matched string count	success
 * @retval	keylength		if dup keys
 *
 */
static int
compkey(rectype *r1, rectype *r2)
{
	int n;
	if (ix_keylength)
		n = memcmp(r1->key, r2->key, ix_keylength);
	else {
		if (ix_flags & AVL_CASE_CMP)
			n = strcasecmp(r1->key, r2->key);
		else
			n = strcmp(r1->key, r2->key);
	}

	if (n || !(ix_flags & AVL_DUP_KEYS_OK))
		return n;
	return memcmp(&(r1->recptr), &(r2->recptr), sizeof(AVL_RECPOS));
}

/**
 * @brief
 *	copy data of one record  to another
 *
 * @param[in] r1 - key1
 * @param[in] r2 - key2
 *
 * @return	Void
 */
static void
copydata(rectype *r1, rectype *r2)
{
	r1->recptr = r2->recptr;
	r1->count = r2->count;
	if (ix_keylength)
		memcpy(r1->key, r2->key, ix_keylength);
	else
		strcpy(r1->key, r2->key);
}

/**
 * @brief
 *	allocate  memory for new node.
 *
 * @return	structure handle
 * @retval	pointer to node key	success
 * @retval	NULL			error
 */
static node *
allocnode()
{
	int size = (ix_keylength ? ix_keylength : rec_keylength);
	node *n = (node *) malloc(size + node_overhead);
	if (n == NULL) {
		fprintf(stderr, "avltrees: out of memory\n");
		return NULL;
	}
	if (ix_flags & AVL_DUP_KEYS_OK)
		n->data.count = 1;

	n->trace = calloc(max_threads, sizeof(way3));
	if (n->trace == NULL) {
		fprintf(stderr, "avltrees: out of memory\n");
		return NULL;
	}
	return n;
}

/******************************************************************************
 NODE
 ******************************************************************************/
/**
 * @brief
 *	swap the given pointers .
 *
 * @param[in] ptrptr - pointer to pointer to root node
 * @param[in] new - new pointer
 *
 * @return	structure handle
 * @retval	pointer to old node	success
 *
 */
static node *
swapptr(node **ptrptr, node *new)
{
	node *old = *ptrptr;
	*ptrptr = new;
	return old;
}

static int
way3ix(way3 x) /* assume x != 0 */
{
	return x == way3right ? 1 : 0;
}

/******************************************************************************
 TREE
 ******************************************************************************/

/**
 * @brief
 *	restructure the tree inorder to maintain balance of tree whenever insertion or deletion of node happens
 *
 * @param[in]	op_del - value indicating insertion(0)/deletion(1) of node
 *
 * @return	int
 * @retval	0	delete node
 * @retval	1	insert node
 *
 */
static bool
restruct(bool op_del)
{
	way3 n = avl_r->balance, c;
	node *p;
	bool g = n == way3stop ? op_del : n == avl_wayhand;
	if (g)
		p = avl_r;
	else {
		p = stepopp(avl_r, avl_wayhand);
		stepopp(avl_r, avl_wayhand) = swapptr(&stepway(p, avl_wayhand), avl_r);
		c = p->balance;
		avl_s->balance = way3opp2(c, avl_wayhand);
		avl_r->balance = way3opp2(c, way3opp(avl_wayhand));
		p->balance = way3stop;
	}
	stepway(avl_s, avl_wayhand) = swapptr(&stepopp(p, avl_wayhand), avl_s);
	*avl_t = p;
	return g;
}

/**
 * @brief
 *	search the avl tree for given record.
 *
 * @param[in] tt - pointer to root of tree
 * @param[in] key - record to be searched
 * @param[in] searchflags- search flag indicating equal,greater
 *
 * @return	structure handle
 * @retval	pointer to the key (found)	success
 * @retval	NULL				error
 *
 */
static rectype *
avltree_search(node **tt, rectype *key, unsigned short searchflags)
{
	node *p, *q, *pp;
	way3 aa, waydir, wayopp;

	if (!(~searchflags & (SRF_FINDGREAT | SRF_FINDLESS)))
		return NULL;
	if (!(searchflags & (SRF_FINDGREAT | SRF_FINDEQUAL | SRF_FINDLESS)))
		return NULL;
	waydir = searchflags & SRF_FINDGREAT ? way3right : searchflags & SRF_FINDLESS ? way3left
										      : way3stop;
	wayopp = way3opp(waydir);
	p = q = NULL;
	while ((pp = *tt) != NULL) {
		aa = searchflags & SRF_FROMMARK ? pp->trace[tind] : makeway3(compkey(key, &(pp->data)));
		if (searchflags & SRF_SETMARK)
			pp->trace[tind] = aa;
		if (aa == way3stop) {
			if (searchflags & SRF_FINDEQUAL)
				return &(pp->data);
			if ((q = stepway(pp, waydir)) == NULL)
				break;
			if (searchflags & SRF_SETMARK)
				pp->trace[tind] = waydir;
			while (1) {
				if ((pp = stepway(q, wayopp)) == NULL) {
					if (searchflags & SRF_SETMARK)
						q->trace[tind] = way3stop;
					return &(q->data);
				}
				if (searchflags & SRF_SETMARK)
					q->trace[tind] = wayopp;
				q = pp;
			}
		}
		/* remember the point where we can change direction to waydir */
		if (aa == wayopp)
			p = pp;
		tt = &stepway(pp, aa);
	}
	if (p == NULL || !(searchflags & (SRF_FINDLESS | SRF_FINDGREAT)))
		return NULL;
	if (searchflags & SRF_SETMARK)
		p->trace[tind] = way3stop;
	return &(p->data);
}

/**
 * @brief
 *	return the address of first node.
 *
 * @param[out] tt - pointer to root node of tree.
 *
 * @erturn	Void
 */
static void
avltree_first(node **tt)
{
	node *pp;
	while ((pp = *tt) != NULL) {
		pp->trace[tind] = way3left;
		tt = &stepway(pp, way3left);
	}
}

/**
 * @brief
 *	insert the given record into the tree pointed by tt.
 *
 * @param[in] tt - address of root
 * @param[in] key - record to be inserted
 *
 * @return	structure handle
 * @retval	pointer to key inserted		success
 * @retval	NULL				error
 *
 */
static rectype *
avltree_insert(node **tt, rectype *key)
{
	way3 aa, b;
	node *p, *q, *pp;

	avl_t = tt;
	p = *tt;
	while ((pp = *tt) != NULL) {
		aa = makeway3(compkey(key, &(pp->data)));
		if (aa == way3stop) {
			return NULL;
		}
		if (pp->balance != way3stop)
			avl_t = tt; /* t-> the last disbalanced node */
		pp->trace[tind] = aa;
		tt = &stepway(pp, aa);
	}
	*tt = q = allocnode();
	q->balance = q->trace[tind] = way3stop;
	stepway(q, way3left) = stepway(q, way3right) = NULL;
	key->count = 1;
	copydata(&(q->data), key);
	/* balancing */
	avl_s = *avl_t;
	avl_wayhand = avl_s->trace[tind];
	if (avl_wayhand != way3stop) {
		avl_r = stepway(avl_s, avl_wayhand);
		for (p = avl_r; p != NULL; p = stepway(p, b))
			b = p->balance = p->trace[tind];
		b = avl_s->balance;
		if (b != avl_wayhand)
			avl_s->balance = way3sum(avl_wayhand, b);
		else if (restruct(0))
			avl_s->balance = avl_r->balance = way3stop;
	}
	return &(q->data);
}

/**
 * @brief
 *      delete the given record  from  the tree.
 *
 * @param[in] tt - address of root node
 * @param[in] key - record to be deleted
 *
 * @return      structure handle
 * @retval      deleted key			success
 * @retval      NULL                            error
 *
 */
static rectype *
avltree_delete(node **tt, rectype *key, unsigned short searchflags)
{
	way3 aa, aaa, b, bb;
	node *p, *q, *pp, *p1;
	node **t1, **tt1, **qq1, **rr = tt;

	avl_t = t1 = tt1 = qq1 = tt;
	p = *tt;
	q = NULL;
	aaa = way3stop;

	while ((pp = *tt) != NULL) {
		aa = aaa != way3stop ? aaa : searchflags & SRF_FROMMARK ? pp->trace[tind]
									: makeway3(compkey(key, &(pp->data)));
		b = pp->balance;
		if (aa == way3stop) {
			qq1 = tt;
			q = pp;
			rr = t1;
			aa = b != way3stop ? b : way3left;
			aaa = way3opp(aa); /* will move opposite to aa */
		}
		avl_t = t1;
		if (b == way3stop || (b != aa && stepopp(pp, aa)->balance == way3stop))
			t1 = tt;
		tt1 = tt;
		tt = &stepway(pp, aa);
		pp->trace[tind] = aa;
	}
	if (aaa == way3stop)
		return NULL;
	copydata(key, &(q->data));
	p = *tt1;
	*tt1 = p1 = stepopp(p, p->trace[tind]);
	if (p != q) {
		*qq1 = p;
		memcpy(p->ptr, q->ptr, sizeof(p->ptr));
		p->balance = q->balance;
		avl_wayhand = p->trace[tind] = q->trace[tind];
		if (avl_t == &stepway(q, avl_wayhand))
			avl_t = &stepway(p, avl_wayhand);
	}
	while ((avl_s = *avl_t) != p1) {
		avl_wayhand = way3opp(avl_s->trace[tind]);
		b = avl_s->balance;
		if (b != avl_wayhand) {
			avl_s->balance = way3sum(avl_wayhand, b);
		} else {
			avl_r = stepway(avl_s, avl_wayhand);
			if (restruct(1)) {
				if ((bb = avl_r->balance) != way3stop)
					avl_s->balance = way3stop;
				avl_r->balance = way3sum(way3opp(avl_wayhand), bb);
			}
		}
		avl_t = &stepopp(avl_s, avl_wayhand);
	}
	while ((p = *rr) != NULL) {
		/* adjusting trace */
		aa = makeway3(compkey(&(q->data), &(p->data)));
		p->trace[tind] = aa;
		rr = &stepway(p, aa);
	}
	freenode(q);
	return key;
}

/**
 * @brief
 *	clear or free all the nodes
 *
 * @param[in] tt - pointer to root
 *
 * @return	Void
 *
 */
static void
avltree_clear(node **tt)
{
	long nodecount = 0L;
	node *p = *tt, *q = NULL, *x, **xx;

	if (p != NULL) {
		while (1) {
			if ((x = stepway(p, way3left)) != NULL ||
			    (x = stepway(p, way3right)) != NULL) {
				stepway(p, way3left) = q;
				q = p;
				p = x;
				continue;
			}
			freenode(p);
			nodecount++;
			if (q == NULL)
				break;
			if (*(xx = &stepway(q, way3right)) == p)
				*xx = NULL;
			p = q;
			q = *(xx = &stepway(p, way3left));
			*xx = NULL;
		}
		*tt = NULL;
	}
}

/******************************************************************************
 'PLUS' interface style
 ******************************************************************************/

/**
 * @brief
 *	create index for the tree.
 *
 * @param[in] pix - record
 * @param[in] flags - 0x01 - dups allowed, 0x02 - case insensitive search
 * @param[in] keylength - key length
 *
 * @return	error code
 * @retval	1	error
 * @retval	0	success
 *
 */
int
avl_create_index(AVL_IX_DESC *pix, int flags, int keylength)
{
	if (keylength < 0) {
		fprintf(stderr, "create_index 'keylength'=%d: programming error\n", keylength);
		return 1;
	}
	pix->root = NULL;
	pix->keylength = keylength;
	pix->flags = flags;

	return 0;
}

/**
 * @brief
 *	destroy the avl tree pointed by pix.
 *
 * @param[in] pix - pointer to head of tree
 *
 * @return	Void
 */
void
avl_destroy_index(AVL_IX_DESC *pix)
{
	if (!pix)
		return;

	ix_keylength = pix->keylength;
	avltree_clear((node **) &(pix->root));
	pix->root = NULL;
}

/**
 * @brief
 *	finds a record in tree and copy its index.
 *
 * @param[in] pe - key
 * @param[in] pix - pointer to tree
 *
 * @return	int
 * @retval      AVL_IX_OK(1)    success
 * @retval      AVL_IX_FAIL(0)  error
 *
 */
int
avl_find_key(AVL_IX_REC *pe, AVL_IX_DESC *pix)
{
	rectype *ptr;

	ix_keylength = pix->keylength;
	ix_flags = pix->flags;

	memset((void *) &(pe->recptr), 0, sizeof(AVL_RECPOS));
	ptr = avltree_search((node **) &(pix->root), pe,
			     SRF_FINDEQUAL | SRF_SETMARK | SRF_FINDGREAT);
	if (ptr == NULL)
		return AVL_IX_FAIL;

	pe->recptr = ptr->recptr;
	pe->count = ptr->count;
	if (compkey(pe, ptr))
		return AVL_IX_FAIL;
	return AVL_IX_OK;
}

/**
 * @brief
 *	add a key to the tree
 *
 * @param[in] pe - record to be added
 * @param[in] pix - pointer to root of tree
 *
 * @return	int
 * @retval      AVL_IX_OK(1)    success
 * @retval      AVL_IX_FAIL(0)  error
 *
 */
int
avl_add_key(AVL_IX_REC *pe, AVL_IX_DESC *pix)
{
	ix_keylength = pix->keylength;
	ix_flags = pix->flags;
	if (ix_keylength == 0)
		rec_keylength = strlen(pe->key) + 1;
	if (avltree_insert((node **) &(pix->root), pe) == NULL)
		return AVL_IX_FAIL;
	return AVL_IX_OK;
}

/**
 * @brief
 *	delete the given record from the tree
 *
 * @param[in] pe - index of record to be deleted
 * @param[in] pix - pointer to the root of tree
 *
 * @return	int
 * @retval	AVL_IX_OK(1)	success
 * @retval	AVL_IX_FAIL(0)	error
 *
 */
int
avl_delete_key(AVL_IX_REC *pe, AVL_IX_DESC *pix)
{
	rectype *ptr;

	ix_keylength = pix->keylength;
	ix_flags = pix->flags;

	ptr = avltree_search((node **) &(pix->root), pe, SRF_FINDEQUAL | SRF_SETMARK);
	if (ptr == NULL)
		return AVL_IX_FAIL;
	avltree_delete((node **) &(pix->root), pe, SRF_FROMMARK);
	return AVL_IX_OK;
}

/**
 * @brief
 *      return the first record in tree
 *
 * @param[out] pix - pointer to root node of tree.
 *
 * @return      Void
 */
void
avl_first_key(AVL_IX_DESC *pix)
{
	avltree_first((node **) &(pix->root));
}

/**
 * @brief
 *      copies and returns  the next node index.
 *
 * @param[out] pe - place to hold copied node data
 * @param[in] pix - pointer to root of tree
 *
 * @return      int
 * @retval      AVL_EOIX(-2)    error
 * @retval      AVL_IX_OK(1)    success
 *
 */
int
avl_next_key(AVL_IX_REC *pe, AVL_IX_DESC *pix)
{
	rectype *ptr;
	ix_keylength = pix->keylength;
	ix_flags = pix->flags;

	if ((ptr = avltree_search((node **) &(pix->root),
				  pe, /* pe not used */
				  SRF_FROMMARK | SRF_SETMARK | SRF_FINDGREAT)) == NULL)
		return AVL_EOIX;
	copydata(pe, ptr);
	return AVL_IX_OK;
}

/**
 * @brief
 *	Create an AVL key based on the string provided
 *
 * @param[in] - key - String to be used as the key
 *
 * @return	The AVL key
 * @retval	NULL - Failure (out of memory)
 * @retval	!NULL - Success - The AVL key
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
AVL_IX_REC *
avlkey_create(AVL_IX_DESC *tree, void *key)
{
	size_t keylen;
	AVL_IX_REC *pkey;

	if (tree->keylength != 0)
		keylen = sizeof(AVL_IX_REC) - AVL_DEFAULTKEYLEN + tree->keylength;
	else {
		if (key == NULL)
			keylen = sizeof(AVL_IX_REC) + MAX_AVLKEY_LEN + 1;
		else
			keylen = sizeof(AVL_IX_REC) + strlen(key) + 1;
	}
	pkey = calloc(1, keylen);
	if (pkey == NULL)
		return NULL;

	if (key != NULL) {
		if (tree->keylength != 0)
			memcpy(pkey->key, key, tree->keylength);
		else
			strcpy(pkey->key, (char *) key);
	}

	return (pkey);
}


================================================
FILE: src/lib/Libutil/daemon_protect.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */
#include <pbs_config.h>

#include <sys/types.h>
#include <unistd.h>
#include <string.h>
#include <stdio.h>
#include <fcntl.h>
#include <errno.h>
#include "server_limits.h"
#include "pbs_ifl.h"
#include "log.h"

/**
 * @brief
 *	Where possible enable protection for the daemon from the OS.
 *
 * @par	Linux
 *	Protect from OOM (Out of Memory) killer
 *
 * @param[in] pid_t pid - pid of process to protect, if 0 then myself.
 * @param[in] enum PBS_Daemon_Protect action - turn on/off proection:
 *	PBS_DAEMON_PROTECT_ON/OFF
 */

void
daemon_protect(pid_t pid, enum PBS_Daemon_Protect action)
{

#ifdef linux
	int fd;
	char fname[MAXPATHLEN + 1];
	struct oom_protect {
		char *oom_value[2]; /* value to write: unprotect/protect */
		char *oom_path;	    /* path to which to write */
	};
	static struct oom_protect oom_protect_old = {
		{
			"0\n",	/* unprotect value */
			"-17\n" /* protect value   */
		},
		"/proc/%ld/oom_adj"};
	static struct oom_protect oom_protect_new = {
		{
			"0\n",	  /* unprotect value */
			"-1000\n" /* protect value   */
		},
		"/proc/%ld/oom_score_adj"};

	if (pid == 0)
		pid = getpid(); /* use my pid */

	/**
	 *	for Linux:  Need to protect daemons from the Out of Memory killer.
	 *
	 *	First try to set /proc/<pid>/oom_score_adj to -1000 to protect
	 *	or 0 to unprotect.
	 *	If oom_score_adj is does not exist, try setting /proc/<pid>oom_adj
	 *	which is older to -17 to protect or 0 to unprotect.
	 */
	snprintf(fname, MAXPATHLEN, oom_protect_new.oom_path, pid);
	if ((fd = open(fname, O_WRONLY | O_TRUNC)) != -1) {
		if (write(fd, oom_protect_new.oom_value[(int) action], strlen(oom_protect_new.oom_value[(int) action])) == -1) 
				log_errf(-1, __func__, "write failed. ERR: %s", strerror(errno));
	} else {

		/* failed to open "oom_score_adj", now try "oom_adj" */
		/* found in older Linux kernels			     */
		snprintf(fname, MAXPATHLEN, oom_protect_old.oom_path, pid);
		if ((fd = open(fname, O_WRONLY | O_TRUNC)) != -1) {
			if (write(fd, oom_protect_old.oom_value[(int) action], strlen(oom_protect_old.oom_value[(int) action])) == -1) 
				log_errf(-1, __func__, "write failed. ERR: %s", strerror(errno));
		}
	}
	if (fd != -1)
		close(fd);
#endif /* linux */

	/**
	 *	For any other OS, we don't do anything currently.
	 */
	return;
}


================================================
FILE: src/lib/Libutil/dedup_jobids.c
================================================
/*
 * Copyright (C) 1994-2023 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/* C functions module to remove duplicates in jobids list */

#include "job.h"
#include "range.h"
#include "dedup_jobids.h"
#include "pbs_idx.h"

/**
 * @brief is_array_job - determines if the job id indicates an array job
 *
 * @param[in]   id - Job Id.
 *
 * @return  Job Type
 * @retval  IS_ARRAY_NO  - A regular job
 * @retval  IS_ARRAY_ArrayJob  - A ArrayJob
 * @retval  IS_ARRAY_Single  - A single subjob
 * @retval  IS_ARRAY_Range  - A range of subjobs
 */
int
is_array_job(char *id)
{
	char *pc;

	if ((pc = strchr(id, (int) '[')) == NULL)
		return IS_ARRAY_NO; /* not an ArrayJob nor a subjob (range) */
	if (*++pc == ']')
		return IS_ARRAY_ArrayJob; /* an ArrayJob */

	/* know it is either a single subjob or an range there of */
	while (isdigit((int) *pc))
		++pc;
	if ((*pc == '-') || (*pc == ','))
		return IS_ARRAY_Range; /* a range of subjobs */
	else
		return IS_ARRAY_Single;
}

/**
 * @brief Allocate memory for new job range
 *
 * @return array_job_range_list*
 * @retval new range object
 */
array_job_range_list *
new_job_range(void)
{
	array_job_range_list *new_range;
	new_range = (array_job_range_list *) malloc(sizeof(array_job_range_list));
	if (new_range == NULL)
		return NULL;
	new_range->range = NULL;
	new_range->next = NULL;
	return new_range;
}

/**
 * @brief Helper function to split sub jobid from its range
 * @example
 *  1. For jobid "0[1-5].hostname"
 *      outjobid = "0.hostname" , sub_job_range = "1-5" 
 *  2. For jobid "0[1-5]"
 *      outjobid = "0" , sub_job_range = "1-5" 
 *
 * @param[in]  jobid
 * @param[out] array_jobid
 * @param[out] sub_job_range
 *
 * @return int
 * @retval 0 for Success
 * @retval 1 for Failure
 *
 * @par NOTE: out_jobid will contain jobid without sub job range.
 */
int
split_sub_jobid(char *jobid, char **out_jobid, char **sub_job_range)
{
	char *range = NULL, *hostname, *array_jobid;
	char *pc = NULL, save;

	/* subjobid */
	pc = strchr(jobid, (int) '[');
	save = *pc;
	*pc = '\0';
	array_jobid = strdup(jobid);
	*pc = save;

	/* range */
	range = ++pc;
	pc = strchr(range, (int) ']');
	save = *pc;
	*pc = '\0';
	*sub_job_range = strdup(range);
	*pc = save;

	/* hostname */
	pc = strchr(jobid, (int) '.');
	if (pc == NULL) {
		*out_jobid = array_jobid;
		return 0;
	}
	hostname = strdup(++pc);
	/* one extra for the '.' */
	*out_jobid = (char *) malloc(strlen(array_jobid) + strlen(hostname) + 2);
	if (*out_jobid == NULL)
		return 1;
	sprintf(*out_jobid, "%s.%s", array_jobid, hostname);
	free(array_jobid);
	free(hostname);

	return 0;
}

/**
 * @brief Check if job id is a short job id
 * and misses the server name.
 *
 * @param [in] jobid to check
 * 
 * @return bool
 * @retval true for short job id
 * @retval false otherwise
 */
bool
check_short_jobid(char *jobid)
{
	if (jobid == NULL) {
		return false;
	}

	while (*jobid) {
		if (isdigit(*jobid) == 0 && *jobid != '[' && *jobid != ']') {
			return false;
		}
		jobid++;
	}
	return true;
}

/**
 * @brief Adds default server name to short job ids.
 *
 * @param [in,out] jobids list of jobids
 * @param [in] numjids total count of jobids
 * @param [in,out] malloc_track to track the memory allocated
 * 
 * @return int
 * @retval 0  for Success
 * @retval -1 for Failure
 */
int
add_default_server(char **jobids, int numjids, char *malloc_track)
{
	int i;
	char *def_server = pbs_default();
	char jobid[PBS_MAXJOBNAME +1];
	for (i = 0; i < numjids; i++) {
		if (check_short_jobid(jobids[i])) {
			if (def_server == NULL) {
				return -1;
			}

			sprintf(jobid, "%s.%s", jobids[i], def_server);
			jobids[i] = strdup(jobid);
			if (jobids[i] == NULL) {
				return -1;
			}
			malloc_track[i] = 1;
		}
	}

	return 0;
}

/**
 * @brief Remove duplicate jobids from jobids list
 *
 * @param [in,out] jobids list of jobids
 * @param [in,out] numjids total count of jobids
 * @param [in,out] malloc_track to track the memory allocated
 * 
 * @return int
 * @retval 0  for Success
 * @retval -1 for Failure
 */
int
dedup_jobids(char **jobids, int *numjids, char *malloc_track)
{
	void *index = NULL;
	void *non_array_jobs_idx = NULL;
	void *array_jobs_idx = NULL;
	int uni_jobids = 0;	  /* counter for unique jobids */
	int uni_array_jobids = 0; /* counter for unique array jobids */
	int i = 0, j = 0, rc = 0, dup = 0, ret = 0, is_job_array = 0;
	char **array_jobid_list = NULL;
	char *array_job_range = NULL, *array_jobid = NULL, *hostname = NULL;
	char temp_range[256] = {
		'\0',
	};
	range *r1 = NULL, *r2 = NULL, *r3 = NULL;
	array_job_range_list **srange_list = NULL, *srange = NULL, *new_srange = NULL;
	int original_numjids = *numjids;
	
	if (jobids == NULL || numjids == NULL)
		return -1;

	array_jobid_list = calloc((*numjids + 1), sizeof(char *));
	if (array_jobid_list == NULL)
		return -1;

	srange_list = calloc((*numjids), sizeof(array_job_range_list *));
	if (array_jobid_list == NULL)
		return -1;

	if (add_default_server(jobids, *numjids, malloc_track)) {
		return -1;
	}

	non_array_jobs_idx = pbs_idx_create(0, 0);
	array_jobs_idx = pbs_idx_create(0, 0);

	for (i = 0, j = 0; i < *numjids; i++) {
		is_job_array = is_array_job(jobids[i]);
		if (is_job_array == IS_ARRAY_ArrayJob ||
				is_job_array == IS_ARRAY_Single ||
				is_job_array == IS_ARRAY_Range) {
			dup = 0;
			if (split_sub_jobid(jobids[i], &array_jobid, &array_job_range) != 0) {
				ret = -1;
				goto err;
			}
			new_srange = new_job_range();
			if (new_srange == NULL) {
				ret = -1;
				goto err;
			}
			new_srange->range = array_job_range;
			srange_list[i] = new_srange;
			if (pbs_idx_find(array_jobs_idx, (void **) &array_jobid,
					 (void **) &srange,
					 NULL) == PBS_IDX_RET_OK) {
				/* found duplicate, update the range */
				dup = 1;
				new_srange->next = srange;
				srange = new_srange;
				/* Delete existing value */
				if (pbs_idx_delete(array_jobs_idx,
						   array_jobid) != PBS_IDX_RET_OK) {
					ret = -1;
					goto err;
				}
			} else
				srange = new_srange;
			if (pbs_idx_insert(array_jobs_idx, array_jobid, srange) !=
			    PBS_IDX_RET_OK) {
				ret = -1;
				goto err;
			}
			if (!dup) {
				array_jobid_list[j] = array_jobid;
				j++;
				uni_array_jobids++;
			} else
				free(array_jobid);
		} else if (non_array_jobs_idx) { /* For Normal jobs */
			rc = pbs_idx_find(non_array_jobs_idx, (void **) &jobids[i],
					  (void **) &index, NULL);
			if (rc == PBS_IDX_RET_OK)
				continue;
			rc = pbs_idx_insert(non_array_jobs_idx, jobids[i], NULL);
			if (rc == PBS_IDX_RET_OK) {
				jobids[uni_jobids] = jobids[i];
				uni_jobids++; /* counter for non array jobs */
			}
		}
	}
	array_jobid_list[j] = NULL;

	/*
	If the same jobids present with different ranges then
	join their ranges, to avoid the overlaping / duplicates
	of subjobids.
	*/
	for (i = 0; array_jobid_list[i] != NULL; i++, uni_jobids++) {
		if (pbs_idx_find(array_jobs_idx, (void **) &array_jobid_list[i],
				 (void **) &srange, NULL) == PBS_IDX_RET_OK) {
			memset(temp_range, '\0', sizeof(temp_range));
			for (; srange; srange = (array_job_range_list *) srange->next) {
				if (strlen(temp_range) == 0) {
					strncpy(temp_range, srange->range,
						sizeof(temp_range) - 1);
					continue;
				}
				r1 = range_parse(temp_range);
				r2 = range_parse(srange->range);
				r3 = range_join(r1, r2);
				strncpy(temp_range, range_to_str(r3),
					sizeof(temp_range) - 1);
				free_range_list(r1);
				free_range_list(r2);
				free_range_list(r3);
			}
		}
		if (malloc_track[uni_jobids]) {
			free(jobids[uni_jobids]);
		}
		/* one for '[', one for ']' and one for '.' */
		jobids[uni_jobids] = (char *) malloc(strlen(array_jobid_list[i]) + strlen(temp_range) + 4);
		if (jobids[uni_jobids] == NULL) {
			ret = -1;
			goto err;
		}
		malloc_track[uni_jobids] = 1;
		hostname = strchr(array_jobid_list[i], (int) '.');
		if (hostname == NULL)
			sprintf(jobids[uni_jobids], "%s[%s]", array_jobid_list[i],
				temp_range);
		else {
			*hostname = '\0';
			sprintf(jobids[uni_jobids], "%s[%s].%s",
				array_jobid_list[i], temp_range, ++hostname);
		}
	}
	*numjids = uni_jobids;
	ret = 0;
err:
	free_string_array(array_jobid_list);
	for (i = 0; i < original_numjids; i++) {
		if (srange_list[i]) {
			if (srange_list[i]->range)
				free(srange_list[i]->range);
			free(srange_list[i]);
		}
	}
	free(srange_list);
	pbs_idx_destroy(non_array_jobs_idx);
	pbs_idx_destroy(array_jobs_idx);

	return ret;
}


================================================
FILE: src/lib/Libutil/entlim.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */
#include <pbs_config.h>

#include <stdlib.h>
#include <string.h>
#include <stdio.h>
#include "pbs_entlim.h"

/* entlim iteration context structure, opaque to caller */
typedef struct _entlim_ctx {
	void *idx;
	void *idx_ctx;
} entlim_ctx;

/**
 * @brief
 * 	entlim_initialize_ctx - initialize the data context structure
 */
void *
entlim_initialize_ctx(void)
{
	entlim_ctx *pctx = malloc(sizeof(entlim_ctx));
	if (pctx == NULL)
		return NULL;
	pctx->idx_ctx = NULL;
	pctx->idx = pbs_idx_create(0, 0);
	if (pctx->idx == NULL) {
		free(pctx);
		return NULL;
	}
	return (void *) pctx;
}

/**
 * @brief
 * 	entlim_get - get record whose key is built from the given key-string
 *
 * @param[in] keystr - key string whose key is to be built
 * @param[in] ctx - pointer to context
 *
 * @return	void text
 * @retval	key		success
 * @retval	NULL		error
 *
 */

void *
entlim_get(const char *keystr, void *ctx)
{
	void *rtn;

	if (pbs_idx_find(((entlim_ctx *) ctx)->idx, (void **) &keystr, &rtn, NULL) == PBS_IDX_RET_OK)
		return rtn;
	return NULL;
}

/**
 * @brief
 * 	entlim_add - add a record with a key based on the key-string
 *
 * @param[in] keystr - key string whose key is to be built
 * @param[in] recptr - pointer to record
 * @param[in] ctx - pointer to context
 *
 * @return	int
 * @retval	0	success, record added
 * @retval	-1	add failed
 */
int
entlim_add(const char *keystr, const void *recptr, void *ctx)
{
	if (pbs_idx_insert(((entlim_ctx *) ctx)->idx, (void *) keystr, (void *) recptr) == PBS_IDX_RET_OK)
		return 0;
	return -1;
}

/**
 * @brief
 * 	entlim_replace - replace a record with a key based on the key-string
 *	if the record already exists, if not then this becomes equivalent
 *	to entlim_add().
 *
 * @param[in] keystr - key string whose key is to be built
 * @param[in] recptr - pointer to record
 * @param[in] ctx - pointer to context
 * @param[in] free_leaf() - function called to delete data record when removing
 *			    exiting record.
 *
 * @return	int
 * @retval	0	success, record replace/added
 * @retval	-1	change failed
 */
int
entlim_replace(const char *keystr, void *recptr, void *ctx, void fr_leaf(void *))
{
	void *olddata;
	entlim_ctx *pctx = (entlim_ctx *) ctx;

	if (pbs_idx_insert(pctx->idx, (void *) keystr, recptr) == PBS_IDX_RET_OK)
		return 0;
	else {
		if (pbs_idx_find(pctx->idx, (void **) &keystr, &olddata, NULL) == PBS_IDX_RET_OK) {
			if (pbs_idx_delete(pctx->idx, (void *) keystr) == PBS_IDX_RET_OK) {
				fr_leaf(olddata);
				if (pbs_idx_insert(pctx->idx, (void *) keystr, recptr) == PBS_IDX_RET_OK)
					return 0;
			}
		}
	}
	return -1;
}

/**
 * @brief
 * 	entlim_delete - delete record with a key based on the keystr
 *
 * @param[in] keystr - key string whose key is to be built
 * @param[in] recptr - pointer to record
 * @param[in] ctx - pointer to context
 * @param[in] free_leaf() - function to free the data structure associated
 *			    with the key.
 *
 * @return	int
 * @retval	0	delete success
 * @retval	-1	delete failed
 */
int
entlim_delete(const char *keystr, void *ctx, void free_leaf(void *))
{
	void *prec;

	if (pbs_idx_find(((entlim_ctx *) ctx)->idx, (void **) &keystr, &prec, NULL) == PBS_IDX_RET_OK) {
		if (pbs_idx_delete(((entlim_ctx *) ctx)->idx, (void *) keystr) == PBS_IDX_RET_OK) {
			free_leaf(prec);
			return 0;
		}
	}
	return -1;
}

/**
 * @brief
 * 	entlim_get_next - walk the objects returning the next entry.
 *	If called with a NULL key, it allocates a key and returns
 *	the first entry; otherwise it returns the next entry.
 *
 * @param[in] keystr - key string whose key is to be built
 * @param[in] ctx - pointer to context
 *
 * @return	structure handle
 * @retval	key info		success
 * @retval	NULL			error
 *		Returns NULL following the last entry or when no entry found
 *		The key needs to be freed by the caller when all is said and done.
 */
void *
entlim_get_next(void *ctx, void **key)
{

	entlim_ctx *pctx = (entlim_ctx *) ctx;
	void *data;

	if (pctx == NULL || pctx->idx == NULL)
		return NULL;

	if (key != NULL && *key != NULL) {
		if (pctx->idx_ctx == NULL)
			return NULL;
	} else {
		if (pctx->idx_ctx != NULL)
			pbs_idx_free_ctx(pctx->idx_ctx);
		pctx->idx_ctx = NULL;
	}

	if (pbs_idx_find(pctx->idx, key, &data, &pctx->idx_ctx) == PBS_IDX_RET_OK)
		return data;

	pbs_idx_free_ctx(pctx->idx_ctx);
	pctx->idx_ctx = NULL;
	*key = NULL;
	return NULL;
}

/**
 * @brief
 * 	entlim_free_ctx - free the data structure including all keys and records
 *
 * @param[in] ctx - pointer to context
 * @param[in] free_leaf() - function called to delete data record when removing
 *                          exiting record.
 *
 * @return      int
 * @retval      0       success, record freed
 * @retval      -1      freeing failed
 */

int
entlim_free_ctx(void *ctx, void free_leaf(void *))
{
	void *leaf;
	entlim_ctx *pctx = (entlim_ctx *) ctx;

	if (pctx->idx_ctx != NULL)
		pbs_idx_free_ctx(pctx->idx_ctx);
	pctx->idx_ctx = NULL;
	while (pbs_idx_find(pctx->idx, NULL, &leaf, &pctx->idx_ctx) == PBS_IDX_RET_OK) {
		free_leaf(leaf);
	}
	pbs_idx_free_ctx(pctx->idx_ctx);
	pbs_idx_destroy(pctx->idx);
	free(pctx);
	return 0;
}

/**
 * @brief
 * 	entlim_mk_keystr - make a key string from the key type, entity and resc
 *
 * @param[in] kt - enum for key token
 * @param[in] entity - entity name
 * @param[in] resc - resource name
 *
 * @return	strinf
 * @retval	ptr to key string in the heap -
 *
 * @par	WARNING - it is up to you to free it
 */
static char *
entlim_mk_keystr(enum lim_keytypes kt, const char *entity, const char *resc)
{
	size_t keylen;
	char *pkey;
	char ktyl;

	if (kt == LIM_USER)
		ktyl = 'u';
	else if (kt == LIM_GROUP)
		ktyl = 'g';
	else if (kt == LIM_PROJECT)
		ktyl = 'p';
	else if (kt == LIM_OVERALL)
		ktyl = 'o';
	else
		return NULL; /* invalid entity key type */

	keylen = 2 + strlen(entity);
	if (resc)
		keylen += 1 + strlen(resc);
	pkey = malloc(keylen + 1);

	if (pkey) {
		if (resc)
			sprintf(pkey, "%c:%s;%s", ktyl, entity, resc);
		else
			sprintf(pkey, "%c:%s", ktyl, entity);
	}
	return (pkey);
}

/**
 * @brief
 * 	entlim_mk_runkey - make a key for a entity run (number of jobs) limit
 *
 * @param[in] kt - enum for key token
 * @param[in] entity - entity name
 *
 * @return      strinf
 * @retval      ptr to key string in the heap -
 *
 * @par WARNING - it is up to you to free it
 */
char *
entlim_mk_runkey(enum lim_keytypes kt, const char *entity)
{
	return entlim_mk_keystr(kt, entity, NULL);
}

/**
 * @brief
 * 	entlim_mk_reskey - make a key for a entity resource usage limit
 *
 * @param[in] kt - enum for key token
 * @param[in] entity - entity name
 *
 * @return      strinf
 * @retval      ptr to key string in the heap -
 *
 * @par WARNING - it is up to you to free it
 */
char *
entlim_mk_reskey(enum lim_keytypes kt, const char *entity, const char *resc)
{
	return entlim_mk_keystr(kt, entity, resc);
}

/**
 * @brief
 * 	entlim_entity_from_key - obtain the entity name from a key
 *
 * @param[in] key - pointer to key info
 * @param[in] rtnname - a buffer large enought to hold the max entity name +1
 * @param[in] ln      - the size of that buffer
 *
 * @return	int
 * @retval	0	entity name found and returned
 * @retval	-1	entity name would not fit
 */
int
entlim_entity_from_key(char *key, char *rtnname, size_t ln)
{
	char *pc;
	int sz = 0;

	pc = key + 2;
	while (*pc && (*pc != ';')) {
		++sz;
		++pc;
	}
	if ((size_t) sz < ln) {
		(void) strncpy(rtnname, key + 2, sz);
		*(rtnname + sz) = '\0';
		return 0;
	}
	return -1;
}

/**
 * @brief
 * 	entlim_resc_from_key - obtain the resource name from a key if it
 *	includes one.
 *
 * @param[in] key - pointer to key info
 * @param[in] rtnname - a buffer large enought to hold the max entity name +1
 * @param[in] ln      - the size of that buffer
 *
 * @return      int
 * @retval      0 	resource name found and returned
 * @retval      -1	resource name would not fit
 * @retval	+1	no resource name found
 *
 */
int
entlim_resc_from_key(char *key, char *rtnresc, size_t ln)
{
	char *pc;

	pc = strchr(key, (int) ';');
	if (pc) {
		if (strlen(++pc) < ln) {
			strcpy(rtnresc, pc);
			return 0;
		} else
			return -1;
	} else {
		*rtnresc = '\0';
		return 1;
	}
}


================================================
FILE: src/lib/Libutil/execvnode_seq_util.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	execvnode_seq_util.c
 * @brief
 *  Utility functions to condense and unroll a sequence of execvnodes that are
 *  returned by the scheduler as confirmation of a standing reservation.
 *  The functionality is to condense into a human-readable string, the execvnodes
 *  of each occurrence of a standing reservation, and be able to retrieve each
 *  occurrence by occurrence index of an array.
 *
 *  Example usage (also refer to the debug function int test_execvnode_seq
 *  for a practical example):
 *
 *  Assume str points to some string.
 *  char *condensed_str;
 *  char **unrolled_str;
 *  char **tofree;
 *
 *  condensed_str = condense_execvnode_seq(str);
 *  unrolled_str = unroll_execvnode_seq(condensed_str, &tofree);
 *  ...access an arbitrary, say 2nd occurrence, index via unrolled_str[1]
 *  free_execvnode_seq(tofree);
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <libutil.h>
#include <log.h>
#include <string.h>
#include <stdio.h>
#include <stdlib.h>

/* Initialize a dictionary structure */
static dictionary *new_dictionary();

/* Initialize a new word with the given string value */
static struct word *new_word(char *);

/* Initialize a new map for a given value */
static struct map *new_map(int);

/* Map a sequence of words to a list of indices by which
 * they are represented in the passed string str.
 */
static int direct_map(dictionary *, char *);

/* find a word in a dictionary */
static struct word *find_word(dictionary *, char *);

/* Append word to dictionary */
static int append_to_dict(dictionary *, char *, int);

/* Append the index of a word in a string to the mapping of the word */
static int append_to_word(dictionary *, struct word *, int);

/* Create a string out of all words in a dictionary and their corresponding mapped indices */
static char *dict_to_str(dictionary *);

/* Free memory allocated to dictionary */
static void free_dict(dictionary *);

/* Free memory allocated to a word and its mapping */
static void free_word(struct word *);

/**
 * @brief
 *	Initialize a dictionary structure.
 *
 * @return	structure handle
 * @retval	a new dictionary structure 	success
 * @retval	NULL 				if unable to allocate memory.
 *
 */
static dictionary *
new_dictionary()
{
	dictionary *dict;
	if ((dict = (dictionary *) malloc(sizeof(dictionary))) == NULL) {
		DBPRT(("new_dictionary: %s\n", MALLOC_ERR_MSG))
		return NULL;
	}
	dict->first = NULL;
	dict->last = NULL;
	dict->count = 0;
	dict->length = 0;
	dict->max_idx = 0;

	return dict;
}

/**
 * @brief
 * 	Initialize a new word with the given string value.
 *
 * @param[in] str - The string value associated to the new word
 *
 * @return 	structure handle
 * @retval	a new word structure 	succes
 * @retval	NULL 			if unable to allocate memory
 *
 */
static struct word *
new_word(char *str)
{
	struct word *nw;

	if (str == NULL)
		return NULL;

	if ((nw = malloc(sizeof(struct word))) == NULL) {
		DBPRT(("new_word: %s\n", MALLOC_ERR_MSG))
		return NULL;
	}
	if ((nw->name = strdup(str)) == NULL) {
		free(nw);
		DBPRT(("new_word: %s\n", MALLOC_ERR_MSG));
		return NULL;
	}
	nw->next = NULL;
	nw->map = NULL;
	nw->count = 0;

	return nw;
}

/**
 * @brief
 * 	Initialize a new map for a given value. A map is the associated value of a
 * 	word, and in practice is the index where the word appears in the sequence.
 *
 * @param[in] val - The integer value corresponding to the index  of a word.
 *
 * @return 	structure handle
 * @retval	A new map structure 	success
 * @retval	NULL 			if unable to allocate memory.
 *
 */
static struct map *
new_map(int val)
{
	struct map *m;

	if (val < 0)
		return NULL;

	if ((m = malloc(sizeof(struct map))) == NULL) {
		DBPRT(("new_map: %s\n", MALLOC_ERR_MSG))
		return NULL;
	}
	m->val = val;
	m->next = NULL;

	return m;
}

/**
 * @brief
 * 	Map a sequence of words to a list of indices by which
 * 	they are represented in the passed string str.
 *
 * @par	Given a sequence of words (the execvnodes), this function\n
 * 	1) Looks for the word in the dictionary\n
 * 	2) If the word is found, the index where it appears in the string is added
 *    	as a mapping of the word\n
 * 	3) If the word is not found in the dictionary, it is added.\n
 *
 * @param[out] dict - The dictionary considered.
 * @param[in] str - The string to check against in the dictionary.
 *
 * @par	Note:
 *	If the string exists in the dictionary, its index is appended
 * 	to the word entry. Otherwise it is added as a new word to the dictionary
 *
 * @return int
 * @retval 1 error
 * @retval 0 success
 */
static int
direct_map(dictionary *dict, char *str)
{
	struct word *w;
	char *str_tok;
	char *str_copy;
	int i = 0;

	if (dict == NULL || str == NULL)
		return 1;

	if ((str_copy = strdup(str)) == NULL) {
		DBPRT(("new_word: %s\n", MALLOC_ERR_MSG));
		return 1;
	}

	str_tok = strtok(str_copy, TOKEN_SEPARATOR);
	while (str_tok != NULL) {
		w = (struct word *) find_word(dict, str_tok);
		if (w == NULL) {
			if (append_to_dict(dict, str_tok, i)) {
				free(str_copy);
				return 1;
			}
		} else if (append_to_word(dict, w, i)) {
			free(str_copy);
			return 1;
		}
		i++;
		str_tok = strtok(NULL, TOKEN_SEPARATOR);
	}
	dict->max_idx = i;
	free(str_copy);
	return 0;
}

/**
 * @brief
 * 	Find a word in a dictionary.
 *
 * @param[in] dict - The dictionary in which to search
 * @param[in] str - The string to be found.
 *
 * @return	structure handle
 * @retval	a Word structure 	if the word is found,
 * @retval	NULL.			if not found
 *
 */
static struct word *
find_word(dictionary *dict, char *str)
{
	struct word *cur;

	if (dict == NULL || str == NULL)
		return NULL;

	if (dict->count == 0)
		return NULL;

	for (cur = dict->first; cur != NULL; cur = cur->next) {
		if (!strcmp(cur->name, str))
			return cur;
	}

	return NULL;
}

/**
 * @brief
 * 	Append word to dictionary.
 *
 * @param[in] dict - The dictionary considered.
 * @param[in] str - The string representation of the word to append
 * @param[in] val - The index at which the string resides in the original string.
 * 
 * @return int
 * @retval 1 error
 * @retval 0 success
 *
 */
static int
append_to_dict(dictionary *dict, char *str, int val)
{
	struct word *nw;
	struct word *tmp;

	if (dict == NULL || str == NULL || val < 0)
		return 1;

	nw = new_word(str);

	if (nw == NULL)
		return 1;

	if (dict->first == NULL) {
		dict->first = nw;
		dict->last = nw;
	} else {
		tmp = dict->first;
		dict->first = nw;
		nw->next = tmp;
	}
	nw->map = new_map(val);

	if (nw->map == NULL)
		return 1;

	nw->count++;
	dict->length += strlen(str);
	dict->length += MAX_INT_LENGTH;
	dict->count++;

	return 0;
}

/**
 * @brief
 * 	Append the index of a word in a string to the mapping of the word
 *
 * @param[in] dict - The dictionary considered
 * @param[in] w - The word to append to
 * @param[in] val - The index value to append to the word
 * 
 * @return int
 * @retval 1 error
 * @retval 0 success
 *
 */
static int
append_to_word(dictionary *dict, struct word *w, int val)
{

	struct map *m, *tmp;

	if (dict == NULL || w == NULL || val < 0)
		return 1;

	m = w->map;
	tmp = m;
	if (m == NULL) {
		m = new_map(val);

		if (m == NULL)
			return 1;

		w->map = m;
	} else {
		while (tmp->next != NULL) {
			tmp = tmp->next;
		}
		tmp->next = new_map(val);

		if (tmp->next == NULL)
			return 1;
	}
	w->count++;
	/* MAX_INT_LENGTH is the length of a string representation of an index */
	dict->length += MAX_INT_LENGTH;

	return 0;
}

/**
 * @brief
 *	Convert a TOKEN_SEPARATOR delimited string into a condensed dictionary representation.
 *
 * @param[in] str - The string to condense into indexed arrays or repeating occurrences.
 *
 * @return 	string
 * @retval	a Condensed reprsentation of the string in which all recurring tokens are
 * 		represented by an indexed array. For example the string:
 *		(tic)~(tac)~(toe)~(tic)~(tic)~(tic) is condensed to (tic){0,3-5} (tac){1} (toe){2}
 *		( the condensed representation of the sequence of tokens)
 * @retval	NULL			error
 *
 */
char *
condense_execvnode_seq(const char *str)
{
	dictionary *dict;
	char *s_tmp;
	char *cp;

	if (str == NULL)
		return NULL;

	dict = new_dictionary();

	if (dict == NULL)
		return NULL;

	s_tmp = strdup(str);
	if (s_tmp == NULL) {
		DBPRT(("condense_execvnode_seq: %s\n", MALLOC_ERR_MSG));
		free(dict);
		return NULL;
	}
	if (direct_map(dict, s_tmp)) {
		free(s_tmp);
		free_dict(dict);
		return NULL;
	}
	cp = dict_to_str(dict);
	/* Free up all memory allocated */
	free_dict(dict);
	free(s_tmp);

	return cp;
}

/**
 * @brief
 * 	Unroll a condensed string into an indexed array of pointers to words (strings).
 * 	This function takes as input a string of the form:
 * 	<count>COUNT_TOK<vnode1><range1><vnode2><range2>...
 * The tokens that are being used are:
 * 1) COUNT_TOK to separate the number of occurrences from the sequence of execvnodes
 * 2) WORD_TOK WORD_MAP_TOK used to enclose the range of indices for each execvnode
 *
 * and returns an array of pointers of length count, for which each index of
 * the array points to either vnode1, vnode2,etc based on the values in
 * range1, range2, etc respectively.
 * The idea is that instead of recreating the original long sequence of vnodes, only
 * unique vnode strings are created and is referred to as an array of pointers.
 *
 * Because of this special handling, the pointers to the unique vnodes has to be
 * visible at return time so that it can be properly free'd. The pointers to these
 * unique vnodes are kept in the tofree parameter.
 *
 * @param[in] str - The string to unroll
 * @param[in] tofree - A pointer to a block of memory to deallocate
 *
 * @return A pointer to the unrolled string
 *
 */
char **
unroll_execvnode_seq(char *str, char ***tofree)
{
	char *word;
	char *map;
	char *range;
	char *nm1 = NULL;
	char *nm2 = NULL;
	char *nm3 = NULL;
	int max_idx;
	int first, last;
	char *tmp;
	int i;
	int j = 0;

	char **rev_dict;

	if (str == NULL) {
		*tofree = NULL;
		return NULL;
	}

	/* Tokenize the number of occurrences part */
	word = string_token(str, COUNT_TOK, &nm1);

	if (word == NULL)
		return NULL;
	/* The number of occurrences */
	max_idx = atoi(word);
	/* Allocate memory for the returning variable rev_dict which
	 * will be an array of pointers of length, the number of occurrences,
	 * for which each index corresponds to the execvnode associated to that occurrence */
	if ((rev_dict = (char **) malloc((max_idx + 1) * sizeof(char *))) == NULL) {
		DBPRT(("unroll_execvnode_seq: %s\n", MALLOC_ERR_MSG));
		return NULL;
	}
	/* Allocate memory to the block of memory that contains only Unique execvnodes
	 * that will need to be freed once the string is not anymore needed.
	 * This block of memory is made as large as rev_dict in the worst case where
	 * all execvnodes are distinct but is resized later for the average case
	 * where most execvnodes after a certain date will be identical */
	if ((*tofree = (char **) malloc((max_idx + 1) * sizeof(char *))) == NULL) {
		free(rev_dict);
		return NULL;
	}
	/* Tokenize the <vnode>{range} part */
	word = string_token(NULL, WORD_TOK, &nm1);
	while (word != NULL) {
		if ((tmp = strdup(word)) == NULL) {
			free(*tofree);
			free(rev_dict);
			DBPRT(("unroll_execvnode_seq: %s\n", MALLOC_ERR_MSG));
			return NULL;
		}
		/* Tokenize to isolate <vnode> in <vnode>{range} */
		word = string_token(NULL, WORD_MAP_TOK, &nm1);
		if (word == NULL) {
			free(tmp);
			break;
		}
		/* Tokenize to isolate {range} */
		map = string_token(word, MAP_TOK, &nm2);
		while (map != NULL) {
			/* Tokenize the range which can be of the form 0-10 or 0,3,5 */
			range = string_token(map, RANGE_TOK, &nm3);
			if (range != NULL) {
				first = atoi(range);
				last = first;
				/* Each index in range is parsed */
				range = string_token(NULL, RANGE_TOK, &nm3);
				if (range != NULL)
					last = atoi(range);
				/* Append the <vnode> token to the pointer array
				 * for each index indicated by range */
				for (i = first; i <= last; i++)
					rev_dict[i] = (char *) tmp;
			} else {
				rev_dict[atoi(map)] = (char *) tmp;
			}
			map = string_token(NULL, MAP_TOK, &nm2);
		}
		/* Append each unique <vnode> to the block of memory to free */
		if (j < max_idx) {
			(*tofree)[j] = tmp;
			j++;
		} else {
			j = max_idx;
			break;
		}
		word = string_token(NULL, WORD_TOK, &nm1);
	}

	rev_dict[max_idx] = NULL;

	(*tofree)[j] = NULL;

	return rev_dict;
}

/**
 * @brief
 * 	Get the total number of indices represented in the condensed string
 * 	which corresponds to the total number of occurrences in the execvnode string
 *
 * @param[in] str - Either a condensed execvnode_seq or a single execvnode
 * 		The format expected is in the form of:
 * 		execvnode_seq: N#(execvnode){0-N-1} e.g. 10:(mars:ncpus=1){0-9}
 * 		Single execvnode: (mars:ncpus=1)
 *
 * @return	int
 * @retval	The number of occurrences. If the first token is
 * @retval	0			   NULL,
 *
 */
int
get_execvnodes_count(char *str)
{
	int count;
	char *word;
	char *str_copy;

	if (str == NULL)
		return 0;

	if (str[0] == '(')
		return 1;

	if ((str_copy = strdup(str)) == NULL)
		return 0;
	word = strtok(str_copy, COUNT_TOK);

	if (word == NULL)
		return 0;

	count = atoi(word);
	free(str_copy);

	return count;
}

/**
 * @brief
 *	Translate a dictionary into a string
 *      Walks the entire dictionary, word by word, and for each word creates a
 *      string representation by concatenating words together.
 *      The result is a string of tokens separated by the WORD_TOK character.
 *      The format of the returned string is:
 *
 *      <num_occurrences>COUNT_TOK<vnode1>WORD_TOK<range>WORD_MAP_TOK<vnode2>
 *      WORD_TOK...COUNT_TOK, WORD_TOK and WORD_MAP_TOK are defined in the
 *      header file.
 *
 * @param[in]   dict - the dictionary considered
 *
 * @return char* The concatenation of all words in the dictionary.
 * @retval SUCCESS The concatenation of all words in the dictionary
 * @retval NULL	Memory allocation for returned string fails
 */
static char *
dict_to_str(dictionary *dict)
{
	char *condensed;
	char *tmp;
	char buf[1024];
	struct word *w;
	struct map *m;
	int prev = 0, first = 0, cur;
	int begin_range = 1;

	if (dict == NULL)
		return NULL;

	w = dict->first;

	if (w == NULL)
		return NULL;

	/* Allocate  sufficient memory for the string to be returned
	 * this string will be resized at the end of the function.*/
	if ((condensed = malloc((dict->length + 1) * sizeof(char))) == NULL) {
		DBPRT(("dict_to_str: %s\n", MALLOC_ERR_MSG));
		return NULL;
	}

	/* Write the number of occurrences followed by COUNT_TOK */
	sprintf(condensed, "%d%s", dict->max_idx, COUNT_TOK);

	m = w->map;

	while (w != NULL) {
		tmp = strdup(w->name);
		if (tmp == NULL) {
			break;
		}
		/* Concatenate the vnode followed by the separator
		 * to start the range */
		(void) strcat(condensed, tmp);
		(void) strcat(condensed, WORD_TOK);

		while (m != NULL) {
			cur = m->val;
			/* If current value (and not first scan) is increment
			 *  of previous then keep reading */
			if (!begin_range && cur == prev + 1) {
				m = m->next;
				prev = cur;
				continue;
			}

			if (begin_range) {
				first = cur;
				begin_range = 0;
				m = m->next;
			} else {
				/* Concatentate the range */
				if (first == prev)
					sprintf(buf, "%d%s", first, MAP_TOK);
				else
					sprintf(buf, "%d%s%d, ", first, RANGE_TOK, prev);
				(void) strcat(condensed, buf);
				begin_range = 1;
			}

			prev = cur;
		}
		if (first == prev)
			sprintf(buf, "%d", first);
		else
			sprintf(buf, "%d%s%d", first, RANGE_TOK, prev);
		(void) strcat(condensed, buf);

		begin_range = 1;

		w = w->next;
		if (w != NULL)
			m = w->map;
		/* Concatenate the closing separator of the range */
		strcat(condensed, WORD_MAP_TOK);

		free(tmp);
	}
	/* condensed was malloc'd dict->length which was an "overestimate" of the actual needed memory
	 * resize to what's actually been used */
	tmp = realloc(condensed, (strlen(condensed) + 1) * sizeof(char));
	if (tmp == NULL) {
		free(condensed);
		DBPRT(("dict_to_str: %s\n", MALLOC_ERR_MSG));
		return NULL;
	} else
		condensed = tmp;

	condensed[strlen(condensed)] = '\0';

	return condensed;
}

/**
 * @brief
 * 	Free up all memory allocated to dictionary
 *
 * @param[in] dict - The dictionary considered
 *
 */
static void
free_dict(dictionary *dict)
{
	struct word *w;
	struct word *w_tmp;

	if (dict == NULL)
		return;

	w = dict->first;

	if (w == NULL) {
		free(dict);
		return;
	}

	while (w->next != NULL) {
		w_tmp = w->next;
		free_word(w);
		w = w_tmp;
	}
	free_word(w);
	free(dict);
}

/**
 * @brief
 * 	Free memory allocated to a word and its mapping
 *
 * @param[in] w - The word to deallocate memory for
 *
 */
static void
free_word(struct word *w)
{
	struct map *m;
	struct map *m_tmp;

	if (w == NULL)
		return;

	m = w->map;

	if (m == NULL)
		return;

	while (m->next != NULL) {
		m_tmp = m->next;
		free(m);
		m = m_tmp;
	}
	free(m);
	free(w->name);
	free(w);
}

/**
 * @brief
 * 	Free the memory allocated to an unrolled execvnode sequence.
 *  	The execvnode sequence is an array of pointers to the unique
 *  	execvnode strings.
 *
 * @par	Note that this function is passed the block of memory allocated
 *  	from unroll_execvnode_seq's argument and NOT its return value.
 *  	The block of memory that is freed here is only the unique execvnodes
 *  	that had been allocated and not the array of pointers to these execvnodes.
 *
 * @param[in] ptr - Pointer to a block of memory to free
 *
 */
void
free_execvnode_seq(char **ptr)
{
	int i;

	if (ptr == NULL)
		return;

	for (i = 0; ptr[i] != NULL; i++)
		free(ptr[i]);
	free(ptr);
}

#ifdef DEBUG
/**
 * @brief
 * 	function for Unit test
 *
 */
void
test_execvnode_seq()
{
	int i;
	int num;
	char *str;
	char *condensed_execvnodes;
	char **tofree;
	char **unroll_execvnodes;

	/* using all possible legal vnode characters separated by TOKEN_SEPARATOR */
	str = "(a-_^.#[0]:n=1)~(b@m.[1],c:m=2)~(a-_^.#[0]:n=1)~(b@m.[1],c:m=2)";
	printf("Original string: %s\n", str);
	condensed_execvnodes = condense_execvnode_seq(str);
	num = get_execvnodes_count(condensed_execvnodes);
	printf("condensed string: %s\n", condensed_execvnodes);
	unroll_execvnodes = unroll_execvnode_seq(condensed_execvnodes, &tofree);
	printf("Decompressed string:\n");
	for (i = 0; i < num; i++)
		printf("%s ", unroll_execvnodes[i]);
	printf("\n");
	free(unroll_execvnodes);
	free_execvnode_seq(tofree);
	free(condensed_execvnodes);
}
#endif


================================================
FILE: src/lib/Libutil/get_hostname.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	get_hostname.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <ctype.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include "portability.h"
#include <netdb.h>
#include <string.h>
#include <errno.h>
#include <arpa/inet.h>
#include "pbs_ifl.h"
#include "pbs_internal.h"

/**
 * @brief
 * 	-get_fullhostname - get the fully qualified name of a host.
 *
 * @param[in] shortname - short name of host
 * @param[in] namebuf - buffer holding local name of host
 * @param[in] bufsize - buffer size
 *
 * @return	int
 * @retval	0	if success
 *			host name in character buffer pointed to by namebuf
 * @retval	-1	if error
 */

int
get_fullhostname(char *shortname, char *namebuf, int bufsize)
{
	int i;
	char *pbkslh = 0;
	char *pcolon = 0;
	char extname[PBS_MAXHOSTNAME + 1] = {'\0'};
	char localname[PBS_MAXHOSTNAME + 1] = {'\0'};
	struct addrinfo *aip, *pai;
	struct addrinfo hints;
	struct sockaddr_in *inp;

	if ((pcolon = strchr(shortname, (int) ':')) != NULL) {
		*pcolon = '\0';
		if (*(pcolon - 1) == '\\')
			*(pbkslh = pcolon - 1) = '\0';
	}

	memset(&hints, 0, sizeof(struct addrinfo));
	/*
	 *	Why do we use AF_UNSPEC rather than AF_INET?  Some
	 *	implementations of getaddrinfo() will take an IPv6
	 *	address and map it to an IPv4 one if we ask for AF_INET
	 *	only.  We don't want that - we want only the addresses
	 *	that are genuinely, natively, IPv4 so we start with
	 *	AF_UNSPEC and filter ai_family below.
	 */
	hints.ai_family = AF_UNSPEC;
	hints.ai_socktype = SOCK_STREAM;
	hints.ai_protocol = IPPROTO_TCP;

	if (getaddrinfo(shortname, NULL, &hints, &pai) != 0)
		return (-1);

	if (pcolon) {
		*pcolon = ':'; /* replace the colon */
		if (pbkslh)
			*pbkslh = '\\';
	}

	/*
	 *	This loop tries to find a non-loopback IPv4 address suitable
	 *	for use by, in particular, pbs_server (which doesn't want to
	 *	name its jobs <N>.localhost), so we ignore non-IPv4 addresses,
	 *	those that aren't invertible, and those on a loopback net.
	 */
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		if (aip->ai_family != AF_INET)
			continue; /* skip non-IPv4 addresses */
		if (getnameinfo(aip->ai_addr, aip->ai_addrlen, namebuf,
				bufsize, NULL, 0, 0) != 0)
			continue; /* skip non-invertible addresses */
		inp = (struct sockaddr_in *) aip->ai_addr;
		if (ntohl(inp->sin_addr.s_addr) >> 24 != IN_LOOPBACKNET) {
			strncpy(extname, namebuf, (sizeof(extname) - 1));
			break; /* skip loopback addresses */
		} else
			strncpy(localname, namebuf, (sizeof(localname) - 1));
	}
	freeaddrinfo(pai);
	if (extname[0] == '\0')
		strncpy(namebuf, localname, bufsize);
	else
		strncpy(namebuf, extname, bufsize);

	if (namebuf[0] == '\0')
		return (-1);

	for (i = 0; i < bufsize; i++) {
		*(namebuf + i) = tolower((int) *(namebuf + i));
		if (*(namebuf + i) == '\0')
			break;
	}

	*(namebuf + bufsize) = '\0'; /* insure null terminated */
	return (0);
}

/**
 * @brief
 *	Get hostname corresponding to the addr passed
 *
 *  @param[in]	addr	- addr contains ip and port
 * @param[in]	port	- port of peer server service
 *
 * @return	host name
 * @retval	NULL	- Failure
 * @retval	!NULL	- Success
 */
char *
get_hostname_from_addr(struct in_addr addr)
{
	struct hostent *hp;

	hp = gethostbyaddr((void *) &addr, sizeof(struct in_addr), AF_INET);
	if (hp == NULL) {
		log_errf(-1, __func__, "%s: errno=%d, h_errno=%d",
			 inet_ntoa(addr), errno, h_errno);
		return NULL;
	}

	return hp->h_name;
}


================================================
FILE: src/lib/Libutil/hook.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <sys/param.h>
#include <dirent.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <ctype.h>
#include <errno.h>
#include <assert.h>

#include <memory.h>
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "libpbs.h"
#include "list_link.h"
#include "work_task.h"
#include "log.h"
#include "server_limits.h"
#include "attribute.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "svrfunc.h"
#include "pbs_nodes.h"
#include <pbs_python.h> /* for python interpreter */
#include "hook.h"
#include "tpp.h"
#include <signal.h>
#include "hook_func.h"

/**
 * @file	hook.c
 */
/* External functions */

/* Local Private Functions */

/* Global Data items */
static void (*python_interrupt_func)(void) = NULL;

extern char *path_priv;
extern char *path_hooks_workdir;

extern char *path_hooks;
extern time_t time_now;

extern pbs_list_head svr_allhooks;
extern pbs_list_head svr_queuejob_hooks;
extern pbs_list_head svr_postqueuejob_hooks;
extern pbs_list_head svr_modifyjob_hooks;
extern pbs_list_head svr_resvsub_hooks;
extern pbs_list_head svr_modifyresv_hooks;
extern pbs_list_head svr_movejob_hooks;
extern pbs_list_head svr_runjob_hooks;
extern pbs_list_head svr_jobobit_hooks;
extern pbs_list_head svr_management_hooks;
extern pbs_list_head svr_modifyvnode_hooks;
extern pbs_list_head svr_provision_hooks;
extern pbs_list_head svr_periodic_hooks;
extern pbs_list_head svr_resv_confirm_hooks;
extern pbs_list_head svr_resv_begin_hooks;
extern pbs_list_head svr_resv_end_hooks;
extern pbs_list_head svr_execjob_begin_hooks;
extern pbs_list_head svr_execjob_prologue_hooks;
extern pbs_list_head svr_execjob_epilogue_hooks;
extern pbs_list_head svr_execjob_end_hooks;
extern pbs_list_head svr_execjob_preterm_hooks;
extern pbs_list_head svr_execjob_launch_hooks;
extern pbs_list_head svr_exechost_periodic_hooks;
extern pbs_list_head svr_exechost_startup_hooks;
extern pbs_list_head svr_execjob_attach_hooks;
extern pbs_list_head svr_execjob_resize_hooks;
extern pbs_list_head svr_execjob_abort_hooks;
extern pbs_list_head svr_execjob_postsuspend_hooks;
extern pbs_list_head svr_execjob_preresume_hooks;

/**
 *
 * @brief
 *	Removes 'phook' from all the hooks lists known to the system.
 *
 * @param[in]	phook - the hook to remove.
 *
 */
void
clear_hook_links(hook *phook)
{
	delete_link(&phook->hi_queuejob_hooks);
	delete_link(&phook->hi_postqueuejob_hooks);
	delete_link(&phook->hi_modifyjob_hooks);
	delete_link(&phook->hi_resvsub_hooks);
	delete_link(&phook->hi_modifyresv_hooks);
	delete_link(&phook->hi_movejob_hooks);
	delete_link(&phook->hi_runjob_hooks);
	delete_link(&phook->hi_jobobit_hooks);
	delete_link(&phook->hi_provision_hooks);
	delete_link(&phook->hi_periodic_hooks);
	delete_link(&phook->hi_resv_confirm_hooks);
	delete_link(&phook->hi_resv_begin_hooks);
	delete_link(&phook->hi_resv_end_hooks);
	delete_link(&phook->hi_allhooks);
	delete_link(&phook->hi_management_hooks);
	delete_link(&phook->hi_modifyvnode_hooks);

	/* mom hooks below */
	delete_link(&phook->hi_execjob_begin_hooks);
	delete_link(&phook->hi_execjob_prologue_hooks);
	delete_link(&phook->hi_execjob_epilogue_hooks);
	delete_link(&phook->hi_execjob_preterm_hooks);
	delete_link(&phook->hi_execjob_launch_hooks);
	delete_link(&phook->hi_execjob_end_hooks);
	delete_link(&phook->hi_exechost_periodic_hooks);
	delete_link(&phook->hi_exechost_startup_hooks);
	delete_link(&phook->hi_execjob_attach_hooks);
	delete_link(&phook->hi_execjob_resize_hooks);
	delete_link(&phook->hi_execjob_abort_hooks);
	delete_link(&phook->hi_execjob_postsuspend_hooks);
	delete_link(&phook->hi_execjob_preresume_hooks);
}

/**
 *
 * @brief
 *	Return a comma separated set of strings giving
 *	the names of event bits turned on in 'event'.
 *
 * @param[in]	event - input event.
 *
 * @return char *
 * @retval <string>	comma-separated event names.
 *
 * @note
 *	This returns a static string that will get overwritten on the
 *	next call to this function.
 */
char *
hook_event_as_string(unsigned int event)
{
	static char eventstr[HOOK_BUF_SIZE];
	int ev_ct = 0;

	eventstr[0] = '\0';
	if (event & HOOK_EVENT_QUEUEJOB) {
		snprintf(eventstr, sizeof(eventstr), HOOKSTR_QUEUEJOB);
		ev_ct++;
	}

	if (event & HOOK_EVENT_POSTQUEUEJOB) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_POSTQUEUEJOB, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_MODIFYJOB) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_MODIFYJOB, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_RESVSUB) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_RESVSUB, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_MODIFYRESV) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_MODIFYRESV, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_MOVEJOB) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_MOVEJOB, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_RUNJOB) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_RUNJOB, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_JOBOBIT) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_JOBOBIT, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_MANAGEMENT) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_MANAGEMENT, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_MODIFYVNODE) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_MODIFYVNODE, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_PERIODIC) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_PERIODIC, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_PROVISION) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_PROVISION, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_RESV_CONFIRM) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_RESV_CONFIRM, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_RESV_BEGIN) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_RESV_BEGIN, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_RESV_END) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_RESV_END, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_BEGIN) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_BEGIN, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_PROLOGUE) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_PROLOGUE, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_EPILOGUE) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_EPILOGUE, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_END) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_END, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_PRETERM) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_PRETERM, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_LAUNCH) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_LAUNCH, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_ATTACH) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_ATTACH, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_RESIZE) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_RESIZE, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_ABORT) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_ABORT, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_POSTSUSPEND) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_POSTSUSPEND, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECJOB_PRERESUME) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECJOB_PRERESUME, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECHOST_PERIODIC) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECHOST_PERIODIC, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (event & HOOK_EVENT_EXECHOST_STARTUP) {
		if (ev_ct > 0)
			strncat(eventstr, ",", sizeof(eventstr) - strlen(eventstr) - 1);
		strncat(eventstr, HOOKSTR_EXECHOST_STARTUP, sizeof(eventstr) - strlen(eventstr) - 1);
		ev_ct++;
	}

	if (ev_ct == 0)
		snprintf(eventstr, sizeof(eventstr), HOOKSTR_NONE);
	return (eventstr);
}

/**
 * @brief
 *	Returns the internal value (in integer) of the given event string name.
 *
 * @param[in]	eventstr - an event string value (ex. "execjob_begin")
 *
 * @return int
 * @retval <n>	The internal,numeric value (ex. 5)
 */
unsigned int
hookstr_event_toint(char *eventstr)
{
	if (strcmp(eventstr, HOOKSTR_QUEUEJOB) == 0)
		return HOOK_EVENT_QUEUEJOB;
	if (strcmp(eventstr, HOOKSTR_POSTQUEUEJOB) == 0)
		return HOOK_EVENT_POSTQUEUEJOB;
	if (strcmp(eventstr, HOOKSTR_MODIFYJOB) == 0)
		return HOOK_EVENT_MODIFYJOB;
	if (strcmp(eventstr, HOOKSTR_RESVSUB) == 0)
		return HOOK_EVENT_RESVSUB;
	if (strcmp(eventstr, HOOKSTR_MODIFYRESV) == 0)
		return HOOK_EVENT_MODIFYRESV;
	if (strcmp(eventstr, HOOKSTR_MOVEJOB) == 0)
		return HOOK_EVENT_MOVEJOB;
	if (strcmp(eventstr, HOOKSTR_RUNJOB) == 0)
		return HOOK_EVENT_RUNJOB;
	if (strcmp(eventstr, HOOKSTR_JOBOBIT) == 0)
		return HOOK_EVENT_JOBOBIT;
	if (strcmp(eventstr, HOOKSTR_MANAGEMENT) == 0)
		return HOOK_EVENT_MANAGEMENT;
	if (strcmp(eventstr, HOOKSTR_MODIFYVNODE) == 0)
		return HOOK_EVENT_MODIFYVNODE;
	if (strcmp(eventstr, HOOKSTR_PROVISION) == 0)
		return HOOK_EVENT_PROVISION;
	if (strcmp(eventstr, HOOKSTR_RESV_CONFIRM) == 0)
		return HOOK_EVENT_RESV_CONFIRM;
	if (strcmp(eventstr, HOOKSTR_RESV_BEGIN) == 0)
		return HOOK_EVENT_RESV_BEGIN;
	if (strcmp(eventstr, HOOKSTR_RESV_END) == 0)
		return HOOK_EVENT_RESV_END;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_BEGIN) == 0)
		return HOOK_EVENT_EXECJOB_BEGIN;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_PROLOGUE) == 0)
		return HOOK_EVENT_EXECJOB_PROLOGUE;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_EPILOGUE) == 0)
		return HOOK_EVENT_EXECJOB_EPILOGUE;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_END) == 0)
		return HOOK_EVENT_EXECJOB_END;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_PRETERM) == 0)
		return HOOK_EVENT_EXECJOB_PRETERM;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_LAUNCH) == 0)
		return HOOK_EVENT_EXECJOB_LAUNCH;
	if (strcmp(eventstr, HOOKSTR_EXECHOST_PERIODIC) == 0)
		return HOOK_EVENT_EXECHOST_PERIODIC;
	if (strcmp(eventstr, HOOKSTR_EXECHOST_STARTUP) == 0)
		return HOOK_EVENT_EXECHOST_STARTUP;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_ATTACH) == 0)
		return HOOK_EVENT_EXECJOB_ATTACH;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_RESIZE) == 0)
		return HOOK_EVENT_EXECJOB_RESIZE;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_ABORT) == 0)
		return HOOK_EVENT_EXECJOB_ABORT;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_POSTSUSPEND) == 0)
		return HOOK_EVENT_EXECJOB_POSTSUSPEND;
	if (strcmp(eventstr, HOOKSTR_EXECJOB_PRERESUME) == 0)
		return HOOK_EVENT_EXECJOB_PRERESUME;

	return 0;
}

int
hookstr_type_toint(char *hookstr_type)
{
	if (strcmp(hookstr_type, HOOKSTR_SITE) == 0) {
		return (HOOK_SITE);
	}
	if (strcmp(hookstr_type, HOOKSTR_PBS) == 0) {
		return (HOOK_PBS);
	}
	return (-1);
}

/*
 *	Returns the string representation of hook 'type' value.
 */
char *
hook_type_as_string(hook_type type)
{
	switch (type) {

		case HOOK_SITE:
			return HOOKSTR_SITE;

		case HOOK_PBS:
			return HOOKSTR_PBS;

		default:
			return HOOKSTR_UNKNOWN;
	}
}

/*
 *	Returns the string representation of hook 'enabled' value.
 */
char *
hook_enabled_as_string(int enabled)
{
	if (enabled == TRUE)
		return HOOKSTR_TRUE;
	else
		return HOOKSTR_FALSE;
}

/*
 *	Returns the string representation of hook 'debug' value.
 */
char *
hook_debug_as_string(int debug)
{
	if (debug == TRUE)
		return HOOKSTR_TRUE;
	else
		return HOOKSTR_FALSE;
}

/**
 *
 * @brief
 *	Returns the string representation of hook 'user' value.
 *
 * @return char *
 * @reval  <string> - the string version of the internal hook 'user' value.
 */
char *
hook_user_as_string(hook_user user)
{
	switch (user) {

		case HOOK_PBSADMIN:
			return HOOKSTR_ADMIN;
		case HOOK_PBSUSER:
			return HOOKSTR_USER;

		default:
			return HOOKSTR_UNKNOWN;
	}
}

/**
 *
 * @brief
 *	Return a comma separated set of strings giving
 *	the names of fail_action bits turned on in 'fail_action'.
 *
 * @param[in]	fail_action - input fail_action.
 *
 * @return char *
 * @retval <string>	comma-separated fail_action names.
 *
 * @note
 *	This returns a static string that will get overwritten on the
 *	next call to this function.
 */
char *
hook_fail_action_as_string(unsigned int fail_action)
{
	static char fail_actionstr[HOOK_BUF_SIZE];
	char *ptr = &fail_actionstr[0];
	int ev_ct = 0;
	int i;
	static struct {
		unsigned int flags;
		char *name;
	} array[] = {
		{HOOK_FAIL_ACTION_NONE, HOOKSTR_FAIL_ACTION_NONE},
		{HOOK_FAIL_ACTION_OFFLINE_VNODES, HOOKSTR_FAIL_ACTION_OFFLINE_VNODES},
		{HOOK_FAIL_ACTION_CLEAR_VNODES, HOOKSTR_FAIL_ACTION_CLEAR_VNODES},
		{HOOK_FAIL_ACTION_SCHEDULER_RESTART_CYCLE, HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE},
		{0, NULL}};

	*ptr = '\0';
	for (i = 0; array[i].flags != 0; i++) {
		if (fail_action & array[i].flags) {
			size_t namelen = strlen(array[i].name);
			size_t actionlen = ptr - fail_actionstr;

			if (ev_ct > 0) {
				if (2 > sizeof(fail_actionstr) - actionlen)
					return NULL; /* out of space */
				*ptr++ = ',';	     /* replace nul */
				*ptr = '\0';	     /* terminate string */
				actionlen++;
			}
			if (namelen + 1 > sizeof(fail_actionstr) - actionlen)
				return NULL; /* out of space */
			strncpy(ptr, array[i].name, sizeof(fail_actionstr) - actionlen);
			ptr += namelen;
			ev_ct++;
		}
	}

	if (ev_ct == 0)
		strcpy(fail_actionstr, HOOKSTR_FAIL_ACTION_NONE);
	return (fail_actionstr);
}

/*
 *	Returns the string representation of hook 'order' value.
 */
char *
hook_order_as_string(short order)
{
	static char order_str[HOOK_BUF_SIZE];

	sprintf(order_str, "%d", order);
	return (order_str);
}

/*
 *	Returns the string representation of hook 'alarm' value.
 */
char *
hook_alarm_as_string(int alarm)
{
	static char alarm_str[HOOK_BUF_SIZE];

	sprintf(alarm_str, "%d", alarm);
	return (alarm_str);
}

/**
 *
 * @brief
 *	Returns the string representation of hook 'freq' value.
 *
 * @return char *
 * @reval  <string> - the string version of the internal hook 'freq' value.
 */
char *
hook_freq_as_string(int freq)
{
	static char freq_str[HOOK_BUF_SIZE + 1];

	snprintf(freq_str, HOOK_BUF_SIZE, "%d", freq);
	return (freq_str);
}

/*
 *	Sets the hook 'phook's name attribute to string 'newval'.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
set_hook_name(hook *phook, char *newval, char *msg, size_t msg_len)
{
	int pbsprefix;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's name is NULL!", __func__);
		return (1);
	}

	pbsprefix = (strncmp(newval, HOOK_PBS_PREFIX,
			     strlen(HOOK_PBS_PREFIX)) == 0);
	if ((phook->type == HOOK_PBS) && !pbsprefix) {
		snprintf(msg, msg_len - 1,
			 "hook_name '%s', must use %s as a "
			 "prefix since this is a %s hook.",
			 newval, HOOK_PBS_PREFIX, HOOKSTR_PBS);
		return (1);
	} else if ((phook->type == HOOK_SITE) && pbsprefix) {
		snprintf(msg, msg_len - 1,
			 "hook_name '%s', cannot use %s as a "
			 "prefix it is reserved for %s hooks",
			 newval, HOOK_PBS_PREFIX, HOOKSTR_PBS);
		return (1);
	}
	phook->hook_name = strdup(newval);

	return (0);
}

/*
 *	Sets the hook 'phook's enabled attribute to a value
 *	representing 'newval'.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
set_hook_enabled(hook *phook, char *newval, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL!", __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's value is NULL!", __func__);
		return (1);
	}

	if ((strcasecmp(newval, HOOKSTR_TRUE) == 0) ||
	    (strcasecmp(newval, "t") == 0) ||
	    (strcasecmp(newval, "y") == 0) ||
	    (strcmp(newval, "1") == 0)) {
		phook->enabled = TRUE;
	} else if ((strcasecmp(newval, HOOKSTR_FALSE) == 0) ||
		   (strcasecmp(newval, "f") == 0) ||
		   (strcasecmp(newval, "n") == 0) ||
		   (strcmp(newval, "0") == 0)) {
		phook->enabled = FALSE;
	} else {
		snprintf(msg, msg_len - 1,
			 "unexpected value \'%s\', must be (not case sensitive) "
			 "%s|t|y|1|%s|f|n|0",
			 newval,
			 HOOKSTR_TRUE, HOOKSTR_FALSE);
		return (1);
	}
	return (0);
}

/*
 *	Sets the hook 'phook's debug attribute to a value
 *	representing 'newval'.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
set_hook_debug(hook *phook, char *newval, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL!", __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's value is NULL!", __func__);
		return (1);
	}

	if ((strcasecmp(newval, HOOKSTR_TRUE) == 0) ||
	    (strcasecmp(newval, "t") == 0) ||
	    (strcasecmp(newval, "y") == 0) ||
	    (strcmp(newval, "1") == 0)) {
		phook->debug = TRUE;
	} else if ((strcasecmp(newval, HOOKSTR_FALSE) == 0) ||
		   (strcasecmp(newval, "f") == 0) ||
		   (strcasecmp(newval, "n") == 0) ||
		   (strcmp(newval, "0") == 0)) {
		phook->debug = FALSE;
	} else {
		snprintf(msg, msg_len - 1,
			 "unexpected value \'%s\', must be (not case sensitive) "
			 "%s|t|y|1|%s|f|n|0",
			 newval,
			 HOOKSTR_TRUE, HOOKSTR_FALSE);
		return (1);
	}
	return (0);
}

/*
 *	Sets the hook 'phook's type attribute to a value
 *	representing 'newval'.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
set_hook_type(hook *phook, char *newval, char *msg, size_t msg_len,
	      int allow_PBS_type)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's type is NULL!", __func__);
		return (1);
	}

	if (strcmp(newval, HOOKSTR_PBS) == 0) {
		if (!allow_PBS_type) {
			snprintf(msg, msg_len - 1,
				 "not allowed to set hook to '%s' type",
				 HOOKSTR_PBS);
			return (1);
		}
		if (phook->hook_name &&
		    (strncmp(phook->hook_name, HOOK_PBS_PREFIX,
			     strlen(HOOK_PBS_PREFIX)) != 0)) {
			snprintf(msg, msg_len - 1,
				 "can't set hook to %s type - hook name (%s) "
				 "not prefixed with %s",
				 HOOKSTR_PBS,
				 phook->hook_name, HOOK_PBS_PREFIX);
			return (1);
		}

		phook->type = HOOK_PBS;
	} else if (strcmp(newval, HOOKSTR_SITE) == 0) {
		if (phook->hook_name &&
		    (strncmp(phook->hook_name, HOOK_PBS_PREFIX,
			     strlen(HOOK_PBS_PREFIX)) == 0)) {
			snprintf(msg, msg_len - 1,
				 "can't set hook to %s type - hook name (%s) "
				 "already prefixed with %s",
				 HOOKSTR_SITE,
				 phook->hook_name, HOOK_PBS_PREFIX);
			return (1);
		}

		if (phook->order <= 0) {
			snprintf(msg, msg_len - 1,
				 "can't set hook to %s type - hook order "
				 "value is already set to <= 0",
				 HOOKSTR_SITE);
			return (1);
		}
		phook->type = HOOK_SITE;
	} else {
		if (allow_PBS_type) {
			snprintf(msg, msg_len - 1,
				 "invalid argument to type, must be "
				 "\"%s\" or \"%s\"",
				 HOOKSTR_PBS, HOOKSTR_SITE);
		} else
			snprintf(msg, msg_len - 1,
				 "invalid argument to type, must be \"%s\"",
				 HOOKSTR_SITE);
		return (1);
	}

	return (0);
}

/**
 * @brief
 *	Sets the hook 'phook's user attribute to a value
 *	representing 'newval'.
 *
 * @param[in/out] phook - hook being operated on
 * @param[in]	  newval - the new value to phook's user attribute.
 * @param[in/out] msg - filled in with error message if this function fails.
 * @param[in]	  msg_len - length of 'msg' buffer.
 * @param[in]	  strict - if 'strict' is set to 1, then only set 'user'
 *			  attribute to pbsuser if it is a mom hook and matches
 *			 one of the MOM_USER_EVENTS.
 * @return int
 * @retval 0 	for success
 * @retval 1 	for failure, with 'msg' of size 'msg_len' filled in.
 */
int
set_hook_user(hook *phook, char *newval, char *msg, size_t msg_len, int strict)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL!", __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s:  hook's user is NULL!", __func__);
		return (1);
	}

	if (strcmp(newval, HOOKSTR_ADMIN) != 0) {
		if (phook->event & HOOK_EVENT_PERIODIC) {
			snprintf(msg, msg_len - 1, "user value of a server periodic hook must be %s", HOOKSTR_ADMIN);
			return (1);
		} else if (strcmp(newval, HOOKSTR_USER) != 0) {
			snprintf(msg, msg_len - 1,
				 "user value of a hook must be %s,%s", HOOKSTR_ADMIN,
				 HOOKSTR_USER);
			return (1);
		}
	}

	if (strcmp(newval, HOOKSTR_ADMIN) == 0) {
		phook->user = HOOK_PBSADMIN;
	} else if (strcmp(newval, HOOKSTR_USER) == 0) {

		if (strict && ((phook->event & USER_MOM_EVENTS) == 0)) {
			snprintf(msg, msg_len - 1,
				 "Can't set hook user value to '%s': hook event must contain at least %s", HOOKSTR_USER, hook_event_as_string(USER_MOM_EVENTS));
			return (1);
		}

		phook->user = HOOK_PBSUSER;
	}

	return (0);
}

/**
 *
 * @brief
 *	Inserts the hook 'phook' into  'phook_head' that represents a list
 *	of hooks of the given 'event'. The hook is inserted following the
 *	phook->order, in ascending format.
 *
 * @param[in]	  event - the event of the hooks.
 * @param[in/out] phook_head - list of hooks of the given 'event' where 'phook'
 *				will be inserted.
 * @param[in]	  phook - hook to insert.
 *
 */
static void
insert_hook_sort_order(unsigned int event, pbs_list_head *phook_head, hook *phook)
{
	pbs_list_link *plink_elem, *plink_cur;
	hook *phook_cur;

	if ((phook_head == NULL) || (phook == NULL)) {
		log_err(PBSE_INTERNAL, __func__,
			"NULL arguments to phook_head and/or phook");
		return;
	}

	if (event == HOOK_EVENT_QUEUEJOB) {
		plink_elem = &phook->hi_queuejob_hooks;
	} else if (event == HOOK_EVENT_POSTQUEUEJOB) {
		plink_elem = &phook->hi_postqueuejob_hooks;
	} else if (event == HOOK_EVENT_MODIFYJOB) {
		plink_elem = &phook->hi_modifyjob_hooks;
	} else if (event == HOOK_EVENT_RESVSUB) {
		plink_elem = &phook->hi_resvsub_hooks;
	} else if (event == HOOK_EVENT_MODIFYRESV) {
		plink_elem = &phook->hi_modifyresv_hooks;
	} else if (event == HOOK_EVENT_MOVEJOB) {
		plink_elem = &phook->hi_movejob_hooks;
	} else if (event == HOOK_EVENT_RUNJOB) {
		plink_elem = &phook->hi_runjob_hooks;
	} else if (event == HOOK_EVENT_JOBOBIT) {
		plink_elem = &phook->hi_jobobit_hooks;
	} else if (event == HOOK_EVENT_MANAGEMENT) {
		plink_elem = &phook->hi_management_hooks;
	} else if (event == HOOK_EVENT_MODIFYVNODE) {
		plink_elem = &phook->hi_modifyvnode_hooks;
	} else if (event == HOOK_EVENT_PROVISION) {
		plink_elem = &phook->hi_provision_hooks;
	} else if (event == HOOK_EVENT_PERIODIC) {
		plink_elem = &phook->hi_periodic_hooks;
	} else if (event == HOOK_EVENT_RESV_CONFIRM) {
		plink_elem = &phook->hi_resv_confirm_hooks;
	} else if (event == HOOK_EVENT_RESV_BEGIN) {
		plink_elem = &phook->hi_resv_begin_hooks;
	} else if (event == HOOK_EVENT_RESV_END) {
		plink_elem = &phook->hi_resv_end_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_BEGIN) {
		plink_elem = &phook->hi_execjob_begin_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_PROLOGUE) {
		plink_elem = &phook->hi_execjob_prologue_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_EPILOGUE) {
		plink_elem = &phook->hi_execjob_epilogue_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_PRETERM) {
		plink_elem = &phook->hi_execjob_preterm_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_LAUNCH) {
		plink_elem = &phook->hi_execjob_launch_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_END) {
		plink_elem = &phook->hi_execjob_end_hooks;
	} else if (event == HOOK_EVENT_EXECHOST_PERIODIC) {
		plink_elem = &phook->hi_exechost_periodic_hooks;
	} else if (event == HOOK_EVENT_EXECHOST_STARTUP) {
		plink_elem = &phook->hi_exechost_startup_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_ATTACH) {
		plink_elem = &phook->hi_execjob_attach_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_RESIZE) {
		plink_elem = &phook->hi_execjob_resize_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_ABORT) {
		plink_elem = &phook->hi_execjob_abort_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_POSTSUSPEND) {
		plink_elem = &phook->hi_execjob_postsuspend_hooks;
	} else if (event == HOOK_EVENT_EXECJOB_PRERESUME) {
		plink_elem = &phook->hi_execjob_preresume_hooks;
	} else {
		/* should not happen */
		log_err(PBSE_INTERNAL, __func__, "encountered a bad event");
		return;
	}

	if (is_linked(phook_head, plink_elem)) {
		return;
	}

	phook_cur = (hook *) GET_NEXT(*phook_head);
	plink_cur = phook_head;
	while (phook_cur) {

		if (event == HOOK_EVENT_QUEUEJOB) {
			plink_cur = &phook_cur->hi_queuejob_hooks;
		} else if (event == HOOK_EVENT_POSTQUEUEJOB) {
			plink_cur = &phook_cur->hi_postqueuejob_hooks;
		} else if (event == HOOK_EVENT_MODIFYJOB) {
			plink_cur = &phook_cur->hi_modifyjob_hooks;
		} else if (event == HOOK_EVENT_RESVSUB) {
			plink_cur = &phook_cur->hi_resvsub_hooks;
		} else if (event == HOOK_EVENT_MODIFYRESV) {
			plink_cur = &phook_cur->hi_modifyresv_hooks;
		} else if (event == HOOK_EVENT_MOVEJOB) {
			plink_cur = &phook_cur->hi_movejob_hooks;
		} else if (event == HOOK_EVENT_RUNJOB) {
			plink_cur = &phook_cur->hi_runjob_hooks;
		} else if (event == HOOK_EVENT_JOBOBIT) {
			plink_cur = &phook_cur->hi_jobobit_hooks;
		} else if (event == HOOK_EVENT_MANAGEMENT) {
			plink_cur = &phook_cur->hi_management_hooks;
		} else if (event == HOOK_EVENT_MODIFYVNODE) {
			plink_cur = &phook_cur->hi_modifyvnode_hooks;
		} else if (event == HOOK_EVENT_PROVISION) {
			plink_cur = &phook_cur->hi_provision_hooks;
		} else if (event == HOOK_EVENT_PERIODIC) {
			plink_cur = &phook_cur->hi_periodic_hooks;
		} else if (event == HOOK_EVENT_RESV_CONFIRM) {
			plink_cur = &phook_cur->hi_resv_confirm_hooks;
		} else if (event == HOOK_EVENT_RESV_BEGIN) {
			plink_cur = &phook_cur->hi_resv_begin_hooks;
		} else if (event == HOOK_EVENT_RESV_END) {
			plink_cur = &phook_cur->hi_resv_end_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_BEGIN) {
			plink_cur = &phook_cur->hi_execjob_begin_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_PROLOGUE) {
			plink_cur = &phook_cur->hi_execjob_prologue_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_EPILOGUE) {
			plink_cur = &phook_cur->hi_execjob_epilogue_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_PRETERM) {
			plink_cur = &phook_cur->hi_execjob_preterm_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_LAUNCH) {
			plink_cur = &phook_cur->hi_execjob_launch_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_END) {
			plink_cur = &phook_cur->hi_execjob_end_hooks;
		} else if (event == HOOK_EVENT_EXECHOST_PERIODIC) {
			plink_cur = &phook_cur->hi_exechost_periodic_hooks;
		} else if (event == HOOK_EVENT_EXECHOST_STARTUP) {
			plink_cur = &phook_cur->hi_exechost_startup_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_ATTACH) {
			plink_cur = &phook_cur->hi_execjob_attach_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_RESIZE) {
			plink_cur = &phook_cur->hi_execjob_resize_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_ABORT) {
			plink_cur = &phook_cur->hi_execjob_abort_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_POSTSUSPEND) {
			plink_cur = &phook_cur->hi_execjob_postsuspend_hooks;
		} else if (event == HOOK_EVENT_EXECJOB_PRERESUME) {
			plink_cur = &phook_cur->hi_execjob_preresume_hooks;
		} else {
			/* should not happen */
			log_err(PBSE_INTERNAL, __func__, "encountered a bad event");
			return;
		}

		if (phook_cur->order > phook->order) {
			break;
		}

		phook_cur = (hook *) GET_NEXT(*plink_cur);
	}

	if (phook_cur) {
		/* link before 'current' hook in server's list */
		insert_link(plink_cur, plink_elem, phook, LINK_INSET_BEFORE);
	} else {
		/* attach either at the beginning or the last of the list */
		insert_link(plink_cur, plink_elem, phook, LINK_INSET_AFTER);
	}
}

/**
 *
 * @brief
 *	Sets the hook 'phook's fail_action attribute to a value
 *	representing 'newval'.
 *
 * @param[in/out]  phook - hook being operated on.
 * @param[in]	   newval - new fail_action value
 * @param[in/out]  msg - error message buffer
 * @param[in]	   msg_len - length of 'msg' buffer.
 * @param[in]	  strict - if 'strict' is set to 1, then only non- "none"
 * 			 value if the hook's event has "execjob_begin" or
 * 			 "exechost_periodic".
 *
 * @return int
 * @retval 0 	for success
 * @retval 1 	for failure with 'msg' of size 'msg_len' filled in.
 */
int
set_hook_fail_action(hook *phook, char *newval, char *msg,
		     size_t msg_len, int strict)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's fail_action is NULL!", __func__);
		return (1);
	}

	if (phook->fail_action != 0) {
		phook->fail_action = 0;
	}

	return add_hook_fail_action(phook, newval, msg, msg_len, strict);
}

/**
 * @brief
 *	Adds to hook 'phook's fail_action attribute (bitmask) a value
 *	representing 'newval'.
 * @note
 * 	The valid 'newval' values are:
 *		HOOKSTR_FAIL_ACTION_NONE	   ("none")
 *		HOOKSTR_FAIL_ACTION_OFFLINE_VNODES ("offline_vnodes")
 *		HOOKSTR_FAIL_ACTION_CLEAR_VNODES   ("clear_vnodes_upon_recovery")
 *		HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE
 *						("scheduler_restart_cycle")
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in]		newval - new hook fail_action value
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of message buffer
 * @param[in]	  	strict - if 'strict' is set to 1, then only non- "none"
 * 			 value if the hook's event has "execjob_begin" or
 * 			 "exechost_periodic".
 *
 * @return int
 * @retval 0	for success
 * @retval 1 *  for failure with 'msg' of size 'msg_len' filled in.
 */
int
add_hook_fail_action(hook *phook, char *newval, char *msg, size_t msg_len,
		     int strict)
{
	char *val, *newval_dup;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's fail_action is NULL!", __func__);
		return (1);
	}

	if ((newval_dup = strdup(newval)) == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: failed to malloc newval=%s!", __func__, newval);
		return (1);
	}
	val = strtok(newval_dup, ",");
	while (val) {
		if (strcmp(val, HOOKSTR_FAIL_ACTION_NONE) == 0) {
			/* can't combine "none" with other fail_action values */
			if ((phook->fail_action != HOOK_FAIL_ACTION_NONE) &&
			    (phook->fail_action != 0))
				goto err;
			phook->fail_action |= HOOK_FAIL_ACTION_NONE;
		} else if (strcmp(val, HOOKSTR_FAIL_ACTION_OFFLINE_VNODES) == 0) {
			/* can't combine "none" with other fail_action values */
			if (phook->fail_action & HOOK_FAIL_ACTION_NONE)
				goto err;
			/* must contain one of the events in FAIL_ACTION_EVENTS */
			/* in order to set an "offline_vnodes" fail_action value. */
			if (strict &&
			    ((phook->event & FAIL_ACTION_EVENTS) == 0)) {
				if (msg[0] == '\0') {
					snprintf(msg, msg_len - 1,
						 "Can't set hook fail_action value to '%s': "
						 "hook event must contain at least one of %s",
						 val, HOOKSTR_FAIL_ACTION_EVENTS);
				}
				free(newval_dup);
				return (1);
			}

			phook->fail_action |= HOOK_FAIL_ACTION_OFFLINE_VNODES;
		} else if (strcmp(val, HOOKSTR_FAIL_ACTION_CLEAR_VNODES) == 0) {
			/* can't combine "none" with other fail_action values */
			if (phook->fail_action & HOOK_FAIL_ACTION_NONE)
				goto err;
			/* must be an exechost_startup event value */
			/* in order to set a "clear_vnodes_upon_recovery" fail_action value. */
			if (strict &&
			    ((phook->event & HOOK_EVENT_EXECHOST_STARTUP) == 0)) {
				if (msg[0] == '\0') {
					snprintf(msg, msg_len - 1,
						 "Can't set hook fail_action value to '%s': "
						 "hook event must contain at least an %s value",
						 val, HOOKSTR_EXECHOST_STARTUP);
				}
				free(newval_dup);
				return (1);
			}
			phook->fail_action |= HOOK_FAIL_ACTION_CLEAR_VNODES;
		} else if (strcmp(val,
				  HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE) == 0) {
			/* can't combine "none" with other fail_action values */
			if (phook->fail_action & HOOK_FAIL_ACTION_NONE)
				goto err;
			/* must contain one of the events in HOOK_EVENT_EXECJOB_BEGIN, HOOK_EVENT_EXECJOB_PROLOGUE */
			/* in order to set a "scheduler_restart_cycle" fail_action value. */
			if (strict &&
			    ((phook->event & HOOK_EVENT_EXECJOB_BEGIN) == 0) &&
			    ((phook->event & HOOK_EVENT_EXECJOB_PROLOGUE) == 0)) {
				if (msg[0] == '\0') {
					snprintf(msg, msg_len - 1,
						 "Can't set hook fail_action value to '%s': "
						 "hook event must contain at least one of %s, %s",
						 val, HOOKSTR_EXECJOB_BEGIN, HOOKSTR_EXECJOB_PROLOGUE);
				}
				free(newval_dup);
				return (1);
			}
			phook->fail_action |= HOOK_FAIL_ACTION_SCHEDULER_RESTART_CYCLE;
		} else {
			snprintf(msg, msg_len - 1,
				 "fail_action value of a hook "
				 "must be \"%s\" or one or more of \"%s\","
				 "\"%s\", \"%s\"",
				 HOOKSTR_FAIL_ACTION_NONE,
				 HOOKSTR_FAIL_ACTION_OFFLINE_VNODES,
				 HOOKSTR_FAIL_ACTION_CLEAR_VNODES,
				 HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE);
			free(newval_dup);
			return (1);
		}

		val = strtok(NULL, ",");
	}

	free(newval_dup);
	return (0);
err:
	if (msg[0] == '\0') {
		snprintf(msg, msg_len - 1,
			 "fail_action value of a hook "
			 "must be \"%s\" or one or more of \"%s\","
			 "\"%s\", \"%s\"",
			 HOOKSTR_FAIL_ACTION_NONE,
			 HOOKSTR_FAIL_ACTION_OFFLINE_VNODES,
			 HOOKSTR_FAIL_ACTION_CLEAR_VNODES,
			 HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE);
	}
	free(newval_dup);
	return (1);
}

/**
 * @brief
 *	Removes from hook 'phook's fail_action attribute (bitmask) the value
 *	representing 'newval'.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in]		newval - the hook fail_action value to delete
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of 'msg' buffer.
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure with 'msg' of size 'msg_len' illed in.
 */
int
del_hook_fail_action(hook *phook, char *newval, char *msg, size_t msg_len)
{
	char *val, *newval_dup;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's fail_action is NULL!", __func__);
		return (1);
	}

	if ((newval_dup = strdup(newval)) == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: failed to malloc newval=%s!", __func__, newval);
		return (1);
	}

	val = strtok(newval_dup, ",");
	while (val) {
		if (strcmp(val, HOOKSTR_FAIL_ACTION_NONE) == 0) {
			phook->fail_action &= ~HOOK_FAIL_ACTION_NONE;
			if (phook->fail_action == 0) {
				phook->fail_action = HOOK_FAIL_ACTION_NONE;
			}
		} else if (strcmp(val, HOOKSTR_FAIL_ACTION_OFFLINE_VNODES) == 0) {
			phook->fail_action &= ~HOOK_FAIL_ACTION_OFFLINE_VNODES;
		} else if (strcmp(val, HOOKSTR_FAIL_ACTION_CLEAR_VNODES) == 0) {
			phook->fail_action &= ~HOOK_FAIL_ACTION_CLEAR_VNODES;
		} else if (strcmp(val,
				  HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE) == 0) {
			phook->fail_action &= ~HOOK_FAIL_ACTION_SCHEDULER_RESTART_CYCLE;
		} else if (strcmp(val, HOOKSTR_NONE) != 0) {
			snprintf(msg, msg_len - 1,
				 "fail_action value of a hook "
				 "must be \"%s\" or one or more of \"%s\","
				 "\"%s\", \"%s\"",
				 HOOKSTR_FAIL_ACTION_NONE,
				 HOOKSTR_FAIL_ACTION_OFFLINE_VNODES,
				 HOOKSTR_FAIL_ACTION_CLEAR_VNODES,
				 HOOKSTR_FAIL_ACTION_SCHEDULER_RESTART_CYCLE);
			free(newval_dup);
			return (1);
		}

		val = strtok(NULL, ",");
	}

	free(newval_dup);
	return (0);
}

/*
 *
 * @brief
 *	Sets the hook 'phook's event attribute to a value
 *	representing 'newval'.
 *
 * @param[in/out]  phook - hook being operated on.
 * @param[in]	   newval - new event value
 * @param[in/out]  msg - error message buffer
 * @param[in]	   msg_len - length of 'msg' buffer.
 *
 * @return int
 * @retval 0 	for success
 * @retval 1 	for failure with 'msg' of size 'msg_len' filled in.
 */
int
set_hook_event(hook *phook, char *newval, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's event is NULL!", __func__);
		return (1);
	}

	if (phook->event != 0) {

		delete_link(&phook->hi_queuejob_hooks);
		delete_link(&phook->hi_postqueuejob_hooks);
		delete_link(&phook->hi_modifyjob_hooks);
		delete_link(&phook->hi_modifyvnode_hooks);
		delete_link(&phook->hi_management_hooks);
		delete_link(&phook->hi_resvsub_hooks);
		delete_link(&phook->hi_modifyresv_hooks);
		delete_link(&phook->hi_movejob_hooks);
		delete_link(&phook->hi_runjob_hooks);
		delete_link(&phook->hi_provision_hooks);
		delete_link(&phook->hi_periodic_hooks);
		delete_link(&phook->hi_resv_confirm_hooks);
		delete_link(&phook->hi_resv_begin_hooks);
		delete_link(&phook->hi_resv_end_hooks);
		delete_link(&phook->hi_execjob_begin_hooks);
		delete_link(&phook->hi_execjob_prologue_hooks);
		delete_link(&phook->hi_execjob_epilogue_hooks);
		delete_link(&phook->hi_execjob_preterm_hooks);
		delete_link(&phook->hi_execjob_launch_hooks);
		delete_link(&phook->hi_execjob_end_hooks);
		delete_link(&phook->hi_exechost_periodic_hooks);
		delete_link(&phook->hi_exechost_startup_hooks);
		delete_link(&phook->hi_execjob_attach_hooks);
		delete_link(&phook->hi_execjob_resize_hooks);
		delete_link(&phook->hi_execjob_abort_hooks);
		delete_link(&phook->hi_execjob_postsuspend_hooks);
		delete_link(&phook->hi_execjob_preresume_hooks);
		phook->event = 0;
	}

	return add_hook_event(phook, newval, msg, msg_len);
}

/**
 * @brief
 *	Adds to hook 'phook's event attribute (bitmask) a value
 *	representing 'newval'. Various hooks lists where 'phook'
 *	appear are automatically updated to reflect the changed
 *	event value.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in]		newval - new hook event value
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of message buffer
 *
 * @return int
 * @retval 0	for success
 * @retval 1 *  for failure with 'msg' of size 'msg_len' filled in.
 */
int
add_hook_event(hook *phook, char *newval, char *msg, size_t msg_len)
{
	char *val, *newval_dup;
	hook *anotherhook;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's event is NULL!", __func__);
		return (1);
	}

	if ((newval_dup = strdup(newval)) == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: failed to malloc newval=%s!", __func__, newval);
		return (1);
	}
	val = strtok(newval_dup, ",");
	while (val) {
		if (strcmp(val, HOOKSTR_QUEUEJOB) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_queuejob_hooks);
			phook->event |= HOOK_EVENT_QUEUEJOB;
			insert_hook_sort_order(HOOK_EVENT_QUEUEJOB,
					       &svr_queuejob_hooks, phook);
		} else if (strcmp(val, HOOKSTR_POSTQUEUEJOB) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_postqueuejob_hooks);
			phook->event |= HOOK_EVENT_POSTQUEUEJOB;
			insert_hook_sort_order(HOOK_EVENT_POSTQUEUEJOB,
					       &svr_postqueuejob_hooks, phook);
		} else if (strcmp(val, HOOKSTR_MODIFYJOB) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_modifyjob_hooks);
			phook->event |= HOOK_EVENT_MODIFYJOB;
			insert_hook_sort_order(HOOK_EVENT_MODIFYJOB,
					       &svr_modifyjob_hooks, phook);
		} else if (strcmp(val, HOOKSTR_RESVSUB) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_resvsub_hooks);
			phook->event |= HOOK_EVENT_RESVSUB;
			insert_hook_sort_order(HOOK_EVENT_RESVSUB,
					       &svr_resvsub_hooks, phook);
		} else if (strcmp(val, HOOKSTR_MODIFYRESV) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_modifyresv_hooks);
			phook->event |= HOOK_EVENT_MODIFYRESV;
			insert_hook_sort_order(HOOK_EVENT_MODIFYRESV,
					       &svr_modifyresv_hooks, phook);
		} else if (strcmp(val, HOOKSTR_MOVEJOB) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_movejob_hooks);
			phook->event |= HOOK_EVENT_MOVEJOB;
			insert_hook_sort_order(HOOK_EVENT_MOVEJOB,
					       &svr_movejob_hooks, phook);
		} else if (strcmp(val, HOOKSTR_RUNJOB) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_runjob_hooks);
			phook->event |= HOOK_EVENT_RUNJOB;
			insert_hook_sort_order(HOOK_EVENT_RUNJOB,
					       &svr_runjob_hooks, phook);
		} else if (strcmp(val, HOOKSTR_JOBOBIT) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_jobobit_hooks);
			phook->event |= HOOK_EVENT_JOBOBIT;
			insert_hook_sort_order(HOOK_EVENT_JOBOBIT,
					       &svr_jobobit_hooks, phook);
		} else if (strcmp(val, HOOKSTR_MANAGEMENT) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_management_hooks);
			phook->event |= HOOK_EVENT_MANAGEMENT;
			insert_hook_sort_order(HOOK_EVENT_MANAGEMENT,
					       &svr_management_hooks, phook);
		} else if (strcmp(val, HOOKSTR_MODIFYVNODE) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_modifyvnode_hooks);
			phook->event |= HOOK_EVENT_MODIFYVNODE;
			insert_hook_sort_order(HOOK_EVENT_MODIFYVNODE,
					       &svr_modifyvnode_hooks, phook);
		} else if (strcmp(val, HOOKSTR_PROVISION) == 0) {
			if (phook->event & ~HOOK_EVENT_PROVISION)
				goto err;
			anotherhook = find_hookbyevent(HOOK_EVENT_PROVISION);
			if (anotherhook) {
				snprintf(msg, msg_len - 1,
					 "Another hook '%s' already has "
					 "event 'provision', only one 'provision' "
					 "hook allowed",
					 anotherhook->hook_name);
				return -1;
			}
			delete_link(&phook->hi_provision_hooks);
			phook->event |= HOOK_EVENT_PROVISION;
			insert_hook_sort_order(HOOK_EVENT_PROVISION,
					       &svr_provision_hooks, phook);
		} else if (strcmp(val, HOOKSTR_PERIODIC) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_periodic_hooks);
			phook->event |= HOOK_EVENT_PERIODIC;
			insert_hook_sort_order(HOOK_EVENT_PERIODIC,
					       &svr_periodic_hooks, phook);
		} else if (strcmp(val, HOOKSTR_RESV_CONFIRM) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_resv_confirm_hooks);
			phook->event |= HOOK_EVENT_RESV_CONFIRM;
			insert_hook_sort_order(HOOK_EVENT_RESV_CONFIRM,
					       &svr_resv_confirm_hooks, phook);
		} else if (strcmp(val, HOOKSTR_RESV_BEGIN) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_resv_begin_hooks);
			phook->event |= HOOK_EVENT_RESV_BEGIN;
			insert_hook_sort_order(HOOK_EVENT_RESV_BEGIN,
					       &svr_resv_begin_hooks, phook);
		} else if (strcmp(val, HOOKSTR_RESV_END) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_resv_end_hooks);
			phook->event |= HOOK_EVENT_RESV_END;
			insert_hook_sort_order(HOOK_EVENT_RESV_END,
					       &svr_resv_end_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_BEGIN) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_begin_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_BEGIN;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_BEGIN,
					       &svr_execjob_begin_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_PROLOGUE) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_prologue_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_PROLOGUE;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_PROLOGUE,
					       &svr_execjob_prologue_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_EPILOGUE) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_epilogue_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_EPILOGUE;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_EPILOGUE,
					       &svr_execjob_epilogue_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_END) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_end_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_END;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_END,
					       &svr_execjob_end_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_PRETERM) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_preterm_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_PRETERM;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_PRETERM,
					       &svr_execjob_preterm_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_LAUNCH) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_launch_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_LAUNCH;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_LAUNCH,
					       &svr_execjob_launch_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECHOST_PERIODIC) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_exechost_periodic_hooks);
			phook->event |= HOOK_EVENT_EXECHOST_PERIODIC;
			insert_hook_sort_order(HOOK_EVENT_EXECHOST_PERIODIC,
					       &svr_exechost_periodic_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECHOST_STARTUP) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_exechost_startup_hooks);
			phook->event |= HOOK_EVENT_EXECHOST_STARTUP;
			insert_hook_sort_order(HOOK_EVENT_EXECHOST_STARTUP,
					       &svr_exechost_startup_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_ATTACH) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_attach_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_ATTACH;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_ATTACH,
					       &svr_execjob_attach_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_RESIZE) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_resize_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_RESIZE;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_RESIZE,
					       &svr_execjob_resize_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_ABORT) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_abort_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_ABORT;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_ABORT,
					       &svr_execjob_abort_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_POSTSUSPEND) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_postsuspend_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_POSTSUSPEND;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_POSTSUSPEND,
					       &svr_execjob_postsuspend_hooks, phook);
		} else if (strcmp(val, HOOKSTR_EXECJOB_PRERESUME) == 0) {
			if (phook->event & HOOK_EVENT_PROVISION)
				goto err;
			delete_link(&phook->hi_execjob_preresume_hooks);
			phook->event |= HOOK_EVENT_EXECJOB_PRERESUME;
			insert_hook_sort_order(HOOK_EVENT_EXECJOB_PRERESUME,
					       &svr_execjob_preresume_hooks, phook);
		} else if (strcmp(val, HOOKSTR_NONE) != 0) {
			snprintf(msg, msg_len - 1,
				 "invalid argument (%s) to event. "
				 "Should be one or more of: %s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,"
				 "%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s "
				 "or %s for no event",
				 newval, HOOKSTR_QUEUEJOB, HOOKSTR_POSTQUEUEJOB, HOOKSTR_MODIFYJOB, HOOKSTR_MODIFYVNODE, HOOKSTR_MANAGEMENT,
				 HOOKSTR_RESVSUB, HOOKSTR_MODIFYRESV, HOOKSTR_MOVEJOB, HOOKSTR_JOBOBIT,
				 HOOKSTR_RUNJOB, HOOKSTR_PROVISION, HOOKSTR_PERIODIC, HOOKSTR_RESV_CONFIRM,
				 HOOKSTR_RESV_BEGIN, HOOKSTR_RESV_END, HOOKSTR_EXECJOB_BEGIN,
				 HOOKSTR_EXECJOB_PROLOGUE, HOOKSTR_EXECJOB_EPILOGUE, HOOKSTR_EXECJOB_PRETERM,
				 HOOKSTR_EXECJOB_END, HOOKSTR_EXECHOST_PERIODIC, HOOKSTR_EXECJOB_LAUNCH,
				 HOOKSTR_EXECHOST_STARTUP, HOOKSTR_EXECJOB_ATTACH, HOOKSTR_EXECJOB_RESIZE, HOOKSTR_EXECJOB_ABORT, HOOKSTR_EXECJOB_POSTSUSPEND, HOOKSTR_EXECJOB_PRERESUME, HOOKSTR_NONE);
			free(newval_dup);
			return (1);
		}

		val = strtok(NULL, ",");
	}

	free(newval_dup);
	return (0);
err:
	if (msg[0] == '\0') {
		snprintf(msg, msg_len - 1,
			 "Event provision is exclusive with other events, "
			 "and only one provision hook allowed");
	}
	free(newval_dup);
	return (1);
}

/**
 * @brief
 *	Removes from hook 'phook's event attribute (bitmask) the value
 *	representing 'newval'. Various hooks lists where 'phook' appears
 *	are automatically updated to reflect the changed event value.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in]		newval - the hook event value to delete
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of 'msg' buffer.
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure with 'msg' of size 'msg_len' illed in.
 */
int
del_hook_event(hook *phook, char *newval, char *msg, size_t msg_len)
{
	char *val, *newval_dup;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's event is NULL!", __func__);
		return (1);
	}

	if ((newval_dup = strdup(newval)) == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: failed to malloc newval=%s!", __func__, newval);
		return (1);
	}

	val = strtok(newval_dup, ",");
	while (val) {
		if (strcmp(val, HOOKSTR_QUEUEJOB) == 0) {
			delete_link(&phook->hi_queuejob_hooks);
			phook->event &= ~HOOK_EVENT_QUEUEJOB;
		} else if (strcmp(val, HOOKSTR_POSTQUEUEJOB) == 0) {
			delete_link(&phook->hi_postqueuejob_hooks);
			phook->event &= ~HOOK_EVENT_POSTQUEUEJOB;
		} else if (strcmp(val, HOOKSTR_MODIFYJOB) == 0) {
			delete_link(&phook->hi_modifyjob_hooks);
			phook->event &= ~HOOK_EVENT_MODIFYJOB;
		} else if (strcmp(val, HOOKSTR_RESVSUB) == 0) {
			delete_link(&phook->hi_resvsub_hooks);
			phook->event &= ~HOOK_EVENT_RESVSUB;
		} else if (strcmp(val, HOOKSTR_MODIFYRESV) == 0) {
			delete_link(&phook->hi_modifyresv_hooks);
			phook->event &= ~HOOK_EVENT_MODIFYRESV;
		} else if (strcmp(val, HOOKSTR_MOVEJOB) == 0) {
			delete_link(&phook->hi_movejob_hooks);
			phook->event &= ~HOOK_EVENT_MOVEJOB;
		} else if (strcmp(val, HOOKSTR_RUNJOB) == 0) {
			delete_link(&phook->hi_runjob_hooks);
			phook->event &= ~HOOK_EVENT_RUNJOB;
		} else if (strcmp(val, HOOKSTR_JOBOBIT) == 0) {
			delete_link(&phook->hi_jobobit_hooks);
			phook->event &= ~HOOK_EVENT_JOBOBIT;
		} else if (strcmp(val, HOOKSTR_MANAGEMENT) == 0) {
			delete_link(&phook->hi_management_hooks);
			phook->event &= ~HOOK_EVENT_MANAGEMENT;
		} else if (strcmp(val, HOOKSTR_MODIFYVNODE) == 0) {
			delete_link(&phook->hi_modifyvnode_hooks);
			phook->event &= ~HOOK_EVENT_MODIFYVNODE;
		} else if (strcmp(val, HOOKSTR_PROVISION) == 0) {
			delete_link(&phook->hi_provision_hooks);
			phook->event &= ~HOOK_EVENT_PROVISION;
		} else if (strcmp(val, HOOKSTR_PERIODIC) == 0) {
			delete_link(&phook->hi_periodic_hooks);
			phook->event &= ~HOOK_EVENT_PERIODIC;
			delete_task_by_parm1_func(phook, NULL, DELETE_ALL);
		} else if (strcmp(val, HOOKSTR_RESV_CONFIRM) == 0) {
			delete_link(&phook->hi_resv_confirm_hooks);
			phook->event &= ~HOOK_EVENT_RESV_CONFIRM;
		} else if (strcmp(val, HOOKSTR_RESV_BEGIN) == 0) {
			delete_link(&phook->hi_resv_begin_hooks);
			phook->event &= ~HOOK_EVENT_RESV_BEGIN;
		} else if (strcmp(val, HOOKSTR_RESV_END) == 0) {
			delete_link(&phook->hi_resv_end_hooks);
			phook->event &= ~HOOK_EVENT_RESV_END;
		} else if (strcmp(val, HOOKSTR_EXECJOB_BEGIN) == 0) {
			delete_link(&phook->hi_execjob_begin_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_BEGIN;
		} else if (strcmp(val, HOOKSTR_EXECJOB_PROLOGUE) == 0) {
			delete_link(&phook->hi_execjob_prologue_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_PROLOGUE;
		} else if (strcmp(val, HOOKSTR_EXECJOB_EPILOGUE) == 0) {
			delete_link(&phook->hi_execjob_epilogue_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_EPILOGUE;
		} else if (strcmp(val, HOOKSTR_EXECJOB_END) == 0) {
			delete_link(&phook->hi_execjob_end_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_END;
		} else if (strcmp(val, HOOKSTR_EXECJOB_PRETERM) == 0) {
			delete_link(&phook->hi_execjob_preterm_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_PRETERM;
		} else if (strcmp(val, HOOKSTR_EXECJOB_LAUNCH) == 0) {
			delete_link(&phook->hi_execjob_launch_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_LAUNCH;
		} else if (strcmp(val, HOOKSTR_EXECHOST_PERIODIC) == 0) {
			delete_link(&phook->hi_exechost_periodic_hooks);
			phook->event &= ~HOOK_EVENT_EXECHOST_PERIODIC;
		} else if (strcmp(val, HOOKSTR_EXECHOST_STARTUP) == 0) {
			delete_link(&phook->hi_exechost_startup_hooks);
			phook->event &= ~HOOK_EVENT_EXECHOST_STARTUP;
		} else if (strcmp(val, HOOKSTR_EXECJOB_ATTACH) == 0) {
			delete_link(&phook->hi_execjob_attach_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_ATTACH;
		} else if (strcmp(val, HOOKSTR_EXECJOB_RESIZE) == 0) {
			delete_link(&phook->hi_execjob_resize_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_RESIZE;
		} else if (strcmp(val, HOOKSTR_EXECJOB_ABORT) == 0) {
			delete_link(&phook->hi_execjob_abort_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_ABORT;
		} else if (strcmp(val, HOOKSTR_EXECJOB_POSTSUSPEND) == 0) {
			delete_link(&phook->hi_execjob_postsuspend_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_POSTSUSPEND;
		} else if (strcmp(val, HOOKSTR_EXECJOB_PRERESUME) == 0) {
			delete_link(&phook->hi_execjob_preresume_hooks);
			phook->event &= ~HOOK_EVENT_EXECJOB_PRERESUME;
		} else if (strcmp(val, HOOKSTR_NONE) != 0) {
			snprintf(msg, msg_len - 1,
				 "invalid argument (%s) to event. "
				 "Should be one or more of: %s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,"
				 "%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s "
				 "or %s for no event.",
				 newval, HOOKSTR_QUEUEJOB, HOOKSTR_POSTQUEUEJOB, HOOKSTR_MODIFYJOB, HOOKSTR_MODIFYVNODE, HOOKSTR_MANAGEMENT,
				 HOOKSTR_RESVSUB, HOOKSTR_MODIFYRESV, HOOKSTR_MOVEJOB,
				 HOOKSTR_RUNJOB, HOOKSTR_PERIODIC, HOOKSTR_PROVISION, HOOKSTR_RESV_CONFIRM,
				 HOOKSTR_RESV_BEGIN, HOOKSTR_RESV_END, HOOKSTR_EXECJOB_BEGIN,
				 HOOKSTR_EXECJOB_PROLOGUE, HOOKSTR_EXECJOB_EPILOGUE, HOOKSTR_EXECJOB_END,
				 HOOKSTR_EXECJOB_PRETERM, HOOKSTR_EXECHOST_PERIODIC,
				 HOOKSTR_EXECJOB_LAUNCH, HOOKSTR_EXECHOST_STARTUP,
				 HOOKSTR_EXECJOB_ATTACH, HOOKSTR_EXECJOB_RESIZE, HOOKSTR_EXECJOB_ABORT, HOOKSTR_EXECJOB_POSTSUSPEND, HOOKSTR_EXECJOB_PRERESUME, HOOKSTR_NONE);
			free(newval_dup);
			return (1);
		}

		val = strtok(NULL, ",");
	}

	free(newval_dup);
	return (0);
}

/**
 * @brief
 *	Sets the hook 'phook's order attribute to a value
 *	representing 'newval'. Various hooks lists where
 *	'phook' appears are updated to reflect the new phook->order value.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in]		newval - the hook order value to set to
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of 'msg' buffer.
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure with 'msg' of size 'msg_len' filled in.
 *
 */
int
set_hook_order(hook *phook, char *newval, char *msg, size_t msg_len)
{

	int val;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook parameter is NULL!",
			 __func__);
		return (1);
	}

	if (newval == NULL) {
		snprintf(msg, msg_len - 1, "%s: hook's order is NULL!", __func__);
		return (1);
	}

	val = atoi(newval);

	if (phook->type == HOOK_SITE) {

		if ((val < HOOK_SITE_ORDER_MIN) ||
		    (val > HOOK_SITE_ORDER_MAX)) {
			snprintf(msg, msg_len - 1,
				 "order given (%d) is outside the acceptable "
				 "range of [%d, %d] for type \'%s\'.",
				 val, HOOK_SITE_ORDER_MIN, HOOK_SITE_ORDER_MAX,
				 HOOKSTR_SITE);
			return (1);
		}
	} else {
		if ((val < HOOK_PBS_ORDER_MIN) ||
		    (val > HOOK_PBS_ORDER_MAX)) {
			snprintf(msg, msg_len - 1,
				 "order given (%d) is outside the acceptable "
				 "range of [%d, %d] for type \'%s\'.",
				 val,
				 HOOK_PBS_ORDER_MIN, HOOK_PBS_ORDER_MAX,
				 HOOKSTR_PBS);
			return (1);
		}
	}

	phook->order = val;

	if (phook->event & HOOK_EVENT_QUEUEJOB) {
		delete_link(&phook->hi_queuejob_hooks);
		insert_hook_sort_order(HOOK_EVENT_QUEUEJOB,
				       &svr_queuejob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_POSTQUEUEJOB) {
		delete_link(&phook->hi_postqueuejob_hooks);
		insert_hook_sort_order(HOOK_EVENT_POSTQUEUEJOB,
				       &svr_postqueuejob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MODIFYJOB) {
		delete_link(&phook->hi_modifyjob_hooks);
		insert_hook_sort_order(HOOK_EVENT_MODIFYJOB,
				       &svr_modifyjob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESVSUB) {
		delete_link(&phook->hi_resvsub_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESVSUB,
				       &svr_resvsub_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MODIFYRESV) {
		delete_link(&phook->hi_modifyresv_hooks);
		insert_hook_sort_order(HOOK_EVENT_MODIFYRESV,
				       &svr_modifyresv_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MOVEJOB) {
		delete_link(&phook->hi_movejob_hooks);
		insert_hook_sort_order(HOOK_EVENT_MOVEJOB,
				       &svr_movejob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RUNJOB) {
		delete_link(&phook->hi_runjob_hooks);
		insert_hook_sort_order(HOOK_EVENT_RUNJOB,
				       &svr_runjob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_JOBOBIT) {
		delete_link(&phook->hi_jobobit_hooks);
		insert_hook_sort_order(HOOK_EVENT_JOBOBIT,
				       &svr_jobobit_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MANAGEMENT) {
		delete_link(&phook->hi_management_hooks);
		insert_hook_sort_order(HOOK_EVENT_MANAGEMENT,
				       &svr_management_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MODIFYVNODE) {
		delete_link(&phook->hi_modifyvnode_hooks);
		insert_hook_sort_order(HOOK_EVENT_MODIFYVNODE,
				       &svr_modifyvnode_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESV_BEGIN) {
		delete_link(&phook->hi_resv_begin_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESV_BEGIN,
				       &svr_resv_begin_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESV_CONFIRM) {
		delete_link(&phook->hi_resv_confirm_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESV_CONFIRM,
				       &svr_resv_confirm_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESV_END) {
		delete_link(&phook->hi_resv_end_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESV_END,
				       &svr_resv_end_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_BEGIN) {
		delete_link(&phook->hi_execjob_begin_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_BEGIN,
				       &svr_execjob_begin_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PROLOGUE) {
		delete_link(&phook->hi_execjob_prologue_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_PROLOGUE,
				       &svr_execjob_prologue_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_EPILOGUE) {
		delete_link(&phook->hi_execjob_epilogue_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_EPILOGUE,
				       &svr_execjob_epilogue_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_END) {
		delete_link(&phook->hi_execjob_end_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_END,
				       &svr_execjob_end_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PRETERM) {
		delete_link(&phook->hi_execjob_preterm_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_PRETERM,
				       &svr_execjob_preterm_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_LAUNCH) {
		delete_link(&phook->hi_execjob_launch_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_LAUNCH,
				       &svr_execjob_launch_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECHOST_PERIODIC) {
		delete_link(&phook->hi_exechost_periodic_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECHOST_PERIODIC,
				       &svr_exechost_periodic_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECHOST_STARTUP) {
		delete_link(&phook->hi_exechost_startup_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECHOST_STARTUP,
				       &svr_exechost_startup_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_ATTACH) {
		delete_link(&phook->hi_execjob_attach_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_ATTACH,
				       &svr_execjob_attach_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_RESIZE) {
		delete_link(&phook->hi_execjob_resize_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_RESIZE,
				       &svr_execjob_resize_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_ABORT) {
		delete_link(&phook->hi_execjob_abort_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_ABORT,
				       &svr_execjob_abort_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_POSTSUSPEND) {
		delete_link(&phook->hi_execjob_postsuspend_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_POSTSUSPEND,
				       &svr_execjob_postsuspend_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PRERESUME) {
		delete_link(&phook->hi_execjob_preresume_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_PRERESUME,
				       &svr_execjob_preresume_hooks, phook);
	}
	return (0);
}

/*
 *	Sets the hook 'phook's alarm attribute to a value
 *	representing 'newval'.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
set_hook_alarm(hook *phook, char *newval, char *msg, size_t msg_len)
{
	int alarm;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL!", __func__);
		return (1);
	}
	if (newval == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook's alarm is NULL!", __func__);
		return (1);
	}

	alarm = atoi(newval);

	if (alarm <= 0) {
		snprintf(msg, msg_len - 1,
			 "%s: alarm value '%s' of a hook must be > 0", __func__,
			 newval);
		return (1);
	}

	phook->alarm = alarm;
	return (0);
}

/**
 * @brief
 *	Sets the hook 'phook's freq attribute to a value
 *	representing 'newval'.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in]		newval - the hook freq value to set to
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of 'msg' buffer.
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure with 'msg' of size 'msg_len' filled in.
 */
int
set_hook_freq(hook *phook, char *newval, char *msg, size_t msg_len)
{
	int freq;
	char *pc = NULL;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL!", __func__);
		return (1);
	}
	if (newval == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook's freq is NULL!", __func__);
		return (1);
	}

	pc = newval;
	if (*pc == '-')
		++pc; /* move past negative number, it will be caught later  */

	while (isdigit((int) *pc))
		++pc;

	if (*pc != '\0') {
		snprintf(msg, msg_len - 1,
			 "%s: encountered a non-digit freq value: %c",
			 __func__, *pc);
		return (1);
	}

	freq = atoi(newval);

	if (freq <= 0) {
		snprintf(msg, msg_len - 1,
			 "%s: freq value '%s' of a hook must be > 0", __func__,
			 newval);
		return (1);
	}

	if (((phook->event & HOOK_EVENT_EXECHOST_PERIODIC) == 0) && ((phook->event & HOOK_EVENT_PERIODIC) == 0)) {
		snprintf(msg, msg_len - 1,
			 "%s: Can't set hook freq value: hook event must contain at least'%s' or '%s'", __func__,
			 HOOKSTR_EXECHOST_PERIODIC, HOOKSTR_PERIODIC);
		return (1);
	}

	phook->freq = freq;
	return (0);
}

/*
 *
 * unset_hook* functions.
 *
 */

/*
 *	Unsets 'phook's enabled value, resetting back to default.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
unset_hook_enabled(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	phook->enabled = HOOK_ENABLED_DEFAULT;
	return (0);
}

/*
 *
 * unset_hook* functions.
 *
 */

/*
 *	Unsets 'phook's debug value, resetting back to default.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
unset_hook_debug(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	phook->debug = HOOK_DEBUG_DEFAULT;
	return (0);
}

/*
 *	Unsets 'phook's type value, resetting back to default.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
unset_hook_type(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	if (phook->hook_name &&
	    (strncmp(phook->hook_name, HOOK_PBS_PREFIX,
		     strlen(HOOK_PBS_PREFIX)) == 0)) {
		snprintf(msg, msg_len - 1,
			 "can't unset hook's type since hook name is %s",
			 phook->hook_name);
		return (1);
	}
	phook->type = HOOK_TYPE_DEFAULT;
	return (0);
}

/*
 *	Unsets 'phook's user value, resetting back to default.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
unset_hook_user(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	phook->user = HOOK_USER_DEFAULT;
	return (0);
}

/*
 *	Unsets 'phook's fail_action value, resetting back to default.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
unset_hook_fail_action(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	phook->fail_action = HOOK_FAIL_ACTION_DEFAULT;
	return (0);
}

/**
 * @brief
 *	Unsets 'phook's event value, resetting back to default.
 *	Various hosts list where 'phook' appears are updated to
 *	reflect the changed event value.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of 'msg' buffer.
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure with 'msg' of size 'msg_len' filled in.
 */
int
unset_hook_event(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	if (phook->event & HOOK_EVENT_QUEUEJOB)
		delete_link(&phook->hi_queuejob_hooks);

	if (phook->event & HOOK_EVENT_POSTQUEUEJOB)
		delete_link(&phook->hi_postqueuejob_hooks);

	if (phook->event & HOOK_EVENT_MODIFYJOB)
		delete_link(&phook->hi_modifyjob_hooks);

	if (phook->event & HOOK_EVENT_RESVSUB)
		delete_link(&phook->hi_resvsub_hooks);

	if (phook->event & HOOK_EVENT_MODIFYRESV)
		delete_link(&phook->hi_modifyresv_hooks);

	if (phook->event & HOOK_EVENT_MOVEJOB)
		delete_link(&phook->hi_movejob_hooks);

	if (phook->event & HOOK_EVENT_RUNJOB)
		delete_link(&phook->hi_runjob_hooks);

	if (phook->event & HOOK_EVENT_JOBOBIT)
		delete_link(&phook->hi_jobobit_hooks);

	if (phook->event & HOOK_EVENT_MANAGEMENT)
		delete_link(&phook->hi_management_hooks);

	if (phook->event & HOOK_EVENT_MODIFYVNODE)
		delete_link(&phook->hi_modifyvnode_hooks);

	if (phook->event & HOOK_EVENT_PROVISION)
		delete_link(&phook->hi_provision_hooks);

	if (phook->event & HOOK_EVENT_PERIODIC)
		delete_link(&phook->hi_periodic_hooks);

	if (phook->event & HOOK_EVENT_RESV_CONFIRM)
		delete_link(&phook->hi_resv_confirm_hooks);

	if (phook->event & HOOK_EVENT_RESV_BEGIN)
		delete_link(&phook->hi_resv_begin_hooks);

	if (phook->event & HOOK_EVENT_RESV_END)
		delete_link(&phook->hi_resv_end_hooks);

	if (phook->event & HOOK_EVENT_EXECJOB_BEGIN) {
		delete_link(&phook->hi_execjob_begin_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PROLOGUE) {
		delete_link(&phook->hi_execjob_prologue_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_EPILOGUE) {
		delete_link(&phook->hi_execjob_epilogue_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PRETERM) {
		delete_link(&phook->hi_execjob_preterm_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_LAUNCH) {
		delete_link(&phook->hi_execjob_launch_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_END) {
		delete_link(&phook->hi_execjob_end_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECHOST_PERIODIC) {
		delete_link(&phook->hi_exechost_periodic_hooks);
	}
	if (phook->event & HOOK_EVENT_EXECHOST_STARTUP) {
		delete_link(&phook->hi_exechost_startup_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_ATTACH) {
		delete_link(&phook->hi_execjob_attach_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_RESIZE) {
		delete_link(&phook->hi_execjob_resize_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_ABORT) {
		delete_link(&phook->hi_execjob_abort_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_POSTSUSPEND) {
		delete_link(&phook->hi_execjob_postsuspend_hooks);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PRERESUME) {
		delete_link(&phook->hi_execjob_preresume_hooks);
	}
	phook->event = HOOK_EVENT_DEFAULT;

	return (0);
}

/**
 * @brief
 *	Unsets 'phook's order value, resetting back to default.
 *	Various hosts list where 'phook' appears are updated to
 *	reflect the changed phook->order value.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of 'msg' buffer.
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure with 'msg' of size 'msg_len' filled in.
 */
int
unset_hook_order(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	phook->order = HOOK_ORDER_DEFAULT;

	if (phook->event & HOOK_EVENT_QUEUEJOB) {
		delete_link(&phook->hi_queuejob_hooks);
		insert_hook_sort_order(HOOK_EVENT_QUEUEJOB,
				       &svr_queuejob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_POSTQUEUEJOB) {
		delete_link(&phook->hi_postqueuejob_hooks);
		insert_hook_sort_order(HOOK_EVENT_POSTQUEUEJOB,
				       &svr_postqueuejob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MODIFYJOB) {
		delete_link(&phook->hi_modifyjob_hooks);
		insert_hook_sort_order(HOOK_EVENT_MODIFYJOB,
				       &svr_modifyjob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESVSUB) {
		delete_link(&phook->hi_resvsub_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESVSUB,
				       &svr_resvsub_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MODIFYRESV) {
		delete_link(&phook->hi_modifyresv_hooks);
		insert_hook_sort_order(HOOK_EVENT_MODIFYRESV,
				       &svr_modifyresv_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MOVEJOB) {
		delete_link(&phook->hi_movejob_hooks);
		insert_hook_sort_order(HOOK_EVENT_MOVEJOB,
				       &svr_movejob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RUNJOB) {
		delete_link(&phook->hi_runjob_hooks);
		insert_hook_sort_order(HOOK_EVENT_RUNJOB,
				       &svr_runjob_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_JOBOBIT) {
		delete_link(&phook->hi_jobobit_hooks);
		insert_hook_sort_order(HOOK_EVENT_JOBOBIT,
				       &svr_jobobit_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MANAGEMENT) {
		delete_link(&phook->hi_management_hooks);
		insert_hook_sort_order(HOOK_EVENT_MANAGEMENT,
				       &svr_management_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_MODIFYVNODE) {
		delete_link(&phook->hi_modifyvnode_hooks);
		insert_hook_sort_order(HOOK_EVENT_MODIFYVNODE,
				       &svr_modifyvnode_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESV_CONFIRM) {
		delete_link(&phook->hi_resv_confirm_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESV_CONFIRM,
				       &svr_resv_confirm_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESV_BEGIN) {
		delete_link(&phook->hi_resv_begin_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESV_BEGIN,
				       &svr_resv_begin_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_RESV_END) {
		delete_link(&phook->hi_resv_end_hooks);
		insert_hook_sort_order(HOOK_EVENT_RESV_END,
				       &svr_resv_end_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_BEGIN) {
		delete_link(&phook->hi_execjob_begin_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_BEGIN,
				       &svr_execjob_begin_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PROLOGUE) {
		delete_link(&phook->hi_execjob_prologue_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_PROLOGUE,
				       &svr_execjob_prologue_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_EPILOGUE) {
		delete_link(&phook->hi_execjob_epilogue_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_EPILOGUE,
				       &svr_execjob_epilogue_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_END) {
		delete_link(&phook->hi_execjob_end_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_END,
				       &svr_execjob_end_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PRETERM) {
		delete_link(&phook->hi_execjob_preterm_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_PRETERM,
				       &svr_execjob_preterm_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_LAUNCH) {
		delete_link(&phook->hi_execjob_launch_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_LAUNCH,
				       &svr_execjob_launch_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECHOST_PERIODIC) {
		delete_link(&phook->hi_exechost_periodic_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECHOST_PERIODIC,
				       &svr_exechost_periodic_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECHOST_STARTUP) {
		delete_link(&phook->hi_exechost_startup_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECHOST_STARTUP,
				       &svr_exechost_startup_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_ATTACH) {
		delete_link(&phook->hi_execjob_attach_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_ATTACH,
				       &svr_execjob_attach_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_RESIZE) {
		delete_link(&phook->hi_execjob_resize_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_RESIZE,
				       &svr_execjob_resize_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_ABORT) {
		delete_link(&phook->hi_execjob_abort_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_ABORT,
				       &svr_execjob_abort_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_POSTSUSPEND) {
		delete_link(&phook->hi_execjob_postsuspend_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_POSTSUSPEND,
				       &svr_execjob_postsuspend_hooks, phook);
	}

	if (phook->event & HOOK_EVENT_EXECJOB_PRERESUME) {
		delete_link(&phook->hi_execjob_preresume_hooks);
		insert_hook_sort_order(HOOK_EVENT_EXECJOB_PRERESUME,
				       &svr_execjob_preresume_hooks, phook);
	}

	return (0);
}

/*
 *	Unsets 'phook's alarm value, resetting back to default.
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
int
unset_hook_alarm(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	phook->alarm = HOOK_ALARM_DEFAULT;

	return (0);
}

/**
 * @brief
 *	Unsets 'phook's freq value, resetting back to default.
 *
 * @param[in/out]	phook - hook being operated on.
 * @param[in/out]	msg - error message buffer
 * @param[in]		msg_len - size of 'msg' buffer.
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure with 'msg' of size 'msg_len' filled in.
 */
int
unset_hook_freq(hook *phook, char *msg, size_t msg_len)
{
	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if (phook == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: hook parameter is NULL", __func__);
		return (1);
	}

	phook->freq = HOOK_FREQ_DEFAULT;

	return (0);
}

/**
 *
 * @brief
 *	Initializes all the entries except the 'name' attribute of a hook.
 * @param[in/out] phook	- the hook in question
 * @param[in]	  pyfree_func - the "free" function to be used on a python
 *				script attribute.
 *
 */
static void
hook_init(hook *phook, void (*pyfree_func)(struct python_script *))
{

	phook->type = HOOK_TYPE_DEFAULT;
	phook->user = HOOK_USER_DEFAULT;
	phook->fail_action = HOOK_FAIL_ACTION_DEFAULT;
	phook->enabled = HOOK_ENABLED_DEFAULT;
	phook->debug = HOOK_DEBUG_DEFAULT;
	phook->event = HOOK_EVENT_DEFAULT;
	phook->order = HOOK_ORDER_DEFAULT;
	phook->alarm = HOOK_ALARM_DEFAULT;
	phook->freq = HOOK_FREQ_DEFAULT;
	phook->pending_delete = HOOK_PENDING_DELETE_DEFAULT;

	if (phook->script != NULL) {
		/* Free up also any Python objects that may have been */
		/* instantiated for the hook script */
		if (pyfree_func != NULL)
			pyfree_func(phook->script);
		free(phook->script);
	}
	phook->script = NULL;
	phook->hook_control_checksum = 0;
	phook->hook_script_checksum = 0;
	phook->hook_config_checksum = 0;
}

/**
 * @brief
 * 	Allocates space for a hook structure and initialize working
 *	attributes to "unset"
 *
 * @return hook *
 * @retval <pointer to hook>	pointer to structure
 * @retval NULL 		if malloc space not available.
 */
hook *
hook_alloc(void)
{
	hook *phook;

	phook = (hook *) malloc(sizeof(hook));
	if (phook == NULL) {
		log_err(errno, __func__, "no memory");
		return NULL;
	}
	(void) memset((char *) phook, (int) 0, (size_t) sizeof(hook));

	phook->hook_name = NULL;

	hook_init(phook, NULL);

	clear_hook_links(phook);
	append_link(&svr_allhooks, &phook->hi_allhooks, phook);

	return (phook);
}

/**
 * @brief
 *	Frees the hook structure and its sub-structures.
 *
 * @param[in/out]  phook	- pointer to the hook structure.
 * @param[in] 	   pyfree_func - the special free function for the
 *				Python-related field.
 *			Ex. pbs_python_ext_free_python_script()
 *
 */
void
hook_free(hook *phook, void (*pyfree_func)(struct python_script *))
{
	if (phook->hook_name != NULL) {
		free(phook->hook_name);
	}
	phook->hook_name = NULL;
	hook_init(phook, pyfree_func);

	free(phook); /* now free the main structure */
}

/**
 *
 * @brief
 *	Mark the given hook-related 'filename' as bad by renaming it
 *	with a HOOK_BAD_SUFFIX.
 *
 * @note
 *	This function expects filename with HOOK_FILE_SUFFIX,
 *	HOOK_SCRIPT_SUFFIX, HOOK_CONFIG_SUFFIX, or named PBS_RESCDEF.
 *
 */
void
mark_hook_file_bad(char *filename)
{
	char bad_filename[MAXPATHLEN + 1];
	char *p;
	int is_hook_cntrl_file = 0;
	int is_hook_config_file = 0;
	int is_hook_script_file = 0;

	if (filename == NULL)
		return;

	p = strstr(filename, HOOK_FILE_SUFFIX);
	if ((p != NULL) && (strcmp(p, HOOK_FILE_SUFFIX) == 0)) {
		is_hook_cntrl_file = 1;
	}
	if (!is_hook_cntrl_file) {
		p = strstr(filename, HOOK_SCRIPT_SUFFIX);
		if ((p != NULL) && (strcmp(p, HOOK_SCRIPT_SUFFIX) == 0))
			is_hook_script_file = 1;
	}

	if (!is_hook_cntrl_file && !is_hook_script_file) {
		p = strstr(filename, HOOK_CONFIG_SUFFIX);
		if ((p != NULL) && (strcmp(p, HOOK_CONFIG_SUFFIX) == 0))
			is_hook_config_file = 1;
	}

	if (!is_hook_cntrl_file && !is_hook_script_file &&
	    !is_hook_config_file) {
		p = strstr(filename, PBS_RESCDEF);
		if ((p == NULL) || (strcmp(p, PBS_RESCDEF) != 0))
			/* not a recognized file, so not moving it */
			return;
	}

	snprintf(bad_filename, sizeof(bad_filename), "%s%s",
		 filename, HOOK_BAD_SUFFIX);

#ifdef WIN32
	if (MoveFileEx(filename, bad_filename,
		       MOVEFILE_REPLACE_EXISTING | MOVEFILE_WRITE_THROUGH) == 0) {
		errno = GetLastError();
		snprintf(log_buffer, sizeof(log_buffer),
			 "MoveFileEx(%s, %s) failed!", filename, bad_filename);
		log_err(errno, __func__, log_buffer);

	} else {
		snprintf(log_buffer, sizeof(log_buffer),
			 "renamed hook-related file %s as %s", filename,
			 bad_filename);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK,
			  LOG_WARNING, __func__, log_buffer);
	}
	secure_file(bad_filename, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#else
	if (rename(filename, bad_filename) == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "error renaming hook file %s", filename);
		log_err(errno, __func__, log_buffer);
	} else {
		snprintf(log_buffer, sizeof(log_buffer),
			 "renamed hook-related file %s as %s", filename,
			 bad_filename);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK,
			  LOG_WARNING, __func__, log_buffer);
	}
#endif
}

/**
 * @brief
 *	Purge hook from system.
 * 	The hook is dequeued; the hook control file, script file
 * 	are unlinked, and the hook structure is freed.
 * @note
 *	If the hook-related file fails to unlink, then it is moved out
 *	of the way (renamed via mark_hook_file_bad() call) so as not to
 *	get rediscovered by hook_recov().
 *
 * @param[in/out] phook	- pointer to the hook structure.
 * @param[in] 	  pyfree_func - the special free function for the Python-related
 *			field.
 *			Ex. pbs_python_ext_free_python_script()
 *
 */
void
hook_purge(hook *phook, void (*pyfree_func)(struct python_script *))
{
	char namebuf[MAXPATHLEN + 1];

	if (phook == NULL) {
		log_err(PBSE_INTERNAL, __func__, "phook is NULL!");
		return;
	}

	clear_hook_links(phook);
	if (phook->hook_name == NULL) {
		/* hook_name should not be NULL, but if so, we already    */
		/* malloced hook structure so don't return here so as     */
		/* to catch hook_free() at the end.                       */
		log_err(PBSE_INTERNAL, __func__,
			"phook->hook_name is NULL!");
	} else {
		memset(namebuf, '\0', MAXPATHLEN + 1);

		snprintf(namebuf, MAXPATHLEN, "%s%s%s", path_hooks,
			 phook->hook_name, HOOK_CONFIG_SUFFIX);
		if ((phook->event & HOOK_EVENT_PERIODIC) && (phook->enabled == TRUE))
			delete_task_by_parm1_func(phook, NULL, DELETE_ALL);

#ifdef WIN32
		/* in case file permission got corrupted */
		secure_file(namebuf, "Administrators",
			    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif
		if (unlink(namebuf) < 0) {
			if (errno != ENOENT) {
				sprintf(log_buffer,
					"Failed to delete hook config file %s",
					namebuf);
				log_err(errno, __func__, log_buffer);
				mark_hook_file_bad(namebuf);
			}
		}

		snprintf(namebuf, MAXPATHLEN, "%s%s%s", path_hooks,
			 phook->hook_name, HOOK_SCRIPT_SUFFIX);

#ifdef WIN32
		/* in case file permission got corrupted */
		secure_file(namebuf, "Administrators",
			    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif

		if (unlink(namebuf) < 0) {
			if (errno != ENOENT) {
				sprintf(log_buffer,
					"Failed to delete hook script %s",
					namebuf);
				log_err(errno, __func__, log_buffer);
				mark_hook_file_bad(namebuf);
			}
		}

		snprintf(namebuf, MAXPATHLEN, "%s%s%s", path_hooks,
			 phook->hook_name, HOOK_FILE_SUFFIX);

#ifdef WIN32
		/* in case file permission got corrupted */
		secure_file(namebuf, "Administrators",
			    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif
		if (unlink(namebuf) < 0) {
			if (errno != ENOENT) {
				sprintf(log_buffer,
					"Failed to delete hook control file %s",
					namebuf);
				log_err(errno, __func__, log_buffer);
				mark_hook_file_bad(namebuf);
			}
		}
	}

	hook_free(phook, pyfree_func);
	return;
}

/**
 * @brief
 * 	Saves non-default attribute values into  the hook control file.
 *
 * @param[in/out]	phook - hook being operated on.
 *
 * @return int
 * @retval	0	for success
 * @retval	-1	for failure
 */
int
hook_save(hook *phook)
{
	char hookfile[MAXPATHLEN + 1];
	char hookfile_new[MAXPATHLEN + 1];
	FILE *hkfp = NULL;

	if (phook == NULL) {
		log_err(PBSE_INTERNAL, __func__, "phook is NULL!");
		return (-1);
	}
	if (phook->hook_name == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"phook->hook_name is NULL!");
		return (-1);
	}

	memset(hookfile, '\0', MAXPATHLEN + 1);
	memset(hookfile_new, '\0', MAXPATHLEN + 1);
	snprintf(hookfile, MAXPATHLEN, "%s%s%s", path_hooks, phook->hook_name,
		 HOOK_FILE_SUFFIX);
	snprintf(hookfile_new, MAXPATHLEN, "%s%s%s.new", path_hooks,
		 phook->hook_name, HOOK_FILE_SUFFIX);

#ifdef WIN32
	fix_perms2(hookfile, hookfile_new);
#endif

	if ((hkfp = fopen(hookfile_new, "w")) == NULL) {
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK,
			  LOG_WARNING, __func__,
			  "Hook control file update failed!");
		return (-1);
	}

	fprintf(hkfp, "%s=%s\n", HOOKATT_NAME, phook->hook_name);

	/* Save only the non-defaults */
	if (phook->type != HOOK_TYPE_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_TYPE,
			hook_type_as_string(phook->type));

	if (phook->enabled != HOOK_ENABLED_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_ENABLED,
			hook_enabled_as_string(phook->enabled));

	if (phook->debug != HOOK_DEBUG_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_DEBUG,
			hook_debug_as_string(phook->debug));

	if (phook->user != HOOK_USER_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_USER,
			hook_user_as_string(phook->user));

	if (phook->fail_action != HOOK_FAIL_ACTION_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_FAIL_ACTION,
			hook_fail_action_as_string(phook->fail_action));

	if (phook->event != HOOK_EVENT_DEFAULT) {
		fprintf(hkfp, "%s=%s\n", HOOKATT_EVENT,
			hook_event_as_string(phook->event));
	}

	if (phook->order != HOOK_ORDER_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_ORDER,
			hook_order_as_string(phook->order));

	if (phook->alarm != HOOK_ALARM_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_ALARM,
			hook_alarm_as_string(phook->alarm));

	if (phook->freq != HOOK_FREQ_DEFAULT)
		fprintf(hkfp, "%s=%s\n", HOOKATT_FREQ,
			hook_freq_as_string(phook->freq));

	/* need to save on disk that the hook is pending to be deleted */
	if (phook->pending_delete != HOOK_PENDING_DELETE_DEFAULT) {
		fprintf(hkfp, "%s=%d\n", "pending_delete", phook->pending_delete);
	}

#ifdef WIN32
	if ((fflush(hkfp) != 0) ||
	    (fclose(hkfp) != 0)) {
		sprintf(log_buffer, "Failed to flush/close hook file %s",
			hookfile_new);
		log_err(errno, __func__, log_buffer);
		return (-1);
	}

	if (MoveFileEx(hookfile_new, hookfile,
		       MOVEFILE_REPLACE_EXISTING | MOVEFILE_WRITE_THROUGH) == 0) {
		errno = GetLastError();
		sprintf(log_buffer, "MoveFileEx(%s, %s) failed! Deleting file.",
			hookfile_new, hookfile);
		log_err(errno, __func__, log_buffer);
		(void) unlink(hookfile_new);
		return (-1);
	}
	secure_file(hookfile, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#else
	if ((fflush(hkfp) != 0) ||
	    (fsync(fileno(hkfp)) != 0) ||
	    (fclose(hkfp) != 0)) {
		sprintf(log_buffer, "Failed to flush/close hook file %s",
			hookfile_new);
		log_err(errno, __func__, log_buffer);
		return (-1);
	}
	if (rename(hookfile_new, hookfile) < 0) {
		char *msgbuf;

		pbs_asprintf(&msgbuf, "rename(%s, %s) failed!", hookfile_new, hookfile);
		log_err(errno, __func__, msgbuf);
		free(msgbuf);
		(void) unlink(hookfile_new);
		return (-1);
	}
#endif
	phook->hook_control_checksum = crc_file(hookfile);

	return (0);
}

/*
 * find_hook() - find hook by hook_name
 *
 *	Search list of all server hooks for one with same hook name
 *	Return NULL if not found or pointer to hook struct if found
 */

hook *
find_hook(char *hook_name)
{
	hook *phook;

	phook = (hook *) GET_NEXT(svr_allhooks);
	while (phook) {
		if (phook->hook_name &&
		    (strcmp(hook_name, phook->hook_name) == 0)) {
			break;
		}
		phook = (hook *) GET_NEXT(phook->hi_allhooks);
	}
	return (phook); /* may be a null pointer */
}

/**
 * @brief
 *	Locate a hook by its event.
 *
 * @par Functionality:
 *      This function locates a hook by its event number.
 *
 * @see
 *	add_hook_event
 *	set_srv_prov_attributes
 *	start_vnode_provisioning
 *	#hook in hook.h
 *	#HOOK_EVENT_PROVISION in hook.h
 *
 * @param[in]   hook_event           -       number identifying a hook event
 *
 * @return      poiner to hook
 * @retval       pointer to hook : if hook is found
 * @retval       NULL : if hook is not found
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

hook *
find_hookbyevent(int hook_event)
{
	hook *phook;

	phook = (hook *) GET_NEXT(svr_allhooks);
	while (phook) {
		if (phook->event & hook_event)
			break;
		phook = (hook *) GET_NEXT(phook->hi_allhooks);
	}
	DBPRT(("hook pointer is %p\n", (void *) phook))
	return (phook); /* may be a null pointer */
}

/* The following are for encoding and decoding of a hook file in base 64 */
/* Much of the code has been taken from Python-2.5.1/Modules/binascii.c  */
/* as written by: Jack Jansen, CWI, July 1995.                           */

static char table_a2b_base64[] = {
	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
	-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, 62, -1, -1, -1, 63,
	52, 53, 54, 55, 56, 57, 58, 59, 60, 61, -1, -1, -1, 0, -1, -1, /* Note PAD->0 */
	-1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14,
	15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, -1, -1, -1, -1, -1,
	-1, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40,
	41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, -1, -1, -1, -1, -1};

#define BASE64_PAD '='

static unsigned char table_b2a_base64[] =
	"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";

static int
find_valid_base64_char(unsigned char *s, ssize_t slen, int num)
{
	/* Finds & returns the (num+1)th
	 ** valid character for base64, or -1 if none.
	 */

	int ret = -1;
	unsigned char c, b64val;

	while ((slen > 0) && (ret == -1)) {
		c = *s;
		b64val = table_a2b_base64[c & 0x7f];
		if (((c <= 0x7f) && (b64val != (unsigned char) -1))) {
			if (num == 0)
				ret = *s;
			num--;
		}

		s++;
		slen--;
	}
	return ret;
}

/*
 *	Decodes a base64-encoded block of data (ascii_data, ascii_len), and
 *	store the result in (bin_data, p_bin_len).
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *		filled in.
 */
int
decode_block_base64(unsigned char *ascii_data, ssize_t ascii_len,
		    unsigned char *bin_data, ssize_t *p_bin_len,
		    char *msg, size_t msg_len)
{
	int leftbits = 0;
	unsigned char this_ch;
	unsigned int leftchar = 0;
	int quad_pos = 0;
	ssize_t bin_len = 0;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	for (; ascii_len > 0; ascii_len--, ascii_data++) {
		this_ch = *ascii_data;
		if (this_ch > 0x7f ||
		    this_ch == '\r' || this_ch == '\n' || this_ch == ' ')
			continue;

		/* Check for pad sequences and ignore
		 ** the invalid ones.
		 */
		if (this_ch == BASE64_PAD) {
			if ((quad_pos < 2) ||
			    ((quad_pos == 2) &&
			     (find_valid_base64_char(ascii_data, ascii_len, 1) != BASE64_PAD))) {
				continue;
			} else {
				/* A pad sequence means no more input.
				 ** We've already interpreted the data
				 ** from the quad at this point.
				 */
				leftbits = 0;
				break;
			}
		}

		this_ch = table_a2b_base64[*ascii_data];
		if (this_ch == (unsigned char) -1)
			continue;

		/*
		 ** Shift it in on the low end, and see if there's
		 ** a byte ready for output.
		 */
		quad_pos = (quad_pos + 1) & 0x03;
		leftchar = (leftchar << 6) | (this_ch);
		leftbits += 6;

		if (leftbits >= 8) {
			leftbits -= 8;
			*bin_data++ = (leftchar >> leftbits) & 0xff;
			bin_len++;
			leftchar &= ((1 << leftbits) - 1);
		}
	}

	if (leftbits != 0) {
		snprintf(msg, msg_len - 1, "Incorrect padding");
		return (1);
	}

	/* And set string size correctly. If the result string is empty
	 ** (because the input was all invalid) return the shared empty
	 ** string instead.
	 */
	if (bin_len <= 0) {
		snprintf(msg, msg_len - 1, "Unable to decode...bad input");
		return (1);
	}
	*p_bin_len = bin_len;

	return (0);
}

/*
 *	Encodes a non-encoded block of data (bin_data, bin_len), and store
 *	the result in (asci_data, p_ascii_len).
 *	RETURNS: 0 for success; 1 otherwise with 'msg' of size 'msg_len'
 *	filled in.
 */
static int
encode_block_base64(unsigned char *bin_data, ssize_t bin_len,
		    unsigned char *ascii_data, ssize_t *p_ascii_len,
		    char *msg, size_t msg_len)
{
	int leftbits = 0;
	unsigned char this_ch;
	unsigned int leftchar = 0;
	unsigned char *ascii_data_start;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	ascii_data_start = ascii_data;

	for (; bin_len > 0; bin_len--, bin_data++) {
		/* Shift the data into our buffer */
		leftchar = (leftchar << 8) | *bin_data;
		leftbits += 8;

		/* See if there are 6-bit groups ready */
		while (leftbits >= 6) {
			this_ch = (leftchar >> (leftbits - 6)) & 0x3f;
			leftbits -= 6;
			*ascii_data++ = table_b2a_base64[this_ch];
		}
	}
	if (leftbits == 2) {
		*ascii_data++ = table_b2a_base64[(leftchar & 3) << 4];
		*ascii_data++ = BASE64_PAD;
		*ascii_data++ = BASE64_PAD;
	} else if (leftbits == 4) {
		*ascii_data++ = table_b2a_base64[(leftchar & 0xf) << 2];
		*ascii_data++ = BASE64_PAD;
	}
	*ascii_data++ = '\n'; /* Append a courtesy newline */

	*p_ascii_len = (ssize_t)(ascii_data - ascii_data_start);

	return (0);
}

/**
 * @brief
 *	Encodes the contents of 'inline' file as 'content_encoding', and storing
 *      the result in 'outfile'
 *
 * @param[in]       inflie          - the content of this input file will be encoded
 * @param[in/out]   outfile         - the output file in which the encoded output is stored
 * @param[in]       conent_encoding - specifies the encoding
 * @param[in/out]   msg             - error message
 * @param[in]       msg_len         - specifiles length of error message
 *
 * @return int
 * @retval = 0	SUCCESS
 * @retval = 1	if not SUCCESS, then also sets 'msg' of size 'msg_len'
 */
int
encode_hook_content(char *infile, char *outfile, char *content_encoding,
		    char *msg, size_t msg_len)
{
	FILE *infp = NULL;
	FILE *outfp = NULL;
	unsigned char in_data[HOOK_BUF_SIZE];
	unsigned char out_data[(HOOK_BUF_SIZE * 2) + 3];
	/* an upper bound that should work for */
	/* both encoded and decoded data */
	size_t nread;
	ssize_t in_len;
	ssize_t out_len;
	int ret = 0;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if ((infile == NULL) || (outfile == NULL)) {
		snprintf(msg, msg_len - 1, "no infile or outfile");
		return (1);
	}

	if (content_encoding == NULL) {
		snprintf(msg, msg_len - 1, "no content_encoding");
		return (1);
	}
	outfp = fopen(outfile, "wb");
	if (outfp == NULL) {
		snprintf(msg, msg_len - 1, "failed to open %s - error %s", outfile,
			 strerror(errno));
		ret = 1;
		goto encode_hook_content_exit;
	}

#ifdef WIN32
	secure_file(outfile, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif

	infp = fopen(infile, "rb");

	if (infp == NULL) {
		if (errno == ENOENT) {
			ret = 0;
		} else {

			snprintf(msg, msg_len - 1,
				 "failed to open %s - error %s", infile,
				 strerror(errno));
			ret = 1;
		}

		goto encode_hook_content_exit;
	}

	while ((nread = fread(in_data, 1, HOOK_BUF_SIZE, infp)) > 0) {
		in_len = nread;
		if (strcmp(content_encoding, HOOKSTR_DEFAULT) == 0) {
			out_len = nread;
			memcpy((char *) out_data, (char *) in_data, in_len);
		} else if (strcmp(content_encoding, "base64") == 0) {
			if (encode_block_base64(in_data, in_len,
						out_data, &out_len, msg, msg_len) != 0) {
				ret = 1;
				goto encode_hook_content_exit;
			}
		} else {
			snprintf(msg, msg_len - 1,
				 "encountered bad content_encoding=%s",
				 content_encoding);
			ret = 1;
			goto encode_hook_content_exit;
		}

		if (out_len > 0) {
			if (fwrite(out_data, 1, out_len, outfp) != out_len) {
				snprintf(msg, msg_len - 1,
					 "write to %s failed! Aborting...",
					 outfile);
				ret = 1;
				goto encode_hook_content_exit;
			}
		}
	}

	if (fflush(outfp) != 0) {
		snprintf(msg, msg_len - 1,
			 "Failed to flush/close hook file %s (error %s)", outfile,
			 strerror(errno));
		ret = 1;
	}

encode_hook_content_exit:
	if (infp != NULL)
		fclose(infp);
	if (outfp != NULL)
		fclose(outfp);

	if (ret != 0) {
		if (outfile)
			(void) unlink(outfile);
	}

	return (ret);
}

/**
 * @brief
 *	Decodes the contents of 'infile' encoded as 'content_encoding',
 *	and storing the result in 'outfile'.
 *
 * @param[in]   infile - the encoded input file
 * @param[in]   outfile - used to store the decoded output
 * @param[in]   content_encoding - specifies the encoding of 'infile'
 * @param[in]   msg - message in case unsuccessful
 * @param[in]   msg_len - length of message
 *
 * @return int
 * @retval  0	indicates SUCCESS
 * @retval  1   otherwise, setting 'msg' of size 'msg_len'
 */
int
decode_hook_content(char *infile, char *outfile, char *content_encoding,
		    char *msg, size_t msg_len)
{
	FILE *infp = NULL;
	FILE *outfp;
	unsigned char in_data[HOOK_BUF_SIZE + 1];
	unsigned char out_data[((HOOK_BUF_SIZE + 1) * 2) + 3];
	/* an upper bound that should work for */
	/* both encoded and decoded data */
	int ret = 0;
	ssize_t in_len;
	ssize_t out_len = 0;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return (1);
	}
	memset(msg, '\0', msg_len);

	if ((infile == NULL) || (outfile == NULL)) {
		snprintf(msg, msg_len - 1, "no infile or outfile");
		return (1);
	}

	if (content_encoding == NULL) {
		snprintf(msg, msg_len - 1, "no content_encoding");
		return (1);
	}

	outfp = fopen(outfile, "wb");
	if (outfp == NULL) {
		snprintf(msg, msg_len - 1,
			 "failed to open %s - error %s", outfile,
			 strerror(errno));
		ret = 1;
		goto decode_hook_content_exit;
	}

#ifdef WIN32
	secure_file(outfile, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif

	infp = fopen(infile, "rb");

	if (infp == NULL) {
		if (errno == ENOENT) {
			ret = 0; /* success since no file to decode */
		} else {

			snprintf(msg, msg_len - 1,
				 "failed to open %s - error %s", infile,
				 strerror(errno));
			ret = 1;
		}
		goto decode_hook_content_exit;
	}

	while (fgets((char *) in_data, sizeof(in_data), infp) != NULL) {
		in_len = strlen((char *) in_data);
		if (strcmp(content_encoding, HOOKSTR_DEFAULT) == 0) {
			out_len = in_len;
			memcpy((char *) out_data, (char *) in_data, in_len);
		} else if (strcmp(content_encoding, "base64") == 0) {
			if (decode_block_base64(in_data, in_len,
						out_data, &out_len, msg, msg_len) != 0) {
				ret = 1;
				goto decode_hook_content_exit;
			}
			out_data[out_len] = '\0';
		} else {
			snprintf(msg, msg_len - 1,
				 "encountered bad content_encoding=%s",
				 content_encoding);
			ret = 1;
			goto decode_hook_content_exit;
		}

		if (out_len > 0) {
			if (fwrite(out_data, 1, out_len, outfp) != out_len) {
				snprintf(msg, msg_len - 1,
					 "write to %s failed! Aborting...",
					 outfile);
				ret = 1;
				goto decode_hook_content_exit;
			}
			out_len = 0;
		}
	}

	if (fflush(outfp) != 0) {
		snprintf(msg, msg_len - 1,
			 "Failed to flush/close hook file %s (error %s)", outfile,
			 strerror(errno));
		ret = 1;
	}

decode_hook_content_exit:
	if (infp != NULL)
		fclose(infp);

	if (outfp != NULL)
		fclose(outfp);

	if (ret != 0) {
		if (outfile)
			(void) unlink(outfile);
	}
	return (ret);
}

/**
 * @brief
 * 	Prints all the attributes and their values of 'phook'
 *
 * @param[in]	phook - hook whoso values are being printed out.
 * @param[in]	heading - a string to print out before printing out values.
 */
void
print_hook(hook *phook, char *heading)
{
	if (phook == NULL)
		return;

	snprintf(log_buffer, sizeof(log_buffer),
		 "%s = {%s, %s=%d, %s=%d, %s=%d %s=%d, "
		 "%s=(%d) %s=(%d), %s=(%s), %s=%d, %s=%d}",
		 heading, phook->hook_name ? phook->hook_name : "",
		 HOOKATT_ORDER, phook->order,
		 HOOKATT_TYPE, phook->type,
		 HOOKATT_ENABLED, phook->enabled,
		 HOOKATT_USER, phook->user,
		 HOOKATT_DEBUG, phook->debug,
		 HOOKATT_FAIL_ACTION, phook->fail_action,
		 HOOKATT_EVENT, hook_event_as_string(phook->event),
		 HOOKATT_ALARM, phook->alarm,
		 HOOKATT_FREQ, phook->freq);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
		  LOG_INFO, __func__, log_buffer);

	snprintf(log_buffer, sizeof(log_buffer),
		 "checksums: %s: hook_control_checksum=%lu hook_script_checksum=%lu hook_config_checksum=%lu",
		 phook->hook_name ? phook->hook_name : "",
		 phook->hook_control_checksum,
		 phook->hook_script_checksum,
		 phook->hook_config_checksum);
	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
		  LOG_INFO, __func__, log_buffer);
}

/**
 * @brief
 * 	Prints all the attributes and their values of all hooks appearing
 *	in the system hooks list representing 'event'.
 *
 * @param[in] event - the event whose hooks are being printed. If 'event' is 0,
 * 	means to print out the svr_allhooks list.
 */
void
print_hooks(unsigned int event)
{
	hook *phook;
	int i;
	pbs_list_head l_elem;
	char ev_str[40];
	char heading[80];

	if (event == HOOK_EVENT_QUEUEJOB) {
		l_elem = svr_queuejob_hooks;
		strcpy(ev_str, HOOKSTR_QUEUEJOB);
	} else if (event == HOOK_EVENT_POSTQUEUEJOB) {
		l_elem = svr_postqueuejob_hooks;
		strcpy(ev_str, HOOKSTR_POSTQUEUEJOB);
	} else if (event == HOOK_EVENT_MODIFYJOB) {
		l_elem = svr_modifyjob_hooks;
		strcpy(ev_str, HOOKSTR_MODIFYJOB);
	} else if (event == HOOK_EVENT_RESVSUB) {
		l_elem = svr_resvsub_hooks;
		strcpy(ev_str, HOOKSTR_RESVSUB);
	} else if (event == HOOK_EVENT_MODIFYRESV) {
		l_elem = svr_modifyresv_hooks;
		strcpy(ev_str, HOOKSTR_MODIFYRESV);
	} else if (event == HOOK_EVENT_MOVEJOB) {
		l_elem = svr_movejob_hooks;
		strcpy(ev_str, HOOKSTR_MOVEJOB);
	} else if (event == HOOK_EVENT_RUNJOB) {
		l_elem = svr_runjob_hooks;
		strcpy(ev_str, HOOKSTR_RUNJOB);
	} else if (event == HOOK_EVENT_JOBOBIT) {
		l_elem = svr_jobobit_hooks;
		strcpy(ev_str, HOOKSTR_JOBOBIT);
	} else if (event == HOOK_EVENT_MANAGEMENT) {
		l_elem = svr_management_hooks;
		strcpy(ev_str, HOOKSTR_MANAGEMENT);
	} else if (event == HOOK_EVENT_MODIFYVNODE) {
		l_elem = svr_modifyvnode_hooks;
		strcpy(ev_str, HOOKSTR_MODIFYVNODE);
	} else if (event == HOOK_EVENT_PERIODIC) {
		l_elem = svr_periodic_hooks;
		strcpy(ev_str, HOOKSTR_PERIODIC);
	} else if (event == HOOK_EVENT_PROVISION) {
		l_elem = svr_provision_hooks;
		strcpy(ev_str, HOOKSTR_PROVISION);
	} else if (event == HOOK_EVENT_RESV_CONFIRM) {
		l_elem = svr_resv_confirm_hooks;
		strcpy(ev_str, HOOKSTR_RESV_CONFIRM);
	} else if (event == HOOK_EVENT_RESV_BEGIN) {
		l_elem = svr_resv_begin_hooks;
		strcpy(ev_str, HOOKSTR_RESV_BEGIN);
	} else if (event == HOOK_EVENT_RESV_END) {
		l_elem = svr_resv_end_hooks;
		strcpy(ev_str, HOOKSTR_RESV_END);
	} else if (event == HOOK_EVENT_EXECJOB_BEGIN) {
		l_elem = svr_execjob_begin_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_BEGIN);
	} else if (event == HOOK_EVENT_EXECJOB_PROLOGUE) {
		l_elem = svr_execjob_prologue_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_PROLOGUE);
	} else if (event == HOOK_EVENT_EXECJOB_EPILOGUE) {
		l_elem = svr_execjob_epilogue_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_EPILOGUE);
	} else if (event == HOOK_EVENT_EXECJOB_END) {
		l_elem = svr_execjob_end_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_END);
	} else if (event == HOOK_EVENT_EXECJOB_PRETERM) {
		l_elem = svr_execjob_preterm_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_PRETERM);
	} else if (event == HOOK_EVENT_EXECJOB_LAUNCH) {
		l_elem = svr_execjob_launch_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_LAUNCH);
	} else if (event == HOOK_EVENT_EXECHOST_PERIODIC) {
		l_elem = svr_exechost_periodic_hooks;
		strcpy(ev_str, HOOKSTR_EXECHOST_PERIODIC);
	} else if (event == HOOK_EVENT_EXECHOST_STARTUP) {
		l_elem = svr_exechost_startup_hooks;
		strcpy(ev_str, HOOKSTR_EXECHOST_STARTUP);
	} else if (event == HOOK_EVENT_EXECJOB_ATTACH) {
		l_elem = svr_execjob_attach_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_ATTACH);
	} else if (event == HOOK_EVENT_EXECJOB_RESIZE) {
		l_elem = svr_execjob_resize_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_RESIZE);
	} else if (event == HOOK_EVENT_EXECJOB_ABORT) {
		l_elem = svr_execjob_abort_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_ABORT);
	} else if (event == HOOK_EVENT_EXECJOB_POSTSUSPEND) {
		l_elem = svr_execjob_postsuspend_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_POSTSUSPEND);
	} else if (event == HOOK_EVENT_EXECJOB_PRERESUME) {
		l_elem = svr_execjob_preresume_hooks;
		strcpy(ev_str, HOOKSTR_EXECJOB_PRERESUME);
	} else {
		l_elem = svr_allhooks;
		strcpy(ev_str, "ALLHOOKS");
	}

	phook = (hook *) GET_NEXT(l_elem);
	i = 0;
	while (phook) {

		sprintf(heading, "%s hook[%d]", ev_str, i);
		print_hook(phook, heading);
		if (event == HOOK_EVENT_QUEUEJOB)
			phook = (hook *) GET_NEXT(phook->hi_queuejob_hooks);
		else if (event == HOOK_EVENT_POSTQUEUEJOB)
			phook = (hook *) GET_NEXT(phook->hi_postqueuejob_hooks);
		else if (event == HOOK_EVENT_MODIFYJOB)
			phook = (hook *) GET_NEXT(phook->hi_modifyjob_hooks);
		else if (event == HOOK_EVENT_RESVSUB)
			phook = (hook *) GET_NEXT(phook->hi_resvsub_hooks);
		else if (event == HOOK_EVENT_MODIFYRESV)
			phook = (hook *) GET_NEXT(phook->hi_modifyresv_hooks);
		else if (event == HOOK_EVENT_MOVEJOB)
			phook = (hook *) GET_NEXT(phook->hi_movejob_hooks);
		else if (event == HOOK_EVENT_RUNJOB)
			phook = (hook *) GET_NEXT(phook->hi_runjob_hooks);
		else if (event == HOOK_EVENT_JOBOBIT)
			phook = (hook *) GET_NEXT(phook->hi_jobobit_hooks);
		else if (event == HOOK_EVENT_MANAGEMENT)
			phook = (hook *) GET_NEXT(phook->hi_management_hooks);
		else if (event == HOOK_EVENT_MODIFYVNODE)
			phook = (hook *) GET_NEXT(phook->hi_modifyvnode_hooks);
		else if (event == HOOK_EVENT_PROVISION)
			phook = (hook *) GET_NEXT(phook->hi_provision_hooks);
		else if (event == HOOK_EVENT_PERIODIC)
			phook = (hook *) GET_NEXT(phook->hi_periodic_hooks);
		else if (event == HOOK_EVENT_RESV_CONFIRM)
			phook = (hook *) GET_NEXT(phook->hi_resv_confirm_hooks);
		else if (event == HOOK_EVENT_RESV_BEGIN)
			phook = (hook *) GET_NEXT(phook->hi_resv_begin_hooks);
		else if (event == HOOK_EVENT_RESV_END)
			phook = (hook *) GET_NEXT(phook->hi_resv_end_hooks);
		else if (event == HOOK_EVENT_EXECJOB_BEGIN)
			phook = (hook *) GET_NEXT(phook->hi_execjob_begin_hooks);
		else if (event == HOOK_EVENT_EXECJOB_PROLOGUE)
			phook = (hook *) GET_NEXT(phook->hi_execjob_prologue_hooks);
		else if (event == HOOK_EVENT_EXECJOB_EPILOGUE)
			phook = (hook *) GET_NEXT(phook->hi_execjob_epilogue_hooks);
		else if (event == HOOK_EVENT_EXECJOB_END)
			phook = (hook *) GET_NEXT(phook->hi_execjob_end_hooks);
		else if (event == HOOK_EVENT_EXECJOB_PRETERM)
			phook = (hook *) GET_NEXT(phook->hi_execjob_preterm_hooks);
		else if (event == HOOK_EVENT_EXECJOB_LAUNCH)
			phook = (hook *) GET_NEXT(phook->hi_execjob_launch_hooks);
		else if (event == HOOK_EVENT_EXECHOST_PERIODIC)
			phook = (hook *) GET_NEXT(phook->hi_exechost_periodic_hooks);
		else if (event == HOOK_EVENT_EXECHOST_STARTUP)
			phook = (hook *) GET_NEXT(phook->hi_exechost_startup_hooks);
		else if (event == HOOK_EVENT_EXECJOB_ATTACH)
			phook = (hook *) GET_NEXT(phook->hi_execjob_attach_hooks);
		else if (event == HOOK_EVENT_EXECJOB_RESIZE)
			phook = (hook *) GET_NEXT(phook->hi_execjob_resize_hooks);
		else if (event == HOOK_EVENT_EXECJOB_ABORT)
			phook = (hook *) GET_NEXT(phook->hi_execjob_abort_hooks);
		else if (event == HOOK_EVENT_EXECJOB_POSTSUSPEND)
			phook = (hook *) GET_NEXT(phook->hi_execjob_postsuspend_hooks);
		else if (event == HOOK_EVENT_EXECJOB_PRERESUME)
			phook = (hook *) GET_NEXT(phook->hi_execjob_preresume_hooks);
		else
			phook = (hook *) GET_NEXT(phook->hi_allhooks);

		i++;
	}
}

/**
 * @brief
 * 	Reads a <filename> under global variable path_hooks,
 *		where <filename> must have the format: <basename>.HK,
 *		creating a hook structure out of the read data.
 *
 * @param[in]   filename - contains the hook data, where the filename must have
 *			 the format <basename>.HK. <basename> must match a
 *			"hook_name=<basename>" entry, which becomes the hook
 *			hook structure's hook_name value.
 * @param[in]	hookfp - If this is not NULL, then use this file`pointer to
 *			to get contents of hook file.
 * @param[in/out] msg	- buffer that is filled with error message, if any.
 * @param[in]	  msg_len - size of 'msg'.
 * @param[in] 	  pyalloc_func - the special function  that
 *			creates a bytecode reprsentation of <basename>.PY,
 *			the actual Python hook script.
 *			Ex.  pbs_python_ext_alloc_python_script()
 * @param[in] 	pyfree_func - the special free function for the Python-related
 *			field.
 *			Ex. pbs_python_ext_free_python_script()
 * @return	hook *
 * @retval	pointer to hook structure mapping the recovered hook.
 * @reval	NULL - for any error encountered.
 *
 */
hook *
hook_recov(char *filename, FILE *hookfp, char *msg, size_t msg_len,
	   int (*pyalloc_func)(const char *, struct python_script **),
	   void (*pyfree_func)(struct python_script *))
{
	hook *phook;
	char basename[MAXPATHLEN + 1];
	char *p;
	FILE *fp = NULL;
	char linebuf[BUFSIZ];
	int linenum;
	char hook_script[MAXPATHLEN + 1];
	char hook_config[MAXPATHLEN + 1];
	char *hook_name;
	int created_here = 0;

	if (msg == NULL) { /* should not happen */
		log_err(PBSE_INTERNAL, __func__, "'msg' buffer is NULL");
		return NULL;
	}
	memset(msg, '\0', msg_len);
	memset(basename, '\0', MAXPATHLEN + 1);

	p = strstr(filename, HOOK_FILE_SUFFIX);
	if ((p == NULL) || (strcmp(p, HOOK_FILE_SUFFIX) != 0)) {
		snprintf(msg, msg_len - 1,
			 "bad filename %s format: should have %s suffix",
			 filename, HOOK_FILE_SUFFIX);
		return NULL;
	}

	strncpy(basename, filename, p - filename);

	hook_name = basename;
	if ((p = strrchr(basename, '/')) != NULL) {
		hook_name = p + 1;
	}

	/* Reuse hook entry if any */
	phook = find_hook(hook_name);
	if (phook != NULL) {
		hook_init(phook, pyfree_func);
		clear_hook_links(phook);
		append_link(&svr_allhooks, &phook->hi_allhooks, phook);
		created_here = 0;
	} else {
		phook = hook_alloc();
		if (phook == NULL) {
			snprintf(msg, msg_len - 1, "hook_alloc() returned NULL!");
			return NULL;
		}
		created_here = 1;
		phook->hook_name = strdup(hook_name);

		if (phook->hook_name == NULL) {
			log_err(errno, __func__, "no memory");
			snprintf(msg, msg_len - 1,
				 "Hook name could not be determined!");
			goto hook_recov_error;
		}
	}

	if (strncmp(phook->hook_name, HOOK_PBS_PREFIX,
		    strlen(HOOK_PBS_PREFIX)) == 0) {
		/* Actually initializing a PBS* prefix hook conrol file */
		phook->type = HOOK_PBS;
	}

#ifdef WIN32
	/* in case file's permission got corrupted */
	secure_file(filename, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif

	if (hookfp == NULL) {
		if ((fp = fopen(filename, "r")) == NULL) {
			sprintf(log_buffer, "%s", filename);
			log_err(errno, __func__, log_buffer);
			snprintf(msg, msg_len - 1,
				 "error %s opening file %s", strerror(errno), filename);
			goto hook_recov_error;
		}
	} else {
		fp = hookfp;
	}

	linenum = 1;
	while (fgets(linebuf, sizeof(linebuf), fp) != NULL) {
		char *p;
		char *pequal;

		char *attname, *attval;

		if (linebuf[0] == '#') {
			continue; /* ignore comment lines */
		}

		if ((p = strrchr(linebuf, '\n')) != NULL) {
			*p = '\0';
		} else {
			snprintf(msg, msg_len - 1,
				 "line %d is too long", linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			goto hook_recov_error;
		}
		/* ignore initial white space;  skip blank lines */
		/*
		 *      Parse lines of the form
		 *
		 *	<attribute name>=<attribute value>
		 *
		 */
		p = linebuf;
		while ((*p != '\0') && isspace(*p))
			p++;

		if (*p == '\0')
			continue; /* empty line */

		if ((pequal = strchr(linebuf, '=')) == NULL) {
			snprintf(msg, msg_len - 1,
				 "line %d:  missing '='", linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			goto hook_recov_error;
		}

		if (*(pequal + 1) == '\0') {
			snprintf(msg, msg_len - 1,
				 "line %d:  no <attribute value>",
				 linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			goto hook_recov_error;
		}
		*pequal = '\0';
		attname = p;
		attval = pequal + 1;

		if (strcmp(attname, HOOKATT_NAME) == 0) {
			if (strcmp(attval, hook_name) != 0) {
				snprintf(msg, msg_len - 1,
					 "failed integrity check - "
					 "found %s=%s not match \'%s\'",
					 HOOKATT_NAME, attval, hook_name);
				goto hook_recov_error;
			}
		} else if (strcmp(attname, HOOKATT_TYPE) == 0) {
			if (set_hook_type(phook, attval, msg, msg_len,
					  1) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_USER) == 0) {
			if (set_hook_user(phook, attval, msg, msg_len, 0) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_FAIL_ACTION) == 0) {
			if (set_hook_fail_action(phook, attval, msg, msg_len, 0) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_ENABLED) == 0) {
			if (set_hook_enabled(phook, attval, msg, msg_len) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_DEBUG) == 0) {
			if (set_hook_debug(phook, attval, msg, msg_len) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_EVENT) == 0) {
			if (set_hook_event(phook, attval, msg, msg_len) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_ORDER) == 0) {
			if (set_hook_order(phook, attval, msg, msg_len) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_ALARM) == 0) {
			if (set_hook_alarm(phook, attval, msg, msg_len) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_FREQ) == 0) {
			if (set_hook_freq(phook, attval, msg, msg_len) != 0)
				goto hook_recov_error;
		} else if (strcmp(attname, HOOKATT_PENDING_DELETE) == 0) {
			phook->pending_delete = atoi(attval);
		} else {
			snprintf(msg, msg_len - 1,
				 "unknown attribute name \'%s\' in line %d",
				 attname, linenum);
			goto hook_recov_error;
		}
		linenum++;
	}

	/* Better not fclose the passed file pointer (hookfp) since the caller */
	/* will be fclose-ing that outside. */
	if ((fp != NULL) && (fp != hookfp))
		(void) fclose(fp);

	phook->hook_control_checksum = crc_file(filename);

	/* now do checksum of hook config file (if any) */
	snprintf(hook_config, MAXPATHLEN, "%s%s%s", path_hooks,
		 phook->hook_name, HOOK_CONFIG_SUFFIX);
	phook->hook_config_checksum = crc_file(hook_config);

	/* now set the hook script */
	snprintf(hook_script, MAXPATHLEN, "%s%s%s", path_hooks,
		 phook->hook_name, HOOK_SCRIPT_SUFFIX);

	if (pyalloc_func != NULL) {
		if (pyalloc_func(hook_script,
				 (struct python_script **) &phook->script) == -1) {
			snprintf(msg, msg_len - 1,
				 "failed to allocate storage for python script %s",
				 hook_script);
			log_err(errno, __func__, msg);
		} else {
			phook->hook_script_checksum = crc_file(hook_script);
		}
	}

#ifdef WIN32
	/* in case file's permission got corrupted  - ok if none existent */
	secure_file(hook_script, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif

	return (phook);

hook_recov_error:
	/* Better not fclose the passed file pointer (hookfp) since the caller */
	/* will be fclose-ing that outside. */
	if ((fp != NULL) && (fp != hookfp))
		(void) fclose(fp);

	if (created_here) {
		clear_hook_links(phook);
		hook_free(phook, pyfree_func);
		return NULL;
	} else {
		/* reuse phook later */
		hook_init(phook, pyfree_func);
		clear_hook_links(phook);
		append_link(&svr_allhooks, &phook->hi_allhooks, phook);
		return NULL;
	}
}

/*
 ************************************************************************
 *   Hook-related Alarm operations.
 ************************************************************************
 */

#ifdef WIN32
#define ALARM_HANDLER_ARG void
#else
#define ALARM_HANDLER_ARG int sig
#endif

/**
 * @brief
 *	The ALARM signal handler.
 *
 * @param[in]   sig	- The signal received causing this function to get
 *			called.
 * @param[in] 	pyinter_func - the interrupt function that raised some signal
 *			to the calling process.
 *			Ex. pbs_python_set_interrupt() which sends an
 *			    an INT signal (ctrl-C)
 *
 */
void
catch_hook_alarm(ALARM_HANDLER_ARG)
{
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "alarm call received, interrupting hook execution.");
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_NOTICE, __func__,
		  log_buffer);

	if (python_interrupt_func != NULL)
		python_interrupt_func();
}

/**
 * @brief
 *	The ALARM signal handler.
 *	Set or unset an alarm signal.
 *	If 'sec' > 0, then start an alarm of the given # of 'sec'; otherwise,
 *      if 'sec'is 0, then to stop the previous alarm.
 *
 *	Return: 0 for success; -1 otherwise.
 *
 * @param[in]   sec - # of seconds to alarm.
 * @param[in] 	pyinter_func - the interrupt function that raised some signal
 *			to the calling process.
 *			Ex. pbs_python_set_interrupt() which sends an
 *			    an INT signal (ctrl-C)
 * @return	int
 * @retval	0	for success.
 * @retval	-1 	otherwise.
 *
 */
int
set_alarm(int sec, void (*pyinter_func)(void))
{
#ifndef WIN32
	static struct sigaction act, oact;

	python_interrupt_func = pyinter_func;

	sigemptyset(&act.sa_mask);

	if (sec > 0) {
		/* set SIGALRM hander to catch_hook_alarm() */
		act.sa_flags = 0;
		act.sa_handler = catch_hook_alarm;
		if (sigaction(SIGALRM, &act, &oact) == -1) {
			log_event(PBSEVENT_ADMIN | PBSEVENT_SYSTEM,
				  PBS_EVENTCLASS_HOOK, LOG_ERR, __func__,
				  "Failed to install alarm");
			return (-1);
		}
		(void) alarm(sec);
	} else {
		(void) alarm(0);
		(void) sigaction(SIGALRM, &oact, NULL);
		/* reset handler for SIGALRM */
	}
#else /* Windows */

	python_interrupt_func = pyinter_func;

	if (sec > 0)
		(void) win_alarm(sec, catch_hook_alarm);
	else
		(void) win_alarm(0, NULL);

#endif /* end of Windows */
	return (0);
}

/**
 *
 * @brief
 * 	Cleans up files older than HOOKS_TMPFILE_MAX_AGE under
 *	<path_hooks_workdir> periodically as driven by the
 *	HOOKS_TMPFILE_NEXT_CLEANUP_PERIOD.
 *
 * @param[in]	ptask	- pointer to the task structure.
 *
 */
void
cleanup_hooks_workdir(struct work_task *ptask)
{
	DIR *dir;
	struct dirent *pdirent;
	struct stat sbuf;
	char hook_file[MAXPATHLEN + 1];

	memset(hook_file, '\0', MAXPATHLEN + 1);
	dir = opendir(path_hooks_workdir);
	if (dir == NULL) {
		sprintf(log_buffer, "could not opendir %s",
			path_hooks_workdir);
		log_err(errno, __func__, log_buffer);
		return;
	}
	while (errno = 0, (pdirent = readdir(dir)) != NULL) {

		if (pdirent->d_name[0] == '.') {
			if (pdirent->d_name[1] == '\0' ||
			    (pdirent->d_name[1] == '.' &&
			     pdirent->d_name[2] == '\0'))
				continue;
		}

		snprintf(hook_file, MAXPATHLEN, "%s%s",
			 path_hooks_workdir, pdirent->d_name);
		if (stat(hook_file, &sbuf) == -1) {
			sprintf(log_buffer, "could not stat %s", hook_file);
			log_err(errno, __func__, log_buffer);
			continue;
		}

		/* remove files older than 'HOOKS_TMPFILE_MAX_AGE' */
		if ((time_now - sbuf.st_ctime) > HOOKS_TMPFILE_MAX_AGE) {
			if (unlink(hook_file) < 0) {
				if (errno != ENOENT) {
					sprintf(log_buffer, "could not cleanup %s",
						hook_file);
					log_err(errno, __func__, log_buffer);
				}
			}
		}
	}
	if (errno != 0 && errno != ENOENT) {
		log_err(errno, __func__, "readdir");
	}
	if (dir) {
		(void) closedir(dir);
	}
	/*  cleanup of hooks temp files happen in the next */
	/* 'HOOKS_TMPFILE_NEXT_CLEANUP_PERIOD' secs.	   */
	(void) set_task(WORK_Timed, time_now + HOOKS_TMPFILE_NEXT_CLEANUP_PERIOD,
			cleanup_hooks_workdir, NULL);
}

/**
 * @brief
 *
 *	Returns the number of hook scripts that are eligible to
 *	be executed for the specified 'hook_event'.
 *	This means the hook is enabled and has hook content.
 *
 * @param[in] hook_event - the event of the hooks to count
 *
 * @return int
 * @retval <n> number of hooks
 *
 */
int
num_eligible_hooks(unsigned int hook_event)
{
	hook *phook;
	hook *phook_next = NULL;
	pbs_list_head *head_ptr;
	int num_hooks = 0;

	switch (hook_event) {

		case HOOK_EVENT_EXECJOB_BEGIN:
			head_ptr = &svr_execjob_begin_hooks;
			break;
		case HOOK_EVENT_EXECJOB_PROLOGUE:
			head_ptr = &svr_execjob_prologue_hooks;
			break;
		case HOOK_EVENT_EXECJOB_EPILOGUE:
			head_ptr = &svr_execjob_epilogue_hooks;
			break;
		case HOOK_EVENT_EXECJOB_END:
			head_ptr = &svr_execjob_end_hooks;
			break;
		case HOOK_EVENT_EXECJOB_PRETERM:
			head_ptr = &svr_execjob_preterm_hooks;
			break;
		case HOOK_EVENT_EXECJOB_LAUNCH:
			head_ptr = &svr_execjob_launch_hooks;
			break;
		case HOOK_EVENT_EXECHOST_PERIODIC:
			head_ptr = &svr_exechost_periodic_hooks;
			break;
		case HOOK_EVENT_EXECHOST_STARTUP:
			head_ptr = &svr_exechost_startup_hooks;
			break;
		case HOOK_EVENT_EXECJOB_ATTACH:
			head_ptr = &svr_execjob_attach_hooks;
			break;
		case HOOK_EVENT_EXECJOB_RESIZE:
			head_ptr = &svr_execjob_resize_hooks;
			break;
		case HOOK_EVENT_EXECJOB_ABORT:
			head_ptr = &svr_execjob_abort_hooks;
			break;
		case HOOK_EVENT_EXECJOB_POSTSUSPEND:
			head_ptr = &svr_execjob_postsuspend_hooks;
			break;
		case HOOK_EVENT_EXECJOB_PRERESUME:
			head_ptr = &svr_execjob_preresume_hooks;
			break;
		default:
			return (0); /* unexpected event encountered */
	}

	for (phook = (hook *) GET_NEXT(*head_ptr); phook; phook = phook_next) {
		switch (hook_event) {

			case HOOK_EVENT_EXECJOB_BEGIN:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_begin_hooks);
				break;
			case HOOK_EVENT_EXECJOB_PROLOGUE:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_prologue_hooks);
				break;
			case HOOK_EVENT_EXECJOB_EPILOGUE:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_epilogue_hooks);
				break;
			case HOOK_EVENT_EXECJOB_END:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_end_hooks);
				break;
			case HOOK_EVENT_EXECJOB_PRETERM:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_preterm_hooks);
				break;
			case HOOK_EVENT_EXECJOB_LAUNCH:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_launch_hooks);
				break;
			case HOOK_EVENT_EXECHOST_PERIODIC:
				phook_next = (hook *) GET_NEXT(phook->hi_exechost_periodic_hooks);
				break;
			case HOOK_EVENT_EXECHOST_STARTUP:
				phook_next = (hook *) GET_NEXT(phook->hi_exechost_startup_hooks);
				break;
			case HOOK_EVENT_EXECJOB_ATTACH:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_attach_hooks);
				break;
			case HOOK_EVENT_EXECJOB_RESIZE:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_resize_hooks);
				break;
			case HOOK_EVENT_EXECJOB_ABORT:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_abort_hooks);
				break;
			case HOOK_EVENT_EXECJOB_POSTSUSPEND:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_postsuspend_hooks);
				break;
			case HOOK_EVENT_EXECJOB_PRERESUME:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_preresume_hooks);
				break;
			default:
				return (0); /*  should not get here */
		}

		if (phook->enabled == FALSE)
			continue;

		if (phook->script == NULL)
			continue;

		num_hooks++;
	}

	return (num_hooks);
}

/**
 *
 * @brief
 * 	Start profiling the next lines of code, collectively giving it
 *      a 'label' and an 'action' description.
 *	The 'label' usually identifies to some object being profiled
 *	(e.g. hook), while the 'action' describes what
 *	is being captured for the object (e.g. "initialization").
 *	Both 'label' and 'action' uniquely identify the
 *	data collected.
 *
 * @param[in]	label - describes a particular object
 * @param[in]	action - refers to the object's action
 *
 * @param[in]	print_start_msg - if 1, then log a "profile_start" message.
 *
 * @return void
 *
 */
void
hook_perf_stat_start(char *label, char *action, int print_start_msg)
{
	char instance[MAXBUFLEN];

	if (!will_log_event(PBSEVENT_DEBUG4))
		return;

	if ((label == NULL) || (action == NULL))
		return;

	snprintf(instance, sizeof(instance), "label=%s action=%s", label, action);
	perf_stat_start(instance);

	if (print_start_msg) {
		snprintf(log_buffer, sizeof(log_buffer), "%s profile_start", instance);
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_HOOK, LOG_INFO, "hook_perf_stat", log_buffer);
	}
}

/**
 *
 * @brief
 * 	Log summary of what has been tracked since hook_perf_stat_start()
 *	call on the same label, action given.
 *
 * @param[in]	label - refers to a particular object
 * @param[in]	action - refers to the object's action
 *
 * @param[in]	print_end_msg - if 1, then mark a "profile_stop" message.
 *
 * @return void
 *
 */
void
hook_perf_stat_stop(char *label, char *action, int print_end_msg)
{
	char instance[MAXBUFLEN];
	char *msg;

	if ((label == NULL) || (action == NULL))
		return;

	snprintf(instance, sizeof(instance), "label=%s action=%s", label, action);

	if (!will_log_event(PBSEVENT_DEBUG4)) {
		perf_stat_remove(instance);
		return;
	}

	msg = perf_stat_stop(instance);

	if (msg == NULL)
		return;

	if (print_end_msg)
		snprintf(log_buffer, sizeof(log_buffer), "%s profile_stop", msg);
	else
		snprintf(log_buffer, sizeof(log_buffer), "%s", msg);

	log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_HOOK, LOG_INFO, "hook_perf_stat", log_buffer);
}


================================================
FILE: src/lib/Libutil/misc_utils.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	misc_utils.c
 * @brief
 *  Utility functions to condense and unroll a sequence of execvnodes that are
 *  returned by the scheduler for standing reservations.
 *  The objective is to condense in a human-readable format the execvnodes
 *  of each occurrence of a standing reservation, and be able to retrieve each
 *  such occurrence easily.
 *
 *  Example usage (also refer to the debug function int test_execvnode_seq
 *  for a code snippet):
 *
 *  Assume str points to some string.
 *  char *condensed_str;
 *  char **unrolled_str;
 *  char **tofree;
 *
 *  condensed_str = condense_execvnode_seq(str);
 *  unrolled_str = unroll_execvnode_seq(condensed_str, &tofree);
 *  ...access an arbitrary, say 2nd occurrence, index via unrolled_str[2]
 *  free_execvnode_seq(tofree);
 */
#define _MISC_UTILS_C
#include <pbs_config.h> /* the master config generated by configure */

#include <libutil.h>
#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <stdarg.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <unistd.h>
#include <libpbs.h>
#include <limits.h>
#include <pbs_idx.h>
#include <pbs_ifl.h>
#include <pbs_internal.h>
#include <pbs_sched.h>
#include <pbs_share.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <pwd.h>
#include <assert.h>
#include <netinet/in.h>
#include <dlfcn.h>
#include <grp.h>
#include <time.h>
#include <sys/time.h>
#include <sys/resource.h>

#include "pbs_error.h"
#include "job.h"
#include "ticket.h"

#ifdef HAVE_MALLOC_INFO
#include <malloc.h>
#endif

#define ISESCAPED(ch) (ch == '\'' || ch == '\"' || ch == ',')

/** @brief conversion array for vnode sharing attribute between str and enum */
struct {
	char *vn_str;
	enum vnode_sharing vns;
} str2vns[] = {
	{ND_Default_Shared, VNS_DFLT_SHARED},
	{ND_Ignore_Excl, VNS_IGNORE_EXCL},
	{ND_Ignore_Excl, VNS_FORCE_SHARED},
	{ND_Default_Excl, VNS_DFLT_EXCL},
	{ND_Force_Excl, VNS_FORCE_EXCL},
	{ND_Default_Exclhost, VNS_DFLT_EXCLHOST},
	{ND_Force_Exclhost, VNS_FORCE_EXCLHOST}};

/* Used for collecting performance stats */
typedef struct perf_stat {
	char instance[MAXBUFLEN + 1];
	double walltime;
	double cputime;
	pbs_list_link pi_allstats;
} perf_stat_t;

static int perf_stats_initialized = 0;
static pbs_list_head perf_stats;

/**
 * @brief
 * 	char_in_set - is the char c in the tokenset
 *
 * @param[in] c - the char
 * @param[in] tokset - string tokenset
 *
 * @return	int
 * @retval	1 	if c is in tokset
 * @retval	0 	if c is not in tokset
 */
int
char_in_set(char c, const char *tokset)
{

	int i;

	for (i = 0; tokset[i] != '\0'; i++)
		if (c == tokset[i])
			return 1;

	return 0;
}

/**
 * @brief
 * 	string_token - strtok() without an an internal state pointer
 *
 * @param[in]      str - the string to tokenize
 * @param[in] 	   tokset - the tokenset to look for
 * @param[in/out]  ret_str - the char ptr where we left off after the tokens
 *		             ** ret_str is opaque to the caller
 *
 * @par	call:
 *	string_token( string, tokenset, &tokptr)
 *	2nd call: string_token( NULL, tokenset2, &tokptr)
 *
 * @par	tokenset can differ between the two calls (as per strtok())
 *	tokptr is an opaque ptr, just keep passing &tokptr into all calls
 *	to string_token()
 *
 * @return	char pointer
 * @retval	returns ptr to front of string segment (as per strtok())
 *
 */
char *
string_token(char *str, const char *tokset, char **ret_str)
{
	char *tok;
	char *search_string;

	if (str != NULL)
		search_string = str;
	else if (ret_str != NULL && *ret_str != NULL)
		search_string = *ret_str;
	else
		return NULL;

	tok = strstr(search_string, tokset);

	if (tok != NULL) {
		while (char_in_set(*tok, tokset) && *tok != '\0') {
			*tok = '\0';
			tok++;
		}

		if (ret_str != NULL)
			*ret_str = tok;
	} else
		*ret_str = NULL;

	return search_string;
}

/**
 *	@brief convert vnode sharing enum into string form

 * 	@par Note:
 * 		Do not free the return value - it's a statically allocated
 *		string.
 *
 *	@param[in] vns - vnode sharing value
 *
 *	@retval string form of sharing value
 *	@retval NULL on error
 */
char *
vnode_sharing_to_str(enum vnode_sharing vns)
{
	int i;
	int size = sizeof(str2vns) / sizeof(str2vns[0]);

	for (i = 0; i < size && str2vns[i].vns != vns; i++)
		;

	if (i == size)
		return NULL;

	return str2vns[i].vn_str;
}

/**
 *	@brief convert string form of vnode sharing to enum
 *
 *	@param[in] vn_str - vnode sharing  string
 *
 *	@return	enum
 *	@retval vnode sharing value
 *	@retval VNS_UNSET if not found
 */
enum vnode_sharing
str_to_vnode_sharing(char *vn_str)
{
	int i;
	int size = sizeof(str2vns) / sizeof(str2vns[0]);

	if (vn_str == NULL)
		return VNS_UNSET;

	for (i = 0; i < size && strcmp(vn_str, str2vns[i].vn_str) != 0; i++)
		;

	if (i == size)
		return VNS_UNSET;

	return str2vns[i].vns;
}

/**
 *
 * @brief concatenate two strings by expanding target string as needed.
 * 	  Operation: strbuf += str
 *
 *	@param[in, out] strbuf - string that will expand to accommodate the
 *			        concatenation of 'str' - if null, new buffer allocated
 *	@param[in, out] ssize - if not NULL, allocated size of strbuf
 *	@param[in]      str   - string to concatenate to 'strbuf'
 *
 *	@return char *
 *	@retval pointer to the resulting string on success (*strbuf)
 *	@retval NULL on failure
 */
char *
pbs_strcat(char **strbuf, int *ssize, const char *str)
{
	int len;
	int rbuf_len;
	char *tmp;
	char *rbuf;
	int size;

	if (str == NULL)
		return *strbuf;

	rbuf = *strbuf;
	size = ssize == NULL ? 0 : *ssize;

	len = strlen(str);
	rbuf_len = rbuf == NULL ? 0 : strlen(rbuf);

	if (rbuf_len + len >= size) {
		if (len > size)
			size = len * 2;
		else
			size *= 2;

		tmp = realloc(rbuf, size + 1);
		if (tmp == NULL)
			return NULL;
		if (ssize)
			*ssize = size;
		*strbuf = tmp;
		rbuf = tmp;
		/* first allocate */
		if (rbuf_len == 0)
			rbuf[0] = '\0';
	}

	return strcat(rbuf, str);
}

/**
 *
 * @brief special purpose strcpy for chain copying strings
 *        primary difference with normal strcpy is that it
 *        returns the destination buffer position just past
 *        the copied data. Thus the next string can be just
 *        added to the returned pointer.
 *
 * @param[in] dest - pointer to the destination buffer
 * @param[in] src  - pointer to the source buffer
 *
 * @return char *
 * @retval pointer to the end of the resulting string
 *
 * @note: Caller needs to ensure space and non-NULL pointers
 *        This function is created for performance so does not
 *        verify any paramaters
 */
char *
pbs_strcpy(char *dest, const char *src)
{
	while (*src)
		*dest++ = *src++;

	*dest = '\0';

	return dest;
}
/**
 *
 * @brief general purpose strncpy function that will make sure to
 *        copy '\0' at the end of the buffer.
 *
 * @param[in] dest - pointer to the destination buffer
 * @param[in] src  - pointer to the source string
 * @param[in] n    - size of destination buffer
 *
 * @return char *
 * @retval pointer to the destination string
 *
 * @note: Caller needs ensure non-NULL pointers
 */
char *
pbs_strncpy(char *dest, const char *src, size_t n)
{
	if (strlen(src) < n - 1)
		strcpy(dest, src);
	else {
		memcpy(dest, src, n - 1);
		dest[n - 1] = '\0';
	}
	return dest;
}

/**
 * @brief
 *	get a line from a file of any length.  Extend string via realloc
 *	if necessary
 *
 * @param fp[in] - open file
 * @param pbuf[in,out] - pointer to buffer to fill (may change ala realloc)
 * @param pbuf_size[in,out] - size of buf (may increase ala realloc)
 *
 * @return char *
 * @retval pointer to *pbuf(the string pbuf points at) on successful read
 * @retval NULL on EOF or error
 */
#define PBS_FGETS_LINE_LEN 8192
char *
pbs_fgets(char **pbuf, int *pbuf_size, FILE *fp)
{
	char fbuf[PBS_FGETS_LINE_LEN];
	char *buf;
	char *p;

	if (fp == NULL || pbuf == NULL || pbuf_size == NULL)
		return NULL;

	if (*pbuf_size == 0) {
		if ((*pbuf = malloc(PBS_FGETS_LINE_LEN)) == NULL)
			return NULL;
		*pbuf_size = PBS_FGETS_LINE_LEN;
	}
	buf = *pbuf;

	buf[0] = '\0';
	while ((p = fgets(fbuf, PBS_FGETS_LINE_LEN, fp)) != NULL) {
		buf = pbs_strcat(pbuf, pbuf_size, fbuf);
		if (buf == NULL)
			return NULL;

		if (buf[strlen(buf) - 1] == '\n') /* we've reached the end of the line */
			break;
	}
	if (p == NULL && buf[0] == '\0')
		return NULL;

	return *pbuf;
}

/**
 * @brief
 * 	Helper function for pbs_fgets_extend() and callers to determine if string requires extending
 *
 * @param[in] buf - line to check for extendable ending
 *
 * @return int
 * @retval offset to extendable location, -1 if not extendable
 */
int
pbs_extendable_line(char *buf)
{
	int len = 0;

	if (buf == NULL)
		return 0;

	len = strlen(buf);

	/* we have two options:
	 * 1) We extend: string ends in a '\' and 0 or more whitespace
	 * 2) we do not extend: Not #1
	 * In the case of #1, we want the string to end just before the '\'
	 * In the case of #2 we want to leave the string alone.
	 */
	while (len > 0 && isspace(buf[len - 1]))
		len--;

	if (len > 0 && buf[len - 1] == '\\')
		return len - 1;
	else /* We're at the end of a non-extended line */
		return -1;
}

/**
 * @brief get a line from a file pointed at by fp.  The line can be extended
 *	  onto the next line if it ends in a backslash (\).  If the string is
 *	  extended, the lines will be combined and the backslash will be
 *        stripped.
 *
 * @param[in] fp pointer to file to read from
 * @param[in, out] pbuf_size - pointer to size of buffer
 * @param[in, out] pbuf - pointer to buffer
 *
 * @return char *
 * @retval string read from file
 * @retval NULL - EOF or error
 * @par MT-Safe: no
 */
char *
pbs_fgets_extend(char **pbuf, int *pbuf_size, FILE *fp)
{
	static char *locbuf = NULL;
	static int locbuf_size = 0;
	char *buf;
	char *p;
	int len;

	if (pbuf == NULL || pbuf_size == NULL || fp == NULL)
		return NULL;

	if (locbuf == NULL) {
		if ((locbuf = malloc(PBS_FGETS_LINE_LEN)) == NULL)
			return NULL;
		locbuf_size = PBS_FGETS_LINE_LEN;
	}

	if (*pbuf_size == 0 || *pbuf == NULL) {
		if ((*pbuf = malloc(PBS_FGETS_LINE_LEN)) == NULL)
			return NULL;
		*pbuf_size = PBS_FGETS_LINE_LEN;
	}

	buf = *pbuf;
	locbuf[0] = '\0';
	buf[0] = '\0';

	while ((p = pbs_fgets(&locbuf, &locbuf_size, fp)) != NULL) {
		if (pbs_strcat(pbuf, pbuf_size, locbuf) == NULL)
			return NULL;

		buf = *pbuf;
		len = pbs_extendable_line(buf);
		if (len >= 0)
			buf[len] = '\0'; /* remove the backslash (\) */
		else
			break;
	}

	/* if we read just EOF */
	if (p == NULL && buf[0] == '\0')
		return NULL;

	return buf;
}

/**
 * @brief
 * 	Internal helper function for pbs_asprintf() to determine the length of post-formatted string
 *
 * @param[in] fmt - printf format string
 * @param[in] args - va_list arguments from pbs_asprintf()
 *
 * @return int
 * @retval length of post-formatted string
 */
int
pbs_asprintf_len(const char *fmt, va_list args)
{
	int len;
#ifdef WIN32
	len = _vscprintf(fmt, args);
#else
	{
		va_list dupargs;
		char c;

		va_copy(dupargs, args);
		len = vsnprintf(&c, 0, fmt, dupargs);
		va_end(dupargs);
	}
#endif
	return len;
}

/**
 * @brief
 * 	Internal helper function for pbs_asprintf() to allocate memory and format the string
 *
 * @param[in] len - length of post-formatted string
 * @param[in] fmt - format for printed string
 * @param[in] args - va_list arguments from pbs_asprintf()
 *
 * @return char *
 * @retval formatted string in allocated buffer
 */

char *
pbs_asprintf_format(int len, const char *fmt, va_list args)
{
	char *buf;
	int rc;
	buf = malloc(len + 1);
	if (!buf)
		return NULL;
	rc = vsnprintf(buf, len + 1, fmt, args);
	if (rc != len) {
		free(buf);
		return NULL;
	}
	return buf;
}

/**
 * @brief
 *	Internal asprintf() implementation for use on all platforms
 *
 * @param[in, out] dest - character pointer that will point to allocated
 *			  space ** must be freed by caller **
 * @param[in] fmt - format for printed string
 * @param[in] ... - arguments to format string
 *
 * @return int
 * @retval -1 - Error
 * @retval >=0 - Length of new string, not including terminator
 */
int
pbs_asprintf(char **dest, const char *fmt, ...)
{
	va_list args;
	int len;
	char *buf = NULL;

	if (!dest)
		return -1;
	*dest = NULL;
	if (!fmt)
		return -1;
	va_start(args, fmt);
	len = pbs_asprintf_len(fmt, args);
	if (len < 0)
		goto pbs_asprintf_exit;

	buf = pbs_asprintf_format(len, fmt, args);
	if (buf == NULL)
		goto pbs_asprintf_exit;
	*dest = buf;
pbs_asprintf_exit:
	va_end(args);
	if (buf == NULL) {
		buf = malloc(1);
		if (buf) {
			*buf = '\0';
			*dest = buf;
			return -1;
		}
	}
	return len;
}

/**

 * @brief
 *	Copies 'src' file  to 'dst' file.
 *
 * @param[in] src - file1
 * @param[in] dst - file2
 *
 * @return int
 * @retval 0	- success
 * @retval COPY_FILE_BAD_INPUT	- dst or src is NULL.
 * @retval COPY_FILE_BAD_SOURCE	- failed to open 'src' file.
 * @retval COPY_FILE_BAD_DEST - failed to open 'dst' file.
 * @retval COPY_FILE_BAD_WRITE	- incomplete write
 */
int
copy_file_internal(char *src, char *dst)
{
	FILE *fp_orig = NULL;
	FILE *fp_copy = NULL;
	char in_data[BUFSIZ + 1];

	if ((src == NULL) || (dst == NULL)) {
		return (COPY_FILE_BAD_INPUT);
	}

	fp_orig = fopen(src, "r");

	if (fp_orig == NULL) {
		return (COPY_FILE_BAD_SOURCE);
	}

	fp_copy = fopen(dst, "w");

	if (fp_copy == NULL) {
		fclose(fp_orig);
		return (COPY_FILE_BAD_DEST);
	}

	while (fgets(in_data, sizeof(in_data),
		     fp_orig) != NULL) {
		if (fputs(in_data, fp_copy) < 0) {
			fclose(fp_orig);
			fclose(fp_copy);
			(void) unlink(dst);
			return (COPY_FILE_BAD_WRITE);
		}
	}

	fclose(fp_orig);
	if (fclose(fp_copy) != 0) {
		return (COPY_FILE_BAD_WRITE);
	}

	return (0);
}

/**
 * @brief
 * 	Puts an advisory lock of type 'op' to the file whose descriptor
 *	is 'fd'.
 *
 * @param[in]	fd - descriptor of file being locked.
 * @param[in]	op - type of lock: F_WRLCK, F_RDLCK, F_UNLCK
 * @param[in]	filename -  corresonding name to 'fp' for logging purposes.
 * @param[in]	lock_retry - number of attempts to retry lock if there's a
 *			     failure to lock.
 * @param[out]	err_msg - filled with the error message string if there's a
 *			  failure to lock. (can be NULL if error message need
 *			  not be saved).
 * @param[in]	err_msg_len - size of the err_msg buffer.
 *
 * @return 	int
 * @retval 	0	for success
 * @reval	1	for failure to lock
 *
 */

int
lock_file(int fd, int op, char *filename, int lock_retry,
	  char *err_msg, size_t err_msg_len)
{
	int i;
	struct flock flock;

	lseek(fd, (off_t) 0, SEEK_SET);
	flock.l_type = op;
	flock.l_whence = SEEK_SET;
	flock.l_start = 0;
	flock.l_len = 0;

	for (i = 0; i < lock_retry; i++) {
		if ((fcntl(fd, F_SETLK, &flock) == -1) &&
		    ((errno == EACCES) || (errno == EAGAIN))) {
			if (err_msg != NULL)
				snprintf(err_msg, err_msg_len,
					 "Failed to lock file %s, retrying", filename);
		} else {
			return 0; /* locked */
		}
		if (i < (lock_retry - 1))
			sleep(2);
	}
	if (err_msg != NULL)
		snprintf(err_msg, err_msg_len,
			 "Failed to lock file %s, giving up", filename);
	return 1;
}

/**
 * @brief
 *	calculate the number of digits to the right of the decimal point in
 *	a floating point number.  This can be used in conjunction with
 *	printf() to not print trailing zeros.
 *
 * @param[in] fl - the float point number
 * @param[in] digits - the max number of digits to check.  Can be -1 for max
 *            number of digits for 32/64 bit numbers.
 *
 * @par	Use: int x = float_digits(fl, 8);
 * 	printf("%0.*f\n", x, fl);
 *
 * @note It may be unwise to use use a large value for digits (or -1) due to
 * that the precision of a double will decrease after the first handful of
 * digits.
 *
 * @return int
 * @retval number of digits to the right of the decimal point in fl.
 *         in the range of 0..digits
 *
 * @par MT-Safe: Yes
 */

#define FLOAT_DIGITS_ERROR_FACTOR 1000.0
/* To be more generic, we should use a signed integer type.
 * This is fine for our current use and gives us 1 more digit.
 */
#define TRUNCATE(x) (((x) > (double) ULONG_MAX) ? ULONG_MAX : (unsigned long) (x))

int
float_digits(double fl, int digits)
{
	unsigned long num;
	int i;

	/* 2^64 = 18446744073709551616 (18 useful)
	 * 2^32 = 4294967296 (9 useful)
	 */
	if (digits == -1)
		digits = (sizeof(unsigned long) >= 8) ? 18 : 9;

	fl = ((fl < 0) ? -fl : fl);

	/* The main part of the algorithm: Floating point numbers are not very exact.
	 * We need to do something to determine how close we are to the right number
	 * We multiply our floating point value by an error factor.  If we see a
	 * string of 9's or 0's in a row, we stop.  For example, if the error factor
	 * is 1000, if we see 3 9's or 0's we stop.  Every time through the loop we
	 * multiply by 10 to shift over one digit and repeat.
	 */
	for (i = 0; i < digits; i++) {
		num = TRUNCATE((fl - TRUNCATE(fl)) * FLOAT_DIGITS_ERROR_FACTOR);
		if ((num < 1) || (num >= (long) (FLOAT_DIGITS_ERROR_FACTOR - 1.0)))
			break;
		fl *= 10.0;
	}
	return i;
}

/**
 *
 * @brief
 *	Returns 1 for path is a full path; otherwise, 0 if
 * 	relative path.
 *
 * @param[in]	path	- the filename path being checked.
 *
 * @return int
 * @retval	1	if 'path' is a full path.
 * @retval	0	if 'path' is  relative path
 */
int
is_full_path(char *path)
{
	char *cp = path;

	if (*cp == '"')
		++cp;

#ifdef WIN32
	if ((cp[0] == '/') || (cp[0] == '\\') ||
	    (strlen(cp) >= 3 &&
	     isalpha(cp[0]) && cp[1] == ':' &&
	     ((cp[2] == '\\') || (cp[2] == '/'))))
	/* matches c:\ or c:/ */
#else
	if (cp[0] == '/')
#endif
		return (1);
	return (0);
}

/**
 * @brief
 *	Replace sub with repl in str.
 *
 * @par Note
 *	same as replace_space except the matching character to replace
 *      is not necessarily a space but the supplied 'sub' string, plus leaving
 *      alone existing 'repl' sub strings and no quoting if 'repl' is ""
 *
 * @param[in]	str  - input buffer having patter sub
 * @param[in]	sub  - pattern to be replaced
 * @param[in]   repl - pattern to be replaced with
 * @param[out]  retstr : string replaced with given pattern.
 *
 */

void
replace(char *str, char *sub, char *repl, char *retstr)
{
	char rstr[MAXPATHLEN + 1];
	int i, j;
	int repl_len;
	int has_match = 0;
	int sub_len;

	if (str == NULL || repl == NULL || sub == NULL)
		return;

	if (*str == '\0') {
		retstr[0] = '\0';
		return;
	}

	if (*sub == '\0') {
		strcpy(retstr, str);
		return;
	}

	repl_len = strlen(repl);
	sub_len = strlen(sub);

	i = 0;
	while (*str != '\0') {
		if (strncmp(str, sub, sub_len) == 0 &&
		    repl_len > 0) {
			for (j = 0; (j < repl_len && i <= MAXPATHLEN); j++, i++) {
				rstr[i] = repl[j];
			}
			has_match = 1;
		} else if (strncmp(str, sub, sub_len) == 0) {
			for (j = 0; (j < sub_len && i <= MAXPATHLEN); j++, i++) {
				rstr[i] = sub[j];
			}
			has_match = 1;
		} else {
			rstr[i] = *str;
			i++;
			has_match = 0;
		}

		if (i > MAXPATHLEN) {
			retstr[0] = '\0';
			return;
		}

		if (has_match) {
			str += sub_len;
		} else {
			str++;
		}
	}
	rstr[i] = '\0';

	strncpy(retstr, rstr, i + 1);
}

/**
 * @brief
 *	Escape every occurrence of 'delim' in 'str' with 'esc'
 *
 * @param[in]	str     - input string
 * @param[in]	delim   - delimiter to be searched in str
 * @param[in]	esc     - escape character to be added if delim found in str
 *
 * @return	string
 * @retval	NULL	- memory allocation failed or str is NULL
 * @retval	retstr	- output string, with every occurrence of delim escaped with 'esc'
 *
 * @note
 * 	The string returned should be freed by the caller.
 */

char *
escape_delimiter(char *str, char *delim, char esc)
{
	int i = 0;
	int j = 0;
	int delim_len = 0;
	int retstrlen = 0;
	char *retstr = NULL;
	char *temp = NULL;

	if (str == NULL)
		return NULL;

	if (*str == '\0' || (delim == NULL || *delim == '\0') || esc == '\0') {
		return strdup((char *) str);
	}
	delim_len = strlen(delim);
	retstr = (char *) malloc(MAXBUFLEN);
	if (retstr == NULL)
		return NULL;
	retstrlen = MAXBUFLEN;

	while (*str != '\0') {
		/* We dont want to use strncmp function if delimiter is a character. */
		if ((*str == esc && !ISESCAPED(*(str + 1))) || (delim_len == 1 && *str == *delim)) {
			retstr[i++] = esc;
			retstr[i++] = *str++;
		} else if (strncmp(str, delim, delim_len) == 0 && ((i + 1 + delim_len) < retstrlen)) {
			retstr[i++] = esc;
			for (j = 0; j < delim_len; j++, i++)
				retstr[i] = *str++;
		} else if ((i + 1 + delim_len) < retstrlen)
			retstr[i++] = *str++;

		if (i >= (retstrlen - (1 + delim_len))) {
			retstrlen *= BUFFER_GROWTH_RATE;
			temp = (char *) realloc(retstr, retstrlen);
			if (temp == NULL) {
				free(retstr);
				return NULL;
			}
			retstr = temp;
		}
	}
	retstr[i] = '\0';
	return retstr;
}

/**
 *
 * @brief
 * 	file_exists: returns 1 if file exists; 0 otherwise.
 *
 * @param[in]	path - file pathname being checked.
 *
 * @return 	int
 * @retval	1	if 'path' exists.
 * @retval	0	if 'path'does not exist.
 */
int
file_exists(char *path)
{
	struct stat sbuf;

#ifdef WIN32
	if (lstat(path, &sbuf) == -1) {
		int ret = GetLastError();
		if (ret == ERROR_FILE_NOT_FOUND ||
		    ret == ERROR_PATH_NOT_FOUND) {
			return 0;
		}
	}
#else
	if ((stat(path, &sbuf) == -1) &&
	    (errno == ENOENT))
		return (0);
#endif
	return (1);
}

/**
 * @brief
 *	Given the two hostnames, compare their short names and full names to make sure if those
 *      point to same host.
 *
 * @param[in]	        host1 - first host
 * @param[in]           host2 - second host
 *
 * @return              int
 * @retval	        0 - hostnames point to different hosts
 * @retval	        1 - hostnames point to same host
 *
 */
int
is_same_host(char *host1, char *host2)
{
	char *host1_f = NULL;
	char *host2_f = NULL;

	static void *hostmap = NULL;

	if (host1 == NULL || host2 == NULL)
		return 0;

	if (hostmap == NULL)
		hostmap = pbs_idx_create(0, 0);

	if (strcasecmp(host1, host2) == 0)
		return 1;

	pbs_idx_find(hostmap, (void **) &host1, (void **) &host1_f, NULL);
	pbs_idx_find(hostmap, (void **) &host2, (void **) &host2_f, NULL);

	if (host1_f == NULL) {
		char host1_full[PBS_MAXHOSTNAME + 1];

		if (get_fullhostname(host1, host1_full, PBS_MAXHOSTNAME) != 0 || host1_full[0] == '\0')
			return 0;
		host1_f = strdup(host1_full);
		pbs_idx_insert(hostmap, host1, host1_f);
	}
	if (host2_f == NULL) {
		char host2_full[PBS_MAXHOSTNAME + 1];

		if (get_fullhostname(host2, host2_full, PBS_MAXHOSTNAME) != 0 || host2_full[0] == '\0')
			return 0;
		host2_f = strdup(host2_full);
		pbs_idx_insert(hostmap, host2, host2_f);
	}
	if (host1_f == NULL || host2_f == NULL)
		return 0;

	if (strcasecmp(host1_f, host2_f) == 0)
		return 1;

	return 0;
}

/**
 * @brief Determine if place_def is in place_str
 * @see place_sharing_type and getplacesharing
 *
 * @param[in] place_str - The string representation of the place directive
 * @param[in] place_def - The type of place to check
 *
 * @return Whether the place directive contains the type of exclusivity
 * queried for.
 * @retval 1 If the place directive is of the type queried
 * @retval 0 If the place directive is not of the type queried
 *
 *@par MT-Safe: No
 */
int
place_sharing_check(char *place_str, char *place_def)
{
	char *buf;
	char *p;
	char *psave;

	if ((place_str == NULL) || (*place_str == '\0'))
		return 0;

	if ((place_def == NULL) || (*place_def == '\0'))
		return 0;

	buf = strdup(place_str);
	if (buf == NULL)
		return 0;

	for (p = buf; (p = strtok_r(p, ":", &psave)) != NULL; p = NULL) {
		if (strcmp(p, place_def) == 0) {
			free(buf);
			return 1;
		}
	}
	free(buf);
	return 0;
}

/**
 *
 * @brief
 * 	Determines if 'str' is found in 'sep'-separated 'string_list'.
 *
 * @param[in]	str	- the substring to look for.
 * @param[in]	sep	- the separator character in 'string_list'
 * @param[in]	string_list - the list of characters to check for a 'str'
 *				match.
 * @return int
 * @retval	1	- if 'str' is found in 'string_list'.
 * @retval	0	- if 'str' not found.
 *
 * @note
 *	In the absence of a 'sep' value (i.e. empty string ''), then
 *	a white space is the default delimiter.
 *	If there's a 'sep' value, the white space character is also treated
 *	as an additional delimeter, matching only the strings that don't
 *	contain leading/trailing 'sep' char and white space character.
 */
int
in_string_list(char *str, char sep, char *string_list)
{
	char *p = NULL;
	char *p2 = NULL;
	char *p_end = NULL;
	char *ptoken = NULL;
	int found_match = 0;

	if ((str == NULL) || (str[0] == '\0') || (string_list == NULL)) {
		return (0);
	}

	p2 = strdup(string_list);
	if (p2 == NULL) {
		return (0);
	}

	p = p2;
	p_end = p + strlen(string_list);

	while (p < p_end) {

		/* skip past [<sep> ] characters */
		while ((*p != '\0') && ((*p == sep) || (*p == ' '))) {
			p++;
		}

		if (*p == '\0')
			break;

		ptoken = p; /* start of token */

		/* skip past not in [<sep> ] characters  */
		while ((*p != '\0') && ((*p != sep) && (*p != ' '))) {
			p++;
		}
		*p = '\0'; /* delimeter value is nulled */
		if (strcmp(str, ptoken) == 0) {
			found_match = 1;
			break;
		}
		p++;
	}

	if (p2) {
		(void) free(p2);
	}
	return (found_match);
}

/**
 *
 *	@brief break apart a delimited string into an array of strings
 *
 *	@param[in] strlist - the delimited string
 *	@param[in] sep - the separator character
 *
 *	@return char **
 *
 *	@note
 *		The returned array of strings has to be freed by the caller.
 */
char **
break_delimited_str(char *strlist, char delim)
{
	char sep[2] = {0};
	int num_words = 1; /* number of words delimited by commas*/
	char **arr = NULL; /* the array of words */
	char *list;
	char *tok; /* used with strtok() */
	char *end;
	int i;

	sep[0] = delim;

	if (strlist == NULL) {
		pbs_errno = PBSE_BADATVAL;
		return NULL;
	}

	list = strdup(strlist);

	if (list != NULL) {
		char *saveptr = NULL;

		for (i = 0; list[i] != '\0'; i++)
			if (list[i] == delim)
				num_words++;

		if ((arr = (char **) malloc(sizeof(char *) * (num_words + 1))) == NULL) {
			pbs_errno = PBSE_SYSTEM;
			free(list);
			return NULL;
		}

		tok = strtok_r(list, sep, &saveptr);

		for (i = 0; tok != NULL; i++) {
			while (isspace((int) *tok))
				tok++;

			end = &tok[strlen(tok) - 1];

			while (isspace((int) *end)) {
				*end = '\0';
				end--;
			}

			arr[i] = strdup(tok);
			if (arr[i] == NULL) {
				pbs_errno = PBSE_SYSTEM;
				free(list);
				free_string_array(arr);
				return NULL;
			}
			tok = strtok_r(NULL, sep, &saveptr);
		}
		arr[i] = NULL;
	}
	if (list != NULL)
		free(list);

	return arr;
}

/**
 *
 *	@brief break apart a comma delimited string into an array of strings
 *
 *	@param[in] strlist - the comma delimited string
 *
 *	@return char **
 *
 */
char **
break_comma_list(char *strlist)
{
	return (break_delimited_str(strlist, ','));
}

/**
 * @brief
 *		Does a string exist in the given array?
 *
 * @param[in]	strarr	-	the string array to search, should be NULL terminated
 * @param[in]	str	-	the string to find
 *
 * @return	int
 * @retval	1	: if the string is found
 * @retval	0	: the string is not found or on error
 *
 */
int
is_string_in_arr(char **strarr, const char *str)
{
	int ind;

	ind = find_string_idx(strarr, str);

	if (ind >= 0)
		return 1;

	return 0;
}

/**
 * @brief
 *	make copy of string array
 *
 * @param[in] strarr - the string array to make copy
 *
 * @return char **
 * @retval !NULL - copy of string array
 * @retval NULL  - failed to make copy of string array
 *
 */
char **
dup_string_arr(char **strarr)
{
	int i = 0;
	char **retarr = NULL;

	if (strarr == NULL)
		return NULL;

	for (i = 0; strarr[i] != NULL; i++)
		;

	if ((retarr = (char **) malloc((i + 1) * sizeof(char *))) == NULL)
		return NULL;

	for (i = 0; strarr[i] != NULL; i++) {
		retarr[i] = strdup(strarr[i]);
		if (retarr[i] == NULL) {
			for (i = 0; retarr[i] != NULL; i++)
				free(retarr[i]);
			free(retarr);
			return NULL;
		}
	}
	retarr[i] = NULL;
	return retarr;
}

/**
 * @brief
 * 		find index of str in strarr
 *
 * @param[in]	strarr	-	the string array to search
 * @param[in]	str	-	the string to find
 *
 * @return	int
 * @retval	index of string
 * @retval	-1	: if not found
 */
int
find_string_idx(char **strarr, const char *str)
{
	int i;
	if (strarr == NULL || str == NULL)
		return -1;

	for (i = 0; strarr[i] != NULL && strcmp(strarr[i], str); i++)
		;
	if (strarr[i] == NULL)
		return -1;

	return i;
}

/**
 * @brief
 *		free_string_array - free an array of strings with a NULL as a sentinel
 *
 * @param[in,out]	arr	-	the array to free
 *
 * @return	nothing
 *
 */
void
free_string_array(char **arr)
{
	int i;

	if (arr != NULL) {
		for (i = 0; arr[i] != NULL; i++)
			free(arr[i]);

		free(arr);
	}
}

/**
 * @brief
 *	ensure_string_not_null - if string is NULL, allocate an empty string
 *
 * @param[in]	str - pointer to pointer to string (or to NULL)
 *
 * @return	nothing
 *
 */
void
ensure_string_not_null(char **str)
{
	if (*str == NULL)
		*str = strdup("");
}

/**
 * @brief
 *	convert_string_to_lowercase - Convert string to lowercase
 *
 * @param[in]	str - string to be converted
 *
 * @return	char *
 * @retval	!NULL - converted string
 * @retval	NULL - failure
 *
 * @note
 * 	Returned string will be malloced area, so free after use
 *
 */
char *
convert_string_to_lowercase(char *str)
{
	char *ret = NULL;
	int i = 0;
	int len = 0;

	if (str == NULL || *str == '\0')
		return NULL;

	len = strlen(str);
	if ((ret = calloc(1, len + 1)) == NULL)
		return NULL;

	for (i = 0; i < len; i++)
		ret[i] = tolower(str[i]);

	return ret;
}

/**
 * @brief
 * 		Convert a duration to HH:MM:SS format string
 *
 * @param[in]	duration	-	the duration
 * @param[out]	buf	-	the buffer to be filled
 * @param[in]	bufsize	-	size of the buffer
 *
 * @return	void
 */
void
convert_duration_to_str(time_t duration, char *buf, int bufsize)
{
	long hour, min, sec;
	if (buf == NULL || bufsize == 0)
		return;
	hour = duration / 3600;
	duration = duration % 3600;
	min = duration / 60;
	duration = duration % 60;
	sec = duration;
	snprintf(buf, bufsize, "%02ld:%02ld:%02ld", hour, min, sec);
}

/**
 * @brief
 *	Determines if 'str' ends with three consecutive double quotes,
 *	before a newline (if it exists).
 *
 * @param[in]	str - input string
 * @param[in]	strip_quotes - if set to 1, then modify 'str' so that
 *				the triple quotes are not part of the string.
 *
 * @return int
 * @retval 1 - if string ends with triple quotes.
 * @retval 0 - if string does not end with triple quotes.
 *
 */
int
ends_with_triple_quotes(char *str, int strip_quotes)
{
	int ct;
	char *p = NULL;
	int ll = 0;

	if (str == NULL)
		return (0);

	ll = strlen(str);
	if (ll < 3) {
		return (0);
	}

	p = str + (ll - 1);

	if (*p == '\n') {
		p--;
#ifdef WIN32
		if (*p == '\r') {
			p--;
		}
#endif
	}

	ct = 0;
	while ((p >= str) && (*p == '"')) {
		ct++;
		p--;
		if (ct == 3)
			break;
	}
	if (ct == 3) {
		if (strip_quotes == 1) {
			/* null terminate the first double quote */
			*(p + 1) = '\0';
		}
		return (1);
	}
	return (0);
}

/**
 * @brief
 *	Determines if 'str' begins with three consecutive double quotes.
 *
 * @param[in]	str - input string
 *
 * @return int
 * @retval 1 - if string starts with triple quotes.
 * @retval 0 - if string does not start with triple quotes.
 *
 */
int
starts_with_triple_quotes(char *str)
{
	char *p;
	int ct;

	if (str == NULL)
		return (0);

	p = str;
	ct = 0;
	while ((*p != '\0') && (*p == '"')) {
		ct++;
		p++;
		if (ct == 3)
			break;
	}
	if (ct == 3) {
		return (1);
	}
	return (0);
}

/*
 * @brief
 *	Gets malloc_info and returns as a string
 *
 * @return char *
 * @retval NULL - Error
 * @note
 * The buffer has to be freed by the caller.
 *
 */
#ifndef WIN32
#ifdef HAVE_MALLOC_INFO
char *
get_mem_info(void)
{
	FILE *stream;
	char *buf;
	size_t len;
	int err = 0;

	stream = open_memstream(&buf, &len);
	if (stream == NULL)
		return NULL;
	err = malloc_info(0, stream);
	fclose(stream);
	if (err == -1) {
		free(buf);
		return NULL;
	}
	return buf;
}
#endif /* malloc_info */
#endif /* WIN32 */

/**
 * @brief
 *	Return a copy of 'str' where non-printing characters
 *	(except the ones listed in the local variable 'special_char') are
 *	shown in ^<translated_char> notation.
 *
 * @param[in]	str - input string
 *
 * @return char *
 *
 * @note
 * 	Do not free the return value - it's in a fixed memory area that
 *	will get overwritten the next time the function is called.
 *      So best to use the result immediately or strdup() it.
 *
 *	This will return the original (non-translated) 'str' value if
 *	an error was encounted, like a realloc() error.
 */
char *
show_nonprint_chars(char *str)
{
#ifndef WIN32
	static char *locbuf = NULL;
	static size_t locbuf_size = 0;
	char *buf, *buf2;
	size_t nsize;
	int ch;
	char special_char[] = "\n\t";
	wchar_t wc;
	int len;

	if ((str == NULL) || (str[0] == '\0'))
		return str;

	nsize = (strlen(str) * 2) + 1;
	if (nsize > locbuf_size || locbuf == NULL) {
		char *tmpbuf;
		if ((tmpbuf = realloc(locbuf, nsize)) == NULL)
			return str;
		locbuf = tmpbuf;
		locbuf_size = nsize;
	}

	locbuf[0] = '\0';
	buf = str;
	buf2 = locbuf;

	mbtowc(NULL, NULL, 0);

	while (*buf != '\0') {
		len = mbtowc(&wc, buf, MB_CUR_MAX);

		if (len == 0) {
			/* shoud not happen */
			break;
		} else if (len < 0) {
			/* non-ASCII */
			ch = *buf & 0xFF;
		} else {
			/* wide character - len > 0 */
			ch = (int)wc;
		}

		if ((ch < 32) && !char_in_set(ch, special_char)) {
			*buf2++ = '^';
			*buf2++ = ch + 64;
		} else {
			*buf2++ = ch;
		}

		if (len < 0) {
			buf++;
		} else {
			buf += len;
		}
	}
	*buf2 = '\0';
	return (locbuf);
#else
	return (str);
#endif
}

/**
 * @brief
 *  get_preemption_order - deduce the preemption ordering to be used for a job
 *
 *  @param[in]	porder - static value of preempt order from the sched object
 *  						this array is assumed to be of size PREEMPT_ORDER_MAX
 *  @param[in]	req - amount of requested time for the job
 *  @param[in]	used - amount of used time by the job
 *
 *  @return	struct preempt_ordering *
 *  @retval	preempt ordering for the job
 *  @retval	NULL if error
 */
struct preempt_ordering *
get_preemption_order(struct preempt_ordering *porder, int req, int used)
{
	int i;
	int percent_left = 0;
	struct preempt_ordering *po = NULL;

	if (porder == NULL)
		return NULL;

	po = &porder[0];
	if (req < 0 || used < 0)
		return po;

	/* check if we have more then one range... no need to choose if not */
	if (porder[1].high_range != 0) {
		percent_left = 100 - ((float) used / req) * 100;
		if (percent_left < 0)
			percent_left = 1;

		for (i = 0; i < PREEMPT_ORDER_MAX; i++) {
			if (percent_left <= porder[i].high_range && percent_left >= porder[i].low_range) {
				po = &porder[i];
				break;
			}
		}
	}

	return po;
}

#ifdef WIN32
/**
 * @brief
 *	Returns the current wall clock time.
 *
 * @return double - number of seconds.
 */
static double
get_walltime(void)
{
	LARGE_INTEGER time, freq;

	if (QueryPerformanceFrequency(&freq) == 0)
		return (0);

	if (QueryPerformanceCounter(&time) == 0)
		return (0);

	return ((double) time.QuadPart / freq.QuadPart);
}

/**
 * @brief
 *	Returns the current processor time.
 *
 * @return double - number of seconds.
 **/
static double
get_cputime()
{
	FILETIME create_time;
	FILETIME exit_time;
	FILETIME kernel_time;
	FILETIME user_time;

	/* The times are returned in 100-nanosecond units */
	if (GetProcessTimes(GetCurrentProcess(), &create_time, &exit_time, &kernel_time, &user_time) == 0)
		return (0);

	if (user_time.dwLowDateTime != 0)
		return ((double) user_time.dwLowDateTime * 0.0000001);

	return ((double) (((unsigned long long) user_time.dwHighDateTime << 32)) * 0.0000001);
}

#else

/**
 * @brief
 *	Returns the current wall clock time.
 *
 * @return double - number of seconds.
 */
static double
get_walltime(void)
{

	struct timeval time;

	if (gettimeofday(&time, NULL) == -1)
		return (0);

	return ((double) time.tv_sec + (double) time.tv_usec * .000001);
}

/**
 * @brief
 *	Returns the current processor time.
 *
 * @return double - number of seconds.
 **/
static double
get_cputime()
{
	clock_t clock_cycles;
	clock_cycles = clock();
	if (clock_cycles == -1)
		return (0);
	assert(CLOCKS_PER_SEC != 0);
	return (double) clock_cycles / CLOCKS_PER_SEC;
}
#endif

/**
 * @brief
 *	Allocates memory for a given 'instance' of measurements.
 *
 * @param[in] instance - a description of what is being measured.
 *
 * @return perf_stat_t - an allocated entry.
 */
static perf_stat_t *
perf_stat_alloc(char *instance)
{
	perf_stat_t *p_stat;

	if ((instance == NULL) || (instance[0] == '\0'))
		return NULL;

	p_stat = malloc(sizeof(perf_stat_t));
	if (p_stat == NULL)
		return NULL;

	(void) memset((char *) p_stat, (int) 0, (size_t) sizeof(perf_stat_t));

	strncpy(p_stat->instance, instance, MAXBUFLEN);
	p_stat->instance[MAXBUFLEN] = '\0';
	p_stat->walltime = 0;
	p_stat->cputime = 0;

	delete_link(&p_stat->pi_allstats);
	append_link(&perf_stats, &p_stat->pi_allstats, p_stat);

	return (p_stat);
}

/**
 * @brief
 *	Find an 'instance' entry among the list of saved performance
 *	stats.
 *
 * @param[in] instance - entity being measured.
 *
 * @return perf_stat_t - found entry.
 */
static perf_stat_t *
perf_stat_find(char *instance)
{
	perf_stat_t *p_stat;

	if ((instance == NULL) || (instance[0] == '\0') || (perf_stats_initialized == 0))
		return (NULL);

	p_stat = (perf_stat_t *) GET_NEXT(perf_stats);
	while (p_stat) {
		if (strcmp(p_stat->instance, instance) == 0) {
			break;
		}
		p_stat = (perf_stat_t *) GET_NEXT(p_stat->pi_allstats);
	}
	return (p_stat); /* may be a null pointer */
}

/**
 * @brief
 *	Remove (deallocate) an 'instance' entry among the list of
 *	saved performance stats.
 *
 * @param[in] instance - entity being measured.
 *
 * @return void
 */
void
perf_stat_remove(char *instance)
{
	perf_stat_t *p_stat;

	if ((instance == NULL) || (instance[0] == '\0') || (perf_stats_initialized == 0))
		return;

	p_stat = (perf_stat_t *) GET_NEXT(perf_stats);
	while (p_stat) {
		if (strcmp(p_stat->instance, instance) == 0) {
			break;
		}
		p_stat = (perf_stat_t *) GET_NEXT(p_stat->pi_allstats);
	}
	if (p_stat != NULL) {
		delete_link(&p_stat->pi_allstats);
		free(p_stat);
	}
}

/**
 * @brief
 *	Record start counters for the 'instance' entry.
 *
 * @param[in] instance - entity being measured
 *
 * @return void
 */
void
perf_stat_start(char *instance)
{
	perf_stat_t *p_stat;

	if ((instance == NULL) || (instance[0] == '\0'))
		return;

	if (perf_stats_initialized == 0) {
		CLEAR_HEAD(perf_stats);
		perf_stats_initialized = 1;
	}

	p_stat = perf_stat_find(instance);
	if (p_stat == NULL) {
		p_stat = perf_stat_alloc(instance);
		if (p_stat == NULL)
			return;
	}

	p_stat->walltime = get_walltime();
	p_stat->cputime = get_cputime();
}

/**
 * @brief
 *	Returns a summary of statistics gathered (e.g.
 *	elapsed walltime) since the perf_stat_start() call on the
 *	same 'instance'.
 *
 * @param[in] instance - entity being measured
 *
 * @return char *  - a string describing stats gathered.
 *		   - this is a statically-allocated buffer that
 *		     will get over-written by the next call to this
 *		     function.
 * @note
 *	This also frees up the memory used by the 'instance' entry
 *      in the list of saved stats.
 */
char *
perf_stat_stop(char *instance)
{
	perf_stat_t *p_stat;
	double now_walltime;
	double now_cputime;
	static char stat_summary[MAXBUFLEN + 1];

	if ((instance == NULL) || (instance[0] == '\0')) {
		return (NULL);
	}

	p_stat = perf_stat_find(instance);
	if (p_stat == NULL)
		return (NULL);

	now_walltime = get_walltime();
	now_cputime = get_cputime();

	snprintf(stat_summary, sizeof(stat_summary), "%s walltime=%f cputime=%f", instance, (now_walltime - p_stat->walltime), (now_cputime - p_stat->cputime));

	delete_link(&p_stat->pi_allstats);
	free(p_stat);

	return (stat_summary);
}

/**
 * @brief
 *	creates an empty file in /tmp/ and saves timestamp of that file
 *
 * @param[in] - void
 *
 * @return - void
 */
void
create_query_file(void)
{
	FILE *f;
	char filename[MAXPATHLEN + 1];
	uid_t usid = getuid();
#ifdef WIN32
	LPSTR win_sid = NULL;
	if (!ConvertSidToStringSid(usid, &win_sid)) {
		fprintf(stderr, "qstat: failed to convert SID to string with error=%d\n", GetLastError());
		return;
	}
	snprintf(filename, sizeof(filename), "%s\\.pbs_last_query_%s", TMP_DIR, win_sid);
	LocalFree(win_sid);
#else
	snprintf(filename, sizeof(filename), "%s/.pbs_last_query_%d", TMP_DIR, usid);
#endif /* WIN32 */
	f = fopen(filename, "w");
	if (f != NULL)
		fclose(f);
}

/**
 * @brief
 *	stats te information of the empty file created in /tmp/ to decide
 *  whether to add sleep for .2 seconds or not
 *
 * @param[in] - void
 *
 * @return - void
 */
void
delay_query(void)
{
	char filename[MAXPATHLEN + 1];
#ifdef WIN32
	struct _stat buf;
#else
	struct stat buf;
#endif

	uid_t usid = getuid();
#ifdef WIN32
	LPSTR win_sid = NULL;
	if (!ConvertSidToStringSid(usid, &win_sid)) {
		fprintf(stderr, "qstat: failed to convert SID to string with error=%d\n", GetLastError());
		return;
	}
	snprintf(filename, sizeof(filename), "%s\\.pbs_last_query_%s", TMP_DIR, win_sid);
	if (_stat(filename, &buf) == 0) {
		if (((time(NULL) * 1000) - (buf.st_mtime * 1000)) < 10) {
			Sleep(200);
		}
	}
	LocalFree(win_sid);
#else
	snprintf(filename, sizeof(filename), "%s/.pbs_last_query_%d", TMP_DIR, usid);
	if (stat(filename, &buf) == 0) {
		if (((time(NULL) * 1000) - (buf.st_mtime * 1000)) < 10) {
			usleep(200000);
		}
	}
#endif /* WIN32 */
	atexit(create_query_file);
}

/**
 * @brief
 *	Put a human readable representation of a network addres into
 *	a staticly allocated string.
 *
 * @param[in] ap - internet address
 *
 * @return	string
 * @retval	static  string		success
 * @retval	"unknown"		error
 *
 */
char *
netaddr(struct sockaddr_in *ap)
{
	static char out[80];
	u_long ipadd;

	if (ap == NULL)
		return "unknown";

	ipadd = ntohl(ap->sin_addr.s_addr);

	sprintf(out, "%ld.%ld.%ld.%ld:%d",
		(ipadd & 0xff000000) >> 24,
		(ipadd & 0x00ff0000) >> 16,
		(ipadd & 0x0000ff00) >> 8,
		(ipadd & 0x000000ff),
		ntohs(ap->sin_port));
	return out;
}

/*
 *	BEGIN included source
 */
/*-
 * Copyright (c) 1991, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * This code is derived from software contributed to Berkeley by
 * James W. Williams of NASA Goddard Space Flight Center.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgment:
 *	This product includes software developed by the University of
 *	California, Berkeley and its contributors.
 * 4. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */

static u_long crctab[] = {
	0x0,
	0x04c11db7, 0x09823b6e, 0x0d4326d9, 0x130476dc, 0x17c56b6b,
	0x1a864db2, 0x1e475005, 0x2608edb8, 0x22c9f00f, 0x2f8ad6d6,
	0x2b4bcb61, 0x350c9b64, 0x31cd86d3, 0x3c8ea00a, 0x384fbdbd,
	0x4c11db70, 0x48d0c6c7, 0x4593e01e, 0x4152fda9, 0x5f15adac,
	0x5bd4b01b, 0x569796c2, 0x52568b75, 0x6a1936c8, 0x6ed82b7f,
	0x639b0da6, 0x675a1011, 0x791d4014, 0x7ddc5da3, 0x709f7b7a,
	0x745e66cd, 0x9823b6e0, 0x9ce2ab57, 0x91a18d8e, 0x95609039,
	0x8b27c03c, 0x8fe6dd8b, 0x82a5fb52, 0x8664e6e5, 0xbe2b5b58,
	0xbaea46ef, 0xb7a96036, 0xb3687d81, 0xad2f2d84, 0xa9ee3033,
	0xa4ad16ea, 0xa06c0b5d, 0xd4326d90, 0xd0f37027, 0xddb056fe,
	0xd9714b49, 0xc7361b4c, 0xc3f706fb, 0xceb42022, 0xca753d95,
	0xf23a8028, 0xf6fb9d9f, 0xfbb8bb46, 0xff79a6f1, 0xe13ef6f4,
	0xe5ffeb43, 0xe8bccd9a, 0xec7dd02d, 0x34867077, 0x30476dc0,
	0x3d044b19, 0x39c556ae, 0x278206ab, 0x23431b1c, 0x2e003dc5,
	0x2ac12072, 0x128e9dcf, 0x164f8078, 0x1b0ca6a1, 0x1fcdbb16,
	0x018aeb13, 0x054bf6a4, 0x0808d07d, 0x0cc9cdca, 0x7897ab07,
	0x7c56b6b0, 0x71159069, 0x75d48dde, 0x6b93dddb, 0x6f52c06c,
	0x6211e6b5, 0x66d0fb02, 0x5e9f46bf, 0x5a5e5b08, 0x571d7dd1,
	0x53dc6066, 0x4d9b3063, 0x495a2dd4, 0x44190b0d, 0x40d816ba,
	0xaca5c697, 0xa864db20, 0xa527fdf9, 0xa1e6e04e, 0xbfa1b04b,
	0xbb60adfc, 0xb6238b25, 0xb2e29692, 0x8aad2b2f, 0x8e6c3698,
	0x832f1041, 0x87ee0df6, 0x99a95df3, 0x9d684044, 0x902b669d,
	0x94ea7b2a, 0xe0b41de7, 0xe4750050, 0xe9362689, 0xedf73b3e,
	0xf3b06b3b, 0xf771768c, 0xfa325055, 0xfef34de2, 0xc6bcf05f,
	0xc27dede8, 0xcf3ecb31, 0xcbffd686, 0xd5b88683, 0xd1799b34,
	0xdc3abded, 0xd8fba05a, 0x690ce0ee, 0x6dcdfd59, 0x608edb80,
	0x644fc637, 0x7a089632, 0x7ec98b85, 0x738aad5c, 0x774bb0eb,
	0x4f040d56, 0x4bc510e1, 0x46863638, 0x42472b8f, 0x5c007b8a,
	0x58c1663d, 0x558240e4, 0x51435d53, 0x251d3b9e, 0x21dc2629,
	0x2c9f00f0, 0x285e1d47, 0x36194d42, 0x32d850f5, 0x3f9b762c,
	0x3b5a6b9b, 0x0315d626, 0x07d4cb91, 0x0a97ed48, 0x0e56f0ff,
	0x1011a0fa, 0x14d0bd4d, 0x19939b94, 0x1d528623, 0xf12f560e,
	0xf5ee4bb9, 0xf8ad6d60, 0xfc6c70d7, 0xe22b20d2, 0xe6ea3d65,
	0xeba91bbc, 0xef68060b, 0xd727bbb6, 0xd3e6a601, 0xdea580d8,
	0xda649d6f, 0xc423cd6a, 0xc0e2d0dd, 0xcda1f604, 0xc960ebb3,
	0xbd3e8d7e, 0xb9ff90c9, 0xb4bcb610, 0xb07daba7, 0xae3afba2,
	0xaafbe615, 0xa7b8c0cc, 0xa379dd7b, 0x9b3660c6, 0x9ff77d71,
	0x92b45ba8, 0x9675461f, 0x8832161a, 0x8cf30bad, 0x81b02d74,
	0x857130c3, 0x5d8a9099, 0x594b8d2e, 0x5408abf7, 0x50c9b640,
	0x4e8ee645, 0x4a4ffbf2, 0x470cdd2b, 0x43cdc09c, 0x7b827d21,
	0x7f436096, 0x7200464f, 0x76c15bf8, 0x68860bfd, 0x6c47164a,
	0x61043093, 0x65c52d24, 0x119b4be9, 0x155a565e, 0x18197087,
	0x1cd86d30, 0x029f3d35, 0x065e2082, 0x0b1d065b, 0x0fdc1bec,
	0x3793a651, 0x3352bbe6, 0x3e119d3f, 0x3ad08088, 0x2497d08d,
	0x2056cd3a, 0x2d15ebe3, 0x29d4f654, 0xc5a92679, 0xc1683bce,
	0xcc2b1d17, 0xc8ea00a0, 0xd6ad50a5, 0xd26c4d12, 0xdf2f6bcb,
	0xdbee767c, 0xe3a1cbc1, 0xe760d676, 0xea23f0af, 0xeee2ed18,
	0xf0a5bd1d, 0xf464a0aa, 0xf9278673, 0xfde69bc4, 0x89b8fd09,
	0x8d79e0be, 0x803ac667, 0x84fbdbd0, 0x9abc8bd5, 0x9e7d9662,
	0x933eb0bb, 0x97ffad0c, 0xafb010b1, 0xab710d06, 0xa6322bdf,
	0xa2f33668, 0xbcb4666d, 0xb8757bda, 0xb5365d03, 0xb1f740b4};

/**
 * @brief
 *	-Compute a POSIX 1003.2 checksum.  This routine has been broken out so that
 * 	other programs can use it.  It takes a char pointer and length.
 * 	It ruturns the crc value for the data in buf.
 *
 * @param[in] buf - input data data for which crc computed
 * @param[in] len - length of input data
 *
 * @return	u_long
 * @retval	crc value	success
 *
 */
static u_long
crc(u_char *buf, u_long clen)
{
	register u_char *p;
	register u_long crc, len;

#define COMPUTE(var, ch) (var) = (((var) << 8) ^                           \
				  crctab[(((var) >> 24) & 0xff) ^ (ch)]) & \
				 0xffffffff

	for (crc = 0, len = clen, p = buf; len--; ++p) {
		COMPUTE(crc, *p);
	}

	/* Include the length of the file. */
	for (; clen != 0; clen >>= 8) {
		COMPUTE(crc, clen & 0xff);
	}

	return (~crc & 0xffffffff);
}
/*
 *	END of included source
 */

#ifdef WIN32
/**
 * @brief
 * 	Given some bytes of data in 'buf' of size 'buf_sz', return a
 *	copy of the data but with <carriage return> <linefeed> combination
 *	entries replaced by a single <linefeed>. The returned buffer
 *	size is returned in 'new_buf_sz'.
 *
 * @param[in]		buf	- some bytes of data.
 * @param[in]		buf_sz	- size of 'buf'.
 * @param[in/out]	new_buf_sz - holds the buffer size of the returned buf.
 *
 * @return char *
 * @retval <copy of filtered 'buf'>
 */
static char *
dos2unix(char *buf, unsigned long buf_sz, int *new_buf_sz)
{
	static char *buf2 = NULL;
	static unsigned long buf2_sz = 0;
	char *tmp_str = NULL;
	int i, j;

	if (buf_sz > buf2_sz) {
		tmp_str = realloc(buf2, buf_sz);
		if (tmp_str == NULL) {
			*new_buf_sz = buf_sz;
			return (buf); /* return original */
		}
		buf2 = tmp_str;
		buf2_sz = buf_sz;
	}

	memset(buf2, '\0', buf2_sz);
	j = 0;
	for (i = 0; i < buf_sz; i++) {
		if ((i < (buf_sz - 1)) && (buf[i] == '\r') &&
		    (buf[i + 1] == '\n')) {
			buf2[j++] = '\n';
			i++; /* skip the next linefeed */
		} else {
			buf2[j++] = buf[i];
		}
	}

	*new_buf_sz = j;
	return (buf2);
}
#endif

/**
 * @brief
 * 	Given a file represented by 'filepath', return its crc value.
 *
 * @param[in]	filepath	- file being crc-ed.
 *
 * @return u_long
 * @retval	> 0	- crc (checksum) value of the file.
 * @retval	0	- if file is non-existent, or file is empty, or if an
 * 			  error encountered while opening or reading the
 * 			  file.
 */
unsigned long
crc_file(char *filepath)
{
	int fd;
	struct stat sb;
	static u_char *buf = NULL;
	static int buf_sz = 0;
	u_char *tmp_str = NULL;
	int nread = 0;
	int count;
	u_char *tmpbuf;
#ifdef WIN32
	u_char *tr_buf = NULL;
	int tr_buf_sz = 0;
#endif

	if (filepath == NULL)
		return (0);

	if (stat(filepath, &sb) == -1) {
		return (0);
	}

	if (sb.st_size <= 0) {
		return (0);
	}

	if ((fd = open(filepath, O_RDONLY)) <= 0) {
		return (0);
	}

#ifdef WIN32
	setmode(fd, O_BINARY);
#endif

	if (sb.st_size > buf_sz) {
		tmp_str = realloc(buf, sb.st_size);
		if (tmp_str == NULL) {
			close(fd);
			return (0);
		}
		buf = tmp_str;
		buf[0] = '\0';
		buf_sz = sb.st_size;
	}

	tmpbuf = buf;
	count = sb.st_size;

	while (((nread = read(fd, tmpbuf, count)) > 0) &&
	       (nread <= sb.st_size)) {

		count -= nread;
		tmpbuf += nread;

		if (count == 0) {
			break;
		}
	}

	if (nread < 0) {
		close(fd);
		return (0);
	}

	close(fd);
#ifdef WIN32
	tr_buf = dos2unix(buf, sb.st_size, &tr_buf_sz);
	return (crc(tr_buf, tr_buf_sz));
#else
	return (crc(buf, sb.st_size));
#endif
}

/**
 * @brief
 * 		state_char2int - return the state from character form to int form.
 *
 * @param[in]	stc	-	state in character form
 *
 * @return	state in int form
 * @retval	-1	: failure
 */

int
state_char2int(char stc)
{
	int i;
	char statechars[] = "TQHWREXBMF";

	for (i = 0; i < PBS_NUMJOBSTATE; i++) {
		if (statechars[i] == stc)
			return i;
	}
	return -1;
}

/**
 * @brief
 * 		state_int2char - return the state from int form to char form.
 *
 * @param[in]	sti	-	state in int form
 *
 * @return	state in char form
 * @retval	'0'	: failure
 */

char
state_int2char(int sti)
{
	switch (sti) {
		case JOB_STATE_TRANSIT:
			return JOB_STATE_LTR_TRANSIT;
		case JOB_STATE_QUEUED:
			return JOB_STATE_LTR_QUEUED;
		case JOB_STATE_HELD:
			return JOB_STATE_LTR_HELD;
		case JOB_STATE_WAITING:
			return JOB_STATE_LTR_WAITING;
		case JOB_STATE_RUNNING:
			return JOB_STATE_LTR_RUNNING;
		case JOB_STATE_EXITING:
			return JOB_STATE_LTR_EXITING;
		case JOB_STATE_EXPIRED:
			return JOB_STATE_LTR_EXPIRED;
		case JOB_STATE_BEGUN:
			return JOB_STATE_LTR_BEGUN;
		case JOB_STATE_MOVED:
			return JOB_STATE_LTR_MOVED;
		case JOB_STATE_FINISHED:
			return JOB_STATE_LTR_FINISHED;
		default:
			return JOB_STATE_LTR_UNKNOWN;
	}

	return JOB_STATE_LTR_UNKNOWN;
}

/**
 * @brief
 * 		parse_servername - parse a server/vnode name in the form:
 *		[(]name[:service_port][:resc=value[:...]][+name...]
 *		from exec_vnode or from exec_hostname
 *		name[:service_port]/NUMBER[*NUMBER][+...]
 *		or basic servername:port string
 *
 *		Returns ptr to the node name as the function value and the service_port
 *		number (int) into service if :port is found, otherwise port is unchanged
 *		host name is also terminated by a ':', '+' or '/' in string
 *
 * @param[in]	name	- server/node/exec_vnode string
 * @param[out]	service	-  RETURN: service_port if :port
 *
 * @return	 ptr to the node name
 *
 * @par MT-safe: No
 */

char *
parse_servername(char *name, unsigned int *service)
{
	static char buf[PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2];
	int i = 0;
	char *pc;

	if ((name == NULL) || (*name == '\0'))
		return NULL;
	if (*name == '(') /* skip leading open paren found in exec_vnode */
		name++;

	/* look for a ':', '+' or '/' in the string */

	pc = name;
	while (*pc && (i < PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 1)) {
		if ((*pc == '+') || (*pc == '/')) {
			break;
		} else if (*pc == ':') {
			if (isdigit((int) *(pc + 1)) && (service != NULL))
				*service = (unsigned int) atoi(pc + 1);
			break;
		} else {
			buf[i++] = *pc++;
		}
	}
	buf[i] = '\0';
	return (buf);
}

#ifndef WIN32
/**
 * @brief
 * 	set limits for the current process
 *
 * @param[in] core_limit - core limit in string (this is usally pbs_conf.pbs_core_limit)
 * @param[in] fdlimit - max open fd limit (can be 0 to not to change limit)
 *
 * @return void
 *
 */
void
set_proc_limits(char *core_limit, int fdlimit)
{
#ifdef RLIMIT_CORE
	int char_in_cname = 0;
	extern char *msg_corelimit;

	if (core_limit) {
		char *pc = core_limit;
		while (*pc != '\0') {
			if (!isdigit(*pc)) {
				/* there is a character in core limit */
				char_in_cname = 1;
				break;
			}
			pc++;
		}
	}
#endif /* RLIMIT_CORE */

#if defined(RLIM64_INFINITY)
	{
		struct rlimit64 rlimit;

		if (fdlimit) {
			rlimit.rlim_cur = fdlimit;
			rlimit.rlim_max = fdlimit;
			if (setrlimit64(RLIMIT_NOFILE, &rlimit) == -1) {
				log_err(errno, __func__, "could not set max open files limit");
			}
		}

		rlimit.rlim_cur = RLIM64_INFINITY;
		rlimit.rlim_max = RLIM64_INFINITY;
		(void) setrlimit64(RLIMIT_CPU, &rlimit);
		(void) setrlimit64(RLIMIT_FSIZE, &rlimit);
		(void) setrlimit64(RLIMIT_DATA, &rlimit);
		(void) setrlimit64(RLIMIT_STACK, &rlimit);
#ifdef RLIMIT_RSS
		(void) setrlimit64(RLIMIT_RSS, &rlimit);
#endif /* RLIMIT_RSS */
#ifdef RLIMIT_VMEM
		(void) setrlimit64(RLIMIT_VMEM, &rlimit);
#endif /* RLIMIT_VMEM */
#ifdef RLIMIT_CORE
		if (core_limit) {
			struct rlimit64 corelimit;
			corelimit.rlim_max = RLIM64_INFINITY;
			if (strcmp("unlimited", core_limit) == 0)
				corelimit.rlim_cur = RLIM64_INFINITY;
			else if (char_in_cname == 1) {
				log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_WARNING,
					   __func__, msg_corelimit);
				corelimit.rlim_cur = RLIM64_INFINITY;
			} else
				corelimit.rlim_cur = (rlim64_t) atol(core_limit);
			(void) setrlimit64(RLIMIT_CORE, &corelimit);
		}
#endif /* RLIMIT_CORE */
	}

#else /* setrlimit 32 bit */
	{
		struct rlimit rlimit;

		if (fdlimit) {
			rlimit.rlim_cur = fdlimit;
			rlimit.rlim_max = fdlimit;
			if (setrlimit(RLIMIT_NOFILE, &rlimit) == -1) {
				log_err(errno, __func__, "could not set max open files limit");
			}
		}
		rlimit.rlim_cur = RLIM_INFINITY;
		rlimit.rlim_max = RLIM_INFINITY;
		(void) setrlimit(RLIMIT_CPU, &rlimit);
#ifdef RLIMIT_RSS
		(void) setrlimit(RLIMIT_RSS, &rlimit);
#endif /* RLIMIT_RSS */
#ifdef RLIMIT_VMEM
		(void) setrlimit(RLIMIT_VMEM, &rlimit);
#endif /* RLIMIT_VMEM */
#ifdef RLIMIT_CORE
		if (core_limit) {
			struct rlimit corelimit;
			corelimit.rlim_max = RLIM_INFINITY;
			if (strcmp("unlimited", core_limit) == 0)
				corelimit.rlim_cur = RLIM_INFINITY;
			else if (char_in_cname == 1) {
				log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_WARNING,
					   (char *) __func__, msg_corelimit);
				corelimit.rlim_cur = RLIM_INFINITY;
			} else
				corelimit.rlim_cur =
					(rlim_t) atol(core_limit);

			(void) setrlimit(RLIMIT_CORE, &corelimit);
		}
#endif /* RLIMIT_CORE */
#ifndef linux
		(void) setrlimit(RLIMIT_FSIZE, &rlimit);
		(void) setrlimit(RLIMIT_DATA, &rlimit);
		(void) setrlimit(RLIMIT_STACK, &rlimit);
#else
		if (getrlimit(RLIMIT_STACK, &rlimit) != -1) {
			if ((rlimit.rlim_cur != RLIM_INFINITY) && (rlimit.rlim_cur < MIN_STACK_LIMIT)) {
				rlimit.rlim_cur = MIN_STACK_LIMIT;
				rlimit.rlim_max = MIN_STACK_LIMIT;
				if (setrlimit(RLIMIT_STACK, &rlimit) == -1) {
					log_err(errno, __func__, "setting stack limit failed");
					exit(1);
				}
			}
		} else {
			log_err(errno, __func__, "getting current stack limit failed");
			exit(1);
		}
#endif /* not linux */
	}
#endif /* !RLIM64_INFINITY */
}
#endif

/**
 * @brief
 *	rand_num - returns a random number.
 * 	This function will seed using micro second if already not seeded
 *
 */
int
rand_num(void)
{
	static int seeded = 0;
	struct timeval tv;

	if (!seeded) {
		gettimeofday(&tv, NULL);
		srand(1000000 * tv.tv_sec + tv.tv_usec); /* seed the random generator */
		seeded = 1;
	}

	return rand();
}

/**
 * @brief
 * 	get subjob index from given jobid
 *
 * @param[in] jid - jobid
 *
 * @return int
 * @retval -1  - fail to determine index of subjob
 * @retval !-1 - index of subjob
 */
int
get_index_from_jid(char *jid)
{
	char *range = get_range_from_jid(jid);

	if (range != NULL) {
		char *endptr = NULL;
		int idx = strtoul(range, &endptr, 10);

		if (endptr == NULL || *endptr != '\0' || idx < 0)
			return -1;
		else
			return idx;
	} else
		return -1;
}
/**
 * @brief
 * 	get range string of arrayjob from given jobid
 *
 * @param[in] jid - job id
 *
 * @return char *
 * @retval NULL - on error
 * @retval ptr - ptr to static char array containing range string if found
 *
 * @par
 * 	MT-safe: No - uses static variables - index, indexlen.
 */
char *
get_range_from_jid(char *jid)
{
	int i;
	char *pcb;
	char *pce;
	static char index[BUF_SIZE];

	if ((pcb = strchr(jid, (int) '[')) == NULL)
		return NULL;
	if ((pce = strchr(jid, (int) ']')) == NULL)
		return NULL;
	if (pce <= pcb)
		return NULL;

	i = 0;
	while (++pcb < pce)
		index[i++] = *pcb;
	index[i] = '\0';
	return index;
}

/**
 * @brief
 * 	create and return (in a static array) a jobid for a subjob based on
 * 	the parent jobid and the subjob index
 *
 * @param[in] parent_jid - parent jobid
 * @param[in] sjidx -  subjob index.
 *
 * @return char *
 * @return !NULL - jobid of subjob
 * @return NULL - failure
 *
 * @par
 * 	MT-safe: No - uses a static buffer, "jid".
 */
char *
create_subjob_id(char *parent_jid, int sjidx)
{
	static char jid[PBS_MAXSVRJOBID + 1];
	char *pcb;
	char *pce;

	if ((pcb = strchr(parent_jid, (int) '[')) == NULL)
		return NULL;
	if ((pce = strchr(parent_jid, (int) ']')) == NULL)
		return NULL;
	if (pce <= pcb)
		return NULL;

	*pcb = '\0';
	snprintf(jid, sizeof(jid), "%s[%d]%s", parent_jid, sjidx, pce + 1);
	*pcb = '[';
	return jid;
}

/**
 * @brief
 * 		read attributes from file descriptor of a job file
 *
 * @param[in]	fd	-	file descriptor
 * @param[out]	errbuf	-	buffer to return messages for any errors
 *
 * @return	svrattrl *
 * @retval	svrattrl object for the attribute read
 * @retval	NULL for error
 */
static svrattrl *
read_attr(int fd, char **errbuf)
{
	int amt;
	int i;
	svrattrl *pal;
	svrattrl tempal;

	i = read(fd, (char *) &tempal, sizeof(tempal));
	if (i != sizeof(tempal)) {
		if (errbuf != NULL)
			sprintf(*errbuf, "bad read of attribute");
		return NULL;
	}
	if (tempal.al_tsize == ENDATTRIBUTES)
		return NULL;

	pal = (svrattrl *) malloc(tempal.al_tsize);
	if (pal == NULL) {
		if (errbuf != NULL)
			sprintf(*errbuf, "malloc failed");
		return NULL;
	}
	*pal = tempal;

	/* read in the actual attribute data */

	amt = pal->al_tsize - sizeof(svrattrl);
	i = read(fd, (char *) pal + sizeof(svrattrl), amt);
	if (i != amt) {
		if (errbuf != NULL)
			sprintf(*errbuf, "short read of attribute");
		return NULL;
	}
	pal->al_name = (char *) pal + sizeof(svrattrl);
	if (pal->al_rescln)
		pal->al_resc = pal->al_name + pal->al_nameln;
	else
		pal->al_resc = NULL;
	if (pal->al_valln)
		pal->al_value = pal->al_name + pal->al_nameln + pal->al_rescln;
	else
		pal->al_value = NULL;

	return pal;
}

/**
 * @brief	Read all job attribute values from a job file
 *
 * @param[in]	fd - fd of job file
 * @param[out]	state - return pointer to state value
 * @param[out]	substate - return pointer for substate value
 * @param[out]	errbuf	-	buffer to return messages for any errors
 *
 * @return	svrattrl*
 * @retval	list of attributes read from a job file
 * @retval	NULL for error
 */
svrattrl *
read_all_attrs_from_jbfile(int fd, char **state, char **substate, char **errbuf)
{
	svrattrl *pal = NULL;
	svrattrl *pali = NULL;

	while ((pali = read_attr(fd, errbuf)) != NULL) {
		if (pal == NULL) {
			pal = pali;
			(&pal->al_link)->ll_struct = (void *) (&pal->al_link);
			(&pal->al_link)->ll_next = NULL;
			(&pal->al_link)->ll_prior = NULL;
		} else {
			pbs_list_link *head = &pal->al_link;
			pbs_list_link *newp = &pali->al_link;
			newp->ll_prior = NULL;
			newp->ll_next = head;
			newp->ll_struct = pali;
			pal = pali;
		}
		/* Check if the attribute read is state/substate and store it separately */
		if (state && strcmp(pali->al_name, ATTR_state) == 0)
			*state = pali->al_value;
		else if (substate && strcmp(pali->al_name, ATTR_substate) == 0)
			*substate = pali->al_value;
	}

	return pal;
}

/**
 * @brief
 *  Generate a random string with given length..
 *
 * @param[in/out]	str - Character array where random string is stored
 * @param[in]		len - Length of string to be generated
 *
 * @return void
 */
void
set_rand_str(char *str, int len)
{
	int i;
	for (i = 0; i < len - 1; i++) {
		str[i] = (rand_num() % 255) + 1; /* don't allow zero since it is null char */
		if (str[i] == ';') {
			/* we are using ; as a separator, so can't have that */
			str[i] = '_';
		}
	}
	str[i] = '\0';

}
/**
 * @brief
 * 	Generate a host key with encryption
 *
 * @param[in] cluster_key - The cluster key used for encryption
 * @param[in] salt -  A salt value to add randomness to the encryption
 * @param[in/out] len - Length of encrypted data
 *
 * @return char *
 * @return !NULL - Encrypted data
 * @return NULL - failure
 */
char *
gen_hostkey(char *cluster_key, char *salt, size_t *len)
{
	static size_t cred_len;
	static char *cred_buf = NULL;
	int cred_type;
	extern unsigned char pbs_aes_key[][16];
	extern unsigned char pbs_aes_iv[][16];
	char *q;
	char *p = NULL;
	const char *timestr = uLTostr(time(0), 10);

	if (cluster_key == NULL)
		return NULL;

	q = p = malloc(strlen(salt) + 1 + strlen(timestr) + 1 + strlen(cluster_key) + 1);
	p = pbs_strcpy(p, salt);
	p = pbs_strcpy(p, ";");
	p = pbs_strcpy(p, timestr);
	p = pbs_strcpy(p, ";");
	pbs_strcpy(p, cluster_key);

	if (pbs_encrypt_pwd(q, &cred_type, &cred_buf, &cred_len,
			    (const unsigned char *) pbs_aes_key, (const unsigned char *) pbs_aes_iv) != 0)
		return NULL;
	free(q);

	/* now form a string as such: str;encrypted-data */
	*len = strlen(salt) + 1 + cred_len;
	q = p = malloc(*len + 1);
	p = pbs_strcpy(p, salt);
	p = pbs_strcpy(p, ";");
	memcpy(p, cred_buf, cred_len);
	free(cred_buf);
	cred_buf = NULL;
	q[*len] = '\0';

	return q;
}

/**
 * @brief
 * 	Validate a host key and extract cluster key
 *
 * @param[in] host_key - The host key to be validated
 * @param[in] host_keylen -  Length of host key
 * @param[out] cluster_key - Store the extracted cluster key
 *
 * @return int
 * @return 0 - success
 * @return -1 - failure
 */
int
validate_hostkey(char *host_key, size_t host_keylen, char **cluster_key)
{
	char *ck;
	char *p;
	char *key = NULL;
	char *salt;
	time_t origin;
	extern unsigned char pbs_aes_key[][16];
	extern unsigned char pbs_aes_iv[][16];

	/* break it down to find out salt;clusterkey */
	if (!(p = strchr(host_key, ';'))) {
		log_errf(-1, __func__, "first ; not found");
		goto err;
	}
	*p = '\0';
	salt = host_key;

	ck = p + 1;
	if (pbs_decrypt_pwd(ck, PBS_CREDTYPE_AES, host_keylen - (ck - host_key), &key,
			    (const unsigned char *) pbs_aes_key, (const unsigned char *) pbs_aes_iv) != 0) {
		log_errf(-1, __func__, "decyrpt failed, host_keylen=%d, initial salt found was %s", host_keylen - (ck - host_key), salt);
		goto err;
	}

	/* break down decrypted cluster key into timestamp and rand and verify timestamp */
	if (!(p = strchr(key, ';'))) {
		log_errf(-1, __func__, "second ; not found");
		goto err;
	}
	*p = '\0';

	/* compare the salt values */
	if (strcmp(salt, key) != 0) {
		log_errf(-1, __func__, "salt does not match salt=%s, key=%s", salt, key);
		goto err;
	}

	/* ensure timestamp is not too old (within 5 mins) */
	origin = atol(++p);
	if ((origin == -1) || ((time(0) - origin) > 300)) {
		log_errf(-1, __func__, "timestamp out of whack, time=%ld, origin=%ld", time(0), origin);
		goto err;
	}
	if (!(p = strchr(p, ';'))) {
		log_errf(-1, __func__, "Third ; not found");
		goto err;
	}
	*p = '\0';
	ck = ++p;

	/* if cluster_key provided compare them */
	if (cluster_key) {
		if (*cluster_key) {
			if (strcmp(ck, *cluster_key) != 0) {
				log_errf(-1, __func__, "Cluster key does not match, ck=%s, cluster_key=%s", ck, *cluster_key);
				goto err;
			}
		} else {
			*cluster_key = strdup(ck);
			if (!*cluster_key) {
				log_errf(-1, __func__, "strdup of cluster key failed");
				goto err;
			}
		}
	}
	free(key);
	return 0;

err:
	free(key);
	return -1;
}


================================================
FILE: src/lib/Libutil/pbs_aes_encrypt.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <memory.h>
#include <string.h>
#include <stdlib.h>

#include <openssl/evp.h>
#include <openssl/aes.h>
#include <openssl/bio.h>
#include <openssl/buffer.h>
#include <openssl/sha.h>
#include "ticket.h"
/**
 * @file	pbs_aes_encrypt.c
 */
extern unsigned char pbs_aes_key[];
extern unsigned char pbs_aes_iv[];

#if OPENSSL_VERSION_NUMBER < 0x10100000L
#define CIPHER_CONTEXT_INIT(v) EVP_CIPHER_CTX_init(v)
#define CIPHER_CONTEXT_CLEAN(v) EVP_CIPHER_CTX_cleanup(v)
#else
#define CIPHER_CONTEXT_INIT(v)    \
	v = EVP_CIPHER_CTX_new(); \
	if (!v)                   \
	return -1
#define CIPHER_CONTEXT_CLEAN(v)    \
	EVP_CIPHER_CTX_cleanup(v); \
	EVP_CIPHER_CTX_free(v)
#endif

/**
 * @brief
 *	Encrypt the input string using AES encryption. The keys are rotated
 *	for each block of data equal to the size of each key.
 *
 * @param[in]	uncrypted - The input data to encrypt
 * @param[out]	credtype  - The credential type
 * @param[out]	credbuf	  - The buffer containing the encrypted data
 * @param[out]	outlen	  - Length of the buffer containing encrypted data
 *
 * @return      int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_encrypt_pwd(char *uncrypted, int *credtype, char **crypted, size_t *outlen, const unsigned char *aes_key, const unsigned char *aes_iv)
{
	int plen, len2 = 0;
	unsigned char *cblk;
	size_t len = strlen(uncrypted) + 1;

#if OPENSSL_VERSION_NUMBER < 0x10100000L
	EVP_CIPHER_CTX real_ctx;
	EVP_CIPHER_CTX *ctx = &real_ctx;
#else
	EVP_CIPHER_CTX *ctx = NULL;
#endif

	CIPHER_CONTEXT_INIT(ctx);

	if (EVP_EncryptInit_ex(ctx, EVP_aes_256_cbc(), NULL, (const unsigned char *) aes_key, (const unsigned char *) aes_iv) == 0) {
		CIPHER_CONTEXT_CLEAN(ctx);
		return -1;
	}

	plen = len + EVP_CIPHER_CTX_block_size(ctx) + 1;
	cblk = malloc(plen);
	if (!cblk) {
		CIPHER_CONTEXT_CLEAN(ctx);
		return -1;
	}

	if (EVP_EncryptUpdate(ctx, cblk, &plen, (unsigned char *) uncrypted, len) == 0) {
		CIPHER_CONTEXT_CLEAN(ctx);
		free(cblk);
		cblk = NULL;
		return -1;
	}

	if (EVP_EncryptFinal_ex(ctx, cblk + plen, &len2) == 0) {
		CIPHER_CONTEXT_CLEAN(ctx);
		free(cblk);
		cblk = NULL;
		return -1;
	}

	CIPHER_CONTEXT_CLEAN(ctx);

	*crypted = (char *) cblk;
	*outlen = plen + len2;
	*credtype = PBS_CREDTYPE_AES;

	return 0;
}

/**
 * @brief
 *	Decrypt the encrypted input data using AES decryption.
 *	The keys are rotated for each block of data equal to size of each key.
 *
 * @param[in]	crypted   - The encrypted data to decrypt
 * @param[in]   credtype  - The credential type
 * @param[in]	len	      - The length of crypted
 * @param[out]	uncrypted - The decrypted data
 *
 * @return      int
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
pbs_decrypt_pwd(char *crypted, int credtype, size_t len, char **uncrypted, const unsigned char *aes_key, const unsigned char *aes_iv)
{
	unsigned char *cblk;
	int plen, len2 = 0;

#if OPENSSL_VERSION_NUMBER < 0x10100000L
	EVP_CIPHER_CTX real_ctx;
	EVP_CIPHER_CTX *ctx = &real_ctx;
#else
	EVP_CIPHER_CTX *ctx = NULL;
#endif

	CIPHER_CONTEXT_INIT(ctx);

	if (EVP_DecryptInit_ex(ctx, EVP_aes_256_cbc(), NULL, (const unsigned char *) aes_key, (const unsigned char *) aes_iv) == 0) {
		CIPHER_CONTEXT_CLEAN(ctx);
		return -1;
	}

	cblk = malloc(len + EVP_CIPHER_CTX_block_size(ctx) + 1);
	if (!cblk) {
		CIPHER_CONTEXT_CLEAN(ctx);
		return -1;
	}

	if (EVP_DecryptUpdate(ctx, cblk, &plen, (unsigned char *) crypted, len) == 0) {
		CIPHER_CONTEXT_CLEAN(ctx);
		free(cblk);
		cblk = NULL;
		return -1;
	}

	if (EVP_DecryptFinal_ex(ctx, cblk + plen, &len2) == 0) {
		CIPHER_CONTEXT_CLEAN(ctx);
		free(cblk);
		cblk = NULL;
		return -1;
	}

	CIPHER_CONTEXT_CLEAN(ctx);

	*uncrypted = (char *) cblk;
	(*uncrypted)[plen + len2] = '\0';

	return 0;
}

/**
 * @brief
 *	encode_to_base64 - Encode data into base64 format
 *
 * @param[in]		buffer			-	Data buffer for encoding
 * @param[in]		buffer_len		-	Length of the data buffer
 * @param[in/out]	ret_encoded_data	-	Return the encoded data
 *
 * @return int
 * @retval 0 - for success
 * @retval 1 - for failure
 */
int
encode_to_base64(const unsigned char *buffer, size_t buffer_len, char **ret_encoded_data)
{
	BIO *mem_obj1, *mem_obj2;
	long buf_len = 0;
	char *buf;

	mem_obj1 = BIO_new(BIO_s_mem());
	if (mem_obj1 == NULL)
		return 1;
	mem_obj2 = BIO_new(BIO_f_base64());
	if (mem_obj2 == NULL) {
		BIO_free(mem_obj1);
		return 1;
	}

	mem_obj1 = BIO_push(mem_obj2, mem_obj1);
	BIO_set_flags(mem_obj1, BIO_FLAGS_BASE64_NO_NL);
	BIO_write(mem_obj1, buffer, buffer_len);
	(void) BIO_flush(mem_obj1);
	buf_len = BIO_get_mem_data(mem_obj1, &buf);
	if (buf_len <= 0)
		return 1;
	*ret_encoded_data = (char *) malloc(buf_len + 1);
	if (*ret_encoded_data == NULL) {
		BIO_free_all(mem_obj1);
		return 1;
	}
	memcpy(*ret_encoded_data, buf, buf_len);
	(*ret_encoded_data)[buf_len] = '\0';

	BIO_free_all(mem_obj1);
	return 0;
}

/**
 * @brief
 *	decode_from_base64 - Decode data from base64 format
 *
 * @param[in]		buffer			-	Data buffer for decoding
 * @param[in/out]	ret_decoded_data	-	Return the decoded data
 * @param[in/out]	ret_decoded_len		-	Return length of the decoded data
 *
 * @return int
 * @retval 0 - for success
 * @retval 1 - for failure
 */
int
decode_from_base64(char *buffer, unsigned char **ret_decoded_data, size_t *ret_decoded_len)
{
	BIO *mem_obj1, *mem_obj2;
	size_t decode_length = 0;
	size_t input_len = 0;
	size_t char_padding = 0;
	int padding_enabled = 1;

	input_len = strlen(buffer);
	if (input_len == 0)
		return 1;
	if ((buffer[input_len - 1] == '=') && (buffer[input_len - 2] == '=')) {
		char_padding = 2;
		padding_enabled = 0;
	}
	if (padding_enabled) {
		if (buffer[input_len - 1] == '=')
			char_padding = 1;
	}
	decode_length = ((input_len * 3) / 4 - char_padding);
	*ret_decoded_data = (unsigned char *) malloc(decode_length + 1);
	if (*ret_decoded_data == NULL)
		return 1;
	(*ret_decoded_data)[decode_length] = '\0';

	mem_obj1 = BIO_new_mem_buf(buffer, -1);
	if (mem_obj1 == NULL)
		return 1;
	mem_obj2 = BIO_new(BIO_f_base64());
	if (mem_obj2 == NULL) {
		BIO_free_all(mem_obj1);
		return 1;
	}

	mem_obj1 = BIO_push(mem_obj2, mem_obj1);
	BIO_set_flags(mem_obj1, BIO_FLAGS_BASE64_NO_NL);
	*ret_decoded_len = BIO_read(mem_obj1, *ret_decoded_data, strlen(buffer));

	if (*ret_decoded_len != decode_length) {
		BIO_free_all(mem_obj1);
		return 1;
	}
	BIO_free_all(mem_obj1);
	return 0;
}
/** @brief
 *	encode_SHA - Returns the hexadecimal hash.
 *
 *	@param[in] : str - token to hash
 *	@param[in] : len - length of the
 *	@param[in] ebufsz - size of ebuf
 *	@return	int
 *	@retval 1 on error
 *			0 on success
 */

void
encode_SHA(char *token, size_t cred_len, char **hex_digest)
{
	unsigned char obuf[SHA_DIGEST_LENGTH] = {'\0'};
	int i;

	SHA1((const unsigned char *) token, cred_len, obuf);
	for (i = 0; i < SHA_DIGEST_LENGTH; i++) {
		sprintf((char *) (*hex_digest + (i * 2)), "%02x", obuf[i]);
	}
}


================================================
FILE: src/lib/Libutil/pbs_array_list.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "pbs_array_list.h"

/**
 * @brief
 *	return the reallocated chunk of memory to hold range of ip addresses,
 *
 * @return	pntPBS_IP_RANGE
 * @retval	reallocated memory
 *
 */
pntPBS_IP_RANGE
create_pbs_range(void)
{
	return ((pntPBS_IP_RANGE) calloc(CHUNK, sizeof(PBS_IP_RANGE)));
}

/**
 * @brief
 *	resize the present ip list
 *
 * @param[in] list - list of ip address
 *
 * @return	pntPBS_IP_LIST
 * @retval	new list	success
 * @retval	NULL		error
 */
pntPBS_IP_LIST
resize_pbs_iplist(pntPBS_IP_LIST list)
{
	pntPBS_IP_RANGE temp;
	temp = (pntPBS_IP_RANGE) realloc(list->li_range, ((CHUNK + list->li_totalsize) * sizeof(PBS_IP_RANGE)));
	if (temp != NULL) {
		list->li_range = temp;
		memset(((char *) list->li_range + (list->li_totalsize * sizeof(PBS_IP_RANGE))), 0, CHUNK * sizeof(PBS_IP_RANGE));
		list->li_totalsize += CHUNK;
		return list;
	} else {
		delete_pbs_iplist(list);
		return NULL;
	}
}

/**
 * @brief
 *	creates ip address list.
 *
 * @return	pntPBS_IP_LIST
 * @retval	reference to created ip addr list	success
 * @retval	NULL					error
 *
 */
pntPBS_IP_LIST
create_pbs_iplist(void)
{
	pntPBS_IP_LIST list = (pntPBS_IP_LIST) calloc(1, sizeof(PBS_IP_LIST));
	if (list) {
		list->li_range = create_pbs_range();
		if (!list->li_range) {
			free(list);
			return NULL;
		}
		list->li_totalsize = CHUNK;
	}
	return list;
}

/**
 * @brief
 *      deletes ip address list.
 *
 * @param[in] pntPBS_IP_LIST pointer to list
 *
 */
void
delete_pbs_iplist(pntPBS_IP_LIST list)
{
	if (list) {
		if (list->li_range)
			free(list->li_range);
		free(list);
	}
	return;
}

/**
 * @brief
 *	searches the the key value in list.
 *
 * @param[in] list - list
 * @param[in] key - key value
 * @param[out] location - index where key found
 *
 * @return	int
 * @retval	location	if found
 * @retval	-1		if not found
 *
 */
int
search_location(pntPBS_IP_LIST list, T key, int *location)
{
	int bottom, middle, top;
	bottom = 0;
	top = list->li_nrowsused - 1;
	while (top >= bottom) {
		middle = (top + bottom) / 2;
		if (key == IPLIST_GET_LOW(list, middle)) {
			*location = middle;
			return middle;
		} else if (key < IPLIST_GET_LOW(list, middle))
			top = middle - 1;
		else
			bottom = middle + 1;
	}
	*location = top;
	if (top != -1 && key <= (IPLIST_GET_LOW(list, *location) + IPLIST_GET_HIGH(list, *location))) {
		return (*location);
	}
	return -1;
}

/**
 * @brief
 *      insert the the key value into list.
 *
 * @param[in] list - list
 * @param[in] key - key value
 *
 * @return      int
 * @retval      0	insertion of key successful
 * @retval      !0	insertion of key  failed
 *
 */

int
insert_iplist_element(pntPBS_IP_LIST list, T key)
{
	int location = -1;
	int first_row = 0;
	/* If list is empty, go ahed and input the ip at first location */
	if (IPLIST_GET_LOW(list, 0) == 0 && list->li_nrowsused == 0) {
		IPLIST_SET_LOW(list, 0, key);
		list->li_nrowsused++;
		return IPLIST_INSERT_SUCCESS;
	}

	if (list->li_nrowsused == list->li_totalsize) {
		list = resize_pbs_iplist(list);
		if (!list) {
			return IPLIST_INSERT_FAILURE;
		}
	}

	if (search_location(list, key, &location) >= 0)
		return IPLIST_INSERT_SUCCESS;
	if (location == -1) {
		first_row = 1;
		location++;
	}

	if (IPLIST_IS_CONTINUOUS_ROW(list, location, key)) {
		IPLIST_SET_HIGH(list, location, IPLIST_GET_HIGH(list, location) + 1);
		if (IPLIST_IS_CONTINUOUS_ROW(list, location, IPLIST_GET_LOW(list, location + 1))) {
			IPLIST_SET_HIGH(list, location, IPLIST_GET_HIGH(list, location) + 1 + IPLIST_GET_HIGH(list, location + 1));
			/** memove rows up , decrement nrowsused, memset one row with INIT_VALUE **/
			list->li_nrowsused--;
			if (IPLIST_SHIFT_ALL_UP_BY_ONE(list, location + 1, list->li_nrowsused - (location + 1)) == NULL) {
				list->li_nrowsused++;
				return IPLIST_INSERT_FAILURE;
			}
			memset(list->li_range + list->li_nrowsused, 0, sizeof(PBS_IP_RANGE));
		}
	} else {
		if (first_row)
			location--;
		if (IPLIST_IS_CONTINUOUS(key, IPLIST_GET_LOW(list, location + 1))) {
			IPLIST_SET_LOW(list, location + 1, key);
			IPLIST_SET_HIGH(list, location + 1, IPLIST_GET_HIGH(list, location + 1) + 1);
		} else {
			if (IPLIST_GET_LOW(list, location + 1) == INIT_VALUE) {
				IPLIST_SET_LOW(list, location + 1, key);
				list->li_nrowsused++;
			} else {
				/** Add new Row **/
				if (IPLIST_SHIFT_ALL_DOWN_BY_ONE(list, location + 1, list->li_nrowsused - (location + 1)) == NULL)
					return IPLIST_INSERT_FAILURE;
				IPLIST_SET_LOW(list, location + 1, key);
				IPLIST_SET_HIGH(list, location + 1, INIT_VALUE);
				list->li_nrowsused++;
			}
		}
	}
	return IPLIST_INSERT_SUCCESS;
}

/**
 * @brief
 *      delete the the key value into list.
 *
 * @param[in] list - list
 * @param[in] key - key value
 *
 * @return      int
 * @retval      0       deletion of key successful
 * @retval      !0      deletion of key  failed
 *
 */

int
delete_iplist_element(pntPBS_IP_LIST list, T key)
{
	int location = -1;
	T high = 0;

	if (list->li_nrowsused == list->li_totalsize) {
		list = resize_pbs_iplist(list);
		if (!list) {
			return IPLIST_INSERT_FAILURE;
		}
	}

	if (search_location(list, key, &location) == -1)
		return IPLIST_DELETE_FAILURE;
	if ((IPLIST_GET_LOW(list, location) == key) && list->li_nrowsused) { /** If the Lower IP of range **/
		if (IPLIST_GET_HIGH(list, location) == INIT_VALUE) {
			if (IPLIST_SHIFT_ALL_UP_BY_ONE(list, location, list->li_nrowsused - (location + 1)) == NULL) {
				list->li_nrowsused++;
				return IPLIST_DELETE_FAILURE;
			}
			list->li_nrowsused--;
			memset(list->li_range + list->li_nrowsused, 0, sizeof(PBS_IP_RANGE));
		} else {
			IPLIST_SET_LOW(list, location, IPLIST_GET_LOW(list, location) + 1);
			IPLIST_SET_HIGH(list, location, IPLIST_GET_HIGH(list, location) - 1);
		}
	} else if ((IPLIST_GET_LOW(list, location) + IPLIST_GET_HIGH(list, location)) == key) { /** Is the biggest IP of range **/
		IPLIST_SET_HIGH(list, location, IPLIST_GET_HIGH(list, location) - 1);
	} else { /** Lies somewhere in between LOW & HIGH **/
		/* temp = IPLIST_GET_HIGH(list,location); */
		high = IPLIST_GET_LOW(list, location) + IPLIST_GET_HIGH(list, location);
		IPLIST_SET_HIGH(list, location, key - IPLIST_GET_LOW(list, location) - 1);
		if (IPLIST_SHIFT_ALL_DOWN_BY_ONE(list, location + 1, list->li_nrowsused - (location + 1)) == NULL)
			return IPLIST_DELETE_FAILURE;
		IPLIST_SET_LOW(list, location + 1, key + 1);
		IPLIST_SET_HIGH(list, location + 1, high - IPLIST_GET_LOW(list, location + 1));
		list->li_nrowsused++;
	}
	return IPLIST_DELETE_SUCCESS;
}


================================================
FILE: src/lib/Libutil/pbs_ical.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_ical.c
 * @brief
 * pbs_ical.c : Utility functions to parse and handle iCal syntax
 *
 *	This is used to abstract the use of libical from the
 *  functionality of PBS. It is invoked from
 *  1) the commands (pbs_rsub and pbs_rstat)
 *  2) the server: req_rescq.c, svr_jobfunc.c
 *  3) the scheduler: resv_info.c
 *
 *  The purpose of this interface to libical is to wrap all iCalendar specific
 *  calls from PBS to an implementation independent function.
 *
 * See RFC 2445 for more information and specifics of the iCalendar syntax
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include <libutil.h>

#include "pbs_error.h"
#ifdef LIBICAL
#include <libical/ical.h>
#endif

#define DATE_LIMIT (3 * (60 * 60 * 24 * 365)) /* Limit to 3 years from now */

/**
 * @brief
 * 	Returns the number of occurrences defined by a recurrence rule.
 *
 * @par	The total number of occurrences is currently limited to a hardcoded
 * 	3 years limit from the current date.
 *
 * @par	NOTE: Determine whether 3 years limit is the right way to go about setting
 * 	a limit on the total number of occurrences.
 *
 * @param[in] rrule - The recurrence rule as defined by the user
 * @param[in] tt - The start time of the first occurrence
 * @param[in] tz - The timezone associated to the recurrence rule
 *
 * @return	int
 * @retval 	the total number of occurrences
 *
 */
int
get_num_occurrences(char *rrule, time_t dtstart, char *tz)
{

#ifdef LIBICAL
	struct icalrecurrencetype rt;
	struct icaltimetype start;
	icaltimezone *localzone;
	struct icaltimetype next;
	struct icalrecur_iterator_impl *itr;
	time_t now;
	time_t date_limit;
	int num_resv = 0;

	/* if any of the argument is NULL, we are dealing with
	 * advance reservation, so return 1 occurrence */
	if (rrule == NULL || tz == NULL)
		return 1;

	icalerror_clear_errno();

	icalerror_set_error_state(ICAL_PARSE_ERROR, ICAL_ERROR_NONFATAL);
#ifdef LIBICAL_API2
	icalerror_set_errors_are_fatal(0);
#else
	icalerror_errors_are_fatal = 0;
#endif
	localzone = icaltimezone_get_builtin_timezone(tz);

	if (localzone == NULL)
		return 0;

	now = time(NULL);
	date_limit = now + DATE_LIMIT;

	rt = icalrecurrencetype_from_string(rrule);

	start = icaltime_from_timet_with_zone(dtstart, 0, NULL);
	icaltimezone_convert_time(&start, icaltimezone_get_utc_timezone(), localzone);

	itr = (struct icalrecur_iterator_impl *) icalrecur_iterator_new(rt, start);

	next = icalrecur_iterator_next(itr);

	/* Compute the total number of occurrences.
	 * Breaks out if the total number of allowed occurrences is exceeded */
	while (!icaltime_is_null_time(next) &&
	       (icaltime_as_timet(next) < date_limit)) {
		num_resv++;
		next = icalrecur_iterator_next(itr);
	}
	icalrecur_iterator_free(itr);

	return num_resv;
#else

	if (rrule == NULL)
		return 1;

	return 0;
#endif
}

/**
 * @brief
 * 	Get the occurrence as defined by the given recurrence rule,
 * 	index, and start time. This function assumes that the
 * 	time dtsart passed in is the one to start the occurrence from.
 *
 * @par	NOTE: This function should be made reentrant such that
 * 	it can be looped over without having to loop over every occurrence
 * 	over and over again.
 *
 * @param[in] rrule - The recurrence rule as defined by the user
 * @param[in] dtstart - The start time from which to start
 * @param[in] tz - The timezone associated to the recurrence rule
 * @param[in] idx - The index of the occurrence to start counting from
 *
 * @return 	time_t
 * @retval	The date of the next occurrence or -1 if the date exceeds libical's
 * 		Unix time in 2038
 *
 */
time_t
get_occurrence(char *rrule, time_t dtstart, char *tz, int idx)
{
#ifdef LIBICAL
	struct icalrecurrencetype rt;
	struct icaltimetype start;
	icaltimezone *localzone;
	struct icaltimetype next;
	struct icalrecur_iterator_impl *itr;
	int i;
	time_t next_occr = dtstart;

	if (rrule == NULL)
		return dtstart;

	if (tz == NULL)
		return -1;

	icalerror_clear_errno();

	icalerror_set_error_state(ICAL_PARSE_ERROR, ICAL_ERROR_NONFATAL);
#ifdef LIBICAL_API2
	icalerror_set_errors_are_fatal(0);
#else
	icalerror_errors_are_fatal = 0;
#endif
	localzone = icaltimezone_get_builtin_timezone(tz);

	if (localzone == NULL)
		return -1;

	rt = icalrecurrencetype_from_string(rrule);

	start = icaltime_from_timet_with_zone(dtstart, 0, NULL);
	icaltimezone_convert_time(&start, icaltimezone_get_utc_timezone(), localzone);
	next = start;

	itr = (struct icalrecur_iterator_impl *) icalrecur_iterator_new(rt, start);
	/* Skip as many occurrences as specified by idx */
	for (i = 0; i < idx && !icaltime_is_null_time(next); i++)
		next = icalrecur_iterator_next(itr);

	if (!icaltime_is_null_time(next)) {
		icaltimezone_convert_time(&next, localzone,
					  icaltimezone_get_utc_timezone());
		next_occr = icaltime_as_timet(next);
	} else
		next_occr = -1; /* If reached end of possible date-time return -1 */
	icalrecur_iterator_free(itr);

	return next_occr;
#else
	return dtstart;
#endif
}

/**
 * @brief
 * 	Check if a recurrence rule is valid and consistent.
 * 	The recurrence rule is verified against a start date and checks
 * 	that the frequency of the recurrence matches the duration of the
 * 	submitted reservation. If the duration of a reservation exceeds the
 * 	granularity of the frequency then an error message is displayed.
 *
 * @par The recurrence rule is checked to contain a COUNT or an UNTIL.
 *
 * @par	Note that the PBS_TZID environment variable HAS to be set for the occurrence's
 * 	dates to be correctly computed.
 *
 * @param[in] rrule - The recurrence rule to unroll
 * @param[in] dtstart - The start time associated to the reservation (1st occurrence)
 * @param[in] dtend - The end time associated to the reservation (1st occurrence)
 * @param[in] duration - The duration of an occurrence. This is used when a reservation is
 *  			submitted using the -D (duration) param instead of an end time
 * @param[in] tz - The timezone associated to the recurrence rule
 * @param[in] err_code - A pointer to the error code to return. Codes are defined in pbs_error.h
 *
 * @return	int
 * @retval	The total number of occurrences that the recurrence rule and start date
 *
 * 		define. 1 for an advance reservation.
 *
 */
int
check_rrule(char *rrule, time_t dtstart, time_t dtend, char *tz, int *err_code)
{

#ifdef LIBICAL /* Standing Reservation Recurrence */
	int count = 1;
	struct icalrecurrencetype rt;
	struct icaltimetype start;
	struct icaltimetype next;
	struct icaltimetype first;
	struct icaltimetype prev;
	struct icalrecur_iterator_impl *itr;
	icaltimezone *localzone;
	int time_err = 0;
	int i;
	long min_occr_duration = -1;
	long tmp_occr_duration = 0;
	long duration;

	*err_code = 0;
	icalerror_clear_errno();

	icalerror_set_error_state(ICAL_PARSE_ERROR, ICAL_ERROR_NONFATAL);
#ifdef LIBICAL_API2
	icalerror_set_errors_are_fatal(0);
#else
	icalerror_errors_are_fatal = 0;
#endif

	if (tz == NULL || rrule == NULL)
		return 0;

	localzone = icaltimezone_get_builtin_timezone(tz);
	/* If the timezone info directory is not accessible
	 * then bail
	 */
	if (localzone == NULL) {
		*err_code = PBSE_BAD_ICAL_TZ;
		return 0;
	}

	rt = icalrecurrencetype_from_string(rrule);

	/* Check if by_day rules are defined and valid
	 * the first item in the array of by_* rule
	 * determines whether the item exists or not.
	 */
	for (i = 0; rt.by_day[i] < 8; i++) {
		if (rt.by_day[i] <= 0) {
			*err_code = PBSE_BAD_RRULE_SYNTAX;
			return 0;
		}
	}

	/* Check if by_hour rules are defined and valid
	 * the first item in the array of by_* rule
	 * determines whether the item exists or not.
	 */
	for (i = 0; rt.by_hour[i] < 25; i++) {
		if (rt.by_hour[i] < 0) {
			*err_code = PBSE_BAD_RRULE_SYNTAX;
			return 0;
		}
	}

	/* Check if frequency was correctly set */
	if (rt.freq == ICAL_NO_RECURRENCE) {
		*err_code = PBSE_BAD_RRULE_SYNTAX;
		return 0;
	}
	/* Check if the rest of the by_* rules are defined
	 * and valid.
	 * currently no support for
	 * BYMONTHDAY, BYYEARDAY, BYSECOND,
	 * BYMINUTE, BYWEEKNO, or BYSETPOS
	 *
	 */
	if (rt.by_second[0] < 61 ||    /* by_second is negative such as in -10 */
	    rt.by_minute[0] < 61 ||    /* by_minute is negative such as in -10 */
	    rt.by_year_day[0] < 367 || /* a year day is defined */
	    rt.by_month_day[0] < 31 || /* a month day is defined */
	    rt.by_week_no[0] < 52 ||   /* a week number is defined */
	    rt.by_set_pos[0] < 367) {  /* a set pos is defined */
		*err_code = PBSE_BAD_RRULE_SYNTAX;
		return 0;
	}

	/* Require that either a COUNT or UNTIL be passed. But not both. */
	if ((rt.count == 0 && icaltime_is_null_time(rt.until)) ||
	    (rt.count != 0 && !icaltime_is_null_time(rt.until))) {
		*err_code = PBSE_BAD_RRULE_SYNTAX2; /* Undefined iCalendar synax. A valid COUNT or UNTIL is required */
		return 0;
	}

	start = icaltime_from_timet_with_zone(dtstart, 0, NULL);
	icaltimezone_convert_time(&start, icaltimezone_get_utc_timezone(), localzone);

	itr = (struct icalrecur_iterator_impl *) icalrecur_iterator_new(rt, start);

	duration = dtend - dtstart;

	/* First check if the syntax of the iCalendar rule is valid */
	next = icalrecur_iterator_next(itr);

	/* Catch case where first occurrence date is in the past */
	if (icaltime_is_null_time(next)) {
		*err_code = PBSE_BADTSPEC;
		icalrecur_iterator_free(itr);
		return 0;
	}

	first = next;
	prev = first;

	for (next = icalrecur_iterator_next(itr); !icaltime_is_null_time(next); next = icalrecur_iterator_next(itr), count++) {
		/* The interval duration between two occurrences
		 * is the time between the end of an occurrence and the
		 * start of the next one
		 */
		tmp_occr_duration = icaltime_as_timet(next) - icaltime_as_timet(prev);

		/* Set the minimum time interval between occurrences */
		if (min_occr_duration == -1)
			min_occr_duration = tmp_occr_duration;
		else if (tmp_occr_duration > 0 &&
			 tmp_occr_duration < min_occr_duration)
			min_occr_duration = tmp_occr_duration;

		prev = next;
	}
	/* clean up */
	icalrecur_iterator_free(itr);

	if (icalerrno != ICAL_NO_ERROR) {
		*err_code = PBSE_BAD_RRULE_SYNTAX; /*  Undefined iCalendar syntax */
		return 0;
	}

	/* Then check if the duration fits in the frequency rule */
	switch (rt.freq) {

		case ICAL_SECONDLY_RECURRENCE: {
			if (duration > 1) {
#ifdef NAS /* localmod 005 */
				icalerrno = ICAL_BADARG_ERROR;
#else
				icalerrno = 1;
#endif								     /* localmod 005 */
				*err_code = PBSE_BAD_RRULE_SECONDLY; /* SECONDLY recurrence duration cannot exceed 1 second */
				time_err++;
			}
			break;
		}
		case ICAL_MINUTELY_RECURRENCE: {
			if (duration > 60) {
#ifdef NAS /* localmod 005 */
				icalerrno = ICAL_BADARG_ERROR;
#else
				icalerrno = 1;
#endif								     /* localmod 005 */
				*err_code = PBSE_BAD_RRULE_MINUTELY; /* MINUTELY recurrence duration cannot exceed 1 minute */
				time_err++;
			}
			break;
		}
		case ICAL_HOURLY_RECURRENCE: {
			if (duration > (60 * 60)) {
#ifdef NAS /* localmod 005 */
				icalerrno = ICAL_BADARG_ERROR;
#else
				icalerrno = 1;
#endif								   /* localmod 005 */
				*err_code = PBSE_BAD_RRULE_HOURLY; /* HOURLY recurrence duration cannot exceed 1 hour */
				time_err++;
			}
			break;
		}
		case ICAL_DAILY_RECURRENCE: {
			if (duration > (60 * 60 * 24)) {
#ifdef NAS /* localmod 005 */
				icalerrno = ICAL_BADARG_ERROR;
#else
				icalerrno = 1;
#endif								  /* localmod 005 */
				*err_code = PBSE_BAD_RRULE_DAILY; /* DAILY recurrence duration cannot exceed 24 hours */
				time_err++;
			}
			break;
		}
		case ICAL_WEEKLY_RECURRENCE: {
			if (duration > (60 * 60 * 24 * 7)) {
#ifdef NAS /* localmod 005 */
				icalerrno = ICAL_BADARG_ERROR;
#else
				icalerrno = 1;
#endif								   /* localmod 005 */
				*err_code = PBSE_BAD_RRULE_WEEKLY; /* WEEKLY recurrence duration cannot exceed 1 week */
				time_err++;
			}
			break;
		}
		case ICAL_MONTHLY_RECURRENCE: {
			if (duration > (60 * 60 * 24 * 30)) {
#ifdef NAS /* localmod 005 */
				icalerrno = ICAL_BADARG_ERROR;
#else
				icalerrno = 1;
#endif								    /* localmod 005 */
				*err_code = PBSE_BAD_RRULE_MONTHLY; /* MONTHLY recurrence duration cannot exceed 1 month */
				time_err++;
			}
			break;
		}
		case ICAL_YEARLY_RECURRENCE: {
			if (duration > (60 * 60 * 24 * 30 * 365)) {
#ifdef NAS /* localmod 005 */
				icalerrno = ICAL_BADARG_ERROR;
#else
				icalerrno = 1;
#endif								   /* localmod 005 */
				*err_code = PBSE_BAD_RRULE_YEARLY; /* YEARLY recurrence duration cannot exceed 1 year */
				time_err++;
			}
			break;
		}
		default: {
			icalerror_set_errno(ICAL_MALFORMEDDATA_ERROR);
			return 0;
		}
	}

	if (time_err)
		return 0;

	/* If the requested reservation duration exceeds
	 * the occurrence's duration then print an error
	 * message and return */
	if (count != 1 && duration > min_occr_duration) {
		*err_code = PBSE_BADTSPEC; /*  Bad Time Specification(s) */
		return 0;
	}

	return count;

#else

	*err_code = PBSE_BAD_RRULE_SYNTAX; /* iCalendar is undefined */
	return 0;
#endif
}

/**
 * @brief
 * 	Displays the occurrences in a two-column format:
 * 	the first column corresponds to the occurrence date and time
 * 	the second column corresponds to the reserved execvnode
 *
 * @par	NOTE: This is currently only used by pbs_rstat and only
 * 	for testing purpose, it is not used in production environment.
 *
 * @param[in] rrule - The recurrence rule considered
 * @param[in] dtstart - The date start of the recurrence
 * @param[in] seq_execvnodes - The condensed form of execvnodes/occurrence
 * @param[in] tz - The timezone associated to the recurrence rule
 * @param[in] ridx - The index of the occurrence from which to start displaying information
 * @param[in] count - The total number of occurrences considered
 *
 */
void
display_occurrences(char *rrule, time_t dtstart, char *seq_execvnodes, char *tz, int ridx, int count)
{

#ifdef LIBICAL
	char **short_xc;
	char **tofree;
	char *tt_str;
	time_t next = 0;
	int i = 1;

	if (tz == NULL || rrule == NULL)
		return;

	if (get_num_occurrences(rrule, dtstart, tz) == 0)
		return;

	short_xc = (char **) unroll_execvnode_seq(seq_execvnodes, &tofree);

	printf("Occurrence Dates\t Occurrence Execvnode:\n");
	for (; ridx <= count && next != -1; ridx++) {
		next = get_occurrence(rrule, dtstart, tz, i);
		i++;
		tt_str = ctime(&next);
		/* ctime adds a carriage return at the end, strip it */
		tt_str[strlen(tt_str) - 1] = '\0';
		printf("%2s %2s\n", tt_str, short_xc[ridx - 1]);
	}
	free_execvnode_seq(tofree);
	free(short_xc);
#endif
}

/**
 * @brief
 * 	Set the zoneinfo directory
 *
 * @param[in] path - The path to libical's zoneinfo
 *
 */
void
set_ical_zoneinfo(char *path)
{
#ifdef LIBICAL
	static int called = 0;
	if (path != NULL) {
		if (called)
			free_zone_directory();

		set_zone_directory(path);
		called = 1;
	}
#endif
	return;
}

#ifdef DEBUG
/**
 * @brief
 *	display the number of occurences and occurences.
 *
 * @param[in] rrule - The recurrence rule considered
 * @param[in] dtstart - The date start of the recurrence
 * @param[in] tz - The timezone associated to the recurrence rule
 *
 */
void
test_it(char *rrule, time_t dtstart, char *tz)
{
	int no;
	time_t next;
	int i;

	no = get_num_occurrences(rrule, dtstart, tz);
	printf("Number of occurrences = %d\n", no);
	next = dtstart;
	for (i = 0; i < no; i++) {
		next = get_occurrence(rrule, dtstart, tz, i + 1);
		printf("Next occurrence on %s", ctime(&next));
	}
	return;
}

/**
 * @brief
 *	print usage and wrapper function for test_it.
 *
 * @param[in] argc - num of args
 * @param[in] argv - argument list
 *
 * @return	int
 * @retval	0	success
 * #retval	1	failure
 *
 */
int
test_main(int argc, char *argv[])
{
	char *rrule;
	char *tz;
	time_t dtstart;
	int err_code;

	if (argc < 2) {
		printf("Usage: test_it <rrule>");
		return 1;
	}

	tz = getenv("PBS_TZID");
	dtstart = time(NULL);

	rrule = argv[1];
	/* apply to your local configuration */
	set_ical_zoneinfo("/usr/local/pbs/lib/ical/zoneinfo");
	test_it(rrule, dtstart, tz);
	printf("check_rrule returned %d\n", check_rrule(rrule, dtstart, 0, tz, &err_code));
	printf("get_num_occurrences = %d\n", get_num_occurrences(rrule, dtstart, tz));

	return 0;
}
#endif


================================================
FILE: src/lib/Libutil/pbs_idx.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "pbs_idx.h"
#include "avltree.h"
#include <stddef.h>
#include <stdlib.h>
#include <string.h>

/* iteration context structure, opaque to application */
typedef struct _iter_ctx {
	AVL_IX_DESC *idx; /* pointer to idx */
	AVL_IX_REC *pkey; /* pointer to key used while iteration */
} iter_ctx;

/**
 * @brief
 *	Create an empty index
 *
 * @param[in] - flags  - index flags like duplicates allowed, or case insensitive compare
 * @param[in] - keylen - length of key in index (can be 0 for default size)
 *
 * @return void *
 * @retval !NULL - success
 * @retval NULL  - failure
 *
 */
void *
pbs_idx_create(int flags, int keylen)
{
	void *idx = NULL;

	idx = malloc(sizeof(AVL_IX_DESC));
	if (idx == NULL)
		return NULL;

	if (avl_create_index(idx, flags, keylen)) {
		free(idx);
		return NULL;
	}

	return idx;
}

/**
 * @brief
 *	destroy index
 *
 * @param[in] - idx - pointer to index
 *
 * @return void
 *
 */
void
pbs_idx_destroy(void *idx)
{
	if (idx != NULL) {
		avl_destroy_index(idx);
		free(idx);
		idx = NULL;
	}
}

/**
 * @brief
 *	add entry in index
 *
 * @param[in] - idx  - pointer to index
 * @param[in] - key  - key of entry
 * @param[in] - data - data of entry
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 */
int
pbs_idx_insert(void *idx, void *key, void *data)
{
	AVL_IX_REC *pkey;

	if (idx == NULL || key == NULL)
		return PBS_IDX_RET_FAIL;

	pkey = avlkey_create(idx, key);
	if (pkey == NULL)
		return PBS_IDX_RET_FAIL;

	pkey->recptr = data;
	if (avl_add_key(pkey, idx) != AVL_IX_OK) {
		free(pkey);
		return PBS_IDX_RET_FAIL;
	}
	free(pkey);
	return PBS_IDX_RET_OK;
}

/**
 * @brief
 *	delete entry from index
 *
 * @param[in] - idx - pointer to index
 * @param[in] - key - key of entry
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 */
int
pbs_idx_delete(void *idx, void *key)
{
	AVL_IX_REC *pkey;

	if (idx == NULL || key == NULL)
		return PBS_IDX_RET_FAIL;

	pkey = avlkey_create(idx, key);
	if (pkey == NULL)
		return PBS_IDX_RET_FAIL;

	pkey->recptr = NULL;
	avl_delete_key(pkey, idx);
	free(pkey);
	return PBS_IDX_RET_OK;
}

/**
 * @brief
 *	delete exact entry from index using given context
 *
 * @param[in] - ctx - pointer to context used while
 *                    deleting exact entry in index
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 */
int
pbs_idx_delete_byctx(void *ctx)
{
	iter_ctx *pctx = (iter_ctx *) ctx;

	if (pctx == NULL || pctx->idx == NULL || pctx->pkey == NULL)
		return PBS_IDX_RET_FAIL;

	avl_delete_key(pctx->pkey, pctx->idx);
	return PBS_IDX_RET_OK;
}

/**
 * @brief
 *	find or iterate entry in index
 *
 * @param[in]     - idx  - pointer to index
 * @param[in/out] - key  - key of the entry
 *                         if *key is NULL then this routine will
 *                         return the first entry in index
 * @param[in/out] - data - data of the entry
 * @param[in/out] - ctx  - context to be set for iteration
 *                         can be NULL, if caller doesn't want
 *                         iteration context
 *                         if *ctx is not NULL, then this routine
 *                         will return next entry in index
 *
 * @return int
 * @retval PBS_IDX_RET_OK   - success
 * @retval PBS_IDX_RET_FAIL - failure
 *
 * @note
 * 	ctx should be free'd after use, using pbs_idx_free_ctx()
 *
 */
int
pbs_idx_find(void *idx, void **key, void **data, void **ctx)
{
	iter_ctx *pctx;
	AVL_IX_REC *pkey;
	int rc = AVL_IX_FAIL;

	if (idx == NULL || data == NULL)
		return PBS_IDX_RET_FAIL;

	if (ctx != NULL && *ctx != NULL) {
		pctx = (iter_ctx *) *ctx;

		*data = NULL;
		if (key)
			*key = NULL;

		if (pctx->idx != idx || pctx->pkey == NULL)
			return PBS_IDX_RET_FAIL;

		if (avl_next_key(pctx->pkey, pctx->idx) != AVL_IX_OK)
			return PBS_IDX_RET_FAIL;

		*data = pctx->pkey->recptr;
		if (key)
			*key = &pctx->pkey->key;

		return PBS_IDX_RET_OK;
	} else {
		*data = NULL;
		pkey = avlkey_create(idx, key ? *key : NULL);
		if (pkey == NULL)
			return PBS_IDX_RET_FAIL;

		if (key != NULL && *key != NULL) {
			rc = avl_find_key(pkey, idx);
		} else {
			avl_first_key(idx);
			rc = avl_next_key(pkey, idx);
		}

		if (rc == AVL_IX_OK) {
			*data = pkey->recptr;
			if (key != NULL && *key == NULL)
				*key = &pkey->key;
			if (ctx != NULL) {
				pctx = (iter_ctx *) malloc(sizeof(iter_ctx));
				if (pctx == NULL) {
					free(pkey);
					return PBS_IDX_RET_FAIL;
				}
				pctx->idx = idx;
				pctx->pkey = pkey;
				*ctx = (void *) pctx;

				return PBS_IDX_RET_OK;
			}
		}
		free(pkey);
	}

	return rc == AVL_IX_OK ? PBS_IDX_RET_OK : PBS_IDX_RET_FAIL;
}

/**
 * @brief
 *	free given iteration context
 *
 * @param[in] - ctx - pointer to context for iteration
 *
 * @return void
 *
 */
void
pbs_idx_free_ctx(void *ctx)
{
	if (ctx != NULL) {
		iter_ctx *pctx = (iter_ctx *) ctx;
		free(pctx->pkey);
		free(ctx);
		ctx = NULL;
	}
}

/**
 * @brief check whether idx is empty and has no key associated with it
 * 
 * @param[in] idx - pointer to avl index
 * 
 * @return bool
 * @retval 1 - idx is empty
 * @retval 0 - idx is not empty
 */
bool
pbs_idx_is_empty(void *idx)
{
	void *idx_ctx = NULL;
	char **data = NULL;

	if (pbs_idx_find(idx, NULL, (void **) &data, &idx_ctx) == PBS_IDX_RET_OK)
		return 0;

	return 1;
}


================================================
FILE: src/lib/Libutil/pbs_secrets.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_SECRETS_H
#define _PBS_SECRETS_H
#ifdef __cplusplus
extern "C" {
#endif

#include <pbs_config.h> /* the master config generated by configure */
#include "ticket.h"

/**
 * @file	pbs_secrets.c
 * @brief
 *	Key and iv to use with the AES encryption routines.
 */
unsigned char pbs_aes_key[][16] = {
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00}};

unsigned char pbs_aes_iv[][16] = {
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00},
	{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00}};

#ifdef __cplusplus
}
#endif
#endif /* _PBS_SECRETS_H */


================================================
FILE: src/lib/Libutil/range.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>
#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <errno.h>
#include <string.h>
#include <log.h>
#include <libutil.h>
#include "range.h"

/**
 * @brief
 *		new_range - allocate and initialize a range structure
 *
 * @return	newly allocated range
 * @retval	NULL	: on error
 *
 */
range *
new_range(int start, int end, int step, int count, range *next)
{
	range *r;

	if ((r = malloc(sizeof(range))) == NULL) {
		log_err(errno, __func__, RANGE_MEM_ERR_MSG);
		return NULL;
	}

	r->start = start;
	r->end = end;
	r->step = step;
	r->count = count;
	r->next = next;

	return r;
}

/**
 * @brief
 *		free_range_list - free a list of ranges
 *
 * @param[in,out]	r	-	range list to be freed.
 *
 * @return	nothing
 *
 */
void
free_range_list(range *r)
{
	range *cur_r;
	range *next_r;

	cur_r = r;

	while (cur_r != NULL) {
		next_r = cur_r->next;
		free_range(cur_r);

		cur_r = next_r;
	}
}

/**
 * @brief
 *		free_range - free a range structure
 *
 * @param[in,out]	r	-	range structure to be freed.
 *
 * @return	nothing
 *
 */
void
free_range(range *r)
{
	if (r == NULL)
		return;

	free(r);
}

/**
 * @brief
 *		dup_range_list - duplicate a range list
 *
 * @param[in]	old_r	-	range to dup;
 *
 * @return	newly duplicated range list
 *
 */
range *
dup_range_list(range *old_r)
{
	range *new_r;
	range *new_r_head = NULL;
	range *cur_old_r;
	range *prev_new_r = NULL;

	if (old_r == NULL)
		return NULL;

	cur_old_r = old_r;

	while (cur_old_r != NULL) {
		new_r = dup_range(cur_old_r);
		if (new_r == NULL) {
			free_range_list(new_r_head);
			return NULL;
		}

		if (prev_new_r != NULL)
			prev_new_r->next = new_r;
		else
			new_r_head = new_r;

		cur_old_r = cur_old_r->next;
		prev_new_r = new_r;
	}

	return new_r_head;
}

/**
 * @brief
 *		dup_range - duplicate a range structure
 *
 * @param[in]	old_r	-	range structure to duplicate
 *
 * @return	new range structure
 * @retval	NULL	: on error
 *
 */
range *
dup_range(range *old_r)
{
	range *new_r;

	if (old_r == NULL)
		return NULL;

	new_r = new_range(old_r->start, old_r->end, old_r->step, old_r->count, NULL);

	return new_r;
}

/**
 * @brief
 *	range_count - count number of elements in a given range structure
 *
 * @param[in]	r - range structure to count
 *
 * @return int
 * @retval # - number of elements in range
 *
 */
int
range_count(range *r)
{
	int count = 0;
	range *cur = r;

	while (cur != NULL) {
		count += cur->count;
		cur = cur->next;
	}
	return count;
}

/**
 * @brief
 *		range_parse - parse string of ranges delimited by comma
 *
 * @param[in]	str	-	string of ranges to parse
 *
 * @return	list of ranges
 * @retval	NULL	: on error
 *
 */
range *
range_parse(char *str)
{
	range *head = NULL;
	range *cur = NULL;
	range *r;
	char *p;
	char *endp;
	int ret;

	if (str == NULL)
		return NULL;

	p = str;

	do {
		int start;
		int end;
		int step;
		int count;

		ret = parse_subjob_index(p, &endp, &start, &end, &step, &count);
		if (!ret) {
			r = new_range(start, end, step, count, NULL);

			if (r == NULL) {
				free_range_list(head);
				return NULL;
			}

			/* ensure the end value is contained in the range */
			while (range_contains(r, end) == 0 && end > start)
				end--;

			if (range_contains(r, end))
				r->end = end;
			else { /* range is majorly hosed */
				free_range_list(head);
				free_range(r);
				return NULL;
			}

			if (head == NULL)
				head = cur = r;
			else {
				cur->next = r;
				cur = r;
			}

			p = endp;
		}
	} while (!ret);

	if (ret == -1) {
		free_range_list(head);
		return NULL;
	}

	return head;
}

/**
 * @brief
 *		range_next_value - get the next value in a range
 *			   if a current value is given, return the next
 *			   if no current value is given, return the first
 *
 * @param[in]	r	-	the range to return the value from
 * @param[in]	cur_value	-	the current value or if negative, no value
 *
 * @return	the next value in the range
 * @retval	-1	: on error
 * @retval	-2	: if there is no next value
 *
 */
int
range_next_value(range *r, int cur_value)
{
	range *cur;
	int ret_val = -2;

	if (r == NULL)
		return -1;

	if (cur_value < 0)
		return r->start;

	if (range_contains(r, cur_value) == 0)
		return -1;

	cur = r;
	while (cur != NULL && ret_val < 0) {
		if (range_contains_single(cur, cur_value)) {
			if (cur_value == cur->end) {
				if (cur->next != NULL)
					ret_val = cur->next->start;
			} else
				ret_val = cur_value + cur->step;
		}
		cur = cur->next;
	}

	return ret_val;
}
/**
 * @brief
 *		range_contains - find if a range contains a value
 *
 * @param[in]	r	-	range to search
 * @param[in]	val	-	val to find
 *
 * @return	int
 * @retval	1	: if the range contains the value
 * @retval	0	: if the range does not contain the value
 *
 */
int
range_contains(range *r, int val)
{
	range *cur;
	int found = 0;

	cur = r;

	while (cur != NULL && !found) {
		if (range_contains_single(cur, val))
			found = 1;

		cur = cur->next;
	}

	if (found)
		return 1;

	return 0;
}

/**
 * @brief
 *		range_contains_single - is a value contained in a single range
 *				  structure
 *
 * @param[in]	r	-	the range structure
 * @param[in]	val	-	the value
 *
 * @return	int
 * @retval	1	: if the value is in the single range structure
 * @retval	0	: if not
 *
 */
int
range_contains_single(range *r, int val)
{
	if (r == NULL)
		return 0;

	if (val >= r->start && val <= r->end)
		if ((val - r->start) % r->step == 0)
			return 1;

	return 0;
}

/**
 * @brief
 *		range_remove_value - remove a value from a range list
 *
 * @param[in,out]	r	-	pointer to pointer to the head of the range
 * @param[in]	val	-	value to remove
 *
 * @return	int
 * @retval	1	: on success
 * @retval	0	: if not done (see note)
 *
 * @par	NOTE: value of r might be changed if the last value of first range
 *		  is removed. only supports removing values from either the start or end
 *	      of a range, not in the middle
 *
 */

int
range_remove_value(range **r, int val)
{
	range *cur;
	range *prev = NULL;
	int done = 0;

	if (r == NULL || *r == NULL || val < 0)
		return 0;

	if (!range_contains(*r, val))
		return 0;

	cur = *r;
	while (cur != NULL && !done) {
		if (cur->start == val && cur->end == val) {
			if (prev == NULL) /* we're removing the first range struct in the list */
				*r = (*r)->next;
			else
				prev->next = cur->next;
			free_range(cur);
			return 1;
		} else if (cur->start == val) {
			cur->start += cur->step;
			cur->count--;
			done = 1;
		} else if (cur->end == val) {
			cur->end -= cur->step;
			cur->count--;
			done = 1;
		} else if ((val > cur->start) && (val < cur->end)) {
			range *next_range = NULL;
			if ((next_range = new_range(0, 0, 1, 0, NULL)) == NULL)
				return 0;

			next_range->count = (cur->end - val) / cur->step;
			next_range->step = cur->step;
			next_range->start = val + cur->step;
			next_range->end = cur->end;
			next_range->next = cur->next;

			cur->count = (val - cur->start) / cur->step;
			cur->end = val - cur->step;
			cur->next = next_range;
			return 1;
		}

		if (!done) {
			prev = cur;
			cur = cur->next;
		}
	}

	if (done) {
		/* we removed the last value from this section of the range */
		if (cur->start > cur->end) {
			if (prev == NULL) /* we're removing the first range struct in the list */
				*r = (*r)->next;
			else
				prev->next = cur->next;
			free_range(cur);
		}
		return 1;
	}

	/* we didn't remove it */
	return 0;
}

/**
 * @brief
 *		range_add_value - add a value to a range list by adding it to the end
 *			  of the list
 *
 * @param[in,out]	r	-	pointer to pointer to the head of the range
 * @param[in]	val	-	value to add
 * @param[in]	type	-	enable/disable subrange stepping
 *
 * @return	int
 * @retval	1	: if successfully added value
 * @retval	0	: if val is in range, or val not successfully added
 *
 */
int
range_add_value(range **r, int val, int range_step)
{
	range *cur; /* current range structure in list */
	range *next_range;

	if (r == NULL)
		return 0;

	if (*r == NULL) {
		/* If there are no range structs in the list; create the new range for first value */
		range *first_range = NULL;
		if ((first_range = new_range(val, val, range_step, 1, NULL)) == NULL) {
			return 0;
		}
		*r = first_range;
		return 1;
	}

	cur = *r;
	/* Value falls before the first sub-range */
	if (cur != NULL && val < cur->start) {
		if (val == cur->start - cur->step) {
			cur->start -= cur->step;
			cur->count++;
			return 1;
		} else {
			/* Add new range as the first element with same value */
			range *first_range = NULL;
			if ((first_range = new_range(val, val, cur->step, 1, cur)) == NULL) {
				return 0;
			}
			*r = first_range;
			return 1;
		}
	}

	/* The value that needs to be added is in between the cur and the next sub-ranges  */

	while (cur != NULL && cur->next != NULL) {

		next_range = cur->next;
		if ((val > cur->end) && (val < next_range->start)) {

			if ((val == cur->end + cur->step) && (val == next_range->start - next_range->step)) {
				/* Adding this value would coalesce these two sub-ranges  */
				cur->end = next_range->end;
				cur->next = next_range->next;
				cur->count += next_range->count + 1;
				free_range(next_range);
				return 1;

			} else if (val == cur->end + cur->step) {
				/* Value falls in the cur sub-range end  */
				cur->end += cur->step;
				cur->count++;
				return 1;

			} else if (val == next_range->start - next_range->step) {
				/* Value falls in the next sub-range start  */
				next_range->start -= next_range->step;
				next_range->count++;
				return 1;

			} else {
				/* Value falls in this range; add new mid-range with same value */
				range *mid_range = NULL;
				if ((mid_range = new_range(val, val, cur->step, 1, cur->next)) == NULL) {
					return 0;
				}
				cur->next = mid_range;
				return 1;
			}
		}
		cur = next_range;
	}

	/* Coming out of the loop and check the extreme right corner case */

	if (cur != NULL && val > cur->end) {
		if (val == cur->end + cur->step) {
			cur->end += cur->step;
			cur->count++;
			return 1;
		} else {
			/* Add new range at the end with same value */
			range *end_range = NULL;
			if ((end_range = new_range(val, val, cur->step, 1, NULL)) == NULL) {
				return 0;
			}
			cur->next = end_range;
			return 1;
		}
	}

	return 0;
}

/**
 * @brief
 *		range_intersection - create an intersection between two ranges
 *
 * @param[in]	r1	-	range 1
 * @param[in]	r2	-	range 2
 *
 * @return	a new range which is the intersection of r1 and r2
 * @retval	NULL	: on error or intersection is the null set
 *
 */
range *
range_intersection(range *r1, range *r2)
{
	range *intersection = NULL;
	int cur = 0;

	if (r1 == NULL || r2 == NULL)
		return NULL;

	cur = range_next_value(r1, -1);

	while (cur >= 0) {
		if (range_contains(r2, cur))
			range_add_value(&intersection, cur, r2->step);
		cur = range_next_value(r1, cur);
	}
	return intersection;
}

/**
 * @brief
 *		parse_subjob_index - parse a subjob index range of the form:
 *		START[-END[:STEP]][,...]
 *		Each call parses up to the first comma or if no comma the end of
 *		the string or a ']'
 * @param[in]	pc	-	range of sub jobs
 * @param[out]	ep	-	ptr to character that terminated scan (comma or new-line)
 * @param[out]	pstart	-	first number of range
 * @param[out]	pend	-	maximum value in range
 * @param[out]	pstep	-	stepping factor
 * @param[out]	pcount -	number of entries in this section of the range
 *
 * @return	integer
 * @retval	0	- success
 * @retval	1	- no (more) indices are found
 * @retval	-1	- parse/format error
 */
int
parse_subjob_index(char *pc, char **ep, int *pstart, int *pend, int *pstep, int *pcount)
{
	int start;
	int end;
	int step;
	char *eptr;

	if (pc == NULL)
		return (-1);

	while (isspace((int) *pc) || (*pc == ','))
		pc++;
	if ((*pc == '\0') || (*pc == ']')) {
		*pcount = 0;
		*ep = pc;
		return (1);
	}

	if (!isdigit((int) *pc)) {
		/* Invalid format, 1st char not digit */
		return (-1);
	}
	start = (int) strtol(pc, &eptr, 10);
	pc = eptr;
	while (isspace((int) *pc))
		pc++;
	if ((*pc == ',') || (*pc == '\0') || (*pc == ']')) {
		/* "X," or "X" case */
		end = start;
		step = 1;
		if (*pc == ',')
			pc++;
	} else {
		/* should be X-Y[:Z] case */
		if (*pc != '-') {
			/* Invalid format, not in X-Y format */
			*pcount = 0;
			return (-1);
		}
		end = (int) strtol(++pc, &eptr, 10);
		pc = eptr;
		if (isspace((int) *pc))
			pc++;
		if ((*pc == '\0') || (*pc == ',') || (*pc == ']')) {
			step = 1;
		} else if (*pc++ != ':') {
			/* Invalid format, not in X-Y:z format */
			*pcount = 0;
			return (-1);
		} else {
			while (isspace((int) *pc))
				pc++;
			step = (int) strtol(pc, &eptr, 10);
			pc = eptr;
			while (isspace((int) *pc))
				pc++;
			if (*pc == ',')
				pc++;
		}

		/* y must be greater than x for a range and z must be greater 0 */
		if ((start >= end) || (step < 1))
			return (-1);
	}

	*ep = pc;
	/* now compute the number of extires ((end + 1) - start + (step - 1)) / step = (end - start + step) / step */
	*pcount = (end - start + step) / step;
	*pstart = start;
	*pend = end;
	*pstep = step;
	return (0);
}

/**
 * @brief
 * 		Returns a string representation of a range structure.
 *
 * @param[in]	r	-	The range for which a string representation is expected

 * @par MT-safe:	no
 *
 * @return	a string representation of the range
 * @retval	""	: on any malloc error
 *
 */
char *
range_to_str(range *r)
{
	static char *range_str = NULL;
	static int size = 0;
	range *cur_r = NULL;
	char numbuf[128];
	int len;

	if (r == NULL)
		return "";

	if (range_str == NULL) {
		if ((range_str = malloc(INIT_RANGE_ARR_SIZE + 1)) == NULL) {
			log_err(errno, __func__, RANGE_MEM_ERR_MSG);
			return "";
		}
		size = INIT_RANGE_ARR_SIZE;
	}
	range_str[0] = '\0';

	for (cur_r = r; cur_r != NULL; cur_r = cur_r->next) {
		if (cur_r->count > 1)
			sprintf(numbuf, "%d-%d", cur_r->start, cur_r->end);
		else
			sprintf(numbuf, "%d", cur_r->start);

		if (cur_r->step > 1 && cur_r->count > 1) {
			if (pbs_strcat(&range_str, &size, numbuf) == NULL)
				return "";
			sprintf(numbuf, ":%d", cur_r->step);
			if (pbs_strcat(&range_str, &size, numbuf) == NULL)
				return "";
		} else if (pbs_strcat(&range_str, &size, numbuf) == NULL)
			return "";

		if (pbs_strcat(&range_str, &size, ",") == NULL)
			return "";
	}
	len = strlen(range_str);
	if (range_str[len - 1] == ',')
		range_str[len - 1] = '\0';

	return range_str;
}

/**
 * @brief	Join r1 and r2 by removing the duplicate values 
 * 
 * @param[in] r1 range of sub job
 * @param[in] r2 range of sub job
 * @return range
 * @retval r3 superset of r1 and r2 ranges
 * @retval NULL if not done
 */
range *
range_join(range *r1_in, range *r2_in)
{
	range *r1 = dup_range_list(r1_in);
	range *r2 = dup_range_list(r2_in);
	range *ri = NULL;
	range *r3 = NULL;
	int cur = 0;
	ri = range_intersection(r1, r2);
	if (ri != NULL) {
		/* XOR */
		cur = range_next_value(ri, -1);
		while (cur >= 0) {
			if (range_contains(r1, cur)) {
				range_remove_value(&r1, cur);
			}
			if (range_contains(r2, cur)) {
				range_remove_value(&r2, cur);
			}
			cur = range_next_value(ri, cur);
		}
		/* JOIN r1, r2 and ri in r3*/
		r3 = dup_range(r1);
		cur = range_next_value(ri, -1);
		while (cur >= 0) {
			range_add_value(&r3, cur, 1);
			cur = range_next_value(ri, cur);
		}
		cur = range_next_value(r2, -1);
		while (cur >= 0) {
			range_add_value(&r3, cur, 1);
			cur = range_next_value(r2, cur);
		}
		free_range_list(ri);
	} else {
		r3 = dup_range(r1);
		cur = range_next_value(r2, -1);
		while (cur >= 0) {
			range_add_value(&r3, cur, 1);
			cur = range_next_value(r2, cur);
		}
	}
	free_range_list(r1);
	free_range_list(r2);
	return r3;
}


================================================
FILE: src/lib/Libutil/thread_utils.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	thread_utils.c
 * @brief
 * thread_utils.c - contains utility functions for multi-threading using pthread
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <pthread.h>

/**
 * @brief	initialize a mutex attr object
 *
 * @param[out]	attr - the attr object to initialize
 *
 * @return int
 * @retval 0 for Success
 * @retval -1 for Error
 */
int
init_mutex_attr_recursive(pthread_mutexattr_t *attr)
{
	if (pthread_mutexattr_init(attr) != 0) {
		return -1;
	}

	if (pthread_mutexattr_settype(attr,
#if defined(linux)
				      PTHREAD_MUTEX_RECURSIVE_NP
#else
				      PTHREAD_MUTEX_RECURSIVE
#endif
				      )) {
		return -1;
	}

	return 0;
}


================================================
FILE: src/lib/Libutil/work_task.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	work_task.c
 * @brief
 * work_task.c - contains functions to deal with the server's task list
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "portability.h"
#include <stdlib.h>
#include <time.h>
#include <sys/param.h>
#include <sys/types.h>
#include <sys/wait.h>
#include "server_limits.h"
#include "list_link.h"
#include "work_task.h"

/* Global Data Items: */

extern pbs_list_head task_list_immed;	   /* list of tasks that can execute now */
extern pbs_list_head task_list_interleave; /* list of tasks that can execute after interleaving other tasks */
extern pbs_list_head task_list_timed;	   /* list of tasks that have set start times */
extern pbs_list_head task_list_event;	   /* list of tasks responding to an event */
extern int svr_delay_entry;
extern time_t time_now;

/**
 *
 * @brief
 * 	Creates a task of type 'type', 'event_id', and when task is dispatched,
 *	execute func with argument 'parm'. The task is added to
 *	'task_list_immed' if 'type' is  WORK_Immed; otherwise, task is added
 *	'task_list_event'.
 *
 * @param[in]	type - of task
 * @param[in]	event_id - event id of the task
 * @param[in]	func - function that will be executed in behalf of the task
 * @param[in]	parm - parameter to 'func'
 *
 * @return struct work_task *
 * @retval <a work task entry>	- for success
 * @retval NULL			- for any error
 *
 */
struct work_task *
set_task(enum work_type type, long event_id, void (*func)(struct work_task *), void *parm)
{
	struct work_task *pnew;
	struct work_task *pold;

	pnew = (struct work_task *) malloc(sizeof(struct work_task));
	if (pnew == NULL)
		return NULL;
	CLEAR_LINK(pnew->wt_linkevent);
	CLEAR_LINK(pnew->wt_linkobj);
	CLEAR_LINK(pnew->wt_linkobj2);
	pnew->wt_event = event_id;
	pnew->wt_event2 = NULL;
	pnew->wt_type = type;
	pnew->wt_func = func;
	pnew->wt_parm1 = parm;
	pnew->wt_parm2 = NULL;
	pnew->wt_parm3 = NULL;
	pnew->wt_aux = 0;
	pnew->wt_aux2 = 0;

	if (type == WORK_Immed)
		append_link(&task_list_immed, &pnew->wt_linkevent, pnew);
	else if (type == WORK_Interleave)
		append_link(&task_list_interleave, &pnew->wt_linkevent, pnew);
	else if (type == WORK_Timed) {
		pold = (struct work_task *) GET_NEXT(task_list_timed);
		while (pold) {
			if (pold->wt_event > pnew->wt_event)
				break;
			pold = (struct work_task *) GET_NEXT(pold->wt_linkevent);
		}
		if (pold)
			insert_link(&pold->wt_linkevent, &pnew->wt_linkevent, pnew,
				    LINK_INSET_BEFORE);
		else
			append_link(&task_list_timed, &pnew->wt_linkevent, pnew);
	} else
		append_link(&task_list_event, &pnew->wt_linkevent, pnew);
	return (pnew);
}

/**
 *
 * @brief
 * 	Convert a work task to the type specified.
 *
 * @param[in]	ptask	- task being converted
 * @param[in]	wtype	- work task type to convert
 *
 * @return int
 * @retval 0: success
 * @retval -1: failure
 */
int
convert_work_task(struct work_task *ptask, enum work_type wtype)
{
	pbs_list_head *list;

	if (!ptask)
		return -1;

	switch (wtype) {
		case WORK_Immed:
			list = &task_list_immed;
			break;
		case WORK_Timed:
			list = &task_list_timed;
			break;
		default:
			list = &task_list_event;
	}

	delete_link(&ptask->wt_linkevent);
	append_link(list, &ptask->wt_linkevent, ptask);

	return 0;
}

/**
 *
 * @brief
 * 	Dispatches a work task found on a work list
 *
 * @param[in]	ptask	- task being dispatched
 *
 * @note:
 *	This also deletes the work task entry, calls the associated function
 *	with the parameters from the work task entry, and then frees the
 *	entry.
 */

void
dispatch_task(struct work_task *ptask)
{
	delete_link(&ptask->wt_linkevent);
	delete_link(&ptask->wt_linkobj);
	delete_link(&ptask->wt_linkobj2);
	if (ptask->wt_func)
		ptask->wt_func(ptask); /* dispatch process function */
	(void) free(ptask);
}

/**
 *
 * @brief
 * 	Unlinks and frees a work_task structure.
 *
 * @param[in]	ptask	- the task entry being deleted.
 */

void
delete_task(struct work_task *ptask)
{
	delete_link(&ptask->wt_linkobj);
	delete_link(&ptask->wt_linkobj2);
	delete_link(&ptask->wt_linkevent);
	(void) free(ptask);
}

/**
 * @brief
 *	Check if some task in the specified task list
 *	has a wt_parm1 matching 'parm1'
 *	and wt_func matching 'func'
 *
 * @param[in]	task_list - header of task list to be searched
 * @param[in]	parm1	- parameter being matched.
 * @param[in]	func	- function being matched.
 *
 * @return work task
 * @retval	!NULL if 'parm1' and 'func' was matched
 * @retval	NULL otherwise
 */
static struct work_task *
find_worktask_by_parm_func(pbs_list_head task_list, void *parm1, void *func)
{
	struct work_task *ptask;
	struct work_task *ptask_next;

	for (ptask = GET_NEXT(task_list); ptask; ptask = ptask_next) {
		ptask_next = GET_NEXT(ptask->wt_linkevent);

		if (parm1 && (ptask->wt_parm1 != parm1))
			continue;
		if (func && (ptask->wt_func != func))
			continue;

		return ptask;
	}

	return NULL;
}

/**
 * @brief
 *	Check if some task in in any of the task lists (task_list_event,
 *	task_list_timed, task_list_immed)
 *	has a wt_parm1 matching 'parm1'
 *	and wt_func matching 'func'
 *
 * @param[in]	wtype - work task type enum, -1 to match all
 * @param[in]	parm1	- parameter being matched. NULL to ignore this field.
 * @param[in]	func	- function being matched. NULL to ignore this field.
 *
 * @return work task
 * @retval	!NULL if 'parm1' and 'func' was matched
 * @retval	NULL otherwise
 */
struct work_task *
find_work_task(enum work_type wtype, void *parm1, void *func)
{
	struct work_task *ptask;

	if (wtype == -1 || wtype == WORK_Immed) {
		ptask = find_worktask_by_parm_func(task_list_immed, parm1, func);
		if (ptask)
			return ptask;
	}

	if (wtype == -1 || wtype == WORK_Timed) {
		ptask = find_worktask_by_parm_func(task_list_timed, parm1, func);
		if (ptask)
			return ptask;
	}

	if (wtype == -1 || (wtype != WORK_Timed && wtype != WORK_Immed)) {
		ptask = find_worktask_by_parm_func(task_list_event, parm1, func);
		if (ptask)
			return ptask;
	}

	return NULL;
}

/**
 *
 * @brief
 *	Delete task found in task_list_event, task_list_immed, or
 *	task_list_timed by either its function pointer, parm1, or both.
 * 	At least one of the function pointer or parm1 must not be NULL.
 *
 * @param[in]	parm1	- wt->parm1 parameter to match (can be NULL)
 * @param[in]	func	- function pointer to match (can be NULL)
 * @param[in]	option  - option is used to decide whether the
 *			  caller wants to delete all tasks that
 *			  matches parm1 values or just one.
 *
 * @return none
 */
void
delete_task_by_parm1_func(void *parm1, void (*func)(struct work_task *), enum wtask_delete_option option)
{
	struct work_task *ptask;
	struct work_task *ptask_next;
	pbs_list_head task_lists[] = {task_list_event, task_list_timed, task_list_immed};
	int i;

	if (parm1 == NULL && func == NULL)
		return;

	for (i = 0; i < 3; i++) {
		for (ptask = (struct work_task *) GET_NEXT(task_lists[i]); ptask; ptask = ptask_next) {
			ptask_next = (struct work_task *) GET_NEXT(ptask->wt_linkevent);

			if ((parm1 != NULL) && (ptask->wt_parm1 != parm1))
				continue;
			if ((func != NULL) && (ptask->wt_func != func))
				continue;

			delete_task(ptask);
			if (option == DELETE_ONE)
				return;
		}
	}
}

/**
 *
 * @brief
 *	Check if some task in any of the task lists (task_list_event,
 *	task_list_timed, task_list_immed) has a wt_parm1 matching 'parm1'.
 *
 * @param[in]	parm1	- parameter being matched.
 *
 * @return int
 * @retval	1 if 'parm1' was matched
 * @retval	0 otherwise
 */
int
has_task_by_parm1(void *parm1)
{
	struct work_task *ptask;

	/* only 1 ptask can be possibly matched */
	ptask = find_work_task(-1, parm1, NULL);
	if (ptask)
		return 1;

	return 0;
}

/**
 * @brief
 *	Looks for the next work task to perform:
 *	1. If svr_delay_entry is set, then a delayed task in the
 *	   task_list_event is ready so find and process it.
 *	2. All items on the immediate list, then
 *	3. All items on the timed task list which have expired times
 *
 * @return time_t
 * @retval The amount of time till next task
 */

time_t
default_next_task(void)
{
	time_t delay;
	struct work_task *nxt;
	struct work_task *ptask;
	struct work_task *last_interleave_task;
	/*
	 * tilwhen is the basic "idle" time if there is nothing pending sooner
	 * for the Server (timed-events, call scheduler, IO)
	 * It used to be 10, but that caused a delay of outgoing TPP packets
	 * in some cases, and we don't burn too many extra cycles doing nothing
	 * if the delay is shorted to 2.
	 */
	time_t tilwhen = 2; /* basic cycle time */

	time_now = time(NULL);

	if (svr_delay_entry) {
		ptask = (struct work_task *) GET_NEXT(task_list_event);
		while (ptask) {
			nxt = (struct work_task *) GET_NEXT(ptask->wt_linkevent);
			if (ptask->wt_type == WORK_Deferred_Cmp)
				dispatch_task(ptask);
			ptask = nxt;
		}
		svr_delay_entry = 0;
	}

	while ((ptask = (struct work_task *) GET_NEXT(task_list_immed)) != NULL)
		dispatch_task(ptask);

	last_interleave_task = (struct work_task *) GET_PRIOR(task_list_interleave);
	while ((ptask = (struct work_task *) GET_NEXT(task_list_interleave)) != NULL) {
		dispatch_task(ptask);
		if (ptask == last_interleave_task)
			break;
	}

	if (GET_NEXT(task_list_interleave)) {
		/* more tasks waiting, wait least */
		tilwhen = 0;
	}

	while ((ptask = (struct work_task *) GET_NEXT(task_list_timed)) != NULL) {
		if ((delay = ptask->wt_event - time_now) > 0) {
			if (tilwhen > delay)
				tilwhen = delay;
			break;
		} else {
			dispatch_task(ptask); /* will delete link */
		}
	}

	return (tilwhen);
}


================================================
FILE: src/lib/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = \
	Libattr \
	Libdb \
	Liblog \
	Libnet \
	Libifl \
	Libpbs \
	Libpython \
	Libsite \
	Libsec \
	Libtpp \
	Libutil \
	Libauth \
	Liblicensing \
	Libjson


================================================
FILE: src/modules/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = python


================================================
FILE: src/modules/python/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

pbs_v1_sodir = $(libdir)/python/altair

pbs_v1_so_LTLIBRARIES = \
	_pbs_v1.la \
	_pbs_ifl.la

nodist_pbs_v1_so_PYTHON = $(top_builddir)/src/lib/Libifl/pbs_ifl.py

_pbs_v1_la_SOURCES = \
	$(top_builddir)/src/lib/Libattr/attr_fn_acl.c \
	$(top_builddir)/src/lib/Libattr/attr_fn_entlim.c \
	$(top_builddir)/src/lib/Libattr/attr_fn_resc.c \
	$(top_builddir)/src/lib/Libattr/attr_fn_time.c \
	$(top_builddir)/src/lib/Libattr/attr_node_func.c \
	$(top_builddir)/src/lib/Libattr/job_attr_def.c \
	$(top_builddir)/src/lib/Libattr/node_attr_def.c \
	$(top_builddir)/src/lib/Libattr/queue_attr_def.c \
	$(top_builddir)/src/lib/Libattr/resc_def_all.c \
	$(top_builddir)/src/lib/Libattr/resv_attr_def.c \
	$(top_builddir)/src/lib/Libattr/sched_attr_def.c \
	$(top_builddir)/src/lib/Libattr/svr_attr_def.c \
	$(top_srcdir)/src/lib/Libpython/shared_python_utils.c \
	$(top_srcdir)/src/lib/Libpython/common_python_utils.c \
	$(top_srcdir)/src/lib/Libpython/pbs_python_external.c \
	$(top_srcdir)/src/lib/Libpython/pbs_python_svr_external.c \
	$(top_srcdir)/src/lib/Libpython/module_pbs_v1.c \
	$(top_srcdir)/src/lib/Libpython/pbs_python_svr_internal.c \
	$(top_srcdir)/src/lib/Libpython/pbs_python_svr_size_type.c \
	$(top_srcdir)/src/lib/Libpython/pbs_python_import_types.c \
	$(top_srcdir)/src/lib/Libutil/entlim.c \
	$(top_srcdir)/src/lib/Libutil/hook.c \
	$(top_srcdir)/src/lib/Libutil/work_task.c \
	$(top_srcdir)/src/server/resc_attr.c \
	$(top_srcdir)/src/server/setup_resc.c \
	$(top_srcdir)/src/server/vnparse.c \
	$(top_srcdir)/src/server/jattr_get_set.c \
	$(top_srcdir)/src/server/sattr_get_set.c \
	$(top_srcdir)/src/server/qattr_get_set.c \
	$(top_srcdir)/src/server/nattr_get_set.c \
	$(top_srcdir)/src/server/rattr_get_set.c \
	pbs_v1_module_init.c
_pbs_v1_la_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@PYTHON_INCLUDES@ \
	@KRB5_CFLAGS@
_pbs_v1_la_LDFLAGS = \
	-module \
	-shared \
	-export-dynamic \
	-avoid-version
_pbs_v1_la_LIBADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la

nodist__pbs_ifl_la_SOURCES = $(top_builddir)/src/lib/Libifl/pbs_ifl_wrap.c
_pbs_ifl_la_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@PYTHON_INCLUDES@
_pbs_ifl_la_LDFLAGS = \
	-module \
	-shared \
	-export-dynamic \
	-avoid-version \
	-no-undefined \
	@PYTHON_LDFLAGS@
_pbs_ifl_la_LIBADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la

pbsmoduledir = $(libdir)/python/altair/pbs

pbsmodule_PYTHON = pbs/__init__.py

pbsv1moduledir = $(libdir)/python/altair/pbs/v1

pbsv1module_PYTHON = \
	pbs/v1/__init__.py \
	pbs/v1/_attr_types.py \
	pbs/v1/_base_types.py \
	pbs/v1/_exc_types.py \
	pbs/v1/_export_types.py \
	pbs/v1/_svr_types.py \
	pbs/v1/_pmi_types.py \
	pbs/v1/_pmi_sgi.py \
	pbs/v1/_pmi_cray.py \
	pbs/v1/_pmi_none.py \
	pbs/v1/_pmi_utils.py


pbshooksdir = $(libdir)/python/altair/pbs_hooks

dist_pbshooks_DATA = \
	pbs_hooks/PBS_power.HK \
	pbs_hooks/PBS_power.PY \
	pbs_hooks/PBS_power.CF \
	pbs_hooks/PBS_alps_inventory_check.HK \
	pbs_hooks/PBS_alps_inventory_check.PY \
	pbs_hooks/PBS_xeon_phi_provision.HK \
	pbs_hooks/PBS_xeon_phi_provision.PY \
	pbs_hooks/PBS_cray_atom.HK \
	pbs_hooks/PBS_cray_atom.PY \
	pbs_hooks/PBS_cray_atom.CF


================================================
FILE: src/modules/python/pbs/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

# Allow pbs.v1 (Python support routines) and _pbs_v1 (C support routines)
# to be callable under "pbs." prefix.
from _pbs_v1 import *
from pbs.v1 import *


================================================
FILE: src/modules/python/pbs/v1/__init__.py
================================================
# coding: utf-8
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


The PBS Python V1 package
"""

#: the following is used by the embedded interpreter
from ._export_types import EXPORTED_TYPES_DICT
#: import all types from pbs_v1 C module
from _pbs_v1 import *
#
from ._base_types import *
from ._exc_types import *
from ._svr_types import *

#: this is Power Management Infrastructure which may not exist on all system
#: types yet
try:
    from ._pmi_types import *
except ImportError:
    pass


================================================
FILE: src/modules/python/pbs/v1/_attr_types.py
================================================
# coding: utf-8
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
__doc__ = """
All Python representation of internal PBS attribute structures.
"""
# All types available when doing a
__all__ = (
           'acl_group_enable',
           'acl_groups',
           'acl_host_enable',
           'hosts',
           'acl_user_enable',
           'enabled',
           'from_route_only',
           'max_array_size',
           'max_queuable',
           'max_running'
           )

#from _pbs_v1 import _attr
_attr = object
#                            (BEGIN) QUEUE  ATTRIBUTES

class acl_group_enable(_attr):
    pass

class acl_groups(_attr):
    pass

class acl_host_enable(_attr):
    pass

class hosts(_attr):
    pass

class acl_user_enable(_attr):
    pass

class acl_users(_attr):
    pass

class enabled(_attr):
    pass

class from_route_only(_attr):
    pass

class max_array_size(_attr):
    pass

class max_queuable(_attr):
    pass

class max_running(_attr):
    pass

class node_group_key(_attr):
    pass

class Priority(_attr):
    pass


#                            (END) QUEUE  ATTRIBUTES


================================================
FILE: src/modules/python/pbs/v1/_base_types.py
================================================
# coding: utf-8
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
__doc__ = """
All Python based types mapping to PBS attribute types.
"""

_ATTRIBUTES_KEY_NAME = 'attributes'

__all__ = ['_generic_attr',
           'size',
           'to_bytes',
           'size_to_kbytes',
           'duration',
           'pbs_env',
           'email_list',
           'pbs_list',
           'pbs_bool',
           'pbs_int',
           'pbs_str',
           'pbs_float',
           'acl',
           'select',
           'place',
           'exec_host',
           'exec_vnode',
           'checkpoint',
           'depend',
           'group_list',
           'user_list',
           'path_list',
           'path',
           'sandbox',
           'hold_types',
           'keep_files',
           'mail_points',
           'staging_list',
           'range',
           'state_count',
           'license_count',
           'route_destinations',
           'args',
           'job_sort_formula',
           'node_group_key',
           'version',
           'software',
           'priority',
           'name',
           'project',
           'join_path',
           'PbsAttributeDescriptor',
           'PbsReadOnlyDescriptor',
           'pbs_resource',
           'vchunk',
           'vnode_state',
           'vnode_sharing',
           'vnode_ntype'
           ]

import _pbs_v1
import sys
import math

_size = _pbs_v1.svr_types._size
_LOG = _pbs_v1.logmsg
_IS_SETTABLE = _pbs_v1.is_attrib_val_settable


class PbsAttributeDescriptor():
    """This class wraps evey PBS attribute into a *DATA* descriptor AND is
    maintained per instance instead of the default per class.

    Some things to note are:
      - All attributes values are ensured to be an instance of value_type
      - if read_only is set then any attempt to set will raise
        BadAttributeValueError
      - Add the attribute name to the dictionary 'attributes' on the instance
        if it exists.
      - Since a Descriptor is a class level object, to maintain unique values
        across instances, we maintain an internal dictionary.
    """

    def __init__(
        self, cls, name, default_value, value_type=None, resc_attr=None,
        is_entity=0
    ):
        """
        """

        self._name = name
        self._value = default_value
        self._class_name = cls.__name__
        self._is_entity = is_entity

        #: check if we are resource wrapped in a attribute
        self._is_resource = False
        self._resc_attribute = None
        if resc_attr is not None:
            self._is_resource = True
            self._resc_attribute = resc_attr

        #: WARNING value_type must support sequence protocol, see __set__ for
        #: why
        if value_type is None:
            self._value_type = (str,)
        elif isinstance(value_type, (list, tuple)):
            self._value_type = value_type
        else:
            self._value_type = tuple(value_type)
        #:

        #: The below is used to keep track of all the descriptors in a Class
        #: WARNING Purposely not checking exception so as to ensure all Classes
        #: that use this descriptor define a _ATTRIBUTES_KEY_NAME which is of
        #: Mapping type.

        __attributes = getattr(cls, _ATTRIBUTES_KEY_NAME)
        __attributes[name] = None
    #: m(__init__)

    @staticmethod
    def _get_values_dict(obj):
        """
        Obtain the values dictionary from the instance ("obj") of the class to
        which the PbsAttributeDescriptors are attached.
        """
        try:
            values_dict = object.__getattribute__(obj, "__pad_values")
        except AttributeError as e:
            values_dict = {}
            object.__setattr__(obj, "__pad_values", values_dict)
        return values_dict

    def __get__(self, obj, cls=None):
        """__get__
        """

        #: if accessing from class then return self
        if obj is None:
            return self

        values_dict = PbsAttributeDescriptor._get_values_dict(obj)
        try:
            value = values_dict[self._name]
        except KeyError:
            try:
                value = self._get_default_value()
            except Exception as e:
                _pbs_v1.logmsg(
                    _pbs_v1.EVENT_ERROR,
                    f'PbsAttributeDescriptor._get_default_value() failed for '
                    f'attribute "{self._name}": {str(e)}')
                raise
            values_dict[self._name] = value
        return value
    #: m(__get__)

    def __set__(self, obj, value):
        """__set___
        """

        if not _IS_SETTABLE(self, obj, value):
            return

        # if in Python (hook script mode), the hook writer has set value to
        # to None, meaning to unset the attribute.

        try:
            basestring
        except Exception:
            basestring = str

        if (value is None) and _pbs_v1.in_python_mode():
            set_value = ""
        elif ((value is None)
              or (isinstance(value, basestring) and value == "")
              or isinstance(value, self._value_type)
              or self._is_entity
              or (hasattr(obj, "_is_entity")
                  and getattr(obj, "_is_entity"))):

            # no instantiation/transformation of value needed if matching
            # one of the following cases:
            #     - value is unset  : (value is None) or (value == "")
            #     - same type as value's type :
            #                       (isinstance(value, self._value_type)
            #     - a special entity resource type : self.is_entity is True
            #                             or parent object is an entity type
            set_value = value
        else:
            if (self._is_resource and isinstance(value, str)
                    and value[0] == "@"):
                # an indirect resource
                set_value = value
            else:
                set_value = self._value_type[0](value)
        PbsAttributeDescriptor._get_values_dict(obj)[self._name] = set_value
    #: m(__set__)

    def _set_resc_atttr(self, resc_attr, is_entity=0):
        """
        """
        self._resc_attribute = resc_attr
        self._is_resource = True
        self._is_entity = is_entity

    #: m(_set_resc_atttr)

    def __delete__(self, obj):
        """__delete__, we just set the attribute value to None"""
        PbsAttributeDescriptor._get_values_dict(obj)[self._name] = None
    #: m(__delete__)

    def _get_default_value(self):
        """ get a default value
        """

        if self._value is None:
            return self._value

        #: otherwise return a new instance of default value
        if self._value_type[0] == pbs_resource:
            # following results in the call
            #	pbs_resource(self._value, self._is_entity)
            # (see class pbs_resource __init__ method)
            s = self._value_type[0](self._value, self._is_entity)
        else:
            s = self._value_type[0](self._value)
        return s

    # the checkValue method here before was rolled into _IS_SETTABLE

#: End Class PbsAttributeDescriptor


class PbsReadOnlyDescriptor():
    """This class wraps a generic read only data descriptor. This is a class
    level descriptor.
    """

    def __init__(self, name, value):
        """

        """
        self._name = name
        self._value = value
    #: m(__init__)

    def __get__(self, obj, cls=None):
        """get """

        return self._value
    #: m(__get__)

    def __set__(self, obj, value):
        """set"""
        raise BadAttributeValueError("<%s> is readonly" % (self._name,))
    #: m(__set__)

    def __delete__(self, obj):
        """delete, we just set the attribute value to None"""
        raise BadAttributeValueError("cannot delete <%s>" % (self._name,))
    #: m(__delete__)

    def __str__(self):
        if isinstance(self._value, dict):
            return ",".join(list(self._value.keys()))
        else:
            return str(self._value)
        #
    #: m(__str__)
    __repr__ = __str__

#: End Class PbsReadOnlyDescriptor


#
from ._exc_types import *


class _generic_attr():
    """A generic attribute"""

    # _derived_types: What type other than '_generic_attr' will be accepted
    _derived_types = (str,)

    def __init__(self, value):

        self._value = None
        if value is not None:
            if isinstance(value, (str, _generic_attr)):
                self._value = value
            else:
                self._value = value.__class__(value)

        super().__init__()
    #: m(__init__)

    def __str__(self):
        """String representation of the object"""
        return str(self._value)
    #: m(__str__)

    __repr__ = __str__

#: C(_generic_attr)

#: ---------------------  VALUE TYPES         ---------------------
# to_bytes: given a _size 'sz' value, returns an integer which is the
# equivalent number of bytes.


def to_bytes(sz):

    s_str = str(sz).rstrip("bB")
    sl = len(s_str)
    wordsz = 1
    if (s_str[sl - 1] == "w") or (s_str[sl - 1] == "W"):
        s_str = s_str.rstrip("wW")
        wordsz = _pbs_v1.wordsize()

    sl = len(s_str)
    if (s_str[sl - 1] == "k") or (s_str[sl - 1] == "K"):
        s_num = int(s_str.rstrip("kK")) * 1024
    elif (s_str[sl - 1] == "m") or (s_str[sl - 1] == "M"):
        s_num = int(s_str.rstrip("mM")) * 1024 * 1024
    elif (s_str[sl - 1] == "g") or (s_str[sl - 1] == "G"):
        s_num = int(s_str.rstrip("gG")) * 1024 * 1024 * 1024
    elif (s_str[sl - 1] == "t") or (s_str[sl - 1] == "T"):
        s_num = int(s_str.rstrip("tT")) * 1024 * 1024 * 1024 * 1024
    elif (s_str[sl - 1] == "p") or (s_str[sl - 1] == "P"):
        s_num = int(s_str.rstrip("pP")) * 1024 * 1024 * 1024 * 1024 * 1024
    else:
        s_num = int(s_str)

    s_num *= wordsz
    return s_num

# transform_sizes: return _size transformation of 'sz1' and 'sz2' that
# can be fed to the richcompare functions of _size without causing an
# overflow or rounding up inherent in small values.


def transform_sizes(sz1, sz2):

    s_num = -1
    s = sz1
    if isinstance(sz1, (int, size)):
        s = _size(str(sz1))
        if s.__le__(_size("10kb")):
            # make all values at least 10kb to prevent rounding up errors
            # in normalize_size().  Here, we make it relative to 1gb.
            s_num = to_bytes(s) + 1073741824
            s = _size(s_num)

    o_num = -1
    o = sz2
    if isinstance(sz2, (int, size)):
        o = _size(str(sz2))
        if o.__le__(_size("10kb")):
            # make all values at least 10kb to prevent rounding up errors
            # in normalize_size()
            o_num = to_bytes(o) + 1073741824
            o = _size(o_num)

    if s_num == -1 and isinstance(s, _size):
        s = _size(s.__add__(_size("1gb")))
    if o_num == -1 and isinstance(o, _size):
        o = _size(o.__add__(_size("1gb")))

    l = [s, o]
    return l


def size_to_kbytes(sz):
    """
    Given a pbs.size value 'sz', return the actual
    # of kbytes representing the value.
    """
    return _pbs_v1.size_to_kbytes(sz)


class size(_size):
    """
    This represents a PBS size type.
    pbs.size(int)
    pbs.size("int[suffix]") where suffix is:

         b or  w     bytes or words.
         kb or kw    Kilo (1024) bytes or words.
         mb or mw    Mega (1,048,576) bytes or words.
         gb or gw    Giga (1,073,741,824) bytes or words.
         tb or tw    Tera (1024  gigabytes) bytes or words.
         pb or pw    Peta  (1,048,576 gigabytes) bytes or words

    pbs.size instances can be operated on by +, - operators, and can be
    can be compared using the operators ==, !=, >, <, >=, and <=.

        Ex.
        >> sz = pbs.size(10gb)

        # the sizes are normalize to the lower of
        # the 2 suffixes.
        # In this case, 10gb becomes 10240mb
        # and added to 10mb
        >> sz = sz + 10mb
        10250mb

        # following returns true as sz is greater
        # than 100 bytes.
        >> if  sz > 100:
        print  true
    """

    _derived_types = (_size,)

    def __lt__(self, other):
        so = transform_sizes(self, other)
        s = so[0]
        o = so[1]

        s_str = str(s).rstrip("bB")
        o_str = str(o).rstrip("bB")

        if s_str.isdigit() and o_str.isdigit():
            return(int(s_str) < int(o_str))

        # uses _size's richcompare
        return s.__lt__(o)

    def __le__(self, other):
        so = transform_sizes(self, other)
        s = so[0]
        o = so[1]

        s_str = str(s).rstrip("bB")
        o_str = str(o).rstrip("bB")

        if s_str.isdigit() and o_str.isdigit():
            return(int(s_str) <= int(o_str))

        # uses _size's richcompare
        return s.__le__(o)

    def __gt__(self, other):
        so = transform_sizes(self, other)
        s = so[0]
        o = so[1]

        s_str = str(s).rstrip("bB")
        o_str = str(o).rstrip("bB")

        if s_str.isdigit() and o_str.isdigit():
            return(int(s_str) > int(o_str))

        # uses _size's richcompare
        return s.__gt__(o)

    def __ge__(self, other):
        so = transform_sizes(self, other)
        s = so[0]
        o = so[1]

        s_str = str(s).rstrip("bB")
        o_str = str(o).rstrip("bB")

        if s_str.isdigit() and o_str.isdigit():
            return(int(s_str) >= int(o_str))

        # uses _size's richcompare
        return s.__ge__(o)

    def __eq__(self, other):
        so = transform_sizes(self, other)
        s = so[0]
        o = so[1]

        s_str = str(s).rstrip("bB")
        o_str = str(o).rstrip("bB")

        if s_str.isdigit() and o_str.isdigit():
            return(int(s_str) == int(o_str))

        # uses _size's richcompare
        return s.__eq__(o)

    def __ne__(self, other):
        """
        This is called on a <self> != <other> comparison, where
        <self> is of size type.
        """
        if not isinstance(other, (int, size)):
            # if <other> object is not of type 'int', 'long', or 'size',
            # then it cannot be transformed into size type.
            # So automatically this != comparison should return
            # True  - yes, they're not equal.
            return True

        so = transform_sizes(self, other)
        s = so[0]
        o = so[1]

        s_str = str(s).rstrip("bB")
        o_str = str(o).rstrip("bB")

        if s_str.isdigit() and o_str.isdigit():
            return(int(s_str) != int(o_str))

        # uses _size's richcompare
        return s.__ne__(o)

    def __add__(self, other):
        s = self
        o = other
        if isinstance(self, (int, size)):
            s = _size(str(self))
        if isinstance(other, (int, size)):
            o = _size(str(other))
        # uses _size's add function, but trick is return
        # the "size" type so that any comparisons with the
        # return would look in here for comparison operators
        # and not in _size's richcompare.
        return size(s.__add__(o))

    def __sub__(self, other):
        s = self
        o = other
        if isinstance(self, (int, size)):
            s = _size(str(self))
        if isinstance(other, (int, size)):
            o = _size(str(other))
        # uses _size's subtract function, but trick is return
        # the "size" type so that any comparisons with the
        # return would look in here for comparison operators
        # and not in _size's richcompare.
        return size(s.__sub__(o))

    def __deepcopy__(self, mem):
        return size(str(self))


class duration(int):
    """
    Represents an interval or elapsed time object in number of seconds. This is
    actually derived from a Python int type.

    pbs.duration([[intHours:]intMinutes:]intSeconds[.intMilliseconds])
    pbs.duration(int)
    """
    # alternate form (i.e. what type can be used for pbs attribute of this
    # type. For example, walltime is pbs.duration type, but can also be set
    # using the given _derived_types:
    _derived_types = (int,)

    def __new__(cls, value):
        valstr = str(value)
        # validates against the 'walltime' attribute entry of the
        # the server 'resource' table
        _pbs_v1.validate_input("resc", "walltime", valstr)
        return int.__new__(cls, _pbs_v1.duration_to_secs(valstr))

    def __init__(self, value):
        self.duration_str = str(value)

    def __str__(self):
        return self.duration_str


def replace_char_not_before(str, chr, repl_substr, chr_after_list):
    """
    Given 'str', replace all occurences of single character 'chr' with
    replacement  substr 'repl_substr', only if 'chr' in 'str' is not
    succeeded by any of the characters in 'chr_after_list'.
    Ex. Given str = "ab\,c\d\'\e\"\f\\,
              # replace occurences of "\" with  "\\" as long as it is
              # not followed by <,>, <'>, <">,  or <\>
              replace_char_not_after(str, "\", "\\",
                                        [ ',', '\'', '\"', '\\'])  =
                "ab\,c\\d\'\\e\"\\f\\"
        Here are sample transformations:

         str= ab\,c\d\'\e\"\f\
        rstr= ab\,c\\d\'\\e\"\\f\\

         str= \ab\,c\d\'\e\"\f\
        rstr= \\ab\,c\\d\'\\e\"\\f\\

         str= \ab\,c\d\'\e\"\f\
        rstr= \\ab\,c\\d\'\\e\"\\f\\

         str= \\ab\,c\d\'\e\"\f\
        rstr= \\ab\,c\\d\'\\e\"\\f\\

         str= \\ab\,c\\d\'\e\"\f\
        rstr= \\ab\,c\\d\'\\e\"\\f\\
    """
    i = 0
    l = len(str)
    end_index = l - 1
    s = ""
    while i < l:
        if ((str[i] != chr) or
            ((i > 0) and (str[i - 1] == chr) and (str[i] in chr_after_list)) or
                ((i < end_index) and (str[i + 1] in chr_after_list))):
            s += str[i]
        else:
            s += repl_substr
        i = i + 1
    return s


class pbs_env(dict):
    # a list of path where "\" will be converted to "/"
    _attributes_readonly = PbsReadOnlyDescriptor('_attributes_readonly',
                                                 ['PBS_ENVIRONMENT',
                                                  'PBS_JOBDIR',
                                                  'PBS_JOBID',
                                                  'PBS_JOBNAME',
                                                  'PBS_NODEFILE',
                                                  'TMPDIR',
                                                  'PBS_O_HOME',
                                                  'PBS_O_HOST',
                                                  'PBS_O_LANG',
                                                  'PBS_O_LOGNAME',
                                                  'PBS_O_MAIL',
                                                  'PBS_O_PATH',
                                                  'PBS_O_QUEUE',
                                                  'PBS_O_SHELL',
                                                  'PBS_O_SYSTEM',
                                                  'PBS_O_TZ',
                                                  'PBS_O_WORKDIR',
                                                  'PBS_QUEUE'
                                                  ])

    def __init__(self, value, generic=False):
        # if generic is True, this means to use pbs_env() type in a
        # generic way, so that the PBS-related variables (e.g. PBS_O*)
        # are allowed to be modified.
        self._generic = generic
        if isinstance(value, str):
            # temporarily replace "<esc_char>," with something we
            # don't expect to see: two etx <ascii code 3>
            # since ',' is used as a separator among env variables.
            # NOTE: We take care here of also catching "\\," which is
            #       legal as in:  DPATH=\\a\\b\\,MP_MSG_API=MPI\,LAPI
            #       which must break down to:
            #           v['DPATH'] = "\\a\\b\\"
            #	       v['MP_MSG_API'] = "MPI\,LAPI"
            if (sys.platform == "win32"):
                esc_char = "^"
            else:
                esc_char = "\\"
            double_stx = "\x02\x02"
            double_etx = "\x03\x03"
            value1 = value.replace(
                esc_char + esc_char, double_stx).replace(
                esc_char + ",", double_etx)
            vals = value1.split(",")
            ev = {}
            for v in vals:
                # now restore "<esc_char>,"
                v1 = v.replace(double_etx, esc_char +
                               ",").replace(double_stx, esc_char + esc_char)
                e = v1.split("=", 1)

                if len(e) == 2:

                    vue = e[1]
                    if isinstance(e[1], str):
                        if (_pbs_v1.get_python_daemon_name() != "pbs_python") \
                                or (sys.platform != "win32"):
                            # replace \ with \\ if not used to escape special
                            # chars
                            # note: no need to do this under a Windows mom
                            #       since backslash is recognized as path
                            #       character
                            vue = replace_char_not_before(
                                e[1], '\\', '\\\\', [',', '\'', '\"', '\\'])
                    ev.update({e[0]: vue})
        else:
            ev = value
        super().__init__(ev)
    #: m(__init__)

    def __setitem__(self, name, value):
        """__setitem__"""
        # pbs builtin variables are off limits except under a PBS hook
        if name in pbs_env._attributes_readonly and \
                _pbs_v1.in_python_mode() and _pbs_v1.in_site_hook() and \
                not getattr(self, "_generic"):
            raise BadAttributeValueError(
                "env variable '%s' is readonly" % (name,))
        v = value
        if isinstance(value, str):
            if (_pbs_v1.get_python_daemon_name() != "pbs_python") \
                    or (sys.platform != "win32"):
                # replace \ with \\ if not used to escape special chars
                # note: no need to do this on a Windows mom
                #       since backslash is recognized as path character
                v = replace_char_not_before(value, '\\', '\\\\',
                                            [',', '\'', '\"', '\\'])
        super().__setitem__(name, v)

    def __str__(self):
        """String representation of the object"""
        rv = ""
        for k in self.keys():
            if self[k] is not None:
                rv += "%s=%s," % (k, self[k])
        return rv.rstrip(",")
    #: m(__str__)


class email_list(_generic_attr):
    """
    Represents the set of users to whom mail may be sent when a job makes
    certain state changes. Ex. Jobs Mail_Users attribute.
    Format: pbs.email_list(<email_address1>, <email address2>)
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Mail_Users", value)
        super().__init__(value)

# pbs_list is like email_list except less strict - "str" is allowed as a
# derived type.


class pbs_list(_generic_attr):
    _derived_types = (_generic_attr, str)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Mail_Users", value)
        super().__init__(value)


class pbs_bool(_generic_attr):
    _derived_types = (bool,)

    def __init__(self, value):
        if value in ("true", "True", "TRUE", "t", "T", "y", "1", 1):
            v = 1
        elif value in ("false", "False", "FALSE", "f", "F", "n", "0", 0):
            v = 0
        else:
            # should not end up here
            v = -1
        # validates against the 'Rerunable' attribute entry of the
        # the server 'job' table
        _pbs_v1.validate_input("job", "Rerunable", str(v))
        super().__init__(v)

    def __cmp__(self, value):
        iself = int(str(self))

        if value is None:
            return 1

        ivalue = int(value)

        if iself == ivalue:
            return 0
        elif iself > ivalue:
            return 1
        else:
            return -1

    def __bool__(self):
        if int(str(self)) == 1:
            return True
        else:
            return False

    def __int__(self):
        return int(str(self))


class pbs_int(int):
    _derived_types = (int, int, float)

    def __init__(self, value):
        # empty  string ("") also matched
        if value != "":
            _pbs_v1.validate_input("job", "ctime", str(int(value)))
        super().__init__()


class vnode_state(int):
    _derived_types = (int, int, float)

    def __init__(self, value):
        # empty  string ("") also matched
        if value != "":
            if _pbs_v1.vnode_state_to_str(int(value)) == "":
                raise BadAttributeValueError(
                    "invalid vnode state value '%s'" % (value,))

        super().__init__()

    def __add__(self, val):
        if _pbs_v1.vnode_state_to_str(val) == "":
            raise BadAttributeValueError(
                "invalid vnode state value '%d'" % (val,))
        return (self | val)

    def __sub__(self, val):
        if _pbs_v1.vnode_state_to_str(val) == "":
            raise BadAttributeValueError(
                "invalid vnode state value '%d'" % (val,))
        return (self & ~val)


class pbs_str(str):
    _derived_types = (str,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Job_Owner", value)
        super().__init__()


class pbs_float(float):
    _derived_types = (int, int, float)

    def __init__(self, value):
        _pbs_v1.validate_input("float", "", str(value))
        super().__init__()

#: ---------------------  SPECIAL VALUE TYPES ---------------------


class server_state(int):
    _derived_types = (int,)

    def __new__(cls, value):
        v = value
        if isinstance(value, str):
            # convert to the internal long value
            if value == "Hot_Start":
                v = _pbs_v1.SV_STATE_HOT
            elif value == "Active":
                v = _pbs_v1.SV_STATE_ACTIVE
            elif value == "Terminating_Delay":
                v = _pbs_v1.SV_STATE_SHUTDEL
            elif value == "Terminating":
                v = _pbs_v1.SV_STATE_SHUTIMM
            else:
                # not all server states are captured in this function,
                # so just default to 0 (instead of -1)
                v = 0
        return super().__new__(cls, v)


class queue_type(int):
    _derived_types = (int,)

    def __new__(cls, value):
        v = value
        if isinstance(value, str):
            # convert to the internal long value
            if (value == "Execution") or (value == "E"):
                v = _pbs_v1.QTYPE_EXECUTION
            elif value == "Route":
                v = _pbs_v1.QTYPE_ROUTE
            else:
                # should not get here
                v = -1
        return super().__new__(cls, v)


class job_state(int):
    _derived_types = (int,)

    def __new__(cls, value):
        v = value
        if isinstance(value, str):
            # convert to the internal long value
            if value == "T":
                v = _pbs_v1.JOB_STATE_TRANSIT
            elif value == "Q":
                v = _pbs_v1.JOB_STATE_QUEUED
            elif value == "H":
                v = _pbs_v1.JOB_STATE_HELD
            elif value == "W":
                v = _pbs_v1.JOB_STATE_WAITING
            elif value == "R":
                v = _pbs_v1.JOB_STATE_RUNNING
            elif value == "E":
                v = _pbs_v1.JOB_STATE_EXITING
            elif value == "X":
                v = _pbs_v1.JOB_STATE_EXPIRED
            elif value == "B":
                v = _pbs_v1.JOB_STATE_BEGUN
            elif value == "S":
                v = _pbs_v1.JOB_STATE_SUSPEND
            elif value == "U":
                v = _pbs_v1.JOB_STATE_SUSPEND_USERACTIVE
            elif value == "M":
                v = _pbs_v1.JOB_STATE_MOVED
            elif value == "F":
                v = _pbs_v1.JOB_STATE_FINISHED
            else:
                # should not get here
                v = -1
        return super().__new__(cls, v)


class acl(_generic_attr):
    """
    Represents a PBS ACL type.
    Format: pbs.acl("[+|-]<entity>][,...]")
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("resv", "Authorized_Users", value)
        super().__init__(value)


class select(_generic_attr):
    """
    This represents the select resource specification when submitting a job.
    Format: pbs.select([N:]res=val[:res=val][+[N:]res=val[:res=val] ... ]")

    Ex. sel = pbs.select("2:ncpus=1:mem=5gb+3:ncpus=2:mem=5gb")
        s = repr(sel)	 or s = `sel`
        print s[2]  prints n
        s = s + "+5:scratch=10gb"  append to string
        sel = pbs.select(s)  reset the value of sel

    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("resc", "select", value)
        super().__init__(value)

    def increment_chunks(self, increment_spec):
        """
        Given a pbs.select value (i.e. <num>:r1=v1:r2=v2+...+<num>:rn=vN),
        increase the number of chunks for each of the pbs.select chunk
        specs (except for the first chunk assigned to primary mom)
        by the 'increment' specification.
        The first chunk is the single chunk inside the first item
        in the plus-separated specs that is assigned to the
        primary mom. It is left as is.
        For instance, given a chunk specs of "3:ncpus=2+2:ncpus=4",
        this is viewed as "(1:ncpus=2+2:ncpus=2)+(2:ncpus=4)", and
        the increment specs described below would apply to the
        chunk after the initial, single chunk "1:ncpus=2".

        if 'increment_spec' is a number (int or long) or a numeric
        string,  then it will be the amount to add to the number of
        chunks spcified for each chunk that is not the first chunk
        in the pbs.select spec.

        if 'increment_spec' is a numeric string that ends with a percent
        sign (%), then this will be the percent amount of chunks to
        increase each chunk (except the first chunk) in the pbs.select spec.
        The resulting amount is rounded up (i.e. ceiling)
        (e.g. 1.23 rounds up to 2).

        Finally, if 'increment_spec' is a dictionary with elements of the
        form:
               {<chunk_index_to_select_spec> : <increment>, ...}
        where <chunk_index_to_select_spec> starts at 0 for the first
        chunk appearing in the plus-separated spec list,
        and <increment> can be numeric, numeric string or
        a percent increase value. This allow for individually
        specifying the number of chunks to increase original value.
        Note that for the first chunk in the list (0th index), the
        increment will apply to the chunks beyond the first chunk, which is
        assigned to the primary mom.

        Ex. Given:
            sel=pbs.select("ncpus=3:mem=1gb+1:ncpus=2:mem=2gb+2:ncpus=1:mem=3gb")

            Calling sel.increment_chunks(2) would return a string:
                "1:ncpus=3:mem=1gb+3:ncpus=2:mem=2gb+4:ncpus=1:mem=3gb"

            Calling sel.increment_chunks("3") would return a string:
                "1:ncpus=3:mem=1gb+4:ncpus=2:mem=2gb+5:ncpus=1:mem=3gb"

            Calling sel.increment_chunks("23.5%"), would return a
            pbs.select value mapping to:
                "1:ncpus=3:mem=1gb+2:ncpus=2:mem=2gb+3:ncpus=1:mem=3gb"

            with the first chunk, which is a single chunk, is left as is,
            and the second and third chunks are increased by 23.5 %
            resulting in 1.24 rounded up to 2 and 2.47 rounded up to 3.

            Calling sel.increment_chunks({0: 0, 1: 4, 2: "50%"}), would
            return a pbs.select value mapping to:
                "1:ncpus=3:mem=1gb+5:ncpus=2:mem=2gb+3:ncpus=1:mem=3gb"

            where no increase (0) for chunk 1, additional 4
            chunks for chunk 2, 50% increase for chunk 3 resulting in
            3.

            Given:
                sel=pbs.select("5:ncpus=3:mem=1gb+1:ncpus=2:mem=2gb+2:ncpus=1:mem=3gb")

            Then calling sel.increment_chunks("50%") or
            sel.increment_chunks({0: "50%", 1: "50%", 2: "50%}) would return a
            pbs.select value mapping to:
                "7:ncpus=3:mem=1gb+2:ncpus=2:mem=2gb+3:ncpus=1:mem=3gb"
            as for the first chunk, the initial single chunk of
            "1:ncpus=3:mem=1gb" is left as is, with the "50%" increase applied
            to the remaining chunks "4:ncpus=3:mem=1gb", and then added back to
            the single chunk to make 7, while chunks 2 and 3 are increased to 2
            and 3, respectively.
        """
        increment = None
        percent_inc = None
        increment_dict = None
        if isinstance(increment_spec, (int, int)):
            increment = increment_spec
        elif isinstance(increment_spec, str):
            if increment_spec.endswith('%'):
                percent_inc = float(increment_spec[:-1]) / 100 + 1.0
            else:
                increment = int(increment_spec)
        elif isinstance(increment_spec, dict):
            increment_dict = increment_spec
        else:
            raise ValueError("bad increment specs")

        ret_str = ""
        i = 0  # index to each chunk in the + separated spec
        for chunk in str(self).split("+"):
            if i != 0:
                ret_str += '+'
            j = 0  # index to items within a chunk separated by ':'
            for subchunk in chunk.split(":"):
                c_str = subchunk
                if j == 0:
                    # given <chunk_ct>:<res1>=<val1>:<res2>=<val2> or
                    # <res1>=<val1>:<res2>:<val2> (without <chunk_ct>),
                    # here we're looking at the first field:
                    # subchunk=<chunk_ct> or subchunk=<res1>=<val1>
                    save_str = None
                    if not subchunk.isdigit():
                        # detected a first field that is not
                        # a <chunk_ct>, so default to 1
                        subchunk = "1"
                        save_str = c_str
                    chunk_ct = int(subchunk)

                    if i == 0:
                        # don't touch the first chunk which lands in MS
                        chunk_ct -= 1

                    if chunk_ct <= 0:
                        num = 0
                    elif increment:
                        num = chunk_ct + increment
                    elif percent_inc:
                        num = int(math.ceil(chunk_ct * percent_inc))
                    elif increment_dict is not None and i in increment_dict:
                        if isinstance(increment_dict[i], (int, int)):
                            inc = increment_dict[i]
                            num = chunk_ct + inc
                        elif isinstance(increment_dict[i], str):
                            if increment_dict[i].endswith('%'):
                                p_inc = float(
                                    increment_dict[i][:-1]) / 100 + 1.0
                                num = int(math.ceil(chunk_ct * p_inc))
                            else:
                                inc = int(increment_dict[i])
                                num = chunk_ct + inc
                    else:
                        raise ValueError("bad increment specs")

                    if (i == 0):
                        num += 1  # put back the decremented count

                    if save_str:
                        c_str = "%s:%s" % (num, save_str)
                    else:
                        c_str = "%s" % (num)
                else:
                    ret_str += ":"
                ret_str += c_str
                j += 1

            i += 1

        return select(ret_str)


class place(_generic_attr):
    """
    the place specification when submitting a job.
    Format: pbs.place("[arrangement]:[sharing]:[group]")
            where 	[arrangement] can be pack, scatter, free,
                        [sharing] can be shared, excl, and
                        [group] can be of the form group=<resource>.
                        [arrangement], [sharing], and [group] can be given
                        in any order or combination.
    Ex.	pl = pbs.place("pack:excl")
        s = repr(pl)	 or s = `pl`
        print pl[0]  returns p
        s = s + :group=host  append to string
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("resc", "place", value)
        super().__init__(value)


class vnode_sharing(int):
    _derived_types = (int, int, float)

    def __init__(self, value):
        if _pbs_v1.vnode_sharing_to_str(int(value)) == "":
            raise BadAttributeValueError(
                "invalid vnode sharing value '%s'" % (value,))
        super().__init__()


class vnode_ntype(int):
    _derived_types = (int, int, float)

    def __init__(self, value):
        if _pbs_v1.vnode_ntype_to_str(int(value)) == "":
            raise BadAttributeValueError(
                "invalid vnode ntype value '%s'" % (value,))
        super().__init__()


class exec_host(_generic_attr):
    """
    Represents a PBS exec_host.
    Format: pbs.exec_host("host/N[*C][+...]")
            where N are C are ints.
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "exec_host", value)
        super().__init__(value)


class checkpoint(_generic_attr):
    """
    Represents a job's checkpoint attribute.
    Format: pbs.checkpoint( <chkpnt_string> )
                where <chkpnt_string> must be one of "n", "s", "c", or "c=mmm"

    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Checkpoint", value)
        super().__init__(value)


class depend(_generic_attr):
    """
    Represents a job's dependency attribute.
    Format: pbs.depend("<depend_string>")
                Creates a PBS dependency specification object out of
                the given <depend_string>. <depend_string> must be of
                "<type>:<jobid>[,<jobid>...]", or on:<count>.
                <type> is one of "after", "afterok",
                afterany", "before", "beforeok", and "beforenotok.
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "depend", value)
        super().__init__(value)


class group_list(_generic_attr):
    """
    Represents a list of group names.
    Format: pbs.group_list("<group_name>[@<host>][,<group_name>[@<host>]..]")
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "group_list", value)
        super().__init__(value)


class user_list(_generic_attr):
    """
    Represents a list of user names.
    Format: pbs.user_list("<user>[@<host>][,<user>@<host>...]")
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "User_List", value)
        super().__init__(value)


class path(_generic_attr):
    _derived_types = (_generic_attr, str)

    def __init__(self, value):
        # for windows
        val = value
        if isinstance(value, str):
            val = value.replace("\\", "/")
        _pbs_v1.validate_input("job", "Output_Path", val)
        super().__init__(val)


class sandbox(_generic_attr):
    _derived_types = (_generic_attr, str)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "sandbox", value)
        super().__init__(value)


class priority(_generic_attr):
    _derived_types = (_generic_attr, int)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Priority", str(value))
        super().__init__(value)


class name(_generic_attr):
    _derived_types = (_generic_attr, str)

    def __init__(self, value):
        # Validate only if set inside a hook script and not internally
        # by PBS.
        if _pbs_v1.in_python_mode():
            _pbs_v1.validate_input("job", "Job_Name", value)
        super().__init__(value)


class project(_generic_attr):
    _derived_types = (_generic_attr, str)

    def __init__(self, value):
        # Validate only if set inside a hook script and not internally
        # by PBS.
        if _pbs_v1.in_python_mode():
            _pbs_v1.validate_input("job", "project", value)
        super().__init__(value)


class join_path(_generic_attr):
    """
    Represents how the output and error files are merged.
    Format: pbs.join_path({oe|eo|n})
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Join_Path", value)
        super().__init__(value)


class path_list(_generic_attr):
    """
    Represents a list of pathnames.
    Format: pbs.path_list("<path>[@<host>][,<path>@<host> ...]")
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        # for windows
        val = value
        if isinstance(value, str):
            val = value.replace("\\", "/")
        _pbs_v1.validate_input("job", "Shell_Path_List", val)
        super().__init__(val)


class hold_types(_generic_attr):
    """
    Represents the Hold_Types attribute of a job.
    Format: pbs.hold_types(<hold_type_str>)
            where <hold_type_str> is one of "u", "o", "s",  or ("n" or "p").

    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        """
        Instantiates an pbs.holdtypes() value.
        """
        _pbs_v1.validate_input("job", "Hold_Types", value)
        self.opval = "__init__"
        super().__init__(value)

    def __add__(self, val):
        """
        Returns a new value containing the Hold_Types values in
        self._value plus the the Hold_Types values in val.
        This also ensures that each character in val will appear
        only once in the new value.
        Example:
                Given: pbs.event().job.Hold_types = "o"
                        pbs.event().job.Hold_Types += pbs.hold_types("uos")
                -> pbs.event().job.Hold_Types = uos
        """
        sdict = {}
        for c in self._value:
            sdict[c] = ""
        for c in str(val):
            sdict[c] = ""
        nval = "".join(list(sdict.keys()))

        # nval will get validated inside hold_types instantiation
        h = hold_types(nval)
        h.opval = "__add__"
        return h

    def __sub__(self, val):
        """
        Returns a new value containing the Hold_Types values
        in self._value, but with the Hold_Types values in val
        taken out.
        Example:
            Given: pbs.event().job.Hold_types = os
                   pbs.event().job.Hold_Types  -= pbs.hold_types("us")
                                         -> pbs.event().job.Hold_types = o
        """
        sdict = {}
        # string that holds deleted Hold_Types values
        deleted_vals = ""
        for c in self._value:
            sdict[c] = ""
        for c in str(val):
            if c in list(sdict.keys()):
                del sdict[c]
                deleted_vals += c
        nval = "".join(list(sdict.keys()))

        # nval will get validated inside hold_types instantiation
        if nval == "":
            nval = "n"
        h = hold_types(nval)
        h.opval = "__sub__"
        h.delval = deleted_vals
        return h


class keep_files(_generic_attr):
    """
    Represents the Keep_Files job attribute.
    Format: pbs.keep_files(<keep_files_str>)
                where <keep_files_str> is one of "o", "e", "oe", "eo".

    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Keep_Files", value)
        super().__init__(value)


class mail_points(_generic_attr):
    """
    Represents the Mail_Points attribute of a job.
    Format: pbs.mail_points("<mail_points_string>")
                Creates a PBS Mail_Points object, where
                <mail_points_string> is "a", "b", and/or "e", or n.
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "Mail_Points", value)
        super().__init__(value)


class staging_list(_generic_attr):
    """
    Represents a list of file stagein or stageout parameters.
    Format: pbs.staging_list("<filespec>[,<filespec>,...]")
                Creates a file staging parameters list object.
                where <filespec> is
                        <local_path>@<remote_host>:<remote_path>
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        val = value
        if isinstance(value, str):
            val = value.replace("\\", "/")
            val = val.replace("/,", "\\,")
        _pbs_v1.validate_input("job", "stagein", val)
        super().__init__(val)


class range(_generic_attr):
    """
    Represents a range of numbers referring to job array.
    Format: pbs.range("<start>-<stop>:<end>")
                Creates a PBS object representing a range of values.
                Ex. pbs.range(1-30:3)

    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "array_indices_submitted", value)
        super().__init__(value)


class state_count(_generic_attr):
    """
    Represents a set of job-related state counters.
    Format: pbs.state_count("Transit:<U> Queued:<V> Held:<W> Running:<X> "
                            "Exiting:<Y> Begun:<Z>")
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        # validates against the 'state_account' attribute entry of the
        # the server 'server' table
        _pbs_v1.validate_input("server", "state_count", value)
        super().__init__(value)


class license_count(_generic_attr):
    """
    Represents a set of licensing-related counters.
    Format: pbs.license_count("Avail_Global:<W> Avail_Local:<X> Used:<Y> "
                              "High_Use:<Z>")
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("server", "license_count", value)
        super().__init__(value)


class route_destinations(_generic_attr):
    """
    Represents the "route_destinations" attribute of a queue.
    Format: pbs.route_destinations(("<queue_spec>[,<queue_spec>,...]"
                Creates an object that represents route_destinations routing
                queue attribute. <queue_spec> is
                "queue_name[@server_host[:port]]"
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        # validates against the 'state_account' attribute entry of the
        # the server 'queue' table
        _pbs_v1.validate_input("queue", "route_destinations", value)
        super().__init__(value)


class args(_generic_attr):
    """
    Represents a space-separated list of PBS arguments to commands like
    qsub, qdel.
    Format: pbs.args(<space-separated PBS args to commands like qsub, qdel>)
                Ex. pbs.args("-Wsuppress_mail=N r y")
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("server", "default_qsub_arguments", value)
        super().__init__(value)


class job_sort_formula(_generic_attr):
    """
    Represents the job_sort_formula server attribute.
    Format: pbs.job_sort_formula(<string containing math formula>)
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        # treat as string for now
        if not isinstance(value, str):
            raise BadAttributeValueError(
                "job_sort_formula value '%s' not a string" % (value,))
        super().__init__(value)


class node_group_key(_generic_attr):
    """
    Represents the node group key atribute.
    Format: pbs.node_group_key(<resource>)
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("queue", "node_group_key", value)
        super().__init__(value)


class version(_generic_attr):
    """
    Represents a version information for PBS.
    Format: pbs.version(<pbs version string>)
    """
    _derived_types = (str, _generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("server", "pbs_version", value)
        super().__init__(value)


class software(_generic_attr):
    """
    Represents a site-dependent software specification resource.
    Format: pbs.software(<software info string>)
    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("resc", "software", value)
        super().__init__(value)


#:-------------------------------------------------------------------------
#                       RESOURCE TYPE
#:-------------------------------------------------------------------------
class pbs_resource():
    """A generic python representation of PBS resource type.

    This leverages the Python descriptor mechanism to expose all the resources
    as attributes.

    """

    __resources = PbsReadOnlyDescriptor('__resources', {})
    attributes = __resources

    def __init__(self, name, is_entity=0):
        """__init__"""

        #: name could be an instance of pbs_resource, in that case we are
        #: actually creating a new instance of pbs_resource, this happens
        #: when the attributes are actually setup by parent.
        if isinstance(name, pbs_resource):
            name = name._name
            #: set all the attribute descriptors resc_attr to name
            for a in pbs_resource.attributes:
                #: get the descriptor
                descr = getattr(pbs_resource, a)
                if isinstance(descr, PbsAttributeDescriptor):
                    descr._set_resc_atttr(name, is_entity)
                #:
            #:
        self._attributes_hook_set = {}
        self._attributes_unknown = {}
        self._name = name
        self._readonly = False
        self._has_value = True
        self._is_entity = is_entity
    #: m(__init__)

    def __str__(self):
        """
        """
        if not self._has_value:
            # return the cached value
            return str(_pbs_v1.resource_str_value(self))

        rv = []

        d = pbs_resource.attributes.copy()
        # update pbs_resource list of attribute names to contain the "unknown"
        # names as well.
        d.update(self._attributes_unknown)

        for resc in d:
            if resc == '_name' or resc == '_has_value':
                continue
            v = getattr(self, resc)
            if (v is not None) or (v == ""):
                str_v = str(v)
                if (str_v.find("\"") == -1) and (str_v.find(",") != -1):
                    rv.append("%s=\"%s\"" % (resc, v))
                else:
                    rv.append("%s=%s" % (resc, v))
            #
        #
        return ",".join(rv)
    #: m(__str__)

    def __getitem__(self, resname):
        """__getitem__"""
        if not self._has_value:
            # load the cached resource value
            _pbs_v1.load_resource_value(self)

        return getattr(self, resname)
    #: m(__getitem__)

    def __setitem__(self, resname, resval):
        """__setitem__"""

        if not self._has_value:
            # load the cached resource value
            _pbs_v1.load_resource_value(self)
        setattr(self, resname, resval)
    #: m(__setitem__)

    def __contains__(self, resname):
        """__contains__"""

        return hasattr(self, resname)
    #: m(__contains__)

    def __setattr__(self, nameo, value):
        """__setattr__"""
        if nameo == '_attributes_hook_set' or nameo == '_attributes_unknown':
            if _pbs_v1.in_python_mode() and hasattr(self, nameo):
                raise BadAttributeValueError(
                    f"the attribute '{nameo}' is readonly")
            super().__setattr__(nameo, value)
            return

        name = nameo
        if (nameo == "_readonly"):
            if _pbs_v1.in_python_mode() and \
                    hasattr(self, "_readonly") and not value:
                raise BadResourceValueError(
                    "_readonly can only be set to True!")
        elif (nameo != "_has_value") and (nameo != "_is_entity"):
            # _has_value is a special, resource attribute that tells if a
            # resource instance is already holding its value (i.e. value
            # is not cached somewhere else).
            # _is_entity is also a special attribute that tells if the
            # resource instance is an entity resource type.

            # resource names in PBS are case insensitive,
            # so do caseless matching here.
            found = False
            namel = nameo.lower()
            for resc in pbs_resource.attributes:
                rescl = resc.lower()
                if namel == rescl:
                    # Need to use the matched name stored in PBS Python
                    # resource table, to avoid resource ambiguity later on.
                    name = resc
                    found = True

            if not found:
                if _pbs_v1.in_python_mode():
                    # if attribute name not found,and executing inside Python
                    # script
                    if _pbs_v1.get_python_daemon_name() != "pbs_python":
                        # we're in a server hook
                        raise UnsetResourceNameError(
                            "resource attribute '%s' not found" % (name,))
                    else:
                        # we're in a mom hook, so no longer raising an
                        # exception here since if it's an unknown resource, we
                        # can now tell server to automatically add a custom
                        # resource.
                        pass
                # add the current attribute name to the "unknown" list
                self._attributes_unknown[name] = None

        super().__setattr__(name, value)

        # attributes that are set in python mode will be reflected in
        # _attributes_hook_set dictionary.
        if _pbs_v1.in_python_mode():
            # using a dictionary value as easier to search for keys
            self._attributes_hook_set[name] = None
    #: m(__setattr__)

    def keys(self):
        """
        Returns keys that have non-empty values.
        """
        rv = []
        for resc in pbs_resource.attributes:
            if resc == '_name' or resc == '_has_value':
                continue
            v = getattr(self, resc)
            if v is not None:
                rv.append(resc)
        #
        return rv
    #: m(keys)


#: C(pbs_resource)
pbs_resource._name = PbsAttributeDescriptor(pbs_resource, '_name',
                                            "<generic resource>", (str,))


class vchunk():
    """
    This represents a resource chunk assigned to a job.
    Format: pbs.vchunk("<vnodeN>:<res1>=<val1>:<res2>=<val2>:...:"
                       "<resN>=<valN>")
         where vnodeN is a name of a vnode.
    """

    def __init__(self, achunk):
        """__init__"""

        ch = achunk.split(":")
        self.chunk_resources = pbs_resource("Resource_List")
        for c in ch:
            if c.find("=") == -1:
                self.vnode_name = c
            else:
                rs = c.split("=", 1)
                descr = getattr(pbs_resource, rs[0])
                self.chunk_resources[rs[0]] = descr._value_type[0](rs[1])
    #: m(__init__)


class exec_vnode(_generic_attr):
    """
    Represents a PBS exec_vnodes
    Format: ev = pbs.exec_vnode(
                (vnodeA:ncpus=N:mem=X)+(vnodeB:ncpus=P:mem=Y+vnodeC:mem=Z))
                where vnodeA, ..., vnodeC are names of vnodes.
            ev.chunks returns an array of pbs.vchunk job objects representing
            that will show:
            ev.chunks[0].vnode_name = 'vnodeA'
            ev.chunks[0].vnode_resources = {'ncpus': N, 'mem': pbs.size('X')}

            ev.chunks[1].vnode_name = 'vnodeB'
            ev.chunks[1].vnode_resources = {'ncpus': P, 'mem': pbs.size('Y')}
            ev.chunks[1].vnode_name = 'vnodeC'
            ev.chunks[1].vnode_resources = {  'mem' : pbs.size('Z') }

    """
    _derived_types = (_generic_attr,)

    def __init__(self, value):
        _pbs_v1.validate_input("job", "exec_vnode", value)
        super().__init__(value)
        self.chunks = list()
        vals = value.split("+")
        i = 0
        for v in vals:
            self.chunks.append(vchunk(v.strip("(").strip(")")))
#: --------         EXPORTED TYPES DICTIONARY                      ---------


================================================
FILE: src/modules/python/pbs/v1/_exc_types.py
================================================
# coding: utf-8
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
__doc__ = """
This module introduces all the exception for the PBS/Python interaction
"""

__all__ = [
            'EventIncompatibleError',
            'UnsetAttributeNameError',
            'BadAttributeValueTypeError',
            'BadAttributeValueError',
            'UnsetResourceNameError',
            'BadResourceValueTypeError',
            'BadResourceValueError'
          ]

class EventIncompatibleError(AttributeError):
    pass

class UnsetAttributeNameError(Exception):
    pass

class BadAttributeValueTypeError(Exception):
    pass

class BadAttributeValueError(Exception):
    pass

class UnsetResourceNameError(Exception):
    pass

class BadResourceValueTypeError(Exception):
    pass

class BadResourceValueError(Exception):
    pass


================================================
FILE: src/modules/python/pbs/v1/_export_types.py
================================================
# coding: utf-8
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""

__doc__ = r"""
This module primarily exists to help the embedded interpreter import all the
python types. All attribute names that require *special* handling are
maintained in a dictionary as:
    Key <name> : Value <python_type>

    where:
        name *MUST* map to either attribute_def.at_name or resource_def.rs_name

Motivation:
    Since most of the object will be generated by the embedded python (aka C
    code) this gives a simple way to leverage the Python Data types to pass the
    information back to the embedded python. Which, then can use the excellent
    C API to retrieve the python type.

"""

from . import _base_types as pbs_types
from ._svr_types import (_queue, _job, _server, _resv, _vnode, _event,
                         pbs_iter, _management, _server_attribute)
from ._exc_types import *


#: IMPORTANT the keys are imported by the C code, make sure the mapping is
#: maintained.
#: TODO In future or time permits should add a constants to the internal
#: _pbs_v1 module.
#:
EXPORTED_TYPES_DICT = {
    'interactive' 		: pbs_types.pbs_int,
    'block'			: pbs_types.pbs_int,
    'Authorized_Users' 	: pbs_types.acl,
    'Authorized_Groups' 	: pbs_types.acl,
    'Authorized_Hosts' 	: pbs_types.acl,
    'array_index' 		: pbs_types.pbs_int,
    'array_indices_submitted': pbs_types.range,
    'array_state_count'	: pbs_types.state_count,
    'group_list' 		: pbs_types.group_list,
    'managers' 		: pbs_types.acl,
    'operators' 		: pbs_types.acl,
    'User_List' 		: pbs_types.user_list,
    'Shell_Path_List' 	: pbs_types.path_list,
    'Output_Path' 		: pbs_types.path,
    'Error_Path' 		: pbs_types.path,
    'Priority' 		: pbs_types.priority,
    'Job_Name' 		: pbs_types.name,
    'project' 		: pbs_types.project,
    'Reserve_Name' 		: pbs_types.name,
    'Join_Path' 		: pbs_types.join_path,
    'default_qsub_arguments' : pbs_types.args,
    'default_qdel_arguments' : pbs_types.args,
    'select'             : pbs_types.select,
    'schedselect'        : pbs_types.select,
    'place'              : pbs_types.place,
    'exec_host'          : pbs_types.exec_host,
    'exec_vnode'         : pbs_types.exec_vnode,
    'Checkpoint'         : pbs_types.checkpoint,
    'depend'             : pbs_types.depend,
    'Hold_Types'         : pbs_types.hold_types,
    'Keep_Files'         : pbs_types.keep_files,
    'Mail_Points'        : pbs_types.mail_points,
    'Mail_Users'         : pbs_types.email_list,
    'stagein'       	    : pbs_types.staging_list,
    'stageout'           : pbs_types.staging_list,
    'range'              : pbs_types.range,
    'state_count'        : pbs_types.state_count,
    'license_count'      : pbs_types.license_count,
    'scheduler_iteration': pbs_types.duration,
    'reserve_duration'   : pbs_types.duration,
    'args'               : pbs_types.args,
    'job_sort_formula'   : pbs_types.job_sort_formula,
    'node_group_key'     : pbs_types.node_group_key,
    'sandbox'	    : pbs_types.sandbox,
    'pbs_version'        : pbs_types.version,
    'software'           : pbs_types.software,
    'acl_roots'          : pbs_types.acl,
    'acl_hosts'          : pbs_types.acl,
    'acl_resv_hosts'     : pbs_types.acl,
    'acl_resv_groups'    : pbs_types.acl,
    'acl_resv_users'     : pbs_types.acl,
    'acl_groups'         : pbs_types.acl,
    'acl_users'          : pbs_types.acl,
    'state_count'        : pbs_types.state_count,
    'server_state'       : pbs_types.server_state,
    'route_destinations' : pbs_types.route_destinations,
    'Variable_List'	    : pbs_types.pbs_env,
    'queue_type'	    : pbs_types.queue_type,
    'job_state'	    : pbs_types.job_state,
    'license'            : pbs_types.pbs_str,
    'license_info'       : pbs_types.pbs_int,
    'attr_descriptor'    : pbs_types.PbsAttributeDescriptor,
    'generic_type'       : pbs_types._generic_attr,
    'pbs_bool'           : pbs_types.pbs_bool,
    'pbs_int'            : pbs_types.pbs_int,
    'pbs_env'            : pbs_types.pbs_env,
    'pbs_list'           : pbs_types.pbs_str,
    'pbs_str'            : pbs_types.pbs_str,
    'pbs_float'          : pbs_types.pbs_float,
    'pbs_resource'       : pbs_types.pbs_resource,
    'size'               : pbs_types.size,
    'generic_time'       : pbs_types.duration,
    'generic_acl'        : pbs_types.acl,
    'queue'              : _queue,
    'default_queue'      : _queue,
    'job'                : _job,
    'management'         : _management,
    'server_attribute'   : _server_attribute,
    'server'             : _server,
    'resv'               : _resv,
    'vnode'              : _vnode,
    'event'              : _event,
    'pbs_iter'	    : pbs_iter,
    'state'   	    : pbs_types.vnode_state,
    'sharing'   	    : pbs_types.vnode_sharing,
    'ntype'   	    : pbs_types.vnode_ntype,
    'pbs_entity'   	    : str,
    'EventIncompatibleError'    : EventIncompatibleError,
    'UnsetAttributeNameError'   : UnsetAttributeNameError,
    'BadAttributeValueTypeError': BadAttributeValueTypeError,
    'BadAttributeValueError'    : BadAttributeValueError,
    'UnsetResourceNameError'    : UnsetResourceNameError,
    'BadResourceValueTypeError' : BadResourceValueTypeError,
    'BadResourceValueError'     : BadResourceValueError
}


================================================
FILE: src/modules/python/pbs/v1/_pmi_cray.py
================================================
# coding: utf-8
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

 *
 */
"""
__doc__ = """
This module is used for Cray systems.
"""

import os
import stat
import time
import random
from subprocess import Popen, PIPE
from pbs.v1._pmi_types import BackendError
import pbs
from pbs.v1._pmi_utils import _running_excl, _pbs_conf, _get_vnode_names, \
    _svr_vnode

pbsexec = _pbs_conf("PBS_EXEC")
if pbsexec is None:
    raise BackendError("PBS_EXEC not found")


def launch(jid, args):
    """
    Run capmc and return the structured output.

    :param jid: job id
    :type jid: str
    :param args: arguments for capmc command
    :type args: str
    :returns: capmc output in json format.
    """
    import json

    # full path to capmc given by Cray
    cmd = os.path.join(os.path.sep, 'opt', 'cray',
                       'capmc', 'default', 'bin', 'capmc')
    if not os.path.exists(cmd):
        cmd = "capmc"		# should be in PATH then
    cmd = cmd + " " + args
    fail = ""

    pbs.logjobmsg(jid, "launch: " + cmd)
    cmd_run = Popen(cmd, shell=True, stdout=PIPE, stderr=PIPE)
    (cmd_out, cmd_err) = cmd_run.communicate()
    exitval = cmd_run.returncode
    if exitval != 0:
        fail = "%s: exit %d" % (cmd, exitval)
    else:
        pbs.logjobmsg(jid, "launch: finished")

    try:
        out = json.loads(cmd_out)
    except Exception:
        out = None
    try:
        err = cmd_err.splitlines()[0]           # first line only
    except Exception:
        err = ""
    if out is not None:
        errno = out["e"]
        msg = out["err_msg"]
        if errno != 0 or (len(msg) > 0 and msg != "Success"):
            fail = "output: e=%d err_msg='%s'" % (errno, msg)
    if len(err) > 0:
        pbs.logjobmsg(jid, "stderr: %s" % err.strip())

    if len(fail) > 0:
        pbs.logjobmsg(jid, fail)
        raise BackendError(fail)
    return out


def jobnids(job):
    """
    Return the set of nids belonging to a job.

    :param job: job id
    :type job: str
    :returns: set of nids from node's resources_available[craynid].
    """
    nidset = set()
    craynid = "PBScraynid"
    for vname in _get_vnode_names(job):
        vnode = _svr_vnode(vname)
        try:
            nidset.add(int(vnode.resources_available[craynid]))
        except Exception:
            pass
    return nidset


def nodenids(hosts):
    """
    Return the set of nids from the host list.

    :param hosts: list of exec hosts from the job.
    :type hosts: str
    :returns: set of nids from node's resources_available[craynid].
    """
    nidset = set()
    craynid = "PBScraynid"
    for vnames in hosts:
        vnode = _svr_vnode(vnames)
        try:
            nidset.add(int(vnode.resources_available[craynid]))
        except Exception:
            pass
    return nidset


def nidlist(job=None, nidset=None):
    """
    Return a string to be used with capmc --nids option
    and the number of nids

    :param job: job id.
    :type job: str
    :param nidset: nid set
    :type nidset: set
    :returns: retunrs a list of nids that can be used with capmc.
              in the foramt "24-30, 51, 53, 60-65"
    """
    if nidset is None:
        nidset = jobnids(job)
    nids = []
    first = ""
    last = ""
    prev = 0
    for nid in sorted(nidset):
        val = nid
        if len(first) == 0:		# start point
            first = str(nid)
        elif prev + 1 != val:
            if prev == int(first):
                nids.append(first)
            else:
                nids.append(first + "-" + last)
            first = str(nid)
        prev = val
        last = str(nid)
    if len(first) > 0:
        if prev == int(first):
            nids.append(first)
        else:
            nids.append(first + "-" + last)
    return ",".join(nids), len(nidset)


def spool_file(name):
    """
    Form a path to the PBS spool directory with name as the last element.

    :param name: energy file name in format <jobid>.energy.
    :type name: str
    :returns: path to RUR/energy file in format PBS_HOME/spool/<jobid>.energy.
    """
    home = _pbs_conf("PBS_HOME")
    if home is None:
        raise BackendError("PBS_HOME not found")
    return os.path.join(home, "spool", name)


def energy_file(job):
    """
    Form a path to the PBS spool directory with name as the last element.

    :param job: job id.
    :type job: str
    :returns: path to energy file in format PBS_HOME/spool/<jobid>.energy.
    """
    return spool_file("%s.energy" % job.id)


def rur_file(job):
    """
    Form a path to the PBS spool directory with name as the last element.

    :param job: job id.
    :type job: str
    :returns: path to RUR file in format PBS_HOME/spool/<jobid>.rur.
    """
    return spool_file("%s.rur" % job.id)


def node_energy(jid, nids, cnt):
    """
    Return the result of running capmc get_node_energy_counter.
    The magic number of 15 seconds in the past is used because that
    is the most current value that can be expected from capmc.

    :param jid: job id.
    :type jid: str
    :param nids: nid list
    :type nids: str
    :param cnt: node count
    :type cnt: int
    :returns: ret on successfull energy usage capmc query.
              None on failure.
    """
    if cnt == 0:
        return None
    cmd = "get_node_energy_counter --nids %s" % nids
    ret = launch(jid, cmd)
    cntkey = "nid_count"
    gotcnt = "<notset>"
    if (ret is not None) and (cntkey in ret):
        gotcnt = ret[cntkey]
        if gotcnt == cnt:
            return ret

    pbs.logjobmsg(jid, "node count %s, should be %d" % (str(gotcnt), cnt))
    ret = launch(jid, cmd)
    gotcnt = "<notset>"
    if (ret is not None) and (cntkey in ret):
        gotcnt = ret[cntkey]
        if gotcnt == cnt:
            return ret

    pbs.logjobmsg(jid, "second query failed, node count %s, should be %d" %
                  (str(gotcnt), cnt))
    return None


def job_energy(job, nids, cnt):
    """
    Return energy counter from capmc.  Return None if no energy
    value is available.

    :param job: pbs job.
    :type job: str
    :param nids: nid list
    :type nids: str
    :param cnt: node count
    :type cnt: int
    :returns: ret on successfull energy usage capmc query.
              None on failure.
    """
    energy = None
    ret = node_energy(job.id, nids, cnt)
    if ret is not None and "nodes" in ret:
        energy = 0
        for node in ret["nodes"]:
            energy += node["energy_ctr"]
        pbs.logjobmsg(job.id, "energy usage %dJ" % energy)
    return energy


class Pmi:

    ninfo = None
    nidarray = dict()

    def __init__(self, pyhome=None):
        pbs.logmsg(pbs.EVENT_DEBUG3, "Cray: init")

    def _connect(self, endpoint=None, port=None, job=None):
        if job is None:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Cray: connect")
        else:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Cray: %s connect" % (job.id))
        return

    def _disconnect(self, job=None):
        if job is None:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Cray: disconnect")
        else:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Cray: %s disconnect" % (job.id))
        return

    def _get_usage(self, job):
        pbs.logmsg(pbs.EVENT_DEBUG3, "Cray: %s get_usage" % (job.id))
        try:
            f = open(energy_file(job), "r")
            start = int(f.read())
            f.close()
        except Exception:
            return None

        e = pbs.event()
        if e.type == pbs.EXECHOST_PERIODIC:
            # This function will be called for each job in turn when
            # running from a periodic hook.  Here we fill in some
            # global variables just once and use the information
            # for each job in turn.  Save the result of calling capmc
            # for all running jobs in the variable ninfo.  Keep a
            # dictionary with the job id's as keys holding a set
            # of nid numbers.
            if Pmi.ninfo is None:
                allnids = set()
                for jobid in list(e.job_list.keys()):
                    j = e.job_list[jobid]
                    nidset = jobnids(j)
                    allnids.update(nidset)
                    Pmi.nidarray[jobid] = nidset
                nids, cnt = nidlist(None, allnids)
                Pmi.ninfo = node_energy("all", nids, cnt)
            nidset = Pmi.nidarray[job.id]
            energy = None
            if Pmi.ninfo is not None and "nodes" in Pmi.ninfo:
                energy = 0
                for node in Pmi.ninfo["nodes"]:
                    if node["nid"] in nidset:		# owned by job of interest
                        energy += node["energy_ctr"]
                pbs.logjobmsg(job.id, "Cray: get_usage: energy %dJ" %
                              energy)
        else:
            nids, cnt = nidlist(job)
            energy = job_energy(job, nids, cnt)
        if energy is not None:
            return float(energy - start) / 3600000.0
        else:
            return None

    def _query(self, query_type):
        pbs.logmsg(pbs.LOG_DEBUG, "Cray: query")
        return None

    def _activate_profile(self, profile_name, job):
        pbs.logmsg(pbs.LOG_DEBUG, "Cray: %s activate '%s'" %
                   (job.id, str(profile_name)))

        nids, cnt = nidlist(job)
        if cnt == 0:
            pbs.logjobmsg(job.id, "Cray: no compute nodes for power setting")
            return False

        energy = job_energy(job, nids, cnt)
        if energy is not None:
            f = open(energy_file(job), "w")
            f.write(str(energy))
            f.close()

        # If this is the only job, set nodes to capped power.
        if _running_excl(job):
            cmd = "set_power_cap --nids " + nids
            doit = False

            pcap = job.Resource_List['pcap_node']
            if pcap is not None:
                pbs.logjobmsg(job.id, "Cray: pcap node %d" % pcap)
                cmd += " --node " + str(pcap)
                doit = True
            pcap = job.Resource_List['pcap_accelerator']
            if pcap is not None:
                pbs.logjobmsg(job.id, "Cray: pcap accel %d" % pcap)
                cmd += " --accel " + str(pcap)
                doit = True

            if doit:
                launch(job.id, cmd)
            else:
                pbs.logjobmsg(job.id, "Cray: no power cap to set")

        return True

    def _deactivate_profile(self, job):
        pbs.logmsg(pbs.LOG_DEBUG, "Cray: deactivate %s" % job.id)
        nids, cnt = nidlist(job)
        if cnt == 0:
            pbs.logjobmsg(job.id, "Cray: no compute nodes for power setting")
            return False

        # remove initial energy file
        try:
            os.unlink(energy_file(job))
        except Exception:
            pass

        # If this is the only job, undo any power cap we set.
        if _running_excl(job):
            cmd = "set_power_cap --nids " + nids
            doit = False

            pcap = job.Resource_List['pcap_node']
            if pcap is not None:
                pbs.logjobmsg(job.id, "Cray: remove pcap node %d" % pcap)
                cmd += " --node 0"
                doit = True
            pcap = job.Resource_List['pcap_accelerator']
            if pcap is not None:
                pbs.logjobmsg(job.id, "Cray: remove pcap accel %d" % pcap)
                cmd += " --accel 0"
                doit = True

            if doit:
                try:
                    launch(job.id, cmd)
                except Exception:
                    pass
            else:
                pbs.logjobmsg(job.id, "Cray: no power cap to remove")

        # Get final energy value from RUR data
        name = rur_file(job)
        try:
            rurfp = open(name, "r")
        except Exception:
            pbs.logjobmsg(job.id, "Cray: no RUR data")
            return False

        sbuf = os.fstat(rurfp.fileno())
        if (sbuf.st_uid != 0) or (sbuf.st_mode & stat.S_IWOTH):
            pbs.logjobmsg(job.id, "Cray: RUR file permission: %s" % name)
            rurfp.close()
            os.unlink(name)
            return False

        pbs.logjobmsg(job.id, "Cray: reading RUR file: %s" % name)
        energy = 0
        seen = False        # track if energy plugin is seen
        for line in rurfp:
            plugin, _, rest = line.partition(" : ")
            if plugin != "energy":		# check that the plugin is energy
                continue

            apid, _, metstr = rest.partition(" : ")
            seen = True
            try:						# parse the metric list
                metlist = eval(metstr, {})
                metrics = dict(
                    metlist[i:i + 2] for i in range(0, len(metlist), 2))
                joules = metrics["energy_used"]
                energy += joules
                pbs.logjobmsg(
                    job.id,
                    'Cray:RUR: {"apid":%s,"apid_energy":%dJ,"job_energy":%dJ}'
                    % (apid, joules, energy))
            except Exception as e:
                pbs.logjobmsg(job.id,
                              "Cray:RUR: energy_used not found: %s" % str(e))

        rurfp.close()
        os.unlink(name)

        if not seen:
            pbs.logjobmsg(job.id, "Cray:RUR: no energy plugin")
            return False

        old_energy = job.resources_used["energy"]
        new_energy = float(energy) / 3600000.0
        if old_energy is None:
            pbs.logjobmsg(job.id, "Cray:RUR: energy %fkWh" % new_energy)
            job.resources_used["energy"] = new_energy
        elif new_energy > old_energy:
            pbs.logjobmsg(
                job.id,
                "Cray:RUR: energy %fkWh replaces periodic energy %fkWh" %
                (new_energy, old_energy))
            job.resources_used["energy"] = new_energy
        else:
            pbs.logjobmsg(
                job.id,
                "Cray:RUR: energy %fkWh last periodic usage %fkWh" %
                (new_energy, old_energy))
        return True

    def _pmi_power_off(self, hosts):
        pbs.logmsg(pbs.LOG_DEBUG, "Cray: powering-off the node")
        nidset = nodenids(hosts)
        nids, _ = nidlist(None, nidset)
        cmd = "node_off --nids " + nids
        func = "pmi_power_off"
        launch(func, cmd)
        return True

    def _pmi_power_on(self, hosts):
        pbs.logmsg(pbs.LOG_DEBUG, "Cray: powering-on the node")
        nidset = nodenids(hosts)
        nids, _ = nidlist(None, nidset)
        cmd = "node_on --nids " + nids
        func = "pmi_power_on"
        launch(func, cmd)
        return True

    def _pmi_ramp_down(self, hosts):
        pbs.logmsg(pbs.LOG_DEBUG, "Cray: ramping down the node")
        nidset = nodenids(hosts)
        nids, _ = nidlist(None, nidset)
        cmd = "get_sleep_state_limit_capabilities --nids " + nids
        func = "pmi_ramp_down"
        out = launch(func, cmd)
        for n in out["nids"]:
            if "data" in n:
                nid = n["nid"]
                states = n["data"]["PWR_Attrs"][0]["PWR_AttrValueCapabilities"]
                for s in states:
                    if int(s) != 0:
                        cmd = ("set_sleep_state_limit --nids " + str(nid) +
                               " --limit " + str(s))
                        launch(func, cmd)
                        sleep_time = random.randint(1, 10)
                        time.sleep(sleep_time)
        return True

    def _pmi_ramp_up(self, hosts):
        pbs.logmsg(pbs.LOG_DEBUG, "Cray: ramping up the node")
        nidset = nodenids(hosts)
        nids, _ = nidlist(None, nidset)
        cmd = "get_sleep_state_limit_capabilities --nids " + nids
        func = "pmi_ramp_up"
        out = launch(func, cmd)
        for n in out["nids"]:
            if "data" in n:
                nid = n["nid"]
                states = n["data"]["PWR_Attrs"][0]["PWR_AttrValueCapabilities"]
                for s in reversed(states):
                    if int(s) != 0:
                        cmd = ("set_sleep_state_limit --nids " + str(nid) +
                               " --limit " + str(s))
                        launch(func, cmd)
                        sleep_time = random.randint(1, 10)
                        time.sleep(sleep_time)
        return True

    def _pmi_power_status(self, hosts):
        # Do a capmc node_status and return a list of ready nodes.
        pbs.logmsg(pbs.EVENT_DEBUG3, "Cray: status of the nodes")
        nidset = nodenids(hosts)
        nids, _ = nidlist(nidset=nidset)
        cmd = "node_status --nids " + nids
        func = "pmi_power_status"
        out = launch(func, cmd)
        ready = []
        nodeset = set()
        if 'ready' in out:
            ready = out['ready']
        else:
            return nodeset
        craynid = "PBScraynid"
        for vnames in hosts:
            vnode = _svr_vnode(vnames)
            if craynid in vnode.resources_available:
                nid = int(vnode.resources_available[craynid])
                if nid in ready:
                    nodeset.add(vnames)
        return nodeset


================================================
FILE: src/modules/python/pbs/v1/_pmi_none.py
================================================

"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
__doc__ = """
This module is be used when no PMI is present.
"""

import pbs


class Pmi:
    def __init__(self, pyhome=None):
        pbs.logmsg(pbs.LOG_WARNING, "Stubbed PMI calls are being used")

    def _connect(self, endpoint, port, job):
        return

    def _disconnect(self, job):
        return

    def _get_usage(self, job):
        return None

    def _query(self, query_type):
        return None

    def _activate_profile(self, profile_name, job):
        return False

    def _deactivate_profile(self, job):
        return False

    def _pmi_power_off(self, hosts):
        return False

    def _pmi_power_on(self, hosts):
        return False

    def _pmi_ramp_down(self, hosts):
        return False

    def _pmi_ramp_up(self, hosts):
        return False

    def _pmi_power_status(self, hosts):
        return False


================================================
FILE: src/modules/python/pbs/v1/_pmi_sgi.py
================================================

"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""

__doc__ = """
This module is used for SGI systems.
"""

import pbs
import os
import sys
from pbs.v1._pmi_types import BackendError
from pbs.v1._pmi_utils import _pbs_conf, _get_hosts

pbsexec = _pbs_conf("PBS_EXEC")
if pbsexec is None:
    raise BackendError("PBS_EXEC not found")

py_version = str(sys.version_info.major) + "." + str(sys.version_info.minor)
_path = os.path.join(pbsexec, "python", "lib", py_version)
if _path not in sys.path:
    sys.path.append(_path)
_path = os.path.join(pbsexec, "python", "lib", py_version, "lib-dynload")
if _path not in sys.path:
    sys.path.append(_path)
import encodings


# Plug in the path for the HPE/SGI power API.
_path = "/opt/clmgr/power-service"
if os.path.exists(_path):
    # Look for HPCM support.
    if _path not in sys.path:
        sys.path.append(_path)
    import hpe_clmgr_power_api as api
else:
    # Look for SGIMC support.
    _path = "/opt/sgi/ta"
    if _path not in sys.path:
        sys.path.append(_path)
    import sgi_power_api as api


class Pmi:
    def __init__(self, pyhome=None):
        pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: init")
        api.SERVER = """lead-eth:8888"""

    def _connect(self, endpoint, port, job):
        if job is None:
            pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: connect")
        else:
            pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: %s connect" % (job.id))
        api.VerifyConnection()
        return

    def _disconnect(self, job):
        if job is None:
            pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: disconnect")
        else:
            pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: %s disconnect" % (job.id))
        return

    def _get_usage(self, job):
        pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: %s get_usage" % (job.id))
        report = api.MonitorReport(job.id)
        if report is not None and report[0] == 'total_energy':
            pbs.logjobmsg(job.id, "SGI: energy %fkWh" % report[1])
            return report[1]
        return None

    def _query(self, query_type):
        pbs.logmsg(pbs.LOG_DEBUG, "SGI: query")
        if query_type == pbs.Power.QUERY_PROFILE:
            return api.ListAvailableProfiles()
        return None

    def _activate_profile(self, profile_name, job):
        pbs.logmsg(pbs.LOG_DEBUG, "SGI: %s activate '%s'" %
                   (job.id, str(profile_name)))
        api.NodesetCreate(job.id, _get_hosts(job))
        api.MonitorStart(job.id, profile_name)
        return False

    def _deactivate_profile(self, job):
        pbs.logmsg(pbs.LOG_DEBUG, "SGI: %s deactivate" % (job.id))
        try:
            api.MonitorStop(job.id)
        # be sure to remove the nodeset
        finally:
            api.NodesetDelete(job.id)
        return False

    def _pmi_power_off(self, hosts):
        pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: powering-off the node")
        return False

    def _pmi_power_on(self, hosts):
        pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: powering-on the node")
        return False

    def _pmi_ramp_down(self, hosts):
        pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: ramp-down the node")
        return False

    def _pmi_ramp_up(self, hosts):
        pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: ramp up the node")
        return False

    def _pmi_power_status(self, hosts):
        pbs.logmsg(pbs.EVENT_DEBUG3, "SGI: status of the nodes")
        return False


================================================
FILE: src/modules/python/pbs/v1/_pmi_types.py
================================================

"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""

__doc__ = """
This file contains the Power Management Infrastructure (PMI) base types.
It contains mostly vendor agnostic code with the exception of the
initialization method that determines which vendor specific PMI calls
to import.
"""

import sys
import os
import pbs
from pbs.v1._pmi_utils import _get_hosts, _get_vnode_names, _running_excl
from pbs.v1._exc_types import *


class InternalError(Exception):
    def __init__(self, msg="Internal error encountered."):
        self.msg = msg

    def __str__(self):
        return repr(self.msg)


class BackendError(Exception):
    def __init__(self, msg="Backend error encountered."):
        self.msg = msg

    def __str__(self):
        return repr(self.msg)


class Power:

    QUERY_PROFILE = 0

    def __init__(self, requested_pmi=None):
        self.__pmi = None
        self.__sitepk = None

        if requested_pmi is None:
            self.pmi_type = self.__get_pmi_type()
        else:
            self.pmi_type = requested_pmi

        try:
            _temp = __import__("pbs.v1._pmi_" + self.pmi_type,
                               globals(), locals(), ['Pmi'], 0)
        except Exception as e:
            raise InternalError(
                "could not import: " + self.pmi_type + ": " + str(e))

        try:
            self.__pmi = _temp.Pmi(self.__sitepk)
        except Exception as e:
            raise InternalError(
                "No such PMI: " + self.pmi_type + ": " + str(e))

    def __get_pmi_type(self):
        """
        Determine what system is being used.
        """
        if os.path.exists('/proc/cray_xt/cname'):
            return "cray"
        if (os.path.exists('/opt/clmgr/power-service') or
            os.path.exists('/opt/sgi')):
            return "sgi"
        return "none"

    def _map_profile_names(self, pnames):
        """
        Take a python list of profile names and create a string suitable for
        setting the eoe value for a node.
        """
        if pnames is None:
            return ""
        return ",".join(pnames)

    def _check_pmi(self):
        if self.__pmi is None:
            raise InternalError("No Power Management Interface instance.")

    def connect(self, endpoint=None, port=None, job=None):
        self._check_pmi()
        if job is None:
            try:
                job = pbs.event().job
            except EventIncompatibleError:
                pass
        return self.__pmi._connect(endpoint, port, job)

    def disconnect(self, job=None):
        self._check_pmi()
        if job is None:
            try:
                job = pbs.event().job
            except EventIncompatibleError:
                pass
        return self.__pmi._disconnect(job)

    def get_usage(self, job=None):
        self._check_pmi()
        if job is None:
            job = pbs.event().job
        return self.__pmi._get_usage(job)

    def query(self, query_type=None):
        self._check_pmi()
        return self.__pmi._query(query_type)

    def activate_profile(self, profile_name=None, job=None):
        self._check_pmi()
        if job is None:
            job = pbs.event().job

        try:
            ret = self.__pmi._activate_profile(profile_name, job)
            if profile_name is not None:
                hosts = _get_vnode_names(job)
                for h in hosts:
                    try:
                        pbs.event().vnode_list[h].current_eoe = profile_name
                    except Exception:
                        pass
            return ret
        except BackendError as e:
            # get fresh set of profile names, ignore errors
            mynode = pbs.event().vnode_list[pbs.get_local_nodename()]
            if mynode.power_provisioning:
                try:
                    profiles = self.__pmi._query(
                        pbs.Power.QUERY_PROFILE)
                    names = self._map_profile_names(profiles)
                    mynode.resources_available["eoe"] = names
                    pbs.logmsg(pbs.LOG_WARNING,
                               "PMI:activate: set eoe: %s" % names)
                except Exception:
                    pass
            raise BackendError(e)
        except InternalError as e:
            # couldn't do activation so set vnode offline
            me = pbs.get_local_nodename()
            pbs.event().vnode_list[me].state += pbs.ND_OFFLINE
            pbs.logmsg(pbs.LOG_WARNING, "PMI:activate: set vnode offline")
            raise InternalError(e)

    def deactivate_profile(self, job=None):
        self._check_pmi()

        if job is None:
            job = pbs.event().job
        if _running_excl(job):
            pbs.logjobmsg(job.id, "PMI: reset current_eoe")
            for h in _get_vnode_names(job):
                try:
                    pbs.event().vnode_list[h].current_eoe = None
                except Exception:
                    pass
        return self.__pmi._deactivate_profile(job)

    def power_off(self, hosts=None):
        self._check_pmi()
        pbs.logmsg(pbs.EVENT_DEBUG3, "PMI:poweroff: powering off nodes")
        return self.__pmi._pmi_power_off(hosts)

    def power_on(self, hosts=None):
        self._check_pmi()
        pbs.logmsg(pbs.EVENT_DEBUG3, "PMI:poweron: powering on nodes")
        return self.__pmi._pmi_power_on(hosts)

    def ramp_down(self, hosts=None):
        self._check_pmi()
        pbs.logmsg(pbs.EVENT_DEBUG3, "PMI:rampdown: ramping down nodes")
        return self.__pmi._pmi_ramp_down(hosts)

    def ramp_up(self, hosts=None):
        self._check_pmi()
        pbs.logmsg(pbs.EVENT_DEBUG3, "PMI:rampup: ramping up nodes")
        return self.__pmi._pmi_ramp_up(hosts)

    def power_status(self, hosts=None):
        self._check_pmi()
        pbs.logmsg(pbs.EVENT_DEBUG3, "PMI:powerstatus: status of nodes")
        return self.__pmi._pmi_power_status(hosts)


================================================
FILE: src/modules/python/pbs/v1/_pmi_utils.py
================================================
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
__doc__ = """
$Id$
Utility power functions.
"""

import pbs
import os
import sys


def _pbs_conf(confvar):
    # Return the value of a setting in the pbs.conf file if it exists.
    # Save the values in a global dictionary for future use.

    if confvar in os.environ:
        return os.environ[confvar]

    global pmi_pbsconf
    if "pmi_pbsconf" not in globals():
        pmi_pbsconf = dict()
        cfile = "PBS_CONF_FILE"
        if cfile in os.environ:
            pbsconf = os.environ[cfile]
        else:
            pbsconf = "/etc/pbs.conf"

        try:
            fp = open(pbsconf)
        except OSError:
            pbs.logmsg(pbs.DEBUG, "%s: Unable to open conf file." % pbsconf)
            return None
        else:
            for line in fp:
                line = line.strip()
                # ignore empty lines or those beginning with '#'
                if line == "" or line[0] == "#":
                    continue
                var, eq, val = line.partition('=')
                if val == "":
                    continue
                pmi_pbsconf[var] = val
            fp.close()
    if confvar in pmi_pbsconf:
        return pmi_pbsconf[confvar]
    else:
        return None


def _is_node_provisionable():
    """
    Check if the local machine is running pbs_server or
    pbs_sched or pbs_comm. If any of these are running, provisioning
    must not be automatically enabled.
    """
    serv = _pbs_conf("PBS_START_SERVER")
    if serv is not None and serv == "1":
        return False

    sched = _pbs_conf("PBS_START_SCHED")
    if sched is not None and sched == "1":
        return False

    comm = _pbs_conf("PBS_START_COMM")
    if comm is not None and comm == "1":
        return False

    return True


def _get_hosts(job):
    """
    Form a list of unique short hostnames from a pbs job.
    The short names are used even if the hostnames from exec_host2
    are FQDNs because SGIMC seems to have a bug in that it will
    not accept FQDNs.
    """
    hosts = str(job.exec_host2)
    pbs_nodes = sorted({x.partition(':')[0].partition('.')[0]
                            for x in hosts.split('+')})
    return pbs_nodes


def _jobreq(job, name):
    """
    Get a requested resource from a job.
    """
    val = str(job.schedselect).partition(name + '=')[2]
    if len(val) == 0:
        return None
    else:
        return val.partition('+')[0].partition(':')[0]


def _get_vnode_names(job):
    """
    Return a list of vnodes being used for a job.
    """
    exec_vnode = str(job.exec_vnode).replace("(", "").replace(")", "")
    vnodes = sorted({x.partition(':')[0]
                        for x in exec_vnode.split('+')})
    return vnodes


def _svr_vnode(name):
    # Return a vnode object obtained from the server by name.
    # Save the values in a global dictionary for future use.
    global pmi_pbsconf
    if "pmi_pbsvnodes" not in globals():
        global pmi_pbsvnodes
        pmi_pbsvnodes = dict()
        for vn in pbs.server().vnodes():
            pmi_pbsvnodes[vn.name] = vn
    return pmi_pbsvnodes[name]


def _running_excl(job):
    # Look for any other job that is running on a job's vnodes
    for vname in _get_vnode_names(job):
        vnode = _svr_vnode(vname)
        for j in str(vnode.jobs).split(', '):
            id = j.partition('/')[0]
            if job.id != id:
                return False
    return True


================================================
FILE: src/modules/python/pbs/v1/_svr_types.py
================================================
# coding: utf-8
"""

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""

__doc__ = """

This module captures all the python types representing the PBS Server objects
(server,queue,job,resv, etc.)
"""
from ._base_types import (PbsAttributeDescriptor, PbsReadOnlyDescriptor,
                          pbs_resource, pbs_bool, _LOG,
                          )
import _pbs_v1
from _pbs_v1 import (_event_accept, _event_reject,
                     _event_param_mod_allow, _event_param_mod_disallow,
                     iter_nextfunc)

from ._exc_types import *

NAS_mod = 0

try:
    if _pbs_v1.get_python_daemon_name() == "pbs_python":
        from _pbs_ifl import *
        from pbs_ifl import *
except ImportError:
    pass

# Set global hook_config_filename parameter.
hook_config_filename = None
try:
    import os

    if "PBS_HOOK_CONFIG_FILE" in os.environ:
        hook_config_filename = os.environ["PBS_HOOK_CONFIG_FILE"]
except Exception:
    pass

# Set global pbs_conf parameter.
pbs_conf = _pbs_v1.get_pbs_conf()


#
# get_server_data_fp: returns the file object representing the
#                     hook debug data file.
def get_server_data_fp():
    data_file = _pbs_v1.get_server_data_file()
    if data_file is None:
        return None
    try:
        return open(data_file, "a+")
    except OSError:
        _pbs_v1.logmsg(_pbs_v1.LOG_WARNING,
                       "warning: error opening debug data file %s" % data_file)
        return None

#
# get_local_nodename: returns the name of the current host as it would appear
#                      as a vnode name. This is usually the short form of the
#                      hostname.


def get_local_nodename():
    return(_pbs_v1.get_local_host_name())


#
# pbs_statobj: general-purpose function that connects to server named
#           'connect_server' or if None, use "localhost", and depending
#            on 'objtype', then performs pbs_statjob(), ps_statque(),
#            pbs_statresv(), pbs_statvnode(), or pbs_statserver(), and
#            returning results in a new object of type _job, _queue,
#            _resv, _vnode, or _server.
#            NOTE: 'filter_queue' is used for a "job" type, which means
#                  the job must be in the queue 'filter_queue' for the
#                  job object to be instantiated.
def pbs_statobj(objtype, name=None, connect_server=None, filter_queue=None):
    """
    Returns a PBS (e.g. _job, _queue, _resv, _vnode, _server) object
    that is populated with data obtained by calling PBS APIs:
    pbs_statjob(), pbs_statque(), pbs_statresv(), pbs_statvnode(),
    pbs_statserver(), using a connection handle to 'connect_server'.

    If 'objtype'  is "job", then return the _job object.
    If 'objtype'  is "queue", then return the _queue object.
    If 'objtype'  is "resv", then return the _resv object.
    If 'objtype'  is "vnode", then return the _vnode object.
    If 'objtype'  is "server", then return the _server object.

    'filter_queue' is used for a "job" type, which means
    the job must be in the queue 'filter_queue' for the
    job object to be instantiated.
    """

    _pbs_v1.set_c_mode()

    if(connect_server is None):
        con = pbs_connect("localhost")
    else:
        con = pbs_connect(connect_server)

    if con < 0:
        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                       "pbs_statobj: Unable to connect to server %s"
                       % (connect_server))
        _pbs_v1.set_python_mode()
        return None

    if(objtype == "job"):
        bs = pbs_statjob(con, name, None, None)
        header_str = "pbs.server().job(%s)" % (name,)
    elif(objtype == "queue"):
        bs = pbs_statque(con, name, None, None)
        header_str = "pbs.server().queue(%s)" % (name,)
    elif(objtype == "vnode"):
        bs = pbs_statvnode(con, name, None, None)
        header_str = "pbs.server().vnode(%s)" % (name,)
    elif(objtype == "resv"):
        bs = pbs_statresv(con, name, None, None)
        header_str = "pbs.server().resv(%s)" % (name,)
    elif(objtype == "server"):
        bs = pbs_statserver(con, None, None)
        header_str = "pbs.server()"
    else:
        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                       "pbs_statobj: Bad object type %s" % (objtype))
        pbs_disconnect(con)
        _pbs_v1.set_python_mode()
        return None

    server_data_fp = get_server_data_fp()

    b = bs
    obj = None
    while(b):
        if(objtype == "job"):
            obj = _job(b.name, connect_server)
        elif(objtype == "queue"):
            obj = _queue(b.name, connect_server)
        elif(objtype == "vnode"):
            obj = _vnode(b.name, connect_server)
        elif(objtype == "resv"):
            obj = _resv(b.name, connect_server)
        elif(objtype == "server"):
            obj = _server(b.name, connect_server)
        else:
            _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                           "pbs_statobj: Bad object type %s" % (objtype))
            pbs_disconnect(con)
            if server_data_fp:
                server_data_fp.close()
            _pbs_v1.set_python_mode()
            return None

        a = b.attribs

        while(a):
            n = a.name
            r = a.resource
            v = a.value

            if(objtype == "vnode"):
                if(n == ATTR_NODE_state):
                    v = _pbs_v1.str_to_vnode_state(v)
                elif(n == ATTR_NODE_ntype):
                    v = _pbs_v1.str_to_vnode_ntype(v)
                elif(n == ATTR_NODE_Sharing):
                    v = _pbs_v1.str_to_vnode_sharing(v)

            elif(objtype == "job"):
                if((filter_queue is not None) and (n == ATTR_queue) and
                        (filter_queue != v)):
                    pbs_disconnect(con)
                    if server_data_fp:
                        server_data_fp.close()
                    _pbs_v1.set_python_mode()
                    return None
                if n == ATTR_inter or n == ATTR_block or n == ATTR_X11_port:
                    v = int(pbs_bool(v))

            if(r):
                pr = getattr(obj, n)

                # instantiate Resource_List object if not set
                if(pr is None):
                    setattr(obj, n)

                pr = getattr(obj, n)
                if (pr is None):
                    _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                   "pbs_statobj: missing %s" % (n))
                    a = a.next
                    continue

                vo = getattr(pr, r)
                if(vo is None):
                    setattr(pr, r, v)
                    if server_data_fp:
                        server_data_fp.write(
                            "%s.%s[%s]=%s\n" % (header_str, n, r, v))
                else:
                    # append value...
                    # example: "select=1:ncpus=1,ncpus=1,nodect=1,place=pack"
                    vl = [vo, v]
                    setattr(pr, r, ",".join(vl))
                    if server_data_fp:
                        server_data_fp.write("%s.%s[%s]=%s\n" % (
                            header_str, n, r, ",".join(vl)))

            else:
                vo = getattr(obj, n)

                if(vo is None):
                    setattr(obj, n, v)
                    if server_data_fp:
                        server_data_fp.write("%s.%s=%s\n" % (header_str, n, v))
                else:
                    # append value
                    vl = [vo, v]
                    setattr(obj, n, ",".join(vl))
                    if server_data_fp:
                        server_data_fp.write("%s.%s=%s\n" %
                                             (header_str, n, ",".join(vl)))

            a = a.next

        b = b.next

    pbs_disconnect(con)
    if server_data_fp:
        server_data_fp.close()
    _pbs_v1.set_python_mode()
    return obj


# Allow the C implementation of hooks to call pbs_statobj function.
_pbs_v1.set_pbs_statobj(pbs_statobj)

#:------------------------------------------------------------------------
#                       JOB TYPE
#:-------------------------------------------------------------------------


class _job():
    """
    This represents a PBS job.
    """

    attributes = PbsReadOnlyDescriptor('attributes', {})

    def __new__(cls, value, connect_server=None):
        return object.__new__(cls)

    def __init__(self, jid, connect_server=None,
                 failed_node_list=None, node_list=None):
        """__init__"""

        self._attributes_hook_set = {}
        self.id = jid
        self._connect_server = connect_server
        self._readonly = False
        self._rerun = False
        self._delete = False
        self._checkpointed = False
        self._msmom = False
        self._stdout_file = None
        self._stderr_file = None
        self.failed_mom_list = failed_node_list
        self.succeeded_mom_list = node_list
    #: m(__init__)

    def __str__(self):
        """String representation of the object"""

        return str(self.id)
    #: m(__str__)

    def __setattr__(self, name, value):
        if name == '_attributes_hook_set':
            if _pbs_v1.in_python_mode():
                raise BadAttributeValueError(
                    f"the attribute '{name}' is readonly")
            super().__setattr__(name, value)
            return

        if name == "_readonly":
            if _pbs_v1.in_python_mode() and \
                    hasattr(self, "_readonly") and not value:
                raise BadAttributeValueError(
                    "_readonly can only be set to True!")
        elif ((name != "_rerun") and (name != "_delete") and
              (name != "_checkpointed") and (name != "_msmom") and
              (name != "_stdout_file") and (name != "_stderr_file") and
              name not in _job.attributes):
            raise UnsetAttributeNameError(
                "job attribute '%s' not found" % (name,))

        super().__setattr__(name, value)

        # attributes that are set in python mode will be reflected in
        # _attributes_hook_set dictionary.
        if _pbs_v1.in_python_mode():
            # using a dictionary value as easier to search for keys
            self._attributes_hook_set[name] = None
    #: m(__setattr__)

    def rerun(self):
        """rerun"""
        ev_type = _pbs_v1.event().type
        if ((ev_type & _pbs_v1.MOM_EVENTS) == 0):
            raise NotImplementedError("rerun(): only for mom hooks")
        self._rerun = True
    #: m(rerun)

    def delete(self):
        """delete"""
        ev_type = _pbs_v1.event().type
        if ((ev_type & _pbs_v1.MOM_EVENTS) == 0):
            raise NotImplementedError("delete(): only for mom hooks")
        self._delete = True
    #: m(rerun)

    def is_checkpointed(self):
        """is_checkpointed"""
        return self._checkpointed
    #: m(is_checkpointed)

    def in_ms_mom(self):
        """in_ms_mom"""
        return self._msmom
    #: m(in_ms_mom)

    def stdout_file(self):
        """stdout_file"""
        return self._stdout_file
    #: m(stdout_file)

    def stderr_file(self):
        """stderr_file"""
        return self._stderr_file
    #: m(stderr_file)

    def release_nodes(self, node_list=None, keep_select=None):
        """release_nodes"""
        if ((_pbs_v1.event().type & _pbs_v1.EXECJOB_PROLOGUE) == 0 and
                (_pbs_v1.event().type & _pbs_v1.EXECJOB_LAUNCH) == 0):
            return None
        tolerate_node_failures = None
        ajob = _pbs_v1.event().job
        if hasattr(ajob, "tolerate_node_failures"):
            tolerate_node_failures = getattr(ajob, "tolerate_node_failures")
            if tolerate_node_failures not in ["job_start", "all"]:
                msg = "no nodes released as job does not " \
                      "tolerate node failures"
                _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG, "%s: %s" % (ajob.id, msg))
                return ajob
        return _pbs_v1.release_nodes(self, node_list, keep_select)
    #: m(release_nodes)


_job.id = PbsAttributeDescriptor(_job, 'id', "", (str,))
_job.failed_mom_list = PbsAttributeDescriptor(
    _job, 'failed_mom_list', [], (list,))
_job.succeeded_mom_list = PbsAttributeDescriptor(
    _job, 'succeeded_mom_list', [], (list,))
_job._connect_server = PbsAttributeDescriptor(
    _job, '_connect_server', "", (str,))
#: C(job)

#:------------------------------------------------------------------------
#                       VNODE TYPE
#:-------------------------------------------------------------------------


class _vnode():
    """
    This represents a PBS vnode.
    """

    attributes = PbsReadOnlyDescriptor('attributes', {})

    def __new__(cls, value, connect_server=None):
        return object.__new__(cls)

    def __init__(self, name, connect_server=None):
        """__init__"""

        self._attributes_hook_set = {}
        self.name = name
        self._readonly = False
        self._connect_server = connect_server
    #: m(__init__)

    def __str__(self):
        """String representation of the object"""

        return str(self.name)
    #: m(__str__)

    def __setattr__(self, name, value):
        if name == '_attributes_hook_set':
            super().__setattr__(name, value)
            return

        if name == "_readonly":
            if _pbs_v1.in_python_mode() and \
                    hasattr(self, "_readonly") and not value:
                raise BadAttributeValueError(
                    "_readonly can only be set to True!")
        elif name not in _vnode.attributes:
            raise UnsetAttributeNameError(
                "vnode attribute '%s' not found" % (name,))

        super().__setattr__(name, value)

        # attributes that are set in python mode will be reflected in
        # _attributes_hook_set dictionary.
        if _pbs_v1.in_python_mode() and (name != "_connect_server"):
            # using a dictionary value as easier to search for keys
            self._attributes_hook_set[name] = None
            _pbs_v1.mark_vnode_set(self.name, name, str(value))

    #: m(__seattr__)
    
    def extract_state_strs(self):
        """returns the string values from the state bits."""
        lst = []
        if self.state == _pbs_v1.ND_STATE_FREE:
            lst.append('ND_STATE_FREE')
        else:
            lst = [
                val for (mask, val) in
                sorted(_pbs_v1.REVERSE_NODE_STATE.items())
                if self.state & mask
            ]
        return lst

    def extract_state_ints(self):
        """returns the integer values from the state bits."""
        lst = []
        if self.state == _pbs_v1.ND_STATE_FREE:
            lst.append(_pbs_v1.ND_STATE_FREE)
        else:
            lst = [mask for (mask, val)
                   in sorted(_pbs_v1.REVERSE_NODE_STATE.items())
                   if self.state & mask]
        return lst

_vnode.name = PbsAttributeDescriptor(_vnode, 'name', "", (str,))
_vnode._connect_server = PbsAttributeDescriptor(
    _vnode, '_connect_server', "", (str,))
#: C(vnode)

# This exposes pbs.vnode() to be callable in a hook script
vnode = _vnode

#:-------------------------------------------------------------------------
#                       RESERVATION TYPE
#:-------------------------------------------------------------------------


class _resv():
    """
    This represents a PBS reservation entity.
    """

    attributes = PbsReadOnlyDescriptor('attributes', {})
    attributes_readonly = PbsReadOnlyDescriptor('attributes_readonly',
                                                [])

    def __new__(cls, value, connect_server=None):
        return object.__new__(cls)

    def __init__(self, resvid, connect_server=None):
        """__init__"""

        self._attributes_hook_set = {}
        self.resvid = resvid
        self._readonly = False
        self._connect_server = connect_server
    #: m(__init__)

    def __str__(self):
        """String representation of the object"""

        return str(self.resvid)
    #: m(__str__)

    def __setattr__(self, name, value):
        if name == '_attributes_hook_set':
            if _pbs_v1.in_python_mode():
                raise BadAttributeValueError(
                    f"the attribute '{name}' is readonly")
            super().__setattr__(name, value)
            return

        if (name == "_readonly"):
            if _pbs_v1.in_python_mode() and \
                    hasattr(self, "_readonly") and not value:
                raise BadAttributeValueError(
                    "_readonly can only be set to True!")
        elif name not in _resv.attributes:
            raise UnsetAttributeNameError(
                "resv attribute '%s' not found" % (name,))
        elif name in _resv.attributes_readonly and \
                _pbs_v1.in_python_mode() and \
                _pbs_v1.in_site_hook():
            # readonly under a SITE hook
            raise BadAttributeValueError(
                "resv attribute '%s' is readonly" % (name,))

        super().__setattr__(name, value)

        # attributes that are set in python mode will be reflected in
        # _attributes_hook_set dictionary.
        if _pbs_v1.in_python_mode():
            # using a dictionary value as easier to search for keys
            self._attributes_hook_set[name] = None
    #: m(__setattr__)


#: C(resv)
_resv.resvid = PbsAttributeDescriptor(_resv, 'resvid', "", (str,))
_resv._connect_server = PbsAttributeDescriptor(
    _resv, '_connect_server', "", (str,))
#: End (resv) setting class attributes

#:-------------------------------------------------------------------------
#                       QUEUE TYPE
#:-------------------------------------------------------------------------


class _queue():
    """
    This represents a PBS queue.
    """

    attributes = PbsReadOnlyDescriptor('attributes', {})
    #name = PbsAttributeDescriptor(queue, 'name', "", (str,))

    def __init__(self, name, connect_server=None):
        """__init__"""
        #: ok, descriptor is set.
        self.name = name
        self._readonly = False
        self._connect_server = connect_server
    #: m(__init__)

    def __str__(self):
        """String representation of the object"""

        return str(self.name)
    #: m(__str__)

    def __setattr__(self, name, value):
        if (name == "_readonly"):
            if _pbs_v1.in_python_mode() and \
                    hasattr(self, "_readonly") and not value:
                raise BadAttributeValueError(
                    "_readonly can only be set to True!")
        elif name not in _queue.attributes:
            raise UnsetAttributeNameError(
                "queue attribute '%s' not found" % (name,))
        super(_queue, self).__setattr__(name, value)
    #: m(__setattr__)

    def job(self, jobid):
        """Return a job object representing jobid that belongs to queue"""

        if jobid.find(".") == -1:
            jobid = jobid + "." + _pbs_v1.get_pbs_server_name()

        if _pbs_v1.get_python_daemon_name() == "pbs_python":

            if _pbs_v1.use_static_data():
                if self._connect_server is None:
                    sn = ""
                else:
                    sn = self._connect_server

                if self.name is None:
                    qn = ""
                else:
                    qn = self.name
                return _pbs_v1.get_job_static(jobid, sn, qn)

            return pbs_statobj("job", jobid, self._connect_server,
                               self.name)
        else:
            return _pbs_v1.get_job(jobid, self.name)
    #: m(job)

    def jobs(self):
        """
            Returns an iterator that loops over the list of jobs on this queue.
        """
        return pbs_iter("jobs", "",  self.name, self._connect_server)
    #: m(jobs)

#: C(_queue)


_queue.name = PbsAttributeDescriptor(_queue, 'name', "", (str,))
_queue._connect_server = PbsAttributeDescriptor(
    _queue, '_connect_server', "", (str,))

#: End (queue) setting class attributes

#:-------------------------------------------------------------------------
#                       Server TYPE
#:-------------------------------------------------------------------------


class _server():
    """
    This represents the PBS server entity.
    """

    attributes = PbsReadOnlyDescriptor('attributes', {})

    def __init__(self, name, connect_server=None):
        """__init__"""

        self.name = name
        self._readonly = False
        self._connect_server = connect_server
    #: m(__init__)

    def __str__(self):
        """String representation of the object"""

        return str(self.name)
    #: m(__str__)

    def queue(self, qname):
        """
        queue(strQname)
            strQname -  name of a PBS queue (without the @host part) to query.

          Returns a queue object representing the queue <queue name> that is
          managed by server s.
        """
        if qname.find("@") != -1:
            raise AssertionError(
                "Got '%s', please specify a queue name only (no @)" % (qname,))

        if _pbs_v1.get_python_daemon_name() == "pbs_python":
            if _pbs_v1.use_static_data():
                if self._connect_server is None:
                    sn = ""
                else:
                    sn = self._connect_server
                return _pbs_v1.get_queue_static(qname, sn)

            return pbs_statobj("queue", qname, self._connect_server)
        else:
            return _pbs_v1.get_queue(qname)
    #: m(queue)

    def job(self, jobid):
        """
        job(strJobid)
            strJobid - PBS jobid to query.
          Returns a job object representing jobid
        """
        if jobid.find(".") == -1:
            jobid = jobid + "." + _pbs_v1.get_pbs_server_name()

        if _pbs_v1.get_python_daemon_name() == "pbs_python":
            if _pbs_v1.use_static_data():
                if self._connect_server is None:
                    sn = ""
                else:
                    sn = self._connect_server
                return _pbs_v1.get_job_static(jobid, sn, "")

            return pbs_statobj("job", jobid, self._connect_server)
        else:
            return _pbs_v1.get_job(jobid)
    #: m(job)

    def vnode(self, vname):
        """
        vnode(strVname)
            strVname - PBS vnode name to query.
          Returns a vnode object representing vname
        """
        if _pbs_v1.get_python_daemon_name() == "pbs_python":
            if _pbs_v1.use_static_data():
                if self._connect_server is None:
                    sn = ""
                else:
                    sn = self._connect_server
                return _pbs_v1.get_vnode_static(vname, sn)

            return pbs_statobj("vnode", vname, self._connect_server)
        else:
            return _pbs_v1.get_vnode(vname)
    #: m(vnode)

    def resv(self, resvid):
        """Return a resv object representing resvid"""

        if _pbs_v1.get_python_daemon_name() == "pbs_python":
            if _pbs_v1.use_static_data():
                if self._connect_server is None:
                    sn = ""
                else:
                    sn = self._connect_server
                return _pbs_v1.get_resv_static(resvid, sn)

            return pbs_statobj("resv", resvid, self._connect_server)
        else:
            return _pbs_v1.get_resv(resvid)
    #: m(resv)

    # NAS localmod 014
    if NAS_mod is not None and NAS_mod != 0:
        def jobs(self, ignore_fin=None, qname=None, username=None):
            """
            Returns an iterator that loops over the list of jobs
            on this server.
            Jobs can be filtered in 3 ways:
            - if ignore_fin is an integer != 0, finished jobs are ignored
            - qname returns jobs from that queue
            - username returns jobs with that euser
            """

            return pbs_iter("jobs", "",  qname, self._connect_server,
                            ignore_fin, username)
        #: m(jobs_nas)
    else:
        def jobs(self):
            """
            Returns an iterator that loops over the list of jobs
            on this server.
            """

            return pbs_iter("jobs", "",  "", self._connect_server)
        #: m(jobs)

    def vnodes(self):
        """
        Returns an iterator that loops over the list of vnodes
        on this server.
        """

        return pbs_iter("vnodes", "",  "", self._connect_server)
    #: m(vnodes)

    def queues(self):
        """
        Returns an iterator that loops over the list of queues on this server.
        """
        return pbs_iter("queues", "",  "", self._connect_server)
    #: m(queues)

    def resvs(self):
        """
        Returns an iterator that loops over the list of reservations on this
        server.
        """
        return pbs_iter("resvs", "", "", self._connect_server)
    #: m(resvs)

    def scheduler_restart_cycle(self):
        """
        Flags the server to tell the scheduler to restart scheduling cycle
        """
        if self._connect_server is None:
            _pbs_v1.scheduler_restart_cycle(_pbs_v1.get_pbs_server_name())
        else:
            _pbs_v1.scheduler_restart_cycle(self._connect_server)

    def __setattr__(self, name, value):
        if (name == "_readonly"):
            if _pbs_v1.in_python_mode() and \
                    hasattr(self, "_readonly") and not value:
                raise BadAttributeValueError(
                    "_readonly can only be set to True!")
        elif name not in _server.attributes:
            raise UnsetAttributeNameError(
                "server attribute '%s' not found" % (name,))
        super(_server, self).__setattr__(name, value)
    #: m(__setattr__)


#: C(server)
_server.name = PbsAttributeDescriptor(_server, 'name', "", (str,))
_server._connect_server = PbsAttributeDescriptor(
    _server, '_connect_server', "", (str,))
#: End (server) setting class attributes


#
# server: this now gets invoked when pbs.server() is called.
#        if in "pbs_python" mode, would use _pbs_ifl/pbs_ifl wrapped calls for
#        querying the server for data; otherwise, use the builtin server()
#        function in a server hook.
#
def server():

    if _pbs_v1.get_python_daemon_name() == "pbs_python":

        if _pbs_v1.use_static_data():
            return _pbs_v1.get_server_static()
        connect_server = _pbs_v1.get_pbs_server_name()
        return pbs_statobj("server", None, connect_server)
    else:
        return _pbs_v1.server()
#
# reboot: this flags PBS to reboot the local host, and if reboot_cmd is
#        given, to have PBS  use 'reboot_cmd' as the reboot command to
#        execute.
#        This immediately terminates the hook script.
#


def reboot(reboot_cmd=""):

    ev_type = _pbs_v1.event().type
    if ((ev_type & _pbs_v1.MOM_EVENTS) == 0):
        raise NotImplementedError("reboot(): only for mom hooks")
    _pbs_v1.reboot(reboot_cmd)
    raise SystemExit

#:-------------------------------------------------------------------------
#                       Event TYPE
#:-------------------------------------------------------------------------


class _event():
    """
    This represents the event that the current hook is responding to.
    """
    #: the below is used for attribute type acess
    attributes = PbsReadOnlyDescriptor('attributes', {})

    def __init__(self, type, rq_user, rq_host):
        """__init__"""
        self.type = type
        self.requestor = rq_user
        self.requestor_host = rq_host
        self._readonly = False
    #: m(__init__)

    def accept(self, ecode=0):
        """
        accept([ecode])
           Terminates hook execution and causes PBS to perform the
           associated event request action. If [ecode] argument is given,
           it will be used as the value for the SystemExit exception, else
           a value of 0 is used.

           This terminates hook execution by throwing a SystemExit exception.
        """
        _event_accept()
        _event_param_mod_disallow()
        raise SystemExit(str(ecode))
    #: m(__accept__)

    def reject(self, emsg="", ecode=255):
        """
        reject([msg])
           Terminates hook execution and instructs PBS to not perform the
           associated event request action. If [msg] argument is given, it
                will be shown in the appropriate PBS daemon log, and the STDERR
           of the PBS command that caused this event to take place.
           If [ecode] argument is given, if will be used as the value for
           the SystemExit exception, else a value of 255 is used.

           This terminates hook execution by throwing a SystemExit exception.
        """
        _event_reject(emsg)
        _event_param_mod_disallow()
        raise SystemExit(str(ecode))
    #: m(__reject__)

    def __getattr__(self, key):
        try:
            return self._param[key]
        except KeyError:
            raise EventIncompatibleError(f'"{key}" not found in self._param')
    #: m(__getattr__)

    def __setattr__(self, name, value):
        if (name == "_readonly"):
            if _pbs_v1.in_python_mode() and \
                    hasattr(self, "_readonly") and not value:
                raise BadAttributeValueError(
                    "_readonly can only be set to True!")
        elif _pbs_v1.in_python_mode() and name in self._param:
            if name == "progname" or name == "argv" or name == "env":
                self._param[name] = value
                return
            else:
                raise BadAttributeValueError(
                    "event attribute '%s' is readonly" % (name,))
        elif name not in _event.attributes:
            raise UnsetAttributeNameError(
                "event attribute '%s' not found" % (name,))
        super().__setattr__(name, value)
    #: m(__setattr__)


#: C(event)
_event.type = PbsAttributeDescriptor(_event, 'type', None, (int,))
_event.hook_name = PbsAttributeDescriptor(_event, 'hook_name', "", (str,))
_event.hook_type = PbsAttributeDescriptor(_event, 'hook_type', "", (str,))
_event.requestor = PbsAttributeDescriptor(_event, 'requestor', "", (str,))
_event.requestor_host = PbsAttributeDescriptor(
    _event, 'requestor_host', "", (str,))
_event._param = PbsAttributeDescriptor(_event, '_param', {}, (dict,))
_event.freq = PbsAttributeDescriptor(_event, 'freq', None, (int,))
#: End (event) setting class attributes

#:-------------------------------------------------------------------------
#                       PBS Iterator Type
#:-------------------------------------------------------------------------


class pbs_iter():
    """
    This represents an iterator for looping over a list of PBS objects.
    Pbs_obj_name can be: queues, jobs, resvs, vnodes.
    Pbs_filter1 is usually the <server_name> where the queues,
                 jobs, resvs, vnodes reside. A <server_name> of ""
                means the local server host.
    Pbs_filter2 can be any string that can further restrict the list
                being referenced. For example, this can be set to
                some <queue_name>, to have the iterator represents
                a list of jobs on <queue_name>@<server_name>

    connect_server Name of the pbs server to get various stats.
    """
    # NAS localmod 014
    if NAS_mod is not None and NAS_mod != 0:
        """
        We add the following args:

        Pbs_ignore_fin can be used to ignore finished jobs.
        Pbs_username   tells the iterator to return only jobs with this euser.
        """

        def __init__(self, pbs_obj_name, pbs_filter1, pbs_filter2,
                     connect_server=None, pbs_ignore_fin=None,
                     pbs_username=None):

            self._caller = _pbs_v1.get_python_daemon_name()
            if self._caller == "pbs_python":

                if(connect_server is None):
                    self._connect_server = "localhost"
                    sn = ""
                else:
                    self._connect_server = connect_server
                    sn = connect_server

                self.type = pbs_obj_name
                if _pbs_v1.use_static_data():
                    if(self.type == "jobs"):
                        self.bs = iter(_pbs_v1.get_job_static("", sn, ""))
                    elif(self.type == "queues"):
                        self.bs = iter(_pbs_v1.get_queue_static("", sn))
                    elif(self.type == "vnodes"):
                        self.bs = iter(_pbs_v1.get_vnode_static("", sn))
                    elif(self.type == "resvs"):
                        self.bs = iter(_pbs_v1.get_resv_static("", sn))
                    else:
                        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                       "pbs_iter/init: Bad object iterator"
                                       " type %s"
                                       % (self.type))
                        return None
                    return

                self.con = pbs_connect(self._connect_server)
                if self.con < 0:
                    _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                   "pbs_iter: Unable to connect to server %s"
                                   % (connect_server))
                    return None

                if(self.type == "jobs"):
                    _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                   "pbs_iter: pbs_python mode not"
                                   " supported by NAS local mod")
                    pbs_disconnect(self.con)
                    self.con = -1
                    return None
                elif(self.type == "queues"):
                    self.bs = pbs_statque(self.con, None, None, None)
                elif(self.type == "vnodes"):
                    self.bs = pbs_statvnode(self.con, None, None, None)
                elif(self.type == "resvs"):
                    self.bs = pbs_statresv(self.con, None, None, None)
                else:
                    _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                   "pbs_iter/init: Bad object iterator type %s"
                                   % (self.type))
                    pbs_disconnect(self.con)
                    self.con = -1
                    return None

            else:

                self.obj_name = pbs_obj_name
                self.filter1 = pbs_filter1
                self.filter2 = ""
                self.ignore_fin = 0
                self.filter_user = ""

                if pbs_filter2 is not None:
                    self.filter2 = pbs_filter2

                if pbs_ignore_fin is not None:
                    self.ignore_fin = pbs_ignore_fin

                if pbs_username is not None:
                    self.filter_user = pbs_username

                # argument 1 below tells C function were inside __init__
                _pbs_v1.iter_nextfunc(
                    self, 1, pbs_obj_name, pbs_filter1, self.filter2,
                    self.ignore_fin, self.filter_user)
    else:
        def __init__(self, pbs_obj_name, pbs_filter1,
                     pbs_filter2, connect_server=None):

            self._caller = _pbs_v1.get_python_daemon_name()
            if self._caller == "pbs_python":

                if(connect_server is None):
                    self._connect_server = "localhost"
                    sn = ""
                else:
                    self._connect_server = connect_server
                    sn = connect_server

                self.type = pbs_obj_name
                if _pbs_v1.use_static_data():
                    if(self.type == "jobs"):
                        self.bs = iter(_pbs_v1.get_job_static("", sn, ""))
                    elif(self.type == "queues"):
                        self.bs = iter(_pbs_v1.get_queue_static("", sn))
                    elif(self.type == "vnodes"):
                        self.bs = iter(_pbs_v1.get_vnode_static("", sn))
                    elif(self.type == "resvs"):
                        self.bs = iter(_pbs_v1.get_resv_static("", sn))
                    else:
                        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                       "pbs_iter/init: Bad object "
                                       "iterator type %s"
                                       % (self.type))
                        return None
                    return

                self.con = pbs_connect(self._connect_server)
                if self.con < 0:
                    _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                   "pbs_iter: Unable to connect to server %s"
                                   % (connect_server))
                    return None

                if(self.type == "jobs"):
                    self.bs = pbs_statjob(self.con, pbs_filter2, None, None)
                elif(self.type == "queues"):
                    self.bs = pbs_statque(self.con, None, None, None)
                elif(self.type == "vnodes"):
                    self.bs = pbs_statvnode(self.con, None, None, None)
                elif(self.type == "resvs"):
                    self.bs = pbs_statresv(self.con, None, None, None)
                else:
                    _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                   "pbs_iter/init: Bad object iterator type %s"
                                   % (self.type))
                    pbs_disconnect(self.con)
                    self.con = -1
                    return None

            else:

                self.obj_name = pbs_obj_name
                self.filter1 = pbs_filter1
                self.filter2 = pbs_filter2
                # argument 1 below tells C function we're inside __init__
                _pbs_v1.iter_nextfunc(
                    self, 1, pbs_obj_name, pbs_filter1, pbs_filter2)

    def __iter__(self):
        return self

    # NAS localmod 014
    if NAS_mod is not None and NAS_mod != 0:
        def __next__(self):
            if self._caller == "pbs_python":
                if not hasattr(self, "bs") or self.bs is None:
                    if not _pbs_v1.use_static_data():
                        pbs_disconnect(self.con)
                        self.con = -1
                    raise StopIteration

                if _pbs_v1.use_static_data():
                    if(self.type == "jobs"):
                        return _pbs_v1.get_job_static(next(self.bs),
                                                      self._connect_server, "")
                    elif(self.type == "queues"):
                        return _pbs_v1.get_queue_static(next(self.bs),
                                                        self._connect_server)
                    elif(self.type == "resvs"):
                        return _pbs_v1.get_resv_static(next(self.bs),
                                                       self._connect_server)
                    elif(self.type == "vnodes"):
                        return _pbs_v1.get_vnode_static(next(self.bs),
                                                        self._connect_server)
                    else:
                        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                       "pbs_iter/next: Bad object"
                                       " iterator type %s"
                                       % (self.type))
                        raise StopIteration
                    return

                b = self.bs
                job = None

                _pbs_v1.set_c_mode()
                server_data_fp = get_server_data_fp()
                if(b):
                    if(self.type == "jobs"):
                        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                       "pbs_iter/next: pbs_python mode not"
                                       " supported by NAS local mod")
                        pbs_disconnect(self.con)
                        if server_data_fp:
                            server_data_fp.close()
                        self.con = -1
                        _pbs_v1.set_python_mode()
                        raise StopIteration
                    elif(self.type == "queues"):
                        obj = _queue(b.name, self._connect_server)
                        header_str = "pbs.server().queue(%s)" % (b.name,)
                    elif(self.type == "resvs"):
                        obj = _resv(b.name, self._connect_server)
                        header_str = "pbs.server().resv(%s)" % (b.name,)
                    elif(self.type == "vnodes"):
                        obj = _vnode(b.name, self._connect_server)
                        header_str = "pbs.server().vnode(%s)" % (b.name,)
                    else:
                        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                       "pbs_iter/next: Bad object iterator "
                                       "type %s"
                                       % (self.type))
                        pbs_disconnect(self.con)
                        if server_data_fp:
                            server_data_fp.close()
                        self.con = -1
                        _pbs_v1.set_python_mode()
                        raise StopIteration

                    a = b.attribs

                    while(a):
                        n = a.name
                        r = a.resource
                        v = a.value

                        if(self.type == "vnodes"):
                            if(n == ATTR_NODE_state):
                                v = _pbs_v1.str_to_vnode_state(v)
                            elif(n == ATTR_NODE_ntype):
                                v = _pbs_v1.str_to_vnode_ntype(v)
                            elif(n == ATTR_NODE_Sharing):
                                v = _pbs_v1.str_to_vnode_sharing(v)

                        if(self.type == "jobs"):
                            if n == ATTR_inter or n == ATTR_block or \
                                    n == ATTR_X11_port:
                                v = int(pbs_bool(v))

                        if(r):
                            pr = getattr(obj, n)

                            # if resource list does not exist, then set it
                            if(pr is None):
                                setattr(obj, n)

                            pr = getattr(obj, n)
                            if (pr is None):
                                _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                               "pbs_statobj: missing %s" % (n))
                                a = a.next
                                continue

                            vo = getattr(pr, r)
                            if(vo is None):
                                setattr(pr, r, v)
                                if server_data_fp:
                                    server_data_fp.write(
                                        "%s.%s[%s]=%s\n" % (header_str, n,
                                                            r, v))
                            else:
                                # append value:
                                # example: "select=1:ncpus=1,ncpus=1,nodect=1,
                                # place=pack"
                                vl = [vo, v]
                                setattr(pr, r, ",".join(vl))
                                if server_data_fp:
                                    server_data_fp.write("%s.%s[%s]=%s\n" % (
                                        header_str, n, r, ",".join(vl)))

                        else:
                            vo = getattr(obj, n)

                            if(vo is None):
                                setattr(obj, n, v)
                                if server_data_fp:
                                    server_data_fp.write(
                                        "%s.%s=%s\n" % (header_str, n, v))
                            else:
                                vl = [vo, v]
                                setattr(obj, n, ",".join(vl))
                                if server_data_fp:
                                    server_data_fp.write("%s.%s=%s\n" % (
                                        header_str, n, ",".join(vl)))

                        a = a.next

                self.bs = b.next

                if server_data_fp:
                    server_data_fp.close()
                _pbs_v1.set_python_mode()
                return obj
            else:
                # argument 0 below tells C function we're inside next
                return _pbs_v1.iter_nextfunc(self, 0, self.obj_name,
                                             self.filter1,
                                             self.filter2, self.ignore_fin,
                                             self.filter_user)
    else:
        def __next__(self):
            if self._caller == "pbs_python":
                if not hasattr(self, "bs") or self.bs is None:
                    if not _pbs_v1.use_static_data():
                        pbs_disconnect(self.con)
                        self.con = -1
                    raise StopIteration

                if _pbs_v1.use_static_data():
                    if(self.type == "jobs"):
                        return _pbs_v1.get_job_static(next(self.bs),
                                                      self._connect_server,
                                                      "")
                    elif(self.type == "queues"):
                        return _pbs_v1.get_queue_static(next(self.bs),
                                                        self._connect_server)
                    elif(self.type == "resvs"):
                        return _pbs_v1.get_resv_static(next(self.bs),
                                                       self._connect_server)
                    elif(self.type == "vnodes"):
                        return _pbs_v1.get_vnode_static(next(self.bs),
                                                        self._connect_server)
                    else:
                        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                       "pbs_iter/next: Bad object"
                                       " iterator type %s"
                                       % (self.type))
                        raise StopIteration
                    return

                b = self.bs
                job = None

                _pbs_v1.set_c_mode()

                server_data_fp = get_server_data_fp()
                if(b):
                    if(self.type == "jobs"):
                        obj = _job(b.name, self._connect_server)
                        header_str = "pbs.server().job(%s)" % (b.name,)
                    elif(self.type == "queues"):
                        obj = _queue(b.name, self._connect_server)
                        header_str = "pbs.server().queue(%s)" % (b.name,)
                    elif(self.type == "resvs"):
                        obj = _resv(b.name, self._connect_server)
                        header_str = "pbs.server().resv(%s)" % (b.name,)
                    elif(self.type == "vnodes"):
                        obj = _vnode(b.name, self._connect_server)
                        header_str = "pbs.server().vnode(%s)" % (b.name,)
                    else:
                        _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                       "pbs_iter/next: Bad object"
                                       " iterator type %s"
                                       % (self.type))
                        pbs_disconnect(self.con)
                        if server_data_fp:
                            server_data_fp.close()
                        self.con = -1
                        _pbs_v1.set_python_mode()
                        raise StopIteration

                    a = b.attribs

                    while(a):
                        n = a.name
                        r = a.resource
                        v = a.value

                        if(self.type == "vnodes"):
                            if(n == ATTR_NODE_state):
                                v = _pbs_v1.str_to_vnode_state(v)
                            elif(n == ATTR_NODE_ntype):
                                v = _pbs_v1.str_to_vnode_ntype(v)
                            elif(n == ATTR_NODE_Sharing):
                                v = _pbs_v1.str_to_vnode_sharing(v)

                        if(self.type == "jobs"):
                            if n == ATTR_inter or n == ATTR_block or \
                                    n == ATTR_X11_port:
                                v = int(pbs_bool(v))

                        if(r):
                            pr = getattr(obj, n)

                            # if resource list does not exist, then set it
                            if(pr is None):
                                setattr(obj, n)

                            pr = getattr(obj, n)
                            if (pr is None):
                                _pbs_v1.logmsg(_pbs_v1.LOG_DEBUG,
                                               "pbs_statobj: missing %s" % (n))
                                a = a.__next__
                                continue

                            vo = getattr(pr, r)
                            if(vo is None):
                                setattr(pr, r, v)
                                if server_data_fp:
                                    server_data_fp.write(
                                        "%s.%s[%s]=%s\n" % (header_str, n, r,
                                                            v))
                            else:
                                # append value:
                                # example: "select=1:ncpus=1,ncpus=1,nodect=1,
                                # place=pack"
                                vl = [vo, v]
                                setattr(pr, r, ",".join(vl))
                                if server_data_fp:
                                    server_data_fp.write("%s.%s[%s]=%s\n" % (
                                        header_str, n, r, ",".join(vl)))

                        else:
                            vo = getattr(obj, n)

                            if(vo is None):
                                setattr(obj, n, v)
                                if server_data_fp:
                                    server_data_fp.write(
                                        "%s.%s=%s\n" % (header_str, n, v))
                            else:
                                vl = [vo, v]
                                setattr(obj, n, ",".join(vl))
                                if server_data_fp:
                                    server_data_fp.write("%s.%s=%s\n" % (
                                        header_str, n, ",".join(vl)))

                        a = a.next

                self.bs = b.next

                _pbs_v1.set_python_mode()
                if server_data_fp:
                    server_data_fp.close()
                return obj
            else:
                # argument 0 below tells C function we're inside next
                return _pbs_v1.iter_nextfunc(self, 0, self.obj_name,
                                             self.filter1, self.filter2)
#: C(pbs_iter)

#:------------------------------------------------------------------------
#                  SERVER ATTRIBUTE TYPE
#:-------------------------------------------------------------------------
class _server_attribute:
    """
    This represents a external form of attributes..
    """
    attributes = PbsReadOnlyDescriptor('attributes', {})

    def __init__(self, name, resource, value, op, flags):
        self.name = name
        self.resource = resource
        self.value = value
        self.op = op
        self.flags = flags
        self.sisters = []
    #: m(__init__)

    def __str__(self):
        return ("name=%s:resource=%s:value=%s:op=%s:flags=%s:sisters=%s" %
                self.tup())
    #: m(__str__)

    def __setattr__(self, name, value):
        if _pbs_v1.in_python_mode():
            raise BadAttributeValueError(
                "'%s' attribute in the server_attribute object is readonly"
                % (name,))
        super().__setattr__(name, value)
    #: m(__setattr__)

    def extract_flags_str(self):
        """returns the string values from the attribute flags."""
        lst = []
        for mask, value in _pbs_v1.REVERSE_ATR_VFLAGS.items():
            if self.flags & mask:
                lst.append(value)
        return lst
    #: m(extract_flags_str)

    def extract_flags_int(self):
        """returns the integer values from the attribute flags."""
        lst = []
        for mask, value in _pbs_v1.REVERSE_ATR_VFLAGS.items():
            if self.flags & mask:
                lst.append(mask)
        return lst
    #: m(extract_flags_int)

    def tup(self):
        return (self.name, self.resource, self.value, self.op, self.flags,
                self.sisters)
    #: m(tup)

_server_attribute._connect_server = PbsAttributeDescriptor(
    _server_attribute, '_connect_server', "", (str,))
#: C(_server_attribute)

# This exposes pbs.server_attribute() to be callable in a hook script
server_attribute = _server_attribute

#:------------------------------------------------------------------------
#                  MANAGEMENT TYPE
#:-------------------------------------------------------------------------
class _management:
    """
    This represents a management operation.
    """
    attributes = PbsReadOnlyDescriptor('attributes', {})

    def __init__(self, cmd, objtype, objname, request_time, reply_code,
        reply_auxcode, reply_choice, reply_text,
        attribs, connect_server=None):
        """__init__"""
        self.cmd = cmd
        self.objtype = objtype
        self.objname = objname
        self.request_time = request_time
        self.reply_code = reply_code
        self.reply_auxcode = reply_auxcode
        self.reply_choice = reply_choice
        self.reply_text = reply_text
        self.attribs = attribs
        self._readonly = True
        self._connect_server = connect_server
    #: m(__init__)

    def __str__(self):
        """String representation of the object"""
        return "%s:%s:%s" % (
            _pbs_v1.REVERSE_MGR_CMDS.get(self.cmd, self.cmd),
            _pbs_v1.REVERSE_MGR_OBJS.get(self.objtype, self.objtype),
            self.objname
            )
    #: m(__str__)

    def __setattr__(self, name, value):
        if _pbs_v1.in_python_mode():
            raise BadAttributeValueError(
                "'%s' attribute in the management object is readonly" %
                (name,))
        super().__setattr__(name, value)
    #: m(__setattr__)

_management._connect_server = PbsAttributeDescriptor(
    _management, '_connect_server', "", (str,))
#: C(_management)

# This exposes pbs.management() to be callable in a hook script
management = _management


#:------------------------------------------------------------------------
#                  Reverse Lookup for _pv1mod_insert_int_constants
#:-------------------------------------------------------------------------
_pbs_v1.REVERSE_MGR_CMDS = {}
_pbs_v1.REVERSE_MGR_OBJS = {}
_pbs_v1.REVERSE_BRP_CHOICES = {}
_pbs_v1.REVERSE_BATCH_OPS = {}
_pbs_v1.REVERSE_ATR_VFLAGS = {}
_pbs_v1.REVERSE_NODE_STATE = {}
_pbs_v1.REVERSE_JOB_STATE = {}
_pbs_v1.REVERSE_JOB_SUBSTATE = {}
_pbs_v1.REVERSE_RESV_STATE = {}
_pbs_v1.REVERSE_HOOK_EVENT = {}

for key, value in _pbs_v1.__dict__.items():
    if key.startswith("MGR_CMD_"):
        _pbs_v1.REVERSE_MGR_CMDS[value] = key
    elif key.startswith("MGR_OBJ_"):
        _pbs_v1.REVERSE_MGR_OBJS[value] = key
    elif key.startswith("BRP_CHOICE_"):
        _pbs_v1.REVERSE_BRP_CHOICES[value] = key
    elif key.startswith("BATCH_OP_"):
        _pbs_v1.REVERSE_BATCH_OPS[value] = key
    elif key.startswith("ATR_VFLAG_"):
        _pbs_v1.REVERSE_ATR_VFLAGS[value] = key
    elif key.startswith("ND_STATE_"):
        _pbs_v1.REVERSE_NODE_STATE[value] = key
    elif key.startswith("JOB_STATE_"):
        _pbs_v1.REVERSE_JOB_STATE[value] = key
    elif key.startswith("JOB_SUBSTATE_"):
        _pbs_v1.REVERSE_JOB_SUBSTATE[value] = key
    elif key.startswith("RESV_STATE"):
        _pbs_v1.REVERSE_RESV_STATE[value] = key
    elif key.startswith("HOOK_EVENT_"):
        _pbs_v1.REVERSE_HOOK_EVENT[value] = key


================================================
FILE: src/modules/python/pbs_hooks/PBS_alps_inventory_check.HK
================================================
type=pbs
enabled=false
user=pbsadmin
event=exechost_periodic
freq=300
alarm=90


================================================
FILE: src/modules/python/pbs_hooks/PBS_alps_inventory_check.PY
================================================
# coding: utf-8
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
Purpose:

- Force PBS to refresh nodes information when PBS and ALPS get out of
  sync.

Requirements:

- PBS vnodes created in qmgr must be named after a locally-valid
  alias for each login node.

 Some enhanced operations in a multi-Cray or mixed Cray/non-Cray
 environment with an external server:

    1) Determine my node's cray host value by reading /etc/xthostname.
    2) Only compile lists of compute and login nodes whose PBScrayhost
       resource matches my crayhost value.
    3) Current host always validates itself against the first "up"
       Cray login node. This prevents non-Cray nodes from attempting
       obtain an ALPS inventory in cases where there is only one
       Cray login node. To facilitate this, we've a list,
       cray_login_list.
    4) Rather than attempting to index into the list of Cray login
       nodes (which fails with a spurious error message if the hook
       is running on a non-Cray node in a mixed environment, or if
       the vnode name of the host does not match the default hostname
       of the node), check all local aliases for this node against the
       vnode name of the first "up" Cray login node to determine
       whether to proceed.
    5) Check that the PBScraynid resource is defined before attempting
       to add a node's PBScraynid to the nid list. This prevents the
       hook from failing on a conversion error if a site sets the
       vntype resource on a non_Cray node.
    6) A compute node that is offlined in PBS, but still preset as a
       batch node in ALPS, would cause a false inventory mismatch
       since only "up" nodes were included in the pbs_nids_set. This
       would in turn cause the hook to HUP inventory MoM every cycle.
       It's perfectly reasonable for an Admin to offline a node
       without necessarily downing it in ALPS. We deal with this by:
       a) treating node states as a bitmask rather than as a set of
          integer values
       b) distinguishing between "down" states ("down", "unknown",
          "stale") and offline
       c) excluding down or offline login nodes from consideration as
          the inventory MoM
       d) special-casing offline compute nodes by removing their nids
          from the apstat_nids_set if present and excluding them from
          the pbs_nids_set. This essentially means that we don't care
          whether an offline node is present in ALPS or not.
    7) When we check to see whether the current node matches the
       inventory MoM, we actually resolve the inventory MoM and see
       if its IP matches a valid IP from the current node . This allows
       the hook to continue to work even if a site changes the default
       hostname of a MoM node after installation.
"""

import fcntl
import os
import re
import socket
import struct
import sys
import time
from signal import SIGHUP
from subprocess import PIPE, Popen

import pbs

XTHOSTNAME = "/etc/xthostname"
APSTAT_CMD = "/opt/cray/alps/default/bin/apstat"
SIOCGIFADDR = 0x8915


def get_mom_home():
    """
    Return the path to the PBS home directory
    """

    for v in ("PBS_MOM_HOME", "PBS_HOME"):
        if v in os.environ:
            return os.environ[v]

    home = None
    conf_file = os.environ.get("PBS_CONF_FILE", "/etc/pbs.conf")
    with open(conf_file) as conf:
        for line in conf:
            (key, val) = line.strip().split("=")
            if key == "PBS_MOM_HOME":
                home = val
                # PBS_MOM_HOME takes priority over PBS_HOME, so we are done
                # searching
                break
            elif key == "PBS_HOME":
                home = val

    if not home.strip():
        return None

    return home


def hup_mom():
    PBS_MOM_HOME = get_mom_home()
    pidfile = open(os.path.join(PBS_MOM_HOME, "mom_priv", "mom.lock"))
    pid = int(pidfile.readline())
    pidfile.close()
    os.kill(pid, SIGHUP)


def get_apstat_nids(msg):
    """
    Returns the number of nodes reported by ALPS as marked "up" and of type
    "batch".

    Sample output of the command 'apstat -rn':

    NID Arch State HW Rv Pl  PgSz     Avl    Conf Placed PEs Apids
    2   XT UP  B 16  -  -    4K 4194304       0      0   0
    3   XT UP  B 16  -  -    4K 4194304       0      0   0
    """

    if not os.path.isfile(APSTAT_CMD):
        msg += ["ALPS Inventory Check: apstat command can not be found at %s" %
                (APSTAT_CMD)]
        return None

    apstat_nids = set()
    cmd_apstat = APSTAT_CMD + " -nv"
    apstat_out = Popen(cmd_apstat, shell=True, stdout=PIPE)

    if apstat_out.wait() != 0 or apstat_out is None:
        msg += ["ALPS Inventory Check: No nodes reported by apstat."]
        hup_mom()
        __exit_hook(1, msg)

    pattern = re.compile(
        r"(?P<nid>.+?)\s+(?P<arch>.+?)\s+(?P<state>.+?)\s+" +
        r"(?P<hw>.+?)\s+(?P<everything>.+)")

    for apstat_line in apstat_out.stdout:
        apstat_line = apstat_line.decode().strip()

        apstat_record = re.search(pattern, apstat_line)

        if apstat_record:
            if apstat_record.group('state') == "UP" and \
                    apstat_record.group('hw') == "B":
                apstat_nids.add(int(apstat_record.group('nid')))

    return apstat_nids


def flush_log_messages(msg=None):
    """
    Prints msg to the log file
    """
    if msg is not None:
        for m in msg:
            pbs.logmsg(pbs.LOG_DEBUG, m)


def __exit_hook(code=0, msg=None):
    flush_log_messages(msg)
    sys.exit(code)


def my_addresses():
    """ produces a list of ip strings for each network interface """

    for ifname in os.listdir('/sys/class/net'):
        if ifname == 'lo':
            continue

        test_socket = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
        ifreq = struct.pack('256s', bytes(ifname[:15], "utf-8"))

        try:
            sockaddr_in = fcntl.ioctl(test_socket.fileno(),
                                      SIOCGIFADDR,
                                      ifreq)[20:24]
        except IOError:
            continue

        yield socket.inet_ntoa(sockaddr_in)


cray_login_list = []
offline_nids_list = []
pbs_nids_set = set()
now_mn = int(time.strftime("%M", time.gmtime()))
msg = []

if not os.path.isfile(XTHOSTNAME):
    msg += ["No %s file found on this host." % (XTHOSTNAME)]
    __exit_hook(0, msg)

# XTHOSTNAME file found on this host. Read it to determine our Cray hostname.

with open(XTHOSTNAME) as xthost_file:
    my_crayhost = xthost_file.readline()
    my_crayhost = my_crayhost.rstrip()
    msg += ["Processing ALPS inventory for crayhost %s" % (my_crayhost)]

start = time.time()
vnodes = pbs.server().vnodes()
vnodes_query_duration = time.time() - start
if not vnodes:
    msg += ["ALPS Inventory Check: No vnodes reported by PBS"]
    __exit_hook(1, msg)

down_states = pbs.ND_DOWN | pbs.ND_STALE | pbs.ND_STATE_UNKNOWN

for v in vnodes:
    str_v = str(v)
    vntype = " "

    if (v.state & down_states) or \
        "PBScrayhost" not in v.resources_available or \
            v.resources_available["PBScrayhost"] != my_crayhost:
        continue

    if "vntype" in v.resources_available:
        vntype = v.resources_available["vntype"]

    if vntype == "cray_login":
        if (not (v.state & pbs.ND_OFFLINE)) and \
                str_v not in cray_login_list:
            cray_login_list.append(str_v)

    elif vntype == "cray_compute":

        if "PBScraynid" in v.resources_available:
            pbs_craynid = v.resources_available["PBScraynid"]

        if pbs_craynid.isdigit():
            if (v.state & pbs.ND_OFFLINE):

                # if vnode is offline, add it to offline_nids_list.
                # Otherwise, add it to the pbs_nids_set.
                # Later on, the inventory MoM sill iterate through the
                # offline_nids_list and discard those nids from the
                # apstat_nids_set. This has the effect of causing us
                # to ignore any offline nids so we won't generate a
                # spurious HUP of the MoM if there are offline vnodes
                # whose nids are present in the apstat output. We use
                # the set.discard() method because it doesn't throw an
                # error if the nid isn't present in the apstat_nids_set.

                offline_nids_list.append(int(pbs_craynid))
            else:
                pbs_nids_set.add(int(pbs_craynid))

if len(cray_login_list) == 0:
    msg += ["ALPS Inventory Check: No eligible " +
            "login nodes to perform inventory check"]
    __exit_hook(0, msg)

cray_login_local_name = pbs.get_local_nodename()

try:
    inventory_node = cray_login_list[0]
    inventory_addr = socket.gethostbyname(inventory_node)

    if ((inventory_addr not in my_addresses()) and (
            inventory_node != cray_login_local_name)):
        msg += ["ALPS Inventory Check: Login node '%s' is in charge of "
                "verification, skipping check on '%s'." %
                (inventory_node, socket.gethostname())]
        __exit_hook(0, msg)

    start = time.time()
    apstat_nids_set = get_apstat_nids(msg)
    apstat_query_duration = time.time() - start

    if apstat_query_duration > 1 or vnodes_query_duration > 1:
        msg += ["ALPS Inventory Check: apstat query: %ds pbsnodes query: %ds" %
                (apstat_query_duration, vnodes_query_duration)]

#  Remove any offline nids from the apstat_nids_set.
    for offline_nid in offline_nids_list:
        apstat_nids_set.discard(offline_nid)

    pbs_apstat_diff = pbs_nids_set.difference(apstat_nids_set)
    apstat_pbs_diff = apstat_nids_set.difference(pbs_nids_set)

    if apstat_pbs_diff:
        msg += ["ALPS Inventory Check: Compute " +
                "node%s defined in ALPS, but not in PBS: %s" %
                (['', "s"][len(apstat_pbs_diff) > 0],
                 ",".join(str(n) for n in apstat_pbs_diff))]

    if pbs_apstat_diff:
        msg += ["ALPS Inventory Check: Compute " +
                "node%s defined in PBS, but not in ALPS: %s" %
                (['', "s"][len(pbs_apstat_diff) > 0],
                 ",".join(str(n) for n in pbs_apstat_diff))]

    if apstat_pbs_diff or pbs_apstat_diff:
        PBS_MOM_HOME = get_mom_home()
        if PBS_MOM_HOME is not None:
            flush_log_messages(msg)
            hup_mom()
            sys.exit(0)
        else:
            msg += ["ALPS Inventory Check: Internal error in retrieving path "
                    "to mom_priv"]
    else:
        msg += ["ALPS Inventory Check: PBS and ALPS are in sync"]

    flush_log_messages(msg)

except SystemExit:
    pass
except BaseException:
    msg += ["ALPS Inventory Check: Failure in refreshing "
            "nodes on login node (%s) " % (cray_login_local_name)]
    __exit_hook(1, msg)


================================================
FILE: src/modules/python/pbs_hooks/PBS_cray_atom.CF
================================================
{
    "post_timeout": 30,
    "delete_timeout": 30,
    "unix_socket_file": "/var/run/atomd/atomd.sock"
}


================================================
FILE: src/modules/python/pbs_hooks/PBS_cray_atom.HK
================================================
type=pbs
enabled=false
user=pbsadmin
event=execjob_begin,execjob_end
order=100
alarm=300
fail_action=offline_vnodes


================================================
FILE: src/modules/python/pbs_hooks/PBS_cray_atom.PY
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


"""
PBS hook for consuming the Shasta Northbound API.

This hook services the following events:
- execjob_begin
- execjob_end
"""


import json as JSON
import os
import site
import sys
import urllib

site.main()

# to be PEP-8 compliant, the imports must be indented
if True:
    import requests
    import requests_unixsocket
    import pbs
    import pwd
    import copy
    import re

requests_unixsocket.monkeypatch()

# ============================================================================
# Utility functions
# ============================================================================


class OfflineError(Exception):
    """
    Exception that will offline the node and reject the event
    """

    def __init__(self, msg):
        super().__init__(pbs.event().job.id + ': ' + msg)


class RejectError(Exception):
    """
    Exception that will reject the event
    """
    pass


class HookHelper(object):
    """
    Helper to load config and event
    """
    config = None

    def __init__(self):
        raise Exception('Access class via static methods')

    @classmethod
    def load_config(cls):
        """
        Read the config file
        """
        log_function_name()
        defaults = {
            'post_timeout': 30,
            'delete_timeout': 30,
            'unix_socket_file': '/var/run/atomd/atomd.sock',
        }
        constants = {
            'version_uri': '/rm/v1',
            'resources': {
                'job': '/jobs',
                'task': '/tasks'
            }
        }
        # Identify the config file and read in the data
        config_file = ''
        if 'PBS_HOOK_CONFIG_FILE' in os.environ:
            config_file = os.environ['PBS_HOOK_CONFIG_FILE']
        else:
            raise RuntimeError('%s: No config file set' % caller_name())
        pbs.logmsg(pbs.EVENT_DEBUG4, 'config file is %s' % config_file)
        try:
            with open(config_file, 'r') as cfg:
                config = merge_dict(defaults, JSON.load(cfg))
        except IOError:
            raise IOError('I/O error reading config file')
        config = merge_dict(config, constants)
        pbs.logmsg(pbs.EVENT_DEBUG4, 'loaded config is: %s' % (str(config)))
        cls.config = config

    @classmethod
    def validate_config(cls):
        """
        Validate the config file
        This will check if the unix_socket_file resolves to a file.
        """
        if not os.path.exists(cls.get_config()['unix_socket_file']):
            log_with_caller(pbs.EVENT_DEBUG4,
                            'Unix socket file does not exist, skipping hook',
                            jobid=False)
            pbs.event().accept()

    @classmethod
    def get_config(cls):
        """
        Load the config if it hasn't already been loaded.
        Return the config
        """
        if not cls.config:
            cls.load_config()
            cls.validate_config()
        return cls.config

    @staticmethod
    def build_path(resource, jobid=None):
        """
        Given a jobid and a resource type build the path.
        If jobid is none, build a path to the collection
        requests_unixsockets requires the socket path to be percent-encoded
        """
        log_function_name()
        cfg = HookHelper.get_config()

        if resource not in cfg['resources']:
            log_with_caller(pbs.EVENT_ERROR, 'Invalid resource type %s' %
                            resource, jobid=False)
            raise RejectError()

        path = 'http+unix://%s%s%s%s' % (
            urllib.parse.quote(cfg['unix_socket_file'], safe=''),
            cfg['version_uri'],
            cfg['resources'][resource],
            ('/' + jobid) if jobid else ''
        )
        log_with_caller(pbs.EVENT_DEBUG4, 'path is %s' % path)
        return path

    @staticmethod
    def is_it_exclusive(job):
        """
        check to see if the job requested exclusive, or if the
        nodes are marked exclusive.  This needs to be passed
        to ATOM.
        """
        place = str(job.Resource_List["place"])
        log_with_caller(pbs.EVENT_DEBUG4, "place is %s" % place)

        # See if the node sharing value has exclusive
        vn = pbs.server().vnode(pbs.get_local_nodename())
        sharing = vn.sharing
        log_with_caller(pbs.EVENT_DEBUG4, "The sharing value is %s type %s" %
                        (str(sharing), str(type(sharing))))

        # Uses the same logic as the scheduler (is_excl())
        if sharing == pbs.ND_FORCE_EXCL or sharing == pbs.ND_FORCE_EXCLHOST:
            return True

        if sharing == pbs.ND_IGNORE_EXCL:
            return False

        if any(s.startswith('excl') for s in place.split(':')):
            return True
        if any(s.startswith('shared') for s in place.split(':')):
            return False

        if (sharing == pbs.ND_DEFAULT_EXCL or
            sharing == pbs.ND_DEFAULT_EXCLHOST):
            return True

        if sharing == pbs.ND_DEFAULT_SHARED:
            return False

        return False

def post(url, json=None, **kwargs):
    """
    Wrapper to requests.post

    Logs before and after
    """
    log_with_caller(pbs.EVENT_DEBUG2, 'Sending POST to %s' % url, caller=1)
    log_with_caller(pbs.EVENT_DEBUG2, 'Sending POST JSON: %s' %
                    JSON.dumps(json), caller=1)
    r = requests.post(url, json=json, **kwargs)
    log_with_caller(pbs.EVENT_DEBUG2, 'Received POST status code = %s' %
                    r.status_code, caller=1)
    log_with_caller(pbs.EVENT_DEBUG2, 'Received POST text %s' %
                    r.text, caller=1)
    return r


def get(url, params=None, **kwargs):
    """
    Wrapper to requests.get

    Logs before and after
    """
    log_with_caller(pbs.EVENT_DEBUG2, 'Sending GET to %s' % url, caller=1)
    if params:
        log_with_caller(pbs.EVENT_DEBUG2,
                        'Sending GET params: %s' % params, caller=1)
    r = requests.get(url, params=params, **kwargs)
    log_with_caller(pbs.EVENT_DEBUG2, 'Received GET status code = %s' %
                    r.status_code, caller=1)
    log_with_caller(pbs.EVENT_DEBUG2, 'Received GET text %s' %
                    r.text, caller=1)
    return r


def delete(url, **kwargs):
    """
    Wrapper to requests.delete

    Logs before and after
    """
    log_with_caller(pbs.EVENT_DEBUG2, 'Sending DELETE to %s' % url, caller=1)
    r = requests.delete(url, **kwargs)
    log_with_caller(pbs.EVENT_DEBUG2, 'Received DELETE status code = %s' %
                    r.status_code, caller=1)
    log_with_caller(pbs.EVENT_DEBUG2, 'Received DELETE text %s' %
                    r.text, caller=1)
    return r


def caller_name(frames=1):
    """
    Return the name of the nth calling function or method.
    """
    return str(sys._getframe(frames).f_code.co_name)


def log_function_name():
    """
    Log the caller's name
    """
    pbs.logmsg(pbs.EVENT_DEBUG4, '%s:%s: Method called' %
               (pbs.event().hook_name, caller_name(2)))


def log_with_caller(sev, mes, caller=0, jobid=True):
    """
    Wrapper to pbs.logmsg with caller's name prepended

    Increment caller to get the caller of the calling function

    If jobid is true, add the jobid from the event to the log message
    """
    if jobid:
        pbs.logmsg(sev, '%s:%s:%s: %s' %
                   (pbs.event().hook_name, pbs.event().job.id,
                    caller_name(2 + caller), mes))
    else:
        pbs.logmsg(sev, '%s:%s: %s' %
                   (pbs.event().hook_name, caller_name(2 + caller), mes))


def merge_dict(base, new):
    """
    Merge together two multilevel dictionaries where new
    takes precedence over base
    """
    if not isinstance(base, dict):
        raise ValueError('base must be type dict')
    if not isinstance(new, dict):
        raise ValueError('new must be type dict')
    newkeys = new.keys()
    merged = {}
    for key in base:
        if key in newkeys and isinstance(base[key], dict):
            # Take it off the list of keys to copy
            newkeys.remove(key)
            merged[key] = merge_dict(base[key], new[key])
        else:
            merged[key] = copy.deepcopy(base[key])
    # Copy the remaining unique keys from new
    for key in newkeys:
        merged[key] = copy.deepcopy(new[key])
    return merged


def retry_post(data):
    """
    In the case where a POST fails due to a 400 error,
    it could be because there is already a job on the cray side.
    In that case, we should try to delete the existing job and
    resubmit a new one.

    If a previous POST timedout so we rejected it, but the service
    just took too long to respond, it would exist on the service.
    """
    event = pbs.event()
    jid = event.job.id

    joburl = HookHelper.build_path(resource='job', jobid=jid)
    del_timeout = HookHelper.get_config()['delete_timeout']
    try:
        r_del = delete(joburl, timeout=del_timeout)
        r_del.raise_for_status()
    except requests.Timeout:
        log_with_caller(pbs.EVENT_ERROR, 'DELETE timed out')
        raise OfflineError('Job delete timed out')
    except requests.HTTPError:
        # If 404, then maybe the job that was there is now gone,
        # try posting again. Otherwise, raise an OfflineError
        if r_del.status_code != 404:
            log_with_caller(pbs.EVENT_ERROR, 'DELETE job failed')
            raise OfflineError('Job delete failed')

    url = HookHelper.build_path(resource='job')
    post_timeout = HookHelper.get_config()['post_timeout']
    try:
        r_post = post(url, json=data, timeout=post_timeout)
        r_post.raise_for_status()
    except requests.Timeout:
        log_with_caller(pbs.EVENT_ERROR, 'POST timed out')
        raise OfflineError('Job POST timed out')
    except requests.HTTPError:
        log_with_caller(pbs.EVENT_ERROR,
                        'Invalid status code %d' % r_post.status_code)
        raise OfflineError('Job POST encountered invalid status code')

    # if we got here, we've successfully deleted and re-posted the job
    log_with_caller(pbs.EVENT_DEBUG, 'Job %s registered' % jid)
    return

def get_uid(user):
    """
    get uid for the user
    """
    try:
        return pwd.getpwnam(user).pw_uid
    except Exception:
        pbs.logmsg(pbs.EVENT_DEBUG, "Error while reading user uid from the"
                   " machine.")
        raise RejectError(f"Unable to get uid for {user}")

def handle_execjob_begin():
    """
    Handler for execjob_begin events.
    """
    log_function_name()
    event = pbs.event()
    jid = event.job.id
    uid = get_uid(event.job.euser)
    log_with_caller(pbs.EVENT_DEBUG4, 'UID is %d' % uid)
    excl = HookHelper.is_it_exclusive(event.job)
    data = {
        'jobid': jid,
        'uid': uid,
        'exclusive': excl
    }
    url = HookHelper.build_path(resource='job')
    timeout = HookHelper.get_config()['post_timeout']
    try:
        r = post(url, json=data, timeout=timeout)
        r.raise_for_status()
    except requests.Timeout:
        log_with_caller(pbs.EVENT_ERROR, 'POST timed out')
        raise OfflineError('Job POST timed out')
    except requests.HTTPError:
        if r.status_code == 400:
            retry_post(data)
        else:
            log_with_caller(pbs.EVENT_ERROR, 'Invalid status code %d' %
                            r.status_code)
            raise OfflineError('Job POST encountered invalid status code')
    log_with_caller(pbs.EVENT_DEBUG, 'Job %s registered' % jid)


def handle_execjob_end():
    """
    Handler for execjob_end events.
    """
    log_function_name()
    jid = pbs.event().job.id
    url = HookHelper.build_path(resource='job', jobid=jid)
    timeout = HookHelper.get_config()['delete_timeout']
    try:
        r = delete(url, timeout=timeout)
        r.raise_for_status()
    except requests.Timeout:
        log_with_caller(pbs.EVENT_ERROR, 'DELETE timed out')
        raise RejectError('Job delete timed out')
    except requests.HTTPError:
        log_with_caller(pbs.EVENT_ERROR, 'DELETE job failed')
        raise RejectError('Job delete failed')

    log_with_caller(pbs.EVENT_DEBUG, 'Job %s deleted' % jid)


def main():
    """
    Main function for execution
    """
    log_function_name()
    hostname = pbs.get_local_nodename()
    # Log the hook event type
    event = pbs.event()

    handlers = {
        pbs.EXECJOB_BEGIN: (handle_execjob_begin, OfflineError),
        pbs.EXECJOB_END: (handle_execjob_end, RejectError)
    }

    handler, timeout_exc = handlers.get(event.type, (None, None))
    if not handler:
        log_with_caller(pbs.EVENT_ERROR, '%s event is not handled by this hook'
                        % event.type, jobid=False)
        event.accept()
    try:
        handler()
    except KeyboardInterrupt:
        raise timeout_exc('Handler alarmed')


if __name__ == 'builtins':
    try:
        main()
    except OfflineError as e:
        # the fail_action will offline the vnodes
        raise
    except RejectError:
        pbs.event().reject()


================================================
FILE: src/modules/python/pbs_hooks/PBS_power.CF
================================================
{
	"power_ramp_rate_enable": false,
	"power_on_off_enable": false,
	"node_idle_limit": "1800",
	"min_node_down_delay": "1800",
	"max_jobs_analyze_limit": "100",
	"max_concurrent_nodes" : "5"
}


================================================
FILE: src/modules/python/pbs_hooks/PBS_power.HK
================================================
type=pbs
enabled=false
user=pbsadmin
event=periodic,execjob_prologue,execjob_epilogue,exechost_periodic,exechost_startup,execjob_begin,execjob_end
order=2000
alarm=180
freq=300


================================================
FILE: src/modules/python/pbs_hooks/PBS_power.PY
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

__doc__ = """
This hook will activate and deactivate a power profile contained
in the 'eoe' value for a job.
"""

import datetime
import json
import os
import socket
import time
from subprocess import PIPE, Popen

import pbs
from pbs.v1._pmi_utils import _get_vnode_names, _svr_vnode


def init_power(event):
    # Get a Power structure and do the connect.  Reject on failure.
    try:
        confvar = "PBS_PMINAME"
        name = None
        if confvar in os.environ:
            name = os.environ[confvar]
        power = pbs.Power(name)
        power.connect()
    except Exception as e:
        event.reject(str(e))
    return power


def vnodes_enabled(job):
    # see if power operations are allowed on all job vnodes
    for vn in _get_vnode_names(job):
        if not _svr_vnode(vn).power_provisioning:
            pbs.logjobmsg(job.id,
                          "power functionality is disabled on vnode %s" % vn)
            return False
    return True


def get_local_node(name):
    # Get host names from /etc/hosts and return matching name for the MoM
    try:
        (hostname, aliaslist, _) = socket.gethostbyname_ex(name)
    except Exception:
        return None
    aliaslist.append(hostname)
    # Search for possible match in server vnode list.
    pbsvnodes = dict()
    for vn in pbs.server().vnodes():
        pbsvnodes[vn.name] = vn
    for n in aliaslist:
        if n in pbsvnodes:
            return pbsvnodes[n]
    return None


# Read the config file in json format
def parse_config_file():
    # Turn everything off by default. These settings be modified
    # when the configuration file is read.
    global pbs_home
    global pbs_exec
    global power_ramp_rate_enable
    global power_on_off_enable
    global node_idle_limit
    global min_node_down_delay
    global max_jobs_analyze_limit
    global max_concurrent_nodes

    try:
        # This block will work for PBS versions 13 and later
        pbs_conf = pbs.get_pbs_conf()
        pbs_home = pbs_conf['PBS_HOME']
        pbs_exec = pbs_conf['PBS_EXEC']
    except Exception:
        pbs.logmsg(pbs.EVENT_DEBUG,
                   "PBS_HOME needs to be defined in the config file")
        pbs.logmsg(pbs.EVENT_DEBUG, "Exiting the power hook")
        pbs.event().accept()

    # Identify the config file and read in the data
    config_file = ''
    if 'PBS_HOOK_CONFIG_FILE' in os.environ:
        config_file = os.environ["PBS_HOOK_CONFIG_FILE"]
    tmpcfg = ''
    if not config_file:
        tmpcfg = os.path.join(pbs_home, 'server_priv', 'hooks',
                              'PBS_power.CF')
    if os.path.isfile(tmpcfg):
        config_file = tmpcfg
    if not config_file:
        tmpcfg = os.path.join(pbs_home, 'mom_priv', 'hooks',
                              'PBS_power.CF')
    if os.path.isfile(tmpcfg):
        config_file = tmpcfg
    if not config_file:
        raise Exception("Config file not found")
    pbs.logmsg(pbs.EVENT_DEBUG3, "Config file is %s" % config_file)
    try:
        fd = open(config_file, 'r')
        config = json.load(fd)
        fd.close()
    except IOError:
        raise Exception("I/O error reading config file")
    except Exception:
        raise Exception("Error reading config file")

    # Assign default values to attributes
    power_ramp_rate_enable = False
    power_on_off_enable = False
    node_idle_limit = 1800
    min_node_down_delay = 1800
    max_jobs_analyze_limit = 100
    max_concurrent_nodes = 10

    # Now assgin values read from config file
    if 'power_on_off_enable' in config:
        power_on_off_enable = config['power_on_off_enable']
        pbs.logmsg(pbs.EVENT_DEBUG3, "power_on_off_enable is set to %s" %
                   str(power_on_off_enable))
    if 'power_ramp_rate_enable' in config:
        power_ramp_rate_enable = config['power_ramp_rate_enable']
        pbs.logmsg(pbs.EVENT_DEBUG3, "power_ramp_rate_enable is set to %s" %
                   str(power_ramp_rate_enable))
    if 'node_idle_limit' in config:
        node_idle_limit = int(config['node_idle_limit'])
        if not node_idle_limit or node_idle_limit < 0:
            node_idle_limit = 1800
        pbs.logmsg(pbs.EVENT_DEBUG3, "node_idle_limit is set to %d" %
                   node_idle_limit)
    if 'min_node_down_delay' in config:
        min_node_down_delay = int(config['min_node_down_delay'])
        if not min_node_down_delay or min_node_down_delay < 0:
            min_node_down_delay = 1800
        pbs.logmsg(pbs.EVENT_DEBUG3, "min_node_down_delay is set to %d" %
                   min_node_down_delay)
    if 'max_jobs_analyze_limit' in config:
        max_jobs_analyze_limit = int(config['max_jobs_analyze_limit'])
        if not max_jobs_analyze_limit or max_jobs_analyze_limit < 0:
            max_jobs_analyze_limit = 100
        pbs.logmsg(pbs.EVENT_DEBUG3, "max_jobs_analyze_limit is set to %d" %
                   max_jobs_analyze_limit)
    if 'max_concurrent_nodes' in config:
        max_concurrent_nodes = int(config['max_concurrent_nodes'])
        if not max_concurrent_nodes or max_concurrent_nodes < 0:
            max_concurrent_nodes = 10
        pbs.logmsg(pbs.EVENT_DEBUG3, "max_concurrent_nodes is set to %d" %
                   max_concurrent_nodes)


# Accept if event not serviceable.
this_event = pbs.event()
if this_event.type not in [pbs.EXECJOB_PROLOGUE, pbs.EXECJOB_EPILOGUE,
                           pbs.EXECJOB_BEGIN, pbs.EXECJOB_END,
                           pbs.EXECHOST_STARTUP, pbs.EXECHOST_PERIODIC,
                           pbs.PERIODIC]:
    pbs.logmsg(pbs.LOG_WARNING,
               "Event not serviceable for power provisioning.")
    this_event.accept()


if this_event.type == pbs.PERIODIC:
    vnlist = this_event.vnode_list
    resvlist = this_event.resv_list
    time_now = time.time()

    # Parse the config file for power attributes
    try:
        parse_config_file()
    except Exception as e:
        this_event.reject(str(e))

    if power_ramp_rate_enable == 0 and power_on_off_enable == 0:
        this_event.accept()

    if power_on_off_enable and power_ramp_rate_enable:
        # Disable ramp rate if power on/off is enabled as well.
        power_ramp_rate_enable = 0
        pbs.logmsg(pbs.LOG_WARNING,
                   "Hook config: power_on_off_enable is over-riding power_ramp_rate_enable")

    qselect_cmd = os.path.join(pbs_exec, 'bin', 'qselect')
    qstat_cmd = os.path.join(pbs_exec, 'bin', 'qstat')
    dtnow = datetime.datetime.now().strftime("%m%d%H%M")
    qselect_cmd += " -tt.gt." + str(dtnow)
    try:
        p = Popen(qselect_cmd, shell=True, stdout=PIPE, stderr=PIPE)
        (o, e) = p.communicate()
        if p.returncode or not o:
            job_list = []
        else:
            job_list = o.splitlines()
    except (OSError, ValueError):
        job_list = []
    # Analyze queued jobs and see if any of the nodes are needed in near future
    exec_vnodes = {}
    i = 0
    pattern = '%a %b %d %H:%M:%S %Y'
    for jobid in job_list:
        if not jobid:
            break
        if i == max_jobs_analyze_limit:
            break
        cmd = qstat_cmd + " -f -F json " + jobid
        try:
            p = Popen(cmd, shell=True, stdout=PIPE, stderr=PIPE)
            (o, e) = p.communicate()
            if p.returncode:
                continue
        except (OSError, ValueError):
            pbs.logmsg(pbs.EVENT_DEBUG3,
                       "Error running qstat command for job %s" % jobid)
            continue
        evnlist = None
        start_time = 0
        job_state = None
        if not o:
            continue
        try:
            out = json.loads(o)
            job = out['Jobs'][jobid]
            if 'estimated' in job:
                est = job['estimated']
                if 'start_time' in est:
                    fmttime = est['start_time']
                    start_time = int(time.mktime(
                        time.strptime(fmttime, pattern)))
                if 'exec_vnode' in est:
                    evnlist = est['exec_vnode']
            if 'job_state' in job:
                job_state = job['job_state']
        except ValueError:
            pbs.logmsg(pbs.EVENT_DEBUG3,
                       "Error reading json output for job %s" % jobid)
            continue
        if job_state == 'Q':
            if start_time and evnlist:
                for chunk in evnlist.split("+"):
                    vn = chunk.split(":")[0][1:]
                    if vn not in exec_vnodes:
                        exec_vnodes[vn] = {}
                        exec_vnodes[vn]["neededby"] = start_time
                    elif start_time < exec_vnodes[vn]["neededby"]:
                        exec_vnodes[vn]["neededby"] = start_time
        i += 1

    pbs_conf = pbs.get_pbs_conf()
    if 'PBS_HOME' in pbs_conf:
        pbs_home = pbs_conf['PBS_HOME']
    else:
        pbs.logmsg(pbs.EVENT_DEBUG,
                   "PBS_HOME needs to be defined in the config file")
        pbs.logmsg(pbs.EVENT_DEBUG, "Exiting the power hook")
        pbs.event().accept()

    # Identify the nodes file and read in the data
    node_file = ''
    sleep_node_list = []
    node_file = os.path.join(pbs_home,
                             'server_priv', 'hooks', 'tmp', 'pbs_power_nodes_file')
    if os.path.isfile(node_file) and os.stat(node_file).st_size:
        pbs.logmsg(pbs.EVENT_DEBUG3, "pbs_power_nodes_file is %s" % node_file)
        try:
            with open(node_file, 'r') as fd:
                sleep_node_list = fd.read().split(',')
        except IOError as e:
            this_event.reject(str(e))

    nodes = {}
    for vn in vnlist:
        vnode = vnlist[vn]
        host = vnode.resources_available["host"]
        can_power_off = 0
        try:
            if vnode.resources_available["PBScraynid"]:
                if power_on_off_enable:
                    if vnode.poweroff_eligible:
                        can_power_off = vnode.poweroff_eligible
                else:
                    # For ramp rate limiting.
                    can_power_off = 1
        except Exception:
            pass

        if host not in nodes:
            # Initialize the nodes with new host
            nodes[host] = {}
            nodes[host]["can_power_off"] = can_power_off
            nodes[host]["poweroff"] = 0
            nodes[host]["poweron"] = 0
            nodes[host]["vnodes"] = []
        nodes[host]["vnodes"].append(vnode)

        if can_power_off == 0:
            # Not allowed to power on/off this node
            nodes[host]["can_power_off"] = 0
            nodes[host]["poweroff"] = 0
            nodes[host]["poweron"] = 0

        rs_list = []
        if vnode.resv:
            resv_str = str(vnode.resv)
            rs_list = resv_str.split(",")

        if nodes[host]["can_power_off"]:
            # See if the node is actually free
            if vnode.state != pbs.ND_FREE:
                nodes[host]["poweroff"] = 0
            else:
                # See if there are any reservations on the vnode
                # Reservations further in time can be ignored.
                for resid in rs_list:
                    resv = resvlist[resid.lstrip()]
                    rstates = [pbs.RESV_STATE_RUNNING, pbs.RESV_STATE_DELETED,
                               pbs.RESV_STATE_BEING_ALTERED,
                               pbs.RESV_STATE_DELETING_JOBS]
                    if resv.reserve_state in rstates:
                        nodes[host]["poweroff"] = 0
                        nodes[host]["can_power_off"] = 0
                    if resv.reserve_state == pbs.RESV_STATE_CONFIRMED:
                        reserve_start = resv.reserve_start
                        if vn not in exec_vnodes:
                            exec_vnodes[vn] = {}
                            exec_vnodes[vn]["neededby"] = reserve_start
                        elif reserve_start < exec_vnodes[vn]["neededby"]:
                            exec_vnodes[vn]["neededby"] = reserve_start
                        # Do not power off a node if it has reservation starting
                        # in (time_now + min_node_down_delay + 900) seconds
                        if time_now > (reserve_start - (min_node_down_delay + 900)):
                            nodes[host]["poweroff"] = 0
                            nodes[host]["can_power_off"] = 0

                # Is the node idle enough to put to sleep or power down?
                if nodes[host]["can_power_off"]:
                    if vnode.last_used_time:
                        last_used_time = vnode.last_used_time
                    else:
                        last_used_time = 0
                    idle_time = time_now - last_used_time
                    if node_idle_limit < idle_time:
                        nodes[host]["poweroff"] = 1

        # POWER-ON/RAMP-UP check: See if the node is down and
        # needs to be brought up. Check if the node needs to be
        # up before this periodic event runs again.
        if vnode.state == pbs.ND_SLEEP:
            if power_on_off_enable:
                # Ignore the nodes in sleep_node_list as they are
                # being powered up by previous interation of the hook.
                if vn in sleep_node_list:
                    continue
            # Look for upcoming reservation starts in the node.
            for resid in rs_list:
                resv = resvlist[resid.lstrip()]
                rstates = [pbs.RESV_STATE_CONFIRMED, pbs.RESV_STATE_DEGRADED]
                if resv.reserve_state in rstates:
                    reserve_start = resv.reserve_start
                    if vn not in exec_vnodes:
                        exec_vnodes[vn] = {}
                        exec_vnodes[vn]["neededby"] = reserve_start
                    elif reserve_start < exec_vnodes[vn]["neededby"]:
                        exec_vnodes[vn]["neededby"] = reserve_start
            if vn in exec_vnodes and exec_vnodes[vn]["neededby"]:
                neededby = exec_vnodes[vn]["neededby"]
            else:
                neededby = 0
            # Check if node is needed in near future.
            # Assuming node will take about 900 seconds to come up.
            if neededby and neededby < (time_now + 900):
                nodes[host]["poweron"] = 1
            # See when node was put down
            if vnode.last_state_change_time:
                last_state_change = vnode.last_state_change_time
            else:
                last_state_change = 0
            # Do not power on a node if it went down within less than
            # min_node_down_delay seconds
            if power_on_off_enable and last_state_change:
                if (time_now - last_state_change) < int(min_node_down_delay):
                    nodes[host]["poweron"] = 0

    poweroff_vnlist = []
    poweron_vnlist = []
    i = 0
    j = 0
    for n in nodes:
        # Check if any nodes need to be ramped-down/powered-off.
        if nodes[n]["poweroff"] == 1 and i < max_concurrent_nodes:
            poweroff_vnlist.append(n)
            i += 1
        # Check if any nodes need to be ramped-up/powered-on.
        elif nodes[n]["poweron"] == 1 and j < max_concurrent_nodes:
            poweron_vnlist.append(n)
            j += 1
        if i == max_concurrent_nodes and j == max_concurrent_nodes:
            break

    if poweroff_vnlist or poweron_vnlist or sleep_node_list:
        power = init_power(this_event)
    else:
        this_event.accept()
    try:
        if power_ramp_rate_enable:
            # Ramp rate limiting
            if poweroff_vnlist:
                power.ramp_down(poweroff_vnlist)
            if poweron_vnlist:
                power.ramp_up(poweron_vnlist)
        else:
            # Power on/off nodes
            if poweroff_vnlist:
                power.power_off(poweroff_vnlist)
            if poweron_vnlist:
                power.power_on(poweron_vnlist)
            ready_nodes = set()
            if sleep_node_list:
                ready_nodes = power.power_status(sleep_node_list)
                # For the nodes which are up remove ND_SLEEP
                for host in ready_nodes:
                    for vn in nodes[host]["vnodes"]:
                        prev_state = vn.state
                        vn.state = prev_state & ~(pbs.ND_SLEEP)
                        vn.last_used_time = time_now
            # nodes which are still booting, write them to
            # node file for status check in next iteration.
            if sleep_node_list or poweron_vnlist:
                if poweron_vnlist:
                    sleeping_nodes = poweron_vnlist
                else:
                    sleeping_nodes = []
                # Look for still booting nodes from previous iteration.
                for n in sleep_node_list:
                    if n not in ready_nodes:
                        sleeping_nodes.append(n)
                data = ','.join(sleeping_nodes)
                try:
                    with open(node_file, 'w') as fd:
                        fd.write(data)
                except IOError as e:
                    power.disconnect()
                    this_event.reject(str(e))
        # Mark nodes to ND_Sleep
        for nd in poweroff_vnlist:
            for vn in nodes[nd]["vnodes"]:
                vn.state = pbs.ND_SLEEP
        # Mark nodes to ND_free
        if power_ramp_rate_enable:
            for nd in poweron_vnlist:
                for vn in nodes[nd]["vnodes"]:
                    vn.state = pbs.ND_FREE
                    vn.last_used_time = time_now
        power.disconnect()
        this_event.accept()
    except Exception as e:
        power.disconnect()
        this_event.reject(str(e))


# Set eoe values for my node
if this_event.type == pbs.EXECHOST_STARTUP:
    from pbs.v1._pmi_utils import _is_node_provisionable

    # Don't connect if the server or sched is running.
    if not _is_node_provisionable():
        pbs.logmsg(pbs.LOG_DEBUG,
                   "Provisioning cannot be enabled on this host")
        this_event.accept()
    power = init_power(this_event)
    profiles = power.query(pbs.Power.QUERY_PROFILE)
    if profiles is not None:
        me = pbs.get_local_nodename()
        this_event.vnode_list[me].resources_available[
            "eoe"] = power._map_profile_names(profiles)
    power.disconnect()
    this_event.accept()


# Gather energy usage for all jobs
if this_event.type == pbs.EXECHOST_PERIODIC:
    # Check if any jobs are running
    if len(this_event.job_list) == 0:
        this_event.accept()

    power = init_power(this_event)
    for jobid in this_event.job_list:
        # set energy usage
        job = this_event.job_list[jobid]
        # skip any jobs that MOM is not MS
        if not job.in_ms_mom():
            continue
        # skip if vnodes have power_provisioning=0
        if not vnodes_enabled(job):
            continue

        try:
            usage = power.get_usage(job)
            if usage is not None:
                job.resources_used["energy"] = usage
        except Exception as e:
            pbs.logmsg(pbs.LOG_ERROR, str(e))
    power.disconnect()
    this_event.accept()

# From this point on, the event will have a job.
this_job = this_event.job

if this_event.type == pbs.EXECJOB_BEGIN:
    me = pbs.get_local_nodename()
    try:
        if not _svr_vnode(me).power_provisioning:
            this_event.accept()
    except Exception:
        # Try with different hostname
        vn = get_local_node(me)
        if not _svr_vnode(vn.name).power_provisioning:
            this_event.accept()
    requested_profile = str(this_job.schedselect).partition(
        'eoe=')[2].partition('+')[0].partition(':')[0]
    if requested_profile != "":
        try:
            this_event.vnode_list[me].current_eoe = requested_profile
        except (KeyError, ValueError):
            pass
    this_event.accept()
if this_event.type == pbs.EXECJOB_END:
    me = pbs.get_local_nodename()
    try:
        this_event.vnode_list[me].current_eoe = None
    except (KeyError, ValueError):
        pass

    power = init_power(this_event)
    try:
        power.deactivate_profile(this_job)
    except Exception as e:
        pbs.logjobmsg(this_job.id, str(e))
    power.disconnect()
    this_event.accept()

# No further processing is needed if we are not mother superior.
if not this_job.in_ms_mom():
    this_event.accept()

# Don't do anything if power_provisioning=0
if not vnodes_enabled(this_job):
    this_event.accept()

# Was an EOE requested?
requested_profile = str(this_job.schedselect).partition(
    'eoe=')[2].partition('+')[0].partition(':')[0]
if requested_profile == "":
    this_event.accept()

if this_event.type == pbs.EXECJOB_PROLOGUE:
    power = init_power(this_event)
    try:
        power.activate_profile(requested_profile, this_job)
        power.disconnect()
    except Exception as e:
        power.disconnect()
        this_event.reject(str(e))
elif this_event.type == pbs.EXECJOB_EPILOGUE:
    power = init_power(this_event)
    # set energy usage
    try:
        usage = power.get_usage(this_job)
        if usage is not None:
            this_job.resources_used["energy"] = usage
    except Exception as e:
        pbs.logjobmsg(this_job.id, str(e))
    power.disconnect()

this_event.accept()


================================================
FILE: src/modules/python/pbs_hooks/PBS_xeon_phi_provision.HK
================================================
type=pbs
enabled=false
user=pbsadmin
event=provision
order=1
alarm=1800


================================================
FILE: src/modules/python/pbs_hooks/PBS_xeon_phi_provision.PY
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import json as json
import os
import subprocess
import sys
import time

import pbs

# Section to be moved to config file once available for provision hook
capmc_dir = '/opt/cray/capmc/default/bin'
power_up_checks = 20
power_up_sleep = 60

# Get the information about the node and aoe to provision
e = pbs.event()
vnode = e.vnode
aoe = e.aoe

numa_cfg, cache_percent = aoe.split('_')
nid = vnode.split('_')[1]

# Add capmc_dir to path
os.environ['PATH'] = capmc_dir + ":" + os.environ['PATH']

# capmc commands to configure the knl nodes
cmd_set_numa_cfg = ['capmc', 'set_numa_cfg', '--nids', '%s' % nid,
                    '--mode', '%s' % numa_cfg]
cmd_set_mcdram_cfg = ['capmc', 'set_mcdram_cfg', '--nids',
                      '%s' % nid, '--mode', '%s' % cache_percent]
cmd_node_reinit = ['capmc', 'node_reinit', '--nids', '%s' % nid]
cmd_node_status = ['capmc', 'node_status', '--nids', '%s' % nid]
cmd_list = (cmd_set_numa_cfg, cmd_set_mcdram_cfg, cmd_node_reinit)

pbs.logmsg(pbs.EVENT_DEBUG3, "vnode: %s" % vnode)
pbs.logmsg(pbs.EVENT_DEBUG3, "aoe: %s" % aoe)
pbs.logmsg(pbs.EVENT_DEBUG3, "numa cmd: %s" % cmd_set_numa_cfg)
pbs.logmsg(pbs.EVENT_DEBUG3, "cache cmd: %s" % cmd_set_mcdram_cfg)
pbs.logmsg(pbs.EVENT_DEBUG3, "power reinit cmd: %s" % cmd_node_reinit)

try:
    for cmd in cmd_list:
        process = subprocess.Popen(cmd, stdout=subprocess.PIPE,
                                   stderr=subprocess.PIPE)
        (output, err) = process.communicate()
        if process.returncode != 0:
            error_msg = "Error while running %s: %s" % (cmd, err.strip())
            e.reject(error_msg, process.returncode)
        else:
            node_status = json.loads(output)
            # err_msg value will be Success
            pbs.logmsg(pbs.EVENT_DEBUG3, "%s return code: %s err_msg: %s" % (
                cmd, process.returncode, node_status['err_msg']))

    # Nodes can take upwards of 15 minutes to come back online
    poll_val = 0
    poll_cnt = 0
    while poll_val < 1 and poll_cnt < power_up_checks:
        time.sleep(power_up_sleep)
        process = subprocess.Popen(cmd_node_status, stdout=subprocess.PIPE,
                                   stderr=subprocess.PIPE)
        (output, err) = process.communicate()
        if process.returncode != 0:
            error_msg = "Error while running %s: %s" % (cmd_node_status, err.strip())
            e.reject(error_msg, process.returncode)
        node_status = json.loads(output)
        pbs.logmsg(pbs.EVENT_DEBUG3,
                   "poll_cnt: %d node_status: %s" % (poll_cnt, node_status))
        if "ready" in node_status:
            if int(nid) in node_status['ready']:
                pbs.logmsg(pbs.EVENT_DEBUG3,
                           "Node was successfully powered on")
                poll_val = 1
        poll_cnt += 1

    if poll_val != 1:
        e.reject("Provisioning with reboot failed", 211)
    else:
        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to accept")
        e.accept(0)
except (OSError, ValueError) as err:
    e.reject("Caught exception : %s" % (str(err)), err.errno)
except Exception as err:
    e.reject("Caught exception : %s" % (str(err)), err.errno)


================================================
FILE: src/modules/python/pbs_v1_module_init.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include "pbs_config.h"
#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "pbs_version.h"
#include "pbs_error.h"
#include "attribute.h"
#include "job.h"
#include "reservation.h"
#include "server.h"
#include "pbs_nodes.h"
#include "pbs_sched.h"
#include <pbs_python_private.h>
#include <Python.h>

#define PBS_V1_COMMON_MODULE_DEFINE_STUB_FUNCS 1
#include "pbs_v1_module_common.i"

/* #define MODULE_NAME "_pbs_v1_module" */
#define MODULE_NAME "pbs_python"

PyMODINIT_FUNC
PyInit__pbs_v1(void)
{
	int i;
	PyObject *module = NULL;
	PyObject *py_sys_modules = NULL;

	memset(&server, 0, sizeof(server));

	if (set_msgdaemonname(MODULE_NAME)) {
		return PyErr_Format(PyExc_MemoryError,
				    "set_msgdaemonname() failed to allocate memory");
	}

	if (pbs_loadconf(0) == 0) {
		return PyErr_Format(PyExc_Exception, "Failed to load pbs.conf!");
	}

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	pbs_python_set_use_static_data_value(0);

	/* by default, server_name is what is set in /etc/pbs.conf */
	strncpy(server_name, pbs_conf.pbs_server_name, PBS_MAXSERVERNAME);

	/* determine the actual server name */
	pbs_server_name = pbs_default();
	if ((!pbs_server_name) || (*pbs_server_name == '\0')) {
		return PyErr_Format(PyExc_Exception,
				    "pbs_default() failed acquire the server name");
	}

	/* determine the server host name */
	if (get_fullhostname(pbs_server_name, server_host, PBS_MAXSERVERNAME) != 0) {
		return PyErr_Format(PyExc_Exception,
				    "get_fullhostname() failed to acqiure the server host name");
	}

	if ((job_attr_idx = cr_attrdef_idx(job_attr_def, JOB_ATR_LAST)) == NULL) {
		return PyErr_Format(PyExc_Exception,
				    "Failed creating job attribute search index");
	}
	if ((node_attr_idx = cr_attrdef_idx(node_attr_def, ND_ATR_LAST)) == NULL) {
		return PyErr_Format(PyExc_Exception,
				    "Failed creating node attribute search index");
	}
	if ((que_attr_idx = cr_attrdef_idx(que_attr_def, QA_ATR_LAST)) == NULL) {
		return PyErr_Format(PyExc_Exception,
				    "Failed creating queue attribute search index");
	}
	if ((svr_attr_idx = cr_attrdef_idx(svr_attr_def, SVR_ATR_LAST)) == NULL) {
		return PyErr_Format(PyExc_Exception,
				    "Failed creating server attribute search index");
	}
	if ((sched_attr_idx = cr_attrdef_idx(sched_attr_def, SCHED_ATR_LAST)) == NULL) {
		return PyErr_Format(PyExc_Exception,
				    "Failed creating sched attribute search index");
	}
	if ((resv_attr_idx = cr_attrdef_idx(resv_attr_def, RESV_ATR_LAST)) == NULL) {
		return PyErr_Format(PyExc_Exception,
				    "Failed creating resv attribute search index");
	}
	if (cr_rescdef_idx(svr_resc_def, svr_resc_size) != 0) {
		return PyErr_Format(PyExc_Exception,
				    "Failed creating resc definition search index");
	}

	/* initialize the pointers in the resource_def array */
	for (i = 0; i < (svr_resc_size - 1); ++i) {
		svr_resc_def[i].rs_next = &svr_resc_def[i + 1];
	}

	/* set python interp data */
	svr_interp_data.init_interpreter_data = NULL;
	svr_interp_data.destroy_interpreter_data = NULL;
	svr_interp_data.interp_started = 1;
	svr_interp_data.pbs_python_types_loaded = 0;
	if (gethostname(svr_interp_data.local_host_name, PBS_MAXHOSTNAME) == -1) {
		return PyErr_Format(PyExc_Exception,
				    "gethostname() failed to acquire the local host name");
	}
	svr_interp_data.daemon_name = strdup(MODULE_NAME);
	svr_interp_data.data_initialized = 1;

	/* construct _pbs_v1 module */
	module = pbs_v1_module_init();
	if (module == NULL) {
		return PyErr_Format(PyExc_Exception,
				    PBS_PYTHON_V1_MODULE_EXTENSION_NAME
				    " module initialization failed");
	}

	/*
	 * get a borrowed reference to sys.modules and add our module to it in order
	 * to prevent an import cycle while loading the PBS python types
	 */
	py_sys_modules = PyImport_GetModuleDict();
	if (PyDict_SetItemString(py_sys_modules,
				 PBS_PYTHON_V1_MODULE_EXTENSION_NAME, module)) {
		return PyErr_Format(PyExc_Exception,
				    "failed to addd the " PBS_PYTHON_V1_MODULE_EXTENSION_NAME
				    " module to sys.modules");
	}

	/* load python types into the _pbs_v1 module */
	if ((pbs_python_load_python_types(&svr_interp_data) == -1)) {
		PyDict_DelItemString(py_sys_modules,
				     PBS_PYTHON_V1_MODULE_EXTENSION_NAME);
		return PyErr_Format(PyExc_Exception,
				    "pbs_python_load_python_types() failed to load Python types");
	}

	return module;
}


================================================
FILE: src/modules/python/setup.cfg
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

[global]

[install]
optimize = 2


================================================
FILE: src/modules/python/setup.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from distutils.core import setup
from distutils.core import DEBUG

package_version = "1.0"
package_name = "pbs"
package_src_root = "pbs"
packages = []
package_dir = {}

packages.extend([
                    package_name,
                    "%s.v1" % (package_name,)
                ])

package_dir.update({
                    package_name : package_src_root
                  })

#: ############################################################################
#:             INVOKE setup (aka MAIN Program)
#: ############################################################################

#: build the setup keyword argument list.
setup(
                name                             = package_name,
                version                          = package_version,
                maintainer                       = "Altair Engineering",
                maintainer_email                 = "support@altair.com",
                author                           = "Altair",
                author_email                     = "support@altair.com",
                url                              = "http://www.altair.com",
                download_url                     = "http://www.altair.com",
                license                          = "Proprietary",
                platforms                        = ["any"],
                packages                         = packages,
                package_dir                      = package_dir,
)


================================================
FILE: src/mom_rcp/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

sbin_PROGRAMS = pbs_rcp

pbs_rcp_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

pbs_rcp_LDADD = @socket_lib@

pbs_rcp_SOURCES = \
	extern.h \
	pathnames.h \
	pbs_stat.h \
	rcp.c \
	replace.c \
	util.c


================================================
FILE: src/mom_rcp/README
================================================
MOM's rcp

1. What is this rcp stuff?

The majority contents of this directory is the source code
for the rcp(1) command.  This source is from the bsd4.4-Lite
distribution.  It is copyrighted by UCB as noted in the source
files.  This code has been slightly modified in order to have
in compile on systems other than bsd4.4;  note their liberal
use of functions suchs as vwarnx() and snprintf() not found in
POSIX.   The copyright, reproduced below, clearly grants the right
to modify and redistribute the source.

 * Copyright (c) 1992, 1993
 *      The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *      This product includes software developed by the University of
 *      California, Berkeley and its contributors.
 * 4. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.


2. Why do we need it?

Within PBS, there are three cases in which MOM must move files
between her machine and some other:
	a. Pre-execution stage in of files.
	b. Post-execution stage out of files.
	c. Post-execution return of the job`s standard output and
	   standard error.

The PBS project did not wish to be dependent on NFS, AFS, or any
other distributed file system in order to support file delivery.
Nor did we wish to restrict the source/target of file movement to
those systems with a PBS server.  This ruled out using the "job"
protocol as a file transport.  Ftp(1) and ftam require the user's
password.  We did not wish to require that knowledge.  Thus rcp(1)
was selected as the transport method.   MOM uses the system(3)
library routine to execute the rcp command.

However, many rcp implementations come with a serious flaw.  They
may exit and return an exit status of zero (0), when the file was
not delivered.  If this happens, MOM would believe that the file
was delivered when it was not.  

One solution would have been to implement a new copy utility for MOM
very similar to rcp.  But this would have required it's installation
on every system to/from which the user may wish to move files.  Rather
than duplicate rcp, lets just fix it.  As only the rcp used by MOM
must be "fixed", the PBS team opted to provide a version of rcp that
works correctly.   The bsd4.4-Lite version was chosen because of the
freedom to copy and modify it granted by its copyright.


3. How is it used?

The supplied rcp source is compiled and the program is named
"pbs_rcp" in order to reduce the level of confusion on having
two "rcp"s installed on the system.  It is installed in the same
directory as MOM (pbs_mom).

When MOM invokes pbs_rcp, MOM has forked a child which as set its
effective and real uid to that of the user on whoses behalf MOM
is operation.  This child of MOM, as the user, will use system(3)
to fork a shell and execute pbs_rcp.  The path to the pbs_rcp 
is specified in building src/mom/requests.c and contains the directory
where MOM is (will be) installed.

Pbs_rcp, as in normal rcp, must be installed "setuid" and owned by root.


================================================
FILE: src/mom_rcp/extern.h
================================================
/*-
 * Copyright (c) 1992, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *	This product includes software developed by the University of
 *	California, Berkeley and its contributors.
 * 4. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 *	@(#)extern.h	8.1 (Berkeley) 5/31/93
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

typedef struct {
	int cnt;
	char *buf;
} BUF;

extern int iamremote;

BUF *allocbuf(BUF *, int, int);
char *colon(char *);
void lostconn(int);
void nospace(void);
int okname(char *);
void run_err(const char *, ...);
int susystem(char *, uid_t, char *);
void verifydir(char *);
char *strerror(int);
void errx(int err, const char *fmt, ...);
void err(int val, char *str);
void warnx(const char *fmt, ...);


================================================
FILE: src/mom_rcp/pathnames.h
================================================
/*
 * Copyright (c) 1989, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *	This product includes software developed by the University of
 *	California, Berkeley and its contributors.
 * 4. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 *	@(#)pathnames.h	8.1 (Berkeley) 5/31/93
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifdef WIN32

#define _PATH_CP "copy"
#define _PATH_BSHELL "cmd"
#define _PATH_RSH "\\winnt\\system32\\rsh.exe"

#else

#define _PATH_CP "/bin/cp"
#define _PATH_BSHELL "/bin/sh"
#define _PATH_RSH "rsh"

#endif


================================================
FILE: src/mom_rcp/pbs_stat.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <Long.h>
#include <sys/stat.h>
#include <sys/types.h>

/*  This header file consist of new definition for Macro pbs_stat_struct,
 *  pbs_stat(const char * , struct pbs_stat_struct * ),  INT64  used
 *  in  Windows.
 */

#ifdef WIN32
#define pbs_stat(path, buffer) _stati64(path, buffer)
typedef struct _stati64 pbs_stat_struct;
typedef INT64 off_t_pbs;
typedef INT64 int_pbs;
#else
#define pbs_stat(path, buffer) stat(path, buffer)
typedef struct stat pbs_stat_struct;
typedef off_t off_t_pbs;
typedef long int_pbs;
#endif


================================================
FILE: src/mom_rcp/rcp.c
================================================
/*
 * Copyright (c) 1983, 1990, 1992, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *	This product includes software developed by the University of
 *	California, Berkeley and its contributors.
 * 4. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Copyright (c) 1983, 1990, 1992, 1993
 * The Regents of the University of California.  All rights reserved.
 *
 * rcp.c 8.2 (Berkeley) 4/2/94";
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/param.h>
#include <sys/time.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <netinet/in_systm.h>
#include <netinet/ip.h>

#include <ctype.h>
#include <dirent.h>
#include <errno.h>
#include <fcntl.h>
#include <netdb.h>
#include <pwd.h>
#include <signal.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <string.h>
#include <unistd.h>

#include "pathnames.h"
#include "extern.h"
#include "pbs_version.h"
#include "pbs_stat.h"
#include "libutil.h"
#include "pbs_ifl.h"
#include "pbs_internal.h"

#ifdef USELOG
#include <syslog.h>
#include <arpa/inet.h>
#endif /* USELOG */
/**
 * @file	rcp.c
 */
extern int setresuid(uid_t, uid_t, uid_t);

#ifdef KERBEROS
#include <kerberosIV/des.h>
#include <kerberosIV/krb.h>

char dst_realm_buf[REALM_SZ];
char *dest_realm = NULL;
int use_kerberos = 1;
CREDENTIALS cred;
Key_schedule schedule;
extern char *krb_realmofhost();
#ifdef CRYPT
int doencrypt = 0;
#define OPTIONS "dfKk:prtx-:"
#else
#define OPTIONS "dfKk:prt-:"
#endif
#else
#define OPTIONS "Edfprt-:"
#endif

char *credb = NULL;
size_t credl = 0;
struct passwd *pwd;
u_short port;
uid_t userid;
int errs, rem;
int pflag, iamremote, iamrecursive, targetshouldbedirectory;

#ifdef WIN32
struct _utimbuf times;
#endif

#define CMDNEEDS 64
char cmd[CMDNEEDS]; /* must hold "rcp -r -p -d\0" */

#ifdef KERBEROS
int kerberos(char **, char *, char *, char *);
void oldw(const char *, ...);
#endif
int response(void);
void rsource(char *, pbs_stat_struct *);
void sink(int, char *[]);
void source(int, char *[]);
void tolocal(int, char *[]);
void toremote(char *, int, char *[]);
void usage(void);

#ifdef USELOG
#define exit use_exit
static void use_logusage();
static void use_prep_timer();
static float use_get_wtime(); /* wall clock time */
static void use_tvsub();
static void use_exit();
struct hostent *gethostbyname();
struct hostent *gethostbyaddr();
struct timeval use_time0; /* Time at which timing started */
struct hostent *use_host_rec;
struct sockaddr_in use_sock_rec;
int use_namelen;
char use_message[160];
char use_host[50];
char use_user[20];
char use_direction[2]; /* Put/Send or Get/Receive a file */
float use_size = 0.0;  /* Size of transfer in MBytes */
float use_rate = 0.1;  /* MBytes/Second */
int use_status = 0;
int use_filec = 0;
float use_wctime = 0.1;
int use_neterr = 0;
#endif /* USELOG */

int
main(int argc, char *argv[])
{
	struct servent *sp;
	int ch, fflag, tflag;
	char *targ, *shell;
	extern int optind;
#ifdef WIN32
	DWORD cnt;
	DWORD a_cnt = 0;
#else
	size_t cnt;
	size_t a_cnt = 0;
#endif

#ifdef USELOG
	use_prep_timer();
	strcpy(use_user, "no_user");
	strcpy(use_host, "no_host");
	strcpy(use_direction, "E"); /* default is Error */
#endif				    /* USELOG */

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	fflag = tflag = 0;
	while ((ch = getopt(argc, argv, OPTIONS)) != EOF)
		switch (ch) { /* User-visible flags. */
			case 'K':
#ifdef KERBEROS
				use_kerberos = 0;
#endif
				break;
#ifdef KERBEROS
			case 'k':
				dest_realm = dst_realm_buf;
				(void) strncpy(dst_realm_buf, optarg, REALM_SZ);
				break;
#ifdef CRYPT
			case 'x':
				doencrypt = 1;
				/* des_set_key(cred.session, schedule); */
				break;
#endif
#endif
			case 'p':
				pflag = 1;
				break;
			case 'r':
				iamrecursive = 1;
				break;
				/* Server options. */
			case 'd':
				targetshouldbedirectory = 1;
				break;
			case 'f': /* "from" */
				iamremote = 1;
				fflag = 1;
				break;
			case 't': /* "to" */
				iamremote = 1;
				tflag = 1;
				break;
			case 'E': /* "encrypted password" */

				cnt = sizeof(size_t);
#ifdef WIN32
				ReadFile(GetStdHandle(STD_INPUT_HANDLE),
					 (char *) &credl, cnt, &a_cnt, NULL);
#else
				a_cnt = fread((char *) &credl, sizeof(char), cnt,
					      stdin);
#endif
				if (cnt != a_cnt) {
					fprintf(stderr,
						"failed to read in credlen. expect %ld got %ld",
#ifdef NAS /* localmod 005 */
						(long) cnt, (long) a_cnt);
#else
						cnt, a_cnt);
#endif /* localmod 005 */
					exit(1);
				}

				if (credl == 0) {
					fprintf(stderr, "credlen=0\n");
					exit(1);
				}

				credb = (char *) malloc(credl);
				if (credb == NULL) {
					fprintf(stderr, "failed to malloc cred buf...");
					exit(1);
				}

				a_cnt = 0;
#ifdef WIN32
				ReadFile(GetStdHandle(STD_INPUT_HANDLE), (char *) credb,
					 credl, &a_cnt, NULL);
#else
				a_cnt = fread((char *) credb, sizeof(char), credl,
					      stdin);
#endif

				if (credl != a_cnt) {
					fprintf(stderr,
						"failed to read in cred...expect %ld got %ld\n",
#ifdef NAS /* localmod 005 */
						(long) credl, (long) a_cnt);
#else
						credl, a_cnt);
#endif /* localmod 005 */
					exit(-1);
				}
				break;

			case '?':
			default:
				usage();
		}
	argc -= optind;
	argv += optind;

	if (initsocketlib())
		return 1;

#ifdef KERBEROS
	if (use_kerberos) {
#ifdef CRYPT
		shell = doencrypt ? "ekshell" : "kshell";
#else
		shell = "kshell";
#endif
		if ((sp = getservbyname(shell, "tcp")) == NULL) {
			use_kerberos = 0;
			oldw("can't get entry for %s/tcp service", shell);
			sp = getservbyname(shell = "shell", "tcp");
		}
	} else
		sp = getservbyname(shell = "shell", "tcp");
#else
	sp = getservbyname(shell = "shell", "tcp");
#endif
	if (sp == NULL)
		errx(1, "%s/tcp: unknown service", shell);
	port = sp->s_port;

	if ((pwd = getpwuid(userid = getuid())) == NULL)
		errx(1, "unknown user %d", (int) userid);

#ifdef USELOG
	strcpy(use_user, pwd->pw_name);
#endif /* USELOG */

	rem = STDIN_FILENO;

	if (fflag) { /* Follow "protocol", send data. */
		(void) response();
#ifndef WIN32
		if (setuid(userid) == -1)
			exit(-11);
#endif
		source(argc, argv);
		exit(errs);
	}

	if (tflag) { /* Receive data. */
#ifndef WIN32
		if (setuid(userid) == -1)
			exit(-12);
#endif
		sink(argc, argv);
		exit(errs);
	}

	if (argc < 2)
		usage();
	if (argc > 2)
		targetshouldbedirectory = 1;

	rem = -1;
	/* Command to be executed on remote system using "rsh". */
#ifdef KERBEROS
	(void) sprintf(cmd,
		       "rcp%s%s%s%s", iamrecursive ? " -r" : "",
#ifdef CRYPT
		       (doencrypt && use_kerberos ? " -x" : ""),
#else
		       "",
#endif
		       pflag ? " -p" : "", targetshouldbedirectory ? " -d" : "");
#else
	(void) sprintf(cmd, "rcp%s%s%s",
		       iamrecursive ? " -r" : "", pflag ? " -p" : "",
		       targetshouldbedirectory ? " -d" : "");
#endif

#ifndef WIN32
	(void) signal(SIGPIPE, lostconn);
#endif

#ifdef WIN32
	if (!(IS_UNCPATH(argv[argc - 1])) &&
	    ((targ = colon(argv[argc - 1])) != NULL))
#else
	if ((targ = colon(argv[argc - 1])) != NULL)
#endif
		/* Dest is non-UNC remote path */
		toremote(targ, argc, argv);
	else {
		/* Dest is local host or UNC path */
		tolocal(argc, argv);
		if (targetshouldbedirectory)
			verifydir(argv[argc - 1]);
	}
	exit(errs);
}

/**
 * @brief
 *	strips the uid port number and other details required for authentication,
 *	using rcmd or kerboros authentication mechanism tries to execute commands on remote system.
 *
 * @param[in] targ - target path
 * @param[in] argc - num of args
 * @param[in] argv - pointer to array of args
 *
 * @return	Void
 *
 */
void
toremote(char *targ, int argc, char *argv[])
{
	int i, len;
	char *bp, *host, *src, *suser, *thost, *tuser;

	*targ++ = 0;
	if (*targ == 0)
		targ = ".";

	if ((thost = strchr(argv[argc - 1], '@')) != NULL) {
		/* user@host */
		*thost++ = 0;
		tuser = argv[argc - 1];
		if (*tuser == '\0')
			tuser = NULL;
		else if (!okname(tuser)) {
			if (credb != NULL) {
				(void) free(credb);
				credb = NULL;
			}
			exit(1);
		}
	} else {
		thost = argv[argc - 1];
		tuser = NULL;
	}

#ifdef USELOG
	use_host_rec = gethostbyname(thost);
	if (use_host_rec)
		strcpy(use_host, use_host_rec->h_name);
	else
		strcpy(use_host, thost);
#endif /* USELOG */

	for (i = 0; i < argc - 1; i++) {
		src = colon(argv[i]);
		if (src) { /* remote to remote */
			*src++ = 0;
			if (*src == 0)
				src = ".";
			host = strchr(argv[i], '@');
			len = strlen(_PATH_RSH) + strlen(argv[i]) +
			      strlen(src) + (tuser ? strlen(tuser) : 0) +
			      strlen(thost) + strlen(targ) + CMDNEEDS + 20;
			if (!(bp = malloc(len)))
				err(1, NULL);
			if (host) {
				*host++ = 0;
				suser = argv[i];
				if (*suser == '\0')
					suser = pwd->pw_name;
				else if (!okname(suser))
					continue;
				(void) sprintf(bp,
					       "%s %s -l %s -n %s %s '%s%s%s:%s'",
					       _PATH_RSH, host, suser, cmd, src,
					       tuser ? tuser : "", tuser ? "@" : "",
					       thost, targ);
			} else
				(void) sprintf(bp,
#ifdef WIN32
					       "%s %s -n %s %s '%s%s%s:%s'",
#else
					       "exec %s %s -n %s %s '%s%s%s:%s'",
#endif
					       _PATH_RSH, argv[i], cmd, src,
					       tuser ? tuser : "", tuser ? "@" : "",
					       thost, targ);
			(void) susystem(bp, userid, pwd->pw_name);
			(void) free(bp);
		} else { /* local to remote */
			if (rem == -1) {
				len = strlen(targ);
				if ((targ[len - 1] == '/') ||
				    (targ[len - 1] == '\\'))
					targ[len - 1] = '\0';
				len = len + CMDNEEDS + 20;
				if (!(bp = malloc(len)))
					err(1, NULL);
				(void) sprintf(bp, "%s -t %s", cmd, targ);
				host = thost;
#ifdef KERBEROS
				if (use_kerberos)
					rem = kerberos(&host, bp,
						       pwd->pw_name,
						       tuser ? tuser : pwd->pw_name);
				else
#endif
#ifdef WIN32
					rem = rcmd2(&host, port, pwd->pw_name,
						    tuser ? tuser : pwd->pw_name,
						    credb, credl, bp, 0);
#else
				rem = rcmd(&host, port, pwd->pw_name,
					   tuser ? tuser : pwd->pw_name,
					   bp, 0);
#endif

				if (rem < 0) {
					if (credb != NULL) {
						(void) free(credb);
						credb = NULL;
					}
					exit(1);
				}
				if (response() < 0) {
					if (credb != NULL) {
						(void) free(credb);
						credb = NULL;
					}
					exit(1);
				}
				(void) free(bp);
#ifndef WIN32
				if (setuid(userid) == -1)
					exit(-14);
#endif
			}
			source(1, argv + i);
		}
	}
	if (credb != NULL) {
		(void) free(credb);
		credb = NULL;
	}
}

/**
 * @brief
 *      using rcmd or kerboros authentication mechanism tries to execute
 *	commands on local machine
 *
 * @param[in] argc - num of args
 * @param[in] argv - pointer to array of args
 *
 * @return      Void
 *
 */

void
tolocal(int argc, char *argv[])
{
	int i, len;
	char *bp, *host, *src, *suser;

	for (i = 0; i < argc - 1; i++) {
		if (!(src = colon(argv[i]))) { /* Local to local. */
			len = strlen(_PATH_CP) + strlen(argv[i]) +
			      strlen(argv[argc - 1]) + 20;
			if (!(bp = malloc(len)))
				err(1, NULL);
#ifdef WIN32
			(void) sprintf(bp, "cmd /c %s%s%s %s %s", _PATH_CP,
#else
			(void) sprintf(bp, "exec %s%s%s %s %s", _PATH_CP,
#endif
				       iamrecursive ? " -r" : "", pflag ? " -p" : "",
				       argv[i], argv[argc - 1]);
			if (susystem(bp, userid, pwd->pw_name))
				++errs;
			(void) free(bp);
			continue;
		}
		*src++ = 0;
		if (*src == 0)
			src = ".";
		if ((host = strchr(argv[i], '@')) == NULL) {
			host = argv[i];
			suser = pwd->pw_name;
		} else {
			*host++ = 0;
			suser = argv[i];
			if (*suser == '\0')
				suser = pwd->pw_name;
			else if (!okname(suser))
				continue;
		}
		len = strlen(src) + CMDNEEDS + 20;
		if ((bp = malloc(len)) == NULL)
			err(1, NULL);

#ifdef USELOG
		use_host_rec = gethostbyname(host);
		if (use_host_rec)
			strcpy(use_host, use_host_rec->h_name);
		else
			strcpy(use_host, host);
		strcpy(use_user, suser);
#endif /* USELOG */

		(void) sprintf(bp, "%s -f %s", cmd, src);
		rem =
#ifdef KERBEROS
			use_kerberos ? kerberos(&host, bp, pwd->pw_name, suser) :
#endif

#ifdef WIN32
				     rcmd2(&host, port, pwd->pw_name, suser, credb, credl,
					   bp, 0);
#else
			rcmd(&host, port, pwd->pw_name, suser, bp, 0);
#endif
		(void) free(bp);
		if (rem < 0) {
			++errs;
			continue;
		}
#if defined(HAVE_SETRESUID)
#define seteuid(e) (setresuid(-1, (e), -1))
#endif

#ifdef WIN32
		sink(1, argv + argc - 1);
#else
		if (seteuid(userid) == -1)
			exit(15);
		sink(1, argv + argc - 1);
		if (seteuid(0) == -1)
			exit(15);
#endif
		closesocket(rem);

		rem = -1;
	}

	if (credb != NULL) {
		(void) free(credb);
		credb = NULL;
	}
}

/**
 * @brief
 *	Send requested file(s) (or directory(s)) information to rshd server
 *
 * @param[in]	argc - no. of arguments
 * @param[in]	argv - arguments which contains requested file informations
 *
 * @return	void
 */
void
source(int argc, char *argv[])
{
	pbs_stat_struct stb = {0};
	static BUF buffer = {0};
	BUF *bp = NULL;
	off_t_pbs i = 0;
	int amt = 0;
	int fd = 0;
	int haderr = 0;
	int indx = 0;
	int result = 0;
	char *last = NULL;
	char *name = NULL;
	char buf[RCP_BUFFER_SIZE] = {'\0'};

	for (indx = 0; indx < argc; ++indx) {
		name = argv[indx];
		if ((fd = open(name, O_RDONLY, 0)) < 0)
			goto syserr;

#ifdef WIN32
		setmode(fd, O_BINARY);
	/* windows will fail to open file if a dir. To capture dir */
	/* info, we also do a pbs_stat() */
	syserr:
		if (pbs_stat(name, &stb)) {
			run_err("%s: %s", name, strerror(errno));
			goto next;
		}
#else
		if (fstat(fd, &stb)) {
		syserr:
			run_err("%s: %s", name, strerror(errno));
			goto next;
		}
#endif

		switch (stb.st_mode & S_IFMT) {
			case S_IFREG:
				break;
			case S_IFDIR:
				if (iamrecursive) {
					rsource(name, &stb);
					goto next;
				}
				/* FALLTHROUGH */
			default:
				run_err("%s: not a regular file", name);
				goto next;
		}
		if ((last = strrchr(name, '/')) == NULL)
			last = name;
		else
			++last;
		if (pflag) {
			/*
			 * Make it compatible with possible future
			 * versions expecting microseconds.
			 */
			(void) sprintf(buf, "T%ld 0 %ld 0\n",
				       (long) stb.st_mtime, (long) stb.st_atime);

#ifdef WIN32
			(void) send(rem, buf, strlen(buf), 0);
#else
			if (write(rem, buf, strlen(buf)) == -1) 
				errx(-1, __func__, "write failed. ERR : %s",
						strerror(errno));				
#endif
			if (response() < 0)
				goto next;
		}

#ifdef WIN32
#define MODMASK (S_IRWXU | S_IRWXG | S_IRWXO)
#else
#define MODMASK (S_ISUID | S_ISGID | S_IRWXU | S_IRWXG | S_IRWXO)
#endif

#ifdef WIN32
		(void) sprintf(buf, "C%04o %I64d %s\n",
			       stb.st_mode & MODMASK, stb.st_size, last);
#else
		(void) sprintf(buf, "C%04o %ld %s\n",
			       stb.st_mode & MODMASK, (long) stb.st_size, last);
#endif

#ifdef WIN32
		(void) send(rem, buf, strlen(buf), 0);
#else
		if (write(rem, buf, strlen(buf)) == -1) 
			errx(-1, __func__, "write failed. ERR : %s",
					strerror(errno));				
#endif
		if (response() < 0)
			goto next;
		if ((bp = allocbuf(&buffer, fd, RCP_BUFFER_SIZE)) == NULL) {
		next:
			if (fd > 0)
				(void) close(fd);
			continue;
		}

		/* Keep writing after an error so that we stay sync'd up. */
		haderr = 0;
		for (i = 0; i < stb.st_size; i += bp->cnt) {
			amt = bp->cnt;
			if (i + amt > stb.st_size)
				amt = (int) (stb.st_size - i);
			if (!haderr) {
				result = read(fd, bp->buf, amt);
				if (result != amt)
					haderr = result >= 0 ? EIO : errno;
			}
			if (haderr) {

#ifdef WIN32
				(void) send(rem, bp->buf, amt, 0);
#else
				if (write(rem, bp->buf, amt) == -1) 
					errx(-1, __func__, "write fail. ERR:%s",
							strerror(errno));				
#endif
			} else {
#ifdef WIN32
				result = send(rem, bp->buf, amt, 0);
#else
				result = write(rem, bp->buf, amt);
#endif
				if (result != amt)
					haderr = result >= 0 ? EIO : errno;
			}
		}
		if (close(fd) && !haderr)
			haderr = errno;

#ifdef USELOG /* MegaBytes */
		use_filec++;
		use_size += stb.st_size / 1048576.0;
		strcpy(use_direction, "P");
		use_namelen = sizeof(use_sock_rec);

		if (!strcmp(use_host, "no_host")) {
			if (!getpeername(rem, (struct sockaddr *) &use_sock_rec,
					 &use_namelen))
				use_host_rec =
					gethostbyaddr((char *) &use_sock_rec.sin_addr,
						      sizeof(use_sock_rec.sin_addr),
						      AF_INET);
			if (use_host_rec)
				strcpy(use_host, use_host_rec->h_name);
			else
				strcpy(use_host,
				       inet_ntoa(use_sock_rec.sin_addr));
		}
#endif /* USELOG */

		if (!haderr){

#ifdef WIN32
			(void) send(rem, "", 1, 0);
#else
			if (write(rem, "", 1) == -1) 
				errx(-1, __func__, "write failed. ERR : %s",strerror(errno));			
#endif
		} else 
			run_err("%s: %s", name, strerror(haderr));
		
		(void) response();
	}
}

/**
 *
 *  @brief Send directory information to remote host.
 *
 *  @param[in]  name - directory name.
 *  @param[in]  statp - pointer to struct stat.
 *
 *  @return void
 */
void
rsource(char *name, pbs_stat_struct *statp)
{
	DIR *dirp;
	struct dirent *dp;
	char *last, *vect[1], path[MAXPATHLEN];

	if (!(dirp = opendir(name))) {
		run_err("%s: %s", name, strerror(errno));
		return;
	}
	last = strrchr(name, '/');
	if (last == 0) {
#ifdef WIN32
		/* '/' not found so check for '\\' in windows*/
		last = strrchr(name, '\\');
		if (last == 0)
			last = name;
		else
			last++;
#else
		last = name;
#endif
	} else
		last++;
	if (pflag) {
		(void) sprintf(path, "T%ld 0 %ld 0\n",
			       (long) statp->st_mtime, (long) statp->st_atime);
#ifdef WIN32
		(void) send(rem, path, strlen(path), 0);
#else
		if (write(rem, path, strlen(path)) == -1) 
			errx(-1, __func__, "write failed. ERR : %s",strerror(errno));				
#endif
		if (response() < 0) {
			closedir(dirp);
			return;
		}
	}
	(void) sprintf(path,
		       "D%04o %d %s\n", statp->st_mode & MODMASK, 0, last);

#ifdef WIN32
	(void) send(rem, path, strlen(path), 0);
#else
	if (write(rem, path, strlen(path)) == -1) 
		errx(-1, __func__, "write failed. ERR : %s",strerror(errno));		
#endif
	if (response() < 0) {
		closedir(dirp);
		return;
	}
	while (errno = 0, (dp = readdir(dirp)) != NULL) {

		int len1 = 0;
		int len2 = 0;
#ifndef WIN32
		if (dp->d_ino == 0)
			continue;
#endif
		if (!strcmp(dp->d_name, ".") || !strcmp(dp->d_name, ".."))
			continue;
		len1 = strlen(name);
		len2 = strlen(dp->d_name);
		if (len1 + 1 + len2 >= (size_t) (MAXPATHLEN - 1)) {
			run_err("%s/%s: name too long", name, dp->d_name);
			continue;
		}
		(void) snprintf(path, len1 + 1, "%s/", name);
		(void) snprintf(path + len1 + 1, len2, "%s", dp->d_name);
		vect[0] = path;
		source(1, vect);
	}
	if (errno != 0 && errno != ENOENT) {
		run_err("%s: %s", name, strerror(errno));
		(void) closedir(dirp);
		return;
	}
	(void) closedir(dirp);

#ifdef WIN32
	(void) send(rem, "E\n", 2, 0);
#else
	if (write(rem, "E\n", 2) == -1) 
		errx(-1, __func__, "write failed. ERR : %s",strerror(errno));
#endif
	(void) response();
}

/**
 * @brief
 *	Receive file(s) (or directory(s)) informations sent by rshd server
 *
 * @param[in]	argc - no. arguments
 * @param[in]	argv - arguments which contains target information
 *
 * @return	void
 */
void
sink(int argc, char *argv[])
{
	static BUF buffer = {0};
	pbs_stat_struct stb = {0};
	struct timeval tv[2];
	enum { YES,
	       NO,
	       DISPLAYED } wrerr;
	BUF *bp = NULL;
	off_t j = 0;
	int_pbs size = 0;
	int_pbs i = 0;
	int amt = 0;
	int count = 0;
	int exists = 0;
	int first = 0;
	int mask = 0;
	int mode = 0;
	int ofd = 0;
	int omode = 0;
	int setimes = 0;
	int targisdir = 0;
	int wrerrno = 0;
	char ch = '\0';
	char *cp = NULL;
	char *np = NULL;
	char *targ = NULL;
	char *why = NULL;
	char *vect[1] = {0};
	char buf[RCP_BUFFER_SIZE] = {'\0'};

	memset(tv, 0, sizeof(tv));

#ifdef USELOG
	pbs_stat_struct use_stb;
#endif /* USELOG */

#define atime tv[0]
#define mtime tv[1]
#define SCREWUP(str)          \
	{                     \
		why = str;    \
		goto screwup; \
	}

#ifdef USELOG
	strcpy(use_direction, "G");
#endif /* USELOG */

	setimes = targisdir = 0;
	mask = umask(0);
	if (!pflag)
		(void) umask(mask);
	if (argc != 1) {
		run_err("ambiguous target");
		exit(1);
	}
	targ = *argv;
	if (targetshouldbedirectory)
		verifydir(targ);

#ifdef WIN32
	(void) send(rem, "", 1, 0);
#else
	if (write(rem, "", 1) == -1) 
		errx(-1, __func__, "write failed. ERR : %s",strerror(errno));
#endif
	if (pbs_stat(targ, &stb) == 0 && S_ISDIR(stb.st_mode))
		targisdir = 1;
	for (first = 1;; first = 0) {
		cp = buf;

#ifdef WIN32
		if (recv(rem, cp, 1, 0) <= 0)
#else
		if (read(rem, cp, 1) <= 0)
#endif
			return;
		if (*cp++ == '\n')
			SCREWUP("unexpected <newline>");
		do {
#ifdef WIN32
			if (recv(rem, &ch, sizeof(ch), 0) != sizeof(ch))
#else
			if (read(rem, &ch, sizeof(ch)) != sizeof(ch))
#endif
				SCREWUP("lost connection");
			*cp++ = ch;
		} while (cp < &buf[RCP_BUFFER_SIZE - 1] && ch != '\n');
		*cp = 0;

		if (buf[0] == '\01' || buf[0] == '\02') {
			if (iamremote == 0)
				if ( write(STDERR_FILENO,
					     buf + 1, strlen(buf + 1)) == -1) 
					errx(-1, __func__, "write failed. ERR : %s",strerror(errno));

			if (buf[0] == '\02')
				exit(1);
			++errs;
			continue;
		}
		if (buf[0] == 'E') {
#ifdef WIN32
			(void) send(rem, "", 1, 0);
#else
			if (write(rem, "", 1) == -1) 
				errx(-1, __func__, "write failed. ERR : %s",strerror(errno));
#endif
			return;
		}

		if (ch == '\n')
			*--cp = 0;

#define getnum(t)            \
	(t) = 0;             \
	while (isdigit(*cp)) \
		(t) = (t) *10 + (*cp++ - '0');
		cp = buf;
		if (*cp == 'T') {
			setimes++;
			cp++;
			getnum(mtime.tv_sec);
			if (*cp++ != ' ')
				SCREWUP("mtime.sec not delimited");
			getnum(mtime.tv_usec);
			if (*cp++ != ' ')
				SCREWUP("mtime.usec not delimited");
			getnum(atime.tv_sec);
			if (*cp++ != ' ')
				SCREWUP("atime.sec not delimited");
			getnum(atime.tv_usec);
			if (*cp++ != '\0')
				SCREWUP("atime.usec not delimited");

#ifdef WIN32
			(void) send(rem, "", 1, 0);
#else
			if ( write(rem, "", 1) == -1) 
				errx(-1, __func__, "write failed. ERR : %s",strerror(errno));
#endif
			continue;
		}
		if (*cp != 'C' && *cp != 'D') {
			/*
			 * Check for the case "rcp remote:foo\* local:bar".
			 * In this case, the line "No match." can be returned
			 * by the shell before the rcp command on the remote is
			 * executed so the ^Aerror_message convention isn't
			 * followed.
			 */
			if (first) {
				run_err("%s", cp);
				exit(1);
			}
			SCREWUP("expected control record");
		}
		mode = 0;
		for (++cp; cp < buf + 5; cp++) {
			if (*cp < '0' || *cp > '7')
				SCREWUP("bad mode");
			mode = (mode << 3) | (*cp - '0');
		}
		if (*cp++ != ' ')
			SCREWUP("mode not delimited");

		for (size = 0; isdigit(*cp);)
			size = size * 10 + (*cp++ - '0');
		if (*cp++ != ' ')
			SCREWUP("size not delimited");
		if (targisdir) {
			static char *namebuf;
			static int cursize;
			size_t need;

			need = strlen(targ) + strlen(cp) + 250;
			if (need > (unsigned) cursize) {
				if (!(namebuf = malloc(need)))
					run_err("%s", strerror(errno));
			}
			(void) sprintf(namebuf, "%s%s%s", targ,
				       *targ ? "/" : "", cp);
			np = namebuf;
		} else
			np = targ;
		exists = pbs_stat(np, &stb) == 0;
		if (buf[0] == 'D') {
			int mod_flag = pflag;
			if (exists) {
				if (!S_ISDIR(stb.st_mode)) {
					errno = ENOTDIR;
					goto bad;
				}
				if (pflag)
					(void) chmod(np, mode);
			} else {
				/* Handle copying from a read-only directory */
				mod_flag = 1;

#ifdef WIN32
				/* use _mkdir as it supports UNC path */
				if (_mkdir(np) == -1)
#else
				if (mkdir(np, mode | S_IRWXU) < 0)
#endif
					goto bad;
			}
			vect[0] = np;
			sink(1, vect);
			if (setimes) {
				setimes = 0;
#ifdef WIN32
				times.actime = atime.tv_sec;
				times.modtime = mtime.tv_sec;

				if (_utime(np, &times) < 0)
#else
				if (utimes(np, tv) < 0)
#endif
					run_err("%s: set times: %s",
						np, strerror(errno));
			}
			if (mod_flag)
				(void) chmod(np, mode);
			continue;
		}
		omode = mode;
		mode |= S_IWRITE;

#ifdef WIN32
		if ((ofd = open(np, O_WRONLY | O_CREAT | O_TRUNC | O_BINARY, mode)) < 0)
#else
		if ((ofd = open(np, O_WRONLY | O_CREAT, mode)) < 0)
#endif
		{
		bad:
			run_err("%s: %s", np, strerror(errno));
			continue;
		}

#ifdef WIN32
		(void) send(rem, "", 1, 0);
#else
		if (write(rem, "", 1) == -1) 
			errx(-1, __func__, "write failed. ERR : %s",strerror(errno));
#endif
		if ((bp = allocbuf(&buffer, ofd, RCP_BUFFER_SIZE)) == NULL) {
			(void) close(ofd);
			continue;
		}
		cp = bp->buf;
		wrerr = NO;
		count = 0;
		for (i = 0; i < size; i += RCP_BUFFER_SIZE) {
			amt = RCP_BUFFER_SIZE;
			if (i + amt > size)
				amt = (int) (size - i);
			count += amt;
			do {

#ifdef WIN32
				j = recv(rem, cp, amt, 0);
#else
				j = read(rem, cp, amt);
#endif
				if (j <= 0) {
					run_err("%s", j ? strerror(errno) : "dropped connection");
					exit(1);
				}
				amt -= j;
				cp += j;
			} while (amt > 0);
			if (count == bp->cnt) {
				/* Keep reading so we stay sync'd up. */
				if (wrerr == NO) {
					j = write(ofd, bp->buf, (unsigned int) count);
					if (j != count) {
						wrerr = YES;
						wrerrno = j >= 0 ? EIO : errno;
					}
				}
				count = 0;
				cp = bp->buf;
			}
		}
		if (count != 0 && wrerr == NO &&
		    (j = write(ofd, bp->buf, (unsigned int) count)) != count) {
			wrerr = YES;
			wrerrno = j >= 0 ? EIO : errno;
		}

#ifdef WIN32
		if (pflag) {
			if (exists || omode != mode)
				if (_chmod(np, omode))
					run_err("%s: set mode: %s",
						np, strerror(errno));
		} else {
			if (!exists && omode != mode)
				if (_chmod(np, omode & ~mask))
					run_err("%s: set mode: %s",
						np, strerror(errno));
		}
#else
		if (ftruncate(ofd, size)) {
			run_err("%s: truncate: %s", np, strerror(errno));
			wrerr = DISPLAYED;
		}
		if (pflag) {
			if (exists || omode != mode)
				if (fchmod(ofd, omode))
					run_err("%s: set mode: %s",
						np, strerror(errno));
		} else {
			if (!exists && omode != mode)
				if (fchmod(ofd, omode & ~mask))
					run_err("%s: set mode: %s",
						np, strerror(errno));
		}
#endif
		(void) close(ofd);

#ifdef USELOG
		use_filec++;
		pbs_stat(np, &use_stb);
		use_size += use_stb.st_size / 1048576.0;
		use_namelen = sizeof(use_sock_rec);

		if (!strcmp(use_host, "no_host")) {
			if (!getpeername(rem, (struct sockaddr *) &use_sock_rec,
					 &use_namelen))
				use_host_rec =
					gethostbyaddr((char *) &use_sock_rec.sin_addr,
						      sizeof(use_sock_rec.sin_addr), AF_INET);
			if (use_host_rec)
				strcpy(use_host, use_host_rec->h_name);
			else
				strcpy(use_host, inet_ntoa(use_sock_rec.sin_addr));
		}

#endif /* USELOG */

		(void) response();
		if (setimes && wrerr == NO) {
			setimes = 0;

#ifdef WIN32
			times.actime = atime.tv_sec;
			times.modtime = mtime.tv_sec;

			if (_utime(np, &times) < 0)
#else
			if (utimes(np, tv) < 0)
#endif
			{
				run_err("%s: set times: %s",
					np, strerror(errno));
				wrerr = DISPLAYED;
			}
		}
		switch (wrerr) {
			case YES:
				run_err("%s: %s", np, strerror(wrerrno));
				break;
			case NO:
#ifdef WIN32
				(void) send(rem, "", 1, 0);
#else
				if (write(rem, "", 1) == -1) 
					errx(-1, __func__, "fchown failed. ERR : %s",strerror(errno));
#endif
				break;
			case DISPLAYED:
				break;
		}
	}
screwup:
	run_err("protocol error: %s", why);
#ifdef USELOG
	use_neterr++;
#endif /* USELOG */

	exit(1);
}

#ifdef KERBEROS

/**
 * @brief
 *	provides kerberos authentication data.
 *
 * @param[in] host - host name
 * @param[in] bp -
 * @param[in] localuser - present working user
 * @param[in] user - username
 *
 * @return	int
 * @retval	communication handle	success
 * @retval	-1			error
 *
 */
int
kerberos(char **host, char *bp, char *locuser, char *user)
{
	struct servent *sp;

again:
	if (use_kerberos) {
		rem = KSUCCESS;
		errno = 0;
		if (dest_realm == NULL)
			dest_realm = krb_realmofhost(*host);
		rem =
#ifdef CRYPT
			doencrypt ? krcmd_mutual(host, port, user, bp, 0, dest_realm, &cred, schedule) :
#endif
				  krcmd(host, port, user, bp, 0, dest_realm);

		if (rem < 0) {
			use_kerberos = 0;
			if ((sp = getservbyname("shell", "tcp")) == NULL)
				errx(1, "unknown service shell/tcp");
			if (errno == ECONNREFUSED)
				oldw("remote host doesn't support Kerberos");
			else if (errno == ENOENT)
				oldw("can't provide Kerberos authentication data");
			port = sp->s_port;
			goto again;
		}
	} else {
#ifdef CRYPT
		if (doencrypt)
			errx(1,
			     "the -x option requires Kerberos authentication");
#endif
		rem = rcmd(host, port, locuser, user, bp, 0);
	}
	return (rem);
}
#endif /* KERBEROS */

/**
 * @brief
 *	Receive response of last operation from rshd server
 *		response will be as follow:
 *		0 - OK
 *		1 - error, followed by error message
 *		2 - fatal error followed by ""
 *
 * @return	int
 * @retval	0	OK
 * @retval	-1	error
 *
 * @par	Note:
 *	on receiving fatal error response will do exit with 1.
 */
int
response()
{
	char ch = '\0';
	char *cp = NULL;
	char resp = '\0';
	char rbuf[RCP_BUFFER_SIZE] = {'\0'};

#ifdef WIN32
	if (recv(rem, &resp, sizeof(resp), 0) != sizeof(resp))
#else
	if (read(rem, &resp, sizeof(resp)) != sizeof(resp))
#endif
		lostconn(0);

	cp = rbuf;
	switch (resp) {
		case 0: /* ok */
			return (0);
		default:
			*cp++ = resp;
			/* FALLTHROUGH */
		case 1: /* error, followed by error msg */
		case 2: /* fatal error, "" */
			do {

#ifdef WIN32
				if (recv(rem, &ch, sizeof(ch), 0) != sizeof(ch))
#else
				if (read(rem, &ch, sizeof(ch)) != sizeof(ch))
#endif
					lostconn(0);
				*cp++ = ch;
			} while (cp < &rbuf[RCP_BUFFER_SIZE] && ch != '\n');

			if (!iamremote)
				if (write(STDERR_FILENO, rbuf, cp - rbuf) == -1) 
					errx(-1, __func__, "fchown failed. ERR : %s",strerror(errno));
			++errs;
			if (resp == 1)
				return (-1);
			exit(1);
	}
	/* NOTREACHED */
}

/**
 * @brief
 *	prints the usage guidelines for using pbs_rcp.
 *
 */
void
usage()
{
#ifdef KERBEROS
#ifdef CRYPT
	(void) fprintf(stderr, "%s\n\t%s\n",
		       "usage: pbs_rcp [-Kpx] [-k realm] f1 f2",
		       "or: pbs_rcp [-Kprx] [-k realm] f1 ... fn directory");
#else
	(void) fprintf(stderr, "%s\n\t%s\n",
		       "usage: pbs_rcp [-Kp] [-k realm] f1 f2",
		       "or: pbs_rcp [-Kpr] [-k realm] f1 ... fn directory");
#endif
#else
	(void) fprintf(stderr,
		       "usage: pbs_rcp [-E] [-p] f1 f2; or: pbs_rcp [-pr] f1 ... fn directory\n");
#endif
	(void) fprintf(stderr,
		       "       pbs_rcp --version\n");
	exit(1);
}

#include <stdarg.h>

#ifdef KERBEROS
/**
 * @brief
 *	prints error message to stderr in provided format.
 *
 * @param[in] fmt - error message to be logged
 *
 */
void
oldw(const char *fmt, ...)
{
	va_list ap;
	va_start(ap, fmt);
	(void) fprintf(stderr, "rcp: ");
	(void) vfprintf(stderr, fmt, ap);
	(void) fprintf(stderr, ", using standard rcp\n");
	va_end(ap);
}
#endif

/**
 * @brief
 *      prints error message to specified file in provided format.
 *
 * @param[in] fmt - error message to be logged
 *
 */
void
run_err(const char *fmt, ...)
{
	static FILE *fp;
	va_list ap;
	va_start(ap, fmt);

	++errs;

	if (!iamremote) {
		(void) vfprintf(stderr, fmt, ap);
		(void) fprintf(stderr, "\n");
	}

	if (fp == NULL && !(fp = fdopen(rem, "w"))) {
		va_end(ap);
		return;
	}
	(void) fprintf(fp, "%c", 0x01);
	(void) fprintf(fp, "rcp: ");
	(void) vfprintf(fp, fmt, ap);
	(void) fprintf(fp, "\n");
	(void) fflush(fp);

	va_end(ap);
}

#ifdef USELOG
/**
 * @brief
 *	generates a distributed log message.
 */
static void
use_logusage(char *mes, char *app)
{
	closelog();
	openlog(app, LOG_INFO | LOG_NDELAY, LOG_LOCAL4);
	syslog(LOG_INFO, "%s", mes);
	closelog();
}

/**
 * @brief
 *	returns the time and timezone info.
 */
static void
use_prep_timer()
{
	gettimeofday(&use_time0, NULL);
}

/**
 * @brief
 *	returns the time in seconds and microseconds format.
 *
 */
static float
use_get_wtime()
{
	struct timeval timedol;
	struct timeval td;
	float realt;

	gettimeofday(&timedol, NULL);

	/* Get real time */
	use_tvsub(&td, &timedol, &use_time0);
	realt = td.tv_sec + ((double) td.tv_usec) / 1000000;
	if (realt < 0.00001)
		realt = 0.00001;

	return (realt);
}

/**
 * @brief
 *	calculate the time difference of t1 and t0.
 *
 * @param[in] t1 - time value1
 * @param[in] t1 - time value2
 *
 * @return	Void
 */
static void
use_tvsub(struct timeval *tdiff, struct timeval *t1, struct timeval *t0)
{

	tdiff->tv_sec = t1->tv_sec - t0->tv_sec;
	tdiff->tv_usec = t1->tv_usec - t0->tv_usec;
	if (tdiff->tv_usec < 0)
		tdiff->tv_sec--, tdiff->tv_usec += 1000000;
}

/**
 * @brief
 *	end up a communication by logging appropriate msg.
 *
 * @param[in] status - status code
 *
 */
void
use_exit(int status)
{
	/*   UNICOS tcp/ip socket error codes */
	if (status && (127 < errno && errno < 156)) {
		strcpy(use_direction, "E");
		use_status = errno;
		use_neterr++;
	} else
		use_status = status;

	/* only report files bigger than 0.001MB or network problems */
	if (use_size > 0.001 || use_neterr) {
		use_wctime = use_get_wtime();
		use_rate = use_size / use_wctime;

		sprintf(use_message,
			"%-25s %-9s %-2s %5.3f %5.3f %2d %2d\n",
			use_host, use_user, use_direction, use_size,
			use_rate, use_status, use_filec);

		use_logusage(use_message, "rcp");
	}

#undef exit
	exit(status);
}
#endif /* USELOG */


================================================
FILE: src/mom_rcp/replace.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	replace.c
 * @brief
 * This file contains homebrewed PBS replacements for
 * library functions found on BSD 4.4-Lite.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include <stdio.h>
#include <stdarg.h>
#include <stdlib.h>

extern char *credb;

/**
 * @brief
 *	accepts varargs as error inputs and logs error on stderr.
 *
 * @param[in] fmt - error msg
 *
 */
void
errx(int err, const char *fmt, ...)
{
	va_list ap;

	va_start(ap, fmt);
	(void) vfprintf(stderr, fmt, ap);
	exit(err);
}

/**
 * @brief
 *      accepts varargs as warning inputs and logs the same on stderr.
 *
 * @param[in] fmt - error msg
 *
 */
void
warnx(const char *fmt, ...)
{
	va_list ap;

	va_start(ap, fmt);
	(void) vfprintf(stderr, fmt, ap);
}

/**
 * @brief
 *	print the error number and message to stderr.
 * @par Note:	frees the credentials.
 *
 * @param[in] val - error val
 * @param[in] str - error msg
 *
 * @return	Void
 *
 */
void
err(int val, char *str)
{
	if (str)
		(void) fprintf(stderr, "%s\n", str);

	if (credb != NULL) {
		(void) free(credb);
		credb = NULL;
	}

	exit(val);
}


================================================
FILE: src/mom_rcp/util.c
================================================
/*
 * Copyright (c) 1992, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *	This product includes software developed by the University of
 *	California, Berkeley and its contributors.
 * 4. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/param.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/wait.h>

#include <ctype.h>
#include <errno.h>
#include <signal.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>

#include "extern.h"
#include "pathnames.h"
/**
 * @file	util.c
 */

#ifdef USELOG
extern int use_neterr;
#endif /* USELOG */

/**
 * @brief
 *	extract and return the file name from input string
 *
 * @param[in] cp - argument
 *
 * @return	string
 * @retval	filename	success
 * @retval	0		error
 */
char *
colon(char *cp)
{
	if (*cp == ':') /* Leading colon is part of file name. */
		return (0);

	for (; *cp; ++cp) {
		if (*cp == ':')
			return (cp);
		if (*cp == '/')
			return (0);
	}
	return (0);
}

/**
 * @breif
 *	verify the input directory.
 *
 * @param[in] cp - directory path
 *
 * @return Void
 */
void
verifydir(char *cp)
{
	struct stat stb;

	if (!stat(cp, &stb)) {
		if (S_ISDIR(stb.st_mode))
			return;
		errno = ENOTDIR;
	}
	run_err("%s: %s", cp, strerror(errno));
	exit(1);
}

/**
 * @brief
 *	validate input user name.
 *
 * @param[in] cp0 - user name
 */
int
okname(char *cp0)
{
	int c;
	char *cp;

	cp = cp0;
	do {
		c = *cp;
		if (c & 0200)
			goto bad;
		if (!isalpha(c) && !isdigit(c) && c != '_' && c != '-' && c != '.')
			goto bad;
	} while (*++cp);
	return (1);

bad:
	warnx("%s: invalid user name", cp0);
	return (0);
}

/**
 * @brief
 */
int
susystem(char *s,
	 uid_t userid,	 /* used in unix */
	 char *username) /* used in windows */
{

#ifdef WIN32
	HANDLE hUser;
	int rc;

	STARTUPINFO si = {0};
	PROCESS_INFORMATION pi = {0};
	int flags = CREATE_DEFAULT_ERROR_MODE | CREATE_NEW_CONSOLE |
		    CREATE_NEW_PROCESS_GROUP;

	if ((hUser = LogonUserNoPass(username)) == INVALID_HANDLE_VALUE)
		return (1);

	rc = CreateProcessAsUser(hUser, NULL, s, NULL, NULL, TRUE, flags,
				 NULL, NULL, &si, &pi);

	if (rc == 0)
		errno = GetLastError();

	if (errno != 0) {
		rc = errno + 10000; /* error on fork (100xx), retry */
	} else {
		if (WaitForSingleObject(pi.hProcess,
					INFINITE) != WAIT_OBJECT_0)
			errno = GetLastError();
		else if (!GetExitCodeProcess(pi.hProcess, &rc))
			errno = GetLastError();
		CloseHandle(pi.hProcess);
		CloseHandle(pi.hThread);

		if (errno != 0)
			rc = (20000 + errno); /* 200xx is error on wait */
	}

	CloseHandle(hUser);
	return (rc);
#else
	int status;
	pid_t pid;
	
	static char ok_chars[] = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789.-_:/@\\ ";
	if (strspn(s, ok_chars) != strlen(s))
		_exit(1);

	pid = fork();
	switch (pid) {
		case -1:
			return (127);

		case 0:
			if (setuid(userid) == -1)
				_exit(126);
			execl(_PATH_BSHELL, "sh", "-c", s, NULL);
			_exit(127);
	}
	if (waitpid(pid, &status, 0) < 0)
		status = -1;
	return (status);

#endif
}

/**
 * @brief
 *	reallocate memory in BUF structure based on
 *	given size of file <fd> in given block size <blksize>
 *
 * @param[in]	bp - pointer to allocated BUF struct which will be reallocated
 * @param[in]	fd - fd of file to get file size
 * @param[in]	blksize - block size to get buffer size in BUF struct
 *
 * @return	BUF*
 * @retval	pointer to reallocated BUF struct
 * @par	NOTE:
 *	This pointer can be same as <bp> if size is 0 or less than
 *	already allocated buffer size in <bp>
 */
BUF *
allocbuf(BUF *bp, int fd, int blksize)
{
	struct stat stb = {0};
	int size = 0;

	if (fstat(fd, &stb) < 0) {
		run_err("fstat: %s", strerror(errno));
		return (0);
	}

#ifdef WIN32
	size = 0;
#else
	size = (((int) stb.st_blksize + blksize - 1) / blksize) * blksize;
#endif

	if (size == 0)
		size = blksize;
	if (bp->cnt >= size)
		return (bp);
	if (bp->buf) {
		char *tbuf;
		tbuf = realloc(bp->buf, size);
		if (tbuf == NULL)
			free(bp->buf);
		bp->buf = tbuf;
	} else
		bp->buf = malloc(size);
	if (bp->buf == NULL) {
		bp->cnt = 0;
		run_err("%s", strerror(errno));
		return (0);
	}
	bp->cnt = size;
	return (bp);
}

/**
 * @brief
 *	log warning msg.
 *
 * @param[in] signo -  signal num
 */
void
lostconn(int signo)
{
	if (!iamremote)
		warnx("lost connection");
#ifdef USELOG
	use_neterr++;
#endif /* USELOG */

	exit(1);
}


================================================
FILE: src/resmom/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

sbin_PROGRAMS = pbs_mom

pbs_mom_CPPFLAGS = \
	-DPBS_MOM \
	-I$(top_srcdir)/src/include \
	-I$(top_srcdir)/src/resmom/linux \
	@hwloc_flags@ \
	@hwloc_inc@ \
	@pmix_inc@ \
	@libz_inc@ \
	@PYTHON_INCLUDES@ \
	@KRB5_CFLAGS@

pbs_mom_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libattr/libattr.a \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	$(top_builddir)/src/lib/Libsite/libsite.a \
	$(top_builddir)/src/lib/Libtpp/libtpp.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	@KRB5_LIBS@ \
	@hwloc_lib@ \
	@pmix_lib@ \
	@PYTHON_LDFLAGS@ \
	@PYTHON_LIBS@ \
	@libz_lib@ \
	-lssl \
	-lcrypto

pbs_mom_SOURCES = \
	$(top_builddir)/src/lib/Libattr/job_attr_def.c \
	$(top_builddir)/src/lib/Libattr/node_attr_def.c \
	$(top_builddir)/src/lib/Libattr/resc_def_all.c \
	$(top_builddir)/src/lib/Libpython/shared_python_utils.c \
	$(top_srcdir)/src/server/mom_info.c \
	$(top_srcdir)/src/server/attr_recov.c \
	$(top_srcdir)/src/server/dis_read.c \
	$(top_srcdir)/src/server/jattr_get_set.c \
	$(top_srcdir)/src/server/nattr_get_set.c \
	$(top_srcdir)/src/server/job_func.c \
	$(top_srcdir)/src/server/process_request.c \
	$(top_srcdir)/src/server/reply_send.c \
	$(top_srcdir)/src/server/req_quejob.c \
	$(top_srcdir)/src/server/resc_attr.c \
	$(top_srcdir)/src/server/vnparse.c \
	$(top_srcdir)/src/server/setup_resc.c \
	linux/mom_mach.c \
	linux/mom_mach.h \
	linux/mom_start.c \
	linux/pe_input.c \
	catch_child.c \
	job_recov_fs.c \
	mock_run.c \
	mock_run.h \
	mom_comm.c \
	mom_hook_func.c \
	mom_inter.c \
	linux/mom_func.c \
	mom_main.c \
	mom_updates_bundle.c \
	mom_pmix.c \
	mom_pmix.h \
	mom_server.c \
	mom_vnode.c \
	mom_walltime.c \
	popen.c \
	prolog.c \
	requests.c \
	rm_dep.h \
	stage_func.c \
	start_exec.c \
	vnode_storage.c \
	renew_creds.c \
	renew_creds.h

if ALPS_ENABLED
pbs_mom_CPPFLAGS += -DMOM_ALPS=1 @expat_inc@
pbs_mom_LDADD += @expat_lib@
pbs_mom_SOURCES += linux/alps.c
endif


================================================
FILE: src/resmom/catch_child.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#ifdef PYTHON
#include <pbs_python_private.h>
#include <Python.h>
#endif

#include <unistd.h>
#include <dirent.h>
#include <pwd.h>
#include <stdio.h>
#include <stdlib.h>
#include <limits.h>
#include <assert.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <signal.h>
#include <string.h>
#include <sys/types.h>
#include <sys/stat.h>
#include "dis.h"
#include "libpbs.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "log.h"
#include "work_task.h"
#include "credential.h"
#include "batch_request.h"
#include "net_connect.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "mom_mach.h"
#include "mom_func.h"
#include "mom_server.h"
#include "mom_vnode.h"
#include "pbs_error.h"
#include "tpp.h"
#include "mom_hook_func.h"
#include "placementsets.h"
#include "hook.h"
#include "renew_creds.h"
#include "mock_run.h"
#include <libutil.h>

/**
 * @file	catch_child.c
 */
/* External Functions */
void (*free_job_CPUs)(job *) = NULL;

/* External Globals */

extern char mom_host[];
extern char *path_epilog;
extern char *path_jobs;
extern unsigned int default_server_port;
extern pbs_list_head svr_alljobs;
extern int exiting_tasks;
extern char *msg_daemonname;
extern char *mom_home;
#ifndef WIN32
extern int termin_child;
#endif
extern int server_stream;
extern time_t time_now;
extern pbs_list_head mom_polljobs;
extern unsigned int pbs_mom_port;
extern int gen_nodefile_on_sister_mom;
#if MOM_ALPS
extern useconds_t alps_release_wait_time;
extern int alps_release_timeout;
extern useconds_t alps_release_jitter;
#endif

extern char *path_hooks_workdir;

#ifndef WIN32
/**
 * @brief
 *	catch_child() - the signal handler for  SIGCHLD.
 *
 * @param[in] sig - signal number
 *
 * @par To keep the signal handler simple for
 *	SIGCHLD  - just indicate there was one.
 *
 * @return Void
 *
 */
void
catch_child(int sig)
{
	termin_child = 1;
}
#endif

/**
 * @brief
 *	returns execution node info for job pjob
 *
 * @param[in] pjob - job pointer to job
 * @param[in] nodeid - nodeid on which  job execs
 *
 * @return hnodent *
 * @retval  hostdetails  SUCCESS
 * @retval  NULL  	 Failure
 *
 */
hnodent *
get_node(job *pjob, tm_node_id nodeid)
{
	int i;
	vmpiprocs *vp = pjob->ji_vnods;

	for (i = 0; i < pjob->ji_numvnod; i++, vp++) {
		if (vp->vn_node == nodeid)
			return vp->vn_host;
	}
	return NULL;
}

/**
 * @brief
 *	Restart each task which has exited and has TI_FLAGS_CHKPT turned on.
 *	If all tasks have been restarted, turn off MOM_CHKPT_POST.
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return Void
 *
 */
void
chkpt_partial(job *pjob)
{
	int i;
	char namebuf[MAXPATHLEN + 1];
	char *filnam;
	pbs_task *ptask;
	int texit = 0;
	extern char task_fmt[];
	extern char *path_checkpoint;

	assert(pjob != NULL);

	pbs_strncpy(namebuf, path_checkpoint, sizeof(namebuf));
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		strcat(namebuf, pjob->ji_qs.ji_fileprefix);
	else
		strcat(namebuf, pjob->ji_qs.ji_jobid);
	strcat(namebuf, JOB_CKPT_SUFFIX);

	i = strlen(namebuf);
	filnam = &namebuf[i];

	pjob->ji_sampletim = 0; /* reset sampletime for cpupercent */

	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		/*
		 ** See if the task was marked as one of those that did
		 ** actually checkpoint.
		 */
		if ((ptask->ti_flags & TI_FLAGS_CHKPT) == 0)
			continue;
		texit++;
		/*
		 ** Now see if it was reaped.  We don't want to
		 ** fool with it until we see it die.
		 */
		if (ptask->ti_qs.ti_status != TI_STATE_EXITED)
			continue;
		texit--;

		sprintf(filnam, task_fmt, ptask->ti_qs.ti_task);

		/*
		 **	Try action script with no post function.
		 */
		i = do_mom_action_script(RestartAction, pjob, ptask,
					 namebuf, NULL);
		if (i != 0) { /* script failed */
			/* if there is no script, try native support */
			if (i == -2)
				i = mach_restart(ptask, namebuf);
			if (i != 0) /* everything failed */
				goto fail;
		}

		ptask->ti_qs.ti_status = TI_STATE_RUNNING;
		/*
		 ** Turn off TI_FLAGS_CHKPT if TI_FLAGS_SAVECKP is off.
		 ** Turn off TI_FLAGS_SAVECKP if it is on.
		 */
		if ((ptask->ti_flags & TI_FLAGS_SAVECKP) == 0)
			ptask->ti_flags &= ~TI_FLAGS_CHKPT;
		else
			ptask->ti_flags &= ~TI_FLAGS_SAVECKP;
		(void) task_save(ptask);
	}

	if (texit == 0) {
		char oldname[MAXPATHLEN + 1];
		struct stat statbuf;

		/*
		 ** All tasks should now be running.
		 ** Turn off MOM_CHKPT_POST and MOM_CHKPT_ACTIVE flags.
		 ** Job is back to where it was before the bad checkpoint
		 ** attempt.
		 */
		pjob->ji_flags &= ~MOM_CHKPT_POST;
		pjob->ji_flags &= ~MOM_CHKPT_ACTIVE;
		/*
		 ** Get rid of incomplete checkpoint directory and
		 ** move old chkpt dir back to regular if it exists.
		 */
		*filnam = '\0';
		(void) remtree(namebuf);
		strcpy(oldname, namebuf);
		strcat(oldname, ".old");
		if (stat(oldname, &statbuf) == 0) {
			if (rename(oldname, namebuf) == -1)
				pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_CHKPT;
		}
	}
	return;

fail:
	/*
	 ** If we cannot restart a task from a partially failed checkpoint,
	 ** the job will be killed.
	 */
	log_joberr(errno, __func__, "failed to restart", pjob->ji_qs.ji_jobid);
	pjob->ji_flags &= ~MOM_CHKPT_POST;
	(void) kill_job(pjob, SIGKILL);
	return;
}

/**
 * @brief
 * 	update jobs rescused to the server
 *
 * @return void
 *
 */
void
update_jobs_status(void)
{
	job *pjob = (job *) GET_NEXT(svr_alljobs);
	for (; pjob; pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
			continue;
		if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING))
			continue;
		enqueue_update_for_send(pjob, IS_RESCUSED);
	}
}

/**
 * @brief
 * 	send_obit - routine called following completion of epilogue process
 *	Job then moved into substate OBIT and Obit message sent to server over TPP stream
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] exval - exit value
 *
 * @return Void
 *
 */
void
send_obit(job *pjob, int exval)
{
#ifndef WIN32
	/* update pjob with values set from an epilogue hook */
	/* since these are hooks that are executing in a child process */
	/* and changes inside the child will not be reflected in main */
	/* mom */
	if (num_eligible_hooks(HOOK_EVENT_EXECJOB_EPILOGUE) > 0) {
		char hook_outfile[MAXPATHLEN + 1];
		struct stat stbuf;

		snprintf(hook_outfile, MAXPATHLEN, FMT_HOOK_JOB_OUTFILE, path_hooks_workdir, pjob->ji_qs.ji_jobid);
		if (stat(hook_outfile, &stbuf) == 0) {
			pbs_list_head vnl_changes;
			int reject_deletejob = 0;
			int reject_rerunjob = 0;
			int accept_flag = 1;

			CLEAR_HEAD(vnl_changes);
			if (get_hook_results(hook_outfile, &accept_flag, NULL, NULL, 0,
					     &reject_rerunjob, &reject_deletejob, NULL,
					     NULL, 0, &vnl_changes, pjob,
					     NULL, 0, NULL) != 0) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, __func__, "Failed to get epilogue hook results");
				vna_list_free(vnl_changes);
			} else {
				/* Delete job or reject job actions */
				/* NOTE: Must appear here before vnode changes, */
				/* since this action will be sent whether hook  */
				/* script executed by PBSADMIN or PBSUSER.      */
				if (reject_deletejob) {
					/* deletejob takes precedence */
					new_job_action_req(pjob, HOOK_PBSADMIN, JOB_ACT_REQ_DELETE);
				} else if (reject_rerunjob) {
					new_job_action_req(pjob, HOOK_PBSADMIN, JOB_ACT_REQ_REQUEUE);
				} else if (!accept_flag) {
					/* Per EDD on a pbs.event().reject() from an */
					/* epilogue hook, must delete the job. */
					new_job_action_req(pjob, HOOK_PBSADMIN, JOB_ACT_REQ_DELETE);
				}

				/* Whether or not we accept or reject, we'll make */
				/* job changes, vnode changes, job actions */
				enqueue_update_for_send(pjob, IS_RESCUSED_FROM_HOOK);

				/* Push vnl hook changes to server */
				hook_requests_to_server(&vnl_changes);
			}
			/* need to clear out hook_outfile, */
			/* as epilogue hook processing  */
			/* in mom_process_hooks() will end up appending to */
			/* this same file when job is rerun, resulting in */
			/* duplicate actions. */
			unlink(hook_outfile);
		}
	}
#endif

	if (is_jattr_set(pjob, JOB_ATR_run_version)) {
		DBPRT(("send_obit: job %s run_version %ld exval %d\n",
		       pjob->ji_qs.ji_jobid, get_jattr_long(pjob, JOB_ATR_run_version), exval))
	} else {
		DBPRT(("send_obit: job %s runcount %ld exval %d\n",
		       pjob->ji_qs.ji_jobid, get_jattr_long(pjob, JOB_ATR_runcount), exval))
	}

	pjob->ji_mompost = NULL;
	if (!check_job_substate(pjob, JOB_SUBSTATE_OBIT)) {
		set_job_substate(pjob, JOB_SUBSTATE_OBIT);
		job_save(pjob);
	}

	pjob->ji_sampletim = time_now; /* when obit sent to server */
	/* epilogue script exit of 2 means requeue for	*/
	/* chkpt/restart if job was checkpointed	*/
	if (exval == 2 && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT))
		pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_QUERST;
	if (enqueue_update_for_send(pjob, IS_JOBOBIT) != 0)
		log_joberr(PBSE_SYSTEM, __func__, "Failed to enque job obit", pjob->ji_qs.ji_jobid);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "Obit sent");
}

/**
 * @brief
 * 	Look for job tasks that have terminated (see scan_for_terminating),
 *	and for each task, find which job the task was part, and if the top
 *	shell, start end of job processing by running the epilogue.
 *
 * @return Void
 *
 */

void
scan_for_exiting(void)
{

	pid_t cpid;
	int i;
	int extval;
	int found_one = 0;
	u_long hours, mins, secs;
	job *nxjob;
	job *pjob;
	pbs_task *ptask;
	obitent *pobit;
	char *cookie;
	u_long gettime(resource * pres);
	u_long getsize(resource * pres);
	int im_compose(int, char *, char *, int, tm_event_t, tm_task_id, int);
	mom_hook_input_t hook_input;
	int has_epilog = 0;
	int update_svr = 0;

#ifdef WIN32
	/* update the latest intelligence about the running jobs; */
	time_now = time(NULL);
	mom_set_use_all();
	update_svr = 1;
#endif
	if (num_eligible_hooks(HOOK_EVENT_EXECJOB_EPILOGUE) > 0 || file_exists(path_epilog))
		has_epilog = 1;

	/*
	 ** Look through the jobs.  Each one has it's tasks examined
	 ** and if the job is EXITING, it meets it's fate depending
	 ** on whether this is the Mother Superior or not.
	 */
	for (pjob = (job *) GET_NEXT(svr_alljobs); pjob; pjob = nxjob) {
		nxjob = (job *) GET_NEXT(pjob->ji_alljobs);

		if (pjob->ji_numnodes > 1 && !pjob->ji_msconnected && pjob->ji_nodeid) /* assume that MS has a connection to itself at all times */
			continue;

		/*
		 ** If a restart is active, skip this job since
		 ** not all of the tasks may have started yet.
		 */
		if (pjob->ji_flags & MOM_RESTART_ACTIVE) {
			continue;
		}
		/*
		 ** If a checkpoint with aborts is active,
		 ** skip it.  We don't want to report any obits
		 ** until we know that the whole thing worked.
		 */
		if ((pjob->ji_flags & MOM_CHKPT_ACTIVE) &&
		    (pjob->ji_mompost != NULL)) {
			continue;
		}
		/*
		 ** If the job has had an error doing a checkpoint with
		 ** abort, the MOM_CHKPT_POST flag will be on.
		 */
		if (pjob->ji_flags & MOM_CHKPT_POST) {
			chkpt_partial(pjob);
			continue;
		}

		if (is_jattr_set(pjob, JOB_ATR_Cookie))
			cookie = get_jattr_str(pjob, JOB_ATR_Cookie);
		else
			cookie = NULL;

		/*
		 ** Check each EXITED task.  They transistion to DEAD here.
		 */
		for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
		     ptask != NULL;
		     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
			if (ptask->ti_qs.ti_status != TI_STATE_EXITED)
				continue;
			/*
			 ** Check if it is the top shell.
			 */
			if (ptask->ti_qs.ti_parenttask == TM_NULL_TASK) {
				int *exitstat =
					&pjob->ji_qs.ji_un.ji_momt.ji_exitstat;

				set_job_state(pjob, JOB_STATE_LTR_EXITING);
				set_job_substate(pjob, JOB_SUBSTATE_KILLSIS);
				if (*exitstat >= 0)
					*exitstat = ptask->ti_qs.ti_exitstat;
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
					  LOG_INFO,
					  pjob->ji_qs.ji_jobid, "Terminated");

				if (send_sisters(pjob, IM_KILL_JOB, NULL) == 0) {
					set_job_substate(pjob, JOB_SUBSTATE_EXITING);
					/*
					 ** if the job was checkpointed ok,
					 ** reset ji_nodekill to prevent mom_comm
					 ** error on restart resulting in job
					 ** being killed.
					 */
					if ((pjob->ji_flags & MOM_CHKPT_ACTIVE) &&
					    !(pjob->ji_flags & MOM_CHKPT_POST) &&
					    (pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT))
						pjob->ji_nodekill = TM_ERROR_NODE;
				}
			}
			/*
			 ** Go through any TM client obits waiting.
			 */
			for (pobit = (obitent *) GET_NEXT(ptask->ti_obits);
			     pobit != NULL;
			     pobit = (obitent *) GET_NEXT(ptask->ti_obits)) {

				hnodent *pnode;

				/* see if this is a batch request */
				if (pobit->oe_type == OBIT_TYPE_BREVENT) {
					pobit->oe_u.oe_preq->rq_reply.brp_code =
						PBSE_NONE;
					pobit->oe_u.oe_preq->rq_reply.brp_auxcode =
						ptask->ti_qs.ti_exitstat;
					pobit->oe_u.oe_preq->rq_reply.brp_choice =
						BATCH_REPLY_CHOICE_NULL;
					(void) reply_send(pobit->oe_u.oe_preq);
					goto end_loop;
				}

				pnode = get_node(pjob, pobit->oe_u.oe_tm.oe_node);

				/* see if this is mother superior or a sister */
				if (pjob->ji_nodeid == pnode->hn_node) {
					pbs_task *tp;

					/* Send response locally */
					tp = task_find(pjob, pobit->oe_u.oe_tm.oe_taskid);
					if (pobit->oe_u.oe_tm.oe_fd != -1) {
						assert(tp != NULL);
						(void) tm_reply(pobit->oe_u.oe_tm.oe_fd,
								tp->ti_protover, IM_ALL_OKAY,
								pobit->oe_u.oe_tm.oe_event);
						(void) diswsi(pobit->oe_u.oe_tm.oe_fd,
							      ptask->ti_qs.ti_exitstat);
						(void) dis_flush(pobit->oe_u.oe_tm.oe_fd);
					}
				} else if (pnode->hn_stream != -1 &&
					   cookie != NULL) {
					/*
					 * Send a response over to MOM
					 * whose child sent the request
					 */
					(void) im_compose(pnode->hn_stream,
							  pjob->ji_qs.ji_jobid,
							  cookie, IM_ALL_OKAY,
							  pobit->oe_u.oe_tm.oe_event,
							  pobit->oe_u.oe_tm.oe_taskid, IM_OLD_PROTOCOL_VER);
					(void) diswsi(pnode->hn_stream,
						      ptask->ti_qs.ti_exitstat);
					(void) dis_flush(pnode->hn_stream);
				}

			end_loop:
				delete_link(&pobit->oe_next);
				free(pobit);
			}
			ptask->ti_qs.ti_status = TI_STATE_DEAD;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
			AFSLOG_TERM(ptask);
#endif

			/*
			 ** KLUDGE
			 ** We need to save the value of the sid here just
			 ** in case it is exiting from a checkpoint/abort
			 ** and it will be restarted later.  Just set it
			 ** to the negative of itself.
			 */
			if (ptask->ti_qs.ti_sid <= 1) {
				ptask->ti_qs.ti_sid = 0;
			} else
				ptask->ti_qs.ti_sid = -ptask->ti_qs.ti_sid;
			task_save(ptask);
		}

		/*
		 ** Look to see if the job has terminated.  If it is
		 ** in any state other than EXITING continue on.
		 */
		if (!check_job_substate(pjob, JOB_SUBSTATE_EXITING))
			continue;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		/* job in state JOB_SUBSTATE_EXITING destroy creds */
		if (cred_by_job(pjob, CRED_DESTROY) != PBS_KRB5_OK) {
			log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid,
				   "failed to destroy credentials");
		}
#endif

		/*
		 ** This job is exiting.  If MOM_CHKPT_ACTIVE is on, it
		 ** is time to turn if off.
		 */
		pjob->ji_flags &= ~MOM_CHKPT_ACTIVE;

		/*
		 ** Once a job is exiting each task that is done running
		 ** gets a log message for the cpu and mem usage.
		 */
		ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
		while (ptask != NULL) {
			secs = ptask->ti_cput;
			hours = secs / 3600;
			secs -= hours * 3600;
			mins = secs / 60;
			secs -= mins * 60;
			sprintf(log_buffer,
				"task %8.8X cput=%02lu:%2.2lu:%2.2lu",
				ptask->ti_qs.ti_task,
				hours, mins, secs);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
			ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask);
		}

		/*
		 ** Look to see if I am a regular sister.  If so,
		 ** check to see if there is a obit event to
		 ** send back to mother superior.
		 ** Otherwise, I need to wait for her to send a KILL_JOB
		 ** so I can send the obit (unless she died).
		 */
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
			int stream = (pjob->ji_hosts == NULL) ? -1 : pjob->ji_hosts[0].hn_stream;

			/*
			 ** Check to see if I'm still in touch with
			 ** the head office.  If not, I'm just going to
			 ** get rid of this job.
			 */
			if (stream == -1) {
				(void) kill_job(pjob, SIGKILL);
				if ((pjob->ji_qs.ji_svrflags &
				     (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) == 0) {
					mom_deljob(pjob);
				}
				continue;
			}

			/*
			 * No event waiting for sending info to MS
			 * so I'll just sit tight.
			 */
			if (pjob->ji_obit == TM_NULL_EVENT)
				continue;

			/* Check to see if any tasks are running */
			ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
			while (ptask != NULL) {
				if (ptask->ti_qs.ti_status == TI_STATE_RUNNING)
					break;
				ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask);
			}
			/* Still somebody there so don't send it yet. */
			if (ptask != NULL)
				continue;
			/* No tasks running. Format and send a reply to the mother superior */
			if (cookie != NULL) {
				(void) im_compose(stream, pjob->ji_qs.ji_jobid,
						  cookie, IM_ALL_OKAY,
						  pjob->ji_obit, TM_NULL_TASK, IM_OLD_PROTOCOL_VER);
				(void) diswul(stream,
					      resc_used(pjob, "cput", gettime));
				(void) diswul(stream,
					      resc_used(pjob, "mem", getsize));
				(void) diswul(stream,
					      resc_used(pjob, "cpupercent", gettime));
				(void) send_resc_used_to_ms(stream, pjob);
				(void) dis_flush(stream);
				pjob->ji_obit = TM_NULL_EVENT;
			}
			continue;
		}

		/*
		 * At this point, we know we are Mother Superior for this
		 * job which is EXITING.  Time for it to die.
		 */
		pjob->ji_qs.ji_svrflags &= ~(JOB_SVFLG_Suspend |
					     JOB_SVFLG_Actsuspd);
		if (pjob->ji_qs.ji_un.ji_momt.ji_exitstat != JOB_EXEC_INITABT)
			(void) kill_job(pjob, SIGKILL);
		delete_link(&pjob->ji_jobque); /* unlink from poll list */

		/*
		 * The SISTER_KILLDONE flag needs to be reset so
		 * we can talk to the sisterhood.
		 */
		for (i = 0; i < pjob->ji_numnodes; i++) {
			hnodent *np = &pjob->ji_hosts[i];

			if (np->hn_node == pjob->ji_nodeid) /* me */
				continue;

			if (np->hn_sister == SISTER_KILLDONE)
				np->hn_sister = SISTER_OKAY;
		}

		/* Job termination begins */

		/* stop counting walltime */
		stop_walltime(pjob);

		/* summary for MS */
		secs = resc_used(pjob, "cput", gettime);
		hours = secs / 3600;
		secs -= hours * 3600;
		mins = secs / 60;
		secs -= mins * 60;
		sprintf(log_buffer,
			"%s cput=%02lu:%2.2lu:%2.2lu mem=%lukb",
			mom_short_name, hours, mins, secs,
			resc_used(pjob, "mem", getsize));
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
			  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);

		/* summary for other nodes */
		for (i = 0; i < pjob->ji_numrescs; i++) {
			noderes *nr = &pjob->ji_resources[i];
			secs = nr->nr_cput;

			hours = secs / 3600;
			secs -= hours * 3600;
			mins = secs / 60;
			secs -= mins * 60;

			/*
			 ** ji_hosts starts with node 0 (MS)
			 ** ji_resource starts with node 1
			 */
			sprintf(log_buffer,
				"%s cput=%02lu:%2.2lu:%2.2lu mem=%lukb",
				pjob->ji_resources[i].nodehost ? pjob->ji_resources[i].nodehost : "",
				hours, mins, secs, nr->nr_mem);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
		}

		/*
		 ** Do dependent end of job processing if it needs to be
		 ** done.
		 */
		if (job_end_final != NULL)
			job_end_final(pjob);

		if (mock_run || !has_epilog) {
			send_obit(pjob, 0);
			continue;
		}

		/*
		 * Parent:
		 *  +  fork child process to run epilogue,
		 *  +  look for more terminated jobs.
		 * Child:
		 *  +  Run the epilogue script
		 */

		cpid = fork_me(-1);
		if (cpid > 0) {
			pjob->ji_sampletim = 0;
			pjob->ji_momsubt = cpid;
			pjob->ji_actalarm = 0;
			pjob->ji_mompost = send_obit;
			set_job_substate(pjob, JOB_SUBSTATE_RUNEPILOG);

			if (found_one++ < 20) {
				continue; /* look for more exiting jobs */
			} else {
				break; /* 20 exiting jobs at a time is our limit */
			}
		} else if (cpid < 0 && errno != ENOSYS)
			continue; /* curses, failed again */

		if (pjob->ji_grpcache) {
			if ((is_jattr_set(pjob, JOB_ATR_sandbox)) && (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
				/* in "sandbox=PRIVATE" mode so run epilogue in PBS_JOBDIR */
				if (chdir(jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir)) == -1) 
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));
			} else {
				/* else run in usr's home */
				if (chdir(pjob->ji_grpcache->gc_homedir) == -1) 
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));
			}
		}

		extval = 0;
		if (num_eligible_hooks(HOOK_EVENT_EXECJOB_EPILOGUE) > 0) {
			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;
			(void) mom_process_hooks(HOOK_EVENT_EXECJOB_EPILOGUE, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, NULL, NULL, 0, update_svr);
		} else {
			if ((is_jattr_set(pjob, JOB_ATR_interactive)) && get_jattr_long(pjob, JOB_ATR_interactive)) {
				extval = run_pelog(PE_EPILOGUE, path_epilog, pjob, PE_IO_TYPE_NULL);
			} else {
				extval = run_pelog(PE_EPILOGUE, path_epilog, pjob, PE_IO_TYPE_STD);
			}
		}
		if (extval != 2)
			extval = 0;

		if (!cpid)
			/* if we are child exit and parent will do send_obit() */
			exit(extval);

		send_obit(pjob, i);
		/* restore MOM's home if we are foreground */
		if (chdir(mom_home) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));
	}
	if (pjob == NULL)
		exiting_tasks = 0; /* went through all jobs */
}

/**
 * @brief
 * 		choosing the server to connect to if a failover server is already set up.
 * 		Selects primary and secondary alternatively.
 *
 * @param[out] port - Passed through to parse_servername(), not modified here.
 *
 * @return char *
 * @return NULL - failure
 * @retval !NULL - pointer to server name
 */
static char *
get_servername_failover(unsigned int *port)
{
	static int whom_to_connect = 0;

	if (!pbs_conf.pbs_secondary)
		return get_servername(port);
	else {
		whom_to_connect = !whom_to_connect;

		if (whom_to_connect)
			return get_servername(port);
		else
			return parse_servername(pbs_conf.pbs_secondary, port);
	}
}

/**
 * @brief
 * 	send IS_HELLOSVR message to Server.
 *
 * @param[in]	stream	- connection stream
 *
 * @par
 *	Open a connection stream to the named server/port if not already exists,
 *	compose the IS_HELLOSVR, flush the stream and remember for future use.
 *
 *
 * @return	void
 *
 */

void
send_hellosvr(int stream)
{
	int rc = 0;
	char *svr = NULL;
	unsigned int port = default_server_port;
	extern int mom_net_up;

	if (mom_net_up == 0)
		return;

	if (stream < 0) {
		if ((svr = get_servername_failover(&port)) == NULL) {
			log_err(errno, msg_daemonname, "get_servername_failover() failed");
			return;
		}

		stream = tpp_open(svr, port);
		if (stream < 0) {
			log_errf(errno, msg_daemonname, "tpp_open(%s, %d) failed", svr, port);
			return;
		}
	}

	if ((rc = is_compose(stream, IS_HELLOSVR)) != DIS_SUCCESS)
		goto err;

	if ((rc = diswui(stream, pbs_mom_port)) != DIS_SUCCESS)
		goto err;
	if ((rc = dis_flush(stream)) != DIS_SUCCESS)
		goto err;

	server_stream = stream;

	if (svr)
		sprintf(log_buffer, "HELLO sent to server at %s:%d, stream:%d", svr, port, stream);
	else
		sprintf(log_buffer, "HELLO sent to server at stream:%d", stream);
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  msg_daemonname, log_buffer);
	return;

err:
	if (svr)
		log_errf(errno, msg_daemonname, "Failed to send HELLO at %s:%d", svr, port);
	else
		log_errf(errno, msg_daemonname, "Failed to send HELLO at stream:%d", stream);
	tpp_close(stream);
	return;
}

/**
 * @brief
 *	On mom initialization, recover all running jobs.
 *
 *	Called on initialization
 *	   If the -p option was given (recover = 2), Mom will allow the jobs
 *	   to continue to run.   She depends on detecting when they terminate
 *	   via the slow poll method rather than SIGCHLD.
 *
 *	   If the -r option was given (recover = 1), MOM is recovering on a
 *  	   running system and the session id of the jobs should be valid;
 *	   the jobs are killed.
 *
 *	   If -r was not given (recover = 0), it is assumed that the whole
 *	   system, not just MOM, is comming up, the session ids are not valid;
 *	   so no attempt is made to kill the job processes.  But the jobs are
 *	   terminated and requeued.
 *
 * @param [in]	recover - Specify recovering mode for MoM.
 * @param [in]	multinode_jobs - Pointer to list of pointers to recovered multinode jobs
 *
 */

void
init_abort_jobs(int recover, pbs_list_head *multinode_jobs)
{
	DIR *dir;
	int i, sisters;
	struct dirent *pdirent;
	job *pj = NULL;
	char *job_suffix = JOB_FILE_SUFFIX;
	int job_suf_len = strlen(job_suffix);
	char *psuffix;
	char path[MAXPATHLEN + 1];
	char oldp[MAXPATHLEN + 1];
	char rcperr[] = "rcperr.";
	struct stat statbuf;
	extern char *path_checkpoint;
	extern char *path_spool;

	CLEAR_HEAD((*multinode_jobs));

	dir = opendir(path_jobs);
	if (dir == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ALERT,
			  msg_daemonname, "Jobs directory not found");
		exit(1);
	}
	while (errno = 0, (pdirent = readdir(dir)) != NULL) {
		if ((i = strlen(pdirent->d_name)) <= job_suf_len)
			continue;

		psuffix = pdirent->d_name + i - job_suf_len;
		if (strcmp(psuffix, job_suffix))
			continue;
		pj = job_recov(pdirent->d_name);
		if (pj == NULL) {
			(void) strcpy(path, path_jobs);
			(void) strcat(path, pdirent->d_name);
			(void) unlink(path);
			psuffix = path + strlen(path) - job_suf_len;
			strcpy(psuffix, JOB_TASKDIR_SUFFIX);
			(void) remtree(path);
			continue;
		}

		/* To get homedir info */
		pj->ji_grpcache = NULL;
		check_pwd(pj);
		if (pbs_idx_insert(jobs_idx, pj->ji_qs.ji_jobid, pj) != PBS_IDX_RET_OK) {
			log_joberr(PBSE_INTERNAL, __func__, "Failed to add job in index during recovery", pj->ji_qs.ji_jobid);
			job_free(pj);
			continue;
		}
		append_link(&svr_alljobs, &pj->ji_alljobs, pj);
		job_nodes(pj);
		task_recov(pj);

		/*
		 ** Check to see if a checkpoint.old dir exists.
		 ** If so, remove the regular checkpoint dir
		 ** and rename the old to the regular name.
		 */
		pbs_strncpy(path, path_checkpoint, sizeof(path));
		if (*pj->ji_qs.ji_fileprefix != '\0')
			strcat(path, pj->ji_qs.ji_fileprefix);
		else
			strcat(path, pj->ji_qs.ji_jobid);
		strcat(path, JOB_CKPT_SUFFIX);
		strcpy(oldp, path);
		strcat(oldp, ".old");

		if (stat(oldp, &statbuf) == 0) {
			(void) remtree(path);
			if (rename(oldp, path) == -1)
				(void) remtree(oldp);
		}

		/*
		 ** Check to see if I am Mother Superior.  The
		 ** JOB_SVFLG_HERE flag is overloaded for MOM
		 ** for this purpose.
		 */
		if ((pj->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
			/* I am sister, junk the job files */
			if (recover != 2) {
				mom_deljob(pj);
				continue;
			}
		}

		sisters = pj->ji_numnodes - 1;
		if (sisters > 0) {
			pj->ji_resources = (noderes *) calloc(sisters,
							      sizeof(noderes));
			if (pj->ji_resources == NULL) {
				log_err(ENOMEM, "init_abort_jobs", "out of memory");
				continue;
			}
			pj->ji_numrescs = sisters;
		}

		/*
		 **	If mom went down during file stage ops,
		 **	the substate should be EXITED.  Set it
		 **	back to OBIT so the server can verify that
		 **	it still has the job or not.
		 */
		if (check_job_substate(pj, JOB_SUBSTATE_EXITED)) {
			/*
			 ** We don't want to change the state if the
			 ** job is checkpointed.
			 */
			if ((pj->ji_qs.ji_svrflags &
			     (JOB_SVFLG_CHKPT |
			      JOB_SVFLG_ChkptMig)) == 0) {
				set_job_substate(pj, JOB_SUBSTATE_OBIT);
				job_save(pj);
			}
		} else if (check_job_substate(pj, JOB_SUBSTATE_TERM)) {
			/*
			 * Mom went down while terminate action script was
			 * running, don't know if it finished or not;  force
			 * Mom to send/resend OBIT and lets end it
			 */
			if (recover)
				(void) kill_job(pj, SIGKILL);
			set_job_substate(pj, JOB_SUBSTATE_OBIT);
			job_save(pj);
		} else if ((recover != 2) &&
			   ((check_job_substate(pj, JOB_SUBSTATE_RUNNING)) ||
			    (check_job_substate(pj, JOB_SUBSTATE_SUSPEND)) ||
			    (check_job_substate(pj, JOB_SUBSTATE_KILLSIS)) ||
			    (check_job_substate(pj, JOB_SUBSTATE_RUNEPILOG)) ||
			    (check_job_substate(pj, JOB_SUBSTATE_EXITING)))) {

			if (recover)
				(void) kill_job(pj, SIGKILL);

			/* set exit status to:
			 *   JOB_EXEC_INITABT - init abort and no chkpnt
			 *   JOB_EXEC_INITRST - init and chkpt, no mig
			 *   JOB_EXEC_INITRMG - init and chkpt, migrate
			 * to indicate recovery abort
			 */
			if (pj->ji_qs.ji_svrflags &
			    (JOB_SVFLG_CHKPT |
			     JOB_SVFLG_ChkptMig)) {
#if PBS_CHKPT_MIGRATE
				pj->ji_qs.ji_un.ji_momt.ji_exitstat =
					JOB_EXEC_INITRMG;
#else
				pj->ji_qs.ji_un.ji_momt.ji_exitstat =
					JOB_EXEC_INITRST;
#endif
			} else {
				pj->ji_qs.ji_un.ji_momt.ji_exitstat =
					JOB_EXEC_INITABT;
			}

			/*
			 ** I am MS, send a DELETE_JOB request to any
			 ** sisters that happen to still be alive.
			 */
			if (sisters > 0) {
				(void) send_sisters(pj, IM_DELETE_JOB, NULL);
			}
			set_job_substate(pj, JOB_SUBSTATE_EXITING);
			job_save(pj);
			exiting_tasks = 1;
		} else if (recover == 2) {
			pbs_task *ptask;

			for (ptask = (pbs_task *) GET_NEXT(pj->ji_tasks);
			     ptask != NULL;
			     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
				ptask->ti_flags |= TI_FLAGS_ORPHAN;
			}

			if (check_job_substate(pj, JOB_SUBSTATE_RUNNING)) {
				recover_walltime(pj);
				start_walltime(pj);
			}

			if (mom_do_poll(pj))
				append_link(&mom_polljobs, &pj->ji_jobque, pj);

			if (sisters > 0)
				append_link(multinode_jobs, &pj->ji_multinodejobs, pj);

			if (pj->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {
				/* I am MS */
				pj->ji_stdout = pj->ji_ports[0] = pj->ji_extended.ji_ext.ji_stdout;
				pj->ji_stderr = pj->ji_ports[1] = pj->ji_extended.ji_ext.ji_stdout;
			}
		}
	}
	if (errno != 0 && errno != ENOENT) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ALERT,
			  msg_daemonname, "Jobs directory cannot be read");
		(void) closedir(dir);
		exit(1);
	}
	(void) closedir(dir);

	/*
	 ** Go through spool dir and remove files that match
	 ** "rcperr.<pid>".  These would be leftover from file
	 ** stage operations that were interrupted.
	 */
	dir = opendir(path_spool);
	if (dir == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ALERT,
			  msg_daemonname, "spool directory not found");
		return;
	}

	while (errno = 0, (pdirent = readdir(dir)) != NULL) {
		if (strncmp(pdirent->d_name, rcperr, sizeof(rcperr) - 1) != 0)
			continue;

		(void) strcpy(path, path_spool);
		(void) strcat(path, pdirent->d_name);
		(void) unlink(path);
	}
	if (errno != 0 && errno != ENOENT)
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ALERT,
			  msg_daemonname, "spool directory cannot be read");
	(void) closedir(dir);
}

/**
 * @brief
 * 	static handler function to be called by deferred child exit work task
 * 	for alps cancel reservation child of mom
 *
 * 	The forked child process cannot send a req_reject or reply_ack since
 * 	transmission of data via tpp is not supported from child processes
 * 	(tpp streams are automatically closed when proccess forks).
 * 	Thus this child exit handler is added to send the reply from the
 * 	parent process after reaping the exit status from child
 *
 * @param[in] ptask - Pointer to the task structure
 *
 */
#if MOM_ALPS
static void
post_alps_cancel_resv(struct work_task *ptask)
{
	struct batch_request *preq = ptask->wt_parm1;
	int j;

	if (preq == NULL)
		return;

	j = ptask->wt_aux;
	if (j > 0) {
		/* Tell the server we failed */
		req_reject(PBSE_ALPSRELERR, j, preq);
	} else if (j < 0) {
		/* Fatal error, log message was logged in
		 * alps_cancel_request
		 */
		req_reject(PBSE_ALPSRELERR, j, preq);
	} else {
		/* The job will have been purged in mom_deljob_wait at this point
		 * so just do the reply.
		 */
		reply_ack(preq);
	}
}
#endif

/**
 * @brief
 * 	del_job_hw	delete job/hardware related resources such as ALPS reservations, ...
 *
 *	Used by del_job_resc() and exec_bail()
 *	Most items here are platform dependent.
 *
 * @param pjob  - pointer to job structure
 *
 * @return void
 *
 */
void
del_job_hw(job *pjob)
{
#if MOM_ALPS
	int i;
	int j;
	int sleeptime = 0;
	time_t total_time = 0;
	time_t begin_time = 0;
	time_t end_time = 0;
	long jitter = 0;
	pid_t parent_pid = 0;
	pid_t pid;
	int sconn = -1;
	struct work_task *wtask = NULL;

	/*
	 * Try to cancel the reservation once as 'main MOM'.
	 * If we got an acknowledgment from ALPS that the reservation
	 * is actually gone, then send ACK to server.
	 * Else, fork a child process that will continue to try to cancel
	 * the reservation until the remaining processes count is zero.
	 * Or until the ALPS reservation no longer exists.
	 */
	if ((j = alps_cancel_reservation(pjob)) > 0) {
		/*
		 * alps reservation cancel failed with "temporary" error
		 * This could be due to one of more of the following:
		 * 	- the reservation still has claims on it
		 * 	- ALPS is down
		 * Retry in child until success, or a hard error is returned
		 * Or alps_release_timeout is reached.
		 * Once the ALPS reservation is successfully canceled,
		 * respond to the server's delete job request.
		 * The job will remain in the 'E' state until then.
		 */
		if (pjob->ji_preq != NULL)
			sconn = pjob->ji_preq->rq_conn;

		if ((pid = fork_me(sconn)) == 0) {
			/* We are the child */
			begin_time = time(NULL);
			end_time = begin_time;
			/* add jobid to the seed */
			srandom((unsigned) (atoi(pjob->ji_qs.ji_jobid) + begin_time));
			for (i = 1; (total_time = end_time - begin_time) < alps_release_timeout; ++i, end_time = time(NULL)) {
				/* calculate time to sleep */
				sleeptime = alps_release_wait_time;
				/* Add randomness of 0 to 0.12 seconds to the
				 * sleeptime so we don't overwhelm ALPS with
				 * multiple ALPS release requests when jobs end
				 * at the same time.
				 */
				jitter = random() % alps_release_jitter;
				sleeptime += jitter;
				usleep(sleeptime);
				if ((j = alps_cancel_reservation(pjob)) <= 0)
					break;
			}
			if (j > 0) {
				sprintf(log_buffer,
					"Timed out after %d attempts over "
					"%ld seconds of attempting "
					"to cancel ALPS reservation %ld",
					i, total_time,
					pjob->ji_extended.ji_ext.ji_reservation);
				log_joberr(-1, __func__, log_buffer,
					   pjob->ji_qs.ji_jobid);
				/* send a HUP to main MOM so she re-reads
				 * the ALPS inventory
				 */
				parent_pid = getppid();
				kill(parent_pid, SIGHUP);

			} else if (j == 0) {
				sprintf(log_buffer,
					"Cancelled ALPS reservation %ld after a "
					"total of %d tries",
					pjob->ji_extended.ji_ext.ji_reservation, i + 1);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG, pjob->ji_qs.ji_jobid,
					  log_buffer);
			}

			/* exit with the respective error code to the parent process
			 * Parents (moms) post handler will handle this
			 */
			exit(j);

		} else if (pid > 0) {
			/* we are the parent, the reply happens after the child exits */
			if ((wtask = set_task(WORK_Deferred_Child, pid,
					      post_alps_cancel_resv, pjob->ji_preq)) == NULL) {
				log_err(errno, NULL, "Failed to create deferred work task, Out of memory");
				req_reject(PBSE_SYSTEM, 0, pjob->ji_preq);
			}
		} else if (pid < 0) {
			/* fork failed, reply to the server so the job
			 * doesn't stay in the "E" state
			 */
			req_reject(PBSE_ALPSRELERR, j, pjob->ji_preq);
		}
	} else if (j < 0) {
		/* ALPS returned a PERMANENT error */
		req_reject(PBSE_ALPSRELERR, j, pjob->ji_preq);
	} else {
		/* The reservation was canceled, let server know */
		reply_ack(pjob->ji_preq);
	}
	pjob->ji_preq = NULL;
#endif
}

/**
 * @brief
 * 	del_job_resc - delete job related resources, files, etc
 *	Used by mom_deljob() and mom_deljob_wait()
 *
 *	Items which are kept until the very bitter end of the job, just
 *	before the job structure is freed, are released/freed/cleared here.
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return Void
 *
 */
void
del_job_resc(job *pjob)
{
	/*
	 * WARNING - the following is for QA automated testing to induce
	 * certain failures modes
	 */

	if (QA_testing != 0) {
		if (QA_testing & PBSQA_DELJOB_SLEEP)
			sleep(90); /* 90 second delay */
		else if (QA_testing & PBSQA_DELJOB_SLEEPLONG)
			sleep(900); /* 900 second long delay */
		else if (QA_testing & PBSQA_DELJOB_CRASH)
			exit(99); /* simulate crash */
	}

	/* remove PBS_NODEFILE - Mother Superior shall have one and the sister
	moms too if the mom config gen_nodefile_on_sister_mom is set to 1 */

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE || gen_nodefile_on_sister_mom) {
		char file[MAXPATHLEN + 1];
#ifdef WIN32
		(void) sprintf(file, "%s/auxiliary/%s",
			       pbs_conf.pbs_home_path, pjob->ji_qs.ji_jobid);
#else
		(void) sprintf(file, "%s/aux/%s",
			       pbs_conf.pbs_home_path, pjob->ji_qs.ji_jobid);
#endif
		(void) unlink(file);
	}

	/* TMPDIR removed in job_purge so files are available for staging */

	if (job_clean_extra != NULL) {
		(void) job_clean_extra(pjob);
	}

	/* delete the hardware related items */

	del_job_hw(pjob);
}

/**
 * @brief
 * 	mom_deljob - delete the job entry, MOM no longer knows about the job
 *	This version does NOT wait for the Sisters to reply
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return Void
 *
 */
void
mom_deljob(job *pjob)
{

	del_job_resc(pjob); /* rm tmpdir, etc. */

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) /* MS */
		(void) send_sisters(pjob, IM_DELETE_JOB, NULL);
	job_purge_mom(pjob);

	/*
	 ** after job is gone, check to make sure no rogue user
	 ** procs are still hanging about
	 */
	dorestrict_user();
}

/**
 * @brief
 * 	mom_deljob_wait - deletes most of the job stuff, job entry not deleted
 *	until the sisters have replied or are down
 *	This version DOES wait for the Sisters to reply, see processing of
 *	IM_DELETE_JOB_REPLY in mom_comm.c
 *	IT should only be called for a job for which this is Mother Superior.
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return int
 * @retval the number of sisters to whom the request was sent
 *
 */
int
mom_deljob_wait(job *pjob)
{
	int i;

	del_job_resc(pjob); /* rm tmpdir, etc. */

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) { /* MS */
		set_job_substate(pjob, JOB_SUBSTATE_DELJOB);
		pjob->ji_sampletim = time_now;
		/*
		 * The SISTER_KILLDONE flag needs to be reset so
		 * we can talk to the sisterhood and know when they reply.
		 */
		for (i = 0; i < pjob->ji_numnodes; i++) {
			hnodent *np = &pjob->ji_hosts[i];

			if (np->hn_node == pjob->ji_nodeid) /* me */
				continue;

			if (np->hn_sister == SISTER_KILLDONE)
				np->hn_sister = SISTER_OKAY;
		}
		i = send_sisters(pjob, IM_DELETE_JOB_REPLY, NULL);
		if (i == 0) {
			if (pjob->ji_numnodes > 1) {
				sprintf(log_buffer, "Unable to send delete job "
						    "request to one or more sisters");
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					  LOG_ERR, pjob->ji_qs.ji_jobid, log_buffer);
			}

			if (mock_run) {
				/* Delete the job end work task for this job */
				delete_task_by_parm1_func(pjob, mock_run_end_job_task, DELETE_ALL);
			}

			/* job is purged here first, discard job happens later
			 * and IM_DISCARD_JOB does not find pjob to kill
			 * job process in case of a mom restart
			 *
			 * Fixing by killing job here, should not hurt in any
			 * case (since we are purging job anyway)
			 */
			(void) kill_job(pjob, SIGKILL);
			job_purge_mom(pjob);
			dorestrict_user();
		}
		/*
		 * otherwise, job_purge() and dorestrict_user() are called in
		 * mom_comm when all the sisters have replied.  The reply to
		 * the Server is also done there
		 */
		return (i);
	} else
		return 0;
}

/**
 *
 * @brief
 *  The wrapper to "mom_deljob_wait()".
 * @par
 *  This will call mom_deljob_wait based on MOM_ALPS macro and
 *  reply to the batch request.
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return void
 */
void
mom_deljob_wait2(job *pjob)
{
#if MOM_ALPS
	(void) mom_deljob_wait(pjob);

#else
	int numnodes;
	struct batch_request *preq;
	/*
	 * save number of nodes in sisterhood in case
	 * job is deleted in mom_deljob_wait()
	 */
	numnodes = pjob->ji_numnodes;

	preq = pjob->ji_preq;
	pjob->ji_preq = NULL;
	if (mom_deljob_wait(pjob) > 0) {
		/* wait till sisters respond */
		pjob->ji_preq = preq;
	} else if (numnodes > 1) {
		/*
		* no messages sent, but there are sisters
		* must be all down
		*/
		req_reject(PBSE_SISCOMM, 0, preq); /* all sis down */
	} else {
		reply_ack(preq); /* no sisters, reply now  */
	}
#endif
}

/**
 * @brief
 * send_sisters_deljob_wait	-
 * 	Job entry is not deleted until the sisters have replied or are down
 *	This version DOES wait for the Sisters to reply, see processing of
 *	IM_DELETE_JOB_REPLY in mom_comm.c
 *	It should only be called for a job for which this is Mother Superior.
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return int
 * @retval the number of sisters to whom the request was sent
 *
 */
int
send_sisters_deljob_wait(job *pjob)
{
	int i;

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) { /* MS */
		set_job_substate(pjob, JOB_SUBSTATE_DELJOB);
		pjob->ji_sampletim = time_now;
		/*
		 * The SISTER_KILLDONE flag needs to be reset so
		 * we can talk to the sisterhood and know when they reply.
		 */
		for (i = 0; i < pjob->ji_numnodes; i++) {
			hnodent *np = &pjob->ji_hosts[i];

			if (np->hn_node == pjob->ji_nodeid) /* me */
				continue;

			if (np->hn_sister == SISTER_KILLDONE)
				np->hn_sister = SISTER_OKAY;
		}
		return (send_sisters(pjob, IM_DELETE_JOB_REPLY, NULL));
	} else
		return 0;
}

/**
 * @brief
 * 		Convenience function to call mom_set_use() when all jobs need to be updated
 *
 * @param	void
 * @return	void
 */
void
mom_set_use_all(void)
{
	job *pjob = NULL;

	if (!mock_run) {
		if (mom_get_sample() == PBSE_NONE) {
			pjob = (job *) GET_NEXT(svr_alljobs);
			while (pjob) {
				if ((check_job_state(pjob, JOB_STATE_LTR_EXITING) &&
				     (get_job_substate(pjob) >= JOB_SUBSTATE_OBIT ||
				      get_job_substate(pjob) == JOB_SUBSTATE_EXITED)) ||
				    (check_job_state(pjob, JOB_STATE_LTR_RUNNING) && get_job_substate(pjob) <= JOB_SUBSTATE_PRERUN)) {
					pjob = (job *) GET_NEXT(pjob->ji_alljobs);
					continue;
				}
				mom_set_use(pjob);
				pjob = (job *) GET_NEXT(pjob->ji_alljobs);
			}
		}
	}
}

/**
 * @brief	Wrapper function to job purge
 *
 * @param[in]	pjob - the job being purged
 *
 * @return	void
 */
void
job_purge_mom(job *pjob)
{
	if (mock_run)
		mock_run_job_purge(pjob);
	else
		job_purge(pjob);
}


================================================
FILE: src/resmom/job_recov_fs.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    job_recov_fs.c
 *
 * @brief
 *	job_recov_fs.c - This file contains the functions to record a job
 *	data struture to disk and to recover it from disk by Mom
 *
 *	The data is recorded in a file whose name is the job_id.
 *
 *	The following public functions are provided:
 *		job_save_fs() -		save the disk image
 *		job_recov_fs() -		recover (read) job from disk
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include <sys/param.h>

#include "pbs_ifl.h"
#include <errno.h>
#include <fcntl.h>
#include <string.h>
#include <stdlib.h>
#include <time.h>

#include <unistd.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"

#include <sys/stat.h>

#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include <memory.h>
#include "libutil.h"

#define MAX_SAVE_TRIES 3

/* global data items */

extern char *path_jobs;
extern time_t time_now;
extern char pbs_recov_filename[];

/* data global only to this file */

static const size_t fixedsize = sizeof(struct jobfix);
static const size_t extndsize = sizeof(union jobextend);

/**
 * @brief
 *		Saves (or updates) a job structure image on disk
 *
 *		Save does either - a quick update for state changes only,
 *			 - a full update for an existing file, or
 *			 - a full write for a new job
 *
 *		For a quick update, the data written is less than a disk block
 *		size and no size change occurs.
 *
 *		No need of O_SYNC flag as this will improve the performance.
 *		This might lead to data loss from file system in case of system
 *		crash. This is not an issue as data is mostly recovered from the
 *		database.
 *
 *		For a new file write, first time, the data is written directly to
 *		the file.
 *
 * @param[in]	pjob - Pointer to the job structure to save
 *
 * @return      Error code
 * @retval	 0  - Success
 * @retval	-1  - Failure
 *
 */

int
job_save_fs(job *pjob)
{
	int fds;
	int i;
	char *filename;
	char namebuf1[MAXPATHLEN + 1];
	char namebuf2[MAXPATHLEN + 1];
	int openflags;
	int redo;
	int pmode;
	int quick = 1;

#ifdef WIN32
	pmode = _S_IWRITE | _S_IREAD;
#else
	pmode = 0600;
#endif

	(void) strcpy(namebuf1, path_jobs); /* job directory path */
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(namebuf1, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(namebuf1, pjob->ji_qs.ji_jobid);
	(void) strcpy(namebuf2, namebuf1); /* setup for later */
	(void) strcat(namebuf1, JOB_FILE_SUFFIX);

	if (pjob->ji_qs.ji_jsversion != JSVERSION) {
		/* version of job structure changed, force full write */
		pjob->ji_qs.ji_jsversion = JSVERSION;
		quick = 0;
	}

	for (i = 0; i < JOB_ATR_LAST; i++) {
		if ((get_jattr(pjob, i))->at_flags & ATR_VFLAG_MODIFY) {
			quick = 0;
			break;
		}
	}

	if (quick) {
		openflags = O_WRONLY;
		fds = open(namebuf1, openflags, pmode);
		if (fds < 0) {
			log_errf(errno, __func__, "Failed to open %s file", namebuf1);
			return (-1);
		}
#ifdef WIN32
		secure_file(namebuf1, "Administrators",
			    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
		setmode(fds, O_BINARY);
#endif

		/* just write the "critical" base structure to the file */

		save_setup(fds);
		if ((save_struct((char *) &pjob->ji_qs, fixedsize) == 0) &&
		    (save_struct((char *) &pjob->ji_extended, extndsize) == 0) &&
		    (save_flush() == 0)) {
			(void) close(fds);
		} else {
			log_err(errno, "job_save", "error quickwrite");
			(void) close(fds);
			return (-1);
		}

	} else {
		/* an attribute changed,  update mtime */
		set_jattr_l_slim(pjob, JOB_ATR_mtime, time_now, SET);

		/*
		 * write the whole structure to the file.
		 * For a update, this is done to a new file to protect the
		 * old against crashs.
		 * The file is written in four parts:
		 * (1) the job structure,
		 * (2) the extended area,
		 * (3) if a Array Job, the index tracking table
		 * (4) the attributes in the "encoded "external form, and last
		 * (5) the dependency list.
		 */

		(void) strcat(namebuf2, JOB_FILE_COPY);
		openflags = O_CREAT | O_WRONLY;

#ifdef WIN32
		fix_perms2(namebuf2, namebuf1);
#endif

		filename = namebuf2;

		fds = open(filename, openflags, pmode);
		if (fds < 0) {
			log_err(errno, "job_save",
				"error opening for full save");
			return (-1);
		}

#ifdef WIN32
		secure_file(filename, "Administrators",
			    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
		setmode(fds, O_BINARY);
#endif

		for (i = 0; i < MAX_SAVE_TRIES; ++i) {
			redo = 0; /* try to save twice */
			save_setup(fds);
			if (save_struct((char *) &pjob->ji_qs, fixedsize) != 0) {
				redo++;
			} else if (save_struct((char *) &pjob->ji_extended,
					       extndsize) != 0) {
				redo++;
			} else if (save_attr_fs(job_attr_def, pjob->ji_wattr,
						(int) JOB_ATR_LAST) != 0) {
				redo++;
			} else if (save_flush() != 0) {
				redo++;
			}
			if (redo != 0) {
				if (lseek(fds, (off_t) 0, SEEK_SET) < 0) {
					log_err(errno, "job_save", "error lseek");
				}
			} else
				break;
		}

		(void) close(fds);
		if (i >= MAX_SAVE_TRIES)
			return (-1);

#ifdef WIN32
		if (MoveFileEx(namebuf2, namebuf1,
			       MOVEFILE_REPLACE_EXISTING | MOVEFILE_WRITE_THROUGH) == 0) {

			errno = GetLastError();
			sprintf(log_buffer, "MoveFileEx(%s,%s) failed!",
				namebuf2, namebuf1);
			log_err(errno, "job_save", log_buffer);
		}
		secure_file(namebuf1, "Administrators",
			    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#else
		if (rename(namebuf2, namebuf1) == -1) {
			log_event(PBSEVENT_ERROR | PBSEVENT_SECURITY,
				  PBS_EVENTCLASS_JOB, LOG_ERR,
				  pjob->ji_qs.ji_jobid,
				  "rename in job_save failed");
		}
#endif
	}
	return (0);
}

/**
 * @brief
 *		recover (read in) a job from its save file
 *
 *		This function is only needed upon server start up.
 *
 *		The job structure, its attributes strings, and its dependencies
 *		are recovered from the disk.  Space to hold the above is
 *		malloc-ed as needed.
 *
 *
 * @param[in]	filename	- Name of job file to load job from
 *
 * @return	pointer to new job structure
 *
 * @retval	 NULL - Failure
 * @retval	!NULL - Success
 *
 */

job *
job_recov_fs(char *filename)
{
	int fds;
	char basen[MAXPATHLEN + 1];
	job *pj;
	char *pn;
	char *psuffix;

	pj = job_alloc(); /* allocate & initialize job structure space */
	if (pj == NULL) {
		return NULL;
	}

	(void) strcpy(pbs_recov_filename, path_jobs); /* job directory path */
	(void) strcat(pbs_recov_filename, filename);
#ifdef WIN32
	fix_perms(pbs_recov_filename);
#endif

	/* change file name in case recovery fails so we don't try same file */

	pbs_strncpy(basen, pbs_recov_filename, sizeof(basen));
	psuffix = basen + strlen(basen) - strlen(JOB_BAD_SUFFIX);
	(void) strcpy(psuffix, JOB_BAD_SUFFIX);
#ifdef WIN32
	if (MoveFileEx(pbs_recov_filename, basen,
		       MOVEFILE_REPLACE_EXISTING | MOVEFILE_WRITE_THROUGH) == 0) {
		errno = GetLastError();
		sprintf(log_buffer, "MoveFileEx(%s, %s) failed!",
			pbs_recov_filename, basen);
		log_err(errno, "nodes", log_buffer);
	}
	secure_file(basen, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#else
	if (rename(pbs_recov_filename, basen) == -1) {
		sprintf(log_buffer, "error renaming job file %s",
			pbs_recov_filename);
		log_err(errno, __func__, log_buffer);
		free((char *) pj);
		return NULL;
	}
#endif

	fds = open(basen, O_RDONLY, 0);
	if (fds < 0) {
		sprintf(log_buffer, "error opening of job file %s",
			pbs_recov_filename);
		log_err(errno, __func__, log_buffer);
		free((char *) pj);
		return NULL;
	}
#ifdef WIN32
	setmode(fds, O_BINARY);
#endif

	/* read in job fixed sub-structure */

	errno = -1;
	if (read(fds, (char *) &pj->ji_qs, fixedsize) != (int) fixedsize) {
		sprintf(log_buffer, "error reading fixed portion of %s",
			pbs_recov_filename);
		log_err(errno, __func__, log_buffer);
		free((char *) pj);
		(void) close(fds);
		return NULL;
	}
	/* Does file name match the internal name? */
	/* This detects ghost files */

#ifdef WIN32
	pn = strrchr(pbs_recov_filename, (int) '/');
	if (pn == NULL)
		pn = strrchr(pbs_recov_filename, (int) '\\');
	if (pn == NULL) {
		sprintf(log_buffer, "bad path %s", pbs_recov_filename);
		log_err(errno, __func__, log_buffer);
		free((char *) pj);
		(void) close(fds);
		return NULL;
	}
	pn++;
#else
	pn = strrchr(pbs_recov_filename, (int) '/') + 1;
#endif

	if (strncmp(pn, pj->ji_qs.ji_jobid, strlen(pn) - 3) != 0) {
		/* mismatch, discard job */

		(void) sprintf(log_buffer,
			       "Job Id %s does not match file name for %s",
			       pj->ji_qs.ji_jobid,
			       pbs_recov_filename);
		log_err(-1, __func__, log_buffer);
		free((char *) pj);
		(void) close(fds);
		return NULL;
	}

	/* read in extended save area depending on JSVERSION */

	errno = 0;
	DBPRT(("Job save version %d\n", pj->ji_qs.ji_jsversion))
	if (pj->ji_qs.ji_jsversion >= JSVERSION_18) {
		/* since there is no change in jobextend structure for JSVERSION(1900) and JSVERSION_18(800),
		 * read the current structure.
		 */
		if (read(fds, (char *) &pj->ji_extended,
			 sizeof(union jobextend)) !=
		    sizeof(union jobextend)) {
			sprintf(log_buffer,
				"error reading extended portion of %s",
				pbs_recov_filename);
			log_err(errno, __func__, log_buffer);
			free((char *) pj);
			(void) close(fds);
			return NULL;
		}
	} else {
		/* If really an old version(i.e. pre 13.x), it wasn't there, abort out */
		sprintf(log_buffer,
			"Job structure version cannot be recovered for job %s",
			pbs_recov_filename);
		log_err(errno, __func__, log_buffer);
		free((char *) pj);
		(void) close(fds);
		return NULL;
	}

	/* read in working attributes */

	if (recov_attr_fs(fds, pj, job_attr_idx, job_attr_def, pj->ji_wattr, (int) JOB_ATR_LAST,
			  (int) JOB_ATR_UNKN) != 0) {
		sprintf(log_buffer, "error reading attributes portion of %s",
			pbs_recov_filename);
		log_err(errno, __func__, log_buffer);
		job_free(pj);
		(void) close(fds);
		return NULL;
	}
	(void) close(fds);

#if defined(WIN32)
	/* get a handle to the job (may not exist) */
	pj->ji_hJob = OpenJobObject(JOB_OBJECT_ALL_ACCESS, FALSE,
				    pj->ji_qs.ji_jobid);
#endif

	/* all done recovering the job, change file name back to .JB */

#ifdef WIN32
	if (MoveFileEx(basen, pbs_recov_filename,
		       MOVEFILE_REPLACE_EXISTING | MOVEFILE_WRITE_THROUGH) == 0) {
		errno = GetLastError();
		sprintf(log_buffer, "MoveFileEx(%s, %s) failed!",
			basen, pbs_recov_filename);
		log_err(errno, "nodes", log_buffer);
	}
	secure_file(pbs_recov_filename, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#else
	(void) rename(basen, pbs_recov_filename);
#endif

	return (pj);
}


================================================
FILE: src/resmom/linux/alps.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	alps.c
 * @brief
 * Cray ALPS related functionality.
 * The functions in this file are responsible for parsing the XML response
 * from the ALPS BASIL client (either catnip or apbasil). These functions
 * rely on the expat XML parsing engine, and require libexpat to be linked
 * with the binary. The expat library is commonly installed with all Linux
 * distributions, but the developer may choose to link the library statically
 * to eliminate the potential for version mismatch or lack of availability.
 * The 64 bit version of the static library is currently less that 256KB in
 * size, so the overhead of static linking is minimal.
 *
 * The Batch and Application Scheduling Interface Layer (BASIL) utilizes
 * the extensible markup language (XML) for input and output. A brief
 * description of XML may be found on Wikipedia at
 * http://en.wikipedia.org/wiki/XML
 *
 * A nice description of Expat can be found at:
 * http://www.xml.com/pub/a/1999/09/expat/index.html
 *
 * We are primarily concerned with XML elements and attributes. Perhaps
 * the easiest way to think of these structures is in relation to their
 * HTML counterparts. Both document types are heirarchical in nature and
 * are built upon a set of elements that may each contain attributes.
 * Descriptions of each element and its associated attributes may be
 * found in the basil.h header file.
 */

#include "pbs_config.h"

#if MOM_ALPS /* Defined when --enable-alps is passed to configure. */

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <ctype.h>
#include <fcntl.h>
#include <errno.h>
#include <expat.h>
#include <sys/types.h>
#include <sys/wait.h>
#include <signal.h>
#include <stdarg.h>
#include <pwd.h>
#include <assert.h>

#ifndef _XOPEN_SOURCE
extern pid_t getsid(pid_t);
#endif /* _XOPEN_SOURCE */

#include "pbs_error.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "log.h"
#include "mom_func.h"
#include "basil.h"
#include "placementsets.h"
#include "mom_server.h"
#include "mom_vnode.h"
#include "resmon.h"
#include "hwloc.h"

/**
 * Remember the PBScrayhost (mpphost) reported by ALPS.
 * Utilized during Inventory query procession for Compute nodes.
 */
char mpphost[BASIL_STRING_LONG];

/*
 * Data types to support interaction with the Cray ALPS implementation.
 */

extern char *alps_client;
extern int vnode_per_numa_node;
extern char *ret_string;
extern vnl_t *vnlp;

/**
 * Define a sane BASIL stack limit.
 * This specifies the how many levels deep the BASIL can go.
 * Need to increase this for each XML level indentation addition.
 */
#define MAX_BASIL_STACK (16)

/**
 * Maintain counts on elements that are limited to one instance per context.
 * These counters help keep track of the XML structure that is imposed
 * by ALPS. The counter is checked to be sure they are not nested or
 * get jumbled in any way.
 */
typedef struct element_counts {
	int response;
	int response_data;
	int reserved;
	int confirmed;
	int released;
	int inventory;
	int node_array;
	int socket_array;
	int segment_array;
	int processor_array;
	int memory_array;
	int label_array;
	int reservation_array;
	int application_array;
	int command_array;
	int accelerator_array;
	int computeunit_array;
/*
	The following entries are not needed now because we are just
	ignoring the corresponding XML tags. If they become nesessary
	in the future, here they are.
*/
#if 0
	int reserved_node_array;
	int reserved_segment_array;
	int reserved_processor_array;
	int reserved_memory_array;
#endif
} element_counts_t;

/**
 * This is for the SYSTEM Query XML Response.
 * Maintain counts on elements that are limited to one instance per context.
 * These counters are checked to ensure that the XML Response is not nested/
 * jumbled in any way.
 */
typedef struct element_counts_sys {
	int response;
	int response_data;
	int system;
} element_counts_sys_t;

/**
 * Pointers for node data used when parsing inventory.
 * These provide a place to hang lists of any possible result from an
 * ALPS inventory. Additionally, counters for node states are kept here.
 */
typedef struct inventory_data {
	basil_node_t *node;
	basil_node_socket_t *socket;
	basil_node_segment_t *segment;
	basil_node_processor_t *processor;
	basil_processor_allocation_t *processor_allocation;
	basil_node_memory_t *memory;
	basil_memory_allocation_t *memory_allocation;
	basil_label_t *label;
	basil_rsvn_t *reservation;
	basil_node_computeunit_t *cu;
	int role_int;
	int role_batch;
	int role_unknown;
	int state_up;
	int state_down;
	int state_unavail;
	int state_routing;
	int state_suspect;
	int state_admin;
	int state_unknown;
	basil_node_accelerator_t *accelerator;
	basil_accelerator_allocation_t *accelerator_allocation;
	int accel_type_gpu;
	int accel_type_unknown;
	int accel_state_up;
	int accel_state_down;
	int accel_state_unknown;
	int socket_count;
} inventory_data_t;

/**
 * Pointer to System <Nodes> data used when parsing System response.
 * This structure is expected to grow as/when we implement more of
 * the BASIL 1.7 features.
 */
typedef struct system_data {
	basil_system_element_t *node_group;
} system_data_t;

/**
 * The user data structure for expat.
 */
typedef struct ud {
	int depth;
	int stack[MAX_BASIL_STACK + 1];
	char status[BASIL_STRING_SHORT];
	char message[BASIL_ERROR_BUFFER_SIZE];
	char type[BASIL_STRING_SHORT];
	char basil_ver[BASIL_STRING_SHORT];
	char error_class[BASIL_STRING_SHORT];
	char error_source[BASIL_STRING_SHORT];
	element_counts_t count;
	element_counts_sys_t count_sys;
	inventory_data_t current;
	system_data_t current_sys;
	basil_response_t *brp;
} ud_t;

/**
 * Pointer to a response structure (that gets filled in with KNL Node information).
 */
static basil_response_t *brp_knl;

/**
 * List of all KNL Nodes extracted from the System (BASIL 1.7) XML Response.
 */
static char *knl_node_list;

/**
 * Function pointers to XML handler functions.
 * @param element string giving the XML tag
 * @param start function to call when the tag is seen
 * @param end function to call when the XML segment is finished
 * @param char_data character handler for the given XML segment
 */
typedef struct element_handler {
	char *element;
	void (*start)(ud_t *, const XML_Char *, const XML_Char **);
	void (*end)(ud_t *, const XML_Char *);
	void (*char_data)(ud_t *, const XML_Char *, int);
} element_handler_t;

static XML_Parser parser;
static element_handler_t handler[];

#define EXPAT_BUFFER_LEN (65536)
static char expatBuffer[(EXPAT_BUFFER_LEN * sizeof(char))];
static char *basil_inventory;
static char *alps_client_out;

static char *requestBuffer;
static char *requestBuffer_knl;
static size_t requestSize_knl;
static size_t requestCurr = 0;
static size_t requestSize = 0;

#define UTIL_BUFFER_LEN (4096)
static char utilBuffer[(UTIL_BUFFER_LEN * sizeof(char))];

#define VNODE_NAME_LEN 255

#define BASIL_ERR_ID "BASIL"

/**
 * Flag set to true when talking to Basil 1.1 original.
 */
static int basil11orig = 0;

/**
 * Variables that keep track of which basil version to speak.
 * The Inventory Query speaks BASIL 1.4 (stored in basilversion_inventory) and
 * the System Query speaks BASIL 1.7 (stored in basilversion_system).
 */
static char basilversion_inventory[BASIL_STRING_SHORT];
static char basilversion_system[BASIL_STRING_SHORT];

/**
 * Flag to indicate BASIL 1.7 support.
 */
static int basil_1_7_supported;

/**
 * Variable that keeps track of the numeric value related to the basil version.
 * It is used to do specific validation per basil version.
 */
static basil_version_t basilver = 0;

/**
 * Versions of BASIL that PBS supports.
 * It is a smaller subset that what ALPS likely provides in
 * basil_supported_versions.
 * PBS no longer supports version 1.0.
 * As ALPS adds BASIL versions, once PBS supports them, they should
 * be added here.
 */
static const char *pbs_supported_basil_versions[] __attribute__((unused)) = {
	BASIL_VAL_VERSION_1_4,
	BASIL_VAL_VERSION_1_3,
	BASIL_VAL_VERSION_1_2,
	BASIL_VAL_VERSION_1_1,
	NULL};

static int first_compute_node = 1;

/**
 * String to use for mpp_host in vnode names when basil11orig
 * is true.
 */
#define FAKE_MPP_HOST "default"

/**
 * Prototype declarations for System Query (KNL) related functions.
 */
static int init_KNL_alps_req_buf(void);
static void create_vnodes_KNL(basil_response_query_system_t *);
static int exclude_from_KNL_processing(basil_system_element_t *,
				       short int check_state);
static long *process_nodelist_KNL(char *, int *);
static void store_nids(int, char *, long **, int *);
static void free_basil_elements_KNL(basil_system_element_t *);
static void alps_engine_query_KNL(void);

/**
 * @brief
 *	When DEBUG is defined, log XML parsing messages to MOM log file.
 *
 * @param[in] fmt - format of msg
 *
 * @return Void
 */
static void
xml_dbg(char *fmt, ...)
{
#ifdef DEBUG
	va_list argp;
	va_start(argp, fmt);
	vsnprintf(log_buffer, sizeof(log_buffer), fmt, argp);
	va_end(argp);
	log_event(PBSEVENT_DEBUG2, 0, LOG_DEBUG, BASIL_ERR_ID, log_buffer);
#endif /* DEBUG */
	return;
}

/**
 * @brief
 * 	Start a new ALPS request.
 * 	If need be, allocate a buffer. Set the start point requestCurr to 0.
 *
 * @return Void
 *
 */
static void
new_alps_req(void)
{
	if (requestBuffer == NULL) {
		requestSize = UTIL_BUFFER_LEN;
		requestBuffer = malloc(UTIL_BUFFER_LEN);
	}
	assert(requestBuffer != NULL);
	requestCurr = 0;
}

/**
 * @brief
 * Start a new ALPS request for KNL.
 *
 * If need be, allocate a buffer.
 * @retval 1 if buffer allocation failed.
 * @retval 0 if success.
 */
static int
init_KNL_alps_req_buf(void)
{
	if (requestBuffer_knl == NULL) {
		requestSize_knl = UTIL_BUFFER_LEN;
		if ((requestBuffer_knl = (char *) malloc(UTIL_BUFFER_LEN)) == NULL) {
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_ERR, __func__,
				  "Memory allocation for XML request buffer failed.");
			return 1;
		}
	}
	return 0;
}

/**
 * @brief
 * 	Add new text to current ALPS request.
 *
 * 	If need be, extend the buffer. Copy the new text into the buffer
 * 	and set the start point requestCurr to follow the added text.
 *
 * @param[in] new - text to add
 *
 * @return Void
 *
 */
static void
add_alps_req(char *new)
{
	size_t len = strlen(new);

	if (requestCurr + len >= requestSize) {
		size_t num = (UTIL_BUFFER_LEN + len) / UTIL_BUFFER_LEN;
		requestSize += num * UTIL_BUFFER_LEN;
		requestBuffer = realloc(requestBuffer, requestSize);
		assert(requestBuffer != NULL);
	}
	strcpy(&requestBuffer[requestCurr], new);
	requestCurr += len;
}

/**
 * @brief
 * 	When an internal parse error is encountered, set the source, class,
 * 	and message pointers in the expat user data structure.
 *
 * @param d - pointer to user data structure
 *
 * @return Void
 *
 */
static void
parse_err_internal(ud_t *d)
{
	snprintf(d->message, sizeof(d->message), "Internal error.");
	sprintf(d->error_source, "%s", BASIL_VAL_INTERNAL);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When an out of memory error is encountered, set the source, class,
 *	and message pointers in the expat user data structure.
 *
 * @param[in] d - pointer to user data structure
 *
 * @return Void
 *
 */
static void
parse_err_out_of_memory(ud_t *d)
{
	snprintf(d->message, sizeof(d->message), "Out of memory.");
	sprintf(d->error_source, "%s", BASIL_VAL_SYSTEM);
	sprintf(d->error_class, "%s", BASIL_VAL_TRANSIENT);
	return;
}

/**
 * @brief
 * 	When a stack depth error is encountered, set the source, class,
 * 	and message pointers in the expat user data structure.
 *
 * @param[in] d - pointer to user data structure
 *
 * @return Void
 *
 */
static void
parse_err_stack_depth(ud_t *d)
{
	snprintf(d->message, sizeof(d->message), "Stack too deep.");
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When an invalid XML element is encountered, set the source, class,
 * 	and message pointers in the expat user data structure.
 *
 * @param[in] d - pointer to user data structure
 *
 * @return Void
 *
 */
static void
parse_err_illegal_start(ud_t *d)
{
	char *el = handler[d->stack[d->depth]].element;

	snprintf(d->message, sizeof(d->message),
		 "Illegal element: %s", el);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When a single XML element is expected, but multiple instances are
 * 	encountered, set the source, class, and message pointers in the
 * 	expat user data structure.
 *
 * param[in] d - pointer to user data structure
 *
 * @return Void
 *
 */

static void
parse_err_multiple_elements(ud_t *d)
{
	char *el = handler[d->stack[d->depth]].element;

	snprintf(d->message, sizeof(d->message),
		 "Multiple instances of element: %s", el);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When an unsupported BASIL version is encountered, set the source, class,
 * 	and message pointers in the expat user data structure.
 *
 * @param d pointer to user data structure
 * @param[in] remote version string from the XML
 * @param[in] local version define from 'basil.h' (BASIL_VAL_VERSION)
 *
 * @retval Void
 *
 */
static void
parse_err_version_mismatch(ud_t *d, const char *remote, const char *local)
{
	snprintf(d->message, sizeof(d->message),
		 "BASIL version mismatch: us=%s, them=%s", local, remote);
	sprintf(d->error_source, "%s", BASIL_VAL_BACKEND);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When an XML attribute is required but not specified, set the source,
 * 	class, and message pointers in the expat user data structure.
 *
 * @param d pointer to user data structure
 * @param[in] attr name of the unspecified attribute
 *
 * @retval Void
 *
 */
static void
parse_err_unspecified_attr(ud_t *d, const char *attr)
{
	snprintf(d->message, sizeof(d->message),
		 "Unspecified attribute: %s", attr);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When a single XML attribute is expected, but multiple instances are
 * 	encountered, set the source, class, and message pointers in the
 * 	expat user data structure.
 * 	Most fields are initialized to zero so a non-zero value means a repeat
 * 	has taken place.
 *
 * @param[in] d pointer to user data structure
 * @param[in] attr name of the repeated attribute
 *
 * @retval Void
 *
 */
static void
parse_err_multiple_attrs(ud_t *d, const char *attr)
{
	snprintf(d->message, sizeof(d->message),
		 "Multiple attribute instances: %s", attr);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When an unrecognized XML attribute is specified within an element, set
 * 	the source, class, and message pointers in the expat user data structure.
 *
 * @param[in] d pointer to user data structure
 * @param[in] attr name of the unrecognized attribute
 *
 * @return Void
 *
 */
static void
parse_err_unrecognized_attr(ud_t *d, const char *attr)
{
	snprintf(d->message, sizeof(d->message),
		 "Unrecognized attribute: %s", attr);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When an illegal value is assigned to an attribute within an element, set
 * 	the source, class, and message pointers in the expat user data structure.
 *
 * @param[in] d pointer to user data structure
 * @param[in] name name of the attribute
 * @param[in] value bad value
 *
 * @retval Void
 *
 */
static void
parse_err_illegal_attr_val(ud_t *d, const char *name, const char *value)
{
	snprintf(d->message, sizeof(d->message),
		 "Illegal attribute assignment: %s = %s", name, value);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When illegal characters are encountered within the XML data, set the
 * 	source, class, and message pointers in the expat user data structure.
 *
 * @param[in] d pointer to user data structure
 * @param[in] s string with bad characters
 *
 * @retval Void
 *
 */
static void
parse_err_illegal_char_data(ud_t *d, const char *s)
{
	snprintf(d->message, sizeof(d->message),
		 "Illegal character data: %s", s);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * 	When the end of the XML data is encountered prematurely, set the
 * 	source, class, and message pointers in the expat user data structure.
 *
 * @param[in] d pointer to user data structure
 * @param[in] el name of bad end element
 *
 * @retval Void
 *
 */
static void
parse_err_illegal_end(ud_t *d, const char *el)
{
	snprintf(d->message, sizeof(d->message),
		 "Illegal end of element: %s", el);
	sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
	sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
	return;
}

/**
 * @brief
 * This function enforces the structure of the XML elements. Since
 * messages can occur in any element, they are not part of the check.
 *
 * Check that the depth is okay then look at the top element. Make
 * sure that what comes before the top is legal in the XML structure
 * we are parsing.
 *
 * @return int
 * @retval 1 if XML structure is incorrect
 * @retval 0 okay
 *
 */
static int
stack_busted(ud_t *d)
{
	char *top;
	char *prev;
	basil_response_t *brp;

	if (!d) {
		parse_err_internal(NULL);
		return (1);
	}
	brp = d->brp;
	if (d->depth < 1 || d->depth >= MAX_BASIL_STACK) {
		parse_err_stack_depth(d);
		return (1);
	} else if (d->depth == 1) {
		top = handler[d->stack[d->depth]].element;
		if (strcmp(BASIL_ELM_RESPONSE, top) != 0) {
			parse_err_illegal_start(d);
			return (1);
		}
	} else {
		top = handler[d->stack[d->depth]].element;
		prev = handler[d->stack[(d->depth - 1)]].element;
		if (strcmp(BASIL_ELM_RESPONSE, top) == 0) {
			parse_err_illegal_start(d);
			return (1);
		} else if (strcmp(BASIL_ELM_RESPONSEDATA, top) == 0) {
			if (strcmp(BASIL_ELM_RESPONSE, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RESERVED, top) == 0) {
			if (strcmp(BASIL_ELM_RESPONSEDATA, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
			if (brp->method != basil_method_reserve) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_CONFIRMED, top) == 0) {
			if (strcmp(BASIL_ELM_RESPONSEDATA, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
			if (brp->method != basil_method_confirm) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RELEASED, top) == 0) {
			if (strcmp(BASIL_ELM_RESPONSEDATA, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
			if (brp->method != basil_method_release) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_INVENTORY, top) == 0) {
			if (strcmp(BASIL_ELM_RESPONSEDATA, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
			if (brp->method != basil_method_query) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_NODEARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_INVENTORY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
			if (brp->data.query.type != basil_query_inventory) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_NODE, top) == 0) {
			if (strcmp(BASIL_ELM_NODEARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_SOCKETARRAY, top) == 0) {
			/* socket XML was introduced in BASIL 1.3*/
			if (strcmp(BASIL_ELM_NODE, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_SOCKET, top) == 0) {
			if (strcmp(BASIL_ELM_SOCKETARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_SEGMENTARRAY, top) == 0) {
			switch (basilver) {
				case basil_1_0:
				case basil_1_1:
				case basil_1_2:
					if (strcmp(BASIL_ELM_NODE, prev) != 0) {
						parse_err_illegal_start(d);
						return (1);
					}
					break;
				case basil_1_3:
				case basil_1_4:
				case basil_1_7:
					if (strcmp(BASIL_ELM_SOCKET, prev) != 0) {
						parse_err_illegal_start(d);
						return (1);
					}
					break;
			}
		} else if (strcmp(BASIL_ELM_SEGMENT, top) == 0) {
			if (strcmp(BASIL_ELM_SEGMENTARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_CUARRAY, top) == 0) {
			/* ComputeUnit Array XML was introduced in BASIL 1.3*/
			if (strcmp(BASIL_ELM_SEGMENT, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_COMPUTEUNIT, top) == 0) {
			/* Compute Unit XML was introduced in BASIL 1.3*/
			if (strcmp(BASIL_ELM_CUARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_PROCESSORARRAY, top) == 0) {
			switch (basilver) {
				case basil_1_0:
				case basil_1_1:
				case basil_1_2:
					if (strcmp(BASIL_ELM_SEGMENT, prev) != 0) {
						parse_err_illegal_start(d);
						return (1);
					}
					break;
				case basil_1_3:
				case basil_1_4:
				case basil_1_7:
					if (strcmp(BASIL_ELM_COMPUTEUNIT, prev) != 0) {
						parse_err_illegal_start(d);
						return (1);
					}
					break;
			}
		} else if (strcmp(BASIL_ELM_PROCESSOR, top) == 0) {
			if (strcmp(BASIL_ELM_PROCESSORARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_PROCESSORALLOC, top) == 0) {
			if (strcmp(BASIL_ELM_PROCESSOR, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_MEMORYARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_SEGMENT, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_MEMORY, top) == 0) {
			if (strcmp(BASIL_ELM_MEMORYARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_MEMORYALLOC, top) == 0) {
			if (strcmp(BASIL_ELM_MEMORY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_LABELARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_SEGMENT, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_LABEL, top) == 0) {
			if (strcmp(BASIL_ELM_LABELARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVNARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_INVENTORY, prev) != 0) {
				if (strcmp(BASIL_ELM_RESPONSEDATA, prev) != 0) {
					parse_err_illegal_start(d);
					return (1);
				}
			}
		} else if (strcmp(BASIL_ELM_RESERVATION, top) == 0) {
			if (strcmp(BASIL_ELM_RSVNARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_APPARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_RESERVATION, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_APPLICATION, top) == 0) {
			if (strcmp(BASIL_ELM_APPARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_CMDARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_APPLICATION, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_COMMAND, top) == 0) {
			if (strcmp(BASIL_ELM_CMDARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_ACCELERATORARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_NODE, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_ACCELERATOR, top) == 0) {
			if (strcmp(BASIL_ELM_ACCELERATORARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_ACCELERATORALLOC, top) == 0) {
			if (strcmp(BASIL_ELM_ACCELERATOR, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_NODEARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_RESERVED, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_NODE, top) == 0) {
			if (strcmp(BASIL_ELM_RSVD_NODEARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_SGMTARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_RESERVED, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_SGMT, top) == 0) {
			if (strcmp(BASIL_ELM_RSVD_SGMTARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_PROCARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_RESERVED, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_PROCESSOR, top) == 0) {
			if (strcmp(BASIL_ELM_RSVD_PROCARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_MEMARRAY, top) == 0) {
			if (strcmp(BASIL_ELM_RESERVED, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		} else if (strcmp(BASIL_ELM_RSVD_MEMORY, top) == 0) {
			if (strcmp(BASIL_ELM_RSVD_MEMARRAY, prev) != 0) {
				parse_err_illegal_start(d);
				return (1);
			}
		}
	}
	return (0);
}

/**
 * @brief
 * 	This function is registered to handle the start of the BASIL response.
 * 	Checks the stack (depth should be 1) and the protocol version. The
 * 	protocol version is defined in basil.h and will be updated whenever
 * 	the BASIL document format changes. Cray will provide a new basil.h
 * 	when this occurs.
 *
 *
 * The standard Expat start handler function prototype is used.
 * @param[in] d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 *
 */
static void
response_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	char protocol[BASIL_STRING_SHORT];

	if (stack_busted(d))
		return;
	if (++(d->count.response) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	protocol[0] = '\0';
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_PROTOCOL, *np) == 0) {
			BASIL_STRSET_SHORT(protocol, *vp);
			if ((strcmp(BASIL_VAL_VERSION_1_7, *vp) != 0) &&
			    (strcmp(BASIL_VAL_VERSION_1_4, *vp) != 0) &&
			    (strcmp(BASIL_VAL_VERSION_1_3, *vp) != 0) &&
			    (strcmp(BASIL_VAL_VERSION_1_2, *vp) != 0) &&
			    (strcmp(BASIL_VAL_VERSION_1_1, *vp) != 0)) {
				parse_err_version_mismatch(d, *vp, d->basil_ver);
				return;
			}
		}
	}
	if (protocol[0] == '\0') {
		parse_err_unspecified_attr(d, BASIL_ATR_PROTOCOL);
		return;
	}
}

/**
 * @brief
 * 	This funtion is registered to handle the start of the BASIL data.
 * 	It checks to make sure there is a valid method type so we know
 * 	what elements to expect later on.
 *
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param[in] d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 *
 */
static void
response_data_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_response_t *brp;

	if (stack_busted(d))
		return;
	brp = d->brp;
	if (++(d->count.response_data) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_METHOD, *np) == 0) {
			if (brp->method != basil_method_none) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_RESERVE, *vp) == 0) {
				brp->method = basil_method_reserve;
				brp->data.reserve.rsvn_id = -1;
			} else if (strcmp(BASIL_VAL_CONFIRM, *vp) == 0) {
				brp->method = basil_method_confirm;
			} else if (strcmp(BASIL_VAL_RELEASE, *vp) == 0) {
				brp->method = basil_method_release;
				brp->data.release.claims = 0;
			} else if (strcmp(BASIL_VAL_QUERY, *vp) == 0) {
				brp->method = basil_method_query;
				/*
				 * Set type to status, for the switch status
				 * response. The other types can get set in
				 * inventory_start and engine_start.
				 */
				brp->data.query.type = basil_query_status;
			} else if (strcmp(BASIL_VAL_SWITCH, *vp) == 0) {
				brp->method = basil_method_switch;
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_STATUS, *np) == 0) {
			pbs_strncpy(d->status, *vp, sizeof(d->status));
			if (strcmp(BASIL_VAL_SUCCESS, *vp) == 0) {
				*brp->error = '\0';
			} else if (strcmp(BASIL_VAL_FAILURE, *vp) == 0) {
				/* do nothing here, brp->error was set */
				/* in alps_request_parent              */
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_ERROR_CLASS, *np) == 0) {
			pbs_strncpy(d->error_class, *vp, sizeof(d->error_class));
			/*
			 * The existence of a PERMENENT error used to
			 * reset the BASIL_ERR_TRANSIENT flag. This
			 * is no longer done since the error_flags
			 * field is initialized to zero.
			 */
			if (strcmp(BASIL_VAL_TRANSIENT, *vp) == 0) {
				brp->error_flags |= (BASIL_ERR_TRANSIENT);
			} else if (strcmp(BASIL_VAL_PERMANENT, *vp) != 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_ERROR_SOURCE, *np) == 0) {
			pbs_strncpy(d->error_source, *vp, sizeof(d->error_source));
			/*
			 * Consider "BACKEND" errors TRANSIENT when trying
			 * to create an ALPS reservation.
			 * It was found that a node being changed from
			 * batch to interactive would cause a PERMANENT,
			 * BACKEND error when a job was run on it. We
			 * want this to not result in the job being deleted.
			 */
			if (brp->method == basil_method_reserve) {
				if (strcmp(BASIL_VAL_BACKEND, *vp) == 0) {
					brp->error_flags |= (BASIL_ERR_TRANSIENT);
				}
			}
		} else if (strcmp(BASIL_ATR_TYPE, *np) == 0) {
			pbs_strncpy(d->type, *vp, sizeof(d->type));
			if ((strcmp(BASIL_VAL_SYSTEM, *vp) != 0) &&
			    (strcmp(BASIL_VAL_ENGINE, *vp) != 0)) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}

	if (brp->method == basil_method_none) {
		parse_err_unspecified_attr(d, BASIL_ATR_METHOD);
		return;
	}
	if (*d->status == '\0') {
		parse_err_unspecified_attr(d, BASIL_ATR_STATUS);
		return;
	}
}

/**
 * @brief
 * 	This funtion is registered to handle BASIL message elements. Message
 * 	elements may appear anywhere in the XML, and may be selectively
 * 	ignored. Each message must have a severity defined as an attribute.
 *
 * 	The standard Expat start handler function prototype is used.
 *
 * @param[in] d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 */
static void
message_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	*d->message = '\0';
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_SEVERITY, *np) == 0) {
			if (strcmp(BASIL_VAL_DEBUG, *vp) == 0) {
				strcat(d->message, BASIL_VAL_DEBUG ": ");
			} else if (strcmp(BASIL_VAL_WARNING, *vp) == 0) {
				strcat(d->message, BASIL_VAL_WARNING ": ");
			} else if (strcmp(BASIL_VAL_ERROR, *vp) == 0) {
				strcat(d->message, BASIL_VAL_ERROR ": ");
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (*d->message == '\0') {
		parse_err_unspecified_attr(d, BASIL_ATR_SEVERITY);
		return;
	}
	return;
}

/**
 * @brief
 * 	This function digests the text component of the message element and
 * 	updates the message pointer in the user data structure.
 *
 * The standard Expat character handler function prototype is used.
 *
 * @param[in] d pointer to user data structure
 * @param[in] s string
 * @param[in] len length of string
 *
 * @retval Void
 *
 */
static void
message_char_data(ud_t *d, const XML_Char *s, int len)
{
	strncat(d->message, s, len);
}

/**
 * @brief
 * 	This function handles the end of a BASIL message element by logging
 * 	the message to the MOM log file.
 *
 * 	The standard Expat end handler function prototype is used.
 *
 * @param[in] d pointer to user data structure
 * @param[in] el name of end element
 *
 * @retval Void\
 *
 */
static void
message_end(ud_t *d, const XML_Char *el)
{
	if (strcmp(el, handler[d->stack[d->depth]].element) != 0)
		parse_err_illegal_end(d, el);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  BASIL_ERR_ID, d->message);
	return;
}

/**
 * @brief
 * 	This function is registered to handle the reserved element in
 * 	response to a reservation creation request.
 *
 * Change from basil 1.0: admin_cookie is renamed to pagg_id
 * and alloc_cookie is deprecated as of 1.1.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param[in] d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 *
 */
static void
reserved_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_response_t *brp;

	if (stack_busted(d))
		return;
	if (++(d->count.reserved) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	brp = d->brp;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
			brp->data.reserve.rsvn_id = strtol(*vp, NULL, 10);
		} else if (!basil11orig) {
			/*
			 * Basil 1.1+ doesn't have any other elements
			 * but Basil 1.1 orig has dummy entries for
			 * "admin_cookie" and "alloc_cookie". Just
			 * ignore them.
			 */
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	/* rsvn_id is initialized to -1 so this catches the unset case. */
	if (brp->data.reserve.rsvn_id < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_RSVN_ID);
		return;
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the confirmed element in
 * 	response to a reservation confirmation request.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 *
 */
static void
confirmed_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.confirmed) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		/*
		 * These keywords do not need to be saved. The CONFIRM
		 * reply is just sending back the same values given in
		 * the CONFIRM request.
		 */
		if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
		} else if (strcmp(BASIL_ATR_PAGG_ID, *np) == 0) {
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
		}
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the released element in
 * 	response to a reservation release request.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 *
 */
static void
released_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_response_t *brp;

	if (stack_busted(d))
		return;
	if (++(d->count.released) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	brp = d->brp;

	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		/*
		 * This keyword does not need to be saved. The
		 * RELEASE reply is just sending back the same value
		 * given in the RELEASE request.
		 */
		if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
		} else if (strcmp(BASIL_ATR_CLAIMS, *np) == 0) {
			brp->data.release.claims = strtol(*vp, NULL, 10);
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the engine element in
 * 	response to an engine request.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 *
 */
static void
engine_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_response_t *brp;
	basil_response_query_engine_t *eng;
	int len = 0;

	if (stack_busted(d))
		return;

	brp = d->brp;
	brp->data.query.type = basil_query_engine;
	eng = &brp->data.query.data.engine;

	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		if (strcmp(BASIL_ATR_NAME, *np) == 0) {
			/* This keyword does not have to be saved */
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
		} else if (strcmp(BASIL_ATR_VERSION, *np) == 0) {
			/* We will need this in alps_engine_query */
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
			if (eng->version) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			len = strlen(*vp) + 1;
			eng->version = malloc(len);
			if (!eng->version) {
				parse_err_out_of_memory(d);
				return;
			}
			snprintf(eng->version, len, "%s", *vp);
		} else if (strcmp(BASIL_ATR_SUPPORTED, *np) == 0) {
			/* Save this for use in alps_engine_query */
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
			if (eng->basil_support) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			len = strlen(*vp) + 1;
			eng->basil_support = malloc(len);
			if (!eng->basil_support) {
				parse_err_out_of_memory(d);
				return;
			}
			snprintf(eng->basil_support, len, "%s", *vp);
		}
	}
	if (!eng->version) {
		parse_err_unspecified_attr(d, BASIL_ATR_VERSION);
		return;
	}
	if (!eng->basil_support) {
		parse_err_unspecified_attr(d, BASIL_ATR_SUPPORTED);
		return;
	}
}

/**
 * @brief
 * 	This function is registered to handle the inventory element in
 * 	response to an inventory request.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
inventory_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_response_t *brp;
	basil_response_query_inventory_t *inv;

	if (stack_busted(d))
		return;
	if (++(d->count.inventory) > 1) {
		parse_err_multiple_elements(d);
		return;
	}

	brp = d->brp;
	brp->data.query.type = basil_query_inventory;
	inv = &brp->data.query.data.inventory;

	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_TIMESTAMP, *np) == 0) {
			if (inv->timestamp != 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			inv->timestamp = atoll(*vp);
		} else if (strcmp(BASIL_ATR_MPPHOST, *np) == 0) {
			if (inv->mpp_host[0] != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			snprintf(&inv->mpp_host[0],
				 BASIL_STRING_LONG, "%s", *vp);
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}

	/*
	 * The mpp_host and timestamp fields will be filled in
	 * for BASIL_VAL_VERSION_1_1 "plus" and higher. There is no other
	 * way to tell BASIL_VAL_VERSION_1_1 from 1.1+.
	 */
	if (inv->timestamp == 0) {
		inv->timestamp = time(NULL);
		basil11orig = 1;
	}
	if (inv->mpp_host[0] == '\0') {
		pbs_strncpy(inv->mpp_host, FAKE_MPP_HOST, sizeof(inv->mpp_host));
		basil11orig = 1;
	}

	d->count.node_array = 0;
	d->count.reservation_array = 0;
	d->count.accelerator_array = 0;
	d->count.socket_array = 0;
	d->count.segment_array = 0;
	d->count.computeunit_array = 0;

	/* set interesting counts to zero */
	d->current.role_int = 0;
	d->current.role_batch = 0;
	d->current.role_unknown = 0;
	d->current.state_up = 0;
	d->current.state_down = 0;
	d->current.state_unavail = 0;
	d->current.state_routing = 0;
	d->current.state_suspect = 0;
	d->current.state_admin = 0;
	d->current.state_unknown = 0;
	d->current.accel_type_gpu = 0;
	d->current.accel_type_unknown = 0;
	d->current.accel_state_up = 0;
	d->current.accel_state_down = 0;
	d->current.accel_state_unknown = 0;
	d->current.socket_count = 0;
	return;
}

/**
 * @brief
 * 	This function is registered to handle the node array element within
 * 	an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void]
 *
 */
static void
node_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.node_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_CHANGECOUNT, *np) == 0) {
			/*
			 * Currently unused.
			 * We could save changecount if we ever started
			 * requesting inventory more frequently.
			 * changecount could help reduce the amount of data
			 * returned if the inventory has not changed.
			 */
		} else if (strcmp(BASIL_ATR_SCHEDCOUNT, *np) == 0) {
			/*
			 * Currently unused.
			 */
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	d->current.node = NULL;
	return;
}

/**
 * @brief
 * 	This function is registered to handle the node element within an
 * 	inventory response.
 *
 * Due to the new response format introduced in BASIL 1.3, and
 * continuing in BASIL 1.4, the count for different arrays need to be
 * reset at different places.
 * For example, since BASIL 1.1 and BASIL 1.2 have segments but no sockets
 * we need to reset the segment_array as part of node_start, however in
 * BASIL 1.3 and 1.4 segment_array count will be reset in socket_start.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @retval Void
 *
 */
static void
node_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_node_t *node;
	basil_response_t *brp;

	if (stack_busted(d))
		return;
	brp = d->brp;
	node = malloc(sizeof(basil_node_t));
	if (!node) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(node, 0, sizeof(basil_node_t));
	node->node_id = -1;
	if (d->current.node) {
		(d->current.node)->next = node;
	} else {
		brp->data.query.data.inventory.nodes = node;
	}
	d->current.node = node;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_NODE_ID, *np) == 0) {
			if (node->node_id >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			node->node_id = atol(*vp);
			if (node->node_id < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_ROUTER_ID, *np) == 0) {
			if (node->router_id > 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			node->router_id = atol(*vp);
			if (*vp <= 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_NAME, *np) == 0) {
			if (*node->name) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			snprintf(node->name, BASIL_STRING_SHORT, "%s", *vp);
		} else if (strcmp(BASIL_ATR_ARCH, *np) == 0) {
			if (node->arch) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_XT, *vp) == 0) {
				node->arch = basil_node_arch_xt;
			} else if (strcmp(BASIL_VAL_X2, *vp) == 0) {
				node->arch = basil_node_arch_x2;
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_ROLE, *np) == 0) {
			if (node->role) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_INTERACTIVE, *vp) == 0) {
				d->current.role_int++;
				node->role = basil_node_role_interactive;
			} else if (strcmp(BASIL_VAL_BATCH, *vp) == 0) {
				d->current.role_batch++;
				node->role = basil_node_role_batch;
			} else {
				d->current.role_unknown++;
				node->role = basil_node_role_unknown;
			}
		} else if (strcmp(BASIL_ATR_STATE, *np) == 0) {
			if (node->state) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_UP, *vp) == 0) {
				d->current.state_up++;
				node->state = basil_node_state_up;
			} else if (strcmp(BASIL_VAL_DOWN, *vp) == 0) {
				d->current.state_down++;
				node->state = basil_node_state_down;
			} else if (strcmp(BASIL_VAL_UNAVAILABLE, *vp) == 0) {
				d->current.state_unavail++;
				node->state = basil_node_state_unavail;
			} else if (strcmp(BASIL_VAL_ROUTING, *vp) == 0) {
				d->current.state_routing++;
				node->state = basil_node_state_route;
			} else if (strcmp(BASIL_VAL_SUSPECT, *vp) == 0) {
				d->current.state_suspect++;
				node->state = basil_node_state_suspect;
			} else if (strcmp(BASIL_VAL_ADMIN, *vp) == 0) {
				d->current.state_admin++;
				node->state = basil_node_state_admindown;
			} else {
				d->current.state_unknown++;
				node->state = basil_node_state_unknown;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (node->node_id < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_NODE_ID);
		return;
	}
	if (*node->name == '\0') {
		parse_err_unspecified_attr(d, BASIL_ATR_NAME);
		return;
	}
	if (!node->role) {
		parse_err_unspecified_attr(d, BASIL_ATR_ROLE);
		return;
	}
	if (!node->state) {
		parse_err_unspecified_attr(d, BASIL_ATR_STATE);
		return;
	}
	/* Reset the array counters. */
	switch (basilver) {
		case basil_1_0:
		case basil_1_1:
		case basil_1_2:
			d->count.segment_array = 0;
			break;
		case basil_1_3:
		case basil_1_4:
		case basil_1_7:
			/* segment_array is reset in socket_start() for these
			 * BASIL versions.
			 */
			break;
	}
	d->count.socket_array = 0;
	d->count.accelerator_array = 0;
	return;
}

/**
 * @brief
 * 	This function is registered to handle the segment array element
 * 	within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 * @retval Void
 *
 */
static void
socket_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.socket_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	d->current.socket = NULL;
	return;
}

/**
 * @brief
 *	 This function is registered to handle the socket element within an inventory response.
 * Starting with BASIL 1.3 the socket array has the architecture and clock_mhz of the processors.
 * However, this information is not used by PBS.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
socket_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_node_socket_t *socket;

	if (stack_busted(d))
		return;
	socket = malloc(sizeof(basil_node_socket_t));
	if (!socket) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(socket, 0, sizeof(basil_node_socket_t));
	socket->ordinal = -1;
	socket->clock_mhz = -1;
	if (d->current.socket) {
		(d->current.socket)->next = socket;
	} else {
		if (!d->current.node) {
			parse_err_internal(d);
			free(socket);
			return;
		}
		(d->current.node)->sockets = socket;
	}
	d->current.socket = socket;

	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_ORDINAL, *np) == 0) {
			if (socket->ordinal >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			socket->ordinal = atoi(*vp);
			if (socket->ordinal < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_ARCH, *np) == 0) {
			if (socket->arch) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_X86_64, *vp) == 0) {
				socket->arch = basil_processor_x86_64;
			} else if (strcmp(BASIL_VAL_CRAY_X2, *vp) == 0) {
				socket->arch = basil_processor_cray_x2;
			} else if (strcmp(BASIL_VAL_AARCH64, *vp) == 0) {
				socket->arch = basil_processor_aarch64;
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_CLOCK_MHZ, *np) == 0) {
			if (socket->clock_mhz >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			socket->clock_mhz = atoi(*vp);
			if (socket->clock_mhz < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}

	if (socket->ordinal < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_ORDINAL);
		return;
	}
	if (!socket->arch) {
		parse_err_unspecified_attr(d, BASIL_ATR_ARCH);
		return;
	}
	if (socket->clock_mhz < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_CLOCK_MHZ);
		return;
	}
	/* Increase the socket count */
	d->current.socket_count++;

	/* Reset the array counters and segment */
	d->count.segment_array = 0;
	d->current.segment = NULL;

	return;
}

/**
 * @brief
 *	This function is registered to handle the segment array element
 * within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
segment_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.segment_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	if (!d->current.socket)
		d->current.segment = NULL;
	return;
}

/**
 * @brief
 *	This function is registered to handle the segment element within an
 * inventory response.
 *
 * Due to the new XML format introduced in BASIL 1.3, and
 * continuing in BASIL 1.4, the count for different arrays need to be
 * reset at different places.
 * For example, since BASIL 1.1 and BASIL 1.2 have no compute units we don't
 * need to reset the count here. Also for BASIL 1.1 and 1.2, the processor
 * count will be reset in processor_array_start.
 * For BASIL 1.3 and BASIL 1.4 we need to reset the count for compute unit
 * arrays here.
 *
 * The standard Expat start handler function prototype is used.
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
segment_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_node_segment_t *segment;

	if (stack_busted(d))
		return;
	segment = malloc(sizeof(basil_node_segment_t));
	if (!segment) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(segment, 0, sizeof(basil_node_segment_t));
	segment->ordinal = -1;
	if (d->current.segment) {
		(d->current.segment)->next = segment;
	} else {
		if (!d->current.node) {
			parse_err_internal(d);
			free(segment);
			return;
		}
		switch (basilver) {
			case basil_1_0:
			case basil_1_1:
			case basil_1_2:
				/* There are no socket elements. */
				(d->current.node)->segments = segment;
				break;
			case basil_1_3:
			case basil_1_4:
			case basil_1_7:
				(d->current.socket)->segments = segment;
				break;
		}
	}
	d->current.segment = segment;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_ORDINAL, *np) == 0) {
			if (segment->ordinal >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			segment->ordinal = atol(*vp);
			if (segment->ordinal < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (segment->ordinal < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_ORDINAL);
		return;
	}
	/* Reset the array counters. */
	switch (basilver) {
		case basil_1_0:
		case basil_1_1:
		case basil_1_2:
			/* There are no compute units, and the processor
			 * count was initialized as part of processor_array_start()
			 */
			break;
		case basil_1_3:
		case basil_1_4:
		case basil_1_7:
			d->count.computeunit_array = 0;
			d->current.processor = NULL;
			break;
	}
	d->count.processor_array = 0;
	d->count.memory_array = 0;
	d->count.label_array = 0;
	return;
}

/**
 * @brief
 *	This function is registered to handle the computeunit array element
 * within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 */
static void
computeunit_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.computeunit_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	d->current.cu = NULL;
	return;
}

/**
 * @brief
 *	This function is registered to handle the computeunit element within an
 * inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
computeunit_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_node_computeunit_t *cu;

	if (stack_busted(d))
		return;
	cu = malloc(sizeof(basil_node_computeunit_t));
	if (!cu) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(cu, 0, sizeof(basil_node_computeunit_t));
	cu->ordinal = -1;
	cu->proc_per_cu_count = 0;

	if (d->current.cu) {
		(d->current.cu)->next = cu;
	} else {
		if (!d->current.segment) {
			parse_err_internal(d);
			free(cu);
			return;
		}
		(d->current.segment)->computeunits = cu;
	}
	d->current.cu = cu;

	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_ORDINAL, *np) == 0) {
			if (cu->ordinal >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			cu->ordinal = atol(*vp);
			if (cu->ordinal < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (cu->ordinal < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_ORDINAL);
		return;
	}
	/* Reset the array counter */
	d->count.processor_array = 0;
}

/**
 * @brief
 *	This function is registered to handle the processor array element
 * within an inventory response.
 *
 * Due to the new response format introduced in BASIL 1.3, and
 * continuing in BASIL 1.4, the count for different arrays need to be
 * reset at different times.
 * For example, for BASIL 1.1 and 1.2, the processor pointer will be
 * set to NULL.
 * Whereas, for BASIL 1.3 and BASIL 1.4 we reset it in segment_start.
 *
 * The standard Expat start handler function prototype is used.
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 * @return Void
 *
 */
static void
processor_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.processor_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	switch (basilver) {
		case basil_1_0:
		case basil_1_1:
		case basil_1_2:
			d->current.processor = NULL;
			break;
		case basil_1_3:
		case basil_1_4:
		case basil_1_7:
			/* processor is reset in segment_start()
			 * for these BASIL versions
			 */
			break;
	}
	return;
}

/**
 * @brief
 *	This function is registered to handle the processor element within an
 * inventory response.
 *
 * Due to the new response format introduced in BASIL 1.3, and
 * continuing in BASIL 1.4, the information attached to different XML
 * sections has changed. For example, processor arch and MHz info is
 * no longer part of the processor XML for BASIL 1.3 and 1.4. Thus that
 * information is not verified here.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 */
static void
processor_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_node_processor_t *processor;
	basil_node_computeunit_t *cu = NULL;

	if (stack_busted(d))
		return;
	processor = malloc(sizeof(basil_node_processor_t));
	if (!processor) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(processor, 0, sizeof(basil_node_processor_t));
	processor->ordinal = -1;
	processor->clock_mhz = -1;
	if (d->current.processor) {
		(d->current.processor)->next = processor;
	} else {
		if (!d->current.segment) {
			parse_err_internal(d);
			free(processor);
			return;
		}
		(d->current.segment)->processors = processor;
	}
	d->current.processor = processor;
	switch (basilver) {
		case basil_1_0:
		case basil_1_1:
		case basil_1_2:
			/* There are no computeunits for these BASIL versions */
			break;
		case basil_1_3:
		case basil_1_4:
		case basil_1_7:
			cu = (d->current.segment)->computeunits;
			if (!cu) {
				parse_err_internal(d);
				return;
			}
			break;
	}

	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_ORDINAL, *np) == 0) {
			if (processor->ordinal >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			processor->ordinal = atol(*vp);
			if (processor->ordinal < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
			if (cu) {
				cu->proc_per_cu_count = processor->ordinal + 1;
			}
		} else if (strcmp(BASIL_ATR_ARCH, *np) == 0) {
			if (processor->arch) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_X86_64, *vp) == 0) {
				processor->arch = basil_processor_x86_64;
			} else if (strcmp(BASIL_VAL_CRAY_X2, *vp) == 0) {
				processor->arch = basil_processor_cray_x2;
			} else if (strcmp(BASIL_VAL_AARCH64, *vp) == 0) {
				processor->arch = basil_processor_aarch64;
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_CLOCK_MHZ, *np) == 0) {
			if (processor->clock_mhz >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			processor->clock_mhz = atoi(*vp);
			if (processor->clock_mhz < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (processor->ordinal < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_ORDINAL);
		return;
	}
	switch (basilver) {
		case basil_1_0:
		case basil_1_1:
		case basil_1_2:
			if (!processor->arch) {
				parse_err_unspecified_attr(d, BASIL_ATR_ARCH);
				return;
			}
			if (processor->clock_mhz < 0) {
				parse_err_unspecified_attr(d, BASIL_ATR_CLOCK_MHZ);
				return;
			}
			break;
		case basil_1_3:
		case basil_1_4:
		case basil_1_7:
			/* The arch and mhz info is no longer part of the
			 * processor XML for these BASIL versions
			 */
			break;
	}
	d->current.processor_allocation = NULL;
	return;
}

/**
 * This function is registered to handle the processor allocation element
 * within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 */
static void
processor_allocation_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_processor_allocation_t *procalloc;

	if (stack_busted(d))
		return;
	procalloc = malloc(sizeof(basil_processor_allocation_t));
	if (!procalloc) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(procalloc, 0, sizeof(basil_processor_allocation_t));
	procalloc->rsvn_id = -1;
	if (d->current.processor_allocation) {
		(d->current.processor_allocation)->next = procalloc;
	} else {
		if (!d->current.processor) {
			parse_err_internal(d);
			free(procalloc);
			return;
		}
		(d->current.processor)->allocations = procalloc;
	}
	d->current.processor_allocation = procalloc;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
			if (procalloc->rsvn_id >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			procalloc->rsvn_id = atol(*vp);
			if (procalloc->rsvn_id < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (procalloc->rsvn_id < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_RSVN_ID);
		return;
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the memory array element within
 * an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
memory_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.memory_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	d->current.memory = NULL;
	return;
}

/**
 * @brief
 *	This function is registered to handle the memory element within an
 * inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 */
static void
memory_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_node_memory_t *memory;

	if (stack_busted(d))
		return;
	memory = malloc(sizeof(basil_node_memory_t));
	if (!memory) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(memory, 0, sizeof(basil_node_memory_t));
	memory->page_size_kb = -1;
	memory->page_count = -1;
	if (d->current.memory) {
		(d->current.memory)->next = memory;
	} else {
		if (!d->current.segment) {
			parse_err_internal(d);
			free(memory);
			return;
		}
		(d->current.segment)->memory = memory;
	}
	d->current.memory = memory;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_TYPE, *np) == 0) {
			if (memory->type != 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_OS, *vp) == 0) {
				memory->type = basil_memory_type_os;
			} else if (strcmp(BASIL_VAL_VIRTUAL, *vp) == 0) {
				memory->type = basil_memory_type_virtual;
			} else if (strcmp(BASIL_VAL_HUGEPAGE, *vp) == 0) {
				memory->type = basil_memory_type_hugepage;
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_PAGE_SIZE_KB, *np) == 0) {
			if (memory->page_size_kb >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			memory->page_size_kb = atol(*vp);
			if (memory->page_size_kb < 1) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_PAGE_COUNT, *np) == 0) {
			if (memory->page_count >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			memory->page_count = atol(*vp);
			if (memory->page_count < 1) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (!memory->type) {
		parse_err_unspecified_attr(d, BASIL_ATR_TYPE);
		return;
	}
	if (memory->page_size_kb < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_PAGE_SIZE_KB);
		return;
	}
	if (memory->page_count < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_PAGE_COUNT);
		return;
	}
	d->current.memory_allocation = NULL;
	return;
}

/**
 * @brief
 *	This function is registered to handle the memory allocation element
 * 	within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
memory_allocation_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_memory_allocation_t *memalloc;

	if (stack_busted(d))
		return;
	memalloc = malloc(sizeof(basil_memory_allocation_t));
	if (!memalloc) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(memalloc, 0, sizeof(basil_memory_allocation_t));
	memalloc->rsvn_id = -1;
	memalloc->page_count = -1;
	if (d->current.memory_allocation) {
		(d->current.memory_allocation)->next = memalloc;
	} else {
		if (!d->current.memory) {
			parse_err_internal(d);
			free(memalloc);
			return;
		}
		(d->current.memory)->allocations = memalloc;
	}
	d->current.memory_allocation = memalloc;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
			if (memalloc->rsvn_id >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			memalloc->rsvn_id = atol(*vp);
			if (memalloc->rsvn_id < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_PAGE_COUNT, *np) == 0) {
			if (memalloc->page_count > 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			memalloc->page_count = atol(*vp);
			if (memalloc->page_count <= 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (memalloc->rsvn_id < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_RSVN_ID);
		return;
	}
	if (memalloc->page_count <= 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_PAGE_COUNT);
		return;
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the label array element within
 * 	an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
label_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.label_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	d->current.label = NULL;
	return;
}

/**
 * @brief
 *	 This function is registered to handle the label element within an
 * 	inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
label_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_label_t *label;

	if (stack_busted(d))
		return;
	label = malloc(sizeof(basil_label_t));
	if (!label) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(label, 0, sizeof(basil_label_t));
	if (d->current.label) {
		(d->current.label)->next = label;
	} else {
		if (!d->current.segment) {
			parse_err_internal(d);
			free(label);
			return;
		}
		(d->current.segment)->labels = label;
	}
	d->current.label = label;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_NAME, *np) == 0) {
			if (*label->name) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			snprintf(label->name, BASIL_STRING_MEDIUM, "%s", *vp);
		} else if (strcmp(BASIL_ATR_TYPE, *np) == 0) {
			if (label->type) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_HARD, *vp) == 0) {
				label->type = basil_label_type_hard;
			} else if (strcmp(BASIL_VAL_SOFT, *vp) == 0) {
				label->type = basil_label_type_soft;
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_DISPOSITION, *np) == 0) {
			if (label->disposition) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_ATTRACT, *vp) == 0) {
				label->disposition =
					basil_label_disposition_attract;
			} else if (strcmp(BASIL_VAL_REPEL, *vp) == 0) {
				label->disposition =
					basil_label_disposition_repel;
			} else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (*label->name == '\0') {
		parse_err_unspecified_attr(d, BASIL_ATR_NAME);
		return;
	}
	if (!label->type) {
		label->type = basil_label_type_hard;
	}
	if (!label->disposition) {
		label->disposition = basil_label_disposition_attract;
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the accelerator array element
 * 	within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
accelerator_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.accelerator_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	d->current.accelerator = NULL;
	return;
}

/**
 * @brief
 * 	This function is registered to handle the accelerator element within an
 * 	inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
accelerator_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_node_accelerator_t *accelerator;
	basil_accelerator_gpu_t *gpu;
	char *family;

	if (stack_busted(d))
		return;
	accelerator = malloc(sizeof(basil_node_accelerator_t));
	if (!accelerator) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(accelerator, 0, sizeof(basil_node_accelerator_t));
	gpu = malloc(sizeof(basil_accelerator_gpu_t));
	if (!gpu) {
		parse_err_out_of_memory(d);
		free(accelerator);
		return;
	}
	memset(gpu, 0, sizeof(basil_accelerator_gpu_t));
	accelerator->data.gpu = gpu;
	if (d->current.accelerator) {
		(d->current.accelerator)->next = accelerator;
	} else {
		if (!d->current.node) {
			parse_err_internal(d);
			free(gpu);
			free(accelerator);
			return;
		}
		(d->current.node)->accelerators = accelerator;
	}
	d->current.accelerator = accelerator;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		int len = 0;
		if (strcmp(BASIL_ATR_ORDINAL, *np) == 0) {
			/*
			 * Do nothing with the ordinal there is no
			 * place in the structure to put it
			 */
		} else if (strcmp(BASIL_ATR_TYPE, *np) == 0) {
			if (accelerator->type) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_GPU, *vp) == 0) {
				accelerator->type = basil_accel_gpu;
				d->current.accel_type_gpu++;
			} else {
				d->current.accel_type_unknown++;
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_STATE, *np) == 0) {
			if (accelerator->state) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if (strcmp(BASIL_VAL_UP, *vp) == 0) {
				d->current.accel_state_up++;
				accelerator->state = basil_accel_state_up;
			} else if (strcmp(BASIL_VAL_DOWN, *vp) == 0) {
				d->current.accel_state_down++;
				accelerator->state = basil_accel_state_down;
			} else {
				d->current.accel_state_unknown++;
				accelerator->state = basil_accel_state_unknown;
			}
		} else if (strcmp(BASIL_ATR_FAMILY, *np) == 0) {
			if (gpu->family) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			len = strlen(*vp) + 1;
			family = malloc(len);
			if (!family) {
				parse_err_out_of_memory(d);
				return;
			}
			snprintf(family, len, "%s", *vp);
			gpu->family = family;
		} else if (strcmp(BASIL_ATR_MEMORY_MB, *np) == 0) {
			if (gpu->memory > 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			gpu->memory = atoi(*vp);
			if (gpu->memory < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_CLOCK_MHZ, *np) == 0) {
			if (gpu->clock_mhz > 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			gpu->clock_mhz = atoi(*vp);
			if (gpu->memory < 1) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (!accelerator->type) {
		parse_err_unspecified_attr(d, BASIL_ATR_TYPE);
		return;
	}
	if (!accelerator->state) {
		parse_err_unspecified_attr(d, BASIL_ATR_STATE);
		return;
	}
	if (!gpu->family) {
		parse_err_unspecified_attr(d, BASIL_ATR_FAMILY);
		return;
	}
	if (gpu->clock_mhz < 1) {
		parse_err_unspecified_attr(d, BASIL_ATR_CLOCK_MHZ);
		return;
	}
	d->current.accelerator_allocation = NULL;
	return;
}

/**
 * @brief
 * 	This function is registered to handle the accelerator allocation element
 * 	within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
accelerator_allocation_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_accelerator_allocation_t *accelalloc;

	if (stack_busted(d))
		return;
	accelalloc = malloc(sizeof(basil_accelerator_allocation_t));
	if (!accelalloc) {
		parse_err_out_of_memory(d);
		return;
	}
	memset(accelalloc, 0, sizeof(basil_accelerator_allocation_t));
	accelalloc->rsvn_id = -1;
	if (d->current.accelerator_allocation) {
		(d->current.accelerator_allocation)->next = accelalloc;
	} else {
		if (!d->current.accelerator) {
			parse_err_internal(d);
			free(accelalloc);
			return;
		}
		(d->current.accelerator)->allocations = accelalloc;
	}
	d->current.accelerator_allocation = accelalloc;
	/*
	 * Work through the attribute pairs updating the name pointer and
	 * value pointer with each loop. The somewhat complex loop control
	 * syntax is just a fancy way of stepping through the pairs.
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
			if (accelalloc->rsvn_id >= 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			accelalloc->rsvn_id = atol(*vp);
			if (accelalloc->rsvn_id < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
	if (accelalloc->rsvn_id < 0) {
		parse_err_unspecified_attr(d, BASIL_ATR_RSVN_ID);
		return;
	}
	return;
}

/**
 * @brief
 *	 This function is registered to handle the reservation array element
 * 	within an inventory response.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
reservation_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.reservation_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	d->current.reservation = NULL;
	return;
}

/**
 * This function is registered to handle the reservation element within a
 * query response.  This is used for both status response and inventory response.
 *
 * The standard Expat start handler function prototype is used.
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 */
static void
reservation_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_rsvn_t *rsvn;
	basil_response_t *brp;
	basil_response_query_status_res_t *res_status = NULL;
	basil_response_switch_res_t *switch_res = NULL;

	if (stack_busted(d))
		return;

	/*
	 * Which type of reservation line is this?  Is it for an INVENTORY response?
	 * Or is it for a SWITCH STATUS response?
	 */
	brp = d->brp;
	if (!brp)
		return;

	if ((brp->method == basil_method_query) && (brp->data.query.type == basil_query_status)) {
		/* This is for a SWITCH status response */
		res_status = malloc(sizeof(basil_response_query_status_res_t));
		if (!res_status) {
			parse_err_out_of_memory(d);
			return;
		}
		memset(res_status, 0, sizeof(basil_response_query_status_res_t));
		res_status->rsvn_id = -1;
		res_status->status = basil_reservation_status_none;
		if (d->brp->data.query.data.status.reservation) {
			(d->brp->data.query.data.status.reservation)->next = res_status;
		} else {
			d->brp->data.query.data.status.reservation = res_status;
		}

		/*
		 * work through the attribute pairs updating the name pointer
		 * and value pointer with each loop.  The somewhat complex loop
		 * control syntax is just a fancy way of stepping through
		 * the pairs.
		 */
		for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
			xml_dbg("%s: %s = %s", (char *) __func__, *np, *vp);
			if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
				if (res_status->rsvn_id >= 0) {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				res_status->rsvn_id = atol(*vp);
				if (res_status->rsvn_id < 0) {
					parse_err_illegal_attr_val(d, *np, *vp);
					return;
				}
			} else if (strcmp(BASIL_ATR_STATUS, *np) == 0) {
				if (res_status->status > 0) {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				if (strcmp(BASIL_VAL_EMPTY, *vp) == 0) {
					res_status->status = basil_reservation_status_empty;
				} else if (strcmp(BASIL_VAL_INVALID, *vp) == 0) {
					res_status->status = basil_reservation_status_invalid;
				} else if (strcmp(BASIL_VAL_MIX, *vp) == 0) {
					res_status->status = basil_reservation_status_mix;
				} else if (strcmp(BASIL_VAL_RUN, *vp) == 0) {
					res_status->status = basil_reservation_status_run;
				} else if (strcmp(BASIL_VAL_SUSPEND, *vp) == 0) {
					res_status->status = basil_reservation_status_suspend;
				} else if (strcmp(BASIL_VAL_SWITCH, *vp) == 0) {
					res_status->status = basil_reservation_status_switch;
				} else if (strcmp(BASIL_VAL_UNKNOWN, *vp) == 0) {
					res_status->status = basil_reservation_status_unknown;
				} else {
					parse_err_illegal_attr_val(d, *np, *vp);
					return;
				}
			} else {
				parse_err_unrecognized_attr(d, *np);
				return;
			}
		}
		if (res_status->rsvn_id < 0) {
			parse_err_unspecified_attr(d, BASIL_ATR_RSVN_ID);
			return;
		}
		if (res_status->status == basil_reservation_status_none) {
			parse_err_unspecified_attr(d, BASIL_ATR_STATUS);
			return;
		}
	} else if (brp->method == basil_method_switch) {
		/* This is for a response to a SWITCH request */
		switch_res = malloc(sizeof(basil_response_switch_res_t));
		if (!switch_res) {
			parse_err_out_of_memory(d);
			return;
		}
		memset(switch_res, 0, sizeof(basil_response_switch_res_t));

		switch_res->rsvn_id = -1;
		switch_res->status = basil_reservation_status_none;
		if (brp->data.swtch.reservation) {
			(brp->data.swtch.reservation)->next = switch_res;
		} else {
			brp->data.swtch.reservation = switch_res;
		}
		/*
		 * work through the attribute pairs updating the name pointer
		 * and value pointer with each loop.  The somewhat complex loop
		 * control syntax is just a fancy way of stepping through
		 * the pairs.
		 */
		for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
			xml_dbg("%s: %s = %s", (char *) __func__, *np, *vp);
			if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
				if (switch_res->rsvn_id >= 0) {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				switch_res->rsvn_id = atol(*vp);
				if (switch_res->rsvn_id < 0) {
					parse_err_illegal_attr_val(d, *np, *vp);
					return;
				}
			} else if (strcmp(BASIL_ATR_STATUS, *np) == 0) {
				if (switch_res->status > 0) {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				if (strcmp(BASIL_VAL_SUCCESS, *vp) == 0) {
					switch_res->status = basil_switch_status_success;
				} else if (strcmp(BASIL_VAL_FAILURE, *vp) == 0) {
					/* do nothing here, brp->error was set 	*/
					/* in alps_request_parent 		*/
				} else {
					parse_err_illegal_attr_val(d, *np, *vp);
					return;
				}
			} else {
				parse_err_unrecognized_attr(d, *np);
				return;
			}
		}
	} else {
		/* This is for an inventory response */
		rsvn = malloc(sizeof(basil_rsvn_t));
		if (!rsvn) {
			parse_err_out_of_memory(d);
			return;
		}
		memset(rsvn, 0, sizeof(basil_rsvn_t));
		rsvn->rsvn_id = -1;
		if (d->current.reservation) {
			(d->current.reservation)->next = rsvn;
		} else {
			brp->data.query.data.inventory.rsvns = rsvn;
		}
		d->current.reservation = rsvn;
		/*
		 * Work through the attribute pairs updating the name pointer and
		 * value pointer with each loop. The somewhat complex loop control
		 * syntax is just a fancy way of stepping through the pairs.
		 */
		for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
			xml_dbg("%s: %s = %s", __func__, *np, *vp);
			if (strcmp(BASIL_ATR_RSVN_ID, *np) == 0) {
				if (rsvn->rsvn_id >= 0) {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				rsvn->rsvn_id = atol(*vp);
				if (rsvn->rsvn_id < 0) {
					parse_err_illegal_attr_val(d, *np, *vp);
					return;
				}
			} else if (strcmp(BASIL_ATR_USER_NAME, *np) == 0) {
				if (*rsvn->user_name != '\0') {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				snprintf(rsvn->user_name, BASIL_STRING_MEDIUM,
					 "%s", *vp);
			} else if (strcmp(BASIL_ATR_ACCOUNT_NAME, *np) == 0) {
				if (*rsvn->account_name != '\0') {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				snprintf(rsvn->account_name, BASIL_STRING_MEDIUM,
					 "%s", *vp);
			} else if (strcmp(BASIL_ATR_TIME_STAMP, *np) == 0) {
				if (*rsvn->time_stamp != '\0') {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				snprintf(rsvn->time_stamp, BASIL_STRING_MEDIUM,
					 "%s", *vp);
			} else if (strcmp(BASIL_ATR_BATCH_ID, *np) == 0) {
				if (*rsvn->batch_id != '\0') {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				snprintf(rsvn->batch_id, BASIL_STRING_LONG,
					 "%s", *vp);
			} else if (strcmp(BASIL_ATR_RSVN_MODE, *np) == 0) {
				if (*rsvn->rsvn_mode != '\0') {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				snprintf(rsvn->rsvn_mode, BASIL_STRING_MEDIUM,
					 "%s", *vp);
			} else if (strcmp(BASIL_ATR_GPC_MODE, *np) == 0) {
				if (*rsvn->gpc_mode != '\0') {
					parse_err_multiple_attrs(d, *np);
					return;
				}
				snprintf(rsvn->gpc_mode, BASIL_STRING_MEDIUM,
					 "%s", *vp);
			} else {
				parse_err_unrecognized_attr(d, *np);
				return;
			}
		}
		if (rsvn->rsvn_id < 0) {
			parse_err_unspecified_attr(d, BASIL_ATR_RSVN_ID);
			return;
		}
		if (*rsvn->user_name == '\0') {
			parse_err_unspecified_attr(d, BASIL_ATR_USER_NAME);
			return;
		}
		if (*rsvn->account_name == '\0') {
			parse_err_unspecified_attr(d, BASIL_ATR_ACCOUNT_NAME);
			return;
		}
		d->count.application_array = 0;
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the application array element
 * 	within an inventory response.
 *
 * @note
 * 	PBS accepts this element but ignores it.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
application_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.application_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the application element
 * 	within an inventory response.
 *
 * @note
 * 	PBS accepts this element but ignores it.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
application_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	if (stack_busted(d))
		return;
	d->count.command_array = 0;
	return;
}

/**
 * @brief
 * 	This function is registered to handle the command array element
 * 	within an inventory response.
 *
 * @note
 * 	PBS accepts this element but ignores it.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
command_array_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;
	if (++(d->count.command_array) > 1) {
		parse_err_multiple_elements(d);
		return;
	}
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		parse_err_unrecognized_attr(d, *np);
		return;
	}
	return;
}

/**
 * @brief
 * 	This function is registered to handle the XML elements that are
 * 	to be ignored.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
ignore_element(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;

	if (stack_busted(d))
		return;

	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
	}
	return;
}

/**
 * @brief
 * 	Generic method registered to handle character data for elements
 * 	that do not utilize it. Make sure we skip whitespace characters
 * 	since they may be there for formatting.
 *
 * The standard Expat character handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] s string
 * @param[in] len length of string
 *
 * @return Void
 *
 */
static void
disallow_char_data(ud_t *d, const XML_Char *s, int len)
{
	int i;

	for (i = 0; i < len; i++) {
		if (!isspace(*(s + i)))
			break;
	}
	if (i == len)
		return;
	parse_err_illegal_char_data(d, s);
	return;
}

/**
 * @brief
 * Helper function for allow_char_data() that is registered to handle
 * character data for elements.
 * The user data structure (ud_t) is populated with the node rangelist associated
 * with the 'Nodes' element (in the System BASIL 1.7 XML response), that is
 * currently being processed.
 *
 * @param d pointer to user data structure.
 * @param[in] s string.
 * @param[in] len length of string.
 *
 * @return void
 */
static void
parse_nidlist_char_data(ud_t *d, const char *s, int len)
{
	char *tmp_ptr = NULL;

	/*
	 * Point 'nidlist' to a copy of s (which now contains the parsed char data
	 * i.e. the node rangelist).
	 */
	if ((d->current_sys.node_group->nidlist = strndup(s, len)) == NULL) {
		parse_err_out_of_memory(d);
		d->current_sys.node_group->nidlist = NULL;
		return;
	}

	/*
	 * Check if the current rangelist of Nodes is of type KNL and that such Nodes
	 * are in "batch" mode.  Checking the state of the node while parsing the
	 * system query for node list is not require, doing this will keep this
	 * (KNL node(s) in down state) out of KNL node list we populate (which we
	 * use in inventory_to_vnodes to skip these node while creating non KNL nodes)
	 * and if this node comes up in the inventory query then this(KNL node) will
	 * be created as non KNL node.
	 */
	if (!exclude_from_KNL_processing(d->current_sys.node_group, 0)) {
		/*
		 * Accummulate KNL Nodes, extracted from each Node group, in a buffer
		 * for later use. The KNL Nodes in this buffer will be excluded from vnode
		 * creation in inventory_to_vnodes() (which creates non-KNL vnodes only).
		 */
		if (!knl_node_list) {
			knl_node_list = malloc(sizeof(char) * (len + 1));
			if (knl_node_list == NULL) {
				log_err(errno, __func__, "malloc failure");
				return;
			}
			pbs_strncpy(knl_node_list, d->current_sys.node_group->nidlist, (len + 1));
		} else {
			/* Allocate an extra byte for the "," separation between rangelists. */
			tmp_ptr = realloc(knl_node_list, sizeof(char) * (strlen(knl_node_list) + len + 2));
			if (!tmp_ptr) {
				log_err(errno, __func__, "realloc failure");
				free(knl_node_list);
				knl_node_list = NULL;
				return;
			}
			knl_node_list = tmp_ptr;

			/*
			 * To maintain comma separation between Node rangelists belonging
			 * to each Node Group (in the System XML Response), we append a
			 * "," at the end of the current array e.g. 12,13-15,16,17 is what
			 * we want and not 12,13-1516,17.
			 */
			strcat(knl_node_list, ",");
			strcat(knl_node_list, d->current_sys.node_group->nidlist);
		}
	}
}

/**
 * @brief
 * Function registered to handle character data for XML Elements
 * that utilize it. Skip leading whitespace characters since they
 * may be there for formatting.
 *
 * @param d pointer to user data structure.
 * @param[in] s string.
 * @param[in] len length of string.
 *
 * @return void
 */
static void
allow_char_data(ud_t *d, const XML_Char *s, int len)
{
	int i = 0;
	int j = 0;

	/*
	 * As an example, a string 's' could initially point to a rangelist
	 * "  12-15,18,19,20".  'j' accummulates the leading whitespace count.
	 */
	for (i = 0; i < len; i++) {
		if (!isspace(*(s + i)))
			break;
		j++;
	}
	if (i == len)
		return;

	/*
	 * 's+j' is the location where the 'useful' data starts.
	 * Subtracting the whitespace count from 'len' gives the true length of
	 * the node rangelist string e.g. "12-15,18,19,20".
	 */
	parse_nidlist_char_data(d, s + j, len - j);
}

/**
 * @brief
 * 	Generic method registered to handle the end of an element where
 * 	no post processing needs to take place. Make sure the element end
 * 	is balanced with the element start.
 *
 * The standard Expat end handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el name of end element
 *
 * @return Void
 *
 */
static void
default_element_end(ud_t *d, const XML_Char *el)
{
	if (strcmp(el, handler[d->stack[d->depth]].element) != 0)
		parse_err_illegal_end(d, el);
	return;
}

/**
 * @brief
 * 	Special method registered to handle the end of the inventory element.
 * 	The counts for the roles and states of the nodes are logged here.
 *
 * The standard Expat end handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el name of end element
 *
 * @return Void
 *
 */
static void
inventory_end(ud_t *d, const XML_Char *el)
{
	if (strcmp(el, handler[d->stack[d->depth]].element) != 0)
		parse_err_illegal_end(d, el);

	sprintf(log_buffer, "%d interactive, %d batch, %d unknown",
		d->current.role_int,
		d->current.role_batch,
		d->current.role_unknown);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  "roles", log_buffer);
	sprintf(log_buffer, "%d up, %d down, %d unavailable, %d routing, "
			    "%d suspect, %d admin, %d unknown",
		d->current.state_up,
		d->current.state_down,
		d->current.state_unavail,
		d->current.state_routing,
		d->current.state_suspect,
		d->current.state_admin,
		d->current.state_unknown);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  "state", log_buffer);
	sprintf(log_buffer, "%d gpu, %d unknown",
		d->current.accel_type_gpu,
		d->current.accel_type_unknown);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  "accelerator types", log_buffer);
	sprintf(log_buffer, "%d up, %d down, %d unknown",
		d->current.accel_state_up,
		d->current.accel_state_down,
		d->current.accel_state_unknown);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  "accelerator state", log_buffer);
	sprintf(log_buffer, "%d sockets", d->current.socket_count);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  "inventory", log_buffer);
	return;
}

/**
 * @brief
 * 	Find the element handler function registered for a particular element.
 *
 * @param[in] el name of element to search for
 * @return index of the matching handler array entry
 *
 * @return 		int
 * @retval -1 no 	match
 * @retval  !(-1) 	matched index
 *
 */
int
handler_find_index(const XML_Char *el)
{
	int i = 0;

	for (i = 1; handler[i].element; i++) {
		if (strcmp(handler[i].element, el) == 0)
			return (i);
	}
	return (-1);
}

/**
 * @brief
 * 	Parse the start of any element by looking up its handler and
 * 	calling it.
 *
 * The standard Expat start handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return Void
 *
 */
static void
parse_element_start(void *ud, const XML_Char *el, const XML_Char **atts)
{
	int i = 0;
	ud_t *d;

	if (!ud)
		return;
	d = (ud_t *) ud;
	xml_dbg("parse_element_start: ELEMENT = %s", el);
	i = handler_find_index(el);
	if (i < 0) {
		sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
		sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
		snprintf(d->message, sizeof(d->message),
			 "Unrecognized element start at line %d: %s",
			 (int) XML_GetCurrentLineNumber(parser), el);
		return;
	}
	d->depth++;
	d->stack[d->depth] = i;
	handler[i].start(d, el, atts);
	return;
}

/**
 * @brief
 * 	Parse the end of any element by looking up its handler and
 * 	calling it.
 *
 * The standard Expat end handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] el name of end element
 *
 * @return Void
 *
 */
static void
parse_element_end(void *ud, const XML_Char *el)
{
	int i = 0;
	ud_t *d;

	if (!ud)
		return;
	d = (ud_t *) ud;
	xml_dbg("parse_element_end: ELEMENT = %s", el);
	i = handler_find_index(el);
	if (i < 0) {
		sprintf(d->error_class, "%s", BASIL_VAL_PERMANENT);
		sprintf(d->error_source, "%s", BASIL_VAL_SYNTAX);
		snprintf(d->message, sizeof(d->message),
			 "Unrecognized element end at line %d: %s",
			 (int) XML_GetCurrentLineNumber(parser), el);
		return;
	}
	handler[i].end(d, el);
	d->stack[d->depth] = 0;
	d->depth--;
	return;
}

/**
 * @brief
 * 	Parse the character data for any element by invoking the registered
 *	handler.
 *
 * The standard Expat character handler function prototype is used.
 *
 * @param d pointer to user data structure
 * @param[in] s string
 * @param[in] len length of string
 *
 * @return Void
 *
 */
static void
parse_char_data(void *ud, const XML_Char *s, int len)
{
	ud_t *d;

	if (!ud)
		return;
	d = (ud_t *) ud;
	handler[d->stack[d->depth]].char_data(d, s, len);
	return;
}

/**
 * @brief
 *	This function walks all the segments and fills in the information needed to
 * generate the vnodes. It is called directly when PBS is using BASIL 1.2 or
 * prior XML inventories. It is called from within the socket loop when PBS
 * gets BASIL 1.3 and BASIL 1.4 XML inventory.
 * @param[in] node	information about the node
 * @param[in] nv	vnode list information
 * @param[in] arch	the architecture of the vnode
 * @param[in/out] total_seg	latest count of the segments, to increase
 *				across sockets
 * @param[in] order	order number of the vnode
 * @param[in/out] name_buf	upon exiting it contains the name of the vnode
 * @param[in/out] total_cpu	keeps a running count of cpus for the whole node
 * @param[in/out] total_mem	keeps a running count of mem for the whole node
 *
 * These last three parameters are used for the vnode_per_numa_node = 0 case.
 * Where we only create one PBS vnode per Cray compute node
 *
 * @return Void
 */
void
inventory_loop_on_segments(basil_node_t *node, vnl_t *nv, char *arch,
			   int *total_seg, long order, char *name_buf, int *total_cpu, long *total_mem)
{
	basil_node_socket_t *socket = NULL;
	basil_node_segment_t *seg = NULL;
	basil_node_processor_t *proc = NULL;
	basil_node_memory_t *mem = NULL;
	basil_label_t *label = NULL;
	basil_node_accelerator_t *accel = NULL;
	basil_node_computeunit_t *cu = NULL;
	int aflag = READ_WRITE | ATR_DFLAG_CVTSLT;
	long totmem = 0;
	int totcpus = 0;
	int totaccel = 0;
	int first_seg = 0;
	char vname[VNODE_NAME_LEN];
	char *attr;
	int totseg = 0;

	/* Proceed only if we have valid pointers */
	if (node == NULL) {
		sprintf(log_buffer, "Bad pointer to node info");
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE,
			  LOG_ERR, __func__, log_buffer);
		return;
	}
	if (nv == NULL) {
		sprintf(log_buffer, "Bad pointer to node list info");
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE,
			  LOG_ERR, __func__, log_buffer);
		return;
	}

	totseg = *total_seg;
	totcpus = *total_cpu;
	totmem = *total_mem;

	socket = node->sockets;
	do {
		if (socket) {
			seg = socket->segments;
			socket = socket->next;
		} else {
			seg = node->segments;
		}

		for (; seg; seg = seg->next, totseg++) {
			if (totseg == 0) {
				/* The first segment is different and important
				 * because some information is only attached to the
				 * very first segment of a vnode.
				 */
				first_seg = 1;
			}
			if (vnode_per_numa_node) {
				snprintf(vname, sizeof(vname), "%s_%ld_%d",
					 mpphost, node->node_id, totseg);
				vname[sizeof(vname) - 1] = '\0';
			} else if (first_seg) {
				/* When concatenating the segments into
				 * one vnode, we don't put any segment info
				 * in the name.
				 */
				snprintf(vname, sizeof(vname), "%s_%ld",
					 mpphost, node->node_id);
				vname[sizeof(vname) - 1] = '\0';
			}

			attr = "sharing";
			/* already exists so don't define type */
			if (vn_addvnr(nv, vname, attr,
				      ND_Force_Exclhost,
				      0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.PBScrayorder";
			sprintf(utilBuffer, "%ld", order);
			if (vn_addvnr(nv, vname, attr, utilBuffer,
				      ATR_TYPE_LONG, aflag,
				      NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.arch";
			if (vn_addvnr(nv, vname, attr, arch,
				      0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.host";
			sprintf(utilBuffer, "%s_%ld", mpphost, node->node_id);
			if (vn_addvnr(nv, vname, attr, utilBuffer,
				      0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.PBScraynid";
			sprintf(utilBuffer, "%ld", node->node_id);
			if (vn_addvnr(nv, vname, attr, utilBuffer,
				      ATR_TYPE_STR, aflag,
				      NULL) == -1)
				goto bad_vnl;

			if (vnode_per_numa_node) {
				attr = "resources_available.PBScrayseg";
				sprintf(utilBuffer, "%d", totseg);
				if (vn_addvnr(nv, vname, attr, utilBuffer,
					      ATR_TYPE_STR, aflag,
					      NULL) == -1)
					goto bad_vnl;
			}

			attr = "resources_available.vntype";
			if (vn_addvnr(nv, vname, attr, CRAY_COMPUTE,
				      0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.PBScrayhost";
			if (vn_addvnr(nv, vname, attr, mpphost,
				      ATR_TYPE_STR, aflag,
				      NULL) == -1)
				goto bad_vnl;

			if (vnode_per_numa_node) {
				totcpus = 0;
				cu = seg->computeunits;
				if (cu) {
					for (cu = seg->computeunits; cu; cu = cu->next) {
						totcpus++;
					}
				} else {
					for (proc = seg->processors; proc; proc = proc->next)
						totcpus++;
				}

				attr = "resources_available.ncpus";
				sprintf(utilBuffer, "%d", totcpus);
				if (vn_addvnr(nv, vname, attr, utilBuffer,
					      0, 0, NULL) == -1)
					goto bad_vnl;

				attr = "resources_available.mem";
				totmem = 0;
				for (mem = seg->memory; mem; mem = mem->next)
					totmem += (mem->page_size_kb * mem->page_count);
				sprintf(utilBuffer, "%ldkb", totmem);
				if (vn_addvnr(nv, vname, attr, utilBuffer,
					      0, 0, NULL) == -1)
					goto bad_vnl;

				for (label = seg->labels; label; label = label->next) {
					sprintf(utilBuffer,
						"resources_available.PBScraylabel_%s",
						label->name);
					if (vn_addvnr(nv, vname, utilBuffer, "true",
						      ATR_TYPE_BOOL, aflag,
						      NULL) == -1)
						goto bad_vnl;
				}
			} else {
				/*
				 * vnode_per_numa_node is false, which
				 * means we need to compress all the segment info (and
				 * in the case of BASIl 1.3 and higher the socket
				 * info too) into only one vnode. We need to
				 * total up the cpus and memory for each of the
				 * segments and report it as part of the
				 * whole vnode. Add/set labels only once.
				 * All labels are assumed to be the same on
				 * all segments.
				 */
				for (mem = seg->memory; mem; mem = mem->next)
					totmem += mem->page_size_kb * mem->page_count;

				cu = seg->computeunits;
				if (cu) {
					for (cu = seg->computeunits; cu; cu = cu->next) {
						totcpus++;
					}
				} else {
					for (proc = seg->processors; proc; proc = proc->next)
						totcpus++;
				}

				if (totseg == 0) {
					for (label = seg->labels; label; label = label->next) {
						sprintf(utilBuffer,
							"resources_available.PBScraylabel_%s",
							label->name);
						if (vn_addvnr(nv, vname, utilBuffer, "true",
							      ATR_TYPE_BOOL, aflag,
							      NULL) == -1)
							goto bad_vnl;
					}
				}
			}
			/* Only do this for nodes that have accelerators */
			if (node->accelerators) {
				for (accel = node->accelerators, totaccel = 0;
				     accel; accel = accel->next) {
					if (accel->state == basil_accel_state_up)
						/* Only count them if the state is UP */
						totaccel++;
				}
				attr = "resources_available.naccelerators";
				if (totseg == 0) {
					/*
					 * add the naccelerators count only to
					 * the first vnode of a compute node
					 * all other vnodes will share the count
					 */
					snprintf(utilBuffer, sizeof(utilBuffer),
						 "%d", totaccel);
				} else if (vnode_per_numa_node) {
					/*
					 * When there is a vnode being created
					 * per numa node, only the first
					 * (segment 0) vnode gets the accelerator.
					 * The other vnodes must
					 * share the accelerator count with
					 * segment 0 vnodes
					 */
					snprintf(utilBuffer, sizeof(utilBuffer),
						 "@%s_%ld_0",
						 mpphost, node->node_id);
				}

				if (vnode_per_numa_node || totseg == 0) {
					if (vn_addvnr(nv, vname, attr, utilBuffer,
						      0, 0, NULL) == -1)
						goto bad_vnl;
				}

				attr = "resources_available.accelerator";
				if (totaccel > 0) {
					/* set to 'true' if the accelerator
					 * is in state=up, totaccel is only
					 * incremented if state=up
					 */
					snprintf(utilBuffer, sizeof(utilBuffer), "true");
				} else {
					/* set to 'false' to show that the
					 * vnode has accelerator(s) but they
					 * are not currently state=up
					 */
					snprintf(utilBuffer, sizeof(utilBuffer), "false");
				}

				if (vn_addvnr(nv, vname, attr, utilBuffer,
					      0, 0, NULL) == -1)
					goto bad_vnl;

				/*
				 * Only set accelerator_model and
				 * accelerator_memory if the accelerator is UP
				 */
				if (totaccel > 0) {
					accel = node->accelerators;
					if (accel->data.gpu) {
						if (strcmp(accel->data.gpu->family, BASIL_VAL_UNKNOWN) == 0) {
							sprintf(log_buffer, "The GPU family "
									    "value is 'UNKNOWN'. Check "
									    "your Cray GPU inventory.");
							log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__, log_buffer);
						}
						attr = "resources_available.accelerator_model";
						snprintf(utilBuffer, sizeof(utilBuffer),
							 "%s",
							 accel->data.gpu->family);
						if (vn_addvnr(nv, vname, attr,
							      utilBuffer, 0,
							      0, NULL) == -1)
							goto bad_vnl;
						if (accel->data.gpu->memory) {
							attr = "resources_available.accelerator_memory";
							if (totseg == 0) {
								snprintf(utilBuffer,
									 sizeof(utilBuffer),
									 "%umb",
									 accel->data.gpu->memory);
							} else if (vnode_per_numa_node) {
								snprintf(utilBuffer,
									 sizeof(utilBuffer),
									 "@%s_%ld_0",
									 mpphost, node->node_id);
							}

							if (vnode_per_numa_node || totseg == 0) {
								if (vn_addvnr(nv, vname, attr,
									      utilBuffer, 0,
									      0, NULL) == -1)
									goto bad_vnl;
							}
						}
					}
				}
			}
		}

	} while (socket);

	pbs_strncpy(name_buf, vname, VNODE_NAME_LEN);
	*total_cpu = totcpus;
	*total_mem = totmem;
	*total_seg = totseg;

	return;

bad_vnl:
	sprintf(log_buffer, "creation of Cray vnodes failed at %ld, with vname %s", order, vname);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  __func__, log_buffer);
	/*
	 * don't free nv since it might be important in the dump
	 */
	abort();
}

/**
 * @brief
 * 	After the Cray inventory XML response is parsed, use the resulting structures
 * to generate vnodes for the compute nodes and send them to the server.
 *
 * @param brp ALPS inventory response
 *
 * @return	int
 * @retval	0	: success
 * @retval	-1	: failure
 */
static int
inventory_to_vnodes(basil_response_t *brp)
{
	extern int internal_state_update;
	extern int num_acpus;
	extern unsigned long totalmem;
	int aflag = READ_WRITE | ATR_DFLAG_CVTSLT;
	long order = 0;
	char *attr;
	vnl_t *nv = NULL;
	int ret = 0;
	char *xmlbuf;
	int xmllen = 0;
	int seg_num = 0;
	int cpu_ct = 0;
	long *arr_nodes = NULL;
	int node_count = 0;
	int idx = 0;
	int skip_node = 0;
	long mem_ct = 0;
	char name[VNODE_NAME_LEN];
	basil_node_t *node = NULL;
	basil_response_query_inventory_t *inv = NULL;
	hwloc_topology_t topology;

	if (!brp)
		return -1;
	if (brp->method != basil_method_query) {
		snprintf(log_buffer, sizeof(log_buffer), "Wrong method: %d", brp->method);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			  __func__, log_buffer);
		return -1;
	}
	if (brp->data.query.type != basil_query_inventory) {
		snprintf(log_buffer, sizeof(log_buffer), "Wrong query type: %d",
			 brp->data.query.type);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			  __func__, log_buffer);
		return -1;
	}
	if (*brp->error != '\0') {
		snprintf(log_buffer, sizeof(log_buffer), "Error in BASIL response: %s", brp->error);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			  __func__, log_buffer);
		return -1;
	}

	if (vnl_alloc(&nv) == NULL) {
		log_err(errno, __func__, "vnl_alloc failed!");
		return -1;
	}
	pbs_strncpy(mpphost, brp->data.query.data.inventory.mpp_host,
		    sizeof(mpphost));
	nv->vnl_modtime = (long) brp->data.query.data.inventory.timestamp;

	/*
	 * add login node
	 */
	ret = 0;
	if (hwloc_topology_init(&topology) == -1)
		ret = -1;
	else if ((hwloc_topology_set_flags(topology,
					   HWLOC_TOPOLOGY_FLAG_WHOLE_SYSTEM | HWLOC_TOPOLOGY_FLAG_IO_DEVICES) == -1) ||
		 (hwloc_topology_load(topology) == -1) ||
		 (hwloc_topology_export_xmlbuffer(topology, &xmlbuf, &xmllen) == -1)) {
		hwloc_topology_destroy(topology);
		ret = -1;
	}
	if (ret < 0) {
		/* on any failure above, issue log message */
		log_err(PBSE_SYSTEM, __func__, "topology init/load/export failed");
		return -1;
	} else {
		char *lbuf;
		int lbuflen = xmllen + 1024;

		/*
		 *	xmlbuf is almost certain to overflow log_buffer's size,
		 *	so for logging this information, we allocate one large
		 *	enough to hold it
		 */
		if ((lbuf = malloc(lbuflen)) == NULL) {
			snprintf(log_buffer, sizeof(log_buffer), "malloc logbuf (%d) failed",
				 lbuflen);
			hwloc_free_xmlbuffer(topology, xmlbuf);
			hwloc_topology_destroy(topology);
			return -1;
		} else {
			snprintf(lbuf, lbuflen, "allocated log buffer, len %d", lbuflen);
			log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE,
				  LOG_DEBUG, __func__, lbuf);
		}
		log_event(PBSEVENT_DEBUG4,
			  PBS_EVENTCLASS_NODE,
			  LOG_DEBUG, __func__, "topology exported");
		snprintf(lbuf, lbuflen, "%s%s", NODE_TOPOLOGY_TYPE_HWLOC, xmlbuf);
		if (vn_addvnr(nv, mom_short_name, ATTR_NODE_TopologyInfo,
			      lbuf, ATR_TYPE_STR, READ_ONLY, NULL) == -1) {
			hwloc_free_xmlbuffer(topology, xmlbuf);
			hwloc_topology_destroy(topology);
			free(lbuf);
			goto bad_vnl;
		} else {
			snprintf(lbuf, lbuflen, "attribute '%s = %s%s' added",
				 ATTR_NODE_TopologyInfo,
				 NODE_TOPOLOGY_TYPE_HWLOC, xmlbuf);
			log_event(PBSEVENT_DEBUG4,
				  PBS_EVENTCLASS_NODE,
				  LOG_DEBUG, __func__, lbuf);
			hwloc_free_xmlbuffer(topology, xmlbuf);
			hwloc_topology_destroy(topology);
			free(lbuf);
		}
	}
	attr = "resources_available.ncpus";
	snprintf(utilBuffer, sizeof(utilBuffer), "%d", num_acpus);
	/* already exists so don't define type */
	if (vn_addvnr(nv, mom_short_name, attr, utilBuffer, 0, 0, NULL) == -1)
		goto bad_vnl;
	attr = "resources_available.mem";
	snprintf(utilBuffer, sizeof(utilBuffer), "%lukb", totalmem);
	/* already exists so don't define type */
	if (vn_addvnr(nv, mom_short_name, attr, utilBuffer, 0, 0, NULL) == -1)
		goto bad_vnl;

	attr = "resources_available.vntype";
	if (vn_addvnr(nv, mom_short_name, attr, CRAY_LOGIN,
		      0, 0, NULL) == -1)
		goto bad_vnl;

	attr = "resources_available.PBScrayhost";
	if (vn_addvnr(nv, mom_short_name, attr, mpphost,
		      ATR_TYPE_STR, aflag, NULL) == -1)
		goto bad_vnl;

	/*
	 * Extract KNL NIDs (Node ID) from 'knl_node_list' ('knl_node_list' is a string
	 * containing a rangelist of KNL Node IDs) and populate 'arr_nodes'.
	 * If BASIL 1.7 is not supported on the Cray system, knl_node_list remains empty,
	 * causing NULL to be returned and node_count to be set to 0.
	 */

	if (basil_1_7_supported)
		arr_nodes = process_nodelist_KNL(knl_node_list, &node_count);
	/*
	 * now create the compute nodes
	 */
	inv = &brp->data.query.data.inventory;
	for (order = 1, node = inv->nodes; node; node = node->next, order++) {
		char *arch;

		/*
		 * We are only interested in creating non-KNL vnodes in this function.
		 * We avoid creating vnodes for KNL Nodes here since they will be
		 * created in system_to_vnodes_KNL(). So, filter them out here.
		 */
		skip_node = 0;
		for (idx = 0; idx < node_count; idx++) {
			if (arr_nodes && node->node_id == arr_nodes[idx]) {
				skip_node = 1;
				break;
			}
		}
		if (skip_node)
			continue;

		(void) memset(name, '\0', VNODE_NAME_LEN);
		if (node->role != basil_node_role_batch)
			continue;
		if (node->state != basil_node_state_up)
			continue;

		switch (node->arch) {
			case basil_node_arch_xt:
				arch = BASIL_VAL_XT;
				break;
			case basil_node_arch_x2:
				arch = BASIL_VAL_X2;
				break;
			default:
				continue;
		}

		if (basil_inventory != NULL) {
			if (first_compute_node) {
				/* Create the name of the very first vnode
				 * so we can attach topology info to it
				 */
				if (vnode_per_numa_node) {
					snprintf(name, VNODE_NAME_LEN, "%s_%ld_0",
						 mpphost, node->node_id);
				} else {
					/* When concatenating the segments into
					 * one vnode, we don't put any segment info
					 * in the name.
					 */
					snprintf(name, VNODE_NAME_LEN, "%s_%ld",
						 mpphost, node->node_id);
				}
				first_compute_node = 0;
				attr = ATTR_NODE_TopologyInfo;
				if (vn_addvnr(nv, name, attr,
					      (char *) basil_inventory,
					      ATR_TYPE_STR, READ_ONLY,
					      NULL) == -1)
					goto bad_vnl;
			}
		} else {
			sprintf(log_buffer, "no saved basil_inventory");
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
				  LOG_DEBUG, __func__, log_buffer);
		}
		seg_num = 0;
		cpu_ct = 0;
		mem_ct = 0;

		inventory_loop_on_segments(node, nv, arch, &seg_num, order, name, &cpu_ct, &mem_ct);

		if (!vnode_per_numa_node) {
			/* Since we're creating one vnode that combines
			 * the info for all the numa nodes,
			 * we've now cycled through all the numa nodes, so
			 * we need to set the total number of cpus and total
			 * memory before moving on to the next node
			 */
			attr = "resources_available.ncpus";
			sprintf(utilBuffer, "%d", cpu_ct);
			if (vn_addvnr(nv, name, attr, utilBuffer,
				      0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.mem";
			snprintf(utilBuffer, sizeof(utilBuffer), "%lukb", mem_ct);
			if (vn_addvnr(nv, name, attr, utilBuffer,
				      0, 0, NULL) == -1)
				goto bad_vnl;
		}
	}
	internal_state_update = UPDATE_MOM_STATE;

	/* merge any existing vnodes into the new set */
	if (vnlp != NULL) {
		if (vn_merge(nv, vnlp, NULL) == NULL)
			goto bad_vnl;
		vnl_free(vnlp);
	}
	vnlp = nv;

	/* We have no further use for this string of KNL node rangelist(s), so free it. */
	if (knl_node_list) {
		free(knl_node_list);
		knl_node_list = NULL;
	}
	/* We have no further use for this array of KNL node ids, so free it. */
	if (arr_nodes) {
		free(arr_nodes);
		arr_nodes = NULL;
	}

	return 0;

bad_vnl:
	snprintf(log_buffer, sizeof(log_buffer), "creation of cray vnodes failed at %ld, with name %s", order, name);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  __func__, log_buffer);
	/*
	 * don't free nv since it might be importaint in the dump
	 */
	abort();
}

/**
 * @brief
 * 	Destructor function for BASIL processor allocation structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_processor_allocation(basil_processor_allocation_t *p)
{
	if (!p)
		return;
	free_basil_processor_allocation(p->next);
	free(p);
	return;
}

/**
 * @brief
 * 	Destructor function for BASIL processor structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_processor(basil_node_processor_t *p)
{
	if (!p)
		return;
	free_basil_processor(p->next);
	free_basil_processor_allocation(p->allocations);
	free(p);
	return;
}

/**
 * @brief
 * 	Destructor function for BASIL memory allocation structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_memory_allocation(basil_memory_allocation_t *p)
{
	if (!p)
		return;
	free_basil_memory_allocation(p->next);
	free(p);
	return;
}

/**
 * @brief
 * 	Destructor function for BASIL memory structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_memory(basil_node_memory_t *p)
{
	if (!p)
		return;
	free_basil_memory(p->next);
	free_basil_memory_allocation(p->allocations);
	free(p);
	return;
}

/**
 * @brief
 * 	Destructor function for BASIL label structure.

 * @param p structure to free
 */
static void
free_basil_label(basil_label_t *p)
{
	if (!p)
		return;
	free_basil_label(p->next);
	free(p);
	return;
}

/**
 * @brief
 * 	Destructor function for BASIL accelerator gpu structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_accelerator_gpu(basil_accelerator_gpu_t *p)
{
	if (!p)
		return;
	if (p->family)
		free(p->family);
	free(p);
	return;
}

/**
 * @brief
 * 	Destructor function for BASIL accelerator allocation structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_accelerator_allocation(basil_accelerator_allocation_t *p)
{
	if (!p)
		return;
	free_basil_accelerator_allocation(p->next);
	free(p);
	return;
}

/**
 * @brief
 * 	Destructor function for BASIL accelerator structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_accelerator(basil_node_accelerator_t *p)
{
	if (!p)
		return;
	free_basil_accelerator(p->next);
	free_basil_accelerator_allocation(p->allocations);
	free_basil_accelerator_gpu(p->data.gpu);
	free(p);
	return;
}

/**
 * @brief
 * Destructor function for BASIL computeunit structure
 * @param p structure to free
 */
static void
free_basil_computeunit(basil_node_computeunit_t *p)
{
	if (!p)
		return;
	free_basil_computeunit(p->next);
	free(p);
}

/**
 * @brief
 *	Destructor function for BASIL node segment structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_segment(basil_node_segment_t *p)
{
	if (!p)
		return;
	free_basil_segment(p->next);
	free_basil_processor(p->processors);
	free_basil_memory(p->memory);
	free_basil_label(p->labels);
	free_basil_computeunit(p->computeunits);
	free(p);
}

/**
 * @brief
 * Destructor function for BASIL socket structure
 * @param p structure to free
 */
static void
free_basil_socket(basil_node_socket_t *p)
{
	if (!p)
		return;
	free_basil_socket(p->next);
	free_basil_segment(p->segments);
	free(p);
}

/**
 * @brief
 * Destructor function for BASIL node structure.
 * @param p structure to free
 */
static void
free_basil_node(basil_node_t *p)
{
	if (!p)
		return;
	free_basil_node(p->next);
	free_basil_segment(p->segments);
	free_basil_accelerator(p->accelerators);
	free_basil_socket(p->sockets);
	free(p);
}

/**
 * @brief
 * Destructor function for BASIL System element structure.
 * @param p linked list of structures to free.
 */
static void
free_basil_elements_KNL(basil_system_element_t *p)
{
	basil_system_element_t *nxtp;
	if (!p)
		return;
	nxtp = p->next;
	if (p->nidlist)
		free(p->nidlist);
	free(p);
	free_basil_elements_KNL(nxtp);
}

/**
 * @brief
 * 	Destructor function for BASIL reservation structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
free_basil_rsvn(basil_rsvn_t *p)
{
	if (!p)
		return;
	free_basil_rsvn(p->next);
	free(p);
}

/**
 * @brief
 * Destructor function for BASIL query status reservation structure.
 * @param p structure to free
 */
static void
free_basil_query_status_res(basil_response_query_status_res_t *p)
{
	if (!p)
		return;
	free_basil_query_status_res(p->next);
	free(p);
}

/**
 * @brief
 * Destructor function for BASIL response structure.

 * @param brp structure to free.
 *
 * @return Void
 */
static void
free_basil_response_data(basil_response_t *brp)
{
	if (!brp)
		return;
	if (brp->method == basil_method_query) {
		if (brp->data.query.type == basil_query_inventory) {
			free_basil_node(brp->data.query.data.inventory.nodes);
			free_basil_rsvn(brp->data.query.data.inventory.rsvns);
		} else if (brp->data.query.type == basil_query_system) {
			free_basil_elements_KNL(brp->data.query.data.system.elements);
		} else if (brp->data.query.type == basil_query_engine) {
			if (brp->data.query.data.engine.name)
				free(brp->data.query.data.engine.name);
			if (brp->data.query.data.engine.version)
				free(brp->data.query.data.engine.version);
			if (brp->data.query.data.engine.basil_support)
				free(brp->data.query.data.engine.basil_support);
		} else if (brp->data.query.type == basil_query_status) {
			free_basil_query_status_res(brp->data.query.data.status.reservation);
		}
	}
	free(brp);
}

/**
 * @brief
 * 	The child side of the request handler that invokes the ALPS client.
 *
 * Setup stdin to map to infd and stdout to map to outfd. Once that is
 * done, call exec to run the ALPS client.
 *
 * @param[in] infd input file descriptor
 * @param[in] outfd output file descriptor
 *
 * @return exit value of ALPS client
 * @retval 127 failure to setup exec of ALPS client
 */
static int
alps_request_child(int infd, int outfd)
{
	char *p;
	int rc = 0;
	int in = 0;
	int out = 0;

	in = infd;
	out = outfd;
	if (in != STDIN_FILENO) {
		if (out == STDIN_FILENO) {
			rc = dup(out);
			if (rc == -1) {
				sprintf(log_buffer, "dup() of out failed: %s",
					strerror(errno));
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
					  LOG_NOTICE, __func__, log_buffer);
				_exit(127);
			}
			close(out);
			out = rc;
		}
		rc = dup2(in, STDIN_FILENO);
		if (rc == -1) {
			sprintf(log_buffer, "dup2() of in failed: %s",
				strerror(errno));
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
				  LOG_NOTICE, __func__, log_buffer);
			_exit(127);
		}
		close(in);
	}
	if (out != STDOUT_FILENO) {
		rc = dup2(out, STDOUT_FILENO);
		if (rc == -1) {
			sprintf(log_buffer, "dup2() of out failed: %s",
				strerror(errno));
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
				  LOG_NOTICE, __func__, log_buffer);
			_exit(127);
		}
		close(out);
	}
	rc = open("/dev/null", O_WRONLY);
	if (rc != -1)
		dup2(rc, STDERR_FILENO);

	rc = fcntl(STDIN_FILENO, F_GETFD);
	if (rc == -1)
		_exit(127);
	rc = fcntl(STDIN_FILENO, F_SETFD, (rc & ~(FD_CLOEXEC)));
	if (rc == -1)
		_exit(127);
	rc = fcntl(STDOUT_FILENO, F_GETFD);
	if (rc == -1)
		_exit(127);
	rc = fcntl(STDOUT_FILENO, F_SETFD, (rc & ~(FD_CLOEXEC)));
	if (rc == -1)
		_exit(127);
	rc = fcntl(STDERR_FILENO, F_GETFD);
	if (rc == -1)
		_exit(127);
	rc = fcntl(STDERR_FILENO, F_SETFD, (rc & ~(FD_CLOEXEC)));
	if (rc == -1)
		_exit(127);

	if (!alps_client)
		_exit(127);
	p = strrchr(alps_client, '/');
	if (!p)
		_exit(127);
	p++;
	if (*p == '\0')
		_exit(127);
	log_close(0);
	if (execl(alps_client, p, NULL) < 0)
		_exit(127);
	exit(0);
}

/**
 * @brief
 * 	The parent side of the request handler that reads and parses the
 * 	XML response from the ALPS client (child side).
 *
 * Read the XML from the ALPS client and pass it to XML_Parse.
 * This is where the actual Expat (XML_) functions are called.
 * @param[in] fdin file descriptor to read XML stream from child
 * @param[in] basil_ver BASIL version indicates context i.e. did control
 *	      arrive at this function as a result of processing the
 *	      Inventory Query or System Query
 * @return pointer to filled in response structure
 * @retval NULL no result
 *
 */
static basil_response_t *
alps_request_parent(int fdin, char *basil_ver)
{
	ud_t ud;
	basil_response_t *brp;
	FILE *in = NULL;
	int status = 0;
	int eof = 0;
	int inventory_size = 0;

	in = fdopen(fdin, "r");
	if (!in) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Failed to open read FD.");
		return NULL;
	}
	memset(&ud, 0, sizeof(ud));
	brp = malloc(sizeof(basil_response_t));
	if (!brp) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Failed to allocate response structure.");
		return NULL;
	}
	memset(brp, 0, sizeof(basil_response_t));
	ud.brp = brp;
	parser = XML_ParserCreate(NULL);
	if (!parser) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Failed to create parser.");
		free_basil_response_data(brp);
		return NULL;
	}
	XML_SetUserData(parser, (void *) &ud);
	XML_SetElementHandler(parser, parse_element_start, parse_element_end);
	XML_SetCharacterDataHandler(parser, parse_char_data);

	if (alps_client_out != NULL)
		free(alps_client_out);
	if ((alps_client_out = strdup(NODE_TOPOLOGY_TYPE_CRAY)) == NULL) {
		sprintf(log_buffer, "failed to allocate client output buffer");
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_ERR,
			  __func__, log_buffer);
		free_basil_response_data(brp);
		return NULL;
	} else
		inventory_size = strlen(alps_client_out) + 1;

	if (basil_ver != NULL)
		pbs_strncpy(ud.basil_ver, basil_ver, BASIL_STRING_SHORT);
	else
		pbs_strncpy(ud.basil_ver, BASIL_VAL_UNKNOWN, BASIL_STRING_SHORT);
	ud.basil_ver[BASIL_STRING_SHORT - 1] = '\0';

	do {
		int rc = 0;
		int len = 0;
		expatBuffer[0] = '\0';
		len = fread(expatBuffer, sizeof(char),
			    (EXPAT_BUFFER_LEN - 1), in);
		rc = ferror(in);
		if (rc) {
			if (len == 0) {
				clearerr(in);
				usleep(100);
				continue;
			}
			sprintf(log_buffer,
				"Read error on stream: rc=%d, len=%d",
				rc, len);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
				  LOG_NOTICE, __func__, log_buffer);
			break;
		}
		*(expatBuffer + len) = '\0';
		if (pbs_strcat(&alps_client_out, &inventory_size,
			       expatBuffer) == NULL) {
			sprintf(log_buffer, "failed to save client response");
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_ERR,
				  __func__, log_buffer);
			free(alps_client_out);
			alps_client_out = NULL;
			break;
		}
		eof = feof(in);
		status = XML_Parse(parser, expatBuffer, len, eof);
		if (status == XML_STATUS_ERROR) {
			sprintf(ud.error_class, "%s", BASIL_VAL_PERMANENT);
			sprintf(ud.error_source, "%s", BASIL_VAL_PARSER);
			sprintf(ud.message, "%s",
				XML_ErrorString(XML_GetErrorCode(parser)));
			break;
		}
	} while (!eof);
	fclose(in);

	if (*ud.error_class || *ud.error_source) {
		sprintf(log_buffer, "%s BASIL error from %s: %s",
			ud.error_class, ud.error_source, ud.message);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE,
			  __func__, log_buffer);
		snprintf(brp->error, BASIL_ERROR_BUFFER_SIZE, ud.message);
		if (strcmp(BASIL_VAL_PARSER, ud.error_source) == 0) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__, "XML buffer: ");
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
				  LOG_DEBUG, __func__, expatBuffer);
		}
	}
	XML_ParserFree(parser);
	return (brp);
}

/**
 * @brief
 * 	The front-end function for all ALPS requests that calls the
 * 	appropriate subordinate functions to issue the request (child) and
 * 	parse the response (parent).
 *
 * Setup pipes and call fork so the ALPS client can be run and send its
 * stdout to be read by the parent.
 *
 * @param[in] msg XML message to send to ALPS client
 * @param[in] basil_ver BASIL version indicates context i.e. did control
 *	      arrive at this function as a result of processing the
 *	      Inventory Query or System Query.
 * @return pointer to filled in response structure
 * @retval NULL no result
 *
 */
static basil_response_t *
alps_request(char *msg, char *basil_ver)
{
	int toChild[2];
	int fromChild[2];
	int status = 0;
	pid_t pid;
	pid_t exited;
	size_t msglen = 0;
	size_t wlen = -1;
	basil_response_t *brp = NULL;
	FILE *fp = NULL;

	if (!alps_client) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "No alps_client specified in MOM configuration file.");
		return NULL;
	}
	if (!msg) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			  __func__, "No message parameter for method.");
		return NULL;
	}
	msglen = strlen(msg);
	if (msglen < 32) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			  __func__, "ALPS request too short.");
		return NULL;
	}
	snprintf(log_buffer, sizeof(log_buffer),
		 "Sending ALPS request: %s", msg);
	log_event(PBSEVENT_DEBUG2, 0, LOG_DEBUG, __func__, log_buffer);
	if (pipe(toChild) == -1)
		return NULL;
	if (pipe(fromChild) == -1) {
		(void) close(toChild[0]);
		(void) close(toChild[1]);
		return NULL;
	}

	pid = fork();
	if (pid < 0) {
		log_err(errno, __func__, "fork");
		(void) close(toChild[0]);
		(void) close(toChild[1]);
		(void) close(fromChild[0]);
		(void) close(fromChild[1]);
		return NULL;
	}
	if (pid == 0) {
		close(toChild[1]);
		close(fromChild[0]);
		alps_request_child(toChild[0], fromChild[1]);
		exit(1);
	}
	close(toChild[0]);
	close(fromChild[1]);
	fp = fdopen(toChild[1], "w");
	if (fp == NULL) {
		sprintf(log_buffer, "fdopen() failed: %s", strerror(errno));
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE,
			  __func__, log_buffer);
		kill(pid, SIGKILL); /* don't let child run */
		goto done;
	}

	wlen = fwrite(msg, sizeof(char), msglen, fp);
	if (wlen < msglen) {
		log_err(errno, __func__, "fwrite");
		fclose(fp);
		kill(pid, SIGKILL); /* don't let child run */
		goto done;
	}

	if (fflush(fp) != 0) {
		log_err(errno, __func__, "fflush");
		fclose(fp);
		kill(pid, SIGKILL); /* don't let child run */
		goto done;
	}

	fclose(fp);
	if ((brp = alps_request_parent(fromChild[0], basil_ver)) == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
			  "No response from ALPS.");
	}

done:
	exited = waitpid(pid, &status, 0);
	/*
	 * If the wait fails or the process did not exit with 0,
	 * generate a message.
	 */
	if ((exited == -1) || (!WIFEXITED(status)) ||
	    (WEXITSTATUS(status) != 0)) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
			  "BASIL query process exited abnormally.");
	}

	close(toChild[1]);
	close(fromChild[0]);
	return (brp);
}

/**
 * @brief
 * 	Destructor function for BASIL memory parameter structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
alps_free_memory_param(basil_memory_param_t *p)
{
	if (!p)
		return;
	alps_free_memory_param(p->next);
	free(p);
}

/**
 * @brief
 * 	Destructor function for BASIL label parameter structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
alps_free_label_param(basil_label_param_t *p)
{
	if (!p)
		return;
	alps_free_label_param(p->next);
	free(p);
}

/**
 * @brief
 * 	Destructor function for BASIL node list parameter structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
alps_free_nodelist_param(basil_nodelist_param_t *p)
{
	if (!p)
		return;
	alps_free_nodelist_param(p->next);
	if (p->nodelist)
		free(p->nodelist);
	free(p);
}

/**
 * @brief
 * 	Destructor function for BASIL accelerator parameter structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
alps_free_accelerator_param(basil_accelerator_param_t *p)
{
	if (!p)
		return;
	alps_free_accelerator_param(p->next);
	free_basil_accelerator_gpu(p->data.gpu);
	free(p);
}

/**
 * @brief
 * 	Destructor function for BASIL parameter structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
static void
alps_free_param(basil_reserve_param_t *p)
{
	if (!p)
		return;
	alps_free_param(p->next);
	alps_free_memory_param(p->memory);
	alps_free_label_param(p->labels);
	alps_free_nodelist_param(p->nodelists);
	alps_free_accelerator_param(p->accelerators);
	free(p);
}

/**
 * @brief
 * 	Destructor function for BASIL reservation request structure.
 *
 * @param p structure to free
 *
 * @return Void
 *
 */
void
alps_free_reserve_request(basil_request_reserve_t *p)
{
	if (!p)
		return;
	alps_free_param(p->params);
	free(p);
	return;
}

/**
 * Information to remember for each vnode in the exec_vnode for a job.
 * The vnode are combined by alps_create_reserve_request() to form
 * the ALPS reservation.
 */
typedef struct nodesum {
	char *name;
	char *vntype;
	char *arch;
	long nid;
	long mpiprocs;
	long ncpus;
	long threads;
	long long mem;
	long chunks;
	long width;
	long depth;
	enum vnode_sharing_state share;
	int naccels;
	int need_accel;
	char *accel_model;
	long long accel_mem;
	int done;
} nodesum_t;

/**
 * @brief
 * Given a pointer to a PBS job (pjob), validate and construct a BASIL
 * reservation request.
 *
 * A loop goes through each element of the ji_vnods array for the job and
 * looks for entries that have cpus, the name matches mpphost, vntype is
 * CRAY_COMPUTE, and has a value for arch. Each of these entries causes
 * an entry to be made in the nodes array. If no vnodes are matched,
 * we can return since no compute nodes are being allocated.
 *
 * An error check is done to be sure no entries in the nodes array have
 * a bad combination of ncpus and mpiprocs. Then, a double loop is
 * entered that goes through each element of the of the nodes array
 * looking for matching entries. A match is when depth, width, mem,
 * share, arch, need_accel, accelerator_model and accelerator_mem are
 * all the same. All matches will be output to
 * a single ReserveParam XML section. Each node array entry that
 * is represented in an ReserveParam section is marked done so it
 * can be skipped as the loops run through the entries.
 *
 * @param[in] job PBS job
 * @param[out] req resulting completed request structure (NULL on error)
 *
 * @retval 0 success
 * @retval 1 failure
 * @retval 2 requeue job
 *
 */
int
alps_create_reserve_request(job *pjob, basil_request_reserve_t **req)
{
	basil_request_reserve_t *basil_req;
	basil_reserve_param_t *pend;
	enum rlplace_value rpv;
	enum vnode_sharing vnsv;
	struct passwd *pwent;
	int i = 0;
	int j = 0;
	int num = 0;
	int err_ret = 1;
	nodesum_t *nodes;
	vmpiprocs *vp;
	size_t len = 0;
	size_t nsize = 0;
	char *cp;
	long pstate = 0;
	char *pgov = NULL;
	char *pname = NULL;
	resource *pres;

	*req = NULL;

	nodes = (nodesum_t *) calloc(pjob->ji_numvnod, sizeof(nodesum_t));
	if (nodes == NULL)
		return 1;

	rpv = getplacesharing(pjob);

	/*
	 * Go through the vnodes to consolidate the mpi ranks onto
	 * the compute nodes. The index into ji_vnods will be
	 * incremented by the value of vn_mpiprocs because the
	 * entries in ji_vnods are replicated for each mpi rank.
	 */
	num = 0;
	len = strlen(mpphost);
	for (i = 0; i < pjob->ji_numvnod; i += vp->vn_mpiprocs) {
		vnal_t *vnp;
		char *vntype, *vnt;
		char *sharing;
		long nid;
		int seg;
		long long mem;
		char *arch;
		enum vnode_sharing_state share;
		vp = &pjob->ji_vnods[i];

		assert(vp->vn_mpiprocs > 0);
		if (vp->vn_cpus == 0)
			continue;

		/*
		 * Only match vnodes that begin with mpphost and have
		 * a following "_<num>_<num>" (when
		 * vnode_per_numa_node is true) otherwise,
		 * just plain "_<num>"..
		 */
		if (strncmp(vp->vn_vname, mpphost, len) != 0)
			continue;
		cp = &vp->vn_vname[len];
		if (vnode_per_numa_node) {
			if (sscanf(cp, "_%ld_%d", &nid, &seg) != 2)
				continue;
		} else {
			if (sscanf(cp, "_%ld", &nid) != 1)
				continue;
		}

		/* check that vnode exists */
		vnp = vn_vnode(vnlp, vp->vn_vname);
		if (vnp == NULL) {
			sprintf(log_buffer, "vnode %s does not exist",
				vp->vn_vname);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
			free(nodes);
			return 2;
		}

		/* see if this is a compute node */
		vntype = attr_exist(vnp, "resources_available.vntype");
		if (vntype == NULL) {
			sprintf(log_buffer, "vnode %s has no vntype value",
				vp->vn_vname);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
			continue;
		}
		/*
		 * Check string array to be sure CRAY_COMPUTE is
		 * one of the values.
		 */
		for (vnt = parse_comma_string(vntype); vnt != NULL;
		     vnt = parse_comma_string(NULL)) {
			if (strcmp(vnt, CRAY_COMPUTE) == 0)
				break;
			sprintf(log_buffer, "vnode %s has vntype %s",
				vp->vn_vname, vnt);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
		}
		if (vnt == NULL) {
			sprintf(log_buffer, "vnode %s does not have vntype %s",
				vp->vn_vname, CRAY_COMPUTE);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
			continue;
		}

		arch = attr_exist(vnp, "resources_available.arch");
		if (arch == NULL) {
			sprintf(log_buffer, "vnode %s has no arch value",
				vp->vn_vname);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
			free(nodes);
			return 2;
		}

		/* check legal values for arch */
		if (strcmp(BASIL_VAL_XT, arch) != 0 &&
		    strcmp(BASIL_VAL_X2, arch) != 0) {
			sprintf(log_buffer, "vnode %s has bad arch value %s",
				vp->vn_vname, arch);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
			free(nodes);
			return 2;
		}

		/* rounded up value for size_mb which is memory per MPI rank */
		mem = (vp->vn_mem + vp->vn_mpiprocs - 1) / vp->vn_mpiprocs;
		sharing = attr_exist(vnp, "sharing");
		vnsv = str_to_vnode_sharing(sharing);
		share = vnss[vnsv][rpv];

		/*
		 ** If the vnode is in the array but is setup to use
		 ** different values for ncpus, mpiprocs etc, we need
		 ** to allocate another slot for it so a separate
		 ** ReserveParam XML section is created.
		 */
		for (j = 0; j < num; j++) {
			nodesum_t *ns = &nodes[j];

			if (ns->nid == nid && ns->share == share &&
			    ns->mpiprocs == vp->vn_mpiprocs &&
			    ns->ncpus == vp->vn_cpus &&
			    ns->threads == vp->vn_threads &&
			    ns->mem == mem &&
			    (strcmp(ns->arch, arch) == 0) &&
			    ns->need_accel == vp->vn_need_accel &&
			    ns->accel_mem == vp->vn_accel_mem) {
				if (ns->need_accel == 1) {
					/* If an accelerator is needed, check to
					 * see if the model has been set.
					 * Need a new XML block when the previous
					 * model doesn't match the current.
					 * Or if prev was set and current isn't,
					 * or vice versa.
					 */
					if (vp->vn_accel_model &&
					    ns->accel_model) {
						if (strcmp(ns->accel_model, vp->vn_accel_model) != 0) {
							continue;
						}
					} else if (!(vp->vn_accel_model == NULL &&
						     ns->accel_model == NULL)) {
						/* if both are NULL they match
						 * otherwise keep looking
						 */
						continue;
					}
				}
				ns->chunks++;
				break;
			}
		}
		if (j == num) { /* need a new entry */
			nodes[num].nid = nid;
			nodes[num].name = vp->vn_vname;
			nodes[num].mpiprocs = vp->vn_mpiprocs;
			nodes[num].ncpus = vp->vn_cpus;
			nodes[num].threads = vp->vn_threads;
			nodes[num].mem = mem;
			nodes[num].naccels = vp->vn_naccels;
			nodes[num].need_accel = vp->vn_need_accel;
			if (nodes[num].need_accel) {
				if (vp->vn_accel_mem) {
					nodes[num].accel_mem = vp->vn_accel_mem;
				}
				if (vp->vn_accel_model) {
					nodes[num].accel_model = vp->vn_accel_model;
				}
			}
			nodes[num].vntype = vntype;
			nodes[num].arch = arch;
			nodes[num].share = share;
			nodes[num++].chunks = 1;
		}
	}
	if (num == 0) { /* no compute nodes -> no reservation */
		free(nodes);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
			  LOG_DEBUG, pjob->ji_qs.ji_jobid,
			  "no ALPS reservation created: "
			  "no compute nodes allocated");
		return 0;
	}

	basil_req = malloc(sizeof(basil_request_reserve_t));
	if (!basil_req)
		return 1;
	memset(basil_req, 0, sizeof(basil_request_reserve_t));

	pwent = getpwuid(pjob->ji_qs.ji_un.ji_momt.ji_exuid);
	if (!pwent)
		goto err;
	sprintf(basil_req->user_name, "%s", pwent->pw_name);

	pbs_strncpy(basil_req->batch_id, pjob->ji_qs.ji_jobid,
		    sizeof(basil_req->batch_id));

	/* check for pstate or pgov */
	for (pres = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
	     pres != NULL;
	     pres = (resource *) GET_NEXT(pres->rs_link)) {

		if ((pstate > 0) && (pgov != NULL))
			break;

		if (pres->rs_defin == NULL)
			continue;
		pname = pres->rs_defin->rs_name;
		if (pname == NULL)
			continue;

		if (strcmp(pname, "pstate") == 0) {
			pstate = atol(pres->rs_value.at_val.at_str);
			if (pstate <= 0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "pstate value \"%s\" could not be used for the reservation",
					 pres->rs_value.at_val.at_str);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
				pstate = 0;
			}
			continue;
		}
		if (strcmp(pname, "pgov") == 0) {
			pgov = pres->rs_value.at_val.at_str;
			continue;
		}
	}

	for (i = 0; i < num; i++) {
		nodesum_t *ns = &nodes[i];

		/*
		 * ALPS cannot represent situations where a thread
		 * or process does not have a cpu allocated.
		 */
		if ((ns->ncpus % ns->mpiprocs) != 0)
			goto err;

		ns->width = ns->mpiprocs * ns->chunks;
		ns->depth = ns->ncpus / ns->mpiprocs;
	}

	pend = NULL;

	for (i = 0; i < num; i++) {
		basil_reserve_param_t *p;
		basil_nodelist_param_t *n;
		basil_accelerator_param_t *a;
		basil_accelerator_gpu_t *gpu;
		nodesum_t *ns = &nodes[i];
		char *arch = ns->arch;
		long long mem = ns->mem;
		char *accel_model = ns->accel_model;
		long long accel_mem = ns->accel_mem;
		long width;
		long last_nid, prev_nid;

		if (ns->done) /* already output */
			continue;

		p = malloc(sizeof(basil_reserve_param_t));
		if (p == NULL)
			goto err;

		memset(p, 0, sizeof(*p));
		if (pend == NULL)
			basil_req->params = p;
		else
			pend->next = p;
		pend = p;

		n = malloc(sizeof(basil_nodelist_param_t));
		if (n == NULL)
			goto err;

		memset(n, 0, sizeof(*n));
		p->nodelists = n;

		nsize = BASIL_STRING_LONG;
		n->nodelist = malloc(nsize);
		if (n->nodelist == NULL)
			goto err;

		sprintf(n->nodelist, "%ld", ns->nid);
		last_nid = prev_nid = ns->nid;

		p->depth = ns->depth;
		p->nppn = width = ns->width;

		/*
		 * If the user requested place=excl then we need to pass
		 * that information into the ALPS reservation.
		 */
		p->rsvn_mode = basil_rsvn_mode_none; /* initialize it */
		if (rpv == rlplace_excl) {
			/*
			 * The user asked for the node exclusively.
			 * Set it in the ALPS reservation.
			 */
			p->rsvn_mode = basil_rsvn_mode_exclusive;
		}
		if (ns->ncpus != ns->threads) {
			sprintf(log_buffer, "ompthreads %ld does not match"
					    " ncpus %ld",
				ns->threads, ns->ncpus);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
		}

		/*
		 * Collapse matching entries.
		 */
		for (j = i + 1; j < num; j++) {
			nodesum_t *ns2 = &nodes[j];

			/* Look for matching nid entries that have not
			 * yet been output.
			 */
			if (ns2->done)
				continue;

			/* If everthing matches, add in this entry
			 * and mark it done.
			 */
			if (ns2->depth != ns->depth)
				continue;
			if (ns2->width != ns->width)
				continue;
			if (ns2->mem != ns->mem)
				continue;
			if (ns2->share != ns->share)
				continue;
			if (strcmp(ns2->arch, arch) != 0)
				continue;
			if (ns2->need_accel != ns->need_accel)
				continue;
			if (ns2->accel_mem != accel_mem)
				continue;
			if (ns->need_accel == 1) {
				if (accel_model &&
				    ns2->accel_model) {
					if (strcmp(ns2->accel_model, accel_model) != 0) {
						continue;
					}
				} else if (!(accel_model == NULL &&
					     ns2->accel_model == NULL)) {
					continue;
				}
			}

			width += ns2->width;
			ns2->done = 1;

			/*
			 * See if we can use a range of nid numbers.
			 */
			if (ns2->nid == (prev_nid + 1)) {
				prev_nid = ns2->nid;
				continue;
			}

			if (last_nid == prev_nid) /* no range */
				sprintf(utilBuffer, ",%ld", ns2->nid);
			else {
				sprintf(utilBuffer, "-%ld,%ld",
					prev_nid, ns2->nid);
			}
			prev_nid = last_nid = ns2->nid;

			/* check to see if we need to get a new nodelist */
			if (strlen(utilBuffer) + 1 >
			    nsize - strlen(n->nodelist)) {
				char *hold;

				nsize *= 2; /* double size */
				hold = realloc(n->nodelist, nsize);
				if (hold == NULL)
					goto err;
				n->nodelist = hold;
			}
			/* this is safe since we checked for overflow */
			strcat(n->nodelist, utilBuffer);
		}
		p->width = width;
		if (last_nid < prev_nid) { /* last range */
			size_t slen;

			sprintf(utilBuffer, "-%ld", prev_nid);
			slen = strlen(utilBuffer) + 1;

			/* check to see if we need to get a new nodelist */
			if (slen > nsize - strlen(n->nodelist)) {
				char *hold;

				nsize += slen + 1;
				hold = realloc(n->nodelist, nsize);
				if (hold == NULL)
					goto err;
				n->nodelist = hold;
			}
			/* this is safe since we checked for overflow */
			strcat(n->nodelist, utilBuffer);
		}

		if (mem > 0) {
			p->memory = malloc(sizeof(basil_memory_param_t));
			if (p->memory == NULL)
				goto err;
			memset(p->memory, 0, sizeof(basil_memory_param_t));
			p->memory->size_mb = (long) ((mem + 1023) / 1024);
			p->memory->type = basil_memory_type_os;
		}
		/*
		 * We don't include checking for ns->naccels here because
		 * ALPS is currently unable to accept a specified count
		 * of accelerators. Also ALPS currently needs a width
		 * to be requested on every node, so an accelerator cannot
		 * be the only thing requested on a node.
		 */
		if (ns->need_accel) {
			a = malloc(sizeof(basil_accelerator_param_t));
			if (a == NULL)
				goto err;
			memset(a, 0, sizeof(*a));
			a->type = basil_accel_gpu;
			p->accelerators = a;
			if (accel_model || (accel_mem > 0)) {
				gpu = malloc(sizeof(basil_accelerator_gpu_t));
				if (gpu == NULL)
					goto err;
				memset(gpu, 0, sizeof(basil_accelerator_gpu_t));
				a->data.gpu = gpu;
				if (accel_model) {
					gpu->family = strdup(accel_model);
					if (gpu->family == NULL)
						goto err;
				}
				if (accel_mem > 0) {
					/* ALPS expects MB */
					gpu->memory = (unsigned int) ((accel_mem + 1023) / 1024);
				}
			}
		}
		if (strcmp(BASIL_VAL_XT, arch) == 0) {
			p->arch = basil_node_arch_xt;
		} else if (strcmp(BASIL_VAL_X2, arch) == 0) {
			p->arch = basil_node_arch_x2;
		}
		if (pstate > 0) {
			p->pstate = pstate;
		}
		if (pgov != NULL) {
			if (strlen(pgov) < sizeof(p->pgovernor)) {
				pbs_strncpy(p->pgovernor, pgov, sizeof(p->pgovernor));
			} else {
				sprintf(log_buffer, "pgov value %s is too long,"
						    " length must be less than %ld",
					pgov, sizeof(p->pgovernor));
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG, pjob->ji_qs.ji_jobid,
					  log_buffer);
			}
		}
	}
	*req = basil_req;
	free(nodes);
	return 0;

err:
	free(nodes);
	alps_free_reserve_request(basil_req);
	return err_ret;
}

/**
 * @brief
 * 	Issue a request to create a reservation on behalf of a user.
 *
 * Called during job initialization.
 *
 * @param[in] bresvp - pointer to the reserve request
 * @param[out] rsvn_id - reservation ID
 * @param pagg - unused
 *
 * @retval 0 success
 * @retval 1 transient error (retry)
 * @retval -1 fatal error
 *
 */
int
alps_create_reservation(basil_request_reserve_t *bresvp, long *rsvn_id,
			unsigned long long *pagg)
{
	basil_reserve_param_t *param;
	basil_memory_param_t *mem;
	basil_label_param_t *label;
	basil_nodelist_param_t *nl;
	basil_accelerator_param_t *accel;
	basil_response_t *brp;

	if (!bresvp) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Cannot create ALPS reservation, missing data.");
		return (-1);
	}
	if (*bresvp->user_name == '\0') {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Cannot create ALPS reservation, missing user name.");
		return (-1);
	}
	if (!bresvp->params) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Cannot create ALPS reservation, missing parameters.");
		return (-1);
	}
	new_alps_req();
	sprintf(utilBuffer, "<?xml version=\"1.0\"?>\n"
			    "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_RESERVE "\">\n",
		basilversion_inventory);
	add_alps_req(utilBuffer);
	sprintf(utilBuffer,
		" <" BASIL_ELM_RESVPARAMARRAY " " BASIL_ATR_USER_NAME "=\"%s\" " BASIL_ATR_BATCH_ID "=\"%s\"",
		bresvp->user_name, bresvp->batch_id);
	add_alps_req(utilBuffer);
	if (*bresvp->account_name != '\0') {
		sprintf(utilBuffer, " " BASIL_ATR_ACCOUNT_NAME "=\"%s\"",
			bresvp->account_name);
		add_alps_req(utilBuffer);
	}
	add_alps_req(">\n");
	for (param = bresvp->params; param; param = param->next) {
		add_alps_req("  <" BASIL_ELM_RESERVEPARAM);
		switch (param->arch) {
			case basil_node_arch_x2:
				add_alps_req(" " BASIL_ATR_ARCH "=\"" BASIL_VAL_X2 "\"");
				break;
			default:
				add_alps_req(" " BASIL_ATR_ARCH "=\"" BASIL_VAL_XT "\"");
				break;
		}
		if (param->width >= 0) {
			sprintf(utilBuffer, " " BASIL_ATR_WIDTH "=\"%ld\"",
				param->width);
			add_alps_req(utilBuffer);
		}
		/*
		 * Only output BASIL_ATR_RSVN_MODE if we are not talking
		 * to basil 1.1 orig.
		 */
		if (!basil11orig) {
			if (param->rsvn_mode == basil_rsvn_mode_exclusive) {
				add_alps_req(" " BASIL_ATR_RSVN_MODE "=\"" BASIL_VAL_EXCLUSIVE "\"");
			} else if (param->rsvn_mode == basil_rsvn_mode_shared) {
				add_alps_req(" " BASIL_ATR_RSVN_MODE "=\"" BASIL_VAL_SHARED "\"");
			}
		}
		if (param->depth >= 0) {
			sprintf(utilBuffer, " " BASIL_ATR_DEPTH "=\"%ld\"",
				param->depth);
			add_alps_req(utilBuffer);
		}
		if (param->nppn > 0) {
			sprintf(utilBuffer, " " BASIL_ATR_NPPN "=\"%ld\"",
				param->nppn);
			add_alps_req(utilBuffer);
		}
		if (param->pstate > 0) {
			sprintf(utilBuffer, " " BASIL_ATR_PSTATE "=\"%ld\"",
				param->pstate);
			add_alps_req(utilBuffer);
		}
		if (param->nppcu > 0) {
			sprintf(utilBuffer, " " BASIL_ATR_NPPCU "=\"0\"");
			add_alps_req(utilBuffer);
		}
		if (param->pgovernor[0] != '\0') {
			sprintf(utilBuffer, " " BASIL_ATR_PGOVERNOR "=\"%s\"",
				param->pgovernor);
			add_alps_req(utilBuffer);
		}
		if (vnode_per_numa_node && param->segments[0] != '\0') {
			sprintf(utilBuffer, " " BASIL_ATR_SEGMENTS "=\"%s\"",
				param->segments);
			add_alps_req(utilBuffer);
		}
		if (!param->memory && !param->labels && !param->nodelists) {
			add_alps_req("/>\n");
			continue;
		}
		add_alps_req(">\n");
		if (param->memory) {
			add_alps_req("   <" BASIL_ELM_MEMPARAMARRAY ">\n");
			for (mem = param->memory; mem; mem = mem->next) {
				add_alps_req("    <" BASIL_ELM_MEMPARAM " " BASIL_ATR_TYPE "=\"");
				switch (mem->type) {
					case basil_memory_type_hugepage:
						add_alps_req(BASIL_VAL_HUGEPAGE);
						break;
					case basil_memory_type_virtual:
						add_alps_req(BASIL_VAL_VIRTUAL);
						break;
					default:
						add_alps_req(BASIL_VAL_OS);
				}
				add_alps_req("\"");
				sprintf(utilBuffer,
					" " BASIL_ATR_SIZE_MB "=\"%ld\"",
					mem->size_mb);
				add_alps_req(utilBuffer);
				add_alps_req("/>\n");
			}
			add_alps_req("   </" BASIL_ELM_MEMPARAMARRAY ">\n");
		}
		if (param->labels) {
			add_alps_req("   <" BASIL_ELM_LABELPARAMARRAY ">\n");
			for (label = param->labels; label && *label->name;
			     label = label->next) {
				add_alps_req("    <" BASIL_ELM_LABELPARAM " " BASIL_ATR_NAME "=");
				sprintf(utilBuffer, "\"%s\"", label->name);
				add_alps_req(utilBuffer);
				add_alps_req(" " BASIL_ATR_TYPE "=");
				switch (label->type) {
					case basil_label_type_soft:
						sprintf(utilBuffer, "\"%s\"",
							BASIL_VAL_SOFT);
						break;
					default:
						sprintf(utilBuffer, "\"%s\"",
							BASIL_VAL_HARD);
				}
				add_alps_req(utilBuffer);
				add_alps_req(" " BASIL_ATR_DISPOSITION "=");
				switch (label->disposition) {
					case basil_label_disposition_repel:
						sprintf(utilBuffer, "\"%s\"",
							BASIL_VAL_REPEL);
						break;
					default:
						sprintf(utilBuffer, "\"%s\"",
							BASIL_VAL_ATTRACT);
				}
				add_alps_req(utilBuffer);
				add_alps_req("/>\n");
			}
			add_alps_req("   </" BASIL_ELM_LABELPARAMARRAY ">\n");
		}
		if (param->nodelists) {
			add_alps_req("   <" BASIL_ELM_NODEPARMARRAY ">\n");
			for (nl = param->nodelists;
			     nl && nl->nodelist && *nl->nodelist;
			     nl = nl->next) {
				add_alps_req("    <" BASIL_ELM_NODEPARAM ">");
				add_alps_req(nl->nodelist);
				add_alps_req("</" BASIL_ELM_NODEPARAM ">\n");
			}
			add_alps_req("   </" BASIL_ELM_NODEPARMARRAY ">\n");
		}
		if (param->accelerators) {
			add_alps_req("   <" BASIL_ELM_ACCELPARAMARRAY ">\n");
			for (accel = param->accelerators; accel;
			     accel = accel->next) {
				add_alps_req("    <" BASIL_ELM_ACCELPARAM " " BASIL_ATR_TYPE "=\"" BASIL_VAL_GPU "\"");
				if (accel->data.gpu) {
					if (accel->data.gpu->family) {
						sprintf(utilBuffer, " " BASIL_ATR_FAMILY "=\"%s\"",
							accel->data.gpu->family);
						add_alps_req(utilBuffer);
					}
					if (accel->data.gpu->memory > 0) {
						sprintf(utilBuffer, " " BASIL_ATR_MEMORY_MB "=\"%d\"",
							accel->data.gpu->memory);
						add_alps_req(utilBuffer);
					}
				}
				add_alps_req("/>\n");
			}
			add_alps_req("   </" BASIL_ELM_ACCELPARAMARRAY ">\n");
		}
		add_alps_req("  </" BASIL_ELM_RESERVEPARAM ">\n");
	}
	add_alps_req(" </" BASIL_ELM_RESVPARAMARRAY ">\n");
	add_alps_req("</" BASIL_ELM_REQUEST ">");
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
		  "Creating ALPS reservation for job.");
	if ((brp = alps_request(requestBuffer, basilversion_inventory)) == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Failed to create ALPS reservation.");
		return (-1);
	}
	if (*brp->error != '\0') {
		if (brp->error_flags & BASIL_ERR_TRANSIENT) {
			free_basil_response_data(brp);
			return (1);
		} else {
			free_basil_response_data(brp);
			return (-1);
		}
	}
	sprintf(log_buffer, "Created ALPS reservation %ld.",
		brp->data.reserve.rsvn_id);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  __func__, log_buffer);
	*rsvn_id = brp->data.reserve.rsvn_id;
	free_basil_response_data(brp);
	return (0);
}

/**
 * @brief
 * 	Issue a request to confirm an existing reservation.
 *
 * Called during job initialization.
 * Change from basil 1.0: admin_cookie is renamed to pagg_id
 * and alloc_cookie is deprecated as of 1.1.
 *
 * @param[in] pjob - pointer to job structure
 *
 * @retval 0 success
 * @retval 1 transient error (retry)
 * @retval -1 fatal error
 *
 */
int
alps_confirm_reservation(job *pjob)
{
	basil_response_t *brp;

	if (!pjob) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Cannot confirm ALPS reservation, invalid job.");
		return (-1);
	}
	/* Return success if no reservation present. */
	if (pjob->ji_extended.ji_ext.ji_reservation < 0) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid,
			  "No MPP reservation to confirm.");
		return (0);
	}
	if (pjob->ji_extended.ji_ext.ji_pagg == 0) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid,
			  "No PAGG to confirm MPP reservation.");
		return (1);
	}
	sprintf(log_buffer, "Confirming ALPS reservation %ld.",
		pjob->ji_extended.ji_ext.ji_reservation);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	new_alps_req();
	sprintf(requestBuffer, "<?xml version=\"1.0\"?>\n"
			       "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_CONFIRM "\" " BASIL_ATR_RSVN_ID "=\"%ld\" "
			       "%s =\"%llu\"/>",
		basilversion_inventory,
		pjob->ji_extended.ji_ext.ji_reservation,
		basil11orig ? BASIL_ATR_ADMIN_COOKIE : BASIL_ATR_PAGG_ID,
		pjob->ji_extended.ji_ext.ji_pagg);
	if ((brp = alps_request(requestBuffer, basilversion_inventory)) == NULL) {
		sprintf(log_buffer, "Failed to confirm ALPS reservation %ld.",
			pjob->ji_extended.ji_ext.ji_reservation);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (-1);
	}
	if (*brp->error != '\0') {
		if (brp->error_flags & BASIL_ERR_TRANSIENT) {
			free_basil_response_data(brp);
			return (1);
		} else {
			free_basil_response_data(brp);
			return (-1);
		}
	}
	sprintf(log_buffer, "ALPS reservation confirmed.");
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	free_basil_response_data(brp);
	return (0);
}

/**
 * @brief
 * 	Issue a request to cancel an existing reservation.
 *
 * Called during job exit/cleanup.
 *
 * @param[in] pjob - pointer to job structure
 * @retval 0 success
 * @retval 1 transient error (retry)
 * @retval -1 fatal error
 *
 */
int
alps_cancel_reservation(job *pjob)
{
	char buf[1024];
	basil_response_t *brp;

	if (!pjob) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "Cannot cancel ALPS reservation, invalid job.");
		return (-1);
	}
	/* Return success if no reservation present. */
	if (pjob->ji_extended.ji_ext.ji_reservation < 0 ||
	    pjob->ji_extended.ji_ext.ji_pagg == 0) {
		return (0);
	}
	sprintf(log_buffer, "Canceling ALPS reservation %ld with PAGG %llu.",
		pjob->ji_extended.ji_ext.ji_reservation,
		pjob->ji_extended.ji_ext.ji_pagg);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	new_alps_req();
	sprintf(requestBuffer, "<?xml version=\"1.0\"?>\n"
			       "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_RELEASE "\" " BASIL_ATR_RSVN_ID "=\"%ld\" "
			       "%s =\"%llu\"/>",
		basilversion_inventory,
		pjob->ji_extended.ji_ext.ji_reservation,
		basil11orig ? BASIL_ATR_ADMIN_COOKIE : BASIL_ATR_PAGG_ID,
		pjob->ji_extended.ji_ext.ji_pagg);
	if ((brp = alps_request(requestBuffer, basilversion_inventory)) == NULL) {
		sprintf(log_buffer, "Failed to cancel ALPS reservation %ld.",
			pjob->ji_extended.ji_ext.ji_reservation);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (-1);
	}
	if (*brp->error != '\0') {
		if (brp->error_flags & BASIL_ERR_TRANSIENT) {
			free_basil_response_data(brp);
			return (1);
		} else {
			/*
			 * check if it's a "No entry for resID"
			 * error message. If so, we will assume the ALPS
			 * reservation went away due to a prior release
			 * request and fall through to the successful exit
			 * If for some reason Cray changes this error string
			 * the behavior of PBS will be to continue to try to
			 * cancel the reservation (even though ALPS does not
			 * know about this reservation) and the job will
			 * remain in the "E" state until the
			 * alps_release_timeout time has elapsed.
			 */
			bzero(buf, sizeof(buf));
			snprintf(buf, sizeof(buf), "No entry for resId %ld",
				 pjob->ji_extended.ji_ext.ji_reservation);
			if (strstr(brp->error, buf) == NULL) {
				sprintf(log_buffer, "Failed to cancel ALPS "
						    "reservation %ld. BASIL response error: %s",
					pjob->ji_extended.ji_ext.ji_reservation,
					brp->error);
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					  LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
				free_basil_response_data(brp);
				return (-1);
			}
		}
	}

	/*
	 * There are still claims on the ALPS reservation, so just
	 * treat it like a transient error so we keep trying to
	 * release the ALPS reservation.
	 */
	if (brp->data.release.claims > 0) {
		sprintf(log_buffer, "ALPS reservation %ld has %u claims "
				    "against it",
			pjob->ji_extended.ji_ext.ji_reservation,
			brp->data.release.claims);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
		free_basil_response_data(brp);
		return (1);
	}

	sprintf(log_buffer, "ALPS reservation cancelled.");
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	free_basil_response_data(brp);
	return (0);
}

/**
 * @brief
 * Issue a request to switch an existing reservation "OUT" (suspend it)
 * or "IN" (resume it).
 *
 * Called by mother superior when a job needs to be suspended or resumed.
 *
 * @retval 0 success
 * @retval 1 transient error (retry)
 * @retval -1 fatal error
 */
int
alps_suspend_resume_reservation(job *pjob, basil_switch_action_t switchval)
{
	basil_response_t *brp;
	char actionstring[10] = "";
	char switch_buf[10] = "";

	if (switchval == basil_switch_action_out) {
		strcpy(switch_buf, "suspend");
		strcpy(actionstring, BASIL_VAL_OUT);
	} else if (switchval == basil_switch_action_in) {
		strcpy(switch_buf, "resume");
		strcpy(actionstring, BASIL_VAL_IN);
	} else {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Invalid switch action %d.", switchval);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE,
			  (char *) __func__, log_buffer);
		return (-1);
	}

	if (!pjob) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Cannot %s (%d), invalid job.", switch_buf, switchval);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE,
			  (char *) __func__, log_buffer);
		return (-1);
	}
	snprintf(log_buffer, sizeof(log_buffer),
		 "Switching ALPS reservation %ld to %s",
		 pjob->ji_extended.ji_ext.ji_reservation, switch_buf);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	new_alps_req();
	snprintf(utilBuffer, sizeof(utilBuffer), "<?xml version=\"1.0\"?>\n"
						 "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_SWITCH "\">\n",
		 basilversion_inventory);
	add_alps_req(utilBuffer);
	add_alps_req(" <" BASIL_ELM_RSVNARRAY ">\n");
	snprintf(utilBuffer, sizeof(utilBuffer),
		 "  <" BASIL_ELM_RESERVATION " " BASIL_ATR_RSVN_ID "=\"%ld\" " BASIL_ATR_ACTION "=\"%s\"/>\n",
		 pjob->ji_extended.ji_ext.ji_reservation,
		 actionstring);
	add_alps_req(utilBuffer);
	add_alps_req(" </" BASIL_ELM_RSVNARRAY ">\n");
	add_alps_req("</" BASIL_ELM_REQUEST ">");
	if ((brp = alps_request(requestBuffer, basilversion_inventory)) == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to switch %s ALPS reservation.", actionstring);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE,
			  (char *) __func__, log_buffer);
		return (-1);
	}
	if (*brp->error != '\0') {
		/* A TRANSIENT error would mean the previous switch
		 * method had not completed
		 */
		if (brp->error_flags & BASIL_ERR_TRANSIENT) {
			free_basil_response_data(brp);
			brp = NULL;
			return (1);
		} else {
			free_basil_response_data(brp);
			brp = NULL;
			return (-1);
		}
	}
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		  (char *) __func__, "Made the ALPS SWITCH request.");
	free_basil_response_data(brp);
	return (0);
}

/**
 * @brief
 * Confirm that an ALPS reservation has been switched to either "SUSPEND"
 * or "RUN" status.
 * Confirm that an ALPS reservation has successfully finished switching in/out.
 *
 * @retval 0 success
 * @retval 1 transient error (retry)
 * @retval 2 transient error (retry) - When reservation is empty
 * @retval -1 fatal error
 */
int
alps_confirm_suspend_resume(job *pjob, basil_switch_action_t switchval)
{
	basil_response_t *brp = NULL;
	basil_response_query_status_res_t *res = NULL;

	if (!pjob) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_ERR, (char *) __func__,
			  "Cannot confirm ALPS reservation, invalid job.");
		return (-1);
	}
	/* If no reservation ID return an error */
	if (pjob->ji_extended.ji_ext.ji_reservation < 0) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid,
			  "No ALPS reservation ID provided.  Can't confirm SWITCH status.");
		return (-1);
	}

	if ((switchval != basil_switch_action_out) &&
	    (switchval != basil_switch_action_in)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Invalid switch action %d.", switchval);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_ERR,
			  (char *) __func__, log_buffer);
		return (-1);
	}

	sprintf(log_buffer, "Confirming ALPS reservation %ld SWITCH status.",
		pjob->ji_extended.ji_ext.ji_reservation);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	new_alps_req();
	sprintf(utilBuffer, "<?xml version=\"1.0\"?>\n"
			    "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_QUERY "\" " BASIL_ATR_TYPE "=\"" BASIL_VAL_STATUS "\">\n",
		basilversion_inventory);
	add_alps_req(utilBuffer);
	add_alps_req(" <" BASIL_ELM_RSVNARRAY ">\n");
	sprintf(utilBuffer,
		"  <" BASIL_ELM_RESERVATION " " BASIL_ATR_RSVN_ID "=\"%ld\"/>\n",
		pjob->ji_extended.ji_ext.ji_reservation);
	add_alps_req(utilBuffer);
	add_alps_req(" </" BASIL_ELM_RSVNARRAY ">\n");
	add_alps_req("</" BASIL_ELM_REQUEST ">");

	if ((brp = alps_request(requestBuffer, basilversion_inventory)) == NULL) {
		sprintf(log_buffer, "Failed to confirm ALPS reservation %ld has been switched.",
			pjob->ji_extended.ji_ext.ji_reservation);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (-1);
	}
	if (*brp->error != '\0') {
		if (brp->error_flags & BASIL_ERR_TRANSIENT) {
			free_basil_response_data(brp);
			return (1);
		} else {
			free_basil_response_data(brp);
			return (-1);
		}
	}

	/*
	 * Now check for status of the suspend/resume
	 * INVALID is considered a permanent error, just error out
	 */
	res = brp->data.query.data.status.reservation;
	if (res->status == basil_reservation_status_invalid) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "ALPS SWITCH status is = 'INVALID'");
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid, log_buffer);
		free_basil_response_data(brp);
		return (-1);
	}

	/*
	 * The MIX, SWITCH and UNKNOWN status response types are considered
	 * transient, we will need to check the status again.
	 */
	if (res->status == basil_reservation_status_mix) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "ALPS SWITCH status is = 'MIX', keep checking "
			 "ALPS status.");
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
		free_basil_response_data(brp);
		return (1);
	}
	if (res->status == basil_reservation_status_switch) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "ALPS SWITCH status is = 'SWITCH', keep checking "
			 "ALPS status.");
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
		free_basil_response_data(brp);
		return (1);
	}
	if (res->status == basil_reservation_status_unknown) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "ALPS SWITCH status is = 'UNKNOWN', keep checking "
			 "ALPS status.");
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
		free_basil_response_data(brp);
		return (1);
	}

	/* What we expect for status depends on whether we are trying to SWITCH IN or OUT */
	if (res->status == basil_reservation_status_run) {
		if (switchval == basil_switch_action_out) {
			/* We want to suspend the reservation's applications, so we
			 * need to keep checking status
			 */
			snprintf(log_buffer, sizeof(log_buffer),
				 "ALPS SWITCH status is 'RUN', and "
				 "'SUSPEND' was requested, keep checking "
				 "ALPS status.");
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				  pjob->ji_qs.ji_jobid, log_buffer);
			free_basil_response_data(brp);
			return (1);
		} else {
			/* We are trying to run the application again, and it is running! */
			snprintf(log_buffer, sizeof(log_buffer),
				 "ALPS reservation %ld has been successfully "
				 "switched to 'RUN'.",
				 pjob->ji_extended.ji_ext.ji_reservation);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				  pjob->ji_qs.ji_jobid, log_buffer);
			free_basil_response_data(brp);
			return (0);
		}
	}
	if (res->status == basil_reservation_status_suspend) {
		if (switchval == basil_switch_action_in) {
			/* We want to run the reservation's applications, so we
			 * need to keep checking status
			 */
			snprintf(log_buffer, sizeof(log_buffer),
				 "ALPS SWITCH status is 'SUSPEND', "
				 "and 'RUN' was requested, keep checking "
				 "ALPS status.");
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				  pjob->ji_qs.ji_jobid, log_buffer);
			free_basil_response_data(brp);
			return (1);
		} else {
			/* We are trying to suspend the application, and it is! */
			snprintf(log_buffer, sizeof(log_buffer),
				 "ALPS reservation %ld has been successfully "
				 "switched to 'SUSPEND'.",
				 pjob->ji_extended.ji_ext.ji_reservation);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				  pjob->ji_qs.ji_jobid, log_buffer);
			free_basil_response_data(brp);
			return (0);
		}
	}
	/*
	 * Due to a race condition in ALPS where ALPS wrongly returns "EMPTY"
	 * (which means no claim on the ALPS resv) when there may be a claim
	 * on the reservation, PBS must work around this by polling for status
	 * again when we get "EMPTY". Thus we will print at DEBUG2 level so
	 * we can be aware of how often the race condition is encountered.
	 */
	if ((res->status == basil_reservation_status_empty) &&
	    (switchval == basil_switch_action_out)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "ALPS reservation %ld SWITCH status is = 'EMPTY'.",
			 pjob->ji_extended.ji_ext.ji_reservation);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
		free_basil_response_data(brp);
		return (2);
	}
	/* Getting the status of EMPTY while SWITCH IN (resume) means
	 * there was nothing to do, so consider the SWITCH done.
	 */
	if ((res->status == basil_reservation_status_empty) &&
	    (switchval == basil_switch_action_in)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "ALPS reservation %ld has been successfully switched.",
			 pjob->ji_extended.ji_ext.ji_reservation);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}
	free_basil_response_data(brp);
	return (0);
}

/**
 * Issue an ENGINE query and determine which version of BASIL
 * we should use.
 */
static void
alps_engine_query(void)
{
	basil_response_t *brp = NULL;
	char *ver = NULL;
	char *tmp = NULL;
	int i = 0;
	int found_ver = 0;

	new_alps_req();
	for (i = 0; (pbs_supported_basil_versions[i] != NULL); i++) {
		sprintf(basilversion_inventory, pbs_supported_basil_versions[i]);
		sprintf(requestBuffer, "<?xml version=\"1.0\"?>\n"
				       "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_QUERY "\" " BASIL_ATR_TYPE "=\"" BASIL_VAL_ENGINE "\"/>",
			basilversion_inventory);
		if ((brp = alps_request(requestBuffer, basilversion_inventory)) != NULL) {
			if (*brp->error == '\0') {
				/*
				 * There are no errors in the response data.
				 * Check the response method to ensure we have
				 * the correct response.
				 */
				if (brp->method == basil_method_query) {
					/* Check if 'basil_support' is set before trying to strdup.
					 * If basil_support is not set, it's likely
					 * CLE 2.2 which doesn't have 'basil_support' but we'll
					 * check that later.
					 */
					if (brp->data.query.data.engine.basil_support != NULL) {
						ver = strdup(brp->data.query.data.engine.basil_support);
						if (ver != NULL) {
							tmp = strtok(ver, ",");
							while (tmp) {
								if ((strcmp(basilversion_inventory, tmp)) == 0) {
									/* Success! We found a version to speak */
									sprintf(log_buffer, "The basilversion is "
											    "set to %s",
										basilversion_inventory);
									log_event(PBSEVENT_DEBUG,
										  PBS_EVENTCLASS_NODE,
										  LOG_DEBUG, __func__, log_buffer);
									found_ver = 1;
									break;
								}
								tmp = strtok(NULL, ",");
							}
							/* We didn't find the version we were looking for
							 * in basil_support, even though the engine query
	 						 * itself succeeded. Something is wrong.
	 						 */
							if (found_ver == 0) {
								sprintf(log_buffer, "ALPS ENGINE query failed. "
										    "Supported BASIL versions returned: "
										    "'%s'",
									ver);
								log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
									  LOG_NOTICE, __func__, log_buffer);
							}
						} else {
							/* No memory */
							sprintf(log_buffer, "ALPS ENGINE query failed. No "
									    "memory");
							log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE,
								  LOG_NOTICE, __func__, log_buffer);
						}
					} else {
						if ((strcmp(basilversion_inventory, BASIL_VAL_VERSION_1_1)) == 0) {
							/* basil_support isn't in the XML response
							 * and the XML wasn't junk, so
							 * assume CLE 2.2 is running.
							 */
							sprintf(log_buffer, "Assuming CLE 2.2 is running, "
									    "setting the basilversion to %s",
								basilversion_inventory);
							log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE,
								  LOG_DEBUG, __func__, log_buffer);
							sprintf(log_buffer, "The basilversion is "
									    "set to %s",
								basilversion_inventory);
							log_event(PBSEVENT_DEBUG,
								  PBS_EVENTCLASS_NODE,
								  LOG_DEBUG, __func__, log_buffer);
							found_ver = 1;
						}
					}
				} else {
					/* wrong method in the response */
					sprintf(log_buffer, "Wrong method, expected: %d but "
							    "got: %d",
						basil_method_query, brp->method);
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
						  LOG_DEBUG, __func__, log_buffer);
				}
			} else {
				/* There was an error in the BASIL response */
				sprintf(log_buffer, "Error in BASIL response: %s", brp->error);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
					  __func__, log_buffer);
			}
		} else {
			sprintf(log_buffer, "ALPS ENGINE query failed with BASIL "
					    "version %s.",
				basilversion_inventory);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
				  LOG_NOTICE, __func__, log_buffer);
		}
		free(ver);
		ver = NULL;
		free_basil_response_data(brp);
		brp = NULL;
		if (found_ver != 0) {
			/* Found it, let's get outta here. */
			break;
		}
	}

	/*
	 * We didn't find the right BASIL version.
	 * Set basilversion to "UNDEFINED"
	 */
	if (found_ver == 0) {
		sprintf(basilversion_inventory, BASIL_VAL_UNDEFINED);
		sprintf(log_buffer, "No BASIL versions are understood.");
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
			  LOG_NOTICE, __func__, log_buffer);
	} else {
		/* we found a BASIL version that works
		 * Set basilver so the rest of the code can use switch
		 * statements to choose the appropriate code path
		 */
		if ((strcmp(basilversion_inventory, BASIL_VAL_VERSION_1_4)) == 0) {
			basilver = basil_1_4;
		} else if ((strcmp(basilversion_inventory, BASIL_VAL_VERSION_1_3)) == 0) {
			basilver = basil_1_3;
		} else if ((strcmp(basilversion_inventory, BASIL_VAL_VERSION_1_2)) == 0) {
			basilver = basil_1_2;
		} else if ((strcmp(basilversion_inventory, BASIL_VAL_VERSION_1_1)) == 0) {
			basilver = basil_1_1;
		}
	}
}

/**
 * @brief
 *	 Issue a request for a system inventory including nodes, CPUs, and
 * 	assigned applications.
 *
 * @return	int
 * @retval  0   : success
 * @retval  -1  : failure
 */
int
alps_inventory(void)
{
	int rc = 0;
	basil_response_t *brp;
	first_compute_node = 1;

	/* Determine what BASIL version we should speak */
	alps_engine_query();
	new_alps_req();
	sprintf(requestBuffer, "<?xml version=\"1.0\"?>\n"
			       "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_QUERY "\" " BASIL_ATR_TYPE "=\"" BASIL_VAL_INVENTORY "\"/>",
		basilversion_inventory);
	if ((brp = alps_request(requestBuffer, basilversion_inventory)) == NULL) {
		sprintf(log_buffer, "ALPS inventory request failed.");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
			  LOG_NOTICE, __func__, log_buffer);
		return -1;
	}
	if (basil_inventory != NULL)
		free(basil_inventory);
	basil_inventory = strdup(alps_client_out);
	if (basil_inventory == NULL) {
		sprintf(log_buffer, "failed to save inventory response");
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_ERR,
			  __func__, log_buffer);
	}
	rc = inventory_to_vnodes(brp);
	free_basil_response_data(brp);
	return rc;
}

/**
 *
 * @brief System Query handling (for KNL Nodes).
 * 	  Invoked from dep_topology() in mom_mach.c before alps_inventory()
 * 	  (which handles processing for non-KNL Cray Compute Nodes) is called.
 *	  Checks if BASIL 1.7 is supported, then makes a System Query request and
 *	  populates System Query related structures.
 *
 * @return void
 *
 */
void
alps_system_KNL(void)
{
	/*
	 * Determine if ALPS supports the BASIL 1.7 protocol. We are only
	 * partially supporting the BASIL 1.7 protocol (for the System Query).
	 */
	alps_engine_query_KNL();

	if (basil_1_7_supported)
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
			  "This Cray system supports the BASIL 1.7 protocol.");
	else {
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE, LOG_ERR, __func__,
			  "This Cray system does not support the BASIL 1.7 protocol.");
		return;
	}

	/*
	 * Allocate a buffer (requestBuffer_knl) for a new ALPS request (System Query).
	 * A nonzero return value indicates failure; return at this point without proceeding
	 * with System Query processing.
	 */
	if (init_KNL_alps_req_buf() != 0)
		return;

	/* Create a System (BASIL 1.7) Query request to fetch KNL information. */
	snprintf(requestBuffer_knl, UTIL_BUFFER_LEN, "<?xml version=\"1.0\"?>\n"
						     "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_QUERY "\" " BASIL_ATR_TYPE "=\"" BASIL_VAL_SYSTEM "\"/>",
		 basilversion_system);

	/*
	 * The 'basil_ver' argument is checked in response_start() (a callback
	 * function invoked during alps_request() processing). Flow of control can
	 * arrive at response_start() from either alps_system_KNL() or alps_inventory().
	 * This argument helps make the distinction.
	 */
	if ((brp_knl = alps_request(requestBuffer_knl, basilversion_system)) == NULL) {

		/* Failure to get KNL Node information from ALPS. */
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, __func__,
			  "ALPS System Query request failed.");
		return;
	}
}

/**
 * @brief Issue an ENGINE query to determine if BASIL 1.7 is supported.
 * 	  We are partially supporting the BASIL 1.7 protocol (for the System Query).
 *	  If the BASIL 1.7 protocol is found in the query response, set a flag
 *	  that will be checked in alps_system_KNL().
 *
 * @return void
 */
static void
alps_engine_query_KNL(void)
{
	basil_response_t *brp_eng;

	/*
	 * Allocate a buffer (requestBuffer_knl) for a new ALPS request (Engine Query).
	 * A nonzero return value indicates failure.
	 */
	if (init_KNL_alps_req_buf() != 0)
		return;

	/* This is set to "1.1", since PBS may be running on a system that may or */
	/* may not support BASIL 1.7. BASIL 1.1 is the lowest version that supports */
	/* the ENGINE Query. */

	sprintf(requestBuffer_knl, "<?xml version=\"1.0\"?>\n"
				   "<" BASIL_ELM_REQUEST " " BASIL_ATR_PROTOCOL "=\"%s\" " BASIL_ATR_METHOD "=\"" BASIL_VAL_QUERY "\" " BASIL_ATR_TYPE "=\"" BASIL_VAL_ENGINE "\"/>",
		BASIL_VAL_VERSION_1_1);
	if ((brp_eng = alps_request(requestBuffer_knl, BASIL_VAL_VERSION_1_1)) != NULL) {
		/* Proceed if no errors in the response data. */
		if (*brp_eng->error == '\0') {
			/* Ensure we have the correct response. */
			if (brp_eng->method == basil_method_query) {
				/* Check if 'basil_support' is set before trying to strdup. */
				if (brp_eng->data.query.data.engine.basil_support != NULL) {

					if (strstr(brp_eng->data.query.data.engine.basil_support,
						   BASIL_VAL_VERSION_1_7) != NULL) {
						basil_1_7_supported = 1;
						snprintf(basilversion_system, sizeof(basilversion_system),
							 BASIL_VAL_VERSION_1_7);
					} else
						basil_1_7_supported = 0;
				}
			} else {
				/* Wrong method in the response. */
				sprintf(log_buffer, "Wrong method, expected: %d but "
						    "got: %d",
					basil_method_query, brp_eng->method);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
					  LOG_DEBUG, __func__, log_buffer);
			}
		} else {
			/* There was an error in the BASIL response. */
			sprintf(log_buffer, "Error in BASIL response: %s", brp_eng->error);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				  __func__, log_buffer);
		}
	}

	free_basil_response_data(brp_eng);
}

/**
 * @brief Process the System (BASIL 1.7) Query Response. This includes creation
 *	  of KNL vnodes.
 *
 * @return void
 */
void
system_to_vnodes_KNL(void)
{
	basil_response_query_system_t *sys_knl;

	if (!basil_1_7_supported)
		return;

	/* System 1.7 Query failed to get KNL Node information from ALPS. */
	if (!brp_knl)
		return;

	if (brp_knl->method != basil_method_query) {
		snprintf(log_buffer, sizeof(log_buffer), "Wrong method: %d",
			 brp_knl->method);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
			  log_buffer);
		return;
	}

	if (brp_knl->data.query.type != basil_query_system) {
		snprintf(log_buffer, sizeof(log_buffer), "Wrong query type: %d",
			 brp_knl->data.query.type);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
			  log_buffer);
		return;
	}

	if (*brp_knl->error != '\0') {
		snprintf(log_buffer, sizeof(log_buffer), "Error in BASIL response: %s",
			 brp_knl->error);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
			  log_buffer);
		return;
	}

	sys_knl = &brp_knl->data.query.data.system;

	create_vnodes_KNL(sys_knl);

	free_basil_response_data(brp_knl);
}

/**
 *
 * @brief Create KNL vnodes.
 * 	  'vnlp' is a global pointer that gets freed in process_hup() (mom_main.c)
 * 	  during a MoM restart. The vnode state gets cleared and we repeat the vnode
 *	  creation cycle i.e. creation of non-KNL vnodes (in inventory_to_vnodes())
 *	  followed by KNL vnodes in this function.
 *
 * @param[in] sys_knl ALPS BASIL System Query response.
 *
 * @return void
 */
static void
create_vnodes_KNL(basil_response_query_system_t *sys_knl)
{
	char *attr, *arch;
	char vname[VNODE_NAME_LEN];
	char utilBuffer_knl[(UTIL_BUFFER_LEN * sizeof(char))];
	int ncpus_per_knl;
	int node_idx = 0;
	int node_count = 0;
	long node_id = 0;
	long *nid_arr = NULL;
	int atype = READ_WRITE | ATR_DFLAG_CVTSLT;
	char mpphost_knl[BASIL_STRING_LONG];

	basil_system_element_t *node_group;

	if (sys_knl == NULL)
		return;

	snprintf(mpphost_knl, sizeof(mpphost_knl), "%s", sys_knl->mpp_host);

	/*
	 * Iterate through all the Node groups in the System Query Response. Each
	 * Node group may contain information about multiple (a 'range list') of KNL Nodes.
	 * Each XML Element <Nodes ...> </Nodes> encapsulates information about a group of Nodes.
	 */
	for (node_group = sys_knl->elements; node_group; node_group = node_group->next) {

		/*
		 * The System Query XML Response contains information about KNL and
		 * non-KNL Nodes. We are only interested in KNL nodes that are in
		 * "batch" mode and in the "up" state.
		 */
		if (exclude_from_KNL_processing(node_group, 1))
			continue;

		/*
		 * Extract NIDs (Node ID) from node_group->nidlist.
		 * If nidlist is empty, node_count gets set to 0 and vnode
		 * creation in the inner for() is bypassed.
		 */
		nid_arr = process_nodelist_KNL(node_group->nidlist, &node_count);

		/*
		 * Create vnodes for each of the KNL Nodes listed in this Node group.
		 * All KNL Nodes within a Node Group will have similar vnode attributes,
		 * since all attributes in each <Nodes ...> XML element apply to all
		 * Nodes listed in the 'rangelist'.
		 */
		for (node_idx = 0; node_idx < node_count; node_idx++) {

			node_id = nid_arr[node_idx];
			snprintf(vname, VNODE_NAME_LEN, "%s_%ld", mpphost_knl, node_id);

			if (first_compute_node) {
				/*
				 * Create the name of the very first vnode so we
				 * can attach topology info to it.
				 */

				attr = ATTR_NODE_TopologyInfo;
				if (vn_addvnr(vnlp, vname, attr, (char *) basil_inventory,
					      ATR_TYPE_STR, READ_ONLY, NULL) == -1)
					goto bad_vnl;
				first_compute_node = 0;
			}

			attr = "sharing";
			if (vn_addvnr(vnlp, vname, attr, ND_Force_Exclhost, 0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.vntype";
			if (vn_addvnr(vnlp, vname, attr, CRAY_COMPUTE, 0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.PBScrayhost";
			if (vn_addvnr(vnlp, vname, attr, mpphost_knl, ATR_TYPE_STR, atype, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.arch";
			arch = BASIL_VAL_XT;
			if (vn_addvnr(vnlp, vname, attr, arch, ATR_TYPE_STR, atype, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.host";
			snprintf(utilBuffer_knl, sizeof(utilBuffer_knl), "%s_%ld", mpphost_knl, node_id);
			if (vn_addvnr(vnlp, vname, attr, utilBuffer_knl, 0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "resources_available.PBScraynid";
			snprintf(utilBuffer_knl, sizeof(utilBuffer_knl), "%ld", node_id);
			if (vn_addvnr(vnlp, vname, attr, utilBuffer_knl, ATR_TYPE_STR, atype, NULL) == -1)
				goto bad_vnl;

			if (vnode_per_numa_node) {
				attr = "resources_available.PBScrayseg";
				if (vn_addvnr(vnlp, vname, attr, "0", ATR_TYPE_STR, atype, NULL) == -1)
					goto bad_vnl;
			}
			attr = "resources_available.ncpus";
			ncpus_per_knl = atoi(node_group->compute_units);
			snprintf(utilBuffer_knl, sizeof(utilBuffer_knl), "%d", ncpus_per_knl);
			if (vn_addvnr(vnlp, vname, attr, utilBuffer_knl, 0, 0, NULL) == -1)
				goto bad_vnl;

			/* avlmem is conventional DRAM mem. avlmem = page_size_kb * page_count. */
			attr = "resources_available.mem";
			snprintf(utilBuffer_knl, sizeof(utilBuffer_knl), "%skb", node_group->avlmem);
			if (vn_addvnr(vnlp, vname, attr, utilBuffer_knl, 0, 0, NULL) == -1)
				goto bad_vnl;

			attr = "current_aoe";
			snprintf(utilBuffer_knl, sizeof(utilBuffer_knl), "%s_%s",
				 node_group->numa_cfg, node_group->hbm_cfg);
			if (vn_addvnr(vnlp, vname, attr, utilBuffer_knl, 0, 0, NULL) == -1)
				goto bad_vnl;

			/* hbmem is high bandwidth mem (MCDRAM) in megabytes. */
			attr = "resources_available.hbmem";
			snprintf(utilBuffer_knl, sizeof(utilBuffer_knl), "%smb", node_group->hbmsize);
			if (vn_addvnr(vnlp, vname, attr, utilBuffer_knl, 0, 0, NULL) == -1)
				goto bad_vnl;
		}
		/* We have no further use for this array of KNL node ids. */
		if (nid_arr) {
			free(nid_arr);
			nid_arr = NULL;
		}
	}

	return;

bad_vnl:
	snprintf(log_buffer, sizeof(log_buffer), "Creation of Cray KNL vnodes failed with name %s", vname);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__, log_buffer);
	/*
	 * Don't free nv since it might be important in the dump.
	 */
	abort();
}

/**
 *
 * @brief Check if this Node Group needs to be considered for KNL processing.
 *        We are only interested in KNL Nodes that have "role" set to "batch" and
 *	  "state" set to "up".
 *	  The attributes "numa_cfg", "hbmsize", "hbm_cfg" not being empty ("") implies
 *	  they pertain to KNL Nodes.
 *
 * @param[in] ptrNodeGrp Pointer to the current Node Group in the System XML Response.
 * @param[in] check_state Indicates wheather this function to look for the KNL node state.
 *
 * @return int
 * @retval 1 Indicates that the Node Group should not be considered.
 * @retval 0 Indicates that the Node Group should be considered.
 *
 */
static int
exclude_from_KNL_processing(basil_system_element_t *ptrNodeGrp,
			    short int check_state)
{
	if ((strcmp(ptrNodeGrp->role, BASIL_VAL_BATCH_SYS) != 0) ||
	    (check_state ? (strcmp(ptrNodeGrp->state,
				   BASIL_VAL_UP_SYS) != 0)
			 : 0) ||
	    ((strcmp(ptrNodeGrp->numa_cfg, "") == 0) &&
	     (strcmp(ptrNodeGrp->hbmsize, "") == 0) &&
	     (strcmp(ptrNodeGrp->hbm_cfg, "") == 0)))
		return 1;
	else
		return 0;
}

/**
 *
 * @brief KNL Nodes are specified in 'Rangelist' format in a string e.g. "12,13,14-18,21".
 * 	  Extract Node IDs from this string and store them in an integer array.
 *
 * @param[in] nidlist String containing rangelist of Nodes.
 * @param[out] ptr_count Total number of Nodes in this list.
 *
 * @return int *
 * @retval This is an long integer array containing Node IDs.
 *	   nid_arr returned here is freed in the calling function after use.
 */
static long *
process_nodelist_KNL(char *nidlist, int *ptr_count)
{
	char delim[] = ",";
	char *token, *nidlist_array, *endptr;
	int nid_count = 0;
	long *nid_arr = NULL;

	if (nidlist == NULL) {
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__, "No KNL nodes.");
		*ptr_count = 0;
		return NULL;
	}

	if ((nidlist_array = strdup(nidlist)) == NULL) {
		log_err(errno, __func__, "malloc failure");
		*ptr_count = 0;
		return NULL;
	}

	endptr = NULL;
	/* 'token' points to a null terminated string containing the token e.g. "12\0", "14-18\0". */
	token = strtok(nidlist_array, delim);
	while (token != NULL) {
		int nid_num;
		/*
		 * Each token (e.g. "12" or "14-18") is converted to an int and sent as
		 * an argument to store_nids(). In case of tokens such as "14-18", nid_num=14
		 * and 'endptr' points to the first invalid character i.e. "-".
		 */
		nid_num = (int) strtol(token, &endptr, 10);
		/* Checking for invalid data in the Node rangelist. */
		if ((*endptr != '\0') && (*endptr != '-')) {
			snprintf(log_buffer, sizeof(log_buffer), "Bad KNL Rangelist: \"%s\"", nidlist_array);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_ERR, __func__, log_buffer);
			free(nid_arr);
			nid_arr = NULL;
			nid_count = 0;
			break;
		}

		store_nids(nid_num, endptr, &nid_arr, &nid_count);
		if (nid_arr == NULL) {
			nid_count = 0;
			break;
		}

		token = strtok(NULL, delim);
	}

	*ptr_count = nid_count;
	free(nidlist_array);
	return nid_arr;
}

/**
 *
 * @brief Helper function for process_nodelist_KNL().
 *	  It stores the tokenized Node IDs in an integer array.
 * @example For the token "14-18", nid_num = 14, *endptr = "-" and endptr = "-18\0".
 *	  The Node IDs 14 and 18 are extracted and stored in 'nid_arr'.
 *
 * @param[in] nid_num Node ID to be stored.
 * @param[in] endptr Ptr to invalid character (set by strtol()).
 *
 * @param[out] nid_arr Array to hold all Node IDs.
 * @param[out] nid_count Node count.
 *
 * @return void
 */
static void
store_nids(int nid_num, char *endptr, long **nid_arr, int *nid_count)
{
	int count = *nid_count;
	int range_len = 1;
	int i = 0;
	long *tmp_ptr = NULL;
	char *ptr = NULL;

	if (*endptr == '-') {
		int nid_num_last;
		nid_num_last = (int) strtol(endptr + 1, &ptr, 10);
		/* Checking for invalid data in the Node rangelist. */
		if ((*ptr != '\0') && (*ptr != '-')) {
			snprintf(log_buffer, sizeof(log_buffer), "Bad KNL Rangelist: \"%s\"", endptr);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_ERR, __func__, log_buffer);
			free(*nid_arr);
			*nid_arr = NULL;
			return;
		}

		range_len = (nid_num_last - nid_num) + 1;
	}

	tmp_ptr = (long *) realloc(*nid_arr, (count + range_len) * sizeof(long));
	if (!tmp_ptr) {
		log_err(errno, __func__, "realloc failure");
		free(*nid_arr);
		*nid_arr = NULL;
		return;
	}
	*nid_arr = tmp_ptr;

	for (i = 0; i < range_len; i++) {
		*(*nid_arr + count) = nid_num + i;
		count++;
	}

	*nid_count = count;
}

/**
 * @brief
 * This function is registered to handle the System element in
 * the System XML response.
 *
 * The standard Expat start handler function prototype is used.
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return void
 */
static void
system_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_response_t *brp;
	basil_response_query_system_t *sys;

	if (++(d->count_sys.system) > 1) {
		parse_err_multiple_elements(d);
		return;
	}

	brp = d->brp;
	brp->data.query.type = basil_query_system;
	sys = &brp->data.query.data.system;

	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_TIMESTAMP, *np) == 0) {
			if (sys->timestamp != 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			sys->timestamp = atoll(*vp);
		} else if (strcmp(BASIL_ATR_MPPHOST, *np) == 0) {
			if (sys->mpp_host[0] != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			snprintf(sys->mpp_host, BASIL_STRING_LONG, "%s", *vp);
		} else if (strcmp(BASIL_ATR_CPCU, *np) == 0) {
			if (sys->cpcu_val != 0) {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			sys->cpcu_val = atoi(*vp);
			if (sys->cpcu_val < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
}

/**
 * @brief
 * This function is registered to handle the 'Nodes' element within a System XML
 * response.
 * This element handler is called each time a new <Nodes ...> element is encountered
 * in the XML response currently being parsed. It populates the user data structure
 * (ud_t *d) with the current <Nodes ...> element attribute/value pairs.
 *
 * The standard Expat start handler function prototype is used.
 * @param d pointer to user data structure
 * @param[in] el unused in this function
 * @param[in] atts array of name/value pairs
 *
 * @return void
 */
static void
node_group_start(ud_t *d, const XML_Char *el, const XML_Char **atts)
{
	const XML_Char **np;
	const XML_Char **vp;
	basil_system_element_t *node_group;
	basil_response_t *brp;
	int page_size_KB = 0;
	int shift_count = 0;
	int res = 0;
	long page_count, avail_mem;
	char *invalid_char_ptr;

	brp = d->brp;
	node_group = (basil_system_element_t *) calloc(1, sizeof(basil_system_element_t));
	if (!node_group) {
		parse_err_out_of_memory(d);
		return;
	}

	if (d->current_sys.node_group)
		(d->current_sys.node_group)->next = node_group;
	else
		brp->data.query.data.system.elements = node_group;

	d->current_sys.node_group = node_group;

	/*
	 * Iterate through the attribute name/value pairs. Update the name and
	 * value pointers with each loop. If the XML attributes ("role", "state",
	 * "speed", "numa_nodes", "dies", "compute_units", "cpus_per_cu",
	 * "page_size_kb", "page_count", "accels", "accel_state", "numa_cfg",
	 * "hbm_size_mb", "hbm_cache_pct") are repeated within each "Nodes"
	 * element under consideration, invoke parse_err_multiple_attrs().
	 */
	for (np = vp = atts, vp++; np && *np && vp && *vp; np = ++vp, vp++) {
		xml_dbg("%s: %s = %s", __func__, *np, *vp);
		if (strcmp(BASIL_ATR_ROLE, *np) == 0) {
			if (*node_group->role != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			if ((strcmp(BASIL_VAL_BATCH_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_INTERACTIVE_SYS, *vp) == 0))
				pbs_strncpy(node_group->role, *vp, sizeof(node_group->role));
			else
				strcpy(node_group->role, BASIL_VAL_UNKNOWN);
		} else if (strcmp(BASIL_ATR_STATE, *np) == 0) {
			if (*node_group->state != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			if ((strcmp(BASIL_VAL_UP_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_DOWN_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_UNAVAILABLE_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_ROUTING_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_SUSPECT_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_ADMIN_SYS, *vp) == 0))
				pbs_strncpy(node_group->state, *vp, sizeof(node_group->state));
			else
				strcpy(node_group->state, BASIL_VAL_UNKNOWN);
		} else if (strcmp(BASIL_ATR_SPEED, *np) == 0) {
			if (*node_group->speed != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/**
			 * The speed attribute is not used elsewhere in PBS. Setting
			 * it to -1 to catch the multiple instances scenario (i.e.
			 * multiple speed attributes occurring in the XML response).
 			 */
			strncpy(node_group->speed, "-1", sizeof(node_group->speed) - 1);
		} else if (strcmp(BASIL_ATR_NUMA_NODES, *np) == 0) {
			if (*node_group->numa_nodes != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be empty (""), "0" nor negative. */
			if (strtol(*vp, &invalid_char_ptr, 10) <= 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
			pbs_strncpy(node_group->numa_nodes, *vp, sizeof(node_group->numa_nodes));
		} else if (strcmp(BASIL_ATR_DIES, *np) == 0) {
			if (*node_group->n_dies != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be empty ("") nor negative. Can be "0". */
			if ((strcmp(*vp, "") == 0) || (strtol(*vp, &invalid_char_ptr, 10) < 0)) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
			pbs_strncpy(node_group->n_dies, *vp, sizeof(node_group->n_dies));
		} else if (strcmp(BASIL_ATR_COMPUTE_UNITS, *np) == 0) {
			if (*node_group->compute_units != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be empty ("") nor negative. Can be "0". */
			if ((strcmp(*vp, "") == 0) || (strtol(*vp, &invalid_char_ptr, 10) < 0)) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
			pbs_strncpy(node_group->compute_units, *vp, sizeof(node_group->compute_units));
		} else if (strcmp(BASIL_ATR_CPUS_PER_CU, *np) == 0) {
			if (*node_group->cpus_per_cu != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be empty (""), "0" nor negative. */
			if (strtol(*vp, &invalid_char_ptr, 10) <= 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
			pbs_strncpy(node_group->cpus_per_cu, *vp, sizeof(node_group->cpus_per_cu));
		} else if (strcmp(BASIL_ATR_PAGE_SIZE_KB, *np) == 0) {
			if (*node_group->pgszl2 != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be empty (""), "0" nor negative. */
			page_size_KB = strtol(*vp, &invalid_char_ptr, 10);
			if (page_size_KB <= 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}

			shift_count = 0;
			while (1) {
				/* Computing log base 2 of page_size_KB. */
				/* e.g. if page_size_kb = 1 KB (i.e. 1024 Bytes), */
				/* then pgszl2 = 10 (since 2 ^ 10 = 1024). */
				res = 1 << shift_count;
				if (res == page_size_KB)
					break;
				else
					shift_count++;
			}
			/* Adding log base 2 of 1024. */
			shift_count += 10;
			snprintf(node_group->pgszl2, BASIL_STRING_SHORT, "%d", shift_count);
		} else if (strcmp(BASIL_ATR_PAGE_COUNT, *np) == 0) {
			if (*node_group->avlmem != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be empty ("") nor negative. Can be "0". */
			page_count = strtol(*vp, &invalid_char_ptr, 10);
			if ((strcmp(*vp, "") == 0) || (page_count < 0)) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}

			avail_mem = page_size_KB * page_count;
			snprintf(node_group->avlmem, BASIL_STRING_SHORT, "%ld", avail_mem);
		} else if (strcmp(BASIL_ATR_ACCELS, *np) == 0) {
			if (*node_group->accel_name != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be empty (""). */
			if (strcmp(*vp, "") == 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
			pbs_strncpy(node_group->accel_name, *vp, sizeof(node_group->accel_name));
		} else if (strcmp(BASIL_ATR_ACCEL_STATE, *np) == 0) {
			if (*node_group->accel_state != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			if ((strcmp(BASIL_VAL_UP_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_DOWN_SYS, *vp) == 0))
				pbs_strncpy(node_group->accel_state, *vp, sizeof(node_group->accel_state));
			else
				strcpy(node_group->accel_state, BASIL_VAL_UNKNOWN);
		} else if (strcmp(BASIL_ATR_NUMA_CFG, *np) == 0) {
			if (*node_group->numa_cfg != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			if ((strcmp(BASIL_VAL_EMPTY_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_A2A_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_SNC2_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_SNC4_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_HEMI_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_QUAD_SYS, *vp) == 0))
				pbs_strncpy(node_group->numa_cfg, *vp, sizeof(node_group->numa_cfg));
			else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else if (strcmp(BASIL_ATR_HBMSIZE, *np) == 0) {
			if (*node_group->hbmsize != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}

			/* *vp cannot be negative. */
			if (strtol(*vp, &invalid_char_ptr, 10) < 0) {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
			pbs_strncpy(node_group->hbmsize, *vp, sizeof(node_group->hbmsize));
		} else if (strcmp(BASIL_ATR_HBM_CFG, *np) == 0) {
			if (*node_group->hbm_cfg != '\0') {
				parse_err_multiple_attrs(d, *np);
				return;
			}
			if ((strcmp(BASIL_VAL_EMPTY_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_0_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_25_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_50_SYS, *vp) == 0) ||
			    (strcmp(BASIL_VAL_100_SYS, *vp) == 0))
				pbs_strncpy(node_group->hbm_cfg, *vp, sizeof(node_group->hbm_cfg));
			else {
				parse_err_illegal_attr_val(d, *np, *vp);
				return;
			}
		} else {
			parse_err_unrecognized_attr(d, *np);
			return;
		}
	}
}

/**
 * Define the array that is used to register the expat element handlers.
 * See parse_element_start, parse_element_end, and parse_char_data for
 * further information.
 * The definition of element_handler_t above explains the different
 * structure elements.
 */

// clang-format off

static element_handler_t handler[] =
{
	{
		"UNDEFINED",
		NULL,
		NULL,
		NULL
	},
	{
		BASIL_ELM_MESSAGE,
		message_start,
		message_end,
		message_char_data
	},
	{
		BASIL_ELM_RESPONSE,
		response_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RESPONSEDATA,
		response_data_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RESERVED,
		reserved_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_CONFIRMED,
		confirmed_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RELEASED,
		released_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_INVENTORY,
		inventory_start,
		inventory_end,
		disallow_char_data
	},
	{
		BASIL_ELM_ENGINE,
		engine_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_NODEARRAY,
		node_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_NODE,
		node_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_SOCKETARRAY,
		socket_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_SOCKET,
		socket_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_SEGMENTARRAY,
		segment_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_SEGMENT,
		segment_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_CUARRAY,
		computeunit_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_COMPUTEUNIT,
		computeunit_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_PROCESSORARRAY,
		processor_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_PROCESSOR,
		processor_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_PROCESSORALLOC,
		processor_allocation_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_MEMORYARRAY,
		memory_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_MEMORY,
		memory_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_MEMORYALLOC,
		memory_allocation_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_LABELARRAY,
		label_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_LABEL,
		label_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVNARRAY,
		reservation_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RESERVATION,
		reservation_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_APPARRAY,
		application_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_APPLICATION,
		application_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_CMDARRAY,
		command_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_COMMAND,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_ACCELERATORARRAY,
		accelerator_array_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_ACCELERATOR,
		accelerator_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_ACCELERATORALLOC,
		accelerator_allocation_start,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_NODEARRAY,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_NODE,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_SGMTARRAY,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_SGMT,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_SGMT,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_PROCARRAY,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_PROCESSOR,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_PROCESSOR,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_MEMARRAY,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_RSVD_MEMORY,
		ignore_element,
		default_element_end,
		disallow_char_data
	},
	{
		BASIL_ELM_SYSTEM,
		system_start,
		default_element_end,
		disallow_char_data,
	},
	{
		BASIL_ELM_NODES,
		node_group_start,
		default_element_end,
		allow_char_data
	},
	{
		NULL,
		NULL,
		NULL,
		NULL
	}
};
#endif /* MOM_ALPS */

// clang-format on


================================================
FILE: src/resmom/linux/mom_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <sys/stat.h>
#include <signal.h>
#include <sys/utsname.h>
#include <limits.h>
#include <sys/resource.h>

#include "pbs_ifl.h"
#include "net_connect.h"
#include "log.h"
#include "job.h"
#include "mom_func.h"
#include "placementsets.h"
#include "tpp.h"

extern int do_debug_report;
extern int termin_child;
extern int exiting_tasks;
extern int next_sample_time;
extern char *log_file;
extern char *path_log;
extern int mom_run_state;
extern int vnode_additive;
extern int kill_jobs_on_exit;
extern vnl_t *vnlp;
extern char *msg_corelimit;
extern vnl_t *vnlp_from_hook;
extern char *ret_string;

extern void debug_report(void);
extern void scan_for_exiting(void);
extern int read_config(char *);
extern void cleanup(void);
extern void initialize(void);
extern void mom_vnlp_report(vnl_t *vnl, char *header);

/**
 * @brief
 *	signal handler for SIGTERM and SIGINT
 *	TERM kills running jobs
 *	INT  leaves them running
 *
 * @param[in] sig - signal number
 *
 * @return	Void
 *
 */

void
stop_me(int sig)
{
	sprintf(log_buffer, "caught signal %d", sig);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);

	switch (sig) {
		case SIGPIPE:
		case SIGUSR1:
#ifdef SIGINFO
		case SIGINFO:
#endif
			return;

		default:
			break;
	}

	mom_run_state = 0;
	if (sig == SIGTERM)
		kill_jobs_on_exit = 1;
}

/**
 * @brief
 *	The finish of MOM's main loop
 *	Actually the heart of the loop
 *
 * @param[in] waittime - wait time
 *
 * @return Void
 *
 */
void
finish_loop(time_t waittime)
{
	if (do_debug_report)
		debug_report();
	if (termin_child) {
		scan_for_terminated();
		waittime = 1; /* want faster time around to next loop */
	}
	if (exiting_tasks) {
		scan_for_exiting();
		waittime = 1; /* want faster time around to next loop */
	}

	if (waittime > next_sample_time)
		waittime = next_sample_time;
	DBPRT(("%s: waittime %lu\n", __func__, (unsigned long) waittime));

	/* wait for a request to process */
	if (wait_request(waittime, NULL) != 0)
		log_err(-1, msg_daemonname, "wait_request failed");
}

/**
 * @brief
 *	returns access permission of a file
 *
 * @return int
 * @retval permission
 *
 */
int
get_permission(char *perm)
{
	if (strcmp(perm, "write") == 0)
		return (S_IWGRP | S_IWOTH);
	return 0;
}

/**
 * @brief
 *	Verify whether PBS_INTERACTIVE process is running.
 *	As this is not useful for *nix platform, so returns HANDLER_SUCCESS.
 *
 * @return handler_ret_t
 * @retval Success
 *
 */

handler_ret_t
check_interactive_service()
{
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	returns username
 *
 * @return string
 * @retval user name
 *
 */
char *
getuname(void)
{
	static char *name = NULL;
	struct utsname n;

	if (name == NULL) {
		if (uname(&n) == -1)
			return NULL;
		sprintf(ret_string, "%s %s %s %s %s", n.sysname,
			n.nodename, n.release, n.version, n.machine);
		name = strdup(ret_string);
	}
	return name;
}

/**
 * @brief
 *	Function to catch HUP signal.
 *	Set call_hup = 1.
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
catch_hup(int sig)
{
	sprintf(log_buffer, "caught signal %d", sig);
	log_event(PBSEVENT_SYSTEM, 0, LOG_INFO, "catch_hup", log_buffer);
	call_hup = HUP_REAL;
}

/**
 * @brief
 *	Do a restart of resmom.
 *	Read the last seen config file and
 *	Clean up and reinit the dependent code.
 *
 * @return Void
 *
 */
void
process_hup(void)
{
	/**
	 * When call_hup == HUP_REAL, the catch_hup function has been called.
	 * When call_hup == HUP_INIT, we couldn't start a job so the ALPS
	 * inventory needs to be refreshed.
	 * When real_hup is false, some actions don't need to be done.
	 */
	int real_hup = (call_hup == HUP_REAL);
	int num_var_env;

	call_hup = HUP_CLEAR;

	if (real_hup) {
		log_event(PBSEVENT_SYSTEM, 0, LOG_INFO, __func__, "reset");
		log_close(1);
		log_open(log_file, path_log);

		if ((num_var_env = setup_env(pbs_conf.pbs_environment)) == -1) {
			mom_run_state = 0;
			return;
		}
	}

	/*
	 ** See if we need to get rid of the previous vnode state.
	 */
	if (!vnode_additive) {
		if (vnlp != NULL) {
			vnl_free(vnlp);
			vnlp = NULL;
		}
		if (vnlp_from_hook != NULL) {
			vnl_free(vnlp_from_hook);
			vnlp_from_hook = NULL;
		}
	}

	if (read_config(NULL) != 0) {
		cleanup();
		log_close(1);
		tpp_shutdown();
		exit(1);
	}

	cleanup();
	initialize();

#if MOM_ALPS /* ALPS needs libjob support */
	/*
	 * This needs to be called after the config file is read.
	 */
	ck_acct_facility_present();
#endif /* MOM_ALPS */

	if (!real_hup) /* no need to go on */
		return;
}

/**
 * @brief
 *	signal handler for SIG_USR2
 *
 * @return Void
 *
 */

void
catch_USR2(int sig)
{
	do_debug_report = 1;
}

/**
 * @brief
 *	Cause useful information to be logged.  This function is called from
 *	MoM's main loop after catching a SIGUSR2.
 *
 * @return Void
 *
 */

void
debug_report(void)
{
	extern void mom_CPUs_report(void);

	mom_CPUs_report();
	mom_vnlp_report(vnlp, NULL);
	do_debug_report = 0;
}

/**
 * @brief
 *	Got an alarm call.
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
toolong(int sig)
{
	log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, __func__, "alarm call");
	DBPRT(("alarm call\n"))
}

/**
 * @brief
 *	Prints usage for prog
 *
 * @param[in] prog - char pointer which holds program name
 *
 * @return Void
 *
 */

void
usage(char *prog)
{
	const char *configusage = "%s -s insert scriptname inputfile\n"
				  "%s -s [ remove | show ] scriptname\n"
				  "%s -s list\n";
	fprintf(stderr,
		"Usage: %s [-C chkdirectory][-d dir][-c configfile][-r|-p][-R port][-M port][-L log][-a alarm][-n nice]\n", prog);
	fprintf(stderr, "or\n");
	fprintf(stderr, configusage, prog, prog, prog);
	fprintf(stderr, "%s --version\n", prog);
	exit(1);
}


================================================
FILE: src/resmom/linux/mom_mach.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef PBSMOM_HTUNIT
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <limits.h>
#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <unistd.h>
#include <stddef.h>
#include <dirent.h>
#include <fcntl.h>
#include <errno.h>
#include <string.h>
#include <pwd.h>
#include <time.h>
#include <ftw.h>
#include <dlfcn.h>
#include <sys/types.h>
#include <sys/time.h>
#include <sys/param.h>
#include <sys/stat.h>
#ifdef __linux__
#include <sys/vfs.h>
#else
#include <sys/mount.h>
#endif
#include <sys/resource.h>
#include <sys/utsname.h>
#include <sys/wait.h>
#include <signal.h>

#include "mom_mach.h"
#include "pbs_error.h"
#include "portability.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "log.h"
#include "mom_func.h"
#include "resmon.h"
#include "../rm_dep.h"
#include "tpp.h"
#include "pbs_license.h"
#include "pbs_ifl.h"
#include "placementsets.h"
#include "mom_vnode.h"

/**
 * @file
 * @brief
 *	System dependent code to gather information for the resource
 *	monitor for a Linux i386 machine.
 *
 * @par Resources known by this code:
 *		cput		cpu time for a pid or session
 *		mem		memory size for a pid or session in KB
 *		resi		resident memory size for a pid or session in KB
 *		sessions	list of sessions in the system
 *		pids		list of pids in a session
 *		nsessions	number of sessions in the system
 *		nusers		number of users in the system
 *		totmem		total memory size in KB
 *		availmem	available memory size in KB
 *		ncpus		number of cpus
 *		physmem		physical memory size in KB
 *		size		size of a file or filesystem
 *		idletime	seconds of idle time (see mom_main.c)
 *		walltime	wall clock time for a pid
 *		loadave		current load average
 */

#ifndef TRUE
#define FALSE 0
#define TRUE 1
#endif /* TRUE */

#define TBL_INC 20
#define CPUT_POSSIBLE_FACTOR 5

static char procfs[] = "/proc";
static DIR *pdir = NULL;
static int pagesize;
static long hz;

/* convert between jiffies and seconds */
#define JTOS(x) (((x) + (hz / 2)) / hz)

static char *choose_procflagsfmt(void);

proc_stat_t *proc_info = NULL;
int nproc = 0;
int max_proc = 0;

extern char *ret_string;
extern char extra_parm[];
extern char no_parm[];
extern int exiting_tasks;
extern vnl_t *vnlp;

extern time_t time_now;

/*
 ** external functions and data
 */
extern int nice_val;
extern int rm_errno;
extern int reqnum;
extern double cputfactor;
extern double wallfactor;
extern pid_t mom_pid;
extern int num_acpus;
extern int num_pcpus;
extern int num_oscpus;
struct config *search(struct config *, char *);
struct rm_attribute *momgetattr(char *);

char *physmem(struct rm_attribute *attrib);

/*
 ** local functions and data
 */
static char *resi(struct rm_attribute *attrib);
static char *totmem(struct rm_attribute *attrib);
static char *availmem(struct rm_attribute *attrib);
static char *ncpus(struct rm_attribute *attrib);
static char *walltime(struct rm_attribute *attrib);

extern char *loadave(struct rm_attribute *attrib);
extern char *nullproc(struct rm_attribute *attrib);

time_t wait_time = 10;

typedef struct proc_mem {
	unsigned long total;
	unsigned long used;
	unsigned long free;
} proc_mem_t;

int mom_does_chkpnt = 0;
unsigned long totalmem;

static int myproc_max = 0;    /* entries in Proc_lnks  */
pbs_plinks *Proc_lnks = NULL; /* process links table head */
static time_t sampletime_ceil;
static time_t sampletime_floor;

/*
 ** local resource array
 */
struct config dependent_config[] = {
	{"resi", {resi}},
	{"totmem", {totmem}},
	{"availmem", {availmem}},
	{"physmem", {physmem}},
	{"ncpus", {ncpus}},
	{"loadave", {loadave}},
	{"walltime", {walltime}},
	{NULL, {nullproc}},
};

unsigned linux_time = 0;
/**
 * @brief
 * 	support routine for getting system time -- sets linux_time
 *
 * @return	Void
 *
 */
void
proc_get_btime(void)
{
	FILE *fp;
	char label[256];

	if ((fp = fopen("/proc/stat", "r")) == NULL)
		return;

	while (!feof(fp)) {
		if (fscanf(fp, "%s", label) == EOF) 
			log_errf(-1, __func__, "fscanf failed. ERR : %s", strerror(errno));
		if (strcmp(label, "btime")) {
			if (fscanf(fp, "%*[^\n]%*c") == EOF) 
				log_errf(-1, __func__, "fscanf failed. ERR : %s", strerror(errno));				
		} else {
			if (fscanf(fp, "%u", &linux_time) == EOF) 
				log_errf(-1, __func__, "fscanf failed. ERR : %s", strerror(errno));				
			fclose(fp);
			return;
		}
	}

	fclose(fp);
	return;
}

static char stat_str_pre[] =
	"%%d "	    /* 1  pid %d The process id */
	"(%%[^)]) " /* 2  comm %s The filename of the executable */
	"%%c "	    /* 3  state %c "RSDZTW" */
	"%%d "	    /* 4  ppid %d The PID of the parent */
	"%%d "	    /* 5  pgrp %d The process group ID */
	"%%d "	    /* 6  session %d The session ID */
	"%%*d "	    /* 7  ignored:  tty_nr */
	"%%*d "	    /* 8  ignored:  tpgid */
	"%s "	    /* 9  flags - %u or %lu */
	"%%*lu "    /* 10 ignored:  minflt */
	"%%*lu "    /* 11 ignored:  cminflt */
	"%%*lu "    /* 12 ignored:  majflt */
	"%%*lu "    /* 13 ignored:  cmajflt */
	"%%lu "	    /* 14 utime %lu */
	"%%lu "	    /* 15 stime %lu */
	"%%ld "	    /* 16 cutime %ld */
	"%%ld "	    /* 17 cstime %ld */
	"%%*ld "    /* 18 ignored:  priority %ld */
	"%%*ld "    /* 19 ignored:  nice %ld */
	"%%*ld "    /* 20 ignored:  num_threads %ld */
	"%%*ld "    /* 21 ignored:  itrealvalue %ld - no longer maintained */
	"%%llu "    /* 22 starttime (was %lu before Linux 2.6 - see proc(5) for conversion details */
	"%%lu "	    /* 23 vsize (bytes) */
	"%%ld "	    /* 24 rss (number of pages) */
	;

/**
 * @brief
 *	returns the process memory (used,free,total).
 *
 * @return	structure handle
 * @retval	pointer to proc_mem_t structure 	Success
 * @retval	NULL					Error
 *
 */
proc_mem_t *
get_proc_mem(void)
{
	static proc_mem_t mm;
	FILE *fp;
	unsigned long m_tot, m_use, m_free;
	unsigned long s_tot, s_use, s_free;
	char strbuf[BUFSIZ];

	if ((fp = fopen("/proc/meminfo", "r")) == NULL)
		return NULL;

	m_tot = m_free = s_tot = s_free = (unsigned long) 0;
	while (fgets(strbuf, sizeof(strbuf), fp) != NULL) {
		sscanf(strbuf, "MemTotal: %ld k", &m_tot);
		sscanf(strbuf, "MemFree: %ld k", &m_free);
		sscanf(strbuf, "SwapTotal: %ld k", &s_tot);
		sscanf(strbuf, "SwapFree: %ld k", &s_free);
	}

	/* convert from kB to B */
	m_tot <<= 10;
	m_free <<= 10;
	s_tot <<= 10;
	s_free <<= 10;
	m_use = m_tot - m_free;
	s_use = s_tot - s_free;

	mm.total = m_tot + s_tot;
	mm.used = m_use + s_use;
	mm.free = m_free + s_free;

	fclose(fp);
	return (&mm);
}

/**
 * @brief
 *	Check if attribute ATTR_NODE_TopologyInfo is in the global 'vnlp' structure.
 *
 * @return int
 * @retval 1	- if ATTR_NODE_TopologyInfo is found as one of the entries in 'vnlp'.
 * @retval 0	- otherwise, if not found or 'vnlp' is NULL.
 *
 */
static int
vnlp_has_topology_info(void)
{
	int i, j;

	if (vnlp == NULL) {
		return (0);
	}

	for (i = 0; i < vnlp->vnl_used; i++) {
		vnal_t *vnalp;

		vnalp = VNL_NODENUM(vnlp, i);

		for (j = 0; j < vnalp->vnal_used; j++) {
			vna_t *vnap;

			vnap = VNAL_NODENUM(vnalp, j);
			if (strcmp(vnap->vna_name, ATTR_NODE_TopologyInfo) == 0) {
				return (1);
			}
		}
	}

	return (0);
}

/**
 * @brief
 * 	dep_topology - compute and export platform-dependent topology information
 *
 * @return	void
 *
 * @par MT-Safe:	no
 * @par Side Effects:
 *	None
 *
 * @par Note:	nominally, we use the Open-MPI hardware locality (a.k.a. hwloc)
 *		functions to export the topology information that it generates,
 *		but on Cray systems we instead export information via the
 *		alps_inventory() function.
 * @brief A synopsis of the function call sequence (for vnode creation).
 *	  1. Process the System (BASIL 1.7) Query in alps_system_KNL(). This
 *	  	does not include KNL vnode creation.
 *	  2. Process the Inventory (BASIL 1.4) Query in alps_inventory() and
 *		create non-KNL vnodes.
 *	  	KNL vnodes returned by the earlier System Query (step 1) are
 *		filtered from the Inventory (1.4) response.
 *	  3. Create KNL vnodes in system_to_vnodes_KNL(), using information
 *		retrieved earlier in alps_system_KNL() (step 1).
 *
 * @see	alps_inventory
 * @see	mom_topology
 * @see alps_system_KNL
 * @see system_to_vnodes_KNL
 */
void
dep_topology(void)
{
#if MOM_ALPS
	/* This function is the entry point for System Query processing. */
	/* Activities include making a System XML Request & handling the XML Response. */
	alps_system_KNL();
	/*
	 * The call to physmem needs to take place before the ALPS inventory
	 * because a vnode for the "login node" will be created which
	 * must have the memory set.
	 */
	/* Inventory (BASIL 1.4) Query processing. */
	/* Create non-KNL vnodes. */
	if (alps_inventory() != -1) {
		/* Create KNL VNodes. */
		system_to_vnodes_KNL();
	}
#endif
	if (!vnlp_has_topology_info()) {
		/* Populate "topology_info", only if the attribute */
		/* has not been set inside alps_inventory(). */
		mom_topology();
	}
}

/**
 * @brief
 *	initialize the platform-dependent topology information
 *
 * @return	Void
 *
 */
void
dep_initialize(void)
{
	pagesize = getpagesize();

	if ((pdir = opendir(procfs)) == NULL) {
		log_err(errno, __func__, "opendir");
		return;
	}

	proc_get_btime();

	/*
	 ** The global cpu counts are now set in ncpus()
	 */
	(void) ncpus(NULL);

	(void) physmem(0); /* get memory info */

	dep_topology();
}

/**
 * @brief
 *	clean up platform-dependent topology information
 *
 * @return	Void
 *
 */
void
dep_cleanup(void)
{
	if (pdir) {
		closedir(pdir);
		pdir = NULL;
	}
}

/**
 * @brief
 *	 Scan a list of tasks and return true if one of them matches sid
 *
 * @param[in] pjob - job pointer
 * @param[in] sid - session id
 *
 * @return	Bool
 * @retval	TRUE
 * @retval	FALSE	Error
 *
 */
static int
injob(job *pjob, pid_t sid)
{
	task *ptask;

	for (ptask = (task *) GET_NEXT(pjob->ji_tasks);
	     ptask;
	     ptask = (task *) GET_NEXT(ptask->ti_jobtask)) {
		if (ptask->ti_qs.ti_sid <= 1)
			continue;
		if (ptask->ti_qs.ti_sid == sid)
			return TRUE;
	}
	return FALSE;
}

/**
 * @brief
 * 	Internal session cpu time decoding routine.
 *
 * @param[in] job - a job pointer.
 *
 * @return	unsigned long
 * @retval	sum of all cpu time consumed for all tasks executed by the job, in seconds,
 *		adjusted by cputfactor.
 *
 */
static unsigned long
cput_sum(job *pjob)
{
	int i;
	unsigned long cputime = 0;
	int nps = 0;
	int active_tasks = 0;
	int taskprocs;
	proc_stat_t *ps;
	task *ptask;
	unsigned long pcput, tcput;

	for (ptask = (task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (task *) GET_NEXT(ptask->ti_jobtask)) {

		/* DEAD task */
		if (ptask->ti_qs.ti_sid <= 1) {
			cputime += ptask->ti_cput;
			continue;
		}

		active_tasks++;
		tcput = 0;
		taskprocs = 0;
		for (i = 0; i < nproc; i++) {
			ps = &proc_info[i];

			/* is this process part of the task? */
			if (ptask->ti_qs.ti_sid != ps->session)
				continue;

			/*
			 * is the owner of this process the job owner?
			 * prevents random PID matches after reboot/restart
			 */
			if (ps->uid != pjob->ji_qs.ji_un.ji_momt.ji_exuid)
				continue;

			nps++;
			taskprocs++;

			/* don't include zombie unless it is the top proc */
			if ((ps->state == 'Z') && (ps->pid != ps->session) &&
			    (ps->ppid != mom_pid))
				continue;

			pcput = (ps->utime + ps->stime +
				 ps->cutime + ps->cstime);

			if (pcput > num_oscpus * (sampletime_ceil + 1 - pjob->ji_qs.ji_stime) * CPUT_POSSIBLE_FACTOR) {
				sprintf(log_buffer,
					"cput for process %d impossible (%lds > %lds * %d), ignoring",
					ps->pid,
					pcput,
					(sampletime_ceil + 1 - pjob->ji_qs.ji_stime),
					num_oscpus);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG, pjob->ji_qs.ji_jobid,
					  log_buffer);
				sampletime_floor = pjob->ji_qs.ji_stime;
				sampletime_ceil = pjob->ji_qs.ji_stime;
				return 0;

			} else {
				tcput += pcput;
			}

			DBPRT(("%s: task %8.8X ses %d pid %d cputime %lu\n",
			       __func__, ptask->ti_qs.ti_task,
			       ps->session, ps->pid, tcput))
		}
		if (tcput > ptask->ti_cput)
			ptask->ti_cput = tcput;
		cputime += ptask->ti_cput;
		DBPRT(("%s: task %8.8X cput %lu total %lu\n", __func__,
		       ptask->ti_qs.ti_task, ptask->ti_cput, cputime))

		if (taskprocs == 0) {
			/*
			 * Linux seems to be able to forget about a
			 * process on rare occations.  See if the
			 * kill system call can see it.
			 */
			if (kill(ptask->ti_qs.ti_sid, 0) == 0) {
				sprintf(log_buffer,
					"active processes for task %8.8X "
					"session %d exist but are not "
					"reported in /proc",
					ptask->ti_qs.ti_task,
					(int) ptask->ti_qs.ti_sid);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG, pjob->ji_qs.ji_jobid,
					  log_buffer);
				/*
				 * Fake a non-zero nps so the job is not killed.
				 */
				nps++;
				continue;
			}

			/*
			 * Don't declare a running task exited without a small
			 * grace time.
			 */
			if ((ptask->ti_qs.ti_status == TI_STATE_RUNNING) &&
			    ((time_now - pjob->ji_qs.ji_stime) < 10)) {
				sprintf(log_buffer,
					"no active processes for task %8.8X "
					"session %d exist but the job is"
					"only %ld secs old",
					ptask->ti_qs.ti_task,
					(int) ptask->ti_qs.ti_sid,
					time_now - pjob->ji_qs.ji_stime);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG, pjob->ji_qs.ji_jobid,
					  log_buffer);
				/*
				 * Fake a non-zero nps so the job is not killed.
				 */
				nps++;
				continue;
			}
			sprintf(log_buffer,
				"no active process for task %8.8X",
				ptask->ti_qs.ti_task);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
				  LOG_INFO, pjob->ji_qs.ji_jobid,
				  log_buffer);
			ptask->ti_qs.ti_status = TI_STATE_EXITED;
			task_save(ptask);
			exiting_tasks = 1;
		}
	}

	if (active_tasks == 0) {
		sprintf(log_buffer, "no active tasks");
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
			  LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
	}
	if (nps == 0)
		pjob->ji_flags |= MOM_NO_PROC;

	if (cputime > num_oscpus * (sampletime_ceil + 1 - pjob->ji_qs.ji_stime) * CPUT_POSSIBLE_FACTOR) {
		sprintf(log_buffer,
			"cput for job impossible (%lds > %lds * %d), ignoring",
			cputime,
			(sampletime_ceil + 1 - pjob->ji_qs.ji_stime),
			num_oscpus);

		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
			  LOG_DEBUG, pjob->ji_qs.ji_jobid,
			  log_buffer);
		sampletime_floor = pjob->ji_qs.ji_stime;
		sampletime_ceil = pjob->ji_qs.ji_stime;
		return 0;
	}

	return ((unsigned long) ((double) cputime * cputfactor));
}

/**
 * @brief
 * 	Internal session memory usage function.
 *
 * @param[in] job - job pointer
 *
 * @return	unsigned long
 * @retval	the total number of bytes of address
 *		space consumed by all current processes within the job.
 *
 */
static unsigned long
mem_sum(job *pjob)
{
	int i;
	unsigned long segadd;
	proc_stat_t *ps;

	segadd = 0;

	for (i = 0; i < nproc; i++) {

		ps = &proc_info[i];

		if (!injob(pjob, ps->session))
			continue;
		segadd += ps->vsize;
		DBPRT(("%s: pid: %d  pr_size: %lu  total: %lu\n",
		       __func__, ps->pid, (unsigned long) ps->vsize, segadd))
	}

	return (segadd);
}

/**
 * @brief
 * 	Internal session workingset size function.
 *
 * @param[in] pjob - job pointer
 *
 * @return	unsigned long
 * @retval	new resident set size 	Success
 * @retval	old resident set size	Error
 *
 */
static unsigned long
resi_sum(job *pjob)
{
	int i;
	unsigned long resisize;
	proc_stat_t *ps;

	resisize = 0;
	for (i = 0; i < nproc; i++) {

		ps = &proc_info[i];

		if (!injob(pjob, ps->session))
			continue;

		resisize += ps->rss * pagesize;
	}

	return (resisize);
}

/**
 * @brief
 * 	Establish system-enforced limits for the job.
 *
 *	Run through the resource list, checking the values for all items
 *	we recognize.
 *
 * @param[in] pjob - job pointer
 * @param[in]  set_mode	- setting mode
 *
 *	If set_mode is SET_LIMIT_SET, then also set hard limits for the
 *			  system enforced limits (not-polled).
 *	If anything goes wrong with the process, return a PBS error code
 *	and print a message on standard error.  A zero-length resource list
 *	is not an error.
 *
 *	If set_mode is SET_LIMIT_SET the entry conditions are:
 *	    1.	MOM has already forked, and we are called from the child.
 *	    2.	The child is still running as root.
 *	    3.  Standard error is open to the user's file.
 *
 *	If set_mode is SET_LIMIT_ALTER, we are beening called to modify
 *	existing limits.  Cannot alter those set by setrlimit (kernel)
 *	because we are the wrong process.
 *
 * @return	int
 * @retval	PBSE_NONE	Success
 * @retval	PBSE_*		Error
 *
 */
int
mom_set_limits(job *pjob, int set_mode)
{
	char *pname;
	int retval;
	unsigned long value; /* place in which to build resource value */
	resource *pres;
	struct rlimit reslim;
	unsigned long mem_limit = 0;
	unsigned long vmem_limit = 0;
	unsigned long cput_limit = 0;

	DBPRT(("%s: entered\n", __func__))
	assert(pjob != NULL);
	assert((get_jattr(pjob, JOB_ATR_resource))->at_type == ATR_TYPE_RESC);
	pres = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));

	/*
	 * Cycle through all the resource specifications,
	 * setting limits appropriately.
	 */

	/* mem and vmem limits come from the local node limits, not the job */
	mem_limit = pjob->ji_hosts[pjob->ji_nodeid].hn_nrlimit.rl_mem << 10;
	vmem_limit = pjob->ji_hosts[pjob->ji_nodeid].hn_nrlimit.rl_vmem << 10;

	while (pres != NULL) {
		assert(pres->rs_defin != NULL);
		pname = pres->rs_defin->rs_name;
		assert(pname != NULL);
		assert(*pname != '\0');

		if (strcmp(pname, "cput") == 0 ||
		    strcmp(pname, "pcput") == 0) {
			retval = local_gettime(pres, &value);
			if (retval != PBSE_NONE)
				return (error(pname, retval));
			if ((cput_limit == 0) || (value < cput_limit))
				cput_limit = value;
		} else if (strcmp(pname, "pvmem") == 0) {
			retval = local_getsize(pres, &value);
			if (retval != PBSE_NONE)
				return (error(pname, retval));
			if ((vmem_limit == 0) || (value < vmem_limit))
				vmem_limit = value;
		} else if (strcmp(pname, "pmem") == 0) { /* set */
			retval = local_getsize(pres, &value);
			if (retval != PBSE_NONE)
				return (error(pname, retval));
			if ((mem_limit == 0) || (value < mem_limit))
				mem_limit = value;
		} else if (strcmp(pname, "walltime") == 0) { /* Check */
			retval = local_gettime(pres, &value);
			if (retval != PBSE_NONE)
				return (error(pname, retval));
		} else if (strcmp(pname, "nice") == 0) { /* set nice */
			if (set_mode == SET_LIMIT_SET) {
				errno = 0;
				if ((nice((int) pres->rs_value.at_val.at_long) == -1) && (errno != 0))
					return (error(pname, PBSE_BADATVAL));
			}
		} else if (strcmp(pname, "file") == 0) { /* set */
			if (set_mode == SET_LIMIT_SET) {
				retval = local_getsize(pres, &value);
				if (retval != PBSE_NONE)
					return (error(pname, retval));
				reslim.rlim_cur = reslim.rlim_max = value;
				if (setrlimit(RLIMIT_FSIZE, &reslim) < 0)
					return (error(pname, PBSE_SYSTEM));
			}
		}
		pres = (resource *) GET_NEXT(pres->rs_link);
	}

	if (set_mode == SET_LIMIT_SET) {
		/* if either vmem or pvmem was given, set sys limit to lesser */
		if (vmem_limit != 0) {
			reslim.rlim_cur = reslim.rlim_max = vmem_limit;
			if (setrlimit(RLIMIT_AS, &reslim) < 0)
				return (error("RLIMIT_AS", PBSE_SYSTEM));
		}

		/* if either mem or pmem was given, set sys limit to lesser */
		if (mem_limit != 0) {
			reslim.rlim_cur = reslim.rlim_max = mem_limit;
			if (setrlimit(RLIMIT_RSS, &reslim) < 0)
				return (error("RLIMIT_RSS", PBSE_SYSTEM));
		}

		/* if either cput or pcput was given, set sys limit to lesser */
		if (cput_limit != 0) {
			reslim.rlim_cur = reslim.rlim_max =
				(unsigned long) ((double) cput_limit / cputfactor);
			if (setrlimit(RLIMIT_CPU, &reslim) < 0)
				return (error("RLIMIT_CPU", PBSE_SYSTEM));
		}
	}
	return (PBSE_NONE);
}

/**
 * @brief
 * 	State whether MOM main loop has to poll this job to determine if some
 * 	limits are being exceeded.
 *
 * @param[in] pjob - job pointer
 *
 * @return	int
 * @retval	TRUE	if polling is necessary
 * @retval	FALSE 	otherwise.
 *
 * NOTE: Actual polling is done using the mom_over_limit machine-dependent function.
 *
 */
int
mom_do_poll(job *pjob)
{
	char *pname;
	resource *pres;

	DBPRT(("%s: entered\n", __func__))
	assert(pjob != NULL);
	assert((get_jattr(pjob, JOB_ATR_resource))->at_type == ATR_TYPE_RESC);
	pres = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));

	while (pres != NULL) {
		assert(pres->rs_defin != NULL);
		pname = pres->rs_defin->rs_name;
		assert(pname != NULL);
		assert(*pname != '\0');

		if (strcmp(pname, "walltime") == 0 ||
		    strcmp(pname, "cput") == 0 ||
		    strcmp(pname, "mem") == 0 ||
		    strcmp(pname, "vmem") == 0 ||
		    strcmp(pname, "ncpus") == 0)
			return (TRUE);
		pres = (resource *) GET_NEXT(pres->rs_link);
	}

	return (FALSE);
}

/**
 * @brief
 * 	Setup for polling.
 *	Open kernel device and get namelist info.
 *
 * @return	int
 * @retval	PBSE_NONE		Success
 * @retval	PBSE_SYSTEM		Error
 *
 */
int
mom_open_poll(void)
{
	DBPRT(("%s: entered\n", __func__))
	pagesize = getpagesize();
	proc_info = (proc_stat_t *) malloc(sizeof(proc_stat_t) * TBL_INC);
	if (proc_info == NULL) {
		log_err(errno, __func__, "malloc");
		return (PBSE_SYSTEM);
	}
	max_proc = TBL_INC;

	return (PBSE_NONE);
}

/**
 * @brief
 * 	Declare start of polling loop.
 *
 * @return	int
 * @retval	PBSE_INTERNAL	Dir pdir in NULL
 * @retval	PBSE_NONE	Success
 *
 */
int
mom_get_sample(void)
{
	struct dirent *dent = NULL;
	FILE *fd = NULL;
	static char path[MAXPATHLEN + 1];
	char procname[MAXPATHLEN + 1]; /* space for dent->d_name plus extra */
	char procid[MAXPATHLEN + 1];
	struct stat sb;
	proc_stat_t *ps = NULL;
	int nprocs = 0;
	int ncached = 0;
	int ncantstat = 0;
	int nnomem = 0;
	unsigned long long starttime;
	int nskipped = 0;
	extern time_t time_last_sample;
	char *stat_str = NULL;

	/* There are no job tasks created in mock run mode, so no need to walk the proc table */
	if (mock_run)
		return PBSE_NONE;

	DBPRT(("%s: entered\n", __func__))
	if (pdir == NULL)
		return PBSE_INTERNAL;

	rewinddir(pdir);
	nproc = 0;
	fd = NULL;
	if (hz == 0)
		hz = sysconf(_SC_CLK_TCK);
	time_last_sample = time(0);
	sampletime_floor = time_last_sample;
	while (errno = 0, (dent = readdir(pdir)) != NULL) {
		int nomem = 0;
		struct stat sbuf;

		nprocs++;

		/*
		 ** Check to see if we have /proc/pid or /proc/.pid
		 */
		if (!isdigit(dent->d_name[0])) {
			if (dent->d_name[0] == '.' && isdigit(dent->d_name[1])) {
				nomem = 1;
				nnomem++;
			} else
				continue;
		}
		snprintf(procid, sizeof(procid), "/proc/%s", dent->d_name);
		if ((stat(procid, &sbuf) == -1) || (sbuf.st_uid == 0)) {
			/* ignore root-owned processes */
			nskipped++;
			continue;
		}
		snprintf(procname, sizeof(procname), "/proc/%s/stat", dent->d_name);

		if ((fd = fopen(procname, "r")) == NULL) {
			ncantstat++;
			continue;
		}

		ps = &proc_info[nproc];
		stat_str = choose_procflagsfmt();
		if (stat_str == NULL) {
			log_err(errno, __func__, "choose_procflagsfmt allocation failed");
			return PBSE_INTERNAL;
		}
		if (fscanf(fd, stat_str,
			   &ps->pid,	 /* "%d "	1  pid %d The process id */
			   path,	 /* "(%[^)]) "	2  comm %s The filename of the executable */
			   &ps->state,	 /* "%c "	3  state %c "RSDZTW" */
			   &ps->ppid,	 /* "%d "	4  ppid %d The PID of the parent */
			   &ps->pgrp,	 /* "%d "	5  pgrp %d The process group ID */
			   &ps->session, /* "%d "	6  session %d The session ID */
			   /* "%*d "	7  ignored:  tty_nr */
			   /* "%*d "	8  ignored:  tpgid */
			   &ps->flags, /* "%u or %lu"	9  flags */
			   /* "%*lu "	10 ignored:  minflt */
			   /* "%*lu "	11 ignored:  cminflt */
			   /* "%*lu "	12 ignored:  majflt */
			   /* "%*lu "	13 ignored:  cmajflt */
			   &ps->utime,	/* "%lu "	14 utime %lu */
			   &ps->stime,	/* "%lu "	15 stime %lu */
			   &ps->cutime, /* "%ld "	16 cutime %ld */
			   &ps->cstime, /* "%ld "	17 cstime %ld */
			   /* "%*ld "	18 ignored:  priority %ld */
			   /* "%*ld "	19 ignored:  nice %ld */
			   /* "%*ld "	20 ignored:  num_threads %ld */
			   /* "%*ld "	21 ignored:  itrealvalue %ld - no longer maintained */
			   &starttime, /* "%llu "	22 starttime (was %lu before Linux 2.6 - see proc(5) for conversion details */
			   &ps->vsize, /* "%lu "	23 vsize (bytes) */
			   &ps->rss    /* "%ld "	24 rss (number of pages) */
			   ) != 14) {
			ncantstat++;
			fclose(fd);
			continue;
		}

		if (fstat(fileno(fd), &sb) == -1) {
			fclose(fd);
			continue;
		}
		ps->uid = sb.st_uid;
		fclose(fd);

		/*
		 ** A .pid thread shows the memory of the process
		 ** but we only want to count it once.
		 */
		if (nomem) {
			ps->vsize = 0;
			ps->rss = 0;
		}

		ps->start_time = linux_time + (starttime / hz);
		snprintf(ps->comm, sizeof(ps->comm), "%.*s",
			 (int) (sizeof(ps->comm) - 1), path);

		ps->utime = JTOS(ps->utime);
		ps->stime = JTOS(ps->stime);
		ps->cutime = JTOS(ps->cutime);
		ps->cstime = JTOS(ps->cstime);
		if (++nproc == max_proc) {
			void *hold;
			DBPRT(("%s: alloc more proc table space %d\n", __func__, nproc))
			max_proc += TBL_INC;
			hold = realloc((void *) proc_info,
				       max_proc * sizeof(proc_stat_t));
			assert(hold != NULL);
			proc_info = (proc_stat_t *) hold;
		}
	}
	if (errno != 0 && errno != ENOENT)
		log_err(errno, __func__, "readdir");
	sampletime_ceil = time_last_sample;
	sprintf(log_buffer,
		"nprocs:  %d, cantstat:  %d, nomem:  %d, skipped:  %d, "
		"cached:  %d",
		nprocs - 2, ncantstat, nnomem, nskipped,
		ncached);
	log_event(PBSEVENT_DEBUG4, 0, LOG_DEBUG, __func__, log_buffer);
	return (PBSE_NONE);
}

/**
 * @brief
 * 	Update the resources used.<attributes> of a job.
 *
 * @param[in]	pjob - job in question.
 *
 * @note
 *	The first time this is called for a job, set up resource entries for
 *	each resource that can be reported for this machine.  Fill in the
 *	correct values.
 *	If a resource attribute has been set in a mom hook, then its value
 *	will not be updated here. This allows a mom  hook to override
 *	resource value.
 *
 * @return int
 * @retval PBSE_NONE	for success.
 */
int
mom_set_use(job *pjob)
{
	resource *pres;
	resource *pres_req;
	attribute *at;
	attribute *at_req;
	resource_def *rd;
	u_Long *lp_sz, lnum_sz;
	unsigned long *lp, lnum, oldcput;
	long ncpus_req;

	assert(pjob != NULL);
	at = get_jattr(pjob, JOB_ATR_resc_used);
	assert(at->at_type == ATR_TYPE_RESC);

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) != 0)
		return (PBSE_NONE); /* job suspended, don't track it */

	DBPRT(("%s: entered %s\n", __func__, pjob->ji_qs.ji_jobid))

	at->at_flags |= (ATR_VFLAG_MODIFY | ATR_VFLAG_SET);

	rd = &svr_resc_def[RESC_NCPUS];
	pres = find_resc_entry(at, rd);
	if (pres == NULL) {
		pres = add_resource_entry(at, rd);
		mark_attr_set(&pres->rs_value);
		pres->rs_value.at_type = ATR_TYPE_LONG;

		/*
		 * get pointer to list of resources *requested* for the job
		 * so the ncpus used can be set to ncpus requested
		 */
		at_req = get_jattr(pjob, JOB_ATR_resource);
		assert(at->at_type == ATR_TYPE_RESC);

		pres_req = find_resc_entry(at_req, rd);
		if ((pres_req != NULL) &&
		    ((ncpus_req = pres_req->rs_value.at_val.at_long) != 0))
			pres->rs_value.at_val.at_long = ncpus_req;
		else
			pres->rs_value.at_val.at_long = 0;
	}

	rd = &svr_resc_def[RESC_CPUT];
	pres = find_resc_entry(at, rd);
	if (pres == NULL) {
		pres = add_resource_entry(at, rd);
		mark_attr_set(&pres->rs_value);
		pres->rs_value.at_type = ATR_TYPE_LONG;
		pres->rs_value.at_val.at_long = 0;
	}
	lp = (unsigned long *) &pres->rs_value.at_val.at_long;
	oldcput = *lp;
	lnum = cput_sum(pjob);
	lnum = MAX(*lp, lnum);
	if ((pres->rs_value.at_flags & ATR_VFLAG_HOOK) == 0) {
		/* don't conflict with hook setting a value */
		*lp = lnum;
	}

	rd = &svr_resc_def[RESC_CPUPERCENT];
	pres = find_resc_entry(at, rd);
	if (pres == NULL) {
		pres = add_resource_entry(at, rd);
		mark_attr_set(&pres->rs_value);
		pres->rs_value.at_type = ATR_TYPE_LONG;
		pres->rs_value.at_val.at_long = 0;
	}
	if ((pres->rs_value.at_flags & ATR_VFLAG_HOOK) == 0) {
		/* now calculate weighted moving average cpu usage */
		/* percentage */
		calc_cpupercent(pjob, oldcput, lnum, sampletime_ceil);
	}
	pjob->ji_sampletim = sampletime_floor;

	rd = &svr_resc_def[RESC_VMEM];
	pres = find_resc_entry(at, rd);
	if (pres == NULL) {
		pres = add_resource_entry(at, rd);
		mark_attr_set(&pres->rs_value);
		pres->rs_value.at_type = ATR_TYPE_SIZE;
		pres->rs_value.at_val.at_size.atsv_shift = 10; /* KB */
		pres->rs_value.at_val.at_size.atsv_units = ATR_SV_BYTESZ;
	} else if ((pres->rs_value.at_flags & ATR_VFLAG_HOOK) == 0) {
		lp_sz = &pres->rs_value.at_val.at_size.atsv_num;
		lnum_sz = (mem_sum(pjob) + 1023) >> 10; /* as KB */
		*lp_sz = MAX(*lp_sz, lnum_sz);
	}

	/* update walltime usage */
	update_walltime(pjob);

	rd = &svr_resc_def[RESC_MEM];
	pres = find_resc_entry(at, rd);
	if (pres == NULL) {
		pres = add_resource_entry(at, rd);
		mark_attr_set(&pres->rs_value);
		pres->rs_value.at_type = ATR_TYPE_SIZE;
		pres->rs_value.at_val.at_size.atsv_shift = 10; /* KB */
		pres->rs_value.at_val.at_size.atsv_units = ATR_SV_BYTESZ;
	} else if ((pres->rs_value.at_flags & ATR_VFLAG_HOOK) == 0) {
		lp_sz = &pres->rs_value.at_val.at_size.atsv_num;
		lnum_sz = (resi_sum(pjob) + 1023) >> 10; /* as KB */
		*lp_sz = MAX(*lp_sz, lnum_sz);
	}

	return (PBSE_NONE);
}

/**
 * @brief
 * 	bld_ptree - establish links (parent, child, and sibling) for processes
 * 	in a given session.
 *
 *	The PBS_PROC_* macros are defined in resmom/.../mom_mach.h
 *	to refer to the correct machine dependent table.
 *	Linkage scope changed from static to default as this gets referred
 *	from scan_for_terminated(), declaration	added in the mom_mach.h.
 *
 * @param[in] sid - session id
 *
 * @return	int
 * @retval	number of processes in session	Success
 *
 */
int
bld_ptree(pid_t sid)
{
	int myproc_ct; /* count of processes in a session */
	int i, j;

	if (Proc_lnks == NULL) {
		Proc_lnks = (pbs_plinks *) malloc(TBL_INC * sizeof(pbs_plinks));
		assert(Proc_lnks != NULL);
		myproc_max = TBL_INC;
	}

	/*
	 * Build links for processes in the session in question.
	 * First, load with the processes in the session.
	 */

	myproc_ct = 0;
	for (i = 0; i < nproc; i++) {
		if (PBS_PROC_PID(i) <= 1)
			continue;
		if ((int) PBS_PROC_SID(i) == sid) {
			Proc_lnks[myproc_ct].pl_pid = PBS_PROC_PID(i);
			Proc_lnks[myproc_ct].pl_ppid = PBS_PROC_PPID(i);
			Proc_lnks[myproc_ct].pl_parent = -1;
			Proc_lnks[myproc_ct].pl_sib = -1;
			Proc_lnks[myproc_ct].pl_child = -1;
			Proc_lnks[myproc_ct].pl_done = 0;
			if (++myproc_ct == myproc_max) {
				void *hold;

				myproc_max += TBL_INC;
				hold = realloc((void *) Proc_lnks,
					       myproc_max * sizeof(pbs_plinks));
				assert(hold != NULL);
				Proc_lnks = (pbs_plinks *) hold;
			}
		}
	}

	/* Now build the tree for those processes */

	for (i = 0; i < myproc_ct; i++) {
		/*
		 * Find all the children for this process, establish links.
		 */
		for (j = 0; j < myproc_ct; j++) {
			if (j == i)
				continue;
			if (Proc_lnks[j].pl_ppid == Proc_lnks[i].pl_pid) {
				Proc_lnks[j].pl_parent = i;
				Proc_lnks[j].pl_sib = Proc_lnks[i].pl_child;
				Proc_lnks[i].pl_child = j;
			}
		}
	}
	return (myproc_ct); /* number of processes in session */
}

/**
 * @brief
 * 	kill_ptree - traverse the process tree, killing the processes as we go
 *
 * @param[in]	idx:	current pid index
 * @param[in]	flag:	traverse order, top down (1) or bottom up (0)
 * @param[in]	sig:	the signal to send
 *
 * @return	Void
 *
 */
static void
kill_ptree(int idx, int flag, int sig)
{
	pid_t child;

	if (flag && !Proc_lnks[idx].pl_done) { /* top down */
		DBPRT(("%s: top down %d\n", __func__, Proc_lnks[idx].pl_pid));
		(void) kill(Proc_lnks[idx].pl_pid, sig);
		Proc_lnks[idx].pl_done = 1;
	}
	child = Proc_lnks[idx].pl_child;
	while (child != -1) {
		kill_ptree(child, flag, sig);
		child = Proc_lnks[child].pl_sib;
	}
	if (!flag && !Proc_lnks[idx].pl_done) { /* bottom up */
		DBPRT(("%s: bottom up %d\n", __func__, Proc_lnks[idx].pl_pid));
		(void) kill(Proc_lnks[idx].pl_pid, sig);
		Proc_lnks[idx].pl_done = 1;
	}
}
/**
 * @brief
 *	kill task session
 *
 * @param[in] ptask - pointer to pbs_task structure
 * @param[in] sig - signal number
 * @param[in] dir - indication how to kill
 *		    0 - kill child first
 *		    1 - kill parent first
 *
 * @return	int
 * @retval	number of tasks
 *
 */
int
kill_task(pbs_task *ptask, int sig, int dir)
{
	return kill_session(ptask->ti_qs.ti_sid, sig, dir);
}

/**
 * @brief
 *	Kill a task session.
 *	Call with the task pointer and a signal number.
 *
 * @param[in] sesid - session id
 * @param[in] sig - signal number
 * @param[in] dir - indication how to kill
 *                  0 - kill child first
 *	            1 - kill parent first
 *
 * @return	int
 * @retval      number of tasks
 *
 */
int
kill_session(pid_t sesid, int sig, int dir)
{
	int ct = 0;
	int i;

	DBPRT(("%s: entered sid %d\n", __func__, sesid))
	if (sesid <= 1)
		return 0;

	(void) mom_get_sample();
	ct = bld_ptree(sesid);
	DBPRT(("%s: bld_ptree %d\n", __func__, ct))

	/*
	 ** Find index into the Proc_lnks table for the session lead.
	 */
	for (i = 0; i < ct; i++) {
		if (Proc_lnks[i].pl_pid == sesid) {
			kill_ptree(i, dir, sig);
			break;
		}
	}
	/*
	 ** Do a linear pass.
	 */
	for (i = 0; i < ct; i++) {
		if (Proc_lnks[i].pl_done)
			continue;
		DBPRT(("%s: cleanup %d\n", __func__, Proc_lnks[i].pl_pid))
		kill(Proc_lnks[i].pl_pid, sig);
	}

	/*
	 ** Kill the process group in case anything was missed reading /proc
	 */
	if ((sig == SIGKILL) || (ct == 0))
		killpg(sesid, sig);

	return ct;
}

/**
 * @brief
 *	Clean up everything related to polling.
 *
 * @return	int
 * @retval	PBSE_NONE	Success
 * @retval	PBSE_SYSTEM	Error
 *
 */
int
mom_close_poll(void)
{
	DBPRT(("%s: entered\n", __func__))
	if (pdir) {
		if (closedir(pdir) != 0) {
			log_err(errno, __func__, "closedir");
			return (PBSE_SYSTEM);
		}
		pdir = NULL;
	}
	if (proc_info) {
		(void) free(proc_info);
		proc_info = NULL;
		max_proc = 0;
	}

	return (PBSE_NONE);
}

/**
 * @brief
 * 	Checkpoint the job.
 *
 * @param[in] ptask - pointer to task
 * @param[in] file - filename
 * @param[in] abort - value indicating abort
 *
 * If abort is true, kill it too.
 *
 * @return	int
 * @retval	-1
 */
int
mach_checkpoint(task *ptask, char *file, int abort)
{
	return (-1);
}

/**
 * @brief
 * 	Restart the job from the checkpoint file.
 *
 * @param[in] ptask - pointer to task
 * @param[in] file - filename
 *
 * @return      long
 * @retval      session id	Success
 * @retval	-1		Error
 */
long
mach_restart(task *ptask, char *file)
{
	return (-1);
}

/**
 * @brief
 *	Return 1 if proc table can be read, 0 otherwise.
 */
int
getprocs(void)
{
	static unsigned int lastproc = 0;

	if (lastproc == reqnum) /* don't need new proc table */
		return 1;

	if (mom_get_sample() != PBSE_NONE)
		return 0;

	lastproc = reqnum;
	return 1;
}

#define dsecs(val) ((double) (val))

/**
 * @brief
 *	computes and returns the cpu time process with  pid jobid
 *
 * @param[in] jobid - process id for job
 *
 * @return	string
 * @retval	cputime		Success
 * @retval	NULL		Error
 *
 */
char *
cput_job(pid_t jobid)
{
	int i;
	int found = 0;
	double cputime, addtime;
	proc_stat_t *ps;

	cputime = 0.0;
	for (i = 0; i < nproc; i++) {

		ps = &proc_info[i];
		if (jobid != ps->session)
			continue;

		found = 1;
		addtime = dsecs(ps->cutime) + dsecs(ps->cstime);

		cputime += addtime;
		DBPRT(("%s: total %.2f pid %d %.2f\n", __func__, cputime,
		       ps->pid, addtime))
	}
	if (found) {
		sprintf(ret_string, "%.2f", cputime * cputfactor);
		return ret_string;
	}

	rm_errno = RM_ERR_EXIST;
	return NULL;
}

/**
 * @brief
 *      computes and returns the cpu time process with  pid pid.
 *
 * @param[in] pid - process id
 *
 * @return      string
 * @retval      cputime         Success
 * @retval      NULL            Error
 *
 */
char *
cput_proc(pid_t pid)
{
	int i;
	double cputime;
	proc_stat_t *ps = NULL;

	mom_get_sample();
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];
		if (ps->pid == pid)
			break;
	}
	if (i == nproc) {
		rm_errno = RM_ERR_EXIST;
		return NULL;
	}
	cputime = dsecs(ps->utime) + dsecs(ps->stime);

	sprintf(ret_string, "%.2f", cputime * cputfactor);
	return ret_string;
}

/**
 * @brief
 *	wrapper function for cput_proc and cput_job.
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return	string
 * @retval	cputime		Success
 * @retval	NULL		ERRor
 *
 */
char *
cput(struct rm_attribute *attrib)
{
	int value;

	if (attrib == NULL) {
		log_err(-1, __func__, no_parm);
		rm_errno = RM_ERR_NOPARAM;
		return NULL;
	}
	if ((value = atoi(attrib->a_value)) == 0) {
		sprintf(log_buffer, "bad param: %s", attrib->a_value);
		log_err(-1, __func__, log_buffer);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if (momgetattr(NULL)) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (strcmp(attrib->a_qualifier, "session") == 0)
		return (cput_job((pid_t) value));
	else if (strcmp(attrib->a_qualifier, "proc") == 0)
		return (cput_proc((pid_t) value));
	else {
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
}

/**
 * @brief
 *      computes and returns the memory for session with  pid sid..
 *
 * @param[in] sid - process id
 *
 * @return      string
 * @retval      memsize         Success
 * @retval      NULL            Error
 *
 */
char *
mem_job(pid_t sid)
{
	unsigned long memsize;
	int i;
	proc_stat_t *ps;

	memsize = 0;

	mom_get_sample();
	for (i = 0; i < nproc; i++) {

		ps = &proc_info[i];

		if (sid != ps->session)
			continue;
		memsize += ps->vsize;
	}

	if (memsize == 0) {
		rm_errno = RM_ERR_EXIST;
		return NULL;
	} else {
		sprintf(ret_string, "%lukb", memsize >> 10); /* KB */
		return ret_string;
	}
}

/**
 * @brief
 *      computes and returns the memory for process with  pid sid..
 *
 * @param[in] pid - process id
 *
 * @return      string
 * @retval      memsize         Success
 * @retval      NULL            Error
 *
 */
char *
mem_proc(pid_t pid)
{
	int i;
	proc_stat_t *ps = NULL;

	mom_get_sample();
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];
		if (ps->pid == pid)
			break;
	}
	if (i == nproc) {
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}

	sprintf(ret_string, "%lukb", (unsigned long) ps->vsize >> 10); /* KB */
	return ret_string;
}

/**
 * @brief
 *      wrapper function for mem_job and mem_proc..
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return      string
 * @retval      memsize         Success
 * @retval      NULL            ERRor
 *
 */
char *
mem(struct rm_attribute *attrib)
{
	int value;

	if (attrib == NULL) {
		log_err(-1, __func__, no_parm);
		rm_errno = RM_ERR_NOPARAM;
		return NULL;
	}
	if ((value = atoi(attrib->a_value)) == 0) {
		sprintf(log_buffer, "bad param: %s", attrib->a_value);
		log_err(-1, __func__, log_buffer);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if (momgetattr(NULL)) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (strcmp(attrib->a_qualifier, "session") == 0)
		return (mem_job((pid_t) value));
	else if (strcmp(attrib->a_qualifier, "proc") == 0)
		return (mem_proc((pid_t) value));
	else {
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
}

/**
 * @brief
 *	computes and returns resident set size for job
 *
 * @param[in] jobid - pid for job
 *
 * @return	string
 * @retval	resident set size	Success
 * @retval	NULL			Error
 *
 */
static char *
resi_job(pid_t jobid)
{
	int i;
	unsigned long resisize;
	int found = 0;
	proc_stat_t *ps;

	resisize = 0;
	mom_get_sample();

	for (i = 0; i < nproc; i++) {

		ps = &proc_info[i];

		if (jobid != ps->session)
			continue;

		found = 1;
		resisize += ps->rss;
	}
	if (found) {
		/* in KB */
		sprintf(ret_string, "%lukb", (resisize * (unsigned long) pagesize) >> 10);
		return ret_string;
	}

	rm_errno = RM_ERR_EXIST;
	return NULL;
}

/**
 * @brief
 *      computes and returns resident set size for process
 *
 * @param[in] pid - process id
 *
 * @return      string
 * @retval      resident set size       Success
 * @retval      NULL                    Error
 *
 */
static char *
resi_proc(pid_t pid)
{
	int i;
	proc_stat_t *ps = NULL;

	mom_get_sample();
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];
		if (ps->pid == pid)
			break;
	}
	if (i == nproc) {
		rm_errno = RM_ERR_EXIST;
		return NULL;
	}
	/* in KB */
	sprintf(ret_string, "%lukb", ((unsigned long) ps->rss * (unsigned long) pagesize) >> 10);
	return ret_string;
}

/**
 * @brief
 *      wrapper function for mem_job and mem_proc..
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return      string
 * @retval      resident set size     	Success
 * @retval      NULL            	ERRor
 *
 */
static char *
resi(struct rm_attribute *attrib)
{
	int value;

	if (attrib == NULL) {
		log_err(-1, __func__, no_parm);
		rm_errno = RM_ERR_NOPARAM;
		return NULL;
	}
	if ((value = atoi(attrib->a_value)) == 0) {
		sprintf(log_buffer, "bad param: %s", attrib->a_value);
		log_err(-1, __func__, log_buffer);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if (momgetattr(NULL)) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (strcmp(attrib->a_qualifier, "session") == 0)
		return (resi_job((pid_t) value));
	else if (strcmp(attrib->a_qualifier, "proc") == 0)
		return (resi_proc((pid_t) value));
	else {
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
}

/**
 * @brief
 *	returns the number of sessions
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return	string
 * @retval	sessions	Success
 * @retval	NULL		error
 *
 */
char *
sessions(struct rm_attribute *attrib)
{
	char *fmt;
	int i, j;
	proc_stat_t *ps;
	int njids = 0;
	pid_t *jids, *hold;
	static int maxjid = 200;
	register pid_t jobid;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if ((jids = (pid_t *) calloc(maxjid, sizeof(pid_t))) == NULL) {
		log_err(errno, __func__, "no memory");
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}

	mom_get_sample();

	/*
	 ** Search for members of session
	 */
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];

		if (ps->uid == 0)
			continue;
		if ((jobid = ps->session) == 0)
			continue;
		DBPRT(("%s[%d]: pid %d sid %d\n",
		       __func__, njids, ps->pid, jobid))

		for (j = 0; j < njids; j++) {
			if (jids[j] == jobid)
				break;
		}
		if (j == njids) {	       /* not found */
			if (njids == maxjid) { /* need more space */
				maxjid += 100;
				hold = (pid_t *) realloc(jids, maxjid);
				if (hold == NULL) {
					log_err(errno, __func__, "realloc");
					rm_errno = RM_ERR_SYSTEM;
					free(jids);
					return NULL;
				}
				jids = hold;
			}
			jids[njids++] = jobid; /* add jobid to list */
		}
	}

	fmt = ret_string;
	for (j = 0; j < njids; j++) {
		checkret(&fmt, 100);
		sprintf(fmt, " %d", (int) jids[j]);
		fmt += strlen(fmt);
	}
	free(jids);
	return ret_string;
}

/**
 * @brief
 *	wrapper function for sessions().
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return      string
 * @retval      sessions        Success
 * @retval      0           	error
 *
 */
char *
nsessions(struct rm_attribute *attrib)
{
	char *result, *ch;
	int num = 0;

	if ((result = sessions(attrib)) == NULL)
		return result;

	for (ch = result; *ch; ch++) {
		if (*ch == ' ') /* count blanks */
			num++;
	}
	sprintf(ret_string, "%d", num);
	return ret_string;
}

/**
 * @brief
 *      returns the number of processes in session
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return      string
 * @retval      process        Success
 * @retval      NULL            error
 *
 */
char *
pids(struct rm_attribute *attrib)
{
	char *fmt;
	int i;
	pid_t jobid;
	proc_stat_t *ps;
	int num_pids;

	if (attrib == NULL) {
		log_err(-1, __func__, no_parm);
		rm_errno = RM_ERR_NOPARAM;
		return NULL;
	}
	if ((jobid = (pid_t) atoi(attrib->a_value)) == 0) {
		sprintf(log_buffer, "bad param: %s", attrib->a_value);
		log_err(-1, __func__, log_buffer);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if (momgetattr(NULL)) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (strcmp(attrib->a_qualifier, "session") != 0) {
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	mom_get_sample();

	/*
	 ** Search for members of session
	 */
	fmt = ret_string;
	num_pids = 0;

	for (i = 0; i < nproc; i++) {

		ps = &proc_info[i];
		DBPRT(("%s[%d]: pid: %d sid %d\n",
		       __func__, num_pids, ps->pid, ps->session))
		if (jobid != ps->session)
			continue;

		sprintf(fmt, "%d ", ps->pid);
		fmt += strlen(fmt);
		num_pids++;
	}
	if (num_pids == 0) {
		rm_errno = RM_ERR_EXIST;
		return NULL;
	}
	return ret_string;
}

/**
 * @brief
 *      returns the number of users
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return      string
 * @retval      users        Success
 * @retval      NULL            error
 *
 */
char *
nusers(struct rm_attribute *attrib)
{
	int i;
	int j;
	proc_stat_t *ps;
	int nuids = 0;
	uid_t *uids, *hold;
	static int maxuid = 200;
	register uid_t uid;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if ((uids = (uid_t *) calloc(maxuid, sizeof(uid_t))) == NULL) {
		log_err(errno, __func__, "no memory");
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}

	mom_get_sample();
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];

		if ((uid = ps->uid) == 0)
			continue;

		DBPRT(("%s[%d]: pid %d uid %d\n",
		       __func__, nuids, ps->pid, uid))

		for (j = 0; j < nuids; j++) {
			if (uids[j] == uid)
				break;
		}
		if (j == nuids) {	       /* not found */
			if (nuids == maxuid) { /* need more space */
				maxuid += 100;
				hold = (uid_t *) realloc(uids, maxuid);
				if (hold == NULL) {
					log_err(errno, __func__, "realloc");
					rm_errno = RM_ERR_SYSTEM;
					free(uids);
					return NULL;
				}
				uids = hold;
			}
			uids[nuids++] = uid; /* add uid to list */
		}
	}

	sprintf(ret_string, "%d", nuids);
	free(uids);
	return ret_string;
}

/**
 * @brief
 *	returns all the process ids
 *
 * @return	pid_t
 * @retval	pids	Success
 * @retval	NULl	Error
 *
 */
pid_t *
allpids(void)
{
	int i;
	proc_stat_t *ps;
	static pid_t *pids = NULL;

	getprocs();

	if (pids != NULL)
		free(pids);
	if ((pids = (pid_t *) calloc(nproc + 1, sizeof(pid_t))) == NULL) {
		log_err(errno, __func__, "no memory");
		return NULL;
	}

	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];

		pids[i] = ps->pid; /* add pid to list */
	}
	pids[nproc] = -1;
	return pids;
}

/**
 * @brief
 *	 return amount of total memory on system in KB as numeric string
 *
 * @return      string
 * @retval      total memory    	Success
 * @retval      NULl    		Error
 *
 */
static char *
totmem(struct rm_attribute *attrib)
{
	proc_mem_t *mm;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if ((mm = get_proc_mem()) == NULL) {
		log_err(errno, __func__, "get_proc_mem");
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}
	DBPRT(("%s: total mem=%lu\n", __func__, mm->total))
	sprintf(ret_string, "%lukb", (unsigned long) mm->total >> 10); /* KB */
	return ret_string;
}

/**
 * @brief
 *      returns available free process memory
 *
 * @return      string
 * @retval      avbl free process memory		Success
 * @retval      NULl 					Error
 *
 */
static char *
availmem(struct rm_attribute *attrib)
{
	proc_mem_t *mm;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if ((mm = get_proc_mem()) == NULL) {
		log_err(errno, __func__, "get_proc_mem");
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}
	DBPRT(("%s: free mem=%lu\n", __func__, mm->free))
	sprintf(ret_string, "%lukb", (unsigned long) mm->free >> 10); /* KB */
	return ret_string;
}

/**
 * @brief	find and remember the current Linux release number
 * @param[in]	struct utsname *
 *
 * @return	value returned by uname(2)'s utsname release[] member
 */
static char *
uname2release(struct utsname *u)
{
	static char *u_release = NULL;

	if (u_release != NULL)
		return (u_release);
	else if ((u_release = malloc(strlen(u->release) + 1)) != NULL) {
		memcpy(u_release, u->release, strlen(u->release) + 1);
		sprintf(log_buffer, "uname release:  %s", u_release);
		log_event(PBSEVENT_DEBUG4, 0, LOG_DEBUG, __func__, log_buffer);
		return (u_release);
	} else
		return NULL;
}

/**
 * @brief	choose the format for the /proc "flags" field
 * @param[in]	release
 * @param[out]	stdio format string
 *
 * @return	"%lu" for /proc before Linux version 2.6.22
 * @return	"%u" for  /proc Linux version 2.6.22 and later
 * *
 * @note	To derive release information, we're at the mercy of whoever
 *		configures the kernel's UTS_RELEASE value when it's built.
 *		We hope that the version information is in the format
 *		<major>.<minor>.<micro>, or - if not - that at least we can
 *		depend on sscanf() to throw away extraneous characters and
 *		derive a number for the "micro" version that can be used to
 *		leverage proc(5)'s "%u (%lu before Linux 2.6.22)" flags
 *		field format specification.
 *
 *		This code is not designed to work for Linux versions < 2.
 *
 * @par MT-Safe:	yes
 */
static char *
procflagsfmt(char *release)
{
	char *p;
	char *ver_begin = release;
	char rfseparator_dot = '.';
	char rfseparator_dash = '-';
	int nseparators_seen = 0;
	int major, minor = 0, micro, ver;
	static char before[] = "%lu";
	static char after[] = "%u";

	for (p = release; *p != '\0'; p++) {
		if ((*p == rfseparator_dot) || (*p == rfseparator_dash)) {
			p++;
			if (sscanf(ver_begin, "%d", &ver) == 1) {
				if (nseparators_seen == 0) {
					major = ver;
					if (major > 2)
						return (after);
				} else if (nseparators_seen == 1) {
					minor = ver;
					if (minor > 6)
						return (after);
				} else {
					micro = ver;
					/* "flags %u (%lu before Linux 2.6.22)" */
					if ((minor == 6) && (micro >= 22))
						return (after);
					else
						return (before);
				}
			}
			ver_begin = p;
			nseparators_seen++;
		}
	}

	return NULL;
}

/**
 * @brief	return the stdio format directive for the /proc flags field
 *
 * @param[out]	format string for the /proc flags field
 *
 * @return	static char *
 *
 * @see	procflagsfmt
 * @see	uname2release
 */
static char *
choose_procflagsfmt(void)
{
	char buf[1024];
	static char *fmtstr = NULL;
	static int initialized = 0;
	struct utsname u;

	if (initialized)
		return (fmtstr);

	if (uname(&u) == -1) {
		log_err(errno, __func__, "uname");
		return NULL;
	} else {
		char *release;
		char *fffs; /* the flags field format string */

		if ((release = uname2release(&u)) == NULL) {
			log_err(-1, __func__, "uname2release returned NULL");
			return NULL;
		} else if ((fffs = procflagsfmt(release)) == NULL) {
			log_err(-1, __func__, "procflagsfmt returned NULL");
			return NULL;
		} else {
			sprintf(buf, stat_str_pre, fffs);
			if ((fmtstr = strdup(buf)) == NULL) {
				log_err(-1, __func__, "strdup returned NULL");
				return NULL;
			} else {
				initialized = 1;
				return (fmtstr);
			}
		}
	}
}

#else /* PBSMOM_HTUNIT */

/*
 **	This is code to compile the ncpus function for unit testing.
 **	What follows is a bit of cruft needed to make a correct program.
 */
#include <stdio.h>
#include <stdlib.h>
#include <limits.h>
#include <string.h>
#include <assert.h>
#include <sys/utsname.h>

char log_buffer[4096];
char ret_string[4096];

/**
 * @brief
 *	outputs logevent on stdout
 *
 * @param[in] a - event  number
 * @param[in] b - event number
 * @param[in] c - type of log
 * @param[in] id - id to indicate log from which object
 * @param[in] mess - message to be logged
 *
 * @return	Void
 *
 */
void
log_event(int a, int b, int c, char *id, char *mess)
{
	printf("%s: %s\n", id, mess);
}
/**
 * @brief
 *      outputs logevent on stdout
 *
 * @param[in] a - error number
 * @param[in] id - id to indicate log from which object
 * @param[in] mess - message to be logged
 *
 * @return      Void
 *
 */
void
log_err(int a, char *id, char *mess)
{
	printf("error %d %s: %s\n", a, id, mess);
}

struct rm_attribute;

static char *ncpus(struct rm_attribute *);

#define PBSEVENT_SYSTEM 0
#define LOG_NOTICE 0
#define RM_ERR_BADPARAM 0
#define pbs_strsep strsep

int num_pcpus, num_acpus, num_oscpus, rm_errno;
char extra_parm[] = "extra_parm";

int
main()
{
	if (ncpus(NULL) != NULL)
		printf("ncpus = %s\n", ret_string);
	printf("physical %d  logical %d\n", num_pcpus, num_oscpus);
	return 0;
}
#endif /* PBSMOM_HTUNIT */

/**
 * @brief
 *	returns the processed string (skip).
 *	processed string format "string	:"
 *
 * @param[in] str - label
 * @param[in] skip - string to be processed
 *
 * @return	string
 * @retval	NULL			Error
 * @retval	processed string	Success
 *
 */

char *
skipstr(char *str, char *skip)
{
	int len = strlen(skip);

	if (strncmp(str, skip, len) != 0)
		return NULL;

	skip = str + len;
	return skip + strspn(skip, "\t :");
}

int linenum;
int errflag = 0;

char badformat[] = "warning: /proc/cpuinfo format not recognized";

/**
 * @brief
 *	prints log events about ncpus
 *
 * @return	Void
 *
 */
void
warning(void)
{
	if (!errflag) {
		log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, "ncpus", badformat);
		errflag = 1;
	}
	log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, "ncpus", log_buffer);
	return;
}

/**
 * @brief
 *	converts and return the string value
 *
 * @param[in] str - string to be processed
 *
 * @return	int
 * @retval	converted val(strtol)	Success
 * @retval	0			Error
 *
 */
int
getnum(char *str)
{
	long val;
	char *extra;

	if (str == NULL || *str == '\0') {
		sprintf(log_buffer, "line %d: number needed", linenum);
		warning();
		return 0;
	}

	val = strtol(str, &extra, 10);
	if (*extra != '\0') {
		sprintf(log_buffer, "line %d: bad number %s", linenum, str);
		warning();
	}
	return (int) val;
}

#define LABLELEN 2048

struct {
	int physid;
	int coreid;
} *proc_array = NULL;
int proc_num = 0;

/**
 * @brief
 *	Add an entry to the proc_array[] with the physid/coreid
 *	combination of a cpu.  We do this to count the number of
 *	unique tuples since HyperThread(tm) "cpus" will have duplicate
 *	physid/coreid values.
 *
 * @param[in] physid - physical id
 * @param[in] coreid - core id
 *
 * @return	Void
 *
 */
static void
proc_new(int physid, int coreid)
{
	int i;

	if (physid < 0 || coreid < 0)
		return;

	for (i = 0; i < proc_num; i++) {
		if (proc_array[i].physid == physid &&
		    proc_array[i].coreid == coreid)
			break;
	}
	if (i == proc_num) { /* need new proc entry */
		proc_num++;
		proc_array = realloc(proc_array, sizeof(*proc_array) * proc_num);
		assert(proc_array != NULL);
		proc_array[i].physid = physid;
		proc_array[i].coreid = coreid;
	}
}

/**
 * @brief
 *	return the number of cpus
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return	string
 * @retval	number of cpus	Success
 * @retval	NULL		Error
 *
 */
static char *
ncpus(struct rm_attribute *attrib)
{
	char *file = "/proc/cpuinfo";
	char label[LABLELEN];
	char *cp;
	FILE *fp;
	int procs, logical;
	int skip = 0;
	int siblings = 0;
	int coreid = -1;
	int physid = -1;
	int maxsib = 0;
	int maxsibcpu = 0;
	int procnum = -1;
	int htseen, htany;
	int intelany;
	static int oldlinux = -1;
	int len;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (num_pcpus > 0) {
		sprintf(ret_string, "%d", num_pcpus);
		return ret_string;
	}

	if ((fp = fopen(file, "r")) == NULL)
		return NULL;

	if (oldlinux == -1) {
		struct utsname ubuf;

		oldlinux = 0;
		if (uname(&ubuf) == 0) {
			if (strncmp(ubuf.release, "2.4.", 4) == 0 &&
			    strcmp(ubuf.machine, "x86_64") == 0)
				oldlinux = 1;
		}
	}

	errflag = 0;
	logical = procs = 0;
	linenum = 0;
	htany = intelany = 0;

	while (!feof(fp)) {
		if (fgets(label, LABLELEN, fp) == NULL)
			break;

		linenum++;
		len = strlen(label);
		if (label[len - 1] == '\n')
			label[len - 1] = '\0';
		else {
			sprintf(log_buffer, "line %d too long", linenum);
			warning();
		}

		/* x86 linux /proc/cpuinfo format is
		 ** processor 0
		 ** info about processor 0
		 ** processor 1
		 ** info about processor 1
		 ** etc.... Alpha linux just prints "cpus detected: X"
		 */
		if ((cp = skipstr(label, "processor")) != NULL) {
			proc_new(physid, coreid);
			physid = coreid = -1;
			htseen = 0;
			siblings = 0;
			procnum = getnum(cp);
			logical++;
			if (skip == 0)
				procs++;
		} else if ((cp = skipstr(label, "cpus detected")) != NULL) {
			logical = procs = getnum(cp);
			break;
		} else if ((cp = skipstr(label, "siblings")) != NULL ||
			   (cp = skipstr(label, "threads")) != NULL ||
			   (cp = skipstr(label, "Number of siblings")) != NULL) {
			siblings = getnum(cp);
			if (siblings > maxsib) {
				maxsib = siblings;
				maxsibcpu = procnum;
			}
			if (skip == 0)
				skip = siblings - 1;
			else
				skip--;
		} else if ((cp = skipstr(label, "physical id")) != NULL) {
			physid = getnum(cp);
		} else if ((cp = skipstr(label, "core id")) != NULL) {
			coreid = getnum(cp);
		} else if ((cp = skipstr(label, "vendor_id")) != NULL) {
			if (strcmp(cp, "GenuineIntel") == 0)
				intelany = 1;
		} else if ((cp = skipstr(label, "flags")) != NULL) {
			while (cp != NULL) {
				char *flag = pbs_strsep(&cp, " ");

				if (flag == NULL)
					break;
				if (strcmp(flag, "ht") == 0) {
					htany = htseen = 1;
					break;
				}
			}
		}
	}
	fclose(fp);
	proc_new(physid, coreid);

	if (maxsib > logical) {
		sprintf(log_buffer, "cpu %d: siblings=%d but OS only "
				    "reports %d cpus",
			maxsibcpu, maxsib, logical);
		warning();
	}
	if (errflag)
		procs = logical;
	else if (htany || (oldlinux && intelany)) {
		/*
		 ** If the version of linux is new enough to have
		 ** physid and coreid, we can use the proc_num
		 ** count as the value of physical processors.
		 */
		if (proc_num > 0)
			procs = proc_num;
		sprintf(log_buffer, "hyperthreading %s",
			(procs < logical) ? "enabled" : "disabled");
		log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, "ncpus", log_buffer);
	}

	num_pcpus = num_acpus = num_oscpus = logical;
	if (proc_array != NULL) {
		free(proc_array);
		proc_array = NULL;
		proc_num = 0;
	}

	sprintf(ret_string, "%d", num_oscpus);
	return ret_string;
}

/**
 * @brief
 *	returns the total physical memory
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return      string
 * @retval      tot physical memory  	Success
 * @retval      NULL            	Error
 *
 */

#ifndef PBSMOM_HTUNIT
char *
physmem(struct rm_attribute *attrib)
{
	char strbuf[256];
	FILE *fp;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if ((fp = fopen("/proc/meminfo", "r")) == NULL) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}
	/* the physmem of the machine is in MemTotal */
	while (fgets(strbuf, 256, fp) != NULL) {
		if (sscanf(strbuf, "MemTotal: %s k", ret_string) == 1) {
			fclose(fp);
			totalmem = (unsigned long) atol(ret_string);

			sprintf(ret_string, "%lukb",
				totalmem * (num_acpus / num_pcpus));
			return ret_string;
		}
	}
	fclose(fp);
	rm_errno = RM_ERR_SYSTEM;
	return NULL;
}

/**
 * @brief
 *	returns the size of file system present in machine
 *
 * @param[in] param - attribute value(file system)
 *
 * @return 	string
 * @retval	size of file system	Success
 * @retval	NULL			Error
 *
 */
char *
size_fs(char *param)
{
	struct statfs fsbuf;

	if (param[0] != '/') {
		sprintf(log_buffer, "%s: not full path filesystem name: %s",
			__func__, param);
		log_err(-1, __func__, log_buffer);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if (statfs(param, &fsbuf) == -1) {
		log_err(errno, __func__, "statfs");
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	sprintf(ret_string, "%lukb",
		(unsigned long) (((double) fsbuf.f_bsize *
			  (double) fsbuf.f_bfree) /
			 1024.0)); /* KB */
	return ret_string;
}

/**
 * @brief
 *	get file attribute(size) from param and put them in buffer.
 *
 * @param[in] param - file attributes
 *
 * @return	string
 * @retval	size of file	Success
 * @retval	NULL		Error
 *
 */
char *
size_file(char *param)
{
	struct stat sbuf;

	if (param[0] != '/') {
		sprintf(log_buffer, "%s: not full path filesystem name: %s",
			__func__, param);
		log_err(-1, __func__, log_buffer);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (stat(param, &sbuf) == -1) {
		log_err(errno, __func__, "stat");
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	sprintf(ret_string, "%lukb", (unsigned long) (sbuf.st_size >> 10)); /* KB */
	return ret_string;
}

/**
 * @brief
 *	wrapper function for size_file which returns the size of file system
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return	string
 * @retval      size of file system     Success
 * @retval      NULL                    Error
 *
 */
char *
size(struct rm_attribute *attrib)
{
	char *param;

	if (attrib == NULL) {
		log_err(-1, __func__, no_parm);
		rm_errno = RM_ERR_NOPARAM;
		return NULL;
	}
	if (momgetattr(NULL)) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	param = attrib->a_value;
	if (strcmp(attrib->a_qualifier, "file") == 0)
		return (size_file(param));
	else if (strcmp(attrib->a_qualifier, "fs") == 0)
		return (size_fs(param));
	else {
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
}

/**
 * @brief
 *	computes and returns walltime for process or session.
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return	string
 * @retval	walltime	Success
 * @retval	NULL		Error
 *
 */
static char *
walltime(struct rm_attribute *attrib)
{
	int i;
	int value, job, found = 0;
	time_t now, start;
	proc_stat_t *ps;

	if (attrib == NULL) {
		log_err(-1, __func__, no_parm);
		rm_errno = RM_ERR_NOPARAM;
		return NULL;
	}
	if ((value = atoi(attrib->a_value)) == 0) {
		sprintf(log_buffer, "bad param: %s", attrib->a_value);
		log_err(-1, __func__, log_buffer);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if (momgetattr(NULL)) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (strcmp(attrib->a_qualifier, "proc") == 0)
		job = 0;
	else if (strcmp(attrib->a_qualifier, "session") == 0)
		job = 1;
	else {
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if ((now = time(NULL)) <= 0) {
		log_err(errno, __func__, "time");
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}
	mom_get_sample();

	start = now;
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];

		if (job) {
			if (value != ps->session)
				continue;
		} else {
			if (value != ps->pid)
				continue;
		}

		found = 1;
		start = MIN(start, ps->start_time);
	}

	if (found) {
		sprintf(ret_string, "%ld",
			(long) ((double) (now - start) * wallfactor));
		return ret_string;
	}

	rm_errno = RM_ERR_EXIST;
	return NULL;
}

/**
 * @brief
 *	reads load avg from file and returns
 *
 * @param[out] rv - var to hold load avg
 *
 * @return	int
 * @retval	0			Success
 * @retval	RM_ERR_SYSTEM(15205)	error
 *
 */
int
get_la(double *rv)
{
	FILE *fp;
	float load;

	if ((fp = fopen("/proc/loadavg", "r")) == NULL)
		return (rm_errno = RM_ERR_SYSTEM);

	if (fscanf(fp, "%f", &load) != 1) {
		log_err(errno, __func__, "fscanf of load in /proc/loadavg");
		(void) fclose(fp);
		return (rm_errno = RM_ERR_SYSTEM);
	}

	*rv = (double) load;
	(void) fclose(fp);
	return 0;
}

u_long
gracetime(u_long secs)
{
	time_t now = time(NULL);

	if (secs > now) /* time is in the future */
		return (secs - now);
	else
		return 0;
}

/**
 * @brief
 *	set priority of processes.
 *
 * @return	Void
 *
 */
void
mom_nice(void)
{
	if ((nice_val != 0) && (setpriority(PRIO_PROCESS, 0, nice_val) == -1)) {
		(void) sprintf(log_buffer, "failed to nice(%d) mom", nice_val);
		log_err(errno, __func__, log_buffer);
	}
}

/**
 * @brief
 *      Unset priority of processes.
 *
 * @return      Void
 *
 */
void
mom_unnice(void)
{
	if ((nice_val != 0) && (setpriority(PRIO_PROCESS, 0, 0) == -1)) {
		(void) sprintf(log_buffer, "failed to nice(%d) mom", nice_val);
		log_err(errno, __func__, log_buffer);
	}
}

/**
 * @brief
 *	Get the info required for tm_attach.
 *
 * @param[in] pid - process id
 * @param[in] sid - session id
 * @param[in] uid - user id
 * @param[in] comm - command name
 * @param[in] len - size of command
 *
 * @return	int
 * @retval	TM_OKAY			Success
 * @retval	TM_ENOPROC(17011)	Error
 *
 */
int
dep_procinfo(pid_t pid, pid_t *sid, uid_t *uid, char *comm, size_t len)
{
	int i;
	proc_stat_t *ps;

	getprocs();
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];
		if (ps->pid == pid) {
			*sid = ps->session;
			*uid = ps->uid;
			memset(comm, '\0', len);
			memcpy(comm, ps->comm,
			       MIN(len - 1, sizeof(ps->comm)));
			return TM_OKAY;
		}
	}
	return TM_ENOPROC;
}

#ifdef NAS_UNKILL /* localmod 011 */
/**
 * @brief
 *	Get the info required for tracking killed processes.
 *
 * @param[in] pid - process id
 * @param[in] ppid - parent process id
 * @param[in] start_time - start time of process
 *
 * @return      int
 * @retval      TM_OKAY                 Success
 * @retval      TM_ENOPROC(17011)       Error
 *
 */
int
kill_procinfo(pid_t pid, pid_t *ppid, u_Long *start_time)
{
	int i;
	proc_stat_t *ps;

	getprocs();
	for (i = 0; i < nproc; i++) {
		ps = &proc_info[i];
		if (ps->pid == pid) {
			*ppid = ps->ppid;
			*start_time = ps->start_time;
			return TM_OKAY;
		}
	}
	return TM_ENOPROC;
}
#endif /* localmod 011 */

/**
 * @brief
 *	For cpuset machine, migrate new task to a cpuset.
 *
 * @param[in] ptask - pointer to task structure
 *
 * @return	int
 * @retval	TM_OKAY			Success
 * @retval	TM_ESYSTEM(17000)	Error
 *
 */
int
dep_attach(task *ptask)
{
	return TM_OKAY;
}

/**
 * @brief
 *	adjusts the reserved mem attribute to make it hold in space
 *
 * @param[in] vp - pointer to vnl_t structure( vnode list)
 *
 * @return	Void
 *
 */
#endif /* PBSMOM_HTUNIT */


================================================
FILE: src/resmom/linux/mom_mach.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _MOM_MACH_H
#define _MOM_MACH_H
#ifdef __cplusplus
extern "C" {
#endif
/*
 * Machine-dependent definitions for the Machine Oriented Miniserver
 *
 * Target System: linux
 */

#ifndef PBS_MACH
#define PBS_MACH "linux"
#endif /* PBS_MACH */

#ifndef MOM_MACH
#define MOM_MACH "linux"

#define SET_LIMIT_SET 1
#define SET_LIMIT_ALTER 0
#define PBS_CHKPT_MIGRATE 0
#define PBS_PROC_SID(x) proc_info[x].session
#define PBS_PROC_PID(x) proc_info[x].pid
#define PBS_PROC_PPID(x) proc_info[x].ppid
#define CLR_SJR(sjr) memset(&sjr, 0, sizeof(sjr));
#define PBS_SUPPORT_SUSPEND 1
#define task pbs_task

#if MOM_ALPS
#include <sys/types.h>
#include <dlfcn.h>
#include "/usr/include/job.h"
#include <basil.h>
#endif /* MOM_ALPS */

#include "job.h"

typedef struct pbs_plinks { /* struct to link processes */
	pid_t pl_pid;	    /* pid of this proc */
	pid_t pl_ppid;	    /* parent pid of this proc */
	int pl_child;	    /* index to child */
	int pl_sib;	    /* index to sibling */
	int pl_parent;	    /* index to parent */
	int pl_done;	    /* kill has been done */
} pbs_plinks;

extern unsigned long totalmem;
extern int kill_session(pid_t pid, int sig, int dir);
extern int bld_ptree(pid_t sid);

/* struct startjob_rtn = used to pass error/session/other info 	*/
/* 			child back to parent			*/

struct startjob_rtn {
	int sj_code;	  /* error code	*/
	pid_t sj_session; /* session	*/

#if MOM_ALPS
	jid_t sj_jid;
	long sj_reservation;
	unsigned long long sj_pagg;
#endif /* MOM_ALPS */
};

extern int mom_set_limits(job *pjob, int); /* Set job's limits */
extern int mom_do_poll(job *pjob);	   /* Should limits be polled? */
extern int mom_does_chkpnt;		   /* see if mom does chkpnt */
extern int mom_open_poll();		   /* Initialize poll ability */
extern int mom_get_sample();		   /* Sample kernel poll data */
extern int mom_over_limit(job *pjob);	   /* Is polled job over limit? */
extern int mom_set_use(job *pjob);	   /* Set resource_used list */
extern int mom_close_poll();		   /* Terminate poll ability */
extern int mach_checkpoint(struct task *, char *path, int abt);
extern long mach_restart(struct task *, char *path); /* Restart checkpointed job */
extern int set_job(job *, struct startjob_rtn *);
extern void starter_return(int, int, int, struct startjob_rtn *);
extern void set_globid(job *, struct startjob_rtn *);
extern void mom_topology(void);

#if MOM_ALPS
extern void ck_acct_facility_present(void);

/*
 *	Interface to the Cray ALPS placement scheduler. (alps.c)
 */
extern int alps_create_reserve_request(
	job *,
	basil_request_reserve_t **);
extern void alps_free_reserve_request(basil_request_reserve_t *);
extern int alps_create_reservation(
	basil_request_reserve_t *,
	long *,
	unsigned long long *);
extern int alps_confirm_reservation(job *);
extern int alps_cancel_reservation(job *);
extern int alps_inventory(void);
extern int alps_suspend_resume_reservation(job *, basil_switch_action_t);
extern int alps_confirm_suspend_resume(job *, basil_switch_action_t);
extern void alps_system_KNL(void);
extern void system_to_vnodes_KNL(void);
#endif /* MOM_ALPS */

#define COMSIZE 12
typedef struct proc_stat {
	pid_t session;	    /* session id */
	char state;	    /* one of RSDZT: Running, Sleeping,
						 Sleeping (uninterruptable), Zombie,
						 Traced or stopped on signal */
	pid_t ppid;	    /* parent pid */
	pid_t pgrp;	    /* process group id */
	unsigned long utime;	    /* utime this process */
	unsigned long stime;	    /* stime this process */
	unsigned long cutime;	    /* sum of children's utime */
	unsigned long cstime;	    /* sum of children's stime */
	pid_t pid;	    /* process id */
	unsigned long vsize;	    /* virtual memory size for proc */
	unsigned long rss;	    /* resident set size */
	unsigned long start_time;   /* start time of this process */
	unsigned long flags;	    /* the flags of the process */
	unsigned long uid;	    /* uid of the process owner */
	char comm[COMSIZE]; /* command name */
} proc_stat_t;

typedef struct proc_map {
	unsigned long vm_start;	 /* start of vm for process */
	unsigned long vm_end;	 /* end of vm for process */
	unsigned long vm_size;	 /* vm_end - vm_start */
	unsigned long vm_offset; /* offset into vm? */
	unsigned inode;		 /* inode of region */
	char *dev;		 /* device */
} proc_map_t;
#endif /* MOM_MACH */
#ifdef __cplusplus
}
#endif
#endif /* _MOM_MACH_H */


================================================
FILE: src/resmom/linux/mom_start.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
/**
 * @file
 */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <pwd.h>
#include <fcntl.h>
#include <signal.h>
#include <errno.h>
#include <assert.h>
#include <ftw.h>
#include <sys/types.h>
#include <sys/wait.h>
#include <sys/resource.h>
#include <sys/param.h>
#include <sys/utsname.h>
#include <ctype.h>
#include "libpbs.h"
#include "list_link.h"
#include "log.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "pbs_nodes.h"
#include "mom_mach.h"
#include "mom_func.h"
#ifdef PMIX
#include "mom_pmix.h"
#endif
#include "resmon.h"
#include "mom_vnode.h"
#include "libutil.h"
#include "work_task.h"

/**
 * @struct
 *	struct release_info is used to parse the release information
 *	of ProPack and linux distributions (i.e RHEL/SLES).
 *
 *	Keep the sgi-release file information at index 0
 *	To load the ProPack information, index 0 is used.
 *	To load the os information, index 1 thru end is used
 *	to search which file is available.
 */

static struct release_info {
	char *file;
	char *pfx;
	char *srch;
	char *sep;
} release_info[] = {
	{"/etc/redhat-release", "RHEL", "release", " "},
	{"/etc/SuSE-release", "SLES", "VERSION", "="},
	{"/etc/os-release", "SLES", "VERSION", "="}};

/**
 * @struct
 *	struct libjob_support is used to hold verified and tested list of
 *	<OS ver>, <Architecture>, <libjob ver>.
 */

static struct libjob_support {
	char *osver;
	char *arch;
	char *libjobver;
} libjob_support[] = {
	{"SLES10", "x86_64", "libjob.so"},
	{"SLES11", "x86_64", "libjob.so"},
	{"SLES12", "x86_64", "libjob.so.0"},
	{"SLES12", "aarch64", "libjob.so.0"},
	{"SLES15", "aarch64", "libjob.so.0"},
	{"SLES15", "x86_64", "libjob.so.0"}};

/* Global Variables */

extern int exiting_tasks;
extern char mom_host[];
extern pbs_list_head svr_alljobs;
extern int termin_child;
extern int num_acpus;
extern int num_pcpus;
extern int svr_delay_entry;

extern pbs_list_head task_list_event;

#if MOM_ALPS
extern char *path_jobs;
char *get_versioned_libname();
int find_in_lib(void *handle, char *plnam, char *psnam, void **psp);

/**
 *	This is a temporary kludge - this work should really be done by
 *	pbs_sched:  if the job is getting exclusive use of a vnode, we
 *	will assign all the CPU
 *	resources of the vnode to the created CPU set.  Exclusive use of
 *	a vnode is defined by a table in (currently) section E16.4 of the
 *	GRUNT 2 document, q.v..  It is reproduced here
 *
 *					Resource_List.place value
 *	vnode "sharing"
 *	   value		unset	   contains "share"   contains "excl"
 *			   ---------------------------------------------------|
 * 	unset  	       	   |   	share  	  |    	share  	  |    	excl   	      |
 *     	       	       	   |--------------|---------------|-------------------|
 *	"default_shared"   |	share	  |	share	  |	excl	      |
 *		    	   |--------------|---------------|-------------------|
 *	"default_excl"	   |	excl	  |	share	  |	excl	      |
 *	       	    	   |--------------|---------------|-------------------|
 *	"ignore_excl"	   |	share	  |	share	  |	share	      |
 *		    	   |--------------|---------------|-------------------|
 *	"force_excl"	   |	excl	  |	excl	  |	excl 	      |
 *			   |---------------------------------------------------
 *
 *	and reflected in the vnss[][] array below.
 *
 *	This applies to ALPS because the Cray reservation has an EXCLUSIVE
 *	or SHARED mode that is set from this table.
 */
enum vnode_sharing_state vnss[][rlplace_excl - rlplace_unset + 1] = {
	{isshared, isshared, isexcl},	/* VNS_UNSET */
	{isshared, isshared, isexcl},	/* VNS_DFLT_SHARED */
	{isexcl, isshared, isexcl},	/* VNS_DFLT_EXCL */
	{isshared, isshared, isshared}, /* VNS_IGNORE_EXCL */
	{isexcl, isexcl, isexcl},	/* VNS_FORCE_EXCL */
	{isexcl, isshared, isexcl},	/* VNS_DFLT_EXCLHOST */
	{isexcl, isexcl, isexcl}	/* VNS_FORCE_EXCLHOST */
};

#ifndef MAX
#define MAX(a, b) (((a) > (b)) ? (a) : (b))
#endif

/**
 * @brief
 *   	getplacesharing	sharing value for job place
 *
 *   	Compare the "place" string for a job with "excl" and "share" and
 *   	return the corresponding rlplace_value.
 *
 * @param[in] 	pjob	the job of interest
 *
 * @return	enum rlplace_value
 *
 * @par Side-effects
 *   	A log message is printed at DEBUG level.
 *
 * @par
 *   	This code was put in an externally
 *   	available function for use by the Cray project.
 *
 */
enum rlplace_value
getplacesharing(job *pjob)
{
	static resource_def *prsdef = NULL;
	enum rlplace_value rpv = rlplace_unset;
	resource *pplace;

	/*
	 *	Compute the "Resource_List.place" index for vnss[][]:
	 */
	prsdef = &svr_resc_def[RESC_PLACE];
	if (prsdef != NULL) {
		char *placeval = NULL;

		pplace = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), prsdef);
		if (pplace)
			placeval = pplace->rs_value.at_val.at_str;
		if (placeval != NULL) {
			if (place_sharing_check(placeval, PLACE_Excl))
				rpv = rlplace_excl;
			else if (place_sharing_check(placeval, PLACE_ExclHost))
				rpv = rlplace_excl;
			else if (place_sharing_check(placeval, PLACE_Shared))
				rpv = rlplace_share;

			sprintf(log_buffer, "Resource_List.place = %s",
				placeval);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid,
				  log_buffer);
		}
	}
	return rpv;
}

/* These globals are initialized in ck_acct_facility_present.
 *
 * At a later time it may be better to relocate them to the machine
 * independent portion of the mom code if they find use by more
 * than a single machine/OS type
 */

int job_facility_present;
int job_facility_enabled;
int acct_facility_present;
int acct_facility_active;
jid_t (*jc_create)();
jid_t (*jc_getjid)();

void
ck_acct_facility_present(void)
{
	int ret1;
	int ret2;
	char *libjob;

	static void *handle1 = NULL;

	struct config *cptr;
	extern struct config *config_array;

	/* use of job_create defaults to True */
	job_facility_enabled = 1;

	for (cptr = config_array; cptr != NULL; cptr++) {
		if (cptr->c_name == NULL || *cptr->c_name == 0)
			break;
		else if (strcasecmp(cptr->c_name, "pbs_jobcreate_workload_mgmt") == 0) {
			(void) set_boolean(__func__, cptr->c_u.c_value,
					   &job_facility_enabled);
		}
	}

	/* multiple calls to dlopen with the same arguments do not cause multiple
	 * copies of the library to get loaded into the proesses memory, they just
	 * bump a reference count and return the same handle value.
	 * If dlclose is issued when the reference count is 1, the library will be
	 * unloaded from memory and any previous pointers obtained through calls to
	 * dlsym will not be valid.
	 */

	job_facility_present = 0;
	acct_facility_present = 0;
	acct_facility_active = 0;

	/*
	 * If job facility is turned off, don't call dlopen for job_create.
	 */
	if (job_facility_enabled == 0)
		goto done;

	libjob = get_versioned_libname();
	if (libjob == NULL) {
		sprintf(log_buffer, "Could not find a supported job shared object");
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG, __func__,
			  log_buffer);
		goto err;
	}

	sprintf(log_buffer, "using %s for job shared object", libjob);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG, __func__, log_buffer);
	handle1 = dlopen(libjob, RTLD_LAZY);
	if (handle1 == NULL) {
		/* facility is not available */

		sprintf(log_buffer, "%s. failed to dlopen %s", dlerror(), libjob);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG,
			  __func__, log_buffer);
		goto err;
	}

	sprintf(log_buffer, "dlopen of %s successful", libjob);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG,
		  __func__, log_buffer);

	/* find_in_lib sets message in log_buffer */
	ret1 = find_in_lib(handle1, libjob, "job_create", (void **) &jc_create);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG, __func__,
		  log_buffer);

	ret2 = find_in_lib(handle1, libjob, "job_getjid", (void **) &jc_getjid);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG, __func__,
		  log_buffer);

	if ((ret1 == 1) && (ret2 == 1))
		job_facility_present = 1;

	if (job_facility_present == 0)
		goto done;

err:
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG,
		  __func__, "job facility not present or improperly setup");

done:
	/*
	 * When we get here, the flags are set to indicate what libs should
	 * be kept open.
	 */
	if (job_facility_present == 0) {
		if (handle1) {
			dlclose(handle1);
			handle1 = NULL;
		}
	}
}

/**
 * @brief
 *	find_in_lib -  Call this function when you want to find the address of symbol
 * 	in a shared library that has been opened by a call to dlopen.
 *
 * 	An appropriate message will be written into PBS' global "log_buffer"
 * 	in each of the three possible cases (found, not found, bogus arguments).
 * 	The caller chooses to log or ignore the content of log_buffer.
 *
 *
 * @param[in]	handle	valid handle from call to dlopen
 * @param[in]	plnam	pointer to the name of the library (NULL acceptable)
 * @param[in]	psnam	pointer to the name of the symbol
 * @param[out]	psp	where to return the symbol pointer if found
 *
 * @return	int
 * @retval	1      success, with symbol pointer stored to *psp
 * @retval 	0      failure, and *psp unmodified
 * @retval	-1      bad input to this function
 *
 */
int
find_in_lib(void *handle, char *plnam, char *psnam, void **psp)
{
	void *psym;
	const char *error;
	int retcode;

	/* check arguments */
	if (handle == NULL || psnam == NULL || *psnam == '\0') {
		sprintf(log_buffer, "%s: bad arguments %p %p %p %p", __func__,
			handle, plnam, psnam, psp);
		return -1;
	}

	psym = dlsym(handle, psnam);
	error = dlerror();

	if (error != NULL) {

		retcode = 0;
		if (plnam)
			sprintf(log_buffer, "%s. symbol %s not found in %s", error, psnam, plnam);
		else
			sprintf(log_buffer, "%s. symbol %s not found", error, psnam);
	} else {

		retcode = 1;
		*psp = psym;

		if (plnam)
			sprintf(log_buffer, "symbol %s found in %s", psnam, plnam);
		else
			sprintf(log_buffer, "symbol %s found", psnam);
	}
	return (retcode);
}

#endif /* MOM_ALPS */

/* Private variables */

/**
 * @brief
 * 	Set session id and whatever else is required on this machine
 *	to create a new job.
 * 	On a Cray, an ALPS reservation will be created and confirmed.
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	sjr	-	pointer to startjob_rtn structure
 *
 * @return session/job id
 * @retval -1 error from setsid(), no message in log_buffer
 * @retval -2 temporary error, retry job, message in log_buffer
 * @retval -3 permanent error, abort job, message in log_buffer
 *
 */
int
set_job(job *pjob, struct startjob_rtn *sjr)
{
#if MOM_ALPS
	if (job_facility_present && pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {

		/* host system has necessary JOB container facility present
		 * and this host is Mother Superior for this job
		 */

		jid_t *pjid = (jid_t *) &pjob->ji_extended.ji_ext.ji_jid[0];

		if (*pjid != (jid_t) 0 && *pjid != (jid_t) -1) {
			sjr->sj_jid = *pjid;
		} else {

			errno = -1;
			sjr->sj_jid = (jc_create == NULL) ? -1 : (*jc_create)(0, pjob->ji_qs.ji_un.ji_momt.ji_exuid, 0);

			if (sjr->sj_jid == (jid_t) -1) {

				/* Failed: categorize errno into two cases and handle */
				/* Remark: sit_job call occurs before log_close()     */

				if (errno == ENOSYS) {
					if (job_facility_present == 1) {
						log_joberr(errno, __func__,
							   "Job container facility unavailable",
							   pjob->ji_qs.ji_jobid);
						job_facility_present = 0;
					}
				} else {

					/* log any other job_create failure type */

					log_joberr(errno, __func__,
						   "Job container job_create call failed", pjob->ji_qs.ji_jobid);
				}
			}
		}

		*pjid = sjr->sj_jid;
	}
#endif /* MOM_ALPS */

	sjr->sj_session = setsid();

#if MOM_ALPS
	/*
	 * Now that we have our SID/JID we can request/confirm our
	 * placement scheduler reservation.
	 *
	 * Do this only if we are mother superior for the job.
	 */

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {
		basil_request_reserve_t *basil_req;
		int rc;

		/* initialized to -1 so this catches the unset case. */
		sjr->sj_reservation = -1;

		rc = alps_create_reserve_request(pjob, &basil_req);
		if (rc == 1) {
			sprintf(log_buffer,
				"Fatal MPP reservation error"
				" preparing request.");
			return -3;
		} else if (rc == 2) {
			sprintf(log_buffer,
				"Transient MPP reservation error"
				" preparing request.");
			return -2;
		}
		if (basil_req) {
			rc = alps_create_reservation(basil_req,
						     &sjr->sj_reservation,
						     &sjr->sj_pagg);
			alps_free_reserve_request(basil_req);
			if (rc < 0) {
				sprintf(log_buffer,
					"Fatal MPP reservation error"
					" on create.");
				return -3;
			}
			if (rc > 0) {
				sprintf(log_buffer,
					"Transient MPP reservation error"
					" on create.");
				return -2;
			}
			/*
			 * If we are interacting with ALPS, the cookie has
			 * not been set. Fill in the session ID we just
			 * acquired. Otherwise, we are interacting with
			 * CPA and use the cookie that was acquired when
			 * the reservation was created.
			 */
			if (sjr->sj_pagg == 0) {
				if ((job_facility_present == 1))
					sjr->sj_pagg = sjr->sj_jid;
				else
					sjr->sj_pagg = sjr->sj_session;
			}
			pjob->ji_extended.ji_ext.ji_reservation =
				sjr->sj_reservation;
			pjob->ji_extended.ji_ext.ji_pagg =
				sjr->sj_pagg;

			rc = alps_confirm_reservation(pjob);
			if (rc < 0) {
				sprintf(log_buffer,
					"Fatal MPP reservation error"
					" on confirm.");
				return -3;
			}
			if (rc > 0) {
				sprintf(log_buffer,
					"Transient MPP reservation error"
					" on confirm.");
				return -2;
			}
		} else { /* No error but no reservation made, reset so
					 * the inventory will not be reread.
					 */
			sjr->sj_reservation = 0;
		}
	}
#endif /* MOM_ALPS */

	return (sjr->sj_session);
}

/**
 * @brief
 *	set_globid - set the global id for a machine type.
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] sjr  - pointer to startjob_rtn structure
 *
 * @return Void
 *
 */

void
set_globid(job *pjob, struct startjob_rtn *sjr)
{
#if MOM_ALPS
	char buf[19]; /* 0x,16 hex digits,'\0' */
	char altid_buf[23];

	if (sjr->sj_jid == (jid_t) -1)
		job_facility_present = 0;
	else if (sjr->sj_jid) {

		sprintf(buf, "%#0lx", (unsigned long) sjr->sj_jid);
		set_jattr_str_slim(pjob, JOB_ATR_acct_id, buf, NULL);
		(void) memcpy(&pjob->ji_extended.ji_ext.ji_jid, &sjr->sj_jid, sizeof(pjob->ji_extended.ji_ext.ji_jid));

		if (job_facility_present == 0) {
			/* first success on job_create() after failure */
			job_facility_present = 1;
			sprintf(log_buffer, "Job container facility available");
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_ACCT, LOG_DEBUG, __func__, log_buffer);
		}
	}

	pjob->ji_extended.ji_ext.ji_pagg = sjr->sj_pagg;
	pjob->ji_extended.ji_ext.ji_reservation = sjr->sj_reservation;
	sprintf(altid_buf, "%ld", sjr->sj_reservation);
	set_jattr_str_slim(pjob, JOB_ATR_altid, altid_buf, NULL);

#endif /* MOM_ALPS */
}

/**
 * @brief
 *	sets the shell to be used
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] pwdp - pointer to passwd structure
 *
 * @return 	string
 * @retval 	shellname	Success
 *
 */
char *
set_shell(job *pjob, struct passwd *pwdp)
{
	char *cp;
	int i;
	char *shell;
	struct array_strings *vstrs;
	/*
	 * find which shell to use, one specified or the login shell
	 */

	shell = pwdp->pw_shell;
	if ((is_jattr_set(pjob, JOB_ATR_shell)) &&
	    (vstrs = get_jattr_arst(pjob, JOB_ATR_shell))) {
		for (i = 0; i < vstrs->as_usedptr; ++i) {
			cp = strchr(vstrs->as_string[i], '@');
			if (cp) {
				if (!strncmp(mom_host, cp + 1, strlen(cp + 1))) {
					*cp = '\0'; /* host name matches */
					shell = vstrs->as_string[i];
					break;
				}
			} else {
				shell = vstrs->as_string[i]; /* wildcard */
			}
		}
	}
	return (shell);
}

/**
 *
 * @brief
 * 	Checks if a child of the current (mom) process has terminated, and
 *	matches it with the pid of one of the tasks in the task_list_event,
 *	or matches the pid of a process being monitored for a PBS job.
 *	if matching a task in the task_list_event, then that task is
 *	marked as WORK_Deferred_Cmp along with the exit value of the child
 *	process. Otherwise if it's for a job, and that job's
 *	JOB_SVFLAG_TERMJOB is set, then mark the job as exiting.
 *
 * @return	Void
 *
 */

void
scan_for_terminated(void)
{
	int exiteval;
	pid_t pid;
	job *pjob;
	task *ptask = NULL;
	struct work_task *wtask = NULL;
	int statloc;

	/* update the latest intelligence about the running jobs;         */
	/* must be done before we reap the zombies, else we lose the info */

	termin_child = 0;

	mom_set_use_all();

	/* Now figure out which task(s) have terminated (are zombies) */

	while ((pid = waitpid(-1, &statloc, WNOHANG)) > 0) {
		if (WIFEXITED(statloc))
			exiteval = WEXITSTATUS(statloc);
		else if (WIFSIGNALED(statloc))
			exiteval = WTERMSIG(statloc) + 0x100;
		else
			exiteval = 1;

		/* Check for other task lists */
		wtask = (struct work_task *) GET_NEXT(task_list_event);
		while (wtask) {
			if ((wtask->wt_type == WORK_Deferred_Child) &&
			    (wtask->wt_event == pid)) {
				wtask->wt_type = WORK_Deferred_Cmp;
				wtask->wt_aux = (int) exiteval; /* exit status */
				svr_delay_entry++;		/* see next_task() */
			}
			wtask = (struct work_task *) GET_NEXT(wtask->wt_linkevent);
		}

		pjob = (job *) GET_NEXT(svr_alljobs);
		while (pjob) {
			/*
			 ** see if process was a child doing a special
			 ** function for MOM
			 */
			if (pid == pjob->ji_momsubt)
				break;
			/*
			 ** look for task
			 */
			ptask = (task *) GET_NEXT(pjob->ji_tasks);
			while (ptask) {
				if (ptask->ti_qs.ti_sid == pid)
					break;
				ptask = (task *) GET_NEXT(ptask->ti_jobtask);
			}
			if (ptask != NULL)
				break;
			pjob = (job *) GET_NEXT(pjob->ji_alljobs);
		}

		if (pjob == NULL) {
			DBPRT(("%s: pid %d not tracked, exit %d\n",
			       __func__, pid, exiteval))
			continue;
		}

		if (pid == pjob->ji_momsubt) {
			pjob->ji_momsubt = 0;
			if (pjob->ji_mompost) {
				pjob->ji_mompost(pjob, exiteval);
			}
			(void) job_save(pjob);
			continue;
		}
		DBPRT(("%s: task %8.8X pid %d exit value %d\n", __func__,
		       ptask->ti_qs.ti_task, pid, exiteval))
		ptask->ti_qs.ti_exitstat = exiteval;
		sprintf(log_buffer, "task %8.8X terminated",
			ptask->ti_qs.ti_task);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);

#ifdef PMIX
		/* Inform PMIx that the task has exited. */
		pbs_pmix_notify_exit(pjob, ptask->ti_qs.ti_exitstat, NULL);
#endif

		/*
		 ** After the top process(shell) of the TASK exits, check if the
		 ** JOB_SVFLG_TERMJOB job flag set. If yes, then check for any
		 ** live process(s) in the session. If found, make the task
		 ** ORPHAN by setting the flag and delay by kill_delay time. This
		 ** will be exited in kill_job or by cput_sum() as can not be
		 ** seen again by scan_for_terminated().
		 */
		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_TERMJOB) {
			int n;

			(void) mom_get_sample();
			n = bld_ptree(ptask->ti_qs.ti_sid);
			if (n > 0) {
				ptask->ti_flags |= TI_FLAGS_ORPHAN;
				DBPRT(("%s: task %8.8X still has %d active procs\n", __func__,
				       ptask->ti_qs.ti_task, n))
				continue;
			}
		}

		kill_session(ptask->ti_qs.ti_sid, SIGKILL, 0);
		ptask->ti_qs.ti_status = TI_STATE_EXITED;
		(void) task_save(ptask);
		exiting_tasks = 1;
	}
}

#ifdef HAVE_POSIX_OPENPT

/**
 * @brief
 *	This is code adapted from an example for posix_openpt in
 *	The Open Group Base Specifications Issue 6.
 *
 *	On success, this function returns an open descriptor for the
 *	master pseudotty and places a pointer to the (static) name of
 *	the slave pseudotty in *rtn_name;  on failure, -1 is returned.
 *
 * @param[out] rtn_name - holds info of tty
 *
 * @return 	int
 * @retval 	fd 	Success
 * @retval 	-1	Failure
 *
 */
int
open_master(char **rtn_name)
{
	int masterfd;
	char *newslavename;
	static char slavename[_POSIX_PATH_MAX];
#ifndef _XOPEN_SOURCE
	extern char *ptsname(int);
	extern int grantpt(int);
	extern int unlockpt(int);
	extern int posix_openpt(int);
#endif

	masterfd = posix_openpt(O_RDWR | O_NOCTTY);
	if (masterfd == -1)
		return (-1);

	if ((grantpt(masterfd) == -1) ||
	    (unlockpt(masterfd) == -1) ||
	    ((newslavename = ptsname(masterfd)) == NULL)) {
		(void) close(masterfd);
		return (-1);
	}

	pbs_strncpy(slavename, newslavename, sizeof(slavename));
	assert(rtn_name != NULL);
	*rtn_name = slavename;
	return (masterfd);
}

#else /* HAVE_POSIX_OPENPT */

/**
 * @brief
 * 	creat the master pty, this particular
 * 	piece of code depends on multiplexor /dev/ptc
 *
 * @param[in] rtn_name - holds info about tty
 * @return      int
 * @retval      fd      Success
 * @retval      -1      Failure
 *
 */

#define PTY_SIZE 12

int
open_master(char **rtn_name)
{
	char *pc1;
	char *pc2;
	int ptc; /* master file descriptor */
	static char ptcchar1[] = "pqrs";
	static char ptcchar2[] = "0123456789abcdef";
	static char pty_name[PTY_SIZE + 1]; /* "/dev/[pt]tyXY" */

	pbs_strncpy(pty_name, "/dev/ptyXY", sizeof(pty_name));
	for (pc1 = ptcchar1; *pc1 != '\0'; ++pc1) {
		pty_name[8] = *pc1;
		for (pc2 = ptcchar2; *pc2 != '\0'; ++pc2) {
			pty_name[9] = *pc2;
			if ((ptc = open(pty_name, O_RDWR | O_NOCTTY, 0)) >= 0) {
				/* Got a master, fix name to matching slave */
				pty_name[5] = 't';
				*rtn_name = pty_name;
				return (ptc);

			} else if (errno == ENOENT)
				return (-1); /* tried all entries, give up */
		}
	}
	return (-1); /* tried all entries, give up */
}
#endif /* HAVE_POSIX_OPENPT */

/*
 * struct sig_tbl = map of signal names to numbers,
 * see req_signal() in ../requests.c
 */
struct sig_tbl sig_tbl[] = {
	{"NULL", 0},
	{"HUP", SIGHUP},
	{"INT", SIGINT},
	{"QUIT", SIGQUIT},
	{"ILL", SIGILL},
	{"TRAP", SIGTRAP},
	{"IOT", SIGIOT},
	{"ABRT", SIGABRT},
	{"FPE", SIGFPE},
	{"KILL", SIGKILL},
	{"BUS", SIGBUS},
	{"SEGV", SIGSEGV},
	{"PIPE", SIGPIPE},
	{"ALRM", SIGALRM},
	{"TERM", SIGTERM},
	{"URG", SIGURG},
	{"STOP", SIGSTOP},
	{"TSTP", SIGTSTP},
	{"CONT", SIGCONT},
	{"CHLD", SIGCHLD},
	{"CLD", SIGCHLD},
	{"TTIN", SIGTTIN},
	{"TTOU", SIGTTOU},
	{"IO", SIGIO},
#ifdef __linux__
	{"POLL", SIGPOLL},
#endif
	{"XCPU", SIGXCPU},
	{"XFSZ", SIGXFSZ},
	{"VTALRM", SIGVTALRM},
	{"PROF", SIGPROF},
	{"WINCH", SIGWINCH},
	{"USR1", SIGUSR1},
	{"USR2", SIGUSR2},
	{NULL, -1}};

/**
 * @brief
 *      Get the release information
 *
 * @par Functionality:
 *      This function extracts the release information of ProPack and Linux distributions
 *      from system files listed in struct release_info.
 *
 * @see
 *      get_versioned_lib
 *
 * @param[in]   file    -       pointer to file
 * @param[in]   pfx     -       pointer to prefix
 * @param[in]   srch    -       pointer to search string
 * @param[in]   sep     -       pointer to separator
 *
 * @return	char *
 * @retval	distro: <PP ver> or <OS ver>
 * @retval	NULL: Not able to get the requested information from distro
 *
 * @par Side Effects: The value returned needs to be freed by the caller.
 *
 * @par MT-safe: Yes
 *
 */

static char *
parse_sysfile_info(const char *file,
		   const char *pfx,
		   const char *srch,
		   const char *sep)
{
	FILE *fptr;
	char rbuf[1024];
	char *tok;
	char *svptr = NULL;
	char *distro;
	int found = 0;

	fptr = fopen(file, "r");
	if (fptr == NULL)
		return NULL;

	while (fgets(rbuf, sizeof(rbuf), fptr) != NULL) {
		if (strstr(rbuf, srch)) {
			found = 1;
			break;
		}
	}

	fclose(fptr);

	if (found == 0) {
		sprintf(log_buffer, "release info not found in %s", file);
		log_err(errno, __func__, log_buffer);
		return NULL;
	}

	tok = string_token(rbuf, sep, &svptr);
	while (tok) {
		if (strstr(tok, srch)) {
			tok = string_token(NULL, sep, &svptr);
			break;
		}
		tok = string_token(NULL, sep, &svptr);
	}
	if (tok == NULL)
		return NULL;

	while (!isdigit((int) (*tok)))
		tok++;
	distro = malloc(MAXNAMLEN);
	if (distro == NULL) {
		sprintf(log_buffer, "memory allocation failed");
		log_err(errno, __func__, log_buffer);
		return NULL;
	}
	(void) snprintf(distro, MAXNAMLEN, "%s%d", pfx, atoi(tok));
	distro[MAXNAMLEN - 1] = '\0';
	return distro;
}

/**
 *@brief
 *	Ensure that the shared object exists and
 *	get the shared object name from the table
 *
 * @par Functionality:
 *	This function checks verified and tested list of
 *	<PP ver>, <OS ver>, <Architecture>  and
 *	if the above entries matches with  libjob_support table,
 *	then returns shared object to the caller for dlopen.
 *	Otherwise it returns NULL.
 *
 * @see
 *	ck_acct_facility_present
 *
 * @return	char *
 * @retval	libjob_support[idx].libjobver
 * @retval	NULL:				Failed to get the supported library
 *
 * @par Side Effects: None
 *
 * @par MT-safe: Yes
 *
 */

char *
get_versioned_libname()
{
	int idx;
	int table_size;
	struct utsname buf;
	struct libjob_support jobobj;

	memset(&jobobj, 0, sizeof(jobobj));

	/* find OS information - loop to find out which file available */
	table_size = sizeof(release_info) / sizeof(release_info[0]);
	for (idx = 1; idx < table_size; idx++) {
		if (access(release_info[idx].file, R_OK) != -1)
			break;
	}

	/* if we found a readable os release file, parse it.
	 * if we dont find a file or if parse_sysfile_info fails,
	 * jobobj.osver remains NULL, and is handled later
	 */
	if (idx < table_size)
		jobobj.osver = parse_sysfile_info(release_info[idx].file,
						  release_info[idx].pfx,
						  release_info[idx].srch,
						  release_info[idx].sep);
	/* Get the information on architecture */
	if (uname(&buf) == -1) {
		sprintf(log_buffer, "uname() call failed");
		log_err(errno, __func__, log_buffer);
		goto SYSFAIL;
	}

	jobobj.arch = strdup(buf.machine);

	/* check that all the required members of jobobj are NON-NULL */
	if ((jobobj.arch == NULL) || (jobobj.osver == NULL)) {
		sprintf(log_buffer, "Failed to get system information");
		log_err(errno, __func__, log_buffer);
		goto SYSFAIL;
	}

	/* Compare system information with verified list of platforms */

	table_size = sizeof(libjob_support) / sizeof(libjob_support[0]);
	for (idx = 0; idx < table_size; idx++) {
		if ((strcmp(jobobj.osver, libjob_support[idx].osver) == 0) &&
		    (strcmp(jobobj.arch, libjob_support[idx].arch) == 0)) {
			free(jobobj.arch);
			free(jobobj.osver);
			return libjob_support[idx].libjobver;
		}
	}

SYSFAIL:
	if (jobobj.arch)
		free(jobobj.arch);
	if (jobobj.osver)
		free(jobobj.osver);
	return NULL;
}


================================================
FILE: src/resmom/linux/pe_input.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <fcntl.h>
#include <sys/param.h>

/**
 * @file
 */
/**
 * @brief
 * 	pe_input() - open architecture dependent input file for prologue
 *	and epilogue scripts.  See ../prolog.c
 *	For linux - /dev/null
 *
 * @param[in] jobid - job id
 *
 * @return 	file descriptor
 * @retval	fd	Success
 * @retval  	-1	Failure
 *
 */

int
pe_input(char *jobid)
{
	return (open("/dev/null", O_RDONLY, 0));
}


================================================
FILE: src/resmom/mock_run.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <assert.h>
#include <time.h>
#include <errno.h>

#include "attribute.h"
#include "batch_request.h"
#include "job.h"
#include "log.h"
#include "mock_run.h"
#include "mom_func.h"
#include "pbs_error.h"
#include "resource.h"
#include "mom_server.h"

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
#include "renew_creds.h"
#endif

extern time_t time_now;
extern time_t time_resc_updated;
extern int min_check_poll;
extern int next_sample_time;

void
mock_run_finish_exec(job *pjob)
{
	resource_def *rd;
	resource *wall_req;
	int walltime = 0;

	rd = &svr_resc_def[RESC_WALLTIME];
	wall_req = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), rd);
	if (wall_req != NULL) {
		walltime = wall_req->rs_value.at_val.at_long;
		start_walltime(pjob);
	}

	time_now = time(NULL);

	/* Add a work task that runs when the job is supposed to end */
	set_task(WORK_Timed, time_now + walltime, mock_run_end_job_task, pjob);

	sprintf(log_buffer, "Started mock run of job");
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
		  LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);

	mock_run_record_finish_exec(pjob);

	return;
}

void
mock_run_record_finish_exec(job *pjob)
{
	set_job_state(pjob, JOB_STATE_LTR_RUNNING);
	set_job_substate(pjob, JOB_SUBSTATE_RUNNING);

	job_save(pjob);

	time_resc_updated = time_now;
	mock_run_mom_set_use(pjob);

	enqueue_update_for_send(pjob, IS_RESCUSED);
	next_sample_time = min_check_poll;

	return;
}

/**
 * @brief	work task handler for end of a job in mock run mode
 *
 * @param[in]	ptask - pointer to the work task
 *
 * @return void
 */
void
mock_run_end_job_task(struct work_task *ptask)
{
	job *pjob;

	if (ptask == NULL) {
		log_err(PBSE_UNKJOBID, __func__, "Task not received");
		return;
	}

	pjob = ptask->wt_parm1;

	set_job_state(pjob, JOB_STATE_LTR_EXITING);
	set_job_substate(pjob, JOB_SUBSTATE_EXITING);

	pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_OK;

	scan_for_exiting();
}

/**
 * @brief
 * 	Update the resources used.<attributes> of a job when in mock run mode
 *
 * @param[in]	pjob - job in question.
 *
 *
 * @return int
 * @retval PBSE_NONE	for success.
 */
int
mock_run_mom_set_use(job *pjob)
{
	int i;
	resource *pres;
	resource *pres_req;
	attribute *at;
	resource_def *rdefp;
	long val_req = 0;
	static resource_def **rd = NULL;
	static resource_def *vmemd = NULL;
	int memval = 0;
	unsigned int mem_atsv_shift = 10;
	unsigned int mem_atsv_units = ATR_SV_BYTESZ;

	assert(pjob != NULL);
	at = get_jattr(pjob, JOB_ATR_resc_used);
	at->at_flags |= (ATR_VFLAG_MODIFY | ATR_VFLAG_SET);

	if (rd == NULL) {
		rd = malloc(5 * sizeof(resource_def *));
		if (rd == NULL) {
			log_err(errno, __func__, "Unable to allocate memory");
			return PBSE_SYSTEM;
		}

		rd[0] = &svr_resc_def[RESC_NCPUS];
		rd[1] = &svr_resc_def[RESC_MEM];
		rd[2] = &svr_resc_def[RESC_CPUT];
		rd[3] = &svr_resc_def[RESC_CPUPERCENT];
		rd[4] = NULL;
	}

	vmemd = &svr_resc_def[RESC_VMEM];

	for (i = 0; rd[i] != NULL; i++) {
		rdefp = rd[i];
		pres = find_resc_entry(at, rdefp);
		if (pres == NULL) {
			pres = add_resource_entry(at, rdefp);
			mark_attr_set(&pres->rs_value);
			pres->rs_value.at_type = rd[i]->rs_type;

			/*
			 * get pointer to list of resources *requested* for the job
			 * so the res used can be set to res requested
			 */
			pres_req = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), rdefp);
			if (pres_req != NULL &&
			    (val_req = pres_req->rs_value.at_val.at_long) != 0)
				pres->rs_value.at_val.at_long = val_req;
			else
				pres->rs_value.at_val.at_long = 0;

			if (rd[i]->rs_type == ATR_TYPE_SIZE) {
				if (pres_req != NULL) {
					memval = val_req;
					mem_atsv_shift = pres_req->rs_value.at_val.at_size.atsv_shift;
					mem_atsv_units = pres_req->rs_value.at_val.at_size.atsv_units;
					pres->rs_value.at_val.at_size.atsv_shift = mem_atsv_shift;
					pres->rs_value.at_val.at_size.atsv_units = mem_atsv_units;
				} else {
					pres->rs_value.at_val.at_size.atsv_shift = 10; /* KB */
					pres->rs_value.at_val.at_size.atsv_units = ATR_SV_BYTESZ;
				}
			}
		}
	}

	/* Set vmem equal to the value of mem */
	pres = find_resc_entry(at, vmemd);
	if (pres == NULL) {
		pres = add_resource_entry(at, vmemd);
		mark_attr_set(&pres->rs_value);
		pres->rs_value.at_type = ATR_TYPE_LONG;
		pres->rs_value.at_val.at_long = memval;
		pres->rs_value.at_val.at_size.atsv_shift = mem_atsv_shift;
		pres->rs_value.at_val.at_size.atsv_units = mem_atsv_units;
	}

	pjob->ji_sampletim = time(NULL);

	/* update walltime usage */
	update_walltime(pjob);

	return (PBSE_NONE);
}

/**
 * @brief	job_purge for mock run mode
 *
 * @param[in,out]	pjob - the job being purged
 *
 * @return	void
 */
void
mock_run_job_purge(job *pjob)
{
	delete_link(&pjob->ji_jobque);
	delete_link(&pjob->ji_alljobs);
	delete_link(&pjob->ji_unlicjobs);

	if (pjob->ji_preq != NULL) {
		log_joberr(PBSE_INTERNAL, __func__, "request outstanding",
			   pjob->ji_qs.ji_jobid);
		reply_text(pjob->ji_preq, PBSE_INTERNAL, "job deleted");
		pjob->ji_preq = NULL;
	}

	/* delete script file */
	del_job_related_file(pjob, JOB_SCRIPT_SUFFIX);

	del_job_dirs(pjob, NULL);

	/* delete job file */
	del_job_related_file(pjob, JOB_FILE_SUFFIX);

	del_chkpt_files(pjob);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	delete_cred(pjob->ji_qs.ji_jobid);
#endif
	del_job_related_file(pjob, JOB_CRED_SUFFIX);

	job_free(pjob);
}


================================================
FILE: src/resmom/mock_run.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _MOCK_RUN_H
#define _MOCK_RUN_H
#ifdef __cplusplus
extern "C" {
#endif

#include <stdio.h>

#include "work_task.h"
#include "job.h"

void mock_run_finish_exec(job *pjob);

void mock_run_record_finish_exec(job *pjob);

void mock_run_end_job_task(struct work_task *ptask);

int mock_run_mom_set_use(job *pjob);

void mock_run_job_purge(job *pjob);

#ifdef __cplusplus
}
#endif
#endif /* _MOCK_RUN_H */


================================================
FILE: src/resmom/mom_comm.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_comm.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/stat.h>

#include <unistd.h>
#include <dirent.h>
#include <pwd.h>
#include <netdb.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <sys/param.h>
#include <sys/times.h>
#include <sys/time.h>
#include <sys/resource.h>
#include <signal.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <time.h>
#include <limits.h>
#include <sys/types.h>
#include <sys/stat.h>

#include "libpbs.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server_limits.h"
#include "job.h"
#include "pbs_error.h"
#include "log.h"
#include "net_connect.h"
#include "tpp.h"
#include "dis.h"
#include "mom_func.h"
#include "mom_server.h"
#include "credential.h"
#include "ticket.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "batch_request.h"
#include "hook.h"
#include "mom_hook_func.h"
#include "pbs_internal.h"
#include "placementsets.h"
#include "pbs_reliable.h"
#include "renew_creds.h"
#ifdef PMIX
#include "mom_pmix.h"
#endif

/* Global Data Items */

extern int exiting_tasks;
extern char mom_host[];
extern char *path_jobs;
extern int pbs_errno;
extern pbs_list_head mom_deadjobs; /* for deferred purging of job */
extern pbs_list_head mom_polljobs; /* must have resource limits polled */
extern pbs_list_head svr_alljobs;  /* all jobs under MOM's control */
extern time_t time_now;
extern int server_stream;
extern char mom_short_name[];
extern unsigned int pbs_mom_port;
extern unsigned int pbs_rm_port;
extern int gen_nodefile_on_sister_mom;

extern int mom_net_up;
extern time_t mom_net_up_time;
extern int max_poll_downtime_val;
extern char *msg_err_malloc;
extern int
write_pipe_data(int upfds, void *data, int data_size);
char task_fmt[] = "/%8.8X";
extern void resume_multinode(job *pjob);

/* Function pointers
 **
 ** These are functions to provide extra interaction between mother
 ** superior and the sisters for any special job setup that needs
 ** to take place. If no extra setup needs to happen, the function
 ** pointers are all NULL and standard MOM interaction takes place.
 ** The sequence of actions which happen for extra setup is as follows
 ** (showing one sister):
 **
 **    MS                          sister
 ** Sends JOIN_JOB
 **                                Gets JOIN_JOB, calls job_join_extra.
 **                                Calls job_join_ack to append to reply.
 ** Calls job_join_read to read
 ** extra values included with
 ** JOIN_JOB reply.
 **
 ** Calls job_join_extra to get
 ** her own extra info.
 **
 ** Calls send_sister to send a
 ** SETUP_JOB message and uses
 ** job_setup_send to append setup
 ** information to the message.
 **                                Gets SETUP_JOB, calls job_setup_final.
 ** Gets reply to SETUP_JOB, calls
 ** job_setup_final.
 **
 ** At this point, all the extra setup for the job is done and it
 ** can be started by calling finish_exec.  The clean up to undo or
 ** deallocate whatever resources were claimed in job_setup_final
 ** is done in job_clean_extra.
 */

/*
 **	Gather any extra information needed at job start.  Called by
 **	a sister when she gets JOIN_JOB.  Called by MS after she gets
 **	good JOIN_JOB replies from all the sisters.
 */
#ifdef PMIX
pbs_jobnode_t job_join_extra = &pbs_pmix_job_join_extra;
#else
pbs_jobnode_t job_join_extra = NULL;
#endif

/*
 **	Used by a sister node to write extra information back to MS
 **	with the reply to JOIN_JOB.
 */
pbs_jobndstm_t job_join_ack = NULL;

/*
 **	Used by MS to read extra information sent by a sister reply
 **	to JOIN_JOB.
 */
pbs_jobndstm_t job_join_read = NULL;

/*
 **	Called by MS from send_sisters to form a SETUP_JOB message.
 */
pbs_jobndstm_t job_setup_send = NULL;

/*
 **	Called by a sister to read a SETUP_JOB message and do any
 **	special setup required at job start.
 */
pbs_jobstream_t job_setup_final = NULL;

/*
 **	Does any special processing needed before the epilogue runs.
 */
pbs_jobvoid_t job_end_final = NULL;

/*
 **	Called at job end to undo the setup done in job_setup_final
 **	or job_join_extra.
 */
#ifdef PMIX
pbs_jobfunc_t job_clean_extra = &pbs_pmix_job_clean_extra;
#else
pbs_jobfunc_t job_clean_extra = NULL;
#endif

/*
 **	Free memory allocated in ji_setup and hn_setup for all nodes.
 */
pbs_jobvoid_t job_free_extra = NULL;

/*
 **	Free memory allocated in hn_setup for a given node.
 */
pbs_jobnodevoid_t job_free_node = NULL;

/* the following depends on tm_node_id being 0 to n-1 */
#define TO_PHYNODE(vnode) pjob->ji_vnods[vnode].vn_host->hn_node

eventent *event_dup(eventent *ep, job *pjob, hnodent *pnode);

/**
 * @brief
 *	Save the critical information associated with a task to disk.
 *
 * @param[in]   ptask - structure handle holding task info to be saved
 *
 * @return   Error code
 * @retval   0 Success
 * @retval  -1 Failure
 *
 */
int
task_save(pbs_task *ptask)
{
	job *pjob = ptask->ti_job;
	int fds;
	int i;
	char namebuf[MAXPATHLEN + 1];
	char filnam[MAXPATHLEN + 1];
	int openflags;

	(void) strcpy(namebuf, path_jobs); /* job directory path */
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(namebuf, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(namebuf, pjob->ji_qs.ji_jobid);
	(void) strcat(namebuf, JOB_TASKDIR_SUFFIX);
	(void) sprintf(filnam, task_fmt, ptask->ti_qs.ti_task);
	(void) strcat(namebuf, filnam);

	openflags = O_WRONLY | O_CREAT;
	fds = open(namebuf, openflags, 0600);
	if (fds < 0) {
		sprintf(log_buffer, "error on open %s", namebuf);
		log_err(errno, __func__, log_buffer);
		return (-1);
	}

#ifdef WIN32
	secure_file(namebuf, "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif

	/* just write the "critical" base structure to the file */

	while ((i = write(fds, (char *) &ptask->ti_qs, sizeof(ptask->ti_qs))) !=
	       sizeof(ptask->ti_qs)) {
		if ((i < 0) && (errno == EINTR)) { /* retry the write */
			if (lseek(fds, (off_t) 0, SEEK_SET) < 0) {
				log_err(errno, __func__, "lseek");
				(void) close(fds);
				return (-1);
			}
			continue;
		} else {
			log_err(errno, __func__, "quickwrite");
			(void) close(fds);
			return (-1);
		}
	}
	(void) close(fds);
	return (0);
}

/**
 * @brief
 *	Duplicate an event and link it to the given nodeent entry.
 *
 * @param[in] ep - eventent pointer to event to be linked
 * @param[in] pjob - job pointer to job
 * @param[in] pnode - hnode pointer to node to link event
 *
 * @return structure
 * @retval event linked
 *
 */
eventent *
event_dup(eventent *ep, job *pjob, hnodent *pnode)
{
	eventent *nep;

	nep = (eventent *) malloc(sizeof(eventent));
	assert(nep);

	memmove(nep, ep, sizeof(*ep));
	CLEAR_LINK(nep->ee_next);

	append_link(&pnode->hn_events, &nep->ee_next, nep);

	if (pnode->hn_stream == -1)
		pnode->hn_stream = tpp_open(pnode->hn_host, pnode->hn_port);

	return nep;
}

/**
 * @brief
 *	Allocate an event and link it to the given nodeent entry.
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] command - command event is for
 * @param[in] fd - TM stream
 * @param[in] pnode - pointer to structure to keep track of events for node
 * @param[in] event - MOM event number
 * @param[in] taskid - which task id
 *
 * @return structure handle
 * @retval eventent *
 *
 */
eventent *
event_alloc(job *pjob, int command, int fd, hnodent *pnode,
	    tm_event_t event, tm_task_id taskid)
{
	static tm_event_t eventnum = TM_NULL_EVENT + 1;
	static int rollover = 0;
	eventent *ep;

	ep = (eventent *) malloc(sizeof(eventent));
	assert(ep);
	ep->ee_command = command;
	ep->ee_retry = 0;
	ep->ee_fd = fd;
	ep->ee_client = event;
	ep->ee_taskid = taskid;
	ep->ee_argv = NULL;
	ep->ee_envp = NULL;
	CLEAR_LINK(ep->ee_next);

	if ((ep->ee_event = eventnum++) == TM_NULL_EVENT) {
		/*
		 ** Set the eventnum counter back to initial condition.
		 ** The first legal event number is TM_NULL_EVENT+1.
		 */
		DBPRT(("%s: EVENT ROLLOVER\n", __func__))
		eventnum = TM_NULL_EVENT + 1;
		ep->ee_event = eventnum++;
		rollover = 1;
	}

	if (rollover) {
		int i;

		/*
		 ** Check for events to be sure there are no dups.
		 */
	check:
		for (i = 0; i < pjob->ji_numnodes; i++) {
			eventent *sp;
			hnodent *np = &pjob->ji_hosts[i];

			sp = (eventent *) GET_NEXT(np->hn_events);
			while (sp) {
				if (sp->ee_event == ep->ee_event) {
					DBPRT(("%s: DUP host event\n", __func__))
					ep->ee_event = eventnum++;
					goto check;
				}

				sp = (eventent *) GET_NEXT(sp->ee_next);
			}
		}
		/*
		 ** We don't need to search the obit events because
		 ** any local client (not MOM) will have generated
		 ** the event number that is saved for the obit.
		 */
	}

	append_link(&pnode->hn_events, &ep->ee_next, ep);

	if (pnode->hn_stream == -1)
		pnode->hn_stream = tpp_open(pnode->hn_host, pnode->hn_port);

	return ep;
}

/**
 * @brief
 *	How many bits does it take to represent a number?
 *
 * @param[in] x - unsigned number
 *
 * @return int
 * @retval number of bits
 *
 */
int
numbits(uint x)
{
	int i;

	for (i = 0; x != 0; i++)
		x >>= 1;
	return i;
}

/**
 * @brief
 *	Create a new task for job
 *
 * @param[in] pjob - structure handle to job
 *
 * @return structure
 * @retval structure handle to pbs_task
 *
 */
pbs_task *
momtask_create(job *pjob)
{
	pbs_task *ptask;
	tm_task_id taskid;

	{
		int i;
		uint nodeid = pjob->ji_numvnod; /* largest nodeid */
		uint myvnodeid = pjob->ji_nodeid;

		i = numbits(nodeid);
		taskid = pjob->ji_taskid++;

		/* check for overflow */
		if (numbits(taskid) > (8 * sizeof(taskid) - i))
			return NULL;

		myvnodeid <<= (8 * sizeof(taskid) - i);
		taskid |= myvnodeid;
	}

	ptask = (pbs_task *) malloc(sizeof(pbs_task));
	assert(ptask);
	memset((void *) ptask, 0, sizeof(pbs_task));
	ptask->ti_job = pjob;
	CLEAR_LINK(ptask->ti_jobtask);
	append_link(&pjob->ji_tasks, &ptask->ti_jobtask, ptask);
	ptask->ti_tmfd = NULL;
	ptask->ti_protover = -1;
	ptask->ti_flags = 0;
	ptask->ti_cput = 0;
#ifdef WIN32
	ptask->ti_hProc = NULL;
#endif
	ptask->ti_register = TM_NULL_EVENT;
	CLEAR_HEAD(ptask->ti_obits);
	CLEAR_HEAD(ptask->ti_info);

	ptask->ti_qs.ti_parentnode = TM_ERROR_NODE;
	ptask->ti_qs.ti_parenttask = 0;
	ptask->ti_qs.ti_task = taskid;

	ptask->ti_qs.ti_myvnode = 0;
	ptask->ti_qs.ti_status = TI_STATE_EMBRYO;
	ptask->ti_qs.ti_sid = 0;
	ptask->ti_qs.ti_exitstat = 0;
	memset(ptask->ti_qs.ti_u.ti_hold, 0, sizeof(ptask->ti_qs.ti_u.ti_hold));

	return ptask;
}

/**
 * @brief
 *	find task for job
 *
 * @param[in] pjob - structure handle to job
 * @param[in] taskid - task id
 *
 * @retval structure handle to pbs_task
 *
 */
pbs_task *
task_find(job *pjob, tm_task_id taskid)
{
	pbs_task *ptask;

	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		if (ptask->ti_qs.ti_task == taskid)
			break;
	}
	return ptask;
}

/**
 * @brief
 *	find session  for task
 *
 * @param[in] sid - session id
 *
 * @return structure handle to pbs_task
 *
 */
pbs_task *
find_session(pid_t sid)
{
	job *pjob;
	pbs_task *ptask;

	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob != NULL;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
		     ptask;
		     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
			if (ptask->ti_qs.ti_sid == sid)
				return ptask;
		}
	}
	return NULL;
}

/**
 * @brief
 *	check task for job
 *
 * @param[in] pjob - structure handle to job
 * @param[in] fd   - TM stream
 * @param[in] taskid - task's taskid
 *
 * @return structure handle to pbs_task
 *
 */
pbs_task *
task_check(job *pjob, int fd, tm_task_id taskid)
{
	int i;
	pbs_task *ptask;

	ptask = task_find(pjob, taskid);
	if (ptask == NULL) {
		sprintf(log_buffer, "requesting task %8.8X not found",
			taskid);
		log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
		return NULL;
	}
	for (i = 0; i < ptask->ti_tmnum; i++) {
		if (ptask->ti_tmfd[i] == fd)
			break;
	}
	if (fd < 0 || i == ptask->ti_tmnum) {
		sprintf(log_buffer, "cannot tm_reply to task %8.8X", taskid);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return NULL;
	}
	return ptask;
}

/**
 * @brief
 *      Recover (read in) the tasks from their save files for a job.
 *      This function is only needed upon MOM start up.
 *
 * @param [in]	pjob - pointer to struct job.
 *
 * @return	int
 * @retval	0	Success
 * @retval	-1	Open dir on dirname failed
 *
 */
int
task_recov(job *pjob)
{
	int fds;
	pbs_task *pt;
	char dirname[MAXPATHLEN + 1];
	char namebuf[MAXPATHLEN + 1];
#ifdef WIN32
	int len;
	HANDLE hDir;
	WIN32_FIND_DATA finfo;
#else
	DIR *dir;
	struct dirent *pdirent;
#endif
	struct taskfix task_save;

	(void) strcpy(dirname, path_jobs); /* job directory path */
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(dirname, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(dirname, pjob->ji_qs.ji_jobid);
	(void) strcat(dirname, JOB_TASKDIR_SUFFIX);

#ifdef WIN32
	(void) strcat(dirname, "\\*");

	if ((hDir = FindFirstFile(dirname, &finfo)) == INVALID_HANDLE_VALUE)
		return -1;

	len = strlen(dirname);
	dirname[len - 1] = '\0'; /* trim wildcard */
	do {
		if (finfo.cFileName[0] == '.')
			continue;

		(void) strcpy(namebuf, dirname);
		(void) strcat(namebuf, finfo.cFileName);

		fds = open(namebuf, O_RDONLY, 0);
		if (fds < 0) {
			log_err(errno, __func__, "open of task file");
			unlink(namebuf);
			continue;
		}

		/* read in task quick save sub-structure */
		if (read(fds, (char *) &task_save, sizeof(task_save)) !=
		    sizeof(task_save)) {
			log_err(errno, __func__, "read");
			unlink(namebuf);
			(void) close(fds);
			continue;
		}
		if ((pt = momtask_create(pjob)) == NULL) {
			unlink(namebuf);
			(void) close(fds);
			continue;
		}
		pt->ti_qs = task_save;
		(void) close(fds);

		if (task_save.ti_sid > 0) {
			pt->ti_hProc = OpenProcess(PROCESS_ALL_ACCESS,
						   FALSE, pt->ti_qs.ti_sid);
		}
	} while (FindNextFile(hDir, &finfo));
	(void) FindClose(hDir);
#else
	if ((dir = opendir(dirname)) == NULL)
		return -1;

	(void) strcat(dirname, "/");
	while (errno = 0, (pdirent = readdir(dir)) != NULL) {
		if (pdirent->d_name[0] == '.')
			continue;

		(void) strcpy(namebuf, dirname);
		(void) strcat(namebuf, pdirent->d_name);

		fds = open(namebuf, O_RDONLY, 0);
		if (fds < 0) {
			log_err(errno, __func__, "open of task file");
			unlink(namebuf);
			continue;
		}

		/* read in task quick save sub-structure */
		if (read(fds, (char *) &task_save, sizeof(task_save)) !=
		    sizeof(task_save)) {
			log_err(errno, __func__, "read");
			unlink(namebuf);
			(void) close(fds);
			continue;
		}
		if ((pt = momtask_create(pjob)) == NULL) {
			unlink(namebuf);
			(void) close(fds);
			continue;
		}
		pt->ti_qs = task_save;
		(void) close(fds);
	}
	if (errno != 0 && errno != ENOENT) {
		log_err(errno, __func__, "readdir");
		(void) closedir(dir);
		return -1;
	}
	(void) closedir(dir);
#endif /* WIN32 */

	return 0;
}

/**
 * @brief
 *	Send a reply message to a user proc over a TCP stream.
 *
 * @param[in] stream - file descriptor to tasks
 * @param[in] version - protocol version
 * @param[in] com - command event
 * @param[in] event - event number
 *
 * @return int
 * @retval (DIS_SUCCESS) 0  No error
 *
 */
int
tm_reply(int stream, int version, int com, tm_event_t event)
{
	int ret;

	DBPRT(("tm_reply: stream %d version %d com %d event %d\n",
	       stream, version, com, event))
	DIS_tcp_funcs();

	ret = diswsi(stream, TM_PROTOCOL);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, version);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, com);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, event);
	if (ret != DIS_SUCCESS)
		goto done;
	return DIS_SUCCESS;

done:
	DBPRT(("tm_reply: send error %s\n", dis_emsg[ret]))
	return ret;
}

/**
 * @brief
 *	Start a standard inter-MOM message.
 *
 * @param[in] stream - file descriptor
 * @param[in] jobid  - character pointer holding jobid
 * @param[in] cookie -
 * @param[in] command - command for task
 * @param[in] event   - event number
 * @param[in] taskid  - task id
 * @param[in] version - protocol version
 *
 * @return int
 * @retval (DIS_SUCCESS) 0  No error
 *
 */
int
im_compose(int stream, char *jobid, char *cookie, int command,
	   tm_event_t event, tm_task_id taskid, int version)
{
	int ret;

	if (stream < 0)
		return DIS_EOF;
	DIS_tpp_funcs();

	ret = diswsi(stream, IM_PROTOCOL);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, version);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswst(stream, jobid);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswst(stream, cookie);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, command);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswsi(stream, event);
	if (ret != DIS_SUCCESS)
		goto done;
	ret = diswui(stream, taskid);
	if (ret != DIS_SUCCESS)
		goto done;
	return DIS_SUCCESS;

done:
	DBPRT(("im_compose: send error %s\n", dis_emsg[ret]))
	return ret;
}

/**
 * @brief
 * 	Close the sister streams associated with the mcast channel
 * 	for a job
 * @param[in] pjob - structure handle to job
 *
 * @return Void
 *
 */
void
close_sisters_mcast(job *pjob)
{
	int i;

	for (i = 0; i < pjob->ji_numnodes; i++) {
		hnodent *np = &pjob->ji_hosts[i];
		if (np->hn_stream != -1) {
			tpp_close(np->hn_stream);
			np->hn_stream = -1;
		}
	}
}

/**
 * @brief
 *	simple helper function that checks whether pbs_comm is up
 *	up for a specified duration of time (in seconds)
 *
 * @param[in] - age of connection from establishment time, in seconds
 *
 * @return - communication up or down code
 * @retval 0 - Communications down or is younger than "maturity_time"
 * @retval 1 - Communications up and older than "maturity_time"
 *
 */
int
is_comm_up(int maturity_time)
{
	if ((mom_net_up == 1) && ((time_now - mom_net_up_time) > maturity_time))
		return 1;

	return 0;
}

/**
 * @brief
 *	Modify job 'pjob''s exec_vnode, exec_host, exec_host2
 *	values so that only the nodes/vnodes
 *	belonging to the parent 'momlist' (pjob->ji_momlist)
 *	are retained, and that it satisfies only the given 'select_str'.
 *
 * @param[in,out] pjob 		- job whose exec_vnode/exec_host/exec_host2
 *				 is being pruned.
 * @param[in]	select_str 	- the "schedselect"-like string containing the
 *				specifications that will filter the job's
 *				exec_vnode value.
 *				If this is NULL, then this function
 *				does not prune job's
 *				exec_vnode/exec_host/exec_host2, but rather
 *				just return in 'failed_vnodes' the list of
 *				vnodes assigned to the job that
 *				have non-functioning parent moms.
 *
 * @param[out]  failed_vnodes - returns in here the vnodes and their resources
 *				that have been taken out from the list of
 *				vnodes assigned with non-functioning parent
 *				moms.
 *
 * @return  int
 * @retval	0	- for success
 * @retval	1	- if any error occurred.
 *
 * @note
 *	The first chunk in job's original exec_vnode value is always retained.
 *	It is the one assigned by the mother superior mom.
*/
int
prune_exec_vnode(job *pjob, char *select_str, vnl_t **failed_vnodes, vnl_t **good_vnodes, char *err_msg, int err_msg_sz)
{
	char *execvnode = NULL;
	char *exechost = NULL;
	char *exechost2 = NULL;
	char *schedselect = NULL;
	int rc = 1;
	char *new_exec_vnode = NULL;
	char *new_exec_host = NULL;
	char *new_exec_host2 = NULL;
	char *new_schedselect = NULL;
	int entry = 0;
	relnodes_input_t r_input;
	relnodes_input_select_t r_input_select;

	if (pjob == NULL) {
		log_err(-1, __func__, "job parameter is NULL");
		return (1);
	}

	if (((is_jattr_set(pjob, JOB_ATR_exec_vnode)) == 0) ||
	    (get_jattr_str(pjob, JOB_ATR_exec_vnode) == NULL)) {
		log_err(-1, __func__, "no execvnode");
		return (1);
	}

	execvnode = get_jattr_str(pjob, JOB_ATR_exec_vnode);
	if (execvnode == NULL) {
		log_err(-1, __func__, "execvnode is NULL");
		return (1);
	}

	if (((is_jattr_set(pjob, JOB_ATR_exec_host)) != 0) &&
	    (get_jattr_str(pjob, JOB_ATR_exec_host) != NULL)) {
		exechost = get_jattr_str(pjob, JOB_ATR_exec_host);
	}

	if (((is_jattr_set(pjob, JOB_ATR_exec_host2)) != 0) &&
	    (get_jattr_str(pjob, JOB_ATR_exec_host2) != NULL)) {
		exechost2 = get_jattr_str(pjob, JOB_ATR_exec_host2);
	}

	if (((is_jattr_set(pjob, JOB_ATR_SchedSelect)) != 0) &&
	    (get_jattr_str(pjob, JOB_ATR_SchedSelect) != NULL)) {
		schedselect = get_jattr_str(pjob, JOB_ATR_SchedSelect);
	}

	if ((exechost == NULL) && (exechost2 == NULL)) {
		log_err(-1, __func__, "no exechost nor exechost2");
		goto prune_exec_vnode_exit;
	}

	if (exechost == NULL)
		exechost = exechost2;

	if (exechost2 == NULL)
		exechost2 = exechost;

	relnodes_input_init(&r_input);
	r_input.jobid = pjob->ji_qs.ji_jobid;
	r_input.execvnode = execvnode;
	r_input.exechost = exechost;
	r_input.exechost2 = exechost2;
	r_input.schedselect = schedselect;
	r_input.p_new_exec_vnode = &new_exec_vnode;
	r_input.p_new_exec_host[0] = &new_exec_host;
	r_input.p_new_exec_host[1] = &new_exec_host2;
	r_input.p_new_schedselect = &new_schedselect;

	relnodes_input_select_init(&r_input_select);
	r_input_select.select_str = select_str;
	r_input_select.failed_mom_list = &pjob->ji_failed_node_list;
	r_input_select.succeeded_mom_list = &pjob->ji_node_list;
	r_input_select.failed_vnodes = failed_vnodes;
	r_input_select.good_vnodes = good_vnodes;
	rc = pbs_release_nodes_given_select(&r_input, &r_input_select, err_msg, LOG_BUF_SIZE);

	snprintf(log_buffer, sizeof(log_buffer), "MOM: release_nodes_given_select: AFT rc=%d keep_select=%s execvnode=%s exechost=%s exechost2=%s new_exec_vnode=%s new_exec_host=%s new_exec_host2=%s new_schedselect=%s", rc, "NULL", execvnode,
		 exechost ? exechost : "null", exechost2 ? exechost2 : "null",
		 new_exec_vnode ? new_exec_vnode : "null",
		 new_exec_host ? new_exec_host : "null",
		 new_exec_host2 ? new_exec_host2 : "null", new_schedselect);
	log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);

	if ((rc != 0) || (select_str == NULL)) {
		/* a NULL select_str means to just return in
		 * 'failed_vnodes' those vnodes that are assigned to
		 * job that have been seen as down.
		 */
		goto prune_exec_vnode_exit;
	}

	if (new_exec_vnode != NULL) {

		if (strcmp(execvnode, new_exec_vnode) == 0) {
			/* there was no change */
			rc = 0;
			goto prune_exec_vnode_exit;
		}

		entry = strlen(new_exec_vnode) - 1;
		if (new_exec_vnode[entry] == '+')
			new_exec_vnode[entry] = '\0';

		set_jattr_str_slim(pjob, JOB_ATR_exec_vnode, new_exec_vnode, NULL);

		(void) update_resources_list(pjob, ATTR_l, JOB_ATR_resource, new_exec_vnode, INCR, 0, JOB_ATR_resource_orig);
	}

	if (new_exec_host != NULL) {
		entry = strlen(new_exec_host) - 1;
		if (new_exec_host[entry] == '+')
			new_exec_host[entry] = '\0';
		set_jattr_str_slim(pjob, JOB_ATR_exec_host, new_exec_host, NULL);
	}

	if (new_exec_host2 != NULL) {
		entry = strlen(new_exec_host2) - 1;
		if (new_exec_host2[entry] == '+')
			new_exec_host2[entry] = '\0';
		set_jattr_str_slim(pjob, JOB_ATR_exec_host2, new_exec_host2, NULL);
	}

	if (new_schedselect != NULL) {
		set_jattr_str_slim(pjob, JOB_ATR_SchedSelect, new_schedselect, NULL);
	}

	rc = 0;
prune_exec_vnode_exit:
	free(new_exec_vnode);
	free(new_exec_host);
	free(new_exec_host2);
	free(new_schedselect);

	return (rc);
}

/**
 * @brief
 *	Send to sister nodes updates to exec_vnode, exec_host2,
 *	and schedselect job attributes.
 *
 * @param[in]	pjob - job to update
 *
 * @return int
 * @retval <num>	- # of successfully sent requests to sis moms.
 * @retval -1		- for failure.
*/
int
send_sisters_job_update(job *pjob)
{
	pbs_list_head phead;
	int mtfd = -1;
	int com;
	svrattrl *psatl;
	char *cookie;
	int num = 0;
	hnodent *np;
	eventent *ep = NULL;
	eventent *nep = NULL;
	int i;
	int ret;

	if (pjob == NULL) {
		log_err(-1, __func__, "bad pjob parameter");
		return (-1);
	}
	if (pjob->ji_numnodes <= 1) {
		return (0);
	}
	if (!is_jattr_set(pjob, JOB_ATR_Cookie)) {
		log_err(-1, __func__, "job cookie not set");
		return (-1);
	}

	cookie = get_jattr_str(pjob, JOB_ATR_Cookie);

	CLEAR_HEAD(phead);

	(void) job_attr_def[(int) JOB_ATR_exec_vnode].at_encode(
		get_jattr(pjob, JOB_ATR_exec_vnode),
		&phead,
		ATTR_execvnode,
		NULL,
		ATR_ENCODE_MOM,
		NULL);

	(void) job_attr_def[(int) JOB_ATR_exec_host2].at_encode(
		get_jattr(pjob, JOB_ATR_exec_host2),
		&phead,
		ATTR_exechost2,
		NULL,
		ATR_ENCODE_MOM,
		NULL);

	(void) job_attr_def[(int) JOB_ATR_SchedSelect].at_encode(
		get_jattr(pjob, JOB_ATR_SchedSelect),
		&phead,
		ATTR_SchedSelect,
		NULL,
		ATR_ENCODE_MOM,
		NULL);

	attrl_fixlink(&phead);
	/* Open streams to the sisterhood.  */
	if (pbs_conf.pbs_use_mcast == 1) {
		/* open the tpp mcast channel here */
		if ((mtfd = tpp_mcast_open()) == -1) {
			sprintf(log_buffer, "mcast open failed");
			log_err(errno, __func__, log_buffer);
			return (-1);
		}
	}

	psatl = (svrattrl *) GET_NEXT(phead);
	com = IM_UPDATE_JOB;
	num = 0;
	for (i = 1; i < pjob->ji_numnodes; i++) {
		np = &pjob->ji_hosts[i];

		if (reliable_job_node_find(&pjob->ji_failed_node_list, np->hn_host) != NULL) {
			/* ensure current node (which is managed by a failed mom
			 * host) is not flagged as a problem
			 */
			if (pjob->ji_nodekill == np->hn_node)
				pjob->ji_nodekill = TM_ERROR_NODE;
			snprintf(log_buffer, sizeof(log_buffer),
				 "not sending request IM_UPDATE_JOB to failed mom %s",
				 np->hn_host ? np->hn_host : "UNDEFINED");
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
			continue;
		}
		if (np->hn_stream == -1)
			np->hn_stream = tpp_open(np->hn_host, np->hn_port);
		if (np->hn_stream < 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "tpp_open failed on %s:%d", np->hn_host, np->hn_port);
			log_err(errno, __func__, log_buffer);
			free_attrlist(&phead);
			if (pbs_conf.pbs_use_mcast == 1)
				tpp_mcast_close(mtfd);
			return (-1);
		}

		if (nep == NULL) {
			nep = event_alloc(pjob, com, -1, np,
					  TM_NULL_EVENT, TM_NULL_TASK);
			ep = nep;
		} else {
			ep = event_dup(nep, pjob, np);
		}

		if (ep == NULL) {
			sprintf(log_buffer,
				"failed to create event for %s",
				np->hn_host ? np->hn_host : "node");
			log_err(errno, __func__, log_buffer);
			tpp_close(np->hn_stream);
			np->hn_stream = -1;
			if (pbs_conf.pbs_use_mcast == 1)
				tpp_mcast_close(mtfd);
			free_attrlist(&phead);
			return (-1);
		}
		if (pbs_conf.pbs_use_mcast == 1) {
			/* add each of the tpp streams to the tpp mcast channel */
			if (tpp_mcast_add_strm(mtfd, np->hn_stream, FALSE) == -1) {
				snprintf(log_buffer,
					 sizeof(log_buffer),
					 "mcast add to %s failed",
					 np->hn_host ? np->hn_host : "node");
				log_err(errno, __func__, log_buffer);
				tpp_close(np->hn_stream);
				np->hn_stream = -1;
				tpp_mcast_close(mtfd);
				free_attrlist(&phead);
				return (-1);
			}
		} else {
			/* send message header */
			ret = im_compose(np->hn_stream,
					 pjob->ji_qs.ji_jobid, cookie,
					 com, ep->ee_event, TM_NULL_TASK,
					 IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to send job update to %s",
					 np->hn_host ? np->hn_host : "node");
				log_err(errno, __func__, log_buffer);
				free_attrlist(&phead);
				continue;
			}
			(void) encode_DIS_svrattrl(np->hn_stream,
						   psatl);
			(void) dis_flush(np->hn_stream);
		}
		num++;
	}

	if (pbs_conf.pbs_use_mcast == 1) {
		if (num > 0) {
			ret = im_compose(mtfd, pjob->ji_qs.ji_jobid,
					 cookie, com, ep->ee_event, TM_NULL_TASK,
					 IM_OLD_PROTOCOL_VER);

			if (ret != DIS_SUCCESS) {
				log_err(errno, __func__, "compose mcast header failed");
				tpp_mcast_close(mtfd);
				free_attrlist(&phead);
				return (-1);
			}
			(void) encode_DIS_svrattrl(mtfd, psatl);

			ret = dis_flush(mtfd);
			if (ret != DIS_SUCCESS) {
				log_err(errno, __func__, "flush mcast stream failed");
				tpp_mcast_close(mtfd);
				free_attrlist(&phead);
				return (-1);
			}
		}
		tpp_mcast_close(mtfd);
	}

	free_attrlist(&phead);
	return (num);
}
/**
 *
 * @brief
 *	Receive job updates to exec_vnode, exec_host2, and
 *	schedselect from mother superior via 'stream'.
 *	This would cause job_nodes() to get called to
 *	re-populate nodes info (i.e. ji_vnods)
 *
 * @return int
 * @retval 0	- successs
 * retval  -1	- failure
 */
int
receive_job_update(int stream, job *pjob)
{
	pbs_list_head lhead;
	int found_exechost = 0;
	int found_execvnode = 0;
	int found_schedselect = 0;
	int index;
	int errcode;
	int rc;
	int i;
	svrattrl *psatl;

	CLEAR_HEAD(lhead);
	if (decode_DIS_svrattrl(stream, &lhead) != DIS_SUCCESS) {
		log_err(-1, __func__, "decode_DIS_svrattrl failed");
		return (-1);
	}
	for (psatl = (svrattrl *) GET_NEXT(lhead);
	     psatl; psatl = (svrattrl *) GET_NEXT(psatl->al_link)) {

		/* identify the attribute by name */
		index = find_attr(job_attr_idx, job_attr_def, psatl->al_name);
		if (index < 0) { /* didn`t recognize the name */
			snprintf(log_buffer, sizeof(log_buffer),
				 "did not recognize attribute name %s", psatl->al_name);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  pjob->ji_qs.ji_jobid, log_buffer);
			free_attrlist(&lhead);
			return (-1);
		}

		if (strcmp(psatl->al_name, ATTR_execvnode) == 0) {
			found_execvnode = 1;
		} else if (strcmp(psatl->al_name, ATTR_SchedSelect) == 0) {
			found_schedselect = 1;
		} else if (strcmp(psatl->al_name, ATTR_exechost2) == 0) {
			found_exechost = 1;
		} else {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: ignoring attribute name %s", psatl->al_name);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  pjob->ji_qs.ji_jobid, log_buffer);
			continue;
		}

		errcode = set_jattr_generic(pjob, index, psatl->al_value, psatl->al_resc, INTERNAL);
		/* Unknown resources still get decoded */
		/* under "unknown" resource def */
		if ((errcode != 0) && (errcode != PBSE_UNKRESC)) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed to decode attribute name %s", psatl->al_name);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  pjob->ji_qs.ji_jobid, log_buffer);
			free_attrlist(&lhead);
			return (-1);
		}

		if (psatl->al_op == DFLT)
			(get_jattr(pjob, index))->at_flags |= ATR_VFLAG_DEFLT;
	}
	free_attrlist(&lhead);
	for (i = 0; i < pjob->ji_numvnod; i++) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "before: ji_vnods[%d].vn_node=%d phy node %d host=%s",
			 i, pjob->ji_vnods[i].vn_node,
			 pjob->ji_vnods[i].vn_host->hn_node,
			 pjob->ji_vnods[i].vn_host->hn_host ? pjob->ji_vnods[i].vn_host->hn_host : "");
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}
	if (found_execvnode && found_schedselect && found_exechost) {
		mom_hook_input_t hook_input;
		mom_hook_output_t hook_output;
		char hook_msg[HOOK_MSG_SIZE + 1];
		int hook_errcode = 0;
		hook *last_phook;
		unsigned int hook_fail_action = 0;

		if ((rc = job_nodes(pjob)) != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed updating internal nodes data (rc=%d)", rc);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  pjob->ji_qs.ji_jobid, log_buffer);
			return (-1);
		}

		mom_hook_input_init(&hook_input);
		hook_input.pjob = pjob;

		mom_hook_output_init(&hook_output);
		hook_output.reject_errcode = &hook_errcode;
		hook_output.last_phook = &last_phook;
		hook_output.fail_action = &hook_fail_action;
		if (mom_process_hooks(HOOK_EVENT_EXECJOB_RESIZE,
				      PBS_MOM_SERVICE_NAME, mom_host,
				      &hook_input, &hook_output,
				      hook_msg, sizeof(hook_msg), 1) == 0) {
			snprintf(log_buffer, sizeof(log_buffer), "execjob_resize hook rejected request: %s", hook_msg);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
			return (-1);
		}

		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, "updated nodes info");

		pjob->ji_updated = 1;
		(void) job_save(pjob);

		for (i = 0; i < pjob->ji_numvnod; i++) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "after: ji_vnods[%d].vn_node=%d phy node %d "
				 "host=%s",
				 i,
				 pjob->ji_vnods[i].vn_node,
				 pjob->ji_vnods[i].vn_host->hn_node,
				 pjob->ji_vnods[i].vn_host->hn_host ? pjob->ji_vnods[i].vn_host->hn_host : "");
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
		}
	}
	return (0);
}

/**
 * @brief
 *	Returns 1 if mom entry ('mname', 'port')  is listed
 *	as one of the entries in '+' separated 'exechost' string.
 *
 * @param[in]	exechost - a string of the form:
 *		  exec_host2: <host1>:<port1>/...+<host2>:<port2>/...
 *		  - or -
 *		  exec_host: <host1>/...+<host2>/...
 * @param[in]	mname - mom  hostname to match.
 * @param[in]	port - mom  port number to match.
 *
 * @return int
 * @retval 1	- for a match.
 * @retval 0	- for a non-match or error.
 */
static int
in_exechost(char *exechost, char *mname, int port)
{
	char *ehost = NULL;
	char *str = NULL;
	char *hname = NULL;
	int hport;
	char *pc, *pc2 = NULL;
	momvmap_t *pnat = NULL;
	int match_short = 0;
	char *save_ptr; /* posn for strtok_r() */

	if ((exechost == NULL) || (mname == NULL)) {
		log_err(PBSE_INTERNAL, __func__, "bad input parameter");
		return 0;
	}

	ehost = strdup(exechost);
	if (ehost == NULL) {
		log_err(errno, __func__, "strdup failed");
		return 0;
	}

	str = strtok_r(ehost, "+", &save_ptr);
	while (str != NULL) {
		hname = str;
		hport = -1;
		pc = strchr(str, ':');
		match_short = 0;
		if (pc != NULL) {
			*pc = '\0';
			pc++;
			pc2 = strchr(pc, '/');
			if (pc2 != NULL)
				*pc2 = '\0';
			hport = atoi(pc);
		} else { /* no port info...not exechost2 format*/
			pc2 = strchr(hname, '/');
			if (pc2 != NULL)
				*pc2 = '\0';
			pnat = find_vmap_entry(hname);
			if (pnat != NULL) {
				/* found a map entry */
				hport = pnat->mvm_mom->mi_port;
			} else {
				/* no map entry, use standard port */
				/* and match up to short names */
				hport = pbs_mom_port;
				match_short = 1;
			}
		}

		if (match_short) {
			pc = strchr(hname, '.');
			if (pc != NULL)
				*pc = '\0';

			pc2 = strchr(mname, '.');
			if (pc2 != NULL)
				*pc2 = '\0';

			if ((strcmp(hname, mname) == 0) && (hport == port)) {
				if (pc != NULL)
					*pc = '.';
				if (pc2 != NULL)
					*pc2 = '.';

				free(ehost);
				return 1;
			}
			if (pc != NULL)
				*pc = '.';
			if (pc2 != NULL)
				*pc2 = '.';

		} else {
			if ((strcmp(hname, mname) == 0) && (hport == port)) {
				free(ehost);
				return 1;
			}
		}
		str = strtok_r(NULL, "+", &save_ptr);
	}

	free(ehost);
	return 0;
}
/**
 * @brief
 *	Send a message (command = com) to all the other MOMs in
 *	'pjob'.  Set ji_nodekill if there is a problem
 *	with a node.  Call the function command_func if it is
 *	not NULL.  It can be used to send extra information.
 *
 * @param[in] pjob - structure handle to job
 * @param[in] com  - command for task
 * @param[in] command_func - function
 * @param[in] exclude_exec_host - if sister host match one of these,
 *			then ignore sending mcast message to that host.
 *
 * @return int
 * @retval num - number of nodes without problem
 * @retval 0   - Failure
 *
 */
int
send_sisters_mcast_inner(job *pjob, int com, pbs_jobndstm_t command_func,
			 char *exclude_exec_host)
{
	int i, num, ret;
	eventent *ep, *nep = NULL;
	tm_event_t event = TM_NULL_EVENT;
	char *cookie;
	int mtfd;

	DBPRT(("send_sisters_mcast: command %d\n", com))
	if (!(is_jattr_set(pjob, JOB_ATR_Cookie)))
		return 0;
	cookie = get_jattr_str(pjob, JOB_ATR_Cookie);
	num = 0;

	/* open the tpp mcast channel here */
	if ((mtfd = tpp_mcast_open()) == -1)
		return 0;

	for (i = 0; i < pjob->ji_numnodes; i++) {
		hnodent *np = &pjob->ji_hosts[i];

		if (np->hn_node == pjob->ji_nodeid) /* this is me */
			continue;

		if (pjob->ji_nodekill == TM_ERROR_NODE)
			pjob->ji_nodekill = np->hn_node;

		if (np->hn_sister != SISTER_OKAY) /* sis is gone? */
			continue;

		/*
		 ** 'np' holds the RM port number in np->hn_port
		 ** while exclude_exec_host stores the MOM port
		 ** number. So we need to compare against
		 ** np->hn_port-1, for PBS mom expects RM port =
                 ** MOM port + 1.
		 */
		if ((exclude_exec_host != NULL) &&
		    in_exechost(exclude_exec_host, np->hn_host,
				np->hn_port - 1)) {
			/*
			 ** ensure current node (which is managed by an
			 ** excluded mom host) is not flagged as a problem
			 */
			if (pjob->ji_nodekill == np->hn_node)
				pjob->ji_nodekill = TM_ERROR_NODE;
			continue;
		}

		if (reliable_job_node_find(&pjob->ji_failed_node_list, np->hn_host) != NULL) {
			/* ensure current node (which is managed by a failed mom
			 * host) is not flagged as a problem
			 */
			if (pjob->ji_nodekill == np->hn_node)
				pjob->ji_nodekill = TM_ERROR_NODE;
			snprintf(log_buffer, sizeof(log_buffer),
				 "not sending request %d to failed mom %s",
				 com, np->hn_host ? np->hn_host : "UNDEFINED");
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
			continue;
		}

		if (np->hn_stream == -1)
			np->hn_stream = tpp_open(np->hn_host, np->hn_port);
		np->hn_sister = SISTER_EOF;

		if (np->hn_stream == -1)
			continue;

		/* add each of the tpp streams to the tpp mcast channel */
		if (tpp_mcast_add_strm(mtfd, np->hn_stream, FALSE) == -1) {
			tpp_close(np->hn_stream);
			np->hn_stream = -1;
			continue;
		}

		if (com == IM_DELETE_JOB)
			event = TM_NULL_EVENT;
		else {
			if (nep == NULL) {
				nep = event_alloc(pjob, com, -1, np,
						  TM_NULL_EVENT, TM_NULL_TASK);
				ep = nep;
			} else {
				ep = event_dup(nep, pjob, np);
			}
			event = ep->ee_event;
		}

		if (pjob->ji_nodekill == np->hn_node)
			pjob->ji_nodekill = TM_ERROR_NODE;
		np->hn_sister = SISTER_OKAY;
		num++;
	}

	if (num > 0) {
		ret = im_compose(mtfd, pjob->ji_qs.ji_jobid,
				 cookie, com, event, TM_NULL_TASK, IM_OLD_PROTOCOL_VER);
		if (ret != DIS_SUCCESS) {
			close_sisters_mcast(pjob);
			tpp_mcast_close(mtfd);
			return 0;
		}

		/*
		 ** Here we send any extra information that needs
		 ** to follow the standard set.
		 ** There was a np being passed, have to think what to do about that
		 */
		if (command_func != NULL) {
			ret = command_func(pjob, NULL, mtfd);
			if (ret != DIS_SUCCESS) {
				close_sisters_mcast(pjob);
				tpp_mcast_close(mtfd);
				return 0;
			}
		}
		ret = dis_flush(mtfd);
		if (ret != DIS_SUCCESS) {
			close_sisters_mcast(pjob);
			tpp_mcast_close(mtfd);
			return 0;
		}
	}

	tpp_mcast_close(mtfd);
	return num;
}

/**
 * @brief
 *	Send a message (command = com) to all the other MOMs not
 *	in 'exclude_exec_host' list attached to 'pjob'.
 *	Set ji_nodekill if there is a problem
 *	with a node.  Call the function command_func if it is
 *	not NULL.  It can be used to send extra information.
 *
 * @param[in] pjob - structure handle to job
 * @param[in] com  - command for task
 * @param[in] command_func - function
 * @param[in] exclude_exec_host - if not NULL, do not
 *				send command 'com' to MOM hostnames
 *				appearing in this list, which has the
 *				form:
 *				 <host1>:<port1>/...+<host2>:<port2>/...
 *				 - or -
 *				<host1>/...+<host2>/...
 *
 * @return int
 * @retval num - number of command requests sent out.
 * @retval 0   - Failure
 *
 * @note
 *	Set pjob->ji_nodekill if there is a problem with a node.
 *
 */
int
send_sisters_inner(job *pjob, int com, pbs_jobndstm_t command_func,
		   char *exclude_exec_host)
{
	int i, num, ret;
	eventent *ep, *nep = NULL;
	tm_event_t event;
	char *cookie;

	if (pbs_conf.pbs_use_mcast == 1)
		return send_sisters_mcast_inner(pjob, com, command_func,
						exclude_exec_host);

	DBPRT(("send_sisters: command %d\n", com))
	if (!(is_jattr_set(pjob, JOB_ATR_Cookie)))
		return 0;

	cookie = get_jattr_str(pjob, JOB_ATR_Cookie);
	num = 0;
	for (i = 0; i < pjob->ji_numnodes; i++) {
		hnodent *np = &pjob->ji_hosts[i];

		if (np->hn_node == pjob->ji_nodeid) /* this is me */
			continue;

		if (pjob->ji_nodekill == TM_ERROR_NODE)
			pjob->ji_nodekill = np->hn_node;

		if (np->hn_sister != SISTER_OKAY) /* sis is gone? */
			continue;
		/* 'np' holds the RM port number in np->hn_port */
		/* while exclude_exec_host stores the MOM port */
		/* number. So we need to compare against */
		/* np->hn_port-1 */
		if ((exclude_exec_host != NULL) &&
		    in_exechost(exclude_exec_host, np->hn_host,
				np->hn_port - 1)) {
			/* ensure current node (which is managed by an
			 * excluded mom host) is not flagged as a problem
			 */
			if (pjob->ji_nodekill == np->hn_node) {
				pjob->ji_nodekill = TM_ERROR_NODE;
			}
			continue;
		}

		if (reliable_job_node_find(&pjob->ji_failed_node_list, np->hn_host) != NULL) {
			/* ensure current node (which is managed by a failed mom
			 * host) is not flagged as a problem
			 */
			if (pjob->ji_nodekill == np->hn_node)
				pjob->ji_nodekill = TM_ERROR_NODE;
			snprintf(log_buffer, sizeof(log_buffer) - 1,
				 "not sending request %d to failed mom %s",
				 com, np->hn_host ? np->hn_host : "UNDEFINED");
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
			continue;
		}

		if (np->hn_stream == -1)
			np->hn_stream = tpp_open(np->hn_host, np->hn_port);

		if (np->hn_stream == -1)
			continue;

		np->hn_sister = SISTER_EOF;

		if (com == IM_DELETE_JOB)
			event = TM_NULL_EVENT;
		else {
			if (nep == NULL) {
				nep = event_alloc(pjob, com, -1, np,
						  TM_NULL_EVENT, TM_NULL_TASK);
				ep = nep;
			} else {
				ep = event_dup(nep, pjob, np);
			}
			if (ep == NULL)
				continue;
			event = ep->ee_event;
		}

		ret = im_compose(np->hn_stream, pjob->ji_qs.ji_jobid,
				 cookie, com, event, TM_NULL_TASK, IM_OLD_PROTOCOL_VER);
		if (ret != DIS_SUCCESS)
			continue;
		/*
		 ** Here we send any extra information that needs
		 ** to follow the standard set.
		 */
		if (command_func != NULL) {
			ret = command_func(pjob, np, np->hn_stream);
			if (ret != DIS_SUCCESS)
				continue;
		}
		ret = dis_flush(np->hn_stream);
		if (ret == -1)
			continue;

		if (pjob->ji_nodekill == np->hn_node)
			pjob->ji_nodekill = TM_ERROR_NODE;
		np->hn_sister = SISTER_OKAY;
		num++;
	}
	return num;
}

/**
 * @brief
 *	This is the wrapper function to 'send_sisters_inner()'.
 */
int
send_sisters(job *pjob, int com, pbs_jobndstm_t command_func)
{
	return (send_sisters_inner(pjob, com, command_func, NULL));
}

#define SEND_ERR(err)                                                                                     \
	if (reply) {                                                                                      \
		(void) im_compose(stream, jobid, cookie, IM_ERROR, event, fromtask, IM_OLD_PROTOCOL_VER); \
		(void) diswsi(stream, err);                                                               \
	}

#define SEND_ERR2(err, errmsg)                                                                             \
	if (reply) {                                                                                       \
		(void) im_compose(stream, jobid, cookie, IM_ERROR2, event, fromtask, IM_OLD_PROTOCOL_VER); \
		(void) diswsi(stream, err);                                                                \
		(void) diswst(stream, errmsg);                                                             \
	}

/**
 * @brief
 * 	Check to see which node a stream is coming from.  Return a NULL
 * 	if it is not assigned to this job.  Return a nodeent pointer if
 * 	it is.
 *
 * @param[in] pjob - structure handle to job
 * @param[in] stream - file descriptor for task
 * @param[in] vnodeid - node id
 *
 * @return structure handle to hnodent - SUCCESS
 * @retval                     NULL    - FAILURE
 *
 */
hnodent *
find_node(job *pjob, int stream, tm_node_id vnodeid)
{
	int i;
	vmpiprocs *vp;
	hnodent *hp;
	struct sockaddr_in *node_addr;
	struct sockaddr_in *stream_addr;

	for (vp = pjob->ji_vnods, i = 0; i < pjob->ji_numvnod; vp++, i++) {
		if (vp->vn_node == vnodeid)
			break;
	}
	if (i == pjob->ji_numvnod) {
		sprintf(log_buffer, "node %d not found", vnodeid);
		log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
		return NULL;
	}

	hp = vp->vn_host; /* host for virtual node */
	node_addr = tpp_getaddr(hp->hn_stream);
	stream_addr = tpp_getaddr(stream);

	if (stream_addr == NULL) { /* caller didn't have a stream */
		/*
		 ** If node is not me and no stream open, open one
		 */
		if (pjob->ji_nodeid != hp->hn_node && node_addr == NULL)
			hp->hn_stream = tpp_open(hp->hn_host, hp->hn_port);
		return hp;
	}

	/*
	 **	No stream recorded in the node info, save this one.
	 */
	if (node_addr == NULL) {
		hp->hn_stream = stream;
		hp->hn_eof_ts = 0;
		return hp;
	}

	/*
	 **	At this point, both the input stream and the recorded
	 **	stream for the node are good.  If they are the same
	 **	index, we are done.
	 */
	if (hp->hn_stream == stream) {
		hp->hn_eof_ts = 0;
		return hp;
	}

	/*
	 **	The node struct has a different stream number saved
	 **	then the one passed in (supposedly from the same node).
	 **	Check to see if stream recorded in the node struct
	 **	and the one passed in have the same IP address.  If
	 **	they do (only a possibly different port number),
	 **	we are fine.  Otherwise, a mixup has happened.
	 **
	 **	TODO: check possible multiple IP addresses for
	 **	a single host.
	 */
	if (memcmp(&stream_addr->sin_addr, &node_addr->sin_addr,
		   sizeof(node_addr->sin_addr)) != 0) {
		sprintf(log_buffer,
			"stream id %d does not match %d to node %d",
			stream, hp->hn_stream, vnodeid);
		log_err(-1, __func__, log_buffer);

		sprintf(log_buffer, "%s: stream addr %s", __func__,
			netaddr(stream_addr));
		log_err(-1, __func__, log_buffer);

		sprintf(log_buffer, "%s: node addr %s", __func__,
			netaddr(node_addr));
		log_err(-1, __func__, log_buffer);
		return NULL;
	}

	hp->hn_eof_ts = 0;
	return hp;
}

/**
 *
 * @brief
 *	 Given an socket address 'ap', return the
 *	 hostname mapping the internet address given in 'ap'.
 *
 * @param[in]	ap	- a socket addresas.
 *
 * @return  char *
 *
 * @retval <string>		- the mapped hostname.
 * @retval "" (empty string)	- if none found or error encountered.
 *
 * @note
 *	The returned hostname points to a fixed memory area that must not
 *	be freed, and get overwritten on the next call to
 *	addr_to_hostname().
 *
 */
char *
addr_to_hostname(struct sockaddr_in *ap)
{
	struct hostent *hp;
	static char *ret_hostname = NULL;
	static int hostname_sz = 0;
	char *tmp_str;
	int new_sz;

	if (ap == NULL)
		return ("");

	hp = gethostbyaddr((void *) &ap->sin_addr, sizeof(struct in_addr), AF_INET);
	if (hp == NULL) {
		snprintf(log_buffer, sizeof(log_buffer), "%s: h_errno=%d",
			 inet_ntoa(ap->sin_addr), h_errno);
		log_err(-1, __func__, log_buffer);
		return ("");
	}
	if (hp->h_name == NULL)
		return ("");

	if ((ret_hostname != NULL) && (strcmp(ret_hostname, hp->h_name) == 0))
		return (ret_hostname);

	new_sz = strlen(hp->h_name) + 1;
	if (new_sz > hostname_sz) {
		tmp_str = realloc(ret_hostname, new_sz);
		if (tmp_str == NULL) {
			log_err(errno, __func__, "error on realloc");
			return ("");
		}
		hostname_sz = new_sz;
		ret_hostname = tmp_str;
	}
	pbs_strncpy(ret_hostname, hp->h_name, hostname_sz);
	return (ret_hostname);
}
/**
 * @brief
 * 	An error has been encountered starting a job.
 * 	Format a message to all the sisterhood to get rid of their copy
 * 	of the job.  There should be no processes running at this point.
 *
 * @param pjob		job encountering error
 * @param code		error code
 * @param nodename	name of host that returned the error
 * @param cmd		string giving a verb for what failed
 *
 * @return Void
 *
 */
void
job_start_error(job *pjob, int code, char *nodename, char *cmd)
{
	void exec_bail(job * pjob, int code, char *txt);

	if ((pjob == NULL) || (nodename == NULL) || (cmd == NULL))
		return;

	snprintf(log_buffer, sizeof(log_buffer),
		 "%s %d from node %s could not %s successfully",
		 __func__, code, nodename, cmd);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);
	if (do_tolerate_node_failures(pjob)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "ignoring error from %s as job is tolerant of node failures", nodename);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		/* a filled-in log_buffer could be mistaken for an error message */
		log_buffer[0] = '\0';

		reliable_job_node_add(&pjob->ji_failed_node_list, nodename);
		reliable_job_node_delete(&pjob->ji_node_list, nodename);

#ifndef WIN32
		if (pjob->ji_parent2child_moms_status_pipe != -1) {
			size_t r_size;
			r_size = strlen(nodename) + 1;
			if (write_pipe_data(pjob->ji_parent2child_moms_status_pipe, &r_size, sizeof(size_t)) == 0)
				(void) write_pipe_data(pjob->ji_parent2child_moms_status_pipe, nodename, r_size);
			else
				log_err(errno, __func__, "failed to write");
		}
#endif
		return;
	}
	if (get_job_substate(pjob) >= JOB_SUBSTATE_EXITING)
		return;

	if (code == PBSE_HOOK_REJECT_DELETEJOB)
		exec_bail(pjob, JOB_EXEC_FAILHOOK_DELETE, NULL);
	else if (code == PBSE_HOOK_REJECT_RERUNJOB)
		exec_bail(pjob, JOB_EXEC_FAILHOOK_RERUN, NULL);
	else if (code == PBSE_SISCOMM)
		exec_bail(pjob, JOB_EXEC_JOINJOB, NULL);
	else
		exec_bail(pjob, JOB_EXEC_RETRY, NULL);
}

/**
 * @brief
 * 	chk_del_job - check that all the sisters have replied to a
 *	IM_DELETE_JOB_REPLY request or are dead.  When all are done,
 *	reply to the server and purge the job structure
 *
 * @param[in] pjob - structure handle to job
 * @param[in] errcode - error code
 *
 * @return Void
 *
 */
static void
chk_del_job(job *pjob, int errcode)
{
	int bad = 0;
	int i;

	DBPRT(("%s for job %s\n", __func__, pjob->ji_qs.ji_jobid))

	for (i = 1; i < pjob->ji_numnodes; i++) {
		if (reliable_job_node_find(&pjob->ji_failed_node_list, pjob->ji_hosts[i].hn_host) != NULL) {
			DBPRT(("%s: %d IGNORED for node %s\n", __func__,
			       i, pjob->ji_hosts[i].hn_host))
		} else if (pjob->ji_hosts[i].hn_sister == SISTER_OKAY) {
			/* still need to wait for her to answer */
			DBPRT(("%s: %d OK  for node %s\n", __func__,
			       i, pjob->ji_hosts[i].hn_host))
			break;
		} else if (pjob->ji_hosts[i].hn_sister != SISTER_KILLDONE) {
			/* either dead or replied with error */
			++bad;
			DBPRT(("%s: %d EOF for node %s\n", __func__,
			       i, pjob->ji_hosts[i].hn_host))
		} else {
			DBPRT(("%s: %d DONE node %s\n", __func__,
			       i, pjob->ji_hosts[i].hn_host))
		}
	}

	if (i == pjob->ji_numnodes) {
		/* all sisters are dead or have replied, can    */
		/* now reply to the Server's delete job request */
		if (pjob->ji_preq) {
			if ((bad != 0) || (errcode != 0)) {
				if (pjob->ji_hook_running_bg_on == BG_NONE) {
					req_reject(PBSE_SISCOMM, 0, pjob->ji_preq);
					pjob->ji_preq = NULL;
				} else
					pjob->ji_hook_running_bg_on = BG_PBSE_SISCOMM;
			} else {
				reply_ack(pjob->ji_preq);
				pjob->ji_preq = NULL;
			}
		}
		DBPRT(("%s: all sisters done for job %s\n",
		       __func__, pjob->ji_qs.ji_jobid))
		/*
		 * jobs "could" be purged now, but doing so may impact loop
		 * processing at a higher level, see the chain:
		 * im_eof() -> node_bailout() -> here
		 *
		 * So move job to list of jobs to be purged in Mom's main loop.
		 * Note, we use the ji_jobque link, not the ji_alljobs.
		 * If the job is already on the list of jobs to be purged,
		 * do nothing.
		 */
		if (is_linked(&mom_deadjobs, &pjob->ji_jobque)) {
			DBPRT(("%s: job %s ALREADY LINKED to deadjobs\n",
			       __func__, pjob->ji_qs.ji_jobid))
		} else {
			if (is_linked(&mom_polljobs, &pjob->ji_jobque))
				delete_link(&pjob->ji_jobque);
			if (pjob->ji_hook_running_bg_on == BG_NONE)
				append_link(&mom_deadjobs, &pjob->ji_jobque, pjob);
		}
	}
}

/**
 * @brief
 *	Deal with events hooked to a node where a stream has gone
 *	south or we are going away.
 *
 * @param[in] pjob - structure handle to job
 * @param[in] np   - structure handle to hnodent
 *
 * @return Void
 *
 */
void
node_bailout(job *pjob, hnodent *np)
{
	pbs_task *ptask;
	eventent *ep;
	eventent *nxtep;
	int i;
	int keep_event = 0;
	char *name;
	pbs_list_head phead;

	ep = (eventent *) GET_NEXT(np->hn_events);
	while (ep) {
		switch (ep->ee_command) {

			case IM_JOIN_JOB:
				/*
				 ** I'm MS and a node has failed to respond to the
				 ** call.  Maybe in the future the use can specify
				 ** the job can start with a range of nodes so
				 ** one (or more) missing can be tolerated.  Not
				 ** for now.
				 */

				DBPRT(("%s: JOIN_JOB %s jjretry %d old stream %d\n", __func__, pjob->ji_qs.ji_jobid, ep->ee_retry, np->hn_stream))
				if (ep->ee_retry == 0) {
					/* first failure, try to reopen and resend */
					np->hn_stream = tpp_open(np->hn_host,
								 np->hn_port);
					if (np->hn_stream < 0) {
						/* reopen failed - fatal */
						job_start_error(pjob, PBSE_SISCOMM,
								np->hn_host,
								"JOIN_JOB retry");
						break;
					}
					/* clear error indicator set in im_eof */
					np->hn_sister = SISTER_OKAY;
					/* encode job attributes to send to sister */
					CLEAR_HEAD(phead);
					for (i = 0; i < (int) JOB_ATR_LAST; i++) {
						(void) (job_attr_def + i)->at_encode(get_jattr(pjob, i), &phead, (job_attr_def + i)->at_name, NULL, ATR_ENCODE_MOM, NULL);
					}

					++ep->ee_retry; /* retry count */

					/* resend JOIN_JOB to this sister */
					i = np - pjob->ji_hosts;
					DBPRT(("%s: JOIN_JOB %s host %s port %d jjretry %d i %d new stream %d\n", __func__, pjob->ji_qs.ji_jobid, np->hn_host, np->hn_port, ep->ee_retry, i, np->hn_stream))
					send_join_job_restart(IM_JOIN_JOB, ep, i,
							      pjob, &phead);

					free_attrlist(&phead);
					/*
					 * note that this event is to be retained in
					 * in the list since the associated request
					 * is being retried
					 */
					keep_event = 1;
				} else {
					/* failed on a retry - fatal */
					job_start_error(pjob, PBSE_SISCOMM,
							np->hn_host, "JOIN_JOB");
				}
				break;

			case IM_SETUP_JOB:
				/*
				 ** I'm MS and a node has failed during setup.
				 */
				DBPRT(("%s: SETUP_JOB %s\n", __func__, pjob->ji_qs.ji_jobid))
				job_start_error(pjob, PBSE_SISCOMM, np->hn_host,
						"SETUP_JOB");
				break;

			case IM_SUSPEND:
			case IM_RESUME:
				/*
				 ** A MOM has failed to suspend or resume a job.
				 ** I'm mother superior.
				 */
				sprintf(log_buffer, "%s returned EOF",
					(ep->ee_command == IM_SUSPEND) ? "SUSPEND" : "RESUME");
				log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
				if (pjob->ji_mompost != NULL)
					pjob->ji_mompost(pjob, PBSE_SISCOMM);
				break;

			case IM_RESTART:
			case IM_CHECKPOINT:
			case IM_CHECKPOINT_ABORT:
				/*
				 ** A MOM has failed to do a checkpoint.
				 ** I'm mother superior.
				 */
				name = (ep->ee_command == IM_RESTART) ? "RESTART" : (ep->ee_command == IM_CHECKPOINT) ? "CHECKPOINT"
														      : "CHECKPOINT_ABORT";
				sprintf(log_buffer, "%s returned EOF", name);
				log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
				if (pjob->ji_mompost != NULL)
					pjob->ji_mompost(pjob, PBSE_SISCOMM);
				break;

			case IM_ABORT_JOB:
			case IM_KILL_JOB:
				/*
				 ** The job is already in the process of being killed
				 ** but somebody has dropped off the face of the
				 ** earth.  Just check to see if everybody has
				 ** been heard from in some form or another and
				 ** set JOB_SUBSTATE_EXITING if so.
				 */
				DBPRT(("%s: KILL/ABORT JOB %s\n",
				       __func__, pjob->ji_qs.ji_jobid))
				for (i = 1; i < pjob->ji_numnodes; i++) {
					if ((pjob->ji_hosts[i].hn_sister == SISTER_OKAY) && (reliable_job_node_find(&pjob->ji_failed_node_list, pjob->ji_hosts[i].hn_host) == NULL))
						break;
				}
				if (i == pjob->ji_numnodes) { /* all dead */
					if (check_job_substate(pjob, JOB_SUBSTATE_KILLSIS)) {
						set_job_state(pjob, JOB_STATE_LTR_EXITING);
						set_job_substate(pjob, JOB_SUBSTATE_EXITING);
						exiting_tasks = 1;
					}
				}
				break;

			case IM_DELETE_JOB_REPLY:
				/*
				 ** The job is being deleted and a sister just went bye.
				 ** See if everyone else has replied or died.
				 */
				DBPRT(("%s: DELETE_REPLY JOB eof %s\n",
				       __func__, pjob->ji_qs.ji_jobid))
				chk_del_job(pjob, 0);
				break;

			case IM_SPAWN_TASK:
			case IM_GET_TASKS:
			case IM_SIGNAL_TASK:
			case IM_OBIT_TASK:
			case IM_GET_INFO:
			case IM_GET_RESC:
			case IM_CRED:
				/*
				 ** A user attempt failed, inform process.
				 */
				DBPRT(("%s: REQUEST %d %s\n", __func__,
				       ep->ee_command, pjob->ji_qs.ji_jobid))

				ptask = task_check(pjob, ep->ee_fd, ep->ee_taskid);
				if (ptask == NULL)
					break;
				(void) tm_reply(ep->ee_fd, ptask->ti_protover,
						TM_ERROR, ep->ee_client);
				(void) diswsi(ep->ee_fd, TM_ESYSTEM);
				(void) dis_flush(ep->ee_fd);
				break;

			case IM_POLL_JOB:
				/*
				 ** I must be Mother Superior for the job and
				 ** this is an error reply to a poll request.
				 */
				if (do_tolerate_node_failures(pjob)) {

					snprintf(log_buffer, sizeof(log_buffer),
						 "ignoring POLL error from failed mom %s as job is tolerant of node failures",
						 np->hn_host ? np->hn_host : "");
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
					break;
				}
				sprintf(log_buffer,
					"POLL failed from node %d", np->hn_node);
				log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
				pjob->ji_nodekill = np->hn_node;
				break;

#ifdef PMIX
			case IM_PMIX:
				/* I am MS and a node has failed a PMIX request. */
				DBPRT(("%s: IM_PMIX %s\n", __func__, pjob->ji_qs.ji_jobid))
				snprintf(log_buffer, sizeof(log_buffer),
					 "sister node %s failed PMIx operation",
					 np->hn_host ? np->hn_host : "");
				exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
				break;
#endif /* PMIX */

			case IM_UPDATE_JOB:
				/*
				 ** I'm MS and a node has failed during job update.
				 */
				DBPRT(("%s: UPDATE_JOB %s\n", __func__, pjob->ji_qs.ji_jobid))
				snprintf(log_buffer, sizeof(log_buffer),
					 "sister node %s failed to update job",
					 np->hn_host ? np->hn_host : "");

#ifndef WIN32
				close_update_pipes(pjob);
#endif
				exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
				break;

			default:
				sprintf(log_buffer,
					"unknown command %d saved in event %d",
					ep->ee_command, ep->ee_event);
				if (pjob && pjob->ji_qs.ji_jobid[0]) {
					log_joberr(-1, __func__, log_buffer,
						   pjob->ji_qs.ji_jobid);
				} else
					log_err(-1, __func__, log_buffer);
				break;
		}

		/* get the next event to check; done here as we may keep */
		/* this event in the list (keep_event==1) or delete it   */
		nxtep = (eventent *) GET_NEXT(ep->ee_next);
		if (keep_event == 0) {
			delete_link(&ep->ee_next);
			free(ep);
		} else {
			keep_event = 0; /* reset for next event */
		}
		ep = nxtep; /* go on to examine the next event */
	}
}

/**
 * @brief
 *	Tie off all loose ends for a job that is going away.  In particular,
 * 	release any special resources.  The job should already be terminated
 * 	before getting here.
 *
 * @param[in] pjob - structure handle to job
 *
 * @see job_clean_extra
 * @see del_job_hw
 *
 * @return Void
 *
 */
void
term_job(job *pjob)
{
	hnodent *np;
	int num;

	for (num = 0, np = pjob->ji_hosts;
	     num < pjob->ji_numnodes;
	     num++, np++) {
		if (np->hn_stream >= 0) {
			np->hn_stream = -1;
			np->hn_sister = SISTER_EOF;
		}
		node_bailout(pjob, np);
	}

	if (job_clean_extra != NULL) {
		(void) job_clean_extra(pjob);
	}

	del_job_hw(pjob); /* release special hardware related resources */
}

/**
 * @brief
 *	Handle a stream that needs to be closed.
 *	May be either from another Mom, or the server.
 *
 * @param[in] stream - file descriptor
 * @param[in] ret    - indicates value for error message to be logged
 *
 * @return Void
 *
 */
void
im_eof(int stream, int ret)
{
	int num;
	job *pjob;
	hnodent *np;
	struct sockaddr_in *addr;

	addr = tpp_getaddr(stream);
	sprintf(log_buffer, "%s from addr %s on stream %d",
		dis_emsg[ret], netaddr(addr), stream);
	log_err(-1, __func__, log_buffer);
	tpp_close(stream);

	if (stream == server_stream) {
		sprintf(log_buffer, "Server closed connection.");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, log_buffer);
		server_stream = -1;
	}

	/*
	 ** Search through all the jobs looking for this stream.
	 ** We want to find if any events are being waited for
	 ** from the "dead" stream and do something with them.
	 */
	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob != NULL;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		for (num = 0, np = pjob->ji_hosts;
		     num < pjob->ji_numnodes;
		     num++, np++) {
			if (np->hn_stream != stream)
				continue;

			np->hn_stream = -1;
			if (np->hn_eof_ts == 0)
				np->hn_eof_ts = time(0);
			pjob->ji_msconnected = 0;

			/*
			 ** In case connection to pbs_comm is down/recently established, do not kill a job that is actually running.
			 ** If this is the MS, we check job substate == JOB_SUBSTATE_RUNNING to see if job is running.
			 ** If this is a sister, we check is substate is JOB_SUBSTATE_PRERUN or JOB_SUBSTATE_RUNNING
			 ** We include PRERUN in case of jobs at sisters since at sister moms job substate stays at PRERUN
			 ** till a tm task is initiated on it by the MS
             ** We also check for substate JOB_SUBSTATE_SUSPEND to retain suspended jobs.
			 **
			 */
			if ((((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) && (check_job_substate(pjob, JOB_SUBSTATE_PRERUN))) ||
			    (check_job_substate(pjob, JOB_SUBSTATE_RUNNING)) || (check_job_substate(pjob, JOB_SUBSTATE_SUSPEND))) {
				if (do_tolerate_node_failures(pjob)) {
					sprintf(log_buffer, "ignoring lost communication with %s as job is tolerant of node failures", np->hn_host);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
					reliable_job_node_add(&pjob->ji_failed_node_list, np->hn_host);
					reliable_job_node_delete(&pjob->ji_node_list, np->hn_host);
#ifndef WIN32
					if (pjob->ji_parent2child_moms_status_pipe != -1) {
						size_t r_size;
						r_size = strlen(np->hn_host) + 1;
						if (write_pipe_data(pjob->ji_parent2child_moms_status_pipe, &r_size, sizeof(size_t)) == 0)
							(void) write_pipe_data(pjob->ji_parent2child_moms_status_pipe, np->hn_host, r_size);
						else
							log_err(errno, __func__, "failed to write");
					}
#endif
					continue;
				} else if ((time_now - np->hn_eof_ts) <= max_poll_downtime_val) {
					sprintf(log_buffer, "lost communication with %s, not killing job yet", np->hn_host);
					log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
					continue;
				}

				if (!is_comm_up(COMM_MATURITY_TIME)) {
					sprintf(log_buffer, "lost connection to %s due to pbs_comm down/recently established, not killing job", np->hn_host);
					log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
					continue;
				}

				sprintf(log_buffer, "lost communication with %s for > %d secs, killing job now", np->hn_host, max_poll_downtime_val);
				log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
			}

			np->hn_sister = SISTER_EOF;
			node_bailout(pjob, np);

			/*
			 ** If dead stream is num = 0, I'm a regular node
			 ** and my connection to Mother Superior is gone...
			 ** kill job.
			 */
			if (num != 0)
				continue;

			sprintf(log_buffer,
				"lost connection to MS on %s", np->hn_host);
			log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
			kill_job(pjob, SIGKILL);
			set_job_substate(pjob, JOB_SUBSTATE_EXITING);
			exiting_tasks = 1;
		}
	}
}

/**
 * @brief
 *	Check to be sure this is a connection from Mother Superior on
 * 	a good port.
 *	Check to make sure I am not Mother Superior (talking to myself).
 * 	Set the stream in ji_nodes[0] if needed.
 *
 * @param[in] stream - file descriptor
 * @param[in] pjob   - structure handle to job
 *
 * @return error code
 * @retval TRUE  error
 * @retval FALSE if okay
 *
 */
int
check_ms(int stream, job *pjob)
{
	struct sockaddr_in *addr;
	hnodent *np;

	addr = tpp_getaddr(stream);

	if (pjob == NULL)
		return FALSE;

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {
		log_joberr(-1, __func__, "Mother Superior talking to herself",
			   pjob->ji_qs.ji_jobid);
		tpp_eom(stream);
		return TRUE;
	}

	/*
	 ** This should be mother superior calling.
	 ** We always have a stream open to her at node 0.
	 */
	np = &pjob->ji_hosts[0]; /* MS entry */
	if (stream != np->hn_stream) {
		if (np->hn_stream != -1) {
			sprintf(log_buffer,
				"MS reset from %d to %d (%s)",
				np->hn_stream, stream, netaddr(addr));
			log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
		}
		np->hn_stream = stream;
	}
	np->hn_eof_ts = 0;
	pjob->ji_msconnected = 1;
	return FALSE;
}

/**
 * @brief
 *	return resource used by job
 *
 * @param[in] pjob - structure handle to job
 * @param[in] name - character pointer holding resource name
 * @param[in] (*func)(resource *) -
 *
 *
 */
u_long
resc_used(job *pjob, char *name, u_long (*func)(resource *))
{
	resource_def *rd;
	resource *pres;
	u_long val = 0L;

	if (!is_jattr_set(pjob, JOB_ATR_resc_used))
		return 0;

	rd = find_resc_def(svr_resc_def, name);
	if (rd == NULL)
		return 0;

	pres = find_resc_entry(get_jattr(pjob, JOB_ATR_resc_used), rd);
	if (pres == NULL)
		return 0;

	val = func(pres);
	DBPRT(("resc_used: %s %lu\n", name, val))
	return val;
}

/**
 * @brief
 *	Find named info for a task.
 *
 * @param[in] ptask - structure handle to pbs_task
 * @param[in] name  - name of task
 *
 * @return structure handle to infoent
 *
 */
infoent *
task_findinfo(pbs_task *ptask, char *name)
{
	infoent *ip;

	for (ip = (infoent *) GET_NEXT(ptask->ti_info);
	     ip;
	     ip = (infoent *) GET_NEXT(ip->ie_next)) {
		if (strcmp(ip->ie_name, name) == 0)
			break;
	}
	return ip;
}

/**
 * @brief
 *	Save named info with a task.
 *
 * @param[in] ptask - structure handle to pbs_task
 * @param[in] name  - char pointer to hold name of task
 * @param[in] info  - string counted
 * @param[in] len   - length of string
 *
 * @return Void
 *
 */
void
task_saveinfo(pbs_task *ptask, char *name, void *info, int len)
{
	infoent *ip;

	if ((ip = task_findinfo(ptask, name)) == NULL) { /* new name */
		ip = (infoent *) malloc(sizeof(infoent));
		assert(ip);
		CLEAR_LINK(ip->ie_next);
		append_link(&ptask->ti_info, &ip->ie_next, ip);
		ip->ie_name = name;
	} else /* replace name with new info */
		free(ip->ie_info);

	ip->ie_info = info;
	ip->ie_len = len;
}

/**
 * @brief
 *	Generate a resource string for a job.
 *
 * @param pjob - structure handle to job
 *
 * @return string
 * @retval res_string
 *
 */
char *
resc_string(job *pjob)
{
	attribute *at;
	attribute_def *ad;
	svrattrl *pal;
	pbs_list_head lhead;
	int len, used, tot;
	char *res_str, *ch;
	char *getuname();
	extern int resc_access_perm;

	ch = getuname();
	len = strlen(ch);
	tot = len * 2;
	used = 0;
	res_str = (char *) malloc(tot);
	if (res_str == NULL)
		return NULL;
	strcpy(res_str, ch);
	used += len;
	res_str[used++] = ':';

	at = get_jattr(pjob, JOB_ATR_resource);
	if (at->at_type != ATR_TYPE_RESC) {
		res_str[used] = '\0';
		return res_str;
	}
	ad = &job_attr_def[(int) JOB_ATR_resource];
	resc_access_perm = ATR_DFLAG_USRD;
	CLEAR_HEAD(lhead);
	(void) ad->at_encode(at,
			     &lhead, ad->at_name,
			     NULL, ATR_ENCODE_CLIENT, NULL);
	attrl_fixlink(&lhead);

	for (pal = (svrattrl *) GET_NEXT(lhead);
	     pal;
	     pal = (svrattrl *) GET_NEXT(pal->al_link)) {
		while (used + pal->al_rescln + pal->al_valln > tot) {
			char *tmp_res_str;

			tot *= 2;
			tmp_res_str = realloc(res_str, tot);
			if (tmp_res_str == NULL) {
				free(res_str);
				free_attrlist(&lhead);
				return NULL;
			}
			res_str = tmp_res_str;
		}
		strcpy(&res_str[used], pal->al_resc);
		used += (pal->al_rescln - 1);
		res_str[used++] = '=';
		strcpy(&res_str[used], pal->al_value);
		used += (pal->al_valln - 1);
		res_str[used++] = ',';
	}
	free_attrlist(&lhead);
	res_str[--used] = '\0';
	return res_str;
}

/**
 * @brief
 *	Process a cred received in a JOIN_JOB.
 *
 * @param[in] pjob - structure handle to job
 * @param[in] info - string count
 * @param[in] len - length of string
 * @param[in] tcp - indiaction whether tcp or not
 * @param[in] con - inter mom stream
 *
 * @return  error code
 * @retval -1     error
 * @retval  0     Success
 *
 */
int
mom_create_cred(job *pjob, char *info, size_t len, int tcp, int con)
{
	int ret = -1;
	int type = pjob->ji_extended.ji_ext.ji_credtype;

	DBPRT(("%s: entered\n", __func__))
	switch (type) {

		case PBS_CREDTYPE_NONE:
			ret = 0;
			break;

		default:
			ret = write_cred(pjob, info, len);
			break;
	}

	return ret;
}

static char bail_format[] = "dis read failed: %s";

#define BAIL(message)                                      \
	if (ret != DIS_SUCCESS) {                          \
		sprintf(log_buffer, bail_format, message); \
		goto err;                                  \
	}

/**
 * @brief
 *	Send resources_used values to the MS via
 *	'stream' descriptor.
 *
 * @param[in] stream - descriptor pathway to MS.
 * @param[in] pjob - poineter to owning job structure
 *
 * @return  error code
 * @retval -1     error
 * @retval  0     Success
 *
 */
int
send_resc_used_to_ms(int stream, job *pjob)
{
	extern int resc_access_perm;
	attribute *at;
	attribute_def *ad;
	svrattrl *pal;
	svrattrl *nxpal;
	pbs_list_head lhead;
	pbs_list_head send_head;
	svrattrl *psatl;
	int ret;

	if (pjob == NULL || stream == -1)
		return (-1);

	at = get_jattr(pjob, JOB_ATR_resc_used);
	if (at->at_type != ATR_TYPE_RESC)
		return (-1);
	ad = &job_attr_def[(int) JOB_ATR_resc_used];
	resc_access_perm = ATR_DFLAG_MGRD;

	memset(&lhead, 0, sizeof(lhead));
	CLEAR_HEAD(lhead);

	(void) ad->at_encode(at, &lhead, ad->at_name, NULL, ATR_ENCODE_CLIENT, NULL);
	memset(&send_head, 0, sizeof(send_head));
	CLEAR_HEAD(send_head);

	pal = (svrattrl *) GET_NEXT(lhead);
	while (pal != NULL) {
		nxpal = (struct svrattrl *) GET_NEXT(pal->al_link);

		/* no need to track the resources automatically sent to MS */
		/* like 'cput', 'mem', and 'cpupercent',but only those */
		/* resources that are set in a mom hook */
		if ((pal->al_flags & ATR_VFLAG_HOOK) != 0 &&
		    strcmp(pal->al_resc, "cput") != 0 &&
		    strcmp(pal->al_resc, "mem") != 0 &&
		    strcmp(pal->al_resc, "cpupercent") != 0) {
			if (add_to_svrattrl_list(&send_head, pal->al_name, pal->al_resc,
						 pal->al_value, pal->al_op, NULL) == -1) {
				free_attrlist(&send_head);
				free_attrlist(&lhead);
				return (-1);
			}
		}
		pal = nxpal;
	}
	free_attrlist(&lhead);

	psatl = (svrattrl *) GET_NEXT(send_head);
	if (psatl == NULL) {
		free_attrlist(&send_head);
		return (-1);
	}

	ret = encode_DIS_svrattrl(stream, psatl);
	free_attrlist(&send_head);
	if (ret != DIS_SUCCESS)
		return (-1);
	return (0);
}

/**
 * @brief
 *	Received resources_used values for job 'jobid'
 *	from descriptor 'stream', with values to be saved in
 *	internal nodes resources table indexed by 'nodeidx'.
 *
 * @param[in] stream - descriptor pathway
 * @param[in] pjob - pointer to owning job structure
 * @param[in] nodeidx - node index to the job's internal resources table
 *			where received values will be saved.
 *			resources values received from
 *
 * @return  error code
 * @retval -1     error
 * @retval  0     Success
 *
 */
int
recv_resc_used_from_sister(int stream, job *pjob, int nodeidx)
{
	extern int resc_access_perm;
	attribute_def *pdef;
	pbs_list_head lhead;
	svrattrl *psatl;
	int errcode;

	if (pjob == NULL || stream == -1 || nodeidx < 0)
		return (-1);

	pdef = &job_attr_def[(int) JOB_ATR_resc_used];

	CLEAR_HEAD(lhead);
	if (decode_DIS_svrattrl(stream, &lhead) != DIS_SUCCESS) {
		sprintf(log_buffer, "decode_DIS_svrattrl failed");
		return (-1);
	}
	if (is_attr_set(&pjob->ji_resources[nodeidx].nr_used) != 0)
		pdef->at_free(&pjob->ji_resources[nodeidx].nr_used);
	/* decode attributes from request into job structure */
	clear_attr(&pjob->ji_resources[nodeidx].nr_used, &job_attr_def[JOB_ATR_resc_used]);

	resc_access_perm = READ_WRITE;
	psatl = (svrattrl *) GET_NEXT(lhead);
	for (; psatl; psatl = (svrattrl *) GET_NEXT(psatl->al_link)) {

		if ((psatl->al_name == NULL) || (psatl->al_resc == NULL)) {
			free_attrlist(&lhead);
			return (-1);
		}

		if (strcmp(psatl->al_name, ATTR_used) != 0) {
			free_attrlist(&lhead);
			return (-1);
		}

		errcode = set_attr_generic(&pjob->ji_resources[nodeidx].nr_used, pdef, psatl->al_value, psatl->al_resc, INTERNAL);
		/* Unknown resources still get decoded */
		/* under "unknown" resource def */
		if ((errcode != 0) && (errcode != PBSE_UNKRESC)) {
			free_attrlist(&lhead);
			return (-1);
		}

		if (psatl->al_op == DFLT)
			pjob->ji_resources[nodeidx].nr_used.at_flags |= ATR_VFLAG_DEFLT;
	}

	free_attrlist(&lhead);
	return (0);
}

/**
 * @brief
 *	General purpose function for executing actions that are done
 *	before calling finish_exec() on a job.
 *
 * @param[in]       pjob		job being operated on
 * @param[in]       do_job_setup_send	set to 1 if job_setup_send() should be done
 *
 * @return enum pre_finish_results_t
 * @retval PRE_FINISH_SUCCESS			all actions executed successfully
 * @retval PRE_FINISH_FAIL			at least one of the actions has failed
 * @retval PRE_FINISH_SUCCESS_JOB_SETUP_SEND	all actions up to job_setup_send()
 *						succeeded
 * @retval PRE_FINISH_FAIL_JOB_SETUP_SEND	action to do job_setup_send() failed
 * @retval PRE_FINISH_FAIL_JOIN_EXTRA		action to do job_join_extra() failed
 *
 */
pre_finish_results_t
pre_finish_exec(job *pjob, int do_job_setup_send)
{
	if (pjob == NULL)
		return PRE_FINISH_FAIL;

	/*
	 * If job_join_read exists, call it to read
	 * any extra info included with the JOIN reply.
	 * This function can return an error if there
	 * is no extra information or deal with it
	 * more gracefully and return SUCCESS.
	 */
	if (job_join_extra != NULL) {
		if (job_join_extra(pjob, &pjob->ji_hosts[0]) != 0)
			return PRE_FINISH_FAIL_JOIN_EXTRA;
	}

	/*
	 * If there is a job_setup_send function,
	 * send a SETUP_JOB message to each node.
	 * The call to finish_exec will happen
	 * when we get a reply from all the nodes.
	 */
	if (do_job_setup_send && (job_setup_send != NULL)) {
		if (send_sisters(pjob, IM_SETUP_JOB, job_setup_send) != pjob->ji_numnodes - 1)
			return PRE_FINISH_FAIL_JOB_SETUP_SEND;
		return PRE_FINISH_SUCCESS_JOB_SETUP_SEND;
	}
	return PRE_FINISH_SUCCESS;
}

// clang-format off

/**
 * @brief
 *	Input is coming from another MOM over a DIS on tpp stream.
 *	Read the stream to get a Inter-MOM request.
 *
 *	request (
 *		jobid	string
 *		cookie	string
 *		command	int
 *		event	int
 *		task	int
 *	)
 *
 *	Format the reply and write it back.
 *
 *
 * @param[in] stream	inter-MOM TPP stream
 * @param[in] version	inter-MOM protocol version; only IM_PROTOCOL_VER is currently supported
 * @return void
 *
 */
void
im_request(int stream, int version)
{
	int			command = 0;
	int			event_com = -1, ret;
	char			*jobid = NULL;
	char			*cookie = NULL;
	char			*oreo;
	char			basename[MAXPATHLEN + 1] = {0};
	char			namebuf[MAXPATHLEN+1];
	job			*pjob;
	pbs_task		*ptask;
	hnodent			*np;
	eventent		*ep = NULL;
	infoent			*ip;
	struct	sockaddr_in	*addr;
	u_long			ipaddr;
	int			i, errcode;
	int			nodeidx =0;
	int			resc_idx = 0;
	int			reply;
	int			exitval;
	tm_node_id		pvnodeid;
	tm_node_id		tvnodeid;
	tm_task_id		fromtask, event_task = 0, taskid;
	int			hnodenum, index;
	int			num;
	int			sig;
	char			**argv, **envp, *cp;
	char			*name;
	void			*info = NULL;
	size_t			len;
	tm_event_t		event, event_client = 0;
	int			efd = -1;
	pbs_list_head		lhead;
	svrattrl		*psatl;
	extern  unsigned long	 QA_testing;
	extern	int		resc_access_perm;
	int			local_supres(job *pjob, int which,
		struct batch_request *preq);
	char			*errmsg = NULL;
	char			hook_msg[HOOK_MSG_SIZE+1];
	int			argc = 0;
	mom_hook_input_t	hook_input;
	mom_hook_output_t	hook_output;
	mom_hook_input_t	*hook_input_ptr;
	mom_hook_output_t	*hook_output_ptr;
	int			hook_errcode = 0;
	int			hook_rc = 0;
	hook			*last_phook = NULL;
	unsigned int		hook_fail_action = 0;
	char			*nodehost = NULL;
	char			timebuf[TIMEBUF_SIZE] = {0};
  	char			*delete_job_msg = NULL;

	DBPRT(("%s: stream %d version %d\n", __func__, stream, version))
	if ((version != IM_PROTOCOL_VER) && (version != IM_OLD_PROTOCOL_VER)) {
		sprintf(log_buffer, "protocol version %d unknown", version);
		log_err(-1, __func__, log_buffer);
		tpp_close(stream);
		return;
	}

	/* check that machine is known */
	addr = tpp_getaddr(stream);
	if (addr == NULL) {
		sprintf(log_buffer, "Sender unknown");
		log_err(-1, __func__, log_buffer);
		tpp_close(stream);
		return;
	}

	ipaddr = ntohl(addr->sin_addr.s_addr);
	DBPRT(("connect from %s\n", netaddr(addr)))
	if (!addrfind(ipaddr)) {
		sprintf(log_buffer, "bad connect from %s",
			netaddr(addr));
		log_err(-1, __func__, log_buffer);
		im_eof(stream, 0);
		return;
	}

	jobid = disrst(stream, &ret);
	BAIL("jobid")
	cookie = disrst(stream, &ret);
	BAIL("cookie")
	command = disrsi(stream, &ret);
	BAIL("command")
	event = disrsi(stream, &ret);
	BAIL("event")
	fromtask = disrui(stream, &ret);
	BAIL("fromtask")
	switch (command) {

		case IM_JOIN_RECOV_JOB:
			reply = 1;

			hnodenum = disrsi(stream, &ret);
			BAIL("JOINJOB nodenum")

			np = NULL;
			/* job should already exist */
			pjob = find_job(jobid);
			if( pjob == NULL ) {
				SEND_ERR(PBSE_SYSTEM)
				goto done;
			}
			pjob->ji_stdout = disrsi(stream, &ret);
			BAIL("JOINJOB stdout")
			pjob->ji_stderr = disrsi(stream, &ret);
			BAIL("JOINJOB stderr")
			pjob->ji_qs.ji_un.ji_momt.ji_exuid = pjob->ji_grpcache->gc_uid;
			pjob->ji_qs.ji_un.ji_momt.ji_exgid = pjob->ji_grpcache->gc_gid;
			pjob->ji_msconnected = 1;
			goto done;
		case IM_JOIN_JOB:
			/*
			 ** Sender is mom superior sending a job structure to me.
			 ** I am going to become a member of a job.
			 **
			 ** auxiliary info (
			 **	local host id	int;
			 **	number of nodes	int;
			 **	stdout port	int;
			 **	stderr port	int;
			 **	cred type	int;
			 **	credential	string; <if cred type != 0>
			 **	jobattrs	attrl;
			 ** )
			 */
			reply = 1;
			if (check_ms(stream, NULL))
				goto fini;

			hnodenum = disrsi(stream, &ret);
			BAIL("JOINJOB nodenum")

			np = NULL;
			/* does job already exist? */
			pjob = find_job(jobid);
			if (pjob) {	/* job is here */
				kill_job(pjob, SIGKILL);
				mom_deljob(pjob);
			}
			if ((pjob = job_alloc()) == NULL) {
				SEND_ERR(PBSE_SYSTEM)
				goto done;
			}

			pjob->ji_stdout = disrsi(stream, &ret);
			BAIL("JOINJOB stdout")
			pjob->ji_stderr = disrsi(stream, &ret);
			BAIL("JOINJOB stderr")
			pjob->ji_extended.ji_ext.ji_credtype = disrsi(stream, &ret);
			BAIL("JOINJOB credtype")
			if (pjob->ji_extended.ji_ext.ji_credtype != PBS_CREDTYPE_NONE) {
				info = disrcs(stream, &len, &ret);
				BAIL("JOINJOB credential")
			}
			pjob->ji_msconnected = 1;

			pjob->ji_numnodes = hnodenum;
			CLEAR_HEAD(lhead);
			if (decode_DIS_svrattrl(stream, &lhead) != DIS_SUCCESS) {
				sprintf(log_buffer, "decode_DIS_svrattrl failed");
				goto err;
			}
			/*
			 ** Get the hashname from the attribute.
			 */
			psatl = (svrattrl *)GET_NEXT(lhead);
			while (psatl) {
				if (!strcmp(psatl->al_name, ATTR_hashname)) {
					pbs_strncpy(basename, psatl->al_value, sizeof(basename));
					break;
				}
				psatl = (svrattrl *)GET_NEXT(psatl->al_link);
			}
			pbs_strncpy(pjob->ji_qs.ji_jobid, jobid, sizeof(pjob->ji_qs.ji_jobid));
			if (strlen(basename) <= PBS_JOBBASE)
				strcpy(pjob->ji_qs.ji_fileprefix, basename);
			else
				*pjob->ji_qs.ji_fileprefix = '\0';
			pjob->ji_nodeid = -1;
			pjob->ji_qs.ji_svrflags = 0;
			pjob->ji_qs.ji_un_type = JOB_UNION_TYPE_MOM;

			/* decode attributes from request into job structure */
			errcode = 0;
			resc_access_perm = READ_WRITE;
			for (psatl = (svrattrl *)GET_NEXT(lhead);
				psatl;
				psatl = (svrattrl *)GET_NEXT(psatl->al_link)) {

				/* identify the attribute by name */
				index = find_attr(job_attr_idx, job_attr_def, psatl->al_name);
				if (index < 0) {	/* didn`t recognize the name */
					errcode = PBSE_NOATTR;
					break;
				}

				errcode = set_jattr_generic(pjob, index, psatl->al_value, psatl->al_resc, INTERNAL);
				/* Unknown resources still get decoded */
				/* under "unknown" resource def */
				if ((errcode != 0) && (errcode != PBSE_UNKRESC))
					break;

				if (psatl->al_op == DFLT)
					(get_jattr(pjob, index))->at_flags |= ATR_VFLAG_DEFLT;
			}
			free_attrlist(&lhead);
			if (errcode != 0) {
				(void)job_purge_mom(pjob);
				SEND_ERR(errcode)
				goto done;
			}

			pjob->ji_nodeid = TM_ERROR_NODE;
			if ((errcode = job_nodes_inner(pjob, &np)) != 0) {
				sprintf(log_buffer,
					"job_nodes_inner failed with error %d", errcode);
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
				nodes_free(pjob);
				SEND_ERR(errcode)
				goto done;
			}

			pjob->ji_hosts[0].hn_stream = stream;

			if (gen_nodefile_on_sister_mom) {
				char varlist[(2 * MAXPATHLEN) + 1] = "PBS_NODEFILE=";
				char buf[MAXPATHLEN + 1];
				if (generate_pbs_nodefile(pjob, buf, sizeof(buf) - 1, log_buffer, LOG_BUF_SIZE - 1) == 0) {
					strcat(varlist, buf);
					set_jattr_generic(pjob, JOB_ATR_variables, varlist, NULL, INCR);
				}
			}

			/*
			 ** Check to make sure we found ourself.
			 */
			if (pjob->ji_nodeid == TM_ERROR_NODE) {
				char *eh2;

				snprintf(log_buffer, sizeof(log_buffer),
					"no match for my hostname '%s' was found in exec_host2, "
					"possible network misconfiguration", mom_host);

				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_CRIT, pjob->ji_qs.ji_jobid, log_buffer);

				if ((eh2 = get_jattr_str(pjob,  JOB_ATR_exec_host2)) != NULL) {
					snprintf(log_buffer, sizeof(log_buffer), "exec_host2 = %s", eh2);
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					LOG_CRIT, pjob->ji_qs.ji_jobid, log_buffer);
				}

				nodes_free(pjob);
				SEND_ERR(PBSE_INTERNAL);
				goto done;
			}

			/* set remaining job structure elements */
			set_job_state(pjob, JOB_STATE_LTR_RUNNING);
			set_job_substate(pjob, JOB_SUBSTATE_PRERUN);
			set_jattr_l_slim(pjob, JOB_ATR_mtime, time_now, SET);
			pjob->ji_qs.ji_stime = time_now;
			pjob->ji_polltime = time_now;

			/* np is set from job_nodes_inner */


			/*
			 * NULL value passed to hook_input.vnl
			 * means to assign vnode list using pjob->ji_host[].
			 */
			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			switch ((hook_rc=mom_process_hooks(HOOK_EVENT_EXECJOB_BEGIN,
					PBS_MOM_SERVICE_NAME, mom_host,
					&hook_input, &hook_output,
					hook_msg, sizeof(hook_msg), 1))) {
				case 1:   	/* explicit accept */
					break;
				case 2:	/* no hook script executed - go ahead and accept event*/
					break;
				default:
					/* a value of '0' means explicit reject encountered. */
					if (hook_rc != 0) {
						/*
						 * we've hit an internal error (malloc error, full disk, etc...), so
						 * treat this now like a  hook error so hook fail_action will be
						 * consulted. Before, behavior of an internal error was to ignore it!
						 */
						hook_errcode = PBSE_HOOKERROR;
					}
					SEND_ERR2(hook_errcode, (char *)hook_msg);
					if ((hook_errcode == PBSE_HOOKERROR) &&
					    (last_phook != NULL) &&
					    ((last_phook->fail_action & HOOK_FAIL_ACTION_OFFLINE_VNODES) != 0)) {
						vnl_t *tvnl = NULL;
						char	hook_buf[HOOK_BUF_SIZE];
						int	vret = 0;

						snprintf(hook_buf,
							HOOK_BUF_SIZE,
							"1,%s",
							last_phook->hook_name);
						if (vnl_alloc(&tvnl) != NULL) {
							vret = vn_addvnr(tvnl,
								mom_short_name,
								VNATTR_HOOK_OFFLINE_VNODES,
								hook_buf, 0, 0, NULL);
						} else {
							vret = 1;
						}

						if (vret != 0) {
							snprintf(log_buffer,
								sizeof(log_buffer),
								"Failed to add to "
								"vnlp: %s=%s",
								VNATTR_HOOK_OFFLINE_VNODES,
								hook_buf);
							log_event(PBSEVENT_DEBUG2,
								PBS_EVENTCLASS_HOOK,
								LOG_INFO,
								last_phook->hook_name,
								log_buffer);
						} else {
							/* this saves 'tvnl' */
							/* in svr_vnl_action, */
							/* and later freed upon */
							/* server acking action */
							(void)send_hook_vnl(tvnl);
							tvnl = NULL;
						}
						if (tvnl != NULL)
							vnl_free(tvnl);
					}

					mom_deljob(pjob);
					goto done;
			}

			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			DBPRT(("%s: JOIN_JOB %s node %d\n", __func__, jobid, pjob->ji_nodeid))

			/*
			 ** Call job_join_extra to do setup.
			 */
			if (job_join_extra != NULL) {
				errcode = job_join_extra(pjob, np);
				if (errcode != 0) {
					(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
					mom_deljob(pjob);
					SEND_ERR(errcode)
					goto done;
				}
			}

			(void)job_save(pjob);
			(void)strcpy(namebuf, path_jobs);	/* job directory path */
			if (*pjob->ji_qs.ji_fileprefix != '\0')
				(void)strcat(namebuf, pjob->ji_qs.ji_fileprefix);
			else
				(void)strcat(namebuf, pjob->ji_qs.ji_jobid);
			(void)strcat(namebuf, JOB_TASKDIR_SUFFIX);

			if (mkdir(namebuf, 0700) == -1) {
				(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
				mom_deljob(pjob);
				SEND_ERR(PBSE_SYSTEM)
				goto done;
			}
#ifdef WIN32
			/* the following must appear before check_pwd() since the */
			/* latter tries to read cred info */
			if (mom_create_cred(pjob, info, len, FALSE, stream) == -1) {
				(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
				mom_deljob(pjob);
				SEND_ERR(PBSE_SYSTEM)
				goto done;
			}
#endif
			if (check_pwd(pjob) == NULL) {
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE,
					pjob->ji_qs.ji_jobid, log_buffer);
				(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
				mom_deljob(pjob);
				SEND_ERR(PBSE_BADUSER)
				goto done;
			}
			pjob->ji_qs.ji_un.ji_momt.ji_exuid = pjob->ji_grpcache->gc_uid;
			pjob->ji_qs.ji_un.ji_momt.ji_exgid = pjob->ji_grpcache->gc_gid;

#ifndef WIN32
			if (mom_create_cred(pjob, info, len, FALSE, stream) == -1) {
				(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
				mom_deljob(pjob);
				SEND_ERR(PBSE_SYSTEM)
				goto done;
			}
#endif

			/* create staging and execution dir if sandbox=PRIVATE mode is enabled */
			/* this code should appear after check_pwd() since */
			/* mkjobdir() depends on job uid and gid being set correctly */
			if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
				(strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
#ifdef WIN32
				if (mkjobdir(pjob->ji_qs.ji_jobid,
					jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir),
					(pjob->ji_user != NULL) ? pjob->ji_user->pw_name : NULL,
					(pjob->ji_user != NULL) ? pjob->ji_user->pw_userlogin : INVALID_HANDLE_VALUE)) {
					sprintf(log_buffer, "unable to create the job directory %s",
						jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir));
					log_err(errno, __func__, log_buffer);
					(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
					mom_deljob(pjob);
					SEND_ERR(PBSE_SYSTEM)
					goto done;
				}

#else	/* Unix/Linux */

				mode_t myumask = 0;
				char   maskbuf[22];
				mode_t j;
				int    e;

				if (is_jattr_set(pjob, JOB_ATR_umask)) {
					sprintf(maskbuf, "%ld", get_jattr_long(pjob, JOB_ATR_umask));
					sscanf(maskbuf, "%o", &j);
					myumask = umask(j);
				} else {
					myumask = umask(077);
				}

				e = mkjobdir(pjob->ji_qs.ji_jobid,
					jobdirname(pjob->ji_qs.ji_jobid,
					pjob->ji_grpcache->gc_homedir),
					pjob->ji_qs.ji_un.ji_momt.ji_exuid,
					pjob->ji_qs.ji_un.ji_momt.ji_exgid);
				if (myumask != 0)
					(void)umask(myumask);

				if (e != 0) {
					sprintf(log_buffer, "unable to create the job directory %s", jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir));
					log_err(errno, __func__, log_buffer);
					(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
					mom_deljob(pjob);
					SEND_ERR(PBSE_SYSTEM)
					goto done;
				}
#endif
			}

			sprintf(log_buffer, "JOIN_JOB as node %d", pjob->ji_nodeid);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);
			/*
			 ** if certain resource limits require that the job usage be
			 ** polled, we link the job to mom_polljobs.
			 **
			 ** NOTE: we overload the job field ji_jobque for this as it
			 ** is not used otherwise by MOM
			 */
			if (mom_do_poll(pjob))
				append_link(&mom_polljobs, &pjob->ji_jobque, pjob);
			if (pbs_idx_insert(jobs_idx, pjob->ji_qs.ji_jobid, pjob) != PBS_IDX_RET_OK) {
				log_joberr(PBSE_INTERNAL, __func__, "Failed to add job in index during join job", pjob->ji_qs.ji_jobid);
				goto join_err;
			}
			append_link(&svr_alljobs, &pjob->ji_alljobs, pjob);

			/*
			 ** At this point, we have done all the job setup.
			 ** Any error from now on is a problem sending the
			 ** reply to MS.  We don't need to call SEND_ERR.
			 */
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS)
				goto join_err;
			/*
			 ** Here we need to call job_join_ack to send any extra
			 ** information with the reply to the JOIN request.
			 ** The format of the data sent by job_join_ack will
			 ** always have a version number as the first item
			 ** sent as an int.  The rest depends on job_join_ack
			 ** and will be defined in the function it points to.
			 */
			if (job_join_ack != NULL) {
				ret = job_join_ack(pjob, np, stream);
				if (ret != DIS_SUCCESS)
					goto join_err;
			}

			if (tpp_eom(stream) == -1)
				goto join_err;

			if (dis_flush(stream) == -1)
				goto join_err;

			goto fini;

join_err:
			log_err(errno, __func__, "tpp flush");
			(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
			tpp_close(stream);
			mom_deljob(pjob);
			goto fini;

		case IM_ALL_OKAY:
		case IM_ERROR:
		case IM_ERROR2:
			reply = 0;
			break;

		default:
			reply = 1;
			break;
	}

	np = NULL;
	/*
	 ** Check if job already exists.
	 */
	if ((pjob = find_job(jobid)) == NULL) {
		SEND_ERR(PBSE_JOBEXIST)
		goto done;
	}

	/* check cookie */
	if (!(is_jattr_set(pjob, JOB_ATR_Cookie))) {
		DBPRT(("%s: job %s has no cookie\n", __func__, jobid))
		SEND_ERR(PBSE_BADSTATE)
		goto done;
	}
	oreo = get_jattr_str(pjob, JOB_ATR_Cookie);
	if (strcmp(oreo, cookie) != 0) {
		DBPRT(("%s: job %s cookie %s message %s\n", __func__, jobid, oreo, cookie))
		SEND_ERR(PBSE_BADSTATE)
		goto done;
	}
	/*
	 ** This is some processing needed that is common between
	 ** both kinds of reply.
	 ** reply == 0 means that this message is a reply not a request
	 ** reply == 1 means that this is a request to which a reply may happen
	 */
	if (reply == 0) {
		for (nodeidx = 0; nodeidx < pjob->ji_numnodes; nodeidx++) {
			np = &pjob->ji_hosts[nodeidx];

			if (np->hn_stream == stream) {
				np->hn_eof_ts = 0; /* reset down timestamp */
				break;
			}
		}
		if (nodeidx == pjob->ji_numnodes) {
			if (pjob->ji_updated)  {
				/* since some of job's nodes have been released early,
				 * this looks like a stream from one of the
				 * released nodes.
				 */
				goto done;
			} else {
				sprintf(log_buffer,
					"stream %d not found to job nodes", stream);
				goto err;
			}
		}
		ep = (eventent *)GET_NEXT(np->hn_events);

		while (ep) {
			if (ep->ee_event == event &&
				ep->ee_taskid == fromtask)
				break;
			ep = (eventent *)GET_NEXT(ep->ee_next);
		}
		if (ep == NULL) {
			if (pjob->ji_updated)  {
				/* some of job's vnodes have been released early
				 * along with their associated tm_spawn events
				 */
				goto done;
			} else {
				sprintf(log_buffer, "event %d taskid %8.8X not found",
					event, fromtask);
				goto err;
			}
		}

		efd = ep->ee_fd;
		event_com = ep->ee_command;
		event_task = ep->ee_taskid;
		event_client = ep->ee_client;
		argv = ep->ee_argv;
		envp = ep->ee_envp;
		delete_link(&ep->ee_next);
		free(ep);
	}

	switch (command) {

		case	IM_KILL_JOB:
			/*
			 ** Sender is (must be) mom superior commanding me to kill a
			 ** job which I should be a part of.
			 ** Send a signal and set the jobstate to begin the
			 ** kill.  We wait for all tasks to exit before sending
			 ** an obit to mother superior.
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */
			if (check_ms(stream, pjob))
				goto fini;

			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;
			if (mom_process_hooks(HOOK_EVENT_EXECJOB_PRETERM,
				PBS_MOM_SERVICE_NAME, mom_host, &hook_input,
				&hook_output,
				hook_msg, sizeof(hook_msg), 1) == 0) {

				SEND_ERR2(hook_errcode, (char *)hook_msg);
				goto done;	/* explicit reject - don't cancel */
			}


			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, "KILL_JOB received");
			/*
			 ** Send the jobs a signal but we have to wait to
			 ** do a reply to mother superior until the procs
			 ** die and are reaped.
			 */
			DBPRT(("%s: KILL_JOB %s\n", __func__, jobid))
			reply = 0;	/* reply will be deferred */
			kill_job(pjob, SIGKILL);
			set_job_substate(pjob, JOB_SUBSTATE_EXITING);
			set_job_state(pjob, JOB_STATE_LTR_EXITING);
			pjob->ji_obit = event;
			exiting_tasks = 1;

			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			(void)mom_process_hooks(HOOK_EVENT_EXECJOB_EPILOGUE,
				PBS_MOM_SERVICE_NAME, mom_host, &hook_input,
				&hook_output, hook_msg, sizeof(hook_msg), 1);
			break;

		case	IM_DELETE_JOB:
		case	IM_DELETE_JOB2:
		case	IM_DELETE_JOB_REPLY:
			/*
			 ** Sender is (must be) mom superior commanding me to delete a
			 ** job which I should be a part of.  There is no reply for
			 ** IM_DELETE_JOB but is for IM_DELETE_JOB_REPLY.
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */
			DBPRT(("%s: %s for %s\n", __func__, command==IM_DELETE_JOB?"DELETE_JOB":"DELETE_JOB_REPLY", pjob->ji_qs.ji_jobid));

			if (check_ms(stream, pjob))
				goto fini;

 			if ((command == IM_DELETE_JOB) || (command == IM_DELETE_JOB_REPLY))
				/* For IM_DELETE_JOB_REPLY, it should be
				 * 'DELETE_JOB_REPLY received'
				 * but there are QA tests out there that
				 * already depend on the current message.
				 */
 				delete_job_msg = "DELETE_JOB received";
			else if (command == IM_DELETE_JOB2)
				delete_job_msg = "DELETE_JOB2 received";

			if (delete_job_msg != NULL)
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, delete_job_msg);

			if (pjob->ji_hook_running_bg_on)
				goto fini;

			kill_job(pjob, SIGKILL);	/* just in case */

			/* NULL value passed to hook_input.vnl 				*/
			/* means to assign vnode list using pjob->ji_host[].	    	*/

			if ((hook_input_ptr = (mom_hook_input_t *)malloc(
				sizeof(mom_hook_input_t))) == NULL) {
					log_err(errno, __func__, MALLOC_ERR_MSG);
					goto err;
			}
			mom_hook_input_init(hook_input_ptr);
			hook_input_ptr->pjob = pjob;

			if ((hook_output_ptr = (mom_hook_output_t *)malloc(
				sizeof(mom_hook_output_t))) == NULL) {
					log_err(errno, __func__, MALLOC_ERR_MSG);
					goto err;
			}
			mom_hook_output_init(hook_output_ptr);

			if ((hook_output_ptr->reject_errcode =
				(int *)malloc(sizeof(int))) == NULL) {
					log_err(errno, __func__, MALLOC_ERR_MSG);
					goto err;
			}
			memset(hook_output_ptr->reject_errcode, 0, sizeof(int));

			pjob->ji_postevent = event;
			pjob->ji_taskid = fromtask;

			if (mom_process_hooks(
				(command == IM_DELETE_JOB2)?
					HOOK_EVENT_EXECJOB_EPILOGUE:
					HOOK_EVENT_EXECJOB_END,
				PBS_MOM_SERVICE_NAME, mom_host, hook_input_ptr,
				hook_output_ptr, NULL, 0, 1) ==
						HOOK_RUNNING_IN_BACKGROUND) {
					pjob->ji_hook_running_bg_on = (command == IM_DELETE_JOB)? BG_IM_DELETE_JOB: BG_IM_DELETE_JOB_REPLY;
					break;
				}

			if (command == IM_DELETE_JOB_REPLY) {
				mom_deljob(pjob);
				ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
					event, fromtask, IM_OLD_PROTOCOL_VER);
				reply = 1;
			} else if (command == IM_DELETE_JOB2) {
				job *pjob2 = NULL;
				long runver;

				ret = im_compose(stream, jobid, cookie, IM_SEND_RESC,
					event, fromtask, IM_OLD_PROTOCOL_VER);

				/* Send the information tallied for the job. */
				ret = diswst(stream, mom_host);
				BAIL("mom_host")
				ret = diswul(stream, resc_used(pjob, "cput",
								gettime));
				BAIL("resources_used.cput")
				ret = diswul(stream, resc_used(pjob, "mem",
								getsize));
				BAIL("resources_used.mem")
				ret = diswul(stream, resc_used(pjob,
						"cpupercent", gettime));
				BAIL("resources_used.cpupercent")
				if (is_jattr_set(pjob, JOB_ATR_run_version))
					runver = get_jattr_long(pjob, JOB_ATR_run_version);
				else
					runver = get_jattr_long(pjob, JOB_ATR_runcount);

				/* Call the execjob_end hook now */
				if (mom_process_hooks(HOOK_EVENT_EXECJOB_END, PBS_MOM_SERVICE_NAME, mom_host, hook_input_ptr,
						hook_output_ptr, NULL, 0, 1) == HOOK_RUNNING_IN_BACKGROUND) {
						pjob->ji_hook_running_bg_on = BG_IM_DELETE_JOB2;
						break;
				}
				mom_deljob(pjob);

				/* Needed to create a lightweight copy of the job to
				 * contain only the jobid info, so I can just call
				 * new_job_action() to create a JOB_ACT_REQ_DEALLOCATE
				 * request. Can't use the original 'pjob' structure as
				 * before creating the request, the real job should have
				 * been deleted already.
				 */
				if ((pjob2 = job_alloc()) != NULL) {
					pbs_strncpy(pjob2->ji_qs.ji_jobid, jobid, sizeof(pjob2->ji_qs.ji_jobid));
					set_jattr_l_slim(pjob2, JOB_ATR_run_version, runver, SET);
				 	/* JOB_ACT_REQ_DEALLOCATE request will tell the
				 	 * the server that this mom has completely deleted the
				 	 * job and now the server can officially free up the
					 * job from the nodes managed by this mom, allowing
					 * other jobs to run.
				 	 */
					new_job_action_req(pjob2, HOOK_PBSADMIN, JOB_ACT_REQ_DEALLOCATE);
					job_free(pjob2);
				}

				reply = 1;
			} else {
				mom_deljob(pjob);
				reply = 0;
			}
			free(hook_input_ptr);
			if (hook_output_ptr) {
				free(hook_output_ptr->reject_errcode);
				free(hook_output_ptr);
			}
			break;

		case	IM_EXEC_PROLOGUE:
			/*
			 ** Sender is (must be) mom superior commanding me to execute
			 ** a prologue hook.
			 */
			DBPRT(("%s: %s for %s\n", __func__, "IM_EXEC_PROLOGUE", pjob->ji_qs.ji_jobid));
			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			switch (hook_rc = mom_process_hooks(HOOK_EVENT_EXECJOB_PROLOGUE,
						PBS_MOM_SERVICE_NAME,
						mom_host, &hook_input, &hook_output,
						hook_msg, sizeof(hook_msg), 1)) {

				case 1: /* explicit accept */
				case 2:	/* no hook script executed - go ahead and accept event*/
					ret = im_compose(stream, jobid, cookie,
							IM_ALL_OKAY,
							event, fromtask, IM_OLD_PROTOCOL_VER);
					if (ret != DIS_SUCCESS)
						goto err;
					break;
				default:
					/* a value of '0' means explicit reject encountered. */
					if (hook_rc != 0) {
						/* we've hit an internal error (malloc error, full disk, etc...), so */
						/* treat this now like a  hook error so hook fail_action  */
						/* will be consulted.  */
						/* Before, behavior of an internal error was to ignore it! */
						hook_errcode = PBSE_HOOKERROR;
					}
					SEND_ERR2(hook_errcode, (char *)hook_msg);
					if (hook_errcode == PBSE_HOOKERROR)
					    send_hook_fail_action(last_phook);
			}
			break;

		case	IM_SPAWN_TASK:
			/*
			 ** Sender is a MOM in a job that wants to start a task.
			 ** I am MOM on the node that is to run the task.
			 **
			 ** auxiliary info (
			 **	parent vnode	tm_node_id
			 **	target vnode	tm_node_id
			 **	task id		tm_task_id (not used)
			 **	argv 0		string
			 **	...
			 **	argv n		string
			 **	null
			 **	envp 0		string
			 **	...
			 **	envp m		string
			 ** )
			 */
			pvnodeid = disrsi(stream, &ret);
			BAIL("SPAWN_TASK pvnodeid")

			if ((np = find_node(pjob, stream, pvnodeid)) == NULL) {
				SEND_ERR(PBSE_BADHOST)
				break;
			}
			tvnodeid = disrsi(stream, &ret);
			BAIL("SPAWN_TASK tvnodeid")
			taskid = disrui(stream, &ret);
			BAIL("SPAWN_TASK taskid")
			DBPRT(("%s: SPAWN_TASK %s parent %d target %d taskid %u\n",
				__func__, jobid, pvnodeid, tvnodeid, taskid))

			/*
			 **	The target node must be here.
			 */
			if (pjob->ji_nodeid != TO_PHYNODE(tvnodeid)) {
				SEND_ERR(PBSE_INTERNAL)
				break;
			}

			if( version == IM_OLD_PROTOCOL_VER) {
				/*
				 * The arg list is ended by an empty (zero length)
				 * string.
				 */
				num = 4;
				argv = (char **)calloc(sizeof(char *), num);
				assert(argv);
				for (i=0;; i++) {
					if ((cp = disrst(stream, &ret)) == NULL)
						break;
					if (ret != DIS_SUCCESS)
						break;
					if (*cp == '\0') {
						/* got a empty string, end of args lits */
						free(cp);
						break;
					}
					if (i == num-1) {
						num *= 2;
						argv = (char **)realloc(argv,
						num*sizeof(char *));
						assert(argv);
					}
					argv[i] = cp;
				}
			} else {
			  	argc = disrui(stream, &ret);
				if (ret != DIS_SUCCESS) {
					sprintf(log_buffer, "SPAWN_TASK read of argc");
					goto err;
				}
				argv = (char **)calloc(argc+1, sizeof(char *));
				assert(argv);
				for (i=0; i<argc; i++) {
					argv[i] = disrst(stream, &ret);
					if (ret != DIS_SUCCESS)
						break;
				}
			}
			argv[i] = NULL;
			if (ret != DIS_SUCCESS) {
				arrayfree(argv);
				sprintf(log_buffer, "SPAWN_TASK read of argv array");
				goto err;
			}

			num = 8;
			envp = (char **)calloc(sizeof(char *), num);
			assert(envp);
			for (i=0;; i++) {
				if ((cp = disrst(stream, &ret)) == NULL)
					break;
				if (ret != DIS_SUCCESS)
					break;
				if (*cp == '\0') {
					free(cp);
					break;
				}
				if (i == num-1) {
					num *= 2;
					envp = (char **)realloc(envp,
						num*sizeof(char *));
					assert(envp);
				}
				envp[i] = cp;
			}
			envp[i] = NULL;
			if (ret != DIS_EOD) {
				arrayfree(argv);
				arrayfree(envp);
				sprintf(log_buffer, "SPAWN_TASK read of envp array");
				goto err;
			}
#ifdef PMIX
			pbs_pmix_register_client(pjob, tvnodeid, &envp);
#endif
			ret = DIS_SUCCESS;
			if ((ptask = momtask_create(pjob)) == NULL) {
				SEND_ERR(PBSE_SYSTEM);
				arrayfree(argv);
				arrayfree(envp);
				break;
			}
			strcpy(ptask->ti_qs.ti_parentjobid, jobid);
			ptask->ti_qs.ti_parentnode = pvnodeid;
			ptask->ti_qs.ti_myvnode    = tvnodeid;
			ptask->ti_qs.ti_parenttask = fromtask;
			if (task_save(ptask) == -1) {
				SEND_ERR(PBSE_SYSTEM)
				arrayfree(argv);
				arrayfree(envp);
				break;
			}
			errcode = start_process(ptask, argv, envp, false);
			if (errcode != PBSE_NONE) {
				SEND_ERR(errcode)
			}
			else {
				ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
					event, fromtask, IM_OLD_PROTOCOL_VER);
				if (ret != DIS_SUCCESS)
					break;
				ret = diswui(stream, ptask->ti_qs.ti_task);
			}

			arrayfree(argv);
			arrayfree(envp);
			break;

		case	IM_GET_TASKS:
			/*
			 ** Sender is MOM which controls a task that wants to get
			 ** the list of tasks running here.
			 **
			 ** auxiliary info (
			 **	sending node	tm_node_id;
			 **	target node	tm_node_id;
			 ** )
			 */
			pvnodeid = disrsi(stream, &ret);
			BAIL("GET_TASKS pvnodeid")
			tvnodeid = disrsi(stream, &ret);
			BAIL("GET_TASKS tvnodeid")
			DBPRT(("%s: GET_TASKS %s from node %d to node %d\n",
				__func__, jobid, pvnodeid, tvnodeid))
			if ((np = find_node(pjob, stream, pvnodeid)) == NULL) {
				SEND_ERR(PBSE_BADHOST)
				break;
			}

			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, "GET_TASKS received");
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS)
				break;
			for (ptask=(pbs_task *)GET_NEXT(pjob->ji_tasks);
				ptask;
				ptask=(pbs_task *)GET_NEXT(ptask->ti_jobtask)) {
				if (ptask->ti_qs.ti_myvnode == tvnodeid) {
					ret = diswui(stream, ptask->ti_qs.ti_task);
					if (ret != DIS_SUCCESS)
						break;
				}
			}
			break;

		case	IM_SIGNAL_TASK:
			/*
			 ** Sender is MOM sending a task and signal to
			 ** deliver.
			 **
			 ** auxiliary info (
			 **	sending node	tm_node_id;
			 **	taskid		tm_task_id;
			 **	signal		int;
			 ** )
			 */
			pvnodeid = disrsi(stream, &ret);
			BAIL("SIGNAL_TASK pvnodeid")
			if ((np = find_node(pjob, stream, pvnodeid)) == NULL) {
				SEND_ERR(PBSE_BADHOST)
				break;
			}
			taskid = disrui(stream, &ret);
			BAIL("SIGNAL_TASK taskit")
			sig = disrsi(stream, &ret);
			BAIL("SIGNAL_TASK signum")
			DBPRT(("%s: SIGNAL_TASK %s fromnode %d task %8.8X sig %d\n",
				__func__, jobid, pvnodeid, taskid, sig))
			ptask = task_find(pjob, taskid);
			if (ptask == NULL) {
				SEND_ERR(PBSE_JOBEXIST)
				break;
			}
			sprintf(log_buffer, "SIGNAL_TASK %8.8X sig %d", taskid, sig);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);
			kill_task(ptask, sig, 0);
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			break;

		case	IM_OBIT_TASK:
			/*
			 ** Sender is MOM sending a request to monitor a
			 ** task for exit.
			 **
			 ** auxiliary info (
			 **	sending node	tm_node_id;
			 **	taskid		tm_task_id;
			 ** )
			 */
			pvnodeid = disrsi(stream, &ret);
			BAIL("OBIT_TASK pvnodeid")
			if ((np = find_node(pjob, stream, pvnodeid)) == NULL) {
				SEND_ERR(PBSE_BADHOST)
				break;
			}
			taskid = disrui(stream, &ret);
			BAIL("OBIT_TASK taskid")
			ptask = task_find(pjob, taskid);
			if (ptask == NULL) {
				SEND_ERR(PBSE_JOBEXIST)
				break;
			}
			DBPRT(("%s: OBIT_TASK %s from node %d task %8.8X\n", __func__,
				jobid, pvnodeid, taskid))
			if (ptask->ti_qs.ti_status >= TI_STATE_EXITED) {
				ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
					event, fromtask, IM_OLD_PROTOCOL_VER);
				if (ret != DIS_SUCCESS)
					break;
				ret = diswsi(stream, ptask->ti_qs.ti_exitstat);
			}
			else {	/* save obit request with task */
				obitent	*op = (obitent *)malloc(sizeof(obitent));
				assert(op);
				CLEAR_LINK(op->oe_next);
				append_link(&ptask->ti_obits, &op->oe_next, op);
				op->oe_type = OBIT_TYPE_TMEVENT;
				op->oe_u.oe_tm.oe_fd = -1;
				op->oe_u.oe_tm.oe_node = pvnodeid;
				op->oe_u.oe_tm.oe_event = event;
				op->oe_u.oe_tm.oe_taskid = fromtask;
				task_save(ptask);
				reply = 0;
			}
			break;

		case	IM_GET_INFO:
			/*
			 ** Sender is MOM sending a task and name to lookup
			 ** for info to report back.
			 **
			 ** auxiliary info (
			 **	sending node	tm_node_id;
			 **	taskid		tm_task_id;
			 **	name		string;
			 ** )
			 */
			pvnodeid = disrsi(stream, &ret);
			BAIL("GET_INFO pvnodeid")
			if ((np = find_node(pjob, stream, pvnodeid)) == NULL) {
				SEND_ERR(PBSE_BADHOST)
				break;
			}
			taskid = disrui(stream, &ret);
			BAIL("GET_INFO taskid")
			ptask = task_find(pjob, taskid);
			if (ptask == NULL) {
				SEND_ERR(PBSE_JOBEXIST)
				break;
			}
			name = disrst(stream, &ret);
			BAIL("GET_INFO name")
			DBPRT(("%s: GET_INFO %s from node %d task %8.8X name %s\n",
				__func__, jobid, pvnodeid, taskid, name))
			if ((ip = task_findinfo(ptask, name)) == NULL) {
				SEND_ERR(PBSE_JOBEXIST)
				break;
			}
			sprintf(log_buffer, "GET_INFO task %8.8X name %s",
				taskid, name);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS)
				break;
			ret = diswcs(stream, ip->ie_info, ip->ie_len);
			break;

		case	IM_GET_RESC:
			/*
			 ** Sender is MOM requesting resource info to
			 ** report back its client.
			 **
			 ** auxiliary info (
			 **	sending node	tm_node_id;
			 ** )
			 */
			pvnodeid = disrsi(stream, &ret);
			BAIL("GET_RESC pvnodeid")
			if ((np = find_node(pjob, stream, pvnodeid)) == NULL) {
				SEND_ERR(PBSE_BADHOST)
				break;
			}
			DBPRT(("%s: GET_RESC %s from node %d\n", __func__, jobid, pvnodeid))
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, "GET_RESC received");
			info = resc_string(pjob);
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS)
				break;
			ret = diswst(stream, info);
			break;

		case	IM_POLL_JOB:
			/*
			 ** Sender is (must be) mom superior commanding me to send
			 ** information for a job which I should be a part of.
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */

			if (QA_testing != 0) {		/* for QA Testing only */
				if (QA_testing & PBSQA_POLLJOB_CRASH)
					exit(98);
				else if (QA_testing & PBSQA_POLLJOB_SLEEP)
					sleep(90);
			}

			if (check_ms(stream, pjob))
				goto fini;
			pjob->ji_polltime = time_now;
			DBPRT(("%s: POLL_JOB %s\n", __func__, jobid))
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS)
				break;
			/*
			 ** Now comes a recomendation for killing the job.
			 */
			exitval = (pjob->ji_qs.ji_svrflags &
				(JOB_SVFLG_OVERLMT1|JOB_SVFLG_OVERLMT2)) ? 1 : 0;
			ret = diswsi(stream, exitval);
			if (ret != DIS_SUCCESS)
				break;
			/*
			 ** Send the information tallyed for the job.
			 */
			ret = diswul(stream, resc_used(pjob, "cput", gettime));
			if (ret != DIS_SUCCESS)
				break;
			ret = diswul(stream, resc_used(pjob, "mem", getsize));
			if (ret != DIS_SUCCESS)
				break;
			ret = diswul(stream, resc_used(pjob, "cpupercent", gettime));

			send_resc_used_to_ms(stream, pjob);
			break;

#ifdef PMIX
		case	IM_PMIX:
			/*
			 * Sender is MOM requesting a PMIX operation
			 * be carried out.
			 *
			 * auxiliary info (
			 *	sending node	tm_node_id;
			 *	taskid		tm_task_id;
			 *	operation	string;
			 * )
			 */
			sprintf(log_buffer, "IM_PMIX request received");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);
			/* TODO: Read aux info, processes request, and send response */
			sprintf(log_buffer, "Handle IM_PMIX request");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);
			sprintf(log_buffer, "IM_PMIX replying IM_ALL_OK");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS)
				break;
			break;
#endif

		case	IM_SUSPEND:
		case	IM_RESUME:
			/*
			 ** Sender is (must be) mom superior commanding me to do
			 ** a suspend or resume of all local tasks for a job which
			 ** I should be a part of.
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */
			if (check_ms(stream, pjob))
				goto fini;
			DBPRT(("%s: %s %s\n", __func__, (command == IM_SUSPEND) ?
				"SUSPEND" : "RESUME", jobid))
			sprintf(log_buffer, "%s received", (command == IM_SUSPEND) ?
				"SUSPEND" : "RESUME");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);
			if ((errcode = local_supres(pjob,
				(command == IM_SUSPEND) ? 1 : 0, NULL))
				!= PBSE_NONE) {
				SEND_ERR(errcode);
				break;
			}
			pjob->ji_mompost = (command == IM_SUSPEND) ?
				post_suspend : post_resume;
			/*
			 ** If a child was started to handle the operation,
			 ** wait to reply until the kid returns.
			 */
			if (pjob->ji_momsubt) {
				reply = 0;
				pjob->ji_postevent = event;
				pjob->ji_taskid = fromtask;
				break;
			}

			pjob->ji_mompost(pjob, PBSE_NONE);
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			break;

		case	IM_RESTART:
			/*
			 ** Sender is (must be) mom superior commanding me to do
			 ** a restart of all local tasks for a job which
			 ** I should be a part of.
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */
			if (check_ms(stream, pjob))
				goto fini;
			DBPRT(("%s: RESTART %s\n", __func__, jobid))
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, "RESTART received");

			/*
			 * NULL value passed to hook_input.vnl means to assign
			 * vnode list using pjob->ji_host[].
			 */
			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;
			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			hook_rc=mom_process_hooks(HOOK_EVENT_EXECJOB_BEGIN,
					PBS_MOM_SERVICE_NAME, mom_host,
					&hook_input, &hook_output,
					hook_msg, sizeof(hook_msg), 1);
			if (hook_rc <= 0) {
				/* a value of '0' means explicit reject encountered. */
				if (hook_rc != 0) {
					/*
					 * we've hit an internal error (malloc error, full disk, etc...), so
					 * treat this now like a  hook error so hook fail_action will be consulted.
					 * Before, behavior of an internal error was to ignore it!
					 */
					hook_errcode = PBSE_HOOKERROR;
					send_hook_fail_action(last_phook);
				}
				SEND_ERR2(hook_errcode, (char *)hook_msg);
				mom_deljob(pjob);
				break;
			}

			errcode = local_restart(pjob, NULL);

			if (errcode != PBSE_NONE) {	/* error, send reply */
				SEND_ERR(errcode);
				break;
			}

			/*
			 ** If a child was started to handle the operation,
			 ** wait to reply until the kid returns.
			 */
			if (pjob->ji_momsubt) {
				reply = 0;
				pjob->ji_postevent = event;
				pjob->ji_taskid = fromtask;
				break;
			}

			post_restart(pjob, PBSE_NONE);
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			break;


		case	IM_CHECKPOINT:
		case	IM_CHECKPOINT_ABORT:
			/*
			 ** Sender is (must be) mom superior commanding me to do
			 ** a checkpoint of all local tasks for a job which
			 ** I should be a part of.
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */
			if (check_ms(stream, pjob))
				goto fini;
			DBPRT(("%s: %s %s\n", __func__,
				(command == IM_CHECKPOINT) ? "CHECKPOINT" :
				"CHECKPOINT_ABORT", jobid))
			sprintf(log_buffer, "%s received",
				(command == IM_CHECKPOINT) ?
				"CHECKPOINT" : "CHECKPOINT_ABORT");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, log_buffer);

			errcode = local_checkpoint(pjob,
				(command == IM_CHECKPOINT) ? 0 : 1, NULL);

			if (errcode != PBSE_NONE) {	/* error, send reply */
				SEND_ERR(errcode);
				break;
			}

			/*
			 ** If a child was started to handle the operation,
			 ** wait to reply until the kid returns.
			 */
			if (pjob->ji_momsubt) {
				reply = 0;
				pjob->ji_postevent = event;
				pjob->ji_taskid = fromtask;
				break;
			}

			post_chkpt(pjob, PBSE_NONE);
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			break;

		case	IM_ABORT_JOB:
			/*
			 ** Sender is (must be) mom superior commanding me to
			 ** abort a JOIN_JOB or RESTART request.
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */
			if (check_ms(stream, pjob))
				goto fini;
			DBPRT(("%s: ABORT_JOB %s\n", __func__, jobid))
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, "ABORT_JOB received");
			reply = 0;
			if (pjob->ji_qs.ji_svrflags &
				(JOB_SVFLG_CHKPT|JOB_SVFLG_ChkptMig)) {
				kill_job(pjob, SIGKILL);	/* is this right? */
			} else {
				mom_hook_input_init(&hook_input);
				hook_input.pjob = pjob;

				mom_hook_output_init(&hook_output);
				hook_output.reject_errcode = &hook_errcode;
				hook_output.last_phook = &last_phook;
				hook_output.fail_action = &hook_fail_action;
				(void)mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT, PBS_MOM_SERVICE_NAME, mom_host, &hook_input, &hook_output, hook_msg, sizeof(hook_msg), 1);
				mom_deljob(pjob);
			}
			break;

		case	IM_REQUEUE:
			/*
			 ** Sender is another MOM telling me that she has gone
			 ** keyboard busy and that a job needs to be requeued
			 **
			 ** auxiliary info (
			 **	none;
			 ** )
			 */
			DBPRT(("%s: IM_REQUEUE job %s\n", __func__, jobid))
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, "REQUEUE received");
			reply = 0;
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) != 0) {
				pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_RERUN;
				(void)kill_job(pjob, SIGKILL);
				/* Server will decide if job is rerunnable or not */
			}
			break;

		case	IM_SETUP_JOB:
			/*
			 ** Sender is (must be) mom superior sending me setup
			 ** information to complete a JOIN_JOB or RESTART request.
			 **
			 ** auxiliary info (
			 **	identity	int
			 **	... dependent
			 ** )
			 */
			if (check_ms(stream, pjob))
				goto fini;
			DBPRT(("%s: SETUP_JOB %s\n", __func__, jobid))
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				jobid, "SETUP_JOB received");

			/*
			 ** If there is a job_setup_final, call it,
			 ** otherwise, send the "not supported" error.
			 */
			if (job_setup_final == NULL) {
				SEND_ERR(PBSE_NOSUP);
				break;
			}

			errcode = job_setup_final(pjob, stream);
			if (errcode != PBSE_NONE) {	/* error, send reply */
				SEND_ERR(errcode);
				break;
			}
			ret = im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			break;

		case	IM_ALL_OKAY:		/* this is a REPLY */
			/*
			 ** Sender is another MOM telling me that a request has
			 ** completed just dandy.
			 */
			switch (event_com) {

				case	IM_JOIN_JOB:
					/*
					 ** Sender is one of the sisterhood saying she
					 ** got the job structure sent and she accepts it.
					 ** I'm mother superior.
					 **
					 ** auxiliary info (
					 **	optional;
					 ** )
					 */
					if ((nodeidx > 0) &&
					    (nodeidx < pjob->ji_numnodes) &&
					    ((nodeidx-1) < pjob->ji_numrescs) &&
  					    (pjob->ji_resources[nodeidx-1].nodehost == NULL))
						pjob->ji_resources[nodeidx-1].nodehost = strdup(pjob->ji_hosts[nodeidx].hn_host);

					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"got JOIN_JOB OKAY and I'm not MS");
						goto err;
					}
					DBPRT(("%s: JOIN_JOB %s OKAY\n", __func__, jobid))

					/*
					 ** If job_join_read exists, call it to read
					 ** any extra info included with the JOIN reply.
					 ** This function can return an error if there
					 ** is no extra information or deal with it
					 ** more gracefully and return SUCCESS.
					 */
					if (job_join_read != NULL) {
						/* on error, log_message set */
						ret = job_join_read(pjob, np, stream);
						if (ret != DIS_SUCCESS)
							goto err;
					}

					for (i=0; i<pjob->ji_numnodes; i++) {
						hnodent *xp = &pjob->ji_hosts[i];
						if ((ep = (eventent *)GET_NEXT(xp->hn_events))
							!= NULL)
							break;
					}

					if (do_tolerate_node_failures(pjob) &&
					    (nodeidx > 0) && (nodeidx < pjob->ji_numnodes)) {
						reliable_job_node_add(&pjob->ji_node_list, pjob->ji_hosts[nodeidx].hn_host);
					}

					if (ep == NULL) {	/* no events */
						int rcode;
						int do_break = 0;
						/*
						 * All the JOIN messages have come in.
						 * Call job_join_extra for local MS setup.
						 */
						rcode = pre_finish_exec(pjob, 1);
						switch (rcode) {
						  case PRE_FINISH_SUCCESS_JOB_SETUP_SEND:
							do_break = 1;
							break;
						  case PRE_FINISH_FAIL_JOIN_EXTRA:
							goto done;
						  case PRE_FINISH_FAIL_JOB_SETUP_SEND:
							sprintf(log_buffer, "could not send setup");
							goto err;
						  case PRE_FINISH_FAIL:
							goto err;
						}
						if (do_break)
							break;
						/*
						 ** At this point, we are ready to call
						 ** finish_exec and launch the job.
						 */
 						if (!do_tolerate_node_failures(pjob) || (check_job_substate(pjob, JOB_SUBSTATE_WAITING_JOIN_JOB))) {
							if (check_job_substate(pjob, JOB_SUBSTATE_WAITING_JOIN_JOB)) {
								set_job_substate(pjob, JOB_SUBSTATE_PRERUN);
								job_save(pjob);
							}
							finish_exec(pjob);
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
						}
					}
					break;

				case	IM_SETUP_JOB:
					/*
					 ** Sender is one of the sisterhood saying she
					 ** did the job setup step.
					 ** I'm mother superior.
					 **
					 ** auxiliary info (
					 **	none;
					 ** )
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"got JOIN_JOB OKAY and I'm not MS");
						goto err;
					}
					DBPRT(("%s: SETUP_JOB %s from %s OKAY\n", __func__,
						jobid, np->hn_host))
					for (i=0; i<pjob->ji_numnodes; i++) {
						np = &pjob->ji_hosts[i];
						if ((ep = (eventent *)GET_NEXT(np->hn_events))
							!= NULL)
							break;
					}

					if (ep == NULL) {	/* all SETUPs done */
						/*
						 ** Call finish_exec.  The MS call to
						 ** job_setup_final is done in job_setup.
						 */
						finish_exec(pjob);
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
							LOG_DEBUG,
							pjob->ji_qs.ji_jobid, log_buffer);
					}
					break;

				case	IM_SUSPEND:
				case	IM_RESUME:
					/*
					 ** Sender is one of the sisterhood saying she
					 ** did a suspend or resume.
					 ** I'm mother superior.
					 **
					 ** auxiliary info (
					 **	none;
					 ** )
					 */
					name = (event_com == IM_SUSPEND) ?
						"SUSPEND" : "RESUME";
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"got %s OKAY and I'm not MS", name);
						goto err;
					}
					DBPRT(("%s: %s %s OKAY\n", __func__, jobid, name))

					if (pjob->ji_mompost != NULL)
						pjob->ji_mompost(pjob, PBSE_NONE);
					break;

				case	IM_RESTART:
				case	IM_CHECKPOINT:
				case	IM_CHECKPOINT_ABORT:
					/*
					 ** Sender is one of the sisterhood saying she
					 ** did a checkpoint or restart.
					 ** I'm mother superior.
					 **
					 ** auxiliary info (
					 **	none;
					 ** )
					 */
					name = (event_com == IM_RESTART) ? "RESTART" :
						(event_com == IM_CHECKPOINT) ?
						"CHECKPOINT" : "CHECKPOINT_ABORT";
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"got %s OKAY and I'm not MS", name);
						goto err;
					}

					DBPRT(("%s: %s %s OKAY\n", __func__, jobid, name))
					if (pjob->ji_mompost != NULL)
						pjob->ji_mompost(pjob, PBSE_NONE);
					break;

				case	IM_KILL_JOB:
					/*
					 ** Sender is sending a response that a job
					 ** which needs to die has been given the ax.
					 ** I'm mother superior.
					 **
					 ** auxiliary info (
					 **	cput	int;
					 **	mem	int;
					 **	cpupercent int;
					 ** )
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer, "got KILL_JOB OKAY and I'm not MS");
						goto err;
					}
					DBPRT(("%s: KILL_JOB %s OKAY\n", __func__, jobid))

					pjob->ji_resources[nodeidx - 1].nr_cput = disrul(stream, &ret);
					BAIL("OK-KILL_JOB cput")
					pjob->ji_resources[nodeidx - 1].nr_mem = disrul(stream, &ret);
					BAIL("OK-KILL_JOB mem")
					pjob->ji_resources[nodeidx - 1].nr_cpupercent = disrul(stream, &ret);
					BAIL("OK-KILL_JOB cpupercent")

					DBPRT(("%s: %s FINAL from %d cpu %lu sec mem %lu kb\n",
					       __func__, jobid, nodeidx,
					       pjob->ji_resources[nodeidx - 1].nr_cput,
					       pjob->ji_resources[nodeidx - 1].nr_mem))
					recv_resc_used_from_sister(stream, pjob, nodeidx - 1);

					/* don't close stream in case other jobs use it */
					np->hn_sister = SISTER_KILLDONE;
					for (i = 1; i < pjob->ji_numnodes; i++) {
						if (reliable_job_node_find(&pjob->ji_failed_node_list, pjob->ji_hosts[i].hn_host) == NULL &&
						    pjob->ji_hosts[i].hn_sister == SISTER_OKAY)
							break;
					}
					if (i == pjob->ji_numnodes) { /* all dead */
						DBPRT(("%s: ALL DONE, set EXITING job %s\n", __func__, jobid))
						if (check_job_substate(pjob, JOB_SUBSTATE_KILLSIS)) {
							set_job_state(pjob, JOB_STATE_LTR_EXITING);
							set_job_substate(pjob, JOB_SUBSTATE_EXITING);
							exiting_tasks = 1;
						}
					}
					break;

				case	IM_DELETE_JOB_REPLY:
					/*
					 ** Sender is MOM responding to a "delete job and reply"
					 ** request.
					 **
					 ** auxiliary info - none
					 */
					DBPRT(("%s: reply for DELETE_JOB_REPLY %s received from %s\n", __func__, pjob->ji_qs.ji_jobid, np->hn_host))
					np->hn_sister = SISTER_KILLDONE;
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"got DELETE_JOB_REPLY OKAY and I'm not MS");
						goto err;
					}
					DBPRT(("%s: DELETE_JOB_REPLY %s OKAY\n", __func__, jobid))
					chk_del_job(pjob, 0);
					break;

				case	IM_SPAWN_TASK:
					/*
					 ** Sender is MOM responding to a "spawn_task"
					 ** request.
					 **
					 ** auxiliary info (
					 **	task id		tm_task_id;
					 ** )
					 */
					taskid = disrui(stream, &ret);
					BAIL("OK-SPAWN taskid")
					DBPRT(("%s: SPAWN_TASK %s OKAY task %8.8X\n",
						__func__, jobid, taskid))
					ptask = task_check(pjob, efd, event_task);
					if (ptask == NULL)
						break;
					(void)tm_reply(efd, ptask->ti_protover,
						TM_OKAY, event_client);
					(void)diswui(efd, taskid);
					(void)dis_flush(efd);
					break;

				case	IM_GET_TASKS:
					/*
					 ** Sender is MOM giving a list of tasks which she
					 ** has started for this job.
					 **
					 ** auxiliary info (
					 **	task id		tm_task_id;
					 **	...
					 **	task id		tm_task_id;
					 ** )
					 */
					DBPRT(("%s: GET_TASKS %s OKAY\n", __func__, jobid))
					ptask = task_check(pjob, efd, event_task);
					if (ptask == NULL)
						break;
					(void)tm_reply(efd, ptask->ti_protover,
						TM_OKAY, event_client);
					for (;;) {
						DIS_tpp_funcs();
						taskid = disrui(stream, &ret);
						if (ret != DIS_SUCCESS) {
							if (ret == DIS_EOD)
								break;
							else {
								sprintf(log_buffer,
									bail_format,
									"OK-GET_TASK idlist");
								goto err;
							}
						}
						DIS_tcp_funcs();
						(void)diswui(efd, taskid);
					}
					DIS_tcp_funcs();
					(void)diswui(efd, TM_NULL_TASK);
					(void)dis_flush(efd);
					break;

				case	IM_SIGNAL_TASK:
					/*
					 ** Sender is MOM with a good signal to report.
					 **
					 ** auxiliary info (
					 **	none;
					 ** )
					 */
					DBPRT(("%s: %s SIGNAL_TASK %8.8X OKAY\n",
						__func__, jobid, event_task))
					ptask = task_check(pjob, efd, event_task);
					if (ptask == NULL)
						break;
					(void)tm_reply(efd, ptask->ti_protover,
						TM_OKAY, event_client);
					(void)dis_flush(efd);
					break;

				case	IM_OBIT_TASK:
					/*
					 ** Sender is MOM with a death report.
					 **
					 ** auxiliary info (
					 **	exit value	int;
					 ** )
					 */
					exitval = disrsi(stream, &ret);
					BAIL("OK-OBIT_TASK exitval")
					DBPRT(("%s: %s OBIT_TASK %8.8X OKAY exit val %d\n",
						__func__, jobid, event_task, exitval))
					ptask = task_check(pjob, efd, event_task);
					if (ptask == NULL)
						break;
					(void)tm_reply(efd, ptask->ti_protover,
						TM_OKAY, event_client);
					(void)diswsi(efd, exitval);
					(void)dis_flush(efd);
					break;

				case	IM_GET_INFO:
					/*
					 ** Sender is MOM with a named info to report.
					 **
					 ** auxiliary info (
					 **	info		counted string;
					 ** )
					 */
					info = disrcs(stream, &len, &ret);
					BAIL("OK-GET_INFO info")
					DBPRT(("%s: %s GET_INFO %8.8X OKAY\n",
						__func__, jobid, event_task))
					ptask = task_check(pjob, efd, event_task);
					if (ptask == NULL)
						break;

					(void)tm_reply(efd, ptask->ti_protover,
						TM_OKAY, event_client);
					(void)diswcs(efd, info, len);
					(void)dis_flush(efd);
					break;

				case	IM_GET_RESC:
					/*
					 ** Sender is MOM with a resource info to report.
					 **
					 ** auxiliary info (
					 **	info		counted string;
					 ** )
					 */
					info = disrst(stream, &ret);
					BAIL("OK-GET_RESC info")
					DBPRT(("%s: %s GET_RESC %8.8X OKAY\n",
						__func__, jobid, event_task))
					ptask = task_check(pjob, efd, event_task);
					if (ptask == NULL)
						break;

					(void)tm_reply(efd, ptask->ti_protover,
						TM_OKAY, event_client);
					(void)diswst(efd, info);
					(void)dis_flush(efd);
					break;

				case	IM_POLL_JOB:
					/*
					 ** I must be Mother Superior for the job and
					 ** this is a reply with job resources to
					 ** tally up.
					 **
					 ** auxiliary info (
					 **	recommendation	int;
					 **	cput		u_long;
					 **	mem		u_long;
					 ** )
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer, "got POLL_JOB and I'm not MS");
						goto err;
					}
					exitval = disrsi(stream, &ret);
					BAIL("OK-POLL_JOB exitval")
					pjob->ji_resources[nodeidx - 1].nr_cput = disrul(stream, &ret);
					BAIL("OK-POLL_JOB cput")
					pjob->ji_resources[nodeidx - 1].nr_mem = disrul(stream, &ret);
					BAIL("OK-POLL_JOB mem")
					pjob->ji_resources[nodeidx - 1].nr_cpupercent = disrul(stream, &ret);
					BAIL("OK-POLL_JOB cpupercent")
					recv_resc_used_from_sister(stream, pjob, nodeidx - 1);
					DBPRT(("%s: POLL_JOB %s OKAY kill %d cpu %lu mem %lu\n",
					       __func__, jobid, exitval,
					       pjob->ji_resources[nodeidx - 1].nr_cput,
					       pjob->ji_resources[nodeidx - 1].nr_mem))

					if (exitval)
						pjob->ji_nodekill = np->hn_node;
					break;

#ifdef PMIX
				case	IM_PMIX:
					/*
					 * I must be mother superior for the job and
					 * this is a reply for a PMIX operation.
					 *
					 * auxiliary info (
					 *	operation	int;
					 * )
					 */
					sprintf(log_buffer, "IM_PMIX reply received");
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
						jobid, log_buffer);
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"Received IM_PMIX reply "
							"and this is not MS");
						goto err;
					}
					/* TODO: Handle IM_PMIX reply */
					sprintf(log_buffer, "Handle IM_PMIX reply here");
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
						jobid, log_buffer);
					break;
#endif /* PMIX */

				case	IM_UPDATE_JOB:
					for (i = 0; i < pjob->ji_numnodes; i++) {
						hnodent *xp = &pjob->ji_hosts[i];
						ep = (eventent *)GET_NEXT(xp->hn_events);
  						if (ep != NULL)
							break;
					}

					if ((nodeidx > 0) && (nodeidx < pjob->ji_numnodes)) {
						char *hn;

						hn  = pjob->ji_hosts[nodeidx].hn_host;
						snprintf(log_buffer, sizeof(log_buffer),
						"received IM_ALL_OK job update from host %s", hn?hn:"");
						log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
					}

					if (ep == NULL) {
						/* no events left */
#ifndef WIN32
						if (do_tolerate_node_failures(pjob) && (pjob->ji_parent2child_job_update_status_pipe != -1)) {
							int cmd = IM_ALL_OKAY;
							log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "all job updates from sisters done");
						    	write_pipe_data(pjob->ji_parent2child_job_update_status_pipe, (int *)&cmd, sizeof(int));
						}
#endif

					}
					break;

				case	IM_EXEC_PROLOGUE:
					for (i = 0; i < pjob->ji_numnodes; i++) {
						hnodent *xp = &pjob->ji_hosts[i];
						ep = (eventent *)GET_NEXT(xp->hn_events);
  						if (ep != NULL)
							break;
					}

					if ((nodeidx > 0) && (nodeidx < pjob->ji_numnodes)) {
						char *hn;
						reliable_job_node *rjn = NULL;

						hn  = pjob->ji_hosts[nodeidx].hn_host;
						snprintf(log_buffer, sizeof(log_buffer),
						"received IM_ALL_OK prologue hook from host %s", hn?hn:"");
						log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
						/* note that do_tolerate_node_failures() could return 0 if
						 * tolerate_node_failures=job_start but job already moved past
						 * the starting up phase. The second if clause will catch
						 * previously failed node host due to not getting ack for
						 * execjob_prologue hook execution, but we got the
						 * ack now, just delayed.
						 */
						rjn = reliable_job_node_find(&pjob->ji_failed_node_list, hn);
						if (do_tolerate_node_failures(pjob) || (rjn != NULL)) {
							(void)reliable_job_node_set_prologue_hook_success(&pjob->ji_node_list, hn);
							if (rjn != NULL) {
								delete_link(&rjn->rjn_link);
								free(rjn);
							}
						}
					}

#ifndef WIN32
					if (ep == NULL) {
						/* no events left */
						if (do_tolerate_node_failures(pjob) && (pjob->ji_mjspipe2 != -1)) {
							int cmd = IM_ALL_OKAY;
							log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "all job prologue hook from sisters done");
						    	write_pipe_data(pjob->ji_mjspipe2, (int *)&cmd, sizeof(int));
						}

					}
#endif
					break;

				default:
					sprintf(log_buffer, "unknown request type %d saved",
						event_com);
					log_err(-1, __func__, log_buffer);
					break;
			}
			break;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		case	IM_CRED:
			ret = im_cred_read(pjob, np, stream);
			if (ret != DIS_SUCCESS)
				goto err;
			break;
#endif

		case	IM_ERROR:		/* this is a REPLY */
		case	IM_ERROR2:		/* this is a REPLY */
			/*
			 ** Sender is responding to a request with an error code.
			 **
			 ** auxiliary info (
			 **	error value	int;
			 ** )
			 */
			errcode = disrsi(stream, &ret);
			BAIL("ERROR errcode")

			if (command == IM_ERROR2) {
				errmsg = disrst(stream, &ret);
			}

			switch (event_com) {

				case	IM_JOIN_JOB:
					/*
					 * A MOM has rejected a request to join a job.
					 * We need to send ABORT_JOB to all the sisterhood
					 * and fail the job start to server.
					 * I'm mother superior.
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"JOIN_JOB ERROR and I'm not MS");
						goto err;
					}
					DBPRT(("%s: JOIN_JOB %s returned ERROR %d\n",
						__func__, jobid, errcode))
					job_start_error(pjob, errcode, (do_tolerate_node_failures(pjob) ? addr_to_hostname(addr) : netaddr(addr)), "JOIN_JOB");
					if (errmsg != NULL) {
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
							LOG_INFO, jobid, errmsg);
					}
					if (!do_tolerate_node_failures(pjob))
						break;

					for (i = 0; i < pjob->ji_numnodes; i++) {
						hnodent *xp = &pjob->ji_hosts[i];
						if ((ep = (eventent *)GET_NEXT(xp->hn_events)) != NULL)
							break;
					}
					if (ep == NULL) {	/* no events */
						int rcode;
						int do_break = 0;

						/* All the JOIN messages have come in. */
						rcode = pre_finish_exec(pjob, 1);
						switch (rcode) {
						  case PRE_FINISH_SUCCESS_JOB_SETUP_SEND:
							do_break = 1;
							break;
						  case PRE_FINISH_FAIL_JOIN_EXTRA:
							goto done;
						  case PRE_FINISH_FAIL_JOB_SETUP_SEND:
							sprintf(log_buffer, "could not send setup");
							goto err;
						  case PRE_FINISH_FAIL:
							goto err;
						}
						if (do_break)
							break;
						/*
						 ** At this point, we are ready to call
						 ** finish_exec and launch the job.
						 */
						if (check_job_substate(pjob, JOB_SUBSTATE_WAITING_JOIN_JOB)) {
							set_job_substate(pjob, JOB_SUBSTATE_PRERUN);
							job_save(pjob);
						}
						finish_exec(pjob);
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
					}
					break;

				case	IM_EXEC_PROLOGUE:
					/*
					 * A MOM prologue hook execution has been rejected
					 * for the job.  We need to send ABORT_JOB to all
					 * the sisterhood and fail the job start to server.
					 * I'm mother superior.
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer, "IM_EXEC_PROLOGUE ERROR and I'm not MS");
						goto err;
					}
					DBPRT(("%s: IM_EXEC_PROLOGUE %s returned ERROR %d\n", __func__, jobid, errcode))

					job_start_error(pjob, errcode,(do_tolerate_node_failures(pjob)?addr_to_hostname(addr):netaddr(addr)), "IM_EXEC_PROLOGUE");
					if (errmsg != NULL) {
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
							  LOG_INFO, jobid, errmsg);
					}
					if (!do_tolerate_node_failures(pjob))
						break;

					for (i = 0; i < pjob->ji_numnodes; i++) {
						hnodent *xp = &pjob->ji_hosts[i];
						if ((ep = (eventent *)GET_NEXT(xp->hn_events))
							!= NULL)
							break;
					}

#ifndef WIN32
					if (ep == NULL) {
						/* no events left */
						if (pjob->ji_mjspipe2 != -1) {
							int cmd = IM_ALL_OKAY;
							log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "all job prologue hooks from sisters executed");
						    	write_pipe_data(pjob->ji_mjspipe2, (int *)&cmd, sizeof(int));
						}
					}
#endif
					break;

				case	IM_SETUP_JOB:
					/*
					 ** A MOM has rejected a request to setup a job.
					 ** If the error is PBSE_NOSUP, the job might be
					 ** able to continue.  Otherwise, we need to send
					 ** ABORT_JOB to all the sisterhood and fail the
					 ** job start to server.  The determination of
					 ** if the job cannot run in the case of PBSE_NOSUP
					 ** is done when MS runs job_setup_final.  Then, the
					 ** lack of information from this node will be
					 ** noted and if it cannot be tolerated, the
					 ** job will be aborted.
					 ** I'm mother superior.
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"SETUP_JOB ERROR and I'm not MS");
						goto err;
					}
					DBPRT(("%s: SETUP_JOB %s returned ERROR %d\n",
						__func__, jobid, errcode))
					if (errcode != PBSE_NOSUP) {
						job_start_error(pjob, errcode, (do_tolerate_node_failures(pjob)?addr_to_hostname(addr):netaddr(addr)), "SETUP_JOB");
					}
					break;

				case	IM_SUSPEND:
				case	IM_RESUME:
					/*
					 ** A MOM has failed to suspend or resume a job.
					 ** I'm mother superior.
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"%s ERROR and I'm not MS",
							(event_com == IM_SUSPEND) ?
							"SUSPEND" : "RESUME");
						goto err;
					}
					sprintf(log_buffer, "%s returned ERROR %d",
						(event_com == IM_SUSPEND) ?
						"SUSPEND" : "RESUME", errcode);
					log_joberr(-1, __func__, log_buffer, jobid);

					if (pjob->ji_mompost != NULL)
						pjob->ji_mompost(pjob, errcode);
					break;

				case	IM_RESTART:
				case	IM_CHECKPOINT:
				case	IM_CHECKPOINT_ABORT:
					/*
					 ** A MOM has failed to do a checkpoint.
					 ** I'm mother superior.
					 **
					 ** auxiliary info (
					 **	none;
					 ** )
					 */
					name = (event_com == IM_RESTART) ? "RESTART" :
						(event_com == IM_CHECKPOINT) ?
						"CHECKPOINT" : "CHECKPOINT_ABORT";

					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"%s ERROR and I'm not MS", name);
						goto err;
					}
					sprintf(log_buffer, "%s returned ERROR %d",
						name, errcode);
					log_joberr(-1, __func__, log_buffer, jobid);

					if (pjob->ji_mompost != NULL)
						pjob->ji_mompost(pjob, errcode);
					break;

				case	IM_ABORT_JOB:
				case	IM_KILL_JOB:
					/*
					 ** Job cleanup failed on a sister.
					 ** Wait for everybody to respond then finishup.
					 ** I'm mother superior.
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"KILL/ABORT ERROR and I'm not MS");
						goto err;
					}
					DBPRT(("%s: KILL/ABORT JOB %s returned ERROR %d\n",
						__func__, jobid, errcode))

					if (errcode == PBSE_HOOKERROR) {
						if (errmsg != NULL) {
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
								LOG_INFO,
								pjob->ji_qs.ji_jobid, errmsg);
						}
					}
					np->hn_sister = errcode ? errcode : SISTER_KILLDONE;
					for (i=1; i<pjob->ji_numnodes; i++) {
						if ((reliable_job_node_find(&pjob->ji_failed_node_list, pjob->ji_hosts[i].hn_host) == NULL) && (pjob->ji_hosts[i].hn_sister == SISTER_OKAY))
							break;
					}
					if (i == pjob->ji_numnodes) {	/* all dead */
						if (check_job_substate(pjob, JOB_SUBSTATE_KILLSIS)) {
							set_job_substate(pjob, JOB_SUBSTATE_EXITING);
							exiting_tasks = 1;
						}
					}
					break;

				case	IM_DELETE_JOB_REPLY:
					/*
					 ** Job delete failed on a sister.
					 ** Wait for everybody to respond then finishup.
					 ** I'm mother superior.
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"DEL_JOB_REPLY ERROR and I'm not MS");
						goto err;
					}
					DBPRT(("%s: DEL_JOB_REPLY job %s returned ERROR %d\n",
						__func__, jobid, errcode))
					if ((errcode == 0) || (errcode == PBSE_JOBEXIST))
						np->hn_sister = SISTER_KILLDONE;
					else
						np->hn_sister = errcode;
					chk_del_job(pjob, errcode);

					if (errmsg != NULL) {
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
							LOG_INFO, pjob->ji_qs.ji_jobid, errmsg);
					}
					break;

				case	IM_SPAWN_TASK:
				case	IM_GET_TASKS:
				case	IM_SIGNAL_TASK:
				case	IM_OBIT_TASK:
				case	IM_GET_INFO:
				case	IM_GET_RESC:
					/*
					 ** A user attempt failed, inform process.
					 */
					DBPRT(("%s: REQUEST %d %s returned ERROR %d\n",
						__func__, event_com, jobid, errcode))
					ptask = task_check(pjob, efd, event_task);
					if (ptask == NULL)
						break;
					(void)tm_reply(efd, ptask->ti_protover,
						TM_ERROR, event_client);
					(void)diswsi(efd, errcode);
					(void)dis_flush(efd);
					break;

				case	IM_POLL_JOB:
					/*
					 ** I must be Mother Superior for the job and
					 ** this is an error reply to a poll request.
					 */
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"POLL_JOB ERROR and I'm not MS");
						goto err;
					}

					if (do_tolerate_node_failures(pjob)) {
						snprintf(log_buffer, sizeof(log_buffer), "ignoring POLL_JOB error from failed mom %s as job is tolerant of node failures", np->hn_host?np->hn_host:"");
						log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
						break;
					}

					DBPRT(("%s: POLL_JOB %s returned ERROR %d\n",
						__func__, jobid, errcode))
					sprintf(log_buffer, "POLL_JOB returned ERROR %d",
						errcode);
					log_joberr(-1, __func__, log_buffer, jobid);

					np->hn_sister = errcode ? errcode : SISTER_BADPOLL;
					pjob->ji_nodekill = np->hn_node;
					break;

#ifdef PMIX
				case	IM_PMIX:
					/*
					 * I must be mother superior for the job and
					 * this is an error response to a PMIX request.
					 */
					sprintf(log_buffer, "IM_PMIX error encountered");
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
						jobid, log_buffer);
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						sprintf(log_buffer,
							"IM_PMIX error and this is not MS");
						goto err;
					}
					/* TODO: Handle IM_PMIX error */
					sprintf(log_buffer, "Handle IM_PMIX error here");
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
						jobid, log_buffer);
					break;
#endif /* PMIX */

				case	IM_UPDATE_JOB:
					if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
						snprintf(log_buffer, sizeof(log_buffer), "IM_UPDATE_JOB ERROR and I'm not MS");
						goto err;
					}
					DBPRT(("%s: IM_UPDATE_JOB %s returned ERROR %d\n", __func__, jobid, errcode))
					if (errmsg != NULL) {
						log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
							  LOG_INFO, jobid, errmsg);
					}
					break;
				default:
					sprintf(log_buffer, "unknown command %d error",
						event_com);
					goto err;
			}
			break;

		case	IM_SEND_RESC:
			/*
			 ** I must be Mother Superior for the job and
			 ** this is a reply with job resources to
			 ** tally up.
			 **
			 */
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
				sprintf(log_buffer,
					"got IM_SEND_RESC and I'm not MS");
				goto err;
			}

			nodehost = disrst(stream, &ret);
			BAIL("nodehost")
			resc_idx = -1;
			for (i=0; i < pjob->ji_numrescs; i++) {
				if ((pjob->ji_resources[i].nodehost != NULL) &&
				    (compare_short_hostname(pjob->ji_resources[i].nodehost, nodehost) == 0)) {
					resc_idx = i;
					break;
				}
			}
			if (resc_idx == -1) {
				noderes *tmparr = NULL;
				/* add an entry to pjob->ji_resources */
				/* for this incoming resource report */

				tmparr = (noderes *)realloc(
						pjob->ji_resources,
				 (pjob->ji_numrescs+1)*sizeof(noderes));

				if (tmparr == NULL) {
					snprintf(log_buffer,
						sizeof(log_buffer),
				 	 	"realloc failure extending"
					 	"  pjob->ji_resources");
					goto err;
				}
				pjob->ji_resources = tmparr;
				resc_idx = pjob->ji_numrescs;
				pjob->ji_resources[resc_idx].nodehost =
					strdup(nodehost);
				if (pjob->ji_resources[resc_idx].nodehost == NULL) {
					snprintf(log_buffer, sizeof(log_buffer),
				 	 	"strdup failure setting nodehost");
					goto err;
				}
				clear_attr(&pjob->ji_resources[resc_idx].nr_used,
						&job_attr_def[JOB_ATR_resc_used]);
				pjob->ji_numrescs++;

			}
			pjob->ji_resources[resc_idx].nr_cput =
				disrul(stream, &ret);
			BAIL("resources_used.cput")
			convert_duration_to_str(pjob->ji_resources[resc_idx].nr_cput, timebuf, TIMEBUF_SIZE);

			pjob->ji_resources[resc_idx].nr_mem =
				disrul(stream, &ret);
			BAIL("resources_used.mem")
			pjob->ji_resources[resc_idx].nr_cpupercent =
				disrul(stream, &ret);
			BAIL("resources_used.cpupercent")
			DBPRT(("%s: SEND_RESC %s OKAY nodeidx %d cpu %lu mem %lu\n",
				__func__, jobid, resc_idx,
				pjob->ji_resources[nodeidx-1].nr_cput,
				pjob->ji_resources[nodeidx-1].nr_mem))

			pjob->ji_resources[resc_idx].nr_status = PBS_NODERES_DELETE;

			sprintf(log_buffer,
				"%s cput=%s mem=%lukb", nodehost, timebuf,
				pjob->ji_resources[resc_idx].nr_mem);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
				LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);

			free(nodehost);
			nodehost = NULL;
			enqueue_update_for_send(pjob, IS_RESCUSED);
			break;

		case	IM_UPDATE_JOB:
			if (check_ms(stream, NULL))
				goto fini;
			if (receive_job_update(stream, pjob) != 0) {
				snprintf(log_buffer,
					sizeof(log_buffer),
					"receive_job_update failed");
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
					LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
				goto err;
			}
			ret = im_compose(stream, jobid, cookie,
				IM_ALL_OKAY,
				event, fromtask, IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS)
				goto err;
			break;
		case IM_RECONNECT_TO_MS:
			if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE)
				resume_multinode(pjob);
			break;

		default:
			sprintf(log_buffer, "unknown command %d sent", command);
			goto err;
	}

done:
	tpp_eom(stream);
	if (reply) {	/* check if write worked */
		if (ret != DIS_SUCCESS ||
			dis_flush(stream) == -1) {
			if (errno != 0)
				log_err(errno, __func__, "dis_flush");
			tpp_close(stream);
			if (np != NULL && np->hn_stream == stream)
				np->hn_stream = -1;
		}
	}
	goto fini;

err:
	/*
	 ** We come here if we got a DIS read error or a protocol
	 ** element is missing, or possibly because we failed to
	 ** create a CPU set.  The likely case is the remote
	 ** host has gone down.
	 */
	if (jobid == NULL)
		log_err(-1, __func__, log_buffer);
	else
		log_joberr(-1, __func__, log_buffer, jobid);
	im_eof(stream, ret);

fini:
	free(jobid);
	free(cookie);
	free(info);
	free(errmsg);
	free(nodehost);
}

// clang-format on

/**
 * @brief
 *      Handle a stream that needs to be closed.
 *      May be either from another Mom, or the server.
 *
 * @param[in] fd - file descriptor
 *
 * @return Void
 *
 */
void
tm_eof(int fd)
{
	job *pjob;
	pbs_task *ptask;
	int i;
	int events;
	tm_task_id fromtask;

	/*
	 ** Search though all the jobs looking for this fd.
	 */
	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob != NULL;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
		     ptask;
		     ptask = (pbs_task *)
			     GET_NEXT(ptask->ti_jobtask)) {

			if (ptask->ti_tmfd == NULL)
				continue;

			for (i = 0; i < ptask->ti_tmnum; i++) {
				if (ptask->ti_tmfd[i] == fd) {
					fromtask = ptask->ti_qs.ti_task;
					ptask->ti_tmfd[i] = -1;
					goto cleanup;
				}
			}
		}
	}
	log_err(-1, __func__, "no matching task found");
	return;

cleanup:

	events = 0;
	/*
	 ** Check for events waiting to be sent to the dead client.
	 */
	for (i = 0; i < pjob->ji_numnodes; i++) {
		eventent *ep;
		hnodent *np = &pjob->ji_hosts[i];

		ep = (eventent *) GET_NEXT(np->hn_events);
		while (ep) {
			if (ep->ee_fd == fd) {
				DBPRT(("%s: fd %d drop command %d "
				       "client %d event %d task %8.8X\n",
				       __func__, ep->ee_fd, ep->ee_command,
				       ep->ee_client, ep->ee_event,
				       ep->ee_taskid))
				ep->ee_fd = -1;
				events++;
			}

			ep = (eventent *) GET_NEXT(ep->ee_next);
		}
	}

	/*
	 ** Throw away any obits the dead client was waiting for.
	 */
	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		obitent *pobit;

		pobit = (obitent *) GET_NEXT(ptask->ti_obits);
		while (pobit) {
			obitent *next = GET_NEXT(pobit->oe_next);

			if (pobit->oe_type == OBIT_TYPE_TMEVENT &&
			    pobit->oe_u.oe_tm.oe_fd == fd) {
				DBPRT(("%s: fd %d drop obit event %d "
				       "node %d task %8.8X\n",
				       __func__,
				       pobit->oe_u.oe_tm.oe_fd,
				       pobit->oe_u.oe_tm.oe_event,
				       pobit->oe_u.oe_tm.oe_node,
				       pobit->oe_u.oe_tm.oe_taskid))
				delete_link(&pobit->oe_next);
				free(pobit);
				events++;
			}
			pobit = next;
		}
	}

	if (events > 0) {
		sprintf(log_buffer,
			"%d events dropped for TM client in task %8.8X",
			events, fromtask);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}
	return;
}

#define TASK_FDMAX 10


/**
 * @brief
 * 		Find the UID of a process that owns the socket between 
 * 		two endpoints from /proc/net/tcp or /proc/net/tcp6.
 * 
 * @param[in] path - Path to the TCP file (either /proc/net/tcp or /proc/net/tcp6)
 * @param[in] target_uid - Target UID to match
 * @param[in] target_local_port - Target local port to match
 * @param[in] target_remote_port - Target remote port to match
 * 
 * @return int
 * @retval -1 on failure
 * @retval UID of the process on success
 * 
 */
static int
find_uid_from_tcp(const char *path, int target_uid, unsigned int target_local_port, unsigned int target_remote_port)
{
	char line[512];
	unsigned int local;
	unsigned int remote;
	int uid = -1;
	FILE *fp = fopen(path, "r");

	if (!fp) {
		log_errf(errno, __func__, "Failed to open %s", path);
		return -1;
	}

	/*
	 * Read each line, extract the local port, remote port and uid,
	 * and compare them with the target ports. If a match is found, return
	 * the uid.
	 */
	while (fgets(line, sizeof(line), fp)) {
		if (sscanf(line, "%*s %*[0-9A-Fa-f]:%4X %*[0-9A-Fa-f]:%4X %*s %*s %*s %*s %d",
			   &local, &remote, &uid) == 3) {
			if (local == target_local_port && remote == target_remote_port && target_uid == uid) {
				goto ret;
			} else if (local == target_remote_port && remote == target_local_port && target_uid == uid) {
				goto ret;
			}
		}
	}

	uid = -1;
ret:
	fclose(fp);
	return uid;
}

/**
 * @brief
 *      Discover the UID of the process that owns the socket connection by 
 * 		looking at /proc/net/tcp or /proc/net/tcp6.
 *
 * @param[in] conn - The connection structure
 * @param[in] target_uid - Target UID to match
 *
 * @return int
 * @retval -1 on failure
 * @retval UID of the process on success
 */
static int
get_uid_from_socket(conn_t *conn, int target_uid)
{
	pbs_net_t local_addr;
	pbs_net_t remote_addr;
	pbs_socklen_t addr_len;

	addr_len = sizeof(local_addr);
	if (getsockname(conn->cn_sock, (struct sockaddr *) &local_addr, &addr_len) < 0) {
		log_err(errno, __func__, "Error getting the socket's local address");
		return -1;
	}

	addr_len = sizeof(remote_addr);
	if (getpeername(conn->cn_sock, (struct sockaddr *) &remote_addr, &addr_len) < 0) {
		log_err(errno, __func__, "Error getting the socket's remote address");
		return -1;
	}

	if (IS_VALID_IP(&local_addr) && IS_VALID_IP(&remote_addr)) {
		unsigned int local_port = ntohs(GET_IP_PORT(&local_addr));
		unsigned int remote_port = ntohs(GET_IP_PORT(&remote_addr));

		/* First try to find matching entry in /proc/net/tcp */
		int uid = find_uid_from_tcp("/proc/net/tcp", target_uid, local_port, remote_port);
		if (uid != -1)
			return uid;

		/* Then look at /proc/net/tcp6 */
		uid = find_uid_from_tcp("/proc/net/tcp6", target_uid, local_port, remote_port);
		if (uid != -1)
			return uid;

		log_errf(-1, __func__, "No matching UID found for local port %u and remote port %u in /proc/net/tcp or /proc/net/tcp6",
			 local_port, remote_port);
	} else {
		log_err(-1, __func__, "Invalid IP address in connection");
	}

	return -1;
}

/**
 *
 * @brief
 *	Input is coming from a process running on this host which
 *	should be part of one of the jobs I am part of.  The i/o
 *	will take place using DIS over a tcp fd.
 *
 * @param[in]	fd - the stream to read input from.
 * @param[in]	version - protocol version
 *
 * @note
 *	Read the stream to get a task manager request.  Format the reply
 *	and write it back.
 *
 *	read (
 *		jobid			string
 *		cookie			string
 *		command			int
 *		event			int
 *		from taskid		uint
 *	)
 *
 * @return int
 * @retval 0		for success
 * @retval non-zero 	for failure
 *
 */
int
tm_request(int fd, int version)
{
	extern int reqnum;
	int command;
	int reply = TRUE;
	int ret = DIS_SUCCESS;
	char *jobid = NULL;
	char *cookie = NULL;
	char *oreo;
	job *pjob = NULL;
	eventent *ep;
	pbs_task *ptask = NULL;
	vmpiprocs *pnode;
	hnodent *phost;
	int i, event, numele;
	size_t len;
	long ipadd;
	char **argv, **envp;
	char *name, *info;
	infoent *ip;
	int signum;
	int vnodenum;
	int prev_error = 0;
	tm_node_id tvnodeid;
	tm_node_id myvnodeid;
	tm_task_id taskid, fromtask;
	extern u_long localaddr;
	char hook_msg[HOOK_MSG_SIZE + 1];
	int argc = 0;
	int found_empty_string = 0;
	mom_hook_input_t hook_input;

	conn_t *conn = get_conn(fd);
	if (!conn) {
		sprintf(log_buffer, "not found fd=%d in connection table", fd);
		closesocket(fd);
		if (cookie)
			free(cookie);
		return -1;
	}

	if (conn->cn_addr != localaddr) {
		sprintf(log_buffer, "non-local connect");
		goto err;
	}
	if (version != TM_PROTOCOL_VER &&
	    version != TM_PROTOCOL_OLD) {
		sprintf(log_buffer, "bad protocol version %d", version);
		goto err;
	}

	jobid = disrst(fd, &ret);
	BAIL("jobid")
	cookie = disrst(fd, &ret);
	BAIL("cookie")
	command = disrsi(fd, &ret);
	BAIL("command")
	event = disrsi(fd, &ret);
	BAIL("event")
	fromtask = disrui(fd, &ret);
	BAIL("fromtask")

	DBPRT(("%s: job %s cookie %s task %8.8X com %d event %d\n", __func__,
	       jobid, cookie, fromtask, command, event))

	/*
	 **	Check to see if we are doing a TM_ATTACH.  If so,
	 **	it is a special case since there will be no existing
	 **	task to look up.
	 */
	if (command == TM_ATTACH) {
		static char id[] = "tm_attach";
		pid_t pid;
		pid_t sid;
		extern int attach_allow;
		uid_t proc_uid;
		uid_t jobowner;
#ifdef WIN32
		char proc_uname[UNLEN + 1] = {'\0'};
		char comm[MAX_PATH] = {'\0'};
		HANDLE hProcess = INVALID_HANDLE_VALUE;
		char *user_name = disrst(fd, &ret);
		BAIL("uid")
#else
		int system_uid = -1;
		char comm[32] = {'\0'};
		uid_t uid;
		uid = disrui(fd, &ret);
		BAIL("uid")
#endif
		pid = disrui(fd, &ret);
		BAIL("pid")

		/*
		 ** See if we are allowed to attach.
		 */
		if (!attach_allow) {
			sprintf(log_buffer, "%s: not allowed", id);
			i = TM_ENOTIMPLEMENTED;
			goto aterr;
		}

		/*
		 ** The cookie must be NULL.
		 */
		if (*cookie != '\0') {
			sprintf(log_buffer, "%s: job cookie is not NULL", id);
			goto err;
		}

		/* Discover the system_uid by indexing /proc/net/tcp
		 * with the local and remote socket addresses
		 * The system_uid should match uid
		 */
		system_uid = get_uid_from_socket(conn, uid);
		if (system_uid == -1) {
			sprintf(log_buffer, "%s: unable to determine the system UID", id);
			i = TM_ENOTFOUND;
			goto aterr;
		} else if (system_uid != uid) {
			sprintf(log_buffer, "%s: system UID %d does not match UID %u", id, system_uid, uid);
			i = TM_EUSER;
			goto aterr;
		}

		if (*jobid == '\0') { /* search for job */
			job *pj;

			i = 0;
			for (pj = (job *) GET_NEXT(svr_alljobs);
			     pj != NULL;
			     pj = (job *) GET_NEXT(pj->ji_alljobs)) {
#ifdef WIN32
				if (user_name == NULL || pj->ji_user->pw_name == NULL || (strcasecmp(user_name, pj->ji_user->pw_name) != 0))
#else
				if (uid != pj->ji_qs.ji_un.ji_momt.ji_exuid)
#endif
					continue;

				if (!check_job_substate(pj, JOB_SUBSTATE_RUNNING) && !check_job_substate(pj, JOB_SUBSTATE_PRERUN))
					continue;
				i++;
				pjob = pj;
			}
			/*
			 ** If one and only one match is found, pjob is good.
			 */
			if (i != 1) {
				sprintf(log_buffer,
					"%s: job could not be determined", id);
				i = TM_ENOTFOUND;
				goto aterr;
			}
			jobowner = pjob->ji_qs.ji_un.ji_momt.ji_exuid;
		} else {
			/* verify the jobid is known */
			if ((pjob = find_job(jobid)) == NULL) {
				sprintf(log_buffer, "job not found");
				i = TM_ENOTFOUND;
				goto aterr;
			}
			if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING) && !check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) {
				sprintf(log_buffer, "job not running");
				i = TM_ENOTFOUND;
				goto aterr;
			}
			/*
			 ** The uid must match the job.
			 */
			jobowner = pjob->ji_qs.ji_un.ji_momt.ji_exuid;
#ifdef WIN32
			if (user_name == NULL || pjob->ji_user->pw_name == NULL || (strcasecmp(user_name, pjob->ji_user->pw_name) != 0)) {
				sprintf(log_buffer,
					"%s: uid mismatch %s to job %s",
					id, user_name, pjob->ji_user->pw_name);
				i = TM_EUSER;
				goto aterr;
			}
#else
			if (uid != jobowner) {
				sprintf(log_buffer,
					"%s: uid mismatch %d to job %d",
					id, uid, jobowner);
				i = TM_EUSER;
				goto aterr;
			}
#endif
		}

		mom_hook_input_init(&hook_input);
		hook_input.pjob = pjob;
		hook_input.pid = pid;

		switch (mom_process_hooks(HOOK_EVENT_EXECJOB_ATTACH,
					  PBS_MOM_SERVICE_NAME, mom_host,
					  &hook_input, NULL,
					  hook_msg, sizeof(hook_msg), 1)) {
			case 0: /* explicit reject */
				/* maybe a new TM error? */
				i = TM_EHOOK;
				/* in aterr, log_buffer gets printed */
				snprintf(log_buffer, sizeof(log_buffer),
					 "execjob_attach hook rejected request");
				goto aterr;
			case 1: /* explicit accept */
				break;
			case 2: /* no hook script executed - go ahead and accept event*/
				break;
			default:
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, "",
					  "execjob_attach event: accept req by default");
		}

		/*
		 ** Get the session, uid and command name for the pid.
		 ** I need to bump reqnum so dep_procinfo will get a
		 ** fresh copy of the process table.
		 */
		reqnum++;
#ifdef WIN32
		i = dep_procinfo(pid, &sid, &proc_uid, proc_uname, sizeof(proc_uname), comm, sizeof(comm));
#else
		i = dep_procinfo(pid, &sid, &proc_uid, comm, sizeof(comm));
#endif
		if (i != TM_OKAY) {
#ifdef linux
			char procid[MAXPATHLEN + 1];
			struct stat sbuf;

			snprintf(procid, sizeof(procid), "/proc/%d", pid);
			if (stat(procid, &sbuf) == -1)
				goto aterr;

			sid = getsid(pid);
			if (sid == -1)
				goto aterr;

			proc_uid = sbuf.st_uid;
#else
			goto aterr;
#endif
		}
		if (sid <= 1) {
			i = TM_ENOPROC;
			goto aterr;
		}

		/*
		 ** Search all the tasks to make sure the session has
		 ** not already been attached.
		 */
		ptask = find_session(sid);
		if (ptask != NULL) {
			sprintf(log_buffer, "%s: sid %d already attached",
				id, sid);
			i = TM_ESESSION;
			goto aterr;
		}

		/*
		 ** The process must be owned by
		 ** the job owner.
		 */
#ifdef WIN32
		if (proc_uname == NULL || pjob->ji_user->pw_name == NULL || (strcasecmp(proc_uname, pjob->ji_user->pw_name) != 0)) {
			sprintf(log_buffer,
				"%s: uid mismatch proc %s to job %s",
				id, proc_uname, pjob->ji_user->pw_name);
			i = TM_EOWNER;
			goto aterr;
		}
#else
		if (proc_uid != jobowner) {
			sprintf(log_buffer,
				"%s: uid mismatch proc %d to job %d",
				id, proc_uid, jobowner);
			i = TM_EOWNER;
			goto aterr;
		}
#endif
		/*
		 **	Create a new task for the session.
		 */
#ifdef WIN32
		if ((hProcess = OpenProcess(PROCESS_ALL_ACCESS, TRUE, (DWORD) sid)) == NULL) {
			sprintf(log_buffer, "%s: OpenProcess Failed for pid %d with error %d", id, sid, GetLastError());
			i = TM_ENOPROC;
			goto aterr;
		}
#endif

		ptask = momtask_create(pjob);
		if (ptask == NULL) {
			sprintf(log_buffer, "%s: task create failed", id);
			i = TM_ESYSTEM;
			goto aterr;
		}

		strcpy(ptask->ti_qs.ti_parentjobid, jobid);
		/*
		 **	The parent self virtual nodes are not known.
		 */
		ptask->ti_qs.ti_parentnode = TM_ERROR_NODE;
		ptask->ti_qs.ti_myvnode = TM_ERROR_NODE;
		ptask->ti_qs.ti_parenttask = TM_INIT_TASK;
		ptask->ti_qs.ti_sid = sid;
#ifdef WIN32
		ptask->ti_hProc = hProcess;
		if (pjob->ji_hJob == NULL) {
			pjob->ji_hJob = CreateJobObject(NULL, pjob->ji_qs.ji_jobid);
			if (pjob->ji_hJob != NULL) {
				/*
				 * When a process is attached using -p option of pbs_attach
				 * and the processe is not running under session 0,
				 * or when a pbs_attach is run outside the job in a session != 0,
				 * it may fail to assign to the Windows Job object
				 * but its resource accounting and resource limit enforcement
				 * will still be applicable via polling.
				 * Any processes created by pbs_attach are automatically
				 * assigned to the job object as long as pbs_attach
				 * gets run inside the job
				 */
				(void) AssignProcessToJobObject(pjob->ji_hJob, hProcess);
			}
		} else {
			/*
			 * When a process is attached using -p option of pbs_attach
			 * and the process is not running under session 0,
			 * or when a pbs_attach is run outside the job in a session != 0,
			 * it may fail to assign to the Windows Job object
			 * but its resource accounting and resource limit enforcement
			 * will still be applicable via polling.
			 * Any processes created by pbs_attach are automatically
			 * assigned to the job object as long as pbs_attach
			 * gets run inside the job
			 */
			(void) AssignProcessToJobObject(pjob->ji_hJob, hProcess);
		}
#endif
		ptask->ti_qs.ti_status = TI_STATE_RUNNING;
		ptask->ti_flags |= TI_FLAGS_ORPHAN;
		(void) task_save(ptask);

		if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING)) {
			set_job_state(pjob, JOB_STATE_LTR_RUNNING);
			set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
			job_save(pjob);
		}

		/*
		 ** Add to list of polled jobs if it isn't
		 ** already there.
		 */
		if (is_linked(&mom_polljobs,
			      &pjob->ji_jobque) == 0) {
			append_link(&mom_polljobs,
				    &pjob->ji_jobque, pjob);
		}

		/*
		 ** Do any dependent attach operation.
		 */
		i = dep_attach(ptask);
		if (i != TM_OKAY) {
			goto aterr;
		}

		sprintf(log_buffer,
			"pid %d sid %d cmd %s attached as task %8.8X",
			pid, sid, comm, ptask->ti_qs.ti_task);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		/*
		 * Do any dependent attach operation.
		 */
	aterr:
		if (i != TM_OKAY) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
				  LOG_NOTICE,
				  (pjob == NULL) ? "N/A" : pjob->ji_qs.ji_jobid,
				  log_buffer);
		}
		ret = tm_reply(fd, version,
			       (i == TM_OKAY) ? i : TM_ERROR, event);
		if (ret != DIS_SUCCESS)
			goto done;
		ret = diswui(fd, ((i == TM_OKAY) ? ptask->ti_qs.ti_task : i));
		goto done;
	}

	/* Continue normal processing for all other commands. */
	/* verify the jobid is known */
	if ((pjob = find_job(jobid)) == NULL) {
		sprintf(log_buffer, "job not found");
		goto err;
	}

	/* see if the cookie matches */
	if (!(is_jattr_set(pjob, JOB_ATR_Cookie))) {
		sprintf(log_buffer, "job has no cookie");
		goto err;
	}
	oreo = get_jattr_str(pjob, JOB_ATR_Cookie);
	if (strcmp(oreo, cookie) != 0) {
		DBPRT(("job cookie %s message %s", oreo, cookie))
		sprintf(log_buffer, "bad cookie");
		goto err;
	}

	/* verify this taskid is my baby */
	ptask = task_find(pjob, fromtask);
	if (ptask == NULL) { /* not found */
		sprintf(log_buffer, "task %8.8X not found", fromtask);
		log_joberr(-1, __func__, log_buffer, jobid);
		ret = tm_reply(fd, version, TM_ERROR, event);
		if (ret != DIS_SUCCESS)
			goto done;
		ret = diswsi(fd, TM_ENOTFOUND);
		goto done;
	}
	myvnodeid = ptask->ti_qs.ti_myvnode;
	conn->cn_oncl = tm_eof;

	if (ptask->ti_protover != -1 && ptask->ti_protover != version) {
		/* the protocol version should not change */
		sprintf(log_buffer,
			"inconsistent TM version %d from task %8.8X",
			version, fromtask);
		goto err;
	}
	ptask->ti_protover = version;

	if (ptask->ti_tmfd == NULL) {
		ptask->ti_tmfd = (int *) calloc(TASK_FDMAX, sizeof(int));
		assert(ptask->ti_tmfd != NULL);
		ptask->ti_tmnum = 0;
		ptask->ti_tmmax = TASK_FDMAX;
	}
	for (i = 0; i < ptask->ti_tmnum; i++) {
		if (ptask->ti_tmfd[i] == fd)
			break;
	}
	if (i == ptask->ti_tmnum) { /* didn't find existing fd */
		for (i = 0; i < ptask->ti_tmnum; i++) {
			if (ptask->ti_tmfd[i] == -1)
				break;
		}
		if (i == ptask->ti_tmnum) { /* no free slot */
			if (ptask->ti_tmnum == ptask->ti_tmmax) {
				/* no more space */
				ptask->ti_tmmax *= 2;
				ptask->ti_tmfd = (int *) realloc(ptask->ti_tmfd,
								 ptask->ti_tmmax * sizeof(int));
				assert(ptask->ti_tmfd != NULL);
			}
			i = ptask->ti_tmnum++;
		}
		ptask->ti_tmfd[i] = fd;
	}

	/* set no timeout so connection is not closed for being idle */
	conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;

	switch (command) {

		case TM_INIT:
			/*
			 ** A request to initialize.
			 **
			 **	send (
			 **		number of nodes int;
			 **		nodeid[0]       int;
			 **		...
			 **		nodeid[n-1]     int;
			 **		parent jobid    string;
			 **		parent nodeid   int;
			 **		parent taskid   int;
			 **	)
			 */
			DBPRT(("%s: INIT %s\n", __func__, jobid))
			if (prev_error)
				goto done;

			ret = tm_reply(fd, version, TM_OKAY, event);
			if (ret != DIS_SUCCESS)
				goto done;
			vnodenum = pjob->ji_numvnod;
			ret = diswui(fd, vnodenum); /* num nodes */
			if (ret != DIS_SUCCESS)
				goto done;

			pnode = pjob->ji_vnods;
			for (i = 0; i < vnodenum; i++) {
				ret = diswsi(fd, pnode[i].vn_node);
				if (ret != DIS_SUCCESS)
					goto done;
			}
			ret = diswst(fd, ptask->ti_qs.ti_parentjobid); /* dad job */
			if (ret != DIS_SUCCESS)
				goto done;
			ret = diswsi(fd, ptask->ti_qs.ti_parentnode); /* dad node */
			if (ret != DIS_SUCCESS)
				goto done;
			ret = diswui(fd, ptask->ti_qs.ti_parenttask); /* dad task */
			if (ret != DIS_SUCCESS)
				goto done;

			ptask->ti_flags |= TI_FLAGS_INIT;
			goto done;

		case TM_POSTINFO:
			/*
			 ** Post named info for a task.
			 **
			 **	read (
			 **		name		string;
			 **		info		counted string;
			 **	)
			 */
			name = disrst(fd, &ret);
			BAIL("POSTINFO name")
			info = disrcs(fd, &len, &ret);
			if (ret != DIS_SUCCESS) {
				free(name);
				sprintf(log_buffer, bail_format, "POSTINFO info");
				goto err;
			}
			DBPRT(("%s: POSTINFO %s task %8.8X sent info %s:%s(%d)\n", __func__,
			       jobid, fromtask, name, info, (int) len))
			if (prev_error) {
				free(name);
				free(info);
				goto done;
			}

			task_saveinfo(ptask, name, info, (int) len);
			ret = tm_reply(fd, version, TM_OKAY, event);
			goto done;

		case TM_REGISTER:
			sprintf(log_buffer, "REGISTER received - NOT IMPLEMENTED");
			(void) tm_reply(fd, version, TM_ERROR, event);
			(void) diswsi(fd, TM_ENOTIMPLEMENTED);
			(void) dis_flush(fd);
			goto err;

		default:
			break;
	}

	/*
	 ** All requests beside TM_INIT and TM_POSTINFO
	 ** require a node number where the action will take place.
	 ** Read that and check that it is legal.
	 **
	 **	read (
	 **		node number		int
	 **	)
	 */
	tvnodeid = disrui(fd, &ret);
	BAIL("tvnodeid")

	pnode = pjob->ji_vnods;
	for (i = 0; i < pjob->ji_numvnod; i++, pnode++) {
		if (pnode->vn_node == tvnodeid)
			break;
	}
	if (i == pjob->ji_numvnod) {
		sprintf(log_buffer, "node %d not found", tvnodeid);
		log_joberr(-1, __func__, log_buffer, jobid);
		ret = tm_reply(fd, version, TM_ERROR, event);
		if (ret != DIS_SUCCESS)
			goto done;
		ret = diswsi(fd, TM_ENOTFOUND);
		if (ret != DIS_SUCCESS)
			goto done;
		prev_error = 1;
	}
	phost = pnode->vn_host;

	switch (command) {

		case TM_TASKS:
			/*
			 ** A request to read the list of tasks that a
			 ** particular node has charge of.
			 */
			DBPRT(("%s: TASKS %s on node %d\n",
			       __func__, jobid, tvnodeid))
			if (prev_error)
				goto done;

			if (pjob->ji_nodeid != TO_PHYNODE(tvnodeid)) { /* not me */
				ep = event_alloc(pjob, IM_GET_TASKS, fd, phost,
						 event, fromtask);
				ret = im_compose(phost->hn_stream, jobid, cookie,
						 IM_GET_TASKS, ep->ee_event, fromtask, IM_OLD_PROTOCOL_VER);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(phost->hn_stream, myvnodeid);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(phost->hn_stream, tvnodeid);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = (dis_flush(phost->hn_stream) == -1) ? DIS_NOCOMMIT : DIS_SUCCESS;
				if (ret != DIS_SUCCESS)
					goto done;
				reply = FALSE;
				goto done;
			}
			ret = tm_reply(fd, version, TM_OKAY, event);
			if (ret != DIS_SUCCESS)
				goto done;
			for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
			     ptask;
			     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
				ret = diswui(fd, ptask->ti_qs.ti_task);
				if (ret != DIS_SUCCESS)
					goto done;
			}
			ret = diswui(fd, TM_NULL_TASK);
			break;

		case TM_SPAWN:
			/*
			 ** Spawn a task on the requested node.
			 **
			 **	read (
			 **		argc		int;
			 **		arg 0		string;
			 **		...
			 **		arg argc-1	string;
			 **		env 0		string;
			 **		...
			 **		env m		string;
			 **	)
			 */
			DBPRT(("%s: SPAWN %s on node %d\n",
			       __func__, jobid, tvnodeid))
			argc = disrui(fd, &ret);
			if (ret != DIS_SUCCESS)
				goto done;
			argv = (char **) calloc(argc + 1, sizeof(char *));
			assert(argv);
			for (i = 0; i < argc; i++) {
				argv[i] = disrst(fd, &ret);
				if (ret != DIS_SUCCESS) {
					argv[i] = NULL;
					arrayfree(argv);
					goto done;
				}
				if (strlen(argv[i]) == 0)
					found_empty_string = 1; /* arguments contains empty string, Used if spawn on another MOM*/
			}
			argv[i] = NULL;

			numele = 3;
			envp = (char **) calloc(numele, sizeof(char *));
			assert(envp);
			for (i = 0;; i++) {
				char *env;

				env = disrst(fd, &ret);
				if (ret != DIS_SUCCESS && ret != DIS_EOD) {
					arrayfree(argv);
					envp[i] = NULL;
					arrayfree(envp);
					goto done;
				}
				if (env == NULL)
					break;
				if (*env == '\0') {
					free(env);
					break;
				}
				/*
				 **	Need to remember extra slot for NULL
				 **	at the end.  Thanks to Pete Wyckoff
				 **	for finding this.
				 */
				if (i == numele - 1) {
					numele *= 2;
					envp = (char **) realloc(envp,
								 numele * sizeof(char *));
					assert(envp);
				}
				envp[i] = env;
			}
			envp[i] = NULL;
			ret = DIS_SUCCESS;

			if (prev_error) {
				arrayfree(argv);
				arrayfree(envp);
				goto done;
			}

			/*
			 ** If the spawn happens on me, just do it.
			 */
			if (pjob->ji_nodeid == TO_PHYNODE(tvnodeid)) {
#ifdef PMIX
				pbs_pmix_register_client(pjob, tvnodeid, &envp);
#endif
				i = TM_ERROR;
				ptask = momtask_create(pjob);
				if (ptask != NULL) {
					strcpy(ptask->ti_qs.ti_parentjobid, jobid);
					ptask->ti_qs.ti_parentnode = myvnodeid;
					ptask->ti_qs.ti_myvnode = tvnodeid;
					ptask->ti_qs.ti_parenttask = fromtask;
					if (task_save(ptask) != -1) {
						ret = start_process(ptask, argv, envp, false);
						if (ret == PBSE_NONE) {
							i = TM_OKAY;
						} else if (ret == PBSE_SYSTEM) {
							i = TM_ESYSTEM;
							ptask->ti_qs.ti_status = TI_STATE_EXITED;
						}
					}
				}
				arrayfree(argv);
				arrayfree(envp);
				ret = tm_reply(fd, version, i, event);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(fd, ((i == TM_ERROR) ? TM_ESYSTEM : ptask->ti_qs.ti_task));
				goto done;
			}
			/*
			 ** Sending to another MOM.
			 */
			ep = event_alloc(pjob, IM_SPAWN_TASK, fd, phost,
					 event, fromtask);
			ret = im_compose(phost->hn_stream, jobid, cookie,
					 IM_SPAWN_TASK, ep->ee_event, fromtask,
					 found_empty_string ? IM_PROTOCOL_VER : IM_OLD_PROTOCOL_VER);
			if (ret != DIS_SUCCESS) {
				arrayfree(argv);
				arrayfree(envp);
				goto done;
			}
			ret = diswui(phost->hn_stream, myvnodeid);
			if (ret != DIS_SUCCESS) {
				arrayfree(argv);
				arrayfree(envp);
				goto done;
			}
			ret = diswui(phost->hn_stream, tvnodeid);
			if (ret != DIS_SUCCESS) {
				arrayfree(argv);
				arrayfree(envp);
				goto done;
			}
			ret = diswui(phost->hn_stream, TM_NULL_TASK);
			if (ret != DIS_SUCCESS) {
				arrayfree(argv);
				arrayfree(envp);
				goto done;
			}
			if (found_empty_string) {
				ret = diswui(phost->hn_stream, argc);
				if (ret != DIS_SUCCESS) {
					arrayfree(argv);
					arrayfree(envp);
					goto done;
				}
				for (i = 0; i < argc; i++) {
					ret = diswst(phost->hn_stream, argv[i]);
					if (ret != DIS_SUCCESS) {
						arrayfree(argv);
						arrayfree(envp);
						goto done;
					}
				}
			} else {
				for (i = 0; argv[i]; i++) {
					ret = diswst(phost->hn_stream, argv[i]);
					if (ret != DIS_SUCCESS) {
						arrayfree(argv);
						arrayfree(envp);
						goto done;
					}
				}
				ret = diswst(phost->hn_stream, "");
				if (ret != DIS_SUCCESS) {
					arrayfree(argv);
					arrayfree(envp);
					goto done;
				}
			}
			for (i = 0; envp[i]; i++) {
				ret = diswst(phost->hn_stream, envp[i]);
				if (ret != DIS_SUCCESS) {
					arrayfree(argv);
					arrayfree(envp);
					goto done;
				}
			}
			ret = (dis_flush(phost->hn_stream) == -1) ? DIS_NOCOMMIT : DIS_SUCCESS;
			if (ret != DIS_SUCCESS) {
				arrayfree(argv);
				arrayfree(envp);
				goto done;
			}
			reply = FALSE;
			arrayfree(argv);
			arrayfree(envp);

			break;

		case TM_SIGNAL:
			/*
			 ** Send a signal to the specified task.
			 **
			 **	read (
			 **		to task			int
			 **		signal			int
			 **	)
			 */
			taskid = disrui(fd, &ret);
			BAIL("SIGNAL taskid")
			signum = disrui(fd, &ret);
			BAIL("SIGNAL signum")
			DBPRT(("%s: SIGNAL %s on node %d task %8.8X sig %d\n",
			       __func__, jobid, tvnodeid, taskid, signum))
			if (prev_error)
				goto done;

			if (pjob->ji_nodeid != TO_PHYNODE(tvnodeid)) { /* not me */
				ep = event_alloc(pjob, IM_SIGNAL_TASK, fd, phost,
						 event, fromtask);
				ret = im_compose(phost->hn_stream, jobid, cookie,
						 IM_SIGNAL_TASK, ep->ee_event, fromtask, IM_OLD_PROTOCOL_VER);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(phost->hn_stream, myvnodeid);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(phost->hn_stream, taskid);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswsi(phost->hn_stream, signum);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = (dis_flush(phost->hn_stream) == -1) ? DIS_NOCOMMIT : DIS_SUCCESS;
				if (ret != DIS_SUCCESS)
					goto done;
				reply = FALSE;
				goto done;
			}

			/*
			 ** Task should be here... look for it.
			 */
			if ((ptask = task_find(pjob, taskid)) == NULL) {
				ret = tm_reply(fd, version, TM_ERROR, event);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswsi(fd, TM_ENOTFOUND);
				break;
			}
			kill_task(ptask, signum, 0);
			ret = tm_reply(fd, version, TM_OKAY, event);
			break;

		case TM_OBIT:
			/*
			 ** Register an obit request for the specified task.
			 **
			 **	read (
			 **		task to watch		int
			 **	)
			 */
			taskid = disrui(fd, &ret);
			BAIL("OBIT taskid")
			DBPRT(("%s: fd %d OBIT %s on node %d task %8.8X\n",
			       __func__, fd, jobid, tvnodeid, taskid))
			if (prev_error)
				goto done;

			if (pjob->ji_nodeid != TO_PHYNODE(tvnodeid)) { /* not me */
				ep = event_alloc(pjob, IM_OBIT_TASK, fd, phost,
						 event, fromtask);
				ret = im_compose(phost->hn_stream, jobid, cookie,
						 IM_OBIT_TASK, ep->ee_event, fromtask, IM_OLD_PROTOCOL_VER);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(phost->hn_stream, myvnodeid);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(phost->hn_stream, taskid);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = (dis_flush(phost->hn_stream) == -1) ? DIS_NOCOMMIT : DIS_SUCCESS;
				if (ret != DIS_SUCCESS)
					goto done;
				reply = FALSE;
				goto done;
			}
			/*
			 ** Task should be here... look for it.
			 */
			if ((ptask = task_find(pjob, taskid)) == NULL) {
				ret = tm_reply(fd, version, TM_ERROR, event);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswsi(fd, TM_ENOTFOUND);
				break;
			}
			if (ptask->ti_qs.ti_status >= TI_STATE_EXITED) {
				ret = tm_reply(fd, version, TM_OKAY, event);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswsi(fd, ptask->ti_qs.ti_exitstat);
			} else {
				obitent *op = (obitent *) malloc(sizeof(obitent));
				assert(op);
				CLEAR_LINK(op->oe_next);
				append_link(&ptask->ti_obits, &op->oe_next, op);
				op->oe_type = OBIT_TYPE_TMEVENT;
				op->oe_u.oe_tm.oe_fd = fd;
				op->oe_u.oe_tm.oe_node = tvnodeid;
				op->oe_u.oe_tm.oe_event = event;
				op->oe_u.oe_tm.oe_taskid = fromtask;
				reply = 0;
			}
			break;

		case TM_GETINFO:
			/*
			 ** Get named info for a specified task.
			 **
			 **	read (
			 **		task			int
			 **		name			string
			 **	)
			 */
			taskid = disrui(fd, &ret);
			BAIL("GETINFO taskid")
			name = disrst(fd, &ret);
			BAIL("GETINFO name")
			DBPRT(("%s: GETINFO %s from node %d task %8.8X name %s\n",
			       __func__, jobid, tvnodeid, taskid, name))
			if (prev_error)
				goto done;

			if (pjob->ji_nodeid != TO_PHYNODE(tvnodeid)) { /* not me */
				ep = event_alloc(pjob, IM_GET_INFO, fd, phost,
						 event, fromtask);
				ret = im_compose(phost->hn_stream, jobid, cookie,
						 IM_GET_INFO, ep->ee_event, fromtask, IM_OLD_PROTOCOL_VER);
				if (ret == DIS_SUCCESS) {
					ret = diswui(phost->hn_stream, myvnodeid);
					if (ret == DIS_SUCCESS) {
						ret = diswui(phost->hn_stream, taskid);
						if (ret == DIS_SUCCESS) {
							ret = diswst(phost->hn_stream,
								     name);
						}
					}
				}
				free(name);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = (dis_flush(phost->hn_stream) == -1) ? DIS_NOCOMMIT : DIS_SUCCESS;
				if (ret != DIS_SUCCESS)
					goto done;
				reply = FALSE;
				goto done;
			}

			/*
			 ** Task should be here... look for it.
			 */
			if ((ptask = task_find(pjob, taskid)) != NULL) {
				if ((ip = task_findinfo(ptask, name)) != NULL) {
					ret = tm_reply(fd, version, TM_OKAY, event);
					if (ret != DIS_SUCCESS)
						goto done;
					ret = diswcs(fd, ip->ie_info, ip->ie_len);
					break;
				}
			}
			ret = tm_reply(fd, version, TM_ERROR, event);
			if (ret != DIS_SUCCESS)
				goto done;
			ret = diswsi(fd, TM_ENOTFOUND);
			break;

		case TM_RESOURCES:
			/*
			 ** Get resource string for a node.
			 */
			DBPRT(("%s: RESOURCES %s for node %d\n", __func__, jobid, tvnodeid))
			if (prev_error)
				goto done;

			if (pjob->ji_nodeid != TO_PHYNODE(tvnodeid)) { /* not me */
				ep = event_alloc(pjob, IM_GET_RESC, fd, phost,
						 event, fromtask);
				ret = im_compose(phost->hn_stream, jobid, cookie,
						 IM_GET_RESC, ep->ee_event, fromtask, IM_OLD_PROTOCOL_VER);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = diswui(phost->hn_stream, myvnodeid);
				if (ret != DIS_SUCCESS)
					goto done;
				ret = (dis_flush(phost->hn_stream) == -1) ? DIS_NOCOMMIT : DIS_SUCCESS;
				if (ret != DIS_SUCCESS)
					goto done;
				reply = FALSE;
				goto done;
			}

			info = resc_string(pjob);
			ret = tm_reply(fd, version, TM_OKAY, event);
			if (ret != DIS_SUCCESS)
				goto done;
			ret = diswst(fd, info);
			free(info);
			break;

		default:
			sprintf(log_buffer, "%s: unknown command %d", jobid, command);
			(void) tm_reply(fd, version, TM_ERROR, event);
			(void) diswsi(fd, TM_EUNKNOWNCMD);
			(void) dis_flush(fd);
			goto err;
	}

done:
	if (reply) {
		DBPRT(("%s: REPLY %s\n", __func__, dis_emsg[ret]))
		if (ret != DIS_SUCCESS || dis_flush(fd) == -1) {
			sprintf(log_buffer, "comm failed %s", dis_emsg[ret]);
			log_err(errno, __func__, log_buffer);
			close_conn(fd);
		}
	}

	free(jobid);
	free(cookie);
	return 0;

err:
	if (jobid != NULL) {
		log_joberr(-1, __func__, log_buffer, jobid);
		free(jobid);
	} else
		log_err(-1, __func__, log_buffer);

	ipadd = conn->cn_addr;
	sprintf(log_buffer,
		"message refused from port %d addr %ld.%ld.%ld.%ld",
		conn->cn_port,
		(ipadd & 0xff000000) >> 24,
		(ipadd & 0x00ff0000) >> 16,
		(ipadd & 0x0000ff00) >> 8,
		(ipadd & 0x000000ff));
	close_conn(fd);
	if (cookie)
		free(cookie);
	return -1;
}

/**
 * @brief
 *	send_join_job_restart - send the JOIN_JOB or RESTART message from
 *	a Mother Superior to a Sister.
 *
 * @par Functionality:
 *	The message header is composed and sent.
 *	If the message is JOIN_JOB, the following information is also
 *	encoded and sent:
 *	    number of nodes	int
 *	    stdout port		int
 *	    stderr port		int
 *	    cred type		int
 *		<if cred len > 0>
 *		credential	string
 *	    jobattrs		attrl
 *
 * @param[in]	com    - IM message type: IM_JOIN_JOB or IM_RESTART
 * @param[in]	ep     - pointer to associated event
 * @param[in]	nth    - index of host entry (job's node number for this sister)
 * @param[in]	pjob   - pointer to job structure for job to be run
 * @param[in]	phead  - pointer to pbs_list_head of job's encoded attributes
 */

void
send_join_job_restart(int com, eventent *ep, int nth, job *pjob, pbs_list_head *phead)
{
	size_t mycred_len = 0;
	char *mycred_buf = NULL;
	hnodent *np;
	svrattrl *psatl;
	int stream;

	if (pjob->ji_hosts == NULL)
		return;

	/* find the "nth" hnodent (host entry) of the job and stream to it */
	np = &pjob->ji_hosts[nth];
	stream = np->hn_stream;

	/* send message header */
	im_compose(stream, pjob->ji_qs.ji_jobid,
		   get_jattr_str(pjob, JOB_ATR_Cookie),
		   com, ep->ee_event, TM_NULL_TASK, IM_OLD_PROTOCOL_VER);

	if (com == IM_JOIN_JOB) {
		/* for JOIN_JOB send body of message */
		(void) get_credential(np->hn_host, pjob,
				      PBS_GC_EXEC, &mycred_buf, &mycred_len);

		(void) diswsi(stream, pjob->ji_numnodes);
		(void) diswsi(stream, pjob->ji_ports[0]);
		(void) diswsi(stream, pjob->ji_ports[1]);
		(void) diswsi(stream, pjob->ji_extended.ji_ext.ji_credtype);
		if (mycred_len > 0) {
			(void) diswcs(stream,
				      mycred_buf, mycred_len);
			free(mycred_buf);
		}

		psatl = (svrattrl *) GET_NEXT(*phead);
		(void) encode_DIS_svrattrl(stream, psatl);
	}
	dis_flush(stream);
}

/**
 * @brief
 *	send_join_job_restart - send the JOIN_JOB or RESTART message from
 *	a Mother Superior to a Sister.
 *
 * @par Functionality:
 *	The message header is composed and sent.
 *	If the message is JOIN_JOB, the following information is also
 *	encoded and sent:
 *	    number of nodes	int
 *	    stdout port		int
 *	    stderr port		int
 *	    cred type		int
 *		<if cred len > 0>
 *		credential	string
 *	    jobattrs		attrl
 *
 * @param[in]   mtfd   - The TPP multicast stream descriptor
 * @param[in]	com    - IM message type: IM_JOIN_JOB or IM_RESTART
 * @param[in]	ep     - pointer to associated event
 * @param[in]	nth    - index of host entry (job's node number for this sister)
 * @param[in]	pjob   - pointer to job structure for job to be run
 * @param[in]	phead  - pointer to list_head of job's encoded attributes
 */

void
send_join_job_restart_mcast(int mtfd, int com, eventent *ep, int nth, job *pjob, pbs_list_head *phead)
{
	size_t mycred_len = 0;
	char *mycred_buf = NULL;
	hnodent *np;
	svrattrl *psatl;
	int stream;

	if (pjob->ji_hosts == NULL)
		return;

	/* find the "nth" hnodent (host entry) of the job and stream to it */
	np = &pjob->ji_hosts[nth];
	stream = mtfd;

	/* send message header */
	im_compose(stream, pjob->ji_qs.ji_jobid,
		   get_jattr_str(pjob, JOB_ATR_Cookie),
		   com, ep->ee_event, TM_NULL_TASK, IM_OLD_PROTOCOL_VER);

	if (com == IM_JOIN_JOB) {
		/* for JOIN_JOB send body of message */
		(void) get_credential(np->hn_host, pjob,
				      PBS_GC_EXEC, &mycred_buf, &mycred_len);

		(void) diswsi(stream, pjob->ji_numnodes);
		(void) diswsi(stream, pjob->ji_ports[0]);
		(void) diswsi(stream, pjob->ji_ports[1]);
		(void) diswsi(stream, pjob->ji_extended.ji_ext.ji_credtype);
		if (mycred_len > 0) {
			(void) diswcs(stream,
				      mycred_buf, mycred_len);
			free(mycred_buf);
		}

		psatl = (svrattrl *) GET_NEXT(*phead);
		(void) encode_DIS_svrattrl(stream, psatl);
	}
	dis_flush(stream);
}


================================================
FILE: src/resmom/mom_hook_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_hook_func.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <sys/param.h>
#include <dirent.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/wait.h>
#include <ctype.h>
#include <errno.h>
#include <assert.h>

#include <memory.h>
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "libpbs.h"
#include "list_link.h"
#include "work_task.h"
#include "hook.h"
#include "log.h"
#include "server_limits.h"
#include "attribute.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "svrfunc.h"
#include "pbs_python.h" /* for python interpreter */
#include <signal.h>
#include "mom_func.h"
#include "placementsets.h"
#include "resmon.h"
#include "libutil.h"
#include "pbs_nodes.h"
#include "net_connect.h"
#include "mom_hook_func.h"
#include "mom_server.h"
#include "hook.h"
#include "pbs_reliable.h"
#include "pbs_version.h"
#include "tpp.h"
#include "dis.h"
#include <openssl/sha.h>

#define RESCASSN_NCPUS "resources_assigned.ncpus"
#define RESCASSN_MEM "resources_assigned.mem"
#define RESCASSN_HOST "resources_assigned.host"
/* External functions */

/* Local Private Functions */

/* Global Data items */
static int run_exit = 0; /* run exit of child */

extern int exiting_tasks;
extern int resc_access_perm;
extern char *path_hooks;
extern char *path_hooks_workdir;
extern char *path_log;
extern char *path_spool;
extern char *mom_home;
extern char mom_host[];
extern char mom_short_name[];
extern pbs_list_head svr_execjob_begin_hooks;
extern pbs_list_head svr_execjob_prologue_hooks;
extern pbs_list_head svr_execjob_epilogue_hooks;
extern pbs_list_head svr_execjob_preterm_hooks;
extern pbs_list_head svr_execjob_launch_hooks;
extern pbs_list_head svr_execjob_end_hooks;
extern pbs_list_head svr_exechost_periodic_hooks;
extern pbs_list_head svr_exechost_startup_hooks;
extern pbs_list_head svr_execjob_attach_hooks;
extern pbs_list_head svr_execjob_resize_hooks;
extern pbs_list_head svr_execjob_abort_hooks;
extern pbs_list_head svr_execjob_postsuspend_hooks;
extern pbs_list_head svr_execjob_preresume_hooks;
extern pbs_list_head svr_hook_job_actions;
extern pbs_list_head svr_hook_vnl_actions;

extern pbs_list_head task_list_immed;
extern pbs_list_head task_list_timed;
extern pbs_list_head task_list_event;
extern pbs_list_head svr_alljobs;

extern char *msg_err_malloc;

extern time_t time_now;

extern int num_pcpus;
extern int num_acpus;
extern u_Long av_phy_mem;

extern int becomeuser(job *pjob);

extern int send_sched_recycle(char *user);

static void post_periodic_hook(struct work_task *pwt);
static void mom_process_background_hooks(struct work_task *ptask);

extern vnl_t *vnlp;
extern unsigned long hook_action_id;
extern int internal_state_update; /* flag for sending mom information update to the server */

extern int server_stream;

extern char **environ;

/**
 * @brief
 * 	Print job data into stream pointed by 'fp'.
 *
 * @param[in]	fp - stream pointer where data is flushed
 * @param[in]	pjob - pointer to job whose data is being printed out
 *
 */
static void
fprintf_job_struct(FILE *fp, job *pjob)
{
	pbs_list_head phead;
	svrattrl *psatl;
	svrattrl *ps;
	int i;

	if ((fp == NULL) || (pjob == NULL)) {
		return;
	}

	fprintf(fp, "%s.%s=%s\n", EVENT_JOB_OBJECT, "id", pjob->ji_qs.ji_jobid);

	/* Now print job attributes and resources */
	CLEAR_HEAD(phead);
	for (i = 0; i < (int) JOB_ATR_LAST; i++) {
		(void) (job_attr_def + i)->at_encode(get_jattr(pjob, i), &phead, (job_attr_def + i)->at_name, NULL, ATR_ENCODE_MOM, NULL);
	}
	attrl_fixlink(&phead);

	psatl = (svrattrl *) GET_NEXT(phead);
	for (ps = psatl; ps; ps = (svrattrl *) GET_NEXT(ps->al_link)) {
		if (ps->al_resc != NULL) {
			fprintf(fp, "%s.%s[%s]=%s\n", EVENT_JOB_OBJECT,
				ps->al_name, ps->al_resc, ps->al_value);
		} else {
			if (strcmp(ps->al_name, ATTR_v) == 0)
				fprintf(fp, "%s.%s=\"\"\"%s\"\"\"\n", EVENT_JOB_OBJECT, ps->al_name, ps->al_value);
#if MOM_ALPS
			else if (strcmp(ps->al_name, ATTR_tolerate_node_failures) == 0)
				fprintf(fp, "%s.%s=none\n", EVENT_JOB_OBJECT, ps->al_name);
#endif
			else
				fprintf(fp, "%s.%s=%s\n", EVENT_JOB_OBJECT, ps->al_name, ps->al_value);
		}
	}

	free_attrlist(&phead);
}

/**
 * @brief
 *	Alarm handling function to the set_alarm() call.
 *
 */
static void
run_hook_alarm(void)
{
	run_exit = -3;
}

/**
 * @brief
 *	Print to file pointed to by 'fp', the values in a vnl_t structure 'vp'.
 *
 * @param[in] 	fp - pointer to file to dump output into
 * @param[in]	head_str - some string to prefix outputted data
 * @param[in]	vp - pointer to a vnl_t structure containing data to print out.
 *
 * @note
 * 	vnl_t entry with attribute ATTR_NODE_TopologyInfo is ignored.
 *
 * @return none
 *
 */
void
fprint_vnl(FILE *fp, char *head_str, vnl_t *vp)
{
	char *p;
	int i, j;
	char *attname = NULL;
	char *attres = NULL;

	if ((fp == NULL) || (head_str == NULL) || (vp == NULL))
		return;

	for (i = 0; i < vp->vnl_used; i++) {
		vnal_t *vnalp;

		vnalp = VNL_NODENUM(vp, i);

		for (j = 0; j < vnalp->vnal_used; j++) {
			vna_t *vnap;

			vnap = VNAL_NODENUM(vnalp, j);
			attname = vnap->vna_name;
			if (strcmp(attname, ATTR_NODE_TopologyInfo) == 0) {
				/* ignoring this internal attribute  */
				/* since it tends to be quite a big data, */
				/* plus no support right now in hooks */
				/* to modify this data. */
				continue;
			}
			attres = NULL;
			p = strrchr(vnap->vna_name, '.');
			if (p != NULL) {
				*p = '\0';
				p++;
				attres = p;
			}

			if (attres != NULL) {
				fprintf(fp, "%s[\"%s\"].%s[%s]=%s\n",
					head_str,
					vnalp->vnal_id, attname, attres,
					vnap->vna_val);
			} else {
				fprintf(fp, "%s[\"%s\"].%s=%s\n",
					head_str,
					vnalp->vnal_id, attname,
					vnap->vna_val);
			}
			if (p != NULL)
				*p = '.'; /* restore value */
		}
	}
	fflush(fp);
}

/**
 * @brief
 *	Print to file pointed to by 'fp', the values of each job in the 'joblist'.
 *
 * @param[in] 	fp - pointer to file to dump output into
 * @param[in]	head_str - some string to prefix outputted data
 * @param[in]	joblist - pointer to a  list of jobs.
 *
 * @return none
 *
 */
void
fprint_joblist(FILE *fp, char *head_str, pbs_list_head *joblist)
{
	job *pjob;
	int i;
	pbs_list_head phead;
	svrattrl *psatl;
	svrattrl *ps;
	char *jobid;
	int keeping = 0;
	char *std_file = NULL;

	if ((fp == NULL) || (head_str == NULL) || (joblist == NULL))
		return;

	for (pjob = (job *) GET_NEXT(*joblist); pjob;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {

		jobid = pjob->ji_qs.ji_jobid;
		/* Now print job attributes and resources */
		CLEAR_HEAD(phead);
		for (i = 0; i < (int) JOB_ATR_LAST; i++) {
			(void) (job_attr_def + i)->at_encode(get_jattr(pjob, i), &phead, (job_attr_def + i)->at_name, NULL, ATR_ENCODE_MOM, NULL);
		}
		attrl_fixlink(&phead);

		psatl = (svrattrl *) GET_NEXT(phead);
		for (ps = psatl; ps; ps = (svrattrl *) GET_NEXT(ps->al_link)) {
			if (ps->al_resc != NULL) {
				fprintf(fp, "%s[\"%s\"].%s[%s]=%s\n",
					head_str, jobid, ps->al_name, ps->al_resc,
					ps->al_value);
			} else {
				fprintf(fp, "%s[\"%s\"].%s=%s\n",
					head_str,
					jobid, ps->al_name, ps->al_value);
			}
		}
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) != 0) {
			fprintf(fp, "%s[\"%s\"]._msmom=True\n",
				head_str, jobid);
		}

		std_file = std_file_name(pjob, StdOut, &keeping);
		fprintf(fp, "%s[\"%s\"]._stdout_file=%s\n",
			head_str, jobid, std_file ? std_file : "");
		std_file = std_file_name(pjob, StdErr, &keeping);
		fprintf(fp, "%s[\"%s\"]._stderr_file=%s\n",
			head_str, jobid, std_file ? std_file : "");
		free_attrlist(&phead);
	}
}

/**
 * @brief
 *	Add to a vnl_t structure 'p_vnlp' the natural vnode information.
 *
 * @Note
 *	This uses the mom_short_name as natural vnode name.
 *
 * @param[in/out] p_vnlp - the vnl_t structure to put natural vnode info.
 *			 - Be sure to free up the *p_vnlp structure when
 *			 - done as it is malloced.
 *
 * @return none
 *
 */
static void
add_natural_vnode_info(vnl_t **p_vnlp)
{
	char bufs[BUFSIZ];
	char *msgbuf;

	if (*p_vnlp == NULL) {
		if (vnl_alloc(p_vnlp) == NULL) {
			log_err(errno, __func__, "Failed to allocate vnlp");
			return;
		}
	}

	snprintf(bufs, sizeof(bufs), "%d", num_pcpus);
	if (vn_addvnr(*p_vnlp, mom_short_name, ATTR_NODE_pcpus, bufs, 0, 0, NULL) == -1) {
		pbs_asprintf(&msgbuf,
			     "Failed to add '%s %s=%s' to vnode list",
			     mom_short_name, ATTR_NODE_pcpus, bufs);
		log_err(-1, __func__, msgbuf);
		free(msgbuf);
		return;
	}

	snprintf(bufs, sizeof(bufs), "%d", num_acpus);
	if (vn_addvnr(*p_vnlp, mom_short_name, "resources_available.ncpus", bufs, 0, 0, NULL) == -1) {
		pbs_asprintf(&msgbuf,
			     "Failed to add '%s %s=%s' to vnode list",
			     mom_short_name, "resources_available.ncpus", bufs);
		log_err(-1, __func__, msgbuf);
		free(msgbuf);
		return;
	}

	snprintf(bufs, sizeof(bufs), "%llukb", av_phy_mem);
	if (vn_addvnr(*p_vnlp, mom_short_name, "resources_available.mem", bufs, 0, 0, NULL) == -1) {
		pbs_asprintf(&msgbuf,
			     "Failed to add '%s %s=%s' to vnode list",
			     mom_short_name, "resources_available.mem", bufs);
		log_err(-1, __func__, msgbuf);
		free(msgbuf);
		return;
	}

	if (vn_addvnr(*p_vnlp, mom_short_name, "resources_available.arch",
		      arch(NULL), 0, 0, NULL) == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to add '%s %s=%s' to vnode list",
			 mom_host, "arch", arch(NULL));
		log_err(-1, __func__, log_buffer);
		return;
	}

	if (vn_addvnr(*p_vnlp, mom_short_name, "pbs_version",
		      PBS_VERSION, 0, 0, NULL) == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to add '%s %s=%s' to vnode list",
			 mom_short_name, "pbs_version", PBS_VERSION);
		log_err(-1, __func__, log_buffer);
		return;
	}
}

/**
 * @brief
 *	Free any vnl_t structures contained in a hook_vnl_action list and
 *	delete the individual list structure.
 *
 * @param[in]	listh - the head of the list of hook_vnl_action structures
 *
 * @return none
 *
 */
void
vna_list_free(pbs_list_head listh)
{
	struct hook_vnl_action *pvna;
	struct hook_vnl_action *nxt;

	pvna = (struct hook_vnl_action *) GET_NEXT(listh);

	while (pvna != NULL) {
		nxt = (struct hook_vnl_action *) GET_NEXT(pvna->hva_link);
		if (pvna->hva_vnl)
			vnl_free((vnl_t *) pvna->hva_vnl);
		delete_link(&pvna->hva_link);
		free(pvna);
		pvna = nxt;
	}
}

/**
 * @brief
 *	Copies 'src_file' to 'dest_file' and set 'dest_file' permission
 *	from 'pjob''s data.
 *
 * @param[in]	src_file - the source file to copy
 * @param[in]	dest_file - the destination file
 * @param[in]	pjob - job whose permissions will be used to the
 * 			'dest_file'.
 *
 * @return int
 * @retval 0  - for success
 * @retval -1 - for failure.
 *
 */
static int
copy_file_and_set_owner(char *src_file, char *dest_file, job *pjob)
{
	int st;

	if ((src_file == NULL) || (dest_file == NULL) || (pjob == NULL))
		return -1;

	st = copy_file_internal(src_file, dest_file);

	switch (st) {
		case 0:
			break;
		case COPY_FILE_BAD_INPUT:
			log_errf(errno, __func__,
				 "copy_file_internal: bad input parameter src_file: %s; dest_file: %s",
				 src_file, dest_file);
			return -1;
		case COPY_FILE_BAD_SOURCE:
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to open file %s",
				 src_file);
			log_err(errno, __func__, log_buffer);
			return -1;
		case COPY_FILE_BAD_DEST:
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to open file copy %s",
				 dest_file);
			log_err(errno, __func__, log_buffer);
			return -1;
		case COPY_FILE_BAD_WRITE:
			snprintf(log_buffer,
				 sizeof(log_buffer),
				 "Failed writing to file %s",
				 dest_file);
			log_err(errno, __func__, log_buffer);
			return -1;
		default:
			snprintf(log_buffer,
				 sizeof(log_buffer),
				 "Unknown copy_file_internal return %d; src_file: %s; dest_file: %s",
				 st, src_file, dest_file);
			log_err(errno, __func__, log_buffer);
			return -1;
	}
#ifndef WIN32
	if (chown(dest_file,
		  pjob->ji_qs.ji_un.ji_momt.ji_exuid,
		  pjob->ji_qs.ji_un.ji_momt.ji_exgid) == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "chown: %s", dest_file);
		log_err(errno, __func__, log_buffer);
		(void) unlink(dest_file);
		return -1;
	}
#else /* Windows */

	if (secure_file2(dest_file,
			 pjob->ji_user->pw_name,
			 READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED,
			 "Administrators",
			 READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED) == 0) {
		snprintf(log_buffer, LOG_BUF_SIZE, "Unable to change permissions of the file for user: %s, file: %s",
			 pjob->ji_user->pw_name, dest_file);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
			  __func__, log_buffer);
		(void) unlink(dest_file);
		return -1;
	}
#endif

	return 0;
}

/**
 * @brief
 * 	Add to the vnodes list 'vnl' the data found in the vnode-to-mpi-process
 *	mapping array 'vnode_entry', whose number of entries is in 'num_vnodes'.
 *
 * @param[out]		vnl - pointer to the destination list of vnodes.
 * @param[in]		vnode_entry - array of vnode-to-mpi-process mappings.
 * @param[in]		num_vnodes - numbver of entries in 'vnode_entry'.
 * @param[out]		matched_vnode - set to 1 if one of the added vnodes
 * 					matches the natural vnode.
 * @return int
 * @retval 0  - for success
 * @retval -1 - for failure
 *
 */
static int
vnl_add_vnode_entries(vnl_t *vnl, vmpiprocs *vnode_entry, int num_vnodes,
		      int *matched_nvnode)
{
	int i, rc;
	char bufs[BUFSIZ];
	char *msgbuf;
	char *v_name = NULL;
	int v_cpus = 0;
	Long v_mem = 0;
	char *v_cpus_o_str = NULL;
	char *v_mem_o_str = NULL;

	if ((vnl == NULL) || (vnode_entry == NULL) ||
	    (matched_nvnode == NULL)) {
		return (0); /* incomplete input, no need to proceed  */
	}

	for (i = 0; i < num_vnodes; i++) {

		v_name = vnode_entry[i].vn_vname;

		/* matching vnode names is case-insensitive, */
		/* see find_nodebyname() where it does strcasecmp() */
		/* Also, we need to use the str case of mom_short_name */
		/* which is the natural vnode key returned by */
		/* pbs.get_local_nodename() */
		if (strcasecmp(v_name, mom_short_name) == 0)
			*matched_nvnode = 1;

		v_cpus = vnode_entry[i].vn_cpus;
		if ((v_cpus_o_str = vn_exist(vnl, v_name,
					     RESCASSN_NCPUS)) != NULL) {
			v_cpus += atoi(v_cpus_o_str);
		}

		snprintf(bufs, sizeof(bufs), "%d", v_cpus);
		rc = vn_addvnr(vnl, v_name, RESCASSN_NCPUS, bufs, 0, 0, NULL);
		if (rc == -1) {
			pbs_asprintf(&msgbuf, "%s:failed to add '%s=%s'",
				     v_name, RESCASSN_NCPUS, bufs);
			log_err(-1, __func__, msgbuf);
			free(msgbuf);
			return (-1);
		}

		if ((vnode_entry[i].vn_host != NULL) &&
		    (vnode_entry[i].vn_host->hn_host != NULL)) {

			snprintf(bufs, sizeof(bufs), "%s", vnode_entry[i].vn_host->hn_host);
			rc = vn_addvnr(vnl, v_name, RESCASSN_HOST, bufs, 0, 0, NULL);
			if (rc == -1) {
				pbs_asprintf(&msgbuf, "%s:failed to add '%s=%s'",
					     v_name, "host", bufs);
				log_err(-1, __func__, log_buffer);
				free(msgbuf);
				return (-1);
			}
		}

		v_mem = vnode_entry[i].vn_mem;
		if ((v_mem_o_str = vn_exist(vnl, v_name,
					    RESCASSN_MEM)) != NULL) {
			v_mem += atoL(v_mem_o_str);
		}

		snprintf(bufs, sizeof(bufs), "%lldkb", v_mem);
		rc = vn_addvnr(vnl, v_name, RESCASSN_MEM, bufs, 0, 0, NULL);

		if (rc == -1) {
			pbs_asprintf(&msgbuf, "%s:failed add '%s=%s'",
				     v_name, RESCASSN_MEM, bufs);
			log_err(-1, __func__, msgbuf);
			free(msgbuf);
			return (-1);
		}
	}
	return (0);
}

/**
 * @brief
 *	Duplicates pointer to hooks parameters.
 *
 * @param[in]   php - structure for duplication
 *
 * @return new_php	for success
 * @return NULL		for error
 *
 */
mom_process_hooks_params_t
	*
	duplicate_php(mom_process_hooks_params_t *php)
{
	mom_process_hooks_params_t *new_php;

	if ((new_php = (mom_process_hooks_params_t *) malloc(
		     sizeof(mom_process_hooks_params_t))) == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		return NULL;
	}

	new_php->hook_event = php->hook_event;
	new_php->req_user = php->req_user;
	new_php->req_host = php->req_host;
	new_php->hook_msg = php->hook_msg;
	new_php->msg_len = php->msg_len;
	new_php->update_svr = php->update_svr;
	new_php->hook_input = php->hook_input;
	new_php->hook_output = php->hook_output;
	new_php->parent_wait = php->parent_wait;

	return new_php;
}

/**
 * @brief
 *	Runs the hook 'phook' in a child process in response to 'event_type'
 *	with input parameter 'hook_input'.
 *
 * @param[in]	phook	- pointer to hook being run.
 * @param[in]	event_type - the hook event type (e.g. HOOK_EVENT_EXECJOB_BEGIN)
 * @param[in]	hook_input - struct containing input parameters.
 * @param[in]	req_user - user executing the hook
 * @param[in]	req_host - where the hook is executing
 * @param[in]   parent_wait - if set to 1, parent process will wait for hook to
 *		finish; otherwise, it gets run in the background and when done,
 *		the 'post_func' below will execute.
 *		With parent_wait == 0, file_in, file_out are not filled in.
 * @param[in]   post_func - to function to execute when backgrounded hook
 *		finishes execution.
 *		, parent process will wait for job
 * @param[in/out] file_in 	- be filled in by the hook input file used
 * @param[in/out] file_out	- be filled in by the hook output file used
 * @param[in/out] file_data	- be filled in by the hook server data file used
 * @param[in]	  file_size	- max size of file_in and file_out string
 *				  buffers.
 * @param[in]	  php - holds the arguments from mom_process_hooks function
 *
 *
 * @return int		the exit value of the executing hook script
 * @return 0		for success
 * @return != 0		for error
 *
 */
static int
run_hook(hook *phook, unsigned int event_type, mom_hook_input_t *hook_input,
	 char *req_user, char *req_host,
	 int parent_wait, void (*post_func)(struct work_task *),
	 char *file_in, char *file_out, char *file_data, size_t file_size,
	 mom_process_hooks_params_t *php)
{

	FILE *fp = NULL;
	char in_data[LOG_BUF_SIZE + 1];
	char hook_inputfile[MAXPATHLEN + 1];
	char hook_outputfile[MAXPATHLEN + 1];
	char hook_datafile[MAXPATHLEN + 1];
	char script_copy[MAXPATHLEN + 1];
	char hook_config_copy[MAXPATHLEN + 1];
	char rescdef_copy[MAXPATHLEN + 1];
	char log_file[MAXPATHLEN + 1];
	char *script_file = NULL;
	char *rescdef_file = NULL;
	int waitst = 0;
	char pypath[MAXPATHLEN + 1];
	pid_t child;
	struct stat sbuf;
	int runas_jobuser = 0; /* if 1, run as job's euser */
	struct work_task *ptask;
	vnl_t *vnl = NULL;
	vnl_t *vnl_fail = NULL;
	pbs_list_head *failed_mom_list = NULL;
	pbs_list_head *succeeded_mom_list = NULL;
	vnl_t *nv = NULL;
	int vnl_created = 0;
	job *pjob = NULL;
	int matched_nvnode = 0; /* match natural vnode */
	char *arg[14];
	pid_t myseq; /* just some unique sequence number */
	char logmask[BUFSIZ];
	char path_hooks_rescdef[MAXPATHLEN + 1];
	char cmdline[2 * BUFSIZ + 16]; /* Additional bytes for command options */
	struct passwd *pwdp = NULL;
#ifdef WIN32
	FILE *fp2 = NULL;
	pio_handles pio;
#endif
	char *progname = NULL;
	char **argv = NULL;
	char **env = NULL;
	char *env_str = NULL;
	pid_t pid = -1;
	int k;
	char script_path[MAXPATHLEN + 1];
	char hook_config_path[MAXPATHLEN + 1];
	char *p;
	pbs_list_head *jobs_list = NULL;
	char *pc;
	int keeping = 0;
	char *std_file = NULL;
	reliable_job_node *rjn;

	if ((phook == NULL) || (req_user == NULL) || (req_host == NULL)) {
		log_err(-1, __func__, "Bad input received!");
		return -1;
	}

	if (phook->hook_name == NULL) {
		log_err(-1, __func__, "hook has no name");
		return -1;
	}

	if (phook->script == NULL) {
		log_errf(-1, __func__, "hook %s has no script value", phook->hook_name);
		return -1;
	}
	if (hook_input == NULL) {
		log_err(-1, __func__, "missing input argument to event");
		return (-1);
	}

	/* Validate input parameters */

	switch (event_type) {
		case HOOK_EVENT_EXECJOB_LAUNCH:
		case HOOK_EVENT_EXECJOB_ATTACH:
			if (event_type == HOOK_EVENT_EXECJOB_LAUNCH) {
				progname = hook_input->progname;
				argv = hook_input->argv;
				env = hook_input->env;
			} else {
				pid = hook_input->pid;
			}
			/* falls through */
		case HOOK_EVENT_EXECJOB_BEGIN:
		case HOOK_EVENT_EXECJOB_RESIZE:
		case HOOK_EVENT_EXECJOB_PROLOGUE:
		case HOOK_EVENT_EXECJOB_PRETERM:
		case HOOK_EVENT_EXECJOB_EPILOGUE:
		case HOOK_EVENT_EXECJOB_END:
		case HOOK_EVENT_EXECJOB_ABORT:
		case HOOK_EVENT_EXECJOB_POSTSUSPEND:
		case HOOK_EVENT_EXECJOB_PRERESUME:
			pjob = hook_input->pjob;
			if ((event_type == HOOK_EVENT_EXECJOB_LAUNCH) ||
			    (event_type == HOOK_EVENT_EXECJOB_PROLOGUE)) {
				vnl = (vnl_t *) hook_input->vnl;
				vnl_fail = (vnl_t *) hook_input->vnl_fail;
				failed_mom_list = hook_input->failed_mom_list;
				succeeded_mom_list = hook_input->succeeded_mom_list;
			}
			break;
		case HOOK_EVENT_EXECHOST_PERIODIC:
			jobs_list = hook_input->jobs_list;
			/* falls through */
		case HOOK_EVENT_EXECHOST_STARTUP:
			vnl = hook_input->vnl;
			break;
		default:
			log_err(-1, __func__, "unknown hook event");
			return (-1);
	}

	snprintf(pypath, MAXPATHLEN, "%s/bin/pbs_python", pbs_conf.pbs_exec_path);
	run_exit = 0;

	if ((phook->user == HOOK_PBSUSER) && (event_type & USER_MOM_EVENTS))
		runas_jobuser = 1;

	child = fork();
	if (child > 0) { /* parent */

		if (!parent_wait) {
			ptask = set_task(WORK_Deferred_Child, child,
					 post_func, phook);
			if (!ptask) {
				log_err(errno, __func__, msg_err_malloc);
				return (-1);
			}
			if (php) {
				ptask->wt_parm2 = (void *) php;
				if (php->hook_input && php->hook_input->pjob)
					php->hook_input->pjob->ji_bg_hook_task = ptask;
			}
			return (0); /* no hook output file at this time */
		} else if (php)
			php->child = child;

		set_alarm(phook->alarm, run_hook_alarm);
		while (waitpid(child, &waitst, 0) < 0) { /* error on wait */
			if (errno != EINTR) {		 /* continue loop on signal */
				run_exit = -5;
				break;
			}
			kill(-child, SIGKILL);
		}
		set_alarm(0, NULL);
		kill(-child, SIGKILL);
		if (run_exit == 0) {
			if (WIFEXITED(waitst)) {
				run_exit = WEXITSTATUS(waitst);
			} else if (WIFSIGNALED(waitst)) {
				run_exit = -4;
			}
		} else {
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_INFO, phook->hook_name,
				   "prematurely completed %s, exit=%d", ((struct python_script *) (phook->script))->path, run_exit);
		}

	} else {
		run_exit = 255;
		if (!child) { /* child */
			/* releasing ports */
			tpp_terminate();
			net_close(-1);
			setsid();

			myseq = getpid();
		} else if (errno == ENOSYS) {
			/* fork not available continue in foreground */
			myseq = rand();
			child = myseq;
			if (php)
				php->child = child;
		} else {
			log_err(errno, __func__, "fork failed");
			goto run_hook_exit;
		}

		snprintf(path_hooks_rescdef, MAXPATHLEN, "%s%s", path_hooks, PBS_RESCDEF);
		pbs_strncpy(hook_config_path, ((struct python_script *) phook->script)->path, sizeof(hook_config_path));
		p = strstr(hook_config_path, HOOK_SCRIPT_SUFFIX);
		if (p != NULL) {
			/* replace <HOOK_SCRIPT_SUFFIX> with <HOOK_CONFIG_SUFFIX>: */
			/* must copy up to HOOK_SCRIPT_SUFFIX length so as to not */
			/* overflow */
			snprintf(p, sizeof(hook_config_path) - (p - hook_config_path), "%s", HOOK_CONFIG_SUFFIX);
			if (stat(hook_config_path, &sbuf) != 0) {
				hook_config_path[0] = '\0';
			}
		} else
			hook_config_path[0] = '\0';

		if (runas_jobuser) {

			/* use world writable spool directory */

			snprintf(hook_inputfile, MAXPATHLEN, FMT_HOOK_INFILE, path_spool, hook_event_as_string(event_type), phook->hook_name, myseq);
			snprintf(hook_outputfile, MAXPATHLEN, FMT_HOOK_OUTFILE, path_spool, hook_event_as_string(event_type), phook->hook_name, myseq);
			snprintf(hook_datafile, MAXPATHLEN, FMT_HOOK_DATAFILE, path_spool, hook_event_as_string(event_type), phook->hook_name, myseq);
			snprintf(script_copy, MAXPATHLEN, FMT_HOOK_SCRIPT, path_spool, myseq);
			snprintf(hook_config_copy, MAXPATHLEN, FMT_HOOK_CONFIG, path_spool, myseq);
			snprintf(rescdef_copy, MAXPATHLEN, FMT_HOOK_RESCDEF, path_spool, myseq);
			snprintf(log_file, MAXPATHLEN, FMT_HOOK_LOG, path_spool, myseq);

			/*
			 * get the password entry for the user under which the
			 * job is to be run we do this now to save a few things
			 * in the job structure
			 * All this info needed to pre-fetch for becomeuser()
			 * to work.
			 */

			if (pjob == NULL) {
				log_err(-1, __func__, "No job parameter passed!");
				goto run_hook_exit;
			}

			pwdp = check_pwd(pjob);
			if (pwdp == NULL) {
				log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, log_buffer);
				goto run_hook_exit;
			}

			if (pjob->ji_grpcache == NULL) {
				log_errf(-1, __func__, "job %s has no ji_grpcache value", pjob->ji_qs.ji_jobid);
				goto run_hook_exit;
			}

			pjob->ji_qs.ji_un.ji_momt.ji_exuid = pjob->ji_grpcache->gc_uid;
			pjob->ji_qs.ji_un.ji_momt.ji_exgid = pjob->ji_grpcache->gc_gid;

			pbs_strncpy(script_path, ((struct python_script *) phook->script)->path, sizeof(script_path));

			/* copy hook_config_path to user-accessible [PBS_HOME]/path_spool. */
			if (hook_config_path[0] != '\0') {
				if (copy_file_and_set_owner(hook_config_path, hook_config_copy, pjob) == -1)
					goto run_hook_exit;
				/* set hook_config_path to hook_config_copy if the copying was successful */
				snprintf(hook_config_path, sizeof(hook_config_path), "%s", hook_config_copy);
			}
			/* copy script_path to user-accessible [PBS_HOME]/path_spool */
			if (copy_file_and_set_owner(script_path, script_copy, pjob) == -1)
				goto run_hook_exit;
			if (stat(path_hooks_rescdef, &sbuf) == 0) {
				if (copy_file_and_set_owner(path_hooks_rescdef, rescdef_copy, pjob) == -1)
					goto run_hook_exit;
				rescdef_file = (char *) rescdef_copy;
			}
			script_file = (char *) script_copy;

#ifndef WIN32
			if (chown(script_file, pjob->ji_qs.ji_un.ji_momt.ji_exuid, pjob->ji_qs.ji_un.ji_momt.ji_exgid) == -1) {
				log_errf(errno, __func__, "chown: %s", script_file);
				goto run_hook_exit;
			}
#else /* Windows */

			if (secure_file2(script_file, pjob->ji_user->pw_name, READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED,
					 "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED) == 0) {
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, __func__,
					   "Unable to change permissions of the script file for user: %s, file: %s",
					   pjob->ji_user->pw_name, script_file);
				goto run_hook_exit;
			}
#endif

			if ((fp = fopen(hook_inputfile, "w")) == NULL) {
				log_errf(errno, __func__, "open of input file %s failed!", hook_inputfile);
				goto run_hook_exit;
			}

#ifndef WIN32
			if (chown(hook_inputfile, pjob->ji_qs.ji_un.ji_momt.ji_exuid, pjob->ji_qs.ji_un.ji_momt.ji_exgid) == -1) {
				log_errf(errno, __func__, "chown: %s", hook_inputfile);
				goto run_hook_exit;
			}

			/* NOTE: "launch" hook is already running as the user */
			if (becomeuser(pjob) != 0) {
				char *jobuser;

				jobuser = get_jattr_str(pjob, JOB_ATR_euser);
				log_errf(errno, __func__, "Unable to become user %s!", (jobuser ? jobuser : "<job euser unset>"));
				goto run_hook_exit;
			}
#else
			if (secure_file2(hook_inputfile, pjob->ji_user->pw_name, READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED,
					 "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED) == 0) {
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, __func__,
					   "Unable to change permissions of the hook input file for user: %s, file: %s",
					   pjob->ji_user->pw_name, hook_inputfile);
				goto run_hook_exit;
			}

			/* Force create the log file, to secure afterwards */
			if ((fp2 = fopen(log_file, "w")) == NULL) {
				log_errf(errno, __func__, "open of log file %s failed!", log_file);
				goto run_hook_exit;
			}
			fclose(fp2);
			fp2 = NULL;

			if (secure_file2(log_file, pjob->ji_user->pw_name, READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED,
					 "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED) == 0) {
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, __func__,
					   "Unable to change permissions of the log file for user: %s, file: %s",
					   pjob->ji_user->pw_name, log_file);
				goto run_hook_exit;
			}
#endif

			/*
			 * chdir to path_spool like a job
			 * NOTE: For launch hooks, it is already in the
			 * environment of the job, so we don't want to
			 * disturb its current working directory.
			 */
			if (chdir(path_spool) != 0)
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_WARNING, phook->hook_name, "unable to go to spool directory");
		} else { /* run as root */
			snprintf(hook_inputfile, MAXPATHLEN, FMT_HOOK_INFILE, path_hooks_workdir, hook_event_as_string(event_type), phook->hook_name, myseq);
			snprintf(hook_outputfile, MAXPATHLEN, FMT_HOOK_OUTFILE, path_hooks_workdir, hook_event_as_string(event_type), phook->hook_name, myseq);
			snprintf(hook_datafile, MAXPATHLEN, FMT_HOOK_DATAFILE, path_hooks_workdir, hook_event_as_string(event_type), phook->hook_name, myseq);

			script_file = ((struct python_script *) phook->script)->path;
			if (script_file == NULL) {
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name, "No script file found!");
				goto run_hook_exit;
			}

			if (stat(path_hooks_rescdef, &sbuf) == 0)
				rescdef_file = path_hooks_rescdef;

			log_file[0] = '\0';

			if ((fp = fopen(hook_inputfile, "w")) == NULL) {
				log_errf(errno, __func__, "open of input file %s failed!", hook_inputfile);
				goto run_hook_exit;
			}

#ifdef WIN32
			if (secure_file(hook_inputfile, "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED) == 0)
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, __func__,
					   "Failed to change hook input file permissions for file: %s", hook_inputfile);
#endif
			/*
			 * still need to chdir() here. A periodic hook may be
			 * running the hook periodically and may no longer in the
			 * original working directory
			 */
			if (chdir(path_hooks_workdir) != 0)
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_WARNING, phook->hook_name, "unable to go to hooks tmp directory");
		}

		switch (event_type) {
			case HOOK_EVENT_EXECJOB_LAUNCH:
			case HOOK_EVENT_EXECJOB_ATTACH:
				if (event_type == HOOK_EVENT_EXECJOB_LAUNCH) {

					if ((progname != NULL) && (progname[0] != '\0'))
						fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, PY_EVENT_PARAM_PROGNAME, progname);

					if (argv != NULL) {
						k = 0;
						while (argv[k]) {
							fprintf(fp, "%s.%s[%d]=%s\n", EVENT_OBJECT, PY_EVENT_PARAM_ARGLIST, k, argv[k]);
							k++;
						}
					}

					env_str = env_array_to_str(env, ',');
					if (env_str != NULL) {
						if (env_str[0] != '\0')
							fprintf(fp, "%s.%s=\"\"\"%s\"\"\"\n", EVENT_OBJECT, PY_EVENT_PARAM_ENV, env_str);
						free(env_str);
					}
				} else
					fprintf(fp, "%s.%s=%d\n", EVENT_OBJECT, PY_EVENT_PARAM_PID, pid);
				/* fall through */
			case HOOK_EVENT_EXECJOB_BEGIN:
			case HOOK_EVENT_EXECJOB_RESIZE:
			case HOOK_EVENT_EXECJOB_PROLOGUE:
			case HOOK_EVENT_EXECJOB_EPILOGUE:
			case HOOK_EVENT_EXECJOB_END:
			case HOOK_EVENT_EXECJOB_PRETERM:
			case HOOK_EVENT_EXECJOB_ABORT:
			case HOOK_EVENT_EXECJOB_POSTSUSPEND:
			case HOOK_EVENT_EXECJOB_PRERESUME:
				if (pjob == NULL) {
					log_err(-1, __func__, "No job parameter passed!");
					goto run_hook_exit;
				}

				/* pass job parameter */
				fprintf_job_struct(fp, pjob);
				if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT)
					fprintf(fp, "%s._checkpointed=True\n", EVENT_JOB_OBJECT);
				if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) != 0)
					fprintf(fp, "%s._msmom=True\n", EVENT_JOB_OBJECT);
				std_file = std_file_name(pjob, StdOut, &keeping);
				fprintf(fp, "%s._stdout_file=%s\n", EVENT_JOB_OBJECT, std_file ? std_file : "");
				std_file = std_file_name(pjob, StdErr, &keeping);
				fprintf(fp, "%s._stderr_file=%s\n", EVENT_JOB_OBJECT, std_file ? std_file : "");

				/* pass vnode list parameter */
				if (vnl == NULL) {
					int errcode;

					if (vnl_alloc(&vnl) == NULL) {
						log_err(errno, __func__, "Failed to allocate a vnlp structure");
						goto run_hook_exit;
					}
					vnl_created = 1;

					if (pjob->ji_numnodes == 0) {
						/* this executes in a child process */
						if ((errcode = job_nodes(pjob)) != 0) {
							log_errf(-1, __func__, "job_nodes failed with error %d", errcode);
							goto run_hook_exit;
						}
					}

					/*
					* This looks into pjob->ji_assn_vnodes[] whose
					* entries map exec_vnode, the vnodes
					* assigned to the job along with the
					* allocated cpus and mem for each vnode.
					* For example, given
					*   exec_vnode=(hostA[0]:ncpus=3:mem=100kb)+
					*              (hostB[0]:mem=400kb:ncpus=1)+
					*              (hostA[0]:ncpus=2:mem=200kb)
					* vnl would end up getting accumulated
					* entries:
					*	(hostA[0],ncpus=5,mem=300kb)
					*	(hostB[0],ncpus=1,mem=400kb)
					*/

					if ((vnl_add_vnode_entries(vnl, pjob->ji_assn_vnodes, pjob->ji_num_assn_vnodes, &matched_nvnode) == -1))
						goto run_hook_exit;

					if (matched_nvnode)
						add_natural_vnode_info(&vnl);
				}
				fprint_vnl(fp, EVENT_VNODELIST_OBJECT, vnl);
				if (vnl_fail != NULL)
					fprint_vnl(fp, EVENT_VNODELIST_FAIL_OBJECT, vnl_fail);

				if (failed_mom_list != NULL) {
					rjn = (reliable_job_node *) GET_NEXT(*failed_mom_list);
					while (rjn) {
						fprintf(fp, "%s=%s\n", JOB_FAILED_MOM_LIST_OBJECT, rjn->rjn_host);
						rjn = (reliable_job_node *) GET_NEXT(rjn->rjn_link);
					}
				}

				if (succeeded_mom_list != NULL) {
					rjn = (reliable_job_node *) GET_NEXT(*succeeded_mom_list);
					while (rjn) {
						fprintf(fp, "%s=%s\n", JOB_SUCCEEDED_MOM_LIST_OBJECT, rjn->rjn_host);
						rjn = (reliable_job_node *) GET_NEXT(rjn->rjn_link);
					}
				}

				if (vnl_created) {
					vnl_free(vnl);
					vnl_created = 0;
				}
				break;

			case HOOK_EVENT_EXECHOST_PERIODIC:
				fprintf(fp, "%s.%s=%d\n", EVENT_OBJECT, "freq", phook->freq);
				add_natural_vnode_info(&nv);
				if (nv == NULL)
					fprint_vnl(fp, EVENT_VNODELIST_OBJECT, vnl);
				else {
					if (vnl != NULL)
						vn_merge(nv, vnl, NULL);
					fprint_vnl(fp, EVENT_VNODELIST_OBJECT, nv);
					vnl_free(nv);
				}

				fprint_joblist(fp, EVENT_JOBLIST_OBJECT, jobs_list);

				break;
			case HOOK_EVENT_EXECHOST_STARTUP:
				if (vnl == NULL) {
					/*
					* create a default vnode_list containing
					* the natural vnode, to be used as hook
					* input
					*/
					add_natural_vnode_info(&vnl);
					vnl_created = 1;
				}
				fprint_vnl(fp, EVENT_VNODELIST_OBJECT, vnl);
				if (vnl_created) {
					vnl_free(vnl);
					vnl_created = 0;
					vnl = NULL;
				}
				break;
			default:
				log_errf(-1, __func__, "Unknown event type %d", event_type);
				goto run_hook_exit;
		}

		fprintf(fp, "%s.%s=%s\n", PBS_OBJ, GET_NODE_NAME_FUNC, (char *) mom_short_name);
		fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, PY_EVENT_TYPE, hook_event_as_string(event_type));
		fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, PY_EVENT_HOOK_NAME, phook->hook_name);
		fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, PY_EVENT_HOOK_TYPE, hook_type_as_string(phook->type));
		fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, "requestor", req_user);
		fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, "requestor_host", req_host);
		fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, "user", hook_user_as_string(phook->user));
		fprintf(fp, "%s.%s=%d\n", EVENT_OBJECT, "alarm", phook->alarm);

		if (phook->debug)
			fprintf(fp, "%s.%s=%s\n", EVENT_OBJECT, "debug", hook_datafile);

		fclose(fp);
		fp = NULL;

		arg[0] = (char *) pypath;
		arg[1] = "--hook";
		arg[2] = "-i";
		arg[3] = (char *) hook_inputfile;
		arg[4] = "-o";
		arg[5] = (char *) hook_outputfile;

		if (log_file[0] == '\0') {
			arg[6] = "-L";
			arg[7] = (char *) path_log;
		} else {
			arg[6] = "-l";
			arg[7] = (char *) log_file;
		}
		arg[8] = "-e";
		snprintf(logmask, sizeof(logmask), "%ld", *log_event_mask);
		arg[9] = (char *) logmask;

		if (rescdef_file != NULL) {
			arg[10] = "-r";
			arg[11] = (char *) rescdef_file;
			arg[12] = script_file;
			snprintf(cmdline, sizeof(cmdline),
				 "%s %s %s %s %s %s %s %s %s %s %s %s %s",
				 arg[0], arg[1], arg[2], arg[3], arg[4], arg[5],
				 arg[6], arg[7], arg[8], arg[9], arg[10], arg[11],
				 arg[12]);
			arg[13] = NULL;
		} else {
			arg[10] = script_file;
			snprintf(cmdline, sizeof(cmdline),
				 "%s %s %s %s %s %s %s %s %s %s %s",
				 arg[0], arg[1], arg[2], arg[3], arg[4], arg[5],
				 arg[6], arg[7], arg[8], arg[9], arg[10]);
			arg[11] = NULL;
		}
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO, phook->hook_name,
			   "execve %s runas_jobuser=%d in child pid=%d", cmdline, runas_jobuser, myseq);

		if (hook_config_path[0] == '\0') {
			if (child)
				/* since this is still main mom (not forked), need to unset the hook config environment variable. */
				if (unsetenv(PBS_HOOK_CONFIG_FILE) != 0)
					log_err(-1, __func__, "Failed to unset PBS_HOOK_CONFIG_FILE");
		} else if (setenv(PBS_HOOK_CONFIG_FILE, hook_config_path, 1) != 0) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name, "Failed to set PBS_HOOK_CONFIG_FILE");
			return (-1);
		}

#ifndef WIN32
		/*
		 * We're passing the calling process' (mom's) environment
		 * to python hook execution here, so as to match what's
		 * done on Windows. Also, this allows us to control
		 * pbs_python's execution environment via PBS'
		 * pbs_environment file (better security).
		 * We can provide a  workaround, in case pbs_python does
		 * not execute unless a particular variable is set,
		 * perhaps due to an incorrectly setup host.
		 */
		if (pbs_conf.pbs_conf_file != NULL) {
			if (setenv("PBS_CONF_FILE", pbs_conf.pbs_conf_file, 1) != 0) {
				log_err(errno, __func__, "Failed to set PBS_CONF_FILE");
				goto run_hook_exit;
			}
		}

#ifdef __SANITIZE_ADDRESS__
		/*
		 * Ignore ASAN link order for pbs_python because Python bin
		 * is not compiled with ASAN. There are also some leaks in the Python
		 * library so ignore them by setting exitcode to 0.
		 */
		char *env_asan[] =
		{
				"ASAN_OPTIONS=verify_asan_link_order=0",
				"LSAN_OPTIONS=exitcode=0",
				NULL
		};
		execve(pypath, arg, env_asan);
#else
		execve(pypath, arg, environ);
#endif
	run_hook_exit:
		if (fp != NULL) {
			fclose(fp);
			fp = NULL;
		}
		if (vnl_created)
			vnl_free(vnl);
		log_err(-1, __func__, "execv of hook");
		if (child)
			return run_exit;
		exit(run_exit);
	}
#else
		if (!parent_wait) {
			if (win_popen(cmdline, "w", &pio, NULL) == 0) {
				errno = GetLastError();
				pbs_errno = errno;
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, __func__, "executing %s failed errno=%d", cmdline, errno);
				win_pclose(&pio);
				return (-1);
			}
			ptask = set_task(WORK_Deferred_Child, (long) pio.pi.hProcess, post_func, phook);
			if (!ptask) {
				log_err(errno, __func__, msg_err_malloc);
				win_pclose(&pio);
				return (-1);
			}
			ptask->wt_aux2 = myseq;
			addpid(pio.pi.hProcess);
			win_pclose2(&pio); /* closes all handles except the process handle */
			ptask->wt_parm2 = (void *) php;
			return (0); /* no hook output file at this time */
		} else if (runas_jobuser) {
			if (pwdp == NULL) {
				log_err(-1, __func__, "runas_jobuser does not have credential set!");
				run_exit = 255;
				goto run_hook_exit;
			}
			(void) win_alarm(phook->alarm, run_hook_alarm);
			char *env_string = NULL;
			struct var_table hook_env;
			hook_env.v_envp = NULL;
			char *pbs_hook_conf = NULL;

			if ((pjob->ji_env.v_envp != NULL) && (phook->user == HOOK_PBSUSER)) {
				/* Duplicate only when the hook user is pbsuser */
				hook_env.v_envp = dup_string_arr(pjob->ji_env.v_envp);
				if (hook_env.v_envp == NULL) {
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
						  __func__, "Unable to set hook environment");
					goto run_hook_exit;
				}
				hook_env.v_ensize = pjob->ji_env.v_ensize;
				hook_env.v_used = pjob->ji_env.v_used;
				if (pbs_hook_conf = getenv("PBS_HOOK_CONFIG_FILE"))
					bld_env_variables(&hook_env, "PBS_HOOK_CONFIG_FILE", pbs_hook_conf);
				env_string = make_envp(hook_env.v_envp);
			}
			wloaduserprofile(pwdp);
			run_exit = wsystem(cmdline, pwdp->pw_userlogin, env_string);
			wunloaduserprofile(pwdp);
			free(env_string);
			(void) win_alarm(0, NULL);
			free_string_array(hook_env.v_envp);
		} else {
			/* The following blocks until after */
			(void) win_alarm(phook->alarm, run_hook_alarm);
			if (win_popen(cmdline, "r", &pio, NULL) == 0) {
				errno = GetLastError();
				pbs_errno = errno;
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, __func__, "executing %s failed errno=%d", cmdline, errno);

			} else if (GetExitCodeProcess(pio.pi.hProcess, &run_exit) == 0 || run_exit == STILL_ACTIVE) {
				log_err(-1, __func__, "GetExitCodeProcess failed");
				run_exit = 255;
			}
			win_pclose(&pio);
			(void) win_alarm(0, NULL);
		}
		if (php)
			php->child = child;
	run_hook_exit:
		if (fp != NULL)
			fclose(fp);

		if (vnl_created)
			vnl_free(vnl);
	}
#endif

	if (run_exit != 0)
		log_errf(-1, __func__, "execv of %s resulted in nonzero exit status=%d", pypath, run_exit);

	if (file_in != NULL)
		snprintf(file_in, file_size, FMT_HOOK_INFILE, path_hooks_workdir, hook_event_as_string(event_type), phook->hook_name, child);
	if (file_out != NULL)
		snprintf(file_out, file_size, FMT_HOOK_OUTFILE, path_hooks_workdir, hook_event_as_string(event_type), phook->hook_name, child);

	if (file_data != NULL)
		snprintf(file_data, file_size, FMT_HOOK_DATAFILE, path_hooks_workdir, hook_event_as_string(event_type), phook->hook_name, child);

	if (runas_jobuser) {

		/* move [PATH_SPOOL]/<hook input file> to <file_in> where <file_in> is in [PBS_HOME]/mom_priv/hooks/tmp. */
		snprintf(hook_inputfile, MAXPATHLEN, FMT_HOOK_INFILE, path_spool, hook_event_as_string(event_type), phook->hook_name, child);
		if (stat(hook_inputfile, &sbuf) == 0 && file_in != NULL)
			(void) rename(hook_inputfile, file_in);

		/* move [PATH_SPOOL]/<hook output file> to <file_out> where <file_out> is in [PBS_HOME]/mom_priv/hooks/tmp. */
		snprintf(hook_outputfile, MAXPATHLEN, FMT_HOOK_OUTFILE, path_spool, hook_event_as_string(event_type), phook->hook_name, child);
		if (stat(hook_outputfile, &sbuf) == 0 && file_out != NULL)
			(void) rename(hook_outputfile, file_out);

		/* move [PATH_SPOOL]/<hook data file> to <file_data> where <file_data> is in [PBS_HOME]/mom_priv/hooks/tmp. */
		snprintf(hook_datafile, MAXPATHLEN, FMT_HOOK_DATAFILE, path_spool, hook_event_as_string(event_type), phook->hook_name, child);
		if (stat(hook_datafile, &sbuf) == 0 && file_data != NULL)
			(void) rename(hook_datafile, file_data);
		pbs_strncpy(script_path, ((struct python_script *) phook->script)->path, sizeof(script_path));
		pc = strrchr(script_path, '/');
		if (pc == NULL)
			pc = (char *) script_path;
		else
			pc++;

		/* delete [PATH_SPOOL]/<hook script file copy> */
		snprintf(script_copy, MAXPATHLEN, FMT_HOOK_SCRIPT, path_spool, child);

		if (stat(script_copy, &sbuf) == 0)
			(void) unlink(script_copy);

		/* delete [PATH_SPOOL]/<hook config file copy> */
		snprintf(hook_config_copy, MAXPATHLEN, FMT_HOOK_CONFIG, path_spool, child);

		if (stat(hook_config_copy, &sbuf) == 0)
			(void) unlink(hook_config_copy);

		/* delete [PATH_SPOOL]/<resourcedef copy> */
		snprintf(rescdef_copy, MAXPATHLEN, FMT_HOOK_RESCDEF, path_spool, child);

		if (stat(rescdef_copy, &sbuf) == 0)
			(void) unlink(rescdef_copy);

		snprintf(log_file, MAXPATHLEN, FMT_HOOK_LOG, path_spool, child);

		/* Log file generated in [PATH_SPOOL] should be appended to main mom_logs. */
		if ((fp = fopen(log_file, "r")) != NULL) {
			size_t ll;
			char *p;
			char *jobid = NULL;
			int semicolons;

			jobid = pjob->ji_qs.ji_jobid;

			while (fgets(in_data, sizeof(in_data), fp) != NULL) {
				ll = strlen(in_data);
				if (in_data[ll - 1] == '\n')
					/* remove newline */
					in_data[ll - 1] = '\0';

				/* Format of pbs logfile is as follows: */
				/* <time>;<event>;<prog>;<class>;<obj>;<msg> */
				/* There are 5 semicolons before <msg>, */
				/* which is the one we need to get. */
				p = in_data;
				semicolons = 0;
				while (*p != '\0') {
					if (*p == ';') {
						semicolons++;
						if (semicolons == 5)
							break;
					}
					p++;
				}

				if (*p != '\0') {
					*p = '\0';
					p++;
					if (*p != '\0') {

						if (strstr(in_data, ";Job;") != NULL)
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG, jobid ? jobid : "", p);
						else
							log_event(PBSEVENT_ADMIN | PBSEVENT_SYSTEM, PBS_EVENTCLASS_HOOK, LOG_DEBUG, "pbs_python", p);
					}
				}
			}
			fclose(fp);
			if (unlink(log_file) == -1)
				log_err(errno, __func__, log_file);
		}
	}

#ifdef WIN32
	if (secure_file(file_out, "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED) == 0)
		log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, __func__, "Failed to change hook input file permissions for file: %s", file_out);
#endif

	return (run_exit);
}

/**
 * @brief
 *	Free the malloced "path" elemen of py_script.
 *
 * @param[in] py_script - the python_script structure containing the path element.
 *
 * @return Void
 *
 */
void
python_script_free(struct python_script *py_script)
{

	if (py_script != NULL) {
		if (py_script->path != NULL) {
			free(py_script->path);
		}
	} else
		log_err(PBSE_HOOKERROR, __func__, "Python Script is NULL");
}

/**
 * @brief
 *	Creates a path entry to *py_script using 'script_path' as value.
 *
 * @param[in]	script_path - the value to use
 * @param[in] 	py_script - the python_script being instantiated.
 *
 * @Note
 *	If *py_script is not NULL (previously allocated), then
 *	free up previously malloced entries, and reset *py_script to NULL.
 *
 * @return int
 * @retval	0	- for success
 * @retval	-1	- for failure
 *
 */

int
python_script_alloc(const char *script_path, struct python_script **py_script)
{

	struct python_script *tmp_py_script = NULL;
	size_t nbytes = sizeof(struct python_script);
	struct stat sbuf;

	if ((script_path == NULL) || (py_script == NULL)) {
		log_err(-1, __func__, "Bad input parameters");
		return (-1);
	}

	if ((stat(script_path, &sbuf) == -1)) {
		return (0); /* could not stat script, so nothing to set */
	}

	if (*py_script != NULL) {
		if ((*py_script)->path != NULL) {
			free((*py_script)->path);
		}
		free(*py_script);
	}

	*py_script = NULL; /* init, to be safe */

	if (!(tmp_py_script = (struct python_script *) malloc(nbytes))) {
		log_err(errno, __func__, "failed to malloc struct python_script");
		goto python_script_alloc_exit;
	}
	(void) memset(tmp_py_script, 0, nbytes);

	tmp_py_script->path = strdup(script_path);
	if (tmp_py_script->path == NULL) {
		log_err(errno, __func__, "failed to malloc path");
		goto python_script_alloc_exit;
	}

	/* ok, we are set with py_script */
	*py_script = tmp_py_script;
	return 0;

python_script_alloc_exit:
	if (tmp_py_script != NULL) {
		if (tmp_py_script->path != NULL) {
			free(tmp_py_script->path);
		}
		free(tmp_py_script);
		tmp_py_script = NULL;
	}
	return -1;
}

/**
 * @brief
 *	Runs a periodic hook in the background.
 *
 * @param[in] 	phook - hook to run.
 *
 * @return none
 *
 */
void
run_periodic_hook_bg(hook *phook)
{
	int rc;
	mom_hook_input_t hook_input;

	if (phook == NULL) {
		log_err(-1, __func__, "bad input parameter");
		return;
	}

	if (phook->enabled == FALSE) {
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name,
			  "periodic hook has been disabled. Skipping hook");
		return;
	}

	if (phook->script == NULL) {
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name,
			  "Hook has no script content. Skipping hook.");
		return;
	}

	/* Run the hook in a child process, and when done, */
	/* execute post_periodic_hook() */
	/* A copy of the system 'vnlp' is passed here */
	/* hook will execute in a child process, and even though */
	/* it may make changes to 'vnlp', it's only in the child */
	/* that will have this copy */

	/* this is the list of vnodes seen by a periodic hook including */
	/* those added by the exechost_startup hook */
	mom_hook_input_init(&hook_input);
	hook_input.vnl = (vnl_t *) vnlp;
	hook_input.jobs_list = &svr_alljobs;

	rc = run_hook(phook, HOOK_EVENT_EXECHOST_PERIODIC, &hook_input,
		      PBS_MOM_SERVICE_NAME, mom_host, 0,
		      post_periodic_hook,
		      NULL, NULL, NULL, 0, NULL);
	if (rc != 0) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name,
			  "Failed to deploy periodic hook");
	}
}

/**
 * @brief
 *	Runs the hook hanging off a work task.
 *
 * @param[in] 	work_task -  task to process.
 *
 * @return none
 *
 */
static void
run_periodic_hook_bg_task(struct work_task *ptask)
{
	hook *phook = (hook *) ptask->wt_parm1;

	if (phook == NULL) {
		log_err(-1, __func__, "A hook has disappeared.");
		return; /* no hook to execute */
	}

	run_periodic_hook_bg(phook);
}

/**
 * @brief
 *	Get the results from 'input_file' of a previously run hook.
 *
 * @param[in] 		input_file -  file to process.
 * @param[in/out] 	accept_flag -  return 1 if event accept flag is true.
 * @param[in/out] 	reject_flag -  return 1 if event reject flag is true.
 * @param[in/out] 	reject_msg -  the reject message if reject_flag is 1.
 * @param[in]		reject_msg_size -  size of reject_msg buffer.
 * @param[out] 		reject_rerunjob -  return 1 if job is to be rerun.
 * @param[out] 		reject_deletejob -  return 1 if job is to be deleted.
 * @param[in/out] 	reboot_flag -  return 1 if pbs should reboot host
 * @param[in/out] 	reboot_cmd -  the command to use by pbs to reboot host.
 * @param[in]		reboot_cmd_size -  size of reboot_cmd buffer.
 * @param[in/out] 	pvnalist -  a linked list of any resultant vnodes list
 * @param[in/out] 	pjob -  job in question, where if present (not NULL),
 *			        it gets filled in with the
 *				"pbs.event().job" entries in 'input_file'.
 *				'pjob' can be NULL in periodic hooks, since
 *				 periodic hooks are not tied to jobs.
 *				 Note that pbs.event().job_list[<jobid>] entries
 *				 in 'input_file' fill in the individual
 *				 <jobid>'s job struct entry in the system, and
 *				 not the passed 'pjob' structure.
 * @param[in]		phook -  hook that executed of which we're getting the
 *				results. If non-NULL, then phook->user is
 *				used to validate 'pbs.event().job.euser' line
 *				in 'input_file'.
 *				If main Mom is reading a job related hook
 *				results file, phook will be null; an entry in
 *				the file should give us the hook name from which
 *				phook is found.
 * @param[in]		copy_file - copy the results file to one who name has
 *				the job id appended.  This is done when in a
 *				child process of Mom.
 * @param[out]		hook_output - struct of parameters to fill in output.
 *
 * @note
 *	If "copy_file" is true, then the processed 'input_file' lines are
 *	saved under the file name:
 *		hook_output<pjob's job-id>
 *	under the same directory where original 'input_file' is located.
 *	One and only one hook's output is being processed in this case.
 *	"Processed" here means the input line has passed some sanity checks, and
 *	deemed to be a valid input line.
 *	This new hook job output file can later be consulted by
 *	send_obit() and record_finish_exec() to retrieve job and vnl updates
 *	made by a hook in a child process.  It is in this case that a line
 *	containing the hook name will appear.  Multiple hooks of the same event
 *	type may be concatenated.
 *
 * @return int
 * @retval	0 for success
 * @retval	non-zero for failure;  the returned parameters (accept_flag,
 *		reject_flag, reject_rerunjob, reject_deletejob, reboot_flag,
 *		reboot_cmd, pvnalist and pjob) may be invalid and should be
 *		ignored.   The list pvnalisst could have mallocate space and
 *		should be freed by the calling program.
 *
 */
int
get_hook_results(char *input_file, int *accept_flag, int *reject_flag,
		 char *reject_msg, int reject_msg_size, int *reject_rerunjob,
		 int *reject_deletejob, int *reboot_flag, char *reboot_cmd,
		 int reboot_cmd_size, pbs_list_head *pvnalist, job *pjob,
		 hook *phook, int copy_file, mom_hook_output_t *hook_output)
{

	char *name_str;
	char *resc_str;
	char *obj_name;
	char *data_value;
	char *vname_str;
	char *jobid_str;
	int rc = -1;
	char *pc, *pc1, *pc2, *pc3, *pc4, *pc5;
	char *in_data = NULL;
	size_t ll;
	FILE *fp;
	char *p;
	int vn_obj_len = strlen(EVENT_VNODELIST_OBJECT);
	int vn_fail_obj_len = strlen(EVENT_VNODELIST_FAIL_OBJECT);
	int job_obj_len = strlen(EVENT_JOBLIST_OBJECT);
	int index;
	int errcode;
	vnl_t *hvnlp = NULL;
	vnl_t *hvnlp_fail = NULL;
	char hook_job_outfile[MAXPATHLEN + 1];
	FILE *fp2 = NULL;
	char *line_data = NULL;
	int line_data_sz;
	long int endpos;
	int start_new_vnl = 1;
	int start_new_vnl_fail = 1;
	struct hook_vnl_action *pvna;
	char hook_euser[PBS_MAXUSER + 1] = {'\0'};
	char *value_type = NULL;
	job *pjob2 = NULL;
	job *pjob2_prev = NULL;
	int found_rerunjob_action = 0;
	int found_deletejob_action = 0;
	int found_joblist = 0;
	int arg_list_entries = 0;
	int b_triple_quotes = 0;
	int e_triple_quotes = 0;
	char buf_data[STRBUF];

	/* Preset hook_euser for later.  If we are reading a job related     */
	/* copy of hook results, there will be one or more (one per hook)    */
	/* pbs_event().hook_euser=<value> entries.  In that case, hook_euser */
	/* is reset to the <value>.  A null string <value> means PBSADMIN.   */
	if (phook && pjob && (phook->user == HOOK_PBSUSER))
		pbs_strncpy(hook_euser, get_jattr_str(pjob, JOB_ATR_euser), sizeof(hook_euser));

	if ((input_file != NULL) && (*input_file != '\0')) {
		fp = fopen(input_file, "r");

		if (fp == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed to open input file %s", input_file);
			log_err(errno, __func__, log_buffer);
			return (1);
		}
	} else {
		log_err(PBSE_INTERNAL, __func__, "bad input_file parameter");
		return (1);
	}

	/* if called by a child of Mom, then process the input file and    */
	/* copy it to a new file based on the job id.  Thus the main Mom   */
	/* process can read it and send any updates required to the Server */
	if (copy_file) {
		/* 'pjob' is used to name the file, and phook->user is used */
		/* to validate 'pbs.event().job.euser" line in  */
		/* 'input_file'. */
		char *p;
		char chr_save = '\0';
		char *p_dir = NULL;

		if ((pjob == NULL) || (phook == NULL)) {
			log_err(PBSE_INTERNAL, __func__, "bad copy_file parameter");
			return (1);
		}

		p = strrchr(input_file, '/');
		if (p != NULL) {
			p++;
			chr_save = *p;
			*p = '\0';
			p_dir = (char *) input_file;
		}

		snprintf(hook_job_outfile, MAXPATHLEN,
			 FMT_HOOK_JOB_OUTFILE, p_dir ? p_dir : "",
			 pjob->ji_qs.ji_jobid);

		if (chr_save != '\0')
			*p = chr_save; /* restore */

		fp2 = fopen(hook_job_outfile, "a");
		if (fp2 == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed to open hook_job_outfile=%s",
				 hook_job_outfile);
			log_err(errno, __func__, log_buffer);
			fclose(fp);
			(void) unlink(input_file);
			return (1);
		}
		/* first record for each hook is one holding the euser  */
		/* as which the hook was executed.  This also indicates */
		/* the start of a new hook stanza in the file.          */
		fprintf(fp2, "%s=%s\n", EVENT_HOOK_EUSER, hook_euser);
	}

	line_data_sz = STRBUF;
	line_data = (char *) malloc((size_t) line_data_sz);
	if (line_data == NULL) {
		log_err(errno, __func__, "malloc failed");
		rc = 1;
		goto get_hook_results_end;
	}
	line_data[0] = '\0';

	if (fseek(fp, 0, SEEK_END) != 0) {
		log_err(errno, __func__, "fseek to end failed");
		rc = 1;
		goto get_hook_results_end;
	}

	endpos = ftell(fp);
	if (fseek(fp, 0, SEEK_SET) != 0) {
		log_err(errno, __func__, "fseek to beginning failed");
		rc = 1;
		goto get_hook_results_end;
	}

	pjob2 = pjob;
	while (fgets(buf_data, STRBUF, fp) != NULL) {
		b_triple_quotes = 0;
		e_triple_quotes = 0;

		if (pbs_strcat(&line_data, &line_data_sz, buf_data) == NULL) {
			goto get_hook_results_end;
		}
		if (in_data != NULL) {
			free(in_data);
		}
		in_data = strdup(line_data); /* preserve line_data */
		if (in_data == NULL) {
			log_err(errno, __func__, "strdup failed");
			rc = 1;
			goto get_hook_results_end;
		}

		if ((p = strchr(in_data, '=')) != NULL) {
			b_triple_quotes = starts_with_triple_quotes(p + 1);
		}

		ll = strlen(in_data);
		if (in_data[ll - 1] == '\n') {
			e_triple_quotes = ends_with_triple_quotes(in_data, 0);

			if (b_triple_quotes && !e_triple_quotes) {
				int jj;

				while (fgets(buf_data, STRBUF, fp) != NULL) {
					if (pbs_strcat(&line_data, &line_data_sz,
						       buf_data) == NULL) {
						goto get_hook_results_end;
					}

					jj = strlen(line_data);
					if ((line_data[jj - 1] != '\n') &&
					    (ftell(fp) != endpos)) {
						/* get more input for
						 * current item.
						 */
						continue;
					}
					e_triple_quotes =
						ends_with_triple_quotes(line_data, 0);

					if (e_triple_quotes) {
						break;
					}
				}

				if ((!b_triple_quotes && e_triple_quotes) ||
				    (b_triple_quotes && !e_triple_quotes)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "unmatched triple quotes! Skipping  line %s",
						 in_data);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					/* process a new line */
					line_data[0] = '\0';
					continue;
				}
				free(in_data);
				in_data = strdup(line_data); /* preserve line_data */
				if (in_data == NULL) {
					log_err(errno, __func__, "strdup failed");
					rc = 1;
					goto get_hook_results_end;
				}
				/* remove newline */
				in_data[strlen(in_data) - 1] = '\0';
			} else {
				/* remove newline */
				in_data[ll - 1] = '\0';
			}

		} else if (ftell(fp) != endpos) { /* continued on next line */
			/* get more input for current item.  */
			continue;
		}

		data_value = NULL;
		if ((p = strchr(in_data, '=')) != NULL) {
			*p = '\0';
			p++;
			while (isspace(*p))
				p++;

			if (b_triple_quotes) {
				/* strip triple quotes */
				p += 3;
			}
			data_value = p;
			if (e_triple_quotes) {
				ends_with_triple_quotes(p, 1);
			}
		}

		obj_name = in_data;

		pc = strrchr(in_data, '.');
		if (pc) {
			*pc = '\0';
			pc++;
		} else {
			pc = in_data;
		}
		name_str = pc;

		pc1 = strchr(pc, '[');
		pc2 = strchr(pc, ']');
		resc_str = NULL;
		if (pc1 && pc2 && (pc2 > pc1)) {
			*pc1 = '\0';
			pc1++;
			*pc2 = '\0';
			pc2++;

			/* now let's if there's anything quoted inside */
			pc3 = strchr(pc1, '"');
			if (pc3 != NULL)
				pc4 = strchr(pc3 + 1, '"');
			else
				pc4 = NULL;

			if (pc3 && pc4 && (pc4 > pc3)) {
				pc3++;
				*pc4 = '\0';
				resc_str = pc3;
			} else {
				resc_str = pc1;
			}
		}

		/* at this point, we have */
		/* Given:  pbs.event().<attribute>=<value> */
		/* Given:  pbs.event().job.<attribute>=<value> */
		/* Given:  pbs.event().job.<attribute>[<resc>]=<value> */
		/* Given:  pbs.event().vnode_list[<vname>].<attribute>=<value> */
		/* Given:  pbs.event().vnode_list[<vname>].<attribute>[<resc>]=<value> */
		/* We get: */

		/* obj_name = pbs.event() or "pbs.event().job" or "pbs.event().vnode_list[<vname>]" */
		/* name_str = <attribute> */
		/* resc_str = <resc> */
		/* data_value = <value> */

		if (data_value == NULL) {

			snprintf(log_buffer, sizeof(log_buffer),
				 "%s: no value given", in_data);
			log_err(errno, __func__, log_buffer);
			rc = 1;
			goto get_hook_results_end;
		}

		if (strcmp(obj_name, EVENT_OBJECT) == 0) {
			if (strcmp(name_str, "hook_euser") == 0) {
				pbs_strncpy(hook_euser, data_value, sizeof(hook_euser));
				start_new_vnl = 1;
				/* Need to also clear 'hvnlp' as previous  */
				/* one would have already been saved in */
				/* svr_hook_vnl_actions structure via */
				/* hook_requests_to_server(). Otherwise, */
				/* it would be bad if the same 'hvnlp' */
				/* gets duplicated in svr_hook_vnl_actions */
				/* which could cause a mom crash. */
				hvnlp = NULL;
				hvnlp_fail = NULL;
			} else if ((accept_flag != NULL) &&
				   strcmp(name_str, "accept") == 0) {
				if (strcmp(data_value, "True") == 0)
					*accept_flag = 1;
				else
					*accept_flag = 0;
			} else if ((reject_flag != NULL) &&
				   strcmp(name_str, "reject") == 0) {

				if (strcmp(data_value, "True") == 0)
					*reject_flag = 1;
				else
					*reject_flag = 0;
			} else if ((reject_msg != NULL) &&
				   (strcmp(name_str, "reject_msg") == 0)) {
				pbs_strncpy(reject_msg, data_value,
					    reject_msg_size);
			} else if (strcmp(name_str, PY_EVENT_PARAM_PROGNAME) == 0) {
				char **prog;
				if (hook_output != NULL) {
					/* need to free up here previous value */
					/* in case of multiple hooks! */
					prog = hook_output->progname;
					if (*prog != NULL) {
						free(*prog);
					}
					*prog = strdup(data_value);
				}
			} else if (strcmp(name_str, PY_EVENT_PARAM_ARGLIST) == 0) {
				pbs_list_head *ar_list;

				arg_list_entries++;
				if (hook_output != NULL) {
					ar_list = hook_output->argv;
					/* free previous values at start of new list */
					if (arg_list_entries == 1) {
						free_attrlist(ar_list);
					}
					add_to_svrattrl_list(ar_list, name_str, resc_str,
							     data_value, 0, NULL);
				}
			} else if (strcmp(name_str, PY_EVENT_PARAM_ENV) == 0) {
				if (hook_output != NULL) {
					if (hook_output->env != NULL) {
						free_str_array(hook_output->env);
					}
					hook_output->env = str_to_str_array(data_value, ',');
				}
			}
		} else if ((strcmp(obj_name, EVENT_JOB_OBJECT) == 0) ||
			   (strncmp(obj_name, EVENT_JOBLIST_OBJECT, job_obj_len)) == 0) {

			if (strncmp(obj_name, EVENT_JOBLIST_OBJECT, job_obj_len) == 0) {
				/* NOTE: obj_name here is: pbs.event().job_list[<jobid>] */

				/* important here to look for the leftmost '[' (using strchr)
				 * and the rightmost ']' (using strrchr)
				 * as we can have:
				 *	pbs.event().job_list["23.fest"].<attr>=<val>
				 * 	and "23.fest" is a valid job id.
				 */

				found_joblist = 1;
				if (((pc1 = strchr(obj_name, '[')) != NULL) &&
				    ((pc2 = strrchr(obj_name, ']')) != NULL) &&
				    (pc2 > pc1)) {
					pc1++;	     /*  pc1=<jobid>] */
					*pc2 = '\0'; /* pc1=<jobid>  */
					pc2++;

					/* now let's if there's anything quoted inside */
					pc3 = strchr(pc1, '"');
					if (pc3 != NULL)
						pc4 = strchr(pc3 + 1, '"');
					else
						pc4 = NULL;

					if (pc3 && pc4 && (pc4 > pc3)) {
						pc3++;
						*pc4 = '\0';
						jobid_str = pc3;
					} else {
						jobid_str = pc1;
					}
				} else {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' does not have a job id!",
						 obj_name);
					log_err(-1, __func__, log_buffer);
					/* process a new line */
					in_data[0] = '\0';
					continue;
				}

				/* jobs list are stored sorted. If current */
				/* jobid does not match previous jobid, */
				/* this means we've now switched to the */
				/* new job's data. */
				if ((pjob2_prev != NULL) &&
				    (strcmp(pjob2_prev->ji_qs.ji_jobid,
					    jobid_str) == 0)) {
					pjob2 = pjob2_prev; /* optimize */
				} else {
					/* working on a new list of job data */
					if (pjob2_prev != NULL) {
						if (*reject_deletejob) {
							/* deletejob takes precedence */
							new_job_action_req(pjob2, phook ? phook->user : HOOK_PBSADMIN, JOB_ACT_REQ_DELETE);
						} else if (*reject_rerunjob) {
							new_job_action_req(pjob2, phook ? phook->user : HOOK_PBSADMIN, JOB_ACT_REQ_REQUEUE);
						}
						/* already sent the action */
						found_rerunjob_action = 0;
						found_deletejob_action = 0;
					}
					pjob2 = find_job(jobid_str);
					pjob2_prev = pjob2;
					if (reject_rerunjob != NULL)
						*reject_rerunjob = 0;
					if (reject_deletejob != NULL)
						*reject_deletejob = 0;
					found_rerunjob_action = 0;
					found_deletejob_action = 0;
				}
			} else {
				/* not a EVENT_JOBLIST object. Switch */
				/* back to passed job object */
				pjob2 = pjob;
			}
			/* Found: <resource_name>,<job_value_type> */
			if (resc_str != NULL) {
				if ((pc5 = strchr(resc_str, ',')) != NULL) {
					*pc5 = '\0';
					pc5++;
					value_type = pc5;
				}
			}

			if (strcmp(name_str, "_rerun") == 0) {
				found_rerunjob_action = 1;
				if (reject_rerunjob == NULL) {
					/* process a new line */
					line_data[0] = '\0';
					continue;
				}
				if (strcmp(data_value, "True") == 0)
					*reject_rerunjob = 1;
				else
					*reject_rerunjob = 0;
			} else if (strcmp(name_str, "_delete") == 0) {
				found_deletejob_action = 1;
				if (reject_deletejob == NULL) {
					/* process a new line */
					line_data[0] = '\0';
					continue;
				}
				if (strcmp(data_value, "True") == 0)
					*reject_deletejob = 1;
				else
					*reject_deletejob = 0;
			} else if (pjob2 != NULL) {
				/* Is attribute not writeable by manager or */
				/* by a server? */
				/* Exempt attributes set by the hook script */
				resc_access_perm = ATR_DFLAG_USWR |
						   ATR_DFLAG_OPWR |
						   ATR_DFLAG_MGWR |
						   ATR_DFLAG_SvWR |
						   ATR_DFLAG_Creat;

				/* identify the attribute by name */
				index = find_attr(job_attr_idx, job_attr_def, name_str);
				if (index < 0) { /* didn`t recognize the name */
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' unrecognized attrbute name %s!",
						 obj_name, name_str);
					log_err(-1, __func__, log_buffer);
					/* process new line */
					line_data[0] = '\0';
					continue;
				}
				if ((index == JOB_ATR_runcount) && ((is_jattr_set(pjob2, JOB_ATR_run_version)) == 0)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s': ignoring setting attribute %s,"
						 " talking to a server that does not allow %s modification, ",
						 obj_name, name_str, name_str);
					log_err(-1, __func__, log_buffer);
					/* process new line */
					line_data[0] = '\0';
					continue;
				}

				/* security guard: hook that runs as    */
				/* PBSUSER should not be allowed  */
				/* to modify the euser value of the job */
				if ((phook != NULL) &&
				    (phook->user == HOOK_PBSUSER)) {
					long dval = atol(data_value);
					if (index == JOB_ATR_euser) {
						snprintf(log_buffer, sizeof(log_buffer),
							 "object '%s': ignoring setting attribute %s,"
							 " executing hook has user=pbsuser",
							 obj_name, name_str);
						log_err(-1, __func__, log_buffer);
						/* process a new line */
						line_data[0] = '\0';
						continue;
					} else if ((index == JOB_ATR_runcount) && (is_jattr_set(pjob2, index)) && (dval < get_jattr_long(pjob2, index))) {
						snprintf(log_buffer, sizeof(log_buffer),
							 "object '%s': ignoring setting attribute %s,"
							 " executing hook has user=pbsuser, "
							 " cannot decrease value from %ld to %ld",
							 obj_name, name_str,
							 get_jattr_long(pjob2, index),
							 dval);
						log_err(-1, __func__, log_buffer);
						/* process a new line */
						line_data[0] = '\0';
						continue;
					}
				}

				/* decode attribute */
				errcode = set_jattr_generic(pjob2, index, data_value, resc_str, INTERNAL);
				/* unknown resources still get decoded */
				/* using "unknown" placeholder resc def */
				if ((errcode != 0) &&
				    (errcode != PBSE_UNKRESC)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' failed to decode (%s,%s,%s)! (errorcode %d)",
						 obj_name, name_str, resc_str ? resc_str : "",
						 data_value, errcode);
					log_err(-1, __func__, log_buffer);
					/* process a new line */
					line_data[0] = '\0';
					continue;
				}
				if (errcode == PBSE_UNKRESC) {
					resource *prsc;
					resource_def *prdef;
					svrattrl *plist, *plist2, *plist_next;

					prdef = &svr_resc_def[RESC_UNKN];
					prsc = find_resc_entry(get_jattr(pjob2, index), prdef);

					if ((prdef == NULL) || (prsc == NULL)) {
						log_err(-1, __func__, "bad unknown resc");
						/* process a new line */
						line_data[0] = '\0';
						continue;
					}

					plist = (svrattrl *) GET_NEXT(prsc->rs_value.at_val.at_list);

					do {
						if (plist == NULL)
							break;

						plist_next = (svrattrl *) GET_NEXT(plist->al_link);

						/* check for duplicate resource */
						/* entry. The later ones take */
						/* precedence */
						plist2 = (svrattrl *) GET_NEXT(plist->al_link);
						while (plist2 != NULL) {
							if (strcmp(plist->al_resc,
								   plist2->al_resc) == 0) {
								delete_link(&plist->al_link);
								free(plist);
								break;
							}
							plist2 = (svrattrl *) GET_NEXT(plist2->al_link);
						}

						plist = plist_next;
					} while (plist != NULL);
				}
				/* resources set in a hook should be flagged */
				/* as such (see how mom_set_use treat */
				/* ATR_VFLAG_HOOK set resources) */
				if (resc_str != NULL) { /* a resource */
					resource_def *rd;
					resource *pres;

					rd = find_resc_def(svr_resc_def, resc_str);
					if (rd != NULL) {
						pres = find_resc_entry(
							get_jattr(pjob2, index),
							rd);
						if (pres != NULL) {
							pres->rs_value.at_flags |=
								ATR_VFLAG_HOOK;
						}
					}
				}
				/* attributes in a hook should be flagged */
				/* with ATR_VFLAG_HOOK                    */
				(get_jattr(pjob2, index))->at_flags |= ATR_VFLAG_HOOK;
			}
		}
		if ((strncmp(obj_name, EVENT_VNODELIST_FAIL_OBJECT,
			     vn_fail_obj_len) == 0) ||
		    (strncmp(obj_name, EVENT_VNODELIST_OBJECT,
			     vn_obj_len) == 0)) {

			int *start_new_vnl_p;
			vnl_t **hvnlp_p = NULL;

			if (strncmp(obj_name,
				    EVENT_VNODELIST_FAIL_OBJECT,
				    vn_fail_obj_len) == 0) {
				start_new_vnl_p = &start_new_vnl_fail;
				hvnlp_p = &hvnlp_fail;
			} else {
				start_new_vnl_p = &start_new_vnl;
				hvnlp_p = &hvnlp;
			}

			/* NOTE: obj_name here is: pbs.event().vnode_list[<vname>] */

			/* important here to look for the leftmost '[' (using strchr)
			 * and the rightmost ']' (using strrchr)
			 * as we can have:
			 *	pbs.event().vnode_list["altix[5]"].<attr>=<val>
			 * 	and "altix[5]" is a valid vnode id.
			 */
			if (((pc1 = strchr(obj_name, '[')) != NULL) &&
			    ((pc2 = strrchr(obj_name, ']')) != NULL) &&
			    (pc2 > pc1)) {
				pc1++;	     /*  pc1=<vname>] */
				*pc2 = '\0'; /* pc1=<vname>  */
				pc2++;

				/* now let's if there's anything quoted inside */
				pc3 = strchr(pc1, '"');
				if (pc3 != NULL)
					pc4 = strchr(pc3 + 1, '"');
				else
					pc4 = NULL;

				if (pc3 && pc4 && (pc4 > pc3)) {
					pc3++;
					*pc4 = '\0';
					vname_str = pc3;
				} else {
					vname_str = pc1;
				}
			} else {
				snprintf(log_buffer, sizeof(log_buffer),
					 "object '%s' does not have a vnode name!",
					 obj_name);
				log_err(-1, __func__, log_buffer);
				/* process a new line */
				line_data[0] = '\0';
				continue;
			}

			if ((name_str != NULL) && (resc_str != NULL)) {
				/* format is in in_data: <attrib>\0<resc_str> */
				*(resc_str - 1) = '.'; /* so name_str=<attrib>.<resc_str> */
			}
			/* Found: resc_str = <resc_name>,<value_type> */
			if (resc_str != NULL) {
				if ((pc5 = strchr(resc_str, ',')) != NULL) {
					*pc5 = '\0';
					pc5++;
					value_type = pc5;
				}
			}

			if (*start_new_vnl_p) {
				*start_new_vnl_p = 0;
				/* now add new hook_vnl_action structure to */
				/* the list of such to return for updating  */
				/* the Server                               */
				pvna = malloc(sizeof(struct hook_vnl_action));
				if ((pvna != NULL) && (pvnalist != NULL)) {
					CLEAR_LINK(pvna->hva_link);
					snprintf(pvna->hva_euser, sizeof(pvna->hva_euser),
						 "%s", hook_euser);
					pvna->hva_actid = 0;
					pvna->hva_vnl = NULL;
					pvna->hva_update_cmd = IS_UPDATE_FROM_HOOK;
					if (strncmp(obj_name, EVENT_VNODELIST_FAIL_OBJECT, vn_fail_obj_len) == 0) {
						pvna->hva_update_cmd = IS_UPDATE_FROM_HOOK2;
					}
					if (vnl_alloc(hvnlp_p) == NULL) {
						log_err(errno, __func__, "Failed to allocate hvnlp");
					} else {
						pvna->hva_vnl = *hvnlp_p;
						append_link(pvnalist,
							    &pvna->hva_link, pvna);
					}
				} else {
					log_err(errno, __func__, "Failed to allocate hook action");
				}
				if ((copy_file == 0) && (*hvnlp_p != NULL)) {
					/* add a entry to the vnl for the user */
					rc = vn_addvnr(*hvnlp_p, mom_short_name,
						       VNATTR_HOOK_REQUESTOR,
						       hook_euser,
						       ATR_TYPE_STR, READ_ONLY,
						       NULL);
					if (rc == -1) {
						snprintf(log_buffer, sizeof(log_buffer),
							 "Failed to add '%s %s=%s' vnode resource copy_file=%d",
							 mom_short_name, VNATTR_HOOK_REQUESTOR,
							 hook_euser, copy_file);
						log_err(-1, __func__, log_buffer);
					}
				}
			}
			rc = -1;
			if (*hvnlp_p) {
				char *p2;
				resource_def *prdef;
				unsigned int at_type;
				unsigned int rs_flag;

				/* We're now passing type and flag so that if 'name_str' resource */
				/* does not exist, then it will be dynamically allocated on the server */
				/* side, essentially allowing hook scripts to define custom resource! */
				rs_flag = READ_WRITE | ATR_DFLAG_CVTSLT | ATR_DFLAG_MOM;
				if ((p2 = strrchr(name_str, '.')) != NULL) {
					p2++;
					prdef = find_resc_def(svr_resc_def, p2);
					if (prdef == NULL) { /* a custom resource */
						if (value_type != NULL) {
							if (strcmp(value_type, "boolean") == 0) {
								at_type = ATR_TYPE_BOOL;
							} else if (strcmp(value_type, "long") == 0) {
								at_type = ATR_TYPE_LONG;
							} else if (strcmp(value_type, "size") == 0) {
								at_type = ATR_TYPE_SIZE;
							} else if (strcmp(value_type, "float") == 0) {
								at_type = ATR_TYPE_FLOAT;
							} else if (strcmp(value_type, "string_array") == 0) {
								at_type = ATR_TYPE_ARST;
							} else {
								at_type = ATR_TYPE_STR;
							}
						} else {
							at_type = ATR_TYPE_STR;
						}
					} else {
						at_type = prdef->rs_type;
						rs_flag = prdef->rs_flags;
					}
				} else {
					at_type = ATR_TYPE_STR;
				}
				rc = vn_addvnr(*hvnlp_p, vname_str, name_str,
					       data_value, at_type, rs_flag, NULL);
				if (rc == -1) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "Failed to add '%s %s=%s' at_type=%d rs_flag=%d",
						 vname_str, name_str, data_value, at_type, rs_flag);
					log_err(-1, __func__, log_buffer);
				}
			}

		} else if ((strcmp(obj_name, SERVER_OBJECT) == 0) &&
			   (strcmp(name_str, PY_SCHEDULER_RESTART_CYCLE_METHOD) == 0)) {

			if ((strcmp(data_value, "True") == 0) &&
			    (copy_file == 0)) {
				/* ask Server to tell Scheduler to restart a */
				/* scheduling cycle; only done from main Mom */
				if (send_sched_recycle(hook_euser) != 0) {
					/* process a new line */
					line_data[0] = '\0';
					continue;
				}
			}

		} else if (strcmp(obj_name, PBS_OBJ) == 0) {

			if ((reboot_flag != NULL) &&
			    (strcmp(name_str, PBS_REBOOT_OBJECT) == 0)) {
				if (strcmp(data_value, "True") == 0)
					*reboot_flag = 1;
				else
					*reboot_flag = 0;
			} else if ((reboot_cmd != NULL) &&
				   (strcmp(name_str,
					   PBS_REBOOT_CMD_OBJECT) == 0)) {
				pbs_strncpy(reboot_cmd, data_value, HOOK_BUF_SIZE);
			}
		}

		if ((fp2 != NULL) && (fputs(line_data, fp2) < 0)) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to save data in file %s",
				 hook_job_outfile);
			log_err(errno, __func__, log_buffer);
			rc = 1;
			goto get_hook_results_end;
		}
		line_data[0] = '\0';
	}

	if (found_joblist && (found_rerunjob_action || found_deletejob_action)) {
		if ((reject_deletejob != NULL) && (*reject_deletejob)) {
			/* deletejob takes precedence */
			new_job_action_req(pjob2, phook ? phook->user : HOOK_PBSADMIN, JOB_ACT_REQ_DELETE);
		} else if ((reject_rerunjob != NULL) && (*reject_rerunjob)) {
			new_job_action_req(pjob2, phook ? phook->user : HOOK_PBSADMIN, JOB_ACT_REQ_REQUEUE);
		}
	}
	rc = 0;

get_hook_results_end:

	if (fp != NULL)
		fclose(fp);

	if (fp2 != NULL) {
		if (fflush(fp2) != 0) {
			/* error in writting job related hook results file */
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to save data in file %s",
				 hook_job_outfile);
			log_err(errno, __func__, log_buffer);
			rc = 1;
			fclose(fp2);
			unlink(hook_job_outfile);
		} else {
			fclose(fp2);
		}
	}
	if (phook && !phook->debug) {
		(void) unlink(input_file);
	}
	if (line_data != NULL) {
		free(line_data);
	}
	if (in_data != NULL) {
		free(in_data);
	}

	return (rc);
}

/**
 * @brief
 *	Make the actual call to reboot the current host.
 *	If 'reboot_cmd' is NULL, then use the default reboot
 *	cmd line - see REBOOT_CMD macro.
 *
 * @param[in] reboot_cmd char pointer which hold cmd to rebbot host
 *
 * @return Void
 *
 */
static void
do_reboot(char *reboot_cmd)
{
	char bootcmd[HOOK_BUF_SIZE];
	int rcode;

	if ((reboot_cmd == NULL) || (*reboot_cmd == '\0'))
		pbs_strncpy(bootcmd, REBOOT_CMD, sizeof(bootcmd));
	else
		pbs_strncpy(bootcmd, reboot_cmd, sizeof(bootcmd));

	snprintf(log_buffer, sizeof(log_buffer), "issuing cmd %s", bootcmd);
	log_event(PBSEVENT_DEBUG3, 0,
		  LOG_INFO, "do_reboot", log_buffer);

#ifndef WIN32
	if ((rcode = system(bootcmd)) != -1)
#else
	if ((rcode = wsystem(bootcmd, INVALID_HANDLE_VALUE)) == 0)
#endif
	{
		log_event(PBSEVENT_DEBUG3, 0,
			  LOG_INFO, "do_reboot", "mom exiting");
		exit(0);
	} else {
		snprintf(log_buffer, sizeof(log_buffer),
			 "reboot failed exit code=%d", rcode);
		log_event(PBSEVENT_ERROR, 0,
			  LOG_ERR, __func__, log_buffer);
	}
}

/**
 * @brief
 *	Add a hook's delete or requeue action request to the list of such
 *	actions sent to server and call send_hook_job_action() to send it
 *	to the server.  It will be removed from the list when the Server
 *	replies or resent if the Server connection is reestablished.
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] huser - hook ran as admin or user
 * @param[in] action - JOB_ACT_REQ_DELETE (1) or JOB_ACT_REQ_REQUEUE (0)
 *
 * @return none
 *
 */
void
new_job_action_req(job *pjob, enum hook_user huser, int action)
{
	struct hook_job_action *phja;

	if (pjob == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
			  __func__, "Job received is NULL");
		return;
	}
	phja = malloc(sizeof(struct hook_job_action));
	if (phja == NULL) {
		log_err(PBSE_SYSTEM, __func__, msg_err_malloc);
		return;
	}
	CLEAR_LINK(phja->hja_link);
	snprintf(phja->hja_jid, sizeof(phja->hja_jid), "%s", pjob->ji_qs.ji_jobid);
	phja->hja_actid = ++hook_action_id;

	if (is_jattr_set(pjob, JOB_ATR_run_version))
		phja->hja_runct = get_jattr_long(pjob, JOB_ATR_run_version);
	else
		phja->hja_runct = get_jattr_long(pjob, JOB_ATR_runcount);

	phja->hja_huser = huser;
	phja->hja_action = action;
	append_link(&svr_hook_job_actions, &phja->hja_link, phja);
	send_hook_job_action(phja);
}

/**
 * @brief
 *	This function runs after the task that runs a single periodic hook
 *	in the background completes execution.  If there was an error (the
 *	hook process returned a non-zero exits status), the results file
 *	is just discarded (it may not even be there).
 *
 * @param[in] 	pwt - the work task.
 *
 * @return none
 *
 */
static void
post_periodic_hook(struct work_task *pwt)
{
	int wstat = pwt->wt_aux;
	hook *phook = (hook *) pwt->wt_parm1;
#ifdef WIN32
	pid_t mypid = pwt->wt_aux2;
#else
	pid_t mypid = pwt->wt_event;
#endif
	char hook_outfile[MAXPATHLEN + 1];
	char reject_msg[HOOK_MSG_SIZE + 1];
	time_t next_time;
	char *next_time_str;
	int accept_flag = 1;
	int hook_error_flag = 0;
	int reject_flag = 0;
	int rerun_flag = 0;
	int delete_flag = 0;
	int reboot_flag = 0;
	char reboot_cmd[HOOK_BUF_SIZE];
	pbs_list_head vnl_changes;

	CLEAR_HEAD(vnl_changes);
	reboot_cmd[0] = '\0';
	reject_msg[0] = '\0';

	/* Check hook exit status */
	if (wstat != 0) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1,
			 "Non-zero exit status %d encountered for periodic hook",
			 wstat);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name, log_buffer);
		hook_error_flag = 1; /* hook results are invalid */
	}

	/* hook results path */
	snprintf(hook_outfile, MAXPATHLEN, FMT_HOOK_OUTFILE,
		 path_hooks_workdir,
		 HOOKSTR_EXECHOST_PERIODIC,
		 phook->hook_name, mypid);

	if (hook_error_flag == 0) {

		/* hook exited normally, get results from file  */
		if (get_hook_results(hook_outfile, &accept_flag, &reject_flag,
				     reject_msg, sizeof(reject_msg), &rerun_flag,
				     &delete_flag, &reboot_flag, reboot_cmd, HOOK_BUF_SIZE,
				     &vnl_changes, NULL, phook, 0, NULL) != 0) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Failed getting hook results");
			/* error getting results, do not accept results */
			hook_error_flag = 1;
		}
	}

	if ((hook_error_flag == 1) || (accept_flag == 0)) {

		snprintf(log_buffer, sizeof(log_buffer),
			 "%s request rejected by '%s'",
			 "exechost_periodic", phook->hook_name);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name, log_buffer);
		if (reject_msg[0] != '\0') {
			snprintf(log_buffer, sizeof(log_buffer), "%s",
				 reject_msg);
			/* log also the custom reject message */
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
		}
	}

	if (hook_error_flag == 0) {
		/* No hook error means data is communicated to */
		/* the server and actions are done to jobs.    */
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, phook->hook_name, "periodic hook accepted");

		/* remove the processed results file, note that if  */
		/* there was an error, it is left for debugging use */
		if (phook && !phook->debug)
			(void) unlink(hook_outfile); /* remove file */

		if ((struct hook_vnl_action *) GET_NEXT(vnl_changes) != NULL) {

			/* there are vnode hook updates */
			/* Push hook changes to server */

			hook_requests_to_server(&vnl_changes);
		}

		if (reboot_flag) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, phook->hook_name,
				  "requested for host to be rebooted");
			do_reboot(reboot_cmd);
		}
	}
	vna_list_free(vnl_changes); /* free the list of changes */

	next_time = time_now + phook->freq;
	next_time_str = ctime(&next_time);
	if ((next_time_str != NULL) && (next_time_str[0] != '\0')) {
		next_time_str[strlen(next_time_str) - 1] = '\0'; /* rem newline */
		snprintf(log_buffer, sizeof(log_buffer), "will run on %s",
			 next_time_str);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name, log_buffer);
	}

	(void) set_task(WORK_Timed, time_now + phook->freq,
			run_periodic_hook_bg_task, phook);
}

/**
 *
 *	Based on 'hook_fail_action', send a request to server to
 *	perform a hook fail action for hook named 'hook_name'.
 *
 * @param[in]	hook_name - hook in question
 * @param[in]	hook_fail_action - the actual hook fail action.
 *
 * @return void
 */
void
send_hook_fail_action(hook *phook)
{

	char hook_buf[HOOK_BUF_SIZE];
	vnl_t *tvnl = NULL;
	int vret = -1;

	if ((phook == NULL) || (phook->hook_name == NULL)) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "Hook received is NULL");
		return;
	}

	snprintf(hook_buf, sizeof(hook_buf), "1,%s", phook->hook_name);

	if (vnl_alloc(&tvnl) == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to vnl_alloc vnlp for %s",
			 phook->hook_name);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, "", log_buffer);
		goto send_hook_fail_action_error;
	}

	if (phook->fail_action & HOOK_FAIL_ACTION_OFFLINE_VNODES) {
		vret = vn_addvnr(tvnl, mom_short_name,
				 VNATTR_HOOK_OFFLINE_VNODES,
				 hook_buf, 0, 0, NULL);

		if (vret != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to add to vnlp: %s=%s",
				 VNATTR_HOOK_OFFLINE_VNODES, hook_buf);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, phook->hook_name, log_buffer);
			goto send_hook_fail_action_error;
		}
	}

	if (phook->fail_action & HOOK_FAIL_ACTION_SCHEDULER_RESTART_CYCLE) {
		vret = vn_addvnr(tvnl, mom_short_name,
				 VNATTR_HOOK_SCHEDULER_RESTART_CYCLE,
				 hook_buf, 0, 0, NULL);
		if (vret != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to add to vnlp: %s=%s",
				 VNATTR_HOOK_SCHEDULER_RESTART_CYCLE,
				 hook_buf);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, phook->hook_name, log_buffer);
			goto send_hook_fail_action_error;
		}
	}

	if (vret == 0) {
		/* this saves 'tvnl' in svr_vnl_action, and later freed
		 * upon server acking action
		 */
		(void) send_hook_vnl(tvnl);
		tvnl = NULL;
	}

send_hook_fail_action_error:
	if (tvnl != NULL)
		vnl_free(tvnl);
}

/**
 *
 * @brief
 *	Record the name of the last hook that executed
 *	on behalf of 'pjob' into a well-known file
 *	location:
 *
 *	"<location_directory>/hook_<pjob's jobid>.out"
 *
 *
 * @param[in]	hook_event - calling event.
 * @param[in]	hook_name - name of hook that executed
 * @param[in] 	pjob - associated job executing hook
 * @param[in] 	filepath - name of a file whose
 *			directory location is used as
 *			<location_directory>.
 *
 * @note
 *	This will currently record only for
 *	HOOK_EVENT_EXECJOB_PROLOGUE hooks.
 * @return void
 */
static void
record_job_last_hook_executed(unsigned int hook_event,
			      char *hook_name, job *pjob, char *filepath)
{
	char hook_job_outfile[MAXPATHLEN + 1];
	FILE *fp = NULL;
	char *p;
	char chr_save = '\0';
	char *p_dir = NULL;

	if (pjob == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "Job not received");
		return;
	}

	if (hook_name == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "Hook not received");
		return;
	}
	if (hook_event != HOOK_EVENT_EXECJOB_PROLOGUE) {
		return;
	}

	if (filepath != NULL) {
		p = strrchr(filepath, '/');
		if (p != NULL) {
			p++;
			chr_save = *p;
			*p = '\0';
			p_dir = filepath;
		}
	} else {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "Hook not received");
	}

	snprintf(hook_job_outfile, MAXPATHLEN,
		 FMT_HOOK_JOB_OUTFILE, p_dir ? p_dir : "",
		 pjob->ji_qs.ji_jobid);

	if (chr_save != '\0')
		*p = chr_save; /* restore */

	fp = fopen(hook_job_outfile, "w");
	if (fp == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to open hook_job_outfile=%s",
			 hook_job_outfile);
		log_err(errno, __func__, log_buffer);
		return;
	}
	fprintf(fp, "%s=%s\n", PY_EVENT_HOOK_NAME,
		hook_name);
	fclose(fp);
}

/**
 * @brief
 * This function runs after execution of a single hook and processes
 * the results from hook execution. If hook is backgrounded,on
 * successful execution, a new task will be created to run the next
 * hook script and if there was an error (the hook process returned a non-zero exit
 * status) it does not create the new task for the next hook script.
 *
 * @param[in] 	ptask - the work task.
 *
 * @return 1 a hook accepted
 * @return 0 a hook rejected
 * @return -1 an internal error occurred
 */
int
post_run_hook(struct work_task *ptask)
{

	int accept_flag = 1;
	int reject_flag = 0;
	int reject_rerunjob = 0;
	int reject_deletejob = 0;
	int reboot_flag = 0;
	int log_type = 0;
	int log_class = 0;
	int hook_error_flag = 0;
	int *reject_errcode = NULL;
	int wstat = 0;
	char *log_id = NULL;
	char reject_msg[HOOK_MSG_SIZE + 1] = {'\0'};
	char reboot_cmd[HOOK_BUF_SIZE] = {'\0'};
	char hook_outfile[MAXPATHLEN + 1] = {'\0'};
	hook *phook = NULL;
	mom_hook_input_t *hook_input = NULL;
	job *pjob = NULL;
	struct work_task *new_task = NULL;
	pbs_list_head vnl_changes;
	mom_process_hooks_params_t *php = NULL;

	if (ptask == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "missing ptask argument to event");
		return -1;
	}

	if ((phook = (hook *) ptask->wt_parm1) == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "missing hook phook argument to event");
		return -1;
	}

	if ((php = (mom_process_hooks_params_t *) ptask->wt_parm2) == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "missing hook params argument to event");
		return -1;
	}

	if (php->hook_event == HOOK_EVENT_EXECHOST_PERIODIC) {
		free(php);
		post_periodic_hook(ptask);
		return 1;
	}

	if ((hook_input = (mom_hook_input_t *) php->hook_input) == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "missing input argument to event");
		return -1;
	}

	pjob = (job *) hook_input->pjob;
	CLEAR_HEAD(vnl_changes);

	if ((php->hook_event == HOOK_EVENT_EXECHOST_PERIODIC) ||
	    (php->hook_event == HOOK_EVENT_EXECHOST_STARTUP)) {
		log_id = phook->hook_name;
		log_type = PBSEVENT_DEBUG2;
		log_class = PBS_EVENTCLASS_HOOK;
	} else {
		log_id = pjob->ji_qs.ji_jobid;
		log_type = PBSEVENT_JOB;
		log_class = PBS_EVENTCLASS_JOB;
	}

	/* hook results path */
	snprintf(hook_outfile, MAXPATHLEN, FMT_HOOK_OUTFILE,
		 path_hooks_workdir,
		 hook_event_as_string(php->hook_event),
		 phook->hook_name,
		 (pid_t) ((php->parent_wait) ? php->child : ptask->wt_event));

	if (php->parent_wait == 0) {
		/* background hook */
		wstat = ptask->wt_aux;

		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, phook->hook_name, "finished");

		switch (wstat) {
			case 0:
				break;
			case -2: /* unhandled exception return on Windows */
			case 254:
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "%s hook '%s' encountered an exception, "
					 "request rejected",
					 hook_event_as_string(php->hook_event), phook->hook_name);
				log_event(log_type, log_class,
					  LOG_ERR, log_id, log_buffer);
				record_job_last_hook_executed(php->hook_event,
							      phook->hook_name, pjob, hook_outfile);
				hook_error_flag = 1;
				break;
				/* -3 return from pbs_python == 2^8-3, but run_hook() */
				/* itself could return "-3" if it catches the alarm()   */
				/* to the process first. Both run_hook() code here, and */
				/* pbs_python program set alarm signals. One or the   */
				/* other would catch it first */
			case -3: /* somewhere in this file, we do return -3 */
			case 253:
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "alarm call while running %s hook '%s', "
					 "request rejected",
					 hook_event_as_string(php->hook_event), phook->hook_name);
				log_event(log_type, log_class, LOG_ERR, log_id,
					  log_buffer);
				record_job_last_hook_executed(php->hook_event,
							      phook->hook_name, pjob, hook_outfile);
				hook_error_flag = 1;
				break;
			default:
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "Non-zero exit status %d encountered for %s hook",
					 wstat, hook_event_as_string(php->hook_event));
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, phook->hook_name, log_buffer);
				hook_error_flag = 1; /* hook results are invalid */
		}
	}

	if (hook_error_flag == 0) {
		/* hook exited normally, get results from file  */
		if (get_hook_results(hook_outfile, &accept_flag, &reject_flag,
				     reject_msg, sizeof(reject_msg), &reject_rerunjob,
				     &reject_deletejob, &reboot_flag, reboot_cmd,
				     HOOK_BUF_SIZE, &vnl_changes, pjob, phook,
				     (php->hook_event == HOOK_EVENT_EXECHOST_STARTUP) ? 0 : !php->update_svr,
				     php->hook_output) != 0) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Failed to get hook results");
			vna_list_free(vnl_changes);
			if (php->parent_wait)
				return -1;
			hook_error_flag = 1;
		}
	}

	if (!hook_error_flag) {
		if ((php->hook_output != NULL) && (php->hook_output->vnl != NULL)) {
			struct hook_vnl_action *phvna;
			/* save vnl changes into  results array */
			for (phvna = GET_NEXT(vnl_changes); phvna;
			     phvna = GET_NEXT(phvna->hva_link)) {
				vn_merge(php->hook_output->vnl, phvna->hva_vnl, NULL);
			}
		}

		if (php->update_svr == 1) {
			if (pjob != NULL) {
				/* Delete job or reject job actions */
				/* NOTE: Must appear here before vnode changes, */
				/* since this action will be sent whether or not */
				/* hook script executed by PBSADMIN or not. */
				if (reject_deletejob) {
					/* deletejob takes precedence */
					new_job_action_req(pjob, phook->user, JOB_ACT_REQ_DELETE);
				} else if (reject_rerunjob) {
					new_job_action_req(pjob, phook->user, JOB_ACT_REQ_REQUEUE);
				}

				/* Whether or not we accept or reject, we'll make */
				/* job changes, vnode changes, job actions */
				enqueue_update_for_send(pjob, IS_RESCUSED_FROM_HOOK);
			}

			if (vnl_changes.ll_next != NULL)
				/* Push vnl hook changes to server */
				hook_requests_to_server(&vnl_changes);
		} else {
			vna_list_free(vnl_changes);
		}
	}

	/* reject if at least one hook script rejects */
	if (hook_error_flag || !accept_flag) {

		if (php->hook_msg != NULL) {
			snprintf(php->hook_msg, php->msg_len - 1,
				 "%s request rejected by '%s'",
				 hook_event_as_string(php->hook_event),
				 phook->hook_name);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, php->hook_msg);
		} else {
			snprintf(log_buffer, sizeof(log_buffer),
				 "%s request rejected by '%s'",
				 hook_event_as_string(php->hook_event),
				 phook->hook_name);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
		}

		if (reject_msg[0] != '\0') {
			if (php->hook_msg != NULL) {
				snprintf(php->hook_msg, php->msg_len - 1, "%s",
					 reject_msg);
				/* log also the custom reject message */
				log_event(log_type,
					  log_class, LOG_ERR,
					  log_id, php->hook_msg);
			} else {
				snprintf(log_buffer, sizeof(log_buffer), "%s",
					 reject_msg);
				/* log also the custom reject message */
				log_event(log_type, log_class, LOG_ERR,
					  log_id, log_buffer);
			}
		}

		if (php->hook_output)
			reject_errcode = php->hook_output->reject_errcode;

		if (reject_errcode != NULL) {
			*reject_errcode = PBSE_HOOK_REJECT;
			if (reject_rerunjob)
				*reject_errcode = PBSE_HOOK_REJECT_RERUNJOB;
			if (reject_deletejob)
				*reject_errcode = PBSE_HOOK_REJECT_DELETEJOB;
		}
		if (php->parent_wait)
			return (0); /* don't process anymore hooks on reject */
	}

	if (!hook_error_flag && reboot_flag) {
		if (phook->user == HOOK_PBSUSER) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, phook->hook_name,
				  "Not allowed to issue reboot if run as user");
		} else {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, phook->hook_name,
				  "requested for host to be rebooted");
			do_reboot(reboot_cmd);
		}
	}

	if (!php->parent_wait) {
		/* Background hook */
		/* Create task to check and run next hook script */
		new_task = set_task(WORK_Immed, 0, (void *) mom_process_background_hooks, phook);
		if (!new_task)
			log_err(errno, __func__,
				"Unable to set task for mom_process_background_hooks");
		else
			new_task->wt_parm2 = (void *) php;
	}

	return 1;
}

/**
 * @brief
 * This function replies to the outstanding request after
 * execution of the hook event was in background.
 *
 * @param[in] pjob
 *
 * @return void
 */

void
reply_hook_bg(job *pjob)
{
	int n = 0;
	int ret = 0;
	char jobid[PBS_MAXSVRJOBID + 1] = {'\0'};
	job *pjob2 = NULL;
	long runver;
#if !MOM_ALPS
	struct batch_request *preq = pjob->ji_preq;
#endif

	if (pjob->ji_hook_running_bg_on == BG_IS_DISCARD_JOB) {
		/**
		 * IS_DISCARD_JOB can be received by sister node as well,
		 * when node fail requeue is activated
		 */
		n = get_jattr_long(pjob, JOB_ATR_run_version);
		strcpy(jobid, pjob->ji_qs.ji_jobid);

		del_job_resc(pjob); /* rm tmpdir, etc. */
		pjob->ji_hook_running_bg_on = BG_NONE;
		job_purge_mom(pjob);
		dorestrict_user();

		if ((ret = is_compose(server_stream, IS_DISCARD_DONE)) != DIS_SUCCESS)
			goto err;

		if ((ret = diswst(server_stream, jobid)) != DIS_SUCCESS)
			goto err;

		if ((ret = diswsi(server_stream, n)) != DIS_SUCCESS)
			goto err;

		dis_flush(server_stream);
		tpp_eom(server_stream);

	} else if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) { /*MS*/
		switch (pjob->ji_hook_running_bg_on) {
			case BG_CHECKPOINT_ABORT:
				pjob->ji_hook_running_bg_on = BG_NONE;
				exiting_tasks = 1;
				term_job(pjob);
				break;
			case BG_PBS_BATCH_DeleteJob:
			case BG_PBSE_SISCOMM:
				if ((pjob->ji_numnodes == 1) || (pjob->ji_hook_running_bg_on == BG_PBSE_SISCOMM)) {
					del_job_resc(pjob); /* rm tmpdir, etc. */
					pjob->ji_preq = NULL;
					(void) kill_job(pjob, SIGKILL);
					dorestrict_user();
#if !MOM_ALPS
					/*
					* The delete job request from Server will have
					* been or will be replied to and freed by the
					* alps_cancel_reservation code in the sequence
					* of functions started with the above call to
					* del_job_resc().
					*/
					if (pjob->ji_numnodes == 1)
						reply_ack(preq);
					else if (pjob->ji_hook_running_bg_on == BG_PBSE_SISCOMM)
						req_reject(PBSE_SISCOMM, 0, preq); /* sis down */
#endif
					job_purge_mom(pjob);
				} else
					pjob->ji_hook_running_bg_on = BG_NONE;
				/*
				* otherwise, job_purge() and dorestrict_user() are called in
				* mom_comm when all the sisters have replied. The reply to
				* the Server is also done there
				*/

			/**
			 * Following cases to avoid the below compilation
			 * error: enumeration value not handled in switch
			 */
			case BG_NONE:
			case BG_IM_DELETE_JOB_REPLY:
			case BG_IM_DELETE_JOB:
			case BG_IM_DELETE_JOB2:
			case BG_IS_DISCARD_JOB:
				break;
		}
	} else { /*SISTER MOM*/
		switch (pjob->ji_hook_running_bg_on) {
			case BG_CHECKPOINT_ABORT:
				pjob->ji_hook_running_bg_on = BG_NONE;
				exiting_tasks = 1;
				term_job(pjob);
				break;
			case BG_IM_DELETE_JOB_REPLY:
				post_reply(pjob, 0);
			case BG_IM_DELETE_JOB:
				pjob->ji_hook_running_bg_on = BG_NONE;
				mom_deljob(pjob);
				break;
			case BG_IM_DELETE_JOB2:
				strcpy(jobid, pjob->ji_qs.ji_jobid);
				pjob->ji_hook_running_bg_on = BG_NONE;
				if (is_jattr_set(pjob, JOB_ATR_run_version))
					runver = get_jattr_long(pjob, JOB_ATR_run_version);
				else
					runver = get_jattr_long(pjob, JOB_ATR_runcount);

				mom_deljob(pjob);

				/* Needed to create a lightweight copy of the job to
				 * contain only the jobid info, so I can just call
				 * new_job_action() to create a JOB_ACT_REQ_DEALLOCATE
				 * request. Can't use the original 'pjob' structure as
				 * before creating the request, the real job should have
				 * been deleted already.
				 */
				if ((pjob2 = job_alloc()) != NULL) {
					snprintf(pjob2->ji_qs.ji_jobid, sizeof(pjob2->ji_qs.ji_jobid), "%s", jobid);
					set_jattr_l_slim(pjob2, JOB_ATR_run_version, runver, SET);
					/* JOB_ACT_REQ_DEALLOCATE request will tell the
					 * the server that this mom has completely deleted the
					 * job and now the server can officially free up the
					 * job from the nodes managed by this mom, allowing
					 * other jobs to run.
					 */
					new_job_action_req(pjob2, HOOK_PBSADMIN, JOB_ACT_REQ_DEALLOCATE);
					job_free(pjob2);
				}
				break;

			/**
			 * Following cases to avoid the below compilation
			 * error: enumeration value not handled in switch
			 */
			case BG_NONE:
			case BG_PBS_BATCH_DeleteJob:
			case BG_PBSE_SISCOMM:
			case BG_IS_DISCARD_JOB:
				break;
		}
	}
	return;
err:
	sprintf(log_buffer, "%s", dis_emsg[ret]);
	log_err(-1, __func__, log_buffer);
	tpp_close(server_stream);
}

/**
 * @brief
 * This function loops through the hook list,
 * and runs it in the background.
 *
 * @param[in] ptask - the work task.
 *
 * @retval void
 */
static void
mom_process_background_hooks(struct work_task *ptask)
{
	char hook_infile[MAXPATHLEN + 1] = {'\0'};
	char hook_outfile[MAXPATHLEN + 1] = {'\0'};
	char hook_datafile[MAXPATHLEN + 1] = {'\0'};
	hook *phook = NULL;
	job *pjob = NULL;
	mom_process_hooks_params_t *php = NULL;

	if (ptask == NULL) {
		log_err(-1, __func__, "missing ptask argument");
		return;
	}

	if ((phook = (hook *) ptask->wt_parm1) == NULL) {
		log_err(-1, __func__, "missing phook argument");
		return;
	}

	if ((php = (mom_process_hooks_params_t *) ptask->wt_parm2) == NULL) {
		log_err(-1, __func__, "missing php argument");
		return;
	}

	pjob = php->hook_input->pjob;

	if (pjob->ji_bg_hook_task)
		pjob->ji_bg_hook_task = NULL;

	if (php->hook_output && *(php->hook_output->reject_errcode)) {
		reply_hook_bg(pjob);
		goto fini;
	}

	phook = (hook *) GET_NEXT(phook->hi_execjob_end_hooks);
	while (phook) {
		if (phook->enabled == FALSE) {
			phook = (hook *) GET_NEXT(phook->hi_execjob_end_hooks);
			continue;
		}
		if (phook->script == NULL) {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Hook has no script content. Skipping hook.");
			phook = (hook *) GET_NEXT(phook->hi_execjob_end_hooks);
			continue;
		}
		break;
	}
	if (!phook) {
		reply_hook_bg(pjob);
		goto fini;
	}

	run_hook(phook, php->hook_event, php->hook_input,
		 php->req_user, php->req_host, 0, (void *) post_run_hook,
		 hook_infile, hook_outfile, hook_datafile, MAXPATHLEN + 1, php);
	return;

fini:
	if (php->hook_output) {
		free(php->hook_output->reject_errcode);
		free(php->hook_output);
	}
	free(php->hook_input);
	free(php);
}

/**
 * @brief
 *	Process hook scripts based on request type.
 *	This loops through the matching list of
 *	hooks, and executes the corresponding hook scripts.
 *
 * @param[in] 	hook_event - the event of the hooks that need to process.
 * @param[in] 	req_user - who requested for the hook to execute
 * @param[in] 	req_host - where the hook to execute is located
 * @param[in]	hook_input - struct of input parameters
 * @param[out]	hook_output - struct of output parameters
 * @param[in] 	hook_msg  - upon failure, if this buffer is set, fill it with
 *		the actual error message.
 * @param[in]   msg_len  - the size of 'hook_msg' buffer.
 * @param[in]	update_server - if true, send vnode and job attributes updates
 *			and/or requeue/delete job actions to the Server;
 *			done when NOT a child of Mom, but Mom herself.
 *			For exechost_startup hook, this must not be done,
 *			as the event has no job actions associated with the
 *			hook, and the vnode changes are sent separately
 *			upon mom acknowledging the HELLO server message.
 * @return	int
 * @retval 	0 means at least one hook was encountered to have rejected the
 *		request.
 * @retval 	1 means all the executed hooks have agreed to accept the request
 * @retval	2 means no hook script executed (special case).
 * @retval	-1 an internal error occurred
 * @retval	HOOK_RUNNING_IN_BACKGROUND
 * 				background process started for the hook script.
 *
 */
int
mom_process_hooks(unsigned int hook_event, char *req_user, char *req_host,
		  mom_hook_input_t *hook_input, mom_hook_output_t *hook_output, char *hook_msg,
		  size_t msg_len, int update_server)
{
	char hook_infile[MAXPATHLEN + 1];
	char hook_outfile[MAXPATHLEN + 1];
	char hook_datafile[MAXPATHLEN + 1];
	char *log_id = NULL;
	int rc;
	int num_run = 0;
	int set_job_exit = 0;
	int log_type = 0;
	int log_class = 0;
	int *reject_errcode = NULL;
	unsigned int *pfail_action = NULL;
	hook *phook;
	hook *phook_next = NULL;
	hook **last_phook = NULL;
	job *pjob = NULL;
	pbs_list_head vnl_changes;
	pbs_list_head *head_ptr;
	mom_process_hooks_params_t *php = NULL;
	struct work_task task;
	char perf_label[MAXBUFLEN];

	if (hook_input == NULL) {
		log_err(-1, __func__, "missing input argument to event");
		return (-1);
	}

	pjob = hook_input->pjob;

	/* If output objects are given, must have at least 3 */
	/* otherwise, input array is ignored */
	if (hook_output != NULL) {
		reject_errcode = hook_output->reject_errcode;
		last_phook = hook_output->last_phook;
		pfail_action = hook_output->fail_action;
	}
	if ((php = (mom_process_hooks_params_t *) malloc(
		     sizeof(mom_process_hooks_params_t))) == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		return -1;
	}
	php->hook_event = hook_event;
	php->req_user = req_user;
	php->req_host = req_host;
	php->hook_msg = hook_msg;
	php->msg_len = msg_len;
	php->update_svr = update_server;
	php->hook_input = hook_input;
	php->hook_output = hook_output;
	php->parent_wait = 1;

	CLEAR_HEAD(vnl_changes);
	switch (hook_event) {

		case HOOK_EVENT_EXECJOB_BEGIN:
			head_ptr = &svr_execjob_begin_hooks;
			break;
		case HOOK_EVENT_EXECJOB_PROLOGUE:
			head_ptr = &svr_execjob_prologue_hooks;
			break;
		case HOOK_EVENT_EXECJOB_EPILOGUE:
			head_ptr = &svr_execjob_epilogue_hooks;
			break;
		case HOOK_EVENT_EXECJOB_END:
			head_ptr = &svr_execjob_end_hooks;
#ifndef WIN32
			php->parent_wait = 0;
#endif
			break;
		case HOOK_EVENT_EXECJOB_PRETERM:
			head_ptr = &svr_execjob_preterm_hooks;
			break;
		case HOOK_EVENT_EXECJOB_LAUNCH:
			head_ptr = &svr_execjob_launch_hooks;
			break;
		case HOOK_EVENT_EXECHOST_PERIODIC:
			head_ptr = &svr_exechost_periodic_hooks;
			php->parent_wait = 0;
			break;
		case HOOK_EVENT_EXECHOST_STARTUP:
			head_ptr = &svr_exechost_startup_hooks;
			break;
		case HOOK_EVENT_EXECJOB_ATTACH:
			head_ptr = &svr_execjob_attach_hooks;
			break;
		case HOOK_EVENT_EXECJOB_RESIZE:
			head_ptr = &svr_execjob_resize_hooks;
			break;
		case HOOK_EVENT_EXECJOB_ABORT:
			head_ptr = &svr_execjob_abort_hooks;
			break;
		case HOOK_EVENT_EXECJOB_POSTSUSPEND:
			head_ptr = &svr_execjob_postsuspend_hooks;
			break;
		case HOOK_EVENT_EXECJOB_PRERESUME:
			head_ptr = &svr_execjob_preresume_hooks;
			break;
		default:
			free(php);
			return (-1); /* unexpected event encountered */
	}

	if (hook_msg != NULL)
		memset(hook_msg, '\0', msg_len);

	for (phook = (hook *) GET_NEXT(*head_ptr); phook; phook = phook_next) {
		switch (hook_event) {

			case HOOK_EVENT_EXECJOB_BEGIN:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_begin_hooks);
				break;
			case HOOK_EVENT_EXECJOB_PROLOGUE:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_prologue_hooks);
				break;
			case HOOK_EVENT_EXECJOB_EPILOGUE:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_epilogue_hooks);
				break;
			case HOOK_EVENT_EXECJOB_END:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_end_hooks);
				break;
			case HOOK_EVENT_EXECJOB_PRETERM:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_preterm_hooks);
				break;
			case HOOK_EVENT_EXECJOB_LAUNCH:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_launch_hooks);
				break;
			case HOOK_EVENT_EXECHOST_PERIODIC:
				phook_next = (hook *) GET_NEXT(phook->hi_exechost_periodic_hooks);
				break;
			case HOOK_EVENT_EXECHOST_STARTUP:
				phook_next = (hook *) GET_NEXT(phook->hi_exechost_startup_hooks);
				break;
			case HOOK_EVENT_EXECJOB_ATTACH:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_attach_hooks);
				break;
			case HOOK_EVENT_EXECJOB_RESIZE:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_resize_hooks);
				break;
			case HOOK_EVENT_EXECJOB_ABORT:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_abort_hooks);
				break;
			case HOOK_EVENT_EXECJOB_POSTSUSPEND:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_postsuspend_hooks);
				break;
			case HOOK_EVENT_EXECJOB_PRERESUME:
				phook_next = (hook *) GET_NEXT(phook->hi_execjob_preresume_hooks);
				break;
			default:
				free(php);
				return (-1); /*  should not get here */
		}

		if (phook->enabled == FALSE)
			continue;

		if (phook->script == NULL) {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Hook has no script content. Skipping hook.");
			continue;
		}

		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, phook->hook_name, "started");

		hook_infile[0] = '\0';
		hook_outfile[0] = '\0';
		hook_datafile[0] = '\0';

		/* on an execjob_end or execjob_epilogue hook, need to set  */
		/* the job's exit value. 				    */
		/* Set it only once, and only if there's a hook to execute  */
		/* since we're affecting the job directly.		    */
		if (((hook_event == HOOK_EVENT_EXECJOB_END) ||
		     (hook_event == HOOK_EVENT_EXECJOB_EPILOGUE)) &&
		    !set_job_exit) {

			set_jattr_l_slim(pjob, JOB_ATR_exit_status, pjob->ji_qs.ji_un.ji_momt.ji_exitstat, SET);
			set_job_exit = 1;
		} else if ((hook_event == HOOK_EVENT_EXECJOB_LAUNCH) && (num_run >= 1)) {

			/*
			 * If there are multiple execjob_launch hooks,
			 * we need to cascade the execjob_launch specific
			 * parameters to the next execjob_launch hook,
			 * if any of the previous hooks has set these
			 * values.
			 */

			if (hook_output != NULL) {

				if (hook_output->progname != NULL) {
					hook_input->progname = *hook_output->progname;
				}

				if (hook_output->env != NULL) {
					hook_input->env = hook_output->env;
				}
				hook_input->argv = svrattrl_to_str_array(hook_output->argv);
			}
		}

		if (pjob != NULL)
			snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%s", hook_event_as_string(hook_event), phook->hook_name, pjob->ji_qs.ji_jobid);
		else
			snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", hook_event_as_string(hook_event), phook->hook_name, getpid());

		hook_perf_stat_start(perf_label, "mom_process_hooks", 1);
		rc = run_hook(phook, hook_event, hook_input,
			      req_user, req_host, php->parent_wait, (void *) post_run_hook,
			      hook_infile, hook_outfile, hook_datafile, MAXPATHLEN + 1, php);
		hook_perf_stat_stop(perf_label, "mom_process_hooks", 1);

		if (last_phook != NULL)
			*last_phook = phook;

		if (pfail_action != NULL)
			*pfail_action |= phook->fail_action;

		/* go back to mom's private directory */
		if (chdir(mom_home) != 0) {
			log_event(PBSEVENT_DEBUG2,
				  PBS_EVENTCLASS_HOOK, LOG_WARNING, phook->hook_name,
				  "unable to go back to mom_home");
		}

		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO, phook->hook_name, "finished");

		if ((hook_event == HOOK_EVENT_EXECHOST_PERIODIC) || (hook_event == HOOK_EVENT_EXECHOST_STARTUP)) {
			log_id = phook->hook_name;
			log_type = PBSEVENT_DEBUG2;
			log_class = PBS_EVENTCLASS_HOOK;
		} else {
			log_id = pjob->ji_qs.ji_jobid;
			log_type = PBSEVENT_JOB;
			log_class = PBS_EVENTCLASS_JOB;
		}

		switch (rc) {
			case 0: /* success */
				break;
				/* -2 return from pbs_python on Windows == 2^8-2 on Linux*/
			case -2:  /* unhandled exception return on Windows */
			case 254: /* unhandled exception return on Linux/Unix */
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "%s hook '%s' encountered an exception, "
					 "request rejected",
					 hook_event_as_string(hook_event), phook->hook_name);
				log_event(log_type, log_class,
					  LOG_ERR, log_id, log_buffer);
				if (hook_msg != NULL) {
					snprintf(hook_msg, msg_len - 1,
						 "request rejected as filter hook '%s' encountered an "
						 "exception. Please inform Admin",
						 phook->hook_name);
				}
				if (reject_errcode != NULL) {
					*reject_errcode = PBSE_HOOKERROR;
				}
				record_job_last_hook_executed(hook_event, phook->hook_name, pjob, hook_outfile);
				free(php);
				return (0);
				/* -3 return from pbs_python == 2^8-3, but run_hook() */
				/* itself could return "-3" if it catches the alarm()   */
				/* to the process first. Both run_hook() code here, and */
				/* pbs_python program set alarm signals. One or the   */
				/* other would catch it first */
			case -3:  /* somewhere in this file, we do return -3 */
			case 253: /* alarm timeout */
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "alarm call while running %s hook '%s', "
					 "request rejected",
					 hook_event_as_string(hook_event), phook->hook_name);
				log_event(log_type, log_class,
					  LOG_ERR, log_id, log_buffer);
				if (hook_msg != NULL) {
					snprintf(hook_msg, msg_len - 1,
						 "request rejected as filter hook '%s' got an "
						 "alarm call. Please inform Admin",
						 phook->hook_name);
				}
				if (reject_errcode != NULL) {
					*reject_errcode = PBSE_HOOKERROR;
				}
				record_job_last_hook_executed(hook_event, phook->hook_name, pjob, hook_outfile);
				free(php);
				return (0);
			default:
				snprintf(log_buffer, sizeof(log_buffer),
					 "Internal server error encountered. Skipping hook %s",
					 phook->hook_name);
				log_event(log_type, log_class,
					  LOG_ERR, log_id, log_buffer);
				free(php);
				return (-1); /* should not happen */
		}

		num_run++;

		if (hook_event == HOOK_EVENT_EXECHOST_PERIODIC) {
			/* hook backgrounded */
			if ((php = duplicate_php(php)) == NULL)
				return (-1);
			continue;
		}

		if (php->parent_wait == 0)
			return (HOOK_RUNNING_IN_BACKGROUND);

		task.wt_parm1 = (void *) phook;
		task.wt_parm2 = (void *) php;
		if ((rc = post_run_hook(&task)) != 1) {
			/* if a hook is not accepted do not proceed further*/
			free(php);
			return rc;
		}
	}
	if (num_run == 0) {
		free(php);
		return (2);
	}

	free(php);
	return (1);
}

/**
 * @brief
 * 	Cleans up files older than HOOKS_TMPFILE_MAX_AGE under
 *	<path_spool>.
 *
 * @param[in] 	ptask	- a task to queue up
 *
 * @return none
 *
 */
void
cleanup_hooks_in_path_spool(struct work_task *ptask)
{
	DIR *dir;
	struct dirent *pdirent;
	struct stat sbuf;
	char hook_file[MAXPATHLEN + 1];

	memset(hook_file, '\0', MAXPATHLEN + 1);
	dir = opendir(path_spool);
	if (dir == NULL) {
		sprintf(log_buffer, "could not opendir %s",
			path_hooks_workdir);
		log_err(errno, __func__, log_buffer);
		return;
	}
	while (errno = 0, (pdirent = readdir(dir)) != NULL) {

		if (pdirent->d_name[0] == '.') {
			if (pdirent->d_name[1] == '\0' ||
			    (pdirent->d_name[1] == '.' &&
			     pdirent->d_name[2] == '\0'))
				continue;
		}

		if (strncmp(pdirent->d_name, FMT_HOOK_PREFIX,
			    sizeof(FMT_HOOK_PREFIX) - 1) != 0)
			continue;

		snprintf(hook_file, MAXPATHLEN, "%s%s",
			 path_spool, pdirent->d_name);
		if (stat(hook_file, &sbuf) == -1) {
			sprintf(log_buffer, "could not stat %s", hook_file);
			log_err(errno, __func__, log_buffer);
			continue;
		}

		/* remove files older than 'HOOKS_TMPFILE_MAX_AGE' */
		if ((time_now - sbuf.st_ctime) > HOOKS_TMPFILE_MAX_AGE) {
			if (unlink(hook_file) < 0) {
				if (errno != ENOENT) {
					sprintf(log_buffer, "could not cleanup %s",
						hook_file);
					log_err(errno, __func__, log_buffer);
				}
			}
		}
	}
	if (errno != 0 && errno != ENOENT) {
		log_err(errno, __func__, "readdir");
	}
	if (dir) {
		(void) closedir(dir);
	}

	/*  cleanup of hooks temp files happen in the next */
	/* 'HOOKS_TMPFILE_NEXT_CLEANUP_PERIOD' secs.	   */
	(void) set_task(WORK_Timed, time_now + HOOKS_TMPFILE_NEXT_CLEANUP_PERIOD,
			cleanup_hooks_in_path_spool, NULL);
}

/**
 *  @brief
 *  	Initializes all the elements of mom_hook_input_t structure.
 *
 *  @param[in]	hook_input - the structure to initialize.
 *  @return void
 *
 */
void
mom_hook_input_init(mom_hook_input_t *hook_input)
{
	if (hook_input == NULL) {
		log_err(PBSE_HOOKERROR, __func__, "Hook input is NULL");
		return;
	}

	hook_input->pjob = NULL;
	hook_input->progname = NULL;
	hook_input->argv = NULL;
	hook_input->env = NULL;
	hook_input->vnl = NULL;
	hook_input->vnl_fail = NULL;
	hook_input->failed_mom_list = NULL;
	hook_input->succeeded_mom_list = NULL;
	hook_input->jobs_list = NULL;
}

/**
 *  @brief
 *  	Initializes all the elements of mom_hook_output_t structure.
 *
 *  @param[in]	hook_output - the structure to initialize.
 *  @return void
 *
 */
void
mom_hook_output_init(mom_hook_output_t *hook_output)
{
	if (hook_output == NULL) {
		log_err(PBSE_HOOKERROR, __func__, "Hook output is NULL");
		return;
	}

	hook_output->reject_errcode = NULL;
	hook_output->last_phook = NULL;
	hook_output->fail_action = NULL;
	hook_output->progname = NULL;
	hook_output->argv = NULL;
	hook_output->env = NULL;
	hook_output->vnl = NULL;
	hook_output->vnl_fail = NULL;
}


================================================
FILE: src/resmom/mom_inter.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
/**
 * @file	mom_inter.c
 */
#include <sys/types.h>
#include <netinet/in.h>
#include <sys/socket.h>
#include <errno.h>
#include <fcntl.h>
#include <stdio.h>
#include <string.h>
#include <termios.h>
#include <unistd.h>
#include <stdlib.h>
#include <netdb.h>
#if defined(HAVE_SYS_IOCTL_H)
#include <sys/ioctl.h>
#endif
#if !defined(sgi) && !defined(linux)
#include <sys/tty.h>
#endif /* ! sgi */
#include "portability.h"
#include "pbs_ifl.h"
#include "server_limits.h"
#include "net_connect.h"
#include "libsec.h"
#include "port_forwarding.h"
#include "log.h"
#include "libpbs.h"
#include "dis.h"

static char cc_array[PBS_TERM_CCA];
static struct winsize wsz;

extern int mom_reader_go;

extern int ptc;
#define XAUTH_LEN 512

/**
 * @brief
 * 	read_net - read data from network till received amount expected
 *
 * @param[in] sock - file descriptor
 * @param[in] buf  - buffer
 * @param[in] amt  - amount of data
 *
 * @return int
 * @retval  >0 amount read
 * @retval  -1 on error
 *
 */
static int
read_net(int sock, char *buf, int amt)
{
	int got;
	int total = 0;

	while (amt > 0) {
		got = CS_read(sock, buf, amt);
		if (got > 0) { /* read (some) data */
			amt -= got;
			buf += got;
			total += got;
		} else if (got == 0)
			break;
		else
			return (-1);
	}
	return (total);
}

/**
 * @brief
 * 	read_net - read packet from network till received amount expected
 *
 * @param[in] sock - file descriptor
 * @param[in] buf  - buffer
 * @param[in] amt  - amount of data
 *
 * @return int
 * @retval  >0 amount read
 * @retval  -1 on error
 *
 */
static int
read_pkt_net(int sock, char *buf, int amt)
{
	int got;
	int total = 0;
	void *data_in = NULL;
	size_t len_in = 0;
	int type = 0;

	while (amt > 0) {
		got = transport_recv_pkt(sock, &type, &data_in, &len_in);
		if (got > 0) { /* read (some) data */
			memcpy(buf, data_in, len_in);
			amt -= got;
			buf += got;
			total += got;
		} else if (got == 0)
			break;
		else
			return (-1);
	}
	return (total);
}

/**
 * @brief
 * 	rcvttype - receive the terminal type of the real terminal
 *	Sent over network as "TERM=type_string"
 *
 * @param sock - file descriptor
 *
 * @return string
 *
 */

char *
rcvttype(int sock)
{
	static char buf[PBS_TERM_BUF_SZ];
	int (*read_f)(int, char *, int) = NULL;

	if (transport_chan_get_ctx_status(sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		read_f = read_pkt_net;
	} else {
		read_f = read_net;
	}

	/* read terminal type as sent by qsub */

	if ((read_f(sock, buf, PBS_TERM_BUF_SZ) != PBS_TERM_BUF_SZ) ||
	    (strncmp(buf, "TERM=", 5) != 0))
		return NULL;

	/* get the basic control characters from qsub's termial */

	if (read_f(sock, cc_array, PBS_TERM_CCA) != PBS_TERM_CCA) {
		return NULL;
	}

	return (buf);
}

/**
 * @brief
 * 	set_termcc - set the basic modes for the slave terminal, and set the
 *	control characters to those sent by qsub.
 *
 * @param[in] fd - file descriptor
 *
 * @return Void
 *
 */

void
	set_termcc(int fd)
{
	struct termios slvtio;

#ifdef PUSH_STREAM
	(void) ioctl(fd, I_PUSH, "ptem");
	(void) ioctl(fd, I_PUSH, "ldterm");
#endif /* PUSH_STREAM */

	if (tcgetattr(fd, &slvtio) < 0)
		return; /* cannot do it, leave as is */

#ifdef IMAXBEL
	slvtio.c_iflag = (BRKINT | IGNPAR | ICRNL | IXON | IXOFF | IMAXBEL);
#else
	slvtio.c_iflag = (BRKINT | IGNPAR | ICRNL | IXON | IXOFF);
#endif
	slvtio.c_oflag = (OPOST | ONLCR);
#if defined(ECHOKE) && defined(ECHOCTL)
	slvtio.c_lflag = (ISIG | ICANON | ECHO | ECHOE | ECHOK | ECHOKE | ECHOCTL);
#else
	slvtio.c_lflag = (ISIG | ICANON | ECHO | ECHOE | ECHOK);
#endif
	slvtio.c_cc[VEOL] = '\0';
	slvtio.c_cc[VEOL2] = '\0';
	slvtio.c_cc[VSTART] = '\021'; /* ^Q */
	slvtio.c_cc[VSTOP] = '\023';  /* ^S */
#if defined(VDSUSP)
	slvtio.c_cc[VDSUSP] = '\031'; /* ^Y */
#endif
#if defined(VREPRINT)
	slvtio.c_cc[VREPRINT] = '\022'; /* ^R */
#endif
	slvtio.c_cc[VLNEXT] = '\017'; /* ^V */

	slvtio.c_cc[VINTR] = cc_array[0];
	slvtio.c_cc[VQUIT] = cc_array[1];
	slvtio.c_cc[VERASE] = cc_array[2];
	slvtio.c_cc[VKILL] = cc_array[3];
	slvtio.c_cc[VEOF] = cc_array[4];
	slvtio.c_cc[VSUSP] = cc_array[5];
	(void) tcsetattr(fd, TCSANOW, &slvtio);
}

/**
 * @brief
 * 	rcvwinsize - receive the window size of the real terminal window
 *
 *	Sent over network as "WINSIZE rn cn xn yn"  where .n is numeric string
 *
 * @param[in] sock - file descriptor
 *
 * @return   error code
 * @retval   0     Success
 * @retval  -1     Failure
 *
 */

int
rcvwinsize(int sock)
{
	char buf[PBS_TERM_BUF_SZ];
	int (*read_f)(int, char *, int) = NULL;

	if (transport_chan_get_ctx_status(sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		read_f = read_pkt_net;
	} else {
		read_f = read_net;
	}

	if (read_f(sock, buf, PBS_TERM_BUF_SZ) != PBS_TERM_BUF_SZ)
		return (-1);
	if (sscanf(buf, "WINSIZE %hu,%hu,%hu,%hu", &wsz.ws_row, &wsz.ws_col,
		   &wsz.ws_xpixel, &wsz.ws_ypixel) != 4)
		return (-1);
	return 0;
}

/**
 * @brief
 *	set window size or terminal
 *
 * @param pty - terminal interface
 *
 * @return    error code
 * @retval    0     Success
 * @retval   -1     Failure
 *
 */
int
setwinsize(int pty)
{
	if (ioctl(pty, TIOCSWINSZ, &wsz) < 0) {
		perror("ioctl TIOCSWINSZ");
		return (-1);
	}
	return (0);
}

/**
 * @brief
 *	reader process - reads from the remote socket, and writes
 *	to the master pty
 *
 * @param[in] s - filr descriptor
 * @param[in] ptc - master file descriptor
 * @param[in] command - shell command(s) to be sent to the PTY before user data from the socket
 *
 * @return    error code
 * @retval    0     Success
 * @retval   -1     Write Failure
 * @retval   -2     Read Failure
 * 
 */
int
mom_reader(int s, int ptc, char *command)
{
	char buf[PF_BUF_SIZE];
	int c;

	/* send shell command(s) to the PTY input stream */
	c = command ? strlen(command) : 0;
	if (c > 0) {
		int wc;
		char *p = command;

		while (c) {
			if ((wc = write(ptc, p, c)) < 0) {
				if (errno == EINTR) {
					continue;
				}
				return (-1);
			}
			c -= wc;
			p += wc;
		}
	}

	/* read from the socket, and write to ptc */
	while (mom_reader_go) {
		c = CS_read(s, buf, sizeof(buf));
		if (c > 0) {
			int wc;
			char *p = buf;

			while (c) {
				if ((wc = write(ptc, p, c)) < 0) {
					if (errno == EINTR) {
						continue;
					}
					return (-1);
				}
				c -= wc;
				p += wc;
			}
		} else if (c == 0) {
			return (0);
		} else if (c < 0) {
			if (errno == EINTR)
				continue;
			else {
				return (-2);
			}
		}
	}
	return 0;
}

/**
 * @brief
 *	reader process - reads from the remote socket, and writes
 *	to the master pty
 *
 * @param[in] s - filr descriptor
 * @param[in] ptc - master file descriptor
 * @param[in] command - shell command(s) to be sent to the PTY before user data from the socket
 *
 * @return    error code
 * @retval    0     Success
 * @retval   -1     Write Failure
 * @retval   -2     Read Failure
 * 
 */
int
mom_reader_pkt(int s, int ptc, char *command)
{
	int c;
	void *data_in = NULL;
	size_t len_in = 0;
	int type = 0;

	/* send shell command(s) to the PTY input stream */
	c = command ? strlen(command) : 0;
	if (c > 0) {
		int wc;
		char *p = command;

		while (c) {
			if ((wc = write(ptc, p, c)) < 0) {
				if (errno == EINTR) {
					continue;
				}
				return (-1);
			}
			c -= wc;
			p += wc;
		}
	}

	/* read from the socket, and write to ptc */
	while (mom_reader_go) {
		pbs_tcp_timeout = -1;
		c = transport_recv_pkt(s, &type, &data_in, &len_in);
		if (c > 0) {
			int wc;
			char *p = data_in;

			while (c) {
				if ((wc = write(ptc, p, c)) < 0) {
					if (errno == EINTR) {
						continue;
					}
					return (-1);
				}
				c -= wc;
				p += wc;
			}
		} else if (c == -2) { /* tcp_recv returns -2 on EOF */
			return (0);
		} else if (c < 0) {
			if (errno == EINTR)
				continue;
			else {
				return (-2);
			}
		}
	}
	return 0;
}

/**
 * @brief
 *      This functions sets the job directory to PBS_JOBDIR for private sandbox
 *
 * @param command[in] - this parameter contains the job directory in case of
 *                      private sandbox.
 * @return int
 * @retval 0 Success
 * @retval -1 Failure
 *
 */
int
setcurrentworkdir(char *command)

{
	int c;

	/* send shell command(s) to the PTY input stream */
	c = command ? strlen(command) : 0;
	if (c > 0) {
		int wc;
		char *p = command;

		while (c) {
			if ((wc = write(ptc, p, c)) < 0) {
				if (errno == EINTR) {
					continue;
				}
				return (-1);
			}
			c -= wc;
			p += wc;
		}
	}
	return 0;
}

/**
 * @brief
 *        This function reads the data from remote socket and write it to pty.
 *
 * @param[in] s - socket fd from where data needs to be read.
 *
 * @return  int
 * @retval    0  Success
 * @retval   -1  Failure
 * @retval   -2  Peer Closed
 *
 */
int
mom_reader_Xjob(int s)
{
	static char buf[PF_BUF_SIZE];
	int c;
	/* read from the socket, and write to ptc */
	c = CS_read(s, buf, sizeof(buf));
	if (c > 0) {
		int wc;
		char *p = buf;

		while (c) {
			if ((wc = write(ptc, p, c)) < 0) {
				if (errno == EINTR) {
					continue;
				}
				return (-1);
			}
			c -= wc;
			p += wc;
		}
	} else if (c == 0) {
		/* If control reaches here, then it means peer has closed the
		 * connection
		 */
		return (-2);
	} else if (c < 0) {
		if (errno == EINTR) {
			return (0);
		} else {
			return (-1);
		}
	}
	return (0);
}

/**
 * @brief
 *        This function reads the packets from remote socket and write it to pty.
 *
 * @param[in] s - socket fd from where data needs to be read.
 *
 * @return  int
 * @retval    0  Success
 * @retval   -1  Failure
 * @retval   -2  Peer Closed
 *
 */
int
mom_reader_pkt_Xjob(int s)
{
	int c;
	void *data_in = NULL;
	size_t len_in = 0;
	int type = 0;

	/* read from the socket, and write to ptc */
	c = transport_recv_pkt(s, &type, &data_in, &len_in);
	if (c > 0) {
		int wc;
		char *p = data_in;

		while (c) {
			if ((wc = write(ptc, p, c)) < 0) {
				if (errno == EINTR) {
					continue;
				}
				return (-1);
			}
			c -= wc;
			p += wc;
		}
	} else if (c == -2) { /* tcp_recv returns -2 on EOF */
		/* If control reaches here, then it means peer has closed the
		 * connection
		 */
		return (-2);
	} else if (c < 0) {
		if (errno == EINTR) {
			return (0);
		} else {
			return (-1);
		}
	}
	return (0);
}

/**
 * @brief
 *        This function selects reader for data from remote socket and write it to pty.
 *
 * @param[in] s - socket fd from where data needs to be read.
 *
 * @return  int
 * @retval    0  Success
 * @retval   -1  Failure
 * @retval   -2  Peer Closed
 *
 */
int
mom_get_reader_Xjob(int s)
{
	if (transport_chan_get_ctx_status(s, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
		return mom_reader_pkt_Xjob(s);
	} else {
		return mom_reader_Xjob(s);
	}
}

/**
 * @brief
 * 	Writer process: reads from master pty, and writes
 * 	data out to the rem socket
 *
 * @param[in] s - socket fd
 * @param[in] ptc - master file descriptor
 *
 * @return    error code
 * @retval    0     Success
 * @retval   -1     Write Failure
 * @retval   -2     Read Failure
 *
 */
int
mom_writer(int s, int ptc)
{
	char buf[PF_BUF_SIZE];
	int c;

	/* read from ptc, and write to the socket */
	while (1) {
		c = read(ptc, buf, sizeof(buf));
		if (c > 0) {
			int wc;
			char *p = buf;

			while (c) {
				if ((wc = CS_write(s, p, c)) < 0) {
					if (errno == EINTR) {
						continue;
					}
					return (-1);
				}
				c -= wc;
				p += wc;
			}
		} else if (c == 0) {
			return (0);
		} else if (c < 0) {
			if (errno == EINTR)
				continue;
			else {
				return (-2);
			}
		}
	}
}

/**
 * @brief
 * 	Packet Writer process: reads from master pty, and writes
 * 	data out to the rem socket
 *
 * @param[in] s - socket fd
 * @param[in] ptc - master file descriptor
 *
 * @return    error code
 * @retval    0     Success
 * @retval   -1     Write Failure
 * @retval   -2     Read Failure
 *
 */
int
mom_writer_pkt(int s, int ptc)
{
	char buf[PF_BUF_SIZE];
	int c;

	/* read from ptc, and write to the socket */
	while (1) {
		c = read(ptc, buf, sizeof(buf));
		if (c > 0) {
			transport_send_pkt(s, AUTH_ENCRYPTED_DATA, buf, c);
		} else if (c == 0) {
			return (0);
		} else if (c < 0) {
			if (errno == EINTR)
				continue;
			else {
				return (-2);
			}
		}
	}
}

/**
 * @brief
 *      connect to the qsub that submitted this interactive job
 *
 * @param hostname[in] - hostname of the submission host where qsub is running.
 * @param port[in] - port number on which qsub is accepting connection.
 * @param authport_falgs[in] - Authentication port flags to use. Values defined in net_connect.h
 *
 * @return int
 * @retval >=0 the socket obtained
 * @retval  -1 PBS_NET_RC_FATAL
 * @retval  -2 PBS_NET_RC_RETRY
 *
 */
static int
_conn_qsub(char *hostname, long port, int authport_flags)
{
	pbs_net_t hostaddr;

	if ((hostaddr = get_hostaddr(hostname)) == (pbs_net_t) 0)
		return (PBS_NET_RC_FATAL);

	/* Yes, the qsub is listening, but for authentication
	 * purposes mom wants authenticate as a server - not as
	 * a client
	 */

	return (client_to_svr(hostaddr, (unsigned int) port, authport_flags));
}

/**
 * @brief
 *      connect to the qsub that submitted this interactive job, using a privileged port
 *
 * @param hostname[in] - hostname of the submission host where qsub is running.
 * @param port[in] - port number on which qsub is accepting connection.
 *
 * @return int
 * @retval >=0 the socket obtained
 * @retval  -1 PBS_NET_RC_FATAL
 * @retval  -2 PBS_NET_RC_RETRY
 *
 */
int
conn_qsub_resvport(char *hostname, long port)
{
	return _conn_qsub(hostname, port, B_SVR | B_RESERVED);
}


/**
 * @brief
 *      connect to the qsub that submitted this interactive job
 *
 * @param hostname[in] - hostname of the submission host where qsub is running.
 * @param port[in] - port number on which qsub is accepting connection.
 *
 * @return int
 * @retval >=0 the socket obtained
 * @retval  -1 PBS_NET_RC_FATAL
 * @retval  -2 PBS_NET_RC_RETRY
 *
 */
int
conn_qsub(char *hostname, long port)
{
	return _conn_qsub(hostname, port, B_SVR);
}

/**
 * @brief       This function creates a socket for listening for X11
 *              connections.The socket is created only for jobs that
 *              require X forwarding .
 *
 * @param socks[in/out] - Socks structure which keeps track of
 *                        sockets that are active and data read/written by
 *                        peers.
 * @param x11_use_localhost[in] - Non-zero value to use localhost only.
 * @param display[out] - sets the display number and screen number.
 * @param homedir[in] - uses this home directory to put in the environment.
 * @param x11authstr[in] - used to get the X11 protocol, hex data and screen.
 *
 * @return int - Return a suitable display number (>0) for the DISPLAY
 *               variable
 * @retval -1 Failure
 *
 */
int
init_x11_display(
	struct pfwdsock *socks,
	int x11_use_localhost,
	char *display,
	char *homedir,
	char *x11authstr)
{
	int display_number, sock, i;
	u_short port;
	struct addrinfo hints, *ai, *aitop;
	char strport[NI_MAXSERV];
	int gaierr, n, num_socks = 0, ret = 0;
	unsigned int x11screen;
	char x11proto[XAUTH_LEN], x11data[XAUTH_LEN];
	char format[XAUTH_LEN];
	char *homeenv;
	char logit[512] = {0};
	char func[] = "init_x11_display";

	*display = '\0';
	if ((homeenv = malloc(sizeof("HOME=") + strlen(homedir) + 1)) == NULL) {
		/* FAILURE - cannot alloc memory */
		sprintf(logit, "Malloc Failure : %.100s\n",
			strerror(errno));
		log_err(errno, func, logit);

		return (-1);
	}

	setenv("HOME", homedir, 1);

	for (n = 0; n < NUM_SOCKS; n++)
		socks[n].active = 0;

	x11proto[0] = x11data[0] = '\0';
	format[0] = '\0';

	sprintf(format, " %%%d[^:]: %%%d[^:]: %%u", XAUTH_LEN - 1, XAUTH_LEN - 1);

	errno = 0;

	if ((n = sscanf(x11authstr, format,
			x11proto,
			x11data,
			&x11screen)) != 3) {
		sprintf(logit, "sscanf(%s)=%d failed: %s\n",
			x11authstr,
			n,
			strerror(errno));
		log_err(errno, func, logit);
		free(socks);
		return (-1);
	}

	for (display_number = X11OFFSET; display_number < MAX_DISPLAYS;
	     display_number++) {
		port = X_PORT + display_number;
		memset(&hints, 0, sizeof(hints));
		hints.ai_family = AF_UNSPEC;
		hints.ai_flags = x11_use_localhost ? 0 : AI_PASSIVE;
		hints.ai_socktype = SOCK_STREAM;
		ret = snprintf(strport, sizeof(strport), "%d", port);
		if (ret >= sizeof(strport)) {
			log_err(-1, func, "strport overflow");
		}

		if ((gaierr = getaddrinfo(NULL, strport, &hints, &aitop)) != 0) {
			sprintf(logit, "getaddrinfo: %.100s\n",
				gai_strerror(gaierr));
			log_err(errno, func, logit);
			free(socks);
			return (-1);
		}

		/* create a socket and bind it to display_number */
		for (ai = aitop; ai != NULL; ai = ai->ai_next) {
			if (ai->ai_family != AF_INET)
				continue;
			sock = socket(ai->ai_family, SOCK_STREAM, 0);
			if (sock < 0) {
				if ((errno != EINVAL) && (errno != EAFNOSUPPORT)) {
					sprintf(logit, "socket: %.100s\n",
						strerror(errno));
					log_err(errno, func, logit);
					free(socks);
					return (-1);
				} else {
					sprintf(logit, "Socket family %d *NOT* supported\n",
						ai->ai_family);
					log_err(errno, func, logit);
					continue;
				}
			}
			i = 1;
			setsockopt(sock, SOL_SOCKET, SO_REUSEADDR, (char *) &i, sizeof(i));
			if (bind(sock, ai->ai_addr, ai->ai_addrlen) < 0) {
				log_err(errno, func, strerror(errno));
				close(sock);
				if (ai->ai_next)
					continue;
				for (n = 0; n < num_socks; n++) {
					close(socks[n].sock);
				}
				num_socks = 0;
				break;
			}

			socks[num_socks].sock = sock;
			socks[num_socks].active = 1;
			num_socks++;
			if (x11_use_localhost) {
				if (num_socks == NUM_SOCKS)
					break;
			} else {
				break;
			}
		}
		freeaddrinfo(aitop);
		if (num_socks > 0)
			break;
	} /* END for (display) */
	if (display_number >= MAX_DISPLAYS) {
		sprintf(logit, "Failed to allocate internet-domain X11 display socket.\n");
		log_err(errno, func, logit);
		free(socks);
		return (-1);
	}

	/* Start listening for connections on the socket. */
	for (n = 0; n < num_socks; n++) {
		if (listen(socks[n].sock, 10) < 0) {
			sprintf(logit, "listen : %.100s\n",
				strerror(errno));
			log_err(errno, func, logit);
			close(socks[n].sock);
			free(socks);
			return (-1);
		}
		socks[n].listening = 1;
	} /* END for (n) */

	/* setup local xauth */

	sprintf(display, "localhost:%u.%u",
		display_number,
		x11screen);

	return (display_number);
}


================================================
FILE: src/resmom/mom_main.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_main.c
 * @brief
 * The entry point function for MOM.
 */
#define _MOM_MAIN_C
#include <pbs_config.h> /* the master config generated by configure */

#ifdef PYTHON
#include <pbs_python_private.h>
#include <Python.h>
#include <pythonrun.h>
#include <wchar.h>
#endif

#include <unistd.h>
#include <pwd.h>
#include <grp.h>
#include <netdb.h>
#include <sys/param.h>
#include <sys/times.h>
#include <netinet/in.h>
#include <sys/socket.h>
#include <sys/time.h>
#include <sys/resource.h>
#include <sys/utsname.h>
#include <sys/wait.h>
#ifdef _POSIX_MEMLOCK
#include <sys/mman.h>
#endif /* _POSIX_MEMLOCK */
#include <dirent.h>

#include <assert.h>
#include <stdio.h>
#include <stdlib.h>
#include <signal.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <time.h>
#include <limits.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <arpa/inet.h>
#include <libutil.h>

#include "auth.h"
#include "libpbs.h"
#include "pbs_ifl.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "placementsets.h"
#include "resource.h"
#include "job.h"
#include "mom_func.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "pbs_error.h"
#include "log.h"
#include "net_connect.h"
#include "tpp.h"
#include "dis.h"
#include "resmon.h"
#include "batch_request.h"
#include "pbs_license.h"
#include "pbs_version.h"
#include "libsec.h"
#include "pbs_ecl.h"
#include "pbs_internal.h"
#include "pbs_idx.h"
#ifdef HWLOC
#include "hwloc.h"
#endif
#include "hook.h"
#include "mom_hook_func.h"
#include "work_task.h"
#include "pbs_share.h"
#include "mom_server.h"
#if MOM_ALPS
#include "mom_mach.h"
#endif /* MOM_ALPS */
#include "pbs_reliable.h"
#ifdef PMIX
#include "mom_pmix.h"
#endif /* PMIX */

#include "renew_creds.h"

#define STATE_UPDATE_TIME 10
#ifndef PRIO_MAX
#define PRIO_MAX 20
#endif
#ifndef PRIO_MIN
#define PRIO_MIN -20
#endif

/* Reducing tpp_request process for a minimum of 3 times to interleave other connections */
#define MAX_TPP_LOOPS 3

/*
 * Default "mutual exclusion" for job start/queue commit operations.  The
 * pointer is provided so multi-threaded mom implementations can replace it
 * with a pointer to a shared mutex.
 */

/* Global Data Items */
int mock_run = 0;
enum hup_action call_hup = HUP_CLEAR;
static int update_state_flag = 0;
double cputfactor = 1.00;
unsigned int default_server_port;
int exiting_tasks = 0;
float ideal_load_val = -1.0;
int idle_on_maxload = 0;
int internal_state = 0;
int internal_state_update = 0;
int termin_child = 0;
int do_debug_report = 0;
uid_t restrict_user_exempt_uids[NUM_RESTRICT_USER_EXEMPT_UIDS] = {0};
int svr_delay_entry = 0;
int mom_net_up = 0;
time_t mom_net_up_time = 0;
#ifdef WIN32
LASTINPUTINFO key_mouse_press = {sizeof(LASTINPUTINFO), 0};
int nrun_factor = 0;

void WINAPI PbsMomMain(DWORD dwArgc, LPTSTR *rgszArgv);
void WINAPI PbsMomHandler(DWORD dwControl);
DWORD WINAPI main_thread(void *pv);

/*
 * NOTE: Note the global state used by your service. Your service has a name,
 * state and a status handle used by SetServiceStatus.
 */
const TCHAR *const g_PbsMomName = __TEXT("PBS_MOM");
HANDLE g_hthreadMain = 0;
SERVICE_STATUS_HANDLE g_ssHandle = 0;
DWORD g_dwCurrentState = SERVICE_START_PENDING;
HANDLE hStop = NULL;
#endif /* WIN32 */
extern void mom_vnlp_report(vnl_t *vnl, char *header);

int alien_attach = 0; /* attach alien procs */
int alien_kill = 0;   /* kill alien procs */
int lockfds;
float max_load_val = -1.0;
int max_poll_downtime_val = PBS_MAX_POLL_DOWNTIME;
char *mom_domain;
char *mom_home;
char mom_host[PBS_MAXHOSTNAME + 1];
pid_t mom_pid;
int mom_run_state = 1;
char mom_short_name[PBS_MAXHOSTNAME + 1];
int next_sample_time = MAX_CHECK_POLL_TIME;
int max_check_poll = MAX_CHECK_POLL_TIME;
int min_check_poll = MIN_CHECK_POLL_TIME;
int inc_check_poll = 20;
int num_acpus = 1;
int num_pcpus = 1;
int num_oscpus = 1;
u_Long av_phy_mem = 0; /* physical memory in KB */
int num_var_env;
char *path_epilog;
char *path_jobs;
char *path_prolog;
char *path_spool;
char *path_undeliv;
char *path_addconfigs;
char path_addconfigs_reserved_prefix[] = "PBS";

char *path_hooks;
char *path_hooks_workdir;
char *path_rescdef;
hook *phook;
char *hook_suffix = HOOK_FILE_SUFFIX;
int hook_suf_len;
char hook_msg[HOOK_MSG_SIZE + 1];
int baselen;
char *psuffix;
struct dirent *pdirent;
DIR *dir;
/*char		pbs_current_user[PBS_MAXUSER] = "pbs_mom";*/ /* for libpbs.a */
/* above is TLS data now, strcpy the value "pbs_mom" into it in main */

char pbs_tmpdir[_POSIX_PATH_MAX] = TMP_DIR;
char pbs_jobdir_root[_POSIX_PATH_MAX] = "";
int pbs_jobdir_root_shared = FALSE;
vnl_t *vnlp = NULL; /* vnode list */
unsigned long hooks_rescdef_checksum = 0;

/* vnlp_from_hook: vnode list changes made by an exechost_startup hook, that */
/* sent to the server initially as part of the IS_HELLO/IS_CLUSTER_ADDR/ */
/* IS_CLUSTER_ADDR2 sequence . Then when successfully  sent to server,  */
/* entries matching HOOK_VNL_PERSISTENT_ATTRIBS will be merged with the */
/* main vnlp structure,  which gets  resent when server loses contact */
/* with mom, and server sends an IS_HELLO request */
vnl_t *vnlp_from_hook = NULL;

extern char *msg_startup1;
extern char *msg_init_chdir;
extern char *msg_corelimit;
int pbs_errno;
gid_t pbsgroup;
unsigned int pbs_mom_port;
unsigned int pbs_rm_port;
pbs_list_head mom_polljobs; /* jobs that must have resource limits polled */
pbs_list_head mom_deadjobs; /* jobs that need to purged, see chk_del_job */
int server_stream = -1;
pbs_list_head svr_newjobs; /* jobs being sent to MOM */
pbs_list_head svr_alljobs; /* all jobs under MOM's control */
time_t time_last_sample = 0;
extern time_t time_now;
time_t time_resc_updated = 0;
extern pbs_list_head svr_requests;
struct var_table vtable; /* see start_exec.c */

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
extern pbs_list_head svr_allcreds;
#endif

#if MOM_ALPS
#define ALPS_REL_WAIT_TIME_DFLT 400000; /* 0.4 sec */
#define ALPS_REL_JITTER_DFLT 120000;	/* 0.12 sec */
#define ALPS_REL_TIMEOUT 600;		/* 10 min */
#define ALPS_CONF_EMPTY_TIMEOUT 10;	/* 10 sec */
#define ALPS_CONF_SWITCH_TIMEOUT 35;	/* 35 sec */
char *alps_client = NULL;
useconds_t alps_release_wait_time = ALPS_REL_WAIT_TIME_DFLT;
useconds_t alps_release_jitter = ALPS_REL_JITTER_DFLT;
int vnode_per_numa_node;
int alps_release_timeout;
int alps_confirm_empty_timeout;
int alps_confirm_switch_timeout;
#endif /* MOM_ALPS */
char *path_checkpoint = NULL;
static resource_def *rdcput;
static resource_def *rdwall;
int restart_background = FALSE;
int reject_root_scripts = FALSE;
int report_hook_checksums = TRUE;
int restart_transmogrify = FALSE;
int attach_allow = TRUE;
extern double wallfactor;
int suspend_signal;
int resume_signal;
int cycle_harvester = 0;	/* MOM configured for cycle harvesting */
int restrict_user = 0;		/* kill non PBS user procs */
int restrict_user_maxsys = 999; /* largest system user id */
int gen_nodefile_on_sister_mom = TRUE;
int vnode_additive = 1;
momvmap_t **mommap_array = NULL;
int mommap_array_size = 0;
unsigned long QA_testing = 0;

long joinjob_alarm_time = -1;
long job_launch_delay = -1; /* # of seconds to delay job launch due to pipe reads (pipe read timeout)  */
int update_joinjob_alarm_time = 0;
int update_job_launch_delay = 0;

#ifdef NAS		     /* localmod 015 */
unsigned long spoolsize = 0; /* default spoolsize = unlimited */
#endif			     /* localmod 015 */

#ifdef NAS /* localmod 153 */
static char quiesce_mom_flag_file[_POSIX_PATH_MAX] = "/PBS/flags/quiesce_mom";
int mom_should_quiesce = 0;
#endif /* localmod 153 */

#ifdef NAS_UNKILL	/* localmod 011 */
#define KP_WAIT_TIME 60 /* number of seconds to wait for kill
					   to do its deed before declaring the
					   process unkillable */

struct kp {
	pbs_list_link kp_link; /* linked list struct */
	pid_t pid;	       /* pid of process being killed */
	pid_t ppid;	       /* ppid of process being killed */
	u_Long start_time;     /* start_time of process being killed */
	time_t kill_time;      /* time() of first kill attempt */
};
typedef struct kp kp;

pbs_list_head killed_procs; /* procs killed by dorestrict_user() */
#endif			    /* localmod 011 */

void *jobs_idx = NULL;
pbs_list_head mom_pending_ruu;

unsigned long hook_action_id = 0;

pbs_list_head svr_allhooks;
/* hooks below ignored */
pbs_list_head svr_queuejob_hooks;
pbs_list_head svr_postqueuejob_hooks;
pbs_list_head svr_modifyjob_hooks;
pbs_list_head svr_resvsub_hooks;
pbs_list_head svr_modifyresv_hooks;
pbs_list_head svr_movejob_hooks;
pbs_list_head svr_runjob_hooks;
pbs_list_head svr_jobobit_hooks;
pbs_list_head svr_management_hooks;
pbs_list_head svr_modifyvnode_hooks;
pbs_list_head svr_periodic_hooks;
pbs_list_head svr_provision_hooks;
pbs_list_head svr_resv_confirm_hooks;
pbs_list_head svr_resv_begin_hooks;
pbs_list_head svr_resv_end_hooks;
pbs_list_head svr_hook_job_actions;
pbs_list_head svr_hook_vnl_actions;
int mom_recvd_ip_cluster_addrs = 0;

/* the mom hooks */
pbs_list_head svr_execjob_begin_hooks;
pbs_list_head svr_execjob_prologue_hooks;
pbs_list_head svr_execjob_epilogue_hooks;
pbs_list_head svr_execjob_preterm_hooks;
pbs_list_head svr_execjob_launch_hooks;
pbs_list_head svr_execjob_end_hooks;
pbs_list_head svr_exechost_periodic_hooks;
pbs_list_head svr_exechost_startup_hooks;
pbs_list_head svr_execjob_attach_hooks;
pbs_list_head svr_execjob_resize_hooks;
pbs_list_head svr_execjob_abort_hooks;
pbs_list_head svr_execjob_postsuspend_hooks;
pbs_list_head svr_execjob_preresume_hooks;

/* the task lists */
pbs_list_head task_list_immed;
pbs_list_head task_list_interleave;
pbs_list_head task_list_timed;
pbs_list_head task_list_event;

#ifdef WIN32
/* copy request list */
pbs_list_head mom_copyreqs_list;
#endif

#ifndef WIN32
#ifdef RLIM64_INFINITY
struct rlimit64 orig_stack_size;
struct rlimit64 orig_nproc_limit;
struct rlimit64 orig_core_limit;
#else
struct rlimit orig_stack_size;
struct rlimit orig_nproc_limit;
struct rlimit orig_core_limit;
#endif /* RLIM64... */
#endif /* WIN32 */

/* Local Data Items */

static int nconfig;	      /* items in conf file */
static time_t idle_avail = 0; /* seconds for keyboard to be idle */
static time_t idle_busy = 10; /* seconds for keyboard to remain */
static int idle_check = -1;   /* indicate if doing idle check */
time_t idle_poll = 1;	      /* rate to poll keyboard when ! busy */
static time_t went_busy = 0;  /* time keyboard went busy */
static time_t prior_key = 0;  /* time of prior keystroke/mouse */
static int restrictrm = 0;    /* restricted RM request */
int kill_jobs_on_exit = 0;    /* kill running jobs on Mom exit */
static char *path_checkpoint_from_getopt = NULL;
static char *path_checkpoint_from_getenv = NULL;
static char *path_checkpoint_default = NULL;
static char path_checkpoint_buf[_POSIX_PATH_MAX] = "\0";
static time_t maxtm; /* see getkbdtime() */

#ifdef WIN32

/**
 * This global variable is used to indicate whether PBS_INTERACTIVE service
 * has been registered with Service Control Manager
 *
 *	0  - Error
 *	1  - PBS_INTERACTIVE service is registered
 *	-1 - PBS_INTERACTIVE service is not registered
 */
int interactive_svc_avail = 0;

#endif

/**
 *	To handle new configuration file formats (beginning with the vnode-
 *	specific data needed for GRUNT), we introduce the notion that any
 *	new-style mom configuration file must declare its version number at
 *	the beginning of the file, via a "$configversion" directive.
 *
 *	At present, we handle only a single new version number, known internally
 *	as CONFIG_VNODEVERS.
 */
enum configvers {
	CONFIG_MINVERS = 2,
	CONFIG_VNODEVERS = 2,
	CONFIG_MAXVERS = 2
};

struct config_list {
	struct config c;
	struct config_list *c_link;
};
static handler_ret_t config_versionhandler(char *, const char *, FILE *);

static handler_ret_t addclient(char *);
static handler_ret_t add_mom_action(char *);
static handler_ret_t config_verscheck(char *);
static handler_ret_t cputmult(char *);
static handler_ret_t parse_config(char *);
static handler_ret_t prologalarm(char *);
static handler_ret_t set_joinjob_alarm(char *);
static handler_ret_t set_job_launch_delay(char *);
static handler_ret_t restricted(char *);
static handler_ret_t set_alien_attach(char *);
static handler_ret_t set_alien_kill(char *);
#if MOM_ALPS
static handler_ret_t set_alps_client(char *);
static handler_ret_t set_alps_release_wait_time(char *);
static handler_ret_t set_alps_release_jitter(char *);
static handler_ret_t set_alps_release_timeout(char *);
static handler_ret_t set_alps_confirm_empty_timeout(char *);
static handler_ret_t set_vnode_per_numa_node(char *);
static handler_ret_t set_alps_confirm_switch_timeout(char *);
#endif /* MOM_ALPS */
static handler_ret_t set_attach_allow(char *);
static handler_ret_t set_checkpoint_path(char *);
static handler_ret_t set_enforcement(char *);
static handler_ret_t set_jobdir_root(char *);
static handler_ret_t set_kbd_idle(char *);
static handler_ret_t set_max_check_poll(char *);
static handler_ret_t set_min_check_poll(char *);
static handler_ret_t set_momname(char *);
static handler_ret_t set_momport(char *);
#ifdef WIN32
static handler_ret_t set_nrun_factor(char *);
#endif
static handler_ret_t set_restart_background(char *);
static handler_ret_t set_restart_transmogrify(char *);
static handler_ret_t set_restrict_user(char *);
static handler_ret_t set_restrict_user_maxsys(char *);
static handler_ret_t set_restrict_user_exceptions(char *);
static handler_ret_t set_gen_nodefile_on_sister_mom(char *);
static handler_ret_t set_suspend_signal(char *);
static handler_ret_t set_tmpdir(char *);
static handler_ret_t set_vnode_additive(char *);
static handler_ret_t setidealload(char *);
static handler_ret_t setlogevent(char *);
static handler_ret_t set_reject_root_scripts(char *);
static handler_ret_t set_report_hook_checksums(char *);
static handler_ret_t setmaxload(char *);
static handler_ret_t set_max_poll_downtime(char *);
static handler_ret_t usecp(char *);
static handler_ret_t wallmult(char *);
#ifdef NAS /* localmod 015 */
static handler_ret_t set_spoolsize(char *);
#endif /* localmod 015 */

static struct specials {
	char *name;
	handler_ret_t (*handler)(char *);
} special[] = {
	/* alphabetized by name */
	{"action", add_mom_action},
	/*
	 ****************************************************
	 ** WARNING
	 ** These "alien" entries are undocumented and are for
	 ** prototype purposes only.  DO NOT USE.
	 ****************************************************
	 */
	{"alien_attach", set_alien_attach},
	{"alien_kill", set_alien_kill},
#if MOM_ALPS
	{"alps_client", set_alps_client},
	{"alps_confirm_empty_timeout", set_alps_confirm_empty_timeout},
	{"alps_release_wait_time", set_alps_release_wait_time},
	{"alps_release_jitter", set_alps_release_jitter},
	{"alps_release_timeout", set_alps_release_timeout},
	{"vnode_per_numa_node", set_vnode_per_numa_node},
	{"alps_confirm_switch_timeout", set_alps_confirm_switch_timeout},
#endif /* MOM_ALPS */
	{"attach_allow", set_attach_allow},
	{"checkpoint_path", set_checkpoint_path},
	{"clienthost", addclient},
	{"configversion", config_verscheck},
	{"cputmult", cputmult},
	{"enforce", set_enforcement},
	{"ideal_load", setidealload},
	{"jobdir_root", set_jobdir_root},
	{"kbd_idle", set_kbd_idle},
	{"logevent", setlogevent},
	{"max_check_poll", set_max_check_poll},
	{"max_load", setmaxload},
	{"max_poll_downtime", set_max_poll_downtime},
	{"min_check_poll", set_min_check_poll},
	{"momname", set_momname},
#ifdef WIN32
	{"nrun_factor", set_nrun_factor},
#endif
	{"port", set_momport},
	{"prologalarm", prologalarm},
	{"sister_join_job_alarm", set_joinjob_alarm},
	{"job_launch_delay", set_job_launch_delay},
	{"restart_background", set_restart_background},
	{"restart_transmogrify", set_restart_transmogrify},
	{"restrict_user", set_restrict_user},
	{"restrict_user_exceptions", set_restrict_user_exceptions},
	{"restrict_user_maxsysid", set_restrict_user_maxsys},
	{"restricted", restricted},
	{"gen_nodefile_on_sister_mom", set_gen_nodefile_on_sister_mom},
#ifdef NAS /* localmod 015 */
	/*
	 * spool size limit
	 */
	{"spool_size", set_spoolsize},
#endif /* localmod 015 */
	{"suspendsig", set_suspend_signal},
	{"tmpdir", set_tmpdir},
	{"vnodedef_additive", set_vnode_additive},
	{"usecp", usecp},
	{"wallmult", wallmult},
	{"reject_root_scripts", set_reject_root_scripts},
	{"report_hook_checksums", set_report_hook_checksums},
	{NULL, NULL}};

static struct specials addspecial[] = {
	{NULL, NULL}};

void *job_attr_idx = NULL;
char *log_file = NULL;
char *path_log;
#ifndef WIN32
sigset_t allsigs;
#endif
char *ret_string;
int ret_size;
struct config *config_array = NULL;
struct config_list *config_list = NULL;
int rm_errno;
unsigned int reqnum = 0; /* the packet number */
int port_care = 1;	 /* secure connecting ports */
uid_t uid = 0;		 /* uid we are running with */
int alarm_time = 10;	 /* time before alarm */
int nice_val = 0;	 /* nice daemon by this much */

char **maskclient = NULL; /* wildcard connections */
int mask_num = 0;
int mask_max = 0;
u_long localaddr = 0;

char extra_parm[] = "extra parameter(s)";
char no_parm[] = "required parameter not found";

int cphosts_num = 0;
struct cphosts *pcphosts = 0;
int enable_exechost2 = 0;
static int config_file_specified = 0;
static char config_file[_POSIX_PATH_MAX] = "config";

struct mom_action mom_action[(int) LastAction] = {
	{"terminate", 0, Default, NULL, NULL},
	{"checkpoint", 0, Default, NULL, NULL},
	{"checkpoint_abort", 0, Default, NULL, NULL},
	{"restart", 0, Default, NULL, NULL},
	{"multinodebusy", 0, Default, NULL, NULL}};

/*
 **	These routines are in the "dependent" code.
 */
extern void dep_initialize(void);
extern void dep_cleanup(void);

/* External Functions */
extern void catch_child(int);
extern void init_abort_jobs(int, pbs_list_head *);
extern void scan_for_exiting(void);
#ifdef NAS /* localmod 015 */
extern int to_size(char *, struct size_value *);
#endif /* localmod 015 */

extern void cleanup_hooks_workdir(struct work_task *);

extern char *getuname(void);
extern int get_permission(char *perm);
extern handler_ret_t check_interactive_service();
extern void finish_loop(time_t waittime);
extern void usage(char *prog);

#ifndef WIN32
extern void scan_for_terminated(void);

/* Local public functions */

extern void stop_me(int);
extern void catch_USR2(int);
extern void catch_hup(int);
extern void toolong(int);
#endif

extern eventent *event_dup(eventent *ep, job *pjob, hnodent *pnode);

/* Local private functions */
static char *mk_dirs(char *);
static void check_busy(double);

/**
 * @brief
 *	auth_handler - Handles additional authentication required for server TCP connections
 *
 * @param[in] conn - pointer to connection struct
 *
 * @return int
 * @retval -1 - Authentication failed
 * @retval 0 - Connection was authenticated successfully
 * @retval 1 - Conncection did not need additional authentication
 *
 */
static int
auth_handler(conn_t *conn)
{
	if (conn->cn_authen & PBS_NET_CONN_PREVENT_IP_SPOOFING) {
		char ebuf[LOG_BUF_SIZE] = "";
		char port_str[6];

		snprintf(port_str, sizeof(port_str), "%d", conn->cn_port);

		/* The received cipher should include the remote's port used to connect
		 * with this MoM, to prevent IP Spoofing and capture-replay attacks.
		 */
		if (server_cipher_auth(conn->cn_sock, port_str, ebuf, sizeof(ebuf))) {
			log_err(errno, __func__, ebuf);
			return -1;
		}
		conn->cn_authen &= ~PBS_NET_CONN_PREVENT_IP_SPOOFING;
		return 0;
	} else {
		return 1;
	}
}

/**
 * @brief
 *	logs error message
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return NULL
 *
 */
char *
nullproc(struct rm_attribute *attrib)
{

	log_err(-1, __func__, "should not be called");
	return NULL;
}

char *pbs_mach = NULL;

/**
 * @brief
 *	gets machine architecture else logs error msg
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return string
 * @retval PBS_ARCH	Success
 * @retval NULL		Failure
 *
 */
char *
arch(struct rm_attribute *attrib)
{
	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	if (pbs_mach != NULL)
		return pbs_mach;
	else
		return PBS_MACH;
}

/**
 * @brief
 *	requsts username else logs error msg on failure
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return string
 * @retval username	Success
 * @retval NULL		Failure
 *
 */
static char *
requname(struct rm_attribute *attrib)
{
	char *cp;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}
	cp = getuname();
	return cp;
}

/**
 * @brief
 *	checks whether valid user
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return	string
 * @retval	yes	Success
 * @retval	no	Failure
 *
 */
static char *
validuser(struct rm_attribute *attrib)
{
	struct passwd *p;

	if (attrib == NULL || attrib->a_value == NULL) {
		log_err(-1, __func__, no_parm);
		rm_errno = RM_ERR_NOPARAM;
		return NULL;
	}

	p = getpwnam(attrib->a_value);
	if (p) {
		return "yes";
	} else {
		return "no";
	}
}

/**
 * @brief
 *	returns the current load average on node
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return   string
 * @retval   loadvalue   Success
 * @retval   NULL         Failure
 *
 */
char *
loadave(struct rm_attribute *attrib)
{
	static char ret_string[20];
	double la;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	if (get_la(&la) != 0) {
		rm_errno = RM_ERR_SYSTEM;
		return NULL;
	}

	sprintf(ret_string, "%.2f", la);
	return ret_string;
}

/**
 * @brief
 *	Output the various resource lists.
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return  string
 * @retval  log_buffer  Success
 * @retval  NULL	Failure
 *
 */
char *
reslist(struct rm_attribute *attrib)
{
	struct config *cp;
	extern struct config common_config[];
	extern struct config standard_config[];
	extern struct config dependent_config[];
	size_t len;

	if (attrib) {
		log_err(-1, __func__, extra_parm);
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	log_buffer[0] = '\0';

	for (cp = common_config; cp->c_name; cp++) {
		strcat(log_buffer, cp->c_name);
		strcat(log_buffer, " ");
	}

	for (cp = standard_config; cp->c_name; cp++) {
		strcat(log_buffer, cp->c_name);
		strcat(log_buffer, " ");
	}

	for (cp = dependent_config; cp->c_name; cp++) {
		strcat(log_buffer, cp->c_name);
		strcat(log_buffer, " ");
	}

	if (config_array) {
		for (cp = config_array; cp->c_name; cp++) {
			strcat(log_buffer, cp->c_name);
			strcat(log_buffer, " ");
		}
	}

	len = strlen(log_buffer);
	if (len > 0) {
		log_buffer[len - 1] = '\0';
		return log_buffer;
	} else
		return NULL;
}

struct config common_config[] = {
	{"arch", {arch}},
	{"uname", {requname}},
	{"validuser", {validuser}},
	{"reslist", {reslist}},
	{NULL, {nullproc}}};

/**
 * @brief
 *	Search the array of resources read from the config files.
 *
 * @param[in] where - pointer to config structure
 * @param[in] what  - char pointer holding what to search
 *
 * @return	structure handle
 * @retval	pointer to config structure	Success
 * @retval      NULL				Failure
 *
 */
struct config *
rm_search(struct config *where, char *what)
{
	struct config *cp;

	if (where == NULL || what == NULL)
		return NULL;

	for (cp = where; cp->c_name; cp++) {
		if (strcmp(cp->c_name, what) == 0)
			break;
	}
	return (cp->c_name ? cp : NULL);
}

/**
 * @brief
 *	Search the various resource lists.
 *
 * @param[in] res - string holding resource
 * @param[in] attr - pointer to rm_attribute structure
 *
 * @return	string
 * @retval	structure handler to config	Success
 * @retval      NULL				Failure
 *
 */
char *
dependent(char *res, struct rm_attribute *attr)
{
	struct config *ap;
	extern struct config standard_config[];
	extern struct config dependent_config[];

	ap = rm_search(common_config, res);
	if (ap)
		return (ap->c_u.c_func(attr));

	ap = rm_search(standard_config, res);
	if (ap)
		return (ap->c_u.c_func(attr));

	ap = rm_search(dependent_config, res);
	if (ap)
		return (ap->c_u.c_func(attr));

	rm_errno = RM_ERR_UNKNOWN;
	return NULL;
}

/**
 * @brief
 *	wrapper function to dep_cleanup
 *
 */
void
cleanup(void)
{
	dep_cleanup();
}

/**
 * @brief
 *	Clean up after a signal.
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
void
die(int sig)
{
	if (sig > 0) {
		sprintf(log_buffer, "caught signal %d", sig);
		log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, __func__, log_buffer);
	} else
		log_event(PBSEVENT_SYSTEM, 0, LOG_ALERT, __func__,
			  "abnormal termination");

	cleanup();
	pbs_idx_destroy(jobs_idx);
	unload_auths();
	log_close(1);
#ifdef WIN32
	ExitThread(1);
#else
	exit(1);
#endif
}

/**
 * @brief
 *	Performs initialization steps like loading pbs.conf values,
 *	setting core limit size, running platform-specific initializations
 *	(e.g. topology data gathering),
 *	running the exechost_startup hook, and
 *	checking that there are no bad combinations of sharing values
 *	across the vnodes.
 *
 * @return void
 *
 */
void
initialize(void)
{
	unsigned int i;
	void *temp_idx;
	char hook_msg[HOOK_MSG_SIZE + 1];
	char hook_buf[HOOK_BUF_SIZE + 1];
	mom_hook_input_t hook_input;
	mom_hook_output_t hook_output;
	int hook_errcode = 0;
	int hook_rc = 0;
	hook *last_phook = NULL;
	unsigned int hook_fail_action = 0;
	int ret;
	char none[] = "<unset>";
	enum vnode_sharing hostval;

	/* set limits that can be modified by the Admin */
#ifndef WIN32 /* ---- UNIX ------------------------------------------*/
#ifdef RLIMIT_CORE
	int char_in_cname = 0;

	(void) pbs_loadconf(0);
	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	if (pbs_conf.pbs_core_limit) {
		char *pc = pbs_conf.pbs_core_limit;
		while (*pc != '\0') {
			if (!isdigit(*pc)) {
				/* there is a character in core limit */
				char_in_cname = 1;
				break;
			}
			pc++;
		}
	}

#if defined(RLIM64_INFINITY)
	if (pbs_conf.pbs_core_limit) {
		struct rlimit64 corelimit;
		corelimit.rlim_max = RLIM64_INFINITY;
		if (strcmp("unlimited", pbs_conf.pbs_core_limit) == 0)
			corelimit.rlim_cur = RLIM64_INFINITY;
		else if (char_in_cname == 1) {
			log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_WARNING,
				   __func__, msg_corelimit);
			corelimit.rlim_cur = RLIM64_INFINITY;
		} else
			corelimit.rlim_cur =
				(rlim64_t) atol(pbs_conf.pbs_core_limit);
		/* get system core limit */
		(void) getrlimit64(RLIMIT_CORE, &orig_core_limit);

		(void) setrlimit64(RLIMIT_CORE, &corelimit);
	}

#else  /* set rlimit 32 bit */

	if (pbs_conf.pbs_core_limit) {
		struct rlimit corelimit;
		corelimit.rlim_max = RLIM_INFINITY;
		if (strcmp("unlimited", pbs_conf.pbs_core_limit) == 0)
			corelimit.rlim_cur = RLIM_INFINITY;
		else if (char_in_cname == 1) {
			log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_WARNING,
				   __func__, msg_corelimit);
			corelimit.rlim_cur = RLIM_INFINITY;
		} else
			corelimit.rlim_cur =
				(rlim_t) atol(pbs_conf.pbs_core_limit);

		/* get system core limit */
		(void) getrlimit(RLIMIT_CORE, &orig_core_limit);

		(void) setrlimit(RLIMIT_CORE, &corelimit);
	}
#endif /* RLIM64_INFINITY */

#endif /* RLIMIT_CORE */
#endif /* !WIN32 ---------------------------------------------------------- */

	num_pcpus = num_acpus = num_oscpus = 0;
	dep_initialize();
	if (num_oscpus == 0)
		num_oscpus = num_pcpus;
	sprintf(log_buffer, "pcpus=%d, OS reports %d cpu(s)",
		num_pcpus, num_oscpus);
	log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, "initialize", log_buffer);

	if (vnlp_from_hook == NULL) {
		if (vnl_alloc(&vnlp_from_hook) == NULL) {
			log_err(PBSE_SYSTEM, __func__, "vnl_alloc failed");
			return;
		}
		vnlp_from_hook->vnl_modtime = time(NULL);
	}

	mom_hook_input_init(&hook_input);
	hook_input.vnl = (vnl_t *) vnlp;

	mom_hook_output_init(&hook_output);
	hook_output.reject_errcode = &hook_errcode;
	hook_output.last_phook = &last_phook;
	hook_output.fail_action = &hook_fail_action;
	hook_output.vnl = (vnl_t *) vnlp_from_hook;

	if (setup_resc(1) != 0) {
		/* log_buffer set in setup_resc */
		log_err(-1, "setup_resc", "warning: failed to setup resourcdef");
	}

	switch ((hook_rc = mom_process_hooks(HOOK_EVENT_EXECHOST_STARTUP,
					     PBS_MOM_SERVICE_NAME,
					     mom_host, &hook_input, &hook_output, hook_msg,
					     sizeof(hook_msg), 0))) {

		case 2: /* no hook script executed - go ahead and accept event */
			break;
		default:
			/* a value of '0' means explicit reject encountered, and '1' means explicit accept. */
			if ((hook_rc != 0) && (hook_rc != 1)) {
				/* we've hit an internal error (malloc error, full disk, etc...), so */
				/* treat this now like a  hook error so hook fail_action  */
				/* will be consulted.  */
				/* Before, behavior of an internal error was to ignore it! */
				hook_errcode = PBSE_HOOKERROR;
			}
			if (hook_errcode == PBSE_HOOKERROR) { /* error */
				if ((last_phook != NULL) &&
				    (last_phook->fail_action &
				     HOOK_FAIL_ACTION_OFFLINE_VNODES)) {
					snprintf(hook_buf,
						 HOOK_BUF_SIZE + 1,
						 "1,%s", last_phook->hook_name);

					ret = vn_addvnr(vnlp_from_hook,
							mom_short_name,
							VNATTR_HOOK_OFFLINE_VNODES,
							hook_buf, 0, 0, NULL);

					if (ret != 0) {
						snprintf(log_buffer,
							 sizeof(log_buffer),
							 "Failed to add to "
							 "vnlp_from_hook: %s=%s",
							 VNATTR_HOOK_OFFLINE_VNODES,
							 hook_buf);
						log_event(PBSEVENT_DEBUG2,
							  PBS_EVENTCLASS_HOOK, LOG_INFO,
							  last_phook->hook_name,
							  log_buffer);
					}
					vnlp_from_hook->vnl_modtime = time(NULL);
				}
				break;
			} else if (hook_fail_action & HOOK_FAIL_ACTION_CLEAR_VNODES) {
				/* no hook error */
				vnl_t *vnlp_tmp = NULL;

				/* of vnlp_from_hook */
				if (vnl_alloc(&vnlp_tmp) == NULL) {
					log_err(PBSE_SYSTEM, __func__,
						"vnl_alloc failed");
					return;
				}
				ret = vn_addvnr(vnlp_tmp, mom_short_name,
						VNATTR_HOOK_OFFLINE_VNODES, "0", 0,
						0, NULL);
				if (ret != 0) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "Failed to add to "
						 "vnlp_tmp: %s=%s",
						 VNATTR_HOOK_OFFLINE_VNODES,
						 hook_buf);
					log_event(PBSEVENT_DEBUG2,
						  PBS_EVENTCLASS_HOOK, LOG_INFO,
						  last_phook->hook_name,
						  log_buffer);
					vnl_free(vnlp_tmp);
					vnlp_tmp = NULL;
					return;
				}
				if (vnlp_from_hook->vnl_used > 0) {
					/* the clear offline_vnodes action ,*/
					/* as stored in 'vnlp_tmp' */
					/* must appear before other vn */
					/* actions (currently in
					 * vnlp_from_hook),  since it would be */
					/* clearing the states of all vnodes */
					/* and their comments. vnlp_from_hook */
					/* may contain vnode state and */
					/* comment changes, and we would not */
					/* want to override that. */
					vn_merge(vnlp_tmp, vnlp_from_hook,
						 NULL);
					vnl_free(vnlp_from_hook);
					vnlp_from_hook = vnlp_tmp;
				} else {
					vn_merge(vnlp_from_hook, vnlp_tmp,
						 NULL);
					vnl_free(vnlp_tmp);
				}
				vnlp_tmp = NULL;
			}
	}

	mom_vnlp_report(vnlp_from_hook, "vnlp_from_hook");

	if (vnlp_from_hook->vnl_used == 0) {
		vnl_free(vnlp_from_hook);
		vnlp_from_hook = NULL;
	}

	if (vnlp == NULL)
		return;

	/*
	 *	Check that there are no bad combinations of sharing values
	 *	across the vnodes.
	 */
	if ((temp_idx = pbs_idx_create(0, 0)) == NULL) {
		log_err(-1, __func__, "Failed to create index for checking sharing value on vnodes");
		die(0);
	}

	for (i = 0; i < vnlp->vnl_used; i++) {
		vnal_t *vnrlp = VNL_NODENUM(vnlp, i);
		char *host = attr_exist(vnrlp, "resources_available.host");
		char *share;
		char *exclhost = none;
		char *exclhost_frmidx = none;
		enum vnode_sharing shareval;

		if (host == NULL)
			/* mom_host and mom_short_name are different!! */
			/* use mom short name by default */
			host = mom_short_name;

		share = attr_exist(vnrlp, "sharing");
		shareval = str_to_vnode_sharing(share);
		if (shareval != VNS_UNSET)
			exclhost = vnode_sharing_to_str(shareval);

		/* search for host */
		if (pbs_idx_find(temp_idx, (void **) &host, (void **) &exclhost_frmidx, NULL) != PBS_IDX_RET_OK) {
			if (pbs_idx_insert(temp_idx, host, (void *) exclhost) != PBS_IDX_RET_OK) {
				log_errf(errno, __func__, "Failed to add exechost = %s for host %s in index", exclhost, host);
				die(0);
			}
			continue;
		}

		/* the host exists, check if the saved value is the same */
		if (exclhost_frmidx == exclhost)
			continue;

		/* they are different, now check if it is a bad combo */
		hostval = str_to_vnode_sharing(exclhost_frmidx);
		if (hostval == VNS_DFLT_EXCLHOST ||
		    hostval == VNS_FORCE_EXCLHOST ||
		    shareval == VNS_DFLT_EXCLHOST ||
		    shareval == VNS_FORCE_EXCLHOST) {
			sprintf(log_buffer,
				"It is erroneous to mix sharing=%s "
				"for vnode %s with sharing=%s which "
				"is set for other vnodes on host %s",
				exclhost, vnrlp->vnal_id,
				exclhost_frmidx, host);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE,
				  LOG_NOTICE, __func__, log_buffer);
			die(0);
		}
	}

	pbs_idx_destroy(temp_idx);

	if (joinjob_alarm_time == -1)
		joinjob_alarm_time = DEFAULT_JOINJOB_ALARM;

	if (job_launch_delay == -1)
		job_launch_delay = DEFAULT_JOB_LAUNCH_DELAY;

	time_delta_hellosvr(MOM_DELTA_RESET);
}

/**
 * @brief
 *	Check for fatal memory allocation error.
 *
 * @param[in]  buf - reallocated memory
 *
 * @return Void
 *
 */
void
memcheck(char *buf)
{
	if (buf)
		return;
	log_err(-1, "memcheck", "memory allocation failed");
	die(0);
}

/**
 * @brief
 *	Check the ret_string buffer to make sure that there is
 *	enough room starting at *spot to hold len characters more.
 *	If not, realloc the buffer and make *spot point to
 *	the corresponding place that it used to point to in
 *	the old buffer.
 *
 * @param[in] spot - buffer
 * @param[in] len - buffer len
 *
 * @return Void
 *
 */
void
checkret(char **spot, int len)
{
	char *hold;

	if ((*spot - ret_string) < (ret_size - len))
		return;

	ret_size += len * 2; /* new buf size */
	sprintf(log_buffer, "size increased to %d", ret_size);
	log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, __func__, log_buffer);
	hold = realloc(ret_string, ret_size); /* new buf */
	memcheck(hold);
	*spot = *spot - ret_string + hold; /* new spot in buf */
	ret_string = hold;
}

/**
 * @brief
 *	skipwhite - process the string to make it blank free
 *
 * @param[in] str - string to be processed
 *
 * @return	string
 * @retval	string with no blanks
 *
 */
char *
skipwhite(char *str)
{
	for (; *str; str++) {
		if (!isspace(*str))
			break;
	}
	return str;
}

/**
 * @brief
 *	copies string in str to string tok
 *
 * @param[in] str - string to be copied
 * @param[in] tok - destination string to be copied to
 * @param[in] len - size of string str
 *
 * @return	string
 * @retval	destination string "tok"
 *
 */
char *
tokcpy(char *str, char *tok, size_t len)
{
	size_t i;

	for (i = 0; *str && (i < len); str++, tok++, i++) {
		if (!isalnum(*str) && *str != ':' && *str != '_' && check_spl_ch(*str))
			break;
		*tok = *str;
	}
	*tok = '\0';
	return str;
}

#define TOKCPY(a, b) tokcpy(a, b, sizeof(b))

/**
 * @brief
 *	removes new line from str
 *
 * @param[in] str - string to be processed
 *
 * @return Void
 *
 */
void
rmnl(char *str)
{
	int i;

	i = strlen(str);
	while (--i) {
		if ((*(str + i) != '\n') && !isspace((int) *(str + i)))
			break;
		*(str + i) = '\0';
	}
}

/**
 * @brief
 *	Similar to tokcpy() with only whitespace as the delimiting characters
 *
 * @param[in] str - string to be copied
 * @param[in] tok - destination string to be copied to
 * @param[in] len - size of string str
 *
 * @return string
 * @retval processed destination string "tok"
 *
 */
char *
wtokcpy(char *str, char *tok, int len)
{
	int i;
	for (i = 0; *str && (i < len); str++, tok++, i++) {
		if (isspace((int) *str))
			break;
		*tok = *str;
	}
	*tok = '\0';
	return str;
}

/**
 * @brief
 *	malloc memory and make a copy of the path input string that does not
 *	contain any double quote marks
 *
 * @param[in] path - char pointer holding input path
 *
 * @return string
 * @retval processed path string
 *
 */
char *
remove_quotes(char *path)
{
	char *dp, *dup;

	if (!path || !(dup = strdup(path)))
		return NULL;
	else
		dp = dup;

	do {
		if (*path != '"')
			*dp++ = *path;
	} while (*path++);

	return dup;
}

#ifdef WIN32
extern void stop_pbs_interactive();
#endif

/**
 * @brief
 *	add_mom_action - Parse mom action command from mom config file and add
 *	into mom_action array
 *
 * @param[in]	str -	line from mom config file which contain action
 *			command for mom
 *
 * @return	handler_ret_t
 * @retval	HANDLER_FAIL	- on fail
 * @retval	HANDLER_SUCCESS	- on success
 *
 */
static handler_ret_t
add_mom_action(char *str)
{
	char arg[_POSIX_PATH_MAX + 1];
	int i;
	int count;
	char *pc;
	int na;
	char **pargs;
	char *scp;
	int tout;
	int white;

	if (*str == '\0')
		return HANDLER_FAIL;

	/* first token is name of event */
	str = TOKCPY(str, arg);
	str = skipwhite(str);
	if (*str == '\0')
		return HANDLER_FAIL;
	for (na = 0; na < (int) LastAction; na++) {
		if (strcmp(arg, mom_action[na].ma_name) == 0) {
			/* have a valid event name */
			break;
		}
	}
	if (na >= (int) LastAction)
		return HANDLER_FAIL;

	/* next should come the time out value */
	str = TOKCPY(str, arg);
	str = skipwhite(str);
	if (*str == '\0')
		return HANDLER_FAIL;
	if (!isdigit((int) *arg))
		return HANDLER_FAIL;
	tout = atoi(arg);

	/* next is the action verb: a script or some keyword */
	if (*str == '!') {

		/* script specified */
		str = process_string(++str, arg, _POSIX_PATH_MAX);
		str = skipwhite(str);

		if (is_full_path(arg)) {

			scp = malloc(strlen(arg) + 1);
			if (scp == NULL) {
				return HANDLER_FAIL;
			}
			strcpy(scp, arg);
		} else {
			/* convert relative path to an absolute */
			/* path based on PBS_HOME/mom_priv      */

			scp = malloc(strlen(arg) + strlen(mom_home) + 2);
			if (scp == NULL) {
				return HANDLER_FAIL;
			}
			strcpy(scp, mom_home);
			strcat(scp, "/");
			strcat(scp, arg);
		}

		/* now count up the number of args */

		white = -1;
		count = 0;
		pargs = 0;
		pc = str;
		while (*pc) {
			if (isspace((int) *pc)) {
				if (white != 1)
					white = 1;
			} else {
				if (white != 0) {
					white = 0;
					count++;
				}
			}
			pc++;
		}
		pargs = (char **) malloc((count + 1) * sizeof(char *));
		if (pargs == NULL) {
			free(scp);
			return HANDLER_FAIL;
		}

		/* now we know how many and have space, copy each arg */

		for (i = 0; i < count; i++) {
			str = wtokcpy(str, arg, _POSIX_PATH_MAX);
			str = skipwhite(str);
			if ((*(pargs + i) = strdup(arg)) == NULL) {
				for (; i >= 0; i--) {
					free(*(pargs + i));
				}
				free(scp);
				free(pargs);
				return HANDLER_FAIL;
			}
		}
		*(pargs + i) = NULL;

		/* now we can set the action array member */

		mom_action[na].ma_verb = Script;
		mom_action[na].ma_timeout = tout;
		mom_action[na].ma_script = scp;
		mom_action[na].ma_args = pargs;
		goto done;
	}

	/* not a script, must be a recognized verb */

	if (strcmp(arg, "requeue") == 0) {

		/* Requeue Verb */

		mom_action[na].ma_verb = Requeue;
		mom_action[na].ma_timeout = tout;
		mom_action[na].ma_script = NULL;
		mom_action[na].ma_args = NULL;

	} else
		return HANDLER_FAIL; /* error */

done:
	if (mom_action[na].ma_verb == Script)
		sprintf(log_buffer, "%s: %s", mom_action[na].ma_name,
			mom_action[na].ma_script);
	else
		sprintf(log_buffer, "%s: %s", mom_action[na].ma_name, arg);

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  "action", log_buffer);
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	adds client by name.
 *
 * @param[in] name - name of host
 *
 * @return	u_long
 * @retval	0		Failure
 * @retval	ipaddr of host	Success
 *
 */
static u_long
addclient_byname(char *name)
{
	struct hostent *host;
	struct in_addr saddr;
	u_long ipaddr = 0;
	int i;

	if ((host = gethostbyname(name)) == NULL) {
		sprintf(log_buffer, "host %s not found", name);
		log_err(-1, __func__, log_buffer);
		return 0;
	}

	for (i = 0; host->h_addr_list[i]; i++) {
		memcpy((char *) &saddr, host->h_addr_list[i], host->h_length);
		ipaddr = ntohl(saddr.s_addr);
		addrinsert(ipaddr);
	}
	return ipaddr;
}

/**
 * @brief
 *	wrapper func for addclient_byname.
 *
 * @param[in] name - name of host
 *
 * @return	handler_ret_t (return value)
 * @retval      HANDLER_FAIL(0)			Failure
 * @retval	HANDLER_SUCCESS(1)		Success
 *
 */

static handler_ret_t
addclient(char *name)
{
	if (addclient_byname(name) == 0)
		return HANDLER_FAIL;
	else
		return HANDLER_SUCCESS;
}

/**
 * @brief
 *	sets the log event
 *
 * @param[in] value - log value
 *
 * @return      handler_ret_t (return value)
 * @retval      HANDLER_FAIL(0)                 Failure
 * @retval      HANDLER_SUCCESS(1)              Success
 *
 */

static handler_ret_t
setlogevent(char *value)
{
	char *bad;

	*log_event_mask = strtol(value, &bad, 0);
	tpp_set_logmask(*log_event_mask);
	if ((*bad == '\0') || isspace((int) *bad))
		return HANDLER_SUCCESS;
	else
		return HANDLER_FAIL;
}

/**
 * @brief
 *	Set the configuration flag that defines whether the hook files/scripts
 *	or job scripts to be run under root are rejected by mom.
 *
 * @param[in] value - log value
 *
 * @retval 0 failure
 * @retval 1 success
 *
 */
static handler_ret_t
set_reject_root_scripts(char *value)
{
	return (set_boolean(__func__, value, &reject_root_scripts));
}

/**
 * @brief
 *	Set the configuration flag that tells the mom to send the checksums
 *	of the hooks it knows about.
 *
 * @param[in] value - log value
 *
 * @retval 0 failure
 * @retval 1 success
 *
 */
static handler_ret_t
set_report_hook_checksums(char *value)
{
	return (set_boolean(__func__, value, &report_hook_checksums));
}

/**
 * @brief
 *	sets log event if host is restricted.
 *
 * @param[in] name - name of host
 *
 * @return	handler_ret_t
 * @retval	HANDLER_FAIL(0)		Failure
 * @retval	HANDLER_SUCCESS		Success
 *
 */

static handler_ret_t
restricted(char *name)
{
	int i;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, name);
	if (mask_max == 0) {
		maskclient = (char **) calloc(4, sizeof(char *));
		if (maskclient == NULL)
			return HANDLER_FAIL; /* error */
		mask_max = 4;
	}
	if ((maskclient[mask_num] = strdup(name)) == NULL) {
		for (i = 0; i < mask_num; i++)
			free(maskclient[i]);
		mask_num = 0;
		return HANDLER_FAIL;
	}
	if (maskclient[mask_num++] == NULL) {
		for (i = 0; i < mask_num; i++)
			free(maskclient[i]);
		mask_num = 0;
		return HANDLER_FAIL; /* error */
	}

	if (mask_num == mask_max) {
		char **tmcl;
		tmcl = (char **) realloc(maskclient,
					 2 * mask_max * sizeof(char *));
		if (tmcl == NULL)
			return HANDLER_FAIL; /* error */
		maskclient = tmcl;
		mask_max *= 2;
	}
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	sets the cputfactor value
 *
 * @param[in] value - value for cputfactor
 *
 * @return      handler_ret_t (return value)
 * @retval      HANDLER_FAIL(0)                 Failure
 * @retval      HANDLER_SUCCESS(1)              Success
 *
 */

static handler_ret_t
cputmult(char *value)
{
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, value);
	if ((cputfactor = atof(value)) == 0.0)
		return HANDLER_FAIL; /* error */
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	sets wallfactor
 *
 * @param[in] value - value for wallfactor
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL(0)         Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
wallmult(char *value)
{
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, value);
	if ((wallfactor = atof(value)) == 0.0)
		return HANDLER_FAIL; /* error */
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *      sets hosts
 *
 * @param[in] value - value for hosts
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL(0)         Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
usecp(char *value)
{
	char *pnxt;
	static int cphosts_max = 0;

	if (cphosts_max == 0) {
		pcphosts = malloc(2 * sizeof(struct cphosts));
		if (pcphosts == NULL) {
			return HANDLER_FAIL;
		}
		cphosts_max = 2;
	} else if (cphosts_max == cphosts_num) {

		struct cphosts *tmppcphosts;
		tmppcphosts = realloc(pcphosts,
				      (cphosts_max + 2) * sizeof(struct cphosts));
		if (tmppcphosts == NULL) {
			free(pcphosts);
			return HANDLER_FAIL;
		}
		pcphosts = tmppcphosts;
		cphosts_max += 2;
	}
	pnxt = strchr(value, (int) ':');
	if (pnxt == NULL) {
		sprintf(log_buffer, "invalid host specification: %s", value);
		log_err(-1, __func__, log_buffer);
		return HANDLER_FAIL;
	}
	*pnxt++ = '\0';
#ifdef NAS /* localmod 009 */
	/* support $usecp rules that exclude a pattern, look for hostname
	 * that starts with ! */
	if (value[0] == '!') {
		(pcphosts + cphosts_num)->cph_exclude = 1;
		value++;
	} else {
		(pcphosts + cphosts_num)->cph_exclude = 0;
	}
#endif /* localmod 009 */

	if (((pcphosts + cphosts_num)->cph_hosts = strdup(value)) == NULL)
		return HANDLER_FAIL;
	value = pnxt; /* now ptr to path */
	while (!isspace(*pnxt))
		pnxt++;
	*pnxt++ = '\0';
	if (((pcphosts + cphosts_num)->cph_from = strdup(value)) == NULL)
		return HANDLER_FAIL;

	if (((pcphosts + cphosts_num)->cph_to = strdup(skipwhite(pnxt))) == NULL)
		return HANDLER_FAIL;

	fix_path((pcphosts + cphosts_num)->cph_from, 1);
	fix_path((pcphosts + cphosts_num)->cph_to, 1);

	cphosts_num++;

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *      sets prolog alarm
 *
 * @param[in] value - value for prolog alarm
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL(0)         Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
prologalarm(char *value)
{
	int i;
	extern unsigned int pe_alarm_time;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  "prolog alarm", value);
	i = (unsigned int) atoi(value);
	if (i <= 0)
		return HANDLER_FAIL; /* error */
	pe_alarm_time = (unsigned int) i;
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	Handler function for the $sister_join_job_alarm config option.
 *
 * @param[in]	value - the input given in config file.
 *
 * @return handler_ret_t
 * @retval HANNDLER_SUCCESS
 * @retval HANDLER_FAIL
 */
static handler_ret_t
set_joinjob_alarm(char *value)
{
	long i;
	char *endp;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  "sister_join_job_alarm", value);
	i = strtol(value, &endp, 10);
	if ((*endp != '\0') || (i <= 0) || (i == LONG_MIN) || (i == LONG_MAX))
		return HANDLER_FAIL; /* error */
	joinjob_alarm_time = i;
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	Handler function for the $job_launch_delay cconfig option.
 *
 * @param[in]	value - the input given in config file.
 *
 * @return handler_ret_t
 * @retval HANNDLER_SUCCESS
 * @retval HANDLER_FAIL
 */
static handler_ret_t
set_job_launch_delay(char *value)
{
	long i;
	char *endp;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  "job_launch_delay", value);
	i = strtol(value, &endp, 10);

	if ((*endp != '\0') || (i <= 0) || (i == LONG_MIN) || (i == LONG_MAX))
		return HANDLER_FAIL; /* error */
	job_launch_delay = i;
	return HANDLER_SUCCESS;
}

#ifdef WIN32

/**
 * @brief
 *      sets nrun_factor
 *
 * @param[in] value - value for nrun_factor
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL(0)         Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
set_nrun_factor(char *value)
{
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, value);
	if ((nrun_factor = atoi(value)) == 0)
		return HANDLER_FAIL; /* error */
	else
		return HANDLER_SUCCESS;
}

/**
 * @brief
 *      Performs shell_escape_timeout on process tree by using given parent process handle <hProcess> and close that handle.
 *
 * @return	Void
 *
 */

static HANDLE shell_escape_handle = INVALID_HANDLE_VALUE;
static void
shell_escape_timeout(void)
{
	int ret = 0;
	int err_no = 0;
	char log_buf[LOG_BUF_SIZE] = "";
	if (shell_escape_handle != INVALID_HANDLE_VALUE) {
		ret = processtree_op_by_handle(shell_escape_handle, TERMINATE, 13); /* Terminated process would have exit code 13 */
		if (ret == -1) {
			err_no = GetLastError();
			sprintf(log_buf, "could not terminate shell escape process tree, pid=%d", GetProcessId(shell_escape_handle));
			log_err(err_no, "shell_escape_timeout", log_buf);
		} else {
			SetLastError(0);
		}
		log_err(-1, "shell_escape_timeout", "terminate shell escape");
	}
}
#endif /* WIN32 */

/**
 * @brief
 * read and set values used in enforcement of cpupercent calculation and
 * other limit enforcement
 *
 * In the form of:
 * $enforce NAME VALUE
 *
 *	where "NAME is     default	   range of values	*/

int delta_percent_over = 50;	  /* 0   <= I <= 100	*/
double delta_cpufactor = 1.05;	  /* 1.0 <= D		*/
double delta_weightup = 0.4;	  /* 0.0 <= D <= 1.0	*/
double delta_weightdown = 0.1;	  /* 0.0 <= D <= 1.0	*/
int average_percent_over = 50;	  /* 0   <= I <= 100	*/
double average_cpufactor = 1.025; /* 1.0 <= D		*/
int average_trialperiod = 120;	  /* 0   <= I		*/
/*
 * or the form of:  $enforce [!]NAME
 * where NAME is:
 */
/* cpuburst */
int cpuburst = 0; /* 1 or 0		*/
/* cpuaverage */
int cpuaverage = 0; /* 1 or 0		*/
/* mem */
int enforce_mem = 0; /* on, value ignored	*/
/* complexmem	*/
int complex_mem_calc = 0; /* 1 or 0		*/

static handler_ret_t
set_enforcement(char *str)
{
	char arg[80];
	int on = 1;

	if (!str)
		return HANDLER_FAIL;

	/* if current token starts with !, then set value off and skip ! */
	if (*str == '!') {
		on = 0; /* set off */
		str++;
	}

	str = TOKCPY(str, arg);
	str = skipwhite(str);

	if (strcmp(arg, "delta_percent_over") == 0) {
		if (*str == '\0')
			return HANDLER_FAIL;
		delta_percent_over = atoi(str);
	} else if (strcmp(arg, "delta_cpufactor") == 0) {
		if (*str == '\0')
			return HANDLER_FAIL;
		delta_cpufactor = atof(str);
	} else if (strcmp(arg, "delta_weightup") == 0) {
		if (*str == '\0')
			return HANDLER_FAIL;
		delta_weightup = atof(str);
	} else if (strcmp(arg, "delta_weightdown") == 0) {
		if (*str == '\0')
			return HANDLER_FAIL;
		delta_weightdown = atof(str);
	} else if (strcmp(arg, "average_percent_over") == 0) {
		if (*str == '\0')
			return HANDLER_FAIL;
		average_percent_over = atoi(str);
	} else if (strcmp(arg, "average_cpufactor") == 0) {
		if (*str == '\0')
			return HANDLER_FAIL;
		average_cpufactor = atof(str);
	} else if (strcmp(arg, "average_trialperiod") == 0) {
		if (*str == '\0')
			return HANDLER_FAIL;
		average_trialperiod = atoi(str);
	} else if (strcmp(arg, "cpuburst") == 0) {
		cpuburst = on; /* may be off */
	} else if (strcmp(arg, "cpuaverage") == 0) {
		cpuaverage = on; /* may be off */
	} else if (strcmp(arg, "mem") == 0) {
		enforce_mem = on; /* may be off */
	} else if (strcmp(arg, "complexmem") == 0) {
		complex_mem_calc = on; /* may be off */
	} else {
		return HANDLER_FAIL;
	}
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	check for the type of action to be done on a certain event
 *
 * @param[in] ae - enum val for action_event
 *
 * @return	the Action_Verb enum value, see mom_func.h:
 * @retval	Default no directive to change the action for the event
 * @retval	Script defined in see mom_func.h
 * @retval	Requeue defined in see mom_func.h
 *
 */
enum Action_Verb
chk_mom_action(enum Action_Event ae)
{
	assert((0 <= ae) && (ae < (int) LastAction));

	return mom_action[ae].ma_verb;
}

/**
 * @brief
 *	if there is an external script defined for this
 *	action, do it and return values:
 *
 * @retval	1	script running in child process
 * @retval	0	script ran with no error
 * @retval	-1	error, script did not run correctly
 * @retval	-2	error, no script - do normal default action
 *
 *	The "post" function is called out of scan_for_terminated() when the
 *	child process (script) exits.  It is called with the pointer to the job
 *	and the script exit value.   If the script does not complete in the
 *	specified timeout value,  the "post" function will be called with the
 *	error value of -1.
 *
 *	The action taken by the "post" function on a error depends on the
 *	function itself.   Usually it should preform the "default" action
 *	for that action.
 *
 */
int
do_mom_action_script(int ae,	      /* index into action table */
		     job *pjob,	      /* ptr to job */
		     pbs_task *ptask, /* ptr to task */
		     char *path,
		     void (*post)(job *p, int e)) /* post action func */
{
	char **args = NULL;
	char buf[MAXPATHLEN + 1];
	int i;
	int nargs;
	char **pargs;
	struct stat sb;
	struct passwd *pwdp;
	int rc = -1;
	struct mom_action *ma;
	int transmog = 0;
	int j;
	int pipes[2], kid_read = -1, kid_write = -1;
	int parent_read = -1, parent_write = -1;
	struct startjob_rtn sjr;
	pid_t child;

	memset(&sjr, 0, sizeof(sjr));

	assert((0 <= ae) && (ae < (int) LastAction));

	ma = &mom_action[ae];
	if (ma == NULL || ma->ma_script == NULL)
		return -2;

	/* does script really exist? */
	if (stat(ma->ma_script, &sb) == -1) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			   "action %s script %s does not exist", ma->ma_name, ma->ma_script);
		return -1;
	} else if (sb.st_uid != 0 || sb.st_gid > 10 || (sb.st_mode & S_IXUSR) != S_IXUSR || (sb.st_mode & S_IWOTH) != 0) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			   "action %s script %s cannot be executed due to permissions", ma->ma_name, ma->ma_script);
		return -1;
	}

	if (ptask == NULL)
		ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);

	if (ptask == NULL) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			   "action %s script %s cannot run because job has no tasks", ma->ma_name, ma->ma_script);
		return -1;
	}

	/*
	 ** If we are going to leave the script running in the background,
	 ** the ji_momsubt field has to be free to track the pid.
	 */
	if (post != NULL && pjob->ji_momsubt) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			   "action %s script %s cannot be run due to existing subtask", ma->ma_name, ma->ma_script);
		return -1;
	}

	if ((pwdp = check_pwd(pjob)) == NULL) {
		log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, log_buffer);
		return -1;
	}

	/* build up args to script */
	for (nargs = 0, pargs = ma->ma_args; pargs && *pargs; pargs++)
		nargs++;
	/* Add one for the command itself */
	nargs++;
	args = calloc((nargs + 1), sizeof(char *));
	if (args == NULL)
		return -1;

	/* set args[0] to script */
	args[0] = strdup(ma->ma_script);
	if (args[0] == NULL) {
		free(args);
		return -1;
	}

	pargs = ma->ma_args;
	for (i = 1; i < nargs; i++, pargs++) {
		if (**pargs == '%') {
			if (strcmp(*pargs + 1, "jobid") == 0)
				strcpy(buf, pjob->ji_qs.ji_jobid);
			else if (strcmp(*pargs + 1, "sid") == 0)
				sprintf(buf, "%d", ptask->ti_qs.ti_sid);
			else if (strcmp(*pargs + 1, "taskid") == 0)
				sprintf(buf, "%d", ptask->ti_qs.ti_task);
			else if (strcmp(*pargs + 1, "uid") == 0) {
				sprintf(buf, "%d", pjob->ji_qs.ji_un.ji_momt.ji_exuid);
			} else if (strcmp(*pargs + 1, "gid") == 0) {
				sprintf(buf, "%d", pjob->ji_qs.ji_un.ji_momt.ji_exgid);
			} else if (strcmp(*pargs + 1, "login") == 0)
				strcpy(buf, get_jattr_str(pjob, JOB_ATR_euser));
			else if (strcmp(*pargs + 1, "owner") == 0)
				strcpy(buf, get_jattr_str(pjob, JOB_ATR_job_owner));
			else if (strcmp(*pargs + 1, "globid") == 0)
				strcpy(buf, "NULL");
			else if (strcmp(*pargs + 1, "auxid") == 0) {
				char *value;
				if ((value = get_jattr_str(pjob, JOB_ATR_altid)) != NULL)
					pbs_strncpy(buf, value, sizeof(buf));
				else
					strcpy(buf, "NULL");
			} else if (strcmp(*pargs + 1, "path") == 0) {
				if (path != NULL)
					pbs_strncpy(buf, path, sizeof(buf));
				else
					strcpy(buf, "NULL");
			} else {
				log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
					   "action %s script %s cannot be run due to unknown parameter %s",
					   ma->ma_name, ma->ma_script, *pargs);
				goto done;
			}
		} else
			pbs_strncpy(buf, *pargs, sizeof(buf));

		*(args + i) = strdup(buf);
		if (*(args + i) == NULL)
			return -1;
	}

	/*
	 * Special case for restart_transmogrify.
	 * The script is going to morf into the task so we have to
	 * setup pipes just like in start_process()
	 */
	if ((transmog = (ae == RestartAction) && restart_transmogrify)) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			   "action %s script %s preparing to transmogrify task %8.8X",
			   ma->ma_name, ma->ma_script, ptask->ti_qs.ti_task);

		if (pipe(pipes) == -1)
			goto done;
		if (pipes[1] < 3) {
			kid_write = fcntl(pipes[1], F_DUPFD, 3);
			close(pipes[1]);
		} else
			kid_write = pipes[1];
		parent_read = pipes[0];

		if (pipe(pipes) == -1) {
			close(kid_write);
			close(parent_read);
			goto done;
		}
		if (pipes[0] < 3) {
			kid_read = fcntl(pipes[0], F_DUPFD, 3);
			close(pipes[0]);
		} else
			kid_read = pipes[0];
		parent_write = pipes[1];
	} else if (ae == RestartAction)
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			   "action %s script %s preparing to restart task %8.8X",
			   ma->ma_name, ma->ma_script, ptask->ti_qs.ti_task);

	if ((child = fork_me(-1)) == 0) { /* child */
		extern char *variables_else[];
		char *shell;

		/* unprotect the child process which becomes the job */
		daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

		shell = set_shell(pjob, pwdp); /* machine dependent */
		vtable.v_ensize = 30;
		vtable.v_used = 0;
		vtable.v_envp = (char **) calloc(vtable.v_ensize, sizeof(char *));
		if (vtable.v_envp == NULL) {
			free(args);
			log_err(errno, "setup environment", "out of memory");
			return -1;
		}
		/* setup environment */
		/* UID */
		sprintf(buf, "%d", pjob->ji_qs.ji_un.ji_momt.ji_exuid);
		bld_env_variables(&vtable, "UID", buf);
		/* GID */
		sprintf(buf, "%d", pjob->ji_qs.ji_un.ji_momt.ji_exgid);
		bld_env_variables(&vtable, "GID", buf);
		/* HOME */
		bld_env_variables(&vtable, variables_else[0], pwdp->pw_dir);
		/* LOGNAME */
		bld_env_variables(&vtable, variables_else[1], pwdp->pw_name);
		/* PBS_JOBNAME */
		bld_env_variables(&vtable, variables_else[2], get_jattr_str(pjob, JOB_ATR_jobname));
		/* PBS_JOBID */
		bld_env_variables(&vtable, variables_else[3], pjob->ji_qs.ji_jobid);
		/* PBS_QUEUE */
		bld_env_variables(&vtable, variables_else[4], get_jattr_str(pjob, JOB_ATR_in_queue));
		/* SHELL */
		bld_env_variables(&vtable, variables_else[5], shell);
		/* USER */
		bld_env_variables(&vtable, variables_else[6], pwdp->pw_name);
		/* PBS_JOBCOOKIE */
		bld_env_variables(&vtable, variables_else[7], get_jattr_str(pjob, JOB_ATR_Cookie));
		/* PBS_NODENUM */
		sprintf(buf, "%d", pjob->ji_nodeid);
		bld_env_variables(&vtable, variables_else[8], buf);
		/* PBS_TASKNUM */
		sprintf(buf, "%ld", (long) ptask->ti_qs.ti_task);
		bld_env_variables(&vtable, variables_else[9], buf);
		/* PBS_MOMPORT */
		sprintf(buf, "%d", pbs_rm_port);
		bld_env_variables(&vtable, variables_else[10], buf);
		/* PBS_NODEFILE */
		sprintf(buf, "%s/aux/%s", pbs_conf.pbs_home_path, pjob->ji_qs.ji_jobid);
		bld_env_variables(&vtable, variables_else[11], buf);
		/* PBS_SID */
		sprintf(buf, "%d", ptask->ti_qs.ti_sid);
		bld_env_variables(&vtable, "PBS_SID", buf);
		/* PBS_JOBDIR */
		if (is_jattr_set(pjob, JOB_ATR_sandbox) && strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0) {
			bld_env_variables(&vtable, "PBS_JOBDIR",
					  jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir));
		} else
			bld_env_variables(&vtable, "PBS_JOBDIR", pjob->ji_grpcache->gc_homedir);
		mom_unnice();

		/*
		 ** Do the same operations as start_process() but we don't
		 ** need to reset the global ID.
		 */
		if (transmog) {
			close(parent_read);
			close(parent_write);

#if MOM_ALPS
			/*
			 * ALPS jobs need a new PAGG when
			 * being restarted.
			 */
			memset(pjob->ji_extended.ji_ext.ji_jid, 0, sizeof(pjob->ji_extended.ji_ext.ji_jid));
#endif
			j = set_job(pjob, &sjr);
			if (j < 0) {
				if (j == -1)
					strcpy(log_buffer, "Unable to set task session");
				DBPRT(("%s: %s\n", __func__, log_buffer))
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
				if (j == -3)
					j = JOB_EXEC_FAIL2;
				else
					j = JOB_EXEC_RETRY;
				starter_return(kid_write, kid_read, j, &sjr);
			}
			ptask->ti_qs.ti_sid = sjr.sj_session;
			i = mom_set_limits(pjob, SET_LIMIT_SET);
			if (i != PBSE_NONE) {
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_WARNING, pjob->ji_qs.ji_jobid, "Unable to set limits, err=%d", i);
				if (i == PBSE_RESCUNAV)
					j = JOB_EXEC_RETRY;
				else
					j = JOB_EXEC_FAIL2;
				starter_return(kid_write, kid_read, j, &sjr);
			}
			log_close(0);
			starter_return(kid_write, kid_read, JOB_EXEC_OK, &sjr);
		} else { /* just close down anything hanging */
			close(0);
			close(1);
			close(2);
		}

		execve(ma->ma_script, args, vtable.v_envp);
		exit(254);
	}

	if (child == -1) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "action script %s cannot be run due to fork failure %d", ma->ma_script, errno);
		goto done;
	}

	if (post != NULL) { /* post func means we do not wait */
		rc = 1;
		pjob->ji_momsubt = child;
		pjob->ji_mompost = post;
		if (ma->ma_timeout)
			pjob->ji_actalarm = time_now + ma->ma_timeout;
		else
			pjob->ji_actalarm = 0;
		goto done;
	}

	if (transmog) { /* setup new task */
		close(kid_read);
		close(kid_write);

		/* read sid */
		i = readpipe(parent_read, &sjr, sizeof(sjr));
		j = errno;
		close(parent_read);
		if (i != sizeof(sjr)) {
			log_errf(j, __func__, "read of pipe for pid job %s got %d not %d", pjob->ji_qs.ji_jobid, i, (int) sizeof(sjr));
			close(parent_write);
			goto done;
		}
		/* send info back as an acknowlegment */
		writepipe(parent_write, &sjr, sizeof(sjr));
		close(parent_write);
		DBPRT(("%s: read start return %d %d\n", __func__, sjr.sj_code, sjr.sj_session))
		/* update system specific ids and information from set_job() */
		set_globid(pjob, &sjr);
		if (sjr.sj_code < 0) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid,
				   "task %8.8X not started, %s %d", (unsigned int) ptask->ti_qs.ti_task, (sjr.sj_code == JOB_EXEC_RETRY) ? "Retry" : "Failure", sjr.sj_code);
			goto done;
		}
		ptask->ti_qs.ti_sid = sjr.sj_session;
		ptask->ti_qs.ti_status = TI_STATE_RUNNING;
		(void) task_save(ptask);
		/* update the job with the new session id */
		set_jattr_l_slim(pjob, JOB_ATR_session_id, sjr.sj_session, SET);
		if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING)) {
			set_job_state(pjob, JOB_STATE_LTR_RUNNING);
			set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
			job_save(pjob);
		}

		rc = 0;
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "task %8.8X transmogrified", (unsigned int) ptask->ti_qs.ti_task);
		enqueue_update_for_send(pjob, IS_RESCUSED);
	} else { /* wait for script */
		DBPRT(("action: setting alarm %d\n", ma->ma_timeout))
		alarm(ma->ma_timeout);
		rc = 0;
		if (waitpid(child, &rc, 0) == -1) {
			log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "%s script %s: wait failed %d", ma->ma_name, ma->ma_script, errno);
			(void) kill(child, SIGKILL);
			(void) waitpid(child, &rc, 0);
		}
		alarm(0);
		if (WIFEXITED(rc)) {
			rc = WEXITSTATUS(rc);
			log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "%s script %s: exit code %d", ma->ma_name, ma->ma_script, rc);
			if (rc != 0)
				rc = -1;
		} else if (WIFSIGNALED(rc)) {
			rc = WTERMSIG(rc);
			log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "%s script %s: got signal %d", ma->ma_name, ma->ma_script, rc);
			rc = -1;
		} else {
			log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "%s script %s: exited abnormally", ma->ma_name, ma->ma_script);
			rc = -1;
		}
	}

done:
	/* free args arrays */
	for (pargs = args; *pargs; pargs++)
		(void) free(*pargs);
	(void) free(args);

	return rc;
}

/**
 * @brief
 *	set the suspend (and resume) signal used
 *
 * @param[in] str - signal name
 *
 * @return	handler_ret_t
 * @retval	HANDLER_FAIL		Failure
 * @retval	HANDLER_SUCCESS		Success
 *
 */
static handler_ret_t
set_suspend_signal(char *str)
{
	char tok[80];

	if ((str == 0) || (*str == '\0'))
		return HANDLER_FAIL;

	str = TOKCPY(str, tok);
	str = skipwhite(str);

	suspend_signal = atoi(tok);

	if (*str != '\0')
		resume_signal = atoi(str);

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	Add static resource or shell escape line from config file.
 *	This is a support routine for read_config().
 *
 * @param[in] str - string holding resource name
 * @param[in] file - filename
 * @param[in] linenum - line number in file
 *
 * @return int
 *
 * @retval  1 - In case of error
 * @retval  0 - In case of success
 *
 */
static int
add_static(char *str, char *file, int linenum)
{
	int i;
	char name[256];
	struct config_list *cp;
	int perm;

	str = TOKCPY(str, name); /* resource name */
	str = skipwhite(str);	 /* resource value */
	if (*str == '!') {	 /* shell escape command */
		int err;
		char *filename;
		rmnl(str);
		filename = get_script_name(&str[1]);
		if (filename == NULL)
			return 1;
		perm = get_permission("write");
		err = tmp_file_sec(filename, 0, 1, perm, 1);

		if (err != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "error: %s file has a non-secure file access, errno: %d", filename, err);
			log_event(PBSEVENT_SECURITY, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);
			free(filename);
			return 1;
		}
		free(filename);
	} else { /* get the value */
		i = strlen(str);
		while (--i) { /* strip trailing blanks */
			if (!isspace((int) *(str + i)))
				break;
			*(str + i) = '\0';
		}
	}

	cp = (struct config_list *) malloc(sizeof(struct config_list));
	memcheck((char *) cp);

	cp->c_link = config_list;
	cp->c.c_name = strdup(name);
	memcheck(cp->c.c_name);
	cp->c.c_u.c_value = strdup(str);
	memcheck(cp->c.c_u.c_value);

	snprintf(log_buffer, sizeof(log_buffer), "%s[%d] add name %s value %s",
		 file, linenum, name, str);
	log_event(PBSEVENT_DEBUG, 0, LOG_DEBUG, "add_static", log_buffer);

	config_list = cp;
	return 0;
}

/**
 * @brief
 *	sets ideal load
 *
 * @param[in] value - value for ideal load
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL            Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
setidealload(char *value)
{
	char newstr[50] = "ideal_load ";
	float val;

	val = (float) atof(value);
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
		  "ideal_load", value);
	if (val < 0.0)
		return HANDLER_FAIL; /* error */
	ideal_load_val = val;
	if (max_load_val < 0.0)
		max_load_val = val; /* set a default */
	(void) strcat(newstr, value);
	if (add_static(newstr, "config", 0))
		return HANDLER_FAIL;
	nconfig++;
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *      sets maximum load
 *
 * @param[in] value - value for maximum load
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL            Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
setmaxload(char *value)
{
	char newstr[50] = "max_load ";
	char *endptr;
	float val;

	endptr = value;
	while ((!isspace((int) *endptr)) && *endptr)
		endptr++;
	val = (float) atof(value);
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
		  "max_load", value);
	if (val < 0.0)
		return HANDLER_FAIL; /* error */
	max_load_val = val;
	if (ideal_load_val < 0.0)
		ideal_load_val = val;
	(void) strncat(newstr, value, 40);
	if (add_static(newstr, "config", 0))
		return HANDLER_FAIL;
	nconfig++;

	if (*endptr != '\0') {
		if (strstr(endptr, "suspend"))
			idle_on_maxload = 1;
	}
	return HANDLER_SUCCESS;
}

/**
 * process $max_poll_downtime directive in config file:
 *	$max_poll_downtime 300
 */
static handler_ret_t
set_max_poll_downtime(char *value)
{
	char *sbuf;
	char *ebuf;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
		  LOG_INFO, "max_poll_downtime", value);
	sbuf = value;
	max_poll_downtime_val = (time_t) strtol(sbuf, &ebuf, 10);
	if (max_poll_downtime_val <= 0)
		return HANDLER_FAIL; /* error */

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	process $kbd_idle directive in config file:
 *	$kbidle avail [busy]
 *
 * @param[in] value - value for kb idle
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL            Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
set_kbd_idle(char *value)
{
	char *sbuf;
	char *ebuf;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
		  LOG_INFO, "idle_avail", value);
	sbuf = value;
	idle_avail = (time_t) strtol(sbuf, &ebuf, 10);
	if (idle_avail <= 0)
		return HANDLER_FAIL; /* error */

	idle_check = 1;
	cycle_harvester = 1;
	sbuf = ebuf;
	while (isspace((int) *sbuf))
		++sbuf;
	if (*sbuf == '\0')
		goto chk_for_interactive; /* no idle_busy, but that is ok */

	idle_busy = (time_t) strtol(sbuf, &ebuf, 10);
	if (idle_busy <= 0)
		return HANDLER_FAIL; /* error */

	sbuf = ebuf;
	while (isspace((int) *sbuf))
		++sbuf;
	if (*sbuf == '\0')
		goto chk_for_interactive; /* no idle_poll, but that is ok */

	idle_poll = (time_t) strtol(sbuf, &ebuf, 10);
	if (idle_poll <= 0)
		return HANDLER_FAIL; /* error */

	/* check whether PBS_INTERACTIVE service is registered or not? */
chk_for_interactive:
	return check_interactive_service();
}

/**
 * @brief
 *	sets temporary dirctory
 *
 * @param[in] value - value for temp directory
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL            Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
set_tmpdir(char *value)
{
	char *cleaned_value;
	int i;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
		  LOG_INFO, "tmpdir", value);
	cleaned_value = remove_quotes(value); /* remove quotes if any present */
	if (cleaned_value == NULL)
		return HANDLER_FAIL;

	/* Remove trailing separator */
	for (i = (strlen(cleaned_value) - 1); i >= 0; i--) {
		if (cleaned_value[i] != TRAILING_CHAR)
			break;
		cleaned_value[i] = '\0';
	}

	if (strlen(cleaned_value) > sizeof(pbs_tmpdir) - 1) {
		free(cleaned_value);
		return HANDLER_FAIL;
	}

#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	if (verify_dir(cleaned_value, 1, 1, 0, 1)) {
		free(cleaned_value);
		return HANDLER_FAIL; /* error */
	}
#endif /* NO_SECURITY_CHECK */

	strcpy(pbs_tmpdir, cleaned_value);
	free(cleaned_value);
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *      sets job dirctory
 *
 * @param[in] value - value for job directory
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL            Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

static handler_ret_t
set_jobdir_root(char *value)
{
	char *cleaned_value;
	char *savep = NULL;
	char *directive;
	char *p;

	p = value;
	value = strtok_r(p, " ", &savep);
	directive = strtok_r(NULL, " ", &savep);
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
		  LOG_INFO, __func__, value);
	cleaned_value = remove_quotes(value); /* remove quotes if any present */
	if (cleaned_value == NULL)
		return HANDLER_FAIL;

	if (strlen(cleaned_value) > sizeof(pbs_jobdir_root) - 1) {
		free(cleaned_value);
		return HANDLER_FAIL;
	}

#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	if ((strcmp(cleaned_value, JOBDIR_DEFAULT) != 0) && (verify_dir(cleaned_value, 1, 1, 0, 1))) {
		free(cleaned_value);
		return HANDLER_FAIL;
	}
#endif /* NO_SECURITY_CHECK */

	strcpy(pbs_jobdir_root, cleaned_value);
	free(cleaned_value);

	if (directive != NULL) {
		if (strcmp(directive, "shared") == 0)
			pbs_jobdir_root_shared = TRUE;
	}
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	sets boolean value
 *
 * @param[in] id - function name
 * @param[in] value - value
 * @param[in] flag - configuration flag
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL            Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */

handler_ret_t
set_boolean(const char *id, char *value, int *flag)
{
	if (value == NULL || *value == '\0') {
		sprintf(log_buffer, "No value specified, no action taken.");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  id, log_buffer);
		return HANDLER_FAIL; /* error */
	}

	if ((strcasecmp(value, "no") == 0) ||
	    (strcasecmp(value, "false") == 0) ||
	    (strcasecmp(value, "off") == 0) ||
	    (strcmp(value, "0") == 0)) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  id, "false");
		*flag = FALSE;
	} else if ((strcasecmp(value, "yes") == 0) ||
		   (strcasecmp(value, "true") == 0) ||
		   (strcasecmp(value, "on") == 0) ||
		   (strcmp(value, "1") == 0)) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  id, "true");
		*flag = TRUE;
	} else {
		sprintf(log_buffer,
			"Illegal value \"%s\", no action taken.", value);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  id, log_buffer);
		return HANDLER_FAIL; /* error */
	}
	return HANDLER_SUCCESS; /* success */
}

static handler_ret_t
set_int(const char *id, char *value, int *var)
{
	char *left;
	int val;

	if (value == NULL || *value == '\0') {
		sprintf(log_buffer, "No value specified, no action taken.");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  id, log_buffer);
		return HANDLER_FAIL; /* error */
	}

	val = (int) strtol(value, &left, 0);
	if (*left != '\0' || val <= 0) {
		sprintf(log_buffer, "bad value \"%s\"", value);
		log_event(PBSEVENT_SYSTEM, 0, LOG_ERR, id, log_buffer);
		return HANDLER_FAIL; /* error */
	}
	*var = val;

	sprintf(log_buffer, "setting %d", val);
	log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, id, log_buffer);

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	set float value
 *
 * @param[in] id - function name
 * @param[in] value - value
 * @param[out] var - output float value
 *
 * @return      handler_ret_t
 * @retval      HANDLER_FAIL            Failure
 * @retval      HANDLER_SUCCESS         Success
 *
 */
handler_ret_t
set_float(const char *id, char *value, float *var)
{
	char *left;
	float val;

	if (value == NULL || *value == '\0') {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  id, "No value specified, no action taken.");
		return HANDLER_FAIL; /* error */
	}

	val = strtod(value, &left);
	if (left == value || val <= 0) {
		sprintf(log_buffer, "bad value \"%s\"", value);
		log_event(PBSEVENT_SYSTEM, 0, LOG_ERR, id, log_buffer);
		return HANDLER_FAIL; /* error */
	}
	*var = val;

	snprintf(log_buffer, sizeof(log_buffer), "setting %f", val);
	log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, id, log_buffer);

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	Set the configuration flag that defines whether the restart nunction
 *	occurs in the background.
 *
 * @retval 0 failure
 * @retval 1 success
 *
 */
static handler_ret_t
set_restart_background(char *value)
{
	return (set_boolean(__func__, value, &restart_background));
}

/**
 * @brief
 *	 Set the configuration flag that defines whether the restart function
 *	transmogrifies into a task.
 *
 * @retval 0 failure
 * @retval 1 success
 *
 */
static handler_ret_t
set_restart_transmogrify(char *value)
{
	return (set_boolean(__func__, value, &restart_transmogrify));
}

/**
 * @brief
 *	Set the configuration flag that defines whether a call to tm_attach
 *	is allowed.
 *
 * @retval 0 failure
 * @retval 1 success
 *
 */
static handler_ret_t
set_attach_allow(char *value)
{
	return (set_boolean(__func__, value, &attach_allow));
}

#if MOM_ALPS
/**
 * @brief
 *	Set the path used for invoking the ALPS BASIL client.
 *
 * @retval 0 failure
 * @retval 1 success
 *
 */
static handler_ret_t
set_alps_client(char *value)
{
	char *p;

	if (!value) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "Unsetting alps_client.");
		if (alps_client) {
			free(alps_client);
			alps_client = NULL;
		}
		return HANDLER_SUCCESS;
	}
	if (alps_client && strcmp(value, alps_client) == 0) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "alps_client unchanged, values identical.");
		return HANDLER_SUCCESS;
	}
	if (strlen(value) > _POSIX_PATH_MAX) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "alps_client unchanged, new value too long.");
		return HANDLER_FAIL;
	}
	if (*value != '/') {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "alps_client unchanged, must be full path.");
		return HANDLER_FAIL; /* Must be full path. */
	}
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	if (chk_file_sec(value, 0, 0, S_IWGRP | S_IWOTH, 0) != 0) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "alps_client unchanged, security check failed.");
		return HANDLER_FAIL;
	}
#else
	{
		struct stat sb;
		if (stat(value, &sb) == -1) {
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
				  LOG_NOTICE, __func__,
				  "alps_client unchanged, cannot stat file.");
			return HANDLER_FAIL;
		}
		if (!S_ISREG(sb.st_mode)) {
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
				  LOG_NOTICE, __func__,
				  "alps_client unchanged, not a regular file.");
			return HANDLER_FAIL;
		}
	}
#endif
	p = strdup(value);
	if (!p) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "alps_client unchanged, out of memory.");
		return HANDLER_FAIL;
	}
	if (alps_client)
		free(alps_client);
	alps_client = p;
	(void) sprintf(log_buffer, "%s %s",
		       "alps_client now set to", alps_client);
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  __func__, log_buffer);
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	Set the timeout value in seconds when we will stop checking for
 *	ALPS SWITCH response to change from "EMPTY".
 *	In order to work around a situation where we must poll on "EMPTY" in
 *	case it changes.  After the timeout, we can proceed with the suspend.
 *
 * @par
 *	It is best if this value is not too large, since PBS will be
 *	blocked until the timeout is reached or the response changes from "EMPTY".
 *
 * @retval 0 failure
 * @retval 1 success
 */
static handler_ret_t
set_alps_confirm_empty_timeout(char *value)
{
	return (set_int(__func__, value, &alps_confirm_empty_timeout));
}

/**
 * @brief
 *	Set the time out value in seconds when we will stop checking for
 *	ALPS SWITCH to complete.  PBS will basically give up trying.
 *
 * @par
 *	It is best if this value is not too large, since PBS will be
 *	blocked until the timeout is reached or the SWITCH completes.
 *
 * @retval 0 failure
 * @retval 1 success
 */
static handler_ret_t
set_alps_confirm_switch_timeout(char *value)
{
	return (set_int(__func__, value, &alps_confirm_switch_timeout));
}

/**
 * @brief
 * Set the configuration flag that defines vnode creation behavior
 * on a Cray.
 *
 * @par
 * If vnode_per_numa_node is set to TRUE, then
 * PBS will create one vnode per NUMA node (i.e. per segment).
 * Thus there will be multiple vnodes per host.
 *
 * If vnode_per_numa_node is set to FALSE, then
 * PBS will create one vnode for the compute node (i.e. it will
 * cover all segment information in one vnode).
 *
 * @retval 0 failure
 * @retval 1 success
 */
static handler_ret_t
set_vnode_per_numa_node(char *value)
{

	return (set_boolean(__func__, value, &vnode_per_numa_node));
}

/**
 * @brief
 *	Set the alps_release_wait_time in micoseconds to wait between ALPS release
 *	reservation requests
 *
 * @return returns value of set_float()
 *
 */
static handler_ret_t
set_alps_release_wait_time(char *value)
{
	float tmp;
	handler_ret_t ret;
	double fract, integ;
	ret = set_float(__func__, value, &tmp);
	if (ret == HANDLER_SUCCESS) {
		fract = modf(tmp, &integ);
		alps_release_wait_time = (useconds_t) integ * 1000000 + (fract * 1000000);
	}
	return (ret);
}

/**
 * @brief
 *	Set the alps_release_jitter value in microseconds.
 *
 * @par
 *	PBS will randomly generate how much
 *	microseconds to add to the alps_release_wait_time value
 *
 * @return returns value of set_float()
 *
 */
static handler_ret_t
set_alps_release_jitter(char *value)
{
	float tmp;
	handler_ret_t ret;
	double fract, integ;
	ret = set_float(__func__, value, &tmp);
	if (ret == HANDLER_SUCCESS) {
		fract = modf(tmp, &integ);
		alps_release_jitter = (useconds_t) integ * 1000000 + (fract * 1000000);
	}
	return (ret);
}

/**
 * @brief
 *	Set the time out value in seconds when we will stop making ALPS release
 *	reservation requests.  PBS will basically give up trying.
 *
 * @par
 * It is best if this value is greater than the Cray node health
 * value for "suspectbegin" (configurable by admins)
 *
 * @retval 0 failure
 * @retval 1 success
 *
 */
static handler_ret_t
set_alps_release_timeout(char *value)
{
	return (set_int(__func__, value, &alps_release_timeout));
}
#endif /* MOM_ALPS */

/**
 * @brief
 *	Set the base directory used for checkpoint/restart functions.
 *
 * @retval 0 failure
 * @retval 1 success
 */
static handler_ret_t
set_checkpoint_path(char *value)
{
	int rc = 0;
	char newpath[_POSIX_PATH_MAX] = "\0";

	/*
	 * If value and path_checkpoint both contain the same address,
	 * then we have nothing to do.
	 */
	if (value == path_checkpoint && path_checkpoint)
		return HANDLER_SUCCESS;
	/*
	 * Try setting path_checkpoint in the following order:
	 * 1. command line argument
	 * 2. environment variable
	 * 3. mom config file value
	 * 4. PBS_HOME/checkpoint
	 *
	 * Only alter path_checkpoint if we succeed.
	 */
	if (path_checkpoint_from_getopt) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "Using checkpoint path from command line.");
		pbs_strncpy(newpath, path_checkpoint_from_getopt, sizeof(newpath));
	} else if (path_checkpoint_from_getenv) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "Using checkpoint path from environment.");
		pbs_strncpy(newpath, path_checkpoint_from_getenv, sizeof(newpath));
	} else if (value) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "Using checkpoint path from config file.");
		pbs_strncpy(newpath, value, sizeof(newpath));
	} else {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "Using default checkpoint path.");
		pbs_strncpy(newpath, path_checkpoint_default, sizeof(newpath));
	}
	if (strlen(newpath) == 0) {
		/* Bad mojo, fall back to existing or default. */
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, "Empty checkpoint path specified, ignoring.");
		if (*path_checkpoint == '\0')
			/* path_checkpoint is never allocated memory, it points to path_checkpoint_buf */
			pbs_strncpy(path_checkpoint, path_checkpoint_default, sizeof(path_checkpoint_buf));
		return HANDLER_FAIL; /* error */
	}
	if (*(newpath + strlen(newpath) - 1) != '/') {
		strcat(newpath, "/");
	}
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	int perm;
	perm = get_permission("write");
	rc = chk_file_sec(newpath, 1, 0, perm, 0);
#else
	{
		struct stat sb;
		if (stat(newpath, &sb) == -1)
			rc = errno;
		else
			rc = 0;
	}
#endif /* !DEBUG && !NO_SECURITY_CHECK */
	if (rc == 0) {
		(void) sprintf(log_buffer, "%s %s",
			       "Setting checkpoint path to", newpath);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  __func__, log_buffer);
		strcpy(path_checkpoint_buf, newpath);
		if (!path_checkpoint)
			path_checkpoint = path_checkpoint_buf;
		return HANDLER_SUCCESS; /* success */
	}
	(void) sprintf(log_buffer, "%s %s",
		       "Error encountered setting checkpoint path to", newpath);
	log_err(rc, __func__, log_buffer);
	return HANDLER_FAIL; /* error */
}

/**
 * @brief
 *	sets mom name
 *
 * @param[in] value - value for mom name
 *
 * @return	handler_ret_t
 * @retval	HANDLER_SUCCESS		success
 * @retval	HANDLER_FAIL		Failure
 *
 */
static handler_ret_t
set_momname(char *value)
{
	if (strlen(value) > 63)
		return HANDLER_FAIL;
	(void) strcpy(mom_short_name, value);
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *      sets mom port
 *
 * @param[in] value - value for mom port
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_momport(char *value)
{
	char *ebuf;
	char *sbuf;

	sbuf = value;
	pbs_mom_port = (unsigned int) strtol(sbuf, &ebuf, 10);
	if (pbs_mom_port == 0)
		return HANDLER_FAIL;
	pbs_rm_port = pbs_mom_port + 1; /* assume next port for RM */

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *      sets maximum poll checks
 *
 * @param[in] value - max poll check
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_max_check_poll(char *value)
{
	static char id[] = "max_check_poll";

	return (set_int(id, value, &max_check_poll));
}

/**
 * @brief
 *      sets minimum poll checks
 *
 * @param[in] value - min poll checks
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_min_check_poll(char *value)
{
	static char id[] = "min_check_poll";

	return (set_int(id, value, &min_check_poll));
}

/**
 * @brief
 *      sets alien to be attached
 *
 * @param[in] value - value alien
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_alien_attach(char *value)
{
	return (set_boolean(__func__, value, &alien_attach));
}

/**
 * @brief
 *      sets alien kill value
 *
 * @param[in] value - value for alien kill
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_alien_kill(char *value)
{
	return (set_boolean(__func__, value, &alien_kill));
}

/**
 * @brief
 *      sets value for restrict user
 *
 * @param[in] value - value for restrict user
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_restrict_user(char *value)
{
	return (set_boolean(__func__, value, &restrict_user));
}

/**
 * @brief
 *      sets value for restrict maxsys user
 *
 * @param[in] value - value for restrict maxsys user
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_restrict_user_maxsys(char *value)
{
	return (set_int(__func__, value, &restrict_user_maxsys));
}

/**
 * @brief
 *	Exempt users from the restrict user feature.  The restrict_user_exempt_uids
 *	array holds the uids of the exempted users.
 *
 * @param[in]	user_list	comma separated string of usernames
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */
static handler_ret_t
set_restrict_user_exceptions(char *user_list)
{
	char *db_admins = NULL;
	char *p2 = NULL;
	struct passwd *pwent;
	int i;

	db_admins = strdup(user_list);
	if (db_admins == NULL) {
		log_err(errno, __func__, "strdup failed");
		return HANDLER_FAIL;
	}

	p2 = strtok(db_admins, ", ");

	i = 0;
	while (p2 != NULL) { /* each part */

		if (i == NUM_RESTRICT_USER_EXEMPT_UIDS) {
			sprintf(log_buffer, "Reached limit on # of uids exempted from dorestrict_user = %d", NUM_RESTRICT_USER_EXEMPT_UIDS);
			log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, __func__,
				  log_buffer);

			break;
		}

		if (((pwent = getpwnam(p2)) == NULL)) {
			sprintf(log_buffer, "user %s doesn't exist", p2);
			log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, __func__,
				  log_buffer);
		} else if (pwent->pw_uid == 0) {
			sprintf(log_buffer,
				"user %s ignored because uid=0", p2);
			log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, __func__,
				  log_buffer);
		} else {
			restrict_user_exempt_uids[i] = pwent->pw_uid;
			sprintf(log_buffer,
				"restrict_user_exempt_uids[%d]=%d (user %s)",
				i, restrict_user_exempt_uids[i], p2);
			log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, __func__,
				  log_buffer);
			i++;
		}
		p2 = strtok(NULL, ", ");
	} /* while */

	/* terminate the list of uids */
	if (i < NUM_RESTRICT_USER_EXEMPT_UIDS) {
		restrict_user_exempt_uids[i] = 0;
	}

	(void) free(db_admins);

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *      sets value for gen_nodefile_on_sister_mom
 *
 * @param[in] value - value for gen_nodefile_on_sister_mom
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
set_gen_nodefile_on_sister_mom(char *value)
{
	return (set_boolean(__func__, value, &gen_nodefile_on_sister_mom));
}

/**
 * @brief
 *	Set the configuration flag that defines whether to get rid of
 *	all vnode defs when reading the config files.
 *
 * @return	handler_ret_t.
 * @retval	0	Failure
 * @retval	1	Success
 *
 */
static handler_ret_t
set_vnode_additive(char *value)
{
	static char id[] = "set_vnodedef_additive";

	return (set_boolean(id, value, &vnode_additive));
}

/**
 * @brief
 *	parse the mom config file
 *
 * @param[in] file - filename
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
parse_config(char *file)
{
	FILE *conf;
	char line[512];
	char name[256], *str;
	int linenum, i;
	int err = 0;
	int num_newstaticdefs;
	handler_ret_t handler_ret = HANDLER_SUCCESS; /* init to success */

	if ((conf = fopen(file, "r")) == NULL) {
		sprintf(log_buffer, "fopen: %s", file);
		log_err(errno, __func__, log_buffer);
		return HANDLER_FAIL;
	} else {
		sprintf(log_buffer, "file %s", file);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  __func__, log_buffer);
	}

	num_newstaticdefs = 0;
	linenum = 0;
	while (fgets(line, sizeof(line), conf)) {
		linenum++;
		if (line[0] == '#') /* comment */
			continue;
		str = skipwhite(line); /* pass over initial whitespace */
		if (*str == '\0')
			continue;

		skip_trailing_spcl_char(line, 13);

		if (*str == '$') {		   /* special command */
			str = TOKCPY(++str, name); /* resource name */
			for (i = 0; special[i].name; i++) {
				if (strcmp(name, special[i].name) == 0)
					break;
			}
			if (special[i].name == NULL) { /* didn't find it */
				sprintf(log_buffer,
					"command name %s not found", name);
				log_err(-1, __func__, log_buffer);
				err = 1;
				continue;
			}
			str = skipwhite(str); /* command param */
			rmnl(str);

			if ((handler_ret = special[i].handler(str)) ==
			    HANDLER_FAIL) {
				sprintf(log_buffer,
					"%s[%d] command \"$%s %s\" failed, aborting",
					file, linenum, name, str);
				log_err(-1, __func__, log_buffer);
				err = 1;
			} else if (handler_ret == HANDLER_REPARSE) {
				/*
				 *	handler() asked us to pass parsing off
				 *	to the function that understands how to
				 *	read new-style configuration files.
				 *	As a result, this function will not
				 *	continue processing this file.  As an
				 *	additional check, we require that this
				 *	redirection occur at line 1 of the file
				 *	we're currently parsing.
				 */
				if (linenum != 1) {
					sprintf(log_buffer,
						"%s:  handler REPARSE at line %d",
						file, linenum);
					log_err(-1, __func__, log_buffer);
					handler_ret = HANDLER_FAIL;
					err = 1;
					break;
				}
				handler_ret = config_versionhandler(str, file,
								    conf);
				break;
			}
			continue;
		}

		if (add_static(str, file, linenum))
			continue;
		num_newstaticdefs++;
	}
	nconfig += num_newstaticdefs;

	(void) fclose(conf);
	if (err)
		return HANDLER_FAIL;
	return handler_ret;
}

/**
 * @brief
 *	Check the version number supplied to the $configversion directive to
 *	make sure it's within the range of versions we support.
 *
 * @param[in] value - value for config version check
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
config_verscheck(char *value)
{
	int vers;
	char *err = "$configversion value is out of range"
		    " (min %d, max %d) - will treat as old-style";

	vers = atoi(value);
	if ((vers < CONFIG_MINVERS) || (vers > CONFIG_MAXVERS)) {
		(void) sprintf(log_buffer, err, CONFIG_MINVERS, CONFIG_MAXVERS);
		log_err(-1, __func__, log_buffer);
		return HANDLER_FAIL;
	}

	return HANDLER_REPARSE;
}

/**
 * @brief
 *	version handler function for config file
 *
 * @param[in] value - value for config version check
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
config_versionhandler(char *value, const char *filename, FILE *fp)
{
	int vers;
	vnl_t *nv;
	extern callfunc_t vn_callback;

	switch (vers = atoi(value)) {
		case CONFIG_VNODEVERS:
			if ((nv = vn_parse_stream(fp, vn_callback)) == NULL) {
				(void) sprintf(log_buffer,
					       "error(s) parsing vnode definitions file %s",
					       filename);
				log_err(-1, __func__, log_buffer);
				return HANDLER_FAIL;
			}

			if (vnlp == NULL)
				vnlp = nv;
			else {
				vn_merge(vnlp, nv, vn_callback);
				vnl_free(nv);
			}
			break;

		default:
			(void) sprintf(log_buffer,
				       "unhandled config file version (%d) in file %s",
				       vers, filename);
			return HANDLER_FAIL;
	}

	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	compares two directories from directory list
 *
 * @param[in] s1 - directory 1
 * @param[in] s2 - directory 2
 *
 * @return int
 * @retval 0 Failure
 * @retval 1 Success
 *
 */

static int
dirsort(const void *s1, const void *s2)
{
	return (strcmp(*((const char **) s1), *((const char **) s2)));
}

/**
 * @brief
 *	frees the directory list
 *
 * @param[in] list - pointer to pointer directory list
 *
 * @return Void
 *
 */

static void
free_dirlist(char **list)
{
	char **p;

	if (list != NULL) {
		for (p = list; (p != NULL) && (*p != NULL); p++)
			free(*p);
		free(list);
	}
}

/**
 * @brief
 *	Given a directory name, read its contents.
 *
 * @param[in] dirname	directory name to read
 * @param[out] mod	modified time of the directory
 *
 * @return a sorted, NULL-terminated list of strings (excluding "." and "..")
 * @retval NULL					Failure
 * @retval NULL-terminated list of strings	Success
 *
 */
static char **
do_readdir(char *dirname, time_t *mod)
{
	DIR *dirp;
	struct dirent *dp;
	char **list = NULL;
	char **newlist;
	size_t nelem = 0;

	if ((dirp = opendir(dirname)) == NULL) {
		perror(dirname);
		return NULL;
	}
	/*
	 * Get mod time if requested.
	 */
	if (mod != NULL) {
		struct stat sb;

		if (stat(dirname, &sb) == -1) {
			perror(dirname);
			return NULL;
		}
		*mod = sb.st_mtime;
	}

	while (errno = 0, (dp = readdir(dirp)) != NULL) {
		char *s;

		if ((strcmp(dp->d_name, ".") == 0) ||
		    (strcmp(dp->d_name, "..") == 0))
			continue;
		newlist = realloc(list, (nelem + 2) * sizeof(char *));
		if (newlist == NULL) {
			log_err(errno, __func__, "realloc");
			free_dirlist(list);
			(void) closedir(dirp);
			return NULL;
		} else
			list = newlist;
		if ((s = strdup(dp->d_name)) == NULL) {
			log_err(errno, __func__, "strdup");
			free_dirlist(list);
			(void) closedir(dirp);
			return NULL;
		} else {
			/*
			 *	N.B.:  the free_dirlist() function above
			 *	depends on the list always being NULL-
			 *	terminated.
			 */
			list[nelem++] = s;
			list[nelem] = NULL;
		}
	}
	if (errno != 0 && errno != ENOENT) {
		free_dirlist(list);
		perror(dirname);
		(void) closedir(dirp);
		return NULL;
	}
	(void) closedir(dirp);

	if (list)
		qsort(list, nelem, sizeof(*list), dirsort);
	return (list);
}

/**
 * @brief
 *	We make two passes through the list of additional configuration
 *	files, first executing those whose names begin with a special
 *	prefix (see path_addconfigs_reserved_prefix above) which marks
 *	them as reserved for our use, then the rest (which customers
 *	may have added).  Files reserved for our use may have special
 *	handling.  See the addspecial[] list above.
 *
 *	Depending on the error encountered, we may either return
 *	immediately (return HANDLER_FAIL) or set a return value
 *	that will cause the overall config file reading process
 *	to fail, but allow us to continue parsing other config
 *	files (ret = HANDLER_FAIL).
 *
 * @return      handler_ret_t
 * @retval      HANDLER_SUCCESS         success
 * @retval      HANDLER_FAIL            Failure
 *
 */

static handler_ret_t
do_addconfigs(void)
{
	struct stat sb;
	long pathlen;
	char *namebuf = NULL;
	char **list; /* ... of config files */
	char **listhead;
	unsigned int i;
	time_t modtime;
	handler_ret_t ret = HANDLER_SUCCESS; /* accumulated return value */

	if (stat(path_addconfigs, &sb) == -1) /* no work to do */
		return HANDLER_SUCCESS;

	if ((pathlen = pathconf(mom_home, _PC_PATH_MAX)) == -1) {
		log_err(errno, __func__, "pathconf");
		return HANDLER_FAIL;
	} else if ((namebuf = malloc(pathlen)) == NULL) {
		log_err(errno, __func__, "malloc");
		return HANDLER_FAIL;
	}

	if ((listhead = do_readdir(path_addconfigs, &modtime)) == NULL) {
		free(namebuf);
		return HANDLER_SUCCESS; /* no work to do */
	}
	for (list = listhead; list != NULL && *list != NULL; list++) {
		if (strstr(*list, path_addconfigs_reserved_prefix) == *list) {
			if (snprintf(namebuf, pathlen, "%s/%s", path_addconfigs,
				     *list) >= pathlen) {
				sprintf(log_buffer, "%s/%s", path_addconfigs,
					*list);
				log_err(ENAMETOOLONG, __func__, log_buffer);
				free(namebuf);
				free_dirlist(listhead);
				return HANDLER_FAIL;
			}
			for (i = 0; addspecial[i].name; i++) {
				if (strcmp(*list, addspecial[i].name) == 0)
					break;
			}
			if (addspecial[i].name == NULL) {
				/* no special handling */
				if (parse_config(namebuf) == HANDLER_FAIL)
					ret = HANDLER_FAIL;
			} else {
				if (addspecial[i].handler(namebuf) ==
				    HANDLER_FAIL)
					ret = HANDLER_FAIL;
			}
		}
	}
	for (list = listhead; list != NULL && *list != NULL; list++) {
		if (strstr(*list, path_addconfigs_reserved_prefix) != *list) {
			if (snprintf(namebuf, pathlen, "%s/%s", path_addconfigs,
				     *list) >= pathlen) {
				sprintf(log_buffer, "%s/%s", path_addconfigs,
					*list);
				log_err(ENAMETOOLONG, __func__, log_buffer);
				free(namebuf);
				free_dirlist(listhead);
				return HANDLER_FAIL;
			}
			if (parse_config(namebuf) == HANDLER_FAIL)
				ret = HANDLER_FAIL;
		}
	}

	free(namebuf);
	free_dirlist(listhead);

	if (vnlp != NULL && modtime > vnlp->vnl_modtime)
		vnlp->vnl_modtime = modtime;

	return (ret);
}

/**
 * @brief
 *	Open and read the config file.  Save information in a linked
 *	list.  After reading the file, create an array, copy the list
 *	elements to the array and free the list.
 *
 * @param[in] file - filename
 *
 * @return int
 * @retval 0 success
 * @retval 1 error
 *
 */
int
read_config(char *file)
{
	struct config_list *cp;
	struct config *ap;
	int i, j;
	int addconfig_ret;

	/*	initialize variable that can be set by config entries in case	*/
	/*	they are removed and we are HUPped				*/

	for (i = 0; i < mask_num; i++)
		free(maskclient[i]);
	mask_num = 0;

	average_percent_over = 50;
	average_cpufactor = 1.025;
	average_trialperiod = 120;
	complex_mem_calc = 0;
	cpuburst = 0;
	cpuaverage = 0;
	cputfactor = 1.0;
	delta_percent_over = 50;
	delta_cpufactor = 1.05;
	delta_weightup = 0.4;
	delta_weightdown = 0.1;
	enforce_mem = 0;
	ideal_load_val = -1.0;
	max_load_val = -1.0;
	idle_avail = 0;
	idle_busy = 10;
	idle_check = -1;
	idle_poll = 1;
	idle_on_maxload = 0;
	cycle_harvester = 0;
	wallfactor = 1.0;
	suspend_signal = SIGSTOP;
	resume_signal = SIGCONT;
	restart_background = FALSE;
	reject_root_scripts = FALSE;
	report_hook_checksums = TRUE;
	restart_transmogrify = FALSE;
	attach_allow = TRUE;
	max_check_poll = MAX_CHECK_POLL_TIME;
	min_check_poll = MIN_CHECK_POLL_TIME;
	vnode_additive = 1; /* keep vnodes on HUP */
	joinjob_alarm_time = -1;
	job_launch_delay = -1;
#ifdef NAS	       /* localmod 015 */
	spoolsize = 0; /* unlimited by default */
#endif		       /* localmod 015 */

#if MOM_ALPS
	alps_release_wait_time = ALPS_REL_WAIT_TIME_DFLT;
	alps_release_jitter = ALPS_REL_JITTER_DFLT;
	vnode_per_numa_node = FALSE;
	alps_release_timeout = ALPS_REL_TIMEOUT;
	alps_confirm_empty_timeout = ALPS_CONF_EMPTY_TIMEOUT;
	alps_confirm_switch_timeout = ALPS_CONF_SWITCH_TIMEOUT;
	set_alps_client(NULL);
#endif /* MOM_ALPS */

	strcpy(pbs_jobdir_root, "");
	restrict_user = 0;
	restrict_user_maxsys = 999;
	gen_nodefile_on_sister_mom = TRUE;
	for (j = 0; j < NUM_RESTRICT_USER_EXEMPT_UIDS; j++)
		if (restrict_user_exempt_uids[j] != 0)
			restrict_user_exempt_uids[j] = 0;

	for (i = 0; i < (int) LastAction; i++) {
		if (mom_action[i].ma_script) {
			free(mom_action[i].ma_script);
			mom_action[i].ma_script = NULL;
		}
		if (mom_action[i].ma_args) {
			for (j = 0; mom_action[i].ma_args[j]; j++)
				free(mom_action[i].ma_args[j]);
			free(mom_action[i].ma_args);
			mom_action[i].ma_args = NULL;
		}
		mom_action[i].ma_timeout = 0;
	}

	if (file == NULL)
		file = config_file;
	if (file[0] == '\0')
		return 0; /* no config file */

	if (access(file, F_OK) == -1) {
		sprintf(log_buffer, "access: %s", file);
		log_err(errno, __func__, log_buffer);
		if (config_file_specified)
			return 1; /* file given and not there = error */
		else
			return 0; /* ok for "config" not to be there  */
	}
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	int perm;
	perm = get_permission("write");
	if (chk_file_sec(file, 0, 0, perm, FULLPATH)) {
		sprintf(log_buffer,
			"warning: %s file has a non-secure file access mask", file);
		log_err(errno, __func__, log_buffer);
		return 1;
	}
#endif /* NO_SECURITY_CHECK */

	nconfig = 0;
	if (parse_config(file) == HANDLER_FAIL)
		return 1;

	addconfig_ret = do_addconfigs();

	/* check for any bad combinations */
	if (min_check_poll > max_check_poll) {
		sprintf(log_buffer, "min_check_poll(%u) > max_check_poll(%u)",
			min_check_poll, max_check_poll);
		log_event(PBSEVENT_SYSTEM, 0, LOG_ERR, __func__, log_buffer);

		max_check_poll = MAX_CHECK_POLL_TIME;
		min_check_poll = MIN_CHECK_POLL_TIME;
	}
	sprintf(log_buffer, "max_check_poll = %u, min_check_poll = %u",
		max_check_poll, min_check_poll);
	log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, __func__, log_buffer);

	inc_check_poll = (max_check_poll - min_check_poll + 19) / 20;

	if (restart_transmogrify) {
		if (mom_action[RestartAction].ma_script == NULL) {
			sprintf(log_buffer, "restart_transmogrify "
					    "value is TRUE but there is no restart script;"
					    " This is unsupported");
			log_err(-1, __func__, log_buffer);
			return 1;
		} else if (!restart_background) {
			sprintf(log_buffer, "WARNING: restart_background "
					    "value is FALSE but restart_transmogrify is "
					    "TRUE; this type of restart takes place in "
					    "the background regardless of the setting "
					    "of restart_background");
			log_err(-1, __func__, log_buffer);
		}
	} else if (!restart_background &&
		   mom_action[RestartAction].ma_script != NULL) {
		sprintf(log_buffer, "WARNING: restart_background value "
				    "is FALSE but restart is being done by a script; "
				    "restart_background forced TRUE");
		log_err(-1, __func__, log_buffer);
	}

	/* Create a new config_array[] */
	if (config_array) {
		for (ap = config_array; ap->c_name; ap++) {
			free(ap->c_name);
			free(ap->c_u.c_value);
		}
		free(config_array);
	}
	config_array = (struct config *) calloc(nconfig + 1,
						sizeof(struct config));
	memcheck((char *) config_array);

	/* copy information from config_list to config_array[] */
	for (i = 0, ap = config_array; i < nconfig; i++, ap++) {
		*ap = config_list->c;
		cp = config_list->c_link;
		free(config_list); /* don't free name and value strings */
		config_list = cp;  /* they carry over from the list */
	}
	ap->c_name = NULL; /* config_array[] is NULL-terminated */

	if (addconfig_ret == HANDLER_FAIL)
		return (1);
	else {
		if (joinjob_alarm_time == -1)
			update_joinjob_alarm_time = 1;
		else
			update_joinjob_alarm_time = 0;

		if (job_launch_delay == -1)
			update_job_launch_delay = 1;
		else
			update_job_launch_delay = 0;

		return (0);
	}
}

/**
 * @brief
 *	Inserts the config file
 *
 * @param[in] name - name of file
 * @param[in] input - input for file
 *
 * @return Void
 *
 */

void
doconfig_insert(char *name, char *input)
{
	struct stat sb;
	ssize_t nread;
	int fdin, fdout;
	long pathlen;
	char *namebuf;
	char iobuf[BUFSIZ];

	sprintf(log_buffer, "name %s, input %s", name, input);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
		  __func__, log_buffer);

	if (stat(path_addconfigs, &sb) == -1) {
		/*
		 *	First time through, we will need to make the directory
		 *	that holds new config files.
		 */

		if (mkdir(path_addconfigs, S_IRWXU) == -1) {
			sprintf(log_buffer, "mkdir %s", path_addconfigs);
			log_err(errno, __func__, log_buffer);
			exit(1);
		}
	} else if (!S_ISDIR(sb.st_mode)) {
		sprintf(log_buffer, "%s is not a directory (0%o)",
			path_addconfigs, sb.st_mode);
		log_err(-1, __func__, log_buffer);
		exit(1);
	}

	if ((pathlen = pathconf(mom_home, _PC_PATH_MAX)) == -1) {
		log_err(errno, __func__, "pathconf");
		exit(1);
	} else if ((namebuf = malloc(pathlen)) == NULL) {
		log_err(errno, __func__, "malloc");
		exit(1);
	}

	if (snprintf(namebuf, pathlen, "%s/%s", path_addconfigs, name) >=
	    pathlen) {
		sprintf(log_buffer, "%s/%s", path_addconfigs, name);
		log_err(ENAMETOOLONG, __func__, log_buffer);
		exit(1);
	}
	if (stat(namebuf, &sb) == 0) {
		sprintf(log_buffer, "attempt to add existing config file %s",
			namebuf);
		log_err(EEXIST, __func__, log_buffer);
		exit(1);
	}
	if (strstr(name, path_addconfigs_reserved_prefix) == name) {
		sprintf(log_buffer, "config file may not start with \"%s\"",
			path_addconfigs_reserved_prefix);
		log_err(EPERM, __func__, log_buffer);
		exit(1);
	}

	fdin = fdout = -1; /* avoid accidentally close()ing an open fd */
	if (access(input, R_OK) == -1) {
		sprintf(log_buffer, "access R_OK %s", input);
		log_err(errno, __func__, log_buffer);
		exit(1);
	} else if ((fdin = open(input, O_RDONLY)) == -1) {
		sprintf(log_buffer, "open %s", input);
		log_err(errno, __func__, log_buffer);
		exit(1);
	} else if ((fdout = open(namebuf, O_WRONLY | O_CREAT, 0600)) == -1) {
		sprintf(log_buffer, "open %s", namebuf);
		log_err(errno, __func__, log_buffer);
		exit(1);
	} else {
		while ((nread = read(fdin, iobuf, sizeof(iobuf))) != 0) {
			if (nread == -1) {
				log_err(errno, __func__, "read");
				exit(1);
			} else if (write(fdout, iobuf, nread) != nread) {
				log_err(errno, __func__, "write");
				exit(1);
			}
		}
	}

	(void) close(fdout);
	(void) close(fdin);
	free(namebuf);
}

/**
 * @brief
 *	Removes config files
 *
 * @param[in] name - name of file
 *
 * @return Void
 *
 */

void
doconfig_remove(char *name)
{
	struct stat sb;
	long pathlen;
	char *namebuf;

	sprintf(log_buffer, "name %s", name);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
		  __func__, log_buffer);

	if ((pathlen = pathconf(mom_home, _PC_PATH_MAX)) == -1) {
		log_err(errno, __func__, "pathconf");
		exit(1);
	} else if ((namebuf = malloc(pathlen)) == NULL) {
		log_err(errno, __func__, "malloc");
		exit(1);
	}

	if (strstr(name, path_addconfigs_reserved_prefix) == name) {
		sprintf(log_buffer, "file begins with reserved prefix \"%s\""
				    " and may not be removed",
			path_addconfigs_reserved_prefix);
		log_err(EPERM, __func__, log_buffer);
		exit(1);
	}

	if (snprintf(namebuf, pathlen, "%s/%s", path_addconfigs, name) >=
	    pathlen) {
		sprintf(log_buffer, "%s/%s", path_addconfigs, name);
		log_err(ENAMETOOLONG, __func__, log_buffer);
		exit(1);
	}
	if (stat(namebuf, &sb) == -1) {
		log_err(errno, __func__, namebuf);
		exit(1);
	}

	if (S_ISREG(sb.st_mode)) {
		if (unlink(namebuf) == -1) {
			log_err(errno, __func__, namebuf);
			exit(1);
		}
	} else {
		/*
		 *	We were asked to remove something that was not a regular
		 *	file, and refuse.  We use the same error (EPERM) that
		 *	unlink() returns if ``The file named by path is a
		 *	directory, and either the calling process does not
		 *	have appropriate privileges, or the implementation
		 *	prohibits using unlink() on directories.''
		 */
		sprintf(log_buffer, "%s/%s", path_addconfigs, name);
		log_err(EPERM, __func__, log_buffer);
		exit(1);
	}

	free(namebuf);
}

/**
 * @brief
 *	Lists the config files by reading directory
 *
 * @return Void
 *
 */

void
doconfig_list(void)
{
	struct stat sb;
	char **list;
	char **listhead;

	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, "");

	if (stat(path_addconfigs, &sb) == -1)
		return;
	if ((listhead = do_readdir(path_addconfigs, NULL)) == NULL)
		return; /* no work to do */

	for (list = listhead; list != NULL && *list != NULL; list++)
		if (strstr(*list, path_addconfigs_reserved_prefix) == *list)
			printf("%s\n", *list);
	for (list = listhead; list != NULL && *list != NULL; list++)
		if (strstr(*list, path_addconfigs_reserved_prefix) != *list)
			printf("%s\n", *list);

	free_dirlist(listhead);
}

/**
 * @brief
 *
 */
void
doconfig_show(char *name)
{
	ssize_t nread;
	int fdin;
	long pathlen;
	char *namebuf;
	char iobuf[BUFSIZ];

	sprintf(log_buffer, "name %s", name);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
		  __func__, log_buffer);

	if ((pathlen = pathconf(mom_home, _PC_PATH_MAX)) == -1) {
		log_err(errno, __func__, "pathconf");
		exit(1);
	} else if ((namebuf = malloc(pathlen)) == NULL) {
		log_err(errno, __func__, "malloc");
		exit(1);
	}

	if (snprintf(namebuf, pathlen, "%s/%s", path_addconfigs, name) >=
	    pathlen) {
		sprintf(log_buffer, "%s/%s", path_addconfigs, name);
		log_err(ENAMETOOLONG, __func__, log_buffer);
		exit(1);
	}
	fdin = -1; /* avoid accidentally close()ing an open fd */
	if (access(namebuf, R_OK) == -1) {
		sprintf(log_buffer, "access R_OK %s", namebuf);
		log_err(errno, __func__, log_buffer);
		exit(1);
	} else if ((fdin = open(namebuf, O_RDONLY)) == -1) {
		sprintf(log_buffer, "open %s", namebuf);
		log_err(errno, __func__, log_buffer);
		exit(1);
	} else {
		while ((nread = read(fdin, iobuf, sizeof(iobuf))) != 0) {
			if (nread == -1) {
				log_err(errno, __func__, "read");
				exit(1);
			} else if (write(1, iobuf, nread) != nread) {
				log_err(errno, __func__, "write");
				exit(1);
			}
		}
	}

	(void) close(fdin);
	free(namebuf);
}

/**
 * @brief
 *	wrapper function for different operations on config file
 *
 * @param[in] action - action name
 * @param[in] name - name of config file
 * @param[in] input - input for config file
 *
 * @return Void
 *
 */

void
do_configs(char *action, char *name, char *input)
{

	if (strcmp(action, "insert") == 0)
		doconfig_insert(name, input);
	else if (strcmp(action, "remove") == 0)
		doconfig_remove(name);
	else if (strcmp(action, "show") == 0)
		doconfig_show(name);
	else if (strcmp(action, "list") == 0)
		doconfig_list();
	else {
		sprintf(log_buffer, "internal error:  unexpected action %s",
			action);
		log_err(-1, __func__, log_buffer);
	}

	exit(0);
}

/**
 * @brief
 *	Get an rm_attribute structure from a string.  If a NULL is passed
 *	for the string, use the previously remembered string.
 *
 * @param[in] str - string holding info of attributes structure
 *
 * @return structure handle
 * @retval	pointer to rm_attribute structure	Success
 * @retval	NULL					Failure
 *
 */
struct rm_attribute *
momgetattr(char *str)
{
	static char cookie[] = "tag:"; /* rm_attribute to ignore */
	static char *hold = NULL;
	static char qual[256] = "";
	static char valu[4096] = "";
	static struct rm_attribute attr = {qual, valu};
	int level, i;

	if (str == NULL) /* if NULL is passed, used prev value */
		str = hold;

	do {
		str = skipwhite(str);
		if (*str++ != '[')
			return NULL;

		str = skipwhite(str); /* copy qualifier */
		str = TOKCPY(str, qual);
		str = skipwhite(str);

		if (*str++ != '=')
			return NULL;

		level = 0;
		for (i = 0; *str; str++, i++) {
			if (*str == '[')
				level++;
			else if (*str == ']') {
				if (level == 0)
					break;
				level--;
			}
			valu[i] = *str;
		}
		if (*str++ != ']')
			return NULL;

		valu[i] = '\0';
		DBPRT(("momgetattr: found %s = %s\n", qual, valu))
	} while (strncmp(qual, cookie, sizeof(cookie) - 1) == 0);
	hold = str;
	DBPRT(("momgetattr: passing back %s = %s\n", qual, valu))
	return &attr;
}

/**
 * @brief
 *	Check the request against the format of the line read from
 *	the config file.  If it is a static value, there should be
 *	no params.  If it is a shell escape, the parameters (if any)
 *	should match the command line for the system call.
 *
 *
 */
char *
conf_res(char *s, struct rm_attribute *attr)
{
	char *name[RM_NPARM];
	char *value[RM_NPARM];
	int used[RM_NPARM];
	char param[256], *d;
	int i, len;
	char *filename = NULL;
#ifdef WIN32
	pio_handles child;
#else
	FILE *child;
	int fd;
#endif
	char *child_spot;
	int child_len;
	int secondalarm = 0;
	int err;
	int perm;

	if (*s != '!') { /* static value */
		if (attr) {
			sprintf(ret_string, "? %d", RM_ERR_BADPARAM);
			return ret_string;
		} else
			return s;
	}

	if (restrictrm) /* no restricted shell escape */
		return "?";

	/*
	 **	From here on we are going to put together a shell command
	 **	to do the requestor's bidding.  Parameter substitution
	 **	is the first step.
	 */
	for (i = 0; i < RM_NPARM; i++) { /* remember params */
		if (attr == NULL)
			break;
		name[i] = strdup(attr->a_qualifier);
		memcheck(name[i]);
		value[i] = strdup(attr->a_value);
		memcheck(value[i]);
		used[i] = 0;
		attr = momgetattr(NULL);
	}
	if (attr) { /* too many params */
		log_err(-1, __func__, "too many parms");
		sprintf(ret_string, "? %d", RM_ERR_BADPARAM);
		goto done;
	}
	name[i] = NULL;

	for (d = ret_string, s++; *s;) { /* scan command */
		if (*s == '%') {	 /* possible token */
			char *hold;

			hold = TOKCPY(s + 1, param);
			for (i = 0; name[i]; i++) {
				if (strcmp(param, name[i]) == 0)
					break;
			}
			if (name[i]) { /* found a match */
				char *x = value[i];
				while (*x)
					*d++ = *x++;
				s = hold;
				used[i] = 1;
			} else
				*d++ = *s++;
		} else
			*d++ = *s++;
	}
	for (i = 0; name[i]; i++) {
		if (!used[i]) { /* parameter sent but not used */
			log_err(-1, __func__, "unused parameters");
			sprintf(ret_string, "? %d", RM_ERR_BADPARAM);
			goto done;
		}
	}

	*d = '\0';
	DBPRT(("command: %s\n", ret_string))

	filename = get_script_name(ret_string);
	if (filename == NULL)
		return NULL;
	/* Make sure file does not have open permissions */
	perm = get_permission("write");
	err = tmp_file_sec(filename, 0, 1, perm, 1);

	if (err != 0) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "error: %s file has a non-secure file access, errno: %d", filename, err);
		log_event(PBSEVENT_SECURITY, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, log_buffer);
		goto done;
	}

#ifdef WIN32
	if (!win_popen(ret_string, "w", &child, NULL)) {
		errno = GetLastError();
		log_err(errno, __func__, "popen");
		sprintf(ret_string, "? %d", RM_ERR_SYSTEM);
		goto done;
	}
#else
	if ((child = pbs_popen(ret_string, "r")) == NULL) {
		log_err(errno, __func__, "popen");
		sprintf(ret_string, "? %d", RM_ERR_SYSTEM);
		goto done;
	}
#endif /* WIN32 */

#ifdef WIN32
	shell_escape_handle = child.pi.hProcess;
	(void) win_alarm(alarm_time, shell_escape_timeout);
#else
	fd = fileno(child);
#endif /* WIN32 */
	child_spot = ret_string;
	child_len = 0;
	child_spot[0] = '\0';
	while (child_len < ret_size) {

#ifdef WIN32
		if ((len = win_pread(&child, child_spot, ret_size - child_len)) > 0)
#else
		if ((len = read(fd, child_spot, ret_size - child_len)) > 0)
#endif
		{

			for (i = 0; i < len; i++) {
#ifdef WIN32
				/* match \r\n in windows */
				if ((child_spot[i] == '\n') || (child_spot[i] == '\r'))
#else
				if (child_spot[i] == '\n')
#endif
				{
					child_spot[i] = '\0';
					break;
				}
			}
			if (i < len) /* found newline */
				break;

			child_len += len;
			if (child_len >= ret_size) {
				log_err(-1, __func__, "line too long");
				sprintf(ret_string, "? %d", RM_ERR_SYSTEM);
				break;
			}

			child_spot += len;
			checkret(&child_spot, len);
		} else if (len == 0) {
#ifdef WIN32
			if (GetLastError() == ERROR_BROKEN_PIPE) {
				log_err(errno, __func__, "resource read");
				sprintf(ret_string, "? %d", RM_ERR_SYSTEM);
			}
#endif
			break;
		} else if ((len == -1) && (errno == EINTR)) {
			log_err(errno, __func__, "resource read alarm");
			if (secondalarm) {
#ifndef WIN32
				pbs_pkill(child, SIGKILL);
#endif
				sprintf(ret_string, "? %d", RM_ERR_SYSTEM);
				break;
			} else {
#ifndef WIN32
				pbs_pkill(child, SIGINT);
				(void) alarm(alarm_time);
#endif
				secondalarm = 1;
			}
		} else {
			log_err(errno, __func__, "resource read");
			sprintf(ret_string, "? %d", RM_ERR_SYSTEM);
			break;
		}
	}

#ifdef WIN32

	if (shell_escape_handle != INVALID_HANDLE_VALUE) {
		close_valid_handle(&(shell_escape_handle));
		child.pi.hThread = INVALID_HANDLE_VALUE;
		child.pi.hProcess = INVALID_HANDLE_VALUE;
	}
	(void) win_alarm(0, NULL);
	win_pclose(&child);
#else
	pbs_pclose(child);
#endif /* WIN32 */

done:
	for (i = 0; name[i]; i++) { /* free up params */
		free(name[i]);
		free(value[i]);
	}
	free(filename);
	return ret_string;
}
#ifndef WIN32
extern void process_hup(void);
#endif

#ifdef DEBUG
/**
 * @brief
 *	creates logs event
 *
 * @param[in] id - function name
 * @param[in] buf - msg
 * @param[in] len - length of msg
 *
 * @return Void
 *
 */
void
log_verbose(char *id, char *buf, int len)
{
	int i;
	char *cp;

	len = MIN(len, 50);
	cp = log_buffer;
	for (i = 0; i < len; i++) {
		int c = buf[i];

		if (isprint(c))
			*cp++ = c;
		else {
			sprintf(cp, "(%d)", c);
			cp += strlen(cp);
		}
	}
	*cp = '\0';
	log_event(PBSEVENT_DEBUG, 0, LOG_DEBUG, id, log_buffer);
}
#else
#define log_verbose(a, b, c)
#endif

/**
 * @brief
 *	See if an IP address matches any names stored as "restricted"
 *	access hosts.  Return 0 if a name matches, 1 if not.
 *
 * @param[in] ipadd - ip address of host
 *
 * @return	int
 * @retval	0	Failure
 * @retval	1	Success
 *
 */
int
bad_restrict(u_long ipadd)
{
	struct hostent *host;
	struct in_addr in;
	int i, len1, len2;
	char *cp1, *cp2;

	in.s_addr = htonl(ipadd);
	if ((host = gethostbyaddr((void *) &in,
				  sizeof(struct in_addr), AF_INET)) == NULL)
		return 1;
	len1 = strlen(host->h_name) - 1;

	for (i = 0; i < mask_num; i++) {
		len2 = strlen(maskclient[i]) - 1;
		if (len1 < len2)
			continue;
		cp1 = &host->h_name[len1];
		cp2 = &maskclient[i][len2];
		while (len2 >= 0 && tolower(*cp1) == tolower(*cp2)) {
			cp1--;
			cp2--;
			len2--;
		}
		if ((len2 == 0 && *cp2 == '*') || len2 == -1)
			return 0;
	}
	return 1;
}

/**
 * @brief
 *	Process a request for the resource monitor. The i/o
 *	will take place using DIS over an tpp stream.
 *
 * @param[in] iochan - i/o channel to indicate stream or fd
 * @param[in] version - protocol version
 * @param[in] prot - PROT_TCP or PROT_TPP
 *
 * @return int
 * @retval	0	Success
 * @retval	-1	Failure
 *
 */

int
rm_request(int iochan, int version)
{
	char name[256];
	static char *output = NULL;
	static int output_size = 0;
	int len;
	int command, ret;
	char *curr, *value, *cp, *body;
	struct config *ap;
	struct rm_attribute *attr;
	struct sockaddr_in *addr;
	u_long ipadd = 0;
	u_short port = 0;
	void (*close_io)(int) = NULL;

	errno = 0;
	if (!output) {
		output = (char *) malloc(BUFSIZ);
		if (!output) {
			log_err(errno, __func__, "malloc");
			goto bad;
		}
		output_size = BUFSIZ;
	}
	(void) memset(output, 0, output_size);

	addr = tpp_getaddr(iochan);
	if (addr == NULL) {
		sprintf(log_buffer, "Sender unknown");
		goto bad;
	}

	ipadd = ntohl(addr->sin_addr.s_addr);
	port = ntohs((unsigned short) addr->sin_port);
	close_io = (void (*)(int)) & tpp_close;

	if (version != RM_PROTOCOL_VER) {
		sprintf(log_buffer, "protocol version %d unknown", version);
		goto bad;
	}

	restrictrm = 0;
	if (!addrfind(ipadd)) {
		if (bad_restrict(ipadd)) {
			sprintf(log_buffer, "bad attempt to connect");
			goto bad;
		}
		restrictrm = 1;
	}

	/* looks okay, find out what command it is */
	command = disrsi(iochan, &ret);
	if (ret != DIS_SUCCESS) {
		sprintf(log_buffer, "no command %s", dis_emsg[ret]);
		goto bad;
	}

	switch (command) {

		case RM_CMD_CLOSE: /* no response to this */
			close_io(iochan);
			return 1;

		case RM_CMD_REQUEST:
			reqnum++;
			ret = diswsi(iochan, RM_RSP_OK);
			if (ret != DIS_SUCCESS) {
				sprintf(log_buffer,
					"write request response failed: %s",
					dis_emsg[ret]);
				goto bad;
			}

			for (;;) {
				cp = disrst(iochan, &ret);
				if (ret == DIS_EOD)
					break;
				else if (ret != DIS_SUCCESS) {
					sprintf(log_buffer,
						"problem with request line: %s",
						dis_emsg[ret]);
					goto bad;
				}
				curr = skipwhite(cp);
				curr = TOKCPY(curr, name);
				if (strlen(name) == 0) { /* no name */
					sprintf(output, "%s=? %d",
						cp, RM_ERR_UNKNOWN);
				} else {
					ap = rm_search(config_array, name);
					attr = momgetattr(curr);

#ifndef WIN32
					(void) alarm(alarm_time);
#endif
					rm_errno = PBSE_NONE;
					if (ap) /* static */
						value = conf_res(ap->c_u.c_value, attr);
					else /* dynamic */
						value = dependent(name, attr);
#ifndef WIN32
					(void) alarm(0);
#endif
					if (value) {
#if MOM_ALPS
						int lim = 1 << 20;
#else
						int lim = 65536;
#endif

						len = strlen(cp) + strlen(value) + 2;
						if (len >= lim) {
							sprintf(output, "%s=? %d",
								cp, PBSE_BADATVAL);
						} else {
							char *hold;
							if (len > output_size) {
								hold = (char *) realloc(output, len);
								if (!hold) {
									log_err(errno, __func__, "realloc");
									goto bad;
								}
								output = hold;
								output_size = len;
							}
							sprintf(output, "%s=%s", cp, value);
						}
					} else { /* not found anywhere */
						sprintf(output, "%s=? %d", cp, rm_errno);
					}
				}
				free(cp);
				ret = diswst(iochan, output);
				if (ret != DIS_SUCCESS) {
					sprintf(log_buffer,
						"write string failed %s",
						dis_emsg[ret]);
					goto bad;
				}
			}
			break;

		case RM_CMD_CONFIG:
			if (restrictrm) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
					  LOG_NOTICE | LOG_AUTH, __func__,
					  "restricted configure attempt");
				goto bad;
			}

			log_event(PBSEVENT_SYSTEM, 0, LOG_INFO, __func__, "configure");
			body = disrst(iochan, &ret);
			if (ret == DIS_EOD)
				body = NULL;
			else if (ret != DIS_SUCCESS) {
				sprintf(log_buffer,
					"problem with config body %s",
					dis_emsg[ret]);
				goto bad;
			}
			len = read_config(body);

			ret = diswsi(iochan, len ? RM_RSP_ERROR : RM_RSP_OK);
			if (ret != DIS_SUCCESS) {
				sprintf(log_buffer,
					"write config response failed %s",
					dis_emsg[ret]);
				if (len == 0)	  /* config was okay but reply */
					goto bad; /* didn't work */
			}

			/* check if read_config failed */
			if (len != 0) {
				cleanup();
				log_close(1);
				tpp_shutdown();
#ifdef WIN32
				ExitThread(1);
#else
				exit(1);
#endif
			}
			break;

		case RM_CMD_SHUTDOWN:
			if (restrictrm) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
					  LOG_NOTICE | LOG_AUTH, __func__,
					  "restricted shutdown attempt");
				goto bad;
			}

			log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, __func__, "shutdown");
			ret = diswsi(iochan, RM_RSP_OK);
			if (ret != DIS_SUCCESS) {
				sprintf(log_buffer,
					"write shutdown response failed %s",
					dis_emsg[ret]);
				log_err(-1, __func__, log_buffer);
			}
			dis_flush(iochan);
			close_io(iochan);
			cleanup();
			log_close(1);
			tpp_shutdown();
#ifdef WIN32
			ExitThread(0);
#else
			exit(0);
#endif

		default:
			sprintf(log_buffer, "unknown command %d", command);
			log_err(-1, __func__, log_buffer);
			ret = diswsi(iochan, RM_RSP_ERROR);
			if (ret != DIS_SUCCESS) {
				sprintf(log_buffer,
					"write default response failed %s",
					dis_emsg[ret]);
				goto bad;
			}
			ret = diswst(iochan, log_buffer);
			if (ret != DIS_SUCCESS) {
				sprintf(log_buffer,
					"write string failed %s",
					dis_emsg[ret]);
				goto bad;
			}
			break;
	}
	if (dis_flush(iochan) == -1) {
		log_err(errno, __func__, "flush");
		goto bad;
	}
	return 0;

bad:
	sprintf(output,
		"\n\tmessage refused from port %d addr %ld.%ld.%ld.%ld", port,
		(ipadd & 0xff000000) >> 24,
		(ipadd & 0x00ff0000) >> 16,
		(ipadd & 0x0000ff00) >> 8,
		(ipadd & 0x000000ff));
	strcat(log_buffer, output);
	log_err(errno, __func__, log_buffer);

	/*
	 ** This is a special case, if the malloc fails for the 'output'
	 ** buffer, then 'close_io' function pointer won't get a chance
	 ** to be initialized. So, Initialize accordingly before use.
	 */
	if (close_io == NULL)
		close_io = (void (*)(int)) & tpp_close;

	close_io(iochan);
	return -1;
}

/**
 * @brief
 *	Read a message from an TPP stream, figure out if it is a
 *	Resource Monitor request or an InterMom message.
 *
 * @param[in] stream - TPP stream
 *
 * @return Void
 *
 */
void
do_tpp(int stream)
{
	int ret, proto, version;
	void im_request(int stream, int version);
	void is_request(int stream, int version);
	void im_eof(int stream, int ret);

	DIS_tpp_funcs();
	proto = disrsi(stream, &ret);
	if (ret != DIS_SUCCESS) {
		im_eof(stream, ret);
		return;
	}
	version = disrsi(stream, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("%s: no protocol version number %s\n",
		       __func__, dis_emsg[ret]))
		im_eof(stream, ret);
		return;
	}

	switch (proto) {
		case RM_PROTOCOL:
			DBPRT(("%s: got a resource monitor request\n", __func__))
			if (rm_request(stream, version) == 0)
				tpp_eom(stream);
			break;

		case IM_PROTOCOL:
			DBPRT(("%s: got an internal task manager request\n", __func__))
			im_request(stream, version);
			break;

		case IS_PROTOCOL:
			DBPRT(("%s: got an inter-server request\n", __func__))
			is_request(stream, version);
			break;

		default:
			DBPRT(("%s: unknown request %d\n", __func__, proto))
			tpp_close(stream);
			break;
	}
}

/* ARGSUSED */

/**
 * @brief
 *	wrapper function for do_tpp
 *
 * @param[in] fd - file descriptor
 *
 * @return Void
 *
 */
void
tpp_request(int fd)
{
	int stream;
	int i;
	/* To reduce tpp process storm reducing max do_tpp processing to MAX_TPP_LOOPS times */
	for (i = 0; i < MAX_TPP_LOOPS; i++) {
		if ((stream = tpp_poll()) == -1) {
#ifdef WIN32
			if (errno != 10054)
#endif
				log_err(errno, __func__, "tpp_poll");
			break;
		}
		if (stream == -2)
			break;
		do_tpp(stream);
	}
}

/**
 * @brief
 *      Read a TCP message from fd, figure out if it is a
 *      Resource Monitor request or an InterMom message.
 *      Serve only the IM message
 *
 * @param[in] fd - tcp msg
 *
 * @return	int
 * @retval	0	Success
 * @retval	!0	Failure
 *
 */

int
do_tcp(int fd)
{
	int ret, proto, version;
	int tm_request(int stream, int version);

	pbs_tcp_timeout = 0;
	proto = disrsi(fd, &ret);
	pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_SHORT;

	switch (ret) {
		case DIS_SUCCESS: /* worked */
			break;
		case DIS_EOF: /* closed */
			close_conn(fd);
		case DIS_EOD: /* still open */
			return 1;
		default:
			sprintf(log_buffer, "no protocol number: %s",
				dis_emsg[ret]);
			goto bad;
	}

	version = disrsi(fd, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("%s: no protocol version number %s\n",
		       __func__, dis_emsg[ret]))
		goto bad;
	}

	switch (proto) {
		case TM_PROTOCOL:
			DBPRT(("%s: got an internal task manager request\n", __func__))
			ret = tm_request(fd, version);
			break;

		default:
			DBPRT(("%s: unknown request %d\n", __func__, proto))
			goto bad;
	}
	return ret;

bad:
	close_conn(fd);
	return -1;
}

/**
 * @brief
 *      wrapper function for do_tcp which calls infinitely
 *
 * @param[in] fd - file descriptor
 *
 * @return Void
 *
 */

void
tcp_request(int fd)
{
	int c;
	long ipadd;
	char address[80];
	conn_t *conn = get_conn(fd);
	if (!conn) {
		sprintf(log_buffer, "could not find fd=%d in connection table",
			fd);
		log_err(-1, __func__, log_buffer);
		closesocket(fd);
		return;
	}

	ipadd = conn->cn_addr;

	sprintf(address, "%ld.%ld.%ld.%ld:%d",
		(ipadd & 0xff000000) >> 24,
		(ipadd & 0x00ff0000) >> 16,
		(ipadd & 0x0000ff00) >> 8,
		(ipadd & 0x000000ff),
		ntohs(conn->cn_port));
	DBPRT(("%s: fd %d addr %s\n", __func__, fd, address))
	DIS_tcp_funcs();
	if (!addrfind(ipadd)) {
		sprintf(log_buffer, "bad connect from %s", address);
		log_err(errno, __func__, log_buffer);
		close_conn(fd);
		return;
	}
	log_buffer[0] = '\0';
	for (c = 0;; c++) {
		DIS_tcp_funcs();

		if (do_tcp(fd))
			break;
	}
	DBPRT(("%s: processed %d\n", __func__, c))
}

/**
 * @brief
 *	Kill a job.
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	sig - signal number
 *
 * @return      int
 * @retval      nonzero - success, on *NIX returns number of tasks killed
 * @retval      !1 - failure
 *
 */
int
kill_job(job *pjob, int sig)
{
	pbs_task *ptask = NULL;
	int ct = 0;
	int tsk_ct;

#ifdef WIN32
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, "kill_job");

	if (pjob->ji_hJob == NULL)
		return 0;

	/* Normal process termination, top command shell termination will result in exit codes < 256.     */
	/* To differentiate a process termination by signals, add BASE_SIGEXIT_CODE to sig, and the       */
	/* value (BASE_SIGEXIT_CODE + sig) will be assigned as the exit code for that terminated process. */
	if (TerminateJobObject(pjob->ji_hJob, BASE_SIGEXIT_CODE + sig) == 0) {
		log_err(-1, __func__, "TerminateJobObject");
		return 0;
	}
	/*
	 * for any external processes that got attached to the PBS job via pbs_attach
	 * but are not part of the job object, kill the individual tasks
	 */
	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		DBPRT(("%s: task %8.8X status %d\n", __func__,
		       ptask->ti_qs.ti_task, ptask->ti_qs.ti_status))
		if (ptask->ti_qs.ti_status != TI_STATE_RUNNING)
			continue;
		ct += kill_task(ptask, sig, 0);
	}
	return 1;
#else

	DBPRT(("%s: entered %s\n", __func__, pjob->ji_qs.ji_jobid))
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, __func__);

	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		DBPRT(("%s: task %8.8X status %d\n", __func__,
		       ptask->ti_qs.ti_task, ptask->ti_qs.ti_status))
		if (ptask->ti_qs.ti_status != TI_STATE_RUNNING)
			continue;
		tsk_ct = kill_task(ptask, sig, 0);
		ct += tsk_ct;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		if (sig == SIGKILL) { /* only stop afslog when the task is finally dying */
			AFSLOG_TERM(ptask);
		}
#endif

		/*
		 ** If this is an orphan task, force it to be EXITED
		 ** since it will not be seen by scan_for_terminated.
		 **
		 ** Also set the task status to EXITED if the count of
		 ** processes in this task == 0. This is to allow them
		 ** to properly transition to TI_DEAD in scan_for_exiting.
		 */
		if (((sig == SIGKILL) && (ptask->ti_flags & TI_FLAGS_ORPHAN)) || (tsk_ct == 0)) {
			ptask->ti_qs.ti_status = TI_STATE_EXITED;
			task_save(ptask);
			sprintf(log_buffer, "task %8.8X force exited",
				ptask->ti_qs.ti_task);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
			/*
			 ** If it is the parent task who became orphan by
			 ** loosing the top shell, then set exiting_tasks.
			 */
			if (ptask->ti_qs.ti_parenttask == TM_NULL_TASK)
				exiting_tasks = 1;
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
			AFSLOG_TERM(ptask);
#endif
		}
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5) && 0
	if (cred_by_job(pjob, CRED_DESTROY) != PBS_KRB5_OK) {
		log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid,
			   "failed to destroy credentials");
	}
#endif
	DBPRT(("%s: done %s killed %d\n", __func__, pjob->ji_qs.ji_jobid, ct))
	return ct;
#endif /* WIN32 */
}

/**
 * @brief
 *	size decoding routine.
 *	Accepts a resource pointer and a pointer to the unsigned long integer
 *	to receive the decoded value.  It returns the decoded value in kb.
 *
 * @param[in] pres - pointer to resource
 *
 * @note  This will return only up to ULONG_MAX kb (i.e. return value is
 *	  unsigned long). Even though the new size data type has been expanded
 *	  to hold up to UlONG_MAX kb (i.e. unsigned long long max), this
 *	  function will still only return up to the ULONG_MAX kb. Extra care
 *	  has been taken to make sure bit shifts in this function don't go past
 *	  the # of bits of an unsigned long; otherwise, we might get some
 *	  unexpected result.
 *
 * @note  The size of a word is a constant shared between daemons to ensure
 *        consistency over correctness.
 *
 * @return	u_long
 * @retval	decoded value for size
 *
 */
u_long
getsize(resource *pres)
{
	u_Long value;
	u_long shift;

	if (pres->rs_value.at_type != ATR_TYPE_SIZE)
		return (0);
	value = pres->rs_value.at_val.at_size.atsv_num;
	shift = pres->rs_value.at_val.at_size.atsv_shift;

	if (pres->rs_value.at_val.at_size.atsv_units ==
	    ATR_SV_WORDSZ) {
		if (value > ULONG_MAX / SIZEOF_WORD)
			return (0);
		value *= SIZEOF_WORD;
	}
	if (shift > 10) {
		shift -= 10;
		if (shift >= (sizeof(ULONG_MAX) * CHAR_BIT)) {
			return (0);
		}
		return ((u_long) (value << shift));
	} else { /* in kb or < 1 kb */
		u_Long avalue;

		shift = 10 - shift;
		avalue = (value >> shift);
		/* if value is < 1kb but !0, then round up to 1kb */
		if ((value % (1 << shift)) > 0) { /* any remainder, round UP */
			avalue++;
		}
		return ((u_long) avalue);
	}
}

/**
 * @brief
 *	time decoding routine.
 *
 *	Accepts a resource pointer and a pointer to the unsigned long integer
 *	to receive the decoded value.  It returns the decoded value of time
 *	in seconds.
 *
 * @param[in] pres - pointer to resource structure
 *
 * @return	u_long
 * @retval	decoded value for time
 *
 */
u_long
gettime(resource *pres)
{

	if (pres->rs_value.at_type != ATR_TYPE_LONG)
		return (0);
	if (pres->rs_value.at_val.at_long < 0)
		return (0);
	return ((u_long) pres->rs_value.at_val.at_long);
}

/**
 * @brief
 *	Internal size decoding routine.
 *
 *	Accepts a resource pointer and a pointer to the unsigned long integer
 *	to receive the decoded value.  It returns a PBS error code, and the
 *	decoded value in the unsigned long integer.
 *
 * @param[in] pres - pointer to resource
 *
 * @note  In platforms other than sgi, the *ret value is only up to
 *	  ULONG_MAX bytes (i.e. return value is unsigned long). Even though the
 *	  new size data type has been expanded to hold up to UlONG_MAX bytes
 *	  (i.e. unsigned long long max), this function will still only return
 *	  up to the ULONG_MAX bytes. Extra care has been taken to make sure bit
 *	  shifts in this function don't go past the # of bits of an unsigned
 *	  long; otherwise, we might get unexpected result.
 *
 * @retval  ZERO(PBSE_NONE) SUCCESS
 * @retval  NON-ZERO PBS error code indicates failure
 *
 */
int
local_getsize(resource *pres, u_long *ret)
{
	u_Long value;
#define PBS_RLIM_MAX ULONG_MAX
#define PBS_RLIM_TYPE u_long

	/*
	 * If the resource pointer(pres) is NULL, then just
	 * return with error code PBSE_UNKRESC.
	 */
	if (pres == NULL)
		return (PBSE_UNKRESC);

	if (pres->rs_value.at_type != ATR_TYPE_SIZE)
		return (PBSE_ATTRTYPE);
	value = pres->rs_value.at_val.at_size.atsv_num;
	if (pres->rs_value.at_val.at_size.atsv_units == ATR_SV_WORDSZ) {
		if (value > (ULONG_MAX / SIZEOF_WORD))
			return (PBSE_BADATVAL);
		value *= SIZEOF_WORD;
	}
	if ((pres->rs_value.at_val.at_size.atsv_shift >=
	     (sizeof(PBS_RLIM_MAX) * CHAR_BIT)) ||
	    (value >
	     (PBS_RLIM_MAX >> pres->rs_value.at_val.at_size.atsv_shift))) {
		return (PBSE_BADATVAL);
	}
	*ret = (PBS_RLIM_TYPE) (value << pres->rs_value.at_val.at_size.atsv_shift);

	return (PBSE_NONE);
}

/**
 * @brief
 *	Internal time decoding routine.
 *
 *	Accepts a resource pointer and a pointer to the unsigned long integer
 *	to receive the decoded value.  It returns a PBS error code, and the
 *	decoded value of time in seconds in the unsigned long integer.
 *
 * @param[in] pres - pointer to resource
 * @param[out] ret - pointer to u_long to hold decoded value
 *
 * @return	error(numbers)
 * @retval	PBSE_NONE	no error
 * @retval	PBSE_UNKRESC	Unknown resource
 * @retval	PBSE_ATTRTYPE	incompatable queue attribute type
 * @retval	PBSE_BADATVAL	bad attribute value
 *
 *
 */
int
local_gettime(resource *pres, u_long *ret)
{
	/*
	 * If pres is NULL, then just return with PBSE_UNKRESC.
	 */
	if (pres == NULL)
		return (PBSE_UNKRESC);

	if (pres->rs_value.at_type != ATR_TYPE_LONG)
		return (PBSE_ATTRTYPE);
	if (pres->rs_value.at_val.at_long < 0)
		return (PBSE_BADATVAL);
	*ret = pres->rs_value.at_val.at_long;

	return (PBSE_NONE);
}

/**
 * @brief
 *	Internal long decoding routine.
 *
 *	Accepts a resource pointer and a pointer to the unsigned long integer
 *	to receive the decoded value.  It returns a PBS error code, and the
 *	decoded value in the unsigned long integer.
 *
 * @param[in] pres - pointer to resource
 * @param[out] ret - pointer to u_long to hold decoded value
 *
 * @return	error numbers
 *
 */
int
getlong(resource *pres, u_long *ret)
{
	return (local_gettime(pres, ret));
}

/**
 * @brief
 *	Calculate a moving weighted average percentage of cpus used by job.
 *	100% = 1 cpu full time.
 *
 * @param		pjob		pointer to job structure
 * @param		oldcput		cpu time from previous sample
 * @param		newcput		cpu time from current sample
 * @param		sampletime	time stamp of current sample
 *
 * @return		Nothing
 *
 */
void
calc_cpupercent(job *pjob, u_long oldcput, u_long newcput, time_t sampletime)
{
	attribute *at_used;
	u_long *lp;
	long ncpus_req;
	double new_sample_weight;
	u_long percent;
	resource *pres;
	resource *pres_req;
	resource *preswalltime;
	resource_def *rd;
	long dur;

	/* if job started after last sample skip calculation */
	if (pjob->ji_qs.ji_stime > sampletime)
		return;

	ncpus_req = 0;
	rd = &svr_resc_def[RESC_NCPUS];
	pres_req = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), rd);
	if (pres_req != NULL)
		ncpus_req = MAX(0, pres_req->rs_value.at_val.at_long);

	rd = &svr_resc_def[RESC_CPUPERCENT];
	at_used = get_jattr(pjob, JOB_ATR_resc_used);
	pres = find_resc_entry(at_used, rd);
	if (pres == NULL)
		return;

	lp = (u_long *) &pres->rs_value.at_val.at_long;
	if (pjob->ji_sampletim == 0) {
		dur = MAX(1, sampletime - pjob->ji_qs.ji_stime);
	} else {
		dur = MAX(1, sampletime - pjob->ji_sampletim);
	}
	percent = ((newcput - oldcput) * 100) / dur;

	if ((*lp) == 0 && percent != 0 && (ncpus_req > 0))
		/* set old sample used in averaging to sane value at start */
		*lp = MIN(percent, ncpus_req * 100);

	if (percent >= (*lp)) { /* moving cpupercent up */
		new_sample_weight = delta_weightup *
				    MIN((double) 1.0, (double) dur / (double) max_check_poll);
	} else { /* moving cpupercent down */
		/*
		 * clamp sample that would push cpupercent down again
		 * so as to move back to the greater of
		 *   - average over entire run or
		 *   - ncpus*100
		 * rather than back to zero in the face of no cpu
		 * utilisation
		 *
		 * sample going down -
		 *   never allow percent to rise above (*lp)
		 */
		long wallt = -1;
		rd = &svr_resc_def[RESC_WALLTIME];
		preswalltime = find_resc_entry(at_used, rd);
		if ((preswalltime != NULL) &&
		    ((is_attr_set(&preswalltime->rs_value)) != 0)) {
			wallt = preswalltime->rs_value.at_val.at_long;
		}
		if (wallt <= 0)
			return;

		percent = MIN((double) (*lp),
			      MAX((double) percent,
				  MAX((double) ncpus_req,
				      (double) oldcput / (double) wallt) *
					  100.0));
		/* note wallt above corresponds to the old cput
		 * -- resource is only set to time_now further down
		 *    in the mom_set_use() routine
		 */

		new_sample_weight = delta_weightdown *
				    (MIN((double) 1.0, (double) dur / (double) max_check_poll));
	}

	*lp = (u_long) (percent * new_sample_weight + (*lp) * (1.0 - new_sample_weight));

	DBPRT(("cpu%% : ses %ld (new %lu - old %lu)/delta %ld = %lu%% or %ld%% weighted\n", get_jattr_long(pjob, JOB_ATR_session_id), newcput, oldcput, dur, percent, *lp))
}

#ifdef NAS /* localmod 015 */
/* functions for spool_usage limit */

/**
 * @brief
 *	sets spool size for job
 *
 * @param[in] value - spool size
 *
 * @return	handler_ret_t
 * @retval	HANDLER_FAIL	Failure
 * @retval	HANDLER_SUCCESS	Success
 *
 */

static handler_ret_t
set_spoolsize(char *value)

{
	char newstr[50] = "spool_size ";
	u_long val;
	struct size_value psize;

	psize.atsv_shift = 0;
	psize.atsv_num = 0;
	psize.atsv_units = ATR_SV_BYTESZ;

	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
		  "spool_size", value);
	if (to_size(value, &psize) != 0) {
		sprintf(log_buffer, "invalid spool size specification %s", value);
		log_err(-1, __func__, log_buffer);
		return HANDLER_FAIL;
	}

	/*
	 * Convert psize to kilobytes
	 */

	val = psize.atsv_num;

	/* Special-case 0 */

	if (val != 0) {
		if (psize.atsv_units == ATR_SV_WORDSZ)
			val *= sizeof(int);
		if (psize.atsv_shift == 0)
			val = (val + 1023) >> 10;
		else
			val = val << (psize.atsv_shift - 10);
	}

	spoolsize = val;
	(void) strncat(newstr, value, 39);
	if (add_static(newstr, "config", 0))
		return HANDLER_FAIL;
	nconfig++;
	return HANDLER_SUCCESS;
}

/**
 * @brief
 *	spool_usage - compute a job's spool usage (in KB)
 *
 * Returns the sum of the lengths of stdout and stderr in KB, iff they
 * are being written to the $PBS_HOME/spool directory. In all other cases
 * (e.g. interactive jobs, jobs running in a sandbox), returns zero.
 *
 * @param[in] pjob - pointer to job
 *
 * @return	long
 * @retval	length of output written by job into spool dir
 * @retval	0	not writing into spool dir
 *
 */

unsigned long
spool_usage(pjob)
job *pjob;

{
	unsigned long outsize = 0;
	unsigned long errsize = 0;
	char *outpath;
	char *errpath;
	struct stat buf; /* return buffer for stat(2) */
	size_t spool_path_len = strlen(path_spool);
	int keeping;

	/* Return 0 if job is interactive */

	if (is_jattr_set(pjob, JOB_ATR_interactive) && (get_jattr_long(pjob, JOB_ATR_interactive) > 0)) {
		DBPRT(("job is interactive\n"));
		return (0L);
	}

	/* Job is not interactive */

	/* Get full pathname of stdout file */

	outpath = std_file_name(pjob, StdOut, &keeping);
	DBPRT(("file = %s/n", outsize));
	if (strncmp(outpath, path_spool, spool_path_len) == 0) {

		/* stdout file resides under the spool directory (if it exists). */

		if (stat(outpath, &buf) == 0) { /* file exists */
			outsize = (unsigned long) buf.st_size;
			DBPRT(("size = %d\n", outsize));
		}
	}

	/* Get full pathname of stderr file */

	errpath = std_file_name(pjob, StdErr, &keeping);
	DBPRT(("file = %s\n", errsize));
	if (strncmp(errpath, path_spool, spool_path_len) == 0) {

		/* stderr file resides under the spool directory (if it exists). */

		if (stat(errpath, &buf) == 0) { /* file exists */
			errsize = (unsigned long) buf.st_size;
			DBPRT(("size = %d\n", outsize));
		}
	}

	return ((outsize + errsize) >> 10);
}

/**
 * @brief
 *	spool_over_limit - check job's spool usage against limit
 *
 * @param[in] pjob - pointer to job
 *
 * @return	int
 * @retval	1	iff job's spool usage exceeds spool limit in config file
 * @retval	0	otherwise.
 *
 * A spool limit <= 0 is considered to be "unlimited".
 *
 */

int
spool_over_limit(pjob)
job *pjob;
{
	if (spoolsize <= 0)
		return 0;

	return (spool_usage(pjob) > spoolsize);
}
#endif /* localmod 015 */

/**
 * @brief
 *	Measure job resource usage and compare with its limits.
 *
 *	ncpus, mem, vmem are checked against the node specific limit
 *	established by the job's select directive and passed via the
 *	exec_vnode string to job_nodes() into the ji_hosts array.
 *
 *	Job level resource limits, such as cput, walltime, ... are
 *	checked also as no single node can exceed the total
 *
 * @param[in] pjob - pointer to job
 *
 * @return Bool
 * @retval TRUE If any well-formed polled limit has been exceeded
 * @retval FALSE no polled limit has been exceeded
 *
 */
int
mom_over_limit(job *pjob)
{
	char *pname;
	int retval;
	u_long llvalue, llnum;
	u_long value, num;
	resource *pres;
	resource *used;
	attribute *uattr = get_jattr(pjob, JOB_ATR_resc_used);
	resource_def *rd;

	assert(pjob != NULL);
	assert((get_jattr(pjob, JOB_ATR_resource))->at_type == ATR_TYPE_RESC);
	pres = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));

	DBPRT(("%s: entered\n", __func__))

	/* check ncpus usage locally */

	value = pjob->ji_hosts[pjob->ji_nodeid].hn_nrlimit.rl_ncpus;
	if (value != 0) { /* ignore cpuusage check when ncpus=0 */
		attribute *at;
		resource *prescpup;
		resource *prescput;
		resource *preswalltime;
		u_long cput_sum;
		u_long walltime_sum;

		at = get_jattr(pjob, JOB_ATR_resc_used);
		assert(at->at_type == ATR_TYPE_RESC);

		rd = &svr_resc_def[RESC_CPUPERCENT];
		prescpup = find_resc_entry(at, rd);
		if ((prescpup != NULL) &&
		    ((is_attr_set(&prescpup->rs_value)) != 0)) {
			num = prescpup->rs_value.at_val.at_long;
			if ((float) num >
			    (value * 100 * delta_cpufactor + delta_percent_over)) {
				sprintf(log_buffer,
					"ncpus %.1f exceeded limit %lu (burst)",
					(float) num / 100.0, value);
				if (cpuburst) { /* abort job */
					pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_KILL_NCPUS_BURST;
					return (TRUE);
				} else if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_cpuperc) == 0) {
					/* just log it */
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
						  LOG_INFO, pjob->ji_qs.ji_jobid,
						  log_buffer);
					pjob->ji_qs.ji_svrflags |= JOB_SVFLG_cpuperc;
				}
			}

			rd = &svr_resc_def[RESC_WALLTIME];
			preswalltime = find_resc_entry(at, rd);
			if ((preswalltime != NULL) &&
			    ((is_attr_set(&preswalltime->rs_value)) != 0)) {
				walltime_sum = preswalltime->rs_value.at_val.at_long;
				if (walltime_sum > average_trialperiod) {
					rd = &svr_resc_def[RESC_CPUT];
					prescput = find_resc_entry(at, rd);
					if ((prescput != NULL) &&
					    ((is_attr_set(&prescput->rs_value)) != 0)) {
						cput_sum = prescput->rs_value.at_val.at_long;
						/* "value" is from ncpus */
						if (((double) cput_sum / (double) walltime_sum) >
						    (value * average_cpufactor + average_percent_over / 100.0)) {
							sprintf(log_buffer,
								"ncpus %.2f exceeded limit %lu (sum)",
								(double) cput_sum / (double) walltime_sum,
								value);
							if (cpuaverage) { /* abort job */
								pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_KILL_NCPUS_SUM;
								return (TRUE);
							} else if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_cpuperc) == 0) {
								/* just log it */
								log_event(PBSEVENT_JOB,
									  PBS_EVENTCLASS_JOB, LOG_INFO,
									  pjob->ji_qs.ji_jobid,
									  log_buffer);
								pjob->ji_qs.ji_svrflags |= JOB_SVFLG_cpuperc;
							}
						}
					}
				}
			}
		}
	}

	/* check vmem useage locally */
	llvalue = pjob->ji_hosts[pjob->ji_nodeid].hn_nrlimit.rl_vmem << 10;
	if (llvalue != 0) {
		rd = &svr_resc_def[RESC_VMEM];
		used = find_resc_entry(uattr, rd);
		retval = local_getsize(used, &llnum);
		if (retval == PBSE_NONE) {
			if (llnum > llvalue) {
				sprintf(log_buffer, "vmem %lukb exceeded limit %lukb", llnum / 1024, llvalue / 1024);
				pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_KILL_VMEM;
				return (TRUE);
			}
		}
	}

	/* check mem usage locally */
	llvalue = pjob->ji_hosts[pjob->ji_nodeid].hn_nrlimit.rl_mem << 10;
	if (llvalue != 0) {
		rd = &svr_resc_def[RESC_MEM];
		used = find_resc_entry(uattr, rd);
		retval = local_getsize(used, &llnum);
		if (retval == PBSE_NONE) {
			if ((llnum > llvalue) && enforce_mem) {
				sprintf(log_buffer, "mem %lukb exceeded limit %lukb", llnum / 1024, llvalue / 1024);
				pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_KILL_MEM;
				return (TRUE);
			}
		}
	}

	pres = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));

	for (; pres != NULL; pres = (resource *) GET_NEXT(pres->rs_link)) {
		assert(pres->rs_defin != NULL);
		pname = pres->rs_defin->rs_name;
		used = find_resc_entry(uattr, pres->rs_defin);
		assert(pname != NULL);
		assert(*pname != '\0');

		/* The checks for cput and walltime (job wide limits) should
		 * only be done on the MS.  We are leaving the Cray specific
		 * mppe and mppsse to be checked on all nodes though
		 */

		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) != 0) {
			if (strcmp(pname, "cput") == 0) {
				retval = local_gettime(pres, &value);
				if (retval != PBSE_NONE)
					continue;
				retval = local_gettime(used, &num);
				if (retval != PBSE_NONE)
					continue;
				if (num > value) {
					sprintf(log_buffer,
						"cput %lu exceeded limit %lu",
						num, value);
					pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_KILL_CPUT;
					return (TRUE);
				}
			} else if (strcmp(pname, "walltime") == 0) {
				retval = local_gettime(pres, &value);
				if (retval != PBSE_NONE)
					continue;
				/* use the resources_used.walltime value */
				retval = local_gettime(used, &num);
				if (retval != PBSE_NONE)
					continue;
				/* add time that has not been accumulated */
				num += (time_now - pjob->ji_walltime_stamp) * wallfactor;
				if (num > value) {
					sprintf(log_buffer,
						"walltime %lu exceeded limit %lu",
						num, value);
					pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_KILL_WALLTIME;
					return (TRUE);
				}
			}
		}

		if (strcmp(pname, "mppe") == 0) {
			retval = getlong(pres, &value);
			if (retval != PBSE_NONE)
				continue;
			retval = getlong(used, &num);
			if (retval != PBSE_NONE)
				continue;
			if (num > value) {
				sprintf(log_buffer,
					"mppe %lu exceeded limit %lu",
					num, value);
				return (TRUE);
			}
		} else if (strcmp(pname, "mppssp") == 0) {
			retval = getlong(pres, &value);
			if (retval != PBSE_NONE)
				continue;
			retval = getlong(used, &num);
			if (retval != PBSE_NONE)
				continue;
			if (num > value) {
				sprintf(log_buffer,
					"mppssp %lu exceeded limit %lu",
					num, value);
				return (TRUE);
			}
		}
	}

	return (FALSE);
}

/**
 * @brief
 *	check attr value limits of job
 *
 * @param[in] pjob - pointer to job
 * @param[in] recover - recovering mode for MoM
 *
 * @return	int
 * @retval	0	Failure
 * @retval	1	Success
 *
 */

int
job_over_limit(job *pjob, int recover)
{
	attribute *used;
	resource *limresc;
	resource *useresc;
	struct resource_def *rd;
	u_long total_cpu, total_mem;
	u_long *total;
	int i;
	u_long limit;
	char *units;

	if (mom_over_limit(pjob)) {		     /* check my own limits */
		pjob->ji_nodekill = pjob->ji_nodeid; /* no more POLL's */
		return 1;
	}
	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) /* not MS */
		return 0;

	if (pjob->ji_nodekill >= pjob->ji_numnodes) {
		char *msgbuf = NULL;

		pbs_asprintf(&msgbuf,
			     "warning: job %s ji_nodekill=%d >= ji_numnodes=%d",
			     pjob->ji_qs.ji_jobid, pjob->ji_nodekill, pjob->ji_numnodes);
		log_err(-1, __func__, msgbuf);
		free(msgbuf);
	} else if (pjob->ji_nodekill != TM_ERROR_NODE) {
		hnodent *pnode = &pjob->ji_hosts[pjob->ji_nodekill];

		/* special case EOF */
		if (pnode->hn_sister == SISTER_EOF) {
			if ((reliable_job_node_find(&pjob->ji_failed_node_list, pnode->hn_host) != NULL) || (do_tolerate_node_failures(pjob)) || recover == 2) {
				snprintf(log_buffer, sizeof(log_buffer), "ignoring node EOF %d from failed mom %s as job is tolerant of node failures", pjob->ji_nodekill, pnode->hn_host ? pnode->hn_host : "");
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
				return 0;
			} else {
				sprintf(log_buffer, "node EOF %d (%s)",
					pjob->ji_nodekill,
					pnode->hn_host);
				log_event(PBSEVENT_JOB | PBSEVENT_FORCE,
					  PBS_EVENTCLASS_JOB, LOG_INFO,
					  pjob->ji_qs.ji_jobid, log_buffer);
				pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_RERUN_SIS_FAIL;
				(void) kill_job(pjob, SIGKILL);
				return 0;
			}
		}
		sprintf(log_buffer, "node %d (%s) requested job die, code %d",
			pjob->ji_nodekill, pnode->hn_host, pnode->hn_sister);
		return 1;
	}

#ifdef NAS /* localmod 015 */
	/* Check spool usage on the MS */
	if (spool_over_limit(pjob)) {
		sprintf(log_buffer, "spool usage job total %luKB exceeded limit %luKB",
			spool_usage(pjob), spoolsize);
		pjob->ji_nodekill = pjob->ji_nodeid;
		return 1;
	}
#endif /* localmod 015 */

	/* sum up cput and mem for all nodes */
	total_cpu = 0;
	total_mem = 0;
	for (i = 0; i < pjob->ji_numnodes - 1; i++) {
		noderes *nr = &pjob->ji_resources[i];

		total_cpu += nr->nr_cput;
		total_mem += nr->nr_mem;
	}

	used = get_jattr(pjob, JOB_ATR_resc_used);
	for (limresc = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
	     limresc != NULL;
	     limresc = (resource *) GET_NEXT(limresc->rs_link)) {

		if (!is_attr_set(&limresc->rs_value))
			continue;

		rd = limresc->rs_defin;
		/* this is so we don't make extra calls to find_resc_entry */
		if (strcmp(rd->rs_name, "cput") != 0 &&
		    strcmp(rd->rs_name, "mem") != 0)
			continue;

		useresc = find_resc_entry(used, rd);
		if (useresc == NULL)
			continue;
		if (!is_attr_set(&useresc->rs_value))
			continue;

		if (strcmp(rd->rs_name, "cput") == 0) {
			total_cpu += gettime(useresc);
			limit = gettime(limresc);

			units = "secs";
			total = &total_cpu;
			if (limit < total_cpu)
				break;
		} else if (strcmp(rd->rs_name, "mem") == 0) {
			total_mem += getsize(useresc);
			limit = getsize(limresc);

			units = "kb";
			total = &total_mem;
			if (enforce_mem && (limit < total_mem))
				break;
		}
	}
	if (limresc == NULL)
		return 0;

	sprintf(log_buffer, "%s job total %lu %s exceeded limit %lu %s",
		rd->rs_name, *total, units, limit, units);
	pjob->ji_nodekill = pjob->ji_nodeid;
	return 1;
}

#ifdef NAS_UNKILL /* localmod 011 */

/**
 * @brief
 *	free_kp_list_entries(head) - delete_link() and free() entries of a linked
 *	list
 *
 * @param[in] head - pointer to pbs_list_head
 *
 * @return	Void
 *
 */
void
free_kp_list_entries(pbs_list_head *head)
{
	kp *entry;
	kp *next;

	entry = (kp *) GET_NEXT(*head);
	while (entry) {
		next = (kp *) GET_NEXT(entry->kp_link);
		delete_link(&entry->kp_link);
		free(entry);
		entry = next;
	}
	CLEAR_HEAD((*head));
}

/**
 * @brief
 *	kp_comment_node() - Set a node comment regarding the presence of unkillable
 *	processes. Based on Altair's offline_job_vnodes().
 *
 * @return	Void
 *
 */
void
kp_comment_node(void)
{
	static char id[] = "offline_node";
	static char *cmdbuf = NULL;
	static char *cmdprefix = "qmgr -c 'set node ";
	static char *cmdmidfix = "comment = \"";
	static char *cmdsuffix = "unkillable process\"'";
	char linebuf[_POSIX_ARG_MAX];
	long execmax = _POSIX_ARG_MAX;
	size_t linebufmax = sizeof(linebuf);
	time_t now;

	/*
	 ** Prepare cmdbuf with prefix up to before the node name
	 */
	if (cmdbuf == NULL) {
		cmdbuf = malloc(execmax);
		if (cmdbuf == NULL) {
			log_err(errno, id, "cmdbuf malloc");
			return;
		}
	}
	if (snprintf(cmdbuf, execmax, "%s/bin/%s",
		     pbs_conf.pbs_exec_path, cmdprefix) >= execmax) {
		log_err(-1, id, "cmdbuf overflow");
		return;
	}

	/*
	 ** Write out the rest of the command
	 */
	now = time(0);
	if (snprintf(linebuf, linebufmax, "%s %s%.24s: %s",
		     mom_short_name, cmdmidfix,
		     ctime(&now), cmdsuffix) >= linebufmax) {
		log_err(-1, id, "overflow of linebuf");
		return;
	}

	/* cmdbuf length + linebuf length + terminating character */
	if (strlen(cmdbuf) + strlen(linebuf) + 1 > execmax) {
		log_err(-1, id, "cmdbuf overflow");
		return;
	}
	(void) strcat(cmdbuf, linebuf);

	if (system(cmdbuf) == -1)
		log_err(errno, id, "attempt to set node comment failed");
}
#endif /* localmod 011 */

void
dorestrict_user(void)
{
	static char id[] = "restrict_user";
	pid_t *allpids(void);
	pid_t *pids = NULL;
	static pid_t mom_sid = -1;
	int i = 0;
	job *pjob = NULL, *hjob = NULL;
	pbs_task *ptask = NULL;
	static resource_def *prsdef = NULL;
	resource *pplace = NULL;
	int j = 0;
	int found_exempt = 0;
	struct passwd *pwent = NULL;
	static uid_t uid_dataservice = -1;
	char errmsg[PBS_MAX_DB_ERR];
	char *usr = NULL;

#ifdef NAS_UNKILL /* localmod 011 */
	pbs_list_head new_killed_procs;
	kp *current_kp, *prev_kp;

	CLEAR_HEAD(new_killed_procs);
#endif /* localmod 011 */

	if (!restrict_user)
		return;

	if (pbs_conf.start_server && uid_dataservice == -1) {
		/* setting uid_dataservice to 0 to prevent infinite logging of error message if the call to
		 *  pbs_get_dataservice_usr fails
		 */
		uid_dataservice = 0;

		/* Database user must be an exempted user
		 *
		 * errmsg is set to a default value and passed to the pbs_dataservice_usr api . It may be
		 * overwritten inside the pbs_get_dataservice_usr api by some other errorneous condition.
		 * The max possible length of the error message is set to PBS_MAX_DB_ERR
		 *
		 * On success the dataservice username is returned which should be freed by the caller to
		 * prevent a mem leak.
		 */
		if ((usr = pbs_get_dataservice_usr(errmsg, PBS_MAX_DB_ERR)) != NULL) {
			/* usr now contains the dataservice user name . Get the uid of the dataservice
			 * user name using the  getpwnam() api
			 */

			if (((pwent = getpwnam(usr)) == NULL)) {
				sprintf(log_buffer, "user %s doesn't exist", usr);
				log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, id,
					  log_buffer);
			} else {
				uid_dataservice = pwent->pw_uid;
				sprintf(log_buffer,
					"Dataservice user %s is an exmpted user ",
					usr);
				log_event(PBSEVENT_SYSTEM, 0, LOG_DEBUG, id,
					  log_buffer);
			}
			free(usr);
		}
	}

	reqnum++;
	if ((pids = allpids()) == NULL)
		return;

	if (prsdef == NULL)
		prsdef = &svr_resc_def[RESC_PLACE];

#ifndef WIN32
	if (mom_sid == -1) {
		mom_sid = getsid(0);
		DBPRT(("%s: set mom sid %d\n", id, mom_sid))
	}
#endif
	for (i = 0; pids[i] != -1; i++) {
		pid_t pid = pids[i];
		int ret;
		pid_t procsid;
		uid_t uid;
		char comm[30];
#ifdef WIN32
		char *uname = NULL; /* dummy */
		ret = dep_procinfo(pid, &procsid, &uid, uname, 0, comm, sizeof(comm));
#else
		ret = dep_procinfo(pid, &procsid, &uid, comm, sizeof(comm));
#endif
		if (ret != TM_OKAY) {
			DBPRT(("%s: no info pid %d\n", id, pid))
			continue;
		}

		/*
		 ** Ignore processes within MOM's session so we do not
		 ** kill stagein procs where a job does not yet exist.
		 */
		if (procsid == mom_sid) {
			DBPRT(("%s: MOM session pid %d uid %d comm %s\n",
			       id, pid, uid, comm))
			continue;
		}

		/* Ignore system processes. */
		if (uid <= (uid_t) restrict_user_maxsys)
			continue;
		/* Ignore the postgres process */
		if (uid == uid_dataservice)
			continue;

		found_exempt = 0;
		for (j = 0; j < NUM_RESTRICT_USER_EXEMPT_UIDS; j++) {
			if (restrict_user_exempt_uids[j] == 0)
				break;

			if (uid == restrict_user_exempt_uids[j]) {
				found_exempt = 1;
				break;
			}
		}
		if (found_exempt)
			continue;

		for (pjob = (job *) GET_NEXT(svr_alljobs);
		     pjob;
		     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
			if (pjob->ji_qs.ji_un.ji_momt.ji_exuid == uid)
				break;
		}

		if (pjob == NULL) /* no job with same uid */
			goto badguy;

		/*
		 ****************************************************
		 ** WARNING
		 ** THIS IS PROTOTYPE CODE ... DO NOT USE
		 ****************************************************
		 ** Job with same uid exists but we are not doing any
		 ** special handling of aliens so it doesn't mater if
		 ** this is part of a job or not.
		 */
		if (alien_attach == 0 && alien_kill == 0)
			continue;

		hjob = pjob; /* save matching job */

		for (pjob = (job *) GET_NEXT(svr_alljobs);
		     pjob;
		     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
			if (pjob->ji_qs.ji_un.ji_momt.ji_exuid != uid)
				continue;
			/* job should be running */
			if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING) && !check_job_substate(pjob, JOB_SUBSTATE_PRERUN))
				continue;

			for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
			     ptask != NULL;
			     ptask = (pbs_task *)
				     GET_NEXT(ptask->ti_jobtask)) {
				pid_t tasksid;

				tasksid = ptask->ti_qs.ti_sid;
				/* DEAD task */
				if (tasksid <= 1)
					continue;

				if (procsid == tasksid)
					break;
			}

			if (ptask != NULL)
				break;
		}
		/*
		 ** If pjob is not NULL, the process is part of a job.
		 ** We do not want to touch it.
		 */
		if (pjob != NULL)
			continue;

		/*
		 ** We are not going to attach the alien, here we check
		 ** to see if the job has the node "excl".  If so, we
		 ** leave it alone.  If the job is not "excl", we kill
		 ** the alien.
		 */
		if (alien_kill) {
			pplace = find_resc_entry(get_jattr(hjob, JOB_ATR_resource), prsdef);
			if (pplace && pplace->rs_value.at_val.at_str) {
				if (strstr(pplace->rs_value.at_val.at_str,
					   "excl"))
					continue;
			}
			/* fall through to "badguy" */
		}

		/*
		 ** From here on, we are looking an 'alien' process i.e.
		 ** a process that is not part of a job.
		 */
		if (alien_attach && /* attach the alien */
		    procsid > 1) {  /* only if sid is good */
			/*
			 **	Create a new task for the session.
			 */
			ptask = momtask_create(hjob);
			if (ptask == NULL) {
				sprintf(log_buffer,
					"%s: task create failed", id);
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					  LOG_NOTICE, hjob->ji_qs.ji_jobid,
					  log_buffer);
				continue;
			}

			strcpy(ptask->ti_qs.ti_parentjobid,
			       hjob->ji_qs.ji_jobid);
			/*
			 **	The parent self virtual nodes are not known.
			 */
			ptask->ti_qs.ti_parentnode = TM_ERROR_NODE;
			ptask->ti_qs.ti_myvnode = TM_ERROR_NODE;
			ptask->ti_qs.ti_parenttask = TM_INIT_TASK;
			ptask->ti_qs.ti_sid = procsid;
			ptask->ti_qs.ti_status = TI_STATE_RUNNING;
			ptask->ti_flags |= TI_FLAGS_ORPHAN;
			(void) task_save(ptask);

			if (!check_job_substate(hjob, JOB_SUBSTATE_RUNNING)) {
				set_job_state(hjob, JOB_STATE_LTR_RUNNING);
				set_job_substate(hjob, JOB_SUBSTATE_RUNNING);
				job_save(hjob);
			}

			/*
			 ** Add to list of polled jobs if it isn't
			 ** already there.
			 */
			if (is_linked(&mom_polljobs,
				      &hjob->ji_jobque) == 0) {
				append_link(&mom_polljobs,
					    &hjob->ji_jobque, hjob);
			}
			sprintf(log_buffer,
				"%s: pid %d sid %d cmd %s attached "
				"as task %8.8X",
				id,
				pid, procsid, comm, ptask->ti_qs.ti_task);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  hjob->ji_qs.ji_jobid, log_buffer);

			/*
			 ** Do any dependent attach operation.
			 */
			if (dep_attach(ptask) != TM_OKAY) {
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					  LOG_NOTICE, hjob->ji_qs.ji_jobid,
					  log_buffer);
			}
			continue;
		}

		/*
		 ** We are not going to attach the alien, here we check
		 ** to see if the job has the node "excl".  If so, we
		 ** leave it alone.  If the job is not "excl", we kill
		 ** the alien.
		 */
		if (alien_kill) {
			pplace = find_resc_entry(get_jattr(hjob, JOB_ATR_resource), prsdef);
			if (pplace && pplace->rs_value.at_val.at_str) {
				if (strstr(pplace->rs_value.at_val.at_str,
					   "excl"))
					continue;
			}
			/* fall through to "badguy" */
		}

	badguy:

#ifdef WIN32
		log_err(-1, id, "not supported function");

#else
#ifdef NAS_UNKILL /* localmod 011 */
		if ((current_kp = (kp *) malloc(sizeof(kp))) == NULL) {
			log_err(errno, id, "malloc");
			exit(1);
		}

		/*
		 ** Gather indentifying information for the process that should
		 ** be killed
		 */
		current_kp->pid = pid;
		time(&current_kp->kill_time);
		CLEAR_LINK(current_kp->kp_link);
		ret = kill_procinfo(pid, &current_kp->ppid, &current_kp->start_time);
		if (ret != TM_OKAY) {
			/*
			 ** Give up on maintaining a kill history for this
			 ** process, but still continue with kill attempts
			 */
			sprintf(log_buffer, "unable to gather additional info for pid %d(%s) to track kill history",
				pid, comm);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER,
				  LOG_DEBUG, id, log_buffer);

			free(current_kp);
			current_kp = NULL;
		} else {
			/*
			 ** Search through the list of processes we have already
			 ** tried to kill.
			 */
			for (prev_kp = (kp *) GET_NEXT(killed_procs);
			     prev_kp;
			     prev_kp = (kp *) GET_NEXT(prev_kp->kp_link)) {
				if (current_kp->pid == prev_kp->pid &&
				    current_kp->ppid == prev_kp->ppid &&
				    current_kp->start_time == prev_kp->start_time) {
					if (time(0) - prev_kp->kill_time > KP_WAIT_TIME) {
						/*
						 ** We've determined we have an
						 ** unkillable process - set a
						 ** server comment for this
						 ** node, log a message, then
						 ** set flags to have the mom
						 ** quickly exit. For good
						 ** measure we cleanup the
						 ** memory we've malloc'd
						 */
						free(current_kp);
						free_kp_list_entries(&killed_procs);
						free_kp_list_entries(&new_killed_procs);
						kp_comment_node();

						sprintf(log_buffer, "SEC_EVENT |unkillable process|host %s", mom_short_name);
						log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE, id, log_buffer);

						mom_run_state = 0;
						next_sample_time = 1;

						return;
					} else {
						/*
						 ** Again attempt to kill the
						 ** process, keeping the
						 ** previous identifying info
						 */
						free(current_kp);
						current_kp = prev_kp;
						delete_link(&prev_kp->kp_link);
					}

					break;
				}
			}
		}

		/*
		 ** Build a new list of processes we've attempted to kill
		 */
		if (current_kp != NULL)
			append_link(&new_killed_procs, &current_kp->kp_link, current_kp);
#endif		  /* localmod 011 */
		DBPRT(("%s: KILL pid %d sid %d\n", id, pid, procsid))
		if (kill(pid, SIGKILL) == 0) {
			sprintf(log_buffer, "killed uid %d pid %d(%s)",
				uid, pid, comm);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
				  LOG_NOTICE, id, log_buffer);
		} else {
			sprintf(log_buffer,
				"failed kill uid %d pid %d(%s)",
				uid, pid, comm);
			log_err(errno, id, log_buffer);
		}
#endif
	}
#ifdef NAS_UNKILL /* localmod 011 */
	/*
	 ** Our new list is now complete and includes processes we attempted to
	 ** kill previously but which are not dead yet. Discard the old list and
	 ** replace with the new
	 */
	free_kp_list_entries(&killed_procs);
	list_move(&new_killed_procs, &killed_procs);
#endif /* localmod 011 */
}

/*
 * @brief
 *	Function called by the Libtpp layer when the network connection to
 *	the pbs_comm router is restored. This is the implementation for mom.
 *
 * @param[in] data - currently unused
 *
 * @return	Void
 *
 */
void
net_restore_handler(void *data)
{
	mom_net_up = 1;
	mom_net_up_time = time(0);
	time_delta_hellosvr(MOM_DELTA_RESET);

	log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ALERT, __func__, "net restore handler called");
}

/*
 * @brief
 *	Function called by the Libtpp layer when the network connection to
 *	the pbs_comm router is down. In this implementation for the mom,
 *	the down handler closes the server stream. It then goes over the
 *	list of jobs and closes all streams to its sisterhood.
 *
 * @param[in] data - currently unused
 *
 * @return	Void
 *
 */
void
net_down_handler(void *data)
{
	int num;
	hnodent *np;
	job *pjob;

	log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ALERT, __func__, "net down handler called");
	if (server_stream >= 0) {
		log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE, msg_daemonname,
			   "Closing existing server stream %d", server_stream);
		dis_flush(server_stream);
		tpp_close(server_stream);
		server_stream = -1;
	}

	/* close streams to sister-hood for all jobs */
	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob != NULL;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {

		for (num = 0, np = pjob->ji_hosts;
		     num < pjob->ji_numnodes;
		     num++, np++) {
			if (np->hn_stream >= 0) {
				dis_flush(np->hn_stream);
				tpp_close(np->hn_stream);
				np->hn_stream = -1;
			}
		}
	}
	mom_net_up = 0;
	mom_net_up_time = 0;
}

/**
 * @brief
 *      This function returns the time delta
 * 	returns short bursts followed by longer intervals.
 *
 * 	This is used for how long mom should wait before sending next hello (in secs)
 * 	Can be used for any such scenario.
 *
 * @param[in] mode -	reset mode is to bring it back to bursting mode
 *
 * @return int
 * @retval >0 : time delta
 * @retval 0 : only in case of reset mode.
 */
int
time_delta_hellosvr(int mode)
{
	static int delta = 1;
	static int cnt = 1;
	int max_delta = 1 << 6; /* max interval will be 64s */

	DBPRT(("%s: mode= %d, delta= %d, cnt= %d", __func__, mode, delta, cnt))

	if (mode == MOM_DELTA_RESET) {
		delta = 1;
		cnt = 1;
		return 0;
	}

	if (cnt == 0) {
		if (delta == max_delta)
			return delta;

		delta <<= 1;
		cnt = delta << 1;
	} else
		cnt--;

	return delta;
}

/**
 * @brief
 * 	Resume multinode job after one or more sisters has been restarted
 *
 * @param[in] pjob - job pointer
 *
 * @return	Void
 *
 */

void
resume_multinode(job *pjob)
{
	if (pjob->ji_hosts == NULL)
		return;

	int com = IM_JOIN_RECOV_JOB;
	hnodent *np = NULL;
	eventent *ep = NULL;
	int i;
	for (i = 1; i < pjob->ji_numnodes; i++) {
		np = &pjob->ji_hosts[i];

		if (i == 1)
			ep = event_alloc(pjob, com, -1, np, TM_NULL_EVENT, TM_NULL_TASK);
		else
			ep = event_dup(ep, pjob, np);

		if (ep == NULL) {
			exec_bail(pjob, JOB_EXEC_FAIL1, NULL);
			return;
		}

		int stream = np->hn_stream;
		im_compose(stream, pjob->ji_qs.ji_jobid,
			   get_jattr_str(pjob, JOB_ATR_Cookie),
			   com, ep->ee_event, TM_NULL_TASK, IM_OLD_PROTOCOL_VER);
		(void) diswsi(stream, pjob->ji_numnodes);
		(void) diswsi(stream, pjob->ji_ports[0]);
		(void) diswsi(stream, pjob->ji_ports[1]);
		dis_flush(stream);
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		send_cred_sisters(pjob);
#endif
	}
}

#ifdef WIN32
/**
 * @brief
 *	main - the main program of MOM
 */
DWORD WINAPI
	main_thread(pv) void *pv;
#else
int
main(int argc, char *argv[])
#endif
{
	/* both Win32 and Unix */
	int rc;
	char *nodename;
	struct tpp_config tpp_conf;
	int errflg, c;
	int stalone = 0;
	int i;
	char *ptr;
	char *servername;
	unsigned int serverport;
	int recover = 0;
	time_t time_state_update = 0;
	int tppfd; /* fd for rm and im comm */
	double myla;
	time_t time_next_hello = 0;
	job *nxpjob;
	job *pjob;
	extern time_t wait_time;
	time_t getkbdtime();
	void activate_jobs();
	void idle_jobs();
	char *configscriptaction = NULL;
	char *inputfile = NULL;
	char *scriptname = NULL;
	resource *prscput;
	resource *prswall;
	char *getopt_str;
	int fd;
	u_long ipaddr;
	int optindinc = 0;
	mom_hook_input_t hook_input;
	char path_hooks_rescdef[MAXPATHLEN + 1];
	int sock_bind_rm;
	int sock_bind_mom;
#ifdef WIN32
	/* Win32 only */
	struct arg_param *p = (struct arg_param *) pv;
	int argc;
	char **argv;
	SERVICE_STATUS ss;
	int pmode = S_IREAD | S_IWRITE;
	struct _timeb tval;
	char *pwst = NULL;
	char winsta_name[MAXPATHLEN + 1];
	char desktop_name[MAXPATHLEN + 1];
	HWINSTA old_winsta = NULL;
	HWINSTA pbs_winsta = NULL;
	HDESK pbs_desktop = NULL;
	char *pch = NULL;
	extern char *pbs_conf_env;
#else
	/* Unix only */
	int pmode = S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH;
	struct timeval tval;
	struct sigaction act;
	gid_t mygid;
	extern char *optarg;
	extern int optind;
#endif /* WIN32 */

#ifdef _POSIX_MEMLOCK
	int do_mlockall = 0;
#endif

#ifdef WIN32
	_fcloseall(); /* Close any inherited extra files, leaving stdin-err open */
#else
	/* Close any inherited extra files, leaving stdin-err open */
	c = sysconf(_SC_OPEN_MAX);
	while (--c > 2)
		(void) close(c); /* close any file desc left open by parent */

	/* the real deal or version and exit? */
	PRINT_VERSION_AND_EXIT(argc, argv);
#endif

	/* If we are not run with real and effective uid of 0, forget it */
#ifdef WIN32
	_set_fmode(_O_BINARY);
	argc = p->argc;
	argv = p->argv;

	ZeroMemory(&ss, sizeof(ss));
	ss.dwCheckPoint = 0;
	ss.dwServiceType = SERVICE_WIN32_OWN_PROCESS | SERVICE_INTERACTIVE_PROCESS;
	ss.dwCurrentState = g_dwCurrentState;
	ss.dwControlsAccepted = SERVICE_ACCEPT_STOP | SERVICE_ACCEPT_SHUTDOWN;
	ss.dwWaitHint = 3000;
	/*If this is a multi-instance Mom, it needs the corresponding PBS_CONF_FILE environment.*/
	if ((strlen(argv[0]) != strlen("PBS_MOM")) && (pch = strstr(argv[0], "PBS_MOM"))) {
		char *pbsconf_temp = "PBS_CONF_FILE";
		pch = pch + strlen("PBS_MOM");
		if ((pbs_conf_env = (char *) malloc(strlen(pbsconf_temp) + strlen(pch) + 1)) != NULL) {
			memset(pbs_conf_env, 0, strlen(pbsconf_temp) + strlen(pch) + 1);
			pbs_strncpy(pbs_conf_env, pbsconf_temp, strlen(pbsconf_temp) + strlen(pch) + 1);
			pbs_conf_env = strcat(pbs_conf_env, pch);
		} else {
			g_dwCurrentState = SERVICE_STOPPED;
			ss.dwCurrentState = g_dwCurrentState;
			ss.dwWin32ExitCode = ERROR_BAD_CONFIGURATION;
			if (g_ssHandle != 0)
				SetServiceStatus(g_ssHandle, &ss);
			return (1);
		}
	}
#endif

	/* set single threaded mode */
	pbs_client_thread_set_single_threaded_mode();
	/* disable attribute verification */
	set_no_attribute_verification();

#ifdef WIN32

	if (g_ssHandle != 0)
		SetServiceStatus(g_ssHandle, &ss);
	/* load the pbs conf file */
	if (pbs_loadconf(0) == 0) {
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_BAD_CONFIGURATION;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
		return (1);
	}

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	if (!isAdminPrivilege(getlogin())) {
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = CO_E_LAUNCH_PERMSSION_DENIED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
		fprintf(stderr, "%s: Must be run as root\n", argv[0]);
		return (1);
	}

	if (!has_privilege(SE_DEBUG_NAME))
		ena_privilege(SE_DEBUG_NAME);
#else
#ifndef DEBUG
	if ((getuid() != 0) || (geteuid() != 0)) {
		fprintf(stderr, "%s: Must be run as root\n", argv[0]);
		return (1);
	}
#endif
#endif /* WIN32 */

	/* initialize the thread context */
	if (pbs_client_thread_init_thread_context() != 0) {
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_OUTOFMEMORY;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#else
		fprintf(stderr, "%s: Unable to initialize thread context\n",
			argv[0]);
		return (1);
#endif /* WIN32 */
	}

	if (set_msgdaemonname("pbs_mom")) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}
#ifndef WIN32
	if (pbs_loadconf(0) == 0) {
		return (1);
	}
	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);
#endif
	pbsgroup = getgid();

	/* Get our default service port */

	pbs_mom_port = pbs_conf.mom_service_port;
	default_server_port = pbs_conf.batch_service_port;
	pbs_rm_port = pbs_conf.manager_service_port;

	/* Is an alternate Mom Home path specified in pbs.conf ? */

	if (pbs_conf.pbs_mom_home) {
		if (pbs_conf.pbs_home_path != NULL)
			free(pbs_conf.pbs_home_path);
#ifdef WIN32
		pbs_conf.pbs_home_path =
			shorten_and_cleanup_path(pbs_conf.pbs_mom_home);
		if (pbs_conf.pbs_environment) {
			free(pbs_conf.pbs_environment);
			if ((pbs_conf.pbs_environment =
				     malloc(strlen(pbs_conf.pbs_home_path) + 17))) {
				sprintf(pbs_conf.pbs_environment, "%s/pbs_environment",
					pbs_conf.pbs_home_path);
				fix_path(pbs_conf.pbs_environment, 1);
			}
		}
#else
		if ((pbs_conf.pbs_home_path = strdup(pbs_conf.pbs_mom_home)) == NULL) {
			fprintf(stderr, "Unable to allocate Memory!\n");
			return (1);
		}
#endif
	}

	/*
	 * Set the default tmp directory, which may get overridden by $tmpdir in
	 * mom_priv/config later on.
	 */
	if (set_tmpdir(pbs_conf.pbs_tmpdir) != HANDLER_SUCCESS) {
		fprintf(stderr, "%s: Unable to configure temporary directory.\n", argv[0]);
		return (1);
	}

	errflg = 0;
	getopt_str = "d:c:M:mNS:R:lL:a:xC:prs:n:Q:-:";
	while ((c = getopt(argc, argv, getopt_str)) != -1) {
		switch (c) {
			case 'N': /* stand alone (win), no fork (others) */
				stalone = 1;
				break;
			case 'm':
#ifdef WIN32
				fprintf(stderr, "-m option not supported for Windows\n");
				g_dwCurrentState = SERVICE_STOPPED;
				ss.dwCurrentState = g_dwCurrentState;
				ss.dwWin32ExitCode = ERROR_INVALID_PARAMETER;
				if (g_ssHandle != 0)
					SetServiceStatus(g_ssHandle, &ss);
				return 1;
#endif
				mock_run = 1;
				break;
			case 'd': /* directory */
				if (pbs_conf.pbs_home_path != NULL)
					free(pbs_conf.pbs_home_path);
				pbs_conf.pbs_home_path = optarg;
				break;
			case 'c': /* config file */
				config_file_specified = 1;
				pbs_strncpy(config_file, optarg, sizeof(config_file)); /* remember name */
				break;
			case 'M':
				pbs_mom_port = (unsigned int) atoi(optarg);
				if (pbs_mom_port == 0) {
					fprintf(stderr, "Bad MOM port value %s\n",
						optarg);
#ifdef WIN32
					g_dwCurrentState = SERVICE_STOPPED;
					ss.dwCurrentState = g_dwCurrentState;
					ss.dwWin32ExitCode = ERROR_INVALID_PARAMETER;
					if (g_ssHandle != 0)
						SetServiceStatus(g_ssHandle, &ss);
#endif
					return (1);
				}
				break;
			case 'S':
				default_server_port = (unsigned int) atoi(optarg);
				if (default_server_port == 0) {
					fprintf(stderr, "Bad Server port value %s\n",
						optarg);
#ifdef WIN32
					g_dwCurrentState = SERVICE_STOPPED;
					ss.dwCurrentState = g_dwCurrentState;
					ss.dwWin32ExitCode = ERROR_INVALID_PARAMETER;
					if (g_ssHandle != 0)
						SetServiceStatus(g_ssHandle, &ss);
#endif
					return (1);
				}
				break;
			case 'R':
				pbs_rm_port = (unsigned int) atoi(optarg);
				if (pbs_rm_port == 0) {
					fprintf(stderr, "Bad RM port value %s\n",
						optarg);
#ifdef WIN32
					g_dwCurrentState = SERVICE_STOPPED;
					ss.dwCurrentState = g_dwCurrentState;
					ss.dwWin32ExitCode = ERROR_INVALID_PARAMETER;
					if (g_ssHandle != 0)
						SetServiceStatus(g_ssHandle, &ss);
#endif
					return (1);
				}
				break;
			case 'l':
#ifdef _POSIX_MEMLOCK
				do_mlockall = 1;
#else
				fprintf(stderr, "-l option - mlockall not supported\n");
#endif /* _POSIX_MEMLOCK */
				break;
			case 'L':
				log_file = optarg;
				break;
			case 'a':
				alarm_time = (int) strtol(optarg, &ptr, 10);
				if (alarm_time <= 0 || *ptr != '\0') {
					fprintf(stderr,
						"%s: bad alarm time\n", optarg);
					errflg = 1;
				}
				break;
			case 'x':
				port_care = 0;
				break;
			case 'C':
				path_checkpoint_from_getopt = optarg;
				break;
			case 'p':
				if (recover == 0)
					recover = 2;
				else
					errflg = 1;
				break;
			case 'r':
				if (recover == 0)
					recover = 1;
				else
					errflg = 1;
				break;
			case 's':
				configscriptaction = optarg;
				if (strcmp(optarg, "insert") == 0) {
					if (optind == argc - 2) {
						scriptname = argv[optind];
						inputfile = argv[optind + 1];
						optindinc += 2;
					} else
						errflg = 1;
				} else if ((strcmp(optarg, "remove") == 0) ||
					   (strcmp(optarg, "show") == 0)) {
					if (optind == argc - 1) {
						scriptname = argv[optind];
						optindinc++;
					} else
						errflg = 1;
				} else if (strcmp(optarg, "list") != 0)
					errflg = 1;
				break;
			case 'n':
				nice_val = (int) strtol(optarg, &ptr, 10);
				if ((nice_val < PRIO_MIN) ||
				    (nice_val > PRIO_MAX) ||
				    (*ptr != '\0')) {
					fprintf(stderr,
						"%s: bad nice value\n", optarg);
					errflg = 1;
				}
				break;
			case 'Q':
				fprintf(stderr, "Warning, this option is for QA testing only,  it should never be used by a production site\n");
				QA_testing = atol(optarg);
				break;
			case '?':
			default:
				errflg = 1;
		}
	}
	optind += optindinc;

	if (errflg || optind != argc) {
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_INVALID_PARAMETER;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
		usage2(argv[0]); /* exits */
		return (1);
#else
		usage(argv[0]); /* exits */
#endif /* WIN32 */
	}

	umask(022);

#ifdef WIN32
	save_env();
#endif
	/*
	 * The following is code to reduce security risks
	 * start out with standard umask, system resource limit infinite
	 */
	if ((num_var_env = setup_env(pbs_conf.pbs_environment)) == -1) {
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_INVALID_ENVIRONMENT;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
		return (1);
#else
		exit(1);
#endif /* WIN32 */
	}

#ifndef WIN32 /* ---- UNIX ------------------------------------------*/
	mygid = getgid();
	(void) setgroups(1, &mygid); /* secure suppl. groups */

#if defined(RLIM64_INFINITY)
	{
		struct rlimit64 rlimit;
		int curerror;

		rlimit.rlim_cur = RLIM64_INFINITY;
		rlimit.rlim_max = RLIM64_INFINITY;

		(void) setrlimit64(RLIMIT_CPU, &rlimit);
		(void) setrlimit64(RLIMIT_FSIZE, &rlimit);
		(void) setrlimit64(RLIMIT_DATA, &rlimit);
		if (getrlimit64(RLIMIT_STACK, &orig_stack_size) != -1) {
			if ((orig_stack_size.rlim_cur != RLIM64_INFINITY) && (orig_stack_size.rlim_cur < MIN_STACK_LIMIT)) {
				rlimit.rlim_cur = MIN_STACK_LIMIT;
				rlimit.rlim_max = MIN_STACK_LIMIT;
				if (setrlimit64(RLIMIT_STACK, &rlimit) == -1) {
					char msgbuf[] = "Stack limit setting failed";
					curerror = errno;
					log_err(curerror, __func__, msgbuf);
					sprintf(log_buffer, "%s errno=%d", msgbuf, curerror);
					log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR, (char *) __func__, log_buffer);
					exit(1);
				}
			}
		} else {
			char msgbuf[] = "Getting current Stack limit failed";

			curerror = errno;
			log_err(curerror, __func__, msgbuf);
			snprintf(log_buffer, sizeof(log_buffer), "%s errno=%d", msgbuf, curerror);
			log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR, (char *) __func__, log_buffer);
			exit(1);
		}

		rlimit.rlim_cur = RLIM64_INFINITY;
		rlimit.rlim_max = RLIM64_INFINITY;

#ifdef RLIMIT_NPROC
		(void) getrlimit64(RLIMIT_NPROC, &orig_nproc_limit); /* get for later */
		if (setrlimit64(RLIMIT_NPROC, &rlimit) == -1) {	     /* set unlimited */
			char msgbuf[] = "setrlimit NPROC setting failed";
			curerror = errno;
			log_err(curerror, __func__, msgbuf);
		}
#endif /* RLIMIT_NPROC */
#ifdef RLIMIT_RSS
		(void) setrlimit64(RLIMIT_RSS, &rlimit);
#endif /* RLIMIT_RSS */
#ifdef RLIMIT_VMEM
		(void) setrlimit64(RLIMIT_VMEM, &rlimit);
#endif /* RLIMIT_VMEM */
#ifdef RLIMIT_MEMLOCK
		(void) setrlimit64(RLIMIT_MEMLOCK, &rlimit);
#endif /* RLIMIT_MEMLOCK */
	}

#else /* set rlimit 32 bit */
	{
		struct rlimit rlimit;
		int curerror;

		rlimit.rlim_cur = RLIM_INFINITY;
		rlimit.rlim_max = RLIM_INFINITY;
		(void) setrlimit(RLIMIT_CPU, &rlimit);
#ifdef RLIMIT_NPROC
		(void) getrlimit(RLIMIT_NPROC, &orig_nproc_limit); /* get for later */
		if (setrlimit(RLIMIT_NPROC, &rlimit) == -1) {	   /* set unlimited */
			char msgbuf[] = "setrlimit NPROC setting failed";
			curerror = errno;
			log_err(curerror, __func__, msgbuf);
		}
#endif /* RLIMIT_NPROC */
#ifdef RLIMIT_RSS
		(void) setrlimit(RLIMIT_RSS, &rlimit);
#endif /* RLIMIT_RSS */
#ifdef RLIMIT_VMEM
		(void) setrlimit(RLIMIT_VMEM, &rlimit);
#endif /* RLIMIT_VMEM */
#ifdef RLIMIT_MEMLOCK
		(void) setrlimit(RLIMIT_MEMLOCK, &rlimit);
#endif /* RLIMIT_MEMLOCK */
#ifndef linux
		(void) setrlimit(RLIMIT_FSIZE, &rlimit);
		(void) setrlimit(RLIMIT_DATA, &rlimit);
		(void) getrlimit(RLIMIT_STACK, &orig_stack_size); /* get for later */
		(void) setrlimit(RLIMIT_STACK, &rlimit);
#else
		if (getrlimit(RLIMIT_STACK, &orig_stack_size) != -1) {
			if ((orig_stack_size.rlim_cur != RLIM_INFINITY) && (orig_stack_size.rlim_cur < MIN_STACK_LIMIT)) {
				rlimit.rlim_cur = MIN_STACK_LIMIT;
				rlimit.rlim_max = MIN_STACK_LIMIT;
				if (setrlimit(RLIMIT_STACK, &rlimit) == -1) {
					char msgbuf[] = "Stack limit setting failed";
					curerror = errno;
					log_err(curerror, __func__, msgbuf);
					sprintf(log_buffer, "%s errno=%d", msgbuf, curerror);
					log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR, (char *) __func__, log_buffer);
					exit(1);
				}
			}
		} else {
			char msgbuf[] = "Getting current Stack limit failed";
			curerror = errno;
			log_err(curerror, __func__, msgbuf);
			sprintf(log_buffer, "%s errno=%d", msgbuf, curerror);
			log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR, (char *) __func__, log_buffer);
			exit(1);
		}
#endif /* not linux */
	}
#endif /* !RLIM64_INFINITY */

#endif /* !WIN32 */

	if ((job_attr_idx = cr_attrdef_idx(job_attr_def, JOB_ATR_LAST)) == NULL) {
		log_err(errno, __func__, "Failed creating job attribute search index");
		return (-1);
	}
	if (cr_rescdef_idx(svr_resc_def, svr_resc_size) != 0) {
		log_err(errno, __func__, "Failed creating resc definition search index");
		return (-1);
	}

	/* initialize pointers in resource_def array */
	for (i = 0; i < (svr_resc_size - 1); ++i)
		svr_resc_def[i].rs_next = &svr_resc_def[i + 1];
	/* last entry is left with null pointer */

	/* set up and validate home paths    */

	c = 0;
	mom_home = mk_dirs("mom_priv");
	path_jobs = mk_dirs("mom_priv/jobs/");
	path_hooks = mk_dirs("mom_priv/hooks/");
	path_hooks_workdir = mk_dirs("mom_priv/hooks/tmp/");
#ifdef WIN32
	path_epilog = mk_dirs("mom_priv/epilogue.bat");
	path_prolog = mk_dirs("mom_priv/prologue.bat");
#else
	path_epilog = mk_dirs("mom_priv/epilogue");
	path_prolog = mk_dirs("mom_priv/prologue");
#endif
	path_log = mk_dirs("mom_logs");
	path_spool = mk_dirs("spool/");
	path_undeliv = mk_dirs("undelivered/");
	path_addconfigs = mk_dirs("mom_priv/config.d");

	/* open log file while std in,out,err still open, forces to fd 4 */
#ifdef WIN32
	/* Don't worry about return value of log_open() like */
	/* in the server code.  A -1 is returned in log_open() for all */
	/* failure cases so it's hard to know if a corrupt log file is the */
	/* culprit, which happes occasionally under windows. */

	/*
	 * let SCM wait 10 seconds for log_open() to complete
	 * as it does network interface query which can take time
	 */

	ss.dwCheckPoint++;
	ss.dwWaitHint = 60000;
	if (g_ssHandle != 0)
		SetServiceStatus(g_ssHandle, &ss);
	log_open(log_file, path_log);

	/* moved the 2 functions here as they are now using the log functions,
	and these functions can be used after calling log_open() */

	/* let SCM wait 20 seconds for secure_misc_files() to complete */
	ss.dwCheckPoint++;
	ss.dwWaitHint = 20000;
	if (g_ssHandle != 0)
		SetServiceStatus(g_ssHandle, &ss);

	secure_misc_files();

	/* let SCM wait 30 seconds for secure_mom_files() to complete */
	ss.dwCheckPoint++;
	ss.dwWaitHint = 30000;
	if (g_ssHandle != 0)
		SetServiceStatus(g_ssHandle, &ss);

	secure_mom_files();

#else
	if ((c = log_open(log_file, path_log)) != 0) { /* use given name */
		fprintf(stderr, "pbs_mom: Unable to open logfile\n");
		return (1);
	}
#endif /* WIN32 */

	if (QA_testing != 0) {
		sprintf(log_buffer, "Warning QA_testing option set to %lu",
			QA_testing);
		log_event(PBSEVENT_ADMIN | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_WARNING, msg_daemonname, log_buffer);
	}

	if (configscriptaction != NULL) {
		/* must precede chdir(mom_home) */
		do_configs(configscriptaction, scriptname, inputfile);
		/* NOTREACHED */
	}

	/* change working directory to mom home (mom_priv) */

	if (chdir(mom_home) == -1) {
		perror("pbs_mom unable to change working directory to mom home");
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_DIRECTORY;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif
		return (1);
	}

#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
#ifdef WIN32
	/* For windows, don't check full path. Let system put in default */
	/* permissions for top-level directories */
	c |= chk_file_sec(path_jobs, 1, 0, WRITES_MASK ^ FILE_WRITE_EA, 0);
	c |= chk_file_sec(path_hooks, 1, 0, WRITES_MASK ^ FILE_WRITE_EA, 0);
	c |= chk_file_sec(path_hooks_workdir, 1, 0, WRITES_MASK ^ FILE_WRITE_EA, 0);
	c |= chk_file_sec(path_spool, 1, 1, 0, 0);
	c |= chk_file_sec(pbs_conf.pbs_environment, 0, 0, WRITES_MASK ^ FILE_WRITE_EA, 0);
#else
	c |= chk_file_sec(path_jobs, 1, 0, S_IWGRP | S_IWOTH, 1);
	c |= chk_file_sec(path_hooks, 1, 0, S_IWGRP | S_IWOTH, 1);
	c |= chk_file_sec(path_hooks_workdir, 1, 0, S_IWGRP | S_IWOTH, 1);
	c |= chk_file_sec(path_spool, 1, 1, 0, 0);
	c |= chk_file_sec(pbs_conf.pbs_environment, 0, 0, S_IWGRP | S_IWOTH, 0);
#endif /* WIN32 */
	if (c) {
		sprintf(log_buffer,
			"Warning: one of chk_file_sec failed: %s, %s, %s, %s, %s",
			path_jobs, path_spool, pbs_conf.pbs_environment,
			path_hooks, path_hooks_workdir);
		log_err(0, "mom_main", log_buffer);

#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_ACCESS_DENIED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif
		return (3);
	}

#endif /* not DEBUG and not NO_SECURITY_CHECK */

	if (initsocketlib())
		return 1;

#ifdef WIN32
	/* Under WIN32, create structure that will be used to track child processes. */
	if (initpids() == 0) {
		log_err(-1, "pbsd_init", "Creating pid handles table failed!");
		return (-1);
	}

	/* Let's do an extra validity check */

	if (check_executor() == 1) { /* failed on check for root */
		log_err(-1, msg_daemonname, winlog_buffer);
		return (3);
	}
	if (strlen(winlog_buffer) > 0) {

		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
			  LOG_WARNING, msg_daemonname, winlog_buffer);
	}
#endif

	/*
	 * Set mom_host to gethostname(), if gethostname() fail, then use PBS_MOM_NODE_NAME
	 * if it is defined and complies to RFC 952/1123
	 */
	c = gethostname(mom_host, (sizeof(mom_host) - 1));
	if (c != 0) {
		/*
		 * backup plan
		 * use PBS_MOM_NODE_NAME as hostname if it is defined and complies to RFC 952/1123
		 */
		c = 0;
		if (pbs_conf.pbs_mom_node_name) {
			pbs_strncpy(mom_host, pbs_conf.pbs_mom_node_name, sizeof(mom_host));
			ptr = mom_host;
			/* First character must be alpha-numeric */
			if (isalnum((int) *ptr)) {
				/* Subsequent characters may also be dots or dashes */
				for (ptr++; (c == 0) && (*ptr != '\0'); ptr++) {
					if (*ptr == '.') {
						/* Disallow two dots in a row or a trailing dot */
						if (*(ptr + 1) == '.' || *(ptr + 1) == '\0')
							c = -1;
					} else if ((*ptr != '-') && !isalnum((int) *ptr)) {
						c = -1;
					}
				}
			} else {
				c = -1;
			}
		} else {
			c = -1;
		}
		if (c != 0) {
			log_err(-1, msg_daemonname, "Unable to obtain my host name");
			return (-1);
		}
	}

	/*
	 * Set mom_short_name to PBS_MOM_NODE_NAME if it is defined.
	 * Otherwise, set mom_short_name to the return value of
	 * gethostname(), truncated to first dot.
	 */
	if (pbs_conf.pbs_mom_node_name)
		/* mom_short_name was specified explicitly using PBS_MOM_NODE_NAME */
		pbs_strncpy(mom_short_name, pbs_conf.pbs_mom_node_name, sizeof(mom_short_name));
	else {
		/* use gethostname(), truncated to first dot */
		pbs_strncpy(mom_short_name, mom_host, sizeof(mom_short_name));
		if ((ptr = strchr(mom_short_name, (int) '.')) != NULL)
			*ptr = '\0'; /* terminate at first dot */
	}

	/*
	 * Now get mom_host, which determines resources_available.host
	 * and also the interface used to register to pbs_comm if
	 * PBS_LEAF_NAME is unset. Note that mom_host will be overridden
	 * by PBS_LEAF_NAME later on if TPP is enabled (search
	 * pbs_conf.pbs_leaf_name to find code section).
	 */
	c = get_fullhostname(mom_host, mom_host, (sizeof(mom_host) - 1));
	if (c == -1) {
		log_err(-1, msg_daemonname, "Unable to resolve my host name");
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_INVALID_COMPUTERNAME;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif
		return (-1);
	}

	lockfds = open("mom.lock", O_CREAT | O_WRONLY, pmode);
	if (lockfds < 0) {
		(void) strcpy(log_buffer, "Unable to open lock file");
		log_err(-1, msg_daemonname, log_buffer);
		(void) strcat(log_buffer, "\n");
		(void) fprintf(stderr, "%s", log_buffer);
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_LOCK_FAILED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif
		return (1);
	}

#ifdef WIN32
	secure_file("mom.lock", "Administrators",
		    READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
#endif
	if (lock_file(lockfds, F_WRLCK, "mom.lock", 1, NULL, 0)) { /* See if other MOMs are running */
		log_errf(errno, msg_daemonname, "pbs_mom: another mom running");
		fprintf(stderr, "%s\n", "pbs_mom: another mom running");
		exit(1);
	}

	if (read_config(NULL)) {
		fprintf(stderr, "%s: config file(s) parsing failed\n", argv[0]);
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_FILE_INVALID;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif /* WIN32 */
		return (1);
	}
	if (pbs_rm_port != (pbs_mom_port + 1)) {
		fprintf(stderr, "Mom RM port must be one greater than the Mom Service port\n");
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_FILE_INVALID;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif /* WIN32 */
		return (1);
	}

#if MOM_ALPS /* ALPS needs libjob support */
	/*
	 * This needs to be called after the config file is read and before MOM
	 * forks so the exit value can be seen if there is a bad flag combination.
	 */
	ck_acct_facility_present();
#endif /* MOM_ALPS */

	/* initialize the network interface */

	if ((sock_bind_mom = init_network(pbs_mom_port)) < 0) {
#ifdef WIN32
		errno = WSAGetLastError();
#endif
		c = errno;
		(void) sprintf(log_buffer,
			       "server port = %u, errno = %d",
			       pbs_mom_port, c);
#ifdef WIN32
		if (c == WSAEADDRINUSE)
#else
		if (c == EADDRINUSE)
#endif
			(void) strcat(log_buffer, ", already in use");
		log_err(-1, msg_daemonname, log_buffer);
		(void) strcat(log_buffer, "\n");
		(void) fprintf(stderr, "%s", log_buffer);
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_NETWORK_ACCESS_DENIED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif
		return (3);
	}

	if ((sock_bind_rm = init_network(pbs_rm_port)) < 0) {

#ifdef WIN32
		errno = WSAGetLastError();
#endif
		c = errno;
		(void) sprintf(log_buffer,
			       "resource (tcp) port = %u, errno = %d",
			       pbs_rm_port, c);
#ifdef WIN32
		if (c == WSAEADDRINUSE)
#else
		if (c == EADDRINUSE)
#endif
			(void) strcat(log_buffer, ", already in use");
		log_err(-1, msg_daemonname, log_buffer);
		(void) strcat(log_buffer, "\n");
		(void) fprintf(stderr, "%s", log_buffer);

#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_NETWORK_ACCESS_DENIED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif /* WIN32 */
		return (3);
	}

	/*Initialize security library's internal data structures*/
	if (load_auths(AUTH_SERVER)) {
		log_err(-1, __func__, "Failed to load auth lib");
		exit(3);
	}

	{
		int csret;

		/* allow Libsec to log errors if part of PBS daemon code */
		p_cslog = log_err;

		if ((csret = CS_server_init()) != CS_SUCCESS) {
			sprintf(log_buffer,
				"Problem initializing security library (%d)", csret);
			log_err(-1, __func__, log_buffer);
			exit(3);
		}
	}

#ifndef DEBUG
	if (stalone != 1) {
		/* go into the background and become own session/process group */
		if (lock_file(lockfds, F_UNLCK, "mom.lock", 1, NULL, 0)) { /* unlock so child can relock */
			log_errf(errno, msg_daemonname, "failed to unlock mom.lock file");
			fprintf(stderr, "%s\n", "failed to unlock mom.lock file");
			exit(1);
		}

		if (fork() > 0)
			return (0); /* parent goes away */

		if ((setsid() == -1) && (errno != ENOSYS)) {
			log_err(errno, msg_daemonname, "setsid failed");
			return (2);
		}
		if (lock_file(lockfds, F_WRLCK, "mom.lock", 1, NULL, 0)) { /* lock out other MOMs */
			log_errf(errno, msg_daemonname, "pbs_mom: another mom running");
			fprintf(stderr, "%s\n", "pbs_mom: another mom running");
			exit(1);
		}
	}
	if (freopen(NULL_DEVICE, "r", stdin) == NULL) 
		log_errf(-1, __func__, "freopen failed. ERR : %s", strerror(errno));
	if (freopen(NULL_DEVICE, "w", stdout) == NULL) 
		log_errf(-1, __func__, "freopen failed. ERR : %s", strerror(errno));	
	if (freopen(NULL_DEVICE, "w", stderr) == NULL) 
		log_errf(-1, __func__, "freopen failed. ERR : %s", strerror(errno));		
#else  /* DEBUG */
	setvbuf(stdout, NULL, _IONBF, 0);
	setvbuf(stderr, NULL, _IONBF, 0);
	if (stalone != 1) {
		log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
			   __func__, "Debug build does not fork.");
	}
#endif /* DEBUG */

	mom_pid = getpid();
	sprintf(log_buffer, "%d\n", mom_pid);
	if (ftruncate(lockfds, 0) == -1) 
		log_errf(-1, __func__, "ftruncate failed. ERR : %s", strerror(errno));		
	if (write(lockfds, log_buffer, strlen(log_buffer)) == -1) 
		log_errf(-1, __func__, "write failed. ERR : %s", strerror(errno));		

#ifndef WIN32 /* ------------------------------------------------------------*/

	daemon_protect(0, PBS_DAEMON_PROTECT_ON);
#ifdef _POSIX_MEMLOCK
	if (do_mlockall == 1) {
		if (mlockall(MCL_CURRENT | MCL_FUTURE) == -1) {
			log_err(errno, __func__, "mlockall failed");
		}
	}
#endif /* _POSIX_MEMLOCK */

	sigemptyset(&allsigs);
	sigaddset(&allsigs, SIGHUP);  /* remember to block these */
	sigaddset(&allsigs, SIGINT);  /* during critical sections */
	sigaddset(&allsigs, SIGTERM); /* so we don't get confused */
	sigaddset(&allsigs, SIGCHLD);
	sigaddset(&allsigs, SIGUSR1);
	sigaddset(&allsigs, SIGUSR2);
	sigaddset(&allsigs, SIGPIPE);
#ifdef SIGINFO
	sigaddset(&allsigs, SIGINFO);
#endif

	act.sa_flags = 0;
	act.sa_mask = allsigs;

	/*
	 **	We want to abort system calls
	 **	and call a function.
	 */
#ifdef SA_INTERRUPT
	act.sa_flags |= SA_INTERRUPT; /* don't restart system calls */
#endif
	act.sa_handler = catch_USR2;
	sigaction(SIGUSR2, &act, NULL);

	act.sa_handler = catch_child; /* set up to catch Death of Child */
	sigaction(SIGCHLD, &act, NULL);
	act.sa_handler = catch_hup; /* do a restart on SIGHUP */
	sigaction(SIGHUP, &act, NULL);

	act.sa_handler = toolong; /* handle an alarm call */
	sigaction(SIGALRM, &act, NULL);

	act.sa_handler = stop_me; /* shutdown for these */
	sigaction(SIGINT, &act, NULL);
	sigaction(SIGTERM, &act, NULL);
#ifdef SIGXCPU
	sigaction(SIGXCPU, &act, NULL);
#endif
#ifdef SIGXFSZ
	sigaction(SIGXFSZ, &act, NULL);
#endif
#ifdef SIGCPULIM
	sigaction(SIGCPULIM, &act, NULL);
#endif
#ifdef SIGSHUTDN
	sigaction(SIGSHUTDN, &act, NULL);
#endif
	/*
	 **	These signals will be sent to 'stop_me' which will just
	 **	return so they will be ignored.  This is so any process
	 **	that is exec'ed will not have SIG_IGN set for anything.
	 */
	sigaction(SIGPIPE, &act, NULL);
	sigaction(SIGUSR1, &act, NULL);
#ifdef SIGINFO
	sigaction(SIGINFO, &act, NULL);
#endif
#endif /* ! WIN32 end -------------------------------------------------------*/

	/* initialize variables */

	if ((jobs_idx = pbs_idx_create(0, 0)) == NULL) {
		log_err(-1, __func__, "Creating jobs index failed!");
		fprintf(stderr, "Creating jobs index failed!\n");
		return (-1);
	}

	CLEAR_HEAD(mom_pending_ruu);

	CLEAR_HEAD(svr_newjobs);
	CLEAR_HEAD(svr_alljobs);
	CLEAR_HEAD(mom_polljobs);
	CLEAR_HEAD(svr_requests);
	CLEAR_HEAD(mom_deadjobs);

#ifdef NAS_UNKILL /* localmod 011 */
	CLEAR_HEAD(killed_procs);
#endif /* localmod 011 */

	CLEAR_HEAD(svr_allhooks);
	CLEAR_HEAD(svr_queuejob_hooks);
	CLEAR_HEAD(svr_postqueuejob_hooks);
	CLEAR_HEAD(svr_modifyjob_hooks);
	CLEAR_HEAD(svr_resvsub_hooks);
	CLEAR_HEAD(svr_modifyresv_hooks);
	CLEAR_HEAD(svr_movejob_hooks);
	CLEAR_HEAD(svr_runjob_hooks);
	CLEAR_HEAD(svr_jobobit_hooks);
	CLEAR_HEAD(svr_management_hooks);
	CLEAR_HEAD(svr_modifyvnode_hooks);
	CLEAR_HEAD(svr_periodic_hooks);
	CLEAR_HEAD(svr_provision_hooks);
	CLEAR_HEAD(svr_resv_confirm_hooks);
	CLEAR_HEAD(svr_resv_begin_hooks);
	CLEAR_HEAD(svr_resv_end_hooks);
	CLEAR_HEAD(svr_hook_job_actions);
	CLEAR_HEAD(svr_hook_vnl_actions);

	CLEAR_HEAD(svr_execjob_begin_hooks);
	CLEAR_HEAD(svr_execjob_prologue_hooks);
	CLEAR_HEAD(svr_execjob_epilogue_hooks);
	CLEAR_HEAD(svr_execjob_preterm_hooks);
	CLEAR_HEAD(svr_execjob_launch_hooks);
	CLEAR_HEAD(svr_execjob_end_hooks);
	CLEAR_HEAD(svr_exechost_periodic_hooks);
	CLEAR_HEAD(svr_exechost_startup_hooks);
	CLEAR_HEAD(svr_execjob_attach_hooks);
	CLEAR_HEAD(svr_execjob_resize_hooks);
	CLEAR_HEAD(svr_execjob_abort_hooks);
	CLEAR_HEAD(svr_execjob_postsuspend_hooks);
	CLEAR_HEAD(svr_execjob_preresume_hooks);

	CLEAR_HEAD(task_list_immed);
	CLEAR_HEAD(task_list_timed);
	CLEAR_HEAD(task_list_event);
	CLEAR_HEAD(task_list_interleave);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	CLEAR_HEAD(svr_allcreds);
#endif

#ifdef WIN32
	CLEAR_HEAD(mom_copyreqs_list);

	_ftime_s(&tval);
	time_now = tval.time;
	srand(tval.millitm);
#else
	maxtm = time(0);
#endif

#ifndef WIN32
	/* block signals while we do things */
	if (sigprocmask(SIG_BLOCK, &allsigs, NULL) == -1)
		log_err(errno, __func__, "sigprocmask(BLOCK)");

	gettimeofday(&tval, NULL);
	time_now = tval.tv_sec;

	srandom(tval.tv_usec);
#endif /* !WIN32 */

	ret_size = 4096;
	if ((ret_string = malloc(ret_size)) == NULL) {
		perror("malloc");
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_OUTOFMEMORY;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif /* WIN32 */
		return (1);
	}

	tpp_fd = -1;
	if (init_network_add(sock_bind_mom, auth_handler, process_request) != 0) {

		c = SOCK_ERRNO;
		(void) sprintf(log_buffer,
			       "server port = %u, errno = %d",
			       pbs_mom_port, c);

		if (c == EADDRINUSE)
			(void) strcat(log_buffer, ", already in use");
		log_err(-1, msg_daemonname, log_buffer);
		(void) strcat(log_buffer, "\n");
#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_NETWORK_ACCESS_DENIED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif
		return (3);
	}

	if (init_network_add(sock_bind_rm, NULL, tcp_request) != 0) {

		c = SOCK_ERRNO;
		(void) sprintf(log_buffer,
			       "resource (tcp) port = %u, errno = %d",
			       pbs_rm_port, c);

		if (c == EADDRINUSE)
			(void) strcat(log_buffer, ", already in use");
		log_err(-1, msg_daemonname, log_buffer);
		(void) strcat(log_buffer, "\n");

#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_NETWORK_ACCESS_DENIED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif /* WIN32 */
		return (3);
	}

	sprintf(log_buffer, "Out of memory");
	if (pbs_conf.pbs_leaf_name) {
		char *p;
		nodename = strdup(pbs_conf.pbs_leaf_name);

		/* reset pbs_leaf_name to only the first leaf name with port */
		p = strchr(pbs_conf.pbs_leaf_name, ','); /* keep only the first leaf name */
		if (p)
			*p = '\0';
		p = strchr(pbs_conf.pbs_leaf_name, ':'); /* cut out the port */
		if (p)
			*p = '\0';
	} else {
		nodename = get_all_ips(mom_host, log_buffer, sizeof(log_buffer) - 1);
	}
	if (!nodename) {
		log_err(-1, __func__, log_buffer);
		fprintf(stderr, "%s\n", "Unable to determine TPP node name");
		return (1);
	}

	servername = get_servername(&serverport);
	localaddr = addclient_byname(LOCALHOST_SHORTNAME);
	(void) addclient_byname(mom_host);
	if (gethostname(ret_string, ret_size) == 0)
		(void) addclient_byname(ret_string);
	(void) addclient_byname(servername);
	if (pbs_conf.pbs_secondary) {
		servername = parse_servername(pbs_conf.pbs_secondary, &serverport);
		(void) addclient_byname(servername);
	}

	/* locate cput resource definition, needed for checking chkpt time */
	rdcput = &svr_resc_def[RESC_CPUT];
	rdwall = &svr_resc_def[RESC_WALLTIME];
	/* locate the checkpoint path */
	path_checkpoint_from_getenv = getenv("PBS_CHECKPOINT_PATH");
	path_checkpoint_default = mk_dirs("checkpoint/");
#define MAX_CHECKPOINT_DIR_RETRIES 5
	for (i = 0; i < MAX_CHECKPOINT_DIR_RETRIES; i++) {
		errno = 0;
		if ((c = set_checkpoint_path(path_checkpoint)) == 1)
			break;
		if (errno == ENOENT) {
			/* Skip the sleep() if this is the last try. */
			if (i >= (MAX_CHECKPOINT_DIR_RETRIES - 1))
				break;
			(void) sprintf(log_buffer, "%s %s %s %s",
				       "PBS checkpoint directory",
				       path_checkpoint ? path_checkpoint : "NULL",
				       "does not exist or is not NFS mounted.",
#ifdef WIN32
				       "Retrying in 2 secs."
#else
				       "Retrying in 1 minute."
#endif
			);
			log_err(errno, msg_daemonname, log_buffer);

#ifdef WIN32
			sleep(2);
#else
			sleep(60);
#endif
			continue;
		}
		break;
	}
	if (c == 0) {
		(void) sprintf(log_buffer, "%s %s %s %d %s",
			       "Error configuring PBS checkpoint directory",
			       path_checkpoint, "; Giving up after", i, "attempts.");
		log_err(errno, msg_daemonname, log_buffer);

#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_FILE_CORRUPT;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif /* WIN32 */
		return (3);
	}

#ifndef WIN32
	if (!mock_run)
		mom_nice();
#endif
	/*
	 * Recover the hooks.
	 *
	 */
	if (chdir(path_hooks) != 0) {
		(void) snprintf(log_buffer, sizeof(log_buffer),
				msg_init_chdir, path_hooks);
		log_err(errno, __func__, log_buffer);
		return (-1);
	}
	hook_suf_len = strlen(hook_suffix);

	dir = opendir(".");
	if (dir == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
			  LOG_DEBUG, msg_daemonname,
			  "Could not open hooks dir");
	} else {
		/* Now, for each hook found ... */
		while (errno = 0, (pdirent = readdir(dir)) != NULL) {
			/* recover the hooks */
			baselen = strlen(pdirent->d_name) - hook_suf_len;
			if (baselen < 0)
				continue;
			psuffix = pdirent->d_name + baselen;
			if (strcmp(psuffix, hook_suffix)) {
				continue;
			}

			if ((phook = hook_recov(pdirent->d_name, NULL, hook_msg,
						sizeof(hook_msg), python_script_alloc,
						python_script_free)) == NULL) {
				sprintf(log_buffer,
					"hook_recov(%s): can't recover - %s",
					pdirent->d_name, hook_msg);
				log_event(PBSEVENT_SYSTEM,
					  PBS_EVENTCLASS_SERVER, LOG_NOTICE,
					  msg_daemonname, log_buffer);
			} else {
				sprintf(log_buffer, "Found hook %s type=%s",
					phook->hook_name,
					((phook->type == HOOK_SITE) ? "site" : "pbs"));
				log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
						  PBSEVENT_DEBUG,
					  PBS_EVENTCLASS_SERVER,
					  LOG_INFO, msg_daemonname, log_buffer);

				if (update_joinjob_alarm_time &&
				    (phook->enabled == TRUE) &&
				    ((phook->event & HOOK_EVENT_EXECJOB_BEGIN) != 0)) {
					if (joinjob_alarm_time == -1)
						joinjob_alarm_time = 0;
					joinjob_alarm_time += phook->alarm;
				}
				if (update_job_launch_delay &&
				    (phook->enabled == TRUE) &&
				    ((phook->event & HOOK_EVENT_EXECJOB_PROLOGUE) != 0)) {
					if (job_launch_delay == -1)
						job_launch_delay = 0;
					job_launch_delay += phook->alarm;
				}
			}
		}
		if (errno != 0 && errno != ENOENT)
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
				  LOG_DEBUG, msg_daemonname,
				  "Could not read hooks dir");

		(void) closedir(dir);
	}

	snprintf(path_hooks_rescdef, MAXPATHLEN, "%s%s", path_hooks,
		 PBS_RESCDEF);
	hooks_rescdef_checksum = crc_file(path_hooks_rescdef);

	snprintf(log_buffer, sizeof(log_buffer),
		 "hooks_rescdef_checksum(%s)=%lu",
		 path_hooks_rescdef, hooks_rescdef_checksum);
	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  PBS_RESCDEF, log_buffer);
	path_rescdef = (char *) path_hooks_rescdef;

	/* Need to go back to mom's working directory since when recovering */
	/* hooks, we temporarily chdir-ed to the hooks directory. */
	if (chdir(mom_home) == -1) {
		log_err(errno, __func__, "pbs_mom unable to change working directory to mom home");
		return (-1);
	}

	print_hooks(0);
	print_hooks(HOOK_EVENT_EXECJOB_BEGIN);
	print_hooks(HOOK_EVENT_EXECJOB_PROLOGUE);
	print_hooks(HOOK_EVENT_EXECJOB_LAUNCH);
	print_hooks(HOOK_EVENT_EXECJOB_EPILOGUE);
	print_hooks(HOOK_EVENT_EXECJOB_PRETERM);
	print_hooks(HOOK_EVENT_EXECJOB_END);
	print_hooks(HOOK_EVENT_EXECHOST_PERIODIC);
	print_hooks(HOOK_EVENT_EXECHOST_STARTUP);
	print_hooks(HOOK_EVENT_EXECJOB_ATTACH);
	print_hooks(HOOK_EVENT_EXECJOB_RESIZE);
	print_hooks(HOOK_EVENT_EXECJOB_ABORT);
	print_hooks(HOOK_EVENT_EXECJOB_POSTSUSPEND);
	print_hooks(HOOK_EVENT_EXECJOB_PRERESUME);

	/* cleanup the hooks work directory */
	cleanup_hooks_workdir(0);
	cleanup_hooks_in_path_spool(0);

#ifdef PYTHON
#ifdef WIN32
	set_py_progname();
	Py_NoSiteFlag = 1;
	Py_FrozenFlag = 1;
	Py_OptimizeFlag = 2;
	Py_IgnoreEnvironmentFlag = 1;
	Py_InitializeEx(0);
#else
	char *python_binpath = NULL;
	static wchar_t w_python_binpath[MAXPATHLEN + 1] = {'\0'};
	PyStatus py_status;
	PyConfig py_config;

	PyConfig_InitPythonConfig(&py_config);

	py_config._install_importlib = 1;
	py_config.use_environment = 0;
	py_config.optimization_level = 2;
	py_config.isolated = 1;
	py_config.site_import = 0;
	py_config.install_signal_handlers = 0;
        if (w_python_binpath[0] == '\0') {
                if (get_py_progname(&python_binpath))
                        log_err(-1, __func__, "Failed to find python binary path!");
                mbstowcs(w_python_binpath, python_binpath, MAXPATHLEN + 1);
                free(python_binpath);
        }

	py_status = PyConfig_SetString(&py_config, &py_config.program_name, w_python_binpath);
	if (PyStatus_Exception(py_status))
		log_err(-1, __func__, "Failed to set python binary path!");

	py_status = Py_InitializeFromConfig(&py_config);
	if (PyStatus_Exception(py_status)) {
		log_err(-1, "Py_InitializeFromConfig",
			"--> Failed to initialize Python interpreter <--");
		PyConfig_Clear(&py_config);  // Clear the configuration object
	}
#endif
#endif

#ifndef WIN32
	initialize(); /* init RM code */
#endif

	rc = set_tpp_config(&pbs_conf, &tpp_conf, nodename, pbs_rm_port, pbs_conf.pbs_leaf_routers);
	free(nodename);

	if (rc == -1) {
		(void) sprintf(log_buffer, "Error setting TPP config");
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, msg_daemonname, log_buffer);
		fprintf(stderr, "%s", log_buffer);
		return (3);
	}

	tpp_set_app_net_handler(net_down_handler, net_restore_handler);

	if ((tppfd = tpp_init(&tpp_conf)) == -1) {
		(void) sprintf(log_buffer, "tpp_init failed");
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, msg_daemonname, log_buffer);
		fprintf(stderr, "%s", log_buffer);
		return (3);
	}
	(void) add_conn(tppfd, TppComm, (pbs_net_t) 0, 0, NULL, tpp_request);

	/* initialize machine dependent polling routines */
	if ((c = mom_open_poll()) != PBSE_NONE) {
		log_err(c, msg_daemonname, "pre_poll failed");

#ifdef WIN32
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_NETWORK_ACCESS_DENIED;
		if (g_ssHandle != 0)
			SetServiceStatus(g_ssHandle, &ss);
#endif /* WIN32 */
		return (3);
	}

	/* recover & abort Jobs which were under MOM's control */
// clang-format off
#ifdef	WIN32
	old_winsta = GetProcessWindowStation();

	strcpy(winsta_name, PBS_DESKTOP_NAME);
	strcpy(desktop_name, PBS_DESKTOP_NAME);

	if ((pwst = strrchr(winsta_name, '\\'))) {
		*pwst = '\0';
		strcpy(desktop_name, pwst+1);
	}
	/*
	 * Only members of the Administrators group are allowed
	 * to specify a name of windows station. If lpwinsta is
	 * NULL or an empty string the system forms a window station
	 * name using the logon session identifier for the calling process.
	 */

	pbs_winsta = CreateWindowStation(winsta_name, 0,
		WINSTA_ALL_ACCESS, NULL);

	if (pbs_winsta == NULL) {
		(void)sprintf(log_buffer, "CreateWindowStation failed! error=%d",
			GetLastError());
		log_err(errno, msg_daemonname, log_buffer);
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_INVALID_HANDLE;
		if (g_ssHandle != 0) SetServiceStatus(g_ssHandle, &ss);

		return (3);
	}

	sprintf(log_buffer, "Created window station=%s", winsta_name);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_NOTICE, __func__, log_buffer);

	SetProcessWindowStation(pbs_winsta);

	pbs_desktop = CreateDesktop(desktop_name, NULL, NULL,
		DF_ALLOWOTHERACCOUNTHOOK,
		READ_CONTROL|
		WRITE_DAC|
		DESKTOP_READOBJECTS|
		DESKTOP_CREATEWINDOW|
		DESKTOP_CREATEMENU|
		DESKTOP_HOOKCONTROL|
		DESKTOP_JOURNALRECORD|
		DESKTOP_JOURNALPLAYBACK|
		DESKTOP_ENUMERATE|
		DESKTOP_WRITEOBJECTS|
		DESKTOP_SWITCHDESKTOP, NULL);

	if (pbs_desktop == NULL) {
		(void)sprintf(log_buffer, "CreateDesktop failed! error=%d",
			GetLastError());
		log_err(errno, msg_daemonname, log_buffer);
		g_dwCurrentState = SERVICE_STOPPED;
		ss.dwCurrentState = g_dwCurrentState;
		ss.dwWin32ExitCode = ERROR_INVALID_HANDLE;
		if (g_ssHandle != 0) SetServiceStatus(g_ssHandle, &ss);

		return (3);
	}
	sprintf(log_buffer, "Created desktop %s in window station=%s",
		desktop_name, winsta_name);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_NOTICE, __func__, log_buffer);

	SetProcessWindowStation(old_winsta);

#endif	/* WIN32 */

	// clang-format on

	/* recover vnode to host map from file in case Server is not yet up */
	if ((c = recover_vmap()) != 0) {
		log_err(c, msg_daemonname, "unable to recover vnode to host mapping");
	}

	pbs_list_link multinode_jobs;

	/* recover & abort Jobs which were under MOM's control */
	init_abort_jobs(recover, &multinode_jobs);

	/* deploy periodic hooks */
	mom_hook_input_init(&hook_input);
	hook_input.vnl = (vnl_t *) vnlp;
	hook_input.jobs_list = &svr_alljobs;

	(void) mom_process_hooks(HOOK_EVENT_EXECHOST_PERIODIC,
				 PBS_MOM_SERVICE_NAME, mom_host, &hook_input,
				 NULL, NULL, 0, 0);

	/* record the fact that we are up and running */
	(void) sprintf(log_buffer, msg_startup1, PBS_VERSION, recover);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_FORCE,
		  LOG_NOTICE, PBS_EVENTCLASS_SERVER, msg_daemonname, log_buffer);
	(void) sprintf(log_buffer,
		       "Mom pid = %d ready, using ports Server:%d MOM:%d RM:%d",
		       mom_pid, default_server_port, pbs_mom_port, pbs_rm_port);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);

	/* tell server we have restarted */
#ifdef WIN32
	ss.dwCheckPoint = 0;
	g_dwCurrentState = SERVICE_RUNNING;
	ss.dwCurrentState = g_dwCurrentState;
	if (g_ssHandle != 0)
		SetServiceStatus(g_ssHandle, &ss);

	/* put here to minimize chance of hanging up or delaying mom startup */
	initialize();
#endif /* WIN32 */

#ifdef PMIX
	pbs_pmix_server_init(msg_daemonname);
#endif

	/*
	 * Now at last, we are ready to do some work, the following section
	 * constitutes the "main" loop of MOM
	 */
	for (; mom_run_state; finish_loop(wait_time)) {

#ifndef WIN32
		if (call_hup != HUP_CLEAR) {
			process_hup();
			internal_state_update = UPDATE_MOM_STATE;
		}
#endif

		time_now = time(NULL);
		if (server_stream == -1) {
			if (time_now > time_next_hello) {
				send_hellosvr(server_stream);
				time_next_hello = time_now + time_delta_hellosvr(MOM_DELTA_NORMAL);
				if (server_stream != -1) {
					job *m_job;
					for (m_job = (job *) GET_NEXT(multinode_jobs); m_job;
					     m_job = (job *) GET_NEXT(m_job->ji_multinodejobs)) {
						if (m_job->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {
							/* I am MS */
							resume_multinode(m_job);
						} else {
							/* I am sister */
							send_sisters(m_job, IM_RECONNECT_TO_MS, NULL);
						}
					}
					CLEAR_HEAD(multinode_jobs);
				}
			}
		} else
			send_pending_updates();

		wait_time = default_next_task();
#ifdef WIN32
		end_proc();
#endif

		dorestrict_user();

		/* check on User Activity */
		if (server_stream != -1) {
			if (idle_check > 0) {
				time_t lastkey, idletime;

				/*
				 * cycle stealing is turned on, monitor
				 * keyboard/mouse activity
				 *
				 * This impacts the "wait_time" above,  it must be
				 * about the same time of the next activity check
				 */
				lastkey = getkbdtime();
				if (lastkey > time_now)
					idletime = 0;
				else
					idletime = time_now - lastkey;

				if (internal_state & MOM_STATE_BUSYKB) {
					/* currently busy keyboard */
					if (idletime >= idle_avail) {
						/* no longer busy */
						internal_state &= ~MOM_STATE_BUSYKB;
						internal_state_update = UPDATE_MOM_STATE;
						went_busy = 0;
						wait_time = idle_poll;
						activate_jobs();
					}
				} else if (internal_state & MOM_STATE_INBYKB) {
					if (lastkey > (went_busy + idle_busy)) {
						internal_state &= ~MOM_STATE_INBYKB;
						internal_state |= MOM_STATE_BUSYKB;
						wait_time = 10;
					} else if (idletime > idle_busy) {
						/* can resume jobs */
						internal_state &= ~MOM_STATE_INBYKB;
						internal_state_update = UPDATE_MOM_STATE;
						went_busy = 0;
						wait_time = idle_poll;
						activate_jobs();
					}
					prior_key = lastkey;
				} else {
					/* not currently busy */
					if ((idletime < idle_avail) &&
					    (went_busy == 0) &&
					    (lastkey != prior_key)) {
						went_busy = lastkey;
						prior_key = lastkey;
						internal_state |= MOM_STATE_INBYKB;
						internal_state_update = UPDATE_MOM_STATE;
						wait_time = (idle_busy + 1) >> 1;
						idle_jobs();
						/* suspend jobs */
					}
				}
			} else if (idle_check == -1) {
				/*
				 * need to activate jobs that may have been idled before
				 * restart or SIGHUP
				 */
				activate_jobs();
				if (update_state_flag) {
					internal_state &= ~(MOM_STATE_INBYKB | MOM_STATE_BUSYKB | INUSE_BUSY);
					internal_state_update = UPDATE_MOM_STATE;
				}
				idle_check = 0;
			}
		}

		/*
		 * Is it time to update internal state?
		 * This is done at a more leisurely pace
		 */
		if (time_now > time_state_update) {
			time_state_update = time_now + STATE_UPDATE_TIME;

			/*
			 * If required, update node state info to Server
			 * check if loadave means we should be "busy"
			 */
			if (max_load_val > 0.0) {
				(void) get_la(&myla);
				/* check if need to update busy state */
				check_busy(myla);
			}
		}

		/*
		 * if needed, update server with my state change can be changed in
		 * check_busy() or query_adp()
		 */
		if (internal_state_update) {
			state_to_server(UPDATE_VNODES, 0);

			(void) send_hook_vnl(vnlp_from_hook);
			/*
			 * send_hook_vnl() saves 'vnlp_from_hook' internally, to be freed
			 * later when server acks the request.
			 */
			vnlp_from_hook = NULL;
		}

		/*
		 * Have we any jobs that can be purged now?
		 * They would be added to this list if the purge is ready to
		 * be done but the code is in the middle of a loop where
		 * purging the job would mess up the linked list over which
		 * the loop is running, or for some other reason it is not
		 * desirable to actually purge the job then.  For example,
		 * see chk_del_job() in mom_comm.c
		 * If any are found, then call dorestrict_user()
		 */
		i = 0;
		while ((pjob = (job *) GET_NEXT(mom_deadjobs)) != NULL) {
			/* sometimes this purge is happening earlier than
			* IS_DISCARD_JOB, which then does not get the pjob
			* pointer to call kill_job().
			*
			* Fixed by adding a kill_job here, which should be
			* no harm anyway.
			*/
			(void) kill_job(pjob, SIGKILL);
			job_purge_mom(pjob);
			++i;
		}
		if (i > 0)
			dorestrict_user();

		/*
		 * Have we any external (script) actions running for jobs
		 * that have gone longer than their alarm cut off time?
		 * If so, call the post action routine with error of -1
		 *
		 * Also, if this platform supports checkpoint/restart we
		 * want to minimize the wait time for qhold by using the
		 * minimum update time if a checkpoint is active.
		 */
		for (pjob = (job *) GET_NEXT(svr_alljobs);
		     pjob;
		     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
			if ((pjob->ji_momsubt != 0) &&
			    (pjob->ji_actalarm != 0) &&
			    (pjob->ji_actalarm < time_now)) {
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB,
					  LOG_INFO, pjob->ji_qs.ji_jobid,
					  "Action alarm time exceeded");
				kill(pjob->ji_momsubt, SIGKILL);
				pjob->ji_momsubt = 0;
				pjob->ji_mompost(pjob, -1);
				pjob->ji_mompost = NULL;
			}

			if (do_tolerate_node_failures(pjob) &&
			    (check_job_substate(pjob, JOB_SUBSTATE_WAITING_JOIN_JOB)) &&
			    (pjob->ji_joinalarm != 0) &&
			    (pjob->ji_joinalarm < time_now)) {
				int rcode;

				snprintf(log_buffer, sizeof(log_buffer), "sister_join_job_alarm wait time %ld secs exceeded", joinjob_alarm_time);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB,
					  LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
				set_job_substate(pjob, JOB_SUBSTATE_PRERUN);

				rcode = pre_finish_exec(pjob, 1);
				if (rcode == PRE_FINISH_SUCCESS)
					finish_exec(pjob);
				else if (rcode != PRE_FINISH_SUCCESS_JOB_SETUP_SEND)
					exec_bail(pjob, JOB_EXEC_RETRY, "pre_finish_exec failure");
				pjob->ji_joinalarm = 0;
			}

			if (pjob->ji_flags & MOM_CHKPT_ACTIVE)
				next_sample_time = min_check_poll;
		}

		/*
		 * Is it time to update resources used for jobs?
		 * This is done fairly slowly.  This rate applies to
		 * everything from here on in the main loop.
		 */

		if (time_now < (time_resc_updated + next_sample_time))
			continue;

		/*
		 * time to next resources check is set to MIN when new job run
		 * increments upwards until MAX time
		 */

		if (server_stream == -1)
			next_sample_time = max_check_poll;
		else if ((next_sample_time += inc_check_poll) > max_check_poll)
			next_sample_time = max_check_poll;
		DBPRT(("next_sample_time = %d\n", next_sample_time))

		/* are there any jobs? No - then don't bother with Resources */

		if ((pjob = (job *) GET_NEXT(svr_alljobs)) == NULL)
			continue;

		/* there are jobs so update status	 */
		/* if we just got a sample, don't bother */
		if (time_now > time_last_sample) {
			if (mom_get_sample() != PBSE_NONE)
				continue;
		}

		time_resc_updated = time_now;
		for (pjob = (job *) GET_NEXT(svr_alljobs);
		     pjob != NULL;
		     pjob = nxpjob) {

			/* next job pointer in case job is purged */
			nxpjob = (job *) GET_NEXT(pjob->ji_alljobs);

			/* check for job stuck waiting for Svr to ack obit */
			if (!pjob->ji_hook_running_bg_on && check_job_substate(pjob, JOB_SUBSTATE_OBIT) &&
			    pjob->ji_sampletim < time_now - 45) {
				send_obit(pjob, 0); /* resend obit */
			}
			/* check for job stuck waiting for sister to deljob */
			if ((check_job_substate(pjob, JOB_SUBSTATE_DELJOB)) &&
			    (pjob->ji_sampletim < (time_now - 2 * MAX_CHECK_POLL_TIME))) {
				/* just delete the job and let server deal */
				if (pjob->ji_preq) {
					req_reject(PBSE_SISCOMM, 0, pjob->ji_preq);
					pjob->ji_preq = NULL;
				}
				job_purge_mom(pjob);
				dorestrict_user();
				continue;
			}

			c = pjob->ji_qs.ji_svrflags;
			if (c & (JOB_SVFLG_OVERLMT1 | JOB_SVFLG_OVERLMT2 |
				 JOB_SVFLG_TERMJOB)) {
				/* job is over a limit, if it is not already  */
				/* being terminated by action script, kill it */
				if ((!check_job_substate(pjob, JOB_SUBSTATE_TERM)) && (time_now >= pjob->ji_overlmt_timestamp)) {
					/* Unset the TERMJOB flag for KILL signal */
					pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_TERMJOB;
					(void) kill_job(pjob, SIGKILL);
					continue;
				}
			}

			if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING))
				continue;

			/* update information for my tasks */
			(void) mom_set_use(pjob);

			/* see if need to check point any job */
			if (pjob->ji_chkpttype == PBS_CHECKPOINT_CPUT) {
				/* checkpoint on cputime used */
				prscput = find_resc_entry(
					get_jattr(pjob, JOB_ATR_resc_used),
					rdcput);
				if (pjob->ji_chkptnext > prscput->rs_value.at_val.at_long)
					continue;

				pjob->ji_chkptnext = prscput->rs_value.at_val.at_long + pjob->ji_chkpttime;

			} else if (pjob->ji_chkpttype == PBS_CHECKPOINT_WALLT) {
				/*  checkpoint on walltime */
				prswall = find_resc_entry(
					get_jattr(pjob, JOB_ATR_resc_used),
					rdwall);
				if (pjob->ji_chkptnext > prswall->rs_value.at_val.at_long)
					continue;

				pjob->ji_chkptnext = prswall->rs_value.at_val.at_long + pjob->ji_chkpttime;

			} else {
				continue; /* no checkpoint to do */
			}
			/* now do the actual checkpoint */
			if ((c = start_checkpoint(pjob, 0, 0)) == PBSE_NONE)
				continue;
			if (c == PBSE_NOSUP)
				continue;

			/* getting here means something bad happened */
			(void) sprintf(log_buffer,
				       "Checkpoint failed, error %d", c);
			(void) message_job(pjob, StdErr, log_buffer);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  pjob->ji_qs.ji_jobid, log_buffer);
		}

		/* dont try to send update to sevrer or send polls to sisters
		 * since server did not connect yet, and since that has not happened
		 * it means we do not have the IM_CLUSTERS information with us
		 */
		if (server_stream >= 0) {
			/* send updated resource usage info to server */
			update_jobs_status();
		}
#ifdef NAS /* localmod 153 */
		int rc_qflag = access(quiesce_mom_flag_file, F_OK);

		if (rc_qflag != 0 && mom_should_quiesce != 0) {
			log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, __func__, "mom is no longer quiesced");
			mom_should_quiesce = 0;
		} else if (rc_qflag == 0 && mom_should_quiesce == 0) {
			log_event(PBSEVENT_SYSTEM, 0, LOG_NOTICE, __func__, "mom will now quiesce");
			mom_should_quiesce = 1;
		}
#endif /* localmod 153 */

		if (mom_recvd_ip_cluster_addrs) {
			int num;
			hnodent *np;

			/* check on over limit condition for polled jobs */
			for (pjob = (job *) GET_NEXT(mom_polljobs); pjob;
			     pjob = (job *) GET_NEXT(pjob->ji_jobque)) {
#ifdef NAS /* localmod 153 */
				if (mom_should_quiesce) {
					break;
				}
#endif /* localmod 153 */
				if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING))
					continue;
				/*
				 ** Send message to get info from other MOM's
				 ** if I am Mother Superior for the job and
				 ** it is not being killed.
				 */
				if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) &&
				    (pjob->ji_nodekill == TM_ERROR_NODE)) {
					int err_flag = 0;
					/*
					 ** If can't send poll to everybody, the
					 ** time has come to die.
					 */
					if (send_sisters(pjob, IM_POLL_JOB, NULL) !=
					    pjob->ji_numnodes - 1) {

						for (num = 0, np = pjob->ji_hosts; num < pjob->ji_numnodes; num++, np++) {
							if (reliable_job_node_find(&pjob->ji_failed_node_list, np->hn_host) != NULL) {
								sprintf(log_buffer, "ignoring lost communication with %s for reliable job startup", np->hn_host);
								log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
								err_flag = 1;
							} else if ((time_now - np->hn_eof_ts) <= max_poll_downtime_val) {
								pjob->ji_nodekill = TM_ERROR_NODE; /* send poll failed, but dont kill job */
								sprintf(log_buffer, "lost communication with %s, not killing job yet", np->hn_host);
								log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
								err_flag = 1;
							}
						}
						if (err_flag == 0) {
							log_event(PBSEVENT_JOB | PBSEVENT_FORCE,
								  PBS_EVENTCLASS_JOB, LOG_INFO,
								  pjob->ji_qs.ji_jobid,
								  "send POLL failed");
							if (!is_comm_up(COMM_MATURITY_TIME)) {
								pjob->ji_nodekill = TM_ERROR_NODE; /* send poll failed, but dont kill job */
								sprintf(log_buffer, "Connection to pbs_comm down/recently established, not killing job");
								log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
							}
						}
					}
				}

				log_buffer[0] = '\0';
				c = pjob->ji_qs.ji_svrflags;

				/*
				 * Do not update job's overlimit timestamp
				 * when following flags are set
				 */
				if (c & (JOB_SVFLG_OVERLMT1 | JOB_SVFLG_OVERLMT2 | JOB_SVFLG_TERMJOB))
					continue;

				if (job_over_limit(pjob, recover)) {

					char *kill_msg;
					log_event(PBSEVENT_JOB | PBSEVENT_FORCE,
						  PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid, log_buffer);

					kill_msg = malloc(80 + strlen(log_buffer));
					if (kill_msg != NULL) {
						sprintf(kill_msg, "=>> PBS: job killed: %s\n", log_buffer);
						if (c & JOB_SVFLG_HERE) {
							message_job(pjob, StdErr, kill_msg);
						} else {
							/* Multi-mom scenario - adding a connection to demux for reporting error */

							struct sockaddr_in *ap;
							/* We always have a stream open to MS at node 0 */
							i = pjob->ji_hosts[0].hn_stream;
							if ((ap = tpp_getaddr(i)) == NULL) {
								log_joberr(-1, "over_limit_message",
									   "cannot write to job stderr because there is no stream to MS",
									   pjob->ji_qs.ji_jobid);
							} else {
								ipaddr = ap->sin_addr.s_addr;
								if ((fd = open_demux(ipaddr, pjob->ji_stderr)) == -1) {
									(void) sprintf(log_buffer,
										       "over_limit_message: cannot write to job stderr because open_demux failed");
									log_event(PBSEVENT_JOB | PBSEVENT_FORCE,
										  PBS_EVENTCLASS_JOB, LOG_INFO,
										  pjob->ji_qs.ji_jobid, log_buffer);
								} else {
									if (write(fd, get_jattr_str(pjob, JOB_ATR_Cookie),
									      strlen(get_jattr_str(pjob, JOB_ATR_Cookie))) == -1) 
											log_errf(-1, __func__, "write failed. ERR : %s", strerror(errno));					
									if (write(fd, kill_msg, strlen(kill_msg)) == -1) 
										log_errf(-1, __func__, "write failed. ERR : %s", strerror(errno));
									(void) close(fd);
								}
							}
						}
						free(kill_msg);
					}

					(void) terminate_job(pjob, 1);
				}
			} /* for pjob in mom_polljobs */
		}	  /* for pjob in svr_alljobs */
	}		  /* Mom main loop */

	/* if kill_jobs_on_exit set, kill any running/suspended jobs */

	if (kill_jobs_on_exit) {
		pjob = (job *) GET_NEXT(svr_alljobs);
		while (pjob) {
			if (check_job_substate(pjob, JOB_SUBSTATE_RUNNING) || check_job_substate(pjob, JOB_SUBSTATE_SUSPEND) || check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP))
				(void) kill_job(pjob, SIGKILL);
			else
				term_job(pjob);

			pjob = (job *) GET_NEXT(pjob->ji_alljobs);
		}
	}

#ifndef WIN32
	if (termin_child)
		scan_for_terminated();
#endif

	if (exiting_tasks)
		scan_for_exiting();
	(void) mom_close_poll();
	send_pending_updates();

	net_close(-1); /* close all network connections */
	tpp_shutdown();

	/* Have we any jobs that can be purged before we go away? */

	while ((pjob = (job *) GET_NEXT(mom_deadjobs)) != NULL)
		job_purge_mom(pjob);

	{
		int csret;
		if ((csret = CS_close_app()) != CS_SUCCESS) {
			/*had some problem closing the security library*/

			sprintf(log_buffer, "problem closing security library (%d)", csret);
			log_err(-1, __func__, log_buffer);
		}
	}

	cleanup();

#ifdef PMIX
	PMIx_server_finalize();
#endif

	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, "Is down");
	pbs_idx_destroy(jobs_idx);
	unload_auths();
	if (lock_file(lockfds, F_UNLCK, "mom.lock", 1, NULL, 0))
		log_errf(errno, msg_daemonname, "failed to unlock mom.lock file");
	log_close(1);
	close(lockfds);
	unlink("mom.lock");
#ifdef WIN32
	CloseDesktop(pbs_desktop);
	CloseWindowStation(pbs_winsta);
#endif

#ifdef PYTHON
	Py_Finalize();
#endif
	return (0);
}

/**
 * @brief
 *	make the directory names used by MOM
 *
 * @param[in] base - base path
 *
 * @return	string
 * @retval	string holding directory path
 *
 */

static char *
mk_dirs(char *base)
{
	char *pn;
	int ltop = strlen(pbs_conf.pbs_home_path);

	pn = malloc(ltop + strlen(base) + 2);
	if (pn == NULL)
#ifdef WIN32
		ExitThread(2);
#else
		exit(2);
#endif

	(void) strcpy(pn, pbs_conf.pbs_home_path);
#ifdef WIN32
	if (strchr(pn, '\\')) {
		if (*(pbs_conf.pbs_home_path + ltop - 1) != '\\')
			(void) strcat(pn, "\\");
	} else {
		if (*(pbs_conf.pbs_home_path + ltop - 1) != '/')
			(void) strcat(pn, "/");
	}
#else
	if (*(pbs_conf.pbs_home_path + ltop - 1) != '/')
		(void) strcat(pn, "/");
#endif /* WIN32 */
	(void) strcat(pn, base);
	return (pn);
}

#ifdef WIN32
int
main(int argc, char *argv[])
{
	int reg = 0;
	int unreg = 0;
	int stalone = 0;
	SC_HANDLE schManager;
	SC_HANDLE schSelf;
	TCHAR szFileName[MAX_PATH];

	/*the real deal or version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	if (argc > 1) {
		if (strcmp(argv[1], "-R") == 0)
			reg = 1;
		else if (strcmp(argv[1], "-U") == 0)
			unreg = 1;
		else if (strcmp(argv[1], "-N") == 0)
			stalone = 1;
		else
			usage2(argv[0]);
	}

	if (reg || unreg) {

		schManager = OpenSCManager(0, 0, SC_MANAGER_ALL_ACCESS);
		if (schManager == 0) {
			ErrorMessage("OpenSCManager");
			return 1;
		}

		if (reg) {
			GetModuleFileName(0, szFileName,
					  sizeof(szFileName) / sizeof(*szFileName));

			printf("Installing service %s\n", g_PbsMomName);
			schSelf =
				CreateService(schManager, g_PbsMomName,
					      __TEXT("PBS_MOM"),
					      SERVICE_ALL_ACCESS,
					      SERVICE_WIN32_OWN_PROCESS | SERVICE_INTERACTIVE_PROCESS,
					      SERVICE_AUTO_START, SERVICE_ERROR_NORMAL,
					      replace_space(szFileName, ""), 0, 0, 0, 0, 0);

			if (schSelf) {
				printf("Service %s installed successfully!\n",
				       g_PbsMomName);

			} else {
				ErrorMessage("CreateService");
				return 1;
			}

			if (schSelf != 0)
				CloseServiceHandle(schSelf);

		} else if (unreg) {
			schSelf = OpenService(schManager, g_PbsMomName, DELETE);

			if (schSelf) {
				if (DeleteService(schSelf)) {
					printf("Service %s uninstalled successfully!\n", g_PbsMomName);
				} else {
					ErrorMessage("DeleteService");
					return 1;
				}
			} else {
				ErrorMessage("OpenService failed");
				return 1;
			}
			if (schSelf != 0)
				CloseServiceHandle(schSelf);
		}

		if (schManager != 0)
			CloseServiceHandle(schManager);

	} else if (stalone) {

		struct arg_param *pap;
		int i, j;
		pap = create_arg_param();
		if (pap == NULL) {
			ErrorMessage("create_arg_param");
			return 1;
		}
		pap->argc = argc - 1; /* don't pass the second argument */
		for (i = j = 0; i < argc; i++) {
			if (i == 1)
				continue;
			if ((pap->argv[j] = strdup(argv[i])) == NULL) {
				free_arg_param(pap);
				ErrorMessage("strdup");
				return 1;
			}
			j++;
		}
		main_thread((void *) pap);
		if (cycle_harvester && interactive_svc_avail) {
			stop_pbs_interactive();
		}
		free_arg_param(pap);

	} else { /* run as service */
		SERVICE_TABLE_ENTRY ServiceTable[] = {
			{(TCHAR *) g_PbsMomName, PbsMomMain},
			{0}};

		if (getenv("PBS_CONF_FILE") == NULL) {
			char conf_path[80];
			char conf_env[80];
			char *p;
			char psave;
			struct stat sbuf;

			if (p = strstr(argv[0], "exec")) {
				psave = *p;
				*p = '\0';
				_snprintf(conf_path, 79, "%spbs.conf", argv[0]);
				*p = psave;
				if (stat(conf_path, &sbuf) == 0) {
					setenv("PBS_CONF_FILE", conf_path, 1);
				}
			}
		}
		hStop = CreateMutex(NULL, TRUE, NULL);
		if (!StartServiceCtrlDispatcher(ServiceTable)) {
			log_err(-1, "main", "StartServiceCtrlDispatcher");
			ErrorMessage("StartServiceCntrlDispatcher");
			return 1;
		}
		CloseHandle(hStop);
	}
	return (0);
}

/**
 * @brief
 *	Entry point for the service
 *
 * @param[in] dwArgc - Number of arguments in the rgszArgv array
 * @param[in] rgszArgv - Array of strings. The first string is the name of
 *			 the service and subsequent strings are passed by the process
 *			 that called the StartService function to start the service.
 *
 * @return Void
 *
 */
void
	WINAPI
	PbsMomMain(DWORD dwArgc, LPTSTR *rgszArgv)
{
	DWORD dwTID;
	DWORD dwWait;
	SERVICE_STATUS ss;
	DWORD i;

	struct arg_param *pap;

	g_ssHandle = RegisterServiceCtrlHandler(g_PbsMomName, PbsMomHandler);
	if (g_ssHandle == 0) {
		ErrorMessage("RegisterServiceCtrlHandler");
		return 1;
	}

	pap = create_arg_param();
	if (pap == NULL)
		return;
	pap->argc = dwArgc;

	for (i = 0; i < dwArgc; i++) {
		if ((pap->argv[i] = strdup(rgszArgv[i])) == NULL) {
			free_arg_param(pap);
			ErrorMessage("strdup");
			return 1;
		}
	}

	g_hthreadMain = (HANDLE) _beginthreadex(0, 0, main_thread, pap, 0, &dwTID);
	if (g_hthreadMain == 0) {
		(void) free_arg_param(pap);
		ErrorMessage("CreateThread");
		return 1;
	}

	dwWait = WaitForSingleObject(g_hthreadMain, INFINITE);
	if (dwWait != WAIT_OBJECT_0) {
		(void) free_arg_param(pap);
		ErrorMessage("WaitForSingleObject");
		return 1;
	}

	// NOTE: Update the global service state variable to indicate
	//      that the server has STOPPED. Use this to ACK the SCM
	//      that the service has stopped using SetServiceStatus.
	ZeroMemory(&ss, sizeof(ss));
	ss.dwServiceType = SERVICE_WIN32_OWN_PROCESS | SERVICE_INTERACTIVE_PROCESS;
	ss.dwCurrentState = SERVICE_STOPPED;
	ss.dwControlsAccepted = SERVICE_ACCEPT_STOP | SERVICE_ACCEPT_SHUTDOWN;

	if (g_ssHandle != 0)
		SetServiceStatus(g_ssHandle, &ss);

	free_arg_param(pap);
}

/**
 * @brief
 *	Handler function accepts shutdown and releases mutex so the
 *	PbsMomMain() can know it's time to exit.
 *
 * @param[in] dwControl - control code
 *
 * @return Void
 *
 */
void
	WINAPI
	PbsMomHandler(DWORD dwControl)
{
	SERVICE_STATUS ss;

	ZeroMemory(&ss, sizeof(ss));
	ss.dwServiceType = SERVICE_WIN32_OWN_PROCESS | SERVICE_INTERACTIVE_PROCESS;
	ss.dwCurrentState = g_dwCurrentState;
	ss.dwControlsAccepted = SERVICE_ACCEPT_STOP | SERVICE_ACCEPT_SHUTDOWN;

	switch (dwControl) {
		case SERVICE_CONTROL_STOP:
		case SERVICE_CONTROL_SHUTDOWN:
			// DONE: When you receive a stop request, update the global state
			//      variable to indicate that a STOP is pending. You need
			//      to then ACK the SCM by calling SetServiceStatus. Set
			//      the check point to 1 and the wait hint to 1 second,
			//      since we are going to wait for the server to shutdown.

			g_dwCurrentState = SERVICE_STOP_PENDING;
			ss.dwCurrentState = g_dwCurrentState;
			ss.dwCheckPoint = 1;
			ss.dwWaitHint = 1000;
			if (g_ssHandle != 0)
				SetServiceStatus(g_ssHandle, &ss);

			/*
			 log_close(1);
			 TerminateThread(g_hthreadMain, 0);
			 */
			ReleaseMutex(hStop);
			kill_jobs_on_exit = 1;

			/* if cycle harvesting configured and PBS_INTERACTIVE service is registered and started, then stop PBS_INTERACTIVE service */
			if (cycle_harvester && interactive_svc_avail) {
				_beginthreadex(0, 0, (void *) stop_pbs_interactive, NULL, 0, 0);
			}

			CloseHandle(g_hthreadMain);
			break;

		default:
			if (g_ssHandle != 0)
				SetServiceStatus(g_ssHandle, &ss);
			break;
	}
}
#else /* WIN32 */

#endif /* WIN32 */

/* the following is used in support of the getkbdtime() function */

static int check_idle_daemon = 1;
struct input_dev_list {
	int idl_here;
	char *idl_name;
} input_dev_list[] = {
	{1, "/dev/mouse"},
	{1, "/dev/kbd"},
	{1, "/dev/keybd"},
	{1, "/dev/kbd0"},
	{1, "/dev/kbd1"},
	{1, "/dev/hid/mouse_000"},
	{1, "/dev/hid/kbd_000"},
	{0, NULL}};

/**
 * @brief
 *	set most recent access time found for dev/file
 *      maxtm set if the dev/file st_atime is more recent than current value
 *
 * @param[in] dev - dev/file
 *
 * @retval  -1 if dev/file does not exist
 * @retval   0 if dev/file st_atime not most recent
 * @retval  +1 if dev/file st_atime is most recent (so far)
 *
 */
static int
setmax(char *dev)
{
	struct stat sb;

	if (stat(dev, &sb) == -1)
		return -1;
	if (maxtm < sb.st_atime) {
		maxtm = sb.st_atime;
		return 1;
	}

	return 0;
}

/**
 * get the most recent access time for mouse/keyboard/...
 *	we assume that "time_now" is the current time
 */
#ifdef WIN32
/**
 * @brief
 *	gets most recent access time found for idle_touch file
 *
 * @return	time_t
 * @retval	-1		Failure
 * @retval	max time	Success
 *
 */

time_t
getkbdtime()
{
	char idle_touch[MAX_PATH];

	/* Create full path of idle_touch file */
	snprintf(idle_touch, MAX_PATH, "%s/spool/idle_touch", pbs_conf.pbs_home_path);

	/* set most recent access time found for idle_touch file */
	if (setmax(idle_touch) == -1) {
		/* idled_touch file not found, Log this event and disable cycle harvesting */
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "Cycle Harvesting Failed, Please contact Admin");
		log_event(PBSEVENT_SYSTEM, 0, LOG_WARNING, "Cycle_Harvesting", log_buffer);
		cycle_harvester = 0;
		idle_check = -1;
	}
	return (maxtm);
}
#else

time_t
getkbdtime(void)
{
	DIR *dp;
	struct dirent *de;
	static char idle_dir[MAXPATHLEN + 1] = {'\0'};
	char *idle_file = NULL;
	struct input_dev_list *pl = &input_dev_list[0];
	int i;
	int checked = 0;
	char *ptsname;

	/* since we call this function so often, only want to set this once */
	if (idle_dir[0] == '\0')
		snprintf(idle_dir, sizeof(idle_dir), "%s/spool/idledir", pbs_conf.pbs_home_path);

	if (check_idle_daemon) {
		if ((dp = opendir(idle_dir)) != NULL) {
			while ((de = readdir(dp)) != NULL) {
				ptsname = de->d_name;

				if (maxtm >= time_now)
					break;
				if (*ptsname == '.')
					continue;
				pbs_asprintf(&idle_file, "%s/%s", idle_dir, ptsname);
				if (setmax(idle_file) > 0)
					checked = 1;
				free(idle_file);
			}
			closedir(dp);
		} else
			check_idle_daemon = 0;
	}

	if (checked == 0) {
		/* look at list of know keyboard/mouse devices */
		for (i = 0; (pl + i)->idl_name; ++i) {
			if ((pl + i)->idl_here && (pl + i)->idl_name) {
				if (setmax((pl + i)->idl_name) == -1)
					(pl + i)->idl_here = 0; /* ignore this now on */
			}
		}
	}

	return (maxtm);
}
#endif /* WIN32 */

/**
 * @brief
 *	returns the idle time of keyboard
 *
 * @param[in] attrib - pointer to rm_attribute structure
 *
 * @return	string
 * @retval	NULL	Failure
 * @retval	string	Success
 *
 */
char *
idletime(struct rm_attribute *attrib)
{
	time_t idle;
	time_t lastkey;

	if (attrib) {
		rm_errno = RM_ERR_BADPARAM;
		return NULL;
	}

	time_now = time(0);

	lastkey = getkbdtime();
	if (lastkey > time_now)
		idle = 0;
	else
		idle = time_now - lastkey;
	sprintf(ret_string, "%lu", (u_long) idle);
	return ret_string;
}

/**
 * @brief
 *	suspend/resume jobs based on keyboard being active/idle
 *	This function is like susp_resum() in requests.except that a
 *	different flag is set
 *
 * @param[in] pjob - pointer to job
 * @param[in] which is 1 to suspend, 0 to resume
 *
 * @return Void
 *
 */
static void
active_idle(job *pjob, int which)
{
	DBPRT(("active_idle (keyboard): %s job %s\n",
	       which == 1 ? "suspending" : "resuming", pjob->ji_qs.ji_jobid))
	if (((which == 1) && ((pjob->ji_qs.ji_svrflags &
			       (JOB_SVFLG_Suspend | JOB_SVFLG_Actsuspd)) == 0)) ||
	    ((which == 0) && ((pjob->ji_qs.ji_svrflags &
			       (JOB_SVFLG_Suspend | JOB_SVFLG_Actsuspd)) ==
			      JOB_SVFLG_Actsuspd))) {
		if (do_susres(pjob, which) < 0)
			return;
	}

	time_now = time(0);
	if (which == 1) { /* suspend */
		set_job_substate(pjob, JOB_SUBSTATE_SUSPEND);
		pjob->ji_qs.ji_svrflags |= JOB_SVFLG_Actsuspd;
		send_wk_job_idle(pjob->ji_qs.ji_jobid, which);
		if ((pjob->ji_qs.ji_svrflags &
		     (JOB_SVFLG_Suspend | JOB_SVFLG_Actsuspd)) == 0) {
			stop_walltime(pjob);
		}
	} else { /* resume */
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) == 0) {
			start_walltime(pjob);
			set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
		}
		pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_Actsuspd;
		send_wk_job_idle(pjob->ji_qs.ji_jobid, which);
	}
	job_save(pjob);
}

void
do_multinodebusy(job *pjob, int which)
{
	int stream;

	DBPRT(("multinodebusy: dealing with job %s\n", pjob->ji_qs.ji_jobid))

	if (chk_mom_action(MultiNodeBusy) == Requeue) {

		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) != 0) {

			/* this is Mother Superior, kill and requeue job */

			pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_RERUN;
			(void) kill_job(pjob, SIGKILL);
			/* Server will decide if job is rerunnable or not */
		} else {

			/* I am a sister node, send requeue message to Mom Superior */

			stream = pjob->ji_hosts[0].hn_stream;
			im_compose(stream, pjob->ji_qs.ji_jobid,
				   get_jattr_str(pjob, JOB_ATR_Cookie),
				   IM_REQUEUE, TM_NULL_EVENT, TM_NULL_TASK, IM_OLD_PROTOCOL_VER);
			dis_flush(stream);
		}
	}
}

/**
 * @brief
 *	idle all running jobs on keyboard active
 *	Even jobs that have been suspended on "suspend" signal request are idled
 *	At the current time, only single node jobs are suspended,
 *	multinode jobs are ignored or requeued.
 *
 * @return	Void
 *
 */
void
idle_jobs(void)
{
	job *pjob;
	update_state_flag = 0;
	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		if (check_job_state(pjob, JOB_STATE_LTR_RUNNING) &&
		    ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Actsuspd) == 0)) {
			/* right now we can only handle one node jobs */
			if (pjob->ji_numnodes == 1) {
				update_state_flag = 1;
				active_idle(pjob, 1);
			} else {
				do_multinodebusy(pjob, 1);
			}
		}
	}
}

/**
 * @brief
 *	activate all idle jobs on keyboard going idle
 *	Even jobs that have been suspended on "suspend" signal request are
 *	"activated", though they will remain in suspend state.
 *	At the current time, only single node jobs are handled.
 *
 * @return	Void
 *
 */

void
activate_jobs(void)
{
	job *pjob;
	update_state_flag = 0;
	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		if (check_job_state(pjob, JOB_STATE_LTR_RUNNING) &&
		    ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Actsuspd) != 0)) {
			if (pjob->ji_numnodes == 1) {
				update_state_flag = 1;
				active_idle(pjob, 0);
			}
		}
	}
}

/**
 * @brief
 *	If current load average >= max_load_val and busy not already set
 *		set it
 *	If current load average lt ideal_load_val and busy currently set
 *		unset it
 */
static void
check_busy(double mla)
{
	extern int internal_state;
	extern float ideal_load_val;
	extern float max_load_val;

	if ((mla >= max_load_val) && ((internal_state & INUSE_BUSY) == 0)) {
		internal_state |= INUSE_BUSY;
		internal_state_update = UPDATE_MOM_STATE;
		if (idle_on_maxload)
			idle_jobs();
	} else if ((mla < ideal_load_val) && ((internal_state & INUSE_BUSY) != 0)) {
		internal_state = (internal_state & ~INUSE_BUSY);
		internal_state_update = UPDATE_MOM_STATE;
		if (idle_on_maxload)
			activate_jobs();
	}
}

/**
 * @fn mom_topology
 * @brief
 *	compute and export platform-dependent topology information
 *
 * @return	void
 *
 * @par MT-Safe:	no
 * @par Side Effects:
 *	None
 *
 * @par Note:	nominally, we use the Open-MPI hardware locality (a.k.a. hwloc)
 *		functions to export the topology information that it generates,
 *		but the case for the Cray is different.
 *
 *		Also note that whenever we want the topology node attribute to
 *		contain a different type of information, this function will need
 *		to change.
 *
 *		On Windows we use native Windows API's to discover the topology
 *
 * @see	dep_topology()
 *
 */
void
mom_topology(void)
{
	extern char mom_short_name[];
	extern callfunc_t vn_callback;
	int ret = -1;
	char *xmlbuf = NULL;
	int xmllen = 0;
	vnl_t *vtp = NULL;
	char *topology_type;
	int fd[2];
	int pid;

#ifndef WIN32
	if (pipe(fd) == -1) 
		log_errf(-1, __func__, "pipe API failed. ERR : %s", strerror(errno));

	if ((pid = fork()) == -1) {
		log_err(PBSE_SYSTEM, __func__, "fork failed");
		return;
	}

	if (pid == 0) {
		hwloc_topology_t topology;
		ret = 0;

		close(fd[0]);

		ret = hwloc_topology_init(&topology);
		if (ret == 0)
#if HWLOC_API_VERSION < 0x00020000
			ret = hwloc_topology_set_flags(topology,
						       HWLOC_TOPOLOGY_FLAG_WHOLE_SYSTEM |
							       HWLOC_TOPOLOGY_FLAG_IO_DEVICES);
#else
			ret = hwloc_topology_set_io_types_filter(topology,
								 HWLOC_TYPE_FILTER_KEEP_ALL);
#endif
		if (ret == 0)
			ret = hwloc_topology_load(topology);
		if (ret == 0)
#if HWLOC_API_VERSION < 0x00020000
			ret = hwloc_topology_export_xmlbuffer(topology,
							      &xmlbuf, &xmllen);
#else
			ret = hwloc_topology_export_xmlbuffer(topology,
							      &xmlbuf, &xmllen,
							      HWLOC_TOPOLOGY_EXPORT_XML_FLAG_V1);
#endif
		if (ret != 0)
			ret = -1;

		if (write(fd[1], &ret, (sizeof(ret))) == -1) 
			log_errf(-1, __func__, "write failed. ERR : %s", strerror(errno));
		if (write(fd[1], &xmllen, (sizeof(xmllen))) == -1) 
			log_errf(-1, __func__, "write failed. ERR : %s", strerror(errno));			
		if (write(fd[1], xmlbuf, xmllen) == -1) 
			log_errf(-1, __func__, "write failed. ERR : %s", strerror(errno));			

		hwloc_free_xmlbuffer(topology, xmlbuf);
		hwloc_topology_destroy(topology);

		exit(0);
	} else {
		close(fd[1]);

		if (read(fd[0], &ret, sizeof(ret)) == -1) 
			log_errf(-1, __func__, "read failed. ERR : %s", strerror(errno));
		if (read(fd[0], &xmllen, sizeof(xmllen)) == -1) 
			log_errf(-1, __func__, "read failed. ERR : %s", strerror(errno));			
		if ((xmlbuf = malloc(xmllen + 1)) == NULL) {
			log_err(PBSE_SYSTEM, __func__, "malloc failed");
			return;
		}
		xmlbuf[xmllen] = '\0';
		if (read(fd[0], xmlbuf, xmllen) == -1) 
			log_errf(-1, __func__, "read failed. ERR : %s", strerror(errno));

		close(fd[0]);

		waitpid(pid, NULL, 0);
	}
	if (ret < 0) {
		/* on any failure above, issue log message */
		log_err(PBSE_SYSTEM, __func__, "topology init/load/export failed");
		return;
	} else
#endif
	{
		char *lbuf;
		int lbuflen = xmllen + 1024;
#ifdef WIN32
		int no_of_sockets = 0;
#endif

		/*
		 *	xmlbuf is almost certain to overflow log_buffer's size,
		 *	so for logging this information, we allocate one large
		 *	enough to hold it
		 */
		if ((lbuf = malloc(lbuflen)) == NULL) {
			sprintf(log_buffer, "malloc logbuf (%d) failed",
				lbuflen);
			goto bad;
		} else {
			sprintf(lbuf, "allocated log buffer, len %d", lbuflen);
			log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE,
				  LOG_DEBUG, __func__, lbuf);
		}
		log_event(PBSEVENT_DEBUG4,
			  PBS_EVENTCLASS_NODE,
			  LOG_DEBUG, __func__, "topology exported");
		if (vnl_alloc(&vtp) == NULL) {
			log_err(PBSE_SYSTEM, __func__, "vnl_alloc failed");
			free(lbuf);
			goto bad;
		}
#ifndef WIN32
		topology_type = NODE_TOPOLOGY_TYPE_HWLOC;
		sprintf(lbuf, "%s%s", topology_type, xmlbuf);
#else
		topology_type = NODE_TOPOLOGY_TYPE_WIN;
		no_of_sockets = count_sockets();
		if (no_of_sockets == -1)
			goto bad;
		sprintf(lbuf, "%ssockets:%d,gpus:%d,mics:%d", topology_type,
			no_of_sockets, count_gpus(), count_mics());
#endif
		if ((ret = vn_addvnr(vtp, mom_short_name, ATTR_NODE_TopologyInfo,
				     lbuf, ATR_TYPE_STR, READ_ONLY,
				     NULL)) != 0) {
			log_err(PBSE_SYSTEM, __func__, "vnl_addvnr failed");
			vnl_free(vtp);
			free(lbuf);
			goto bad;
		} else {
#ifndef WIN32
			sprintf(lbuf, "attribute '%s = %s%s' added", ATTR_NODE_TopologyInfo,
				topology_type, xmlbuf);
			log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__, lbuf);
#else
			sprintf(log_buffer, "attribute '%s = %s' added", ATTR_NODE_TopologyInfo,
				lbuf);
			log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
				  log_buffer);
#endif
		}
		if (vnlp == NULL) {
			/*
			 *	We must create a natural vnode to hold the
			 *	ATTR_NODE_TopologyInfo attribute.  This natural
			 *	vnode must also include available memory and
			 *	ncpus information.
			 */

			char attrbuf[1024];
			char valbuf[1024];
			char *memstr = physmem(NULL);

			sprintf(attrbuf, "%s.%s", ATTR_rescavail, "mem");
			sprintf(valbuf, "%s", memstr != NULL ? memstr : "0");
			if ((ret = vn_addvnr(vtp, mom_short_name, attrbuf,
					     valbuf, 0, 0, NULL)) != 0) {
				log_err(PBSE_SYSTEM, __func__, "vnl_alloc failed");
				vnl_free(vtp);
				free(lbuf);
				goto bad;
			} else {
				sprintf(lbuf, "resource '%s = %s' added",
					attrbuf, valbuf);
				log_event(PBSEVENT_DEBUG4,
					  PBS_EVENTCLASS_NODE,
					  LOG_DEBUG, __func__, lbuf);
			}

			sprintf(attrbuf, "%s.%s", ATTR_rescavail, "ncpus");
			sprintf(valbuf, "%d", num_acpus);
			if ((ret = vn_addvnr(vtp, mom_short_name, attrbuf,
					     valbuf, 0, 0, NULL)) != 0) {
				log_err(PBSE_SYSTEM, __func__, "vnl_alloc failed");
				vnl_free(vtp);
				free(lbuf);
				goto bad;
			} else {
				sprintf(lbuf, "resource '%s = %s' added",
					attrbuf, valbuf);
				log_event(PBSEVENT_DEBUG4,
					  PBS_EVENTCLASS_NODE,
					  LOG_DEBUG, __func__, lbuf);
			}
			vtp->vnl_modtime = time(NULL);
			vnlp = vtp;

		} else {
			vn_merge(vnlp, vtp, vn_callback);
			vnl_free(vtp);
		}
		free(lbuf);
	}
bad:
#ifndef WIN32
	free(xmlbuf);
#else
    ;
#endif
}


================================================
FILE: src/resmom/mom_pmix.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_pmix.c
 */

#include <pbs_config.h>

#ifdef PMIX

#include <stdio.h>
#include <string.h>
#include <time.h>
#include <errno.h>
#include <sys/types.h>
#include <sys/wait.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <errno.h>
#include <pthread.h>
#include "mom_pmix.h"
#include "mom_func.h"
#include "list_link.h"
#include "log.h"
#include "tm.h"

extern char *log_file;
extern char *path_log;
extern char mom_short_name[];
extern pbs_list_head svr_alljobs;

#if 0

/*
 * Some operations like spawn and fence are not atomic and occur
 * over a series of steps. In some cases, data needs to be retained
 * and used in subsequent steps. We might choose to define a data
 * structure that houses both tracking information (e.g. namespace,
 * operation type, etc.) together with an opaque union to house the
 * underlying data. That is what is being suggested (but not yet
 * implemented) here.
 */

/* Enumerate operations that require PBS to call back */
typedef enum pbs_pmix_oper_type {
	PBS_PMIX_OPER_NONE,
	PBS_PMIX_FENCE,
	PBS_PMIX_SPAWN,
	/* Add new operations before PBS_PMIX_OPER_UNDEFINED */
	PBS_PMIX_OPER_UNDEFINED
} pbs_pmix_oper_type_t;

/* Data structure to house auxiliary PMIx operation data */
typedef struct pbs_pmix_oper {
	pbs_pmix_oper_type_t type;
	job *pjob;
	struct pbs_pmix_oper *next;
	union {
		pbs_pmix_fence_data_t fence;
		pbs_pmix_spawn_data_t spawn;
	} data;
} pbs_pmix_oper_t;

#endif

/* Locking structure and macros */
typedef struct {
	pthread_mutex_t mutex;
	pthread_cond_t cond;
	volatile bool active;
	pmix_status_t status;
} pbs_pmix_lock_t;

#define PBS_PMIX_CONSTRUCT_LOCK(l)                     \
	do {                                           \
		pthread_mutex_init(&(l)->mutex, NULL); \
		pthread_cond_init(&(l)->cond, NULL);   \
		(l)->active = true;                    \
		(l)->status = PMIX_SUCCESS;            \
	} while (0)

#define PBS_PMIX_DESTRUCT_LOCK(l)                   \
	do {                                        \
		pthread_mutex_destroy(&(l)->mutex); \
		pthread_cond_destroy(&(l)->cond);   \
	} while (0)

#define PBS_PMIX_WAIT_THREAD(lck)                                       \
	do {                                                            \
		pthread_mutex_lock(&(lck)->mutex);                      \
		while ((lck)->active) {                                 \
			pthread_cond_wait(&(lck)->cond, &(lck)->mutex); \
		}                                                       \
		pthread_mutex_unlock(&(lck)->mutex);                    \
	} while (0)

#define PBS_PMIX_WAKEUP_THREAD(lck)                   \
	do {                                          \
		pthread_mutex_lock(&(lck)->mutex);    \
		(lck)->active = false;                \
		pthread_cond_broadcast(&(lck)->cond); \
		pthread_mutex_unlock(&(lck)->mutex);  \
	} while (0)

/**
 * @brief
 * This callback function is invoked by the PMIx library after it
 * has been notified a process has exited.
 *
 * @param[in] status - exit status of the process
 * @param[in] cbdata - opaque callback data passed to the caller
 *
 * @retval void
 *
 * @note
 * This function may be superfluous, in which case the call to
 * PMIx_Notify_event() should be passed NULL in pbs_pmix_notify_exit()
 * for its callback and this funtion removed. It has been left in for
 * the time being so that the log shows it being called.
 */
static void
pbs_pmix_notify_exit_cb(pmix_status_t status, void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
}

/**
 * @brief
 * Notify PMIx that a task has exited by constructing a PMIx info
 * array and passing it to PMIx_Notify_event.
 *
 * @param[in] pjob - pointer to the job structure for the exited task
 * @param[in] exitstat - numeric exit status of the task
 * @param[in] msg - optional message supplied by the caller
 *
 * @retval void
 */
void
pbs_pmix_notify_exit(job *pjob, int exitstat, char *msg)
{
	pmix_status_t status;
	pmix_info_t *pinfo;
	size_t ninfo;
	pmix_proc_t procname, procsrc;
	bool flag = true;

	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	if (!pjob) {
		log_event(PBSEVENT_DEBUG, 0, LOG_ERR, __func__,
			  "No job supplied, returning");
		return;
	}
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid,
		  "Setting up the info array for termination");
	/* Info array will contain three entries */
	ninfo = 3;
	/* Add one if a message was provided */
	if (msg)
		ninfo++;
	/* Create the info array */
	PMIX_INFO_CREATE(pinfo, ninfo);
	/* Ensure this only goes to the job terminated event handler */
	PMIX_INFO_LOAD(&pinfo[0], PMIX_EVENT_NON_DEFAULT, &flag, PMIX_BOOL);
	/* Provide the exit status of the application */
	PMIX_INFO_LOAD(&pinfo[1], PMIX_JOB_TERM_STATUS, &exitstat, PMIX_STATUS);
	/* Provide the rank */
	PMIX_LOAD_PROCID(&procname, pjob->ji_qs.ji_jobid, PMIX_RANK_WILDCARD);
	PMIX_INFO_LOAD(&pinfo[2], PMIX_EVENT_AFFECTED_PROC, &procname, PMIX_PROC);
	/* Provide the message if provided */
	if (msg)
		PMIX_INFO_LOAD(&pinfo[3], PMIX_EVENT_TEXT_MESSAGE, msg, PMIX_STRING);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, "Info array populated");
	/*
	 * The source of the event may not be mother superior because it
	 * will cause the PMIx server to upcall recursively. Use an
	 * undefined rank as the source.
	 */
	PMIX_LOAD_PROCID(&procsrc, pjob->ji_qs.ji_jobid, PMIX_RANK_UNDEF);
	status = PMIx_Notify_event(PMIX_ERR_JOB_TERMINATED, &procsrc,
				   PMIX_RANGE_SESSION, pinfo, ninfo, pbs_pmix_notify_exit_cb,
				   NULL);
	switch (status) {
		/* The first four status cases are documented */
		case PMIX_SUCCESS:
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid,
				  "Exit notification pending callback");
			break;
		case PMIX_OPERATION_SUCCEEDED:
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid,
				  "Exit notification successful");
			break;
		case PMIX_ERR_BAD_PARAM:
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid,
				  "Exit notification contains bad parameter");
			break;
		case PMIX_ERR_NOT_SUPPORTED:
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid,
				  "Exit notification not supported");
			break;
		default:
			/* An undocumented error type was encountered */
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				   pjob->ji_qs.ji_jobid,
				   "Exit notification failed: %s",
				   PMIx_Error_string(status));
			break;
	}
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
}

/**
 * @brief
 * Client called PMIx_server_register_client
 *
 * @param[in] proc - client handle
 * @param[in] server_object - value provided by caller
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_client_connected(
	const pmix_proc_t *proc,
	void *server_object,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_OPERATION_SUCCEEDED;
}

/**
 * @brief
 * Client called PMIx_Finalize
 *
 * @param[in] proc - client handle
 * @param[in] server_object - value provided by caller
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_client_finalized(
	const pmix_proc_t *proc,
	void *server_object,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_OPERATION_SUCCEEDED;
}

/**
 * @brief
 * Client called PMIx_Abort
 *
 * @param[in] proc - client handle
 * @param[in] server_object - value provided by caller
 * @param[in] status - client status
 * @param[in] msg - client status message
 * @param[in] procs - array of client handle pointers
 * @param[in] nprocs - number of client handle pointers
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_abort(
	const pmix_proc_t *proc,
	void *server_object,
	int status,
	const char msg[],
	pmix_proc_t procs[],
	size_t nprocs,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	int i;
	job *pjob;

	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	if (!proc) {
		log_err(-1, __func__, "pmix_proc_t parameter is NULL");
		log_event(PBSEVENT_DEBUG, 0, LOG_DEBUG, __func__, "returning");
		return PMIX_ERROR;
	}
	if (!proc->nspace || (*proc->nspace == '\0')) {
		log_err(-1, __func__, "Invalid PMIx namespace");
		log_event(PBSEVENT_DEBUG, 0, LOG_DEBUG, __func__, "returning");
		return PMIX_ERROR;
	}
	pjob = find_job((char *) proc->nspace);
	if (!pjob) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Job not found: %s", proc->nspace);
		log_err(-1, __func__, log_buffer);
		log_event(PBSEVENT_DEBUG, 0, LOG_DEBUG, __func__, "returning");
		return PMIX_ERROR;
	}
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid, "abort status: %d", status);
	if (msg && *msg) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			   pjob->ji_qs.ji_jobid, "abort message: %s", msg);
	}
	if (!procs) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, "All processes to be aborted");
	} else {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, "Following processes to be aborted:");
		for (i = 0; i < nprocs; i++) {
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				   pjob->ji_qs.ji_jobid, "namespace/rank: %s/%u",
				   procs[i].nspace, procs[i].rank);
		}
	}
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * At least one client called PMIx_Fence (blocking) or
 * PMIx_Fence_nb (non-blocking)
 *
 * @param[in] procs - array of client handle pointers
 * @param[in] nprocs - number of client handle pointers
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] data - data (string) to aggregate
 * @param[in] ndata - length of data
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 *
 * @note
 * Required attributes:
 * PMIX_COLLECT_DATA
 * Optional attributes:
 * PMIX_TIMEOUT
 * PMIX_COLLECTIVE_ALGO
 * PMIX_COLLECTIVE_ALGO_REQD
 */
static pmix_status_t
pbs_pmix_fence_nb(
	const pmix_proc_t proc[],
	size_t nproc,
	const pmix_info_t info[],
	size_t ninfo,
	char *data,
	size_t ndata,
	pmix_modex_cbfunc_t cbfunc,
	void *cbdata)
{
	int i;
	job *pjob;

	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	if (!proc) {
		log_err(-1, __func__, "pmix_proc_t parameter is NULL");
		return PMIX_ERROR;
	}
	if (!proc->nspace || (*proc->nspace == '\0')) {
		log_err(-1, __func__, "Invalid PMIx namespace");
		return PMIX_ERROR;
	}
	pjob = find_job((char *) proc->nspace);
	if (!pjob) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Job not found: %s", proc->nspace);
		log_err(-1, __func__, log_buffer);
		return PMIX_ERROR;
	}
	for (i = 0; i < nproc; i++) {
		log_eventf(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__,
			   "proc[%d].nspace = %s", i, proc[i].nspace);
		log_eventf(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__,
			   "proc[%d].rank = %u", i, (unsigned int) proc[i].rank);
	}
	for (i = 0; i < ninfo; i++) {
		log_eventf(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__,
			   "info[%d].key = %s", i, info[i].key);
	}
	log_eventf(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__,
		   "There are %lu data entries", ndata);
	/*
	 * If MS, find/create the barrier for this job. Otherwise, send
	 * a message to MS that a fence has been encountered. Once all
	 * ranks have been accounted for, invoke the callback function.
	 */
	log_eventf(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__,
		   "cbfunc %s NULL", cbfunc ? "is not" : "is");
	log_eventf(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__,
		   "cbdata %s NULL", cbdata ? "is not" : "is");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_OPERATION_SUCCEEDED;
}

/**
 * @brief
 * PMIx server on local host is requesting information from remote
 * node hosting provided proc handle
 *
 * @param[in] proc - client handle pointer
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - required callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_direct_modex(
	const pmix_proc_t *proc,
	const pmix_info_t info[],
	size_t ninfo,
	pmix_modex_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Caller is requesting data be published per the PMIx API spec
 *
 * @param[in] proc - client handle pointer
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_publish(
	const pmix_proc_t *proc,
	const pmix_info_t info[],
	size_t ninfo,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Caller is requesting published data be looked up
 *
 * @param[in] proc - client handle pointer
 * @param[in] keys - array of strings to lookup
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_lookup(
	const pmix_proc_t *proc,
	char **keys,
	const pmix_info_t info[],
	size_t ninfo,
	pmix_lookup_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Delete previously published data from the data store
 *
 * @param[in] proc - client handle pointer
 * @param[in] keys - array of strings to lookup
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_unpublish(
	const pmix_proc_t *proc,
	char **keys,
	const pmix_info_t info[],
	size_t ninfo,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Client called PMIx_Spawn
 *
 * @param[in] proc - client handle pointer
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] apps - array of application handles
 * @param[in] napps - number of application handles
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 *
 * @note
 * The PMIx spec refers to the info parameter as job_info. PMIx refers to
 * an application or client as a job, whereas a job refers to a batch job
 * in PBS nomenclature.
 */
static pmix_status_t
pbs_pmix_spawn(
	const pmix_proc_t *proc,
	const pmix_info_t info[],
	size_t ninfo,
	const pmix_app_t apps[],
	size_t napps,
	pmix_spawn_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Record process(es) as connected
 *
 * @param[in] procs - array of client handle pointers
 * @param[in] nprocs - number of client handle pointers
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_connect(
	const pmix_proc_t procs[],
	size_t nprocs,
	const pmix_info_t info[],
	size_t ninfo,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Record process(es) as disconnected
 *
 * @param[in] procs - array of client handle pointers
 * @param[in] nprocs - number of client handle pointers
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_disconnect(
	const pmix_proc_t procs[],
	size_t nprocs,
	const pmix_info_t info[],
	size_t ninfo,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Register to recieve event notifications
 *
 * @param[in] codes - array of status codes to register for
 * @param[in] ncodes - number of codes in the array
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_register_events(
	pmix_status_t *codes,
	size_t ncodes,
	const pmix_info_t info[],
	size_t ninfo,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Deregister from event notifications
 *
 * @param[in] codes - array of status codes to deregister
 * @param[in] ncodes - number of codes in the array
 * @param[in] info - PMIx info array (parameters provided by caller)
 * @param[in] ninfo - number of info array entries
 * @param[in] cbfunc - optional callback function
 * @param[in] cbdata - opaque data provided to cbfunc
 *
 * @return pmix_status_t
 * @retval PMIX_SUCCESS - request in progress, cbfunc should not be called
 *                        here but will be called later by PMIx
 * @retval PMIX_OPERATION_SUCCEEDED - request immediately processed and
 *                                    successful, cbfunc will not be called
 * @retval PMIX_ERR_BAD_PARAM - one of the provided parameters was invalid
 * @retval PMIX_ERR_NOT_IMPLEMENTED - function not implemented
 */
static pmix_status_t
pbs_pmix_deregister_events(
	pmix_status_t *codes,
	size_t ncodes,
	pmix_op_cbfunc_t cbfunc,
	void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return PMIX_ERR_NOT_IMPLEMENTED;
}

/**
 * @brief
 * Initialize the PMIx server
 *
 * @param[in] name - name of daemon (used for logging)
 *
 * @return void
 *
 * @note
 * The PMIx library spawns threads from pbs_mom to act as the PMIx server
 * for applications (PMIx clients) assigned to this vnode. The pbs_mom acts
 * as the PMIx server even though all it does is call PMIx library functions.
 * It also means that if pbs_mom exits, any PMIx clients (PMIx enabled
 * applications) will lose their local server and fail.
 */
void
pbs_pmix_server_init(char *name)
{
	pmix_status_t pstat;
	pmix_server_module_t pbs_pmix_server_module = {
		/* v1x interfaces */
		.client_connected = pbs_pmix_client_connected,
		.client_finalized = pbs_pmix_client_finalized,
		.abort = pbs_pmix_abort,
		.fence_nb = pbs_pmix_fence_nb,
		.direct_modex = pbs_pmix_direct_modex,
		.publish = pbs_pmix_publish,
		.lookup = pbs_pmix_lookup,
		.unpublish = pbs_pmix_unpublish,
		.spawn = pbs_pmix_spawn,
		.connect = pbs_pmix_connect,
		.disconnect = pbs_pmix_disconnect,
		.register_events = pbs_pmix_register_events,
		.deregister_events = pbs_pmix_deregister_events,
		.listener = NULL
#if PMIX_VERSION_MAJOR > 1
		,
		/* v2x interfaces */
		.notify_event = NULL,
		.query = NULL,
		.tool_connected = NULL,
		.log = NULL,
		.allocate = NULL,
		.job_control = NULL,
		.monitor = NULL
#endif
#if PMIX_VERSION_MAJOR > 2
		,
		/* v3x interfaces */
		.get_credential = NULL,
		.validate_credential = NULL,
		.iof_pull = NULL,
		.push_stdin = NULL
#endif
#if PMIX_VERSION_MAJOR > 3
		,
		/* v4x interfaces */
		.group = NULL
#endif
	};

	pstat = PMIx_server_init(&pbs_pmix_server_module, NULL, 0);
	if (pstat != PMIX_SUCCESS) {
		log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
			   LOG_ERR, name,
			   "Could not initialize PMIx server: %s",
			   PMIx_Error_string(pstat));
	} else {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
			  LOG_DEBUG, name, "PMIx server initialized");
	}
}

/**
 * @brief
 * Generic callback used to wakeup a locked thread
 *
 * @param[in] status - status of locked thread
 * @cbdata[in] cbdata - callback data (pbs_pmix_lock_t *)
 *
 * @return void
 */
static void
pbs_pmix_wait_cb(pmix_status_t status, void *cbdata)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	if (!cbdata) {
		log_err(-1, __func__, "cbdata may not be NULL, returning");
		return;
	}
	log_eventf(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__,
		   "Setting thread status to %s", PMIx_Error_string(status));
	((pbs_pmix_lock_t *) cbdata)->status = status;
	PBS_PMIX_WAKEUP_THREAD((pbs_pmix_lock_t *) cbdata);
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
}

/**
 * @brief
 * Register the PMIx client and adjust the environment so the child will
 * be able to phone home
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] tvnodeid - the global rank of the task
 * @param[in/out] envpp - environment array to modify
 *
 * @return void
 */
void
pbs_pmix_register_client(job *pjob, int tvnodeid, char ***envpp)
{
	char **ep;
	pmix_status_t pstat;
	pmix_proc_t pproc;
	int before, after;
	pbs_pmix_lock_t pmix_lock;

	if (!pjob) {
		log_err(-1, __func__, "Invalid job pointer");
		return;
	}
	if (!envpp) {
		log_err(-1, __func__, "Invalid environment pointer");
		return;
	}
	/* Register the PMIx client */
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "Registering PMIx client %d", tvnodeid);
	/* Rank is based on tvnodeid */
	PMIX_LOAD_PROCID(&pproc, pjob->ji_qs.ji_jobid, tvnodeid);
	PBS_PMIX_CONSTRUCT_LOCK(&pmix_lock);
	pstat = PMIx_server_register_client(&pproc,
					    pjob->ji_qs.ji_un.ji_momt.ji_exuid,
					    pjob->ji_qs.ji_un.ji_momt.ji_exgid,
					    NULL, pbs_pmix_wait_cb, (void *) &pmix_lock);
	PBS_PMIX_WAIT_THREAD(&pmix_lock);
	PBS_PMIX_DESTRUCT_LOCK(&pmix_lock);
	if (pstat != PMIX_SUCCESS) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			   pjob->ji_qs.ji_jobid,
			   "Failed to register PMIx client: %s",
			   PMIx_Error_string(pstat));
		return;
	}
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		   pjob->ji_qs.ji_jobid,
		   "PMIx client %d registered", tvnodeid);
	/* Setup for the PMIx fork */
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "Setting up PMIx fork for client %d", tvnodeid);
	/* Allow PMIx to add required environment variables */
	for (before = 0, ep = *envpp; ep && *ep; before++, ep++) {
	}
	pstat = PMIx_server_setup_fork(&pproc, envpp);
	if (pstat != PMIX_SUCCESS) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			   pjob->ji_qs.ji_jobid,
			   "Failed to setup PMIx server fork: %s",
			   PMIx_Error_string(pstat));
		return;
	}
	for (after = 0, ep = *envpp; ep && *ep; after++, ep++) {
	}
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		   pjob->ji_qs.ji_jobid,
		   "PMIx server setup fork added %d env var(s)",
		   (after - before));
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, "PMIx server setup fork complete");
}

/**
 * @brief
 * Calculate the number of characters required to print an integer
 *
 * @param[in] val - interger value
 *
 * @return int
 * @retval length of string to print provided integer
 */
static int
intlen(int val)
{
	int i = 1;

	if (val < 0) {
		i++;
		val *= -1;
	}
	for (; val > 9; i++)
		val /= 10;
	return i;
}

/*
 * @brief
 * Construct a map of the vnodes and ranks that will be provided to PMIx.
 *
 * @param[in] pjob - pointer to job structure
 * @param[out] nodelist - comma separated list of node names
 * @param[out] nodect - number of nodes in list
 * @param[out] nodeid - numeric rank of the local node
 * @param[out] ppnlist - list of ranks on all nodes
 * @param[out] ppnlocal - list of ranks on this node
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - failure
 *
 * @note
 * The node list looks like: host0,host1,...
 * There are no duplicates in the node list
 * The ppn list looks like: 0,100,200;1,101,201;...
 * Order matches that of the node list with same number of entries
 * The ppnlocal list is the list of ranks on the local node
 */
static int
pbs_pmix_gen_map(
	job *pjob,
	char **nodelist,
	uint32_t *nodect,
	uint32_t *nodeid,
	char **ppnlist,
	char **ppnlocal)
{
	typedef struct {
		vmpiprocs *pmpiproc;
		int nextrank;
		int locrank;
	} pbs_pmix_map_t;
	pbs_pmix_map_t *map;
	int i, j, ilen, jlen, nodelen, ppnlen, ppnloclen, msnlen, locrank;
	char *iname, *jname, *pn, *pp, *ploc, *pdot;

	if (nodelist)
		*nodelist = NULL;
	if (nodeid)
		*nodeid = 0;
	if (nodect)
		*nodect = 0;
	if (ppnlist)
		*ppnlist = NULL;
	if (ppnlocal)
		*ppnlocal = NULL;
	if (!nodelist || !nodeid || !nodect || !ppnlist || !ppnlocal)
		return -1;
	if (!pjob)
		return -1;
	if (pjob->ji_numvnod < 1)
		return -1;
	map = calloc(pjob->ji_numvnod, sizeof(pbs_pmix_map_t));
	if (!map)
		return -1;
	for (i = 0; i < pjob->ji_numvnod; i++) {
		map[i].pmpiproc = &pjob->ji_vnods[i];
		map[i].nextrank = -1;
		map[i].locrank = -1;
	}
	msnlen = strlen(mom_short_name);
	/*
	 * The following loop calculates the length of the node and
	 * PPN lists. It also sets up the map array so that it will
	 * be easier to construct the lists.
	 */
	for (nodelen = ppnlen = ppnloclen = i = 0; i < pjob->ji_numvnod; i++) {
		if (map[i].locrank >= 0)
			continue;
		map[i].locrank = locrank = 0;
		iname = map[i].pmpiproc->vn_hname ? map[i].pmpiproc->vn_hname : map[i].pmpiproc->vn_host->hn_host;
		if ((pdot = strchr(iname, '.')) != NULL)
			ilen = pdot - iname;
		else
			ilen = strlen(iname);
		nodelen += ilen + 1;
		ppnlen += intlen(i) + 1;
		if (ilen == msnlen) {
			if (strncmp(mom_short_name, iname, ilen) == 0)
				ppnloclen += intlen(i) + 1;
		}
		/* Add additional ranks on this node */
		for (j = i + 1; j < pjob->ji_numvnod; j++) {
			jname = map[j].pmpiproc->vn_hname ? map[j].pmpiproc->vn_hname : map[j].pmpiproc->vn_host->hn_host;
			if ((pdot = strchr(jname, '.')) != NULL)
				jlen = pdot - jname;
			else
				jlen = strlen(jname);
			if (ilen == jlen) {
				if (strncmp(iname, jname, jlen) == 0) {
					map[i].nextrank = j;
					map[j].locrank = ++locrank;
					ppnlen += intlen(j) + 1;
					if (jlen == msnlen) {
						if (strncmp(mom_short_name, jname, jlen) == 0) {
							ppnloclen += intlen(map[j].locrank) + 1;
						}
					}
				}
			}
		}
	}
	/* Perform some sanity checks */
	if (nodelen < 1) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			   pjob->ji_qs.ji_jobid,
			   "%s: zero length node list", __func__);
		free(map);
		return -1;
	}
	if (ppnlen < 1) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			   pjob->ji_qs.ji_jobid,
			   "%s: zero length ppn list", __func__);
		free(map);
		return -1;
	}
	if (ppnloclen < 1) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			   pjob->ji_qs.ji_jobid,
			   "%s: zero length local ppn list", __func__);
		free(map);
		return -1;
	}
	/* Allocate the memory for the lists themselves */
	*nodelist = malloc(nodelen);
	if (!*nodelist) {
		free(map);
		return -1;
	}
	*ppnlist = malloc(ppnlen);
	if (!*ppnlist) {
		free(map);
		free(*nodelist);
		*nodelist = NULL;
		return -1;
	}
	*ppnlocal = malloc(ppnloclen);
	if (!*ppnlocal) {
		free(map);
		free(*nodelist);
		*nodelist = NULL;
		free(*ppnlist);
		*ppnlist = NULL;
		return -1;
	}
	/* Construct the node and PPN lists using the map array */
	pn = *nodelist;
	*pn = '\0';
	pp = *ppnlist;
	*pp = '\0';
	ploc = *ppnlocal;
	*ploc = '\0';
	for (i = 0, j = 0; i < pjob->ji_numvnod; i++) {
		bool localnode;
		int next;

		if (map[i].locrank != 0)
			continue;
		iname = map[i].pmpiproc->vn_hname ? map[i].pmpiproc->vn_hname : map[i].pmpiproc->vn_host->hn_host;
		if ((pdot = strchr(iname, '.')) != NULL)
			ilen = pdot - iname;
		else
			ilen = strlen(iname);
		/* Append to the node list */
		if (pn != *nodelist) {
			sprintf(pn, ",");
			pn++;
		}
		snprintf(pn, ilen + 1, "%s", iname);
		pn += ilen;
		(*nodect)++;
		/* Determine if this rank is on the local node */
		localnode = false;
		if (ilen == msnlen) {
			if (strncmp(mom_short_name, iname, ilen) == 0)
				localnode = true;
		}
		if (localnode)
			*nodeid = j;
		/* Append to the PPN and local PPN lists */
		if (pp != *ppnlist) {
			sprintf(pp, ";");
			pp++;
		}
		sprintf(pp, "%d", i);
		pp += intlen(i);
		if (localnode) {
			sprintf(ploc, "%d", i);
			ploc += intlen(i);
		}
		for (next = map[i].nextrank; next >= 0; next = map[next].nextrank) {
			sprintf(pp, ",%d", next);
			pp += intlen(next) + 1;
			if (localnode) {
				sprintf(ploc, ",%d", next);
				ploc += intlen(next) + 1;
			}
		}
		j++;
	}
	free(map);
	return 0;
}

/**
 * @brief
 * Register the PMIx namespace on the local node
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return void
 *
 * @note
 * Populate a PMIx info array and pass it to PMIx_server_register_nspace().
 * This function relies on pbs_pmix_gen_map() to construct the data in the
 * info array.
 */
static void
pbs_pmix_register_namespace(job *pjob)
{
	pmix_info_t *pinfo;
	pmix_status_t pstat;
	pmix_rank_t rank;
	pbs_pmix_lock_t pmix_lock;
	char *pmix_node_list = NULL;
	char *pmix_ppn_list = NULL;
	char *pmix_ppn_local = NULL;
	char *pmix_node_regex;
	char *pmix_ppn_regex;
	int loc_size;
	int msnlen;
	int rc;
	int i, n, ninfo;
	uint32_t ui, pmix_node_ct, pmix_node_idx;

	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	if (!pjob) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
			  NULL, "Invalid job pointer");
		return;
	}
	rc = pbs_pmix_gen_map(pjob, &pmix_node_list,
			      &pmix_node_ct, &pmix_node_idx,
			      &pmix_ppn_list, &pmix_ppn_local);
	if (rc != 0) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid,
			  "Failed to generate PMIx mapping");
		return;
	}
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "PMIX nodes: %s", pmix_node_list);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "PMIX ppn: %s", pmix_ppn_list);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "PMIX local ppn: %s", pmix_ppn_local);
	/* Generate the regex */
	PMIx_generate_regex(pmix_node_list, &pmix_node_regex);
	PMIx_generate_ppn(pmix_ppn_list, &pmix_ppn_regex);
	msnlen = strlen(mom_short_name);
	/* Count the number of ranks assigned to this node */
	for (loc_size = i = 0; i < pjob->ji_numvnod; i++) {
		char *pdot, *hname;
		int hlen;

		hname = pjob->ji_vnods[i].vn_hname ? pjob->ji_vnods[i].vn_hname : pjob->ji_vnods[i].vn_host->hn_host;
		if (!hname || (*hname == '\0'))
			continue;
		pdot = strchr(hname, '.');
		if (pdot)
			hlen = pdot - hname;
		else
			hlen = strlen(hname);
		if (hlen != msnlen)
			continue;
		if (strncmp(mom_short_name, hname, hlen) != 0)
			continue;
		loc_size++;
	}
	free(pmix_node_list);
	pmix_node_list = NULL;
	free(pmix_ppn_list);
	pmix_ppn_list = NULL;
	ninfo = 14;
	PMIX_INFO_CREATE(pinfo, ninfo);
	n = 0;
	/*
	 * INFO #1: Universe size
	 */
	ui = pjob->ji_numvnod;
	/*
	 * Do not increment n in the PMIX_INFO_LOAD macro call!
	 * The macro references the first parameter multiple
	 * times and would thereby increment it multiple times.
	 */
	PMIX_INFO_LOAD(&pinfo[n], PMIX_UNIV_SIZE, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_UNIV_SIZE: %u", ++n, ui);
	/*
	 * INFO #2: Maximum number of processes the user is allowed
	 * to start within this allocation - usually the same as
	 * univ_size
	 */
	ui = pjob->ji_numvnod;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_MAX_PROCS, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_MAX_PROCS: %u", ++n, ui);
	/*
	 * INFO #3: Number of processess being spawned in this job
	 * Note that job refers to a PMIx job (i.e. application)
	 * Note that this again is a value PMIx could compute from
	 * the proc_map
	 */
	ui = pjob->ji_numvnod;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_JOB_SIZE, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_JOB_SIZE: %u", ++n, ui);
	/*
	 * INFO #4: Node map
	 */
	PMIX_INFO_LOAD(&pinfo[n], PMIX_NODE_MAP, pmix_node_regex, PMIX_STRING);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_NODE_MAP: %s", ++n, pmix_node_regex);
	/*
	 * INFO #5: Process map
	 */
	PMIX_INFO_LOAD(&pinfo[n], PMIX_PROC_MAP, pmix_ppn_regex, PMIX_STRING);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_PROC_MAP: %s", ++n, pmix_ppn_regex);
	/*
	 * INFO #6: This process was not created by PMIx_Spawn()
	 */
	ui = 0;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_SPAWNED, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_SPAWNED: %u", ++n, ui);
	/*
	 * INFO #7: Number of local ranks for this application
	 * Note: This could be smaller than the nnumber allocated
	 *       if the application is not utilizing them all.
	 */
	ui = loc_size;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_LOCAL_SIZE, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_LOCAL_SIZE: %u", ++n, ui);
	/*
	 * INFO #8: Number of local ranks for this allocation
	 */
	ui = loc_size;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_NODE_SIZE, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_NODE_SIZE: %u", ++n, ui);
	/*
	 * INFO #9: Number of ranks for the entire job
	 */
	ui = pmix_node_ct;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_NUM_NODES, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_NUM_NODES: %u", ++n, ui);
	/*
	 * INFO #10: Comma delimited list of ranks on local node
	 */
	PMIX_INFO_LOAD(&pinfo[n], PMIX_LOCAL_PEERS, pmix_ppn_local, PMIX_STRING);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_LOCAL_PEERS: %s", ++n, pmix_ppn_local);
	/*
	 * INFO #11: Process leader on local node (first rank)
	 */
	if (sscanf(pmix_ppn_local, "%u", &rank) != 1) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid,
			  "Invalid rank in local ppn list");
		/* Punt and set it to zero */
		rank = 0;
	}
	PMIX_INFO_LOAD(&pinfo[n], PMIX_LOCALLDR, &rank, PMIX_PROC_RANK);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_LOCALLDR: %u", ++n, rank);
	free(pmix_ppn_local);
	pmix_ppn_local = NULL;
	/*
	 * INFO #12: Index of the local node in the node map
	 */
	ui = pmix_node_idx;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_NODEID, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_NODEID: %u", ++n, ui);
	/*
	 * INFO #13: The job ID string
	 */
	PMIX_INFO_LOAD(&pinfo[n], PMIX_JOBID, pjob->ji_qs.ji_jobid, PMIX_STRING);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_JOBID: %s", ++n, pjob->ji_qs.ji_jobid);
	/*
	 * INFO #14: Number of different executables in this PMIx job
	 */
	ui = 1;
	PMIX_INFO_LOAD(&pinfo[n], PMIX_JOB_NUM_APPS, &ui, PMIX_UINT32);
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   pjob->ji_qs.ji_jobid,
		   "%d. PMIX_JOB_NUM_APPS: %u", ++n, ui);
	/* Grab the lock and register the PMIx namespace */
	PBS_PMIX_CONSTRUCT_LOCK(&pmix_lock);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, "Registering PMIx namespace");
	pstat = PMIx_server_register_nspace(pjob->ji_qs.ji_jobid, loc_size,
					    pinfo, ninfo, pbs_pmix_wait_cb, (void *) &pmix_lock);
	PBS_PMIX_WAIT_THREAD(&pmix_lock);
	PBS_PMIX_DESTRUCT_LOCK(&pmix_lock);
	PMIX_INFO_FREE(pinfo, ninfo);
	if (pstat != PMIX_SUCCESS) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			   pjob->ji_qs.ji_jobid,
			   "Failed to register PMIx namespace: %s",
			   PMIx_Error_string(pstat));
	} else {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, "PMIx namespace registered");
	}
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
}

/*
 * @brief
 * Deregister the PMIx namespace for a job on the local node
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return void
 */
static void
pbs_pmix_deregister_namespace(job *pjob)
{
	pbs_pmix_lock_t pmix_lock;

	/* Grab the lock and deregister the PMIx namespace */
	PBS_PMIX_CONSTRUCT_LOCK(&pmix_lock);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, "Deregistering PMIx namespace");
	PMIx_server_deregister_nspace(pjob->ji_qs.ji_jobid,
				      pbs_pmix_wait_cb, (void *) &pmix_lock);
	PBS_PMIX_WAIT_THREAD(&pmix_lock);
	PBS_PMIX_DESTRUCT_LOCK(&pmix_lock);
}

/*
 * @brief
 * Extra processing required when spawning a TM task with PMIx enabled
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] pnode - pointer to node entry for local node
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - failure
 */
int
pbs_pmix_job_join_extra(job *pjob, hnodent *pnode)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	pbs_pmix_register_namespace(pjob);
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return 0;
}

/*
 * @brief
 * Extra processing required when reaping a TM task with PMIx enabled
 *
 * @param[in] pjob - pointer to job structure
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - failure
 */
int
pbs_pmix_job_clean_extra(job *pjob)
{
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "called");
	pbs_pmix_deregister_namespace(pjob);
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, "returning");
	return 0;
}

#endif /* PMIX */


================================================
FILE: src/resmom/mom_pmix.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_pmix.h
 */

#ifndef _MOM_PMIX_H
#define _MOM_PMIX_H
#ifdef __cplusplus
extern "C" {
#endif

#include <pbs_config.h>

#ifdef PMIX

#include <pmix_server.h>
#include "job.h"

extern void
pbs_pmix_server_init(char *);

extern void
pbs_pmix_register_client(job *, int, char ***);

extern void
pbs_pmix_notify_exit(job *pjob, int exitstat, char *msg);

extern int
pbs_pmix_job_join_extra(job *, hnodent *);

extern int
pbs_pmix_job_clean_extra(job *);

#endif /* PMIX */

#ifdef __cplusplus
}
#endif
#endif /* _MOM_PMIX_H */


================================================
FILE: src/resmom/mom_server.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_server.c
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <netdb.h>
#include <netinet/in.h>
#include <sys/param.h>
#include <sys/times.h>
#include <sys/time.h>

#include <assert.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <time.h>
#include <limits.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <signal.h>

#include "portability.h"
#include "list_link.h"
#include "pbs_ifl.h"
#include "server_limits.h"
#include "pbs_error.h"
#include "attribute.h"
#include "log.h"
#include "net_connect.h"
#include "tpp.h"
#include "dis.h"
#include "pbs_nodes.h"
#include "placementsets.h"
#include "resmon.h"
#include "mom_server.h"
#include "svrfunc.h"
#include "server_limits.h"
#include "credential.h"
#include "ticket.h"
#include "libpbs.h"
#include "batch_request.h"
#include "pbs_version.h"
#define MOM_MACH 1 /* don't include the dependent header */
#include "mom_func.h"
#include "mom_hook_func.h"

/* Global Data Items */
extern u_Long av_phy_mem; /* phyical memory in KB */
extern unsigned int default_server_port;
extern char mom_host[];
extern int mom_run_state;
extern char *msg_daemonname;
extern int num_acpus;
extern int num_pcpus;
extern char *path_jobs;
extern int pbs_errno;
extern int next_sample_time;
extern int min_check_poll;
extern unsigned int pbs_mom_port;
extern unsigned int pbs_rm_port;
extern unsigned int pbs_tm_port;
extern time_t time_now;
extern int internal_state;
extern int internal_state_update;
extern int cycle_harvester;
extern char *mom_home;
extern unsigned long hook_action_id;
extern pbs_list_head svr_alljobs;
extern pbs_list_head svr_hook_job_actions;
extern pbs_list_head svr_hook_vnl_actions;
extern pbs_list_head svr_allhooks;
extern int mom_recvd_ip_cluster_addrs;

extern int server_stream;
extern int enable_exechost2;
extern vnl_t *vnlp;	      /* vnode list */
extern vnl_t *vnlp_from_hook; /* vnode list updates from hook */
extern char *msg_request;

extern void req_commit(struct batch_request *preq);
extern void req_quejob(struct batch_request *preq);
extern void req_jobscript(struct batch_request *preq);
extern void mom_vnlp_report(vnl_t *vnl, char *header);
extern char *path_hooks;
extern unsigned long hooks_rescdef_checksum;
extern int report_hook_checksums;

/*
 * Tree search generalized from Knuth (6.2.2) Algorithm T just like
 * the AT&T man page says.
 *
 * The node_t structure is for internal use only, lint doesn't grok it.
 *
 * Written by reading the System V Interface Definition, not the code.
 *
 * Totally public domain.
 */
/*LINTLIBRARY*/

/*
 **	Modified by Tom Proett <proett@nas.nasa.gov> for PBS.
 */

typedef struct node_t {
	u_long key;
	struct node_t *left, *right;
} node;
node *okclients = NULL; /* tree of ip addrs */

/**
 * @brief
 *	find value in tree.
 *
 * @param[in]  key - value to be found in tree
 *
 * @return 	error code
 * @retval  	1     if found,
 * @retval 	0     if not
 */
int
	addrfind(const u_long key)
{
	node **rootp = &okclients; /* address of tree root */

#ifdef NAS_CLUSTER /* localmod 024 */
	return 1;
#endif /* localmod 024 */

	while (*rootp != NULL) {				  /* Knuth's T1: */
		if (key == (*rootp)->key)			  /* T2: */
			return 1;				  /* we found it! */
		rootp = (key < (*rootp)->key) ? &(*rootp)->left : /* T3: follow left branch */
				&(*rootp)->right;		  /* T4: follow right branch */
	}
	return 0;
}

/**
 * @brief
 * 	insert value into tree
 *
 * @param[in] key - value to be inserted
 *
 * @return Void
 *
 */
void
addrinsert(const u_long key)
{
	register node *q;
	node **rootp = &okclients; /* address of tree root */

	while (*rootp != NULL) {				  /* Knuth's T1: */
		if (key == (*rootp)->key)			  /* T2: */
			return;					  /* we found it! */
		rootp = (key < (*rootp)->key) ? &(*rootp)->left : /* T3: follow left branch */
				&(*rootp)->right;		  /* T4: follow right branch */
	}
	q = (node *) malloc(sizeof(node)); /* T5: key not found */
	if (q != NULL) {		   /* make new node */
		*rootp = q;		   /* link new node to old */
		q->key = key;		   /* initialize new node */
		q->left = q->right = NULL;
		sprintf(log_buffer,
			"Adding IP address %ld.%ld.%ld.%ld as authorized",
			(key & 0xff000000) >> 24,
			(key & 0x00ff0000) >> 16,
			(key & 0x0000ff00) >> 8,
			(key & 0x000000ff));
#ifdef NAS /* localmod 094 */
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  msg_daemonname, log_buffer);
#else
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  msg_daemonname, log_buffer);
#endif /* localmod 094 */

	} else
		log_err(errno, __func__, "Failed to allocate memory for new node in tree");
	return;
}

/**
 * @brief
 *	free the value in tree
 *
 * @param[in] rootp - pointer to root node
 *
 * @return Void
 *
 */
void
addrfree(node **rootp)
{
	if (rootp == NULL || *rootp == NULL)
		return;
	addrfree(&(*rootp)->left);
	addrfree(&(*rootp)->right);
	free(*rootp);
	*rootp = NULL;
}

/**
 * @brief
 *	free_vnodemap - free the mominfo_array entries and mommap_array
 *
 * @return Void
 *
 */
static void
free_vnodemap(void)
{
	int i;

	if (mominfo_array) {
		for (i = 0; i < mominfo_array_size; ++i) {
			if (mominfo_array[i]) {
				delete_mom_entry(mominfo_array[i]);
				mominfo_array[i] = NULL;
			}
		}
	}

	if (mommap_array) {
		for (i = 0; i < mommap_array_size; ++i) {
			if (mommap_array[i]) {
				delete_momvmap_entry(mommap_array[i]);
				mommap_array[i] = NULL;
			}
		}
	}
}

/**
 * @brief
 *	reply to server
 *
 * @param[in] stream - connection stream
 * @param[in] combine_msg - combine message in the caller
 *
 * @return int
 * @retval	0: success
 * @retval	!0: error code
 *
 */
static int
registermom(int stream, int combine_msg)
{
	int count = 0;
	int ret;
	job *pjob;

	/* how many jobs are present */
	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob; pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		++count;
	}

	/* Now that all of the options data items are set, send */
	/* the option set, followed by the optional data if any */
	/* Please note,  the options MUST be sent in the order  */
	/* that they are defined, least significant bit to most */

	if (!combine_msg)
		if ((ret = is_compose(stream, IS_REGISTERMOM)) != DIS_SUCCESS)
			goto err;

	/* if there are running jobs, report them to the Server */
	/*
		* Add to the REGISTERMOM the count of jobs and the
		* following per running job:
		*   string  - job id
		*   int     - job substate
		*   long    - run version (count)
		*   int     - Node Id  (0 if Mother Superior)
		*   string  - exec_vnode string
	*/

	if ((ret = diswui(stream, count)) != DIS_SUCCESS)
		goto err;
	for (pjob = (job *) GET_NEXT(svr_alljobs);
	     pjob && (count > 0);
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {

		--count;

		if ((ret = diswst(stream, pjob->ji_qs.ji_jobid)) != DIS_SUCCESS)
			goto err;
		if ((ret = diswsi(stream, get_job_substate(pjob))) != DIS_SUCCESS)
			goto err;

		if (is_jattr_set(pjob, JOB_ATR_run_version))
			ret = diswsl(stream, get_jattr_long(pjob, JOB_ATR_run_version));
		else
			ret = diswsl(stream, get_jattr_long(pjob, JOB_ATR_runcount));

		if (ret != DIS_SUCCESS)
			goto err;
		/* send Node Id */
		if ((ret = diswsi(stream, pjob->ji_nodeid)) != DIS_SUCCESS)
			goto err;
		if ((ret = diswst(stream, get_jattr_str(pjob, JOB_ATR_exec_vnode))) != DIS_SUCCESS)
			goto err;

		if (ret != DIS_SUCCESS)
			goto err;
	}

	if (!combine_msg)
		dis_flush(stream);
	return 0;

err:
	sprintf(log_buffer, "%s for %s", dis_emsg[ret], "HELLO");
#ifdef WIN32

	if (errno != 10054)
#endif
		log_err(errno, __func__, log_buffer);
	tpp_close(stream);
	return ret;
}

/**
 * @brief
 *	Send one or the entire set of unacknowledged hook_job_actions
 *	to the server.   If called with a non-null pointer to an action,
 *	that one is sent;  otherwise all in the list are sent.
 *
 *	If only sending one (non-null argument), please note that that item
 *	has already been linked into the list headed by svr_hook_job_actions.
 *
 * @param[in] phjba - specific action to send or null for all
 *
 * @return none
 *
 */
void
send_hook_job_action(struct hook_job_action *phjba)
{
	struct hook_job_action *pka;
	unsigned int count;
	int ret;

	if (server_stream == -1) {
		/* no stream to server, ok as item already queued to resend */
		return;
	}

	if (phjba != NULL) {
		/* single new item to send */
		pka = phjba;
		count = 1;
	} else {
		/* resend queued up list of items */
		pka = GET_NEXT(svr_hook_job_actions);
		if (pka == NULL)
			return; /* none in the list to send */
		count = 0;
		while (pka) {
			++count;
			pka = GET_NEXT(pka->hja_link);
		}
		pka = GET_NEXT(svr_hook_job_actions);
	}

	if ((ret = is_compose(server_stream, IS_HOOK_JOB_ACTION)) != DIS_SUCCESS)
		goto err;

	ret = diswui(server_stream, count);
	if (ret != DIS_SUCCESS)
		goto err;
	while (count--) {
		ret = diswst(server_stream, pka->hja_jid);
		if (ret != DIS_SUCCESS)
			goto err;
		ret = diswul(server_stream, pka->hja_actid);
		if (ret != DIS_SUCCESS)
			goto err;
		ret = diswsi(server_stream, pka->hja_runct);
		if (ret != DIS_SUCCESS)
			goto err;
		ret = diswsi(server_stream, pka->hja_action);
		if (ret != DIS_SUCCESS)
			goto err;
		ret = diswui(server_stream, pka->hja_huser);
		if (ret != DIS_SUCCESS)
			goto err;
		pka = GET_NEXT(pka->hja_link);
	}
	dis_flush(server_stream);
	return;

err:
	log_err(errno, "send_hook_job_action", (char *) dis_emsg[ret]);
	return;
}
/**
 *  @brief
 * 	Send the vnode changes in 'vnl' to the server via
 * 	hook_requests_to_server() function call, and also
 * 	requests saving 'vnlp' onto the svr_hook_vnl_action list.
 * 	This list will be tracked for an ack from the server, and if
 * 	found, then deletes 'vnl' from the svr_hook_vnl_action_list, and
 * 	frees 'vnl' itself.
 * 	If there's no ack from the server, and communication with the
 * 	server is interrupted, the 'vnl' request would be sent again.
 *
 * @note
 *	Be sure to NULL the value of 'vnl' upon return from this function,
 *	so as to not be referenced again if it later gets freed.
 *
 * @param[in]	vnl	- vnode changes to send.
 *			  This 'vnl' is saved internally inside
 *			  hook_requests_to_server(), to be freed later in
 *			  is_request() under IS_HOOK_ACTION_ACK request
 *			  on an IS_UPDATE_FROM_HOOK/IS_UPDATE_FROM_HOOK2
 *			  acknowledgement.
 * @return	int
 * 		DIS_SUCCESS	- for successful operations.
 * 		!= DIS_SUCCESS	- for failure encountered
 *
 */

int
send_hook_vnl(void *vnl)
{
	struct hook_vnl_action *pvna;
	pbs_list_head pvnalist;
	int ret;
	vnl_t *the_vnlp = vnl;

	if ((the_vnlp == NULL) || (the_vnlp->vnl_used == 0))
		/* nothing to send */
		return DIS_SUCCESS;

	pvna = malloc(sizeof(struct hook_vnl_action));
	if (pvna == NULL) {
		log_err(errno, __func__, "malloc");
		return DIS_NOMALLOC;
	}
	CLEAR_HEAD(pvnalist);
	CLEAR_LINK(pvna->hva_link);
	pvna->hva_euser[0] = '\0';
	pvna->hva_actid = hook_action_id++;
	pvna->hva_vnl = the_vnlp;
	pvna->hva_update_cmd = IS_UPDATE_FROM_HOOK;
	append_link(&pvnalist, &pvna->hva_link, pvna);

	/* The argument of 1 means to save action to */
	/* svr_vnl_actions list for possible resend. */
	ret = hook_requests_to_server(&pvnalist);
	vna_list_free(pvnalist);
	return (ret);
}

/**
 * @brief
 *	Send a checksum report of the various hooks known to the current mom,
 *	if the configuration flag 'report_hook_checksums' is TRUE.
 *
 * @return	int
 * @retval	DIS_SUCCESS	- for successful operation
 * @retval	!= DIS_SUCCESS	- for failure encountered
 *
 */
static int
send_hook_checksums(void)
{
	unsigned int count;
	hook *phook;
	int ret;

	if (!report_hook_checksums)
		return DIS_SUCCESS;

	if (server_stream == -1) {
		/* no stream to server...ok */
		return DIS_SUCCESS;
	}

	phook = (hook *) GET_NEXT(svr_allhooks);
	count = 0;
	while (phook) {
		phook = (hook *) GET_NEXT(phook->hi_allhooks);
		count++;
	}

	if ((ret = is_compose(server_stream, IS_HOOK_CHECKSUMS)) != DIS_SUCCESS)
		goto err;

	ret = diswui(server_stream, count);
	if (ret != DIS_SUCCESS)
		goto err;

	phook = (hook *) GET_NEXT(svr_allhooks);
	while (count--) {
		ret = diswst(server_stream, phook->hook_name);
		if (ret != DIS_SUCCESS)
			goto err;
		ret = diswul(server_stream, phook->hook_control_checksum);
		if (ret != DIS_SUCCESS)
			goto err;
		ret = diswul(server_stream, phook->hook_script_checksum);
		if (ret != DIS_SUCCESS)
			goto err;
		ret = diswul(server_stream, phook->hook_config_checksum);
		if (ret != DIS_SUCCESS)
			goto err;
		phook = (hook *) GET_NEXT(phook->hi_allhooks);
	}

	ret = diswul(server_stream, hooks_rescdef_checksum);
	if (ret != DIS_SUCCESS)
		goto err;

	(void) dis_flush(server_stream);

	return DIS_SUCCESS;

err:
	log_err(errno, "send_hook_checksums", (char *) dis_emsg[ret]);
	return (ret);
}

/**
 * @brief
 *	This function will process the cluster addresses from the server stream.
 *
 * @param[in]	stream - the communication stream
 *
 * @return	int
 * @retval	0: success
 * @retval	!0: Error code
 */
static int
process_cluster_addrs(int stream)
{
	u_long ipaddr;
	int i;
	int tot = 0;
	int ret = 0;
	u_long ipdepth = 0;
	u_long counter = 0;

	DBPRT(("%s: IS_CLUSTER_ADDRS\n", __func__))
	enable_exechost2 = 1;

	tot = disrui(stream, &ret);
	if (ret != DIS_SUCCESS)
		return ret;

	for (i = 0; i < tot; i++) {
		ipaddr = disrul(stream, &ret);
		if (ret != DIS_SUCCESS)
			break;
		ipdepth = disrul(stream, &ret);
		if (ret != DIS_SUCCESS)
			break;
		counter = ipaddr;
		while (counter <= ipaddr + ipdepth) {
			DBPRT(("%s:\t%ld.%ld.%ld.%ld", __func__,
			       (counter & 0xff000000) >> 24,
			       (counter & 0x00ff0000) >> 16,
			       (counter & 0x0000ff00) >> 8,
			       (counter & 0x000000ff)))
			addrinsert(counter++);
			DBPRT(("ipdepth: %lu\n", ipdepth))
		}
	}

	return 0;
}

/**
 * @brief
 *	This handles input coming from another server over a DIS on tpp stream.
 *	Read the stream to get a Inter-Server request.
 *
 * @param[in]	stream - the tpp stream
 * @param[in]	version - protocol version of the incoming connection
 *
 */
void
is_request(int stream, int version)
{
	int command = 0;
	int n;
	int ret = DIS_SUCCESS;
	u_long ipaddr;
	char *jobid = NULL;
	struct sockaddr_in *addr;
	void init_addrs();
	job *pjob;
	FILE *filen = 0;
	extern vnl_t *vnlp;	      /* vnode list */
	extern vnl_t *vnlp_from_hook; /* vnode list updates from hook */
	int hktype;
	unsigned long hkseq;
	struct hook_job_action *phjba;
	struct hook_vnl_action *phvna;
	int need_inv;
	mom_hook_input_t *phook_input = NULL;
	mom_hook_output_t *phook_output = NULL;

	DBPRT(("%s: stream %d version %d\n", __func__, stream, version))
	if (version != IS_PROTOCOL_VER) {
		sprintf(log_buffer, "protocol version %d unknown", version);
		log_err(-1, __func__, log_buffer);
		tpp_close(stream);
		return;
	}

	/* check that machine is okay to be a server */
	addr = tpp_getaddr(stream);
	if (addr == NULL) {
		sprintf(log_buffer, "Sender unknown");
		log_err(-1, __func__, log_buffer);
		tpp_close(stream);
		return;
	}
	ipaddr = ntohl(addr->sin_addr.s_addr);

	if (!addrfind(ipaddr)) {
		sprintf(log_buffer, "bad connect from %s", netaddr(addr));
		log_err(PBSE_BADHOST, __func__, log_buffer);
		tpp_close(stream);
		return;
	}

	/* Server can reach out to mom with requests even before mom sending a hello exchange.
	   This is one such occassion. So trigger hello exchange now */
	if (server_stream == -1)
		send_hellosvr(stream);

	command = disrsi(stream, &ret);
	if (ret != DIS_SUCCESS)
		goto err;

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG, msg_daemonname, "Received request: %d", command);

	switch (command) {

		case IS_REPLYHELLO: /* servers return greeting to IS_HELLOSVR */

			DBPRT(("%s: IS_REPLYHELLO, state=0x%x stream=%d\n", __func__,
			       internal_state, stream))

			time_delta_hellosvr(MOM_DELTA_RESET);

			need_inv = disrsi(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;

			ret = process_cluster_addrs(stream);
			if (ret != 0)
				goto err;

			/* return a IS_REGISTERMOM followed by an UPDATE or UPDATE2 */

			next_sample_time = min_check_poll;
			if ((ret = is_compose(stream, IS_REGISTERMOM)) != DIS_SUCCESS)
				goto err;
			if ((ret = registermom(stream, 1)) != 0)
				goto err;
			internal_state_update = UPDATE_MOM_STATE;

			if (need_inv) {
				if ((ret = state_to_server(UPDATE_VNODES, 1)) != DIS_SUCCESS)
					goto err;
				sprintf(log_buffer, "ReplyHello from server at %s", netaddr(addr));
			} else {
				if ((ret = state_to_server(UPDATE_MOM_ONLY, 1)) != DIS_SUCCESS)
					goto err;
				sprintf(log_buffer, "ReplyHello (no inventory required) from server at %s", netaddr(addr));
			}
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
				  msg_daemonname, log_buffer);
			dis_flush(server_stream);

			if (send_hook_checksums() != DIS_SUCCESS)
				goto err;

			/* send any unacknowledged hook job and vnl action requests */
			send_hook_job_action(NULL);
			hook_requests_to_server(&svr_hook_vnl_actions);

			/* send any vnode changes made by */
			/* exechost_startup hook */
			mom_vnlp_report(vnlp_from_hook, "VNLP_FROM_HOOK");
			(void) send_hook_vnl(vnlp_from_hook);
			/* send_hook_vnl() saves 'vnlp_from_hook' internally, */
			/* to be freed later when server acks the request. */
			vnlp_from_hook = NULL;
			mom_recvd_ip_cluster_addrs = 1;
			break;

		case IS_CLUSTER_ADDRS:
			ret = process_cluster_addrs(stream);
			if (ret != 0 && ret != DIS_EOD)
				goto err;
			break;

		case IS_OBITREPLY: {
			int njobs = 0;

			njobs = disrui(stream, &ret); /* number of acks in reply */
			if (ret != DIS_SUCCESS)
				goto err;

			DBPRT(("%s: IS_OBITREPLY ack njobs: %d\n", __func__, njobs))
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, "received ack obits = %d", njobs);

			while (njobs-- > 0) {
				jobid = disrst(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto err;

				pjob = find_job(jobid);
				if (pjob) {
					/* note: see on_job_exit() for more info */
					if (!has_stage(pjob) && num_eligible_hooks(HOOK_EVENT_EXECJOB_END) == 0) {
						mom_deljob(pjob);
					} else {
						set_job_substate(pjob, JOB_SUBSTATE_EXITED);
						if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) {
							/*
							* if checkpointed, save state to disk, otherwise
							* leave unchanges on disk so recovery will resend
							* obit to server
							*/
							job_save(pjob);
						}
					}
				}
				free(jobid);
				jobid = NULL;
			}

			njobs = disrui(stream, &ret); /* number of rejects in reply */
			if (ret != DIS_SUCCESS)
				goto err;

			DBPRT(("%s: IS_OBITREPLY reject njobs: %d\n", __func__, njobs))
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, "received reject obits = %d", njobs);

			while (njobs-- > 0) {
				jobid = disrst(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto err;

				pjob = find_job(jobid);
				/*
				 * Allowing only to delete a job that has actually
				 * started (i.e. not in JOB_SUBSTATE_PRERUN), would
				 * avoid the race condition resulting in a hung job:
				 * server force reruns a job which is lingering in
				 * PRERUN state, and an Obit request for the previous
				 * instance of the job is received by the server and
				 * rejected, causing mom to delete the new instance of
				 * the job. If the job has passed the PRERUN stage,
				 * then it would have already synced up with the server
				 * on status, and not end up in this race condition.
				 */
				if (pjob && !pjob->ji_hook_running_bg_on && !check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) {
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE, jobid, "Job removed, Server rejected Obit");
					mom_deljob(pjob);
				}
				free(jobid);
				jobid = NULL;
			}
		} break;

		case IS_SHUTDOWN:
			DBPRT(("%s: IS_SHUTDOWN\n", __func__))
			mom_run_state = 0;
			break;

		case IS_DISCARD_JOB:
			jobid = disrst(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;
			DBPRT(("%s: IS_DISCARD_JOB %s\n", __func__, jobid))
			n = disrsi(stream, &ret); /* job's run_version */
			if (ret != DIS_SUCCESS)
				n = -1; /* default to -1 */
			pjob = find_job(jobid);
			if (pjob) {
				long runver;

				if (is_jattr_set(pjob, JOB_ATR_run_version))
					runver = get_jattr_long(pjob, JOB_ATR_run_version);
				else
					runver = get_jattr_long(pjob, JOB_ATR_runcount);
				/* a run_version of -1 means any version is to be discarded */
				if ((n == -1) || (runver == n)) {
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
						  LOG_NOTICE,
						  pjob->ji_qs.ji_jobid,
						  "Job discarded at request of Server");
					if (pjob->ji_hook_running_bg_on) {
						free(jobid);
						jobid = NULL;
						break;
					}
					(void) kill_job(pjob, SIGKILL);
					phook_input = (mom_hook_input_t *) malloc(sizeof(mom_hook_input_t));
					if (phook_input == NULL) {
						log_err(errno, __func__, MALLOC_ERR_MSG);
						goto err;
					}
					mom_hook_input_init(phook_input);
					phook_input->pjob = pjob;
					if ((phook_output = (mom_hook_output_t *) malloc(
						     sizeof(mom_hook_output_t))) == NULL) {
						log_err(errno, __func__, MALLOC_ERR_MSG);
						goto err;
					}
					mom_hook_output_init(phook_output);

					if ((phook_output->reject_errcode =
						     (int *) malloc(sizeof(int))) == NULL) {
						log_err(errno, __func__, MALLOC_ERR_MSG);
						free(phook_output);
						goto err;
					}
					*(phook_output->reject_errcode) = 0;

					if (mom_process_hooks(HOOK_EVENT_EXECJOB_END,
							      PBS_MOM_SERVICE_NAME, mom_host,
							      phook_input, phook_output, NULL, 0, 1) == HOOK_RUNNING_IN_BACKGROUND) {
						pjob->ji_hook_running_bg_on = BG_IS_DISCARD_JOB;
						if (pjob->ji_qs.ji_svrflags &
						    JOB_SVFLG_HERE) /* MS */
							(void) send_sisters(pjob,
									    IM_DELETE_JOB, NULL);
						free(jobid);
						jobid = NULL;
						break;
					}
					mom_deljob(pjob);
					free(phook_output->reject_errcode);
					free(phook_output);
					free(phook_input);
				}
			}
			if ((ret = is_compose(server_stream, IS_DISCARD_DONE)) != DIS_SUCCESS) {
				free(jobid);
				jobid = NULL;
				goto err;
			}
			if ((ret = diswst(server_stream, jobid)) != DIS_SUCCESS) {
				free(jobid);
				jobid = NULL;
				goto err;
			}
			free(jobid); /* can be freed now */
			jobid = NULL;
			if ((ret = diswsi(server_stream, n)) != DIS_SUCCESS)
				goto err;
			dis_flush(server_stream);
			break;

		case IS_CMD:
			DBPRT(("%s: IS_CMD\n", __func__))
			process_IS_CMD(stream);
			break;

		case IS_HOOK_ACTION_ACK: {
			int nacks = 0;
			static char **vnl_allow_attrs = NULL;

			/*
			 * the Server is sending an acknowledgement that it received
			 * and processed an IS_HOOK_JOB_ACTION request for a job.
			 * The Server will send one such per job
			 */

			hktype = disrsi(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;
			nacks = disrsi(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;
			while (nacks--) {
				hkseq = disrsi(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto err;
				if (hktype == IS_HOOK_JOB_ACTION) {
					phjba = GET_NEXT(svr_hook_job_actions);
					for (; phjba; phjba = GET_NEXT(phjba->hja_link)) {
						if (hkseq == phjba->hja_actid) {
							delete_link(&phjba->hja_link);
							free(phjba);
							break;
						}
					}
				} else if (hktype == IS_UPDATE_FROM_HOOK || hktype == IS_UPDATE_FROM_HOOK2) {
					if (vnl_allow_attrs == NULL) {
						vnl_allow_attrs = break_delimited_str(HOOK_VNL_PERSISTENT_ATTRIBS, ' ');
						if (vnl_allow_attrs == NULL)
							continue;
					}
					phvna = GET_NEXT(svr_hook_vnl_actions);
					for (; phvna; phvna = GET_NEXT(phvna->hva_link)) {
						if (hkseq == phvna->hva_actid) {
							delete_link(&phvna->hva_link);
							/* save admin vnode changes done by various hooks */
							if (phvna->hva_euser[0] == '\0') {
								if (vnlp != NULL || vnl_alloc(&vnlp) != NULL) {
									vnlp->vnl_modtime = time(NULL);
									vn_merge2(vnlp, phvna->hva_vnl, vnl_allow_attrs, NULL);
									mom_vnlp_report(vnlp, "vnlp");
								}
							}
							vnl_free(phvna->hva_vnl);
							free(phvna);
							break;
						}
					}
				}
			}
		} break;

		default:
			sprintf(log_buffer, "unknown command %d sent", command);
			log_err(-1, __func__, log_buffer);
			goto err;
	}

	tpp_eom(stream);
	return;

err:
	/*
	 ** We come here if we got a DIS read error or a protocol
	 ** element is missing.
	 */
	sprintf(log_buffer, "%s from %s", dis_emsg[ret], netaddr(addr));
	log_err(-1, __func__, log_buffer);
	tpp_close(stream);
	if (filen)
		fclose(filen);
	if (jobid)
		free(jobid);

	return;
}

/**
 * @brief
 *	Sends any pending requests to the server related to hooks on tpp stream
 *
 * @par
 *	May be called with:
 *	1. a new linked list in which case each vnl entry is sent to the
 *	   Server and the list entry is relinked into svr_hook_vnl_actions
 *	   where it remains until the update is acknowledged by the Server; OR
 *	2. svr_hook_vnl_actions which is done when a new tPP stream is opened
 *	   by a server on restart or reestablished communications.  In this
 *	   case only the entries in svr_hook_vnl_actions are only resent.
 * @Note
 *	Update is sent if the list of vnl changes is not empty.
 *	Upon any error, the connection to the server_stream is not closed.
 *
 * @param[in]	plist - pointer to head of list of vnl actions to send to Server
 *
 * @return	int
 * 		DIS_SUCCESS	- for successful operations.
 * 		!= DIS_SUCCESS	- for failure encountered
 *
 */
int
hook_requests_to_server(pbs_list_head *plist)
{
	int resending = 0;
	int ret;
	struct hook_vnl_action *nxt;
	struct hook_vnl_action *pvna;
	vnl_t *pvnlph;
	extern const char *dis_emsg[];

	if (plist == NULL)
		return (0); /* nothing to send */

	if (server_stream < 0) {
		/* log but keep going to link the changes to be sent later */
		log_err(errno, __func__, "warning: unable to send hook requests to server: No server_stream! (to be retried)");
	}

	if (plist == &svr_hook_vnl_actions) {
		/* we are resending the vnl lists on svr_hool_vnl_actions */
		/* so we don't need to update modtime or to relink        */
		resending = 1;
	}

	pvna = (struct hook_vnl_action *) GET_NEXT(*plist);
	while (pvna != NULL) {

		nxt = (struct hook_vnl_action *) GET_NEXT(pvna->hva_link);

		if ((pvnlph = pvna->hva_vnl) == NULL) {
			/* nothing to send, get rid of it */
			delete_link(&pvna->hva_link);
			free(pvna);
			pvna = nxt;
			continue;
		}

		/* We have hook changes to the vnodes to send to the Server */

		if (resending == 0) {

			/* relink them into the main list of "outstanding" */
			/* changes sent to the server */
			delete_link(&pvna->hva_link);
			append_link(&svr_hook_vnl_actions, &pvna->hva_link, pvna);
			pvna->hva_actid = ++hook_action_id;

			/*
			 * Put in a legit vnl_modtime value; otherwise, garbage
			 * value could be sent, causing pbs_server to panic with
			 * "Input value too large" upon vn_decode_DIS()
			 */
			pvnlph->vnl_modtime = time(NULL);
		}

		/* Now send each update to the Server if we can */
		if (server_stream == -1) {
			pvna = nxt; /* next set of vnl changes */
			continue;
		}

		ret = is_compose(server_stream, pvna->hva_update_cmd);
		if (ret != DIS_SUCCESS)
			goto hook_requests_to_server_err;

		ret = diswul(server_stream, pvna->hva_actid);
		if (ret != DIS_SUCCESS)
			goto hook_requests_to_server_err;

		ret = diswst(server_stream, pvna->hva_euser);
		if (ret != DIS_SUCCESS)
			goto hook_requests_to_server_err;

		ret = vn_encode_DIS(server_stream, pvnlph); /* vnode list */
		if (ret != DIS_SUCCESS)
			goto hook_requests_to_server_err;

		dis_flush(server_stream);

		pvna = nxt; /* next set of vnl changes */
	}

	return 0;

hook_requests_to_server_err:
	log_err(errno, __func__, (char *) dis_emsg[ret]);
	return (ret);
}

/**
 * @brief
 * 	state_to_server() - if UPDATE_MOM_STATE is set, send state update message to
 *	the server.
 *
 * @param[in]	what_to_update - defines what to update
 * 		UPDATE_VNODES - update all the vnodes
 *		UPDATE_MOM_ONLY - update only the info about the mom
 * @param[in]	combine_msg	- combine message in the caller.
 *
 *	If we have placement set information to send, we use IS_UPDATE2;
 *	otherwise, we fall back to IS_UPDATE.
 *
 * @return int
 * @retval	0: success
 * @retval	1: failure
 *
 */
int
state_to_server(int what_to_update, int combine_msg)
{
	int i, ret;
	extern const char *dis_emsg[];
	extern vnl_t *vnlp; /* vnode list */
	char *pv;
	int use_UPDATE2 = 0;
	int cmd = IS_UPDATE;

	if (internal_state_update == 0)
		return 0;

	if (server_stream < 0)
		return -1;

	if (av_phy_mem == 0)
		av_phy_mem = strTouL(physmem(0), &pv, 10);

	i = internal_state & MOM_STATE_MASK;
	if (internal_state & (MOM_STATE_BUSYKB | MOM_STATE_INBYKB))
		i |= MOM_STATE_BUSY;
	if (cycle_harvester == 1)
		i |= MOM_STATE_CONF_HARVEST;

	DBPRT(("updating state 0x%x to server\n", i))

	if ((vnlp != NULL) && (what_to_update == UPDATE_VNODES)) {
		use_UPDATE2 = 1;
		cmd = IS_UPDATE2;
	}

	if (!combine_msg)
		if ((ret = is_compose(server_stream, cmd)) != DIS_SUCCESS)
			goto err;

	if ((ret = diswui(server_stream, i)) != DIS_SUCCESS) /* node state */
		goto err;
	if ((ret = diswui(server_stream, num_pcpus)) != DIS_SUCCESS) /* phy cpus */
		goto err;
	if ((ret = diswui(server_stream, num_acpus)) != DIS_SUCCESS) /* avail cpus */
		goto err;
	if ((ret = diswull(server_stream, av_phy_mem)) != DIS_SUCCESS) /* phy mem */
		goto err;
	if ((ret = diswst(server_stream, arch(0))) != DIS_SUCCESS) /* arch type */
		goto err;

	if (use_UPDATE2) {
#if MOM_ALPS
		/*
		 * This is a workaround for a problem with the reporting of
		 * vnodes by multiple MoMs:  the "check_other_moms_time"
		 * variable's value being nonzero results in the vnl_modtime
		 * for additional MoMs' vnodes being set to match the modtime
		 * for the first one to report.  This in turn causes the call
		 * to update2_to_vnode() to be skipped in the case of additional
		 * MoMs because they are still reporting the old time (the one
		 * recorded when inventory_to_vnodes() created the vnodes.
		 *
		 * The fact that update2_to_vnode() is skipped means that the
		 * ATTR_NODE_TopologyInfo action function is not called and as
		 * a result, the other MoMs don't acquire socket licenses.
		 *
		 * This workaround makes sure that in response to an IS_HELLO
		 * from the server, a Cray always reports current time as the
		 * vnode mod time.
		 */
		vnlp->vnl_modtime = time(0);
#endif /* MOM_ALPS */

		if ((ret = vn_encode_DIS(server_stream, vnlp)) != DIS_SUCCESS) /* vnode list */
			goto err;
	}

	if ((ret = diswst(server_stream, PBS_VERSION)) != DIS_SUCCESS) /* pbs_version */
		goto err;

	if (!combine_msg)
		dis_flush(server_stream);
	internal_state_update = 0;
	return 0;

err:
	log_err(errno, "state_to_server", (char *) dis_emsg[ret]);
	tpp_close(server_stream);
	server_stream = -1;
	return ret;
}

/**
 * @brief
 * 	send_wk_job_idle - send IDLE message to server for each job suspended/resumed
 *	on the workstation going busy/idle.
 *
 * @param[in] idle   suspend/reusme (1/0)
 * @param[in] jobid  job id
 *
 * @return Void
 *
 */
void
send_wk_job_idle(char *jobid, int idle)
{
	int ret;

	if (server_stream < 0)
		return;

	ret = is_compose(server_stream, IS_IDLE);
	if (ret != DIS_SUCCESS)
		goto err;

	ret = diswui(server_stream, idle);
	if (ret != DIS_SUCCESS)
		goto err;
	ret = diswst(server_stream, jobid);
	if (ret != DIS_SUCCESS)
		goto err;
	dis_flush(server_stream);
	return;

err:
	sprintf(log_buffer, "%s for %d", dis_emsg[ret], idle);
	log_err(errno, "send_wk_job_idle", log_buffer);
	tpp_close(server_stream);
	server_stream = -1;
	return;
}

/**
 * @brief
 * 	recover_vmap - recover the vnode to host mapping data from
 *	the mom_priv/vnodemap file.   See resmom/mom_server.c
 *	is_request() function where it is written.
 *
 *	Format of the file is:
 *		integer time stamp
 *		hostname port num_of_vnodes
 *			vnode_name vhost no_task_value
 *			vnode_name vhost no_task_value
 *			...
 *		hostname ...
 *			...
 *	Note:  if "vhost" is '-', then we use the hostname of Mom, "hostname"
 *
 * @return   int
 * @retval   errno  Failure
 * @retval   0      Success
 *
 */
int
recover_vmap(void)
{
	char buf[PBS_MAXHOSTNAME + 64];
	char *endp;
	mominfo_time_t maptime = {0, 0};
	int n;
	char name[PBS_MAXHOSTNAME + 1];
	int notask;
	mominfo_t *pmom;
	unsigned short port;
	char *str;
	FILE *vmf;
	char vmapfile[MAXPATHLEN + 1];
	char vhost[PBS_MAXHOSTNAME + 1];
	extern char *skipwhite(char *);
	extern char *wtokcpy(char *, char *, int);

	sprintf(vmapfile, "%s/%s", mom_home, VNODE_MAP);
	vmf = fopen(vmapfile, "r");
	if (vmf == NULL) {
		if (errno == ENOENT)
			return 0;
		else
			return errno;
	}

	if (fgets(buf, sizeof(buf), vmf) == NULL)
		return 0;
	str = buf;
	while (isdigit(*str))
		str++;
	if ((*str != '\n') && (*str != '.')) {
		fclose(vmf);
		return PBSE_BADTSPEC;
	}
	/* record time stamp of vmap data */
	sscanf(buf, "%lu.%d", &maptime.mit_time, &maptime.mit_gen);

	while (fgets(buf, sizeof(buf), vmf)) {
		str = skipwhite(buf); /* pass over initial whitespace */
		if (*str == '\0')
			continue;
		str = wtokcpy(str, name, sizeof(name));
		str = skipwhite(str);
		if (*str == '\0')
			continue;
		port = (unsigned short) strtol(str, &endp, 10);
		str = skipwhite(endp);
		if (*str == '\0')
			continue;
		n = (int) strtol(str, &endp, 10);

		pmom = create_mom_entry(name, (unsigned int) port);

		while (n--) {
			if (fgets(buf, sizeof(buf), vmf) == NULL)
				break;
			str = skipwhite(buf);
			if (*str == '\0')
				break;
			str = wtokcpy(str, name, sizeof(name));
			str = skipwhite(str);
			if (*str == '\0')
				break;
			str = wtokcpy(str, vhost, sizeof(vhost));
			str = skipwhite(str);
			notask = (int) strtol(str, &endp, 10);

			if ((vhost[0] == '-') && (vhost[1] == '\0'))
				vhost[0] = '\0'; /* make null str */
			if (create_mommap_entry(name, vhost, pmom, notask) == NULL)
				break;
		}
		if (n > 0) {
			free_vnodemap();
			fclose(vmf);
			return PBSE_INTERNAL;
		}
	}
	mominfo_time = maptime;
	fclose(vmf);
	return 0;
}

/**
 * @brief
 *	Send a message on tpp stream to the Server asking that it tell the Scheduler
 *	to restart it's scheduling cycle.
 * @par
 *	If this message is lost due to a closed stream to the Server, so be it.
 *	The world will likely have likely changed by the time a new connection
 *	is established.
 *
 * @param[in] hook_user - effective user running hook,  null string if PBSADMIN
 *
 * @return int
 * @retval 0 - message queued on stream.
 * @retval non-zero - DIS error, stream may be closed.
 *
 */
int
send_sched_recycle(char *hook_user)
{
	int ret;
	ret = is_compose(server_stream, IS_HOOK_SCHEDULER_RESTART_CYCLE);
	if (ret != DIS_SUCCESS)
		goto recycle_err;
	ret = diswst(server_stream, hook_user);
	if (ret != DIS_SUCCESS)
		goto recycle_err;
	ret = dis_flush(server_stream);
	if (ret != DIS_SUCCESS)
		goto recycle_err;
	return (0);

recycle_err:
	sprintf(log_buffer, "%s error %s",
		"Failed to contact server for sched recycle",
		dis_emsg[ret]);
	log_err(-1, __func__, log_buffer);
	return (ret);
}


================================================
FILE: src/resmom/mom_updates_bundle.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * This file containes functions related to generate resc used updates
 * and make bundle of it and sent it to server
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <pbs_python_private.h>
#include <Python.h>
#include <time.h>
#include "resource.h"
#include "job.h"
#include "mom_func.h"
#include "mom_server.h"
#include "hook.h"
#include "tpp.h"

extern pbs_list_head mom_pending_ruu;
extern int resc_access_perm;
extern int server_stream;
extern time_t time_now;

static void bundle_ruu(int *r_cnt, ruu **prused, int *rh_cnt, ruu **prhused, int *o_cnt, ruu **obits);
static ruu *get_job_update(job *pjob);
static PyObject *json_loads(char *value, char *msg, size_t msg_len);
static char *json_dumps(PyObject *py_val, char *msg, size_t msg_len);
static void encode_used(job *pjob, pbs_list_head *phead);

static PyObject *py_json_name = NULL;
static PyObject *py_json_module = NULL;
static PyObject *py_json_dict = NULL;
static PyObject *py_json_func_loads = NULL;
static PyObject *py_json_func_dumps = NULL;

#ifdef PYTHON
/**
 * @brief
 * 	Returns the Python dictionary representation of a string
 *	specyfing a JSON object.
 *
 * @param[in]  value   - string of JSON-object format
 * @param[out] msg     - error message buffer
 * @param[in]  msg_len - size of 'msg' buffer
 *
 * @return PyObject *
 * @retval !NULL - dictionary representation of 'value'
 * @retval NULL  - if not successful, filling out 'msg' with the actual error message.
 */
static PyObject *
json_loads(char *value, char *msg, size_t msg_len)
{
	PyObject *py_value = NULL;
	PyObject *py_result = NULL;

	if (value == NULL)
		return NULL;

	if (msg != NULL) {
		if (msg_len <= 0)
			return NULL;
		msg[0] = '\0';
	}

	if (py_json_name == NULL) {
		py_json_name = PyUnicode_FromString("json");
		if (py_json_name == NULL) {
			if (msg != NULL)
				snprintf(msg, msg_len, "failed to construct json name");
			return NULL;
		}
	}

	if (py_json_module == NULL) {
		py_json_module = PyImport_Import(py_json_name);
		if (py_json_module == NULL) {
			if (msg != NULL)
				snprintf(msg, msg_len, "failed to import json");
			return NULL;
		}
	}

	if (py_json_dict == NULL) {
		py_json_dict = PyModule_GetDict(py_json_module);
		if (py_json_dict == NULL) {
			if (msg != NULL)
				snprintf(msg, msg_len, "failed to get json module dictionary");
			return NULL;
		}
	}

	if (py_json_func_loads == NULL) {
		py_json_func_loads = PyDict_GetItemString(py_json_dict, (char *) "loads");
		if ((py_json_func_loads == NULL) || !PyCallable_Check(py_json_func_loads)) {
			if (msg != NULL)
				snprintf(msg, msg_len, "did not find json.loads() function");
			return NULL;
		}
	}

	py_value = Py_BuildValue("(z)", (char *) value);
	if (py_value == NULL) {
		if (msg != NULL)
			snprintf(msg, msg_len, "failed to build python arg %s", value);
		return NULL;
	}

	PyErr_Clear(); /* clear any exception */
	py_result = PyObject_CallObject(py_json_func_loads, py_value);

	if (PyErr_Occurred()) {
		if (msg != NULL) {
			PyObject *exc_string = NULL;
			PyObject *exc_type = NULL;
			PyObject *exc_value = NULL;
			PyObject *exc_traceback = NULL;

			PyErr_Fetch(&exc_type, &exc_value, &exc_traceback);

			/* get the exception */
			if (exc_type != NULL && (exc_string = PyObject_Str(exc_type)) != NULL && PyUnicode_Check(exc_string))
				snprintf(msg, msg_len, "%s", PyUnicode_AsUTF8(exc_string));
			Py_XDECREF(exc_string);
			Py_XDECREF(exc_type);
			Py_XDECREF(exc_value);
#if !defined(WIN32)
			Py_XDECREF(exc_traceback);
#elif !defined(_DEBUG)
			/* for some reason this crashes on Windows Debug */
			Py_XDECREF(exc_traceback);
#endif
		}
		goto json_loads_fail;
	} else if (!PyDict_Check(py_result)) {
		if (msg != NULL)
			snprintf(msg, msg_len, "value is not a dictionary");
		goto json_loads_fail;
	}

	Py_XDECREF(py_value);
	return (py_result);

json_loads_fail:
	Py_XDECREF(py_value);
	Py_XDECREF(py_result);
	return NULL;
}

/**
 * @brief
 * 	Returns a JSON-formatted string representing the Python object 'py_val'.
 *
 * @param[in]  py_val  - Python object
 * @param[out] msg     - error message buffer
 * @param[in]  msg_len - size of 'msg' buffer
 *
 * @return char *
 * @retval !NULL - the returned JSON-formatted string
 * @retval NULL  - if not successful, filling out 'msg' with the actual error message.
 *
 * @note
 *	The returned string is malloced space that must be freed later when no longer needed.
 */
static char *
json_dumps(PyObject *py_val, char *msg, size_t msg_len)
{
	PyObject *py_value = NULL;
	PyObject *py_result = NULL;
	const char *tmp_str = NULL;
	char *ret_string = NULL;
	int slen;

	if (py_val == NULL)
		return NULL;

	if (msg != NULL) {
		if (msg_len <= 0)
			return NULL;
		msg[0] = '\0';
	}

	if (py_json_name == NULL) {
		py_json_name = PyUnicode_FromString("json");
		if (py_json_name == NULL) {
			if (msg != NULL)
				snprintf(msg, msg_len, "failed to construct json name");
			return NULL;
		}
	}

	if (py_json_module == NULL) {
		py_json_module = PyImport_Import(py_json_name);
		if (py_json_module == NULL) {
			if (msg != NULL)
				snprintf(msg, msg_len, "failed to import json");
			return NULL;
		}
	}

	if (py_json_dict == NULL) {
		py_json_dict = PyModule_GetDict(py_json_module);
		if (py_json_dict == NULL) {
			if (msg != NULL)
				snprintf(msg, msg_len, "failed to get json module dictionary");
			return NULL;
		}
	}

	if (py_json_func_dumps == NULL) {
		py_json_func_dumps = PyDict_GetItemString(py_json_dict, (char *) "dumps");
		if ((py_json_func_dumps == NULL) || !PyCallable_Check(py_json_func_dumps)) {
			if (msg != NULL)
				snprintf(msg, msg_len, "did not find json.dumps() function");
			return NULL;
		}
	}

	py_value = Py_BuildValue("(O)", py_val);
	if (py_value == NULL) {
		if (msg != NULL)
			snprintf(msg, msg_len, "failed to build python arg %p", (void *) py_val);
		return NULL;
	}
	PyErr_Clear(); /* clear any exception */
	py_result = PyObject_CallObject(py_json_func_dumps, py_value);

	if (PyErr_Occurred()) {
		if (msg != NULL) {
			PyObject *exc_string = NULL;
			PyObject *exc_type = NULL;
			PyObject *exc_value = NULL;
			PyObject *exc_traceback = NULL;

			PyErr_Fetch(&exc_type, &exc_value, &exc_traceback);

			/* get the exception */
			if (exc_type != NULL && (exc_string = PyObject_Str(exc_type)) != NULL && PyUnicode_Check(exc_string))
				snprintf(msg, msg_len, "%s", PyUnicode_AsUTF8(exc_string));
			Py_XDECREF(exc_string);
			Py_XDECREF(exc_type);
			Py_XDECREF(exc_value);
#if !defined(WIN32)
			Py_XDECREF(exc_traceback);
#elif !defined(_DEBUG)
			/* for some reason this crashes on Windows Debug */
			Py_XDECREF(exc_traceback);
#endif
		}
		goto json_dumps_fail;
	} else if (!PyUnicode_Check(py_result)) {
		if (msg != NULL)
			snprintf(msg, msg_len, "value is not a string");
		goto json_dumps_fail;
	}

	tmp_str = PyUnicode_AsUTF8(py_result);
	/* returned tmp_str points to an internal buffer of 'py_result' */
	if (tmp_str == NULL) {
		if (msg != NULL)
			snprintf(msg, msg_len, "PyUnicode_AsUTF8 failed");
		goto json_dumps_fail;
	}
	slen = strlen(tmp_str) + 3; /* for null character + 2 single quotes */
	ret_string = (char *) malloc(slen);
	if (ret_string == NULL) {
		if (msg != NULL)
			snprintf(msg, msg_len, "malloc of ret_string failed");
		goto json_dumps_fail;
	}
	snprintf(ret_string, slen, "'%s'", tmp_str);
	Py_XDECREF(py_value);
	Py_XDECREF(py_result);
	return (ret_string);

json_dumps_fail:
	Py_XDECREF(py_value);
	Py_XDECREF(py_result);
	return NULL;
}
#endif

/**
 * @brief
 * 	 encode_used - encode resources used by a job to be returned to the server
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] phead - pointer to pbs_list_head structure
 *
 * @return Void
 *
 */
static void
encode_used(job *pjob, pbs_list_head *phead)
{
	attribute_def *ad;
	attribute_def *ad3;
	resource *rs;
	resource_def *rd;
	int include_resc_used_update = 0;

	ad = &job_attr_def[JOB_ATR_resc_used];
	if (!is_jattr_set(pjob, JOB_ATR_resc_used))
		return;

	ad3 = &job_attr_def[JOB_ATR_resc_used_update];
	if (pjob->ji_updated || (is_jattr_set(pjob, JOB_ATR_relnodes_on_stageout) && (get_jattr_long(pjob, JOB_ATR_relnodes_on_stageout) != 0)))
		include_resc_used_update = 1;

	rs = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resc_used));
	for (; rs != NULL; rs = (resource *) GET_NEXT(rs->rs_link)) {

		int i;
		attribute val;	/* holds the final accumulated resources_used values from Moms including those released from the job */
		attribute val3; /* holds the final accumulated resources_used values from Moms, which does not include the released moms from job */
		PyObject *py_jvalue;
		char *sval;
		char *dumps;
		char emsg[HOOK_BUF_SIZE];
		attribute tmpatr = {0};
		attribute tmpatr3 = {0};

		rd = rs->rs_defin;
		if ((rd->rs_flags & resc_access_perm) == 0)
			continue;

		val = val3 = rs->rs_value; /* copy resource attribute */

		/* NOTE: presence of pjob->ji_resources means a multinode job (i.e. pjob->ji_numnodes > 1) */
		if (pjob->ji_resources != NULL) {
			/* count up sisterhood too */
			unsigned long lnum = 0;
			unsigned long lnum3 = 0;
			noderes *nr;

			if (strcmp(rd->rs_name, "cput") == 0) {
				for (i = 0; i < pjob->ji_numrescs; i++) {
					nr = &pjob->ji_resources[i];
					lnum += nr->nr_cput;
					if (nr->nr_status != PBS_NODERES_DELETE)
						lnum3 += nr->nr_cput;
				}
				val.at_val.at_long += lnum;
				val3.at_val.at_long += lnum3;
			} else if (strcmp(rd->rs_name, "mem") == 0) {
				for (i = 0; i < pjob->ji_numrescs; i++) {
					nr = &pjob->ji_resources[i];
					lnum += nr->nr_mem;
					if (nr->nr_status != PBS_NODERES_DELETE)
						lnum3 += nr->nr_mem;
				}
				val.at_val.at_long += lnum;
				val3.at_val.at_long += lnum3;
			} else if (strcmp(rd->rs_name, "cpupercent") == 0) {
				for (i = 0; i < pjob->ji_numrescs; i++) {
					nr = &pjob->ji_resources[i];
					lnum += nr->nr_cpupercent;
					if (nr->nr_status != PBS_NODERES_DELETE)
						lnum3 += nr->nr_cpupercent;
				}
				val.at_val.at_long += lnum;
				val3.at_val.at_long += lnum3;
			}
#ifdef PYTHON
			else if (strcmp(rd->rs_name, RESOURCE_UNKNOWN) != 0 &&
				 (val.at_type == ATR_TYPE_LONG ||
				  val.at_type == ATR_TYPE_FLOAT ||
				  val.at_type == ATR_TYPE_SIZE ||
				  val.at_type == ATR_TYPE_STR)) {

				PyObject *py_accum = NULL;  /* holds accum resources_used values from all moms (including the released sister moms from job) */
				PyObject *py_accum3 = NULL; /* holds accum resources_used values from all moms (NOT including the released sister moms from job) */

				/* The following 2 temp variables will be set to 1
				 * if there's an error accumulating resources_used
				 * values from all sister moms including those that
				 * have been released from the job (fail) or from
				 * all sister moms NOT including the released nodes
				 * from job (fail2).
				 */
				int fail = 0;
				int fail2 = 0;

				py_jvalue = NULL;
				tmpatr.at_type = tmpatr3.at_type = val.at_type;

				if (val.at_type != ATR_TYPE_STR) {
					rd->rs_set(&tmpatr, &val, SET);
					rd->rs_set(&tmpatr3, &val, SET);
				} else {
					py_accum = PyDict_New();
					if (py_accum == NULL) {
						log_err(-1, __func__, "error creating accumulation dictionary");
						continue;
					}
					py_accum3 = PyDict_New();
					if (py_accum3 == NULL) {
						log_err(-1, __func__, "error creating accumulation dictionary 3");
						Py_CLEAR(py_accum);
						continue;
					}
				}

				/* accumulating resources_used values from sister
				 * moms into tmpatr (from all sisters including released
				 * moms) and tmpatr3 (from sisters that have not been
				 * released from the job).
				 */
				for (i = 0; i < pjob->ji_numrescs; i++) {
					char mom_hname[PBS_MAXHOSTNAME + 1];
					char *p = NULL;
					attribute *at2;
					resource *rs2;

					if (pjob->ji_resources[i].nodehost == NULL)
						continue;

					at2 = &pjob->ji_resources[i].nr_used;
					if ((at2->at_flags & ATR_VFLAG_SET) == 0)
						continue;

					pbs_strncpy(mom_hname, pjob->ji_resources[i].nodehost, sizeof(mom_hname));
					mom_hname[PBS_MAXHOSTNAME] = '\0';
					p = strchr(mom_hname, '.');
					if (p != NULL)
						*p = '\0';

					fail = fail2 = 0;
					rs2 = (resource *) GET_NEXT(at2->at_val.at_list);
					for (; rs2 != NULL; rs2 = (resource *) GET_NEXT(rs2->rs_link)) {

						attribute val2; /* temp variable for accumulating resources_used from sis Moms */
						resource_def *rd2;

						rd2 = rs2->rs_defin;
						val2 = rs2->rs_value; /* copy resource attribute */
						if ((val2.at_flags & ATR_VFLAG_SET) == 0 || strcmp(rd2->rs_name, rd->rs_name) != 0)
							continue;

						if (val2.at_type == ATR_TYPE_STR) {
							sval = val2.at_val.at_str;
							py_jvalue = json_loads(sval, emsg, HOOK_BUF_SIZE - 1);
							if (py_jvalue == NULL) {
								log_errf(-1, __func__,
									 "Job %s resources_used.%s cannot be accumulated: value '%s' from mom %s not JSON-format: %s",
									 pjob->ji_qs.ji_jobid, rd2->rs_name, sval, mom_hname, emsg);
								fail = 1;
							} else if (PyDict_Merge(py_accum, py_jvalue, 1) != 0) {
								log_errf(-1, __func__,
									 "Job %s resources_used.%s cannot be accumulated: value '%s' from mom %s: error merging values",
									 pjob->ji_qs.ji_jobid, rd2->rs_name, sval, mom_hname);
								Py_CLEAR(py_jvalue);
								fail = 1;
							} else {
								if (pjob->ji_resources[i].nr_status != PBS_NODERES_DELETE) {
									if (PyDict_Merge(py_accum3, py_jvalue, 1) != 0) {
										log_errf(-1, __func__,
											 "Job %s resources_used.%s cannot be accumulated: value '%s' from mom %s: error merging values",
											 pjob->ji_qs.ji_jobid, rd2->rs_name, sval, mom_hname);
										fail2 = 1;
									}
									Py_CLEAR(py_jvalue);
								} else {
									Py_CLEAR(py_jvalue);
								}
							}

						} else {
							rd->rs_set(&tmpatr, &val2, INCR);
							if (pjob->ji_resources[i].nr_status != PBS_NODERES_DELETE)
								rd->rs_set(&tmpatr3, &val2, INCR);
						}
						break;
					}
				}

				/* accumulating the resources_used values from MS mom */

				if (val.at_type == ATR_TYPE_STR) {

					if (fail) {
						Py_CLEAR(py_accum);
						Py_CLEAR(py_accum3);
						/* unset resc */
						(void) add_to_svrattrl_list(phead, ad->at_name, rd->rs_name, "", SET, NULL);
						/* go to next resource to encode_used */
						continue;
					}

					if (fail2) {
						Py_CLEAR(py_accum);
						Py_CLEAR(py_accum3);
						/* unset resc */
						(void) add_to_svrattrl_list(phead, ad3->at_name, rd->rs_name, "", SET, NULL);
						/* go to next resource to encode_used */
						continue;
					}

					sval = val.at_val.at_str;
					if (PyDict_Size(py_accum) == 0) {
						/* no other values seen
						 * except from MS...use as is
						 * don't JSONify
						 */
						rd->rs_decode(&tmpatr, ATTR_used, rd->rs_name, sval);
						Py_CLEAR(py_accum);
						Py_CLEAR(py_accum3);
					} else if ((py_jvalue = json_loads(sval, emsg, HOOK_BUF_SIZE - 1)) == NULL) {
						log_errf(-1, __func__,
							 "Job %s resources_used.%s cannot be accumulated: value '%s' from mom %s not JSON-format: %s",
							 pjob->ji_qs.ji_jobid, rd->rs_name, sval, mom_short_name, emsg);
						Py_CLEAR(py_accum);
						Py_CLEAR(py_accum3);
						/* unset resc */
						(void) add_to_svrattrl_list(phead, ad->at_name, rd->rs_name, "", SET, NULL);
						/* go to next resource to encode */
						continue;
					} else if (PyDict_Merge(py_accum, py_jvalue, 1) != 0) {
						log_errf(-1, __func__,
							 "Job %s resources_used.%s cannot be accumulated: value '%s' from mom %s: error merging values",
							 pjob->ji_qs.ji_jobid, rd->rs_name, sval, mom_short_name);
						Py_CLEAR(py_jvalue);
						Py_CLEAR(py_accum);
						Py_CLEAR(py_accum3);
						/* unset resc */
						(void) add_to_svrattrl_list(phead, ad->at_name, rd->rs_name, "", SET, NULL);
						/* go to next resource to encode */
						continue;
					} else {
						dumps = json_dumps(py_accum, emsg, HOOK_BUF_SIZE - 1);
						if (dumps == NULL) {
							log_errf(-1, __func__,
								 "Job %s resources_used.%s cannot be accumulated: %s",
								 pjob->ji_qs.ji_jobid, rd->rs_name, emsg);
							Py_CLEAR(py_jvalue);
							Py_CLEAR(py_accum);
							Py_CLEAR(py_accum3);
							/* unset resc */
							(void) add_to_svrattrl_list(phead, ad->at_name, rd->rs_name, "", SET, NULL);
							continue;
						}

						rd->rs_decode(&tmpatr, ATTR_used, rd->rs_name, dumps);
						Py_CLEAR(py_accum);
						free(dumps);

						if (PyDict_Merge(py_accum3, py_jvalue, 1) != 0) {
							log_errf(-1, __func__,
								 "Job %s resources_used_update.%s cannot be accumulated: value '%s' from mom %s: error merging values",
								 pjob->ji_qs.ji_jobid, rd->rs_name, sval, mom_short_name);
							Py_CLEAR(py_jvalue);
							Py_CLEAR(py_accum3);
							/* unset resc */
							(void) add_to_svrattrl_list(phead, ad3->at_name, rd->rs_name, "", SET, NULL);
							/* go to next resource to encode */
							continue;
						} else if ((dumps = json_dumps(py_accum3, emsg, HOOK_BUF_SIZE - 1)) == NULL) {
							log_errf(-1, __func__,
								 "Job %s resources_used_update.%s cannot be accumulated: %s",
								 pjob->ji_qs.ji_jobid, rd->rs_name, emsg);
							Py_CLEAR(py_jvalue);
							Py_CLEAR(py_accum3);
							/* unset resc */
							(void) add_to_svrattrl_list(phead, ad3->at_name, rd->rs_name, "", SET, NULL);
							continue;
						} else {
							rd->rs_decode(&tmpatr3, ATTR_used_update, rd->rs_name, dumps);
							Py_CLEAR(py_jvalue);
							Py_CLEAR(py_accum3);
							free(dumps);
						}
					}
				}
				val = tmpatr;
				val3 = tmpatr3;
			}
#endif
			/* no resource to accumulate and yet a multinode job */
		}

		if (val.at_type != ATR_TYPE_STR || pjob->ji_numnodes == 1 || pjob->ji_resources != NULL) {
			/* for string values, set value if single node job
			 * (i.e. pjob->ji_numnodes == 1), or
			 * if the value is accumulated from the various
			 * values obtained from sister nodes
			 * (i.e. pjob->ji_resources != NULL).
			 */
			if (val.at_type == ATR_TYPE_STR && pjob->ji_numnodes == 1) {
				/* check if string value is a valid json string,
				 * if it is then set the resource string within
				 * single quotes.
				 */

				sval = val.at_val.at_str;
				if ((py_jvalue = json_loads(sval, emsg, HOOK_BUF_SIZE - 1)) != NULL) {
					dumps = json_dumps(py_jvalue, emsg, HOOK_BUF_SIZE - 1);
					if (dumps == NULL)
						Py_CLEAR(py_jvalue);
					else {
						rd->rs_decode(&tmpatr, ATTR_used, rd->rs_name, dumps);
						val = tmpatr;
						Py_CLEAR(py_jvalue);
						free(dumps);
						dumps = NULL;
					}
				}
			}

			if (rd->rs_encode(&val, phead, ad->at_name, rd->rs_name, ATR_ENCODE_CLIENT, NULL) < 0)
				goto encode_used_exit;

			if (include_resc_used_update) {
				if (rd->rs_encode(&val3, phead, ad3->at_name, rd->rs_name, ATR_ENCODE_CLIENT, NULL) < 0)
					goto encode_used_exit;
			}
		}

	encode_used_exit:
		if ((tmpatr.at_flags & ATR_VFLAG_SET) != 0 && tmpatr.at_type == ATR_TYPE_STR)
			rd->rs_free(&tmpatr);
		if ((tmpatr3.at_flags & ATR_VFLAG_SET) != 0 && tmpatr3.at_type == ATR_TYPE_STR)
			rd->rs_free(&tmpatr3);
	}
}

/**
 * @brief
 * 	generate new resc used update based on given job information
 *
 * @param[in] pjob - pointer to job
 *
 * @return ruu *
 *
 * @return NULL  - failure
 * @return !NULL - success
 *
 * @warning
 * 	retuned pointer should be free'd using FREE_RUU() when not needed
 */
static ruu *
get_job_update(job *pjob)
{
	/*
	 * the following is a list of attributes to be returned to the server
	 * for a newly executing job. They are returned only if they have
	 * been modified by Mom.  Note that JOB_ATR_session_id and JOB_ATR_resc_used
	 * are always returned;
	 */
	static enum job_atr mom_rtn_list[] = {
		JOB_ATR_errpath,
		JOB_ATR_outpath,
		JOB_ATR_altid,
		JOB_ATR_acct_id,
		JOB_ATR_jobdir,
		JOB_ATR_exectime,
		JOB_ATR_hold,
		JOB_ATR_variables,
		JOB_ATR_runcount,
		JOB_ATR_exec_vnode,
		JOB_ATR_SchedSelect,
		JOB_ATR_LAST};
	ruu *prused;
	int i;
	int nth;
	attribute *at;
	attribute_def *ad;

	prused = (ruu *) calloc(1, sizeof(ruu));
	if (prused == NULL) {
		log_joberr(errno, __func__, "Out of memory while encoding stat update", pjob->ji_qs.ji_jobid);
		return NULL;
	}
	CLEAR_LINK(prused->ru_pending);
	CLEAR_HEAD(prused->ru_attr);
	prused->ru_created_at = time(0);
	prused->ru_pjobid = strdup(pjob->ji_qs.ji_jobid);
	if (prused->ru_pjobid == NULL) {
		FREE_RUU(prused);
		log_joberr(errno, __func__, "Out of memory while encoding jobid in stat update", pjob->ji_qs.ji_jobid);
		return NULL;
	}

	resc_access_perm = ATR_DFLAG_MGRD;

	if (is_jattr_set(pjob, JOB_ATR_run_version))
		prused->ru_hop = get_jattr_long(pjob, JOB_ATR_run_version);
	else
		prused->ru_hop = get_jattr_long(pjob, JOB_ATR_runcount);
#ifdef WIN32
	if (is_jattr_set(pjob, JOB_ATR_Comment)) {
		prused->ru_comment = strdup(get_jattr_str(pjob, JOB_ATR_Comment));
		if (prused->ru_comment == NULL)
			log_joberr(errno, __func__, "Out of memory while encoding comment in stat update", pjob->ji_qs.ji_jobid);
	}
#endif
	if ((at = get_jattr(pjob, JOB_ATR_session_id))->at_flags & ATR_VFLAG_MODIFY) {
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "SID is: %ld", get_jattr_long(pjob, JOB_ATR_session_id));
		job_attr_def[JOB_ATR_session_id].at_encode(at, &prused->ru_attr,
							   job_attr_def[JOB_ATR_session_id].at_name,
							   NULL, ATR_ENCODE_CLIENT, NULL);
	}

	if (mock_run) {
		/* Also add substate & state to the attrs sent to servers since we don't have a session id */
		job_attr_def[JOB_ATR_state].at_encode(get_jattr(pjob, JOB_ATR_state), &prused->ru_attr,
						      job_attr_def[JOB_ATR_state].at_name, NULL, ATR_ENCODE_CLIENT, NULL);
		job_attr_def[JOB_ATR_substate].at_encode(get_jattr(pjob, JOB_ATR_substate), &prused->ru_attr,
							 job_attr_def[JOB_ATR_substate].at_name, NULL, ATR_ENCODE_CLIENT, NULL);
	}

	/* sister moms update of used resources
	 * is done by send_resc_used_to_ms(); do not send it here
	 */
	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE)) {
		/*
		 * The update_walltime() ensures the walltime is always set before encode_used().
		 * A job without used walltime could occur in the first seconds of a job.
		 * This ensures the used walltime is set even if the elapsed time is zero.
		 */
		update_walltime(pjob);

		encode_used(pjob, &prused->ru_attr);
	}

	/* Now add certain others as required for updating at the Server */
	for (i = 0; mom_rtn_list[i] != JOB_ATR_LAST; ++i) {
		nth = mom_rtn_list[i];
		at = get_jattr(pjob, nth);
		ad = &job_attr_def[nth];

		if ((at->at_flags & ATR_VFLAG_MODIFY) ||
		    (at->at_flags & ATR_VFLAG_HOOK) ||
		    (pjob->ji_pending_ruu != NULL && find_svrattrl_list_entry(&(((ruu *) pjob->ji_pending_ruu)->ru_attr), ad->at_name, NULL) != NULL)) {
			ad->at_encode(at, &prused->ru_attr, ad->at_name, NULL, ATR_ENCODE_CLIENT, NULL);
			if (at->at_flags & ATR_VFLAG_MODIFY)
				at->at_flags &= ~ATR_VFLAG_MODIFY;
		}
	}

	return prused;
}

/**
 * @brief
 * 	generate resc used update for given job and put it in queue
 * 	to send to server
 *
 * @param[in] pjob - pointer to job
 * @param[in] cmd  - cmd to be send along with resc used update to server
 *
 * @return int
 *
 * @retval 1 - failure
 * @retval 0 - success
 *
 */
int
enqueue_update_for_send(job *pjob, int cmd)
{
	ruu *prused = get_job_update(pjob);
	if (prused == NULL)
		return 1; /* get_job_update has done error logging */

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
		/* If sister node of job, send update right away */
		send_resc_used(cmd, 1, prused);
		FREE_RUU(prused);
		return 0;
	}

	if (pjob->ji_pending_ruu != NULL) {
		ruu *x = (ruu *) (pjob->ji_pending_ruu);
		FREE_RUU(x);
	}
	prused->ru_cmd = cmd;
	prused->ru_pjob = pjob;
	pjob->ji_pending_ruu = prused;
	if (cmd == IS_JOBOBIT)
		prused->ru_status = pjob->ji_qs.ji_un.ji_momt.ji_exitstat;

	/* link in global pending ruu update list */
	append_link(&mom_pending_ruu, &prused->ru_pending, (void *) prused);

	return 0;
}

/**
 * @brief
 * 	create bundles of pending updates in queue based on their cmds
 * 	if cmd of update is not IS_OBIT then check time of creatation
 * 	of update and based on that decide whether to send that update
 * 	or delay it for rescused_send_delay
 *
 * @param[out] r_cnt    - number of updates in prused bundle
 * @param[out] prused   - bundle of IS_RESCUSED updates
 * @param[out] rh_cnt   - number of updates in prhused bundle
 * @param[out] prhused  - bundle of IS_RESCUSED_FROM_HOOK updates
 * @param[out] obits_cnt - number of updates in obits bundle
 * @param[out] obits    - bundle of IS_OBIT updates
 *
 * @return void
 *
 */
static void
bundle_ruu(int *r_cnt, ruu **prused, int *rh_cnt, ruu **prhused, int *obits_cnt, ruu **obits)
{
	static int rescused_send_delay = 2;
	ruu *cur;
	ruu *next;

	*r_cnt = 0;
	*prused = NULL;
	*rh_cnt = 0;
	*prhused = NULL;
	*obits_cnt = 0;
	*obits = NULL;

	cur = (ruu *) GET_NEXT(mom_pending_ruu);
	while (cur != NULL) {
		next = (ruu *) GET_NEXT(cur->ru_pending);
		if (cur->ru_cmd == IS_JOBOBIT) {
			cur->ru_next = *obits;
			*obits = cur;
			(*obits_cnt)++;
		} else if (time_now >= (cur->ru_created_at + rescused_send_delay)) {
			if (cur->ru_cmd == IS_RESCUSED) {
				cur->ru_next = *prused;
				*prused = cur;
				(*r_cnt)++;
			} else if (cur->ru_cmd == IS_RESCUSED_FROM_HOOK) {
				cur->ru_next = *prhused;
				*prhused = cur;
				(*rh_cnt)++;
			}
		}
		cur = next;
	}
}

/**
 * @brief
 * 	Send the amount of resources used by jobs to the server
 * 	This function used to encode and send the data for IS_RESCUSED,
 * 	IS_JOBOBIT, IS_RESCUSED_FROM_HOOK.
 *
 * @param[in] cmd   - communication command to use
 * @param[in] count - number of  jobs to update.
 * @param[in] rud   - input structure containing info about the jobs, resources used, etc...
 *
 * @note
 * 	If cmd is IS_RESCUSED_FROM_HOOK and there's an error communicating
 * 	to the server, the server_stream connection is not closed automatically.
 * 	It's possible it could be a transient error, and this function may
 * 	have been called from a child mom. Closing the server_stream would
 * 	cause the server to see mom as down.
 *
 * @return void
 *
 */
void
send_resc_used(int cmd, int count, ruu *rud)
{
	int ret;

	if (count == 0 || rud == NULL || server_stream < 0)
		return;
	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, "",
		   "send_resc_used update to server on stream %d\n", server_stream);

	ret = is_compose(server_stream, cmd);
	if (ret != DIS_SUCCESS)
		goto err;

	ret = diswui(server_stream, count);
	if (ret != DIS_SUCCESS)
		goto err;

	while (rud) {
		ret = diswst(server_stream, rud->ru_pjobid);
		if (ret != DIS_SUCCESS)
			goto err;

		if (rud->ru_comment) {
			/* non-null comment: send "1" followed by comment */
			ret = diswsi(server_stream, 1);
			if (ret != DIS_SUCCESS)
				goto err;
			ret = diswst(server_stream, rud->ru_comment);
			if (ret != DIS_SUCCESS)
				goto err;
		} else {
			/* null comment: send "0" */
			ret = diswsi(server_stream, 0);
			if (ret != DIS_SUCCESS)
				goto err;
		}
		ret = diswsi(server_stream, rud->ru_status);
		if (ret != DIS_SUCCESS)
			goto err;

		ret = diswsi(server_stream, rud->ru_hop);
		if (ret != DIS_SUCCESS)
			goto err;

		ret = encode_DIS_svrattrl(server_stream, (svrattrl *) GET_NEXT(rud->ru_attr));
		if (ret != DIS_SUCCESS)
			goto err;

		rud = rud->ru_next;
	}

	if (dis_flush(server_stream) != 0)
		goto err;

	return;

err:
	sprintf(log_buffer, "%s for %d", dis_emsg[ret], cmd);
#ifdef WIN32
	if (errno != 10054)
#endif
		log_err(errno, "send_resc_used", log_buffer);

	if (cmd != IS_RESCUSED_FROM_HOOK) {
		tpp_close(server_stream);
		server_stream = -1;
	}
	return;
}

/**
 * @brief
 * 	generate pending update bundles and send it to server
 *
 * @retval void
 */
void
send_pending_updates(void)
{
	int r_cnt;
	ruu *prused;
	int rh_cnt;
	ruu *prhused;
	int obits_cnt;
	ruu *obits;
	ruu *next;

	bundle_ruu(&r_cnt, &prused, &rh_cnt, &prhused, &obits_cnt, &obits);
	if (r_cnt > 0) {
		send_resc_used(IS_RESCUSED, r_cnt, prused);
		while (prused != NULL) {
			next = prused->ru_next;
			FREE_RUU(prused);
			prused = next;
		}
	}
	if (rh_cnt > 0) {
		send_resc_used(IS_RESCUSED_FROM_HOOK, rh_cnt, prhused);
		while (prhused != NULL) {
			next = prhused->ru_next;
			FREE_RUU(prhused);
			prhused = next;
		}
	}
	if (obits_cnt > 0) {
		send_resc_used(IS_JOBOBIT, obits_cnt, obits);
		while (obits != NULL) {
			next = obits->ru_next;
			/*
			 * Here, we reply to outstanding request
			 * this should come after obit sent
			 */
			if (obits->ru_pjob && obits->ru_pjob->ji_preq) {
				reply_ack(obits->ru_pjob->ji_preq);
				obits->ru_pjob->ji_preq = NULL;
			}
			FREE_RUU(obits);
			obits = next;
		}
	}
}


================================================
FILE: src/resmom/mom_vnode.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_vnode.c
 */
#include <sys/types.h>
#include <assert.h>
#include <errno.h>
#include <stdio.h>
#include <unistd.h>
#include <limits.h>
#include "pbs_config.h"
#include "pbs_internal.h"
#include "libpbs.h"
#include "log.h"
#include "server_limits.h"
#include "attribute.h"
#include "placementsets.h"
#include "resource.h"
#include "pbs_nodes.h"
#include "mom_mach.h"
#include "mom_vnode.h"
#include "libutil.h"
#include "hook_func.h"

#ifndef _POSIX_ARG_MAX
#define _POSIX_ARG_MAX 4096 /* largest value standards guarantee */
#endif

extern char mom_host[];
extern unsigned int pbs_mom_port;
extern unsigned int pbs_rm_port;
extern vnl_t *vnlp; /* vnode list */
static void *cpuctx;
static void cpu_inuse(unsigned int, job *, int);
static void *new_ctx(void);
static mom_vninfo_t *new_vnid(const char *, void *);
static void truncate_and_log(int, const char *, char *, int);
static mom_vninfo_t *vnid2mominfo(const char *, const void *);
enum res_op { RES_DECR,
	      RES_INCR,
	      RES_SET };

/**
 * @brief
 *	Log debugging information pertaining to each CPU that we are managing.
 *	Each CPU may be in one of three states:  free for use, in use by a job,
 *	or in use but not assigned to a job (the last of these is used for CPUs
 *	declared unusable by cpunum_outofservice()).
 *
 * @return Void
 *
 */
void
mom_CPUs_report(void)
{
	int ret;
	char *p;
	char reportbuf[LOG_BUF_SIZE];
	int bufspace; /* space remaining in reportbuf[] */
	void *idx_ctx = NULL;
	mominfo_t *mip = NULL;
	int log_ev = PBSEVENT_DEBUG3;

	if (cpuctx == NULL || !will_log_event(log_ev))
		return;

	while (pbs_idx_find(cpuctx, NULL, (void **) &mip, &idx_ctx) == PBS_IDX_RET_OK) {
		unsigned int i;
		int first;
		mom_vninfo_t *mvp;

		assert(mip != NULL);
		assert(mip->mi_data != NULL);

		mvp = (mom_vninfo_t *) mip->mi_data;
		p = reportbuf;
		bufspace = sizeof(reportbuf);
		ret = snprintf(p, bufspace, "%s:  cpus = ", mvp->mvi_id);
		if (ret >= bufspace) {
			truncate_and_log(log_ev, __func__, reportbuf, sizeof(reportbuf));
			continue;
		}
		p += ret;
		bufspace -= ret;
		for (i = 0, first = 1; i < mvp->mvi_ncpus; i++) {
			if (first)
				first = 0;
			else {
				if (bufspace < 1) {
					truncate_and_log(log_ev, __func__, reportbuf, sizeof(reportbuf));
					goto line_done;
				}
				sprintf(p, ",");
				p++;
				bufspace--;
			}

			ret = snprintf(p, bufspace, "%d", mvp->mvi_cpulist[i].mvic_cpunum);
			if (ret >= bufspace) {
				truncate_and_log(log_ev, __func__, reportbuf, sizeof(reportbuf));
				goto line_done;
			}
			p += ret;
			bufspace -= ret;

			if (MVIC_CPUISFREE(mvp, i))
				ret = snprintf(p, bufspace, " (free)");
			else {
				if (mvp->mvi_cpulist[i].mvic_job == NULL)
					ret = snprintf(p, bufspace, " (inuse, no job)");
				else
					ret = snprintf(p, bufspace, " (inuse, job %s)", mvp->mvi_cpulist[i].mvic_job->ji_qs.ji_jobid);
			}
			if (ret >= bufspace) {
				truncate_and_log(log_ev, __func__, reportbuf, sizeof(reportbuf));
				goto line_done;
			}
			p += ret;
			bufspace -= ret;
		}
		log_event(log_ev, 0, LOG_DEBUG, __func__, reportbuf);
	line_done:;
	}

	pbs_idx_free_ctx(idx_ctx);
}

/**
 * @brief
 *	In case of buffer overflow, we log what we can and indicate with an
 *	ellipsis at the end that the line overflowed.
 *
 * @param[in] log_ev - log event
 * @param[in] id - id for log msg
 * @param[in] buf - buffer holding log msg
 * @param[in] bufsize - buffer size
 *
 * @return Void
 *
 */
static void
truncate_and_log(int log_ev, const char *id, char *buf, int bufsize)
{
	buf[bufsize - 4] = buf[bufsize - 3] = buf[bufsize - 2] = '.';
	buf[bufsize - 1] = '\0';
	log_event(log_ev, 0, LOG_DEBUG, id, buf);
}

/**
 * @brief
 *	Log debugging information containing a description of the vnode list
 *	in 'vnl'.
 *	(a rather complicated structure described in "placementsets.h").
 *
 * @param[in]	vnl  - vnode list we're interested in
 * @param[in] 	header - heading of the log message
 *
 * @return void
 *
 */
void
mom_vnlp_report(vnl_t *vnl, char *header)
{
	int i;
	char reportbuf[LOG_BUF_SIZE + 1];
	char *p = NULL;
	vnl_t *vp;
	char attrprefix[] = ", attrs[]:  ";
	int bytes_left;
	int log_ev = PBSEVENT_DEBUG3;

	if (vnl == NULL || !will_log_event(log_ev))
		return;

	vp = vnl;

	for (i = 0; i < vp->vnl_used; i++) {
		vnal_t *vnalp;
		int j, k;

		vnalp = VNL_NODENUM(vp, i);
		bytes_left = LOG_BUF_SIZE;
		p = reportbuf;
		k = snprintf(p, bytes_left, "vnode %s:  nelem %lu", vnalp->vnal_id, vnalp->vnal_used);
		if (k < 0)
			break;
		bytes_left -= k;
		if (bytes_left <= 0)
			break;
		p += k;
		if (vnalp->vnal_used > 0) {
			if (bytes_left < sizeof(attrprefix))
				break;
			strcat(p, attrprefix);
			bytes_left -= sizeof(attrprefix);
			if (bytes_left <= 0)
				break;
			p += sizeof(attrprefix);
		}
		for (j = 0; j < vnalp->vnal_used; j++) {
			vna_t *vnap;

			vnap = VNAL_NODENUM(vnalp, j);
			if (j > 0) {
				strcat(p, ", ");
				bytes_left -= 2;
				if (bytes_left <= 0)
					break;
				p += 2;
			}
			k = snprintf(p, bytes_left, "\"%s\" = \"%s\"", vnap->vna_name, vnap->vna_val);
			if (k < 0)
				break;
			bytes_left -= k;
			if (bytes_left <= 0)
				break;
			p += k;
		}
		log_event(log_ev, 0, LOG_DEBUG, header ? header : __func__, reportbuf);
		p = NULL;
	}
	if (p != NULL) { /* log any remaining item */
		log_event(log_ev, 0, LOG_DEBUG, header ? header : __func__, reportbuf);
	}
}

/**
 * @brief
 *	Add a range of CPUs (an element of the form M or M-N where M and N are
 *	nonnegative integers) to the given mvi.  If any CPUs are already present
 *	in mvp->mvi_cpulist[], they are preserved and their state is unchanged.
 *
 * @param[in] mvp - pointer to mom_vninfo_t
 * @param[in] cpurange - cpu range
 *
 * @return Void
 *
 */
static void
add_CPUrange(mom_vninfo_t *mvp, char *cpurange)
{
	char *p;
	unsigned int from, to;
	unsigned int cpunum;
	unsigned int i, ncpus;
	static int chunknum = 0;

	if ((p = strchr(cpurange, '-')) != NULL) {

		*p = '\0';
		from = strtoul(cpurange, NULL, 0);
		to = strtoul(p + 1, NULL, 0);
		if (from > to) {
			sprintf(log_buffer, "chunk %d:  lhs (%u) > rhs (%u)",
				chunknum, from, to);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			return;
		}
	} else {
		from = to = strtoul(cpurange, NULL, 0);
		chunknum++;
	}

	for (cpunum = from, ncpus = mvp->mvi_ncpus; cpunum <= to; cpunum++) {
#ifdef DEBUG
		/*
		 *	It's not obvious in reading the code that when we get
		 *	to the "for" loop below, mvp->mvi_cpulist is non-NULL.
		 *	It happens because the first time we add any CPUs to
		 *	this vnode's CPU list, ncpus will be 0 and we do a
		 *	realloc(NULL, ...) to allocate the initial storage.
		 */
		if (ncpus > 0)
			assert(mvp->mvi_cpulist != NULL);
#endif /* DEBUG */
		for (i = 0; i < ncpus; i++)
			if (cpunum == mvp->mvi_cpulist[i].mvic_cpunum)
				break;

		if (i >= ncpus) { /* CPU cpunum not in mvi_cpulist[] */
			mom_mvic_t *l;

			l = realloc(mvp->mvi_cpulist,
				    (ncpus + 1) * sizeof(mom_mvic_t));
			if (l == NULL) {
				log_err(errno, __func__, "malloc failure");
				return;
			} else
				mvp->mvi_cpulist = l;
			mvp->mvi_cpulist[ncpus].mvic_cpunum = cpunum;
			cpuindex_free(mvp, ncpus);
			mvp->mvi_ncpus++;
			mvp->mvi_acpus++;
			ncpus = mvp->mvi_ncpus;
		}
	}
}

/**
 * @brief
 *	cpuindex_free() and cpuindex_inuse() are ``context-sensitive'' functions
 *	that mark as free or busy a CPU which is referred to by an index that is
 *	relative to the vnode to which it's attached.  That is, physical CPU 17
 *	may be referred to as index 3 relative to vnode "foo".
 *
 * @param[in] mvp - pointer to mom_vninfo_t structure
 * @param[in] cpuindex - cpu index
 *
 * @return Void
 *
 */
void
cpuindex_free(mom_vninfo_t *mvp, unsigned int cpuindex)
{
	char buf[BUFSIZ];

	assert(mvp != NULL);
	assert(cpuindex <= mvp->mvi_ncpus);
	sprintf(buf, "vnode %s:  mark CPU %u free", mvp->mvi_id,
		mvp->mvi_cpulist[cpuindex].mvic_cpunum);
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, buf);

	mvp->mvi_cpulist[cpuindex].mvic_flags = MVIC_FREE;
	mvp->mvi_cpulist[cpuindex].mvic_job = NULL;
}

/**
 * @brief
 *      cpuindex_free() and cpuindex_inuse() are ``context-sensitive'' functions
 *      that mark as free or busy a CPU which is referred to by an index that is
 *      relative to the vnode to which it's attached.  That is, physical CPU 17
 *      may be referred to as index 3 relative to vnode "foo".
 *
 * @param[in] mvp - pointer to mom_vninfo_t structure
 * @param[in] cpuindex - cpu index
 * @param[in] pjob - pointer to job structure
 *
 * @return Void
 *
 */
void
cpuindex_inuse(mom_vninfo_t *mvp, unsigned int cpuindex, job *pjob)
{
	char buf[BUFSIZ];

	assert(mvp != NULL);
	assert(cpuindex <= mvp->mvi_ncpus);
	if (pjob == NULL) {
		sprintf(buf, "vnode %s:  mark CPU %u inuse", mvp->mvi_id,
			mvp->mvi_cpulist[cpuindex].mvic_cpunum);
	} else {
		sprintf(buf, "vnode %s:  mark CPU %u inuse by job %s",
			mvp->mvi_id, mvp->mvi_cpulist[cpuindex].mvic_cpunum,
			pjob->ji_qs.ji_jobid);
	}
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, buf);

	mvp->mvi_cpulist[cpuindex].mvic_flags = MVIC_ASSIGNED;
	mvp->mvi_cpulist[cpuindex].mvic_job = pjob;
}

/**
 * @brief
 *	Find the vnode with ID vnid and adjust (decrement, increment, or set)
 *	the value of resource res by the amount adjval
 *
 * @param[in] vp - pointer to vnl_t structure
 * @param[in] vnid - vnode id
 * @param[in] res - resource name
 * @param[in] op - enum for resource option
 *
 * @return Void
 *
 */
static void
resadj(vnl_t *vp, const char *vnid, const char *res, enum res_op op,
       unsigned int adjval)
{
	int i, j;
	char *vna_newval;

	sprintf(log_buffer, "vnode %s, resource %s, res_op %d, adjval %u",
		vnid, res, (int) op, adjval);
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, log_buffer);
	for (i = 0; i < vp->vnl_used; i++) {
		vnal_t *vnalp;

		vnalp = VNL_NODENUM(vp, i);
		if (strcmp(vnalp->vnal_id, vnid) != 0)
			continue;
		for (j = 0; j < vnalp->vnal_used; j++) {
			vna_t *vnap;

			vnap = VNAL_NODENUM(vnalp, j);
			if (strcmp(vnap->vna_name, res) == 0) {
				unsigned int resval;
				char valbuf[BUFSIZ];

				resval = strtoul(vnap->vna_val, NULL, 0);
				switch ((int) op) {
					case RES_DECR:
						resval -= adjval;
						break;
					case RES_INCR:
						resval += adjval;
						break;
					case RES_SET:
						resval = adjval;
						break;
					default:
						sprintf(log_buffer, "unknown res_op %d",
							(int) op);
						log_event(PBSEVENT_ERROR, 0, LOG_ERR, __func__,
							  log_buffer);
						return;
				}

				/*
				 *	Deal with two things that should never
				 *	happen:  first, the result of adjusting
				 *	the resource value should never be
				 *	negative.  Second, BUFSIZ should always
				 *	be sufficient to hold any unsigned
				 *	quantity PBS deals with.
				 */
				if (((int) resval) < 0) {
					log_event(PBSEVENT_ERROR, 0, LOG_ERR,
						  __func__, "res underflow");
					return;
				}
				if (snprintf(valbuf, sizeof(valbuf), "%u",
					     resval) >= sizeof(valbuf)) {
					log_event(PBSEVENT_ERROR, 0, LOG_ERR,
						  __func__, "res overflow");
					return;
				}

				/*
				 *	We now replace the current value with
				 *	the adjusted one.  This may involve
				 *	surgery on the vna_t.
				 */
				vna_newval = strdup(valbuf);
				if (vna_newval != NULL) {
					free(vnap->vna_val);
					vnap->vna_val = vna_newval;
				} else
					log_err(PBSE_SYSTEM, __func__, "vna_newval strdup failed");
				return;
			}
		}
	}

	sprintf(log_buffer, "vnode %s, resource %s not found", vnid, res);
	log_event(PBSEVENT_DEBUG, 0, LOG_DEBUG, __func__, log_buffer);
}

/**
 * @brief
 *	cpunum_outofservice() is a ``context-free'' function that marks a CPU
 *	(which is referred to by its physical CPU number) as being unusable.
 *
 * @param[in] cpunum - number of cpu
 *
 * @return Void
 *
 */
void
cpunum_outofservice(unsigned int cpunum)
{
	char buf[BUFSIZ];

	sprintf(buf, "mark CPU %u out of service", cpunum);
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, buf);

	cpu_inuse(cpunum, NULL, 1);
}

/**
 * @brief
 *	Common code for cpunum_inuse() and cpunum_outofservice():  to find
 *	the given CPU in our list of CPUs per vnode, we walk the list of
 *	mom_vninfo_t structures and for each of those, the attached CPU lists
 *	looking for a match.  If taking a CPU out of service, cpu_inuse() must
 *	also adjust the "resources_available.ncpus" for the vnode that contains
 *	the CPU being taken out of service.
 *
 * @param[in] cpunum - number of cpu
 * @param[in] pjob - pointer to job structure
 * @param[in] outofserviceflag - flag value to indicate whether cpu out of service
 *
 * @return - Void
 *
 */
static void
cpu_inuse(unsigned int cpunum, job *pjob, int outofserviceflag)
{
	static char ra_ncpus[] = "resources_available.ncpus";
	void *idx_ctx = NULL;
	mominfo_t *mip = NULL;

	if (cpuctx == NULL)
		return;

	while (pbs_idx_find(cpuctx, NULL, (void **) &mip, &idx_ctx) == PBS_IDX_RET_OK) {
		unsigned int i;
		mom_vninfo_t *mvp;

		assert(mip != NULL);
		assert(mip->mi_data != NULL);

		mvp = (mom_vninfo_t *) mip->mi_data;
		for (i = 0; i < mvp->mvi_ncpus; i++) {
			if (mvp->mvi_cpulist[i].mvic_cpunum == cpunum) {
				if (MVIC_CPUISFREE(mvp, i)) {
					cpuindex_inuse(mvp, i, pjob);
					if (outofserviceflag != 0) {
						assert(vnlp != NULL);
						assert(mvp->mvi_id != NULL);
						resadj(vnlp, mvp->mvi_id, ra_ncpus, RES_DECR, 1);
						mvp->mvi_acpus--;
					}
				}
				pbs_idx_free_ctx(idx_ctx);
				return;
			}
		}
	}

	pbs_idx_free_ctx(idx_ctx);

	/*
	 *	If we get here, we didn't find the CPU in question.
	 *	Requests to mark a CPU for which we have no record
	 *	out of service may be benign;  we may never have
	 *	known about it because we were never told about it
	 *	in a vnode definitions file, and the caller may
	 *	simply not have checked first.  So, we silently
	 *	ignore those requests.  However, if we're asked
	 *	to mark a CPU in use but haven't heard of it, that's
	 *	an error.
	 */
	if (outofserviceflag == 0) {
		sprintf(log_buffer, "CPU %u not found in cpuctx", cpunum);
		log_err(PBSE_SYSTEM, __func__, log_buffer);
	}
}

/**
 * @brief
 *	Add a list of CPUs (one or more elements separated by ',' and of the
 *	form M or M-N where M and N are nonnegative integers) to the given mvi.
 *
 * @param[in] mvp - pointer to mom_vninfo_t structure which holds per mom info
 * @param[in] cpulist - cpu list seperated by ','.
 *
 * @return Void
 *
 */
static void
add_CPUlist(mom_vninfo_t *mvp, char *cpulist)
{
	char *p;

	if ((p = strtok(cpulist, ",")) != NULL) {
		add_CPUrange(mvp, p);
		while ((p = strtok(NULL, ",")) != NULL)
			add_CPUrange(mvp, p);
	}
}

/**
 * @brief
 *	Add the given wad of data (really a mominfo_t structure) to the given
 *	vnode ID, returning 1 if successful or 0 on failure.  An entry with the
 *	given vnode ID should not already be present;  users of this function
 *	should first check this using find_mominfo(), calling add_mominfo()
 *	only if find_mominfo() returned NULL.
 *
 * @param[in] ctx - new vnode
 * @param[in] vnid - vnode id
 * @param[in] data - info about vnode
 *
 * @return int
 * @retval 1 Failure
 * @retval 0 Success
 *
 */
static int
add_mominfo(void *ctx, const char *vnid, void *data)
{

	sprintf(log_buffer, "ctx %p, vnid %s, data %p", ctx, vnid, data);
	log_event(PBSEVENT_DEBUG3, 0, LOG_DEBUG, __func__, log_buffer);

	assert(find_vmapent_byID(ctx, vnid) == NULL);

	if (add_vmapent_byID(ctx, vnid, data) == 0)
		return (0);
	else
		return (1);
}

/**
 * @brief
 *	Return a pointer to the mominfo_t data associated with a given vnode ID,
 *	or NULL if no vnode with the given ID is present.
 *
 * @param[in] vnid - vnode id
 *
 * @return structure
 * @retval structure handle to mominfo_t
 *
 */
mominfo_t *
find_mominfo(const char *vnid)
{
	if (cpuctx == NULL) {
		log_err(PBSE_SYSTEM, __func__, "CPU context not initialized");
		return NULL;
	} else
		return (find_vmapent_byID(cpuctx, vnid));
}

/**
 * @brief
 *	This function is called from vn_addvnr() before vn_addvnr() inserts a
 *	new name/value pair.  If we return zero, the insertion of the given
 *	<ID, name, value> tuple will not occur (but processing of the file
 *	will continue normally);  if we return nonzero, the insertion of
 *	the given tuple will occur (and again, processing continues normally).
 *
 *	Currently we use this function to perform these actions:
 *
 *		for the "cpus" attribute, build a list of the CPUs belonging
 *		to given vnodes
 *
 *		for the "mems" attribute, to record the memory node number of
 *		the memory board belonging to a given vnode (note that in
 *		contrast to CPUs, of which there may be more than one, the
 *		model for memory is that of a single (logical) memory board
 *		per vnode)
 *
 *		for the "sharing" attribute, we simply remember the attribute
 *		value for later use
 *
 *		for the "resources_available.mem" attribute, set a flag that
 *		tells us to remember to do the memreserved adjustment
 *
 * @param[in] vnid - vnode id
 * @param[in] attr - attributes
 * @param[in] attrval - attribute value
 *
 * @return int
 * @retval -1     Failure
 * @retval  0,1   Success
 *
 */
int
vn_callback(const char *vnid, char *attr, char *attrval)
{
	static void *ctx = NULL;

	if (strcmp(attr, "cpus") == 0) {
		mom_vninfo_t *mvp;

		sprintf(log_buffer, "vnid %s, attr %s, val %s",
			vnid, attr, attrval);
		log_event(PBSEVENT_DEBUG3, 0, 0, __func__, log_buffer);

		if ((ctx == NULL) && ((ctx = new_ctx()) == NULL))
			return (-1);
		if ((mvp = vnid2mominfo(vnid, ctx)) == NULL)
			return (0);

		add_CPUlist(mvp, attrval);
		return (0);
	} else if (strcmp(attr, "mems") == 0) {
		mom_vninfo_t *mvp;

		sprintf(log_buffer, "vnid %s, attr %s, val %s",
			vnid, attr, attrval);
		log_event(PBSEVENT_DEBUG3, 0, 0, __func__, log_buffer);

		if ((ctx == NULL) && ((ctx = new_ctx()) == NULL))
			return (-1);
		if ((mvp = vnid2mominfo(vnid, ctx)) == NULL)
			return (0);

		mvp->mvi_memnum = atoi(attrval);
		return (0);
	} else if (strcmp(attr, "sharing") == 0) {
		mom_vninfo_t *mvp;

		if ((ctx == NULL) && ((ctx = new_ctx()) == NULL))
			return (-1);
		if ((mvp = vnid2mominfo(vnid, ctx)) == NULL)
			return (0);

		mvp->mvi_sharing = str_to_vnode_sharing(attrval);
		return (1);

	} else
		return (1);
}

/**
 * @brief
 *	returns new vnode
 *
 * @return vnode on Success or NULL on failure
 *
 */
static void *
new_ctx(void)
{
	if (!create_vmap(&cpuctx)) {
		log_err(PBSE_SYSTEM, __func__, "create_vmap failed");
		return NULL;
	} else
		return (cpuctx);
}

/**
 * @brief
 *	returns pointer to vnode info (mom_vninfo_t).
 *
 * @param[in] vnid - vnode id
 * @param[in] ctx - vnode info
 *
 * @return structure handle
 * @retval pointer to mom_vninfo_t
 *
 */
static mom_vninfo_t *
vnid2mominfo(const char *vnid, const void *ctx)
{
	mominfo_t *mip;
	mom_vninfo_t *mvp;

	assert(vnid != NULL);
	assert(ctx != NULL);

	if ((mip = find_vmapent_byID((void *) ctx, vnid)) != NULL) {
		sprintf(log_buffer, "found vnid %s", vnid);
		log_event(PBSEVENT_DEBUG3, 0, 0, __func__, log_buffer);

		mvp = mip->mi_data;
		assert(mvp != NULL);
	} else if ((mvp = new_vnid(vnid, (void *) ctx)) == NULL)
		return NULL;

	return (mvp);
}

/**
 * @brief
 *	create new vnode id for vnode
 *
 * @param[in] vnid - vnode id
 * @param[in] ctx - vnode info
 *
 * @return structure handle
 * @retval pointer to mom_vninfo_t
 *
 */
static mom_vninfo_t *
new_vnid(const char *vnid, void *ctx)
{
	mominfo_t *mip;
	mom_vninfo_t *mvp;
	char *newid;

	sprintf(log_buffer, "no vnid %s - creating", vnid);
	log_event(PBSEVENT_DEBUG3, 0, 0, __func__, log_buffer);

	if ((mip = malloc(sizeof(mominfo_t))) == NULL) {
		log_err(errno, __func__, "malloc mominfo_t");
		return NULL;
	}
	if ((mvp = malloc(sizeof(mom_vninfo_t))) == NULL) {
		free(mip);
		log_err(errno, __func__, "malloc vninfo_t");
		return NULL;
	}
	if ((newid = strdup(vnid)) == NULL) {
		free(mvp);
		free(mip);
		log_err(errno, __func__, "strdup vnid");
		return NULL;
	}

	snprintf(mip->mi_host, sizeof(mip->mi_host), "%s", mom_host);
	mip->mi_port = pbs_mom_port;
	mip->mi_rmport = pbs_rm_port;
	mip->mi_data = mvp;
	mvp->mvi_id = newid;
	mvp->mvi_ncpus = mvp->mvi_acpus = 0;
	mvp->mvi_cpulist = NULL;
	mvp->mvi_memnum = (unsigned int) -1; /* uninitialized data marker */

	if (add_mominfo(ctx, vnid, mip) != 0) {
		log_errf(PBSE_SYSTEM, __func__, "add_mominfo %s failed", vnid);
		return NULL;
	}

	return (mvp);
}


================================================
FILE: src/resmom/mom_walltime.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */
#include <pbs_config.h>

#include "attribute.h"
#include "job.h"
#include "pbs_assert.h"
#include "resource.h"
#include <stdlib.h>
#include <sys/types.h>
#include <time.h>

time_t time_now = 0;
double wallfactor = 1.00;

/**
 * @brief
 *
 *		start_walltime() starts counting the walltime of a job.
 *
 * @param[in] 	pjob	    - pointer to the job
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
start_walltime(job *pjob)
{
	if (NULL == pjob)
		return;
	/*
	 * time_now is global and should have positive value at this time
	 * if not, set it to current time
	 */
	if (0 == time_now)
		time_now = time(NULL);

	pjob->ji_walltime_stamp = time_now;
}

/**
 * @brief
 *
 *	update_walltime() updates the walltime of a job. If walltime is
 *	not in resources_used then update_walltime() creates a new entry
 *	for it.
 *
 * @param[in] 	pjob	    - pointer to the job
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
update_walltime(job *pjob)
{
	attribute *resources_used;
	resource_def *walltime_def;
	resource *used_walltime;

	resources_used = get_jattr(pjob, JOB_ATR_resc_used);
	assert(resources_used != NULL);
	walltime_def = &svr_resc_def[RESC_WALLTIME];
	used_walltime = find_resc_entry(resources_used, walltime_def);

	/* if walltime entry is not created yet, create it */
	if (NULL == used_walltime) {
		used_walltime = add_resource_entry(resources_used, walltime_def);
		mark_attr_set(&used_walltime->rs_value);
		used_walltime->rs_value.at_type = ATR_TYPE_LONG;
		used_walltime->rs_value.at_val.at_long = 0;
	}

	if (0 != (used_walltime->rs_value.at_flags & ATR_VFLAG_HOOK)) {
		/* walltime is set by hook so do not update here */
		return;
	}

	if (0 != pjob->ji_walltime_stamp) {
		/* walltime counting is not stopped so update it */
		set_attr_l(&used_walltime->rs_value, (long) ((time_now - pjob->ji_walltime_stamp) * wallfactor), INCR);
		pjob->ji_walltime_stamp = time_now;
	}
}

/**
 * @brief
 *
 *		stop_walltime() stops counting the walltime of a job.
 *
 * @param[in] 	pjob	    - pointer to the job
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
stop_walltime(job *pjob)
{
	if (NULL == pjob)
		return;
	/*
	 * time_now is global and should have positive value at this time
	 * if not, set it to current time
	 */
	if (0 == time_now)
		time_now = time(NULL);

	/* update walltime and stop accumulating */
	update_walltime(pjob);
	pjob->ji_walltime_stamp = 0;
}

/**
 * @brief
 *
 *		recover_walltime() tries to recover the used walltime of a job.
 *
 * @param[in] 	pjob	    - pointer to the job
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
recover_walltime(job *pjob)
{
	attribute *resources_used;
	resource_def *walltime_def;
	resource *used_walltime;

	if (NULL == pjob)
		return;

	if (0 == pjob->ji_qs.ji_stime)
		return;

	if (0 == time_now)
		time_now = time(NULL);

	resources_used = get_jattr(pjob, JOB_ATR_resc_used);
	assert(resources_used != NULL);
	walltime_def = &svr_resc_def[RESC_WALLTIME];
	assert(walltime_def != NULL);
	used_walltime = find_resc_entry(resources_used, walltime_def);

	/*
	* if the used walltime is not set, try to recover it.
	*/
	if (NULL == used_walltime) {
		used_walltime = add_resource_entry(resources_used, walltime_def);
		mark_attr_set(&used_walltime->rs_value);
		used_walltime->rs_value.at_type = ATR_TYPE_LONG;
		used_walltime->rs_value.at_val.at_long = (long) ((double) (time_now - pjob->ji_qs.ji_stime) * wallfactor);
	}
}


================================================
FILE: src/resmom/popen.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * Copyright (c) 1988, 1993
 *	The Regents of the University of California.  All rights reserved.
 *
 * This code is derived from software written by Ken Arnold and
 * published in UNIX Review, Vol. 6, No. 8.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *	This product includes software developed by the University of
 *	California, Berkeley and its contributors.
 * 4. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 * $FreeBSD: src/lib/libc/gen/popen.c,v 1.14 2000/01/27 23:06:19 jasone Exp $
 */
/**
 * @file	popen.c
 */
#include <stdio.h>
#include <stdlib.h>
#include <signal.h>
#include <errno.h>
#include <unistd.h>
#include <string.h>

#include <sys/param.h>
#include <sys/wait.h>
#include "log.h"

extern pid_t fork_me(int sock);
extern int kill_session(pid_t pid, int sig, int dir);

extern char **environ;

static struct pid {
	struct pid *next;
	FILE *fp;
	pid_t pid;
} * pidlist;

/**
 * @brief
 *	-implementation of pbs pipe open call.
 *
 * @param[in] command - arguments
 * @param[in] type - mode of pipe
 *
 * @return	FILE pointer
 * @retval	fd		success
 * @retval	NULL		error
 *
 */

FILE *
pbs_popen(const char *command, const char *type)
{
	struct pid *cur;
	FILE *iop;
	int pdes[2], pid, twoway;
	char *argv[4];
	struct pid *p;

	/*
	 * Lite2 introduced two-way popen() pipes using socketpair().
	 * FreeBSD's pipe() is bidirectional, so we use that.
	 */
	if (strchr(type, '+')) {
		twoway = 1;
		type = "r+";
	} else {
		twoway = 0;
		if ((*type != 'r' && *type != 'w') || type[1])
			return NULL;
	}
	if (pipe(pdes) < 0)
		return NULL;

	if ((cur = malloc(sizeof(struct pid))) == NULL) {
		log_err(errno, __func__, "Could not allocate memory for new file descriptor");
		(void) close(pdes[0]);
		(void) close(pdes[1]);
		return NULL;
	}

	argv[0] = "sh";
	argv[1] = "-c";
	argv[2] = (char *) command;
	argv[3] = NULL;

	switch (pid = fork_me(-1)) {
		case -1: /* Error. */
			(void) close(pdes[0]);
			(void) close(pdes[1]);
			free(cur);
			return NULL;
			/* NOTREACHED */
		case 0: /* Child. */
			/* create a new session */
			if (setsid() == -1)
				_exit(127);

			if (*type == 'r') {
				/*
				 * The dup2() to STDIN_FILENO is repeated to avoid
				 * writing to pdes[1], which might corrupt the
				 * parent's copy.  This isn't good enough in
				 * general, since the _exit() is no return, so
				 * the compiler is free to corrupt all the local
				 * variables.
				 */
				(void) close(pdes[0]);
				if (pdes[1] != STDOUT_FILENO) {
					(void) dup2(pdes[1], STDOUT_FILENO);
					(void) close(pdes[1]);
					if (twoway)
						(void) dup2(STDOUT_FILENO, STDIN_FILENO);
				} else if (twoway && (pdes[1] != STDIN_FILENO))
					(void) dup2(pdes[1], STDIN_FILENO);
			} else {
				if (pdes[0] != STDIN_FILENO) {
					(void) dup2(pdes[0], STDIN_FILENO);
					(void) close(pdes[0]);
				}
				(void) close(pdes[1]);
			}
			for (p = pidlist; p; p = p->next) {
				(void) close(fileno(p->fp));
			}
			execve("/bin/sh", argv, environ);
			_exit(127);
			/* NOTREACHED */
	}

	/* Parent; assume fdopen can't fail. */
	if (*type == 'r') {
		iop = fdopen(pdes[0], type);
		(void) close(pdes[1]);
	} else {
		iop = fdopen(pdes[1], type);
		(void) close(pdes[0]);
	}

	/* Link into list of file descriptors. */
	cur->fp = iop;
	cur->pid = pid;
	cur->next = pidlist;
	pidlist = cur;

	return (iop);
}

/**
 * @brief
 * 	-pbs_pkill Send a signal to the child process started by pbs_popen.
 *
 * @param[in] iop - file pointer
 * @param[in] sig - signal number
 *
 * @return	int
 * @retval	o	success
 * @retval	-1	error
 *
 */
int
pbs_pkill(FILE *iop, int sig)
{
	register struct pid *cur;
	int ret;

	/* Find the appropriate file pointer. */
	for (cur = pidlist; cur; cur = cur->next) {
		if (cur->fp == iop)
			break;
	}
	if (cur == NULL)
		return -1;

	ret = kill_session(cur->pid, sig, 0);
	return ret;
}

/**
 * @brief
 * 	-pbs_pclose -- close fds related to opened pipe
 *
 * @par	Pclose returns -1 if stream is not associated with a `popened' command,
 *	if already `pclosed', or waitpid returns an error.
 *
 * @param[in] iop - fd
 *
 * @return 	int
 * @retval	0	success
 * @retval	-1	error
 *
 */
int
pbs_pclose(FILE *iop)
{
	register struct pid *cur, *last;
	int pstat;
	pid_t pid;

	/* Find the appropriate file pointer. */
	for (last = NULL, cur = pidlist; cur; last = cur, cur = cur->next) {
		if (cur->fp == iop)
			break;
	}
	if (cur == NULL)
		return (-1);

	(void) fclose(iop);
	(void) kill_session(cur->pid, SIGKILL, 0);

	do {
		pid = waitpid(cur->pid, &pstat, 0);
	} while (pid == -1 && errno == EINTR);

	/* Remove the entry from the linked list. */
	if (last == NULL)
		pidlist = cur->next;
	else
		last->next = cur->next;
	free(cur);

	return (pid == -1 ? -1 : pstat);
}


================================================
FILE: src/resmom/prolog.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
/**
 * @file prolog.c
 */
#define PBS_MOM 1
#include <stdio.h>
#include <unistd.h>
#include <errno.h>
#include <fcntl.h>
#include <signal.h>
#include <sys/types.h>

#include <unistd.h>
#include <pwd.h>
#include <sys/wait.h>
#include <sys/stat.h>
#include "libpbs.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "job.h"
#include "log.h"
#include "mom_mach.h"
#include "mom_func.h"

#define PBS_PROLOG_TIME 30

unsigned int pe_alarm_time = PBS_PROLOG_TIME;
static pid_t child;
static int run_exit;

extern int pe_input(char *jobid);

/**
 * @brief
 *	convert resources_[list or used] values to a single string that are
 *	comma-separated.
 *
 * @param[in] pattr - the attribute to convert.
 * @param[in][out] buf - the buffer into which to convert.
 * @param[in] buflen - the length of the above buffer.
 *
 * @return pointer to 'buf', and also a modified 'buf'.
 * @retval = string
 * @retval = empty buffer on malloc failure under windows only
 *
 * @note     	This function may not concatenate all resources and their values as one string if buf size is insufficient.
 *		That mean returned buf value may have less resources list compared to actual list.
 *		This effect may occur in both windows and Linux. No indication of this error given.
 *		Also, for windows only, this function returns empty buf if malloc fails.
 *
 */

static char *
resc_to_string(job *pjob, int attr_idx, char *buf, int buflen)
{
	int need;
	svrattrl *patlist;
	pbs_list_head svlist;

	CLEAR_HEAD(svlist);
	*buf = '\0';

	if (encode_resc(get_jattr(pjob, attr_idx), &svlist, "x", NULL, ATR_ENCODE_CLIENT, NULL) <= 0)
		return (buf);

	patlist = (svrattrl *) GET_NEXT(svlist);
	while (patlist) {
		need = strlen(patlist->al_resc) + strlen(patlist->al_value) + 3;
		if (need < buflen) {
			(void) strcat(buf, patlist->al_resc);
			(void) strcat(buf, "=");
			(void) strcat(buf, patlist->al_value);
			buflen -= need;
		}
		patlist = (svrattrl *) GET_NEXT(patlist->al_link);
		if (patlist)
			(void) strcat(buf, ",");
	}
	return (buf);
}

/**
 * @brief
 * 	pelog_err - record error for run_pelog()
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] file - file name
 * @param[in] text - error message
 *
 * @return int
 * @retval error number
 *
 */

static int
pelog_err(job *pjob, char *file, int n, char *text)
{
	sprintf(log_buffer, "pro/epilogue failed, file: %s, exit: %d, %s",
		file, n, text);
	log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_WARNING,
		  pjob->ji_qs.ji_jobid, log_buffer);
	return (n);
}

/**
 * @brief
 *	pelogalm() - alarm handler for run_pelog()
 *
 * @param[in] sig - signal number
 *
 * @return Void
 *
 */
static void
	pelogalm(int sig)
{
	run_exit = -4;
}

/**
 * @brief
 *	run_pelog() - Run the Prologue/Epilogue script
 * @par
 *	Script is run under uid of root, prologue and the epilogue have:
 *		- argv[1] is the jobid
 *		- argv[2] is the user's name
 *		- argv[3] is the user's group name
 *		- the input file is a architecture dependent file
 *		- the output and error are the job's output and error
 #ifdef NAS localmod 095
 *	The prologue also has:
 *		- argv[4] is the list of resource limits specified
 #endif localmod 095
 *	The epilogue also has:
 *		- argv[4] is the job name
 *		- argv[5] is the session id
 *		- argv[6] is the list of resource limits specified
 *		- argv[7] is the list of resources used
 *		- argv[8] is the queue in which the job resides
 *		- argv[9] is the Account under which the job run
 *		- argv[10] is the job exit code
 *
 * @param[in] which - Script type (PE_PROLOGUE or PE_EPILOGUE)
 * @param[in] pelog - Path to the script file
 * @param[in] pjob - Pointer to the associated job structure
 * @param[in] pe_io_type - Output specifier (PE_IO_TYPE_NULL, PE_IO_TYPE_ASIS, or PE_IO_TYPE_STD)
 *
 * @return - Exit code
 * @retval  -2 - script not found
 * @retval  -1 - permission error
 * @retval   0 - success
 * @retval  >0 - exit status returned from script
 *
 */

int
run_pelog(int which, char *pelog, job *pjob, int pe_io_type)
{
	char *arg[12];
	char exitcode[20];
	char resc_list[2048];
	char resc_used[2048];
	struct stat sbuf;
	char sid[20];
	struct sigaction act;
	int fd_input;
	int waitst;
	char buf[MAXNAMLEN + MAXPATHLEN + 2];

	if (stat(pelog, &sbuf) == -1) {
		if (errno == ENOENT)
			return (0);
		else
			return (pelog_err(pjob, pelog, errno, "cannot stat"));
	} else if ((sbuf.st_uid != 0) ||
		   (!S_ISREG(sbuf.st_mode)) ||
		   ((sbuf.st_mode & (S_IRUSR | S_IXUSR)) !=
		    (S_IRUSR | S_IXUSR)) ||
		   (sbuf.st_mode & (S_IWGRP | S_IWOTH)))
		return (pelog_err(pjob, pelog, -1, "Permission Error"));

	fd_input = pe_input(pjob->ji_qs.ji_jobid);
	if (fd_input < 0) {
		return (pelog_err(pjob, pelog, -2,
				  "no pro/epilogue input file"));
	}

	run_exit = 0;
	child = fork();
	if (child > 0) { /* parent */
		(void) close(fd_input);
		sprintf(log_buffer, "running %s",
			which == PE_PROLOGUE ? "prologue" : "epilogue");
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);

		act.sa_handler = pelogalm;
		sigemptyset(&act.sa_mask);
		act.sa_flags = 0;
		sigaction(SIGALRM, &act, 0);
		alarm(pe_alarm_time);
		while (wait(&waitst) < 0) {
			if (errno != EINTR) { /* continue loop on signal */
				run_exit = -3;
				break;
			}
			kill(-child, SIGKILL);
		}
		alarm(0);
		act.sa_handler = SIG_DFL;
		sigaction(SIGALRM, &act, 0);
		kill(-child, SIGKILL);
		if (run_exit == 0) {
			if (WIFEXITED(waitst)) {
				run_exit = WEXITSTATUS(waitst);
			} else if (WIFSIGNALED(waitst)) {
				run_exit = -3;
			}
		} else {
			sprintf(log_buffer, "completed %s, exit=%d",
				which == PE_PROLOGUE ? "prologue" : "epilogue",
				run_exit);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
		}

	} else { /* child */
		 /*
		 * For sanity sake we make sure the following are defined.
		 * They should have been defined in unistd.h
		 */
#ifndef STDIN_FILENO
#define STDIN_FILENO 0
#endif
#ifndef STDOUT_FILENO
#define STDOUT_FILENO 1
#endif
#ifndef STDERR_FILENO
#define STDERR_FILENO 2
#endif

		/*
		 ** As these fd variabes (fds1(2)) are used in the child
		 ** process, define here only.
		 */
		int fds1 = -1;
		int fds2 = -1;

		if (fd_input != 0) {
			(void) close(STDIN_FILENO);
			if (dup(fd_input) == -1) 
				log_errf(-1, __func__, "dup failed. ERR : %s", strerror(errno));				
			(void) close(fd_input);
		}

		/* unprotect from kernel killers (such as oom) */
		daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

		/*
		 * If PE_IO_TYPE_ASIS, leave stdout/stderr alone as they
		 * are already open to job. Otherwise, set FDs 1 and 2
		 * appropriately being careful to join them where
		 * necessary.
		 */
		if (pe_io_type == PE_IO_TYPE_NULL) {
			/* Close any existing stdout/stderr. */
			(void) close(STDOUT_FILENO);
			(void) close(STDERR_FILENO);
			/* No output, force to /dev/null */
			fds1 = open("/dev/null", O_WRONLY, 0600);
			fds2 = dup(fds1);
		} else if (pe_io_type == PE_IO_TYPE_STD) {
			int join_method;
			/* Close any existing stdout/stderr. */
			(void) close(STDOUT_FILENO);
			(void) close(STDERR_FILENO);
			/*
			 * Do not open an output file unless it will be used.
			 * Otherwise, it will be left behind in spool.
			 */
			join_method = is_joined(pjob);
			/* Open job stdout/stderr. */
			if (join_method < 0) { /* joined as stderr */
				fds1 = open("/dev/null", O_WRONLY, 0600);
				fds2 = open_std_file(pjob, StdErr, O_WRONLY | O_APPEND,
						     pjob->ji_qs.ji_un.ji_momt.ji_exgid);
				(void) close(fds1);
				fds1 = dup(fds2);
			} else if (join_method > 0) { /* joined as stdout */
				fds1 = open_std_file(pjob, StdOut, O_WRONLY | O_APPEND,
						     pjob->ji_qs.ji_un.ji_momt.ji_exgid);
				fds2 = dup(fds1);
			} else { /* not joined */
				fds1 = open_std_file(pjob, StdOut, O_WRONLY | O_APPEND,
						     pjob->ji_qs.ji_un.ji_momt.ji_exgid);
				fds2 = open_std_file(pjob, StdErr, O_WRONLY | O_APPEND,
						     pjob->ji_qs.ji_un.ji_momt.ji_exgid);
			}
			if (fds1 == -1 || fds2 == -1) {
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_WARNING,
					  pjob->ji_qs.ji_jobid, "problem opening job output file(s)");
			}
		}

		/* for both prologue and epilogue */

		arg[0] = pelog;
		arg[1] = pjob->ji_qs.ji_jobid;
		arg[2] = get_jattr_str(pjob, JOB_ATR_euser);
		arg[3] = get_jattr_str(pjob, JOB_ATR_egroup);

		/* for epilogue only */

		if (which == PE_EPILOGUE) {
			arg[4] = get_jattr_str(pjob, JOB_ATR_jobname);
			sprintf(sid, "%ld", get_jattr_long(pjob, JOB_ATR_session_id));
			arg[5] = sid;
			arg[6] = resc_to_string(pjob, JOB_ATR_resource, resc_list, 2048);
			arg[7] = resc_to_string(pjob, JOB_ATR_resc_used, resc_used, 2048);
			arg[8] = get_jattr_str(pjob, JOB_ATR_in_queue);
			if ((is_jattr_set(pjob, JOB_ATR_account)) && (strlen(get_jattr_str(pjob, JOB_ATR_account)) > 0))
				arg[9] = get_jattr_str(pjob, JOB_ATR_account);
			else
				arg[9] = "null";
			sprintf(exitcode, "%d", pjob->ji_qs.ji_un.ji_momt.ji_exitstat);
			arg[10] = exitcode;
			arg[11] = 0;

		} else {
#ifdef NAS /* localmod 095 */
			arg[4] = resc_to_string(pjob, JOB_ATR_resource, resc_list, 2048);
			arg[5] = NULL;
#else
			arg[4] = NULL;
#endif /* localmod 095 */
		}

		(void) setsid();

		/* Add PBS_JOBDIR to the current process environement */
		if (pjob->ji_grpcache) {
			if ((is_jattr_set(pjob, JOB_ATR_sandbox)) && (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
				/* set PBS_JOBDIR to the per-job staging and execution directory*/
				sprintf(buf, "PBS_JOBDIR=%s",
					jobdirname(pjob->ji_qs.ji_jobid,
						   pjob->ji_grpcache->gc_homedir));
			} else {
				/* set PBS_JOBDIR to user HOME*/
				sprintf(buf, "PBS_JOBDIR=%s", pjob->ji_grpcache->gc_homedir);
			}
			if (setenv("PBS_JOBDIR", pjob->ji_grpcache->gc_homedir, 1) != 0)
				log_err(-1, "run_pelog", "set environment variable PBS_JOBDIR");
		}

		execv(pelog, arg);

		log_err(errno, "run_pelog", "execle of prologue failed");
		exit(255);
	}

	if (run_exit)
		(void) pelog_err(pjob, pelog, run_exit, "nonzero p/e exit status");

	return (run_exit);
}


================================================
FILE: src/resmom/renew_creds.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)

#include "renew_creds.h"

#include "log.h"
#include "mom_func.h"

#include <errno.h>
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#include <pwd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/fcntl.h>
#include <signal.h>
#include <unistd.h>
#include <math.h>

#include "libpbs.h"
#include "portability.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "resmon.h"
#include "libutil.h"

#include "tpp.h"
#include "pbs_error.h"

#include "net_connect.h"
#include "dis.h"
#include "batch_request.h"
#include "resource.h"

#include "work_task.h"

#if defined(HAVE_LIBKAFS)
#include <kafs.h>
#include <grp.h>
#elif defined(HAVE_LIBKOPENAFS)
#include <kopenafs.h>
#include <grp.h>
#endif

#include <krb5.h>
#include <com_err.h>

typedef struct eexec_job_info_t {
	time_t endtime;	    /* tickets expiration time */
	krb5_creds *creds;  /* User's TGT */
	krb5_ccache ccache; /* User's credentials cache */
	uid_t job_uid;
	char *username;
	char *krb_principal;
	char *jobid;
	char *ccache_name;
	krb5_principal client;
} eexec_job_info_t, *eexec_job_info;

struct krb_holder {
	int got_ticket;
	eexec_job_info_t job_info_;
	eexec_job_info job_info;
	krb5_context context;
};

pbs_list_head svr_allcreds; /* all credentials received from server */

struct svrcred_data {
	pbs_list_link cr_link;
	char *cr_jobid;
	char *cr_credid;
	int cr_type;
	krb5_data *cr_data;
	char *cr_data_base64; /* used for sending to sis moms*/
	long cr_validity;
};
typedef struct svrcred_data svrcred_data;

const char *str_cred_actions[] = {"singleshot", "renewal", "setenv", "close", "destroy"};

extern char *path_jobs; /* job directory path */
extern struct var_table vtable;
extern time_t time_now;
extern int decode_block_base64(unsigned char *ascii_data, ssize_t ascii_len, unsigned char *bin_data, ssize_t *p_bin_len, char *msg, size_t msg_len);

extern char *log_file;
extern char *path_log;

static int get_job_info_from_job(const job *pjob, const task *ptask, eexec_job_info job_info);
static int get_job_info_from_principal(const char *principal, const char *jobid, eexec_job_info job_info);
static krb5_error_code get_ticket_from_storage(struct krb_holder *ticket, char *errbuf, size_t errbufsz);
static krb5_error_code get_ticket_from_ccache(struct krb_holder *ticket, char *errbuf, size_t errbufsz);
static krb5_error_code get_renewed_creds(struct krb_holder *ticket, char *errbuf, size_t errbufsz);
static int init_ticket(struct krb_holder *ticket, job *pjob, int cred_action);

static svrcred_data *find_cred_data_by_jobid(char *jobid);

/**
 * @brief
 * 	init_ticket_from_req - Initialize a kerberos ticket from request
 *
 * @param[in] principal - kerberos principal
 * @param[in] jobid - job id associated with request
 * @param[out] ticket - Kerberos ticket for initialization
 * @param[in] cred_action - credentials action type
 *
 * @return 	int
 * @retval	0 on success
 * @retval	!= 0 on error
 */
int
init_ticket_from_req(char *principal, char *jobid, struct krb_holder *ticket, int cred_action)
{
	int ret;
	char buf[LOG_BUF_SIZE];

	if ((ret = get_job_info_from_principal(principal, jobid, ticket->job_info)) != 0) {
		snprintf(buf, sizeof(buf), "Could not fetch GSSAPI information from principal (get_job_info_from_principal returned %d).", ret);
		log_err(errno, __func__, buf);
		return ret;
	}

	ret = init_ticket(ticket, NULL, cred_action);
	if (ret == 0) {
		ticket->got_ticket = 1;
	}

	return ret;
}

/**
 * @brief
 * 	init_ticket_from_job - Initialize a kerberos ticket from job
 *
 * @param[in] pjob - job structure
 * @param[in] ptask - optional - ptask associated with job
 * @param[out] ticket - Kerberos ticket for initialization
 * @param[in] cred_action - credentials action type
 *
 * @return 	int
 * @retval	0 on success
 * @retval	!= 0 on error
 */
int
init_ticket_from_job(job *pjob, const task *ptask, struct krb_holder *ticket, int cred_action)
{
	int ret;
	char buf[LOG_BUF_SIZE];

	if ((ret = get_job_info_from_job(pjob, ptask, ticket->job_info)) != 0) {
		snprintf(buf, sizeof(buf), "Could not fetch GSSAPI information from job (get_job_info_from_job returned %d).", ret);
		log_err(errno, __func__, buf);
		return ret;
	}

	ret = init_ticket(ticket, pjob, cred_action);
	if (ret == 0) {
		ticket->got_ticket = 1;
	}

	return ret;
}

/**
 * @brief
 * 	init_ticket_from_ccache - Initialize a kerberos ticket from ccache file
 *
 * @param[in] pjob - job structure
 * @param[in] ptask - optional - ptask associated with job
 * @param[out] ticket - Kerberos ticket for initialization
 *
 * @return 	int
 * @retval	0 on success
 * @retval	!= 0 on error
 */
int
init_ticket_from_ccache(job *pjob, const task *ptask, struct krb_holder *ticket)
{
	int ret;
	char buf[LOG_BUF_SIZE];

	if ((ret = get_job_info_from_job(pjob, ptask, ticket->job_info)) != 0) {
		snprintf(buf, sizeof(buf), "Could not fetch GSSAPI information from job (get_job_info_from_job returned %d).", ret);
		log_err(errno, __func__, buf);
		return ret;
	}

	if ((ret = krb5_init_context(&ticket->context)) != 0) {
		log_err(ret, __func__, "Failed to initialize kerberos context.");
		return PBS_KRB5_ERR_CONTEXT_INIT;
	}

	if ((ret = get_ticket_from_ccache(ticket, buf, LOG_BUF_SIZE))) {
		log_err(ret, __func__, buf);

		snprintf(buf, sizeof(buf), "Could not get ticket: %s.", error_message(ret));
		log_err(errno, __func__, buf);
		return ret;
	}

	if (ret == 0) {
		ticket->got_ticket = 1;
	}

	return ret;
}

/**
 * @brief
 * 	init_ticket - Initialize a kerberos ticket
 *
 * @param[out] ticket - Kerberos ticket for initialization
 * @param[in] cred_action - credentials action type
 *
 * @return 	int
 * @retval	PBS_KRB5_OK on success
 * @retval	!= PBS_KRB5_OK on error
 */
static int
init_ticket(struct krb_holder *ticket, job *pjob, int cred_action)
{
	int ret;
	char buf[LOG_BUF_SIZE * 2];

	if ((ret = krb5_init_context(&ticket->context)) != 0) {
		log_err(ret, __func__, "Failed to initialize context.");
		return PBS_KRB5_ERR_CONTEXT_INIT;
	}

	switch (cred_action) {
		case CRED_SINGLESHOT:
		case CRED_RENEWAL:
			if ((ret = get_renewed_creds(ticket, buf, sizeof(buf))) != 0) {
				char buf2[LOG_BUF_SIZE * 3];

				krb5_free_context(ticket->context);
				snprintf(buf2, sizeof(buf2), "get_renewed_creds returned %d, %s", ret, buf);
				log_err(errno, __func__, buf2);
				return PBS_KRB5_ERR_GET_CREDS;
			}
			break;

		case CRED_DESTROY:
			if ((ret = krb5_cc_resolve(ticket->context, ticket->job_info->ccache_name, &ticket->job_info->ccache))) {
				snprintf(buf, sizeof(buf), "Could not resolve ccache name \"krb5_cc_resolve()\" : %s.", error_message(ret));
				log_err(errno, __func__, buf);
				return (ret);
			}
			break;

		case CRED_SETENV:
		case CRED_CLOSE:
			break;
	}

	if (pjob != NULL && pjob->ji_env.v_envp != NULL)
		bld_env_variables(&(pjob->ji_env), "KRB5CCNAME", ticket->job_info->ccache_name);
	else
		setenv("KRB5CCNAME", ticket->job_info->ccache_name, 1);

	return PBS_KRB5_OK;
}

/**
 * @brief
 * 	store_ticket - store the credentials into ccache file
 *
 * @param[in] ticket - ticket with credential
 * @param[out] errbuf - buffer to be filled on error
 * @param[in] errbufsz - size of error buffer
 *
 * @return 	krb5_error_code
 * @retval	0 on success
 * @retval	error code on error
 */
static krb5_error_code
store_ticket(struct krb_holder *ticket, char *errbuf, size_t errbufsz)
{
	krb5_error_code ret;

	if ((ret = krb5_cc_resolve(ticket->context, ticket->job_info->ccache_name, &ticket->job_info->ccache))) {
		snprintf(errbuf, errbufsz, "%s - Could not resolve cache name \"krb5_cc_resolve()\" : %s.", __func__, error_message(ret));
		return (ret);
	}

	if ((ret = krb5_cc_initialize(ticket->context, ticket->job_info->ccache, ticket->job_info->creds->client))) {
		snprintf(errbuf, errbufsz, "%s - Could not initialize cache \"krb5_cc_initialize()\" : %s.", __func__, error_message(ret));
		return (ret);
	}

	if ((ret = krb5_cc_store_cred(ticket->context, ticket->job_info->ccache, ticket->job_info->creds))) {
		snprintf(errbuf, errbufsz, "%s - Could not store credentials initialize cache \"krb5_cc_store_cred()\" : %s.", __func__, error_message(ret));
		return (ret);
	}

	return (0);
}

/**
 * @brief
 * 	get_renewed_creds - Get and store renewed credentials for a given ticket.
 *	The credentials are obtained from storage (which is the memory) and stored
 *	into ccache file.
 *
 * @param[in] ticket - ticket for which to get and store credentials
 * @param[out] errbuf - buffer to be filled on error
 * @param[in] errbufsz - size of error buffer
 * @param[in] cred_action - type of action with credentials
 *
 * @return 	krb5_error_code
 * @retval	0 on success
 * @retval	error code on error
 */
static krb5_error_code
get_renewed_creds(struct krb_holder *ticket, char *errbuf, size_t errbufsz)
{
	krb5_error_code ret;
	char strerrbuf[LOG_BUF_SIZE];

	/* Get TGT for user */
	if ((ret = get_ticket_from_storage(ticket, errbuf, errbufsz)) != 0) {
		log_record(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, ticket->job_info->jobid, "no credentials supplied");
		return ret;
	}

	/* Go user */
	if (seteuid(ticket->job_info->job_uid) < 0) {
		strerror_r(errno, strerrbuf, LOG_BUF_SIZE);
		snprintf(errbuf, errbufsz, "%s - Could not set uid using \"setuid()\": %s.", __func__, strerrbuf);
		return errno;
	}

	/* Store TGT */
	if ((ret = store_ticket(ticket, errbuf, errbufsz))) {
		seteuid(0);
		return ret;
	}

	/* Go root */
	if (seteuid(0) < 0) {
		snprintf(errbuf, errbufsz, "%s - Could not reset root privileges.", __func__);
		return errno;
	}

	return 0;
}

/**
 * @brief
 * 	get_ticket_from_storage - Acquire a user ticket. The credentials are
 *	expected to be stored in the mom's memory (supplied by the pbs server).
 *
 * @param[in] ticket - ticket to be filled with credentials
 * @param[out] errbuf - buffer to be filled on error
 * @param[in] errbufsz - size of error buffer
 *
 * @return 	krb5_error_code
 * @retval	0 on success
 * @retval	error code on error
 */
static krb5_error_code
get_ticket_from_storage(struct krb_holder *ticket, char *errbuf, size_t errbufsz)
{
	krb5_error_code ret = 0;
	krb5_auth_context auth_context = NULL;
	krb5_creds **creds = NULL;
	krb5_data *datatmp;
	krb5_data *data;
	int32_t flags;
	svrcred_data *cred_data;

	cred_data = find_cred_data_by_jobid(ticket->job_info->jobid);
	if (cred_data == NULL || (datatmp = cred_data->cr_data) == NULL) {
		snprintf(errbuf, errbufsz, "find_cred_by_jobid failed; no credentials supplied for job: %s", ticket->job_info->jobid);
		ret = KRB5_NOCREDS_SUPPLIED;
		goto out;
	}

	if ((ret = krb5_copy_data(ticket->context, datatmp, &data))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_copy_data failed; Error text: %s", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	if ((ret = krb5_auth_con_init(ticket->context, &auth_context))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_auth_con_init failed; Error text: %s", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	krb5_auth_con_getflags(ticket->context, auth_context, &flags);
	/* We disable timestamps in the message so the expected message could be cached
	 * and re-sent. The following flag needs to be also set by the tool
	 * that supplies credential.
	 * N.B. The semantics of KRB5_AUTH_CONTEXT_DO_TIME applied in
	 * krb5_fwd_tgt_creds() seems to differ between Heimdal and MIT. MIT uses
	 * it to (also) enable replay cache checks (that are useless and
	 * troublesome for us). Heimdal uses it to just specify whether or not the
	 * timestamp is included in the forwarded message. */
	flags &= ~(KRB5_AUTH_CONTEXT_DO_TIME);
	krb5_auth_con_setflags(ticket->context, auth_context, flags);

	if ((ret = krb5_rd_cred(ticket->context, auth_context, data, &creds, NULL))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_rd_cred - reading credentials; Error text: %s", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	if ((ret = krb5_auth_con_free(ticket->context, auth_context))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_auth_con_free - freeing authentication context; Error text: %s", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	krb5_free_data(ticket->context, data);

	ticket->job_info->creds = creds[0];
	free(creds);

	ticket->job_info->endtime = ticket->job_info->creds->times.endtime;

	if (ticket->job_info->endtime < time_now)
		return KRB5_NOCREDS_SUPPLIED;

out:
	return ret;
}

/**
 * @brief
 * 	get_ticket_from_ccache - Acquire a user ticket. The credentials are
 *	read from ccache file.
 *
 * @param[in] ticket - ticket to be filled with credentials
 * @param[out] errbuf - buffer to be filled on error
 * @param[in] errbufsz - size of error buffer
 *
 * @return 	krb5_error_code
 * @retval	0 on success
 * @retval	error code on error
 */
static krb5_error_code
get_ticket_from_ccache(struct krb_holder *ticket, char *errbuf, size_t errbufsz)
{
	krb5_error_code ret = 0;
	krb5_creds *mcreds = NULL;
	int32_t flags;
	krb5_auth_context auth_context = NULL;

	if ((mcreds = malloc(sizeof(krb5_creds))) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		return KRB5KRB_ERR_GENERIC;
	}
	memset(mcreds, 0, sizeof(krb5_creds));

	if ((ret = krb5_copy_principal(ticket->context, ticket->job_info->client, &mcreds->client))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_get_ticket - couldn't copy client principal - (%s)", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	if ((ret = krb5_cc_resolve(ticket->context, ticket->job_info->ccache_name, &ticket->job_info->ccache))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_cc_resolve failed; Error text: %s", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	if ((ret = krb5_auth_con_init(ticket->context, &auth_context))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_auth_con_init failed; Error text: %s", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	krb5_auth_con_getflags(ticket->context, auth_context, &flags);
	flags &= ~(KRB5_AUTH_CONTEXT_DO_TIME);
	krb5_auth_con_setflags(ticket->context, auth_context, flags);

	if ((ticket->job_info->creds = malloc(sizeof(krb5_creds))) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		ret = KRB5KRB_ERR_GENERIC;
		goto out;
	}
	memset(ticket->job_info->creds, 0, sizeof(krb5_creds));

	if ((ret = krb5_cc_retrieve_cred(ticket->context, ticket->job_info->ccache, 0, mcreds, ticket->job_info->creds))) {
		const char *krb5_err = krb5_get_error_message(ticket->context, ret);
		snprintf(errbuf, errbufsz, "krb5_cc_retrieve_cred failed; Error text: %s", krb5_err);
		krb5_free_error_message(ticket->context, krb5_err);
		goto out;
	}

	ticket->job_info->endtime = ticket->job_info->creds->times.endtime;

out:
	krb5_free_creds(ticket->context, mcreds);
	return ret;
}

/**
 * @brief
 * 	get_ticket_ccname - Get ccname file name from ticket
 *
 * @param[in] ticket
 *
 * @return 	char
 * @retval	ccache file
 * @retval	NULL on error
 */
char *
get_ticket_ccname(struct krb_holder *ticket)
{
	if (ticket == NULL || ticket->job_info == NULL)
		return NULL;

	return ticket->job_info->ccache_name;
}

/**
 * @brief
 * 	got_ticket - Allocated a new krb_holder structure (ticket)
 *
 * @return 	krb_holder
 * @retval	structure - on success
 * @retval	NULL - otherwise
 */
struct krb_holder *
alloc_ticket()
{
	struct krb_holder *ticket = (struct krb_holder *) malloc(sizeof(struct krb_holder));
	if (ticket == NULL)
		return NULL;

	ticket->job_info = &ticket->job_info_;
	ticket->job_info->creds = NULL;
	ticket->job_info->ccache_name = NULL;
	ticket->job_info->krb_principal = NULL;
	ticket->job_info->username = NULL;
	ticket->job_info->jobid = NULL;
	ticket->got_ticket = 0;

	return ticket;
}

/**
 * @brief
 * 	free_ticket - Free a kerberos ticket. Distinguishes whether the
 *	credentials should be also destroyed (removed ccache) or only
 *	free the structures.
 *
 * @param[in] ticket - Ticket with context and job info information
 * @param[in] cred_action - requested action
 *
 * @return void
 */
void
free_ticket(struct krb_holder *ticket, int cred_action)
{
	krb5_error_code ret = 0;

	if (ticket == NULL)
		return;

	if (ticket->got_ticket) {
		switch (cred_action) {
			case CRED_SINGLESHOT:
			case CRED_RENEWAL:
			case CRED_CLOSE:
				if ((ret = krb5_cc_close(ticket->context, ticket->job_info->ccache))) {
					const char *krb5_err = krb5_get_error_message(ticket->context, ret);
					log_err(ret, __func__, krb5_err);
					krb5_free_error_message(ticket->context, krb5_err);
				}

				break;

			case CRED_DESTROY:
#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
				if (k_hasafs())
					k_unlog();
#endif
				if ((ret = krb5_cc_destroy(ticket->context, ticket->job_info->ccache))) {
					const char *krb5_err = krb5_get_error_message(ticket->context, ret);
					log_err(ret, __func__, krb5_err);
					krb5_free_error_message(ticket->context, krb5_err);
				}

				unlink(ticket->job_info->ccache_name);

				break;

			case CRED_SETENV:
				break;
		}

		krb5_free_creds(ticket->context, ticket->job_info->creds);
		krb5_free_principal(ticket->context, ticket->job_info->client);
		krb5_free_context(ticket->context);
	}

	free(ticket->job_info->ccache_name);
	free(ticket->job_info->krb_principal);
	free(ticket->job_info->username);
	free(ticket->job_info->jobid);

	free(ticket);
}

/**
 * @brief
 * 	get_job_info_from_job - Fill in job info from job structure
 *
 * @param[in] pjob - job structure
 * @param[in] ptask - optional ptask associated with job process
 * @param[out] job_info - filled job information
 *
 * @return 	int
 * @retval	PBS_KRB5_OK - on sucess
 * @retval	!= PBS_KRB5_OK - on error
 */
static int
get_job_info_from_job(const job *pjob, const task *ptask, eexec_job_info job_info)
{
	char *krb_principal = NULL;
	size_t len;
	char *ccname = NULL;

	if (is_jattr_set(pjob, JOB_ATR_cred_id))
		krb_principal = strdup(get_jattr_str(pjob, JOB_ATR_cred_id));
	else {
		log_err(-1, __func__, "No ticket found on job.");
		return PBS_KRB5_ERR_NO_KRB_PRINC;
	}

	if (krb_principal == NULL) /* memory allocation error */
		return PBS_KRB5_ERR_INTERNAL;

	if (ptask == NULL) {
		len = snprintf(NULL, 0, "FILE:/tmp/krb5cc_pbsjob_%s", pjob->ji_qs.ji_jobid);
		ccname = (char *) (malloc(len + 1));
		if (ccname != NULL)
			snprintf(ccname, len + 1, "FILE:/tmp/krb5cc_pbsjob_%s", pjob->ji_qs.ji_jobid);
	} else {
		len = snprintf(NULL, 0, "FILE:/tmp/krb5cc_pbsjob_%s_%ld", pjob->ji_qs.ji_jobid, (long) ptask->ti_qs.ti_task);
		ccname = (char *) (malloc(len + 1));
		if (ccname != NULL)
			snprintf(ccname, len + 1, "FILE:/tmp/krb5cc_pbsjob_%s_%ld", pjob->ji_qs.ji_jobid, (long) ptask->ti_qs.ti_task);
	}

	if (ccname == NULL) { /* memory allocation error */
		free(krb_principal);
		return PBS_KRB5_ERR_INTERNAL;
	}

	if (get_jattr_str(pjob, JOB_ATR_euser) == NULL) {
		free(krb_principal);
		free(ccname);
		return PBS_KRB5_ERR_NO_USERNAME;
	}

	char *username = strdup(get_jattr_str(pjob, JOB_ATR_euser));
	if (username == NULL) {
		free(krb_principal);
		free(ccname);
		return PBS_KRB5_ERR_INTERNAL;
	}

	krb5_context context;
	krb5_init_context(&context);
	krb5_parse_name(context, krb_principal, &job_info->client);

	krb5_free_context(context);

	job_info->krb_principal = krb_principal;
	job_info->ccache_name = ccname;
	job_info->username = username;
	job_info->job_uid = pjob->ji_qs.ji_un.ji_momt.ji_exuid;

	job_info->jobid = strdup(pjob->ji_qs.ji_jobid);
	if (job_info->jobid == NULL) {
		free(krb_principal);
		free(ccname);
		return PBS_KRB5_ERR_INTERNAL;
	}

	return PBS_KRB5_OK;
}

/**
 * @brief
 * 	get_job_info_from_principal - Fill in job info from a principal
 *
 * @param[in] principal - Principal for which to construct job info
 * @param[in] jobid - Job ID for which to construct job info
 * @param[out] job_info - filled job information
 *
 * @return 	int
 * @retval	PBS_KRB5_OK - on sucess
 * @retval	!= PBS_KRB5_OK - on error
 */
static int
get_job_info_from_principal(const char *principal, const char *jobid, eexec_job_info job_info)
{
	struct passwd pwd;
	struct passwd *result;
	char *buf;
	long int bufsize;

	if (principal == NULL) {
		log_err(-1, __func__, "No principal provided.");
		return PBS_KRB5_ERR_NO_KRB_PRINC;
	}

	char *krb_principal = strdup(principal);
	if (krb_principal == NULL)
		return PBS_KRB5_ERR_INTERNAL;

	char login[PBS_MAXUSER + 1];
	pbs_strncpy(login, principal, PBS_MAXUSER + 1);
	char *c = strchr(login, '@');
	if (c != NULL)
		*c = '\0';

	/* get users uid */
	bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
	if (bufsize == -1)	 /* Value was indeterminate */
		bufsize = 16384; /* Should be more than enough */

	if ((buf = (char *) (malloc(bufsize))) == NULL) {
		free(krb_principal);
		return PBS_KRB5_ERR_INTERNAL;
	}

	int ret = getpwnam_r(login, &pwd, buf, bufsize, &result);

	if (result == NULL) {
		free(krb_principal);
		free(buf);
		if (ret == 0)
			return PBS_KRB5_ERR_CANT_OPEN_FILE;
		else
			return PBS_KRB5_ERR_INTERNAL;
	}

	uid_t uid = pwd.pw_uid;
	free(buf);

	char *username = strdup(login);
	if (username == NULL) {
		free(krb_principal);
		return PBS_KRB5_ERR_INTERNAL;
	}

	size_t len;
	char *ccname;
	len = snprintf(NULL, 0, "FILE:/tmp/krb5cc_pbsjob_%s", jobid);
	ccname = (char *) (malloc(len + 1));
	if (ccname != NULL)
		snprintf(ccname, len + 1, "FILE:/tmp/krb5cc_pbsjob_%s", jobid);

	if (ccname == NULL) {
		free(krb_principal);
		free(username);
	}

	krb5_context context;
	krb5_init_context(&context);
	krb5_parse_name(context, principal, &job_info->client);

	krb5_free_context(context);

	job_info->krb_principal = krb_principal;
	job_info->job_uid = uid;
	job_info->username = username;
	job_info->ccache_name = ccname;

	job_info->jobid = strdup(jobid);
	if (job_info->jobid == NULL) {
		free(krb_principal);
		free(ccname);
		free(username);
		return PBS_KRB5_ERR_INTERNAL;
	}

	return PBS_KRB5_OK;
}

/**
 * @brief
 * 	cred_by_job - renew/create or destroy credential associated with job id
 *
 * @param[in] pjob - job structure
 * @param[in] cred_action - type of action (renewal, destroy)
 *
 * @return 	int
 * @retval	PBS_KRB5_OK - on sucess
 * @retval	!= PBS_KRB5_OK - on error
 */
int
cred_by_job(job *pjob, int cred_action)
{
	struct krb_holder *ticket = NULL;
	int ret;

	ticket = alloc_ticket();
	if (ticket == NULL)
		return PBS_KRB5_ERR_INTERNAL;

	ret = init_ticket_from_job(pjob, NULL, ticket, cred_action);
	if (ret == PBS_KRB5_ERR_NO_KRB_PRINC) {
		/* job without a principal
		 * not an error, but do nothing */
		return PBS_KRB5_OK;
	}

	if (ret == PBS_KRB5_OK) {
		sprintf(log_buffer, "credential %s for %s succeeded",
			str_cred_actions[cred_action],
			ticket->job_info->ccache_name);
		log_record(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
	} else {
		sprintf(log_buffer, "credential %s for %s failed with error: %d",
			str_cred_actions[cred_action],
			ticket->job_info->ccache_name,
			ret);
		log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
	}

	free_ticket(ticket, cred_action);

	return ret;
}

/**
 * @brief
 * 	renew_job_cred - renew credentials for job and also do the AFS log.
 *
 * @param[in] pjob - job structure
 *
 * @return void
 */
void
renew_job_cred(job *pjob)
{
	int ret = 0;

	if ((ret = cred_by_job(pjob, CRED_RENEWAL)) != PBS_KRB5_OK) {
		sprintf(log_buffer, "renewal failed, error: %d", ret);
		log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
			   pjob->ji_qs.ji_jobid, log_buffer);
	}
#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
	pbs_task *ptask;

	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		if (ptask->ti_job == pjob && ptask->ti_qs.ti_status == TI_STATE_RUNNING) {
			ret = signal_afslog(ptask, SIGHUP);
			if (ret) {
				sprintf(log_buffer, "afslog SIGHUP failed for task: %8.8X",
					ptask->ti_qs.ti_task);
				log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
					   ptask->ti_job->ji_qs.ji_jobid, log_buffer);
			}
		}
	}
#endif
	/* we don't want mom to have ccache of some user... */
	unsetenv("KRB5CCNAME");
}

/**
 * @brief
 * 	store_or_update_cred - save received credentials into mom's memory
 *
 * @param[in] jobid - Job ID
 * @param[in] princ - cred id (e.g. principal)
 * @param[in] data - the credentials itself
 * @param[in] data_base64 - the credentials in base64
 *
 * @return void
 */
void
store_or_update_cred(char *jobid, char *credid, int cred_type, krb5_data *data, char *data_base64, long validity)
{
	svrcred_data *cred_data;

	cred_data = (svrcred_data *) GET_NEXT(svr_allcreds);
	while (cred_data) {
		if (strcmp(cred_data->cr_jobid, jobid) == 0) {
			free(cred_data->cr_data->data);
			free(cred_data->cr_data);
			if (cred_data->cr_data_base64)
				free(cred_data->cr_data_base64);

			cred_data->cr_type = cred_type;
			cred_data->cr_data = data;
			cred_data->cr_data_base64 = data_base64;
			cred_data->cr_validity = validity;
			return;
		}
		cred_data = (svrcred_data *) GET_NEXT(cred_data->cr_link);
	}

	if ((cred_data = (svrcred_data *) malloc(sizeof(svrcred_data))) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		return;
	}

	CLEAR_LINK(cred_data->cr_link);

	cred_data->cr_jobid = strdup(jobid);
	cred_data->cr_credid = strdup(credid);
	cred_data->cr_type = cred_type;
	cred_data->cr_data = data;
	cred_data->cr_data_base64 = data_base64;
	cred_data->cr_validity = validity;

	append_link(&svr_allcreds, &cred_data->cr_link, cred_data);
}

/**
 * @brief
 * 	delete_cred - delete credentials associated with job id from the mom's
 *	memory
 *
 * @param[in] jobid - Job ID
 *
 * @return void
 */
void
delete_cred(char *jobid)
{
	svrcred_data *cred_data;

	cred_data = (svrcred_data *) GET_NEXT(svr_allcreds);
	while (cred_data) {
		if (strcmp(cred_data->cr_jobid, jobid) == 0) {
			free(cred_data->cr_jobid);
			free(cred_data->cr_credid);
			free(cred_data->cr_data->data);
			free(cred_data->cr_data);
			if (cred_data->cr_data_base64)
				free(cred_data->cr_data_base64);

			delete_link(&cred_data->cr_link);
			free(cred_data);
			return;
		}
		cred_data = (svrcred_data *) GET_NEXT(cred_data->cr_link);
	}
}

/**
 * @brief
 * 	find_cred_by_jobid - try to find credentials in mom's memory by the jobid
 *
 * @param[in] jobid - Job ID
 *
 * @return 	svrcred_data
 * @retval	credentials data on success
 * @retval	NULL otherwise
 */
static svrcred_data *
find_cred_data_by_jobid(char *jobid)
{
	svrcred_data *cred_data;

	cred_data = (svrcred_data *) GET_NEXT(svr_allcreds);
	while (cred_data) {
		if (strcmp(cred_data->cr_jobid, jobid) == 0)
			return cred_data;

		cred_data = (svrcred_data *) GET_NEXT(cred_data->cr_link);
	}
	return NULL;
}

/**
 * @brief
 * 	im_cred_send - send job's credentials from superior mom to sister mom.
 *	Find the credentials in base64 in superior mom's memory and send them
 *	via IM protocol. This function is meant to by run by send_sisters and
 *	it shouldn't be sent via mcast because mcast can't be wrapped by GSS
 *
 * @param[in] jobid - Job ID
 *
 * @return 	int
 * @retval	DIS_SUCCESS on success
 * @retval	!= DIS_SUCCESS otherwise
 */
int
im_cred_send(job *pjob, hnodent *xp, int stream)
{
	int ret;
	svrcred_data *cred_data;
	char *data_base64;

	cred_data = find_cred_data_by_jobid(pjob->ji_qs.ji_jobid);

	if (cred_data == NULL || (data_base64 = cred_data->cr_data_base64) == NULL) {
		ret = DIS_PROTO;
		goto done;
	}

	ret = diswui(stream, cred_data->cr_type);
	if (ret != DIS_SUCCESS)
		goto done;

	ret = diswst(stream, data_base64);
	if (ret != DIS_SUCCESS)
		goto done;

	ret = diswul(stream, cred_data->cr_validity);
	if (ret != DIS_SUCCESS)
		goto done;

	return DIS_SUCCESS;

done:
	sprintf(log_buffer, "dis err %d (%s)", ret, dis_emsg[ret]);
	DBPRT(("%s: %s\n", __func__, log_buffer))
	log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
	return ret;
}

/**
 * @brief
 * 	im_cred_read - read received (via IM) credentials in base64 on sister
 *	mom, store the credentials in mom's memory and renew the credentials for
 *	associated job.
 *
 * @param[in] pjob - job structure
 * @param[in] np - node structure
 * @param[in] stream - tpp channel
 *
 * @return 	int
 * @retval	DIS_SUCCESS on success
 * @retval	!= DIS_SUCCESS otherwise
 */
int
im_cred_read(job *pjob, hnodent *np, int stream)
{
	int ret;
	char *data_base64;
	unsigned char out_data[CRED_DATA_SIZE];
	ssize_t out_len = 0;
	char buf[LOG_BUF_SIZE];
	krb5_data *data;
	int cred_type;
	long validity;

	DBPRT(("%s: entry\n", __func__))

	cred_type = disrui(stream, &ret);
	if (ret != DIS_SUCCESS)
		goto err;

	data_base64 = disrst(stream, &ret);
	if (ret != DIS_SUCCESS)
		goto err;

	validity = disrul(stream, &ret);
	if (ret != DIS_SUCCESS)
		goto err;

	if (decode_block_base64((unsigned char *) data_base64, strlen(data_base64), out_data, &out_len, buf, LOG_BUF_SIZE) != 0) {
		log_err(errno, __func__, buf);
		ret = DIS_PROTO;
		goto err;
	}

	free(data_base64);

	if ((data = (krb5_data *) malloc(sizeof(krb5_data))) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		ret = DIS_NOMALLOC;
		goto err;
	}

	if ((data->data = (char *) malloc(sizeof(unsigned char) * out_len)) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		ret = DIS_NOMALLOC;
		goto err;
	}

	data->length = out_len;
	memcpy(data->data, out_data, out_len);

	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
		  LOG_INFO,
		  pjob->ji_qs.ji_jobid,
		  "credentials from superior mom received");

	store_or_update_cred(pjob->ji_qs.ji_jobid,
			     get_jattr_str(pjob, JOB_ATR_cred_id),
			     cred_type,
			     data,
			     NULL,
			     validity);

	/* I am the sister and new cred has been received - lets renew creds */
	renew_job_cred(pjob);

	return DIS_SUCCESS;

err:
	/* Getting here means we had a read failure. */
	sprintf(log_buffer, "dis err %d (%s)", ret, dis_emsg[ret]);
	DBPRT(("%s: %s\n", __func__, log_buffer))
	log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
	return ret;
}

/**
 * @brief
 * 	send_cred_sisters - send credentials from superior mom to all sister moms
 *
 * @param[in] pjob - job structure
 *
 * @return void
 */
void
send_cred_sisters(job *pjob)
{
	int i;

	if (pjob->ji_numnodes > 1) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
			  LOG_INFO,
			  pjob->ji_qs.ji_jobid,
			  "sending credentials to sisters");

		i = send_sisters(pjob, IM_CRED, im_cred_send);

		if (i != pjob->ji_numnodes - 1)
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
				  pjob->ji_qs.ji_jobid,
				  "could not send credentials to sisters");
		/* If send_sisters() fails, the job is probably doomed anyway.
			 * Should we resend credentials on fail?
			 * If yes, here is the right place*/
	}
}

#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
static volatile sig_atomic_t rec_signal = 0;
static volatile struct krb_holder *afslog_ticket;

#define AFSLOG_TIME_SLEEP 60 /* 1 minute */

/**
 * @brief
 * 	do_afslog - tests the presence of AFS and do the AFS log if the test is true
 *
 * @param[in] context - GSS context
 * @param[in] job_info - eexec_job_info
 *
 * @return 	krb5_error_code
 * @retval	0
 */
static krb5_error_code
do_afslog(krb5_context context, eexec_job_info job_info)
{
	krb5_error_code ret = 0;

	if (k_hasafs() && (ret = krb5_afslog(context, job_info->ccache, NULL, NULL)) != 0) {
		snprintf(log_buffer, sizeof(log_buffer), "krb5_afslog failed, error: %d", ret);
		log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, job_info->jobid, log_buffer);

		/* ignore this error */
		ret = 0;
	}

	return (ret);
}

/**
 * @brief
 * 	singleshot_afslog - do imminent afslog, no process started
 *
 * @param[in] ticket - kerberos ticket
 *
 * @return void
 */
void
singleshot_afslog(struct krb_holder *ticket)
{
	char buf[LOG_BUF_SIZE * 2];
	char errbuf[LOG_BUF_SIZE];

	if (k_hasafs()) {
		/* Go user */
		if (seteuid(ticket->job_info->job_uid) < 0) {
			strerror_r(errno, errbuf, sizeof(errbuf));
			snprintf(buf, sizeof(buf), "Could not set uid using \"setuid()\": %s.", errbuf);
			log_err(errno, __func__, buf);

			return;
		}

		k_setpag();
		do_afslog(ticket->context, ticket->job_info);

		/* Go root */
		if (seteuid(0) < 0) {
			strerror_r(errno, errbuf, sizeof(errbuf));
			snprintf(buf, sizeof(buf), "Could not reset root privileges: %s.", errbuf);
			log_err(errno, __func__, buf);
		}
	}
}

/**
 * @brief
 * 	do_afslog_on_signal - AFS log signal handler
 *
 * @param[in] signal - received signal
 *
 * @return void
 */
static void
do_afslog_on_signal(int signal)
{
	if (signal == SIGHUP) {
		if (do_afslog(afslog_ticket->context, afslog_ticket->job_info))
			return;
	} else {
		rec_signal = signal;
	}
}

/**
 * @brief
 * 	wait_afslog - in AFS log process wait for signal HUP for do AFS log or
 *	0 for terminate
 *
 * @param[in] signal - received signal
 *
 * @return void
 */
static void
wait_afslog()
{
	/* initialize signal catcher */
	struct sigaction sa;
	memset(&sa, 0, sizeof(sa));
	sa.sa_handler = do_afslog_on_signal;
	sigaction(SIGTERM, &sa, NULL);
	sa.sa_handler = do_afslog_on_signal;
	sigaction(SIGHUP, &sa, NULL);

	while (rec_signal == 0) {
		sleep(AFSLOG_TIME_SLEEP);
	}
}

/**
 * @brief
 * 	start_afslog - fork AFS log process for a specific job task,
 *	save PID file and do AFS log for the task. The AFS log need to be done
 *	in the child of original process who set the pag.
 *
 * @param[in] ptask - job task
 * @param[in] ticket - kerberos ticket associated with process
 * @param[in] fd1 - read socket - need to be closed in forked process
 * @param[in] fd2 - write socker - need to be closed in forked process
 *
 * @return 	int
 * @retval	PBSGSS_OK on success
 * @retval	!= PBSGSS_OK otherwise
 */
int
start_afslog(const task *ptask, struct krb_holder *ticket, int fd1, int fd2)
{
	char buf[LOG_BUF_SIZE * 2];
	char errbuf[LOG_BUF_SIZE];
	int ret = PBS_KRB5_OK;
	char pid_file[MAXPATHLEN];
	int local_ticket = 0;
	job *pjob;
	int fd;
	int pid;

	if (!k_hasafs())
		return PBS_KRB5_OK;

	if (ptask == NULL)
		return PBS_KRB5_ERR_INTERNAL;

	pjob = ptask->ti_job;

	if (*pjob->ji_qs.ji_fileprefix != '\0')
		snprintf(pid_file, sizeof(pid_file), "%s%s_afslog_%8.8X.pid", path_jobs, pjob->ji_qs.ji_fileprefix, (unsigned int) ptask->ti_qs.ti_task);
	else
		snprintf(pid_file, sizeof(pid_file), "%s%s_afslog_%8.8X.pid", path_jobs, pjob->ji_qs.ji_jobid, (unsigned int) ptask->ti_qs.ti_task);

	fd = open(pid_file, O_CREAT | O_EXCL | O_WRONLY, 0600);
	if (fd == -1) {
		/* another afslog process is running ? */
		snprintf(buf, sizeof(buf), "opening PID file for afslog process (%s) uid = %d", pid_file, getuid());
		log_err(errno, __func__, buf);
		return PBS_KRB5_ERR_CANT_OPEN_FILE;
	}

	/* Go user */
	if (seteuid(pjob->ji_qs.ji_un.ji_momt.ji_exuid) < 0) {
		strerror_r(errno, errbuf, sizeof(errbuf));
		snprintf(buf, sizeof(buf), "Could not set uid using \"setuid()\": %s.", errbuf);
		log_err(errno, __func__, buf);

		return PBS_KRB5_ERR_INTERNAL;
	}

	if (ticket == NULL) {
		ticket = alloc_ticket();
		if (ticket == NULL) {
			/* Go root on error */
			if (seteuid(0) < 0) {
				strerror_r(errno, errbuf, sizeof(errbuf));
				snprintf(buf, sizeof(buf), "Could not reset root privileges: %s.", errbuf);
				log_err(errno, __func__, buf);
			}

			return PBS_KRB5_ERR_INTERNAL;
		}

		if ((ret = init_ticket_from_ccache(pjob, NULL, ticket)) != PBS_KRB5_OK) {
			if (local_ticket)
				free_ticket(ticket, CRED_RENEWAL);

			/* Go root */
			if (seteuid(0) < 0) {
				strerror_r(errno, errbuf, sizeof(errbuf));
				snprintf(buf, sizeof(buf), "Could not reset root privileges: %s.", errbuf);
				log_err(errno, __func__, buf);

				return PBS_KRB5_ERR_INTERNAL;
			}

			/* job without a principal */
			/* not an error, but do nothing */
			if (ret == PBS_KRB5_ERR_NO_KRB_PRINC)
				return PBS_KRB5_OK;

			return ret;
		}

		local_ticket = 1;
	}

	afslog_ticket = ticket;

	k_setpag();

	do_afslog(afslog_ticket->context, afslog_ticket->job_info);

	pid = fork();
	if (pid < 0) {
		/* Go root on error */
		if (seteuid(0) < 0) {
			strerror_r(errno, errbuf, sizeof(errbuf));
			snprintf(buf, sizeof(buf), "Could not reset root privileges: %s.", errbuf);
			log_err(errno, __func__, buf);

			return PBS_KRB5_ERR_INTERNAL;
		}

		log_err(errno, __func__, "fork() failed");
		close(fd);

		return PBS_KRB5_ERR_INTERNAL;
	}

	if (pid > 0) {
		/* Go root in parent */
		if (seteuid(0) < 0) {
			strerror_r(errno, errbuf, sizeof(errbuf));
			snprintf(buf, sizeof(buf), "Could not reset root privileges: %s.", errbuf);
			log_err(errno, __func__, buf);

			return PBS_KRB5_ERR_INTERNAL;
		}

		snprintf(buf, sizeof(buf), "%d\n", pid);
		ret = write(fd, buf, strlen(buf));
		if (ret == -1) {
			log_err(errno, __func__, "writing pid failed");
			goto out;
		}

		snprintf(log_buffer, sizeof(buf), "afslog for task %8.8X started, pid: %d",
			 ptask->ti_qs.ti_task, pid);
		log_record(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);

		ret = PBS_KRB5_OK;

	out:
		if (fd != -1) {
			fsync(fd);
			close(fd);
		}

		if (local_ticket)
			free_ticket(ticket, CRED_RENEWAL);

		return ret;
	}

	close(fd);

	log_close(0);
	pbs_conf.locallog = 0;
	log_open(log_file, path_log);

	if (fd1 >= 0)
		close(fd1);
	if (fd2 >= 0)
		close(fd2);

	if (setsid() == -1)
		log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, "afslog could not setsid");

	wait_afslog();

	if (local_ticket)
		free_ticket(ticket, CRED_RENEWAL);

	exit(0);
}

/**
 * @brief
 * 	signal_afslog - send signal to the specific job task in order to do
 *	AFS log or terminate the process on job exit.
 *
 * @param[in] ptask - job task
 * @param[in] signal - signal to send
 *
 * @return 	int
 * @retval	PBSGSS_OK on success
 * @retval	!= PBSGSS_OK otherwise
 */
int
signal_afslog(const task *ptask, int signal)
{
	char buf[LOG_BUF_SIZE];
	char pid_file[MAXPATHLEN];
	FILE *fd;
	struct stat cache_info;
	job *pjob;

	if (ptask == NULL)
		return PBS_KRB5_ERR_INTERNAL;

	pjob = ptask->ti_job;
	if (pjob == NULL)
		return PBS_KRB5_ERR_INTERNAL;

	if (*pjob->ji_qs.ji_fileprefix != '\0')
		snprintf(pid_file, sizeof(pid_file), "%s%s_afslog_%8.8X.pid", path_jobs, pjob->ji_qs.ji_fileprefix, (unsigned int) ptask->ti_qs.ti_task);
	else
		snprintf(pid_file, sizeof(pid_file), "%s%s_afslog_%8.8X.pid", path_jobs, pjob->ji_qs.ji_jobid, (unsigned int) ptask->ti_qs.ti_task);

	fd = fopen(pid_file, "r");
	if (fd == NULL) {
		snprintf(buf, sizeof(buf), "Failed to open pidfile: %s", pid_file);
		log_err(errno, __func__, buf);

		return PBS_KRB5_ERR_CANT_OPEN_FILE;
	}

	int pid = 0;
	if (fscanf(fd, "%d", &pid) < 1) {
		pid = -1;
	}

	fclose(fd);

	if (pid >= 0) {
		if (kill(pid, signal) != 0) {
			snprintf(buf, sizeof(buf), "afslog for task %8.8X could not send signal %d to PID %d.",
				 (unsigned int) ptask->ti_qs.ti_task, signal, pid);
			log_err(errno, __func__, buf);

			return PBS_KRB5_ERR_KILL_PROCESS;
		} else {
			sprintf(log_buffer, "afslog for task %8.8X, signal %d sent to pid %d",
				(unsigned int) ptask->ti_qs.ti_task, signal, pid);
			log_record(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
		}
	} else {
		snprintf(buf, sizeof(buf), "afslog for task %8.8X failed to get pid from pidfile: %s",
			 (unsigned int) ptask->ti_qs.ti_task, pid_file);
		log_err(errno, __func__, buf);

		return PBS_KRB5_ERR_KILL_PROCESS;
	}

	if (signal != SIGHUP && stat(pid_file, &cache_info) == 0) {
		unlink(pid_file);
	}

	return PBS_KRB5_OK;
}

/**
 * @brief
 * 	getpag - recognize afs pag in groups and return the pag.
 *
 * @return 	int32_t
 * @retval	pag > 0 on success
 * @retval	0 otherwise
 */
int32_t
getpag()
{
	gid_t *grplist = NULL;
	int i;
	int numsup;
	static int maxgroups = 0;
	int32_t pag = 0;

	if (k_hasafs() == 0)
		return 0;

	maxgroups = (int) sysconf(_SC_NGROUPS_MAX);

	grplist = calloc((size_t) maxgroups, sizeof(gid_t));
	if (grplist == NULL)
		return 0;

	numsup = getgroups(maxgroups, grplist);

	for (i = 0; i < numsup; ++i) {
		/* last (4th) byte in pag is char 'A' */
		if ((grplist[i] >> 24) == 'A') {
			pag = grplist[i];
			break;
		}
	}

	if (grplist)
		free(grplist);

	return pag;
}
#endif
#endif


================================================
FILE: src/resmom/renew_creds.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef RENEW_CREDS_H
#define RENEW_CREDS_H

#include <pbs_config.h> /* the master config generated by configure */

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)

#include <sys/types.h>

#include "list_link.h"
#include "pbs_ifl.h"
#include "attribute.h"
#include "job.h"
#include "mom_mach.h"
#include "work_task.h"

#include <krb5.h>

struct krb_holder;

/* cred actions */
#define CRED_SINGLESHOT 0
#define CRED_RENEWAL 1
#define CRED_SETENV 2
#define CRED_CLOSE 3
#define CRED_DESTROY 4

#define CRED_DATA_SIZE 4096

enum PBS_KRB5_ERRORS {
	PBS_KRB5_OK = 0,
	PBS_KRB5_ERR_INTERNAL,
	PBS_KRB5_ERR_CONTEXT_INIT,
	PBS_KRB5_ERR_GET_CREDS,
	PBS_KRB5_ERR_NO_KRB_PRINC,
	PBS_KRB5_ERR_NO_USERNAME,
	PBS_KRB5_ERR_USER_NOT_FOUND,
	PBS_KRB5_ERR_CANT_OPEN_FILE,
	PBS_KRB5_ERR_KILL_PROCESS,
	PBS_KRB5_LAST
};

struct krb_holder *alloc_ticket();
int init_ticket_from_job(job *pjob, const task *ptask, struct krb_holder *ticket, int cred_action);
int init_ticket_from_req(char *principal, char *jobid, struct krb_holder *ticket, int cred_action);
void free_ticket(struct krb_holder *ticket, int cred_action);
char *get_ticket_ccname(struct krb_holder *ticket);

int cred_by_job(job *pjob, int cred_action);
void renew_job_cred(job *pjob);

/* storage functions */
void store_or_update_cred(char *jobid, char *credid, int cred_type, krb5_data *data, char *data_base64, long validity);
void delete_cred(char *jobid);

void send_cred_sisters(job *pjob);

int im_cred_send(job *pjob, hnodent *xp, int stream);
int im_cred_read(job *pjob, hnodent *np, int stream);

#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
void singleshot_afslog(struct krb_holder *ticket);
int start_afslog(const task *ptask, struct krb_holder *ticket, int, int);
int signal_afslog(const task *ptask, int signal);

int32_t getpag();

#define AFSLOG_TERM(x)                                                                                                                                  \
	{                                                                                                                                               \
		if (signal_afslog(x, SIGTERM))                                                                                                          \
			log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, x->ti_job->ji_qs.ji_jobid, "sending SIGTERM to afslog process failed"); \
	}
#else
#define AFSLOG_TERM(x) \
	{              \
	}
#endif /* OpenAFS */

#endif

#endif /* RENEW_CREDS_H */


================================================
FILE: src/resmom/requests.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <limits.h>
#include <signal.h>
#include <grp.h>
#include <pwd.h>
#include <unistd.h>
#include <sys/wait.h>
#include <dirent.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <assert.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <time.h>
#include "dis.h"
#include "libpbs.h"
#include "pbs_error.h"
#include "server_limits.h"
#include "list_link.h"
#include "ticket.h"
#include "credential.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "batch_request.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "mom_mach.h"
#include "mom_func.h"
#include "mom_server.h"
#include "net_connect.h"
#include "log.h"
#include "tpp.h"
#include "hook.h"
#include "pbs_python.h"
#include "mom_hook_func.h"
#include "work_task.h"
#include "placementsets.h"
#include "pbs_internal.h"
#include "portability.h"

#ifdef __SANITIZE_ADDRESS__
#include <sanitizer/common_interface_defs.h>
pid_t pid_sanitizer = -1;
#endif

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
#include "renew_creds.h"
#include <krb5.h>
extern int decode_block_base64(unsigned char *ascii_data, ssize_t ascii_len, unsigned char *bin_data, ssize_t *p_bin_len, char *msg, size_t msg_len);
#endif

/**
 * @file	requests.c
 */
/* External Global Data Items */

extern unsigned int default_server_port;
extern int exiting_tasks;
extern pbs_list_head svr_alljobs;
extern char mom_host[];
#ifdef WIN32
extern char *mom_home;
#endif
extern char *msg_err_unlink;
extern char *msg_mom_reject_root_scripts;
extern int reject_root_scripts;
extern char *path_spool;
extern char *path_undeliv;
extern attribute_def job_attr_def[];
extern char *msg_jobmod;
extern char *msg_manager;
extern time_t time_now;
extern time_t time_resc_updated;
extern int resc_access_perm; /* see encode_resc() */
/* in attr_fn_resc.c */
extern int suspend_signal;
extern int resume_signal;
extern char *path_checkpoint;
extern int restart_background;
extern int reject_hook_scripts;
extern int restart_transmogrify;
extern char task_fmt[];
extern char *msg_noloopbackif;
extern char *msg_stageremote;
extern char *path_hooks;
extern char *msg_hookfile_open;
extern char *msg_hookfile_write;
extern unsigned long hooks_rescdef_checksum;
extern char *path_rescdef;
#if MOM_ALPS
extern int alps_confirm_empty_timeout;
extern int alps_confirm_switch_timeout;
#endif

extern long joinjob_alarm_time;
extern long job_launch_delay;
extern int update_joinjob_alarm_time;
extern int update_job_launch_delay;
extern pbs_list_head svr_allhooks;
/* External Functions */
extern int is_direct_write(job *, enum job_file, char *, int *);
extern unsigned char pbs_aes_key[][16];
extern unsigned char pbs_aes_iv[][16];

/* Local Data Items */
char rcperr[MAXPATHLEN] = {'\0'}; /* file to contain rcp error */
char *pbs_jobdir = NULL;	  /* path to staging and execution dir of current job */
char *cred_buf = NULL;
size_t cred_len = 0;
int cred_type = 0;
int cred_pipe = -1;
char *pwd_buf = NULL;

#ifndef WIN32
static void post_cpyfile(job *pjob, int ev);
#else
extern char *save_actual_homedir(struct passwd *, job *);
extern char *set_homedir_to_local_default(job *, char *);
#endif

#ifndef TRUE
#define TRUE 1
#define FALSE 0
#endif

#define STAGEOUT_FAILURE 65
#define SUSPEND 1
#define RESUME 0

#ifdef __SANITIZE_ADDRESS__
/**
 * @brief
 * 	__lsan_is_turned_off() - disable leak sanitizer for running process
 *  based on pid_sanitizer. If pid_sanitizer is zero, lsan is disabled.
 *  This is used for disabling lsan in child process in case of changing
 *  uid/gid of the child process. The sanitizer can not handle functions
 *  like setuid() and fails with not being able to connect to the thread.
 *
 * @return 	int
 * @retval	1	disable LSAN
 * @retval	0	enable LSAN
 *
 */
int __attribute__((used))
__lsan_is_turned_off(void)
{
	if (pid_sanitizer)
		return 0;

	return 1;
}
#endif

/**
 * @brief
 * 	is_file_same() - are two paths pointing to the same file
 * @param[in] file1 - path1
 * @param[in] file2 - path2
 *
 * @return 	int
 * @retval	1	if are the same
 * @retval	0	if not the same (or cannot tell)
 *
 */

static int
is_file_same(char *file1, char *file2)
{
#ifndef WIN32
	struct stat sb1, sb2;

	if ((stat(file1, &sb1) == 0) && (stat(file2, &sb2) == 0)) {
		if ((sb1.st_dev == sb2.st_dev) && (sb1.st_ino == sb2.st_ino))
			return 1;
	}
#endif
	return 0;
}

/**
 * @brief
 * 	fork_to_user - fork mom and go to user's home directory
 *	also sets up the global useruid and usergid in the child
 *
 *	WARNING: valid only if called when preq points to a cpyfiles structure
 *
 * @param[in] preq - pointer to batch_request structure
 * @param[in] pjob - pointer to job structure (can be null)
 *
 * @return 	HANDLE
 * @retval
 * @retval	!INVALID_HANDLE_VALUE - success
 * @retval	INVALID_HANDLE_VALUE - failure
 */
#ifdef WIN32
static HANDLE
fork_to_user(struct batch_request *preq, job *pjob)
{
	struct passwd *pwdp = NULL;
	struct rq_cpyfile *rqcpf;
	static char buf[MAXPATHLEN + 1];
	char lpath[MAXPATHLEN + 1];

	/* Need to look up the uid, gid, and home directory */
	if (preq->rq_type == PBS_BATCH_CopyFiles_Cred || preq->rq_type == PBS_BATCH_DelFiles_Cred) {
		rqcpf = &preq->rq_ind.rq_cpyfile_cred.rq_copyfile;
		cred_buf = preq->rq_ind.rq_cpyfile_cred.rq_pcred;
		cred_len = preq->rq_ind.rq_cpyfile_cred.rq_credlen;
	} else {
		rqcpf = &preq->rq_ind.rq_cpyfile;
		cred_buf = NULL;
		cred_len = 0;
	}

	if (pjob)
		pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));

	/* we're trying to reuse old pw_userlogin since a mapped UNC */
	/* path maybe hanging off it. With pbs_mom running under     */
	/* SERVICE_ACCOUNT, we have to map drives under user session */
	/* Only the session that mapped the drive can unmap it.      */
	log_buffer[0] = '\0';
	if ((pwdp == NULL || pwdp->pw_userlogin == INVALID_HANDLE_VALUE) &&
	    (pwdp = logon_pw(preq->rq_ind.rq_cpyfile.rq_user, cred_buf, cred_len, pbs_decrypt_pwd, 0, log_buffer)) == NULL) {
		log_err(-1, __func__, log_buffer);
		return (INVALID_HANDLE_VALUE);
	}

	if (strlen(log_buffer) > 0)
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, log_buffer);

	if (pwdp->pw_userlogin != INVALID_HANDLE_VALUE) {
		if (!impersonate_user(pwdp->pw_userlogin)) {
			log_err(-1, "fork_to_user2", "ImpersonateLoggedOnUser");
			return (INVALID_HANDLE_VALUE);
		}
	} else
		return (INVALID_HANDLE_VALUE);

	pbs_strncpy(lpath, save_actual_homedir(pwdp, pjob), sizeof(lpath));
	CreateDirectory(lpath, 0); /* user homedir may not exist yet */
	if (chdir(lpath) == -1) {
		pbs_strncpy(lpath, set_homedir_to_local_default(pjob, preq->rq_ind.rq_cpyfile.rq_user), sizeof(lpath));
		CreateDirectory(lpath, 0); /* user homedir may not exist yet */
		(void) chdir(lpath);
	}

	setenv("PBS_EXEC", pbs_conf.pbs_exec_path, 1);

	return (pwdp->pw_userlogin);
}

#else

/**
 * @brief
 * 	frk_err - error function for "fork_to_user()".
 *	Call this if there is an error reply needed for the the batch request
 *	in the child process.  The error is returned to the Server and the
 *	child process exits.
 *
 * @param[in] err - error number
 * @param[in] preq - pointer to batch_request structure
 *
 * @return 	Void
 *
 */

static void
frk_err(int err, struct batch_request *preq)
{
	req_reject(err, 0, preq);
	exit(0);
}

/**
 * @brief
 *	fork_to_user - fork mom and go to user's home directory
 *		  also sets up the global useruid and usergid in the child
 *
 *	WARNING: valid only if called when preq points to a cpyfiles structure
 *		 or a cpyfiles_cred structure
 *
 * @param[in] preq - pointer to batch_request structure
 * @param[in] pjob - pointer to job structure (can be null)
 *
 * @return	pid_t
 * @retval	>0 - success
 * @retval	<0 - failure
 */

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
static pid_t
fork_to_user(struct batch_request *preq, job *pjob, struct krb_holder *ticket)
#else
static pid_t
fork_to_user(struct batch_request *preq, job *pjob)
#endif
{
	struct group *grpp;
	pid_t pid;
	struct passwd *pwdp;
	uid_t useruid;
	gid_t usergid;
	gid_t user_rgid;
	int fds[2];
	struct rq_cpyfile *rqcpf;
	static char buf[MAXPATHLEN + 1];

	pid = fork_me(preq->rq_conn);

#ifdef __SANITIZE_ADDRESS__
	/* see the comment of __lsan_is_turned_off() */
	pid_sanitizer = pid;
#endif

	if (pid > 0) {
		if (preq->prot == PROT_TCP)
			free_br(preq); /* parent - note leave connection open   */
		return pid;
	} else if (pid < 0)
		return (-PBSE_SYSTEM);

	/* The Child */

	if (preq->rq_type == PBS_BATCH_CopyFiles_Cred || preq->rq_type == PBS_BATCH_DelFiles_Cred)
		rqcpf = &preq->rq_ind.rq_cpyfile_cred.rq_copyfile;
	else
		rqcpf = &preq->rq_ind.rq_cpyfile;

	/* create a PBS_EXEC env entry */
	setenv("PBS_EXEC", pbs_conf.pbs_exec_path, 1);

	if (pjob != NULL && pjob->ji_grpcache != NULL) {
		/* used the good stuff cached in the job structure */
		useruid = pjob->ji_qs.ji_un.ji_momt.ji_exuid;
		usergid = pjob->ji_qs.ji_un.ji_momt.ji_exgid;
		if (chdir(pjob->ji_grpcache->gc_homedir) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));		
		user_rgid = pjob->ji_grpcache->gc_rgid;
		/* Account ID used to be set her for Cray via acctid(). */
	} else {
		/* Need to look up the uid, gid, and home directory */
		if ((pwdp = getpwnam(rqcpf->rq_user)) == NULL)
			frk_err(PBSE_BADUSER, preq); /* no return */
		useruid = pwdp->pw_uid;
		user_rgid = pwdp->pw_gid;

		if (rqcpf->rq_group[0] == '\0')
			usergid = pwdp->pw_gid; /* default to login group */
		else {
			if ((grpp = getgrnam(rqcpf->rq_group)) == NULL)
				frk_err(PBSE_BADUSER, preq); /* no return */
			usergid = grpp->gr_gid;
		}
		if (chdir(pwdp->pw_dir) == -1)  /* change to user`s home directory */
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	/* singleshot ticket, without renewal */
	if (pjob != NULL)
		init_ticket_from_job(pjob, NULL, ticket, CRED_SINGLESHOT);
	else
		init_ticket_from_req(preq->rq_extend, preq->rq_ind.rq_cpyfile.rq_jobid, ticket, CRED_SINGLESHOT);

#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
	singleshot_afslog(ticket);
#endif
#endif

	if (preq->rq_type == PBS_BATCH_CopyFiles_Cred || preq->rq_type == PBS_BATCH_DelFiles_Cred) {

		cred_buf = preq->rq_ind.rq_cpyfile_cred.rq_pcred;
		cred_len = preq->rq_ind.rq_cpyfile_cred.rq_credlen;

		switch (preq->rq_ind.rq_cpyfile_cred.rq_credtype) {
			case PBS_CREDTYPE_NONE:
				if (becomeuser_args(rqcpf->rq_user, useruid, usergid, user_rgid) == -1) {
					log_err(errno, __func__, "set privilege as user");
					frk_err(PBSE_SYSTEM, preq); /* no return */
				}
				break;

			case PBS_CREDTYPE_AES:
				if (becomeuser_args(rqcpf->rq_user, useruid, usergid, user_rgid) == -1) {
					log_err(errno, __func__, "set privilege as user");
					frk_err(PBSE_SYSTEM, preq); /* no return */
				}
				if (pbs_decrypt_pwd(cred_buf, PBS_CREDTYPE_AES, cred_len, &pwd_buf, (const unsigned char *) pbs_aes_key, (const unsigned char *) pbs_aes_iv) != 0) {
					log_joberr(-1, __func__, "decrypt_pwd", rqcpf->rq_jobid);
					frk_err(PBSE_BADCRED, preq); /* no return */
				}
				if (pipe(fds) == -1) {
					log_err(errno, __func__, "pipe");
					frk_err(PBSE_SYSTEM, preq); /* no return */
				}
				cred_pipe = fds[1];

				sprintf(buf, "%d", fds[0]);
				setenv("PBS_PWPIPE", buf, 1);
				fcntl(cred_pipe, F_SETFD, 1); /* close on exec */

				break;

			default:
				log_err(errno, __func__, "unknown credential type");
				break;
		}
	} else { /* no cred */
		if (becomeuser_args(rqcpf->rq_user, useruid, usergid, user_rgid) == -1) {
			log_err(errno, __func__, "set privilege as user");
			frk_err(PBSE_SYSTEM, preq); /* no return */
		}
	}

	return pid;
}
#endif /* WIN32 */

#define RT_BLK_SZ 65536
/**
 * @brief
 * 	Called when a job is rerun (qrerun) to copy the job's standard out/error
 * 	files back to the Server until job is rescheduled.  Function opens
 * 	the StdOut or StdErr file for the job, reading in blocks of it and
 * 	ships the blocks to the Server.
 * 	If the file is shipped back to the Server successfully and it was in
 * 	PBS_HOME/spool, it is then deleted.
 *
 * @see
 * @param[in] pjob  - Accepts a job pointer.
 * @param[in] which - enum for standard job files
 * @param[in] sock  - socket descriptor value
 *
 * @return	int
 * @retval	 0  - success.
 * @retval	-1  - failure.
 *
 */
static int
return_file(job *pjob, enum job_file which, int sock)
{
	int amt;
	char buf[RT_BLK_SZ];
	int fds;
	struct batch_request *prq;
	int rc = 0;
	int seq = 0;
	int direct_write_possible = 1;

	char path[MAXPATHLEN + 1]; /* needed by is_direct_write */

	if ((is_jattr_set(pjob, JOB_ATR_interactive)) && (get_jattr_long(pjob, JOB_ATR_interactive) > 0)) {
		return (0); /* interactive job, no file to copy */
	}

	/* Check for direct write of this file - direct write files are */
	/* not copied back to the server on rerun.                      */
	if (is_direct_write(pjob, which, path, &direct_write_possible)) {
		sprintf(log_buffer,
			"Skipping copy of directly written %s file of job %s",
			(which == StdOut) ? "STDOUT" : "STDERR", pjob->ji_qs.ji_jobid);
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (0); /* Direct write, no copy done */
	}

	fds = open_std_file(pjob, which, O_RDONLY,
			    pjob->ji_qs.ji_un.ji_momt.ji_exgid);
	if (fds < 0)
		return (0);

	/* Build a "request" to the Server which will contain */
	/* a block of the file and send it on its way         */

	prq = alloc_br(PBS_BATCH_MvJobFile);
	if (prq == NULL) {
		close(fds);
		return (-1);
	}

	(void) strcpy(prq->rq_host, mom_host);
	(void) strcpy(prq->rq_ind.rq_jobfile.rq_jobid, pjob->ji_qs.ji_jobid);

	while ((amt = read(fds, buf, RT_BLK_SZ)) > 0) {
		/* prq->rq_ind.rq_jobfile.rq_sequence = seq++; */
		/* prq->rq_ind.rq_jobfile.rq_type = (int)which; */
		/* prq->rq_ind.rq_jobfile.rq_size = amt; */
		/* prq->rq_ind.rq_jobfile.rq_data = buf; */

		DIS_tcp_funcs();
		if ((rc = encode_DIS_ReqHdr(sock, PBS_BATCH_MvJobFile,
					    pbs_current_user)) ||
		    (rc = encode_DIS_JobFile(sock, seq++, buf, amt,
					     pjob->ji_qs.ji_jobid, which)) ||
		    (rc = encode_DIS_ReqExtend(sock, NULL))) {
			break;
		}

		dis_flush(sock);

		if ((DIS_reply_read(sock, &prq->rq_reply, 0) != 0) ||
		    (prq->rq_reply.brp_code != 0)) {
			rc = -1;
			break;
		}
	}
	free_br(prq);
	(void) close(fds);

	if (rc == 0) {
		int keeping;
		char *path;

		/* get path of file and if "keeping" indicates file is in */
		/* the job's working directory, don't bother to delete it */
		/* it will be deleted when the sandbox is removed or left */
		/* in the user's home to be replaced when job rerun.      */
		path = std_file_name(pjob, which, &keeping);
		if (keeping == 0)
			(void) unlink(path);
		return (0);
	} else
		return (-1);
}

/**
 * Delete job request
 * @brief
 * 	Delete job request - wait for the sisters to finish, cleanup, and respond back to the
 *	the server
 *	In the case of Cray, the response to the server will be done
 *	at a lower level in del_job_hw() to allow the MOM cancel the
 *	ALPS reservation.  In Cray's case, the job will remain in the
 *	"E" state until the MOM responds to the deletejob request from
 *	the server.
 *
 * @param[in] batch_request structure for the job
 *
 * @return Void
 *
 */
void
req_deletejob(struct batch_request *preq)
{
	job *pjob;
	mom_hook_input_t *hook_input = NULL;
	mom_hook_output_t *hook_output = NULL;
	char *jobid = NULL;

	jobid = preq->rq_ind.rq_delete.rq_objname;
	pjob = find_job(jobid);

	if (!pjob) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	if (pjob->ji_hook_running_bg_on)
		/* This is a duplicate request just return from here. */
		return;

		/*
		* check to see is there any copy request pending
		* for this job ?
		*/
#ifdef WIN32
	if (get_copyinfo_from_list(jobid) != NULL)
#else
	if (pjob->ji_momsubt != 0 && pjob->ji_mompost == post_cpyfile)
#endif
	{
		/*
		 * we have copy request pending so we
		 * need to first process the post_cpyfile
		 * request before starting this one.
		 * Tell the server to try again later.
		 */
		req_reject(PBSE_TRYAGAIN, 0, preq);
		return;
	}
	/*
	 * mom_deljob_wait() sets substate to
	 * prevent sending more OBIT messages
	 */
	pjob->ji_preq = preq;
	if ((hook_input = (mom_hook_input_t *) malloc(
		     sizeof(mom_hook_input_t))) == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		return;
	}
	mom_hook_input_init(hook_input);
	hook_input->pjob = pjob;

	if ((hook_output = (mom_hook_output_t *) malloc(
		     sizeof(mom_hook_output_t))) == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		return;
	}
	mom_hook_output_init(hook_output);
	if ((hook_output->reject_errcode =
		     (int *) malloc(sizeof(int))) == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		free(hook_output);
		return;
	}
	*(hook_output->reject_errcode) = 0;

	if (mom_process_hooks(HOOK_EVENT_EXECJOB_END,
			      PBS_MOM_SERVICE_NAME, mom_host, hook_input,
			      hook_output, NULL, 0, 1) == HOOK_RUNNING_IN_BACKGROUND) {

		pjob->ji_hook_running_bg_on = BG_PBS_BATCH_DeleteJob;

		/*
		* save number of nodes in sisterhood in case
		* job is deleted in send_sisters_deljob()
		*/
		if (pjob->ji_numnodes > 1) {
			if (send_sisters_deljob_wait(pjob) == 0) {
				sprintf(log_buffer, "Unable to send delete job "
						    "request to one or more sisters");
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					  LOG_ERR, pjob->ji_qs.ji_jobid, log_buffer);
				/*
				* no messages sent, but there are sisters
				* must be all down
				*/
				pjob->ji_hook_running_bg_on = BG_PBSE_SISCOMM;
			}
		}
		/*
		* Hook is running in background reply to the batch
		* request will be taken care of in mom_process_background_hooks
		* function
		*/
		return;
	}
	mom_deljob_wait2(pjob);
	free(hook_output->reject_errcode);
	free(hook_output);
	free(hook_input);
}

/**
 * @brief
 * 	req_holdjob - checkpoint and terminate job
 *
 * @param[in] batch_request structure for the job
 *
 * @return Void
 *
 */

void
req_holdjob(struct batch_request *preq)
{
	job *pjob;

	pjob = find_job(preq->rq_ind.rq_hold.rq_orig.rq_objname);
	if (pjob == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	if (pjob->ji_flags & MOM_CHKPT_ACTIVE) {
		req_reject(PBSE_BADSTATE, 0, preq);
		sprintf(log_buffer, "req_holdjob failed: Checkpoint active.");
	} else if (pjob->ji_flags & MOM_RESTART_ACTIVE) {
		req_reject(PBSE_BADSTATE, 0, preq);
		sprintf(log_buffer, "req_holdjob failed: Restart active.");
	} else if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING) &&
		   !check_job_substate(pjob, JOB_SUBSTATE_SUSPEND)) {
		req_reject(PBSE_BADSTATE, 0, preq);
		sprintf(log_buffer,
			"req_holdjob failed: Job not running or suspended.");
	} else {
		start_checkpoint(pjob, 1, preq);
		sprintf(log_buffer, "req_holdjob: Checkpoint initiated.");
	}
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);

	/* note, normally the reply to the server is in start_checkpoint() */
}

/**
 * @brief
 *	Write text into a job's output file,
 *	Return a PBS error code.
 *
 * @param[in] pjob - pointer to job structure
 * @param[in] jft  - enum for job_file
 * @param[in] text - message to be written into job's o/p file
 *
 * @return 	PBS error code
 * @retval	PBSE_NONE	No error
 * @retval	PBSE_MOMREJECT
 * @retval	PBSE_UNKJOBID	Unknown Job Identifier
 * @retval	PBSE_MOMREJECT	Request to MOM failed
 * @retval	PBSE_INTERNAL	internal server error occurred
 *
 */
int
message_job(job *pjob, enum job_file jft, char *text)
{
	char *pstr = NULL;
	int len;
	int fds = -1;
	ssize_t bytes_written = 0;
	ssize_t total_bytes_written = 0;

	if (pjob == NULL)
		return PBSE_UNKJOBID;

	/* must be Mother Superior for this to make sence */
	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
		return PBSE_MOMREJECT;

	len = is_joined(pjob);
	if (len == -1)
		jft = StdErr; /* only have stderr open */
	else if (len == 1)
		jft = StdOut; /* only have stdout open */

#ifdef WIN32
	if ((fds = open_std_file(pjob, jft, O_WRONLY | O_APPEND,
				 pjob->ji_qs.ji_un.ji_momt.ji_exgid)) < 0)
		return PBSE_MOMREJECT;

	/* set to append mode */
	SetFilePointer((HANDLE) _get_osfhandle(fds), (LONG) NULL,
		       (PLONG) NULL, FILE_END);
#else
	int i;
	unsigned int usecs = 250 * 1000; /* 250 milliseconds */
	for (i = 0; i < 3; i++) {
		fds = open_std_file(pjob, jft, O_WRONLY | O_APPEND | O_NONBLOCK,
				    pjob->ji_qs.ji_un.ji_momt.ji_exgid);
		if (fds < 0)
			if (errno == EAGAIN || errno == EWOULDBLOCK)
				usleep(usecs);
			else
				return PBSE_MOMREJECT;
		else
			break;
	}

	if (fds < 0)
		return PBSE_MOMREJECT;
#endif
	len = strlen(text);
	if (text[len - 1] != '\n') {
		if ((pstr = malloc(len + 2)) == NULL)
			return PBSE_INTERNAL;

		(void) strcpy(pstr, text);
		pstr[len++] = '\n'; /* append new-line */
		text = pstr;
	}
#ifdef WIN32
	total_bytes_written = write(fds, text, len);
	(void) _commit(fds);
#else
	for (i = 0; i < 3; i++) {
		bytes_written = write(fds, text, len - total_bytes_written);
		if (bytes_written <= 0) {
			if (errno == EAGAIN || errno == EWOULDBLOCK)
				usleep(usecs);
			else {
				(void) close(fds);
				free(pstr);
				return PBSE_MOMREJECT;
			}
		} else {
			text += bytes_written;
			total_bytes_written += bytes_written;
			if (total_bytes_written == len)
				break;
		}
	}
#endif
	(void) close(fds);
	if (pstr)
		free(pstr);

	if (total_bytes_written == len)
		return PBSE_NONE;
	else
		return PBSE_MOMREJECT;
}

/**
 * @brief
 * 	req_messagejob - Append message to job's output/error file
 *
 * @param[in] preq - pointer to batc_request structure
 *
 * @return 	Void
 *
 */

void
req_messagejob(struct batch_request *preq)
{
	int ret = 0;
	job *pjob;

	pjob = find_job(preq->rq_ind.rq_message.rq_jid);
	if ((preq->rq_ind.rq_message.rq_file == PBS_BATCH_FileOpt_Default) ||
	    (preq->rq_ind.rq_message.rq_file & PBS_BATCH_FileOpt_OFlg)) {
		ret = message_job(pjob, StdOut, preq->rq_ind.rq_message.rq_text);
	}

	if ((preq->rq_ind.rq_message.rq_file & PBS_BATCH_FileOpt_EFlg) &&
	    (ret == 0)) {
		ret = message_job(pjob, StdErr,
				  preq->rq_ind.rq_message.rq_text);
	}

	if (ret == PBSE_NONE)
		reply_ack(preq);
	else
		req_reject(ret, 0, preq);
	return;
}

/**
 * @brief
 *	Spawn a Python process.
 *
 * @param[in] preq - pointer to batc_request structure
 *
 * @return      Void
 *
 */
void
req_py_spawn(struct batch_request *preq)
{
	static char pypath[MAXPATHLEN + 1];
	char *allargs;
	int allarglen = 1;
	struct stat sbuf;
	int ret, i;
	job *pjob;
	pbs_task *ptask;
	char **argv;
	obitent *op;

	pjob = find_job(preq->rq_ind.rq_py_spawn.rq_jid);
	if (pjob == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	if (pypath[0] == '\0') { /* initialize pbs_python path */
		sprintf(pypath, "%s/bin/pbs_python", pbs_conf.pbs_exec_path);
#ifdef WIN32
		strncat(pypath, ".exe", sizeof(pypath) - strlen(pypath) - 1);
#endif
	}

	/* return error if python is not found in PBS_EXEC/bin */
	if (stat(pypath, &sbuf) == -1) {
		if (errno == ENOENT) {
			sprintf(log_buffer, "%s: %s not installed",
				__func__, pypath);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
				  LOG_WARNING, pjob->ji_qs.ji_jobid, log_buffer);
		} else {
			log_err(errno, __func__, pypath);
		}
		req_reject(PBSE_MOMREJECT, 0, preq);
		return;
	}

	/* check to see it is a regular file that is executable */
	if (((sbuf.st_mode & S_IFMT) != S_IFREG) ||
	    (sbuf.st_mode & (S_IXUSR | S_IXGRP | S_IXOTH)) !=
		    (S_IXUSR | S_IXGRP | S_IXOTH)) {
		sprintf(log_buffer, "%s: %s not executable",
			__func__, pypath);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
			  LOG_WARNING, pjob->ji_qs.ji_jobid, log_buffer);
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	/* count the number of args (2 for space and null) */
	for (i = 0; preq->rq_ind.rq_py_spawn.rq_argv[i] != NULL; i++)
		allarglen += strlen(preq->rq_ind.rq_py_spawn.rq_argv[i]) + 2;

	argv = (char **) calloc(i + 2, sizeof(char *));
	if (argv == NULL) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}
	allargs = (char *) malloc(allarglen);
	if (allargs == NULL) {
		req_reject(PBSE_SYSTEM, 0, preq);
		free(argv);
		return;
	}
	op = (obitent *) malloc(sizeof(obitent));
	if (op == NULL) {
		req_reject(PBSE_SYSTEM, 0, preq);
		free(argv);
		free(allargs);
		return;
	}

	/* fill argv array and create arg string */
	/* allargs will have a trailing blank */
	argv[0] = pypath;
	allargs[0] = '\0';
	for (i = 0; preq->rq_ind.rq_py_spawn.rq_argv[i] != NULL; i++) {
		argv[i + 1] = preq->rq_ind.rq_py_spawn.rq_argv[i];
		strcat(allargs, preq->rq_ind.rq_py_spawn.rq_argv[i]);
		strcat(allargs, " ");
	}
	argv[i + 1] = NULL;

	ptask = momtask_create(pjob);
	if (ptask == NULL) {
		req_reject(PBSE_INTERNAL, 0, preq);
		free(argv);
		free(allargs);
		free(op);
		return;
	}

	strcpy(ptask->ti_qs.ti_parentjobid, preq->rq_ind.rq_py_spawn.rq_jid);
	ptask->ti_qs.ti_parentnode = TM_ERROR_NODE;
	ptask->ti_qs.ti_myvnode = TM_ERROR_NODE;
	ptask->ti_qs.ti_parenttask = TM_INIT_TASK;
	(void) task_save(ptask);

	/* start the task with no demux option */
	ret = start_process(ptask, argv, preq->rq_ind.rq_py_spawn.rq_envp, true);
	free(argv);
	if (ret != PBSE_NONE) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "%s: FAILED %stask %8.8X err %d", __func__,
			 allargs, ptask->ti_qs.ti_task, ret);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_WARNING,
			  pjob->ji_qs.ji_jobid, log_buffer);

		req_reject(ret, 0, preq);
		free(allargs);
		free(op);
		return;
	}

	snprintf(log_buffer, sizeof(log_buffer), "%s: args %stask %8.8X", __func__,
		 allargs, ptask->ti_qs.ti_task);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	free(allargs);

	CLEAR_LINK(op->oe_next);
	append_link(&ptask->ti_obits, &op->oe_next, op);
	op->oe_type = OBIT_TYPE_BREVENT;
	op->oe_u.oe_preq = preq;

	return;
}

/**
 * @brief
 * 	req_modifyjob - service the Modify Job Request
 *	This request modifys a job's attributes.
 *
 * @param[in] preq - pointer to batch_request structure
 *
 * @return 	Void
 *
 */

void
req_modifyjob(struct batch_request *preq)
{
	int bad = 0;
	int i;
	attribute newattr[(int) JOB_ATR_LAST];
	attribute *pattr;
	job *pjob;
	svrattrl *plist;
	int rc;
	int recreate_nodes = 0;
	char *new_peh = NULL;

	pjob = find_job(preq->rq_ind.rq_modify.rq_objname);
	if (pjob == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_modify.rq_attr);
	if (plist == NULL) { /* nothing to do */
		reply_ack(preq);
		return;
	}

	/* modify the jobs attributes */

	bad = 0;
	pattr = pjob->ji_wattr;

	/* call attr_atomic_set to decode and set a copy of the attributes */

	rc = attr_atomic_set(plist, pattr, newattr, job_attr_idx, job_attr_def, JOB_ATR_LAST, -1, ATR_DFLAG_MGWR | ATR_DFLAG_MOM, &bad);
	if (rc) {
		/* leave old values, free the new ones */
		for (i = 0; i < JOB_ATR_LAST; i++)
			free_attr(job_attr_def, &newattr[i], i);
		req_reject(rc, 0, preq);
		return;
	}

	/* OK, now copy the new values into the job attribute array */

	for (i = 0; i < JOB_ATR_LAST; i++) {
		if (newattr[i].at_flags & ATR_VFLAG_MODIFY) {

			if (job_attr_def[i].at_action)
				(void) job_attr_def[i].at_action(&newattr[i],
								 pjob, ATR_ACTION_ALTER);
			free_attr(job_attr_def, &pattr[i], i);
			if ((newattr[i].at_type == ATR_TYPE_LIST) ||
			    (newattr[i].at_type == ATR_TYPE_RESC)) {
				list_move(&newattr[i].at_val.at_list,
					  &(pattr + i)->at_val.at_list);
			} else {
				*(pattr + i) = newattr[i];
			}
			(pattr + i)->at_flags = newattr[i].at_flags;
			if ((i == JOB_ATR_exec_vnode) ||
			    (i == JOB_ATR_exec_host) ||
			    (i == JOB_ATR_exec_host2) ||
			    (i == JOB_ATR_SchedSelect) ||
			    (i == JOB_ATR_resource)) {
				/* all of the above attributes must */
				/*  be received (recreate_nodes == 5) */
				/*  in order to trigger recreation of */
				/*  job nodes and PBS_NODEFILE */
				recreate_nodes++;
				if (recreate_nodes == 5)
					break;
			}
		}
	}

	if (get_jattr_str(pjob, JOB_ATR_exec_host2) != NULL) /* Mom got information from new server */
		new_peh = get_jattr_str(pjob, JOB_ATR_exec_host2);
	else
		new_peh = get_jattr_str(pjob, JOB_ATR_exec_host);

	if (recreate_nodes == 5) {

		/* Send IM_DELETE_JOB2 request to the sister moms not in */
		/* 'new_peh', to kill the job on that sister and */
		/* report resources_used info. */
		(void) send_sisters_inner(pjob, IM_DELETE_JOB2,
					  NULL, new_peh);

		if ((rc = job_nodes(pjob)) != 0) {
			snprintf(log_buffer, sizeof(log_buffer) - 1,
				 "failed updating internal nodes data (rc=%d)", rc);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
				  LOG_NOTICE, pjob->ji_qs.ji_jobid,
				  log_buffer);
			reply_text(preq, rc, log_buffer);
			return;
		}

		if (generate_pbs_nodefile(pjob, NULL, 0,
					  log_buffer, LOG_BUF_SIZE - 1) != 0) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
				  LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
			reply_text(preq, rc, log_buffer);
			return;
		}
		send_sisters_job_update(pjob);
		pjob->ji_updated = 1;
	}
	/* note, the newattr[] attributes are on the stack, they goaway auto */

	if (rc == 0)
		rc = mom_set_limits(pjob, SET_LIMIT_ALTER);
	if (rc) {
		req_reject(rc, bad, preq);
		return;
	}

	(void) job_save(pjob);
	(void) sprintf(log_buffer, msg_manager, msg_jobmod,
		       preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	reply_ack(preq);
}

/**
 * @brief
 *	Create a reject reply for a request, then send the reply.
 *
 * @param[in] preq - pointer to batch_request structure
 *
 * @return 	Void
 *
 */

void
req_shutdown(struct batch_request *preq)
{
	req_reject(PBSE_NOSUP, 0, preq);
}

/**
 * @brief
 * 	See if there are any events of type event_comm left to wait for.
 *
 * @param[in] pjob - pointer to job
 * @param[in] event_com - inter mom request
 *
 * @return 	int
 * @retval	1	if event exist
 * @retval	0 	if no event left
 *
 */

static int
eventleft(job *pjob, int event_com)
{
	int i;
	eventent *ep;
	hnodent *np;

	DBPRT(("eventleft: %s com %d\n", pjob->ji_qs.ji_jobid, event_com))

	for (i = 0; i < pjob->ji_numnodes; i++) {
		np = &pjob->ji_hosts[i];
		ep = (eventent *) GET_NEXT(np->hn_events);
		while (ep) {
			if (ep->ee_command == event_com)
				break;
			ep = (eventent *) GET_NEXT(ep->ee_next);
		}
		if (ep != NULL)
			return 1;
	}
	return 0;
}

/**
 * @brief
 *	Clean up any saved event state in the job structure.
 *
 * @param[in] pjob - pointer to job
 * @param[in] err - exit value
 *
 * @return 	Void
 *
 */
void
post_reply(job *pjob, int err)
{
	int stream;
	char *cookie;
	char *jobid;
	int im_compose(int, char *, char *, int, tm_event_t, tm_task_id, int);

	if (pjob->ji_postevent == TM_NULL_EVENT) /* no event */
		return;

	if (pjob->ji_hosts == NULL) { /* No one to talk to */
		pjob->ji_postevent = TM_NULL_EVENT;
		pjob->ji_taskid = TM_NULL_TASK;
		return;
	}

	stream = pjob->ji_hosts[0].hn_stream; /* MS stream */
	cookie = get_jattr_str(pjob, JOB_ATR_Cookie);
	jobid = pjob->ji_qs.ji_jobid;

	/*
	 **	I'm a sister and the reply needs to be sent back
	 **	to MS for this operation.
	 */

	if (err == 0) {
		(void) im_compose(stream, jobid, cookie, IM_ALL_OKAY,
				  pjob->ji_postevent, pjob->ji_taskid, IM_OLD_PROTOCOL_VER);
	} else {
		(void) im_compose(stream, jobid, cookie, IM_ERROR,
				  pjob->ji_postevent, pjob->ji_taskid, IM_OLD_PROTOCOL_VER);
		(void) diswsi(stream, err);
	}
	(void) dis_flush(stream);

	pjob->ji_postevent = TM_NULL_EVENT;
	pjob->ji_taskid = TM_NULL_TASK;
}

/**
 * @brief
 * 	Do all the common operations for post_action function.
 * 	For MS, if there are more things to wait for, return 1, else return 0.
 * 	For a sister, send reply back to MS and return 0.
 *
 * @param[in] pjob - pointer to job
 * @param[in] event_com - inter mom request
 * @param[in] err - exit value
 *
 * @return 	int
 * @retval	1	if there are more things to wait for
 * @retval	0 	else return 0
 *
 */

int
post_action(job *pjob, int event_com, int err)
{
	DBPRT(("post_action: %s com %d err %d\n", pjob->ji_qs.ji_jobid,
	       event_com, err))

	if (err != 0) {
		pjob->ji_flags |= MOM_SISTER_ERR;
		if (pjob->ji_preq) {
			req_reject(err, 0, pjob->ji_preq);
			pjob->ji_preq = NULL;
		}
	}

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {

		if (pjob->ji_momsubt != 0) /* child running */
			return 1;

		/*
		 **	If I'm MS, I need to check for events
		 **	to see if processing is still going on.
		 */
		if (eventleft(pjob, event_com))
			return 1;

		/*
		 ** No more operations are waiting.
		 ** This will be the final call to whoever called me.
		 */
		if (pjob->ji_preq) {
			reply_ack(pjob->ji_preq);
			pjob->ji_preq = NULL;
		}
	} else
		post_reply(pjob, err);

	/*
	 ** Everything is done, now is the time to clear ji_mompost.
	 */
	pjob->ji_mompost = NULL;

	return 0;
}

/**
 * @brief
 * 	post_suspend - post exit of child for suspending a job
 *
 * @param[in] pjob - pointer to job
 * @param[in] err - exit value
 *
 * @return	Void
 *
 */

void
post_suspend(job *pjob, int err)
{
	DBPRT(("post_suspend: %s err %d\n", pjob->ji_qs.ji_jobid, err))

	if (post_action(pjob, IM_SUSPEND, err))
		return;

	if ((pjob->ji_flags & MOM_SISTER_ERR) == 0) {
		stop_walltime(pjob);

		pjob->ji_polltime = 0; /* don't check polling */
		if (get_job_substate(pjob) < JOB_SUBSTATE_EXITING) {
			mom_hook_input_t hook_input;
			mom_hook_output_t hook_output;
			char hook_msg[HOOK_MSG_SIZE + 1];
			hook *last_phook = NULL;
			unsigned int hook_fail_action = 0;
			int reject_errcode = 0;

			set_job_substate(pjob, JOB_SUBSTATE_SUSPEND);
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_Suspend;
			(void) job_save(pjob);

			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &reject_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			if (mom_process_hooks(HOOK_EVENT_EXECJOB_POSTSUSPEND,
					      PBS_MOM_SERVICE_NAME, mom_host, &hook_input,
					      &hook_output, hook_msg, sizeof(hook_msg), 1) == 0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "execjob_postsuspend hook rejected request: %s", hook_msg);
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
			}
		} else {
			snprintf(log_buffer, sizeof(log_buffer),
				 "This job can't be suspended, since the job was in %ld substate", get_job_substate(pjob));
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
				  log_buffer);
		}
	} else
		pjob->ji_flags &= ~MOM_SISTER_ERR;
}

/**
 * @brief
 * 	post_resume - post exit of child for a resume of a job
 *
 * @param[in] pjob - pointer to job
 * @param[in] err - exit value
 *
 * @return      Void
 *
 */

void
post_resume(job *pjob, int err)
{
	DBPRT(("post_resume: %s err %d\n", pjob->ji_qs.ji_jobid, err))

	if (post_action(pjob, IM_RESUME, err))
		return;

	if ((pjob->ji_flags & MOM_SISTER_ERR) == 0) {

		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) {
			start_walltime(pjob);
		}
		/* if I'm not MS, start to check for polling again */
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
			pjob->ji_polltime = time_now;
		set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
		pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_Suspend;
		(void) job_save(pjob);
	} else
		pjob->ji_flags &= ~MOM_SISTER_ERR;
}

#if MOM_ALPS

/*
 * Try to minimize latency of suspend/resume. Wait half a second before
 * the first check, and then poll every tenth of a second.
 */

#define ALPS_SWITCH_SLEEP_USECS_LONG (500000)
#define ALPS_SWITCH_SLEEP_USECS_SHORT (100000)

/**
 * On a Cray, make the requested switch, and confirm it
 * @param[in]	pjob	job of interest
 * @param[in]	which	SUSPEND/RESUME
 * @retval	PBSE_NONE	no error
 * @retval	PBSE_ALPS_SWITCH_ERR
 */
static int
do_cray_susres_conf(job *pjob, int which)
{
	/**
	 * On a Cray, we need to send an ALPS SWITCH request to move the jobs
	 * to a suspend or resume state.
	 */
	basil_switch_action_t action;
	int i;
	int rc = 0;
	time_t total_time = 0;
	time_t begin_time = 0;
	time_t end_time = 0;
	int timeout_val = alps_confirm_switch_timeout;
	int first_status;
	int first_status_was_empty = 0;
	int first_sleep;

	/* Check if there is an ALPS reservation to act on.
	 * If not, just return PBSE_NONE.
	 */
	if (pjob->ji_extended.ji_ext.ji_reservation <= 0) {
		return PBSE_NONE;
	}

	if (which == SUSPEND)
		action = basil_switch_action_out;
	else
		action = basil_switch_action_in;

	rc = alps_suspend_resume_reservation(pjob, action);
	if (rc < 0) {
		sprintf(log_buffer, "Fatal ALPS SWITCH request.");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (PBSE_ALPS_SWITCH_ERR);
	}
	if (rc > 0) {
		sprintf(log_buffer, "Transient ALPS SWITCH error, the "
				    "prior SWITCH method has not yet completed.");
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (PBSE_ALPS_SWITCH_ERR);
	}

	/* The call to ALPS SWITCH was successful
	 * Now we have to poll to confirm the SWITCH happens
	 * We will assume that the ALPS suspend happens "relatively quickly"
	 * as per the Cray ALPS folks, and we will poll for a successful
	 * suspend state here.  If the confirmation takes a while, then PBS
	 * may need to somehow poll for the confirmation without tying up
	 * the mom.
	 *
	 * Keep trying in this process (don't fork a child) until the SWITCH
	 * completes, or a hard error is returned, or
	 * alps_confirm_switch_timeout is reached.
	 * alps_confirm_switch_timeout is set by default to
	 * ALPS_CONF_SWITCH_TIMEOUT
	 * NOTE:  The MOM, server and scheduler are blocked while we poll
	 * ALPS and wait for the SWITCH.
	 */
	first_status = 1;
	first_sleep = 1;
	begin_time = time(NULL);
	end_time = begin_time;
	i = 0;
	do {
		i++;
		if ((rc = alps_confirm_suspend_resume(pjob, action)) <= 0)
			break;
		if (rc == 2) {
			/* we got a response of "EMPTY" */
			if (first_status) {
				/*
				 * Alps may report EMPTY reservation for the first
				 * time we query it. So for the first time we
				 * need to poll for alps_confirm_empty_timeout
				 * time in hopes of letting the Cray race
				 * condition work itself out.  Once we hit the
				 * timeout we assume that there are no ALPS
				 * claims (i.e. apruns) on the reservation and
				 * the suspend can proceed.
				 */
				timeout_val = alps_confirm_empty_timeout;
				first_status_was_empty = 1;
			}
			if (!first_status_was_empty) {
				/* The first status response wasn't EMPTY and
				 * the status is now EMPTY.  According to
				 * Cray this means PBS can proceed
				 * as if the switch request was successful.
				 */
				break;
			}
		} else {
			/* Reset the timeout_val if we get anything besides
			 * "EMPTY"
			 */
			timeout_val = alps_confirm_switch_timeout;
		}
		/* Getting a transient error, sleep then retry */
		if (first_sleep) {
			usleep(ALPS_SWITCH_SLEEP_USECS_LONG);
			first_sleep = 0;
		} else {
			usleep(ALPS_SWITCH_SLEEP_USECS_SHORT);
		}
		end_time = time(NULL);
		first_status = 0;
	} while ((total_time = end_time - begin_time) < timeout_val);
	if (rc == 1) {
		sprintf(log_buffer, "Timed out after %d attempts over %ld "
				    "seconds of attempting to confirm the ALPS "
				    "SWITCH completed.",
			i, total_time);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (PBSE_ALPS_SWITCH_ERR);
	} else if ((rc == 2) && first_status_was_empty) {
		sprintf(log_buffer, "Timed out after %d attempts over "
				    "%ld seconds of waiting for a status of EMPTY "
				    "to change.  Proceeding as if the SWITCH "
				    "succeeded.",
			i, total_time);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
			  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
		return (PBSE_NONE);
	} else if (rc < 0) {
		sprintf(log_buffer, "Fatal ALPS QUERY of status.");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return (PBSE_ALPS_SWITCH_ERR);
	} else {
		/* the SWITCH has completed successfully */
		sprintf(log_buffer, "The SWITCH was confirmed after a total "
				    "of %d attempts, and %ld seconds.",
			i, total_time);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}

	return PBSE_NONE;
}
#endif /* MOM_ALPS */

/**
 * @brief
 *	responsible for suspend/resume job.
 *
 * @param[in] pjob - pointer to job
 * @param[in] which - indication for whether SUSPEND/RESUME
 *
 * @return	int PBSE error number
 * @retval	PBSE_NONE	no error
 * @retval	PBSE_SYSTEM	 system error occurred
 *
 */

int
do_susres(job *pjob, int which)
{
	pbs_task *ptask;
	int rc = 0;
	int err;

	if (pjob == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB,
			  LOG_ERR, "do_susres", "The job information is NULL");
		return (PBSE_SYSTEM);
	}

#if MOM_ALPS
	/* if we're trying to suspend, then ask ALPS to suspend, before
	 * we send the signal to the processes
	 */
	if (which == SUSPEND) {
		if ((rc = do_cray_susres_conf(pjob, which)) != PBSE_NONE) {
			/* We failed to do the suspend */
			return PBSE_ALPS_SWITCH_ERR;
		}
	}

	/* Continue on through the code.  Let the signal get sent to the job */

#endif /* MOM_ALPS */

	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {

		rc = (which == SUSPEND) ? kill_task(ptask, suspend_signal, 1) : kill_task(ptask, resume_signal, 0);
		DBPRT(("%s: %s of task %8.8X rc %d\n", __func__,
		       (which == SUSPEND) ? "suspend" : "resume",
		       ptask->ti_qs.ti_task, rc))
	}
	if (rc < 0) {
		/* error recovery, set things back */
		err = errno;
		for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
		     ptask != NULL;
		     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
			if (which == SUSPEND)
				kill_task(ptask, resume_signal, 0);
			else
				kill_task(ptask, suspend_signal, 1);
		}
		errno = err;
		return PBSE_SYSTEM;
	}

#if MOM_ALPS
	/*
	 * We're trying to resume, we already sent the signal to the processes
	 * now we tell ALPS to resume the ALPS reservation
	 */
	if (which == RESUME) {
		if ((rc = do_cray_susres_conf(pjob, which)) != PBSE_NONE) {
			/* We failed to do the resume */
			return PBSE_ALPS_SWITCH_ERR;
		}
	}
#endif /* MOM_ALPS */

	return PBSE_NONE;
}

/**
 * @brief
 * 	Do the common things needed for both suspend and resume
 * 	for tasks that are local.
 *
 * @param[in]	pjob	job of interest
 * @param[in]	which	SUSPEND/RESUME
 * @param[in]	preq	batch request
 *
 * @return 	int
 * @retval	0	no error
 * @retval	!0	PBS error code
 *
 */
int
local_supres(job *pjob, int which, struct batch_request *preq)
{
	int rc;

	DBPRT(("%s: %s %s %s request\n", __func__, pjob->ji_qs.ji_jobid,
	       which == SUSPEND ? "suspend" : "resume",
	       preq == NULL ? "no" : "with"))

	if (which == RESUME) {
		mom_hook_input_t hook_input;
		mom_hook_output_t hook_output;
		char hook_msg[HOOK_MSG_SIZE + 1];
		hook *last_phook = NULL;
		unsigned int hook_fail_action = 0;
		int reject_errcode = 0;

		mom_hook_input_init(&hook_input);
		hook_input.pjob = pjob;

		mom_hook_output_init(&hook_output);
		hook_output.reject_errcode = &reject_errcode;
		hook_output.last_phook = &last_phook;
		hook_output.fail_action = &hook_fail_action;

		if (mom_process_hooks(HOOK_EVENT_EXECJOB_PRERESUME,
				      PBS_MOM_SERVICE_NAME, mom_host, &hook_input,
				      &hook_output, hook_msg, sizeof(hook_msg), 1) == 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "execjob_preresume hook rejected request: %s", hook_msg);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
			errno = reject_errcode;
			return (PBSE_MOMREJECT);
		}
	}
	/*
	 ** Check to see if something is already going on.
	 */
	if (pjob->ji_momsubt != 0 ||
	    pjob->ji_mompost != NULL)
		return PBSE_MOMREJECT;

	rc = do_susres(pjob, which);

	return rc;
}

/**
 * @brief
 * 	susp_resum - the suspend/resume function
 *
 * @param[in] pjob - pointer to job
 * @param[in] which - SUSPEND/RESUME
 * @param[in] preq - pointer to batch_request structure
 *
 * @return 	Void
 *
 */

static void
susp_resum(job *pjob, int which, struct batch_request *preq)
{
	int rc;

	DBPRT(("susp_resum: %s %s %s request\n", pjob->ji_qs.ji_jobid,
	       which == SUSPEND ? "suspend" : "resume",
	       preq == NULL ? "no" : "with"))

	/* if already suspended for keyboard activity, just set/clear flag */
	if (which == SUSPEND) {
		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_Actsuspd) {
			/* already suspended for keyboard activity */
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_Suspend;
			(void) job_save(pjob);
			reply_ack(preq);
			return;
		}
	} else {
		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_Actsuspd) {
			/* keep suspended for keyboard activity */
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_Suspend;
			(void) job_save(pjob);
			reply_ack(preq);
			return;
		}
	}

	/* do suspend/resume of local tasks */

	if ((rc = local_supres(pjob, which, preq)) != PBSE_NONE) {
		req_reject(rc, errno, preq);
		return;
	}

	/*
	 ** If there is a sisterhood, send command.
	 */
	if (pjob->ji_numnodes > 1) {
		int i;

		i = send_sisters(pjob,
				 (which == SUSPEND) ? IM_SUSPEND : IM_RESUME, NULL);

		if (i > 0) {
			pjob->ji_mompost = (which == SUSPEND) ? post_suspend : post_resume;
		}
		if (i != (pjob->ji_numnodes - 1)) {
			pjob->ji_flags |= MOM_SISTER_ERR;
			req_reject(PBSE_SYSTEM, errno, preq);
			return;
		}
		pjob->ji_preq = preq;
	}

	if (pjob->ji_mompost != NULL) /* later action */
		return;

	if (which == SUSPEND) /* local */
		post_suspend(pjob, 0);
	else
		post_resume(pjob, 0);

	reply_ack(preq);
	return;
}

/**
 * @brief
 *	function for post termination of job
 *
 * @param[in] pjob - pointer to job
 * @param[in] err - exit value
 *
 * @return 	Void
 *
 */
void
post_terminate(job *pjob, int err)
{
	if (err) {
#ifdef WIN32
		if (err == -1) {
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid,
				  "Terminate script failed to exit in allocated time");
		} else {
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid,
				  "Terminate script exited with non-zero status");
		}
		/* assume that terminate action processes are hooked to */
#else

		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, "Terminate action failed");
#endif
		/* kill job */
		if (kill_job(pjob, SIGKILL) == 0) {
			/* no processes around, force into exiting */
			set_job_substate(pjob, JOB_SUBSTATE_EXITING);
			exiting_tasks = 1;
		}
	}
	return;
}

/**
 * @brief
 * 	terminate_job - terminate a job
 *	If there is a site supplied script as given by "$action terminate"
 *	then run it and place job in special exiting state:
 *	Note: This function is invoked on Mother Superior only.
 *
 *	If no script, or error,  do the normal termination: kill_job()
 *	with SIGTERM.
 *
 * @param[in] pjob - pointer to job
 * @param[in] internal - 1 if Mom terminating job for being overlimit
 *		         0 if Server terminating job
 *			 ( in both cases, SIGTERM is used )
 *		        -1 internal and use SIGKILL
 *
 * @return 	int
 * @retval	1	if script running (see do_mom_action_script())
 * @retval	-1 	if error
 * @retval	-2 	no script
 *
 */

int
terminate_job(job *pjob, int internal)
{
	int i;
	int s;

	if (internal == 1)
		pjob->ji_qs.ji_svrflags |= JOB_SVFLG_OVERLMT1;

	/* set overlimit time stamp by adding kill_delay and time_now. */
	pjob->ji_overlmt_timestamp = time_now + get_jattr_long(pjob, JOB_ATR_job_kill_delay);
	if ((chk_mom_action(TerminateAction) == Script) &&
	    ((i = do_mom_action_script(TerminateAction, pjob, NULL, NULL,
				       post_terminate)) == 1)) {
		set_job_state(pjob, JOB_STATE_LTR_EXITING);
		set_job_substate(pjob, JOB_SUBSTATE_TERM);
	} else {
		if (internal == -1)
			s = SIGKILL;
		else {
			extern int next_sample_time;
			extern int min_check_poll;

			/* The job is going to be terminated by TERM */
			s = SIGTERM;
			/* set the TERMJOB flag */
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_TERMJOB;
			/* poll ASAP in case job ignores SIGTERM */
			next_sample_time = min_check_poll;
		}
		if (kill_job(pjob, s) == 0) {
			/* no processes around, time to exit */
			exiting_tasks = 1;
		}
		i = -2;
	}
	(void) job_save(pjob);
	return i;
}

/**
 * @brief
 *	Issue a specified signal to a job.
 *
 * @par Functionality:
 *	Server has requested that a real or pseudo (made up for PBS) signal
 *	be issued to a job. Real signals (see qsig command) may be sepcified
 *	by number (numeric string), or by name with or without the "SIG" prefix.
 *	Additional processing may be required depending on the signal.
 *
 * @param[in]	preq  - pointer to the batch request structure which contains
 *		jobid and signal.
 *
 * @return	none
 */

void
req_signaljob(struct batch_request *preq)
{
	job *pjob;
	pbs_task *ptask;
	int sig;
	char *sname;
	struct sig_tbl *psigt;
	extern struct sig_tbl sig_tbl[];
	mom_hook_input_t hook_input;
	mom_hook_output_t hook_output;
	char hook_msg[HOOK_MSG_SIZE + 1];
	hook *last_phook = NULL;
	unsigned int hook_fail_action = 0;
	int reject_errcode = 0;

	sname = preq->rq_ind.rq_signal.rq_signame;
	pjob = find_job(preq->rq_ind.rq_signal.rq_jid);

	if (pjob == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	sprintf(log_buffer, "signal job with %s", sname);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);

	/**
	 *	Apparently the Server didn't receive or process an Obit sent earlier.
	 *	Just force a resend of the obit.
	 */
	if (check_job_substate(pjob, JOB_SUBSTATE_OBIT)) {
		send_obit(pjob, 0);
		if (strcmp(sname, SIG_RESUME) == 0)
			req_reject(PBSE_BADSTATE, 0, preq);
		else
			reply_ack(preq);
		return;
	} else if ((check_job_substate(pjob, JOB_SUBSTATE_RUNEPILOG)) &&
		   (strcmp(sname, "SIGKILL") != 0)) {
		/* If epilogue is running and signal is not SIGKILL, */
		/* disallow request;  note SIGKILL sent on qdel -w force */
		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}

	if ((strcmp(sname, SIG_TermJob) == 0) ||
	    (strcmp(sname, SIG_RERUN) == 0)) {

		if (strcmp(sname, SIG_TermJob) == 0) {
			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &reject_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			if (mom_process_hooks(HOOK_EVENT_EXECJOB_PRETERM,
					      PBS_MOM_SERVICE_NAME, mom_host,
					      &hook_input, &hook_output,
					      hook_msg, sizeof(hook_msg), 1) == 0) {
				reply_text(preq, PBSE_HOOK_REJECT, hook_msg);
				return;
			}
		}
		/**
		 *		PBS pseudo signal for either:
		 *		job termination, sent when a qdel is issued on a running job; or
		 *		rerunning (requeuing) a job, sent on qrerun.
		 */
		if (strcmp(sname, SIG_RERUN) == 0) {
			/* Set RERUN exit value */
			pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_RERUN;
		}

		/**
		 *		For both terminate and rerun terminate the job either via
		 *		running the terminate action script or by sending  a
		 *		SIGTERM-delay-SIGKILL sequence
		 */
		if (terminate_job(pjob, 0) == 1) {
			/* let server know (via ..._TERM) that a site
			 * script is being run
			 *
			 * The reason for the req_reject(PBSE_NONE, ..) call
			 * was that req_reject (unlike reply_ack()) allows MOM
			 * to pass back JOB_SUBSTATE_TERM to the server.
			 */
			req_reject(PBSE_NONE, JOB_SUBSTATE_TERM, preq);
		} else {
			reply_ack(preq);
		}
		return;
	} else if (strcmp(sname, SIG_SUSPEND) == 0 || strcmp(sname, SIG_ADMIN_SUSPEND) == 0) {
		/**
		 *		PBS pseudo signal to suspend a running job.
		 *		Job must be actually running.
		 */
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) != 0) {
			sprintf(log_buffer, "suspend failed: %s",
				"server indicates job is already suspended");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
		switch (get_job_substate(pjob)) {
			case JOB_SUBSTATE_RUNNING:
				break;
			default:
				sprintf(log_buffer, "suspend failed, job substate = %ld",
					get_job_substate(pjob));
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
					  pjob->ji_qs.ji_jobid, log_buffer);
				req_reject(PBSE_BADSTATE, 0, preq);
				return;
		}
		susp_resum(pjob, 1, preq);
		return;
	} else if (strcmp(sname, SIG_RESUME) == 0 || strcmp(sname, SIG_ADMIN_RESUME) == 0) {
		/**
		 *		PBS pseudo signal to resume a suspended job.
		 */
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) == 0) {
			sprintf(log_buffer, "resume failed: %s",
				"server indicates job is not suspended");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
		switch (get_job_substate(pjob)) {
			case JOB_SUBSTATE_SUSPEND:
			case JOB_SUBSTATE_SCHSUSP:
				break;
			default:
				sprintf(log_buffer, "resume failed, job substate = %ld",
					get_job_substate(pjob));
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
					  pjob->ji_qs.ji_jobid, log_buffer);
				req_reject(PBSE_BADSTATE, 0, preq);
				return;
		}
		susp_resum(pjob, 0, preq);
		return;
	}

	/**
	 *	From here on, we are dealing with a "real" signal.  It is sent to all
	 *	processes in the job.
	 */
	if (isdigit((int) *sname))
		sig = atoi(sname);
	else {
		if (!strncmp("SIG", sname, 3))
			sname += 3;
		psigt = sig_tbl;
		while (psigt->sig_name) {
			if (!strcmp(sname, psigt->sig_name))
				break;
			psigt++;
		}
		sig = psigt->sig_val;
	}
	if (sig < 0) {
		req_reject(PBSE_UNKSIG, 0, preq);
		return;
	}
#ifdef SIGKILL
	if ((sig != SIGKILL) &&
	    (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING)))
#else
	if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING))
#endif
	{
		sprintf(log_buffer, "cannot signal job, job substate = %ld",
			get_job_substate(pjob));
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}
	/* Now, send signal to the MOM's child process */
	if (kill_job(pjob, sig) == 0) {
		if ((get_job_substate(pjob) <= JOB_SUBSTATE_EXITING) ||
		    (check_job_substate(pjob, JOB_SUBSTATE_TERM))) {
			/* No procs found, force job to exiting */
			/* force issue of (another) job obit */
			(void) sprintf(log_buffer,
				       "Job recycled into exiting on signal from substate %ld",
				       get_job_substate(pjob));
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
			set_job_substate(pjob, JOB_SUBSTATE_EXITING);
			ptask = GET_NEXT(pjob->ji_tasks);
			if (ptask)
				ptask->ti_qs.ti_status = TI_STATE_EXITED;
			exiting_tasks = 1;
		}
	}

	reply_ack(preq);
	return;
}

/**
 * @brief
 *	Remove a file which is specified by path and owned by user.
 *
 * @param[in] path - path for file to be deleted
 * @param[in] user - user name
 * @param[in] bad_list - pointer to bad file list
 *
 * @return	int
 * @retval	0	success
 * @retval	errno	failure.
 *
 */

static int
delete_file(char *path, char *user, char *prmt, char **bad_list)
{
	int rc;

	DBPRT(("%s: path %s\n", __func__, path))
	fix_path(prmt, 3);
	fix_path(path, 3);
	if (local_or_remote(&prmt) == 0) {
		/* local file, is the source == destination? */
		/* if so, don't delete it		     */
		if (is_file_same(prmt, path) == 1) {
			DBPRT(("%s: path same as %s\n", __func__, prmt))
			return 0;
		}
	}

	rc = remtree(path);
	if (rc == -1 && errno == ENOENT)
		rc = 0;

	if (rc != 0) {
		sprintf(log_buffer,
			"Unable to delete file %s for user %s, error = %d",
			path, user, errno);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_REQUEST,
			  LOG_INFO, __func__, log_buffer);
		add_bad_list(bad_list, log_buffer, 2);
		rc = errno;
	} else {
		DBPRT(("%s: Deleted file %s\n", __func__, path))
	}
	return rc;
}

/**
 * @brief
 *	delete the files in a copy files or delete files request
 *	WARNING: fork_to_user() must be called first so that useruid/gid is set up
 *
 * @param[in] rqcpf - pointer to file list structure from request
 * @param[in] pjob - pointer to job structure (can be null)
 * @param[out] pbadfile - pointer to bad file list
 *
 * @return int
 * @retval 0 - success
 * @retval errno - failure.
 *
 */
static int
del_files(struct rq_cpyfile *rqcpf, job *pjob, char **pbadfile)
{
	struct rqfpair *pair = NULL;
	int rc = 0;
	int ret = 0;
	char path[MAXPATHLEN + 1] = {'\0'};
	struct stat sb = {0};
	char dname[MAXPATHLEN + 1] = {'\0'};
	char matched[MAXPATHLEN + 1] = {'\0'};
	char rmt_file[MAXPATHLEN + 1] = {'\0'};
	char local_file[MAXPATHLEN + 1] = {'\0'};
	char *ps = NULL;
	char *pp = NULL;
	DIR *dirp = NULL;
	struct dirent *pdirent = NULL;
	char prmt[MAXPATHLEN + 1] = {'\0'};
	int sandbox_private = 0;

	DBPRT(("%s: entered\n", __func__))
	/*
	 * Should be running in the user's home directory.
	 * Build up path of file using local name only, then unlink it.
	 * The first set of files may have the STDJOBFILE
	 * flag set, which we need to unlink as root, the others as the user.
	 * This is changed from the past.  We no longer delete
	 * checkpoint files here.
	 */
	sandbox_private = (rqcpf->rq_dir & STAGE_JOBDIR) ? TRUE : FALSE;
	/* When sandbox=private, chdir to job directory */
	if (sandbox_private) {
		if (!pjob) {
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_REQUEST, LOG_INFO, __func__, "%s: no job information", rqcpf->rq_jobid);
			return -1;
		}
		if (pjob->ji_grpcache)
			pbs_jobdir = jobdirname(rqcpf->rq_jobid, pjob->ji_grpcache->gc_homedir);
		else
			pbs_jobdir = jobdirname(rqcpf->rq_jobid, NULL);
		if (chdir(pbs_jobdir) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));		
	}

	pair = (struct rqfpair *) GET_NEXT(rqcpf->rq_pair);
	for (; pair; pair = (struct rqfpair *) GET_NEXT(pair->fp_link)) {

		replace(pair->fp_rmt, "\\,", ",", rmt_file);
		if (*rmt_file != '\0')
			strcpy(prmt, rmt_file);
		else
			pbs_strncpy(prmt, pair->fp_rmt, sizeof(prmt));
		path[0] = '\0';
		if (pair->fp_flag == STDJOBFILE) { /* standard out or error */
#ifndef NO_SPOOL_OUTPUT
			if (!sandbox_private) {
				DBPRT(("%s:, STDJOBFILE in %s\n", __func__, path_spool))
				pbs_strncpy(path, path_spool, sizeof(path));
			}
#endif /* NO_SPOOL_OUTPUT */
		}
		replace(pair->fp_local, "\\,", ",", local_file);
		if (*local_file != '\0')
			(void) strcat(path, local_file);
		else
			(void) strcat(path, pair->fp_local);
		DBPRT(("%s: path %s\n", __func__, path))

		/* will have to fix this for O_WORKDIR - or change O_WORKDIR behavior */
		/* O_WORKDIR behavior should match the behavior of HOME */
		/* and delete files one by one */
		if (sandbox_private) {
			if (is_child_path(pbs_jobdir, path) == 1) {
				/* file is under staging and execution dir, */
				/* so defer its removal until staging and */
				/* execution dir removal time */
				continue;
			}
		}

#ifdef WIN32
		if (stat_uncpath(path, &sb) == 0)
#else
		if (stat(path, &sb) == 0)
#endif
		{
			if (S_ISDIR(sb.st_mode)) {

				/* have a directory, must append last segment */
				/* of source name to it for  the unlink	      */

				(void) strcat(path, "/");
				pp = strrchr(prmt, '/');

				if (pp && *(pp + 1) == '\0') {
					/* reduce /dir/dir/  case to /dir/dir */
					*pp = '\0';
					pp = strrchr(prmt, '/');
				}
				if (pp)
					++pp;
				else if ((pp = strrchr(prmt, ':')) != NULL)
					++pp;
				else
					pp = prmt;

				(void) strcat(path, pp);

				DBPRT(("%s: append segment to path %s\n", __func__, path))
			}
		} else {
			if (errno != ENOENT)
				log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_REQUEST, LOG_INFO, __func__, "cannot stat(%s): %s", path, strerror(errno));
		}

		/*
		 * If the wildcard "*" is given to delete every file
		 * in the homedir, don't do it.
		 */
		if (strcmp(path, "./*") == 0) {
			DBPRT(("%s: wildcard delete of all files skipped\n", __func__))
			continue;
		}

		ps = strrchr(path, (int) '/');
		if (ps) {
			/* has prefix path, save parent directory name */
			int len = (int) (ps - path) + 1;

			pbs_strncpy(dname, path, len);
			ps++;
		} else { /* no prefix path */
			/*
			 * If the wildcard "*" is given to delete every file
			 * in the homedir, don't do it.
			 */
			if (strcmp(path, "*") == 0) {
				DBPRT(("%s: wildcard delete of all files skipped\n", __func__))
				continue;
			}
			dname[0] = '.';
			dname[1] = '/';
			dname[2] = '\0';
			ps = path;
		}

		/* if there are no wildcards we don't need to search */
		if (strchr(ps, '*') == NULL && strchr(ps, '?') == NULL) {
			DBPRT(("%s: path has no wildcards\n", __func__))
			rc = delete_file(path, rqcpf->rq_user, prmt, pbadfile);
			if (rc != 0)
				ret = rc;
			continue;
		}

		dirp = opendir(dname);
		if (dirp == NULL) { /* dir cannot be opened, just call delete_file */
			DBPRT(("%s: cannot open dir %s\n", __func__, dname))
			rc = delete_file(path, rqcpf->rq_user, prmt, pbadfile);
			if (rc != 0)
				ret = rc;
			continue;
		}

		while (errno = 0, (pdirent = readdir(dirp)) != NULL) {
			if (pdirent->d_name[0] == '.') {
				if (pdirent->d_name[1] == '\0' || (pdirent->d_name[1] == '.' && pdirent->d_name[2] == '\0'))
					continue;
			}
			if (pbs_glob(pdirent->d_name, ps) != 0) {
				/* name matches */
				strcpy(matched, dname);
				strcat(matched, pdirent->d_name);
				DBPRT(("%s: match %s\n", __func__, matched))
				rc = delete_file(matched, rqcpf->rq_user, prmt, pbadfile);
				if (rc != 0)
					ret = rc;
			}
		}
		if (errno != 0 && errno != ENOENT) { /* dir cannot be read, just call delete_file */
			DBPRT(("%s: cannot read dir %s\n", __func__, dname))
			rc = delete_file(path, rqcpf->rq_user, prmt, pbadfile);
			if (rc != 0)
				ret = rc;
		}

		(void) closedir(dirp);
	}
	return (ret);
}

/**
 * @brief
 * 	Do post rerunjob processing and cleanup for both tcp
 * 	and tpp requests
 *
 * @param[in]	ptask - Work task
 *
 * @return 	none
 *
 */

static void
post_rerunjob(struct work_task *ptask)
{
	struct batch_request *preq = ptask->wt_parm1;
	if (preq == NULL)
		return;

	if (ptask->wt_aux != 0)
		req_reject(-ptask->wt_aux, 0, preq);
	else
		reply_ack(preq);
}

/**
 * @brief
 *	request to rerun job.
 *
 * @param[in] preq - pointer to batch_request structure
 *
 * @return 	Void
 *
 */

void
req_rerunjob(struct batch_request *preq)
{
	job *pjob;
	unsigned int port;
	int rc;
	int sock;
	char *svrport;
	struct work_task *wtask = NULL;
	pid_t child;

	pjob = find_job(preq->rq_ind.rq_rerun);
	if (pjob == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	/* try fork to send files back */

	if ((child = fork_me(preq->rq_conn)) > 0) {
		wtask = set_task(WORK_Deferred_Child, child, post_rerunjob, preq);
		if (!wtask) {
			log_err(errno, NULL, "Failed to create deferred work task, Out of memory");
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}

		/* change substate so Mom doesn't send another obit     */
		/* do not record to disk, so Obit is resent on recovery */
		if (check_job_substate(pjob, JOB_SUBSTATE_OBIT))
			set_job_substate(pjob, JOB_SUBSTATE_EXITED);
		return;
	} else if ((child < 0) && (errno != ENOSYS)) {
		req_reject(-child, 0, preq);
		return;
	}

	/* Child process ...  if fork available else continue in foreground */
	/* send a Job Files request(s).                           */

	rc = 0;
	svrport = strchr(get_jattr_str(pjob, JOB_ATR_at_server),
			 (int) ':');
	if (svrport)
		port = atoi(svrport + 1);
	else
		port = default_server_port;

	sock = client_to_svr(pjob->ji_qs.ji_un.ji_momt.ji_svraddr, port, B_RESERVED);

	if (pbs_errno == PBSE_NOLOOPBACKIF)
		log_err(PBSE_NOLOOPBACKIF, "client_to_svr", msg_noloopbackif);

	if (sock < 0) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_REQUEST, LOG_WARNING,
			  "req_rerun", "no contact with the server");
		if (child) {
			/* TPP streams cannot be inherited.
			 * So, we need to reject the request here itself if in foreground.
			 */
			req_reject(PBSE_NOSERVER, 0, preq);
		}
		rc = 1;
	}

	if (rc == 0) {
		if (((rc = return_file(pjob, StdOut, sock)) != 0) ||
		    ((rc = return_file(pjob, StdErr, sock)) != 0)) {
			/* TPP streams cannot be inherited.
		 * So, we need to reject/ack the request here itself if in foreground.
		 */
			if (child)
				req_reject(rc, 0, preq);
			else
				rc = 1;
		} else if (child)
			reply_ack(preq);
	}

	closesocket(sock);
	if (!child)
		exit(rc);
	return;
}

#ifdef WIN32 /* WIN32 ------------------------------------------------------ */
/**
 * @brief
 * 	Do post cpyfile processing and cleanup
 * 	Called when child process started in req_cpyfile()
 *	If it had a major failure, resend obit to server, otherwise set
 *	substate back to OBIT
 *
 * @param[in]	pjob - pointer to the job structure
 * @param[in]	ev - exit value of the child process
 *
 * @return 	none
 *
 */

void
post_cpyfile(struct work_task *pwt)
{
	struct batch_request *preq = NULL;
	pio_handles *pio = NULL;
	struct rq_cpyfile *rqcpf = NULL;
	copy_info *cpyinfo = NULL;
	int ecode = -1;
	job *pjob = NULL;
	char buf[CPY_PIPE_BUFSIZE] = {'\0'};
	int buflen = 0;
	char *jobid = NULL;

	if ((pwt == NULL) || (pwt->wt_parm1 == NULL))
		return;

	cpyinfo = pwt->wt_parm1;
	if (cpyinfo->preq == NULL || cpyinfo->jobid == NULL)
		return;
	preq = cpyinfo->preq;
	pio = &cpyinfo->pio;
	jobid = cpyinfo->jobid;
	pjob = cpyinfo->pjob;
	ecode = pwt->wt_aux;

	DBPRT(("%s: entered %s\n", __func__, jobid))
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG, jobid, "%s: entered %s", __func__, jobid);

	switch (ecode) {
		case STAGEFILE_OK:
			if (pjob) {
				/*
				 * reset substate to OBIT,  if server doesn't move
				 * on to next step in End of Job processing quickly
				 * we will resend obit, see mom_main.c
				 */
				set_job_substate(pjob, JOB_SUBSTATE_OBIT);
				pjob->ji_sampletim = time(0);
			}
			reply_ack(preq);
			break;
		case STAGEFILE_NOCOPYFILE:
			(void) win_pread(pio, buf, sizeof(buf));
			buflen = strlen(buf);
			if (buflen > 0)
				buf[buflen - 1] = '\0';
			(void) reply_text(preq, PBSE_NOCOPYFILE, buf);
			if (pjob) {
				pjob->ji_qs.ji_svrflags |= JOB_SVFLG_StgoFal;
				(void) job_save(pjob);
			}
			break;
		case STAGEFILE_FATAL:
			(void) win_pread(pio, buf, sizeof(buf));
			buflen = strlen(buf);
			if (buflen > 0)
				buf[buflen - 1] = '\0';
			(void) snprintf(log_buffer, sizeof(log_buffer), "file copy failed for jobid %s with fatal error: %s", jobid, buf);
			log_err(PBSE_NOCOPYFILE, __func__, log_buffer);
			(void) reply_text(preq, PBSE_NOCOPYFILE, log_buffer);
			break;
		case STAGEFILE_BADUSER:
			(void) snprintf(log_buffer, sizeof(log_buffer), "file copy failed for jobid %s with baduser", jobid);
			log_err(PBSE_BADUSER, __func__, log_buffer);
			req_reject(PBSE_BADUSER, 0, preq);
			break;
		default:
			(void) snprintf(log_buffer, sizeof(log_buffer), "file copy failed for job %s with error %d", jobid, ecode);
			log_err(PBSE_NOCOPYFILE, __func__, log_buffer);

			if (pjob) {
				/*
				* child that was doing file copies had major error
				* was killed or crashed,  resend obit to restart
				*/
				send_obit(pjob, 0);
			}

			(void) reply_text(preq, PBSE_NOCOPYFILE, log_buffer);
			break;
	}

	win_pclose2(pio);
	DBPRT(("%s: done %s\n", __func__, jobid))
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG, jobid, "%s: done %s", __func__, jobid);

	delete_link(&cpyinfo->al_link);
	free(cpyinfo->jobid);
	cpyinfo->jobid = NULL;
	free(cpyinfo);
	cpyinfo = NULL;
}

/**
 * @brief
 *	find and return copy information saved in global list mom_copyreqs_list
 *	for given <jobid>
 *
 * @param[in]	jobid - job id
 *
 * @return	copy_info *
 * @retval	pointer to copy_info	if copy info found
 * @retval	NULL			if copy info not found
 *
 */
copy_info *
get_copyinfo_from_list(char *jobid)
{
	copy_info *cpyinfo = NULL;

	if (jobid == NULL || *jobid == '\0')
		return 0;

	cpyinfo = GET_NEXT(mom_copyreqs_list);
	while (cpyinfo) {
		if (!strncmp(cpyinfo->jobid, jobid, strlen(jobid))) {
			return cpyinfo;
		}
		cpyinfo = GET_NEXT(cpyinfo->al_link);
	}

	return NULL;
}

/**
 * @brief
 *	process the Copy Files request from the server to dispose
 *	of output from the job.  This is done by a child of MOM since it
 *	might take time.
 *	<Windows version>
 *
 * @param[in]	preq - pointer to batch request for copy file
 * @return	void
 *
 * NOTE:The supplied PBS means of moving the file is by "rcp". A site may wish to change this.
 *
 */

void
req_cpyfile(struct batch_request *preq)
{
	int dir = -1;
	job *pjob = NULL;
	int rc = -1;
	struct rq_cpyfile *rqcpf = NULL;
	struct passwd *pw = NULL;
	char actual_homedir[MAXPATHLEN + 1] = {'\0'};
	cpy_files stage_inout = {0};
	char cmdline[PBS_CMDLINE_LENGTH + 1] = {'\0'};
	char buf[CPY_PIPE_BUFSIZE + 1] = {'\0'};
	struct work_task *ptask = NULL;
	copy_info *cpyinfo = NULL;
	struct proc_ctrl proc_info;
	extern char *path_log;
	extern char *log_file;
	extern pbs_list_head task_list_event;
	int is_network_drive = 0;
	char current_dir[MAX_PATH + 1] = {'\0'};
	int direct_write = 0;

	if (preq->rq_type == PBS_BATCH_CopyFiles_Cred)
		rqcpf = &preq->rq_ind.rq_cpyfile_cred.rq_copyfile;
	else
		rqcpf = &preq->rq_ind.rq_cpyfile;

	pjob = find_job(rqcpf->rq_jobid);
	if (pjob != NULL) {
		/*
		 * Once a job starts file processing, the checkpoint
		 * flags need to be turned off so a restart cannot
		 * send us back to the future.
		 */
		if (pjob->ji_qs.ji_svrflags &
		    (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) {
			pjob->ji_qs.ji_svrflags &=
				~(JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig);
			(void) job_save(pjob);
		}
		/*
		 * change substate so Mom doesn't send another obit
		 * do not record to disk, so Obit is resent on recovery
		 */
		if (check_job_substate(pjob, JOB_SUBSTATE_OBIT))
			set_job_substate(pjob, JOB_SUBSTATE_EXITED);
	}

	dir = (rqcpf->rq_dir & STAGE_DIRECTION) ? STAGE_DIR_OUT : STAGE_DIR_IN;
	stage_inout.sandbox_private = (rqcpf->rq_dir & STAGE_JOBDIR) ? TRUE : FALSE;
	if (pjob != NULL && (dir == STAGE_DIR_OUT)) {
		direct_write = direct_write_requested(pjob);
	}

	/*
	 * In Windows, we need to be the user in order to call
	 * map_unc_path() therefore we will fork_to_user before
	 * calling getpwnam()
	 */
	if (fork_to_user(preq, pjob) == INVALID_HANDLE_VALUE) {
		req_reject(PBSE_BADUSER, 0, preq);
		return;
	}

	if (pjob == NULL) {
		/*
		 * no homedir can be cached in job's gc_homedir/altid
		 * attribute, so we call map_unc_path to get it now
		 */
		if ((pw = getpwnam(preq->rq_ind.rq_cpyfile.rq_user)) != NULL) {
			pbs_strncpy(actual_homedir,
				    map_unc_path(pw->pw_dir, pw), sizeof(actual_homedir));
			pbs_jobdir = jobdirname(rqcpf->rq_jobid, actual_homedir);
		} else {
			sprintf(log_buffer, "unable to find a password entry for %s", preq->rq_ind.rq_cpyfile.rq_user);
			log_err(errno, "req_cpyfile", log_buffer);
			req_reject(PBSE_BADUSER, 0, preq);
			return;
		}
	} else {
		/*
		 * stage out will have the pjob already set, and the
		 * home directory should have also been set.
		 * Find the pbs_jobdir based off the user home info
		 * stored in the pjob
		 */
		if (pjob->ji_grpcache)
			pbs_jobdir = jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir);
		else
			pbs_jobdir = jobdirname(pjob->ji_qs.ji_jobid, NULL);
	}

	/*
	 * revert to ADMIN to do stuff like
	 * create the job directory as PBS, so it has
	 * the same permissions as TMPDIR
	 */
	(void) revert_impersonated_user();

	if ((dir == STAGE_DIR_IN) && (stage_inout.sandbox_private)) {
		/* Create PBS_JOBDIR */
		rc = mkjobdir(rqcpf->rq_jobid, pbs_jobdir, preq->rq_ind.rq_cpyfile.rq_user, (pjob != NULL && pjob->ji_user != NULL) ? pjob->ji_user->pw_userlogin : INVALID_HANDLE_VALUE);
		if (rc != 0) {
			sprintf(log_buffer, "unable to create the job directory %s", pbs_jobdir);
			log_err(errno, "req_cpyfile", log_buffer);
			req_reject(PBSE_MOMREJECT, 0, preq);
			return;
		}
	}

	snprintf(cmdline, sizeof(cmdline), "%s/sbin/pbs_stage_file.exe", pbs_conf.pbs_exec_path);

	if ((cpyinfo = (copy_info *) malloc(sizeof(copy_info))) == NULL) {
		(void) snprintf(log_buffer, sizeof(log_buffer), "unable to allocate memory for copy_info for job %s", rqcpf->rq_jobid);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_ERR, rqcpf->rq_jobid, log_buffer);
		req_reject(PBSE_MOMREJECT, 0, preq);
		return;
	}

	memset(cpyinfo, 0, sizeof(copy_info));
	CLEAR_LINK(cpyinfo->al_link);

	if ((cpyinfo->jobid = strdup(rqcpf->rq_jobid)) == NULL) {
		(void) snprintf(log_buffer, sizeof(log_buffer), "unable to allocate memory for copy_info->jobid for job %s", rqcpf->rq_jobid);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_ERR, rqcpf->rq_jobid, log_buffer);
		free(cpyinfo);
		cpyinfo = NULL;
		req_reject(PBSE_MOMREJECT, 0, preq);
		return;
	}

	cpyinfo->pjob = pjob;
	cpyinfo->preq = preq;
	proc_info.bInheritHandle = TRUE;
	proc_info.bnowait = 0;
	proc_info.buse_cmd = TRUE;
	proc_info.need_ptree_termination = TRUE;
#ifndef DEBUG
	proc_info.flags = 0;
#else
	proc_info.flags = CREATE_NO_WINDOW | CREATE_BREAKAWAY_FROM_JOB;
#endif
	/* win_popen() doesn't launch process if current directory is a mapped path is user session */
	current_dir[0] = '\0';
	_getcwd(current_dir, MAX_PATH + 1);
	if ((pjob != NULL) && (pjob->ji_user != NULL) && impersonate_user(pjob->ji_user->pw_userlogin) == 0) {
		snprintf(log_buffer, sizeof(log_buffer) - 1, "req_cpyfile: failed to impersonate user %s error=%d",
			 pjob->ji_user->pw_name, GetLastError());
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
			  LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
		return;
	}
	is_network_drive = is_network_drive_path(current_dir);
	proc_info.is_current_path_network = is_network_drive;
	(void) revert_impersonated_user();

	if (win_popen(cmdline, "w", &cpyinfo->pio, &proc_info) == 0) {
		errno = GetLastError();
		pbs_errno = errno;
		(void) snprintf(log_buffer, sizeof(log_buffer) - 1, "executing %s for job %s failed errno=%d", cmdline, rqcpf->rq_jobid, errno);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_ERR, rqcpf->rq_jobid, log_buffer);
		win_pclose(&cpyinfo->pio);
		free(cpyinfo->jobid);
		cpyinfo->jobid = NULL;
		free(cpyinfo);
		cpyinfo = NULL;
		req_reject(PBSE_MOMREJECT, 0, preq);
		return;
	}

	ptask = set_task(WORK_Deferred_Child, (long) cpyinfo->pio.pi.hProcess, post_cpyfile, cpyinfo);
	if (!ptask) {
		errno = ENOMEM;
		pbs_errno = errno;
		(void) snprintf(log_buffer, sizeof(log_buffer) - 1, "unable to set task for cpyreq for job %s", rqcpf->rq_jobid);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_ERR, rqcpf->rq_jobid, log_buffer);
		win_pclose(&cpyinfo->pio);
		free(cpyinfo->jobid);
		cpyinfo->jobid = NULL;
		free(cpyinfo);
		cpyinfo = NULL;
		req_reject(PBSE_MOMREJECT, 0, preq);
		return;
	}

	cpyinfo->ptask = ptask;
	append_link(&mom_copyreqs_list, &cpyinfo->al_link, cpyinfo);

	addpid(cpyinfo->pio.pi.hProcess);

	snprintf(buf, sizeof(buf) - 1, "path_log=%s\n", path_log);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "path_spool=%s\n", path_spool);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "path_undeliv=%s\n", path_undeliv);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "path_checkpoint=%s\n", path_checkpoint);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "pbs_jobdir=%s\n", pbs_jobdir);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "actual_homedir=%s\n",
		 (pjob ? (pjob->ji_grpcache ? pjob->ji_grpcache->gc_homedir : "") : actual_homedir));
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "mom_host=%s\n", mom_host);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "log_file=%s\n", (log_file ? log_file : ""));
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "log_event_mask=%ld\n", *log_event_mask);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "direct_write=%d\n", direct_write);
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	send_pcphosts(&cpyinfo->pio, pcphosts);

	if (!send_rq_cpyfile_cred(&cpyinfo->pio, rqcpf)) {
		log_err(-1, __func__, "Failed to send data");
	}

	snprintf(buf, sizeof(buf) - 1, "quit\n");
	check_err(__func__, buf, win_pwrite(&cpyinfo->pio, buf, strlen(buf)));

	chdir(mom_home);
}

/**
 * @brief
 *	delete the specifled output/staged files
 *	<Windows version>
 *
 * @param[in]	preq - pointer to batch request for delete file
 *
 * @return	void
 *
 */

void
req_delfile(struct batch_request *preq)
{
	int rc = 0;
	struct rq_cpyfile *rqcpf = NULL;
	job *pjob = NULL;
	char *bad_list = NULL;
	HANDLE hUser = INVALID_HANDLE_VALUE;

	if (preq->rq_type == PBS_BATCH_DelFiles_Cred)
		rqcpf = &preq->rq_ind.rq_cpyfile_cred.rq_copyfile;
	else
		rqcpf = &preq->rq_ind.rq_cpyfile;

	pjob = find_job(rqcpf->rq_jobid);
	if (pjob) {
		/*
		 * check to see is there any copy request pending
		 * for this job ?
		 */
		if (get_copyinfo_from_list(rqcpf->rq_jobid) != NULL) {
			/*
			 * we have copy request pending so we
			 * need to first process the post_cpyfile
			 * request before starting this one.
			 * Tell the server to try again later.
			 */
			req_reject(PBSE_TRYAGAIN, 0, preq);
			return;
		}

		/*
		 * Once a job starts file processing, the checkpoint
		 * flags need to be turned off so a restart cannot
		 * send us back to the future.
		 */
		if (pjob->ji_qs.ji_svrflags & (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) {
			pjob->ji_qs.ji_svrflags &= ~(JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig);
			(void) job_save(pjob);
		}

		if (check_job_substate(pjob, JOB_SUBSTATE_OBIT)) {
			/* change substate so Mom doesn't send another obit
			 * do not record to disk, so Obit is resent on recovery
			 */
			set_job_substate(pjob, JOB_SUBSTATE_EXITED);
		}
	}

	hUser = fork_to_user(preq, pjob);
	if (hUser == INVALID_HANDLE_VALUE) {
		req_reject(PBSE_BADUSER, 0, preq);
		return;
	}

	/* Child process ... delete the files */

	if ((rc = del_files(rqcpf, pjob, &bad_list)) != 0) {
		reply_text(preq, rc, bad_list);
		if (bad_list != NULL) {
			free(bad_list);
			bad_list = NULL;
		}
	} else
		reply_ack(preq);

	(void) revert_impersonated_user();
	chdir(mom_home);
}

#else /* UNIX---------------------------------------------------------------*/
/**
 * @brief
 * 	Do post cpyfile processing and cleanup in case of tpp connection
 * 	and for stagein when the job is not yet available at the server
 *
 * @param[in]	ptask - Work task
 *
 * @return 	none
 *
 */

static void
post_cpyfile_nojob(struct work_task *ptask)
{
	struct batch_request *preq = ptask->wt_parm1;
	if (preq == NULL)
		return;

	if (ptask->wt_aux != 0)
		req_reject(PBSE_NOCOPYFILE, 0, preq);
	else
		reply_ack(preq);
}

/**
 * @brief
 * 	Do post cpyfile processing and cleanup
 * @ par
 * 	Called when child process started in req_cpyfile() on
 *	stageout only
 *	If it had a major failure, resend obit to server, otherwise set
 *	substate back to OBIT
 *
 * @param[in]	pjob - pointer to the job structure
 * @param[in]	ev - exit value of the child process
 *
 * @return 	none
 *
 */

static void
post_cpyfile(job *pjob, int ev)
{
	if (pjob == NULL)
		return;

	pjob->ji_mompost = NULL;
	if (ev != 0) {
		if (pjob->ji_preq)
			req_reject(PBSE_NOCOPYFILE, 0, pjob->ji_preq);
		pjob->ji_preq = NULL;
		if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
		    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0) &&
		    (ev == STAGEOUT_FAILURE)) {
			/* We are in sandbox=private mode and there was */
			/* a stageout failure */
			/* Set the flag to show the stageout failure */
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_StgoFal;
		} else {
			/* child that was doing file copies had major error */
			/* was killed or crashed,  resend obit to restart   */
			send_obit(pjob, 0);
			return;
		}
	} else {
		if (pjob->ji_preq)
			reply_ack(pjob->ji_preq);
		pjob->ji_preq = NULL;
		/* reset substate to OBIT,  if server doesn't move  */
		/* on to next step in End of Job processing quickly */
		/* we will resend obit, see mom_main.c              */
		set_job_substate(pjob, JOB_SUBSTATE_OBIT);
		pjob->ji_sampletim = time(0);
	}
}

/**
 * @brief
 * 	req_cpyfile - process the Copy Files request from the server to dispose
 *	of output from the job.  This is done by a child of MOM since it
 *	might take time.
 *
 *	UNIX version
 *
 *	The supplied PBS means of moving the file is by "rcp".
 * 	A site may wish to change this.
 *
 * @param[in] preq - pointer to batch_request structure
 *
 * @return	Void
 *
 */

void
req_cpyfile(struct batch_request *preq)
{
	job *pjob;
	struct rq_cpyfile *rqcpf;
	time_t copy_start;
	time_t copy_stop;
	int num_copies = 0;
	int dir;
	struct passwd *pwdp;
	struct group *grpp;
	uid_t useruid = 0;
	gid_t usergid = 0;
	int rc;
	pid_t pid;
	struct rqfpair *pair;
	int rmtflag;
	cpy_files stage_inout;
	char *prmt;
	char dup_rqcpf_jobid[PBS_MAXSVRJOBID + 1];
	struct work_task *wtask = NULL;
	int tot_copies = 0;
	bool copy_failed = FALSE;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	struct krb_holder *ticket = NULL;
	char *krbccname = NULL;
#endif

	if (mock_run) {
		/*
		 * in mock run we don't have any files to copy back,
		 * so just ack request to make server happy
		 * and return
		 */
		reply_ack(preq);
		return;
	}

	DBPRT(("%s: entered\n", __func__))

	if (preq->rq_type == PBS_BATCH_CopyFiles_Cred)
		rqcpf = &preq->rq_ind.rq_cpyfile_cred.rq_copyfile;
	else
		rqcpf = &preq->rq_ind.rq_cpyfile;

	stage_inout.stageout_failed = FALSE;
	stage_inout.bad_files = 0;
	stage_inout.file_num = 0;
	stage_inout.file_max = 0;
	stage_inout.file_list = NULL;
	stage_inout.bad_list = NULL;
	pjob = find_job(rqcpf->rq_jobid);
	if (pjob) {
		/*
		 ** Once a job starts file processing, the checkpoint
		 ** flags need to be turned off so a restart cannot
		 ** send us back to the future.
		 */
		if (pjob->ji_qs.ji_svrflags &
		    (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) {
			pjob->ji_qs.ji_svrflags &=
				~(JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig);
			(void) job_save(pjob);
		}
		/* change substate so Mom doesn't send another obit     */
		/* do not record to disk, so Obit is resent on recovery */
		if (check_job_substate(pjob, JOB_SUBSTATE_OBIT))
			set_job_substate(pjob, JOB_SUBSTATE_EXITED);
	}

	dir = (rqcpf->rq_dir & STAGE_DIRECTION) ? STAGE_DIR_OUT : STAGE_DIR_IN;
	stage_inout.sandbox_private = (rqcpf->rq_dir & STAGE_JOBDIR) ? TRUE : FALSE;

	/* Call getpwnam for user info */
	pwdp = getpwnam(rqcpf->rq_user);
	if (pwdp != NULL) {
		pbs_jobdir = jobdirname(rqcpf->rq_jobid, pwdp->pw_dir);
	} else {
		sprintf(log_buffer, "unable to find a password entry");
		log_joberr(errno, __func__, log_buffer, rqcpf->rq_jobid);
		req_reject(PBSE_BADUSER, 0, preq);
		return;
	}

	if ((dir == STAGE_DIR_IN) && stage_inout.sandbox_private) {
		/* Need to look up the uid, gid */
		if (pwdp == NULL) {
			req_reject(PBSE_BADUSER, 0, preq);
			return;
		}
		useruid = pwdp->pw_uid;

		if (rqcpf->rq_group[0] == '\0') {
			usergid = pwdp->pw_gid; /* default to login group */
		} else {
			if ((grpp = getgrnam(rqcpf->rq_group)) == NULL) {
				req_reject(PBSE_BADUSER, 0, preq);
				return;
			}
			usergid = grpp->gr_gid;
		}
		/* Create PBS_JOBDIR  and no change of environment */
		rc = mkjobdir(rqcpf->rq_jobid, pbs_jobdir, useruid, usergid);

		if (rc != 0) {
			sprintf(log_buffer, "unable to create the job directory %s", pbs_jobdir);
			log_err(errno, __func__, log_buffer);
			req_reject(PBSE_MOMREJECT, 0, preq);
			return;
		}
	}

	if ((pjob != NULL) && (dir == STAGE_DIR_OUT) && direct_write_requested(pjob))
		stage_inout.direct_write = 1;
	else
		stage_inout.direct_write = 0;

		/* Become the user */
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	ticket = alloc_ticket();
	pid = fork_to_user(preq, pjob, ticket);
#else
	pid = fork_to_user(preq, pjob);
#endif
	rc = (int) pid;
	if (pid > 0) {
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		free_ticket(ticket, CRED_CLOSE);
#endif

		if (pjob) {
			/* change substate so Mom doesn't send another obit     */
			/* do not record to disk, so Obit is resent on recovery */
			if (check_job_substate(pjob, JOB_SUBSTATE_OBIT))
				set_job_substate(pjob, JOB_SUBSTATE_EXITED);
			pjob->ji_momsubt = pid;
			pjob->ji_mompost = post_cpyfile;
			if (preq->prot == PROT_TPP)
				pjob->ji_preq = preq; /* keep the batch request pointer */
		} else {
			if (preq->prot == PROT_TPP) {
				/* there is no job yet, so cant hang this post function to job
				 * but this is tpp based connection, so we cannot reply in child
				 * lets hang the preq in a work task
				 */
				wtask = set_task(WORK_Deferred_Child, pid, post_cpyfile_nojob, preq);
				if (!wtask) {
					log_err(errno, __func__, "Failed to create deferred work task, Out of memory");
					req_reject(PBSE_SYSTEM, 0, preq);
					return;
				}
			}
		}
		return; /* parent - continue with someother task */
	} else if (rc < 0) {
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		free_ticket(ticket, CRED_DESTROY);
#endif

		req_reject(-rc, 0, preq);
		return;
	}

	/* chdir to job pbs_jobdir directory if "sandbox=PRIVATE" mode is requested */
	if (stage_inout.sandbox_private) {
		if (chdir(pbs_jobdir) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));			
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	krbccname = get_ticket_ccname(ticket);
	if (krbccname != NULL)
		setenv("KRB5CCNAME", krbccname, 1);
#endif

	/*
	 * Child process ...
	 * Now running in the user's home or job staging and execution directory as the user.
	 * Build up cp/rcp command(s), one per file pair
	 */

	copy_start = time(0);
	for (pair = (struct rqfpair *) GET_NEXT(rqcpf->rq_pair);
	     pair != 0;
	     pair = (struct rqfpair *) GET_NEXT(pair->fp_link), tot_copies++) {
		if (copy_failed)
			continue;
		DBPRT(("%s: local %s remote %s\n", __func__, pair->fp_local, pair->fp_rmt))

		stage_inout.from_spool = 0;
		prmt = pair->fp_rmt;

		if (local_or_remote(&prmt) == 0) {
			/* destination host is this host, use cp */
			rmtflag = 0;
		} else {
			/* destination host is another, use (pbs_)rcp */
			rmtflag = 1;
		}

		rc = stage_file(dir, rmtflag, rqcpf->rq_owner,
				pair, preq->rq_conn, &stage_inout, prmt, rqcpf->rq_jobid);
		/*
		 ** Here we break out of the the loop on error.
		 ** This will only happen on a stagein failure.
		 */
		if (rc != 0) {
			copy_failed = TRUE;
			continue;
		}
		num_copies++;
	}
	copy_stop = time(0);

	/* If there was a stage in failure, remove the job directory.
	 * There is no guarantee we'll run on this mom again,
	 * So we need to cleanup.
	 */
	if ((dir == STAGE_DIR_IN) && stage_inout.sandbox_private && stage_inout.bad_files) {
		/* cd to user's home to be out of   */
		/* the sandbox so it can be deleted */
		if (chdir(pwdp->pw_dir) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));			
		rmjobdir(rqcpf->rq_jobid, pbs_jobdir, useruid, usergid, 0);
	}

	pbs_strncpy(dup_rqcpf_jobid, rqcpf->rq_jobid, sizeof(dup_rqcpf_jobid));
	if (preq->prot == PROT_TCP) {
		if (stage_inout.bad_files) {
			reply_text(preq, PBSE_NOCOPYFILE, stage_inout.bad_list);
		} else {
			reply_ack(preq);
		}
	} else {
		if (stage_inout.bad_files) {
			char *token = NULL;
			char *rest = stage_inout.bad_list;
			char *save_ptr = NULL;
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				  dup_rqcpf_jobid, "Job files not copied:---->>>>");
			token = strtok_r(rest, "\n", &save_ptr);
			while (token != NULL) {
				char *temp_buff = NULL;
				if ((pbs_asprintf(&temp_buff, "%s\n", token)) != -1) {
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
						  dup_rqcpf_jobid, temp_buff);
					free(temp_buff);
					temp_buff = NULL;
				} else
					break;
				token = strtok_r(NULL, "\n", &save_ptr);
			}
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				  dup_rqcpf_jobid, "---->>>>");
		}
	}

	/* log the number of files/directories copied and the time it took */
	copy_stop = copy_stop - copy_start;

#ifdef NAS /* localmod 005 */
	sprintf(log_buffer, "Staged %d/%d items %s over %ld:%02ld:%02ld",
		num_copies, tot_copies, (dir == STAGE_DIR_OUT) ? "out" : "in",
		(long) copy_stop / 3600, ((long) copy_stop % 3600) / 60,
		(long) copy_stop % 60);
#else
	sprintf(log_buffer, "Staged %d/%d items %s over %d:%02d:%02d",
		num_copies, tot_copies, (dir == STAGE_DIR_OUT) ? "out" : "in",
		(int) copy_stop / 3600, ((int) copy_stop % 3600) / 60,
		(int) copy_stop % 60);
#endif /* localmod 005 */
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  dup_rqcpf_jobid, log_buffer);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	free_ticket(ticket, CRED_DESTROY);
#endif

	if (preq->prot == PROT_TPP && stage_inout.bad_files)
		exit(STAGEOUT_FAILURE);

	if (stage_inout.sandbox_private && stage_inout.stageout_failed) {
		exit(STAGEOUT_FAILURE);
	}

	exit(0); /* remember, we are the child, exit not return */
}

/**
 * @brief
 * 	Do post delete file processing and cleanup.
 *
 * @par
 * 	Called when the child process started in req_delfile() exits.
 * 	If it had a major failure, resend obit to server, otherwise
 * 	set substate back to OBIT
 *	This is only called in the UNIX code
 *
 * @param[in]	pjob - pointer to the job structure
 * @param[in]	ev   - exit value of the chile process
 *
 * @return	none
 *
 */
static void
post_delfile(job *pjob, int ev)
{
	if (pjob == NULL)
		return;
	pjob->ji_mompost = NULL;

	if (pjob->ji_preq)
		reply_ack(pjob->ji_preq);
	pjob->ji_preq = NULL;

	if (ev == 0) {
		/* reset substate to OBIT,  if server doesn't move  */
		/* on to next step in End of Job processing quickly */
		/* we will resend obit, see mom_main.c              */
		set_job_substate(pjob, JOB_SUBSTATE_OBIT);
		pjob->ji_sampletim = time(0);
	} else {
		/* child that was doing file copies had major error */
		/* was killed or crashed,  resend obit to restart   */
		send_obit(pjob, 0);
	}
}

/**
 * @brief
 * 	req_delfile - delete the specifled output/staged files
 *
 * UNIX version
 *
 * @param[in] preq - pointer to batch_request structure
 *
 * @return	Void
 *
 */
void
req_delfile(struct batch_request *preq)
{
	int rc;
	pid_t pid;
	job *pjob;
	char *bad_list = NULL;
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	struct krb_holder *ticket = NULL;
	char *krbccname = NULL;
#endif

	if (mock_run) {
		/*
		 * in mock run we don't have any files to delete,
		 * so just ack request to make server happy
		 * and return
		 */
		reply_ack(preq);
		return;
	}

	pjob = find_job(preq->rq_ind.rq_cpyfile.rq_jobid);
	if (pjob) {
		/*
		 * Check to see if the post_cpyfile has already been
		 * processed.  If it has been processed the momsubt == 0
		 */
		if (pjob->ji_momsubt != 0 && pjob->ji_mompost == post_cpyfile) {
			/* Need to first process the post_cpyfile
			 * request before starting this one.
			 * Tell the server to try again later.
			 */
			req_reject(PBSE_TRYAGAIN, 0, preq);
			return;
		}
	}

	if (pjob) {
		pjob->ji_preq = NULL;
		if (preq->prot == PROT_TPP)
			pjob->ji_preq = preq; /* keep the batch request pointer */
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	ticket = alloc_ticket();
	if ((pid = fork_to_user(preq, pjob, ticket)) > 0)
#else
	if ((pid = fork_to_user(preq, pjob)) > 0)
#endif
	{
		/* parent */
		if (pjob) {
			pjob->ji_momsubt = pid;
			pjob->ji_mompost = post_delfile;
			pjob->ji_sampletim = time(0);
			set_job_substate(pjob, JOB_SUBSTATE_EXITED);
		}
		return; /* parent - continue with someother task */
	} else if (pid < 0) {
		req_reject(-(int) pid, 0, preq);
		return;
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	krbccname = get_ticket_ccname(ticket);
	if (krbccname != NULL)
		setenv("KRB5CCNAME", krbccname, 1);
#endif

	/* Child process ... delete the files */

	rc = del_files(&(preq->rq_ind.rq_cpyfile), pjob, &bad_list);
	if (rc != 0) {
		if (preq->prot == PROT_TCP) {
			reply_text(preq, rc, bad_list);
		} else {
			char *token = NULL;
			char *rest = bad_list;
			char *save_ptr = NULL;
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, preq->rq_ind.rq_cpyfile.rq_jobid, "Job files not deleted:---->>>>");
			token = strtok_r(rest, "\n", &save_ptr);
			while (token != NULL) {
				char *temp_buff = NULL;
				if ((pbs_asprintf(&temp_buff, "%s\n", token)) != -1) {
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, preq->rq_ind.rq_cpyfile.rq_jobid, temp_buff);
					free(temp_buff);
					temp_buff = NULL;
				} else
					break;
				token = strtok_r(NULL, "\n", &save_ptr);
			}
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, preq->rq_ind.rq_cpyfile.rq_jobid, "---->>>>");
		}
	} else {
		if (preq->prot == PROT_TCP)
			reply_ack(preq);
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	free_ticket(ticket, CRED_DESTROY);
#endif

	exit(0); /* remember, we are the child, exit not return */
}
#endif /* WIN32/UNIX ------------------------------------------------------- */

/**
 * @brief
 * 	Checkpoint the job.
 *
 *	If abort is TRUE, kill it too.  Return a PBS error code.
 *	Done in a child of MOM.
 *
 * @param[in] pjob - job pointer
 * @param[in] abort - indiacation whether abort true or false
 *
 * @return	PBSerrorcode
 * @retval	0		no error
 * @retval	!0		error
 *
 */

int
mom_checkpoint_job(job *pjob, int abort)
{
	int hasold = 0;
	int ckerr = ENOENT;
	struct stat statbuf;
	char path[MAXPATHLEN + 1];
	char oldp[MAXPATHLEN + 1];
	char file[MAXPATHLEN + 1], *name;
	int filelen;
	pbs_task *ptask;
	char *cwdname = NULL;
	struct passwd *pwdp = NULL;

	assert(pjob != NULL);

	DBPRT(("mom_checkpoint_job: %s %s abort\n", pjob->ji_qs.ji_jobid,
	       abort ? "with" : "no"))

	pbs_strncpy(path, path_checkpoint, sizeof(path));
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		strcat(path, pjob->ji_qs.ji_fileprefix);
	else
		strcat(path, pjob->ji_qs.ji_jobid);
	strcat(path, JOB_CKPT_SUFFIX);

	if (stat(path, &statbuf) == 0) {
		(void) strcpy(oldp, path); /* file already exists, rename it */
		(void) strcat(oldp, ".old");
		if (rename(path, oldp) < 0)
#ifdef WIN32
			return 73;
#else
			return errno;
#endif
		hasold = 1;
	}

	if (mkdir(path, 0755) == -1) {
		ckerr = errno;
		goto checkpoint_fail;
	}

	filelen = strlen(path);
	strcpy(file, path);
	name = &file[filelen];

	/* Change to user's home to pick up .cpr */
#ifdef WIN32
	if ((cwdname = getcwd(NULL, _MAX_PATH + 2)) != NULL) {
		if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
		    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
			/* "sandbox=PRIVATE" mode is enabled, so restart job in PBS_JOBDIR */
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL) {
				(void) chdir(jobdirname(pjob->ji_qs.ji_jobid,
							save_actual_homedir(pwdp, pjob)));
			}
		} else {
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL)
				(void) chdir(save_actual_homedir(pwdp, pjob));
		}
	}
#else
	if ((cwdname = getcwd(NULL, 0)) != NULL) {
		if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
		    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
			/* "sandbox=PRIVATE" mode is enabled, so restart job in PBS_JOBDIR */
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL) {
				if (chdir(jobdirname(pjob->ji_qs.ji_jobid, pwdp->pw_dir)) == -1) 
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));					
			}
		} else {
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL)
				if (chdir(pwdp->pw_dir) == -1) 
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));
		}
	}
#endif

	errno = 0;
	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		int i;

		if (ptask->ti_qs.ti_status != TI_STATE_RUNNING)
			continue;
		sprintf(name, task_fmt, ptask->ti_qs.ti_task);

		/*
		 **	Try action script with no post function.
		 */
		i = do_mom_action_script(abort ? ChkptAbtAction : ChkptAction,
					 pjob, ptask, file, NULL);
		if (i != 0) { /* script didn't work */
			/* if there is no script, try native support */
			if (i == -2)
				i = mach_checkpoint(ptask, file, abort);
			if (i != 0) /* nothing worked */
				goto checkpoint_fail;
		}
		if (stat(file, &statbuf) == -1) { /* no file created */
			int fd;

			/*
			 ** create a zero len file to mark checkpoint
			 */
			fd = open(file, O_CREAT | O_TRUNC | O_WRONLY, 0600);
			if (fd == -1)
				goto errout;
			close(fd);
		}
	}

	/* Checkpoint successful */
	/* return to MOM's rightful lair */
	if (cwdname) {
		if (chdir(cwdname) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));		
		free(cwdname);
	}

	sprintf(log_buffer, "checkpointed to %s", path);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);
	if (hasold)
		(void) remtree(oldp);

	return 0;

checkpoint_fail:
	switch (errno) {
#ifdef ERFLOCK
		case ERFLOCK:
#endif
#ifdef EQUSR
		case EQUSR:
#endif
#ifdef EQGRP
		case EQGRP:
#endif
#ifdef EQACT
		case EQACT:
#endif
#ifdef ENOSDS
		case ENOSDS:
#endif
		case EAGAIN:
		case ENOMEM:
		case ENOLCK:
		case ENOSPC:
		case ENFILE:
		case EDEADLK:
		case EBUSY:
			ckerr = EAGAIN;
			break;
	}

errout:
	/*
	 ** A checkpoint has failed.  Log and return error.
	 */
	sprintf(log_buffer, "checkpoint failed: errno=%d", errno);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);

	/* return to MOM's rightful lair */
	if (cwdname) {
		if (chdir(cwdname) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));		
		free(cwdname);
	}

	/*
	 ** See if any checkpoints worked and abort is set.
	 ** If so, we need to restart these tasks so the whole job is
	 ** still running.  This has to wait until we reap the
	 ** aborted task(s).
	 */
	if (abort)
		return ckerr;

	/*
	 ** Clean up files.
	 */
	(void) remtree(path);
	if (hasold) {
		if (rename(oldp, path) == -1) {
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_CHKPT;
			(void) job_save(pjob);
		}
	}
	return ckerr;
}

/**
 * @brief
 * 	post processor for start_checkpoint()
 *
 * Called from scan_for_terminated() when found in ji_mompost;
 * This sets the "has checkpoint image" bit in the job.
 *
 * @param[in]	pjob	job pointer
 * @param[in]	ev	exit value of checkpoint process
 *
 * @return 	Void
 *
 */

void
post_chkpt(job *pjob, int ev)
{
	char path[MAXPATHLEN + 1];
	char oldname[MAXPATHLEN + 1];
	struct stat statbuf;
	DIR *dir;
	struct dirent *pdir;
	tm_task_id tid;
	pbs_task *ptask;
	int i;
	int abort = pjob->ji_flags & MOM_CHKPT_ACTIVE;

	DBPRT(("%s: %s %s abort err %d\n", __func__, pjob->ji_qs.ji_jobid,
	       abort ? "with" : "no", ev))

	if (ev != 0) {
		/* checkpoint action exited with an error, set error flag */
		pjob->ji_flags |= MOM_SISTER_ERR;
		if (pjob->ji_preq) {
			/* as there is request waiting, reply with error */
			req_reject(PBSE_CKPSHORT, ev, pjob->ji_preq);
			/* and clear request pointer */
			pjob->ji_preq = NULL;
		}
	}

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {
		/*
		 **	If I'm MS, I need to check for checkpoint events
		 **	to see if non-local processing is still going on.
		 */

		if (pjob->ji_momsubt != 0) /* child running */
			return;

		/*
		 ** See if there are any checkpoint events left
		 ** to wait for.
		 */
		for (i = 0; i < pjob->ji_numnodes; i++) {
			hnodent *np;
			eventent *ep;

			np = &pjob->ji_hosts[i];
			ep = (eventent *) GET_NEXT(np->hn_events);
			while (ep) {
				if (ep->ee_command == IM_CHECKPOINT)
					break;
				if (ep->ee_command == IM_CHECKPOINT_ABORT)
					break;
				ep = (eventent *) GET_NEXT(ep->ee_next);
			}
			if (ep != NULL)
				return;
		}
	} else
		post_reply(pjob, ev);

	/*
	 ** No more operations are waiting.
	 ** Now is the time to clear ji_mompost.
	 ** Wait to turn off MOM_CHKPT_ACTIVE until scan_for_exiting is done.
	 */
	pjob->ji_mompost = NULL;

	/*
	 ** Set the TI_FLAGS_CHKPT flag for each task that was checkpointed.
	 */
	pbs_strncpy(path, path_checkpoint, sizeof(path));
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		strcat(path, pjob->ji_qs.ji_fileprefix);
	else
		strcat(path, pjob->ji_qs.ji_jobid);
	strcat(path, JOB_CKPT_SUFFIX);

	dir = opendir(path);
	if (dir != NULL) {
		while (errno = 0, (pdir = readdir(dir)) != NULL) {
			if (pdir->d_name[0] == '.')
				continue;
			tid = strtoul(pdir->d_name, NULL, 16);
			if (tid == 0)
				continue;
			ptask = task_find(pjob, tid);
			if (ptask == NULL)
				continue;
			ptask->ti_flags |= TI_FLAGS_CHKPT;
		}
		if (errno != 0 && errno != ENOENT) {
			sprintf(log_buffer, "readdir failed for directory :%s", path);
			log_joberr(errno, __func__, log_buffer, pjob->ji_qs.ji_jobid);
		}
		closedir(dir);
	}

	if ((pjob->ji_flags & MOM_SISTER_ERR) == 0) {
		/*
		 **	Everything worked.  The checkpoint process
		 **	is done and no IM_CHECKPOINT events are
		 **	outstanding.  Any resources owned by the
		 **	job should be cleaned up here.
		 **	If abort is set the job's tasks will be killed
		 **	and should be picked up in scan_for_exiting().
		 **	Any saved batch request will be acked after the
		 **	obit is sent.
		 */
		if (abort) {
			mom_hook_input_t *hook_input = NULL;

			hook_input = (mom_hook_input_t *) malloc(sizeof(mom_hook_input_t));
			if (hook_input) {
				mom_hook_input_init(hook_input);
				hook_input->pjob = pjob;
			}
			if ((hook_input != NULL) && (mom_process_hooks(HOOK_EVENT_EXECJOB_END, PBS_MOM_SERVICE_NAME, mom_host, hook_input, NULL, NULL, 0, 1) == HOOK_RUNNING_IN_BACKGROUND)) {
				pjob->ji_hook_running_bg_on = BG_CHECKPOINT_ABORT;
			} else {
				free(hook_input);
				exiting_tasks = 1;
				term_job(pjob);
			}
		} else if (pjob->ji_preq) {
			/*
			 **	If abort is not set and there is a request
			 **	saved, do an ack for it.  This will be
			 **	the response for the hold.
			 */
			reply_ack(pjob->ji_preq);
			pjob->ji_preq = NULL;
		}
		/*
		 ** Turn off TI_FLAGS_SAVECKP.
		 */
		for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
		     ptask != NULL;
		     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
			ptask->ti_flags &= ~TI_FLAGS_SAVECKP;
		}
		pjob->ji_qs.ji_svrflags |= JOB_SVFLG_CHKPT;
		(void) job_save(pjob);
		return;
	}
	pjob->ji_flags &= ~MOM_SISTER_ERR;

	/*
	 ** If we get here, an error happened.  Only try to recover
	 ** if we had abort set.
	 */
	if (pjob->ji_qs.ji_un.ji_momt.ji_exitstat == JOB_EXEC_CHKP)
		pjob->ji_qs.ji_un.ji_momt.ji_exitstat = 0;

	/*
	 ** If abort is on, I'm MS and there is a sisterhood, send restart.
	 */
	if (abort && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) &&
	    pjob->ji_numnodes > 1) {
		int i;

		pjob->ji_mompost = post_restart;
		i = send_sisters(pjob, IM_RESTART, NULL);

		if (i != (pjob->ji_numnodes - 1)) {
			log_joberr(errno, __func__, "could not send restart",
				   pjob->ji_qs.ji_jobid);
			(void) kill_job(pjob, SIGKILL);
			return;
		}
	}

	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		if (ptask->ti_flags & TI_FLAGS_CHKPT)
			break;
	}

	/*
	 ** If any tasks were checkpointed and abort was set, set a flag for
	 ** scan_for_exiting() to be able to deal with a failed checkpoint.
	 */
	if (ptask != NULL && abort) {
		pjob->ji_flags |= MOM_CHKPT_POST;
		return;
	}

	/*
	 ** No tasks were checkpointed.
	 ** Get rid of incomplete checkpoint directory and
	 ** move old chkpt dir back to regular if it exists.
	 */
	(void) remtree(path);
	strcpy(oldname, path);
	strcat(oldname, ".old");
	if (stat(oldname, &statbuf) == 0) {
		if (rename(oldname, path) == -1) {
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_CHKPT;
		}
	}

	/*
	 ** Set TI_FLAGS_CHKPT back on if it was on before this attempt
	 ** started.  Turn off TI_FLAGS_SAVECKP.
	 */
	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		if (ptask->ti_flags & TI_FLAGS_SAVECKP)
			ptask->ti_flags |= TI_FLAGS_CHKPT;
		ptask->ti_flags &= ~TI_FLAGS_SAVECKP;
	}

	/* clear checkpoint active flag so a following checkpoint can happen */
	pjob->ji_flags &= ~MOM_CHKPT_ACTIVE;
	(void) job_save(pjob);
	return;
}

int
local_checkpoint(job *pjob, int abort, struct batch_request *preq) /* may be null */
{
	svrattrl *pal;
	int rc;
	attribute tmph;
	pbs_task *ptask;
	int hok = 1;
	pid_t pid;

	DBPRT(("local_checkpoint: %s %s abort %s request\n",
	       pjob->ji_qs.ji_jobid,
	       abort ? "with" : "no", preq ? "with" : "no"))

	/* no checkpoint, reject request */
	rc = (int) (abort ? ChkptAbtAction : ChkptAction);
	if ((mom_does_chkpnt == 0) &&
	    (mom_action[rc].ma_script == NULL))
		return PBSE_NOSUP;

	/*
	 **	Check to see if anything is going on.
	 */
	if (pjob->ji_momsubt != 0 ||
	    pjob->ji_mompost != NULL)
		return PBSE_MOMREJECT;

	/*
	 **	Reset TI_FLAGS_CHKPT flag for this attempt.
	 */
	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
		if (ptask->ti_flags & TI_FLAGS_CHKPT)
			ptask->ti_flags |= TI_FLAGS_SAVECKP;
		ptask->ti_flags &= ~TI_FLAGS_CHKPT;
	}

	/* now try set up as child of MOM */
	pid = fork_me(-1);
	if ((pid < 0) && (errno != ENOSYS))
		return PBSE_SYSTEM; /* error on fork */

	if (pid > 0) {
		/* parent, record pid in job for when child terminates */

		DBPRT(("local_checkpoint: %s pid %d\n", pjob->ji_qs.ji_jobid, pid))
		pjob->ji_momsubt = pid;
		pjob->ji_mompost = post_chkpt;
		pjob->ji_actalarm = 0;

		/*
		** If we are going to have tasks dieing, set a flag.
		*/
		if (abort) {
			pjob->ji_flags |= MOM_CHKPT_ACTIVE;
			pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_CHKP;
		}
		(void) job_save(pjob);

		return PBSE_NONE; /* parent return */
	}

	/* if fork available child does the checkpoint else by foreground */

	clear_attr(&tmph, &job_attr_def[(int) JOB_ATR_hold]);
	if (preq) {
		pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_hold.rq_orig.rq_attr);
		if (pal)
			hok = set_attr_generic(&tmph, &job_attr_def[(int) JOB_ATR_hold], pal->al_value, NULL, INTERNAL);
	}
	rc = mom_checkpoint_job(pjob, abort);
	if ((rc == 0) && (hok == 0))
		rc = site_mom_postchk(pjob, (int) tmph.at_val.at_long);
	if (pid) {
		pjob->ji_preq = preq;
		if (abort) {
			pjob->ji_flags |= MOM_CHKPT_ACTIVE;
			pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_CHKP;
		}

		(void) job_save(pjob);

		post_chkpt(pjob, rc);

		return (rc);
	} else
		exit(rc); /* zero exit tells main chkpnt ok */
}

/**
 * @brief
 * 	start_checkpoint - start a checkpoint going
 *
 *	checkpoint done from a child because it takes a while
 *
 * @param[in] pjob - pointer to job
 * @param[in] abort - indication for abort true or false
 * @param[in] preq - pointer to batch_request structure
 *
 * @return 	int
 * @retval	0 	success
 * @retval	!0	Error
 *
 */
int
start_checkpoint(job *pjob,
		 int abort,
		 struct batch_request *preq) /* may be null */
{
	int rc;

	DBPRT(("start_checkpoint: %s %s abort %s request\n",
	       pjob->ji_qs.ji_jobid,
	       abort ? "with" : "no", preq ? "with" : "no"))

	if ((rc = local_checkpoint(pjob, abort, preq)) != PBSE_NONE) {
		req_reject(rc, errno, preq);
		return rc;
	}

	/*
	 ** If there is a sisterhood, send command.
	 */
	if (pjob->ji_numnodes > 1) {
		int i;

		i = send_sisters(pjob, abort ? IM_CHECKPOINT_ABORT : IM_CHECKPOINT, NULL);

		if (i != (pjob->ji_numnodes - 1)) {
			pjob->ji_flags |= MOM_SISTER_ERR;
			req_reject(PBSE_SYSTEM, errno, preq);
			return PBSE_SYSTEM;
		}
	}
	pjob->ji_preq = preq;

	return 0;
}

/**
 * @brief
 *	Restart the job.
 *	May be done in a child of MOM.
 *
 * @param[in] pjob - pointer to job
 *
 * @return 	int
 * @retval	0	no error
 * @retval	!0	error
 *
 */

int
mom_restart_job(job *pjob)
{
	int i;
	int rserr = ENOENT;
	char path[MAXPATHLEN + 1];
	char *filnam;
	tm_task_id taskid;
	pbs_task *ptask;
	int tcount = 0;
	struct stat sbuf;
	extern pid_t mom_pid;

	/* changing directory to job user's home */
	char *cwdname = NULL;
	struct passwd *pwdp = NULL;

	assert(pjob != NULL);
	DBPRT(("%s: %s\n", __func__, pjob->ji_qs.ji_jobid))

	/* perform any site required setup before restart */
	if ((i = site_mom_prerst(pjob)) != 0) {
		sprintf(log_buffer, "Pre-restart failed: return=%d errno=%d",
			i, errno);
		rserr = errno;
		goto done;
	}

	pbs_strncpy(path, path_checkpoint, sizeof(path));
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		strcat(path, pjob->ji_qs.ji_fileprefix);
	else
		strcat(path, pjob->ji_qs.ji_jobid);
	strcat(path, JOB_CKPT_SUFFIX);

	i = strlen(path);
	filnam = &path[i];

	/* Change to user's home or PBS_JOBDIR to pick up .cpr */
#ifdef WIN32
	if ((cwdname = getcwd(NULL, _MAX_PATH + 2)) != NULL) {
		if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
		    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
			/* "sandbox=PRIVATE" mode is enabled, so restart job in PBS_JOBDIR */
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL) {
				if (chdir(jobdirname(pjob->ji_qs.ji_jobid,
					save_actual_homedir(pwdp, pjob))) == -1) 
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));				
			}
		} else {
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL)
				if (chdir(save_actual_homedir(pwdp, pjob)) == -1) 
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));
		}
	}
#else
	if ((cwdname = getcwd(NULL, 0)) != NULL) {
		if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
		    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
			/* "sandbox=PRIVATE" mode is enabled, so restart job in PBS_JOBDIR */
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL)
				if (chdir(jobdirname(pjob->ji_qs.ji_jobid, pwdp->pw_dir)) == -1) 
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));		
		} else {
			pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
			if (pwdp != NULL)
				if (chdir(pwdp->pw_dir) == -1) {
					log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));			
			}
		}
	}
#endif

	for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
	     ptask != NULL;
	     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {

		taskid = ptask->ti_qs.ti_task;
		sprintf(filnam, task_fmt, taskid);

		/* check to see if checkpoint file exists */
		if (stat(path, &sbuf) == -1) {
			if (errno == ENOENT)
				continue;

			sprintf(log_buffer,
				"checkpoint path %s stat failed %d",
				path, errno);
			goto done;
		}

		/*
		 **	Try action script with no post function.
		 */
		i = do_mom_action_script(RestartAction, pjob, ptask,
					 path, NULL);
		if (i == 0) { /* script worked */
			tcount++;
			continue;
		}

		/* if there is no script, try native support */
		if (i == -2) {
			i = mach_restart(ptask, path);
			if (i != -1) { /* it worked */
				tcount++;
				continue;
			}
			/*
			 ** Look to see if errno is any of the set
			 ** of values that should cause us to return
			 ** EAGAIN.  Don't need to do this for action
			 ** script since it runs in a child.
			 */
			switch (errno) {
#ifdef ERFLOCK
				case ERFLOCK:
#endif
#ifdef EQUSR
				case EQUSR:
#endif
#ifdef EQGRP
				case EQGRP:
#endif
#ifdef EQACT
				case EQACT:
#endif
#ifdef ENOSDS
				case ENOSDS:
#endif
				case EAGAIN:
				case ENOMEM:
				case ENOLCK:
				case ENOSPC:
				case ENFILE:
				case EDEADLK:
				case EBUSY:
					rserr = EAGAIN;
					break;
			}
		}

		sprintf(log_buffer,
			"restart of task %8.8X from file %s failed",
			taskid, path);
		goto done;
	}

	sprintf(log_buffer, "Restarted %d task(s)", tcount);
	rserr = PBSE_NONE;

done:
	/* log if not the main mom */
	if (getpid() != mom_pid) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}

	/* return to MOM's rightful lair */
	if (cwdname) {
		if (chdir(cwdname) == -1) 
			log_errf(-1, __func__, "chdir failed. ERR : %s", strerror(errno));		
		free(cwdname);
	}
	return rserr;
}

/**
 * @brief
 * 	post_restart - post processor for start_restart()
 *
 *	Called from catch_child() when found in ji_mompost.
 *
 * @param[in] pjob - pointer to job\
 * @param[in] ev -  exit value of the child process
 *
 * @return	Void
 *
 */
void
post_restart(job *pjob, int ev)
{
	pbs_task *ptask;

	DBPRT(("post_restart: %s err %d\n", pjob->ji_qs.ji_jobid, ev))

	if (post_action(pjob, IM_RESTART, ev))
		return;

	/*
	 ** No more operations are waiting.
	 ** Now is the time to clear ji_mompost.
	 */
	pjob->ji_mompost = NULL;
	pjob->ji_flags &= ~MOM_RESTART_ACTIVE;

	if (pjob->ji_flags & MOM_SISTER_ERR) {
		/*
		 ** If we get here, an error happened.
		 */
		set_job_substate(pjob, JOB_SUBSTATE_EXITING);
		exiting_tasks = 1;
		return;
	}

	/*
	 **	The restart worked.
	 */
	pjob->ji_flags &= ~MOM_SISTER_ERR;

	/* reset sample time for cpupercent, to start over */
	pjob->ji_sampletim = 0;

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) == 0) {
		/*
		 ** Set all checkpointed tasks running.
		 */
		for (ptask = (pbs_task *) GET_NEXT(pjob->ji_tasks);
		     ptask != NULL;
		     ptask = (pbs_task *) GET_NEXT(ptask->ti_jobtask)) {
			if (ptask->ti_flags & TI_FLAGS_CHKPT) {
				ptask->ti_qs.ti_status = TI_STATE_RUNNING;
				/*
				 * KLUDGE
				 * The sid for the task is saved as a negative value in
				 * scan_for_exiting() when it goes into DEAD state. We
				 * need to keep it for the restarted task if a new sid
				 * has not been generated.
				 */
				if (ptask->ti_qs.ti_sid < 0) {
					ptask->ti_qs.ti_sid =
						-ptask->ti_qs.ti_sid;
				}
				(void) task_save(ptask);
			}
		}

		set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
		start_walltime(pjob);

		if (mom_get_sample() != PBSE_NONE) {
			time_resc_updated = time_now;
			(void) mom_set_use(pjob);
		}
	} else {
		set_job_substate(pjob, JOB_SUBSTATE_SUSPEND);
		stop_walltime(pjob);
	}
	if (pjob->ji_preq) {
		/*
		 **	If there is a request saved, do an ack
		 **	for it.  This will be the response for
		 **	the release.
		 */
		reply_ack(pjob->ji_preq);
		pjob->ji_preq = NULL;
	}

	return;
}

int
local_restart(job *pjob,
	      struct batch_request *preq) /* may be null */
{
	pid_t pid;
	int rc;
	int background = restart_background;

	DBPRT(("local_restart: %s %s request\n",
	       pjob->ji_qs.ji_jobid, preq ? "with" : "without"))

	/* no restart, reject request */
	if ((mom_does_chkpnt == 0) &&
	    (mom_action[RestartAction].ma_script == NULL))
		return PBSE_NOSUP;

	/*
	 ** If a script is going to transmogrify, don't run in the
	 ** background, otherwise, do run in the background.
	 */
	if (mom_action[RestartAction].ma_script != NULL)
		background = (restart_transmogrify ? FALSE : TRUE);

	if ((pjob->ji_mompost != NULL) && (pjob->ji_mompost != post_restart))
		return PBSE_CKPBSY;

	/*
	 * If restart_background is NOT enabled, perform the restart
	 * in the foreground.
	 */
	if (background == FALSE) {
		rc = mom_restart_job(pjob);

		/* retry for any kind of changable thing */
		switch (rc) {
			case PBSE_NONE:
				break;
			case 75:
				rc = PBSE_CKPBSY;
				pjob->ji_qs.ji_un.ji_momt.ji_exitstat = JOB_EXEC_RETRY;
				break;
			default:
				rc = PBSE_SYSTEM;
				pjob->ji_qs.ji_un.ji_momt.ji_exitstat =
					JOB_EXEC_BADRESRT;
				break;
		}
		/* post_restart gets called from start_exec or finish_exec */
		return rc;
	}

	/*
	 **	Check to see if anything is going on.
	 */
	if (pjob->ji_momsubt != 0)
		return PBSE_CKPBSY;

	/*
	 * If we get to this point, restart_background is enabled, perform
	 * the restart as a subtask of MOM.
	 */
	pid = fork_me(-1);
	if ((pid < 0) && (errno != ENOSYS))
		return PBSE_SYSTEM; /* error on fork */

	if (pid > 0) {
		/* parent, records pid in job for when child terminates */

		DBPRT(("local_restart: %s pid %d\n", pjob->ji_qs.ji_jobid, pid))
		pjob->ji_momsubt = pid;
		pjob->ji_mompost = post_restart;
		pjob->ji_actalarm = 0;
		pjob->ji_flags |= MOM_RESTART_ACTIVE;
		(void) job_save(pjob);
		return PBSE_NONE; /* parent return */
	}
	/* child - does the restart if fork avaialable else by foreground*/
	rc = mom_restart_job(pjob);
	if (pid) {
		pjob->ji_preq = preq;
		post_restart(pjob, rc);
		return (rc);
	} else
		exit(rc); /* zero exit tells main restart ok */
}

/**
 * @brief
 *	Parse a resourcedef file and return an array of resource names
 *
 * @param[in] path - Path to a resourcedef file
 *
 * @par The return value is to be freed by the caller using a call to
 * free_str_array()
 *
 * @return 	an array of resource names.
 * @retval	array of resource names
 * @retval	NULL on failure
 *
 */
static char **
get_resources_from_file(char *path)
{
	FILE *fp;
	char line[256];
	char *n;
	char **resources;
	int numlines;
	int i;

	/* Assume no resources */
	resources = malloc(sizeof(char *));
	if (resources == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		return NULL;
	}

	resources[0] = NULL;

	/* Note that the absence of a file is not an error, it means that
	 * there are no resources defined
	 */
	if ((fp = fopen(path, "r")) == NULL) {
		return resources;
	}

	for (numlines = 0; fgets(line, sizeof(line), fp); numlines++)
		;

	(void) fseek(fp, 0, SEEK_SET);

	/* now that we have the number of resources defined, we allocate an
	 * array that can hold those resources names
	 */
	free(resources);
	resources = malloc((numlines + 1) * sizeof(char *));
	if (resources == NULL) {
		log_err(PBSEVENT_SYSTEM, __func__, MALLOC_ERR_MSG);
		fclose(fp);
		return NULL;
	}

	for (i = 0; fgets(line, sizeof(line), fp);) {
		n = strtok(line, " ");
		if (n[0] != '#') {
			resources[i] = strdup(n);
			if (resources[i] == NULL) {
				log_err(PBSEVENT_SYSTEM, __func__, MALLOC_ERR_MSG);
				free_str_array(resources);
				fclose(fp);
				return NULL;
			}
			i++;
		}
	}
	resources[i] = NULL;
	fclose(fp);

	return resources;
}

/**
 * @brief
 *	Returns an array of names of resources that were deleted based on
 * 	the comparison between an 'old' (r1) and 'new' (r2) set of names.
 *
 * @param[in] r1 - The array of 'old' resource names. i.e., prior to update
 * @param[in] r2 - The array of 'new' resource names.
 *
 * @par The return value is to be freed by the caller.
 *
 *
 * @return An array of names of resources that were deleted, i.e., that were
 * in r1 but are not in r2.
 * @retval	names of resource	Success
 * @retval	NULL			Failure
 *
 */

static char **
get_deleted_resources(char **r1, char **r2)
{
	char **deleted_resources;
	int i, j;
	int k = 0;

	for (i = 0; r1[i] != NULL; i++)
		;

	/* worst case is that all resources in r1 were deleted */
	deleted_resources = malloc((i + 1) * sizeof(char *));
	if (deleted_resources == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		return NULL;
	}

	for (i = 0; r1[i] != NULL; i++) {
		for (j = 0; r2[j] != NULL; j++) {
			if (strcmp(r1[i], r2[j]) == 0) {
				break;
			}
		}
		/* r1[i] is no longer reported in r2 */
		if (r2[j] == NULL) {
			deleted_resources[k++] = r1[i];
		}
	}
	deleted_resources[k] = NULL;

	return deleted_resources;
}

/**
 * @brief
 *	Update vnodes when resource definitions have changed
 *
 * @param deleted_resources - Array of deleted resources
 *
 * @return	Void
 *
 */
static void
update_vnodes_on_resourcedef_change(char **deleted_resources)
{
	extern vnl_t *vnlp;
	int i, j, k;
	char *attr;
	int attrlen;
	char *attrprefix = "resources_available.";
	vnl_t *nv = NULL;
	int mod_vnlp = 0; /* track whether vnode list was modified */

	if (vnlp == NULL)
		return;

	/* The deleted resources may have a single NULL entry if no resources
	 * are defined
	 */
	if ((deleted_resources == NULL) || (deleted_resources[0] == NULL)) {
		return;
	}

	if (vnl_alloc(&nv) == NULL) {
		log_err(errno, __func__, "vnl_alloc failed!");
		return;
	}

	attrlen = strlen(attrprefix) + 20; /* for resources_available.<some arbitrary resource> (will be extended as needed) */
	attr = malloc(attrlen);
	if (attr == NULL) {
		vnl_free(nv);
		log_err(errno, __func__, MALLOC_ERR_MSG);
		return;
	}

	for (i = 0; i < vnlp->vnl_used; i++) {
		vnal_t *vnrlp = VNL_NODENUM(vnlp, i);
		for (j = 0; j < vnrlp->vnal_used; j++) {
			vna_t *vnrp = VNAL_NODENUM(vnrlp, j);
			for (k = 0; deleted_resources[k] != NULL; k++) {
				strcpy(attr, attrprefix);
				(void) pbs_strcat(&attr, &attrlen, deleted_resources[k]);
				if (strcmp(vnrp->vna_name, attr) == 0) {
					break;
				}
			}
			/* attribute not found in deleted resources list, add
			 * it to new vnode list */
			if (deleted_resources[k] == NULL) {
				vn_addvnr(nv, vnrlp->vnal_id, vnrp->vna_name, vnrp->vna_val, vnrp->vna_type, vnrp->vna_flag, NULL);
			} else {
				/* attribute was deleted, do not add it to new
				 * vnode list, keep track of modification */
				mod_vnlp = 1;
			}
		}
	}

	free(attr);
	if (mod_vnlp) {
		vnl_free(vnlp);
		nv->vnl_modtime = time(0);
		vnlp = nv;
	} else {
		vnl_free(nv);
	}
}

/**
 * @brief
 *	Receive a hook-related file.
 *
 *  @param[in] 	preq - Pointer to batch request structure for a Copy Hook
 *			request.
 *			The 'preq' parameter holds:
 * 			- preq->rq_ind.rq_hookfile.rq_filename - the basename
 *			  including suffix)  of the target hook file.
 *			- preq->rq_ind.rq_hookfile.rq_data contains the hook
 *			  data.
 *			- preq->rq_ind.rq_hookfile.rq_size is the size of
 *			  rq_data.
 * @note
 *	The idea is to put contents (preq->rq_ind.rq_hookfile.rq_data) into
 *	[PATH_HOOKS]/<preq->rq_ind.rq_hookfile.rq_filename>
 *
 *	If the file received is for a periodic hook, then attempt is made
 *	to instantiate the hook, if none is queued up for execution.
 *
 *	This function expects 4 types of files and they are:
 *		<file_name>HOOK_FILE_SUFFIX
 *		<file_name>HOOK_CONFIG_SUFFIX
 *		<file_name>HOOK_SCRIPT_SUFFIX
 *		PBS_RESCDEF
 *
 * @return 	Void
 *
 */

void
req_copy_hookfile(struct batch_request *preq) /* ptr to the decoded request   */
{
	int filemode = 0700;
	int fds;
	char namebuf[MAXPATHLEN + 1];
	char *p;
	int is_hook_cntrl_file = 0;
	int is_hook_config_file = 0;
	int is_hook_script_file = 0;
	int is_hook_resourcedef_file = 0;
	hook *phook = NULL;
	char *hook_name;
	char hook_msg[HOOK_MSG_SIZE + 1];
	int oflag;
	char **prev_resources = NULL;

	if (reject_root_scripts == TRUE) {
		log_err(-1, __func__, msg_mom_reject_root_scripts);
		req_reject(PBSE_MOM_REJECT_ROOT_SCRIPTS, 0, preq);
		return;
	}

	p = strstr(preq->rq_ind.rq_hookfile.rq_filename, HOOK_FILE_SUFFIX);
	if ((p != NULL) && (strcmp(p, HOOK_FILE_SUFFIX) == 0)) {
		is_hook_cntrl_file = 1;
	}
	if (!is_hook_cntrl_file) {
		p = strstr(preq->rq_ind.rq_hookfile.rq_filename, HOOK_SCRIPT_SUFFIX);
		if ((p != NULL) && (strcmp(p, HOOK_SCRIPT_SUFFIX) == 0))
			is_hook_script_file = 1;
	}

	if (!is_hook_cntrl_file && !is_hook_script_file) {
		p = strstr(preq->rq_ind.rq_hookfile.rq_filename, HOOK_CONFIG_SUFFIX);
		if ((p != NULL) && (strcmp(p, HOOK_CONFIG_SUFFIX) == 0))
			is_hook_config_file = 1;
	}

	if (!is_hook_cntrl_file && !is_hook_script_file &&
	    !is_hook_config_file) {
		p = strstr(preq->rq_ind.rq_hookfile.rq_filename, PBS_RESCDEF);
		if ((p == NULL) || (strcmp(p, PBS_RESCDEF) != 0)) {
			log_err(errno, __func__, "malformed request");
			req_reject(PBSE_INTERNAL, 0, preq);
			return;
		}
		is_hook_resourcedef_file = 1;
	}

	snprintf(namebuf, sizeof(namebuf), "%s%s", path_hooks,
		 preq->rq_ind.rq_hookfile.rq_filename);

	/* Resources prior to update of the resourcedef file */
	if (is_hook_resourcedef_file) {
		prev_resources = get_resources_from_file(namebuf);
	}

	if (preq->rq_ind.rq_hookfile.rq_sequence == 0) { /* 1st chunk of data */
		oflag = O_TRUNC | O_RDWR | O_CREAT | O_Sync;
	} else {
		oflag = O_RDWR | O_APPEND | O_CREAT | O_Sync;
	}

	fds = open(namebuf, oflag, filemode);

	if (fds < 0) {
		log_err(errno, __func__, msg_hookfile_open);
		req_reject(PBSE_SYSTEM, 0, preq);
		free_str_array(prev_resources);
		return;
	}

#ifdef WIN32
	secure_file2(namebuf, "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED, "Everyone", READS_MASK | READ_CONTROL);
	setmode(fds, O_BINARY);
#endif /* WIN32 */

	if (write(fds, preq->rq_ind.rq_hookfile.rq_data,
		  (unsigned) preq->rq_ind.rq_hookfile.rq_size) !=
	    preq->rq_ind.rq_hookfile.rq_size) {
		log_err(errno, __func__, msg_hookfile_write);
		req_reject(PBSE_SYSTEM, 0, preq);
		(void) close(fds);
		free_str_array(prev_resources);
		return;
	}

	if (is_hook_cntrl_file) {
		FILE *fp = NULL;

		(void) lseek(fds, 0L, SEEK_SET);

		fp = fdopen(fds, "r");

		/* Load the contents of hook control file into memory */
		/* passed fp to hook_recov()  so file does not need to be */
		/* reopened */
		if ((phook = hook_recov(namebuf, fp, hook_msg, HOOK_MSG_SIZE,
					python_script_alloc, python_script_free)) == NULL) {
			log_err(-1, __func__, hook_msg);
			req_reject(PBSE_SYSTEM, 0, preq);
			if (fp != NULL)
				(void) fclose(fp);
			else
				(void) close(fds);
			return;
		} else {

			hook *phook2;
			int i;
			int j;

			if ((phook->event & HOOK_EVENT_EXECHOST_PERIODIC) &&
			    !has_task_by_parm1(phook)) {
				run_periodic_hook_bg(phook);
			}

			phook2 = (hook *) GET_NEXT(svr_allhooks);
			i = j = 0;
			for (phook2 = (hook *) GET_NEXT(svr_allhooks); phook2 != NULL;
			     phook2 = (hook *) GET_NEXT(phook2->hi_allhooks)) {
				if (update_joinjob_alarm_time &&
				    (phook2->enabled == TRUE) &&
				    ((phook2->event & HOOK_EVENT_EXECJOB_BEGIN) != 0)) {
					if (i == 0)
						joinjob_alarm_time = 0;
					joinjob_alarm_time += phook2->alarm;
					i++;
				} else if (update_job_launch_delay &&
					   (phook2->enabled == TRUE) &&
					   ((phook2->event & HOOK_EVENT_EXECJOB_PROLOGUE) != 0)) {
					if (j == 0)
						job_launch_delay = 0;
					job_launch_delay += phook2->alarm;
					j++;
				}
			}
			if (i > 0) {
				snprintf(log_buffer, sizeof(log_buffer), "joinjob_alarm_time updated to %ld", joinjob_alarm_time);
				log_err(-1, __func__, log_buffer);
			}
			if (j > 0) {
				snprintf(log_buffer, sizeof(log_buffer), "job_launch_delay updated to %ld", job_launch_delay);
				log_err(-1, __func__, log_buffer);
			}
		}
		if (fp != NULL)
			(void) fclose(fp);
		else
			(void) close(fds);

	} else { /* a hook script, resourcedef, or hook config  file*/

		phook = NULL;
		if (is_hook_script_file)
			p = strstr(namebuf, HOOK_SCRIPT_SUFFIX);
		else if (is_hook_config_file)
			p = strstr(namebuf, HOOK_CONFIG_SUFFIX);
		else
			p = NULL;

		if (p != NULL) {
			*p = '\0';
			hook_name = strrchr(namebuf, '/');
		} else {
			hook_name = NULL;
		}
		if (hook_name != NULL) { /* hook related */
			hook_name++;

			if ((phook = find_hook(hook_name)) != NULL) {
				if (is_hook_script_file) {
					strcat(p, HOOK_SCRIPT_SUFFIX);
					if (python_script_alloc(namebuf,
								(struct python_script **) &phook->script) == -1) {
						log_err(-1, __func__, "python_script_alloc call failed!");
						req_reject(PBSE_SYSTEM, 0, preq);
						(void) close(fds);
						return;
					}
				} else if (is_hook_config_file) {
					strcat(p, HOOK_CONFIG_SUFFIX);
				}
				if ((phook->event & HOOK_EVENT_EXECHOST_PERIODIC) &&
				    !has_task_by_parm1(phook)) {
					run_periodic_hook_bg(phook);
				}
			}
		}
		(void) close(fds);

		if (is_hook_resourcedef_file) {
			/* check if any deleted resources were set on the
			 * vnodes attribute list, and if so, update the vnodes
			 */
			char **new_resources;
			char **deleted_resources;

			new_resources = get_resources_from_file(namebuf);
			deleted_resources = get_deleted_resources(prev_resources, new_resources);
			if (deleted_resources != NULL) {
				update_vnodes_on_resourcedef_change(deleted_resources);
				free(deleted_resources);
			}
			free_str_array(new_resources);
			free_str_array(prev_resources);

			/* Call setup_resc() only if received
			 * resourcedef file is the one for path_rescdef,
 			 * which is set up at mom startup and used when
			 * HUP-ed.
			 */
			if ((path_rescdef != NULL) &&
			    (strcmp(path_rescdef, namebuf) == 0) &&
			    (setup_resc(1) != 0)) {
				/* log_buffer set in setup_resc */
				log_err(-1, "setup_resc",
					"warning: failed to setup resourcedef");
			}
		}
	}
	/* obtain new checksums after file is closed/flushed */
	if (is_hook_cntrl_file) {
		if (phook != NULL) {
			phook->hook_control_checksum = crc_file(namebuf);
		}
	} else if (is_hook_script_file) {
		if (phook != NULL) {
			phook->hook_script_checksum = crc_file(namebuf);
		}
	} else if (is_hook_config_file) {
		if (phook != NULL) {
			phook->hook_config_checksum = crc_file(namebuf);
		}
	} else if (is_hook_resourcedef_file) {
		hooks_rescdef_checksum = crc_file(namebuf);
	}

	reply_ack(preq);
}

/**
 * @brief
 *	Receive a request to delete a hook-related file.
 *
 *  @param[in]	preq - pointer to batch request structure for a Delete Hook
 *			request.
 *		     - contains preq->rq_ind.rq_hookfile.rq_filename which
 *			is the hook-related filename to delete. If this
 *			matches the hook control file (*.HK suffix), then
 *			before deleting the file, the asociated hook in
 *			memory is also purged.
 *
 * @return	Void
 *
 */

void
req_del_hookfile(struct batch_request *preq) /* ptr to the decoded request   */
{

	char namebuf[MAXPATHLEN + 1];
	char *p;
	char hook_name[MAXPATHLEN + 1];
	hook *phook;
	job *pjob = NULL;
	int hook_running = 0;

	p = strstr(preq->rq_ind.rq_hookfile.rq_filename, HOOK_FILE_SUFFIX);
	if ((p == NULL) || (strcmp(p, HOOK_FILE_SUFFIX) != 0)) {
		p = strstr(preq->rq_ind.rq_hookfile.rq_filename,
			   HOOK_SCRIPT_SUFFIX);
	} else {
		*p = '\0';
		snprintf(hook_name, sizeof(hook_name), "%s",
			 preq->rq_ind.rq_hookfile.rq_filename);
		strcat(p, HOOK_FILE_SUFFIX);
		if ((phook = find_hook(hook_name)) != NULL) {
#ifndef WIN32
			pjob = (job *) GET_NEXT(svr_alljobs);
			while (pjob) {
				/* See if any asynchronous hook is running */
				if (pjob->ji_hook_running_bg_on) {
					hook_running = 1;
					break;
				}
				pjob = (job *) GET_NEXT(pjob->ji_alljobs);
			}
			if (hook_running && phook->event & HOOK_EVENT_EXECJOB_END) {
				/**
				 * This event runs hook in the background,
				 * and it's deferred task created while
				 * running the hook, is required for graceful
				 * exit of the job.
				 */
				reply_ack(preq);
				return;
			}
#endif
			delete_task_by_parm1_func(phook, NULL, DELETE_ONE);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, phook->hook_name,
				  "deleted any hook task entry");
			/* inside hook_purge() is where the hook control */
			/* file is deleted */
			hook_purge(phook, python_script_free);
		}
		reply_ack(preq);
		return;
	}
	if (((p == NULL) || (strcmp(p, HOOK_SCRIPT_SUFFIX) != 0)) &&
	    (strcmp(preq->rq_ind.rq_hookfile.rq_filename,
		    PBS_RESCDEF) != 0)) {
		p = strstr(preq->rq_ind.rq_hookfile.rq_filename, HOOK_CONFIG_SUFFIX);
		if ((p == NULL) || (strcmp(p, HOOK_SCRIPT_SUFFIX) != 0)) {
			log_err(errno, __func__, "malformed request");
			req_reject(PBSE_INTERNAL, 0, preq);
		}
	}

	snprintf(namebuf, sizeof(namebuf), "%s%s", path_hooks,
		 preq->rq_ind.rq_hookfile.rq_filename);

	if (unlink(namebuf) < 0) {
		if (errno != ENOENT) {
			sprintf(log_buffer,
				"Failed to delete hook file %s",
				namebuf);
			log_err(errno, __func__, log_buffer);
			req_reject(PBSE_INTERNAL, 0, preq);
			mark_hook_file_bad(namebuf);
		}
	} else {
		if (!strcmp(preq->rq_ind.rq_hookfile.rq_filename, PBS_RESCDEF))
			hooks_rescdef_checksum = 0LU;
	}

	reply_ack(preq);
}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
void
req_cred(struct batch_request *preq) /* ptr to the decoded request */
{
	unsigned char out_data[CRED_DATA_SIZE];
	ssize_t out_len = 0;
	char buf[LOG_BUF_SIZE];
	krb5_data *data;
	char *data_base64 = NULL;
	job *pjob;

	if (decode_block_base64((unsigned char *) preq->rq_ind.rq_cred.rq_cred_data, preq->rq_ind.rq_cred.rq_cred_size, out_data, &out_len, buf, LOG_BUF_SIZE) != 0) {
		log_err(errno, __func__, buf);
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	if ((data = (krb5_data *) malloc(sizeof(krb5_data))) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	if ((data->data = (char *) malloc(sizeof(unsigned char) * out_len)) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	data->length = out_len;
	memcpy(data->data, out_data, out_len);

	data_base64 = strdup(preq->rq_ind.rq_cred.rq_cred_data);

	store_or_update_cred(preq->rq_ind.rq_cred.rq_jobid, preq->rq_ind.rq_cred.rq_credid, preq->rq_ind.rq_cred.rq_cred_type, data, data_base64, preq->rq_ind.rq_cred.rq_cred_validity);

	/* renew ticket for the job */
	if ((pjob = find_job(preq->rq_ind.rq_cred.rq_jobid)) != NULL) {
		/* send cred to sisters too */
		send_cred_sisters(pjob);

		/* new creds received - lets renew cred */
		renew_job_cred(pjob);
	}

	reply_ack(preq);
}
#endif


================================================
FILE: src/resmom/rm_dep.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 **	Common resource names for dependent code.  All machines
 **	supported by the resource monitor should include at least
 **	these resources.
 */

static char *cput(struct rm_attribute *attrib);
#ifndef WIN32
static char *mem(struct rm_attribute *attrib);
static char *sessions(struct rm_attribute *attrib);
static char *pids(struct rm_attribute *attrib);
static char *nsessions(struct rm_attribute *attrib);
static char *nusers(struct rm_attribute *attrib);
#endif
static char *size(struct rm_attribute *attrib);
extern char *idletime(struct rm_attribute *attrib);

extern char *nullproc(struct rm_attribute *attrib);

struct config standard_config[] = {
	{"cput", {cput}},
#ifndef WIN32
	{"mem", {mem}},
	{"sessions", {sessions}},
	{"pids", {pids}},
	{"nsessions", {nsessions}},
	{"nusers", {nusers}},
#endif
	{"size", {size}},
	{"idletime", {idletime}},
	{NULL, {nullproc}},
};


================================================
FILE: src/resmom/stage_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <sys/types.h>
#include <sys/stat.h>
#include <assert.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <stdio.h>
#include <limits.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include <sys/wait.h>
#include <dirent.h>
#include "tpp.h"
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "ticket.h"
#include "libpbs.h"
#include "batch_request.h"
#include "pbs_nodes.h"
#include "mom_func.h"

/**
 * @file	stage_func.c
 */
extern char *path_spool;	/* path to spool directory */
extern char *path_undeliv;	/* path to undelivered directory */
extern char *path_checkpoint;	/* path to checkpoint directory */
extern char *msg_err_unlink;	/* unlink error message (see pbs_messages.c) */
extern char rcperr[MAXPATHLEN]; /* path to rcp errfile for current copy */
extern char *pbs_jobdir;	/* path to staging and execution dir of current job */
extern char *cred_buf;		/* cred buffer */
extern size_t cred_len;		/* length of cred buffer */
#ifndef WIN32
extern int cred_pipe;
extern char *pwd_buf;
#endif
extern char mom_host[PBS_MAXHOSTNAME + 1]; /* MoM host name */

int stage_file(int, int, char *, struct rqfpair *, int, cpy_files *, char *, char *);
static int sys_copy(int, int, char *, char *, struct rqfpair *, int, char *, char *);

/**
 * A path in windows is not case sensitive so do a define
 * to do the right compare.
 */
#ifdef WIN32
#define PATHCMP strncasecmp
#else
#define PATHCMP strncmp
#endif

#ifdef WIN32
/**
 * @brief
 * check_err - Report the error in log file, if the length of actual data
 *             buffer and length of the total data written is different.
 *
 * @param[in]		func_name		-	Name of the caller function
 * @param[in]		buffer			-	Actual data buffer
 * @param[in]		written_len		-	Total length of the written data
 *
 * @return void
 */
void
check_err(const char *func_name, char *buffer, int written_len)
{
	if (written_len != strlen(buffer)) {
		DWORD ecode = GetLastError();
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to write or written partial data to the pipe: data=[%s], total_len=%d, written_len=%d, ecode=%d",
			 buffer, strlen(buffer), written_len, ecode);
		log_err(-1, func_name, log_buffer);
	}
}
#endif

/**
 * @brief
 *	add_bad_list
 *	add new bad file message to bad file messages list
 *
 * @param[in/out]	pbl	-	list of bad file messages
 * @param[in]		newtext	-	new bad file message
 * @param[in]		nl	-	number of prefix new-lines
 *
 * @return	void
 *
 * @note: if <pbl> is non-NULL then it will be reallocated based on length of
 *        <newtext> or if <pbl> is NULL then it will be allocated
 *        So, caller should free <pbl> after use
 *
 */
void
add_bad_list(char **pbl, char *newtext, int nl)
{
	int needed = 0;
	char *pnew = NULL;

	if (*pbl) {
		needed += strlen(*pbl) + strlen(newtext) + nl + 1;
		pnew = realloc(*pbl, needed);
	} else {
		needed += strlen(newtext) + nl + 1;
		pnew = malloc(needed);
		if (pnew)
			*pnew = '\0';
	}
	if (pnew == NULL) {
		log_err(errno, __func__, "Failed to allocate memory");
		return;
	}

	*pbl = pnew;
	while (nl--) /* prefix new-lines */
		(void) strcat(*pbl, "\n");
	(void) strcat(*pbl, newtext);
	return;
}

/**
 * @brief
 *	is_child_path
 *		check if provided <path> specifies location under specified directory <dir>
 *
 * @param[in]	dir	-	directory path
 * @param[in]	path	-	path to check
 *
 * @return	int
 * @retval	1 - given path is child of dir
 * @retval	0 - given not a child path
 * @retval -1 - error encountered
 */
int
is_child_path(char *dir, char *path)
{
	char fullpath[2 * MAXPATHLEN + 2] = {'\0'};
	char *dir_real = NULL;
	char *fullpath_real = NULL;
	char *pos = NULL;
	int return_value = 0;

	/* if file path is relative, combine it with directory */
	if (!is_full_path(path)) {
		snprintf(fullpath, sizeof(fullpath), "%s/%s", dir, path);
	} else {
		snprintf(fullpath, sizeof(fullpath), "%s", path);
	}

#ifdef WIN32
	dir_real = malloc(sizeof(char) * (MAXPATHLEN + 1));
	fullpath_real = malloc(sizeof(char) * (2 * MAXPATHLEN + 2));
#else
	dir_real = realpath(dir, NULL);
	fullpath_real = realpath(fullpath, NULL);
#endif

	if (dir_real == NULL || fullpath_real == NULL) {
		log_err(errno, __func__, "Failed to allocate memory");
		return_value = -1;
		goto error_exit;
	}

	/* even if the file path is relative to some directory, */
	/* it may use /../../ notation and escape that directory, */
	/* so always perform full check of parent-child directory relation */
#ifdef WIN32
	fix_path(fullpath, 3);
	pbs_strncpy(dir_real, lpath2short(dir), MAXPATHLEN + 1);
	pbs_strncpy(fullpath_real, lpath2short(fullpath), 2 * MAXPATHLEN + 2);
#endif
	/* check that fullpath_real begins with dir_real */
	if (strlen(dir_real) && strlen(fullpath_real)) {
		pos = strstr(fullpath_real, dir_real);
		if (pos == fullpath_real) {
			return_value = 1;
		}
	}

error_exit:
	free(dir_real);
	free(fullpath_real);
	return return_value;
}

/**
 * @brief	wchost_match
 *		Wild card host name match.
 *		Do a case insensitive compare since hostnames are not case sensitive.
 *
 * @param[in]	can	-	stage request hostname
 * @param[in]	master	-	name from usecp list (may be wild carded at beginning)
 *
 * @return	int
 * @retval	1 - can"idate" matches master name
 * @retval	0 - not a match
 *
 */
int
wchost_match(const char *can, const char *master)
{
	const char *pc;
	const char *pm;

	if ((can == NULL) || (master == NULL))
		return 0;

	pc = can + strlen(can) - 1;
	pm = master + strlen(master) - 1;
	while ((pc > can) && (pm > master)) {
		if (tolower(*pc) != tolower(*pm))
			return 0;
		pc--;
		pm--;
	}

	/* comparison of one or both reached the start of the string */
	if (pm == master) {
		if (*pm == '*')
			return 1;
		else if ((pc == can) && (tolower(*pc) == tolower(*pm)))
			return 1;
	}
	return 0;
}

#ifdef NAS /* localmod 009 */
/**
 * @brief
 *	Wild card suffix host name match.  Do a case insensitive compare since
 * 	hostnames are not case sensitive.
 *
 * @param can           stage request hostname
 * @param master        name from usecp list (may be wild carded at end)
 *
 * @return int
 * @retval 1    candidate matches master name
 * @retval 0    not a match
 *
 */
static int
	wcsuffix_host_match(can, master)
		const char *can;
const char *master;
{
	int cmp_length;
	int master_length = strlen(master);

	if (master[master_length - 1] == '*') {
		cmp_length = master_length - 1;
	} else {
		cmp_length = master_length;
	}

	if (strncasecmp(can, master, cmp_length) == 0)
		return 1;

	return 0;
}
#endif /* localmod 009 */

/**
 * @brief
 *	told_to_cp - Check a stage file request against the saved set of "usecp" paths.
 *
 * @param[in]	host	-	stage request hostname
 * @param[in]	oldpath	-	stage request path
 * @param[out]	newpath	-	pointer to "usecp" path
 *
 * @return	int
 * @retval	1 - file matched, newpath is updated
 * @retval	0 - no match, newpath is unchanged
 *
 */
int
told_to_cp(char *host, char *oldpath, char **newpath)
{
	int i = 0;
	int nh = 0;
	static char newp[MAXPATHLEN + 1] = {'\0'};

#ifdef NAS /* localmod 009 */
	extern struct cphosts *pcphosts;
	int match_found = 0;
	for (nh = 0; nh < cphosts_num; nh++) {
		if (wchost_match(host, (pcphosts + nh)->cph_hosts) ||
		    wcsuffix_host_match(host, (pcphosts + nh)->cph_hosts)) {
			i = strlen((pcphosts + nh)->cph_from);
			if (PATHCMP((pcphosts + nh)->cph_from, oldpath, i) == 0) {
				if ((pcphosts + nh)->cph_exclude)
					return 0;

				match_found = 1;
				pbs_strncpy(newp, (pcphosts + nh)->cph_to, sizeof(newp));
				(void) strcat(newp, oldpath + i);
			}
		}
	}

	if (match_found) {
		*newpath = newp;
	}

	return match_found;
#else
	for (nh = 0; nh < cphosts_num; nh++) {
		if (wchost_match(host, (pcphosts + nh)->cph_hosts)) {
			i = strlen((pcphosts + nh)->cph_from);
			if (PATHCMP((pcphosts + nh)->cph_from, oldpath, i) == 0) {
				(void) strcpy(newp, (pcphosts + nh)->cph_to);
				(void) strcat(newp, oldpath + i);
				*newpath = newp;
				return 1;
			}
		}
	}
	return 0;
#endif /* localmod 009 */
}

/**
 * @brief
 *	local_or_remote - Decide if the specified path is to a local or remote file.
 *
 * @param[in]	path	-	pointer to stage path string
 *
 * @return	int
 * @retval	1 - if given path is remote path
 * @retval	0 - if given path is local path
 *
 * @note	This function will updates the path pointer to just the path name if local.
 *
 */
int
local_or_remote(char **path)
{
	int len = 0;
	char *pcolon = NULL;

	pcolon = strchr(*path, (int) ':');
	if (pcolon == NULL)
		return 0;

	*pcolon = '\0';
	len = strlen(*path);
#ifdef WIN32
	if (IS_UNCPATH(pcolon + 1)) {
		/*
		 * UNC path found
		 * treat as local path and
		 * remove given hostname part from path
		 */
		*pcolon = ':';
		*path = pcolon + 1;
		return 0;
	} else if (told_to_cp(*path, pcolon + 1, path))
#else
	if (told_to_cp(*path, pcolon + 1, path))
#endif
	{
		/* path updated in told_to_cp() */
		*pcolon = ':';
		return 0;
	} else if ((strcasecmp("localhost", *path) == 0) ||
		   ((strncasecmp(mom_host, *path, len) == 0) &&
		    ((mom_host[len] == '\0') || (mom_host[len] == '.')))) {
		/* we have a host match, file is local */
		*pcolon = ':';
		*path = pcolon + 1;
		return 0;
	} else {
		/* remote file */
		*pcolon = ':';
		return 1;
	}
}

/**
 * @brief
 *	Setup for direct write of spool file
 * @par
 *	Determines if a spool file is to be directly written to its final destination, i.e:
 *	1. Direct write of spool files has been requested by the job, and
 *  2. Final destination of the file maps to a locally-mounted directory, either because it is
 *	   explicitly mapped by $usecp, or the destination hostname is Mom's host.
 *
 * @param[in]  pjob - pointer to job structure
 * @param[in]  which - identifies which file: StdOut, StdErr, or Chkpt.
 * @param[out]  path -  pointer to array of size MAPATHXLEN+1 into which the final path of the file is to be stored.
 * @param[out]  direct_write_possible -  Determines whether direct_write is possible.
 *                                         Useful to decide whether to write warning message to stderr file
 *                                          after multiple function invocation.
 *
 * @return int
 *
 * @retval	0 if file is not to be directly written,
 * @retval	1 otherwise.
 *
 * @par
 *	If the file is not to be directly written (return zero), the contents of *path are unchanged.
 * @par
 *	Direct write of checkpoint files is not currently supported.
 *
 * @par @par MT-safe: No
 *
 */
int
is_direct_write(job *pjob, enum job_file which, char *path, int *direct_write_possible)
{
	char working_path[MAXPATHLEN + PBS_MAXSVRJOBID + 3 + 1];
	char *p = working_path;

	if (which == Chkpt)
		return (0); /* direct write of checkpoint not supported */

	/* Check if direct_write requested. */
	if (!((is_jattr_set(pjob, JOB_ATR_keep)) &&
	      (strchr(get_jattr_str(pjob, JOB_ATR_keep), 'd'))))
		return (0);

	/* Figure out what the final destination path is */
	switch (which) {
		case StdOut:
			if (!strchr(get_jattr_str(pjob, JOB_ATR_keep), 'o'))
				return (0);
			else
				/* Make local working copy of path for call to local_or_remote */
				snprintf(working_path, MAXPATHLEN + 1, "%s", get_jattr_str(pjob, JOB_ATR_outpath));
			if (
#ifdef WIN32
				working_path[strlen(working_path) - 1] == '\\'
#else
				working_path[strlen(working_path) - 1] == '/'
#endif
			) {
				strcat(working_path, pjob->ji_qs.ji_jobid);
				strcat(working_path, JOB_STDOUT_SUFFIX);
			}
			break;
		case StdErr:
			if (!strchr(get_jattr_str(pjob, JOB_ATR_keep), 'e'))
				return (0);
			else
				/* Make local working copy of path for call to local_or_remote */
				snprintf(working_path, MAXPATHLEN + 1, "%s", get_jattr_str(pjob, JOB_ATR_errpath));
			if (
#ifdef WIN32
				working_path[strlen(working_path) - 1] == '\\'
#else
				working_path[strlen(working_path) - 1] == '/'
#endif
			) {
				strcat(working_path, pjob->ji_qs.ji_jobid);
				strcat(working_path, JOB_STDERR_SUFFIX);
			}
			break;
		default:
			return (0);
	}

	if (local_or_remote(&p) == 1) {
		*direct_write_possible = 0;
		if (pjob->ji_hosts != NULL) {
			log_eventf(PBSEVENT_DEBUG3,
				   PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid,
				   "Direct write is requested for job: %s, but the destination: %s is not usecp-able from %s",
				   pjob->ji_qs.ji_jobid, p,
				   pjob->ji_hosts[pjob->ji_nodeid].hn_host);
		} else {
			/* When a job is requeued and later run, the ji_hosts
			 * information is not available when this function is
			 * called as part of req_mvjobfile
			 */
			log_eventf(PBSEVENT_DEBUG3,
				   PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid,
				   "Direct write is requested for job: %s, but the destination: %s is not usecp-able",
				   pjob->ji_qs.ji_jobid, p);
		}
		return (0);
	}

	if (strlen(p) > MAXPATHLEN) {
		*direct_write_possible = 0;
		sprintf(log_buffer,
			"Direct write is requested for job: %s, but the destination path is longer than %d",
			pjob->ji_qs.ji_jobid, MAXPATHLEN);
		log_event(PBSEVENT_DEBUG3,
			  PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
		return (0);
	}

	/* Destination maps to local directory - final path is in working_path. */
	snprintf(path, MAXPATHLEN + 1, "%s", p);
	return (1);
}

#ifdef WIN32
/**
 * @brief
 *	remtree - wrapper function to remove a tree (or single file) to support for UNC path
 *
 * @param[in]	dirname	-	path of single file or dir to remove
 *
 * @return	int
 * @retval	0 - success
 * @retval	-1 - failure
 *
 */
int
remtree(char *dirname)
{
	int rtnv = 0;
	char unipath[MAXPATHLEN + 1] = {'\0'};
	int unmap = 0;
	char map_drive[MAXPATHLEN + 1] = {'\0'};

	if (dirname != NULL && *dirname != '\0') {
		replace(dirname, "\\ ", " ", unipath);
		fix_path(unipath, 3);
	} else {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, "directory or file path is NULL");
		return -1;
	}

	unmap = get_localpath(unipath, map_drive);

	rtnv = remdir(unipath);

	if (unmap)
		unmap_unc_path(map_drive);

	return rtnv;
}

/**
 * @brief
 *	remove a tree (or single file)
 *
 * @param[in]	path - path of single file or dir to remove
 *
 * @return 	int
 * @retval 	0 on success
 * @retval	-1 on failure
 *
 */
int
remdir(char *dirname)
#else /* WIN32 */
int
remtree(char *dirname)
#endif
{
#ifdef WIN32
	static char id[] = "remdir";
#else
	static char id[] = "remtree";
#endif
	DIR *dir = NULL;
	struct dirent *pdir = NULL;
	char namebuf[MAXPATHLEN] = {'\0'};
	char *filnam = NULL;
	int i = 0;
	int rtnv = 0;
	struct stat sb = {0};

	if (lstat(dirname, &sb) == -1) {
		if (errno != ENOENT) {
			sprintf(log_buffer, "lstat: %s", dirname);
			log_err(errno, id, log_buffer);
		}
		return -1;
	}

	if (S_ISDIR(sb.st_mode)) {
		if ((dir = opendir(dirname)) == NULL) {
			if (errno != ENOENT) {
				sprintf(log_buffer, "opendir: %s", dirname);
				log_err(errno, id, log_buffer);
			}
			return -1;
		}

		pbs_strncpy(namebuf, dirname, sizeof(namebuf));
#ifdef WIN32
		(void) strcat(namebuf, "\\");
#else
		(void) strcat(namebuf, "/");
#endif
		i = strlen(namebuf);
		filnam = &namebuf[i];

		while (errno = 0, (pdir = readdir(dir)) != NULL) {
			if (pdir->d_name[0] == '.') {
				if (pdir->d_name[1] == '\0' ||
				    (pdir->d_name[1] == '.' &&
				     pdir->d_name[2] == '\0'))
					continue;
			}

			pbs_strncpy(filnam, pdir->d_name, sizeof(namebuf) - (filnam - namebuf));
#ifdef WIN32
			rtnv = remdir(namebuf);
#else
			rtnv = remtree(namebuf);
#endif
			if (rtnv == -1) {
				errno = 0;
				break;
			}
		}
		if (errno != 0 && errno != ENOENT) {
			sprintf(log_buffer, "readdir: %s", dirname);
			log_err(errno, id, log_buffer);
			(void) closedir(dir);
			return -1;
		}
		(void) closedir(dir);

		if (rmdir(dirname) < 0) {
			if (errno != ENOENT) {
				sprintf(log_buffer, "rmdir: %s", dirname);
				log_err(errno, id, log_buffer);
				rtnv = -1;
			}
		}
	} else if (unlink(dirname) < 0) {
		sprintf(log_buffer, "unlink: %s", dirname);
		log_err(errno, id, log_buffer);
		rtnv = -1;
	}
	return rtnv;
}

/**
 * @brief
 *	pbs_glob - check whether given pattern matches in filename
 *	pattern matches:
 *	*	matches zero or more characters
 *	?	matches any single character
 *	char	matches itself except where char is '*' or '?'
 *
 * @param[in]	filen	-	filename
 * @param[in]	pat	-	pattern to match
 *
 * @return	Boolean
 * @retval	TRUE - if pattern matches
 * @retval	FALSE - if no match
 *
 */
int
pbs_glob(char *filen, char *pat)
{
	int c = 0;

	while (*pat) {
		if (!*filen && *pat != '*')
			return FALSE;

		c = *pat++;
		switch (c) {

			case '*':
				while (*pat == '*')
					pat++;

				if (!*pat)
					return TRUE;

				if (*pat != '?') {
					while (*filen && *pat != *filen)
						filen++;
				}

				while (*filen) {
					if (pbs_glob(filen, pat))
						return TRUE;
					filen++;
				}
				return FALSE;

			case '?':
				if (*filen)
					break;
				return FALSE;

			default:
				if (c != *filen)
					return FALSE;
				break;
		}
		filen++;
	}

	return !*filen;
}

/**
 * @brief
 *	copy_file - Do a single staging file copy.
 *
 * @param[in]		dir		-	direction of copy
 *						STAGE_DIR_IN - for stage in request
 *						STAGE_DIR_OUT - for stageout request
 * @param[in]		rmtflag		-	is remote file copy
 * @param[in]		owner		-	username for owner of copy request
 * @param[in]		src		-	path to source is stageout else local file name
 * @param[in]		pair		-	list of file pair
 * @param[in]		conn		-	socket on which request is received
 * @param[in/out]	stage_inout	-	pointer to cpy_files struct
 * @param[in]		prmt		-	path to destination if stageout else source path
 * @param[in]		jobid		- 	job ID
 *
 * @return	int
 * @retval	0 - all OK
 * @retval	!0 - error
 *
 */
int
copy_file(int dir, int rmtflag, char *owner, char *src, struct rqfpair *pair, int conn, cpy_files *stage_inout, char *prmt, char *jobid)
{
	int rc = 0;
	int ret = 0;
	int len = 0;
	struct stat buf = {0};
	char dest[MAXPATHLEN + 1] = {'\0'};
	char src_file[MAXPATHLEN + 1] = {'\0'};

	/*
	 ** The destination is calcluated for a stagein so it can
	 ** be used later.  It does not need to be passed to sys_copy.
	 */
	if (dir == STAGE_DIR_IN) {
		/* if destination is a directory, append filename */
#ifdef WIN32
		if (stat_uncpath(pair->fp_local, &buf) == 0 && S_ISDIR(buf.st_mode))
#else
		if (stat(pair->fp_local, &buf) == 0 && S_ISDIR(buf.st_mode))
#endif
		{
			char *slash = strrchr(src, '/');

			pbs_strncpy(dest, pair->fp_local, sizeof(dest));
			strcat(dest, "/");
			strcat(dest, (slash != NULL) ? slash + 1 : src);
		} else
			pbs_strncpy(dest, pair->fp_local, sizeof(dest));
	}

	ret = sys_copy(dir, rmtflag, owner, src, pair, conn, prmt, jobid);

	if (ret == 0) {
		/*
		 ** Copy worked.  If old behavior is used, a stageout file
		 ** is deleted now.  New behavior of waiting to delete
		 ** everything could be achived by adding the file to
		 ** a list to delete later.
		 */
		if (dir == STAGE_DIR_OUT) {
			/*
			 ** have copied out, may need to remove local file
			 ** if sandbox=private then the file is not removed here
			 ** it will be removed when the sandbox directory is removed
			 */

			if (!(stage_inout->sandbox_private &&
			      is_child_path(pbs_jobdir, src) == 1)) {
				/* Check if local file path has comma in it, if
				 * found escape character prefixed will be
				 * removed
				 */
				replace(src, "\\,", ",", src_file);
				if (*src_file == '\0')
					pbs_strncpy(src_file, src, sizeof(src_file));

				if (remtree(src_file) < 0) {
					if (errno == ENOENT) {
						log_event(PBSEVENT_ADMIN,
							  PBS_EVENTCLASS_FILE,
							  LOG_INFO, src,
							  "previously removed");
					} else {
						char temp[80 + MAXPATHLEN];

						snprintf(temp, sizeof(temp),
							 msg_err_unlink,
							 "stage out", src);
						log_err(errno, "req_cpyfile",
							temp);
						add_bad_list(&(stage_inout->bad_list),
							     temp, 2);
						stage_inout->bad_files = 1;
					}
				}
			}
		} else {
			/*
			 ** Add destination (local) filename to list so it can
			 ** be deleted on later failure.
			 */
			char temp[80 + MAXPATHLEN];
			char **stage_file_list_temp = NULL;
			if (stage_inout->file_max == stage_inout->file_num) { /* need to extend list */
				stage_inout->file_max += 10;
				if ((stage_file_list_temp = (char **) realloc(stage_inout->file_list, stage_inout->file_max * sizeof(char **))) == NULL) {
					snprintf(temp, sizeof(temp), "Out of Memory!");
					log_err(ENOMEM, "req_cpyfile", temp);
					return -1;
				} else {
					stage_inout->file_list = stage_file_list_temp;
				}
			}

			DBPRT(("%s: listadd %s\n", __func__, dest))
			if ((stage_inout->file_list[stage_inout->file_num++] = strdup(dest)) == NULL) {
				snprintf(temp, sizeof(temp), "Out of Memory!");
				log_err(ENOMEM, "req_cpyfile", temp);
				return -1;
			}
		}
	} else { /* failure */

		FILE *fp = NULL;
		DBPRT(("%s: sys_copy failed, error = %d\n", __func__, ret))
		snprintf(log_buffer, sizeof(log_buffer), "Job %s: sys_copy failed, return value=%d", jobid, ret);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, log_buffer);
		stage_inout->bad_files = 1;
		snprintf(log_buffer, sizeof(log_buffer), "Unable to copy file %s %s %s",
			 (dir == STAGE_DIR_IN) ? dest : src,
			 (dir == STAGE_DIR_IN) ? "from" : "to",
			 (dir == STAGE_DIR_IN) ? src : pair->fp_rmt);
		add_bad_list(&(stage_inout->bad_list), log_buffer, 2);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_FILE, LOG_INFO,
			  pair->fp_local, log_buffer);

		/* copy message from rcp as well */
		if ((fp = fopen(rcperr, "r")) != NULL) {
			add_bad_list(&(stage_inout->bad_list), ">>> error from copy", 1);
			while (fgets(log_buffer, LOG_BUF_SIZE, fp) != NULL) {
				len = strlen(log_buffer) - 1;

				/* strip up to 2 line endings */
				if (len >= 0) {
					if (log_buffer[len] == '\n' ||
					    log_buffer[len] == '\r')
						log_buffer[len] = '\0';
					len--;
					if (len >= 0) {
						if (log_buffer[len] == '\n' ||
						    log_buffer[len] == '\r')
							log_buffer[len] = '\0';
					}
				}
				add_bad_list(&(stage_inout->bad_list), log_buffer, 1);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_FILE,
					  LOG_INFO, pair->fp_local, log_buffer);
			}
			fclose(fp);
			add_bad_list(&(stage_inout->bad_list), ">>> end error output", 1);
		} else {
			log_errf(errno, __func__, "Failed to open %s file", rcperr);
		}

		rc = -1;
		if (dir == STAGE_DIR_OUT) {
#ifndef NO_SPOOL_OUTPUT
			if (stage_inout->from_spool == 1) { /* copy out of spool */
				char undelname[MAXPATHLEN + 1];

				len = strlen(path_spool);
				pbs_strncpy(undelname, path_undeliv, sizeof(undelname));
				strcat(undelname, src + len); /* src path begins with spool */

				if (rename(src, undelname) == 0) { /* move file to undelivered */
					add_bad_list(&(stage_inout->bad_list), "Output retained on that host in: ", 1);
					add_bad_list(&(stage_inout->bad_list), undelname, 0);
				} else {
					char temp[80 + 2 * MAXPATHLEN];

					sprintf(temp, "Unable to rename %s to %s",
						src, undelname);
					log_err(errno, "req_cpyfile", temp);
				}
			}
#endif /* NO_SPOOL_OUTPUT */

			if (is_child_path(pbs_jobdir, src) == 1)
				stage_inout->stageout_failed = TRUE;
		}
	}

	unlink(rcperr);
	return rc;
}

/**
 * @brief
 *	stage_file - Handle file stage pair. The source could have a wildcard
 *	which would result in multipile copies.
 *
 * @param[in]		dir		-	direction of copy
 *							STAGE_DIR_IN - for stage in request
 *							STAGE_DIR_OUT - for stageout request
 * @param[in]		rmtflag		-	is remote file copy
 * @param[in]		owner		-	username for owner of copy request
 * @param[in]		pair		-	list of file pair
 * @param[in]		conn		-	socket on which request is received
 * @param[in/out]	stage_inout	-	pointer cpy_files struct
 * @param[in]		prmt		-	path to destination if stageout else source path
 * @param[in]		jobid		- 	job ID
 *
 * @return	int
 * @retval	0 - all OK
 * @retval 	!0 - error
 *
 */
int
stage_file(int dir, int rmtflag, char *owner, struct rqfpair *pair, int conn, cpy_files *stage_inout, char *prmt, char *jobid)
{
	char *ps = NULL;
	int i = 0;
	int rc = 0;
	int len = 0;
	char dname[MAXPATHLEN + 1] = {'\0'};
	char source[MAXPATHLEN + 1] = {'\0'};
	char matched[MAXPATHLEN + 1] = {'\0'};
	DIR *dirp = NULL;
	struct dirent *pdirent = NULL;
	struct stat statbuf;

	DBPRT(("%s: entered local %s remote %s\n", __func__, pair->fp_local, prmt))

	/*
	 * figure out the source path
	 */
	if (dir == STAGE_DIR_OUT) {
		source[0] = '\0';
		if (pair->fp_flag == STDJOBFILE) {
#ifndef NO_SPOOL_OUTPUT
			/* stdout | stderr from MOM's spool area */

			if (!(stage_inout->sandbox_private)) {
				DBPRT(("%s: STDJOBFILE from %s\n", __func__, path_spool))
				pbs_strncpy(source, path_spool, sizeof(source));
				stage_inout->from_spool = 1; /* flag as being in spool dir */
			}

			/*
			 * note, if NO_SPOOL_OUTPUT is defined, the
			 * output is in the user's home directory or job directory where
			 * we currently are.
			 */
#endif /* NO_SPOOL_OUTPUT */

		} else if (pair->fp_flag == JOBCKPFILE) {
			DBPRT(("%s: JOBCKPFILE from %s\n", __func__, path_checkpoint))
			pbs_strncpy(source, path_checkpoint, sizeof(source));
		}
		strcat(source, pair->fp_local);

		/* Staging out. Check to see if file is being staged out from spool directory (i.e., is stdout or stderr). If so,
		 * skip file if it doesn't exist in the spool directory, since it may have been directly written.
		 */

		if (stage_inout->from_spool && stage_inout->direct_write && !rmtflag) {
			if (stat(source, &statbuf) == -1) {
				if (errno == ENOENT) {
					sprintf(log_buffer,
						"Skipping directly written/absent spool file %s",
						source);
					log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB,
						  LOG_DEBUG, __func__, log_buffer);
					return 0;
				}
			}
		}

	} else { /* in bound (stage-in) file */
		/* take (remote) source name from request */
		pbs_strncpy(source, prmt, sizeof(source));
	}
	DBPRT(("%s: source %s\n", __func__, source))

	ps = strrchr(source, (int) '/');
	if (ps) {
		/* has prefix path, save parent directory name */
		len = (int) (ps - source) + 1;
		pbs_strncpy(dname, source, len + 1);
		ps++;
	} else {
		/* no prefix path, go with "./source" */
		dname[0] = '.';
		dname[1] = '/';
		dname[2] = '\0';
		ps = source;
	}

	if ((rmtflag != 0) && (dir == STAGE_DIR_IN)) { /* no need to check for wildcards */
		DBPRT(("%s: simple copy, remote/stagein\n", __func__))
		rc = copy_file(dir, rmtflag, owner, source,
			       pair, conn, stage_inout, prmt, jobid);
		if (rc != 0) {
			snprintf(log_buffer, sizeof(log_buffer), "Job %s: remote stagein failed for %s from %s to %s",
				 jobid, owner, source, pair->fp_local);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, log_buffer);
			goto error;
		}
		return 0;
	}

	/* if there are no wildcards we don't need to search */
	if ((strchr(ps, '*') == NULL) && (strchr(ps, '?') == NULL)) {
		DBPRT(("%s: simple copy, no wildcards\n", __func__))
		rc = copy_file(dir, rmtflag, owner, source,
			       pair, conn, stage_inout, prmt, jobid);
		if (rc != 0) {
			snprintf(log_buffer, sizeof(log_buffer), "Job %s: no wildcards:%s stage%s failed for %s from %s to %s",
				 jobid, (rmtflag == 1) ? "remote" : "local", (dir == STAGE_DIR_OUT) ? "out" : "in", owner, source,
				 (dir == STAGE_DIR_OUT) ? pair->fp_rmt : pair->fp_local);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, log_buffer);
			goto error;
		}
		return 0;
	}

	dirp = opendir(dname);
	if (dirp == NULL) { /* dir cannot be opened, just call copy_file */
		DBPRT(("%s: cannot open dir %s\n", __func__, dname))
		rc = copy_file(dir, rmtflag, owner, source,
			       pair, conn, stage_inout, prmt, jobid);
		if (rc != 0) {
			snprintf(log_buffer, sizeof(log_buffer), "Job %s: Cannot open directory:%s stage%s failed for %s from %s to %s",
				 jobid, (rmtflag == 1) ? "remote" : "local", (dir == STAGE_DIR_OUT) ? "out" : "in", owner, source,
				 (dir == STAGE_DIR_OUT) ? pair->fp_rmt : pair->fp_local);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, log_buffer);
			goto error;
		}
		return 0;
	}

	while (errno = 0, (pdirent = readdir(dirp)) != NULL) {
#ifdef WIN32
		DWORD fa = 0;

		if (strcmp(pdirent->d_name, ".") == 0 ||
		    strcmp(pdirent->d_name, "..") == 0)
			continue;

		/* get Windows file attributes */
		pbs_strncpy(matched, dname, sizeof(matched));
		strcat(matched, pdirent->d_name);
		fa = GetFileAttributes(matched);

		/* skip windows HIDDEN or SYSTEM files */
		if (fa == INVALID_FILE_ATTRIBUTES)
			continue;
		if (fa == FILE_ATTRIBUTE_HIDDEN)
			continue;
		if (fa == FILE_ATTRIBUTE_SYSTEM)
			continue;

#else
		/* skip unix files that begin with '.' */
		if (pdirent->d_name[0] == '.')
			continue;
#endif
		if (pbs_glob(pdirent->d_name, ps) != 0) {
			/* name matches */

			pbs_strncpy(matched, dname, sizeof(matched));
			strcat(matched, pdirent->d_name);
			DBPRT(("%s: match %s\n", __func__, matched))
			rc = copy_file(dir, rmtflag, owner, matched,
				       pair, conn, stage_inout, prmt, jobid);
			if (rc != 0) {
				(void) closedir(dirp);
				snprintf(log_buffer, sizeof(log_buffer), "Job %s: Pattern matched:%s stage%s failed for %s from %s to %s",
					 jobid, (rmtflag == 1) ? "remote" : "local", (dir == STAGE_DIR_OUT) ? "out" : "in", owner, source,
					 (dir == STAGE_DIR_OUT) ? pair->fp_rmt : pair->fp_local);
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, log_buffer);
				goto error;
			}
		}
	}
	if (errno != 0 && errno != ENOENT) { /* dir cannot be read, just call copy_file */
		DBPRT(("%s: cannot read dir %s\n", __func__, dname))
		rc = copy_file(dir, rmtflag, owner, source,
			       pair, conn, stage_inout, prmt, jobid);
		(void) closedir(dirp);
		if (rc != 0) {
			snprintf(log_buffer, sizeof(log_buffer), "Job %s: Cannot read directory:%s stage%s failed for %s from %s to %s",
				 jobid, (rmtflag == 1) ? "remote" : "local", (dir == STAGE_DIR_OUT) ? "out" : "in", owner, source,
				 (dir == STAGE_DIR_OUT) ? pair->fp_rmt : pair->fp_local);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, log_buffer);
			goto error;
		}
		return 0;
	}

	(void) closedir(dirp);
	return 0;

error:
	/* delete all the files in the list */
	for (i = 0; i < stage_inout->file_num; i++) {
		DBPRT(("%s: delete %s\n", __func__, stage_inout->file_list[i]))
		if (remtree(stage_inout->file_list[i]) != 0 && errno != ENOENT) {
			char temp[80 + MAXPATHLEN];

			sprintf(temp, msg_err_unlink, "stage in", stage_inout->file_list[i]);
			log_err(errno, "req_cpyfile", temp);
			add_bad_list(&(stage_inout->bad_list), temp, 2);
		}
	}
	return rc;
}

/**
 * @brief
 *	rmjobdir - Remove the staging and execution directory and any files
 *	within it.
 *
 * @param[in] jobid  - the job id string, i.e. "123.server"
 * @param[in] jobdir - the full path to the sandox (working directory to make
 * @param[in] uid    - the user id of the user under which the job will run.
 *		       Currenty this parameter only used in *nix so for
 *		       windows this parameter should be NULL
 * @param[in] gid    - the group id of the user under which the job will run.
 *		       Currenty this parameter only used in *nix so for
 *		       windows this parameter should be NULL
 * @param[in] check_shared - if set to '1', test if the staging and execution
 *			directory is sitting on a shared location, and if so,
 *			do not remove any files in it.
 * @return void
 *
 * @note	This may take awhile so the task is forked and execed to another
 *		process. In *nix, as with mkjobdir(),  the actions must be done
 *		as the User or as root depending on the location of the sandbox.
 *
 */
void
rmjobdir(char *jobid, char *jobdir, uid_t uid, gid_t gid, int check_shared)
{
	static char rmdir_buf[MAXPATHLEN + 1] = {'\0'};
	struct stat sb = {0};
	char *newdir = NULL;
	char *nameptr = NULL;
#ifdef WIN32
	struct pio_handles pio = {0};
	char cmdbuf[MAXPATHLEN + 1] = {'\0'};
	char sep = '\\';
#else
	pid_t pid = -1;
	char *rm = "/bin/rm";
	char *rf = "-rf";
	char sep = '/';
#endif

	if (jobdir == NULL)
		return;

	if (check_shared &&
	    (pbs_jobdir_root[0] != '\0') &&
	    pbs_jobdir_root_shared &&
	    ((strcmp(pbs_jobdir_root, JOBDIR_DEFAULT) == 0) ||
	     (strncmp(pbs_jobdir_root, jobdir, strlen(pbs_jobdir_root)) == 0))) {
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, jobid ? jobid : "", "shared jobdir %s to be removed by primary mom", jobdir);

		return;
	}

#ifndef WIN32
	if ((pbs_jobdir_root[0] == '\0') || (strcmp(pbs_jobdir_root, JOBDIR_DEFAULT) == 0)) {
		/* In user's home, need to be user */
		/* The rest must be done as the User */
		if (impersonate_user(uid, gid) == -1)
			return;
	}
#endif

	/* Hello, is any body there? */
	if (stat(jobdir, &sb) == -1) {
#ifndef WIN32
		if ((pbs_jobdir_root[0] == '\0') || (strcmp(pbs_jobdir_root, JOBDIR_DEFAULT) == 0)) {
			/* oops, have to go back to being root */
			revert_from_user();
		}
#endif
		if (errno != ENOENT) {
			sprintf(log_buffer, "stat: %s", jobdir);
			log_joberr(errno, __func__, log_buffer, jobid);
		}
		return;
	}

	/*
	 * The job path should be "pbs.<jobid>.x8z"
	 * if the string "pbs." is not found in the basename of
	 * the given path, then there is no staging and execution
	 * directory.  So don't delete anything, we don't want
	 * to remove too much!
	 * There is no need to check for trailing separator at the
	 * end of the job path, because jobdirname() does not add
	 * a trailing separator.
	 * NOTE: basename() wasn't available on all supported architectures,
	 * so instead we look for the last separator in the path name,
	 * and advance the pointer one space (past the
	 * separator) to get the basename.
	 */
	if ((nameptr = strrchr(jobdir, sep)) != NULL) {
		nameptr++;
	} else {
		/* we already have the basename */
		nameptr = jobdir;
	}

	if (strncmp(nameptr, "pbs.", 4) != 0) {
#ifndef WIN32
		if ((pbs_jobdir_root[0] == '\0') || (strcmp(pbs_jobdir_root, JOBDIR_DEFAULT) == 0))
			revert_from_user();
#endif
		sprintf(log_buffer, "%s is not a staging and execution directory", jobdir);
		log_joberr(-1, __func__, log_buffer, jobid);
		return;
	}

	snprintf(rmdir_buf, sizeof(rmdir_buf) - 1, "%s_remove", jobdir);
	newdir = rmdir_buf;

#ifdef WIN32
	make_dir_files_service_account_read(jobdir);

	if (!MoveFile(jobdir, newdir)) {
		errno = GetLastError();
		sprintf(log_buffer, "rename: %s %s", jobdir, newdir);
		log_joberr(errno, __func__, log_buffer, jobid);
		newdir = jobdir;
	}

	sprintf(cmdbuf, "rmdir /S /Q \"%s\"", newdir);
	if (!win_popen(cmdbuf, "w", &pio, NULL)) {
		errno = GetLastError();
		log_joberr(errno, __func__, "win_popen", jobid);
	}
	win_pclose2(&pio);
	close_valid_handle(&(pio.pi.hProcess));
#else
	if (rename(jobdir, newdir) == -1) {
		sprintf(log_buffer, "rename: %s %s", jobdir, newdir);
		log_joberr(errno, __func__, log_buffer, jobid);
		newdir = jobdir;
	}

	/* fork and exec the cleantmp process */
	pid = fork();
	if (pid != 0) { /* parent or error */
		int err = errno;
		if ((pbs_jobdir_root[0] == '\0') || (strcmp(pbs_jobdir_root, JOBDIR_DEFAULT) == 0))
			revert_from_user();

		if (pid < 0)
			log_err(err, __func__, "fork");
		return;
	}

	tpp_terminate();
	execl(rm, "pbs_cleandir", rf, newdir, NULL);
	log_err(errno, __func__, "execl");
	exit(21);
#endif
}

#ifndef WIN32

/**
 * @brief
 *	copy string quoting whitespace by prefixing with back-slash
 *
 * @par Functionality:
 *	Copy a source string into a buffer.  Any whitespace as defined by
 *	"isspace()" is prefixed by a back-slash '\'.
 *
 * @par Note
 *	this is compiled for Unix/Linux only.   Windows has it's own thing
 *	in lib/Libwin.
 *
 * @param[in]	pd  - input string
 * @param[in]	ps  - output buffer into which the coping is done
 * @param[in]	sz  - length of output buffer
 *
 * @return	int
 * @retval	0 : 	copied successfully
 * @retval	1 :	buffer would have overflowed, buf is not null terminated
 *
 */

static int
quote_and_copy_white(char *pd, char *ps, ssize_t sz)
{

	/* Copy the file path escaping white space with a back-slash */

	while (*ps) {
		if (isspace((int) *ps)) {
			*pd++ = '\\';
			if (--sz < 1)
				return 1;
		}
		*pd++ = *ps++; /* copy the character */
		if (--sz < 1)
			return 1;
	}
	*pd = '\0';
	return 0;
}
#else
/**
 * @brief
 *	is_scp_path - check whether scp_path in pbs_conf is set and contain "scp"
 *
 * @return	int
 * @retval	0 - either scp_path is not set or does not contain "scp"
 * @retval	1 - scp_path is set and contain "scp"
 *
 */
static int
is_scp_path(void)
{
	if (pbs_conf.scp_path &&
	    (strstr(pbs_conf.scp_path, "scp") ||
	     strstr(pbs_conf.scp_path, "SCP") ||
	     strstr(pbs_conf.scp_path, "Scp"))) {
		return (1);
	}
	return (0);
}

/**
 * @brief
 *	is_pbs_rcp_path - check whether rcp_path in pbs_conf is set and contain "pbs_rcp"
 *
 * @return	int
 * @retval	0 - either rcp_path is not set or does not contain "pbs_rcp"
 * @retval	1 - rcp_path is set and contain "pbs_rcp"
 *
 */
static int
is_pbs_rcp_path(void)
{
	if (pbs_conf.rcp_path &&
	    (strstr(pbs_conf.rcp_path, "pbs_rcp") ||
	     strstr(pbs_conf.scp_path, "PBS_RCP") ||
	     strstr(pbs_conf.scp_path, "Pbs_rcp"))) {
		return (1);
	}
	return (0);
}
#endif
/**
 * @brief
 *	sys_copy
 *	issue system call to copy file
 *	Also check error of copy process and retry as required
 *
 *	In Windows, use "xcopy" (for directory) or "copy" (for single file)
 *	for local copy and "pbs_rcp" for remote copy.
 *	If there is an error in the copy and pbs_rcp is used, it will try with scp.
 *
 *	In *nix, use "cp" for local copy and "scp"/"rcp" for remote copy.
 *	If there is an error in the copy and scp is used, it will try with rcp.
 *
 *	If there is an error, the copy will be retried 3 additional times.
 *
 * @param[in]		dir		-	direction of copy
 *						STAGE_DIR_IN - for stage in request
 *						STAGE_DIR_OUT - for stageout request
 * @param[in]		rmtflag		-	is remote file copy
 * @param[in]		owner		-	username for owner of copy request
 * @param[in]		src		-	path to source is stageout else local file name
 * @param[in]		pair		-	list of file pair
 * @param[in]		conn		-	socket on which request is received
 * @param[in]		prmt		-	path to destination if stageout else source path
 * @param[in]		jobid		-	Job ID
 *
 * @return	int
 * @retval	0 - successful copy
 * @retval 	!0 - copy failed
 *
 * @note
 * Use of the arguments is somewhat confusing, in summary the files copied are:
 *	STAGE_DIR_OUT
 *		"src"  local source file to copy
 *		"prmt" local or remote destination file
 *	STAGE_DIR_IN
 *		if remote - "prmt" is the remote source file
 *		if local  - "src"  is the local source file
 *		"pair->fp_local" is the local destination path in both cases
 *
 */
static int
sys_copy(int dir, int rmtflg, char *owner, char *src, struct rqfpair *pair, int conn, char *prmt, char *jobid)
{
	char *ag0 = NULL;
	char *ag1 = NULL;
	char ag2[MAXPATHLEN + 1] = {'\0'};
	char ag3[MAXPATHLEN + 1] = {'\0'};
	char local_file[MAXPATHLEN + 1] = {'\0'};
	char rmt_file[MAXPATHLEN + 1] = {'\0'};
	int loop = 0;
	int rc = 0;
	time_t original = 0;
	struct stat sb = {0};
#ifdef WIN32
	char str_buf[MAXPATHLEN + 1] = {'\0'};
	char *sp = NULL;
	char *dp = NULL;
	int fd = -1;
	STARTUPINFO si = {0};
	PROCESS_INFORMATION pi = {0};
	int flags = CREATE_DEFAULT_ERROR_MODE | CREATE_NEW_CONSOLE |
		    CREATE_NEW_PROCESS_GROUP;
	char cmd_line[PBS_CMDLINE_LENGTH] = {'\0'};
	char ag2_path[MAXPATHLEN + 1] = {'\0'};
	char ag3_path[MAXPATHLEN + 1] = {'\0'};
	char wdir[MAXPATHLEN + 1] = {'\0'};
	HANDLE readp = INVALID_HANDLE_VALUE;
	HANDLE writep = INVALID_HANDLE_VALUE;
	SECURITY_ATTRIBUTES sa = {0};
	struct passwd *pw = NULL;
#else
	int i;
	ssize_t len;
#endif

	DBPRT(("%s: %s %s copy %s of %s\n", __func__, owner,
	       rmtflg ? "remote" : "local",
	       (dir == STAGE_DIR_OUT) ? "out" : "in", src))

#ifdef WIN32
	ZeroMemory(&si, sizeof(SYSTEM_INFO));
	sa.nLength = sizeof(sa);
	sa.lpSecurityDescriptor = NULL;
	sa.bInheritHandle = TRUE;

	strcpy(wdir, "C:\\");

	if (getcwd(wdir, MAXPATHLEN + 1) == NULL) {
		log_errf(-1, __func__, "Failed to get the current working directory %s", wdir);
	}

	si.cb = sizeof(si);
	si.lpDesktop = PBS_DESKTOP_NAME;

	if ((pw = getpwnam(owner)) == NULL) {
		log_errf(-1, __func__, "Failed to get %s password", owner);
		rc = PBSE_BADUSER;
		goto sys_copy_end;
	}
#endif
	sprintf(rcperr, "%srcperr.%d", path_spool, getpid());

	if (dir == STAGE_DIR_OUT) {
#ifndef WIN32
		if (*src == '-')
			strcpy(ag2, "./"); /* prefix leading '-' with "./" */
#endif
		replace(src, "\\,", ",", local_file);
		if (*local_file != '\0')
			strcpy(ag2, local_file);
		else
			pbs_strncpy(ag2, src, sizeof(ag2));

#ifndef WIN32
		/* Is the file there?  If not, don`t try copy */
		if (access(ag2, F_OK | R_OK) < 0)
#else
		if (access_uncpath(ag2, F_OK | R_OK) < 0)
#endif
		{
			if (errno == ENOENT)
				return 1;
		}

		/* take (remote) destination name from request */
		if (rmtflg) {
#ifdef WIN32
			/* using rcp, need to prepend the owner name */
			if (is_scp_path() || is_pbs_rcp_path()) {
				strcat(ag3, owner);
				strcat(ag3, "@");
				replace(prmt, "\\,", ",", rmt_file);
				if (*rmt_file != '\0')
					strcat(ag3, rmt_file);
				else
					strcat(ag3, prmt);
			} else {
				for (dp = ag3, sp = prmt; *sp; dp++, sp++) {
					if (*sp == ':')
						break;
					*dp = *sp;
				}
				*dp++ = '.';
				strcpy(dp, owner);
				strcat(dp, ":");
				strcat(dp, sp + 1);
			}
#else
			/* using scp/rcp, need to prepend the owner name */
			strcat(ag3, owner);
			strcat(ag3, "@");
			len = strlen(ag3);
			if (quote_and_copy_white(ag3 + len, prmt, MAXPATHLEN - len) != 0)
				return 1;
#endif
		} else {
#ifndef WIN32
			if (*prmt == '-')
				strcat(ag3, "./"); /* prefix '-' with "./" */
#endif
			replace(prmt, "\\,", ",", rmt_file);
			if (*rmt_file != '\0')
				strcat(ag3, rmt_file);
			else
				strcat(ag3, prmt);
		}
	} else { /* in bound (stage-in) file */
		/* take (remote) source name from request */
		if (rmtflg) {
#ifdef WIN32
			/* using rcp, need to prepend the owner name */
			if (is_scp_path() || is_pbs_rcp_path()) {
				strcat(ag2, owner);
				strcat(ag2, "@");
				replace(prmt, "\\,", ",", rmt_file);
				if (*rmt_file != '\0')
					strcat(ag2, rmt_file);
				else
					strcat(ag2, prmt);
			} else {
				for (dp = ag2, sp = prmt; *sp; dp++, sp++) {
					if (*sp == ':')
						break;
					*dp = *sp;
				}
				*dp++ = '.';
				strcpy(dp, owner);
				strcat(dp, ":");
				strcat(dp, sp + 1);
			}
#else
			/* using scp/rcp, need to prepend the owner name */
			pbs_strncpy(ag2, owner, sizeof(ag2));
			strcat(ag2, "@");
			len = strlen(ag2);
			if (quote_and_copy_white(ag2 + len, prmt, MAXPATHLEN - len) != 0)
				return 1;
#endif
		} else {
#ifndef WIN32
			if (*src == '-')
				strcpy(ag2, "./"); /* prefix '-' with "./" */
#endif
			replace(src, "\\,", ",", rmt_file);
			if (*rmt_file != '\0')
				strcat(ag2, rmt_file);
			else
				strcat(ag2, src);
		}
#ifndef WIN32
		if (*pair->fp_local == '-')
			strcpy(ag3, "./"); /* prefix leading '-' with "./" */
#endif
		replace(pair->fp_local, "\\,", ",", local_file);
		if (*local_file != '\0')
			strcpy(ag3, local_file);
		else
			pbs_strncpy(ag3, pair->fp_local, sizeof(ag3));
	}

#ifndef WIN32
	for (loop = 1; loop < 5; ++loop) {
		original = 0;
		if (rmtflg == 0) { /* local copy */
			ag0 = pbs_conf.cp_path;
			if (strcmp(ag3, "/dev/null") == 0)
				return (0); /* don't need to copy, just return zero */
			else
				ag1 = "-rp";

			/* remote, try scp */
		} else if (pbs_conf.scp_path != NULL && (loop % 2) == 1) {
			ag0 = pbs_conf.scp_path;
			if (pbs_conf.scp_args != NULL) {
				ag1 = pbs_conf.scp_args;
                        } else {
				ag1 = "-Brvp";
                        }
		} else {
			ag0 = pbs_conf.rcp_path;
			ag1 = "-rp";
		}

		/*
		 * There is a problem where scp can return zero indicating success even
		 * though the copy did not work.  In the case of a remote stagein,
		 * where the file already exists, save the ctime of an existing file so
		 * we can check the ctime after the copy to be sure it worked.  ctime
		 * is used instead of mtime because scp may reset mtime.
		 */
		if ((rmtflg != 0) && (dir == STAGE_DIR_IN)) {
			if (stat(ag3, &sb) != -1)
				original = sb.st_ctime;
		}

		DBPRT(("%s: %s %s %s %s\n", __func__, ag0, ag1, ag2, ag3))

		if ((rc = fork()) > 0) {

			/* Parent */
			if (cred_pipe != -1) {
				if (write(cred_pipe, pwd_buf, cred_len) != cred_len) {
					log_err(errno, __func__, "pipe write");
				}
			}

			/* wait for copy to complete */
			while (((i = wait(&rc)) < 0) && (errno == EINTR))
				;
			if (i == -1) {
				rc = (20000 + errno); /* 200xx is error on wait */
			} else if (WIFEXITED(rc)) {
				if ((rc = WEXITSTATUS(rc)) == 0) {
					if ((rmtflg != 0) && (dir == STAGE_DIR_IN)) {
						if ((stat(ag3, &sb) == -1) ||
						    (original == sb.st_ctime))
							rc = 13;
					}
					return (rc); /* good,  stop now */
				}
			} else if (WIFSTOPPED(rc)) {
				rc = (30000 + WSTOPSIG(rc)); /* 300xx is stopped */
			} else if (WIFSIGNALED(rc)) {
				rc = (40000 + WTERMSIG(rc)); /* 400xx is signaled */
			}

		} else if (rc < 0) {

			rc = errno + 10000; /* error on fork (100xx), retry */

		} else {

			int fd;

			/* child - exec the copy command */

			(void) close(conn);

			/* redirect stderr to make error from rcp available to MOM */
			if ((fd = open(rcperr, O_RDWR | O_CREAT, 0644)) < 0) {
				(void) sprintf(log_buffer, "can't open %s, error = %d",
					       rcperr, errno);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_FILE,
					  LOG_DEBUG, __func__, log_buffer);
				exit(12);
			};
			if (fd != 2) {
				(void) dup2(fd, 2);
				(void) close(fd);
			}
			/*
			 * In order to fix a timing problem where the copy may have
			 * succeeded in less than a second, the child process may have to
			 * sleep for 1 second before doing the copy.  This will ensure the
			 * ctime will be different. This is needed because the exit value
			 * of the copy agent can be zero even when the copy did not work
			 * correctly.
			 *
			 * The value of original will be 0 or the previously existing
			 * file's ctime.  If this ctime is "right now", then we have to
			 * sleep a second so we can tell if the copy worked.  sleep() can
			 * be terminated early if a signal is received, so loop until the
			 * current time is different than the initial ctime of the file.
			 */
			while (original == time(NULL)) {
				sleep(1);
			}

			execl(ag0, ag0, ag1, ag2, ag3, NULL);
			sprintf(log_buffer, "command: %s %s %s %s execl failed %d", ag0, ag1, ag2, ag3, errno);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_FILE, LOG_DEBUG, __func__, log_buffer);
			exit(13); /* 13, an unluckly number */
		}

		/* copy did not work, try again */

		sprintf(log_buffer, "command: %s %s %s %s status=%d, try=%d", ag0, ag1, ag2, ag3, rc, loop);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_FILE, LOG_DEBUG, __func__, log_buffer);
		if ((loop % 2) == 0) /* don't sleep between scp and rcp */
			sleep(loop / 2 * 10 + 1);
	}
#else
	for (loop = 1; loop < 5; ++loop) {
		original = 0;
		if (rmtflg == 0) { /* local copy */
			ag0 = pbs_conf.cp_path;
			ag1 = "/e/i/q/y";
			/* remote, try scp */
		} else if (pbs_conf.scp_path != NULL && (loop % 2) == 1) {
			ag0 = pbs_conf.scp_path;
			struct stat local_sb = {0};
			char ag0_cpy[MAXPATHLEN + 1] = {'\0'};
			pbs_strncpy(ag0_cpy, ag0, sizeof(ag0_cpy));
			if (stat_uncpath(ag0_cpy, &local_sb) == -1) {
				log_errf(errno, __func__, "%s", ag0_cpy);
				/* let's try to copy using pbs_rcp now */
				continue;
			}
			if (pbs_conf.scp_args != NULL) {
				ag1 = pbs_conf.scp_args;
                        } else {
				ag1 = "-Brv";
                        }
		} else {
			ag0 = pbs_conf.rcp_path;
			if ((cred_buf != NULL) && (cred_len != 0)) {
				int clen;
				int wrote;

				ag1 = "-E -r";

				if (CreatePipe(&readp, &writep, &sa, 0) == 0) {
					log_err(-1, __func__, "Unable to create pipe");
					rc = 22;
					goto sys_copy_end;
				}
				clen = sizeof(size_t);
				WriteFile(writep, &cred_len, clen, &wrote, NULL);

				if (wrote != clen) {
					log_errf(-1, __func__, "sending cred_len: wrote %d should be %d", wrote, clen);
					rc = 22;
					goto sys_copy_end;
				}
				WriteFile(writep, cred_buf, cred_len, &wrote, NULL);
				if (wrote != cred_len) {
					log_errf(-1, __func__, "sending cred_buf: wrote %d should be %d", wrote, clen);
					rc = 22;
					goto sys_copy_end;
				}
			} else {
				ag1 = "-r";
			}
		}

		/*
		 ** There is a problem where scp can return zero
		 ** indicating success even though the copy did
		 ** not work.  In the case of a remote stagein,
		 ** save the mtime of an existing file so we can
		 ** check the mtime after the copy to be sure it
		 ** worked.
		 */
		if ((rmtflg != 0) && (dir == STAGE_DIR_IN)) {
			if (stat_uncpath(ag3, &sb) != -1)
				original = sb.st_mtime;
		}

		/* redirect stderr to make error from rcp available to MOM */
		if ((fd = open(rcperr, O_RDWR | O_CREAT, 0644)) < 0) {
			log_errf(errno, __func__, "can't open %s", rcperr);
			rc = 12;
		} else {
			errno = 0;

			if (rmtflg == 0) {
				/*
				 *  Xcopy Implementation.
				 */
				replace(ag2, "\\ ", " ", str_buf);
				snprintf(ag2_path, sizeof(ag2_path),
					 "%s", str_buf);
				fix_path(ag2_path, 3);

				if (stat_uncpath(ag2, &sb) != -1) {
					if (S_ISREG(sb.st_mode)) {
						replace(ag3, "\\ ", " ", str_buf);
						snprintf(ag3_path, sizeof(ag3_path), "%s",
							 str_buf);
						fix_path(ag3_path, 3);

						/* if file, use copy with /y option */
						/* the option /y will supress any file
						 overwrite messages */
						ag0 = "copy";
						ag1 = "/y";
						snprintf(cmd_line, sizeof(cmd_line),
							 "cmd /c %s %s \"%s\" \"%s\"",
							 ag0, ag1, ag2_path, ag3_path);
					} else {
						char ag3_tmp[MAXPATHLEN + 1];
						char *ss, *ts;
						size_t len;

						pbs_strncpy(ag3_tmp, ag3, sizeof(ag3_tmp));
						len = strlen(ag3_tmp);

						/*
						 * Handle case where destination path has
						 * a trailing slash.
						 */
						if (len > 0 && ag3_tmp[len - 1] == '/') {
							len--;
							ag3_tmp[len] = '\0';
						}
						/*
						 * Compare the last component of the source
						 * to the last component of the target to
						 * see if they match.
						 */
						ss = strrchr(ag2, '/');
						ss = ss ? ss + 1 : ag2;
						ts = strrchr(ag3_tmp, '/');
						ts = ts ? ts + 1 : ag3_tmp;

						if (strcmp(ss, ts) != 0) {
							/*
							 * The last path components are different
							 * so add last component of source directory
							 * to target since xcopy will not do it.
							 */
							strncat(ag3_tmp, "/",
								sizeof(ag3_tmp) - len - 1);
							strncat(ag3_tmp, ss,
								sizeof(ag3_tmp) - len - 2);
						}
						replace(ag3_tmp, "\\ ", " ", str_buf);
						snprintf(ag3_path, sizeof(ag3_path), "%s",
							 str_buf);
						fix_path(ag3_path, 3);
						snprintf(cmd_line, sizeof(cmd_line),
							 "cmd /c %s %s \"%s\" \"%s\"",
							 ag0, ag1, ag2_path, ag3_path);
					}
				} else {
					log_errf(errno, __func__, "%s", ag2);
					rc = errno;
					goto sys_copy_end;
				}
			} else {
				si.dwFlags = STARTF_USESTDHANDLES;

				if (readp != INVALID_HANDLE_VALUE)
					si.hStdInput = readp;
				else
					si.hStdInput = INVALID_HANDLE_VALUE;

				si.hStdOutput = INVALID_HANDLE_VALUE;
				si.hStdError = (HANDLE) _get_osfhandle(fd);

				if (ag2[1] == ':') { /* has drive info */

					sprintf(wdir, "%c:\\", toupper(ag2[0]));
					if (_getdcwd(toupper(ag2[0]) - 'A' + 1, wdir, sizeof(wdir)) == NULL) {
						log_errf(errno, __func__, "Failed to get the full path of the current working directory on the specified drive %s", wdir);
					}
					strcpy(ag2_path, replace_space(ag2 + 2, ""));
					fix_path(ag2_path, 3);
				} else if (strchr(ag2, ':')) {
					/* replace "\ " wth " " so "\" not forwarded */
					replace(ag2, "\\ ", " ", ag2_path);
					fix_path(ag2_path, 1);
					sprintf(ag2_path, "\"%s\"",
						replace_space(ag2_path, "\\ "));
				} else {
					sprintf(ag2_path, "\"%s\"", ag2);
					fix_path(ag2_path, 3);
				}

				if (ag3[1] == ':') { /* has drive info */

					sprintf(wdir, "%c:\\", toupper(ag3[0]));

					strcpy(ag3_path, replace_space(ag3 + 2, ""));
					fix_path(ag3_path, 3);
				} else if (strchr(ag3, ':')) {
					/* replace "\ " wth " " so "\" not forwarded */
					replace(ag3, "\\ ", " ", ag3_path);
					fix_path(ag3_path, 1);
					sprintf(ag3_path, "\"%s\"",
						replace_space(ag3_path, "\\ "));
				} else {
					sprintf(ag3_path, "\"%s\"", ag3);
					fix_path(ag3_path, 3);
				}

				sprintf(cmd_line, "%s %s %s %s", ag0, ag1,
					ag2_path, ag3_path);
			}

			/*
			 ** In order to fix a timing problem where the copy may
			 ** have succeeded in less than a second, the child
			 ** process may have to sleep for 1 second before doing
			 ** the copy.  This will ensure the mtime will be different.
			 ** This is needed because the exit value of
			 ** the copy agent can be zero even when the copy
			 ** did not work correctly.
			 **
			 ** The value of original will be 0 or the previously
			 ** existing file's mtime.  If this mtime is "right now",
			 ** then we have to sleep a second so we can tell if
			 ** the copy worked.
			 */
			if (original == time(NULL))
				sleep(1);
			/* Re-initialize errno to zero */
			errno = 0;

			/* do we need 'AsUser' here? */
			if ((pw->pw_userlogin == INVALID_HANDLE_VALUE) && (strcmpi(owner, getlogin()) == 0)) {
				snprintf(log_buffer, sizeof(log_buffer), "Job %s: CreateProcess(%s) under acct %s wdir=%s",
					 jobid, cmd_line, owner, wdir);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, log_buffer);
				rc = CreateProcess(NULL, cmd_line,
						   NULL, NULL, TRUE, flags,
						   NULL, wdir, &si, &pi);
				if (rc == 0) {
					errno = GetLastError();
					log_err(-1, __func__, "CreateProcess failed");
				}
			} else {
				snprintf(log_buffer, sizeof(log_buffer), "Job %s: CreateProcessAsUser(%d, %s) under acct %s wdir=%s",
					 jobid, pw->pw_userlogin, cmd_line, getlogin(), wdir);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, log_buffer);
				rc = CreateProcessAsUser(pw->pw_userlogin, NULL, cmd_line,
							 NULL, NULL, TRUE, flags,
							 NULL, wdir, &si, &pi);
				if (rc == 0) {
					errno = GetLastError();
					log_err(-1, __func__, "CreateProcessAsUser failed");
				}
			}

			if (rc == 0) {
				errno = GetLastError();
				snprintf(log_buffer, sizeof(log_buffer), "Job %s: process creation failed errno %lu", jobid, errno);
				log_err(-1, __func__, log_buffer);
			}

			close(fd);
			fd = -1; /* already done the close */

			if (errno != 0) {
				rc = errno + 10000; /* error on fork (100xx), retry */
			} else {
				int ret = 0;
				ret = WaitForSingleObject(pi.hProcess, INFINITE);
				if (ret != WAIT_OBJECT_0) {
					if (ret != WAIT_FAILED) {
						sprintf(log_buffer, "Job %s: WaitForSingleObject failed with status=%d", jobid, ret);
						log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_FILE, LOG_ERR, __func__, log_buffer);
					} else {
						sprintf(log_buffer, "Job %s: WaitForSingleObject failed with status=%d", jobid, ret);
						log_err(-1, __func__, log_buffer);
					}
				}
				if (!GetExitCodeProcess(pi.hProcess, &rc)) {
					sprintf(log_buffer, "Job %s: GetExitCodeProcess failed", jobid);
					log_err(-1, __func__, log_buffer);
				}
				if (rc != 0) {
					sprintf(log_buffer, "Job %s: GetExitCodeProcess return code=%d", jobid, rc);
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, __func__, log_buffer);
				}
				CloseHandle(pi.hProcess);
				CloseHandle(pi.hThread);

				if (errno != 0) {
					rc = (20000 + errno); /* 200xx is error on wait */
				} else {
					if ((rmtflg != 0) && (dir == STAGE_DIR_IN)) {
						if ((stat_uncpath(ag3, &sb) == -1) ||
						    (original == sb.st_mtime))
							rc = 13;
					}
					goto sys_copy_end;
				}
			}
		}

		/* copy did not work, try again */
		(void) sprintf(log_buffer,
			       "command: %s %s %s %s status=%d, try=%d",
			       ag0, ag1, ag2, ag3, rc, loop);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_FILE, LOG_DEBUG,
			  __func__, log_buffer);
		if ((loop % 2) == 0) /* don't sleep between scp and rcp */
			Sleep(1000 * (loop / 2 * 10 + 1));
	}

sys_copy_end:
	if (readp != INVALID_HANDLE_VALUE) {
		CloseHandle(readp);
	}
	if (writep != INVALID_HANDLE_VALUE) {
		CloseHandle(writep);
	}

	if (fd != -1)
		(void) close(fd);
#endif
	return (rc); /* tried a bunch of times, just give up */
}

#ifdef WIN32
/**
 * @brief
 *	free_pcphosts - Free allocated cphosts struct (i.e. pcphosts)
 *
 * @return void
 *
 */
static void
free_pcphosts(void)
{
	int nh = 0;

	if (pcphosts != NULL && cphosts_num > 0) {
		for (nh = 0; nh < cphosts_num; nh++) {
			if ((pcphosts + nh)->cph_hosts != NULL) {
				free((pcphosts + nh)->cph_hosts);
				(pcphosts + nh)->cph_hosts = NULL;
			}

			if ((pcphosts + nh)->cph_from != NULL) {
				free((pcphosts + nh)->cph_from);
				(pcphosts + nh)->cph_from = NULL;
			}

			if ((pcphosts + nh)->cph_to != NULL) {
				free((pcphosts + nh)->cph_to);
				(pcphosts + nh)->cph_to = NULL;
			}
		}

		free(pcphosts);
		pcphosts = NULL;
		cphosts_num = 0;
	}
}

/**
 * @brief
 *	recv_pcphosts - Receive cphosts struct through stdin sent by parent MoM
 *
 * @return	int
 * @retval	0 - on Error
 * @retval	1 - on Success
 *
 * @note	This function will put received info in
 *		global struct pcphosts and cphosts_num variable
 *
 */
int
recv_pcphosts(void)
{
	char buf[CPY_PIPE_BUFSIZE] = {'\0'};
	int nh = 0;

	if (fgets(buf, sizeof(int), stdin) == NULL) {
		log_err(-1, __func__, "Failed to read cphosts_num");
		return 0;
	} else {
		buf[strlen(buf) - 1] = '\0';
		cphosts_num = (unsigned) atoi(buf);
	}

	if (cphosts_num <= 0) {
		return 1;
	} else {
		if ((pcphosts = malloc(cphosts_num * sizeof(struct cphosts))) == NULL) {
			log_err(errno, __func__, "malloc failed");
			return 0;
		} else {
			memset(pcphosts, 0, (cphosts_num * sizeof(struct cphosts)));
		}
	}

	for (nh = 0; nh < cphosts_num; nh++) {

		if (fgets(buf, sizeof(buf), stdin) == NULL) {
			free_pcphosts();
			log_err(-1, __func__, "Failed to read cph_hosts");
			return 0;
		} else {
			buf[strlen(buf) - 1] = '\0';
			if (((pcphosts + nh)->cph_hosts = strdup(buf)) == NULL) {
				log_err(-1, __func__, "Failed to allocate data to cph_hosts");
				free_pcphosts();
				return 0;
			} else
				memset(buf, 0, sizeof(buf));
		}

		if (fgets(buf, sizeof(buf), stdin) == NULL) {
			free_pcphosts();
			log_err(-1, __func__, "Failed to read cph_from");
			return 0;
		} else {
			buf[strlen(buf) - 1] = '\0';
			if (((pcphosts + nh)->cph_from = strdup(buf)) == NULL) {
				log_err(-1, __func__, "Failed to allocate data to cph_from");
				free_pcphosts();
				return 0;
			} else
				memset(buf, 0, sizeof(buf));
		}

		if (fgets(buf, sizeof(buf), stdin) == NULL) {
			log_err(-1, __func__, "Failed to read cph_to");
			free_pcphosts();
			return 0;
		} else {
			buf[strlen(buf) - 1] = '\0';
			if (((pcphosts + nh)->cph_to = strdup(buf)) == NULL) {
				log_err(-1, __func__, "Failed to allocate data to cph_to");
				free_pcphosts();
				return 0;
			} else
				memset(buf, 0, sizeof(buf));
		}
	}
	return 1;
}

/**
 * @brief
 *	free_rq_cpyfile_cred - Free allocated rq_cpyfile and cred info (if any)
 *
 * @param[in] pcf - pointer to already allocated rq_cpyfile struct
 *
 * @return void
 *
 */
static void
free_rq_cpyfile_cred(struct rq_cpyfile *pcf)
{
	if (pcf != NULL) {
		struct rqfpair *ppair = NULL;

		while ((ppair = (struct rqfpair *) GET_NEXT(pcf->rq_pair)) != NULL) {
			delete_link(&ppair->fp_link);
			if (ppair->fp_local)
				(void) free(ppair->fp_local);
			if (ppair->fp_rmt)
				(void) free(ppair->fp_rmt);
			(void) free(ppair);
		}
	}

	if (cred_buf != NULL) {
		memset(cred_buf, 0, cred_len);
		free(cred_buf);
		cred_buf = NULL;
		cred_len = 0;
	}
}

/**
 * @brief
 *	recv_rq_cpyfile_cred - Receive rq_cpyfile struct and cred_info (if any) through stdin sent by parent MoM
 *
 * @param[in/out] pcf - pointer to already allocated rq_cpyfile struct
 *
 * @return	int
 * @retval	0 - on Error
 * @retval	1 - on Success
 *
 * @note	This function will put received cred info (if any) in
 *		global variable cred_buf and cred_len
 *
 */
int
recv_rq_cpyfile_cred(struct rq_cpyfile *pcf)
{
	int pair_ct = 0;
	struct rqfpair *ppair = NULL;
	char buf[CPY_PIPE_BUFSIZE] = {'\0'};

	CLEAR_HEAD(pcf->rq_pair);

	if (fgets(pcf->rq_jobid, PBS_MAXJOBNAME, stdin) == NULL) {
		log_err(-1, __func__, "Failed to read rq_jobid");
		return 0;
	} else {
		pcf->rq_jobid[strlen(pcf->rq_jobid) - 1] = '\0';
	}

	if (fgets(pcf->rq_owner, PBS_MAXUSER, stdin) == NULL) {
		log_err(-1, __func__, "Failed to read rq_owner");
		return 0;
	} else {
		pcf->rq_owner[strlen(pcf->rq_owner) - 1] = '\0';
	}

	if (fgets(pcf->rq_user, PBS_MAXUSER, stdin) == NULL) {
		log_err(-1, __func__, "Failed to read rq_user");
		return 0;
	} else {
		pcf->rq_user[strlen(pcf->rq_user) - 1] = '\0';
	}

	if (fgets(pcf->rq_group, PBS_MAXGRPN, stdin) == NULL) {
		log_err(-1, __func__, "Failed to read rq_group");
		return 0;
	} else {
		pcf->rq_group[strlen(pcf->rq_group) - 1] = '\0';
	}

	if (fgets(buf, sizeof(int), stdin) == NULL) {
		log_err(-1, __func__, "Failed to read rq_dir");
		return 0;
	} else {
		buf[strlen(buf) - 1] = '\0';
		pcf->rq_dir = (unsigned) atoi(buf);
	}

	if (fgets(buf, sizeof(int), stdin) == NULL) {
		log_err(-1, __func__, "Failed to read pair_ct");
		return 0;
	} else {
		buf[strlen(buf) - 1] = '\0';
		pair_ct = (unsigned) atoi(buf);
	}

	while (pair_ct--) {

		ppair = (struct rqfpair *) malloc(sizeof(struct rqfpair));
		if (ppair == NULL) {
			log_err(-1, __func__, "rqfpair: malloc failed");
			free_rq_cpyfile_cred(pcf);
			return 0;
		}
		CLEAR_LINK(ppair->fp_link);
		ppair->fp_flag = 0;
		ppair->fp_local = NULL;
		ppair->fp_rmt = NULL;

		if (fgets(buf, sizeof(int), stdin) == NULL) {
			free(ppair);
			ppair = NULL;
			free_rq_cpyfile_cred(pcf);
			log_err(-1, __func__, "Failed to read fp_flag");
			return 0;
		} else {
			buf[strlen(buf) - 1] = '\0';
			ppair->fp_flag = atoi(buf);
		}

		if ((ppair->fp_local = (char *) malloc(MAXPATHLEN + 1)) == NULL) {
			free(ppair);
			ppair = NULL;
			free_rq_cpyfile_cred(pcf);
			log_err(-1, __func__, "Failed to read fp_local");
			return 0;
		} else {
			memset(ppair->fp_local, 0, MAXPATHLEN + 1);
			if (fgets(ppair->fp_local, MAXPATHLEN, stdin) == NULL) {
				free(ppair->fp_local);
				ppair->fp_local = NULL;
				free(ppair);
				ppair = NULL;
				free_rq_cpyfile_cred(pcf);
				return 0;
			} else {
				ppair->fp_local[strlen(ppair->fp_local) - 1] = '\0';
			}
		}

		if ((ppair->fp_rmt = (char *) malloc(MAXPATHLEN + 1)) == NULL) {
			free(ppair->fp_local);
			ppair->fp_local = NULL;
			free(ppair);
			ppair = NULL;
			free_rq_cpyfile_cred(pcf);
			log_err(errno, __func__, "fp_rmt: malloc failed");
			return 0;
		} else {
			memset(ppair->fp_rmt, 0, MAXPATHLEN + 1);
			if (fgets(ppair->fp_rmt, MAXPATHLEN, stdin) == NULL) {
				free(ppair->fp_rmt);
				ppair->fp_rmt = NULL;
				free(ppair->fp_local);
				ppair->fp_local = NULL;
				free(ppair);
				ppair = NULL;
				free_rq_cpyfile_cred(pcf);
				log_err(-1, __func__, "Failed to read fp_rmt");
				return 0;
			} else {
				ppair->fp_rmt[strlen(ppair->fp_rmt) - 1] = '\0';
			}
		}
		append_link(&pcf->rq_pair, &ppair->fp_link, ppair);
	}

	if (fgets(buf, sizeof(buf), stdin) == NULL) {
		free_rq_cpyfile_cred(pcf);
		log_err(-1, __func__, "Failed to read pcf");
		return 0;
	} else {
		buf[strlen(buf) - 1] = '\0';
		if (strcmp(buf, "cred_info") == 0) {
			DWORD a_cnt = 0;

			if (fgets(buf, sizeof(buf), stdin) == NULL) {
				free_rq_cpyfile_cred(pcf);
				log_err(-1, __func__, "Failed to read cred_length");
				return 0;
			} else {
				buf[strlen(buf) - 1] = '\0';
				cred_len = atoi(buf);
			}

			if (fgets(buf, sizeof(buf), stdin) == NULL) {
				free_rq_cpyfile_cred(pcf);
				log_err(-1, __func__, "Failed to read cred_buf");
				return 0;
			} else {
				buf[strlen(buf) - 1] = '\0';
				cred_buf = NULL;
				if (decode_from_base64(buf, &cred_buf, &a_cnt)) {
					sprintf(log_buffer, "Failed to decode buf: %s, len: %d", buf, strlen(buf));
					log_err(-1, __func__, log_buffer);
					return 0;
				}
			}

			if (cred_len != a_cnt) {
				sprintf(log_buffer, "Data mismatch, cred_len: %d, decoded_cred_len: %d", cred_len, a_cnt);
				log_err(-1, __func__, log_buffer);
				free_rq_cpyfile_cred(pcf);
				free(cred_buf);
				return 0;
			}
		} else if (strcmp(buf, "no_cred_info") == 0) {
			cred_buf = NULL;
			cred_len = 0;
		}
	}
	return 1;
}

/**
 * @brief
 *	send_pcphosts - Send cphosts structure (information about usecp from mom config file)
 *	and cphosts_num (no. of usecp entry in cphosts struct) to
 *	given pipe handles <pio>
 *
 * @param[in]	pio      -	pio_handles struct which include
 *				handle to pipe on which info will be sent
 * @param[in]	pcphosts -	pointer to cphosts struct which will be sent to pipe
 *
 * @return	void
 *
 */
void
send_pcphosts(pio_handles *pio, struct cphosts *pcphosts)
{
	char buf[CPY_PIPE_BUFSIZE + 1] = {'\0'};
	int nh = 0;

	if ((cphosts_num <= 0) || (pcphosts == NULL))
		/* nothing to send, just return */
		return;

	snprintf(buf, sizeof(buf) - 1, "%s\n", "pcphosts=");
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "%d\n", cphosts_num);
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	for (nh = 0; nh < cphosts_num; nh++) {
		snprintf(buf, sizeof(buf) - 1, "%s\n", (pcphosts + nh)->cph_hosts);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

		snprintf(buf, sizeof(buf) - 1, "%s\n", (pcphosts + nh)->cph_from);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

		snprintf(buf, sizeof(buf) - 1, "%s\n", (pcphosts + nh)->cph_to);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));
	}
}

/**
 * @brief
 *	send_rq_cpyfile_cred - Send given rq_cpyfile structure and cred info (if any) to
 *	given pipe handles <pio>
 *
 * @param[in]	pio	-	pio_handles struct which include
 *				handle to pipe on which info will be sent
 * @param[in]	pcf	-	pointer to rq_cpyfile struct which will be sent to pipe
 *
 * @return	int
 * @retval	0 - on Error
 * @retval  	1 - on Success
 *
 * @note	This function will cred info from global variable cred_buf and cred_len
 *
 */
int
send_rq_cpyfile_cred(pio_handles *pio, struct rq_cpyfile *pcf)
{
	char buf[CPY_PIPE_BUFSIZE + 1] = {'\0'};
	int pair_ct = 0;
	struct rqfpair *ppair = NULL;

	if ((pio == NULL) || (pcf == NULL)) {
		return 0;
	}

	ppair = (struct rqfpair *) GET_NEXT(pcf->rq_pair);
	while (ppair) {
		++pair_ct;
		ppair = (struct rqfpair *) GET_NEXT(ppair->fp_link);
	}

	snprintf(buf, sizeof(buf) - 1, "%s\n", "rq_cpyfile=");
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "%s\n", pcf->rq_jobid);
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "%s\n", pcf->rq_owner);
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "%s\n", pcf->rq_user);
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "%s\n", pcf->rq_group);
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "%d\n", pcf->rq_dir);
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	snprintf(buf, sizeof(buf) - 1, "%d\n", pair_ct);
	check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

	ppair = (struct rqfpair *) GET_NEXT(pcf->rq_pair);
	while (ppair) {
		snprintf(buf, sizeof(buf) - 1, "%d\n", ppair->fp_flag);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

		snprintf(buf, sizeof(buf) - 1, "%s\n", ppair->fp_local);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

		snprintf(buf, sizeof(buf) - 1, "%s\n", ppair->fp_rmt);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

		ppair = (struct rqfpair *) GET_NEXT(ppair->fp_link);
	}

	if (cred_buf != NULL && cred_len != 0) {
		char *str = NULL;
		snprintf(buf, sizeof(buf) - 1, "cred_info\n");
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

		snprintf(buf, sizeof(buf) - 1, "%d\n", cred_len);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));

		if (encode_to_base64(cred_buf, cred_len, &str)) {
			sprintf(log_buffer, "Failed to encode cred_buf: %s, len: %d", cred_buf, cred_len);
			log_err(-1, __func__, log_buffer);
			return 0;
		}
		snprintf(buf, sizeof(buf) - 1, "%s\n", str);
		free(str);
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));
	} else {
		snprintf(buf, sizeof(buf) - 1, "no_cred_info\n");
		check_err(__func__, buf, win_pwrite(pio, buf, strlen(buf)));
	}
	return 1;
}
#endif


================================================
FILE: src/resmom/start_exec.c
================================================
	/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <dirent.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <pwd.h>
#include <grp.h>
#include <string.h>
#include <limits.h>
#include <assert.h>
#include <signal.h>
#include <termios.h>
#include <sys/param.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <sys/resource.h>
#include <sys/socket.h>
#include <sys/wait.h>
#include <netinet/in.h>
#include <fcntl.h>

#if defined(__osf__)
#include <stropts.h>
#endif

#include "libpbs.h"
#include "portability.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "log.h"
#include "tpp.h"
#include "dis.h"
#include "pbs_nodes.h"
#include "mom_mach.h"
#include "pbs_error.h"
#include "net_connect.h"
#include "batch_request.h"
#include "mom_func.h"
#include "pbs_ifl.h"
#include "port_forwarding.h"

#include "credential.h"
#include "ticket.h"
#include "svrfunc.h"
#include "libsec.h"
#include "mom_hook_func.h"
#include "mom_server.h"
#include "placementsets.h"
#include "pbs_internal.h"
#include "pbs_reliable.h"

#include "renew_creds.h"

#include "mock_run.h"

#define PIPE_READ_TIMEOUT 5
#define EXTRA_ENV_PTRS 32

/* Global Variables */

extern char mom_host[];
extern int num_var_env;
extern char **environ;
extern int exiting_tasks;
extern u_long localaddr;
extern int lockfds;
extern pbs_list_head mom_polljobs;
extern int next_sample_time;
extern int min_check_poll;
extern char *path_jobs;
extern char *path_prolog;
extern char *path_spool;
extern unsigned int pbs_rm_port;
extern gid_t pbsgroup;
extern int server_stream;
extern unsigned int pbs_mom_port;
extern time_t time_now;
extern time_t time_resc_updated;
extern char *path_hooks_workdir;
extern long joinjob_alarm_time;
extern long job_launch_delay;
int mom_reader_go; /* see catchinter() & mom_writer() */

extern int x11_reader_go;
extern int enable_exechost2;
extern char *msg_err_malloc;
extern unsigned char pbs_aes_key[][16];
extern unsigned char pbs_aes_iv[][16];

int ptc = -1; /* fd for master pty */
#include <poll.h>
#ifdef RLIM64_INFINITY
extern struct rlimit64 orig_nproc_limit;
extern struct rlimit64 orig_core_limit;
#else
extern struct rlimit orig_nproc_limit;
extern struct rlimit orig_core_limit;
#endif /* RLIM64... */

extern eventent *event_dup(eventent *ep, job *pjob, hnodent *pnode);
extern void send_join_job_restart_mcast(int mtfd, int com, eventent *ep, int nth, job *pjob, pbs_list_head *phead);

/* Local Varibles */

static int script_in;	/* script file, will be stdin	  */
static pid_t writerpid; /* writer side of interactive job */
static pid_t shellpid;	/* shell part of interactive job  */
static size_t cred_len;
static char *cred_buf;

char *variables_else[] = {/* variables to add, value computed */
			  "HOME",
			  "LOGNAME",
			  "PBS_JOBNAME",
			  "PBS_JOBID",
			  "PBS_QUEUE",
			  "SHELL",
			  "USER",
			  "PBS_JOBCOOKIE",
			  "PBS_NODENUM",
			  "PBS_TASKNUM",
			  "PBS_MOMPORT",
			  "PBS_NODEFILE",
			  "OMP_NUM_THREADS",
			  "PBS_ACCOUNT",
			  "PBS_ARRAY_INDEX",
			  "PBS_ARRAY_ID"};

static int num_var_else = sizeof(variables_else) / sizeof(char *);
static void catchinter(int);

extern int is_direct_write(job *, enum job_file, char *, int *);
static int direct_write_possible = 1;

void
starter_return(int upfds, int downfds, int code,
	       struct startjob_rtn *);

#define FDMOVE(fd)                                \
	if (fd < 3) {                             \
		int hold = fcntl(fd, F_DUPFD, 3); \
		(void) close(fd);                 \
		fd = hold;                        \
	}

/**
 * @brief
 * 	Internal error routine.
 *
 * @param[in] string - error related to
 * @param[in] value - error number
 *
 * @return 	int
 * @retval	error number
 *
 */
int
error(char *string, int value)
{
	int i = 0;
	char *message;
	extern char *msg_momsetlim;
	extern struct pbs_err_to_txt pbs_err_to_txt[];

	assert(string != NULL);
	assert(*string != '\0');
	assert(value > PBSE_);		  /* minimum PBS error number */
	assert(value <= PBSE_NOSYNCMSTR); /* maximum PBS error number */
	assert(pbs_err_to_txt[i].err_no != 0);

	do {
		if (pbs_err_to_txt[i].err_no == value)
			break;
	} while (pbs_err_to_txt[++i].err_no != 0);

	assert(pbs_err_to_txt[i].err_txt != NULL);
	message = *pbs_err_to_txt[i].err_txt;
	assert(message != NULL);
	assert(*message != '\0');

	if (value == PBSE_SYSTEM) {
		strcpy(log_buffer, message);
		strcat(log_buffer, strerror(errno));
		message = log_buffer;
	}
	(void) fprintf(stderr, msg_momsetlim, string, message);
	(void) fflush(stderr);

	return value;
}

/**
 * @brief
 * 	no_hang() - interrupt handler for alarm() around attempt to connect
 *	to qsub for interactive jobs.   If qsub hung or suspended or if the
 *	network is fouled up, mom cannot afford to wait forever.
 *
 * @param[in] sig - signal number
 *
 * @return 	Void
 *
 */

static void
no_hang(int sig)
{
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_REQUEST, LOG_DEBUG, " ",
		  "alarm timed-out connect to qsub");
}

/**
 * @brief
 *	validate credentials of user for job.
 *
 * @param[in] pjob - job pointer
 *
 * @return	pointer to structure
 * @retval	structure handle to passwd
 *
 */

struct passwd *
check_pwd(job *pjob)
{
	struct passwd *pwdp;
	struct group *grpp;
	struct stat sb;
	attribute *jb_group;

	pwdp = getpwnam(get_jattr_str(pjob, JOB_ATR_euser));
	if (pwdp == NULL) {
		(void) sprintf(log_buffer, "No Password Entry for User %s",
			       get_jattr_str(pjob, JOB_ATR_euser));
		return NULL;
	}
	/* check that home directory is valid */
	if (*pwdp->pw_dir == '\0') {
		sprintf(log_buffer, "null home directory");
		return NULL;
	}
	if (pjob->ji_grpcache == NULL) {
		pjob->ji_grpcache = malloc(sizeof(struct grpcache) +
					   strlen(pwdp->pw_dir) + 1);
		if (pjob->ji_grpcache == NULL) {
			sprintf(log_buffer, "Malloc failed");
			return NULL;
		}
		if (stat(pwdp->pw_dir, &sb) == -1) {
			sprintf(log_buffer, "%s: home directory: %s",
				pjob->ji_qs.ji_jobid, pwdp->pw_dir);
			log_err(errno, "check_pwd", log_buffer);
		}
		strcpy(pjob->ji_grpcache->gc_homedir, pwdp->pw_dir);
	}

	pjob->ji_grpcache->gc_uid = pwdp->pw_uid;  /* execution uid */
	pjob->ji_grpcache->gc_rgid = pwdp->pw_gid; /* real user gid */

	/* get the group and supplimentary under which the job is to be run */

	jb_group = get_jattr(pjob, JOB_ATR_egroup);
	if ((jb_group->at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) == ATR_VFLAG_SET) {

		/* execution group specified - not defaulting to login group */

		grpp = getgrnam(get_jattr_str(pjob, JOB_ATR_egroup));
		if (grpp == NULL) {
			(void) sprintf(log_buffer, "No Group Entry for Group %s",
				       get_jattr_str(pjob, JOB_ATR_egroup));
			return NULL;
		}
		if (grpp->gr_gid != pwdp->pw_gid) {
			char **pgnam;

			pgnam = grpp->gr_mem;
			while (*pgnam) {
				if (!strcmp(*pgnam, pwdp->pw_name))
					break;
				++pgnam;
			}
			if (*pgnam == 0) {
				(void) sprintf(log_buffer, "user not in group");
				return NULL;
			}
		}
		pjob->ji_grpcache->gc_gid = grpp->gr_gid;
	} else {
		/* default to login group */
		pjob->ji_grpcache->gc_gid = pwdp->pw_gid;
	}

	/* perform site specific check on validatity of account */
	if (site_mom_chkuser(pjob))
		return NULL;

	return pwdp;
}

/**
 * @brief
 *	writepipe() - writes to pipe
 *
 * @param[in] pfd - file descriptor
 * @param[in] vptr - content to be written
 * @param[in] nbytes - length of content
 *
 * @return	ssize_t
 * @retval	-1					error
 * @retval	number of bytes written to pipe		success
 *
 */

ssize_t
writepipe(int pfd, void *vptr, size_t nbytes)
{
	size_t nleft;
	char *ptr = vptr; /* so we can do pointer arithmetic */

	nleft = nbytes;
	while (nleft > 0) {
		ssize_t nwritten;
		nwritten = write(pfd, ptr, nleft);
		if (nwritten == -1) {
			if (errno == EINTR)
				continue;
			else
				return -1;
		}

		nleft -= nwritten;
		ptr += nwritten;
	}
	return nbytes;
}

/**
 * @brief
 *      readpipe() - reads from pipe
 *
 * @param[in] pfd - file descriptor
 * @param[in] vptr - content to be into
 * @param[in] nbytes - length of content
 *
 * @return      ssize_t
 * @retval      -1                                      error
 * @retval      number of bytes read to pipe         success
 *
 */

ssize_t
readpipe(int pfd, void *vptr, size_t nbytes)
{
	size_t nleft;
	char *ptr = vptr; /* so we can do pointer arithmetic */

	nleft = nbytes;
	while (nleft > 0) {
		ssize_t nread;
		nread = read(pfd, ptr, nleft);
		if (nread == -1) {
			if (errno == EINTR)
				continue;
			else
				return -1;
		}
		if (nread == 0)
			break;

		nleft -= nread;
		ptr += nread;
	}
	return (nbytes - nleft);
}

/**
 * @brief
 *	exec_bail - called when the start of a job fails to clean up
 *
 * @par Functionality:
 *	Logs the message if one is passed in.
 *	Sends IM_ABORT_JOB to the sisters.
 *	sets the job's substate to JOB_SUBSTATE_EXITING, sets the job's
 *	exit code and sets exiting_tasks so an obit is sent for the job.
 *	The job's standard out/err are closed and then resources are released.
 *
 * @param[in]	pjob - pointer to job structure
 * @param[in]	code - the error code for the exit value, typically JOB_EXEC_*
 * @param[in]	txt  - a message to log or NULL if none or already logged
 *
 * @return	None
 *
 * @par MT-safe: likely no
 *
 */

void
exec_bail(job *pjob, int code, char *txt)
{
	int nodes;
	mom_hook_input_t hook_input;
	mom_hook_output_t hook_output;
	int hook_errcode = 0;
	hook *last_phook = NULL;
	unsigned int hook_fail_action = 0;
	char hook_msg[HOOK_MSG_SIZE + 1];

	/* log message passed in if one was */
	if (txt != NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, txt);
	}

	mom_hook_input_init(&hook_input);
	hook_input.pjob = pjob;

	mom_hook_output_init(&hook_output);
	hook_output.reject_errcode = &hook_errcode;
	hook_output.last_phook = &last_phook;
	hook_output.fail_action = &hook_fail_action;

	(void) mom_process_hooks(HOOK_EVENT_EXECJOB_ABORT,
				 PBS_MOM_SERVICE_NAME, mom_host,
				 &hook_input, &hook_output, hook_msg,
				 sizeof(hook_msg), 1);

	nodes = send_sisters(pjob, IM_ABORT_JOB, NULL);
	if (nodes != pjob->ji_numnodes - 1) {
		sprintf(log_buffer,
			"sent %d ABORT requests, should be %d",
			nodes, pjob->ji_numnodes - 1);
		log_joberr(-1, __func__, log_buffer, pjob->ji_qs.ji_jobid);
	}
	set_job_substate(pjob, JOB_SUBSTATE_EXITING);
	pjob->ji_qs.ji_un.ji_momt.ji_exitstat = code;
	exiting_tasks = 1;
	if (pjob->ji_stdout > 0)
		(void) close(pjob->ji_stdout);
	if (pjob->ji_stderr > 0)
		(void) close(pjob->ji_stderr);

	if (job_clean_extra != NULL) {
		(void) job_clean_extra(pjob);
	}
}

#define RETRY 3

/**
 * @brief
 *	opens the demux
 *
 * @param[in] addr - ip address
 * @param[in] port - port number
 *
 * @return 	int
 * @retval	-1		Error
 * @retval	socket number	Success
 *
 */

int
open_demux(u_long addr, int port)
{
	int sock;
	int i;
	struct sockaddr_in remote;

	remote.sin_addr.s_addr = addr;
	remote.sin_port = htons((unsigned short) port);
	remote.sin_family = AF_INET;

	if ((sock = socket(AF_INET, SOCK_STREAM, 0)) == -1) {
		sprintf(log_buffer, "%s: socket %s", __func__, netaddr(&remote));
		log_err(errno, __func__, log_buffer);
		return -1;
	}

	for (i = 0; i < RETRY; i++) {
		if (connect(sock, (struct sockaddr *) &remote,
			    sizeof(remote)) == 0)
			return sock;

		switch (errno) {

			case EINTR:
			case EADDRINUSE:
			case ETIMEDOUT:
			case ECONNREFUSED:
				sleep(2);
				continue;

			default:
				break;
		}
		break;
	}
	sprintf(log_buffer, "%s: connect %s", __func__, netaddr(&remote));
	log_err(errno, __func__, log_buffer);
	(void) close(sock);
	return -1;
}

/**
 * @brief
 * 	open_pty - open slave side of master/slave pty
 *
 * @param[in] pjob - job pointer
 *
 * @retval	int
 * @retval 	pty descriptor	Success
 *
 */

static int
open_pty(job *pjob)
{
	char *name;
	int pts;

	/* Open the slave pty as the controlling tty */

	name = get_jattr_str(pjob, JOB_ATR_outpath);

	if ((pts = open(name, O_RDWR, 0600)) < 0) {
		sprintf(log_buffer, "open_pty(%s): cannot open slave", name);
		log_err(errno, "open_pty", log_buffer);
	} else {

		FDMOVE(pts);

		if (fchmod(pts, 0620) == -1) 
			log_errf(-1, __func__, "fchmod failed. ERR : %s",strerror(errno));				
		if (fchown(pts, pjob->ji_qs.ji_un.ji_momt.ji_exuid,
			      pjob->ji_qs.ji_un.ji_momt.ji_exgid) == -1) 
			log_errf(-1, __func__, "fchown failed. ERR : %s",strerror(errno));		
#if defined(__osf__)
		(void) ioctl(pts, TIOCSCTTY, 0); /* make controlling */
#endif
	}
	return (pts);
}

/**
 * @brief
 * 	is_joined - determine if stdard out and stardard error are joined together
 *	(-j option) and if so which is first
 *
 * @param[in] pjob - job pointer
 *
 * @return 	int
 * @retval	0	no join, separate files
 * @retval  	+1	joined as stdout
 * @retval  	-1 	joined as stderr
 *
 */
int
is_joined(job *pjob)
{
	char *join;

	if (is_jattr_set(pjob, JOB_ATR_join)) {
		join = get_jattr_str(pjob, JOB_ATR_join);
		if (join[0] != 'n') {
			if (join[0] == 'o' && strchr(join, (int) 'e') != 0)
				return 1;
			else if (join[0] == 'e' && strchr(join, (int) 'e') != 0)
				return -1;
		}
	}
	return 0;
}

/**
 * @brief
 * 	open_std_out_err - open standard out and err to files
 *
 * @param[in] pjob - job pointer
 *
 * @return	int
 * @retval	0	Success
 * @retval	-1	Error
 *
 */

static int
open_std_out_err(job *pjob)
{
	int i;
	int file_out = -2;
	int file_err = -2;
	int filemode = O_CREAT | O_WRONLY | O_APPEND;
	direct_write_possible = 1;

	/* if std out/err joined (set and !="n"),which file is first */

	i = is_joined(pjob);
	if (i == 1) {
		file_out = open_std_file(pjob, StdOut, filemode,
					 pjob->ji_qs.ji_un.ji_momt.ji_exgid);
		file_err = dup(file_out);
	} else if (i == -1) {
		file_err = open_std_file(pjob, StdErr, filemode,
					 pjob->ji_qs.ji_un.ji_momt.ji_exgid);
		file_out = dup(file_err);
	}

	if (file_out == -2)
		file_out = open_std_file(pjob, StdOut, filemode,
					 pjob->ji_qs.ji_un.ji_momt.ji_exgid);
	if (file_err == -2)
		file_err = open_std_file(pjob, StdErr, filemode,
					 pjob->ji_qs.ji_un.ji_momt.ji_exgid);
	if ((file_out < 0 || file_err < 0)) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid,
			  "Unable to open standard output/error");
		return -1;
	}

	if (!direct_write_possible && direct_write_requested(pjob)) {
		sprintf(log_buffer,
			"Direct write is requested for job: %s, but the destination is not usecp-able from %s\n",
			pjob->ji_qs.ji_jobid, pjob->ji_hosts[pjob->ji_nodeid].hn_host);
		if (write(file_err, log_buffer, strlen(log_buffer)) == -1) 
			log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));			
	}

	FDMOVE(file_out); /* make sure descriptor > 2       */
	FDMOVE(file_err); /* so don't clobber stdin/out/err */
	if (file_out != 1) {
		(void) close(1);
		if (dup(file_out) == -1) 
			log_errf(-1, __func__, "dup failed. ERR : %s",strerror(errno));		
		(void) close(file_out);
	}
	if (file_err != 2) {
		(void) close(2);
		if (dup(file_err) == -1) 
			log_errf(-1, __func__, "dup failed. ERR : %s",strerror(errno));		
		(void) close(file_err);
	}
	return 0;
}
#ifdef NAS /* localmod 010 */

/**
 * @brief
 * 	NAS_tmpdirname - build NAS version of temporary directory name
 * 	Modifies pbs_tmpdir to append user name
 *
 * @param[in] pjob - job pointer
 *
 * @return 	string
 * @retval	temp directory name
 *
 */

char *
NAS_tmpdirname(job *pjob)
{
	char *ss;

	ss = strstr(pbs_tmpdir, "//");
	if (ss != NULL)
		strcpy(ss + 2, get_jattr_str(pjob, JOB_ATR_euser));

	return tmpdirname(pjob->ji_qs.ji_jobid);
}
#endif /* localmod 010 */

/**
 * @brief
 * 	tmpdirname - build a temporary directory name
 *
 * @param[in] sequence - directory name
 *
 * @return 	string
 * @retval	directory name
 *
 */

char *
tmpdirname(char *sequence)
{
	static char tmpdir[MAXPATHLEN + 1];

	sprintf(tmpdir, "%s/pbs.%s", pbs_tmpdir, sequence);
	return tmpdir;
}

/**
 * @brief
 *	jobdirname - build the staging and execution directory name
 *	with a random number tagged onto the end
 *
 * @param[in] sequence - directory name
 * @param[in] homedir - home dirctory
 *
 * @return	string
 * @retval	job directory name	success
 *
 */

char *
jobdirname(char *sequence, char *homedir)
{
	static char dir[MAXPATHLEN + 1];

	/* this will be implemented/used in phase II
	 **	static char unique[5+1];
	 **	unsigned int seed = (unsigned int)time(NULL);
	 **
	 **	for (i = 0; i < 5; i++) {
	 **		srandom(seed);
	 **		tempnum = random(NULL);
	 **		seed = tempnum;
	 **		unique[i] = (tempnum%26) + '0';
	 **	}
	 **
	 **	sprintf(dir, "%s/%s.%s", pbs_jobdir_root, sequence, unique);
	 */

	if ((pbs_jobdir_root[0] != '\0') && (strcmp(pbs_jobdir_root, JOBDIR_DEFAULT) != 0)) {
		sprintf(dir, "%s/pbs.%s.%s", pbs_jobdir_root, sequence, FAKE_RANDOM);
	} else if ((homedir != NULL) && (*homedir != '\0')) {
		/*
		 * jobdir_root was not set in mom_priv/config file
		 * so use the given homedir
		 */
		sprintf(dir, "%s/pbs.%s.%s", homedir, sequence, FAKE_RANDOM);
	} else {
		/* last resort, use default tmp dir */
		sprintf(dir, "%s/pbs.%s.%s", pbs_tmpdir, sequence, FAKE_RANDOM);
	}

	return dir;
}

/**
 * @brief
 * 	mktmpdir - make temporary directory(s)
 *	A temporary directory is created and the name is
 *	placed in an environment variable.
 *
 * @param[in] jobid - job id
 * @param[in] uid - user id
 * @param[in] gid - group id
 * @param[in] vtab - pointer to variable table
 *
 * @return	int
 * @retval	0		Success
 * @retval 	JOB_EXEC_FAIL1 	failure to make directory
 *
 */

int
mktmpdir(char *jobid, uid_t uid, gid_t gid, struct var_table *vtab)
{
	char *tmpdir;

	tmpdir = tmpdirname(jobid);
	errno = 0;
	if (mkdir(tmpdir, 0700) == -1) {
		int tmp_errno;

		if ((tmp_errno = errno) != EEXIST) {
			sprintf(log_buffer, "mkdir: %s", tmpdir);
			log_joberr(tmp_errno, __func__, log_buffer, jobid);
			return JOB_EXEC_FAIL1;
		} else if (tmp_errno == EEXIST) {
			struct stat statbuf;
			if (lstat(tmpdir, &statbuf) == -1) {
				sprintf(log_buffer, "%s: lstat : %s", jobid, tmpdir);
				log_joberr(tmp_errno, __func__, log_buffer, jobid);
				return JOB_EXEC_FAIL1;
			}
			if (!S_ISDIR(statbuf.st_mode)) { /* Not a directory */
				sprintf(log_buffer, "mkdir: %s is already available: possible attempted security breach by %d:%d(uid:gid of job tmpdir)",
					tmpdir, statbuf.st_uid, statbuf.st_gid);
				log_joberr(tmp_errno, __func__, log_buffer, jobid);
				return JOB_EXEC_FAIL_SECURITY;
			} else if (!((statbuf.st_uid == uid || statbuf.st_uid == 0) && (statbuf.st_gid == gid || statbuf.st_gid == 0))) {
				sprintf(log_buffer, "mkdir: %s is already available: possible attempted security breach by %d:%d(uid:gid of job tmpdir)",
					tmpdir, statbuf.st_uid, statbuf.st_gid);
				log_joberr(tmp_errno, __func__, log_buffer, jobid);
				return JOB_EXEC_FAIL_SECURITY;
			}
		}
	}
	/* Explicitly call chmod because umask affects mkdir() */
	if (chmod(tmpdir, 0700) == -1) {
		sprintf(log_buffer, "chmod: %s", tmpdir);
		log_joberr(errno, __func__, log_buffer, jobid);
		return JOB_EXEC_FAIL1;
	}
	if (chown(tmpdir, uid, gid) == -1) {
		sprintf(log_buffer, "chown: %s", tmpdir);
		log_joberr(errno, __func__, log_buffer, jobid);
		return JOB_EXEC_FAIL1;
	}
	/* Only set TMPDIR if everything succeeded to this point. */
	if (vtab) {
		bld_env_variables(vtab, "TMPDIR", tmpdir);
	}
	return 0;
}

/**
 * @brief
 *	Make the staging and execution directory with what ever
 *	privileges are currently set,  may be root or may be user.
 *	This function is a helper task for mkjobdir() below.
 *
 * @param[in] jobid - the job id string
 * @param[in] jobdir - the full path to the sandox (working directory to make
 *
 * @return int
 * @retval JOB_EXEC_FAIL1 failure to make directory
 * @retval  0 success
 *
 */
static int
internal_mkjobdir(char *jobid, char *jobdir)
{
	if (mkdir(jobdir, 0700) == -1) {
		if (errno == EEXIST) {
			sprintf(log_buffer, "the staging and execution directory %s already exists", jobdir);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_INFO, jobid, log_buffer);
		} else {
			sprintf(log_buffer, "mkdir: %s", jobdir);
			log_joberr(errno, __func__, log_buffer, jobid);
			return JOB_EXEC_FAIL1;
		}
	}
	if (chmod(jobdir, 0700) == -1) {
		sprintf(log_buffer, "unable to change permissions on staging and execution directory %s", jobdir);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO, jobid, log_buffer);
	}
	return 0;
}

/**
 * @brief
 * 	Impersonate the user by changing effective uid and gid.
 *
 * @param[in] uid - user id
 * @param[in] gid - group id
 *
 * @return 	int
 * @retval	0	Success
 * @retval	-1	Error
 *
 */

int
impersonate_user(uid_t uid, gid_t gid)
{
#if defined(HAVE_GETPWUID) && defined(HAVE_INITGROUPS)
	struct passwd *pwd = getpwuid(uid);
	if (pwd == NULL)
		return -1;

	if ((geteuid() != uid) &&
	    (initgroups(pwd->pw_name, gid) == -1)) {
		return -1;
	}

#endif
#if defined(HAVE_SETEUID) && defined(HAVE_SETEGID)
	/* most systems */
	if ((setegid(gid) == -1) ||
	    (seteuid(uid) == -1)) {
		if (setegid(pbsgroup) == -1) 
			log_errf(-1, __func__, "setegid to pbs group failed. ERR : %s",strerror(errno));		
		return -1;
	}
#elif defined(HAVE_SETRESUID) && defined(HAVE_SETRESGID)
	if ((setresgid(-1, gid, -1) == -1) ||
	    (setresuid(-1, uid, -1) == -1)) {
		(void) setresgid(-1, pbsgroup, -1);
		return -1;
	}
#else
#error No function to change effective UID or GID
#endif
	return 0;
}

void
revert_from_user(void)
{
#if defined(HAVE_SETEUID)
	/* most systems */
	if (seteuid(0) == -1) 
		log_errf(-1, __func__, "seteuid failed. ERR : %s",strerror(errno));	
#elif defined(HAVE_SETRESUID)
	(void) setresuid(-1, 0, -1);
#else
#error No function to change effective UID
#endif
#if defined(HAVE_INITGROUPS)
	(void) initgroups("root", pbsgroup);
#endif
#if defined(HAVE_SETEGID)
	if (setegid(pbsgroup) == -1) 
		log_errf(-1, __func__, "setegid to pbs group failed. ERR : %s",strerror(errno));		
#elif defined(HAVE_SETRESGID)
	(void) setresgid(-1, pbsgroup, -1);
#else
#error No function to change effective GID
#endif
}

/**
 * @brief
 *	Make the staging and execution directory for the job.
 *
 * @par If the root of the working directory (sandbox) is the User's home
 *	directory, make the directory as the User in case root has no access.
 *	Otherwise, it is being made in a admin specified secure root owned
 *	location, "job_dir_root" and should be made as root and then the
 *	ownship changed.
 * @par The global character array pbs_jobdir_root is set to a non null string
 *	if the base for the sandbox is not to be the User's home directory.
 *
 * @param[in] jobid - the job id string, i.e. "123.server"
 * @param[in] jobdir - the full path to the sandox (working directory to make
 * @param[in] uid    - the user id of the user under which the job will run
 * @param[in] gid    - the group id of the user under which the job will run
 *
 * @return int
 * @retval -1 failure to make directory
 * @retval  0 success
 *
 */

/**
 * @brief
 * 	mkjobdir - make the staging and execution directory
 *	A per-job staging and execution directory is created.
 *	If the parent of the directory is the user's home, it is made while
 *	operating with the user's privilege.  Otherwise, it is made as root
 *	and then changed as it would be in "job_dir_root" which is root owned.
 *
 * @param[in] jobid - job id
 * @param[in] jobdir - job directory
 * @param[in] uid - user id
 * @param[in] gid - group id
 *
 * @return 	int
 * @retval	0	Success
 * @retval	-1	Error
 *
 */

int
mkjobdir(char *jobid, char *jobdir, uid_t uid, gid_t gid)
{
	int rc;

	if ((pbs_jobdir_root[0] != '\0') && (strcmp(pbs_jobdir_root, JOBDIR_DEFAULT) != 0)) {

		/* making the directory as root in a secure root owned dir */

		if ((rc = internal_mkjobdir(jobid, jobdir)) != 0)
			return (rc);

		/* now change ownership to the user */
		if (chown(jobdir, uid, gid) == -1) {
			sprintf(log_buffer, "chown: %s", jobdir);
			log_joberr(errno, __func__, log_buffer, jobid);
			return JOB_EXEC_FAIL1;
		}
	} else {

		/* making the directory in the user's home, do it as user */

		if (impersonate_user(uid, gid) == -1)
			return -1;

		/* make the directory */
		rc = internal_mkjobdir(jobid, jobdir);

		/* go back to being root */

		revert_from_user();

		if (rc != 0)
			return (rc);
	}

	/*
	 * success.  log a message that shows the name of the
	 * staging and execution dir
	 */
	sprintf(log_buffer, "created the job directory %s", jobdir);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobid, log_buffer);
	return 0;
}

/**
 * @brief
 * 	rmtmpdir - remove the temporary directory
 *	This may take awhile so the task is forked and execed to another
 *	process.
 *
 * @param[in] jobid - job id
 *
 * @return	Void
 *
 */

void
rmtmpdir(char *jobid)
{
	static char rmdir[MAXPATHLEN + 1];
	struct stat sb;
	pid_t pid;
	char *rm = "/bin/rm";
	char *rf = "-rf";
	char *tmpdir;
	char *newdir = rmdir;

	/* Hello, is any body there? */
	tmpdir = tmpdirname(jobid);
	if (stat(tmpdir, &sb) == -1) {
		if (errno != ENOENT) {
			sprintf(log_buffer, "stat: %s", tmpdir);
			log_joberr(errno, __func__, log_buffer, jobid);
		}
		return;
	}

	sprintf(rmdir, "%s/pbs_remove.%s", pbs_tmpdir, jobid);
	if (rename(tmpdir, newdir) == -1) {
		char *msgbuf;

		pbs_asprintf(&msgbuf, "%s %s", tmpdir, newdir);
		log_joberr(errno, __func__, msgbuf, jobid);
		free(msgbuf);
		newdir = tmpdir;
	}

	/* fork and exec the cleantmp process */
	pid = fork();
	if (pid < 0) {
		log_err(errno, __func__, "fork");
		return;
	}

	if (pid > 0) /* parent */
		return;

	tpp_terminate();
	execl(rm, "pbs_cleandir", rf, newdir, NULL);
	log_err(errno, __func__, "execl");
	exit(21);
}

/**
 * @brief
 *	returns shell name
 *
 * @param[in] shell - shellname
 *
 * @return 	string
 * @retval	shell name
 *
 */

char *
lastname(char *shell)
{
	char *shellname;

	shellname = strrchr(shell, '/');
	if (shellname)
		shellname++; /* go past last '/' */
	else
		shellname = shell;
	return shellname;
}

/**
 * @brief
 *	Become the user with specified user name, uid, and gids.
 *	Obtains the current supplement group list and if necessary adds
 *	the user's login group to it,  then changes to the specified group,
 *	new group list, and the specified uid.
 *
 * @param[in] eusrname - the execution user name
 * @param[in] euid     - the execution uid
 * @param[in] egid     - the execution gid
 * @param[in] rgid     - the login (or real) gid of the user
 *
 * @return int
 * @retval 0  - success
 * @retval -1 - failure to change
 *
 */
int
becomeuser_args(char *eusrname, uid_t euid, gid_t egid, gid_t rgid)
{
	gid_t *grplist = NULL;
	static int maxgroups = 0;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
	int32_t pag = 0;
	pag = getpag();
#endif
#endif

	/* obtain the maximum number of groups possible in the list */
	if (maxgroups == 0)
		maxgroups = (int) sysconf(_SC_NGROUPS_MAX);

	if (initgroups(eusrname, egid) != -1) {
		int numsup;
		int i;

		/* allocate an array for the group list */
		grplist = calloc((size_t) maxgroups, sizeof(gid_t));
		if (grplist == NULL)
			return -1;
		/* get the current list of groups */
		numsup = getgroups(maxgroups, grplist);
		for (i = 0; i < numsup; ++i) {
			if (grplist[i] == rgid)
				break;
		}
		if (i == numsup) {
			/* need to add primary group to list */
			if (numsup == maxgroups) {
				/* cannot, list already at max size */
				free(grplist);
				return -1;
			}
			grplist[numsup++] = rgid;
		}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
		if (pag)
			grplist[numsup++] = pag;
#endif
#endif

		if ((setgroups((size_t) numsup, grplist) != -1) &&
		    (setgid(egid) != -1) &&
		    (setuid(euid) != -1)) {
			free(grplist);
			return 0;
		}
	}
	if (grplist)
		free(grplist);
	return -1;
}

/**
 * @brief
 *	Become the user using information sent with the job and in the cached
 *	password information in the job structure if available.
 *
 *	Picks up the execution user name from the euser attribute, the euid
 *	and egid from the mom subarea of the job structure and the login gid
 *	from the cached password info if that has been set.  Otherwise use
 *	the egid.
 *
 *	The real work is done by passing the above to becomeuser_args().
 * @see	becomeuser_args
 *
 * @param[in] pjob - pointer to the job structure
 * @return int
 * @retval 0  - success
 * @retval -1 - failure to change
 *
 */

int
becomeuser(job *pjob)
{
	gid_t rgid;
	if (pjob->ji_grpcache != NULL)
		rgid = pjob->ji_grpcache->gc_rgid;
	else
		rgid = pjob->ji_qs.ji_un.ji_momt.ji_exgid;
	if (becomeuser_args(get_jattr_str(pjob, JOB_ATR_euser), pjob->ji_qs.ji_un.ji_momt.ji_exuid, pjob->ji_qs.ji_un.ji_momt.ji_exgid, rgid) == -1) {
		fprintf(stderr, "unable to set user privileges, errno = %d\n",
			errno);
		return -1;
	} else
		return 0;
}

/**
 * @brief
 * 	Expects the current process will invoke some external program,
 * 	and this sets the process to have the special credential
 * 	stored in the job, along with 'shell', arguments array (argarray),
 * 	and 'pjob->ji_env' values.
 *
 * @param[in] pjob - job in question
 * @param[out] shell - if not NULL, filled in with shell to use for future
 *				external program invocations.
 * @param[out] argarray - if not NULL, filled in with argument array to be
 *				used for future external program invocations.
 *
 *	Do the right thing for the type of credential the job has.
 *	We are in a child process which will become a task.
 *
 * @return	int
 * @retval	-1	error
 * @retval	0	Success
 *
 */
int
set_credential(job *pjob, char **shell, char ***argarray)
{
	char **argv;
	static char buf[MAXPATHLEN + 1];
	int ret = 0;
	char *prog = NULL; /* possible new shell */
	char *name;
	int i = 0;
	int j;
	int num = 0;
	int fds[2];

	if ((argarray != NULL) && (*argarray != NULL)) {
		while ((*argarray)[num] != NULL) {
			num++;
		}
	}
	cred_buf = NULL;

	switch (pjob->ji_extended.ji_ext.ji_credtype) {

		case PBS_CREDTYPE_NONE:
			argv = (char **) calloc(2 + num, sizeof(char *));
			assert(argv != NULL);

			/* construct argv array */
			if (shell != NULL) {
				prog = *shell;
				name = lastname(*shell);
				argv[i] = malloc(strlen(name) + 2);
				assert(argv[i] != NULL);
				strcpy(argv[i], "-");
				strcat(argv[i++], name);
				/* copy remaining command line args 1..end, skip 0 */
				if (num >= 2) { /* num=# of !NULL argarray entries */
					for (j = 1; (*argarray)[j]; j++)
						argv[i++] = (*argarray)[j];
				}
			}
			ret = becomeuser(pjob);
			break;

		case PBS_CREDTYPE_AES:
			/* there are 3 set argv[] entries below, so need to alloc */
			/* 3+1 initial slots (+1 for the terminating NULL entry) */
			argv = (char **) calloc(4 + num, sizeof(char *));
			assert(argv != NULL);

			if (read_cred(pjob, &cred_buf, &cred_len) != 0)
				break;

			ret = becomeuser(pjob);

			if (pipe(fds) == -1) {
				log_err(errno, __func__, "pipe");
				break;
			}

			name = NULL;
			if (pbs_decrypt_pwd(cred_buf, PBS_CREDTYPE_AES, cred_len, &name, (const unsigned char *) pbs_aes_key, (const unsigned char *) pbs_aes_iv) != 0) {
				log_joberr(-1, __func__, "decrypt_pwd", pjob->ji_qs.ji_jobid);
				close(fds[0]);
			} else if (writepipe(fds[1], name, cred_len) != cred_len) {
				log_err(errno, __func__, "pipe write");
				close(fds[0]);
			} else {
				sprintf(buf, "%d", fds[0]);
				bld_env_variables(&pjob->ji_env, "PBS_PWPIPE", buf);
			}
			if (name != NULL) {
				memset(name, 0, cred_len);
				free(name);
			}
			close(fds[1]);

			/* construct argv array */
			if (shell != NULL) {
				prog = *shell;
				name = lastname(*shell);
				argv[i] = malloc(strlen(name) + 2);
				if (argv[i] == NULL)
					break;
				strcpy(argv[i], "-");
				strcat(argv[i++], name);
			}
			break;

		default:
			log_err(errno, __func__, "unknown credential type");
			return -1;
	}

	if (shell == NULL ||  /* only args OR */
	    prog != *shell) { /* we added a program */
		/* copy remaining command line args */
		if (argarray != NULL) {
			if (*argarray != NULL) {
				argv[i++] = (shell == NULL) ? (*argarray)[0] : *shell;
				if (num >= 2) { /* num=# of !NULL argarray entries */
					for (j = 1; (*argarray)[j]; j++) {
						argv[i++] = (*argarray)[j];
					}
				}
			} else {
				argv[i++] = (shell == NULL) ? NULL : *shell;
			}
		}
		if (shell != NULL)
			*shell = prog;
	}
	argv[i++] = NULL;

	if (argarray != NULL) {
		*argarray = argv;
	} else {
		free_str_array(argv);
	}

	if (cred_buf) {
		free(cred_buf);
		cred_buf = NULL;
	}
	return ret;
}

/** @brief
 * 	get_index_and_parent - from the job if of a subjob, return the parent array
 *	job jobid and the index for this subjob. The two returned strings are
 *	in static buffers and must be copied before this is called again.
 *
 * @param[in] jobid - job id
 * @param[out] pparent - parent array job
 * @param[out] pindex - index for subjob
 *
 * @return	Void
 *
 */

void
get_index_and_parent(char *jobid, char **pparent, char **pindex)
{
	char *pd;
	char *pi;
	char *ps;
	static char parent[PBS_MAXSVRJOBID + 1];
	static char index[20];

	ps = jobid;
	pd = parent;
	pi = index;
	while (*ps != '[') /* copy first part of job id */
		*pd++ = *ps++;
	*pd++ = *ps++;	   /* copy in '[' */
	while (*ps != ']') /* copy index  */
		*pi++ = *ps++;
	*pi = '\0';
	while (*ps)
		*pd++ = *ps++;
	*pd = '\0';
	*pparent = parent;
	*pindex = index;
}

/**
 * @brief
 *	creates set up for job.
 *
 * @param[in] pjob - job pointer
 * @param[in] pwdparm - pointer to passwd structure
 *
 * @return	int
 * @retval	JOB_EXEC_FAILUID(-10)	Error
 * @retval	JOB_EXEC_RETRY(-3)	Error
 * @retval	JOB_EXEC_OK(0)		Success
 *
 */

static int
job_setup(job *pjob, struct passwd **pwdparm)
{
	struct passwd *pwdp;
	char *chkpnt;

	/*
	 * get the password entry for the user under which the job is to be run
	 * we do this now to save a few things in the job structure
	 */
	pwdp = check_pwd(pjob);
	if (pwdparm != NULL)
		*pwdparm = pwdp;

	if (pwdp == NULL) {
		log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB,
			  LOG_ERR, pjob->ji_qs.ji_jobid, log_buffer);
		pjob->ji_qs.ji_stime = time_now; /* for walltime */
		set_jattr_l_slim(pjob, JOB_ATR_stime, time_now, SET);
		return JOB_EXEC_FAILUID;
	}
	pjob->ji_qs.ji_un.ji_momt.ji_exuid = pjob->ji_grpcache->gc_uid;
	pjob->ji_qs.ji_un.ji_momt.ji_exgid = pjob->ji_grpcache->gc_gid;

	/*
	 ** Call job_setup_final if it is available.
	 ** The stream parameter is not used by mother superior.
	 */
	if (job_setup_final != NULL) {
		if (job_setup_final(pjob, -1) != PBSE_NONE)
			return JOB_EXEC_RETRY;
	}

	/*
	 * if certain resource limits require that the job usage be
	 * polled or it is a multinode job, we link the job to mom_polljobs.
	 *
	 * NOTE: we overload the job field ji_jobque for this as it
	 * is not used otherwise by MOM
	 */

	if (pjob->ji_numnodes > 1 || mom_do_poll(pjob))
		if (is_linked(&mom_polljobs, &pjob->ji_jobque) == 0)
			append_link(&mom_polljobs, &pjob->ji_jobque, pjob);

	/* Is the job to be periodic checkpointed */

	pjob->ji_chkpttype = PBS_CHECKPOINT_NONE;
	if (is_jattr_set(pjob, JOB_ATR_chkpnt)) {
		chkpnt = get_jattr_str(pjob, JOB_ATR_chkpnt);
		if ((*chkpnt == 'c') && (*(chkpnt + 1) == '=')) {
			/* has cpu checkpoint time in minutes, convert to seconds */
			pjob->ji_chkpttype = PBS_CHECKPOINT_CPUT;
			pjob->ji_chkpttime = atoi(chkpnt + 2) * 60;
		} else if ((*chkpnt == 'w') && (*(chkpnt + 1) == '=')) {
			/* has checkpoint walltime in minutes, convert to seconds */
			pjob->ji_chkpttype = PBS_CHECKPOINT_WALLT;
			pjob->ji_chkpttime = atoi(chkpnt + 2) * 60;
		}
		pjob->ji_chkptnext = pjob->ji_chkpttime;
	}
	return JOB_EXEC_OK;
}

/**
 * @brief
 *	record_finish_exec - record the results of finish_exec()
 *	primarily the session id of the started job.
 *
 * @par Functionality:
 *	Find the connection table entry associated with the pipe file
 *	descriptor.  This leads to the task and from there to the job
 *	being started.  The starter return information is read from the pipe.
 *	If the read fails, log the fact and requeue the job.
 *	Otherwise, record that the job is now running:
 *	- the session id and global id (if one)
 *	- set the state/substate to RUNNING
 *	- get a first sample of usage for this job and
 *	  return a status update to the Server so it knows the job is going.
 *
 * @param[in]	sd - file descriptor of the pipe on which the job starter
 *		process has written the session id and other info
 *
 * @return	None
 *
 * @par MT-safe: likely no
 *
 */
static void
record_finish_exec(int sd)
{
	conn_t *conn = NULL;
	int i;
	int j;
	job *pjob = NULL;
	pbs_task *ptask;
	struct startjob_rtn sjr;

	if ((conn = get_conn(sd)) == NULL) {
		log_err(PBSE_INTERNAL, __func__, "unable to find pipe");
		return;
	}

	ptask = (pbs_task *) conn->cn_data;
	if (ptask != NULL)
		pjob = ptask->ti_job;
	else {
		/*
		 * Job has been deleted before recording session id.
		 * Read the session information and kill the process.
		 */
		memset(&sjr, 0, sizeof(sjr));
		i = readpipe(sd, &sjr, sizeof(sjr));
		j = errno;
		(void) close_conn(sd);

		if (i == sizeof(sjr))
			kill_session(sjr.sj_session, SIGKILL, 0);
		else {
			sprintf(log_buffer,
				"read of pipe for session information got %d not %d",
				i, (int) sizeof(sjr));
			log_err(j, __func__, log_buffer);
		}

		return;
	}

	if (pjob == NULL) {
		log_err(PBSE_INTERNAL, __func__,
			"no job task associated with connection");
		return;
	}

	/* now we read the session id or error */
	memset(&sjr, 0, sizeof(sjr));
	i = readpipe(pjob->ji_jsmpipe, &sjr, sizeof(sjr));
	j = errno;

	if (i != sizeof(sjr)) {
		sprintf(log_buffer,
			"read of pipe for pid job %s got %d not %d",
			pjob->ji_qs.ji_jobid,
			i, (int) sizeof(sjr));
		log_err(j, __func__, log_buffer);
		(void) close_conn(pjob->ji_jsmpipe);
		pjob->ji_jsmpipe = -1;
		(void) close(pjob->ji_mjspipe);
		pjob->ji_mjspipe = -1;

		if (pjob->ji_jsmpipe2 != -1) {
			(void) close_conn(pjob->ji_jsmpipe2);
			pjob->ji_jsmpipe2 = -1;
		}

		if (pjob->ji_mjspipe2 != -1) {
			(void) close(pjob->ji_mjspipe2);
			pjob->ji_mjspipe2 = -1;
		}

		if (pjob->ji_child2parent_job_update_pipe != -1) {
			(void) close_conn(pjob->ji_child2parent_job_update_pipe);
			pjob->ji_child2parent_job_update_pipe = -1;
		}

		if (pjob->ji_parent2child_job_update_pipe != -1) {
			(void) close(pjob->ji_parent2child_job_update_pipe);
			pjob->ji_parent2child_job_update_pipe = -1;
		}

		if (pjob->ji_parent2child_job_update_status_pipe != -1) {
			(void) close(pjob->ji_parent2child_job_update_status_pipe);
			pjob->ji_parent2child_job_update_status_pipe = -1;
		}

		if (pjob->ji_parent2child_moms_status_pipe != -1) {
			(void) close(pjob->ji_parent2child_moms_status_pipe);
			pjob->ji_parent2child_moms_status_pipe = -1;
		}
		(void) sprintf(log_buffer, "start failed, improper sid");
		exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
		return;
	}

#if MOM_ALPS
	if (sjr.sj_code == JOB_EXEC_UPDATE_ALPS_RESV_ID) {
		pjob->ji_extended.ji_ext.ji_pagg = sjr.sj_pagg;
		pjob->ji_extended.ji_ext.ji_reservation = sjr.sj_reservation;
		(void) writepipe(pjob->ji_mjspipe, &sjr, sizeof(sjr));
		return;
	}
#endif

	/* send back as an acknowledgement that MOM got it */
	(void) writepipe(pjob->ji_mjspipe, &sjr, sizeof(sjr));
	(void) close_conn(pjob->ji_jsmpipe);
	pjob->ji_jsmpipe = -1;
	(void) close(pjob->ji_mjspipe);
	pjob->ji_mjspipe = -1;

	if (pjob->ji_jsmpipe2 != -1) {
		(void) close_conn(pjob->ji_jsmpipe2);
		pjob->ji_jsmpipe2 = -1;
	}

	if (pjob->ji_mjspipe2 != -1) {
		(void) close(pjob->ji_mjspipe2);
		pjob->ji_mjspipe2 = -1;
	}

	if (pjob->ji_child2parent_job_update_pipe != -1) {
		(void) close_conn(pjob->ji_child2parent_job_update_pipe);
		pjob->ji_child2parent_job_update_pipe = -1;
	}

	if (pjob->ji_parent2child_job_update_pipe != -1) {
		(void) close(pjob->ji_parent2child_job_update_pipe);
		pjob->ji_parent2child_job_update_pipe = -1;
	}

	if (pjob->ji_parent2child_job_update_status_pipe != -1) {
		(void) close(pjob->ji_parent2child_job_update_status_pipe);
		pjob->ji_parent2child_job_update_status_pipe = -1;
	}

	if (pjob->ji_parent2child_moms_status_pipe != -1) {
		(void) close(pjob->ji_parent2child_moms_status_pipe);
		pjob->ji_parent2child_moms_status_pipe = -1;
	}

	DBPRT(("%s: read start return %d %d\n", __func__,
	       sjr.sj_code, sjr.sj_session))

	/* update pjob with values set from a prologue/launch hook
	 * since these are hooks that are executing in a child process
	 * and changes inside the child will not be reflected in main
	 * mom
	 */
	if ((num_eligible_hooks(HOOK_EVENT_EXECJOB_PROLOGUE) > 0) ||
	    (num_eligible_hooks(HOOK_EVENT_EXECJOB_LAUNCH) > 0)) {
		char hook_outfile[MAXPATHLEN + 1];
		struct stat stbuf;
		int reject_rerunjob = 0;
		int reject_deletejob = 0;

		snprintf(hook_outfile, MAXPATHLEN, FMT_HOOK_JOB_OUTFILE,
			 path_hooks_workdir, pjob->ji_qs.ji_jobid);
		if (stat(hook_outfile, &stbuf) == 0) {
			pbs_list_head vnl_changes;

			CLEAR_HEAD(vnl_changes);
			if (sjr.sj_code == JOB_EXEC_HOOKERROR) {

				char hook_buf2[HOOK_BUF_SIZE];
				int fd;
				char *hook_name = NULL;
				int rd_size = stbuf.st_size;

				if (rd_size >= HOOK_BUF_SIZE) {
					rd_size = HOOK_BUF_SIZE - 1;
				}

				fd = open(hook_outfile, O_RDONLY);
				hook_buf2[0] = '\0';
				if (fd != -1) {
					if (read(fd, hook_buf2, rd_size) == rd_size) {
						hook_buf2[rd_size] = '\0';
						if (hook_buf2[rd_size - 1] == '\n') {
							hook_buf2[rd_size - 1] = '\0';
						}

						hook_name = strchr(hook_buf2, '=');
						if (hook_name != NULL)
							hook_name++;
					}

					close(fd);
					unlink(hook_outfile);
				}
				if (hook_name != NULL) {
					send_hook_fail_action(find_hook(hook_name));
				}

			} else if (get_hook_results(hook_outfile, NULL, NULL, NULL, 0,
						    &reject_rerunjob, &reject_deletejob, NULL,
						    NULL, 0, &vnl_changes, pjob,
						    NULL, 0, NULL) != 0) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, __func__, "Failed to get prologue hook results");
				vna_list_free(vnl_changes);
				/* important to unlink this file here */
				/* as this file is usually opened in append */
				/* mode under mom_process_hooks() */
				unlink(hook_outfile);
			} else {
				/* Delete job or reject job actions */
				/* NOTE: Must appear here before vnode changes, */
				/* since this action will be sent whether or not */
				/* hook script executed by PBSADMIN or not. */
				if (reject_deletejob) {
					/* deletejob takes precedence */
					new_job_action_req(pjob, HOOK_PBSADMIN, JOB_ACT_REQ_DELETE);
				} else if (reject_rerunjob) {
					new_job_action_req(pjob, HOOK_PBSADMIN, JOB_ACT_REQ_REQUEUE);
				}

				/* Whether or not we accept or reject, we'll make */
				/* job changes, vnode changes, job actions */
				enqueue_update_for_send(pjob, IS_RESCUSED_FROM_HOOK);

				/* Push vnl hook changes to server */
				hook_requests_to_server(&vnl_changes);

				unlink(hook_outfile);
			}
		}
	}

	/*
	 ** Set the global id before exiting on error so any
	 ** information can be put into the job struct first.
	 */
	set_globid(pjob, &sjr);
	if (sjr.sj_code < 0) {
#if MOM_ALPS
		/* we couldn't get a reservation so refresh the inventory */
		if (sjr.sj_reservation == -1)
			call_hup = HUP_INIT;
#endif
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		AFSLOG_TERM(ptask);
#endif
		(void) sprintf(log_buffer, "job not started, %s %d",
			       (sjr.sj_code == JOB_EXEC_RETRY) ? "Retry" : "Failure", sjr.sj_code);
		exec_bail(pjob, sjr.sj_code, log_buffer);
		return;
	}

	ptask->ti_qs.ti_sid = sjr.sj_session;
	ptask->ti_qs.ti_status = TI_STATE_RUNNING;

	strcpy(ptask->ti_qs.ti_parentjobid, pjob->ji_qs.ji_jobid);
	if (task_save(ptask) == -1) {
		(void) sprintf(log_buffer, "Task save failed");
		exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
		return;
	}

	/*
	 * return from the starter indicated the job is a go ...
	 * record the start time and session/process id
	 */

	start_walltime(pjob);

	set_jattr_l_slim(pjob, JOB_ATR_session_id, sjr.sj_session, SET);

	set_job_state(pjob, JOB_STATE_LTR_RUNNING);
	set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
	job_save(pjob);

	if (mom_get_sample() == PBSE_NONE) {
		time_resc_updated = time_now;
		(void) mom_set_use(pjob);
	}
	/*
	 * these are set so that it will
	 * return them to the Server on the first update below
	 */
	(get_jattr(pjob, JOB_ATR_errpath))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_outpath))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_session_id))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_altid))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_state))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_substate))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_jobdir))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_altid2))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_acct_id))->at_flags |= ATR_VFLAG_MODIFY;

	enqueue_update_for_send(pjob, IS_RESCUSED);
	next_sample_time = min_check_poll;
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "Started, pid = %d", sjr.sj_session);

	return;
}

/**
 * @brief
 *	Regenerate the PBS_NODEFILE of a job based on internal
 *	nodes-related data.
 * @param[in]	pjob	- the job whose PBS_NODEFILE is to be generated.
 * @param[out]	nodefile- buffer to hold the path to PBS_NODEFILE
 *			  that got regenerated.
 *			  NOTE: OK for this to be NULL, which means
 *			  don't save nodefile path.
 *
 * @param[in] nodefile_sz - size of the 'nodefile' buffer.
 * @param[out] err_msg	- buffer to hold the error message if this
 *			 functions returns a failure.
 * @param[in]	err_msg_sz - size of the 'err_msg' buffer.
 *
 * @return int
 * @retval  0	success
 * @retval < 0	failure
 *
 */
int
generate_pbs_nodefile(job *pjob, char *nodefile, int nodefile_sz,
		      char *err_msg, int err_msg_sz)
{
	FILE *nhow;
	int j, vnodenum;
	char pbs_nodefile[MAXPATHLEN + 1];

	if (pjob == NULL) {
		snprintf(err_msg, err_msg_sz, "bad pjob param");
		return (-1);
	}

	if ((err_msg != NULL) && (err_msg_sz > 0))
		err_msg[0] = '\0';

	snprintf(pbs_nodefile, sizeof(pbs_nodefile) - 1, "%s/aux/%s",
		 pbs_conf.pbs_home_path, pjob->ji_qs.ji_jobid);

	if ((nhow = fopen(pbs_nodefile, "w")) == NULL) {
		if ((err_msg != NULL) && (err_msg_sz > 0)) {
			snprintf(err_msg, err_msg_sz,
				 "cannot open %s", pbs_nodefile);
		}
		return (-1);
	}
	/*
	 **	The file must be owned by root and readable by
	 **	the user.  We take the easy way out and make
	 **	it readable by anyone.
	 */
	if (fchmod(fileno(nhow), 0644) == -1) {
		if ((err_msg != NULL) && (err_msg_sz > 0)) {
			snprintf(err_msg, err_msg_sz, "cannot chmod %s",
				 pbs_nodefile);
		}
		fclose(nhow);
		(void) unlink(pbs_nodefile);
		return (-1);
	}

	/* write each node name out once per vnod and entry */
	vnodenum = pjob->ji_numvnod;
	for (j = 0; j < vnodenum; j++) {
		if (pjob->ji_vnods[j].vn_hname == NULL) {
			size_t len;
			char *pdot;

			/* we want to write just the short name of the host */
			if ((pdot = strchr(pjob->ji_vnods[j].vn_host->hn_host, '.')) != NULL)
				len = (size_t) (pdot - pjob->ji_vnods[j].vn_host->hn_host);
			else
				len = strlen(pjob->ji_vnods[j].vn_host->hn_host);
			fprintf(nhow, "%.*s\n", (int) len,
				pjob->ji_vnods[j].vn_host->hn_host);
		} else
			fprintf(nhow, "%s\n", pjob->ji_vnods[j].vn_hname);
	}
	fclose(nhow);

	if ((nodefile != NULL) && (nodefile_sz > 0))
		pbs_strncpy(nodefile, pbs_nodefile, nodefile_sz);

	return (0);
}

/**
 * @brief
 *	Read a piece of data from 'downfds' pipe of size 'data_size'.
 *
 * @param[in]	downfds - the pipe descriptor to read from.
 * @param[in]	data_size - the size of data to read.
 * @param[in]	wait_sec - # of seconds to wait for data to arrive.
 *
 * @return void *
 * @retval <opaque_data>	- pointer to some data that is in a fixed
 *				  memory area that must not be freed and can
 *				  get overwritten on a next call to this
 *				  function.
 * @retval NULL			- if no data was found or error encountered.
 * @note
 *	The read time is timed out using the $job_launch_delay mom config
 *	option value.
 */
void *
read_pipe_data(int downfds, int data_size, int wait_sec)
{
	static char *buf = NULL;
	static int buf_size = 0;
	int ret;
	int nread = 0;
	struct pollfd pollfds[1];
	int timeout = (int) (wait_sec * 1000); /* milli seconds */
	pollfds[0].fd = downfds;
	pollfds[0].events = POLLIN;
	pollfds[0].revents = 0;

	ret = poll(pollfds, 1, timeout);

	if (ret == -1) {
		log_err(errno, __func__, "error on monitoring pipe");
		return NULL;
	} else if (ret == 0) {
		/* select or poll timed out */
		return NULL;
	}

	if (data_size > buf_size) {
		char *tpbuf;

		tpbuf = realloc(buf, data_size);
		if (tpbuf == NULL) {
			log_err(-1, __func__, "realloc failure");
			return NULL;
		}
		buf = tpbuf;
		buf_size = data_size;
	}
	memset(buf, 0, buf_size);

	nread = readpipe(downfds, buf, data_size);

	if (data_size != nread) {
		log_err(-1, __func__, "did not receive all data");
		return NULL;
	}
	return (buf);
}

/**
 * @brief
 *	Write a piece of data of size 'data_size' into pipe descriptors
 *	'upfds' (data write)  and 'downfds' (data ack).
 *
 * @param[in]	upfds - pipe descriptor upstream.
 * @param[in]	downfds - pipe descriptor downstream
 * @param[in]	data - the data to write
 * @param[in]	data_size - the size of 'data'
 *
 * @return int
 * @retval  0	- for success
 * @retval  1	- for failure
 */
int
write_pipe_data_ack(int upfds, int downfds, void *data, size_t data_size)
{
	void *data_recv = NULL;
	int nwrite = 0;
	size_t data_size_recv;

	if ((data == NULL) || (data_size == 0)) {
		return (1);
	}

	/* first send out data length */
	nwrite = writepipe(upfds, data, data_size);
	if (nwrite != data_size) {
		log_err(-1, __func__, "failed to write data to pipe");
		return (1);
	}

	/* wait for acknowledgement */
	data_recv = read_pipe_data(downfds, sizeof(size_t), PIPE_READ_TIMEOUT);
	if (data_recv == NULL) {
		log_err(-1, __func__, "failed to get ack from pipe");
		return (1);
	}

	memcpy(&data_size_recv, data_recv, sizeof(size_t));
	if (data_size_recv != data_size) {
		log_err(-1, __func__, "received data not match sent data");
		return (1);
	}
	return (0);
}

/**
 * @brief
 *	Write a piece of data of size 'data_size' into pipe 'upfds'.
 *
 * @param[in]	upfds - pipe descriptor upstream.
 * @param[in]	data - the data to write
 * @param[in]	data_size - the size of 'data'
 *
 * @return int
 * @retval  0	- for success
 * @retval  1	- for failure
 */
int
write_pipe_data(int upfds, void *data, int data_size)
{
	int nwrite = 0;

	if ((data == NULL) || (data_size <= 0)) {
		return (1);
	}

	nwrite = writepipe(upfds, data, data_size);
	if (nwrite != data_size) {
		log_err(-1, __func__, "partial write detected");
		return (1);
	}
	return (0);
}

/**
 * @brief
 *	Write 'r_size' first, and then the actual data 'r_buf' into pipe
 *	descriptors *	'upfds' (data write)  and 'downfds' (data ack).
 *
 * @param[in]	upfds - pipe descriptor upstream.
 * @param[in]	downfds - pipe descriptor downstream
 * @param[in]	r_buf - the data to write
 * @param[in]	r_size - the size of 'r_buf'
 *
 * @return int
 * @retval  0	- for success
 * @retval  1	- for failure
 *
 */
int
send_string_data(int upfds, int downfds, void *r_buf, size_t r_size)
{
	/* send new string size */
	if (write_pipe_data_ack(upfds, downfds, &r_size, sizeof(size_t)) != 0) {
		return (1);
	}
	/* now send string data actual data */
	if (write_pipe_data_ack(upfds, downfds, r_buf, r_size) != 0) {
		return (1);
	}

	return (0);
}

/**
 * @brief
 *	Read some string of data from 'downfds' pipe descriptor and using
 *	'upfds' for acknowledgement.
 *
 * @param[in]	downfds - the pipe descriptor to read from.
 * @param[in]	upfds - the pipe descriptor to use for acks.
 *
 * @return char *
 * @retval <string_of_data>	- pointer to some string data that is in a
 *				  fixed memory area that must not be freed and
 *				  can get overwritten on a next call to this
 *				  function.
 * @retval NULL			- if no data was found or error encountered.
 * @note
 *	The read time is timed out using the $job_launch_delay mom config
 *	option value.
 */
char *
receive_string_data(int downfds, int upfds)
{
	char *r_buf;
	size_t r_size;
	size_t ack_size;

	/* get size of buffer to receive */
	r_buf = read_pipe_data(downfds, sizeof(size_t), PIPE_READ_TIMEOUT);
	if (r_buf == NULL) {
		return (NULL);
	}
	memcpy(&r_size, r_buf, sizeof(size_t));
	/* ack that we got the r_size */
	ack_size = sizeof(size_t);
	if (write_pipe_data(upfds, &ack_size, sizeof(size_t)) != 0) {
		snprintf(log_buffer, sizeof(log_buffer), "write of length %lu bytes to pipe failed", (unsigned long) ack_size);
		log_err(errno, __func__, log_buffer);
		return (NULL);
	}

	/* now get the actual string data */
	r_buf = read_pipe_data(downfds, r_size, PIPE_READ_TIMEOUT);
	if (r_buf == NULL) {
		snprintf(log_buffer, sizeof(log_buffer), "read of pipe of size %lu bytes for failed", (unsigned long) r_size);
		log_err(errno, __func__, log_buffer);
		return (NULL);
	}
	/* send back as an acknowledgement that MOM got it */
	ack_size = r_size;
	if (write_pipe_data(upfds, &ack_size, sizeof(size_t)) != 0) {
		snprintf(log_buffer, sizeof(log_buffer), "write of length %lu bytes to pipe failed", (unsigned long) r_size);
		log_err(errno, __func__, log_buffer);
		return (NULL);
	}
	return (r_buf);
}

/**
 * @brief
 *	Send a command 'cmd' request using the pipes given.
 *
 * @param[in]	upfds - upstream pipe
 * @param[in]	downstream - downstream pipe
 * @param[in]	cmd - command request to send (e.g. IM_EXEC_PROLOGUE)
 *
 * @return int
 * @retval 0	- success
 * @retval 1	- fail
 */
int
send_pipe_request(int upfds, int downfds, int cmd)
{
	char *r_buf;
	int cmd_read;

	if (write_pipe_data(upfds, &cmd, sizeof(int)) != 0) {
		log_err(-1, __func__, "bad write to pipe");
		return (1);
	}

	/* wait for acknowledgement */
	r_buf = read_pipe_data(downfds, sizeof(int), PIPE_READ_TIMEOUT);
	if (r_buf == NULL) {
		log_err(-1, __func__, "bad read from pipe");
		return (1);
	}

	memcpy(&cmd_read, r_buf, sizeof(int));
	if (cmd != cmd_read) {
		snprintf(log_buffer, sizeof(log_buffer), "wrote %d got %d", cmd, cmd_read);
		log_err(-1, __func__, log_buffer);
		return (1);
	}
	return (0);
}

/**
 * @brief
 *	Returns 1 (true) if sister moms have all replied IM_ALL_OKAY status in
 *	regards to execution of remote prologue hooks.
 *
 * @param[in,out]	pjob	 - job being operated on.
 * @param[in]		pipefd	-  pipe to mother superior to get status info.
 * @return int
 * @retval 1	- for true
 * @retval 0	- for false
 */
int
prologue_hook_all_okay_from_sisters_moms(job *pjob, int pipefd)
{
	int cmd_ack = 0;
	char *r_buf = NULL;

	if (pipefd == -1)
		return (0);

	/* get cmd_ack from parent that it received IM_ALL_OKAY status from
	 * all sister moms regarding execution of remote prologue hooks.
	 */
	r_buf = read_pipe_data(pipefd, sizeof(int), 0);
	if (r_buf != NULL)
		memcpy(&cmd_ack, r_buf, sizeof(int));

	if ((r_buf == NULL) || (cmd_ack != IM_ALL_OKAY))
		return (0);
	return (1);
}

/**
 * @brief
 *	Wait/read from 'pipfd' pipe for node names of unhealthy moms, and
 *	update accordingly the job 'pjob''s ji_node_list and ji_failed_node_list.
 *	Return in 'vnl_fails' those entries in job's exec_vnode where the
 *	vnodes are managed by parent moms appearing in pjob->ji_failed_node_list.
 *
 * @param[in/out]	pjob	 - job being operated on.
 * @param[in]		pipefd	-  pipe to mother superior to get data.
 * @param[in]		prolo_pipefd	-  pipe to mother superior to get info
 *				   about remote prologue hook execution
 * @param[out]		vnl_fails - fill in with the list of vnodes and their
 *				   resources with non-healthy  parent moms.
 * @param[out]		vnl_good - fill in with the list of vnodes and their
 *				   resources with functional parent moms.
 * @param[in]		timeout	- # of seconds to wait waiting for list of failed
 *				   mom hosts.
 * @return int
 * @retval 0	- for success
 * @retval 1	- for failure
 */
int
get_failed_moms_and_vnodes(job *pjob, int pipefd, int prolo_pipefd, vnl_t **vnl_fails, vnl_t **vnl_good, unsigned int timeout)
{
	size_t r_size = 0;
	char *r_buf = NULL;
	int timer;
	char err_msg[LOG_BUF_SIZE];
	int prolo_okay = 0;

	if (pjob == NULL)
		return (1);

	/* Get failed mom hosts, and update the job's node_list and failed_node_list */
	timer = timeout;
	do {
		/* get size of buffer to receive */
		r_buf = read_pipe_data(pipefd, sizeof(size_t), 1);
		if (r_buf != NULL) {
			memcpy(&r_size, r_buf, sizeof(size_t));
			/* now get the actual string data */
			r_buf = read_pipe_data(pipefd, r_size, 0);
			if (r_buf != NULL) {
				snprintf(log_buffer, sizeof(log_buffer), "received from parent mom that node's host %s is not healthy", r_buf);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
				reliable_job_node_add(&pjob->ji_failed_node_list, r_buf);
				reliable_job_node_delete(&pjob->ji_node_list, r_buf);
			}
		}
		if (prolo_pipefd != -1)
			prolo_okay = prologue_hook_all_okay_from_sisters_moms(pjob, prolo_pipefd);
		timer--;
	} while ((timer >= 0) && !prolo_okay);

	if ((prolo_pipefd != -1) && !prolo_okay)
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "not all prologue hooks to sister moms completed, but job will proceed to execute");

	/* now prune_exec_vnode taking away vnodes managed by moms
	 * in job's node_fail_list, and also satisfy the original
	 * job schedselect
	 */
	if (prune_exec_vnode(pjob, NULL, vnl_fails, vnl_good, err_msg, LOG_BUF_SIZE) != 0) {
		return (1);
	}

	return (0);
}

/**
 * @brief
 *	This is called by a job child process telling parent mom of job attribute
 *	updates, using the communication pipes:'pipefd_write', 'pipefd_ack',
 *	'pipefd_status'.
 *
 * @param[in,out]	pjob	 - job being operated on.
 * @param[in]		pipefd_write - for sending the job update request.
 * @param[in]		pipefd_ack - for receiving the ack from parent mom that it
 *				     has received the job update request.
 * @param[in]		pipefd_status - for child to get the result from parent mom
 *					on the job update.
 * @retval 0	- for success
 * @retval 1	- for failure
 */
int
send_update_job(job *pjob, int pipefd_write, int pipefd_ack, int pipefd_status)
{
	int exec_vnode_hookset;
	int schedselect_hookset;
	int exec_host_hookset;
	int exec_host2_hookset;
	size_t r_size = 0;
	char *r_buf = NULL;
	int cmd_ack = IM_ALL_OKAY;

	if (pjob == NULL)
		return (1);

	exec_vnode_hookset = (get_jattr(pjob, JOB_ATR_exec_vnode))->at_flags & ATR_VFLAG_HOOK;
	schedselect_hookset = (get_jattr(pjob, JOB_ATR_SchedSelect))->at_flags & ATR_VFLAG_HOOK;
	exec_host_hookset = (get_jattr(pjob, JOB_ATR_exec_host))->at_flags & ATR_VFLAG_HOOK;
	exec_host2_hookset = (get_jattr(pjob, JOB_ATR_exec_host2))->at_flags & ATR_VFLAG_HOOK;
	if (!exec_vnode_hookset || !schedselect_hookset ||
	    (!exec_host_hookset && !exec_host2_hookset)) {
		return (1);
	}

	/* now that we pruned exec_vnode, need to send the
	 * update to the parent mom
	 */
	if (send_pipe_request(pipefd_write, pipefd_ack, IM_UPDATE_JOB) != 0) {
		log_err(-1, __func__, "send of IM_UPDATE_JOB to parent mom failed");
		return (1);
	}

	/* add delay */
	r_buf = get_jattr_str(pjob, JOB_ATR_exec_vnode);
	r_size = strlen(r_buf) + 1;

	if (send_string_data(pipefd_write, pipefd_ack, r_buf, r_size) != 0) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to send_string_data %s to parent mom", r_buf);
		log_err(-1, __func__, log_buffer);
		return (1);
	}

	/* now send new exec_host or exec_host2 */
	if (is_jattr_set(pjob, JOB_ATR_exec_host2))
		r_buf = get_jattr_str(pjob, JOB_ATR_exec_host2);
	else if (is_jattr_set(pjob, JOB_ATR_exec_host)) /* send new exec_host size */
		r_buf = get_jattr_str(pjob, JOB_ATR_exec_host);
	else {
		snprintf(log_buffer, sizeof(log_buffer),
			 "job %s has unset exec_host and exec_host2", pjob->ji_qs.ji_jobid);
		log_err(-1, __func__, log_buffer);
		return (1);
	}
	r_size = strlen(r_buf) + 1;

	if (send_string_data(pipefd_write, pipefd_ack, r_buf, r_size) != 0) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to send_string_data %s to parent mom", r_buf);
		log_err(-1, __func__, log_buffer);
		return (1);
	}

	/* now send schedselect */
	r_buf = get_jattr_str(pjob, JOB_ATR_SchedSelect);

	r_size = strlen(r_buf) + 1;
	if (send_string_data(pipefd_write, pipefd_ack, r_buf, r_size) != 0) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "failed to send_string_data %s to parent mom", r_buf);
		log_err(-1, __func__, log_buffer);
		return (1);
	}

	/* clear the hook set flag since we've sent the update */
	(get_jattr(pjob, JOB_ATR_exec_vnode))->at_flags &= ~ATR_VFLAG_HOOK;
	if (exec_host2_hookset)
		(get_jattr(pjob, JOB_ATR_exec_host2))->at_flags &= ~ATR_VFLAG_HOOK;
	else
		(get_jattr(pjob, JOB_ATR_exec_host))->at_flags &= ~ATR_VFLAG_HOOK;
	(get_jattr(pjob, JOB_ATR_SchedSelect))->at_flags &= ~ATR_VFLAG_HOOK;

	if (pjob->ji_numnodes > 1) {
		/* get cmd_ack from parent that it received
		 * and acted upon the job updates from sis moms
		 */
		snprintf(log_buffer, sizeof(log_buffer), "waiting up to %d secs for job update acks from sister moms", PIPE_READ_TIMEOUT);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
		r_buf = read_pipe_data(pipefd_status, sizeof(int), PIPE_READ_TIMEOUT);
		if (r_buf != NULL)
			memcpy(&cmd_ack, r_buf, sizeof(int));
		if ((r_buf == NULL) || (cmd_ack != IM_ALL_OKAY)) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "not all job updates to sister moms completed");
		}
	}
	return (0);
}

/**
 * @brief
 *	Get/set job pjob's exec_vnode, exec_host, schedselect from the job's
 *	3rd pipe, and communicatng to the server of the new exec_vnode,
 *	schedselect values (no need to send exec_host as server will just
 *	recreate it on its end). The sister moms whose vnodes have been
 *	out in the new exec_vnode would get an IM_DELETE_JOB2 request.
 * @param[in]	pjob - job whose exec_vnode/exec_host/schedselect  is being
 *			obtained.
 * @param[in]	msg - fill in with error message received if this function
 *			encounters a failure.
 * @param[in]	msg_size - size of 'msg'.
 *
 * @return int
 * @retval 0	- for success
 * @retval 1	- for non-success due to pipes failure
 * @retval 2	- for no data found
 * @retval -1	- for non-success due to internal error.
 */
int
get_new_exec_vnode_host_schedselect(job *pjob, char *msg, size_t msg_size)
{
	char *new_exec_vnode = NULL;
	char *new_exec_host = NULL;
	char *new_schedselect = NULL;
	char *r_buf;
	int rc = 0;

	/* get exec_vnode don't close pipes */
	r_buf = receive_string_data(pjob->ji_child2parent_job_update_pipe,
				    pjob->ji_parent2child_job_update_pipe);
	if (r_buf == NULL) {
		(void) snprintf(msg, msg_size, "failed to obtain new exec_vnode");
		return (1);
	}
	new_exec_vnode = strdup(r_buf);
	if (new_exec_vnode == NULL) {
		(void) snprintf(msg, msg_size, "%s: new exec_vnode strdup error", __func__);
		return (1);
	}

	/* get exec_host */
	r_buf = receive_string_data(pjob->ji_child2parent_job_update_pipe, pjob->ji_parent2child_job_update_pipe);
	if (r_buf == NULL) {
		(void) snprintf(msg, msg_size, "failed to obtain new exec_host size");
		free(new_exec_vnode);
		return (1);
	}

	new_exec_host = strdup(r_buf);
	if (new_exec_host == NULL) {
		(void) snprintf(msg, msg_size, "failed to strdup new exec_host");
		free(new_exec_vnode);
		return (1);
	}
	/* get schedselect */
	r_buf = receive_string_data(pjob->ji_child2parent_job_update_pipe, pjob->ji_parent2child_job_update_pipe);
	if (r_buf == NULL) {
		(void) snprintf(msg, msg_size, "failed to obtain new schedselect size");
		free(new_exec_vnode);
		free(new_exec_host);
		return (1);
	}

	new_schedselect = strdup(r_buf);
	if (new_schedselect == NULL) {
		(void) snprintf(msg, msg_size, "failed to strdup new schedselect");
		free(new_exec_vnode);
		free(new_exec_host);
		return (1);
	}

	/* set job's exec_vnode */
	snprintf(log_buffer, sizeof(log_buffer), "pruned from exec_vnode=%s",
		 get_jattr_str(pjob, JOB_ATR_exec_vnode));
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);
	snprintf(log_buffer, sizeof(log_buffer),
		 "pruned to exec_vnode=%s", new_exec_vnode);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);

	set_jattr_str_slim(pjob, JOB_ATR_exec_vnode, new_exec_vnode, NULL);

	(void) update_resources_list(pjob, ATTR_l,
				     JOB_ATR_resource, new_exec_vnode, INCR, 0,
				     JOB_ATR_resource_orig);

	if (is_jattr_set(pjob, JOB_ATR_exec_host2))
		set_jattr_str_slim(pjob, JOB_ATR_exec_host2, new_exec_host, NULL);
	else if (is_jattr_set(pjob, JOB_ATR_exec_host))
		set_jattr_str_slim(pjob, JOB_ATR_exec_host, new_exec_host, NULL);

	/* Send DELETE_JOB2 request to the sister moms not in
	 * 'new_peh', to kill the job on that sister and
	 * report resources_used info.
	 */
	(void) send_sisters_inner(pjob, IM_DELETE_JOB2, NULL, new_exec_host);

	set_jattr_str_slim(pjob, JOB_ATR_SchedSelect, new_schedselect, NULL);

	free(new_exec_vnode);
	free(new_exec_host);
	free(new_schedselect);

	if ((rc = job_nodes(pjob)) != 0) {
		snprintf(msg, msg_size, "failed updating internal nodes data (rc=%d)", rc);
		return (-1);
	}
	if (generate_pbs_nodefile(pjob, NULL, 0, msg, msg_size) != 0) {
		return (-1);
	}

	job_save(pjob);
	/* set modify flag on the job attributes that will be sent to the server */
	(get_jattr(pjob, JOB_ATR_exec_vnode))->at_flags |= ATR_VFLAG_MODIFY;
	(get_jattr(pjob, JOB_ATR_SchedSelect))->at_flags |= ATR_VFLAG_MODIFY;
	enqueue_update_for_send(pjob, IS_RESCUSED);

	return (0);
}

/**
 * @brief
 *	A task that will report failed node hosts due to
 *	unsuccessful execjob_prologue hook execution.
 *
 * @param[in] 	work_task -  task to process.
 *
 * @return none
 *
 */
static void
report_failed_node_hosts_task(struct work_task *ptask)
{
	job *pjob = (job *) ptask->wt_parm1;
	reliable_job_node *rjn, *rjn_next;

	if (pjob == NULL) {
		log_err(-1, __func__, "task structure contains reference to NULL job");
		return;
	}
	if (pjob->ji_report_task)
		pjob->ji_report_task = NULL;

	if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING) ||
	    !check_job_substate(pjob, JOB_SUBSTATE_PRERUN))
		return; /* job not longer waiting for healthy moms */

	for (rjn = (reliable_job_node *) GET_NEXT(pjob->ji_node_list); rjn != NULL; rjn = rjn_next) {
		rjn_next = (reliable_job_node *) GET_NEXT(rjn->rjn_link);
		if (strcmp(rjn->rjn_host, mom_host) == 0)
			continue;

		if (!rjn->prologue_hook_success) {
			reliable_job_node_add(&pjob->ji_failed_node_list, rjn->rjn_host);
			if (pjob->ji_parent2child_moms_status_pipe != -1) {
				size_t r_size;
				r_size = strlen(rjn->rjn_host) + 1;
				if (write_pipe_data(pjob->ji_parent2child_moms_status_pipe, &r_size, sizeof(size_t)) == 0)
					(void) write_pipe_data(pjob->ji_parent2child_moms_status_pipe, rjn->rjn_host, r_size);
				else
					log_err(errno, __func__, "failed to write");
			}
			delete_link(&rjn->rjn_link);
			free(rjn);
		}
	}
}

/**
 * @brief
 * 	Receive a special request from the pipe represented by descriptor
 *	'sd'.
 * @param[in]	sd - connection descriptor
 *
 * @return none
 *
 */
static void
receive_pipe_request(int sd)
{
	conn_t *conn;
	int i;
	job *pjob = NULL;
	pbs_task *ptask;
	int cmd;
	char msg[LOG_BUF_SIZE];

	if ((conn = get_conn(sd)) == NULL) {
		log_err(PBSE_INTERNAL, __func__, "unable to find pipe");
		return;
	}

	ptask = (pbs_task *) conn->cn_data;
	if (ptask == NULL)
		return;

	pjob = ptask->ti_job;

	if (pjob == NULL) {
		log_err(PBSE_INTERNAL, __func__, "no job task associated with connection");
		return;
	}

	/* now we read the cmd or error */
	i = readpipe(pjob->ji_jsmpipe2, &cmd, sizeof(int));

	if (i != sizeof(int)) {
		return;
	}

	/* send back as an acknowledgement that MOM got it */
	(void) writepipe(pjob->ji_mjspipe2, &cmd, sizeof(int));

	if (cmd == IM_EXEC_PROLOGUE) {

		if (send_sisters(pjob, IM_EXEC_PROLOGUE, NULL) != pjob->ji_numnodes - 1) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: %s: IM_EXEC_PROLOGUE requests "
				 "could not reach some sister moms",
				 pjob->ji_qs.ji_jobid);
			log_err(-1, __func__, log_buffer);
		}

		if (do_tolerate_node_failures(pjob)) {
			long delay_value;
			/* execute report task 'delay_value' seconds from
			 * now, where the value is 95% of the job_launch_delay
			 * value. This allows the waiting child mom to
			 * capture the failed node host values before it times
			 * out on job_launch_delay.
			 */
			delay_value = 0.95 * job_launch_delay;
			pjob->ji_report_task = set_task(WORK_Timed, time_now + delay_value, report_failed_node_hosts_task, pjob);
		}
	} else {
		snprintf(msg, sizeof(msg), "ignoring unknown cmd %d", cmd);
		log_err(-1, __func__, msg);
	}
}

/**
 * @brief
 *	Close various pipes touched by a job update.
 *
 * @param[in] pjob - structure handle to job
 *
 * @return Void
 *
 */
void
close_update_pipes(job *pjob)
{
	if (pjob == NULL)
		return;

	(void) close_conn(pjob->ji_child2parent_job_update_pipe);
	pjob->ji_child2parent_job_update_pipe = -1;
	(void) close(pjob->ji_parent2child_job_update_pipe);
	pjob->ji_parent2child_job_update_pipe = -1;

	if (pjob->ji_jsmpipe2 != -1) {
		(void) close(pjob->ji_jsmpipe2);
		pjob->ji_jsmpipe2 = -1;
	}

	if (pjob->ji_mjspipe2 != -1) {
		(void) close(pjob->ji_mjspipe2);
		pjob->ji_mjspipe2 = -1;
	}

	(void) close_conn(pjob->ji_jsmpipe);
	pjob->ji_jsmpipe = -1;
	(void) close(pjob->ji_mjspipe);
	pjob->ji_mjspipe = -1;
}

/**
 * @brief
 * 	Receive a special request from the pipe represented by descriptor
 *	'sd'.
 * @param[in]	sd - connection descriptor
 *
 * @return none
 *
 */
static void
receive_job_update_request(int sd)
{
	conn_t *conn = NULL;
	int i;
	job *pjob = NULL;
	pbs_task *ptask;
	int cmd;
	char msg[LOG_BUF_SIZE];

	if ((conn = get_conn(sd)) == NULL) {
		log_err(PBSE_INTERNAL, __func__, "unable to find pipe");
		return;
	}

	ptask = (pbs_task *) conn->cn_data;

	if (ptask == NULL)
		return;

	pjob = ptask->ti_job;

	if (pjob == NULL) {
		log_err(PBSE_INTERNAL, __func__, "no job task associated with connection");
		return;
	}

	/* now we read the cmd or error */
	i = readpipe(pjob->ji_child2parent_job_update_pipe, &cmd, sizeof(int));

	if (i != sizeof(int)) {
		snprintf(msg, sizeof(msg),
			 "read of pipe for pid job %s got %d not %d: errno %s",
			 pjob->ji_qs.ji_jobid, i, (int) sizeof(int), strerror(errno));

		close_update_pipes(pjob);
		exec_bail(pjob, JOB_EXEC_RETRY, msg);
		return;
	}

	/* send back as an acknowledgement that MOM got it */
	(void) writepipe(pjob->ji_parent2child_job_update_pipe, &cmd, sizeof(int));

	if (cmd == IM_UPDATE_JOB) {
		mom_hook_input_t hook_input;
		mom_hook_output_t hook_output;
		char hook_msg[HOOK_MSG_SIZE + 1];
		int hook_errcode = 0;
		hook *last_phook;
		unsigned int hook_fail_action = 0;

		if (get_new_exec_vnode_host_schedselect(pjob, msg, LOG_BUF_SIZE) != 0) {
			close_update_pipes(pjob);
			exec_bail(pjob, JOB_EXEC_RETRY, msg);
			return;
		}

		mom_hook_input_init(&hook_input);
		hook_input.pjob = pjob;

		mom_hook_output_init(&hook_output);
		hook_output.reject_errcode = &hook_errcode;
		hook_output.last_phook = &last_phook;
		hook_output.fail_action = &hook_fail_action;
		if (mom_process_hooks(HOOK_EVENT_EXECJOB_RESIZE,
				      PBS_MOM_SERVICE_NAME, mom_host, &hook_input,
				      &hook_output,
				      hook_msg, sizeof(hook_msg), 1) == 0) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid, "execjob_resize hook rejected request");
			close_update_pipes(pjob);
			exec_bail(pjob, JOB_EXEC_RETRY, hook_msg);
			return;
		}
		(void) send_sisters_job_update(pjob);
		pjob->ji_updated = 1;
	} else {
		snprintf(msg, sizeof(msg), "ignoring unknown cmd %d", cmd);
		log_err(-1, __func__, msg);
	}
}

/**
 *
 * @brief
 * 	Used by MOM superior to start the shell process for 'pjob'
 *
 * @param[in]	pjob - pointer to the job whose initial shell is
 *		being spawned.
 *
 * @return	Void
 *
 */
void
finish_exec(job *pjob)
{
	char **argv = NULL;
	char buf[(2 * MAXPATHLEN) + 5];
	pid_t cpid;
	struct passwd *pwdp; /* for uid, shell, home dir */
	int i, j, k;
	pbs_socklen_t len;
	int is_interactive = 0;
	int numthreads;
#if SHELL_INVOKE == 1
	int pipe_script[] = {-1, -1};
#endif
	char *pts_name; /* name of slave pty */
	char *shell;
	int jsmpipe[] = {-1, -1};		       /* job starter to MOM for sid */
	int jsmpipe2[] = {-1, -1};		       /* job starter to MOM */
	int child2parent_job_update_pipe[] = {-1, -1}; /* job starter to MOM */
	int child2parent_job_update_pipe_w = -1;
	int upfds = -1;				       /* init to invalid fd */
	int upfds2 = -1;			       /* init to invalid fd */
	int mjspipe[] = {-1, -1};		       /* MOM to job starter for ack */
	int mjspipe2[] = {-1, -1};		       /* MOM to job starter */
	int parent2child_job_update_pipe[] = {-1, -1}; /* MOM to job starter */
	int parent2child_job_update_pipe_r = -1;
	int parent2child_job_update_status_pipe[] = {-1, -1}; /* MOM to job starter */
	int parent2child_job_update_status_pipe_r = -1;	      /* init to invalid fd */
	int downfds = -1;				      /* init to invalid fd */
	int downfds2 = -1;				      /* init to invalid fd */
	int parent2child_moms_status_pipe[] = {-1, -1};	      /* MOM to job starter */
	int parent2child_moms_status_pipe_r = -1;	      /* init to invalid fd */
	int port_out, port_err;
	struct startjob_rtn sjr;
#if MOM_ALPS
	struct startjob_rtn ack;
#endif
	pbs_task *ptask;
	struct array_strings *vstrs;
	struct sockaddr_in saddr;
	int nodemux = 0;
	char *pbs_jobdir; /* staging and execution directory of this job */
	int sandbox_private = 0;
	int display_number = 0, n = 0;
	struct pfwdsock *socks = NULL;
#ifdef NAS /* localmod 020 */
	char *schedselect;
#endif /* localmod 020 */
	char hook_msg[HOOK_MSG_SIZE + 1];
	int hook_rc;
	int prolo_hooks = 0; /*# of runnable prologue hooks*/
	char *progname = NULL;
	pbs_list_head argv_list;
	char *the_progname;
	char **the_argv;
	char **the_env;
	char **res_env;
	hook *last_phook = NULL;
	unsigned int hook_fail_action = 0;
	int hook_errcode = 0;
	mom_hook_input_t hook_input;
	mom_hook_output_t hook_output;
	int job_has_executable;
	FILE *temp_stderr = stderr;
	vnl_t *vnl_fails = NULL;
	vnl_t *vnl_good = NULL;
	struct sigaction tmp_act_hup;
	struct sigaction tmp_act_int;
	struct sigaction tmp_act_quit;
	struct sigaction tmp_act_stp;

	ptc = -1; /* No current master pty */

	memset(&sjr, 0, sizeof(sjr));
	if (is_jattr_set(pjob, JOB_ATR_nodemux))
		nodemux = get_jattr_long(pjob, JOB_ATR_nodemux);

	if ((i = job_setup(pjob, &pwdp)) != JOB_EXEC_OK) {
		exec_bail(pjob, i, NULL);
		return;
	}

	/* wait until after job_setup to call jobdirname(), we need the user's home info */
	pbs_jobdir = jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir);

	if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
	    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
		/* set local variable sandbox_private */
		sandbox_private = 1;
	}

	/* If job has been checkpointed, restart from the checkpoint image */

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) ||
	    (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ChkptMig)) {
		if ((i = local_restart(pjob, NULL)) != 0) {
			post_restart(pjob, i);
			exec_bail(pjob, (i == PBSE_CKPBSY) ? JOB_EXEC_RETRY : JOB_EXEC_FAIL2, NULL);
		}
		return;
	}

	if (pjob->ji_numnodes == 1 || nodemux) {
		port_out = -1;
		port_err = -1;
	} else {
		/*
		 ** Get port numbers from file decriptors in job struct.  The
		 ** sockets are stored there so they can be closed later as
		 ** Main MOM will not need them after the job is going.
		 */
		len = sizeof(saddr);
		if (getsockname(pjob->ji_stdout,
				(struct sockaddr *) &saddr, &len) == -1) {
			(void) sprintf(log_buffer, "getsockname on stdout");
			exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
			return;
		}
		port_out = (int) ntohs(saddr.sin_port);

		len = sizeof(saddr);
		if (getsockname(pjob->ji_stderr,
				(struct sockaddr *) &saddr, &len) == -1) {
			(void) sprintf(log_buffer, "getsockname on stderr");
			exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
			return;
		}
		port_err = (int) ntohs(saddr.sin_port);
	}

	if (is_jattr_set(pjob, JOB_ATR_interactive) && get_jattr_long(pjob, JOB_ATR_interactive) != 0) {

		is_interactive = 1;

		/*
		 * open a master pty, need to do it here before we fork,
		 * to save the slave name in the master's job structure
		 */

		if ((ptc = open_master(&pts_name)) < 0) {
			log_err(errno, __func__, "cannot open master pty");
			exec_bail(pjob, JOB_EXEC_RETRY, NULL);
			return;
		}
		FDMOVE(ptc)

		/* save pty name in job output/error file name */
		set_jattr_str_slim(pjob, JOB_ATR_outpath, pts_name, NULL);
		set_jattr_str_slim(pjob, JOB_ATR_errpath, pts_name, NULL);

#if SHELL_INVOKE == 1
	} else {
		/* need a pipe on which to write the shell script 	*/
		/* file name to the input of the shell			*/

		if (pipe(pipe_script) == -1) {
			(void) sprintf(log_buffer,
				       "Failed to create shell name pipe");
			exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
			return;
		}
#endif /* SHELL_INVOKE */
	}

	/* create pipes between MOM and the job starter    */
	/* fork the job starter which will become the job */

	if ((pipe(mjspipe) == -1) || (pipe(jsmpipe) == -1)) {
		i = -1;

	} else {

		i = 0;

		/* make sure pipe file descriptors are above 2 */

		if (jsmpipe[1] < 3) {
			upfds = fcntl(jsmpipe[1], F_DUPFD, 3);
			(void) close(jsmpipe[1]);
			jsmpipe[1] = -1;
		} else {
			upfds = jsmpipe[1];
		}
		if (mjspipe[0] < 3) {
			downfds = fcntl(mjspipe[0], F_DUPFD, 3);
			(void) close(mjspipe[0]);
			mjspipe[0] = -1;
		} else {
			downfds = mjspipe[0];
		}
	}
	if ((i == -1) || (upfds < 3) || (downfds < 3)) {
		if (upfds != -1)
			(void) close(upfds);
		if (downfds != -1)
			(void) close(downfds);
		if (jsmpipe[0] != -1)
			(void) close(jsmpipe[0]);
		if (mjspipe[1] != -1)
			(void) close(mjspipe[1]);
		(void) sprintf(log_buffer, "Failed to create communication pipe");
		exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
		return;
	}
	if ((ptask = momtask_create(pjob)) == NULL) {
		if (upfds != -1)
			(void) close(upfds);
		if (downfds != -1)
			(void) close(downfds);
		if (jsmpipe[0] != -1)
			(void) close(jsmpipe[0]);
		if (mjspipe[1] != -1)
			(void) close(mjspipe[1]);
		(void) sprintf(log_buffer, "Task creation failed");
		exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
		return;
	}

	prolo_hooks = num_eligible_hooks(HOOK_EVENT_EXECJOB_PROLOGUE);

	/* create 2nd set of pipes between MOM and the job starter */
	/* if there are prologue hooks */
	if (prolo_hooks > 0) {
		if ((pipe(mjspipe2) == -1) || (pipe(jsmpipe2) == -1)) {
			i = -1;

		} else {

			i = 0;

			/* make sure pipe file descriptors are above 2 */

			if (jsmpipe2[1] < 3) {
				upfds2 = fcntl(jsmpipe2[1], F_DUPFD, 3);
				(void) close(jsmpipe2[1]);
				jsmpipe2[1] = -1;
			} else {
				upfds2 = jsmpipe2[1];
			}

			if (mjspipe2[0] < 3) {
				downfds2 = fcntl(mjspipe2[0], F_DUPFD, 3);
				(void) close(mjspipe2[0]);
				mjspipe2[0] = -1;
			} else {
				downfds2 = mjspipe2[0];
			}
		}
		if ((i == -1) || (upfds2 < 3) || (downfds2 < 3)) {
			if (upfds2 != -1)
				(void) close(upfds2);
			if (downfds2 != -1)
				(void) close(downfds2);
			if (jsmpipe2[0] != -1)
				(void) close(jsmpipe2[0]);
			if (mjspipe2[1] != -1)
				(void) close(mjspipe2[1]);
			(void) snprintf(log_buffer, sizeof(log_buffer),
					"Failed to create communication pipe");
			exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
			return;
		}
	}

	if (do_tolerate_node_failures(pjob)) {
		/* create 3rd set of pipes between MOM and the job starter
		 * fork the job starter which will become the job
		 */

		if ((pipe(parent2child_job_update_pipe) == -1) || (pipe(child2parent_job_update_pipe) == -1)) {
			i = -1;
		} else {
			i = 0;
			/* make sure pipe file descriptors are above 2 */
			if (child2parent_job_update_pipe[1] < 3) {
				child2parent_job_update_pipe_w = fcntl(child2parent_job_update_pipe[1], F_DUPFD, 3);
				(void) close(child2parent_job_update_pipe[1]);
				child2parent_job_update_pipe[1] = -1;
			} else {
				child2parent_job_update_pipe_w = child2parent_job_update_pipe[1];
			}
			if (parent2child_job_update_pipe[0] < 3) {
				parent2child_job_update_pipe_r = fcntl(parent2child_job_update_pipe[0], F_DUPFD, 3);
				(void) close(parent2child_job_update_pipe[0]);
				parent2child_job_update_pipe[0] = -1;
			} else {
				parent2child_job_update_pipe_r = parent2child_job_update_pipe[0];
			}
		}
		if ((i == -1) || (child2parent_job_update_pipe_w < 3) || (parent2child_job_update_pipe_r < 3)) {
			if (child2parent_job_update_pipe_w != -1)
				(void) close(child2parent_job_update_pipe_w);
			if (parent2child_job_update_pipe_r != -1)
				(void) close(parent2child_job_update_pipe_r);
			if (child2parent_job_update_pipe[0] != -1)
				(void) close(child2parent_job_update_pipe[0]);
			if (parent2child_job_update_pipe[1] != -1)
				(void) close(parent2child_job_update_pipe[1]);
			(void) sprintf(log_buffer,
				       "Failed to create communication pipe");
			exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
			return;
		}

		/* create 4th set of pipes between MOM and the job starter
		 * fork the job starter which will become the job
		 */

		if (pipe(parent2child_job_update_status_pipe) == -1) {
			i = -1;
		} else {
			i = 0;
			/* make sure pipe file descriptors are above 2 */
			if (parent2child_job_update_status_pipe[0] < 3) {
				parent2child_job_update_status_pipe_r = fcntl(parent2child_job_update_status_pipe[0], F_DUPFD, 3);
				(void) close(parent2child_job_update_status_pipe[0]);
				parent2child_job_update_status_pipe[0] = -1;
			} else {
				parent2child_job_update_status_pipe_r = parent2child_job_update_status_pipe[0];
			}
		}
		if ((i == -1) || (parent2child_job_update_status_pipe_r < 3)) {
			if (parent2child_job_update_status_pipe_r != -1)
				(void) close(parent2child_job_update_status_pipe_r);
			if (parent2child_job_update_status_pipe[1] != -1)
				(void) close(parent2child_job_update_status_pipe[1]);
			(void) sprintf(log_buffer,
				       "Failed to create communication pipe");
			exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
			return;
		}

		if (pipe(parent2child_moms_status_pipe) == -1) {
			i = -1;

		} else {

			i = 0;

			/* make sure pipe file descriptors are above 2 */
			if (parent2child_moms_status_pipe[0] < 3) {
				parent2child_moms_status_pipe_r = fcntl(parent2child_moms_status_pipe[0], F_DUPFD, 3);
				(void) close(parent2child_moms_status_pipe[0]);
				parent2child_moms_status_pipe[0] = -1;
			} else {
				parent2child_moms_status_pipe_r = parent2child_moms_status_pipe[0];
			}
		}

		if ((i == -1) || (parent2child_moms_status_pipe_r < 3)) {
			if (parent2child_moms_status_pipe_r != -1)
				(void) close(parent2child_moms_status_pipe_r);
			if (parent2child_moms_status_pipe[1] != -1)
				(void) close(parent2child_moms_status_pipe[1]);
			(void) sprintf(log_buffer,
				       "Failed to create communication pipe");
			exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
			return;
		}
	}

	pjob->ji_qs.ji_stime = time_now;
	set_jattr_l_slim(pjob, JOB_ATR_stime, time_now, SET);
	pjob->ji_sampletim = time_now;

	/*
	 * Fork the child process that will become the job.
	 */
	cpid = fork_me(-1);
	if (cpid > 0) {
		conn_t *conn = NULL;

		/* the parent side, still the main man, uhh that is MOM */

		(void) close(upfds);
		(void) close(downfds);

		(void) close(upfds2);
		(void) close(downfds2);

		(void) close(child2parent_job_update_pipe_w);
		(void) close(parent2child_job_update_pipe_r);

		(void) close(parent2child_job_update_status_pipe_r);
		(void) close(parent2child_moms_status_pipe_r);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		DIS_tcp_funcs();
#endif

		/* add the pipe to the connection table so we can poll it */

		if ((conn = add_conn(jsmpipe[0], ChildPipe, (pbs_net_t) 0,
				     (unsigned int) 0, NULL, record_finish_exec)) == NULL) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
				  pjob->ji_qs.ji_jobid,
				  "Unable to start job, communication connection table is full");
			(void) close(jsmpipe[0]);
			(void) close(mjspipe[1]);
			(void) close(jsmpipe2[0]);
			(void) close(mjspipe2[1]);

			(void) close(child2parent_job_update_pipe[0]);
			(void) close(parent2child_job_update_pipe[1]);

			(void) close(parent2child_job_update_status_pipe[1]);
			(void) close(parent2child_moms_status_pipe[1]);
#if SHELL_INVOKE == 1
			if (pipe_script[0] != -1)
				(void) close(pipe_script[0]);
			if (pipe_script[1] != -1)
				(void) close(pipe_script[1]);
#endif
			exec_bail(pjob, JOB_EXEC_RETRY, NULL);
			return;
		}
		conn->cn_data = ptask;
		pjob->ji_jsmpipe = jsmpipe[0];
		pjob->ji_mjspipe = mjspipe[1];
		pjob->ji_jsmpipe2 = jsmpipe2[0];
		pjob->ji_mjspipe2 = mjspipe2[1];

		/*
		 * at this point, parent mom writes to
		 * pjob->ji_mjspipe2, and parent reads from
		 * pjob->ji_jsmpipe2
		 */

		/*
		 * if there are prologue hooks to run
		 * add the pipe to the connection table so we can poll it
		 */
		if (prolo_hooks > 0) {
			if ((conn = add_conn(jsmpipe2[0], ChildPipe,
					     (pbs_net_t) 0, (unsigned int) 0, NULL,
					     receive_pipe_request)) == NULL) {
				log_event(PBSEVENT_ERROR,
					  PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid,
					  "Unable t0 start job... communication "
					  "connection table is full");
				(void) close(jsmpipe2[0]);
				(void) close(mjspipe2[1]);

				(void) close(jsmpipe[0]);
				(void) close(mjspipe[1]);

				if (pipe_script[0] != -1)
					(void) close(pipe_script[0]);
				if (pipe_script[1] != -1)
					(void) close(pipe_script[1]);
				exec_bail(pjob, JOB_EXEC_RETRY, NULL);
				return;
			}
			conn->cn_data = ptask;
		}

		/*
		 * if there are prologue hooks to run
		 * add the pipe to the connection table so we can poll it
		 */
		if (do_tolerate_node_failures(pjob)) {

			if ((conn = add_conn(child2parent_job_update_pipe[0], ChildPipe,
					     (pbs_net_t) 0, (unsigned int) 0, NULL,
					     receive_job_update_request)) == NULL) {
				log_event(PBSEVENT_ERROR,
					  PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid,
					  "Unable to start job, communication connection table is full");
				(void) close(child2parent_job_update_pipe[0]);
				(void) close(parent2child_job_update_pipe[1]);

				(void) close(jsmpipe2[0]);
				(void) close(mjspipe2[1]);

				(void) close(jsmpipe[0]);
				(void) close(mjspipe[1]);

				if (pipe_script[0] != -1)
					(void) close(pipe_script[0]);
				if (pipe_script[1] != -1)
					(void) close(pipe_script[1]);
				exec_bail(pjob, JOB_EXEC_RETRY, NULL);
				return;
			}
			conn->cn_data = ptask;

			pjob->ji_child2parent_job_update_pipe = child2parent_job_update_pipe[0];
			pjob->ji_parent2child_job_update_pipe = parent2child_job_update_pipe[1];

			pjob->ji_parent2child_job_update_status_pipe = parent2child_job_update_status_pipe[1];
			pjob->ji_parent2child_moms_status_pipe = parent2child_moms_status_pipe[1];
		}

		if (ptc >= 0) {
			(void) close(ptc);
			ptc = -1;
		}

#if SHELL_INVOKE == 1
		if (is_interactive == 0) {
			char *s;
			char *d;
			char holdbuf[(2 * MAXPATHLEN) + 5];
			int k;

			if (*pjob->ji_qs.ji_fileprefix != '\0')
				sprintf(buf, "%s%s%s", path_jobs,
					pjob->ji_qs.ji_fileprefix, JOB_SCRIPT_SUFFIX);
			else
				sprintf(buf, "%s%s%s", path_jobs,
					pjob->ji_qs.ji_jobid, JOB_SCRIPT_SUFFIX);

			if (chown(buf, pjob->ji_qs.ji_un.ji_momt.ji_exuid,
					pjob->ji_qs.ji_un.ji_momt.ji_exgid) == -1)
					log_errf(-1, __func__, "chown failed. ERR : %s",strerror(errno));

			/* add escape in front of brackets */
			for (s = buf, d = holdbuf; *s && ((d - holdbuf) < sizeof(holdbuf)); s++, d++) {
				if (*s == '[' || *s == ']')
					*d++ = '\\';
				*d = *s;
			}
			*d = '\0';
			snprintf(buf, sizeof(buf), "%s", holdbuf);
			DBPRT(("shell: %s\n", buf))

			/* pass name of shell script on pipe	*/
			/* will be stdin of shell 		*/

			(void) close(pipe_script[0]);

			/* if in "sandbox=PRIVATE" mode, prepend the script name on the pipe */
			/* with "cd $PBS_JOBDIR;" command */
			if (sandbox_private) {
				snprintf(buf, sizeof(buf), "cd %s;%.*s", pbs_jobdir,
					 (int) (sizeof(buf) - strlen(pbs_jobdir) - 5), holdbuf);
			}

			(void) strcat(buf, "\n"); /* setup above */
			i = strlen(buf);
			j = 0;
			while (j < i) {
				if ((k = write(pipe_script[1], buf + j, i - j)) < 0) {
					if (errno == EINTR)
						continue;
					break;
				}
				j += k;
			}
			(void) close(pipe_script[1]);
		}

		if (pjob->ji_numnodes > 1 && !nodemux) {
			/*
			 * Put port numbers into job struct and close sockets.
			 * The job uses them to talk to demux, but main MOM
			 * doesn't need them.   The port numbers are stored
			 * here for use in start_process(), to connect to
			 * pbs_demux.
			 */
			(void) close(pjob->ji_stdout);
			pjob->ji_stdout = port_out;
			(void) close(pjob->ji_stderr);
			pjob->ji_stderr = port_err;
		}

		/* record job working directory in jobdir attribute */
		set_jattr_str_slim(pjob, JOB_ATR_jobdir, sandbox_private ? pbs_jobdir : pwdp->pw_dir, NULL);
#endif /* SHELL_INVOKE */

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		if (is_jattr_set(pjob, JOB_ATR_cred_id))
			send_cred_sisters(pjob);
#endif

		return;

	} else if (cpid < 0) {
#if SHELL_INVOKE == 1
		if (pipe_script[0] != -1)
			(void) close(pipe_script[0]);
		if (pipe_script[1] != -1)
			(void) close(pipe_script[1]);
#endif /* SHELL_INVOKE */
		if (upfds != -1)
			(void) close(upfds);
		if (downfds != -1)
			(void) close(downfds);
		if (jsmpipe[0] != -1)
			(void) close(jsmpipe[0]);
		if (mjspipe[1] != -1)
			(void) close(mjspipe[1]);
		if (upfds2 != -1)
			(void) close(upfds2);
		if (downfds2 != -1)
			(void) close(downfds2);
		if (child2parent_job_update_pipe_w != -1)
			(void) close(child2parent_job_update_pipe_w);
		if (parent2child_job_update_pipe_r != -1)
			(void) close(parent2child_job_update_pipe_r);
		if (parent2child_job_update_status_pipe_r != -1)
			(void) close(parent2child_job_update_status_pipe_r);
		if (parent2child_moms_status_pipe_r != -1)
			(void) close(parent2child_moms_status_pipe_r);

		if (jsmpipe2[0] != -1)
			(void) close(jsmpipe2[0]);
		if (mjspipe2[1] != -1)
			(void) close(mjspipe2[1]);
		if (child2parent_job_update_pipe[0] != -1)
			(void) close(child2parent_job_update_pipe[0]);
		if (parent2child_job_update_pipe[1] != -1)
			(void) close(parent2child_job_update_pipe[1]);
		if (parent2child_job_update_status_pipe[1] != -1)
			(void) close(parent2child_job_update_status_pipe[1]);
		if (parent2child_moms_status_pipe[1] != -1)
			(void) close(parent2child_moms_status_pipe[1]);

		(void) sprintf(log_buffer, "Fork failed in %s: %d",
			       __func__, errno);
		exec_bail(pjob, JOB_EXEC_RETRY, log_buffer);
		return;
	}
	/************************************************/
	/*						*/
	/* The child process - will become THE JOB	*/
	/*						*/
	/************************************************/

	if (jsmpipe[0] != -1)
		(void) close(jsmpipe[0]);

	if (mjspipe[1] != -1)
		(void) close(mjspipe[1]);

	if (jsmpipe2[0] != -1)
		(void) close(jsmpipe2[0]);

	if (mjspipe2[1] != -1)
		(void) close(mjspipe2[1]);

	if (child2parent_job_update_pipe[0] != -1)
		(void) close(child2parent_job_update_pipe[0]);

	if (parent2child_job_update_pipe[1] != -1)
		(void) close(parent2child_job_update_pipe[1]);

	if (parent2child_job_update_status_pipe[1] != -1)
		(void) close(parent2child_job_update_status_pipe[1]);

	if (parent2child_moms_status_pipe[1] != -1)
		(void) close(parent2child_moms_status_pipe[1]);

	CLR_SJR(sjr) /* clear structure used to return info to parent */

	/* unprotect the job from the vagaries of the kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

	/* set system core limit */
#if defined(RLIM64_INFINITY)
	(void) setrlimit64(RLIMIT_CORE, &orig_core_limit);
#else  /* set rlimit 32 bit */
	(void) setrlimit(RLIMIT_CORE, &orig_core_limit);
#endif /* RLIM64_INFINITY */

	/*
	 * find which shell to use, one specified or the login shell
	 */
	shell = set_shell(pjob, pwdp); /* in the machine dependent section */

	prolo_hooks = num_eligible_hooks(HOOK_EVENT_EXECJOB_PROLOGUE);

	/*
	 * set up the Environmental Variables to be given to the job
	 */
	vstrs = get_jattr_arst(pjob, JOB_ATR_variables);
	pjob->ji_env.v_ensize = vstrs->as_usedptr + num_var_else + num_var_env +
				EXTRA_ENV_PTRS;
	pjob->ji_env.v_used = 0;
	pjob->ji_env.v_envp = (char **) calloc(pjob->ji_env.v_ensize, sizeof(char *));
	if (pjob->ji_env.v_envp == NULL) {
		log_err(ENOMEM, __func__, "out of memory");
		starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	if (cred_by_job(ptask->ti_job, CRED_RENEWAL) != PBS_KRB5_OK) {
		starter_return(upfds, downfds, JOB_EXEC_FAIL_KRB5, &sjr);
	}

#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
	if (start_afslog(ptask, NULL, pipe_script[0], pipe_script[1]) != PBS_KRB5_OK) {
		sprintf(log_buffer, "afslog for task %8.8X not started",
			ptask->ti_qs.ti_task);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}
#endif
#endif

	/*  First variables from the local environment */

	for (j = 0; j < num_var_env; ++j)
		bld_env_variables(&(pjob->ji_env), environ[j], NULL);

	/* Second, the variables passed with the job.  They may */
	/* be overwritten with new correct values for this job	*/

	for (j = 0; j < vstrs->as_usedptr; ++j) {
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
			/* never set KRB5CCNAME; it would rewrite the correct value */
			if (strncmp(vstrs->as_string[j], "KRB5CCNAME", strlen("KRB5CCNAME")) == 0)
				continue;
#endif
		bld_env_variables(&(pjob->ji_env), vstrs->as_string[j], NULL);
	}

	/* .. Next the critical variables: home, path, logname, ... */
	/* these may replace some passed in with the job	    */

	/* HOME */
	bld_env_variables(&(pjob->ji_env), variables_else[0], pwdp->pw_dir); /* HOME */

	/* LOGNAME */
	bld_env_variables(&(pjob->ji_env), variables_else[1], pwdp->pw_name);

	/* PBS_JOBNAME */
	bld_env_variables(&(pjob->ji_env), variables_else[2], get_jattr_str(pjob, JOB_ATR_jobname));

	/* PBS_JOBID */
	bld_env_variables(&(pjob->ji_env), variables_else[3], pjob->ji_qs.ji_jobid);

	/* PBS_QUEUE */
	bld_env_variables(&(pjob->ji_env), variables_else[4], get_jattr_str(pjob, JOB_ATR_in_queue));

	/* SHELL */
	bld_env_variables(&(pjob->ji_env), variables_else[5], shell);

	/* USER, for compatability */
	bld_env_variables(&(pjob->ji_env), variables_else[6], pwdp->pw_name);

	/* PBS_JOBCOOKIE */
	bld_env_variables(&(pjob->ji_env), variables_else[7], get_jattr_str(pjob, JOB_ATR_Cookie));

	/* PBS_NODENUM */
	sprintf(buf, "%d", pjob->ji_nodeid);
	bld_env_variables(&(pjob->ji_env), variables_else[8], buf);

	/* PBS_TASKNUM */
	sprintf(buf, "%u", ptask->ti_qs.ti_task);
	bld_env_variables(&(pjob->ji_env), variables_else[9], buf);

	/* PBS_MOMPORT */
	sprintf(buf, "%u", pbs_rm_port);
	bld_env_variables(&(pjob->ji_env), variables_else[10], buf);

	/* OMP_NUM_THREADS and NCPUS eq to number of cpus */

	numthreads = pjob->ji_vnods[0].vn_threads;
	sprintf(buf, "%d", numthreads);
#ifdef NAS /* localmod 020 */
	/*
	 * If ompthreads specified, use it to set OMP_NUM_THREADS, else
	 * set OMP_NUM_THREADS=1
	 * (Cannot just leave it unset because then the MKL sparse solvers
	 * use every CPU in the system.)
	 */
	schedselect = get_jattr_str(pjob, JOB_ATR_SchedSelect);
	if (schedselect && strstr(schedselect, OMPTHREADS) != NULL)
		bld_env_variables(&(pjob->ji_env), variables_else[12], buf);
	else
		bld_env_variables(&(pjob->ji_env), variables_else[12], "1");
#else
	bld_env_variables(&(pjob->ji_env), variables_else[12], buf);
#endif /* localmod 020 */
	bld_env_variables(&(pjob->ji_env), "NCPUS", buf);

	/* PBS_NODEFILE */

	if (generate_pbs_nodefile(pjob, buf, sizeof(buf) - 1, log_buffer, LOG_BUF_SIZE - 1) == 0)
		bld_env_variables(&(pjob->ji_env), variables_else[11], buf);
	else {
		log_err(errno, __func__, log_buffer);
		starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
	}

	/* PBS_ACCOUNT */
	if (is_jattr_set(pjob, JOB_ATR_account))
		bld_env_variables(&(pjob->ji_env), variables_else[13], get_jattr_str(pjob, JOB_ATR_account));

	/* If an Sub job of an Array job, put in the index */

	if (strchr(pjob->ji_qs.ji_jobid, (int) '[') != NULL) {
		char *pparent;
		char *pindex;

		get_index_and_parent(pjob->ji_qs.ji_jobid, &pparent, &pindex);
		bld_env_variables(&(pjob->ji_env), variables_else[14], pindex);
		bld_env_variables(&(pjob->ji_env), variables_else[15], pparent);
	}

	/* if user specified umask for job, set it */
	if (is_jattr_set(pjob, JOB_ATR_umask)) {
		sprintf(buf, "%ld", get_jattr_long(pjob, JOB_ATR_umask));
		sscanf(buf, "%o", &j);
		umask(j);
	} else
		umask(077);

		/* Add TMPDIR to environment */
#ifdef NAS /* localmod 010 */
	(void) NAS_tmpdirname(pjob);
#endif /* localmod 010 */
	j = mktmpdir(pjob->ji_qs.ji_jobid,
		     pjob->ji_qs.ji_un.ji_momt.ji_exuid,
		     pjob->ji_qs.ji_un.ji_momt.ji_exgid,
		     &(pjob->ji_env));
	if (j != 0)
		starter_return(upfds, downfds, j, &sjr);

	/* set PBS_JOBDIR */
	if (sandbox_private) {
		/* Add PBS_JOBDIR if it doesn't already exist */
		j = mkjobdir(pjob->ji_qs.ji_jobid,
			     pbs_jobdir,
			     pjob->ji_qs.ji_un.ji_momt.ji_exuid,
			     pjob->ji_qs.ji_un.ji_momt.ji_exgid);
		if (j != 0) {
			sprintf(log_buffer, "unable to create the job directory %s",
				pbs_jobdir);
			log_joberr(errno, __func__, log_buffer, pjob->ji_qs.ji_jobid);
			starter_return(upfds, downfds, j, &sjr); /* exits */
		}
		bld_env_variables(&(pjob->ji_env), "PBS_JOBDIR", pbs_jobdir);
	} else {
		bld_env_variables(&(pjob->ji_env), "PBS_JOBDIR", pwdp->pw_dir);
	}

	mom_unnice();

	if (is_interactive) {
		struct sigaction act;
		char *termtype;
		char *phost;
		char *auth_method;
		char *encrypt_method;
		int qsub_sock;
		int old_qsub_sock;
		int pts; /* fd for slave pty */
		int ret = 0;

		/*************************************************************************/
		/*		We have an "interactive" job, connect the standard	 */
		/*		streams to a socket connected to qsub.			 */
		/*************************************************************************/

		sigemptyset(&act.sa_mask);
		/* prevent user from interrupting start of the job */
		act.sa_flags = 0;
		act.sa_handler = SIG_IGN;
		(void) sigaction(SIGHUP, &act, &tmp_act_hup);
		(void) sigaction(SIGINT, &act, &tmp_act_int);
		(void) sigaction(SIGQUIT, &act, &tmp_act_quit);
		(void) sigaction(SIGTSTP, &act, &tmp_act_stp);

#ifdef SA_INTERRUPT
		act.sa_flags = SA_INTERRUPT;
#else
		act.sa_flags = 0;
#endif /* SA_INTERRUPT */
		act.sa_handler = no_hang;
		(void) sigaction(SIGALRM, &act, NULL);
		alarm(30);

		/* Set environment to reflect interactive */

		bld_env_variables(&(pjob->ji_env), "PBS_ENVIRONMENT", "PBS_INTERACTIVE");

		/* get host where qsub resides */

		phost = arst_string("PBS_O_HOST", get_jattr(pjob, JOB_ATR_variables));
		if ((phost == NULL) ||
		    ((phost = strchr(phost, (int) '=')) == NULL)) {
			log_joberr(-1, __func__, "PBS_O_HOST not set",
				   pjob->ji_qs.ji_jobid);
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
		}

		/* get qsub prefered auth method */

		auth_method = arst_string("PBS_O_INTERACTIVE_AUTH_METHOD", get_jattr(pjob, JOB_ATR_variables));
		if ((auth_method == NULL) ||
		    ((auth_method = strchr(auth_method, (int) '=')) == NULL)) {
			log_joberr(-1, __func__, "PBS_O_INTERACTIVE_AUTH_METHOD not set",
				   pjob->ji_qs.ji_jobid);
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
		}

		/* get qsub prefered encrypt method */

		encrypt_method = arst_string("PBS_O_INTERACTIVE_ENCRYPT_METHOD", get_jattr(pjob, JOB_ATR_variables));
		if ((encrypt_method == NULL) ||
		    ((encrypt_method = strchr(encrypt_method, (int) '=')) == NULL)) {
			log_joberr(-1, __func__, "PBS_O_INTERACTIVE_ENCRYPT_METHOD not set",
				   pjob->ji_qs.ji_jobid);
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
		}

		/* Verify prefered auth is supported */
		if (is_string_in_arr(pbs_conf.supported_auth_methods, auth_method+1)) {
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
				"interactive authentication method = %s", auth_method+1);
			if (strcmp(auth_method+1, AUTH_RESVPORT_NAME) == 0)
				qsub_sock = conn_qsub_resvport(phost + 1, get_jattr_long(pjob, JOB_ATR_interactive));
			else
				qsub_sock = conn_qsub(phost + 1, get_jattr_long(pjob, JOB_ATR_interactive));
		} else {
			qsub_sock = -1;
			sprintf(log_buffer, "interactive authentication method %s not supported", auth_method +1);
			log_err(errno, __func__, log_buffer);
		}

		if (qsub_sock < 0) {
			sprintf(log_buffer, "cannot open qsub sock for %s",
				pjob->ji_qs.ji_jobid);
			log_err(errno, __func__, log_buffer);
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
		}

		old_qsub_sock = qsub_sock;
		FDMOVE(qsub_sock);

		if (get_jattr_str(pjob, JOB_ATR_X11_cookie)) {
			char display[X_DISPLAY_LEN];

			if ((socks = calloc(sizeof(struct pfwdsock), NUM_SOCKS)) == NULL) {
				/* FAILURE - cannot alloc memory */
				log_err(errno, __func__, "ERROR: could not calloc!\n");
				starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
			}
			display_number = init_x11_display(socks, 1, /* use localhost only */
							  display, pjob->ji_grpcache->gc_homedir,
							  get_jattr_str(pjob, JOB_ATR_X11_cookie));

			if (display_number >= 0) {
				bld_env_variables(&(pjob->ji_env), "DISPLAY", display);
			} else {
				log_err(errno, __func__, "PBS: X11 forwarding init failed\n");
				starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
			}
		}

		if (qsub_sock != old_qsub_sock) {

			if (CS_remap_ctx(old_qsub_sock, qsub_sock) != CS_SUCCESS) {

				(void) CS_close_socket(old_qsub_sock);
				starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
			}
		}

		ret = auth_with_qsub(qsub_sock, get_jattr_long(pjob, JOB_ATR_interactive),
				     phost + 1, auth_method + 1, encrypt_method + 1, pjob->ji_qs.ji_jobid);
		if (ret != INTERACTIVE_AUTH_SUCCESS) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, "Failed to authenticate with qsub");
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
		}

		/* send job id as validation to qsub */
		if (transport_chan_get_ctx_status(qsub_sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
			if (transport_send_pkt(qsub_sock, AUTH_ENCRYPTED_DATA, pjob->ji_qs.ji_jobid, PBS_MAXSVRJOBID + 1) < 0) {
				log_err(errno, __func__, "cannot write jobid");
				starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
			}
		} else {
			if (CS_write(qsub_sock, pjob->ji_qs.ji_jobid, PBS_MAXSVRJOBID + 1) !=
				PBS_MAXSVRJOBID + 1) {
				log_err(errno, __func__, "cannot write jobid");
				starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
			}
		}

		/* receive terminal type and window size */

		if ((termtype = rcvttype(qsub_sock)) == NULL)
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);

		bld_env_variables(&(pjob->ji_env), termtype, NULL);

		if (rcvwinsize(qsub_sock) == -1)
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);

		/* turn off alarm set around qsub connect activities */

		alarm(0);
		act.sa_handler = SIG_DFL;
		act.sa_flags = 0;
		(void) sigaction(SIGALRM, &act, NULL);

		/* set up the Job session */

		j = set_job(pjob, &sjr);
		if (j < 0) {
			if (j == -1) {
				/* set_job didn't leave message in log_buffer */
				(void) strcpy(log_buffer, "Unable to set session");
			}
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
				  LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
		}
#if MOM_ALPS
		sjr.sj_code = JOB_EXEC_UPDATE_ALPS_RESV_ID;
		(void) writepipe(upfds, &sjr, sizeof(sjr));

		/* wait for acknowledgement */
		(void) readpipe(downfds, &ack, sizeof(ack));
#endif

		/* Open the slave pty as the controlling tty */

		if ((pts = open_pty(pjob)) < 0) {
			log_err(errno, __func__, "cannot open slave");
			starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
		}

		act.sa_handler = SIG_IGN; /* setup to ignore SIGTERM */

		writerpid = fork();
		if (writerpid == 0) {
			/* child is "writer" process */

			(void) sigaction(SIGTERM, &act, NULL);

			(void) close(upfds);
			(void) close(downfds);
			(void) close(upfds2);
			(void) close(downfds2);
			(void) close(child2parent_job_update_pipe_w);
			(void) close(parent2child_job_update_pipe_r);
			(void) close(parent2child_job_update_status_pipe_r);
			(void) close(parent2child_moms_status_pipe_r);
			(void) close(pts);
			/*Closing the inherited post forwarded listening socket  */
			if (get_jattr_str(pjob, JOB_ATR_X11_cookie)) {
				for (n = 0; n < NUM_SOCKS; n++) {
					if (socks[n].active)
						close(socks[n].sock);
				}
			}

			int res;
			if (transport_chan_get_ctx_status(qsub_sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
				res = mom_writer_pkt(qsub_sock, ptc);
			} else {
				res = mom_writer(qsub_sock, ptc);
			}

			/* Inside mom_writer, if read is successful and write fails then it is an error and hence logging here as error for -1 */
			if (res == -1)
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, "CS_write failed with errno %d", errno);
			else if (res == -2)
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "read failed with errno %d", errno);

			shutdown(qsub_sock, 2);
			dis_destroy_chan(qsub_sock);
			exit(0);

		} else if (writerpid > 0) {
			/*
			 ** parent -- it first runs the prolog then forks
			 ** again.  the child becomes the job while the
			 ** parent becomes the reader.
			 */

			(void) close(1);
			(void) close(2);
			(void) dup2(pts, 1);
			(void) dup2(pts, 2);
			fflush(stdout);
			fflush(stderr);
			set_termcc(pts);	/* set terminal control char */
			(void) setwinsize(pts); /* set window size to qsub's */
			if (do_tolerate_node_failures(pjob) && (get_failed_moms_and_vnodes(pjob, parent2child_moms_status_pipe_r, -1, &vnl_fails, &vnl_good, 1) != 0)) {
				FREE_VNLS(vnl_fails, vnl_good);
				starter_return(upfds, downfds,
					       JOB_EXEC_RETRY, &sjr);
			}

			/* run prolog */
			if (prolo_hooks > 0) {

				mom_hook_input_init(&hook_input);
				hook_input.pjob = pjob;
				if (do_tolerate_node_failures(pjob)) {
					hook_input.vnl_fail = (vnl_t *) vnl_fails;
					hook_input.failed_mom_list = &pjob->ji_failed_node_list;
					hook_input.succeeded_mom_list = &pjob->ji_node_list;
				}

				mom_hook_output_init(&hook_output);
				hook_output.reject_errcode = &hook_errcode;
				hook_output.last_phook = &last_phook;
				hook_output.fail_action = &hook_fail_action;

				hook_rc =
					mom_process_hooks(HOOK_EVENT_EXECJOB_PROLOGUE,
							  PBS_MOM_SERVICE_NAME,
							  mom_host, &hook_input, &hook_output,
							  hook_msg, sizeof(hook_msg), 0);
			} else { /* no runnable hooks */
				/* don't execute any prologue hook */
				/* as no prologue hooks are runnable */
				hook_rc = 2;
			}

			switch (hook_rc) {

				case 0: /* explicit reject */
					if (hook_errcode == PBSE_HOOK_REJECT_DELETEJOB) {
						starter_return(upfds, downfds,
							       JOB_EXEC_FAILHOOK_DELETE, &sjr);
					} else if (hook_errcode == PBSE_HOOKERROR) {
						starter_return(upfds, downfds,
							       JOB_EXEC_HOOKERROR, &sjr);
					} else {
						/* rerun is the default in prologue */
						starter_return(upfds, downfds,
							       JOB_EXEC_FAILHOOK_RERUN, &sjr);
					}
					return;
				case 1: /* explicit accept */
					if (send_pipe_request(upfds2, downfds2, IM_EXEC_PROLOGUE) != 0) {
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
							  LOG_INFO, pjob->ji_qs.ji_jobid,
							  "warning: send of IM_EXEC_PROLOGUE to parent mom failed");
					}
					if (do_tolerate_node_failures(pjob))
						send_update_job(pjob, child2parent_job_update_pipe_w, parent2child_job_update_pipe_r, parent2child_job_update_status_pipe_r);
					break;
				case 2:
					/* no hook script executed - execute old-style prologue */
					if (run_pelog(PE_PROLOGUE,
						      path_prolog, pjob,
						      PE_IO_TYPE_ASIS) != 0) {
						(void) fprintf(stderr,
							       "Could not run prolog: %s\n",
							       log_buffer);
						starter_return(upfds, downfds,
							       JOB_EXEC_FAIL2, &sjr);
					}
					break;
				default:
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
						  LOG_INFO, "",
						  "prologue hook event: accept req by default");
					if (send_pipe_request(upfds2, downfds2, IM_EXEC_PROLOGUE) != 0) {
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
							  LOG_INFO, pjob->ji_qs.ji_jobid,
							  "warning: send of IM_EXEC_PROLOGUE to parent mom failed");
					}
					if (do_tolerate_node_failures(pjob))
						send_update_job(pjob, child2parent_job_update_pipe_w, parent2child_job_update_pipe_r, parent2child_job_update_status_pipe_r);
			}

			shellpid = fork();
			if (shellpid == 0) {

				/*********************************************/
				/* child - this will be the interactive job  */
				/* i/o is to slave tty			     */
				/*********************************************/

				(void) close(0);
				(void) dup2(pts, 0);
				fflush(stdin);

				(void) close(ptc); /* close master side */
				ptc = -1;
				(void) close(pts); /* dup'ed above */
				(void) close(qsub_sock);

				/* continue setting up and exec-ing shell */

			} else {
				if (shellpid > 0) {
					/* fork, parent is "reader" process  */
					(void) sigaction(SIGTERM, &act, NULL);

					if (pts != -1)
						(void) close(pts);
					if (upfds != -1)
						(void) close(upfds);
					if (downfds != -1)
						(void) close(downfds);
					if (upfds2 != -1)
						(void) close(upfds2);
					if (downfds2 != -1)
						(void) close(downfds2);
					if (child2parent_job_update_pipe_w != -1)
						(void) close(child2parent_job_update_pipe_w);
					if (parent2child_job_update_pipe_r != -1)
						(void) close(parent2child_job_update_pipe_r);
					if (parent2child_job_update_status_pipe_r != -1)
						(void) close(parent2child_job_update_status_pipe_r);
					if (parent2child_moms_status_pipe_r != -1)
						(void) close(parent2child_moms_status_pipe_r);
					(void) close(1);
					(void) close(2);

					sigemptyset(&act.sa_mask);
					act.sa_flags = SA_NOCLDSTOP;
					act.sa_handler = catchinter;
					(void) sigaction(SIGCHLD, &act,
							 NULL);

					mom_reader_go = 1;
					/* prepare shell command "cd $PBS_JOBDIR" if in sandbox=PRIVATE mode */
					if (sandbox_private) {
						sprintf(buf, "cd %s\n", pbs_jobdir);
					} else {
						buf[0] = '\0';
					}
					if ((is_interactive == TRUE) &&
					    get_jattr_str(pjob, JOB_ATR_X11_cookie)) {
						if (sandbox_private) {
							/* Change to $PBS_JOBDIR before
							 blocking waiting for data */
							if (setcurrentworkdir(buf)) {
								log_err(errno, __func__,
									"Setting Private Sandbox directory Failed");
								starter_return(upfds, downfds,
									       JOB_EXEC_FAIL2, &sjr);
							}
						}
						if (strcmp(auth_method+1, AUTH_RESVPORT_NAME) == 0) {
							port_forwarder(socks, conn_qsub_resvport, phost + 1,
									get_jattr_long(pjob, JOB_ATR_X11_port),
									qsub_sock, mom_get_reader_Xjob,
									log_mom_portfw_msg,
									EXEC_HOST_SIDE, auth_method+1, encrypt_method+1, pjob->ji_qs.ji_jobid);
						} else {
							port_forwarder(socks, conn_qsub, phost + 1,
									get_jattr_long(pjob, JOB_ATR_X11_port),
									qsub_sock, mom_get_reader_Xjob,
									log_mom_portfw_msg,
									EXEC_HOST_SIDE, auth_method+1, encrypt_method+1, pjob->ji_qs.ji_jobid);
						}
					} else {
						int res;
						if (transport_chan_get_ctx_status(qsub_sock, FOR_ENCRYPT) == (int) AUTH_STATUS_CTX_READY) {
							res = mom_reader_pkt(qsub_sock, ptc, buf);
						} else {
							res = mom_reader(qsub_sock, ptc, buf);
						}
						/* Inside mom_reader, if read is successful and write fails then it is an error and hence logging here as error for -1 */
						if (res == -1)
							log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, "Write failed with errno %d", errno);
						else if (res == -2)
							log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "CS_read failed with errno %d", errno);
					}
				} else {
					log_err(errno, __func__,
						"cant fork reader");
				}

				/* make sure qsub gets EOF */

				shutdown(qsub_sock, 2);
				dis_destroy_chan(qsub_sock);

				/* change pty back to available after */
				/* job is done */
				if (chmod(pts_name, 0666) == -1) 
					log_errf(-1, __func__, "chmod failed. ERR : %s",strerror(errno));			
				if (chown(pts_name, 0, 0) == -1) 
					log_errf(-1, __func__, "chown failed. ERR : %s",strerror(errno));		
				exit(0);
			}
		} else { /* error */
			log_err(errno, __func__, "cannot fork nanny");

			/* change pty back to available */
			if (chmod(pts_name, 0666) == -1) 
				log_errf(-1, __func__, "chmod failed. ERR : %s",strerror(errno));		
			if (chown(pts_name, 0, 0) == -1) 
				log_errf(-1, __func__, "chown failed. ERR : %s",strerror(errno));			

			starter_return(upfds, downfds, JOB_EXEC_RETRY, &sjr);
		}

	} else {

		/*************************************************************************/
		/*		We have a "normal" batch job, connect the standard	 */
		/*		streams to files					 */
		/*************************************************************************/

		/* set Environment to reflect batch */

		bld_env_variables(&(pjob->ji_env), "PBS_ENVIRONMENT", "PBS_BATCH");
		bld_env_variables(&(pjob->ji_env), "ENVIRONMENT", "BATCH");

#if SHELL_INVOKE == 1
		/* if passing script file name as input to shell */

		(void) close(pipe_script[1]);
		script_in = pipe_script[0];
#else  /* SHELL_INVOKE == 0 */
		/* if passing script itself as input to shell */

		(void) strcpy(buf, path_jobs);
		if (*pjob->ji_qs.ji_fileprefix != '\0')
			(void) strcat(buf, pjob->ji_qs.ji_fileprefix);
		else
			(void) strcat(buf, pjob->ji_qs.ji_jobid);
		(void) strcat(buf, JOB_SCRIPT_SUFFIX);
		if ((script_in = open(buf, O_RDONLY, 0)) < 0) {
			if (errno == ENOENT)
				script_in = open("/dev/null", O_RDONLY, 0);
		}
#endif /* SHELL_INVOKE */
		if (!is_jattr_set(pjob, JOB_ATR_executable)) {
			/*
			 * user has passed executable and argument list as
			 * as command-line options to qsub (i.e after -- flag
			 * so, no need to check for script file)
			 */
			if (script_in < 0) {
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid,
					  "Unable to open script");
				starter_return(upfds, downfds, JOB_EXEC_FAIL1, &sjr);
			}
			FDMOVE(script_in); /* make sure descriptor > 2       */
			if (script_in != 0) {
				close(0);
				if (dup(script_in) == -1) 
					log_errf(-1, __func__, "dup failed. ERR : %s",strerror(errno));			
				close(script_in);
			}
		}

		if (open_std_out_err(pjob) == -1) {
			starter_return(upfds, downfds, JOB_EXEC_RETRY, &sjr);
		}

		/* After the error is redirected, stderr does not have a valid FILE* */
		temp_stderr = fdopen(STDERR_FILENO, "w");
		/* If we could not get the valid FILE*, let temp_stderr point to stderr to avoid
		 * a possible crash in subsequent calls to output functions like printf/fprintf */
		if (!temp_stderr)
			temp_stderr = stderr;
		/* set up the Job session */

		j = set_job(pjob, &sjr);
		if (j < 0) {
			if (j == -1) {
				/* set_job didn't leave message in log_buffer */
				(void) strcpy(log_buffer, "Unable to set session");
			}
			/* set_job leaves message in log_buffer */
			(void) fprintf(temp_stderr, "%s\n", log_buffer);

			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  pjob->ji_qs.ji_jobid, log_buffer);

			if (j == -3)
				j = JOB_EXEC_FAIL2;
			else
				j = JOB_EXEC_RETRY;
			starter_return(upfds, downfds, j, &sjr);
		}
		if (do_tolerate_node_failures(pjob) &&
		    (get_failed_moms_and_vnodes(pjob, downfds2, -1, &vnl_fails, &vnl_good, 1) != 0)) {
			FREE_VNLS(vnl_fails, vnl_good);
			starter_return(upfds, downfds, JOB_EXEC_RETRY, &sjr);
		}
		/* run prologue hooks */

		if (prolo_hooks > 0) {
			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;
			if (do_tolerate_node_failures(pjob)) {
				hook_input.vnl_fail = (vnl_t *) vnl_fails;
				hook_input.failed_mom_list = &pjob->ji_failed_node_list;
				hook_input.succeeded_mom_list = &pjob->ji_node_list;
			}

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			hook_rc =
				mom_process_hooks(HOOK_EVENT_EXECJOB_PROLOGUE,
						  PBS_MOM_SERVICE_NAME,
						  mom_host, &hook_input, &hook_output,
						  hook_msg, sizeof(hook_msg), 0);
		} else { /* no runnable hooks */
			/* don't execute any prologue hook */
			/* as no prologue hooks are runnable */
			hook_rc = 2;
		}

		switch (hook_rc) {

			case 0: /* explicit reject */
				if (hook_errcode == PBSE_HOOK_REJECT_DELETEJOB) {
					starter_return(upfds, downfds,
						       JOB_EXEC_FAILHOOK_DELETE, &sjr);
				} else if (hook_errcode == PBSE_HOOKERROR) {
					starter_return(upfds, downfds,
						       JOB_EXEC_HOOKERROR, &sjr);
				} else { /* rerun is the default */
					starter_return(upfds, downfds,
						       JOB_EXEC_FAILHOOK_RERUN, &sjr);
				}
			case 1: /* explicit accept */
				if (send_pipe_request(upfds2, downfds2, IM_EXEC_PROLOGUE) != 0) {
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
						  LOG_INFO, pjob->ji_qs.ji_jobid,
						  "warning: send of IM_EXEC_PROLOGUE to parent mom failed");
				}
				if (do_tolerate_node_failures(pjob))
					send_update_job(pjob, child2parent_job_update_pipe_w, parent2child_job_update_pipe_r, parent2child_job_update_status_pipe_r);
				break;
			case 2:
				/* no hook script executed - execute old-style prologue */
				if ((j = run_pelog(PE_PROLOGUE,
						   path_prolog, pjob, PE_IO_TYPE_ASIS)) == 1) {
					/* abort job */
					(void) fprintf(temp_stderr,
						       "Could not run prolog: %s\n", log_buffer);
					starter_return(upfds, downfds, JOB_EXEC_FAIL2,
						       &sjr);
				} else if (j != 0) {
					/* requeue job */
					starter_return(upfds, downfds, JOB_EXEC_RETRY,
						       &sjr);
				}
				break;
			default:
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, "",
					  "prologue hook event: accept req by default");
				if (send_pipe_request(upfds2, downfds2, IM_EXEC_PROLOGUE) != 0) {
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
						  LOG_INFO, pjob->ji_qs.ji_jobid,
						  "warning: send of IM_EXEC_PROLOGUE to parent mom failed");
				}
				if (do_tolerate_node_failures(pjob))
					send_update_job(pjob, child2parent_job_update_pipe_w, parent2child_job_update_pipe_r, parent2child_job_update_status_pipe_r);
		}
	}

	/*************************************************************************/
	/*	Set resource limits				 		 */
	/*	Both normal batch and interactive job come through here 	 */
	/*************************************************************************/

	set_jattr_l_slim(pjob, JOB_ATR_session_id, sjr.sj_session, SET);
	if (site_job_setup(pjob) != 0) {
		starter_return(upfds, downfds,
			       JOB_EXEC_FAIL2, &sjr); /* exits */
	}

	i = 0;

	/* if RLIMIT_NPROC is definded,  the value set when Mom was */
	/* invoked was saved,  reset that limit for the job	    */
#ifdef RLIMIT_NPROC
#ifdef RLIM64_INFINITY
	if ((i = setrlimit64(RLIMIT_NPROC, &orig_nproc_limit)) == -1) {
		(void) sprintf(log_buffer,
			       "Unable to restore NPROC limits, err=%d", errno);
	}
#else  /* RLIM64... */
	if ((i = setrlimit(RLIMIT_NPROC, &orig_nproc_limit)) == -1) {
		(void) sprintf(log_buffer,
			       "Unable to restore NPROC limits, err=%d", errno);
	}
#endif /* RLIM64... */
#endif /* RLIMIT_NPROC */
	if (i == 0) {
		/* now set all other kernel enforced limits on the job */
		if ((i = mom_set_limits(pjob, SET_LIMIT_SET)) != PBSE_NONE) {
			(void) sprintf(log_buffer, "Unable to set limits, err=%d", i);
		}
	}
	if (i != 0) {
		/* if we had a setlimit error, fail the job */
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, log_buffer);
		if (i == PBSE_RESCUNAV) { /* resource temp unavailable */
			if (is_interactive)
				j = JOB_EXEC_FAIL2;
			else
				j = JOB_EXEC_RETRY;
		} else
			j = JOB_EXEC_FAIL2;
		starter_return(upfds, downfds, j, &sjr); /* exits */
	}
	endpwent();

	job_has_executable = 0;
	if (is_jattr_set(pjob, JOB_ATR_executable)) {
		/*
		 * Call decode_xml_arg_list to decode XML string
		 * and store executable in shell and argument list in argv.
		 */
		if (decode_xml_arg_list(get_jattr_str(pjob, JOB_ATR_executable),
					get_jattr_str(pjob, JOB_ATR_Arglist), &shell, &argv) != 0) {
			starter_return(upfds, downfds, JOB_EXEC_FAIL2, &sjr);
		}
		job_has_executable = 1;
	}

	if (do_tolerate_node_failures(pjob) && (prolo_hooks > 0)) {

		/* free up from previous execjob_prologue hook */
		FREE_VNLS(vnl_fails, vnl_good);

		if (pjob->ji_numnodes > 1) {
			snprintf(log_buffer, sizeof(log_buffer), "waiting up to %ld secs ($job_launch_delay) for mom hosts status and prologue hooks ack", job_launch_delay);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);
			/* a filled-in log_buffer could be mistaken for an error message */
			log_buffer[0] = '\0';

			if (get_failed_moms_and_vnodes(pjob, parent2child_moms_status_pipe_r, (prolo_hooks > 0) ? downfds2 : -1, &vnl_fails, &vnl_good, job_launch_delay) != 0) {
				FREE_VNLS(vnl_fails, vnl_good);
				starter_return(upfds, downfds, JOB_EXEC_RETRY, &sjr);
			}
		}
	}

	the_progname = shell;
	the_argv = argv;

	/* NULL terminate the envp array */
	*((pjob->ji_env).v_envp + (pjob->ji_env).v_used) = NULL;
	the_env = (pjob->ji_env).v_envp;

	mom_hook_input_init(&hook_input);
	hook_input.pjob = pjob;
	hook_input.progname = the_progname;
	hook_input.argv = the_argv;
	hook_input.env = the_env;

	if (do_tolerate_node_failures(pjob)) {
		hook_input.vnl_fail = (vnl_t *) vnl_fails;
		hook_input.failed_mom_list = &pjob->ji_failed_node_list;
		hook_input.succeeded_mom_list = &pjob->ji_node_list;
	}

	mom_hook_output_init(&hook_output);
	hook_output.reject_errcode = &hook_errcode;
	hook_output.last_phook = &last_phook;
	hook_output.fail_action = &hook_fail_action;
	hook_output.progname = &progname;
	CLEAR_HEAD(argv_list);
	hook_output.argv = &argv_list;

	switch (mom_process_hooks(HOOK_EVENT_EXECJOB_LAUNCH,
				  PBS_MOM_SERVICE_NAME,
				  mom_host, &hook_input, &hook_output,
				  hook_msg, sizeof(hook_msg), 0)) {

		case 0: /* explicit reject */
			free(progname);
			free_attrlist(&argv_list);
			free_str_array(hook_output.env);
			if (do_tolerate_node_failures(pjob))
				FREE_VNLS(vnl_fails, vnl_good);

			if (hook_errcode == PBSE_HOOK_REJECT_RERUNJOB) {
				starter_return(upfds, downfds,
					       JOB_EXEC_FAILHOOK_RERUN, &sjr);
			} else {
				starter_return(upfds, downfds,
					       JOB_EXEC_FAILHOOK_DELETE, &sjr);
			}
		case 1: /* explicit accept */
			if (progname != NULL)
				the_progname = progname;

			the_argv = svrattrl_to_str_array(&argv_list);
			if (the_argv == NULL) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, "",
					  "execjob_launch hook returned NULL argv!");
				free(progname);
				free_attrlist(&argv_list);
				free_str_array(hook_output.env);
				if (do_tolerate_node_failures(pjob))
					FREE_VNLS(vnl_fails, vnl_good);

				starter_return(upfds, downfds,
					       JOB_EXEC_FAILHOOK_DELETE, &sjr);
			}
			res_env = hook_output.env;

			if (res_env == NULL) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, "",
					  "execjob_launch hook NULL env!");
				free(progname);
				free_attrlist(&argv_list);
				free_str_array(the_argv);
				if (do_tolerate_node_failures(pjob))
					FREE_VNLS(vnl_fails, vnl_good);

				starter_return(upfds, downfds,
					       JOB_EXEC_FAILHOOK_DELETE, &sjr);
			}

			/* clear the env array */
			(pjob->ji_env).v_used = 0;
			(pjob->ji_env).v_envp[0] = NULL;

			/* need to also set vtable as that would */
			/* get appended to later in the code */
			/* vtable holds the environmnent variables */
			/* and their values that are going to be */
			/* part of the job. */
			k = 0;
			while (res_env[k]) {
				char *n, *v, *p;
				if ((p = strchr(res_env[k], '=')) != NULL) {
					*p = '\0';
					n = res_env[k];
					v = p + 1;
					bld_env_variables(&(pjob->ji_env),
							  n, v);
					*p = '=';
				}
				k++;
			}
			the_env = pjob->ji_env.v_envp;
			if (do_tolerate_node_failures(pjob))
				send_update_job(pjob, child2parent_job_update_pipe_w, parent2child_job_update_pipe_r, parent2child_job_update_status_pipe_r);

			break;
		case 2: /* no hook script executed - go ahead and accept event */
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, "",
				  "execjob_launch hook event: accept req by default");
	}

	if (do_tolerate_node_failures(pjob))
		FREE_VNLS(vnl_fails, vnl_good);

	/* if job has executable (submitted as qsub -- <progname> <argv>), then */
	/* <progname> and <argv> take precedence so they must not be passed to */
	/* set_credential(), which would modify them. */
	if (set_credential(pjob, job_has_executable ? NULL : &the_progname,
			   job_has_executable ? NULL : &the_argv) == -1) {
		starter_return(upfds, downfds,
			       JOB_EXEC_FAIL2, &sjr); /* exits */
	}

	/* include any new env settings added by set_credential. */
	the_env = pjob->ji_env.v_envp;
	*(pjob->ji_env.v_envp + pjob->ji_env.v_used) = NULL;

	/*
	 * If JOB_ATR_executable is set, and job is in "sandbox=PRIVATE" mode,
	 * change working directory to PBS_JOBDIR and run the executable.
	 * If JOB_ATR_executable attribute is unset,
	 * change working directory to User's Home.
	 * If in "sandbox=PRIVATE" mode, it is preferable to start in User's HOME
	 * in order to process user's "dot" files in the login shell,
	 * but if user's Home does not exist, start in PBS_JOBDIR.
	 *
	 * Note that even while job process is started in user's Home,
	 * when "sandbox" is "PRIVATE", "cd $PBS_JOBDIR" is prepended to the job script name,
	 * so job script is executed in $PBS_JOBDIR after "dot" files from user's Home are processed.
	 * See the code for the forked parent (about 700 lines above), look for the comment:
	 * "the parent side, still the main man, uhh that is MOM"
	 */
	if (is_jattr_set(pjob, JOB_ATR_executable) && sandbox_private) {
		if (!pbs_jobdir || chdir(pbs_jobdir) == -1) {
			log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB,
				  LOG_ERR, pjob->ji_qs.ji_jobid,
				  "sandbox=PRIVATE mode: Could not chdir to job directory\n");
			starter_return(upfds, downfds, JOB_EXEC_FAIL2, &sjr);
			return;
		}
	} else if (chdir(pwdp->pw_dir) == -1) {
		log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB,
			  LOG_ERR, pjob->ji_qs.ji_jobid,
			  "Could not chdir to Home directory");
		(void) fprintf(temp_stderr, "Could not chdir to home directory\n");
		/* check if "qsub -k[oe]" was specified */
		if (((is_jattr_set(pjob, JOB_ATR_keep)) &&
		     ((strchr(get_jattr_str(pjob, JOB_ATR_keep), 'o')) ||
		      (strchr(get_jattr_str(pjob, JOB_ATR_keep), 'e')))) &&
		    !sandbox_private) {
			/* user Home is required for job output if "qsub -k[oe]" was specified
			 * and not in sandbox=private mode, so error out.
			 */
			starter_return(upfds, downfds, JOB_EXEC_FAIL2, &sjr);
			return;
		} else if (sandbox_private) {
			/* "sandbox=PRIVATE" mode is active, so job can be started in PBS_JOBDIR instead of user Home */
			if ((!pbs_jobdir) || (chdir(pbs_jobdir) == -1)) {
				log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB,
					  LOG_ERR, pjob->ji_qs.ji_jobid,
					  "sandbox=PRIVATE mode: Could not chdir to job directory\n");
				starter_return(upfds, downfds, JOB_EXEC_FAIL2, &sjr);
			}
			/* an else case for O_WORKDIR should be added here */
		} else {
			/* nothing special specified, so job must be started in user Home  */
			starter_return(upfds, downfds, JOB_EXEC_FAIL2, &sjr);
			return;
		}
	}

	/* tell mom we are going */
	starter_return(upfds, downfds, JOB_EXEC_OK, &sjr);
	log_close(0);

	if ((pjob->ji_numnodes == 1) || nodemux || ((cpid = fork()) > 0)) {
		/* parent does the shell */
		FILE *f;

		/* close sockets that child uses */
		(void) close(pjob->ji_stdout);
		(void) close(pjob->ji_stderr);
		if ((is_interactive == TRUE) &&
		    get_jattr_str(pjob, JOB_ATR_X11_cookie)) {
			char auth_display[X_DISPLAY_LEN];
			char cmd[X_DISPLAY_LEN];
			char format[X_DISPLAY_LEN];
			char x11proto[X_DISPLAY_LEN];
			char x11data[X_DISPLAY_LEN];
			char x11authstr[X_DISPLAY_LEN];
			unsigned int x11screen;
			int ret;

			x11proto[0] = x11data[0] = '\0';
			format[0] = '\0';

			sprintf(format, " %%%d[^:]: %%%d[^:]: %%u",
				X_DISPLAY_LEN - 1, X_DISPLAY_LEN - 1);

			/*getting the cookie data from the job attributes*/
			strcpy(x11authstr,
			       get_jattr_str(pjob, JOB_ATR_X11_cookie));

			/**
			 * parsing cookie to get X11 protocol,
			 * hex data and screen number
			 */
			if ((n = sscanf(x11authstr, format,
					x11proto,
					x11data,
					&x11screen)) != 3) {
				sprintf(log_buffer, "sscanf(%s)=%d failed: %s\n",
					x11authstr,
					n,
					strerror(errno));
				log_err(errno, __func__, log_buffer);
				log_close(0);
				return;
			}
			ret = snprintf(auth_display, sizeof(auth_display),
				       "unix:%d.%u",
				       display_number,
				       x11screen);
			if (ret >= sizeof(auth_display)) {
				log_err(-1, __func__, " auth_display overflow");
				log_close(0);
				return;
			}
			if (!sandbox_private) {
				/*Fetching XAUTHORITY from job environment if present*/
				int xauth_index;
				if ((xauth_index = find_env_slot(&(pjob->ji_env), "XAUTHORITY=")) != -1) {
					char *xauth_file = strchr(pjob->ji_env.v_envp[xauth_index], (int) '=') + 1;
					ret = snprintf(cmd, sizeof(cmd), "%s -f %s -q -", XAUTH_BINARY, xauth_file);
				} else {
					ret = snprintf(cmd, sizeof(cmd), "%s -q -",
						       XAUTH_BINARY);
				}
				if (ret >= sizeof(cmd)) {
					log_err(-1, __func__, " cmd overflow ");
					log_close(0);
					return;
				}
			} else {
				char var[MAXPATHLEN + 1];
				sprintf(var, "%s/.Xauthority", pbs_jobdir);
				ret = snprintf(cmd, sizeof(cmd),
					       "%s -f %s/.Xauthority -q -",
					       XAUTH_BINARY, pbs_jobdir);
				if (ret >= sizeof(cmd)) {
					log_err(-1, __func__, " cmd overflow ");
					log_close(0);
					return;
				}
				bld_env_variables(&(pjob->ji_env), "XAUTHORITY", var);
			}
			f = popen(cmd, "w");
			if (f != NULL) {
				/**
				 *  executing commands to add new display
				 *  in Xauthority file
				 */
				fprintf(f, "remove %s\n ", auth_display);
				fprintf(f, "add %s %s %s\n", auth_display,
					x11proto,
					x11data);
				pclose(f);
			} else {
				sprintf(log_buffer, "could not run %s\n", cmd);
				log_err(errno, __func__, log_buffer);
				log_close(0);
				return;
			}
		}

		/* include any new env settings added. */
		the_env = pjob->ji_env.v_envp;
		*(pjob->ji_env.v_envp + pjob->ji_env.v_used) = NULL;

		/* user was prevented to interrupt, it is safe to revert now */
		(void) sigaction(SIGHUP, &tmp_act_hup, NULL);
		(void) sigaction(SIGINT, &tmp_act_int, NULL);
		(void) sigaction(SIGQUIT, &tmp_act_quit, NULL);
		(void) sigaction(SIGTSTP, &tmp_act_stp, NULL);

		execve(the_progname, the_argv, the_env);
		free(progname);
		free_attrlist(&argv_list);
		free_str_array(the_argv);
		the_argv = NULL;
		free_str_array(hook_output.env);
		free_str_array(the_env);
		the_env = NULL;
	} else if (cpid == 0) { /* child does demux */
		char *arg[2];
		char *shellname;

		/* setup descriptors 3 and 4 */
		(void) dup2(pjob->ji_stdout, 3);
		if (pjob->ji_stdout > 3)
			close(pjob->ji_stdout);
		(void) dup2(pjob->ji_stderr, 4);
		if (pjob->ji_stderr > 4)
			close(pjob->ji_stderr);

		/* construct argv array */
		shell = pbs_conf.pbs_demux_path;
		shellname = strrchr(shell, '/');
		if (shellname)
			++shellname; /* go past last '/' */
		else
			shellname = shell;
		arg[0] = shellname;
		arg[1] = NULL;

		/* user was prevented to interrupt, it is safe to revert now */
		(void) sigaction(SIGHUP, &tmp_act_hup, NULL);
		(void) sigaction(SIGINT, &tmp_act_int, NULL);
		(void) sigaction(SIGQUIT, &tmp_act_quit, NULL);
		(void) sigaction(SIGTSTP, &tmp_act_stp, NULL);

		/* we're purposely not calling log_close() here */
		/* for this causes a side-effect. log_close() would */
		/* do an fclose(<logfile>), but its file position */
		/* is still shared with the parent mom, which */
		/* could be writing to the <logfile>. */
		execve(shell, arg, pjob->ji_env.v_envp);
	}
	fprintf(temp_stderr, "pbs_mom, exec of %s failed with error: %s\n",
		shell, strerror(errno));
	exit(254); /* should never, ever get here */
}

/**
 * @brief
 * 	Start a process for a spawn request.  This will be different from
 * 	a job's initial shell task in that the environment will be specified
 * 	and no interactive code need be included.
 *
 * @param[in] ptask - pointer to task structure
 * @param[in] argv - argument list
 * @param[in] envp - pointer to environment variable list
 * @param[in] nodemux - false if the task process needs demux, true otherwise

 *
 * @return	int
 * @retval	PBSE_NONE (0) if success
 * @retval	PBSE_* on error.
 *
 */
int
start_process(task *ptask, char **argv, char **envp, bool nodemux)
{
	job *pjob = ptask->ti_job;
	int ebsize;
	char buf[MAXPATHLEN + 2];
	pid_t pid;
	int pipes[2], kid_read, kid_write, parent_read, parent_write;
	int pts;
	int i, j, k;
	int fd;
	u_long ipaddr;
	struct array_strings *vstrs;
	struct startjob_rtn sjr;
	char *pbs_jobdir; /* staging and execution directory of this job */
	int hook_errcode = 0;
	char hook_msg[HOOK_MSG_SIZE + 1];
	char *progname = NULL;
	pbs_list_head argv_list;
	mom_hook_input_t hook_input;
	mom_hook_output_t hook_output;
	char *the_progname;
	char **the_argv;
	char **the_env;
	char **res_env;
	hook *last_phook = NULL;
	unsigned int hook_fail_action = 0;
	FILE *temp_stderr = stderr;
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	int cred_action;
#endif

	pbs_jobdir = jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir);
	memset(&sjr, 0, sizeof(sjr));
	if (pipe(pipes) == -1)
		return PBSE_SYSTEM;
	if (pipes[1] < 3) {
		kid_write = fcntl(pipes[1], F_DUPFD, 3);
		(void) close(pipes[1]);
	} else
		kid_write = pipes[1];
	parent_read = pipes[0];

	if (pipe(pipes) == -1) {
		close(kid_write);
		close(parent_read);
		return PBSE_SYSTEM;
	}
	if (pipes[0] < 3) {
		kid_read = fcntl(pipes[0], F_DUPFD, 3);
		(void) close(pipes[0]);
	} else
		kid_read = pipes[0];
	parent_write = pipes[1];

	/*
	 ** Get ipaddr to Mother Superior.
	 */
	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) /* I'm MS */
		ipaddr = htonl(localaddr);
	else {
		struct sockaddr_in *ap;

		/*
		 ** We always have a stream open to MS at node 0.
		 */
		i = pjob->ji_hosts[0].hn_stream;
		if ((ap = tpp_getaddr(i)) == NULL) {
			log_joberr(-1, __func__, "no stream to MS",
				   pjob->ji_qs.ji_jobid);
			return PBSE_SYSTEM;
		}
		ipaddr = ap->sin_addr.s_addr;
	}

	/*
	 ** Begin a new process for the fledgling task.
	 */
	if ((pid = fork_me(-1)) == -1)
		return PBSE_SYSTEM;
	else if (pid != 0) { /* parent */
		(void) close(kid_read);
		(void) close(kid_write);

		/* read sid */
		i = readpipe(parent_read, &sjr, sizeof(sjr));
		j = errno;
		(void) close(parent_read);
		if (i != sizeof(sjr)) {
			sprintf(log_buffer,
				"read of pipe for pid job %s got %d not %d",
				pjob->ji_qs.ji_jobid, i, (int) sizeof(sjr));
			log_err(j, __func__, log_buffer);
			(void) close(parent_write);
			return PBSE_SYSTEM;
		}
		(void) writepipe(parent_write, &sjr, sizeof(sjr));
		(void) close(parent_write);
		DBPRT(("%s: read start return %d %d\n", __func__,
		       sjr.sj_code, sjr.sj_session))

		/*
		 ** Set the global id before exiting on error so any
		 ** information can be put into the job struct first.
		 */
		set_globid(pjob, &sjr);
		if (sjr.sj_code < 0) {
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
			AFSLOG_TERM(ptask);
#endif
			(void) sprintf(log_buffer, "task not started, %s %s %d",
				       (sjr.sj_code == JOB_EXEC_RETRY) ? "Retry" : "Failure",
				       argv[0],
				       sjr.sj_code);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
				  LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
			return PBSE_SYSTEM;
		}

		ptask->ti_qs.ti_sid = sjr.sj_session;
		ptask->ti_qs.ti_status = TI_STATE_RUNNING;

		(void) task_save(ptask);
		if (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING)) {
			set_job_state(pjob, JOB_STATE_LTR_RUNNING);
			set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
			job_save(pjob);
		}
		(void) sprintf(log_buffer, "task %8.8X started, %s",
			       ptask->ti_qs.ti_task, argv[0]);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);

		return PBSE_NONE;
	}

	/************************************************/
	/* The child process - will become the TASK	*/
	/************************************************/
	(void) close(parent_read);
	(void) close(parent_write);

	/* unprotect the job from the vagaries of the kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

	/*
	 * set up the Environmental Variables to be given to the job
	 */

	for (j = 0, ebsize = 0; envp[j]; j++)
		ebsize += strlen(envp[j]);
	vstrs = get_jattr_arst(pjob, JOB_ATR_variables);
	pjob->ji_env.v_ensize = vstrs->as_usedptr + num_var_else + num_var_env +
				j + EXTRA_ENV_PTRS;
	pjob->ji_env.v_used = 0;
	pjob->ji_env.v_envp = (char **) malloc(pjob->ji_env.v_ensize * sizeof(char *));
	if (pjob->ji_env.v_envp == NULL) {
		return PBSE_SYSTEM;
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	if (pjob->ji_tasks.ll_prior == pjob->ji_tasks.ll_next) { /* create only on first task */
		cred_action = CRED_RENEWAL;
	} else {
		cred_action = CRED_SETENV;
	}

	if (cred_by_job(pjob, cred_action) != PBS_KRB5_OK) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid,
			   "failed to set credentials for task %8.8X",
			   ptask->ti_qs.ti_task);
	}

#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
	if (start_afslog(ptask, NULL, kid_write, kid_read) != PBS_KRB5_OK) {
		sprintf(log_buffer, "afslog for task %8.8X not started",
			ptask->ti_qs.ti_task);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}
#endif
#endif

	/* First variables from the local environment */
	for (j = 0; j < num_var_env; ++j)
		bld_env_variables(&(pjob->ji_env), environ[j], NULL);

	/* Next, the variables passed with the job.  They may   */
	/* be overwritten with new correct values for this job	*/

	for (j = 0; j < vstrs->as_usedptr; ++j) {
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
			/* never set KRB5CCNAME; it would rewrite the correct value */
			if (strncmp(vstrs->as_string[j], "KRB5CCNAME", strlen("KRB5CCNAME")) == 0)
				continue;
#endif
		bld_env_variables(&(pjob->ji_env), vstrs->as_string[j], NULL);
	}

	/* HOME */
	bld_env_variables(&(pjob->ji_env), variables_else[0],
			  pjob->ji_grpcache->gc_homedir);

	/* PBS_JOBNAME */
	bld_env_variables(&(pjob->ji_env), variables_else[2],
			  get_jattr_str(pjob, JOB_ATR_jobname));

	/* PBS_JOBID */
	bld_env_variables(&(pjob->ji_env), variables_else[3], pjob->ji_qs.ji_jobid);

	/* PBS_QUEUE */
	bld_env_variables(&(pjob->ji_env), variables_else[4],
			  get_jattr_str(pjob, JOB_ATR_in_queue));

	/* PBS_JOBCOOKIE */
	bld_env_variables(&(pjob->ji_env), variables_else[7],
			  get_jattr_str(pjob, JOB_ATR_Cookie));

	/* PBS_NODENUM */
	sprintf(buf, "%d", pjob->ji_nodeid);
	bld_env_variables(&(pjob->ji_env), variables_else[8], buf);

	/* PBS_TASKNUM */
	sprintf(buf, "%8.8X", ptask->ti_qs.ti_task);
	bld_env_variables(&(pjob->ji_env), variables_else[9], buf);

	/* PBS_MOMPORT */
	sprintf(buf, "%d", pbs_rm_port);
	bld_env_variables(&(pjob->ji_env), variables_else[10], buf);

	/* OMP_NUM_THREADS and NCPUS eq to number of cpus */
	sprintf(buf, "%d", pjob->ji_vnods[ptask->ti_qs.ti_myvnode].vn_threads);
#ifdef NAS /* localmod 020 */
	/* Force OMP_NUM_THREADS=1 on Columbia.
	 * If you've ever seen a 256 process MPI program try to start 256
	 * threads for each process, you'd know why.
	 */
	bld_env_variables(&(pjob->ji_env), variables_else[12], "1");
#else
	bld_env_variables(&(pjob->ji_env), variables_else[12], buf);
#endif /* localmod 020 */
	bld_env_variables(&(pjob->ji_env), "NCPUS", buf);

	/* PBS_ACCOUNT */
	if (is_jattr_set(pjob, JOB_ATR_account))
		bld_env_variables(&(pjob->ji_env), variables_else[13],
				  get_jattr_str(pjob, JOB_ATR_account));

	if (is_jattr_set(pjob, JOB_ATR_umask)) {
		sprintf(buf, "%ld", get_jattr_long(pjob, JOB_ATR_umask));
		sscanf(buf, "%o", &j);
		umask(j);
	} else {
		umask(077);
	}

	mom_unnice();

	/* set Environment to reflect batch */
	bld_env_variables(&(pjob->ji_env), "PBS_ENVIRONMENT", "PBS_BATCH");
	bld_env_variables(&(pjob->ji_env), "ENVIRONMENT", "BATCH");

	for (i = 0; envp[i]; i++)
		bld_env_variables(&(pjob->ji_env), envp[i], NULL);

		/* Add TMPDIR to environment */
#ifdef NAS /* localmod 010 */
	(void) NAS_tmpdirname(pjob);
#endif /* localmod 010 */
	j = mktmpdir(pjob->ji_qs.ji_jobid,
		     pjob->ji_qs.ji_un.ji_momt.ji_exuid,
		     pjob->ji_qs.ji_un.ji_momt.ji_exgid,
		     &(pjob->ji_env));
	if (j != 0) {
		starter_return(kid_write, kid_read, j, &sjr);
	}

	/* set PBS_JOBDIR */
	if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
	    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
		bld_env_variables(&(pjob->ji_env), "PBS_JOBDIR", pbs_jobdir);
	} else {
		bld_env_variables(&(pjob->ji_env), "PBS_JOBDIR", pjob->ji_grpcache->gc_homedir);
	}

	j = set_job(pjob, &sjr);
	if (j < 0) {
		if (j == -1) {
			/* set_job didn't leave message in log_buffer */
			(void) strcpy(log_buffer, "Unable to set task session");
		}
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid, log_buffer);
		if (j == -3)
			j = JOB_EXEC_FAIL2;
		else
			j = JOB_EXEC_RETRY;
		starter_return(kid_write, kid_read, j, &sjr);
	}
	ptask->ti_qs.ti_sid = sjr.sj_session;
	if ((i = mom_set_limits(pjob, SET_LIMIT_SET)) != PBSE_NONE) {
		(void) sprintf(log_buffer, "Unable to set limits, err=%d", i);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_WARNING,
			  pjob->ji_qs.ji_jobid, log_buffer);
		if (i == PBSE_RESCUNAV) /* resource temp unavailable */
			j = JOB_EXEC_RETRY;
		else
			j = JOB_EXEC_FAIL2;
		starter_return(kid_write, kid_read, j, &sjr);
	}

	the_progname = argv[0];
	the_argv = argv;

	*(pjob->ji_env.v_envp + pjob->ji_env.v_used) = NULL;
	the_env = pjob->ji_env.v_envp;

	mom_hook_input_init(&hook_input);
	hook_input.pjob = pjob;
	hook_input.progname = the_progname;
	hook_input.argv = the_argv;
	hook_input.env = the_env;

	mom_hook_output_init(&hook_output);
	hook_output.reject_errcode = &hook_errcode;
	hook_output.last_phook = &last_phook;
	hook_output.fail_action = &hook_fail_action;
	hook_output.progname = &progname;
	CLEAR_HEAD(argv_list);
	hook_output.argv = &argv_list;

	switch (mom_process_hooks(HOOK_EVENT_EXECJOB_LAUNCH,
				  PBS_MOM_SERVICE_NAME,
				  mom_host, &hook_input, &hook_output,
				  hook_msg, sizeof(hook_msg), 0)) {

		case 0: /* explicit reject */
			free(progname);
			free_attrlist(&argv_list);
			free_str_array(hook_output.env);
			starter_return(kid_write, kid_read,
				       JOB_EXEC_FAILHOOK_DELETE, &sjr);
		case 1: /* explicit accept */
			if (progname != NULL)
				the_progname = progname;

			the_argv = svrattrl_to_str_array(&argv_list);
			if (the_argv == NULL) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, "",
					  "execjob_launch hook returned NULL argv!");
				free(progname);
				free_attrlist(&argv_list);
				free_str_array(hook_output.env);
				starter_return(kid_write, kid_read,
					       JOB_EXEC_FAILHOOK_DELETE, &sjr);
			}
			res_env = hook_output.env;
			if (res_env == NULL) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, "",
					  "execjob_launch hook NULL env!");
				free(progname);
				free_attrlist(&argv_list);
				free_str_array(the_argv);
				starter_return(kid_write, kid_read,
					       JOB_EXEC_FAILHOOK_DELETE, &sjr);
			}

			/* clear the env array */
			pjob->ji_env.v_used = 0;
			pjob->ji_env.v_envp[0] = NULL;

			/* need to also set vtable as that would */
			/* get appended to later in the code */
			/* vtable holds the environmnent variables */
			/* and their values that are going to be */
			/* part of the job. */
			k = 0;
			while (res_env[k]) {
				char *n, *v, *p;
				if ((p = strchr(res_env[k], '=')) != NULL) {
					*p = '\0';
					n = res_env[k];
					v = p + 1;
					bld_env_variables(&(pjob->ji_env),
							  n, v);
					*p = '=';
				}
				k++;
			}
			the_env = pjob->ji_env.v_envp;

			break;
		case 2: /* no hook script executed - go ahead and accept event */
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, "",
				  "execjob_launch hook event: accept req by default");
	}
	if (set_credential(pjob, NULL, &the_argv) == -1) {
		starter_return(kid_write, kid_read,
			       JOB_EXEC_FAIL2, &sjr); /* exits */
	}

	/* Pick up any env settings added by set_credential(), and NULL */
	/* terminate the envp array. */
	*(pjob->ji_env.v_envp + pjob->ji_env.v_used) = NULL;
	the_env = pjob->ji_env.v_envp;

	/* change working directory to PBS_JOBDIR or to User's Home */
	if ((is_jattr_set(pjob, JOB_ATR_sandbox)) &&
	    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
		if ((!pbs_jobdir) || (chdir(pbs_jobdir) == -1)) {
			log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB,
				  LOG_ERR, pjob->ji_qs.ji_jobid,
				  "Could not chdir to PBS_JOBDIR directory");
			(void) fprintf(stderr, "sandbox=PRIVATE mode: could not chdir to job directory\n");
			starter_return(kid_write, kid_read, JOB_EXEC_FAIL2, &sjr);
		}
	} else {
		if (chdir(pjob->ji_grpcache->gc_homedir) == -1) {
			log_event(PBSEVENT_JOB | PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB,
				  LOG_ERR, pjob->ji_qs.ji_jobid,
				  "Could not chdir to Home directory");
			(void) fprintf(stderr, "Could not chdir to home directory\n");
			starter_return(kid_write, kid_read, JOB_EXEC_FAIL2, &sjr);
		}
	}

	/*
	 ** Set up stdin.
	 */
	if ((fd = open("/dev/null", O_RDONLY)) == -1) {
		log_err(errno, __func__, "could not open devnull");
		(void) close(0);
	} else {
		(void) dup2(fd, 0);
		if (fd > 0)
			(void) close(fd);
	}

	/* If nodemux is not already set by the caller, check job's JOB_ATR_nodemux attribute. */
	if (!nodemux && (is_jattr_set(pjob, JOB_ATR_nodemux)))
		nodemux = get_jattr_long(pjob, JOB_ATR_nodemux);

	if (pjob->ji_numnodes > 1) {
		if (nodemux) {
			/*
			 ** Open /dev/null for stdout and stderr.
			 */
			if ((fd = open("/dev/null", O_RDONLY)) == -1) {
				log_err(errno, __func__, "could not open devnull");
				(void) close(1);
				(void) close(2);
			} else {
				if (fd != 1)
					(void) dup2(fd, 1);
				if (fd != 2)
					(void) dup2(fd, 2);
				if (fd > 2)
					(void) close(fd);
			}
		} else {
			/*
			 ** Open sockets to demux proc for stdout and stderr.
			 */
			if ((fd = open_demux(ipaddr, pjob->ji_stdout)) == -1)
				starter_return(kid_write, kid_read, JOB_EXEC_FAIL2, &sjr);
			(void) dup2(fd, 1);
			if (fd > 1)
				(void) close(fd);
			if ((fd = open_demux(ipaddr, pjob->ji_stderr)) == -1)
				starter_return(kid_write, kid_read, JOB_EXEC_FAIL2, &sjr);
			(void) dup2(fd, 2);
			if (fd > 2)
				(void) close(fd);

			if (write(1, get_jattr_str(pjob, JOB_ATR_Cookie),
			      strlen(get_jattr_str(pjob, JOB_ATR_Cookie))) == -1) 
				log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));			
			if ( write(2, get_jattr_str(pjob, JOB_ATR_Cookie),
			      strlen(get_jattr_str(pjob, JOB_ATR_Cookie))) == -1) 
				log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));			
		}
	} else if (is_jattr_set(pjob, JOB_ATR_interactive) && get_jattr_long(pjob, JOB_ATR_interactive) > 0) {
		/* interactive job, single node, write to pty */
		if ((pts = open_pty(pjob)) < 0) {
			log_err(errno, __func__, "cannot open slave");
			starter_return(kid_write, kid_read, JOB_EXEC_FAIL1, &sjr);
		}
		(void) dup2(pts, 1);
		(void) dup2(pts, 2);

	} else {
		/* normal batch job, single node, write straight to files */
		if (open_std_out_err(pjob) == -1) {
			starter_return(kid_write, kid_read,
				       JOB_EXEC_RETRY, &sjr);
		} else {
			/* After the error is redirected, stderr does not have a valid FILE* */
			temp_stderr = fdopen(STDERR_FILENO, "w");

			/* If we could not get the valid FILE*, let temp_stderr point to stderr to avoid
		 	* a possible crash in subsequent calls to output functions like printf/fprintf */
			if (!temp_stderr)
				temp_stderr = stderr;
		}
	}

	log_close(0);
	starter_return(kid_write, kid_read, JOB_EXEC_OK, &sjr);

	environ = the_env;
	execvp(the_progname, the_argv);
	free(progname);
	free_attrlist(&argv_list);
	free_str_array(the_argv);
	free_str_array(hook_output.env);
	free_str_array(the_env);
#if 0
	/*
	 ** This is for a shell to run the command.
	 */
	if (argv[0][0] == '/')		/* full path exe */
		execve(argv[0], argv, pjob->ji_env.v_envp);
	else {
		struct	passwd	*pwent;
		char	*shell = "/bin/sh";
		char	*shname;
		char	*args[4];

		pwent = getpwuid(pjob->ji_qs.ji_un.ji_momt.ji_exuid);
		if (pwent != NULL && pwent->pw_shell[0] == '/')
			shell = pwent->pw_shell;
		shname = strrchr(shell, '/') + 1;	/* one past slash */
		args[0] = strdup("-");
		strcat(args[0], shname);

		args[1] = "-c";

		args[2] = strdup(argv[0]);
		for (i=1; argv[i] != NULL; i++) {
			strcat(args[2], " ");
			strcat(args[2], argv[i]);
		}

		args[3] = NULL;

		printf("%s %s %s\n", args[0], args[1], args[2]);
		execve(shell, args, pjob->ji_env.v_envp);
	}
#endif
	fprintf(temp_stderr, "%s: %s\n", argv[0], strerror(errno));
	exit(254);
	return PBSE_SYSTEM; /* not reached */
}

/**
 * @brief
 *	Free the ji_hosts and ji_vnods arrays for a job.  If any events are
 *	attached to an array element, free them as well.
 *
 * @param[in] pj - job pointer
 *
 * @return Void
 *
 */

void
nodes_free(job *pj)
{
	int i;
	vmpiprocs *vp;

	if (pj->ji_vnods) {
		vp = pj->ji_vnods;
		for (i = 0; i < pj->ji_numvnod; i++, vp++) {
			if (vp->vn_hname)
				free(vp->vn_hname);
			if (vp->vn_vname)
				free(vp->vn_vname);
		}
		(void) free(pj->ji_vnods);
		pj->ji_vnods = NULL;
	}

	if (pj->ji_assn_vnodes) {
		vp = pj->ji_assn_vnodes;
		for (i = 0; i < pj->ji_num_assn_vnodes; i++, vp++) {
			if (vp->vn_hname)
				free(vp->vn_hname);
			if (vp->vn_vname)
				free(vp->vn_vname);
		}
		(void) free(pj->ji_assn_vnodes);
		pj->ji_assn_vnodes = NULL;
		pj->ji_num_assn_vnodes = 0;
	}

	if (pj->ji_hosts) {
		hnodent *np;

		np = pj->ji_hosts;
		for (i = 0; i < pj->ji_numnodes; i++, np++) {
			eventent *ep = (eventent *) GET_NEXT(np->hn_events);

			if (np->hn_host)
				free(np->hn_host);
			if (np->hn_vlist)
				free(np->hn_vlist);

			/* don't close stream incase another job uses it */
			while (ep) {

				if (ep->ee_argv)
					arrayfree(ep->ee_argv);
				if (ep->ee_envp)
					arrayfree(ep->ee_envp);
				delete_link(&ep->ee_next);
				free(ep);
				ep = (eventent *) GET_NEXT(np->hn_events);
			}
			/*
			 ** Here we free any dependent structure(s) from hn_setup.
			 */
			if (job_free_node != NULL)
				job_free_node(pj, np);
		}
		free(pj->ji_hosts);
		pj->ji_hosts = NULL;
	}
}

/**
 * @brief
 *	Add a mom to a job, if the mom is not already present
 *
 * @param[in] pjob - job pointer
 * @param[in] mname - mom name to add
 * @param[in] port - mom port
 * @param[in/out] mi - The last used index in the ji_hosts array 
 * @param[out] mynp - Return pointer to a match with this host
 *
 * @return hnodent
 * @retval - The hnodent structure matching the mname, port
 * @retval - NULL - failure to add (get_fullhostname failed)
 *
 */
hnodent *
add_mom_to_job(job *pjob, char *mname, int port, int *mi, hnodent **mynp)
{
	int j;
	int momindex = *mi;
	hnodent *hp = NULL;

	/*
	* for the natural vnode in a set that satisfies a chunk,
	* see if we have a hnodent entry for the parent Mom,
	* if not add an entry
	*/

	/* see if we already have this mom */
	for (j = 0; j < momindex; ++j) {
		if ((strcmp(mname, pjob->ji_hosts[j].hn_host) == 0) && (port == pjob->ji_hosts[j].hn_port))
			break;
	}
	hp = &pjob->ji_hosts[j];
	if ((hp != NULL) && (j == momindex)) {
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "Adding mom %s:%d to job", mname, port);
		/* need to add entry */
		hp->hn_node = momindex++;
		hp->hn_host = strdup(mname);
		if (hp->hn_host == NULL)
			return (NULL);
		hp->hn_port = port;
		hp->hn_stream = -1;
		hp->hn_eof_ts = 0; /* reset eof timestamp */
		hp->hn_sister = SISTER_OKAY;
		hp->hn_nprocs = 0;
		hp->hn_vlnum = 0;
		hp->hn_vlist = (host_vlist_t *) 0;
		hp->hn_vlist = NULL;
		memset(&hp->hn_nrlimit, 0, sizeof(resc_limit_t));
		CLEAR_HEAD(hp->hn_events);
		/* mark next slot as the (current) end */
		pjob->ji_hosts[momindex].hn_node = TM_ERROR_NODE;

		if (hp->hn_port == pbs_rm_port) {
			int hostmatch = 0;
			static char node_name[PBS_MAXHOSTNAME + 1] = {'\0'};
			static char canonical_name[PBS_MAXHOSTNAME + 1] = {'\0'};

			/*
			* The following block prevents us from having to employ
			* yet another global variable to represent the hostname
			* of the local node.
			*/
			if (pbs_conf.pbs_leaf_name) {
				if (strcmp(pbs_conf.pbs_leaf_name, node_name) != 0) {
					/* PBS_LEAF_NAME has changed or node_name is uninitialized */
					strncpy(node_name, pbs_conf.pbs_leaf_name, PBS_MAXHOSTNAME);
					node_name[PBS_MAXHOSTNAME] = '\0';
					/* Need to canonicalize PBS_LEAF_NAME */
					if (get_fullhostname(node_name, canonical_name, (sizeof(canonical_name) - 1)) != 0) {
						log_errf(errno, __func__, "Failed to get fullhostname from %s for job %s", node_name, pjob->ji_qs.ji_jobid);
						node_name[0] = '\0';
						canonical_name[0] = '\0';
						return (NULL);
					}
				}
			} else {
				if (strcmp(mom_host, node_name) != 0) {
					/* mom_host has changed or node_name is uninitialized */
					strncpy(node_name, mom_host, PBS_MAXHOSTNAME);
					node_name[PBS_MAXHOSTNAME] = '\0';
					/* mom_host contains the canonical name */
					strncpy(canonical_name, mom_host, PBS_MAXHOSTNAME);
					canonical_name[PBS_MAXHOSTNAME] = '\0';
				}
			}

			if (strcmp(hp->hn_host, node_name) == 0)
				hostmatch = 1;
			else {
				char namebuf[PBS_MAXHOSTNAME + 1];
				if (get_fullhostname(hp->hn_host, namebuf, (sizeof(namebuf) - 1)) != 0) {
					log_errf(errno, __func__, "Failed to get fullhostname from %s for job %s", hp->hn_host, pjob->ji_qs.ji_jobid);
					return (NULL);
				}
				if (strcmp(namebuf, canonical_name) == 0)
					hostmatch = 1;
			}

			if (hostmatch) {
				pjob->ji_nodeid = hp->hn_node;
				if (mynp)
					*mynp = hp;
			}
		}
	}
	*mi = momindex;
	return hp;
}

/**
 * @brief
 *	Get the next "chunk" from the exechost(2) string
 *
 * @param[in] enable_exechost2 - is exec_host2 available?
 * @param[in/out] ppeh - pointer to the current location in exechost(2) string
 * @param[out] pport - pointer to the integer port variable to be returned
 *
 * @return char *
 * @retval - the mom name 
 * @retval - NULL - failure
 *
 */
static char *
get_next_exechost2(int enable_exechost2, char **ppeh, int *pport)
{
	static char *mname;
	int port;
	char *peh = *ppeh;
	int n = 0;
	static char natvnodename[PBS_MAXNODENAME + 1];
	static char momname[PBS_MAXNODENAME + 1];
	static char momport[10] = {0};
	momvmap_t *pnat = NULL;

	if (enable_exechost2 == 0) {
		while ((*peh != '/') && (*peh != '\0') &&
		       (n < PBS_MAXNODENAME)) {
			natvnodename[n++] = *peh++;
		}
		natvnodename[n] = '\0';
	} else {
		momport[0] = '\0';
		while ((*peh != ':') && (*peh != '/') && (*peh != '\0') &&
		       (n < PBS_MAXNODENAME)) {
			momname[n++] = *peh++;
		}
		momname[n] = '\0';
		/* check if peh is colon, if so parse out port */
		n = 0;
		if (*peh == ':') {
			peh++; /* skip first ':' character to get port number */
			while ((*peh != '/') && (*peh != '\0') && (n < sizeof(momport)))
				momport[n++] = *peh++;
		}
		momport[n] = '\0';
	}

	/* advance past the "+" to the next host */
	while (*peh != '\0') {
		if (*peh++ == '+')
			break;
	}

	if (enable_exechost2 == 0) {
		pnat = find_vmap_entry(natvnodename);
		if (pnat != NULL) {
			/* found a map entry */
			mname = pnat->mvm_mom->mi_host;
			port = pnat->mvm_mom->mi_port + 1; /* RM port */
		} else {
			/* no map entry, assume same vnode name is */
			/* the host name and the port is standard  */
			mname = natvnodename;
			port = pbs_mom_port + 1; /* RM port */
		}
	} else {
		mname = momname;
		if (strlen(momport) > 0) {
			port = atol(momport) + 1;
		} else {
			port = pbs_mom_port + 1; /* RM port */
		}
	}

	*pport = port;
	*ppeh = peh;
	return mname;
}

/**
 * @brief
 *	job_nodes - process schedselect and exec_vnode to build mapping between
 *	chunks and allocated nodes/resources.
 *
 * @par Functionality:
 *	Loops through schedselect attribute and concurrently exec_vnode and
 *	exec_host attributes creating two arrays of structures:
 *	    hnodent - one per Mom regardless of the number of vnodes
 *		allocated from that Mom.  For the local Mom's entry, indexed
 *		by pjob->ji_nodeid, the hnodent will also contain an sub-array
 *		of host_vlist_t with one entry per vnode allocated on this host.
 *		This sub-array's length is given by hn_vlnum.
 *	    vmiprocs - one pre task/mpi process to be created;  there is one
 *		line per entry written into PBS_NODEFILE by Mom
 *	Both of the hnodent and vmpiprocs arrays are terminated by an entry
 *	where the id (hn_node or vn_node) is set to TM_ERROR_NODE.
 *	Additionally this function also determines the ji_nodeid of the job
 *	by matching the mom's name and port with the exechost list.
 *
 * @param[in]	pjob - pointer to job structure for job to be run
 * @param[out]	mynp - pointer to hnodent structure to be filled with the
 *                     hnodent for the node matching the current mom:port
 *
 * @return	int
 * @retval	PBSE_NONE (0) if success
 * @retval	PBSE_* on error.
 *
 * @par Side Effects:
 *	pjob->ji_vnods, pjob->ji_assn_vnodes, and pjob->ji_hosts are set,
 *	arrays in the heap
 *
 * @par MT-safe: likely no
 *
 */
int
job_nodes_inner(struct job *pjob, hnodent **mynp)
{
	char *execvnode;
	char *schedselect;
	int i, j, k;
	hnodent *hp = NULL;
	int hpn;
	int momindex;
	char *mname;
	int nmoms;
	vmpiprocs *vmp;
	momvmap_t *pmm = NULL;
	mominfo_t *pmom;

	char *peh;
	int port;
	int nprocs;
	int n_chunks;
	int procindex;
	int rc;
	long long sz;
	char *tpc;
	resc_limit_t have;
	resc_limit_t need;
	int naccels = 0;	  /* naccelerators count */
	int need_accel = 0;	  /* accelerator needed in subchunk? */
	long long accel_mem = 0;  /* accel mem per exec_vnode key-value pair */
	char *accel_model = NULL; /* accelerator model if set */

	/* variables used in parsing the "exec_vnode" string */
	int stop_on_paren;
	char *pndspec;
	char *elast;
	int enelma;
	char *nodep;
	static int ebuf_len = 0;
	static char *ebuf = NULL;
	static int enelmt = 0;
	static key_value_pair *enkv = NULL;

	/* variables used in parsing the "schedselect" string */
	char *psubspec;
	char *slast;
	int snc;
	int snelma;
	static int sbuf_len = 0;
	static char *sbuf = NULL;
	static int snelmt = 0;
	static key_value_pair *skv = NULL;
	char *save_ptr; /* posn for strtok_r() */
	int n_assn_vnodes;
	int assn_index;
	char *tmp_str;
	char *evnode;

	if (pjob == NULL)
		return (PBSE_INTERNAL);
	if (!(is_jattr_set(pjob, JOB_ATR_exec_vnode)))
		return (PBSE_INTERNAL);
	if (!(is_jattr_set(pjob, JOB_ATR_SchedSelect)))
		return (PBSE_INTERNAL);

	/* free what might have been done before if job is restarted */
	nodes_free(pjob);

	execvnode = get_jattr_str(pjob, JOB_ATR_exec_vnode);
	if (execvnode == NULL)
		return (PBSE_INTERNAL);

	schedselect = get_jattr_str(pjob, JOB_ATR_SchedSelect);
	if (schedselect == NULL)
		return (PBSE_INTERNAL);

	if (get_jattr_str(pjob, JOB_ATR_exec_host2) != NULL) {
		/* Mom got information from new server */
		enable_exechost2 = 1;
		peh = get_jattr_str(pjob, JOB_ATR_exec_host2);
	} else {
		peh = get_jattr_str(pjob, JOB_ATR_exec_host);
	}
	if (peh == NULL)
		return (PBSE_INTERNAL);

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "execvnode=%s", execvnode);
	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "schedselect=%s", schedselect);
	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "%s=%s", enable_exechost2 ? "exechost2" : "exechost", peh);

	/* make sure parsing buffers are long enought */
	if ((i = strlen(execvnode)) >= ebuf_len) {
		tpc = (char *) realloc(ebuf, i + 100);
		if (tpc == NULL)
			return (PBSE_SYSTEM);
		ebuf = tpc;
		ebuf_len = i + 100;
	}
	if ((i = strlen(schedselect)) >= sbuf_len) {
		tpc = (char *) realloc(sbuf, i + 100);
		if (tpc == NULL)
			return (PBSE_SYSTEM);
		sbuf = tpc;
		sbuf_len = i + 100;
	}

	strcpy(sbuf, schedselect);

	/* First, go parse schedselect and count up number of chunks and */
	/* total number of mpiprocs;   assuming one Mom per chunk and    */
	/* one mpiproc structure per mpiproc, this is used to obtain a   */
	/* maxmimun number of each for allocating the array              */

	nmoms = 0;    /* num of mom (struct hnodent) entries needed    */
	nprocs = 0;   /* num of vmpiproc entries needed                */
	n_chunks = 0; /* number of chunks */

	psubspec = parse_plus_spec_r(sbuf, &slast, &hpn);
	/* hpn set to 1 if open paren found, -1 if close paren found, or */
	/* 0 if neither or both found					 */

	while (psubspec) {
		DBPRT(("\tsubspec: %s\n", psubspec))
		rc = parse_chunk_r(psubspec, &snc, &snelma, &snelmt, &skv, NULL);
		/* snc is the number (repeat factor) of chunks */
		if (rc != 0)
			return (rc);

		nmoms += snc; /* num of Moms, one per chunk */
		k = 1;	      /* default number of mpiprocs */
		for (j = 0; j < snelma; ++j) {
			if (strcmp(skv[j].kv_keyw, "mpiprocs") == 0) {
				k = atol(skv[j].kv_val);
			}
		}
#ifdef NAS /* localmod 020 */
		/*
		 * At NAS, if specify only ncpus and not mpiprocs or
		 * ompthreads, assume mpiprocs = ncpus.
		 */
		{
			int ncpusidx = -1;
			for (j = 0; j < snelma; ++j) {
				if (strcmp(skv[j].kv_keyw, "ncpus") == 0) {
					ncpusidx = j;
					continue;
				}
				if (strcmp(skv[j].kv_keyw, MPIPROCS) == 0) {
					break;
				}
				if (strcmp(skv[j].kv_keyw, OMPTHREADS) == 0) {
					break;
				}
			}
			if (ncpusidx >= 0 && j >= snelma) {
				k = atol(skv[ncpusidx].kv_val);
			}
		}
#endif				   /* localmod 020 */
		nprocs += snc * k; /* mpiproces * num of chunks */
		n_chunks += snc;
		psubspec = parse_plus_spec_r(slast, &slast, &hpn);
	}

	DBPRT(("- allocating %d hosts and %d procs\n", nmoms, nprocs))
	pjob->ji_hosts = (hnodent *) calloc(nmoms + 1, sizeof(hnodent));
	pjob->ji_vnods = (vmpiprocs *) calloc(nprocs + 1, sizeof(vmpiprocs));

	n_assn_vnodes = 0;
	evnode = strdup(execvnode);
	if (evnode == NULL) {
		log_err(errno, __func__, "strdup failed");
		return (PBSE_SYSTEM);
	}
	for (tmp_str = strtok_r(evnode, "+", &save_ptr); tmp_str != NULL; tmp_str = strtok_r(NULL, "+", &save_ptr)) {
		n_assn_vnodes++;
	}

	if (n_assn_vnodes == 0)
		n_assn_vnodes = 1;

	free(evnode);

	pjob->ji_assn_vnodes = (vmpiprocs *) calloc(n_assn_vnodes + 1, sizeof(vmpiprocs));

	if ((pjob->ji_hosts == NULL) || (pjob->ji_vnods == NULL) ||
	    (pjob->ji_assn_vnodes == NULL)) {
		log_err(errno, "job_nodes", "calloc failed");
		return (PBSE_SYSTEM);
	}

	for (i = 0; i <= nmoms; ++i) {
		pjob->ji_hosts[i].hn_node = TM_ERROR_NODE;
		CLEAR_HEAD(pjob->ji_hosts[i].hn_events);
	}
	for (i = 0; i <= nprocs; ++i)
		pjob->ji_vnods[i].vn_node = TM_ERROR_NODE;

	for (i = 0; i <= n_assn_vnodes; ++i)
		pjob->ji_assn_vnodes[i].vn_node = TM_ERROR_NODE;

	/* Now parse schedselect and exec_vnode at same time to map mpiprocs */
	/* onto the corresponding Mom and sum up the resources allocated     */
	/* from each Mom						     */

	strcpy(ebuf, execvnode);
	strcpy(sbuf, schedselect);

	momindex = 0;
	procindex = 0;
	assn_index = 0;

	elast = ebuf;

	/*
	 * Next we parse the select spec to look at the next chunk that was
	 * requested by the user.  For each chunk we
	 * 1. parse the subspecs from the exec_vnode that were allocated for
	 *    that chunk.  Then
	 *    a. for the first vnode, get the Mom/host and setup the hnodent
	 *    b. for my hnodent, for each vnode, add a host_vlist entry to
	 *       the hnodent entry
	 * 2. setup the number of "mpiprocs" (from the chunk) vmpiprocs
	 */

	/* (1) parse chunk from select spec */

	psubspec = parse_plus_spec_r(sbuf, &slast, &hpn);
	while (psubspec) {
		int nthreads;
		int numprocs;

		DBPRT(("\tsubspec: %s\n", psubspec))
		nthreads = -1;
		numprocs = -1;
		rc = parse_chunk_r(psubspec, &snc, &snelma, &snelmt, &skv, NULL);
		/* snc = number of chunks */
		if (rc != 0) {
			return (rc);
		}

		for (i = 0; i < snc; ++i) { /* for each chunk in schedselect.. */
			need_accel = 0;
			accel_model = NULL;

			/* clear "need" counts */
			memset(&need, 0, sizeof(need));

			/* clear "have" counts */
			memset(&have, 0, sizeof(have));

			/* figure out what is "need"ed */
			for (j = 0; j < snelma; ++j) {
				if (strcmp(skv[j].kv_keyw, "ncpus") == 0)
					need.rl_ncpus = atol(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "mem") == 0)
					need.rl_mem = to_kbsize(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "vmem") == 0)
					need.rl_vmem = to_kbsize(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "mpiprocs") == 0)
					numprocs = atol(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "ompthreads") == 0)
					nthreads = atol(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "accelerator") == 0) {
					if (strcmp(skv[j].kv_val, "True") == 0)
						need_accel = 1;
					else
						need_accel = 0;
				} else if (strcmp(skv[j].kv_keyw, "naccelerators") == 0)
					need.rl_naccels = atol(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "accelerator_model") == 0) {
					accel_model = skv[j].kv_val;
					need_accel = 1;
				}
			}
#ifdef NAS /* localmod 020 */
			if (nthreads == -1 && numprocs == -1 && need.rl_ncpus != 0) {
				numprocs = need.rl_ncpus;
			}
#endif /* localmod 020 */
			if (nthreads == -1)
#ifdef NAS_NCPUS1 /* localmod 020 */
				nthreads = 1;
#else
				nthreads = need.rl_ncpus;
#endif /* localmod 020 */

			if (numprocs == -1) {
				if (need.rl_ncpus == 0) {
					numprocs = 0;
				} else {
					numprocs = 1;
				}
			}

			DBPRT(("\tchunk: %d, need %d ncpus and %lu mem\n", i,
			       need.rl_ncpus, (unsigned long) need.rl_mem))

			/*
			* The "natural" vnode for the Mom who is managing
			* this chunk of resources can be determined by the
			* corresponding entry in exec_host.  We have to know which
			* Mom in case of multiple-Moms for the allocated vnodes
			*/
			mname = get_next_exechost2(enable_exechost2, &peh, &port);
			hp = add_mom_to_job(pjob, mname, port, &momindex, mynp);
			if (hp == NULL) {
				log_err(errno, __func__, "Failed to add mom to job");
				return (PBSE_SYSTEM);
			}

			/* now parse exec_vnode to match up alloc-ed with needed */
			stop_on_paren = 0;

			while ((pndspec = parse_plus_spec_r(elast, &elast, &hpn)) != NULL) {
				int vnncpus = 0;
				long long ndmem = 0;

				if (hpn > 0) /* found open paren '(' */
					stop_on_paren = 1;

				rc = parse_node_resc_r(pndspec, &nodep, &enelma, &enelmt, &enkv);

				/* if no resources specified, skip it */
				if (enelma == 0) {
					stop_on_paren = 0;
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "Ignoring vnode %s without resources", nodep);
					mname = get_next_exechost2(enable_exechost2, &peh, &port);
					hp = add_mom_to_job(pjob, mname, port, &momindex, mynp);
					if (hp == NULL) {
						log_err(errno, __func__, "Failed to add mom to job");
						return (PBSE_SYSTEM);
					}
					continue; /* check next piece */
				}

				/* nodep = vnode name */
				if (rc != 0) {
					return (rc);
				}
				DBPRT(("\t\tusing vnode %s\n", nodep))

				/* find the Mom who manages the vnode */
				pmm = (momvmap_t *) find_vmap_entry(nodep);
				if (pmm == NULL) {
					/* Did not find a vmap entry for this vnode */
					/* assume it is host and add it w/ std port */

					if (enable_exechost2) {
						/* In case mom connected with newer server  */
						pmom = create_mom_entry(mname, port - 1);
					} else {
						pmom = create_mom_entry(nodep, pbs_mom_port);
					}
					if (pmom == NULL)
						return PBSE_SYSTEM;
#ifdef NAS /* localmod 123 */
					/* call create_mommap_entry() in a */
					/* way that populates the job      */
					/* nodefile with short names       */
					/* (e.g. r169i0n0)                 */
					if (0)
#else
					if (enable_exechost2)
#endif /* localmod 123 */
					{
						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "Creating entry for vnode=%s, mom=%s", nodep, mname);
						pmm = create_mommap_entry(nodep, mname, pmom, 0);
					} else {
						pmm = create_mommap_entry(nodep, NULL, pmom, 0);
					}

					if (pmm == NULL) {
						delete_mom_entry(pmom);
						return PBSE_SYSTEM;
					}
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, nodep, "implicitly added host to vmap");
				} else {
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid,
						   "Found! vnodemap entry for vnode=%s: mom-name=%s, hostname=%s", nodep, pmm->mvm_name, pmm->mvm_hostn);
				}

				/* for the allocated resc, add to hnodent resc_limit */
				/* which is used for limit enforcement while running */

				for (j = 0; j < enelma; ++j) {
					if (strcmp(enkv[j].kv_keyw, "ncpus") == 0) {
						vnncpus = atoi(enkv[j].kv_val);
						have.rl_ncpus += vnncpus;
						hp->hn_nrlimit.rl_ncpus += vnncpus;
					} else if (strcmp(enkv[j].kv_keyw, "mem") == 0) {
						ndmem = to_kbsize(enkv[j].kv_val);
						have.rl_mem += ndmem;
						hp->hn_nrlimit.rl_mem += ndmem;
					} else if (strcmp(enkv[j].kv_keyw, "vmem") == 0) {
						sz = to_kbsize(enkv[j].kv_val);
						have.rl_vmem += sz;
						hp->hn_nrlimit.rl_vmem += sz;
					} else if (strcmp(enkv[j].kv_keyw, "ssinodes") == 0) {
						hp->hn_nrlimit.rl_ssi += atoi(enkv[j].kv_val);
					} else if (strcmp(enkv[j].kv_keyw, "naccelerators") == 0) {
						naccels = atoi(enkv[j].kv_val);
						have.rl_naccels += naccels;
						hp->hn_nrlimit.rl_naccels += naccels;
					} else if (strcmp(enkv[j].kv_keyw, "accelerator_memory") == 0) {
						accel_mem = to_kbsize(enkv[j].kv_val);
						have.rl_accel_mem += accel_mem;
						hp->hn_nrlimit.rl_accel_mem += accel_mem;
						need_accel = 1;
					}
				}

				/* (1b)if this mom is me, add vnode to  host_vlist */
				if (hp->hn_node == pjob->ji_nodeid) {
					host_vlist_t *phv;
					phv = (host_vlist_t *) realloc(hp->hn_vlist,
								       (hp->hn_vlnum + 1) * sizeof(host_vlist_t));
					if (phv == NULL) {
						return (PBSE_INTERNAL);
					}
					hp->hn_vlist = phv;
					pbs_strncpy(phv[hp->hn_vlnum].hv_vname, nodep,
						    sizeof(phv[hp->hn_vlnum].hv_vname));
					phv[hp->hn_vlnum].hv_ncpus = vnncpus;
					phv[hp->hn_vlnum].hv_mem = ndmem;
					hp->hn_vlnum++;
				}

				vmp = &pjob->ji_assn_vnodes[assn_index];
				vmp->vn_node = assn_index++;
				if (hp != NULL)
					vmp->vn_host = hp;
				if (pmm != NULL)
					vmp->vn_vname = strdup(pmm->mvm_name);
				if (vmp->vn_vname == NULL) {
					if (vmp->vn_hname != NULL) {
						free(vmp->vn_hname);
						vmp->vn_hname = NULL;
					}
					return (PBSE_SYSTEM);
				}
				vmp->vn_cpus = vnncpus;
				vmp->vn_mem = ndmem;
				/* mark next entry as the (current) end */
				pjob->ji_assn_vnodes[assn_index].vn_node = TM_ERROR_NODE;

				if (stop_on_paren == 0)
					break;
				else if (hpn < 0)
					break;
			}
			/* validate the pointers before using  - SAFER */
			assert((hp != NULL) && (pmm != NULL));
			hp->hn_nprocs += numprocs;

			/* (2) setup the number of vmpiprocs entries based */
			/* on the number of procs, numprocs, in this chunk */

			for (k = 0; k < numprocs; ++k) {
				vmp = &pjob->ji_vnods[procindex];
				vmp->vn_node = procindex++;
				vmp->vn_host = hp;
				if (pmm->mvm_hostn) {
					/* copy the true host name */
					vmp->vn_hname = strdup(pmm->mvm_hostn);
					if (vmp->vn_hname == NULL)
						return (PBSE_SYSTEM);
				} else {
					/* set null and we will use the Mom name */
					vmp->vn_hname = NULL;
				}
				vmp->vn_vname = strdup(pmm->mvm_name);
				if (vmp->vn_vname == NULL) {
					if (vmp->vn_hname != NULL) {
						free(vmp->vn_hname);
						vmp->vn_hname = NULL;
					}
					return (PBSE_SYSTEM);
				}
				vmp->vn_cpus = have.rl_ncpus;
				vmp->vn_mem = have.rl_mem;
				vmp->vn_vmem = have.rl_vmem;
				vmp->vn_mpiprocs = numprocs;
				vmp->vn_threads = nthreads;
				vmp->vn_naccels = have.rl_naccels;
				vmp->vn_need_accel = need_accel;
				if (vmp->vn_need_accel || (vmp->vn_naccels > 0)) {
					if (accel_model) {
						vmp->vn_accel_model = strdup(accel_model);
					}
					vmp->vn_accel_mem = have.rl_accel_mem;
				}

				/* mark next entry as the (current) end */
				pjob->ji_vnods[procindex].vn_node = TM_ERROR_NODE;
			}
		}

		/* do next section of schedselect */
		psubspec = parse_plus_spec_r(slast, &slast, &hpn);
	}

	pjob->ji_numnodes = momindex;
	pjob->ji_numvnod = procindex;
	pjob->ji_num_assn_vnodes = assn_index;

	return (0);
}

/**
 * @brief
 * 	wrapper function that calls job_nodes_inner with a NULL parameter
 * 	for the "mynodeid" parameter
 *
 * @param[in] pjob - job pointer
 *
 * @return 	int
 * @retval	PBSE_NONE (0) Success
 * @retval      PBSE_* on error.
 *
 */

int
job_nodes(struct job *pjob)
{
	return job_nodes_inner(pjob, NULL);
}

/**
 * @brief
 * 	start_exec() - start execution of a job
 *
 * @param[in] pjob - job pointer
 *
 * @return	Void
 *
 */
void
start_exec(job *pjob)
{
	eventent *ep = NULL;
	int i, nodenum;
	pbs_socklen_t len;
	int socks[2];
	struct sockaddr_in saddr;
	hnodent *np;
	pbs_list_head phead;
	mom_hook_input_t hook_input;
	mom_hook_output_t hook_output;
	int hook_errcode = 0;
	int hook_rc = 0;
	char hook_msg[HOOK_MSG_SIZE];
	hook *last_phook = NULL;
	unsigned int hook_fail_action = 0;

	/* make sure we have an open tpp stream back to the server */
	if (server_stream == -1)
		send_hellosvr(server_stream);

#if MOM_ALPS
	/* set ALPS reservation id to -1 to indicate there isn't one yet */
	pjob->ji_extended.ji_ext.ji_reservation = -1;
#endif

	if (pjob->ji_mompost) { /* fail until activity is done */
		log_joberr(-1, __func__, "waiting for worktask completion",
			   pjob->ji_qs.ji_jobid);
		exec_bail(pjob, JOB_EXEC_RETRY, NULL);
		return;
	}

	/*
	 * Ensure we have a cookie for the job. The cookie consists of a
	 * string of 32 hex characters plus a null terminator. The machine
	 * architecture needs to be considered when populating the string
	 * because random() and lrand48() return a long int.
	 */

	if (!(is_jattr_set(pjob, JOB_ATR_Cookie))) {
		char tt[33];
		int i;

		for (i = 0; i < 33; i += sizeof(long)) {
			snprintf(&tt[i], 33 - i, "%.*lX", (int) sizeof(long), (unsigned long) random());
		}
		set_jattr_str_slim(pjob, JOB_ATR_Cookie, tt, NULL);
		DBPRT(("===== COOKIE %s\n", tt))
	}

	if ((i = job_nodes(pjob)) != 0) {
		sprintf(log_buffer, "job_nodes failed with error %d", i);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid, log_buffer);
		nodes_free(pjob);
		exec_bail(pjob, JOB_EXEC_RETRY, NULL);
		return;
	}
	pjob->ji_nodeid = 0; /* I'm MS */
	nodenum = pjob->ji_numnodes;

	if (do_tolerate_node_failures(pjob))
		reliable_job_node_add(&pjob->ji_node_list, mom_host);

	if (mock_run) {
		pjob->ji_ports[0] = -1;
		pjob->ji_ports[1] = -1;
		pjob->ji_stdout = -1;
		pjob->ji_stderr = -1;

		mock_run_finish_exec(pjob);
		return;
	}

	if (nodenum > 1) {
		int nodemux = 0;
		int mtfd = -1;
		int com;

		pjob->ji_resources = (noderes *) calloc(nodenum - 1,
							sizeof(noderes));
		assert(pjob->ji_resources != NULL);
		pjob->ji_numrescs = nodenum - 1;

		/* pjob->ji_numrescs is the number of entries in pjob->ji_resources array,
		 * which houses the resources obtained from the SISTER moms attached to the
		 * job. So pjob->ji_resources[0] is actually the resources from sister mom #1,
		 * pjob->ji_resources[1] is the resources from sister mom #2, and so on.
		 * Correlating this to the pjob->ji_hosts array,
		 * pjob->ji_hosts[0] refers to the MS entry which won't have an entry in the
		 * pjob->ji_resources array since that is for sisters only.
		 * pjob->ji_hosts[1] is sister #1 whose resources obtained for the job
		 * is in pjob->ji_resources[0],
		 * pjob->ji_hosts[2] is sister #2 whose resources obtained for the job is in
		 * pjob->ji_resources[1], and so on.
		 * This is why pjob->ji_numnodes = pjob->numrescs + 1.
		 */
		CLEAR_HEAD(phead);
		for (i = 0; i < (int) JOB_ATR_LAST; i++) {
			(void) (job_attr_def + i)->at_encode(get_jattr(pjob, i), &phead, (job_attr_def + i)->at_name, NULL, ATR_ENCODE_MOM, NULL);
		}
		attrl_fixlink(&phead);
		/*
		 **		Open streams to the sisterhood.
		 */
		if (pbs_conf.pbs_use_mcast == 1) {
			/* open the tpp mcast channel here */
			if ((mtfd = tpp_mcast_open()) == -1) {
				sprintf(log_buffer, "mcast open failed");
				log_err(errno, __func__, log_buffer);
				exec_bail(pjob, JOB_EXEC_FAIL1, NULL);
				return;
			}
		}

		for (i = 1; i < nodenum; i++) {
			np = &pjob->ji_hosts[i];

			np->hn_stream = tpp_open(np->hn_host, np->hn_port);
			if (np->hn_stream < 0) {
				sprintf(log_buffer, "tpp_open failed on %s:%d",
					np->hn_host, np->hn_port);
				log_err(errno, __func__, log_buffer);
				exec_bail(pjob, JOB_EXEC_FAIL1, NULL);
				return;
			}
			if (pbs_conf.pbs_use_mcast == 1) {
				/* add each of the tpp streams to the tpp mcast channel */
				if (tpp_mcast_add_strm(mtfd, np->hn_stream, FALSE) == -1) {
					tpp_close(np->hn_stream);
					np->hn_stream = -1;
					tpp_mcast_close(mtfd);
					sprintf(log_buffer, "mcast add failed");
					log_err(errno, __func__, log_buffer);
					exec_bail(pjob, JOB_EXEC_FAIL1, NULL);
					return;
				}
			}
		}

		if (is_jattr_set(pjob, JOB_ATR_nodemux))
			nodemux = get_jattr_long(pjob, JOB_ATR_nodemux);

		/*
		 **		Send out a JOIN_JOB/RESTART message to all the MOM's in
		 **		the sisterhood.
		 */
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) ||
		    (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ChkptMig)) {

			/*
			 * NULL value passed to hook_input.vnl means to assign
			 * vnode list using pjob->ji_host[].
			 */
			mom_hook_input_init(&hook_input);
			hook_input.pjob = pjob;

			mom_hook_output_init(&hook_output);
			hook_output.reject_errcode = &hook_errcode;
			hook_output.last_phook = &last_phook;
			hook_output.fail_action = &hook_fail_action;

			switch ((hook_rc = mom_process_hooks(HOOK_EVENT_EXECJOB_BEGIN,
							     PBS_MOM_SERVICE_NAME, mom_host,
							     &hook_input, &hook_output,
							     hook_msg, sizeof(hook_msg), 1))) {
				case 1: /* explicit accept */
					break;
				case 2: /* no hook script executed - go ahead and accept event*/
					break;
				default:
					/* a value of '0' means explicit reject encountered. */
					if (hook_rc != 0) {
						/*
						 * we've hit an internal error (malloc error, full disk, etc...), so
						 * treat this now like a  hook error so hook fail_action will be
						 * consulted. Before, behavior of an internal error was to ignore it!
						 */
						hook_errcode = PBSE_HOOKERROR;
						send_hook_fail_action(last_phook);
					}
					exec_bail(pjob, JOB_EXEC_FAIL1, NULL);
					return;
			}

			if ((i = job_setup(pjob, NULL)) != JOB_EXEC_OK) {
				exec_bail(pjob, i, NULL);
				return;
			}

			/* new tasks can't talk to demux anymore */
			nodemux = 0;

			com = IM_RESTART;
			pjob->ji_mompost = post_restart;

			if ((i = local_restart(pjob, NULL)) != 0) {
				post_restart(pjob, i);
				exec_bail(pjob, (i == PBSE_CKPBSY) ? JOB_EXEC_RETRY : JOB_EXEC_FAIL2, NULL);
				return;
			}
		} else
			com = IM_JOIN_JOB;

		if (nodemux) {
			pjob->ji_ports[0] = -1;
			pjob->ji_ports[1] = -1;
			pjob->ji_stdout = -1;
			pjob->ji_stderr = -1;
		} else {
			/*
			 * Open two sockets for use by demux program later.
			 */
			for (i = 0; i < 2; i++)
				socks[i] = -1;
			for (i = 0; i < 2; i++) {
				if ((socks[i] = socket(AF_INET,
						       SOCK_STREAM, 0)) == -1)
					break;

				memset(&saddr, '\0', sizeof(saddr));
				saddr.sin_addr.s_addr = INADDR_ANY;
				saddr.sin_family = AF_INET;
				if (bind(socks[i], (struct sockaddr *) &saddr,
					 sizeof(saddr)) == -1)
					break;

				len = sizeof(saddr);
				if (getsockname(socks[i],
						(struct sockaddr *) &saddr,
						&len) == -1)
					break;
				pjob->ji_ports[i] = (int) ntohs(saddr.sin_port);
			}
			if (i < 2) {
				log_err(errno, __func__, "stdout/err socket");
				for (i = 0; i < 2; i++) {
					if (socks[i] != -1)
						close(socks[i]);
				}
				exec_bail(pjob, JOB_EXEC_FAIL1, NULL);
				return;
			}
			pjob->ji_stdout = socks[0];
			pjob->ji_stderr = socks[1];
			pjob->ji_extended.ji_ext.ji_stdout = pjob->ji_ports[0];
			pjob->ji_extended.ji_ext.ji_stderr = pjob->ji_ports[1];
		}

		for (i = 1; i < nodenum; i++) {
			np = &pjob->ji_hosts[i];

			if (i == 1)
				ep = event_alloc(pjob, com, -1, np,
						 TM_NULL_EVENT, TM_NULL_TASK);
			else
				ep = event_dup(ep, pjob, np);

			if (ep == NULL) {
				exec_bail(pjob, JOB_EXEC_FAIL1, NULL);
				return;
			}
			if (pbs_conf.pbs_use_mcast == 0)
				send_join_job_restart(com, ep, i, pjob, &phead);
		}
		if (pbs_conf.pbs_use_mcast == 1) {
			send_join_job_restart_mcast(mtfd, com, ep, i, pjob, &phead);
			tpp_mcast_close(mtfd);
		}

		free_attrlist(&phead);
		if (do_tolerate_node_failures(pjob)) {
			if (!check_job_substate(pjob, JOB_SUBSTATE_WAITING_JOIN_JOB)) {
				set_job_substate(pjob, JOB_SUBSTATE_WAITING_JOIN_JOB);
				pjob->ji_joinalarm = time_now + joinjob_alarm_time;
				sprintf(log_buffer, "job waiting up to %ld secs ($sister_join_job_alarm) for all sister moms to join", joinjob_alarm_time);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
				log_buffer[0] = '\0';
			}
		}
	} else { /* no sisters */
		pjob->ji_ports[0] = -1;
		pjob->ji_ports[1] = -1;
		pjob->ji_stdout = -1;
		pjob->ji_stderr = -1;

		/*
		 * All the JOIN messages have come in.
		 */
		switch (pre_finish_exec(pjob, 0)) {
			case PRE_FINISH_SUCCESS:
				finish_exec(pjob);
				break;
			default:
				exec_bail(pjob, JOB_EXEC_RETRY, NULL);
				return;
		}
	}
}

/**
 * @brief
 *	Forks a child process, with the parent process returning the child
 *	process id, while the child closes shuts down tpp, and closes
 *	network descriptors, and turns off alarm.
 *
 * @param[in]	conn	- connection file descriptor to NOT close in the child.
 * @note
 * 	If 'conn' is the impossible -1, then ALL connection descriptors will
 *	be closed.
 *
 * @return 	pid_t
 * @retval	child process id	Success
 *
 */

pid_t
fork_me(int conn)
{
	struct sigaction act;
	pid_t pid;

	fflush(stdout);
	fflush(stderr);

	pid = fork();
	if (pid == 0) {
		/* now the child */

		/* Turn off alarm if it should happen to be on */
		alarm(0);
		tpp_terminate();
		(void) close(lockfds);

		/* Reset signal actions for most to SIG_DFL */
		sigemptyset(&act.sa_mask);
		act.sa_flags = 0;
		act.sa_handler = SIG_DFL;
		(void) sigaction(SIGCHLD, &act, NULL);
		(void) sigaction(SIGINT, &act, NULL);
		(void) sigaction(SIGTERM, &act, NULL);
		act.sa_handler = SIG_IGN;
		(void) sigaction(SIGHUP, &act, NULL);

		/* Reset signal mask */
		(void) sigprocmask(SIG_SETMASK, &act.sa_mask, NULL);

		(void) mom_close_poll();
		net_close(conn); /* close all but for the current */
	} else if (pid < 0)
		log_err(errno, __func__, "fork failed");

	return (pid);
}

/**
 * @brief
 * 	starter_return - return starter value,
 *	exit if negative
 *
 */

void
starter_return(int upfds, int downfds, int code, struct startjob_rtn *sjrtn)
{
	struct startjob_rtn ack;

	sjrtn->sj_code = code;
	(void) writepipe(upfds, sjrtn, sizeof(*sjrtn));

	/* wait for acknowledgement */
	(void) readpipe(downfds, &ack, sizeof(ack));
	(void) close(upfds);
	(void) close(downfds);
	if (code < 0) {
		exit(254);
	}
}

/**
 * @brief	Open a file as the user.
 *
 * @par	Purpose
 *	This is done to prevent a security problem where in "root" opens a file
 *	in a public directory and then changes ownership.   If a symlink
 *	already existed, we could have a problem.
 *
 * @param[in] path  - full path of file to open/create
 * @param[in] oflag - access mode, see oflag of open(2)
 * @param[in] mode  - file creation mode (permissions), see mode of open(2)
 * @param[in] exuid - effective uid of user as which to open/create file
 * @param[in] exgid - effective gid of user as which to open/create file
 *
 * @return int
 * @retval -1  - error on open/create or impersonating the user
 * @retval >=0 - the opened file descriptor
 *
 */

int
open_file_as_user(char *path, int oflag, mode_t mode, uid_t exuid, gid_t exgid)
{
	int fds;
	int open_errno = 0;
	extern gid_t pbsgroup;

	/* must open or create file as the user */

	if (impersonate_user(exuid, exgid) == -1)
		return -1;

	if ((fds = open(path, oflag, mode)) == -1)
		open_errno = errno;

	revert_from_user();

	if (open_errno)
		errno = open_errno;

	return (fds);
}

/**
 * @brief
 *	create_file_securely - create job's output/error file in a secure
 *	manner, but as the user.
 *
 * @par Functionality:
 *	This function is used when we need to create the job's output/error.
 *	In the spool directory, anyone can create a file there, so we need to
 *	open in a manner that a hacker cannot replace the file with a link
 *	and not open it to create it as a link may be there and we don't wish
 *	to create the link's target.
 *
 *	Uses mktemp() to create a file with a name that does not
 *	currently exist, and then rename this file to the correct name for
 *	the job.  Then set correct permissions based on user's umask for the
 *	job and set the O_APPEND flag so that qmsg can write without having
 *	its text over written by the job.
 *
 * @param[in]	path  - path to the file to be created
 * @param[in]	exuid - uid for file owner
 * @param[in]	exgid - gid for file owner
 *
 * @return	int
 * @retval	file descriptor (>=0) if success
 * @retval	-1 on error.
 *
 * @par MT-safe: likely no
 *
 */
static int
create_file_securely(char *path, uid_t exuid, gid_t exgid)
{
	char buf[MAXPATHLEN + 1];
	char *pc;
	mode_t cur_mask;
	int fds;

	/* create a uniquely named file using mkstemp() */
	/* for that we need to setup the template       */

	pbs_strncpy(buf, path, sizeof(buf));
	pc = strrchr(buf, '/'); /* last slash in path */
	if (pc == NULL)
		return (-1);
	++pc;
	if ((pc - buf) > (MAXPATHLEN - 6))
		return (-1);  /* path too long, unlikely to happen */
	strcpy(pc, "XXXXXX"); /* mkstemp template */

	/* The user's umask has already been set.  Get it for later */

	cur_mask = umask(022);
	(void) umask(cur_mask); /* reset it back */

	/*
	 * become the user, i.e. set effective privileges
	 * IMPORTANT - once we have changed to the user privilege,
	 * DO NOT return until have changed back to root
	 */

	if (impersonate_user(exuid, exgid) == -1)
		return -1;

	fds = mkstemp(buf); /* create file */
	if (fds != -1) {

		/* change permissions based on user's umask */
		/* because mkstemp() ignores umask; then    */
		/* rename to what we want for the job file  */

		if ((fchmod(fds, 0666 & ~cur_mask) == -1) ||
		    (rename(buf, path) == -1)) {
			(void) close(fds);
			(void) unlink(buf);
			fds = -1;
		} else {
			int acc;

			/* add O_APPEND to the file descriptor so that lines */
			/* written by qmsg are not overwritten by the job    */

			acc = fcntl(fds, F_GETFL);
			if (acc == -1) {
				(void) close(fds);
				(void) unlink(path);
				fds = -1;
			}
			acc = (acc & ~O_ACCMODE) | O_APPEND;
			if (fcntl(fds, F_SETFL, acc) == -1) {
				(void) close(fds);
				(void) unlink(path);
				fds = -1;
			}
		}
	}

	/* return to having full administrative (root) privileges */
	revert_from_user();

	/* now we can return */
	return (fds);
}

/**
 * @brief
 *	Generate the fully qualified path name for a job's standard stream
 *
 * @par Functionality:
 *	Creates a fully qualified path name for the output/error file for the following cases:
 *	1.  Interactive PBS job, just return the output attribute value,  it won't be used.
 *	2.  qsub -k option was specified for the file, retain in User's Home directory unless
 *	    sandbox=PRIVATE, in which case it goes there.  The file name is the default of
 *	    job_name.a|eo<sequence number>
 *	3.  If sandbox=PRIVATE, the file is placed there.
 *	4.  If direct_write is specified and the final destination of the file is mapped to a local directory by $usecp,
 *	    create the file in its final destination directory and set the "keeping" flag so it will not be staged.
 *	5.  Else, the file path is created to put the file in PBS_HOME/spool
 * @param[in]  pjob - pointer to job structure
 * @param[in]  which - identifies which file: StdOut, StdErr, or Chkpt.
 * @param[out] keeping - set true if file to reside in User's Home or sandbox, false if in spool.
 *
 * @return char * - pointer to path which is in a static array.
 *
 * @par @par MT-safe: No
 */

char *
std_file_name(job *pjob, enum job_file which, int *keeping)
{
	static char path[MAXPATHLEN + 1];
	char key = '\001'; /* should never be found */
	int len;
	char *pd;
	char *suffix = NULL;

	if (is_jattr_set(pjob, JOB_ATR_interactive) && (get_jattr_long(pjob, JOB_ATR_interactive) > 0)) {

		/* interactive job, name of pty is in outpath */

		*keeping = 0;
		return (get_jattr_str(pjob, JOB_ATR_outpath));
	}

	switch (which) {
		case StdOut:
			key = 'o';
			suffix = JOB_STDOUT_SUFFIX;
			break;

		case StdErr:
			key = 'e';
			suffix = JOB_STDERR_SUFFIX;
			break;

		case Chkpt:
			suffix = JOB_CKPT_SUFFIX;
			break;

		default:
			break;
	}

	if (pjob->ji_grpcache == NULL)
		return (""); /* needs to be non-NULL for figuring out homedir path; otherwise, mom will crash! */

	/* check if file is to be directly written to its final destination */
	if (is_direct_write(pjob, which, path, &direct_write_possible)) {
		*keeping = 1; /* inhibit staging */
		return (path);
	}

	/* Is file to be kept?, if so use default name in Home directory */
	else if ((is_jattr_set(pjob, JOB_ATR_keep)) &&
		 strchr(get_jattr_str(pjob, JOB_ATR_keep), key) && !strchr(get_jattr_str(pjob, JOB_ATR_keep), 'd')) {
		/* sandbox=private mode set the path to be the path to the */
		/* staging and execution directory			   */
		if ((is_jattr_set(pjob, JOB_ATR_sandbox)) && (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
			strcpy(path, jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir));
			*keeping = 1;
		} else
			strcpy(path, pjob->ji_grpcache->gc_homedir);

		pd = strrchr(get_jattr_str(pjob, JOB_ATR_jobname), '/');
		if (pd == NULL) {
			pd = get_jattr_str(pjob, JOB_ATR_jobname);
			strcat(path, "/");
		}

		strcat(path, pd); /* start with the job name */
		len = strlen(path);
		*(path + len++) = '.';	   /* the dot        */
		*(path + len++) = key;	   /* the letter     */
		pd = pjob->ji_qs.ji_jobid; /* the seq_number */
		while (isdigit((int) *pd))
			*(path + len++) = *pd++;
		*(path + len) = '\0';
		if (is_jattr_set(pjob, JOB_ATR_array_index)) {
			/* this is a sub job of an Array Job, append .index */
			strcat(path, ".");
			strcat(path, get_jattr_str(pjob, JOB_ATR_array_index));
		}
		*keeping = 1;
	} else {
		/* put into spool directory unless NO_SPOOL_OUTPUT is defined */

#ifdef NO_SPOOL_OUTPUT
		/* sandbox=PRIVATE mode puts output in job staging and execution directory */
		if (is_jattr_set(pjob, JOB_ATR_sandbox) &&
		    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
			strcpy(path, jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir));
			strcat(path, "/");
		} else /* force all output to user's HOME */
			strcpy(path, pjob->ji_grpcache->gc_homedir);

		strcat(path, "/");
		*keeping = 1;
#else  /* NO_SPOOL_OUTPUT */
		/* sandbox=PRIVATE mode puts output in job staging and execution directory */
		if (is_jattr_set(pjob, JOB_ATR_sandbox) &&
		    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
			strcpy(path, jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir));
			strcat(path, "/");
			*keeping = 1;
		} else {
			strcpy(path, path_spool);
			*keeping = 0;
		}
#endif /* NO_SPOOL_OUTPUT */
		if (*pjob->ji_qs.ji_fileprefix != '\0')
			(void) strcat(path, pjob->ji_qs.ji_fileprefix);
		else
			(void) strcat(path, pjob->ji_qs.ji_jobid);
		if (suffix)
			(void) strcat(path, suffix);
	}
	return (path);
}

/**
 * @brief
 *	Open (create) either standard output or standard error for the job.
 * @par
 *	Open, likely creating, the job file in a secure manner.
 *	If the job is interactive, connecting to a pseudo terminal, or the file is being opened
 *	in the User's Home or sandbox,  it is opened as the user.
 *	In spool, it is a bit more complex; must make sure an attacker cannot try and slip in a
 *	symbolic link which would cause the file to overwrite something else.
 *
 * @param[in] pjob  - pointer to job structure
 * @param[in] which - which file to create, StdOut, StdErr, or Chkpt
 * @param[in] mode  - file open oflag (O_CREAT, O_WRONLY, ...)
 * @param[in] exgid - User's gid
 *
 * @return 	int
 * @retval	fd	On success
 * @retval	-1	on failure
 *
 */

int
open_std_file(job *pjob, enum job_file which, int mode, gid_t exgid)
{
	uid_t exuid;
	int fds;
	int keeping = 0;
	char *path;
	struct stat sb;

	if (!pjob)
		return (-1);
	if (!pjob->ji_grpcache)
		return (-1);
	exuid = pjob->ji_grpcache->gc_uid;
	path = std_file_name(pjob, which, &keeping);

	/* must open or create file as the user */

	/*
	 * If the job is interactive, the tty device file is "safe" in a
	 * protected directory,  otherwise check others for security.
	 */

	if (is_jattr_set(pjob, JOB_ATR_interactive) != 0 && get_jattr_long(pjob, JOB_ATR_interactive) > 0)
		fds = open_file_as_user(path, mode, 0644, exuid, exgid);
	else if (keeping) {
		/* The user is keeping the file in his Home directory or sandbox, */
		/* both are safe and the file can be opened directly.             */
		fds = open_file_as_user(path, mode, 0644, exuid, exgid);
	} else {

		/* File going into the spool area... */

		int lrc;

		/*
		 * If the file does not already exist (the typical case for a
		 * job running the first time) or exists, but is a regular file
		 * owned by the right user (if job has run before), then we
		 * will open it.  BUT, we need to recheck because there is a
		 * (very) small window in which it could be changed.
		 *
		 * If the file exists, but isn't a regular file owned by the
		 * right user, there is a problem.  In this case, (see "else")
		 * we don't want to open it as this could create a file as the
		 * target of a link,  we make it using a more secure manner
		 * using mkstemp().
		 */
		if (((lrc = lstat(path, &sb)) != -1) && ((sb.st_mode & S_IFMT) == S_IFREG) && (sb.st_nlink == 1) && (sb.st_uid == exuid) && (sb.st_gid == exgid)) {

			/* at this point all is ok, go open it */
			fds = open_file_as_user(path, mode, 0644, exuid, exgid);
			if (fds == -1)
				return (-1);

			/* Recheck what is opened, it might have  */
			/* changed between the check and the open */

			if ((fstat(fds, &sb) == -1) || ((sb.st_mode & S_IFMT) != S_IFREG) || (sb.st_nlink != 1) || (sb.st_uid != exuid) || (sb.st_gid != exgid)) {

				/* Its bad now,  log it, leaving */
				/* it in place as evidence       */
				if (fds != -1)
					close(fds);

				log_suspect_file(__func__, "bad type or owner", path, &sb);
				return (-1);
			}
		} else {

			if ((lrc != -1) || (errno != ENOENT)) {
				/* file exists but is suspect */
				log_suspect_file(__func__,
						 "bad type or owner, attempting to remove file", path, &sb);
				(void) unlink(path);
			}

			/* file does not exist or is not correct */
			/* create the file in a secure manner    */

			if ((fds = create_file_securely(path, exuid, exgid)) == -1) {
				sprintf(log_buffer,
					"secure create of file failed for job %s for user %u",
					pjob->ji_qs.ji_jobid, exuid);
				if (stat(path, &sb) != -1) {
					strcat(log_buffer, ", file exists");
					log_suspect_file(__func__, log_buffer, path, &sb);
				} else {
					log_record(PBSEVENT_SECURITY, PBS_EVENTCLASS_FILE, LOG_CRIT,
						   path, log_buffer);
				}
				return (-1);
			}
		}
	}

	return (fds);
}

/**
 * @brief
 *	catchinter = catch death of writer child of interactive job
 *	and kill off the shell child.
 *
 * @param[in] sig - signal number
 *
 * @return	Void
 *
 */

static void
catchinter(int sig)
{
	int status;
	pid_t pid;

	pid = waitpid(-1, &status, WNOHANG);
	if (pid == 0)
		return;
	if (pid == writerpid) {
		kill(shellpid, SIGKILL);
#if defined(HAVE_LIBKAFS) || defined(HAVE_LIBKOPENAFS)
		waitpid(shellpid, &status, WNOHANG);
#else
		(void) wait(&status);
#endif
		mom_reader_go = 0;
		x11_reader_go = 0;
	}
}
/**
 * @brief
 *	log_mom_portfw_msg - used to log a port forwarding error message to
 *	MOM logs
 *
 * @param[in]	msg -  pointer to error message
 *
 * @return	None
 *
 */
void
log_mom_portfw_msg(char *msg)
{
	strcpy(log_buffer, msg);
	log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, __func__, log_buffer);
}


================================================
FILE: src/resmom/vnode_storage.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include "pbs_config.h"

#include <stdlib.h>
#include <string.h>
#include <stdio.h>
#include <errno.h>
#include <assert.h>
#include "libpbs.h"
#include "log.h"
#include "server_limits.h"
#include "attribute.h"
#include "placementsets.h"
#include "resource.h"
#include "pbs_nodes.h"

#ifdef DEBUG
extern void mom_CPUs_report();
#endif /* DEBUG */

/**
 * @file
 */
/**
 * @brief
 *	creates vnode map
 *
 * @param[in] ctxp - pointer to pointer to vnodes
 *
 * @return 	int
 * @retval 	1	Success
 * @retval 	0 	Failure
 *
 */

int
create_vmap(void **ctxp)
{
	assert(ctxp != NULL);

	if (*ctxp == NULL) {
		if ((*ctxp = pbs_idx_create(0, 0)) == NULL) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, "Failed to create vnode map");
			return 0;
		}
	}

	return (1);
}

/**
 * @brief
 *	destroys the vnode map
 *
 * @param[in] ctx - char pointer to node
 *
 * @return Void
 *
 */
void
destroy_vmap(void *ctx)
{
	assert(ctx != NULL);
	pbs_idx_destroy(ctx);
	ctx = NULL;
}

/**
 * @brief
 *	finds vnode map entry by vnode id
 *
 * @param[in] ctx - char pointer to vnode
 * @param[in] vnid - vnode id
 *
 * @return 	structure handle
 * @retval  	pointer to mominfo_t structure on success else NULL
 *
 */
mominfo_t *
find_vmapent_byID(void *ctx, const char *vnid)
{
	mominfo_t *p;

	if (pbs_idx_find(ctx, (void **) &vnid, (void **) &p, NULL) == PBS_IDX_RET_OK)
		return p;
	return NULL;
}

/**
 * @brief
 *	adds vnode to vnode map by vnode id.
 *
 * @param[in] ctx - char pointer to vnode
 * @param[in] vnid - vnode id
 * @param[in] data - information about vnode
 *
 * @return 	int
 * @retval 	0	Success
 * @retval 	1	Failure
 *
 */
int
add_vmapent_byID(void *ctx, const char *vnid, void *data)
{
	if (pbs_idx_insert(ctx, (void *) vnid, data) != PBS_IDX_RET_OK) {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, "Failed to add vnode %s in vnodemap", vnid);
		return 1;
	}
	return 0;
}


================================================
FILE: src/scheduler/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

lib_LIBRARIES = libpbs_sched.a
noinst_LIBRARIES = libschedharness.a

common_cflags = \
	-I$(top_srcdir)/src/include \
	@libz_inc@ \
	-pthread \
	@PYTHON_INCLUDES@ \
	@KRB5_CFLAGS@

common_libs = \
	$(builddir)/libpbs_sched.a \
	$(builddir)/libschedharness.a \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	@KRB5_LIBS@ \
	@PYTHON_LDFLAGS@ \
	@PYTHON_LIBS@ \
	@libz_lib@ \
	@libical_lib@

libpbs_sched_a_CPPFLAGS = ${common_cflags}

libschedharness_a_CPPFLAGS = ${common_cflags}
libschedharness_a_SOURCES = \
	pbs_sched_utils.cpp

libpbs_sched_a_SOURCES = \
	$(top_builddir)/src/lib/Libpython/shared_python_utils.c \
	buckets.cpp \
	buckets.h \
	check.cpp \
	check.h \
	config.h \
	constant.h \
	data_types.h \
	dedtime.cpp \
	dedtime.h \
	fairshare.cpp \
	fairshare.h \
	fifo.cpp \
	fifo.h \
	get_4byte.cpp \
	globals.cpp \
	globals.h \
	job_info.cpp \
	job_info.h \
	limits.cpp \
	limits_if.h \
	misc.cpp \
	misc.h \
	multi_threading.cpp \
	multi_threading.h \
	node_info.cpp \
	node_info.h \
	node_partition.cpp \
	node_partition.h \
	parse.cpp \
	parse.h \
	pbs_bitmap.cpp \
	pbs_bitmap.h \
	prev_job_info.cpp \
	prev_job_info.h \
	prime.cpp \
	prime.h \
	queue.cpp \
	queue.h \
	queue_info.cpp \
	queue_info.h \
	resource.cpp \
	resource.h \
	resource_resv.cpp \
	resource_resv.h \
	resv_info.cpp \
	resv_info.h \
	sched_exception.cpp \
	sched_ifl_wrappers.cpp \
	server_info.cpp \
	server_info.h \
	simulate.cpp \
	simulate.h \
	sort.cpp \
	sort.h \
	state_count.cpp \
	state_count.h \
	site_code.cpp \
	site_code.h \
	site_data.h

sbin_PROGRAMS = pbs_sched pbsfs
noinst_PROGRAMS = pbs_sched_bare

pbs_sched_CPPFLAGS = ${common_cflags}
pbs_sched_LDADD = ${common_libs}
pbs_sched_SOURCES = pbs_sched.cpp

pbs_sched_bare_CPPFLAGS = ${common_cflags}
pbs_sched_bare_LDADD = ${common_libs}
pbs_sched_bare_SOURCES = pbs_sched_bare.cpp

pbsfs_CPPFLAGS = ${common_cflags}
pbsfs_LDADD = ${common_libs}
pbsfs_SOURCES = pbsfs.cpp

dist_sysconf_DATA = \
	pbs_dedicated \
	pbs_holidays \
	pbs_holidays.2017 \
	pbs_resource_group \
	pbs_sched_config


================================================
FILE: src/scheduler/buckets.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include "data_types.h"
#include "pbs_bitmap.h"
#include "node_info.h"
#include "server_info.h"
#include "buckets.h"
#include "globals.h"
#include "resource.h"
#include "resource_resv.h"
#include "simulate.h"
#include "misc.h"
#include "sort.h"
#include "node_partition.h"
#include "check.h"
#include <log.h>
#include "pbs_internal.h"

/* bucket_bitpool constructor */
bucket_bitpool *
new_bucket_bitpool()
{
	bucket_bitpool *bp;

	bp = static_cast<bucket_bitpool *>(calloc(1, sizeof(bucket_bitpool)));
	if (bp == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	bp->truth = pbs_bitmap_alloc(NULL, 1);
	if (bp->truth == NULL) {
		free_bucket_bitpool(bp);
		return NULL;
	}
	bp->truth_ct = 0;

	bp->working = pbs_bitmap_alloc(NULL, 1);
	if (bp->working == NULL) {
		free_bucket_bitpool(bp);
		return NULL;
	}
	bp->working_ct = 0;

	return bp;
}

/* bucket_bitpool destructor */
void
free_bucket_bitpool(bucket_bitpool *bp)
{
	if (bp == NULL)
		return;

	pbs_bitmap_free(bp->truth);
	pbs_bitmap_free(bp->working);

	free(bp);
}

/* bucket_bitpool copy constructor */
bucket_bitpool *
dup_bucket_bitpool(bucket_bitpool *obp)
{
	bucket_bitpool *nbp;

	nbp = new_bucket_bitpool();

	if (pbs_bitmap_assign(nbp->truth, obp->truth) == 0) {
		free_bucket_bitpool(nbp);
		return NULL;
	}
	nbp->truth_ct = obp->truth_ct;

	if (pbs_bitmap_assign(nbp->working, obp->working) == 0) {
		free_bucket_bitpool(nbp);
		return NULL;
	}
	nbp->working_ct = obp->working_ct;

	return nbp;
}

/* node_bucket constructor */
node_bucket *
new_node_bucket(int new_pools)
{
	node_bucket *nb;

	nb = static_cast<node_bucket *>(calloc(1, sizeof(node_bucket)));
	if (nb == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	if (new_pools) {
		nb->busy_pool = new_bucket_bitpool();
		if (nb->busy_pool == NULL) {
			free_node_bucket(nb);
			return NULL;
		}

		nb->busy_later_pool = new_bucket_bitpool();
		if (nb->busy_later_pool == NULL) {
			free_node_bucket(nb);
			return NULL;
		}

		nb->free_pool = new_bucket_bitpool();
		if (nb->free_pool == NULL) {
			free_node_bucket(nb);
			return NULL;
		}
	} else {
		nb->busy_pool = NULL;
		nb->busy_later_pool = NULL;
		nb->free_pool = NULL;
	}
	nb->bkt_nodes = pbs_bitmap_alloc(NULL, 1);
	if (nb->bkt_nodes == NULL) {
		free_node_bucket(nb);
		return NULL;
	}

	nb->res_spec = NULL;
	nb->queue = NULL;
	nb->priority = 0;
	nb->total = 0;

	return nb;
}

/* node_bucket copy constructor */
node_bucket *
dup_node_bucket(node_bucket *onb, server_info *nsinfo)
{
	node_bucket *nnb;

	nnb = new_node_bucket(0);
	if (nnb == NULL)
		return NULL;

	nnb->busy_pool = dup_bucket_bitpool(onb->busy_pool);
	if (nnb->busy_pool == NULL) {
		free_node_bucket(nnb);
		return NULL;
	}

	nnb->busy_later_pool = dup_bucket_bitpool(onb->busy_later_pool);
	if (nnb->busy_later_pool == NULL) {
		free_node_bucket(nnb);
		return NULL;
	}

	nnb->free_pool = dup_bucket_bitpool(onb->free_pool);
	if (nnb->free_pool == NULL) {
		free_node_bucket(nnb);
		return NULL;
	}

	pbs_bitmap_assign(nnb->bkt_nodes, onb->bkt_nodes);
	nnb->res_spec = dup_resource_list(onb->res_spec);
	if (nnb->res_spec == NULL) {
		free_node_bucket(nnb);
		return NULL;
	}

	if (onb->queue != NULL)
		nnb->queue = find_queue_info(nsinfo->queues, onb->queue->name);

	if (onb->name != NULL)
		nnb->name = string_dup(onb->name);
	nnb->total = onb->total;
	nnb->priority = onb->priority;

	return nnb;
}

/* node_bucket array copy constructor */
node_bucket **
dup_node_bucket_array(node_bucket **old, server_info *nsinfo)
{
	node_bucket **nnb;
	int i;
	if (old == NULL)
		return NULL;

	nnb = static_cast<node_bucket **>(malloc((count_array(old) + 1) * sizeof(node_bucket *)));
	if (nnb == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; old[i] != NULL; i++) {
		nnb[i] = dup_node_bucket(old[i], nsinfo);
		if (nnb[i] == NULL) {
			free_node_bucket_array(nnb);
			return NULL;
		}
	}

	nnb[i] = NULL;

	return nnb;
}

/* node_bucket destructor */
void
free_node_bucket(node_bucket *nb)
{
	if (nb == NULL)
		return;

	free_bucket_bitpool(nb->busy_pool);
	free_bucket_bitpool(nb->busy_later_pool);
	free_bucket_bitpool(nb->free_pool);

	free_resource_list(nb->res_spec);

	pbs_bitmap_free(nb->bkt_nodes);

	free(nb->name);
	free(nb);
}

/* node bucket array destructor */
void
free_node_bucket_array(node_bucket **buckets)
{
	int i;

	if (buckets == NULL)
		return;

	for (i = 0; buckets[i] != NULL; i++)
		free_node_bucket(buckets[i]);

	free(buckets);
}

/* node_bucket_count constructor */
node_bucket_count *
new_node_bucket_count()
{
	node_bucket_count *nbc;

	nbc = static_cast<node_bucket_count *>(malloc(sizeof(node_bucket_count)));
	if (nbc == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	nbc->bkt = NULL;
	nbc->chunk_count = 0;

	return nbc;
}

void
free_node_bucket_count(node_bucket_count *nbc)
{
	if (nbc == NULL)
		return;

	free(nbc);
}

void
free_node_bucket_count_array(node_bucket_count **nbc_array)
{
	int i;
	if (nbc_array == NULL)
		return;

	for (i = 0; nbc_array[i] != NULL; i++)
		free_node_bucket_count(nbc_array[i]);

	free(nbc_array);
}

/**
 * @brief find the index into an array of node_buckets based on resources, queue, and priority
 * @param[in] buckets - the node_bucket array to search
 * @param[in] rl - the resource list of the node bucket
 * @param[in] qinfo - the queue of the node bucket
 * @param[in] priority - the priority of the node bucket
 * @return int
 * @retval index of array if found
 * @retval -1 if not found or on error
 */
int
find_node_bucket_ind(node_bucket **buckets, schd_resource *rl, queue_info *qinfo, int priority)
{
	int i;
	if (buckets == NULL || rl == NULL)
		return -1;

	for (i = 0; buckets[i] != NULL; i++) {
		if (buckets[i]->queue == qinfo && buckets[i]->priority == priority &&
		    compare_resource_avail_list(buckets[i]->res_spec, rl))
			return i;
	}
	return -1;
}

/**
 * @brief create a name for a node bucket based on resource names, priority, and queue
 *
 * @return char *
 * @retval name of bucket
 * @retval NULL - error
 */
char *
create_node_bucket_name(status *policy, node_bucket *nb)
{
	char *name;
	int len;

	if (policy == NULL || nb == NULL)
		return NULL;

	name = create_resource_signature(nb->res_spec, policy->resdef_to_check_no_hostvnode, ADD_ALL_BOOL);
	if (name == NULL)
		return NULL;

	len = strlen(name);

	if (nb->priority != 0) {
		char buf[20];
		if (pbs_strcat(&name, &len, ":priority=") == NULL) {
			free(name);
			return NULL;
		}
		snprintf(buf, sizeof(buf), "%d", nb->priority);
		if (pbs_strcat(&name, &len, buf) == NULL) {
			free(name);
			return NULL;
		}
	}

	if (nb->queue != NULL) {
		if (pbs_strcat(&name, &len, ":queue=") == NULL) {
			free(name);
			return NULL;
		}
		if (pbs_strcat(&name, &len, nb->queue->name.c_str()) == NULL) {
			free(name);
			return NULL;
		}
	}

	return name;
}

/**
 * @brief create node buckets from an array of nodes
 * @param[in] policy - policy info
 * @param[in] nodes - the nodes to create buckets from
 * @param[in] queues - the queues the nodes may be associated with.  May be NULL
 * @param[in] flags - flags to control creation of buckets
 * 						UPDATE_BUCKET_IND - update the bucket_ind member on the node_info structure
 * 						NO_PRINT_BUCKETS - do not print that a bucket has been created
 * @return node_bucket **
 * @retval array of node buckets
 * @retval NULL on error
 */
node_bucket **
create_node_buckets(status *policy, node_info **nodes, std::vector<queue_info *> &queues, unsigned int flags)
{
	int i;
	int j = 0;
	node_bucket **buckets = NULL;
	node_bucket **tmp;
	int node_ct;

	if (policy == NULL || nodes == NULL || queues.empty())
		return NULL;

	node_ct = count_array(nodes);

	buckets = static_cast<node_bucket **>(calloc((node_ct + 1), sizeof(node_bucket *)));
	if (buckets == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; i < node_ct; i++) {
		node_bucket *nb = NULL;
		int bkt_ind;
		queue_info *qinfo = NULL;
		int node_ind = nodes[i]->node_ind;

		if (nodes[i]->is_down || nodes[i]->is_offline || node_ind == -1 || nodes[i]->lic_lock == 0)
			continue;

		if (!nodes[i]->queue_name.empty())
			qinfo = find_queue_info(queues, nodes[i]->queue_name);

		bkt_ind = find_node_bucket_ind(buckets, nodes[i]->res, qinfo, nodes[i]->priority);
		if (flags & UPDATE_BUCKET_IND) {
			if (bkt_ind == -1)
				nodes[i]->bucket_ind = j;
			else
				nodes[i]->bucket_ind = bkt_ind;
		}
		if (bkt_ind != -1)
			nb = buckets[bkt_ind];

		if (nb == NULL) { /* no bucket found, need to add one*/
			schd_resource *cur_res;
			buckets[j] = new_node_bucket(1);

			if (buckets[j] == NULL) {
				free_node_bucket_array(buckets);
				return NULL;
			}

			buckets[j]->res_spec = dup_selective_resource_list(nodes[i]->res, policy->resdef_to_check_no_hostvnode,
									   (ADD_UNSET_BOOLS_FALSE | ADD_ALL_BOOL));

			if (buckets[j]->res_spec == NULL) {
				free_node_bucket_array(buckets);
				return NULL;
			}

			if (qinfo != NULL)
				buckets[j]->queue = qinfo;

			buckets[j]->priority = nodes[i]->priority;

			for (cur_res = buckets[j]->res_spec; cur_res != NULL; cur_res = cur_res->next)
				if (cur_res->type.is_consumable)
					cur_res->assigned = 0;

			buckets[j]->busy_later_pool->truth_ct = 0;
			buckets[j]->free_pool->truth_ct = 0;
			buckets[j]->busy_pool->truth_ct = 0;

			buckets[j]->total = 0;

			buckets[j]->name = create_node_bucket_name(policy, buckets[j]);
			if (buckets[j]->name == NULL) {
				free_node_bucket_array(buckets);
				return NULL;
			}
			if (!(flags & NO_PRINT_BUCKETS))
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__, "Created node bucket %s", buckets[j]->name);

			nb = buckets[j];
			j++;
		}
		pbs_bitmap_bit_on(nb->bkt_nodes, node_ind);
		nb->total++;
		if (nodes[i]->is_free && nodes[i]->num_jobs == 0 && nodes[i]->num_run_resv == 0) {
			if (nodes[i]->node_events != NULL) {
				pbs_bitmap_bit_on(nb->busy_later_pool->truth, node_ind);
				nb->busy_later_pool->truth_ct++;
			} else {
				pbs_bitmap_bit_on(nb->free_pool->truth, node_ind);
				nb->free_pool->truth_ct++;
			}
		} else {
			pbs_bitmap_bit_on(nb->busy_pool->truth, node_ind);
			nb->busy_pool->truth_ct++;
		}
	}

	if (j == 0) {
		free(buckets);
		return NULL;
	}

	tmp = static_cast<node_bucket **>(realloc(buckets, (j + 1) * sizeof(node_bucket *)));
	if (tmp != NULL)
		buckets = tmp;
	else {
		log_err(errno, __func__, MEM_ERR_MSG);
		free_node_bucket_array(buckets);
		return NULL;
	}
	return buckets;
}

/* chunk_map constructor */
chunk_map *
new_chunk_map()
{
	chunk_map *cmap;
	cmap = static_cast<chunk_map *>(malloc(sizeof(chunk_map)));
	if (cmap == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	cmap->chk = NULL;
	cmap->bkt_cnts = NULL;
	cmap->node_bits = pbs_bitmap_alloc(NULL, 1);
	if (cmap->node_bits == NULL) {
		free_chunk_map(cmap);
		return NULL;
	}

	return cmap;
}

/* chunk_map destructor */
void
free_chunk_map(chunk_map *cmap)
{
	if (cmap == NULL)
		return;

	free_node_bucket_count_array(cmap->bkt_cnts);
	pbs_bitmap_free(cmap->node_bits);
	free(cmap);
}

/* chunk_map array destructor */
void
free_chunk_map_array(chunk_map **cmap_arr)
{
	int i;
	if (cmap_arr == NULL)
		return;

	for (i = 0; cmap_arr[i] != NULL; i++)
		free_chunk_map(cmap_arr[i]);

	free(cmap_arr);
}

/**
 * @brief log a summary of a chunk_map array
 * @param[in] resresv - the job we are logging about
 * @param[in] cmap - the chunk_map to log
 *
 * @return nothing
 */
void
log_chunk_map_array(resource_resv *resresv, chunk_map **cmap)
{
	int i;
	int j;

	if (resresv == NULL || cmap == NULL)
		return;

	for (i = 0; cmap[i] != NULL; i++) {
		int total_chunks = 0;

		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name, "Chunk: %s", cmap[i]->chk->str_chunk);

		for (j = 0; cmap[i]->bkt_cnts[j] != NULL; j++) {
			int chunk_count;
			node_bucket_count *nbc = cmap[i]->bkt_cnts[j];
			chunk_count = (nbc->bkt->free_pool->truth_ct + nbc->bkt->busy_later_pool->truth_ct) * nbc->chunk_count;
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name, "Bucket %s can fit %d chunks", nbc->bkt->name, chunk_count);
			total_chunks += chunk_count;
		}
		if (total_chunks < cmap[i]->chk->num_chunks)
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Found %d out of %d chunks needed", total_chunks, cmap[i]->chk->num_chunks);
	}
}

/**
 * @brief set working buckets = truth buckets
 * @param[in,out] nb - node bucket to set
 */
void
set_working_bucket_to_truth(node_bucket *nb)
{
	if (nb == NULL)
		return;
	if (nb->busy_pool == NULL || nb->busy_later_pool == NULL || nb->free_pool == NULL)
		return;

	pbs_bitmap_assign(nb->busy_pool->working, nb->busy_pool->truth);
	nb->busy_pool->working_ct = nb->busy_pool->truth_ct;

	pbs_bitmap_assign(nb->busy_later_pool->working, nb->busy_later_pool->truth);
	nb->busy_later_pool->working_ct = nb->busy_later_pool->truth_ct;

	pbs_bitmap_assign(nb->free_pool->working, nb->free_pool->truth);
	nb->free_pool->working_ct = nb->free_pool->truth_ct;
}

/**
 * @brief map job to nodes in buckets and allocate nodes to job
 * @param[in, out] cmap - mapping between chunks and buckets for the job
 * @param[in] resresv - the job
 * @param[out] err - error structure
 * @return int
 * @retval 1 - success
 * @retval 0 - failure
 */
int
bucket_match(chunk_map **cmap, resource_resv *resresv, schd_error *err)
{
	int i;
	int j;
	int k;
	static pbs_bitmap *zeromap = NULL;
	server_info *sinfo;

	if (cmap == NULL || resresv == NULL || resresv->select == NULL)
		return 0;

	if (zeromap == NULL) {
		zeromap = pbs_bitmap_alloc(NULL, 1);
		if (zeromap == NULL)
			return 0;
	}

	sinfo = resresv->server;

	for (i = 0; cmap[i] != NULL; i++) {
		if (cmap[i]->bkt_cnts != NULL) {
			for (j = 0; cmap[i]->bkt_cnts[j] != NULL; j++) {
				set_working_bucket_to_truth(cmap[i]->bkt_cnts[j]->bkt);
				pbs_bitmap_assign(cmap[i]->node_bits, zeromap);
			}
		}
	}

	for (i = 0; cmap[i] != NULL; i++) {
		int num_chunks_needed = cmap[i]->chk->num_chunks;

		if (cmap[i]->bkt_cnts == NULL)
			break;

		for (j = 0; cmap[i]->bkt_cnts[j] != NULL && num_chunks_needed > 0; j++) {
			node_bucket *bkt = cmap[i]->bkt_cnts[j]->bkt;
			int chunks_added = 0;

			for (k = pbs_bitmap_first_on_bit(bkt->busy_later_pool->working);
			     num_chunks_needed > chunks_added && k >= 0;
			     k = pbs_bitmap_next_on_bit(bkt->busy_later_pool->working, k)) {
				clear_schd_error(err);
				if (resresv->aoename != NULL) {
					if (sinfo->unordered_nodes[k]->current_aoe == NULL ||
					    strcmp(sinfo->unordered_nodes[k]->current_aoe, resresv->aoename) != 0)
						if (is_provisionable(sinfo->unordered_nodes[k], resresv, err) == NOT_PROVISIONABLE) {
							continue;
						}
				}
				if (node_can_fit_job_time(k, resresv)) {
					pbs_bitmap_bit_off(bkt->busy_later_pool->working, k);
					bkt->busy_later_pool->working_ct--;
					pbs_bitmap_bit_on(bkt->busy_pool->working, k);
					bkt->busy_pool->working_ct++;
					pbs_bitmap_bit_on(cmap[i]->node_bits, k);
					chunks_added += cmap[i]->bkt_cnts[j]->chunk_count;
				}
			}

			for (k = pbs_bitmap_first_on_bit(bkt->free_pool->working);
			     num_chunks_needed > chunks_added && k >= 0;
			     k = pbs_bitmap_next_on_bit(bkt->free_pool->working, k)) {
				clear_schd_error(err);
				if (resresv->aoename != NULL) {
					if (sinfo->unordered_nodes[k]->current_aoe == NULL ||
					    strcmp(sinfo->unordered_nodes[k]->current_aoe, resresv->aoename) != 0)
						if (is_provisionable(sinfo->unordered_nodes[k], resresv, err) == NOT_PROVISIONABLE) {
							continue;
						}
				}
				pbs_bitmap_bit_off(bkt->free_pool->working, k);
				bkt->free_pool->working_ct--;
				pbs_bitmap_bit_on(bkt->busy_pool->working, k);
				bkt->busy_pool->working_ct++;
				pbs_bitmap_bit_on(cmap[i]->node_bits, k);
				chunks_added += cmap[i]->bkt_cnts[j]->chunk_count;
			}

			if (chunks_added > 0)
				num_chunks_needed -= chunks_added;
		}
		/* Couldn't find buckets to satisfy all the chunks */
		if (num_chunks_needed > 0)
			return 0;
	}

	return 1;
}

/**
 * @brief Determine if a job can fit in time before a node becomes busy
 * @param[in] node_ind - index into sinfo->snodes of the node
 * @param[in] resresv - the job
 * @return yes/no
 * @retval 1 - yes
 * @retvan 0 - no
 */
int
node_can_fit_job_time(int node_ind, resource_resv *resresv)
{
	te_list *tel;
	time_t end;
	server_info *sinfo;

	if (resresv == NULL)
		return 0;

	sinfo = resresv->server;
	end = sinfo->server_time + calc_time_left(resresv, 0);
	tel = sinfo->unordered_nodes[node_ind]->node_events;
	if (tel != NULL && tel->event != NULL)
		if (tel->event->event_time < end)
			return 0;

	return 1;
}

/**
 * @brief convert a chunk into an nspec for a job on a node
 * @param policy - policy info
 * @param chk - the chunk
 * @param node - the node
 * @param aoename - the aoe requested by the job
 * @return nspec*
 * @retval the nspec
 * @retval NULL on error
 */
nspec *
chunk_to_nspec(status *policy, chunk *chk, node_info *node, char *aoename)
{
	nspec *ns;
	resource_req *prev_req;
	resource_req *req;
	resource_req *cur_req;

	if (policy == NULL || chk == NULL || node == NULL)
		return NULL;

	ns = new nspec();

	ns->ninfo = node;
	ns->seq_num = get_sched_rank();
	ns->end_of_chunk = 1;
	prev_req = NULL;
	if (aoename != NULL) {
		if (node->current_aoe == NULL || strcmp(aoename, node->current_aoe) != 0) {
			ns->go_provision = 1;
			req = create_resource_req("aoe", aoename);
			if (req == NULL) {
				delete ns;
				return NULL;
			}
			ns->resreq = req;
			prev_req = req;
		}
	}
	for (cur_req = chk->req; cur_req != NULL; cur_req = cur_req->next) {
		if (cur_req->def->type.is_consumable && policy->resdef_to_check.find(cur_req->def) != policy->resdef_to_check.end()) {
			req = dup_resource_req(cur_req);
			if (req == NULL) {
				delete ns;
				return NULL;
			}
			if (prev_req == NULL)
				ns->resreq = req;
			else
				prev_req->next = req;
			prev_req = req;
		}
	}

	return ns;
}

/**
 * @brief convert a chunk_map->node_bits into an nspec array
 * @param[in] policy - policy info
 * @param[in] cb_map - chunk_map->node_bits are the nodes to allocate
 * @param resresv - the job
 * @return vector<nspec*>
 * @retval nspec array to run the job on
 * @retval empty vector on error
 */
std::vector<nspec *>
bucket_to_nspecs(status *policy, chunk_map **cb_map, resource_resv *resresv)
{
	int i;
	int j;
	int k;
	int cnt = 1;
	int n = 0;
	std::vector<nspec *> ns_arr;
	server_info *sinfo;

	if (policy == NULL || cb_map == NULL || resresv == NULL)
		return {};

	sinfo = resresv->server;
	ns_arr.reserve(resresv->select->total_chunks);

	for (i = 0; cb_map[i] != NULL; i++) {
		int chunks_needed = cb_map[i]->chk->num_chunks;
		for (j = pbs_bitmap_first_on_bit(cb_map[i]->node_bits); j >= 0;
		     j = pbs_bitmap_next_on_bit(cb_map[i]->node_bits, j)) {
			/* Find the bucket the node is in */
			if (cb_map[i]->bkt_cnts != NULL) {
				for (k = 0; cb_map[i]->bkt_cnts[k] != NULL; k++)
					if (pbs_bitmap_get_bit(cb_map[i]->bkt_cnts[k]->bkt->bkt_nodes, j)) {
						cnt = cb_map[i]->bkt_cnts[k]->chunk_count;
						break;
					}
			} else {
				/* Error case(shouldn't happen): the bkt_cnts is NULL.  Only assign one chunk.
				 * This could cause us not to allocate enough chunks in free placement
				 */
				cnt = 1;
			}
			/* Allocate the chunks.  For all but the final chunk, we need to allocate cnt chunks,
			 * For the final chunk, we might allocate less.
			 */
			for (; cnt > 0 && chunks_needed > 0; cnt--, chunks_needed--, n++) {
				auto ns = chunk_to_nspec(policy, cb_map[i]->chk, sinfo->unordered_nodes[j], resresv->aoename);
				if (ns == NULL) {
					free_nspecs(ns_arr);
					return {};
				}
				ns_arr.push_back(ns);
			}
		}
	}

	return ns_arr;
}

/**
 * @brief decide if a job should use the node bucket algorithm
 * @param resresv - the job
 * @return int
 * @retval 1 if the job should use the bucket algorithm
 * @retval 0 if not
 */
int
job_should_use_buckets(resource_resv *resresv)
{

	if (resresv == NULL)
		return 0;

	/* nodes are bucketed, they can't be sorted by unused */
	if (conf.node_sort_unused)
		return 0;

	/* Bucket algorithm doesn't support avoid_provisioning */
	if (conf.provision_policy == AVOID_PROVISION)
		return 0;

	/* qrun uses the standard path */
	if (resresv == resresv->server->qrun_job)
		return 0;

	/* Jobs in reservations use the standard path */
	if (resresv->job != NULL) {
		if (resresv->job->resv != NULL)
			return 0;
	}

	/* Only excl jobs use buckets */
	if (resresv->place_spec->share)
		return 0;
	if (!resresv->place_spec->excl)
		return 0;

	/* place=pack jobs do not use buckets */
	if (resresv->place_spec->pack)
		return 0;

	/*  multivnoded systems are incompatible */
	if (resresv->server->has_multi_vnode)
		return 0;

	/* Job's requesting specific hosts or vnodes use the standard path */
	const auto &defs = resresv->select->defs;
	if (defs.find(allres["host"]) != defs.end())
		return 0;
	if (defs.find(allres["vnode"]) != defs.end())
		return 0;
	/* If a job has an execselect, it means it's requesting vnode */
	if (resresv->execselect != NULL)
		return 0;

	return 1;
}

/*
 * @brief - create a mapping of chunks to the buckets they can run in.
 * 	    The mapping will be of the chunks to all the buckets that can satisfy them.
 * 	    This may be way more nodes than are required to run the job.
 * 	    If we can't find enough nodes in the buckets, we know we can never run.
 *
 * @param[in] policy - policy info
 * @param[in] buckets - buckets to check
 * @param[in] resresv - resresv to check
 * @param[out] err - error structure to return failure
 *
 * @return chunk map
 * @retval NULL - for the following reasons:
		- if no buckets are found for one chunk
 *		- if there aren't enough nodes in all buckets found for one chunk
 *		- on malloc() failure
 */
chunk_map **
find_correct_buckets(status *policy, node_bucket **buckets, resource_resv *resresv, schd_error *err)
{
	int bucket_ct;
	int chunk_ct;
	int i, j;
	int can_run = 1;
	chunk_map **cb_map;
	static struct schd_error *failerr = NULL;

	if (policy == NULL || buckets == NULL || resresv == NULL || resresv->select == NULL || resresv->select->chunks == NULL || err == NULL)
		return NULL;

	if (failerr == NULL) {
		failerr = new_schd_error();
		if (failerr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return 0;
		}
	} else
		clear_schd_error(failerr);

	bucket_ct = count_array(buckets);
	chunk_ct = count_array(resresv->select->chunks);

	cb_map = static_cast<chunk_map **>(calloc((chunk_ct + 1), sizeof(chunk_map *)));
	if (cb_map == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; resresv->select->chunks[i] != NULL; i++) {
		int total = 0;
		int b = 0;
		cb_map[i] = new_chunk_map();
		if (cb_map[i] == NULL) {
			free_chunk_map_array(cb_map);
			return NULL;
		}
		cb_map[i]->chk = resresv->select->chunks[i];
		cb_map[i]->bkt_cnts = static_cast<node_bucket_count **>(calloc(bucket_ct + 1, sizeof(node_bucket_count *)));
		if (cb_map[i]->bkt_cnts == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			free_chunk_map_array(cb_map);
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return NULL;
		}
		for (j = 0; buckets[j] != NULL && can_run; j++) {
			queue_info *qinfo = NULL;

			if (resresv->job != NULL && resresv->job->queue->nodes != NULL)
				qinfo = resresv->job->queue;

			if (buckets[j]->queue == qinfo) {
				int c;
				c = check_avail_resources(buckets[j]->res_spec, resresv->select->chunks[i]->req,
							  (CHECK_ALL_BOOLS | COMPARE_TOTAL | UNSET_RES_ZERO),
							  policy->resdef_to_check_no_hostvnode, INSUFFICIENT_RESOURCE, err);
				if (c > 0) {
					if (resresv->place_spec->scatter || resresv->place_spec->vscatter)
						c = 1;

					cb_map[i]->bkt_cnts[b] = new_node_bucket_count();
					if (cb_map[i]->bkt_cnts[b] == NULL) {
						free_chunk_map_array(cb_map);
						set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
						return NULL;
					}
					cb_map[i]->bkt_cnts[b]->bkt = buckets[j];
					cb_map[i]->bkt_cnts[b++]->chunk_count = c;
					total += buckets[j]->total * c;
				} else {
					if (failerr->status_code == SCHD_UNKWN)
						move_schd_error(failerr, err);
				}
				clear_schd_error(err);
			}
		}

		/* No buckets match or not enough nodes in the buckets: the job can't run */
		if (b == 0 || total < cb_map[i]->chk->num_chunks)
			can_run = 0;
	}
	cb_map[i] = NULL;

	log_chunk_map_array(resresv, cb_map);

	if (can_run == 0) {
		if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
			move_schd_error(err, failerr);
		err->status_code = NEVER_RUN;
		free_chunk_map_array(cb_map);
		return NULL;
	}

	return cb_map;
}

/**
 * @brief entry point into the node bucket algorithm.  If placement sets are
 * 	in use, choose the right pool and call map_buckets() on each.  If placement
 * 	sets are not in use, just call map_buckets()
 * @param[in] policy - policy info
 * @param[in] sinfo - the server info universe
 * @param[in] qinfo - the queue the job is in
 * @param[in] resresv - the job
 * @param[out] err - schd_error structure to return reason why the job can't run
 * @return vector<nspec *>
 * @retval place job can run
 * @retval empty vector if job can't run
 */
std::vector<nspec *>
check_node_buckets(status *policy, server_info *sinfo, queue_info *qinfo, resource_resv *resresv, schd_error *err)
{
	node_partition **nodepart = NULL;

	if (policy == NULL || sinfo == NULL || resresv == NULL || err == NULL)
		return {};

	if (resresv->is_job && qinfo == NULL)
		return {};

	if (resresv->is_job && qinfo->nodepart != NULL)
		nodepart = qinfo->nodepart;
	else if (sinfo->nodepart != NULL)
		nodepart = sinfo->nodepart;
	else
		nodepart = NULL;

	/* job's place=group=res replaces server or queue node grouping
	 * We'll search the node partition cache for the job's pool of node partitions
	 * If it doesn't exist, we'll create it and add it to the cache
	 */
	if (resresv->place_spec->group != NULL) {
		std::vector<std::string> groupvec{resresv->place_spec->group};
		np_cache *npc = NULL;
		node_info **ninfo_arr;

		if (qinfo->has_nodes)
			ninfo_arr = qinfo->nodes;
		else
			ninfo_arr = sinfo->unassoc_nodes;

		npc = find_alloc_np_cache(policy, sinfo->npc_arr, groupvec, ninfo_arr, cmp_placement_sets);
		if (npc != NULL)
			nodepart = npc->nodepart;
	}
	if (nodepart != NULL) {
		int i;
		int can_run = 0;
		static schd_error *failerr = NULL;
		if (failerr == NULL) {
			failerr = new_schd_error();
			if (failerr == NULL)
				return {};
		} else
			clear_schd_error(failerr);

		for (i = 0; nodepart[i] != NULL; i++) {
			std::vector<nspec *> nspecs;
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Evaluating placement set: %s", nodepart[i]->name);

			clear_schd_error(err);
			nspecs = map_buckets(policy, nodepart[i]->bkts, resresv, err);
			if (!nspecs.empty())
				return nspecs;
			if (err->status_code == NOT_RUN) {
				if (failerr->status_code == SCHD_UNKWN)
					copy_schd_error(failerr, err);
				can_run = 1;
			}
		}
		/* If we can't fit in any placement set, span over all of them */
		if (can_run == 0) {
			if (sc_attrs.do_not_span_psets) {
				set_schd_error_codes(err, NEVER_RUN, CANT_SPAN_PSET);
				return {};
			} else {
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name, "Request won't fit into any placement sets, will use all nodes");
				return map_buckets(policy, sinfo->buckets, resresv, err);
			}
		} else
			/* There is a possibility that the job might fit in one of the placement set,
			 * use that error code
			 */
			move_schd_error(err, failerr);
	}

	return map_buckets(policy, sinfo->buckets, resresv, err);
}

/*
 * @brief check to see if a resresv can fit on the nodes using buckets
 *
 * @param[in] policy - policy info
 * @param[in] bkts - buckets to search
 * @param[in] resresv - resresv to see if it can fit
 * @param[out] err - error structure to return failure
 *
 * @return place resresv can run or NULL if it can't
 */
std::vector<nspec *>
map_buckets(status *policy, node_bucket **bkts, resource_resv *resresv, schd_error *err)
{
	chunk_map **cmap;

	if (policy == NULL || bkts == NULL || resresv == NULL || err == NULL)
		return {};

	cmap = find_correct_buckets(policy, bkts, resresv, err);
	if (cmap == NULL)
		return {};

	clear_schd_error(err);
	if (bucket_match(cmap, resresv, err) == 0) {
		if (err->status_code == SCHD_UNKWN)
			set_schd_error_codes(err, NOT_RUN, NO_NODE_RESOURCES);

		free_chunk_map_array(cmap);
		return {};
	}

	auto ns_arr = bucket_to_nspecs(policy, cmap, resresv);

	free_chunk_map_array(cmap);
	return ns_arr;
}


================================================
FILE: src/scheduler/buckets.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _BUCKETS_H
#define _BUCKETS_H

#include "data_types.h"

/* bucket_bitpool constructor, copy constructor, destructor */
bucket_bitpool *new_bucket_bitpool();
void free_bucket_bitpool(bucket_bitpool *bp);
bucket_bitpool *dup_bucket_bitpool(bucket_bitpool *obp);

/* node_bucket constructor, copy constructor, destructor */
node_bucket *new_node_bucket(int new_pools);
node_bucket *dup_node_bucket(node_bucket *onb, server_info *nsinfo);
node_bucket **dup_node_bucket_array(node_bucket **old, server_info *nsinfo);
void free_node_bucket(node_bucket *nb);
void free_node_bucket_array(node_bucket **buckets);

/* find index of node_bucket in an array */
int find_node_bucket_ind(node_bucket **buckets, schd_resource *rl, queue_info *qinfo, int priority);

/* create node_buckets an array of nodes */
node_bucket **create_node_buckets(status *policy, node_info **nodes, std::vector<queue_info *> &queues, unsigned int flags);

/* Create a name for the node bucket based on resources, queue, and priority */
char *create_node_bucket_name(status *policy, node_bucket *nb);

/* match job's request to buckets and allocate */
int bucket_match(chunk_map **cmap, resource_resv *resresv, schd_error *err);
/* convert chunk_map->node_bits into nspec array */
std::vector<nspec *> bucket_to_nspecs(status *policy, chunk_map **cb_map, resource_resv *resresv);

/* can a job completely fit on a node before it is busy */
int node_can_fit_job_time(int node_ind, resource_resv *resresv);

/* bucket version of a = b */
void set_working_bucket_to_truth(node_bucket *nb);
void set_chkpt_bucket_to_working(node_bucket *nb);
void set_working_bucket_to_chkpt(node_bucket *nb);
void set_chkpt_bucket_to_truth(node_bucket *nb);
void set_truth_bucket_to_chkpt(node_bucket *nb);

/* chunk_map constructor, copy constructor, destructor */
chunk_map *new_chunk_map();
chunk_map *dup_chunk_map(chunk_map *ocmap);
void free_chunk_map(chunk_map *cmap);
void free_chunk_map_array(chunk_map **cmap_arr);
chunk_map **dup_chunk_map_array(chunk_map **ocmap_arr);

/* decide of a job should use the node_bucket path */
int job_should_use_buckets(resource_resv *resresv);

/* Log a summary of a chunk_map array */
void log_chunk_map_array(resource_resv *resresv, chunk_map **cmap);

/* Check to see if a job can run on nodes via the node_bucket codepath */
std::vector<nspec *> check_node_buckets(status *policy, server_info *sinfo, queue_info *qinfo, resource_resv *resresv, schd_error *err);
std::vector<nspec *> map_buckets(status *policy, node_bucket **bkts, resource_resv *resresv, schd_error *err);

/* map job to buckets that can satisfy */
chunk_map **find_correct_buckets(status *policy, node_bucket **buckets, resource_resv *resresv, schd_error *err);

#endif /* _BUCKETS_H */


================================================
FILE: src/scheduler/check.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    check.c
 *
 * Functions included are:
 *	is_ok_to_run_queue()
 *	time_to_ded_boundary()
 *	time_to_prime_boundary()
 *	shrink_to_boundary()
 *	shrink_to_minwt()
 *	shrink_to_run_event()
 *	shrink_job_algorithm()
 *	is_ok_to_run_STF()
 *	is_ok_to_run()
 *	check_avail_resources()
 *	dynamic_avail()
 *	find_counts_elm()
 *	check_ded_time_boundary()
 *	dedtime_conflict()
 *	check_nodes()
 *	check_ded_time_queue()
 *	check_prime_queue()
 *	check_nonprime_queue()
 *	check_prime_boundary()
 *	false_res()
 *	unset_str_res()
 *	zero_res()
 *
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <pbs_ifl.h>
#include <pbs_internal.h>
#include <log.h>
#include <libutil.h>
#include "check.h"
#include "config.h"
#include "server_info.h"
#include "queue_info.h"
#include "job_info.h"
#include "misc.h"
#include "constant.h"
#include "globals.h"
#include "dedtime.h"
#include "node_info.h"
#include "fifo.h"
#include "resource_resv.h"
#ifdef NAS
#include "site_code.h"
#endif
#include "node_partition.h"
#include "sort.h"
#include "server_info.h"
#include "queue_info.h"
#include "limits_if.h"
#include "simulate.h"
#include "resource.h"
#include "buckets.h"
#include "pbs_bitmap.h"

/**
 *
 * @brief
 *		check to see if jobs can be run in a queue
 *
 * @param[in]	policy	-	policy info
 * @param[in]	qinfo	-	queue in question
 *
 * @return	enum sched_error_code
 * @retval	SUCCESS	: on success or
 * @retval	scheduler failure code	: jobs can' run in queue
 *
 * @note
 * 		This function will be run once per queue every scheduling cycle
 *
 */

enum sched_error_code
is_ok_to_run_queue(status *policy, queue_info *qinfo)
{
	enum sched_error_code rc = SE_NONE; /* Return Code */

	if (!qinfo->is_exec)
		return QUEUE_NOT_EXEC;

	if (!qinfo->is_started)
		return QUEUE_NOT_STARTED;

	if ((rc = check_ded_time_queue(qinfo)))
		return rc;

	if ((rc = check_prime_queue(policy, qinfo)))
		return rc;

	if ((rc = check_nonprime_queue(policy, qinfo)))
		return rc;

	if (rc == SE_NONE)
		return SUCCESS;

	return rc;
}

/**
 *
 * @brief
 * 		Time before dedicated time boundary if the job is hitting the boundary.
 *
 *	@param[in]	policy	-	policy structure
 *	@param[in]	njob	-	resource resv
 *
 *	@return	time duration up to dedicated boundary
 *	@retval sch_resource_t:	time duration upto dedicated boundary
 *							or full duration of the job if not
 *							hitting dedicated boundary.
 *	@retval UNSPECIFIED	: if job's min duration is hitting dedicated boundary
 *	@retval -3	: on error
 *
 */
sch_resource_t
time_to_ded_boundary(status *policy, resource_resv *njob)
{
	sch_resource_t min_time_left = UNSPECIFIED;
	sch_resource_t end = UNSPECIFIED;
	sch_resource_t min_end = UNSPECIFIED;

	if (njob == NULL || policy == NULL)
		return -3; /* error */

	sch_resource_t duration = njob->duration;
	timegap ded_time = find_next_dedtime(njob->server->server_time);
	bool ded = is_ded_time(njob->server->server_time);
	sch_resource_t time_left = calc_time_left_STF(njob, &min_time_left);

	if (!ded) {
		sch_resource_t start = UNSPECIFIED;

		if (njob->start == UNSPECIFIED && njob->end == UNSPECIFIED) {
			start = njob->server->server_time;
			min_end = start + min_time_left;
			end = start + time_left;
		} else if (njob->start == UNSPECIFIED || njob->end == UNSPECIFIED) {
			return -3; /* error */
		} else {
			start = njob->start;
			end = njob->end;
			min_end = njob->start + njob->min_duration;
		}
		/* Currently not dedicated time, Job can not complete its
		 * maximum duration before dedicated time would start,
		 * See if it can complete it's minimum duration before the start of
		 * dedicated time. If yes, set duration upto start of the dedicated time.
		 */
		if (end > ded_time.from && end < ded_time.to) {
			min_end = start + min_time_left;
			if (min_end > ded_time.from && min_end < ded_time.to)
				duration = UNSPECIFIED;
			else
				duration = ded_time.from - start;
		}
		/* Long job -- one which includes dedicated time.  In other words,
		 * it starts at or before dedicated time starts and
		 * it ends at or after dedicated time ends, if run for maximum duration.
		 * Check whether the job can be run for minimum duration without hitting dedicated time?
		 * If yes, set duration upto start of the dedicated time.
		 */
		if (start <= ded_time.from && end >= ded_time.to) {
			if (min_end >= ded_time.from)
				duration = UNSPECIFIED;
			else
				duration = ded_time.from - start;
		}
	} else /* Dedicated time */ {
		min_end = njob->server->server_time + min_time_left;
		end = njob->server->server_time + time_left;
		/* See if job's minimum duration can be completed without hitting
		 * dedicated time boundary. If yes, see if job's complete duration
		 * too can be satisfied. If No, set duration to the end of the dedicated time.
		 */
		if (min_end > ded_time.to)
			duration = UNSPECIFIED;
		/* Set duration only if it is hitting */
		else if (end > ded_time.to)
			duration = ded_time.to - njob->server->server_time;
	}
	return (duration);
}

/**
 *
 *	@brief
 *		Time to prime time boundary if the job is hitting prime/non-prime boundary
 *
 *
 *	@param[in]	policy	-	policy structure
 *	@param[in]	njob	-	resource resv
 *
 *	@return	time duration upto prime/non-prime boundary
 *	@retval sch_resource_t	: time duration upto prime/non-prime boundary
 *								or full duration of the job if not hitting
 *	@retval UNSPECIFIED	: if job's minimum duration is hitting prime/non-prime boundary
 *	@retval -3	: if njob is NULL or policy is NULL
 *
 */
sch_resource_t
time_to_prime_boundary(status *policy, resource_resv *njob)
{
	sch_resource_t time_left = UNSPECIFIED;
	sch_resource_t min_time_left = UNSPECIFIED; /* time left for minimum duration */
	sch_resource_t duration = UNSPECIFIED;

	if (njob == NULL || policy == NULL)
		return -3; /* error */

	duration = njob->duration;
	/* If backfill_prime is not set to true or if prime status never ends return full duration of the job */
	if (policy->prime_status_end == SCHD_INFINITY || !(policy->backfill_prime))
		return duration;

	time_left = calc_time_left_STF(njob, &min_time_left);
	/* If not hitting, return full duration */
	if (njob->server->server_time + time_left < policy->prime_status_end + policy->prime_spill)
		return duration;

	/* Job can be shrunk to time available before prime/non-prime time boundary */
	if (njob->server->server_time + min_time_left < policy->prime_status_end + policy->prime_spill)
		/* Shrink the job's duration to prime time boundary */
		duration = (policy->prime_status_end + policy->prime_spill) - (njob->server->server_time);
	else
		duration = UNSPECIFIED;
	return (duration);
}

/**
 *	@brief
 *		Shrink job to dedicated/prime time boundary(Job's duration will be set),
 *		if hitting and see if job can run. If job is not hitting a boundary see if it
 *		can run with full duration.
 *		Job duration may be set inside this function and it is caller's responsibility
 *		to keep track of the earlier value of job duration  if needed.
 *
 *	@param[in]	policy	-	policy structure
 *	@param[in]	sinfo	-	server info
 *	@param[in]	qinfo	-	queue info
 *	@param[in]	resresv -	resource resv
 *	@param[in]	flags		flags for is_ok_to_run() @see is_ok_to_run()
 *	@param[in,out]	err	-	error reply structure
 *
 *	@par NOTE
 *			return value is required to be freed by caller
 *
 *	@return	node solution of where job will run - more info in err
 *	@retval	nspec**	: array
 *	@retval NULL	: if job/resv can not run/error
 *
 */
std::vector<nspec *>
shrink_to_boundary(status *policy, server_info *sinfo,
		   queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err)
{
	std::vector<nspec *> ns_arr;
	if (njob == NULL || policy == NULL || sinfo == NULL || err == NULL)
		return {};
	/* No need to shrink the job to prime/dedicated boundary,
	 * if it is not hitting */
	if (err->error_code == CROSS_PRIME_BOUNDARY ||
	    err->error_code == CROSS_DED_TIME_BOUNDRY) {
		auto orig_duration = njob->duration;
		auto time_to_dedboundary = time_to_ded_boundary(policy, njob);
		if (time_to_dedboundary == UNSPECIFIED)
			return {};

		auto time_to_primeboundary = time_to_prime_boundary(policy, njob);
		if (time_to_primeboundary == UNSPECIFIED)
			return {};
		clear_schd_error(err);
		/* Shrink job to prime/ded boundary if hitting,
		 * If both prime and ded boundaries are getting hit
		 * shrink job to the nearest of the two
		 */
		njob->duration = time_to_dedboundary < time_to_primeboundary ? time_to_dedboundary : time_to_primeboundary;
		ns_arr = is_ok_to_run(policy, sinfo, qinfo, njob, flags, err);
		if (!ns_arr.empty() && orig_duration > njob->duration) {
			char timebuf[TIMEBUF_SIZE];
			convert_duration_to_str(njob->duration, timebuf, TIMEBUF_SIZE);
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_NOTICE, njob->name,
				   "Considering shrinking job to duration=%s, due to a prime/dedicated time conflict", timebuf);
		}
	}
	return ns_arr;
}

/**
 *
 *	@brief
 *		Shrink the job to it's minimum duration and see if it can run
 *		(Job's duration will be set to minimum duration)
 *		Job duration may be set inside this function and it is caller's responsibility
 *		to keep track of the earlier value of job duration  if needed.
 *
 *	@param[in]	policy	-	policy structure
 *	@param[in]	sinfo	-	server info
 *	@param[in]	qinfo	-	queue info
 *	@param[in]	resresv	-	resource resv
 *	@param[in]	flags		flags for is_ok_to_run() @see is_ok_to_run()
 *	@param[out]	err	-	error reply structure
 *	@par NOTE
 *		return value is required to be freed by caller
 *	@return	node solution of where job will run - more info in err
 *	@retval	vector<nspec *> array
 *	@retval NULL	: if job/resv can not run/error
 **/
std::vector<nspec *>
shrink_to_minwt(status *policy, server_info *sinfo,
		queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err)
{
	if (njob == NULL || policy == NULL || sinfo == NULL || err == NULL)
		return {};
	njob->duration = njob->min_duration;
	return is_ok_to_run(policy, sinfo, qinfo, njob, flags, err);
}

/**
 *
 *	@brief
 *		Shrink upto a run event and see if it can run
 *		Try only upto SHRINK_MAX_RETRY=5 events.
 *		Initially retry_count=SHRINK_MAX_RETRY.
 *	@par Algorithm:
 *		In each iteration:
 *		1.	Calculate job's possible_shrunk_duration. This should be
 *			the duration between min_end_time and last tried event's event_time.
 *			If it is the first event to be tried, possible_shrunk_duration should be
 *			the duration between min_end_time and farthest_event's event_time.
 *		2.	Divide the possible_shrunk_duration into retry_count equal segments.
 *		3.	try shrinking to the last event of the last segment.
 *		4.	If job still can't run, traverse backwards and skip rest of the events in that segment.
 *			and try last event of the next segment.
 *		5.	reduce the retry_count by 1.
 *		Repeat these iterations until either retry_count==0 or job is ok to run.
 *
 *		So what this algorithm does, is:
 *		First try shrinking to the farthest event. If it fails, divide the
 *		possible_shrunk_duration(duration between min_end_time and this event's event_time)
 *		into 5 equal segments. Skip rest of the events in the 5th segment.
 *		Try last event of the 4th segment. If it fails, recalculate possible_shrunk_duration and divide it
 *		into 4 equal segments. Skip rest of the events in the 4th segment.
 *		Try last event of the 3rd segment. If it fails, recalculate possible_shrunk_duration and divide it
 *		into 3 equal segments. Skip rest of the events in the 3rd segment.
 *		Try last event of the 2nd segment. If it fails, recalculate possible_shrunk_duration and divide it
 *		into 2 equal segments. Skip rest of the events in the 2nd segment.
 *		Try last event of the 1st segment.
 *		Example:
 *		The farthest event within job's duration is 100 hours after min_end_time.
 *		Try shrinking to this event's start time i.e. 100 hours.
 *		Let's say shrinking fails, now divide 100 hours into 5 equal segments
 *		of 20 hours each. Skip rest of the events of the last(5th) segment, since
 *		we have tried one event in this segment already. We keep traversing
 *		and skipping events untill we found an event that falls in the
 *		4th segment e.g. within (100-20=80)hours.
 *		Try shrinking to this event's start time say it is: 56 hours.
 *		Let's say shrinking fails, divide 56 hours into 4 equal segments
 *		of 14 hours each. Skip rest of the events of the last(4th) segment, since
 *		we have tried one event in this segment already. We keep traversing
 *		and skipping events untill we found an event that falls in the
 *		3rd segment e.g. within (56-14=42)hours.
 *		Try shrinking to this event's start time say it is: 36 hours.
 *		Let's say shrinking fails, divide 36 hours into 3 equal segments
 *		of 12 hours each. Skip rest of the events of the last(3rd) segment, since
 *		we have tried one event in this segment already. We keep traversing
 *		and skipping events untill we found an event that falls in the
 *		2nd segment e.g. within (36-12=24)hours.
 *		Try shrinking to this event's start time say it is: 20 hours.
 *		Let's say shrinking fails, divide 20 hours into 2 equal segments
 *		of 10 hours each. Skip rest of the events of the last(2nd) segment, since
 *		we have tried one event in this segment already. We keep traversing
 *		and skipping events untill we found an event that falls in the
 *		1st segment e.g. within (20-10=10)hours.
 *		Try shrinking to this event's start time say it is: 6 hours.
 *		If job still can't run, indicate failure.
 *
 *	@param[in]	policy	-	policy structure
 *	@param[in]	sinfo	-	server info
 *	@param[in]	qinfo   -	queue info
 *	@param[in]	resresv -	resource resv
 *	@param[in]	flags		flags for is_ok_to_run() @see is_ok_to_run()
 *	@param[in,out]	err	-	error reply structure
 *
 *	@par NOTE:
 *		return value is required to be freed by caller
 *
 *	@return	node solution of where job will run - more info in err
 *	@retval	vector<nspec*> array
 *	@retval	NULL	: if job/resv can not run/error
 *
 */
std::vector<nspec *>
shrink_to_run_event(status *policy, server_info *sinfo,
		    queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err)
{
	std::vector<nspec *> ns_arr;
	timed_event *te = NULL;
	timed_event *initial_event = NULL;
	timed_event *farthest_event = NULL;
	unsigned int event_mask = TIMED_RUN_EVENT;

	if (njob == NULL || policy == NULL || sinfo == NULL || err == NULL)
		return {};

	auto orig_duration = njob->duration;
	auto servertime_now = sinfo->server_time;
	auto end_time = servertime_now + njob->duration;
	auto min_end_time = servertime_now + njob->min_duration;
	/* Go till farthest event in the event list between job's min and max duration */
	te = get_next_event(sinfo->calendar);
	/* Get the front pointer of the event list. It may not always be NULL. */
	if (te != NULL)
		initial_event = te->prev;
	for (te = find_init_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask);
	     te != NULL && te->event_time < end_time;
	     te = find_next_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask)) {
		farthest_event = te;
	}
	clear_schd_error(err);
	/* If no events between job's min and max duration, try running with complete duration */
	if (farthest_event == NULL || farthest_event->event_time < min_end_time)
		ns_arr = is_ok_to_run(policy, sinfo, qinfo, njob, flags, err);
	else {
		/* try shrinking upto the farthest event */
		time_t last_tried_event_time = 0;
		int retry_count = SHRINK_MAX_RETRY;
		timed_event *last_skipped_event = NULL;
		end_time = farthest_event->event_time;

		/* Now, go backwards in the events list */
		for (te = farthest_event; retry_count != 0;
		     te = find_prev_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask)) {
			if (te == NULL) {
				/* If we've reached the end of the list, we're done */
				if (last_skipped_event == NULL)
					break;
				te = last_skipped_event;
				last_skipped_event = NULL;
				/* No events left, this is the last time through the loop */
				retry_count = 1;
				/* If we have reached the front of event list or if the event is falling before min end time, break. */
			} else if (te == initial_event || te->event_time < min_end_time)
				break;
			/* If no events in this segment, then try last skipped event of the previous segment
			 * Skip events that fall in the previous segment or if the event time is already tried
			 */
			else if (te->event_time > end_time || te->event_time == last_tried_event_time) {
				last_skipped_event = te;
				continue;
			}
			/* Shrink job to the start of this event */
			njob->duration = te->event_time - servertime_now;
			clear_schd_error(err);
			ns_arr = is_ok_to_run(policy, sinfo, qinfo, njob, flags, err);
			/* break if success */
			if (!ns_arr.empty())
				break;
			last_skipped_event = NULL; /* This event does not get skipped */
			last_tried_event_time = te->event_time;
			/* Shrink end_time to the next segment */
			end_time = min_end_time + (njob->duration - njob->min_duration) * (retry_count - 1) / retry_count;
			retry_count--;
		}
	}
	if (!ns_arr.empty() && njob->duration == njob->min_duration)
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_NOTICE, njob->name,
			  "Considering shrinking job to it's minimum walltime");
	else if (!ns_arr.empty() && orig_duration > njob->duration) {
		char timebuf[TIMEBUF_SIZE];
		convert_duration_to_str(njob->duration, timebuf, TIMEBUF_SIZE);
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_NOTICE, njob->name,
			   "Considering shrinking job to duration=%s, due to a reservation/top job conflict", timebuf);
	}
	return ns_arr;
}

/**
 *
 *	@brief
 *		Generic algorithm for shrinking a job
 *
 *	@param[in]	policy	-	policy structure
 *	@param[in]	pbs_sd	-	the connection descriptor to the pbs_server
 *	@param[in]	sinfo	-	server info
 *	@param[in]	qinfo	-	queue info
 *	@param[in]	resresv	-	resource resv
 *	@param[in]	flags		flags for is_ok_to_run() @see is_ok_to_run()
 *	@param[in,out]	err	-	error reply structure
 *
 *	@par NOTE:
 *		return value is required to be freed by caller
 *
 *	@return	node solution of where job will run - more info in err
 *	@retval	vector<nspec*> array
 *	@retval NULL	: if job/resv can not run/error
 **/
std::vector<nspec *>
shrink_job_algorithm(status *policy, server_info *sinfo,
		     queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err)
{
	std::vector<nspec *> ns_arr; /* node solution for job */
	time_t transient_duration;

	if (njob == NULL || policy == NULL || sinfo == NULL || err == NULL)
		return {};
	/* We are here because job could not run with full duration, check the error code
	 * and see if dedicated/prime conflict was found, if yes, try shrinking to boundary
	 */
	if (err->error_code == CROSS_PRIME_BOUNDARY ||
	    err->error_code == CROSS_DED_TIME_BOUNDRY) {
		/* Return ns_arr on success */
		/* err will be cleared inside shrink_to_boundary if min walltime is not hitting the
		 * prime/dedicated boundary. If min walltime is still hitting prime/dedicated
		 * boundary, the err will not be cleared.
		 */
		ns_arr = shrink_to_boundary(policy, sinfo, qinfo, njob, flags, err);
		if (!ns_arr.empty())
			return ns_arr;
	}
	/* Inside shrink_to_boundary(), job's duration would be set to time upto the
	 * prime/dedicated boundary if hitting. If the job could still not run,
	 * we need to see if the job can be run by shrinking further within the boundary.
	 * If err is set to CROSS_PRIME_BOUNDARY or CROSS_DED_TIME_BOUNDRY, no need to try further
	 * since we know that minimum duration of the job, itself is hitting boundary.
	 */
	transient_duration = njob->duration;
	if (ns_arr.empty() &&
	    err->error_code != CROSS_PRIME_BOUNDARY &&
	    err->error_code != CROSS_DED_TIME_BOUNDRY) {
		/* Try with lesser time durations */
		/* Clear any scheduling errors we got during earlier shrink attempts. */
		clear_schd_error(err);
		auto ns_arr_minwt = shrink_to_minwt(policy, sinfo, qinfo, njob, flags, err);
		/* Return NULL if job can't run at all */
		if (ns_arr_minwt.empty())
			return {};
		else { /* If success with min walltime, try running with a bigger walltime possible */
			njob->duration = transient_duration;
			clear_schd_error(err);
			ns_arr = shrink_to_run_event(policy, sinfo, qinfo, njob, flags, err);
			/* If job still could not be run, should be run with min_duration */
			if (ns_arr.empty()) {
				ns_arr = ns_arr_minwt;
				njob->duration = njob->min_duration;
			} else
				free_nspecs(ns_arr_minwt);
		}
	}
	return ns_arr;
}

/**
 *
 *	@brief
 *		check to see if the STF job is OK to run.
 *
 *	@param[in]	policy	-	policy structure
 *	@param[in]	sinfo	-	server info
 *	@param[in]	qinfo	-	queue info
 *	@param[in]	resresv	-	resource resv
 *	@param[in]	flags		flags for is_ok_to_run() @see is_ok_to_run()
 *	@param[out]	err	-	error reply structure
 *	@par NOTE:
 *		return value is required to be freed by caller
 *
 *	@return	node solution of where job will run - more info in err
 *	@retval	nspec** array
 *	@retval NULL	: if job/resv can not run/error
 */
std::vector<nspec *>
is_ok_to_run_STF(status *policy, server_info *sinfo,
		 queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err,
		 std::vector<nspec *> (*shrink_heuristic)(status *policy, server_info *sinfo,
							  queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err))
{
	std::vector<nspec *> ns_arr; /* node solution for job */
	sch_resource_t orig_duration;

	if (njob == NULL || policy == NULL || sinfo == NULL || err == NULL)
		return {};

	orig_duration = njob->duration;

	/* First see if it can run with full walltime */
	ns_arr = is_ok_to_run(policy, sinfo, qinfo, njob, flags, err);
	/* If the job can not run for non-calender reasons, return NULL*/
	if (!ns_arr.empty())
		return ns_arr;

	if (err->error_code == DED_TIME ||
	    err->error_code == PRIME_ONLY ||
	    err->error_code == NONPRIME_ONLY)
		return {};
	/* Apply the shrink heuristic  and try running the job after shrinking it */
	ns_arr = shrink_heuristic(policy, sinfo, qinfo, njob, flags, err);
	/* Reset the job duration on failure */
	if (ns_arr.empty())
		njob->duration = orig_duration;
	else
		njob->hard_duration = njob->duration;
	return ns_arr;
}

/**
 *
 *  @brief
 *  	Check to see if the resresv can fit within the system limits
 *	  	Used for both job to run and confirming/running of reservations.
 *
 *  @par the err structure can be set in two ways:
 *	1. For simple check functions, the error code comes from the function.
 *	   We set the error code into err within is_ok_to_run()
 *	2. For more complex check functions, we pass in err by reference.
 *	   The err will be completed inside the check function.
 *	* As an extension of #2, even more complex check functions may construct
 *	  a list of error structures.
 *
 * @param[in] policy	-	policy info
 * @param[in] sinfo	-	server info
 * @param[in] qinfo	-	queue info
 * @param[in] resresv	-	resource resv
 * @param[in] flags	-	RETURN_ALL_ERR - Return all reasons why the job
 * 					can not run, not just the first.  @warning: may be expensive.
 *					This flag will ignore equivalence classes
 *				IGNORE_EQUIV_CLASS - Ignore job equivalence class feature.
 *					If a job equivalence class has been seen before and marked
 *					can_not_run, the job will still be evaluated normally.
 *				USE_BUCKETS - use bucket code path
 *				NO_ALLPART - do not use the allpart
 * @param[in,out]	perr	-	pointer to error structure or NULL.
 *
 * @par NOTE:
 *		return value is required to be freed by caller (using free_nspecs())
 *
 * @return	node solution of where job/resv will run - more info in err
 * @retval	nspec** array
 * @retval	NULL	: if job/resv can not run/error
 *
 *
 */
std::vector<nspec *>
is_ok_to_run(status *policy, server_info *sinfo,
	     queue_info *qinfo, resource_resv *resresv, unsigned int flags, schd_error *perr)
{
	enum sched_error_code rc = SE_NONE; /* Return Code */
	schd_resource *res = NULL;	    /* resource list to check */
	int endtime = 0;		    /* end time of job if started now */
	node_partition *allpart = NULL;	    /* all partition to use (queue's or servers) */
	schd_error *prev_err = NULL;
	schd_error *err;
	resource_req *resreq = NULL;

	if (sinfo == NULL || resresv == NULL || perr == NULL)
		return {};

	if (resresv->is_job && qinfo == NULL)
		return {};

	err = perr;

	if (resresv->is_job && sinfo->equiv_classes != NULL &&
	    !(flags & (IGNORE_EQUIV_CLASS | RETURN_ALL_ERR)) &&
	    resresv->ec_index != UNSPECIFIED &&
	    sinfo->equiv_classes[resresv->ec_index]->can_not_run) {
		copy_schd_error(err, sinfo->equiv_classes[resresv->ec_index]->err);
		return {};
	}

	if (resresv->is_job) {
		if (qinfo == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			add_err(&prev_err, err);

			if (!(flags & RETURN_ALL_ERR))
				return {};
			else {
				err = new_schd_error();
				if (err == NULL)
					return {};
			}
		}
	}

	if (!in_runnable_state(resresv)) {
		if (resresv->is_job) {
			set_schd_error_codes(err, NOT_RUN, NOT_QUEUED);
			add_err(&prev_err, err);

			if (!(flags & RETURN_ALL_ERR))
				return {};

			err = new_schd_error();
			if (err == NULL)
				return {};
		}

		/* There are 3 [sub]states a reservation is in that can be confirmed
		 * 1) state = RESV_UNCONFIRMED
		 * 2) state = RESV_BEING_ALTERED
		 * 3) substate = RESV_DEGRADED
		 */
		if (resresv->is_resv && resresv->resv != NULL) {
			int rstate = resresv->resv->resv_state;
			int rsubstate = resresv->resv->resv_substate;
			if (rstate != RESV_UNCONFIRMED && rstate != RESV_BEING_ALTERED && rsubstate != RESV_DEGRADED) {
				set_schd_error_codes(err, NOT_RUN, NOT_QUEUED);
				add_err(&prev_err, err);

				if (!(flags & RETURN_ALL_ERR))
					return {};

				err = new_schd_error();
				if (err == NULL)
					return {};
			}
		}
	}

	/* If the pset metadata is stale, update it now for the allpart */
	if (sinfo->pset_metadata_stale && !(flags & NO_ALLPART))
		update_all_nodepart(policy, sinfo, NO_FLAGS);

	/* quick check to see if there are enough consumable resources over all nodes
	 * on the system to see if the resresv can possibly fit.
	 * This check is bypassed for jobs in reservations.  They have their own
	 * universe of nodes
	 */
	if (flags & NO_ALLPART)
		allpart = NULL;
	else if (resresv->is_job && resresv->job != NULL &&
		 resresv->job->resv != NULL)
		allpart = NULL;
	else if (qinfo != NULL && qinfo->has_nodes)
		allpart = qinfo->allpart;
	else
		allpart = sinfo->allpart;

	if (allpart != NULL) {
		if (resresv_can_fit_nodepart(policy, allpart, resresv, flags, err) == 0) {
			schd_error *toterr;
			toterr = new_schd_error();
			if (toterr == NULL) {
				if (err != perr)
					free_schd_error(err);
				return {};
			}
			/* We can't fit now, lets see if we can ever fit */
			if (resresv_can_fit_nodepart(policy, allpart, resresv, flags | COMPARE_TOTAL, toterr) == 0) {
				move_schd_error(err, toterr);
				err->status_code = NEVER_RUN;
			}

			add_err(&prev_err, err);
			if (!(flags & RETURN_ALL_ERR)) {
				free_schd_error(toterr);
				return {};
			}
			/* reuse toterr since we've already allocated it*/
			err = toterr;
			clear_schd_error(err);
		}
	}

	/* override these limits if we were issued a qrun request */
	if (sinfo->qrun_job == NULL) {
#ifdef NAS_HWY149 /* localmod 033 */
		if (resresv->job == NULL || resresv->job->priority != NAS_HWY149)
#endif		  /* localmod 033 */
#ifdef NAS_HWY101 /* localmod 032 */
			if (resresv->job == NULL || resresv->job->priority != NAS_HWY101)
#endif /* localmod 032 */
				if (resresv->is_job) {
					if ((rc = static_cast<sched_error_code>(check_limits(sinfo, qinfo, resresv, err, flags | CHECK_LIMIT)))) {

						add_err(&prev_err, err);
						if (rc == SCHD_ERROR)
							return {};
						if (!(flags & RETURN_ALL_ERR))
							return {};
						err = new_schd_error();
						if (err == NULL)
							return {};
					}
					/* check for max_run_subjobs limits only when its not a qrun job */
					if (resresv->job->is_array && (resresv->job->max_run_subjobs != UNSPECIFIED) &&
					    (resresv->job->running_subjobs >= resresv->job->max_run_subjobs)) {
						set_schd_error_codes(err, NOT_RUN, MAX_RUN_SUBJOBS);
						add_err(&prev_err, err);

						if (!(flags & RETURN_ALL_ERR))
							return {};
						else {
							err = new_schd_error();
							if (err == NULL)
								return {};
						}
					}

					if (check_prime_boundary(policy, resresv, err) != SE_NONE) {
						/* err is set inside check_prime_boundary() */
						add_err(&prev_err, err);
						if (!(flags & RETURN_ALL_ERR))
							return {};

						err = new_schd_error();
						if (err == NULL)
							return {};
					}

					if ((rc = check_ded_time_queue(qinfo))) {
						set_schd_error_codes(err, NOT_RUN, rc);
						add_err(&prev_err, err);
						if (!(flags & RETURN_ALL_ERR))
							return {};

						err = new_schd_error();
						if (err == NULL)
							return {};
					}

					if ((rc = check_prime_queue(policy, qinfo))) {
						set_schd_error_codes(err, NOT_RUN, rc);
						add_err(&prev_err, err);
						if (!(flags & RETURN_ALL_ERR))
							return {};

						err = new_schd_error();
						if (err == NULL)
							return {};
					}

					if ((rc = check_nonprime_queue(policy, qinfo))) {
						enum schd_err_status scode;
						if (policy->prime_status_end == SCHD_INFINITY) /* only primetime and we're in a non-prime queue*/
							scode = NEVER_RUN;
						else
							scode = NOT_RUN;
						set_schd_error_codes(err, scode, rc);
						add_err(&prev_err, err);
						if (!(flags & RETURN_ALL_ERR))
							return {};

						err = new_schd_error();
						if (err == NULL)
							return {};
					}
#ifdef NAS /* localmod 034 */
					if ((rc = site_check_cpu_share(sinfo, policy, resresv))) {
						set_schd_error_codes(err, NOT_RUN, rc);
						add_err(&prev_err, err);
						if (!(flags & RETURN_ALL_ERR))
							return NULL;

						err = new_schd_error();
						if (err == NULL)
							return NULL;
					}
#endif /* localmod 034 */
				}
	}
	if (resresv->is_job || (resresv->is_resv && !conf.resv_conf_ignore)) {
		if ((rc = check_ded_time_boundary(resresv))) {
			set_schd_error_codes(err, NOT_RUN, rc);
			add_err(&prev_err, err);
			if (!(flags & RETURN_ALL_ERR))
				return {};
			err = new_schd_error();
			if (err == NULL)
				return {};
		}
	}

	if (exists_resv_event(sinfo->calendar, sinfo->server_time + resresv->hard_duration))
		endtime = sinfo->server_time + calc_time_left(resresv, 1);
	else
		endtime = sinfo->server_time + calc_time_left(resresv, 0);

	if (resresv->is_job) {
		if (qinfo->qres != NULL) {
			if (resresv->job->resv == NULL) {
				res = simulate_resmin(qinfo->qres, endtime, sinfo->calendar,
						      qinfo->jobs, resresv);
			} else
#ifdef NAS /* localmod 036 */
			{
				if (resresv->job->resv->resv->is_standing) {
					resource_req *req = find_resource_req(resresv->resreq, allres["min_walltime"]);

					if (req != NULL) {
						int resv_time_left = calc_time_left(resresv->job->resv, 0);
						if (req->amount > resv_time_left) {
							set_schd_error_codes(err, NOT_RUN, INSUFFICIENT_RESOURCE);
							add_err(&prev_err, err);
							if (!(flags & RETURN_ALL_ERR))
								return {};

							err = new_schd_error();
							if (err == NULL)
								return {};
						}
					}
				}
#endif /* localmod 036 */
				res = qinfo->qres;
#ifdef NAS /* localmod 036 */
			}
#endif /* localmod 036 */
			/* If job already has a list of resources released, use that list
			 * check for available resources
			 */
			if ((resresv->job != NULL) && (resresv->job->resreq_rel != NULL))
				resreq = resresv->job->resreq_rel;
			else
				resreq = resresv->resreq;
			if (check_avail_resources(res, resreq,
						  flags, policy->resdef_to_check, INSUFFICIENT_QUEUE_RESOURCE, err) == 0) {
				struct schd_error *toterr;
				toterr = new_schd_error();
				if (toterr == NULL) {
					if (err != perr)
						free_schd_error(err);
					return {};
				}
				/* We can't fit now, lets see if we can ever fit */
				if (check_avail_resources(res, resreq,
							  flags | COMPARE_TOTAL, policy->resdef_to_check, INSUFFICIENT_QUEUE_RESOURCE, toterr) == 0) {
					move_schd_error(err, toterr);
					err->status_code = NEVER_RUN;
				}

				add_err(&prev_err, err);
				err = toterr;
				clear_schd_error(err);

				if (!(flags & RETURN_ALL_ERR)) {
					if (err != perr)
						free_schd_error(err);
					return {};
				}
			}
		}
	}

	/* Don't check the server resources if a job is in a reservation.  This is
	 * because the server resources_assigned will already reflect the entire
	 * resource amount for the reservation
	 */
	if (sinfo->res != NULL) {
		if (resresv->is_resv ||
		    (resresv->is_job && resresv->job != NULL && resresv->job->resv == NULL)) {
			res = simulate_resmin(sinfo->res, endtime, sinfo->calendar, NULL, resresv);
			if ((resresv->job != NULL) && (resresv->job->resreq_rel != NULL))
				resreq = resresv->job->resreq_rel;
			else
				resreq = resresv->resreq;
			if (check_avail_resources(res, resreq, flags,
						  policy->resdef_to_check, INSUFFICIENT_SERVER_RESOURCE, err) == 0) {
				struct schd_error *toterr;
				toterr = new_schd_error();
				if (toterr == NULL) {
					if (err != perr)
						free_schd_error(err);
					return {};
				}
				/* We can't fit now, lets see if we can ever fit */
				if (check_avail_resources(res, resreq,
							  flags | COMPARE_TOTAL, policy->resdef_to_check,
							  INSUFFICIENT_SERVER_RESOURCE, toterr) == 0) {
					toterr->status_code = NEVER_RUN;
					move_schd_error(err, toterr);
				}

				add_err(&prev_err, err);
				err = toterr;
				clear_schd_error(err);

				if (!(flags & RETURN_ALL_ERR)) {
					if (err != perr)
						free_schd_error(err);
					return {};
				}
			}
		}
	}

	auto ns_arr = check_nodes(policy, sinfo, qinfo, resresv, flags, err);

	if (err->error_code != SUCCESS)
		add_err(&prev_err, err);

	/* If any more checks are added after check_nodes(),
	 * the RETURN_ALL_ERR case must be added here */

	/* This is the case where we allocated a error structure for use, but
	 * didn't end up using it.  We have to check against perr, so we don't
	 * free the caller's memory.
	 */
	else if (err != perr)
		free_schd_error(err);

	return ns_arr;
}

/**
 * @brief find the resources associated with the resource_req's def
 * @param[in] reslist - schd_resource list to search in
 * @param[in] resreq - requested resource
 * @param[in] flags to modify behavior (@see check_avail_resources())
 * @return schd_resource
 * @retval found resource
 * @retval fres/zres/ustr if not found
 * @retval if indirect, point to the real resource
 * @retval NULL if resource is to be ignored
 */
schd_resource *
find_check_resource(schd_resource *reslist, resource_req *resreq, unsigned int flags)
{
	schd_resource *res;
	schd_resource *fres = false_res();
	schd_resource *zres = zero_res();
	schd_resource *ustr = unset_str_res();

	res = find_resource(reslist, resreq->def);

	if (res == NULL || res->orig_str_avail == NULL) {
		/* if resources_assigned.res is unset and resources is in
		 * resource_unset_infinite, ignore the check and assume a match
		 */
		if (conf.ignore_res.find(resreq->name) != conf.ignore_res.end())
			return NULL;
	}

	if (res == NULL) {
		if (!(flags & UNSET_RES_ZERO))
			return NULL;

		if (resreq->type.is_boolean)
			res = fres;
		else if (resreq->type.is_num)
			res = zres;
		else if (resreq->type.is_string)
			res = ustr;
		else /* ignore check: effect is resource is infinite */
			return NULL;

		res->name = resreq->name;
		res->def = resreq->def;
	}

	if (res->indirect_res != NULL) {
		res = res->indirect_res;
	}
	return res;
}

/**
 * @brief do resource matching between a resource_req and a schd_resource
 * @param[in] res - schd_resource to match
 * @param[in] resreq - resource_req to match
 * @param[in] flags to modify behavior (@see check_avail_resources())
 * @param[in] fail_code - fail code to use in schd_error if resources don't match
 * @param[out] err - if resources don't match, reason not matched
 * @return long long
 * @retval number of chunks matched if matched and consumable
 * @retval SCHD_INFINITY if matched and non-consumable
 * @retval 0 of resources failed to match
 */

long long
match_resource(schd_resource *res, resource_req *resreq, unsigned int flags, enum sched_error_code fail_code, schd_error *err)
{
	sch_resource_t avail; /* amount of available resource */
	long long num_chunk = SCHD_INFINITY;
	long long cur_chunk = 0;

	char resbuf1[MAX_LOG_SIZE];
	char resbuf2[MAX_LOG_SIZE];
	char resbuf3[MAX_LOG_SIZE];
	/*
	 * buf must be large enough to hold the three resbuf buffers plus a
	 * small amount of text... (R: resbuf1 A: resbuf2 T: resbuf3)
	 */
	char buf[(MAX_LOG_SIZE * 3) + 16];

	if (res->type.is_non_consumable && !(flags & ONLY_COMP_CONS)) {
		if (!compare_non_consumable(res, resreq)) {
			num_chunk = 0;
			if (err != NULL) {
				const char *requested;
				set_schd_error_codes(err, NOT_RUN, fail_code);
				err->rdef = res->def;
				requested = res_to_str_r(resreq, RF_REQUEST, resbuf1, sizeof(resbuf1));
				snprintf(buf, sizeof(buf), "(%s != %s)",
					 requested,
					 res_to_str_r(res, RF_AVAIL, resbuf2, sizeof(resbuf2)));
				set_schd_error_arg(err, ARG1, buf);
				/* Set arg2 for vnode/host resource. In case of preemption, arg2 is used to cull
				 * the list of running jobs
				 */
				if (res->def == allres["host"] || (res->def == allres["vnode"]))
					set_schd_error_arg(err, ARG2, requested);
			}
		}
	} else if (res->type.is_consumable && !(flags & ONLY_COMP_NONCONS)) {
		if (flags & COMPARE_TOTAL)
			avail = res->avail;
		else
			avail = dynamic_avail(res);

		if (avail == SCHD_INFINITY_RES && (flags & UNSET_RES_ZERO))
			avail = 0;

		/*
		 * if there is an infinite amount available or we are requesting
		 * 0 amount of the resource, we do not need to check if any is
		 * available
		 */
		if (avail != SCHD_INFINITY_RES && resreq->amount != 0) {
			if (avail < resreq->amount) {
				num_chunk = 0;
				if (err != NULL) {
					set_schd_error_codes(err, NOT_RUN, fail_code);
					err->rdef = res->def;

					res_to_str_r(resreq, RF_REQUEST, resbuf1, sizeof(resbuf1));
					res_to_str_c(avail, res->def, RF_AVAIL, resbuf2, sizeof(resbuf2));
					if ((flags & UNSET_RES_ZERO) && res->avail == SCHD_INFINITY_RES)
						res_to_str_c(0, res->def, RF_AVAIL, resbuf3, sizeof(resbuf3));
					else
						res_to_str_r(res, RF_AVAIL, resbuf3, sizeof(resbuf3));
					snprintf(buf, sizeof(buf), "(R: %s A: %s T: %s)", resbuf1, resbuf2, resbuf3);
					set_schd_error_arg(err, ARG1, buf);
				}
			} else {
				cur_chunk = avail / resreq->amount;
				if (cur_chunk < num_chunk || num_chunk == SCHD_INFINITY)
					num_chunk = cur_chunk;
			}
		}
	}

	return num_chunk;
}

/**
 *
 * @brief
 * 		This function will calculate the number of
 *		multiples of the requested resources in reqlist
 *		which can be satisfied by the resources
 *		available in the reslist for the resources in checklist
 *
 * @param[in]	reslist	-	resources list
 * @param[in]	reqlist	-	the list of resources requested
 * @param[in]	flags	-	valid flags:
 *							CHECK_ALL_BOOLS - always check all boolean resources
 *							UNSET_RES_ZERO - a resource which is unset defaults to 0
 *							COMPARE_TOTAL - do comparisons against resource total rather
 *							than what is currently available
 *							ONLY_COMP_NONCONS - only compare non-consumable resources
 *							ONLY_COMP_CONS - only compare consumable resources
 * @param[in]	checklist	-	set of resources to check
 * @param[in]	fail_code	-	error code if resource request is rejected
 *	@param[out]	perr	-	if not NULL the the reason request is not
 *							satisfiable (i.e. the resource there is not
 *							enough of).  If err is NULL, no error reason is
 *							returned.
 *
 * @return	int
 * @retval	number of chunks which can be allocated
 * @retval	-1	: on error
 *
 */
long long
check_avail_resources(schd_resource *reslist, resource_req *reqlist,
		      unsigned int flags, std::unordered_set<resdef *> &checklist,
		      enum sched_error_code fail_code, schd_error *perr)
{
	long long num_chunk = SCHD_INFINITY;
	long long match_chunk = SCHD_INFINITY;

	int any_fail = 0;
	schd_error *prev_err = NULL;
	schd_error *err;

	if (reslist == NULL || reqlist == NULL) {
		if (perr != NULL)
			set_schd_error_codes(perr, NOT_RUN, SCHD_ERROR);

		return -1;
	}

	err = perr;

	for (resource_req *resreq = reqlist; resreq != NULL; resreq = resreq->next) {
		if (((flags & CHECK_ALL_BOOLS) && resreq->type.is_boolean) ||
		    (checklist.find(resreq->def) != checklist.end())) {

			schd_resource *res = find_check_resource(reslist, resreq, flags);
			if (res == NULL)
				continue;

			match_chunk = match_resource(res, resreq, flags, fail_code, err);

			if (num_chunk == SCHD_INFINITY)
				num_chunk = match_chunk;
			else if (match_chunk != SCHD_INFINITY && match_chunk < num_chunk)
				num_chunk = match_chunk;

			if (num_chunk == 0) {
				any_fail = 1;
				if (flags & RETURN_ALL_ERR) {
					if (err != NULL) {
						err->next = new_schd_error();
						if (err->next == NULL)
							return 0;
						prev_err = err;
						err = err->next;
					}
				} else
					break;
			}
		}
	}

	if (any_fail)
		num_chunk = 0;

	if (prev_err != NULL && (flags & RETURN_ALL_ERR)) {
		if (prev_err != NULL) {
			free_schd_error(err);
			prev_err->next = NULL;
		}
	}

	return num_chunk;
}

/** @brief overloaded version of check_avail_resources() which matches all resources.  
 * @see other function for argument description
*/
long long
check_avail_resources(schd_resource *reslist, resource_req *reqlist,
		      unsigned int flags, enum sched_error_code fail_code, schd_error *perr)
{
	long long num_chunk = SCHD_INFINITY;
	long long match_chunk = SCHD_INFINITY;

	int any_fail = 0;
	schd_error *prev_err = NULL;
	schd_error *err;

	if (reslist == NULL || reqlist == NULL) {
		if (perr != NULL)
			set_schd_error_codes(perr, NOT_RUN, SCHD_ERROR);

		return -1;
	}

	err = perr;

	for (resource_req *resreq = reqlist; resreq != NULL; resreq = resreq->next) {
		schd_resource *res = find_check_resource(reslist, resreq, flags);
		if (res == NULL)
			continue;

		match_chunk = match_resource(res, resreq, flags, fail_code, err);

		if (num_chunk == SCHD_INFINITY)
			num_chunk = match_chunk;
		else if (match_chunk != SCHD_INFINITY && match_chunk < num_chunk)
			num_chunk = match_chunk;

		if (num_chunk == 0) {
			any_fail = 1;
			if (flags & RETURN_ALL_ERR) {
				if (err != NULL) {
					err->next = new_schd_error();
					if (err->next == NULL)
						return 0;
					prev_err = err;
					err = err->next;
				}
			} else
				break;
		}
	}

	if (any_fail)
		num_chunk = 0;

	if (prev_err != NULL && (flags & RETURN_ALL_ERR)) {
		if (prev_err != NULL) {
			free_schd_error(err);
			prev_err->next = NULL;
		}
	}

	return num_chunk;
}

/**
 * @brief
 *		dynamic_avail - find out how much of a resource is available on a
 *			server.  If the resources_available attribute is
 *			set, use that, else use resources_max.
 *
 * @param[in]	res	-	the resource to check
 *
 * @return	available amount of the resource
 *
 */

sch_resource_t
dynamic_avail(schd_resource *res)
{
	if (res->avail == SCHD_INFINITY_RES)
		return SCHD_INFINITY_RES;
	else if ((res->avail - res->assigned) <= 0)
		return 0;
	else
		return res->avail - res->assigned;
}

/**
 *	@brief
 *		find a element of a counts structure by name.
 *		  If res arg is NULL return 'running' element.
 *		  otherwise return named resource
 *
 * @param[in]	cts_list	-	counts list to search
 * @param[in]	name	-	name of counts structure to find
 * @param[in]	rdef	-	resource definition to find or if NULL,
 *				return number of running
 * @param[out]  cnt	-	address of the counts structure found in the list
 * @param[out]  rcount	-	address of matching resource count structure
 *
 * @return	resource amount
 */
sch_resource_t
find_counts_elm(counts_umap &cts_list, const std::string &name, resdef *rdef, counts **cnt, resource_count **rcount)
{
	resource_count *res_lim;
	counts *cts;

	if (name.empty())
		return 0;

	if ((cts = find_counts(cts_list, name)) != NULL) {
		if (cnt != NULL)
			*cnt = cts;
		if (rdef == NULL)
			return cts->running;
		else if ((res_lim = find_resource_count(cts->rescts, rdef)) != NULL) {
			if (rcount != NULL)
				*rcount = res_lim;
			return res_lim->amount;
		}
	}

	return 0;
}

/**
 * @brief
 * 		check to see if a resource resv will cross
 *		  into dedicated time
 *
 * @param[in]	resresv	-	the resource resv to check
 *
 * @retval	SE_NONE	: will not cross a ded time boundary
 * @retval	CROSS_DED_TIME_BOUNDRY	: will cross a ded time boundary
 */
enum sched_error_code
check_ded_time_boundary(resource_resv *resresv)
{
	if (resresv == NULL)
		return SE_NONE;

	timegap ded_time = find_next_dedtime(resresv->server->server_time);

	/* we have no dedicated time */
	if (ded_time.from == 0 && ded_time.to == 0)
		return SE_NONE;

	auto ded = is_ded_time(resresv->server->server_time);

	if (!ded) {
		if (dedtime_conflict(resresv)) /* has conflict or has no duration */
			return CROSS_DED_TIME_BOUNDRY;
	} else {
		auto time_left = calc_time_left(resresv, 0);
		auto finish_time = resresv->server->server_time + time_left;

		if (finish_time > ded_time.to)
			return CROSS_DED_TIME_BOUNDRY;
	}
	return SE_NONE;
}

/**
 * @brief
 *		dedtime_conflict - check for dedtime conflicts
 *
 * @param[in]	resresv	-	resource resv to check for conflects
 *
 * @return	int
 * @retval	1	: the reservation conflicts
 * @retval	0	: the reservation doesn't conflict
 * @retval	-1	: error
 *
 */
int
dedtime_conflict(resource_resv *resresv)
{
	time_t start;
	time_t end;

	if (resresv == NULL)
		return -1;

	if (resresv->start == UNSPECIFIED && resresv->end == UNSPECIFIED) {
		auto duration = calc_time_left(resresv, 0);

		start = resresv->server->server_time;
		end = start + duration;
	} else if (resresv->start == UNSPECIFIED || resresv->end == UNSPECIFIED)
		return -1;
	else {
		start = resresv->start;
		end = resresv->end;
	}

	timegap ded_time = find_next_dedtime(start);

	/* no ded time */
	if (ded_time.from == 0 && ded_time.to == 0)
		return 0;

	/* it is currently dedicated time */
	if (start > ded_time.from && start < ded_time.to)
		return 1;

	/* currently not dedicated time, but job would not
	 * complete before dedicated time would start
	 */
	if (end > ded_time.from && end < ded_time.to)
		return 1;

	/* Long job -- one which includes dedicated time.  In other words,
	 *             it starts at or before dedicated time starts and
	 *             it ends at or after dedicated time ends
	 */
	if (start <= ded_time.from && end >= ded_time.to)
		return 1;

	return 0;
}

/**
 * @brief check to see if a resresv can run on nodes using either node search code path
  * @param[in]	policy	-	policy info
 * @param[in]	sinfo	-	server associated with job/resv
 * @param[in]	qinfo	-	queue associated with job (NULL if resv)
 * @param[in]	resresv	-	resource resv to check
 * @param[in]	flags   -	flags to change functions behavior
 *					EVAL_OKBREAK - ok to break chunk up across vnodes
 *					EVAL_EXCLSET - allocate entire nodelist exclusively
 *					NO_ALLPART - don't update allpart when updating meta data
 *					USE_BUCKETS - use the bucket code path
 * @param[out]	err	-	error structure on why job/resv can't run
 *
 * @return	vector<nspec *>
 * @retval	node solution of where the job/resv will run
 * @retval	NULL	: if the job/resv can't run now

 */
std::vector<nspec *>
check_nodes(status *policy, server_info *sinfo, queue_info *qinfo, resource_resv *resresv, unsigned int flags, schd_error *err)
{
	std::vector<nspec *> ns_arr;

	if (sinfo->pset_metadata_stale)
		update_all_nodepart(policy, sinfo, (flags & NO_ALLPART));

	if (flags & USE_BUCKETS)
		ns_arr = check_node_buckets(policy, sinfo, qinfo, resresv, err);
	else
		ns_arr = check_normal_node_path(policy, sinfo, qinfo, resresv, flags, err);

	return ns_arr;
}

/**
 *	@brief
 *		check to see if there is sufficient nodes available to run a job/resv
 *		using the normal node search code path.
 *
 * @param[in]	policy	-	policy info
 * @param[in]	sinfo	-	server associated with job/resv
 * @param[in]	qinfo	-	queue associated with job (NULL if resv)
 * @param[in]	resresv	-	resource resv to check
 * @param[in]	flags   -	flags to change functions behavior
 *					EVAL_OKBREAK - ok to break chunk up across vnodes
 *					EVAL_EXCLSET - allocate entire nodelist exclusively
 * @param[out]	err	-	error structure on why job/resv can't run
 *
 * @return	vector<nspec *>
 * @retval	node solution of where the job/resv will run
 * @retval	NULL	: if the job/resv can't run now
 *
 */
std::vector<nspec *>
check_normal_node_path(status *policy, server_info *sinfo, queue_info *qinfo, resource_resv *resresv, unsigned int flags, schd_error *err)
{
	std::vector<nspec *> nspec_arr;
	selspec *spec = NULL;
	place *pl = NULL;
	int rc = 0;
	np_cache *npc = NULL;
	int error = 0;
	node_partition **nodepart = NULL;
	node_info **ninfo_arr = NULL;

	if (!sc_attrs.do_not_span_psets)
		flags |= SPAN_PSETS;

	if (sinfo == NULL || resresv == NULL || err == NULL) {
		if (err != NULL)
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
		return {};
	}

	if (resresv->is_job) {
		if (qinfo == NULL)
			return {};

		if (resresv->job == NULL)
			return {};

		if (resresv->job->resv != NULL && resresv->job->resv->resv == NULL)
			return {};
	}

	get_resresv_spec(resresv, &spec, &pl);

	/* Sets of nodes:
	   * 1. job is in a reservation - use reservation nodes
	   * 2. job or reservation has nodes -- use them
	   * 3. queue job is in has nodes associated with it - use queue's nodes
	   * 4. catchall - either the job is being run on nodes not associated with
	   * any queue, or we're node grouping and we the job can't fit into any
	   * node partition, therefore it falls in here
	   */

	if (resresv->is_job && resresv->job->resv != NULL) {
		/* if we're in a reservation, only check nodes assigned to the resv
		 * and not worry about node grouping since the nodes for the reservation
		 * are already in a group
		 */
		ninfo_arr = resresv->job->resv->resv->resv_nodes;
		nodepart = NULL;
	} else if (resresv->ninfo_arr != NULL) {
		/* if we have nodes, use them
		 * don't care about node grouping because nodes are already assigned
		 * to the job.  We won't need to search for them.
		 */
		ninfo_arr = resresv->ninfo_arr;
		nodepart = NULL;
	} else {
		if (resresv->is_job && qinfo->nodepart != NULL)
			nodepart = qinfo->nodepart;
		else if (sinfo->nodepart != NULL)
			nodepart = sinfo->nodepart;
		else
			nodepart = NULL;

		if (resresv->is_job) {
			/* if there are nodes assigned to the queue, then check those */
			if (qinfo->has_nodes)
				ninfo_arr = qinfo->nodes;
		}
	}

	if (ninfo_arr == NULL)
		ninfo_arr = sinfo->unassoc_nodes;

	if (resresv->node_set_str != NULL) {
		/* Note that jobs inside reservations have their node_set
		 * created in query_reservations()
		 */
		if (resresv->node_set == NULL) {
			resresv->node_set = create_node_array_from_str(
				qinfo->num_nodes > 0 ? qinfo->nodes : sinfo->unassoc_nodes,
				resresv->node_set_str);
		}
		ninfo_arr = resresv->node_set;
		nodepart = NULL;
	}

	/* job's place=group=res replaces server or queue node grouping
	 * We'll search the node partition cache for the job's pool of node partitions
	 * If it doesn't exist, we'll create it and add it to the cache
	 */
	if (resresv->place_spec->group != NULL) {
		std::vector<std::string> grouparr{resresv->place_spec->group};
		npc = find_alloc_np_cache(policy, sinfo->npc_arr, grouparr, ninfo_arr, cmp_placement_sets);
		if (npc != NULL)
			nodepart = npc->nodepart;
		else
			error = 1;
	}

	if (ninfo_arr == NULL || error)
		return {};

	nspec_arr.reserve(spec->total_chunks);

	rc = eval_selspec(policy, spec, pl, ninfo_arr, nodepart, resresv, flags, nspec_arr, err);

	/* We can run, yippie! */
	if (rc > 0)
		return nspec_arr;

	/* We were not told why the resresv can't run: Use generic reason */
	if (err->status_code == SCHD_UNKWN)
		set_schd_error_codes(err, NOT_RUN, NO_NODE_RESOURCES);

	free_nspecs(nspec_arr);

	return {};
}

/**
 * @brief
 *		check_ded_time_queue - check if it is the appropriate time to run jobs
 *					in a dedtime queue
 *
 * @param[in]	qinfo	-	the queue
 *
 * @return	int
 * @retval	SE_NONE	: if it is dedtime and qinfo is a dedtime queue or
 *	     			if it is not dedtime and qinfo is not a dedtime queue
 * @retval	DED_TIME	: if jobs can not run in queue because of dedtime restrictions
 * @retval	SCHD_ERROR	: An error has occurred.
 *
 */
enum sched_error_code
check_ded_time_queue(queue_info *qinfo)
{
	enum sched_error_code rc = SE_NONE; /* return code */

	if (qinfo == NULL || qinfo->server == NULL)
		return SCHD_ERROR;

	if (is_ded_time(qinfo->server->server_time)) {
		if (qinfo->is_ded_queue)
			rc = SE_NONE;
		else
			rc = DED_TIME;
	} else {
		if (qinfo->is_ded_queue)
			rc = DED_TIME;
		else
			rc = SE_NONE;
	}
	return rc;
}

/**
 *
 *	@brief
 *		Check primetime status of the queue.  If the queue
 *		    is a primetime queue and it is primetime or if the
 *		    queue is an anytime queue, jobs can run in it.
 *
 * @param[in]	policy	-	policy info
 * @param[in]	qinfo	-	the queue to check
 *
 * @retval	SE_NONE	: if the queue is an anytime queue or if it is a primetime
 * 					queue and its is currently primetime
 * @retval	PRIME_ONLY	: its a primetime queue and its not primetime
 * @retval	SCHD_ERROR	error
 *
 */
enum sched_error_code
check_prime_queue(status *policy, queue_info *qinfo)
{
	if (policy == NULL || qinfo == NULL)
		return SCHD_ERROR;
	/* if the queue is an anytime queue, allow jobs to run */
	if (!qinfo->is_prime_queue && !qinfo->is_nonprime_queue)
		return SE_NONE;

	if (!policy->is_prime && qinfo->is_prime_queue)
		return PRIME_ONLY;

	return SE_NONE;
}

/**
 * @brief
 * 		Check nonprime status of the queue.  If the
 *			       queue is a nonprime queue and it is nonprimetime
 *			       of the queue is an anytime queue, jobs can run
 *
 * @param[in]	policy	-	policy info
 * @param[in]	qinfo	-	the queue to check
 *
 * @return	int
 * @retval	SE_NONE	: if the queue is an anytime queue or if it is nonprimetime
 * 	             	and the queue is a nonprimetime queue
 * @retval	NONPRIME_ONLY	: its a nonprime queue and its primetime
 *
 */
enum sched_error_code
check_nonprime_queue(status *policy, queue_info *qinfo)
{
	/* if the queue is an anytime queue, allow jobs to run */
	if (!qinfo->is_prime_queue && !qinfo->is_nonprime_queue)
		return SE_NONE;

	if (policy->is_prime && qinfo->is_nonprime_queue)
		return NONPRIME_ONLY;

	return SE_NONE;
}

/**
 * @brief
 * 		check to see if the resource resv can run before
 *		the prime status changes (from primetime to nonprime etc)
 *
 * @param[in]	policy	-	policy info
 * @param[in]	resresv	-	the resource_resv to check
 * @param[out]	err     -	error structure to return
 *
 * @retval	CROSS_PRIME_BOUNDARY	: if the resource resv crosses
 * @retval	SE_NONE	: if it doesn't
 * @retval	SCHD_ERROR	: on error
 *
 */
enum sched_error_code
check_prime_boundary(status *policy, resource_resv *resresv, struct schd_error *err)
{

	if (resresv == NULL || policy == NULL) {
		set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
		return SCHD_ERROR;
	}

	/*
	 *   If the job is not in a prime or non-prime queue, we do not
	 *   need to check the prime boundary.
	 */
	if (resresv->is_job) {
		if (conf.prime_exempt_anytime_queues &&
		    !resresv->job->queue->is_nonprime_queue &&
		    !resresv->job->queue->is_prime_queue)
			return SE_NONE;
	}

	/* prime status never ends */
	if (policy->prime_status_end == SCHD_INFINITY)
		return SE_NONE;

	if (policy->backfill_prime) {
		auto time_left = calc_time_left(resresv, 0);

		/*
		 *   Job has no walltime requested.  Lets be conservative and assume the
		 *   job will conflict with primetime.
		 */
		if (time_left < 0) {
			set_schd_error_codes(err, NOT_RUN, CROSS_PRIME_BOUNDARY);
			set_schd_error_arg(err, ARG1, policy->is_prime ? NONPRIMESTR : PRIMESTR);
			return CROSS_PRIME_BOUNDARY;
		}

		if (resresv->server->server_time + time_left >
		    policy->prime_status_end + policy->prime_spill) {
			set_schd_error_codes(err, NOT_RUN, CROSS_PRIME_BOUNDARY);
			set_schd_error_arg(err, ARG1, policy->is_prime ? NONPRIMESTR : PRIMESTR);
			return CROSS_PRIME_BOUNDARY;
		}
	}
	return SE_NONE;
}

/**
 * @brief
 * 		return a boolean resource that is False
 *         It is up to the caller to set the name and def fields
 *
 * @return	schd_resource * (set to False)
 *
 * @par MT-safe: No
 */
schd_resource *
false_res()
{
	static schd_resource *res = NULL;

	if (res == NULL) {
		res = new_resource();
		if (res != NULL) {
			res->type.is_non_consumable = 1;
			res->type.is_boolean = 1;
			res->orig_str_avail = string_dup(ATR_FALSE);
			res->avail = 0;
		} else
			return NULL;
	}

	res->def = NULL;
	res->name = NULL;

	return res;
}

/**
 * @brief
 * 		return a string resource that is "unset" (set to "")
 *         It is up to the caller to set the name and def fields
 *
 * @return	schd_resource *
 * @retval	NULL	: fail
 *
 * @par MT-safe: No
 */
schd_resource *
unset_str_res()
{
	static schd_resource *res = NULL;

	if (res == NULL) {
		res = new_resource();
		if ((res->str_avail = static_cast<char **>(malloc(sizeof(char *) * 2))) != NULL) {
			if (res->str_avail != NULL) {
				res->str_avail[0] = string_dup("");
				res->str_avail[1] = NULL;
			} else {
				log_err(errno, __func__, MEM_ERR_MSG);
				free_resource(res);
				return NULL;
			}
			res->type.is_non_consumable = 1;
			res->type.is_string = 1;
			res->orig_str_avail = string_dup("");
			res->avail = 0;
		} else
			return NULL;
	}

	res->name = NULL;
	res->def = NULL;

	return res;
}
/**
 * @brief
 * 		return a numeric resource that is 0
 *         It is up to the caller to set the name and def fields
 *
 * @return	schd_resource *
 * @retval	NULL	: fail
 */
schd_resource *
zero_res()
{
	static schd_resource *res = NULL;

	if (res == NULL) {
		res = new_resource();
		if (res != NULL) {
			res->type.is_consumable = 1;
			res->type.is_num = 1;
			res->orig_str_avail = string_dup("0");
			res->avail = 0;
		} else
			return NULL;
	}

	res->name = NULL;
	res->def = NULL;

	return res;
}

/**
 * @brief get_resresv_spec - this function returns the correct value of select and
 *	    place to be used for node searching.
 * @param[in]  *resresv resources reservation object
 * @param[out] **spec output select specification
 * @param[out] **pl  output placement specification
 *
 * @par MT-Safe: No
 * @return void
 */
void
get_resresv_spec(resource_resv *resresv, selspec **spec, place **pl)
{
	static place place_spec;
	if (resresv->is_job && resresv->job != NULL) {
		if (resresv->execselect != NULL) {
			*spec = resresv->execselect;
			place_spec = *resresv->place_spec;

			/* Placement was handled the first time.  Don't let it get in the way */
			place_spec.scatter = place_spec.vscatter = place_spec.pack = 0;
			place_spec.free = 1;
			*pl = &place_spec;
		} else {
			*pl = resresv->place_spec;
			*spec = resresv->select;
		}
	} else if (resresv->is_resv && resresv->resv != NULL) {
		/* The execselect should be used when the resv is running.  We can't
		 * trust the state/substate to be RESV_RUNNING when a reservation is both
		 * RESV_DEGRADED and RESV_BEING_ALTERED and is running.
		 */
		if (resresv->resv->is_running)

			*spec = resresv->execselect;
		else
			*spec = resresv->select;
		place_spec = *resresv->place_spec;
		*pl = &place_spec;
	}
}


================================================
FILE: src/scheduler/check.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _CHECK_H
#define _CHECK_H

#include <unordered_set>

#include "server_info.h"
#include "queue_info.h"
#include "job_info.h"

/*
 *	is_ok_to_run_in_queue - check to see if jobs can be run in queue
 */
enum sched_error_code is_ok_to_run_queue(status *policy, queue_info *qinfo);

/*
 *	is_ok_to_run - check to see if it ok to run a job on the server
 */
std::vector<nspec *>
is_ok_to_run(status *policy, server_info *sinfo,
	     queue_info *qinfo, resource_resv *resresv, unsigned int flags, schd_error *perr);

/**
 *
 *	is_ok_to_run_STF - check to see if the STF job is OK to run.
 *
 */
std::vector<nspec *>
is_ok_to_run_STF(status *policy, server_info *sinfo,
		 queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err,
		 std::vector<nspec *> (*shrink_heuristic)(status *policy, server_info *sinfo,
							  queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err));
/*
 * shrink_job_algorithm - generic algorithm for shrinking a job
 */
std::vector<nspec *>
shrink_job_algorithm(status *policy, server_info *sinfo,
		     queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err); /* Generic shrinking heuristic */

/*
 * shrink_to_boundary - Shrink job to dedicated/prime time boundary
 */
std::vector<nspec *>
shrink_to_boundary(status *policy, server_info *sinfo,
		   queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err);

/*
 * shrink_to_minwt - Shrink job to it's minimum walltime
 */
std::vector<nspec *>
shrink_to_minwt(status *policy, server_info *sinfo,
		queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err);

/*
 * shrink_to_run_event - Shrink job before reservation or top job.
 */
std::vector<nspec *>
shrink_to_run_event(status *policy, server_info *sinfo,
		    queue_info *qinfo, resource_resv *njob, unsigned int flags, schd_error *err);

/*
 *      check_avail_resources - This function will calculate the number of
 *				multiples of the requested resources in reqlist
 *				which can be satisfied by the resources
 *				available in the reslist for the resources in
 *				checklist
 *
 *
 *      returns number of chunks which can be allocated or -1 on error
 *
 */
long long
check_avail_resources(schd_resource *reslist, resource_req *reqlist,
		      unsigned int flags, std::unordered_set<resdef *> &checklist,
		      enum sched_error_code fail_code, schd_error *perr);
long long
check_avail_resources(schd_resource *reslist, resource_req *reqlist,
		      unsigned int flags, enum sched_error_code fail_code, schd_error *perr);

/*
 *	dynamic_avail - find out how much of a resource is available on a
 */
sch_resource_t dynamic_avail(schd_resource *res);

/*
 *	find_counts_elm - find a element of a counts structure by name.
 *			  If res arg is NULL return number of running jobs
 *			  otherwise return named resource
 *
 *	cts_list - counts map to search
 *	name     - name of counts structure to find
 *	res      - resource to find or if NULL, return number of running
 *			resource amount
 *	cnt	- output param for address of the matching counts structure
 *	rreq	- output param for address of the matching resource_count structure
 */
sch_resource_t find_counts_elm(counts_umap &cts_list, const std::string &name, resdef *rdef, counts **rcount, resource_count **rreq);

/*
 *      check_nodes - check to see if there is sufficient nodes available to
 *                    run a job/resv.
 */
std::vector<nspec *> check_nodes(status *policy, server_info *sinfo, queue_info *qinfo, resource_resv *resresv, unsigned int flags, schd_error *err);

/* Normal node searching algorithm */
std::vector<nspec *>
check_normal_node_path(status *policy, server_info *sinfo, queue_info *qinfo, resource_resv *resresv, unsigned int flags, schd_error *err);

/*
 *      is_node_available - determine that there is a node available to run
 *                          the job
 */
int is_node_available(resource_resv *job, node_info **ninfo_arr);

/*
 *      check_ded_time_queue - check if it is the approprate time to run jobs
 *                             in a dedtime queue
 */
enum sched_error_code check_ded_time_queue(queue_info *qinfo);

/*
 *      dedtime_conflict - check for dedtime conflicts
 */
int dedtime_conflict(resource_resv *resresv);

/*
 *      check_ded_time_boundary  - check to see if a job would cross into
 */
enum sched_error_code check_ded_time_boundary(resource_resv *resresv);

/*
 *      check_prime_queue - Check primetime status of the queue.  If the queue
 *                          is a primetime queue and it is primetime or if the
 *                          queue is an anytime queue, jobs can run in it.
 */
enum sched_error_code check_prime_queue(status *policy, queue_info *qinfo);

/*
 *      check_nonprime_queue - Check nonprime status of the queue.  If the
 *                             queue is a nonprime queue and it is nonprimetime
 *                             of the queue is an anytime queue, jobs can run
 */
enum sched_error_code check_nonprime_queue(status *policy, queue_info *qinfo);

/*
 *      check_prime_boundary - check to see if the job can run before the prime
 *                            status changes (from primetime to nonprime etc)
 */
enum sched_error_code check_prime_boundary(status *policy, resource_resv *resresv, struct schd_error *err);

/*
 *      check_node_resources - check to see if resources are available on
 *                             timesharing nodes for a job to run
 */
int check_node_resources(resource_resv *resresv, node_info **ninfo_arr);

/*
 *	false_res - return a static struct of resource which is a boolean
 *		    set to false
 */
schd_resource *false_res(void);

/*
 *
 *	zero_res -  return a static struct of resource which is numeric and
 *		    consumable set to 0
 *	returns zero resource ptr
 *
 */
schd_resource *zero_res(void);

/*
 *	unset_str_res - return a static struct of resource which is a string
 *		    set to ""
 *	returns unset string resource ptr
 *
 */
schd_resource *unset_str_res(void);

/*
 *	get_resresv_spec - gets the correct select and placement specification
 *
 *	returns void
 */
void get_resresv_spec(resource_resv *resresv, selspec **spec, place **pl);
#endif /* _CHECK_H */


================================================
FILE: src/scheduler/config.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _CONFIG_H
#define _CONFIG_H

#include "constant.h"

/* the level of schd_priority that a suspended job has */
#define SUSPEND_PRIO 500000

/* resources can get too large for a 32 bit number, so the ability to use the
 * nonstandard type long long is necessary.
 */
#define RESOURCE_TYPE double

/* name of config file */
#define CONFIG_FILE "sched_config"
#define USAGE_FILE "usage"
#define USAGE_TOUCH USAGE_FILE ".touch"
#define HOLIDAYS_FILE "holidays"
#define RESGROUP_FILE "resource_group"
#define DEDTIME_FILE "dedicated_time"

/* usage file "magic number" - needs to be 8 chars */
#define USAGE_MAGIC "PBS_MAG!"
#define USAGE_VERSION 2
#define USAGE_NAME_MAX 50

#define UNKNOWN_GROUP_NAME "unknown"

/* preempt priority values */
#define PREEMPT_PRIORITY_HIGH 100000
#define PREEMPT_PRIORITY_STEP 1000

#define PREEMPT_ORDER_MAX 20

/* name of root node in the fairshare tree */
#define FAIRSHARE_ROOT_NAME "TREEROOT"

/* Estimate on how long it will take exiting jobs to end*/
#define EXITING_TIME 1

/* Estimate of time that a job past their walltime will be running */
#define FINISH_TIME 120

/* maximum number of sort keys */
#define MAX_SORTS 21

/* maximum number of scheduling cycle restarts in event of job-run failure */
#define MAX_RESTART_CYCLECNT 5

/* estimate of how long a node will take to provision - used in simulation */
#define PROVISION_DURATION 600

/* Maximum number of events(reservations or top jobs)
 * around which shrinking of a STF job would be attemtpted,
 */
#define SHRINK_MAX_RETRY 5

/* parsing -
 * names that appear on the left hand side in the sched config file
 */
#define PARSE_ROUND_ROBIN "round_robin"
#define PARSE_BY_QUEUE "by_queue"
#define PARSE_FAIR_SHARE "fair_share"
#define PARSE_HALF_LIFE "half_life"
#define PARSE_UNKNOWN_SHARES "unknown_shares"
#define PARSE_LOG_FILTER "log_filter"
#define PARSE_DEDICATED_PREFIX "dedicated_prefix"
#define PARSE_HELP_STARVING_JOBS "help_starving_jobs"
#define PARSE_MAX_STARVE "max_starve"
#define PARSE_SORT_QUEUES "sort_queues"
#define PARSE_BACKFILL "backfill"
#define PARSE_PRIMETIME_PREFIX "primetime_prefix"
#define PARSE_NONPRIMETIME_PREFIX "nonprimetime_prefix"
#define PARSE_BACKFILL_PRIME "backfill_prime"
#define PARSE_PRIME_EXEMPT_ANYTIME_QUEUES "prime_exempt_anytime_queues"
#define PARSE_PRIME_SPILL "prime_spill"
#define PARSE_RESOURCES "resources"
#define PARSE_MOM_RESOURCES "mom_resources"
#define PARSE_SMP_CLUSTER_DIST "smp_cluster_dist"
#define PARSE_PREEMPT_QUEUE_PRIO "preempt_queue_prio"
#define PARSE_PREEMPT_SUSPEND "preempt_suspend"
#define PARSE_PREEMPT_CHKPT "preempt_checkpoint"
#define PARSE_PREEMPT_REQUEUE "preempt_requeue"
#define PARSE_PREEMPIVE_SCHED "preemptive_sched"
#define PARSE_FAIRSHARE_RES "fairshare_usage_res"
#define PARSE_FAIRSHARE_ENT "fairshare_entity"
#define PARSE_FAIRSHARE_DECAY_FACTOR "fairshare_decay_factor"
#define PARSE_FAIRSHARE_DECAY_TIME "fairshare_decay_time"
#define PARSE_SUSP_THRESHOLD "susp_threshold"
#define PARSE_PREEMPT_PRIO "preempt_prio"
#define PARSE_PREEMPT_ORDER "preempt_order"
#define PARSE_PREEMPT_SORT "preempt_sort"
#define PARSE_JOB_SORT_KEY "job_sort_key"
#define PARSE_NODE_SORT_KEY "node_sort_key"
#define PARSE_SORT_NODES "sort_nodes"
#define PARSE_SERVER_DYN_RES "server_dyn_res"
#define PARSE_PEER_QUEUE "peer_queue"
#define PARSE_PEER_TRANSLATION "peer_translation"
#define PARSE_NODE_GROUP_KEY "node_group_key"
#define PARSE_ENFORCE_NO_SHARES "fairshare_enforce_no_shares"
#define PARSE_STRICT_ORDERING "strict_ordering"
#define PARSE_RES_UNSET_INFINITE "resource_unset_infinite"
#define PARSE_SELECT_PROVISION "provision_policy"

#ifdef NAS
/* localmod 034 */
#define PARSE_MAX_BORROW "max_borrow"
#define PARSE_SHARES_TRACK_ONLY "shares_track_only"
#define PARSE_PER_SHARE_DEPTH "per_share_depth" /* old name */
#define PARSE_PER_SHARE_TOPJOBS "per_share_topjobs"

/* localmod 038 */
#define PARSE_PER_QUEUES_TOPJOBS "per_queues_topjobs"

/* localmod 030 */
#define PARSE_MIN_INTERRUPTED_CYCLE_LENGTH "min_interrupted_cycle_length"
#define PARSE_MAX_CONS_INTERRUPTED_CYCLES "max_cons_interrupted_cycles"
#endif

/* undocumented */
#define PARSE_MAX_JOB_CHECK "max_job_check"
#define PARSE_PREEMPT_ATTEMPTS "preempt_attempts"
#define PARSE_UPDATE_COMMENTS "update_comments"
#define PARSE_RESV_CONFIRM_IGNORE "resv_confirm_ignore"
#define PARSE_ALLOW_AOE_CALENDAR "allow_aoe_calendar"

/* deprecated */
#define PARSE_STRICT_FIFO "strict_fifo"

/* max sizes */
#define MAX_HOLIDAY_SIZE 50
#define MAX_DEDTIME_SIZE 50
#define MAX_SERVER_DYN_RES 201 /* 200 elements + 1 sentinel */
#define MAX_LOG_SIZE 1024
#define MAX_RES_NAME_SIZE 256
#define MAX_RES_RET_SIZE 256
#define NUM_PPRIO 20
#define NUM_PEERS 50
#define MAX_DEF_REPLY 5
#define MAX_PTIME_SIZE 64

/* resource names for sorting special cases */
#define SORT_FAIR_SHARE "fair_share_perc"
#define SORT_PREEMPT "preempt_priority"
#define SORT_PRIORITY "sort_priority"
#define SORT_JOB_PRIORITY "job_priority"
#define SORT_USED_TIME "last_used_time"

#ifdef NAS
/* localmod 039 */
#define SORT_QPRI "qpri"

/* localmod 034 */
#define SORT_ALLOC "cpu_alloc"

/* localmod 040 */
#define SORT_NODECT "nodect"
#endif

/* max num of retries for preemption */
#define MAX_PREEMPT_RETRIES 5

/* provisioning policy */
#define PROVPOLICY_AVOID "avoid_provision"
#define PROVPOLICY_AGGRESSIVE "aggressive_provision"

/* Job Comment Prefixes */
#define JOB_COMMENT_NOT_RUN_NOW "Not Running"
#define JOB_COMMENT_NEVER_RUN "Can Never Run"

#define BF_OFF 0
#define BF_LOW 60
#define BF_MED 600
#define BF_HIGH 3600
#define BF_DEFAULT BF_LOW

#define SCH_CYCLE_LEN_DFLT 1200

#ifdef NAS /* attributes we may define in the server's resourcedef file */
/* localmod 040 */
#define ATTR_ignore_nodect_sort "ignore_nodect_sort"

/* localmod 038 */
#define ATTR_topjob_setaside "topjob_set_aside"
#endif

#endif /* _CONFIG_H */


================================================
FILE: src/scheduler/constant.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _CONSTANT_H
#define _CONSTANT_H

#include <math.h>

/* macro to turn a value from enum preempt into it's bit for the bitfield */
#define PREEMPT_TO_BIT(X) (1 << (X))

/* bitcount macro for up to 16 bits */
#define BX16_(x) ((x) - (((x) >> 1) & 0x7777) - (((x) >> 2) & 0x3333) - (((x) >> 3) & 0x1111))
#define BITCOUNT16(x) (((BX16_(x) + (BX16_(x) >> 4)) & 0x0F0F) % 255)

/* max between 0 or a number: basically don't let a number drop below 0 */
#define IF_NEG_THEN_ZERO(a) (((a) >= (0)) ? (a) : (0))

/* multipliers [bw] means either btye or word */
#define KILO 1024L	       /* number of [bw] in a kilo[bw] */
#define MEGATOKILO 1024L       /* number of mega[bw] in a kilo[bw] */
#define GIGATOKILO 1048576L    /* number of giga[bw] in a kilo[bw] */
#define TERATOKILO 1073741824L /* number of tera[bw] in a kilo[bw] */

/* extra constants */
#define FREE_DEEP 1 /* constant to pass to free_*_list */
#define INITIALIZE -1

/* Constants used as flags to pass to next_job() function
 * Decision of Sorting jobs is taken on the basis of these constants */
enum sort_status {
	DONT_SORT_JOBS,	  /* If there is no need to sort in next_job() */
	MAY_RESORT_JOBS,  /* used to resort all jobs whenever needed */
	MUST_RESORT_JOBS, /* used to resort all jobs mandatorily */
	SORTED		  /* job list is already sorted */
};

/* enum used to find out what to skip while searching for the next job to schedule.  Values are bits in a bitfield */

enum skip {
	SKIP_NOTHING,
	/* Value used to know whether reservations are already scheduled or not */
	SKIP_RESERVATIONS = 1,
	/* Value used to know whether express, preempted, are already scheduled or not */
	SKIP_NON_NORMAL_JOBS = 2
};

/* return value of select_index_to_preempt function */
enum select_job_status {
	NO_JOB_FOUND = -1, /* fails to find a job to preempt */
	ERR_IN_SELECT = -2 /* error while selecting a job to preempt */
};

#define INIT_ARR_SIZE 2048

/* We need two sets of UNSPECIFIED/SCHD_INFINITY constants.  One for resources
 * which can be negative, and one for positive integer values.  While we could
 * use some numbers near -LONG_MAX, that would mean every integer used in the
 * scheduler would need to be a long, when an int or smaller type is fine.
 */

/* Unspecified resource value */
#define UNSPECIFIED_RES -HUGE_VAL
#define UNSPECIFIED_STR "UNSPECIFIED"
/* infinity value for resources */
#define SCHD_INFINITY_RES HUGE_VAL
#define SCHD_INFINITY_STR "SCHD_INFINITY"

#define UNSPECIFIED -1
#define SCHD_INFINITY -2

/* infinity walltime value for forever job. This is 5 years(=60 * 60 * 24 * 365 * 5 seconds) */
#define JOB_INFINITY (60 * 60 * 24 * 365 * 5)

/* for filter functions */
#define FILTER_FULL 1 /* leave new array the full size */

/* for update_jobs_cant run */
#define START_BEFORE_JOB -1
#define START_WITH_JOB 0
#define START_AFTER_JOB 1

/* Error message when we fail to allocate memory */
#define MEM_ERR_MSG "Unable to allocate memory (malloc error)"

/* accrue types for update_accruetype */
#define ACCRUE_INIT "0"
#define ACCRUE_INEL "1"
#define ACCRUE_ELIG "2"
#define ACCRUE_RUNN "3"
#define ACCRUE_EXIT "4"

/* operational modes for update_accruetype */
enum update_accruetype_mode {
	ACCRUE_CHECK_ERR = 0,
	ACCRUE_MAKE_INELIGIBLE,
	ACCRUE_MAKE_ELIGIBLE
};

/* Default values for datatype resource */
#define RES_DEFAULT_AVAIL SCHD_INFINITY_RES
#define RES_DEFAULT_ASSN 0

#define PREEMPT_QUEUE_SERVER_SOFTLIMIT (1 << (PREEMPT_OVER_QUEUE_LIMIT) | 1 << (PREEMPT_OVER_SERVER_LIMIT))

/* strings for prime and non-prime */
#define PRIMESTR "primetime"
#define NONPRIMESTR "non-primetime"

/* dedtime_change */
#define DEDTIME_START "DEDTIME_START"
#define DEDTIME_END "DEDTIME_END"

/* comment prefixes */
#define NOT_RUN_PREFIX "Not Running"
#define NEVER_RUN_PREFIX "Can Never Run"

/* Time in seconds for 5 years */
#define FIVE_YRS 157680000

#define PREEMPT_NONE 1

/* resource comparison flag values */
enum resval_cmpflag {
	CMP_CASE,
	CMP_CASELESS
};

enum thread_task_type {
	TS_IS_ND_ELIGIBLE,
	TS_DUP_ND_INFO,
	TS_QUERY_ND_INFO,
	TS_FREE_ND_INFO,
	TS_DUP_RESRESV,
	TS_QUERY_JOB_INFO,
	TS_FREE_RESRESV
};

/* return codes for is_ok_to_run_* functions
 * codes less then RET_BASE are standard PBSE pbs error codes
 * NOTE: RET_BASE MUST be greater than the highest PBSE error code
 */
enum sched_error_code {
	SE_NONE = 0,
	RET_BASE = 16300,
	SUCCESS = RET_BASE + 1,
	SCHD_ERROR = RET_BASE + 2,
	NOT_QUEUED = RET_BASE + 3,
	QUEUE_NOT_STARTED = RET_BASE + 4,
	QUEUE_NOT_EXEC = RET_BASE + 5,
	QUEUE_JOB_LIMIT_REACHED = RET_BASE + 6,
	SERVER_JOB_LIMIT_REACHED = RET_BASE + 7,
	SERVER_USER_LIMIT_REACHED = RET_BASE + 8,
	QUEUE_USER_LIMIT_REACHED = RET_BASE + 9,
	SERVER_GROUP_LIMIT_REACHED = RET_BASE + 10,
	QUEUE_GROUP_LIMIT_REACHED = RET_BASE + 11,
	DED_TIME = RET_BASE + 12,
	CROSS_DED_TIME_BOUNDRY = RET_BASE + 13,
	NO_AVAILABLE_NODE = RET_BASE + 14, /* unused */
	NOT_ENOUGH_NODES_AVAIL = RET_BASE + 15,
	BACKFILL_CONFLICT = RET_BASE + 16,
	RESERVATION_INTERFERENCE = RET_BASE + 17,
	PRIME_ONLY = RET_BASE + 18,
	NONPRIME_ONLY = RET_BASE + 19,
	CROSS_PRIME_BOUNDARY = RET_BASE + 20,
	NODE_NONEXISTENT = RET_BASE + 21,
	NO_NODE_RESOURCES = RET_BASE + 22,
	CANT_PREEMPT_ENOUGH_WORK = RET_BASE + 23,
	QUEUE_USER_RES_LIMIT_REACHED = RET_BASE + 24,
	SERVER_USER_RES_LIMIT_REACHED = RET_BASE + 25,
	QUEUE_GROUP_RES_LIMIT_REACHED = RET_BASE + 26,
	SERVER_GROUP_RES_LIMIT_REACHED = RET_BASE + 27,
	NO_FAIRSHARES = RET_BASE + 28,
	INVALID_NODE_STATE = RET_BASE + 29,
	INVALID_NODE_TYPE = RET_BASE + 30,
	NODE_NOT_EXCL = RET_BASE + 31,
	NODE_JOB_LIMIT_REACHED = RET_BASE + 32,
	NODE_USER_LIMIT_REACHED = RET_BASE + 33,
	NODE_GROUP_LIMIT_REACHED = RET_BASE + 34,
	NODE_NO_MULT_JOBS = RET_BASE + 35,
	NODE_UNLICENSED = RET_BASE + 36,
	NOT_USED37 = RET_BASE + 37, /* unused */
	NO_SMALL_CPUSETS = RET_BASE + 38,
	INSUFFICIENT_RESOURCE = RET_BASE + 39,
	RESERVATION_CONFLICT = RET_BASE + 40,
	NODE_PLACE_PACK = RET_BASE + 41,
	NODE_RESV_ENABLE = RET_BASE + 42,
	STRICT_ORDERING = RET_BASE + 43,
	MAKE_ELIGIBLE = RET_BASE + 44,	 /* unused */
	MAKE_INELIGIBLE = RET_BASE + 45, /* unused */
	INSUFFICIENT_QUEUE_RESOURCE = RET_BASE + 46,
	INSUFFICIENT_SERVER_RESOURCE = RET_BASE + 47,
	QUEUE_BYGROUP_JOB_LIMIT_REACHED = RET_BASE + 48,
	QUEUE_BYUSER_JOB_LIMIT_REACHED = RET_BASE + 49,
	SERVER_BYGROUP_JOB_LIMIT_REACHED = RET_BASE + 50,
	SERVER_BYUSER_JOB_LIMIT_REACHED = RET_BASE + 51,
	SERVER_BYGROUP_RES_LIMIT_REACHED = RET_BASE + 52,
	SERVER_BYUSER_RES_LIMIT_REACHED = RET_BASE + 53,
	QUEUE_BYGROUP_RES_LIMIT_REACHED = RET_BASE + 54,
	QUEUE_BYUSER_RES_LIMIT_REACHED = RET_BASE + 55,
	QUEUE_RESOURCE_LIMIT_REACHED = RET_BASE + 56,
	SERVER_RESOURCE_LIMIT_REACHED = RET_BASE + 57,
	PROV_DISABLE_ON_SERVER = RET_BASE + 58,
	PROV_DISABLE_ON_NODE = RET_BASE + 59,
	AOE_NOT_AVALBL = RET_BASE + 60,
	EOE_NOT_AVALBL = RET_BASE + 61,
	PROV_BACKFILL_CONFLICT = RET_BASE + 62, /* unused */
	IS_MULTI_VNODE = RET_BASE + 63,
	PROV_RESRESV_CONFLICT = RET_BASE + 64,
	RUN_FAILURE = RET_BASE + 65,
	SET_TOO_SMALL = RET_BASE + 66,
	CANT_SPAN_PSET = RET_BASE + 67,
	NO_FREE_NODES = RET_BASE + 68,
	SERVER_PROJECT_LIMIT_REACHED = RET_BASE + 69,
	SERVER_PROJECT_RES_LIMIT_REACHED = RET_BASE + 70,
	SERVER_BYPROJECT_RES_LIMIT_REACHED = RET_BASE + 71,
	SERVER_BYPROJECT_JOB_LIMIT_REACHED = RET_BASE + 72,
	QUEUE_PROJECT_LIMIT_REACHED = RET_BASE + 73,
	QUEUE_PROJECT_RES_LIMIT_REACHED = RET_BASE + 74,
	QUEUE_BYPROJECT_RES_LIMIT_REACHED = RET_BASE + 75,
	QUEUE_BYPROJECT_JOB_LIMIT_REACHED = RET_BASE + 76,
	NO_TOTAL_NODES = RET_BASE + 77,
	INVALID_RESRESV = RET_BASE + 78,
	JOB_UNDER_THRESHOLD = RET_BASE + 79,
	MAX_RUN_SUBJOBS = RET_BASE + 80,
#ifdef NAS
	/* localmod 034 */
	GROUP_CPU_SHARE = RET_BASE + 81,
	GROUP_CPU_INSUFFICIENT = RET_BASE + 82,
	/* localmod 998 */
	RESOURCES_INSUFFICIENT = RET_BASE + 83,
#endif
	ERR_SPECIAL = RET_BASE + 1000
};

enum schd_err_status {
	SCHD_UNKWN,
	NOT_RUN,
	NEVER_RUN,
	SCHD_STATUS_HIGH
};

/* for SORT_BY */
enum sort_type {
	NO_SORT,
	SHORTEST_JOB_FIRST,
	LONGEST_JOB_FIRST,
	SMALLEST_MEM_FIRST,
	LARGEST_MEM_FIRST,
	HIGH_PRIORITY_FIRST,
	LOW_PRIORITY_FIRST,
	LARGE_WALLTIME_FIRST,
	SHORT_WALLTIME_FIRST,
	FAIR_SHARE,
	PREEMPT_PRIORITY,
	MULTI_SORT
};

#ifdef FALSE
#undef FALSE
#endif

#ifdef TRUE
#undef TRUE
#endif

/* Reservation related constants */
#define MAXVNODELIST 100

enum resv_conf {
	RESV_CONFIRM_FAIL = -1,
	RESV_CONFIRM_VOID,
	RESV_CONFIRM_SUCCESS,
	RESV_CONFIRM_RETRY
};

/* job substate meaning suspended by scheduler */
#define SUSP_BY_SCHED_SUBSTATE "45"

/* job substate meaning node is provisioning */
#define PROVISIONING_SUBSTATE "71"

/* job substate meaning job is pre-running state */
#define PRERUNNING_SUBSTATE "41"

/* TRUE_FALSE indicates both true and false for collections of resources */
enum { FALSE,
       TRUE,
       TRUE_FALSE };

enum { RUN_JOBS_SORTED = 1,
       SIM_RUN_JOB = 2 };
enum { SIMULATE_SD = -1 };

enum fairshare_flags {
	FS_TRIM = 1
};

#define FAIRSHARE_MIN_USAGE 1

/* flags used for copy constructors - bit field */
enum dup_flags {
	DUP_LOW = 0,
	DUP_INDIRECT = 1
	/* next flag 2 then 4, the 8... */
};

/* an enum of 1-off names */
enum misc_constants {
	NO_FLAGS = 0,
	IGNORE_DISABLED_EVENTS = 1,
	FORCE_SCHED,
	SET_RESRESV_INDEX = 4,
	DETECT_GHOST_JOBS = 8,
	ALL_MASK = 0xffffffff
};

enum advance {
	DONT_ADVANCE,
	ADVANCE
};

/* resource list flags is a bitfield = 0, 1, 2, 4, 8...*/
enum add_resource_list_flags {
	NO_UPDATE_NON_CONSUMABLE = 1,
	USE_RESOURCE_LIST = 2,
	ADD_UNSET_BOOLS_FALSE = 4,
	ADD_AVAIL_ASSIGNED = 8,
	ADD_ALL_BOOL = 16
	/* next flag 32 */
};

enum incr_decr {
	SCHD_INCR,
	SCHD_DECR
};

/* run update resresv flags is a bitfield = 0, 1, 2, 4, 8, ...*/
enum run_update_resresv_flags {
	RURR_NO_FLAGS = 0,
	RURR_ADD_END_EVENT = 1, /* add end events to calendar for job */
	RURR_NOPRINT = 2	/* don't print messages */
				/* next value 4 */
};

enum delete_event_flags {
	DE_NO_FLAGS = 0,
	DE_UNLINK = 1
	/* next flag 2, 4, 8, 16, ...*/
};

enum res_print_flags {
	PRINT_INT_CONST = 1,
	NOEXPAND = 2
	/* next flex 4, 8, 16, ...*/
};

enum is_provisionable_ret {
	NOT_PROVISIONABLE,
	NO_PROVISIONING_NEEDED,
	PROVISIONING_NEEDED
};

enum sort_order {
	NO_SORT_ORDER,
	DESC, /* decending i.e. 4 3 2 1 */
	ASC   /* ascending i.e. 1 2 3 4 */
};

enum cmptype {
	CMPAVAIL,
	CMPTOTAL
};

enum match_string_array_ret {
	SA_NO_MATCH,	  /* no match */
	SA_PARTIAL_MATCH, /* at least one match */
	SA_SUB_MATCH,	  /* one array is a subset of the other */
	SA_FULL_MATCH	  /* both arrays are the same size and match */
};

enum prime_time {
	NON_PRIME = 0,
	PRIME = 1,
	PT_ALL,
	PT_NONE
};

enum days {
	SUNDAY,
	MONDAY,
	TUESDAY,
	WEDNESDAY,
	THURSDAY,
	FRIDAY,
	SATURDAY,
	WEEKDAY,
	HIGH_DAY,
};

enum smp_cluster_dist {
	SMP_NODE_PACK,
	SMP_ROUND_ROBIN,
	HIGH_SMP_DIST
};

/*
 *	When adding entries to this enum, be sure to initialize a matching
 *	entry in prempt_prio_info[] (globals.c).
 */
enum preempt {
	PREEMPT_NORMAL,		   /* normal priority jobs */
	PREEMPT_OVER_FS_LIMIT,	   /* jobs over their fairshare of the machine */
	PREEMPT_OVER_QUEUE_LIMIT,  /* jobs over queue run limits (maxrun etc) */
	PREEMPT_OVER_SERVER_LIMIT, /* jobs over server run limits */
	PREEMPT_EXPRESS,	   /* jobs in express queue */
	PREEMPT_QRUN,		   /* job is being qrun */
	PREEMPT_ERR,		   /* error occurred during preempt computation */
	PREEMPT_HIGH
};

enum schd_simulate_cmd {
	SIM_NONE,
	SIM_NEXT_EVENT,
	SIM_TIME
};

enum timed_event_types {
	TIMED_NOEVENT = 1,
	TIMED_ERROR = 2,
	TIMED_RUN_EVENT = 4,
	TIMED_END_EVENT = 8,
	TIMED_POLICY_EVENT = 16,
	TIMED_DED_START_EVENT = 32,
	TIMED_DED_END_EVENT = 64,
	TIMED_NODE_DOWN_EVENT = 128,
	TIMED_NODE_UP_EVENT = 256
};

enum resource_fields {
	RF_NONE,
	RF_AVAIL,	 /* resources_available - if indirect, resolve */
	RF_DIRECT_AVAIL, /* resources_available - if indirect, return @vnode */
	RF_ASSN,
	RF_REQUEST,
	RF_UNUSED /* meta field: RF_AVAIL - RF_ASSN: used for sorting */
};

/* bit fields */
enum node_eval {
	EVAL_LOW = 0,
	EVAL_OKBREAK = 1, /* OK to break chunk up across placement set */
	EVAL_EXCLSET = 2  /* allocate entire placement set exclusively */
			  /* next 4, then 8, etc */
};

enum nodepart {
	NP_NONE = 0,
	NP_IGNORE_EXCL = 1,
	NP_CREATE_REST = 2,
	NP_NO_ADD_NP_ARR = 4
	/* next 8, 16, etc */
};

/* It is used to identify the provisioning policy set on scheduler */
enum provision_policy_types {
	AGGRESSIVE_PROVISION = 0,
	AVOID_PROVISION = 1
};

enum sort_obj_type {
	SOBJ_JOB,
	SOBJ_NODE,
	SOBJ_PARTITION,
	SOBJ_BUCKET
};

enum update_sort_defs {
	SD_FREE,
	SD_UPDATE
};

enum update_attr_flags {
	UPDATE_FLAGS_LOW = 0,
	UPDATE_LATER = 1,
	UPDATE_NOW = 2,
	/* Bit Field, next 4, then 8 */
};

/* static indexes into the allres resdef array for built in resources.  It is
 * likely that the query_rsc() API call will return the resources in the order
 * of the server's resc_def_all array.  It is marginally faster if we try and
 * keep this array in the same order.  There is no dependency on this ordering
 */
enum resource_index {
	RES_CPUT,
	RES_MEM,
	RES_WALLTIME,
	RES_SOFT_WALLTIME,
	RES_NCPUS,
	RES_ARCH,
	RES_HOST,
	RES_VNODE,
	RES_AOE,
	RES_EOE,
	RES_MIN_WALLTIME,
	RES_MAX_WALLTIME,
	RES_PREEMPT_TARGETS,
	RES_HIGH
};

/* Flags for is_ok_to_run() and the check functions called by it */
enum check_flags {
	CHECK_FLAGS_LOW,
	RETURN_ALL_ERR = 1,
	CHECK_LIMIT = 2,	    /* for check_limits */
	CHECK_CUMULATIVE_LIMIT = 4, /* for check_limits */
	CHECK_ALL_BOOLS = 8,
	UNSET_RES_ZERO = 16,
	COMPARE_TOTAL = 32,
	ONLY_COMP_NONCONS = 64,
	ONLY_COMP_CONS = 128,
	IGNORE_EQUIV_CLASS = 256,
	USE_BUCKETS = 512,
	NO_ALLPART = 1024,
	SPAN_PSETS = 2048
	/* next flag 4096 */
};

enum schd_error_args {
	ARG1,
	ARG2,
	ARG3,
	SPECMSG
};

enum bucket_flags {
	UPDATE_BUCKET_IND = 1,
	NO_PRINT_BUCKETS
};

enum sort_info_type {
	PRIME_SORT,
	NON_PRIME_SORT,
	PRIME_NODE_SORT,
	NON_PRIME_NODE_SORT
};

enum runjob_mode {
	RJ_NOWAIT,
	RJ_RUNJOB_HOOK,
	RJ_EXECJOB_HOOK
};

enum preempt_sort_vals {
	PS_MIN_T_SINCE_START,
	PS_PREEMPT_PRIORITY,
	PS_HIGH
};

enum nscr_vals {
	NSCR_NONE = 0,
	NSCR_VISITED = 1,
	NSCR_SCATTERED = 2,
	NSCR_INELIGIBLE = 4,
	NSCR_CYCLE_INELIGIBLE = 8
};

#endif /* _CONSTANT_H */


================================================
FILE: src/scheduler/data_types.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * A quick explanation of the scheduler's data model:
 * To free an object, use the object’s destructor (e.g., free_node_info())
 * To free an array of objects, you need to know if you own the objects yourself
 * or are an array of references
 * If you own the objects(e.g., sinfo->nodes), you call the multi-object object
 * destructor (e.g., free_nodes())
 * If you are an array of references (e.g., sinfo->queues[i]->nodes), you call
 * free().  You are just an array of pointers that are referencing objects.
 */

// clang-format off

#ifndef	_DATA_TYPES_H
#define	_DATA_TYPES_H

#include <string>
#include <unordered_map>
#include <unordered_set>
#include <vector>

#include <time.h>
#include <pbs_ifl.h>
#include <libutil.h>
#include "constant.h"
#include "config.h"
#include "pbs_bitmap.h"
#include "pbs_share.h"
#include "range.h"
#ifdef NAS
#include "site_queue.h"
#endif

class server_info;
struct job_info;
struct schd_resource;
struct resource_req;
struct resource_count;
struct holiday;
struct prev_job_info;
class group_info;
struct usage_info;
class counts;
class nspec;
struct node_partition;
struct range;
struct place;
struct schd_error;
class np_cache;
struct chunk;
class selspec;
class resdef;
struct event_list;
struct status;
class fairshare_head;
struct node_scratch;
struct te_list;
struct node_bucket;
struct bucket_bitpool;
struct chunk_map;
struct node_bucket_count;
struct preempt_job_st;
struct config;
struct sort_info;
class resource_resv;
class node_info;
class queue_info;
class sched_exception;


typedef struct state_count state_count;
typedef struct job_info job_info;
typedef struct schd_resource schd_resource;
typedef struct resource_req resource_req;
typedef struct resource_count resource_count;
typedef struct usage_info usage_info;
typedef struct resv_info resv_info;
typedef struct node_partition node_partition;
typedef struct place place;
typedef struct schd_error schd_error;
typedef struct chunk chunk;
typedef struct timed_event timed_event;
typedef struct event_list event_list;
typedef struct node_scratch node_scratch;
typedef struct resresv_set resresv_set;
typedef struct te_list te_list;
typedef struct node_bucket node_bucket;
typedef struct bucket_bitpool bucket_bitpool;
typedef struct chunk_map chunk_map;
typedef struct node_bucket_count node_bucket_count;
typedef struct preempt_job_st preempt_job_st;
typedef struct th_task_info th_task_info;
typedef struct th_data_nd_eligible th_data_nd_eligible;
typedef struct th_data_dup_nd_info th_data_dup_nd_info;
typedef struct th_data_query_ninfo th_data_query_ninfo;
typedef struct th_data_free_ninfo th_data_free_ninfo;
typedef struct th_data_dup_resresv th_data_dup_resresv;
typedef struct th_data_query_jinfo th_data_query_jinfo;
typedef struct th_data_free_resresv th_data_free_resresv;

using counts_umap = std::unordered_map<std::string, counts *>;
#ifdef NAS
/* localmod 034 */
/*
 * site_j_share_type - How jobs interact with CPU shares
 */
enum    site_j_share_type {
	J_TYPE_ignore =   0		/* share ignored when scheduling */
	, J_TYPE_limited =  1		/* jobs limited to share */
	, J_TYPE_borrow =   2		/* jobs can borrow from other shares */
};
#define	J_TYPE_COUNT	(J_TYPE_borrow+1)

struct share_head;
typedef struct share_head share_head;
struct share_info;
typedef struct share_info share_info;
typedef int sh_amt;
/* localmod 053 */
struct	site_user_info;
typedef struct site_user_info site_user_info;
#endif

typedef RESOURCE_TYPE sch_resource_t;
/* since resource values and usage values are linked */
typedef sch_resource_t usage_t;

typedef void event_ptr_t;
typedef int (*event_func_t)(event_ptr_t*, void *);

struct th_task_info
{
	int task_id;							/* task id, should be set by main thread */
	enum thread_task_type task_type;		/* task type */
	void *thread_data;					/* data for the worker thread to execute the task */
};

struct th_data_nd_eligible
{
	resource_resv *resresv;
	place *pl;
	schd_error *err;
	node_info **ninfo_arr;
	int sidx;
	int eidx;
};

struct th_data_dup_nd_info
{
	bool error:1;
	node_info **onodes;
	node_info **nnodes;
	server_info *nsinfo;
	unsigned int flags;
	int sidx;
	int eidx;
};

struct th_data_query_ninfo
{
	bool error:1;
	struct batch_status *nodes;
	server_info *sinfo;
	node_info **oarr;
	int sidx;
	int eidx;
};

struct th_data_free_ninfo
{
	node_info **ninfo_arr;
	int sidx;
	int eidx;
};

struct th_data_dup_resresv
{
	bool error:1;
	resource_resv **oresresv_arr;
	resource_resv **nresresv_arr;
	server_info *nsinfo;
	queue_info *nqinfo;
	int sidx;
	int eidx;
};

struct th_data_query_jinfo
{
	bool error:1;
	struct batch_status *jobs;
	server_info *sinfo;
	queue_info *qinfo;
	resource_resv **oarr;
	status *policy;
	int pbs_sd;
	int sidx;
	int eidx;
};

struct th_data_free_resresv
{
	resource_resv **resresv_arr;
	int sidx;
	int eidx;
};

struct schd_error
{
	enum sched_error_code error_code;	/* scheduler error code (see constant.h) */
	enum schd_err_status status_code; /* error status */
	resdef *rdef;			/* resource def if error contains a resource*/
	char *arg1;			/* buffer for error code specific string */
	char *arg2;			/* buffer for error code specific string */
	char *arg3;			/* buffer for error code specific string */
	char *specmsg;			/* buffer to override static error msg */
	schd_error *next;
};

struct state_count
{
	int running;			/* number of jobs in the running state*/
	int queued;			/* number of jobs in the queued state */
	int held;			/* number of jobs in the held state */
	int transit;			/* number of jobs in the transit state */
	int waiting;			/* number of jobs in the waiting state */
	int exiting;			/* number of jobs in the exiting state */
	int suspended;			/* number of jobs in the suspended state */
	int userbusy;			/* number of jobs in the userbusy state */
	int begin;			/* number of job arrays in begin state */
	int expired;			/* expired jobs which are no longer running */
	int invalid;			/* number of invalid jobs */
	int total;			/* total number of jobs in all states */
};

struct place
{
	bool free:1;		/* free placement */
	bool pack:1;		/* pack placement */
	bool scatter:1;		/* scatter placement */
	bool vscatter:1;	/* scatter by vnode */
	bool excl:1;		/* need nodes exclusively */
	bool exclhost:1;	/* need whole hosts exclusively */
	bool share:1;		/* will share nodes */

	char *group;			/* resource to node group by */
};

struct chunk
{
	char *str_chunk;		/* chunk in string form */
	int num_chunks;			/* the number of chunks needed */
	int seq_num;			/* the chunk sequence number */
	resource_req *req;		/* the resources in resource_req form */
};

class selspec
{
	public:
	int total_chunks;
	int total_cpus;			/* # of cpus requested in this select spec */
	std::unordered_set<resdef *> defs;			/* the resources requested by this select spec*/
	chunk **chunks;
	selspec();
	selspec(const selspec&);
	selspec& operator=(const selspec&);
	virtual ~selspec();
};

/* for description of these bits, check the PBS admin guide or scheduler IDS */
struct status
{
	bool round_robin:1;		/* Round robin around queues */
	bool by_queue:1;		/* schedule per-queue */
	bool strict_fifo:1;		/* deprecated */
	bool strict_ordering:1;
	bool fair_share:1;
	bool backfill:1;
	bool sort_nodes:1;
	bool backfill_prime:1;
	bool preempting:1;
#ifdef NAS /* localmod 034 */
	bool shares_track_only:1;
#endif /* localmod 034 */

	bool is_prime:1;
	bool is_ded_time:1;

	std::vector<sort_info> *sort_by;		/* job sorting */
	std::vector<sort_info> *node_sort;		/* node sorting */
	enum smp_cluster_dist smp_dist;

	unsigned prime_spill;			/* the amount of time a job can spill into the next prime state */
	unsigned int backfill_depth;		/* number of top jobs to backfill around */

	std::unordered_set<resdef *> resdef_to_check;		/* resources to match as definitions */
	std::unordered_set<resdef *> resdef_to_check_no_hostvnode;	/* resdef_to_check without host/vnode*/
	std::unordered_set<resdef *> resdef_to_check_rassn;		/* resdef_to_check intersects res_rassn */
	std::unordered_set<resdef *> resdef_to_check_rassn_select;	/* resdef_to_check intersects res_rassn and host level resource */
	std::unordered_set<resdef *> resdef_to_check_noncons;	/* non-consumable resources to match */
	std::unordered_set<resdef *> equiv_class_resdef;		/* resources to consider for job equiv classes */


	time_t prime_status_end;		/* the end of prime or nonprime */

	std::unordered_set<resdef *> rel_on_susp;	    /* resources to release on suspend */

	/* not really policy... but kinda just left over here */
	time_t current_time;			/* current time in the cycle */
	time_t cycle_start;			/* cycle start in real time */

	unsigned int order;			/* used to assign a ordering to objs */
	int preempt_attempts;			/* number of jobs attempted to preempt */
};

/*
 * All attributes of the qmgr sched object
 * Don't need log_events here, we use log_event_mask from Liblog/log_event.c
 */
struct schedattrs
{
	bool do_not_span_psets:1;
	bool only_explicit_psets:1;
	bool preempt_targets_enable:1;
	bool sched_preempt_enforce_resumption:1;
	bool throughput_mode:1;
	long attr_update_period;
	char *comment;
	char *job_sort_formula;
	double job_sort_formula_threshold;
	int opt_backfill_fuzzy;
	char *partition;
	long preempt_queue_prio;
	unsigned int preempt_prio[NUM_PPRIO][2];
	struct preempt_ordering preempt_order[PREEMPT_ORDER_MAX + 1];
	enum preempt_sort_vals preempt_sort;
	enum runjob_mode runjob_mode; /* set to a numeric version of job_run_wait attribute value */
	long sched_cycle_length;
	char *sched_log;
	char *sched_priv;
	long server_dyn_res_alarm;
};

class server_info
{
	public:
	bool has_soft_limit:1;	/* server has a soft user/grp limit set */
	bool has_hard_limit:1;	/* server has a hard user/grp limit set */
	bool has_mult_express:1;	/* server has multiple express queues */
	bool has_user_limit:1;	/* server has user hard or soft limit */
	bool has_grp_limit:1;	/* server has group hard or soft limit */
	bool has_proj_limit:1;	/* server has project hard or soft limit */
	bool has_all_limit:1;	/* server has PBS_ALL limits set on it */
	bool has_prime_queue:1;	/* server has a primetime queue */
	bool has_ded_queue:1;	/* server has a dedtime queue */
	bool has_nonprime_queue:1;	/* server has a non primetime queue */
	bool node_group_enable:1;	/* is node grouping enabled */
	bool has_nodes_assoc_queue:1; /* nodes are associates with queues */
	bool has_multi_vnode:1;	/* server has at least one multi-vnoded MOM  */
	bool has_runjob_hook:1;	/* server has at least 1 runjob hook enabled */
	bool eligible_time_enable:1;/* controls if we accrue eligible_time  */
	bool provision_enable:1;	/* controls if provisioning occurs */
	bool power_provisioning:1;	/* controls if power provisioning occurs */
	bool has_nonCPU_licenses:1;	/* server has non-CPU (e.g. socket-based) licenses */
	bool use_hard_duration:1;	/* use hard duration when creating the calendar */
	bool pset_metadata_stale:1;	/* The placement set meta data is stale and needs to be regenerated before the next use */
	std::string name;		/* name of server */
	struct schd_resource *res;	/* list of resources */
	void *liminfo;			/* limit storage information */
	int num_nodes;			/* number of nodes associated with the server */
	int num_resvs;			/* number of reservations on the server */
	int num_preempted;		/* number of jobs currently preempted */
	std::vector<std::string> node_group_key;		/* the node grouping resources */
	state_count sc;			/* number of jobs in each state */
	std::vector<queue_info *> queues;		/* array of queues */
	queue_info ***queue_list;	/* 3 dimensional array, used to order jobs in round_robin */
	node_info **nodes;		/* array of nodes associated with the server */
	node_info **unassoc_nodes;	/* array of nodes not associated with queues */
	resource_resv **resvs;		/* the reservations on the server */
	resource_resv **running_jobs;	/* array of jobs which are in state R */
	resource_resv **exiting_jobs;	/* array of jobs which are in state E */
	resource_resv **jobs;		/* all the jobs in the server */
	resource_resv **all_resresv;	/* a list of all jobs and adv resvs */
	event_list *calendar;		/* the calendar of events */
	char *job_sort_formula;	/* set via the JSF attribute of either the sched, or the server */

	time_t server_time;		/* The time the server is at.  Could be in the
					 * future if we're simulating
					 */
	/* the number of running jobs in each preempt level
	 * all jobs in preempt_count[NUM_PPRIO] are unknown preempt status's
	 */
	int preempt_count[NUM_PPRIO + 1];

	counts_umap group_counts;		/* group resource and running counts */
	counts_umap project_counts;		/* project resource and running counts */
	counts_umap user_counts;		/* user resource and running counts */
	counts_umap alljobcounts;		/* overall resource and running counts */

	/*
	 * Resource/Run counts list to store counts for all jobs which
	 * are running/queued/suspended.
	 */
	counts_umap total_group_counts;
	counts_umap total_project_counts;
	counts_umap total_user_counts;
	counts_umap total_alljobcounts;

	node_partition **nodepart;	/* array pointers to node partitions */
	int num_parts;			/* number of node partitions(node_group_key) */
	node_partition *allpart;	/* node partition for all nodes */
	int num_hostsets;		/* the size of hostsets */
	node_partition **hostsets;	/* partitions for vnodes on a host */

	char **nodesigs;		/* node signatures from server nodes */

	/* cache of node partitions we created.  We cache them all here and
	 * will attempt to find one when we need to use it.  This cache will not
	 * be duplicated.  It would be difficult to duplicate correctly, and it is
	 * just a cache.  It will be regenerated when needed
	 */
	std::vector<np_cache *> npc_arr;

	resource_resv *qrun_job;	/* used if running a job via qrun request */
	/* policy structure for the server.  This is an easy storage location for
	 * the policy struct.  The policy struct will be passed around separately
	 */
	status *policy;
	fairshare_head *fstree;	/* root of fairshare tree */
	resresv_set **equiv_classes;
	node_bucket **buckets;		/* node bucket array */
	node_info **unordered_nodes;
	std::unordered_map<std::string, node_partition *> svr_to_psets;
#ifdef NAS
	/* localmod 034 */
	share_head *share_head;	/* root of share info */
#endif
	// Class methods
	explicit server_info(const char *);
	server_info() = delete;
	server_info(const server_info &);
	virtual ~server_info();
	server_info & operator=(const server_info &);

	private:
	void init_server_info();
	void free_server_info();
	void free_server_psets();
	void dup_server_psets(const std::unordered_map<std::string, node_partition*>& spsets);
};

class queue_info
{
	public:
	bool is_started:1;		/* is queue started */
	bool is_exec:1;		/* is the queue an execution queue */
	bool is_route:1;		/* is the queue a routing queue */
	bool is_ok_to_run:1;	/* is it ok to run jobs in this queue */
	bool is_ded_queue:1;	/* only jobs in dedicated time */
	bool is_prime_queue:1;	/* only run jobs in primetime */
	bool is_nonprime_queue:1;	/* only run jobs in nonprimetime */
	bool has_nodes:1;		/* does this queue have nodes assoc with it */
	bool has_soft_limit:1;	/* queue has a soft user/grp limit set */
	bool has_hard_limit:1;	/* queue has a hard user/grp limit set */
	bool is_peer_queue:1;	/* queue is a peer queue */
	bool has_resav_limit:1;	/* queue has resources_available limits */
	bool has_user_limit:1;	/* queue has user hard or soft limit */
	bool has_grp_limit:1;	/* queue has group hard or soft limit */
	bool has_proj_limit:1;	/* queue has project hard or soft limit */
	bool has_all_limit:1;	/* queue has PBS_ALL limits set on it */
	struct server_info *server;	/* server where queue resides */
	const std::string name;		/* queue name */
	state_count sc;			/* number of jobs in different states */
	void *liminfo;			/* limit storage information */
	int priority;			/* priority of queue */
#ifdef NAS
	/* localmod 046 */
	time_t max_starve;		/* eligible job marked starving after this */
	/* localmod 034 */
	time_t max_borrow;		/* longest job that can borrow CPUs */
	/* localmod 038 */
	bool is_topjob_set_aside:1; /* draws topjobs from per_queues_topjobs */
	/* localmod 040 */
	bool ignore_nodect_sort:1; /* job_sort_key nodect ignored in this queue */
#endif
	int num_nodes;		/* number of nodes associated with queue */
	struct schd_resource *qres;	/* list of resources on the queue */
	resource_resv *resv;		/* the resv if this is a resv queue */
	resource_resv **jobs;		/* array of jobs that reside in queue */
	resource_resv **running_jobs;	/* array of jobs in the running state */
	node_info **nodes;		/* array of nodes associated with the queue */
	counts_umap group_counts;		/* group resource and running counts */
	counts_umap project_counts;		/* project resource and running counts */
	counts_umap user_counts;		/* user resource and running counts */
	counts_umap alljobcounts;		/* overall resource and running counts */
	/*
	 * Resource/Run counts list to store counts for all jobs which
	 * are running/queued/suspended.
	 */
	counts_umap total_group_counts;
	counts_umap total_project_counts;
	counts_umap total_user_counts;
	counts_umap total_alljobcounts;

	std::vector<std::string> node_group_key;		/* node grouping resources */
	struct node_partition **nodepart; /* array pointers to node partitions */
	struct node_partition *allpart;   /* partition w/ all nodes assoc with queue*/
	int num_parts;			/* number of node partitions(node_group_key) */
	int num_topjobs;		/* current number of top jobs in this queue */
	int backfill_depth;		/* total allowable topjobs in this queue*/
	char *partition;		/* partition to which queue belongs to */

	explicit queue_info(const char *);
	queue_info(queue_info&, server_info *);
	virtual ~queue_info();
};

struct job_info
{
	bool is_queued:1;		/* state booleans */
	bool is_running:1;
	bool is_held:1;
	bool is_waiting:1;
	bool is_transit:1;
	bool is_exiting:1;
	bool is_suspended:1;
	bool is_susp_sched:1;	/* job is suspended by scheduler */
	bool is_userbusy:1;
	bool is_begin:1;		/* job array 'B' state */
	bool is_expired:1;		/* 'X' pseudo state for simulated job end */
	bool is_checkpointed:1;	/* job has been checkpointed */

	bool can_not_preempt:1;	/* this job can not be preempted */

	bool can_checkpoint:1;	/* this job can be checkpointed */
	bool can_requeue:1;	/* this job can be requeued */
	bool can_suspend:1;	/* this job can be suspended */

	bool is_array:1;		/* is the job a job array object */
	bool is_subjob:1;		/* is a subjob of a job array */

	bool is_provisioning:1;	/* job is provisioning */
	bool is_preempted:1;	/* job is preempted */
	bool is_prerunning:1;		/* Job in prerunning substate */
	bool is_topjob:1;		/* job is the top job */
	bool topjob_ineligible:1;	/* Job is ineligible to be a top job */

	char *job_name;			/* job name attribute (qsub -N) */
	char *comment;			/* comment field of job */
	char *resv_id;			/* identifier of reservation job is in */
	char *alt_id;			/* vendor assigned job identifier */
	queue_info *queue;		/* queue where job resides */
	resource_resv *resv;		/* the reservation the job is part of */
	int priority;			/* PBS priority of job */
	time_t etime;			/* the time the job went to the queued state */
	time_t stime;			/* the time the job was started */
	time_t est_start_time;		/* scheduler estimated start time of job */
	time_t time_preempted;		/* time when the job was preempted */
	char *est_execvnode;		/* scheduler estimated execvnode of job */
	unsigned int preempt_status;	/* preempt levels (bitfield) */
	unsigned int preempt;			/* preempt priority */
	int peer_sd;			/* connection descriptor to peer server */
	resource_req *resused;		/* a list of resources used */
	group_info *ginfo;		/* the fair share node for the owner */

	/* subjob information */
	std::string array_id;		/* job id of job array if we are a subjob */
	int array_index;		/* array index if we are a subjob */
	resource_resv *parent_job;	/* pointer to the parent array job */

	/* job array information */
	range *queued_subjobs;		/* a list of ranges of queued subjob indices */
	long max_run_subjobs;		/* Max number of running subjobs at any time */
	long running_subjobs;		/* number of currently running subjobs */

	int accrue_type;		/* type of time job should accrue */
	time_t eligible_time;		/* eligible time accrued until last cycle */

	struct attrl *attr_updates;	/* used to federate all attr updates to server*/
	float formula_value;		/* evaluated job sort formula value */
	std::vector<nspec *> resreleased;		/* list of resources released by the job on each node */
	resource_req *resreq_rel;	/* list of resources released */
	char *depend_job_str;		/* dependent jobs in a ':' separated string */
	resource_resv **dependent_jobs; /* dependent jobs with runone depenency */

#ifdef NAS
	/* localmod 045 */
	int		NAS_pri;	/* NAS version of priority */
	/* localmod 034 */
	sh_amt	*sh_amts;	/* Amount of each type job is requesting */
	share_info	*sh_info;	/* Info about share group job belongs to */
	sch_resource_t accrue_rate;	/* rate at which job uses share resources */
	/* localmod 040 */
	int		nodect;		/* Node count for sorting jobs by */
	/* localmod 031 */
	char		*schedsel;	/* schedselect field of job */
	/* localmod 053 */
	site_user_info *u_info;	/* User associated with job */
#endif
};

class node_info
{
	public:
	bool is_down:1;		/* node is down */
	bool is_free:1;		/* node is free to run a job */
	bool is_offline:1;	/* node is off-line */
	bool is_unknown:1;	/* node is in an unknown state */
	bool is_exclusive:1;	/* node is running in exclusive mode */
	bool is_job_exclusive:1;	/* node is running in job-exclusive mode */
	bool is_resv_exclusive:1;	/* node is reserved exclusively */
	bool is_sharing:1;	/* node is running in job-sharing mode */
	bool is_busy:1;		/* load on node is too high to schedule */
	bool is_job_busy:1;	/* ntype = cluster all vp's allocated */
	bool is_stale:1;		/* node is unknown by mom */
	bool is_maintenance:1;	/* node is in maintenance */

	/* license types */
	bool lic_lock:1;		/* node has a node locked license */

	bool has_hard_limit:1;	/* node has a hard user/grp limit set */
	bool no_multinode_jobs:1;	/* do not run multnode jobs on this node */

	bool resv_enable:1;	/* is this node available for reservations */
	bool provision_enable:1;	/* is this node available for provisioning */

	bool is_provisioning:1;	/* node is provisioning */
	/* node in wait-provision is considered as node in provisioning state
	 * nodes in provisioning and wait provisioning states cannot run job
	 * NOTE:
	 * If node is provisioning an aoe and job needs this aoe then it could have
	 * run on this node. However, within the same cycle, this cannot be handled
	 * since we can't make the other job wait. In another cycle, the node is
	 * either free or provisioning, then, the case is clear.
	 */
	bool is_multivnoded:1;	/* multi vnode */
	bool power_provisioning:1;	/* can this node can power provision */
	bool is_sleeping:1;		/* node put to sleep through power on/off or ramp rate limit */
	bool has_ghost_job:1;	/* race condition occurred: recalculate resources_assigned */

	/* sharing */
	enum vnode_sharing sharing;	/* deflt or forced sharing/excl of the node */

	const std::string name;		/* name of the node */
	char *mom;			/* host name on which mom resides */

	char **jobs;			/* the name of the jobs currently on the node */
	char **resvs;			/* the name of the reservations currently on the node */
	resource_resv **job_arr;	/* ptrs to structs of the jobs on the node */
	resource_resv **run_resvs_arr;	/* ptrs to structs of resvs holding resources on the node */

	/* This element is the server the node is associated with.  In the case
	 * of a node which is part of an advanced reservation, the nodes are
	 * a copy of the real nodes with the resources modified to what the
	 * reservation gets.  This element points to the server the non-duplicated
	 * nodes do.  This means ninfo is not part of ninfo -> server -> nodes.
	 */
	server_info *server;
	std::string queue_name;		/* the queue the node is associated with */

	int num_jobs;			/* number of jobs running on the node */
	int num_run_resv;		/* number of running advanced reservations */
	int num_susp_jobs;		/* number of suspended jobs on the node */

	int priority;			/* node priority */

	counts_umap group_counts;	/* group resource and running counts */
	counts_umap user_counts;		/* user resource and running counts */

	int max_running;		/* max number of jobs on the node */
	int max_user_run;		/* max number of jobs running by a user */
	int max_group_run;		/* max number of jobs running by a UNIX group */

	schd_resource *res;		/* list of resources max/current usage */

	int rank;			/* unique numeric identifier for node */

#ifdef NAS
	/* localmod 034 */
	int	sh_cls;			/* Share class supplied by node */
	int	sh_type;		/* Share type of node */
#endif

	char *current_aoe;		/* AOE name instantiated on node */
	char *current_eoe;		/* EOE name instantiated on node */
	char *nodesig;			/* resource signature */
	int nodesig_ind;		/* resource signature index in server array */
	node_info *svr_node;		/* ptr to svr's node if we're a resv node */
	node_partition *hostset;	/* other vnodes on on the same host */
	unsigned int nscr;		/* scratch space local to node search code */
	char *partition;		/* partition to which node belongs to */
	time_t last_state_change_time;	/* Node state change at time stamp */
	time_t last_used_time;		/* Node was last active at this time */
	te_list *node_events;		/* list of run events that affect the node */
	int bucket_ind;			/* index in server's bucket array */
	int node_ind;			/* node's index into sinfo->unordered_nodes */
	node_partition **np_arr;	/* array of node partitions node is in */

	explicit node_info(const std::string& nname);
	virtual ~node_info();
};

struct resv_info
{
	bool is_standing:1;		/* set to 1 for a standing reservation */
	bool is_running:1;		/* the reservation is running (not necessarily in the running state) */
	char *queuename;		/* the name of the queue */
	char *rrule;			/* recurrence rule for standing reservations */
	char *execvnodes_seq;		/* sequence of execvnodes for standing resvs */
	time_t *occr_start_arr;		/* occurrence start time */
	char *timezone;			/* timezone associated to a reservation */
	int resv_idx;			/* the index of standing resv occurrence */
	int count;			/* the total number of occurrences */
	time_t req_start;		/* user requested start time of resv */
	time_t req_start_orig;		/* For altered reservations, this has the original start time */
	time_t req_start_standing;		/* For standing reservations, this will be used to get start time of future occurrences */
	time_t req_end;			/* user requested end tiem of resv */
	time_t req_duration;		/* user requested duration of resv */
	time_t req_duration_orig;		/* For altered reservations, this has the original duration */
	time_t req_duration_standing;	/* For standing reservations, this will be used to get duration of future occurrences */
	time_t retry_time;		/* time at which a reservation is to be reconfirmed */
	enum resv_states resv_state;	/* reservation state */
	enum resv_states resv_substate;	/* reservation substate */
	queue_info *resv_queue;		/* general resv: queue which is owned by resv */
	node_info **resv_nodes;		/* node universe for reservation */
	char *partition;		/* name of the partition in which the reservation was confirmed */
	selspec *select_orig;		/* original schedselect pre-alter */
	selspec *select_standing;	/* original schedselect for standing reservations */
	std::vector<nspec *> orig_nspec_arr;		/* original non-shrunk exec_vnode with exec_vnode chunk mapped to select chunk */
};

/* resource reservation - used for both jobs and advanced reservations */
class resource_resv 
{
	public:
	bool can_not_run:1;   /* res resv can not run this cycle */
	bool can_never_run:1; /* res resv can never run and will be deleted */
	bool can_not_fit:1;   /* res resv can not fit into node group */
	bool is_invalid:1;    /* res resv is invalid and will be ignored */
	bool is_peer_ob:1;    /* res resv can from a peer server */

	bool is_job:1;	       /* res resv is a job */
	bool is_prov_needed:1;   /* res resv requires provisioning */
	bool is_shrink_to_fit:1; /* res resv is a shrink-to-fit job */
	bool is_resv:1;	       /* res resv is an advanced reservation */

	bool will_use_multinode:1;	/* res resv will use multiple nodes */

	const std::string name;		/* name of res resv */
	std::string user;		/* username of the owner of the res resv */
	std::string group;		/* exec group of owner of res resv */
	std::string project;		/* exec project of owner of res resv */
	char *nodepart_name;		/* name of node partition to run res resv in */

	long sch_priority;		/* scheduler priority of res resv */
	int rank;			/* unique numeric identifier for resource_resv */
	int ec_index;			/* Index into server's job_set array*/

	time_t qtime;			/* time res resv was submitted */
	long long qrank;		/* time on which we might need to stabilize the sort */
	time_t start;			/* start time (UNDEFINED means no start time */
	time_t end;			/* end time (UNDEFINED means no end time */
	time_t duration;		/* duration of resource resv request */
	time_t hard_duration;		/* hard duration of resource resv request */
	time_t min_duration;		/* minimum duration of STF job */

	resource_req *resreq;		/* list of resources requested */
	selspec *select;		/* select spec */
	selspec *execselect;		/* select spec from exec_vnode and resv_nodes */
	place *place_spec;		/* placement spec */

	server_info *server;		/* pointer to server which owns res resv */
	node_info **ninfo_arr; 		/* nodes belonging to res resv */
	std::vector<nspec *> nspec_arr;		/* exec vnode of object in internal sched form (one nspec per node) */

	job_info *job;			/* pointer to job specific structure */
	resv_info *resv;		/* pointer to reservation specific structure */

	char *aoename;			   /* store name of aoe if requested */
	char *eoename;			   /* store name of eoe if requested */
	char **node_set_str;		   /* user specified node string */
	node_info **node_set;		   /* node array specified by node_set_str */
#ifdef NAS				   /* localmod 034 */
	enum site_j_share_type share_type; /* How resv counts against group share */
#endif					   /* localmod 034 */
	int resresv_ind;		   /* resource_resv index in all_resresv array */
	timed_event *run_event;		   /* run event in calendar */
	timed_event *end_event;		   /* end event in calendar */

	explicit resource_resv(const std::string& rname);
	virtual ~resource_resv();
};

class resource_type
{
	public:
	/* non consumable - used for selection only (e.g. arch) */
	bool is_non_consumable:1;
	bool is_string:1;
	bool is_boolean:1; /* value == 1 for true and 0 for false */

	/* consumable - numeric resource which is consumed and may have a max limit */
	bool is_consumable:1;
	bool is_num:1;
	bool is_long:1;
	bool is_float:1;
	bool is_size:1;	/* all sizes are converted into kb */
	bool is_time:1;
	resource_type();
};

struct schd_resource
{
	const char *name;			/* name of the resource - reference to the definition name */
	resource_type type;	/* resource type */

	char *orig_str_avail;		/* original resources_available string */

	char *indirect_vnode_name;	/* name of vnode where to get value */
	schd_resource *indirect_res;	/* ptr to indirect resource */

	sch_resource_t avail;		/* availble amount of the resource */
	char **str_avail;		/* the string form of avail */
	sch_resource_t assigned;	/* amount of the resource assigned */
	char *str_assigned;		/* the string form of assigned */

	resdef *def;			/* resource definition */

	struct schd_resource *next;	/* next resource in list */
};

struct resource_req
{
	const char *name;			/* name of the resource - reference to the definition name */
	resource_type type;	/* resource type information */

	sch_resource_t amount;		/* numeric value of resource */
	char *res_str;			/* string value of resource */
	resdef *def;			/* definition of resource */
	struct resource_req *next;	/* next resource_req in list */
};

class resdef
{
	public:
	const std::string name;	/* name of resource */
	resource_type type;	/* resource type */
	unsigned int flags;	/* resource flags (see pbs_ifl.h) */
	resdef(char *rname, unsigned int rflags, resource_type rtype) : name(rname), type(rtype), flags(rflags) {}
};

class prev_job_info
{
	public:
	std::string name;	/* name of job */
	std::string entity_name;	/* fair share entity of job */
	resource_req *resused;	/* resources used by the job */
	prev_job_info(const std::string& pname, const std::string& ename, resource_req *rused);
	prev_job_info(const prev_job_info &);
	prev_job_info(prev_job_info &&);
	prev_job_info& operator=(const prev_job_info&);
	virtual ~prev_job_info();
};

class counts
{
	public:
	std::string name;		/* name of entitiy */
	int running;			/* count of running jobs in object */
	int soft_limit_preempt_bit;	/* Place to store preempt bit if entity is over limits */
	resource_count *rescts;		/* resources used */
	explicit counts(const std::string &);
	counts(const counts &);
	counts& operator=(const counts &);
	virtual ~counts();
};

struct resource_count
{
	const char *name;		    /* resource name */
	resdef *def;		    /* definition of resource */
	sch_resource_t amount;	    /* amount of resource used */
	int soft_limit_preempt_bit; /* Place to store preempt bit if resource of an entity is over limits */
	struct resource_count *next;
};

/* global data types */

/* fairshare head structure */
class fairshare_head
{
	public:
	group_info *root;			/* root of fairshare tree */
	time_t last_decay;			/* last time tree was decayed */
	fairshare_head();
	fairshare_head(fairshare_head&);
	fairshare_head& operator=(fairshare_head&);
	virtual ~fairshare_head();
};

class group_info
{
	public:
	std::string name;				/* name of user/group */
	int resgroup;				/* resgroup the group is in */
	int cresgroup;				/* resgroup of the children of group */
	int shares;				/* number of shares this group has */
	float tree_percentage;			/* overall percentage the group has */
	float group_percentage;			/* percentage within fairshare group (i.e., shares/group_shares) */

	/* There are two usage element per entity.  The usage element is used to
	 * hold the real usage for the entity.  The temp_usage is more of a sractch
	 * variable.  At the beginning of the cycle, usage is copied into temp_usage
	 * and from then on, only temp_usage is consulted for fairshare usage
	 */
	usage_t usage;				/* calculated usage info */
	usage_t temp_usage;			/* usage plus any temporary usage */
	float usage_factor;			/* usage calculation taking parent's usage into account: number between 0 and 1 */

	std::vector<group_info *> gpath;	/* path from the root of the tree */

	group_info *parent;			/* parent node */
	group_info *sibling;			/* sibling node */
	group_info *child;			/* child node */
	explicit group_info(const std::string& gname);
	group_info(group_info&);
	group_info &operator=(const group_info &);
};

/**
 * Set of equivalent resresvs.  It is used to keep track if one can't run, the rest cannot.
 * The set is defined by a number of attributes of the resresv.  If the attributes do
 * not matter, they won't be used and set to NULL
 * @see create_resresv_set_by_resresv() for reasons why members can be NULL
 */
struct resresv_set
{
	bool can_not_run:1;		/* set can not run */
	schd_error *err;		/* reason why set can not run*/
	char *user;			/* user of set, can be NULL */
	char *group;			/* group of set, can be NULL */
	char *project;			/* project of set, can be NULL */
	selspec *select_spec;		/* select spec of set */
	place *place_spec;		/* place spec of set */
	resource_req *req;		/* ATTR_L (qsub -l) resources of set.  Only contains resources on the resources line */
	queue_info *qinfo;		/* The queue the resresv is in if the queue has nodes associated */
};

struct node_partition
{
	bool ok_break:1;	/* OK to break up chunks on this node part */
	bool excl:1;		/* partition should be allocated exclusively */
	char *name;		/* res_name=res_val */
	/* name of resource and value which define the node partition */
	resdef *def;
	char *res_val;
	int tot_nodes;		/* the total number of nodes  */
	int free_nodes;		/* the number of nodes in state Free  */
	schd_resource *res;	/* total amount of resources in node part */
	node_info **ninfo_arr;	/* array of pointers to node structures  */
	node_bucket **bkts;	/* node buckets for node part */
	int rank;		/* unique numeric identifier for node partition */
};

class np_cache
{
	public:
	node_info **ninfo_arr;		/* ptr to array of nodes used to create pools */
	std::vector<std::string> resnames;		/* resource names used to create partitions */
	node_partition **nodepart;	/* node partitions */
	int num_parts;			/* number of partitions in nodepart */
	np_cache();
	np_cache(node_info **, const std::vector<std::string>&, node_partition **, int);
	np_cache(const np_cache &) = delete;
	np_cache& operator=(const np_cache &) = delete;
	virtual ~np_cache();
};

/* header to usage file.  Needs to be EXACTLY the same size as a
 * group_node_usage for backwards compatibility
 * tag defined in config.h
 */
struct group_node_header
{
	char tag[9];		/* usage file "magic number" */
	usage_t version;	/* usage file version number */
};

/* This structure is used to write out the usage to disk
 * Version 1 was just successive group_node_usage structures written to disk
 * with not header or anything.
 */
struct group_node_usage_v1
{
	char name[9];
	usage_t usage;
};

/* This is the second attempt at a good usage file.  The first became obsolete
 * when users became entities and entities were no longer constrained by the
 * 8 characters of usernames.  Usage file version 2 also contains the last
 * 8 characters of usernames.  Usage file version 2 also contains the last
 * 8 characters of usernames.  Usage file version 2 also contains the last
 * decay time so it can be saved over restarts of the scheduler
 */
struct group_node_usage_v2
{
	char name[USAGE_NAME_MAX];
	usage_t usage;
};

struct usage_info
{
	char *name;			/* name of the user */
	struct resource_req *reslist;	/* list of resources */
	int computed_value;		/* value computed from usage info */
};

struct t
{
	unsigned int hour;
	unsigned int min;
	unsigned int none;
	unsigned int all;
};

struct sort_info
{
	std::string res_name;		/* Name of sorting resource */
	resdef *def;			/* Definition of sorting resource */
	enum sort_order order;		/* Ascending or Descending sort */
	enum resource_fields res_type;	/* resources_available, resources_assigned, etc */
};

struct sort_conv
{
	const char *config_name;
	const char *res_name;
	enum sort_order order;
};

/* structure to convert an enum to a string or back again */
struct enum_conv
{
	int value;
	const char *str;
};

struct timegap
{
	time_t from;
	time_t to;
	timegap(time_t tfrom, time_t tto): from(tfrom), to(tto) {}
};

struct dyn_res
{
	std::string res;
	std::string command_line;
	std::string script_name;
	dyn_res(const char *resource, const char *cmdline, const char *fname): res(resource), command_line(cmdline), script_name(fname) {}
};

struct peer_queue
{
	const std::string local_queue;
	const std::string remote_queue;
	const std::string remote_server;
	int peer_sd;
	peer_queue(const char *lqueue, const char *rqueue, const char *rserver): local_queue(lqueue), remote_queue(rqueue), remote_server(rserver) {peer_sd = -1;}
};

class nspec
{
	public:
	bool end_of_chunk:1; /* used for putting parens into the execvnode */
	bool go_provision:1; /* used to mark a node to be provisioned */
	int seq_num;			/* sequence number of chunk */
	int sub_seq_num;		/* sub sequence number for sort stabilization */
	node_info *ninfo;
	resource_req *resreq;
	chunk *chk;

	nspec();
	nspec(const nspec &, node_info **, selspec *);
	~nspec();
	/* We need to have the copy constructor dup everything inside the nspec
	 * We can't have the default copy constructor copy everything, because
	 * we'd end up with a pointer to the same resreq
	 */
	nspec(const nspec&) = delete;
	nspec &operator=(const nspec &) = delete;
};

struct nameval
{
	bool is_set:1;
	char *str;
	int value;
};

struct config
{
	/* these bits control the scheduling policy
	 * prime_* is the prime time setting
	 * non_prime_* is the non-prime setting
	 */
	bool prime_rr:1;		/* round robin through queues*/
	bool non_prime_rr:1;
	bool prime_bq:1;		/* by queue */
	bool non_prime_bq:1;
	bool prime_sf:1;		/* strict fifo */
	bool non_prime_sf:1;
	bool prime_so:1;		/* strict ordering */
	bool non_prime_so:1;
	bool prime_fs:1;		/* fair share */
	bool non_prime_fs:1;
	bool prime_bf:1;		/* back filling */
	bool non_prime_bf:1;
	bool prime_sn:1;		/* sort nodes by priority */
	bool non_prime_sn:1;
	bool prime_bp:1;		/* backfill around prime time */
	bool non_prime_bp:1;	/* backfill around non prime time */
	bool prime_pre:1;		/* preemptive scheduling */
	bool non_prime_pre:1;
	bool update_comments:1;	/* should we update comments or not */
	bool prime_exempt_anytime_queues:1; /* backfill affects anytime queues */
	bool enforce_no_shares:1;	/* jobs with 0 shares don't run */
	bool node_sort_unused:1;	/* node sorting by unused/assigned is used */
	bool resv_conf_ignore:1;	/* if we want to ignore dedicated time when confirming reservations.  Move to enum if ever expanded */
	bool allow_aoe_calendar:1;	/* allow jobs requesting aoe in calendar*/
#ifdef NAS /* localmod 034 */
	bool prime_sto:1;	/* shares_track_only--no enforce shares */
	bool non_prime_sto:1;
#endif /* localmod 034 */

	std::vector<sort_info> prime_sort;	/* prime time sort */
	std::vector<sort_info> non_prime_sort;	/* non-prime time sort */

	enum smp_cluster_dist prime_smp_dist;	/* how to dist jobs during prime*/
	enum smp_cluster_dist non_prime_smp_dist;/* how do dist jobs during nonprime*/
	time_t prime_spill;			/* the amount of time a job can
						 * spill into primetime
						 */
	time_t nonprime_spill;			/* vice versa for prime_spill */
	time_t decay_time;			/*  time in seconds for the decay period*/
	struct t prime[HIGH_DAY][2];		/* prime time start and prime time end*/
	std::vector<int> holidays;		/* holidays in Julian date */
	int holiday_year;			/* the year the holidays are for */
	std::vector<struct timegap> ded_time;	/* dedicated times */
	int unknown_shares;			/* unknown group shares */
	int max_preempt_attempts;		/* max num of preempt attempts per cyc*/
	int max_jobs_to_check;			/* max number of jobs to check in cyc*/
	std::string ded_prefix;			/* prefix to dedicated queues */
	std::string pt_prefix;			/* prefix to primetime queues */
	std::string npt_prefix;			/* prefix to non primetime queues */
	std::string fairshare_res;		/* resource to calc fairshare usage */
	float fairshare_decay_factor;		/* decay factor used when decaying fairshare tree */
	std::string fairshare_ent;			/* job attribute to use as fs entity */
	std::unordered_set<std::string> res_to_check;		/* the resources schedule on */
	std::unordered_set<resdef *> resdef_to_check;		/* the res to schedule on in def form */
	std::unordered_set<std::string> ignore_res;		/* resources - unset implies infinite */
	/* order to preempt jobs */
	std::vector<sort_info> prime_node_sort;	/* node sorting primetime */
	std::vector<sort_info> non_prime_node_sort;	/* node sorting non primetime */
	std::vector<dyn_res> dynamic_res; /* for server_dyn_res */
	std::vector<peer_queue> peer_queues;/* peer local -> remote queue map */
#ifdef NAS
	/* localmod 034 */
	time_t max_borrow;			/* job share borrowing limit */
	int per_share_topjobs;		/* per share group guaranteed top jobs*/
	/* localmod 038 */
	int per_queues_topjobs;		/* per queues guaranteed top jobs */
	/* localmod 030 */
	int min_intrptd_cycle_length;		/* min length of interrupted cycle */
	int max_intrptd_cycles;		/* max consecutive interrupted cycles */
#endif

	/* selection criteria of nodes for provisioning */
	enum provision_policy_types provision_policy;
	config();
};

struct rescheck
{
	char *name;
	char *comment_msg;
	char *debug_msg;
};

struct event_list
{
	bool eol:1;		/* we've reached the end of time */
	timed_event *events;		/* the calendar of events */
	timed_event *next_event;	/* the next event to be performed */
	timed_event *first_run_event;	/* The first run event in the calendar */
	time_t *current_time;		/* [reference] current time in the calendar */
};

struct timed_event
{
	bool disabled:1;	/* event is disabled - skip it in simulation */
	std::string name;	
	enum timed_event_types event_type;
	time_t event_time;
	event_ptr_t *event_ptr;
	event_func_t event_func;
	void *event_func_arg;		/* optional argument to function - not freed */
	timed_event *next;
	timed_event *prev;
};

struct te_list {
	te_list *next;
	timed_event *event;
};

struct bucket_bitpool {
	pbs_bitmap *truth;		/* The actual bits.  This only changes if the bitmaps are changing */
	int truth_ct;			/* number of 1 bits in truth bitmap*/
	pbs_bitmap *working;		/* Used for short lived operations.  Usually truth is copied into working. */
	int working_ct;			/* number of 1 bits in working bitmap */
};

struct node_bucket {
	char *name;			/* Name of bucket: resource spec + queue + priority */
	schd_resource *res_spec;	/* resources that describe the bucket */
	queue_info *queue;		/* queue that nodes in the bucket are associated with */
	int priority;			/* priority of nodes in the bucket */
	pbs_bitmap *bkt_nodes;		/* bitmap of the nodes in the bucket */
	bucket_bitpool *free_pool;	/* bit pool of free_pool nodes*/
	bucket_bitpool *busy_later_pool;/* bit pool of nodes that are free now, but are busy_pool later */
	bucket_bitpool *busy_pool;	/* bit pool of nodes that are busy now */
	int total;			/* total number of nodes in bucket */
};

struct node_bucket_count {
	node_bucket *bkt;		/* node bucket */
	int chunk_count;		/* number of chunks bucket can satisfy */
};

struct chunk_map {
	chunk *chk;
	node_bucket_count **bkt_cnts;	/* buckets job can run in and chunk counts */
	pbs_bitmap *node_bits;		/* assignment of nodes from buckets */
};

struct resresv_filter {
	resource_resv *job;
	schd_error *err;		/* reason why set can not run*/
};

class sched_exception: public std::exception
{
	public:
	sched_exception(const sched_exception &e);
	sched_exception &operator=(const sched_exception &err);
	sched_exception (const std::string &str, const enum sched_error_code e);
	const char *what();
	enum sched_error_code get_error_code() const;
	const std::string& get_message() const;
	sched_exception() = delete;

	private:
	std::string message;
	enum sched_error_code error_code;

};
#endif	/* _DATA_TYPES_H */

// clang-format on

================================================
FILE: src/scheduler/dedtime.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    dedtime.c
 *
 * @brief
 * 		dedtime.c - This file contains functions related to dedicated time.
 *
 * Functions included are:
 * 	parse_ded_file()
 * 	cmp_ded_time()
 * 	is_ded_time()
 *
 */

#include <algorithm>

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <time.h>
#include <memory.h>
#include <errno.h>

#include <log.h>

#include "data_types.h"
#include "misc.h"
#include "dedtime.h"
#include "globals.h"

/**
 * @brief
 *		parse_ded_file - read in dedicated times from file
 *
 * @param[in]	filename	-	filename of dedicated time file
 *
 * @return	0	: on success non-zero on failure
 *
 * @par NOTE:
 * 		modifies conf data structure
 *
 * @note
 *	FORMAT:      start         finish
 *		MM/DD/YY HH:MM MM/DD/YYYY HH:MM
 */
int
parse_ded_file(const char *filename)
{
	FILE *fp;		  /* file pointer for the dedtime file */
	char line[256];		  /* a buffer for a line from the file */
	int error = 0;		  /* boolean: is there an error? */
	struct tm tm_from, tm_to; /* tm structs used to convert to time_t */
	time_t from, to;	  /* time_t values for dedtime start - end */

	if ((fp = fopen(filename, "r")) == NULL) {
		sprintf(log_buffer, "Error opening file %s", filename);
		log_err(errno, "parse_ded_file", log_buffer);
		return 1;
	}

	// We are rereading the dedtime file.  The current dedtime might not exist any more.
	cstat.is_ded_time = false;
	conf.ded_time.clear();

	while (fgets(line, 256, fp) != NULL) {
		if (!skip_line(line)) {
			/* mktime() will figure out if it is dst or not if tm_isdst == -1 */
			memset(&tm_from, 0, sizeof(struct tm));
			tm_from.tm_isdst = -1;

			memset(&tm_to, 0, sizeof(struct tm));
			tm_to.tm_isdst = -1;

			if (sscanf(line, "%d/%d/%d %d:%d %d/%d/%d %d:%d", &tm_from.tm_mon, &tm_from.tm_mday, &tm_from.tm_year, &tm_from.tm_hour, &tm_from.tm_min, &tm_to.tm_mon, &tm_to.tm_mday, &tm_to.tm_year, &tm_to.tm_hour, &tm_to.tm_min) != 10)
				error = 1;
			else {
				/* tm_mon starts at 0, where the file will start at 1 */
				tm_from.tm_mon--;

				/* the MM/DD/YY is the wrong date format, but we will accept it anyways */
				/* if year is less then 90, assume year is > 2000 */
				if (tm_from.tm_year < 90)
					tm_from.tm_year += 100;

				/* MM/DD/YYYY is the correct date format */
				if (tm_from.tm_year > 1900)
					tm_from.tm_year -= 1900;
				from = mktime(&tm_from);

				tm_to.tm_mon--;
				if (tm_from.tm_year < 90)
					tm_from.tm_year += 100;
				if (tm_to.tm_year > 1900)
					tm_to.tm_year -= 1900;
				to = mktime(&tm_to);

				/* ignore all dedtime which has passed */
				if (!(from < cstat.current_time && to < cstat.current_time))
					conf.ded_time.emplace_back(from, to);

				if (from > to) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "From date is greater than To date in the line - '%s'.", line);
					log_err(-1, "Dedicated Time Conflict", log_buffer);
					error = 1;
				}
			}
			if (error) {
				printf("Error: %s\n", line);
				error = 0;
			}
		}
	}
	/* sort dedtime in ascending order with all 0 elements at the end */
	std::sort(conf.ded_time.begin(), conf.ded_time.end(), cmp_ded_time);
	fclose(fp);
	return 0;
}

/**
 * @brief
 *		cmp_ded_time - compare function for qsort for the ded time array
 *
 * @param[in]	v1	-	value 1
 * @param[in]	v2	-	value 2
 *
 * @par
 *	  Sort Keys:
 *	    - zero elements to the end of the array
 *	    - descending by the start time
 *
 */
bool
cmp_ded_time(const timegap &t1, const timegap &t2)
{
	if (t1.from == 0 && t2.from != 0)
		return 0;
	else if (t2.from == 0 && t1.from != 0)
		return 1;

	return t1.from < t2.from;
}

/**
 * @brief
 * 		checks if it is dedicated time at time t
 *
 * @param[in]	t	-	the time to check
 *
 * @return	bool
 * @retval	true if it is currently ded time
 * @retval	false if it is not ded time
 *
 */
bool
is_ded_time(time_t t)
{
	if (t == 0)
		t = cstat.current_time;

	struct timegap ded = find_next_dedtime(t);

	if (t >= ded.from && t < ded.to)
		return true;
	else
		return false;
}

/**
 * @brief
 * 		find the next dedtime after time t
 *
 * @param[in]	t	-	a time to find the next dedtime after
 *
 * @return	the next dedtime or empty timegap if no dedtime
 */
struct timegap
find_next_dedtime(time_t t)
{
	for (const auto &dt : conf.ded_time)
		if (dt.to >= t)
			return dt;

	return {0, 0};
}


================================================
FILE: src/scheduler/dedtime.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _DEDTIME_H
#define _DEDTIME_H

#include <time.h>

/*
 *      parse_ded_file - read in dedicated times from file
 *
 *      FORMAT: start - finish
 *              MM/DD/YYYY HH:MM MM/DD/YYYY HH:MM
 */
int parse_ded_file(const char *filename);

/*
 *
 *      cmp_ded_time - compare function for qsort for the ded time array
 *
 */
bool cmp_ded_time(const timegap &t1, const timegap &t2);

/*
 *      is_ded_time - checks if it is currently dedicated time
 */
bool is_ded_time(time_t t);

/*
 *
 *	find_next_dedtime - find the next dedtime.  If t is specified
 *			    find the next dedtime after time t
 *
 *	  t - a time to find the next dedtime after
 *
 *	return the next dedtime or empty timegap if no dedtime
 */
struct timegap find_next_dedtime(time_t t);

#endif /* _DEDTIME_H */


================================================
FILE: src/scheduler/fairshare.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    fairshare.c
 *
 * @brief
 * 		fairshare.c - This file contains functions related to fareshare scheduling.
 *
 * Functions included are:
 * 	add_child()
 * 	add_unknown()
 * 	find_group_info()
 * 	find_alloc_ginfo()
 * 	new_group_info()
 * 	parse_group()
 * 	preload_tree()
 * 	count_shares()
 * 	calc_fair_share_perc()
 * 	test_perc()
 * 	update_usage_on_run()
 * 	decay_fairshare_tree()
 * 	compare_path()
 * 	print_fairshare()
 * 	write_usage()
 * 	rec_write_usage()
 * 	read_usage()
 * 	read_usage_v1()
 * 	read_usage_v2()
 * 	over_fs_usage()
 * 	dup_fairshare_tree()
 * 	free_fairshare_tree()
 * 	reset_temp_usage()
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>

#include <log.h>

#include "data_types.h"
#include "job_info.h"
#include "constant.h"
#include "fairshare.h"
#include "globals.h"
#include "misc.h"
#include "constant.h"
#include "config.h"
#include "log.h"
#include "fifo.h"
#include "resource_resv.h"
#include "resource.h"
#ifdef NAS /* localmod 041 */
#include "sort.h"
#endif

extern time_t last_decay;

/**
 * @brief
 *		add_child - add a group_info to the resource group tree
 *
 * @param[out]	ginfo	-	ginfo to add to the tree
 * @param[in,out]	parent	-	parent ginfo
 *
 * @return	nothing
 *
 */
void
add_child(group_info *ginfo, group_info *parent)
{
	if (parent != NULL) {
		ginfo->sibling = parent->child;
		parent->child = ginfo;
		ginfo->parent = parent;
		ginfo->resgroup = parent->cresgroup;
		ginfo->gpath = create_group_path(ginfo);
	}
}

/**
 * @brief
 * 		add a ginfo to the "unknown" group
 *
 * @param[in]	ginfo	-	ginfo to add
 * @param[in]	root	-	root of fairshare tree
 *
 * @return	nothing
 *
 */
void
add_unknown(group_info *ginfo, group_info *root)
{
	group_info *unknown; /* ptr to the "unknown" group */

	unknown = find_group_info("unknown", root);
	add_child(ginfo, unknown);
	calc_fair_share_perc(unknown->child, UNSPECIFIED);
}

/**
 * @brief
 *		find_group_info - recursive function to find a group_info in the
 *			  resgroup tree
 *
 * @param[in]	name	-	name of the ginfo to find
 * @param[in]	root	-	the root of the current sub-tree
 *
 * @return	the found group_info or NULL
 *
 */
group_info *
find_group_info(const std::string &name, group_info *root)
{
	group_info *ginfo; /* the found group */
	if (root == NULL || name == root->name)
		return root;

	ginfo = find_group_info(name, root->sibling);
	if (ginfo == NULL)
		ginfo = find_group_info(name, root->child);

	return ginfo;
}

/**
 * @brief
 *		find_alloc_ginfo - tries to find a ginfo in the fair share tree.  If it
 *			  can not find the ginfo, then allocate a new one and
 *			  add it to the "unknown" group
 *
 * @param[in]	name	-	name of the ginfo to find
 * @param[in]	root	-	root of the fairshare tree
 *
 * @return	the found ginfo or the newly allocated ginfo
 *
 */
group_info *
find_alloc_ginfo(const std::string &name, group_info *root)
{
	group_info *ginfo; /* the found group or allocated group */

	if (root == NULL)
		return NULL;

	ginfo = find_group_info(name, root);

	if (ginfo == NULL) {
		if ((ginfo = new group_info(name)) == NULL)
			return NULL;

		ginfo->shares = 1;
		add_unknown(ginfo, root);
	}
	return ginfo;
}

/**
 * @brief
 * 		parse the resource group file
 *
 * @param[in]	fname	-	name of the file
 * @param[in]	root	-	root of fairshare tree
 *
 * @return	success/failure
 *
 *
 * @par FORMAT:   name	cresgrp		grpname		shares
 *	  name    - name of user/grp
 *	  cresgrp - resource group of the children of this group (if group)
 *	  grpname - resource group of this user/group
 *	  shares  - the amount of shares the user/group has in its resgroup
 *
 */
int
parse_group(const char *fname, group_info *root)
{
	group_info *ginfo;     /* ptr to parent group */
	group_info *new_ginfo; /* used to add each new group */
	char buf[256];	       /* used to read each line from the file */
	char *nametok;	       /* strtok: name of new group */
	char *grouptok;	       /* strtok: parent group name */
	char *cgrouptok;       /* strtok: resgrp of the children of newgrp */
	char *sharestok;       /* strtok: the amount of shares for newgrp */
	FILE *fp;	       /* file pointer to the resource group file */
	char error = 0;	       /* boolean: is there an error ? */
	int shares;	       /* number of shares for the new group */
	int cgroup;	       /* resource group of the children of the grp */
	char *endp;	       /* used for strtol() */
	int linenum = 0;       /* current line number in the file */

	if ((fp = fopen(fname, "r")) == NULL) {
		snprintf(log_buffer, sizeof(log_buffer), "Error opening file %s", fname);
		log_err(errno, __func__, log_buffer);
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, "", "Warning: resource group file error, fair share will not work");
		return 0;
	}

	while (fgets(buf, 256, fp) != NULL) {
		if (buf[strlen(buf) - 1] == '\n')
			buf[strlen(buf) - 1] = '\0';
		linenum++;
		if (!skip_line(buf)) {
			nametok = strtok(buf, " \t");
			cgrouptok = strtok(NULL, " \t");
			grouptok = strtok(NULL, " \t");
			sharestok = strtok(NULL, " \t");

			if (nametok == NULL || cgrouptok == NULL ||
			    grouptok == NULL || sharestok == NULL) {
				error = 1;
			} else if (find_group_info(nametok, root) != NULL) {
				error = 1;
				sprintf(log_buffer, "entity %s is not unique", nametok);
				fprintf(stderr, "%s\n", log_buffer);
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE,
					  "fairshare", log_buffer);
			} else {
				if (!strcmp(grouptok, "root"))
					ginfo = find_group_info(FAIRSHARE_ROOT_NAME, root);
				else
					ginfo = find_group_info(grouptok, root);

				if (ginfo != NULL) {
					shares = strtol(sharestok, &endp, 10);
					if (*endp == '\0') {
						cgroup = strtol(cgrouptok, &endp, 10);
						if (*endp == '\0') {
							if ((new_ginfo = new group_info(nametok)) == NULL)
								return 0;
							new_ginfo->resgroup = ginfo->cresgroup;
							new_ginfo->cresgroup = cgroup;
							new_ginfo->shares = shares;
							add_child(new_ginfo, ginfo);
						} else
							error = 1;
					} else
						error = 1;
				} else {
					error = 1;
					sprintf(log_buffer, "Parent ginfo of %s doesnt exist.", nametok);
					fprintf(stderr, "%s\n", log_buffer);
					log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE,
						  "fairshare", log_buffer);
				}
			}

			if (error) {
				sprintf(log_buffer, "resgroup: error on line %d.", linenum);
				fprintf(stderr, "%s\n", log_buffer);
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE,
					  "fairshare", log_buffer);
			}

			error = 0;
		}
	}
	fclose(fp);
	return 1;
}

/**
 * @brief
 * 		load the root node into the fair share tree
 *		the root node is the entire machine.  Also load
 *		the "unknown" group.  This group is for any user that
 *		is not specified in the resource group file.
 *
 * @return	new head and root of a fairshare tree
 *
 */
fairshare_head *
preload_tree()
{
	fairshare_head *head;
	group_info *root;
	group_info *unknown; /* pointer to the "unknown" group */

	if ((head = new fairshare_head()) == NULL)
		return 0;

	root = new group_info(FAIRSHARE_ROOT_NAME);

	head->root = root;

	root->resgroup = -1;
	root->cresgroup = 0;
	root->tree_percentage = 1.0;

	if ((unknown = new group_info(UNKNOWN_GROUP_NAME)) == NULL) {
		delete head;
		return NULL;
	}

	unknown->shares = conf.unknown_shares;
	unknown->resgroup = 0;
	unknown->cresgroup = 1;
	unknown->parent = root;
	add_child(unknown, root);
	return head;
}

/**
 * @brief
 *		count_shares - count the shares in a resource group
 *		       a resource group is a group_info and all of its
 *		       siblings
 *
 * @param[in]	grp	-	The start of a sibling chain
 *
 * @return	the number of shares
 *
 */
int
count_shares(group_info *grp)
{
	int shares = 0;	     /* accumulator to count the shares */
	group_info *cur_grp; /* the current group in a sibling chain */

	cur_grp = grp;

	while (cur_grp != NULL) {
		shares += cur_grp->shares;
		cur_grp = cur_grp->sibling;
	}

	return shares;
}

/**
 * @brief
 *		calc_fair_share_perc - walk the fair share group tree and calculate
 *			       the overall percentage of the machine a user/
 *			       group gets if all usage is equal
 *
 * @param[in,out]	root	-	the root of the current subtree
 * @param[in]	shares	-	the number of total shares in the group
 *
 * @return	success/failure
 *
 */
int
calc_fair_share_perc(group_info *root, int shares)
{
	int cur_shares; /* total number of shares in the resgrp */

	if (root == NULL)
		return 0;

	if (shares == UNSPECIFIED)
		cur_shares = count_shares(root);
	else
		cur_shares = shares;

	if (cur_shares * root->parent->tree_percentage == 0) {
		root->group_percentage = 0;
		root->tree_percentage = 0;
	} else {
		root->group_percentage = (float) root->shares / cur_shares;
		root->tree_percentage = root->group_percentage * root->parent->tree_percentage;
	}

	calc_fair_share_perc(root->sibling, cur_shares);
	calc_fair_share_perc(root->child, UNSPECIFIED);
	return 1;
}

/**
 * @brief
 * 		Update the usage of a fairshare entity for a job.  The process
 *         of updating an entity's usage causes the full usage of the job
 *	       to be accrued to the entity and all groups on the path from the
 *	       entity to the root of the fairshare tree.
 *
 * @param[in]	resresv	-	the job to accrue usage
 *
 * @return nothing
 *
 */
void
update_usage_on_run(resource_resv *resresv)
{
	usage_t u;

	if (resresv == NULL)
		return;

	if (!resresv->is_job || resresv->job == NULL)
		return;

	u = formula_evaluate(conf.fairshare_res.c_str(), resresv, resresv->resreq);
	if (resresv->job->ginfo != NULL) {
		for (auto &g : resresv->job->ginfo->gpath)
			g->temp_usage += u;
	} else
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, resresv->name,
			  "Job doesn't have a group_info ptr set, usage not updated.");
}

/**
 * @brief
 *		decay_fairshare_tree - decay the usage information kept in the fair
 *			       share tree
 *
 * @param[in,out]	root	-	the root of the fairshare tree
 *
 * @return nothing
 *
 */
void
decay_fairshare_tree(group_info *root)
{
	if (root == NULL)
		return;

	decay_fairshare_tree(root->sibling);
	decay_fairshare_tree(root->child);

	root->usage *= conf.fairshare_decay_factor;
	if (root->usage < FAIRSHARE_MIN_USAGE)
		root->usage = FAIRSHARE_MIN_USAGE;
}

/**
 * @brief
 *		compare_path - compare two group paths and see which is more
 *				deserving to run
 * @par
 *		comparison: usage / priority
 *
 * @param[in]	gp1	-	group path 1
 * @param[in]	gp2	-	group path 2
 *
 * @return	int
 * @retval	-1	: gp1 is more deserving
 * @retval	0	: both are equal
 * @retval	1	: gp2 is more deserving
 *
 */
int
compare_path(std::vector<group_info *> &gp1, std::vector<group_info *> &gp2)
{
	double curval1, curval2;
	int rc = 0;
	int len;

	if (gp1.size() > gp2.size())
		len = gp2.size();
	else
		len = gp1.size();

	for (int i = 0; rc == 0 && i < len; i++) {
		if (gp1[i] != gp2[i]) {
			if (gp1[i]->tree_percentage <= 0 && gp2[i]->tree_percentage > 0)
				return 1;
			if (gp1[i]->tree_percentage > 0 && gp2[i]->tree_percentage <= 0)
				return -1;
			if (gp1[i]->tree_percentage <= 0 && gp2[i]->tree_percentage <= 0)
				return 0;

			curval1 = gp1[i]->temp_usage / gp1[i]->tree_percentage;
			curval2 = gp2[i]->temp_usage / gp2[i]->tree_percentage;

			if (curval1 < curval2)
				rc = -1;
			else if (curval2 < curval1)
				rc = 1;
		}
	}

	return rc;
}

/**
 * @brief
 *		write_usage - write the usage information to the usage file
 *		      This function uses a recursive helper function
 *
 * @param[in]	filename	-	usage file
 * @param[in]	fhead	-	Pointer to fairshare_head structure.
 *
 * @return	success/failure
 *
 */
int
write_usage(const char *filename, fairshare_head *fhead)
{
	FILE *fp; /* file pointer to usage file */
	struct group_node_header head;

	if (fhead == NULL)
		return 0;

	if (filename == NULL)
		filename = USAGE_FILE;

	if ((fp = fopen(filename, "wb")) == NULL) {
		sprintf(log_buffer, "Error opening file %s", filename);
		log_err(errno, "write_usage", log_buffer);
		return 0;
	}

	/* version 2:
	 * header
	 * last_decay
	 * group_node_usage_v2
	 * group_node_usage_v2
	 * ...
	 */

	memset(&head, 0, sizeof(struct group_node_header));

	pbs_strncpy(head.tag, USAGE_MAGIC, sizeof(head.tag));
	head.version = USAGE_VERSION;
	fwrite(&head, sizeof(struct group_node_header), 1, fp);
	fwrite(&fhead->last_decay, sizeof(time_t), 1, fp);

	rec_write_usage(fhead->root, fp);
	fclose(fp);
	return 1;
}

/**
 * @brief
 *		rec_write_usage - recursive helper function which will write out all
 *			  the group_info structs of the resgroup tree
 *
 * @param[in]	root	-	the root of the current subtree
 * @param[in]	fp	-	the file to write the ginfo out to
 *
 * @return nothing
 *
 */
void
rec_write_usage(group_info *root, FILE *fp)
{
	struct group_node_usage_v2 grp; /* used to write out usage info */

	if (root == NULL)
		return;

	/* only write out leaves of the tree (fairshare entities)
	 * usage defaults to 1 so don't bother writing those out either
	 * It is possible that the unknown group is empty.  Don't want to write it out
	 */
	if (root->usage != 1 && root->child == NULL && root->name != UNKNOWN_GROUP_NAME) {
		memset(&grp, 0, sizeof(struct group_node_usage_v2));
		snprintf(grp.name, sizeof(grp.name), "%s", root->name.c_str());
		grp.usage = root->usage;

		fwrite(&grp, sizeof(struct group_node_usage_v2), 1, fp);
	}

	rec_write_usage(root->sibling, fp);
	rec_write_usage(root->child, fp);
}

/**
 * @brief
 *		read_usage - read the usage information and load it into the
 *		     resgroup tree.
 *
 * @param[in]	filename	-	The file which stores the usage information.
 * @param[in]	flags	-	flags to check whether to trim or not.
 * @param[in]	fhead	-	pointer to fairshare_head struct.
 *
 * @return void
 *
 */
void
read_usage(const char *filename, int flags, fairshare_head *fhead)
{
	FILE *fp;		       /* file pointer to usage file */
	struct group_node_header head; /* usage file header */
	time_t last;		       /* read the last sync from the file */

	if (fhead == NULL || fhead->root == NULL)
		return;

	if (filename == NULL)
		filename = USAGE_FILE;

	if ((fp = fopen(filename, "r")) == NULL) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_WARNING, "fairshare usage",
			  "Creating usage database for fairshare");
		fprintf(stderr, "Creating usage database for fairshare.\n");
		return;
	}
	memset(&head, 0, sizeof(struct group_node_header));
	/* read header */
	if (fread(&head, sizeof(struct group_node_header), 1, fp) != 0) {
		if (!strcmp(head.tag, USAGE_MAGIC)) { /* this is a header */
			int error = 0;

			if (head.version == 2) {
				if (fread(&last, sizeof(time_t), 1, fp) != 0) {
					/* 946713600 = 1/1/2000 00:00 - before usage version 2 existed */
					if (last == 0 || last > 946713600)
						fhead->last_decay = last;
					else
						error = 1;
				}
				if (!error)
					read_usage_v2(fp, flags, fhead->root);
			} else
				error = 1;

			if (error)
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_WARNING,
					  "fairshare usage", "Invalid usage file header");

		} else { /* original headerless usage file */
			rewind(fp);
			read_usage_v1(fp, fhead->root);
		}
	}

	fclose(fp);
}

/**
 * @brief
 * 		read version 1 usage file
 *
 * @param[in]	fp	-	the file pointer to the open file
 * @param[in]	root	-	root of the fairshare tree
 *
 * @return	int
 *	@retval	1	: success
 *	@retval	0	: failure
 *
 */
int
read_usage_v1(FILE *fp, group_info *root)
{
	struct group_node_usage_v1 grp;
	group_info *ginfo;

	if (fp == NULL)
		return 0;
	memset(&grp, 0, sizeof(struct group_node_usage_v1));
	while (fread(&grp, sizeof(struct group_node_usage_v1), 1, fp)) {
		if (grp.usage >= 0 && is_valid_pbs_name(grp.name, USAGE_NAME_MAX)) {
			ginfo = find_alloc_ginfo(grp.name, root);
			if (ginfo != NULL) {
				ginfo->usage = grp.usage;
				ginfo->temp_usage = grp.usage;
				if (ginfo->child == NULL) {
					/* add usage down the path from the root to our parent */
					for (auto &g : ginfo->gpath) {
						if (g == ginfo)
							break;
						g->usage += grp.usage;
						g->temp_usage += grp.usage;
					}
				}
			}
		} else
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_WARNING,
				  "fairshare usage", "Invalid entity");
	}

	return 1;
}

/**
 * @brief
 * 		read version 2 usage file
 *
 * @param[in]	fp	- the file pointer to the open file
 * @param[in]	flags	- flags to check whether to trim or not.
 * @param[in]	root	- root of the fairshare tree
 *
 *	@retval 1 success
 *	@retval 0 failure
 *
 */
int
read_usage_v2(FILE *fp, int flags, group_info *root)
{
	struct group_node_usage_v2 grp;
	group_info *ginfo;

	if (fp == NULL)
		return 0;

	memset(&grp, 0, sizeof(struct group_node_usage_v2));
	while (fread(&grp, sizeof(struct group_node_usage_v2), 1, fp)) {
		if (grp.usage >= 0 && is_valid_pbs_name(grp.name, USAGE_NAME_MAX)) {
			/* if we're trimming the tree, don't add any new nodes which are not
			 * already in the resource_group file
			 */
			if (flags & FS_TRIM)
				ginfo = find_group_info(grp.name, root);
			else
				ginfo = find_alloc_ginfo(grp.name, root);

			if (ginfo != NULL) {
				ginfo->usage = grp.usage;
				ginfo->temp_usage = grp.usage;
				if (ginfo->child == NULL) {
					/* add usage down the path from the root to our parent */
					for (auto &g : ginfo->gpath) {
						if (g == ginfo)
							break;
						g->usage += grp.usage;
						g->temp_usage += grp.usage;
					}
				}
			}
		} else
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_WARNING,
				  "fairshare usage", "Invalid entity");
	}

	return 1;
}

/**
 * @brief
 *		create_group_path - create a path from the root to the leaf of the tree
 *
 * @param[in]	ginfo - the group_root to create the path from
 *
 * @return path
 *
 */
std::vector<group_info *>
create_group_path(group_info *ginfo)
{
	struct group_info *cur;
	std::vector<group_info *> gpath;

	if (ginfo == NULL)
		return {};

	for (cur = ginfo; cur != NULL; cur = cur->parent)
		gpath.insert(gpath.begin(), cur);

	return gpath;
}

/**
 * @brief
 *		over_fs_usage - return true of a entity has used more then their
 *			fairshare of the machine.  Overusage is defined as
 *			a user using more then their strict percentage of the
 *			total usage used (the usage of the root node)
 *
 * @param[in]	ginfo	-	the entity to check
 *
 * @return	true/false
 * @retval	-	true	: if the user is over their usage
 * @retval	-	false	: if under
 *
 */
int
over_fs_usage(group_info *ginfo)
{
	return ginfo->gpath[0]->usage * ginfo->tree_percentage < ginfo->usage;
}

/**
 * @brief
 *		new_group_info - allocate a new group_info struct and initalize it
 *
 * @return	a ptr to the new group_info
 *
 */
group_info::group_info(const std::string &gname) : name(gname)
{
	resgroup = UNSPECIFIED;
	cresgroup = UNSPECIFIED;
	shares = UNSPECIFIED;
	tree_percentage = 0.0;
	group_percentage = 0.0;
	usage = FAIRSHARE_MIN_USAGE;
	temp_usage = FAIRSHARE_MIN_USAGE;
	usage_factor = 0.0;
	parent = NULL;
	sibling = NULL;
	child = NULL;
}

group_info::group_info(group_info &oginfo) : name(oginfo.name)
{
	resgroup = oginfo.resgroup;
	cresgroup = oginfo.cresgroup;
	shares = oginfo.shares;
	tree_percentage = oginfo.tree_percentage;
	group_percentage = oginfo.group_percentage;
	usage = oginfo.usage;
	usage_factor = oginfo.usage_factor;
	temp_usage = oginfo.temp_usage;
	sibling = NULL;
	child = NULL;
	parent = NULL;
}

group_info &
group_info::operator=(const group_info &oginfo)
{
	resgroup = oginfo.resgroup;
	cresgroup = oginfo.cresgroup;
	shares = oginfo.shares;
	tree_percentage = oginfo.tree_percentage;
	group_percentage = oginfo.group_percentage;
	usage = oginfo.usage;
	usage_factor = oginfo.usage_factor;
	temp_usage = oginfo.temp_usage;
	sibling = NULL;
	child = NULL;
	parent = NULL;

	return *this;
}

/**
 * @brief
 * 		copy constructor for the fairshare tree
 *
 * @param[in]	root	-	root of the tree
 * @param[in] nparent	-	the parent of the root in the new dup'd tree
 *
 * @return	duplicated fairshare tree
 */
group_info *
dup_fairshare_tree(group_info *root, group_info *nparent)
{
	group_info *nroot;
	if (root == NULL)
		return NULL;

	nroot = new group_info(*root);

	if (nroot == NULL)
		return NULL;

	add_child(nroot, nparent);

	nroot->sibling = dup_fairshare_tree(root->sibling, nparent);
	nroot->child = dup_fairshare_tree(root->child, nroot);

	return nroot;
}

/**
 *	@brief
 *		free the entire fairshare tree
 *
 * @param[in]	root	-	root of the tree
 */
void
free_fairshare_tree(group_info *root)
{
	if (root == NULL)
		return;

	free_fairshare_tree(root->sibling);
	free_fairshare_tree(root->child);
	delete root;
}

/**
 * @brief
 * 		constructor for fairshare head
 */

fairshare_head::fairshare_head()
{
	root = NULL;
	last_decay = 0;
}

/**
 * @brief
 *		copy constructor for fairshare_head
 *
 * @param[in]	ofhead	-	fairshare_head to dup
 *
 * @return	duplicated fairshare_head
 * @retval	NULL	: fail 
 */
fairshare_head::fairshare_head(fairshare_head &ofhead)
{
	last_decay = ofhead.last_decay;
	root = dup_fairshare_tree(ofhead.root, NULL);
}

/**
 * @brief copy assignment operator for fairshare_head
 */
fairshare_head &
fairshare_head::operator=(fairshare_head &ofhead)
{
	free_fairshare_tree(root);
	last_decay = ofhead.last_decay;
	root = dup_fairshare_tree(ofhead.root, NULL);
	return *this;
}

/**
 * @brief
 * 		destructor for fairshare_head
 *
 * @param[in]	fhead	-	fairshare_head to be freed.
 */
fairshare_head::~fairshare_head()
{
	free_fairshare_tree(root);
}

/**
 * @brief
 * 		recursively walk the fairshare tree resetting temp_usage = usage
 *
 * @param[in]	head	-	fairshare node to reset
 *
 * @return	void
 */
void
reset_temp_usage(group_info *head)
{
	if (head == NULL)
		return;

	head->temp_usage = head->usage;
	reset_temp_usage(head->sibling);
	reset_temp_usage(head->child);
}

/**
 * @brief
 *		recursive helper function to calc_usage_factor()
 * @param root	- parent fairshare tree node
 * @param ginfo	- child fairshare tree node
 *
 * @return void
 */
static void
calc_usage_factor_rec(group_info *root, group_info *ginfo)
{
	float usage;

	if (root == NULL || ginfo == NULL)
		return;

	usage = ginfo->usage / root->usage;
	ginfo->usage_factor = usage + ((ginfo->parent->usage_factor - usage) * ginfo->group_percentage);

	calc_usage_factor_rec(root, ginfo->sibling);
	calc_usage_factor_rec(root, ginfo->child);
}

/**
 * @brief
 *		calculate usage_factor numbers for entire tree.
 *		The usage_factor is a number that takes the node's usage
 *		plus part of its parent's usage_factor into account.  This
 *		will give a number that is comparable across the tree.
 *
 * @param[in] tree - fairshare tree
 *
 * @return void
 */
void
calc_usage_factor(fairshare_head *tree)
{
	group_info *ginfo;
	group_info *root;

	if (tree == NULL)
		return;

	root = tree->root;
	/* Root's children use their real usage as their arbitrary usage */
	for (ginfo = root->child; ginfo != NULL; ginfo = ginfo->sibling) {
		ginfo->usage_factor = ginfo->usage / root->usage;
		calc_usage_factor_rec(root, ginfo->child);
	}
}

/**
 * @brief reset the usage of the fairshare tree so the usage can be reread.
 *	If the usage is not reset first, any entity that is no longer in the
 *	fairshare usage file will retain their original usage.
 * @param node - the fairshare node
 */
void
reset_usage(group_info *node)
{
	if (node == NULL)
		return;
	reset_usage(node->sibling);
	reset_usage(node->child);
	node->usage = 1;
	node->temp_usage = 1;
}


================================================
FILE: src/scheduler/fairshare.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _FAIRSHARE_H
#define _FAIRSHARE_H

#include "data_types.h"
/*
 *      add_child - add a ginfo to the resource group tree
 */
void add_child(group_info *ginfo, group_info *parent);

/*
 *      find_group_info - recursive function to find a ginfo in the
 resgroup tree
 */
group_info *find_group_info(const std::string &name, group_info *root);

/*
 *      find_alloc_ginfo - trys to find a ginfo in the fair share tree.  If it
 *                        can not find the ginfo, then allocate a new one and
 *                        add it to the "unknown" group
 */
group_info *find_alloc_ginfo(const std::string &name, group_info *root);

/*
 *
 *	parse_group - parse the resource group file
 *
 *	  fname - name of the file
 *	  root  - root of fairshare tree
 *
 *	return success/failure
 *
 *
 *	FORMAT:   name	cresgrp		grpname		shares
 *
 *	  name    - name of user/grp
 *	  cresgrp - resource group of the children of this group (if group)
 *	  grpname - resource group of this user/group
 *	  shares  - the amount of shares the user/group has in its resgroup
 *
 */
int parse_group(const char *fname, group_info *root);

/*
 *
 *	preload_tree -  load the root node into the fair share tree
 *			the root node is the entire machine.  Also load
 *			the "unknown" group.  This group is for any user that
 *			is not specified in the resource group file.
 *
 *	return new head and root of a fairshare tree
 *
 */
fairshare_head *preload_tree(void);

/*
 *      count_shares - count the shares in the current resource group
 */
int count_shares(group_info *grp);

/*
 *      calc_fair_share_perc - walk the fair share group tree and calculate
 *                             the overall percentage of the machine a user/
 *                             group gets if all usage is equal
 */
int calc_fair_share_perc(group_info *root, int shares);

/*
 *      update_usage_on_run - update a users usage information when a
 *                            job is run
 */
void update_usage_on_run(resource_resv *resresv);

/*
 *      decay_fairshare_tree - decay the usage information kept in the fair
 *                             share tree
 */
void decay_fairshare_tree(group_info *root);

/*
 *      write_usage - write the usage information to the usage file
 *                    This fuction uses a recursive helper function
 */
int write_usage(const char *filename, fairshare_head *fhead);

/*
 *      rec_write_usage - recursive helper function which will write out all
 *                        the group_info structs of the resgroup tree
 */
void rec_write_usage(group_info *root, FILE *fp);

/*
 *      read_usage - read the usage information and load it into the
 *                   resgroup tree.
 */
void read_usage(const char *filename, int flags, fairshare_head *fhead);

/*
 *      read_usage_v1 - read version 1 usage file
 */
int read_usage_v1(FILE *fp, group_info *root);

/*
 *      read_usage_v2 - read version 2 usage file
 */
int read_usage_v2(FILE *fp, int flags, group_info *root);

/*
 *      create_group_path - create a path from the root to the leaf of the tree
 */
std::vector<group_info *> create_group_path(group_info *ginfo);

/*
 *      compare_path - compare two group_path's and see which is more
 *                     deserving to run
 */
int compare_path(std::vector<group_info *> &gp1, std::vector<group_info *> &gp2);

/*
 *      over_fs_usage - return true of a entity has used more then their
 *                      fairshare of the machine.  Overusage is defined as
 *                      a user using more then their strict percentage of the
 *                      total usage used (the usage of the root node)
 */
int over_fs_usage(group_info *ginfo);

/*
 *	dup_fairshare_tree
 *
 *	  root - root of the tree
 *	  nparent - the parent of the root in the "new" duplicated tree
 *
 *	return duplicated fairshare tree
 */
group_info *dup_fairshare_tree(group_info *root, group_info *nparent);

/*
 *	free_fairshare_tree - free the entire fairshare tree
 */
void free_fairshare_tree(group_info *root);

/*
 *
 *	add_unknown - add a ginfo to the "unknown" group
 *
 *	  ginfo - ginfo to add
 *	  root  - root of fairshare tre
 *
 *	return nothing
 *
 */
void add_unknown(group_info *ginfo, group_info *root);

/*
 * 	reset_temp_usage - walk the fairshare tree resetting temp_usage = usage
 *
 * 	  head - fairshare node to reset
 *
 * 	return nothing
 */
void reset_temp_usage(group_info *head);

/* reset the tree to 1 usage */
void reset_usage(group_info *node);

/* Calculate the arbitrary usage of the tree */
void calc_usage_factor(fairshare_head *tree);

#endif /* _FAIRSHARE_H */


================================================
FILE: src/scheduler/fifo.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * This file contains functions related to scheduling
 */

#include <pbs_config.h>

#ifdef PYTHON
#include <pbs_python_private.h>
#include <Python.h>
#include <pythonrun.h>
#include <wchar.h>
#endif

#include <algorithm>

#include "buckets.h"
#include "check.h"
#include "config.h"
#include "constant.h"
#include "dedtime.h"
#include "fairshare.h"
#include "fifo.h"
#include "globals.h"
#include "job_info.h"
#include "libpbs.h"
#include "limits_if.h"
#include "misc.h"
#include "multi_threading.h"
#include "node_info.h"
#include "node_partition.h"
#include "parse.h"
#include "pbs_internal.h"
#include "pbs_python.h"
#include "pbs_share.h"
#include "pbs_version.h"
#include "prev_job_info.h"
#include "prime.h"
#include "queue_info.h"
#include "range.h"
#include "resource.h"
#include "resource_resv.h"
#include "resv_info.h"
#include "server_info.h"
#include "simulate.h"
#include "sort.h"
#include <errno.h>
#include <fcntl.h>
#include <libutil.h>
#include <log.h>
#include <pbs_error.h>
#include <pbs_ifl.h>
#include <pwd.h>
#include <sched_cmds.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <time.h>
#include <unistd.h>

#ifdef NAS
#include "site_code.h"
#endif

/**
 * @brief
 * 		initialize conf struct and parse conf files
 *
 * @param[in]	nthreads - number of worker threads to launch, < 1 to use num cores
 *
 * @return	Success/Failure
 * @retval	0	: success
 * @retval	!= 0	: failure
 */
int
schedinit(int nthreads)
{
	char zone_dir[MAXPATHLEN];

#ifdef PYTHON
	const char *errstr;
	PyObject *module;
	PyObject *obj;
	PyObject *dict;
#endif

	conf = parse_config(CONFIG_FILE);

	parse_holidays(HOLIDAYS_FILE);
	time(&(cstat.current_time));

	if (is_prime_time(cstat.current_time))
		init_prime_time(&cstat, NULL);
	else
		init_non_prime_time(&cstat, NULL);

	if (conf.holiday_year != 0) {
		auto tmptr = localtime(&cstat.current_time);
		if ((tmptr != NULL) && ((tmptr->tm_year + 1900) > conf.holiday_year))
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_FILE, LOG_NOTICE, HOLIDAYS_FILE,
				  "The holiday file is out of date; please update it.");
	}

	parse_ded_file(DEDTIME_FILE);

	if (fstree != NULL)
		delete fstree;
	/* preload the static members to the fairshare tree */
	fstree = preload_tree();
	if (fstree != NULL) {
		parse_group(RESGROUP_FILE, fstree->root);
		calc_fair_share_perc(fstree->root->child, UNSPECIFIED);
		read_usage(USAGE_FILE, 0, fstree);

		if (fstree->last_decay == 0)
			fstree->last_decay = cstat.current_time;
	}
#ifdef NAS /* localmod 034 */
	site_parse_shares(SHARE_FILE);
#endif /* localmod 034 */

	/* set the zoneinfo directory to $PBS_EXEC/zoneinfo.
	 * This is used for standing reservations user of libical */
	sprintf(zone_dir, "%s%s", pbs_conf.pbs_exec_path, ICAL_ZONEINFO_DIR);
	set_ical_zoneinfo(zone_dir);

#ifdef PYTHON
#ifdef WIN32
	Py_NoSiteFlag = 1;
	Py_FrozenFlag = 1;
	Py_IgnoreEnvironmentFlag = 1;
	set_py_progname();
	Py_InitializeEx(0);
#else
	static wchar_t w_python_binpath[MAXPATHLEN + 1] = {'\0'};
	char *python_binpath = NULL;
	PyStatus py_status;
	PyConfig py_config;

	PyConfig_InitPythonConfig(&py_config);

	py_config._install_importlib = 1;
	py_config.use_environment = 0;
	py_config.optimization_level = 2;
	py_config.isolated = 1;
	py_config.site_import = 0;
	py_config.install_signal_handlers = 0;

        if (w_python_binpath[0] == '\0') {
                if (get_py_progname(&python_binpath)) {
                        log_err(-1, __func__, "Failed to find python binary path!");
                        return -1;
                }
                mbstowcs(w_python_binpath, python_binpath, MAXPATHLEN + 1);
                free(python_binpath);
        }

	py_status = PyConfig_SetString(&py_config, &py_config.program_name, w_python_binpath);
	if (PyStatus_Exception(py_status))
		return -1;

	py_status = Py_InitializeFromConfig(&py_config);
	if (PyStatus_Exception(py_status)) {
		log_err(-1, "Py_InitializeFromConfig",
			"--> Failed to initialize Python interpreter <--");
		PyConfig_Clear(&py_config);  // Clear the configuration object
		return -1;
	}
#endif
	PyRun_SimpleString(
		"_err =\"\"\n"
		"ex = None\n"
		"try:\n"
		"\tfrom math import *\n"
		"except ImportError as ex:\n"
		"\t_err = str(ex)");

	module = PyImport_AddModule("__main__");
	dict = PyModule_GetDict(module);

	errstr = NULL;
	obj = PyMapping_GetItemString(dict, "_err");
	if (obj != NULL) {
		errstr = PyUnicode_AsUTF8(obj);
		if (errstr != NULL) {
			if (strlen(errstr) > 0)
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING,
					   "PythonError", " %s. Python is unlikely to work properly.", errstr);
		}
		Py_XDECREF(obj);
	}

#endif

	/* (Re-)Initialize multithreading */
	if (num_threads == 0 || (nthreads > 0 && nthreads != num_threads)) {
		if (init_multi_threading(nthreads) != 1) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
				  "", "Error initializing pthreads");
			return -1;
		}
	}

	return 0;
}

/**
 * @brief
 *		update global status structure which holds
 *		status information used by the scheduler which
 *		can change from cycle to cycle
 *
 * @param[in]	policy	-	status structure to update
 * @param[in]	current_time	-	current time or 0 to call time()
 *
 * @return nothing
 *
 */
void
update_cycle_status(status &policy, time_t current_time)
{
	bool dedtime;	       /* is it dedtime? */
	enum prime_time prime; /* current prime time status */
	const char *primetime;

	if (current_time == 0)
		time(&policy.current_time);
	else
		policy.current_time = current_time;

	/* cycle start in real time -- can be used for time deltas */
	policy.cycle_start = time(NULL);

	dedtime = is_ded_time(policy.current_time);

	/* it was dedtime last scheduling cycle, and it is not dedtime now */
	if (policy.is_ded_time && !dedtime)
		conf.ded_time.erase(conf.ded_time.begin());

	policy.is_ded_time = dedtime;

	/* if we have changed from prime to nonprime or nonprime to prime
	 * init the status respectively
	 */
	prime = is_prime_time(policy.current_time);
	if (prime == PRIME && !policy.is_prime)
		init_prime_time(&policy, NULL);
	else if (prime == NON_PRIME && policy.is_prime)
		init_non_prime_time(&policy, NULL);

	if (conf.holiday_year != 0) {
		auto tmptr = localtime(&policy.current_time);
		if ((tmptr != NULL) && ((tmptr->tm_year + 1900) > conf.holiday_year))
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_FILE, LOG_NOTICE,
				  HOLIDAYS_FILE, "The holiday file is out of date; please update it.");
	}
	policy.prime_status_end = end_prime_status(policy.current_time);

	primetime = prime == PRIME ? "primetime" : "non-primetime";
	if (policy.prime_status_end == SCHD_INFINITY)
		log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "", "It is %s.  It will never end", primetime);
	else {
		auto ptm = localtime(&(policy.prime_status_end));
		if (ptm != NULL) {
			log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "",
				   "It is %s.  It will end in %ld seconds at %02d/%02d/%04d %02d:%02d:%02d",
				   primetime, policy.prime_status_end - policy.current_time,
				   ptm->tm_mon + 1, ptm->tm_mday, ptm->tm_year + 1900,
				   ptm->tm_hour, ptm->tm_min, ptm->tm_sec);
		} else
			log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "",
				   "It is %s.  It will end at <UNKNOWN>", primetime);
	}

	// Will be set in query_server()
	policy.resdef_to_check_no_hostvnode.clear();
	policy.resdef_to_check_noncons.clear();
	policy.resdef_to_check_rassn.clear();
	policy.resdef_to_check_rassn_select.clear();
	policy.backfill_depth = UNSPECIFIED;

	policy.order = 0;
	policy.preempt_attempts = 0;
}

/**
 * @brief
 * 		prep the scheduling cycle.  Do tasks that have to happen prior
 *		to the consideration of the first job.  This includes any
 *		periodic upkeep (like fairshare), or any prep to the queried
 *		data that needed to happen post query_server() (like preemption)
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd		connection descriptor to pbs_server
 * @param[in]	sinfo	-	the server
 *
 * @return	int
 * @retval	1	: success
 * @retval	0	: failure
 *
 * @note
 * 		failure of this function will cause schedule() to exit
 */

int
init_scheduling_cycle(status *policy, int pbs_sd, server_info *sinfo)
{
	group_info *user = NULL; /* the user for the running jobs of the last cycle */
	static schd_error *err;

	if (err == NULL) {
		err = new_schd_error();
		if (err == NULL)
			return 0;
	}

	if ((policy->fair_share || sinfo->job_sort_formula != NULL) && sinfo->fstree != NULL) {
		FILE *fp;
		bool decayed = false;
		bool resort = false;
		if ((fp = fopen(USAGE_TOUCH, "r")) != NULL) {
			fclose(fp);
			reset_usage(fstree->root);
			read_usage(USAGE_FILE, NO_FLAGS, fstree);
			if (fstree->last_decay == 0)
				fstree->last_decay = policy->current_time;
			remove(USAGE_TOUCH);
			resort = true;
		}
		if (!last_running.empty() && sinfo->running_jobs != NULL) {
			/* add the usage which was accumulated between the last cycle and this
			 * one and calculate a new value
			 */

			for (const auto &lj : last_running) {
				user = find_alloc_ginfo(lj.entity_name, sinfo->fstree->root);

				if (user != NULL) {
					auto rj = find_resource_resv(sinfo->running_jobs, lj.name);

					if (rj != NULL && rj->job != NULL && !rj->job->is_prerunning) {
						/* just in case the delta is negative just add 0 */
						auto delta = formula_evaluate(conf.fairshare_res.c_str(), rj, rj->job->resused) -
							     formula_evaluate(conf.fairshare_res.c_str(), rj, lj.resused);

						delta = IF_NEG_THEN_ZERO(delta);

						;
						for (auto &g : user->gpath)
							g->usage += delta;

						resort = true;
					}
				}
			}
		}

		/* The half life for the fair share tree might have passed since the last
		 * scheduling cycle.  For that matter, several half lives could have
		 * passed.  If this is the case, perform as many decays as necessary
		 */

		auto t = policy->current_time;
		while (conf.decay_time != SCHD_INFINITY &&
		       (t - sinfo->fstree->last_decay) > conf.decay_time) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
				  "Fairshare", "Decaying Fairshare Tree");
			if (fstree != NULL)
				decay_fairshare_tree(sinfo->fstree->root);
			t -= conf.decay_time;
			decayed = true;
			resort = true;
		}

		if (decayed) {
			/* set the time to the actual time the half-life should have occurred */
			if (fstree != NULL)
				fstree->last_decay =
					policy->current_time - (policy->current_time -
								sinfo->fstree->last_decay) %
								       conf.decay_time;
		}

		if (decayed || !last_running.empty()) {
			write_usage(USAGE_FILE, sinfo->fstree);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
				  "Fairshare", "Usage Sync");
		}
		reset_temp_usage(sinfo->fstree->root);
		calc_usage_factor(sinfo->fstree);
		if (resort)
			sort_jobs(policy, sinfo);
	}

	/* set all the jobs' preempt priorities.  It is done here instead of when
	 * the jobs were created for several reasons.
	 * 1. fairshare usage is not updated
	 * 2. we need all the jobs to be created and up to date for soft run limits
	 */

	/* Before setting preempt priorities on all jobs, make sure that entity's preempt bit
	 * is updated for all running jobs
	 */
	if ((sinfo->running_jobs != NULL) && (policy->preempting)) {
		for (int i = 0; sinfo->running_jobs[i] != NULL; i++) {
			if (sinfo->running_jobs[i]->job->resv_id == NULL)
				update_soft_limits(sinfo, sinfo->running_jobs[i]->job->queue, sinfo->running_jobs[i]);
		}
	}
	if (sinfo->jobs != NULL) {
		for (int i = 0; sinfo->jobs[i] != NULL; i++) {
			resource_resv *resresv = sinfo->jobs[i];
			if (resresv->job != NULL) {
				if (policy->preempting) {
					set_preempt_prio(resresv, resresv->job->queue, sinfo);
					if (resresv->job->is_running)
						if (!resresv->job->can_not_preempt)
							sinfo->preempt_count[preempt_level(resresv->job->preempt)]++;
				}
				if (sinfo->job_sort_formula != NULL) {
					double threshold = sc_attrs.job_sort_formula_threshold;
					resresv->job->formula_value = formula_evaluate(sinfo->job_sort_formula, resresv, resresv->resreq);
					log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name, "Formula Evaluation = %.*f",
						   float_digits(resresv->job->formula_value, FLOAT_NUM_DIGITS), resresv->job->formula_value);

					if (!resresv->can_not_run && resresv->job->formula_value <= threshold) {
						set_schd_error_codes(err, NOT_RUN, JOB_UNDER_THRESHOLD);
						log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name, "Job's formula value %.*f is under threshold %.*f",
							   float_digits(resresv->job->formula_value, FLOAT_NUM_DIGITS), resresv->job->formula_value, float_digits(threshold, 2), threshold);
						if (err->error_code != SUCCESS) {
							update_job_can_not_run(pbs_sd, resresv, err);
							clear_schd_error(err);
						}
					}
				}
			}
		}
	}

	next_job(policy, sinfo, INITIALIZE);
#ifdef NAS /* localmod 034 */
	(void) site_pick_next_job(NULL);
	(void) site_is_share_king(policy);
#endif /* localmod 034 */

	return 1; /* SUCCESS */
}

/**
 * @brief
 *		schedule - this function gets called to start each scheduling cycle
 *		   It will handle the difference cases that caused a
 *		   scheduling cycle
 *
 * @param[in]	sd	-	primary socket descriptor to the server pool
 *
 * @return	int
 * @retval	0	: continue calling scheduling cycles
 * @retval	1	: exit scheduler
 */
int
schedule(int sd, const sched_cmd *cmd)
{
	switch (cmd->cmd) {
		case SCH_SCHEDULE_NULL:
		case SCH_RULESET:
			/* ignore and end cycle */
			break;

		case SCH_SCHEDULE_FIRST:
			/*
			 * on the first cycle after the server restarts custom resources
			 * may have been added.
			 */
			update_resource_defs(sd);

			/* Get config from the qmgr sched object */
			if (!set_validate_sched_attrs(sd))
				return 0;

		case SCH_SCHEDULE_NEW:
		case SCH_SCHEDULE_TERM:
		case SCH_SCHEDULE_CMD:
		case SCH_SCHEDULE_TIME:
		case SCH_SCHEDULE_JOBRESV:
		case SCH_SCHEDULE_STARTQ:
		case SCH_SCHEDULE_MVLOCAL:
		case SCH_SCHEDULE_ETE_ON:
		case SCH_SCHEDULE_RESV_RECONFIRM:
			return intermediate_schedule(sd, cmd);
		case SCH_SCHEDULE_AJOB:
			return intermediate_schedule(sd, cmd);
		case SCH_CONFIGURE:
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_INFO,
				  "reconfigure", "Scheduler is reconfiguring");
			/* Get config from sched_priv/ files */
			if (schedinit(-1) != 0)
				return 0;

			update_resource_defs(sd);

			/* Get config from the qmgr sched object */
			if (!set_validate_sched_attrs(sd))
				return 0;
			break;
		case SCH_QUIT:
#ifdef PYTHON
			Py_Finalize();
#endif
			return 1; /* have the scheduler exit nicely */
		default:
			return 0;
	}
	return 0;
}

/**
 * @brief
 *		intermediate_schedule - responsible for starting/restarting scheduling
 *		cycle.
 *
 * @param[in]	sd	-	primary socket descriptor to the server pool
 *
 * returns 0
 *
 */
int
intermediate_schedule(int sd, const sched_cmd *cmd)
{
	int ret;	   /* to re schedule or not */
	int cycle_cnt = 0; /* count of cycles run */

	do {
		ret = scheduling_cycle(sd, cmd);

		/* don't restart cycle if :- */

		/* 1) qrun request, we don't want to keep trying same job */
		if (cmd->jid != NULL)
			break;

		/* Note that a qrun request receiving batch protocol error or any other
		 error will not restart scheduling cycle.
		 */

		/* 2) broken pipe, server connection lost */
		if (got_sigpipe)
			break;

		/* 3) max allowed number of cycles have already been run,
		 *    there can be total of 1 + MAX_RESTART_CYCLECNT cycles
		 */
		if (cycle_cnt > (MAX_RESTART_CYCLECNT - 1))
			break;

		cycle_cnt++;
	} while (ret == -1);

	return 0;
}

/**
 * @brief
 *		scheduling_cycle - the controling function of the scheduling cycle
 *
 * @param[in]	sd	-	primary socket descriptor to the server pool
 *
 * @return	int
 * @retval	0	: success/normal return
 * @retval	-1	: failure
 *
 */

int
scheduling_cycle(int sd, const sched_cmd *cmd)
{
	server_info *sinfo;	    /* ptr to the server/queue/job/node info */
	int rc = SUCCESS;	    /* return code from main_sched_loop() */
	char log_msg[MAX_LOG_SIZE]; /* used to log the message why a job can't run*/
	int error = 0;		    /* error happened, don't run main loop */
	status *policy;		    /* policy structure used for cycle */
	schd_error *err = NULL;

	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
		  "", "Starting Scheduling Cycle");

	/* Decide whether we need to send "can't run" type updates this cycle */
	if (time(NULL) - last_attr_updates >= sc_attrs.attr_update_period)
		send_job_attr_updates = 1;
	else
		send_job_attr_updates = 0;

	update_cycle_status(cstat, 0);

#ifdef NAS /* localmod 030 */
	do_soft_cycle_interrupt = 0;
	do_hard_cycle_interrupt = 0;
#endif /* localmod 030 */
	/* create the server / queue / job / node structures */
	if ((sinfo = query_server(&cstat, sd)) == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  "", "Problem with creating server data structure");
		end_cycle_tasks(sinfo);
		return 0;
	}
	policy = sinfo->policy;

	/* don't confirm reservations if we're handling a qrun request */
	if (cmd->jid == NULL) {
		int rc;
		rc = check_new_reservations(policy, sd, sinfo->resvs, sinfo);
		if (rc) {
			/* Check if there are new reservations.  If there are, we can't go any
			 * further in the scheduling cycle since we don't have the up to date
			 * information about the newly confirmed reservations
			 */
			end_cycle_tasks(sinfo);
			/* Problem occurred confirming reservation, retry cycle */
			if (rc < 0)
				return -1;

			return 0;
		}
	}

	/* jobid will not be NULL if we received a qrun request */
	if (cmd->jid != NULL) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, cmd->jid, "Received qrun request");
		if (is_job_array(cmd->jid) > 1) /* is a single subjob or a range */
			modify_job_array_for_qrun(sinfo, cmd->jid);
		else
			sinfo->qrun_job = find_resource_resv(sinfo->jobs, cmd->jid);

		if (sinfo->qrun_job == NULL) { /* something went wrong */
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, cmd->jid, "Could not find job to qrun.");
			error = 1;
			rc = SCHD_ERROR;
			sprintf(log_msg, "PBS Error: Scheduler can not find job");
		}
	}

	if (init_scheduling_cycle(policy, sd, sinfo) == 0) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, sinfo->name, "init_scheduling_cycle failed.");
		end_cycle_tasks(sinfo);
		return 0;
	}

	if (sinfo->qrun_job != NULL) {
		sinfo->qrun_job->can_not_run = 0;
		if (sinfo->qrun_job->job != NULL) {
			if (sinfo->qrun_job->job->is_waiting ||
			    sinfo->qrun_job->job->is_held) {
				set_job_state("Q", sinfo->qrun_job->job);
			}
		}
	}

	/* run loop run */
	if (error == 0)
		rc = main_sched_loop(policy, sd, sinfo, &err);

	if (cmd->jid != NULL) {
		int def_rc = -1;
		int i;

		for (i = 0; i < MAX_DEF_REPLY && def_rc != 0; i++) {
			/* smooth sailing, the job ran */
			if (rc == SUCCESS)
				def_rc = pbs_defschreply(sd, SCH_SCHEDULE_AJOB, cmd->jid, 0, NULL, NULL);

			/* we thought the job should run, but the server had other ideas */
			else {
				if (err != NULL) {
					translate_fail_code(err, NULL, log_msg);
					if (err->error_code < RET_BASE) {
						error = err->error_code;
					} else {
						/* everything else... unfortunately our ret codes don't nicely match up to
						 * the rest of PBS's PBSE codes, so we return resources unavailable.  This
						 * doesn't really matter, because we're returning a message
						 */
						error = PBSE_RESCUNAV;
					}
				} else
					error = PBSE_RESCUNAV;
				def_rc = pbs_defschreply(sd, SCH_SCHEDULE_AJOB, cmd->jid, error, log_msg, NULL);
			}
			if (def_rc != 0) {
				char *pbs_errmsg;
				pbs_errmsg = pbs_geterrmsg(sd);

				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, cmd->jid, "Error in deferred reply: %s", pbs_errmsg == NULL ? "" : pbs_errmsg);
			}
		}
		if (i == MAX_DEF_REPLY && def_rc != 0) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, cmd->jid, "Max deferred reply count reached; giving up.");
		}
	}

#ifdef NAS
	/* localmod 064 */
	site_list_jobs(sinfo, sinfo->jobs);
	/* localmod 034 */
	site_list_shares(stdout, sinfo, "eoc_", 1);
#endif
	end_cycle_tasks(sinfo);

	free_schd_error(err);
	if (rc < 0)
		return -1;

	return 0;
}

/**
 * @brief check whether any server sent us super high priority command
 *        return cmd if we have it
 *
 * @param[out] is_conn_lost - did we lost connection to server?
 *                            1 - yes, 0 - no
 * @param[in,out] high_prior_cmd - contains the high priority command received
 *
 * @return sched_cmd *
 * @retval 0 - no super high priority command is received
 * @retval 1 - super high priority command is received
 *
 */
static int
get_high_prio_cmd(int *is_conn_lost, sched_cmd *high_prior_cmd)
{
	sched_cmd cmd;
	int rc;

	rc = get_sched_cmd_noblk(clust_secondary_sock, &cmd);
	if (rc == -2) {
		*is_conn_lost = 1;
		return 0;
	}
	if (rc != 1)
		return 0;

	if (cmd.cmd == SCH_SCHEDULE_RESTART_CYCLE) {
		*high_prior_cmd = cmd;
		return 1;
	} else {
		if (cmd.cmd == SCH_SCHEDULE_AJOB)
			qrun_list[qrun_list_size++] = cmd;
		else {
			/* Index of the array is the command recevied. Put the value as 1 which indicates that
			 * the command is received. If we receive same commands from multiple servers they
			 * are overwritten which is what we want i.e. it allows us to eliminate duplicate commands.
			 */
			if (cmd.cmd >= SCH_SCHEDULE_NULL && cmd.cmd < SCH_CMD_HIGH)
				sched_cmds[cmd.cmd] = 1;
		}
	}

	return 0;
}

/**
 * @brief
 * 		the main scheduler loop
 *		Loop until njob = next_job() returns NULL
 *		if njob can run now, run it
 *		if not, attempt preemption
 *		if successful, run njob
 *		njob can't run:
 *		if we can backfill
 *		add job to calendar
 *		deal with normal job can't run stuff
 *
 * @param[in]	policy	-	policy info
 * @param[in]	sd	-	primary socket descriptor to the server pool
 * @param[in]	sinfo	-	pbs universe we're going to loop over
 * @param[out]	rerr	-	error bits from the last job considered
 *
 *	@return return code of last job scheduled
 *	@retval -1	: on error
 */
int
main_sched_loop(status *policy, int sd, server_info *sinfo, schd_error **rerr)
{
	resource_resv *njob;	     /* ptr to the next job to see if it can run */
	int rc = 0;		     /* return code to the function */
	int num_topjobs = 0;	     /* number of jobs we've added to the calendar */
	int end_cycle = 0;	     /* boolean  - end main cycle loop */
	char log_msg[MAX_LOG_SIZE];  /* used to log an message about job */
	char comment[MAX_LOG_SIZE];  /* used to update comment of job */
	time_t cycle_start_time;     /* the time the cycle starts */
	time_t cycle_end_time;	     /* the time when the current cycle should end */
	time_t cur_time;	     /* the current time via time() */
	std::vector<nspec *> ns_arr; /* node solution for job */
	int i;
	int sort_again = DONT_SORT_JOBS;
	schd_error *err;
	schd_error *chk_lim_err;

	if (policy == NULL || sinfo == NULL || rerr == NULL)
		return -1;

	time(&cycle_start_time);
	/* calculate the time which we've been in the cycle too long */
	cycle_end_time = cycle_start_time + sc_attrs.sched_cycle_length;

	chk_lim_err = new_schd_error();
	if (chk_lim_err == NULL)
		return -1;
	err = new_schd_error();
	if (err == NULL) {
		free_schd_error(chk_lim_err);
		return -1;
	}

	/* main scheduling loop */
#ifdef NAS
	/* localmod 030 */
	interrupted_cycle_start_time = cycle_start_time;
	/* localmod 038 */
	num_topjobs_per_queues = 0;
	/* localmod 064 */
	site_list_jobs(sinfo, sinfo->jobs);
#endif
	for (i = 0; !end_cycle &&
		    (njob = next_job(policy, sinfo, sort_again)) != NULL;
	     i++) {
		int should_use_buckets;	       /* Should use node buckets for a job */
		unsigned int flags = NO_FLAGS; /* flags to is_ok_to_run @see is_ok_to_run() */
		auto qinfo = njob->job->queue;

#ifdef NAS /* localmod 030 */
		if (check_for_cycle_interrupt(1)) {
			break;
		}
#endif /* localmod 030 */

		rc = 0;
		comment[0] = '\0';
		log_msg[0] = '\0';
		sort_again = SORTED;

		clear_schd_error(err);

		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  njob->name, "Considering job to run");

		should_use_buckets = job_should_use_buckets(njob);
		if (should_use_buckets)
			flags = USE_BUCKETS;

		if (njob->is_shrink_to_fit) {
			/* Pass the suitable heuristic for shrinking */
			ns_arr = is_ok_to_run_STF(policy, sinfo, qinfo, njob, flags, err, shrink_job_algorithm);
		} else
			ns_arr = is_ok_to_run(policy, sinfo, qinfo, njob, flags, err);

		if (err->status_code == NEVER_RUN)
			njob->can_never_run = 1;

		if (!ns_arr.empty()) { /* success! */
			if (rc != SCHD_ERROR) {
				if (run_update_job(policy, sd, sinfo, qinfo, njob, ns_arr, RURR_ADD_END_EVENT, err)) {
					rc = SUCCESS;
					if (sinfo->has_soft_limit || qinfo->has_soft_limit)
						sort_again = MUST_RESORT_JOBS;
					else
						sort_again = MAY_RESORT_JOBS;
				} else {
					/* if run_update_job() returns 0 and pbs_errno == PBSE_HOOKERROR,
					 * then this job is required to be ignored in this scheduling cycle
					 */
					rc = err->error_code;
					sort_again = SORTED;
				}
			} else
				free_nspecs(ns_arr);
		} else if (policy->preempting && in_runnable_state(njob) && (!njob->can_never_run)) {
			if (find_and_preempt_jobs(policy, sd, njob, sinfo, err) > 0) {
				rc = SUCCESS;
				sort_again = MUST_RESORT_JOBS;
			} else
				sort_again = SORTED;
		}

#ifdef NAS /* localmod 034 */
		if (rc == SUCCESS && !site_is_queue_topjob_set_aside(njob)) {
			site_bump_topjobs(njob);
		}
		if (rc == SUCCESS) {
			site_resort_jobs(njob);
		}
#endif /* localmod 034 */

		/* if run_update_job() returns an error, it's generally pretty serious.
		 * lets bail out of the cycle now
		 */
		if (rc == SCHD_ERROR || rc == PBSE_PROTOCOL || got_sigpipe) {
			end_cycle = 1;
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_WARNING, njob->name, "Leaving scheduling cycle because of an internal error.");
		} else if (rc != SUCCESS && rc != RUN_FAILURE) {
#ifdef NAS /* localmod 034 */
			int bf_rc;
			if ((bf_rc = site_should_backfill_with_job(policy, sinfo, njob, num_topjobs, num_topjobs_per_queues, err))) {
#else
			if (should_backfill_with_job(policy, sinfo, njob, num_topjobs) != 0) {
#endif
				auto cal_rc = add_job_to_calendar(sd, policy, sinfo, njob, should_use_buckets);

				if (cal_rc > 0) { /* Success! */
#ifdef NAS					  /* localmod 034 */
					switch (bf_rc) {
						case 1:
							num_topjobs++;
							break;
						case 2: /* localmod 038 */
							num_topjobs_per_queues++;
							break;
						case 3:
							site_bump_topjobs(njob, 0.0);
							num_topjobs++;
							break;
						case 4:
							if (!njob->job->is_preempted) {
								site_bump_topjobs(njob, delta);
								num_topjobs++;
							}
							break;
					}
#else
					sort_again = MAY_RESORT_JOBS;
					if (njob->job->is_preempted == 0 || sc_attrs.sched_preempt_enforce_resumption == 0) { /* preempted jobs don't increase top jobs count */
						if (qinfo->backfill_depth == UNSPECIFIED)
							num_topjobs++;
						else
							qinfo->num_topjobs++;
					}
#endif							   /* localmod 034 */
				} else if (cal_rc == -1) { /* recycle */
					end_cycle = 1;
					rc = -1;
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
						  njob->name, "Error in add_job_to_calendar");
				}
				/* else cal_rc == 0: failed to add to calendar - continue on */
			} else {
				if (njob->job->is_topjob) {
					/* the job is not a tob job anymore */
					update_job_attr(sd, njob, ATTR_topjob, NULL, const_cast<char *>("False"), NULL, UPDATE_NOW);
				}
			}

			/* Need to set preemption status so that soft limits can be checked
			 * before updating accrue_type.
			 */
			if (sinfo->eligible_time_enable == 1) {
				struct schd_error *update_accrue_err = err;
				set_preempt_prio(njob, qinfo, sinfo);
				/*
				 * A temporary schd_error location where errors from check_limits
				 * will be stored (when called to check CUMULATIVE limits)
				 */
				clear_schd_error(chk_lim_err);
				if (sinfo->qrun_job == NULL) {
					chk_lim_err->error_code = static_cast<enum sched_error_code>(check_limits(sinfo,
														  qinfo, njob, chk_lim_err, CHECK_CUMULATIVE_LIMIT));
					if (chk_lim_err->error_code != 0) {
						update_accrue_err = chk_lim_err;
					}
					/* Update total_*_counts in server_info and queue_info
					 * based on number of jobs that are either running  or
					 * are considered to run.
					 */
					update_total_counts(sinfo, qinfo, njob, ALL);
				}
				update_accruetype(sd, sinfo, ACCRUE_CHECK_ERR, update_accrue_err->error_code, njob);
			}

			njob->can_not_run = 1;
		}

		if ((rc != SUCCESS) && (err->error_code != 0)) {
			translate_fail_code(err, comment, log_msg);
			if (comment[0] != '\0' &&
			    (!njob->job->is_array || !njob->job->is_begin))
				update_job_comment(sd, njob, comment);
			if (log_msg[0] != '\0')
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB,
					  LOG_INFO, njob->name, log_msg);

			/* If this job couldn't run, the mark the equiv class so the rest of the jobs are discarded quickly.*/
			/* Note: for MAX_RUN_SUBJOBS it concerns only this array, not the equivalence class!! */
			if(sinfo->equiv_classes != NULL && njob->ec_index != UNSPECIFIED &&
			   err->error_code != MAX_RUN_SUBJOBS) {
				resresv_set *ec = sinfo->equiv_classes[njob->ec_index];
				if (rc != RUN_FAILURE && !ec->can_not_run) {
					ec->can_not_run = 1;
					ec->err = dup_schd_error(err);
				}
			}
		}

		if (njob->can_never_run) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_WARNING,
				  njob->name, "Job will never run with the resources currently configured in the complex");
		}
		if ((rc != SUCCESS) && njob->job->resv == NULL) {
			/* jobs in reservations are outside of the law... they don't cause
			 * the rest of the system to idle waiting for them
			 */
			if (policy->strict_fifo) {
				set_schd_error_codes(err, NOT_RUN, STRICT_ORDERING);
				update_jobs_cant_run(sd, qinfo->jobs, NULL, err, START_WITH_JOB);
			} else if (!policy->backfill && policy->strict_ordering) {
				set_schd_error_codes(err, NOT_RUN, STRICT_ORDERING);
				update_jobs_cant_run(sd, sinfo->jobs, NULL, err, START_WITH_JOB);
			} else if (policy->backfill && policy->strict_ordering && qinfo->backfill_depth == 0) {
				set_schd_error_codes(err, NOT_RUN, STRICT_ORDERING);
				update_jobs_cant_run(sd, qinfo->jobs, NULL, err, START_WITH_JOB);
			}
		}

		time(&cur_time);
		if (cur_time >= cycle_end_time) {
			end_cycle = 1;
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_NOTICE, "toolong",
				   "Leaving the scheduling cycle: Cycle duration of %ld seconds has exceeded %s of %ld seconds",
				   (long) (cur_time - cycle_start_time), ATTR_sched_cycle_len, sc_attrs.sched_cycle_length);
		}
		if (conf.max_jobs_to_check != SCHD_INFINITY && (i + 1) >= conf.max_jobs_to_check) {
			/* i begins with 0, hence i + 1 */
			end_cycle = 1;
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO, "",
				   "Bailed out of main job loop after checking to see if %d jobs could run.", (i + 1));
		}
		if (!end_cycle) {
			sched_cmd cmd;
			int is_conn_lost = 0;
			int rc = get_high_prio_cmd(&is_conn_lost, &cmd);

			if (is_conn_lost) {
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_WARNING,
					  njob->name, "We lost connection with the server, leaving scheduling cycle");
				end_cycle = 1;
			} else if ((rc == 1) && (cmd.cmd == SCH_SCHEDULE_RESTART_CYCLE)) {
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_WARNING,
					  njob->name, "Leaving scheduling cycle as requested by server.");
				end_cycle = 1;
			}
		}

#ifdef NAS /* localmod 030 */
		if (check_for_cycle_interrupt(0)) {
			consecutive_interrupted_cycles++;
		} else {
			consecutive_interrupted_cycles = 0;
		}
#endif /* localmod 030 */

		/* send any attribute updates to server that we've collected */
		send_job_updates(sd, njob);
	}

	*rerr = err;

	free_schd_error(chk_lim_err);
	return rc;
}

/**
 * @brief
 *		end_cycle_tasks - stuff which needs to happen at the end of a cycle
 *
 * @param[in]	sinfo	-	the server structure
 *
 * @return	nothing
 *
 */
void
end_cycle_tasks(server_info *sinfo)
{
	/* keep track of update used resources for fairshare */
	if (sinfo != NULL && sinfo->policy->fair_share)
		create_prev_job_info(sinfo->running_jobs);

	/* we copied in the global fairshare into sinfo at the start of the cycle,
	 * we don't want to free it now, or we'd lose all fairshare data
	 */
	if (sinfo != NULL) {
		sinfo->fstree = NULL;
		delete sinfo; /* free server and queues and jobs */
	}

	/* close any open connections to peers */
	for (auto &pq : conf.peer_queues) {
		if (pq.peer_sd >= 0) {
			/* When peering "local", do not disconnect server */
			if (!pq.remote_server.empty())
				pbs_disconnect(pq.peer_sd);
			pq.peer_sd = -1;
		}
	}

	/* free cmp_aoename */
	if (cmp_aoename != NULL) {
		free(cmp_aoename);
		cmp_aoename = NULL;
	}

	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
		  "", "Leaving Scheduling Cycle");
}

/**
 * @brief
 *		update_job_can_not_run - do post job 'can't run' processing
 *				 mark it 'can_not_run'
 *				 update the job comment and log the reason why
 *				 take care of deleting a 'can_never_run job
 *
 * @param[in]	pbs_sd	-	the connection descriptor to the server
 * @param[in,out]	job	-	the job to update
 * @param[in]	err	-	the error structure for why the job can't run
 *
 * @return	int
 * @retval	1	: success
 * @retval	0	: failure.
 *
 */
int
update_job_can_not_run(int pbs_sd, resource_resv *job, schd_error *err)
{
	char comment_buf[MAX_LOG_SIZE]; /* buffer for comment message */
	char log_buf[MAX_LOG_SIZE];	/* buffer for log message */
	int ret = 1;			/* return code for function */

	if ((job == NULL) || (err == NULL) || (job->job == NULL))
		return ret;

	job->can_not_run = 1;

	if (translate_fail_code(err, comment_buf, log_buf)) {
		/* don't attempt to update the comment on a remote job and on an array job */
		if (!job->is_peer_ob && (!job->job->is_array || !job->job->is_begin))
			update_job_comment(pbs_sd, job, comment_buf);

		/* not attempting to update accrue type on a remote job */
		if (!job->is_peer_ob) {
			if (job->job != NULL)
				set_preempt_prio(job, job->job->queue, job->server);
			update_accruetype(pbs_sd, job->server, ACCRUE_CHECK_ERR, err->error_code, job);
		}

		if (log_buf[0] != '\0')
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
				  job->name, log_buf);

		/* We won't be looking at this job in main_sched_loop()
		 * and we just updated some attributes just above.  Send Now.
		 */
		send_job_updates(pbs_sd, job);
	} else
		ret = 0;

	return ret;
}

/**
 * @brief move a peer job locally
 * 
 * @param[in] rr - the job
 * @return int
 * @retval return value from pbs_movejob()
 */
int
move_peer_job(resource_resv *rr)
{
	int rc = 0;

	if (rr == NULL)
		return 1;
	if (rr->is_peer_ob) {
		char buf[100]; /* used to assemble queue@localserver */

		if (rr->server->name.find(':') == std::string::npos) {
#ifdef NAS /* localmod 005 */
			sprintf(buf, "%s@%s:%u", rr->job->queue->name.c_str(),
#else
			sprintf(buf, "%s@%s:%d", rr->job->queue->name.c_str(),
#endif /* localmod 005 */
				rr->server->name.c_str(), pbs_conf.batch_service_port);
		} else {
			sprintf(buf, "%s@%s", rr->job->queue->name.c_str(),
				rr->server->name.c_str());
		}

		rc = pbs_movejob(rr->job->peer_sd, const_cast<char *>(rr->name.c_str()), buf, NULL);

		/*
		 * After successful transfer of the peer job to local server,
		 * reset the peer job flag i.e. is_peer_ob to 0, as it became
		 * a local job.
		 */
		if (rc == 0)
			rr->is_peer_ob = 0;
	}
	return rc;
}

/**
 * @brief
 * 		run_job - handle the running of a pbs job.  If it's a peer job
 *			first move it to the local server and then run it.
 *			if it's a local job, just run it.
 *
 * @param[in]	pbs_sd	-	pbs connection descriptor to the server
 * @param[in]	rr	-	the job to run
 * @param[in]	ns_arr		where to run the job
 * @param[out]	err	-	error struct to return errors
 *
 *
 * @retval true - success
 * @retval false - failure
 * 
 */
bool
run_job(status *policy, int pbs_sd, resource_resv *rr, std::vector<nspec *> &ns_arr, schd_error *err)
{
	bool ret = true;
	int pbsrc = 0; /* Return code from IFL call, 0 success, 1 failure */

	if (rr == NULL || rr->job == NULL || err == NULL)
		return false;

	/* Server most likely crashed */
	if (got_sigpipe) {
		set_schd_error_codes(err, NEVER_RUN, SCHD_ERROR);
		return false;
	}

#ifdef RESC_SPEC /* Hack to make rescspec work with new select code */
	if (rr->is_job && rr->job->rspec != NULL && ns[0] != NULL) {
		struct batch_status *bs; /* used for rescspec res assignment */
		struct attrl *attrp;	 /* used for rescspec res assignment */
		resource_req *req;
		bs = rescspec_get_assignments(rr->job->rspec);
		if (bs != NULL) {
			attrp = bs->attribs;
			while (attrp != NULL) {
				req = find_alloc_resource_req_by_str(ns[0]->resreq, attrp->resource);
				if (req != NULL)
					set_resource_req(req, attrp->value);

				if (rr->resreq == NULL)
					rr->resreq = req;
				attrp = attrp->next;
			}
			pbs_statfree(bs);
		}
	}
#endif

	if (rr->is_peer_ob)
		pbsrc = move_peer_job(rr);

	if (!pbsrc) {
		auto execvnode = create_execvnode(ns_arr);

#ifdef NAS /* localmod 031 */
		/* debug dpr - Log vnodes assigned to job */
		time_t tm = time(NULL);
		struct tm *ptm = localtime(&tm);
		printf("%04d-%02d-%02d %02d:%02d:%02d %s %s %s\n",
		       ptm->tm_year + 1900, ptm->tm_mon + 1, ptm->tm_mday,
		       ptm->tm_hour, ptm->tm_min, ptm->tm_sec,
		       "Running", resresv->name.c_str(),
		       execvnode != NULL ? execvnode : "(NULL)");
		fflush(stdout);
#endif /* localmod 031 */

		if (rr->is_shrink_to_fit) {
			char timebuf[TIMEBUF_SIZE] = {0};
			auto rc = 1;
			/* The job is set to run, update it's walltime only if it is not a foerever job */
			if (rr->duration != JOB_INFINITY) {
				convert_duration_to_str(rr->duration, timebuf, TIMEBUF_SIZE);
				rc = update_job_attr(pbs_sd, rr, ATTR_l, "walltime", timebuf, NULL, UPDATE_NOW);
			}
			if (rc > 0) {
				if (strlen(timebuf) > 0)
					log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_NOTICE, rr->name,
						   "Job will run for duration=%s", timebuf);
				pbsrc = send_run_job(pbs_sd, rr->server->has_runjob_hook, rr->name, execvnode);
			} else
				pbsrc = 1;
		} else
			pbsrc = send_run_job(pbs_sd, rr->server->has_runjob_hook, rr->name, execvnode);
	}

#ifdef NAS_CLUSTER /* localmod 125 */
	ret = translate_runjob_return_code(pbsrc, rr);
#else
	if (pbsrc)
		ret = false;
#endif /* localmod 125 */

	if (!ret) {
		/* received 'batch protocol error' */
		if (pbs_errno == PBSE_PROTOCOL) {
			set_schd_error_codes(err, NOT_RUN, static_cast<enum sched_error_code>(PBSE_PROTOCOL));
			return false;
		} else {
			const char *errbuf; /* comes from pbs_geterrmsg() */
			char buf[MAX_LOG_SIZE];

			set_schd_error_codes(err, NOT_RUN, RUN_FAILURE);
			errbuf = pbs_geterrmsg(pbs_sd);
			if (errbuf == NULL)
				errbuf = "";
			set_schd_error_arg(err, ARG1, errbuf);
			snprintf(buf, sizeof(buf), "%d", pbs_errno);
			set_schd_error_arg(err, ARG2, buf);
#ifdef NAS /* localmod 031 */
			set_schd_error_arg(err, ARG3, rr->name);
#endif /* localmod 031 */
		}
	}
	rr->can_not_run = true;
	if (rr->job->parent_job != NULL && range_next_value(rr->job->parent_job->job->queued_subjobs, -1) < 0)
		rr->job->parent_job->can_not_run = true;

	return ret;
}

#ifdef NAS_CLUSTER /* localmod 125 */
/**
 * @brief
 * 		check the run_job return code and decide whether to
 *        consider this job as running or not.
 *
 * @param[in]	pbsrc	-	return code of run_job
 * @param[in]	bjob	-	job structure
 *
 * @return	int
 * @retval	1	-	Job ran successfully
 * @retval	2	-	Job may not be running, ignoring error.
 * @retval	0	-	Job did not run
 * @retval	-1	-	Invalid function parameter
 */
static int
translate_runjob_return_code(int pbsrc, resource_resv *bjob)
{
	if ((bjob == NULL) || (pbsrc == PBSE_PROTOCOL))
		return -1;
	if (pbsrc == 0)
		return 1;
	switch (pbsrc) {
		case PBSE_HOOKERROR:
			return 0;
		default:
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_WARNING, bjob->name,
				   "Transient job warning.  Job may get held if issue persists:%d", pbsrc);
			return 2;
	}
}
#endif /* localmod 125 */

/**
 * @brief resume a suspended job
 * 
 * @param[in] policy - policy info
 * @param[in] pbs_sd - PBS connection descriptor
 * @param[in] rr - the job
 * @param[in] flags - flags to pass to update_universe_on_run()
 * @param[out] err - error structure to return errors
 * @return true job resumed successfully
 * @return false job didn't resume
 */
bool
resume_job(status *policy, int pbs_sd, resource_resv *rr, unsigned int flags, schd_error *err)
{
	auto pbsrc = send_sigjob(pbs_sd, rr, "resume", NULL);
	if (pbsrc) {
		char buf[COMMENT_BUF_SIZE] = {'\0'}; /* generic buffer - comments & logging*/
		const char *err_txt = pbse_to_txt(pbsrc);
		if (err_txt == NULL)
			err_txt = "";
		clear_schd_error(err);
		set_schd_error_codes(err, NOT_RUN, RUN_FAILURE);
		set_schd_error_arg(err, ARG1, err_txt);
		snprintf(buf, sizeof(buf), "%d", pbsrc);
		set_schd_error_arg(err, ARG2, buf);
		return false;
	}
	update_universe_on_run(policy, pbs_sd, rr, flags);

	return true;
}
/**
 * @brief
 * 		run a job and update the local cache if it was successfully run
 * 		This overload should be used when the ns_arr is unknown or 
 * 		the job is being rerun on its own ns_arr
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	connection descriptor to pbs_server
 * @param[in]	sinfo	-	server job is on
 * @param[in]	qinfo	-	queue job resides in
 * @param[in]	resresv	-	the job/reservation to run
 * @param[in]	flags	-	flags to modify procedure
 *							RURR_ADD_END_EVENT - add an end event to calendar for this job
 * 							RURR_NOPRINT - Don't print anything
 * @param[out]	err	-	error struct to return errors
 *
 * @retval	true	: success
 * @retval	false	: failure (see err for more info)
 */
bool
run_update_job(status *policy, int pbs_sd, server_info *sinfo,
	       queue_info *qinfo, resource_resv *rr,
	       unsigned int flags, schd_error *err)
{
	if (rr == NULL || sinfo == NULL || qinfo == NULL || !rr->is_job || rr->job == NULL) {
		clear_schd_error(err);
		set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
		return false;
	}
	if (!is_resource_resv_valid(rr, err))
		return false;

	if (rr->job->is_suspended)
		return resume_job(policy, pbs_sd, rr, flags, err);

	if (rr->nspec_arr.empty()) {
		auto nspec_arr = check_nodes(policy, sinfo, qinfo, rr, NO_FLAGS, err);
		if (nspec_arr.empty()) {
			/* Theoretically we've already make sure we can run, so this shouldn't happen */
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_NOTICE, rr->name,
				  "Could not find node solution in run_update_job()");
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return false;
		}
		return run_update_job(policy, pbs_sd, sinfo, qinfo, rr, nspec_arr, flags, err);
	} else {
		/* We're going to use the job's nspec_arr, so just pass an empty vector that will be ignored */
		std::vector<nspec *> empty_ns;
		return run_update_job(policy, pbs_sd, sinfo, qinfo, rr, empty_ns, flags, err);
	}
}

/**
 * @brief
 * 		run a job and update the local cache if it was successfully run
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	connection descriptor to pbs_server
 * @param[in]	sinfo	-	server job is on
 * @param[in]	qinfo	-	queue job resides in
 * @param[in]	resresv	-	the job/reservation to run
 * @param[in]	ns_arr	-	node solution of where job should run.  
 * 				This will either be owned by the job or freed before we return.
 * @param[in]	flags	-	flags to modify procedure
 *							RURR_ADD_END_EVENT - add an end event to calendar for this job
 * 							RURR_NOPRINT - Don't print anything
 * @param[out]	err	-	error struct to return errors
 *
 * @retval	true	: success
 * @retval	false	: failure (see err for more info)
 *
 */
bool
run_update_job(status *policy, int pbs_sd, server_info *sinfo,
	       queue_info *qinfo, resource_resv *resresv, std::vector<nspec *> &nspec_arr,
	       unsigned int flags, schd_error *err)
{
	bool ret;
	resource_resv *rr;

	if (resresv == NULL || sinfo == NULL || qinfo == NULL || !resresv->is_job) {
		clear_schd_error(err);
		set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
		free_nspecs(nspec_arr);
		return false;
	}

	if (!is_resource_resv_valid(resresv, err)) {
		schdlogerr(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SCHED, LOG_DEBUG, (char *) __func__, "Request not valid:", err);
		free_nspecs(nspec_arr);
		return false;
	}

	if (resresv->job->is_array)
		rr = queue_subjob(resresv, sinfo, qinfo);
	else
		rr = resresv;

	if (rr->job->is_suspended) {
		free_nspecs(nspec_arr);
		return resume_job(policy, pbs_sd, rr, flags, err);
	}
	/* If the job/resv already has a location to run, use that */
	if (!rr->nspec_arr.empty()) {
		/* We're not using this, so free it */
		free_nspecs(nspec_arr);
		ret = run_job(policy, pbs_sd, rr, rr->nspec_arr, err);
		if (ret) {
			ret = update_universe_on_run(policy, pbs_sd, rr, flags);
			if (!ret)
				set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
		}
	} else {
		std::sort(nspec_arr.begin(), nspec_arr.end(), cmp_nspec);
		ret = run_job(policy, pbs_sd, rr, nspec_arr, err);
		if (!ret)
			free_nspecs(nspec_arr);
		else {
			ret = update_universe_on_run(policy, pbs_sd, rr, nspec_arr, flags);
			if (!ret)
				set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
		}
	}
	return ret;
}

/**
 * @brief
 * 		simulate the running of a resource resv
 *
 * @param[in]	policy	-	policy info
 * @param[in]	resresv	-	the resource resv to simulate running
 * @param[in]	ns_arr  -	node solution of where a job/resv should run
 * @param[in]	flags	-	flags to modify procedure
 *							RURR_ADD_END_EVENT - add an end event to calendar for this job
 *
 * @retval	true	: success
 * @retval	false	: failure
 *
 */
bool
sim_run_update_resresv(status *policy, resource_resv *resresv, std::vector<nspec *> &ns_arr, unsigned int flags)
{
	bool ret = true;
	resource_resv *rr;

	if (resresv == NULL) {
		free_nspecs(ns_arr);
		return false;
	}

	if (!is_resource_resv_valid(resresv, NULL)) {
		free_nspecs(ns_arr);
		return false;
	}

	if (resresv->is_job && resresv->job->is_array)
		rr = queue_subjob(resresv, resresv->server, resresv->job->queue);
	else
		rr = resresv;

	if (rr->nspec_arr.empty())
		ret = update_universe_on_run(policy, SIMULATE_SD, rr, ns_arr, (flags | RURR_NOPRINT));
	else
		ret = update_universe_on_run(policy, SIMULATE_SD, rr, (flags | RURR_NOPRINT));

	if (!ret)
		free_nspecs(ns_arr);

	return ret;
}

/**
 * @brief
 * 		simulate the running of a resource resv without ns_arr.  This is 
 * 		used when we want to rerun the job on the same nodes its own ns_arr
 *
 * @param[in]	policy	-	policy info
 * @param[in]	resresv	-	the resource resv to simulate running
 * @param[in]	ns_arr  -	node solution of where a job/resv should run
 * @param[in]	flags	-	flags to modify procedure
 *							RURR_ADD_END_EVENT - add an end event to calendar for this job
 *
 * @retval	true	: success
 * @retval	false	: failure */
bool
sim_run_update_resresv(status *policy, resource_resv *resresv, unsigned int flags)
{
	std::vector<nspec *> empty_ns;
	return sim_run_update_resresv(policy, resresv, empty_ns, flags);
}
/**
 * @brief
 * 		should we call add_job_to_calendar() with job
 *
 * @param[in]	policy	-	policy structure
 * @param[in]	sinfo   -	server where job resides
 * @param[in]	resresv -	the job to check
 * @param[in]	num_topjobs	-	number of topjobs added to the calendar
 *
 * @return	int
 * @retval	1	: we should backfill
 * @retval	0	: we should not
 *
 */
int
should_backfill_with_job(status *policy, server_info *sinfo, resource_resv *resresv, int num_topjobs)
{

	if (policy == NULL || sinfo == NULL || resresv == NULL)
		return 0;

	if (resresv->job == NULL)
		return 0;

	if (!policy->backfill)
		return 0;

	/* jobs in reservations are not eligible for backfill */
	if (resresv->job->resv != NULL)
		return 0;

#ifndef NAS /* localmod 038 */
	if (!resresv->job->is_preempted) {
		queue_info *qinfo = resresv->job->queue;
		int bf_depth;
		int num_tj;

		/* If job is in a queue with a backfill_depth, use it*/
		if (qinfo->backfill_depth != UNSPECIFIED) {
			bf_depth = qinfo->backfill_depth;
			num_tj = qinfo->num_topjobs;
		} /* else check for a server bf depth */
		else if (policy->backfill_depth != static_cast<unsigned int>(UNSPECIFIED)) {
			bf_depth = policy->backfill_depth;
			num_tj = num_topjobs;
		} else { /* lastly use the server's default of 1*/
			bf_depth = 1;
			num_tj = num_topjobs;
		}

		if ((num_tj >= bf_depth))
			return 0;
	}
#endif /* localmod 038 */

	/* jobs with AOE are not eligible for backfill unless specifically allowed */
	if (!conf.allow_aoe_calendar && resresv->aoename != NULL)
		return 0;

	/* If we know we can never run the job, we shouldn't try and backfill*/
	if (resresv->can_never_run)
		return 0;

	/* Job is preempted and we're helping preempted jobs resume -- add to the calendar*/
	if (resresv->job->is_preempted && sc_attrs.sched_preempt_enforce_resumption && (resresv->job->preempt >= preempt_normal))
		return 1;

	/* Admin settable flag - don't add to calendar */
	if (resresv->job->topjob_ineligible)
		return 0;

	if (policy->strict_ordering)
		return 1;

	return 0;
}

/**
 * @brief
 * 		Find the start time of the top job and init
 *       all the necessary variables in sinfo to correctly backfill
 *       around it.  If no start time can be found, the job is not added
 *	     to the calendar.
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	connection descriptor to pbs server
 * @param[in]	policy	-	policy structure
 * @param[in]	sinfo	-	the server to find the topjob in
 * @param[in]	topjob	-	the job we want to backfill around
 * @param[in]	use_bucekts	use the bucket algorithm to add the job to the calendar
 *
 * @retval	1	: success
 * @retval	0	: failure
 * @retval	-1	: error
 *
 * @par Side-Effect:
 * 			Use caution when returning failure from this function.
 *		    It will have the effect of exiting the cycle and possibily
 *		    stalling scheduling.  It should only be done for important
 *		    reasons like jobs can't be added to the calendar.
 */
int
add_job_to_calendar(int pbs_sd, status *policy, server_info *sinfo,
		    resource_resv *topjob, int use_buckets)
{
	server_info *nsinfo; /* dup'd universe to simulate in */
	resource_resv *njob; /* the topjob in the dup'd universe */
	resource_resv *bjob; /* job pointer which becomes the topjob*/
	resource_resv *tjob; /* temporary job pointer for job arrays */
	time_t start_time;   /* calculated start time of topjob */

	if (policy == NULL || sinfo == NULL ||
	    topjob == NULL || topjob->job == NULL)
		return 0;

	if (sinfo->calendar != NULL) {
		/* if the job is in the calendar, then there is nothing to do
		 * Note: We only ever look from now into the future
		 */
		auto nexte = get_next_event(sinfo->calendar);
		if (find_timed_event(nexte, topjob->name, IGNORE_DISABLED_EVENTS, TIMED_NOEVENT, 0) != NULL)
			return 1;
	}
	try {
		nsinfo = new server_info(*sinfo);
	} catch (std::exception &e) {
		return 0;
	}

	if ((njob = find_resource_resv_by_indrank(nsinfo->jobs, topjob->resresv_ind, topjob->rank)) == NULL) {
		delete nsinfo;
		return 0;
	}

#ifdef NAS /* localmod 031 */
	log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		   topjob->name, "Estimating the start time for a top job (q=%s schedselect=%.1000s).", topjob->job->queue->name, topjob->job->schedsel);
#else
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  topjob->name, "Estimating the start time for a top job.");
#endif /* localmod 031 */
	if (use_buckets)
		start_time = calc_run_time(njob->name, nsinfo, SIM_RUN_JOB | USE_BUCKETS);
	else
		start_time = calc_run_time(njob->name, nsinfo, SIM_RUN_JOB);

	if (start_time > 0) {
		char *exec; /* used to hold execvnode for topjob */
		char log_buf[MAX_LOG_SIZE];

		/* If our top job is a job array, we don't backfill around the
		 * parent array... rather a subjob.  Normally subjobs don't actually
		 * exist until they are started.  In our case here, we need to create
		 * the subjob so we can backfill around it.
		 */
		if (topjob->job->is_array) {
			tjob = queue_subjob(topjob, sinfo, topjob->job->queue);
			if (tjob == NULL) {
				delete nsinfo;
				return 0;
			}

			/* Can't search by rank, we just created tjob and it has a new rank*/
			njob = find_resource_resv(nsinfo->jobs, tjob->name);
			if (njob == NULL) {
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__,
					  "Can't find new subjob in simulated universe");
				delete nsinfo;
				return 0;
			}
			/* The subjob is just for the calendar, not for running */
			tjob->can_not_run = 1;
			bjob = tjob;
		} else
			bjob = topjob;

		exec = create_execvnode(njob->nspec_arr);
		if (exec != NULL) {
			free_nspecs(bjob->nspec_arr);
			bjob->nspec_arr = parse_execvnode(exec, sinfo, NULL);
			if (!bjob->nspec_arr.empty()) {
				std::string selectspec;
				if (bjob->ninfo_arr != NULL)
					free(bjob->ninfo_arr);
				bjob->ninfo_arr =
					create_node_array_from_nspec(bjob->nspec_arr);
				selectspec = create_select_from_nspec(bjob->nspec_arr);
				if (!selectspec.empty()) {
					delete bjob->execselect;
					bjob->execselect = parse_selspec(selectspec);
				}
			} else {
				delete nsinfo;
				return 0;
			}
		} else {
			delete nsinfo;
			return 0;
		}

		if (bjob->job->est_execvnode != NULL)
			free(bjob->job->est_execvnode);
		bjob->job->est_execvnode = string_dup(exec);
		bjob->job->est_start_time = start_time;
		bjob->start = start_time;
		bjob->end = start_time + bjob->duration;

		auto te_start = create_event(TIMED_RUN_EVENT, bjob->start, bjob, NULL, NULL);
		if (te_start == NULL) {
			delete nsinfo;
			return 0;
		}
		add_event(sinfo->calendar, te_start);

		auto te_end = create_event(TIMED_END_EVENT, bjob->end, bjob, NULL, NULL);
		if (te_end == NULL) {
			delete nsinfo;
			return 0;
		}
		add_event(sinfo->calendar, te_end);

		if (update_estimated_attrs(pbs_sd, bjob, bjob->job->est_start_time,
					   bjob->job->est_execvnode, 0) < 0) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING,
				  bjob->name, "Failed to update estimated attrs.");
		}

		for (auto ns : bjob->nspec_arr) {
			int ind = ns->ninfo->node_ind;
			add_te_list(&(ns->ninfo->node_events), te_start);

			if (ind != -1 && sinfo->unordered_nodes[ind]->bucket_ind != -1) {
				node_bucket *bkt;

				bkt = sinfo->buckets[sinfo->unordered_nodes[ind]->bucket_ind];
				if (pbs_bitmap_get_bit(bkt->free_pool->truth, ind)) {
					pbs_bitmap_bit_off(bkt->free_pool->truth, ind);
					bkt->free_pool->truth_ct--;
					pbs_bitmap_bit_on(bkt->busy_later_pool->truth, ind);
					bkt->busy_later_pool->truth_ct++;
				}
			}
		}

		if (policy->fair_share) {
			/* update the fairshare usage of this job.  This only modifies the
			 * temporary usage used for this cycle.  Updating this will help the
			 * problem of backfilling other jobs which will affect the fairshare
			 * priority of the top job.  If the priority changes too much
			 * before it is run, the current top job may change in subsequent
			 * cycles
			 */
			update_usage_on_run(bjob);
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, bjob->name,
				   "Fairshare usage of entity %s increased due to job becoming a top job.", bjob->job->ginfo->name.c_str());
		}

		sprintf(log_buf, "Job is a top job and will run at %s",
			ctime(&bjob->start));

		log_buf[strlen(log_buf) - 1] = '\0'; /* ctime adds a \n */
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, bjob->name, log_buf);
	} else if (start_time == 0) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_WARNING, topjob->name,
			  "Error in calculation of start time of top job");
		delete nsinfo;
		return 0;
	}
	delete nsinfo;

	return 1;
}

/**
 * @brief
 *		find_ready_resv_job - find a job in a reservation which can run
 *
 * @param[in]	resvs	-	running resvs
 *
 * @return	the first job whose reservation is running
 * @retval	: NULL if there are not any
 *
 */
resource_resv *
find_ready_resv_job(resource_resv **resvs)
{
	int i;
	int ind;
	resource_resv *rjob = NULL;

	if (resvs == NULL)
		return NULL;

	for (i = 0; resvs[i] != NULL && rjob == NULL; i++) {
		if (resvs[i]->resv != NULL) {
			if (resvs[i]->resv->is_running) {
				if (resvs[i]->resv->resv_queue != NULL) {
					ind = find_runnable_resresv_ind(resvs[i]->resv->resv_queue->jobs, 0);
					if (ind != -1)
						rjob = resvs[i]->resv->resv_queue->jobs[ind];
					else
						rjob = NULL;
				}
			}
		}
	}

	return rjob;
}

/**
 * @brief
 *		find the index of the next runnable resouce resv in an array
 *
 * @param[in]	resresv_arr	-	array of resource resvs to search
 * @param[in]	start_index		index of array to start from
 *
 * @return	the index of the next resource resv to run
 * @retval	NULL	: if there are not any
 *
 */
int
find_runnable_resresv_ind(resource_resv **resresv_arr, int start_index)
{
#ifdef NAS /* localmod 034 */
	return site_find_runnable_res(resresv_arr);
#else
	int i;

	if (resresv_arr == NULL)
		return -1;

	for (i = start_index; resresv_arr[i] != NULL; i++) {
		if (!resresv_arr[i]->can_not_run && in_runnable_state(resresv_arr[i]))
			return i;
	}
	return -1;
#endif /* localmod 034 */
}

/**
 * @brief
 *		find the index of the next runnable express,preempted.
 * @par
 * 		ASSUMPTION: express jobs will be sorted to the front of the list, followed by preempted jobs
 *
 * @param[in]	jobs	-	the array of jobs
 * @param[in]	start_index	the index to start from
 *
 * @return	the index of the first runnable job
 * @retval	-1	: if there aren't any
 *
 */
int
find_non_normal_job_ind(resource_resv **jobs, int start_index)
{
	int i;

	if (jobs == NULL)
		return -1;

	for (i = start_index; jobs[i] != NULL; i++) {
		if (jobs[i]->job != NULL) {
			if ((jobs[i]->job->preempt_status & PREEMPT_TO_BIT(PREEMPT_EXPRESS)) || (jobs[i]->job->is_preempted)) {
				if (!jobs[i]->can_not_run)
					return i;
			} else if (jobs[i]->job->preempt_status & PREEMPT_TO_BIT(PREEMPT_NORMAL))
				return -1;
		}
	}
	return -1;
}

/**
 * @brief
 * 		find the next job to be considered to run by the scheduler
 *
 * @param[in]	policy	-	policy info
 * @param[in]	sinfo	-	the server the jobs are on
 * @param[in]	flag	-	whether or not to initialize, sort/re-sort jobs.
 *
 * @return	resource_resv *
 * @retval	the next job to consider
 * @retval  NULL	: on error or if there are no more jobs to run
 *
 * @par MT-safe: No
 *
 */
resource_resv *
next_job(status *policy, server_info *sinfo, int flag)
{
	/* last_queue is the index into a queue array of the last time
	 * the function was called
	 */
	static unsigned int last_queue;
	static int last_queue_index;
	static int last_job_index;

	/* skip is used to mark that we're done looking for qrun, reservation jobs and
	 * preempted jobs (while using by_queue policy).
	 * In each scheduling cycle skip is reset to 0. Jobs are selected in following
	 * order.
	 * 1. qrun job
	 * 2. jobs in reservation
	 * 3. High priority preempting jobs
	 * 4. Preempted jobs
	 * 5. Normal jobs
	 */
	static int skip = SKIP_NOTHING;
	static int sort_status = MAY_RESORT_JOBS; /* to decide whether to sort jobs or not */
	static int queue_list_size;		  /* Count of number of priority levels in queue_list */
	resource_resv *rjob = NULL;		  /* the job to return */
	int ind = -1;

	if ((policy == NULL) || (sinfo == NULL))
		return NULL;

	if (flag == INITIALIZE) {
		if (policy->round_robin) {
			last_queue = 0;
			last_queue_index = 0;
			queue_list_size = count_array(sinfo->queue_list);

		} else if (policy->by_queue)
			last_queue = 0;
		skip = SKIP_NOTHING;
		sort_jobs(policy, sinfo);
		sort_status = SORTED;
		last_job_index = 0;
		return NULL;
	}

	if (sinfo->qrun_job != NULL) {
		if (!sinfo->qrun_job->can_not_run &&
		    in_runnable_state(sinfo->qrun_job)) {
			rjob = sinfo->qrun_job;
		}
		return rjob;
	}
	if (!(skip & SKIP_RESERVATIONS)) {
		rjob = find_ready_resv_job(sinfo->resvs);
		if (rjob != NULL)
			return rjob;
		else
			skip |= SKIP_RESERVATIONS;
	}

	if ((sort_status != SORTED) || ((flag == MAY_RESORT_JOBS) && policy->fair_share) || (flag == MUST_RESORT_JOBS)) {
		sort_jobs(policy, sinfo);
		sort_status = SORTED;
		last_job_index = 0;
	}
	if (policy->round_robin) {
		/* Below is a pictorial representation of how queue_list
		 * looks like when policy is set to round_robin.
		 * each column represent the queues which are at a given priority level
		 * Priorities are also sorted in descending order i.e.
		 * Priority 1 > Priority 2 > Priority 3 ...
		 * We make use of each column, traverse through each queue at the same priority
		 * level and run jobs from these queues in round_robin fashion. For example:
		 * If queue 1 has J1,J3 : queue 2 has J2, J5 : queue 4 has J4, J6 then the order
		 * these jobs will be picked would be J1 -> J2 -> J4 -> J3 -> J5 -> J6
		 * When we are finished running all jobs from one priority column, we move onto
		 * next column and repeat the procedure there.
		 */
		/****************************************************
		 *    --------------------------------------------
		 *    | Priority 1 | Priority 2 | .............. |
		 *    --------------------------------------------
		 *    | queue 1    | queue 3    | ........ | NULL|
		 *    --------------------------------------------
		 *    | queue 2    | queue 5    | ........ | NULL|
		 *    --------------------------------------------
		 *    | queue 4    | NULL       | ........ | NULL|
		 *    --------------------------------------------
		 *    | NULL       |            | ........ | NULL|
		 *    --------------------------------------------
		 ****************************************************/
		/* last_index refers to a priority level as shown in diagram
		 * above.
		 */
		int i = last_queue_index;

		while ((rjob == NULL) && (i < queue_list_size)) {
			/* Calculating number of queues at this priority level */
			unsigned int queue_index_size = count_array(sinfo->queue_list[i]);
			unsigned int queues_finished = 0;

			for (unsigned int j = last_queue; j < queue_index_size; j++) {
				ind = find_runnable_resresv_ind(sinfo->queue_list[i][j]->jobs, 0);
				if (ind != -1)
					rjob = sinfo->queue_list[i][j]->jobs[ind];
				else
					rjob = NULL;
				last_queue++;
				/*If all queues are traversed, move back to first queue */
				if (last_queue == queue_index_size)
					last_queue = 0;
				/* Count how many times we've reached the end of a queue.
				 * If we've reached the end of all the queues, we're done.
				 * If we find a job, reset our counter.
				 */
				if (rjob == NULL) {
					queues_finished++;
					if (queues_finished == queue_index_size)
						break;
				} else {
					/* If we are able to get one job from any of the queues,
					 * set queues_finished to 0
					 */
					queues_finished = 0;
					break;
				}
			}
			/* If all queues at the given priority level are traversed
			 * then move onto next index and set last_queue as 0, so as to
			 * start from the first queue of the next index
			 */
			if (queues_finished == queue_index_size) {
				last_queue = 0;
				last_queue_index++;
				i++;
			}
		}
	} else if (policy->by_queue) {
		if (!(skip & SKIP_NON_NORMAL_JOBS)) {
			ind = find_non_normal_job_ind(sinfo->jobs, last_job_index);
			if (ind == -1) {
				/* No more preempted jobs */
				skip |= SKIP_NON_NORMAL_JOBS;
				last_job_index = 0;
			} else {
				rjob = sinfo->jobs[ind];
				last_job_index = ind;
			}
		}
		if (skip & SKIP_NON_NORMAL_JOBS) {
			while (last_queue < sinfo->queues.size() &&
			       ((ind = find_runnable_resresv_ind(sinfo->queues[last_queue]->jobs, last_job_index)) == -1)) {
				last_queue++;
				last_job_index = 0;
			}
			if (last_queue < sinfo->queues.size() && ind != -1) {
				rjob = sinfo->queues[last_queue]->jobs[ind];
				last_job_index = ind;
			} else
				rjob = NULL;
		}
	} else { /* treat the entire system as one large queue */
		ind = find_runnable_resresv_ind(sinfo->jobs, last_job_index);
		if (ind != -1) {
			rjob = sinfo->jobs[ind];
			last_job_index = ind;
		} else
			rjob = NULL;
	}
	return rjob;
}

/**
 * @brief	Initialize sc_attrs
 */
static void
init_sc_attrs(void)
{
	free(sc_attrs.comment);
	free(sc_attrs.job_sort_formula);
	free(sc_attrs.partition);
	free(sc_attrs.sched_log);
	free(sc_attrs.sched_priv);

	sc_attrs.attr_update_period = 0;
	sc_attrs.comment = NULL;
	sc_attrs.do_not_span_psets = 0;
	sc_attrs.job_sort_formula = NULL;
	sc_attrs.job_sort_formula_threshold = INT_MIN;
	sc_attrs.only_explicit_psets = 0;
	sc_attrs.partition = NULL;
	sc_attrs.preempt_queue_prio = 0;
	sc_attrs.preempt_sort = PS_MIN_T_SINCE_START;
	sc_attrs.runjob_mode = RJ_NOWAIT;
	sc_attrs.preempt_targets_enable = 1;
	sc_attrs.sched_cycle_length = SCH_CYCLE_LEN_DFLT;
	sc_attrs.sched_log = NULL;
	sc_attrs.sched_preempt_enforce_resumption = 0;
	sc_attrs.sched_priv = NULL;
	sc_attrs.server_dyn_res_alarm = 0;
	sc_attrs.throughput_mode = 1;
	sc_attrs.opt_backfill_fuzzy = BF_DEFAULT;
}

/**
 * @brief	Parse and cache sched object batch_status
 *
 * @param[in] status - populated batch_status after stating this scheduler from server
 *
 * @retval
 * @return 0 - Failure
 * @return  1 - Success
 *
 * @mt-safe: No
 * @par Side Effects:
 *	None
 */
static int
parse_sched_obj(int connector, struct batch_status *status)
{
	struct attrl *attrp;
	char *tmp_priv_dir = NULL;
	char *tmp_log_dir = NULL;
	static char *priv_dir = NULL;
	static char *log_dir = NULL;
	struct attropl *attribs;
	char *tmp_comment = NULL;
	int clear_comment = 0;
	int ret = 0;
	long num;
	char *endp;
	char *tok;
	char *save_ptr;
	int i;
	int j;
	long prev_attr_u_period = sc_attrs.attr_update_period;

	attrp = status->attribs;

	init_sc_attrs();

	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
		  "", "Updating scheduler attributes");

	/* resetting the following before fetching from batch_status. */
	while (attrp != NULL) {
		if (!strcmp(attrp->name, ATTR_sched_cycle_len)) {
			sc_attrs.sched_cycle_length = res_to_num(attrp->value, NULL);
		} else if (!strcmp(attrp->name, ATTR_attr_update_period)) {
			long newval;

			newval = res_to_num(attrp->value, NULL);
			sc_attrs.attr_update_period = newval;
			if (newval != prev_attr_u_period)
				last_attr_updates = 0;
		} else if (!strcmp(attrp->name, ATTR_partition)) {
			free(sc_attrs.partition);
			sc_attrs.partition = string_dup(attrp->value);
		} else if (!strcmp(attrp->name, ATTR_do_not_span_psets)) {
			sc_attrs.do_not_span_psets = res_to_num(attrp->value, NULL);
		} else if (!strcmp(attrp->name, ATTR_only_explicit_psets)) {
			sc_attrs.only_explicit_psets = res_to_num(attrp->value, NULL);
		} else if (!strcmp(attrp->name, ATTR_sched_preempt_enforce_resumption)) {
			if (!strcasecmp(attrp->value, ATR_FALSE))
				sc_attrs.sched_preempt_enforce_resumption = 0;
			else
				sc_attrs.sched_preempt_enforce_resumption = 1;
		} else if (!strcmp(attrp->name, ATTR_preempt_targets_enable)) {
			if (!strcasecmp(attrp->value, ATR_FALSE))
				sc_attrs.preempt_targets_enable = 0;
			else
				sc_attrs.preempt_targets_enable = 1;
		} else if (!strcmp(attrp->name, ATTR_job_sort_formula_threshold)) {
			sc_attrs.job_sort_formula_threshold = res_to_num(attrp->value, NULL);
		} else if (!strcmp(attrp->name, ATTR_throughput_mode)) {
			sc_attrs.throughput_mode = res_to_num(attrp->value, NULL);
		} else if (!strcmp(attrp->name, ATTR_opt_backfill_fuzzy)) {
			num = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				sc_attrs.opt_backfill_fuzzy = num;
			else if (!strcasecmp(attrp->value, "off"))
				sc_attrs.opt_backfill_fuzzy = BF_OFF;
			else if (!strcasecmp(attrp->value, "low"))
				sc_attrs.opt_backfill_fuzzy = BF_LOW;
			else if (!strcasecmp(attrp->value, "med") || !strcasecmp(attrp->value, "medium"))
				sc_attrs.opt_backfill_fuzzy = BF_MED;
			else if (!strcasecmp(attrp->value, "high"))
				sc_attrs.opt_backfill_fuzzy = BF_HIGH;
			else
				sc_attrs.opt_backfill_fuzzy = BF_DEFAULT;
		} else if (!strcmp(attrp->name, ATTR_job_run_wait)) {
			if (!strcmp(attrp->value, RUN_WAIT_NONE))
				sc_attrs.runjob_mode = RJ_NOWAIT;
			else if (!strcmp(attrp->value, RUN_WAIT_RUNJOB_HOOK)) {
				sc_attrs.runjob_mode = RJ_RUNJOB_HOOK;
			} else
				sc_attrs.runjob_mode = RJ_EXECJOB_HOOK;
		} else if (!strcmp(attrp->name, ATTR_sched_preempt_order)) {
			tok = strtok_r(attrp->value, "\t ", &save_ptr);

			if (tok != NULL && !isdigit(tok[0])) {
				/* unset the defaults */
				sc_attrs.preempt_order[0].order[0] = PREEMPT_METHOD_LOW;
				sc_attrs.preempt_order[0].order[1] = PREEMPT_METHOD_LOW;
				sc_attrs.preempt_order[0].order[2] = PREEMPT_METHOD_LOW;

				sc_attrs.preempt_order[0].high_range = 100;
				i = 0;
				do {
					if (isdigit(tok[0])) {
						num = strtol(tok, &endp, 10);
						if (*endp != '\0')
							goto cleanup;
						sc_attrs.preempt_order[i].low_range = num + 1;
						i++;
						sc_attrs.preempt_order[i].high_range = num;
					} else {
						for (j = 0; tok[j] != '\0'; j++) {
							switch (tok[j]) {
								case 'S':
									sc_attrs.preempt_order[i].order[j] = PREEMPT_METHOD_SUSPEND;
									break;
								case 'C':
									sc_attrs.preempt_order[i].order[j] = PREEMPT_METHOD_CHECKPOINT;
									break;
								case 'R':
									sc_attrs.preempt_order[i].order[j] = PREEMPT_METHOD_REQUEUE;
									break;
								case 'D':
									sc_attrs.preempt_order[i].order[j] = PREEMPT_METHOD_DELETE;
									break;
							}
						}
					}
					tok = strtok_r(NULL, "\t ", &save_ptr);
				} while (tok != NULL && i < PREEMPT_ORDER_MAX);

				sc_attrs.preempt_order[i].low_range = 0;
			}
		} else if (!strcmp(attrp->name, ATTR_sched_preempt_queue_prio)) {
			sc_attrs.preempt_queue_prio = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				goto cleanup;
		} else if (!strcmp(attrp->name, ATTR_sched_preempt_prio)) {
			long prio;
			char **list;

			prio = PREEMPT_PRIORITY_HIGH;
			list = break_comma_list(attrp->value);
			if (list != NULL) {
				memset(sc_attrs.preempt_prio, 0, sizeof(sc_attrs.preempt_prio));
				sc_attrs.preempt_prio[0][0] = PREEMPT_TO_BIT(PREEMPT_QRUN);
				sc_attrs.preempt_prio[0][1] = prio;
				prio -= PREEMPT_PRIORITY_STEP;
				for (i = 0; list[i] != NULL; i++) {
					num = preempt_bit_field(list[i]);
					if (num >= 0) {
						sc_attrs.preempt_prio[i + 1][0] = num;
						sc_attrs.preempt_prio[i + 1][1] = prio;
						prio -= PREEMPT_PRIORITY_STEP;
					}
				}
				/* sc_attrs.preempt_prio is an int array of size[NUM_PPRIO][2] */
				qsort(sc_attrs.preempt_prio, NUM_PPRIO, sizeof(int) * 2, preempt_cmp);

				/* cache preemption priority for normal jobs */
				for (i = 0; i < NUM_PPRIO && sc_attrs.preempt_prio[i][1] != 0; i++) {
					if (sc_attrs.preempt_prio[i][0] == PREEMPT_TO_BIT(PREEMPT_NORMAL)) {
						preempt_normal = sc_attrs.preempt_prio[i][1];
						break;
					}
				}

				free_string_array(list);
			}
		} else if (!strcmp(attrp->name, ATTR_sched_preempt_sort)) {
			if (strcasecmp(attrp->value, "min_time_since_start") == 0)
				sc_attrs.preempt_sort = PS_MIN_T_SINCE_START;
			else
				sc_attrs.preempt_sort = PS_PREEMPT_PRIORITY;
		} else if (!strcmp(attrp->name, ATTR_job_sort_formula)) {
			free(sc_attrs.job_sort_formula);
			sc_attrs.job_sort_formula = read_formula();
			if (!conf.prime_sort.empty() || !conf.non_prime_sort.empty())
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__,
					  "Job sorting formula and job_sort_key are incompatible.  "
					  "The job sorting formula will be used.");
		} else if (!strcmp(attrp->name, ATTR_sched_server_dyn_res_alarm)) {
			num = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				goto cleanup;

			sc_attrs.server_dyn_res_alarm = num;
		} else if (!strcmp(attrp->name, ATTR_sched_priv) && !dflt_sched) {
			if ((tmp_priv_dir = string_dup(attrp->value)) == NULL)
				goto cleanup;
		} else if (!strcmp(attrp->name, ATTR_sched_log) && !dflt_sched) {
			if ((tmp_log_dir = string_dup(attrp->value)) == NULL)
				goto cleanup;
		} else if (!strcmp(attrp->name, ATTR_comment) && !dflt_sched) {
			if ((tmp_comment = string_dup(attrp->value)) == NULL)
				goto cleanup;
		} else if (!strcmp(attrp->name, ATTR_logevents)) {
			char *endp;
			long mask;
			mask = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				goto cleanup;
			*log_event_mask = mask;
		}
		attrp = attrp->next;
	}

	if (!dflt_sched) {
		int err;
		int priv_dir_update_fail = 0;
		int validate_log_dir = 0;
		int validate_priv_dir = 0;
		struct attropl *patt;
		char comment[MAX_LOG_SIZE] = {0};

		if (log_dir == NULL)
			validate_log_dir = 1;
		else if (tmp_log_dir != NULL && strcmp(log_dir, tmp_log_dir) != 0)
			validate_log_dir = 1;

		if (priv_dir == NULL)
			validate_priv_dir = 1;
		else if (tmp_priv_dir != NULL && strcmp(priv_dir, tmp_priv_dir) != 0)
			validate_priv_dir = 1;

		if (!validate_log_dir && !validate_priv_dir && tmp_comment != NULL)
			clear_comment = 1;

		if (validate_log_dir) {
			log_close(1);
			if (log_open(logfile, tmp_log_dir) == -1) {
				/* update the sched comment attribute with the reason for failure */
				attribs = static_cast<attropl *>(calloc(2, sizeof(struct attropl)));
				if (attribs == NULL) {
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__, MEM_ERR_MSG);
					goto cleanup;
				}
				strcpy(comment, "Unable to change the sched_log directory");
				patt = attribs;
				patt->name = const_cast<char *>(ATTR_comment);
				patt->value = comment;
				patt->next = patt + 1;
				patt++;
				patt->name = const_cast<char *>(ATTR_scheduling);
				patt->value = const_cast<char *>("0");
				patt->next = NULL;

				err = pbs_manager(connector,
						  MGR_CMD_SET, MGR_OBJ_SCHED,
						  const_cast<char *>(sc_name), attribs, NULL);
				free(attribs);
				if (err) {
					log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
						   "Failed to update scheduler comment %s at the server", comment);
				}
				goto cleanup;
			} else {
				if (tmp_comment != NULL)
					clear_comment = 1;
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG,
					   "reconfigure", "scheduler log directory is changed to %s", tmp_log_dir);
				free(log_dir);
				if ((log_dir = string_dup(tmp_log_dir)) == NULL) {
					return 0;
				}
			}
		}

		if (validate_priv_dir) {
			int c;
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
			c = chk_file_sec_user(tmp_priv_dir, 1, 0, S_IWGRP | S_IWOTH, 1, getuid());
			c |= chk_file_sec_user(pbs_conf.pbs_environment, 0, 0, S_IWGRP | S_IWOTH, 0, getuid());
			if (c != 0) {
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
					   "PBS failed validation checks for directory %s", tmp_priv_dir);
				strcpy(comment, "PBS failed validation checks for sched_priv directory");
				priv_dir_update_fail = 1;
			}
#else /* not DEBUG and not NO_SECURITY_CHECK */
			c = 0;
#endif
			if (c == 0) {
				if (tmp_priv_dir == NULL || chdir(tmp_priv_dir) == -1) {
					strcpy(comment, "PBS failed validation checks for sched_priv directory");
					log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
						   "PBS failed validation checks for directory %s", tmp_priv_dir);
					priv_dir_update_fail = 1;
				} else {
					int lockfds;
					lockfds = open("sched.lock", O_CREAT | O_WRONLY, 0644);
					if (lockfds < 0) {
						strcpy(comment, "PBS failed validation checks for sched_priv directory");
						log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
							   "PBS failed validation checks for directory %s", tmp_priv_dir);
						priv_dir_update_fail = 1;
					} else {
						/* write schedulers pid into lockfile */
						if (ftruncate(lockfds, (off_t) 0) == -1) 
							log_errf(-1, __func__, "ftruncate failed. ERR : %s",strerror(errno));
						(void) sprintf(log_buffer, "%d\n", getpid());
						if (write(lockfds, log_buffer, strlen(log_buffer)) == -1) 
							log_errf(-1, __func__, "fwrite failed. ERR : %s",strerror(errno));
						close(lockfds);
						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, "reconfigure",
							   "scheduler priv directory has changed to %s", tmp_priv_dir);
						if (tmp_comment != NULL)
							clear_comment = 1;
						free(priv_dir);
						if ((priv_dir = string_dup(tmp_priv_dir)) == NULL) {
							return 0;
						}
					}
				}
			}
		}

		if (priv_dir_update_fail) {
			/* update the sched comment attribute with the reason for failure */
			attribs = static_cast<attropl *>(calloc(2, sizeof(struct attropl)));
			if (attribs == NULL) {
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__, MEM_ERR_MSG);
				strcpy(comment, "Unable to change the sched_priv directory");
				goto cleanup;
			}
			patt = attribs;
			patt->name = const_cast<char *>(ATTR_comment);
			patt->value = comment;
			patt->next = patt + 1;
			patt++;
			patt->name = const_cast<char *>(ATTR_scheduling);
			patt->value = const_cast<char *>("0");
			patt->next = NULL;
			err = pbs_manager(connector,
					  MGR_CMD_SET, MGR_OBJ_SCHED,
					  const_cast<char *>(sc_name), attribs, NULL);
			free(attribs);
			if (err) {
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
					   "Failed to update scheduler comment %s at the server", comment);
			}
			goto cleanup;
		}
	}
	if (clear_comment) {
		int err;
		struct attropl *patt;

		attribs = static_cast<attropl *>(calloc(1, sizeof(struct attropl)));
		if (attribs == NULL) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__, MEM_ERR_MSG);
			goto cleanup;
		}

		patt = attribs;
		patt->name = const_cast<char *>(ATTR_comment);
		patt->value = static_cast<char *>(malloc(1));
		if (patt->value == NULL) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
				  "can't update scheduler attribs, malloc failed");
			free(attribs);
			goto cleanup;
		}
		patt->value[0] = '\0';
		patt->next = NULL;
		err = pbs_manager(connector,
				  MGR_CMD_UNSET, MGR_OBJ_SCHED,
				  const_cast<char *>(sc_name), attribs, NULL);
		free(attribs->value);
		free(attribs);
		if (err) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
				  "Failed to update scheduler comment at the server");
			goto cleanup;
		}
	}
	ret = 1;
cleanup:
	free(tmp_log_dir);
	free(tmp_priv_dir);
	free(tmp_comment);
	return ret;
}

/**
 * @brief
 *	Set and validate the sched object attributes queried from Server
 *
 * @param[in] connector - socket descriptor to server
 *
 * @retval Error code
 * @return 0 - Failure
 * @return 1 - Success
 *
 * @par Side Effects:
 *	None
 *
 *
 */
int
set_validate_sched_attrs(int connector)
{
	struct batch_status *ss = NULL;
	struct batch_status *all_ss = NULL;

	if (connector < 0)
		return 0;

	/* Stat the scheduler to get details of sched */

	all_ss = send_statsched(connector, NULL, NULL);
	ss = bs_find(all_ss, sc_name);

	if (ss == NULL) {
		snprintf(log_buffer, sizeof(log_buffer), "Unable to retrieve the scheduler attributes from server");
		log_err(-1, __func__, log_buffer);
		pbs_statfree(all_ss);
		return 0;
	}
	if (!parse_sched_obj(connector, ss)) {
		pbs_statfree(all_ss);
		return 0;
	}

	pbs_statfree(all_ss);

	return 1;
}

/**
 * @brief Validate running user.
 * If PBS_DAEMON_SERVICE_USER is set, and user is root, change user to it.
 *
 * @param[in] exename - name of executable (argv[0])
 *
 * @retval Error code
 * @return 0 - Failure
 * @return 1 - Success
 *
 * @par Side Effects:
 *	None
 */
int
validate_running_user(char *exename)
{
	char buf[128];
	if (pbs_conf.pbs_daemon_service_user) {
		struct passwd *user = getpwnam(pbs_conf.pbs_daemon_service_user);
		if (user == NULL) {
			snprintf(buf, sizeof(buf), "%s: PBS_DAEMON_SERVICE_USER [%s] does not exist\n", exename, pbs_conf.pbs_daemon_service_user);
			perror(buf);
			return 0;
		}

		int rc = setgid(user->pw_gid);
		if (rc != 0) {
			snprintf(buf, sizeof(buf), "%s: Can't change group to PBS_DAEMON_SERVICE_USER's group [%d], setgid() failed.", exename, user->pw_gid);
			perror(buf);
			return 0;
		}

		if (geteuid() == 0) {
			int rc = setuid(user->pw_uid);
			if (rc != 0) {
				snprintf(buf, sizeof(buf), "%s: Can't change to PBS_DAEMON_SERVICE_USER [%s], setuid() failed.", exename, pbs_conf.pbs_daemon_service_user);
				perror(buf);
				return 0;
			}
			pbs_strncpy(pbs_current_user, pbs_conf.pbs_daemon_service_user, PBS_MAXUSER);
		}

		if (user->pw_uid != getuid()) {
			snprintf(buf, sizeof(buf), "%s: Must be run by PBS_DAEMON_SERVICE_USER [%s]\n", exename, pbs_conf.pbs_daemon_service_user);
			perror(buf);
			return 0;
		}
	} else if ((geteuid() != 0) || getuid() != 0) {
		snprintf(buf, sizeof(buf), "%s: Must be run by PBS_DAEMON_SERVICE_USER if set or root if not set\n", exename);
		perror(buf);
		return 0;
	}

	return 1;
}


================================================
FILE: src/scheduler/fifo.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _FIFO_H
#define _FIFO_H

#include <string>

#include <limits.h>
#include "data_types.h"
#include "sched_cmds.h"

/**
 * @brief Gets the Scheduler Command sent by the Server
 *
 * @param[in]     sock - secondary connection to the server
 * @param[in,out] cmd  - pointer to sched cmd to be filled with received cmd
 *
 * @return	int
 * @retval	0	: for EOF
 * @retval	+1	: for success
 * @retval	-1	: for error
 */
int get_sched_cmd(int sock, sched_cmd *cmd);

/**
 * @brief This is non-blocking version of get_sched_cmd()
 *
 * @param[in]     sock - secondary connection to the server
 * @param[in,out] cmd  - pointer to sched cmd to be filled with received cmd
 *
 * @return	int
 * @retval	0	no super high priority command
 * @retval	+1	for success
 * @retval	-1	for error
 * @retval	-2	for EOF
 *
 * @note this function uses different return code (-2) for EOF than get_sched_cmd() (-1)
 */
int get_sched_cmd_noblk(int sock, sched_cmd *cmd);

/*
 *      schedinit - initialize conf struct and parse conf files
 */
int schedinit(int nthreads);

/*
 *	intermediate_schedule - responsible for starting/restarting scheduling
 *				cycle
 */

int intermediate_schedule(int sd, const sched_cmd *cmd);

/*
 *      scheduling_cycle - the controling function of the scheduling cycle
 */

int scheduling_cycle(int sd, const sched_cmd *cmd);

/*
 *	init_scheduling_cycle - run things that need to be set up every
 *				scheduling cycle
 *	NOTE: failure of this function will cause schedule() to exit
 */
int init_scheduling_cycle(status *policy, int pbs_sd, server_info *sinfo);

/*
 *
 *      next_job - find the next job to be run by the scheduler
 *
 *        policy - policy info.
 *        sinfo - the server the jobs are on
 *        flag - whether or not to initialize, sort jobs.
 *
 *      returns the next job to run or NULL when there are no more jobs
 *              to run, or on error
 *
 */

resource_resv *next_job(status *policy, server_info *sinfo, int flag);

/*
 *      find_runnable_job_ind - find the index of the next runnable job in a job array
 *  		Jobs are runnable if:
 *	   	in state 'Q'
 *		suspended by the scheduler
 *		is job array in state 'B' and there is a queued subjob
 *
 *		Reservations are runnable if they are in state RESV_CONFIRMED
 */
int find_runnable_resresv_ind(resource_resv **resresv_arr, int start_index);

/*
 *	find_non_normal_job_ind - find the index of the next runnable express,preempted
 */
int find_non_normal_job_ind(resource_resv **jobs, int start_index);

/*
 *
 *      sim_run_update_resresv - simulate the running of a job
 */
bool sim_run_update_resresv(status *policy, resource_resv *resresv, std::vector<nspec *> &ns_arr, unsigned int flags);
bool sim_run_update_resresv(status *policy, resource_resv *resresv, unsigned int flags);

/*
 *
 *	run_update_resresv - run a resource_resv (job or reservation) and
 *				update the local cache if it was successfully
 *				run.  Currently we only simulate the running
 *				of reservations.
 *
 *	  pbs_sd - connection descriptor to pbs_server or
 *			  SIMULATE_SD if we're simulating
 *	  sinfo  - server job is on
 *	  qinfo  - queue job resides in or NULL if reservation
 *	  rresv  - the job/reservation to run
 *	  flags  - flags to modify procedure
 *		RURR_ADD_END_EVENT - add an end event to calendar for this job
 *
 *	return 1 for success
 *	return 0 for failure (see pbs_errno for more info)
 *	return -1 on error
 *
 */
bool run_update_job(status *policy, int pbs_sd, server_info *sinfo, queue_info *qinfo,
		    resource_resv *resresv, std::vector<nspec *> &nspec_arr, unsigned int flags, schd_error *err);

bool
run_update_job(status *policy, int pbs_sd, server_info *sinfo, queue_info *qinfo,
	       resource_resv *rr, unsigned int flags, schd_error *err);

/*
 *	update_job_can_not_run - do post job 'can't run' processing
 *				 mark it 'can_not_run'
 *				 update the job comment and log the reason why
 *				 take care of deleting a 'can_never_run job
 */
int update_job_can_not_run(int pbs_sd, resource_resv *job, schd_error *err);

/*
 *	end_cycle_tasks - stuff which needs to happen at the end of a cycle
 */
void end_cycle_tasks(server_info *sinfo);

/*
 *	add_job_to_calendar - find the most top job and init all the
 *		correct variables in sinfo to correctly backfill around it
 */
int add_job_to_calendar(int pbs_sd, status *policy, server_info *sinfo, resource_resv *topjob, int use_buckets);

/*
 * 	run_job - handle the running of a pbs job.  If it's a peer job
 *	       first move it to the local server and then run it.
 *	       if it's a local job, just run it.
 */
int run_job(int pbs_sd, resource_resv *rjob, char *execvnode, schd_error *err);

/*
 *	should_backfill_with_job - should we call add_job_to_calendar() with job
 *	returns 1: we should backfill 0: we should not
 */
int should_backfill_with_job(status *policy, server_info *sinfo, resource_resv *resresv, int num_topjobs);

/*
 *
 *	update_cycle_status - update global status structure which holds
 *			      status information used by the scheduler which
 *			      can change from cycle to cycle
 *
 *	  policy - status structure to update
 *	  current_time - current time or 0 to call time()
 *
 *	return nothing
 *
 */
void update_cycle_status(status &policy, time_t current_time);

/*
 *
 *	the main scheduler loop
 *			  Loop until njob = next_job() returns NULL
 *			   if njob can run now, run it
 *			   if not, attempt preemption
 *				if successful, run njob
 *			   njob can't run:
 *			     if we can backfill
 *				add job to calendar
 *			     deal with normal job can't run stuff

 */
int main_sched_loop(status *policy, int sd, server_info *sinfo, schd_error **rerr);

/*
 *
 *	scheduler_simulation_task - offline simulation task to calculate
 *		       estimated information for all jobs in the system.
 *
 *	  pbs_sd - connection descriptor to pbs server
 *
 *	return success 1 or error 0
 */
int scheduler_simulation_task(int pbs_sd, int debug);

int set_validate_sched_attrs(int);

int validate_running_user(char *exename);

int send_run_job(int virtual_sd, int has_runjob_hook, const std::string &jobid, char *execvnode);

struct batch_status *send_statsched(int virtual_fd, struct attrl *attrib, char *extend);

#endif /* _FIFO_H */


================================================
FILE: src/scheduler/get_4byte.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * contains functions related to receive command sent by the Server
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <stdlib.h>
#include "dis.h"
#include "sched_cmds.h"
#include "data_types.h"
#include "fifo.h"

#include <sys/types.h>
#include <sys/time.h>
#include <unistd.h>

#if defined(FD_SET_IN_SYS_SELECT_H)
#include <sys/select.h>
#endif

/**
 * @brief Gets the Scheduler Command sent by the Server
 *
 * @param[in]     sock - secondary connection to the server
 * @param[in,out] cmd  - pointer to sched cmd to be filled with received cmd
 *
 * @return	int
 * @retval	0	: for EOF
 * @retval	+1	: for success
 * @retval	-1	: for error
 */
int
get_sched_cmd(int sock, sched_cmd *cmd)
{
	int i;
	int rc = 0;
	char *jobid = NULL;

	i = disrsi(sock, &rc);
	if (rc != 0)
		goto err;
	if (i == SCH_SCHEDULE_AJOB) {
		jobid = disrst(sock, &rc);
		if (rc != 0)
			goto err;
	}

	cmd->cmd = i;
	cmd->jid = jobid;
	return 1;

err:
	if (rc == DIS_EOF)
		return 0;
	else
		return -1;
}

/**
 * @brief This is non-blocking version of get_sched_cmd()
 *
 * @param[in]     sock - secondary connection to the server
 * @param[in,out] cmd  - pointer to sched cmd to be filled with received cmd
 *
 * @return	int
 * @retval	0	no command to read
 * @retval	+1	for success
 * @retval	-1	for error
 * @retval	-2	for EOF
 *
 * @note this function uses different return code (-2) for EOF than get_sched_cmd() (which uses -1)
 */
int
get_sched_cmd_noblk(int sock, sched_cmd *cmd)
{
	struct timeval timeout;
	fd_set fdset;
	timeout.tv_usec = 0;
	timeout.tv_sec = 0;

	FD_ZERO(&fdset);
	FD_SET(sock, &fdset);

	if (select(FD_SETSIZE, &fdset, NULL, NULL, &timeout) != -1 && FD_ISSET(sock, &fdset)) {
		int rc = get_sched_cmd(sock, cmd);
		if (rc == 0)
			return -2;
		return rc;
	}
	return 0;
}


================================================
FILE: src/scheduler/globals.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdio.h>
#include <pthread.h>
#include <limits.h>

#include "globals.h"
#include "constant.h"
#include "sort.h"
#include "config.h"
#include "data_types.h"
#include "queue.h"

/**
 * @file    globals.c
 *
 * @brief
 *	sorting_info[] - holds information about all the different ways you
 *			 can sort the jobs
 * @par
 *	Format: { sort_type, config_name, cmp_func_ptr }
 * @par
 *	sort_type    : an element from the enum sort_type
 *	config_name  : the name which appears in the scheduling policy config
 *		         file (sched_config)
 *	cmp_func_ptr : function pointer the qsort compare function
 *			 (located in sort.c)
 *
 */

const struct sort_conv sort_convert[] =
	{
		{"shortest_job_first", "cput", ASC},
		{"longest_job_first", "cput", DESC},
		{"smallest_memory_first", "mem", ASC},
		{"largest_memory_first", "mem", DESC},
		{"high_priority_first", SORT_PRIORITY, DESC},
		{"low_priority_first", SORT_PRIORITY, ASC},
		{"large_walltime_first", "walltime", DESC},
		{"short_walltime_first", "walltime", ASC},
		{"fair_share", SORT_FAIR_SHARE, ASC},
		{"preempt_priority", SORT_PREEMPT, DESC},
		{NULL, NULL, NO_SORT_ORDER}};

/*
 * 	smp_cluster_info - used to convert parse values into enum
 */
const struct enum_conv smp_cluster_info[] =
	{
		{SMP_NODE_PACK, "pack"},
		{SMP_ROUND_ROBIN, "round_robin"},
		{HIGH_SMP_DIST, ""}};

/*
 *	prempt_prio_info - used to convert parse values into enum values
 *			   for preemption priority levels
 *
 */
const struct enum_conv preempt_prio_info[] =
	{
		{PREEMPT_NORMAL, "normal_jobs"},
		{PREEMPT_OVER_FS_LIMIT, "fairshare"},
		{PREEMPT_OVER_QUEUE_LIMIT, "queue_softlimits"},
		{PREEMPT_OVER_SERVER_LIMIT, "server_softlimits"},
		{PREEMPT_EXPRESS, "express_queue"},
		{PREEMPT_ERR, ""}, /* no corresponding config file value */
		{PREEMPT_HIGH, ""}};

/* Well known resources: If these aren't queried, we return an error.
 * Any resource you want to directly index into allres should be in this list
 */
const std::vector<std::string> well_known_res{
	"cput",
	"mem",
	"walltime",
	"soft_walltime",
	"ncpus",
	"arch",
	"host",
	"vnode",
	"aoe",
	"eoe",
	"min_walltime",
	"max_walltime",
	"preempt_targets",
};

struct config conf;
struct status cstat;

/* to make references happy */
int got_sigpipe;

/* Each index of the array is a sched command. Store 1 as a value to indicate that we received a command */
int sched_cmds[SCH_CMD_HIGH];

/* This list stores SCH_SCHEDULE_AJOB commands */
sched_cmd *qrun_list;
int qrun_list_size;

void *poll_context = NULL;

/* Stuff needed for multi-threading */
pthread_mutex_t general_lock;
pthread_mutex_t work_lock;
pthread_mutex_t result_lock;
pthread_cond_t work_cond;
pthread_cond_t result_cond;
ds_queue *work_queue = NULL;
ds_queue *result_queue = NULL;
pthread_t *threads = NULL;
int threads_die = 0;
int num_threads = 0;
pthread_key_t th_id_key;
pthread_once_t key_once = PTHREAD_ONCE_INIT;

/* resource definitions from the server */

/* all resources */
std::unordered_map<std::string, resdef *> allres;
/* consumable resources */
std::unordered_set<resdef *> consres;
/* boolean resources*/
std::unordered_set<resdef *> boolres;

/* AOE name used to compare nodes, free when exit cycle */
char *cmp_aoename = NULL;

const char *sc_name = NULL;
char *logfile = NULL;

unsigned int preempt_normal; /* preempt priority of normal_jobs */

char path_log[_POSIX_PATH_MAX];
int dflt_sched = 0;

struct schedattrs sc_attrs;

time_t last_attr_updates = 0;

int send_job_attr_updates = 1;

/* primary socket descriptor to the server pool */
int clust_primary_sock = -1;

/* secondary socket descriptor to the server pool */
int clust_secondary_sock = -1;

/* a list of running jobs from the last scheduling cycle */
std::vector<prev_job_info> last_running;

/* fairshare tree */
fairshare_head *fstree;


================================================
FILE: src/scheduler/globals.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _GLOBALS_H
#define _GLOBALS_H
#include <pthread.h>
#include <limits.h>

#include "data_types.h"
#include "queue.h"
#include "sched_cmds.h"

extern void *poll_context;

/* Each index of the array is a sched command. Store 1 as a value to indicate that we received a command */
extern int sched_cmds[SCH_CMD_HIGH];

/* This list stores SCH_SCHEDULE_AJOB commands */
extern sched_cmd *qrun_list;
extern int qrun_list_size;

/* resources to check */
extern const struct rescheck res_to_check[];

/* information about sorting */
extern const struct sort_conv sort_convert[];

/* used to convert string into enum in parsing */
extern const struct enum_conv smp_cluster_info[];
extern const struct enum_conv preempt_prio_info[];

/* info to get from mom */
extern const char *res_to_get[];

/* programs to run to replaced specific resources_assigned values */
extern const char *res_assn[];

extern struct config conf;
extern struct status cstat;

extern const int num_resget;

/* Variables from pbs_sched code */
extern int got_sigpipe;

extern const std::vector<std::string> well_known_res;
/* Stuff needed for multi-threading */
extern pthread_mutex_t general_lock;
extern pthread_mutex_t work_lock;
extern pthread_cond_t work_cond;
extern pthread_mutex_t result_lock;
extern pthread_cond_t result_cond;
extern ds_queue *work_queue;
extern ds_queue *result_queue;
extern pthread_t *threads;
extern int threads_die;
extern int num_threads;
extern pthread_key_t th_id_key;
extern pthread_once_t key_once;

extern std::unordered_map<std::string, resdef *> allres;
extern std::unordered_set<resdef *> consres;
extern std::unordered_set<resdef *> boolres;

extern const char *sc_name;
extern char *logfile;

extern unsigned int preempt_normal; /* preempt priority of normal_jobs */

extern char path_log[_POSIX_PATH_MAX];
extern int dflt_sched;

extern struct schedattrs sc_attrs;

extern time_t last_attr_updates; /* timestamp of the last time attr updates were sent */

extern int send_job_attr_updates;

extern int clust_primary_sock;

extern int clust_secondary_sock;

/* a list of running jobs from the last scheduling cycle */
extern std::vector<prev_job_info> last_running;

/**
 * @brief
 * It is used as a placeholder to store aoe name. This aoe name will be
 * used by sorting routine to compare with vnode's current aoe.
 */
extern char *cmp_aoename;

extern fairshare_head *fstree;

#endif /* _GLOBALS_H */


================================================
FILE: src/scheduler/job_info.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    job_info.c
 *
 * @brief
 * 		job_info.c - This file contains functions related to job_info structure.
 *
 * Functions included are:
 * 	query_jobs()
 * 	query_job()
 * 	new_job_info()
 * 	free_job_info()
 * 	set_job_state()
 * 	update_job_attr()
 * 	send_job_updates()
 * 	send_attr_updates()
 * 	unset_job_attr()
 * 	update_job_comment()
 * 	update_jobs_cant_run()
 * 	translate_fail_code()
 * 	dup_job_info()
 * 	preempt_job_set_filter()
 * 	get_preemption_order()
 * 	preempt_job()
 * 	find_and_preempt_jobs()
 * 	find_jobs_to_preempt()
 * 	select_index_to_preempt()
 * 	preempt_level()
 * 	set_preempt_prio()
 * 	create_subjob_name()
 * 	create_subjob_from_array()
 * 	update_array_on_run()
 * 	is_job_array()
 * 	modify_job_array_for_qrun()
 * 	queue_subjob()
 * 	formula_evaluate()
 * 	make_eligible()
 * 	make_ineligible()
 * 	update_accruetype()
 * 	getaoename()
 * 	update_estimated_attrs()
 * 	check_preempt_targets_for_none()
 * 	is_finished_job()
 * 	preemption_similarity()
 * 	geteoename()
 *
 */

#include <pbs_config.h>

#ifdef PYTHON
#include <pbs_python_private.h>
#include <Python.h>
#endif

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <time.h>
#include <unistd.h>
#include <sys/types.h>
#include <math.h>
#include <pbs_ifl.h>
#include <log.h>
#include <libutil.h>
#include <pbs_share.h>
#include <pbs_internal.h>
#include <pbs_error.h>
#include "queue_info.h"
#include "job_info.h"
#include "resv_info.h"
#include "constant.h"
#include "misc.h"
#include "config.h"
#include "globals.h"
#include "fairshare.h"
#include "node_info.h"
#include "check.h"
#include "sort.h"
#include "fifo.h"
#include "range.h"
#include "resource_resv.h"
#include "limits_if.h"
#include "simulate.h"
#include "resource.h"
#include "server_info.h"
#include "attribute.h"
#include "multi_threading.h"
#include "libpbs.h"

#ifdef NAS
#include "site_code.h"
#include "site_queue.h"
#endif

extern char *pbse_to_txt(int err);

/**
 *	This table contains job comment and information messages that correspond
 *	to the sched_error_code enums in "constant.h".  The order of the strings in
 *	the table must match the numeric order of the sched_error_code enum values.
 *	The length of the resultant strings (including any arguments inserted
 *	via % formatting directives by translate_fail_code(), q.v.) must not
 *	exceed the dimensions of the schd_error elements.  See data_types.h.
 */
struct fc_translation_table {
	const char *fc_comment; /**< job comment string */
	const char *fc_info;	/**< job error string */
};
static struct fc_translation_table fctt[] = {
	{"",
	 ""},
	{/* SUCCESS */
	 "",
	 ""},
	{/* SCHD_ERROR */
	 "Internal Scheduling Error",
	 "A scheduling error has occurred"},
	{/* NOT_QUEUED */
	 "Job not in queued state",
	 "Job is not in queued state"},
	{/* QUEUE_NOT_STARTED */
	 "Queue not started.",
	 "Queue not started"},
	{/* QUEUE_NOT_EXEC */
	 "Queue not an execution queue.",
	 "Queue not an execution queue"},
	{/* QUEUE_JOB_LIMIT_REACHED */
	 "Queue %s job limit has been reached.",
	 "Queue %s job limit reached"},
	{/* SERVER_JOB_LIMIT_REACHED */
	 "Server job limit has been reached.",
	 "Server job limit reached"},
	{/* SERVER_USER_LIMIT_REACHED */
	 "User has reached server running job limit.",
	 "Server per-user job limit reached"},
	{/* QUEUE_USER_LIMIT_REACHED */
	 "User has reached queue %s running job limit.",
	 "Queue %s per-user job limit reached"},
	{/* SERVER_GROUP_LIMIT_REACHED */
	 "Group has reached server running limit.",
	 "Server per-group limit reached"},
	{/* QUEUE_GROUP_LIMIT_REACHED */
	 "Group has reached queue %s running limit.",
	 "Queue %s per-group job limit reached"},
	{/* DED_TIME */
	 "Dedicated time conflict",
	 "Dedicated Time"},
	{/* CROSS_DED_TIME_BOUNDRY */
	 "Job would cross dedicated time boundary",
	 "Job would not finish before dedicated time"},
	{/* NO_AVAILABLE_NODE */
	 "",
	 ""},
	{/* NOT_ENOUGH_NODES_AVAIL */
	 "Not enough of the right type of nodes are available",
	 "Not enough of the right type of nodes available"},
	{/* BACKFILL_CONFLICT */
	 "Job would interfere with a top job",
	 "Job would interfere with a top job"},
	{/* RESERVATION_INTERFERENCE */
	 "Job would interfere with a confirmed reservation",
	 "Job would interfere with a reservation"},
	{/* PRIME_ONLY */
	 "Job will run in primetime only",
	 "Job only runs in primetime"},
	{/* NONPRIME_ONLY */
	 "Job will run in nonprimetime only",
	 "Job only runs in nonprimetime"},
	{/* CROSS_PRIME_BOUNDARY */
	 "Job will cross into %s",
	 "Job would cross into %s"},
	{/* NODE_NONEXISTENT */
	 "Specified %s does not exist: %s",
	 "Specified %s does not exist: %s"},
	{/* NO_NODE_RESOURCES */
	 "No available resources on nodes",
	 "No available resources on nodes"},
	{/* CANT_PREEMPT_ENOUGH_WORK */
	 "Can't preempt enough work to run job",
	 "Can't preempt enough work to run job"},
	{/* QUEUE_USER_RES_LIMIT_REACHED */
	 "Queue %s per-user limit reached on resource %s",
	 "Queue %s per-user limit reached on resource %s"},
	{/* SERVER_USER_RES_LIMIT_REACHED */
	 "Server per-user limit reached on resource %s",
	 "Server per-user limit reached on resource %s"},
	{/* QUEUE_GROUP_RES_LIMIT_REACHED */
	 "Queue %s per-group limit reached on resource %s",
	 "Queue %s per-group limit reached on resource %s"},
	{/* SERVER_GROUP_RES_LIMIT_REACHED */
	 "Server per-group limit reached on resource %s",
	 "Server per-group limit reached on resource %s"},
	{/* NO_FAIRSHARES */
	 "Job has zero shares for fairshare",
	 "Job has zero shares for fairshare"},
	{/* INVALID_NODE_STATE */
	 "Node is in an ineligible state: %s",
#ifdef NAS /* localmod 031 */
	 "Node is in an ineligible state: %s: %s"
#else
	 "Node is in an ineligible state: %s"
#endif /* localmod 031 */
	},
	{/* INVALID_NODE_TYPE */
	 "Node is of an ineligible type: %s",
	 "Node is of an ineligible type: %s"},
	{  /* NODE_NOT_EXCL */
#ifdef NAS /* localmod 031 */
	 "Nodes not available",
#else
	 "%s is requesting an exclusive node and node is in use",
#endif /* localmod 031 */
	 "%s is requesting an exclusive node and node is in use"},
	{/* NODE_JOB_LIMIT_REACHED */
	 "Node has reached job run limit",
	 "Node has reached job run limit"},
	{/* NODE_USER_LIMIT_REACHED */
	 "Node has reached user run limit",
	 "Node has reached user run limit"},
	{/* NODE_GROUP_LIMIT_REACHED */
	 "Node has reached group run limit",
	 "Node has reached group run limit"},
	{/* NODE_NO_MULT_JOBS */
	 "Node can't satisfy a multi-node job",
	 "Node can't satisfy a multi-node job"},
	{/* NODE_UNLICENSED */
	 "Node has no PBS license",
	 "Node has no PBS license"},
	{/* UNUSED37 */
	 "",
	 ""},
	{/* NO_SMALL_CPUSETS */
	 "Max number of small cpusets has been reached",
	 "Max number of small cpusets has been reached"},
	{/* INSUFFICIENT_RESOURCE */
	 "Insufficient amount of resource: %s %s",
	 "Insufficient amount of resource: %s %s"},
	{/* RESERVATION_CONFLICT */
	 "Job would conflict with reservation or top job",
	 "Job would conflict with reservation or top job"},
	{/* NODE_PLACE_PACK */
	 "Node ineligible because job requested pack placement and won't fit on node",
	 "Node ineligible because job requested pack placement and won't fit on node"},
	{/* NODE_RESV_ENABLE */
	 "Node not eligible for advance reservation",
	 "Node not eligible for advance reservation"},
	{/* STRICT_ORDERING */
	 "Job would break strict sorted order",
	 "Job would break strict sorted order"},
	{/* MAKE_ELIGIBLE */
	 "",
	 ""},
	{/* MAKE_INELIGIBLE */
	 "",
	 ""},
	{/* INSUFFICIENT_QUEUE_RESOURCE */
	 "Insufficient amount of queue resource: %s %s",
	 "Insufficient amount of queue resource: %s %s"},
	{/* INSUFFICIENT_SERVER_RESOURCE */
	 "Insufficient amount of server resource: %s %s",
	 "Insufficient amount of server resource: %s %s"},
	{/* QUEUE_BYGROUP_JOB_LIMIT_REACHED */
	 "Queue %s job limit reached for group %s",
	 "Queue %s job limit reached for group %s"},
	{/* QUEUE_BYUSER_JOB_LIMIT_REACHED */
	 "Queue %s job limit reached for user %s",
	 "Queue %s job limit reached for user %s"},
	{/* SERVER_BYGROUP_JOB_LIMIT_REACHED */
	 "Server job limit reached for group %s",
	 "Server job limit reached for group %s"},
	{/* SERVER_BYUSER_JOB_LIMIT_REACHED */
	 "Server job limit reached for user %s",
	 "Server job limit reached for user %s"},
	{/* SERVER_BYGROUP_RES_LIMIT_REACHED */
	 "would exceed group %s's limit on resource %s in complex",
	 "would exceed group %s's limit on resource %s in complex"},
	{/* SERVER_BYUSER_RES_LIMIT_REACHED */
	 "would exceed user %s's limit on resource %s in complex",
	 "would exceed user %s's limit on resource %s in complex"},
	{/* QUEUE_BYGROUP_RES_LIMIT_REACHED */
	 "would exceed group %s's limit on resource %s in queue %s",
	 "would exceed group %s's limit on resource %s in queue %s"},
	{/* QUEUE_BYUSER_RES_LIMIT_REACHED */
	 "would exceed user %s's limit on resource %s in queue %s",
	 "would exceed user %s's limit on resource %s in queue %s"},
	{/* QUEUE_RESOURCE_LIMIT_REACHED */
	 "would exceed overall limit on resource %s in queue %s",
	 "would exceed overall limit on resource %s in queue %s"},
	{/* SERVER_RESOURCE_LIMIT_REACHED */
	 "would exceed overall limit on resource %s in complex",
	 "would exceed overall limit on resource %s in complex"},
	{/* PROV_DISABLE_ON_SERVER */
	 "Cannot provision, provisioning disabled on server",
	 "Cannot provision, provisioning disabled on server"},
	{/* PROV_DISABLE_ON_NODE */
	 "Cannot provision, provisioning disabled on vnode",
	 "Cannot provision, provisioning disabled on vnode"},
	{/* AOE_NOT_AVALBL */
	 "Cannot provision, requested AOE %s not available on vnode",
	 "Cannot provision, requested AOE %s not available on vnode"},
	{/* EOE_NOT_AVALBL */
	 "Cannot provision, requested EOE %s not available on vnode",
	 "Cannot provision, requested EOE %s not available on vnode"},
	{/* PROV_BACKFILL_CONFLICT */
	 "Provisioning for job would interfere with backfill job",
	 "Provisioning for job would interfere with backfill job"},
	{/* IS_MULTI_VNODE */
	 "Cannot provision, host has multiple vnodes",
	 "Cannot provision, host has multiple vnodes"},
	{/* PROV_RESRESV_CONFLICT */
	 "Provision conflict with existing job/reservation",
	 "Provision conflict with existing job/reservation"},
	{/* RUN_FAILURE */
	 "PBS Error: %s",
	 "Failed to run: %s (%s)"},
	{/* SET_TOO_SMALL */
	 "%s set %s has too few free resources",
	 "%s set %s has too few free resources or is too small"},
	{/* CANT_SPAN_PSET */
	 "can't fit in the largest placement set, and can't span psets",
	 "Can't fit in the largest placement set, and can't span placement sets"},
	{/* NO_FREE_NODES */
	 "Not enough free nodes available",
	 "Not enough free nodes available"},
	{/* SERVER_PROJECT_LIMIT_REACHED */
	 "Project has reached server running limit.",
	 "Server per-project limit reached"},
	{/* SERVER_PROJECT_RES_LIMIT_REACHED */
	 "Server per-project limit reached on resource %s",
	 "Server per-project limit reached on resource %s"},
	{/* SERVER_BYPROJECT_RES_LIMIT_REACHED */
	 "would exceed project %s's limit on resource %s in complex",
	 "would exceed project %s's limit on resource %s in complex"},
	{/* SERVER_BYPROJECT_JOB_LIMIT_REACHED */
	 "Server job limit reached for project %s",
	 "Server job limit reached for project %s"},
	{/* QUEUE_PROJECT_LIMIT_REACHED */
	 "Project has reached queue %s's running limit.",
	 "Queue %s per-project job limit reached"},
	{/* QUEUE_PROJECT_RES_LIMIT_REACHED */
	 "Queue %s per-project limit reached on resource %s",
	 "Queue %s per-project limit reached on resource %s"},
	{/* QUEUE_BYPROJECT_RES_LIMIT_REACHED */
	 "would exceed project %s's limit on resource %s in queue %s",
	 "would exceed project %s's limit on resource %s in queue %s"},
	{/* QUEUE_BYPROJECT_JOB_LIMIT_REACHED */
	 "Queue %s job limit reached for project %s",
	 "Queue %s job limit reached for project %s"},
	{/* NO_TOTAL_NODES */
	 "Not enough total nodes available",
	 "Not enough total nodes available"},
	{/* INVALID_RESRESV */
	 "Invalid Job/Resv %s",
	 "Invalid Job/Resv %s"},
	{
		/* JOB_UNDER_THRESHOLD */
		"Job is under job_sort_formula threshold value",
		"Job is under job_sort_formula threshold value",
	},
	{
		/* MAX_RUN_SUBJOBS */
		"Number of concurrent running subjobs limit reached",
		"Number of concurrent running subjobs limit reached",
#ifdef NAS
	},
	/* localmod 034 */
	{
		/* GROUP_CPU_SHARE */
		"Job would exceed mission CPU share",
		"Job would exceed mission CPU share",
	},
	{
		/* GROUP_CPU_INSUFFICIENT */
		"Job exceeds total mission share",
		"Job exceeds total mission share",
	},
	/* localmod 998 */
	{
		/* RESOURCES_INSUFFICIENT */
		"Too few free resources",
		"Too few free resources",
#endif
	},
};

#define ERR2COMMENT(code) (fctt[(code) -RET_BASE].fc_comment)
#define ERR2INFO(code) (fctt[(code) -RET_BASE].fc_info)

/**
 * @brief	pthread routine for querying a chunk of jobs
 *
 * @param[in,out]	data - th_data_query_jinfo object for the querying
 *
 * @return void
 */
void
query_jobs_chunk(th_data_query_jinfo *data)
{
	struct batch_status *jobs;
	resource_resv **resresv_arr;
	server_info *sinfo;
	queue_info *qinfo;
	int sidx;
	int eidx;
	int num_jobs_chunk;
	int i;
	int jidx;
	struct batch_status *cur_job;
	schd_error *err;
	int pbs_sd;
	status *policy;

	jobs = data->jobs;
	sinfo = data->sinfo;
	qinfo = data->qinfo;
	pbs_sd = data->pbs_sd;
	policy = data->policy;
	sidx = data->sidx;
	eidx = data->eidx;
	num_jobs_chunk = eidx - sidx + 1;

	err = new_schd_error();
	if (err == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		data->error = 1;
		return;
	}

	resresv_arr = static_cast<resource_resv **>(malloc(sizeof(resource_resv *) * (num_jobs_chunk + 1)));
	if (resresv_arr == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		data->error = 1;
		return;
	}
	resresv_arr[0] = NULL;

	/* Move to the linked list item corresponding to the 'start' index */
	for (cur_job = jobs, i = 0; i < sidx && cur_job != NULL; cur_job = cur_job->next, i++)
		;

	for (i = sidx, jidx = 0; i <= eidx && cur_job != NULL; cur_job = cur_job->next, i++) {
		resource_resv *resresv;

		if ((resresv = query_job(pbs_sd, cur_job, sinfo, qinfo, err)) == NULL) {
			data->error = 1;
			free_schd_error(err);
			free_resource_resv_array(resresv_arr);
			return;
		}

		/* do a validity check to see if the job is sane.  If we're peering and
		 * we're not a manager at the remote host, we wont have necessary attribs
		 * like euser and egroup
		 */
		if (resresv->is_invalid || !is_resource_resv_valid(resresv, err)) {
			schdlogerr(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Job is invalid - ignoring for this cycle", err);
			/* decrement i because we're about to increment it as part of the for()
			 * header.  We to continue adding valid jobs to our array.  We're
			 * freeing what we allocated and ignoring this job completely.
			 */
			delete resresv;
			continue;
		}

		/* Make sure scheduler does not process a subjob in undesirable state*/
		if (resresv->job->is_subjob && !resresv->job->is_running && !resresv->job->is_exiting &&
		    !resresv->job->is_suspended && !resresv->job->is_provisioning) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_RESV, LOG_DEBUG,
				  resresv->name, "Subjob found in undesirable state, ignoring this job");
			delete resresv;
			continue;
		}

		/* if the job's fairshare entity has no percentage of the machine,
		 * the job can not run if enforce_no_shares is set
		 */
		if (policy->fair_share && conf.enforce_no_shares) {
			if (resresv->job->ginfo != NULL &&
			    resresv->job->ginfo->tree_percentage == 0) {
				set_schd_error_codes(err, NEVER_RUN, NO_FAIRSHARES);
			}
		}

#ifdef NAS /* localmod 034 */
		site_set_job_share(resresv);
#endif /* localmod 034 */

		/* Don't consider a job not in a queued state as runnable */
		if (!in_runnable_state(resresv))
			resresv->can_not_run = 1;

#ifdef RESC_SPEC
		/* search_for_rescspec() sets jinfo->rspec */
		if (!search_for_rescspec(resresv, qinfo->server->nodes))
			set_schd_error_codes(err, NOT_RUN, NO_NODE_RESOURCES);
#endif

		if (err->error_code != SUCCESS) {
			update_job_can_not_run(pbs_sd, resresv, err);
			clear_schd_error(err);
		}
		resresv_arr[jidx++] = resresv;
	}

	resresv_arr[jidx] = NULL;
	data->oarr = resresv_arr;

	free_schd_error(err);
}

/**
 * @brief	Allocates th_data_query_jinfo for multi-threading of query_jobs
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	connection to pbs_server
 * @param[in]	jobs	-	batch_status of jobs
 * @param[in]	qinfo	-	queue to get jobs from
 * @param[in]	sidx	-	start index for the jobs list for the thread
 * @param[in]	eidx	-	end index for the jobs list for the thread
 *
 * @return th_data_query_jinfo *
 * @retval a newly allocated th_data_query_jinfo object
 * @retval NULL for malloc error
 */
static inline th_data_query_jinfo *
alloc_tdata_jquery(status *policy, int pbs_sd, struct batch_status *jobs, queue_info *qinfo,
		   int sidx, int eidx)
{
	th_data_query_jinfo *tdata;

	tdata = static_cast<th_data_query_jinfo *>(malloc(sizeof(th_data_query_jinfo)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->error = 0;
	tdata->jobs = jobs;
	tdata->oarr = NULL; /* Will be filled by the thread routine */
	tdata->sinfo = qinfo->server;
	tdata->qinfo = qinfo;
	tdata->pbs_sd = pbs_sd;
	tdata->policy = policy;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 * 		create an array of jobs in a specified queue
 *
 * @par NOTE:
 * 		anything reservation related needs to happen in
 *		query_reservations().  Since it is called after us,
 *		reservations aren't available at this point.
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	connection to pbs_server
 * @param[in]	qinfo	-	queue to get jobs from
 * @param[in]	pjobs   -	possible job array to add too
 * @param[in]	queue_name	-	the name of the queue to query (local/remote)
 *
 * @return	pointer to the head of a list of jobs
 * @par MT-safe: No
 */
resource_resv **
query_jobs(status *policy, int pbs_sd, queue_info *qinfo, resource_resv **pjobs, const std::string &queue_name)
{
	/* pbs_selstat() takes a linked list of attropl structs which tell it
	 * what information about what jobs to return.  We want all jobs which are
	 * in a specified queue
	 */
	struct attropl opl = {NULL, const_cast<char *>(ATTR_q), NULL, NULL, EQ};
	static struct attropl opl2[2] = {{&opl2[1], const_cast<char *>(ATTR_state), NULL, const_cast<char *>("Q"), EQ},
					 {NULL, const_cast<char *>(ATTR_array), NULL, const_cast<char *>("True"), NE}};
	static struct attrl *attrib = NULL;

	/* linked list of jobs returned from pbs_selstat() */
	struct batch_status *jobs;

	/* current job in jobs linked list */
	struct batch_status *cur_job;

	/* array of internal scheduler structures for jobs */
	resource_resv **resresv_arr;

	/* number of jobs in resresv_arr */
	int num_jobs = 0;
	/* number of jobs in pjobs */
	int num_prev_jobs;
	int num_new_jobs;

	/* for multi-threading */
	int jidx;
	th_data_query_jinfo *tdata = NULL;
	th_task_info *task = NULL;
	resource_resv ***jinfo_arrs_tasks;
	int tid;

	if (policy == NULL || qinfo == NULL || queue_name.empty())
		return pjobs;

	opl.value = const_cast<char *>(queue_name.c_str());

	if (qinfo->is_peer_queue)
		opl.next = &opl2[0];

	if (attrib == NULL) {
		const char *jobattrs[] = {
			ATTR_p,
			ATTR_qtime,
			ATTR_qrank,
			ATTR_etime,
			ATTR_stime,
			ATTR_N,
			ATTR_state,
			ATTR_substate,
			ATTR_sched_preempted,
			ATTR_comment,
			ATTR_released,
			ATTR_euser,
			ATTR_egroup,
			ATTR_project,
			ATTR_resv_ID,
			ATTR_altid,
			ATTR_SchedSelect,
			ATTR_array_id,
			ATTR_node_set,
			ATTR_array,
			ATTR_array_index,
			ATTR_topjob,
			ATTR_topjob_ineligible,
			ATTR_array_indices_remaining,
			ATTR_execvnode,
			ATTR_l,
			ATTR_rel_list,
			ATTR_used,
			ATTR_accrue_type,
			ATTR_eligible_time,
			ATTR_estimated,
			ATTR_c,
			ATTR_r,
			ATTR_depend,
			ATTR_A,
			ATTR_max_run_subjobs,
			NULL};

		for (int i = 0; jobattrs[i] != NULL; i++) {
			struct attrl *temp_attrl;

			temp_attrl = new_attrl();
			temp_attrl->name = strdup(jobattrs[i]);
			temp_attrl->next = attrib;
			temp_attrl->value = const_cast<char *>("");
			attrib = temp_attrl;
		}
	}

	/* get jobs from PBS server */
	if ((jobs = send_selstat(pbs_sd, &opl, attrib, const_cast<char *>("S"))) == NULL) {
		if (pbs_errno > 0) {
			const char *errmsg = pbs_geterrmsg(pbs_sd);
			if (errmsg == NULL)
				errmsg = "";
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_NOTICE, "job_info",
				   "pbs_selstat failed: %s (%d)", errmsg, pbs_errno);
		}
		return pjobs;
	}

	/* count the number of new jobs */
	cur_job = jobs;
	while (cur_job != NULL) {
		num_jobs++;
		cur_job = cur_job->next;
	}
	num_new_jobs = num_jobs;

	/* if there are previous jobs, count those too */
	num_prev_jobs = count_array(pjobs);
	num_jobs += num_prev_jobs;

	/* allocate enough space for all the jobs and the NULL sentinal */
	resresv_arr = static_cast<resource_resv **>(realloc(pjobs, sizeof(resource_resv *) * (num_jobs + 1)));

	if (resresv_arr == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		pbs_statfree(jobs);
		return NULL;
	}
	resresv_arr[num_prev_jobs] = NULL;

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_jquery(policy, pbs_sd, jobs, qinfo, 0, num_new_jobs - 1);
		if (tdata == NULL) {
			free_resource_resv_array(resresv_arr);
			pbs_statfree(jobs);
			return NULL;
		}
		query_jobs_chunk(tdata);

		if (tdata->error || tdata->oarr == NULL) {
			free_resource_resv_array(resresv_arr);
			pbs_statfree(jobs);
			free(tdata->oarr);
			free(tdata);
			return NULL;
		}

		jidx = num_prev_jobs;
		for (int j = 0; tdata->oarr[j] != NULL; j++) {
			resresv_arr[jidx++] = tdata->oarr[j];
		}
		free(tdata->oarr);
		free(tdata);
		resresv_arr[jidx] = NULL;
	} else {
		int chunk_size = num_new_jobs / num_threads;
		int th_err = 0;
		int num_tasks = 0;

		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		chunk_size = (chunk_size < MT_CHUNK_SIZE_MAX) ? chunk_size : MT_CHUNK_SIZE_MAX;
		for (int j = 0; num_new_jobs > 0;
		     num_tasks++, j += chunk_size, num_new_jobs -= chunk_size) {
			tdata = alloc_tdata_jquery(policy, pbs_sd, jobs, qinfo, j, j + chunk_size - 1);
			if (tdata == NULL) {
				th_err = 1;
				break;
			}
			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			if (task == NULL) {
				free(tdata);
				log_err(errno, __func__, MEM_ERR_MSG);
				th_err = 1;
				break;
			}
			task->task_id = num_tasks;
			task->task_type = TS_QUERY_JOB_INFO;
			task->thread_data = (void *) tdata;

			pthread_mutex_lock(&work_lock);
			ds_enqueue(work_queue, (void *) task);
			pthread_cond_signal(&work_cond);
			pthread_mutex_unlock(&work_lock);
		}
		jinfo_arrs_tasks = static_cast<resource_resv ***>(malloc(num_tasks * sizeof(resource_resv **)));
		if (jinfo_arrs_tasks == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			th_err = 1;
		}
		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_query_jinfo *>(task->thread_data);
				if (tdata->error)
					th_err = 1;
				jinfo_arrs_tasks[task->task_id] = tdata->oarr;
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
		if (th_err) {
			pbs_statfree(jobs);
			free_resource_resv_array(resresv_arr);
			free(jinfo_arrs_tasks);
			return NULL;
		}
		/* Assemble job info objects from various threads into the resresv_arr */
		jidx = num_prev_jobs;
		for (int i = 0; i < num_tasks; i++) {
			if (jinfo_arrs_tasks[i] != NULL) {
				for (int j = 0; jinfo_arrs_tasks[i][j] != NULL; j++) {
					resresv_arr[jidx++] = jinfo_arrs_tasks[i][j];
				}
				free(jinfo_arrs_tasks[i]);
			}
		}
		resresv_arr[jidx] = NULL;
		free(jinfo_arrs_tasks);
	}

	pbs_statfree(jobs);

	return resresv_arr;
}

/**
 * @brief
 *		query_job - takes info from a batch_status about a job and
 *			 converts it into a resource_resv struct
 *
 * 	  @param[in] pbs_sd - connection descriptor to the server
 *	  @param[in] job - batch_status struct of job
 *	  @param[in] qinfo - queue where job resides
 *	  @param[out] err - returns error info
 *
 *	@return resource_resv
 *	@retval job (may be invalid, if so, err will report why)
 *	@retval  or NULL on error
 */

resource_resv *
query_job(int pbs_sd, struct batch_status *job, server_info *sinfo, queue_info *qinfo, schd_error *err)
{
	resource_resv *resresv; /* converted job */
	struct attrl *attrp;	/* list of attributes returned from server */
	long count;		/* long used in string->long conversion */
	char *endp;		/* used for strtol() */
	resource_req *resreq;	/* resource_req list for resources requested  */

	if ((resresv = new resource_resv(job->name)) == NULL)
		return NULL;

	if ((resresv->job = new_job_info()) == NULL) {
		delete resresv;
		return NULL;
	}

	resresv->rank = get_sched_rank();

	attrp = job->attribs;

	resresv->server = sinfo;
	resresv->job->queue = qinfo;

	resresv->is_job = true;

	resresv->job->can_checkpoint = true; /* default can be checkpointed */
	resresv->job->can_requeue = true;    /* default can be requeued */
	resresv->job->can_suspend = true;    /* default can be suspended */

	while (attrp != NULL && !resresv->is_invalid) {
		clear_schd_error(err);
		if (conf.fairshare_ent == attrp->name) {
			if (sinfo->fstree != NULL) {
#ifdef NAS /* localmod 059 */
				/* This is a hack to allow -A specification for testing, but
				 * ignore most incorrect user -A values
				 */
				if (strchr(attrp->value, ':') != NULL) {
					/* moved to query_jobs() in order to include the queue name
					 resresv->job->ginfo = find_alloc_ginfo( attrp->value,
					 sinfo->fstree->root );
					 */
					/* localmod 034 */
					resresv->job->sh_info = site_find_alloc_share(sinfo, attrp->value);
				}
#else
				resresv->job->ginfo = find_alloc_ginfo(attrp->value, sinfo->fstree->root);
#endif /* localmod 059 */
			} else
				resresv->job->ginfo = NULL;
		}
		if (!strcmp(attrp->name, ATTR_p)) { /* priority */
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->job->priority = count;
			else
				resresv->job->priority = -1;
#ifdef NAS /* localmod 045 */
			resresv->job->NAS_pri = resresv->job->priority;
#endif							       /* localmod 045 */
		} else if (!strcmp(attrp->name, ATTR_qtime)) { /* queue time */
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->qtime = count;
			else
				resresv->qtime = -1;
		} else if (!strcmp(attrp->name, ATTR_qrank)) { /* queue rank */
			long long qrank;
			qrank = strtoll(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->qrank = qrank;
			else
				resresv->qrank = -1;
		} else if (!strcmp(attrp->name, ATTR_etime)) { /* eligible time */
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->job->etime = count;
			else
				resresv->job->etime = -1;
		} else if (!strcmp(attrp->name, ATTR_stime)) { /* job start time */
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->job->stime = count;
			else
				resresv->job->stime = -1;
		} else if (!strcmp(attrp->name, ATTR_N)) /* job name (qsub -N) */
			resresv->job->job_name = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_state)) { /* state of job */
			if (set_job_state(attrp->value, resresv->job) == 0) {
				set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
				set_schd_error_arg(err, SPECMSG, "Job is in an invalid state");
				resresv->is_invalid = 1;
			}
		} else if (!strcmp(attrp->name, ATTR_substate)) {
			if (!strcmp(attrp->value, SUSP_BY_SCHED_SUBSTATE))
				resresv->job->is_susp_sched = true;
			if (!strcmp(attrp->value, PROVISIONING_SUBSTATE))
				resresv->job->is_provisioning = true;
			if (!strcmp(attrp->value, PRERUNNING_SUBSTATE))
				resresv->job->is_prerunning = true;
		} else if (!strcmp(attrp->name, ATTR_sched_preempted)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0') {
				resresv->job->time_preempted = count;
				resresv->job->is_preempted = true;
			}
		} else if (!strcmp(attrp->name, ATTR_comment)) /* job comment */
			resresv->job->comment = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_released)) /* resources_released */
			resresv->job->resreleased = parse_execvnode(attrp->value, sinfo, NULL);
		else if (!strcmp(attrp->name, ATTR_euser)) /* account name */
			resresv->user = attrp->value;
		else if (!strcmp(attrp->name, ATTR_egroup)) /* group name */
			resresv->group = attrp->value;
		else if (!strcmp(attrp->name, ATTR_project)) /* project name */
			resresv->project = attrp->value;
		else if (!strcmp(attrp->name, ATTR_resv_ID)) /* reserve_ID */
			resresv->job->resv_id = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_altid)) /* vendor ID */
			resresv->job->alt_id = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_SchedSelect))
#ifdef NAS /* localmod 031 */
		{
			resresv->job->schedsel = string_dup(attrp->value);
#endif /* localmod 031 */

			resresv->select = parse_selspec(attrp->value);
#ifdef NAS /* localmod 031 */
		}
#endif /* localmod 031 */
		else if (!strcmp(attrp->name, ATTR_array_id))
			resresv->job->array_id = attrp->value;
		else if (!strcmp(attrp->name, ATTR_node_set))
			resresv->node_set_str = break_comma_list(attrp->value);
		else if (!strcmp(attrp->name, ATTR_array)) { /* array */
			if (!strcmp(attrp->value, ATR_TRUE))
				resresv->job->is_array = true;
		} else if (!strcmp(attrp->name, ATTR_array_index)) { /* array_index */
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->job->array_index = count;
			else
				resresv->job->array_index = -1;

			resresv->job->is_subjob = true;
		} else if (!strcmp(attrp->name, ATTR_topjob)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				resresv->job->is_topjob = true;
		} else if (!strcmp(attrp->name, ATTR_topjob_ineligible)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				resresv->job->topjob_ineligible = true;
		}
		/* array_indices_remaining */
		else if (!strcmp(attrp->name, ATTR_array_indices_remaining))
			resresv->job->queued_subjobs = range_parse(attrp->value);
		else if (!strcmp(attrp->name, ATTR_max_run_subjobs)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->job->max_run_subjobs = count;
		} else if (!strcmp(attrp->name, ATTR_execvnode)) {
			auto tmp_nspec_arr = parse_execvnode(attrp->value, sinfo, NULL);
			resresv->nspec_arr = combine_nspec_array(tmp_nspec_arr);
			free_nspecs(tmp_nspec_arr);

			resresv->ninfo_arr = create_node_array_from_nspec(resresv->nspec_arr);
		} else if (!strcmp(attrp->name, ATTR_l)) { /* resources requested*/
			resreq = find_alloc_resource_req_by_str(resresv->resreq, attrp->resource);
			if (resreq == NULL) {
				delete resresv;
				return NULL;
			}

			if (set_resource_req(resreq, attrp->value) != 1) {
				set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
				set_schd_error_arg(err, SPECMSG, "Bad requested resource data");
				resresv->is_invalid = true;
				return resresv;
			} else {
				if (resresv->resreq == NULL)
					resresv->resreq = resreq;
#ifdef NAS
				if (!strcmp(attrp->resource, "nodect")) { /* nodect for sort */
					/* localmod 040 */
					count = strtol(attrp->value, &endp, 10);
					if (*endp == '\0')
						resresv->job->nodect = count;
					else
						resresv->job->nodect = 0;
					/* localmod 034 */
					resresv->job->accrue_rate = resresv->job->nodect; /* XXX should be SBU rate */
				}
#endif
				if (!strcmp(attrp->resource, "place")) {
					resresv->place_spec = parse_placespec(attrp->value);
					if (resresv->place_spec == NULL) {
						set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
						set_schd_error_arg(err, SPECMSG, "invalid placement spec");
						resresv->is_invalid = true;
					}
				}
			}
		} else if (!strcmp(attrp->name, ATTR_rel_list)) {
			resreq = find_alloc_resource_req_by_str(resresv->job->resreq_rel, attrp->resource);
			if (resreq != NULL)
				set_resource_req(resreq, attrp->value);
			if (resresv->job->resreq_rel == NULL)
				resresv->job->resreq_rel = resreq;
		} else if (!strcmp(attrp->name, ATTR_used)) { /* resources used */
			resreq =
				find_alloc_resource_req_by_str(resresv->job->resused, attrp->resource);
			if (resreq != NULL)
				set_resource_req(resreq, attrp->value);
			if (resresv->job->resused == NULL)
				resresv->job->resused = resreq;
		} else if (!strcmp(attrp->name, ATTR_accrue_type)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				resresv->job->accrue_type = count;
			else
				resresv->job->accrue_type = 0;
		} else if (!strcmp(attrp->name, ATTR_eligible_time))
			resresv->job->eligible_time = (time_t) res_to_num(attrp->value, NULL);
		else if (!strcmp(attrp->name, ATTR_estimated)) {
			if (!strcmp(attrp->resource, "start_time")) {
				resresv->job->est_start_time =
					(time_t) res_to_num(attrp->value, NULL);
			} else if (!strcmp(attrp->resource, "execvnode"))
				resresv->job->est_execvnode = string_dup(attrp->value);
		} else if (!strcmp(attrp->name, ATTR_c)) { /* checkpoint allowed? */
			if (strcmp(attrp->value, "n") == 0)
				resresv->job->can_checkpoint = false;
		} else if (!strcmp(attrp->name, ATTR_r)) { /* reque allowed ? */
			if (strcmp(attrp->value, ATR_FALSE) == 0)
				resresv->job->can_requeue = false;
		} else if (!strcmp(attrp->name, ATTR_depend)) {
			resresv->job->depend_job_str = string_dup(attrp->value);
		}

		attrp = attrp->next;
	}

#ifdef NAS /* localmod 040 */
	/* we modify nodect to be the same value for all jobs in queues that are
	 * configured to ignore nodect key sorting, for two reasons:
	 * 1. obviously to accomplish ignoring of nodect key sorting
	 * 2. maintain stability of qsort when comparing with a job in a queue that
	 *    does not require nodect key sorting
	 * note that this assumes nodect is used only for sorting
	 */
	if (qinfo->ignore_nodect_sort)
		resresv->job->nodect = 999999;
#endif /* localmod 040 */

	if (qinfo->is_peer_queue) {
		resresv->is_peer_ob = 1;
		resresv->job->peer_sd = pbs_sd;
	}

	if ((resresv->aoename = getaoename(resresv->select)) != NULL)
		resresv->is_prov_needed = true;
	if ((resresv->eoename = geteoename(resresv->select)) != NULL) {
		/* job with a power profile can't be checkpointed or suspended */
		resresv->job->can_checkpoint = false;
		resresv->job->can_suspend = false;
	}

	if (resresv->select != NULL && resresv->select->chunks != NULL) {
		/*
		 * Job is invalid if there are no resources in a chunk.  Usually
		 * happens because we strip out resources not in conf.res_to_check
		 */
		int k;
		for (k = 0; resresv->select->chunks[k] != NULL; k++)
			if (resresv->select->chunks[k]->req == NULL) {
				set_schd_error_codes(err, NEVER_RUN, INVALID_RESRESV);
				set_schd_error_arg(err, ARG1, "invalid chunk in select");
				resresv->is_invalid = true;
				return resresv;
			}
	}

	if (resresv->place_spec->scatter &&
	    resresv->select->total_chunks > 1)
		resresv->will_use_multinode = true;

	if (resresv->job->is_queued && !resresv->nspec_arr.empty())
		resresv->job->is_checkpointed = true;

	/* If we did not wait for mom to start the job (throughput mode),
	 * it is possible that we’re seeing a running job without a start time set.
	 * The stime is set when the mom reports back to the server to say the job is running.
	 */
	if ((resresv->job->is_running) && (resresv->job->stime == UNSPECIFIED))
		resresv->job->stime = sinfo->server_time + 1;

	/* For jobs that have an exec_vnode, we create a "select" based
	 * on its exec_vnode.  We do this so if we ever need to run the job
	 * again, we will replace the job on the exact vnodes/resources it originally used.
	 */
	std::string selectspec;
	if (resresv->job->is_suspended && !resresv->job->resreleased.empty())
		/* For jobs that are suspended and have resource_released, the "select"
		 * we create is based off of resources_released instead of the exec_vnode.
		 */
		selectspec = create_select_from_nspec(resresv->job->resreleased);
	else if (!resresv->nspec_arr.empty())
		selectspec = create_select_from_nspec(resresv->nspec_arr);

	if (!selectspec.empty())
		resresv->execselect = parse_selspec(selectspec);

	set_job_times(pbs_sd, resresv, sinfo->server_time);

	/* Add Resource_List resources after resource_used on the job.  This is 
	 * mainly for fairshare.  This allows us to use custom resources only found in 
	 * Resource_List in our fairshare formula.  If a resource appears in both
	 * lists, we'll find the one in resources_used first and use that.
	 */
	auto req = resresv->job->resused;

	if (req != NULL) {
		while (req->next != NULL)
			req = req->next;

		req->next = dup_resource_req_list(resresv->resreq);
	}

	/* if the fairshare entity was not set by query_job(), then check
	 * if it's 'queue' and if so, set the group info to the queue name
	 */
	if (conf.fairshare_ent == "queue") {
		if (sinfo->fstree != NULL) {
			resresv->job->ginfo =
				find_alloc_ginfo(qinfo->name, sinfo->fstree->root);
		} else
			resresv->job->ginfo = NULL;
	}

	/* if fairshare_ent is invalid or the job doesn't have one, give a default
	 * of something most likely unique - egroup:euser
	 */

	if (resresv->job->ginfo == NULL) {
		char fairshare_name[100];
#ifdef NAS /* localmod 058 */
		sprintf(fairshare_name, "%s:%s:%s", resresv->group.c_str(), resresv->user.c_str(),
			qinfo->name.c_str());
#else
		sprintf(fairshare_name, "%s:%s", resresv->group.c_str(), resresv->user.c_str());
#endif /* localmod 058 */
		if (resresv->server->fstree != NULL) {
			resresv->job->ginfo = find_alloc_ginfo(fairshare_name, sinfo->fstree->root);
		} else
			resresv->job->ginfo = NULL;
	}
#ifdef NAS /* localmod 034 */
	if (resresv->job->sh_info == NULL) {
		sprintf(fairshare_name, "%s:%s", resresv->group.c_str(), resresv->user.c_str());
		resresv->job->sh_info = site_find_alloc_share(sinfo,
							      fairshare_name);
	}
	site_set_share_type(sinfo, resresv);
#endif /* localmod 034 */

	return resresv;
}

/**
 *	@brief
 *		job_info constructor
 *
 * @return job_info *
 */
job_info *
new_job_info()
{
	job_info *jinfo;

	if ((jinfo = new job_info()) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	jinfo->is_queued = 0;
	jinfo->is_running = 0;
	jinfo->is_held = 0;
	jinfo->is_waiting = 0;
	jinfo->is_transit = 0;
	jinfo->is_exiting = 0;
	jinfo->is_suspended = 0;
	jinfo->is_susp_sched = 0;
	jinfo->is_userbusy = 0;
	jinfo->is_begin = 0;
	jinfo->is_expired = 0;
	jinfo->is_checkpointed = 0;
	jinfo->accrue_type = 0;
	jinfo->eligible_time = 0;
	jinfo->can_not_preempt = 0;
	jinfo->is_topjob = false;
	jinfo->topjob_ineligible = 0;

	jinfo->is_array = 0;
	jinfo->is_subjob = 0;

	jinfo->can_checkpoint = 1; /* default can be checkpointed */
	jinfo->can_requeue = 1;	   /* default can be reuqued */
	jinfo->can_suspend = 1;	   /* default can be suspended */

	jinfo->is_provisioning = 0;
	jinfo->is_preempted = 0;
	jinfo->is_prerunning = 0;

	jinfo->job_name = NULL;
	jinfo->comment = NULL;
	jinfo->job_name = NULL;
	jinfo->resv_id = NULL;
	jinfo->alt_id = NULL;
	jinfo->queue = NULL;
	jinfo->resv = NULL;
	jinfo->priority = 0;
	jinfo->etime = UNSPECIFIED;
	jinfo->stime = UNSPECIFIED;
	jinfo->preempt = 0;
	jinfo->preempt_status = 0;
	jinfo->peer_sd = -1;
	jinfo->est_start_time = UNSPECIFIED;
	jinfo->time_preempted = UNSPECIFIED;
	jinfo->est_execvnode = NULL;
	jinfo->resused = NULL;
	jinfo->ginfo = NULL;

	jinfo->array_index = UNSPECIFIED;
	jinfo->parent_job = NULL;
	jinfo->queued_subjobs = NULL;
	jinfo->max_run_subjobs = UNSPECIFIED;
	jinfo->running_subjobs = 0;
	jinfo->attr_updates = NULL;
	jinfo->resreq_rel = NULL;
	jinfo->depend_job_str = NULL;
	jinfo->dependent_jobs = NULL;

	jinfo->formula_value = 0.0;

#ifdef RESC_SPEC
	jinfo->rspec = NULL;
#endif

#ifdef NAS
	/* localmod 045 */
	jinfo->NAS_pri = 0;
	/* localmod 034 */
	jinfo->sh_amts = NULL;
	jinfo->sh_info = NULL;
	jinfo->accrue_rate = 0;
	/* localmod 040 */
	jinfo->nodect = 0;
	/* localmod 031 */
	jinfo->schedsel = NULL;
	/* localmod 053 */
	jinfo->u_info = NULL;
#endif

	return jinfo;
}

/**
 *	@brief
 *		job_info destructor
 *
 * @param[in,out]	jinfo	-	Job Info structure to be freed.
 */

void
free_job_info(job_info *jinfo)
{
	if (jinfo == NULL)
		return;

	if (jinfo->comment != NULL)
		free(jinfo->comment);

	if (jinfo->job_name != NULL)
		free(jinfo->job_name);

	if (jinfo->resv_id != NULL)
		free(jinfo->resv_id);

	if (jinfo->alt_id != NULL)
		free(jinfo->alt_id);

	if (jinfo->est_execvnode != NULL)
		free(jinfo->est_execvnode);

	if (jinfo->queued_subjobs != NULL)
		free_range_list(jinfo->queued_subjobs);

	if (jinfo->depend_job_str != NULL)
		free(jinfo->depend_job_str);

	if (jinfo->dependent_jobs != NULL)
		free(jinfo->dependent_jobs);

	free_resource_req_list(jinfo->resused);

	free_attrl_list(jinfo->attr_updates);

	free_resource_req_list(jinfo->resreq_rel);

	free_nspecs(jinfo->resreleased);

#ifdef RESC_SPEC
	free_rescspec(jinfo->rspec);
#endif
#ifdef NAS
	/* localmod 034 */
	if (jinfo->sh_amts)
		free(jinfo->sh_amts);

	/* localmod 031 */
	if (jinfo->schedsel)
		free(jinfo->schedsel);
#endif
	delete jinfo;
}

/**
 * @brief
 *		set_job_state - set the state flag in a job_info structure
 *			i.e. the is_* bit
 *
 * @param[in]	state	-	the state
 * @param[in,out]	jinfo	-	the job info structure
 *
 * @return	1	-	if state is successfully set
 * @return	0	-	if state is not set
 */
int
set_job_state(const char *state, job_info *jinfo)
{
	if (jinfo == NULL)
		return 0;

	/* turn off all state bits first to make sure only 1 is set at the end */
	jinfo->is_queued = jinfo->is_running = jinfo->is_transit =
		jinfo->is_held = jinfo->is_waiting = jinfo->is_exiting =
			jinfo->is_suspended = jinfo->is_userbusy = jinfo->is_begin =
				jinfo->is_expired = 0;

	switch (state[0]) {
		case 'Q':
			jinfo->is_queued = 1;
			break;

		case 'R':
			jinfo->is_running = 1;
			break;

		case 'T':
			jinfo->is_transit = 1;
			break;

		case 'H':
			jinfo->is_held = 1;
			break;

		case 'W':
			jinfo->is_waiting = 1;
			break;

		case 'E':
			jinfo->is_exiting = 1;
			break;

		case 'S':
			jinfo->is_suspended = 1;
			break;

		case 'U':
			jinfo->is_userbusy = 1;
			break;

		case 'B':
			jinfo->is_begin = 1;
			break;

		case 'X':
			jinfo->is_expired = 1;
			break;

		default:
			return 0;
	}
	return 1;
}

/**
 * @brief	Check whether it's ok send attribute updates to server
 *
 * @param[in]	attrname - name of the attribute
 *
 * @return	int
 * @retval	0 for No
 * @retval	1 for Yes
 */
static int
can_send_update(const char *attrname)
{
	const char *attrs_to_throttle[] = {ATTR_comment, ATTR_estimated, NULL};
	int i;

	if (send_job_attr_updates)
		return 1;

	/* Check to see if the attr being updated is eligible for throttling */
	for (i = 0; attrs_to_throttle[i] != NULL; i++) {
		if (strcmp(attrs_to_throttle[i], attrname) == 0)
			return 0;
	}

	return 1;
}

/**
 * @brief
 * 		update job attributes on the server
 *
 * @param[in]	pbs_sd     -	connection to the pbs_server
 * @param[in]	resresv    -	job to update
 * @param[in]	attr_name  -	the name of the attribute to alter
 * @param[in]	attr_resc  -	resource part of the attribute (if any)
 * @param[in]	attr_value -	the value of the attribute to alter (as a str)
 * @param[in]	extra	-	extra attrl attributes to tag along on the alterjob
 * @param[in]	flags	-	UPDATE_NOW - call send_attr_updates() to update the attribute now
 *			     			UPDATE_LATER - attach attribute change to job to be sent all at once
 *							for the job.  NOTE: Only the jobs that are part
 *							of the server in main_sched_loop() will be updated in this way.
 *
 * @retval	1	attributes were updated or successfully attached to job
 * @retval	0	no attributes were updated for a valid reason
 * @retval -1	no attributes were updated for an error
 *
 */
int
update_job_attr(int pbs_sd, resource_resv *resresv, const char *attr_name,
		const char *attr_resc, const char *attr_value, struct attrl *extra, unsigned int flags)
{
	struct attrl *pattr = NULL;
	struct attrl *pattr2 = NULL;
	struct attrl *end;

	if (resresv == NULL ||
	    (attr_name == NULL && attr_value == NULL && extra == NULL))
		return -1;

	if (extra == NULL && (attr_name == NULL || attr_value == NULL))
		return -1;

	if (!resresv->is_job)
		return 0;

	/* if running in simulation then don't update but simulate that we have */
	if (pbs_sd == SIMULATE_SD)
		return 1;

	/* don't try and update attributes for jobs on peer servers */
	if (resresv->is_peer_ob)
		return 0;

	/* if we've received a SIGPIPE, it means our connection to the server
	 * has gone away.  No need to attempt to contact again
	 */
	if (got_sigpipe)
		return -1;

	if (attr_name == NULL && attr_value == NULL) {
		end = pattr = dup_attrl_list(extra);
		if (pattr == NULL)
			return -1;
	} else {
		if ((flags & UPDATE_NOW) && !can_send_update(attr_name)) {
			struct attrl *iter_attrl = NULL;
			int attr_elig = 0;

			/* Check if any of the extra attrs are eligible to be sent */
			for (iter_attrl = extra; iter_attrl != NULL; iter_attrl = iter_attrl->next) {
				if (can_send_update(iter_attrl->name)) {
					attr_elig = 1;
					break;
				}
			}

			if (!attr_elig)
				return 0;
		}

		pattr = new_attrl();

		if (pattr == NULL)
			return -1;
		pattr->name = string_dup(attr_name);
		pattr->value = string_dup(attr_value);
		pattr->resource = string_dup(attr_resc);
		end = pattr;
		if (extra != NULL) {
			pattr2 = dup_attrl_list(extra);
			if (pattr2 == NULL) {
				free_attrl(pattr);
				return -1;
			}
			pattr->next = pattr2;
			/* extra may have been a list, let's find the end */
			for (end = pattr2; end->next != NULL; end = end->next)
				;
		}
	}

	if (flags & UPDATE_LATER) {
		end->next = resresv->job->attr_updates;
		resresv->job->attr_updates = pattr;
	}

	if (pattr != NULL && (flags & UPDATE_NOW)) {
		int rc;
		rc = send_attr_updates(pbs_sd, resresv, pattr);
		free_attrl_list(pattr);
		return rc;
	}

	return 0;
}

/**
 * @brief
 * 		send delayed job attribute updates for job using send_attr_updates().
 *
 * @par
 * 		The main reason to use this function over a direct send_attr_update()
 *      call is so that the job's attr_updates list gets free'd and NULL'd.
 *      We don't want to send the attr updates multiple times
 *
 * @param[in]	pbs_sd	-	server connection descriptor
 * @param[in]	job	-	job to send attributes to
 *
 * @return	int(ret val from send_attr_updates)
 * @retval	1	- success
 * @retval	0	- failure to update
 */
int
send_job_updates(int pbs_sd, resource_resv *job)
{
	int rc;
	struct attrl *iter_attr = NULL;

	if (job == NULL)
		return 0;

	if (!send_job_attr_updates) {
		int send = 0;
		for (iter_attr = job->job->attr_updates; iter_attr != NULL; iter_attr = iter_attr->next) {
			if (can_send_update(iter_attr->name)) {
				send = 1;
				break;
			}
		}
		if (!send)
			return 0;
	}

	rc = send_attr_updates(pbs_sd, job, job->job->attr_updates);

	free_attrl_list(job->job->attr_updates);
	job->job->attr_updates = NULL;
	return rc;
}

/**
 *	@brief
 *		unset job attributes on the server
 *
 * @param[in]	pbs_sd	-	connection to the pbs_server
 * @param[in]	resresv	-	job to update
 * @param[in]	attr_name	-	the name of the attribute to unset
 * @param[in]	flags	-	UPDATE_NOW : call send_attr_updates() to update the attribute now
 *			     			UPDATE_LATER - attach attribute change to job to be sent all at once
 *							for the job.  NOTE: Only the jobs that are part
 *							of the server in main_sched_loop() will be updated in this way.
 *
 *	@retval	1	: attributes were unset
 *	@retval	0	: no attributes were unset for a valid reason
 *	@retval -1	: no attributes were unset for an error
 *
 */
int
unset_job_attr(int pbs_sd, resource_resv *resresv, const char *attr_name, unsigned int flags)
{
	return (update_job_attr(pbs_sd, resresv, attr_name, NULL, "", NULL, flags));
}

/**
 * @brief
 *		update_job_comment - update a job's comment attribute.  If the job's
 *			     comment attr is identical, don't update
 *
 * @param[in]	pbs_sd	-	pbs connection descriptor
 * @param[in]	resresv -	the job to update
 * @param[in]	comment -	the comment string
 *
 * @return	int
 * @retval	1	: if the comment was updated
 * @retval	0	: if not
 *
 */
int
update_job_comment(int pbs_sd, resource_resv *resresv, char *comment)
{
	int rc = 0;

	if (resresv == NULL || comment == NULL)
		return 0;

	if (!resresv->is_job || resresv->job == NULL)
		return 0;

	/* no need to update the job comment if it is the same */
	if (resresv->job->comment == NULL ||
	    strcmp(resresv->job->comment, comment)) {
		if (conf.update_comments) {
			rc = update_job_attr(pbs_sd, resresv, ATTR_comment, NULL, comment, NULL, UPDATE_LATER);
			if (rc > 0) {
				if (resresv->job->comment != NULL)
					free(resresv->job->comment);
				resresv->job->comment = string_dup(comment);
			}
		}
	}
	return rc;
}

/**
 * @brief
 *		update_jobs_cant_run - update an array of jobs which can not run
 *
 * @param[in]	pbs_sd	-	connection to the PBS server
 * @param[in,out]	resresv_arr	-	the array to update
 * @param[in]	start	-	the job which couldn't run
 * @param[in]	comment	-	the comment to update
 * @param[in]	log_msg	-	the message to log for the job
 *
 * @return nothing
 *
 */
void
update_jobs_cant_run(int pbs_sd, resource_resv **resresv_arr,
		     resource_resv *start, struct schd_error *err, int start_where)
{
	int i = 0;

	if (resresv_arr == NULL)
		return;

	/* We are not starting at the front of the array, so we need to find the
	 * element to start with.
	 */
	if (start != NULL) {
		for (; resresv_arr[i] != NULL && resresv_arr[i] != start; i++)
			;
	} else
		i = 0;

	if (resresv_arr[i] != NULL) {
		if (start_where == START_BEFORE_JOB)
			i--;
		else if (start_where == START_AFTER_JOB)
			i++;

		for (; resresv_arr[i] != NULL; i++) {
			if (!resresv_arr[i]->can_not_run) {
				update_job_can_not_run(pbs_sd, resresv_arr[i], err);
			}
		}
	}
}

/**
 * @brief
 *		translate failure codes into a comment and log message
 *
 * @param[in]	err	-	error reply structure to translate
 * @param[out]	comment_msg	-	translated comment (may be NULL)
 * @param[out]	log_msg	-	translated log message (may be NULL)
 *
 * @return	int
 * @retval	1	: comment and log messages were set
 * @retval	0	: comment and log messages were not set
 *
 */
int
translate_fail_code(schd_error *err, char *comment_msg, char *log_msg)
{
	int rc = 1;
	char commentbuf[MAX_LOG_SIZE];
	const char *arg1;
	const char *arg2;
	const char *arg3;
	const char *spec;

	if (err == NULL)
		return 0;

	if (err->status_code == SCHD_UNKWN) {
		if (comment_msg != NULL)
			comment_msg[0] = '\0';
		if (log_msg != NULL)
			log_msg[0] = '\0';
		return 0;
	}

	if (err->error_code < RET_BASE) {
		const char *pbse;

		if (err->specmsg != NULL)
			pbse = err->specmsg;
		else
			pbse = pbse_to_txt(err->error_code);

		if (pbse == NULL)
			pbse = "";

		if (comment_msg != NULL)
			snprintf(commentbuf, sizeof(commentbuf), "%s", pbse);
		if (log_msg != NULL)
			snprintf(log_msg, MAX_LOG_SIZE, "%s", pbse);
	}

	arg1 = err->arg1;
	arg2 = err->arg2;
	arg3 = err->arg3;
	spec = err->specmsg;
	if (arg1 == NULL)
		arg1 = "";
	if (arg2 == NULL)
		arg2 = "";
	if (arg3 == NULL)
		arg3 = "";
	if (spec == NULL)
		spec = "";

	switch (err->error_code) {
		case ERR_SPECIAL:

			if (comment_msg != NULL)
				snprintf(commentbuf, sizeof(commentbuf), "%s", spec);
			if (log_msg != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, "%s", spec);
			break;

		/* codes using no args */
		case MAX_RUN_SUBJOBS:
		case BACKFILL_CONFLICT:
		case CANT_PREEMPT_ENOUGH_WORK:
		case CROSS_DED_TIME_BOUNDRY:
		case DED_TIME:
		case NODE_GROUP_LIMIT_REACHED:
		case NODE_JOB_LIMIT_REACHED:
		case NODE_NO_MULT_JOBS:
		case NODE_PLACE_PACK:
		case NODE_RESV_ENABLE:
		case NODE_UNLICENSED:
		case NODE_USER_LIMIT_REACHED:
		case NONPRIME_ONLY:
		case NOT_ENOUGH_NODES_AVAIL:
		case NO_FAIRSHARES:
		case NO_NODE_RESOURCES:
		case NO_SMALL_CPUSETS:
		case PRIME_ONLY:
		case QUEUE_NOT_STARTED:
		case RESERVATION_CONFLICT:
		case SCHD_ERROR:
		case SERVER_GROUP_LIMIT_REACHED:
		case SERVER_PROJECT_LIMIT_REACHED:
		case SERVER_JOB_LIMIT_REACHED:
		case SERVER_USER_LIMIT_REACHED:
		case STRICT_ORDERING:
		case PROV_DISABLE_ON_SERVER:
		case PROV_DISABLE_ON_NODE:
		case PROV_BACKFILL_CONFLICT:
		case CANT_SPAN_PSET:
		case IS_MULTI_VNODE:
		case PROV_RESRESV_CONFLICT:
		case NO_FREE_NODES:
		case NO_TOTAL_NODES:
		case JOB_UNDER_THRESHOLD:
#ifdef NAS
			/* localmod 034 */
		case GROUP_CPU_SHARE:
		case GROUP_CPU_INSUFFICIENT:
			/* localmod 998 */
		case RESOURCES_INSUFFICIENT:
#endif
			if (comment_msg != NULL)
				snprintf(commentbuf, sizeof(commentbuf), "%s", ERR2COMMENT(err->error_code));
			if (log_msg != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, "%s", ERR2INFO(err->error_code));
			break;
			/* codes using arg1  */
#ifndef NAS /* localmod 031 */
		case INVALID_NODE_STATE:
#endif /* localmod 031 */
		case INVALID_NODE_TYPE:
		case NODE_NOT_EXCL:
		case QUEUE_GROUP_LIMIT_REACHED:
		case QUEUE_PROJECT_LIMIT_REACHED:
		case QUEUE_JOB_LIMIT_REACHED:
		case QUEUE_USER_LIMIT_REACHED:
		case SERVER_BYGROUP_JOB_LIMIT_REACHED:
		case SERVER_BYPROJECT_JOB_LIMIT_REACHED:
		case SERVER_BYUSER_JOB_LIMIT_REACHED:
		case AOE_NOT_AVALBL:
		case EOE_NOT_AVALBL:
		case CROSS_PRIME_BOUNDARY:
		case INVALID_RESRESV:
			if (comment_msg != NULL)
				snprintf(commentbuf, sizeof(commentbuf), ERR2COMMENT(err->error_code), arg1);
			if (log_msg != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, ERR2INFO(err->error_code), arg1);
			break;

			/* codes using two arguments */
#ifdef NAS /* localmod 031 */
		case INVALID_NODE_STATE:
#endif /* localmod 031 */
		case QUEUE_BYGROUP_JOB_LIMIT_REACHED:
		case QUEUE_BYPROJECT_JOB_LIMIT_REACHED:
		case QUEUE_BYUSER_JOB_LIMIT_REACHED:
		case RUN_FAILURE:
		case NODE_NONEXISTENT:
		case SET_TOO_SMALL:
			if (comment_msg != NULL) {
				snprintf(commentbuf, sizeof(commentbuf), ERR2COMMENT(err->error_code), arg1, arg2);
			}
			if (log_msg != NULL) {
				snprintf(log_msg, MAX_LOG_SIZE, ERR2INFO(err->error_code), arg1, arg2);
			}
			break;
		/* codes using a resource definition and arg1 */
		case QUEUE_GROUP_RES_LIMIT_REACHED:
		case QUEUE_PROJECT_RES_LIMIT_REACHED:
		case QUEUE_USER_RES_LIMIT_REACHED:
			if (comment_msg != NULL && err->rdef != NULL)
				snprintf(commentbuf, sizeof(commentbuf), ERR2COMMENT(err->error_code), arg1, err->rdef->name.c_str());
			if (log_msg != NULL && err->rdef != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, ERR2INFO(err->error_code), arg1, err->rdef->name.c_str());
			break;

		/* codes using resource definition in error structure */
		case SERVER_GROUP_RES_LIMIT_REACHED:
		case SERVER_PROJECT_RES_LIMIT_REACHED:
		case SERVER_USER_RES_LIMIT_REACHED:
		case SERVER_RESOURCE_LIMIT_REACHED:
			if (comment_msg != NULL && err->rdef != NULL)
				snprintf(commentbuf, sizeof(commentbuf), ERR2COMMENT(err->error_code), err->rdef->name.c_str());
			if (log_msg != NULL && err->rdef != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, ERR2INFO(err->error_code), err->rdef->name.c_str());
			break;

		/* codes using a resource definition and arg1 in a different order */
		case QUEUE_RESOURCE_LIMIT_REACHED:
		case INSUFFICIENT_QUEUE_RESOURCE:
		case INSUFFICIENT_SERVER_RESOURCE:
		case INSUFFICIENT_RESOURCE:
			if (comment_msg != NULL && err->rdef != NULL)
				snprintf(commentbuf, sizeof(commentbuf), ERR2COMMENT(err->error_code), err->rdef->name.c_str(),
					 arg1 == NULL ? "" : arg1);
			if (log_msg != NULL && err->rdef != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, ERR2INFO(err->error_code), err->rdef->name.c_str(),
					 arg1 == NULL ? "" : arg1);
			break;

		/* codes using arg1, arg3 and resource definition (in a weird order) */
		case QUEUE_BYGROUP_RES_LIMIT_REACHED:
		case QUEUE_BYPROJECT_RES_LIMIT_REACHED:
		case QUEUE_BYUSER_RES_LIMIT_REACHED:
			if (comment_msg != NULL && err->rdef != NULL)
				snprintf(commentbuf, sizeof(commentbuf), ERR2COMMENT(err->error_code), arg3, err->rdef->name.c_str(), arg1);
			if (log_msg != NULL && err->rdef != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, ERR2INFO(err->error_code), arg3, err->rdef->name.c_str(), arg1);
			break;

		/* codes using resource definition and arg2 */
		case SERVER_BYGROUP_RES_LIMIT_REACHED:
		case SERVER_BYPROJECT_RES_LIMIT_REACHED:
		case SERVER_BYUSER_RES_LIMIT_REACHED:
			if (comment_msg != NULL && err->rdef != NULL)
				snprintf(commentbuf, sizeof(commentbuf), ERR2COMMENT(err->error_code), arg2,
					 err->rdef->name.c_str());
			if (log_msg != NULL && err->rdef != NULL)
				snprintf(log_msg, MAX_LOG_SIZE, ERR2INFO(err->error_code), arg2,
					 err->rdef->name.c_str());
			break;

		case RESERVATION_INTERFERENCE:
			if (*arg1 != '\0') {
				if (comment_msg != NULL) {
					sprintf(commentbuf, "%s: %s",
						ERR2COMMENT(err->error_code), arg1);
				}
				if (log_msg != NULL) {
					snprintf(log_msg, MAX_LOG_SIZE, "%s: %s",
						 ERR2INFO(err->error_code), arg1);
				}
			} else {
				if (comment_msg != NULL)
					snprintf(commentbuf, sizeof(commentbuf), "%s", ERR2COMMENT(err->error_code));
				if (log_msg != NULL)
					snprintf(log_msg, MAX_LOG_SIZE, "%s", ERR2INFO(err->error_code));
			}
			break;

		case NOT_QUEUED:
		default:
			rc = 0;
			if (comment_msg != NULL)
				commentbuf[0] = '\0';
			if (log_msg != NULL)
				log_msg[0] = '\0';
	}

	if (comment_msg != NULL) {
		/* snprintf() use MAX_LOG_SIZE because all calls to this function
		 * pass in comment_msg buffers of size MAX_LOG_SIZE.  This needs to be
		 * fixed by passing in the size of comment_msg and log_msg (SPID268659)
		 */
		switch (err->status_code) {
			case SCHD_UNKWN:
			case NOT_RUN:
				snprintf(comment_msg, MAX_LOG_SIZE, "%s: %.*s",
					 NOT_RUN_PREFIX,
					 (int) (MAX_LOG_SIZE - strlen(NOT_RUN_PREFIX) - 3),
					 commentbuf);
				break;
			case NEVER_RUN:
				snprintf(comment_msg, MAX_LOG_SIZE, "%s: %.*s",
					 NEVER_RUN_PREFIX,
					 (int) (MAX_LOG_SIZE - strlen(NEVER_RUN_PREFIX) - 3),
					 commentbuf);
				break;
			default:
				snprintf(comment_msg, MAX_LOG_SIZE, "%s", commentbuf);
		}
	}

	return rc;
}

/**
 * @brief resresv_set constructor
 */
resresv_set *
new_resresv_set(void)
{
	resresv_set *rset;

	rset = static_cast<resresv_set *>(malloc(sizeof(resresv_set)));
	if (rset == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	rset->can_not_run = 0;
	rset->err = NULL;
	rset->user = NULL;
	rset->group = NULL;
	rset->project = NULL;
	rset->place_spec = NULL;
	rset->req = NULL;
	rset->select_spec = NULL;
	rset->qinfo = NULL;

	return rset;
}
/**
 * @brief resresv_set destructor
 */
void
free_resresv_set(resresv_set *rset)
{
	if (rset == NULL)
		return;

	free_schd_error(rset->err);
	free(rset->user);
	free(rset->group);
	free(rset->project);
	delete rset->select_spec;
	free_place(rset->place_spec);
	free_resource_req_list(rset->req);
	free(rset);
}
/**
 *  @brief resresv_set array destructor
 */
void
free_resresv_set_array(resresv_set **rsets)
{
	int i;

	if (rsets == NULL)
		return;

	for (i = 0; rsets[i] != NULL; i++)
		free_resresv_set(rsets[i]);

	free(rsets);
}

/**
 * @brief resresv_set copy constructor
 */
resresv_set *
dup_resresv_set(resresv_set *oset, server_info *nsinfo)
{
	resresv_set *rset;

	if (oset == NULL || nsinfo == NULL)
		return NULL;

	rset = new_resresv_set();
	if (rset == NULL)
		return NULL;

	rset->can_not_run = oset->can_not_run;

	rset->err = dup_schd_error(oset->err);
	if (oset->err != NULL && oset->err == NULL) {
		free_resresv_set(rset);
		return NULL;
	}

	rset->user = string_dup(oset->user);
	if (oset->user != NULL && rset->user == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	rset->group = string_dup(oset->group);
	if (oset->group != NULL && rset->group == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	rset->project = string_dup(oset->project);
	if (oset->project != NULL && rset->project == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	rset->select_spec = new selspec(*oset->select_spec);
	if (rset->select_spec == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	rset->place_spec = dup_place(oset->place_spec);
	if (rset->place_spec == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	rset->req = dup_resource_req_list(oset->req);
	if (oset->req != NULL && rset->req == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	if (oset->qinfo != NULL)
		rset->qinfo = find_queue_info(nsinfo->queues, oset->qinfo->name);

	return rset;
}
/**
 * @brief resresv_set array copy constructor
 */
resresv_set **
dup_resresv_set_array(resresv_set **osets, server_info *nsinfo)
{
	int i;
	int len;
	resresv_set **rsets;
	if (osets == NULL || nsinfo == NULL)
		return NULL;

	len = count_array(osets);

	rsets = static_cast<resresv_set **>(malloc((len + 1) * sizeof(resresv_set *)));
	if (rsets == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; osets[i] != NULL; i++) {
		rsets[i] = dup_resresv_set(osets[i], nsinfo);
		if (rsets[i] == NULL) {
			free_resresv_set_array(rsets);
			return NULL;
		}
	}
	rsets[i] = NULL;
	return rsets;
}

/**
 * @brief should a resresv_set use the user
 * @param sinfo - server info
 * @param qinfo - queue info
 * @retval 1 - yes
 * @retval 0 - no
 */
int
resresv_set_use_user(server_info *sinfo, queue_info *qinfo)
{
	if ((sinfo != NULL) && (sinfo->has_user_limit))
		return 1;
	if ((qinfo != NULL) && (qinfo->has_user_limit))
		return 1;

	return 0;
}

/**
 * @brief should a resresv_set use the group
 * @param sinfo - server info
 * @param qinfo - queue info
 * @retval 1 - yes
 * @retval 0 - no
 */
int
resresv_set_use_grp(server_info *sinfo, queue_info *qinfo)
{
	if ((sinfo != NULL) && (sinfo->has_grp_limit))
		return 1;
	if ((qinfo != NULL) && (qinfo->has_grp_limit))
		return 1;

	return 0;
}

/**
 * @brief should a resresv_set use the project
 * @param sinfo - server info
 * @param qinfo - queue info
 * @retval 1 - yes
 * @retval 0 - no
 */
int
resresv_set_use_proj(server_info *sinfo, queue_info *qinfo)
{
	if ((sinfo != NULL) && (sinfo->has_proj_limit))
		return 1;
	if ((qinfo != NULL) && (qinfo->has_proj_limit))
		return 1;

	return 0;
}

/**
 * @brief should a resresv_set use the queue
 * 	A resresv_set should use queue for the following reasons:
 * 	Hard limits	max_run_res, etc
 * 	Soft Limits	max_run_res_soft, etc
 * 	Nodes		Queue has nodes(e.g., node's queue attribute)
 * 	Dedtime queue 	Queue is a dedicated time queue
 * 	Primetime	Queue is a primetime queue
 * 	Non-primetime	Queue is a non-primetime queue
 * 	Resource limits	Queue has resources_available limits
 * 	Reservation	Queue is a reservation queue
 *
 * @param qinfo - the queue
 * @retval 1 - yes
 * @retval 0 - no
 */
int
resresv_set_use_queue(queue_info *qinfo)
{
	if (qinfo == NULL)
		return 0;

	if (qinfo->has_hard_limit || qinfo->has_soft_limit || qinfo->has_nodes ||
	    qinfo->is_ded_queue || qinfo->is_prime_queue || qinfo->is_nonprime_queue ||
	    qinfo->has_resav_limit || qinfo->resv != NULL)
		return 1;

	return 0;
}

/**
 * @brief determine which selspec to use from a resource_resv for a resresv_set
 *
 * @par Jobs that have an execselect are either running or need to be placed
 *	back on the nodes they were originally running on (e.g., suspended jobs).
 *	We need to put them in their own set because they are no longer
 *	requesting the same resources as jobs with the same select spec.
 *	They are requesting the resources on each vnode they are running on.
 *	We don't care about running jobs because the only time they will be
 *	looked at is if they are requeued.  At that point they are back in
 *	the queued state and have the same select spec as they originally did.
 *
 * @return selspec *
 * @retval selspec to use
 * @retval NULL on error
 */
selspec *
resresv_set_which_selspec(resource_resv *resresv)
{
	if (resresv == NULL)
		return NULL;

	if (resresv->job != NULL && !resresv->job->is_running && resresv->execselect != NULL)
		return resresv->execselect;

	return resresv->select;
}

/**
 * @brief create the list of resources to consider when creating the resresv sets
 * @param policy[in] - policy info
 * @param sinfo[in] - server universe
 * @return resdef **
 * @retval array of resdefs for creating resresv_set's resources.
 * @retval NULL on error
 */
std::unordered_set<resdef *>
create_resresv_sets_resdef(status *policy)
{
	std::unordered_set<resdef *> defs;
	schd_resource *limres;

	if (policy == NULL)
		return {};

	limres = query_limres();

	defs = policy->resdef_to_check;
	defs.insert(allres["cput"]);
	defs.insert(allres["walltime"]);
	defs.insert(allres["max_walltime"]);
	defs.insert(allres["min_walltime"]);
	if (sc_attrs.preempt_targets_enable)
		defs.insert(allres["preempt_targets"]);

	for (auto cur_res = limres; cur_res != NULL; cur_res = cur_res->next)
		defs.insert(cur_res->def);

	return defs;
}

/**
 * @brief create a resresv_set based on a resource_resv
 *
 * @param[in] policy - policy info
 * @param[in] sinfo - server info
 * @param[in] resresv - resresv to create resresv set from
 *
 * @return resresv_set **
 * @retval newly created resresv_set
 * @retval NULL on error
 */
resresv_set *
create_resresv_set_by_resresv(status *policy, server_info *sinfo, resource_resv *resresv)
{
	resresv_set *rset;
	if (policy == NULL || resresv == NULL)
		return NULL;

	rset = new_resresv_set();
	if (rset == NULL)
		return NULL;

	if (resresv->is_job && resresv->job != NULL) {
		if (resresv_set_use_queue(resresv->job->queue))
			rset->qinfo = resresv->job->queue;
	}

	if (resresv_set_use_user(sinfo, rset->qinfo))
		rset->user = string_dup(resresv->user.c_str());
	if (resresv_set_use_grp(sinfo, rset->qinfo))
		rset->group = string_dup(resresv->group.c_str());
	if (resresv_set_use_proj(sinfo, rset->qinfo))
		rset->project = string_dup(resresv->project.c_str());

	rset->select_spec = new selspec(*resresv_set_which_selspec(resresv));
	if (rset->select_spec == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	rset->place_spec = dup_place(resresv->place_spec);
	if (rset->place_spec == NULL) {
		free_resresv_set(rset);
		return NULL;
	}
	/* rset->req may be NULL if the intersection of resresv->resreq and policy->equiv_class_resdef is the NULL set */
	rset->req = dup_selective_resource_req_list(resresv->resreq, policy->equiv_class_resdef);

	return rset;
}

/**
 * @brief find the index of a resresv_set by its component parts
 * @par qinfo, user, group, project, or req can be NULL if the resresv_set does not have one
 * @param[in] policy - policy info
 * @param[in] rsets - resresv_sets to search
 * @param[in] user - user name
 * @param[in] group - group name
 * @param[in] project - project name
 * @param[in] sel - select spec
 * @param[in] pl - place spec
 * @param[in] req - list of resources (i.e., qsub -l)
 * @param[in] qinfo - queue
 * @return int
 * @retval index of resresv if found
 * @retval -1 if not found or on error
 */
int
find_resresv_set(status *policy, resresv_set **rsets, const char *user, const char *group, const char *project, selspec *sel, place *pl, resource_req *req, queue_info *qinfo)
{
	int i;

	if (rsets == NULL)
		return -1;

	for (i = 0; rsets[i] != NULL; i++) {
		if ((qinfo != NULL && rsets[i]->qinfo == NULL) || (qinfo == NULL && rsets[i]->qinfo != NULL))
			continue;
		if ((qinfo != NULL && rsets[i]->qinfo != NULL) && qinfo->name != rsets[i]->qinfo->name)

			continue;
		if ((user != NULL && rsets[i]->user == NULL) || (user == NULL && rsets[i]->user != NULL))
			continue;
		if (user != NULL && cstrcmp(user, rsets[i]->user) != 0)
			continue;

		if ((group != NULL && rsets[i]->group == NULL) || (group == NULL && rsets[i]->group != NULL))
			continue;
		if (group != NULL && cstrcmp(group, rsets[i]->group) != 0)
			continue;

		if ((project != NULL && rsets[i]->project == NULL) || (project == NULL && rsets[i]->project != NULL))
			continue;
		if (project != NULL && cstrcmp(project, rsets[i]->project) != 0)
			continue;

		if (compare_selspec(rsets[i]->select_spec, sel) == 0)
			continue;
		if (compare_place(rsets[i]->place_spec, pl) == 0)
			continue;
		if (compare_resource_req_list(rsets[i]->req, req, policy->equiv_class_resdef) == 0)
			continue;
		/* If we got here, we have found our set */
		return i;
	}
	return -1;
}

/**
 * @brief find the index of a resresv_set by a resresv inside it
 * @param[in] policy - policy info
 * @param[in] rsets - resresv_set array to search
 * @param[in] resresv - resresv to search for
 * @return index of resresv
 */
int
find_resresv_set_by_resresv(status *policy, resresv_set **rsets, resource_resv *resresv)
{
	const char *user = NULL;
	const char *grp = NULL;
	const char *proj = NULL;
	queue_info *qinfo = NULL;
	selspec *sspec;

	if (policy == NULL || rsets == NULL || resresv == NULL)
		return -1;

	if (resresv->is_job && resresv->job != NULL)
		if (resresv_set_use_queue(resresv->job->queue))
			qinfo = resresv->job->queue;

	if (resresv_set_use_user(resresv->server, qinfo))
		user = resresv->user.c_str();

	if (resresv_set_use_grp(resresv->server, qinfo))
		grp = resresv->group.c_str();

	if (resresv_set_use_proj(resresv->server, qinfo))
		proj = resresv->project.c_str();

	sspec = resresv_set_which_selspec(resresv);

	return find_resresv_set(policy, rsets, user, grp, proj, sspec, resresv->place_spec, resresv->resreq, qinfo);
}

/**
 * @brief create equivalence classes based on an array of resresvs
 * @param[in] policy - policy info
 * @param[in] sinfo - server universe
 * @return array of equivalence classes (resresv_sets)
 */
resresv_set **
create_resresv_sets(status *policy, server_info *sinfo)
{
	int i;
	int j = 0;
	int len;
	int rset_len;
	resource_resv **resresvs;
	resresv_set **rsets;
	resresv_set **tmp_rset_arr;
	resresv_set *cur_rset;

	if (policy == NULL || sinfo == NULL)
		return NULL;

	resresvs = sinfo->jobs;

	len = count_array(resresvs);
	rsets = static_cast<resresv_set **>(malloc((len + 1) * sizeof(resresv_set *)));
	if (rsets == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	rsets[0] = NULL;

	for (i = 0; resresvs[i] != NULL; i++) {
		auto cur_ind = find_resresv_set_by_resresv(policy, rsets, resresvs[i]);

		/* Didn't find the set, create it.*/
		if (cur_ind == -1) {
			cur_rset = create_resresv_set_by_resresv(policy, sinfo, resresvs[i]);
			if (cur_rset == NULL) {
				free_resresv_set_array(rsets);
				return NULL;
			}
			cur_ind = j;
			rsets[j++] = cur_rset;
			rsets[j] = NULL;
		}
		resresvs[i]->ec_index = cur_ind;
	}

	tmp_rset_arr = static_cast<resresv_set **>(realloc(rsets, (j + 1) * sizeof(resresv_set *)));
	if (tmp_rset_arr != NULL)
		rsets = tmp_rset_arr;
	rset_len = count_array(rsets);
	if (rset_len > 0) {
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__,
			   "Number of job equivalence classes: %d", rset_len);
	}

	return rsets;
}

/**
 * @brief
 * 		job_info copy constructor
 *
 * @param[in]	ojinfo	-	Pointer to JobInfo structure
 * @param[in]	nqinfo	-	Queue Info
 * @param[in]	sinfo	-	Server Info
 *
 * @return	job_info *
 * @retval	NULL	:	when function fails to duplicate job_info
 * @retval	!NULL	:	duplicated job_info structure pointer
 */
job_info *
dup_job_info(job_info *ojinfo, queue_info *nqinfo, server_info *nsinfo)
{
	job_info *njinfo;

	if ((njinfo = new_job_info()) == NULL)
		return NULL;

	njinfo->queue = nqinfo;
	njinfo->is_queued = ojinfo->is_queued;
	njinfo->is_running = ojinfo->is_running;
	njinfo->is_held = ojinfo->is_held;
	njinfo->is_waiting = ojinfo->is_waiting;
	njinfo->is_transit = ojinfo->is_transit;
	njinfo->is_exiting = ojinfo->is_exiting;
	njinfo->is_userbusy = ojinfo->is_userbusy;
	njinfo->is_begin = ojinfo->is_begin;
	njinfo->is_expired = ojinfo->is_expired;
	njinfo->is_suspended = ojinfo->is_suspended;
	njinfo->is_susp_sched = ojinfo->is_susp_sched;
	njinfo->is_array = ojinfo->is_array;
	njinfo->is_subjob = ojinfo->is_subjob;
	njinfo->is_prerunning = ojinfo->is_prerunning;
	njinfo->can_not_preempt = ojinfo->can_not_preempt;
	njinfo->is_topjob = ojinfo->is_topjob;
	njinfo->topjob_ineligible = ojinfo->topjob_ineligible;
	njinfo->is_checkpointed = ojinfo->is_checkpointed;
	njinfo->is_provisioning = ojinfo->is_provisioning;

	njinfo->can_checkpoint = ojinfo->can_checkpoint;
	njinfo->can_requeue = ojinfo->can_requeue;
	njinfo->can_suspend = ojinfo->can_suspend;

	njinfo->priority = ojinfo->priority;
	njinfo->etime = ojinfo->etime;
	njinfo->stime = ojinfo->stime;
	njinfo->preempt = ojinfo->preempt;
	njinfo->preempt_status = ojinfo->preempt_status;
	njinfo->peer_sd = ojinfo->peer_sd;
	njinfo->est_start_time = ojinfo->est_start_time;
	njinfo->formula_value = ojinfo->formula_value;
	njinfo->est_execvnode = string_dup(ojinfo->est_execvnode);
	njinfo->job_name = string_dup(ojinfo->job_name);
	njinfo->comment = string_dup(ojinfo->comment);
	njinfo->resv_id = string_dup(ojinfo->resv_id);
	njinfo->alt_id = string_dup(ojinfo->alt_id);

	if (ojinfo->resv != NULL) {
		njinfo->resv = find_resource_resv_by_indrank(nqinfo->server->resvs,
							     ojinfo->resv->resresv_ind, ojinfo->resv->rank);
	}

	njinfo->resused = dup_resource_req_list(ojinfo->resused);

	njinfo->array_index = ojinfo->array_index;
	njinfo->array_id = ojinfo->array_id;
	njinfo->queued_subjobs = dup_range_list(ojinfo->queued_subjobs);
	njinfo->max_run_subjobs = ojinfo->max_run_subjobs;

	njinfo->resreleased = dup_nspecs(ojinfo->resreleased, nsinfo->nodes, NULL);
	njinfo->resreq_rel = dup_resource_req_list(ojinfo->resreq_rel);

	if (nqinfo->server->fstree != NULL) {
		njinfo->ginfo = find_group_info(ojinfo->ginfo->name,
						nqinfo->server->fstree->root);
	} else
		njinfo->ginfo = NULL;

	njinfo->depend_job_str = string_dup(njinfo->depend_job_str);

#ifdef RESC_SPEC
	njinfo->rspec = dup_rescspec(ojinfo->rspec);
#endif

#ifdef NAS
	/* localmod 045 */
	njinfo->NAS_pri = ojinfo->NAS_pri;
	/* localmod 034 */
	njinfo->sh_amts = site_dup_share_amts(ojinfo->sh_amts);
	njinfo->sh_info = ojinfo->sh_info;
	njinfo->accrue_rate = ojinfo->accrue_rate;
	/* localmod 040 */
	njinfo->nodect = ojinfo->nodect;
	/* localmod 031 */
	njinfo->schedsel = string_dup(ojinfo->schedsel);
	/* localmod 053 */
	njinfo->u_info = ojinfo->u_info;
#endif

	return njinfo;
}

/**
 * @brief
 * 		filter function used with resource_resv_filter
 *        create limited running job set for use with preemption.
 *        If there are multiple resources found in preempt_targets
 *        the scheduler will select a preemptable job which satisfies
 *        any one of them.
 *
 * @see	resource_resv_filter()
 *
 * @param[in]	job	-	job to consider to include
 * @param[in]	arg	-	attribute=value pairs criteria for inclusion
 *
 * @retval	int
 * @return	1	: If job falls into one of the preempt_targets
 * @return	0	: If job dos not fall into any of the preempt_targets
 */
int
preempt_job_set_filter(resource_resv *job, const void *arg)
{
	resource_req *req;
	char **arglist;
	char *p;
	char *dot;
	int i;

	if (job == NULL || arg == NULL || job->job == NULL ||
	    job->job->queue == NULL || job->job->is_running != 1)
		return 0;

	arglist = (char **) arg;

	for (i = 0; arglist[i] != NULL; i++) {
		p = strpbrk(arglist[i], ".=");
		if (p != NULL) {
			/* two valid attributes: queue and Resource_List.<res> */
			if (!strncasecmp(arglist[i], ATTR_queue, p - arglist[i])) {
				if (job->job->queue->name == p + 1)
					return 1;
			} else if (!strncasecmp(arglist[i], ATTR_l, p - arglist[i])) {
				dot = p;
				p = strpbrk(arglist[i], "=");
				if (p == NULL)
					return 0;
				else {
					*p = '\0';
					req = find_resource_req_by_str(job->resreq, dot + 1);
					*p = '=';
					if (req != NULL) {
						if (!strcmp(req->res_str, p + 1))
							return 1;
					}
				}
			}
		}
	}
	return 0;
}

/**
 * @brief
 *  get_job_req_used_time - get a running job's req and used time for preemption
 *
 * @param[in]	pjob - the job in question
 * @param[out]	rtime - return pointer to the requested time
 * @param[out]	utime - return pointer to the used time
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for error
 */
static int
get_job_req_used_time(resource_resv *pjob, int *rtime, int *utime)
{
	resource_req *req;  /* the jobs requested soft_walltime/walltime/cput */
	resource_req *used; /* the amount of the walltime/cput used */

	if (pjob == NULL || pjob->job == NULL || !pjob->job->is_running || rtime == NULL || utime == NULL)
		return 1;

	req = find_resource_req(pjob->resreq, allres["soft_walltime"]);

	if (req == NULL)
		req = find_resource_req(pjob->resreq, allres["walltime"]);

	if (req == NULL) {
		req = find_resource_req(pjob->resreq, allres["cput"]);
		used = find_resource_req(pjob->job->resused, allres["cput"]);
		;
	} else
		used = find_resource_req(pjob->job->resused, allres["walltime"]);

	if (req != NULL && used != NULL) {
		*rtime = req->amount;
		*utime = used->amount;
	} else {
		*rtime = -1;
		*utime = -1;
	}

	return 0;
}

/**
 * @brief
 *  schd_get_preempt_order - deduce the preemption ordering to be used for a job
 *
 * @param[in]	pjob	-	the job to preempt
 * @param[in]	sinfo	-	Pointer to server info structure.
 *
 * @return	: struct preempt_ordering.  array containing preemption order
 *
 */
struct preempt_ordering *
schd_get_preempt_order(resource_resv *resresv)
{
	struct preempt_ordering *po = NULL;
	int req = -1;
	int used = -1;

	if (get_job_req_used_time(resresv, &req, &used) != 0)
		return NULL;

	po = get_preemption_order(sc_attrs.preempt_order, req, used);

	return po;
}

/**
 * @brief
 * 		find the jobs to preempt and then preempt them
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	communication descriptor to the PBS server
 * @param[in]	hjob	-	the high priority job
 * @param[in]	sinfo	-	the server to find jobs to preempt
 * @param[out]	err	-	schd_error to return error from runjob
 *
 * @return	int
 * @retval	1	: success
 * @retval  0	: failure
 * @retval -1	: error
 *
 */
int
find_and_preempt_jobs(status *policy, int pbs_sd, resource_resv *hjob, server_info *sinfo, schd_error *err)
{

	int i = 0;
	int *jobs = NULL;
	resource_resv *job = NULL;
	int done = 0;
	int rc = 1;
	int *preempted_list = NULL;
	int preempted_count = 0;
	int *fail_list = NULL;
	int fail_count = 0;
	int num_tries = 0;
	int no_of_jobs = 0;
	char **preempt_jobs_list = NULL;
	preempt_job_info *preempt_jobs_reply = NULL;

	/* jobs with AOE cannot preempt (atleast for now) */
	if (hjob->aoename != NULL)
		return 0;

	/* using calloc - saves the trouble to put NULL at end of list */
	if ((preempted_list = static_cast<int *>(calloc((sinfo->sc.running + 1), sizeof(int)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return -1;
	}

	if ((fail_list = static_cast<int *>(calloc((sinfo->sc.running + 1), sizeof(int)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		free(preempted_list);
		return -1;
	}

	/* loop till done is true, ie, all selected jobs are truely preempted,
	 * or we cant find enough jobs to preempt
	 * or the maximum number of tries has been exhausted
	 */
	while (!done &&
	       ((jobs = find_jobs_to_preempt(policy, hjob, sinfo, fail_list, &no_of_jobs)) != NULL) &&
	       num_tries < MAX_PREEMPT_RETRIES) {
		done = 1;

		if ((preempt_jobs_list = static_cast<char **>(calloc(no_of_jobs + 1, sizeof(char *)))) == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			free(preempted_list);
			free(fail_list);
			return -1;
		}

		for (i = 0; i < no_of_jobs; i++) {
			job = find_resource_resv_by_indrank(sinfo->running_jobs, -1, jobs[i]);
			if (job != NULL) {
				if ((preempt_jobs_list[i] = string_dup(job->name.c_str())) == NULL) {
					log_err(errno, __func__, MEM_ERR_MSG);
					free_string_array(preempt_jobs_list);
					free(preempt_jobs_list);
					free(preempted_list);
					free(fail_list);
					return -1;
				}
			}
		}

		if ((preempt_jobs_reply = send_preempt_jobs(pbs_sd, preempt_jobs_list)) == NULL) {
			free_string_array(preempt_jobs_list);
			free(preempted_list);
			free(fail_list);
			return -1;
		}

		for (i = 0; i < no_of_jobs; i++) {
			job = find_resource_resv(sinfo->running_jobs, preempt_jobs_reply[i].job_id);
			if (job == NULL) {
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, preempt_jobs_reply[i].job_id,
					  "Server replied to preemption request with job which does not exist.");
				continue;
			}

			if (preempt_jobs_reply[i].order[0] == '0') {
				done = 0;
				fail_list[fail_count++] = job->rank;
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO, job->name, "Job failed to be preempted");
			} else {
				int update_accrue_type = 1;
				preempted_list[preempted_count++] = job->rank;
				if (preempt_jobs_reply[i].order[0] == 'S') {
					if (!policy->rel_on_susp.empty()) {
						/* Set resources_released and execselect on the job */
						create_res_released(policy, job);
					}
					update_universe_on_end(policy, job, "S", NO_FLAGS);
					job->job->is_susp_sched = 1;
					log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
						  job->name, "Job preempted by suspension");
					/* Since suspended job is not part of its current equivalence class,
					 * break the job's association with its equivalence class.
					 */
					job->ec_index = UNSPECIFIED;
				} else if (preempt_jobs_reply[i].order[0] == 'C') {
					job->job->is_checkpointed = 1;
					update_universe_on_end(policy, job, "Q", NO_FLAGS);
					log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
						  job->name, "Job preempted by checkpointing");
					/* Since checkpointed job is not part of its current equivalence class,
					 * break the job's association with its equivalence class.
					 */
					job->ec_index = UNSPECIFIED;
				} else if (preempt_jobs_reply[i].order[0] == 'Q') {
					update_universe_on_end(policy, job, "Q", NO_FLAGS);
					log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
						  job->name, "Job preempted by requeuing");
				} else {
					update_universe_on_end(policy, job, "X", NO_FLAGS);
					log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
						  job->name, "Job preempted by deletion");
					job->can_not_run = 1;
					update_accrue_type = 0;
				}
				if (update_accrue_type)
					update_accruetype(pbs_sd, sinfo, ACCRUE_MAKE_ELIGIBLE, SUCCESS, job);
				job->job->is_preempted = 1;
				job->job->time_preempted = sinfo->server_time;
				sinfo->num_preempted++;
			}
		}

		free(jobs);
		free_string_array(preempt_jobs_list);
		free(preempt_jobs_reply);
		num_tries++;
	}

	if (done) {
		clear_schd_error(err);
		auto ret = run_update_job(policy, pbs_sd, sinfo, hjob->job->queue, hjob, RURR_ADD_END_EVENT, err);

		/* oops... we screwed up.. the high priority job didn't run.  Forget about
		 * running it now and resume preempted work
		 */
		if (!ret) {
			schd_error *serr;
			serr = new_schd_error();
			if (serr == NULL) {
				free(preempted_list);
				free(fail_list);
				return -1;
			}
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, hjob->name,
				  "Preempted work didn't run job - rerun it");
			for (i = 0; i < preempted_count; i++) {
				job = find_resource_resv_by_indrank(sinfo->jobs, -1, preempted_list[i]);
				if (job != NULL && !job->job->is_running) {
					clear_schd_error(serr);
					if (run_update_job(policy, pbs_sd, sinfo, job->job->queue, job, RURR_NO_FLAGS, serr) == 0) {
						schdlogerr(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, job->name, "Failed to rerun job:", serr);
					}
				}
			}
			rc = 0;
			free_schd_error_list(serr);
		}
	} else if (num_tries == MAX_PREEMPT_RETRIES) {
		rc = 0;
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, hjob->name,
			  "Maximum number of preemption tries exceeded - cannot run job");
	} else
		rc = 0;

	free(preempted_list);
	free(fail_list);
	return rc;
}

/**
 * @brief
 * 		find jobs to preempt in order to run a high priority job.
 *        First we'll check if the reason the job can't run will be helped
 *        if we preempt work (i.e. job won't run because of dedtime) then
 *        we'll simulate preempting jobs to find a list which will work.
 *        We will then go back through the list to find if any work doesn't
 *        need to be preempted.  Finally we'll return the list if we found
 *        one, NULL if not.
 *
 * @param[in]	policy		-	policy info
 * @param[in]	hjob		-	the high priority job
 * @param[in]	sinfo		-	the server of the jobs to preempt
 * @param[in]	fail_list	-	list of jobs which preemption has failed
 *				 	do not attempt to preempt again
 * @param[out]	no_of_jobs	-	number of jobs in the list being returned
 *
 * @return	int *
 * @retval	array of job ranks to preempt
 * @retval	NULL	: error/no jobs
 * @par NOTE:	returned array is allocated with malloc() --  needs freeing
 *
 */
int *
find_jobs_to_preempt(status *policy, resource_resv *hjob, server_info *sinfo, int *fail_list, int *no_of_jobs)
{
	int i;
	int j = 0;
	int has_lower_jobs = 0; /* there are jobs of a lower preempt priority */
	unsigned int prev_prio; /* jinfo's preempt field before simulation */
	server_info *nsinfo;
	status *npolicy;
	resource_resv **rjobs = NULL; /* the running jobs to choose from */
	resource_resv **pjobs = NULL; /* jobs to preempt */
	resource_resv **rjobs_subset = NULL;
	int *pjobs_list = NULL;	     /* list of job ids */
	resource_resv *nhjob = NULL; /* pointer to high priority job from duplicated universe */
	resource_resv *pjob = NULL;
	int rc = 0;
	int retval = 0;
	char log_buf[MAX_LOG_SIZE];
	schd_error *err = NULL;

	enum sched_error_code old_errorcode = SUCCESS;
	resdef *old_rdef = NULL;
	long indexfound;
	long skipto;
	int filter_again = 0;

	schd_error *full_err = NULL;
	schd_error *cur_err = NULL;

	resource_req *preempt_targets_req = NULL;
	char **preempt_targets_list = NULL;
	resource_resv **prjobs = NULL;
	int rjobs_count = 0;

	*no_of_jobs = 0;
	if (hjob == NULL || sinfo == NULL)
		return NULL;

	/* if the job is in an express queue and there are multiple express queues,
	 * we need see if there are any running jobs who we can preempt.  All
	 * express queues fall into the same preempt level but have different
	 * preempt priorities.
	 */
	if ((hjob->job->preempt_status & PREEMPT_TO_BIT(PREEMPT_EXPRESS)) &&
	    sinfo->has_mult_express) {
		for (i = 0; sinfo->running_jobs[i] != NULL && !has_lower_jobs; i++)
			if (sinfo->running_jobs[i]->job->preempt < hjob->job->preempt)
				has_lower_jobs = TRUE;
	} else {
		for (i = 0; i < NUM_PPRIO && !has_lower_jobs; i++)
			if (sc_attrs.preempt_prio[i][1] < hjob->job->preempt &&
			    sinfo->preempt_count[i] > 0)
				has_lower_jobs = TRUE;
	}

	if (has_lower_jobs == FALSE)
		return NULL;

	/* we increment cstat.preempt_attempts when we check, if we only did a
	 * cstat.preempt_attempts > conf.max_preempt_attempts we would actually
	 * attempt to preempt conf.max_preempt_attempts + 1 times
	 */
	if (conf.max_preempt_attempts != SCHD_INFINITY) {
		if (cstat.preempt_attempts >= conf.max_preempt_attempts) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, hjob->name,
				  "Not attempting to preempt: over max cycle preempt limit");
			return NULL;
		} else
			cstat.preempt_attempts++;
	}

	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, hjob->name,
		  "Employing preemption to try and run high priority job.");

	/* Let's get all the reasons the job won't run now.
	 * This will help us find the set of jobs to preempt
	 */

	full_err = new_schd_error();
	if (full_err == NULL) {
		return NULL;
	}

	auto ns_arr = is_ok_to_run(policy, sinfo, hjob->job->queue, hjob, RETURN_ALL_ERR, full_err);

	/* This should be NULL, but just in case */
	free_nspecs(ns_arr);

	/* If a job can't run due to any of these reasons, no amount of preemption will help */
	for (cur_err = full_err; cur_err != NULL; cur_err = cur_err->next) {
		int cant_preempt = 0;
		switch ((int) cur_err->error_code) {
			case SCHD_ERROR:
			case NOT_QUEUED:
			case QUEUE_NOT_STARTED:
			case QUEUE_NOT_EXEC:
			case DED_TIME:
			case CROSS_DED_TIME_BOUNDRY:
			case PRIME_ONLY:
			case NONPRIME_ONLY:
			case CROSS_PRIME_BOUNDARY:
			case NODE_NONEXISTENT:
			case CANT_SPAN_PSET:
			case RESERVATION_INTERFERENCE:
			case PROV_DISABLE_ON_SERVER:
			case MAX_RUN_SUBJOBS:
				cant_preempt = 1;
				break;
		}
		if (cur_err->status_code == NEVER_RUN)
			cant_preempt = 1;
		if (cant_preempt) {
			translate_fail_code(cur_err, NULL, log_buf);
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, hjob->name,
				   "Preempt: Can not preempt to run job: %s", log_buf);
			free_schd_error_list(full_err);
			return NULL;
		}
	}

	if ((pjobs = static_cast<resource_resv **>(malloc(sizeof(resource_resv *) * (sinfo->sc.running + 1)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		free_schd_error_list(full_err);
		return NULL;
	}
	pjobs[0] = NULL;

	if (sc_attrs.preempt_targets_enable) {
		preempt_targets_req = find_resource_req(hjob->resreq, allres["preempt_targets"]);
		if (preempt_targets_req != NULL) {

			preempt_targets_list = break_comma_list(preempt_targets_req->res_str);
			retval = check_preempt_targets_for_none(preempt_targets_list);
			if (retval == PREEMPT_NONE) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, hjob->name,
					  "No preemption set specified for the job: Job will not preempt");
				free_schd_error_list(full_err);
				free(pjobs);
				free_string_array(preempt_targets_list);
				return NULL;
			}
		}
	}

	/* use locally dup'd copy of sinfo so we don't modify the original */
	try {
		nsinfo = new server_info(*sinfo);
	} catch (std::exception &e) {
		free_schd_error_list(full_err);
		free(pjobs);
		free_string_array(preempt_targets_list);
		return NULL;
	}
	npolicy = nsinfo->policy;
	nhjob = find_resource_resv_by_indrank(nsinfo->jobs, hjob->resresv_ind, hjob->rank);
	prev_prio = nhjob->job->preempt;

	if (sc_attrs.preempt_targets_enable) {
		if (preempt_targets_req != NULL) {
			prjobs = resource_resv_filter(nsinfo->running_jobs,
						      count_array(nsinfo->running_jobs),
						      preempt_job_set_filter,
						      (void *) preempt_targets_list, NO_FLAGS);
			free_string_array(preempt_targets_list);
		}
	}

	if (prjobs != NULL) {
		rjobs = prjobs;
		rjobs_count = count_array(prjobs);
		if (rjobs_count > 0) {
			log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, nhjob->name,
				   "Limited running jobs used for preemption from %d to %d", nsinfo->sc.running, rjobs_count);
		} else {
			log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, nhjob->name,
				   "Limited running jobs used for preemption from %d to 0: No jobs to preempt", nsinfo->sc.running);
			pjobs_list = NULL;
			goto cleanup;
		}

	} else {
		rjobs = nsinfo->running_jobs;
		rjobs_count = nsinfo->sc.running;
	}

	/* sort jobs in ascending preemption priority and starttime... we want to preempt them
	 * from lowest prio to highest
	 */
	if (sc_attrs.preempt_sort == PS_MIN_T_SINCE_START)
		qsort(rjobs, rjobs_count, sizeof(job_info *), cmp_preempt_stime_asc);
	else {
		/* sort jobs in ascending preemption priority... we want to preempt them
		 * from lowest prio to highest
		 */
		qsort(rjobs, rjobs_count, sizeof(job_info *), cmp_preempt_priority_asc);
	}

	err = dup_schd_error(full_err); /* only first element */
	if (err == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		pjobs_list = NULL;
		goto cleanup;
	}

	rjobs_subset = filter_preemptable_jobs(rjobs, nhjob, err);
	if (rjobs_subset == NULL) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO, nhjob->name, "Found no preemptable candidates");
		pjobs_list = NULL;
		goto cleanup;
	}

	skipto = 0;
	while ((indexfound = select_index_to_preempt(npolicy, nhjob, rjobs_subset, skipto, err, fail_list)) != NO_JOB_FOUND) {
		struct preempt_ordering *po;
		int dont_preempt_job = 0;
		int ind = 0;

		if (indexfound == ERR_IN_SELECT) {
			/* System error occurred, no need to proceed */
			log_err(errno, __func__, MEM_ERR_MSG);
			pjobs_list = NULL;
			goto cleanup;
		}
		pjob = rjobs_subset[indexfound];
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->name,
			  "Simulation: preempting job");

		po = schd_get_preempt_order(pjob);
		if (po != NULL) {
			if (!policy->rel_on_susp.empty() && po->order[0] == PREEMPT_METHOD_SUSPEND && pjob->job->can_suspend) {
				pjob->job->resreleased = create_res_released_array(npolicy, pjob);
				pjob->job->resreq_rel = create_resreq_rel_list(npolicy, pjob);
			}
		}

		update_universe_on_end(npolicy, pjob, "S", NO_ALLPART);
		rjobs_count--;
		/* Check if any of the previously preempted job increased its preemption priority to be more than the
		 * high priority job
		 */
		for (ind = 0; pjobs[ind] != NULL; ind++) {
			if (pjobs[ind]->job->preempt > nhjob->job->preempt) {
				dont_preempt_job = 1;
				break;
			}
		}
		/* Check if the job we just ended increases its preemption priority to be more than the high priority job.
		 * If so, don't preempt this job
		 */
		if (dont_preempt_job || pjob->job->preempt > nhjob->job->preempt) {
			remove_resresv_from_array(rjobs_subset, pjob);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->name,
				  "Preempting job will escalate its priority or priority of other jobs, not preempting it");
			if (sim_run_update_resresv(npolicy, pjob, ns_arr, NO_ALLPART) != 1) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO, nhjob->name,
					  "Trouble finding preemptable candidates");
				pjobs_list = NULL;
				goto cleanup;
			}
			if (indexfound > 0)
				skipto = indexfound - 1;
			else
				skipto = 0;
			continue;
		}

		if (pjob->end_event != NULL)
			delete_event(nsinfo, pjob->end_event);

		pjobs[j++] = pjob;
		pjobs[j] = NULL;

		old_errorcode = err->error_code;
		if (err->rdef != NULL) {
			old_rdef = err->rdef;
		} else
			old_rdef = NULL;

		clear_schd_error(err);
		ns_arr = is_ok_to_run(npolicy, nsinfo, nhjob->job->queue, nhjob, NO_ALLPART, err);
		if (!ns_arr.empty()) {
			/* Normally when running a subjob, we do not care about the subjob. We just care that it successfully runs.
			 * We allow run_update_job() to enqueue and run the subjob.  In this case, we need to act upon the
			 * subjob after it runs.  To handle this case, we enqueue it first then we run it.
			 */
			if (nhjob->job->is_array) {
				resource_resv *nj;
				nj = queue_subjob(nhjob, nsinfo, nhjob->job->queue);

				if (nj == NULL) {
					pjobs_list = NULL;
					goto cleanup;
				}
				nhjob = nj;
			}

			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, nhjob->name,
				  "Simulation: Preempted enough work to run job");
			rc = sim_run_update_resresv(npolicy, nhjob, ns_arr, NO_ALLPART);
			break;
		} else if (old_errorcode == err->error_code) {
			if (err->rdef != NULL) {
				/* If the error code matches, make sure the resource definition is also matching.
			 * If the definition does not match that means the error is because of some other
			 * resource and we need to filter again.
			 * Otherwise, we just set the skipto to the index of the job that was last seen
			 * by select_index_to_preempt function. This will make select_index_to_preempt
			 * start looking at the jobs from the place it left in the previous call.
			 */
				if (old_rdef != err->rdef)
					filter_again = 1;
				else {
					skipto = indexfound;
					filter_again = 0;
				}
			} else {
				skipto = indexfound;
				filter_again = 0;
			}
		} else {
			/* error changed, so we need to revisit jobs discarded as preemption candidates earlier */
			filter_again = 1;
		}

		if (filter_again == 1) {
			free(rjobs_subset);
			rjobs_subset = filter_preemptable_jobs(rjobs, nhjob, err);
			if (rjobs_subset == NULL) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO, nhjob->name, "Found no preemptable candidates");
				pjobs_list = NULL;
				goto cleanup;
			}
			filter_again = 0;
			skipto = 0;
		}

		translate_fail_code(err, NULL, log_buf);
		log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, nhjob->name,
			   "Simulation: not enough work preempted: %s", log_buf);
	}

	pjobs[j] = NULL;
	if (rjobs_subset != NULL)
		free(rjobs_subset);

	/* check to see if we lowered our preempt priority in our simulation
	 * if we have, then punt and don't
	 */
	if (prev_prio > nhjob->job->preempt) {
		rc = 0;
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, nhjob->name,
			  "Job not run because it would immediately be preemptable.");
	}

	/* Right now we have a list of jobs we know will create enough space.  It
	 * might preempt too much work.  We need to determine if each job is
	 * still needed.
	 *
	 * We look to see if jobs are similar to the high priority job (preemption_similarity())
	 * or we try and rerun them in the simulated universe.
	 * If we can run them or the jobs aren't similar, then we don't have to
	 * preempt them.  We will go backwards from the end of the list because we
	 * started preempting with the lowest priority jobs.
	 */

	if (rc > 0) {
		if ((pjobs_list = static_cast<int *>(calloc((j + 1), sizeof(int)))) == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			goto cleanup;
		}

		for (j--, i = 0; j >= 0; j--) {
			int remove_job = 0;
			clear_schd_error(err);
			if (preemption_similarity(nhjob, pjobs[j], full_err) == 0) {
				remove_job = 1;
			} else {
				ns_arr = is_ok_to_run(npolicy, nsinfo, pjobs[j]->job->queue, pjobs[j], NO_ALLPART, err);
				if (!ns_arr.empty()) {
					remove_job = 1;
					sim_run_update_resresv(npolicy, pjobs[j], ns_arr, NO_ALLPART);
				}
			}

			if (remove_job) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
					  pjobs[j]->name, "Simulation: preemption of job not needed.");
				remove_resresv_from_array(pjobs, pjobs[j]);

			} else {
				pjobs_list[i] = pjobs[j]->rank;
				i++;
			}
		}

		pjobs_list[i] = 0;
		/* i == 0 means we removed all the jobs: Should not happen */
		if (i == 0) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, nhjob->name,
				  "Simulation Error: All jobs removed from preemption list");
		} else
			*no_of_jobs = i;
	}
cleanup:
	delete nsinfo;
	free(pjobs);
	free(prjobs);
	free_schd_error_list(full_err);
	free_schd_error(err);

	return pjobs_list;
}

/**
 * @brief
 *		select a good candidate for preemption
 *
 * @param[in] policy - policy info
 * @param[in] hjob - the high priority job to preempt for
 * @param[in] rjobs - the list of running jobs to select from
 * @param[in] skipto - Index from where we need to start looking into rjobs
 * @param[in] err    - reason the high prio job isn't running
 * @param[in] fail_list - list of jobs to skip. They previously failed to be preempted.
 *			  Do not select them again.
 *
 * @return long
 * @retval index of the job to preempt
 * @retval NO_JOB_FOUND nothing can be selected for preemption
 * @retval ERR_IN_SELECT error
 */
long
select_index_to_preempt(status *policy, resource_resv *hjob,
			resource_resv **rjobs, long skipto, schd_error *err,
			int *fail_list)
{
	int i, j, k;
	int good = 1; /* good boolean: Is job eligible to be preempted */
	struct preempt_ordering *po;

	if (err == NULL || hjob == NULL || hjob->job == NULL ||
	    rjobs == NULL || rjobs[0] == NULL)
		return NO_JOB_FOUND;

	/* This shouldn't happen, but you can never be too paranoid */
	if (hjob->job->is_running && hjob->ninfo_arr == NULL)
		return NO_JOB_FOUND;

	/* if we find a good job, we'll break out at the bottom
	 * we can't break out up here since i will be incremented by this point
	 * and we'll be returning the job AFTER the one we want too
	 */
	for (i = skipto; rjobs[i] != NULL; i++) {
		/* Does the running job have any resource we need? */
		int node_good = 1;

		/* lets be optimistic.. we'll start off assuming this is a good candidate */
		good = 1;

		/* if hjob hit a hard limit, check if candidate job has requested that resource
		 * if reason is different then set flag as if resource was found
		 */

		if (rjobs[i]->job == NULL || rjobs[i]->ninfo_arr == NULL)
			continue; /* we have problems... */

		if (!rjobs[i]->job->is_running)
			/* Only running jobs have resources allocated to them.
			 * They are only eligible to preempt.
			 */
			good = 0;

		if (rjobs[i]->job->is_provisioning)
			good = 0; /* provisioning job cannot be preempted */

		if (good) {
			if (rjobs[i]->job->can_not_preempt ||
			    rjobs[i]->job->preempt >= hjob->job->preempt)
				good = 0;
		}

		if (good) {
			for (j = 0; fail_list[j] != 0; j++) {
				if (fail_list[j] == rjobs[i]->rank) {
					good = 0;
					break;
				}
			}
		}

		if (good) {
			/* get the preemption order to be used for this job */
			po = schd_get_preempt_order(rjobs[i]);

			/* check whether chosen order is enabled for this job */
			for (j = 0; j < PREEMPT_METHOD_HIGH; j++) {
				if (po->order[j] == PREEMPT_METHOD_SUSPEND &&
				    rjobs[i]->job->can_suspend)
					break; /* suspension is always allowed */

				if (po->order[j] == PREEMPT_METHOD_CHECKPOINT &&
				    rjobs[i]->job->can_checkpoint)
					break; /* choose if checkpoint is allowed */

				if (po->order[j] == PREEMPT_METHOD_REQUEUE &&
				    rjobs[i]->job->can_requeue)
					break; /* choose if requeue is allowed */
				if (po->order[j] == PREEMPT_METHOD_DELETE)
					break;
			}
			if (j == PREEMPT_METHOD_HIGH) /* no preemption method good */
				good = 0;
		}

		if (good) {
			for (j = 0; good && rjobs[i]->ninfo_arr[j] != NULL; j++) {
				if (rjobs[i]->ninfo_arr[j]->is_down || rjobs[i]->ninfo_arr[j]->is_offline)
					good = 0;
			}
		}

		/* if the high priority job is suspended then make sure we only
		 * select jobs from the node the job is currently suspended on
		 */

		if (good) {
			if (hjob->ninfo_arr != NULL) {
				for (j = 0; hjob->ninfo_arr[j] != NULL; j++) {
					if (find_node_by_rank(rjobs[i]->ninfo_arr,
							      hjob->ninfo_arr[j]->rank) != NULL)
						break;
				}

				/* if we made all the way through the list, then rjobs[i] has no useful
				 * nodes for us to use... don't select it, unless it's not node resources we're after
				 */

				if (hjob->ninfo_arr[j] == NULL)
					good = 0;
			}
		}
		if (good) {
			schd_error *err;
			node_good = 0;

			err = new_schd_error();
			if (err == NULL)
				return NO_JOB_FOUND;

			for (j = 0; rjobs[i]->ninfo_arr[j] != NULL && !node_good; j++) {
				node_info *node = rjobs[i]->ninfo_arr[j];
				bool only_check_noncons = false;

				if (node->is_multivnoded) {
					/* unsafe to consider vnodes from multivnoded hosts "no good" when "not enough" of some consumable
					 * resource can be found in the vnode, since rest may be provided by other vnodes on the same host
					 * restrict check on these vnodes to check only against non consumable resources
					 */
					if (policy->resdef_to_check_noncons.empty()) {
						for (const auto &rtc : policy->resdef_to_check) {
							if (rtc->type.is_non_consumable)
								policy->resdef_to_check_noncons.insert(rtc);
						}
					}
					only_check_noncons = true;
				}
				for (k = 0; hjob->select->chunks[k] != NULL; k++) {
					long num_chunks_returned = 0;
					unsigned int flags = COMPARE_TOTAL | CHECK_ALL_BOOLS | UNSET_RES_ZERO;
					/* if only non consumables are checked, infinite number of chunks can be satisfied,
					 * and SCHD_INFINITY is negative, so don't be tempted to check on positive value
					 */
					clear_schd_error(err);
					if (only_check_noncons) {
						if (!policy->resdef_to_check_noncons.empty())
							num_chunks_returned = check_avail_resources(node->res, hjob->select->chunks[k]->req,
												    flags, policy->resdef_to_check_noncons, INSUFFICIENT_RESOURCE, err);
						else
							num_chunks_returned = SCHD_INFINITY;
					} else
						num_chunks_returned = check_avail_resources(node->res, hjob->select->chunks[k]->req,
											    flags, INSUFFICIENT_RESOURCE, err);

					if ((num_chunks_returned > 0) || (num_chunks_returned == SCHD_INFINITY)) {
						node_good = 1;
						break;
					}
				}
			}
			free_schd_error(err);
		}

		if (node_good == 0)
			good = 0;

		if (good)
			break;
	}

	if (good && rjobs[i] != NULL)
		return i;

	return NO_JOB_FOUND;
}

/**
 * @brief
 *		preempt_level - take a preemption priority and return a preemption
 *			level
 *
 * @param[in]	prio	-	the preemption priority
 *
 * @return	the preemption level
 *
 */
int
preempt_level(unsigned int prio)
{
	int level = NUM_PPRIO;
	int i;

	for (i = 0; i < NUM_PPRIO && level == NUM_PPRIO; i++)
		if (sc_attrs.preempt_prio[i][1] == prio)
			level = i;

	return level;
}

/**
 * @brief
 *		set_preempt_prio - set a job's preempt field to the correct value
 *
 * @param[in]	job	-	the job to set
 * @param[in]	qinfo	-	the queue the job is in
 * @param[in]	sinfo	-	the job's server
 *
 * @return	nothing
 *
 */
void
set_preempt_prio(resource_resv *job, queue_info *qinfo, server_info *sinfo)
{
	int i;
	job_info *jinfo;
	int rc;

	if (job == NULL || job->job == NULL || qinfo == NULL || sinfo == NULL)
		return;

	jinfo = job->job;

	/* in the case of reseting the value, we need to clear them first */
	jinfo->preempt = 0;
	jinfo->preempt_status = 0;

	if (sinfo->qrun_job != NULL) {
		if (job == sinfo->qrun_job ||
		    (jinfo->is_subjob && jinfo->array_id == sinfo->qrun_job->name))
			jinfo->preempt_status |= PREEMPT_TO_BIT(PREEMPT_QRUN);
	}

	if (sc_attrs.preempt_queue_prio != SCHD_INFINITY &&
	    qinfo->priority >= sc_attrs.preempt_queue_prio)
		jinfo->preempt_status |= PREEMPT_TO_BIT(PREEMPT_EXPRESS);

	if (over_fs_usage(jinfo->ginfo))
		jinfo->preempt_status |= PREEMPT_TO_BIT(PREEMPT_OVER_FS_LIMIT);

	if ((rc = check_soft_limits(sinfo, qinfo, job)) != 0) {
		if ((rc & PREEMPT_TO_BIT(PREEMPT_ERR)) != 0) {
			job->can_not_run = 1;
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR, job->name,
				  "job marked as not runnable due to check_soft_limits internal error");
			return;
		} else
			jinfo->preempt_status |= rc;
	}

	/* we haven't set it yet, therefore it's a normal job */
	if (jinfo->preempt_status == 0)
		jinfo->preempt_status = PREEMPT_TO_BIT(PREEMPT_NORMAL);

	/* now that we've set all the possible preempt status's on the job, lets
	 * set its priority compared to those statuses.  The statuses are sorted
	 * by number of bits first, and priority second.  We need to just search
	 * through the list once and set the priority to the first one we find
	 */

	for (i = 0; i < NUM_PPRIO && sc_attrs.preempt_prio[i][0] != 0 &&
		    jinfo->preempt == 0;
	     i++) {
		if ((jinfo->preempt_status & sc_attrs.preempt_prio[i][0]) == sc_attrs.preempt_prio[i][0]) {
			jinfo->preempt = sc_attrs.preempt_prio[i][1];
			/* if the express bit is on, then we'll add the priority of that
			 * queue into our priority to allow for multiple express queues
			 */
			if (sc_attrs.preempt_prio[i][0] & PREEMPT_TO_BIT(PREEMPT_EXPRESS))
				jinfo->preempt += jinfo->queue->priority;
		}
	}
	/* we didn't find our preemption level -- this means we're a normal job */
	if (jinfo->preempt == 0) {
		jinfo->preempt_status = PREEMPT_TO_BIT(PREEMPT_NORMAL);
		jinfo->preempt = preempt_normal;
	}
}

/**
 * @brief
 * 		create subjob name from subjob id and array name
 *
 * @param[in]	array_id	-	the parent array name
 * @param[in]	index	-	subjob index
 *
 * @return	created subjob name
 */
std::string
create_subjob_name(const std::string &array_id, int index)
{
	std::string subjob_id;
	std::size_t brackets;

	subjob_id = array_id;
	brackets = subjob_id.find("[]");
	if (brackets == std::string::npos)
		return std::string("");
	subjob_id.insert(brackets + 1, std::to_string(index));

	return subjob_id;
}

/**
 * @brief
 *		create_subjob_from_array - create a resource_resv structure for a
 *				   subjob from a job array structure.  The
 *				   subjob will be in state 'Q'
 *
 * @param[in]	array	-	the job array
 * @param[in]	index	-	the subjob index
 * @param[in]	subjob_name	-	name of subjob @see create_subjob_name()
 *
 * @return	the new subjob
 * @retval	NULL	: on error
 *
 */
resource_resv *
create_subjob_from_array(resource_resv *array, int index, const std::string &subjob_name)
{
	resource_resv *subjob; /* job_info structure for new subjob */
	range *tmp;	       /* a tmp ptr to hold the queued_indices ptr */
	schd_error *err;

	if (array == NULL || array->job == NULL)
		return NULL;

	if (!array->job->is_array)
		return NULL;

	err = new_schd_error();
	if (err == NULL)
		return NULL;

	/* so we don't dup the queued_indices for the subjob */
	tmp = array->job->queued_subjobs;
	array->job->queued_subjobs = NULL;

	subjob = dup_resource_resv(array, array->server, array->job->queue, subjob_name);

	if (subjob == NULL) {
		free_schd_error(err);
		return NULL;
	}

	/* make a copy of dependent jobs */
	subjob->job->depend_job_str = string_dup(array->job->depend_job_str);
	subjob->job->dependent_jobs = (resource_resv **) dup_array(array->job->dependent_jobs);

	array->job->queued_subjobs = tmp;

	subjob->job->is_begin = 0;
	subjob->job->is_array = 0;

	subjob->job->is_queued = 1;
	subjob->job->is_subjob = 1;
	subjob->job->array_index = index;
	subjob->job->array_id = array->name;

	subjob->rank = get_sched_rank();

	free_schd_error(err);
	return subjob;
}

/**
 * @brief
 *		update_array_on_run - update a job array object when a subjob is run
 *
 * @param[in]	array	-	the job array to update
 * @param[in]	subjob	-	the subjob which was run
 *
 * @return	success or failure
 *
 */
int
update_array_on_run(job_info *array, job_info *subjob)
{
	if (array == NULL || subjob == NULL)
		return 0;

	range_remove_value(&array->queued_subjobs, subjob->array_index);

	if (array->is_queued) {
		array->is_begin = 1;
		array->is_queued = 0;
	}

	return 1;
}

/**
 * @brief
 *		is_job_array - is a job name a job array range
 *			  valid_form: 1234[]
 *			  valid_form: 1234[N]
 *			  valid_form: 1234[N-M]
 *
 * @param[in]	jobname	-	jobname to check
 *
 * @return int
 * @retval	1	: if jobname is a job array
 * @retval	2	: if jobname is a subjob
 * @retval	3	: if jobname is a range
 * @retval	0	: if it is not a job array
 */
int
is_job_array(char *jobname)
{
	char *bracket;
	int ret = 0;

	if (jobname == NULL)
		return 0;

	bracket = strchr(jobname, (int) '[');

	if (bracket != NULL) {
		if (*(bracket + 1) == ']')
			ret = 1;
		else if (strchr(bracket, (int) '-') != NULL)
			ret = 3;
		else
			ret = 2;
	}

	return ret;
}

/**
 * @brief
 *		modify_job_array_for_qrun - modify a job array for qrun -
 *				    set queued_subjobs to just the
 *				    range which is being run
 *				    set qrun_job on server
 *
 * @param[in,out]	sinfo	-	server to modify job array
 * @param[in]	jobid	-	string job name
 *
 * @return	int
 * @retval	1	: on success
 * @retval	0	: on failure
 * @retval	-1	: on error
 *
 */
int
modify_job_array_for_qrun(server_info *sinfo, char *jobid)
{
	char name[128];
	char rest[128];
	char *rangestr;
	char *ptr;
	range *r, *r2;
	int len;

	resource_resv *job;

	if (sinfo == NULL || jobid == NULL)
		return -1;

	pbs_strncpy(name, jobid, sizeof(name));

	if ((ptr = strchr(name, (int) '[')) == NULL)
		return 0;

	*ptr = '\0';
	rangestr = ptr + 1;

	if ((ptr = strchr(rangestr, ']')) == NULL)
		return 0;

	pbs_strncpy(rest, ptr, sizeof(rest));

	*ptr = '\0';

	/* now rangestr should be the subjob index or range of indices */
	if ((r = range_parse(rangestr)) == NULL)
		return 0;

	/* now that we've converted the subjob index or range into a range list
	 * we can munge our original name to find the job array
	 */
	len = strlen(name);
	name[len] = '[';
	name[len + 1] = '\0';
	strcat(name, rest);

	job = find_resource_resv(sinfo->jobs, name);

	if (job != NULL) {
		/* lets only run the jobs which were requested */
		r2 = range_intersection(r, job->job->queued_subjobs);
		if (r2 != NULL) {
			free_range_list(job->job->queued_subjobs);
			job->job->queued_subjobs = r2;
		} else {
			free_range_list(r);
			return 0;
		}
	} else {
		free_range_list(r);
		return 0;
	}

	sinfo->qrun_job = job;
	free_range_list(r);
	return 1;
}

/**
 * @brief
 *		create a subjob from a job array and queue it
 *
 * @param[in]	array	-	job array to create the next subjob from
 * @param[in]	sinfo	-	the server the job array is in
 * @param[in]	qinfo	-	the queue the job array is in
 *
 * @return	resource_resv *
 * @retval	new subjob
 * @retval	NULL	: on error
 *
 * @note
 * 		subjob will be attached to the server/queue job lists
 *
 */
resource_resv *
queue_subjob(resource_resv *array, server_info *sinfo,
	     queue_info *qinfo)
{
	int subjob_index;
	std::string subjob_name;
	resource_resv *rresv = NULL;
	resource_resv **tmparr = NULL;

	if (array == NULL || array->job == NULL || sinfo == NULL || qinfo == NULL)
		return NULL;

	if (!array->job->is_array)
		return NULL;

	subjob_index = range_next_value(array->job->queued_subjobs, -1);
	if (subjob_index >= 0) {
		subjob_name = create_subjob_name(array->name, subjob_index);
		if (!subjob_name.empty()) {
			if ((rresv = find_resource_resv(sinfo->jobs, subjob_name)) != NULL) {
				/* Set tmparr to something so we're not considered an error */
				tmparr = sinfo->jobs;
			} else if ((rresv = create_subjob_from_array(array, subjob_index, subjob_name)) != NULL) {
				/* add_resresv_to_array calls realloc, so we need to treat this call
				 * as a call to realloc.  Put it into a temp variable to check for NULL
				 */
				tmparr = add_resresv_to_array(sinfo->jobs, rresv, NO_FLAGS);
				if (tmparr != NULL) {
					sinfo->jobs = tmparr;
					sinfo->sc.queued++;
					sinfo->sc.total++;

					tmparr = add_resresv_to_array(sinfo->all_resresv, rresv, SET_RESRESV_INDEX);
					if (tmparr != NULL) {
						sinfo->all_resresv = tmparr;
						tmparr = add_resresv_to_array(qinfo->jobs, rresv, NO_FLAGS);
						if (tmparr != NULL) {
							qinfo->jobs = tmparr;
							qinfo->sc.queued++;
							qinfo->sc.total++;
						}
					}
				}
				rresv->job->parent_job = array;
			}
		}
	}

	if (tmparr == NULL || rresv == NULL) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, array->name,
			  "Unable to create new subjob for job array");
		return NULL;
	}

	return rresv;
}

/**
 * @brief
 * 		evaluate a math formula for jobs based on their resources
 *		NOTE: currently done through embedded python interpreter
 *
 * @param[in]	formula	-	formula to evaluate
 * @param[in]	resresv	-	job for special case key words
 * @param[in]	resreq	-	resources to use when evaluating
 *
 * @return	evaluated formula answer or 0 on exception
 *
 */

#ifdef PYTHON
sch_resource_t
formula_evaluate(const char *formula, resource_resv *resresv, resource_req *resreq)
{
	char buf[1024];
	char *globals;
	int globals_size = 1024; /* initial size... will grow if needed */
	sch_resource_t ans = 0;
	char *formula_buf;
	int formula_buf_len;

	PyObject *module;
	PyObject *dict;
	PyObject *obj;

	if (formula == NULL || resresv == NULL ||
	    resresv->job == NULL)
		return 0;

	formula_buf_len = sizeof(buf) + strlen(formula) + 1;

	formula_buf = static_cast<char *>(malloc(formula_buf_len));
	if (formula_buf == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return 0;
	}

	if ((globals = static_cast<char *>(malloc(globals_size * sizeof(char)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		free(formula_buf);
		return 0;
	}

	globals[0] = '\0';

	if (pbs_strcat(&globals, &globals_size, "globals_dict = {") == NULL) {
		free(globals);
		free(formula_buf);
		return 0;
	}

	for (const auto &cr : consres) {
		auto req = find_resource_req(resreq, cr);

		if (req != NULL)
			sprintf(buf, "\'%s\':%.*f,", cr->name.c_str(),
				float_digits(req->amount, FLOAT_NUM_DIGITS), req->amount);
		else
			sprintf(buf, "\'%s\' : 0,", cr->name.c_str());

		if (pbs_strcat(&globals, &globals_size, buf) == NULL) {
			free(globals);
			free(formula_buf);
			return 0;
		}
	}

	/* special cases */
	sprintf(buf, "\'%s\':%ld,\'%s\':%d,\'%s\':%d,\'%s\':%f, \'%s\': %f, \'%s\': %f, \'%s\': %f, \'%s\':%d}",
		FORMULA_ELIGIBLE_TIME, resresv->job->eligible_time,
		FORMULA_QUEUE_PRIO, resresv->job->queue->priority,
		FORMULA_JOB_PRIO, resresv->job->priority,
		FORMULA_FSPERC, resresv->job->ginfo->tree_percentage,
		FORMULA_FSPERC_DEP, resresv->job->ginfo->tree_percentage,
		FORMULA_TREE_USAGE, resresv->job->ginfo->usage_factor,
		FORMULA_FSFACTOR, resresv->job->ginfo->tree_percentage == 0 ? 0 : pow(2, -(resresv->job->ginfo->usage_factor / resresv->job->ginfo->tree_percentage)),
		FORMULA_ACCRUE_TYPE, resresv->job->accrue_type);
	if (pbs_strcat(&globals, &globals_size, buf) == NULL) {
		free(globals);
		free(formula_buf);
		return 0;
	}

	PyRun_SimpleString(globals);
	free(globals);

	/* now that we've set all the values, let's calculate the answer */
	snprintf(formula_buf, formula_buf_len,
		 "_PBS_PYTHON_EXCEPTIONSTR_=\"\"\n"
		 "ex = None\n"
		 "try:\n"
		 "\t_FORMANS_ = eval(\"%s\", globals_dict, locals())\n"
		 "except Exception as ex:"
		 "\t_PBS_PYTHON_EXCEPTIONSTR_=str(ex)\n",
		 formula);

	PyRun_SimpleString(formula_buf);
	free(formula_buf);

	module = PyImport_AddModule("__main__");
	dict = PyModule_GetDict(module);
	obj = PyMapping_GetItemString(dict, "_FORMANS_");

	if (obj != NULL) {
		ans = PyFloat_AsDouble(obj);
		Py_XDECREF(obj);
	}

	obj = PyMapping_GetItemString(dict, "_PBS_PYTHON_EXCEPTIONSTR_");
	if (obj != NULL) {
		auto str = PyUnicode_AsUTF8(obj);
		if (str != NULL) {
			if (strlen(str) > 0) { /* exception happened */
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
					   "Formula evaluation for job had an error.  Zero value will be used: %s", str);
				ans = 0;
			}
		}
		Py_XDECREF(obj);
	}

	return ans;
}
#else
sch_resource_t
formula_evaluate(char *formula, resource_resv *resresv, resource_req *resreq)
{
	return 0;
}
#endif

/**
 * @brief
 * 		Set the job accrue type to eligible time.
 *
 * @param[in]	pbs_sd	-	connection to pbs_server
 * @param[out]	resresv	-	pointer to job
 *
 * @return	void
 *
 */
static void
make_eligible(int pbs_sd, resource_resv *resresv)
{
	if (resresv == NULL || resresv->job == NULL)
		return;
	if (resresv->job->accrue_type != JOB_ELIGIBLE) {
		update_job_attr(pbs_sd, resresv, ATTR_accrue_type, NULL, ACCRUE_ELIG, NULL, UPDATE_LATER);
		resresv->job->accrue_type = JOB_ELIGIBLE;
	}
	return;
}

/**
 * @brief
 * 		Set the job accrue type to ineligible time.
 *
 * @param[in]	pbs_sd	-	connection to pbs_server
 * @param[out]	resresv	-	pointer to job
 *
 * @return	void
 */
static void
make_ineligible(int pbs_sd, resource_resv *resresv)
{
	if (resresv == NULL || resresv->job == NULL)
		return;
	if (resresv->job->accrue_type != JOB_INELIGIBLE) {
		update_job_attr(pbs_sd, resresv, ATTR_accrue_type, NULL, ACCRUE_INEL, NULL, UPDATE_LATER);
		resresv->job->accrue_type = JOB_INELIGIBLE;
	}
	return;
}

/**
 * @brief
 * 		Updates accrue_type of job on server. The accrue_type is determined
 * 		from the values of mode and err_code. If resresv is a job array, special
 * 		action is taken. If mode is set to something other than ACCRUE_CHECK_ERR
 * 		then the value of err_code is ignored unless it is set to SCHD_ERROR.
 *
 * @param[in]	pbs_sd	-	connection to pbs_server
 * @param[in]	sinfo	-	pointer to server
 * @param[in]	mode	-	mode of operation
 * @param[in]	err_code	-	sched_error_code value
 * @param[in,out]	resresv	-	pointer to job
 *
 * @return void
 *
 */
void
update_accruetype(int pbs_sd, server_info *sinfo,
		  enum update_accruetype_mode mode, enum sched_error_code err_code,
		  resource_resv *resresv)
{
	if (sinfo == NULL || resresv == NULL || resresv->job == NULL)
		return;

	/* if SCHD_ERROR, don't change accrue type */
	if (err_code == SCHD_ERROR)
		return;

	if (sinfo->eligible_time_enable == 0)
		return;

	/* If we're simulating, don't update the job on the server */
	if (pbs_sd == SIMULATE_SD)
		return;

	/* behavior of job array's eligible_time calc differs from jobs/subjobs,
	 *  it depends on:
	 *    1) job array is empty - accrues ineligible time
	 *    2) job array has instantiated all subjobs - accrues ineligible time
	 *    3) job array has atleast one subjob to run - accrues eligible time
	 */

	if (resresv->job->is_array && resresv->job->is_begin &&
	    (range_next_value(resresv->job->queued_subjobs, -1) < 0)) {
		make_ineligible(pbs_sd, resresv);
		return;
	}

	if ((resresv->job->preempt_status & PREEMPT_QUEUE_SERVER_SOFTLIMIT) > 0) {
		make_ineligible(pbs_sd, resresv);
		return;
	}

	if (mode == ACCRUE_MAKE_INELIGIBLE) {
		make_ineligible(pbs_sd, resresv);
		return;
	}

	if (mode == ACCRUE_MAKE_ELIGIBLE) {
		make_eligible(pbs_sd, resresv);
		return;
	}

	/* determine accruetype from err code */
	switch (err_code) {

		case SUCCESS:
			/* server updates accrue_type to RUNNING, hence, simply move out */
			/* accrue type is set to running in update_resresv_on_run() */
			break;

		case SERVER_BYUSER_JOB_LIMIT_REACHED:
		case SERVER_BYUSER_RES_LIMIT_REACHED:
		case SERVER_USER_LIMIT_REACHED:
		case SERVER_USER_RES_LIMIT_REACHED:
		case SERVER_BYGROUP_JOB_LIMIT_REACHED:
		case SERVER_BYPROJECT_JOB_LIMIT_REACHED:
		case SERVER_BYGROUP_RES_LIMIT_REACHED:
		case SERVER_BYPROJECT_RES_LIMIT_REACHED:
		case SERVER_GROUP_LIMIT_REACHED:
		case SERVER_GROUP_RES_LIMIT_REACHED:
		case SERVER_PROJECT_LIMIT_REACHED:
		case SERVER_PROJECT_RES_LIMIT_REACHED:
		case QUEUE_BYUSER_JOB_LIMIT_REACHED:
		case QUEUE_BYUSER_RES_LIMIT_REACHED:
		case QUEUE_USER_LIMIT_REACHED:
		case QUEUE_USER_RES_LIMIT_REACHED:
		case QUEUE_BYGROUP_JOB_LIMIT_REACHED:
		case QUEUE_BYPROJECT_JOB_LIMIT_REACHED:
		case QUEUE_BYGROUP_RES_LIMIT_REACHED:
		case QUEUE_BYPROJECT_RES_LIMIT_REACHED:
		case QUEUE_GROUP_LIMIT_REACHED:
		case QUEUE_GROUP_RES_LIMIT_REACHED:
		case QUEUE_PROJECT_LIMIT_REACHED:
		case QUEUE_PROJECT_RES_LIMIT_REACHED:
		case NODE_GROUP_LIMIT_REACHED:
		case JOB_UNDER_THRESHOLD:
			make_ineligible(pbs_sd, resresv);
			break;

			/*
			 * The list of ineligible cases must be complete, the remainer are eligible.
			 * Some eligible cases include:
			 * - SERVER_JOB_LIMIT_REACHED
			 * - QUEUE_JOB_LIMIT_REACHED
			 * - CROSS_PRIME_BOUNDARY
			 * - CROSS_DED_TIME_BOUNDRY
			 * - ERR_SPECIAL
			 * - NO_NODE_RESOURCES
			 * - INSUFFICIENT_RESOURCE
			 * - BACKFILL_CONFLICT
			 * - RESERVATION_INTERFERENCE
			 * - PRIME_ONLY
			 * - NONPRIME_ONLY
			 * - DED_TIME
			 * - INSUFFICIENT_QUEUE_RESOURCE
			 * - INSUFFICIENT_SERVER_RESOURCE
			 */
		default:
			make_eligible(pbs_sd, resresv);
			break;
	}

	return;
}

/**
 * @brief
 *		Get AOE name from select of job/reservation.
 *
 * @see
 *		query_jobs
 *		query_reservations
 *
 * @param[in]	select	-	select of job/reservation
 *
 * @return	char *
 * @retval	NULL	: no AOE requested
 * @retval	aoe	: AOE requested
 *
 * @par Side Effects:
 *		None
 *
 * @par	MT-safe: Yes
 *
 */
char *
getaoename(selspec *select)
{
	int i = 0;

	if (select == NULL)
		return NULL;

	for (i = 0; select->chunks[i] != NULL; i++) {
		auto req = find_resource_req(select->chunks[i]->req, allres["aoe"]);
		if (req != NULL)
			return string_dup(req->res_str);
	}

	return NULL;
}

/**
 * @brief
 *	Get EOE name from select of job/reservation.
 *
 * @see
 *	query_jobs
 *	query_reservations
 *
 * @param[in]	select	  -	select of job/reservation
 *
 * @return	char *
 * @retval	NULL : no EOE requested
 * @retval	eoe  : EOE requested
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
char *
geteoename(selspec *select)
{
	resource_req *req;

	if (select == NULL || select->chunks == NULL || select->chunks[0] == NULL)
		return NULL;

	/* we only need to look at 1st chunk since either all request eoe
	 * or none request eoe.
	 */
	req = find_resource_req(select->chunks[0]->req, allres["eoe"]);
	if (req != NULL)
		return string_dup(req->res_str);

	return NULL;
}

/**
 * @brief
 * 		updated the estimated.start_time and
 *		 estimated.exec_vnode attributes on a job
 *
 * @param[in]	pbs_sd	-	connection descriptor to pbs server
 * @param[in]	job	-	job to update
 * @param[in]	start_time	-	start time of job
 * @param[in]	exec_vnode	-	exec_vnode of job or NULL to create it from
 *			      				job->nspec_arr
 * @param[in]	force	-	forces attributes to update now -- no checks
 *
 * @return	int
 * @retval	1	: if attributes were successfully updated
 * @retval	0	: if attributes were not updated for a valid reason
 * @retval	-1	: if attributes were not updated for an error
 */
int
update_estimated_attrs(int pbs_sd, resource_resv *job,
		       time_t start_time, char *exec_vnode, int force)
{
	struct attrl attr = {0};
	char timebuf[128];
	resource_resv *array = NULL;
	resource_resv *resresv;
	enum update_attr_flags aflags;

	if (job == NULL)
		return -1;

	if (job->is_job && job->job == NULL)
		return -1;

	if (!force) {
		if (job->job->is_subjob) {
			array = find_resource_resv(job->server->jobs, job->job->array_id);
			if (array != NULL) {
				if (job->job->array_index !=
				    range_next_value(array->job->queued_subjobs, -1)) {
					return -1;
				}
			} else
				return -1;
		}
		aflags = UPDATE_LATER;
	} else {
		aflags = UPDATE_NOW;
		if (!job->job->array_id.empty())
			array = find_resource_resv(job->server->jobs, job->job->array_id);
	}

	if (job->job->is_topjob == false) {
		update_job_attr(pbs_sd, job, ATTR_topjob, NULL, const_cast<char *>("True"), NULL, aflags);
	}

	/* create attrl for estimated.exec_vnode to be passed as the 'extra' field
	 * to update_job_attr().  This will cause both attributes to be updated
	 * in one call to pbs_asyalterjob()
	 */
	attr.name = const_cast<char *>(ATTR_estimated);
	attr.resource = const_cast<char *>("exec_vnode");
	if (exec_vnode == NULL)
		attr.value = create_execvnode(job->nspec_arr);
	else
		attr.value = exec_vnode;

	snprintf(timebuf, 128, "%ld", (long) start_time);

	if (array)
		resresv = array;
	else
		resresv = job;

	return update_job_attr(pbs_sd, resresv, ATTR_estimated, "start_time",
			       timebuf, &attr, aflags);
}

/**
 * @brief
 * 		This function checks if preemption set has been configured as TARGET_NONE
 *          If its found that preempt_targets = TARGET_NONE then this function returns PREEMPT_NONE.
 * @param[in]	res_list	-	list of resources created from comma seperated resource list.
 *
 * @return	int
 * @retval	PREEMPT_NONE	: If preemption set is set to TARGET_NONE
 * @retval	0	: If preemption set is not set as TARGET_NONE
 */
int
check_preempt_targets_for_none(char **res_list)
{
	char *arg = NULL;
	int i = 0;
	if (res_list == NULL)
		return 0;

	for (arg = res_list[i]; arg != NULL; i++, arg = res_list[i]) {
		if (!strcasecmp(arg, TARGET_NONE)) {
			return PREEMPT_NONE;
		}
	}
	return 0;
}

/**
 * @brief
 * 		checks whether the IFL interface failed because it was a finished job
 *
 * @param[in]	error	-	pbs_errno set by server
 *
 * @retval	1	: if job is a finished job
 * @retval	0	: if job is not a finished job
 */
int
is_finished_job(int error)
{
	switch (error) {
		case PBSE_UNKJOBID:
		case PBSE_HISTJOBID:
			return (1);
		default:
			return (0);
	}
}

/**
 * @brief
 * 		preemption_similarity - Compare two running jobs to see if they have
 *			overlap.  Overlap is defined in terms of preemption.
 *			Can pre-emptee pjob help in running hjob.  In doing this
 *			we look at the full list of reasons hjob can not run and
 *			run a similarity heuristic against the two jobs to see if
 *			they are alike.
 *
 * @param[in]	hjob	-	high priority job
 * @param[in]	pjob	-	job to see if it is similar to the high priority job
 * @param[in]	full_err	-	list of reasons why hjob can not run right now.  It gets
 *                      		created by passing the RETURN_ALL_ERRS to is_ok_to_run()
 * @return	int
 * @retval	1	: jobs are similar
 * @retval	0	: jobs are not similar
 */
int
preemption_similarity(resource_resv *hjob, resource_resv *pjob, schd_error *full_err)
{
	schd_error *cur_err;
	int match = 0;
	schd_resource *res;
	int j;

	for (cur_err = full_err; match == 0 && cur_err != NULL; cur_err = cur_err->next) {
		switch (cur_err->error_code) {
			case QUEUE_JOB_LIMIT_REACHED:
			case QUEUE_RESOURCE_LIMIT_REACHED:
				if (pjob->job->queue == hjob->job->queue)
					match = 1;
				break;
			case SERVER_USER_LIMIT_REACHED:
			case SERVER_USER_RES_LIMIT_REACHED:
			case SERVER_BYUSER_JOB_LIMIT_REACHED:
			case SERVER_BYUSER_RES_LIMIT_REACHED:
				if (pjob->user == hjob->user)
					match = 1;
				break;
			case QUEUE_USER_LIMIT_REACHED:
			case QUEUE_USER_RES_LIMIT_REACHED:
			case QUEUE_BYUSER_JOB_LIMIT_REACHED:
			case QUEUE_BYUSER_RES_LIMIT_REACHED:
				if (pjob->job->queue == hjob->job->queue &&
				    (pjob->user == hjob->user))
					match = 1;

				break;
			case SERVER_GROUP_LIMIT_REACHED:
			case SERVER_GROUP_RES_LIMIT_REACHED:
			case SERVER_BYGROUP_JOB_LIMIT_REACHED:
			case SERVER_BYGROUP_RES_LIMIT_REACHED:
				if (pjob->group == hjob->group)
					match = 1;
				break;

			case QUEUE_GROUP_LIMIT_REACHED:
			case QUEUE_GROUP_RES_LIMIT_REACHED:
			case QUEUE_BYGROUP_JOB_LIMIT_REACHED:
			case QUEUE_BYGROUP_RES_LIMIT_REACHED:
				if (pjob->job->queue == hjob->job->queue &&
				    (pjob->group == hjob->group))
					match = 1;
				break;
			case SERVER_PROJECT_LIMIT_REACHED:
			case SERVER_PROJECT_RES_LIMIT_REACHED:
			case SERVER_BYPROJECT_RES_LIMIT_REACHED:
			case SERVER_BYPROJECT_JOB_LIMIT_REACHED:
				if (pjob->project == hjob->project)
					match = 1;
				break;
			case QUEUE_PROJECT_LIMIT_REACHED:
			case QUEUE_PROJECT_RES_LIMIT_REACHED:
			case QUEUE_BYPROJECT_RES_LIMIT_REACHED:
			case QUEUE_BYPROJECT_JOB_LIMIT_REACHED:
				if (pjob->job->queue == hjob->job->queue &&
				    (pjob->project == hjob->project))
					match = 1;
				break;
			case SERVER_JOB_LIMIT_REACHED:
			case SERVER_RESOURCE_LIMIT_REACHED:
				match = 1;
				break;
			/* Codes from check_nodes(): check_nodes() returns a code for one node.
			 * The code itself doesn't really help us.  What it does do is signal us
			 * that we searched the nodes and didn't find a match.  We need to check if
			 * there are nodes in the exec_vnodes that are similar
			 */
			case NO_AVAILABLE_NODE:
			case NOT_ENOUGH_NODES_AVAIL:
			case NO_NODE_RESOURCES:
			case INVALID_NODE_STATE:
			case INVALID_NODE_TYPE:
			case NODE_JOB_LIMIT_REACHED:
			case NODE_USER_LIMIT_REACHED:
			case NODE_GROUP_LIMIT_REACHED:
			case NODE_NO_MULT_JOBS:
			case NODE_UNLICENSED:
			case INSUFFICIENT_RESOURCE:
			case AOE_NOT_AVALBL:
			case PROV_RESRESV_CONFLICT:
			case NO_FREE_NODES:
			case NO_TOTAL_NODES:
			case NODE_NOT_EXCL:
			case CANT_SPAN_PSET:
			case IS_MULTI_VNODE:
			case RESERVATION_CONFLICT:
			case SET_TOO_SMALL:

				if (hjob->ninfo_arr != NULL && pjob->ninfo_arr != NULL) {
					for (j = 0; hjob->ninfo_arr[j] != NULL && !match; j++) {
						if (find_node_by_rank(pjob->ninfo_arr, hjob->ninfo_arr[j]->rank) != NULL)
							match = 1;
					}
				}

				break;
			case INSUFFICIENT_QUEUE_RESOURCE:
				if (hjob->job->queue == pjob->job->queue) {
					for (res = hjob->job->queue->qres; res != NULL; res = res->next) {
						if (res->avail != SCHD_INFINITY_RES)
							if (find_resource_req(pjob->resreq, res->def) != NULL)
								match = 1;
					}
				}
				break;
			case INSUFFICIENT_SERVER_RESOURCE:
				for (res = hjob->server->res; res != NULL; res = res->next) {
					if (res->avail != SCHD_INFINITY_RES)
						if (find_resource_req(pjob->resreq, res->def) != NULL)
							match = 1;
				}
				break;
			default:
				/* Something we didn't expect, err on the side of caution */
				match = 1;
				break;
		}
	}
	return match;
}

/**
 * @brief Create the resources_released and resource_released_list for a job
 *	    and also set execselect on the job based on resources_released
 *
 * @param[in] policy - policy object
 * @param[in] pjob - Job structure using which resources_released string is created
 *
 * @retval - void
 */
void
create_res_released(status *policy, resource_resv *pjob)
{
	std::string selectspec;
	if (pjob->job->resreleased.empty()) {
		pjob->job->resreleased = create_res_released_array(policy, pjob);
		if (pjob->job->resreleased.empty()) {
			return;
		}
		pjob->job->resreq_rel = create_resreq_rel_list(policy, pjob);
	}
	selectspec = create_select_from_nspec(pjob->job->resreleased);
	delete pjob->execselect;
	pjob->execselect = parse_selspec(selectspec);
	return;
}

/**
 * @brief This function populates resreleased job structure for a particular job.
 *	  It does so by duplicating the job's exec_vnode and only keeping the
 *	  consumable resources in policy->rel_on_susp
 *
 * @param[in] policy - policy object
 * @param[in] resresv - Job to create resources_released
 *
 * @return vector<nspec *>
 * @retval nspec array of released resources
 * @retval NULL
 *
 */
std::vector<nspec *>
create_res_released_array(status *policy, resource_resv *resresv)
{
	resource_req *req;

	if ((resresv == NULL) || (resresv->nspec_arr.empty()) || (resresv->ninfo_arr == NULL))
		return {};

	auto nspec_arr = dup_nspecs(resresv->nspec_arr, resresv->ninfo_arr, NULL);
	if (nspec_arr.empty())
		return {};
	if (!policy->rel_on_susp.empty()) {
		for (auto ns : nspec_arr) {
			for (req = ns->resreq; req != NULL; req = req->next) {
				auto &ros = policy->rel_on_susp;
				if (req->type.is_consumable == 1 && ros.find(req->def) == ros.end())
					req->amount = 0;
			}
		}
	}
	return nspec_arr;
}

/**
 * @brief create a resource_rel array for a job by accumulating all of the RASSN
 *	    resources in a resources_released nspec array.
 *
 * @note only uses RASSN resources on the sched_config resources line
 *
 * @param policy - policy info
 * @param pjob -  resource reservation structure
 * @return resource_req *
 * @retval newly created resreq_rel array
 * @retval NULL on error
 */
resource_req *
create_resreq_rel_list(status *policy, resource_resv *pjob)
{
	resource_req *resreq_rel = NULL;
	resource_req *rel;
	resource_req *req;
	if (policy == NULL || pjob == NULL)
		return NULL;

	for (req = pjob->resreq; req != NULL; req = req->next) {
		auto rdc = policy->resdef_to_check_rassn;
		if (rdc.find(req->def) != rdc.end()) {
			auto ros = policy->rel_on_susp;
			if (!policy->rel_on_susp.empty() && ros.find(req->def) == ros.end())
				continue;
			rel = find_alloc_resource_req(resreq_rel, req->def);
			if (rel != NULL) {
				rel->amount += req->amount;
				if (resreq_rel == NULL)
					resreq_rel = rel;
			}
		}
	}
	return resreq_rel;
}

/**
 * @brief extend the soft walltime of job.  A job's soft_walltime will be extended by 100% of its
 * 		original soft_walltime.  If this extension would go past the job's normal walltime
 * 		the soft_walltime is set to the normal walltime.
 * @param[in] policy - policy info
 * @param[in] resresv - job to extend soft walltime
 * @param[in] server_time - current time on the sinfo
 * @return extended soft walltime duration
 */
long
extend_soft_walltime(resource_resv *resresv, time_t server_time)
{
	resource_req *walltime_req;
	resource_req *soft_walltime_req;

	int extension = 0;
	int num_ext_over;

	long job_duration = UNSPECIFIED;
	long extended_duration = UNSPECIFIED;

	if (resresv == NULL)
		return UNSPECIFIED;

	soft_walltime_req = find_resource_req(resresv->resreq, allres["soft_walltime"]);
	walltime_req = find_resource_req(resresv->resreq, allres["walltime"]);

	if (soft_walltime_req == NULL) { /* Nothing to extend */
		if (walltime_req != NULL)
			return walltime_req->amount;
		else
			return JOB_INFINITY;
	}

	job_duration = soft_walltime_req->amount;

	/* number of times the job has been extended */
	num_ext_over = (server_time - resresv->job->stime) / job_duration;

	extension = num_ext_over * job_duration;
	extended_duration = job_duration + extension;
	if (walltime_req != NULL) {
		if (extended_duration > walltime_req->amount) {
			extended_duration = walltime_req->amount;
		}
	}
	return extended_duration;
}

/**
 * @brief   This function is used as a callback with resource_resv_filter(). It	finds out whether or not
 *	    the job in question is appropriate to be preempted.
 * @param[in] job - job that is being analyzed
 * @param[in] arg - a pointer to resresv_filter structure which contains the job that could not run
 *		    and a sched error structure specifying the reason why it could not run.
 *
 * @return - integer
 * @retval - 0 if job is not valid for preemption
 * @retval - 1 if the job is valid for preemption
 */
static int
cull_preemptible_jobs(resource_resv *job, const void *arg)
{
	struct resresv_filter *inp;
	resource_req *req_scan;

	if (arg == NULL || job == NULL)
		return 0;
	inp = (struct resresv_filter *) arg;
	if (inp->job == NULL)
		return 0;

	/* make sure that only running jobs are looked at */
	if (job->job->is_running == 0)
		return 0;

	if (job->job->preempt >= inp->job->job->preempt)
		return 0;

	switch (inp->err->error_code) {
		case SERVER_USER_RES_LIMIT_REACHED:
		case SERVER_BYUSER_RES_LIMIT_REACHED:
			if ((job->user == inp->job->user) &&
			    find_resource_req(job->resreq, inp->err->rdef) != NULL)
				return 1;
			break;
		case QUEUE_USER_RES_LIMIT_REACHED:
		case QUEUE_BYUSER_RES_LIMIT_REACHED:
			if ((job->job->queue == inp->job->job->queue) &&
			    (job->user == inp->job->user) &&
			    find_resource_req(job->resreq, inp->err->rdef) != NULL)
				return 1;
			break;
		case SERVER_GROUP_RES_LIMIT_REACHED:
		case SERVER_BYGROUP_RES_LIMIT_REACHED:
			if ((job->group == inp->job->group) &&
			    find_resource_req(job->resreq, inp->err->rdef) != NULL)
				return 1;
			break;
		case QUEUE_GROUP_RES_LIMIT_REACHED:
		case QUEUE_BYGROUP_RES_LIMIT_REACHED:
			if ((job->job->queue == inp->job->job->queue) &&
			    (job->group == inp->job->group) &&
			    find_resource_req(job->resreq, inp->err->rdef) != NULL)
				return 1;
			break;
		case SERVER_PROJECT_RES_LIMIT_REACHED:
		case SERVER_BYPROJECT_RES_LIMIT_REACHED:
			if ((job->user == inp->job->user) &&
			    find_resource_req(job->resreq, inp->err->rdef) != NULL)
				return 1;
			break;
		case QUEUE_PROJECT_RES_LIMIT_REACHED:
		case QUEUE_BYPROJECT_RES_LIMIT_REACHED:
			if ((job->job->queue == inp->job->job->queue) &&
			    (job->project == inp->job->project) &&
			    find_resource_req(job->resreq, inp->err->rdef) != NULL)
				return 1;
			break;
		case QUEUE_JOB_LIMIT_REACHED:
			if (job->job->queue == inp->job->job->queue)
				return 1;
			break;
		case SERVER_USER_LIMIT_REACHED:
		case SERVER_BYUSER_JOB_LIMIT_REACHED:
			if (job->user == inp->job->user)
				return 1;
			break;
		case QUEUE_USER_LIMIT_REACHED:
		case QUEUE_BYUSER_JOB_LIMIT_REACHED:
			if ((job->job->queue == inp->job->job->queue) &&
			    (job->user == inp->job->user))
				return 1;
			break;
		case SERVER_GROUP_LIMIT_REACHED:
		case SERVER_BYGROUP_JOB_LIMIT_REACHED:
			if (job->group == inp->job->group)
				return 1;
			break;
		case QUEUE_GROUP_LIMIT_REACHED:
		case QUEUE_BYGROUP_JOB_LIMIT_REACHED:
			if ((job->job->queue == inp->job->job->queue) &&
			    (job->group == inp->job->group))
				return 1;
			break;
		case SERVER_PROJECT_LIMIT_REACHED:
		case SERVER_BYPROJECT_JOB_LIMIT_REACHED:
			if (job->project == inp->job->project)
				return 1;
			break;
		case QUEUE_PROJECT_LIMIT_REACHED:
		case QUEUE_BYPROJECT_JOB_LIMIT_REACHED:
			if ((job->job->queue == inp->job->job->queue) &&
			    (job->project == inp->job->project))
				return 1;
			break;
		case SERVER_JOB_LIMIT_REACHED:
			return 1;

		case QUEUE_RESOURCE_LIMIT_REACHED:
			if (job->job->queue != inp->job->job->queue)
				return 0;
		case SERVER_RESOURCE_LIMIT_REACHED:
			for (req_scan = job->resreq; req_scan != NULL; req_scan = req_scan->next) {
				if (req_scan->def == inp->err->rdef && req_scan->amount > 0)
					return 1;
			}
			break;
		case INSUFFICIENT_RESOURCE:
			/* special check for vnode and host resource because those resources
			 * do not get into chunk level resources. So in such a case we
			 * compare the resource name with the chunk name
			 */
			if (inp->err->rdef == allres["vnode"]) {
				if (inp->err->arg2 != NULL && find_node_info(job->ninfo_arr, inp->err->arg2) != NULL)
					return 1;
			} else if (inp->err->rdef == allres["host"]) {
				if (inp->err->arg2 != NULL && find_node_by_host(job->ninfo_arr, inp->err->arg2) != NULL)
					return 1;
			} else {
				if (inp->err->rdef->type.is_non_consumable) {
					/* In the non-consumable case, we need to pass the job on.
					 * There is a case when a job requesting a non-specific
					 * select is allocated a node with a non-consumable.
					 * We will check nodes to see if they are useful in
					 * select_index_to_preempt
					 */
					return 1;
				}
				for (int index = 0; job->select->chunks[index] != NULL; index++) {
					for (req_scan = job->select->chunks[index]->req; req_scan != NULL; req_scan = req_scan->next) {
						if (req_scan->def == inp->err->rdef) {
							if (req_scan->type.is_non_consumable ||
							    req_scan->amount > 0) {
								return 1;
							}
						}
					}
				}
			}
			break;
		case INSUFFICIENT_QUEUE_RESOURCE:
			if (job->job->queue != inp->job->job->queue)
				return 0;
		case INSUFFICIENT_SERVER_RESOURCE:
			if (find_resource_req(job->resreq, inp->err->rdef))
				return 1;
			break;
		default:
			return 0;
	}
	return 0;
}

/**
 * @brief   This function looks at a list of running jobs and create a subset of preemptable candidates
 *	    according to the high priority job and the reason why it couldn't run
 * @param[in] arr - List of running jobs (preemptable candidates)
 * @param[in] job - high priority job that couldn't run
 * @param[in] err - error structure that has the reason why high priority job couldn't run
 *
 * @return - resource_resv **
 * @retval - a newly allocated list of preemptable candidates
 * @retval - NULL if no jobs can be preempted
 */
resource_resv **
filter_preemptable_jobs(resource_resv **arr, resource_resv *job, schd_error *err)
{
	struct resresv_filter arg;
	resource_resv **temp = NULL;
	int i;
	int arr_length;

	if ((arr == NULL) || (job == NULL) || (err == NULL))
		return NULL;

	arr_length = count_array(arr);

	switch (err->error_code) {
		/* list of resources we care about */
		case SERVER_USER_RES_LIMIT_REACHED:
		case SERVER_BYUSER_RES_LIMIT_REACHED:
		case QUEUE_USER_RES_LIMIT_REACHED:
		case QUEUE_BYUSER_RES_LIMIT_REACHED:

		case SERVER_GROUP_RES_LIMIT_REACHED:
		case SERVER_BYGROUP_RES_LIMIT_REACHED:
		case QUEUE_GROUP_RES_LIMIT_REACHED:
		case QUEUE_BYGROUP_RES_LIMIT_REACHED:

		case SERVER_PROJECT_RES_LIMIT_REACHED:
		case SERVER_BYPROJECT_RES_LIMIT_REACHED:
		case QUEUE_PROJECT_RES_LIMIT_REACHED:
		case QUEUE_BYPROJECT_RES_LIMIT_REACHED:

		case SERVER_JOB_LIMIT_REACHED:
		case SERVER_RESOURCE_LIMIT_REACHED:
		case QUEUE_JOB_LIMIT_REACHED:
		case QUEUE_RESOURCE_LIMIT_REACHED:

		case SERVER_USER_LIMIT_REACHED:
		case SERVER_BYUSER_JOB_LIMIT_REACHED:
		case QUEUE_USER_LIMIT_REACHED:
		case QUEUE_BYUSER_JOB_LIMIT_REACHED:

		case SERVER_GROUP_LIMIT_REACHED:
		case SERVER_BYGROUP_JOB_LIMIT_REACHED:
		case QUEUE_GROUP_LIMIT_REACHED:
		case QUEUE_BYGROUP_JOB_LIMIT_REACHED:

		case SERVER_PROJECT_LIMIT_REACHED:
		case SERVER_BYPROJECT_JOB_LIMIT_REACHED:
		case QUEUE_PROJECT_LIMIT_REACHED:
		case QUEUE_BYPROJECT_JOB_LIMIT_REACHED:

		case INSUFFICIENT_RESOURCE:
		case INSUFFICIENT_QUEUE_RESOURCE:
		case INSUFFICIENT_SERVER_RESOURCE:
			arg.job = job;
			arg.err = err;
			temp = resource_resv_filter(arr, arr_length, cull_preemptible_jobs, &arg, 0);
			if (temp == NULL)
				return NULL;
			if (temp[0] == NULL) {
				free(temp);
				return NULL;
			}
			return temp;
		default:
			/* For all other errors return the copy of list back again */
			temp = static_cast<resource_resv **>(malloc((arr_length + 1) * sizeof(resource_resv *)));
			if (temp == NULL) {
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, MEM_ERR_MSG);
				return NULL;
			}
			for (i = 0; arr[i] != NULL; i++)
				temp[i] = arr[i];
			temp[i] = NULL;
			return temp;
	}
	return NULL;
}

/**
 * @brief   This function looks at the job's depend attribute string and creates
 *	    an array of job ids having runone dependency.
 * @param[in] depend_val - job's dependency string
 *
 * @return - char **
 * @retval - a newly allocated list of jobs with runone dependeny
 * @retval - NULL in case of error
 */
static char **
parse_runone_job_list(char *depend_val)
{
	char *start;
	const char *depend_type = "runone:";
	int i;
	int len = 1;
	char *r;
	char **ret = NULL;
	char *depend_str = NULL;

	if (depend_val == NULL)
		return NULL;
	else
		depend_str = string_dup(depend_val);

	start = strstr(depend_str, depend_type);
	if (start == NULL) {
		free(depend_str);
		return NULL;
	}

	r = start + strlen(depend_type);
	for (i = 0; r[i] != '\0'; i++) {
		if (r[i] == ':')
			len++;
	}

	ret = static_cast<char **>(calloc(len + 1, sizeof(char *)));
	if (ret == NULL) {
		free(depend_str);
		return NULL;
	}
	for (i = 0; i < len; i++) {
		auto job_delim = strcspn(r, ":");
		r[job_delim] = '\0';
		auto svr_delim = strcspn(r, "@");
		r[svr_delim] = '\0';
		ret[i] = string_dup(r);
		if (ret[i] == NULL) {
			free_ptr_array(ret);
			free(depend_str);
			return NULL;
		}
		r = r + job_delim + 1;
	}
	free(depend_str);
	return ret;
}

/**
 * @brief   This function processes every job's depend attribute and
 *	    associate the jobs with runone dependency to its dependent_jobs list.
 * @param[in] sinfo - server info structure
 *
 * @return - void
 */
void
associate_dependent_jobs(server_info *sinfo)
{
	int i;
	char **job_arr = NULL;

	if (sinfo == NULL)
		return;
	for (i = 0; sinfo->jobs[i] != NULL; i++) {
		if (sinfo->jobs[i]->job->depend_job_str != NULL) {
			job_arr = parse_runone_job_list(sinfo->jobs[i]->job->depend_job_str);
			if (job_arr != NULL) {
				int j;
				int len = count_array(job_arr);
				sinfo->jobs[i]->job->dependent_jobs = static_cast<resource_resv **>(calloc((len + 1), sizeof(resource_resv *)));
				sinfo->jobs[i]->job->dependent_jobs[len] = NULL;
				for (j = 0; job_arr[j] != NULL; j++) {
					resource_resv *jptr;
					jptr = find_resource_resv(sinfo->jobs, job_arr[j]);
					if (jptr != NULL)
						sinfo->jobs[i]->job->dependent_jobs[j] = jptr;
					free(job_arr[j]);
				}
			}
		}
		if (job_arr != NULL) {
			free(job_arr);
			job_arr = NULL;
		}
	}
	return;
}

/**
 * @brief This function associates the subjob passed in to its parent job.
 *
 * @param[in] pjob	The subjob that needs association
 * @param[in] sinfo	server info structure
 *
 * @return int
 * @retval 1 - Failure
 * @retval 0 - Success
 */
int
associate_array_parent(resource_resv *pjob, server_info *sinfo)
{
	resource_resv *parent = NULL;

	if (pjob == NULL || sinfo == NULL || !pjob->job->is_subjob)
		return 1;

	parent = find_resource_resv(sinfo->jobs, pjob->job->array_id);
	if (parent == NULL)
		return 1;

	pjob->job->parent_job = parent;
	parent->job->running_subjobs++;

	return 0;
}

/**
 *	@brief set job's start, end, duration, and STF attributes if needed
 *
 * 	@param[in] pbs_sd - used to set estimated.soft_walltime
 * 	@param[in] resresv - the job
 * 	@param[in] server_time - current time in cycle
 * 
 * 	@return void
 */
void
set_job_times(int pbs_sd, resource_resv *resresv, time_t server_time)
{
	long duration;
	resource_req *soft_walltime_req = NULL;
	resource_req *walltime_req = NULL;
	/* Find out if it is a shrink-to-fit job.
	 * If yes, set the duration to max walltime.
	 */
	auto req = find_resource_req(resresv->resreq, allres["min_walltime"]);
	if (req != NULL) {
		resresv->is_shrink_to_fit = true;
		/* Set the min duration */
		resresv->min_duration = (time_t) req->amount;
		req = find_resource_req(resresv->resreq, allres["max_walltime"]);

#ifdef NAS /* localmod 026 */
		/* if no max_walltime is set then we want to look at what walltime
		 * is (if it's set at all) - it may be user-specified, queue default,
		 * queue max, or server max.
		 */
		if (req == NULL) {
			req = find_resource_req(resresv->resreq, allres["walltime"]);

			/* if walltime is set, use it if it's greater than min_walltime */
			if (req != NULL && resresv->min_duration > req->amount) {
				req = find_resource_req(resresv->resreq, allres["min_walltime"]);
			}
		}
#endif /* localmod 026 */
	}

	if ((req == NULL) || (resresv->job->is_running == true)) {
		soft_walltime_req = find_resource_req(resresv->resreq, allres["soft_walltime"]);
		walltime_req = find_resource_req(resresv->resreq, allres["walltime"]);
		if (soft_walltime_req != NULL)
			req = soft_walltime_req;
		else
			req = walltime_req;
	}

	if (req != NULL)
		duration = (long) req->amount;
	else /* set to virtual job infinity: 5 years */
		duration = JOB_INFINITY;

	if (walltime_req != NULL)
		resresv->hard_duration = (long) walltime_req->amount;
	else if (resresv->min_duration != UNSPECIFIED)
		resresv->hard_duration = resresv->min_duration;
	else
		resresv->hard_duration = JOB_INFINITY;

	if (resresv->job->stime != UNSPECIFIED &&
	    !(resresv->job->is_queued || resresv->job->is_suspended) &&
	    resresv->ninfo_arr != NULL) {
		auto start = resresv->job->stime;
		time_t end;

		/* if a job is exiting, then its end time can be more closely
			 * estimated by setting it to now + EXITING_TIME
			 */
		if (resresv->job->is_exiting)
			end = server_time + EXITING_TIME;
		/* Normal Case: Job's end is start + duration and it ends in the future */
		else if (start + duration >= server_time)
			end = start + duration;
		/* Duration has been exceeded - either extend soft_walltime or expect the job to be killed */
		else {
			if (soft_walltime_req != NULL) {
				duration = extend_soft_walltime(resresv, server_time);
				if (duration > soft_walltime_req->amount) {
					char timebuf[128];
					convert_duration_to_str(duration, timebuf, 128);
					update_job_attr(pbs_sd, resresv, ATTR_estimated, "soft_walltime", timebuf, NULL, UPDATE_NOW);
				}
			} else
				/* Job has exceeded its walltime.  It'll soon be killed and be put into the exiting state.
				 * Change the duration of the job to match the current situation and assume it will end in
				 * now + EXITING_TIME
				 */
				duration = server_time - start + EXITING_TIME;
			end = start + duration;
		}
		resresv->start = start;
		resresv->end = end;
	}
	resresv->duration = duration;
}


================================================
FILE: src/scheduler/job_info.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _JOB_INFO_H
#define _JOB_INFO_H

#include <pbs_ifl.h>
#include "data_types.h"

/*
 *	query_job - takes info from a batch_status about a job and puts
 */
resource_resv *query_job(int pbs_sd, struct batch_status *job, server_info *sinfo, queue_info *qinfo, schd_error *err);

/*
 * pthread routine for querying a chunk of jobs
 */
void query_jobs_chunk(th_data_query_jinfo *data);

/* create an array of jobs for a particular queue */
resource_resv **query_jobs(status *policy, int pbs_sd, queue_info *qinfo, resource_resv **pjobs, const std::string &queue_name);

/*
 *	new_job_info  - allocate and initialize new job_info structure
 */
#ifdef NAS /* localmod 005 */
job_info *new_job_info(void);
#else
job_info *new_job_info();
#endif /* localmod 005 */

/*
 *	free_job_info - free all the memory used by a job_info structure
 */

void free_job_info(job_info *jinfo);

/*
 *      set_job_state - set the state flag in a job_info structure
 *                      i.e. the is_* bit
 */
int set_job_state(const char *state, job_info *jinfo);

/* update_job_attr - update job attributes on the server */
int
update_job_attr(int pbs_sd, resource_resv *resresv, const char *attr_name,
		const char *attr_resc, const char *attr_value, struct attrl *extra, unsigned int flags);

/* send delayed job attribute updates for job using send_attr_updates() */
int send_job_updates(int pbs_sd, resource_resv *job);

/* send delayed attributes to the server for a job */
int send_attr_updates(int virtual_sd, resource_resv *resresv, struct attrl *pattr);

preempt_job_info *send_preempt_jobs(int virtual_sd, char **preempt_jobs_list);

int send_sigjob(int virtual_sd, resource_resv *resresv, const char *signal, char *extend);

struct batch_status *send_selstat(int virtual_fd, struct attropl *attrib, struct attrl *rattrib, char *extend);

/*
 *
 *      unset_job_attr - unset job attributes on the server
 *
 *	  pbs_sd     - connection to the pbs_server
 *	  resresv    - job to update
 *	  attr_name  - the name of the attribute to unset
 *	  flags - UPDATE_NOW - call send_attr_updates() to update the attribute now
 *		  UPDATE_LATER - attach attribute change to job to be sent all at once
 *				for the job.  NOTE: Only the jobs that are part
 *				of the server in main_sched_loop() will be updated in this way.
 *
 *      returns
 *              1: attribute was unset
 *              0: no attribute was unset
 *
 */
int
unset_job_attr(int pbs_sd, resource_resv *resresv, const char *attr_name, unsigned int flags);

/*
 *      update_jobs_cant_run - update an array of jobs which can not run
 */
void
update_jobs_cant_run(int pbs_sd, resource_resv **resresv_arr,
		     resource_resv *start, struct schd_error *err, int start_where);

/*
 *	update_job_comment - update a job's comment attribute.  If the job's
 *			     comment attr is identical, don't update
 *
 *	  pbs_sd - pbs connection descriptor
 *	  resresv - the job to update
 *	  comment - the comment string
 *
 *	returns 1 if the comment was updated
 *		0 if not
 */
int update_job_comment(int pbs_sd, resource_resv *resresv, char *comment);

/*
 *	translate_fail_code - translate Scheduler failure code into
 *				a comment and log message
 */
int translate_fail_code(schd_error *err, char *comment_msg, char *log_msg);

/*
 *      preempt_job - preempt a job to allow another job to run.  First the
 *                    job will try to be suspended, then checkpointed and
 *                    finally forcablly requeued
 */
int preempt_job(status *policy, int pbs_sd, resource_resv *jinfo, server_info *sinfo);

/*
 *      find_and_preempt_jobs - find the jobs to preempt and then preempt them
 */
int find_and_preempt_jobs(status *policy, int pbs_sd, resource_resv *hjob, server_info *sinfo, schd_error *err);

/*
 *      find_jobs_to_preempt - find jobs to preempt in order to run a high
 *                             priority job
 */
int *
find_jobs_to_preempt(status *policy, resource_resv *hjob,
		     server_info *sinfo, int *fail_list, int *no_of_jobs);

/*
 *      select_job_to_preempt - select the best candidite out of the running
 *                              jobs to preempt
 */
long
select_index_to_preempt(status *policy, resource_resv *hjob,
			resource_resv **rjobs, long skipto, schd_error *err,
			int *fail_list);

/*
 *      preempt_level - take a preemption priority and return a preemption
 *                      level
 */
int preempt_level(unsigned int prio);

/*
 *      set_preempt_prio - set a job's preempt field to the correct value
 */
void set_preempt_prio(resource_resv *job, queue_info *qinfo, server_info *sinfo);

/*
 * create subjob name from subjob id and array name
 *
 *	array_id - the parent array name
 *	index    - subjob index
 *
 * return created subjob name
 */
std::string create_subjob_name(const std::string &array_id, int index);

/*
 *	create_subjob_from_array - create a resource_resv structure for a subjob
 *				   from a job array structure.  The subjob
 *				   will be in state 'Q'
 */
resource_resv *
create_subjob_from_array(resource_resv *array, int index, const std::string &subjob_name);

/*
 *	update_array_on_run - update a job array object when a subjob is run
 */
int update_array_on_run(job_info *array, job_info *subjob);
/*
 *	dup_job_info - duplicate the information in a job_info structure
 */
job_info *dup_job_info(job_info *ojinfo, queue_info *nqinfo, server_info *nsinfo);

/*
 *	is_job_array - is a job name a job array range
 *			  valid_form: 1234[]
 *			  valid_form: 1234[N]
 *			  valid_form: 1234[N-M]
 *
 *	returns 1 if jobname is a job array
 *		2 if jobname is a subjob
 *		3 if jobname is a range
 *		0 if it is not a job array
 */
int is_job_array(char *jobname);

/*
 *
 *	modify_job_array_for_qrun - modify a job array for qrun -
 * 				    set queued_subjobs to just the
 *				    range which is being run
 *				    set qrun_job on server
 */
int modify_job_array_for_qrun(server_info *sinfo, char *jobid);

/*
 *	queue_subjob - create a subjob from a job array and queue it
 *
 *	  array - job array to create the next subjob from
 *	  sinfo - the server the job array is in
 *	  qinfo - the queue the job array is in
 *
 *	returns new subjob or NULL on error
 *	NOTE: subjob will be attached to the server/queue job lists
 */
resource_resv *
queue_subjob(resource_resv *array, server_info *sinfo,
	     queue_info *qinfo);
/*
 *	formula_evaluate - evaluate a math formula for jobs based on their resources
 *		NOTE: currently done through embedded python interpreter
 */

sch_resource_t formula_evaluate(const char *formula, resource_resv *resresv, resource_req *resreq);

/*
 *
 *      update_accruetype - Updates accrue_type of job on server.
 *                          The accrue_type is determined from the values
 *                          of err_code and mode. if resresv is a job
 *                          array, special action is taken.
 *
 *        pbs_sd   - connection to pbs_server
 *        sinfo    - pointer to server
 *        mode     - mode of operation
 *        err_code - error code to evaluate
 *        resresv  - pointer to job
 *
 */

void update_accruetype(int pbs_sd, server_info *sinfo, enum update_accruetype_mode mode, enum sched_error_code err_code, resource_resv *resresv);

/**
 * @brief
 *	return aoe from select spec
 *
 * @param[in]	select - select spec of job/reservation
 *
 * @return	char*
 * @retval	NULL - no aoe found or failure encountered
 * @retval	aoe name string
 */
char *getaoename(selspec *select);

/**
 *  * @brief
 *	return eoe from select spec
 *
 * @param[in]	select - select spec of job/reservation
 *
 * @return	char*
 * @retval	NULL - no eoe found or failure encountered
 * @retval	eoe name string
 */
char *geteoename(selspec *select);

/*
 *
 *	update_estimated_attrs - updated the estimated.start_time and
 *				 estimated.exec_vnode attributes on a job
 *
 *	  \param pbs_sd     - connection descriptor to pbs server
 *	  \param job        - job to update
 *	  \param start_time - start time of job
 *	  \param exec_vnode - exec_vnode of job or NULL to create it from
 *			      job -> nspec_arr
 *
 *	\return 1 if attributes were successfully updated 0 if not
 */
int
update_estimated_attrs(int pbs_sd, resource_resv *job,
		       time_t start_time, char *exec_vnode, int force);

/*
 *
 *	check_preempt_targets_for_none - This function checks if preemption set has been configured as "NONE"
 *					If its found that resources_default.preempt_targets = NONE
 *					then this function returns PREEMPT_NONE.
 *	res_list - list of resources created from comma seperated resource list.
 *
 *	return - int
 *	retval - PREEMPT_NONE :If preemption set is set to "NONE"
 *	retval - 0 :If preemption set is not set as "NONE"
 */
int check_preempt_targets_for_none(char **res_list);

/*
 *
 *  @brief checks whether the IFL interface failed because it was a finished job
 *
 *  @param[in] error - pbs_errno set by server
 *
 *  @retval 1 if job is a finished job
 *  @retval 0 if job is not a finished job
 */
int is_finished_job(int error);

/*
 * compare two jobs to see if they overlap using a complete err list as
 * criteria similarity criteria.
 */
int preemption_similarity(resource_resv *hjob, resource_resv *pjob, schd_error *full_err);

/* Equivalence class functions*/
resresv_set *new_resresv_set(void);
void free_resresv_set(resresv_set *rset);
void free_resresv_set_array(resresv_set **rsets);
resresv_set *dup_resresv_set(resresv_set *oset, server_info *nsinfo);
resresv_set **dup_resresv_set_array(resresv_set **osets, server_info *nsinfo);

/* create a resresv_set with a resresv as a template */
resresv_set *create_resresv_set_by_resresv(status *policy, server_info *sinfo, resource_resv *resresv);

/* find a resresv_set by its internal components */
int find_resresv_set(status *policy, resresv_set **rsets, const char *user, const char *group, const char *project, selspec *sel, place *pl, resource_req *req, queue_info *qinfo);

/* find a resresv_set with a resresv as a template */
int find_resresv_set_by_resresv(status *policy, resresv_set **rsets, resource_resv *resresv);

/* create the array of resdef's to use to create resresv->req*/
std::unordered_set<resdef *> create_resresv_sets_resdef(status *policy);

/* Create an array of resresv_sets based on sinfo*/
resresv_set **create_resresv_sets(status *policy, server_info *sinfo);
/*
 * This function creates a string and update resources_released job
 *  attribute.
 *  The string created will be similar to how exec_vnode is presented
 *  example: (node1:ncpus=8)+(node2:ncpus=8)
 */
void create_res_released(status *policy, resource_resv *pjob);

/*
 *This function populates resreleased job structure for a particular job.
 */
std::vector<nspec *> create_res_released_array(status *policy, resource_resv *resresv);

/*
 * @brief create a resource_rel array for a job by accumulating all of the RASSN
 *	    resources in a resources_released nspec array.
 */
resource_req *create_resreq_rel_list(status *policy, resource_resv *pjob);

/* Returns the extended duration of a job that has exceeded its soft_walltime */
long extend_soft_walltime(resource_resv *resresv, time_t server_time);

/* Returns a list of preemptable candidates */
resource_resv **filter_preemptable_jobs(resource_resv **arr, resource_resv *job, schd_error *err);

/*
 * This function processes every job's depend attribute and
 * associate the jobs with runone dependency to its dependent_jobs list.
 */
void associate_dependent_jobs(server_info *sinfo);

/* This function associated the job passed in to its parent job */
int associate_array_parent(resource_resv *pjob, server_info *sinfo);

/* Set start, end, duration, and possibly STF parts of the job */
void set_job_times(int pbs_sd, resource_resv *resresv, time_t server_time);

#endif /* _JOB_INFO_H */


================================================
FILE: src/scheduler/limits.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    limits.c
 *
 * @brief
 * 		limits.c - This file contains functions related to limit information.
 *
 * Functions included are:
 * 	lim_alloc_liminfo()
 * 	lim_dup_liminfo()
 * 	lim_free_liminfo()
 * 	is_reslimattr()
 * 	is_runlimattr()
 * 	is_oldlimattr()
 * 	lim_setlimits()
 * 	has_hardlimits()
 * 	has_softlimits()
 * 	check_limits()
 * 	check_soft_limits()
 * 	check_server_max_user_run()
 * 	check_server_max_group_run()
 * 	check_server_max_user_res()
 * 	check_server_max_group_res()
 * 	check_queue_max_user_run()
 * 	check_queue_max_group_run()
 * 	check_queue_max_user_res()
 * 	check_queue_max_group_res()
 * 	check_queue_max_res()
 * 	check_server_max_res()
 * 	check_server_max_run()
 * 	check_queue_max_run()
 * 	check_queue_max_run_soft()
 * 	check_queue_max_user_run_soft()
 * 	check_queue_max_group_run_soft()
 * 	check_queue_max_user_res_soft()
 * 	check_queue_max_group_res_soft()
 * 	check_server_max_run_soft()
 * 	check_server_max_user_run_soft()
 * 	check_server_max_group_run_soft()
 * 	check_server_max_user_res_soft()
 * 	check_server_max_group_res_soft()
 * 	check_server_max_res_soft()
 * 	check_queue_max_res_soft()
 * 	check_max_group_res()
 * 	check_max_group_res_soft()
 * 	check_max_user_res()
 * 	check_max_user_res_soft()
 * 	lim_setreslimits()
 * 	clear_limres()
 * 	lim_setrunlimits()
 * 	lim_setoldlimits()
 * 	lim_dup_ctx()
 * 	is_hardlimit()
 * 	lim_gengroupreskey()
 * 	lim_genprojectreskey()
 * 	lim_genuserreskey()
 * 	lim_callback()
 * 	lim_get()
 * 	schderr_args_q()
 * 	schderr_args_q_res()
 * 	schderr_args_server()
 * 	schderr_args_server_res()
 * 	check_max_project_res()
 * 	check_max_project_res_soft()
 * 	check_server_max_project_res()
 * 	check_server_max_project_run_soft()
 * 	check_server_max_project_res_soft()
 * 	check_queue_max_project_res()
 * 	check_queue_max_project_run_soft()
 * 	check_queue_max_project_res_soft()
 * 	check_server_max_project_run()
 * 	check_queue_max_project_run()
 *
 */
#include <unistd.h>
#include <stdlib.h>
#include <errno.h>
#include <stdio.h>
#include <string.h>
#include <assert.h>
#include "pbs_config.h"
#include "pbs_ifl.h"
#include "data_types.h"
#include "resource_resv.h"
#include "misc.h"
#include "log.h"
#include "check.h"
#include "limits_if.h"
#include "simulate.h"
#include "resource.h"
#include "globals.h"

class limcounts {
      public:
	counts_umap user;
	counts_umap group;
	counts_umap project;
	counts_umap all;
	limcounts() = delete;
	limcounts(const counts_umap &ruser,
		  const counts_umap &rgroup,
		  const counts_umap &rproject,
		  const counts_umap &rall);
	limcounts(const limcounts &);
	limcounts &operator=(const limcounts &);
	~limcounts();
};

static int
check_max_group_res(resource_resv *, counts_umap &,
		    resdef **, void *);
static int
check_max_project_res(resource_resv *, counts_umap &,
		      resdef **, void *);
static int
check_max_user_res(resource_resv *, counts_umap &,
		   resdef **, void *);
static int
check_max_group_res_soft(resource_resv *,
			 counts_umap &, void *, int);
static int
check_max_project_res_soft(resource_resv *,
			   counts_umap &, void *, int);
static int
check_max_user_res_soft(resource_resv **, resource_resv *,
			counts_umap &, void *, int);
static int
check_server_max_user_run(server_info *, queue_info *,
			  resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_group_run(server_info *, queue_info *,
			   resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_project_run(server_info *, queue_info *,
			     resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_user_res(server_info *, queue_info *,
			  resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_group_res(server_info *, queue_info *,
			   resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_project_res(server_info *, queue_info *,
			     resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_user_run(server_info *, queue_info *,
			 resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_group_run(server_info *, queue_info *,
			  resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_project_run(server_info *, queue_info *,
			    resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_user_res(server_info *, queue_info *,
			 resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_group_res(server_info *, queue_info *,
			  resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_project_res(server_info *, queue_info *,
			    resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_res(server_info *, queue_info *,
		     resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_res(server_info *, queue_info *,
		    resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_run(server_info *, queue_info *,
		     resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_queue_max_run(server_info *, queue_info *,
		    resource_resv *, limcounts *, limcounts *, schd_error *);
static int
check_server_max_user_run_soft(server_info *, queue_info *,
			       resource_resv *);
static int
check_server_max_group_run_soft(server_info *, queue_info *,
				resource_resv *);
static int
check_server_max_project_run_soft(server_info *, queue_info *,
				  resource_resv *);
static int
check_server_max_user_res_soft(server_info *, queue_info *,
			       resource_resv *);
static int
check_server_max_group_res_soft(server_info *, queue_info *,
				resource_resv *);
static int
check_server_max_project_res_soft(server_info *, queue_info *,
				  resource_resv *);
static int
check_server_max_res_soft(server_info *, queue_info *,
			  resource_resv *);
static int
check_queue_max_res_soft(server_info *, queue_info *,
			 resource_resv *);
static int
check_queue_max_user_run_soft(server_info *, queue_info *,
			      resource_resv *);
static int
check_queue_max_group_run_soft(server_info *, queue_info *,
			       resource_resv *);
static int
check_queue_max_project_run_soft(server_info *, queue_info *,
				 resource_resv *);
static int
check_queue_max_user_res_soft(server_info *, queue_info *,
			      resource_resv *);
static int
check_queue_max_group_res_soft(server_info *, queue_info *,
			       resource_resv *);
static int
check_queue_max_project_res_soft(server_info *, queue_info *,
				 resource_resv *);
static int
check_server_max_run_soft(server_info *, queue_info *,
			  resource_resv *);
static int
check_queue_max_run_soft(server_info *, queue_info *,
			 resource_resv *);

/**
 * @typedef
 * 		int (*limfunc_t)(server_info *, queue_info *, resource_resv *, schd_error *);
 * @brief
 * 		each hard limit function we call has this interface
 * @par
 * 		When adding a new hard limit, be sure to address the following:
 * 			add the function that does limit enforcement to this
 *				list
 * 			add a new error enum to sched_error
 * 			add new log and comment formatting strings to the
 *				fc_translation_table
 * 			format the error string the scheduler will report (use
 *				one of the existing schderr_args_*() functions below or
 *				create a new one)
 * 			add the new error case to translate_fail_code()
 * 			if the limit applies to a job's owner or group, add the
 *				new error case to update_accruetype() so that the job is
 *				marked as ineligible
 *
 * @see	sched_error_code in constant.h
 * @see	fc_translation_table in job_info.c
 */
typedef int (*limfunc_t)(server_info *, queue_info *, resource_resv *,
			 limcounts *, limcounts *, schd_error *);

static limfunc_t limfuncs[] = {
	check_queue_max_group_run,
	check_queue_max_project_run,
	check_queue_max_run,
	check_queue_max_user_run,
	check_server_max_group_run,
	check_server_max_project_run,
	check_server_max_run,
	check_server_max_user_run,
	check_queue_max_group_res,
	check_queue_max_project_res,
	check_queue_max_res,
	check_queue_max_user_res,
	check_server_max_group_res,
	check_server_max_project_res,
	check_server_max_res,
	check_server_max_user_res,
};

/**
 * @typedef
 * 		int (*softlimfunc_t)(server_info *, queue_info *, resource_resv *);
 * @brief
 * 		each soft limit function we call has this interface
 */
typedef int (*softlimfunc_t)(server_info *, queue_info *, resource_resv *);
static softlimfunc_t softlimfuncs[] = {
	check_queue_max_run_soft,
	check_queue_max_user_run_soft,
	check_queue_max_group_run_soft,
	check_queue_max_project_run_soft,
	check_server_max_run_soft,
	check_server_max_user_run_soft,
	check_server_max_group_run_soft,
	check_server_max_project_run_soft,
	check_queue_max_user_res_soft,
	check_queue_max_group_res_soft,
	check_queue_max_project_res_soft,
	check_server_max_user_res_soft,
	check_server_max_group_res_soft,
	check_server_max_project_res_soft,
	check_server_max_res_soft,
	check_queue_max_res_soft,
};

/**
 * @struct	lim_old2new
 * @brief
 * 		Maps between old-style limit attribute names and new-style params
 * @par
 *		This structure holds information needed to map old-style limit attribute
 *		names to new-style parameterized keys ("param"s).
 *
 * @param[in]	lim_attr	-	the (old) attribute name
 * @param[in]	lim_param	-	the (new-style) entity parameter
 * @param[in]	lim_isreslim	-	1 if this attribute is a resource limit, else 0
 */
struct lim_old2new {
	const char *lim_attr;
	const char *lim_param;
	int lim_isreslim;
};
static struct lim_old2new old2new[] = {
	{ATTR_maxgroupres, "g:" PBS_GENERIC_ENTITY, 1},
	{ATTR_maxgrprun, "g:" PBS_GENERIC_ENTITY, 0},
	{ATTR_maxrun, "o:" PBS_ALL_ENTITY, 0},
	{ATTR_maxuserres, "u:" PBS_GENERIC_ENTITY, 1},
	{ATTR_maxuserrun, "u:" PBS_GENERIC_ENTITY, 0}};
static struct lim_old2new old2new_soft[] = {
	{ATTR_max_run_soft, "o:" PBS_ALL_ENTITY, 0},
	{ATTR_max_run_res_soft, "o:" PBS_ALL_ENTITY, 1},
	{ATTR_maxgroupressoft, "g:" PBS_GENERIC_ENTITY, 1},
	{ATTR_maxgrprunsoft, "g:" PBS_GENERIC_ENTITY, 0},
	{ATTR_maxuserressoft, "u:" PBS_GENERIC_ENTITY, 1},
	{ATTR_maxuserrunsoft, "u:" PBS_GENERIC_ENTITY, 0}};

static const char allparam[] = PBS_ALL_ENTITY;
static const char genparam[] = PBS_GENERIC_ENTITY;

static int is_hardlimit(const struct attrl *);
static int
lim_callback(void *, enum lim_keytypes, char *, char *,
	     char *, char *);
static void *lim_dup_ctx(void *);
static char *lim_gengroupreskey(const char *);
static char *lim_genprojectreskey(const char *);
static char *lim_genuserreskey(const char *);
static void schderr_args_q(const std::string &, const char *, schd_error *);
static void schderr_args_q(const std::string &, const std::string &, schd_error *);
static void schderr_args_q_res(const std::string &, const char *, char *, schd_error *);
static void schderr_args_q_res(const std::string &, const std::string &, char *, schd_error *);
static void schderr_args_server(const char *, schd_error *);
static void schderr_args_server(const std::string &, schd_error *);
static void schderr_args_server_res(std::string &, const char *, schd_error *);
static sch_resource_t lim_get(const char *, void *);
static int lim_setoldlimits(const struct attrl *, void *);
static int lim_setreslimits(const struct attrl *, void *);
static int lim_setrunlimits(const struct attrl *, void *);

/**
 * @struct	limit_info
 * @brief
 * 		internal structure of stored limit information
 *
 * @param[in]	li_ctxh	-	limit context for storing (hard) resource and run limits
 * @param[in]	li_ctxs	-	limit context for storing (soft) resource and run limits
 */
struct limit_info {
	void *li_ctxh;
	void *li_ctxs;
};
#define LI2RESCTX(li) (((struct limit_info *) li)->li_ctxh)
#define LI2RESCTXSOFT(li) (((struct limit_info *) li)->li_ctxs)
#define LI2RUNCTX(li) (((struct limit_info *) li)->li_ctxh)
#define LI2RUNCTXSOFT(li) (((struct limit_info *) li)->li_ctxs)

/**
 * @var	resource *limres
 *
 * @brief
 * 		list of resources that have limits
 * @par
 *		We record in this list only those resources that have had limits set.
 *		This is done in lim_setreslimits() and lim_setoldlimits() and used in
 *		the resource checking functions.  These latter functions loop over
 *		only those resources that appear in this list.  We do not maintain a
 *		separate list of per-queue or per-server resources because each limit
 *		checking function uses a limit evaluation context that narrows the
 *		limit search to the proper context.
 * @note
 *		Note that we do not free and rebuild this list for each scheduling cycle.
 *		Instead, we assume that the number of resources with limits is small and
 *		the index tree limit fetching code is sufficiently fast that this isn't an
 *		issue.
 */
static schd_resource *limres; /* list of resources that have limits */
/**
 * @brief
 * 		We currently store both resource and run limits in a
 * 		single member of the limit_info structure.  That might
 * 		change some day, and these assertions are here in order
 * 		to protect accidental violations of this assumption:
 * 		if the run limit contexts are ever NULL after allocation
 * 		of the resource limit contexts, the assumption has been
 * 		violated.
 *
 * @return	allocated lim_info structure
 * @retval	NULL	: failed to allocate memory
*/
void *
lim_alloc_liminfo(void)
{
	struct limit_info *lip;

	if ((lip = static_cast<limit_info *>(calloc(1, sizeof(struct limit_info)))) == NULL)
		return NULL;
	else {
		void *ctx;

		if ((ctx = entlim_initialize_ctx()) == NULL) {
			lim_free_liminfo(lip);
			return NULL;
		} else
			LI2RESCTX(lip) = ctx;
		if ((ctx = entlim_initialize_ctx()) == NULL) {
			lim_free_liminfo(lip);
			return NULL;
		} else
			LI2RESCTXSOFT(lip) = ctx;

		assert(LI2RUNCTX(lip) != NULL);
		assert(LI2RUNCTXSOFT(lip) != NULL);

		return (lip);
	}
}
/**
 * @brief
 * 		take duplicate of passed structure and return the duplicate of the lim_info structure
 *
 * @param[in]	p	-	old limit info structure
 *
 * @return	duplicate of old limit info structure
 * @retval	NULL	: failure
 */
void *
lim_dup_liminfo(void *p)
{
	struct limit_info *oldlip = static_cast<limit_info *>(p);
	struct limit_info *newlip;

	if ((oldlip == NULL) ||
	    (LI2RESCTX(oldlip) == NULL) ||
	    (LI2RESCTXSOFT(oldlip) == NULL))
		return NULL;

	if ((newlip = static_cast<limit_info *>(calloc(1, sizeof(struct limit_info)))) == NULL)
		return NULL;
	else {
		void *ctx;

		if ((ctx = lim_dup_ctx(LI2RESCTX(oldlip))) == NULL) {
			lim_free_liminfo(newlip);
			return NULL;
		} else
			LI2RESCTX(newlip) = ctx;
		if ((ctx = lim_dup_ctx(LI2RESCTXSOFT(oldlip))) == NULL) {
			lim_free_liminfo(newlip);
			return NULL;
		} else
			LI2RESCTXSOFT(newlip) = ctx;

		/*
		 *	We currently store both resource and run limits in a
		 *	single member of the limit_info structure.  That might
		 *	change some day, and these assertions are here in order
		 *	to protect accidental violations of this assumption:
		 *	if the run limit contexts are ever NULL after allocation
		 *	of the resource limit contexts, the assumption has been
		 *	violated.
		 */
		assert(LI2RUNCTX(newlip) != NULL);
		assert(LI2RUNCTXSOFT(newlip) != NULL);

		return (newlip);
	}
}
/**
 * @brief
 * 		free the limit info structure
 *
 * @param[in]	p	-	limit info structure to be freed.
 */
void
lim_free_liminfo(void *p)
{
	struct limit_info *lip = static_cast<limit_info *>(p);

	if (lip == NULL)
		return;

	if (LI2RESCTX(lip) != NULL) {
		(void) entlim_free_ctx(LI2RESCTX(lip), free);
		LI2RESCTX(lip) = NULL;
	}
	if (LI2RESCTXSOFT(lip) != NULL) {
		(void) entlim_free_ctx(LI2RESCTXSOFT(lip), free);
		LI2RESCTXSOFT(lip) = NULL;
	}
	if (LI2RUNCTX(lip) != NULL) {
		(void) entlim_free_ctx(LI2RUNCTX(lip), free);
		LI2RUNCTX(lip) = NULL;
	}
	if (LI2RUNCTXSOFT(lip) != NULL) {
		(void) entlim_free_ctx(LI2RUNCTXSOFT(lip), free);
		LI2RUNCTXSOFT(lip) = NULL;
	}
	free(lip);
}
/**
 * @brief
 * 		check attribute has max run result as name
 *
 * @param[in]	a	-	attribute list structure
 *
 * @return	int
 * @retval	1	: Yes
 * @retval	0	: No
 */
int
is_reslimattr(const struct attrl *a)
{
	if (!strcmp(a->name, ATTR_max_run_res) ||
	    !strcmp(a->name, ATTR_max_run_res_soft))
		return (1);
	else
		return (0);
}
/**
 * @brief
 * 		check attribute has run limit as name
 *
 * @param[in]	a	-	attribute list structure
 *
 * @return	int
 * @retval	1	: Yes
 * @retval	0	: No
 */
int
is_runlimattr(const struct attrl *a)
{
	if (!strcmp(a->name, ATTR_max_run) ||
	    !strcmp(a->name, ATTR_max_run_soft))
		return (1);
	else
		return (0);
}
/**
 * @brief
 * 		convert an old limit attribute name to the new one
 *		@see old2new[]
 *		@see old2new_soft[]
 *
 * @param[in]	a	-	attribute list structure
 *
 * @return char *
 * @retval !NULL	: old limit attribute name
 * @retval NULL		: attribute value is not an old limit attribute
 *
 */
const char *
convert_oldlim_to_new(const struct attrl *a)
{
	size_t i;

	for (i = 0; i < sizeof(old2new) / sizeof(old2new[0]); i++)
		if (!strcmp(a->name, old2new[i].lim_attr))
			return old2new[i].lim_param;
	for (i = 0; i < sizeof(old2new_soft) / sizeof(old2new_soft[0]); i++)
		if (!strcmp(a->name, old2new_soft[i].lim_attr))
			return old2new_soft[i].lim_param;

	return NULL;
}

/*
 * @brief
 *		Return true if attribute is an old limit attribute
 * @param[in] a		attribute list structure
 *
 * @return	int
 * @retval	1	: Yes
 * @retval	0	: No
 */
int
is_oldlimattr(const struct attrl *a)
{
	return (convert_oldlim_to_new(a) != NULL);
}

/**
 * @brief
 * 		assign the resource-limits to the limit context based on the limit type.
 *
 * @param[in]	a	-	attribute list structure
 * @param[in]	lt	-	limit type.
 * @param[in]	p	-	pointer to limit_info structure
 *
 * @return	int
 * @retval	1	: Yes
 * @retval	0	: No
 */
int
lim_setlimits(const struct attrl *a, enum limtype lt, void *p)
{
	struct limit_info *lip = static_cast<limit_info *>(p);

	switch (lt) {
		case LIM_RES:
			if (is_hardlimit(a))
				return (lim_setreslimits(a, LI2RESCTX(lip)));
			else
				return (lim_setreslimits(a, LI2RESCTXSOFT(lip)));
		case LIM_RUN:
			if (is_hardlimit(a))
				return (lim_setrunlimits(a, LI2RUNCTX(lip)));
			else
				return (lim_setrunlimits(a, LI2RUNCTXSOFT(lip)));
		case LIM_OLD:
			return (lim_setoldlimits(a, lip));
		default:
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
				   "attribute %s not a limit attribute", a->name);
			return (1);
	}
}
/**
 * @brief
 * 		check whether the limit info structure has at least one hard resource limit,
 * 		if so, free them.
 *
 * @param[in,out]	p	-	limit info structure which needs to be checked.
 *
 * @return	int
 * @retval	1	: Hard limit found and freed.
 * @retval	0	: Run limit already checked, or nothing is found.
 */
int
has_hardlimits(void *p)
{
	struct limit_info *lip = static_cast<limit_info *>(p);
	char *k = NULL;

	if (entlim_get_next(LI2RESCTX(lip), (void **) &k) != NULL) /* at least one hard resource limit present */
		return (1);

	/* run limit already checked? */
	if (LI2RUNCTX(lip) == LI2RESCTX(lip))
		return (0);
	k = NULL;
	if (entlim_get_next(LI2RUNCTX(lip), (void **) &k) != NULL) /* at least one hard run limit present */
		return (1);

	return (0);
}
/**
 * @brief
 * 		check whether the limit info structure has at least one soft resource limit,
 * 		if so, free them.
 *
 * @param[in,out]	p	-	limit info structure which needs to be checked.
 *
 * @return	int
 * @retval	1	: Soft limit found and freed.
 * @retval	0	: Run limit already checked, or nothing is found.
 */
int
has_softlimits(void *p)
{
	struct limit_info *lip = static_cast<limit_info *>(p);
	char *k = NULL;

	if (entlim_get_next(LI2RESCTXSOFT(lip), (void **) &k) != NULL) /* at least one soft resource limit present */
		return (1);

	/* run limit already checked? */
	if (LI2RUNCTXSOFT(lip) == LI2RESCTXSOFT(lip))
		return (0);
	k = NULL;
	if (entlim_get_next(LI2RUNCTXSOFT(lip), (void **) &k) != NULL) /* at least one soft run limit present */
		return (1);

	return (0);
}
/**
 * @brief
 *		limitcount class constructor.
 */
// Parametrized Constructor
limcounts::limcounts(const counts_umap &ruser,
		     const counts_umap &rgroup,
		     const counts_umap &rproject,
		     const counts_umap &rall)
{
	user = dup_counts_umap(ruser);
	group = dup_counts_umap(rgroup);
	project = dup_counts_umap(rproject);
	all = dup_counts_umap(rall);
}

// Copy Constructor
limcounts::limcounts(const limcounts &rlimit)
{
	user = dup_counts_umap(rlimit.user);
	group = dup_counts_umap(rlimit.group);
	project = dup_counts_umap(rlimit.project);
	all = dup_counts_umap(rlimit.all);
}

// Assignment operator
limcounts &
limcounts::operator=(const limcounts &rlimit)
{
	user = dup_counts_umap(rlimit.user);
	group = dup_counts_umap(rlimit.group);
	project = dup_counts_umap(rlimit.project);
	all = dup_counts_umap(rlimit.all);
	return *this;
}

// destructor
limcounts::~limcounts()
{
	free_counts_list(user);
	free_counts_list(group);
	free_counts_list(project);
	free_counts_list(all);
}

/**
 * @brief
 *		check_limits - hard limit checking function.
 *		This is table-driven limit checking, against limfuncs[]
 *		array.
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[out]	err	-	sched_error_code structure to return error information
 * @param[in]	flags	-	CHECK_LIMITS - check real limits
 *                      CHECK_CUMULATIVE_LIMIT - check limits against total counts
 *                      RETURN_ALL_ERR - check all limits and return an err for all failed limits *
 *
 * @return	integer indicating failing limit test if limit is exceeded,
 *				along with error 'err'.
 * @retval	0	: if limit is not exceeded.
 */

int
check_limits(server_info *si, queue_info *qi, resource_resv *rr, schd_error *err, unsigned int flags)
{
	enum sched_error_code rc;
	int any_fail_rc = 0;
	size_t i;
	limcounts *svr_counts = NULL;
	limcounts *que_counts = NULL;
	limcounts *svr_counts_max = NULL;
	limcounts *que_counts_max = NULL;
	limcounts *server_lim = NULL;
	limcounts *queue_lim = NULL;
	schd_error *prev_err = NULL;

	if (si == NULL || qi == NULL || rr == NULL)
		return SE_NONE;

	/*
	 * Check for  CHECK_CUMULATIVE_LIMIT is needed because we  must have
	 * already run through the same loop before while calling check_limits
	 * from is_ok_to_run.
	 * We do not need to run into the same loop again.
	 */
	if (si->calendar != NULL && !(flags & CHECK_CUMULATIVE_LIMIT)) {
		long time_left;
		if (rr->duration != rr->hard_duration &&
		    exists_resv_event(si->calendar, si->server_time + rr->hard_duration))
			time_left = calc_time_left(rr, 1);
		else
			time_left = calc_time_left(rr, 0);

		auto end = si->server_time + time_left;

		if (exists_run_event(si->calendar, end)) {
			if (si->has_hard_limit) {
				svr_counts_max = new limcounts(si->user_counts,
							       si->group_counts,
							       si->project_counts,
							       si->alljobcounts);

				svr_counts = new limcounts(si->user_counts,
							   si->group_counts,
							   si->project_counts,
							   si->alljobcounts);
			}

			if (qi->has_hard_limit) {
				que_counts_max = new limcounts(qi->user_counts,
							       qi->group_counts,
							       qi->project_counts,
							       qi->alljobcounts);

				que_counts = new limcounts(qi->user_counts,
							   qi->group_counts,
							   qi->project_counts,
							   qi->alljobcounts);
			}

			auto te = get_next_event(si->calendar);
			const auto event_mask = TIMED_RUN_EVENT | TIMED_END_EVENT;
			bool error = false;
			for (te = find_init_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask);
			     te != NULL && te->event_time < end;
			     te = find_next_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask)) {
				auto te_rr = static_cast<resource_resv *>(te->event_ptr);
				if ((te_rr != rr) && te_rr->is_job) {
					if (te->event_type == TIMED_RUN_EVENT) {
						if (svr_counts != NULL) {
							auto cts = find_alloc_counts(svr_counts->user, te_rr->user);
							update_counts_on_run(cts, te_rr->resreq);
							counts_max(svr_counts_max->user, cts);
							if (svr_counts_max->user.size() == 0) {
								error = 1;
								break;
							}

							cts = find_alloc_counts(svr_counts->group, te_rr->group);
							update_counts_on_run(cts, te_rr->resreq);
							counts_max(svr_counts_max->group, cts);
							if (svr_counts_max->group.size() == 0) {
								error = 1;
								break;
							}

							cts = find_alloc_counts(svr_counts->project, te_rr->project);
							update_counts_on_run(cts, te_rr->resreq);
							counts_max(svr_counts_max->project, cts);
							if (svr_counts_max->project.size() == 0) {
								error = 1;
								break;
							}

							cts = find_alloc_counts(svr_counts->all, PBS_ALL_ENTITY);
							update_counts_on_run(cts, te_rr->resreq);
							counts_max(svr_counts_max->all, svr_counts->all);
							if (svr_counts_max->all.size() == 0) {
								error = 1;
								break;
							}
						}

						if (que_counts != NULL) {
							if (te_rr->is_job && te_rr->job != NULL) {
								if (te_rr->job->queue == qi) {
									auto cts = find_alloc_counts(que_counts->user, te_rr->user);
									update_counts_on_run(cts, te_rr->resreq);
									counts_max(que_counts_max->user, cts);
									if (que_counts_max->user.size() == 0) {
										error = 1;
										break;
									}

									cts = find_alloc_counts(que_counts->group, te_rr->group);
									update_counts_on_run(cts, te_rr->resreq);
									counts_max(que_counts_max->group, cts);
									if (que_counts_max->group.size() == 0) {
										error = 1;
										break;
									}

									cts = find_alloc_counts(que_counts->project, te_rr->project);
									update_counts_on_run(cts, te_rr->resreq);
									counts_max(que_counts_max->project, cts);
									if (que_counts_max->project.size() == 0) {
										error = 1;
										break;
									}

									cts = find_alloc_counts(que_counts->all, PBS_ALL_ENTITY);
									update_counts_on_run(cts, te_rr->resreq);
									counts_max(que_counts_max->all, que_counts->all);
									if (que_counts_max->all.size() == 0) {
										error = 1;
										break;
									}
								}
							}
						}
					} else if (te->event_type == TIMED_END_EVENT) {
						if (svr_counts != NULL) {
							auto cts = find_alloc_counts(svr_counts->user, te_rr->user);
							update_counts_on_end(cts, te_rr->resreq);
							cts = find_alloc_counts(svr_counts->group, te_rr->group);
							update_counts_on_end(cts, te_rr->resreq);
							cts = find_alloc_counts(svr_counts->project, te_rr->project);
							update_counts_on_end(cts, te_rr->resreq);
							cts = find_alloc_counts(svr_counts->all, PBS_ALL_ENTITY);
							update_counts_on_end(cts, te_rr->resreq);
						}
						if (que_counts != NULL) {
							if (te_rr->is_job && te_rr->job != NULL) {
								if (te_rr->job->queue == qi) {
									auto cts = find_alloc_counts(que_counts->user, te_rr->user);
									update_counts_on_end(cts, te_rr->resreq);
									cts = find_alloc_counts(que_counts->group, te_rr->group);
									update_counts_on_end(cts, te_rr->resreq);
									cts = find_alloc_counts(que_counts->project, te_rr->project);
									update_counts_on_end(cts, te_rr->resreq);
									cts = find_alloc_counts(que_counts->all, PBS_ALL_ENTITY);
									update_counts_on_end(cts, te_rr->resreq);
								}
							}
						}
					}
				}
			}
			delete svr_counts;
			delete que_counts;
			if (error) {
				delete svr_counts_max;
				delete que_counts_max;
				return SE_NONE;
			}
		}
	}
	if ((flags & CHECK_LIMIT)) {
		if (svr_counts_max != NULL) {
			server_lim = svr_counts_max;
		} else {
			server_lim = new limcounts(si->user_counts,
						   si->group_counts,
						   si->project_counts,
						   si->alljobcounts);
		}
		if (que_counts_max != NULL) {
			queue_lim = que_counts_max;
		} else {
			queue_lim = new limcounts(qi->user_counts,
						  qi->group_counts,
						  qi->project_counts,
						  qi->alljobcounts);
		}
	} else if ((flags & CHECK_CUMULATIVE_LIMIT)) {
		if (!si->has_hard_limit && !qi->has_hard_limit)
			return SE_NONE;
		server_lim = new limcounts(si->total_user_counts,
					   si->total_group_counts,
					   si->total_project_counts,
					   si->total_alljobcounts);
		queue_lim = new limcounts(qi->total_user_counts,
					  qi->total_group_counts,
					  qi->total_project_counts,
					  qi->total_alljobcounts);
	}
	for (i = 0; i < sizeof(limfuncs) / sizeof(limfuncs[0]); i++) {
		rc = static_cast<enum sched_error_code>((limfuncs[i])(si, qi, rr, server_lim, queue_lim, err));
		if (rc != SE_NONE) {
			if ((flags & RETURN_ALL_ERR)) {
				if (any_fail_rc == 0)
					any_fail_rc = rc;
				set_schd_error_codes(err, NOT_RUN, rc);
				err->next = new_schd_error();
				prev_err = err;
				err = err->next;
				if (err == NULL) {
					delete server_lim;
					delete queue_lim;
					return SCHD_ERROR;
				}
			} else {
				set_schd_error_codes(err, NOT_RUN, rc);
				break;
			}
		}
	}

	delete server_lim;
	delete queue_lim;

	if (flags & RETURN_ALL_ERR) {
		if (prev_err != NULL) {
			free_schd_error(err);
			prev_err->next = NULL;
		}
	}

	if (any_fail_rc)
		return any_fail_rc;

	return rc;
}

/**
 * @brief
 *		update_soft_limits - check the soft limit using soft limit function.
 *
 * @param[in]	si	-	server info.
 * @param[in]	qi	-	queue info
 * @param[in]	rr	-	Resource reservation structure
 *
 * @return	void
 */
void
update_soft_limits(server_info *si, queue_info *qi, resource_resv *rr)
{
	size_t i;
	for (i = 0; i < sizeof(softlimfuncs) / sizeof(softlimfuncs[0]); i++)
		softlimfuncs[i](si, qi, rr);
	return;
}

/**
 * @brief	find the value of preempt bit with matching entity and resource in
 *		the counts structure
 * @param[in]	entity_counts	-   Counts structure where entity information is stored
 * @param[in]	entity_name	-   Name of the entity
 * @param[in]	rr		-   job structure
 *
 * @return	int
 * @retval	Accumulated preempt_bits matching the entity
 */
int
find_preempt_bits(counts_umap &entity_counts, const std::string &entity_name, resource_resv *rr)
{
	counts *cnt = NULL;
	resource_count *res_c;
	int rc = 0;

	if (entity_name.empty())
		return rc;

	find_counts_elm(entity_counts, entity_name, NULL, &cnt, NULL);
	if (cnt == NULL)
		return rc;

	rc |= cnt->soft_limit_preempt_bit;
	for (res_c = cnt->rescts; res_c != NULL; res_c = res_c->next) {
		auto req = find_resource_req(rr->resreq, res_c->def);
		if (req != NULL)
			rc |= res_c->soft_limit_preempt_bit;
	}
	return rc;
}

/**
 * @brief
 * 		check_soft_limits - check the soft limit using soft limit function.
 *
 * @param[in]	si	-	server info.
 * @param[in]	qi	-	queue info
 * @param[in]	rr	-	Resource reservation structure
 *
 * @return	return code for soft limits
 */
int
check_soft_limits(server_info *si, queue_info *qi, resource_resv *rr)
{
	int rc = 0;

	if (si == NULL || qi == NULL || rr == NULL)
		return 0;

	if (si->has_soft_limit) {
		if (si->has_user_limit)
			rc |= find_preempt_bits(si->user_counts, rr->user, rr);
		if (si->has_grp_limit)
			rc |= find_preempt_bits(si->group_counts, rr->group, rr);
		if (si->has_proj_limit)
			rc |= find_preempt_bits(si->project_counts, rr->project, rr);
		if (si->has_all_limit)
			rc |= find_preempt_bits(si->alljobcounts, PBS_ALL_ENTITY, rr);
	}
	if (qi->has_soft_limit) {
		if (qi->has_user_limit)
			rc |= find_preempt_bits(qi->user_counts, rr->user, rr);
		if (qi->has_grp_limit)
			rc |= find_preempt_bits(qi->group_counts, rr->group, rr);
		if (qi->has_proj_limit)
			rc |= find_preempt_bits(qi->project_counts, rr->project, rr);
		if (qi->has_all_limit)
			rc |= find_preempt_bits(qi->alljobcounts, PBS_ALL_ENTITY, rr);
	}

	return (rc);
}

/**
 * @brief
 *		check_server_max_user_run	hard limit checking function for
 *					user server run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_server_max_user_run(server_info *si, queue_info *qi, resource_resv *rr,
			  limcounts *sc, limcounts *qc, schd_error *err)
{
	char *key;
	std::string user;
	int used;
	int max_user_run, max_genuser_run;

	if ((si == NULL) || (rr == NULL) || (rr->user.empty()) || (sc == NULL))
		return (SCHD_ERROR);

	if (!si->has_user_limit)
		return (0);

	user = rr->user;

	auto &cts = sc->user;

	if ((key = entlim_mk_runkey(LIM_USER, user.c_str())) == NULL)
		return (SCHD_ERROR);
	max_user_run = (int) lim_get(key, LI2RUNCTX(si->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_USER, genparam)) == NULL)
		return (SCHD_ERROR);
	max_genuser_run = (int) lim_get(key, LI2RUNCTX(si->liminfo));
	free(key);

	if ((max_user_run == SCHD_INFINITY) &&
	    (max_genuser_run == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(cts, user, NULL, NULL, NULL);
	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__,
		   "user %s max_*user_run (%d, %d), used %d",
		   user.c_str(), max_user_run, max_genuser_run, used);

	if (max_user_run != SCHD_INFINITY) {
		if (max_user_run <= used) {
			schderr_args_server(user, err);
			return (SERVER_BYUSER_JOB_LIMIT_REACHED);
		} else
			return (0); /* ignore a generic limit */
	} else if (max_genuser_run <= used) {
		schderr_args_server(NULL, err);
		return (SERVER_USER_LIMIT_REACHED);
	} else
		return (0);
}
/**
 * @brief
 *		check_server_max_group_run	hard limit checking function for
 *					group server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_server_max_group_run(server_info *si, queue_info *qi, resource_resv *rr,
			   limcounts *sc, limcounts *qc, schd_error *err)
{
	char *key;
	std::string group;
	int used;
	int max_group_run, max_gengroup_run;

	if ((si == NULL) || (rr == NULL) || (rr->group.empty()) || (sc == NULL))
		return (SCHD_ERROR);

	if (!si->has_grp_limit)
		return (0);

	group = rr->group;

	auto &cts = sc->group;

	if ((key = entlim_mk_runkey(LIM_GROUP, group.c_str())) == NULL)
		return (SCHD_ERROR);
	max_group_run = (int) lim_get(key, LI2RUNCTX(si->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_GROUP, genparam)) == NULL)
		return (SCHD_ERROR);
	max_gengroup_run = (int) lim_get(key, LI2RUNCTX(si->liminfo));
	free(key);

	if ((max_group_run == SCHD_INFINITY) &&
	    (max_gengroup_run == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(cts, group, NULL, NULL, NULL);
	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "group %s max_*group_run (%d, %d), used %d",
		   group.c_str(), max_group_run, max_gengroup_run, used);

	if (max_group_run != SCHD_INFINITY) {
		if (max_group_run <= used) {
			schderr_args_server(group, err);
			return (SERVER_BYGROUP_JOB_LIMIT_REACHED);
		} else
			return (0); /* ignore a generic limit */
	} else if (max_gengroup_run <= used) {
		schderr_args_server(NULL, err);
		return (SERVER_GROUP_LIMIT_REACHED);
	} else
		return (0);
}

/**
 * @brief
 *		check_server_max_user_res	hard limit checking function for
 *					user server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_server_max_user_res(server_info *si, queue_info *qi, resource_resv *rr,
			  limcounts *sc, limcounts *qc, schd_error *err)
{
	int ret;
	resdef *rdef = NULL;

	if ((si == NULL) || (rr == NULL) || (sc == NULL))
		return (SCHD_ERROR);

	if (!si->has_user_limit)
		return (0);

	auto &cts = sc->user;

	ret = check_max_user_res(rr, cts, &rdef,
				 LI2RESCTX(si->liminfo));
	if (ret != 0)
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "check_max_user_res returned %d", ret);
	switch (ret) {
		default:
		case -1:
			return (SCHD_ERROR);
		case 0:
			return (0);
		case 1: /* generic user limit exceeded */
			err->rdef = rdef;
			return (SERVER_USER_RES_LIMIT_REACHED);
		case 2: /* individual user limit exceeded */
			schderr_args_server_res(rr->user, NULL, err);
			err->rdef = rdef;
			return (SERVER_BYUSER_RES_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_server_max_group_res	hard limit checking function for
 *					group server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see		#sched_error_code in constant.h
 */
static int
check_server_max_group_res(server_info *si, queue_info *qi, resource_resv *rr,
			   limcounts *sc, limcounts *qc, schd_error *err)
{
	int ret;
	resdef *rdef = NULL;

	if ((si == NULL) || (rr == NULL) || (sc == NULL))
		return (SCHD_ERROR);

	if (!si->has_grp_limit)
		return (0);

	auto &cts = sc->group;

	ret = check_max_group_res(rr, cts,
				  &rdef, LI2RESCTX(si->liminfo));
	if (ret != 0)
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "check_max_group_res returned %d", ret);
	switch (ret) {
		default:
		case -1:
			return (SCHD_ERROR);
		case 0:
			return (0);
		case 1: /* generic group limit exceeded */
			err->rdef = rdef;
			return (SERVER_GROUP_RES_LIMIT_REACHED);
		case 2: /* individual group limit exceeded */
			schderr_args_server_res(rr->group, NULL, err);
			err->rdef = rdef;
			return (SERVER_BYGROUP_RES_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_queue_max_user_run	hard limit checking function for
 *					user queue run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	-	if limit is not exceeded
 * @retval	sched_error_code enum	-	if limit is exceeded
 * @retval	SCHD_ERROR	-	on error
 * @see	#sched_error_code in constant.h
 */
static int
check_queue_max_user_run(server_info *si, queue_info *qi, resource_resv *rr,
			 limcounts *sc, limcounts *qc, schd_error *err)
{
	char *key;
	std::string user;
	int used;
	int max_user_run, max_genuser_run;

	if ((qi == NULL) || (rr == NULL) || (rr->user.empty()) || (qc == NULL))
		return (SCHD_ERROR);

	if (!qi->has_user_limit)
		return (0);

	user = rr->user;

	auto &cts = qc->user;

	if ((key = entlim_mk_runkey(LIM_USER, user.c_str())) == NULL)
		return (SCHD_ERROR);
	max_user_run = (int) lim_get(key, LI2RUNCTX(qi->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_USER, genparam)) == NULL)
		return (SCHD_ERROR);
	max_genuser_run = (int) lim_get(key, LI2RUNCTX(qi->liminfo));
	free(key);

	if ((max_user_run == SCHD_INFINITY) &&
	    (max_genuser_run == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(cts, user, NULL, NULL, NULL);
	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "user %s max_*user_run (%d, %d), used %d",
		   user.c_str(), max_user_run, max_genuser_run, used);

	if (max_user_run != SCHD_INFINITY) {
		if (max_user_run <= used) {
			schderr_args_q(qi->name, user, err);
			return (QUEUE_BYUSER_JOB_LIMIT_REACHED);
		} else
			return (0); /* ignore a generic limit */
	} else if (max_genuser_run <= used) {
		schderr_args_q(qi->name, NULL, err);
		return (QUEUE_USER_LIMIT_REACHED);
	} else
		return (0);
}

/**
 * @brief
 *		check_queue_max_group_run	hard limit checking function for
 *					group queue run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 * @see	#sched_error	: in constant.h
 */
static int
check_queue_max_group_run(server_info *si, queue_info *qi, resource_resv *rr,
			  limcounts *sc, limcounts *qc, schd_error *err)
{
	char *key;
	std::string group;
	int used;
	int max_group_run, max_gengroup_run;

	if ((qi == NULL) || (rr == NULL) || (rr->group.empty()) || (qc == NULL))
		return (SCHD_ERROR);

	if (!qi->has_grp_limit)
		return (0);

	group = rr->group;

	auto &cts = qc->group;

	if ((key = entlim_mk_runkey(LIM_GROUP, group.c_str())) == NULL)
		return (SCHD_ERROR);
	max_group_run = (int) lim_get(key, LI2RUNCTX(qi->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_GROUP, genparam)) == NULL)
		return (SCHD_ERROR);
	max_gengroup_run = (int) lim_get(key, LI2RUNCTX(qi->liminfo));
	free(key);

	if ((max_group_run == SCHD_INFINITY) &&
	    (max_gengroup_run == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(cts, group, NULL, NULL, NULL);
	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "group %s max_*group_run (%d, %d), used %d",
		   group.c_str(), max_group_run, max_gengroup_run, used);

	if (max_group_run != SCHD_INFINITY) {
		if (max_group_run <= used) {
			schderr_args_q(qi->name, group, err);
			return (QUEUE_BYGROUP_JOB_LIMIT_REACHED);
		} else
			return (0); /* ignore a generic limit */
	} else if (max_gengroup_run <= used) {
		schderr_args_q(qi->name, NULL, err);
		return (QUEUE_GROUP_LIMIT_REACHED);
	} else
		return (0);
}

/**
 * @brief
 *		check_queue_max_user_res	hard limit checking function for
 *					user queue resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer	: indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error	: in constant.h
 */
static int
check_queue_max_user_res(server_info *si, queue_info *qi, resource_resv *rr,
			 limcounts *sc, limcounts *qc, schd_error *err)
{
	int ret;
	resdef *rdef = NULL;

	if ((qi == NULL) || (rr == NULL) || (qc == NULL))
		return (SCHD_ERROR);

	if (!qi->has_user_limit)
		return (0);

	auto &cts = qc->user;

	ret = check_max_user_res(rr, cts, &rdef, LI2RESCTX(qi->liminfo));
	if (ret != 0)
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "check_max_user_res returned %d", ret);

	switch (ret) {
		default:
		case -1:
			return (SCHD_ERROR);
		case 0:
			return (0);
		case 1: /* generic user limit exceeded */
			schderr_args_q_res(qi->name, NULL, NULL, err);
			err->rdef = rdef;
			return (QUEUE_USER_RES_LIMIT_REACHED);
		case 2: /* individual user limit exceeded */
			schderr_args_q_res(qi->name, rr->user, NULL, err);
			err->rdef = rdef;
			return (QUEUE_BYUSER_RES_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_queue_max_group_res	hard limit checking function for
 *					group queue resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_queue_max_group_res(server_info *si, queue_info *qi, resource_resv *rr,
			  limcounts *sc, limcounts *qc, schd_error *err)
{
	int ret;
	resdef *rdef = NULL;

	if ((qi == NULL) || (rr == NULL) || (qc == NULL))
		return (SCHD_ERROR);

	if (!qi->has_grp_limit)
		return (0);

	auto &cts = qc->group;

	ret = check_max_group_res(rr, cts, &rdef, LI2RESCTX(qi->liminfo));
	if (ret != 0)
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "check_max_group_res returned %d", ret);

	switch (ret) {
		default:
		case -1:
			return (SCHD_ERROR);
		case 0:
			return (0);
		case 1: /* generic group limit exceeded */
			schderr_args_q_res(qi->name, NULL, NULL, err);
			err->rdef = rdef;
			return (QUEUE_GROUP_RES_LIMIT_REACHED);
		case 2: /* individual group limit exceeded */
			schderr_args_q_res(qi->name, rr->group, NULL, err);
			err->rdef = rdef;
			return (QUEUE_BYGROUP_RES_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_queue_max_res	hard limit checking function for overall queue
 *				resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_queue_max_res(server_info *si, queue_info *qi, resource_resv *rr,
		    limcounts *sc, limcounts *qc, schd_error *err)
{
	char *reskey;
	sch_resource_t max_res;
	sch_resource_t used;
	schd_resource *res;
	resource_count *used_res;
	counts *c;

	if ((qi == NULL) || (rr == NULL))
		return (SCHD_ERROR);

	if (qc == NULL)
		return (0);

	auto &cts = qc->all;

	c = find_counts(cts, PBS_ALL_ENTITY);
	if (c == NULL)
		return (0);

	for (res = limres; res != NULL; res = res->next) {
		resource_req *req;
		if ((req = find_resource_req(rr->resreq, res->def)) == NULL)
			continue;

		if ((reskey = entlim_mk_reskey(LIM_OVERALL, allparam,
					       res->name)) == NULL)
			return (SCHD_ERROR);
		max_res = lim_get(reskey, LI2RESCTX(qi->liminfo));
		free(reskey);

		if (max_res == SCHD_INFINITY)
			continue;

		if ((used_res = find_resource_count(c->rescts, res->def)) == NULL)
			used = 0;
		else
			used = used_res->amount;

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "max_res.%s %.1lf, used %.1lf", res->name, max_res, used);
		if (used + req->amount > max_res) {
			schderr_args_q_res(qi->name, NULL, NULL, err);
			err->rdef = res->def;
			return (QUEUE_RESOURCE_LIMIT_REACHED);
		}
	}

	return (0);
}

/**
 * @brief
 *		check_server_max_res	hard limit checking function for overall server
 *				resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_server_max_res(server_info *si, queue_info *qi, resource_resv *rr,
		     limcounts *sc, limcounts *qc, schd_error *err)
{
	char *reskey;
	sch_resource_t max_res;
	sch_resource_t used;
	schd_resource *res;
	resource_count *used_res;
	counts *c;

	if ((si == NULL) || (rr == NULL))
		return (SCHD_ERROR);

	if (sc == NULL)
		return (0);

	auto &cts = sc->all;

	c = find_counts(cts, PBS_ALL_ENTITY);
	if (c == NULL)
		return (0);

	for (res = limres; res != NULL; res = res->next) {
		resource_req *req;

		if ((req = find_resource_req(rr->resreq, res->def)) == NULL)
			continue;

		if ((reskey = entlim_mk_reskey(LIM_OVERALL, allparam,
					       res->name)) == NULL)
			return (SCHD_ERROR);
		max_res = lim_get(reskey, LI2RESCTX(si->liminfo));
		free(reskey);

		if (max_res == SCHD_INFINITY)
			continue;

		if ((used_res = find_resource_count(c->rescts, res->def)) == NULL)
			used = 0;
		else
			used = used_res->amount;

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "max_res.%s %.1lf, used %.1lf", res->name, max_res, used);
		if (used + req->amount > max_res) {
			err->rdef = res->def;
			return (SERVER_RESOURCE_LIMIT_REACHED);
		}
	}

	return (0);
}

/**
 * @brief
 *		check_server_max_run	hard limit checking function for
 *				server run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_server_max_run(server_info *si, queue_info *qi, resource_resv *rr,
		     limcounts *sc, limcounts *qc, schd_error *err)
{
	int max_running;
	char *key;
	int running;

	if (si == NULL)
		return (SCHD_ERROR);

	if (sc == NULL)
		return (0);

	auto &cts = sc->all;

	if ((key = entlim_mk_runkey(LIM_OVERALL, allparam)) == NULL)
		return (SCHD_ERROR);
	max_running = (int) lim_get(key, LI2RUNCTX(si->liminfo));
	free(key);

	running = find_counts_elm(cts, PBS_ALL_ENTITY, NULL, NULL, NULL);

	if ((max_running == SCHD_INFINITY) ||
	    (max_running > running))
		return (0);
	else {
		schderr_args_server(NULL, err);
		return (SERVER_JOB_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_queue_max_run	hard limit checking function for
 *				queue run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_queue_max_run(server_info *si, queue_info *qi, resource_resv *rr,
		    limcounts *sc, limcounts *qc, schd_error *err)
{
	int max_running;
	char *key;
	int running;

	if (qi == NULL)
		return (SCHD_ERROR);

	if (qc == NULL)
		return (0);

	auto &cts = qc->all;

	if ((key = entlim_mk_runkey(LIM_OVERALL, allparam)) == NULL)
		return (SCHD_ERROR);

	max_running = (int) lim_get(key, LI2RUNCTX(qi->liminfo));
	free(key);

	running = find_counts_elm(cts, PBS_ALL_ENTITY, NULL, NULL, NULL);

	if ((max_running == SCHD_INFINITY) ||
	    (max_running > running))
		return (0);
	else {
		schderr_args_q(qi->name, NULL, err);
		return (QUEUE_JOB_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_queue_max_run_soft	soft limit checking function for
 *					queue run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see		#preempt enum in constant.h
 */
static int
check_queue_max_run_soft(server_info *si, queue_info *qi, resource_resv *rr)
{
	int max_running;
	char *key;
	counts *cnt = NULL;
	int used = 0;

	if (qi == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!qi->has_all_limit)
		return (0);

	if ((key = entlim_mk_runkey(LIM_OVERALL, allparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_running = (int) lim_get(key, LI2RUNCTXSOFT(qi->liminfo));
	free(key);

	/* at this point, we know a limit is set for PBS_ALL*/
	used = find_counts_elm(qi->alljobcounts, PBS_ALL_ENTITY, NULL, &cnt, NULL);
	if (max_running != SCHD_INFINITY && used > max_running) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
		return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_queue_max_user_run_soft	soft limit checking function for
 *					user queue run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_queue_max_user_run_soft(server_info *si, queue_info *qi, resource_resv *rr)
{
	char *key;
	std::string user;
	int used;
	int max_user_run_soft, max_genuser_run_soft;
	counts *cnt = NULL;

	if ((qi == NULL) || (rr == NULL) || (rr->user.empty()))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!qi->has_user_limit)
		return (0);

	user = rr->user;

	if ((key = entlim_mk_runkey(LIM_USER, user.c_str())) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_user_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(qi->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_USER, genparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_genuser_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(qi->liminfo));
	free(key);

	if ((max_user_run_soft == SCHD_INFINITY) &&
	    (max_genuser_run_soft == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(qi->user_counts, user, NULL, &cnt, NULL);

	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "user %s max_*user_run_soft (%d, %d), used %d",
		   user.c_str(), max_user_run_soft, max_genuser_run_soft, used);

	if (max_user_run_soft != SCHD_INFINITY) {
		if (max_user_run_soft < used) {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
		} else {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = 0;
			return (0); /* ignore a generic limit */
		}
	} else if (max_genuser_run_soft < used) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
		return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_queue_max_group_run_soft	soft limit checking function for
 *					group queue run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_queue_max_group_run_soft(server_info *si, queue_info *qi,
			       resource_resv *rr)
{
	char *key;
	std::string group;
	int used;
	int max_group_run_soft, max_gengroup_run_soft;
	counts *cnt = NULL;

	if ((qi == NULL) || (rr == NULL) || (rr->group.empty()))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!qi->has_grp_limit)
		return (0);

	group = rr->group;

	if ((key = entlim_mk_runkey(LIM_GROUP, group.c_str())) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_group_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(qi->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_GROUP, genparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_gengroup_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(qi->liminfo));
	free(key);

	if ((max_group_run_soft == SCHD_INFINITY) &&
	    (max_gengroup_run_soft == SCHD_INFINITY))
		return (0);

	used = find_counts_elm(qi->group_counts, group, NULL, &cnt, NULL);
	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "group %s max_*group_run_soft (%d, %d), used %d",
		   group.c_str(), max_group_run_soft, max_gengroup_run_soft, used);

	if (max_group_run_soft != SCHD_INFINITY) {
		if (max_group_run_soft < used) {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
		} else {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = 0;
			return (0); /* ignore a generic limit */
		}
	} else if (max_gengroup_run_soft < used) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
		return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_queue_max_user_res_soft	soft limit checking function for
 *					user queue resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see		#preempt enum in constant.h
 */
static int
check_queue_max_user_res_soft(server_info *si, queue_info *qi, resource_resv *rr)
{
	if ((qi == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!qi->has_user_limit)
		return (0);

	return (check_max_user_res_soft(qi->running_jobs, rr, qi->user_counts,
					LI2RESCTXSOFT(qi->liminfo), PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT)));
}

/**
 * @brief
 *		check_queue_max_group_res_soft	soft limit checking function for
 *					group queue resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_queue_max_group_res_soft(server_info *si, queue_info *qi,
			       resource_resv *rr)
{
	if ((qi == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!qi->has_grp_limit)
		return (0);

	return (check_max_group_res_soft(rr, qi->group_counts,
					 LI2RESCTXSOFT(qi->liminfo), PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT)));
}

/**
 * @brief
 *		check_server_max_run_soft	soft limit checking function for
 *					server run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_run_soft(server_info *si, queue_info *qi, resource_resv *rr)
{
	int max_running;
	char *key;
	counts *cnt = NULL;
	int used = 0;

	if (si == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!si->has_all_limit)
		return (0);

	if ((key = entlim_mk_runkey(LIM_OVERALL, allparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_running = (int) lim_get(key, LI2RUNCTXSOFT(si->liminfo));
	free(key);

	/* at this point, we know a limit is set for PBS_ALL*/
	used = find_counts_elm(si->alljobcounts, PBS_ALL_ENTITY, NULL, &cnt, NULL);
	if (max_running != SCHD_INFINITY && used > max_running) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
		return (PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_server_max_user_run_soft	soft limit checking function for
 *					user server run limits
 *
 * @param [in]	si	-	server_info structure to use for limit evaluation
 * @param [in]	qi	-	queue_info structure to use for limit evaluation
 * @param [in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_user_run_soft(server_info *si, queue_info *qi,
			       resource_resv *rr)
{
	char *key;
	std::string user;
	int used;
	int max_user_run_soft, max_genuser_run_soft;
	counts *cnt = NULL;

	if ((si == NULL) || (rr == NULL) || (rr->user.empty()))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!si->has_user_limit)
		return (0);

	user = rr->user;

	if ((key = entlim_mk_runkey(LIM_USER, user.c_str())) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_user_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(si->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_USER, genparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_genuser_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(si->liminfo));
	free(key);

	if ((max_user_run_soft == SCHD_INFINITY) &&
	    (max_genuser_run_soft == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(si->user_counts, user, NULL, &cnt, NULL);
	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "user %s max_*user_run_soft (%d, %d), used %d",
		   user.c_str(), max_user_run_soft, max_genuser_run_soft, used);

	if (max_user_run_soft != SCHD_INFINITY) {
		if (max_user_run_soft < used) {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT));
		} else {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = 0;
			return (0); /* ignore a generic limit */
		}
	} else if (max_genuser_run_soft < used) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
		return ((PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT)));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_server_max_group_run_soft	soft limit checking function for
 *					group server run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_group_run_soft(server_info *si, queue_info *qi,
				resource_resv *rr)
{
	char *key;
	std::string group;
	int used;
	int max_group_run_soft, max_gengroup_run_soft;
	counts *cnt = NULL;

	if ((si == NULL) || (rr == NULL) || (rr->group.empty()))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!si->has_grp_limit)
		return (0);

	group = rr->group;

	if ((key = entlim_mk_runkey(LIM_GROUP, group.c_str())) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_group_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(si->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_GROUP, genparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_gengroup_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(si->liminfo));
	free(key);

	if ((max_group_run_soft == SCHD_INFINITY) &&
	    (max_gengroup_run_soft == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(si->group_counts, group, NULL, &cnt, NULL);

	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "group %s max_*group_run_soft (%d, %d), used %d",
		   group.c_str(), max_group_run_soft, max_gengroup_run_soft, used);

	if (max_group_run_soft != SCHD_INFINITY) {
		if (max_group_run_soft < used) {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT));
		} else {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = 0;
			return (0); /* ignore a generic limit */
		}
	} else if (max_gengroup_run_soft < used) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
		return (PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_server_max_user_res_soft	soft limit checking function for
 *					user server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param [in]	qi	-	queue_info structure to use for limit evaluation
 * @param [in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_user_res_soft(server_info *si, queue_info *qi,
			       resource_resv *rr)
{
	if ((si == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!si->has_user_limit)
		return (0);

	return (check_max_user_res_soft(si->running_jobs, rr, si->user_counts,
					LI2RESCTXSOFT(si->liminfo), PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT)));
}

/**
 * @brief
 * 		check_server_max_group_res_soft	soft limit checking function for
 *					group server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_group_res_soft(server_info *si, queue_info *qi,
				resource_resv *rr)
{
	if ((si == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!si->has_grp_limit)
		return (0);

	return (check_max_group_res_soft(rr, si->group_counts,
					 LI2RESCTXSOFT(si->liminfo), PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT)));
}

/**
 * @brief
 *		check_server_max_res_soft	soft limit checking function for overall
 *					server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_res_soft(server_info *si, queue_info *qi, resource_resv *rr)
{
	char *reskey;
	sch_resource_t max_res_soft;
	sch_resource_t used;
	schd_resource *res;
	resource_count *used_res;
	counts *c;

	if ((si == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	c = find_counts(si->alljobcounts, PBS_ALL_ENTITY);
	if (c == NULL)
		return (0);

	for (res = limres; res != NULL; res = res->next) {
		/* If the job is not requesting the limit resource, it is not over its soft limit*/
		if (find_resource_req(rr->resreq, res->def) == NULL)
			continue;

		if ((reskey = entlim_mk_reskey(LIM_OVERALL, allparam,
					       res->name)) == NULL)
			return (PREEMPT_TO_BIT(PREEMPT_ERR));
		max_res_soft = lim_get(reskey, LI2RESCTXSOFT(si->liminfo));
		free(reskey);

		if (max_res_soft == SCHD_INFINITY)
			continue;

		if ((used_res = find_resource_count(c->rescts, res->def)) == NULL)
			used = 0;
		else
			used = used_res->amount;

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "max_res_soft.%s %.1lf, used %.1lf",
			   res->name, max_res_soft, used);

		if (max_res_soft < used) {
			if (used_res != NULL)
				used_res->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT));
		} else {
			if (used_res != NULL)
				used_res->soft_limit_preempt_bit = 0;
		}
	}

	return (0);
}

/**
 * @brief
 *		check_queue_max_res_soft	soft limit checking function for overall
 *					queue resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_queue_max_res_soft(server_info *si, queue_info *qi, resource_resv *rr)
{
	char *reskey;
	sch_resource_t max_res_soft;
	sch_resource_t used;
	schd_resource *res;
	resource_count *used_res;
	counts *c;

	if ((qi == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	c = find_counts(qi->alljobcounts, PBS_ALL_ENTITY);
	if (c == NULL)
		return (0);

	for (res = limres; res != NULL; res = res->next) {
		/* If the job is not requesting the limit resource, it is not over its soft limit*/
		if (find_resource_req(rr->resreq, res->def) == NULL)
			continue;

		if ((reskey = entlim_mk_reskey(LIM_OVERALL, allparam,
					       res->name)) == NULL)
			return (PREEMPT_TO_BIT(PREEMPT_ERR));
		max_res_soft = lim_get(reskey, LI2RESCTXSOFT(qi->liminfo));
		free(reskey);

		if (max_res_soft == SCHD_INFINITY)
			continue;

		if ((used_res = find_resource_count(c->rescts, res->def)) == NULL)
			used = 0;
		else
			used = used_res->amount;

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "max_res_soft.%s %.1lf, used %.1lf",
			   res->name, max_res_soft, used);

		if (max_res_soft < used) {
			if (used_res != NULL)
				used_res->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
		} else {
			if (used_res != NULL)
				used_res->soft_limit_preempt_bit = 0;
		}
	}

	return (0);
}

/**
 * @brief
 *		check_max_group_res	check to see whether the user can run a
 *				resource resv and still be within group max
 *				resource limits
 *
 * @param[in]	rr	-	resource_resv to run
 * @param[in]	cts_list	-	the user counts list
 * @param[out]  rdef -		resource definition of resource exceeding a limit
 * @param[in]	limitctx	-	the limit storage context
 *
 * @return	int
 * @retval	0	: if the group would be under or at its limits
 * @retval	1	: if a generic group limit would be exceeded
 * @retval	2	: if an individual group limit would be exceeded
 * @retval	-1	: on error
 */
static int
check_max_group_res(resource_resv *rr, counts_umap &cts_list,
		    resdef **rdef, void *limitctx)
{
	char *groupreskey;
	char *gengroupreskey;
	std::string group;
	schd_resource *res;
	sch_resource_t max_group_res;
	sch_resource_t max_gengroup_res;
	sch_resource_t used = 0;

	if (rr == NULL)
		return (-1);
	if ((limres == NULL) || (rr->resreq == NULL))
		return (0);

	group = rr->group;

	for (res = limres; res != NULL; res = res->next) {
		resource_req *req;
		if ((req = find_resource_req(rr->resreq, res->def)) == NULL)
			continue;

		/* individual group limit check */
		if ((groupreskey = entlim_mk_reskey(LIM_GROUP, group.c_str(),
						    res->name)) == NULL)
			return (-1);
		max_group_res = lim_get(groupreskey, limitctx);
		free(groupreskey);

		/* generic group limit check */
		if ((gengroupreskey = lim_gengroupreskey(res->name)) == NULL)
			return (-1);
		max_gengroup_res = lim_get(gengroupreskey, limitctx);
		free(gengroupreskey);

		if ((max_group_res == SCHD_INFINITY) &&
		    (max_gengroup_res == SCHD_INFINITY))
			continue;

		/* at this point, we know a generic or individual limit is set */
		used = find_counts_elm(cts_list, group, res->def, NULL, NULL);

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "group %s max_*group_res.%s (%.1lf, %.1lf), used %.1lf",
			   group.c_str(), res->name, max_group_res, max_gengroup_res, used);

		if (max_group_res != SCHD_INFINITY) {
			if (used + req->amount > max_group_res) {
				*rdef = res->def;
				return (2);
			} else
				continue; /* ignore a generic limit */
		} else if (used + req->amount > max_gengroup_res) {
			*rdef = res->def;
			return (1);
		}
	}

	return (0);
}

/**
 * @brief
 *		check_max_group_res_soft	check to see whether the user can run a
 *					resource resv and still be within group
 *					max resource limits
 *
 * @param[in]	rr	-	resource_resv to run
 * @param[in]	cts_list	-	the user counts list
 * @param[in]	limitctx	-	the limit storage context
 * @param[in]	preempt_bit	-	preempt bit value to set and return if limit is exceeded
 *
 * @return	int
 * @retval	0	: if the group would be under or at its limits
 * @retval	1	: if a generic group limit would be exceeded
 * @retval	-1	: on error
 */
static int
check_max_group_res_soft(resource_resv *rr, counts_umap &cts_list, void *limitctx, int preempt_bit)
{
	char *groupreskey;
	char *gengroupreskey;
	std::string group;
	schd_resource *res;
	sch_resource_t max_group_res_soft;
	sch_resource_t max_gengroup_res_soft;
	sch_resource_t used = 0;
	resource_count *rescts;
	int rc = 0;

	if (rr == NULL)
		return (-1);
	if ((limres == NULL) || (rr->resreq == NULL))
		return (0);

	group = rr->group;

	for (res = limres; res != NULL; res = res->next) {
		/* If the job is not requesting the limit resource, it is not over its soft limit*/
		if (find_resource_req(rr->resreq, res->def) == NULL)
			continue;

		/* individual group limit check */
		if ((groupreskey = entlim_mk_reskey(LIM_GROUP, group.c_str(),
						    res->name)) == NULL)
			return (-1);
		max_group_res_soft = lim_get(groupreskey, limitctx);
		free(groupreskey);

		/* generic group limit check */
		if ((gengroupreskey = lim_gengroupreskey(res->name)) == NULL)
			return (-1);
		max_gengroup_res_soft = lim_get(gengroupreskey, limitctx);
		free(gengroupreskey);

		if ((max_group_res_soft == SCHD_INFINITY) &&
		    (max_gengroup_res_soft == SCHD_INFINITY))
			continue;

		rescts = NULL;
		/* at this point, we know a generic or individual limit is set */
		used = find_counts_elm(cts_list, group, res->def, NULL, &rescts);
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "group %s max_*group_res_soft.%s (%.1lf, %.1lf), used %.1lf",
			   group.c_str(), res->name, max_group_res_soft, max_gengroup_res_soft, used);

		if (max_group_res_soft != SCHD_INFINITY) {
			if (max_group_res_soft < used) {
				if (rescts != NULL)
					rescts->soft_limit_preempt_bit = preempt_bit;
				rc = preempt_bit;
			} else {
				if (rescts != NULL)
					rescts->soft_limit_preempt_bit = 0;
				continue; /* ignore a generic limit */
			}
		} else if (max_gengroup_res_soft < used) {
			if (rescts != NULL)
				rescts->soft_limit_preempt_bit = preempt_bit;
			rc = preempt_bit;
		} else {
			/* usage is under generic group soft limit, reset the preempt bit */
			if (rescts != NULL)
				rescts->soft_limit_preempt_bit = 0;
		}
	}

	return (rc);
}

/**
 * @brief
 *		check_max_user_res	check to see whether the user can run a job
 *				and still be within max resource limits
 *
 * @param[in]	rr	-	resource_resv to run
 * @param[in]	cts_list	-	the user counts list
 * @param[out]  rdef -		resource definition of resource exceeding a limit
 * @param [in]	limitctx	-	the limit storage context
 *
 * @return	int
 * @retval	0	: if the user would be under or at its limits
 * @retval	1	: if a generic user limit would be exceeded
 * @retval	2	: if an individual user limit would be exceeded
 * @retval	-1	: on error
 */
static int
check_max_user_res(resource_resv *rr, counts_umap &cts_list, resdef **rdef,
		   void *limitctx)
{
	char *userreskey;
	char *genuserreskey;
	std::string user;
	schd_resource *res;
	sch_resource_t max_user_res;
	sch_resource_t max_genuser_res;
	sch_resource_t used = 0;

	if (rr == NULL)
		return (-1);
	if ((limres == NULL) || (rr->resreq == NULL))
		return (0);

	user = rr->user;

	for (res = limres; res != NULL; res = res->next) {
		resource_req *req;

		if ((req = find_resource_req(rr->resreq, res->def)) == NULL)
			continue;

		/* individual user limit check */
		if ((userreskey = entlim_mk_reskey(LIM_USER, user.c_str(),
						   res->name)) == NULL)
			return (-1);
		max_user_res = lim_get(userreskey, limitctx);
		free(userreskey);

		/* generic user limit check */
		if ((genuserreskey = lim_genuserreskey(res->name)) == NULL)
			return (-1);
		max_genuser_res = lim_get(genuserreskey, limitctx);
		free(genuserreskey);

		if ((max_user_res == SCHD_INFINITY) &&
		    (max_genuser_res == SCHD_INFINITY))
			continue;

		/* at this point, we know a generic or individual limit is set */
		used = find_counts_elm(cts_list, user, res->def, NULL, NULL);

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "user %s max_*user_res.%s (%.1lf, %.1lf), used %.1lf",
			   user.c_str(), res->name, max_user_res, max_genuser_res, used);

		if (max_user_res != SCHD_INFINITY) {
			if (used + req->amount > max_user_res) {
				*rdef = res->def;
				return (2);
			} else
				continue; /* ignore a generic limit */
		} else if (used + req->amount > max_genuser_res) {
			*rdef = res->def;
			return (1);
		}
	}

	return (0);
}

/**
 * @brief
 *		check_max_user_res_soft		check to see whether the user can run a
 *					resource resv and still be within max
 *					user resource limits
 *
 * @param[in]	rr_arr	-	resource_resv array to count
 * @param[in]	rr	-	resource_resv to run
 * @param[in]	cts_list	-	the user counts list
 * @param[in]	limitctx	-	the limit storage context
 * @param[in]	preempt_bit	-	preempt bit value to set and return if limit is exceeded
 *
 * @return	int
 * @retval	0	: if the user would be under or at its limits
 * @retval	1	: if a generic user limit would be exceeded
 * @retval	-1	: on error
 */
static int
check_max_user_res_soft(resource_resv **rr_arr, resource_resv *rr,
			counts_umap &cts_list, void *limitctx, int preempt_bit)
{
	char *userreskey;
	char *genuserreskey;
	std::string user;
	schd_resource *res;
	sch_resource_t max_user_res_soft;
	sch_resource_t max_genuser_res_soft;
	sch_resource_t used = 0;
	resource_count *rescts;
	int rc = 0;

	if (rr == NULL)
		return (-1);
	if ((limres == NULL) || (rr->resreq == NULL))
		return (0);

	user = rr->user;

	for (res = limres; res != NULL; res = res->next) {
		/* If the job is not requesting the limit resource, it is not over its soft limit*/
		if (find_resource_req(rr->resreq, res->def) == NULL)
			continue;

		/* individual user limit check */
		if ((userreskey = entlim_mk_reskey(LIM_USER, user.c_str(),
						   res->name)) == NULL)
			return (-1);
		max_user_res_soft = lim_get(userreskey, limitctx);
		free(userreskey);

		/* generic user limit check */
		if ((genuserreskey = lim_genuserreskey(res->name)) == NULL)
			return (-1);
		max_genuser_res_soft = lim_get(genuserreskey, limitctx);
		free(genuserreskey);

		if ((max_user_res_soft == SCHD_INFINITY) &&
		    (max_genuser_res_soft == SCHD_INFINITY))
			continue;

		rescts = NULL;
		/* at this point, we know a generic or individual limit is set */
		used = find_counts_elm(cts_list, user, res->def, NULL, &rescts);

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "user %s max_*user_res_soft (%.1lf, %.1lf), used %.1lf",
			   user.c_str(), max_user_res_soft, max_genuser_res_soft, used);

		if (max_user_res_soft != SCHD_INFINITY) {
			if (max_user_res_soft < used) {
				if (rescts != NULL)
					rescts->soft_limit_preempt_bit = preempt_bit;
				rc = preempt_bit;
			} else {
				if (rescts != NULL)
					rescts->soft_limit_preempt_bit = 0;
				continue; /* ignore a generic limit */
			}
		} else if (max_genuser_res_soft < used) {
			if (rescts != NULL)
				rescts->soft_limit_preempt_bit = preempt_bit;
			rc = preempt_bit;
		} else {
			/* usage is under generic user soft limit, reset the preempt bit */
			if (rescts != NULL)
				rescts->soft_limit_preempt_bit = 0;
		}
	}

	return (rc);
}

/**
 * @brief
 *		lim_setreslimits	set new-style resource limits
 * @par
 *		For the given attribute value and context, parse and set any limit
 *		directives found therein.  We expect the attribute's value to be a
 *		number.
 *
 * @param[in]	a	-	pointer to the attribute, whose value is a new-style
 *							limit attribute
 * @param[in]	ctx	-	the limit context into which the limits should be stored
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: failure
 */
static int
lim_setreslimits(const struct attrl *a, void *ctx)
{
	schd_resource *r;

	/* remember resources that appear in a limit */
	r = find_alloc_resource_by_str(limres, a->resource);
	if (limres == NULL)
		limres = r;

	if (entlim_parse(a->value, a->resource, ctx, lim_callback) == 0)
		return (0);
	else {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__,
			   "entlim_parse(%s, %s) failed", a->value, a->resource);
		return (1);
	}
}

/**
 * @brief
 * 		free and clear saved limit resources.  Must be called whenever
 *		resource definitions are updated.
 *
 * @return void
 */
void
clear_limres(void)
{
	free_resource_list(limres);
	limres = NULL;
}

/**
 *      @brief returns a linked list of resources being limited.
 *
 *      @par This is to be treated as read-only.  Modifying this will adversely
 *           affect the limits code
 *
 *      @return schd_resource *
 */
schd_resource *
query_limres(void)
{
	return limres;
}

/**
 * @brief
 *		lim_setrunlimits	set new-style run limits
 * @par
 *		For the given attribute value and context, parse and set any limit
 *		directives found therein.  We expect the attribute's value to be a
 *		number.
 *
 * @param[in]	a	-	pointer to the attribute, whose value is a new-style
 *						limit attribute
 * @param [in]	ctx	-	the limit context into which the limits should be stored
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: failure
 */
static int
lim_setrunlimits(const struct attrl *a, void *ctx)
{

	if (entlim_parse(a->value, NULL, ctx, lim_callback) == 0)
		return (0);
	else {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, "entlim_parse(%s) failed", a->value);
		return (1);
	}
}

/**
 * @brief
 *		lim_setoldlimits	set old-style run limits
 * @par
 *		For the given attribute value and context, parse and set any limit
 *		directives found therein.  We expect the attribute's value to be a
 *		number.
 *
 * @param[in]	a	-	pointer to the attribute, whose value is an old-style
 *						limit attribute
 * @param[in]	ctx	-	the limit context into which the limits should be stored
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: failure
 * @retval	-1	: indicates an internal error (bad lim_param in old2new_soft[])
 */
static int
lim_setoldlimits(const struct attrl *a, void *ctx)
{
	size_t i;
	struct lim_old2new *avalue = NULL;
	enum lim_keytypes kt;
	const char *p;
	const char *e;

	/* first try soft limits ... */
	for (i = 0; i < sizeof(old2new_soft) / sizeof(old2new_soft[0]); i++) {
		if (!strcmp(a->name, old2new_soft[i].lim_attr)) {
			avalue = &old2new_soft[i];

			p = avalue->lim_param;
			if (*p == 'g')
				kt = LIM_GROUP;
			else if (*p == 'o')
				kt = LIM_OVERALL;
			else if (*p == 'u')
				kt = LIM_USER;
			else
				return (-1);

			/* e is PBS_GENERIC_ENTITY or PBS_ALL_ENTITY */
			e = p + 2;
			if (avalue->lim_isreslim) {
				schd_resource *r;

				/* remember resources that appear in a limit */
				r = find_alloc_resource_by_str(limres, a->resource);
				if (limres == NULL)
					limres = r;

				return (lim_callback(LI2RESCTXSOFT(ctx),
						     kt, const_cast<char *>(avalue->lim_param),
						     const_cast<char *>(e),
						     a->resource, a->value));
			} else
				return (lim_callback(LI2RUNCTXSOFT(ctx),
						     kt, const_cast<char *>(avalue->lim_param),
						     const_cast<char *>(e),
						     NULL, a->value));
		}
	}

	/* ... then hard */
	for (i = 0; i < sizeof(old2new) / sizeof(old2new[0]); i++) {
		if (!strcmp(a->name, old2new[i].lim_attr)) {
			avalue = &old2new[i];

			p = avalue->lim_param;
			if (*p == 'g')
				kt = LIM_GROUP;
			else if (*p == 'o')
				kt = LIM_OVERALL;
			else if (*p == 'u')
				kt = LIM_USER;
			else
				return (-1);

			/* e is PBS_GENERIC_ENTITY or PBS_ALL_ENTITY */
			e = p + 2;
			if (avalue->lim_isreslim) {
				schd_resource *r;

				/* remember resources that appear in a limit */
				r = find_alloc_resource_by_str(limres, a->resource);
				if (limres == NULL)
					limres = r;

				return (lim_callback(LI2RESCTX(ctx),
						     kt, const_cast<char *>(avalue->lim_param),
						     const_cast<char *>(e),
						     a->resource,
						     a->value));
			} else
				return (lim_callback(LI2RUNCTX(ctx),
						     kt, const_cast<char *>(avalue->lim_param),
						     const_cast<char *>(e),
						     a->resource,
						     a->value));
		}
	}

	return (1); /* attribute name not found in translation table */
}
/**
 * @brief
 *		lim_dup_ctx	duplicate all entries in a limit storage context
 *
 * @param[in]	ctx	-	the limit storage context
 *
 * @return	void *
 * @retval	the newly-allocated storage context	: on success
 * @retval	NULL	: on error
 */
static void *
lim_dup_ctx(void *ctx)
{
	void *newctx;
	char *key = NULL;
	char *value = NULL;

	if ((newctx = entlim_initialize_ctx()) == NULL) {
		log_err(errno, __func__, "malloc failed");
		return (NULL);
	}

	while ((value = static_cast<char *>(entlim_get_next(ctx, (void **) &key))) != NULL) {
		const char *newval;
		if ((newval = strdup(value)) == NULL) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__, "strdup value failed");
			(void) entlim_free_ctx(newctx, free);
			return NULL;
		} else if (entlim_add(key, newval, newctx) != 0) {
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__, "entlim_add(%s) failed", key);
			/*
			 *	One might think that we should free newval
			 *	on error as well.  We don't only because we
			 *	are uncertain whether the underneath entlim code
			 *	might have remembered the location of the key's
			 *	value in spite of having returned failure indication.
			 *	We choose to leak a small amount of memory (in
			 *	what we hope to be rare circumstances) rather
			 *	than have the scheduler crash when the system
			 *	memory allocation code detects and aborts due
			 *	to twice-freed memory.
			 */
			(void) entlim_free_ctx(newctx, free);
			return NULL;
		}
	}
	return newctx;
}

/**
 * @brief
 *		is_hardlimit	is the named attribute a new-style hard limit?
 *
 * @param[in]	a	-	pointer to the attribute, whose value is a limit attribute
 *
 * @return	int
 * @retval	0	: if the attrl pointer does not represent a hard lmit
 * @retval	1	: if the attrl pointer represents a soft lmit
 */
static int
is_hardlimit(const struct attrl *a)
{
	if (!strcmp(a->name, ATTR_max_run) ||
	    !strcmp(a->name, ATTR_max_run_res))
		return (1);
	else
		return (0);
}

/**
 * @brief
 *		lim_gengroupreskey	special-purpose shortcut function to construct a
 *				generic group resource key
 *
 * @param[in]	res	-	the resource
 *
 * @return	a resource limit key if successful
 * @retval	NULL	: if not
 */
static char *
lim_gengroupreskey(const char *res)
{
	return (entlim_mk_reskey(LIM_GROUP, genparam, res));
}

/**
 * @brief
 *		lim_genprojectreskey	special-purpose shortcut function to construct a
 *				generic project resource key
 *
 * @param[in]	res	-	the resource
 *
 * @return	a resource limit key if successful
 * @retval	NULL	: if not
 */
static char *
lim_genprojectreskey(const char *res)
{
	return (entlim_mk_reskey(LIM_PROJECT, genparam, res));
}

/**
 * @brief
 *		lim_genuserreskey	special-purpose shortcut function to construct a
 *				generic user resource key
 *
 * @param[in]	res	-	the resource
 *
 * @return	a resource limit key on success
 * @retval	NULL	: on failure
 */
static char *
lim_genuserreskey(const char *res)
{
	return (entlim_mk_reskey(LIM_USER, genparam, res));
}

/**
 * @brief
 *		lim_callback install a new key of the given type and value
 *
 * @param[in]	ctx		the limit storage context
 * @param[in]	kt		the key type
 * @param[in]	param		entity type (unused - see entlim_parse_one())
 * @param[in]	namestring	entity name (see entlim_parse_one())
 * @param[in]	res		the limit resource for which a limit is being set
 * @param[in]	val		the value of the limit
 *
 * @return	int
 * @retval	0 if limit is successfully set
 * @retval	-1 on error.
 */
static int
lim_callback(void *ctx, enum lim_keytypes kt, char *param, char *namestring,
	     char *res, char *val)
{
	char *key = NULL;
	char *v = NULL;

	if (res != NULL)
		key = entlim_mk_reskey(kt, namestring, res);
	else
		key = entlim_mk_runkey(kt, namestring);
	if (key == NULL) {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
			   "key construction %d %s failed", (int) kt, namestring);
		return (-1);
	}

	if ((v = strdup(val)) == NULL) {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
			   "strdup %s %s %s failed", key, res, val);
		free(key);
		return (-1);
	}

	if (entlim_add(key, v, ctx) != 0) {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
			   "limit set %s %s %s failed", key, res, val);
		free(v);
		free(key);
		return (-1);
	} else {
		if (res != NULL)
			log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__,
				   "limit set %s %s %s", key, res, val);
		else
			log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__,
				   "limit set %s NULL %s", key, val);
		free(key);
		return (0);
	}
}

/**
 * @brief
 *		lim_get	fetch a limit value
 *
 * @param[in]	param	-	the requested limit
 * @param[in]	ctx	-	the limit storage context
 *
 * @return	sch_resource_t
 * @retval	the value of the limit, if no error occurs fetching it
 * @retval	SCHD_INFINITY if no such limit exists in the named context
 */
static sch_resource_t
lim_get(const char *param, void *ctx)
{
	char *retptr;

	retptr = static_cast<char *>(entlim_get(param, ctx));
	if (retptr != NULL) {
		sch_resource_t v;

		v = res_to_num(retptr, NULL);
		return (v);
	} else {
		return (SCHD_INFINITY);
	}
}

/**
 * @brief
 *		schderr_args_q	log a queue-related run limit exceeded message
 *
 * @param[in]	qname	-	name of the queue
 * @param[in]	entity	-	name of the group or user, or NULL if unneeded by fmt
 * @param[out]	err	-	schd_error structure to return error information
 */
static void
schderr_args_q(const std::string &qname, const char *entity, schd_error *err)
{
	set_schd_error_arg(err, ARG1, qname.c_str());
	if (entity != NULL)
		set_schd_error_arg(err, ARG2, entity);
}
// overloaded
static void
schderr_args_q(const std::string &qname, const std::string &entity, schd_error *err)
{
	set_schd_error_arg(err, ARG1, qname.c_str());
	if (!entity.empty())
		set_schd_error_arg(err, ARG2, entity.c_str());
}

/**
 * @brief
 * 		schderr_args_q_res log a queue-related resource limit exceeded message
 *
 * @param [in]	qname	-	name of the queue
 * @param [in]	entity	-	name of the group or user, or NULL if unneeded by fmt
 * @param [in]	res	-	name of the resource
 * @param [out]	err	-	schd_error structure to return error information
 */
static void
schderr_args_q_res(const std::string &qname, const char *entity, char *res,
		   schd_error *err)
{
	set_schd_error_arg(err, ARG1, qname.c_str());
	set_schd_error_arg(err, ARG2, res);
	if (entity != NULL)
		set_schd_error_arg(err, ARG3, entity);
}
//overload
static void
schderr_args_q_res(const std::string &qname, const std::string &entity, char *res,
		   schd_error *err)
{
	set_schd_error_arg(err, ARG1, qname.c_str());
	set_schd_error_arg(err, ARG2, res);
	if (!entity.empty())
		set_schd_error_arg(err, ARG3, entity.c_str());
}

/**
 * @brief
 *		schderr_args_server	log a server-related run limit exceeded message
 *
 * @param [in]	entity	-	name of the group or user, or NULL if unneeded
 * @param [out]	err	-	schd_error structure to return error information
 */
static void
schderr_args_server(const char *entity, schd_error *err)
{
	set_schd_error_arg(err, ARG1, entity);
}
// overloaded
static void
schderr_args_server(const std::string &entity, schd_error *err)
{
	set_schd_error_arg(err, ARG1, entity.c_str());
}
/**
 * @brief
 *		schderr_args_server_res	log a server-related resource limit exceeded
 *				message
 *
 * @param[in]	entity	-	name of the group or user, or NULL if unneeded by fmt
 * @param[in]	res	-	name of the resource
 * @param[out]	err	-	schd_error structure to return error information
 */
static void
schderr_args_server_res(std::string &entity, const char *res, schd_error *err)
{
	set_schd_error_arg(err, ARG1, res);
	if (!entity.empty())
		set_schd_error_arg(err, ARG2, entity.c_str());
}

/**
 * @brief
 *		check_max_project_res	check to see whether the user can run a
 *				resource resv and still be within project max
 *				resource limits
 *
 * @param[in]	rr	-	resource_resv to run
 * @param[in]	cts_list	-	the user counts list
 * @param[out]  rdef -		resource definition of resource exceeding a limit
 * @param[in]	limitctx	-	the limit storage context
 *
 * @return	int
 * @retval	0	: if the project would be under or at its limits
 * @retval	1	: if a generic project limit would be exceeded
 * @retval	2	: if an individual project limit would be exceeded
 * @retval	-1	: on error
 */
static int
check_max_project_res(resource_resv *rr, counts_umap &cts_list,
		      resdef **rdef, void *limitctx)
{
	char *projectreskey;
	char *genprojectreskey;
	schd_resource *res;
	std::string project;
	sch_resource_t max_project_res;
	sch_resource_t max_genproject_res;
	sch_resource_t used = 0;

	if (rr == NULL)
		return (-1);
	if ((limres == NULL) || (rr->resreq == NULL) || (rr->project.empty()))
		return (0);

	project = rr->project;
	for (res = limres; res != NULL; res = res->next) {
		resource_req *req;
		if ((req = find_resource_req(rr->resreq, res->def)) == NULL)
			continue;

		/* individual project limit check */
		if ((projectreskey = entlim_mk_reskey(LIM_PROJECT,
						      project.c_str(), res->name)) == NULL)
			return (-1);
		max_project_res = lim_get(projectreskey, limitctx);
		free(projectreskey);

		/* generic project limit check */
		if ((genprojectreskey = lim_genprojectreskey(res->name)) == NULL)
			return (-1);
		max_genproject_res = lim_get(genprojectreskey, limitctx);
		free(genprojectreskey);

		if ((max_project_res == SCHD_INFINITY) &&
		    (max_genproject_res == SCHD_INFINITY))
			continue;

		/* at this point, we know a generic or individual limit is set */
		used = find_counts_elm(cts_list, project, res->def, NULL, NULL);

		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "project %s max_*project_res.%s (%.1lf, %.1lf), used %.1lf",
			   project.c_str(), res->name, max_project_res, max_genproject_res, used);

		if (max_project_res != SCHD_INFINITY) {
			if (used + req->amount > max_project_res) {
				*rdef = res->def;
				return (2);
			} else
				continue; /* ignore a generic limit */
		} else if (used + req->amount > max_genproject_res) {
			*rdef = res->def;
			return (1);
		}
	}

	return (0);
}

/**
 * @brief
 *		check_max_project_res_soft	check to see whether the user can run a
 *					resource resv and still be within project
 *					max resource soft limits
 *
 * @param[in]	rr	-	resource_resv to run
 * @param[in]	cts_list	-	the user counts list
 * @param[in]	limitctx	-	the limit storage context
 * @param[in]	preempt_bit	-	preempt bit value to set and return if limit is exceeded
 *
 * @return	int
 * @retval	0	: if the project would be under or at its limits
 * @retval	1	: if a generic or individual project limit would be exceeded
 * @retval	-1	: on error
 */
static int
check_max_project_res_soft(resource_resv *rr, counts_umap &cts_list, void *limitctx, int preempt_bit)
{
	char *projectreskey;
	char *genprojectreskey;
	std::string project;
	schd_resource *res;
	sch_resource_t max_project_res_soft;
	sch_resource_t max_genproject_res_soft;
	sch_resource_t used = 0;
	resource_count *rescts;
	int rc = 0;

	if (rr == NULL)
		return (-1);
	if ((limres == NULL) || (rr->resreq == NULL) || (rr->project.empty()))
		return (0);

	project = rr->project;
	for (res = limres; res != NULL; res = res->next) {
		/* If the job is not requesting the limit resource, it is not over its soft limit*/
		if (find_resource_req(rr->resreq, res->def) == NULL)
			continue;

		/* individual project limit check */
		if ((projectreskey = entlim_mk_reskey(LIM_PROJECT, project.c_str(),
						      res->name)) == NULL)
			return (-1);
		max_project_res_soft = lim_get(projectreskey, limitctx);
		free(projectreskey);

		/* generic project limit check */
		if ((genprojectreskey = lim_genprojectreskey(res->name)) == NULL)
			return (-1);
		max_genproject_res_soft = lim_get(genprojectreskey, limitctx);
		free(genprojectreskey);

		if ((max_project_res_soft == SCHD_INFINITY) &&
		    (max_genproject_res_soft == SCHD_INFINITY))
			continue;

		rescts = NULL;
		/* at this point, we know a generic or individual limit is set */
		used = find_counts_elm(cts_list, project, res->def, NULL, &rescts);
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "project %s max_*project_res_soft.%s (%.1lf, %.1lf), used %.1lf",
			   project.c_str(), res->name, max_project_res_soft, max_genproject_res_soft, used);

		if (max_project_res_soft != SCHD_INFINITY) {
			if (max_project_res_soft < used) {
				if (rescts != NULL)
					rescts->soft_limit_preempt_bit = preempt_bit;
				rc = preempt_bit;
			} else {
				if (rescts != NULL)
					rescts->soft_limit_preempt_bit = 0;
				continue; /* ignore a generic limit */
			}
		} else if (max_genproject_res_soft < used) {
			if (rescts != NULL)
				rescts->soft_limit_preempt_bit = preempt_bit;
			rc = preempt_bit;
		} else {
			/* usage is under generic project soft limit, reset the preempt bit */
			if (rescts != NULL)
				rescts->soft_limit_preempt_bit = 0;
		}
	}

	return (rc);
}

/**
 * @brief
 *		check_server_max_project_res	hard limit checking function for
 *					project server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_server_max_project_res(server_info *si, queue_info *qi, resource_resv *rr,
			     limcounts *sc, limcounts *qc, schd_error *err)
{
	int ret;
	resdef *rdef = NULL;

	if ((si == NULL) || (rr == NULL) || (sc == NULL))
		return (SCHD_ERROR);

	if (rr->project.empty())
		return 0;

	if (!si->has_proj_limit)
		return (0);

	auto &cts = sc->project;

	ret = check_max_project_res(rr, cts,
				    &rdef, LI2RESCTX(si->liminfo));
	if (ret != 0) {
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "check_max_project_res returned %d", ret);
	}
	switch (ret) {
		default:
		case -1:
			return (SCHD_ERROR);
		case 0:
			return (0);
		case 1: /* generic project limit exceeded */
			err->rdef = rdef;
			return (SERVER_PROJECT_RES_LIMIT_REACHED);
		case 2: /* individual project limit exceeded */
			schderr_args_server_res(rr->project, NULL, err);
			err->rdef = rdef;
			return (SERVER_BYPROJECT_RES_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_server_max_project_run_soft	soft limit checking function for
 *					project server run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_project_run_soft(server_info *si, queue_info *qi,
				  resource_resv *rr)
{
	char *key;
	std::string project;
	int used;
	int max_project_run_soft, max_genproject_run_soft;
	counts *cnt = NULL;

	if (si == NULL || rr == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (rr->project.empty())
		return 0;

	if (!si->has_proj_limit)
		return (0);

	project = rr->project;
	if ((key = entlim_mk_runkey(LIM_PROJECT, project.c_str())) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_project_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(si->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_PROJECT, genparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_genproject_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(si->liminfo));
	free(key);

	if ((max_project_run_soft == SCHD_INFINITY) &&
	    (max_genproject_run_soft == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(si->project_counts, project, NULL, &cnt, NULL);
	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "project %s max_*project_run_soft (%d, %d), used %d",
		   project.c_str(), max_project_run_soft, max_genproject_run_soft, used);

	if (max_project_run_soft != SCHD_INFINITY) {
		if (max_project_run_soft < used) {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT));
		} else {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = 0;
			return (0); /* ignore a generic limit */
		}
	} else if (max_genproject_run_soft < used) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT);
		return (PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_server_max_project_res_soft	soft limit checking function for
 *					project server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_server_max_project_res_soft(server_info *si, queue_info *qi,
				  resource_resv *rr)
{
	if ((si == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!si->has_proj_limit)
		return (0);

	return (check_max_project_res_soft(rr, si->project_counts,
					   LI2RESCTXSOFT(si->liminfo), PREEMPT_TO_BIT(PREEMPT_OVER_SERVER_LIMIT)));
}

/**
 * @brief
 *		check_queue_max_project_res	hard limit checking function for
 *					project queue resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_queue_max_project_res(server_info *si, queue_info *qi, resource_resv *rr,
			    limcounts *sc, limcounts *qc, schd_error *err)
{
	int ret;
	resdef *rdef = NULL;

	if ((qi == NULL) || (rr == NULL) || (qc == NULL))
		return (SCHD_ERROR);

	if (rr->project.empty())
		return 0;

	if (!qi->has_proj_limit)
		return (0);

	auto &cts = qc->project;

	ret = check_max_project_res(rr, cts, &rdef, LI2RESCTX(qi->liminfo));
	if (ret != 0)
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
			   "check_max_project_res returned %d", ret);
	switch (ret) {
		default:
		case -1:
			return (SCHD_ERROR);
		case 0:
			return (0);
		case 1: /* generic project limit exceeded */
			schderr_args_q_res(qi->name, NULL, NULL, err);
			err->rdef = rdef;
			return (QUEUE_PROJECT_RES_LIMIT_REACHED);
		case 2: /* individual project limit exceeded */
			schderr_args_q_res(qi->name, rr->project, NULL, err);
			err->rdef = rdef;
			return (QUEUE_BYPROJECT_RES_LIMIT_REACHED);
	}
}

/**
 * @brief
 *		check_queue_max_project_run_soft	soft limit checking function for
 *					project queue run limits
 *
 * @param [in]	si	-	server_info structure to use for limit evaluation
 * @param [in]	qi	-	queue_info structure to use for limit evaluation
 * @param [in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_queue_max_project_run_soft(server_info *si, queue_info *qi,
				 resource_resv *rr)
{
	char *key;
	std::string project;
	int used;
	int max_project_run_soft, max_genproject_run_soft;
	counts *cnt = NULL;

	if (qi == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (rr->project.empty())
		return 0;

	if (!qi->has_proj_limit)
		return (0);

	project = rr->project;
	if ((key = entlim_mk_runkey(LIM_PROJECT, project.c_str())) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_project_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(qi->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_PROJECT, genparam)) == NULL)
		return (PREEMPT_TO_BIT(PREEMPT_ERR));
	max_genproject_run_soft = (int) lim_get(key, LI2RUNCTXSOFT(qi->liminfo));
	free(key);

	if ((max_project_run_soft == SCHD_INFINITY) &&
	    (max_genproject_run_soft == SCHD_INFINITY))
		return (0);

	used = find_counts_elm(qi->project_counts, project, NULL, &cnt, NULL);

	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "%s project %s max_*project_run_soft (%d, %d), used %d",
		   project.c_str(), max_project_run_soft, max_genproject_run_soft, used);

	if (max_project_run_soft != SCHD_INFINITY) {
		if (max_project_run_soft < used) {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
			return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
		} else {
			if (cnt != NULL)
				cnt->soft_limit_preempt_bit = 0;
			return (0); /* ignore a generic limit */
		}
	} else if (max_genproject_run_soft < used) {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT);
		return (PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT));
	} else {
		if (cnt != NULL)
			cnt->soft_limit_preempt_bit = 0;
		return (0);
	}
}

/**
 * @brief
 *		check_queue_max_project_res_soft	soft limit checking function for
 *					project queue resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	PREEMPT_TO_BIT(preempt enum)	: if limit is exceeded
 * @retval	PREEMPT_TO_BIT(PREEMPT_ERR)	: on error
 *
 * @see	#preempt enum in constant.h
 */
static int
check_queue_max_project_res_soft(server_info *si, queue_info *qi,
				 resource_resv *rr)
{
	if ((qi == NULL) || (rr == NULL))
		return (PREEMPT_TO_BIT(PREEMPT_ERR));

	if (!qi->has_proj_limit)
		return (0);

	return (check_max_project_res_soft(rr, qi->project_counts,
					   LI2RESCTXSOFT(qi->liminfo), PREEMPT_TO_BIT(PREEMPT_OVER_QUEUE_LIMIT)));
}

/**
 * @brief
 *		check_server_max_project_run	hard limit checking function for
 *					project server resource limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_server_max_project_run(server_info *si, queue_info *qi, resource_resv *rr,
			     limcounts *sc, limcounts *qc, schd_error *err)
{
	char *key;
	std::string project;
	int used;
	int max_project_run, max_genproject_run;

	if ((si == NULL) || (rr == NULL) || (sc == NULL))
		return (SCHD_ERROR);

	auto &cts = sc->project;

	if (rr->project.empty())
		return 0;

	if (!si->has_proj_limit)
		return (0);

	project = rr->project;
	if ((key = entlim_mk_runkey(LIM_PROJECT, project.c_str())) == NULL)
		return (SCHD_ERROR);
	max_project_run = (int) lim_get(key, LI2RUNCTX(si->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_PROJECT, genparam)) == NULL)
		return (SCHD_ERROR);
	max_genproject_run = (int) lim_get(key, LI2RUNCTX(si->liminfo));
	free(key);

	if ((max_project_run == SCHD_INFINITY) &&
	    (max_genproject_run == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(cts, project, NULL, NULL, NULL);

	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "project %s max_*project_run (%d, %d), used %d",
		   project.c_str(), max_project_run, max_genproject_run, used);

	if (max_project_run != SCHD_INFINITY) {
		if (max_project_run <= used) {
			schderr_args_server(project, err);
			return (SERVER_BYPROJECT_JOB_LIMIT_REACHED);
		} else
			return (0); /* ignore a generic limit */
	} else if (max_genproject_run <= used) {
		schderr_args_server(NULL, err);
		return (SERVER_PROJECT_LIMIT_REACHED);
	} else
		return (0);
}

/**
 * @brief
 *		check_queue_max_project_run	hard limit checking function for
 *					project queue run limits
 *
 * @param[in]	si	-	server_info structure to use for limit evaluation
 * @param[in]	qi	-	queue_info structure to use for limit evaluation
 * @param[in]	rr	-	resource_resv structure to use for limit evaluation
 * @param[in]	sc	-	limcounts struct for server count/total_count maxes over job run
 * @param[in]	qc	-	limcounts struct for queue count/total_count maxes over job run
 * @param[out]	err	-	schd_error structure to return error information
 *
 * @return	integer indicating failing limit test if limit is exceeded
 * @retval	0	: if limit is not exceeded
 * @retval	sched_error_code enum	: if limit is exceeded
 * @retval	SCHD_ERROR	: on error
 *
 * @see	#sched_error_code in constant.h
 */
static int
check_queue_max_project_run(server_info *si, queue_info *qi, resource_resv *rr,
			    limcounts *sc, limcounts *qc, schd_error *err)
{
	char *key;
	std::string project;
	int used;
	int max_project_run, max_genproject_run;

	if (qi == NULL || (rr == NULL) || (qc == NULL))
		return (SCHD_ERROR);

	auto &cts = qc->project;

	project = rr->project;
	if (project.empty())
		return 0;

	if (!qi->has_proj_limit)
		return (0);

	if ((key = entlim_mk_runkey(LIM_PROJECT, project.c_str())) == NULL)
		return (SCHD_ERROR);
	max_project_run = (int) lim_get(key, LI2RUNCTX(qi->liminfo));
	free(key);

	if ((key = entlim_mk_runkey(LIM_PROJECT, genparam)) == NULL)
		return (SCHD_ERROR);
	max_genproject_run = (int) lim_get(key, LI2RUNCTX(qi->liminfo));
	free(key);

	if ((max_project_run == SCHD_INFINITY) &&
	    (max_genproject_run == SCHD_INFINITY))
		return (0);

	/* at this point, we know a generic or individual limit is set */
	used = find_counts_elm(cts, project, NULL, NULL, NULL);

	log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, rr->name,
		   "project %s max_*project_run (%d, %d), used %d",
		   project.c_str(), max_project_run, max_genproject_run, used);

	if (max_project_run != SCHD_INFINITY) {
		if (max_project_run <= used) {
			schderr_args_q(qi->name, project, err);
			return (QUEUE_BYPROJECT_JOB_LIMIT_REACHED);
		} else
			return (0); /* ignore a generic limit */
	} else if (max_genproject_run <= used) {
		schderr_args_q(qi->name, NULL, err);
		return (QUEUE_PROJECT_LIMIT_REACHED);
	} else
		return (0);
}


================================================
FILE: src/scheduler/limits_if.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _LIMITS_IF_H
#define _LIMITS_IF_H
#include "pbs_ifl.h"
#include "pbs_entlim.h"

enum limtype {
	LIM_RES, /* new-style resource limit */
	LIM_RUN, /* new-style run (i.e. job count) limit */
	LIM_OLD	 /* old-style run limit */
};

/**	@fn void *lim_alloc_liminfo(void)
 *	@brief	allocate and return storage for recording limit information
 *
 *	@par MT-safe:	No
 */
void *lim_alloc_liminfo(void);

/**	@fn void *lim_dup_liminfo(void *p)
 *	@brief	duplicate limit information allocated by lim_alloc_liminfo()
 *
 *	@param	p	the data to be cloned
 *
 *	@return		pointer to cloned data on success or NULL on failure
 *
 *	@par MT-safe:	No
 */
void *lim_dup_liminfo(void *);

/**	@fn void lim_free_liminfo(void *p)
 *	@brief	free limit information allocated by lim_alloc_liminfo()
 *
 *	@param	p	the data to be freed
 *
 *	@par MT-safe:	No
 */
void lim_free_liminfo(void *);

/**	@fn int has_hardlimits(void *p)
 *	@brief	are any hard limits set?
 *
 *	@param p	the limit storage to test
 *
 *	@retval 0	no hard limits set
 *	@retval 1	at least one hard limit set
 *
 *	@par MT-safe:	No
 */
int has_hardlimits(void *);

/**	@fn int has_softlimits(void *p)
 *	@brief	are any soft limits set?
 *
 *	@param p	the limit storage to test
 *
 *	@retval 0	no soft limits set
 *	@retval 1	at least one soft limit set
 *
 *	@par MT-safe:	No
 */
int has_softlimits(void *);

/**	@fn int is_reslimattr(const struct attrl *a)
 *	@brief	is the given attribute a new-style resource limit attribute?
 *
 *	@param a	pointer to the attribute
 *
 *	@retval 0	the named attribute is not a new-style resource limit
 *	@retval 1	the named attribute is a new-style resource limit
 *
 *	@par MT-safe:	Yes
 */
int is_reslimattr(const struct attrl *);

/**	@fn int is_runlimattr(const struct attrl *a)
 *	@brief	is the given attribute a new-style run limit attribute?
 *
 *	@param a	pointer to the attribute
 *
 *	@retval 0	the named attribute is not a new-style run limit
 *	@retval 1	the named attribute is a new-style run limit
 *
 *	@par MT-safe:	Yes
 */
int is_runlimattr(const struct attrl *);

/**	@fn int is_oldlimattr(const struct attrl *a)
 *	@brief	is the given attribute an old-style limit attribute?
 *
 *	@param a	pointer to the attribute
 *
 *	@retval 0	the named attribute is not an old-style limit attribute
 *	@retval 1	the named attribute is an old-style limit attribute
 *
 *	@par MT-safe:	Yes
 */
int is_oldlimattr(const struct attrl *);

/**
 * @brief
 * 		convert an old limit attribute name to the new one
 *
 * @param[in]	a	-	attribute list structure
 *
 * @return char *
 * @retval !NULL	: old limit attribute name
 * @retval NULL		: attribute value is not an old limit attribute
 *
 */
const char *convert_oldlim_to_new(const struct attrl *a);

/**	@fn int lim_setlimits(const struct attrl *a, enum limtype lt, void *p)
 *	@brief set resource or run-time limits
 *
 *	For the given attribute value and limit data, parse and set any limit
 *	directives found therein.
 *
 *	@param a	pointer to the attribute, whose value is a new-style
 *			param and may contain multiple limits to set
 *	@param lt	the class of limit being set
 *	@param p	the place to store limit information
 *
 *	@retval 0	limits were successfully set
 *	@retval nonzero	limits were not successfully set
 *
 *	@par MT-safe:	No
 */
int lim_setlimits(const struct attrl *, enum limtype, void *);

/**	@fn int check_limits(server_info *si, queue_info *qi, resource_resv *rr,
 *                          schd_error *err, int mode)
 *	@brief	check all run-time hard limits to see whether a job may run
 *
 *	@param si	server_info structure (for server resources, list of
 *			running jobs, limit information, ...)
 *	@param qi	queue_info structure (for server resources, list of
 *			running jobs, limit information, ...)
 *	@param rr	resource_resv structure (array of assigned resources to
 *			count against resource limits, group/user name, ...)
 *	@param err	schd_error structure to return error information
 *
 *	@param mode specifies the mode in which limits need to be checked
 *
 *	@retval 0	job exceeds no run-time hard limits
 *	@retval nonzero	job exceeds at least one run-time hard limit
 *
 *	@par MT-safe:	No
 */
int check_limits(server_info *, queue_info *, resource_resv *,
		 schd_error *, unsigned int);

/**	@fn int check_soft_limits(server_info *si, queue_info *qi, resource_resv *rr)
 *	@brief	check to see whether a job exceeds its run-time soft limits
 *
 *	@param si	server_info structure (for server resources, list of
 *			running jobs, limit information, ...)
 *	@param qi	queue_info structure (for server resources, list of
 *			running jobs, limit information, ...)
 *	@param rr	resource_resv structure (array of assigned resources to
 *			count against resource limits, group/user name, ...)
 *
 *	@retval 0	job exceeds no run-time soft limits
 *	@retval PREEMPT_TO_BIT(enum preempt) otherwise
 *
 *	@par MT-safe:	No
 *
 *	@see		#preempt in constant.h
 */
int check_soft_limits(server_info *, queue_info *, resource_resv *);

/**
 *      @fn void clear_limres()
 *      @brief free and clear saved limit resources.  Must be called whenever
 *             resource definitions are updated.
 *      @return void
 */
void clear_limres(void);

/**
 * 	@fn schd_resource query_limres()
 * 	@brief returns a linked list of resources being limited.
 * 	@par This is to be treated as read-only.  Modifying this will adversely
 * 	     affect the limits code
 *
 * 	@return schd_resource *
 */
schd_resource *query_limres(void);

/**
  *  @brief check the soft limit using soft limit function.
  *
  *  @return void
  */
void update_soft_limits(server_info *, queue_info *, resource_resv *);

/**
 * @brief	find the value of preempt bit with matching entity and resource in
 *		the counts structure
 * @return	int
 */
int find_preempt_bits(counts *, std::string &, resource_resv *);
#endif /* _LIMITS_IF_H */


================================================
FILE: src/scheduler/list_order.awk
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
BEGIN { FS=";" }
$6 == "Starting Scheduling Cycle" { st = $1; jobs = "" }

$6 == "Considering job to run" { jobs = sprintf("%s%s\n", jobs, $5) }

$6 == "Leaving Scheduling Cycle" { en = $1 }

END {
  split(en, arr, " ");
  printf("Time: %s - %s\nOrder:%s\n\n", st, arr[2], jobs);
}


================================================
FILE: src/scheduler/misc.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * Miscellaneous functions of scheduler.
 */
#include <pbs_config.h>

#include "config.h"
#include "constant.h"
#include "fairshare.h"
#include "globals.h"
#include "misc.h"
#include "resource.h"
#include "resource_resv.h"
#include <algorithm>
#include <ctype.h>
#include <errno.h>
#include <libpbs.h>
#include <libutil.h>
#include <log.h>
#include <math.h>
#include <pbs_error.h>
#include <pbs_ifl.h>
#include <pbs_internal.h>
#include <pbs_share.h>
#include <sstream>
#include <stdarg.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>

/**
 * @brief
 *		string_dup - duplicate a string
 *
 * @param[in]	str	-	string to duplicate
 *
 * @return	newly allocated string
 *
 */

char *
string_dup(const char *str)
{
	char *newstr;
	size_t len;

	if (str == NULL)
		return NULL;

	len = strlen(str) + 1;
	if ((newstr = static_cast<char *>(malloc(len))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	pbs_strncpy(newstr, str, len);

	return newstr;
}

/**
 * @brief
 * 		add a string to a string array only if it is unique
 *
 * @param[in,out]	str_arr	-	array of strings of unique values
 * @param[in]	str	-	string to add
 * @return	int
 * @retval	index in array if success	: string is added to array
 * @retval	-1 failure	: string could not be added to the array
 */
int
add_str_to_unique_array(char ***str_arr, char *str)
{
	int ind;
	if (str_arr == NULL || str == NULL)
		return -1;

	ind = find_string_idx(*str_arr, str);
	if (ind >= 0) /* found it! */
		return ind;

	return add_str_to_array(str_arr, str);
}

/**
 * @brief
 * 		add string to string array
 *
 * @param[in]	str_arr	-	pointer to an array of strings to be added to(i.e. char ***)
 * @param[in]	str	-	string to add to array
 *
 * @return	int
 * @retval	index	-	index of string on success
 * @retval	-1	: failure
 */
int
add_str_to_array(char ***str_arr, char *str)
{
	char **tmp_arr;
	int cnt;

	if (str_arr == NULL || str == NULL)
		return -1;

	if (*str_arr == NULL)
		cnt = 0;
	else
		cnt = count_array(*str_arr);

	tmp_arr = static_cast<char **>(realloc(*str_arr, (cnt + 2) * sizeof(char *)));
	if (tmp_arr == NULL)
		return -1;

	tmp_arr[cnt] = string_dup(str);
	tmp_arr[cnt + 1] = NULL;

	*str_arr = tmp_arr;

	return cnt;
}

/**
 * @brief
 * 		res_to_num - convert a resource string to a numeric sch_resource_t
 *
 * @param[in]	res_str	-	the resource string
 * @param[out]	type	-	the type of the resource
 *
 * @return	sch_resource_t
 * @retval	a number in kilobytes or seconds
 * @retval	0 for False, if type is boolean
 * @retval	1 for True, if type is boolean
 * @retval	SCHD_INFINITY_RES	: if not a number
 *
 */
sch_resource_t
res_to_num(const char *res_str, struct resource_type *type)
{
	sch_resource_t count = SCHD_INFINITY_RES;  /* convert string resource to numeric */
	sch_resource_t count2 = SCHD_INFINITY_RES; /* convert string resource to numeric */
	char *endp;				   /* used for strtol() */
	char *endp2;				   /* used for strtol() */
	long multiplier = 1;			   /* multiplier to count */
	int is_size = 0;			   /* resource value is a size type */
	int is_time = 0;			   /* resource value is a time spec */

	if (res_str == NULL)
		return SCHD_INFINITY_RES;

	if (!strcasecmp(ATR_TRUE, res_str)) {
		if (type != NULL) {
			type->is_boolean = 1;
			type->is_non_consumable = 1;
		}
		count = 1;
	} else if (!strcasecmp(ATR_FALSE, res_str)) {
		if (type != NULL) {
			type->is_boolean = 1;
			type->is_non_consumable = 1;
		}
		count = 0;
	} else if (!is_num(res_str)) {
		if (type != NULL) {
			type->is_string = 1;
			type->is_non_consumable = 1;
		}
		count = SCHD_INFINITY_RES;
	} else {
		count = (sch_resource_t) strtod(res_str, &endp);

		if (*endp == ':') { /* time resource -> convert to seconds */
			count2 = (sch_resource_t) strtod(endp + 1, &endp2);
			if (*endp2 == ':') { /* form of HH:MM:SS */
				count *= 3600;
				count += count2 * 60;
				count += strtol(endp2 + 1, &endp, 10);
				if (*endp != '\0')
					count = SCHD_INFINITY_RES;
			} else { /* form of MM:SS */
				count *= 60;
				count += count2;
			}
			multiplier = 1;
			is_time = 1;
		} else if (*endp == 'k' || *endp == 'K') {
			multiplier = 1;
			is_size = 1;
		} else if (*endp == 'm' || *endp == 'M') {
			multiplier = MEGATOKILO;
			is_size = 1;
		} else if (*endp == 'g' || *endp == 'G') {
			multiplier = GIGATOKILO;
			is_size = 1;
		} else if (*endp == 't' || *endp == 'T') {
			multiplier = TERATOKILO;
			is_size = 1;
		} else if (*endp == 'b' || *endp == 'B') {
			count = ceil(count / KILO);
			multiplier = 1;
			is_size = 1;
		} else if (*endp == 'w') {
			count = ceil(count / KILO);
			multiplier = SIZEOF_WORD;
			is_size = 1;
		} else /* catch all */
			multiplier = 1;

		if (*endp != '\0' && *(endp + 1) == 'w')
			multiplier *= SIZEOF_WORD;

		if (type != NULL) {
			type->is_consumable = 1;
			if (is_size)
				type->is_size = 1;
			else if (is_time)
				type->is_time = 1;
			else
				type->is_num = 1;
		}
	}

	return count * multiplier;
}

/**
 * @brief
 *      skip_line - find if the line of the config file needs to be skipped
 *                  due to it being a comment or other means
 *
 * @param[in]	line	-	the line from the config file
 *
 * @return	true:1/false:0
 * @retval	true	: if the line should be skipped
 * @retval	false	: if it should be parsed
 *
 */
int
skip_line(char *line)
{
	int skip = 0; /* whether or not to skil the line */

	if (line != NULL) {
		while (isspace((int) *line))
			line++;

		/* '#' is comment in config files and '*' is comment in holidays file */
		if (line[0] == '\0' || line[0] == '#' || line[0] == '*')
			skip = 1;
	}

	return skip;
}

/**
 *	@brief  combination of log_event() and translate_fail_code()
 *		If we're actually going to log a message, translate
 *		err into a message and then log it.  The translated
 *		error will be printed after the message
 *
 *	@param[in] event - the event type
 *	@param[in] event_class - the event class
 *	@param[in] sev   - the severity of the log message
 *	@param[in] name  - the name of the object
 *	@param[in] text  - the text of the message
 *			if NULL, only print translated error text
 *	@param[in] err   - schderr error structure to be translated
 *
 *	@return nothing
 */
void
schdlogerr(int event, int event_class, int sev, const std::string &name, const char *text,
	   schd_error *err)
{

	if (err == NULL)
		return;

	if (will_log_event(event)) {
		char logbuf[MAX_LOG_SIZE];

		translate_fail_code(err, NULL, logbuf);
		if (text == NULL)
			log_event(event, event_class, sev, name, logbuf);
		else
			log_eventf(event, event_class, sev, name, "%s %s", text, logbuf);
	}
}

/**
 * @brief
 * 	log_eventf - a combination of log_event() and printf()
 *
 * @param[in] eventtype - event type
 * @param[in] objclass - event object class
 * @param[in] sev - indication for whether to syslogging enabled or not
 * @param[in] objname - object name stating log msg related to which object
 * @param[in] fmt - format string
 * @param[in] ... - arguments to format string
 *
 * @return void
 */
void
log_eventf(int eventtype, int objclass, int sev, const std::string &objname, const char *fmt, ...)
{
	va_list args;
	va_start(args, fmt);
	do_log_eventf(eventtype, objclass, sev, objname.c_str(), fmt, args);
	va_end(args);
}

/**
 * @brief
 * 	log_event - log a server event to the log file
 *
 *	Checks to see if the event type is being recorded.  If they are,
 *	pass off to log_record().
 *
 *	The caller should ensure proper formating of the message if "text"
 *	is to contain "continuation lines".
 *
 * @param[in] eventtype - event type
 * @param[in] objclass - event object class
 * @param[in] sev - indication for whether to syslogging enabled or not
 * @param[in] objname - object name stating log msg related to which object
 * @param[in] text - log msg to be logged.
 *
 *	Note, "sev" or severity is used only if syslogging is enabled,
 *	see syslog(3) and log_record.c for details.
 */

void
log_event(int eventtype, int objclass, int sev, const std::string &objname, const char *text)
{
	if (will_log_event(eventtype))
		log_record(eventtype, objclass, sev, objname.c_str(), text);
}

/**
 * @brief
 * 		take a generic NULL terminated pointer array and return a
 *             filtered specialized array based on calling filter_func() on every
 *             member.  This can be used with any standard scheduler array
 *	       like resource_resv or node_info or resdef
 *
 * @param[in] ptrarr	-	the array to filter
 * @param[in] filter_func	-	pointer to a function that will filter the array
 * @param[in] arg	-	an optional arg passed to filter_func
 * @param[in] flags	-	control how ptrs are filtered
 *						FILTER_FULL - leave the filtered array full size
 *
 * @par
 * 	   filter_func prototype: @fn int func( void *, void * )
 *                                           object   arg
 *		  object - specific member of ptrarr[]
 *		  arg    - arg parameter
 *               - returns 1: ptr will be added to filtered array
 *               - returns 0: ptr will NOT be added to filtered array
 *
 * @return	void ** filtered array.
 */
void **
filter_array(void **ptrarr, int (*filter_func)(void *, void *),
	     void *arg, int flags)
{
	void **new_arr = NULL; /* the filtered array */
	void **tmp;
	int i, j;
	int size;

	if (ptrarr == NULL || filter_func == NULL)
		return NULL;

	size = count_array(ptrarr);

	if ((new_arr = static_cast<void **>(malloc((size + 1) * sizeof(void *)))) == NULL) {
		log_err(errno, __func__, "Error allocating memory");
		return NULL;
	}

	for (i = 0, j = 0; i < size; i++) {
		if (filter_func(ptrarr[i], arg)) {
			new_arr[j] = ptrarr[i];
			j++;
		}
	}
	new_arr[j] = NULL;

	if (!(flags & FILTER_FULL)) {
		if ((tmp = static_cast<void **>(realloc(new_arr, (j + 1) * sizeof(void *)))) == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			free(new_arr);
			return NULL;
		}
		new_arr = tmp;
	}
	return new_arr;
}

/**
 * @brief
 * 		match two NULL terminated string arrays
 *
 * @param[in]	strarr	-	the string array to search
 * @param[in]	str	-	the string to find
 *
 * @return	enum match_string_array_ret
 * @retval	SA_FULL_MATCH	: full match
 * @retval	SA_SUB_MATCH		: full match of one array and it is
 *									a subset of the other
 * @retval	SA_PARTIAL_MATCH	: at least one match but not all
 * @retval	SA_NO_MATCH	: no match
 *
 */
enum match_string_array_ret
match_string_array(const char *const *strarr1, const char *const *strarr2)
{
	int match = 0;
	int i;
	int strarr2_len;

	if (strarr1 == NULL || strarr2 == NULL)
		return SA_NO_MATCH;

	strarr2_len = count_array(strarr2);

	for (i = 0; strarr1[i] != NULL; i++) {
		if (is_string_in_arr(const_cast<char **>(strarr2), strarr1[i]))
			match++;
	}

	/* i is the length of strarr1 since we just looped through the whole array */
	if (match == i && match == strarr2_len)
		return SA_FULL_MATCH;

	if (match == i || match == strarr2_len)
		return SA_SUB_MATCH;

	if (match)
		return SA_PARTIAL_MATCH;

	return SA_NO_MATCH;
}
// overloaded
enum match_string_array_ret
match_string_array(const std::vector<std::string> &strarr1, const std::vector<std::string> &strarr2)
{
	unsigned int match = 0;

	if (strarr1.empty() || strarr2.empty())
		return SA_NO_MATCH;

	for (auto &str1 : strarr1) {
		if (std::find(strarr2.begin(), strarr2.end(), str1) != strarr2.end())
			match++;
	}

	if (match == strarr1.size() && match == strarr2.size())
		return SA_FULL_MATCH;

	if (match == strarr1.size() || match == strarr2.size())
		return SA_SUB_MATCH;

	if (match)
		return SA_PARTIAL_MATCH;

	return SA_NO_MATCH;
}

/**
 * @brief
 * 		convert a string array into a printable string
 *
 * @param[in]	strarr	-	string array to convert
 *
 * @return	converted string stored in local static ptr (no need to free)
 *
 * @par MT-safe:	yes
 *
 */
char *
string_array_to_str(char **strarr)
{
	char *arrbuf = NULL;
	int len = 0;
	int i;

	if (strarr == NULL)
		return NULL;

	if (strarr[0] == NULL)
		return NULL;

	for (i = 0; strarr[i] != NULL; i++)
		len += strlen(strarr[i]);
	len += i; /* added space for the commas */

	arrbuf = static_cast<char *>(malloc(len + 1));
	if (arrbuf == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	arrbuf[0] = '\0';

	for (i = 0; strarr[i] != NULL; i++) {
		strcat(arrbuf, strarr[i]);
		strcat(arrbuf, ",");
	}
	arrbuf[strlen(arrbuf) - 1] = '\0';

	return arrbuf;
}

/**
 * @brief
 * 		calc_used_walltime - calculate the  used amount of a resource resv
 *
 * @param[in]	resresv	-	the resource resv to calculate
 *
 * @return	used amount of the resource resv
 * @retval	0	: if resresv starts in the future
 *					or if the resource used for walltime is NULL
 */

time_t
calc_used_walltime(resource_resv *resresv)
{
	time_t used_amount = 0;
	resource_req *used = NULL;

	if (resresv == NULL)
		return 0;

	if (resresv->is_job && resresv->job != NULL) {
		used = find_resource_req(resresv->job->resused, allres["walltime"]);

		/* If we can't find the used structure, we will just assume no usage */
		if (used == NULL)
			used_amount = 0;
		else
			used_amount = (time_t) used->amount;
	} else {
		if (resresv->server->server_time > resresv->start)
			used_amount = resresv->server->server_time - resresv->start;
		else
			used_amount = 0;
	}
	return used_amount;
}
/**
 * @brief
 * 		calc_time_left_STF - calculate the amount of time left
 *  	for minimum duration and maximum duration of a STF resource resv
 *
 * 	@param[in]	resresv		-	the resource resv to calculate
 * 	@param[out]	min_time_left	-	time left to complete minimum duration
 *
 * 	@return	time left to complete maximum duration of the job
 * 	@retval	0	: if used amount is greater than duration
 * 	@retval	-1	: on error
 */
int
calc_time_left_STF(resource_resv *resresv, sch_resource_t *min_time_left)
{
	time_t used_amount = 0;

	if (min_time_left == NULL || resresv->duration == UNSPECIFIED)
		return -1;

	used_amount = calc_used_walltime(resresv);
	*min_time_left = IF_NEG_THEN_ZERO((resresv->min_duration - used_amount));

	return IF_NEG_THEN_ZERO((resresv->duration - used_amount));
}
/**
 * @brief
 *		calc_time_left - calculate the remaining time of a resource resv
 *
 * @param[in]	resresv	-	the resource resv to calculate
 * @param[in]	use_hard_duration - use the resresv's hard_duration instead of normal duration
 *
 * @return	time left on job
 * @retval	-1	: on error
 *
 */
int
calc_time_left(resource_resv *resresv, int use_hard_duration)
{
	time_t used_amount = 0;
	long duration;

	if (use_hard_duration && resresv->hard_duration == UNSPECIFIED)
		return -1;

	else if (!use_hard_duration && resresv->duration == UNSPECIFIED)
		return -1;

	if (use_hard_duration)
		duration = resresv->hard_duration;
	else
		duration = resresv->duration;

	used_amount = calc_used_walltime(resresv);

	return IF_NEG_THEN_ZERO(duration - used_amount);
}

/**
 * @brief
 *		cstrcmp	- check string compare - compares two strings but doesn't bomb
 *		  if either one is null
 *
 * @param[in]	s1	-	string one
 * @param[in]	s2	-	string two
 *
 * @return	int
 * @retval	-1	: if s1 < s2
 * @retval	0	: if s1 == s2
 * @retval	1	: if s1 > s2
 *
 */
int
cstrcmp(const char *s1, const char *s2)
{
	if (s1 == NULL && s2 == NULL)
		return 0;

	else if (s1 == NULL && s2 != NULL)
		return -1;

	else if (s1 != NULL && s2 == NULL)
		return 1;

	return strcmp(s1, s2);
}

/**
 * @brief
 *		is_num - checks to see if the string is a number, size, float
 *		 or time in string form
 *
 * @param[in]	str	-	the string to test
 *
 * @return	int
 * @retval	1	: if str is a number
 * @retval	0	: if str is not a number
 * @retval	-1	: on error
 *
 */
int
is_num(const char *str)
{
	int i;
	int colon_count = 0;
	int str_len = -1;

	if (str == NULL)
		return -1;

	if (str[0] == '-' || str[0] == '+')
		str++;

	str_len = strlen(str);
	for (i = 0; i < str_len && (isdigit(str[i]) || str[i] == ':'); i++) {
		if (str[i] == ':')
			colon_count++;
	}

	/* is the string completely numeric or a time(HH:MM:SS or MM:SS) */
	if (i == str_len && colon_count <= 2)
		return 1;

	/* is the string a size type resource like 'mem' */
	if ((i == (str_len - 2)) || (i == (str_len - 1))) {
		auto c = tolower(str[i]);
		if (c == 'k' || c == 'm' || c == 'g' || c == 't') {
			c = tolower(str[i + 1]);
			if (c == 'b' || c == 'w' || c == '\0')
				return 1;
		} else if (i == (str_len - 1)) {
			/* catch the case of "b" or "w" */
			if (c == 'b' || c == 'w')
				return 1;
		}
	}

	/* last but not least, make sure we didn't stop on a decmal point */
	if (str[i] == '.') {
		for (i++; i < str_len && isdigit(str[i]); i++)
			;

		/* number is a float */
		if (i == str_len)
			return 1;
	}

	/* the string is not a number or a size or time */
	return 0;
}

/**
 * @brief
 *		count_array - count the number of elements in a NULL terminated array
 *		      of pointers
 *
 * @param[in]	arr	the array to count
 *
 * @return	number of elements in the array
 *
 */
int
count_array(const void *arr)
{
	int i;
	void **ptr_arr;

	if (arr == NULL)
		return 0;

	ptr_arr = (void **) arr;

	for (i = 0; ptr_arr[i] != NULL; i++)
		;

	return i;
}

/**
 * @brief
 *  dup_array - make a shallow copy of elements in a NULL terminated array of pointers.
 *
 * @param[in]	arr	-	the array to copy
 *
 * @return	array of pointers
 *
 */
void **
dup_array(void *ptr)
{
	void **ret;
	void **arr;
	int len = 0;

	arr = (void **) ptr;
	if (arr == NULL)
		return NULL;

	len = count_array(arr);
	ret = static_cast<void **>(malloc((len + 1) * sizeof(void *)));
	if (ret == NULL)
		return NULL;
	memcpy(ret, arr, len * sizeof(void *));
	ret[len] = NULL;
	return ret;
}

/**
 * @brief
 *		remove_ptr_from_array - remove a pointer from a ptr list and move
 *				the rest of the pointers up to fill the hole
 *				Pointer array size will not change - an extra
 *				NULL is added to the end
 *
 *	  arr - pointer array
 *	  ptr - pointer to remove from array
 *
 *	returns non-zero if the ptr was successfully removed from the array
 *		zero if the array has not been modified
 *
 */
int
remove_ptr_from_array(void *arr, void *ptr)
{
	int i;
	void **parr;

	if (arr == NULL || ptr == NULL)
		return 0;

	parr = (void **) arr;

	for (i = 0; parr[i] != NULL && parr[i] != ptr; i++)
		;

	if (parr[i] != NULL) {
		for (int j = i; parr[j] != NULL; j++)
			parr[j] = parr[j + 1];
		return 1;
	}

	return 0;
}

/**
 * @brief add pointer to NULL terminated pointer array
 * @param[in] ptr_arr - pointer array to add to
 * @param[in] ptr - pointer to add
 *
 * @return void *
 * @retval pointer array with new element added
 * @retval NULL on error
 */
void *
add_ptr_to_array(void *ptr_arr, void *ptr)
{
	void **arr;
	int cnt;

	cnt = count_array(ptr_arr);

	if (cnt == 0) {
		arr = static_cast<void **>(malloc(sizeof(void *) * 2));
		if (arr == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}
		arr[0] = ptr;
		arr[1] = NULL;
	} else {
		arr = static_cast<void **>(realloc(ptr_arr, (cnt + 1) * sizeof(void *)));
		if (arr == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}
		arr[cnt - 1] = ptr;
		arr[cnt] = NULL;
	}
	return arr;
}

/**
 * @brief
 *		is_valid_pbs_name - is str a valid pbs username (POSIX.1 + ' ')
 *			    a valid name is: alpha numeric '-' '_' '.' ' '
 * 			    For fairshare entities: colen ':'
 *
 * @param[in]	str	-	string to check validity
 * @param[in]	len	-	length of str buffer or -1 if length is unknown
 *
 * @return	int
 * @retval	1	: valid PBS username
 * @retval	0	: not valid username
 */
int
is_valid_pbs_name(char *str, int len)
{
	int i;
	int valid = 1;

	if (str == NULL)
		return 0;

	/* if str is not null terminated, this could cause problems */
	if (len < 0)
		len = strlen(str) + 1;

	for (i = 0; i < len && valid; i++) {
		if (str[i] == '\0')
			break;
		if (!(isalpha(str[i]) || isdigit(str[i]) || str[i] == '.' ||
		      str[i] == '-' || str[i] == '_' || str[i] == ' ' || str[i] == ':')) {
			valid = 0;
		}
	}

	if (i == len)
		valid = 0;

	return valid;
}

/**
 * @brief
 * 		clear an schd_error structure for reuse
 *
 * @param[in]	err	-	error structure to clear
 *
 * @return	void
 */
void
clear_schd_error(schd_error *err)
{
	if (err == NULL)
		return;

	set_schd_error_codes(err, SCHD_UNKWN, SUCCESS);
	set_schd_error_arg(err, ARG1, NULL);
	set_schd_error_arg(err, ARG2, NULL);
	set_schd_error_arg(err, ARG3, NULL);
	set_schd_error_arg(err, SPECMSG, NULL);
	err->rdef = NULL;
	err->next = NULL;
}

/**
 * @brief
 *  	constructor schd_error
 *
 * @return	new schd_error strucuture
 * @retval	NULL	: Error
 */
schd_error *
new_schd_error()
{
	schd_error *err;
	if ((err = static_cast<schd_error *>(calloc(1, sizeof(schd_error)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	clear_schd_error(err);
	return err;
}

/**
 * @brief
 * 		copy constructor for schd_error
 *
 * @param[in]	oerr	-	output error.
 *
 * @return	new schd_error structure
 * @retval	NULL	: Error
 */
schd_error *
dup_schd_error(schd_error *oerr)
{
	schd_error *nerr;
	if (oerr == NULL)
		return NULL;

	nerr = new_schd_error();
	if (nerr == NULL)
		return NULL;

	nerr->rdef = oerr->rdef;
	set_schd_error_codes(nerr, oerr->status_code, oerr->error_code);
	set_schd_error_arg(nerr, ARG1, oerr->arg1);
	set_schd_error_arg(nerr, ARG2, oerr->arg2);
	set_schd_error_arg(nerr, ARG3, oerr->arg3);
	set_schd_error_arg(nerr, SPECMSG, oerr->specmsg);

	return nerr;
}

/**
 * @brief
 * 		make a shallow copy of a schd_error and move all argument data
 *		to err.
 *
 * @param[in]	err	-	schd_error to move TO
 * @param[in]	oerr-	schd_error to move FROM
 *
 * @return	nothing
 */
void
move_schd_error(schd_error *err, schd_error *oerr)
{
	if (oerr == NULL || err == NULL)
		return;

	/* we're about to overwrite these, free just incase so we don't leak*/
	free(err->arg1);
	free(err->arg2);
	free(err->arg3);
	free(err->specmsg);
	free_schd_error_list(err->next);

	memcpy(err, oerr, sizeof(schd_error));

	/* Now that err has taken over the memory for the points,
	 * NULL them on the original so we don't accidentally free them
	 */
	oerr->arg1 = NULL;
	oerr->arg2 = NULL;
	oerr->arg3 = NULL;
	oerr->specmsg = NULL;
	oerr->next = NULL;
	clear_schd_error(oerr);
}

/**
 * @brief
 *		deep copy oerr into err.  This will allocate memory
 *		for members of err, but not a new structure itself (like
 *		dup_schd_error() would.
 * @param[out] err
 * @param[in] oerr
 */
void
copy_schd_error(schd_error *err, schd_error *oerr)
{
	set_schd_error_codes(err, oerr->status_code, oerr->error_code);
	set_schd_error_arg(err, ARG1, oerr->arg1);
	set_schd_error_arg(err, ARG2, oerr->arg2);
	set_schd_error_arg(err, ARG3, oerr->arg3);
	set_schd_error_arg(err, SPECMSG, oerr->specmsg);
	err->rdef = oerr->rdef;
}

/**
 * @brief
 * 		safely set the schd_config arg buffers without worrying about leaking
 *
 * @param[in,out]	err	-	object to set
 * @param[in]	arg_field	-	arg buffer to set
 * @param[in]	arg	-	string to set arg to
 *
 * @return	nothing
 */
void
set_schd_error_arg(schd_error *err, enum schd_error_args arg_field, const char *arg)
{

	if (err == NULL)
		return;

	switch (arg_field) {
		case ARG1:
			free(err->arg1);
			if (arg != NULL)
				err->arg1 = string_dup(arg);
			else
				err->arg1 = NULL;
			break;
		case ARG2:
			free(err->arg2);
			if (arg != NULL)
				err->arg2 = string_dup(arg);
			else
				err->arg2 = NULL;
			break;
		case ARG3:
			free(err->arg3);
			if (arg != NULL)
				err->arg3 = string_dup(arg);
			else
				err->arg3 = NULL;
			break;
		case SPECMSG:
			free(err->specmsg);
			if (arg != NULL)
				err->specmsg = string_dup(arg);
			else
				err->specmsg = NULL;
			break;
		default:
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, "Invalid schd_error arg message type");
	}
}

/**
 * @brief
 * 		set the status code and error code of a schd_error structure
 *
 *	@note
 *		this ensures both codes are set together
 *
 * @param[in,out]	err	-	error structure to set
 * @param[in]	status_code	-	status code
 * @param[in]	error_code	-	error code
 *
 * @return	nothing
 */
void
set_schd_error_codes(schd_error *err, enum schd_err_status status_code, enum sched_error_code error_code)
{
	if (err == NULL)
		return;
	if (status_code < SCHD_UNKWN || status_code >= SCHD_STATUS_HIGH)
		return;
	if (error_code < PBSE_NONE || error_code > ERR_SPECIAL)
		return;

	err->status_code = status_code;
	err->error_code = error_code;
}

/**
 * @brief
 * 		destructor of schd_error: Free a single schd_error structure
 *
 * @param[in]	err	-	Error structure
 */
void
free_schd_error(schd_error *err)
{
	if (err == NULL)
		return;

	free(err->arg1);
	free(err->arg2);
	free(err->arg3);
	free(err->specmsg);

	err->next = NULL; /* just incase people try and access freed memory */

	free(err);
}

/**
 * @brief
 * 		list schd_error destructor: Free multiple schd_error's in a list
 *
 * @param[in]	 err_list	-	Error list.
 */
void
free_schd_error_list(schd_error *err_list)
{
	schd_error *err, *tmp;

	err = err_list;
	while (err != NULL) {
		tmp = err->next;
		free_schd_error(err);
		err = tmp;
	}
}

/**
 * @brief
 * 		create a simple schd_error with no arguments
 *
 * @param[in]	error_code	-	error code for new schd_error
 * @param[in]	status_code -	status code for new schd_error
 *
 * @return	new schd_error
 */
schd_error *
create_schd_error(enum sched_error_code error_code, enum schd_err_status status_code)
{
	schd_error *nse;
	nse = new_schd_error();
	if (nse == NULL)
		return NULL;
	set_schd_error_codes(nse, status_code, error_code);
	return nse;
}

/**
 * @brief
 *		create a schd_error complete with arguments
 * @par
 *	schd_error fields: error_code, status_code, arg1, arg2, arg3 and specmsg.
 *
 * @param[in]	error_code	-	Error Code.
 * @param[in]	status_code	-	Status Code.
 * @param[in]	arg1	-	Argument 1
 * @param[in]	arg2	-	Argument 2
 * @param[in]	arg3	-	Argument 3
 * @param[in]	specmsg	-	string to set arg to
 *
 * @return	new schd_error
 */
schd_error *
create_schd_error_complex(enum sched_error_code error_code, enum schd_err_status status_code, char *arg1, char *arg2, char *arg3, char *specmsg)
{
	schd_error *nse;

	nse = create_schd_error(error_code, status_code);
	if (nse == NULL)
		return NULL;

	if (arg1 != NULL)
		set_schd_error_arg(nse, ARG1, arg1);

	if (arg2 != NULL)
		set_schd_error_arg(nse, ARG2, arg2);

	if (arg3 != NULL)
		set_schd_error_arg(nse, ARG3, arg3);

	if (specmsg != NULL)
		set_schd_error_arg(nse, SPECMSG, specmsg);

	return nse;
}
/**
 * @brief
 * 		add a schd_error to a linked list of schd_errors.
 *		The way this works: head of the schd_error list is already created and
 *		passed into the caller (e.g., from main_sched_loop() -> is_ok_to_run()).  The caller will maintain
 *		a 'prev_err' pointer.  The address of the prev_err(i.e., &prev_err) is passed into this function.
 *		The first call, we add the head.  Each additional call, we set up the next pointers.
 *		If err-> next is not NULL, we assume we're adding a sublist of schd_error's to the main list.
 *
 *	@example
 *		main_sched_loop(): foo_err = new_schd_error()
 *		main_sched_loop(): is_ok_to_run(..., foo_err)
 *		is_ok_to_run(): schd_error *prev_err = NULL;
 *		is_ok_to_run() add_err(&prev_err, err);
 *		is_ok_to_run(): err = new_schd_err()
 *		is_ok_to_run() add_err(&prev_err, err)
 *		Note: main_sched_loop() did not pass the address of foo_err into is_ok_to_run()
 *		Note2: main_sched_loop() holds the head of the list, so we don't return the list
 *
 * @param[in]	prev_err	-	address of the pointer previous to the end of the list (i.e. (*prev_err)->next->next == NULL
 * @param[in]	err	-	schd_error to add to the list (may be a list of schd_error's)
 *
 * @return	nothing
 *
 * @note	nothing stops duplicate entries from being added
 */
void
add_err(schd_error **prev_err, schd_error *err)
{
	schd_error *cur = NULL;

	if (err == NULL || prev_err == NULL)
		return;

	if (*prev_err == NULL)
		(*prev_err) = err;
	else
		(*prev_err)->next = err;

	if (err->next != NULL) {
		for (cur = err; cur->next != NULL; cur = cur->next)
			;
		(*prev_err) = cur;
	} else
		(*prev_err) = err;
}

/**
 * @brief
 * 		turn a resource/resource_req into a string for printing using a
 *		internal static buffer
 *
 * @param[in]	p	-	pointer to resource/req
 * @param[in] fld	-	the field of the resource to print
 *
 * @return	char *
 * @retval	the resource in string format (in internal static string)
 * @retval	"" on error
 *
 * @par	MT-Safe: No
 *
 * @note
 * 		This function can not be used more than once in a printf() type func
 *	 	The static string will be overwritten before printing and you will get
 *	 	the same value for all calls.  Use res_to_str_r().
 */
char *
res_to_str(void *p, enum resource_fields fld)
{
	static char *resbuf = NULL;
	static int resbuf_size = 1024;

	if (resbuf == NULL) {
		if ((resbuf = static_cast<char *>(malloc(resbuf_size))) == NULL)
			return const_cast<char *>("");
	}

	return res_to_str_re(p, fld, &resbuf, &resbuf_size, NO_FLAGS);
}

/**
 * @brief
 * 		convert a number that is a resource into a string with a provided
 * 		non-expandable buffer.  This is useful for size types or scheduler constants
 *
 * @param[in]	amount	-	amount of resource
 * @param[in]	def	-	resource definition of amount
 * @param[in]	fld	-	the field of the resource to print - Should be RF_REQUEST or
 *              		RF_AVAIL
 * @param[in,out]	buf	-	buffer for res to str conversion -- not expandable
 * @param[in]	bufsize	-	size of buf
 *
 * @return	char *
 * @retval	the resource in string format (in provided buffer)
 * @retval	""	: on error
 */
char *
res_to_str_c(sch_resource_t amount, resdef *def, enum resource_fields fld,
	     char *buf, int bufsize)
{
	schd_resource res = {0};
	resource_req req = {0};
	const char *unknown[] = {"unknown", NULL};

	if (buf == NULL)
		return const_cast<char *>("");

	buf[0] = '\0';

	if (def == NULL)
		return const_cast<char *>("");

	switch (fld) {
		case RF_REQUEST:
			req.amount = amount;
			req.def = def;
			req.name = def->name.c_str();
			req.type = def->type;
			req.res_str = const_cast<char *>("unknown");
			return res_to_str_re(((void *) &req), fld, &buf, &bufsize, NOEXPAND);
			break;
		case RF_AVAIL:
		default:
			res.avail = amount;
			res.assigned = amount;
			res.def = def;
			res.name = def->name.c_str();
			res.type = def->type;
			res.orig_str_avail = const_cast<char *>("unknown");
			res.str_avail = const_cast<char **>(unknown);
			res.str_assigned = const_cast<char *>("unknown");
			return res_to_str_re(((void *) &res), fld, &buf, &bufsize, NOEXPAND);
	}
	return const_cast<char *>("");
}
/**
 * @brief
 * 		convert a resource to string with a non-expandable buffer
 *
 * @param[in]	p	-	pointer to resource/req
 * @param[in]	fld	-	the field of the resource to print
 * @param[in]	buf	-	buffer for res to str conversion -- not expandable
 * @param[in,out]	bufsize	-	size of buf
 *
 * @return	char *
 * @retval	the resource in string format (in provided buffer)
 * @retval	""	: on error
 */
char *
res_to_str_r(void *p, enum resource_fields fld, char *buf, int bufsize)
{
	return res_to_str_re(p, fld, &buf, &bufsize, NOEXPAND);
}

/**
 * @brief
 * 		turn a resource (resource/resource_req) into
 *      a string for printing.  If the buffer needs expanding, it
 *		will be expanded(except when specified by flags).
 *
 * @param[in]	p	-	a pointer to a resource/req
 * @param[in]	fld	-	The field of the resource type to print.  This is
 *						used to determine if p is a resource or a resource_req
 * @param[in,out]	buf	-	buffer to copy string into
 * @param[in,out]	buf_size	-	size of buffer
 * @param[in]	flags	-	flags to control printing
 *							PRINT_INT_CONST - print internal constant names
 *							NOEXPAND - don't expand the buffer, just fill upto the max size
 *
 * @return	char *
 * @retval	the resource in string format (in buf)
 * @retval	""  on error
 */
char *
res_to_str_re(void *p, enum resource_fields fld, char **buf,
	      int *bufsize, unsigned int flags)
{
	schd_resource *res = NULL;
	resource_req *req = NULL;
	struct resource_type *rt;
	char *str;
	int free_str = 0;
	sch_resource_t amount;

	char localbuf[1024];
	char *ret;
	resource_type rtype;

	if (buf == NULL || bufsize == NULL)
		return const_cast<char *>("");

	if (*bufsize > 0)
		**buf = '\0';

	if (p == NULL)
		return const_cast<char *>("");

	ret = *buf;

	if (*bufsize <= 0) {
		if (!(flags & NOEXPAND)) {
			if ((*buf = static_cast<char *>(malloc(1024))) == NULL) {
				log_err(errno, __func__, MEM_ERR_MSG);
				return const_cast<char *>("");
			} else
				*bufsize = 1024;
		}
	}

	/* empty string */
	**buf = '\0';

	switch (fld) {
		case RF_REQUEST:
			req = static_cast<resource_req *>(p);
			rt = &(req->type);
			str = req->res_str;
			amount = req->amount;
			break;

		case RF_DIRECT_AVAIL:
			res = static_cast<schd_resource *>(p);
			if (res->indirect_res != NULL) {
				if (flags & NOEXPAND)
					snprintf(*buf, *bufsize, "@");
				else {
					ret = pbs_strcat(buf, bufsize, "@");
					if (ret == NULL)
						return const_cast<char *>("");
				}

				str = res->indirect_vnode_name;
				rtype.is_string = 1;
				rtype.is_non_consumable = 1;
				rt = &rtype;
				amount = 0;
				break;
			}
			/* if not indirect, fall through normally */
		case RF_AVAIL:
			res = static_cast<schd_resource *>(p);
			if (res->indirect_res != NULL)
				res = res->indirect_res;
			rt = &(res->type);
			str = string_array_to_str(res->str_avail);
			if (str == NULL)
				str = const_cast<char *>("");
			else
				free_str = 1;
			amount = res->avail;
			break;

		case RF_ASSN:
			res = static_cast<schd_resource *>(p);
			rt = &(res->type);
			str = res->str_assigned;
			amount = res->assigned;
			break;

		default:
			return const_cast<char *>("");
	}

	/* error checking */
	if (rt->is_string) {
		if (flags & NOEXPAND)
			snprintf(*buf, *bufsize, "%s", str);
		else
			ret = pbs_strcat(buf, bufsize, str);
	} else if (rt->is_boolean) {
		if (flags & NOEXPAND)
			snprintf(*buf, *bufsize, "%s", amount ? ATR_TRUE : ATR_FALSE);
		else
			ret = pbs_strcat(buf, bufsize, amount ? ATR_TRUE : ATR_FALSE);
	} else if (rt->is_size) {
		if (amount == 0) /* need to special case 0 or it falls into tb case */
			snprintf(localbuf, sizeof(localbuf), "0kb");
		else if (((long) amount % TERATOKILO) == 0)
			snprintf(localbuf, sizeof(localbuf), "%ldtb", (long) (amount / TERATOKILO));
		else if (((long) amount % GIGATOKILO) == 0)
			snprintf(localbuf, sizeof(localbuf), "%ldgb", (long) (amount / GIGATOKILO));
		else if (((long) amount % MEGATOKILO) == 0)
			snprintf(localbuf, sizeof(localbuf), "%ldmb", (long) (amount / MEGATOKILO));
		else
			snprintf(localbuf, sizeof(localbuf), "%ldkb", (long) amount);
		if (flags & NOEXPAND)
			snprintf(*buf, *bufsize, "%s", localbuf);
		else
			ret = pbs_strcat(buf, bufsize, localbuf);
	} else if (rt->is_num) {
		int const_print = 0;
		if (amount == UNSPECIFIED_RES) {
			if (flags & PRINT_INT_CONST) {
				if (flags & NOEXPAND)
					snprintf(*buf, *bufsize, UNSPECIFIED_STR);
				else
					ret = pbs_strcat(buf, bufsize, UNSPECIFIED_STR);

				const_print = 1;
			}
		} else if (amount == SCHD_INFINITY_RES) {
			if (flags & PRINT_INT_CONST) {
				if (flags & NOEXPAND)
					snprintf(*buf, *bufsize, SCHD_INFINITY_STR);
				else
					ret = pbs_strcat(buf, bufsize, SCHD_INFINITY_STR);

				const_print = 1;
			}
		}

		if (const_print == 0) {
			if (rt->is_float)
				snprintf(localbuf, sizeof(localbuf), "%.*f",
					 float_digits(amount, FLOAT_NUM_DIGITS), (double) amount);
			else
				snprintf(localbuf, sizeof(localbuf), "%ld", (long) amount);
			if (flags & NOEXPAND)
				snprintf(*buf, *bufsize, "%s", localbuf);
			else
				ret = pbs_strcat(buf, bufsize, localbuf);
		}
	} else if (rt->is_time) {
		char resbuf[1024];
		convert_duration_to_str((long) amount, resbuf, sizeof(resbuf));
	}

	if (free_str)
		free(str);

	if (ret == NULL)
		return const_cast<char *>("");
	return *buf;
}

/*
 * @brief   helper function to free an array of pointers
 *
 * @param[in] inp - array of pointers
 * @return void
 */
void
free_ptr_array(void *inp)
{
	int i;
	void **arr;

	if (inp == NULL)
		return;

	arr = (void **) inp;

	for (i = 0; arr[i] != NULL; i++)
		free(arr[i]);
	free(arr);
}

/**
 *
 *	@brief break apart a comma delimited string into an array of strings.
 *	       It's an overloaded function of break_comma_list in libutils
 *
 *	@param[in] strlist - the comma delimited string
 *
 *	@return std::vector<std::string>
 *
 */
std::vector<std::string>
break_comma_list(const std::string &strlist)
{
	std::stringstream sstream(strlist);
	std::string str;
	std::vector<std::string> ret;
	while (std::getline(sstream, str, ','))
		ret.push_back(str);
	return ret;
}


================================================
FILE: src/scheduler/misc.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _MISC_H
#define _MISC_H

#include <string>

#include "data_types.h"
#include "server_info.h"
#include "queue_info.h"
#include "job_info.h"
#include "sched_cmds.h"

/*
 *	string_dup - duplicate a string
 */
char *string_dup(const char *str);

/*
 *      res_to_num - convert a resource string to an integer in the lowest
 *                      form of resource on the machine (btye/word)
 *                      example: 1kb -> 1024 or 1kw -> 1024
 */
sch_resource_t res_to_num(const char *res_str, struct resource_type *type);

/*
 *      skip_line - find if the line of the config file needs to be skipped
 *                  due to it being a comment or other means
 */
int skip_line(char *line);

/*
 *      schdlogerr - combination of log_event() and translate_fail_code()
 *                   If we're actually going to log a message, translate
 *                   err into a message and then log it.  The translated
 *                   error will be printed after the message
 */
void
schdlogerr(int event, int event_class, int sev, const std::string &name, const char *text,
	   schd_error *err);

/*
 *
 *      take a generic NULL terminated pointer array and return a
 *      filtered specialized array based on calling filter_func() on every
 *      member.  This can be used with any standard scheduler array
 *	like resource_resv or node_info or resdef
 *
 *      filter_func prototype: int func( void *, void * )
 *                                       object   arg
 *		  object - specific member of ptrarr[]
 *		  arg    - arg parameter
 *              - returns 1: ptr will be added to filtered array
 *              - returns 0: ptr will NOT be added to filtered array
 */
void **
filter_array(void **ptrarr, int (*filter_func)(void *, void *),
	     void *arg, int flags);

/**
 * 	calc_time_left_STF - calculate the amount of time left
 *  for minimum duration and maximum duration of a STF resource resv
 *
 */
int calc_time_left_STF(resource_resv *resresv, sch_resource_t *min_time_left);

/*
 *
 *	match_string_array - match two NULL terminated string arrays
 *
 *	returns: SA_FULL_MATCH		: full match
 *		 SA_SUB_MATCH		: one array is a subset of the other
 *		 SA_PARTIAL_MATCH	: at least one match but not all
 *		 SA_NO_MATCH		: no match
 *
 */
enum match_string_array_ret match_string_array(const char *const *strarr1, const char *const *strarr2);
enum match_string_array_ret match_string_array(const std::vector<std::string> &strarr1, const std::vector<std::string> &strarr2);

/*
 * convert a string array into a printable string
 */
char *string_array_to_str(char **strarr);

/*
 *      calc_time_left - calculate the remaining time of a job
 */
int calc_time_left(resource_resv *resresv, int use_hard_duration);

/*
 *      cstrcmp - check string compare - compares two strings but doesn't bomb
 *                if either one is null
 */
int cstrcmp(const char *s1, const char *s2);

/*
 *      is_num - checks to see if the string is a number, size, float
 *               or time in string form
 */
int is_num(const char *str);

/*
 *	count_array - count the number of elements in a NULL terminated array
 *		      of pointers
 */
int count_array(const void *arr);

/*
 *	dup_array - make a shallow copy of elements in a NULL terminated array of pointers.
 */
void **dup_array(void *ptr);

/*
 *	remove_ptr_from_array - remove a pointer from a ptr list and move
 *				the rest of the pointers up to fill the hole
 *				Pointer array size will not change - an extra
 *				NULL is added to the end
 *
 *	returns non-zero if the ptr was successfully removed from the array
 *		zero if the array has not been modified
 */
int remove_ptr_from_array(void *arr, void *ptr);

/**
 * @brief add pointer to NULL terminated pointer array
 * @param[in] ptr_arr - pointer array to add to
 * @param[in] ptr - pointer to add
 *
 * @return void *
 * @retval pointer array with new element added
 * @retval NULL on error
 */
void *add_ptr_to_array(void *ptr_arr, void *ptr);

/*
 *      is_valid_pbs_name - is str a valid pbs username (POSIX.1 + ' ')
 *                          a valid name is: alpha numeric '-' '_' '.' or ' '
 */
int is_valid_pbs_name(char *str, int len);

/*
 *
 *      res_to_str - turn a resource (resource/resource_req) into
 *                   a string for printing.
 *      returns the resource in string format.  It is returned in a static
 *              buffer
 *              a null string ("") is returned on error
 */
char *res_to_str(void *p, enum resource_fields fld);

/*
 *
 *    turn a resource/req into a string for printing (reentrant)
 *
 */
char *res_to_str_r(void *p, enum resource_fields fld, char *buf, int bufsize);

/**
 * convert a number that is a resource into a string with a non-expandable
 * buffer. This is useful for size types or scheduler constants
 */
char *
res_to_str_c(sch_resource_t amount, resdef *def, enum resource_fields fld,
	     char *buf, int bufsize);

/**
 *
 *    @brief turn a resource (resource/resource_req) into
 *                 a string for printing.  If the buffer needs expanding, it
 *		   will be expanded based on flags
 * flags:
 * 		NOPRINT_INT_CONST - print "" instead of internal sched constants
 *		NOEXPAND - don't expand the buffer, just fill to the max size
 */
char *
res_to_str_re(void *p, enum resource_fields fld, char **buf,
	      int *bufsize, unsigned int flags);

/*
 * clear schd_error structure for reuse
 */
void clear_schd_error(schd_error *err);

/* schd_error constructor */
schd_error *new_schd_error(void);

/* schd_error copy constructor */
schd_error *dup_schd_error(schd_error *oerr);

/* does a shallow copy err = oerr safely moving all argument data to err */
void move_schd_error(schd_error *err, schd_error *oerr);

/* do a deep copy of err, but don't dup the error itself. */
void copy_schd_error(schd_error *err, schd_error *oerr);

/* safely set the schd_config arg buffers without worrying about leaking */
void set_schd_error_arg(schd_error *err, enum schd_error_args arg_field, const char *arg);

/* set the status code and error code of a schd_error structure to ensure both are set together  */
void set_schd_error_codes(schd_error *err, enum schd_err_status status_code, enum sched_error_code error_code);

/* schd_error destuctor */
void
free_schd_error(schd_error *err);
void
free_schd_error_list(schd_error *err_list);

/* helper functions to create schd_errors*/
schd_error *
create_schd_error(enum sched_error_code error_code, enum schd_err_status status_code);
schd_error *
create_schd_error_complex(enum sched_error_code error_code, enum schd_err_status status_code, char *arg1, char *arg2, char *arg3, char *specmsg);

/* add schd_errors to linked list */
void
add_err(schd_error **prev_err, schd_error *err);

/*
 * add string to NULL terminated string array
 */
int
add_str_to_array(char ***str_arr, char *str);

/*
 * add a string to a string array only if it is unique
 */
int
add_str_to_unique_array(char ***str_arr, char *str);

/*
 * helper function to free an array of pointers
 */
void free_ptr_array(void *inp);

void log_eventf(int eventtype, int objclass, int sev, const std::string &objname, const char *fmt, ...);
void log_event(int eventtype, int objclass, int sev, const std::string &objname, const char *text);

/*
 * overloaded break_comma_list function
 */
std::vector<std::string> break_comma_list(const std::string &strlist);
#endif /* _MISC_H */


================================================
FILE: src/scheduler/multi_threading.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <pthread.h>
#include <errno.h>
#include <signal.h>

#include "log.h"
#include "pbs_idx.h"

#include "constant.h"
#include "misc.h"
#include "data_types.h"
#include "globals.h"
#include "node_info.h"
#include "queue.h"
#include "fifo.h"
#include "resource_resv.h"
#include "multi_threading.h"

/**
 * @brief	create the thread id key & set it for the main thread
 *
 * @param	void
 *
 * @return	void
 */
static void
create_id_key(void)
{
	int *mainid;

	mainid = static_cast<int *>(malloc(sizeof(int)));
	if (mainid == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return;
	}
	*mainid = 0;

	pthread_key_create(&th_id_key, free);
	pthread_setspecific(th_id_key, (void *) mainid);
}

/**
 * @brief	convenience function to kill worker threads
 *
 * @param	void
 *
 * @return	void
 */
void
kill_threads(void)
{
	int i;

	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
		  "", "Killing worker threads");

	threads_die = 1;
	pthread_mutex_lock(&work_lock);
	pthread_cond_broadcast(&work_cond);
	pthread_mutex_unlock(&work_lock);

	/* Wait until all threads to finish */
	for (i = 0; i < num_threads; i++) {
		pthread_join(threads[i], NULL);
	}
	pthread_mutex_destroy(&work_lock);
	pthread_cond_destroy(&work_cond);
	pthread_mutex_destroy(&result_lock);
	pthread_cond_destroy(&result_cond);
	pthread_mutex_destroy(&general_lock);
	free(threads);
	free_ds_queue(work_queue);
	free_ds_queue(result_queue);
	threads = NULL;
	num_threads = 0;
	work_queue = NULL;
	result_queue = NULL;
}

/**
 * @brief	initialize multi-threading
 *
 * @param[in]	nthreads - number of threads to create, or -1 to use default
 *
 * @return	int
 * @retval	1 for success
 * @retval	0 for malloc error
 */
int
init_multi_threading(int nthreads)
{
	int i;
	int num_cores;
	pthread_mutexattr_t attr;

	/* Kill any existing worker threads */
	if (num_threads > 1)
		kill_threads();

	threads_die = 0;
	if (pthread_cond_init(&work_cond, NULL) != 0) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
			  "pthread_cond_init failed");
		return 0;
	}
	if (pthread_cond_init(&result_cond, NULL) != 0) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
			  "pthread_cond_init failed");
		return 0;
	}

	if (init_mutex_attr_recursive(&attr) != 0) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
			  "init_mutex_attr_recursive failed");
		return 0;
	}

	pthread_mutex_init(&work_lock, &attr);
	pthread_mutex_init(&result_lock, &attr);
	pthread_mutex_init(&general_lock, &attr);

	num_cores = sysconf(_SC_NPROCESSORS_ONLN);
	if (nthreads < 1 && num_cores > 2)
		/* Create as many threads as half the number of cores */
		num_threads = num_cores / 2;
	else
		num_threads = nthreads;

	if (num_threads <= 1) {
		num_threads = 1;
		pthread_once(&key_once, create_id_key);
		return 1; /* main thread will act as the only worker thread */
	}

	log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
		   "", "Launching %d worker threads", num_threads);

	threads = static_cast<pthread_t *>(malloc(num_threads * sizeof(pthread_t)));
	if (threads == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return 0;
	}

	/* Create task and result queues */
	work_queue = new_ds_queue();
	if (work_queue == NULL) {
		free(threads);
		return 0;
	}
	result_queue = new_ds_queue();
	if (result_queue == NULL) {
		free(threads);
		free_ds_queue(work_queue);
		work_queue = NULL;
		return 0;
	}

	pthread_once(&key_once, create_id_key);
	for (i = 0; i < num_threads; i++) {
		int *thid;

		thid = static_cast<int *>(malloc(sizeof(int)));
		if (thid == NULL) {
			free(threads);
			free_ds_queue(work_queue);
			free_ds_queue(result_queue);
			work_queue = NULL;
			result_queue = NULL;
			log_err(errno, __func__, MEM_ERR_MSG);
			return 0;
		}
		*thid = i + 1;
		pthread_create(&(threads[i]), NULL, &worker, (void *) thid);
	}

	return 1;
}

/**
 * @brief	Main pthread routine for worker threads
 *
 * @param[in]	tid  - thread id of the thread
 *
 * @return void
 */
void *
worker(void *tid)
{
	th_task_info *work = NULL;
	sigset_t set;
	int ntid;
	char buf[1024];

	pthread_setspecific(th_id_key, tid);
	ntid = *(int *) tid;

	/* Add HUP to the list of signals to block, if we ever unblock this, we'll need to modify 'restart()' to handle MT */
	sigemptyset(&set);
	sigaddset(&set, SIGHUP);

	if (pthread_sigmask(SIG_BLOCK, &set, NULL) != 0) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
			  "pthread_sigmask failed");
		pthread_exit(NULL);
	}

	while (!threads_die) {
		/* Get the next work task from work queue */
		pthread_mutex_lock(&work_lock);
		while (ds_queue_is_empty(work_queue) && !threads_die) {
			pthread_cond_wait(&work_cond, &work_lock);
		}
		work = static_cast<th_task_info *>(ds_dequeue(work_queue));
		pthread_mutex_unlock(&work_lock);

		/* find out what task we need to do */
		if (work != NULL) {
			switch (work->task_type) {
				case TS_IS_ND_ELIGIBLE:
					snprintf(buf, sizeof(buf), "Thread %d calling check_node_eligibility_chunk()", ntid);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, buf);
					check_node_eligibility_chunk(static_cast<th_data_nd_eligible *>(work->thread_data));
					break;
				case TS_DUP_ND_INFO:
					snprintf(buf, sizeof(buf), "Thread %d calling dup_node_info_chunk()", ntid);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, buf);
					dup_node_info_chunk(static_cast<th_data_dup_nd_info *>(work->thread_data));
					break;
				case TS_QUERY_ND_INFO:
					snprintf(buf, sizeof(buf), "Thread %d calling query_node_info_chunk()", ntid);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, buf);
					query_node_info_chunk(static_cast<th_data_query_ninfo *>(work->thread_data));
					break;
				case TS_FREE_ND_INFO:
					snprintf(buf, sizeof(buf), "Thread %d calling free_node_info_chunk()", ntid);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, buf);
					free_node_info_chunk(static_cast<th_data_free_ninfo *>(work->thread_data));
					break;
				case TS_DUP_RESRESV:
					snprintf(buf, sizeof(buf), "Thread %d calling dup_resource_resv_array_chunk()", ntid);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, buf);
					dup_resource_resv_array_chunk(static_cast<th_data_dup_resresv *>(work->thread_data));
					break;
				case TS_QUERY_JOB_INFO:
					snprintf(buf, sizeof(buf), "Thread %d calling query_jobs_chunk()", ntid);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, buf);
					query_jobs_chunk(static_cast<th_data_query_jinfo *>(work->thread_data));
					break;
				case TS_FREE_RESRESV:
					snprintf(buf, sizeof(buf), "Thread %d calling free_resource_resv_array_chunk()", ntid);
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SCHED, LOG_DEBUG, __func__, buf);
					free_resource_resv_array_chunk(static_cast<th_data_free_resresv *>(work->thread_data));
					break;
				default:
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SCHED, LOG_ERR, __func__,
						  "Invalid task type passed to worker thread");
			}

			/* Post results */
			pthread_mutex_lock(&result_lock);
			ds_enqueue(result_queue, (void *) work);
			pthread_cond_signal(&result_cond);
			pthread_mutex_unlock(&result_lock);
		}
	}

	pthread_exit(NULL);
}

/**
 * @brief	Convenience function to queue up work for worker threads
 *
 * @param[in]	task - the task to queue up
 *
 * @return void
 */
void
queue_work_for_threads(th_task_info *task)
{
	pthread_mutex_lock(&work_lock);
	ds_enqueue(work_queue, (void *) task);
	pthread_cond_signal(&work_cond);
	pthread_mutex_unlock(&work_lock);
}


================================================
FILE: src/scheduler/multi_threading.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef SRC_SCHEDULER_MULTI_THREADING_H_
#define SRC_SCHEDULER_MULTI_THREADING_H_

#include "data_types.h"

#define MT_CHUNK_SIZE_MIN 1024
#define MT_CHUNK_SIZE_MAX 8192

int init_multi_threading(int nthreads);
void kill_threads(void);
void *worker(void *);
void queue_work_for_threads(th_task_info *task);

#endif /* SRC_SCHEDULER_MULTI_THREADING_H_ */


================================================
FILE: src/scheduler/node_info.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    node_info.c
 *
 * @brief
 * 		misc.c - This file contains functions related to node_info structure.
 *
 * Functions included are:
 * 	query_nodes()
 * 	query_node_info()
 * 	free_nodes()
 * 	set_node_info_state()
 * 	remove_node_state()
 * 	add_node_state()
 * 	node_filter()
 * 	find_node_info()
 * 	find_node_by_host()
 * 	dup_nodes()
 * 	dup_node_info()
 * 	copy_node_ptr_array()
 * 	collect_resvs_on_nodes()
 * 	collect_jobs_on_nodes()
 * 	update_node_on_run()
 * 	update_node_on_end()
 * 	check_rescspec()
 * 	search_for_rescspec()
 * 	dup_nspec()
 * 	free_nspecs()
 * 	find_nspec()
 * 	find_nspec_by_rank()
 * 	eval_selspec()
 * 	eval_placement()
 * 	eval_complex_selspec()
 * 	eval_simple_selspec()
 * 	is_vnode_eligible()
 * 	is_vnode_eligible_chunk()
 * 	resources_avail_on_vnode()
 * 	check_resources_for_node()
 * 	parse_placespec()
 * 	parse_selspec()
 * 	create_execvnode()
 * 	parse_execvnode()
 * 	node_state_to_str()
 * 	combine_nspec_array()
 * 	create_node_array_from_nspec()
 * 	reorder_nodes()
 * 	reorder_nodes_set()
 * 	ok_break_chunk()
 * 	is_excl()
 * 	alloc_rest_nodepart()
 * 	can_fit_on_vnode()
 * 	is_provisionable()
 * 	node_up_event()
 * 	node_down_event()
 * 	create_node_array_from_str()
 * 	find_node_by_rank()
 * 	new_node_scratch()
 * 	free_node_scratch()
 * 	sim_exclhost()
 * 	sim_exclhost_func()
 * 	set_current_aoe()
 * 	is_exclhost()
 * 	check_node_array_eligibility()
 * 	is_powerok()
 * 	is_eoe_avail_on_vnode()
 * 	set_current_eoe()
 *
 */

#include <unordered_map>

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <math.h>
#include <ctype.h>
#include <sys/types.h>
#include <errno.h>
#include <math.h>
#include <errno.h>
#include <time.h>
#include <pbs_ifl.h>
#include <log.h>
#include <grunt.h>
#include <libutil.h>
#include <pbs_internal.h>
#include "attribute.h"
#include "node_info.h"
#include "server_info.h"
#include "job_info.h"
#include "misc.h"
#include "globals.h"
#include "check.h"
#include "constant.h"
#include "config.h"
#include "resource_resv.h"
#include "simulate.h"
#include "sort.h"
#include "node_partition.h"
#include "resource.h"
#include "pbs_internal.h"
#include "server_info.h"
#include "pbs_share.h"
#include "pbs_bitmap.h"
#include "pbs_license.h"
#include "multi_threading.h"
#ifdef NAS
#include "site_code.h"
#endif

/* name of the last node a job ran on - used in smp_dist = round robin */
static char last_node_name[PBS_MAXSVRJOBID];

void
query_node_info_chunk(th_data_query_ninfo *data)
{
	struct batch_status *nodes;
	struct batch_status *cur_node;
	node_info **ninfo_arr;
	server_info *sinfo;
	node_info *ninfo;
	int i;
	int nidx;
	int start;
	int end;
	int num_nodes_chunk;

	nodes = data->nodes;
	sinfo = data->sinfo;
	start = data->sidx;
	end = data->eidx;
	num_nodes_chunk = end - start + 1;

	if ((ninfo_arr = static_cast<node_info **>(malloc((num_nodes_chunk + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		data->error = 1;
		return;
	}
	ninfo_arr[0] = NULL;

	/* Move to the linked list item corresponding to the 'start' index */
	for (cur_node = nodes, i = 0; i < start && cur_node != NULL; cur_node = cur_node->next, i++)
		;

	for (i = start, nidx = 0; i <= end && cur_node != NULL; cur_node = cur_node->next, i++) {
		/* get node info from the batch_status */
		if ((ninfo = query_node_info(cur_node, sinfo)) == NULL) {
			free_nodes(ninfo_arr);
			data->error = 1;
			return;
		}

		if (node_in_partition(ninfo, sc_attrs.partition)) {
			ninfo_arr[nidx++] = ninfo;
		} else
			delete ninfo;
	}
	ninfo_arr[nidx] = NULL;

	data->oarr = ninfo_arr;
}

/**
 * @brief	Allocates th_data_query_ninfo for multi-threading of query_nodes
 *
 * @param[in]	nodes	-	batch_status of nodes queried from server
 * @param[in]	sinfo	-	server information
 * @param[in]	sidx	-	start index for the jobs list for the thread
 * @param[in]	eidx	-	end index for the jobs list for the thread
 *
 * @return th_data_query_ninfo *
 * @retval a newly allocated th_data_query_ninfo object
 * @retval NULL for malloc error
 */
static inline th_data_query_ninfo *
alloc_tdata_nd_query(struct batch_status *nodes, server_info *sinfo, int sidx, int eidx)
{
	th_data_query_ninfo *tdata;

	tdata = static_cast<th_data_query_ninfo *>(malloc(sizeof(th_data_query_ninfo)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->error = 0;
	tdata->nodes = nodes;
	tdata->oarr = NULL; /* Will be filled by the thread routine */
	tdata->sinfo = sinfo;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 *      query_nodes - query all the nodes associated with a server
 *
 * @param[in]	pbs_sd	-	communication descriptor wit the pbs server
 * @param[in,out]	sinfo	-	server information
 *
 * @return	array of nodes associated with server
 *
 */
node_info **
query_nodes(int pbs_sd, server_info *sinfo)
{
	struct batch_status *nodes;    /* nodes returned from the server */
	struct batch_status *cur_node; /* used to cycle through nodes */
	node_info **ninfo_arr;	       /* array of nodes for scheduler's use */
	int num_nodes = 0;	       /* the number of nodes */
	int nidx = 0;
	static struct attrl *attrib = NULL;
	th_data_query_ninfo *tdata = NULL;
	th_task_info *task = NULL;
	node_info ***ninfo_arrs_tasks = NULL;
	int tid;

	if (attrib == NULL) {
		const char *nodeattrs[] = {
			ATTR_NODE_state,
			ATTR_NODE_Mom,
			ATTR_NODE_Port,
			ATTR_partition,
			ATTR_NODE_jobs,
			ATTR_NODE_ntype,
			ATTR_maxrun,
			ATTR_maxuserrun,
			ATTR_maxgrprun,
			ATTR_queue,
			ATTR_p,
			ATTR_NODE_Sharing,
			ATTR_NODE_License,
			ATTR_rescavail,
			ATTR_rescassn,
			ATTR_NODE_NoMultiNode,
			ATTR_ResvEnable,
			ATTR_NODE_ProvisionEnable,
			ATTR_NODE_current_aoe,
			ATTR_NODE_power_provisioning,
			ATTR_NODE_current_eoe,
			ATTR_NODE_in_multivnode_host,
			ATTR_NODE_last_state_change_time,
			ATTR_NODE_last_used_time,
			ATTR_NODE_resvs,
			NULL};

		for (int i = 0; nodeattrs[i] != NULL; i++) {
			struct attrl *temp_attrl;

			temp_attrl = new_attrl();
			temp_attrl->name = strdup(nodeattrs[i]);
			temp_attrl->next = attrib;
			temp_attrl->value = const_cast<char *>("");
			attrib = temp_attrl;
		}
	}

	/* get nodes from PBS server */
	if ((nodes = send_statvnode(pbs_sd, NULL, attrib, NULL)) == NULL) {
		auto err = pbs_geterrmsg(pbs_sd);
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO, "", "Error getting nodes: %s", err);
		return NULL;
	}

	cur_node = nodes;
	while (cur_node != NULL) {
		num_nodes++;
		cur_node = cur_node->next;
	}

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_nd_query(nodes, sinfo, 0, num_nodes - 1);
		if (tdata == NULL) {
			pbs_statfree(nodes);
			return NULL;
		}
		query_node_info_chunk(tdata);
		ninfo_arr = tdata->oarr;
		free(tdata);

		for (nidx = 0; ninfo_arr[nidx] != NULL; nidx++)
			ninfo_arr[nidx]->rank = get_sched_rank();

		ninfo_arr[nidx] = NULL;
	} else {
		int chunk_size = num_nodes / num_threads;
		int th_err = 0;
		int j;
		int num_tasks;
		if ((ninfo_arr = static_cast<node_info **>(malloc((num_nodes + 1) * sizeof(node_info *)))) == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			pbs_statfree(nodes);
			return NULL;
		}
		ninfo_arr[0] = NULL;
		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		for (j = 0, num_tasks = 0; num_nodes > 0;
		     j += chunk_size, num_tasks++, num_nodes -= chunk_size) {
			tdata = alloc_tdata_nd_query(nodes, sinfo, j, j + chunk_size - 1);
			if (tdata == NULL) {
				th_err = 1;
				break;
			}
			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			if (task == NULL) {
				free(tdata);
				log_err(errno, __func__, MEM_ERR_MSG);
				th_err = 1;
				break;
			}
			task->task_id = num_tasks;
			task->task_type = TS_QUERY_ND_INFO;
			task->thread_data = (void *) tdata;

			queue_work_for_threads(task);
		}
		ninfo_arrs_tasks = static_cast<node_info ***>(malloc(num_tasks * sizeof(node_info **)));
		if (ninfo_arrs_tasks == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			th_err = 1;
		}
		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_query_ninfo *>(task->thread_data);
				if (tdata->error)
					th_err = 1;
				ninfo_arrs_tasks[task->task_id] = tdata->oarr;
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
		if (th_err) {
			pbs_statfree(nodes);
			free_nodes(ninfo_arr);
			return NULL;
		}
		/* Assemble node info objects from various threads into the ninfo_arr */
		for (int i = 0; i < num_tasks; i++) {
			if (ninfo_arrs_tasks[i] != NULL) {
				node_info *ninfo;

				for (int j = 0; (ninfo = ninfo_arrs_tasks[i][j]) != NULL; j++) {
					ninfo->rank = get_sched_rank();
					ninfo_arr[nidx++] = ninfo;
				}
				free(ninfo_arrs_tasks[i]);
			}
		}
		ninfo_arr[nidx] = NULL;
		free(ninfo_arrs_tasks);
	}

	if (nidx == 0) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__,
			  "No nodes found in partitions serviced by scheduler");
		pbs_statfree(nodes);
		free(ninfo_arr);
		return NULL;
	}

#ifdef NAS /* localmod 062 */
	site_vnode_inherit(ninfo_arr);
#endif /* localmod 062 */
	resolve_indirect_resources(ninfo_arr);
	sinfo->num_nodes = nidx;
	pbs_statfree(nodes);
	return ninfo_arr;
}

/**
 * @brief
 *      query_node_info	- collect information from a batch_status and
 *      put it in a node_info struct for easier access
 *
 * @param[in]	node	-	a node returned from a pbs_statvnode() call
 * @param[in,out]	sinfo	-	server information
 *
 * @return	a node_info filled with information from node
 *
 */
node_info *
query_node_info(struct batch_status *node, server_info *sinfo)
{
	node_info *ninfo;     /* the new node_info */
	struct attrl *attrp;  /* used to cycle though attribute list */
	schd_resource *res;   /* used to set resources in res list */
	sch_resource_t count; /* used to convert str->num */
	char *endp;	      /* end pointer for strtol */
	int check_expiry = 0;
	time_t expiry = 0;

	if ((ninfo = new node_info(node->name)) == NULL)
		return NULL;

	attrp = node->attribs;

	ninfo->server = sinfo;

	while (attrp != NULL) {
		/* Node State... i.e. offline down free etc */
		if (!strcmp(attrp->name, ATTR_NODE_state))
			set_node_info_state(ninfo, attrp->value);

		/* Host name */
		else if (!strcmp(attrp->name, ATTR_NODE_Mom)) {
			if (ninfo->mom)
				free(ninfo->mom);
			if ((ninfo->mom = string_dup(attrp->value)) == NULL) {
				delete ninfo;
				return NULL;
			}
		} else if (!strcmp(attrp->name, ATTR_partition)) {
			ninfo->partition = string_dup(attrp->value);
			if (ninfo->partition == NULL) {
				log_err(errno, __func__, MEM_ERR_MSG);
				delete ninfo;
				return NULL;
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_jobs))
			ninfo->jobs = break_comma_list(attrp->value);
		else if (!strcmp(attrp->name, ATTR_maxrun)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->max_running = count;
		} else if (!strcmp(attrp->name, ATTR_maxuserrun)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->max_user_run = count;
			ninfo->has_hard_limit = 1;
		} else if (!strcmp(attrp->name, ATTR_maxgrprun)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->max_group_run = count;
			ninfo->has_hard_limit = 1;
		} else if (!strcmp(attrp->name, ATTR_queue))
			ninfo->queue_name = attrp->value;
		else if (!strcmp(attrp->name, ATTR_p)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->priority = count;
		} else if (!strcmp(attrp->name, ATTR_NODE_Sharing)) {
			ninfo->sharing = str_to_vnode_sharing(attrp->value);
			if (ninfo->sharing == VNS_UNSET) {
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO, ninfo->name,
					   "Unknown sharing type: %s using default shared", attrp->value);
				ninfo->sharing = VNS_DFLT_SHARED;
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_License)) {
			switch (attrp->value[0]) {
				case ND_LIC_TYPE_locked:
					ninfo->lic_lock = 1;
					break;
				case ND_LIC_TYPE_cloud:
					check_expiry = 1;
					break;
				default:
					log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
						   ninfo->name, "Unknown license type: %c", attrp->value[0]);
			}
		} else if (!strcmp(attrp->name, ATTR_rescavail)) {
			if (!strcmp(attrp->resource, ND_RESC_LicSignature)) {
				expiry = strtol(attrp->value, &endp, 10);
			}
			res = find_alloc_resource_by_str(ninfo->res, attrp->resource);

			if (res != NULL) {
				if (ninfo->res == NULL)
					ninfo->res = res;

				if (set_resource(res, attrp->value, RF_AVAIL) == 0) {
					delete ninfo;
					ninfo = NULL;
					break;
				}

				/* Round memory off to the nearest megabyte */
				if (res->def == allres["mem"])
					res->avail -= (long) res->avail % 1024;
#ifdef NAS /* localmod 034 */
				site_set_node_share(ninfo, res);
#endif /* localmod 034 */
			}
		} else if (!strcmp(attrp->name, ATTR_rescassn)) {
			res = find_alloc_resource_by_str(ninfo->res, attrp->resource);

			if (ninfo->res == NULL)
				ninfo->res = res;
			if (res != NULL) {
				if (set_resource(res, attrp->value, RF_ASSN) == 0) {
					delete ninfo;
					ninfo = NULL;
					break;
				}
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_NoMultiNode)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->no_multinode_jobs = 1;
		} else if (!strcmp(attrp->name, ATTR_ResvEnable)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->resv_enable = 1;
		} else if (!strcmp(attrp->name, ATTR_NODE_ProvisionEnable)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->provision_enable = 1;
		} else if (!strcmp(attrp->name, ATTR_NODE_current_aoe)) {
			if (attrp->value != NULL)
				set_current_aoe(ninfo, attrp->value);
		} else if (!strcmp(attrp->name, ATTR_NODE_power_provisioning)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->power_provisioning = 1;
		} else if (!strcmp(attrp->name, ATTR_NODE_current_eoe)) {
			if (attrp->value != NULL)
				set_current_eoe(ninfo, attrp->value);
		} else if (!strcmp(attrp->name, ATTR_NODE_in_multivnode_host)) {
			if (attrp->value != NULL) {
				count = strtol(attrp->value, &endp, 10);
				if (*endp == '\0')
					ninfo->is_multivnoded = count;
				if ((!sinfo->has_multi_vnode) && (count != 0))
					sinfo->has_multi_vnode = 1;
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_last_state_change_time)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->last_state_change_time = count;
		} else if (!strcmp(attrp->name, ATTR_NODE_last_used_time)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->last_used_time = count;
		} else if (!strcmp(attrp->name, ATTR_NODE_resvs)) {
			ninfo->resvs = break_comma_list(attrp->value);
		}
		attrp = attrp->next;
	}
	if (check_expiry) {
		if (time(NULL) < expiry)
			ninfo->lic_lock = 1;
	}

	if (ninfo->lic_lock != 1)
		ninfo->nscr |= NSCR_CYCLE_INELIGIBLE;

	return ninfo;
}

/**
 * @brief
 *	node_info constructor
 */
node_info::node_info(const std::string &nname) : name(nname)
{
	is_down = 0;
	is_free = 0;
	is_offline = 0;
	is_unknown = 0;
	is_exclusive = 0;
	is_job_exclusive = 0;
	is_resv_exclusive = 0;
	is_sharing = 0;
	is_busy = 0;
	is_job_busy = 0;
	is_stale = 0;
	is_maintenance = 0;
	is_provisioning = 0;
	is_sleeping = 0;
	is_multivnoded = 0;
	has_ghost_job = 0;

	lic_lock = 0;

	has_hard_limit = 0;
	no_multinode_jobs = 0;
	resv_enable = 0;
	provision_enable = 0;
	power_provisioning = 0;

	sharing = VNS_DFLT_SHARED;

	num_jobs = 0;
	num_run_resv = 0;
	num_susp_jobs = 0;

	priority = 0;

	rank = 0;

	nodesig_ind = -1;

	mom = NULL;
	jobs = NULL;
	resvs = NULL;
	job_arr = NULL;
	run_resvs_arr = NULL;
	res = NULL;
	server = NULL;

	max_running = SCHD_INFINITY;
	max_user_run = SCHD_INFINITY;
	max_group_run = SCHD_INFINITY;

	current_aoe = NULL;
	current_eoe = NULL;
	nodesig = NULL;
	last_state_change_time = 0;
	last_used_time = 0;

	svr_node = NULL;
	hostset = NULL;

	node_events = NULL;
	bucket_ind = -1;
	node_ind = -1;

	nscr = NSCR_NONE;

#ifdef NAS
	/* localmod 034 */
	sh_type = 0;
	sh_cls = 0;
#endif
	partition = NULL;
	np_arr = NULL;
}

/**
 * @brief	pthread routine for freeing up a node_info array
 *
 * @param[in,out]	data - th_data_free_ninfo wrapper for the ninfo array
 *
 * @return void
 */
void
free_node_info_chunk(th_data_free_ninfo *data)
{
	node_info **ninfo_arr;
	int start;
	int end;
	int i;

	ninfo_arr = data->ninfo_arr;
	start = data->sidx;
	end = data->eidx;

	for (i = start; i <= end && ninfo_arr[i] != NULL; i++) {
		delete ninfo_arr[i];
	}
}

/**
 * @brief	Allocates th_data_free_ninfo for multi-threading of free_nodes
 *
 * @param[in,out]	ninfo_arr	-	the node array to free
 * @param[in]	sidx	-	start index for the nodes array for the thread
 * @param[in]	eidx	-	end index for the nodes array for the thread
 *
 * @return th_data_free_ninfo *
 * @retval a newly allocated th_data_free_ninfo object
 * @retval NULL for malloc error
 */
static inline th_data_free_ninfo *
alloc_tdata_free_nodes(node_info **ninfo_arr, int sidx, int eidx)
{
	th_data_free_ninfo *tdata;

	tdata = static_cast<th_data_free_ninfo *>(malloc(sizeof(th_data_free_ninfo)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	tdata->ninfo_arr = ninfo_arr;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 *		free_nodes - free all the nodes in a node_info array
 *
 * @param[in,out]	ninfo_arr - the node info array
 *
 * @return	nothing
 *
 */
void
free_nodes(node_info **ninfo_arr)
{
	int i;
	int chunk_size;
	th_data_free_ninfo *tdata = NULL;
	th_task_info *task = NULL;
	int num_tasks;
	int num_nodes;
	int tid;

	if (ninfo_arr == NULL)
		return;

	num_nodes = count_array(ninfo_arr);

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_free_nodes(ninfo_arr, 0, num_nodes - 1);
		if (tdata == NULL)
			return;

		free_node_info_chunk(tdata);
		free(tdata);
		free(ninfo_arr);
		return;
	}
	chunk_size = num_nodes / num_threads;
	chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
	for (i = 0, num_tasks = 0; num_nodes > 0;
	     num_tasks++, i += chunk_size, num_nodes -= chunk_size) {
		tdata = alloc_tdata_free_nodes(ninfo_arr, i, i + chunk_size - 1);
		if (tdata == NULL)
			break;

		task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
		if (task == NULL) {
			free(tdata);
			log_err(errno, __func__, MEM_ERR_MSG);
			break;
		}
		task->task_type = TS_FREE_ND_INFO;
		task->thread_data = (void *) tdata;

		queue_work_for_threads(task);
	}

	/* Get results from worker threads */
	for (i = 0; i < num_tasks;) {
		pthread_mutex_lock(&result_lock);
		while (ds_queue_is_empty(result_queue))
			pthread_cond_wait(&result_cond, &result_lock);
		while (!ds_queue_is_empty(result_queue)) {
			task = static_cast<th_task_info *>(ds_dequeue(result_queue));
			tdata = static_cast<th_data_free_ninfo *>(task->thread_data);
			free(tdata);
			free(task);
			i++;
		}
		pthread_mutex_unlock(&result_lock);
	}
	free(ninfo_arr);
}

/**
 * @brief
 *      node_info destructor
 */
node_info::~node_info()
{
	free(mom);
	free_string_array(jobs);
	free_string_array(resvs);
	free(job_arr);
	free(run_resvs_arr);
	free_resource_list(res);
	free_counts_list(group_counts);
	free_counts_list(user_counts);
	free(current_aoe);
	free(current_eoe);
	free(nodesig);
	free_te_list(node_events);
	free(partition);
	free(np_arr);
}

/**
 * @brief
 * 		set the node state info bits from a single or comma separated list of
 * 		states.
 *
 * @param[in]	ninfo	-	the node to set the state
 * @param[in]	state	-	the state string from the server
 *
 * @retval	0	: on success
 * @retval	1	: on failure
 */
int
set_node_info_state(node_info *ninfo, const char *state)
{
	if (ninfo != NULL && state != NULL) {
		char statebuf[256]; /* used to strtok() node states */
		char *tok;	    /* used with strtok() */
		char *saveptr;

		/* clear all states */
		ninfo->is_down = ninfo->is_free = ninfo->is_unknown = 0;
		ninfo->is_sharing = ninfo->is_busy = ninfo->is_job_busy = 0;
		ninfo->is_stale = ninfo->is_provisioning = ninfo->is_exclusive = 0;
		ninfo->is_resv_exclusive = ninfo->is_job_exclusive = 0;
		ninfo->is_sleeping = ninfo->is_maintenance = 0;

		strcpy(statebuf, state);
		tok = strtok_r(statebuf, ",", &saveptr);

		while (tok != NULL) {
			while (isspace((int) *tok))
				tok++;

			if (add_node_state(ninfo, tok) == 1)
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
					   ninfo->name, "Unknown Node State: %s", tok);

			tok = strtok_r(NULL, ",", &saveptr);
		}
		return 0;
	}

	return 1;
}

/**
 * @brief
 * 		Remove a node state
 *
 * @param[in]	node	-	The node being considered
 * @param[in]	state	-	The state to remove
 *
 * @par Side-Effects:
 * 		Handles node exclusivity in a special way.
 * 		If handling resv-exclusive, unset is_exclusive along
 * 		If handling job-exclusive, unset is_exclusive only if resv-exclusive isn't
 * 		set.
 *
 * @retval	0	: on success
 * @retval	1	: on failure
 */
int
remove_node_state(node_info *ninfo, const char *state)
{
	if (ninfo == NULL)
		return 1;

	if (!strcmp(state, ND_down))
		ninfo->is_down = 0;
	else if (!strcmp(state, ND_free))
		ninfo->is_free = 0;
	else if (!strcmp(state, ND_offline))
		ninfo->is_offline = 0;
	else if (!strcmp(state, ND_state_unknown))
		ninfo->is_unknown = 0;
	else if (!strcmp(state, ND_job_exclusive)) {
		ninfo->is_job_exclusive = 0;
		if (ninfo->is_resv_exclusive == 0)
			ninfo->is_exclusive = 0;
	} else if (!strcmp(state, ND_resv_exclusive)) {
		ninfo->is_resv_exclusive = 0;
		if (ninfo->is_job_exclusive == 0)
			ninfo->is_exclusive = 0;
	} else if (!strcmp(state, ND_job_sharing))
		ninfo->is_sharing = 0;
	else if (!strcmp(state, ND_busy))
		ninfo->is_busy = 0;
	else if (!strcmp(state, ND_jobbusy))
		ninfo->is_job_busy = 0;
	else if (!strcmp(state, ND_Stale))
		ninfo->is_stale = 0;
	else if (!strcmp(state, ND_prov))
		ninfo->is_provisioning = 0;
	else if (!strcmp(state, ND_wait_prov))
		ninfo->is_provisioning = 0;
	else if (!strcmp(state, ND_maintenance))
		ninfo->is_maintenance = 0;
	else {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
			   ninfo->name, "Unknown Node State: %s on remove operation", state);
		return 1;
	}

	/* If all state bits are turned off, the node state must be free */
	if (!ninfo->is_free && !ninfo->is_busy && !ninfo->is_exclusive && !ninfo->is_job_exclusive && !ninfo->is_resv_exclusive && !ninfo->is_offline && !ninfo->is_job_busy && !ninfo->is_stale && !ninfo->is_provisioning && !ninfo->is_sharing && !ninfo->is_unknown && !ninfo->is_down && !ninfo->is_maintenance)
		ninfo->is_free = 1;

	if (ninfo->is_free)
		ninfo->nscr &= ~NSCR_CYCLE_INELIGIBLE;
	else
		ninfo->nscr |= NSCR_CYCLE_INELIGIBLE;

	return 0;
}

/**
 * @brief
 * 		Add a node state
 *
 * @param[in]	node	-	The node being considered
 * @param[in]	state	-	The state to add
 *
 * @par Side-Effects:
 * 		Handle node exclusivity in a special way.
 * 		If handling resv-exclusive or job-exclusive, turn is_exclusive bit on.
 *
 * @retval	0	: on success
 * @retval	1	: on failure
 */
int
add_node_state(node_info *ninfo, const char *state)
{
	int set_free = 0;

	if (ninfo == NULL)
		return 1;

	if (!strcmp(state, ND_down))
		ninfo->is_down = 1;
	else if (!strcmp(state, ND_free)) {
		ninfo->is_free = 1;
		set_free = 1;
	} else if (!strcmp(state, ND_offline))
		ninfo->is_offline = 1;
	else if (!strcmp(state, ND_state_unknown) || !strcmp(state, ND_unresolvable))
		ninfo->is_unknown = 1;
	else if (!strcmp(state, ND_job_exclusive)) {
		ninfo->is_job_exclusive = 1;
		ninfo->is_exclusive = 1;
	} else if (!strcmp(state, ND_resv_exclusive)) {
		ninfo->is_resv_exclusive = 1;
		ninfo->is_exclusive = 1;
	} else if (!strcmp(state, ND_job_sharing))
		ninfo->is_sharing = 1;
	else if (!strcmp(state, ND_busy))
		ninfo->is_busy = 1;
	else if (!strcmp(state, ND_jobbusy))
		ninfo->is_job_busy = 1;
	else if (!strcmp(state, ND_Stale))
		ninfo->is_stale = 1;
	else if (!strcmp(state, ND_prov))
		ninfo->is_provisioning = 1;
	else if (!strcmp(state, ND_wait_prov))
		ninfo->is_provisioning = 1;
	else if (!strcmp(state, ND_maintenance))
		ninfo->is_maintenance = 1;
	else if (!strcmp(state, ND_sleep)) {
		if (ninfo->server->power_provisioning)
			ninfo->is_sleeping = 1;
	} else {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
			   ninfo->name, "Unknown Node State: %s on add operation", state);
		return 1;
	}

	/* Remove the free state unless it was specifically the state being added */
	if (!set_free) {
		ninfo->is_free = 0;
		ninfo->nscr |= NSCR_CYCLE_INELIGIBLE;
	} else
		ninfo->nscr &= ~NSCR_CYCLE_INELIGIBLE;

	return 0;
}

/**
 * @brief
 *		node_filter - filter a node array and return a new filterd array
 *
 * @param[in]	nodes	-	the array to filter
 * @param[in]	size	-	size of nodes (<0 for function to figure it out)
 * @param[in]	filter_func	-	pointer to a function that will filter the nodes
 *								- returns 1: job will be added to filtered array
 *								- returns 0: job will NOT be added to filtered array
 * @param[in]	arg - an optional arg passed to filter_func
 * @param[in]	flags - describe how nodes are filtered
 *
 * @return pointer to filtered array
 *
 * @par
 * filter_func prototype: int func( node_info *, void * )
 *
 */
node_info **
node_filter(node_info **nodes, int size,
	    int (*filter_func)(node_info *, void *), void *arg, int flags)
{
	node_info **new_nodes = NULL; /* the new node array */
	node_info **new_nodes_tmp = NULL;
	int i, j;

	if (size < 0)
		size = count_array(nodes);

	if ((new_nodes = static_cast<node_info **>(malloc((size + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0, j = 0; i < size; i++) {
		if (filter_func(nodes[i], arg)) {
			new_nodes[j] = nodes[i];
			j++;
		}
	}
	new_nodes[j] = NULL;

	if (!(flags & FILTER_FULL)) {
		if ((new_nodes_tmp = static_cast<node_info **>(realloc(new_nodes, (j + 1) * sizeof(node_info *)))) == NULL)
			log_err(errno, __func__, MEM_ERR_MSG);
		else
			new_nodes = new_nodes_tmp;
	}
	return new_nodes;
}

/**
 * @brief find a node by string
 * @param[in] ninfo_arr - node array to search
 * @param[in] nodename - name of node to searh for
 * @return node_info *
 * @retval found node
 * @retval NULL if not found or on error
 */
node_info *
find_node_info(node_info **ninfo_arr, const std::string &nodename)
{
	int i;

	if (ninfo_arr == NULL)
		return NULL;

	for (i = 0; ninfo_arr[i] != NULL && nodename != ninfo_arr[i]->name; i++)
		;

	return ninfo_arr[i];
}

/**
 * @brief
 *		find_node_by_host - find a node by its host resource rather then
 *				its name -- will return first found vnode
 *
 * @param[in]	ninfo_arr	-	array of nodes to search
 * @param[in]	host	-	host of node to find
 *
 * @return	found node
 * @retval	NULL	: not found
 *
 */
node_info *
find_node_by_host(node_info **ninfo_arr, char *host)
{
	int i;

	if (ninfo_arr == NULL || host == NULL)
		return NULL;

	for (i = 0; ninfo_arr[i] != NULL; i++) {
		auto res = find_resource(ninfo_arr[i]->res, allres["host"]);
		if (res != NULL) {
			if (compare_res_to_str(res, host, CMP_CASELESS))
				break;
		}
	}

	return ninfo_arr[i];
}

/**
 * @brief	pthread routine to dup a chunk of nodes
 *
 * @param[in,out]	data - data associated with duping of the nodes
 *
 * @return void
 */
void
dup_node_info_chunk(th_data_dup_nd_info *data)
{
	int i;
	int start;
	int end;
	node_info **onodes;
	node_info **nnodes;
	server_info *nsinfo;
	unsigned int flags;

	start = data->sidx;
	end = data->eidx;
	onodes = data->onodes;
	nnodes = data->nnodes;
	nsinfo = data->nsinfo;
	data->error = 0;
	flags = data->flags;

	for (i = start; i <= end && data->onodes[i] != NULL; i++) {
		if ((nnodes[i] = dup_node_info(onodes[i], nsinfo, flags)) == NULL) {
			data->error = 1;
			return;
		}
	}
}

/**
 * @brief	Allocates th_data_dup_nd_info for multi-threading of dup_nodes
 *
 * @param[in]	flags	-	flags passed to dup_nodes
 * @param[in]	nsinfo	-	the new server
 * @param[in]	onodes	-	the array to duplicate
 * @param[out]	nnodes	-	the duplicated array
 * @param[in]	sidx	-	start index for the nodes list for the thread
 * @param[in]	eidx	-	end index for the nodes list for the thread
 *
 * @return th_data_dup_nd_info *
 * @retval a newly allocated th_data_dup_nd_info object
 * @retval NULL for malloc error
 */
static inline th_data_dup_nd_info *
alloc_tdata_dup_nodes(unsigned int flags, server_info *nsinfo, node_info **onodes, node_info **nnodes,
		      int sidx, int eidx)
{
	th_data_dup_nd_info *tdata;

	tdata = static_cast<th_data_dup_nd_info *>(malloc(sizeof(th_data_dup_nd_info)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->flags = flags;
	tdata->nsinfo = nsinfo;
	tdata->onodes = onodes;
	tdata->nnodes = nnodes;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 *		dup_nodes - duplicate an array of nodes
 *
 * @param[in]	onodes	-	the array to duplicate
 * @param[in]	nsinfo	-	the new server
 * @param[in]	flags	-	DUP_INDIRECT - duplicate
 * 				 			target resources, not indirect
 *
 * @return the duplicated array
 * @retval	NULL	: on error
 *
 */
node_info **
dup_nodes(node_info **onodes, server_info *nsinfo, unsigned int flags)
{
	node_info **nnodes;
	int num_nodes;
	int thread_node_ct_left;
	schd_resource *nres = NULL;
	schd_resource *ores = NULL;
	schd_resource *tres = NULL;
	node_info *ninfo = NULL;
	th_data_dup_nd_info *tdata = NULL;
	th_task_info *task = NULL;
	int th_err = 0;
	int tid;

	if (onodes == NULL || nsinfo == NULL)
		return NULL;

	num_nodes = thread_node_ct_left = count_array(onodes);

	if ((nnodes = static_cast<node_info **>(malloc((num_nodes + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_dup_nodes(flags, nsinfo, onodes, nnodes, 0, num_nodes - 1);
		if (tdata == NULL) {
			free_nodes(nnodes);
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}

		dup_node_info_chunk(tdata);
		th_err = tdata->error;
		free(tdata);
	} else { /* We are multithreading */
		int j;
		int num_tasks;
		int chunk_size = num_nodes / num_threads;
		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		for (j = 0, num_tasks = 0; thread_node_ct_left > 0;
		     num_tasks++, j += chunk_size, thread_node_ct_left -= chunk_size) {
			tdata = alloc_tdata_dup_nodes(flags, nsinfo, onodes, nnodes, j, j + chunk_size - 1);
			if (tdata == NULL) {
				th_err = 1;
				break;
			}
			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			if (task == NULL) {
				free(tdata);
				th_err = 1;
				log_err(errno, __func__, MEM_ERR_MSG);
				break;
			}
			task->task_type = TS_DUP_ND_INFO;
			task->thread_data = (void *) tdata;

			queue_work_for_threads(task);
		}

		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_dup_nd_info *>(task->thread_data);
				if (tdata->error)
					th_err = 1;
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
	}

	if (th_err) {
		free_nodes(nnodes);
		return NULL;
	}
	nnodes[num_nodes] = NULL;

	if (!(flags & DUP_INDIRECT)) {
		for (int i = 0; nnodes[i] != NULL; i++) {
			/* since the node list we're duplicating may have indirect resources
			 * which point to resources not in our node list, we need to detect it
			 * if we are in this case, we'll redirect them locally
			 */
			nres = nnodes[i]->res;
			while (nres != NULL) {
				if (nres->indirect_vnode_name != NULL) {
					ninfo = find_node_info(nnodes, nres->indirect_vnode_name);
					/* we found the problem -- first time we see it, we set the value
					 * of THIS node to the indirect value.  We'll then set all the rest
					 * to point to THIS node.
					 */
					if (ninfo == NULL) {
						ninfo = find_node_info(onodes, nnodes[i]->name);
						ores = find_resource(ninfo->res, nres->def);
						if (ores->indirect_res != NULL) {
							char namebuf[1024];

							sprintf(namebuf, "@%s", nnodes[i]->name.c_str());
							for (int j = i + 1; nnodes[j] != NULL; j++) {
								tres = find_resource(nnodes[j]->res, nres->def);
								if (tres != NULL) {
									if (tres->indirect_vnode_name != NULL &&
									    !strcmp(nres->indirect_vnode_name,
										    nres->indirect_vnode_name)) {
										if (set_resource(tres, namebuf, RF_AVAIL) == 0) {
											free_nodes(nnodes);
											return NULL;
										}
									}
								}
							}
							if (set_resource(nres,
									 ores->indirect_res->orig_str_avail, RF_AVAIL) == 0) {
								free_nodes(nnodes);
								return NULL;
							}
							nres->assigned = ores->indirect_res->assigned;
						}
					}
				}
				nres = nres->next;
			}
		}
	}

	if (resolve_indirect_resources(nnodes) == 0) {
		free_nodes(nnodes);
		return NULL;
	}
	return nnodes;
}

/**
 * @brief
 *		dup_node_info - duplicate a node by creating a new one and coping all
 *		        the data into the new
 *
 * @param[in]	onode	-	the node to dup
 * @param[in]	nsinfo	-	the NEW server (i.e. duplicated)
 * @param[in]	flags	-	DUP_INDIRECT - duplicate target resources, not indirect
 *
 * @return	newly allocated and duped node
 *
 */
node_info *
dup_node_info(node_info *onode, server_info *nsinfo, unsigned int flags)
{
	node_info *nnode;

	if (onode == NULL)
		return NULL;

	if ((nnode = new node_info(onode->name)) == NULL)
		return NULL;

	nnode->server = nsinfo;
	nnode->mom = string_dup(onode->mom);
	nnode->queue_name = onode->queue_name;

	nnode->is_down = onode->is_down;
	nnode->is_free = onode->is_free;
	nnode->is_offline = onode->is_offline;
	nnode->is_unknown = onode->is_unknown;
	nnode->is_exclusive = onode->is_exclusive;
	nnode->is_job_exclusive = onode->is_job_exclusive;
	nnode->is_resv_exclusive = onode->is_resv_exclusive;
	nnode->is_sharing = onode->is_sharing;
	nnode->is_busy = onode->is_busy;
	nnode->is_job_busy = onode->is_job_busy;
	nnode->is_stale = onode->is_stale;
	nnode->is_maintenance = onode->is_maintenance;
	nnode->is_provisioning = onode->is_provisioning;
	nnode->is_multivnoded = onode->is_multivnoded;

	nnode->sharing = onode->sharing;

	nnode->lic_lock = onode->lic_lock;

	nnode->rank = onode->rank;

	nnode->has_hard_limit = onode->has_hard_limit;
	nnode->no_multinode_jobs = onode->no_multinode_jobs;
	nnode->resv_enable = onode->resv_enable;
	nnode->provision_enable = onode->provision_enable;
	nnode->power_provisioning = onode->power_provisioning;

	nnode->num_jobs = onode->num_jobs;
	nnode->num_run_resv = onode->num_run_resv;
	nnode->num_susp_jobs = onode->num_susp_jobs;

	nnode->priority = onode->priority;

	nnode->jobs = dup_string_arr(onode->jobs);
	nnode->resvs = dup_string_arr(onode->resvs);
	if (flags & DUP_INDIRECT)
		nnode->res = dup_ind_resource_list(onode->res);
	else
		nnode->res = dup_resource_list(onode->res);

	nnode->max_running = onode->max_running;
	nnode->max_user_run = onode->max_user_run;
	nnode->max_group_run = onode->max_group_run;

	nnode->group_counts = dup_counts_umap(onode->group_counts);
	nnode->user_counts = dup_counts_umap(onode->user_counts);

	set_current_aoe(nnode, onode->current_aoe);
	set_current_eoe(nnode, onode->current_eoe);
	nnode->nodesig = string_dup(onode->nodesig);
	nnode->nodesig_ind = onode->nodesig_ind;
	nnode->last_state_change_time = onode->last_state_change_time;
	nnode->last_used_time = onode->last_used_time;

	if (onode->svr_node != NULL)
		nnode->svr_node = find_node_by_indrank(nsinfo->nodes, onode->node_ind, onode->rank);

	/* Duplicate list of jobs and running reservations.
	 * If caller is server_info's copy constructor then nsinfo->resvs/jobs should be NULL,
	 * but running reservations and jobs are collected later in the caller.
	 * Otherwise, we collect running reservations or jobs here.
	 */
	nnode->run_resvs_arr = copy_resresv_array(onode->run_resvs_arr, nsinfo->resvs);
	nnode->job_arr = copy_resresv_array(onode->job_arr, nsinfo->jobs);

	/* If we are called from dup_server(), nsinfo->hostsets are NULL.
	 * They are not created yet.  Hostsets will be attached in dup_server()
	 */
	if (onode->hostset != NULL)
		nnode->hostset = find_node_partition_by_rank(nsinfo->hostsets,
							     onode->hostset->rank);

	nnode->bucket_ind = onode->bucket_ind;
	nnode->node_ind = onode->node_ind;

	nnode->nscr = onode->nscr;

	if (onode->partition != NULL) {
		nnode->partition = string_dup(onode->partition);
		if (nnode->partition == NULL) {
			delete nnode;
			return NULL;
		}
	}

	return nnode;
}

/**
 * @brief
 *		copy_node_ptr_array - copy an array of jobs using a different set of
 *			      of node pointer (same nodes, different array).
 *			      This means we have to use the names from the
 *			      first array and find them in the second array
 *
 *
 * @param[in]	oarr	-	the old array (filtered array)
 * @param[in]	narr	-	the new array (entire node array)
 *
 * @return	copied array
 * @retval	NULL	: on error
 *
 */
node_info **
copy_node_ptr_array(node_info **oarr, node_info **narr)
{
	int i;
	node_info **ninfo_arr;
	node_info *ninfo;

	if (oarr == NULL || narr == NULL)
		return NULL;

	for (i = 0; oarr[i] != NULL; i++)
		;

	if ((ninfo_arr = static_cast<node_info **>(malloc(sizeof(node_info *) * (i + 1)))) == NULL)
		return NULL;

	for (i = 0; oarr[i] != NULL; i++) {
		ninfo = find_node_by_indrank(narr, oarr[i]->node_ind, oarr[i]->rank);

		if (ninfo == NULL) {
			free(ninfo_arr);
			return NULL;
		}
		ninfo_arr[i] = ninfo;
	}
	ninfo_arr[i] = NULL;

	return ninfo_arr;
}

/**
 * @brief
 *		collect_resvs_on_nodes - collect all the running resvs from resv array
 *				on the nodes
 *
 * @param[in]	ninfo	-	the nodes to collect for
 * @param[in]	resresv_arr	-	the array of resvs to consider
 * @param[in]	size	-	the size (in number of pointers) of the resv array
 *
 * @return	int
 * @retval	1	: success
 * @retval	0	: failure
 *
 */
int
collect_resvs_on_nodes(node_info **ninfo_arr, resource_resv **resresv_arr, int size)
{
	int i;

	if (ninfo_arr == NULL || ninfo_arr[0] == NULL)
		return 0;

	for (i = 0; ninfo_arr[i] != NULL; i++) {
		ninfo_arr[i]->run_resvs_arr = resource_resv_filter(resresv_arr, size,
								   check_resv_running_on_node, ninfo_arr[i]->name.c_str(), 0);
		/* the count of running resvs on the node is set in query_reservations */
	}
	return 1;
}

/**
 * @brief
 *		collect_jobs_on_nodes - collect all the jobs in the job array on the
 *				nodes
 *
 * @param[in]	ninfo	-	the nodes to collect for
 * @param[in]	resresv_arr	-	the array of jobs to consider
 * @param[in]	size	-	the size (in number of pointers) of the job arrays
 * @param[in]	flags	-	to indicate whether to do ghost job detection
 *
 * @retval	1	: upon success
 * @retval	2	: if a job reported on nodes was not found in the job arrays
 * @retval	0	: upon failure
 *
 */
int
collect_jobs_on_nodes(node_info **ninfo_arr, resource_resv **resresv_arr, int size, int flags)
{
	char *ptr;			  /* used to find the '/' in the jobs array */
	resource_resv *job;		  /* find the job from the jobs array */
	resource_resv **susp_jobs = NULL; /* list of suspended jobs */
	node_info *node;		  /* used to store pointer of node in ninfo_arr */
	resource_resv **temp_ninfo_arr = NULL;

	if (ninfo_arr == NULL || ninfo_arr[0] == NULL)
		return 0;

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		if ((ninfo_arr[i]->job_arr = static_cast<resource_resv **>(malloc((size + 1) * sizeof(resource_resv *)))) == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return 0;
		}
		ninfo_arr[i]->job_arr[0] = NULL;
	}

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		if (ninfo_arr[i]->jobs != NULL) {
			/* If there are no running jobs in the list and node reports a running job,
			 * mark that the node has ghost job
			 */
			if (size == 0 && (flags & DETECT_GHOST_JOBS)) {
				ninfo_arr[i]->has_ghost_job = 1;
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG, ninfo_arr[i]->name,
					  "Jobs reported running on node no longer exists or are not in running state");
			}

			int k = 0;
			for (int j = 0; ninfo_arr[i]->jobs[j] != NULL && k < size; j++) {
				/* jobs are in the format of node_name/sub_node.  We don't care about
				 * the subnode... we just want to populate the jobs on our node
				 * structure
				 */
				ptr = strchr(ninfo_arr[i]->jobs[j], '/');
				if (ptr != NULL)
					*ptr = '\0';

				job = find_resource_resv(resresv_arr, ninfo_arr[i]->jobs[j]);
				if ((job != NULL) && (!job->nspec_arr.empty())) {
					/* if a distributed job has more then one instance on this node
					 * it'll show up more then once.  If this is the case, we only
					 * want to have the job in our array once.
					 */
					if (find_resource_resv_by_indrank(ninfo_arr[i]->job_arr, -1, job->rank) == NULL) {
						if (ninfo_arr[i]->has_hard_limit) {
							counts *cts;
							cts = find_alloc_counts(ninfo_arr[i]->group_counts,
										job->group);
							update_counts_on_run(cts, job->resreq);

							cts = find_alloc_counts(ninfo_arr[i]->user_counts,
										job->user);
							update_counts_on_run(cts, job->resreq);
						}

						ninfo_arr[i]->job_arr[k] = job;
						k++;
						/* make the job array searchable with find_resource_resv */
						ninfo_arr[i]->job_arr[k] = NULL;
					}
				} else if (flags & DETECT_GHOST_JOBS) {
					/* Race Condition occurred: nodes were queried when a job existed.
					 * Jobs were queried when the job no longer existed.  Make note
					 * of it on the job so the node's resources_assigned values can be
					 * recalculated later.
					 */
					ninfo_arr[i]->has_ghost_job = 1;
					log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG, ninfo_arr[i]->name,
						   "Job %s reported running on node no longer exists or is not in running state",
						   ninfo_arr[i]->jobs[j]);
				}
			}
			ninfo_arr[i]->num_jobs = k;
		}
	}

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		temp_ninfo_arr = static_cast<resource_resv **>(realloc(ninfo_arr[i]->job_arr, (ninfo_arr[i]->num_jobs + 1) * sizeof(resource_resv *)));
		if (temp_ninfo_arr == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return 0;
		} else {
			ninfo_arr[i]->job_arr = temp_ninfo_arr;
		}
		ninfo_arr[i]->job_arr[ninfo_arr[i]->num_jobs] = NULL;
	}

	susp_jobs = resource_resv_filter(resresv_arr,
					 count_array(resresv_arr), check_susp_job, NULL, 0);
	if (susp_jobs == NULL)
		return 0;

	for (int i = 0; susp_jobs[i] != NULL; i++) {
		if (susp_jobs[i]->ninfo_arr != NULL) {
			for (int j = 0; susp_jobs[i]->ninfo_arr[j] != NULL; j++) {
				/* resresv->ninfo_arr is merely a new list with pointers to server nodes.
				 * resresv->resv->resv_nodes is a new list with pointers to resv nodes
				 */
				node = find_node_info(ninfo_arr,
						      susp_jobs[i]->ninfo_arr[j]->name);
				if (node != NULL)
					node->num_susp_jobs++;
			}
		}
	}
	free(susp_jobs);

	return 1;
}

/**
 * @brief
 *		update_node_on_run - update internal scheduler node data when a
 *			     resource resv is run.
 *
 * @param[in]	nspec	-	the nspec for the node allocation
 * @param[in]	resresv -	the resource rev which ran
 * @param[in]  job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	nothing
 *
 */
void
update_node_on_run(nspec *ns, resource_resv *resresv, const char *job_state)
{
	resource_req *resreq;
	schd_resource *ncpusres = NULL;
	resource_resv **tmp_arr;
	node_info *ninfo;

	if (ns == NULL || resresv == NULL)
		return;

	ninfo = ns->ninfo;

	/* Don't account for resources of a node that is unavailable */
	if (ninfo->is_offline || ninfo->is_down)
		return;

	if (resresv->is_job) {
		ninfo->num_jobs++;
		if (find_resource_resv_by_indrank(ninfo->job_arr, resresv->resresv_ind, resresv->rank) == NULL) {
			tmp_arr = add_resresv_to_array(ninfo->job_arr, resresv, NO_FLAGS);
			if (tmp_arr == NULL)
				return;

			ninfo->job_arr = tmp_arr;
		}

	} else if (resresv->is_resv) {
		ninfo->num_run_resv++;
		if (find_resource_resv_by_indrank(ninfo->run_resvs_arr, resresv->resresv_ind, resresv->rank) == NULL) {
			tmp_arr = add_resresv_to_array(ninfo->run_resvs_arr, resresv, NO_FLAGS);
			if (tmp_arr == NULL)
				return;

			ninfo->run_resvs_arr = tmp_arr;
		}
	}

	resreq = ns->resreq;
	if ((job_state != NULL) && (*job_state == 'S')) {
		if (!resresv->job->resreleased.empty()) {
			nspec *temp = find_nspec_by_rank(resresv->job->resreleased, ninfo->rank);
			if (temp != NULL)
				resreq = temp->resreq;
		}
	}
	while (resreq != NULL) {
		if (resreq->type.is_consumable) {
			schd_resource *res;

			res = find_resource(ninfo->res, resreq->def);

			if (res != NULL) {
				if (res->indirect_res != NULL)
					res = res->indirect_res;

				res->assigned += resreq->amount;

				if (res->def == allres["ncpus"]) {
					ncpusres = res;
				}
			}
		}
		resreq = resreq->next;
	}

	if (ninfo->has_hard_limit && resresv->is_job) {
		counts *cts;

		cts = find_alloc_counts(ninfo->group_counts, resresv->group);
		update_counts_on_run(cts, ns->resreq);

		cts = find_alloc_counts(ninfo->user_counts, resresv->user);
		update_counts_on_run(cts, ns->resreq);
	}

	/* if we're a cluster node and we have no cpus available, we're job_busy */
	if (ncpusres == NULL)
		ncpusres = find_resource(ninfo->res, allres["ncpus"]);

	if (ncpusres != NULL) {
		if (dynamic_avail(ncpusres) == 0)
			set_node_info_state(ninfo, ND_jobbusy);
	}

	/* if node selected for provisioning, this node is no longer available */
	if (ns->go_provision == 1) {
		set_node_info_state(ninfo, ND_prov);

		/* for jobs inside reservation, update the server's node info as well */
		if (resresv->job != NULL && resresv->job->resv != NULL &&
		    ninfo->svr_node != NULL) {
			set_node_info_state(ninfo->svr_node, ND_prov);
		}

		set_current_aoe(ninfo, resresv->aoename);
	}

	/* if job has eoe setting this node gets current_eoe set */
	if (resresv->is_job && resresv->eoename != NULL)
		set_current_eoe(ninfo, resresv->eoename);

	if (is_excl(resresv->place_spec, ninfo->sharing)) {
		if (resresv->is_resv) {
			add_node_state(ninfo, ND_resv_exclusive);
		} else {
			add_node_state(ninfo, ND_job_exclusive);
			if (ninfo->svr_node != NULL)
				add_node_state(ninfo->svr_node, ND_job_exclusive);
		}
	}

	if (resresv->run_event != NULL)
		remove_te_list(&ninfo->node_events, resresv->run_event);

	if (ninfo->node_ind != -1 && ninfo->bucket_ind != -1) {
		node_bucket *bkt = ninfo->server->buckets[ninfo->bucket_ind];
		int ind = ninfo->node_ind;

		if (pbs_bitmap_get_bit(bkt->free_pool->truth, ind)) {
			pbs_bitmap_bit_off(bkt->free_pool->truth, ind);
			bkt->free_pool->truth_ct--;
		} else {
			pbs_bitmap_bit_off(bkt->busy_later_pool->truth, ind);
			bkt->busy_later_pool->truth_ct--;
		}

		pbs_bitmap_bit_on(bkt->busy_pool->truth, ind);
		bkt->busy_pool->truth_ct++;
	}
}

/**
 * @brief
 *		update_node_on_end - update a node when a resource resv ends
 *
 * @param[in]	ninfo	-	the node where the job was running
 * @param[in]	resresv -	the resource resv which is ending
 * @param[in]	job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	nothing
 *
 */
void
update_node_on_end(node_info *ninfo, resource_resv *resresv, const char *job_state)
{
	resource_req *resreq = NULL;
	schd_resource *res = NULL;
	counts *cts;
	int ind;

	if (ninfo == NULL || resresv == NULL)
		return;

	/* Don't account for resources of a node that is unavailable */
	if (ninfo->is_offline || ninfo->is_down)
		return;

	if (resresv->is_job) {
		ninfo->num_jobs--;
		if (ninfo->num_jobs < 0)
			ninfo->num_jobs = 0;

		remove_resresv_from_array(ninfo->job_arr, resresv);
	} else if (resresv->is_resv) {
		ninfo->num_run_resv--;
		if (ninfo->num_run_resv < 0)
			ninfo->num_run_resv = 0;

		remove_resresv_from_array(ninfo->run_resvs_arr, resresv);
	}

	if (ninfo->is_job_busy)
		remove_node_state(ninfo, ND_jobbusy);
	if (is_excl(resresv->place_spec, ninfo->sharing)) {
		if (resresv->is_resv)
			remove_node_state(ninfo, ND_resv_exclusive);
		else {
			remove_node_state(ninfo, ND_job_exclusive);
			if (ninfo->svr_node != NULL)
				remove_node_state(ninfo->svr_node, ND_job_exclusive);
		}
	}

	for (auto ns : resresv->nspec_arr) {
		if (ns->ninfo == ninfo) {
			resreq = ns->resreq;
			if ((job_state != NULL) && (*job_state == 'S')) {
				if (!resresv->job->resreleased.empty()) {
					nspec *temp = find_nspec_by_rank(resresv->job->resreleased, ninfo->rank);
					if (temp != NULL)
						resreq = temp->resreq;
				}
			}
			while (resreq != NULL) {
				if (resreq->type.is_consumable) {
					res = find_resource(ninfo->res, resreq->def);
					if (res != NULL) {
						if (res->indirect_res != NULL)
							res = res->indirect_res;
						res->assigned -= resreq->amount;
						if (res->assigned < 0) {
							log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, ninfo->name,
								   "%s turned negative %.2lf, setting it to 0", res->name, res->assigned);
							res->assigned = 0;
						}
					}
				}
				resreq = resreq->next;
			}
			/* no soft limits on nodes... just hard limits */
			if (ninfo->has_hard_limit && resresv->is_job) {
				cts = find_counts(ninfo->group_counts, resresv->group);

				if (cts != NULL)
					update_counts_on_end(cts, ns->resreq);

				cts = find_counts(ninfo->user_counts, resresv->user);

				if (cts != NULL)
					update_counts_on_end(cts, ns->resreq);
			}
		}
	}

	ind = ninfo->node_ind;
	if (ind != -1 && ninfo->bucket_ind != -1 && ninfo->num_jobs == 0) {
		node_bucket *bkt = ninfo->server->buckets[ninfo->bucket_ind];

		if (ninfo->node_events == NULL) {
			pbs_bitmap_bit_on(bkt->free_pool->truth, ind);
			bkt->free_pool->truth_ct++;
		} else {
			pbs_bitmap_bit_on(bkt->busy_later_pool->truth, ind);
			bkt->busy_later_pool->truth_ct++;
		}
		pbs_bitmap_bit_off(bkt->busy_pool->truth, ind);
		bkt->busy_pool->truth_ct--;
	}
}

// constructor
nspec::nspec()
{
	end_of_chunk = 0;
	seq_num = 0;
	sub_seq_num = 0;
	go_provision = 0;
	ninfo = NULL;
	resreq = NULL;
	chk = NULL;
}

// destructor
nspec::~nspec()
{
	free_resource_req_list(resreq);
}

// copy constructor
nspec::nspec(const nspec &ons, node_info **ninfo_arr, selspec *sel)
{
	end_of_chunk = ons.end_of_chunk;
	seq_num = ons.seq_num;
	sub_seq_num = ons.sub_seq_num;
	go_provision = ons.go_provision;
	ninfo = find_node_by_indrank(ninfo_arr, ons.ninfo->node_ind, ons.ninfo->rank);
	resreq = dup_resource_req_list(ons.resreq);
	if (sel != NULL)
		chk = find_chunk_by_seq_num(sel->chunks, ons.seq_num);
}

/**
 * @brief
 * 		dup_nspecs - duplicate an array of nspecs
 *
 * @param[in]	onspecs		- the nspecs to duplicate
 * @param[in]	ninfo_arr	- the nodes corresponding to the nspecs
 * @param[in]	sel		- select spec to map nspecs to
 * @return	duplicated nspec array
 *
 */
std::vector<nspec *>
dup_nspecs(const std::vector<nspec *> &onspecs, node_info **ninfo_arr, selspec *sel)
{
	std::vector<nspec *> nnspecs;

	if (onspecs.empty() || ninfo_arr == NULL)
		return {};

	for (const auto &ns : onspecs)
		nnspecs.push_back(new nspec(*ns, ninfo_arr, sel));

	return nnspecs;
}

/**
 * @brief
 * 		free_nspecs - free a nspec array
 *
 * @param[in,out]	ns	-	the nspec array
 *
 * @return	nothing
 *
 */
void
free_nspecs(std::vector<nspec *> &nspec_arr)
{
	for (auto ns : nspec_arr)
		delete ns;
	nspec_arr.clear();
}

/**
 * @brief
 *		find_nspec - find an nspec in an array
 *
 * @param[in]	nspec_arr	-	the array of nspecs to search
 * @param[in]	ninfo	-	the node_info to find
 *
 * @return	the found nspec
 * @retval	NULL
 *
 */
nspec *
find_nspec(std::vector<nspec *> &nspec_arr, node_info *ninfo)
{
	if (ninfo == NULL)
		return NULL;
	for (const auto &ns : nspec_arr)
		if (ns->ninfo == ninfo)
			return ns;

	return NULL;
}

/**
 * @brief
 * 		find an nspec in an array by rank
 *
 * @param[in]	nspec_arr	-	the array of nspecs to search
 * @param[in]	rank	-	the unique integer identifier of the nspec/node to search for
 *
 * @return	the found nspec
 * @retval	NULL	: Error
 *
 */
nspec *
find_nspec_by_rank(std::vector<nspec *> &nspec_arr, int rank)
{
	for (const auto &ns : nspec_arr)
		if (ns->ninfo->rank == rank)
			return ns;

	return NULL;
}

/**
 *	@brief
 *		eval a select spec to see if it is satisfiable
 *
 * @param[in]	policy	  -	policy info
 * @param[in]	spec	  -	the select spec
 * @param[in]	placespec -	the placement spec (-l place)
 * @param[in]	ninfo_arr - 	array of nodes to satisfy the spec
 * @param[in]	nodepart  -	the node partition array for node grouping
 *		 	 	if NULL, we're not doing node grouping
 * @param[in]	resresv	  -	the resource resv the spec is from
 * @param[in]	flags	  -	flags to change functions behavior
 *	      			EVAL_OKBREAK - ok to break chunk up across vnodes
 *	      			EVAL_EXCLSET - allocate entire nodelist exclusively
 * @param[out]	nspec_arr -	the node solution
 * @param[out]	err	  -	error structure to return error information
 *
 * @return	bool
 * @retval	true	  : 	if the nodespec can be satisfied
 * @retval	false	  : 	if not
 *
 */
bool
eval_selspec(status *policy, selspec *spec, place *placespec,
	     node_info **ninfo_arr, node_partition **nodepart, resource_resv *resresv,
	     unsigned int flags, std::vector<nspec *> &nspec_arr, schd_error *err)
{
	place *pl;
	int can_fit = 0;
	bool rc = false; /* 1 if resources are available, 0 if not */
	int pass_flags = NO_FLAGS;
	char reason[MAX_LOG_SIZE] = {0};
	int i = 0;
	static struct schd_error *failerr = NULL;

	if (spec == NULL || ninfo_arr == NULL || resresv == NULL || placespec == NULL)
		return false;
	/* Unsetting RETURN_ALL_ERR flag, because with this flag set resresv_can_fit_nodepart can return
	 * with multiple errors and the function only needs to see the first error it encounters.
	 */
	flags &= ~RETURN_ALL_ERR;

	if (failerr == NULL) {
		failerr = new_schd_error();
		if (failerr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return false;
		}
	} else
		clear_schd_error(failerr);

	/* Remove visited, scattered and ineligible bits from ncsr for node searching
	 * Since statebusy is a per cycle bit, it shouldn't be changed
	 */
	for (i = 0; ninfo_arr[i] != NULL; i++)
		ninfo_arr[i]->nscr &= ~(NSCR_VISITED | NSCR_SCATTERED | NSCR_INELIGIBLE);

	pl = placespec;

	if (flags != NO_FLAGS)
		pass_flags = flags;

	check_node_array_eligibility(ninfo_arr, resresv, pl, err);

	if (failerr->status_code == SCHD_UNKWN)
		move_schd_error(failerr, err);
	clear_schd_error(err);

	/* If we are not node grouping or we only have 1 chunk packed onto a single
	 * host, then we should try and satisfy over all nodes in the list
	 *
	 * NOTE: pack && total_chunks == 1 may not be valid once chunks are
	 * broken into vchunks
	 */
	if (nodepart == NULL) {
		if (resresv->server->has_multi_vnode && ok_break_chunk(resresv, ninfo_arr))
			pass_flags |= EVAL_OKBREAK;

		rc = eval_placement(policy, spec, ninfo_arr, pl, resresv, pass_flags, nspec_arr, err);
		if (!rc)
			free_nspecs(nspec_arr);

		if (pass_flags & EVAL_EXCLSET)
			alloc_rest_nodepart(nspec_arr, ninfo_arr);

		if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
			move_schd_error(err, failerr);

		return rc;
	}

	/* Otherwise we're node grouping... */

	for (i = 0; nodepart[i] != NULL && rc == 0; i++) {
		clear_schd_error(err);
		if (resresv_can_fit_nodepart(policy, nodepart[i], resresv, flags, err)) {
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Evaluating placement set: %s", nodepart[i]->name);
			if (nodepart[i]->ok_break)
				pass_flags |= EVAL_OKBREAK;

			if (nodepart[i]->excl)
				pass_flags |= EVAL_EXCLSET;

			rc = eval_placement(policy, spec, nodepart[i]->ninfo_arr, pl,
					    resresv, pass_flags, nspec_arr, err);
			if (rc) {
				if (resresv->nodepart_name != NULL)
					free(resresv->nodepart_name);
				resresv->nodepart_name = string_dup(nodepart[i]->name);
				can_fit = 1;
				if (nodepart[i]->excl)
					alloc_rest_nodepart(nspec_arr, nodepart[i]->ninfo_arr);
			} else {
				free_nspecs(nspec_arr);
				if (failerr->status_code == SCHD_UNKWN)
					copy_schd_error(failerr, err);
			}
		} else {
			translate_fail_code(err, NULL, reason);
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Placement set %s is too small: %s", nodepart[i]->name, reason);
			set_schd_error_codes(err, NOT_RUN, SET_TOO_SMALL);
			set_schd_error_arg(err, ARG1, "Placement");
#ifdef NAS /* localmod 031 */
			set_schd_error_arg(err, ARG2, "for resource model");
#else
			set_schd_error_arg(err, ARG2, nodepart[i]->name);
#endif /* localmod 031 */
			if (failerr->status_code == SCHD_UNKWN)
				copy_schd_error(failerr, err);
		}

		if (!can_fit && !rc &&
		    resresv_can_fit_nodepart(policy, nodepart[i], resresv, flags | COMPARE_TOTAL, err)) {
			can_fit = 1;
		}
		pass_flags = NO_FLAGS;
	}

	if (!can_fit) {
		if (flags & SPAN_PSETS) {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				  "Request won't fit into any placement sets, will use all nodes");
			resresv->can_not_fit = 1;
			if (resresv->server->has_multi_vnode && ok_break_chunk(resresv, ninfo_arr))
				pass_flags |= EVAL_OKBREAK;

			rc = eval_placement(policy, spec, ninfo_arr, pl, resresv, pass_flags, nspec_arr, err);
		} else {
			set_schd_error_codes(err, NEVER_RUN, CANT_SPAN_PSET);
			/* CANT_SPAN_PSET is more important than any other error we may have encountered -- keep it*/
			clear_schd_error(failerr);
			copy_schd_error(failerr, err);
		}
	}

	if (!rc)
		free_nspecs(nspec_arr);

	if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
		move_schd_error(err, failerr);

	return rc;
}

/**
 * @brief
 * 		handle the place spec for vnode placement of chunks
 *
 * @param[in] policy     - policy info
 * @param[in] spec       - the select spec
 * @param[in] ninfo_arr  - array of nodes to satisfy the spec
 * @param[in] pl         - parsed placement spec
 * @param[in] resresv    - the resource resv the spec if from
 * @param[in] flags	-	flags to change function's behavior
 *	      				EVAL_OKBREAK - ok to break chunk up across vnodes
 * @param[out]	nspec_arr	-	the node solution will be allocated and
 *				   				returned by this pointer by reference
 * @param[out]	err	-	error structure to return error information
 *
 * @return	bool
 * @retval	true	: if the selspec can be satisfied
 * @retval	false	: if not
 *
 */
bool
eval_placement(status *policy, selspec *spec, node_info **ninfo_arr, place *pl,
	       resource_resv *resresv, unsigned int flags,
	       std::vector<nspec *> &nspec_arr, schd_error *err)
{
	np_cache *npc = NULL;
	node_partition **hostsets = NULL;
	int tot = 0;
	resource_req *req = NULL;
	schd_resource *res = NULL;
	selspec *dselspec = NULL;
	node_info **nptr = NULL;
	static schd_error *failerr = NULL;

	if (spec == NULL || ninfo_arr == NULL || pl == NULL || resresv == NULL)
		return 0;

	if (failerr == NULL) {
		failerr = new_schd_error();
		if (failerr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return 0;
		}
	} else
		clear_schd_error(failerr);

	/* reorder nodes for smp_cluster_dist or avoid_provision.
	 *
	 * remark: reorder_nodes doesn't reorder in place, returns
	 *         a ptr to a reordered static array
	 */
	if ((pl->pack && spec->total_chunks == 1) ||
	    (conf.provision_policy == AVOID_PROVISION && resresv->aoename != NULL))
		nptr = reorder_nodes(ninfo_arr, resresv);

	if (nptr == NULL)
		nptr = ninfo_arr;

	/*
	 * eval_complex_selspec() handles placement for single vnoded systems.
	 * it should be merged into this function in a optimized way, but until
	 * we short circuit this function and fall into it.  This function doesn't
	 * handle multi-chunk pack.  We still fall into it in the case of a single
	 * chunk.
	 */
	if (!resresv->server->has_multi_vnode &&
	    (!resresv->place_spec->pack || spec->total_chunks == 1)) {
		return eval_complex_selspec(policy, spec, nptr, pl, resresv, flags, nspec_arr, err);
	}

	/* get a pool of node partitions based on host.  If we're using the
	 * server's nodes, we can use the pre-created host sets.
	 */
	if (nptr == resresv->server->nodes)
		hostsets = resresv->server->hostsets;

	if (hostsets == NULL) {
		std::vector<std::string> host_arr{"host"};
		npc = find_alloc_np_cache(policy, resresv->server->npc_arr, host_arr, nptr, NULL);
		if (npc != NULL)
			hostsets = npc->nodepart;
	}

	if (hostsets != NULL) {
		if (pl->scatter || pl->vscatter || pl->free) {
			dselspec = new selspec(*spec);
			if (dselspec == NULL)
				return false;
		}

		for (int i = 0; hostsets[i] != NULL && tot != spec->total_chunks; i++) {
			/* if one vnode on a host is set to force/dflt exclhost
			 * then they all are.  The mom makes sure of this
			 */
			std::vector<nspec *> nsa;
			node_info **dninfo_arr = hostsets[i]->ninfo_arr;
			enum vnode_sharing sharing = VNS_DFLT_SHARED;
			bool do_exclhost = false;
			bool rc = false; /* true if current chunk was successfully allocated */
			/* true if any vnode is allocated from a host - used in exclhost allocation */
			bool any_succ_rc = false;

			if (dninfo_arr[0] != NULL)
				sharing = dninfo_arr[0]->sharing;

			flags &= ~EVAL_EXCLSET;
			if (sharing == VNS_FORCE_EXCLHOST ||
			    (sharing == VNS_DFLT_EXCLHOST && pl->excl == 0 && pl->share == 0) || pl->exclhost) {
				do_exclhost = true;
				flags |= EVAL_EXCLSET;
			}

			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				   resresv->name, "Evaluating host %s", hostsets[i]->res_val);

			/* Pack on One Host Placement:
			 * place all chunks on one host.  This is done with a call to
			 * to eval_complex_selspec().
			 */
			if (pl->pack) {
				rc = eval_complex_selspec(policy, spec, dninfo_arr, pl,
							  resresv, flags | EVAL_OKBREAK, nsa, err);
				if (rc) {
					any_succ_rc = true;
					tot = spec->total_chunks;
				} else {
					free_nspecs(nsa);
					if (failerr->status_code == SCHD_UNKWN)
						move_schd_error(failerr, err);
					clear_schd_error(err);
				}
			}
			/* Scatter by Vnode Placement:
			 * place at most one chunk on any one vnode.  This is done by successive
			 * calls to to eval_simple_selspec().  If it returns true, we remove the
			 * vnode from dninfo_arr[] so we don't allocate it again.
			 */
			else if (pl->vscatter) {
				for (int c = 0; dselspec->chunks[c] != NULL; c++) {
					/* setting rc=1 forces at least 1 loop of the while.  This should be
					 * be rewritten in the do/while() style seen in the free block below
					 */
					rc = true;
					if ((hostsets[i]->free_nodes > 0) && (check_avail_resources(hostsets[i]->res,
												    dselspec->chunks[c]->req, UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err))) {
						for (int k = 0; dninfo_arr[k] != NULL; k++)
							dninfo_arr[k]->nscr &= ~NSCR_VISITED;
						while (rc && dselspec->chunks[c]->num_chunks > 0) {
							std::vector<nspec *> ns_chunk;
							rc = eval_simple_selspec(policy, spec->chunks[c], dninfo_arr, pl,
										 resresv, flags, ns_chunk, err);

							if (rc) {
								any_succ_rc = true;
								tot++;
								dselspec->chunks[c]->num_chunks--;

								for (const auto &ns : ns_chunk) {
									auto vn = find_node_by_rank(dninfo_arr, ns->ninfo->rank);
									if (vn != NULL)
										vn->nscr |= NSCR_SCATTERED;
								}
								nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
							} else {
								free_nspecs(ns_chunk);
								if (failerr->status_code == SCHD_UNKWN)
									move_schd_error(failerr, err);
								clear_schd_error(err);
							}
						}
					} else {
						char reason[MAX_LOG_SIZE] = {0};

						if (hostsets[i]->free_nodes == 0)
							strcpy(reason, "No free nodes available");
						else
							translate_fail_code(err, NULL, reason);

						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							   resresv->name, "Insufficient host-level resources %s", reason);

						/* don't be so specific in the comment since it's only for a single host */
						set_schd_error_arg(err, ARG1, NULL);

						if (failerr->status_code == SCHD_UNKWN)
							move_schd_error(failerr, err);
						clear_schd_error(err);
					}
				}
			}
			/* Scatter By Host Placement:
			* place at most one chunk on any one host.  We make a call to
			* eval_simple_selspec() for each sub-chunk (things between the +'s).
			* If it returns success (i.e. rc=1) we are done for this host
			*/
			else if (pl->scatter) {
				for (int c = 0; dselspec->chunks[c] != NULL && rc == 0; c++) {
					if ((hostsets[i]->free_nodes > 0) && (check_avail_resources(hostsets[i]->res,
												    dselspec->chunks[c]->req, UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err))) {
						std::vector<nspec *> ns_chunk;

						if (dselspec->chunks[c]->num_chunks > 0) {
							for (int k = 0; dninfo_arr[k] != NULL; k++)
								dninfo_arr[k]->nscr &= ~NSCR_VISITED;

							rc = eval_simple_selspec(policy, spec->chunks[c],
										 dninfo_arr, pl, resresv, flags | EVAL_OKBREAK,
										 ns_chunk, err);

							if (rc) {
								any_succ_rc = 1;
								tot++;
								dselspec->chunks[c]->num_chunks--;
								nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
							} else {
								free_nspecs(ns_chunk);

								if (failerr->status_code == SCHD_UNKWN)
									move_schd_error(failerr, err);
								clear_schd_error(err);
							}
						}
					} else {
						char reason[MAX_LOG_SIZE] = {0};

						if (hostsets[i]->free_nodes == 0)
							strcpy(reason, "No free nodes available");
						else
							translate_fail_code(err, NULL, reason);

						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							   resresv->name, "Insufficient host-level resources %s", reason);

						/* don't be so specific in the comment since it's only for a single host */
						set_schd_error_arg(err, ARG1, NULL);

						if (failerr->status_code == SCHD_UNKWN)
							move_schd_error(failerr, err);
						clear_schd_error(err);
					}
				}
			}
			/* Free Placement:
			 * Place as many chunks as possible on vnodes as they can hold.
			 * We do this by duplicating both the nodes and the select spec.  The
			 * resources and chunks counts are decremented in the duplicated select
			 * when they are allocated.  The assigned resources on the nodes are
			 * increased when resources are allocated.  When the select spec has no
			 *  more resources left, we've successfully fulfilled the request.  If we
			 * run out of nodes to search, then we've failed to fulfill the request.
			 */
			else if (pl->free) {
				node_info **dup_ninfo_arr;
				dup_ninfo_arr = dup_nodes(hostsets[i]->ninfo_arr,
							  resresv->server, NO_FLAGS);
				if (dup_ninfo_arr == NULL) {
					delete dselspec;
					return 0;
				}

				for (int c = 0; dselspec->chunks[c] != NULL; c++) {
					if ((hostsets[i]->free_nodes > 0) && (check_avail_resources(hostsets[i]->res,
												    dselspec->chunks[c]->req, UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err))) {
						if (dselspec->chunks[c]->num_chunks > 0) {
							for (int k = 0; dup_ninfo_arr[k] != NULL; k++)
								dup_ninfo_arr[k]->nscr &= ~NSCR_VISITED;
							do {
								std::vector<nspec *> ns_chunk;
								rc = eval_simple_selspec(policy, dselspec->chunks[c], dup_ninfo_arr,
											 pl, resresv, flags | EVAL_OKBREAK, ns_chunk, err);

								if (rc) {
									any_succ_rc = true;
									tot++;
									dselspec->chunks[c]->num_chunks--;

									for (const auto &ns : ns_chunk) {
										req = ns->resreq;
										while (req != NULL) {
											if (req->type.is_consumable) {
												res = find_resource(ns->ninfo->res, req->def);
												if (res != NULL) {
													if (res->indirect_res != NULL)
														res = res->indirect_res;

													res->assigned += req->amount;
												}
											}
											req = req->next;
										}
										ns->ninfo = find_node_by_indrank(nptr, ns->ninfo->node_ind, ns->ninfo->rank);
									}
									nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
								} else {
									free_nspecs(ns_chunk);

									if (failerr->status_code == SCHD_UNKWN)
										move_schd_error(failerr, err);
									clear_schd_error(err);
								}
							} while (rc && dselspec->chunks[c]->num_chunks > 0);
						}
					} else {
						char reason[MAX_LOG_SIZE] = {0};

						if (hostsets[i]->free_nodes == 0)
							strcpy(reason, "No free nodes available");
						else
							translate_fail_code(err, NULL, reason);

						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							   resresv->name, "Insufficient host-level resources %s", reason);
#ifdef NAS /* localmod 998 */
						set_schd_error_codes(err, NOT_RUN, RESOURCES_INSUFFICIENT);
						set_schd_error_arg(err, ARG1, "Host");
						set_schd_error_arg(err, ARG2, hostsets[i]->name);
#endif /* localmod 998 */
						/* don't be so specific in the comment since it's only for a single host */
						set_schd_error_arg(err, ARG1, NULL);

						if (failerr->status_code == SCHD_UNKWN)
							move_schd_error(failerr, err);
						clear_schd_error(err);
					}
				}
				free_nodes(dup_ninfo_arr);
			} else {
				log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, resresv->name,
					   "Unexpected Placement: not %s, %s, %s, or %s",
					   PLACE_Scatter, PLACE_VScatter, PLACE_Pack, PLACE_Free);
			}
			if (any_succ_rc) {
				if (do_exclhost) {
					/* If we're in a placement set dninfo_arr might not contain the whole hostset set.
					 * We need to grab the hostset from the node
					 */
					if (dninfo_arr[0]->hostset != NULL)
						alloc_rest_nodepart(nsa, dninfo_arr[0]->hostset->ninfo_arr);
					else
						alloc_rest_nodepart(nsa, dninfo_arr);
				}
				nspec_arr.insert(nspec_arr.end(), nsa.begin(), nsa.end());
			}
		}
	} else
		set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);

	if (dselspec != NULL)
		delete dselspec;

	if (tot == spec->total_chunks)
		return true;

	if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
		move_schd_error(err, failerr);

	return false;
}

/**
 * @brief
 * 		handle a complex (plus'd) select spec
 *
 * @param[in]	policy	-	policy info
 * @param[in]	spec	-	the select spec
 * @param[in]	ninfo_arr	-	array of nodes to satisify the spec
 * @param[in]	pl	-	parsed placement spec
 * @param[in]	resresv	-	the resource resv the spec if from
 * @param[in]	flags	-	flags to change functions behavior
 *	      					EVAL_OKBREAK - ok to break chunck up across vnodes
 *	      					EVAL_EXCLSET - allocate entire nodelist exclusively
 * @param[out]	nspec_arr	-	the node solution
 * @param[out]	err	-	error structure to return error information
 *
 * @retval	true	: if the selspec can be satisfied
 * @retval	false	: if not
 *
 */
bool
eval_complex_selspec(status *policy, selspec *spec, node_info **ninfo_arr, place *pl,
		     resource_resv *resresv, unsigned int flags, std::vector<nspec *> &nspec_arr, schd_error *err)
{
	std::vector<nspec *> nsa; /* the nspec array to hold node solution */
	node_info **nodes;	  /* nodes to search through (possibly duplicated) */
	int rc = 1;		  /* used as a return code in the complex spec case */
	int tot_nodes;		  /* total number of nodes on the server */
	int num_nodes_used = 0;	  /* number of nodes used to satisfy spec */

	/* number of nodes used with the no_multinode_job flag set */
	int num_no_multi_nodes = 0;

	int chunks_needed = 0;

	int k;
	int n;
	int c;
	resource_req *req;
	schd_resource *res;

	if (spec == NULL || ninfo_arr == NULL)
		return false;

	/* we have a simple selspec... just pass it along */
	if (spec->total_chunks == 1)
		return eval_simple_selspec(policy, spec->chunks[0], ninfo_arr,
					   pl, resresv, flags, nspec_arr, err);

	tot_nodes = count_array(ninfo_arr);

	/* we have a complex select spec
	 * This makes things more complicated now... we can make a single pass
	 * through our nodes and will possibly come up with a solution... but
	 * there is always the chance we could swap out nodes depending on one
	 * node being able to satisfy multiple simple specs.
	 * This recursion could take very long to finish.
	 *
	 * We'll go through the nodes once since it'll probably be fine for most
	 * cases.
	 */

	if (pl->scatter || pl->vscatter) {
		nodes = ninfo_arr;
		for (k = 0; nodes[k] != 0; k++)
			nodes[k]->nscr &= ~NSCR_SCATTERED;
	} else {
		if ((nodes = dup_nodes(ninfo_arr, resresv->server, NO_FLAGS)) == NULL) {
			/* only free array if we allocated it locally */
			return false;
		}
	}

	n = -1;
	for (c = 0, chunks_needed = 0; c < spec->total_chunks && rc > 0; c++) {
		std::vector<nspec *> ns_chunk;
		if (chunks_needed == 0) {
			n++;
			chunks_needed = spec->chunks[n]->num_chunks;
			for (k = 0; nodes[k] != 0; k++)
				nodes[k]->nscr &= ~NSCR_VISITED;
		}

		rc = eval_simple_selspec(policy, spec->chunks[n], nodes, pl, resresv, flags, ns_chunk, err);

		if (rc) {
			for (auto &ns : ns_chunk) {
				num_nodes_used++;
				if (ns->ninfo->no_multinode_jobs)
					num_no_multi_nodes++;

				if (pl->scatter || pl->vscatter)
					ns->ninfo->nscr |= NSCR_SCATTERED;
				else {
					req = ns->resreq;
					while (req != NULL) {
						res = find_resource(ns->ninfo->res, req->def);
						if (res != NULL)
							res->assigned += req->amount;

						req = req->next;
					}
					/* replace the dup'd node with the real one */
					ns->ninfo = find_node_by_indrank(ninfo_arr, ns->ninfo->node_ind, ns->ninfo->rank);
				}

				/* if policy is avoid provision, continue to use aoe-sorted list
				 * of nodes.
				 */
				if (conf.provision_policy != AVOID_PROVISION &&
				    !cstat.node_sort->empty() && conf.node_sort_unused)
					qsort(nodes, tot_nodes, sizeof(node_info *), multi_node_sort);
			}
			chunks_needed--;
			nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
		}
	}

	if (rc) {
		nspec_arr.insert(nspec_arr.end(), nsa.begin(), nsa.end());
		nsa.clear();
	} else
		free_nspecs(nsa);

	if (!(pl->scatter || pl->vscatter))
		free_nodes(nodes);

	if (num_no_multi_nodes == 0 ||
	    (num_no_multi_nodes == 1 && num_nodes_used == 1))
		return rc;

	/* if we've reached this point we're a multi node job and have selected
	 * a node which requested to not be used for multi-node jobs.  We'll
	 * mark the job as a job which will use multiple nodes and use tail
	 * recursion to resatisify the job without the nodes which are marked
	 * as no multi-node jobs
	 */
	resresv->will_use_multinode = 1;
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
		  "Used multiple nodes with no_multinode_job=true: Resatisfy");

	if (!nspec_arr.empty())
		free_nspecs(nspec_arr);

	return eval_complex_selspec(policy, spec, ninfo_arr, pl, resresv, flags, nspec_arr, err);
}

/**
 * @brief
 * 		eval a non-plused select spec for satisfiability
 *
 * @param[in]	policy	-	policy info
 * @param[in]	chk	-	the chunk to satisfy
 * @param[in]	pninfo_arr	-	the array of nodes
 * @param[in]	pl	-	placement information (from -l place)
 * @param[in]	resresv	-	the job the spec is from - needed for resvs
 * @param[in]	flags	-	flags to change functions behavior
 *	      					EVAL_OKBREAK - ok to break chunck up across vnodes
 *	      					EVAL_EXCLSET - allocate entire nodelist exclusively
 * @param[out]	nspec_arr	-	the node solution
 * @param[out]	err	-	error structure to return error information
 *
 * @return	bool
 * @retval	true	: if the select spec is satisfiable
 * @retval	false	: if not
 *
 */
bool
eval_simple_selspec(status *policy, chunk *chk, node_info **pninfo_arr,
		    place *pl, resource_resv *resresv, unsigned int flags,
		    std::vector<nspec *> &nspec_arr, schd_error *err)
{
	int chunks_found = 0;		      /* number of nodes found to satisfy a subspec */
	resource_req *specreq_noncons = NULL; /* non-consumable resources requested by spec */
	resource_req *specreq_cons = NULL;    /* consumable resources requested by spec */
	resource_req *req = NULL;	      /* used to determine if we're done */
	resource_req *prevreq = NULL;	      /* used to determine if we're done */
	resource_req *tmpreq = NULL;	      /* used to unlink and free */
	bool need_new_nspec = false;	      /* need to allocate a new nspec for node solution */

	bool allocated = false; /* did we allocate resources to a vnode */
	int i = 0;
	int k = 0;

	char *str_chunk = NULL; /* ptr to after the number of chunks in the str_chunk */

	node_info **ninfo_arr = NULL;

	static schd_error *failerr = NULL;

	resource_req *aoereq = NULL;
	nspec *ns = NULL;

	std::vector<nspec *> nsa;

	if (chk == NULL || pninfo_arr == NULL || resresv == NULL || pl == NULL)
		return false;

	if (failerr == NULL) {
		failerr = new_schd_error();
		if (failerr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return false;
		}
	}

	/* if it's OK to break across vnodes, but we can fully fit on one
	 * vnode, then lets do that rather then possibly breaking across multiple
	 */
	if ((flags & EVAL_OKBREAK) &&
	    can_fit_on_vnode(chk->req, pninfo_arr)) {
		flags &= ~EVAL_OKBREAK;
	}

	/* we need to dup the nodes to handle indirect resources which need to be
	 * accounted for between nodes allocated to the job.  The only time we
	 * need to account for for this is when we're breaking a chunks across
	 * vnodes.  Otherwise the entire chunk is going onto 1 vnode.
	 */
	if (flags & EVAL_OKBREAK) {
		ninfo_arr = dup_nodes(pninfo_arr, resresv->server, NO_FLAGS);
		if (ninfo_arr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return false;
		}
	} else
		ninfo_arr = pninfo_arr;

	/* find the requested resources part of a chunk, not the number requested */
	for (i = 0; isdigit(chk->str_chunk[i]); i++)
		;

	if (chk->str_chunk[i] == ':')
		i++;

	str_chunk = &chk->str_chunk[i];

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		   resresv->name, "Evaluating subchunk: %s", str_chunk);

	/* We're duplicating the entire list here.  This list is organized so that
	 * all non-consumable resources come before the consumable ones.  After
	 * duplicating, we split it into the consumable and non-consumable lists.
	 */
	specreq_noncons = dup_resource_req_list(chk->req);
	clear_schd_error(failerr);

	if (specreq_noncons == NULL) {
		set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);

		if (flags & EVAL_OKBREAK)
			free_nodes(ninfo_arr);
		return false;
	}

	if (resresv->aoename != NULL) {
		resresv->is_prov_needed = 1;
		aoereq = find_resource_req(specreq_noncons, allres["aoe"]);
		/* Provisionable node needed only if placement=pack or
		 * subchunk consists aoe resource request.
		 */
		if (!pl->pack && aoereq == NULL)
			resresv->is_prov_needed = 0;
	}

	for (req = specreq_noncons; req != NULL && req->type.is_non_consumable;
	     prevreq = req, req = req->next)
		;

	specreq_cons = req;
	if (prevreq != NULL)
		prevreq->next = NULL;
	else
		specreq_noncons = NULL; /* no non-consumable resources */

	ns = new nspec();

	for (i = 0; ninfo_arr[i] != NULL && chunks_found == 0; i++) {
		if (ninfo_arr[i]->nscr)
			continue;

		allocated = false;
		clear_schd_error(err);
		if (ninfo_arr[i]->lic_lock) {

			if (need_new_nspec) {
				need_new_nspec = false;
				ns = new nspec();
			}

			if (is_vnode_eligible_chunk(specreq_noncons, ninfo_arr[i], resresv, err)) {
				if (specreq_cons != NULL)
					allocated = resources_avail_on_vnode(specreq_cons, ninfo_arr[i],
									     pl, resresv, flags, ns, err);
				if (allocated) {
					nsa.push_back(ns);
					need_new_nspec = true;
					ns->seq_num = chk->seq_num;
					ns->sub_seq_num = get_sched_rank();

					if (flags & EVAL_OKBREAK) {
						/* search through requested consumable resources for resources we've
						 * completely allocated.  We'll unlink and free the resource_req
						 */
						prevreq = NULL;
						req = specreq_cons;
						while (req != NULL) {
							if (req->amount == 0) {
								tmpreq = req;
								if (prevreq == NULL)
									req = specreq_cons = req->next;
								else
									req = prevreq->next = req->next;

								free_resource_req(tmpreq);
							} else {
								prevreq = req;
								req = req->next;
							}
						}
						if (specreq_cons == NULL) {
							chunks_found = 1;
							/* we found our solution, we don't need any more nspec's */
							need_new_nspec = false;
							ns->end_of_chunk = 1;
						}

						/* Replace the dup'd node with the real one, but only if we dup'd the nodes */
						if (pninfo_arr != ninfo_arr) {
							/* Need to call find_node_by_rank() over indrank since eval_placement might dup the nodes */
							ns->ninfo = find_node_by_rank(pninfo_arr, ns->ninfo->rank);
						}
					} else {
						chunks_found = 1;
						/* we found our solution, we don't need any more nspec's */
						need_new_nspec = false;
						ns->end_of_chunk = 1;
					}
				} else {
					ninfo_arr[i]->nscr |= NSCR_VISITED;
					if (failerr->status_code == SCHD_UNKWN)
						copy_schd_error(failerr, err);
				}
			} else {
				ninfo_arr[i]->nscr |= NSCR_VISITED;
				if (failerr->status_code == SCHD_UNKWN)
					copy_schd_error(failerr, err);
			}

		} else
			set_schd_error_codes(err, NOT_RUN, NODE_UNLICENSED);

		if (err->error_code != SUCCESS) {
			schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				   ninfo_arr[i]->name, NULL, err);
			/* Since this node is not eligible, check if it ever eligible
			 * If it is never eligible, mark all nodes like it visited.
			 * If we can break, don't bother with equivalence classes because
			 * because the chunk is pretty much equivalent to ncpus=1 at that point
			 */
			if (ninfo_arr[i]->nodesig_ind >= 0 && !(flags & EVAL_OKBREAK)) {
				if (check_avail_resources(ninfo_arr[i]->res, chk->req,
							  COMPARE_TOTAL | UNSET_RES_ZERO | CHECK_ALL_BOOLS,
							  policy->resdef_to_check_no_hostvnode,
							  INSUFFICIENT_RESOURCE, err) == 0) {
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
						   "", "Marking nodes with signature %s ineligible", ninfo_arr[i]->nodesig);
					for (k = 0; ninfo_arr[k] != NULL; k++) {
						if (ninfo_arr[k]->nodesig_ind == ninfo_arr[i]->nodesig_ind) {
							ninfo_arr[k]->nscr |= NSCR_VISITED;
							if (i != k)
								schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
									   ninfo_arr[k]->name, NULL, err);
						}
					}
				}
			}

		} else {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				  ninfo_arr[i]->name, "Node allocated to job");
		}
	}

	if (specreq_cons != NULL)
		free_resource_req_list(specreq_cons);
	if (specreq_noncons != NULL)
		free_resource_req_list(specreq_noncons);

	if (flags & EVAL_OKBREAK)
		free_nodes(ninfo_arr);

	if (chunks_found) {
		nspec_arr.insert(nspec_arr.end(), nsa.begin(), nsa.end());
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			   resresv->name, "Allocated one subchunk: %s", str_chunk);
		clear_schd_error(err);
		return true;
	}

	/* If we didn't allocate any nodes, we need to clean up any nspecs
	 * we've allocated.  This is either the one we allocated in the front of
	 * the main loop above, or for all the nodes we allocated and need to
	 * "deallocate" due to a reason we've decided we can't allocate like exclhost
	 */
	free_nspecs(nsa);
	nsa.clear();

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, resresv->name,
		   "Failed to satisfy subchunk: %s", chk->str_chunk);

	/* If the last node we looked at was fine, err would be empty.
	 * Actually return an a real error */
	if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
		move_schd_error(err, failerr);
	/* don't be so specific in the comment since it's only for a single node */
	set_schd_error_arg(err, ARG1, NULL);
	return false;
}

/**
 * @brief
 * 		evaluate one node to see if it is eligible
 *			    for a simple select spec and return the number
 *			    of chunks it can satisfy
 *
 * @param[in]	specreq	-	resources in the select spec
 * @param[in]	node	-	the node to evaluate
 * @param[in]	pl	-	place spec for request
 * @param[in]	resresv	-	resource resv which is requesting
 * @param[in]	flags	-	flags to change behavior of function
 *							EVAL_OKBREAK - OK to break chunk across vnodes
 * @param[out]	err	-	error status if node is ineligible
 *
 * @par NOTE:
 * 		all resources in specreq will be honored regardless of
 *      whether they are in conf.res_to_check or not due to the fact
 *		that chunk resources only contain such resources.
 *
 * @retval	true	: if node is statically eligible to run the request
 * @retval	false	: if node is ineligible
 *
 */
bool
is_vnode_eligible(node_info *node, resource_resv *resresv,
		  struct place *pl, schd_error *err)
{
	if (node == NULL || resresv == NULL || pl == NULL || err == NULL)
		return false;

	bool job_in_maintenance_resv = false;
	if (resresv->job && resresv->job->resv)
		if (resresv->job->resv->name[0] == 'M')
			job_in_maintenance_resv = true;

	/* A node is invalid for an exclusive job if jobs/resvs are running on it
	 * except if the job is a maintenance reservation
	 * NOTE: this check must be the first check or exclhost may break
	 */
	if (!job_in_maintenance_resv && is_excl(pl, node->sharing) &&
	    (node->num_jobs > 0 || node->num_run_resv > 0)) {
		set_schd_error_codes(err, NOT_RUN, NODE_NOT_EXCL);
		set_schd_error_arg(err, ARG1, resresv->is_job ? "Job" : "Reservation");
		return false;
	}

	/* Does this chunk have EOE? */
	if (resresv->eoename != NULL) {
		if (!is_eoe_avail_on_vnode(node, resresv)) {
			set_schd_error_codes(err, NOT_RUN, EOE_NOT_AVALBL);
			set_schd_error_arg(err, ARG1, resresv->eoename);
			return false;
		}
	}

	if (!node->is_free) {
		set_schd_error_codes(err, NOT_RUN, INVALID_NODE_STATE);
		set_schd_error_arg(err, ARG1, (char *) node_state_to_str(node));
#ifdef NAS /* localmod 031 */
		set_schd_error_arg(err, ARG2, node->name);
#endif /* localmod 031 */
		return false;
	}

	/*
	 * If we are in the reservation's universe, we need to check the state of
	 * the node in the server's universe.  We may have provisioned the node
	 * and it could be down.
	 */
	if (resresv->job != NULL && resresv->job->resv != NULL) {
		if (node->svr_node != NULL) {
			if (node->svr_node->is_provisioning) {
				set_schd_error_codes(err, NOT_RUN, INVALID_NODE_STATE);
#ifdef NAS /* localmod 031 */
				set_schd_error_arg(err, ARG1, node->name);
				set_schd_error_arg(err, ARG2, node_state_to_str(node->svr_node));
#else
				set_schd_error_arg(err, ARG1, (char *) node_state_to_str(node->svr_node));
#endif /* localmod 031 */
				return false;
			}
		}
	}

	if (resresv->is_resv && !node->resv_enable) {
		set_schd_error_codes(err, NOT_RUN, NODE_RESV_ENABLE);
		return false;
	}

	if (resresv->is_job) {
		/* don't enforce max run limits of job is being qrun */
		if (resresv->server->qrun_job == NULL) {
			if (node->max_running != SCHD_INFINITY &&
			    node->max_running <= node->num_jobs) {
				set_schd_error_codes(err, NOT_RUN, NODE_JOB_LIMIT_REACHED);
				return false;
			}

			if (node->max_user_run != SCHD_INFINITY &&
			    node->max_user_run <= find_counts_elm(node->user_counts, resresv->user, NULL, NULL, NULL)) {
				set_schd_error_codes(err, NOT_RUN, NODE_USER_LIMIT_REACHED);
				return false;
			}

			if (node->max_group_run != SCHD_INFINITY &&
			    node->max_group_run <= find_counts_elm(node->group_counts, resresv->group, NULL, NULL, NULL)) {
				set_schd_error_codes(err, NOT_RUN, NODE_GROUP_LIMIT_REACHED);
				return false;
			}
		}
	}

	if (node->no_multinode_jobs && resresv->will_use_multinode) {
		set_schd_error_codes(err, NOT_RUN, NODE_NO_MULT_JOBS);
		return false; /* multiple nodes jobs/resvs not allowed on this node */
	}

	return true;
}
/**
 * @brief
 * 		check if a vnode is eligible for a chunk
 *
 * @param[in]	specreq	-	resources from chunk
 * @param[in]	node	-	vnode tocheck
 * @param[out]	err	-	error structure
 *
 * @return	bool
 * @retval	true	: eligible
 * @retval	false	: not eligible
 */
bool
is_vnode_eligible_chunk(resource_req *specreq, node_info *node,
			resource_resv *resresv, schd_error *err)
{
	if (resresv != NULL) {
		if (node->no_multinode_jobs && resresv->will_use_multinode) {
			set_schd_error_codes(err, NOT_RUN, NODE_NO_MULT_JOBS);
			return false; /* multiple nodes jobs/resvs not allowed on this node */
		}
	}

	if (specreq != NULL) {
		if (check_avail_resources(node->res, specreq,
					  CHECK_ALL_BOOLS | ONLY_COMP_NONCONS | UNSET_RES_ZERO,
					  INSUFFICIENT_RESOURCE, err) == 0) {
			return false;
		}
	}

	return true;
}

/**
 * @brief
 *	Checks if a vnode is eligible for power operations.
 *  Based on is_provisionable.
 *
 * @par Functionality:
 *	This function checks if a vnode is eligible to be provisioned.
 *	A vnode is eligible for power operations if it satisfies all of the
 *	following conditions:-
 *	(1) Server has power_provisioning True,
 *	(2) Vnode has power_provisioning True,
 *	(3) No conflicts with reservations already running on the Vnode
 *	(4) No conflicts with jobs already running on the Vnode
 *
 * @param[in]		node	-	pointer to node_info
 * @param[in]		resresv	-	pointer to resource_resv
 * @param[in,out]	err		-	pointer to schd_error
 *
 * @return	int
 * @retval	 NO_PROVISIONING_NEEDED : resresv doesn't request eoe
 *			or resresv is not a job
 * @retval	 PROVISIONING_NEEDED : vnode doesn't have current_eoe set
 *          or it doesn't match job eoe
 * @retval	 NOT_PROVISIONABLE  : vnode is not provisionable
 *			(see err for more details)
 *
 * @par Side Effects:
 *	Unknown
 *
 * @par MT-safe: No
 *
 */
int
is_powerok(node_info *node, resource_resv *resresv, schd_error *err)
{
	int ret = NO_PROVISIONING_NEEDED;

	if (!resresv->is_job)
		return NO_PROVISIONING_NEEDED;
	if (resresv->eoename == NULL)
		return NO_PROVISIONING_NEEDED;
	if (!resresv->server->power_provisioning) {
		err->error_code = PROV_DISABLE_ON_SERVER;
		return NOT_PROVISIONABLE;
	}
	if (!node->power_provisioning) {
		err->error_code = PROV_DISABLE_ON_NODE;
		return NOT_PROVISIONABLE;
	}

	/* node doesn't have eoe or it doesn't match job eoe */
	if (node->current_eoe == NULL ||
	    strcmp(resresv->eoename, node->current_eoe) != 0) {
		ret = PROVISIONING_NEEDED;

		/* there can't be any jobs on the node */
		if ((node->num_susp_jobs > 0) || (node->num_jobs > 0)) {
			err->error_code = PROV_RESRESV_CONFLICT;
			return NOT_PROVISIONABLE;
		}
	}

	/* node cannot be shared between running reservation without EOE
	 * and job with EOE
	 */
	if (node->run_resvs_arr) {
		for (int i = 0; node->run_resvs_arr[i]; i++) {
			if (node->run_resvs_arr[i]->eoename == NULL) {
				err->error_code = PROV_RESRESV_CONFLICT;
				return NOT_PROVISIONABLE;
			}
		}
	}

	return ret;
}

/**
 * @brief
 * 		check to see if there are enough
 *		consumable resources on a vnode to make it
 *		eligible for a request
 *		Note: This function will allocate <= 1 chunk
 *
 * @param[in][out] specreq_cons - IN : requested consumable resources
 *				  OUT: requested - allocated resources
 * @param[in]	node	-	the node to evaluate
 * @param[in]	pl	-	place spec for request
 * @param[in]	resresv	-	resource resv which is requesting
 * @param[in]	flags	-	flags to change behavior of function
 *              			EVAL_OKBREAK - OK to break chunk across vnodes
 * @param[out]	err	-	error status if node is ineligible
 *
 *	@retval	true	: if resources were allocated from the node
 *	@retval false	: if sufficent resources are not available (err is set)
 */
bool
resources_avail_on_vnode(resource_req *specreq_cons, node_info *node,
			 place *pl, resource_resv *resresv, unsigned int flags,
			 nspec *ns, schd_error *err)
{
	/* used for allocating partial chunks */
	resource_req tmpreq = {0};
	resource_req *req;
	resource_req *newreq, *aoereq;
	long long num_chunks = 0;
	int is_p;

	if (specreq_cons == NULL || node == NULL ||
	    resresv == NULL || pl == NULL || err == NULL)
		return false;

	if (flags & EVAL_OKBREAK) {
		bool allocated = false;

		/* req is the first consumable resource at this point */
		for (req = specreq_cons; req != NULL; req = req->next) {
			if (req->type.is_consumable) {
				auto num = req->amount;
				tmpreq.amount = 1;

				tmpreq.name = req->name;
				tmpreq.type = req->type;
				tmpreq.res_str = req->res_str;
				tmpreq.def = req->def;
				tmpreq.next = NULL;
				num_chunks = check_resources_for_node(&tmpreq, node, resresv, err);

				if (num_chunks > 0) {
					is_p = is_provisionable(node, resresv, err);
					if (is_p == NOT_PROVISIONABLE) {
						allocated = false;
						break;
					} else if (is_p == PROVISIONING_NEEDED) {
						if (ns != NULL)
							ns->go_provision = 1;
						/* Do not set current aoe/eoe on the node when placement is scatter/vscatter
						 * because in case of scatter/vscatter placement we are not working on duplicate
						 * copy of nodes.
						 */
						if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1)
							set_current_aoe(node, resresv->aoename);
						if (resresv->is_job) {
							log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_NOTICE, resresv->name,
								   "Vnode %s selected for provisioning with AOE %s", node->name.c_str(), resresv->aoename);
						}
					}

					/* check if power eoe needs to be considered */
					is_p = is_powerok(node, resresv, err);
					if (is_p == NOT_PROVISIONABLE) {
						allocated = false;
						break;
					} else if (is_p == PROVISIONING_NEEDED) {
						if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1)
							set_current_eoe(node, resresv->eoename);

						if (resresv->is_job)
							log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_NOTICE, resresv->name,
								   "Vnode %s selected for power with EOE %s", node->name.c_str(), resresv->eoename);
					}

					if (num_chunks > num)
						num_chunks = num;

					if (ns != NULL) {
						newreq = dup_resource_req(req);
						if (newreq == NULL)
							return false;

						newreq->amount = num_chunks;

						if (ns->ninfo == NULL) /* check if this is the first res */
							ns->ninfo = node;

						newreq->next = ns->resreq;
						ns->resreq = newreq;
					}

					/* now that we have allocated some resources to this node, we need
					 * to remove them from the requested amount
					 */
					req->amount -= num_chunks;

					auto res = find_resource(node->res, req->def);
					if (res != NULL) {
						if (res->indirect_res != NULL)
							res->indirect_res->assigned += num_chunks;
						else
							res->assigned += num_chunks;
					}

					/* use tmpreq to wrap the amount so we can use res_to_str */
					tmpreq.amount = num_chunks;

					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, node->name,
						   "vnode allocated %s=%s", req->name, res_to_str(&tmpreq, RF_REQUEST));

					allocated = true;
				}
			}
		}
		if (allocated) {
			if (ns != NULL && ns->go_provision != 0) {
				aoereq = create_resource_req("aoe", resresv->aoename);
				if (aoereq != NULL) {
					aoereq->next = ns->resreq;
					ns->resreq = aoereq;
				}
			}

			if (pl->pack && num_chunks == 1 && cstat.smp_dist == SMP_ROUND_ROBIN)
				pbs_strncpy(last_node_name, node->name.c_str(), sizeof(last_node_name));
			return true;
		}
	} else {
		num_chunks = check_resources_for_node(specreq_cons, node, resresv, err);
		if (num_chunks > 0) {
			is_p = is_provisionable(node, resresv, err);
			if (is_p == NOT_PROVISIONABLE)
				return false;

			else if (is_p == PROVISIONING_NEEDED) {
				if (ns != NULL)
					ns->go_provision = 1;
				if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1) {
					set_current_aoe(node, resresv->aoename);
				}
			}

			is_p = is_powerok(node, resresv, err);
			if (is_p == NOT_PROVISIONABLE)
				return false;
			else if (is_p == PROVISIONING_NEEDED) {
				if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1) {
					set_current_eoe(node, resresv->eoename);
				}
			}
		}

		/* if we have infinite amount of resources, the node has been allocated */
		if (num_chunks == SCHD_INFINITY)
			num_chunks = 1;

		if (ns != NULL && num_chunks != 0) {
			ns->ninfo = node;
			ns->resreq = dup_resource_req_list(specreq_cons);

			if (ns->go_provision != 0) {
				aoereq = create_resource_req("aoe", resresv->aoename);
				if (aoereq != NULL) {
					aoereq->next = ns->resreq;
					ns->resreq = aoereq;
				}
			}

			if (pl->pack && cstat.smp_dist == SMP_ROUND_ROBIN)
				pbs_strncpy(last_node_name, node->name.c_str(), sizeof(last_node_name));
		}
		return num_chunks ? true : false;
	}

	return false;
}

/**
 * @brief
 * 		check to see how many chunks can fit on a
 *		node looking at both resources available
 *		now and future advanced reservations
 *
 * @param[in]	resreq	-	requested resources
 * @param[in]	node    -	node to check for
 * @param[in]	resresv -	the resource resv to check for
 * @param[out]	err    -	schd_error reply if there aren't enough resources
 *
 * @par NOTE:
 * 		all resources in resreq will be honored regardless of
 *      whether they are in conf.res_to_check or not due to the fact
 *		that chunk resources only contain such resources.
 *
 * @retval
 * 		number of chunks which can be satisifed during the duration
 * @retval	-1	: on error
 */
long long
check_resources_for_node(resource_req *resreq, node_info *ninfo,
			 resource_resv *resresv, schd_error *err)
{
	/* the minimum number of chunks which can be satisified for the duration
	 * of the request
	 */
	long long min_chunks = UNSPECIFIED;
	long long chunks = UNSPECIFIED; /*number of chunks which can be satisfied*/

	time_t end_time;

	timed_event *event;

	if (resreq == NULL || ninfo == NULL || err == NULL || resresv == NULL)
		return -1;

	auto noderes = ninfo->res;

	min_chunks = check_avail_resources(noderes, resreq,
					   CHECK_ALL_BOOLS | UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err);

	if (chunks != UNSPECIFIED && (min_chunks == SCHD_INFINITY || chunks < min_chunks))
		min_chunks = chunks;

	auto calendar = ninfo->server->calendar;
	auto cur_time = ninfo->server->server_time;
	if (resresv->duration != resresv->hard_duration &&
	    exists_resv_event(calendar, cur_time + resresv->hard_duration))
		end_time = cur_time + calc_time_left(resresv, 1);
	else
		end_time = cur_time + calc_time_left(resresv, 0);

	/* check if there are any timed events to check for conflicts with. We do not
	 * need to check for timed conflicts if the current object is a job inside a
	 * reservation.
	 */
	if (min_chunks > 0 && exists_run_event(calendar, end_time) && !(resresv->job != NULL && resresv->job->resv != NULL)) {
		/* Check for possible conflicts with timed events by walking the sorted
		 * event list that was created in eval_selspec. This runs a simulation
		 * forward in time to account for timed events consuming and/or releasing
		 * resources.
		 *
		 * For example, if a resource_resv such as a reservation is consuming n cpus
		 * from t1 to t2, then the resources should be taken out at t1 and returned
		 * at t2.
		 */
		auto nres = dup_ind_resource_list(noderes);
		auto resresv_excl = is_excl(resresv->place_spec, ninfo->sharing);

		if (nres != NULL) {
			/* Walk the event list by time such that the start of an event always
			 * precedes the end of it. The event type (start or end event) is
			 * determined, and the resources are consumed if a start event, and
			 * released if an end event.
			 */
			event = get_next_event(calendar);
			const auto event_mask = TIMED_RUN_EVENT | TIMED_END_EVENT;

			for (event = find_init_timed_event(event, IGNORE_DISABLED_EVENTS, event_mask);
			     event != NULL && min_chunks > 0;
			     event = find_next_timed_event(event, IGNORE_DISABLED_EVENTS, event_mask)) {
				auto event_time = event->event_time;
				auto resc_resv = static_cast<resource_resv *>(event->event_ptr);
				nspec *ns;

				if (event_time < cur_time)
					continue;
				if (resc_resv->job != NULL && resc_resv->job->resv != NULL)
					continue;

				if (!resc_resv->nspec_arr.empty())
					ns = find_nspec_by_rank(resc_resv->nspec_arr, ninfo->rank);
				else {
					ns = NULL;
					log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, resresv->name,
						   "Event %s is a run/end event w/o nspec array, ignoring event", event->name.c_str());
				}

				auto is_run_event = (event->event_type == TIMED_RUN_EVENT);

				if ((event_time < end_time) && resresv != resc_resv && ns != NULL) {
					/* One event will need provisioning while the other will not,
					 * they cannot co exist at same time.
					 */
					if (resresv->aoename != NULL && resc_resv->aoename == NULL) {
						set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
						min_chunks = 0;
						break;
					}

					if (is_excl(resc_resv->place_spec, ninfo->sharing) || resresv_excl) {
						min_chunks = 0;
					} else {
						for (auto cur_res = nres; cur_res != NULL; cur_res = cur_res->next) {
							if (cur_res->type.is_consumable) {
								auto req = find_resource_req(ns->resreq, cur_res->def);
								if (req != NULL) {
									cur_res->assigned += is_run_event ? req->amount : -req->amount;
								}
							}
						}
						if (is_run_event) {
							chunks = check_avail_resources(nres, resreq,
										       CHECK_ALL_BOOLS | UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err);
							if (chunks < min_chunks)
								min_chunks = chunks;
						}
					}
				}
			}
			free_resource_list(nres);
		} else {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return -1;
		}

		if (min_chunks == 0) {
			if (err->error_code != PROV_RESRESV_CONFLICT)
				set_schd_error_codes(err, NOT_RUN, RESERVATION_CONFLICT);
		}
	}

	return min_chunks;
}

/**
 * @brief compare two place specs to see if they are equal
 * @param[in] pl1 - place spec 1
 * @param[in] pl2 - place spec 2
 * @return  1 if equal 0 if not
 */
int
compare_place(place *pl1, place *pl2)
{
	if (pl1 == NULL && pl2 == NULL)
		return 1;
	else if (pl1 == NULL || pl2 == NULL)
		return 0;

	if (pl1->excl != pl2->excl)
		return 0;

	if (pl1->exclhost != pl2->exclhost)
		return 0;

	if (pl1->share != pl2->share)
		return 0;

	if (pl1->free != pl2->free)
		return 0;

	if (pl1->pack != pl2->pack)
		return 0;

	if (pl1->scatter != pl2->scatter)
		return 0;

	if (pl1->vscatter != pl2->vscatter)
		return 0;

	if (pl1->group != NULL && pl2->group != NULL) {
		if (strcmp(pl1->group, pl2->group))
			return 0;
	} else if (pl1->group != NULL || pl2->group != NULL)
		return 0;

	return 1;
}

/**
 * @brief
 *		parse_placespec - allocate a new place structure and parse
 *		a placement spec (-l place)
 *
 * @param[in]	place_str	-	placespec as a string
 *
 * @return	newly allocated place
 * @retval	NULL	: invalid placement spec
 *
 */
place *
parse_placespec(char *place_str)
{
	/* copy place spec into - max log size should be big enough */
	char str[MAX_LOG_SIZE];
	char *tok;
	char *tokptr;
	int invalid = 0;
	place *pl;

	if (place_str == NULL)
		return NULL;

	pl = new_place();

	if (pl == NULL)
		return NULL;

	pbs_strncpy(str, place_str, sizeof(str));

	tok = string_token(str, ":", &tokptr);

	while (tok != NULL && !invalid) {
		if (!strcmp(tok, PLACE_Pack))
			pl->pack = 1;
		else if (!strcmp(tok, PLACE_Scatter))
			pl->scatter = 1;
		else if (!strcmp(tok, PLACE_Excl))
			pl->excl = 1;
		else if (!strcmp(tok, PLACE_Free))
			pl->free = 1;
		else if (!strcmp(tok, PLACE_Shared))
			pl->share = 1;
		else if (!strcmp(tok, PLACE_VScatter))
			pl->vscatter = 1;
		else if (!strcmp(tok, PLACE_ExclHost)) {
			pl->exclhost = 1;
			pl->excl = 1;
		} else if (!strncmp(tok, PLACE_Group, 5)) {
			/* format: group=res */
			if (tok[5] == '=') {
				/* "group=" is 6 characters so tok[6] should be the first character of
				 * the resource
				 */
				pl->group = string_dup(&tok[6]);
			} else
				invalid = 1;
		} else
			invalid = 1;

		tok = string_token(NULL, ":", &tokptr);
	}

	/* pack and scatter vscatter, and free are all mutually exclusive */
	if (pl->pack + pl->scatter + pl->free + pl->vscatter > 1)
		invalid = 1;

	/* if no scatter, vscatter, pack, or free given, default to free */
	if (pl->pack + pl->scatter + pl->free + pl->vscatter == 0)
		pl->free = 1;

	if (invalid) {
		free_place(pl);
		return NULL;
	}

	return pl;
}

/**
 * @brief
 * 		parse a select spec into a selspec structure with
 *		a dependant array of chunks.  Non-consuamble resources
 *		are sorted first in the chunk resource list
 *
 * @param[in]	selspec	-	the select spec to parse
 *
 * @return	selspec*
 * @retval	pointer to a selspec obtained by parsing the select spec
 *			of the job/resv.
 * @retval	NULL	: on error or invalid spec
 *
 * @par MT-safe: Yes
 */
selspec *
parse_selspec(const std::string &sspec)
{
	/* select specs can be large.  We need to allocate a buffer large enough
	 * to handle the spec.  We'll keep it around so we don't have to allocate
	 * it on every call
	 */
	char *specbuf = NULL;
	char *tmpptr;

	selspec *spec;
	int num_plus;
	const char *p;

	char *tok;
	char *endp = NULL;

	resource_req *req_head = NULL;
	resource_req *req_end = NULL;
	resource_req *req;
	int invalid = 0;

	int num_kv;
	struct key_value_pair *kv = NULL;
	int nkvelements = 0;

	int num_chunks;
	int num_cpus = 0;

	int i;
	int n = 0;

	const char *select_spec = sspec.c_str();

	if ((spec = new selspec()) == NULL)
		return NULL;

	for (num_plus = 0, p = select_spec; *p != '\0'; p++) {
		if (*p == '+')
			num_plus++;
	}

	/* num_plus + 2: 1 for the initial chunk 1 for the NULL ptr */
	if ((spec->chunks = static_cast<chunk **>(calloc(num_plus + 2, sizeof(chunk *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		delete spec;
		return 0;
	}

	specbuf = string_dup(select_spec);
	if (specbuf == NULL) {
		delete spec;
		log_err(errno, __func__, MEM_ERR_MSG);
		return 0;
	}

	tok = string_token(specbuf, "+", &endp);

	tmpptr = NULL;
	while (tok != NULL && !invalid) {
		tmpptr = string_dup(tok);
		auto ret = parse_chunk_r(tok, &num_chunks, &num_kv, &nkvelements, &kv, NULL);

		if (!ret) {
			for (i = 0; i < num_kv && !invalid; i++) {
				req = create_resource_req(kv[i].kv_keyw, kv[i].kv_val);

				if (req == NULL)
					invalid = 1;
				else {
					if (strcmp(req->name, "ncpus") == 0) {
						/* Given: -l select=nchunk1:ncpus=Y + nchunk2:ncpus=Z +... */
						/* Then: # of cpus = (nchunk1 * Y) + (nchunk2 * Z) + ... */
						num_cpus += (num_chunks * req->amount);
					}
					const auto &rtc = conf.res_to_check;
					if (!invalid && (req->type.is_boolean || rtc.empty() || rtc.find(kv[i].kv_keyw) != rtc.end())) {
						spec->defs.insert(req->def);
						if (req_head == NULL)
							req_end = req_head = req;
						else {
							if (req->type.is_consumable) {
								req_end->next = req;
								req_end = req;
							} else {
								req->next = req_head;
								req_head = req;
							}
						}
					} else
						free_resource_req(req);
				}
			}
			spec->chunks[n] = new_chunk();
			if (spec->chunks[n] != NULL) {
				spec->chunks[n]->num_chunks = num_chunks;
				spec->chunks[n]->seq_num = get_sched_rank();
				spec->total_chunks += num_chunks;
				spec->total_cpus = num_cpus;
				spec->chunks[n]->req = req_head;
				spec->chunks[n]->str_chunk = tmpptr;
				tmpptr = NULL;
				req_head = NULL;
				req_end = NULL;
				n++;
			} else
				invalid = 1;
		} else
			invalid = 1;

		tok = string_token(NULL, "+", &endp);
	}
	free(kv);

	if (invalid) {
		delete spec;
		if (tmpptr != NULL)
			free(tmpptr);

		free(specbuf);
		return NULL;
	}

	free(specbuf);

	return spec;
}

/**
 *	@brief compare two chunks for equality
 *	@param[in] c1 - first chunk
 * 	@param[in] c2 - second chunk
 *
 *	@return int
 *	@retval 1 if chunks are equal
 *	@retval 0 if chunks are not equal
 */
int
compare_chunk(chunk *c1, chunk *c2)
{
	if (c1 == NULL && c2 == NULL)
		return 1;
	if (c1 == NULL || c2 == NULL)
		return 0;

	if (c1->num_chunks != c2->num_chunks)
		return 0;
	if (compare_resource_req_list(c1->req, c2->req, conf.resdef_to_check) == 0)
		return 0;

	return 1;
}

/**
 *	@brief compare two selspecs for equality
 *	@param[in] s1 - first selspec
 *	@param[in] s2 - second selspec
 *
 *	@returns int
 *	@retval 1 if selspecs are equal
 *	@retval 0 if not equal
 */
int
compare_selspec(selspec *s1, selspec *s2)
{
	int ret = 1;

	if (s1 == NULL && s2 == NULL)
		return 1;
	else if (s1 == NULL || s2 == NULL)
		return 0;

	if (s1->total_chunks != s2->total_chunks)
		return 0;

	if (s1->chunks != NULL && s2->chunks != NULL) {
		for (int i = 0; ret && s1->chunks[i] != NULL; i++) {
			if (compare_chunk(s1->chunks[i], s2->chunks[i]) == 0)
				ret = 0;
		}
	} else
		ret = 0;
	return ret;
}

/**
 * @brief
 * 		create an execvnode from a node solution array
 *
 * @param[in]	ns	-	the nspec struct with the chosen nodes to run the job on
 *
 * @par MT-safe:	no
 *
 * @return	execvnode in static memory
 *
 */
char *
create_execvnode(std::vector<nspec *> &ns_arr)
{
	static char *execvnode = NULL;
	static int execvnode_size = 0;
	static char *buf = NULL;
	static int bufsize = 0;
	char buf2[128];
	resource_req *req;
	bool end_of_chunk = true;

	if (execvnode == NULL) {
		execvnode = static_cast<char *>(malloc(INIT_ARR_SIZE + 1));

		if (execvnode == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}
		execvnode_size = INIT_ARR_SIZE;
	}
	if (buf == NULL) {
		buf = static_cast<char *>(malloc(INIT_ARR_SIZE + 1));
		if (buf == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}
		bufsize = INIT_ARR_SIZE;
	}
	execvnode[0] = '\0';

	bool need_plus = false;
	for (const auto &ns : ns_arr) {
		if (need_plus)
			strcpy(buf, "+");
		else {
			need_plus = true;
			buf[0] = '\0';
		}

		if (end_of_chunk) {
			if (pbs_strcat(&buf, &bufsize, "(") == NULL)
				return NULL;
		}

		if (pbs_strcat(&buf, &bufsize, ns->ninfo->name.c_str()) == NULL)
			return NULL;

		end_of_chunk = ns->end_of_chunk;

		req = ns->resreq;
		while (req != NULL) {
			if (req->type.is_consumable) {
				if (pbs_strcat(&buf, &bufsize, ":") == NULL)
					return NULL;
				if (pbs_strcat(&buf, &bufsize, req->name) == NULL)
					return NULL;
				if (req->type.is_float)
					sprintf(buf2, "=%.*f", float_digits(req->amount, FLOAT_NUM_DIGITS), req->amount);
				else

					sprintf(buf2, "=%.0lf%s", ceil(req->amount),
						req->type.is_size ? "kb" : "");
				if (pbs_strcat(&buf, &bufsize, buf2) == NULL)
					return NULL;
			} else if (ns->go_provision && strcmp(req->name, "aoe") == 0) {
				strcpy(buf2, ":aoe=");
				if (pbs_strcat(&buf, &bufsize, buf2) == NULL)
					return NULL;
				if (pbs_strcat(&buf, &bufsize, req->res_str) == NULL)
					return NULL;
			}
			req = req->next;
		}
		if (end_of_chunk)
			if (pbs_strcat(&buf, &bufsize, ")") == NULL)
				return NULL;

		if (pbs_strcat(&execvnode, &execvnode_size, buf) == NULL)
			return NULL;
	}

	return execvnode;
}

/**
 * @brief
 *		parse_execvnode - parse an execvnode into an nspec array
 *
 * @param[in]	execvnode	-	the execvnode to parse
 * @param[in]	sinfo		-	server to get the nodes from
 * @param[in]	sel			- select to map
 *
 * @return	a newly allocated nspec array for the execvnode
 *
 */
std::vector<nspec *>
parse_execvnode(char *execvnode, server_info *sinfo, selspec *sel)
{
	char *simplespec;
	char *excvndup;
	char *node_name;
	int num_el;
	struct key_value_pair *kv = NULL;

	std::vector<nspec *> nspec_arr;
	node_info *ninfo;
	resource_req *req;
	int i, j;

	bool invalid = false;

	int num_chunk;
	int nlkv = 0;
	char *p;
	char *tailptr = NULL;
	int hp;
	int cur_chunk_num = 0;
	int cur_tot_chunks = 0;
	int chunks_ind;
	int num_paren = 0;
	int in_superchunk = 0;

	if (execvnode == NULL || sinfo == NULL)
		return {};

	p = execvnode;

	/* number of chunks is number of pluses + 1 */
	num_chunk = 1;

	while (p != NULL && *p != '\0') {
		if (*p == '+')
			num_chunk++;
		if (*p == '(')
			num_paren++;

		p++;
	}

	/* Number of chunks in exec_vnode don't match selspec, don't map chunks */
	if (sel != NULL && num_paren != sel->total_chunks)
		sel = NULL;

	if ((excvndup = string_dup(execvnode)) == NULL)
		return {};

	simplespec = parse_plus_spec_r(excvndup, &tailptr, &hp);
	if (hp > 0) /* simplespec starts with '(' but doesn't close */
		in_superchunk = 1;

	if (simplespec == NULL)
		invalid = true;
	else if (parse_node_resc_r(simplespec, &node_name, &num_el, &nlkv, &kv) != 0)
		invalid = true;

	if (sel != NULL) {
		cur_tot_chunks = sel->chunks[0]->num_chunks;
		chunks_ind = 0;
	}
	for (i = 0; i < num_chunk && !invalid && simplespec != NULL; i++) {
		auto ns = new nspec();
		nspec_arr.push_back(ns);
		ninfo = find_node_info(sinfo->nodes, node_name);
		if (ninfo != NULL) {
			ns->ninfo = ninfo;
			for (j = 0; j < num_el; j++) {
				req = create_resource_req(kv[j].kv_keyw, kv[j].kv_val);
				if (req != NULL) {
					if (ns->resreq == NULL)
						ns->resreq = req;
					else {
						req->next = ns->resreq;
						ns->resreq = req;
					}
				} else
					invalid = true;
			}
		} else {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, node_name,
				  "Exechost contains a node that does not exist.");
			invalid = true;
		}
		if (sel != NULL) {
			/* This shouldn't happen since we checked above to make sure we could map properly */
			if (sel->chunks[chunks_ind] == NULL) {
				log_event(PBS_EVENTCLASS_NODE, PBS_EVENTCLASS_NODE, LOG_WARNING, __func__, "Select spec and exec_vnode/resv_nodes can not be mapped");
				free_nspecs(nspec_arr);
				return {};
			}
			ns->chk = sel->chunks[chunks_ind];
			ns->seq_num = ns->chk->seq_num;
		}
		if (!in_superchunk || hp < 0) {
			ns->end_of_chunk = 1;
			if (sel != NULL) {
				cur_chunk_num++;
				if (cur_chunk_num == cur_tot_chunks) {
					chunks_ind++;
					if (sel->chunks[chunks_ind] != NULL) {
						cur_tot_chunks = sel->chunks[chunks_ind]->num_chunks;
						cur_chunk_num = 0;
					}
				}
			}
		}

		if (!invalid) {
			simplespec = parse_plus_spec_r(tailptr, &tailptr, &hp);
			if (simplespec != NULL) {
				int ret;

				if (hp > 0) /* simplespec starts with '(' but doesn't end with ')' */
					in_superchunk = 1;
				else if (hp < 0) /* simplespec ends with ')' but does not start with '(' */
					in_superchunk = 0;
				/* hp == 0 simplespec either starts and ends with '(' ')' or has neither */

				ret = parse_node_resc_r(simplespec, &node_name, &num_el, &nlkv, &kv);
				if (ret < 0)
					invalid = true;
			}
		}
	}

	free(kv);
	free(excvndup);

	if (invalid) {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_WARNING, __func__,
			   "Failed to parse execvnode: %s", execvnode);
		free_nspecs(nspec_arr);
		return {};
	}

	return nspec_arr;
}

/**
 * @brief
 *		node_state_to_str - convert a node's state into a string for printing
 *
 * @param[in]	ninfo	-	the node
 *
 * @return	static string of node state
 *
 */
const char *
node_state_to_str(node_info *ninfo)
{
	if (ninfo == NULL)
		return "";

	if (ninfo->is_job_busy)
		return ND_jobbusy;

	if (ninfo->is_free)
		return ND_free;

	if (ninfo->is_down)
		return ND_down;

	if (ninfo->is_offline)
		return ND_offline;

	if (ninfo->is_resv_exclusive)
		return ND_resv_exclusive;

	if (ninfo->is_job_exclusive)
		return ND_job_exclusive;

	if (ninfo->is_busy)
		return ND_busy;

	if (ninfo->is_stale)
		return ND_Stale;

	if (ninfo->is_provisioning)
		return ND_prov;

	if (ninfo->is_sleeping)
		return ND_sleep;

	if (ninfo->is_maintenance)
		return ND_maintenance;

	/* default */
	return ND_state_unknown;
}

/**
 * @brief
 *		combine_nspec_array - find and combine any nspec's for the same node
 *		in an nspec array.  Because nspecs no longer map to the original chunks
 *		they came from, seq_num and chk no longer have meaning.  They are cleared.
 *
 * @param[in,out]	nspec_arr	-	array to combine
 *
 * @return	vector<nspec *>
 * @retval	combined nspec array (up to caller to free)
 * @retval	NULL on error
 *
 */
std::vector<nspec *>
combine_nspec_array(const std::vector<nspec *> &nspec_arr)
{
	std::vector<nspec *> new_nspec_arr;
	nspec *new_ns;
	std::unordered_map<int, nspec *> nspec_umap;

	if (nspec_arr.empty())
		return {};

	for (const auto &ns : nspec_arr) {
		auto numap = nspec_umap.find(ns->ninfo->rank);
		if (numap == nspec_umap.end()) {
			new_ns = new nspec();

			nspec_umap[ns->ninfo->rank] = new_ns;

			new_ns->end_of_chunk = true;
			new_ns->ninfo = ns->ninfo;
			new_ns->resreq = dup_resource_req_list(ns->resreq);
			new_nspec_arr.push_back(new_ns);
		} else {
			new_ns = numap->second;
			for (auto req_j = ns->resreq; req_j != NULL; req_j = req_j->next) {
				auto req_i = find_resource_req(new_ns->resreq, req_j->def);
				if (req_i != NULL) {
					/* we assume that if the resource is a boolean or a string
					 * the value is either the same, or doesn't exist
					 * so we don't need to do validity checking
					 */
					if (req_j->type.is_consumable)
						req_i->amount += req_j->amount;
					else if (req_j->type.is_string && req_i->res_str == NULL)
						req_i->res_str = string_dup(req_j->res_str);
				} else { /* This is the first time we've seen this resource */
					resource_req *tmpreq;
					tmpreq = dup_resource_req(req_j);
					tmpreq->next = new_ns->resreq;
					new_ns->resreq = tmpreq;
				}
			}
		}
	}
	return new_nspec_arr;
}

/**
 * @brief
 *		create a node_info array by copying the ninfo pointers out of a nspec array
 *
 * @param[in]	nspec_arr	-	source nspec array
 *
 * @return	new node_info array
 * @retval	NULL	: on error
 *
 */
node_info **
create_node_array_from_nspec(std::vector<nspec *> &nspec_arr)
{
	std::unordered_map<std::string, node_info *> node_umap;
	node_info **ninfo_arr;
	int j = 0;

	if (nspec_arr.empty())
		return NULL;

	if ((ninfo_arr = static_cast<node_info **>(calloc(nspec_arr.size() + 1, sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (const auto &ns : nspec_arr) {
		if (node_umap.find(ns->ninfo->name) == node_umap.end())
			node_umap[ns->ninfo->name] = ns->ninfo;
	}

	for (const auto &numap : node_umap)
		ninfo_arr[j++] = numap.second;

	return ninfo_arr;
}
/**
 * @brief
 *	reorder the nodes for the avoid_provision or smp_cluster_dist policies
 *	or when the reservation is being altered without changing the source
 * 	array. We do so by holding our own static array of node pointers that
 * 	we will sort for the different policies.
 *
 * @param[in]	nodes	: nodes to reorder
 * @param[in]	resresv : job or reservation for which reorder is done
 *
 * @see	last_node_name - the last allocated node - used for round_robin
 *
 * @return	node_info **
 * @retval	reordered list of nodes if needed
 * @retval	'nodes' parameter if nodes do not need reordering
 * @retval	NULL	: on error
 *
 * @par Side Effects:
 *      local variable node_array holds onto memory in the heap for reuse.
 *      The caller should not free the return
 *
 * @par MT-safe:	No
 *
 * @par MT-safe: No
 */
node_info **
reorder_nodes(node_info **nodes, resource_resv *resresv)
{
	static node_info **node_array = NULL;
	static int node_array_size = 0;
	node_info **nptr = NULL;
	node_info **tmparr = NULL;
	schd_resource *hostres = NULL;
	schd_resource *cur_hostres = NULL;
	int nsize = 0;
	int i = 0;
	int j = 0;
	int k = 0;

	if (nodes == NULL)
		return NULL;

	if (resresv == NULL && conf.provision_policy == AVOID_PROVISION)
		return NULL;

	nsize = count_array(nodes);

	if ((node_array_size < nsize + 1) || node_array == NULL) {
		tmparr = static_cast<node_info **>(realloc(node_array, sizeof(node_info *) * (nsize + 1)));
		if (tmparr == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}

		node_array = tmparr;
		node_array_size = nsize + 1;
	}
	tmparr = NULL;

	node_array[0] = NULL;
	nptr = node_array;

	if (last_node_name[0] == '\0' && nodes[0] != NULL)
		pbs_strncpy(last_node_name, nodes[0]->name.c_str(), sizeof(last_node_name));

	if (resresv != NULL) {
		if (resresv->aoename != NULL && conf.provision_policy == AVOID_PROVISION) {
			memcpy(nptr, nodes, (nsize + 1) * sizeof(node_info *));

			if (cmp_aoename != NULL)
				free(cmp_aoename);

			cmp_aoename = string_dup(resresv->aoename);
			qsort(nptr, nsize, sizeof(node_info *), cmp_aoe);

			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Re-sorted the nodes on aoe %s, since aoe was requested", resresv->aoename);

			return nptr;
		}
	}

	switch (cstat.smp_dist) {
		case SMP_NODE_PACK:
			nptr = nodes;
			break;

		case SMP_ROUND_ROBIN:

			if ((tmparr = static_cast<node_info **>(calloc(node_array_size, sizeof(node_info *)))) == NULL) {
				log_err(errno, __func__, MEM_ERR_MSG);
				return NULL;
			}

			memcpy(tmparr, nodes, nsize * sizeof(node_info *));
			qsort(tmparr, nsize, sizeof(node_info *), cmp_node_host);

			for (i = 0; i < nsize && tmparr[i]->name != last_node_name; i++)
				;

			if (i < nsize) {
				/* find the vnode of the next host or the end of the list since the
				 * beginning will definitely be a different host because of our sort
				 */
				hostres = find_resource(tmparr[i]->res, allres["host"]);
				if (hostres != NULL) {
					for (; i < nsize; i++) {
						cur_hostres = find_resource(tmparr[i]->res, allres["host"]);
						if (cur_hostres != NULL) {
							if (!compare_res_to_str(cur_hostres, hostres->str_avail[0], CMP_CASELESS))
								break;
						}
					}
				}
			}

			/* copy from our last location to the end */
			for (j = 0, k = i; k < nsize; j++, k++)
				nptr[j] = tmparr[k];

			/* copy from the beginning to our last location */
			for (k = 0; k < i; j++, k++)
				nptr[j] = tmparr[k];

			nptr[j] = NULL;

			free(tmparr);
			break;

		default:
			nptr = nodes;
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, "", "Invalid smp_cluster_dist value");
	}

	return nptr;
}

/**
 * @brief
 *		ok_break_chunk - is it OK to break up a chunk on a list of nodes?
 *
 * @param[in]	resresv	-	the requestor (unused for the moment)
 * @param[in]	nodes   -	the list of nodes to check
 *
 * @return	int
 * @retval	1	: if its OK to break up chunks across the nodes
 * @retval	0	: if it not
 *
 */
int
ok_break_chunk(resource_resv *resresv, node_info **nodes)
{
	int i;
	schd_resource *hostres = NULL;
	schd_resource *res;
	if (resresv == NULL || nodes == NULL)
		return 0;

	for (i = 0; nodes[i] != NULL; i++) {
		res = find_resource(nodes[i]->res, allres["host"]);
		if (res != NULL) {
			if (hostres == NULL)
				hostres = res;
			else {
				if (match_string_array(hostres->str_avail, res->str_avail) != SA_FULL_MATCH) {
					break;
				}
			}
		} else {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_WARNING,
				  nodes[i]->name, "Node has no host resource");
		}
	}

	if (nodes[i] == NULL)
		return 1;

	return 0;
}

/**
 * @brief
 *		is_excl - is a request/node combination exclusive?  This is based
 *		  on both the place directive of the request and the
 *		  sharing attribute of the node
 *
 * @param[in]	pl	-	place directive of the request
 * @param[in]	sharing	-	sharing attribute of the node
 *
 * @return	int
 * @retval	1	: if exclusive
 * @retval	0	: if not
 *
 * @note
 *		Assumes if pl is NULL, no request excl/shared request was given
 */
int
is_excl(place *pl, enum vnode_sharing sharing)
{
	if (sharing == VNS_FORCE_EXCL || sharing == VNS_FORCE_EXCLHOST)
		return 1;

	if (sharing == VNS_IGNORE_EXCL)
		return 0;

	if (pl != NULL) {
		if (pl->excl)
			return 1;

		if (pl->share)
			return 0;
	}

	if (sharing == VNS_DFLT_EXCL || sharing == VNS_DFLT_EXCLHOST)
		return 1;

	if (sharing == VNS_DFLT_SHARED)
		return 0;

	return 0;
}

/**
 * @brief
 * 		take a node solution and extend it by allocating the rest of
 *		a node array to it.
 *
 * @param[in][out]	nsa	-	currently allocated node solution to be
 *							extended with ninfo_arr
 * @param[in] ninfo_arr - node array to allocate to nspec array
 *
 * @note
 *		must be allocated by caller
 *
 * @return	int
 * @retval	1	: on success
 * @retval	on error	: nsa may be modified
 *
 */
int
alloc_rest_nodepart(std::vector<nspec *> &nsa, node_info **ninfo_arr)
{
	int max_seq_num = 0;
	if (ninfo_arr == NULL)
		return 0;

	/* find the end of our current node solution.  While we're searching, find
	 * the highest nspec sequence number.  We will use this for the sequence
	 * number for the rest of the nodepart
	 */
	for (const auto &ns : nsa)
		if (ns->seq_num > max_seq_num)
			max_seq_num = ns->seq_num;

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		const auto ns = find_nspec(nsa, ninfo_arr[i]);

		/* node not part of solution */
		if (ns == NULL) {
			auto nns = new nspec();
			nns->ninfo = ninfo_arr[i];
			nns->end_of_chunk = 1;
			nns->seq_num = max_seq_num;

			nns->sub_seq_num = get_sched_rank();
			nsa.push_back(nns);
		}
	}

	return 1;
}

/**
 * @brief
 * 		determine if a chunk can fit on one vnode in node list
 *
 * @param[in]	req	-	requested resources to compare to nodes
 * @param[in]	ninfo_arr	-	node array
 *
 * @par NOTE:
 * 		all resources in req will be honored regardless of
 * 	    whether they are in conf.res_to_check or not due to the fact
 *		that chunk resources only contain such resources
 *
 * @return	int
 * @retval	1	: chunk can fit in 1 vnode
 * @retval	0	: chunk can not fit / error
 *
 */
int
can_fit_on_vnode(resource_req *req, node_info **ninfo_arr)
{
	int i;
	static schd_error *dumperr = NULL;

	if (req == NULL || ninfo_arr == NULL)
		return 0;

	if (dumperr == NULL) {
		dumperr = new_schd_error();
		if (dumperr == NULL) {
			set_schd_error_codes(dumperr, NOT_RUN, SCHD_ERROR);
			return 0;
		}
	}

	for (i = 0; ninfo_arr[i] != NULL; i++) {
		clear_schd_error(dumperr);

		if (is_vnode_eligible_chunk(req, ninfo_arr[i], NULL, dumperr)) {
			if (check_avail_resources(ninfo_arr[i]->res, req,
						  UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, NULL))
				return 1;
		}
	}

	return 0;
}

/**
 * @brief
 *	Checks if an EOE is available on a vnode
 *
 * @par Functionality:
 *	This function checks if an EOE is available on a vnode.
 *
 * @see
 *
 * @param[in]	ninfo		-	pointer to node_info
 * @param[in]	resresv		-	pointer to resource_resv
 *
 * @return	int
 * @retval	 0 : EOE not available
 * @retval	 1 : EOE available
 *
 * @par Side Effects:
 *	Unknown
 *
 * @par MT-safe: No
 *
 */
int
is_eoe_avail_on_vnode(node_info *ninfo, resource_resv *resresv)
{
	schd_resource *resp;

	if (ninfo == NULL || resresv == NULL)
		return 0;

	if (resresv->eoename == NULL)
		return 0;

	if ((resp = find_resource(ninfo->res, allres["eoe"])) != NULL)
		return is_string_in_arr(resp->str_avail, resresv->eoename);

	return 0;
}

/**
 * @brief
 *		Checks if a vnode is eligible to be provisioned
 *
 * @par Functionality:
 *		This function checks if a vnode is eligible to be provisioned.
 *		A vnode is eligible to be provisioned if it satisfies all of the
 *		following conditions:-
 *			(1) AOE instantiated on the vnode is different from AOE requested by the
 *			the job or reservation,
 *			(2) Server has provisioning enabled,
 *			(3) Vnode has provisioning enabled,
 *			(4) Vnode does not have suspended jobs
 *  		(5) Vnode does not have any running jobs (inside / outside resvs)
 *			(6) No conflicts with reservations already running on the Vnode
 *			(7) No conflicts with jobs already running on the Vnode
 *
 * @see
 *		should_backfill_with_job
 *
 * @param[in]	node		-	pointer to node_info
 * @param[in]	resresv		-	pointer to resource_resv
 * @param[in]	err		-	pointer to schd_error
 *
 * @return	int
 * @retval	NO_PROVISIONING_NEEDED	: resresv doesn't request aoe
 *			or node doesn't need provisioning
 * @retval	PROVISIONING_NEEDED : vnode is provisionable and needs
 *			provisioning
 * @retval	NOT_PROVISIONABLE  : vnode is not provisionable
 *			(see err for more details)
 *
 * @par Side Effects:
 *		Unknown
 *
 * @par MT-safe:	No
 *
 */
int
is_provisionable(node_info *node, resource_resv *resresv, schd_error *err)
{
	int i;
	int ret = NO_PROVISIONING_NEEDED;

	if ((resresv->aoename == NULL && resresv->is_job) ||
	    !resresv->is_prov_needed)
		return NO_PROVISIONING_NEEDED;

	/* Perform checks if job is going to provision now or if reservation has aoe. */
	if ((resresv->is_job && (node->current_aoe == NULL || strcmp(resresv->aoename, node->current_aoe))) ||
	    (resresv->is_resv && resresv->aoename != NULL)) {
		/* we are inside, it means node requires provisioning... */
		ret = PROVISIONING_NEEDED;

		if (node->is_multivnoded) {
			set_schd_error_codes(err, NOT_RUN, IS_MULTI_VNODE);
			return NOT_PROVISIONABLE;
		}

		/* PROV_DISABLE_ON_SERVER is NOT_RUN instead of NEVER RUN.
		 * Even though we can't provision any nodes, there might be
		 * enough nodes in the correct aoe to run the job.
		 */
		if (!resresv->server->provision_enable) {
			set_schd_error_codes(err, NOT_RUN, PROV_DISABLE_ON_SERVER);
			return NOT_PROVISIONABLE;
		}

		if (!node->provision_enable) {
			set_schd_error_codes(err, NOT_RUN, PROV_DISABLE_ON_NODE);
			return NOT_PROVISIONABLE;
		}

		/* Provisioning disallowed if there are suspended jobs on the node */
		if (node->num_susp_jobs > 0) {
			set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
			return NOT_PROVISIONABLE;
		}

		/* if there are running jobs, inside or outside a resv,
		 * disallow prov.
		 */
		if (node->num_jobs > 0) {
			set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
			return NOT_PROVISIONABLE;
		}
	}

	/* node cannot be shared between running reservation without AOE
	 * and job with AOE
	 */
	if (resresv->is_job && node->run_resvs_arr) {
		for (i = 0; node->run_resvs_arr[i]; i++) {
			if (node->run_resvs_arr[i]->aoename == NULL) {
				set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
				return NOT_PROVISIONABLE;
			}
		}
	}

	/* node cannot be shared between running job with AOE
	 * and reservation without AOE
	 */
	if (resresv->is_resv && resresv->aoename == NULL &&
	    node->job_arr) {
		for (i = 0; node->job_arr[i]; i++) {
			if (node->job_arr[i]->aoename != NULL) {
				set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
				return NOT_PROVISIONABLE;
			}
		}
	}

	return ret;
}

/**
 * @brief
 *		handles everything which happens to a node when it comes back up
 *
 * @param[in]	node	-	the node to bring back up
 * @param[in]	arg		-	NULL param
 *
 * @par Side Effects:
 * 		Sets the resv-exclusive state if the node had it
 * 		previously set.
 *
 * @par MT-safe:	Unknown
 *
 * @retval	1 - node was successfully brought up
 * @retval	0 - node couldn't be brought up
 *
 */
int
node_up_event(node_info *node, void *arg)
{
	server_info *sinfo;

	if (node == NULL)
		return 0;

	/* Preserve the resv-exclusive state when previously set */
	if (node->is_resv_exclusive)
		set_node_info_state(node, ND_resv_exclusive);
	else
		set_node_info_state(node, ND_free);

	sinfo = node->server;
	if (sinfo->node_group_enable && !sinfo->node_group_key.empty()) {
		node_partition_update_array(sinfo->policy, sinfo->nodepart);
		qsort(sinfo->nodepart, sinfo->num_parts,
		      sizeof(node_partition *), cmp_placement_sets);
	}
	update_all_nodepart(sinfo->policy, sinfo, NO_ALLPART);

	return 1;
}

/**
 * @brief
 *		handles everything which happens to a node when it goes down
 *
 * @param[in]	node	-	node to bring down
 * @param[in]	arg		-	NULL param
 *
 * @par Side Effects: None
 * @par MT-safe: Unknown
 *
 * @return	int
 * @retval	1	: node was successfully brought down
 * @retval	0	: node couldn't be brought down
 *
 */
int
node_down_event(node_info *node, void *arg)
{
	server_info *sinfo;

	if (node == NULL)
		return 0;

	sinfo = node->server;
	if (node->job_arr != NULL) {
		for (int i = 0; node->job_arr[i] != NULL; i++) {
			const char *job_state;

			if (node->job_arr[i]->job->can_requeue)
				job_state = "Q";
			else
				job_state = "X";
			update_universe_on_end(sinfo->policy, node->job_arr[i], job_state, NO_ALLPART);
		}
	}

	set_node_info_state(node, ND_down);

	if (sinfo->node_group_enable && !sinfo->node_group_key.empty()) {
		node_partition_update_array(sinfo->policy, sinfo->nodepart);
		qsort(sinfo->nodepart, sinfo->num_parts,
		      sizeof(node_partition *), cmp_placement_sets);
	}
	update_all_nodepart(sinfo->policy, sinfo, NO_ALLPART);

	return 1;
}

/**
 * @brief
 *		create an array of unique nodes from a names in a string array
 *
 * @param[in]	nodes	-	nodes to create array from
 * @param[in]	strnodes	-	string array of vnode names
 *
 * @return node array
 *
 */
node_info **
create_node_array_from_str(node_info **nodes, char **strnodes)
{
	int i, j;
	node_info **ninfo_arr;
	int cnt;

	if (nodes == NULL || strnodes == NULL)
		return NULL;

	cnt = count_array(strnodes);

	if ((ninfo_arr = static_cast<node_info **>(malloc((cnt + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	ninfo_arr[0] = NULL;

	for (i = 0, j = 0; strnodes[i] != NULL; i++) {
		if (find_node_info(ninfo_arr, strnodes[i]) == NULL) {
			ninfo_arr[j] = find_node_info(nodes, strnodes[i]);
			if (ninfo_arr[j] != NULL) {
				j++;
				ninfo_arr[j] = NULL;
			} else
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
					   "Node %s not found in list.", strnodes[i]);
		}
	}

	return ninfo_arr;
}

/**
 * @brief find a node in the array and return its index
 * @param ninfo_arr - node array
 * @param rank - rank of node to search for
 * @return int
 * @retval 0+ - index in array of node
 * @retval -1 - node not found
 */
int
find_node_ind(node_info **ninfo_arr, int rank)
{
	int i;
	if (ninfo_arr == NULL)
		return -1;

	for (i = 0; ninfo_arr[i] != NULL && ninfo_arr[i]->rank != rank; i++)
		;

	if (ninfo_arr[i] == NULL)
		return -1;

	return i;
}

/**
 * @brief
 * 		find a node by its unique rank
 *
 * @param[in]	ninfo_arr	-	node array to search
 * @param[in] rank	-	unique numeric identifier for node
 *
 * @return	node_info *
 * @retval	found node
 * @retval	NULL	: if node is not found
 */
node_info *
find_node_by_rank(node_info **ninfo_arr, int rank)
{
	int ind;
	if (ninfo_arr == NULL)
		return NULL;

	ind = find_node_ind(ninfo_arr, rank);
	if (ind == -1)
		return NULL;
	return ninfo_arr[ind];
}

/**
 * @brief find a node by indexing into sinfo->unordered_nodes O(1) or
 * 	  by searching for its unique rank O(N) if sinfo->unordered_nodes is unavailable
 *
 * @param[in] ninfo_arr - array of nodes to search
 * @param[in] ind - index into sinfo->unordered_nodes
 * @param[in] rank - node's unique rank
 *
 * @return node_info *
 * @retval found node
 * @retval NULL if node is not found
 */
node_info *
find_node_by_indrank(node_info **ninfo_arr, int ind, int rank)
{
	if (ninfo_arr == NULL || *ninfo_arr == NULL)
		return NULL;

	if (ninfo_arr[0] == NULL || ninfo_arr[0]->server == NULL || ninfo_arr[0]->server->unordered_nodes == NULL || ind == -1)
		return find_node_by_rank(ninfo_arr, rank);

	return ninfo_arr[0]->server->unordered_nodes[ind];
}

/**
 * @brief
 * 		determine if resresv conflicts based on exclhost state of the
 *		future events on this node.
 *
 * @param	calendar - server's calendar of events
 * @param	resresv  - job or resv to check
 * @param	ninfo    - node to check
 *
 * @return int
 * @retval 1	: no excl conflict
 * @retval 0	: future excl conflict
 */
int
sim_exclhost(event_list *calendar, resource_resv *resresv, node_info *ninfo)
{
	time_t end;

	if (calendar == NULL || resresv == NULL || ninfo == NULL)
		return 1;

	if (resresv->duration != resresv->hard_duration &&
	    exists_resv_event(calendar, resresv->hard_duration))
		end = resresv->server->server_time + calc_time_left(resresv, 1);
	else
		end = resresv->server->server_time + calc_time_left(resresv, 0);

	return generic_sim(calendar, TIMED_RUN_EVENT,
			   end, 1, sim_exclhost_func, (void *) resresv, (void *) ninfo);
}
/**
 * @brief
 * 		helper function for generic_sim() to check if an event has an exclhost
 *	  conflict with a job/resv on a node.  We either find a conflict or
 *	  continue looping.
 *
 * @param[in]	te	-	future event
 * @param[in]	arg1	-	job/reservation
 * @param[in]	arg2	- node
 *
 * @return	int
 * @retval	1	: no excl conflict
 * @retval	0	: continue looping
 * @retval	-1	: excl conflict
 */
int
sim_exclhost_func(timed_event *te, void *arg1, void *arg2)
{
	resource_resv *resresv;
	resource_resv *future_resresv;
	node_info *ninfo;

	if (te == NULL || arg1 == NULL || arg2 == NULL)
		return 0;

	resresv = static_cast<resource_resv *>(arg1);
	ninfo = static_cast<node_info *>(arg2);
	future_resresv = static_cast<resource_resv *>(te->event_ptr);
	if (find_nspec_by_rank(future_resresv->nspec_arr, ninfo->rank) == NULL)
		return 0; /* event does not affect the node */

	if (is_exclhost(future_resresv->place_spec, ninfo->sharing) ||
	    is_exclhost(resresv->place_spec, ninfo->sharing)) {
		return -1;
	}

	return 0;
}

/**
 * @brief
 * 		set current_aoe on a node.  Free existing value if set
 *
 * @param[in]	node	-	node to set
 * @paran[in]	aoe	-	aoe to set on ode
 *
 * @return void
 */
void
set_current_aoe(node_info *node, char *aoe)
{
	if (node == NULL)
		return;
	if (node->current_aoe != NULL)
		free(node->current_aoe);
	if (aoe == NULL)
		node->current_aoe = NULL;
	else
		node->current_aoe = string_dup(aoe);
}

/**
 * @brief set current_eoe on a node.  Free existing value if set
 * @param[in] node - node to set
 * @paran[in] eoe - eoe to set on ode
 * @return void
 */
void
set_current_eoe(node_info *node, char *eoe)
{
	if (node == NULL)
		return;
	if (node->current_eoe != NULL)
		free(node->current_eoe);
	if (eoe == NULL)
		node->current_eoe = NULL;
	else
		node->current_eoe = string_dup(eoe);
}

/**
 * @brief
 * 		should we exclhost this job - a function of node sharing and job place
 *
 * @param[in]	sharing	-	the nodes sharing attribute value
 * @param[in]	placespec	-	job place attribute
 *
 * @return	int
 * @retval	1	: do exclhost
 * @retval	0	: don't do exclhost (or invalid input)
 */
int
is_exclhost(place *pl, enum vnode_sharing sharing)
{
	/* if the node forces exclhost, we don't care about the place */
	if (sharing == VNS_FORCE_EXCLHOST)
		return 1;

	/* if the node ignores exclusiveness, we don't care about the place */
	if (sharing == VNS_IGNORE_EXCL)
		return 0;

	/* invalid input */
	if (pl == NULL)
		return 0;

	/* Node defaults to exclhost and the job doesn't disagree */
	if (sharing == VNS_DFLT_EXCLHOST &&
	    pl->excl == 0 && pl->share == 0)
		return 1;

	/* If the job is requesting exclhost */
	if (pl->exclhost)
		return 1;

	/* otherwise we're not doing exclhost */
	return 0;
}

/**
 * @brief	pthread routing to check eligibility for a chunk of nodes
 *
 * @param[in,out]	data - th_data_nd_eligible object
 *
 * @return void
 */
void
check_node_eligibility_chunk(th_data_nd_eligible *data)
{
	int i;
	int start, end;
	schd_error *err;
	schd_error *misc_err;
	resource_resv *resresv;
	place *pl;
	node_info **ninfo_arr;

	if (data == NULL)
		return;

	err = new_schd_error();
	if (err == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return;
	}
	misc_err = new_schd_error();
	if (misc_err == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return;
	}

	start = data->sidx;
	end = data->eidx;
	resresv = data->resresv;
	pl = data->pl;
	ninfo_arr = data->ninfo_arr;

	for (i = start; i <= end && ninfo_arr[i] != NULL; i++) {
		node_info *node;

		node = ninfo_arr[i];
		if (!node->nscr) {
			if (is_vnode_eligible(node, resresv, pl, err) == 0) {
				node->nscr |= NSCR_INELIGIBLE;
				if (node->hostset != NULL) {
					if ((err->error_code == NODE_NOT_EXCL && is_exclhost(pl, node->sharing)) || sim_exclhost(resresv->server->calendar, resresv, node) == 0) {
						int j;

						for (j = 0; node->hostset->ninfo_arr[j] != NULL; j++) {
							node_info *n = node->hostset->ninfo_arr[j];
							n->nscr |= NSCR_INELIGIBLE;
							set_schd_error_codes(misc_err, NOT_RUN, NODE_NOT_EXCL);
							schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, n->name,
								   NULL, misc_err);
							clear_schd_error(misc_err);
						}
					}
				}
				if (err->status_code != SCHD_UNKWN) {
					if (misc_err->status_code == SCHD_UNKWN)
						copy_schd_error(misc_err, err);
					schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, node->name, NULL, err);
				}
				clear_schd_error(err);
			}
		}
	}

	free_schd_error(err);
	data->err = misc_err;
}

/**
 * @brief	 Allocates th_data_nd_eligible for multi-threading of check_node_array_eligibility
 *
 * @param[in]	pl	-	the placement object
 * @param[in]	resresv	-	resresv to check to place on nodes
 * @param[in]	exclerr_buf	-	buffer for not exclusive error message
 * @param[in]	ninfo_arr	-	array to check
 * @param[in]	sidx	-	the start index in ninfo_arr for the thread
 * @param[in]	eidx	-	the end index in ninfo_arr for the thread
 *
 * @return th_data_nd_eligible *
 * @retval a newly allocated th_data_nd_eligible object
 * @retval NULL for malloc error
 */
static inline th_data_nd_eligible *
alloc_tdata_nd_eligible(place *pl, resource_resv *resresv, node_info **ninfo_arr,
			int sidx, int eidx)
{
	th_data_nd_eligible *tdata;

	tdata = static_cast<th_data_nd_eligible *>(malloc(sizeof(th_data_nd_eligible)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->err = NULL;
	tdata->pl = pl;
	tdata->resresv = resresv;
	tdata->ninfo_arr = ninfo_arr;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 * 		check nodes for eligibility and mark them ineligible if not
 *
 * @param[in]	ninfo_arr	-	array to check
 * @param[in]	resresv	-	resresv to check to place on nodes
 * @param[in]	num_nodes - count of no. of nodes
 * @param[out]	err	-	error structure
 *
 * @warning
 * 		If an error occurs in this function, no indication will be returned.
 *		This is not a huge concern because, it will just cause more work to be done.
 *
 * @return	void
 */
void
check_node_array_eligibility(node_info **ninfo_arr, resource_resv *resresv, place *pl, schd_error *err)
{
	th_data_nd_eligible *tdata = NULL;
	th_task_info *task = NULL;
	int tid;
	int num_nodes;

	if (ninfo_arr == NULL || resresv == NULL || pl == NULL || err == NULL)
		return;

	num_nodes = count_array(ninfo_arr);

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_nd_eligible(pl, resresv, ninfo_arr, 0, num_nodes - 1);
		if (tdata == NULL)
			return;
		check_node_eligibility_chunk(tdata);
		copy_schd_error(err, tdata->err);
		free_schd_error(tdata->err);
		free(tdata);
	} else { /* We are multithreading */
		int j;
		int num_tasks;
		int chunk_size = num_nodes / num_threads;
		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		for (j = 0, num_tasks = 0; num_nodes > 0;
		     num_tasks++, j += chunk_size, num_nodes -= chunk_size) {
			tdata = alloc_tdata_nd_eligible(pl, resresv, ninfo_arr, j, j + chunk_size - 1);
			if (tdata == NULL)
				break;

			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			if (task == NULL) {
				free(tdata);
				log_err(errno, __func__, MEM_ERR_MSG);
				break;
			}
			task->task_type = TS_IS_ND_ELIGIBLE;
			task->thread_data = (void *) tdata;

			queue_work_for_threads(task);
		}

		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_nd_eligible *>(task->thread_data);
				if (err->status_code == SCHD_UNKWN && tdata->err->status_code != SCHD_UNKWN)
					copy_schd_error(err, tdata->err);

				free_schd_error(tdata->err);
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
	}
}

/**
 * @brief
 *	node_in_partition	-  Tells whether the given node belongs to this scheduler
 *
 * @param[in]	ninfo		-  node information
 * @param[in]	partition	-  partition associated to scheduler
 *
 *
 * @return	int
 * @retval	1	: if success
 * @retval	0	: if failure
 */
int
node_in_partition(node_info *ninfo, char *partition)
{
	if (dflt_sched) {
		if (ninfo->partition == NULL)
			return 1;
		else
			return 0;
	}
	if (ninfo->partition == NULL)
		return 0;

	if (strcmp(partition, ninfo->partition) == 0)
		return 1;
	else
		return 0;
}

/**
 * @brief add an event to all the nodes associated to a calendar event
 * @param te - event
 * @param nspecs - nspecs[i]->node is the node to add the event to
 * @return bool
 * @retval true success
 * @retval false error
 */
bool
add_event_to_nodes(timed_event *te, std::vector<nspec *> &nspecs)
{
	if (te == NULL)
		return false;

	for (auto ns : nspecs) {
		te_list *tel;
		te_list *pre_tel = NULL;
		te_list *cur_tel;
		tel = new_te_list();
		if (tel == NULL)
			return false;
		tel->event = te;
		for (cur_tel = ns->ninfo->node_events; cur_tel != NULL && cur_tel->event->event_time <= te->event_time; cur_tel = cur_tel->next)
			pre_tel = cur_tel;
		if (pre_tel != NULL)
			pre_tel->next = tel;
		else {
			tel->next = ns->ninfo->node_events;
			ns->ninfo->node_events = tel;
		}
	}
	return true;
}

/**
 * @brief function pointer argument to generic_sim() to add an event to nodes
 * @param te - event
 * @param arg1 - unused
 * @param arg2 - unused
 * @return @see generic_sim()
 */
int
add_node_events(timed_event *te, void *arg1, void *arg2)
{
	if (!te->disabled) {
		auto nspecs = (static_cast<resource_resv *>(te->event_ptr))->nspec_arr;

		if (add_event_to_nodes(te, nspecs) == 0)
			return -1;
	}

	return 0;
}


================================================
FILE: src/scheduler/node_info.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _NODE_INFO_H
#define _NODE_INFO_H

#include "data_types.h"
#include <pbs_ifl.h>

void query_node_info_chunk(th_data_query_ninfo *data);

/*
 *      query_nodes - query all the nodes associated with a server
 */
node_info **query_nodes(int pbs_sd, server_info *sinfo);

/*
 *      query_node_info - collect information from a batch_status and
 *                        put it in a node_info struct for easier access
 */
node_info *query_node_info(struct batch_status *node, server_info *sinfo);

/*
 * pthread routine for freeing up a node_info array
 */
void
free_node_info_chunk(th_data_free_ninfo *data);

/*
 *      free_nodes - free all the nodes in a node_info array
 */
void free_nodes(node_info **ninfo_arr);

/*
 *      set_node_info_state - set a node state
 */
int set_node_info_state(node_info *ninfo, const char *state);

/*
 *      remove_node_state
 */
int remove_node_state(node_info *ninfo, const char *state);

/*
 *      add_node_state
 */
int add_node_state(node_info *ninfo, const char *state);

/*
 *      node_filter - filter a node array and return a new filterd array
 */
node_info **
node_filter(node_info **nodes, int size,
	    int (*filter_func)(node_info *, void *), void *arg, int flags);

/*
 *      is_node_timeshared - check if a node is timeshared
 */
int is_node_timeshared(node_info *node, void *arg);

/*
 *      find_node_info - find a node in the node array
 */
node_info *find_node_info(node_info **ninfo_arr, const std::string &nodename);

/*
 *      dup_node_info - duplicate a node by creating a new one and coping all
 *                      the data into the new
 */
node_info *dup_node(node_info *oninfo, server_info *nsinfo);

void dup_node_info_chunk(th_data_dup_nd_info *data);

/*
 *      dup_nodes - duplicate an array of nodes
 */
node_info **dup_nodes(node_info **onodes, server_info *nsinfo, unsigned int flags);

/*
 *      collect_jobs_on_nodes - collect all the jobs in the job array on the
 *                              nodes
 */
int collect_jobs_on_nodes(node_info **ninfo_arr, resource_resv **resresv_arr, int size, int flags);

/*
 *      collect_resvs_on_nodes - collect all the running resvs in the resv array
 *                              on the nodes
 */
int collect_resvs_on_nodes(node_info **ninfo_arr, resource_resv **resresv_arr, int size);

/*
 *      is_node_eligible - is this node eligible to run the job
 */
int is_node_eligible(resource_resv *job, node_info *ninfo, char *reason);

/*
 *      find_eligible_nodes - find the eligible node in an array of nodes
 *                            that a job can run on.
 */
node_info **find_eligible_nodes(resource_resv *job, node_info **ninfo_arr, int node_size);

/*
 *      ssinode_reqlist - create a duplicate reqlist for a job for a node's
 *                        ssinode nodeboard mem/proc configuration
 */
resource_req *ssinode_reqlist(resource_req *reqlist, node_info *ninfo);

/*
 *      update_node_on_run - update internal scheduler node data when a job
 *                           is run.
 */
void update_node_on_run(nspec *ns, resource_resv *resresv, const char *job_state);

/*
 *      node_queue_cmp - used with node_filter to filter nodes attached to a
 *                       specific queue
 */
int node_queue_cmp(node_info *ninfo, void *arg);

/*
 *      update_node_on_end - update a node when a job ends
 */
void update_node_on_end(node_info *ninfo, resource_resv *resresv, const char *job_state);

/*
 *      copy_node_ptr_array - copy an array of jobs using a different set of
 *                            of job pointer (same jobs, different array).
 *                            This means we have to use the names from the
 *                            first array and find them in the second array
 */
node_info **copy_node_ptr_array(node_info **oarr, node_info **narr);

/*
 *      create_execvnode - create an execvnode to run a multi-node job
 */
char *create_execvnode(std::vector<nspec *> &ns_arr);

/*
 *      parse_execvnode - parse an execvnode into an nspec array
 */
std::vector<nspec *> parse_execvnode(char *execvnode, server_info *sinfo, selspec *sel);

/*
 *      dup_nspecs - duplicate an array of nspecs
 */
std::vector<nspec *> dup_nspecs(const std::vector<nspec *> &onspecs, node_info **ninfo_arr, selspec *sel);

/* find a chunk by a sequence number */
chunk *find_chunk_by_seq_num(chunk **chunks, int seq_num);

/*
 *      free_nspecs - free a nspec array
 */
void free_nspecs(std::vector<nspec *> &nspec_arr);

/*
 *      find_nspec - find an nspec in an array
 */
nspec *find_nspec(std::vector<nspec *> &nspec_arr, node_info *ninfo);

/*
 *      update_nodes_for_resvs - take a node array and make resource effects
 *                               to it for reservations in respect to a job
 *                               This function is for jobs outside of resvs
 */
int
update_nodes_for_resvs(node_info **ninfo_arr, server_info *sinfo,
		       resource_resv *job);

/*
 *      dup_node_info - duplicate a node by creating a new one and coping all
 *                      the data into the new
 */
node_info *dup_node_info(node_info *onode, server_info *nsinfo, unsigned int flags);

/*
 *      find_nspec_by_name - find an nspec in an array by nodename
 */
nspec *find_nspec_by_rank(std::vector<nspec *> &nspec_arr, int rank);

/* find node by unique rank and return index into ninfo_arr */
int find_node_ind(node_info **ninfo_arr, int rank);

/*
 *
 *      update_nodes_for_running_resvs - update resource_assigned values for
 *                                       to reflect running resvs
 */
void update_nodes_for_running_resvs(resource_resv **resvs, node_info **nodes);

/*
 *	global_spec_size - calculate how large a the spec will be
 *			   after the global
 *			   '#' operator has been expanded
 */
int global_spec_size(char *spec, int ncpu_size);

/*
 *	node_state_to_str - convert a node's state into a string for printing
 *	returns static string of node state
 */
const char *node_state_to_str(node_info *ninfo);

/*
 *	parse_placespec - allocate a new place structure and parse
 *				a placement spec (-l place)
 *	returns newly allocated place
 *		NULL: invalid placement spec
 *
 */
place *parse_placespec(char *place_str);

/* compare two place specs to see if they are equal */
int compare_place(place *pl1, place *pl2);

/*
 *	parse_selspec - parse a simple select spec into requested resources
 *
 *	  IN: selspec - the select spec to parse
 *	  OUT: numchunks - the number of chunks
 *
 *	returns requested resource list (& number of chunks in numchunks)
 *		NULL on error or invalid spec
 */
selspec *parse_selspec(const std::string &sspec);

/* compare two selspecs to see if they are equal*/
int compare_selspec(selspec *s1, selspec *s2);

/*
 *	combine_nspec_array - find and combine any nspec's for the same node
 *				in an nspec array
 */
std::vector<nspec *> combine_nspec_array(const std::vector<nspec *> &nspec_arr);

/*
 *	eval_selspec - eval a select spec to see if it is satisifable
 *
 *	  IN: spec - the nodespec
 *	  IN: placespec - the placement spec (-l place)
 *	  IN: ninfo_arr - array of nodes to satisify the spec
 *	  IN: nodepart - the node partition array for node grouping
 *		 	 if NULL, we're not doing node grouping
 *	  IN: resresv - the resource resv the spec is from
 *	  IN: flags - flags to change functions behavior
 *	      EVAL_OKBREAK - ok to break chunck up across vnodes
 *	      EVAL_EXCLSET - allocate entire nodelist exclusively
 *	  OUT: nspec_arr - the node solution
 *
 *	returns true if the nodespec can be satisified
 *		false if not
 */
bool
eval_selspec(status *policy, selspec *spec, place *placespec,
	     node_info **ninfo_arr, node_partition **nodepart,
	     resource_resv *resresv, unsigned int flags,
	     std::vector<nspec *> &nspec_arr, schd_error *err);

/*
 *
 *	eval_placement - handle the place spec for node placement
 *
 *	  IN: spec       - the select spec
 *	  IN: ninfo_arr  - array of nodes to satisify the spec
 *	  IN: pl         - parsed placement spec
 *	  IN: resresv    - the resource resv the spec if from
 *	  IN: flags - flags to change functions behavior
 *	      EVAL_OKBREAK - ok to break chunck up across vnodes
 *	  OUT: nspec_arr - the node solution
 *
 *	returns true if the selspec can be satisified
 *		false if not
 *
 */
bool
eval_placement(status *policy, selspec *spec, node_info **ninfo_arr, place *pl,
	       resource_resv *resresv, unsigned int flags, std::vector<nspec *> &nspec_arr, schd_error *err);
/*
 *	eval_complex_selspec - handle a complex (plus'd) select spec
 *
 *	  IN: spec       - the select spec
 *	  IN: ninfo_arr  - array of nodes to satisify the spec
 *	  IN: pl         - parsed placement spec
 *	  IN: resresv    - the resource resv the spec if from
 *	  IN: flags - flags to change functions behavior
 *	      EVAL_OKBREAK - ok to break chunck up across vnodes
 *	  OUT: nspec_arr - the node solution
 *
 *	returns true if the selspec can be satisified
 *		false if not
 */
bool
eval_complex_selspec(status *policy, selspec *spec, node_info **ninfo_arr, place *pl,
		     resource_resv *resresv, unsigned int flags, std::vector<nspec *> &nspec_arr, schd_error *err);

/*
 * 	eval_simple_selspec - eval a non-plused select spec for satasifiability
 *
 *        IN: chk - the chunk to satisfy
 * 	  IN: ninfo_arr - the array of nodes
 *	  IN: pl - placement information (from -l place)
 *	  IN: resresv - the job the spec if from (needed for reservations)
 *        IN: flags - flags to change functions behavior
 *            EVAL_OKBREAK - ok to break chunck up across vnodes
 *	  OUT: nspec_arr - array of struct nspec's describing the chosen nodes
 *
 * 	returns true if the select spec is satifiable
 * 		false if not
 */
bool
eval_simple_selspec(status *policy, chunk *chk, node_info **pninfo_arr,
		    place *pl, resource_resv *resresv, unsigned int flags,
		    std::vector<nspec *> &nspec_arr, schd_error *err);

/* evaluate one node to see if it is eligible at the job/resv level */
bool
is_vnode_eligible(node_info *node, resource_resv *resresv,
		  struct place *pl, schd_error *err);

/* check if a vnode is eligible for a chunk */
bool
is_vnode_eligible_chunk(resource_req *specreq, node_info *node,
			resource_resv *resresv, schd_error *err);

/*
 *	resources_avail_on_vnode - check to see if there are enough
 *				consuable resources on a vnode to make it
 *				eligible for a request
 *				Note: This function will allocate <= 1 chunk
 *
 *	  specreq_cons - requested consumable resources
 *        IN: node - the node to evaluate
 *        IN: pl - place spec for request
 *        IN: resresv - resource resv which is requesting
 *        IN: flags - flags to change behavior of function
 *              EVAL_OKBREAK - OK to break chunk across vnodes
 *        OUT: err - error status if node is ineligible
 *
 *	returns 1 if resources were allocated from the node
 *		0 if sufficent resources are not available (err is set)
 */
bool
resources_avail_on_vnode(resource_req *specreq_cons, node_info *node,
			 place *pl, resource_resv *resresv, unsigned int flags,
			 nspec *ns, schd_error *err);

/*
 *	check_resources_for_node - check to see how many chunks can fit on a
 *				   node looking at both resources available
 *				   now and future advanced reservations
 *
 *
 *	  IN: resreq     - requested resources
 *	  IN: node       - node to check for
 *	  IN: resersv    - the resource resv to check for
 *	  OUT: err       - schd_error reply if there aren't enough resources
 *
 *	returns number of chunks which can be satisifed during the duration
 *		-1 on error
 */
long long
check_resources_for_node(resource_req *resreq, node_info *ninfo,
			 resource_resv *resresv, schd_error *err);

/*
 *	create_node_array_from_nspec - create a node_info array by copying the
 *				       ninfo pointers out of a nspec array
 *	returns new node_info array or NULL on error
 */
node_info **create_node_array_from_nspec(std::vector<nspec *> &nspec_arr);

/*
 *	reorder_nodes - reorder nodes for smp_cluster_dist or
 *				provision_policy_types
 *	NOTE: uses global last_node_name for round_robin
 *	returns pointer to static buffer of nodes (reordered appropretly)
 */
node_info **reorder_nodes(node_info **nodes, resource_resv *resresv);

/*
 *	ok_break_chunk - is it OK to break up a chunk on a list of nodes?
 *	  resresv - the requestor (unused for the moment)
 *	  nodes   - the list of nodes to check
 *
 *	returns 1 if its OK to break up chunks across the nodes
 *		0 if it not
 */
int ok_break_chunk(resource_resv *resresv, node_info **nodes);

/*
 *	is_excl - is a request/node combination exclusive?  This is based
 *		  on both the place directive of the request and the
 *		  sharing attribute of the node
 *
 *	  pl      - place directive of the request
 *	  sharing - sharing attribute of the node
 *
 *	returns 1 if exclusive
 *		0 if not
 *
 *	Assumes if pl is NULL, no request excl/shared request was given
 */
int is_excl(place *pl, enum vnode_sharing sharing);
/* similar to is_excl but for exclhost */
int is_exclhost(place *pl, enum vnode_sharing sharing);

/*
 *	alloc_rest_nodepart - allocate the rest of a node partition to a
 *			      nspec array
 *
 *	  IN,OUT: nsa - node solution to be filled out -- allocated by the
 *		        caller with enough space for the entire solution
 *	  IN: ninfo_arr - node array to allocate
 *
 *	returns 1 on success
 *		0 on error -- nsa will be modified
 */
int alloc_rest_nodepart(std::vector<nspec *> &nsa, node_info **ninfo_arr);

/*
 *	can_fit_on_vnode - see if a chunk fit on one vnode in node list
 *
 *	  req - requested resources to compare to nodes
 *	  ninfo_arr - node array
 *
 *	returns 1: chunk can fit in 1 vnode
 *		0: chunk can not fit / error
 */
int can_fit_on_vnode(resource_req *req, node_info **ninfo_arr);

/*
 *      is_eoe_avail_on_vnode - it first finds if eoe is available in node's
 *                              available list
 *
 *      return : 0 if eoe not available on node
 *             : 1 if eoe available
 *
 */
int is_eoe_avail_on_vnode(node_info *ninfo, resource_resv *resresv);

/*
 *      is_provisionable - it checks if a vnode is eligible to be provisioned
 *
 *      return NO_PROVISIONING_NEEDED : resresv doesn't doesn't request aoe
 *                                      or node doesn't need provisioning
 *             PROVISIONING_NEEDED : vnode is provisionable and needs
 *                                   provisioning
 *             NOT_PROVISIONABLE  : vnode is not provisionable
 *
 *
 */
int is_provisionable(node_info *node, resource_resv *job, schd_error *err);

/*
 *	handles everything which happens to a node when it comes back up
 */
int node_up_event(node_info *node, void *arg);

/*
 *	handles everything which happens to a node when it goes down
 */
int node_down_event(node_info *node, void *arg);

/*
 *	create a node_info array from a list of nodes in a string array
 */
node_info **create_node_array_from_str(node_info **nodes, char **strnodes);

/*
 *      find node by unique rank
 */
node_info *find_node_by_rank(node_info **ninfo_arr, int rank);

/* find node by index into sinfo->unordered_nodes or by unique rank */
node_info *find_node_by_indrank(node_info **ninfo_arr, int ind, int rank);

/* determine if resresv conflicts with future events on ninfo based on the exclhost state */
int sim_exclhost(event_list *calendar, resource_resv *resresv, node_info *ninfo);

/*
 * helper function for generic_sim() to check if an event has an exclhost
 * conflict with a job/resv on a node
 */
int sim_exclhost_func(timed_event *te, void *arg1, void *arg2);

/*
 *  get the node resource list from the node object.  If there is a
 *  scratch resource list, return that one first.
 */

/**
 * set current_aoe on a node.  Free existing value if set
 */
void set_current_aoe(node_info *node, char *aoe);

/**
 * set current_eoe on a node.  Free existing value if set
 */
void set_current_eoe(node_info *node, char *eoe);

/*
 * Check eligibility for a chunk of nodes, a supplementary function to check_node_array_eligibility
 */
void
check_node_eligibility_chunk(th_data_nd_eligible *data);

/* check nodes for eligibility and mark them ineligible if not */
void check_node_array_eligibility(node_info **ninfo_arr, resource_resv *resresv, place *pl, schd_error *err);

int node_in_partition(node_info *ninfo, char *partition);
/* add a node to a node array*/
node_info **add_node_to_array(node_info **ninfo_arr, node_info *node);

bool add_event_to_nodes(timed_event *te, std::vector<nspec *> &nspecs);

int add_node_events(timed_event *te, void *arg1, void *arg2);

struct batch_status *send_statvnode(int virtual_fd, char *id, struct attrl *attrib, char *extend);

/*
 * Find a node by its hostname
 */
node_info *find_node_by_host(node_info **ninfo_arr, char *host);
#endif /* _NODE_INFO_H */


================================================
FILE: src/scheduler/node_partition.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    node_partition.c
 *
 * @brief
 * node_partition.c - contains functions to related to node_partition structure.
 *
 * Functions included are:
 * 	new_node_partition()
 * 	free_node_partition_array()
 * 	free_node_partition()
 * 	dup_node_partition_array()
 * 	dup_node_partition()
 * 	find_node_partition()
 * 	find_node_partition_by_rank()
 * 	create_node_partitions()
 * 	node_partition_update_array()
 * 	node_partition_update()
 * 	free_np_cache_array()
 * 	find_alloc_np_cache()
 * 	resresv_can_fit_nodepart()
 * 	create_specific_nodepart()
 * 	create_placement_sets()
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include "errno.h"

#include <log.h>
#include <pbs_ifl.h>
#include <pbs_internal.h>
#include <libpbs.h>

#include "config.h"
#include "constant.h"
#include "data_types.h"
#include "server_info.h"
#include "queue_info.h"
#include "node_info.h"
#include "resource_resv.h"
#include "resource.h"
#include "misc.h"
#include "node_partition.h"
#include "check.h"
#include "globals.h"
#include "sort.h"
#include "buckets.h"
#include <vector>

/**
 * @brief
 *		new_node_partition - allocate and initialize a node_partition
 *
 * @return new node partition
 * @retval	NULL	: on error
 *
 */
node_partition *
new_node_partition()
{
	node_partition *np;

	if ((np = static_cast<node_partition *>(malloc(sizeof(node_partition)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	np->ok_break = false;
	np->excl = false;
	np->name = NULL;
	np->def = NULL;
	np->res_val = NULL;
	np->tot_nodes = 0;
	np->free_nodes = 0;
	np->res = NULL;
	np->ninfo_arr = NULL;
	np->bkts = NULL;

	np->rank = -1;

	return np;
}

/**
 * @brief
 *		free_node_partition_array - free an array of node_partitions
 *
 * @param[in]	np_arr	-	node partition array to free
 *
 * @return	nothing
 *
 */
void
free_node_partition_array(node_partition **np_arr)
{
	int i;

	if (np_arr == NULL)
		return;

	for (i = 0; np_arr[i] != NULL; i++)
		free_node_partition(np_arr[i]);

	free(np_arr);
}

/**
 * @brief
 *		free_node_partition - free a node_partition structure
 *
 * @param[in]	np	-	the node_partition to free
 *
 */
void
free_node_partition(node_partition *np)
{
	if (np == NULL)
		return;

	if (np->name != NULL)
		free(np->name);

	np->def = NULL;

	if (np->res_val != NULL)
		free(np->res_val);

	if (np->res != NULL)
		free_resource_list(np->res);

	if (np->ninfo_arr != NULL)
		free(np->ninfo_arr);

	if (np->bkts != NULL)
		free_node_bucket_array(np->bkts);

	free(np);
}

/**
 * @brief
 *		dup_node_partition_array - duplicate a node_partition array
 *
 * @param[in]	onp_arr	-	the node_partition array to duplicate
 * @param[in]	nsinfo	-	server for the new node partition
 *
 * @return	duplicated array
 * @retval	NULL	: on error
 *
 */
node_partition **
dup_node_partition_array(node_partition **onp_arr, server_info *nsinfo)
{
	int i;
	node_partition **nnp_arr;
	if (onp_arr == NULL)
		return NULL;

	for (i = 0; onp_arr[i] != NULL; i++)
		;

	if ((nnp_arr = static_cast<node_partition **>(malloc((i + 1) * sizeof(node_partition *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; onp_arr[i] != NULL; i++) {
		nnp_arr[i] = dup_node_partition(onp_arr[i], nsinfo);
		if (nnp_arr[i] == NULL) {
			free_node_partition_array(nnp_arr);
			return NULL;
		}
	}

	nnp_arr[i] = NULL;

	return nnp_arr;
}

/**
 * @brief
 *		dup_node_partition - duplicate a node_partition structure
 *
 * @param[in]	onp	-	the node_partition structure to duplicate
 * @param[in]	nsinfo	-	server for the new node partiton (the nodes are needed)
 *
 * @return	duplicated node_partition
 * @retval	NULL	: on error
 *
 */
node_partition *
dup_node_partition(node_partition *onp, server_info *nsinfo)
{
	node_partition *nnp;

	if (onp == NULL)
		return NULL;

	if ((nnp = new_node_partition()) == NULL)
		return NULL;

	if (onp->name != NULL)
		nnp->name = string_dup(onp->name);

	if (onp->def != NULL)
		nnp->def = onp->def;

	if (onp->res_val != NULL)
		nnp->res_val = string_dup(onp->res_val);

	nnp->ok_break = onp->ok_break;
	nnp->excl = onp->excl;
	nnp->tot_nodes = onp->tot_nodes;
	nnp->free_nodes = onp->free_nodes;
	nnp->res = dup_resource_list(onp->res);
	nnp->ninfo_arr = copy_node_ptr_array(onp->ninfo_arr, nsinfo->nodes);

	nnp->bkts = dup_node_bucket_array(onp->bkts, nsinfo);
	nnp->rank = onp->rank;

	/* validity check */
	if (onp->name == NULL || onp->res_val == NULL ||
	    nnp->res == NULL || nnp->ninfo_arr == NULL) {
		free_node_partition(nnp);
		return NULL;
	}
	return nnp;
}

/**
 * @brief copy a node partition array from pointers out of another.
 * @param[in] onp_arr - old node partition array
 * @param[in] new_nps - node partition array with new pointers
 *
 * @return node_partition **
 */
node_partition **
copy_node_partition_ptr_array(node_partition **onp_arr, node_partition **new_nps)
{
	int cnt;
	int i;
	node_partition **nnp_arr;

	if (onp_arr == NULL || new_nps == NULL)
		return NULL;

	cnt = count_array(onp_arr);
	if ((nnp_arr = static_cast<node_partition **>(malloc((cnt + 1) * sizeof(node_partition *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; i < cnt; i++)
		nnp_arr[i] = find_node_partition_by_rank(new_nps, onp_arr[i]->rank);
	nnp_arr[i] = NULL;

	return nnp_arr;
}

/**
 * @brief
 *		find_node_partition - find a node partition by (resource_name=value)
 *			      partition name from a pool of partitions
 *
 * @param[in]	np_arr	-	array of node partitions to search name
 *
 * @return	found node partition
 * @retval	NULL	: if not found
 *
 */
node_partition *
find_node_partition(node_partition **np_arr, const std::string &name)
{
	int i;
	if (np_arr == NULL || name.empty())
		return NULL;

	for (i = 0; np_arr[i] != NULL && strcmp(np_arr[i]->name, name.c_str()); i++)
		;

	return np_arr[i];
}

/**
 * @brief
 * 		find node partition by unique rank
 *
 * @param[in]	np_arr	-	array of node partitions to search
 * @param[in]	rank	-	unique rank of node partition
 *
 * @return	node_partition **
 * @retval	found node partition
 * @retval	NULL	: if node partition isn't found or on error
 */

node_partition *
find_node_partition_by_rank(node_partition **np_arr, int rank)
{
	int i;
	if (np_arr == NULL)
		return NULL;

	for (i = 0; np_arr[i] != NULL && np_arr[i]->rank != rank; i++)
		;

	return np_arr[i];
}

/**
 * @brief
 * 		break apart nodes into partitions
 *		A possible side-effect of this function when multiple identical
 *		resources are defined on an attribute, is that the node
 *		partitions accounting for this node may count this node in the
 *		total count of "free_nodes" for that partition (if the node was
 *		free in the first place). Due to this, incorrect accounting,
 *		the metadata of the node partition may cause eval_selspec to
 *		descend into the node matching code instead of bailing out right
 *		away due to the fact that the node partition has insufficient
 *		resources.
 *
 * @param[in]	policy	-	policy info
 * @param[in]	nodes	-	the nodes which to create partitions from
 * @param[in]	resnames	-	node grouping resource names
 * @param[in]	flags	-	flags which change operations of node partition creation
 *							NP_IGNORE_EXCL - ignore vnodes marked excl
 *	 						NP_CREATE_REST - create a part for vnodes w/ no np resource
 * @param[out]	num_parts	-	the number of partitions created
 *
 * @return	node_partition ** (NULL terminated node_partition array)
 * @retval	: created node_partition array
 * @retval	: NULL on error
 *
 */
node_partition **
create_node_partitions(status *policy, node_info **nodes, const std::vector<std::string> &resnames, unsigned int flags, int *num_parts)
{
	node_partition **np_arr;
	node_partition *np;
	node_partition **tmp_arr;
	int np_arr_size = 0;
	static schd_resource *res;

	int num_nodes;

	schd_resource *tmpres;

	int val_i;  /* index of placement set resource value */
	int node_i; /* index into nodes array */
	int np_i;   /* index into node partition array we are creating */

	static schd_resource *unset_res = NULL;

	std::vector<queue_info *> queues;

	if (nodes == NULL || resnames.empty())
		return NULL;

	if (nodes[0] != NULL && nodes[0]->server != NULL)
		queues = nodes[0]->server->queues;

	num_nodes = count_array(nodes);

	if ((np_arr = static_cast<node_partition **>(malloc((num_nodes + 1) * sizeof(node_partition *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	np_arr_size = num_nodes;

	np_i = 0;
	np_arr[0] = NULL;

	if (flags & NP_CREATE_REST && unset_res == NULL)
		unset_res = new_resource();

	for (auto &res_i : resnames) {
		auto def = find_resdef(res_i);
		for (node_i = 0; nodes[node_i] != NULL; node_i++) {
			if (nodes[node_i]->is_stale)
				continue;

			res = find_resource(nodes[node_i]->res, def);

			if (res == NULL && (flags & NP_CREATE_REST)) {
				unset_res->name = res_i.c_str();
				if (set_resource(unset_res, "\"\"", RF_AVAIL) == 0) {
					free_node_partition_array(np_arr);
					return NULL;
				}
				res = unset_res;
			}
			if (res != NULL) {
				/* Incase of indirect resource, point it to the right place */
				if (res->indirect_res != NULL)
					res = res->indirect_res;
				for (val_i = 0; res->str_avail[val_i] != NULL; val_i++) {
					std::string str = res_i + "=" + res->str_avail[val_i];
					/* If we find the partition, we've already created it - add the node
					 * to the existing partition.  If we don't find it, we create it.
					 */
					np = find_node_partition(np_arr, str);
					if (np == NULL) {
						if (np_i >= np_arr_size) {
							tmp_arr = static_cast<node_partition **>(realloc(np_arr,
													 (np_arr_size * 2 + 1) * sizeof(node_partition *)));
							if (tmp_arr == NULL) {
								log_err(errno, __func__, MEM_ERR_MSG);
								free_node_partition_array(np_arr);
								return NULL;
							}
							np_arr = tmp_arr;
							np_arr_size *= 2;
						}

						np_arr[np_i] = new_node_partition();
						if (np_arr[np_i] != NULL) {
							np_arr[np_i]->name = string_dup(str.c_str());
							np_arr[np_i]->def = def;
							np_arr[np_i]->res_val = string_dup(res->str_avail[val_i]);
							np_arr[np_i]->tot_nodes = 1;
							if (nodes[node_i]->is_free)
								np_arr[np_i]->free_nodes = 1;
							np_arr[np_i]->rank = get_sched_rank();

							if (np_arr[np_i]->res_val == NULL) {
								np_arr[np_i + 1] = NULL;
								free_node_partition_array(np_arr);
								return NULL;
							}

							np_i++;
							np_arr[np_i] = NULL;
						} else {
							free_node_partition_array(np_arr);
							return NULL;
						}
					} else {
						np->tot_nodes++;
						if (nodes[node_i]->is_free)
							np->free_nodes++;
					}
				}
			}
			/* else we ignore nodes without the node partition resource set
			 * unless the NP_CREATE_REST flag is set
			 */
		}
	}

	/* now that we have a list of node partitions and number of nodes in each
	 * lets allocate a node array and fill it
	 */

	for (np_i = 0; np_arr[np_i] != NULL; np_i++) {
		int i = 0;
		np_arr[np_i]->ok_break = 1;
		schd_resource *hostres = NULL;

		np_arr[np_i]->ninfo_arr =
			static_cast<node_info **>(malloc((np_arr[np_i]->tot_nodes + 1) * sizeof(node_info *)));

		if (np_arr[np_i]->ninfo_arr == NULL) {
			free_node_partition_array(np_arr);
			return NULL;
		}

		np_arr[np_i]->ninfo_arr[0] = NULL;

		for (node_i = 0; nodes[node_i] != NULL && i < np_arr[np_i]->tot_nodes; node_i++) {
			if (nodes[node_i]->is_stale)
				continue;

			res = find_resource(nodes[node_i]->res, np_arr[np_i]->def);
			if (res == NULL && (flags & NP_CREATE_REST)) {
				set_resource(unset_res, "\"\"", RF_AVAIL);
				res = unset_res;
			}
			if (res != NULL) {
				/* Incase of indirect resource, point it to the right place */
				if (res->indirect_res != NULL)
					res = res->indirect_res;
				if (compare_res_to_str(res, np_arr[np_i]->res_val, CMP_CASE)) {
					if (np_arr[np_i]->ok_break) {
						tmpres = find_resource(nodes[node_i]->res, allres["host"]);
						if (tmpres != NULL) {
							if (hostres == NULL)
								hostres = tmpres;
							else {
								if (!compare_res_to_str(hostres, tmpres->str_avail[0], CMP_CASELESS))
									np_arr[np_i]->ok_break = 0;
							}
						}
					}
					if (!(NP_NO_ADD_NP_ARR & flags)) {
						tmp_arr = static_cast<node_partition **>(add_ptr_to_array(nodes[node_i]->np_arr, np_arr[np_i]));
						if (tmp_arr == NULL) {
							free_node_partition_array(np_arr);
							return NULL;
						}
						nodes[node_i]->np_arr = tmp_arr;
					}

					np_arr[np_i]->ninfo_arr[i] = nodes[node_i];
					i++;
					np_arr[np_i]->ninfo_arr[i] = NULL;
				}
			}
		}
		/* if multiple resource values are present, tot_nodes may be incorrect.
		 * recalculating tot_nodes for each node partition.
		 */
		np_arr[np_i]->tot_nodes = count_array(np_arr[np_i]->ninfo_arr);
		np_arr[np_i]->bkts = create_node_buckets(policy, np_arr[np_i]->ninfo_arr, queues, NO_PRINT_BUCKETS);
		node_partition_update(policy, np_arr[np_i]);
	}

	*num_parts = np_i;
	return np_arr;
}

/**
 * @brief update the node buckets associated with a node
 *
 *  @param[in] bkts - the buckets to update
 *  @param[in] ninfo - the node of the job/resv
 */
void
update_buckets_for_node(node_bucket **bkts, node_info *ninfo)
{
	int i;

	if (bkts == NULL || ninfo == NULL)
		return;

	for (i = 0; bkts[i] != NULL; i++) {
		int node_ind = ninfo->node_ind;

		/* Is this node in the bucket? */
		if (pbs_bitmap_get_bit(bkts[i]->bkt_nodes, node_ind)) {
			/* First turn off the current bit */
			if (pbs_bitmap_get_bit(bkts[i]->free_pool->truth, node_ind)) {
				pbs_bitmap_bit_off(bkts[i]->free_pool->truth, node_ind);
				bkts[i]->free_pool->truth_ct--;
			} else if (pbs_bitmap_get_bit(bkts[i]->busy_later_pool->truth, node_ind)) {
				pbs_bitmap_bit_off(bkts[i]->busy_later_pool->truth, node_ind);
				bkts[i]->busy_later_pool->truth_ct--;
			} else if (pbs_bitmap_get_bit(bkts[i]->busy_pool->truth, node_ind)) {
				pbs_bitmap_bit_off(bkts[i]->busy_pool->truth, node_ind);
				bkts[i]->busy_pool->truth_ct--;
			}

			/* Next, turn on the correct bit */
			if (ninfo->num_jobs > 0 || ninfo->num_run_resv > 0) {
				pbs_bitmap_bit_on(bkts[i]->busy_pool->truth, node_ind);
				bkts[i]->busy_pool->truth_ct++;
			} else {
				if (ninfo->node_events != NULL) {
					pbs_bitmap_bit_on(bkts[i]->busy_later_pool->truth, node_ind);
					bkts[i]->busy_later_pool->truth_ct++;
				} else {
					pbs_bitmap_bit_on(bkts[i]->free_pool->truth, node_ind);
					bkts[i]->free_pool->truth_ct++;
				}
			}
		}
	}
}

/**
 * @brief update the node buckets associated with a node partition on
 *        job/resv run/end
 *
 *  @param[in] bkts - the buckets to update
 *  @param[in] ninfo_arr - the nodes of the job/resv
 */
void
update_buckets_for_node_array(node_bucket **bkts, node_info **ninfo_arr)
{
	int i;

	if (bkts == NULL || ninfo_arr == NULL)
		return;

	for (i = 0; ninfo_arr[i] != NULL; i++)
		update_buckets_for_node(bkts, ninfo_arr[i]);
}

/**
 * @brief
 * 		update metadata for an entire array of node partitions
 *
 * @param[in] policy	-	policy info
 * @param[in] nodepart	-	partition array to update
 * @param[in] ninfo_arr - 	nodes being updated (may be NULL)
 *
 * @return	int
 * @retval	1	: on all success
 * @retval	0	: on any failure
 *
 * @note
 * 		This is not an atomic operation -- this means that if this
 *		function fails, some node partitions may have been updated and
 *		others not.
 *
 */
int
node_partition_update_array(status *policy, node_partition **nodepart)
{
	int rc = 1;

	if (policy == NULL || nodepart == NULL)
		return 0;

	for (int i = 0; nodepart[i] != NULL; i++) {
		auto cur_rc = node_partition_update(policy, nodepart[i]);
		if (cur_rc == 0)
			rc = 0;
		update_buckets_for_node_array(nodepart[i]->bkts, nodepart[i]->ninfo_arr);
	}

	return rc;
}

/**
 * @brief
 * 		update the meta data about a node partition
 *			like free_nodes and consumable resources in res
 *
 * @param[in]	policy	-	policy info
 * @param[in]	np	-	the node partition to update
 * @param[in]	nodes	-	the entire node array used to create these node partitions
 *
 * @return	int
 * @retval	1	: on success
 * @retval	0	: on failure
 *
 */
int
node_partition_update(status *policy, node_partition *np)
{
	int i;
	int rc = 1;
	schd_resource *res;
	unsigned int arl_flags = USE_RESOURCE_LIST | ADD_ALL_BOOL;

	if (np == NULL)
		return 0;

	/* if res is not NULL, we are updating.  Clear the meta data for the update*/
	if (np->res != NULL) {
		arl_flags |= NO_UPDATE_NON_CONSUMABLE;
		for (res = np->res; res != NULL; res = res->next) {
			if (res->type.is_consumable) {
				res->assigned = 0;
				res->avail = 0;
			}
		}
	} else
		arl_flags |= ADD_UNSET_BOOLS_FALSE;

	np->free_nodes = 0;

	for (i = 0; i < np->tot_nodes; i++) {
		if (np->ninfo_arr[i]->is_free) {
			np->free_nodes++;
			arl_flags &= ~ADD_AVAIL_ASSIGNED;
		} else
			arl_flags |= ADD_AVAIL_ASSIGNED;

		if (np->res == NULL)
			np->res = dup_selective_resource_list(np->ninfo_arr[i]->res,
							      policy->resdef_to_check, arl_flags);
		else if (!add_resource_list(policy, np->res, np->ninfo_arr[i]->res, arl_flags)) {
			rc = 0;
			break;
		}
	}

	if (!policy->node_sort->empty() && conf.node_sort_unused) {
		/* Resort the nodes in the partition so that selection works correctly. */
		qsort(np->ninfo_arr, np->tot_nodes, sizeof(node_info *),
		      multi_node_sort);
	}

	return rc;
}

/**
 * @brief
 *		np_cache - constructor
 *
 * @return	new np_cache object
 */
np_cache::np_cache()
{
	ninfo_arr = NULL;
	nodepart = NULL;
	num_parts = UNSPECIFIED;
}
// overloaded
np_cache::np_cache(node_info **rninfo_arr, const std::vector<std::string> &rresnames, node_partition **rnodepart, int rnum_parts) : ninfo_arr(rninfo_arr), resnames(rresnames), nodepart(rnodepart), num_parts(rnum_parts) {}
// Destructor
np_cache::~np_cache()
{
	if (nodepart != NULL)
		free_node_partition_array(nodepart);

	/* reference to an array of nodes, the owner will free */
	ninfo_arr = NULL;
}

/**
 * @brief
 *		free_np_cache_array - destructor for array
 *
 * @param[in,out]	npc_arr	-	np cashe array.
 */
void
free_np_cache_array(std::vector<np_cache *> &npc_arr)
{
	if (npc_arr.empty())
		return;

	for (auto elem : npc_arr)
		delete elem;
	npc_arr.clear();
	return;
}

/**
 * @brief
 *		find_np_cache - find a np_cache by the array of resource names and
 *			nodes which created it.
 *
 * @param[in]	npc_arr	-	the array to search
 * @param[in]	resnames	-	the list of names
 * @param[in]	ninfo_arr	-	array of nodes
 *
 * @par NOTE:
 * 		function does node node_info pointer comparison to save time
 *
 * @return	the node found node partition
 * @retval	NULL	: if not (or on error)
 *
 */
np_cache *
find_np_cache(const std::vector<np_cache *> &npc_arr,
	      const std::vector<std::string> &resnames, node_info **ninfo_arr)
{
	if (npc_arr.empty() || resnames.empty() || ninfo_arr == NULL)
		return NULL;

	for (auto elem : npc_arr) {
		if (elem->ninfo_arr == ninfo_arr &&
		    match_string_array(elem->resnames, resnames) == SA_FULL_MATCH)
			return elem;
	}

	return NULL;
}

/**
 * @brief
 * 		find a np_cache by the array of resource names
 *		and nodes which created it.  If the np_cache
 *		does not exist, create it and add it to the list
 *
 * @param[in]	policy	-	policy info
 * @param[in,out]	pnpc_arr	-	pointer to np_cache array -- if *npc_arr == NULL
 *		 	           				a np_cache will be created and it will be set
 *			           				Example: you pass &(sinfo->npc_arr)
 * @param[in]	resnames	-	the names used to create the pool of node parts
 * @param[in]	ninfo_arr	-	the node array used to create the pool of node_parts
 * @param[in]	sort_func	-	sort function to sort placement sets.
 *				  				sets are only sorted when they are created.
 *				  				If NULL is passed in, no sorting is done
 *
 * @return	np_cache *
 * @retval	found	: created np_cache
 * @retval 	NULL	: on error
 *
 */
np_cache *
find_alloc_np_cache(status *policy, std::vector<np_cache *> &pnpc_arr,
		    const std::vector<std::string> &resnames, node_info **ninfo_arr,
		    int (*sort_func)(const void *, const void *))
{
	node_partition **nodepart = NULL;
	int num_parts;
	np_cache *npc = NULL;
	int error = 0;

	if (resnames.empty() || ninfo_arr == NULL)
		return NULL;

	npc = find_np_cache(pnpc_arr, resnames, ninfo_arr);

	if (npc == NULL) {
		int flags = NP_NO_ADD_NP_ARR;

		if (sc_attrs.only_explicit_psets == 0)
			flags |= NP_CREATE_REST;

		/* didn't find node partition cache, need to allocate and create */
		nodepart = create_node_partitions(policy, ninfo_arr, resnames, flags, &num_parts);
		if (nodepart != NULL) {
			if (sort_func != NULL)
				qsort(nodepart, num_parts, sizeof(node_partition *), sort_func);
			try {
				npc = new np_cache(ninfo_arr, resnames, nodepart, num_parts);
				pnpc_arr.push_back(npc);
			} catch (std::bad_alloc &e) {
				free_node_partition_array(nodepart);
				error = 1;
			}
		} else
			error = 1;
	}

	if (error)
		return NULL;

	return npc;
}

/**
 * @brief
 * 		do an initial check to see if a resresv can fit into a node partition
 *        based on the meta data we keep.
 *
 * @param[in]	policy	-	policy info
 * @param[in]	np	-	node partition to check
 * @param[in]	resresv	-	job/resv to see if it can fit
 * @param[in]	flags	-	check_flags
 *							COMPARE_TOTAL - compare with resources_available value
 *							RETURN_ALL_ERR - return all the errors, not just the first failure
 * @param[in]	err	-	schd_error structure to return why job/resv can't fit
 *
 * @return	int
 * @retval	1	: can fit
 * @retval	0	: can't fit
 * @retval	-1	: on error
 */
int
resresv_can_fit_nodepart(status *policy, node_partition *np, resource_resv *resresv,
			 unsigned int flags, schd_error *err)
{
	int i;
	schd_error *prev_err = NULL;
	int can_fit = 1;
	int pass_flags;
	resource_req *req;
	selspec *spec = NULL;
	place *pl = NULL;

	if (policy == NULL || np == NULL || resresv == NULL || err == NULL)
		return -1;

	pass_flags = flags | UNSET_RES_ZERO;

	/* Check 1: Based on the flag check if there are any nodes available or if
	 * they are free.
	 */
	if (flags & COMPARE_TOTAL) {
		/* Check that node partition must have one or more nodes inside it */
		if (np->tot_nodes == 0) {
			set_schd_error_codes(err, NEVER_RUN, NO_TOTAL_NODES);
			if ((flags & RETURN_ALL_ERR)) {
				can_fit = 0;
				err->next = new_schd_error();
				prev_err = err;
				err = err->next;
			} else
				return 0;
		}
	} else {
		/* Check is there at least 1 node in the free state */
		if (np->free_nodes == 0) {
			set_schd_error_codes(err, NOT_RUN, NO_FREE_NODES);
			if ((flags & RETURN_ALL_ERR)) {
				can_fit = 0;
				err->next = new_schd_error();
				prev_err = err;
				err = err->next;
			} else
				return 0;
		}
	}

	/* Check 2: v/scatter - If we're scattering or requesting exclusive nodes
	 * we know we need at least as many nodes as requested chunks */
	if (resresv->place_spec->scatter || resresv->place_spec->vscatter) {
		int nodect;
		enum sched_error_code error_code;
		enum schd_err_status status_code;
		if ((flags & COMPARE_TOTAL)) {
			nodect = np->tot_nodes;
			error_code = NO_TOTAL_NODES;
			status_code = NEVER_RUN;
		} else {
			nodect = np->free_nodes;
			error_code = NO_FREE_NODES;
			status_code = NOT_RUN;
		}

		if (nodect < resresv->select->total_chunks) {
			set_schd_error_codes(err, status_code, error_code);
			if ((flags & RETURN_ALL_ERR)) {
				can_fit = 0;
				err->next = new_schd_error();
				prev_err = err;
				err = err->next;
			} else
				return 0;
		}
	}

	/* Check 3: Job Wide RASSN resources(e.g., ncpus, mem).  We only check
	 * resources that the server has summed over the select statement.  We
	 * know these came from the nodes so should be checked on the nodes.  Other
	 * resources are for server/queue and so we ignore them here
	 */
	if (resresv->is_job && resresv->job != NULL && resresv->job->resreq_rel != NULL)
		req = resresv->job->resreq_rel;
	else
		req = resresv->resreq;
	if (check_avail_resources(np->res, req,
				  pass_flags, policy->resdef_to_check_rassn_select,
				  INSUFFICIENT_RESOURCE, err) == 0) {
		if ((flags & RETURN_ALL_ERR)) {
			can_fit = 0;
			for (; err->next != NULL; err = err->next)
				;
			err->next = new_schd_error();
			prev_err = err;
			err = err->next;
		} else
			return 0;
	}

	/* Check 4: Chunk level resources: Check each chunk compared to the meta data
	 *          This is mostly for non-consumables.  Booleans are always honored
	 *	      on nodes regardless if they are in the resources line.  This is a
	 *	      grandfathering in from the old nodespec properties.
	 */
	/* The call to get_resresv_spec is needed here because we are checking for resources on each
	 * chunk. For jobs that already have execselect specification defined we only need to
	 * traverse through those chunks.
	 * get_resresv_spec sets the spec value to execselect/select depending on whether execselect
	 * was set or not.
	 */
	get_resresv_spec(resresv, &spec, &pl);
	for (i = 0; spec->chunks[i] != NULL; i++) {
		if (check_avail_resources(np->res, spec->chunks[i]->req,
					  pass_flags | CHECK_ALL_BOOLS, policy->resdef_to_check,
					  INSUFFICIENT_RESOURCE, err) == 0) {
			if ((flags & RETURN_ALL_ERR)) {
				can_fit = 0;
				for (; err->next != NULL; err = err->next)
					;
				err->next = new_schd_error();
				prev_err = err;
				err = err->next;
			} else
				return 0;
		}
	}
	if ((flags & RETURN_ALL_ERR)) {
		if (prev_err != NULL) {
			prev_err->next = NULL;
			free(err);
		}
		return can_fit;
	}
	return 1;
}

/**
 * @brief
 * 		create_specific_nodepart - create a node partition with specific
 *				          nodes, rather than from a placement
 *				          set resource=value
 *
 * @param[in]	policy	-	policy info
 * @param[in]	name	-	the name of the node partition
 * @param[in]	nodes	-	the nodes to create the placement set with
 * @param[in]	flags	-	flags which change operations of node partition creation
 *
 * @return	node_partition * - the node partition
 * @NULL	: on error
 */
node_partition *
create_specific_nodepart(status *policy, const char *name, node_info **nodes, int flags)
{
	node_partition *np;
	int i, j;
	int cnt;
	node_partition **tmp_arr;

	if (name == NULL || nodes == NULL)
		return NULL;

	np = new_node_partition();
	if (np == NULL)
		return NULL;

	cnt = count_array(nodes);

	np->name = string_dup(name);
	np->def = NULL;
	np->res_val = string_dup("none");
	np->rank = get_sched_rank();

	np->ninfo_arr = static_cast<node_info **>(malloc((cnt + 1) * sizeof(node_info *)));
	if (np->ninfo_arr == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		free_node_partition(np);
		return NULL;
	}

	j = 0;
	for (i = 0; i < cnt; i++) {
		if (!nodes[i]->is_stale) {
			if (!(flags & NP_NO_ADD_NP_ARR)) {
				tmp_arr = static_cast<node_partition **>(add_ptr_to_array(nodes[i]->np_arr, np));
				if (tmp_arr == NULL) {
					free_node_partition(np);
					return NULL;
				}
				nodes[i]->np_arr = tmp_arr;
			}

			np->ninfo_arr[j] = nodes[i];
			j++;
		}
	}
	np->tot_nodes = j;

	np->ninfo_arr[np->tot_nodes] = NULL;

	if (node_partition_update(policy, np) == 0) {
		free_node_partition(np);
		return NULL;
	}

	return np;
}

/**
 * @brief
 * 		create the placement sets for the server and queues
 *
 * @param[in]	policy	-	policy info
 * @param[in]	sinfo	-	the server
 *
 * @return	int
 * @retval	true	: success
 * @retval	false	: failure
 */
bool
create_placement_sets(status *policy, server_info *sinfo)
{
	bool is_success = true;

	sinfo->allpart = create_specific_nodepart(policy, "all", sinfo->unassoc_nodes, NO_FLAGS);
	if (sinfo->has_multi_vnode) {
		const std::vector<std::string> resstr{"host"};
		int num;
		sinfo->hostsets = create_node_partitions(policy, sinfo->nodes,
							 resstr, sc_attrs.only_explicit_psets ? NP_NONE : NP_CREATE_REST, &num);
		if (sinfo->hostsets != NULL) {
			sinfo->num_hostsets = num;
			for (int i = 0; sinfo->nodes[i] != NULL; i++) {
				schd_resource *hostres;
				char hostbuf[256];

				hostres = find_resource(sinfo->nodes[i]->res, allres["host"]);
				if (hostres != NULL) {
					snprintf(hostbuf, sizeof(hostbuf), "host=%s", hostres->str_avail[0]);
					sinfo->nodes[i]->hostset =
						find_node_partition(sinfo->hostsets, hostbuf);
				} else {
					snprintf(hostbuf, sizeof(hostbuf), "host=\"\"");
					sinfo->nodes[i]->hostset =
						find_node_partition(sinfo->hostsets, hostbuf);
				}
			}
		} else {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "",
				  "Failed to create host sets for server");
			is_success = false;
		}
	}

	if (sinfo->node_group_enable && !sinfo->node_group_key.empty()) {
		sinfo->nodepart = create_node_partitions(policy, sinfo->unassoc_nodes,
							 sinfo->node_group_key,
							 sc_attrs.only_explicit_psets ? NP_NONE : NP_CREATE_REST,
							 &sinfo->num_parts);

		if (sinfo->nodepart != NULL) {
			qsort(sinfo->nodepart, sinfo->num_parts,
			      sizeof(node_partition *), cmp_placement_sets);
		} else {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "",
				  "Failed to create node partitions for server");
			is_success = false;
		}
	}

	for (auto qinfo : sinfo->queues) {

		if (qinfo->has_nodes)
			qinfo->allpart = create_specific_nodepart(policy, "all", qinfo->nodes, NO_FLAGS);

		if (sinfo->node_group_enable && (qinfo->has_nodes || !qinfo->node_group_key.empty())) {
			node_info **ngroup_nodes;
			std::vector<std::string> ngkey;

			if (qinfo->has_nodes)
				ngroup_nodes = qinfo->nodes;
			else
				ngroup_nodes = sinfo->unassoc_nodes;

			if (!qinfo->node_group_key.empty())
				ngkey = qinfo->node_group_key;
			else
				ngkey = sinfo->node_group_key;

			qinfo->nodepart = create_node_partitions(policy, ngroup_nodes,
								 ngkey, sc_attrs.only_explicit_psets ? NP_NONE : NP_CREATE_REST,
								 &(qinfo->num_parts));
			if (qinfo->nodepart != NULL) {
				qsort(qinfo->nodepart, qinfo->num_parts,
				      sizeof(node_partition *), cmp_placement_sets);
			} else {
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_QUEUE, LOG_DEBUG, qinfo->name,
					  "Failed to create node partitions for queue.");
				is_success = false;
			}
		}
	}
	return is_success;
}

/**
 * @brief sort all placement sets (server's psets, queue's psets, and hostsets)
 * @param[in] policy - policy info
 * @param[in] sinfo - server universe
 * @return void
 */
void
sort_all_nodepart(status *policy, server_info *sinfo)
{
	if (policy == NULL || sinfo == NULL)
		return;

	if (sinfo->node_group_enable && !sinfo->node_group_key.empty())
		qsort(sinfo->nodepart, sinfo->num_parts,
		      sizeof(node_partition *), cmp_placement_sets);

	for (auto qinfo : sinfo->queues) {

		if (sinfo->node_group_enable && !qinfo->node_group_key.empty())
			qsort(qinfo->nodepart, qinfo->num_parts,
			      sizeof(node_partition *), cmp_placement_sets);
	}
	if (!policy->node_sort->empty() && conf.node_sort_unused && sinfo->hostsets != NULL) {
		/* Resort the nodes in host sets to correctly reflect unused resources */
		qsort(sinfo->hostsets, sinfo->num_hostsets, sizeof(node_partition *), multi_nodepart_sort);
	}
}

/**
 *
 *	@brief update all node partitions of all queues on the server
 *	@note Call update_all_nodepart() after all nodes have been processed
 *		by update_node_on_end/update_node_on_run
 *
 *	  @param[in] policy - policy info
 *	  @param[in] sinfo - server info
 *	  @param[in] flags - flags to modify behavior
 *	  			NO_ALLPART - do not update the metadata in the allpart.
 *	  				     There are circumstances (e.g., calendaring) where
 *	  				     the allpart provides limited use and will constantly
 *	  				     be updated.  It is best to just skip it.
 *
 *	@return nothing
 *
 */
void
update_all_nodepart(status *policy, server_info *sinfo, unsigned int flags)
{
	if (sinfo == NULL)
		return;

	if (sinfo->allpart == NULL)
		return;

	if (sinfo->node_group_enable && !sinfo->node_group_key.empty())
		node_partition_update_array(policy, sinfo->nodepart);

	/* Update and resort the placement sets on the queues */
	for (auto qinfo : sinfo->queues) {

		if (sinfo->node_group_enable && !qinfo->node_group_key.empty())
			node_partition_update_array(policy, qinfo->nodepart);

		if ((flags & NO_ALLPART) == 0) {
			if (qinfo->allpart != NULL && qinfo->allpart->res == NULL)
				node_partition_update(policy, qinfo->allpart);
		}
	}

	/* Update and resort the hostsets */
	node_partition_update_array(policy, sinfo->hostsets);

	if ((flags & NO_ALLPART) == 0)
		node_partition_update(policy, sinfo->allpart);

	sort_all_nodepart(policy, sinfo);

	sinfo->pset_metadata_stale = 0;
}


================================================
FILE: src/scheduler/node_partition.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _NODE_PARTITION_H
#define _NODE_PARTITION_H

#include "data_types.h"
#include <pbs_ifl.h>

/*
 *
 *      new_node_partition - allocate and initialize a node_partition
 *
 *      returns new node partition or NULL on error
 *
 */
#ifdef NAS /* localmod 005 */
node_partition *new_node_partition(void);
#else
node_partition *new_node_partition();
#endif /* localmod 005 */

/*
 *
 *      free_node_partition_array - free an array of node_partitions
 *
 *        np_arr - node partition array to free
 *
 *      returns nothing
 *
 */
void free_node_partition_array(node_partition **np_arr);

/*
 *
 *      free_node_partition - free a node_partition structure
 *
 *        np - the node_partition to free
 *
 */
void free_node_partition(node_partition *np);

/*
 *
 *      dup_node_partition_array - duplicate a node_partition array
 *
 *        onp_arr - the node_partition array to duplicate
 *        nsinfo - server for the new node partition
 *
 *      returns duplicated array or NULL on error
 *
 */
node_partition **dup_node_partition_array(node_partition **onp_arr, server_info *nsinfo);

/*
 *
 *      dup_node_partition - duplicate a node_partition structure
 *
 *        onp - the node_partition structure to duplicate
 *        nsinfo - server for the new node partiton (the nodes are needed)
 *
 *      returns duplicated node_partition or NULL on error
 *
 */
node_partition *dup_node_partition(node_partition *onp, server_info *nsinfo);

/* copy a node partition array from pointers out of another.*/
node_partition **copy_node_partition_ptr_array(node_partition **onp_arr, node_partition **new_nps);

/*
 *
 *      create_node_partitions - break apart nodes into partitions
 *
 *         IN: policy - policy info
 *         IN: nodes  -  the nodes to create partitions from
 *	   IN: resname - node grouping resource name
 *         IN: flags - flags which change operations of node partition creation
 *	  OUT: num_parts - the number of node partitions created
 *
 *      returns node_partition array or NULL on error
 *              num_parts set to the number of partitions created if not NULL
 *
 *
 */
node_partition **create_node_partitions(status *policy, node_info **nodes, const std::vector<std::string> &resnames,
					unsigned int flags, int *num_parts);

/*
 *
 *      find_node_partition - find a node partition by name in an array
 *
 *        np_arr - array of node partitions to search
 *        name
 *
 *      returns found node partition or NULL if not found
 *
 */
node_partition *find_node_partition(node_partition **np_arr, const std::string &name);

/* find node partition by unique rank */

node_partition *find_node_partition_by_rank(node_partition **np_arr, int rank);

/*
 *	node_partition_update_array - update an entire array of node partitions
 *	  nodepart - the array of node partition to update
 *
 *	returns 1 on all success, 0 on any failure
 *	Note: This is not an atomic operation
 */
int node_partition_update_array(status *policy, node_partition **nodepart);

/*
 *	node_partition_update - update the meta data about a node partition
 *			like free_nodes and res
 *
 *	  np - the node partition to update
 *
 *	returns 1 on success, 0 on failure
 */
int node_partition_update(status *policy, node_partition *np);

/*
 *	free_np_cache_array - destructor for array
 */
void free_np_cache_array(std::vector<np_cache *> &npc_arr);

/*
 *	free_np_cache - destructor
 */
void free_np_cache(np_cache *npc);

/*
 *	find_np_cache - find a np_cache by the array of resource names and
 *			nodes which created it.
 *
 *	  npc_arr - the array to search
 *	  resnames - the list of names
 *	  ninfo_arr - array of nodes
 *
 *	NOTE: function does node node_info pointer comparison to save time
 *
 *	returns the node found node partition or NULL if not (or on error)
 *
 */
np_cache *
find_np_cache(np_cache **npc_arr,
	      const std::vector<std::string> &resnames, node_info **ninfo_arr);
/*
 *	find_alloc_np_cache - find a np_cache by the array of resource names
 *			      and nodes which created it.  If the np_cache
 *			      does not exist, create it and add it to the list
 */
np_cache *
find_alloc_np_cache(status *policy, std::vector<np_cache *> &pnpc_arr,
		    const std::vector<std::string> &resnames, node_info **ninfo_arr,
		    int (*sort_func)(const void *, const void *));

/*
 * do an inital check to see if a resresv can fit into a node partition
 * based on the meta data we keep
 */
int resresv_can_fit_nodepart(status *policy, node_partition *np, resource_resv *resresv, unsigned int flags, schd_error *err);

/*
 *	create_specific_nodepart - create a node partition with specific
 *				   nodes, rather than from a placement
 *				   set resource=value
 */
node_partition *create_specific_nodepart(status *policy, const char *name, node_info **nodes, int flags);
/* create the placement sets for the server and queues */
bool create_placement_sets(status *policy, server_info *sinfo);

/* Update placement sets and allparts */
void update_all_nodepart(status *policy, server_info *sinfo, unsigned int flags);

/* Sort all placement sets (server's psets, queue's psets, and hostsets) */
void sort_all_nodepart(status *policy, server_info *sinfo);

/*
 * update the node buckets associated with a node
 */
void update_buckets_for_node(node_bucket **bkts, node_info *ninfo);

/*
 * update the node buckets associated with a node partition on
 * job/resv run/end
 */
void update_buckets_for_node_array(node_bucket **bkts, node_info **ninfo_arr);

#endif /* _NODE_PARTITION_H */


================================================
FILE: src/scheduler/parse.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    parse.c
 *
 * @brief
 * 	parse.c - contains functions to related to parsing the config file.
 *
 * Functions included are:
 * 	parse_config()
 * 	is_speccase_sort()
 * 	init_config()
 * 	scan()
 * 	preempt_bit_field()
 * 	preempt_cmp()
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <errno.h>
#include <ctype.h>
#include <log.h>
#include <libutil.h>
#include <unistd.h>
#include "data_types.h"
#include "parse.h"
#include "constant.h"
#include "config.h"
#include "misc.h"
#include "globals.h"
#include "fairshare.h"
#include "prime.h"
#include "node_info.h"
#include "resource.h"
#include "pbs_internal.h"

config::config() : fairshare_res("cput"), fairshare_ent("euser")
{
	prime_rr = 0;
	non_prime_rr = 0;
	prime_bq = 0;
	non_prime_bq = 0;
	prime_sf = 0;
	non_prime_sf = 0;
	prime_so = 0;
	non_prime_so = 0;
	prime_fs = 0;
	non_prime_fs = 0;
	prime_bf = 1;
	non_prime_bf = 1;
	prime_sn = 0;
	non_prime_sn = 0;
	prime_bp = 0;
	non_prime_bp = 0;
	prime_pre = 0;
	non_prime_pre = 0;
	update_comments = 1;
	prime_exempt_anytime_queues = 0;
	enforce_no_shares = 1;
	node_sort_unused = 0;
	resv_conf_ignore = 0;
	allow_aoe_calendar = 0;
#ifdef NAS /* localmod 034 */
	prime_sto = 0;
	non_prime_sto = 0;
#endif /* localmod 034 */

	prime_smp_dist = SMP_NODE_PACK;
	non_prime_smp_dist = SMP_NODE_PACK;
	prime_spill = 0;
	nonprime_spill = 0;
	decay_time = 86400;
	ignore_res.insert("mpiprocs");
	ignore_res.insert("ompthreads");
	memset(prime, 0, sizeof(prime));
	holiday_year = 0;		      /* the year the holidays are for */
	unknown_shares = 0;		      /* unknown group shares */
	max_preempt_attempts = SCHD_INFINITY; /* max num of preempt attempts per cyc*/
	max_jobs_to_check = SCHD_INFINITY;    /* max number of jobs to check in cyc*/
	fairshare_decay_factor = .5;	      /* decay factor used when decaying fairshare tree */
#ifdef NAS
	/* localmod 034 */
	max_borrow = 0;	       /* job share borrowing limit */
	per_share_topjobs = 0; /* per share group guaranteed top jobs*/
	/* localmod 038 */
	per_queues_topjobs = 0; /* per queues guaranteed top jobs */
	/* localmod 030 */
	min_intrptd_cycle_length = 0; /* min length of interrupted cycle */
	max_intrptd_cycles = 0;	      /* max consecutive interrupted cycles */
#endif

	/* selection criteria of nodes for provisioning */
	provision_policy = AGGRESSIVE_PROVISION;
}

/* strtok delimiters for parsing the sched_config file are space and tab */
#define DELIM "\t "

/**
 * @brief
 * 		parse the config file into the global struct config conf
 *
 * @param[in]	fname	-	file name of the config file
 *
 * @see	GLOBAL:	conf  - config structure
 *
 * @return struct config
 * 
 * @par
 *	FILE FORMAT:
 *	config_name [white space] : [white space] config_value [prime_value]
 *	EX: sort_by: shortest_job_first prime
 */
config
parse_config(const char *fname)
{
	FILE *fp; /* file pointer to config file */
	char *buf = NULL;
	int buf_size = 0;
	int linenum = 0; /* the current line number in the file */

	/* resource type for validity checking */
	struct resource_type type;

	struct config tmpconf;

	if ((fp = fopen(fname, "r")) == NULL) {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE,
			   fname, "Can not open file: %s", fname);
		return config();
	}

#ifdef NAS
	/* localmod 034 */
	tmpconf.max_borrow = UNSPECIFIED;
	tmpconf.per_share_topjobs = 0;
	/* localmod 038 */
	tmpconf.per_queues_topjobs = 0;
	/* localmod 030 */
	tmpconf.min_intrptd_cycle_length = 30;
	tmpconf.max_intrptd_cycles = 1;
#endif

	/* auto-set any internally needed config values before reading the file */
	while (pbs_fgets_extend(&buf, &buf_size, fp) != NULL) {
		bool error = false;
		const char *obsolete[2] = {0};
		auto prime = PT_ALL;
		char errbuf[1024];
		errbuf[0] = '\0';
		linenum++;

		/* skip blank lines and comments */
		if (!skip_line(buf)) {
			auto config_name = scan(buf, ':');
			auto config_value = scan(NULL, 0);
			auto prime_value = scan(NULL, 0);
			char *endp;
			if (config_name != NULL && config_value != NULL) {
				long num = -1;
				;
				if (strcasecmp(config_value, "true") == 0) {
					/* value is true */
					num = 1;
				} else if (strcasecmp(config_value, "false") == 0) {
					/* value is false */
					num = 0;
				} else if (isdigit((int) config_value[0])) {
					/* value is number */
					num = strtol(config_value, &endp, 10);
				}

				if (prime_value != NULL) {
					if (!strcmp(prime_value, "prime") || !strcmp(prime_value, "PRIME"))
						prime = PRIME;
					else if (!strcmp(prime_value, "non_prime") ||
						 !strcmp(prime_value, "NON_PRIME"))
						prime = NON_PRIME;
					else if (!strcmp(prime_value, "all") || !strcmp(prime_value, "ALL"))
						prime = PT_ALL;
					else if (!strcmp(prime_value, "none") || !strcmp(prime_value, "NONE"))
						prime = PT_NONE;
					else {
						snprintf(errbuf, sizeof(errbuf), "Invalid prime keyword: %s", prime_value);
						error = true;
					}
				}

				if (!strcmp(config_name, PARSE_ROUND_ROBIN)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_rr = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_rr = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_BY_QUEUE)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_bq = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_bq = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_STRICT_FIFO)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_sf = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_sf = num ? 1 : 0;
					obsolete[0] = config_name;
					obsolete[1] = "strict_ordering";
				} else if (!strcmp(config_name, PARSE_STRICT_ORDERING)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_so = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_so = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_FAIR_SHARE)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_fs = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_fs = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_HELP_STARVING_JOBS)) {
					obsolete[0] = config_name;
					obsolete[1] = "use eligible_time in job_sort_formula";
				} else if (!strcmp(config_name, PARSE_BACKFILL)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_bf = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_bf = num ? 1 : 0;

					obsolete[0] = config_name;
					obsolete[1] = "server's backfill_depth=0";
				} else if (!strcmp(config_name, PARSE_SORT_QUEUES)) {
					obsolete[0] = config_name;
				} else if (!strcmp(config_name, PARSE_UPDATE_COMMENTS)) {
					tmpconf.update_comments = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_BACKFILL_PRIME)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_bp = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_bp = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_PREEMPIVE_SCHED)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_pre = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_pre = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_PRIME_EXEMPT_ANYTIME_QUEUES))
					tmpconf.prime_exempt_anytime_queues = num ? 1 : 0;
				else if (!strcmp(config_name, PARSE_ENFORCE_NO_SHARES))
					tmpconf.enforce_no_shares = num ? 1 : 0;
				else if (!strcmp(config_name, PARSE_ALLOW_AOE_CALENDAR))
					tmpconf.allow_aoe_calendar = 1;
				else if (!strcmp(config_name, PARSE_PRIME_SPILL)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_spill = res_to_num(config_value, &type);
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.nonprime_spill = res_to_num(config_value, &type);

					if (!type.is_time) {
						snprintf(errbuf, sizeof(errbuf), "Invalid time %s", config_value);
						error = true;
					}
				} else if (!strcmp(config_name, PARSE_MAX_STARVE)) {
					obsolete[0] = config_name;
					obsolete[1] = "use eligible_time in job_sort_formula";
				} else if (!strcmp(config_name, PARSE_HALF_LIFE) || !strcmp(config_name, PARSE_FAIRSHARE_DECAY_TIME)) {
					if (!strcmp(config_name, PARSE_HALF_LIFE)) {
						obsolete[0] = PARSE_HALF_LIFE;
						obsolete[1] = PARSE_FAIRSHARE_DECAY_TIME " and " PARSE_FAIRSHARE_DECAY_FACTOR " instead";
					}
					tmpconf.decay_time = res_to_num(config_value, &type);
					if (!type.is_time) {
						snprintf(errbuf, sizeof(errbuf), "Invalid time %s", config_value);
						error = true;
					}
				} else if (!strcmp(config_name, PARSE_UNKNOWN_SHARES))
					tmpconf.unknown_shares = num;
				else if (!strcmp(config_name, PARSE_FAIRSHARE_DECAY_FACTOR)) {
					float fnum;
					fnum = strtod(config_value, &endp);
					if (*endp == '\0') {
						if (fnum <= 0 || fnum >= 1) {
							sprintf(errbuf, "%s: Invalid value: %.*f.  Valid values are between 0 and 1.", PARSE_FAIRSHARE_DECAY_FACTOR, float_digits(fnum, 2), fnum);
							error = true;
						} else
							tmpconf.fairshare_decay_factor = fnum;
					} else {
						pbs_strncpy(errbuf, "Invalid " PARSE_FAIRSHARE_DECAY_FACTOR, sizeof(errbuf));
						error = true;
					}
				} else if (!strcmp(config_name, PARSE_FAIRSHARE_RES)) {
					tmpconf.fairshare_res = config_value;
				} else if (!strcmp(config_name, PARSE_FAIRSHARE_ENT)) {
					if (strcmp(config_value, ATTR_euser) &&
					    strcmp(config_value, ATTR_egroup) &&
					    strcmp(config_value, ATTR_A) &&
					    strcmp(config_value, "queue") &&
					    strcmp(config_value, "egroup:euser")) {
						error = true;
						sprintf(errbuf, "%s %s is erroneous (or deprecated).",
							PARSE_FAIRSHARE_ENT, config_value);
					}
					tmpconf.fairshare_ent = config_value;
				} else if (!strcmp(config_name, PARSE_NODE_GROUP_KEY)) {
					obsolete[0] = PARSE_NODE_GROUP_KEY;
					obsolete[1] = "nothing - set via qmgr";
				} else if (!strcmp(config_name, PARSE_LOG_FILTER)) {
					obsolete[0] = PARSE_LOG_FILTER;
					obsolete[1] = "nothing - set log_events via qmgr";
				} else if (!strcmp(config_name, PARSE_PREEMPT_QUEUE_PRIO)) {
					obsolete[0] = PARSE_PREEMPT_QUEUE_PRIO;
					obsolete[1] = "nothing - set via qmgr";
				} else if (!strcmp(config_name, PARSE_RES_UNSET_INFINITE)) {
					char **strarr;

					// mpiprocs and ompthreads are added in the constructor
					strarr = break_comma_list(config_value);
					for (int i = 0; strarr[i] != NULL; i++)
						tmpconf.ignore_res.insert(strarr[i]);
					free_string_array(strarr);

				} else if (!strcmp(config_name, PARSE_RESV_CONFIRM_IGNORE)) {
					if (!strcmp(config_value, "dedicated_time"))
						tmpconf.resv_conf_ignore = 1;
					else if (!strcmp(config_value, "none"))
						tmpconf.resv_conf_ignore = 0;
					else {
						error = true;
						sprintf(errbuf, "%s valid values: dedicated_time or none",
							PARSE_RESV_CONFIRM_IGNORE);
					}
				} else if (!strcmp(config_name, PARSE_RESOURCES)) {
					bool need_host = false;
					bool need_vnode = false;
					char **strarr;
					/* hack: add in "host" into resources list because this was
					 * done by default prior to 7.1.
					 */
					if (strstr(config_value, "host") == NULL)
						need_host = true;

					/* hack: add in "vnode" in 8.0 */
					if (strstr(config_value, "vnode") == NULL)
						need_vnode = true;

					strarr = break_comma_list(config_value);
					for (int i = 0; strarr[i] != NULL; i++)
						tmpconf.res_to_check.insert(strarr[i]);
					free_string_array(strarr);

					if (need_host)
						tmpconf.res_to_check.insert("host");
					if (need_vnode)
						tmpconf.res_to_check.insert("vnode");
				} else if (!strcmp(config_name, PARSE_DEDICATED_PREFIX))
					tmpconf.ded_prefix = config_value;
				else if (!strcmp(config_name, PARSE_PRIMETIME_PREFIX))
					tmpconf.pt_prefix = config_value;
				else if (!strcmp(config_name, PARSE_NONPRIMETIME_PREFIX)) {
					tmpconf.npt_prefix = config_value;
				} else if (!strcmp(config_name, PARSE_SMP_CLUSTER_DIST)) {
					for (int i = 0; i < HIGH_SMP_DIST; i++)
						if (!strcmp(smp_cluster_info[i].str, config_value)) {
							if (prime == PRIME || prime == PT_ALL)
								tmpconf.prime_smp_dist = (enum smp_cluster_dist) smp_cluster_info[i].value;
							if (prime == NON_PRIME || prime == PT_ALL)
								tmpconf.non_prime_smp_dist = (enum smp_cluster_dist) smp_cluster_info[i].value;
						}
				} else if (!strcmp(config_name, PARSE_PREEMPT_PRIO)) {
					obsolete[0] = PARSE_PREEMPT_PRIO;
					obsolete[1] = "nothing - set via qmgr";
				} else if (!strcmp(config_name, PARSE_PREEMPT_ORDER)) {
					obsolete[0] = PARSE_PREEMPT_ORDER;
					obsolete[1] = "nothing - set via qmgr";
				} else if (!strcmp(config_name, PARSE_PREEMPT_SORT)) {
					obsolete[0] = PARSE_PREEMPT_SORT;
					obsolete[1] = "nothing - set via qmgr";
				} else if (!strcmp(config_name, PARSE_JOB_SORT_KEY)) {
					sort_info si;

					auto tok = strtok(config_value, DELIM);

					if (tok != NULL) {
						si.res_name = tok;
						auto f = allres.find(tok);
						if (f != allres.end())
							si.def = f->second;
						else
							si.def = NULL;

						tok = strtok(NULL, DELIM);
						if (tok != NULL) {
							if (!strcmp(tok, "high") || !strcmp(tok, "HIGH") ||
							    !strcmp(tok, "High")) {
								si.order = DESC;
							} else if (!strcmp(tok, "low") || !strcmp(tok, "LOW") ||
								   !strcmp(tok, "Low")) {
								si.order = ASC;
							} else
								error = true;
						} else
							error = true;

						if (!error) {
							if (si.res_name == SORT_PRIORITY) {
								obsolete[0] = SORT_PRIORITY " in " PARSE_JOB_SORT_KEY;
								obsolete[1] = SORT_JOB_PRIORITY;
								si.res_name = SORT_JOB_PRIORITY;
							}
							if (prime == PRIME || prime == PT_ALL)
								tmpconf.prime_sort.push_back(si);

							if (prime == NON_PRIME || prime == PT_ALL)
								tmpconf.non_prime_sort.push_back(si);
						} else
							pbs_strncpy(errbuf, "Invalid job_sort_key", sizeof(errbuf));
					}
				} else if (!strcmp(config_name, PARSE_NODE_SORT_KEY)) {
					sort_info si;
					auto tok = strtok(config_value, DELIM);

					if (tok != NULL) {
						si.res_name = tok;
						auto f = allres.find(tok);
						if (f != allres.end())
							si.def = f->second;
						else
							si.def = NULL;

						tok = strtok(NULL, DELIM);
						if (tok != NULL) {
							if (!strcmp(tok, "high") || !strcmp(tok, "HIGH") ||
							    !strcmp(tok, "High")) {
								si.order = DESC;
							} else if (!strcmp(tok, "low") || !strcmp(tok, "LOW") ||
								   !strcmp(tok, "Low")) {
								si.order = ASC;
							} else
								error = true;
						} else
							error = true;

						if (!error) {
							tok = strtok(NULL, DELIM);
							if (tok == NULL)
								si.res_type = RF_AVAIL;
							else {
								if (!strcmp(tok, "total"))
									si.res_type = RF_AVAIL;
								else if (!strcmp(tok, "assigned"))
									si.res_type = RF_ASSN;
								else if (!strcmp(tok, "unused"))
									si.res_type = RF_UNUSED;
								else
									error = true;
							}
						}

						if (!error) {
							if (prime == PRIME || prime == PT_ALL) {
								tmpconf.prime_node_sort.push_back(si);
								if (si.res_type == RF_UNUSED || si.res_type == RF_ASSN)
									tmpconf.node_sort_unused = 1;
							}

							if (prime == NON_PRIME || prime == PT_ALL) {
								tmpconf.non_prime_node_sort.push_back(si);
								if (si.res_type == RF_UNUSED || si.res_type == RF_ASSN)
									tmpconf.node_sort_unused = 1;
							}
						} else
							pbs_strncpy(errbuf, "Invalid node_sort_key", sizeof(errbuf));
					}
				} else if (!strcmp(config_name, PARSE_SERVER_DYN_RES)) {
					/* get the resource name */
					auto tok = strtok(config_value, DELIM);
					if (tok != NULL) {
						auto res = tok;

						/* tok is the rest of the config_value string - the program */
						tok = strtok(NULL, "");
						while (tok != NULL && isspace(*tok))
							tok++;

						if (tok != NULL && tok[0] == '!') {
							tok++;
							auto command_line = tok;
							auto filename = get_script_name(tok);
							if (filename == NULL) {
								snprintf(errbuf, sizeof(errbuf), "server_dyn_res script %s does not exist", tok);
								error = true;
							} else {
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
								int err;
								err = tmp_file_sec_user(filename, 0, 1, S_IWGRP | S_IWOTH, 1, getuid());
								if (err != 0) {
									snprintf(errbuf, sizeof(errbuf),
										 "error: %s file has a non-secure file access, errno: %d", filename, err);
									error = true;
								}
#endif
								tmpconf.dynamic_res.emplace_back(res, command_line, filename);
								free(filename);
							}
						} else {
							pbs_strncpy(errbuf, "Invalid server_dyn_res", sizeof(errbuf));
							error = true;
						}
					} else {
						pbs_strncpy(errbuf, "Invalid server_dyn_res", sizeof(errbuf));
						error = true;
					}
				} else if (!strcmp(config_name, PARSE_SORT_NODES)) {
					obsolete[0] = config_name;
					obsolete[1] = PARSE_NODE_SORT_KEY;
					sort_info si;

					si.res_name = SORT_PRIORITY;
					si.order = DESC;

					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_node_sort.push_back(si);
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_node_sort.push_back(si);
				} else if (!strcmp(config_name, PARSE_PEER_QUEUE)) {
					auto lqueue = strtok(config_value, DELIM);
					if (lqueue != NULL) {
						auto rqueue = strtok(NULL, "@");
						if (rqueue != NULL) {
							while (isspace(*rqueue))
								rqueue++;
							const char *rserver = strtok(NULL, DELIM);
							if (rserver == NULL)
								rserver = "";
							if (!error)
								tmpconf.peer_queues.emplace_back(lqueue, rqueue, rserver);

						} else
							error = true;
					} else
						error = true;

					if (error)
						sprintf(errbuf, "Invalid peer queue");

				} else if (!strcmp(config_name, PARSE_PREEMPT_ATTEMPTS))
					tmpconf.max_preempt_attempts = num;
				else if (!strcmp(config_name, PARSE_MAX_JOB_CHECK)) {
					if (!strcmp(config_value, "ALL_JOBS"))
						tmpconf.max_jobs_to_check = SCHD_INFINITY;
					else
						tmpconf.max_jobs_to_check = num;
				} else if (!strcmp(config_name, PARSE_SELECT_PROVISION)) {
					if (!strcmp(config_value, PROVPOLICY_AVOID))
						tmpconf.provision_policy = AVOID_PROVISION;
				}
#ifdef NAS
				/* localmod 034 */
				else if (!strcmp(config_name, PARSE_MAX_BORROW)) {
					tmpconf.max_borrow = res_to_num(config_value, &type);
					if (!type.is_time)
						error = true;
				} else if (!strcmp(config_name, PARSE_SHARES_TRACK_ONLY)) {
					if (prime == PRIME || prime == PT_ALL)
						tmpconf.prime_sto = num ? 1 : 0;
					if (prime == NON_PRIME || prime == PT_ALL)
						tmpconf.non_prime_sto = num ? 1 : 0;
				} else if (!strcmp(config_name, PARSE_PER_SHARE_DEPTH) ||
					   !strcmp(config_name, PARSE_PER_SHARE_TOPJOBS)) {
					tmpconf.per_share_topjobs = num;
				}
				/* localmod 038 */
				else if (!strcmp(config_name, PARSE_PER_QUEUES_TOPJOBS)) {
					tmpconf.per_queues_topjobs = num;
				}
				/* localmod 030 */
				else if (!strcmp(config_name, PARSE_MIN_INTERRUPTED_CYCLE_LENGTH)) {
					tmpconf.min_intrptd_cycle_length = num;
				} else if (!strcmp(config_name, PARSE_MAX_CONS_INTERRUPTED_CYCLES)) {
					tmpconf.max_intrptd_cycles = num;
				}
#endif
				else {
					pbs_strncpy(errbuf, "Unknown config parameter", sizeof(errbuf));
					error = true;
				}
			} else {
				pbs_strncpy(errbuf, "Config line invalid", sizeof(errbuf));
				error = true;
			}
		}

		if (error)
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, fname,
				   "Error reading line %d: %s", linenum, errbuf);

		if (obsolete[0] != NULL) {
			if (obsolete[1] != NULL)
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, fname,
					   "Obsolete config name %s, instead use %s", obsolete[0], obsolete[1]);
			else
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, fname,
					   "Obsolete config name %s", obsolete[0]);
		}
	}
	fclose(fp);

	if (buf != NULL)
		free(buf);

	if ((tmpconf.prime_smp_dist != SMP_NODE_PACK || tmpconf.non_prime_smp_dist != SMP_NODE_PACK) && tmpconf.node_sort_unused) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_WARNING, "", "smp_cluster_dist and node sorting by unused/assigned resources are not compatible.  The smp_cluster_dist option is being set to pack.");
		tmpconf.prime_smp_dist = tmpconf.non_prime_smp_dist = SMP_NODE_PACK;
	}

	return tmpconf;
}

/**
 * @brief
 * 		Check if sort_res is a valid special case sorting string
 *
 * @param[in]	sort_res	-	sorting keyword
 * @param[in]	sort_type	-	sorting object type (job or node)
 *
 * @return	int
 * @retval	1	: is special case sort
 * @retval	0	: not special case sort
 */
int
is_speccase_sort(const std::string &sort_res, int sort_type)
{
	if (sort_type == SOBJ_JOB) {
		if (sort_res == SORT_JOB_PRIORITY)
			return 1;
#ifdef NAS
		/* localmod 034 */
		if (sort_res == SORT_ALLOC)
			return 1;
		/* localmod 039 */
		if (sort_res == SORT_QPRI)
			return 1;
#endif
		else
			return 0;
	} else if (sort_type == SOBJ_NODE) {
		if (sort_res == SORT_PRIORITY || sort_res == SORT_FAIR_SHARE || sort_res == SORT_PREEMPT)
			return 1;
		else
			return 0;
	}

	return 0;
}

/**
 * @brief
 *		scan - Scan through the string looking for a white space delimited
 *	       word or quoted string.  If the target parameter is not 0, then
 *	       use that as a delimiter as well.
 *
 * @param[in]	str	-	the string to scan through.  If NULL, start where we left
 *		   				off last time.
 * @param[in]	target	-	if target is 0, set it to a space.  It is already a delimiter
 *
 * @return	scanned string or NULL
 *
 */
char *
scan(char *str, char target)
{
	static char *isp = NULL; /* internal state pointer used if a NULL is
					 * passed in to str
					 */
	char *ptr;		 /* pointer used to search through the str */
	char *start;

	if (str == NULL && isp == NULL)
		return NULL;

	if (str == NULL)
		ptr = isp;
	else
		ptr = str;

	/* if target is 0, set it to a space.  It is already a delimiter */
	if (target == 0)
		target = ' ';

	while (isspace(*ptr) || *ptr == target)
		ptr++;

	start = ptr;

	if (*ptr != '\0') {
		if (*ptr == '\"' || *ptr == '\'') {
			auto quote = *ptr;
			start = ++ptr;
			while (*ptr != '\0' && *ptr != quote)
				ptr++;
		} else {
			while (*ptr != '\0' && !isspace(*ptr) && *ptr != target)
				ptr++;
		}
		if (*ptr == '\0')
			isp = NULL;
		else {
			*ptr = '\0';
			isp = ptr + 1;
		}
		return start;
	}

	isp = NULL;
	return NULL;
}

/**
 * @brief
 *		preempt_bit_field - take list of preempt names seperated by +'s and
 * 			    create a bitfield representing it.  The bitfield
 *			    is created by taking the name in the prempt enum
 *			    and shifting a bit into that position.
 *
 * @param[in]	plist	-	a preempt list
 *
 * @return	a bitfield of -1 on error
 *
 */
int
preempt_bit_field(char *plist)
{
	int bitfield = 0;
	int i;
	char *tok;

	tok = strtok(plist, "+");

	while (tok != NULL) {
		auto obitfield = bitfield;
		for (i = 0; i < PREEMPT_HIGH; i++) {
			if (!strcmp(preempt_prio_info[i].str, tok))
				bitfield |= PREEMPT_TO_BIT(preempt_prio_info[i].value);
		}

		/* invalid preempt string */
		if (obitfield == bitfield) {
			bitfield = -1;
			break;
		}

		tok = strtok(NULL, "+");
	}

	return bitfield;
}

/**
 * @brief
 * 	sort compare function for preempt status's
 * 	sort by descending number of bits in the bitfields (most number of preempt
 * 	statuses at the top) and then priorities
 *
 * @param[in]	p1	-	preempt status 1
 * @param[in]	p2	-	preempt status 2
 *
 * @return	int
 * @retval	1	: p1 < p2
 * @retval	-1	: p1 > p2
 * @retval	0	: Equal
 */
int
preempt_cmp(const void *p1, const void *p2)
{
	int *i1, *i2;

	i1 = (int *) p1;
	i2 = (int *) p2;

	if (BITCOUNT16(*i1) < BITCOUNT16(*i2))
		return 1;
	else if (BITCOUNT16(*i1) > BITCOUNT16(*i2))
		return -1;
	else {
		if (*(i1 + 1) < *(i2 + 1))
			return 1;
		else if (*(i1 + 1) > *(i2 + 1))
			return -1;
		else
			return 0;
	}
}

================================================
FILE: src/scheduler/parse.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PARSE_H
#define _PARSE_H

#include "data_types.h"
#include "globals.h"

/*
 *	parse_config - parse the config file and set a struct config
 *
 *	FILE FORMAT:
 *	config_name [white space ] : [ white space ] config_value
 */
config parse_config(const char *fname);

/*
 *      scan - Scan through the string looking for a white space delemeted word
 *             or quoted string.
 */
char *scan(char *str, char target);

/*
 * sort compare function for preempt status's
 * sort by decending number of bits in the bitfields (most number of preempt
 * statuses at the top) and then priorities
 */
int preempt_cmp(const void *p1, const void *p2);

/*
 *      preempt_bit_field - take list of preempt names seperated by +'s and
 *                          create a bitfield representing it.  The bitfield
 *                          is created by taking the name in the prempt enum
 *                          and shifting a bit into that position.
 */
int preempt_bit_field(char *plist);

/* Check if string is a valid special case sorting string */
int is_speccase_sort(const std::string &, int sort_type);

#endif /* _PARSE_H */


================================================
FILE: src/scheduler/pbs_bitmap.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <stdio.h>
#include <stdlib.h>

#include "pbs_bitmap.h"

#define BYTES_TO_BITS(x) ((x) *8)

/**
 * @brief allocate space for a pbs_bitmap (and possibly the bitmap itself)
 * @param pbm - bitmap to allocate space for.  NULL to allocate a new bitmap
 * @param num_bits - number of bits to allocate
 * @return pbs_bitmap *
 * @retval bitmap which was allocated
 * @retval NULL on error
 */
pbs_bitmap *
pbs_bitmap_alloc(pbs_bitmap *pbm, unsigned long num_bits)
{
	pbs_bitmap *bm;
	unsigned long *tmp_bits;
	long prev_longs;

	if (num_bits == 0)
		return NULL;

	if (pbm == NULL) {
		bm = static_cast<pbs_bitmap *>(calloc(1, sizeof(pbs_bitmap)));
		if (bm == NULL)
			return NULL;
	} else
		bm = pbm;

	/* shrinking bitmap, clear previously used bits */
	if (num_bits < bm->num_bits) {
		long i;
		i = num_bits / BYTES_TO_BITS(sizeof(unsigned long)) + 1;
		for (; static_cast<unsigned long>(i) < bm->num_longs; i++)
			bm->bits[i] = 0;
		for (i = pbs_bitmap_next_on_bit(bm, num_bits); i != -1; i = pbs_bitmap_next_on_bit(bm, i))
			pbs_bitmap_bit_off(bm, i);
	}

	/* If we have enough unused bits available, we don't need to allocate */
	if (bm->num_longs * BYTES_TO_BITS(sizeof(unsigned long)) >= num_bits) {
		bm->num_bits = num_bits;
		return bm;
	}

	prev_longs = bm->num_longs;

	bm->num_bits = num_bits;
	bm->num_longs = num_bits / BYTES_TO_BITS(sizeof(unsigned long));
	if (num_bits % BYTES_TO_BITS(sizeof(unsigned long)) > 0)
		bm->num_longs++;
	tmp_bits = static_cast<unsigned long *>(calloc(bm->num_longs, sizeof(unsigned long)));
	if (tmp_bits == NULL) {
		if (pbm == NULL) /* we allocated the memory */
			pbs_bitmap_free(bm);
		return NULL;
	}

	if (bm->bits != NULL) {
		int i;
		for (i = 0; i < prev_longs; i++)
			tmp_bits[i] = bm->bits[i];

		free(bm->bits);
	}
	bm->bits = tmp_bits;

	return bm;
}

/* pbs_bitmap destructor */
void
pbs_bitmap_free(pbs_bitmap *bm)
{
	if (bm == NULL)
		return;
	free(bm->bits);
	free(bm);
}

/**
 * @brief turn a bit on for a bitmap
 * @param pbm - the bitmap
 * @param bit - which bit to turn on
 * @return nothing
 */
int
pbs_bitmap_bit_on(pbs_bitmap *pbm, unsigned long bit)
{
	long long_ind;
	unsigned long b;

	if (pbm == NULL)
		return 0;

	if (bit >= pbm->num_bits) {
		if (pbs_bitmap_alloc(pbm, bit + 1) == NULL)
			return 0;
	}

	long_ind = bit / BYTES_TO_BITS(sizeof(unsigned long));
	b = 1UL << (bit % BYTES_TO_BITS(sizeof(unsigned long)));

	pbm->bits[long_ind] |= b;
	return 1;
}

/**
 * @brief turn a bit off for a bitmap
 * @param pbm - the bitmap
 * @param bit - the bit to turn off
 * @return nothing
 */
int
pbs_bitmap_bit_off(pbs_bitmap *pbm, unsigned long bit)
{
	long long_ind;
	unsigned long b;

	if (pbm == NULL)
		return 0;

	if (bit >= pbm->num_bits) {
		if (pbs_bitmap_alloc(pbm, bit + 1) == NULL)
			return 0;
	}

	long_ind = bit / BYTES_TO_BITS(sizeof(unsigned long));
	b = 1UL << (bit % BYTES_TO_BITS(sizeof(unsigned long)));

	pbm->bits[long_ind] &= ~b;
	return 1;
}

/**
 * @brief get the value of a bit
 * @param pbm - the bitmap
 * @param bit - which bit to get the value of
 * @return int
 * @retval 1 if the bit is on
 * @retval 0 if the bit is off
 */
int
pbs_bitmap_get_bit(pbs_bitmap *pbm, unsigned long bit)
{
	long long_ind;
	unsigned long b;

	if (pbm == NULL)
		return 0;

	if (bit >= pbm->num_bits)
		return 0;

	long_ind = bit / BYTES_TO_BITS(sizeof(unsigned long));
	b = 1UL << (bit % BYTES_TO_BITS(sizeof(unsigned long)));

	return (pbm->bits[long_ind] & b) ? 1 : 0;
}

/**
 * @brief starting at a bit, get the next on bit
 * @param pbm - the bitmap
 * @param start_bit - which bit to start from
 * @return int
 * @retval number of next on bit
 * @retval -1 if there isn't a next on bit
 */
int
pbs_bitmap_next_on_bit(pbs_bitmap *pbm, unsigned long start_bit)
{
	unsigned long long_ind;
	long bit;
	size_t i;

	if (pbm == NULL)
		return -1;

	if (start_bit >= pbm->num_bits)
		return -1;

	long_ind = start_bit / BYTES_TO_BITS(sizeof(unsigned long));
	bit = start_bit % BYTES_TO_BITS(sizeof(unsigned long));

	/* special case - look at first long that contains start_bit */
	if (pbm->bits[long_ind] != 0) {
		for (i = bit + 1; i < BYTES_TO_BITS(sizeof(unsigned long)); i++) {
			if (pbm->bits[long_ind] & (1UL << i)) {
				return (long_ind * BYTES_TO_BITS(sizeof(unsigned long)) + i);
			}
		}

		/* didn't find an on bit after start_bit_index in the long that contained start_bit */
		if (long_ind < pbm->num_longs) {
			long_ind++;
		}
	}

	for (; long_ind < pbm->num_longs && pbm->bits[long_ind] == 0; long_ind++)
		;

	if (long_ind == pbm->num_longs)
		return -1;

	for (i = 0; i < BYTES_TO_BITS(sizeof(unsigned long)); i++) {
		if (pbm->bits[long_ind] & (1UL << i)) {
			return (long_ind * BYTES_TO_BITS(sizeof(unsigned long)) + i);
		}
	}

	return -1;
}

/**
 * @brief get the first on bit
 * @param bm - the bitmap
 * @return int
 * @retval the bit number of the first on bit
 * @retval -1 on error
 */
int
pbs_bitmap_first_on_bit(pbs_bitmap *bm)
{
	if (pbs_bitmap_get_bit(bm, 0))
		return 0;

	return pbs_bitmap_next_on_bit(bm, 0);
}

/**
 * @brief pbs_bitmap version of L = R
 * @param L - bitmap lvalue
 * @param R - bitmap rvalue
 * @return int
 * @retval 1 success
 * @retval 0 failure
 */
int
pbs_bitmap_assign(pbs_bitmap *L, pbs_bitmap *R)
{
	unsigned long i;

	if (L == NULL || R == NULL)
		return 0;

	/* In the case where R is longer than L, we need to allocate more space for L
	 * Instead of using R->num_bits, we call pbs_bitmap_alloc() with the
	 * full number of bits required for its num_longs.  This is because it
	 * is possible that R has more space allocated to it than required for its num_bits.
	 * This happens if it had a previous call to pbs_bitmap_equals() with a shorter bitmap.
	 */
	if (R->num_longs > L->num_longs)
		if (pbs_bitmap_alloc(L, BYTES_TO_BITS(R->num_longs * sizeof(unsigned long))) == NULL)
			return 0;

	for (i = 0; i < R->num_longs; i++)
		L->bits[i] = R->bits[i];
	if (R->num_longs < L->num_longs)
		for (; i < L->num_longs; i++)
			L->bits[i] = 0;

	L->num_bits = R->num_bits;
	return 1;
}

/**
 * @brief pbs_bitmap version of L == R
 * @param L - bitmap lvalue
 * @param R - bitmap rvalue
 * @return int
 * @retval 1 bitmaps are equal
 * @retval 0 bitmaps are not equal
 */
int
pbs_bitmap_is_equal(pbs_bitmap *L, pbs_bitmap *R)
{
	unsigned long i;

	if (L == NULL || R == NULL)
		return 0;

	if (L->num_bits != R->num_bits)
		return 0;

	for (i = 0; i < L->num_longs; i++)
		if (L->bits[i] != R->bits[i])
			return 0;

	return 1;
}


================================================
FILE: src/scheduler/pbs_bitmap.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PBS_BITMASK_H
#define _PBS_BITMASK_H

struct pbs_bitmap {
	unsigned long *bits;	 /* bit storage */
	unsigned long num_longs; /* number of longs in the bits array */
	unsigned long num_bits;	 /* number of bits that are in use (both 1's and 0's */
};

typedef struct pbs_bitmap pbs_bitmap;

/* Allocate bits to a bitmap (and possibly the bitmap itself) */
pbs_bitmap *pbs_bitmap_alloc(pbs_bitmap *pbm, unsigned long num_bits);

/* Destructor */
void pbs_bitmap_free(pbs_bitmap *bm);

/* Turn a bit on */
int pbs_bitmap_bit_on(pbs_bitmap *pbm, unsigned long bit);

/* Turn a bit off */
int pbs_bitmap_bit_off(pbs_bitmap *pbm, unsigned long bit);

/* Get a bit */
int pbs_bitmap_get_bit(pbs_bitmap *pbm, unsigned long bit);

/* Get the first on bit in a bitmap */
int pbs_bitmap_first_on_bit(pbs_bitmap *bm);

/* Starting at start_bit get the next on bit */
int pbs_bitmap_next_on_bit(pbs_bitmap *pbm, unsigned long start_bit);

/* pbs_bitmap's version of L = R */
int pbs_bitmap_assign(pbs_bitmap *L, pbs_bitmap *R);

/* pbs_bitmap's version of L == R */
int pbs_bitmap_is_equal(pbs_bitmap *L, pbs_bitmap *R);

#endif /* _PBS_BITMASK_H */


================================================
FILE: src/scheduler/pbs_dedicated
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

# FORMAT: 		FROM		TO
#			----		--
#		MM/DD/YYYY HH:MM MM/DD/YYYY HH:MM
#
#  For example
04/15/1998 12:00 04/15/1998 15:30

4/15/1998 16:00 4/15/1998 16:40


================================================
FILE: src/scheduler/pbs_holidays
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
#
# UNCOMMENT AND CHANGE THIS TO THE CURRENT YEAR
#YEAR  1970
#
# Prime/Nonprime Table
#
#   Prime Non-Prime
# Day   Start Start
#
# UNCOMMENT AND SET THE REQUIRED PRIME/NON-PRIME START TIMES
#  weekday 0600  1730
#  saturday  none  all
#  sunday  none  all
#
# Day of  Calendar  Company
# Year    Date    Holiday
#
#
# UNCOMMENT AND ADD CALENDAR HOLIDAYS TO BE CONSIDERED AS NON-PRIME DAYS
#    1           Jan 1           New Year's Day
#  359           Dec 25          Christmas Day


================================================
FILE: src/scheduler/pbs_holidays.2017
================================================
*
* Copyright (C) 1994-2021 Altair Engineering, Inc.
* For more information, contact Altair at www.altair.com.
*
* This file is part of both the OpenPBS software ("OpenPBS")
* and the PBS Professional ("PBS Pro") software.
*
* Open Source License Information:
*
* OpenPBS is free software. You can redistribute it and/or modify it under
* the terms of the GNU Affero General Public License as published by the
* Free Software Foundation, either version 3 of the License, or (at your
* option) any later version.
*
* OpenPBS is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
* License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program.  If not, see <http://www.gnu.org/licenses/>.
*
* Commercial License Information:
*
* PBS Pro is commercially licensed software that shares a common core with
* the OpenPBS software.  For a copy of the commercial license terms and
* conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
* Altair Legal Department.
*
* Altair's dual-license business model allows companies, individuals, and
* organizations to create proprietary derivative works of OpenPBS and
* distribute them - whether embedded or bundled with other software -
* under a commercial license agreement.
*
* Use of Altair's trademarks, including but not limited to "PBS™",
* "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
* subject to Altair's trademark licensing policies.
*

*
YEAR  2017
*
* Prime/Nonprime Table
*
*   Prime Non-Prime
* Day   Start Start
*
  weekday 0600  1730
  saturday  none  all
  sunday  none  all
*
* Day of  Calendar  Company
* Year    Date    Holiday
*

* if a holiday falls on a saturday, it is observed on the friday before
* if a holiday falls on a sunday, it is observed on the monday after

* Jan 1
    1           Jan 1           New Year's Day
* Third Monday of Jan
   16           Jan 16          Martin Luther King Day
* Third Monday in Feb
   51           Feb 20          President's Day
* Last Monday in May
  149           May 29          Memorial Day
* July 4th
  185           Jul 4           Independence Day
* First Monday in Sept
  247           Sep 4           Labor Day
* Second Monday in Oct
  282           Oct 9          Columbus Day
* Nov 11
  315           Nov 11          Veterans Day
* Fourth Thursday in Nov
  327           Nov 23          Thanksgiving
* Dec 25
  359           Dec 25          Christmas Day


================================================
FILE: src/scheduler/pbs_resource_group
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

#grp1	50	root	10
#grp2	51	root	20
#grp3	52	root	10
#grp4	53	grp1	20
#grp5 	54	grp1	10
#grp6	55	grp2	20
#usr1	60	root	5
#usr2	61	grp1	10
#usr3	62	grp2	10
#usr4	63	grp6	10
#usr5	64	grp6	10
#usr6	65	grp6	20
#usr7	66	grp3	10
#usr8	67	grp4	10
#usr9	68	grp4	10
#usr10	69	grp5	10


================================================
FILE: src/scheduler/pbs_sched.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * contains functions related to PBS scheduler
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>

#include "fifo.h"
#include "log.h"
#include "sched_cmds.h"

extern int sched_main(int argc, char *argv[], int (*schedule_func)(int, const sched_cmd *));

int
main(int argc, char *argv[])
{
	if (set_msgdaemonname(const_cast<char *>("pbs_sched"))) {
		fprintf(stderr, "Out of memory\n");
		return (1);
	}

	return sched_main(argc, argv, schedule);
}


================================================
FILE: src/scheduler/pbs_sched_bare.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * contains functions related to PBS scheduler
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>

#ifdef PYTHON
#include <pbs_python_private.h>
#include <Python.h>
#include <pythonrun.h>
#include <wchar.h>
#endif

#include "check.h"
#include "constant.h"
#include "data_types.h"
#include "fifo.h"
#include "globals.h"
#include "libpbs.h"
#include "log.h"
#include "resource.h"
#include "server_info.h"

extern int sched_main(int argc, char *argv[], int (*schedule_func)(int, const sched_cmd *));

/**
 * @brief	Perform scheduling in "mock run" mode
 *
 * @param[in]	policy	-	policy info
 * @param[in]	sd	-	primary socket descriptor to the server pool
 * @param[in]	sinfo	-	pbs universe we're going to loop over
 * @param[out]	rerr	-	error bits from the last job considered
 *
 *	@return return code of last job scheduled
 *	@retval -1	: on error
 */
int
main_sched_loop_bare(int sd, server_info *sinfo)
{
	node_info **nodes = sinfo->nodes;
	resource_resv **jobs = sinfo->jobs;
	int ij;
	int in = 0;
	char execvnode[PBS_MAXHOSTNAME + strlen("(:ncpus=1)") + 1];

	/* Algorithm:
     * - Loop over all jobs, assume that they need just 1 ncpu to run, and
     *  choose the next free node for it
     */
	for (ij = 0; jobs[ij] != NULL; ij++) {
		execvnode[0] = '\0';

		/* Find the first free node and fill it */
		for (; nodes[in] != NULL; in++) {
			node_info *node = nodes[in];
			schd_resource *ncpures = NULL;

			if (node->is_job_busy)
				continue;

			ncpures = find_resource(node->res, allres["ncpus"]);
			if (ncpures == NULL)
				continue;

			/* Assign a cpu on this node */
			ncpures->assigned += 1;
			if (dynamic_avail(ncpures) == 0) {
				node->is_job_busy = 1;
				node->is_free = 0;
			}

			/* Create the exec_node for the job */
			snprintf(execvnode, sizeof(execvnode), "(%s:ncpus=1)", node->name.c_str());

			/* Send the run request */
			send_run_job(sd, 0, jobs[ij]->name, execvnode);

			break;
		}
		if (execvnode[0] == '\0') {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_NOTICE, "",
				  "No free nodes available, won't consider any more jobs");
			break;
		}
	}
	return SUCCESS;
}

/**
 * @brief
 *		scheduling_cycle - the controling function of the scheduling cycle
 *
 * @param[in]	sd	-	primary socket descriptor to the server pool
 *
 * @return	int
 * @retval	0 for normal operation
 * @retval	1 for sched exit
 */
static int
scheduling_cycle_bare(int sd, const sched_cmd *cmd)
{
	server_info *sinfo; /* ptr to the server/queue/job/node info */

	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
		  "", "Starting Scheduling Cycle");

	/* Decide whether we need to send "can't run" type updates this cycle */
	if (time(NULL) - last_attr_updates >= sc_attrs.attr_update_period)
		send_job_attr_updates = 1;
	else
		send_job_attr_updates = 0;

	update_cycle_status(cstat, 0);

	/* create the server / queue / job / node structures */
	if ((sinfo = query_server(&cstat, sd)) == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  "", "Problem with creating server data structure");
		end_cycle_tasks(sinfo);
		return 1;
	}

	main_sched_loop_bare(sd, sinfo);

	end_cycle_tasks(sinfo);

	return 0;
}

/**
 * @brief
 *		schedule - this function gets called to start each scheduling cycle
 *		   It will handle the difference cases that caused a
 *		   scheduling cycle
 *
 * @param[in]	sd	-	primary socket descriptor to the server pool
 *
 * @return	int
 * @retval	0	: continue calling scheduling cycles
 * @retval	1	: exit scheduler
 */
static int
schedule_bare(int sd, const sched_cmd *cmd)
{
	switch (cmd->cmd) {
		case SCH_SCHEDULE_NULL:
		case SCH_RULESET:
			/* ignore and end cycle */
			break;

		case SCH_SCHEDULE_FIRST:
			/*
		 * on the first cycle after the server restarts custom resources
		 * may have been added.  Dump what we have so we'll requery them.
		 */
			update_resource_defs(sd);

			/* Get config from the qmgr sched object */
			if (!set_validate_sched_attrs(sd))
				return 0;

		case SCH_SCHEDULE_NEW:
		case SCH_SCHEDULE_TERM:
		case SCH_SCHEDULE_CMD:
		case SCH_SCHEDULE_TIME:
		case SCH_SCHEDULE_JOBRESV:
		case SCH_SCHEDULE_STARTQ:
		case SCH_SCHEDULE_MVLOCAL:
		case SCH_SCHEDULE_ETE_ON:
		case SCH_SCHEDULE_RESV_RECONFIRM:
			return scheduling_cycle_bare(sd, cmd);
		case SCH_SCHEDULE_AJOB:
			return scheduling_cycle_bare(sd, cmd);
		case SCH_CONFIGURE:
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_INFO,
				  "reconfigure", "Scheduler is reconfiguring");
			update_resource_defs(sd);

			/* Get config from sched_priv/ files */
			if (schedinit(-1) != 0)
				return 0;

			/* Get config from the qmgr sched object */
			if (!set_validate_sched_attrs(sd))
				return 0;
			break;
		case SCH_QUIT:
#ifdef PYTHON
			Py_Finalize();
#endif
			return 1; /* have the scheduler exit nicely */
		default:
			return 0;
	}
	return 0;
}

int
main(int argc, char *argv[])
{
	if (set_msgdaemonname(const_cast<char *>("pbs_sched_bare"))) {
		fprintf(stderr, "Out of memory\n");
		return (1);
	}

	return sched_main(argc, argv, schedule_bare);
}


================================================
FILE: src/scheduler/pbs_sched_config
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#


# This is the config file for the scheduling policy
# FORMAT:  option: value prime_option
#	option 		- the name of what we are changing defined in config.h
#	value  		- can be boolean/string/numeric depending on the option
#	prime_option	- can be prime/non_prime/all ONLY FOR SOME OPTIONS

#### OVERALL SCHEDULING OPTIONS

#
# round_robin
#	Run a job from each queue before running second job from the
#	first queue.
#
#	PRIME OPTION

round_robin: False	all


#
# by_queue
#	Run jobs by queues.  If both round_robin and by_queue are not set,
#	The scheduler will look at all the jobs on on the server as one
#	large queue, and ignore the queues set by the administrator.
#
#	PRIME OPTION

by_queue: True		prime
by_queue: True		non_prime


#
# strict_ordering
#
#	Run jobs exactly in the order determined by the scheduling option
#	settings, so that we run the "most deserving" job as soon as possible
#	while adhering to site policy.  Note that strict_ordering can result
#	in significant idle time unless you use backfilling, which runs smaller
#	"less deserving" jobs provided that they do not delay the start time
#	of the "most deserving" job.
#
#	PRIME OPTION

strict_ordering: false	ALL

#### PRIMETIME OPTIONS:

# NOTE: to set primetime/nonprimetime see $PBS_HOME/sched_priv/holidays file

#
# backfill_prime
#
#	When backfill_prime is turned on, jobs are not allowed to cross from
#	primetime into non-primetime or vice versa.  This option is not related
#	to the backfill_depth server parameter.
#
#	PRIME OPTION

backfill_prime:	false	ALL

#
# prime_exempt_anytime_queues
#
#	Avoid backfill on queues that are not defined as primetime
#	or nonprimetime.
#	NOTE: This is not related to backfill for strict_ordering.
#
#	NO PRIME OPTION

prime_exempt_anytime_queues:	false

#
# prime_spill
#
#	Time duration to allow jobs to cross-over or 'spill' into primetime or
#  	nonprimetime.
#	NOTE: This is used in conjunction with backfill_prime.
#
#	Usage: prime_spill: "HH:MM:SS"
#
#	Examples:
#	prime_spill: "2:00:00" 	PRIME
#	This means primetime jobs can spill into nonprimetime by up to 2 hours
#
#	prime_spill: "1:00:00" ALL
#	This will allow jobs to spill into nonprimeime or into primetime by
#	up to an hour.
#
#	PRIME OPTION
#

#prime_spill: 1:00:00	ALL

#
# primetime_prefix
# 	Prefix to define a primetime queue.
#	Jobs in primeime queues will only be run in primetime
#
#	NO PRIME OPTION

primetime_prefix: p_

#
# nonprimetime_prefix
#	Prefix to define non-primetime queues.
# 	Job in non-primetime queues will only be run in non-primetime
#
#	NO PRIME OPTION
nonprimetime_prefix: np_

#### SORTING OPTIONS:

# job_sort_key
#
#	Sort jobs by any resource known to PBS.
#	job_sort_key allows jobs to be sorted by any resource.  This
#	includes any admin defined resource resources.  The sort can be
#	ascending (low to high) or descending (high to low).
#
#	Usage: job_sort_key: "resource_name HIGH | LOW"
#
#	Allowable non resource keys:
#		fair_share_perc, preempt_priority, job_priority
#
#
#	Examples:
#
#	job_sort_key: "ncpus HIGH"
#	job_sort_key: "mem LOW"
#
#	This would have a 2 key sort, descending by ncpus and ascending by mem
#
#	PRIME OPTION
#

#job_sort_key: "cput LOW"	ALL

# node_sort_key
#
#	Sort nodes by any resource known to PBS.
#	node_sort_key is similar to job_sort_key but works for nodes.
#	Nodes can be sorted on any resource.  The resource value
#	sorted on is the resources_available amount.
#
#	Usage: node_sort_key: "resource_name HIGH | LOW"
#
#	non resource key: sort_priority
#
#	Example:
#
#	node_sort_key: "sort_priority HIGH"
#	node_sort_key: "ncpus HIGH"
#
#	PRIME OPTION
#

node_sort_key: "sort_priority HIGH"	ALL

#
# provision_policy
#
#	Determines how scheduler is going to select nodes to satisfy
#	provisioning request of a job.
#
#	"avoid_provision" sorts vnodes by requested AOE.
#	Nodes with same AOE are sorted on node_sort_key.
#
#	"aggressive_provision" lets scheduler select nodes first and then
#	provision if necessary. This is the default policy.
#
#  	Example:
#
#	provision_policy: "avoid_provision"
#
#	NO PRIME OPTION

provision_policy: "aggressive_provision"

#### SMP JOB OPTIONS:

#
# resources
#
#	Define resource limits to be honored by PBS.
#	The scheduler will not allow a job to run if the amount of assigned
#	resources exceeds the available amount.
#
#	NOTE: you need to encase the comma separated list of resources in
#	      double quotes (")
#  	Example:
#
#  	resources: "ncpus, mem, arch"
#
#  	This is ONLY schedules jobs based on available ncpus, mem, and arch
#  	within the cluster. Other resources requested by the job will not
#  	evaluated for availability.
#
#  	NOTE: Define new resources within
#		$PBS_HOME/server_priv/resourcedef file.
#
#	NO PRIME OPTION

resources: "ncpus, mem, arch, host, vnode, aoe, eoe"

#
# smp_cluster_dist
#
#	This option allows you to decide how to distribute jobs to all the
#	nodes on your systems.
#
#	pack 	    - pack as many jobs onto a node that will fit before
#		      running on another node
#	round_robin - run one job on each node in a cycle
#
#	PRIME OPTION

smp_cluster_dist: pack

#### FAIRSHARE OPTIONS

# NOTE: to define fairshare tree see $PBS_HOME/sched_priv/resources_group file

#
# fair_share
#	Schedule jobs based on usage and share values
#
#	PRIME OPTION
#

fair_share: false	ALL

#
# unknown_shares
#	The number of shares for the "unknown" group
#
#	NO PRIME OPTION
#
#	NOTE: To turn on fairshare and give everyone equal shares,
#	      Uncomment this line (and turn on fair_share above)

#unknown_shares: 10


#
# fairshare_usage_res
#	This specifies the resource to collect to fairshare from.
#	The scheduler will collect timing information pertaining to the
#	utilization of a particular resources to schedule jobs
#
#  	Example:
#  	fairshare_usage_res: cput
#
#	This collects the cput (cputime) resource.
#	NOTE: ONLY one resource can be collected.
#
#	NO PRIME OPTION
fairshare_usage_res: cput

#
# fairshare_entity
#	This is a job attribute which will be used for fairshare entities.
#	This can be anything from the username (euser) to the group (egroup)
#	etc.  It can also be "queue" for the queue name of the job
#
#	NO PRIME OPTION

fairshare_entity: euser

#
# fairshare_decay_time
#	The duration between when the scheduler decays the fairshare tree
#
#	NO PRIME OPTION

fairshare_decay_time: 24:00:00

#
# fairshare_decay_factor
# 	The factor in which the fairshare tree will be decayed by when it is decayed
# 	Example: 0.5 would mean a half-life
#
fairshare_decay_factor: 0.5

#
# fairshare_enforce_no_shares
#
#	Any fairshare entity with zero shares will never run.  If an
#	entity is in a group with zero shares, they will still not run.
#
# 	Usage: fairshare_enforce_no_shares: TRUE|FALSE
#
#	NO PRIME OPTION

# fairshare_enforce_no_shares: TRUE

#### PREEMPTIVE SCHEDULING OPTIONS

#
# preemptive_sched
#
#	Enables preemptive scheduling.
#	This will allow the scheduler to preempt lower priority
#	work to run higher priority jobs.
#
#	PRIME OPTION

preemptive_sched: true	ALL

#### PEER SCHEDULING OPTIONS

#
# peer_queue
#
#	Defines and enables the scheduler to obtain work from other PBS
#	clusters.
#
#	Peer scheduling works by mapping a queue on a remote server to a
#	queue on the local server.  Only one mapping can be made per line,
#	but multiple peer_queue lines can appear in this file. More then
#	one mapping can be made to the same queue.  The scheduler will
#	see the union of all the jobs of the multiple queues (local and remote).
#
#	Usage: peer_queue: "local_queue		remote_queue@remote_server"
#
#	Examples:
#	peer_queue: "workq		workq@svr1"
#	peer_queue: "workq		workq@svr2"
#	peer_queue: "remote_work	workq@svr3"
#
#	NO PRIME OPTION

#### DYNAMIC RESOURCE OPTIONS

#
# mom_resources
#
#	NOTE: The mom_resources option is deprecated and will likely go away in a future release.
#             Use exechost_periodic hook to set the resource values
#
#	Defines Dynamic Consumable Resources on a per node basis.
#
#	The mom_resources option is used to be able to query the MOMs to
#	set the value resources_available.res where res is a site defined
#	resource.  Each mom is queried with the resource name and the
#	return value is used to replace resources_available.res on that node.
#
#	NOTE: this is internal to the scheduler, these values will not
#	      be visible outside of the scheduler.
#
#	Usage: mom_resources: "res1, res2, res3, ... resN"
#
#	Example:
#	mom_resources: "foo"
#
#	NO PRIME OPTION

# server_dyn_res
#
#	Defines Dynamic Consumable Resources on a per job basis.
#
#	server_dyn_res allows the values of resources to be replaced by running
#	a program and taking the first line of output as the new value. For
#	instance, querying a licensing server for the available licenses.
#
#	NOTE: this value MUST be quoted (i.e. server_dyn_res: " ... " )
#
#	Examples:
#	server_dyn_res: "mem !/bin/get_mem"
#	server_dyn_res: "ncpus !/bin/get_ncpus"
#
#	NO PRIME OPTION

#### DEDICATED TIME OPTIONS

# NOTE: to set dedicated time see $PBS_HOME/sched_priv/dedicated_time file

#
# dedicated_prefix
#
#	Prefix to define dedicated time queues.
# 	All queues starting with this value are dedicated time queues and
#	jobs within these queues will only run during dedicated time.
#
# 	Example:
#
#	dedicated_prefix: ded
#
#	dedtime or dedicated time would be dedicated time queues
#	(along with anything else starting with ded).
#
#	NO PRIME OPTION
dedicated_prefix: ded


================================================
FILE: src/scheduler/pbs_sched_utils.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * contains functions related to PBS scheduler
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <vector>

#include <arpa/inet.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <grp.h>
#include <limits.h>
#include <netdb.h>
#include <netinet/in.h>
#include <pwd.h>
#include <signal.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <sys/resource.h>
#include <sys/socket.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <sys/types.h>
#include <unistd.h>
#ifdef _POSIX_MEMLOCK
#include <sys/mman.h>
#endif /* _POSIX_MEMLOCK */

#if defined(FD_SET_IN_SYS_SELECT_H)
#include <sys/select.h>
#endif
#include <sys/resource.h>

#include "auth.h"
#include "config.h"
#include "fifo.h"
#include "globals.h"
#include "libpbs.h"
#include "libsec.h"
#include "list_link.h"
#include "log.h"
#include "misc.h"
#include "multi_threading.h"
#include "net_connect.h"
#include "pbs_ecl.h"
#include "pbs_error.h"
#include "pbs_ifl.h"
#include "pbs_share.h"
#include "pbs_version.h"
#include "portability.h"
#include "rm.h"
#include "sched_cmds.h"
#include "server_limits.h"
#include "tpp.h"
#include "libutil.h"

#define START_CLIENTS 2			   /* minimum number of clients */
auto okclients = std::vector<pbs_net_t>(); /* accept connections from */
char *configfile = NULL;		   /* name of file containing
						 client names to be added */

extern char *msg_daemonname;
char **glob_argv;
char usage[] = "[-d home][-L logfile][-p file][-I schedname][-n][-N][-c clientsfile][-t num threads]";
struct sockaddr_in saddr;
sigset_t allsigs;
sigset_t oldsigs;

int sigstoblock[] = {SIGHUP, SIGINT, SIGTERM, SIGUSR1};

/* if we received a sigpipe, this probably means the server went away. */

/* used in segv restart */
time_t segv_start_time;
time_t segv_last_time;

#ifdef NAS /* localmod 030 */
extern int do_soft_cycle_interrupt;
extern int do_hard_cycle_interrupt;
#endif /* localmod 030 */

extern char *msg_startup1;

pthread_mutex_t cleanup_lock;

static void reconnect_server(void);
void sched_svr_init(void);
void open_server_conns();
static int schedule_wrapper(sched_cmd *cmd, int opt_no_restart);
void close_server_conns(void);

typedef int (*schedule_func)(int, const sched_cmd *);

static schedule_func schedule_ptr;

/**
 * @brief
 * 		cleanup after a segv and re-exec.  Trust as little global mem
 * 		as possible... we don't know if it could be corrupt
 *
 * @param[in]	sig	-	signal
 */
void
on_segv(int sig)
{
	int ret_lock;

	/* We want any other threads to block here, we want them alive until abort() is called
	 * as it dumps core for all threads
	 */
	ret_lock = pthread_mutex_lock(&cleanup_lock);
	if (ret_lock != 0)
		pthread_exit(NULL);

	/* we crashed less then 5 minutes ago, lets not restart ourself */
	if ((segv_last_time - segv_start_time) < 300) {
		log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__,
			   "received a sigsegv within 5 minutes of start: aborting.");

		/* Not unlocking mutex on purpose, we need to hold on to it until the process is killed */
		abort();
	}

	log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__,
		   "received segv and restarting");

	if (fork() > 0) {  /* the parent rexec's itself */
		sleep(10); /* allow the child to die */
		execv(glob_argv[0], glob_argv);
		exit(3);
	} else {
		abort(); /* allow to core and exit */
	}
}

/**
 * @brief
 * 		signal function for receiving a sigpipe - set flag so we know not to talk
 * 		to the server any more and leave the cycle as soon as possible
 *
 * @param[in]	sig	-	sigpipe
 */
void
sigfunc_pipe(int sig)
{
	log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, "sigfunc_pipe", "We've received a sigpipe: The server probably died.");
	got_sigpipe = 1;
}

/**
 * @brief	cleanup routine for scheduler exit
 *
 * @param	void
 *
 * @return void
 */
static void
schedexit(void)
{
	/* close any open connections to peers */
	for (auto &pq : conf.peer_queues) {
		if (pq.peer_sd >= 0) {
			/* When peering "local", do not disconnect server */
			if (!pq.remote_server.empty())
				pbs_disconnect(pq.peer_sd);
			pq.peer_sd = -1;
		}
	}

	/* Kill all worker threads */
	if (num_threads > 1) {
		int *thid;

		thid = (int *) pthread_getspecific(th_id_key);

		if (*thid == 0) {
			kill_threads();
			close_server_conns();
			return;
		}
	}

	close_server_conns();
}

/**
 * @brief
 *       Clean up after a signal.
 *
 *  @param[in]	sig	-	signal
 */
void
die(int sig)
{
	int ret_lock;

	ret_lock = pthread_mutex_trylock(&cleanup_lock);
	if (ret_lock != 0)
		pthread_exit(NULL);

	if (sig > 0)
		log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, "caught signal %d", sig);
	else
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, "abnormal termination");

	schedexit();

	{
		int csret;
		if ((csret = CS_close_app()) != CS_SUCCESS) {
			/*had some problem closing the security library*/

			sprintf(log_buffer, "problem closing security library (%d)", csret);
			log_err(-1, "pbs_sched", log_buffer);
		}
	}

	unload_auths();

	log_close(1);
	exit(1);
}

/**
 * @brief
 * 		add a new client to the list of clients.
 *
 * @param[in]	name	-	Client name.
 */
int
addclient(const char *name)
{
	int i;
	struct hostent *host;
	struct in_addr saddr;

	if ((host = gethostbyname(name)) == NULL) {
		sprintf(log_buffer, "host %s not found", name);
		log_err(-1, __func__, log_buffer);
		return -1;
	}

	for (i = 0; host->h_addr_list[i]; i++) {
		memcpy((char *) &saddr, host->h_addr_list[i], host->h_length);
		okclients.push_back(saddr.s_addr);
	}
	return 0;
}

/**
 * @brief
 * 		read_config - read and process the configuration file (see -c option)
 * @par
 *		Currently, the only statement is $clienthost to specify which systems
 *		can contact the scheduler.
 *
 * @param[in]	file	-	configuration file
 *
 * @return	int
 * @retval	0	: Ok
 * @retval	-1	: !nOtOk!
 */
#define CONF_LINE_LEN 120

static int
read_config(char *file)
{
	FILE *conf;
	int i;
	char line[CONF_LINE_LEN];
	char *token;
	struct specialconfig {
		const char *name;
		int (*handler)(const char *);
	} special[] = {
		{"clienthost", addclient},
		{NULL, NULL}};

#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	if (chk_file_sec_user(file, 0, 0, S_IWGRP | S_IWOTH, 1, getuid()))
		return (-1);
#endif

	if ((conf = fopen(file, "r")) == NULL) {
		log_err(errno, __func__, "cannot open config file");
		return (-1);
	}
	while (fgets(line, CONF_LINE_LEN, conf)) {

		if ((line[0] == '#') || (line[0] == '\n'))
			continue;	   /* ignore comment & null line */
		else if (line[0] == '$') { /* special */

			if ((token = strtok(line, " \t")) == NULL)
				token = const_cast<char *>("");
			for (i = 0; special[i].name; i++) {
				if (strcmp(token + 1, special[i].name) == 0)
					break;
			}
			if (special[i].name == NULL) {
				sprintf(log_buffer, "config name %s not known",
					token);
				log_record(PBSEVENT_ERROR,
					   PBS_EVENTCLASS_SERVER, LOG_INFO,
					   msg_daemonname, log_buffer);
				continue;
			}
			token = strtok(NULL, " \t");
			if (*(token + strlen(token) - 1) == '\n')
				*(token + strlen(token) - 1) = '\0';
			if (special[i].handler(token)) {
				fclose(conf);
				return (-1);
			}

		} else {
			log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
				   LOG_INFO, msg_daemonname,
				   "invalid line in config file");
			fclose(conf);
			return (-1);
		}
	}
	fclose(conf);
	return (0);
}
/**
 * @brief
 * 		restart on signal
 *
 * @param[in]	sig	-	signal
 */
void
restart(int sig)
{
	const sched_cmd cmd = {SCH_CONFIGURE, NULL};

	if (sig) {
		log_close(1);
		log_open(logfile, path_log);
		sprintf(log_buffer, "restart on signal %d", sig);
	} else {
		sprintf(log_buffer, "restart command");
	}
	log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);
	if (configfile) {
		if (read_config(configfile) != 0)
			die(0);
	}
	schedule_ptr(clust_primary_sock, &cmd);
}

#ifdef NAS /* localmod 030 */
/**
 * @brief
 * 		make soft cycle interrupt active
 *
 * @param[in]	sig	-	signal
 */
void
soft_cycle_interrupt(int sig)
{
	do_soft_cycle_interrupt = 1;
}
/**
 * @brief
 * 		make hard cycle interrupt active
 *
 * @param[in]	sig	-	signal
 */
void
hard_cycle_interrupt(int sig)
{
	do_hard_cycle_interrupt = 1;
}
#endif /* localmod 030 */

/**
 * @brief
 * 		lock_out - lock out other daemons from this directory.
 *
 * @param[in]	fds	-	file descriptor
 * @param[in]	op	-	F_WRLCK  or  F_UNLCK
 *
 * @return	1
 */

static void
lock_out(int fds, int op)
{
	struct flock flock;

	(void) lseek(fds, (off_t) 0, SEEK_SET);
	flock.l_type = op;
	flock.l_whence = SEEK_SET;
	flock.l_start = 0;
	flock.l_len = 0; /* whole file */
	if (fcntl(fds, F_SETLK, &flock) < 0) {
		log_err(errno, msg_daemonname, "another scheduler running");
		fprintf(stderr, "pbs_sched: another scheduler running\n");
		exit(1);
	}
}

/**
 * @brief
 * 		are_we_primary - are we on the primary Server host
 *		If either the only configured Server or the Primary in a failover
 *		configuration - return true
 *
 * @return	int
 * @retval	0	: we are the secondary
 * @retval	-1	: cannot be neither
 * @retval	1	: we are the listed primary
 */
static int
are_we_primary()
{
	char server_host[PBS_MAXHOSTNAME + 1];
	char hn1[PBS_MAXHOSTNAME + 1];

	if (pbs_conf.pbs_leaf_name) {
		char *endp;
		snprintf(server_host, sizeof(server_host), "%s", pbs_conf.pbs_leaf_name);
		endp = strchr(server_host, ','); /* find the first name */
		if (endp)
			*endp = '\0';
		endp = strchr(server_host, ':'); /* cut out the port */
		if (endp)
			*endp = '\0';
	} else if ((gethostname(server_host, (sizeof(server_host) - 1)) == -1) ||
		   (get_fullhostname(server_host, server_host, (sizeof(server_host) - 1)) == -1)) {
		log_err(-1, __func__, "Unable to get my host name");
		return -1;
	}

	/* both secondary and primary should be set or neither set */
	if ((pbs_conf.pbs_secondary == NULL) && (pbs_conf.pbs_primary == NULL))
		return 1;
	if ((pbs_conf.pbs_secondary == NULL) || (pbs_conf.pbs_primary == NULL))
		return -1;

	if (get_fullhostname(pbs_conf.pbs_primary, hn1, (sizeof(hn1) - 1)) == -1) {
		log_err(-1, __func__, "Unable to get full host name of primary");
		return -1;
	}

	if (strcmp(hn1, server_host) == 0)
		return 1; /* we are the listed primary */

	if (get_fullhostname(pbs_conf.pbs_secondary, hn1, (sizeof(hn1) - 1)) == -1) {
		log_err(-1, __func__, "Unable to get full host name of secondary");
		return -1;
	}
	if (strcmp(hn1, server_host) == 0)
		return 0; /* we are the secondary */

	return -1; /* cannot be neither */
}

/**
 * @brief close connections to server
 *
 * @return void
 */
void
close_server_conns(void)
{
	int i;

	pbs_disconnect(clust_primary_sock);
	pbs_disconnect(clust_secondary_sock);

	tpp_em_destroy(poll_context);
	poll_context = NULL;

	/* free qrun_list */
	for (i = 0; i < qrun_list_size; i++) {
		if (qrun_list[i].jid != NULL)
			free(qrun_list[i].jid);
	}
	free(qrun_list);
	qrun_list = NULL;

	clust_primary_sock = -1;
	clust_secondary_sock = -1;
}

/**
 * @brief Connect to server. Also add secondary connection to the poll list
 *
 *
 * @return void
 */
void
open_server_conns(void)
{
	sigset_t prevsigs;
	sigset_t tmpsigs;

	while (1) {
		sigemptyset(&prevsigs);
		/*
	 	 * Connecting to server may potentially fork for reserve port authentication.
	 	 * Call to connect to server must be protected from signals because it can cause
	 	 * scheduler to go into a deadlock on logging mutex.
	 	 */
		if (sigprocmask(SIG_BLOCK, &allsigs, &prevsigs) == -1)
			log_err(errno, __func__, "sigprocmask(SIG_BLOCK)");

		if (clust_primary_sock < 0) {
			clust_primary_sock = pbs_connect(NULL);
			if (clust_primary_sock < 0)
				goto unmask_continue;
		}
		clust_secondary_sock = pbs_connect(NULL);
		if (clust_secondary_sock < 0 || clust_primary_sock == clust_secondary_sock)
			goto unmask_continue;

		if (pbs_register_sched(sc_name, clust_primary_sock, clust_secondary_sock) != 0) {
			log_errf(pbs_errno, __func__, "Couldn't register the scheduler %s with connected server", sc_name);
			goto unmask_continue;
		}

		/* Reached here means everything is success, so we will break out of the loop */
		if (sigprocmask(SIG_SETMASK, &prevsigs, NULL) == -1)
			log_err(errno, __func__, "sigprocmask(SIG_SETMASK)");
		break;

	unmask_continue:
		tmpsigs = prevsigs;
		/* allow blocked signals while waiting for connection */
		for (auto &sig : sigstoblock) {
			sigdelset(&tmpsigs, sig);
		}

		if (sigprocmask(SIG_SETMASK, &tmpsigs, NULL) == -1)
			log_err(errno, __func__, "sigprocmask(SIG_SETMASK)");

		/* wait for 2s for not to burn too much CPU, and then retry connection */
		sleep(2);
		if (sigprocmask(SIG_SETMASK, &prevsigs, NULL) == -1)
			log_err(errno, __func__, "sigprocmask(SIG_SETMASK)");
		continue;
	}
	log_eventf(PBSEVENT_ADMIN | PBSEVENT_FORCE, PBS_EVENTCLASS_SCHED,
		   LOG_INFO, msg_daemonname, "Connected to the server");

	sched_svr_init();

	if (tpp_em_add_fd(poll_context, clust_secondary_sock, EM_IN | EM_HUP | EM_ERR) < 0) {
		log_errf(errno, __func__, "Couldn't add secondary connection to poll list");
		die(-1);
	}
}

/**
 * @brief Initialises event poll context for the server and also sched commands queue
 *
 * @return void
 */
void
sched_svr_init(void)
{
	if (poll_context == NULL) {
		poll_context = tpp_em_init(1);
		if (poll_context == NULL) {
			log_err(errno, __func__, "Failed to init cmd connections context");
			die(-1);
		}
	}

	qrun_list = static_cast<sched_cmd *>(malloc(2 * sizeof(sched_cmd)));
	if (qrun_list == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		die(0);
	}
}

/**
 * @brief reconnect to all the servers configured
 *
 * @return void
 */
static void
reconnect_server(void)
{
	close_server_conns();
	open_server_conns();
	return;
}

/**
 * @brief read incoming command from given secondary connection
 *        and add it into sched_cmds array
 *
 * @param[in]  sock   - secondary connection to server
 *
 * @return int
 * @retval -2 - failure due to memory operation failed
 * @retval -1 - failure while reading command
 * @return  0 - no cmd, server might have closed connection
 * @return  1 - success, read atleast one command
 */
static int
read_sched_cmd(int sock)
{
	int rc;
	sched_cmd cmd;

	rc = get_sched_cmd(sock, &cmd);
	if (rc != 1)
		return rc;
	else {
		sched_cmd cmd_prio;
		/*
		 * There is possibility that server has sent
		 * priority command after first non-priority command,
		 * while we were in schedule()
		 *
		 * so try read it in non-blocking mode, but don't
		 * return any failure if fails to read, as we have
		 * successfully enqueued first command
		 *
		 * and if we get priority command then just ignore it
		 * since we are not yet in middle of schedule cycle
		 */
		int rc_prio = get_sched_cmd_noblk(sock, &cmd_prio);
		if (rc_prio == -2)
			return 0;
	}

	if (cmd.cmd != SCH_SCHEDULE_RESTART_CYCLE) {
		if (cmd.cmd == SCH_SCHEDULE_AJOB)
			qrun_list[qrun_list_size++] = cmd;
		else {
			if (cmd.cmd >= SCH_SCHEDULE_NULL && cmd.cmd < SCH_CMD_HIGH)
				sched_cmds[cmd.cmd] = 1;
		}
	}

	return rc;
}

/**
 * @brief wait for commands from servers
 *
 * @return void
 */
static void
wait_for_cmds()
{
	int i;
	em_event_t *events;
	int hascmd = 0;
	sigset_t emptyset;

	qrun_list_size = 0;

	while (!hascmd) {
		sigemptyset(&emptyset);
		auto nsocks = tpp_em_pwait(poll_context, &events, -1, &emptyset);
		auto err = errno;

		if (nsocks < 0) {
			if (!(err == EINTR || err == EAGAIN || err == 0)) {
				log_errf(err, __func__, " tpp_em_wait() error, errno=%d", err);
				sleep(1); /* wait for 1s for not to burn too much CPU */
			}
		} else {
			for (i = 0; i < nsocks; i++) {
				int sock = EM_GET_FD(events, i);
				err = read_sched_cmd(sock);
				if (err != 1) {
					/* if memory error ignore, else reconnect server */
					if (err != -2)
						reconnect_server();
				} else
					hascmd = 1;
			}
		}
	}
}

/**
 * @brief	Helper function for send_cycle_end, just sends the message out
 *
 * @param	sec_conn - secondary conn sd to the server
 *
 * @return	bool
 * @retval	true for success
 * @retval	false for failure/error
 */
bool
send_cycle_end_msg(int sec_conn)
{
	static int cycle_end_marker = 0;

	if (diswsi(sec_conn, cycle_end_marker) != DIS_SUCCESS) {
		log_err(errno, __func__, "Not able to send end of cycle");
		return false;
	}

	if (dis_flush(sec_conn) != 0) {
		log_err(errno, __func__, "Not able to send end of cycle");
		return false;
	}

	return true;
}

/**
 *
 * @brief sends end of cycle indication to all the servers configured
 *
 * @param[in] sd - socket descriptor to send end of cycle notification
 *
 * @return void
 */
static void
send_cycle_end(void)
{
	if (!send_cycle_end_msg(clust_secondary_sock))
		goto reconnect;

	if (got_sigpipe)
		goto reconnect;

	return;

reconnect:
	reconnect_server();
	got_sigpipe = 0;
}

int
sched_main(int argc, char *argv[], schedule_func sched_ptr)
{
	int go;
	int c;
	int errflg = 0;
	int lockfds;
	pid_t pid;
	char host[PBS_MAXHOSTNAME + 1];
#ifndef DEBUG
	const char *dbfile = "sched_out";
#endif
	struct sigaction act;
	int opt_no_restart = 0;
	int stalone = 0;
#ifdef _POSIX_MEMLOCK
	int do_mlockall = 0;
#endif /* _POSIX_MEMLOCK */
	int nthreads = -1;
	int num_cores;
	char *endp = NULL;
	pthread_mutexattr_t attr;

	/*the real deal or show version and exit?*/

	schedule_ptr = sched_ptr;

	PRINT_VERSION_AND_EXIT(argc, argv);

	num_cores = sysconf(_SC_NPROCESSORS_ONLN);

	if (pbs_loadconf(0) == 0)
		return (1);

	if (validate_running_user(argv[0]) == 0)
		return (1);

	/* disable attribute verification */
	set_no_attribute_verification();

	/* initialize the thread context */
	if (pbs_client_thread_init_thread_context() != 0) {
		fprintf(stderr, "%s: Unable to initialize thread context\n",
			argv[0]);
		return (1);
	}

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	nthreads = pbs_conf.pbs_sched_threads;

	glob_argv = argv;
	segv_start_time = segv_last_time = time(NULL);

	opterr = 0;
	while ((c = getopt(argc, argv, "lL:NI:d:p:c:nt:")) != EOF) {
		switch (c) {
			case 'l':
#ifdef _POSIX_MEMLOCK
				do_mlockall = 1;
#else
				fprintf(stderr, "-l option - mlockall not supported\n");
#endif /* _POSIX_MEMLOCK */
				break;
			case 'L':
				logfile = optarg;
				break;
			case 'N':
				stalone = 1;
				break;
			case 'I':
				sc_name = optarg;
				break;
			case 'd':
				if (pbs_conf.pbs_home_path != NULL)
					free(pbs_conf.pbs_home_path);
				pbs_conf.pbs_home_path = optarg;
				break;
			case 'p':
#ifndef DEBUG
				dbfile = optarg;
#endif
				break;
			case 'c':
				configfile = optarg;
				break;
			case 'n':
				opt_no_restart = 1;
				break;
			case 't':
				nthreads = strtol(optarg, &endp, 10);
				if (*endp != '\0') {
					fprintf(stderr, "%s: bad num threads value\n", optarg);
					errflg = 1;
				}
				if (nthreads < 1) {
					fprintf(stderr, "%s: bad num threads value (should be in range 1-99999)\n", optarg);
					errflg = 1;
				}
				if (nthreads > num_cores) {
					fprintf(stderr, "%s: cannot be larger than number of cores %d, using number of cores instead\n",
						optarg, num_cores);
					nthreads = num_cores;
				}
				break;
			default:
				errflg = 1;
				break;
		}
	}

	if (sc_name == NULL) {
		sc_name = PBS_DFLT_SCHED_NAME;
		dflt_sched = 1;
	}

	if (errflg) {
		fprintf(stderr, "usage: %s %s\n", argv[0], usage);
		fprintf(stderr, "       %s --version\n", argv[0]);
		exit(1);
	}

	if (dflt_sched) {
		(void) sprintf(log_buffer, "%s/sched_priv", pbs_conf.pbs_home_path);
	} else {
		(void) sprintf(log_buffer, "%s/sched_priv_%s", pbs_conf.pbs_home_path, sc_name);
	}
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	c = chk_file_sec_user(log_buffer, 1, 0, S_IWGRP | S_IWOTH, 1, getuid());
	c |= chk_file_sec(pbs_conf.pbs_environment, 0, 0, S_IWGRP | S_IWOTH, 0);
	if (c != 0)
		exit(1);
#endif /* not DEBUG and not NO_SECURITY_CHECK */
	if (chdir(log_buffer) == -1) {
		perror("chdir");
		exit(1);
	}
	if (dflt_sched) {
		(void) sprintf(path_log, "%s/sched_logs", pbs_conf.pbs_home_path);
	} else {
		(void) sprintf(path_log, "%s/sched_logs_%s", pbs_conf.pbs_home_path, sc_name);
	}
	if (log_open(logfile, path_log) == -1) {
		fprintf(stderr, "%s: logfile could not be opened\n", argv[0]);
		exit(1);
	}

	/* The following is code to reduce security risks                */
	/* start out with standard umask, system resource limit infinite */

	umask(022);
	if (setup_env(pbs_conf.pbs_environment) == -1)
		exit(1);
	c = getgid();
	(void) setgroups(1, (gid_t *) &c); /* secure suppl. groups */

	set_proc_limits(pbs_conf.pbs_core_limit, 0); /* set_proc_limits can call log_record, so call only after opening log file */

	if (gethostname(host, (sizeof(host) - 1)) == -1) {
		log_err(errno, __func__, "gethostname");
		die(0);
	}

	/*Initialize security library's internal data structures*/
	if (load_auths(AUTH_SERVER)) {
		log_err(-1, "pbs_sched", "Failed to load auth lib");
		die(0);
	}

	{
		int csret;

		/* let Libsec do logging if part of PBS daemon code */
		p_cslog = log_err;

		if ((csret = CS_server_init()) != CS_SUCCESS) {
			sprintf(log_buffer,
				"Problem initializing security library (%d)", csret);
			log_err(-1, "pbs_sched", log_buffer);
			die(0);
		}
	}

	addclient("localhost"); /* who has permission to call MOM */
	addclient(host);
	if (pbs_conf.pbs_server_name)
		addclient(pbs_conf.pbs_server_name);
	if (pbs_conf.pbs_primary && pbs_conf.pbs_secondary) {
		/* Failover is configured when both primary and secondary are set. */
		addclient(pbs_conf.pbs_primary);
		addclient(pbs_conf.pbs_secondary);
	} else if (pbs_conf.pbs_server_host_name) {
		/* Failover is not configured, but PBS_SERVER_HOST_NAME is. */
		addclient(pbs_conf.pbs_server_host_name);
	}
	if (pbs_conf.pbs_leaf_name)
		addclient(pbs_conf.pbs_leaf_name);

	if (configfile) {
		if (read_config(configfile) != 0)
			die(0);
	}

	if ((c = are_we_primary()) == 1) {
		lockfds = open("sched.lock", O_CREAT | O_WRONLY, 0644);
	} else if (c == 0) {
		lockfds = open("sched.lock.secondary", O_CREAT | O_WRONLY, 0644);
	} else {
		log_err(-1, "pbs_sched", "neither primary or secondary server");
		exit(1);
	}
	if (lockfds < 0) {
		log_err(errno, __func__, "open lock file");
		exit(1);
	}

	if (sigemptyset(&allsigs) == -1) {
		perror("sigemptyset");
		exit(1);
	}
	if (sigprocmask(SIG_SETMASK, &allsigs, NULL) == -1) { /* unblock */
		perror("sigprocmask");
		exit(1);
	}
	act.sa_flags = 0;

	/* remember to block these during critical sections so we don't get confused */
	for (auto &sig : sigstoblock) {
		sigaddset(&allsigs, sig);
	}
	act.sa_mask = allsigs;

	act.sa_handler = restart; /* do a restart on SIGHUP */
	sigaction(SIGHUP, &act, NULL);

#ifdef NAS				       /* localmod 030 */
	act.sa_handler = soft_cycle_interrupt; /* do a cycle interrupt on */
					       /* SIGUSR1, subject to     */
					       /* configurable parameters */
	sigaction(SIGUSR1, &act, NULL);
	act.sa_handler = hard_cycle_interrupt; /* do a cycle interrupt on */
					       /* SIGUSR2                 */
	sigaction(SIGUSR2, &act, NULL);
#endif /* localmod 030 */

	act.sa_handler = die; /* bite the biscuit for all following */
	sigaction(SIGINT, &act, NULL);
	sigaction(SIGTERM, &act, NULL);

	act.sa_handler = sigfunc_pipe;
	sigaction(SIGPIPE, &act, NULL);

	if (!opt_no_restart) {
		act.sa_handler = on_segv;
		sigaction(SIGSEGV, &act, NULL);
		sigaction(SIGBUS, &act, NULL);
	}

#ifndef DEBUG
	if (stalone != 1) {
		if ((pid = fork()) == -1) { /* error on fork */
			perror("fork");
			exit(1);
		} else if (pid > 0) /* parent exits */
			exit(0);

		if (setsid() == -1) {
			perror("setsid");
			exit(1);
		}
	}
	lock_out(lockfds, F_WRLCK);
	if (freopen(dbfile, "a", stdout) == NULL) 
		log_errf(-1, __func__, "freopen failed. ERR : %s",strerror(errno));
	setvbuf(stdout, NULL, _IOLBF, 0);
	dup2(fileno(stdout), fileno(stderr));
#else
	if (stalone != 1) {
		(void) sprintf(log_buffer, "Debug build does not fork.");
		log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
			   __func__, log_buffer);
	}
	lock_out(lockfds, F_WRLCK);
	setvbuf(stdout, NULL, _IOLBF, 0);
	setvbuf(stderr, NULL, _IOLBF, 0);
#endif
	pid = getpid();
	daemon_protect(0, PBS_DAEMON_PROTECT_ON);
	if (freopen("/dev/null", "r", stdin) == NULL) 
		log_errf(-1, __func__, "freopen failed. ERR : %s",strerror(errno));

	/* write schedulers pid into lockfile */
	if (ftruncate(lockfds, (off_t) 0) == -1) 
		log_errf(-1, __func__, "ftruncate failed. ERR : %s",strerror(errno));
	(void) sprintf(log_buffer, "%ld\n", (long) pid);
	if (write(lockfds, log_buffer, strlen(log_buffer)) == -1) 
		log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));

#ifdef _POSIX_MEMLOCK
	if (do_mlockall == 1) {
		if (mlockall(MCL_CURRENT | MCL_FUTURE) == -1) {
			log_err(errno, __func__, "mlockall failed");
		}
	}
#endif /* _POSIX_MEMLOCK */

	(void) sprintf(log_buffer, msg_startup1, PBS_VERSION, 0);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_FORCE,
		  LOG_NOTICE, PBS_EVENTCLASS_SERVER, msg_daemonname, log_buffer);

	sprintf(log_buffer, "%s startup pid %ld", argv[0], (long) pid);
	log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);

	/*
	 *  Local initialization stuff
	 */
	/* Set the signal mask temporarily for thread initialization */
	if (sigprocmask(SIG_BLOCK, &allsigs, &oldsigs) == -1)
		log_err(errno, __func__, "sigprocmask(SIG_BLOCK)");
	if (schedinit(nthreads)) {
		(void) sprintf(log_buffer,
			       "local initialization failed, terminating");
		log_record(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
			   __func__, log_buffer);
		exit(1);
	}
	if (sigprocmask(SIG_SETMASK, &oldsigs, NULL) == -1)
		log_err(errno, __func__, "sigprocmask(SIG_SETMASK)");

	/* Initialize cleanup lock */
	if (init_mutex_attr_recursive(&attr) != 0)
		die(0);

	pthread_mutex_init(&cleanup_lock, &attr);

	open_server_conns();

	for (go = 1; go;) {
		int i;

		wait_for_cmds();

		/* First walk through the qrun_list as this has high priority followed by the other commands */
		for (i = 0; i < qrun_list_size; i++) {
			if (schedule_wrapper(&qrun_list[i], opt_no_restart) == 1) {
				go = 0;
				break;
			}
			free(qrun_list[i].jid);
			qrun_list[i].jid = NULL;
		}

		for (i = 0; go && (i < SCH_CMD_HIGH); i++) {
			sched_cmd cmd;

			if (sched_cmds[i] == 0)
				continue;

			/* index itself is the command */
			cmd.cmd = i;

			/* jid is always NULL since this list does not contain SCHEDULE_AJOB commands */
			cmd.jid = NULL;

			/* clear the entry of sched_cmds[i] as we are going to process this command now */
			sched_cmds[i] = 0;

			if (schedule_wrapper(&cmd, opt_no_restart) == 1) {
				go = 0;
				break;
			}
		}
	}

	schedexit();

	log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, "%s normal finish pid %ld", argv[0], (long) pid);
	lock_out(lockfds, F_UNLCK);

	unload_auths();
	close_server_conns();
	log_close(1);
	exit(0);
}

/**
 * @brief
 *	schedule_wrapper - Wrapper function for calling schedule
 *
 * @param[in] cmd - pointer to schedulig command
 * @param[in] opt_no_restart - value of opt_no_restart
 *
 * @return	int
 * @retval	0	: continue calling scheduling cycles
 * @retval	1	: exit scheduler
 */
static int
schedule_wrapper(sched_cmd *cmd, int opt_no_restart)
{
	time_t now;

	if (sigprocmask(SIG_BLOCK, &allsigs, &oldsigs) == -1)
		log_err(errno, __func__, "sigprocmask(SIG_BLOCK)");

	/* Keep track of time to use in SIGSEGV handler */
	now = time(NULL);
	if (!opt_no_restart)
		segv_last_time = now;

#ifdef DEBUG
	{
		strftime(log_buffer, sizeof(log_buffer), "%Y-%m-%d %H:%M:%S", localtime(&now));
		DBPRT(("%s Scheduler received command %d\n", log_buffer, cmd->cmd));
	}
#endif

	if (schedule_ptr(clust_primary_sock, cmd)) /* magic happens here */
		return 1;
	else
		send_cycle_end();

	if (sigprocmask(SIG_SETMASK, &oldsigs, NULL) == -1)
		log_err(errno, __func__, "sigprocmask(SIG_SETMASK)");

	return 0;
}


================================================
FILE: src/scheduler/pbsfs.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    pbsfs.cpp
 *
 * @brief
 * 		pbsfs.cpp - contains functions which are related to PBS file share.
 *
 * Functions included are:
 * 	main()
 * 	print_fairshare_entity()
 *
 */
#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <unistd.h>
#include <libpbs.h>
#include <pbs_ifl.h>
#include "data_types.h"
#include "constant.h"
#include "config.h"
#include "fairshare.h"
#include "parse.h"
#include "pbs_version.h"
#include "sched_cmds.h"
#include "log.h"
#include "fifo.h"

/* prototypes */
static void print_fairshare_entity(group_info *ginfo);
static void print_fairshare(group_info *root, int level);

/* flags */
#define FS_GET 1
#define FS_SET 2
#define FS_PRINT 4
#define FS_PRINT_TREE 8
#define FS_DECAY 16
#define FS_COMP 32
#define FS_TRIM_TREE 64
#define FS_WRITE_FILE 128

/**
 * @brief
 * 		The entry point of pbsfs
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: something is wrong!
 */
int
main(int argc, char *argv[])
{
	char path_buf[256] = {0};
	char sched_name[PBS_MAXSCHEDNAME + 1] = "default";
	group_info *ginfo;
	group_info *ginfo2;
	int c;
	int flags = FS_PRINT;
	int flag1 = 0;
	double val;
	char *endp;
	char *testp;

	/* the real deal or output version and exit? */
	PRINT_VERSION_AND_EXIT(argc, argv);
	set_msgdaemonname(const_cast<char *>("pbsfs"));

	if (pbs_loadconf(0) <= 0)
		exit(1);

	while ((c = getopt(argc, argv, "sgptdceI:-:")) != -1)
		switch (c) {
			case 'g':
				flags = FS_GET;
				break;
			case 's':
				flags = FS_SET | FS_WRITE_FILE;
				break;
			case 'p':
				flags = FS_PRINT;
				break;
			case 't':
				flags = FS_PRINT_TREE;
				break;
			case 'd':
				flags = FS_DECAY | FS_WRITE_FILE;
				break;
			case 'c':
				flags = FS_COMP;
				break;
			case 'e':
				flags = FS_TRIM_TREE | FS_WRITE_FILE;
				break;
			case 'I':
				snprintf(sched_name, sizeof(sched_name), "%s", optarg);
				break;
			case '-':
				flag1 = 1;
				break;
		}

	if (flag1 == 1) {
		fprintf(stderr, "Usage: pbsfs --version\n");
		exit(1);
	}

	if (validate_running_user(argv[0]) == 0) {
		exit(1);
	}

	if ((flags & (FS_PRINT | FS_PRINT_TREE)) && (argc - optind) != 0) {
		fprintf(stderr, "Usage: pbsfs -[ptdgcs] [-I sched_name]\n");
		exit(1);
	} else if ((flags & FS_GET) && (argc - optind) != 1) {
		fprintf(stderr, "Usage: pbsfs [-I sched_name] -g <fairshare_entity>\n");
		exit(1);
	} else if ((flags & FS_SET) && (argc - optind) != 2) {
		fprintf(stderr, "Usage: pbsfs [-I sched_name] -s <fairshare_entity> <usage>\n");
		exit(1);
	} else if ((flags & FS_COMP) && (argc - optind) != 2) {
		fprintf(stderr, "Usage: pbsfs [-I sched_name] -c <entity1> <entity2>\n");
		exit(1);
	}

	if (strcmp(sched_name, "default") != 0) {
		int pbs_sd;
		struct batch_status *bs;
		struct batch_status *cur_bs;
		pbs_sd = pbs_connect(NULL);
		if (pbs_sd < 0) {
			fprintf(stderr, "Can't connect to the server\n");
			exit(1);
		}
		bs = pbs_statsched(pbs_sd, NULL, NULL);

		for (cur_bs = bs; cur_bs != NULL; cur_bs = cur_bs->next) {
			if (strcmp(cur_bs->name, sched_name) == 0) {
				struct attrl *cur_attrl;
				for (cur_attrl = cur_bs->attribs; cur_attrl != NULL; cur_attrl = cur_attrl->next) {
					if (strcmp(cur_attrl->name, ATTR_sched_priv) == 0) {
						pbs_strncpy(path_buf, cur_attrl->value, sizeof(path_buf));
						break;
					}
				}
				if (cur_attrl == NULL) {
					fprintf(stderr, "Scheduler %s does not have its sched_priv set\n", sched_name);
					exit(1);
				}
				break;
			}
		}
		if (cur_bs == NULL) {
			fprintf(stderr, "Scheduler %s does not exist\n", sched_name);
			exit(1);
		}
		pbs_disconnect(pbs_sd);

	} else
		snprintf(path_buf, sizeof(path_buf), "%s/sched_priv/", pbs_conf.pbs_home_path);

	if (chdir(path_buf) == -1) {
		perror("Unable to access fairshare data");
		exit(1);
	}
	conf = parse_config(CONFIG_FILE);
	if ((fstree = preload_tree()) == NULL) {
		fprintf(stderr, "Error in preloading fairshare information\n");
		return 1;
	}
	if (parse_group(RESGROUP_FILE, fstree->root) == 0)
		return 1;

	if (flags & FS_TRIM_TREE) {
		read_usage(USAGE_FILE, FS_TRIM, fstree);
		fstree->last_decay = time(NULL);
	} else
		read_usage(USAGE_FILE, 0, fstree);

	calc_fair_share_perc(fstree->root->child, UNSPECIFIED);
	calc_usage_factor(fstree);

	if (flags & FS_PRINT_TREE)
		print_fairshare(fstree->root, 0);
	else if (flags & FS_PRINT) {
		printf("Fairshare usage units are in: %s\n", conf.fairshare_res.c_str());
		print_fairshare(fstree->root, -1);
	} else if (flags & FS_DECAY) {
		decay_fairshare_tree(fstree->root);
		fstree->last_decay = time(NULL);
	} else if (flags & (FS_GET | FS_SET | FS_COMP)) {
		ginfo = find_group_info(argv[optind], fstree->root);

		if (ginfo == NULL) {
			fprintf(stderr, "Fairshare Entity %s does not exist.\n", argv[optind]);
			return 1;
		}
		if (flags & FS_COMP) {
			ginfo2 = find_group_info(argv[optind + 1], fstree->root);

			if (ginfo2 == NULL) {
				fprintf(stderr, "Fairshare Entity %s does not exist.\n", argv[optind + 1]);
				return 1;
			}
			switch (compare_path(ginfo->gpath, ginfo2->gpath)) {
				case -1:
					printf("%s\n", ginfo->name.c_str());
					break;

				case 0:
					printf("%s == %s\n", ginfo->name.c_str(), ginfo2->name.c_str());
					break;

				case 1:
					printf("%s\n", ginfo2->name.c_str());
			}
		} else if (flags & FS_GET)
			print_fairshare_entity(ginfo);
		else {
			testp = argv[optind + 1];
			val = strtod(testp, &endp);

			if (*endp == '\0')
				ginfo->usage = val;
		}
	}

	if (flags & FS_WRITE_FILE) {
		FILE *fp;
		/* make backup of database file */
		remove(USAGE_FILE ".bak");
		if (rename(USAGE_FILE, USAGE_FILE ".bak") < 0)
			perror("Could not backup usage database.");
		write_usage(USAGE_FILE, fstree);
		if ((fp = fopen(USAGE_TOUCH, "w")) != NULL)
			fclose(fp);
	}

	return 0;
}
/**
 * @brief
 * 		print the group info structure.
 *
 * @param[in]	ginfo	-	group info structure.
 */
static void
print_fairshare_entity(group_info *ginfo)
{
	printf(
		"fairshare entity: %s\n"
		"Resgroup		: %d\n"
		"cresgroup		: %d\n"
		"Shares			: %d\n"
		"Percentage		: %f%%\n"
		"fairshare_tree_usage	: %f\n"
		"usage			: %.0lf (%s)\n"
		"usage/perc		: %.0lf\n",
		ginfo->name.c_str(),
		ginfo->resgroup,
		ginfo->cresgroup,
		ginfo->shares,
		ginfo->tree_percentage * 100,
		ginfo->usage_factor,
		ginfo->usage, conf.fairshare_res.c_str(),
		ginfo->tree_percentage == 0 ? -1 : ginfo->usage / ginfo->tree_percentage);

	printf("Path from root: \n");
	for (const auto &gp : ginfo->gpath) {
		printf("%-10s: %5d %10.0f / %5.3f = %.0f\n",
		       gp->name.c_str(), gp->cresgroup,
		       gp->usage, gp->tree_percentage,
		       gp->tree_percentage == 0 ? -1 : gp->usage / gp->tree_percentage);
	}
}

/**
 * @brief
 *		print_fairshare - print out the fair share tree
 *
 * @param[in]	root	-	root of subtree
 * @param[in]	level	-	-1	: print long version
 *				 0	: print brief but hierarchical tree
 *
 * @return nothing
 *
 */
static void
print_fairshare(group_info *root, int level)
{
	if (root == NULL)
		return;

	if (level < 0) {
		printf(
			"%-10s: Grp: %-5d  cgrp: %-5d"
			"Shares: %-6d Usage: %-6.0lf Perc: %6.3f%%\n",
			root->name.c_str(), root->resgroup, root->cresgroup, root->shares,
			root->usage, (root->tree_percentage * 100));
	} else
		printf("%*s%s(%d)\n", level, " ", root->name.c_str(), root->cresgroup);

	print_fairshare(root->child, level >= 0 ? level + 5 : -1);
	print_fairshare(root->sibling, level);
}


================================================
FILE: src/scheduler/prev_job_info.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    prev_job_info.c
 *
 * @brief
 * 		prev_job_info.c -  contains functions which are related to prev_job_info array.
 *
 * Functions included are:
 * 	create_prev_job_info()
 * 	free_prev_job_info()
 * 	free_pjobs()
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <errno.h>
#include <log.h>
#include "prev_job_info.h"
#include "job_info.h"
#include "misc.h"
#include "resource_resv.h"
#include "globals.h"

/**
 * @brief
 *		create_prev_job_info - create the prev_job_info array from an array of jobs
 *
 * @param[in]	jobs	-	job array
 *
 * @par	NOTE: jinfo_arr is modified
 *
 */
void
create_prev_job_info(resource_resv **jobs)
{
	int i;

	last_running.clear();

	for (i = 0; jobs[i] != NULL; i++) {
		if (jobs[i]->job != NULL) {
			prev_job_info pjinfo(jobs[i]->name, jobs[i]->job->ginfo->name, jobs[i]->job->resused);

			/* resused is shallow copied, NULL it so it doesn't get freed at the end of the cycle */
			jobs[i]->job->resused = NULL;

			last_running.push_back(pjinfo);
		}
	}
}

prev_job_info::prev_job_info(const std::string &pname, const std::string &ename, resource_req *rused) : name(pname), entity_name(ename), resused(rused)
{
}

prev_job_info::prev_job_info(const prev_job_info &opj) : name(opj.name), entity_name(opj.entity_name)
{
	resused = dup_resource_req_list(opj.resused);
}

prev_job_info::prev_job_info(prev_job_info &&opj) : name(std::move(opj.name)), entity_name(std::move(opj.entity_name))
{
	resused = opj.resused;
	opj.resused = NULL;
}

prev_job_info &
prev_job_info::operator=(const prev_job_info &opj)
{
	name = opj.name;
	entity_name = opj.entity_name;
	resused = dup_resource_req_list(opj.resused);

	return *this;
}

/**
 * @brief
 *		prev_job_info destructor
 *
 */
prev_job_info::~prev_job_info()
{
	free_resource_req_list(resused);
}


================================================
FILE: src/scheduler/prev_job_info.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PREV_JOB_INFO_H
#define _PREV_JOB_INFO_H

#include "data_types.h"

/*
 *      create_prev_job_info - create the prev_job_info array from an array
 *                              of jobs
 */
void create_prev_job_info(resource_resv **jobs);

#endif /* _PREV_JOB_INFO_H */


================================================
FILE: src/scheduler/prime.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    prime.c
 *
 * @brief
 * 		prime.c -  contains functions which are related to prime time.
 *
 * Functions included are:
 * 	is_prime_time()
 * 	check_prime()
 * 	is_holiday()
 * 	parse_holidays()
 * 	load_day()
 * 	end_prime_status_rec()
 * 	end_prime_status()
 * 	init_prime_time()
 * 	init_non_prime_time()
 *
 */

#include <algorithm>

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <time.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>

#include <pbs_ifl.h>
#include <log.h>

#include "constant.h"
#include "globals.h"
#include "prime.h"
#include "misc.h"

/**
 * @brief
 * 		return the status of primetime
 *
 * @param[in]	date	-	the date to check if its primetime
 *
 * @return	int
 * @retval 	PRIME	: if prime time
 * @retval	NON_PRIME	: if non_prime
 *
 * @par NOTE: Holidays are considered non-prime
 *
 */
enum prime_time
is_prime_time(time_t date)
{
	enum prime_time ret = PRIME; /* return code */
	struct tm *tmptr;	     /* current time in a struct tm */

	tmptr = localtime(&date);

	/* check for holiday: Holiday == non_prime */
	if (conf.holiday_year != 0) { /* year == 0: no prime-time */

		/* tm_yday starts at 0, and Julian date starts at 1 */
		if (is_holiday(tmptr->tm_yday + 1))
			ret = NON_PRIME;

		/* is_holiday() calls localtime() which returns a static ptr.  Our tmptr
		 * now no longer points to what we think it points to
		 */
		tmptr = localtime(&date);

		/* if ret still equals PRIME then it is not a holiday, we need to check
		 * and see if we are in non-prime or prime
		 */
		if (ret == PRIME) {
			if (tmptr->tm_wday == 0)
				ret = check_prime(SUNDAY, tmptr);
			else if (tmptr->tm_wday == 1)
				ret = check_prime(MONDAY, tmptr);
			else if (tmptr->tm_wday == 2)
				ret = check_prime(TUESDAY, tmptr);
			else if (tmptr->tm_wday == 3)
				ret = check_prime(WEDNESDAY, tmptr);
			else if (tmptr->tm_wday == 4)
				ret = check_prime(THURSDAY, tmptr);
			else if (tmptr->tm_wday == 5)
				ret = check_prime(FRIDAY, tmptr);
			else if (tmptr->tm_wday == 6)
				ret = check_prime(SATURDAY, tmptr);
			else
				ret = check_prime(WEEKDAY, tmptr);
		}
	}

	return ret;
}

/**
 * @brief
 *		check_prime - check if it is prime time for a particular day
 *
 * @param[in]	d	-	days
 * @param[in]	t	-	time represented as tm structure.
 *
 * @return	PRIME if it is in primetime
 * @retval	NON_PRIME	: if not
 */
enum prime_time
check_prime(enum days d, struct tm *t)
{
	enum prime_time prime = NON_PRIME; /* return code */

	/* Nonprime, prime, and current Times are transformed into military time for easier comparison */
	int npt = conf.prime[d][NON_PRIME].hour * 100 + conf.prime[d][NON_PRIME].min;
	int pt = conf.prime[d][PRIME].hour * 100 + conf.prime[d][PRIME].min;
	int ct = (t->tm_hour) * 100 + (t->tm_min);

	/* Case 1: all primetime today */
	if (conf.prime[d][PRIME].all)
		prime = PRIME;

	/* case 2: all nonprime time today */
	else if (conf.prime[d][NON_PRIME].all)
		prime = NON_PRIME;

	/* case 3: no primetime today */
	else if (conf.prime[d][PRIME].none)
		prime = NON_PRIME;

	/* case 4: no nonprime time today */
	else if (conf.prime[d][NON_PRIME].none)
		prime = PRIME;
	/* There are two more cases to handle, if we represent the 24 hours day as:
	 *          0000 ------------------------2400
	 * case 5 is when PRIME starts before NON_PRIME
	 *          0000 -------P----NP----------2400
	 * in which case the current time is PRIME only between P and NP
	 */
	else if (npt > pt) {
		if (pt <= ct && ct < npt)
			prime = PRIME;
		else
			prime = NON_PRIME;
	}
	/*  case 6 is when NON_PRIME starts before PRIME
	 *          0000 -------NP----P----------2400
	 *  in which case the current time is NONPRIME only between NP and P
	 *  This case also captures the setting of identical Prime and Nonprime times in the "holidays" file
	 */
	else if (npt < pt) {
		if (npt <= ct && ct < pt)
			prime = NON_PRIME;
		else
			prime = PRIME;
	}
	/* Catchall case is NON_PRIME */
	else
		prime = NON_PRIME;

	return prime;
}

/**
 * @brief
 *		is_holiday - returns true if 'date' is a holiday
 *
 * @param[in]	date	-	amount of days since the beginning of the year
 *							starting with Jan 1 == 1 or a time_t.
 *
 * @return	TRUE/FALSE
 * @retval	TRUE	: if today is a holiday
 * @retval	FALSE	: if not
 *
 */
int
is_holiday(long date)
{
	int jdate;
	struct tm *tmptr;

	if (date > 366) {
		tmptr = localtime((time_t *) &date);
		jdate = tmptr->tm_yday + 1;
	} else
		jdate = date;

	return std::find(conf.holidays.begin(), conf.holidays.end(), jdate) != conf.holidays.end();
}

/**
 * @brief	Set conf.prime values to reflect "ALL PRIME" before we start parsing
 * 			the holidays file
 *
 * @param	void
 *
 * @return void
 */
static void
handle_missing_prime_info(void)
{
	int d;

	for (d = SUNDAY; d < HIGH_DAY; d++) {
		if (conf.prime[d][PRIME].all + conf.prime[d][PRIME].none + conf.prime[d][PRIME].hour + conf.prime[d][PRIME].min + conf.prime[d][NON_PRIME].hour + conf.prime[d][NON_PRIME].min == 0) {
			conf.prime[d][PRIME].all = TRUE;
			conf.prime[d][PRIME].none = FALSE;
			conf.prime[d][PRIME].hour = static_cast<unsigned int>(UNSPECIFIED);
			conf.prime[d][PRIME].min = static_cast<unsigned int>(UNSPECIFIED);
			conf.prime[d][NON_PRIME].none = TRUE;
			conf.prime[d][NON_PRIME].all = FALSE;
			conf.prime[d][NON_PRIME].hour = static_cast<unsigned int>(UNSPECIFIED);
			conf.prime[d][NON_PRIME].min = static_cast<unsigned int>(UNSPECIFIED);
		}
	}
}

/**
 * @brief
 *		parse_holidays - parse the holidays file.  It should be in UNICOS 8
 *			 format.
 *
 * @param[in]	fname	-	name of holidays file
 *
 * @return	success/failure
 *
 */
int
parse_holidays(const char *fname)
{
	FILE *fp;	   /* file pointer to holidays file */
	char buf[256];	   /* buffer to read lines of the file into */
	char *config_name; /* the first word of the line */
	char *tok;	   /* used with strtok() to parse the rest of the line */
	char *endp;	   /* used with strtol() */
	int num;	   /* used to convert string -> integer */
	char error = 0;	   /* boolean: is there an error ? */
	int linenum = 0;   /* the current line number */

	if ((fp = fopen(fname, "r")) == NULL) {
		sprintf(log_buffer, "Error opening file %s", fname);
		log_err(errno, "parse_holidays", log_buffer);
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, HOLIDAYS_FILE,
			  "Warning: cannot open holidays file; assuming 24hr primetime");
		return 0;
	}

	while (fgets(buf, 256, fp) != NULL) {
		linenum++;
		if (buf[strlen(buf) - 1] == '\n')
			buf[strlen(buf) - 1] = '\0';
		if (!skip_line(buf)) {
			config_name = strtok(buf, "	 ");

			/* this tells us if we have the correct file format.  Its ignored since
			 * lots of error messages will be printed if the file format is wrong
			 * and if the file format is correct but just not this, we really
			 * shouldn't complain
			 */
			if (!strcmp(config_name, "HOLIDAYFILE_VERSION1"))
				;
			/* the current year - if the file is old, we want to know to log errors
			 * later about it
			 *
			 * FORMAT EXAMPLE
			 *
			 * YEAR 1998
			 */
			else if (!strcmp(config_name, "YEAR")) {
				tok = strtok(NULL, " 	");
				if (tok == NULL)
					error = 1;
				else {
					num = strtol(tok, &endp, 10);
					if (*endp != '\0')
						error = 1;
					else
						conf.holiday_year = num;
				}
			}
			/* primetime hours for saturday
			 * first number is primetime start, second is nonprime start
			 *
			 * FORMAT EXAMPLE
			 *
			 *  saturday 	0400	1700
			 */
			else if (!strcmp(config_name, "saturday")) {
				tok = strtok(NULL, " 	");
				if (load_day(SATURDAY, PRIME, tok) < 0)
					error = 1;

				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(SATURDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/* primetime hours for sunday  - same format as saturday */
			else if (!strcmp(config_name, "sunday")) {
				tok = strtok(NULL, " 	");
				if (load_day(SUNDAY, PRIME, tok) < 0)
					error = 1;

				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(SUNDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/* primetime for weekday - same format as saturday */
			else if (!strcmp(config_name, "weekday")) {
				tok = strtok(NULL, " 	");
				if (load_day(WEEKDAY, PRIME, tok) < 0)
					error = 1;
				else if (load_day(MONDAY, PRIME, tok) < 0)
					error = 1;
				else if (load_day(TUESDAY, PRIME, tok) < 0)
					error = 1;
				else if (load_day(WEDNESDAY, PRIME, tok) < 0)
					error = 1;
				else if (load_day(THURSDAY, PRIME, tok) < 0)
					error = 1;
				else if (load_day(FRIDAY, PRIME, tok) < 0)
					error = 1;

				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(WEEKDAY, NON_PRIME, tok) < 0)
						error = 1;
					else if (load_day(MONDAY, NON_PRIME, tok) < 0)
						error = 1;
					else if (load_day(TUESDAY, NON_PRIME, tok) < 0)
						error = 1;
					else if (load_day(WEDNESDAY, NON_PRIME, tok) < 0)
						error = 1;
					else if (load_day(THURSDAY, NON_PRIME, tok) < 0)
						error = 1;
					else if (load_day(FRIDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/* primetime for monday - same format as saturday */
			else if (!strcmp(config_name, "monday")) {
				tok = strtok(NULL, " 	");
				if (load_day(MONDAY, PRIME, tok) < 0)
					error = 1;
				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(MONDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/* primetime for tuesday - same format as saturday */
			else if (!strcmp(config_name, "tuesday")) {
				tok = strtok(NULL, " 	");
				if (load_day(TUESDAY, PRIME, tok) < 0)
					error = 1;

				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(TUESDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/* primetime for wednesday - same format as saturday */
			else if (!strcmp(config_name, "wednesday")) {
				tok = strtok(NULL, " 	");
				if (load_day(WEDNESDAY, PRIME, tok) < 0)
					error = 1;

				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(WEDNESDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/* primetime for thursday - same format as saturday */
			else if (!strcmp(config_name, "thursday")) {
				tok = strtok(NULL, " 	");
				if (load_day(THURSDAY, PRIME, tok) < 0)
					error = 1;

				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(THURSDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/* primetime for friday - same format as saturday */
			else if (!strcmp(config_name, "friday")) {
				tok = strtok(NULL, " 	");
				if (load_day(FRIDAY, PRIME, tok) < 0)
					error = 1;

				if (!error) {
					tok = strtok(NULL, " 	");
					if (load_day(FRIDAY, NON_PRIME, tok) < 0)
						error = 1;
				}
			}
			/*
			 * holidays
			 * We only care about the Julian date of the holiday.  It is enough
			 * information to find out if it is a holiday or not
			 *
			 * FORMAT EXAMPLE
			 *
			 *  Julian date	Calendar date	holiday name
			 *    1		Jan 1		New Year's Day
			 */
			else {
				num = strtol(config_name, &endp, 10);
				conf.holidays.push_back(num);
			}

			if (error) {
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, fname,
					   "Error on line %d, line started with: %s", linenum, config_name);
			}
		}
		error = 0;
	}

	if (conf.holiday_year != 0) {
		/* Let's make sure that any missing days get marked as 24hr prime-time */
		handle_missing_prime_info();
	}

	fclose(fp);
	return 0;
}

/**
 * @brief
 *		load_day - fill in the prime time part of the config structure
 *
 * @param[in]	d	-	enum days: can be WEEKDAY, SATURDAY, or SUNDAY
 * @param[in]	pr 	-	enum prime_time: can be PRIME or NON_PRIME
 * @param[in]	tok	-	token
 *
 * @return	int
 * @retval	0	: on success
 * @retval	-1	: on error
 *
 */
int
load_day(enum days d, enum prime_time pr, const char *tok)
{
	if (tok != NULL) {
		if (!strcmp(tok, "all") || !strcmp(tok, "ALL")) {
			if (pr == NON_PRIME && conf.prime[d][PRIME].all == TRUE) {
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, HOLIDAYS_FILE,
					  "Warning: both prime & non-prime starts are 'all'; assuming 24hr primetime");
				return 0;
			}
			conf.prime[d][pr].all = TRUE;
			conf.prime[d][pr].hour = static_cast<unsigned int>(UNSPECIFIED);
			conf.prime[d][pr].min = static_cast<unsigned int>(UNSPECIFIED);
			conf.prime[d][pr].none = FALSE;
		} else if (!strcmp(tok, "none") || !strcmp(tok, "NONE")) {
			if (pr == NON_PRIME && conf.prime[d][PRIME].none == TRUE) {
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, HOLIDAYS_FILE,
					  "Warning: both prime & non-prime starts are 'none'; assuming 24hr primetime");
				return load_day(d, PRIME, "all");
			}
			conf.prime[d][pr].all = FALSE;
			conf.prime[d][pr].hour = static_cast<unsigned int>(UNSPECIFIED);
			conf.prime[d][pr].min = static_cast<unsigned int>(UNSPECIFIED);
			conf.prime[d][pr].none = TRUE;
		} else {
			char *endp; /* used wtih strtol() */
			auto num = strtol(tok, &endp, 10);
			if (*endp == '\0') {
				/* num is a 4 digit number of the time HHMM */
				auto mins = num % 100;
				auto hours = num / 100;
				conf.prime[d][pr].hour = hours;
				conf.prime[d][pr].min = mins;
			} else
				return -1;
		}
	} else
		return -1;
	return 0;
}

/**
 * @brief
 * 		recursive helper for end_prime_status
 *
 * @param[in]	start	-	the time the function starts
 * @param[in]	date	-	the time to check (date = time when we start)
 * @param[in]	prime_status	-	current prime status PRIME, NON_PRIME, or
 *									NONE to have the function calcuate the prime status at date
 *
 * @retval	time_t	-	when the current prime status ends
 * @retval	SCHD_INFINITY	-	if the current prime status never ends
 */
static time_t
end_prime_status_rec(time_t start, time_t date, enum prime_time prime_status)
{
	struct tm *tmptr;
	enum days day;

	/* base case: if we're more then 7 days out the current prime status will
	 * never end.  We know this because the only prime settings are weekly.
	 */
	if (date > start + (7 * 24 * 60 * 60))
		return (time_t) SCHD_INFINITY;

	tmptr = localtime(&date);

	switch (tmptr->tm_wday) {
		case 0:
			day = SUNDAY;
			break;
		case 1:
			day = MONDAY;
			break;
		case 2:
			day = TUESDAY;
			break;
		case 3:
			day = WEDNESDAY;
			break;
		case 4:
			day = THURSDAY;
			break;
		case 5:
			day = FRIDAY;
			break;
		case 6:
			day = SATURDAY;
			break;
		default:
			day = WEEKDAY;
	}

	if (prime_status == PRIME) {
		/* We are currently in primetime. */
		/* If there is no non-primetime scheduled today, recurse into tomorrow. */
		if (conf.prime[day][NON_PRIME].none)
			return end_prime_status_rec(start, date + time_left_today(tmptr), prime_status);
		/* If there is no non-primetime left today, recurse into tomorrow. */
		if (conf.prime[day][NON_PRIME].hour < static_cast<unsigned int>(tmptr->tm_hour))
			return end_prime_status_rec(start, date + time_left_today(tmptr), prime_status);
		if (conf.prime[day][NON_PRIME].hour == static_cast<unsigned int>(tmptr->tm_hour) &&
		    conf.prime[day][NON_PRIME].min < static_cast<unsigned int>(tmptr->tm_min))
			return end_prime_status_rec(start, date + time_left_today(tmptr), prime_status);
		/* Non-primetime started at the beginning of the day, return it. */
		if (conf.prime[day][NON_PRIME].all || is_holiday(tmptr->tm_yday + 1))
			return date;
		/* Non-primetime will start later today, return the scheduled time. */
		return date + (conf.prime[day][NON_PRIME].hour - tmptr->tm_hour) * 3600 + (static_cast<int>(conf.prime[day][NON_PRIME].min) - tmptr->tm_min) * 60 - tmptr->tm_sec;
	} else {
		/* We are currently in non-primetime. */
		/* If there is no primetime scheduled today, recurse into tomorrow. */
		if (conf.prime[day][PRIME].none || is_holiday(tmptr->tm_yday + 1))
			return end_prime_status_rec(start, date + time_left_today(tmptr),
						    prime_status);
		/* If there is no primetime left today, recurse into tomorrow. */
		if (conf.prime[day][PRIME].hour < static_cast<unsigned int>(tmptr->tm_hour))
			return end_prime_status_rec(start, date + time_left_today(tmptr),
						    prime_status);
		if (conf.prime[day][PRIME].hour == static_cast<unsigned int>(tmptr->tm_hour) &&
		    conf.prime[day][PRIME].min < static_cast<unsigned int>(tmptr->tm_min))
			return end_prime_status_rec(start, date + time_left_today(tmptr),
						    prime_status);
		/* Primetime started at the beginning of the day, return it. */
		if (conf.prime[day][PRIME].all)
			return date;
		/* Primetime will start later today, return the scheduled time. */
		return date + (conf.prime[day][PRIME].hour - tmptr->tm_hour) * 3600 + (static_cast<int>(conf.prime[day][PRIME].min) - tmptr->tm_min) * 60 - tmptr->tm_sec;
	}
}

/**
 * @brief
 * 		find the time when the current prime status
 *		   (primetime or nonprimetime) ends.
 *
 * @param[in]	date	-	the time to check (date = time when we start)
 *
 * @par NOTE:	If prime status doesn't end in start + 7 days,
 *				it is considered infinite
 *
 * @return time when the current prime status ends.
 * @retval	time_t	: when the current prime status ends
 * @retval	SCHD_INFINITY	: if  the current prime status never ends
 *
 */
time_t
end_prime_status(time_t date)
{
	enum prime_time p;

	p = is_prime_time(date);

	/* no year means all prime all the time*/
	if (p == PRIME && conf.holiday_year == 0)
		return SCHD_INFINITY;

	return end_prime_status_rec(date, date, p);
}

/**
 * @brief
 * 		do any initializations that need to happen at the
 *			  start of prime time
 *
 * @param[in]	policy	-	policy info
 *
 * @return	int
 * @retval	1	: success
 * @retval	0	: error
 *
 */
int
init_prime_time(struct status *policy, char *arg)
{
	if (policy == NULL)
		return 0;

	policy->is_prime = PRIME;
	policy->round_robin = conf.prime_rr;
	policy->by_queue = conf.prime_bq;
	policy->strict_fifo = conf.prime_sf;
	policy->strict_ordering = conf.prime_so;
	policy->sort_by = &conf.prime_sort;
	policy->fair_share = conf.prime_fs;
	policy->backfill = conf.prime_bf;
	policy->sort_nodes = conf.prime_sn;
	policy->backfill_prime = conf.prime_bp;
	policy->preempting = conf.prime_pre;
	policy->node_sort = &conf.prime_node_sort;
#ifdef NAS /* localmod 034 */
	policy->shares_track_only = conf.prime_sto;
#endif /* localmod 034 */

	/* we want to know how much we can spill over INTO nonprime time */
	policy->prime_spill = conf.nonprime_spill;
	policy->smp_dist = conf.prime_smp_dist;

	/* policy -> prime_status_end is initially set by the scheduler's first
	 * call to update_cycle_status() at the beginning of the cycle
	 */
	policy->prime_status_end = end_prime_status(policy->prime_status_end);

	return 1;
}

/**
 * @brief
 * 		do any initializations that need to happen at
 *			      the beginning of non prime time
 *
 * @param[in]	policy	-	policy info
 *
 * @return	int
 * @retval	1	: success
 * @retval	0 	: error
 *
 */
int
init_non_prime_time(struct status *policy, char *arg)
{
	if (policy == NULL)
		return 0;

	policy->is_prime = NON_PRIME;
	policy->round_robin = conf.non_prime_rr;
	policy->by_queue = conf.non_prime_bq;
	policy->strict_fifo = conf.non_prime_sf;
	policy->strict_ordering = conf.non_prime_so;
	policy->sort_by = &conf.non_prime_sort;
	policy->fair_share = conf.non_prime_fs;
	policy->backfill = conf.non_prime_bf;
	policy->sort_nodes = conf.non_prime_sn;
	policy->backfill_prime = conf.non_prime_bp;
	policy->preempting = conf.non_prime_pre;
	policy->node_sort = &conf.non_prime_node_sort;
#ifdef NAS /* localmod 034 */
	policy->shares_track_only = conf.non_prime_sto;
#endif /* localmod 034 */

	/* we want to know how much we can spill over INTO primetime */
	policy->prime_spill = conf.prime_spill;
	policy->smp_dist = conf.non_prime_smp_dist;

	/* policy -> prime_status_end is initially set by the scheduler's first
	 * call to update_cycle_status() at the beginning of the cycle
	 */
	policy->prime_status_end = end_prime_status(policy->prime_status_end);

	return 1;
}


================================================
FILE: src/scheduler/prime.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _PRIME_H
#define _PRIME_H

#include "time.h"

/*
 *	time_left_today - macro - return the time left today
 *			  The macro will calculate the time between x and
 *			  23:59:59 and then add 1 to make it 00:00:00
 */
#define time_left_today(x) ((23 - ((x)->tm_hour)) * 3600 + \
			    (59 - ((x)->tm_min)) * 60 +    \
			    (59 - ((x)->tm_sec)) + 1)

/*
 *      is_prime_time - will return true if it is currently prime_time
 */
enum prime_time is_prime_time(time_t date);

/*
 *      check_prime - check if it is prime time for a particular day
 */
enum prime_time check_prime(enum days d, struct tm *t);

/*
 *      is_holiday - returns true if argument date is a holiday
 */
int is_holiday(long date);

/*
 *      load_day - fill in the prime time part of the config structure
 */
int load_day(enum days d, enum prime_time pr, const char *tok);

/*
 *      parse_holidays - parse the holidays file.  It should be in UNICOS 8
 *                       format.
 */
int parse_holidays(const char *fname);

/*
 *      init_prime_time - do any initializations that need to happen at the
 *                        start of prime time
 */
int init_prime_time(struct status *, char *);

/*
 *      init_non_prime_time - do any initializations that need to happen at
 *                            the beginning of non prime time
 */
int init_non_prime_time(struct status *, char *);

/*
 *
 *	end_prime_status - find the time when the current prime status
 *			   (primetime or nonprimetime) ends.
 *
 *	  date - the time to check (date = time when we start)
 *
 *	NOTE: If prime status doesn't end in start + 7 days, it is considered
 *		infinite
 *
 *	time_t - when the current prime status ends
 *      SCHD_INFINITY - if the current prime status never ends
 *
 */
time_t end_prime_status(time_t date);

#endif /* _PRIME_H */


================================================
FILE: src/scheduler/queue.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <stdio.h>
#include <stdlib.h>
#include <errno.h>

#include "constant.h"
#include "log.h"
#include "queue.h"

/**
 * @brief	Constructor for the data structure 'queue'
 *
 * @param	void
 *
 * @return queue *
 * @retval a newly allocated queue object
 * @retval NULL for malloc error
 */
ds_queue *
new_ds_queue(void)
{
	ds_queue *ret_obj;

	ret_obj = static_cast<ds_queue *>(malloc(sizeof(ds_queue)));
	if (ret_obj == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	ret_obj->min_size = QUEUE_DS_MIN_SIZE;
	ret_obj->content_arr = NULL;
	ret_obj->front = 0;
	ret_obj->rear = 0;
	ret_obj->q_size = 0;

	return ret_obj;
}

/**
 * @brief	Destructor for a queue object
 *
 * @param[in]	queue - the queue object to deallocate
 *
 * @return void
 */
void
free_ds_queue(ds_queue *queue)
{
	if (queue != NULL) {
		free(queue->content_arr);
		free(queue);
	}
}

/**
 * @brief	Enqueue an object into the queue
 *
 * @param[in]	queue - the queue to enqueue the object in
 * @param[in]	obj - the object to enqueue
 *
 * @return int
 * @retval 1 for Success
 * @retval 0 for Failure
 */
int
ds_enqueue(ds_queue *queue, void *obj)
{
	long curr_rear;
	long curr_qsize;

	if (queue == NULL || obj == NULL)
		return 0;

	curr_rear = queue->rear;
	curr_qsize = queue->q_size;

	if (curr_rear >= curr_qsize) {
		long new_qsize;
		void **realloc_ptr = NULL;

		/* Need to resize the queue */
		if (curr_qsize == 0) /* First enqueue operation */
			new_qsize = queue->min_size;
		else
			new_qsize = 2 * curr_qsize;

		realloc_ptr = static_cast<void **>(realloc(queue->content_arr, new_qsize * sizeof(void *)));
		if (realloc_ptr == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return 0;
		}

		queue->content_arr = realloc_ptr;
		queue->q_size = new_qsize;
	}

	queue->content_arr[curr_rear] = obj;
	queue->rear = curr_rear + 1;

	return 1;
}

/**
 * @brief	Dequeue an object from the queue
 *
 * @param[in]	queue - the queue to use
 *
 * @return void *
 * @retval the first item in queue
 * @retval NULL for error/empty queue
 */
void *
ds_dequeue(ds_queue *queue)
{
	if (queue == NULL)
		return NULL;

	if (queue->front == queue->rear) { /* queue is empty */
		/* Reset front and rear pointers */
		queue->front = 0;
		queue->rear = 0;
		return NULL;
	}

	return queue->content_arr[queue->front++];
}

/**
 * @brief	Check if a queue is empty
 *
 * @param[in]	queue  - the queue to use
 *
 * @return int
 * @retval 1 if queue is empty
 * @retval 0 otherwise
 */
int
ds_queue_is_empty(ds_queue *queue)
{
	if (queue == NULL)
		return 1;
	if (queue->front == queue->rear) {
		/* Make sure front and rear pointers are set to 0 */
		queue->front = 0;
		queue->rear = 0;
		return 1;
	} else
		return 0;
}


================================================
FILE: src/scheduler/queue.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef SRC_SCHEDULER_QUEUE_H_
#define SRC_SCHEDULER_QUEUE_H_

#define QUEUE_DS_MIN_SIZE 512 /* Minimum size of the queue data structure */

typedef struct ds_queue ds_queue;

struct ds_queue {
	int min_size;
	long front;
	long rear;
	long q_size;
	void **content_arr;
};

ds_queue *new_ds_queue(void);
void free_ds_queue(ds_queue *queue);
int ds_enqueue(ds_queue *queue, void *obj);
void *ds_dequeue(ds_queue *queue);
int ds_queue_is_empty(ds_queue *queue);

#endif /* SRC_SCHEDULER_QUEUE_H_ */


================================================
FILE: src/scheduler/queue_info.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    queue_info.c
 *
 * @brief
 * 		queue_info.c -  contains functions which are related to queue_info structure.
 *
 * Functions included are:
 * 	query_queues()
 * 	query_queue_info()
 * 	free_queues()
 * 	update_queue_on_run()
 * 	update_queue_on_end()
 * 	dup_queues()
 * 	find_queue_info()
 * 	node_queue_cmp()
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <assert.h>
#include <pbs_error.h>
#include <pbs_ifl.h>
#include <log.h>
#include "queue_info.h"
#include "job_info.h"
#include "resv_info.h"
#include "constant.h"
#include "misc.h"
#include "check.h"
#include "config.h"
#include "globals.h"
#include "node_info.h"
#include "sort.h"
#include "resource_resv.h"
#include "resource.h"
#include "state_count.h"
#ifdef NAS
#include "site_code.h"
#endif
#include "node_partition.h"
#include "limits_if.h"
#include "pbs_internal.h"
#include "fifo.h"

/**
 * @brief
 * 		creates an array of queue_info structs which contain
 *			an array of jobs
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	connection to the pbs_server
 * @param[in]	sinfo	-	server to query queues from
 *
 * @return	pointer to the head of the queue structure
 *
 */
std::vector<queue_info *>
query_queues(status *policy, int pbs_sd, server_info *sinfo)
{
	/* the linked list of queues returned from the server */
	struct batch_status *queues;

	/* the current queue in the linked list of queues */
	struct batch_status *cur_queue;

	/* array of pointers to internal scheduling structure for queues */
	std::vector<queue_info *> qinfo_arr;

	/* return code */
	sched_error_code ret;

	/* buffer to store comment message */
	char comment[MAX_LOG_SIZE];

	/* buffer to store log message */
	char log_msg[MAX_LOG_SIZE];

	/* used to count users/groups */
	counts *cts;

	/* peer server descriptor */
	int peer_sd = 0;

	int err = 0; /* an error has occurred */

	schd_error *sch_err;

	if (policy == NULL || sinfo == NULL)
		return qinfo_arr;

	sch_err = new_schd_error();

	if (sch_err == NULL)
		return qinfo_arr;

	/* get queue info from PBS server */
	if ((queues = send_statqueue(pbs_sd, NULL, NULL, NULL)) == NULL) {
		const char *errmsg = pbs_geterrmsg(pbs_sd);
		if (errmsg == NULL)
			errmsg = "";
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_QUEUE, LOG_NOTICE, "queue_info",
			   "Statque failed: %s (%d)", errmsg, pbs_errno);
		free_schd_error(sch_err);
		return qinfo_arr;
	}

	for (cur_queue = queues; cur_queue != NULL && !err; cur_queue = cur_queue->next) {
		queue_info *qinfo;

		/* convert queue information from batch_status to queue_info */
		if ((qinfo = query_queue_info(policy, cur_queue, sinfo)) == NULL) {
			free_schd_error(sch_err);
			pbs_statfree(queues);
			free_queues(qinfo_arr);
			return qinfo_arr;
		}

		if (queue_in_partition(qinfo, sc_attrs.partition)) {
			/* check if it is OK for jobs to run in the queue */
			ret = is_ok_to_run_queue(sinfo->policy, qinfo);
			if (ret == SUCCESS)
				qinfo->is_ok_to_run = 1;
			else
				qinfo->is_ok_to_run = 0;

			if (qinfo->has_nodes) {
				qinfo->nodes = node_filter(sinfo->nodes, sinfo->num_nodes,
							   node_queue_cmp, (void *) qinfo->name.c_str(), 0);

				qinfo->num_nodes = count_array(qinfo->nodes);
			}

			if (ret != QUEUE_NOT_EXEC) {
				/* get all the jobs which reside in the queue */
				qinfo->jobs = query_jobs(policy, pbs_sd, qinfo, NULL, qinfo->name);

				if (qinfo->is_ded_queue)
					sinfo->has_ded_queue = true;
				if (qinfo->is_prime_queue)
					sinfo->has_prime_queue = true;
				else if (qinfo->is_nonprime_queue)
					sinfo->has_nonprime_queue = true;

				for (auto &pq : conf.peer_queues) {
					if (qinfo->name == pq.local_queue) {
						int peer_on = 1;
						/* Locally-peered queues reuse the scheduler's connection */
						if (pq.remote_server.empty()) {
							peer_sd = pbs_sd;
						} else if ((peer_sd = pbs_connect_noblk(const_cast<char *>(pq.remote_server.c_str()))) < 0) {
							/* Message was PBSEVENT_SCHED - moved to PBSEVENT_DEBUG2 for
							 * failover reasons (see bz3002)
							 */
							log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_REQUEST, LOG_INFO, qinfo->name,
								   "Can not connect to peer %s", pq.remote_server.c_str());
							pq.peer_sd = -1;
							peer_on = 0; /* do not proceed */
						}
						if (peer_on) {
							pq.peer_sd = peer_sd;
							qinfo->is_peer_queue = 1;
							/* get peered jobs */
							qinfo->jobs = query_jobs(policy, peer_sd, qinfo, qinfo->jobs, pq.remote_queue);
						}
					}
				}

				clear_schd_error(sch_err);
				set_schd_error_codes(sch_err, NOT_RUN, ret);
				if (qinfo->is_ok_to_run == 0) {
					translate_fail_code(sch_err, comment, log_msg);
					update_jobs_cant_run(pbs_sd, qinfo->jobs, NULL, sch_err, START_WITH_JOB);
				}

				count_states(qinfo->jobs, &(qinfo->sc));

				qinfo->running_jobs = resource_resv_filter(qinfo->jobs,
									   qinfo->sc.total, check_run_job, NULL, 0);

				if (qinfo->running_jobs == NULL)
					err = 1;

				if (qinfo->has_soft_limit || qinfo->has_hard_limit) {
					counts *allcts;
					allcts = find_alloc_counts(qinfo->alljobcounts,
								   PBS_ALL_ENTITY);

					if (qinfo->running_jobs != NULL) {
						/* set the user and group counts */
						for (int j = 0; qinfo->running_jobs[j] != NULL; j++) {
							cts = find_alloc_counts(qinfo->user_counts,
										qinfo->running_jobs[j]->user);
							update_counts_on_run(cts, qinfo->running_jobs[j]->resreq);

							cts = find_alloc_counts(qinfo->group_counts,
										qinfo->running_jobs[j]->group);
							update_counts_on_run(cts, qinfo->running_jobs[j]->resreq);

							cts = find_alloc_counts(qinfo->project_counts,
										qinfo->running_jobs[j]->project);
							update_counts_on_run(cts, qinfo->running_jobs[j]->resreq);

							update_counts_on_run(allcts, qinfo->running_jobs[j]->resreq);
						}
						create_total_counts(NULL, qinfo, NULL, QUEUE);
					}
				}
			}

			qinfo_arr.push_back(qinfo);

		} else
			delete qinfo;
	}

	pbs_statfree(queues);
	free_schd_error(sch_err);
	if (err) {
		free_queues(qinfo_arr);
	}

	return qinfo_arr;
}

/**
 * @brief
 *		query_queue_info - collects information from a batch_status and
 *			   puts it in a queue_info struct for easier access
 *
 * @param[in]	policy	-	policy info
 * @param[in]	queue	-	batch_status struct to get queue information from
 * @param[in]	sinfo	-	server where queue resides
 *
 * @return	newly allocated and filled queue_info
 * @retval	NULL	: on error
 *
 */

queue_info *
query_queue_info(status *policy, struct batch_status *queue, server_info *sinfo)
{
	struct attrl *attrp;	  /* linked list of attributes from server */
	struct queue_info *qinfo; /* queue_info being created */
	schd_resource *resp;	  /* resource in resource qres list */
	char *endp;		  /* used with strtol() */
	sch_resource_t count;	  /* used to convert string -> num */

	if ((qinfo = new queue_info(queue->name)) == NULL)
		return NULL;

	if (qinfo->liminfo == NULL)
		return NULL;

	attrp = queue->attribs;
	qinfo->server = sinfo;
	while (attrp != NULL) {
		if (!strcmp(attrp->name, ATTR_start)) { /* started */
			if (!strcmp(attrp->value, ATR_TRUE))
				qinfo->is_started = 1;
			else
				qinfo->is_started = 0;
		} else if (!strcmp(attrp->name, ATTR_HasNodes)) {
			if (!strcmp(attrp->value, ATR_TRUE)) {
				sinfo->has_nodes_assoc_queue = 1;
				qinfo->has_nodes = 1;
			} else
				qinfo->has_nodes = 0;
		} else if (!strcmp(attrp->name, ATTR_backfill_depth)) {
			qinfo->backfill_depth = strtol(attrp->value, NULL, 10);
			if (qinfo->backfill_depth > 0)
				policy->backfill = 1;
		} else if (!strcmp(attrp->name, ATTR_partition)) {
			if (attrp->value != NULL) {
				qinfo->partition = string_dup(attrp->value);
				if (qinfo->partition == NULL) {
					log_err(errno, __func__, MEM_ERR_MSG);
					delete qinfo;
					return NULL;
				}
			}
		} else if (is_reslimattr(attrp)) {
			(void) lim_setlimits(attrp, LIM_RES, qinfo->liminfo);
			if (strstr(attrp->value, "u:") != NULL)
				qinfo->has_user_limit = 1;
			if (strstr(attrp->value, "g:") != NULL)
				qinfo->has_grp_limit = 1;
			if (strstr(attrp->value, "p:") != NULL)
				qinfo->has_proj_limit = 1;
			if (strstr(attrp->value, "o:") != NULL)
				qinfo->has_all_limit = 1;
		} else if (is_runlimattr(attrp)) {
			(void) lim_setlimits(attrp, LIM_RUN, qinfo->liminfo);
			if (strstr(attrp->value, "u:") != NULL)
				qinfo->has_user_limit = 1;
			if (strstr(attrp->value, "g:") != NULL)
				qinfo->has_grp_limit = 1;
			if (strstr(attrp->value, "p:") != NULL)
				qinfo->has_proj_limit = 1;
			if (strstr(attrp->value, "o:") != NULL)
				qinfo->has_all_limit = 1;
		} else if (is_oldlimattr(attrp)) {
			const char *limname = convert_oldlim_to_new(attrp);
			(void) lim_setlimits(attrp, LIM_OLD, qinfo->liminfo);

			if (strstr(limname, "u:") != NULL)
				qinfo->has_user_limit = 1;
			if (strstr(limname, "g:") != NULL)
				qinfo->has_grp_limit = 1;
			/* no need to check for project limits because there were no old style project limits */
		} else if (!strcmp(attrp->name, ATTR_p)) { /* priority */
			count = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				count = -1;
			qinfo->priority = count;
		} else if (!strcmp(attrp->name, ATTR_qtype)) { /* queue_type */
			if (!strcmp(attrp->value, "Execution")) {
				qinfo->is_exec = 1;
				qinfo->is_route = 0;
			} else if (!strcmp(attrp->value, "Route")) {
				qinfo->is_route = 1;
				qinfo->is_exec = 0;
			}
		} else if (!strcmp(attrp->name, ATTR_NodeGroupKey))
			qinfo->node_group_key = break_comma_list(std::string(attrp->value));
		else if (!strcmp(attrp->name, ATTR_rescavail)) { /* resources_available*/
#ifdef NAS
			/* localmod 040 */
			if (!strcmp(attrp->resource, ATTR_ignore_nodect_sort)) {
				if (!strcmp(attrp->value, ATR_TRUE))
					qinfo->ignore_nodect_sort = 1;
				else
					qinfo->ignore_nodect_sort = 0;

				resp = NULL;
			} /* localmod 038 */
			else if (!strcmp(attrp->resource, ATTR_topjob_setaside)) {
				if (!strcmp(attrp->value, ATR_TRUE))
					qinfo->is_topjob_set_aside = 1;
				else
					qinfo->is_topjob_set_aside = 0;

				resp = NULL;
			} else
#endif
				resp = find_alloc_resource_by_str(qinfo->qres, attrp->resource);
			if (resp != NULL) {
				if (qinfo->qres == NULL)
					qinfo->qres = resp;

				if (set_resource(resp, attrp->value, RF_AVAIL) == 0) {
					delete qinfo;
					return NULL;
				}
				qinfo->has_resav_limit = 1;
			}
		} else if (!strcmp(attrp->name, ATTR_rescassn)) { /* resources_assigned */
			resp = find_alloc_resource_by_str(qinfo->qres, attrp->resource);
			if (qinfo->qres == NULL)
				qinfo->qres = resp;
			if (resp != NULL) {
				if (set_resource(resp, attrp->value, RF_ASSN) == 0) {
					delete qinfo;
					return NULL;
				}
			}
		}
#ifdef NAS
		/* localmod 046 */
		else if (!strcmp(attrp->name, ATTR_maxstarve)) {
			time_t starve;
			starve = site_decode_time(attrp->value);
			qinfo->max_starve = starve;
		}
		/* localmod 034 */
		else if (!strcmp(attrp->name, ATTR_maxborrow)) {
			time_t borrow;
			borrow = site_decode_time(attrp->value);
			qinfo->max_borrow = borrow;
		}
#endif

		attrp = attrp->next;
	}

	if (has_hardlimits(qinfo->liminfo))
		qinfo->has_hard_limit = 1;
	if (has_softlimits(qinfo->liminfo))
		qinfo->has_soft_limit = 1;

	return qinfo;
}

// queue_info constructor
queue_info::queue_info(const char *qname) : name(qname)
{
	is_started = false;
	is_exec = false;
	is_route = false;
	is_ok_to_run = false;
	has_nodes = false;
	has_soft_limit = false;
	has_hard_limit = false;
	is_peer_queue = false;
	has_resav_limit = false;
	has_user_limit = false;
	has_grp_limit = false;
	has_proj_limit = false;
	has_all_limit = false;
	priority = 0;
	init_state_count(&sc);
	liminfo = lim_alloc_liminfo();
	num_nodes = 0;
	qres = NULL;
	jobs = NULL;
	running_jobs = NULL;
	server = NULL;
	resv = NULL;
	nodes = NULL;
	nodepart = NULL;
	allpart = NULL;
	num_parts = 0;
	num_topjobs = 0;
	backfill_depth = UNSPECIFIED;
#ifdef NAS
	/* localmod 046 */
	max_starve = 0;
	/* localmod 034 */
	max_borrow = UNSPECIFIED;
	/* localmod 038 */
	is_topjob_set_aside = 0;
	/* localmod 040 */
	ignore_nodect_sort = 0;
#endif
	partition = NULL;

	/* check if the queue is a dedicated time queue */
	if (name.compare(0, conf.ded_prefix.length(), conf.ded_prefix) == 0)
		is_ded_queue = true;
	else
		is_ded_queue = false;
	/* check if the queue is a prime time queue */
	if (name.compare(0, conf.pt_prefix.length(), conf.pt_prefix) == 0)
		is_prime_queue = true;
	else
		is_prime_queue = false;
	/* check if the queue is a nonprimetime queue */
	if (name.compare(0, conf.npt_prefix.length(), conf.npt_prefix) == 0)
		is_nonprime_queue = true;
	else
		is_nonprime_queue = false;
}

/**
 * @brief
 *		free_queues - free an array of queues
 *
 * @param[in,out]	qarr	-	qinfo array to delete
 *
 * @return	nothing
 *
 */

void
free_queues(std::vector<queue_info *> &qarr)
{
	if (qarr.empty())
		return;

	for (auto queue : qarr)
		delete queue;
	qarr.clear();
}

/**
 * @brief
 *		update_queue_on_run - update the information kept in a qinfo structure
 *				when a resource resv is run
 *
 * @param[in,out]	qinfo	-	the queue to update
 * @param[in]	resresv	-	the resource resv that was run
 * @param[in]  job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	nothing
 *
 */
void
update_queue_on_run(queue_info *qinfo, resource_resv *resresv, char *job_state)
{
	resource_req *req;

	if (qinfo == NULL || resresv == NULL)
		return;

	if (resresv->is_job && resresv->job == NULL)
		return;

	if (resresv->is_job) {
		qinfo->sc.running++;
		/* note: if job is suspended, counts will get off.
		 *       sc.queued is not used, and sc.suspended isn't used again
		 *       after this point
		 *       BZ 5798
		 */
		qinfo->sc.queued--;
	}

	if (!cstat.node_sort->empty() && conf.node_sort_unused && qinfo->nodes != NULL)
		qsort(qinfo->nodes, qinfo->num_nodes, sizeof(node_info *),
		      multi_node_sort);

	if ((job_state != NULL) && (*job_state == 'S') && (resresv->job->resreq_rel != NULL))
		req = resresv->job->resreq_rel;
	else
		req = resresv->resreq;

	while (req != NULL) {
		auto res = find_resource(qinfo->qres, req->def);

		if (res != NULL)
			res->assigned += req->amount;

		req = req->next;
	}

	qinfo->running_jobs = add_resresv_to_array(qinfo->running_jobs, resresv, NO_FLAGS);

	if (qinfo->has_soft_limit || qinfo->has_hard_limit) {

		if (resresv->is_job && resresv->job != NULL) {
			counts *cts;

			update_total_counts(NULL, qinfo, resresv, QUEUE);

			cts = find_alloc_counts(qinfo->group_counts, resresv->group);
			update_counts_on_run(cts, resresv->resreq);

			cts = find_alloc_counts(qinfo->project_counts, resresv->project);
			update_counts_on_run(cts, resresv->resreq);

			cts = find_alloc_counts(qinfo->user_counts, resresv->user);
			update_counts_on_run(cts, resresv->resreq);

			auto allcts = find_alloc_counts(qinfo->alljobcounts, PBS_ALL_ENTITY);
			update_counts_on_run(allcts, resresv->resreq);
		}
	}
}

/**
 * @brief
 *		update_queue_on_end - update a queue when a resource resv
 *				has finished running
 *
 * @par	NOTE:	job must be in pre-ended state
 *
 * @param[in,out]	qinfo	-	the queue to update
 * @param[in]	resresv	-	the resource resv which is no longer running
 * @param[in]  job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	nothing
 *
 */
void
update_queue_on_end(queue_info *qinfo, resource_resv *resresv, const char *job_state)
{
	schd_resource *res = NULL; /* resource from queue */
	resource_req *req = NULL;  /* resource request from job */

	if (qinfo == NULL || resresv == NULL)
		return;

	if (resresv->is_job && resresv->job == NULL)
		return;

	if (resresv->is_job) {
		if (resresv->job->is_running) {
			qinfo->sc.running--;
			remove_resresv_from_array(qinfo->running_jobs, resresv);
		} else if (resresv->job->is_exiting)
			qinfo->sc.exiting--;

		state_count_add(&(qinfo->sc), job_state, 1);
	}

	if ((job_state != NULL) && (*job_state == 'S') && (resresv->job->resreq_rel != NULL))
		req = resresv->job->resreq_rel;
	else
		req = resresv->resreq;

	while (req != NULL) {
		res = find_resource(qinfo->qres, req->def);

		if (res != NULL) {
			res->assigned -= req->amount;

			if (res->assigned < 0) {
				log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
					   "%s turned negative %.2lf, setting it to 0", res->name, res->assigned);
				res->assigned = 0;
			}
		}
		req = req->next;
	}

	if (qinfo->has_soft_limit || qinfo->has_hard_limit) {
		if (is_resresv_running(resresv)) {
			update_total_counts_on_end(NULL, qinfo, resresv, QUEUE);
			auto cts = find_counts(qinfo->group_counts, resresv->group);
			update_counts_on_end(cts, resresv->resreq);

			cts = find_counts(qinfo->project_counts, resresv->project);
			update_counts_on_end(cts, resresv->resreq);

			cts = find_counts(qinfo->user_counts, resresv->user);
			update_counts_on_end(cts, resresv->resreq);

			cts = find_alloc_counts(qinfo->alljobcounts, PBS_ALL_ENTITY);
			update_counts_on_end(cts, resresv->resreq);
		}
	}
}

// queue_info destructor
queue_info::~queue_info()
{
	free_resource_resv_array(jobs);
	free_resource_list(qres);
	free(running_jobs);
	free(nodes);
	free_counts_list(alljobcounts);
	free_counts_list(group_counts);
	free_counts_list(project_counts);
	free_counts_list(user_counts);
	free_counts_list(total_alljobcounts);
	free_counts_list(total_group_counts);
	free_counts_list(total_project_counts);
	free_counts_list(total_user_counts);
	free_node_partition_array(nodepart);
	free_node_partition(allpart);
	lim_free_liminfo(liminfo);
	free(partition);
}

/**
 * @brief
 *		dup_queues - duplicate the queues on a server
 *
 * @param[in]	oqueues	-	the queues to duplicate
 * @param[in]	nsinfo	-	the new server
 *
 * @return	the duplicated queue array
 *
 */
std::vector<queue_info *>
dup_queues(const std::vector<queue_info *> &oqueues, server_info *nsinfo)
{
	std::vector<queue_info *> new_queues = {};

	if (oqueues.empty())
		return new_queues;

	for (auto queue : oqueues) {
		queue_info *temp;
		try {
			temp = new queue_info(*queue, nsinfo);
		} catch (std::bad_alloc &e) {
			free_queues(new_queues);
			/* return the empty vector */
			return new_queues;
		}
		new_queues.push_back(temp);
	}
	return new_queues;
}

/**
 * @brief 	queue_info copy constructor
 *
 * @param[in]	nsinfo	-	the server which owns the duplicated queue
 *
 */
queue_info::queue_info(queue_info &oqinfo, server_info *nsinfo) : name(oqinfo.name), sc(oqinfo.sc)
{
	server = nsinfo;

	is_started = oqinfo.is_started;
	is_exec = oqinfo.is_exec;
	is_route = oqinfo.is_route;
	is_ok_to_run = oqinfo.is_ok_to_run;
	is_ded_queue = oqinfo.is_ded_queue;
	is_prime_queue = oqinfo.is_prime_queue;
	is_nonprime_queue = oqinfo.is_nonprime_queue;
	has_nodes = oqinfo.has_nodes;
	has_soft_limit = oqinfo.has_soft_limit;
	has_hard_limit = oqinfo.has_hard_limit;
	is_peer_queue = oqinfo.is_peer_queue;
	has_resav_limit = oqinfo.has_resav_limit;
	has_user_limit = oqinfo.has_user_limit;
	has_grp_limit = oqinfo.has_grp_limit;
	has_proj_limit = oqinfo.has_proj_limit;
	has_all_limit = oqinfo.has_all_limit;
	liminfo = lim_dup_liminfo(oqinfo.liminfo);
	priority = oqinfo.priority;
	num_parts = oqinfo.num_parts;
	num_topjobs = oqinfo.num_topjobs;
	backfill_depth = oqinfo.backfill_depth;
	num_nodes = oqinfo.num_nodes;

#ifdef NAS
	/* localmod 046 */
	max_starve = oqinfo.max_starve;
	/* localmod 034 */
	max_borrow = oqinfo.max_borrow;
	/* localmod 038 */
	is_topjob_set_aside = oqinfo.is_topjob_set_aside;
	/* localmod 040 */
	ignore_nodect_sort = oqinfo.ignore_nodect_sort;
#endif

	qres = dup_resource_list(oqinfo.qres);
	alljobcounts = dup_counts_umap(oqinfo.alljobcounts);
	group_counts = dup_counts_umap(oqinfo.group_counts);
	project_counts = dup_counts_umap(oqinfo.project_counts);
	user_counts = dup_counts_umap(oqinfo.user_counts);
	total_alljobcounts = dup_counts_umap(oqinfo.total_alljobcounts);
	total_group_counts = dup_counts_umap(oqinfo.total_group_counts);
	total_project_counts = dup_counts_umap(oqinfo.total_project_counts);
	total_user_counts = dup_counts_umap(oqinfo.total_user_counts);
	nodepart = dup_node_partition_array(oqinfo.nodepart, nsinfo);
	allpart = dup_node_partition(oqinfo.allpart, nsinfo);
	node_group_key = oqinfo.node_group_key;

	if (oqinfo.resv != NULL) {
		resv = find_resource_resv_by_indrank(nsinfo->resvs, oqinfo.resv->resresv_ind, oqinfo.resv->rank);
		if (resv != NULL) {
			if (!resv->resv->is_standing) {
				/* just incase we we didn't set the reservation cross pointer */
				resv->resv->resv_queue = this;
			} else {
				/* For standing reservations, we need to restore the resv_queue pointers for all occurrences */
				int i;
				for (i = 0; server->resvs[i] != NULL; i++) {
					if (server->resvs[i]->name == resv->name)
						server->resvs[i]->resv->resv_queue = this;
				}
			}
		}
	} else
		resv = NULL;

	jobs = dup_resource_resv_array(oqinfo.jobs, server, this);

	running_jobs = resource_resv_filter(jobs, sc.total, check_run_job, NULL, 0);

	if (oqinfo.has_nodes)
		nodes = copy_node_ptr_array(oqinfo.nodes, nsinfo->nodes);
	else
		nodes = NULL;

	partition = string_dup(oqinfo.partition);
}

/**
 * @brief
 * 		find a queue by name
 *
 * @param[in]	qinfo_arr	-	the array of queues to look in
 * @param[in]	name	-	the name of the queue
 *
 * @return	the found queue
 * @retval	NULL	: error.
 *
 */
queue_info *
find_queue_info(std::vector<queue_info *> &qinfo_arr, const std::string &name)
{
	if (qinfo_arr.empty())
		return NULL;

	for (auto queue : qinfo_arr) {
		if (queue->name == name)
			return queue;
	}

	/* either we have found our queue or the NULL sentinal value */
	return NULL;
}

/**
 * @brief
 *		node_queue_cmp - used with node_filter to filter nodes attached to a
 *		         specific queue
 *
 * @param[in]	node	-	the node we're currently filtering
 * @param[in]	arg	-	the name of the queue
 *
 * @return	int
 * @return	1	: keep the node
 * @return	0	: don't keep the node
 *
 */
int
node_queue_cmp(node_info *ninfo, void *arg)
{
	if (ninfo->queue_name == (char *) arg)
		return 1;

	return 0;
}

/**
 * @brief
 *      queue_in_partition	-  Tells whether the given node belongs to this scheduler
 *
 * @param[in]	qinfo		-  queue information
 * @param[in]	partition	-  partition associated to scheduler
 *
 * @return	a node_info filled with information from node
 *
 * @return	int
 * @retval	1	: if success
 * @retval	0	: if failure
 */
int
queue_in_partition(queue_info *qinfo, char *partition)
{
	if (dflt_sched) {
		if (qinfo->partition == NULL || (strcmp(qinfo->partition, DEFAULT_PARTITION) == 0))
			return 1;
		else
			return 0;
	}
	if (qinfo->partition == NULL)
		return 0;

	if (strcmp(partition, qinfo->partition) == 0)
		return 1;
	else
		return 0;
}


================================================
FILE: src/scheduler/queue_info.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _QUEUE_INFO_H
#define _QUEUE_INFO_H
#include <pbs_ifl.h>
#include "data_types.h"

/*
 *
 *      query_queues - creates an array of queue_info structs which contain
 *                      an array of jobs
 */
std::vector<queue_info *> query_queues(status *policy, int pbs_sd, server_info *sinfo);

/*
 *      query_queue_info - collects information from a batch_status and
 *                         puts it in a queue_info struct for easier access
 */
queue_info *query_queue_info(status *policy, struct batch_status *queue, struct server_info *sinfo);

/*
 *      new_queue_info - allocate and initalize a new queue_info struct
 */
queue_info *new_queue_info(int limallocflag);

/*
 *      free_queues - frees the memory for an array
 */
void free_queues(std::vector<queue_info *> &qarr);

/*
 *      update_queue_on_run - update the information kept in a qinfo structure
 *                              when a job is run
 */
void update_queue_on_run(queue_info *qinfo, resource_resv *resresv, char *job_state);

/*
 *      dup_queues - duplicate the queues on a server
 */
std::vector<queue_info *> dup_queues(const std::vector<queue_info *> &oqueues, server_info *nsinfo);

/*
 *
 *	find_queue_info - find a queue by name
 *
 *	  qinfo_arr - the array of queues to look in
 *	  name - the name of the queue
 *
 *	return the found queue or NULL
 *
 */
queue_info *find_queue_info(std::vector<queue_info *> &qinfo_arr, const std::string &name);

/*
 *	update_queue_on_end - update a queue when a job has finished running
 */
void
update_queue_on_end(queue_info *qinfo, resource_resv *resresv,
		    const char *job_state);

int queue_in_partition(queue_info *qinfo, char *partition);

struct batch_status *send_statqueue(int virtual_fd, char *id, struct attrl *attrib, char *extend);

#endif /* _QUEUE_INFO_H */


================================================
FILE: src/scheduler/resource.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    resource.c
 *
 * @brief
 * 	resource.c - contains functions related to resources.
 *
 * Functions included are:
 * 	query_resources()
 * 	conv_rsc_type()
 * 	def_is_consumable()
 * 	def_is_bool()
 * 	copy_resdef_array()
 * 	find_resdef()
 * 	is_res_avail_set()
 * 	add_resource_sig()
 * 	create_resource_signature()
 * 	update_resource_defs()
 * 	resstr_to_resdef()
 * 	collect_resources_from_requests()
 * 	update_sorting_defs()
 *
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>

#include <pbs_ifl.h>
#include <log.h>
#include "resource.h"
#include "constant.h"
#include "config.h"
#include "data_types.h"
#include "misc.h"
#include "globals.h"
#include "resource_resv.h"
#include "pbs_internal.h"
#include "limits_if.h"
#include "sort.h"
#include "parse.h"
#include "fifo.h"

/**
 * @brief
 * 		query a pbs server for the resources it knows about and fill in the global unordered_map
 *
 * @param[in]	pbs_sd	-	communication descriptor to pbs server
 *
 * @return unordered_map of resource defs
 */
std::unordered_map<std::string, resdef *>
query_resources(int pbs_sd)
{
	struct batch_status *bs;     /* queried resources from server */
	struct batch_status *cur_bs; /* used to iterate over resources */
	struct attrl *attrp;	     /* iterate over resource fields */
	std::unordered_map<std::string, resdef *> tmpres;

	if ((bs = send_statrsc(pbs_sd, NULL, NULL, const_cast<char *>("p"))) == NULL) {
		const char *errmsg = pbs_geterrmsg(pbs_sd);
		if (errmsg == NULL)
			errmsg = "";

		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_REQUEST, LOG_INFO, "pbs_statrsc",
			   "pbs_statrsc failed: %s (%d)", errmsg, pbs_errno);
		return {};
	}

	for (cur_bs = bs; cur_bs != NULL; cur_bs = cur_bs->next) {
		int flags = NO_FLAGS;
		resource_type rtype;

		for (attrp = cur_bs->attribs; attrp != NULL; attrp = attrp->next) {
			char *endp;

			if (!strcmp(attrp->name, ATTR_RESC_TYPE)) {
				int num = strtol(attrp->value, &endp, 10);
				rtype = conv_rsc_type(num);
			} else if (!strcmp(attrp->name, ATTR_RESC_FLAG)) {
				flags = strtol(attrp->value, &endp, 10);
			}
		}
		tmpres[cur_bs->name] = new resdef(cur_bs->name, flags, rtype);
	}
	pbs_statfree(bs);

	/**
	 * @par Make sure all the well known resources are sent to us.
	 *      This is to allow us to directly index into the allres umap.
	 *      Do not directly index into the allres umap for non-well known resources.  Use find_resdef()
	 */
	for (const auto &r : well_known_res) {
		if (tmpres.find(r) == tmpres.end()) {
			for (auto &d : tmpres)
				delete d.second;
			return {};
		}
	}

	return tmpres;
}

/**
 * @brief
 * 		convert server type number into resource_type struct
 *
 * @param[in]	type	-	server type number
 * @param[out]	rtype	-	resource type structure
 *
 * @return	converted resource_type
 *
 */
resource_type
conv_rsc_type(int type)
{
	resource_type rtype;
	switch (type) {
		case ATR_TYPE_STR:
		case ATR_TYPE_ARST:
			rtype.is_string = true;
			rtype.is_non_consumable = true;
			break;
		case ATR_TYPE_BOOL:
			rtype.is_boolean = true;
			rtype.is_non_consumable = true;
			break;
		case ATR_TYPE_SIZE:
			rtype.is_size = true;
			rtype.is_num = true;
			rtype.is_consumable = true;
			break;
		case ATR_TYPE_SHORT:
		case ATR_TYPE_LONG:
		case ATR_TYPE_LL:
			rtype.is_long = true;
			rtype.is_num = true;
			rtype.is_consumable = true;
			break;
		case ATR_TYPE_FLOAT:
			rtype.is_float = true;
			rtype.is_num = true;
			rtype.is_consumable = true;
			break;
	}
	return rtype;
}

/**
 * @brief find a resdef in the global allres
 * 	  This function should be used if not finding a well known resource
 *
 * @param name - the name of the resdef to find
 *
 * @return resdef *
 * @retval found resdef
 * @retval NULL if not found
 */
resdef *
find_resdef(const std::string &name)
{
	auto f = allres.find(name);
	if (f == allres.end())
		return NULL;

	return f->second;
}

/**
 * @brief
 * 		checks if a resource avail is set.
 *
 * @param[in]	res	-	resource to see if it is set
 *
 * @return	int
 * @retval	1	: is set
 * @retval	0	: not set
 */
int
is_res_avail_set(schd_resource *res)
{
	if (res == NULL)
		return 0;

	if (res->type.is_string) {
		if (res->str_avail != NULL && res->str_avail[0] != NULL)
			return 1;
	} else if (res->avail != SCHD_INFINITY_RES)
		return 1;

	return 0;
}

/**
 * @brief
 * 		add the resource signature of 'res' to the string 'sig'
 *
 * @param[in,out]	sig	-	resource signature we're adding to
 * @param[in,out]	sig_size	-	size of string sig
 * @param[in]	res	-	the resource to add to sig
 *
 * @return	success/failure
 * @retval	1	: success
 * @retval	0	: failure
 */
int
add_resource_sig(char **sig, int *sig_size, schd_resource *res)
{
	if (sig == NULL || res == NULL)
		return 0;

	if (pbs_strcat(sig, sig_size, res->name) == 0)
		return 0;
	if (pbs_strcat(sig, sig_size, "=") == 0)
		return 0;
	if (pbs_strcat(sig, sig_size, res_to_str(res, RF_AVAIL)) == 0)
		return 0;

	return 1;
}
/**
 * @brief
 * 		create node string resource node signature based on the resources
 *      in order from the 'resources' parameter.  This signature can be used
 *      to compare two nodes to see if they are equivalent resource wise
 * @par
 *      FORM: res0=val:res1=val:...:resN=val
 *      Where 0, 1, .., N are indices into the resources array
 *
 * @param[in]	node	-	node to create signature from
 * @param[in]	resources	-	string array of resources
 * @param[in]	flags	-	CHECK_ALL_BOOLS - include all booleans even if not in resources
 *
 * @return	char *
 * @retval	signature of node
 * @retval	NULL	: on error
 *
 * @par	it is the responsibility of the caller to free string returned
 */
char *
create_resource_signature(schd_resource *reslist, std::unordered_set<resdef *> &resources, unsigned int flags)
{
	char *sig = NULL;
	int sig_size = 0;
	schd_resource *res;

	if (reslist == NULL)
		return NULL;

	if ((sig = static_cast<char *>(malloc(1024))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	sig_size = 1024;
	sig[0] = '\0';

	for (const auto &r : resources) {
		res = find_resource(reslist, r);
		if (res != NULL) {
			if (res->indirect_res != NULL) {
				res = res->indirect_res;
			}
			if (is_res_avail_set(res)) {
				add_resource_sig(&sig, &sig_size, res);
				if (pbs_strcat(&sig, &sig_size, ":") == NULL) {
					free(sig);
					return NULL;
				}
			}
		}
	}

	if ((flags & ADD_ALL_BOOL)) {
		for (const auto &br : boolres) {
			if (resources.find(br) == resources.end()) {
				res = find_resource(reslist, br);
				if (res != NULL) {
					add_resource_sig(&sig, &sig_size, res);
					if (pbs_strcat(&sig, &sig_size, ":") == NULL) {
						free(sig);
						return NULL;
					}
				}
			}
		}
	}
	/* we will have a trailing ':' if we did anything, so strip it*/
	if (sig[0] != '\0')
		sig[strlen(sig) - 1] = '\0';

	return sig;
}

/**
 * @brief update allres and sub-containers of resource definitions.  This is called
 *		in schedule().  If it fails in schedule() we'll pick it up in the next call to quuery_server()
 *
 * @param[in]	pbs_sd	-	connection descriptor to the pbs server
 *
 * @return	bool
 * @retval	true - successfully updated resdefs
 * @retval	false - failed to update resdefs
 */
bool
update_resource_defs(int pbs_sd)
{
	auto tmpres = query_resources(pbs_sd);

	if (tmpres.empty())
		return false;

	for (auto &lr : last_running) {
		resource_req *prev_res = NULL;
		for (auto ru = lr.resused; ru != NULL;) {
			auto f = tmpres.find(ru->name);
			if (f == tmpres.end()) {
				resource_req *tru;
				tru = ru->next;
				free_resource_req(ru);
				if (prev_res != NULL)
					prev_res->next = tru;
				else
					lr.resused = tru;
				ru = tru;
			} else {
				ru->def = f->second;
				ru->name = ru->def->name.c_str();
				prev_res = ru;
				ru = ru->next;
			}
		}
	}

	for (auto &d : allres)
		delete d.second;

	allres = tmpres;

	consres.clear();
	for (const auto &def : allres) {
		if (def.second->type.is_consumable)
			consres.insert(def.second);
	}

	boolres.clear();
	for (const auto &def : allres) {
		if (def.second->type.is_boolean)
			boolres.insert(def.second);
	}

	conf.resdef_to_check.clear();
	if (!conf.res_to_check.empty()) {
		conf.resdef_to_check = resstr_to_resdef(conf.res_to_check);
	}
	update_sorting_defs();

	clear_limres();

	return true;
}

/**
 * @brief
 * 		convert an array of string resource names into resdefs
 *
 * @param[in]	resstr	-	array of resource strings
 *
 * @return	resdef array
 * @retval	NULL	: on error
 */
std::unordered_set<resdef *>
resstr_to_resdef(const std::unordered_set<std::string> &resstr)
{
	std::unordered_set<resdef *> defs;

	for (const auto &str : resstr) {
		auto def = find_resdef(str);
		if (def != NULL)
			defs.insert(def);
		else {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, str, "Unknown Resource");
		}
	}

	return defs;
}

std::unordered_set<resdef *>
resstr_to_resdef(const char *const *resstr)
{
	std::unordered_set<resdef *> defs;

	for (int i = 0; resstr[i] != NULL; i++) {
		auto def = find_resdef(resstr[i]);
		if (def != NULL)
			defs.insert(def);
		else {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, resstr[i], "Unknown Resource");
		}
	}

	return defs;
}

/**
 * @brief
 * 		collect a unique list of resource definitions from an array of requests
 *
 * @param[in]	resresv_arr	-	array of requests
 *
 * @return	array of resource definitions
 */
std::unordered_set<resdef *>
collect_resources_from_requests(resource_resv **resresv_arr)
{
	int i;
	resource_req *req;
	std::unordered_set<resdef *> defset;

	for (i = 0; resresv_arr[i] != NULL; i++) {
		resource_resv *r = resresv_arr[i];

		/* schedselect: node resources - resources to be satisfied on the nodes */
		if (r->select != NULL) {
			for (const auto &sdef : r->select->defs)
				defset.insert(sdef);
		}
		/*
		 * execselect: select created from the exec_vnode.  This is likely to
		 * be a subset of resources from schedselect + 'vnode'.  It is possible
		 * that a job was run with qrun -H (res=val) where res is not part of
		 * the schedselect.  The exec_vnode is taken directly from the -H argument
		 * The qrun -H case is why we need to do this check.
		 */
		if (r->execselect != NULL) {
			if ((r->job != NULL && in_runnable_state(r)) ||
			    (r->resv != NULL && (r->resv->resv_state == RESV_BEING_ALTERED || r->resv->resv_substate == RESV_DEGRADED))) {
				for (const auto &esd : r->execselect->defs)
					defset.insert(esd);
			}
		}
		/* Resource_List: job wide resources: resources submitted with
		 * qsub -l and resources with the ATTR_DFLAG_RASSN which the server
		 * sums all the requested amounts in the select and sets job wide
		 */
		for (req = r->resreq; req != NULL; req = req->next)
			if (conf.res_to_check.find(req->name) != conf.res_to_check.end())
				defset.insert(req->def);
	}
	return defset;
}

/**
 * @brief update the resource def for a single sort_info vector
 * @param[in] op - operation to do (e.h. update or clear)
 * @param[in, out] siv - sort_info vector to update
 * @param[in] obj - object type (node or job)
 * @param[in] prefix - string prefix for logging
 * 
 * @return nothing
 */
void
update_single_sort_def(std::vector<sort_info> &siv, int obj, const char *prefix)
{
	for (auto &si : siv) {
		auto f = allres.find(si.res_name);
		if (is_speccase_sort(si.res_name, obj))
			si.def = NULL;
		else if (f == allres.end()) {
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, CONFIG_FILE,
				   "%s sorting resource %s is not a valid resource", prefix, si.res_name.c_str());
			si.def = NULL;
		} else
			si.def = f->second;
	}
}

/**
 * @brief update the resource definition pointers in the sort_info structures
 *
 * @par	We parse our config file when we start.  We do not have the resource
 *      definitions at that time.  They also can change over time if the server
 *      sends us a SCH_CONFIGURE command.
 *
 * @param[in]	op	-	update(non-zero) or clear definitions(0)
 */
void
update_sorting_defs(void)
{
	update_single_sort_def(conf.prime_node_sort, SOBJ_NODE, "prime node");
	update_single_sort_def(conf.non_prime_node_sort, SOBJ_NODE, "Non-prime node");
	update_single_sort_def(conf.prime_sort, SOBJ_JOB, "prime job");
	update_single_sort_def(conf.non_prime_sort, SOBJ_JOB, "Non-prime job");
}

/**
 * 	@brief resource_type constructor
 */
resource_type::resource_type()
{
	is_non_consumable = false;
	is_string = false;
	is_boolean = false;

	is_consumable = false;
	is_num = false;
	is_long = false;
	is_float = false;
	is_size = false;
	is_time = false;
}


================================================
FILE: src/scheduler/resource.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include "data_types.h"
#ifndef _RESOURCE_H
#define _RESOURCE_H

/*
 *	query_resources - query a pbs server for the resources it knows about
 *
 *	  pbs_sd - communication descriptor to pbs server
 *
 *	returns resdef list of resources
 */
std::unordered_map<std::string, resdef *> query_resources(int pbs_sd);

/*
 *	conv_rsc_type - convert server type number into resource_type struct
 *	  IN:  type - server type number
 *	  OUT: rtype - resource type structure
 *	returns nothing
 */
resource_type conv_rsc_type(int type);

/* find and return a resdef entry by name */
resdef *find_resdef(const std::string &name);

/*
 *  create resdef array based on a str array of resource names
 */
resdef **resdef_arr_from_str_arr(resdef **deflist, char **strarr);

/*
 * query the resource definition from the server and create derived
 * data structures.  Only query if required.
 */
bool update_resource_defs(int pbs_sd);

/* checks if a resource avail is set. */
int is_res_avail_set(schd_resource *res);

/* create a resource signature for a set of resources */
char *create_resource_signature(schd_resource *reslist, std::unordered_set<resdef *> &resources, unsigned int flags);

/* collect a unique list of resources from an array of requests */
std::unordered_set<resdef *> collect_resources_from_requests(resource_resv **resresv_arr);

/* convert an array of string resource names into resdefs */
std::unordered_set<resdef *> resstr_to_resdef(const std::unordered_set<std::string> &);
std::unordered_set<resdef *> resstr_to_resdef(const char *const *resstr);

/* filter function for filter_array().  Used to filter out host and vnode */
int no_hostvnode(void *v, void *arg);

/* add resdef to resdef array */
int add_resdef_to_array(resdef ***resdef_arr, resdef *def);

/* make a copy of a resdef array -- array itself is new memory,
 *        pointers point to the same thing
 */
resdef **copy_resdef_array(resdef **deflist);

/* update the def member in sort_info structures in conf */
void update_sorting_defs(void);

/* wrapper for pbs_statrsc */
struct batch_status *send_statrsc(int virtual_fd, char *id, struct attrl *attrib, char *extend);

#endif /* _RESOURCE_H */


================================================
FILE: src/scheduler/resource_resv.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    resource_resv.c
 *
 * @brief
 * 	resource_resv.c - This file contains functions related to resource reservations.
 *
 * Functions included are:
 * 	free_resource_resv_array()
 * 	dup_resource_resv_array()
 * 	dup_resource_resv()
 * 	find_resource_resv()
 * 	find_resource_resv_by_indrank()
 * 	find_resource_resv_by_time()
 * 	is_resource_resv_valid()
 * 	dup_resource_req_list()
 * 	dup_resource_req()
 * 	new_resource_req()
 * 	create_resource_req()
 * 	find_alloc_resource_req()
 * 	find_alloc_resource_req_by_str()
 * 	find_resource_req_by_str()
 * 	find_resource_req()
 * 	set_resource_req()
 * 	free_resource_req_list()
 * 	free_resource_req()
 * 	update_resresv_on_run()
 * 	update_resresv_on_end()
 * 	resource_resv_filter()
 * 	remove_resresv_from_array()
 * 	add_resresv_to_array()
 * 	copy_resresv_array()
 * 	is_resresv_running()
 * 	new_place()
 * 	free_place()
 * 	dup_place()
 * 	new_chunk()
 * 	dup_chunk_array()
 * 	dup_chunk()
 * 	free_chunk_array()
 * 	free_chunk()
 * 	compare_res_to_str()
 * 	compare_non_consumable()
 * 	create_select_from_nspec()
 * 	in_runnable_state()
 *
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <errno.h>
#include <string.h>
#include <log.h>
#include <pthread.h>
#include <libutil.h>
#include "pbs_config.h"
#include "data_types.h"
#include "resource_resv.h"
#include "job_info.h"
#include "resv_info.h"
#include "node_info.h"
#include "misc.h"
#include "node_partition.h"
#include "constant.h"
#include "globals.h"
#include "resource.h"
#include "pbs_internal.h"
#include "check.h"
#include "fifo.h"
#include "range.h"
#include "simulate.h"
#include "multi_threading.h"

/**
 * @brief
 *		resource_resv constructor
 */
resource_resv::resource_resv(const std::string &rname) : name(rname)
{
	nodepart_name = NULL;
	select = NULL;
	execselect = NULL;

	place_spec = NULL;

	is_invalid = 0;
	can_not_fit = 0;
	can_not_run = 0;
	can_never_run = 0;
	is_peer_ob = 0;

	is_prov_needed = 0;
	is_job = 0;
	is_shrink_to_fit = 0;
	is_resv = 0;

	will_use_multinode = 0;

	sch_priority = 0;
	rank = 0;
	qtime = 0;
	qrank = 0;

	ec_index = UNSPECIFIED;

	start = UNSPECIFIED;
	end = UNSPECIFIED;
	duration = UNSPECIFIED;
	hard_duration = UNSPECIFIED;
	min_duration = UNSPECIFIED;
	resreq = NULL;
	server = NULL;
	ninfo_arr = NULL;

	job = NULL;
	resv = NULL;

	aoename = NULL;
	eoename = NULL;

#ifdef NAS /* localmod 034 */
	share_type = J_TYPE_ignore;
#endif /* localmod 034 */

	node_set_str = NULL;
	node_set = NULL;
	resresv_ind = -1;
	run_event = NULL;
	end_event = NULL;
}

/**
 * @brief	pthread routine to free resource_resv array chunk
 *
 * @param[in,out]	data - th_data_free_resresv wrapper for resource_resv array
 *
 * @return void
 */
void
free_resource_resv_array_chunk(th_data_free_resresv *data)
{
	resource_resv **resresv_arr;
	int start;
	int end;
	int i;

	resresv_arr = data->resresv_arr;
	start = data->sidx;
	end = data->eidx;

	for (i = start; i <= end && resresv_arr[i] != NULL; i++) {
		delete resresv_arr[i];
	}
}

/**
 * @brief	Allocates th_data_free_resresv for multi-threading of free_resource_resv_array
 *
 * @param[in,out]	resresv_arr	-	the resresv array to free
 * @param[in]	sidx	-	start index for the resresv array for the thread
 * @param[in]	eidx	-	end index for the resresv array for the thread
 *
 * @return th_data_free_resresv *
 * @retval a newly allocated th_data_free_resresv object
 * @retval NULL for malloc error
 */
static inline th_data_free_resresv *
alloc_tdata_free_rr_arr(resource_resv **resresv_arr, int sidx, int eidx)
{
	th_data_free_resresv *tdata;

	tdata = static_cast<th_data_free_resresv *>(malloc(sizeof(th_data_free_resresv)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	tdata->resresv_arr = resresv_arr;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 *		free_resource_resv_array - free an array of resource resvs
 *
 * @param[in,out]	resresv_arr	-	resource resv to free
 *
 * @return	nothing
 *
 */
void
free_resource_resv_array(resource_resv **resresv_arr)
{
	int i;
	int chunk_size;
	th_data_free_resresv *tdata = NULL;
	th_task_info *task = NULL;
	int num_tasks;
	int num_jobs;
	int tid;

	if (resresv_arr == NULL)
		return;

	num_jobs = count_array(resresv_arr);

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_free_rr_arr(resresv_arr, 0, num_jobs - 1);
		if (tdata == NULL)
			return;

		free_resource_resv_array_chunk(tdata);
		free(tdata);
		free(resresv_arr);
		return;
	}

	chunk_size = num_jobs / num_threads;
	chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
	chunk_size = (chunk_size < MT_CHUNK_SIZE_MAX) ? chunk_size : MT_CHUNK_SIZE_MAX;
	for (i = 0, num_tasks = 0; num_jobs > 0;
	     num_tasks++, i += chunk_size, num_jobs -= chunk_size) {
		tdata = alloc_tdata_free_rr_arr(resresv_arr, i, i + chunk_size - 1);
		if (tdata == NULL)
			break;

		task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
		task->task_type = TS_FREE_RESRESV;
		task->thread_data = (void *) tdata;

		queue_work_for_threads(task);
	}

	/* Get results from worker threads */
	for (i = 0; i < num_tasks;) {
		pthread_mutex_lock(&result_lock);
		while (ds_queue_is_empty(result_queue))
			pthread_cond_wait(&result_cond, &result_lock);
		while (!ds_queue_is_empty(result_queue)) {
			task = static_cast<th_task_info *>(ds_dequeue(result_queue));
			tdata = static_cast<th_data_free_resresv *>(task->thread_data);
			free(tdata);
			free(task);
			i++;
		}
		pthread_mutex_unlock(&result_lock);
	}

	free(resresv_arr);
}

/**
 * @brief
 *		resource_resv destructor
 *
 */
resource_resv::~resource_resv()
{
	free(nodepart_name);
	delete select;
	delete execselect;
	free_place(place_spec);
	free_resource_req_list(resreq);
	free(ninfo_arr);
	free_nspecs(nspec_arr);
	free_job_info(job);
	free_resv_info(resv);
	free(aoename);
	free(eoename);
	free_string_array(node_set_str);
	free(node_set);
	/* Avoid dangling pointers inside the calendar */
	if (run_event != NULL)
		delete_event(server, run_event);

	if (end_event != NULL)
		delete_event(server, end_event);
}

/**
 * @brief	pthread routine for duping a chunk of resresvs
 *
 * @param[in,out]	data - th_data_dup_resresv object for duping
 *
 * @return void
 */
void
dup_resource_resv_array_chunk(th_data_dup_resresv *data)
{
	resource_resv **nresresv_arr;
	resource_resv **oresresv_arr;
	server_info *nsinfo;
	queue_info *nqinfo;
	int start;
	int end;
	int i;
	schd_error *err;

	err = new_schd_error();
	if (err == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		data->error = 1;
		return;
	}

	nresresv_arr = data->nresresv_arr;
	oresresv_arr = data->oresresv_arr;
	nsinfo = data->nsinfo;
	nqinfo = data->nqinfo;
	start = data->sidx;
	end = data->eidx;
	data->error = 0;
	for (i = start; i <= end && oresresv_arr[i] != NULL; i++) {
		if ((nresresv_arr[i] = dup_resource_resv(oresresv_arr[i], nsinfo, nqinfo)) == NULL) {
			data->error = 1;
			free_schd_error(err);
			return;
		}
	}

	free_schd_error(err);
}

/**
 * @brief	Allocates th_data_dup_resresv for multi-threading of dup_resource_resv_array
 *
 * @param[in]	oresresv_arr	-	the array to duplicate
 * @param[out]	nresresv_arr	-	the duplicated array
 * @param[in]	nsinfo	-	new server ptr for new resresv array
 * @param[in]	nqinfo	-	new queue ptr for new resresv array
 * @param[in]	sidx	-	start index for the resresv list for the thread
 * @param[in]	eidx	-	end index for the resresv list for the thread
 *
 * @return th_data_dup_resresv *
 * @retval a newly allocated th_data_dup_resresv object
 * @retval NULL for malloc error
 */
static inline th_data_dup_resresv *
alloc_tdata_dup_nodes(resource_resv **oresresv_arr, resource_resv **nresresv_arr, server_info *nsinfo,
		      queue_info *nqinfo, int sidx, int eidx)
{
	th_data_dup_resresv *tdata;

	tdata = static_cast<th_data_dup_resresv *>(malloc(sizeof(th_data_dup_resresv)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->oresresv_arr = oresresv_arr;
	tdata->nresresv_arr = nresresv_arr;
	tdata->nsinfo = nsinfo;
	tdata->nqinfo = nqinfo;
	tdata->sidx = sidx;
	tdata->eidx = eidx;
	tdata->error = 0;

	return tdata;
}

/**
 * @brief
 *		dup_resource_resv_array - dup a array of pointers of resource resvs
 *
 * @param[in]	oresresv_arr	-	array of resource_resv do duplicate
 * @param[in]	nsinfo	-	new server ptr for new resresv array
 * @param[in]	nqinfo	-	new queue ptr for new resresv array
 *
 * @return	new resource_resv array
 * @retval	NULL	: on error
 *
 */
resource_resv **
dup_resource_resv_array(resource_resv **oresresv_arr,
			server_info *nsinfo, queue_info *nqinfo)
{
	resource_resv **nresresv_arr;
	th_data_dup_resresv *tdata = NULL;
	th_task_info *task = NULL;
	int num_resresv;
	int thread_job_ct_left;
	int th_err = 0;
	int tid;

	if (oresresv_arr == NULL || nsinfo == NULL)
		return NULL;

	num_resresv = thread_job_ct_left = count_array(oresresv_arr);

	if ((nresresv_arr = static_cast<resource_resv **>(malloc((num_resresv + 1) * sizeof(resource_resv *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	nresresv_arr[0] = NULL;

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_dup_nodes(oresresv_arr, nresresv_arr, nsinfo, nqinfo, 0, num_resresv - 1);
		if (tdata == NULL)
			th_err = 1;
		else {
			dup_resource_resv_array_chunk(tdata);
			th_err = tdata->error;
			free(tdata);
		}
	} else { /* We are multithreading */
		int num_tasks = 0;
		int chunk_size = num_resresv / num_threads;
		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		chunk_size = (chunk_size < MT_CHUNK_SIZE_MAX) ? chunk_size : MT_CHUNK_SIZE_MAX;
		for (int j = 0; thread_job_ct_left > 0;
		     num_tasks++, j += chunk_size, thread_job_ct_left -= chunk_size) {
			tdata = alloc_tdata_dup_nodes(oresresv_arr, nresresv_arr, nsinfo, nqinfo, j, j + chunk_size - 1);
			if (tdata == NULL) {
				th_err = 1;
				break;
			}
			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			task->task_type = TS_DUP_RESRESV;
			task->thread_data = (void *) tdata;

			queue_work_for_threads(task);
		}

		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_dup_resresv *>(task->thread_data);
				if (tdata->error)
					th_err = 1;
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
	}

	if (th_err) {
		free_resource_resv_array(nresresv_arr);
		return NULL;
	}
	nresresv_arr[num_resresv] = NULL;

	return nresresv_arr;
}

/**
 * @brief
 *		dup_resource_resv - duplicate a resource resv structure
 *
 * @param[in]	oresresv	-	res resv to duplicate
 * @param[in]	nsinfo	-	new server info for resource_resv
 * @param[in]	nqinfo	-	new queue info for resource_resv if job (NULL if resv)
 * @param[in]	err		-	error object
 *
 * @return	newly duplicated resource resv
 * @retval	NULL	: on error
 *
 */
resource_resv *
dup_resource_resv(resource_resv *oresresv, server_info *nsinfo, queue_info *nqinfo, const std::string &name)
{
	resource_resv *nresresv;
	schd_error *err;

	if (oresresv == NULL || nsinfo == NULL)
		return NULL;

	err = new_schd_error();

	if (err == NULL)
		return NULL;

	if (!is_resource_resv_valid(oresresv, err)) {
		schdlogerr(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SCHED, LOG_DEBUG, oresresv->name, "Can't dup resresv", err);
		free_schd_error(err);
		return NULL;
	}

	nresresv = new resource_resv(name.c_str());

	if (nresresv == NULL) {
		free_schd_error(err);
		return NULL;
	}

	nresresv->server = nsinfo;

	nresresv->user = oresresv->user;
	nresresv->group = oresresv->group;
	nresresv->project = oresresv->project;

	nresresv->nodepart_name = string_dup(oresresv->nodepart_name);
	if (oresresv->select != NULL)
		nresresv->select = new selspec(*oresresv->select); /* must come before calls to dup_nspecs() below */
	if (oresresv->execselect != NULL)
		nresresv->execselect = new selspec(*oresresv->execselect);

	nresresv->is_invalid = oresresv->is_invalid;
	nresresv->can_not_fit = oresresv->can_not_fit;
	nresresv->can_not_run = oresresv->can_not_run;
	nresresv->can_never_run = oresresv->can_never_run;
	nresresv->is_peer_ob = oresresv->is_peer_ob;
	nresresv->is_prov_needed = oresresv->is_prov_needed;
	nresresv->is_shrink_to_fit = oresresv->is_shrink_to_fit;
	nresresv->will_use_multinode = oresresv->will_use_multinode;

	nresresv->ec_index = oresresv->ec_index;

	nresresv->sch_priority = oresresv->sch_priority;
	nresresv->rank = oresresv->rank;
	nresresv->qtime = oresresv->qtime;
	nresresv->qrank = oresresv->qrank;

	nresresv->start = oresresv->start;
	nresresv->end = oresresv->end;
	nresresv->duration = oresresv->duration;
	nresresv->hard_duration = oresresv->hard_duration;
	nresresv->min_duration = oresresv->min_duration;

	nresresv->resreq = dup_resource_req_list(oresresv->resreq);

	nresresv->place_spec = dup_place(oresresv->place_spec);

	nresresv->aoename = string_dup(oresresv->aoename);
	nresresv->eoename = string_dup(oresresv->eoename);

	nresresv->node_set_str = dup_string_arr(oresresv->node_set_str);

	nresresv->resresv_ind = oresresv->resresv_ind;
	nresresv->node_set = copy_node_ptr_array(oresresv->node_set, nsinfo->nodes);

	if (oresresv->is_job) {
		nresresv->is_job = 1;
		nresresv->job = dup_job_info(oresresv->job, nqinfo, nsinfo);
		if (nresresv->job != NULL) {
			if (nresresv->job->resv != NULL) {
				nresresv->ninfo_arr = copy_node_ptr_array(oresresv->ninfo_arr,
									  nresresv->job->resv->resv->resv_nodes);
				nresresv->nspec_arr = dup_nspecs(oresresv->nspec_arr,
								 nresresv->job->resv->ninfo_arr, NULL);

			} else {
				nresresv->ninfo_arr = copy_node_ptr_array(oresresv->ninfo_arr,
									  nsinfo->nodes);
				nresresv->nspec_arr = dup_nspecs(oresresv->nspec_arr,
								 nsinfo->nodes, NULL);
			}
		}
	} else if (oresresv->is_resv) {
		selspec *sel;
		nresresv->is_resv = 1;
		nresresv->resv = dup_resv_info(oresresv->resv, nsinfo);
		if (nresresv->resv->select_orig != NULL)
			sel = nresresv->resv->select_orig;
		else
			sel = nresresv->select;
		nresresv->resv->orig_nspec_arr = dup_nspecs(oresresv->resv->orig_nspec_arr, nsinfo->nodes, sel);
		nresresv->ninfo_arr = copy_node_ptr_array(oresresv->ninfo_arr, nsinfo->nodes);
		nresresv->nspec_arr = dup_nspecs(oresresv->nspec_arr, nsinfo->nodes, NULL);
	} else { /* error */
		delete nresresv;
		free_schd_error(err);
		return NULL;
	}
#ifdef NAS /* localmod 034 */
	nresresv->share_type = oresresv->share_type;
#endif /* localmod 034 */

	if (!is_resource_resv_valid(nresresv, err)) {
		schdlogerr(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SCHED, LOG_DEBUG, oresresv->name, "Failed to dup resresv", err);
		delete nresresv;
		free_schd_error(err);
		return NULL;
	}
	free_schd_error(err);
	return nresresv;
}
resource_resv *
dup_resource_resv(resource_resv *oresresv, server_info *nsinfo, queue_info *nqinfo)
{
	return dup_resource_resv(oresresv, nsinfo, nqinfo, oresresv->name);
}

resource_resv *
find_resource_resv(resource_resv **resresv_arr, const std::string &name)
{
	int i;
	if (resresv_arr == NULL || name.empty())
		return NULL;

	for (i = 0; resresv_arr[i] != NULL && resresv_arr[i]->name != name; i++)
		;

	return resresv_arr[i];
}

/**
 * @brief
 * 		find a resource_resv by index in all_resresv array or by unique numeric rank
 *
 * @param[in]	resresv_arr	-	array of resource_resvs to search
 * @param[in]	index	    -	index of resource_resv to find
 * @param[in]	rank        -	rank of resource_resv to find
 *
 * @return	resource_resv *
 * @retval resource_resv	: if found
 * @retval NULL	: if not found or on error
 *
 */
resource_resv *
find_resource_resv_by_indrank(resource_resv **resresv_arr, int index, int rank)
{
	int i;
	if (resresv_arr == NULL)
		return NULL;

	if (index != -1 && resresv_arr[0] != NULL && resresv_arr[0]->server != NULL &&
	    resresv_arr[0]->server->all_resresv != NULL)
		return resresv_arr[0]->server->all_resresv[index];

	for (i = 0; resresv_arr[i] != NULL && resresv_arr[i]->rank != rank; i++)
		;

	return resresv_arr[i];
}

/**
 * @brief
 * 		find a resource_resv by name and start time
 *
 * @param[in]	resresv_arr -	array of resource_resvs to search
 * @param[in]	name        -	name of resource_resv to find
 * @param[in]	start_time  -	the start time of the resource_resv
 *
 * @return	resource_resv *
 * @retval	resource_resv	: if found
 * @retval	NULL	: if not found or on error
 *
 */
resource_resv *
find_resource_resv_by_time(resource_resv **resresv_arr, const std::string &name, time_t start_time)
{
	int i;
	if (resresv_arr == NULL)
		return NULL;

	for (i = 0; resresv_arr[i] != NULL; i++) {
		if ((resresv_arr[i]->name == name) && (resresv_arr[i]->start == start_time))
			break;
	}

	return resresv_arr[i];
}

/**
 * @brief
 *		is_resource_resv_valid - do simple validity checks for a resource resv
 *
 *
 *	@param[in] resresv - the resource_resv to do check
 *	@param[out] err - error struct to return why resource_resv is invalid
 *
 *	@returns int
 *	@retva1 1 if valid
 *	@retval 0 if invalid (err returns reason why)
 */
int
is_resource_resv_valid(resource_resv *resresv, schd_error *err)
{
	if (resresv == NULL)
		return 0;

	if (resresv->server == NULL) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "No server pointer");
		return 0;
	}

	if (resresv->is_job && resresv->job == NULL) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "Job has no job sub-structure");
		return 0;
	}

	if (resresv->is_resv && resresv->resv == NULL) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "Reservation has no resv sub-structure");
		return 0;
	}

	if (resresv->name.empty()) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "No Name");
		return 0;
	}

	if (resresv->user.empty()) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "No User");
		return 0;
	}

	if (resresv->group.empty()) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "No Group");
		return 0;
	}

	if (resresv->select == NULL) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "No Select");
		return 0;
	}

	if (resresv->place_spec == NULL) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "No Place");
		return 0;
	}

	if (!resresv->is_job && !resresv->is_resv) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "Is neither job nor resv");
		return 0;
	}

	if (is_resresv_running(resresv)) {
		if (resresv->nspec_arr.empty()) {
			set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
			set_schd_error_arg(err, SPECMSG, "Is running w/o exec_vnode1");
			return 0;
		}

		if (resresv->ninfo_arr == NULL) {
			set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
			set_schd_error_arg(err, SPECMSG, "Is running w/o exec_vnode2");
			return 0;
		}
	}

	if (resresv->ninfo_arr != NULL && resresv->nspec_arr.empty()) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "exec_vnode mismatch 1");
		return 0;
	}

	if (!resresv->nspec_arr.empty() && resresv->ninfo_arr == NULL) {
		set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
		set_schd_error_arg(err, SPECMSG, "exec_vnode mismatch 2");
		return 0;
	}

	return 1;
}

/**
 * @brief
 *		dup_resource_req_list - duplicate a resource_req list
 *
 * @param[in]	oreq	-	resource_req list to duplicate
 *
 * @return	duplicated resource_req list
 *
 */
resource_req *
dup_resource_req_list(resource_req *oreq)
{
	resource_req *req;
	resource_req *nreq;
	resource_req *head;
	resource_req *prev;

	head = NULL;
	prev = NULL;
	req = oreq;

	while (req != NULL) {
		if ((nreq = dup_resource_req(req)) != NULL) {
			if (head == NULL)
				head = nreq;
			else
				prev->next = nreq;
			prev = nreq;
		} else {
			free_resource_req_list(head);
			return NULL;
		}
		req = req->next;
	}

	return head;
}

/**
 * @brief
 *		dup_resource_count_list - duplicate a resource_req list
 *
 * @param[in]	orcount	-	resource_count list to duplicate
 *
 * @return	duplicated resource_count list
 *
 */
resource_count *
dup_resource_count_list(resource_count *orcount)
{
	resource_count *rcount;
	resource_count *nrcount;
	resource_count *head;
	resource_count *prev;

	head = NULL;
	prev = NULL;
	rcount = orcount;

	while (rcount != NULL) {
		if ((nrcount = dup_resource_count(rcount)) != NULL) {
			if (head == NULL)
				head = nrcount;
			else
				prev->next = nrcount;
			prev = nrcount;
		} else {
			free_resource_count_list(head);
			return NULL;
		}
		rcount = rcount->next;
	}

	return head;
}

/**
 * @brief
 *		dup_selective_resource_req_list - duplicate a resource_req list
 *
 * @param[in]	oreq	-	resource_req list to duplicate
 * @paral[in]	deflist		only duplicate resources in this list - if NULL, dup all
 *
 * @return	duplicated resource_req list
 *
 */
resource_req *
dup_selective_resource_req_list(resource_req *oreq, std::unordered_set<resdef *> &deflist)
{
	resource_req *req;
	resource_req *nreq;
	resource_req *head;
	resource_req *prev;

	head = NULL;
	prev = NULL;

	for (req = oreq; req != NULL; req = req->next) {
		if (deflist.find(req->def) != deflist.end()) {
			if ((nreq = dup_resource_req(req)) != NULL) {
				if (head == NULL)
					head = nreq;
				else
					prev->next = nreq;
				prev = nreq;
			}
		}
	}

	return head;
}

/**
 * @brief
 *		dup_resource_req - duplicate a resource_req struct
 *
 * @param[in]	oreq	-	the resource_req to duplicate
 *
 * @return	duplicated resource req
 *
 */
resource_req *
dup_resource_req(resource_req *oreq)
{
	resource_req *nreq;
	if (oreq == NULL)
		return NULL;

	if ((nreq = new_resource_req()) == NULL)
		return NULL;

	nreq->def = oreq->def;
	if (nreq->def)
		nreq->name = nreq->def->name.c_str();

	memcpy(&(nreq->type), &(oreq->type), sizeof(struct resource_type));
	nreq->res_str = string_dup(oreq->res_str);
	nreq->amount = oreq->amount;

	return nreq;
}

/**
 * @brief
 *		dup_resource_count - duplicate a resource_count struct
 *
 * @param[in]	orcount	-	the resource_count to duplicate
 *
 * @return	duplicated resource count
 *
 */
resource_count *
dup_resource_count(resource_count *orcount)
{
	resource_count *nrcount;
	if (orcount == NULL)
		return NULL;

	if ((nrcount = new_resource_count()) == NULL)
		return NULL;

	nrcount->def = orcount->def;
	if (nrcount->def)
		nrcount->name = nrcount->def->name.c_str();

	nrcount->amount = orcount->amount;
	nrcount->soft_limit_preempt_bit = orcount->soft_limit_preempt_bit;

	return nrcount;
}

/**
 * @brief
 *		new_resource_req - allocate and initalize new resource_req
 *
 * @return	the new resource_req
 *
 */

resource_req *
new_resource_req()
{
	resource_req *resreq;

	if ((resreq = static_cast<resource_req *>(calloc(1, sizeof(resource_req)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	/* member type zero'd by calloc() */

	resreq->name = NULL;
	resreq->res_str = NULL;
	resreq->amount = 0;
	resreq->def = NULL;
	resreq->next = NULL;

	return resreq;
}

/**
 * @brief
 *		new_resource_count - allocate and initalize new resource_count
 *
 * @return	the new resource_count
 *
 */
resource_count *
new_resource_count()
{
	resource_count *rcount;

	if ((rcount = static_cast<resource_count *>(malloc(sizeof(resource_count)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	rcount->name = NULL;
	rcount->amount = 0;
	rcount->soft_limit_preempt_bit = 0;
	rcount->def = NULL;
	rcount->next = NULL;

	return rcount;
}

/**
 * @brief
 * 		Create new resource_req with given data
 *
 * @param[in]	name	-	name of resource
 * @param[in]	value	-	value of resource
 *
 * @return	newly created resource_req
 * @retval	NULL	: Fail
 */
resource_req *
create_resource_req(const char *name, const char *value)
{
	resource_req *resreq = NULL;
	resdef *rdef;

	if (name == NULL)
		return NULL;

	rdef = find_resdef(name);

	if (rdef != NULL) {
		if ((resreq = new_resource_req()) != NULL) {
			resreq->def = rdef;
			resreq->name = rdef->name.c_str();
			resreq->type = rdef->type;

			if (value != NULL) {
				if (set_resource_req(resreq, value) != 1) {
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_DEBUG, name,
						  "Bad requested resource data");
					return NULL;
				}
			}
		}
	} else {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_DEBUG, name, "Resource definition does not exist, resource may be invalid");
		return NULL;
	}

	return resreq;
}

/**
 * @brief
 *		find resource_req by resource definition or allocate and
 *		initialize a new resource_req also adds new one to the list
 *
 * @param[in]	reqlist	-	list to search
 * @param[in]	def	-	resource_req to find
 *
 * @return	resource_req *
 * @retval	found or newly allocated resource_req
 *
 */
resource_req *
find_alloc_resource_req(resource_req *reqlist, resdef *def)
{
	resource_req *req;	   /* used to find or create resource_req */
	resource_req *prev = NULL; /* previous resource_req in list */

	if (def == NULL)
		return NULL;

	for (req = reqlist; req != NULL && req->def != def; req = req->next) {
		prev = req;
	}

	if (req == NULL) {
		if ((req = new_resource_req()) == NULL)
			return NULL;

		req->def = def;
		req->type = req->def->type;
		req->name = def->name.c_str();
		if (prev != NULL)
			prev->next = req;
	}

	return req;
}

/**
 * @brief
 *		find resource_count by resource definition or allocate and
 *		initialize a new resource_count also adds new one to the list
 *
 * @param[in]	rcountlist	-	list to search
 * @param[in]	def		-	resource_count to find
 *
 * @return	resource_count *
 * @retval	found or newly allocated resource_count
 *
 */
resource_count *
find_alloc_resource_count(resource_count *rcountlist, resdef *def)
{
	resource_count *rcount;	     /* used to find or create resource_count */
	resource_count *prev = NULL; /* previous resource_count in list */

	if (def == NULL)
		return NULL;

	for (rcount = rcountlist; rcount != NULL && rcount->def != def; rcount = rcount->next) {
		prev = rcount;
	}

	if (rcount == NULL) {
		if ((rcount = new_resource_count()) == NULL)
			return NULL;

		rcount->def = def;
		rcount->name = def->name.c_str();
		if (prev != NULL)
			prev->next = rcount;
	}

	return rcount;
}

/**
 * @brief
 * 		find resource_req by name or allocate and initialize a new
 *		resource_req also adds new one to the list
 *
 * @param[in]	reqlist	-	list to search
 * @param[in]	name	-	resource_req to find
 *
 * @return	resource_req *
 * @retval	found or newly allocated resource_req
 *
 */
resource_req *
find_alloc_resource_req_by_str(resource_req *reqlist, char *name)
{
	resource_req *req;	   /* used to find or create resource_req */
	resource_req *prev = NULL; /* previous resource_req in list */

	if (name == NULL)
		return NULL;

	for (req = reqlist; req != NULL && strcmp(req->name, name); req = req->next) {
		prev = req;
	}

	if (req == NULL) {
		if ((req = create_resource_req(name, NULL)) == NULL)
			return NULL;

		if (prev != NULL)
			prev->next = req;
	}

	return req;
}

/**
 * @brief
 * 		find a resource_req from a resource_req list by string name
 *
 * @param[in]	reqlist	-	the resource_req list
 * @param[in]	name	-	resource name to look for
 *
 * @return	resource_req *
 * @retval	found resource request
 * @retval NULL	: if not found
 *
 */
resource_req *
find_resource_req_by_str(resource_req *reqlist, const char *name)
{
	resource_req *resreq;

	resreq = reqlist;

	while (resreq != NULL && strcmp(resreq->name, name))
		resreq = resreq->next;

	return resreq;
}

/**
 * @brief
 * 		find resource_req by resource definition
 *
 * @param	reqlist	-	req list to search
 * @param	def	-	resource definition to search for
 *
 * @return	found resource_req
 * @retval	NULL	: if not found
 */
resource_req *
find_resource_req(resource_req *reqlist, resdef *def)
{
	resource_req *resreq;

	resreq = reqlist;

	while (resreq != NULL && resreq->def != def)
		resreq = resreq->next;

	return resreq;
}

/**
 * @brief
 * 		find resource_count by resource definition
 *
 * @param	rcountlist	-	resource_count list to search
 * @param	def		-	resource definition to search for
 *
 * @return	resource_count *
 * @return	found resource count
 * @retval	NULL	: if not found
 */
resource_count *
find_resource_count(resource_count *rcountlist, resdef *def)
{
	resource_count *rcount;

	rcount = rcountlist;

	while (rcount != NULL && rcount->def != def)
		rcount = rcount->next;

	return rcount;
}

/**
 * @brief
 *		set_resource_req - set the value and type of a resource req
 *
 * @param[out]	req		the resource_req to set
 * @param[in]	val -		the string value (can be NULL)
 *
 * @return	int
 * @retval	1 for Success
 * @retval	0 for Error
 */
int
set_resource_req(resource_req *req, const char *val)
{
	resdef *rdef;

	if (req == NULL)
		return 0;

	/* if val is a string, req -> amount will be set to SCHD_INFINITY_RES */
	req->amount = res_to_num(val, &(req->type));
	req->res_str = string_dup(val);

	if (req->def != NULL)
		rdef = req->def;
	else {
		rdef = find_resdef(req->name);
		req->def = rdef;
	}
	if (rdef != NULL)
		req->type = rdef->type;

	if (req->amount == SCHD_INFINITY_RES) {
		/* Verify that this is actually a non-numeric resource */
		if (!req->type.is_string)
			return 0;
	}

	return 1;
}

/**
 * @brief
 *		free_resource_req_list - frees memory used by a resource_req list
 *
 * @param[in]	list	-	resource_req list
 *
 * @return	nothing
 */
void
free_resource_req_list(resource_req *list)
{
	resource_req *resreq;

	resreq = list;
	while (resreq != NULL) {
		auto tmp = resreq;
		resreq = resreq->next;
		free_resource_req(tmp);
	}
}

/**
 * @brief
 *		free_resource_count_list - frees memory used by a resource_count list
 *
 * @param[in]	list	-	resource_count list
 *
 * @return	nothing
 */
void
free_resource_count_list(resource_count *list)
{
	resource_count *rcount;

	rcount = list;
	while (rcount != NULL) {
		auto tmp = rcount;
		rcount = rcount->next;
		free_resource_count(tmp);
	}
}

/**
 * @brief
 *		free_resource_req - free memory used by a resource_req structure
 *
 * @param[in,out]	req	-	resource_req to free
 *
 * @return	nothing
 *
 */
void
free_resource_req(resource_req *req)
{
	if (req == NULL)
		return;

	if (req->res_str != NULL)
		free(req->res_str);

	free(req);
}

/**
 * @brief
 *		free_resource_count - free memory used by a resource_count structure
 *
 * @param[in,out]	rcount	-	resource_count to free
 *
 * @return	nothing
 *
 */
void
free_resource_count(resource_count *rcount)
{
	free(rcount);
}

/**
 * @brief compare two resource_req structures
 * @return equal or not
 * @retval 1 two structures are equal
 * @retval 0 two strictures are not equal
 */
int
compare_resource_req(resource_req *req1, resource_req *req2)
{

	if (req1 == NULL && req2 == NULL)
		return 1;
	else if (req1 == NULL || req2 == NULL)
		return 0;

	if (req1->type.is_consumable || req1->type.is_boolean)
		return (req1->amount == req2->amount);

	if (req1->type.is_string)
		if (strcmp(req1->res_str, req2->res_str) == 0)
			return 1;

	return 0;
}

/**
 * @brief compare two resource_req lists possibly excluding certain resources
 * @param[in] req1 - list1
 * @param[in] req2 - list2
 * @param[in] comparr - list of resources to compare or NULL for all resources
 * @return int
 * @retval 1 two lists are equal
 * @retval 0 two lists are not equal
 */
int
compare_resource_req_list(resource_req *req1, resource_req *req2, std::unordered_set<resdef *> &comparr)
{
	resource_req *cur_req1;
	resource_req *cur_req2;
	resource_req *cur;
	int ret1 = 1;
	int ret2 = 1;

	if (req1 == NULL && req2 == NULL)
		return 1;

	if (req1 == NULL || req2 == NULL)
		return 0;

	for (cur_req1 = req1; ret1 && cur_req1 != NULL; cur_req1 = cur_req1->next) {
		if (comparr.find(cur_req1->def) != comparr.end()) {
			cur = find_resource_req(req2, cur_req1->def);
			if (cur == NULL)
				ret1 = 0;
			else
				ret1 = compare_resource_req(cur_req1, cur);
		}
	}

	for (cur_req2 = req2; ret2 && cur_req2 != NULL; cur_req2 = cur_req2->next) {
		if (comparr.find(cur_req2->def) != comparr.end()) {
			cur = find_resource_req(req1, cur_req2->def);
			if (cur == NULL)
				ret2 = 0;
			else
				ret2 = compare_resource_req(cur_req2, cur);
		}
	}

	/* Either we found a not-match or one list is larger than the other*/
	if (!ret1 || !ret2)
		return 0;

	return 1;
}

/**
 * @brief
 * 		update information kept in a resource_resv when one is started
 *
 * @param[in]	resresv	-	the resource resv to update
 * @param[in]	nspec_arr	-	the nodes the job ran in
 *
 * @return	void
 */
void
update_resresv_on_run(resource_resv *resresv, std::vector<nspec *> &nspec_arr)
{
	queue_info *resv_queue;
	int ret;

	if (resresv == NULL)
		return;

	if (resresv->is_job) {
		if (resresv->job->is_suspended) {
			for (auto ns : nspec_arr)
				ns->ninfo->num_susp_jobs--;
			if (!resresv->job->resreleased.empty())
				free_nspecs(resresv->job->resreleased);

			if (resresv->job->resreq_rel != NULL) {
				free_resource_req_list(resresv->job->resreq_rel);
				resresv->job->resreq_rel = NULL;
			}
		} else {
			if (resresv->job->is_subjob && resresv->job->parent_job)
				resresv->job->parent_job->job->running_subjobs++;
		}

		set_job_state("R", resresv->job);
		resresv->job->is_susp_sched = 0;
		resresv->job->stime = resresv->server->server_time;
		resresv->start = resresv->server->server_time;
		resresv->end = resresv->start + calc_time_left(resresv, 0);
		resresv->job->accrue_type = JOB_RUNNING;

		if (resresv->aoename != NULL) {
			for (const auto ns : nspec_arr) {
				if (ns->go_provision) {
					resresv->job->is_provisioning = 1;
					break;
				}
			}
		}
		if (resresv->execselect == NULL) {
			std::string selectspec;
			selectspec = create_select_from_nspec(nspec_arr);
			resresv->execselect = parse_selspec(selectspec);
		}
		if (resresv->job->dependent_jobs != NULL) {
			for (int i = 0; resresv->job->dependent_jobs[i] != NULL; i++) {
				/* Mark all runone jobs as "can not run" */
				resresv->job->dependent_jobs[i]->can_not_run = 1;
			}
		}
	} else if (resresv->is_resv && resresv->resv != NULL) {
		resresv->resv->resv_state = RESV_RUNNING;
		resresv->resv->is_running = 1;

		resv_queue = find_queue_info(resresv->server->queues,
					     resresv->resv->queuename);
		if (resv_queue != NULL) {
			/* reservation queues are stopped before the reservation is started */
			resv_queue->is_started = 1;
			/* because the reservation queue was previously stopped, we need to
			 * reevaluate resv_queue -> is_ok_to_run
			 */
			ret = is_ok_to_run_queue(resresv->server->policy, resv_queue);
			if (ret == SUCCESS)
				resv_queue->is_ok_to_run = 1;
			else
				resv_queue->is_ok_to_run = 0;
		}
	}
	if (resresv->ninfo_arr == NULL)
		resresv->ninfo_arr = create_node_array_from_nspec(nspec_arr);
}

/**
 * @brief
 *		update_resresv_on_end - update a resource_resv structure when
 *				      it ends
 *
 * @param[out]	resresv	-	the resresv to update
 * @param[in]	job_state	-	the new state if resresv is a job
 *
 * @return	nothing
 *
 */
void
update_resresv_on_end(resource_resv *resresv, const char *job_state)
{
	queue_info *resv_queue;
	resource_resv *next_occr = NULL;
	time_t next_occr_time;
	int ret;
	int i;

	if (resresv == NULL)
		return;

	/* now that it isn't running, it might be runnable again */
	resresv->can_not_run = 0;

	/* unless of course it's a job and its queue is in an ineligible state */
	if (resresv->is_job && resresv->job != NULL &&
	    !resresv->job->queue->is_ok_to_run)
		resresv->can_not_run = 1;

	/* no longer running... clear start and end times */
	resresv->start = UNSPECIFIED;
	resresv->end = UNSPECIFIED;

	if (resresv->is_job && resresv->job != NULL) {
		set_job_state(job_state, resresv->job);
		if (resresv->job->is_suspended) {
			resresv->job->is_susp_sched = 1;
			for (auto ns : resresv->nspec_arr)
				ns->ninfo->num_susp_jobs++;
		} else {
			if (resresv->job->is_subjob && resresv->job->parent_job &&
			    resresv->job->parent_job->job->max_run_subjobs != UNSPECIFIED)
				resresv->job->parent_job->job->running_subjobs--;
		}

		resresv->job->is_provisioning = 0;

		/* free resources allocated to job since it's now been requeued */
		if (resresv->job->is_queued && !resresv->job->is_checkpointed) {
			free(resresv->ninfo_arr);
			resresv->ninfo_arr = NULL;
			free_nspecs(resresv->nspec_arr);
			free_resource_req_list(resresv->job->resused);
			resresv->job->resused = NULL;
			if (resresv->nodepart_name != NULL) {
				free(resresv->nodepart_name);
				resresv->nodepart_name = NULL;
			}
			delete resresv->execselect;
			resresv->execselect = NULL;
		}
		/* We need to correct our calendar */
		if (resresv->end_event != NULL)
			set_timed_event_disabled(resresv->end_event, 1);
	} else if (resresv->is_resv && resresv->resv != NULL) {
		resresv->resv->resv_state = RESV_DELETED;
		resresv->resv->is_running = 0;

		resv_queue = find_queue_info(resresv->server->queues,
					     resresv->resv->queuename);
		if (resv_queue != NULL) {
			resv_queue->is_started = 0;
			ret = is_ok_to_run_queue(resresv->server->policy, resv_queue);
			if (ret == SUCCESS)
				resv_queue->is_ok_to_run = 1;
			else
				resv_queue->is_ok_to_run = 0;

			if (resresv->resv->is_standing) {
				/* This occurrence is over, move resv pointers of all jobs that are
				 * left to next occurrence if one exists
				 */
				if (resresv->resv->resv_idx < resresv->resv->count) {
					next_occr_time = get_occurrence(resresv->resv->rrule,
									resresv->resv->req_start, resresv->resv->timezone, 2);
					if (next_occr_time >= 0) {
						next_occr = find_resource_resv_by_time(resresv->server->resvs,
										       resresv->name, next_occr_time);
						if (next_occr != NULL) {
							if (resv_queue->jobs != NULL) {
								for (i = 0; resv_queue->jobs[i] != NULL; i++) {
									if (in_runnable_state(resv_queue->jobs[i]))
										resv_queue->jobs[i]->job->resv = next_occr;
								}
							}
						} else
							log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, resresv->name,
								   "Can't find occurrence of standing reservation at time %ld", next_occr_time);
					}
				}
			}
		}
	}
}

/**
 * @brief
 *		resource_resv_filter - filters jobs on specified argument
 *
 * @param[in]	resresv_arr	-	array of jobs to filter through
 * @param[in]	size	-	amount of jobs in array
 * @param[in]	filter_func	-	pointer to a function that will filter
 *								- returns 1: job will be added to new array
 *								- returns 0: job will not be added to new array
 * @param[in]	arg	-	an extra arg to pass to filter_func
 * @param[in]	flags	-	flags to describe the filtering
 *
 * @return	pointer to filtered list
 *
 * @par	NOTE:	this function allocates a new array
 * @note
 *		filter_func prototype: int func( resource_resv *, void * )
 *
 */
resource_resv **
resource_resv_filter(resource_resv **resresv_arr, int size,
		     int (*filter_func)(resource_resv *, const void *), const void *arg, int flags)
{
	resource_resv **new_resresvs = NULL; /* new array of jobs */
	resource_resv **tmp;
	int i, j = 0;

	if (filter_func == NULL) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
			  __func__, "NULL filter function passed in.");
		return NULL;
	}
	if (resresv_arr == NULL && size != 0) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
			  __func__, "NULL input array with non-zero size.");
		return NULL;
	}

	/* NOTE: if resresv_arr is NULL, a one element array will be returned
	 * the one element being the NULL terminator
	 */

	if ((new_resresvs = static_cast<resource_resv **>(malloc((size + 1) * sizeof(resource_resv *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; i < size; i++) {
		if (filter_func(resresv_arr[i], arg)) {
			new_resresvs[j] = resresv_arr[i];
			j++;
		}
	}
	/* FILTER_FULL - leave the filtered array full size */
	if (!(flags & FILTER_FULL)) {
		if ((tmp = static_cast<resource_resv **>(realloc(new_resresvs, (j + 1) *
										       sizeof(resource_resv *)))) == NULL) {
			free(new_resresvs);
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		} else
			new_resresvs = tmp;
	}
	new_resresvs[j] = NULL;

	return new_resresvs;
}

/**
 * @brief
 *		remove_resresv_from_array - remove a resource_resv from an array
 *				    without leaving a hole
 *
 * @param[in,out]	resresv_arr	-	the array
 * @param[in]	resresv	-	the resresv to remove
 *
 * @return	success / failure
 *
 */
int
remove_resresv_from_array(resource_resv **resresv_arr,
			  resource_resv *resresv)
{
	int i;

	if (resresv_arr == NULL || resresv == NULL)
		return 0;

	for (i = 0; resresv_arr[i] != NULL && resresv_arr[i] != resresv; i++)
		;

	if (resresv_arr[i] == resresv) {
		/* copy all the jobs past the one we found back one spot.  Including
		 * coping the NULL back one as well
		 */
		for (; resresv_arr[i] != NULL; i++)
			resresv_arr[i] = resresv_arr[i + 1];
	}
	return 1;
}

/**
 * @brief
 *		add_resresv_to_array - add a resource resv to an array
 * 			   note: requires reallocating array
 *
 * @param[in]	resresv_arr	-	job array to add job to
 * @param[in]	resresv	-	job to add to array
 * @param[in]	flags -
 *			    SET_RESRESV_INDEX - set resresv_ind of the job/resv
 *
 * @return	array (changed from realloc)
 * @retval	NULL	: on error
 *
 */
resource_resv **
add_resresv_to_array(resource_resv **resresv_arr,
		     resource_resv *resresv, int flags)
{
	int size;
	resource_resv **new_arr;

	if (resresv_arr == NULL && resresv == NULL)
		return NULL;

	if (resresv_arr == NULL && resresv != NULL) {
		new_arr = static_cast<resource_resv **>(malloc(2 * sizeof(resource_resv *)));
		if (new_arr == NULL)
			return NULL;
		new_arr[0] = resresv;
		new_arr[1] = NULL;
		if (flags & SET_RESRESV_INDEX)
			resresv->resresv_ind = 0;
		return new_arr;
	}

	size = count_array(resresv_arr);

	/* realloc for 1 more ptr (2 == 1 for new and 1 for NULL) */
	new_arr = static_cast<resource_resv **>(realloc(resresv_arr, ((size + 2) * sizeof(resource_resv *))));

	if (new_arr != NULL) {
		new_arr[size] = resresv;
		new_arr[size + 1] = NULL;
		if (flags & SET_RESRESV_INDEX)
			resresv->resresv_ind = size;
	} else {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	return new_arr;
}

/**
 * @brief
 *		copy_resresv_array - copy an array of resource_resvs by name.
 *			This is useful  when duplicating a data structure
 *			with a job array in it which isn't easily reproduced.
 *
 * @par NOTE:	if a job in resresv_arr is not in tot_arr, that resresv will be
 *			left out of the new array
 *
 * @param[in]	resresv_arr	-	the job array to copy
 * @param[in]	tot_arr	    -		the total array of jobs
 *
 * @return	new resource_resv array or NULL on error
 *
 */
resource_resv **
copy_resresv_array(resource_resv **resresv_arr,
		   resource_resv **tot_arr)
{
	resource_resv *resresv;
	resource_resv **new_resresv_arr;
	int size;
	int i, j;

	if (resresv_arr == NULL || tot_arr == NULL)
		return NULL;

	for (size = 0; resresv_arr[size] != NULL; size++)
		;

	new_resresv_arr =
		static_cast<resource_resv **>(malloc((size + 1) * sizeof(resource_resv *)));
	if (new_resresv_arr == NULL) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, "not enough memory.");
		return NULL;
	}

	for (i = 0, j = 0; resresv_arr[i] != NULL; i++) {
		resresv = find_resource_resv_by_indrank(tot_arr, resresv_arr[i]->resresv_ind, resresv_arr[i]->rank);

		if (resresv != NULL) {
			new_resresv_arr[j] = resresv;
			j++;
		}
	}
	new_resresv_arr[j] = NULL;

	return new_resresv_arr;
}

/**
 * @brief
 *		is_resresv_running - is a resource resv in the running state
 *			     for a job it's in the "R" state
 *			     for an advanced reservation its start time is in the past
 *
 *
 * @param[in]	resresv	-	the resresv to check if it's running
 *
 * @return	int
 * @retval	1	: if running
 * @retval	0	: if not running
 *
 */
int
is_resresv_running(resource_resv *resresv)
{
	if (resresv == NULL)
		return 0;

	if (resresv->is_job) {
		if (resresv->job == NULL)
			return 0;

		if (resresv->job->is_running)
			return 1;
	}

	if (resresv->is_resv) {
		if (resresv->resv == NULL)
			return 0;

		if (resresv->resv->is_running)
			return 1;
	}

	return 0;
}

/**
 * @brief
 *		new_place - allocate and initialize a placement spec
 *
 * @return	newly allocated place
 *
 */
place *
new_place()
{
	place *pl;

	if ((pl = static_cast<place *>(malloc(sizeof(place)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	pl->pack = 0;
	pl->free = 0;
	pl->excl = 0;
	pl->share = 0;
	pl->scatter = 0;
	pl->vscatter = 0;
	pl->exclhost = 0;

	pl->group = NULL;

	return pl;
}

/**
 * @brief
 *		free_place - free a placement spec
 *
 * @param[in,out]	pl	-	the placement spec to free
 *
 * @return	nothing
 *
 */
void
free_place(place *pl)
{
	if (pl == NULL)
		return;

	if (pl->group != NULL)
		free(pl->group);

	free(pl);
}

/**
 * @brief
 *		dup_place - duplicate a place structure
 *
 * @param[in]	pl	-	the place structure to duplicate
 *
 * @return	duplicated place structure
 *
 */
place *
dup_place(place *pl)
{
	place *newpl;

	if (pl == NULL)
		return NULL;

	newpl = new_place();

	if (newpl == NULL)
		return NULL;

	newpl->pack = pl->pack;
	newpl->free = pl->free;
	newpl->scatter = pl->scatter;
	newpl->vscatter = pl->vscatter;
	newpl->excl = pl->excl;
	newpl->exclhost = pl->exclhost;
	newpl->share = pl->share;

	newpl->group = string_dup(pl->group);

	return newpl;
}

/**
 * @brief
 *		new_chunk - constructor for chunk
 *
 * @return	new_chunk
 * @retval	NULL	: malloc failed.
 */
chunk *
new_chunk()
{
	chunk *ch;

	if ((ch = static_cast<chunk *>(malloc(sizeof(chunk)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	ch->num_chunks = 0;
	ch->seq_num = 0;
	ch->str_chunk = NULL;
	ch->req = NULL;

	return ch;
}

/**
 * @brief
 *		dup_chunk_array - array copy constructor for array of chunk pointers
 *
 * @param[in]	old_chunk_arr	-	old array of chunk pointers
 *
 * @return	duplicate chunk array.
 */
chunk **
dup_chunk_array(const chunk *const *old_chunk_arr)
{
	int i;
	int ct;
	chunk **new_chunk_arr = NULL;
	int error = 0;

	if (old_chunk_arr == NULL)
		return NULL;

	ct = count_array(old_chunk_arr);

	if ((new_chunk_arr = static_cast<chunk **>(calloc(ct + 1, sizeof(chunk *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; old_chunk_arr[i] != NULL && !error; i++) {
		new_chunk_arr[i] = dup_chunk(old_chunk_arr[i]);
		if (new_chunk_arr[i] == NULL)
			error = 1;
	}

	new_chunk_arr[i] = NULL;

	if (error) {
		free_chunk_array(new_chunk_arr);
		return NULL;
	}

	return new_chunk_arr;
}

/**
 * @brief
 *		dup_chunk - copy constructor for chunk
 *
 * @param[in]	ochunk	-	old chunk structure
 *
 * @return	duplicate chunk structure.
 */
chunk *
dup_chunk(const chunk *ochunk)
{
	chunk *nchunk;

	if (ochunk == NULL)
		return NULL;

	nchunk = new_chunk();

	if (nchunk == NULL)
		return NULL;

	nchunk->num_chunks = ochunk->num_chunks;
	nchunk->seq_num = ochunk->seq_num;
	nchunk->str_chunk = string_dup(ochunk->str_chunk);
	nchunk->req = dup_resource_req_list(ochunk->req);

	if (nchunk->req == NULL) {
		free_chunk(nchunk);
		return NULL;
	}

	return nchunk;
}

/**
 * @brief
 *		free_chunk_array - array destructor for array of chunk ptrs
 *
 * @param[in,out]	chunk_arr	-	old array of chunk pointers
 *
 * @return	void
 */
void
free_chunk_array(chunk **chunk_arr)
{
	int i;

	if (chunk_arr == NULL)
		return;

	for (i = 0; chunk_arr[i] != NULL; i++)
		free_chunk(chunk_arr[i]);

	free(chunk_arr);
}

/**
 * @brief
 *		free_chunk - destructor for chunk
 *
 * @param[in,out]	ch	-	chunk structure to be freed.
 */
void
free_chunk(chunk *ch)
{
	if (ch == NULL)
		return;

	if (ch->str_chunk != NULL)
		free(ch->str_chunk);

	if (ch->req != NULL)
		free_resource_req_list(ch->req);

	free(ch);
}

/**
 * @brief find_chunk_by_seq_num - find a chunk by its sequence number
 *
 * @param[in] chunks - array of chunks to search
 * @param[in] seq_num - sequence number to search for
 *
 * @return chunk *
 * @retval chunk found
 * @retval NULL if not found
 */
chunk *
find_chunk_by_seq_num(chunk **chunks, int seq_num)
{
	int i;
	for (i = 0; chunks[i] != NULL; i++)
		if (chunks[i]->seq_num == seq_num)
			return chunks[i];

	return NULL;
}
/**
 * @brief
 *		constructor for selspec
 *
 * @return	new selspec
 * @retval	NULL	: Fail
 */

selspec::selspec()
{
	total_chunks = 0;
	total_cpus = 0;
	chunks = NULL;
}

/**
 * @brief
 *		copy constructor for selspec
 *
 * @param[in]	oldspec	-	old selspec to be copied
 */
selspec::selspec(const selspec &oldspec)
{
	total_chunks = oldspec.total_chunks;
	total_cpus = oldspec.total_cpus;
	chunks = dup_chunk_array(oldspec.chunks);
	defs = oldspec.defs;
}

selspec &
selspec::operator=(const selspec &oldspec)
{
	total_chunks = oldspec.total_chunks;
	total_cpus = oldspec.total_cpus;
	chunks = dup_chunk_array(oldspec.chunks);
	defs = oldspec.defs;
	return *this;
}

/**
 * @brief
 *		 - destructor for selspec

 */
selspec::~selspec()
{
	if (chunks != NULL)
		free_chunk_array(chunks);
}

/**
 * @brief
 *		compare_res_to_str - compare a resource structure of type string to
 *			     a character array string
 *
 * @param[in]	res	-	the resource
 * @param[in]	str	-	the string
 * @param[in]	cmpflag	-	case sensitive or insensitive comparison
 *
 * @return	int
 * @retval	1	: if they match
 * @retval	0	: if they don't or res is not a string or error
 *
 */
int
compare_res_to_str(schd_resource *res, char *str, enum resval_cmpflag cmpflag)
{
	int i;

	if (res == NULL || str == NULL)
		return 0;

	if (res->str_avail == NULL)
		return 0;

	for (i = 0; res->str_avail[i] != NULL; i++) {
		if (cmpflag == CMP_CASE) {
			if (!strcmp(res->str_avail[i], str))
				return 1;
		} else if (cmpflag == CMP_CASELESS) {
			if (!strcasecmp(res->str_avail[i], str))
				return 1;
		} else {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_NOTICE, res->name, "Incorrect flag for comparison.");
			return 0;
		}
	}
	/* if we got here, we didn't match the string */
	return 0;
}

/**
 * @brief
 *		compare_non_consumable - perform the == operation on a non consumable
 *				resource and resource_req
 *
 * @param[in]	res	-	the resource
 * @param[in]	req	-	resource request
 *
 * @return	int
 * @retval	1	: for a match
 * @retval	0	: for not a match
 *
 */
int
compare_non_consumable(schd_resource *res, resource_req *req)
{

	if (res == NULL && req == NULL)
		return 0;

	if (req == NULL)
		return 0;

	if (!req->type.is_non_consumable)
		return 0;

	if (res != NULL) {
		if (!res->type.is_non_consumable)
			return 0;

		if (res->type.is_string && res->str_avail == NULL)
			return 0;
	}

	/* successful boolean match: (req = request res = resource on object)
	 * req: True  res: True
	 * req: False res: False
	 * req: False res: NULL
	 * req:   *   res: TRUE_FALSE
	 */
	if (req->type.is_boolean) {
		if (!req->amount && res == NULL)
			return 1;
		else if (req->amount && res == NULL)
			return 0;
		else if (res->avail == TRUE_FALSE)
			return 1;
		else
			return res->avail == req->amount;
	}

	if (req->type.is_string && res != NULL) {
		/* 'host' to follow IETF rules; 'host' is case insensitive  */
		if (!strcmp(res->name, "host"))
			return compare_res_to_str(res, req->res_str, CMP_CASELESS);
		else
			return compare_res_to_str(res, req->res_str, CMP_CASE);
	}

	return 0;
}

/**
 * @brief
 * 		create a select from an nspec array to place chunks back on the
 *		same nodes as before.  If an nspec does not have a ninfo, it means
 *		we need to get back the resources, but not on the same node.
 *
 * @param[in]	nspec_array	-	npsec array to convert
 *
 * @return	converted select string
 */
std::string
create_select_from_nspec(std::vector<nspec *> &nspec_arr)
{
	std::string select_spec;
	char buf[2048];
	resource_req *req;

	if (nspec_arr.empty())
		return {};

	/* convert form (node:foo=X:bar=Y) into 1:vnode=node:foo=X:bay=Y*/
	for (const auto &ns : nspec_arr) {
		/* Don't add exclhost chunks into our select. They will be added back when
		 * we call eval_selspec() with the original place=exclhost.  If we added
		 * them, we'd have issues placing chunks w/o resources
		 */
		if (ns->resreq != NULL) {
			if (ns->ninfo != NULL) {
				select_spec += "1:vnode=";
				select_spec += ns->ninfo->name;
			} else {
				/* We need the resources back, but not necessarily on the same node */
				select_spec += "1";
			}
			for (req = ns->resreq; req != NULL; req = req->next) {
				char resstr[MAX_LOG_SIZE];

				res_to_str_r(req, RF_REQUEST, resstr, sizeof(resstr));
				if (resstr[0] == '\0') {
					return {};
				}
				snprintf(buf, sizeof(buf), ":%s=%s", req->name, resstr);
				select_spec += buf;
			}
			select_spec += "+";
		}
	}

	/* get rid of trailing '+' */
	select_spec.pop_back();

	return select_spec;
}

/**
 * @brief
 * 		true if job/resv is in a state in which it can be run
 * 		Jobs are runnable if:
 *	   	in state 'Q'
 *		suspended by the scheduler
 *		is job array in state 'B' and there is a queued subjob
 *		Reservations are runnable if they are in state RESV_CONFIRMED
 *
 *
 * @param[in] resresv - resource resv to check
 *
 * @return int
 * @retval	1	: if the resource resv is in a runnable state
 * @retval  0	: if not
 *
 */
int
in_runnable_state(resource_resv *resresv)
{
	if (resresv == NULL)
		return 0;

	if (resresv->is_job && resresv->job != NULL) {
		if (resresv->job->is_array) {
			if (range_next_value(resresv->job->queued_subjobs, -1) >= 0) {
				if (resresv->job->is_begin || resresv->job->is_queued)
					return 1;
			} else
				return 0;
		}

		if (resresv->job->is_queued)
			return 1;

		if (resresv->job->is_susp_sched)
			return 1;
	} else if (resresv->is_resv && resresv->resv != NULL) {
		if (resresv->resv->resv_state == RESV_CONFIRMED)
			return 1;
	}

	return 0;
}


================================================
FILE: src/scheduler/resource_resv.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _RESOURCE_RESV_H
#define _RESOURCE_RESV_H

#include "data_types.h"

/*
 * pthread routine to free resource_resv array chunk
 */
void
free_resource_resv_array_chunk(th_data_free_resresv *data);

/*
 *      free_resource_resv_array - free an array of resource resvs
 */
void free_resource_resv_array(resource_resv **resresv_arr);

/*
 *      dup_resource_resv - duplicate a resource resv structure
 */
resource_resv *dup_resource_resv(resource_resv *oresresv, server_info *nsinfo,
				 queue_info *nqinfo, const std::string &name);

resource_resv *dup_resource_resv(resource_resv *oresresv, server_info *nsinfo, queue_info *nqinfo);
/*
 * pthread routine for duping a chunk of resresvs
 */
void dup_resource_resv_array_chunk(th_data_dup_resresv *data);
/*
 *      dup_resource_resv_array - dup a array of pointers of resource resvs
 */
resource_resv **
dup_resource_resv_array(resource_resv **oresresv_arr,
			server_info *nsinfo, queue_info *nqinfo);

/*
 *      is_resource_resv_valid - do simple validity checks for a resource resv
 *      returns 1 if valid 0 if not
 */
int is_resource_resv_valid(resource_resv *resresv, schd_error *err);

/*
 *      find_resource_resv - find a resource_resv by name
 */
resource_resv *find_resource_resv(resource_resv **resresv_arr, const std::string &name);

/*
 * find a resource_resv by unique numeric rank

 */
resource_resv *find_resource_resv_by_indrank(resource_resv **resresv_arr, int index, int rank);

/**
 *  find_resource_resv_by_time - find a resource_resv by name and start time
 */
resource_resv *find_resource_resv_by_time(resource_resv **resresv_arr, const std::string &name, time_t start_time);

/*
 *      find_resource_req - find a resource_req from a resource_req list
 */
resource_req *find_resource_req_by_str(resource_req *reqlist, const char *name);

/*
 *	find resource_req by resource definition
 */
resource_req *find_resource_req(resource_req *reqlist, resdef *def);

/*
 *	find resource_count by resource definition
 */
resource_count *find_resource_count(resource_count *reqlist, resdef *def);

/*
 *      new_resource_req - allocate and initalize new resoruce_req
 */
#ifdef NAS /* localmod 005 */
resource_req *new_resource_req(void);
#else
resource_req *new_resource_req();
#endif /* localmod 005 */

/*
 * new_resource_count - allocate and initalize new resource_count
 */
resource_count *new_resource_count();

/*
 * find_alloc_resource_req[_by_str] -
 * find resource_req by name/resource definition  or allocate and
 * initialize a new resource_req also adds new one to the list
 */
resource_req *find_alloc_resource_req(resource_req *reqlist, resdef *def);
resource_req *find_alloc_resource_req_by_str(resource_req *reqlist, char *name);

/*
 * find resource_count by resource definition or allocate
 */
resource_count *find_alloc_resource_count(resource_count *rcountlist, resdef *def);

/*
 *      free_resource_req_list - frees memory used by a resource_req list
 */
void free_resource_req_list(resource_req *list);

/*
 *	free_resource_req - free memory used by a resource_req structure
 */
void free_resource_req(resource_req *req);

/*
 *      free_resource_count_list - frees memory used by a resource_count list
 */
void free_resource_count_list(resource_count *rcount);

/*
 *	free_resource_count - free memory used by a resource_count structure
 */
void free_resource_count(resource_count *req);

/*
 *	set_resource_req - set the value and type of a resource req
 */
int set_resource_req(resource_req *req, const char *val);

/*
 *
 *      dup_resource_req_list - duplicate a resource_req list
 */
resource_req *dup_resource_req_list(resource_req *oreq);

resource_req *dup_selective_resource_req_list(resource_req *oreq, std::unordered_set<resdef *> &deflist);

/*
 *	dup_resource_count_list - duplicate a resource_req list
 */
resource_count *dup_resource_count_list(resource_count *orcount);

/*
 *      dup_resource_req - duplicate a resource_req struct
 */
resource_req *dup_resource_req(resource_req *oreq);

/*
 *	dup_resource_count - duplicate a resource_count struct
 */
resource_count *dup_resource_count(resource_count *orcount);

/*
 *      update_resresv_on_run - update information kept in a resource_resv
 *                              struct when one is started
 */
void update_resresv_on_run(resource_resv *resresv, std::vector<nspec *> &nspec_arr);

/*
 *      update_resresv_on_end - update a resource_resv structure when
 *                                    it ends
 */
void update_resresv_on_end(resource_resv *resresv, const char *job_state);

/*
 *      resource_resv_filter - filters jobs on specified argument
 */
resource_resv **
resource_resv_filter(resource_resv **resresv_arr, int size,
		     int (*filter_func)(resource_resv *, const void *), const void *arg, int flags);

/*
 *      remove_resresv_from_array - remove a resource_resv from an array
 *                                  without leaving a hole
 */
int
remove_resresv_from_array(resource_resv **resresv_arr,
			  resource_resv *resresv);

/*
 *      add_resresv_to_array - add a resource resv to an array
 *                         note: requires reallocating array
 */
resource_resv **
add_resresv_to_array(resource_resv **resresv_arr,
		     resource_resv *resresv, int flags);

/*
 *      copy_resresv_array - copy an array of resource_resvs by name.
 *                      This is useful  when duplicating a data structure
 *                      with a job array in it which isn't easily reproduced.
 *
 *      NOTE: if a job in resresv_arr is not in tot_arr, that resresv will be
 *              left out of the new array
 */
resource_resv **
copy_resresv_array(resource_resv **resresv_arr,
		   resource_resv **tot_arr);

/*
 *	is_resresv_running - is a resource resv in the running state
 *			     for a job it's in the "R" state
 *			     for an advanced reservation it is running
 */
int is_resresv_running(resource_resv *resresv);

/*
 *	new_place - allocate and initialize a placement spec
 *
 *	returns newly allocated place
 */
#ifdef NAS /* localmod 005 */
place *new_place(void);
#else
place *new_place();
#endif /* localmod 005 */

/*
 *	free_place - free a placement spec
 */
void free_place(place *pl);

/*
 *	dup_place - duplicate a place structure
 */
place *dup_place(place *pl);

/*
 *	compare_res_to_str - compare a resource structure of type string to
 *			     a character array string
 */
int compare_res_to_str(schd_resource *res, char *str, enum resval_cmpflag);

/*
 *	compare_non_consumable - perform the == operation on a non consumable
 *				resource and resource_req
 *	returns 1 for a match or 0 for not a match
 */
int compare_non_consumable(schd_resource *res, resource_req *req);

/* compare two resource req lists for equality.  Only compare resources in comparr */
int compare_resource_req_list(resource_req *req1, resource_req *req2, std::unordered_set<resdef *> &comparr);

/* compare two resource_reqs for equality*/
int compare_resource_req(resource_req *req1, resource_req *req2);

/*
 *	new_chunk - constructor for chunk
 */
#ifdef NAS /* localmod 005 */
chunk *new_chunk(void);
#else
chunk *new_chunk();
#endif /* localmod 005 */

/*
 *	dup_chunk_array - array copy constructor for array of chunk ptrs
 */
chunk **dup_chunk_array(const chunk *const *old_chunk_arr);

/*
 *	dup_chunk - copy constructor for chunk
 */
chunk *dup_chunk(const chunk *ochunk);

/*
 *	free_chunk_array - array destructor for array of chunk ptrs
 */
void free_chunk_array(chunk **chunk_arr);

/*
 *	free_chunk - destructor for chunk
 */
void free_chunk(chunk *ch);

/*
 * create_resource_req - create a new resource_req
 *
 *	return new resource_req or NULL
 */
resource_req *create_resource_req(const char *name, const char *value);

/*
 * create a select from an nspec array to place chunks back on the
 *        same nodes as befor
 *
 * return converted select string
 */
std::string create_select_from_nspec(std::vector<nspec *> &nspec_arr);

/* function returns true if job/resv is in a state which it can be run */
int in_runnable_state(resource_resv *resresv);

#endif /* _RESOURCE_RESV_H */


================================================
FILE: src/scheduler/resv_info.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    resv_info.c
 *
 * @brief
 * 	resv_info.c - This file contains functions related to advance reservations.
 *
 * Functions included are:
 *	stat_resvs()
 *	query_reservations()
 *	query_resv()
 *	new_resv_info()
 *	free_resv_info()
 *	dup_resv_info()
 *	check_new_reservations()
 *	disable_reservation_occurrence()
 *	confirm_reservation()
 *	release_nodes()
 *	create_resv_nodes()
 *
 */

#include <pbs_config.h>

#include <algorithm>

#include <errno.h>
#include <libutil.h>
#include <log.h>
#include <pbs_ifl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#include "check.h"
#include "constant.h"
#include "data_types.h"
#include "fifo.h"
#include "globals.h"
#include "job_info.h"
#include "libpbs.h"
#include "misc.h"
#include "node_info.h"
#include "node_partition.h"
#include "pbs_internal.h"
#include "queue_info.h"
#include "resource.h"
#include "resource_resv.h"
#include "resv_info.h"
#include "server_info.h"
#include "simulate.h"
#include "sort.h"

/**
 * @brief
 * 		Statuses reservations from the server in batch status form.
 *
 * @param[in]	pbs_sd	-	The socket descriptor to the server's connection
 *
 * @return	batch status form of the reservations
 */
struct batch_status *
stat_resvs(int pbs_sd)
{
	struct batch_status *resvs;
	/* get the reservation info from the PBS server */
	if ((resvs = send_statresv(pbs_sd, NULL, NULL, NULL)) == NULL) {
		if (pbs_errno) {
			const char *errmsg = pbs_geterrmsg(pbs_sd);
			if (errmsg == NULL)
				errmsg = "";
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_RESV, LOG_NOTICE, "resv_info",
				   "pbs_statresv failed: %s (%d)", errmsg, pbs_errno);
		}
		return NULL;
	}
	return resvs;
}

/**
 *
 * @brief
 *	query_reservations - query the reservations from the server.
 *
 *  Each reservation, is created to reflect its current state in the server.
 *  For a standing reservation, the parent reservation represents the soonest
 *  occurrence known to the server; each remaining occurrence is unrolled to
 *  account for the resources consumed by the standing reservation as a whole.
 *
 *  A degraded reservation, is handled in a manner similar to a confirmed
 *  reservation. Even though resources of a degraded reservation may change in
 *  this scheduling cycle, in case no alternate resources are found, the
 *  reservation retains its currently allocated resources, such that no other
 *  requests make use of the same resources.
 *
 * @param[in] pbs_sd - connection to the pbs server
 * @param[in] sinfo  - the server to query from
 * @param[in] resvs  - batch status of the stat'ed reservations
 *
 * @return    An array of reservations
 *
 */
resource_resv **
query_reservations(int pbs_sd, server_info *sinfo, struct batch_status *resvs)
{
	/* the current reservation in the list */
	struct batch_status *cur_resv;

	/* the array of pointers to internal scheduling structure for reservations */
	resource_resv **resresv_arr;

	/* the current resv */
	resource_resv *resresv;

	int j;
	int idx = 0; /* index of the server info's resource reservation array */
	int num_resv = 0;

	schd_error *err;

	if (resvs == NULL)
		return NULL;

	err = new_schd_error();
	if (err == NULL)
		return NULL;

	cur_resv = resvs;

	while (cur_resv != NULL) {
		num_resv++;
		cur_resv = cur_resv->next;
	}

	if ((resresv_arr = static_cast<resource_resv **>(malloc(sizeof(resource_resv *) * (num_resv + 1)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		free_schd_error(err);
		return NULL;
	}
	resresv_arr[0] = NULL;
	sinfo->num_resvs = num_resv;

	for (cur_resv = resvs; cur_resv != NULL; cur_resv = cur_resv->next) {
		int ignore_resv = 0;
		clear_schd_error(err);
		struct attrl *attrp = NULL;
		/* Check if this reservation belongs to this scheduler */
		for (attrp = cur_resv->attribs; attrp != NULL; attrp = attrp->next) {
			if (strcmp(attrp->name, ATTR_partition) == 0) {
				if (sc_attrs.partition != NULL && (strcmp(attrp->value, sc_attrs.partition) != 0))
					ignore_resv = 1;
				break;
			}
		}
		if (ignore_resv == 1) {
			sinfo->num_resvs--;
			continue;
		}

		/* convert resv info from server batch_status into resv_info */
		if ((resresv = query_resv(cur_resv, sinfo)) == NULL) {
			free_resource_resv_array(resresv_arr);
			free_schd_error(err);
			return NULL;
		}
#ifdef NAS /* localmod 047 */
		if (resresv->place_spec == NULL) {
			resresv->place_spec = parse_placespec("scatter");
		}
#endif /* localmod 047 */

		/* We continue adding valid resvs to our array.  We're
		 * freeing what we allocated and ignoring this resv completely.
		 */
		if (!is_resource_resv_valid(resresv, err) || resresv->is_invalid) {
			schdlogerr(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV, LOG_DEBUG, resresv->name,
				   "Reservation is invalid - ignoring for this cycle", err);
			ignore_resv = 1;
		}
		/* Make sure it is not a future reservation that is being deleted, if so ignore it */
		else if ((resresv->resv->resv_state == RESV_BEING_DELETED) && (resresv->start > sinfo->server_time)) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_RESV, LOG_DEBUG,
				  resresv->name, "Future reservation is being deleted, ignoring this reservation");
			ignore_resv = 1;
		} else if ((resresv->resv->resv_state == RESV_BEING_DELETED) && (resresv->resv->resv_nodes != NULL) &&
			   (!is_string_in_arr(resresv->resv->resv_nodes[0]->resvs, resresv->name.c_str()))) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_RESV, LOG_DEBUG,
				  resresv->name, "Reservation is being deleted and not present on node, ignoring this reservation");
			ignore_resv = 1;
		}

		if (ignore_resv == 1) {
			sinfo->num_resvs--;
			/* mark all the jobs of the associated queue as can never run */
			if (resresv->resv->queuename != NULL) {
				queue_info *qinfo = find_queue_info(sinfo->queues, resresv->resv->queuename);
				if (qinfo != NULL) {
					clear_schd_error(err);
					set_schd_error_arg(err, SPECMSG, "Reservation is in an invalid state");
					set_schd_error_codes(err, NEVER_RUN, ERR_SPECIAL);
					update_jobs_cant_run(pbs_sd, qinfo->jobs, NULL, err, START_WITH_JOB);
				}
			}
			delete resresv;
			continue;
		}

		modify_jobs_nodes_for_resv(resresv, sinfo->server_time);

		/* The server's info only gives information about a single reservation
		 * object. In the case of a standing reservation, it is up to the
		 * scheduler to account for each occurrence and attempt to confirm the
		 * reservation.
		 *
		 * In such a case, each occurrence has to be 'cloned'
		 * by duplicating the parent reservation and setting the specific start
		 * and end times and unique execvnodes for each occurrence.
		 *
		 * Note that because the first occurrence may reschedule the start time
		 * from the one submitted by reserve_start (see -R of pbs_rsub), the
		 *  initial start time has to be reconfirmed. An example of such
		 * rescheduling is:
		 *   pbs_rsub -R 2000 -E 2100 -r "FREQ=DAILY;BYHOUR=9,20;COUNT=2"
		 * for which the first occurrence is 9am and then 8pm.
		 * BYHOUR takes priority over the start time specified by -R of pbs_rsub.
		 *
		 * Only unroll the occurrences if the parent reservation has been
		 * confirmed.
		 */
		if (resresv->resv->is_standing &&
		    (resresv->resv->resv_state != RESV_UNCONFIRMED)) {
			resource_resv *resresv_ocr = NULL; /* the occurrence's resource_resv */
			char *execvnodes_seq = NULL;		   /* confirmed execvnodes sequence string */
			char **execvnode_ptr = NULL;
			char **tofree = NULL;
			resource_resv **tmp = NULL;
			time_t dtstart;
			char *rrule = NULL;
			char *tz = NULL;
			char start_time[128];
			int count = 0;
			int occr_count;	  /* occurrences count as reported by execvnodes_seq */
			int occr_idx;	  /* the occurrence index of a standing reservation */
			int degraded_idx; /* index corrected to account for reconfirmation */

			/* occr_idx refers to the soonest occurrence to run or currently running
			 * Note that resv_idx starts at 1 on the first occurrence and not 0.
			 */
			occr_idx = resresv->resv->resv_idx;
			execvnodes_seq = string_dup(resresv->resv->execvnodes_seq);
			/* the error handling for the string duplication returning NULL is
			 * combined with the following assignment, because get_execvnodes_count
			 * returns 0 if passed a NULL argument
			 */
			occr_count = get_execvnodes_count(execvnodes_seq);
			/* this should happen only if the execvnodes_seq are corrupted. In such
			 * case, we ignore the reservation and move on to the next one
			 */
			if (occr_count == 0) {
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_RESV, LOG_DEBUG,
					  resresv->name, "Error processing standing reservation, degrading it");
				if  (resresv->resv->resv_state != RESV_RUNNING
				         && resresv->resv->resv_state != RESV_DELETING_JOBS)
					resresv->resv->resv_state = RESV_DEGRADED;
			}
			/* unroll_execvnode_seq will destroy the first argument that is passed
			 * to it by calling tokenizing functions, hence, it has to be duplicated
			 */
			execvnode_ptr = unroll_execvnode_seq(execvnodes_seq, &tofree);
			count = resresv->resv->count;

			/* 'count' and 'occr_idx' attributes persist through the life of the
			 * standing reservation. After a reconfirmation, the new execvnodes
			 * sequence may be shortened, therefore the occurrence index used to
			 * identify which execvnode is associated to which occurrence needs to
			 * be adjusted to take into account the elapsed occurrences
			 */
			degraded_idx = occr_idx - (count - occr_count);

			/* The number of remaining occurrences to add to the svr_info is given
			 * by the total number of occurrences (count) to which we subtract the
			 * number of elapsed occurrences that started at 1.
			 * For example, if a standing reservation for a count of 10 is submitted
			 * and the reservation has already run 2 and is now scheduling the 3rd
			 * one to start, then occr_idx is 3. The number of remaining occurrences
			 * to add to the server info is then 10-3=7
			 * Note that 'count - occr_idx' is identical to
			 * 'occr_count - degraded_idx'
			 */
			sinfo->num_resvs += count - occr_idx;

			/* Resize the reservations array to append each occurrence */
			if ((tmp = static_cast<resource_resv **>(realloc(resresv_arr,
									 sizeof(resource_resv *) * (sinfo->num_resvs + 1)))) == NULL) {
				log_err(errno, __func__, MEM_ERR_MSG);
				free_resource_resv_array(resresv_arr);
				delete resresv;
				free_execvnode_seq(tofree);
				free(execvnodes_seq);
				free(execvnode_ptr);
				free_schd_error(err);
				return NULL;
			}
			resresv_arr = tmp;

			rrule = resresv->resv->rrule;
			dtstart = resresv->resv->req_start;
			tz = resresv->resv->timezone;

			/* Add each occurrence to the universe's view by duplicating the
			 * parent reservation and resetting start and end times and the
			 * execvnode on which the occurrence is confirmed to run.
			 */
			for (j = 0; occr_idx <= count; occr_idx++, j++, degraded_idx++) {
				/* If it is not the first occurrence then update the start time as
				 * req_start_standing (if set). This is to ensure that if the first
				 * occurrence has been changed, other future occurrences are not
				 * affected.
				 */
				if (j == 1 && resresv_ocr->resv->req_start_standing != UNSPECIFIED)
					dtstart = resresv_ocr->resv->req_start_standing;
				/* Get the start time of the next occurrence computed from dtstart.
				 * The server maintains state of a single reservation object for
				 * which in the case of a standing reservation, it updates start
				 * and end times and execvnodes.
				 * The last argument (j+1) indicates the occurrence index from dtstart
				 * starting at 1. Returns dtstart if it's an advance reservation.
				 */
				auto next = get_occurrence(rrule, dtstart, tz, j + 1);

				/* Duplicate the "master" resv only for subsequent occurrences */
				if (j == 0)
					resresv_ocr = resresv;
				else {
					resresv_ocr = dup_resource_resv(resresv, sinfo, NULL);
					if (resresv_ocr == NULL) {
						log_err(errno, __func__, "Error duplicating resource reservation");
						free_resource_resv_array(resresv_arr);
						delete resresv;
						free_execvnode_seq(tofree);
						free(execvnodes_seq);
						free(execvnode_ptr);
						free_schd_error(err);
						return NULL;
					}
					if (resresv->resv->resv_state == RESV_RUNNING ||
					    resresv->resv->resv_state == RESV_BEING_ALTERED ||
					    resresv->resv->resv_state == RESV_DELETING_JOBS) {
						/* Each occurrence will be added to the simulation framework and
						 * should not be in running state. Their state should be
						 * Confirmed instead of possibly inheriting the Running state
						 * from the parent reservation.
						 */
						resresv_ocr->resv->resv_state = RESV_CONFIRMED;
						resresv_ocr->resv->is_running = 0;
					}
					/* Duplication deep-copies node info array. This array gets
					 * overwritten and needs to be freed. This is an alternative
					 * to creating another duplication function that only duplicates
					 * the required fields.
					 */
					release_nodes(resresv_ocr);

					if (resresv_ocr->resv->select_standing != NULL) {
						delete resresv_ocr->select;
						resresv_ocr->select = new selspec(*resresv_ocr->resv->select_standing);
					}

					if (degraded_idx >= 1 && degraded_idx <= occr_count)
						resresv_ocr->resv->orig_nspec_arr = parse_execvnode(
							execvnode_ptr[degraded_idx - 1], sinfo, resresv_ocr->select);
					else {
						resresv_ocr->resv->orig_nspec_arr = {};
						log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV,
							   LOG_INFO, resresv->name,
							   "%s: occurence %d has no execvnodes, proceeding without assigned resources",
							   __func__, j + 1);
					}

					resresv_ocr->nspec_arr = combine_nspec_array(resresv_ocr->resv->orig_nspec_arr);
					resresv_ocr->ninfo_arr = create_node_array_from_nspec(resresv_ocr->nspec_arr);
					resresv_ocr->resv->resv_nodes = create_resv_nodes(
						resresv_ocr->nspec_arr, sinfo);
				}

				/* Set occurrence start and end time and nodes information. On the
				 * first occurrence the start time may need to be reset to the time
				 * specified by the recurrence rule. See description at the head of
				 * this block.
				 */
				resresv_ocr->resv->req_start = next;
				/* If it is not the first occurrence then update the duration as
				 * req_duration_standing (if set). This is to ensure that if the first
				 * occurrence has been changed, other future occurrences are not
				 * affected.
				 */
				if (j != 0 && resresv->resv->req_duration_standing != UNSPECIFIED)
					resresv_ocr->hard_duration = resresv_ocr->duration = resresv->resv->req_duration_standing;
				resresv_ocr->resv->req_end = next + resresv_ocr->duration;
				resresv_ocr->start = resresv_ocr->resv->req_start;
				resresv_ocr->end = resresv_ocr->resv->req_end;
				resresv_ocr->resv->resv_idx = occr_idx;

				/* Add the occurrence to the global array of reservations */
				resresv_arr[idx++] = resresv_ocr;
				resresv_arr[idx] = NULL;

				auto loc_time = localtime(&resresv_ocr->start);
				strftime(start_time, sizeof(start_time), "%Y%m%d-%H:%M:%S", loc_time);

				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_RESV, LOG_DEBUG, resresv->name,
					   "Occurrence %d/%d,%s", occr_idx, count, start_time);
			}
			/* The parent reservation has already been added so move on to handling
			 * the next reservation
			 */

			free_execvnode_seq(tofree);
			free(execvnodes_seq);
			free(execvnode_ptr);

			continue;
		} else {
			resresv_arr[idx++] = resresv;
			resresv_arr[idx] = NULL;
		}
	}

	free_schd_error(err);

	return resresv_arr;
}

/**
 * @brief
 *		query_resv - convert the servers batch_status structure into a
 *			 resource_resv/resv_info structs for easier access
 *
 * @param[in]	resv	-	a single reservation in batch_status form
 * @param[in]	sinfo 	- 	the server
 *
 * @return	the converted resource_resv struct
 *
 */
resource_resv *
query_resv(struct batch_status *resv, server_info *sinfo)
{
	struct attrl *attrp = NULL;    /* linked list of attributes from server */
	resource_resv *advresv = NULL; /* resv_info to be created */
	resource_req *resreq = NULL;   /* used for the ATTR_l resources */
	char *endp = NULL;	       /* used with strtol() */
	long count = 0;		       /* used to convert string -> num */
	char *resv_nodes = NULL;       /* used to hold the resv_nodes for later processing */

	if (resv == NULL)
		return NULL;

	if ((advresv = new resource_resv(resv->name)) == NULL)
		return NULL;

	if ((advresv->resv = new_resv_info()) == NULL) {
		delete advresv;
		return NULL;
	}

	attrp = resv->attribs;
	advresv->server = sinfo;
	advresv->is_resv = 1;

	while (attrp != NULL) {
		if (!strcmp(attrp->name, ATTR_resv_owner))
			advresv->user = attrp->value;
		else if (!strcmp(attrp->name, ATTR_egroup))
			advresv->group = attrp->value;
		else if (!strcmp(attrp->name, ATTR_queue))
			advresv->resv->queuename = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_SchedSelect)) {
			advresv->select = parse_selspec(attrp->value);
			if (advresv->select != NULL && advresv->select->chunks != NULL) {
				/* Ignore resv if any of the chunks has no resource req. */
				int i;
				for (i = 0; advresv->select->chunks[i] != NULL; i++)
					if (advresv->select->chunks[i]->req == NULL)
						advresv->is_invalid = 1;
			}
		} else if (!strcmp(attrp->name, ATTR_resv_start)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				count = -1;
			advresv->resv->req_start = count;
		} else if (!strcmp(attrp->name, ATTR_resv_end)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				count = -1;
			advresv->resv->req_end = count;
		} else if (!strcmp(attrp->name, ATTR_resv_duration)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				count = -1;
			advresv->resv->req_duration = count;
		} else if (!strcmp(attrp->name, ATTR_resv_alter_revert)) {
			if (!strcmp(attrp->resource, "start_time")) {
				count = strtol(attrp->value, &endp, 10);
				if (*endp != '\0')
					count = -1;
				advresv->resv->req_start_orig = count;
			} else if (!strcmp(attrp->resource, "walltime")) {
				advresv->resv->req_duration_orig = (time_t) res_to_num(attrp->value, NULL);
			}
		} else if (!strcmp(attrp->name, ATTR_resv_standing_revert)) {
			if (!strcmp(attrp->resource, "start_time")) {
				count = strtol(attrp->value, &endp, 10);
				if (*endp != '\0')
					count = -1;
				advresv->resv->req_start_standing = count;
			} else if (!strcmp(attrp->resource, "walltime")) {
				advresv->resv->req_duration_standing = (time_t) res_to_num(attrp->value, NULL);
			} else if (!strcmp(attrp->resource, "select")) {
				advresv->resv->select_standing = parse_selspec(attrp->value);
			}
		} else if (!strcmp(attrp->name, ATTR_resv_retry)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				count = -1;
			advresv->resv->retry_time = count;
		} else if (!strcmp(attrp->name, ATTR_resv_state)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				count = -1;
			advresv->resv->resv_state = (enum resv_states) count;
		} else if (!strcmp(attrp->name, ATTR_resv_substate)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp != '\0')
				count = -1;
			advresv->resv->resv_substate = (enum resv_states) count;
		} else if (!strcmp(attrp->name, ATTR_l)) { /* resources requested*/
			resreq = find_alloc_resource_req_by_str(advresv->resreq, attrp->resource);
			if (resreq == NULL) {
				delete advresv;
				return NULL;
			}

			if (set_resource_req(resreq, attrp->value) != 1)
				advresv->is_invalid = 1;
			else {
				if (advresv->resreq == NULL)
					advresv->resreq = resreq;
				if (!strcmp(attrp->resource, "place")) {
					advresv->place_spec = parse_placespec(attrp->value);
					if (advresv->place_spec == NULL)
						advresv->is_invalid = 1;
				}
			}
		} else if (!strcmp(attrp->name, ATTR_resv_nodes))
			resv_nodes = attrp->value;
		else if (!strcmp(attrp->name, ATTR_node_set))
			advresv->node_set_str = break_comma_list(attrp->value);
		else if (!strcmp(attrp->name, ATTR_resv_timezone))
			advresv->resv->timezone = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_resv_rrule))
			advresv->resv->rrule = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_resv_execvnodes))
			advresv->resv->execvnodes_seq = string_dup(attrp->value);
		else if (!strcmp(attrp->name, ATTR_resv_idx))
			advresv->resv->resv_idx = atoi(attrp->value);
		else if (!strcmp(attrp->name, ATTR_resv_standing)) {
			count = atoi(attrp->value);
			advresv->resv->is_standing = count;
		} else if (!strcmp(attrp->name, ATTR_resv_count))
			advresv->resv->count = atoi(attrp->value);
		else if (!strcmp(attrp->name, ATTR_partition)) {
			advresv->resv->partition = strdup(attrp->value);
		} else if (!strcmp(attrp->name, ATTR_SchedSelect_orig)) {
			advresv->resv->select_orig = parse_selspec(attrp->value);
		}
		attrp = attrp->next;
	}

	/* If we have a select_orig, this means we're doing an ralter and reducing the size of our reservation
	 * We need to map the orig chunks to chunks from the smaller select to make sure we keep them.
	 * To do this, we set the seq_num of the select chunk to the same seq_num of the select_orig chunk
	 *
	 */
	if (advresv->resv->select_orig != NULL) {
		int j = 0;
		char *sel_orig_str, *sel_str;
		auto sel_num = strtol(advresv->select->chunks[j]->str_chunk, &sel_str, 10);

		for (int i = 0; advresv->resv->select_orig->chunks[i] != NULL; i++) {
			chunk *chk = advresv->resv->select_orig->chunks[i];
			auto sel_orig_num = strtol(chk->str_chunk, &sel_orig_str, 10);
			if (strcmp(sel_orig_str, sel_str) == 0 && sel_num <= sel_orig_num) {
				advresv->select->chunks[j++]->seq_num = chk->seq_num;
				if (advresv->select->chunks[j] != NULL)
					sel_num = strtol(advresv->select->chunks[j]->str_chunk, &sel_str, 10);
				else
					break;
			}
		}
	}

	if (resv_nodes != NULL) {
		selspec *sel;
		std::string selectspec;
		/* parse the execvnode and create an nspec array with ninfo ptrs pointing
		 * to nodes in the real server
		 */
		if (advresv->resv->select_orig != NULL)
			sel = advresv->resv->select_orig;
		else
			sel = advresv->select;
		advresv->resv->orig_nspec_arr = parse_execvnode(resv_nodes, sinfo, sel);
		advresv->nspec_arr = combine_nspec_array(advresv->resv->orig_nspec_arr);
		advresv->ninfo_arr = create_node_array_from_nspec(advresv->nspec_arr);

		/* create a node info array by copying the nodes and setting
		 * available resources to only the ones assigned to the reservation
		 */
		advresv->resv->resv_nodes = create_resv_nodes(advresv->nspec_arr, sinfo);
		selectspec = create_select_from_nspec(advresv->resv->orig_nspec_arr);
		advresv->execselect = parse_selspec(selectspec);
	}

	/* If reservation is unconfirmed and the number of occurrences is 0 then flag
	 * the reservation as invalid. This is an extra check but isn't supposed to
	 * happen because the server will purge such reservations.
	 */
	if (advresv->resv->resv_state == RESV_UNCONFIRMED &&
	    get_num_occurrences(advresv->resv->rrule,
				advresv->resv->req_start,
				advresv->resv->timezone) == 0)
		advresv->is_invalid = 1;

	/* When a reservation is recognized as DEGRADED, it is converted into
	 * state = CONFIRMED; substate = DEGRADED
	 * From the scheduler's perspective, the reservation is CONFIRMED in that its
	 * allocated resources remain scheduled in the calendar, but it is
	 * handled as an UNCONFIRMED reservation when its resources are to be
	 * replaced.
	 */
	if (advresv->resv->resv_state == RESV_DEGRADED) {
		advresv->resv->resv_state = RESV_CONFIRMED;
		if (advresv->resv->resv_substate != RESV_IN_CONFLICT)
			advresv->resv->resv_substate = RESV_DEGRADED;
	}

	if (advresv->resv->resv_state == RESV_BEING_ALTERED) {
		time_t alter_end = advresv->resv->req_start_orig + advresv->resv->req_duration_orig;
		if (advresv->resv->req_start_orig <= sinfo->server_time && alter_end >= sinfo->server_time)
			advresv->resv->is_running = 1;
	} else if (advresv->resv->req_start <= sinfo->server_time && advresv->resv->req_end >= sinfo->server_time)
		advresv->resv->is_running = 1;

	advresv->rank = get_sched_rank();

	advresv->aoename = getaoename(advresv->select);
	advresv->eoename = geteoename(advresv->select);

	/* reservations requesting AOE mark nodes as exclusive */
	if (advresv->aoename) {
		advresv->place_spec->share = 0;
		advresv->place_spec->excl = 1;
	}

	/*
	 * Check to see if we can attempt to confirm this reservation.
	 * If we can, then then all we will do in this cycle is attempt
	 * to confirm reservations.  In that case, build the calendar
	 * using the hard durations of jobs.
	 */
	if (will_confirm(advresv, sinfo->server_time))
		sinfo->use_hard_duration = 1;

	advresv->duration = advresv->resv->req_duration;
	advresv->hard_duration = advresv->duration;
	if (advresv->resv->resv_state != RESV_UNCONFIRMED) {
		advresv->start = advresv->resv->req_start;
		if (advresv->resv->resv_state == RESV_BEING_DELETED ||
		    advresv->start + advresv->duration <= sinfo->server_time) {
			advresv->end = sinfo->server_time + EXITING_TIME;
		} else
			advresv->end = advresv->resv->req_end;
	}

	if (advresv->node_set_str != NULL) {
		advresv->node_set = create_node_array_from_str(
			advresv->server->unassoc_nodes, advresv->node_set_str);
	}
	advresv->resv->resv_queue =
		find_queue_info(sinfo->queues, advresv->resv->queuename);

	/* It's possible for an in-conflict reservation to be running with no nodes */
	if (is_resresv_running(advresv) && advresv->ninfo_arr != NULL) {
		for (int j = 0; advresv->ninfo_arr[j] != NULL; j++)
			advresv->ninfo_arr[j]->num_run_resv++;
	}

	return advresv;
}

/**
 * @brief
 *		new_resv_info - allocate and initialize new resv_info structure
 *
 * @return	the new structure
 *
 */
resv_info *
new_resv_info()
{
	resv_info *rinfo;

	rinfo = new resv_info();

	rinfo->queuename = NULL;
	rinfo->req_start = UNSPECIFIED;
	rinfo->req_start_orig = UNSPECIFIED;
	rinfo->req_start_standing = UNSPECIFIED;
	rinfo->req_end = UNSPECIFIED;
	rinfo->req_duration = UNSPECIFIED;
	rinfo->req_duration_orig = UNSPECIFIED;
	rinfo->req_duration_standing = UNSPECIFIED;
	rinfo->retry_time = UNSPECIFIED;
	rinfo->resv_state = RESV_NONE;
	rinfo->resv_substate = RESV_NONE;
	rinfo->resv_queue = NULL;
	rinfo->resv_nodes = NULL;
	rinfo->timezone = NULL;
	rinfo->rrule = NULL;
	rinfo->resv_idx = 1;
	rinfo->execvnodes_seq = NULL;
	rinfo->count = 0;
	rinfo->is_standing = 0;
	rinfo->is_running = 0;
	rinfo->occr_start_arr = NULL;
	rinfo->partition = NULL;
	rinfo->select_orig = NULL;
	rinfo->select_standing = NULL;

	return rinfo;
}

/**
 * @brief
 *		free_resv_info - free all the memory used by a rev_info structure
 *
 * @param[in]	rinfo	-	the resv_info to free
 *
 * @return	nothing
 *
 */
void
free_resv_info(resv_info *rinfo)
{
	if (rinfo == NULL)
		return;

	if (rinfo->queuename != NULL)
		free(rinfo->queuename);

	if (rinfo->resv_nodes != NULL)
		free_nodes(rinfo->resv_nodes);

	if (rinfo->timezone != NULL)
		free(rinfo->timezone);

	if (rinfo->rrule != NULL)
		free(rinfo->rrule);

	if (rinfo->execvnodes_seq != NULL)
		free(rinfo->execvnodes_seq);

	if (rinfo->occr_start_arr != NULL)
		free(rinfo->occr_start_arr);

	if (rinfo->partition != NULL)
		free(rinfo->partition);

	if (rinfo->select_orig != NULL)
		delete rinfo->select_orig;

	if (rinfo->select_standing != NULL)
		delete rinfo->select_standing;

	free_nspecs(rinfo->orig_nspec_arr);

	delete rinfo;
}

/**
 * @brief
 *		dup_resv_info - duplicate a reservation
 *
 * @param[in]	rinfo	-	the reservation to duplicate
 * @param[in]	sinfo 	-	the server the NEW reservation belongs to
 *
 * @return	duplicated reservation
 *
 */
resv_info *
dup_resv_info(resv_info *rinfo, server_info *sinfo)
{
	resv_info *nrinfo;

	if (rinfo == NULL)
		return NULL;

	if ((nrinfo = new_resv_info()) == NULL)
		return NULL;

	if (rinfo->queuename != NULL)
		nrinfo->queuename = string_dup(rinfo->queuename);

	nrinfo->req_start = rinfo->req_start;
	nrinfo->req_start_orig = rinfo->req_start_orig;
	nrinfo->req_start_standing = rinfo->req_start_standing;
	nrinfo->req_end = rinfo->req_end;
	nrinfo->req_duration = rinfo->req_duration;
	nrinfo->req_duration_orig = rinfo->req_duration_orig;
	nrinfo->req_duration_standing = rinfo->req_duration_standing;
	nrinfo->retry_time = rinfo->retry_time;
	nrinfo->resv_state = rinfo->resv_state;
	nrinfo->resv_substate = rinfo->resv_substate;
	nrinfo->is_standing = rinfo->is_standing;
	nrinfo->is_running = rinfo->is_running;
	nrinfo->timezone = string_dup(rinfo->timezone);
	nrinfo->rrule = string_dup(rinfo->rrule);
	nrinfo->resv_idx = rinfo->resv_idx;
	nrinfo->execvnodes_seq = string_dup(rinfo->execvnodes_seq);
	nrinfo->count = rinfo->count;
	if (rinfo->partition != NULL)
		nrinfo->partition = string_dup(rinfo->partition);
	if (rinfo->select_orig != NULL)
		nrinfo->select_orig = new selspec(*rinfo->select_orig);
	if (rinfo->select_standing != NULL)
		nrinfo->select_standing = new selspec(*rinfo->select_standing);

	/* the queues may not be available right now.  If they aren't, we'll
	 * catch this when we duplicate the queues
	 */
	if (rinfo->resv_queue != NULL)
		nrinfo->resv_queue = find_queue_info(sinfo->queues, rinfo->queuename);

	nrinfo->resv_nodes = dup_nodes(rinfo->resv_nodes, sinfo, NO_FLAGS);

	return nrinfo;
}

/**
 * @brief
 * 		check for new reservations and handle them
 *		if we can serve the reservation, we reserve it
 *		and if we can't, we delete the reservation
 * @par
 *  	For a standing reservation, each occurrence is unrolled and attempted
 * 		to be confirmed. If a single occurrence fails to be confirmed, then the
 * 		standing reservation is rejected.
 * @par
 *  	For a degraded reservation, the resources allocated to the reservation
 * 		are free'd in the simulated universe, and we attempt to reconfirm resources
 * 		for it. If it fails then we inform the server that the reconfirmation has
 * 		failed. If it succeeds, then the previously allocated resources are freed
 * 		from the real universe and replaced by the newly allocated resources.
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	communication descriptor to PBS server
 * @param[in]	resvs	-	list of reservations
 * @param[in]	sinfo	-	the server who owns the reservations
 *
 * @return	int
 * @retval	number of reservations confirmed
 * @retval	-1	: something went wrong with confirmation, retry later
 *
 */
int
check_new_reservations(status *policy, int pbs_sd, resource_resv **resvs, server_info *sinfo)
{
	int count = 0; /* new reservation count */
	int pbsrc = 0; /* return code from pbs_confirmresv() */

	server_info *nsinfo = NULL;
	resource_resv *nresv = NULL;
	resource_resv *nresv_copy = NULL;
	resource_resv **tmp_resresv = NULL;

	char **occr_execvnodes_arr = NULL;
	int occr_execvnodes_count = 0;
	char **tofree = NULL;
	int occr_count = 1;
	int have_alter_request = 0;
	int i;
	int j, j_adjusted;
	schd_error *err;

	if (sinfo == NULL)
		return -1;

	/* If no reservations to check then return, this is not an error */
	if (resvs == NULL)
		return 0;

	err = new_schd_error();
	if (err == NULL)
		return -1;

	qsort(sinfo->resvs, sinfo->num_resvs, sizeof(resource_resv *), cmp_resv_state);

	for (i = 0; sinfo->resvs[i] != NULL; i++) {
		if (sinfo->resvs[i]->resv == NULL) {
			log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
				  sinfo->resvs[i]->name,
				  "Error determining if reservation can be confirmed: "
				  "Could not find the reservation.");
			continue;
		}

		/* If the reservation is unconfirmed OR is degraded and not running, with a
		 * retry time that is in the past, then the reservation has to be
		 * respectively confirmed and reconfirmed.
		 */
		if (will_confirm(sinfo->resvs[i], sinfo->server_time)) {
			/* Clone the real universe for simulation scratch work. This universe
			 * will be garbage collected after simulation completes.
			 */
			try {
				nsinfo = new server_info(*sinfo);
			} catch (std::exception &e) {
				return -1;
			}

			/* Resource reservations are ordered by event time, in the case of a
			 * standing reservation, the first to be found will be the "parent"
			 * reservation
			 */
			nresv = find_resource_resv_by_indrank(nsinfo->resvs, sinfo->resvs[i]->resresv_ind, sinfo->resvs[i]->rank);
			if (nresv == NULL) {
				log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
					  sinfo->resvs[i]->name,
					  "Error determining if reservation can be confirmed: "
					  "Resource not found.");
				delete nsinfo;
				return -1;
			}

			release_running_resv_nodes(nresv, nsinfo);

			/* Attempt to confirm the reservation. For a standing reservation,
			 * each occurrence is unrolled and attempted to be confirmed within the
			 * function.
			 */
			pbsrc = confirm_reservation(policy, pbs_sd, nresv, nsinfo);

			/* confirm_reservation only returns success if all occurrences were
			 * confirmed and the communication with the server returned no error
			 */
			if (pbsrc == RESV_CONFIRM_SUCCESS) {
				/* If a degraded reservation, then we need to release the resources
				 * that were previously allocated to the reservation in the real
				 * universe. These resources will be replaced by the newly allocated
				 * ones from the simulated server universe.
				 */
				if (nresv->resv->resv_substate == RESV_DEGRADED || nresv->resv->resv_substate == RESV_IN_CONFLICT)
					release_nodes(sinfo->resvs[i]);

				/* the number of occurrences is set during the confirmation process */
				occr_count = nresv->resv->count;

				/* Now deal with updating the "real" server universe */

				/* If a standing reservation, unroll the string representation of the
				 * sequence of execvnodes into an array of pointer to execvnodes */
				if (nresv->resv->is_standing) {
					/* "tofree" is a pointer array to a list of unique execvnodes. It is
					 * safely freed exclusively by calling free_execvnode_seq
					 */
					occr_execvnodes_count = get_execvnodes_count(nresv->resv->execvnodes_seq);
					occr_execvnodes_arr = unroll_execvnode_seq(
						nresv->resv->execvnodes_seq, &tofree);
					if (occr_execvnodes_arr == NULL) {
						log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
							  sinfo->resvs[i]->name,
							  "Error unrolling standing reservation.");
						delete nsinfo;
						return -1;
					}
				} else {
					/* Since we will use occr_execvnodes_arr both for standing and advance
					 * reservations, we create an array with a single entry to hold the
					 * advance reservation's execvnode.
					 */
					occr_execvnodes_arr = static_cast<char **>(malloc(sizeof(char *)));
					if (occr_execvnodes_arr == NULL) {
						delete nsinfo;
						log_err(errno, __func__, MEM_ERR_MSG);
						return -1;
					}
					*occr_execvnodes_arr = nresv->resv->execvnodes_seq;
					occr_execvnodes_count = 1;
				}

				/* Iterate over all occurrences (would be 1 for advance reservations)
				 * and copy the information collected during simulation back into the
				 * real universe
				 */
				for (j = 0; j < occr_count; j++) {
					/* On first occurrence, the reservation is the "parent" reservation */
					if (j == 0) {
						nresv_copy = sinfo->resvs[i];
					}
					/* Subsequent occurrences need to be either modified or created
					 * depending on whether the reservation is to be reconfirmed or
					 * is getting confirmed for the first time.
					 */
					else {
						/* For a degraded reservation, it had already been confirmed in a
						 * previous scheduling cycle. We retrieve the existing object from
						 * the all_resresv list
						 */
						if (nresv->resv->resv_substate == RESV_DEGRADED || nresv->resv->resv_substate == RESV_IN_CONFLICT) {
							nresv_copy = find_resource_resv_by_time(sinfo->all_resresv,
												nresv_copy->name, nresv->resv->occr_start_arr[j]);
							if (nresv_copy == NULL) {
								log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV,
									  LOG_INFO, nresv->name,
									  "Error determining if reservation can be confirmed: "
									  "Could not find reservation by time.");
								break;
							}
						} else {
							/* For a new, unconfirmed, reservation, we duplicate the parent
							 * reservation
							 */
							nresv_copy = dup_resource_resv(nresv_copy, sinfo, NULL);
							if (nresv_copy == NULL)
								break;
							if (nresv_copy->resv->select_standing != NULL) {
								delete nresv_copy->select;
								nresv_copy->select = new selspec(*nresv_copy->resv->select_standing);
							}
						}
					}
					release_nodes(nresv_copy);

					j_adjusted = j - (occr_count - occr_execvnodes_count);

					if (j_adjusted >= 0 && j_adjusted < occr_execvnodes_count) {
						nresv_copy->resv->orig_nspec_arr =
							parse_execvnode(occr_execvnodes_arr[j_adjusted], sinfo, nresv_copy->select);
					} else {
						nresv_copy->resv->orig_nspec_arr = {};
						log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV,
							   LOG_INFO, nresv->name,
							   "%s: occurence %d has no execvnodes, proceeding without assigned resources",
							   __func__, j + 1);
					}

					nresv_copy->nspec_arr = combine_nspec_array(nresv_copy->resv->orig_nspec_arr);
					nresv_copy->ninfo_arr = create_node_array_from_nspec(nresv_copy->nspec_arr);
					nresv_copy->resv->resv_nodes = create_resv_nodes(nresv_copy->nspec_arr, sinfo);

					/* Note that the sequence of occurrence dates and time are determined
					 * during confirm_reservation and set to the reservation in the
					 * simulated server
					 */
					nresv_copy->start = nresv->resv->occr_start_arr[j];
					nresv_copy->end = nresv_copy->start + nresv_copy->duration;

					/* Only add the occurrence to the real universe if we are not
					 * processing a degraded reservation as otherwise, the resources
					 * had already been added to the real universe in query_reservations
					 */
					if (nresv_copy->resv->resv_substate != RESV_DEGRADED && nresv_copy->resv->resv_substate != RESV_IN_CONFLICT) {
						timed_event *te_start;
						timed_event *te_end;
						te_start = create_event(TIMED_RUN_EVENT, nresv_copy->start,
									nresv_copy, NULL, NULL);
						if (te_start == NULL)
							break;
						te_end = create_event(TIMED_END_EVENT, nresv_copy->end,
								      nresv_copy, NULL, NULL);
						if (te_end == NULL) {
							free_timed_event(te_start);
							break;
						}
						add_event(sinfo->calendar, te_start);
						add_event(sinfo->calendar, te_end);

						if (j > 0) {
							tmp_resresv = add_resresv_to_array(sinfo->all_resresv, nresv_copy, SET_RESRESV_INDEX);
							if (tmp_resresv == NULL)
								break;
							sinfo->all_resresv = tmp_resresv;
							tmp_resresv = add_resresv_to_array(sinfo->resvs, nresv_copy, NO_FLAGS);
							if (tmp_resresv == NULL)
								break;
							sinfo->resvs = tmp_resresv;
							sinfo->num_resvs++;
						}
					}

					/* Confirm the reservation such that it is not looked at again in the
					 * main loop of this function.
					 */
					nresv_copy->resv->resv_state = RESV_CONFIRMED;
					nresv_copy->resv->resv_substate = RESV_CONFIRMED;
				}
				/* increment the count if we successfully processed all occurrences */
				if (j == occr_count)
					count++;
			} else if (pbsrc == RESV_CONFIRM_FAIL) {
				/* For a degraded reservation, it had already been confirmed in a
				 * previous scheduling cycle. We retrieve the existing object from
				 * the all_resresv list and update the retry_time to break out of
				 * the main loop that checks for reservations that need confirmation
				 */
				if (nresv->resv->resv_substate == RESV_DEGRADED || nresv->resv->resv_substate == RESV_IN_CONFLICT) {
					for (j = 0; j < nresv->resv->count; j++) {
						nresv_copy = find_resource_resv_by_time(sinfo->all_resresv,
											nresv->name, nresv->resv->occr_start_arr[j]);
						if (nresv_copy == NULL) {
							log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV,
								  LOG_INFO, nresv->name,
								  "Error determining if reservation can be confirmed: "
								  "Could not find reservation by time.");
							break;
						}
						/* Update the retry time such that occurrences of a standing
						 * reservation do not independently attempt to be reconfirmed
						 * This is meant to break out of the conditional that checks what
						 * will be considered "confirmable" by the scheduler. Either one
						 * of updating the substate to something else than RESV_DEGRADED or
						 * updating the reservation retry time to some time in the future
						 * invalidating the condition would work.
						 *
						 * We choose to update the retry_time for consistency with what
						 * the server actually does upon receiving the message informing
						 * it that the reservation could not be reconfirmed.
						 */
						nresv_copy->resv->retry_time = sinfo->server_time + 1;
					}
				}
			}
			/* clean up */
			free(nresv->resv->occr_start_arr);
			nresv->resv->occr_start_arr = NULL;
			free_execvnode_seq(tofree);
			tofree = NULL;
			free(occr_execvnodes_arr);
			occr_execvnodes_arr = NULL;

			/* Clean up simulated server info */
			delete nsinfo;
		}
		if (sinfo->resvs[i]->resv->resv_state == RESV_BEING_ALTERED)
			have_alter_request = 1;

		/* Something went wrong with reservation confirmation, retry later */
		if (pbsrc == RESV_CONFIRM_RETRY) {
			free_schd_error(err);
			return -1;
		}
	}
	free_schd_error(err);
	/* If a reservation is being altered, its attributes are the new altered attributes.
	 * If the alter fails, we can't continue with a cycle because the reservation
	 * reverted back to its pre-altered state, but the copy we have is as if the alter succeeded.
	 * If no reservations have been confirmed, we will run a normal cycle.
	*/
	if (have_alter_request && count == 0)
		return -1;
	return count;
}

/**
 * @brief
 * 		mark the timed event associated to a resource reservation at a given time as
 * 		disabled.
 *
 * @param[in]	events	-	the event which to be disabled in the calendar.
 * @param[in]	resv	-	the resource reservation being disabled
 *
 * @return	int
 * @retval	1	: on success
 * @retval	0	: on failure
 */
static int
disable_reservation_occurrence(timed_event *events,
			       resource_resv *resv)
{
	if (resv == NULL)
		return 0;

	if (resv->run_event != NULL)
		set_timed_event_disabled(resv->run_event, 1);
	if (resv->end_event != NULL)
		set_timed_event_disabled(resv->end_event, 1);
	return 1;
}

/**
 * @brief
 * 		determines if a resource reservation can be satisfied
 *
 * @param[in]	policy	-	policy info
 * @param[in]	pbs_sd	-	connection to server
 * @param[in]	unconf_resv	-	the reservation to confirm
 * @param[in]	nsinfo	-	the simulated server info universe
 *
 * @return	int
 * @retval	RESV_CONFIRM_SUCCESS
 * @retval	RESV_CONFIRM_FAIL
 *
 * @note
 * 		This function modifies the resource reservation by adding the number of
 * 		occurrences and the sequence of occurrence times, which are then used when
 * 		checking for new and degraded reservations.
 */
int
confirm_reservation(status *policy, int pbs_sd, resource_resv *unconf_resv, server_info *nsinfo)
{
	time_t sim_time;		    /* time in simulation */
	unsigned int simrc = TIMED_NOEVENT; /* ret code from simulate_events() */
	schd_error *err;
	int pbsrc = 0;				     /* return code from pbs_confirmresv() */
	enum resv_conf rconf = RESV_CONFIRM_SUCCESS; /* assume reconf success */
	char logmsg[MAX_LOG_SIZE];
	char logmsg2[MAX_LOG_SIZE];

	resource_resv *nresv = unconf_resv;
	resource_resv **tmp_resresv = NULL;
	resource_resv *nresv_copy = NULL;

	resource_resv *nresv_parent = nresv; /* the "original" / parent reservation */

	int confirmd_occr = 0; /* the number of confirmed occurrence(s) */
	int cur_count;

	int vnodes_down = 0; /* the number of vnodes that are down */

	/* resv_start_time is used both for calculating the time of an ASAP
	 * reservation and to keep track of the start time of the first occurrence
	 * of a standing reservation.
	 */
	time_t resv_start_time = 0;    /* estimated start time for resv */
	time_t *occr_start_arr = NULL; /* an array of occurrence start times */

	std::string execvnodes;
	char *short_xc = NULL;
	char *tmp = NULL;
	time_t next;

	char *rrule = nresv->resv->rrule; /* NULL for advance reservation */
	time_t dtstart = nresv->resv->req_start;
	char *tz = nresv->resv->timezone;
	int occr_count = nresv->resv->count;
	int ridx = nresv->resv->resv_idx - 1;

	logmsg[0] = logmsg2[0] = '\0';

	err = new_schd_error();
	if (err == NULL)
		return RESV_CONFIRM_FAIL;

	/* If the number of occurrences is not set, this is a first time confirmation
	 * otherwise it is a reconfirmation request
	 */
	if (occr_count == 0)
		occr_count = get_num_occurrences(rrule, dtstart, tz);
	else {
		/* If the number of occurrences (occr_count) was already set, then we are
		 * dealing with the reconfirmation of a reservation. We need to adjust the
		 * number of occurrences to account only for the remaining occurrences and
		 * not the original number at the time the reservation was first submitted
		 */
		if (nresv->resv->resv_state != RESV_BEING_ALTERED)
			occr_count -= ridx;
		else
			occr_count = 1;
	}

	if ((occr_start_arr = static_cast<time_t *>(calloc(sizeof(time_t), occr_count))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return RESV_CONFIRM_FAIL;
	}

	/* Each reservation attempts to confirm a set of nodes on which to run for
	 * a given start and end time. When handling an advance reservation,
	 * the current reservation is considered. For a standing reservation,
	 * each occurrence is processed by duplicating the parent reservation
	 * and attempts to confirm it.
	 *
	 * All the scratch work attempting to confirm the reservation takes place
	 * in a deep copy of the server info,and is done by simulating events just
	 * as if the server were processing them.
	 *
	 * At the end of the simulation, this cloned server info is completely
	 * wiped and a fresh version is created from the recorded 'sinfo' state.
	 *
	 * It's critical that when handling a standing reservation, each occurrence
	 * be added to the server info such that the duplicated server info has up to
	 * date information.
	 */
	cur_count = 0;
	for (int j = 0; j < occr_count && rconf == RESV_CONFIRM_SUCCESS;
	     j++, cur_count = j) {
		/* Get the start time of the next occurrence.
		 * See call to same function in query_reservations for a more in-depth
		 * description.
		 */
		next = get_occurrence(rrule, dtstart, tz, j + 1);
		/* keep track of each occurrence's start time */
		occr_start_arr[j] = next;

		/* Processing occurrences of a standing reservation requires duplicating
		 * the "parent" reservation as template for each occurrence, modifying its
		 * start time and duration and running a simulation for that occurrence
		 *
		 * This duplication is only done for subsequent occurrences, not for the
		 * parent reservation.
		 */
		if (j > 0) {
			/* If the reservation is Degraded, then it has already been added to the
			 * real universe, so instead of duplicating the parent reservation, it
			 * is retrieved from the duplicated real server universe
			 */
			if (nresv->resv->resv_substate == RESV_DEGRADED || nresv->resv->resv_substate == RESV_IN_CONFLICT) {
				nresv_copy = find_resource_resv_by_time(nsinfo->all_resresv,
									nresv->name, next);
				if (nresv_copy == NULL) {
					log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv->name,
						  "Error determining if reservation can be confirmed: "
						  "Could not find reservation by time.");
					rconf = RESV_CONFIRM_FAIL;
					break;
				}
				nresv = nresv_copy;
			} else {
				nresv_copy = dup_resource_resv(nresv, nsinfo, NULL);

				if (nresv_copy == NULL) {
					rconf = RESV_CONFIRM_FAIL;
					break;
				}
				nresv = nresv_copy;

				/* add it to the simulated universe of reservations.
				 * Also add it to the reservation list (resvs) to be garbage collected
				 */
				tmp_resresv = add_resresv_to_array(nsinfo->resvs, nresv, NO_FLAGS);
				if (tmp_resresv == NULL) {
					delete nresv;
					rconf = RESV_CONFIRM_FAIL;
					break;
				}
				nsinfo->resvs = tmp_resresv;

				tmp_resresv = add_resresv_to_array(nsinfo->all_resresv, nresv, SET_RESRESV_INDEX);
				if (tmp_resresv == NULL) {
					delete nresv;
					rconf = RESV_CONFIRM_FAIL;
					break;
				}
				nsinfo->all_resresv = tmp_resresv;
				nsinfo->num_resvs++;
			}
			execvnodes += TOKEN_SEPARATOR;
		}

		/* If reservation is degraded, then verify that some node(s) associated to
		 * the reservation are down before attempting to reconfirm it. If some
		 * are, then resources allocated to this reservation are released and the
		 * reconfirmation proceeds.
		 */
		if (nresv->resv->resv_substate == RESV_DEGRADED || nresv->resv->resv_substate == RESV_IN_CONFLICT ||
		    nresv->resv->resv_state == RESV_BEING_ALTERED) {
			selspec *spec = new selspec(*nresv->select);
			vnodes_down = resv_reduce_chunks(nresv, spec);

			if (vnodes_down < 0 && nresv->resv->resv_substate != RESV_IN_CONFLICT) {
				if (vnodes_down == -1)
					snprintf(logmsg, sizeof(logmsg), "Reservation has running jobs in it");
				rconf = RESV_CONFIRM_FAIL;
				break;
			} else if (nresv->resv->is_standing && nresv->resv->resv_state == RESV_DELETING_JOBS) {
				snprintf(logmsg, sizeof(logmsg), "Occurrence is ending, will try later");
				rconf = RESV_CONFIRM_FAIL;
			} else if (vnodes_down > 0 || nresv->resv->resv_substate == RESV_IN_CONFLICT ||
				   nresv->resv->resv_state == RESV_BEING_ALTERED) {
				if (nresv->resv->is_running) {
					std::string sel;
					delete nresv->execselect;

					sel = create_select_from_nspec(nresv->resv->orig_nspec_arr);
					nresv->execselect = parse_selspec(sel);
					for (size_t ind = 0; ind < nresv->resv->orig_nspec_arr.size(); ind++) {
						nresv->execselect->chunks[ind]->seq_num = nresv->resv->orig_nspec_arr[ind]->seq_num;
					}
					if (spec != NULL) {
						if (nresv->execselect == NULL)
							nresv->execselect = spec;
						else {
							/* Everything in that select has a running job on it.  Now add in the rest */
							int num_exec_chunks = count_array(nresv->execselect->chunks);
							chunk **tmp = static_cast<chunk **>(realloc(nresv->execselect->chunks, (num_exec_chunks + count_array(spec->chunks) + 1) * sizeof(chunk *)));
							if (tmp == NULL) {
								rconf = RESV_CONFIRM_FAIL;
								break;
							}
							nresv->execselect->chunks = tmp;
							int j = num_exec_chunks;
							for (int i = 0; spec->chunks[i] != NULL; i++) {
								if (spec->chunks[i]->num_chunks > 0) {
									nresv->execselect->chunks[j] = spec->chunks[i];
									nresv->execselect->total_chunks += spec->chunks[i]->num_chunks;
									spec->chunks[i] = NULL;
									j++;
								}
							}
							nresv->execselect->chunks[j] = NULL;
							delete spec;
						}
					}
					release_running_resv_nodes(nresv, nsinfo);
				} else
					delete spec;
				release_nodes(nresv);
			} else if (vnodes_down == 0) {
				/* this occurrence doesn't require reconfirmation so skip it by
				 * incrementing the number of occurrences confirmed and appending
				 * this occurrence's execvnodes to the sequence of execvnodes
				 */
				confirmd_occr++;
				tmp = create_execvnode(nresv->resv->orig_nspec_arr);
				if (j == 0)
					execvnodes = tmp;
				else { /* subsequent occurrences */
					execvnodes += tmp;
					execvnodes += TOKEN_SEPARATOR;
				}
				continue;
			}
			if (!nresv->resv->is_running) {
				if (disable_reservation_occurrence(nsinfo->calendar->events, nresv) != 1) {
					log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv->name,
						  "Error determining if reservation can be confirmed: "
						  "Could not mark occurrence disabled.");
					rconf = RESV_CONFIRM_FAIL;
					break;
				}
			}
		}

		if (nresv->resv->req_start == PBS_RESV_FUTURE_SCH) { /* ASAP Resv */
			resv_start_time = calc_run_time(nresv->name, nsinfo, NO_FLAGS);
			/* Update occr_start_arr used to update the real sinfo structure */
			occr_start_arr[j] = resv_start_time;
		} else {
			nresv->resv->req_start = next;
			nresv->start = nresv->resv->req_start;
			nresv->end = nresv->start + nresv->resv->req_duration;

			/* "next" is used in simulate_events to determine the time up to which
			 * to simulate the universe
			 */
			simrc = simulate_events(policy, nsinfo, SIM_TIME, (void *) &next, &sim_time);
		}
		if (!(simrc & TIMED_ERROR) && resv_start_time >= 0) {
			clear_schd_error(err);
			auto ns = is_ok_to_run(nsinfo->policy, nsinfo, NULL, nresv, NO_ALLPART, err);
			if (!ns.empty()) {
				std::sort(ns.begin(), ns.end(), cmp_nspec);
				tmp = create_execvnode(ns);
				free_nspecs(ns);
				if (tmp == NULL) {
					log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv->name,
						  "Error determining if reservation can be confirmed: "
						  "Creation of execvnode failed.");
					rconf = RESV_CONFIRM_FAIL;
					break;
				}

				if (j == 0) { /* first occurrence keeps track of first execvnode */
					execvnodes = tmp;
					/* Update resv_start_time only if not an ASAP reservation to
					 * schedule the reservation on the first occurrence.
					 */
					if (resv_start_time == 0)
						resv_start_time = next;
				} else /* subsequent occurrences */
					execvnodes += tmp;

				confirmd_occr++;
			}
			/* Something went wrong trying to determine if it's "ok to run", which
			 * may be a problem checking for limits or checking for availability of
			 * resources.
			 */
			else {
				(void) translate_fail_code(err, NULL, logmsg);

				/* If the reservation is degraded, we log a message and continue */
				if (nresv->resv->resv_substate == RESV_DEGRADED || nresv->resv->resv_substate == RESV_IN_CONFLICT) {
					log_eventf(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv->name, "Reservation Failed to Reconfirm: %s", logmsg);
				}
				/* failed to confirm so move on. This will throw flow out of the
				 * loop
				 */
				rconf = RESV_CONFIRM_FAIL;
			}
		} /* end of simulation */
		else {
			log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
				  nresv->name,
				  "Error determining if reservation can be confirmed: "
				  "Simulation failed.");
			rconf = RESV_CONFIRM_FAIL;
		}
	}

	/* Finished simulating occurrences now time to confirm if ok. Currently
	 * the confirmation is an all or nothing process but may come to change. */
	if (confirmd_occr == occr_count) {
		/* We either confirm a standing or advance reservation, the standing
		 * has a special sequence of execvnodes while the advance has a single
		 * execvnode. The sequence of execvnodes is created by concatenating
		 * each execvnode and condensing the concatenated string.
		 */
		if (nresv_parent->resv->is_standing)
			short_xc = condense_execvnode_seq(execvnodes.c_str());
		else
			short_xc = string_dup(execvnodes.c_str());

		if (short_xc == NULL || get_execvnodes_count(short_xc) != occr_count) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV, LOG_DEBUG, nresv_parent->name, "Invalid execvnode_seq while confirming reservation");
			rconf = RESV_CONFIRM_RETRY;
		} else {
			char confirm_msg[LOG_BUF_SIZE] = {0};

			log_eventf(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv_parent->name,
				   "Confirming %d Occurrences", occr_count);

			/* Send a reservation confirm message, if anything goes wrong pbsrc
			* will return an error
			*/
			snprintf(confirm_msg, LOG_BUF_SIZE, "%s:partition=%s", PBS_RESV_CONFIRM_SUCCESS,
				 sc_attrs.partition ? sc_attrs.partition : DEFAULT_PARTITION);

			pbsrc = send_confirmresv(pbs_sd, nresv_parent, short_xc, resv_start_time, confirm_msg);
		}
	} else {
		/* This message is sent to inform that we could not confirm the reservation.
		 * If the reservation was degraded then the retry time will be reset.
		 * "null" is used satisfy the API but any string would do because we've
		 * failed to confirm the reservation and no execvnodes were determined
		 */
		pbsrc = send_confirmresv(pbs_sd, nresv_parent, "null", resv_start_time, PBS_RESV_CONFIRM_FAIL);
	}

	/* Error handling first checks for the return code from the server and the
	 * confirmation flag. If either failed, we print the error message, otherwise
	 * we print success
	 */
	if (pbsrc > 0 || rconf == RESV_CONFIRM_FAIL) {
		/* If the scheduler could not find a place for the reservation, use the
		 * translated error code. Otherwise, use the error message from the server.
		 */
		if (rconf == RESV_CONFIRM_FAIL)
			log_eventf(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv_parent->name,
				   "PBS Failed to confirm resv: %s", logmsg);
		else {
			const char *errmsg = pbs_geterrmsg(pbs_sd);
			if (errmsg == NULL)
				errmsg = "";
			log_eventf(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv_parent->name,
				   "PBS Failed to confirm resv: %s (%d)", errmsg, pbs_errno);
			rconf = RESV_CONFIRM_RETRY;
		}

		if (nresv_parent->resv->resv_substate == RESV_DEGRADED) {
			if (vnodes_down >= 0)
				log_eventf(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv_parent->name,
					   "Reservation is in degraded mode");

			/* we failed to confirm the degraded reservation but we still need to
			 * set the remaining occurrences start time to avoid looking at them
			 * in the future. We had set the occr_start_arr times in the main loop
			 * so we only care about the remaining ones
			 */
			for (; cur_count < occr_count; cur_count++) {
				next = get_occurrence(rrule, dtstart, tz, cur_count + 1);
				occr_start_arr[cur_count] = next;
			}
		}
		free(short_xc);
	}
	/* If the (re)confirmation was a success then we update the sequence of
	 * occurrence start times, the number of occurrences, and the sequence of
	 * execvnodes
	 */
	else if (rconf == RESV_CONFIRM_SUCCESS) {
		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, nresv_parent->name,
			  "Reservation Confirmed");

		/* If handling a degraded reservation or while altering a standing reservation
		 * we recreate a new execvnode sequence string, so the old should be cleared.
		 */
		free(nresv_parent->resv->execvnodes_seq);

		/* set or update (for reconfirmation) the sequence of execvnodes */
		nresv_parent->resv->execvnodes_seq = short_xc;
	}
	/* The sequence of occurrence times and the total number of occurrences are
	 * made available to populate the 'real' sinfo in check_new_reservations
	 */
	nresv_parent->resv->occr_start_arr = occr_start_arr;
	nresv_parent->resv->count = occr_count;

	/* clean up */
	free_schd_error(err);

	/* the return value is initialized to RESV_CONFIRM_SUCCESS */
	return rconf;
}

/**
 * @brief determine if a nspec superchunk/chunk has any running jobs on them
 * @param[in] resv - reservation to check
 * @param[in] chunk_ind - index of the chunk start
 * @param[out] running_jobs - are there running jobs on the nodes we're checking
 * @return bool
 * @retval true chunk has running jobs on it
 * @retval false chunk does not have any running jobs on it
 *
 */
bool
check_chunk_running(resource_resv *resv, int chunk_ind, bool &down_run)
{
	bool found_running_jobs = false;
	if (resv == NULL || chunk_ind < 0 || !resv->is_resv ||
	    resv->resv == NULL || resv->resv->resv_queue == NULL)
		return false;

	for (size_t i = chunk_ind; i < resv->resv->orig_nspec_arr.size(); i++) {
		auto ninfo = resv->resv->orig_nspec_arr[i]->ninfo;

		if (ninfo != NULL) {
			if (resv->resv->resv_queue->running_jobs != NULL)
				for (int j = 0; resv->resv->resv_queue->running_jobs[j] != NULL; j++) {
					resource_resv *job = resv->resv->resv_queue->running_jobs[j];
					for (int k = 0; job->ninfo_arr[k] != NULL; k++) {
						if (job->ninfo_arr[k]->rank == ninfo->rank) {
							found_running_jobs = true;
							if (ninfo->is_stale || ninfo->is_offline || ninfo->is_down ||
							    ninfo->is_unknown || ninfo->is_maintenance || ninfo->is_sleeping)
								down_run = true;
						}
					}
				}

			if (resv->resv->orig_nspec_arr[i]->end_of_chunk)
				break;
		}
		if (down_run)
			return true;
	}
	return found_running_jobs;
}

/**
 * @brief remove nodes without running jobs from an nspec array.
 *
 * @param[in] resv - reservation to remove nodes from
 * @param[in] start_of_chk - index into resv->orig_nspec_arr of where to start
 * @param[in] chk_seq_num - sequence number of chunk to remove nodes from
 * @param[out] down_run - we found a running job on a downed node
 *
 * @note all nspec chunks to be removed will have their ninfo pointer NULL'd.  It up to the caller to actually remove them from the reservation.
 *
 * @return int
 * @retval number of chunks removed from the nspec array
 * @retval -1 nspecs are not mapped to select chunks
 */
int
remove_empty_nodes(resource_resv *resv, int start_of_chk, int chk_seq_num, bool &down_run)
{
	int chunks_removed = 0;

	auto &nspec_arr = resv->resv->orig_nspec_arr;

	for (size_t i = start_of_chk; i < nspec_arr.size(); i++) {
		bool running_jobs = false;
		if (nspec_arr[i]->chk == NULL)
			return -1;

		if (nspec_arr[i]->chk->seq_num != chk_seq_num)
			break;
		running_jobs = check_chunk_running(resv, i, down_run);
		if (!running_jobs) {
			size_t k = i - 1;
			do {
				k++;
				nspec_arr[k]->ninfo = NULL;
			} while (nspec_arr[k] != NULL && !nspec_arr[k]->end_of_chunk);

			chunks_removed++;
			/* In the case of a superchunk, we advance past it.  In the case of a normal chunk, k didn't move, so we reassign i to i */
			i = k;
		}
	}
	return chunks_removed;
}

/**
 * @brief The output of this function will be an nspec array with nodes which only has
 * 	running jobs on them, and a select spec of corrisponding chunks of what we released and need back.
 * 	e.g. we had (vn1:ncpus=1)+(vn2:ncpus=1)+(vn3:ncpus=1) and a new select spec of 2:ncpus=1.
 * 		There is a running job on vn2.  The resulting nspec array only has vn2 in it, and
 * 		the select spec has 1:ncpus=1 which is what is left.
 * 
 * 	The idea is that the caller will create an execselect of 1:vnode=vn2:ncpus=1+1:ncpus=1
 *
 * @param[in] resv - the reservation to shrink
 * @param[out] spec - The part of the new select that isn't kept from orig_nspec_arr
 *
 * @return int
 * @retval 1 the reservation has been successfully shrunk
 * @retval 0 no select_orig, not doing a pbs_ralter -l select
 * @retval -1 can't remove enough chunks due to running jobs
 * @retval -2 can't reduce due to resv_nodes not correctly mapped to select_orig
 */
int
resv_reduce_chunks(resource_resv *resv, selspec *spec)
{
	int cnt;
	int start_of_chunk = 0;
	int j, k;
	chunk **chks_orig, **chks;

	if (resv == NULL || spec == NULL)
		return -2;

	if (resv->resv->resv_state == RESV_BEING_ALTERED) {
		/* We're not altering the select, just return success */
		if (resv->resv->select_orig == NULL)
			return 0;
		chks_orig = resv->resv->select_orig->chunks;
	} else
		chks_orig = resv->select->chunks;

	cnt = resv->resv->orig_nspec_arr.size();
	j = 0;
	chks = resv->select->chunks;
	for (int i = 0; chks_orig[i] != NULL; i++) {
		int num_chks = 0;
		bool down_run = false;

		num_chks = remove_empty_nodes(resv, start_of_chunk, chks_orig[i]->seq_num, down_run);
		if (chks[j] == NULL || chks_orig[i]->seq_num != chks[j]->seq_num) {
			if (num_chks == -1)
				return -2;
			/* If we didn't remove all the nodes, some of them must have running jobs on them */
			if (num_chks != chks_orig[i]->num_chunks)
				return -1;

		} else {
			int chk_diff = chks_orig[i]->num_chunks - chks[j]->num_chunks;

			if (num_chks == -1)
				return -2;

			/* We are shrinking the reservation and can't find enough nodes to free without running jobs on them */
			if (chk_diff > 0 && num_chks < chk_diff)
				return -1;
			if (resv->resv->resv_substate == RESV_DEGRADED && down_run)
				return -1;

			spec->chunks[j]->num_chunks -= (chks_orig[i]->num_chunks - num_chks);

			j++;
		}
		for (k = start_of_chunk; k < cnt && resv->resv->orig_nspec_arr[k]->chk->seq_num == chks_orig[i]->seq_num; k++)
			;
		start_of_chunk = k;
	}
	auto &ns = resv->resv->orig_nspec_arr;
	/* We marked all nodes to remove by NULLing the ninfo ptr.  Remove them here from the vector */
	ns.erase(std::remove_if(ns.begin(), ns.end(), [](nspec *n) {
			 if (n->ninfo == NULL) {
				 delete n;
				 return true;
			 }
			 return false;
		 }),
		 ns.end());
	free_nspecs(resv->nspec_arr);
	resv->nspec_arr = combine_nspec_array(resv->resv->orig_nspec_arr);

	return 1;
}

/**
 * @brief
 * 		Release resources allocated to a reservation
 *
 * @param[in]	resresv	-	the reservation
 *
 * @return	void
 */
void
release_nodes(resource_resv *resresv)
{
	free_nodes(resresv->resv->resv_nodes);
	resresv->resv->resv_nodes = NULL;

	free(resresv->ninfo_arr);
	resresv->ninfo_arr = NULL;

	free_nspecs(resresv->nspec_arr);

	free_nspecs(resresv->resv->orig_nspec_arr);

	if (resresv->nodepart_name != NULL) {
		free(resresv->nodepart_name);
		resresv->nodepart_name = NULL;
	}
}

/**
 * @brief
 *		create_resv_nodes - create a node info array by copying the
 *			    nodes and setting available resources to
 *			    only the ones assigned to the reservation
 *
 * @param[in]	nspec_arr -	the nspec array created from the resv_nodes
 * @param[in]	sinfo     -	server reservation belongs too
 *
 * @return	new node universe
 * @retval	NULL	: on error
 */
node_info **
create_resv_nodes(std::vector<nspec *> &nspec_arr, server_info *sinfo)
{
	node_info **nodes;
	schd_resource *res;
	resource_req *req;

	nodes = static_cast<node_info **>(malloc((nspec_arr.size() + 1) * sizeof(node_info *)));
	if (nodes != NULL) {
		size_t i;
		for (i = 0; i < nspec_arr.size(); i++) {
			/* please note - the new duplicated nodes will NOT be part
				 * of sinfo.  This means that you can't find a node in
				 * node -> server -> nodes.  We include the server because
				 * it is expected that every node have a server pointer and
				 * parts of the code gets cranky if it isn't there.
				 */
			nodes[i] = dup_node_info(nspec_arr[i]->ninfo, sinfo, DUP_INDIRECT);
			nodes[i]->svr_node = nspec_arr[i]->ninfo;

			/* reservation nodes in state resv_exclusive can be assigned to jobs
				 * within the reservation
				 */
			if (nodes[i]->is_resv_exclusive)
				remove_node_state(nodes[i], ND_resv_exclusive);

			req = nspec_arr[i]->resreq;
			while (req != NULL) {
				res = find_alloc_resource(nodes[i]->res, req->def);

				if (res != NULL) {
					if (res->indirect_res != NULL)
						res = res->indirect_res;
					res->avail = req->amount;
					memcpy(&(res->type), &(req->type), sizeof(struct resource_type));
					if (res->type.is_consumable)
						res->assigned = 0; /* clear now, set later */
				}
				req = req->next;
			}
		}
		nodes[i] = NULL;
	}
	return nodes;
}

/**
 * @brief - adjust resources on nodes belonging to a reservation that is
 *	    running and is either degraded or being altered.  We need to free
 * 	    the resources on these nodes so the resources are available for
 * 	    check_nodes() to assign back to the reservation.
 *
 * @param[in] resv - reservation to alter nodes for
 * @param[in] sinfo - PBS universe
 *
 */

void
release_running_resv_nodes(resource_resv *resv, server_info *sinfo)
{
	if (resv == NULL || sinfo == NULL || resv->ninfo_arr == NULL)
		return;
	if (resv->resv->is_running && (resv->resv->resv_substate == RESV_DEGRADED || resv->resv->resv_state == RESV_BEING_ALTERED)) {
		auto resv_nodes = resv->ninfo_arr;
		for (int i = 0; resv_nodes[i] != NULL; i++) {
			auto ninfo = find_node_by_indrank(sinfo->nodes, resv_nodes[i]->node_ind, resv_nodes[i]->rank);
			update_node_on_end(ninfo, resv, NULL);
		}
		sinfo->pset_metadata_stale = 1;
	}
}

/**
 * 	@brief determine if the scheduler will attempt to confirm a reservation
 *
 * 	@return int
 * 	@retval 1 - will attempt confirmation
 * 	@retval 0 - will not attempt confirmation
 */
int
will_confirm(resource_resv *resv, time_t server_time)
{
	/* If the reservation is unconfirmed OR is degraded and not running, with a
	 * retry time that is in the past, then the reservation has to be
	 * respectively confirmed and reconfirmed.
	 */
	if (resv->resv->resv_state == RESV_UNCONFIRMED ||
	    resv->resv->resv_state == RESV_BEING_ALTERED ||
	    ((resv->resv->resv_substate == RESV_DEGRADED || resv->resv->resv_substate == RESV_IN_CONFLICT) &&
	     resv->resv->retry_time != UNSPECIFIED &&
	     resv->resv->retry_time <= server_time))
		return 1;

	return 0;
}

/**
 * @brief Update jobs and nodes for a reservation
 * 
 * @param[in] resresv - the reservation
 * @param[in] server_time - time current time in the server
 */
void
modify_jobs_nodes_for_resv(resource_resv *resresv, time_t server_time)
{
	if (resresv->resv == NULL || resresv->resv->resv_queue == NULL)
		return;

	resresv->resv->resv_queue->resv = resresv;
	if (resresv->resv->resv_queue->jobs != NULL) {
		for (int j = 0; resresv->resv->resv_queue->jobs[j] != NULL; j++) {
			auto rjob = resresv->resv->resv_queue->jobs[j];
			rjob->job->resv = resresv;
			rjob->job->can_not_preempt = 1;
			if (rjob->node_set_str != NULL)
				rjob->node_set =
					create_node_array_from_str(resresv->resv->resv_nodes,
								   rjob->node_set_str);

			/* if a job will exceed the end time of a duration, it will be
			 * killed by the server. We set the job's end time to the resv's
			 * end time for better estimation.
			 */
			if (server_time + rjob->duration > resresv->end) {
				rjob->duration = resresv->end - server_time;
				rjob->hard_duration = rjob->duration;
				if (rjob->end != UNSPECIFIED)
					rjob->end = resresv->end;
			}

			if (rjob->job->is_running) {
				/* the reservations resv_nodes is pointing to
				 * a node_info array with just the reservations part of the node
				 * i.e. the universe of the reservation
				 */
				int k = 0;
				for (auto ns : rjob->nspec_arr) {
					auto resvnode = find_node_info(resresv->resv->resv_nodes, ns->ninfo->name);

					if (resvnode != NULL) {
						/* update the ninfo to point to the ninfo in our universe */
						ns->ninfo = resvnode;
						rjob->ninfo_arr[k++] = resvnode;

						/* update resource assigned amounts on the nodes in the
						 * reservation's universe
						 */
						for (auto req = ns->resreq; req != NULL; req = req->next) {
							if (req->type.is_consumable) {
								auto res = find_resource(ns->ninfo->res, req->def);
								if (res != NULL)
									res->assigned += req->amount;
							}
						}
					} else {
						log_eventf(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, rjob->name,
							   "Job has been assigned a node that doesn't exist in its reservation: %s", ns->ninfo->name.c_str());
					}
				}
				rjob->ninfo_arr[k] = NULL;
			}
		}
		auto jobs_in_reservations = resource_resv_filter(resresv->resv->resv_queue->jobs,
								 count_array(resresv->resv->resv_queue->jobs),
								 check_running_job_in_reservation, NULL, 0);
		collect_jobs_on_nodes(resresv->resv->resv_nodes, jobs_in_reservations,
				      count_array(jobs_in_reservations), NO_FLAGS);
		free(jobs_in_reservations);

		/* Sort the nodes to ensure correct job placement. */
		qsort(resresv->resv->resv_nodes,
		      count_array(resresv->resv->resv_nodes),
		      sizeof(node_info *), multi_node_sort);
	}
}

================================================
FILE: src/scheduler/resv_info.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _RESV_INFO_H
#define _RESV_INFO_H

#include <pbs_config.h>
#include "data_types.h"

/*
 *	stat_resvs - status the reservations in batch_status form from the
 *	server
 */
struct batch_status *stat_resvs(int pbs_sd);

/*
 *	query_reservations - query the reservations from the server
 */
resource_resv **query_reservations(int pbs_sd, server_info *sinfo, struct batch_status *resvs);

/*
 *	query_resv_info - convert the servers batch_statys structure into a
 */
resource_resv *query_resv(struct batch_status *resv, server_info *sinfo);

/*
 *	new_resv_info - allocate and initialize new resv_info structure
 */
#ifdef NAS /* localmod 005 */
resv_info *new_resv_info(void);
#else
resv_info *new_resv_info();
#endif /* localmod 005 */

/*
 *	free_resv_info - free all the memory used by a rev_info structure
 */
void free_resv_info(resv_info *rinfo);

/*
 *	dup_resv_info - duplicate a reservation
 */
resv_info *dup_resv_info(resv_info *rinfo, server_info *sinfo);

/*
 *      check_new_reservations - check for new reservations and handle them
 *                               if we can serve the reservation, we reserve it
 *                               and if we can't, we delete the reservation
 */
int check_new_reservations(status *policy, int pbs_sd, resource_resv **resvs, server_info *sinfo);

/**
 *      confirm_reservation - attempts to confirm a resource reservation
 */
int confirm_reservation(status *policy, int pbs_sd, resource_resv *unconf_resv, server_info *nsinfo);

/**
 * Release reousrces allocated to a reservation
 */
void release_nodes(resource_resv *resresv);

/*
 *	create_resv_nodes - create a node universe for a reservation
 */
node_info **create_resv_nodes(std::vector<nspec *> &nspec_arr, server_info *sinfo);

/*
 *	release_running_resv_nodes - adjust nodes resources for reservations that
 *				  that are being altered or are degraded.
 */
void release_running_resv_nodes(resource_resv *resv, server_info *sinfo);

/* release chunks of the resv_nodes without running jobs on them */
int resv_reduce_chunks(resource_resv *resv, selspec *spec);

/* Will we try and confirm this reservation in this cycle */
int will_confirm(resource_resv *resv, time_t server_time);

/* wrapper for pbs_confirmresv */
int send_confirmresv(int virtual_sd, resource_resv *resv, const char *location, unsigned long start, const char *extend);

/* wrapper for pbs_statresv */
struct batch_status *send_statresv(int virtual_fd, char *id, struct attrl *attrib, char *extend);

/* Update jobs and nodes for resv */
void modify_jobs_nodes_for_resv(resource_resv *resresv, time_t server_time);

#endif /* _RESV_INFO_H */


================================================
FILE: src/scheduler/sched_exception.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include "data_types.h"

// Copy Constructor
sched_exception::sched_exception(const sched_exception &e)
{
	message = e.get_message();
	error_code = e.get_error_code();
}

// Assignment Operator
sched_exception &
sched_exception::operator=(const sched_exception &e)
{
	message = e.get_message();
	error_code = e.get_error_code();
	return (*this);
}

// Parametrized Constructor
sched_exception::sched_exception(const std::string &str, const enum sched_error_code err) : message(str), error_code(err) {}

// Getter function for error_code
enum sched_error_code
sched_exception::get_error_code() const
{
	return error_code;
}

// Getter function for message
const std::string &
sched_exception::get_message() const
{
	return message;
}

/*
 * @brief Overridden function to return char * of message
 *
 * @return const char *
 */
const char *
sched_exception::what()
{
	return message.c_str();
}


================================================
FILE: src/scheduler/sched_ifl_wrappers.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdlib.h>
#include <pbs_ifl.h>
#include <libpbs.h>
#include "data_types.h"
#include "fifo.h"
#include "globals.h"
#include "job_info.h"
#include "misc.h"
#include "log.h"
#include "server_info.h"
#include "libutil.h"

/**
 * @brief	Send the relevant runjob request to server
 *
 * @param[in]	sd	-	communication handle
 * @param[in]	has_runjob_hook	- does server have a runjob hook?
 * @param[in]	jobid	-	id of the job to run
 * @param[in]	execvnode	-	the execvnode to run the job on
 * @param[in]	svr_id_job -	server id of the job
 *
 * @return	int
 * @retval	return value of the runjob call
 */
int
send_run_job(int sd, int has_runjob_hook, const std::string &jobid, char *execvnode)
{
	if (jobid.empty() || execvnode == NULL)
		return 1;

	if (sc_attrs.runjob_mode == RJ_EXECJOB_HOOK)
		return pbs_runjob(sd, const_cast<char *>(jobid.c_str()), execvnode, NULL);
	else if (((sc_attrs.runjob_mode == RJ_RUNJOB_HOOK) && has_runjob_hook))
		return pbs_asyrunjob_ack(sd, const_cast<char *>(jobid.c_str()), execvnode, NULL);
	else
		return pbs_asyrunjob(sd, const_cast<char *>(jobid.c_str()), execvnode, NULL);
}

/**
 * @brief
 * 		send delayed attributes to the server for a job
 *
 * @param[in]	sd	-	communication handle
 * @param[in]	resresv	-	resource_resv object for job
 * @param[in]	pattr	-	attrl list to update on the server
 *
 * @return	int
 * @retval	1	success
 * @retval	0	failure to update
 */
int
send_attr_updates(int sd, resource_resv *resresv, struct attrl *pattr)
{
	const char *errbuf;
	int one_attr = 0;
	const std::string &job_name = resresv->name;

	if (job_name.empty() || pattr == NULL)
		return 0;

	if (sd == SIMULATE_SD)
		return 1; /* simulation always successful */

	if (pattr->next == NULL)
		one_attr = 1;

	if (pbs_asyalterjob(sd, const_cast<char *>(job_name.c_str()), pattr, NULL) == 0) {
		last_attr_updates = time(NULL);
		return 1;
	}

	if (is_finished_job(pbs_errno) == 1) {
		if (one_attr)
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO, job_name,
				   "Failed to update attr \'%s\' = %s, Job already finished",
				   pattr->name, pattr->value);
		else
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO, job_name,
				  "Failed to update job attributes, Job already finished");
		return 0;
	}

	errbuf = pbs_geterrmsg(sd);
	if (errbuf == NULL)
		errbuf = "";
	if (one_attr)
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, job_name,
			   "Failed to update attr \'%s\' = %s: %s (%d)",
			   pattr->name, pattr->value, errbuf, pbs_errno);
	else
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, job_name,
			   "Failed to update job attributes: %s (%d)",
			   errbuf, pbs_errno);

	return 0;
}

/**
 * @brief	Wrapper for pbs_preempt_jobs
 *
 * @param[in]	sd - communication handle
 * @param[in]	preempt_jobs_list - list of jobs to preempt
 *
 * @return	preempt_job_info *
 * @retval	return value of pbs_preempt_jobs
 */
preempt_job_info *
send_preempt_jobs(int sd, char **preempt_jobs_list)
{
	return pbs_preempt_jobs(sd, preempt_jobs_list);
}

/**
 * @brief	Wrapper for pbs_signaljob
 *
 * @param[in]	sd - communication handle
 * @param[in]	resresv - resource_resv for the job to send signal to
 * @param[in]	signal - the signal to send (e.g - "resume")
 * @param[in]	extend - extend data for signaljob
 *
 * @return	int
 * @retval	0 for success, 1 for error
 */
int
send_sigjob(int sd, resource_resv *resresv, const char *signal, char *extend)
{
	return pbs_sigjob(sd, const_cast<char *>(resresv->name.c_str()), const_cast<char *>(signal), extend);
}

/**
 * @brief	Wrapper for pbs_confirmresv
 *
 * @param[in]	sd - communication handle
 * @param[in]	resv - resource_resv for the resv to send confirmation to
 * @param[in] 	location - string of vnodes/resources to be allocated to the resv.
 * @param[in] 	start - start time of reservation if non-zero
 * @param[in] 	extend - extend data for pbs_confirmresv
 *
 * @return	int
 * @retval	0	Success
 * @retval	!0	error
 */
int
send_confirmresv(int sd, resource_resv *resv, const char *location, unsigned long start, const char *extend)
{
	return pbs_confirmresv(sd, const_cast<char *>(resv->name.c_str()), const_cast<char *>(location), start, const_cast<char *>(extend));
}

/**
 * @brief	Wrapper for pbs_selstat
 *
 * @param[in] sd - communication handle
 * @param[in] attrib - pointer to attropl structure(selection criteria)
 * @param[in] extend - extend string to encode req
 * @param[in] rattrib - list of attributes to return
 *
 * @return	struct batch_status *
 * @retval	list of queried jobs
 * @retval	NULL for error
 */
struct batch_status *
send_selstat(int sd, struct attropl *attrib, struct attrl *rattrib, char *extend)
{
	return pbs_selstat(sd, attrib, rattrib, extend);
}

/**
 * @brief	Wrapper for pbs_statvnode
 *
 * @param[in] sd - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	struct batch_status *
 * @retval	list of queried nodes
 * @retval	NULL for error
 */
struct batch_status *
send_statvnode(int sd, char *id, struct attrl *attrib, char *extend)
{
	return pbs_statvnode(sd, id, attrib, extend);
}

/**
 * @brief	Wrapper for pbs_statsched
 *
 * @param[in] sd - communication handle
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	struct batch_status *
 * @retval	list of queried scheds
 * @retval	NULL for error
 */
struct batch_status *
send_statsched(int sd, struct attrl *attrib, char *extend)
{
	return pbs_statsched(sd, attrib, extend);
}

/**
 * @brief	Wrapper for pbs_statque
 *
 * @param[in] sd - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	struct batch_status *
 * @retval	list of queried queues
 * @retval	NULL for error
 */
struct batch_status *
send_statqueue(int sd, char *id, struct attrl *attrib, char *extend)
{
	return pbs_statque(sd, id, attrib, extend);
}

/**
 * @brief	Wrapper for pbs_statserver
 *
 * @param[in] sd - communication handle
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	struct batch_status *
 * @retval	batch_status for server (aggregated in case of multi-server)
 * @retval	NULL for error
 */
struct batch_status *
send_statserver(int sd, struct attrl *attrib, char *extend)
{
	return pbs_statserver(sd, attrib, extend);
}

/**
 * @brief	Wrapper for pbs_statrsc
 *
 * @param[in] sd - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	struct batch_status *
 * @retval	list of resources
 * @retval	NULL for error
 */
struct batch_status *
send_statrsc(int sd, char *id, struct attrl *attrib, char *extend)
{
	return pbs_statrsc(sd, id, attrib, extend);
}

/**
 * @brief	Wrapper for pbs_statresv
 *
 * @param[in] sd - communication handle
 * @param[in] id - object id
 * @param[in] attrib - pointer to attribute list
 * @param[in] extend - extend string for encoding req
 *
 * @return	struct batch_status *
 * @retval	list of reservations
 * @retval	NULL for error
 */
struct batch_status *
send_statresv(int sd, char *id, struct attrl *attrib, char *extend)
{
	return pbs_statresv(sd, id, attrib, extend);
}


================================================
FILE: src/scheduler/server_info.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    server_info.c
 *
 * @brief
 * server_info.c - contains functions related to server_info structure.
 *
 * Functions included are:
 * 	query_server_info()
 * 	query_server_dyn_res()
 * 	query_sched_obj()
 * 	find_alloc_resource()
 * 	find_alloc_resource_by_str()
 * 	find_resource_by_str()
 * 	find_resource()
 * 	free_server_info()
 * 	free_resource_list()
 * 	free_resource()
 * 	new_resource()
 * 	create_resource()
 * 	add_resource_list()
 * 	add_resource_value()
 * 	add_resource_str_arr()
 * 	add_resource_bool()
 * 	update_server_on_run()
 * 	update_server_on_end()
 * 	create_server_arrays()
 * 	check_run_job()
 * 	check_exit_job()
 * 	check_susp_job()
 * 	check_running_job_not_in_reservation()
 * 	check_running_job_in_reservation()
 * 	check_resv_running_on_node()
 * 	dup_resource_list()
 * 	dup_selective_resource_list()
 * 	dup_ind_resource_list()
 * 	dup_resource()
 * 	is_unassoc_node()
 * 	free_counts_list()
 * 	dup_counts_umap()
 * 	find_counts()
 * 	find_alloc_counts()
 * 	update_counts_on_run()
 * 	update_counts_on_end()
 * 	counts_max()
 * 	update_universe_on_end()
 * 	set_resource()
 * 	find_indirect_resource()
 * 	resolve_indirect_resources()
 * 	update_preemption_on_run()
 * 	read_formula()
 * 	dup_status()
 * 	free_queue_list()
 * 	create_total_counts()
 * 	update_total_counts()
 * 	update_total_counts_on_end()
 * 	get_sched_rank()
 * 	add_queue_to_list()
 * 	find_queue_list_by_priority()
 * 	append_to_queue_list()
 *
 */

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <ctype.h>
#include <signal.h>
#include <sys/wait.h>
#include <algorithm>
#include <exception>

#include "pbs_entlim.h"
#include "pbs_ifl.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_share.h"
#include "libpbs.h"
#include "constant.h"
#include "config.h"
#include "server_info.h"
#include "queue_info.h"
#include "job_info.h"
#include "misc.h"
#include "node_info.h"
#include "globals.h"
#include "resv_info.h"
#include "sort.h"
#include "resource_resv.h"
#include "state_count.h"
#include "node_partition.h"
#include "resource.h"
#include "assert.h"
#include "limits_if.h"
#include "resource.h"
#include "pbs_internal.h"
#include "simulate.h"
#include "fairshare.h"
#include "check.h"
#include "fifo.h"
#include "buckets.h"
#include "parse.h"
#include "hook.h"
#include "libpbs.h"
#include "libutil.h"
#ifdef NAS
#include "site_code.h"
#endif

extern char **environ;

/**
 *	@brief
 *		creates a structure of arrays consisting of a server
 *		and all the queues and jobs that reside in that server
 *
 * @par Order of Query
 *		query_server()
 *      -> query_sched()
 *	 	-> query_nodes()
 *	 	-> query_queues()
 *	    -> query_jobs()
 *	 	->query_reservations()
 *
 * @param[in]	pol		-	input policy structure - will be dup'd
 * @param[in]	pbs_sd	-	connection to pbs_server
 *
 * @return	the server_info struct
 * @retval	server_info -> policy - policy structure for cycle
* @retval	NULL	: error
 *
 */
server_info *
query_server(status *pol, int pbs_sd)
{
	struct batch_status *server;   /* info about the server */
	struct batch_status *bs_resvs; /* batch status of the reservations */
	server_info *sinfo;	       /* scheduler internal form of server info */
	int num_express_queues = 0;    /* number of express queues */
	status *policy;
	int job_arrays_associated = FALSE;
	int i;

	if (pol == NULL)
		return NULL;

	if (allres.empty())
		if (update_resource_defs(pbs_sd) == false)
			return NULL;

	/* get server information from pbs server */
	if ((server = send_statserver(pbs_sd, NULL, NULL)) == NULL) {
		const char *errmsg = pbs_geterrmsg(pbs_sd);
		if (errmsg == NULL)
			errmsg = "";
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SERVER, LOG_NOTICE, "server_info",
			   "pbs_statserver failed: %s (%d)", errmsg, pbs_errno);
		return NULL;
	}

	/* convert batch_status structure into server_info structure */
	if ((sinfo = query_server_info(pol, server)) == NULL) {
		pbs_statfree(server);
		return NULL;
	}

	/* We dup'd the policy structure for the cycle */
	policy = sinfo->policy;

	if (query_server_dyn_res(sinfo) == -1) {
		pbs_statfree(server);
		sinfo->fstree = NULL;
		delete sinfo;
		return NULL;
	}

	if (!dflt_sched && (sc_attrs.partition == NULL)) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, "Scheduler does not contain a partition");
		pbs_statfree(server);
		sinfo->fstree = NULL;
		delete sinfo;
		return NULL;
	}

	/* to avoid a possible race condition in which the time it takes to
	 * query nodes is long enough that a reservation may have crossed
	 * into running state, we stat the reservation just before nodes and
	 * will populate internal data structures based on this batch status
	 * after all other data is queried
	 */
	bs_resvs = stat_resvs(pbs_sd);

	/* get the nodes, if any - NOTE: will set sinfo -> num_nodes */
	if ((sinfo->nodes = query_nodes(pbs_sd, sinfo)) == NULL) {
		pbs_statfree(server);
		sinfo->fstree = NULL;
		delete sinfo;
		pbs_statfree(bs_resvs);
		return NULL;
	}

	/* sort the nodes before we filter them down to more useful lists */
	if (!policy->node_sort->empty())
		qsort(sinfo->nodes, sinfo->num_nodes, sizeof(node_info *),
		      multi_node_sort);

	/* get the queues */
	sinfo->queues = query_queues(policy, pbs_sd, sinfo);
	if (sinfo->queues.empty()) {
		pbs_statfree(server);
		sinfo->fstree = NULL;
		delete sinfo;
		pbs_statfree(bs_resvs);
		return NULL;
	}

	if (sinfo->has_nodes_assoc_queue)
		sinfo->unassoc_nodes =
			node_filter(sinfo->nodes, sinfo->num_nodes, is_unassoc_node, NULL, 0);
	else
		sinfo->unassoc_nodes = sinfo->nodes;

	/* count the queues and total up the individual queue states
	 * for server totals. (total up all the state_count structs)
	 */
	for (auto qinfo : sinfo->queues) {
		total_states(&(sinfo->sc), &(qinfo->sc));

		if (qinfo->priority >= sc_attrs.preempt_queue_prio)
			num_express_queues++;
	}

	if (num_express_queues > 1)
		sinfo->has_mult_express = 1;

	/* sort the queues before we collect the jobs list (i.e. set_jobs())
	 * in the case we don't sort the jobs and don't have by_queue turned on
	 */
	if ((policy->round_robin == 1) || (policy->by_queue == 1))
		std::sort(sinfo->queues.begin(), sinfo->queues.end(), cmp_queue_prio_dsc);
	if (policy->round_robin == 1) {
		/* queues are already sorted in descending order of their priority */
		for (auto qinfo : sinfo->queues) {
			auto ret_val = add_queue_to_list(&sinfo->queue_list, qinfo);
			if (ret_val == 0) {
				sinfo->fstree = NULL;
				delete sinfo;
				pbs_statfree(bs_resvs);
				return NULL;
			}
		}
	}

	/* get reservations, if any - NOTE: will set sinfo -> num_resvs */
	sinfo->resvs = query_reservations(pbs_sd, sinfo, bs_resvs);
	pbs_statfree(bs_resvs);

	if (create_server_arrays(sinfo) == 0) { /* bad stuff happened */
		sinfo->fstree = NULL;
		delete sinfo;
		return NULL;
	}
#ifdef NAS /* localmod 050 */
	/* Give site a chance to tweak values before jobs are sorted */
	if (site_tidy_server(sinfo) == 0) {
		delete sinfo;
		return NULL;
	}
#endif /* localmod 050 */
	associate_dependent_jobs(sinfo);

	/* create res_to_check arrays based on current jobs/resvs */
	policy->resdef_to_check = collect_resources_from_requests(sinfo->all_resresv);
	for (const auto &rd : policy->resdef_to_check) {
		if (!(rd == allres["host"] || rd == allres["vnode"]))
			policy->resdef_to_check_no_hostvnode.insert(rd);

		if (rd->flags & ATR_DFLAG_RASSN)
			policy->resdef_to_check_rassn.insert(rd);

		if ((rd->flags & ATR_DFLAG_RASSN) && (rd->flags & ATR_DFLAG_CVTSLT))
			policy->resdef_to_check_rassn_select.insert(rd);
	}

	sinfo->calendar = create_event_list(sinfo);

	sinfo->running_jobs =
		resource_resv_filter(sinfo->jobs, sinfo->sc.total, check_run_job,
				     NULL, FILTER_FULL);
	sinfo->exiting_jobs = resource_resv_filter(sinfo->jobs,
						   sinfo->sc.total, check_exit_job, NULL, 0);
	if (sinfo->running_jobs == NULL || sinfo->exiting_jobs == NULL) {
		sinfo->fstree = NULL;
		delete sinfo;
		return NULL;
	}

	if (sinfo->has_soft_limit || sinfo->has_hard_limit) {
		counts *allcts;
		allcts = find_alloc_counts(sinfo->alljobcounts, PBS_ALL_ENTITY);
		job_arrays_associated = TRUE;
		/* set the user, group , project counts */
		for (int i = 0; sinfo->running_jobs[i] != NULL; i++) {
			counts *cts; /* used to count running per user/grp */

			cts = find_alloc_counts(sinfo->user_counts,
						sinfo->running_jobs[i]->user);

			update_counts_on_run(cts, sinfo->running_jobs[i]->resreq);

			cts = find_alloc_counts(sinfo->group_counts,
						sinfo->running_jobs[i]->group);

			update_counts_on_run(cts, sinfo->running_jobs[i]->resreq);

			cts = find_alloc_counts(sinfo->project_counts,
						sinfo->running_jobs[i]->project);

			update_counts_on_run(cts, sinfo->running_jobs[i]->resreq);

			update_counts_on_run(allcts, sinfo->running_jobs[i]->resreq);
			/* Since we are already looping on running jobs, associcate running
			 * subjobs to their parent.
			 */
			if ((sinfo->running_jobs[i]->job->is_subjob) &&
			    (associate_array_parent(sinfo->running_jobs[i], sinfo) == 1)) {
				sinfo->fstree = NULL;
				delete sinfo;
				return NULL;
			}
		}
		create_total_counts(sinfo, NULL, NULL, SERVER);
	}
	if (job_arrays_associated == FALSE) {
		for (i = 0; sinfo->running_jobs[i] != NULL; i++) {
			if ((sinfo->running_jobs[i]->job->is_subjob) &&
			    (associate_array_parent(sinfo->running_jobs[i], sinfo) == 1)) {
				sinfo->fstree = NULL;
				delete sinfo;
				return NULL;
			}
		}
	}

	policy->equiv_class_resdef = create_resresv_sets_resdef(policy);
	sinfo->equiv_classes = create_resresv_sets(policy, sinfo);

	/* To avoid duplicate accounting of jobs on nodes, we are only interested in
	 * jobs that are bound to the server nodes and not those bound to reservation
	 * nodes, which are accounted for by collect_jobs_on_nodes in
	 * query_reservation, hence the use of the filtered list of jobs
	 */
	auto jobs_alive = resource_resv_filter(sinfo->jobs, sinfo->sc.total, check_running_job_not_in_reservation, NULL, 0);
	collect_jobs_on_nodes(sinfo->nodes, jobs_alive, count_array(jobs_alive), DETECT_GHOST_JOBS);

	/* Now that the job_arr is created, garbage collect the jobs */
	free(jobs_alive);

	collect_resvs_on_nodes(sinfo->nodes, sinfo->resvs, sinfo->num_resvs);

	sinfo->unordered_nodes = static_cast<node_info **>(malloc((sinfo->num_nodes + 1) * sizeof(node_info *)));
	if (sinfo->unordered_nodes == NULL) {
		sinfo->fstree = NULL;
		delete sinfo;
		return NULL;
	}

	/* Ideally we'd query everything about a node in query_node().  We query
	 * nodes very early on in the query process.  Not all the information
	 * necessary for a node is available at that time.  We need to delay it till here.
	 */
	for (i = 0; sinfo->nodes[i] != NULL; i++) {
		auto *ninfo = sinfo->nodes[i];
		ninfo->nodesig = create_resource_signature(ninfo->res,
							   policy->resdef_to_check_no_hostvnode, ADD_ALL_BOOL);
		ninfo->nodesig_ind = add_str_to_unique_array(&(sinfo->nodesigs),
							     ninfo->nodesig);

		if (ninfo->has_ghost_job)
			create_resource_assn_for_node(ninfo);

		sinfo->nodes[i]->node_ind = i;
		sinfo->unordered_nodes[i] = ninfo;
	}
	sinfo->unordered_nodes[i] = NULL;

	generic_sim(sinfo->calendar, TIMED_RUN_EVENT, 0, 0, add_node_events, NULL, NULL);

	/* Create placement sets  after collecting jobs on nodes because
	 * we don't want to account for resources consumed by ghost jobs
	 */
	create_placement_sets(policy, sinfo);

	sinfo->buckets = create_node_buckets(policy, sinfo->nodes, sinfo->queues, UPDATE_BUCKET_IND);

	if (sinfo->buckets != NULL) {
		int ct;
		ct = count_array(sinfo->buckets);
		qsort(sinfo->buckets, ct, sizeof(node_bucket *), multi_bkt_sort);
	}

	pbs_statfree(server);

	return sinfo;
}

/**
 * @brief
 * 		takes info from a batch_status structure about
 *		a server into a server_info structure for easy access
 *
 * @param[in]	pol		-	scheduler policy structure
 * @param[in]	server	-	batch_status struct of server info
 *							chain possibly NULL
 *
 * @return	newly allocated and filled server_info struct
 *
 */
server_info *
query_server_info(status *pol, struct batch_status *server)
{
	struct attrl *attrp;  /* linked list of attributes */
	server_info *sinfo;   /* internal scheduler structure for server info */
	schd_resource *resp;  /* a resource to help create the resource list */
	sch_resource_t count; /* used to convert string -> integer */
	char *endp;	      /* used with strtol() */
	status *policy;

	if (pol == NULL || server == NULL)
		return NULL;

	sinfo = new server_info(server->name);

	if (sinfo->liminfo == NULL)
		return NULL;

	if ((sinfo->policy = dup_status(pol)) == NULL) {
		delete sinfo;
		return NULL;
	}

	policy = sinfo->policy;

	/* set the time to the current time */
	sinfo->server_time = policy->current_time;

	attrp = server->attribs;

	while (attrp != NULL) {
		if (is_reslimattr(attrp)) {
			(void) lim_setlimits(attrp, LIM_RES, sinfo->liminfo);
			if (strstr(attrp->value, "u:") != NULL)
				sinfo->has_user_limit = 1;
			if (strstr(attrp->value, "g:") != NULL)
				sinfo->has_grp_limit = 1;
			if (strstr(attrp->value, "p:") != NULL)
				sinfo->has_proj_limit = 1;
			if (strstr(attrp->value, "o:") != NULL)
				sinfo->has_all_limit = 1;
		} else if (is_runlimattr(attrp)) {
			(void) lim_setlimits(attrp, LIM_RUN, sinfo->liminfo);
			if (strstr(attrp->value, "u:") != NULL)
				sinfo->has_user_limit = 1;
			if (strstr(attrp->value, "g:") != NULL)
				sinfo->has_grp_limit = 1;
			if (strstr(attrp->value, "p:") != NULL)
				sinfo->has_proj_limit = 1;
			if (strstr(attrp->value, "o:") != NULL)
				sinfo->has_all_limit = 1;
		} else if (is_oldlimattr(attrp)) {
			const char *limname = convert_oldlim_to_new(attrp);
			(void) lim_setlimits(attrp, LIM_OLD, sinfo->liminfo);

			if (strstr(limname, "u:") != NULL)
				sinfo->has_user_limit = 1;
			if (strstr(limname, "g:") != NULL)
				sinfo->has_grp_limit = 1;
			/* no need to check for project limits because there were no old style project limits */
		} else if (!strcmp(attrp->name, ATTR_NodeGroupEnable)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				sinfo->node_group_enable = 1;
			else
				sinfo->node_group_enable = 0;
		} else if (!strcmp(attrp->name, ATTR_NodeGroupKey))
			sinfo->node_group_key = break_comma_list(std::string(attrp->value));
		else if (!strcmp(attrp->name, ATTR_job_sort_formula)) { /* Deprecated */
			sinfo->job_sort_formula = read_formula();
			if (policy->sort_by->size() > 1) /* 0 is the formula itself */
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
					  "Job sorting formula and job_sort_key are incompatible.  "
					  "The job sorting formula will be used.");

		} else if (!strcmp(attrp->name, ATTR_rescavail)) { /* resources_available*/
			resp = find_alloc_resource_by_str(sinfo->res, attrp->resource);

			if (resp != NULL) {
				if (sinfo->res == NULL)
					sinfo->res = resp;

				if (set_resource(resp, attrp->value, RF_AVAIL) == 0) {
					delete sinfo;
					return NULL;
				}
			}
		} else if (!strcmp(attrp->name, ATTR_rescassn)) { /* resources_assigned */
			resp = find_alloc_resource_by_str(sinfo->res, attrp->resource);
			if (sinfo->res == NULL)
				sinfo->res = resp;
			if (resp != NULL) {
				if (set_resource(resp, attrp->value, RF_ASSN) == 0) {
					delete sinfo;
					return NULL;
				}
			}
		} else if (!strcmp(attrp->name, ATTR_EligibleTimeEnable)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				sinfo->eligible_time_enable = 1;
			else
				sinfo->eligible_time_enable = 0;
		} else if (!strcmp(attrp->name, ATTR_ProvisionEnable)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				sinfo->provision_enable = 1;
			else
				sinfo->provision_enable = 0;
		} else if (!strcmp(attrp->name, ATTR_power_provisioning)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				sinfo->power_provisioning = 1;
			else
				sinfo->power_provisioning = 0;
		} else if (!strcmp(attrp->name, ATTR_backfill_depth)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				sinfo->policy->backfill_depth = count;
			if (count == 0)
				sinfo->policy->backfill = 0;
		} else if (!strcmp(attrp->name, ATTR_restrict_res_to_release_on_suspend)) {
			char **resl;
			resl = break_comma_list(attrp->value);
			if (resl != NULL) {
				policy->rel_on_susp = resstr_to_resdef(resl);
				free_string_array(resl);
			}
		} else if (!strcmp(attrp->name, ATTR_has_runjob_hook)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				sinfo->has_runjob_hook = 1;
			else
				sinfo->has_runjob_hook = 0;
		}
		attrp = attrp->next;
	}

	if (sinfo->job_sort_formula == NULL && sc_attrs.job_sort_formula != NULL) {
		sinfo->job_sort_formula = string_dup(sc_attrs.job_sort_formula);
		if (sinfo->job_sort_formula == NULL) {
			delete sinfo;
			return NULL;
		}
	}

	if (has_hardlimits(sinfo->liminfo))
		sinfo->has_hard_limit = 1;
	if (has_softlimits(sinfo->liminfo))
		sinfo->has_soft_limit = 1;

	/* Since we want to keep track of fairshare changes from cycle to cycle
	 * copy in the global fairshare tree root.  Be careful to not free it
	 * at the end of the cycle.
	 */
	sinfo->fstree = fstree;
#ifdef NAS /* localmod 034 */
	site_set_share_head(sinfo);
#endif /* localmod 034 */

	return sinfo;
}

/**
 * @brief
 * 		execute all configured server_dyn_res scripts
 *
 * @param[in]	sinfo	-	server info
 *
 * @retval	0	: on success
 * @retval -1	: on error
 */
int
query_server_dyn_res(server_info *sinfo)
{
	int k;
	int pipe_err;
	char res_zero[] = "0"; /* dynamic res failure implies resource <-0 */
	schd_resource *res;    /* used for updating node resources */
	FILE *fp;	       /* for popen() for res_assn */

	for (const auto &dr : conf.dynamic_res) {
		res = find_alloc_resource_by_str(sinfo->res, dr.res);
		if (res != NULL) {
			fd_set set;
			sigset_t allsigs;
			pid_t pid = 0; /* pid of child */
			int pdes[2];
			char buf[256]; /* buffer for reading from pipe */
			k = 0;
			buf[0] = '\0';

			if (sinfo->res == NULL)
				sinfo->res = res;

			pipe_err = errno = 0;

/* Make sure file does not have open permissions */
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
			int err;
			err = tmp_file_sec_user(const_cast<char *>(dr.script_name.c_str()), 0, 1, S_IWGRP | S_IWOTH, 1, getuid());
			if (err != 0) {
				log_eventf(PBSEVENT_SECURITY, PBS_EVENTCLASS_SERVER, LOG_ERR, "server_dyn_res",
					   "error: %s file has a non-secure file access, setting resource %s to 0, errno: %d",
					   dr.script_name.c_str(), res->name, err);
				set_resource(res, res_zero, RF_AVAIL);
				continue;
			}
#endif

			if (pipe(pdes) < 0) {
				pipe_err = errno;
			}
			if (!pipe_err) {
				switch (pid = fork()) {
					case -1: /* error */
						close(pdes[0]);
						close(pdes[1]);
						pipe_err = errno;
						break;
					case 0: /* child */
						close(pdes[0]);
						if (pdes[1] != STDOUT_FILENO) {
							dup2(pdes[1], STDOUT_FILENO);
							close(pdes[1]);
						}
						setpgid(0, 0);
						if (sigemptyset(&allsigs) == -1) {
							log_err(errno, __func__, "sigemptyset failed");
						}
						if (sigprocmask(SIG_SETMASK, &allsigs, NULL) == -1) { /* unblock all signals */
							log_err(errno, __func__, "sigprocmask(UNBLOCK)");
						}

						char *argv[4];
						argv[0] = const_cast<char *>("/bin/sh");
						argv[1] = const_cast<char *>("-c");
						argv[2] = const_cast<char *>(dr.command_line.c_str());
						argv[3] = NULL;

						execve("/bin/sh", argv, environ);
						_exit(127);
				}
			}

			k = 0;
			if (!pipe_err) {
				int ret;
				FD_ZERO(&set);
				FD_SET(pdes[0], &set);
				if (sc_attrs.server_dyn_res_alarm) {
					struct timeval timeout;
					timeout.tv_sec = sc_attrs.server_dyn_res_alarm;
					timeout.tv_usec = 0;
					ret = select(FD_SETSIZE, &set, NULL, NULL, &timeout);
				} else {
					ret = select(FD_SETSIZE, &set, NULL, NULL, NULL);
				}
				if (ret == -1) {
					log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "server_dyn_res",
						   "Select() failed for script %s", dr.command_line.c_str());
				} else if (ret == 0) {
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "server_dyn_res",
						   "Program %s timed out", dr.command_line.c_str());
				}
				if (pid > 0) {
					close(pdes[1]);
					if (ret > 0) {
						/* Parent; only open if child created and select showed sth to read,
						* but assume fdopen can't fail
						*/
						fp = fdopen(pdes[0], "r");
						if (fgets(buf, sizeof(buf), fp) == NULL) {
							pipe_err = errno;
						} else
							k = strlen(buf);

						fclose(fp);
					} else
						close(pdes[0]);
				}
			}

			if (k > 0) {
				buf[k] = '\0';
				/* chop \r or \n from buf so that is_num() doesn't think it's a str */
				while (--k) {
					if ((buf[k] != '\n') && (buf[k] != '\r'))
						break;
					buf[k] = '\0';
				}
				if (set_resource(res, buf, RF_AVAIL) == 0) {
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "server_dyn_res",
						   "Script %s returned bad output", dr.command_line.c_str());
					(void) set_resource(res, res_zero, RF_AVAIL);
				}
			} else {
				if (pipe_err != 0)
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "server_dyn_res",
						   "Can't pipe to program %s: %s", dr.command_line.c_str(), strerror(pipe_err));
				log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "server_dyn_res",
					   "Setting resource %s to 0", res->name);
				(void) set_resource(res, res_zero, RF_AVAIL);
			}
			if (res->type.is_non_consumable)
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "server_dyn_res",
					   "%s = %s", dr.command_line.c_str(), res_to_str(res, RF_AVAIL));
			else
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, "server_dyn_res",
					   "%s = %s (\"%s\")", dr.command_line.c_str(), res_to_str(res, RF_AVAIL), buf);

			if (pid > 0) {
				kill(-pid, SIGTERM);
				if (waitpid(pid, NULL, WNOHANG) == 0) {
					usleep(250000);
					if (waitpid(pid, NULL, WNOHANG) == 0) {
						kill(-pid, SIGKILL);
						waitpid(pid, NULL, 0);
					}
				}
			}
		}
	}

	return 0;
}

/**
 * @brief
 * 		try and find a resource by resdef, and if it is not
 *		there, allocate space for it and add it to the resource list
 *
 * @param[in]	resplist	- 	the resource list
 * @param[in]	name 		-	the name of the resource
 *
 * @return	schd_resource
 * @retval	NULL	: error
 *
 * @par MT-Safe:	no
 */
schd_resource *
find_alloc_resource(schd_resource *resplist, resdef *def)
{
	schd_resource *resp;	    /* used to search through list of resources */
	schd_resource *prev = NULL; /* the previous resources in the list */

	if (def == NULL)
		return NULL;

	for (resp = resplist; resp != NULL && resp->def != def; resp = resp->next) {
		prev = resp;
	}

	if (resp == NULL) {
		if ((resp = new_resource()) == NULL)
			return NULL;

		resp->def = def;
		resp->type = def->type;
		resp->name = def->name.c_str();

		if (prev != NULL)
			prev->next = resp;
	}

	return resp;
}

/**
 * @brief
 * 		try and find a resource by name, and if it is not
 *		there, allocate space for it and add it to the resource list
 *
 * @param[in]	resplist 	- 	the resource list
 * @param[in]	name 		- 	the name of the resource
 *
 * @return	schd_resource
 * @retval	NULL :	Error
 *
 * @par MT-Safe:	no
 */
schd_resource *
find_alloc_resource_by_str(schd_resource *resplist, const char *name)
{
	schd_resource *resp;	    /* used to search through list of resources */
	schd_resource *prev = NULL; /* the previous resources in the list */

	if (name == NULL)
		return NULL;

	for (resp = resplist; resp != NULL && strcmp(resp->name, name);
	     resp = resp->next) {
		prev = resp;
	}

	if (resp == NULL) {
		if ((resp = create_resource(name, NULL, RF_NONE)) == NULL)
			return NULL;

		if (prev != NULL)
			prev->next = resp;
	}

	return resp;
}
schd_resource *
find_alloc_resource_by_str(schd_resource *resplist, const std::string &name)
{
	return find_alloc_resource_by_str(resplist, name.c_str());
}

/**
 * @brief
 * 		finds a resource by string in a resource list
 *
 * @param[in]	reslist - 	the resource list
 * @param[in]	name	- 	the name of the resource
 *
 * @return	schd_resource
 * @retval	NULL	: if not found
 *
 * @par MT-Safe:	no
 */
schd_resource *
find_resource_by_str(schd_resource *reslist, const char *name)
{
	schd_resource *resp; /* used to search through list of resources */

	if (reslist == NULL || name == NULL)
		return NULL;

	resp = reslist;

	while (resp != NULL && strcmp(resp->name, name))
		resp = resp->next;

	return resp;
}

schd_resource *
find_resource_by_str(schd_resource *reslist, const std::string &name)
{
	return find_resource_by_str(reslist, name.c_str());
}

/**
 * @brief
 * 		find resource by resource definition
 *
 * @param 	reslist - 	resource list to search
 * @param 	def 	- 	resource definition to search for
 *
 * @return	the found resource
 * @retval	NULL	: if not found
 */
schd_resource *
find_resource(schd_resource *reslist, resdef *def)
{
	schd_resource *resp;

	if (reslist == NULL || def == NULL)
		return NULL;

	resp = reslist;

	while (resp != NULL && resp->def != def)
		resp = resp->next;

	return resp;
}

/**
 * @brief	free the svr_to_psets map
 * 		Note: this won't be needed once we convert node_partition to a class
 *
 * @return void
 */
void
server_info::free_server_psets()
{
	for (auto &spset : svr_to_psets) {
		free_node_partition(spset.second);
	}
	svr_to_psets.clear();
}

/**
 * @brief	dup a sinfo->svr_to_psets map (deep copy)
 *			Note: this might not be needed once we convert node_partition to a class
 *
 * @param[in]	spsets - map of server psets
 *
 * @return nothing
 */
void
server_info::dup_server_psets(const std::unordered_map<std::string, node_partition *> &spsets)
{
	for (const auto &spset : spsets) {
		svr_to_psets[spset.first] = dup_node_partition(spset.second, this);
		if (svr_to_psets[spset.first] == NULL) {
			free_server_psets();
			return;
		}
	}
}

/**
 * @brief
 * 		free_server_info - free the space used by a server_info
 *		structure
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
server_info::free_server_info()
{
	if (jobs != NULL)
		free(jobs);
	if (all_resresv != NULL)
		free(all_resresv);
	if (running_jobs != NULL)
		free(running_jobs);
	if (exiting_jobs != NULL)
		free(exiting_jobs);
	/* if we don't have nodes associated with queues, this is a reference */
	if (has_nodes_assoc_queue == 0)
		unassoc_nodes = NULL;
	else if (unassoc_nodes != NULL)
		free(unassoc_nodes);
	free_counts_list(alljobcounts);
	free_counts_list(group_counts);
	free_counts_list(project_counts);
	free_counts_list(user_counts);
	free_counts_list(total_alljobcounts);
	free_counts_list(total_group_counts);
	free_counts_list(total_project_counts);
	free_counts_list(total_user_counts);
	free_node_partition_array(nodepart);
	free_node_partition(allpart);
	free_server_psets();
	free_node_partition_array(hostsets);
	free_string_array(nodesigs);
	free_np_cache_array(npc_arr);
	free_event_list(calendar);
	if (policy != NULL)
		delete policy;
	if (fstree != NULL)
		delete fstree;
	lim_free_liminfo(liminfo);
	liminfo = NULL;
	free_queue_list(queue_list);
	free_resresv_set_array(equiv_classes);
	free_node_bucket_array(buckets);

	if (unordered_nodes != NULL)
		free(unordered_nodes);

	free_resource_list(res);
	free(job_sort_formula);

#ifdef NAS
	/* localmod 034 */
	site_free_shares(sinfo);
#endif

	/* We need to free the sinfo first to free the calendar.
	 * When the calendar is freed, the job events modify the jobs.  We can't
	 * free the jobs before then.
	 */
	free_queues(queues);
	free_nodes(nodes);
	free_resource_resv_array(resvs);

#ifdef NAS /* localmod 053 */
	site_restore_users();
#endif /* localmod 053 */
}

/**
 * @brief
 *		free_resource_list - frees the memory used by a resource list
 *
 * @param[in]	reslist	-	the resource list to free
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
free_resource_list(schd_resource *reslist)
{
	schd_resource *resp, *tmp;

	if (reslist == NULL)
		return;

	resp = reslist;
	while (resp != NULL) {
		tmp = resp->next;
		free_resource(resp);

		resp = tmp;
	}
}

/**
 * @brief
 * 		free_resource - frees the memory used by a resource structure
 *
 * @param[in]	reslist	-	the resource to free
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
free_resource(schd_resource *resp)
{
	if (resp == NULL)
		return;

	if (resp->orig_str_avail != NULL)
		free(resp->orig_str_avail);

	if (resp->indirect_vnode_name != NULL)
		free(resp->indirect_vnode_name);

	if (resp->str_avail != NULL)
		free_string_array(resp->str_avail);

	if (resp->str_assigned != NULL)
		free(resp->str_assigned);

	free(resp);
}

// Init function
void
server_info::init_server_info()
{

	has_soft_limit = false;
	has_hard_limit = false;
	has_user_limit = false;
	has_grp_limit = false;
	has_proj_limit = false;
	has_all_limit = false;
	has_mult_express = false;
	has_multi_vnode = false;
	has_prime_queue = false;
	has_nonprime_queue = false;
	has_nodes_assoc_queue = false;
	has_ded_queue = false;
	has_runjob_hook = false;
	node_group_enable = false;
	eligible_time_enable = false;
	provision_enable = false;
	power_provisioning = false;
	use_hard_duration = false;
	pset_metadata_stale = false;
	num_parts = 0;
	has_nonCPU_licenses = 0;
	num_preempted = 0;
	res = NULL;
	queue_list = NULL;
	jobs = NULL;
	all_resresv = NULL;
	calendar = NULL;
	running_jobs = NULL;
	exiting_jobs = NULL;
	nodes = NULL;
	unassoc_nodes = NULL;
	resvs = NULL;
	nodepart = NULL;
	allpart = NULL;
	hostsets = NULL;
	nodesigs = NULL;
	qrun_job = NULL;
	policy = NULL;
	fstree = NULL;
	equiv_classes = NULL;
	buckets = NULL;
	unordered_nodes = NULL;
	num_nodes = 0;
	num_resvs = 0;
	num_hostsets = 0;
	server_time = 0;
	job_sort_formula = NULL;
	init_state_count(&sc);
	memset(preempt_count, 0, (NUM_PPRIO + 1) * sizeof(int));
	liminfo = NULL;

#ifdef NAS
	/* localmod 034 */
	share_head = NULL;
#endif
}

// Constructor
server_info::server_info(const char *sname) : name(sname)
{
	init_server_info();
	liminfo = lim_alloc_liminfo();
}

// Destructor
server_info::~server_info()
{
	free_server_info();
}

/**
 * @brief
 * 		new_resource - allocate and initialize new resource struct
 *
 * @return	schd_resource
 * @retval	NULL	: Error
 *
 * @par MT-Safe:	yes
 */
schd_resource *
new_resource()
{
	schd_resource *resp; /* the new resource */

	if ((resp = static_cast<schd_resource *>(calloc(1, sizeof(schd_resource)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	/* member type zero'd by calloc() */

	resp->name = NULL;
	resp->next = NULL;
	resp->def = NULL;
	resp->orig_str_avail = NULL;
	resp->indirect_vnode_name = NULL;
	resp->indirect_res = NULL;
	resp->str_avail = NULL;
	resp->str_assigned = NULL;
	resp->assigned = RES_DEFAULT_ASSN;
	resp->avail = RES_DEFAULT_AVAIL;

	return resp;
}

/**
 * @brief
 * 		Create new resource with given data
 *
 * @param[in]	name	-	name of resource
 * @param[in] 	value	-	value of resource
 * @param[in] 	field	-	is the value RF_AVAIL or RF_ASSN
 *
 * @see	set_resource()
 *
 * @return schd_resource *
 * @retval newly created resource
 * @retval NULL	: on error
 */
schd_resource *
create_resource(const char *name, const char *value, enum resource_fields field)
{
	schd_resource *nres = NULL;
	resdef *rdef;

	if (name == NULL)
		return NULL;

	if (value == NULL && field != RF_NONE)
		return NULL;

	rdef = find_resdef(name);

	if (rdef != NULL) {
		if ((nres = new_resource()) != NULL) {
			nres->def = rdef;
			nres->name = rdef->name.c_str();
			nres->type = rdef->type;

			if (value != NULL) {
				if (set_resource(nres, value, field) == 0) {
					free_resource(nres);
					return NULL;
				}
			}
		}
	} else {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SCHED, LOG_DEBUG, name,
			  "Resource definition does not exist, resource may be invalid");
		return NULL;
	}

	return nres;
}

/**
 * @brief modify the resources_assigned values for a resource_list
 * 		(e.g. either A += B or A -= B) where
 * 		A is a resource list and B is a resource_req list.
 *
 * @param[in] res_list - The schd_resource list which is modified
 * @param[in] req_list - What is modifing the schd_resource list
 * @param[in] type - SCHD_INCR for += or SCHD_DECR for -=
 *
 * @return int
 * @retval 1 - success
 * @retval 0 - failure
 */
int
modify_resource_list(schd_resource *res_list, resource_req *req_list, int type)
{
	schd_resource *cur_res;
	resource_req *cur_req;
	schd_resource *end_res = NULL;

	if (res_list == NULL || req_list == NULL)
		return 0;

	for (cur_req = req_list; cur_req != NULL; cur_req = cur_req->next) {
		if (cur_req->type.is_consumable) {
			cur_res = find_resource(res_list, cur_req->def);
			if (cur_res == NULL && type == SCHD_INCR) {
				if (end_res == NULL)
					for (end_res = res_list; end_res->next != NULL; end_res = end_res->next)
						;
				end_res->next = create_resource(cur_req->name, cur_req->res_str, RF_AVAIL);
				if (end_res->next == NULL)
					return 0;
				end_res = end_res->next;
			} else {
				if (type == SCHD_INCR)
					cur_res->assigned += cur_req->amount;
				else if (type == SCHD_DECR)
					cur_res->assigned -= cur_req->amount;
			}
		}
	}
	return 1;
}

/**
 * @brief
 * 		add_resource_list - add one resource list to another
 *		i.e. r1 += r2
 *
 * @param[in]	policy	-	policy info
 * @param[in]	r1 		- 	lval resource
 * @param[in]	r2 		- 	rval resource
 * @param[in]	flags 	-
 *							NO_UPDATE_NON_CONSUMABLE - do not update
 *							non consumable resources
 *							USE_RESOURCE_LIST - use policy->resdef_to_check
 *							(and all bools) instead of all resources
 *							ADD_UNSET_BOOLS_FALSE - add unset bools as false
 *
 * @return	int
 * @retval	1	: success
 * @retval	0	: failure
 *
 * @par MT-Safe:	no
 */
int
add_resource_list(status *policy, schd_resource *r1, schd_resource *r2, unsigned int flags)
{
	schd_resource *cur_r1;
	schd_resource *cur_r2;
	schd_resource *end_r1 = NULL;
	schd_resource *nres;
	sch_resource_t assn;

	if (r1 == NULL || r2 == NULL)
		return 0;

	for (cur_r2 = r2; cur_r2 != NULL; cur_r2 = cur_r2->next) {
		if ((flags & NO_UPDATE_NON_CONSUMABLE) && cur_r2->def->type.is_non_consumable)
			continue;
		if ((flags & USE_RESOURCE_LIST)) {
			const auto &rtc = policy->resdef_to_check;
			if (rtc.find(cur_r2->def) == rtc.end() && !cur_r2->type.is_boolean)
				continue;
		}

		cur_r1 = find_resource(r1, cur_r2->def);
		if (cur_r1 == NULL) { /* resource in r2 which is not in r1 */
			if (!(flags & NO_UPDATE_NON_CONSUMABLE) || cur_r2->type.is_consumable) {
				if (end_r1 == NULL)
					for (end_r1 = r1; end_r1->next != NULL; end_r1 = end_r1->next)
						;
				end_r1->next = dup_resource(cur_r2);
				if (end_r1->next == NULL)
					return 0;
				end_r1 = end_r1->next;
			}
		} else if (cur_r1->type.is_consumable) {
			if ((flags & ADD_AVAIL_ASSIGNED)) {
				if (cur_r2->avail == RES_DEFAULT_AVAIL)
					assn = RES_DEFAULT_ASSN; /* nothing is set, so add nothing */
				else
					assn = cur_r2->avail;
			} else
				assn = cur_r2->assigned;
			add_resource_value(&(cur_r1->avail), &(cur_r2->avail),
					   RES_DEFAULT_AVAIL);
			add_resource_value(&(cur_r1->assigned),
					   &assn, RES_DEFAULT_ASSN);
		} else {
			if (!(flags & NO_UPDATE_NON_CONSUMABLE)) {
				if (cur_r1->type.is_string) {
					if (cur_r1->def == allres["vnode"])
						add_resource_str_arr(cur_r1, cur_r2->str_avail, 1);
					else
						add_resource_str_arr(cur_r1, cur_r2->str_avail, 0);
				} else if (cur_r1->type.is_boolean)
					(void) add_resource_bool(cur_r1, cur_r2);
			}
		}
	}

	if (flags & ADD_UNSET_BOOLS_FALSE) {
		for (const auto &br : boolres) {
			if (find_resource(r2, br) == NULL) {
				cur_r1 = find_resource(r1, br);
				if (cur_r1 == NULL) {
					nres = create_resource(br->name.c_str(), ATR_FALSE, RF_AVAIL);
					if (nres == NULL)
						return 0;

					if (end_r1 == NULL)
						for (end_r1 = r1; end_r1->next != NULL; end_r1 = end_r1->next)
							;
					end_r1->next = nres;
					end_r1 = nres;
				} else {
					nres = false_res();
					if (nres == NULL)
						return 0;
					nres->name = br->name.c_str();
					(void) add_resource_bool(cur_r1, nres);
				}
			}
		}
	}
	return 1;
}

/**
 * @brief
 *		add_resource_value - add a resource value to another
 *				i.e. val1 += val2
 *
 * @param[in]	val1		-	value 1
 * @param[in]	val2		-	value 2
 * @param[in]	initial_val - 	value set by resource constructor
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
add_resource_value(sch_resource_t *val1, sch_resource_t *val2,
		   sch_resource_t initial_val)
{
	if (val1 == NULL || val2 == NULL)
		return;

	if (*val1 == initial_val)
		*val1 = *val2;
	else if (*val2 != initial_val)
		*val1 += *val2;
	/* else val2 is default and val1 isn't, so we leave val1 alone */
}

/**
 * @brief
 * 		Add values from a string array to a string resource (available).
 *		Only add values if they do not exist.
 *
 * @param[in]	res			-	resource to add values to
 * @param[in]	str_arr		-	string array of values to add
 * @param[in]	allow_dup 	- 	should we allow dups or not?
 *
 * @return	int
 *
 * @retval	1	: success
 * @retval	0	: failure
 *
 * @par MT-Safe:	no
 */
int
add_resource_str_arr(schd_resource *res, char **str_arr, int allow_dup)
{
	int i;

	if (res == NULL || str_arr == NULL)
		return 0;

	if (!res->type.is_string)
		return 0;

	for (i = 0; str_arr[i] != NULL; i++) {
		if (add_str_to_unique_array(&(res->str_avail), str_arr[i]) < 0)
			return 0;
	}
	return 1;
}

/**
 * @brief
 * 		accumulate two boolean resources together
 *		T + T = True | F + F = False | T + F = TRUE_FALSE
 *
 * @param[in] 	r1	-	lval : left side boolean to add to
 * @param[in]	r2 	-	rval : right side boolean - if NULL, treat as false
 *
 * @return int
 * @retval	1	: Ok
 * @retval	0	: Error
 */
int
add_resource_bool(schd_resource *r1, schd_resource *r2)
{
	int r1val, r2val;
	if (r1 == NULL)
		return 0;

	if (!r1->type.is_boolean || (r2 != NULL && !r2->type.is_boolean))
		return 0;

	/* We can't accumulate any more values than TRUE and FALSE,
	 * so if we have both than return success early
	 */
	r1val = r1->avail;
	if (r1val == TRUE_FALSE)
		return 1;

	r2val = r2 == NULL ? FALSE : r2->avail;

	/********************************************
	 *        Possible Value Combinations       *
	 *       r1     *    r2   *    r1 result    *
	 * ******************************************
	 *       T      *     T    *       T        *
	 *       T      *     F    *   TRUE_FALSE   *
	 *       F      *     T    *   TRUE_FALSE   *
	 *       F      *     F    *       F        *
	 ********************************************/

	if (r1val && !r2val)
		r1->avail = TRUE_FALSE;
	else if (!r1val && r2val)
		r1->avail = TRUE_FALSE;

	return 1;
}

/**
 * @brief
 * 		update_server_on_run - update server_info structure
 *				when a resource resv is run
 *
 * @policy[in]	policy 	- 	policy info
 * @param[in]	sinfo 	- 	server_info to update
 * @param[in]	qinfo 	- 	queue_info the job is in
 *							(if resresv is a job)
 * @param[in]	resresv - 	resource_resv that was run
 * @param[in]  job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
update_server_on_run(status *policy, server_info *sinfo,
		     queue_info *qinfo, resource_resv *resresv, char *job_state)
{
	if (sinfo == NULL || resresv == NULL)
		return;

	if (resresv->is_job) {
		if (resresv->job == NULL)
			return;
		if (qinfo == NULL)
			return;
	}

	/*
	 * Update the server level resources
	 *   -- if a job is in a reservation, the resources have already been
	 *      accounted for and assigned to the reservation.  We don't want to
	 *      double count them
	 */
	if (resresv->is_resv || (qinfo != NULL && qinfo->resv == NULL)) {
		resource_req *req; /* used to cycle through resources to update */

		if (resresv->is_job && (job_state != NULL) && (*job_state == 'S') && (resresv->job->resreq_rel != NULL))
			req = resresv->job->resreq_rel;
		else
			req = resresv->resreq;
		while (req != NULL) {
			if (req->type.is_consumable) {
				auto res = find_resource(sinfo->res, req->def);

				if (res)
					res->assigned += req->amount;
			}
			req = req->next;
		}
	}

	if (resresv->is_job) {
		sinfo->sc.running++;
		/* note: if job is suspended, counts will get off.
		 *       sc.queued is not used, and sc.suspended isn't used again
		 *       after this point
		 *       BZ 5798
		 */
		sinfo->sc.queued--;

		/* sort the nodes before we filter them down to more useful lists */
		if (!cstat.node_sort->empty() && conf.node_sort_unused) {
			if (resresv->job->resv != NULL &&
			    resresv->job->resv->resv != NULL) {
				node_info **resv_nodes;
				int num_resv_nodes;

				resv_nodes = resresv->job->resv->resv->resv_nodes;
				num_resv_nodes = count_array(resv_nodes);
				qsort(resv_nodes, num_resv_nodes, sizeof(node_info *),
				      multi_node_sort);
			} else {
				qsort(sinfo->nodes, sinfo->num_nodes, sizeof(node_info *),
				      multi_node_sort);

				if (sinfo->nodes != sinfo->unassoc_nodes) {
					auto num_unassoc = count_array(sinfo->unassoc_nodes);
					qsort(sinfo->unassoc_nodes, num_unassoc, sizeof(node_info *),
					      multi_node_sort);
				}
			}
		}

		/* We're running a job or reservation, which will affect the cached data.
		 * We'll flush the cache and rebuild it if needed
		 */
		free_np_cache_array(sinfo->npc_arr);

		/* a new job has been run, update running jobs array */
		sinfo->running_jobs = add_resresv_to_array(sinfo->running_jobs, resresv, NO_FLAGS);
	}

	if (sinfo->has_soft_limit || sinfo->has_hard_limit) {
		if (resresv->is_job) {
			counts *cts; /* used in updating project/group/user counts */

			update_total_counts(sinfo, NULL, resresv, SERVER);

			cts = find_alloc_counts(sinfo->group_counts, resresv->group);
			update_counts_on_run(cts, resresv->resreq);

			cts = find_alloc_counts(sinfo->project_counts, resresv->project);
			update_counts_on_run(cts, resresv->resreq);

			cts = find_alloc_counts(sinfo->user_counts, resresv->user);
			update_counts_on_run(cts, resresv->resreq);

			auto allcts = find_alloc_counts(sinfo->alljobcounts, PBS_ALL_ENTITY);
			update_counts_on_run(allcts, resresv->resreq);
		}
	}
}

/**
 * @brief
 * 		update_server_on_end - update a server_info structure when a
 *		resource resv has finished running
 *
 * @param[in]   policy 	- policy info
 * @param[in]	sinfo	- server_info to update
 * @param[in]	qinfo 	- queue_info the job is in
 * @param[in]	resresv - resource_resv that finished running
 * @param[in]  job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	void
 *
 * @note
 * 		Job must be in pre-ended state (job_state is new state)
 *
 * @par MT-Safe:	no
 */
void
update_server_on_end(status *policy, server_info *sinfo, queue_info *qinfo,
		     resource_resv *resresv, const char *job_state)
{
	if (sinfo == NULL || resresv == NULL)
		return;
	if (resresv->is_job) {
		if (resresv->job == NULL)
			return;
		if (qinfo == NULL)
			return;
	}

	if (resresv->is_job) {
		if (resresv->job->is_running) {
			sinfo->sc.running--;
			remove_resresv_from_array(sinfo->running_jobs, resresv);
		} else if (resresv->job->is_exiting) {
			sinfo->sc.exiting--;
			remove_resresv_from_array(sinfo->exiting_jobs, resresv);
		}
		state_count_add(&(sinfo->sc), job_state, 1);
	}

	/*
	 *	if the queue is a reservation then the resources belong to it and not
	 *	the server
	 */
	if (resresv->is_resv || (qinfo != NULL && qinfo->resv == NULL)) {
		resource_req *req; /* resource request from job */

		if (resresv->is_job && (job_state != NULL) && (*job_state == 'S') && (resresv->job->resreq_rel != NULL))
			req = resresv->job->resreq_rel;
		else
			req = resresv->resreq;

		while (req != NULL) {
			auto res = find_resource(sinfo->res, req->def);

			if (res != NULL) {
				res->assigned -= req->amount;

				if (res->assigned < 0) {
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
						   "%s turned negative %.2lf, setting it to 0", res->name, res->assigned);
					res->assigned = 0;
				}
			}

			req = req->next;
		}
	}

	/* We're ending a job or reservation, which will affect the cached data.
	 * We'll flush the cache and rebuild it if needed
	 */
	free_np_cache_array(sinfo->npc_arr);

	if (sinfo->has_soft_limit || sinfo->has_hard_limit) {
		if (resresv->is_job && resresv->job->is_running) {
			counts *cts; /* update user/group/project counts */

			update_total_counts_on_end(sinfo, NULL, resresv, SERVER);
			cts = find_counts(sinfo->group_counts, resresv->group);

			if (cts != NULL)
				update_counts_on_end(cts, resresv->resreq);

			cts = find_counts(sinfo->project_counts, resresv->project);

			if (cts != NULL)
				update_counts_on_end(cts, resresv->resreq);

			cts = find_counts(sinfo->user_counts, resresv->user);

			if (cts != NULL)
				update_counts_on_end(cts, resresv->resreq);

			cts = find_alloc_counts(sinfo->alljobcounts, PBS_ALL_ENTITY);

			if (cts != NULL)
				update_counts_on_end(cts, resresv->resreq);
		}
	}
}
/**
 * @brief
 * 		copy_server_arrays - copy server arrays of all jobs and all reservations
 *
 * @param[in]	nsinfo	-	the server to copy lists to
 * @param[in]	osinfo	-	the server to copy lists from
 *
 * @return	int
 * @retval	1	: success
 * @retval	0 	: failure
 *
 * @par MT-Safe:	no
 */
int
copy_server_arrays(server_info *nsinfo, const server_info *osinfo)
{
	resource_resv **job_arr;     /* used in copying jobs to job array */
	resource_resv **all_arr;     /* used in copying jobs to job/resv array */
	resource_resv **resresv_arr; /* used as source array to copy */
	int i = 0;
	int j = 0;

	if (nsinfo == NULL || osinfo == NULL)
		return 0;

	if ((job_arr = static_cast<resource_resv **>(calloc((osinfo->sc.total + 1), sizeof(resource_resv *)))) == NULL) {
		log_err(errno, __func__, "Error allocating memory");
		return 0;
	}

	if ((all_arr = static_cast<resource_resv **>(calloc((osinfo->sc.total + osinfo->num_resvs + 1),
							    sizeof(resource_resv *)))) == NULL) {
		free(job_arr);
		log_err(errno, __func__, "Error allocating memory");
		return 0;
	}

	for (auto queue : nsinfo->queues) {
		resresv_arr = queue->jobs;

		if (resresv_arr != NULL) {
			for (i = 0; resresv_arr[i] != NULL; i++, j++)
				job_arr[j] = all_arr[resresv_arr[i]->resresv_ind] = resresv_arr[i];
		}
	}

	if (nsinfo->resvs != NULL) {
		for (i = 0; nsinfo->resvs[i] != NULL; i++)
			all_arr[nsinfo->resvs[i]->resresv_ind] = nsinfo->resvs[i];
	}
	nsinfo->jobs = job_arr;
	nsinfo->all_resresv = all_arr;
	nsinfo->num_resvs = osinfo->num_resvs;
	return 1;
}

/**
 * @brief
 * 		create_server_arrays - create a large server resresv array
 *		of all jobs on the system by coping all the jobs from the
 *		queue job arrays.  Also create an array of both jobs and
 *		reservations.
 *
 * @param[in]	sinfo	-	the server
 *
 * @return	int
 * @retval	1	: success
 * @retval	0 	: failure
 *
 * @par MT-Safe:	no
 */
int
create_server_arrays(server_info *sinfo)
{
	resource_resv **job_arr;     /* used in copying jobs to job array */
	resource_resv **all_arr;     /* used in copying jobs to job/resv array */
	resource_resv **resresv_arr; /* used as source array to copy */
	int i = 0, j;

	if ((job_arr = static_cast<resource_resv **>(malloc(sizeof(resource_resv *) * (sinfo->sc.total + 1)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return 0;
	}

	if ((all_arr = static_cast<resource_resv **>(malloc(sizeof(resource_resv *) *
							    (sinfo->sc.total + sinfo->num_resvs + 1)))) == NULL) {
		free(job_arr);
		log_err(errno, __func__, MEM_ERR_MSG);
		return 0;
	}

	for (auto queue : sinfo->queues) {
		resresv_arr = queue->jobs;

		if (resresv_arr != NULL) {
			for (j = 0; resresv_arr[j] != NULL; j++, i++) {
				job_arr[i] = all_arr[i] = resresv_arr[j];
				all_arr[i]->resresv_ind = i;
			}
			if (i > sinfo->sc.total) {
				free(job_arr);
				free(all_arr);
				return 0;
			}
		}
	}
	job_arr[i] = NULL;

	if (sinfo->resvs != NULL) {
		for (j = 0; sinfo->resvs[j] != NULL; j++, i++) {
			all_arr[i] = sinfo->resvs[j];
			all_arr[i]->resresv_ind = i;
		}
	}
	all_arr[i] = NULL;

	sinfo->jobs = job_arr;
	sinfo->all_resresv = all_arr;

	return 1;
}

/**
 * @brief
 * 		helper function for resource_resv_filter() - returns 1 if
 *		job is running
 *
 * @param[in]	job	-	resource reservation job.
 * @param[in]	arg	-	argument (not used here)
 *
 * @return	int
 * @retval	0	: job not running
 * @retval	1	: job is running
 */
int
check_run_job(resource_resv *job, const void *arg)
{
	if (job->is_job && job->job != NULL)
		return job->job->is_running;

	return 0;
}

/**
 * @brief
 * 		helper function for resource_resv_filter()
 *
 * @param[in]	job	-	resource reservation job.
 * @param[in]	arg	-	argument (not used here)
 *
 * @return	int
 * @retval	1	: if job is exiting
 */
int
check_exit_job(resource_resv *job, const void *arg)
{
	if (job->is_job && job->job != NULL)
		return job->job->is_exiting;

	return 0;
}

/**
 * @brief
 * 		helper function for resource_resv_filter()
 *
 * @param[in]	job	-	resource reservation job.
 * @param[in]	arg	-	argument (not used here)
 *
 * @return	int
 * @retval	1	: if job is suspended
 * @retval	0	: if job is not suspended
 */
int
check_susp_job(resource_resv *job, const void *arg)
{
	if (job->is_job && job->job != NULL)
		return job->job->is_suspended;

	return 0;
}

/**
 * @brief
 * 		helper function for resource_resv_filter()
 *
 * @param[in]	job	-	resource reservation job.
 * @param[in]	arg	-	argument (not used here)
 *
 * @return	int
 * @retval	1	: if job is running
 * @retval	0	: if job is not running
 */
int
check_job_running(resource_resv *job, const void *arg)
{
	if (job->is_job && (job->job->is_running || job->job->is_exiting || job->job->is_userbusy))
		return 1;

	return 0;
}

/**
 * @brief
 * 		helper function for resource_resv_filter()
 *
 * @param[in]	job	-	resource reservation job.
 * @param[in]	arg	-	argument (not used here)
 *
 * @return	int
 * @retval	1	: if job is running and in a reservation
 * @retval	0	: if job is not running or not in a reservation
 */
int
check_running_job_in_reservation(resource_resv *job, const void *arg)
{
	if (job->is_job && job->job != NULL && job->job->resv != NULL &&
	    (check_job_running(job, arg) == 1))
		return 1;

	return 0;
}

/**
 * @brief
 * 		helper function for resource_resv_filter()
 *
 * @param[in]	job	-	resource reservation job.
 * @param[in]	arg	-	argument (not used here)
 *
 * @return	int
 * @retval	1	: if job is running and not in a reservation
 * @retval	0	: if job is not running or in a reservation
 */
int
check_running_job_not_in_reservation(resource_resv *job, const void *arg)
{
	if (job->is_job && job->job != NULL && job->job->resv == NULL &&
	    (check_job_running(job, arg) == 1))
		return 1;

	return 0;
}

/**
 * @brief
 * 		helper function for resource_resv_filter()
 *
 * @param[in]	resv	-	resource reservation structure
 * @param[in]	arg		-	the array of nodes to look in
 *
 * @return	int
 * @retval	1	: if reservation is running on node passed in arg
 * @retval	0	: if reservation is not running on node passed in arg
 */
int
check_resv_running_on_node(resource_resv *resv, const void *arg)
{
	if (resv->is_resv && resv->resv != NULL) {
		if (resv->resv->is_running || resv->resv->resv_state == RESV_BEING_DELETED)
			if (find_node_info(resv->ninfo_arr, (char *) arg))
				return 1;
	}
	return 0;
}

// Copy constructor
server_info::server_info(const server_info &osinfo)
{
	init_server_info();
	if (osinfo.fstree != NULL)
		fstree = new fairshare_head(*osinfo.fstree);
	has_mult_express = osinfo.has_mult_express;
	has_soft_limit = osinfo.has_soft_limit;
	has_hard_limit = osinfo.has_hard_limit;
	has_user_limit = osinfo.has_user_limit;
	has_all_limit = osinfo.has_all_limit;
	has_grp_limit = osinfo.has_grp_limit;
	has_proj_limit = osinfo.has_proj_limit;
	has_multi_vnode = osinfo.has_multi_vnode;
	has_prime_queue = osinfo.has_prime_queue;
	has_nonprime_queue = osinfo.has_nonprime_queue;
	has_ded_queue = osinfo.has_ded_queue;
	has_nodes_assoc_queue = osinfo.has_nodes_assoc_queue;
	node_group_enable = osinfo.node_group_enable;
	eligible_time_enable = osinfo.eligible_time_enable;
	provision_enable = osinfo.provision_enable;
	power_provisioning = osinfo.power_provisioning;
	use_hard_duration = osinfo.use_hard_duration;
	pset_metadata_stale = osinfo.pset_metadata_stale;
	name = osinfo.name;
	liminfo = lim_dup_liminfo(osinfo.liminfo);
	server_time = osinfo.server_time;
	res = dup_resource_list(osinfo.res);
	alljobcounts = dup_counts_umap(osinfo.alljobcounts);
	group_counts = dup_counts_umap(osinfo.group_counts);
	project_counts = dup_counts_umap(osinfo.project_counts);
	user_counts = dup_counts_umap(osinfo.user_counts);
	total_alljobcounts = dup_counts_umap(osinfo.total_alljobcounts);
	total_group_counts = dup_counts_umap(osinfo.total_group_counts);
	total_project_counts = dup_counts_umap(osinfo.total_project_counts);
	total_user_counts = dup_counts_umap(osinfo.total_user_counts);
	node_group_key = osinfo.node_group_key;
	nodesigs = dup_string_arr(osinfo.nodesigs);

	policy = dup_status(osinfo.policy);

	num_nodes = osinfo.num_nodes;

	/* dup the nodes, if there are any nodes */
	nodes = dup_nodes(osinfo.nodes, this, NO_FLAGS);

	if (has_nodes_assoc_queue)
		unassoc_nodes = node_filter(nodes, num_nodes, is_unassoc_node, NULL, 0);
	else
		unassoc_nodes = nodes;

	unordered_nodes = dup_unordered_nodes(osinfo.unordered_nodes, nodes);

	/* dup the reservations */
	resvs = dup_resource_resv_array(osinfo.resvs, this, NULL);
	num_resvs = osinfo.num_resvs;

#ifdef NAS /* localmod 053 */
	site_save_users();
#endif /* localmod 053 */

	/* duplicate the queues */
	queues = dup_queues(osinfo.queues, this);
	if (queues.empty()) {
		free_server_info();
		throw sched_exception("Unable to duplicate queues", SCHD_ERROR);
	}

	if (osinfo.queue_list != NULL) {
		/* queues are already sorted in descending order of their priority */
		for (unsigned int i = 0; i < queues.size(); i++) {
			auto ret_val = add_queue_to_list(&queue_list, queues[i]);
			if (ret_val == 0) {
				fstree = NULL;
				free_server_info();
				throw sched_exception("Unable to add queue to queue_list", SCHD_ERROR);
			}
		}
	}

	sc = osinfo.sc;

	/* sets nsinfo -> jobs and nsinfo -> all_resresv */
	copy_server_arrays(this, &osinfo);

	equiv_classes = dup_resresv_set_array(osinfo.equiv_classes, this);

	/* the event list is created dynamically during the evaluation of resource
	 * reservations. It is a sorted list of all_resresv, initialized to NULL to
	 * appropriately be freed in free_event_list */
	calendar = dup_event_list(osinfo.calendar, this);
	if (calendar == NULL) {
		free_server_info();
		throw sched_exception("Unable to duplicate calendar", SCHD_ERROR);
	}

	running_jobs =
		resource_resv_filter(jobs, sc.total,
				     check_run_job, NULL, FILTER_FULL);

	exiting_jobs =
		resource_resv_filter(jobs, sc.total,
				     check_exit_job, NULL, 0);

	num_preempted = osinfo.num_preempted;

	if (osinfo.qrun_job != NULL)
		qrun_job = find_resource_resv(jobs,
					      osinfo.qrun_job->name);

	for (int i = 0; i < NUM_PPRIO; i++)
		preempt_count[i] = osinfo.preempt_count[i];

#ifdef NAS /* localmod 034 */
	if (!site_dup_shares(&osinfo, this)) {
		free_server_info();
		throw sched_exception("Unable to duplicate shares", SCHD_ERROR);
	}
#endif /* localmod 034 */

	/* Now we do any processing which has to happen last */

	/* the jobs are not dupped when we dup the nodes, so we need to copy
	 * the node's job arrays now
	 */
	for (int i = 0; osinfo.nodes[i] != NULL; i++)
		nodes[i]->job_arr =
			copy_resresv_array(osinfo.nodes[i]->job_arr, jobs);

	num_parts = osinfo.num_parts;
	if (osinfo.nodepart != NULL) {
		nodepart = dup_node_partition_array(osinfo.nodepart, this);
		if (nodepart == NULL) {
			free_server_info();
			throw sched_exception("Unable to duplicate node partition", SCHD_ERROR);
		}
	}
	allpart = dup_node_partition(osinfo.allpart, this);
	if (osinfo.hostsets != NULL) {
		int j, k;
		hostsets = dup_node_partition_array(osinfo.hostsets, this);
		if (hostsets == NULL) {
			free_server_info();
			throw sched_exception("Unable to duplicate hostsets", SCHD_ERROR);
		}
		/* reattach nodes to their host sets*/
		for (j = 0; hostsets[j] != NULL; j++) {
			node_partition *hset = hostsets[j];
			for (k = 0; hset->ninfo_arr[k] != NULL; k++)
				hset->ninfo_arr[k]->hostset = hset;
		}
		num_hostsets = osinfo.num_hostsets;
	}

	/* the running resvs are not dupped when we dup the nodes, so we need to copy
	 * the node's running resvs arrays now
	 */
	for (int i = 0; osinfo.nodes[i] != NULL; i++) {
		nodes[i]->run_resvs_arr =
			copy_resresv_array(osinfo.nodes[i]->run_resvs_arr, resvs);
		nodes[i]->np_arr =
			copy_node_partition_ptr_array(osinfo.nodes[i]->np_arr, nodepart);
		if (calendar != NULL)
			nodes[i]->node_events = dup_te_lists(osinfo.nodes[i]->node_events, calendar->next_event);
	}
	buckets = dup_node_bucket_array(osinfo.buckets, this);
	/* Now that all job information has been created, time to associate
	 * jobs to each other if they have runone dependency
	 */
	associate_dependent_jobs(this);

	for (int i = 0; running_jobs[i] != NULL; i++) {
		if ((running_jobs[i]->job->is_subjob) &&
		    (associate_array_parent(running_jobs[i], this) == 1)) {
			free_server_info();
			throw sched_exception("Unable to associate running subjob with parent", SCHD_ERROR);
		}
	}

	if (osinfo.job_sort_formula != NULL) {
		job_sort_formula = string_dup(osinfo.job_sort_formula);
		if (job_sort_formula == NULL) {
			free_server_info();
			throw sched_exception("Unable to duplicate job_sort_fornula", SCHD_ERROR);
		}
	}

	/* Copy the map of server psets */
	dup_server_psets(osinfo.svr_to_psets);
}

/**
 * @brief
 * 		dup_resource_list - dup a resource list
 *
 * @param[in]	res - the resource list to duplicate
 *
 * @return	duplicated resource list
 * @retval	NULL	: Error
 *
 * @par MT-Safe:	no
 */
schd_resource *
dup_resource_list(schd_resource *res)
{
	schd_resource *pres;
	schd_resource *nres;
	schd_resource *prev = NULL;
	schd_resource *head = NULL;

	for (pres = res; pres != NULL; pres = pres->next) {
		nres = dup_resource(pres);
		if (prev == NULL)
			head = nres;
		else
			prev->next = nres;

		prev = nres;
	}

	return head;
}
/**
 * @brief
 * 		dup a resource list selectively + booleans (set or unset=false)
 *
 *
 *	@param[in]	res - the resource list to duplicate
 *	@param[in]	deflist -  dup resources in this list
 *	@param[in]	flags - @see add_resource_list()
 *
 * @return	duplicated resource list
 * @retval	NULL	: Error
 *
 * @par MT-Safe:	no
 */
schd_resource *
dup_selective_resource_list(schd_resource *res, std::unordered_set<resdef *> &deflist, unsigned flags)
{
	schd_resource *pres;
	schd_resource *nres;
	schd_resource *prev = NULL;
	schd_resource *head = NULL;

	for (pres = res; pres != NULL; pres = pres->next) {
		if (((flags & ADD_ALL_BOOL) && pres->type.is_boolean) ||
		    deflist.find(pres->def) != deflist.end()) {
			nres = dup_resource(pres);
			if (nres == NULL) {
				free_resource_list(head);
				return NULL;
			}
			if ((flags & ADD_AVAIL_ASSIGNED)) {
				if (nres->avail == RES_DEFAULT_AVAIL)
					nres->assigned = RES_DEFAULT_ASSN;
				else
					nres->assigned = nres->avail;
			}
			if (prev == NULL)
				head = nres;
			else
				prev->next = nres;
			prev = nres;
		}
	}
	/* add on any booleans which are unset (i.e.,  false) */
	if (flags & ADD_UNSET_BOOLS_FALSE) {
		for (const auto &br : boolres) {
			if (find_resource(res, br) == NULL) {
				nres = create_resource(br->name.c_str(), ATR_FALSE, RF_AVAIL);
				if (nres == NULL) {
					free_resource_list(head);
					return NULL;
				}
				if (prev == NULL)
					head = nres;
				else
					prev->next = nres;
				prev = nres;
			}
		}
	}
	return head;
}

/**
 * @brief
 * 		dup_ind_resource_list - dup a resource list - if a resource in
 *		the list is indirect, dup the pointed to resource instead
 *
 * @param[in]	res - the resource list to duplicate
 *
 * @return	duplicated resource list
 * @retval	NULL	: Error
 *
 * @par MT-Safe:	no
 */
schd_resource *
dup_ind_resource_list(schd_resource *res)
{
	schd_resource *pres;
	schd_resource *nres;
	schd_resource *prev = NULL;
	schd_resource *head = NULL;

	for (pres = res; pres != NULL; pres = pres->next) {
		if (pres->indirect_res != NULL)
			nres = dup_resource(pres->indirect_res);
		else
			nres = dup_resource(pres);

		if (nres == NULL) {
			free_resource_list(head);
			return NULL;
		}

		if (prev == NULL)
			head = nres;
		else
			prev->next = nres;

		prev = nres;
	}

	return head;
}

/**
 * @brief
 * 		dup_resource - duplicate a resource struct
 *
 * @param[in]	res	- the resource to dup
 *
 * @return	the duplicated resource
 * @retval	NULL	: Error
 *
 * @par MT-Safe:	no
 */
schd_resource *
dup_resource(schd_resource *res)
{
	schd_resource *nres;

	if ((nres = new_resource()) == NULL)
		return NULL;

	nres->def = res->def;
	if (nres->def != NULL)
		nres->name = nres->def->name.c_str();

	if (res->indirect_vnode_name != NULL)
		nres->indirect_vnode_name = string_dup(res->indirect_vnode_name);

	if (res->orig_str_avail != NULL)
		nres->orig_str_avail = string_dup(res->orig_str_avail);

	if (res->str_avail != NULL)
		nres->str_avail = dup_string_arr(res->str_avail);

	if (res->str_assigned != NULL)
		nres->str_assigned = string_dup(res->str_assigned);

	nres->avail = res->avail;
	nres->assigned = res->assigned;

	memcpy(&(nres->type), &(res->type), sizeof(struct resource_type));

	return nres;
}

/**
 * @brief
 * 		is_unassoc_node - finds nodes which are not associated
 *		with queues used with node_filter
 *
 * @param[in]	ninfo - the node to check
 *
 * @return	int
 * @retval	1	-	if the node does not have a queue associated with it
 * @retval	0	- 	otherwise
 *
 * @par MT-Safe:	yes
 */
int
is_unassoc_node(node_info *ninfo, void *arg)
{
	if (ninfo->queue_name.empty())
		return 1;

	return 0;
}

// counts constructor
counts::counts(const std::string &rname) : name(rname)
{
	running = 0;
	rescts = NULL;
	soft_limit_preempt_bit = 0;
}

// counts copy constructor
counts::counts(const counts &rcount) : name(rcount.name)
{
	running = rcount.running;
	rescts = dup_resource_count_list(rcount.rescts);
	soft_limit_preempt_bit = rcount.soft_limit_preempt_bit;
}

// count assignment operator
counts &
counts::operator=(const counts &rcount)
{
	this->name = rcount.name;
	this->running = rcount.running;
	this->rescts = dup_resource_count_list(rcount.rescts);
	this->soft_limit_preempt_bit = rcount.soft_limit_preempt_bit;
	return (*this);
}

// destructor
counts::~counts()
{
	free_resource_count_list(rescts);
}

/**
 * @brief
 * 		free_counts_list - free a list of counts structures
 *
 * @param[in]	ctslist	- the counts structure to free
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
free_counts_list(counts_umap &ctslist)
{
	for (auto it : ctslist)
		delete it.second;
}

/**
 * @brief
 * 		dup_counts_umap - duplicate a counts map
 *
 * @param[in]	omap	- the counts map to duplicate
 *
 * @return	new counts_umap
 */
counts_umap
dup_counts_umap(const counts_umap &omap)
{
	counts_umap nmap;
	for (auto &iter : omap)
		nmap[iter.first] = new counts(*(iter.second));
	return nmap;
}

/**
 * @brief
 * 		find_counts - find a counts structure by name
 *
 * @param[in]	ctslist - the counts list to search
 * @param[in]	name 	- the name to find
 *
 * @return	found counts structure
 * @retval	NULL	: error
 *
 * @par MT-Safe:	no
 */
counts *
find_counts(counts_umap &ctslist, const std::string &name)
{
	auto ret = ctslist.find(name);
	if (ret == ctslist.end())
		return NULL;
	return ret->second;
}

/**
 * @brief
 * 		find_alloc_counts - find a counts structure by name or allocate
 *		 a new counts, name it, and add it to the end of the list
 *
 * @param[in]	ctslist - the counts map to search
 * @param[in]	name 	- the name to find
 *
 * @return	found or newly-allocated counts structure
 * @retval	NULL	: error
 *
 * @par MT-Safe:	no
 */
counts *
find_alloc_counts(counts_umap &ctslist, const std::string &name)
{
	counts *ret;

	ret = find_counts(ctslist, name);
	if (ret == NULL) {
		ctslist[name] = new counts(name);
		return ctslist[name];
	}
	return ret;
}

/**
 * @brief
 * 		update_counts_on_run - update a counts struct on the running of
 *		a job
 *
 * @param[in]	cts 	- the counts structure to update
 * @param[in]	resreq 	- the resource requirements of the job which ran
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
update_counts_on_run(counts *cts, resource_req *resreq)
{
	resource_count *ctsreq; /* rescts to update */
	resource_req *req;	/* current in resreq */

	if (cts == NULL)
		return;

	cts->running++;

	if (resreq == NULL)
		return;

	req = resreq;

	while (req != NULL) {
		ctsreq = find_alloc_resource_count(cts->rescts, req->def);

		if (ctsreq != NULL) {
			if (cts->rescts == NULL)
				cts->rescts = ctsreq;

			ctsreq->amount += req->amount;
		}
		req = req->next;
	}
}

/**
 * @brief
 * 		update_counts_on_end - update a counts structure on the end
 *		of a job
 *
 * @param[in]	cts 	- counts structure to update
 * @param[in]	resreq 	- the resource requirements of the job which
 *							ended
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
update_counts_on_end(counts *cts, resource_req *resreq)
{
	if (cts == NULL || resreq == NULL)
		return;

	cts->running--;

	for (auto req = resreq; req != NULL; req = req->next) {
		auto ctsreq = find_resource_count(cts->rescts, req->def);
		if (ctsreq != NULL)
			ctsreq->amount -= req->amount;
	}
}

/*
 * @brief  Helper function that sets the max counts map if the counts structure passed
 *	   to this function has higher number running jobs or resources.
 * @param[in,out] counts_umap - map of max counts structures.
 * @param[in] ncounts * - pointer to counts structure that needs to be updated
 *
 * @return void
 */
static void
set_counts_max(counts_umap &cmax, const counts *ncounts)
{
	counts *cur_fmax;
	resource_count *cur_res;
	resource_count *cur_res_max;

	cur_fmax = find_counts(cmax, ncounts->name);
	if (cur_fmax == NULL) {
		cmax[ncounts->name] = new counts(*ncounts);
		return;
	} else {
		if (ncounts->running > cur_fmax->running)
			cur_fmax->running = ncounts->running;
		for (cur_res = ncounts->rescts; cur_res != NULL; cur_res = cur_res->next) {
			cur_res_max = find_resource_count(cur_fmax->rescts, cur_res->def);
			if (cur_res_max == NULL) {
				cur_res_max = dup_resource_count(cur_res);
				if (cur_res_max == NULL) {
					free_counts_list(cmax);
					return;
				}

				cur_res_max->next = cur_fmax->rescts;
				cur_fmax->rescts = cur_res_max;
			} else {
				if (cur_res->amount > cur_res_max->amount)
					cur_res_max->amount = cur_res->amount;
			}
		}
	}
	return;
}

/**
 * @brief
 * 		perform a max() between the current list of maxes and a
 *		new list.  If any element from the new list is greater
 *		than the current max, we free the old, and dup the new
 *		and attach it in.
 *
 * @param[in,out]	cmax - current max
 * @param[in]	ncounts - new counts map.  If anything in this map is
 *			  greater than the cur_max, it needs to be dup'd.
 *
 * @return	void
 */
void
counts_max(counts_umap &cmax, counts_umap &ncounts)
{

	if (ncounts.size() == 0)
		return;

	if (cmax.size() == 0) {
		cmax = ncounts;
		return;
	}

	for (const auto &cur : ncounts)
		set_counts_max(cmax, cur.second);
}

// overloaded
void
counts_max(counts_umap &cmax, counts *ncounts)
{
	if (ncounts == NULL)
		return;

	if (cmax.size() == 0) {
		cmax[ncounts->name] = new counts(*ncounts);
		return;
	}
	set_counts_max(cmax, ncounts);
	return;
}

/**
 * @brief
 * 		update_universe_on_end - update a pbs universe when a job/resv
 *		ends
 *
 * @param[in]   policy 		- policy info
 * @param[in]	resresv 	- the resresv itself which is ending
 * @param[in]	job_state 	- the new state of a job if resresv is a job
 * @param[in]	flags		- flags to modify behavior of the function
 * 					NO_ALLPART - do not update most of the metadata of the allpart
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
void
update_universe_on_end(status *policy, resource_resv *resresv, const char *job_state, unsigned int flags)
{
	server_info *sinfo = NULL;
	queue_info *qinfo = NULL;

	if (resresv == NULL)
		return;

	if (resresv->is_job && job_state == NULL)
		return;

	if (!is_resource_resv_valid(resresv, NULL))
		return;

	sinfo = resresv->server;

	if (resresv->is_job) {
		qinfo = resresv->job->queue;
		if (resresv->job != NULL && resresv->execselect != NULL) {
			int need_metadata_update = 0;
			for (const auto &sdef : resresv->execselect->defs) {
				const auto &rdc = policy->resdef_to_check;
				if (rdc.find(sdef) == rdc.end()) {
					policy->resdef_to_check.insert(sdef);
					need_metadata_update = 1;
				}
			}
			if (need_metadata_update) {
				/* Since a new resource was added to resdef_to_check, the meta data needs to be recreated.
				 * This will happen on the next call to node_partition_update()
				 */
				if (sinfo->allpart != NULL) {
					free_resource_list(sinfo->allpart->res);
					sinfo->allpart->res = NULL;
				}
				for (auto queue : sinfo->queues) {
					if (queue->allpart != NULL) {
						free_resource_list(queue->allpart->res);
						queue->allpart->res = NULL;
					}
				}
			}
		}
	}

	if (resresv->ninfo_arr != NULL) {
		for (int i = 0; resresv->ninfo_arr[i] != NULL; i++)
			update_node_on_end(resresv->ninfo_arr[i], resresv, job_state);
	}

	update_server_on_end(policy, sinfo, qinfo, resresv, job_state);

	if (qinfo != NULL)
		update_queue_on_end(qinfo, resresv, job_state);
	/* update soft limits for jobs that are not in reservation */
	if (resresv->is_job && resresv->job->resv_id == NULL)
		update_soft_limits(sinfo, qinfo, resresv);
	/* Mark the metadata stale.  It will be updated in the next call to is_ok_to_run() */
	sinfo->pset_metadata_stale = 1;

	update_resresv_on_end(resresv, job_state);

#ifdef NAS /* localmod 057 */
	site_update_on_end(sinfo, qinfo, resresv);
#endif /* localmod 057 */
	update_preemption_priority(sinfo, resresv);
}

/**
 * @brief Update scheduler's cache of the universe when a job/resv runs
 * 
 * @param[in] policy - policy info
 * @param[in] pbs_sd - connection descriptor to pbs server or SIMULATE_SD if we're simulating
 * @param[in] rr - the job or reservations
 * @param[in] sinfo - the server
 * @param[in] qinfo - the queue in the case of a job
 * @param[in] flags - flags which modify behavior
 * 				RURR_ADD_END_EVENT - add an end event to calendar for this job
 * 				RURR_NOPRINT - don't print 'Job run'

 * @return true 
 * @return false 
 */
bool
update_universe_on_run_helper(status *policy, int pbs_sd, resource_resv *rr, unsigned int flags)
{
	char old_state = 0;
	resource_resv *array = NULL;
	server_info *sinfo;
	queue_info *qinfo = NULL;

	if (rr == NULL)
		return false;

	if (!(flags & RURR_NOPRINT))
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO, rr->name, "Job run");

	sinfo = rr->server;
	if (rr->is_job)
		qinfo = rr->job->queue;

	if (rr->is_job && rr->job != NULL && rr->job->parent_job != NULL)
		array = rr->job->parent_job;

	/* any resresv marked can_not_run will be ignored by the scheduler
	 * so just incase we run by this resresv again, we want to ignore it
	 * since it is already running
	 */
	rr->can_not_run = true;

	if (rr->is_job && rr->job->is_suspended)
		old_state = 'S';

	update_resresv_on_run(rr, rr->nspec_arr);

	if ((flags & RURR_ADD_END_EVENT)) {
		auto te = create_event(TIMED_END_EVENT, rr->end, rr, NULL, NULL);
		if (te == NULL)
			return false;

		add_event(sinfo->calendar, te);
	}

	if (array != NULL) {
		update_array_on_run(array->job, rr->job);

		/* Subjobs inherit all attributes from their parent job array. This means
		 * we need to make sure the parent resresv array has its accrue_type set
		 * before running the job.  If all subresresvs have run,
		 * then resresv array's accrue_type becomes ineligible.
		 */
		if (array->is_job &&
		    range_next_value(array->job->queued_subjobs, -1) < 0)
			update_accruetype(pbs_sd, sinfo, ACCRUE_MAKE_INELIGIBLE, SUCCESS, array);
		else
			update_accruetype(pbs_sd, sinfo, ACCRUE_MAKE_ELIGIBLE, SUCCESS, array);
	}

	if (!rr->nspec_arr.empty()) {
		bool sort_nodepart = false;
		for (auto n : rr->nspec_arr) {
			update_node_on_run(n, rr, &old_state);
			if (n->ninfo->np_arr != NULL) {
				node_partition **npar = n->ninfo->np_arr;
				for (int j = 0; npar[j] != NULL; j++) {
					modify_resource_list(npar[j]->res, n->resreq, SCHD_INCR);
					if (!n->ninfo->is_free)
						npar[j]->free_nodes--;
					sort_nodepart = true;
					update_buckets_for_node(npar[j]->bkts, n->ninfo);
				}
			}
			/* if the node is being provisioned, it's brought down in
			 * update_node_on_run().  We need to add an event in the calendar to
			 * bring it back up.
			 */
			if (n->go_provision) {
				if (add_prov_event(sinfo->calendar, sinfo->server_time + PROVISION_DURATION, n->ninfo) == 0)
					return false;
			}
		}
		if (sort_nodepart)
			sort_all_nodepart(policy, sinfo);
	}

	update_queue_on_run(qinfo, rr, &old_state);

	update_server_on_run(policy, sinfo, qinfo, rr, &old_state);

	/* update soft limits for jobs that are not in reservation */
	if (rr->is_job && rr->job->resv_id == NULL) {
		/* update the entity preempt bit */
		update_soft_limits(sinfo, qinfo, rr);
		/* update the job preempt status */
		set_preempt_prio(rr, qinfo, sinfo);
	}

	/* update_preemption_priority() must be called post queue/server update */
	update_preemption_priority(sinfo, rr);

	if (sinfo->policy->fair_share)
		update_usage_on_run(rr);

	if (rr->is_job && rr->job->is_preempted) {
		unset_job_attr(pbs_sd, rr, ATTR_sched_preempted, UPDATE_LATER);
		rr->job->is_preempted = 0;
		rr->job->time_preempted = UNSPECIFIED;
		sinfo->num_preempted--;
	}

#ifdef NAS /* localmod 057 */
	site_update_on_run(sinfo, qinfo, rr, ns);
#endif /* localmod 057 */

	return true;
}

/**
 * @brief Update scheduler's cache of the universe when a job/resv runs
 * 
 * @param[in] policy - policy info
 * @param[in] pbs_sd - connection descriptor to pbs server or SIMULATE_SD if we're simulating
 * @param[in] rr - the job or reservations
 * @param[in] orig_ns - where we're running the job/resv
 * @param[in] sinfo - the server
 * @param[in] qinfo - the queue in the case of a job
 * @param[in] flags - flags which modify behavior
 * 				RURR_ADD_END_EVENT - add an end event to calendar for this job
 * 				RURR_NOPRINT - don't print 'Job run'
 * @return true - success
 * @return false - failure
 */
bool
update_universe_on_run(status *policy, int pbs_sd, resource_resv *rr, std::vector<nspec *> &orig_ns, unsigned int flags)
{
	if (!rr->nspec_arr.empty())
		free_nspecs(rr->nspec_arr);

	rr->nspec_arr = combine_nspec_array(orig_ns);

	if (rr->is_resv) {
		if (rr->resv->orig_nspec_arr.empty())
			free_nspecs(rr->resv->orig_nspec_arr);
		rr->resv->orig_nspec_arr = std::move(orig_ns);
	} else
		free_nspecs(orig_ns);

	return update_universe_on_run_helper(policy, pbs_sd, rr, flags);
}

/**
 * @brief Update scheduler's cache of the universe when a job/resv runs.  This overload
 * 	does not pass an ns_arr parameter and uses the nspec array from the job/resv itself.
 * 
 * @param[in] policy - policy info
 * @param[in] pbs_sd - connection descriptor to pbs server or SIMULATE_SD if we're simulating
 * @param[in] rr - the job or reservations
 * @param[in] sinfo - the server
 * @param[in] qinfo - the queue in the case of a job
 * @param[in] flags - flags which modify behavior
 * 				RURR_ADD_END_EVENT - add an end event to calendar for this job
 * 				RURR_NOPRINT - don't print 'Job run'
 * @return true - success
 * @return false - failure
 */
bool
update_universe_on_run(status *policy, int pbs_sd, resource_resv *rr, unsigned int flags)
{
	return update_universe_on_run_helper(policy, pbs_sd, rr, flags);
}

/**
 * @brief
 * 		set_resource - set the values of the resource structure.  This
 *		function can be called in one of two ways.  It can be called
 *		with resources_available value, or the resources_assigned
 *		value.
 *
 * @param[in]	res 	- the resource to set
 * @param[in]	val 	- the value to set upon the resource
 * @param[in]	field 	- the type of field to set (available or assigned)
 *
 * @return	int
 * @retval	1 : success
 * @retval	0 : failure/error
 *
 * @note
 * 		If we have resource type information from the server,
 *		we will use it.  If not, we will try to set the
 *		resource type from the resources_available value first,
 *		then from the resources_assigned
 *
 * @par MT-Safe:	no
 */
int
set_resource(schd_resource *res, const char *val, enum resource_fields field)
{
	resdef *rdef;

	if (res == NULL || val == NULL)
		return 0;

	rdef = find_resdef(res->name);
	res->def = rdef;

	if (rdef != NULL)
		res->type = rdef->type;
	else {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_RESC, LOG_WARNING, res->name, "Can't find resource definition");
		return 0;
	}

	if (field == RF_AVAIL) {
		/* if this resource is being re-set, lets free the memory we previously
		 * allocated in the last call to this function.  We NULL the values just
		 * incase we don't reset them later (e.g. originally set a resource
		 * indirect and then later set it directly)
		 */
		if (res->orig_str_avail != NULL) {
			free(res->orig_str_avail);
			res->orig_str_avail = NULL;
		}
		if (res->indirect_vnode_name != NULL) {
			free(res->indirect_vnode_name);
			res->indirect_vnode_name = NULL;
		}
		if (res->str_avail != NULL) {
			free_string_array(res->str_avail);
			res->str_avail = NULL;
		}

		res->orig_str_avail = string_dup(val);
		if (res->orig_str_avail == NULL)
			return 0;

		if (val[0] == '@') {
			res->indirect_vnode_name = string_dup(&val[1]);
			/* res -> indirect_res is assigned by a call to
			 * resolve_indirect_resources()
			 */
			if (res->indirect_vnode_name == NULL)
				return 0;
		} else {
			/* if val is a string, avail will be set to SCHD_INFINITY_RES */
			res->avail = res_to_num(val, NULL);
			if (res->avail == SCHD_INFINITY_RES) {
				/* Verify that this is a string type resource */
				if (!res->def->type.is_string) {
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_RESC, LOG_WARNING, res->name, "Invalid value for consumable resource");
					return 0;
				}
			}
			res->str_avail = break_comma_list(const_cast<char *>(val));
			if (res->str_avail == NULL) {
				log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESC, LOG_WARNING, res->name, "Invalid value: %s", val);
				return 0;
			}
		}
	} else if (field == RF_ASSN) {
		/* clear previously allocated memory in the case of a reassignment */
		if (res->str_assigned != NULL) {
			free(res->str_assigned);
			res->str_assigned = NULL;
		}
		if (val[0] == '@') /* Indirect resources will be found elsewhere, assign 0 */
			res->assigned = 0;
		else
			res->assigned = res_to_num(val, NULL);
		res->str_assigned = string_dup(val);
		if (res->str_assigned == NULL)
			return 0;
	}

	return 1;
}

/**
 * @brief
 * 		find_indirect_resource - follow the indirect resource pointers
 *		to find the real resource at the end
 *
 * @param[in]	res 	- the indirect resource
 * @param[in]	nodes 	- the nodes to search
 *
 * @return	the indirect resource
 * @retval	NULL	: on error
 *
 * @par MT-Safe:	no
 */
schd_resource *
find_indirect_resource(schd_resource *res, node_info **nodes)
{
	schd_resource *cur_res = NULL;
	int i;
	int error = 0;
	const int max = 10;

	if (res == NULL || nodes == NULL)
		return NULL;

	cur_res = res;

	for (i = 0; i < max && cur_res != NULL && cur_res->indirect_vnode_name != NULL && !error; i++) {
		auto ninfo = find_node_info(nodes, cur_res->indirect_vnode_name);
		if (ninfo != NULL) {
			cur_res = find_resource(ninfo->res, cur_res->def);
			if (cur_res == NULL) {
				error = 1;
				log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
					   "Resource %s is indirect, and does not exist on indirect node %s",
					   res->name, ninfo->name.c_str());
			}
		} else {
			error = 1;
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
				   "Resource %s is indirect but points to node %s, which was not found",
				   res->name, cur_res->indirect_vnode_name);
			cur_res = NULL;
		}
	}
	if (i == max) {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
			   "Attempted %d indirection lookups for resource %s=@%s-- "
			   "looks like a cycle, bailing out",
			   max, cur_res->name, cur_res->indirect_vnode_name);
		return NULL;
	}

	if (error)
		return NULL;

	return cur_res;
}

/**
 * @brief
 * 		resolve_indirect_resources - resolve indirect resources for node
 *		array
 *
 * @param[in,out]	nodes	-	the nodes to resolve
 *
 * @return	int
 * @retval	1	: if successful
 * @retval	0	: if there were any errors
 *
 * @par MT-Safe:	no
 */
int
resolve_indirect_resources(node_info **nodes)
{
	int i;
	schd_resource *cur_res;
	int error = 0;

	if (nodes == NULL)
		return 0;

	for (i = 0; nodes[i] != NULL; i++) {
		cur_res = nodes[i]->res;
		while (cur_res != NULL) {
			if (cur_res->indirect_vnode_name) {
				cur_res->indirect_res = find_indirect_resource(cur_res, nodes);
				if (cur_res->indirect_res == NULL)
					error = 1;
			}
			cur_res = cur_res->next;
		}
	}

	if (error)
		return 0;

	return 1;
}

/**
 * @brief
 * 		update_preemption_priority - update preemption status when a
 *		job runs/ends
 *
 * @param[in]	sinfo 	- server where job was run
 * @param[in]	resresv - job which was run
 *
 * @return	void
 *
 * @note
 * 		Must be called after update_server_on_run/end() and
 *		update_queue_on_run/end()
 *
 * @note
 * 		The only thing which will change preemption priorities
 *		in the middle of a scheduling cycle is soft user/group/project
 *		limits. If a user, group, or project goes under a limit because
 *		of this job running, we need to update those jobs
 *
 * @par MT-Safe:	no
 */
void
update_preemption_priority(server_info *sinfo, resource_resv *resresv)
{
	if (cstat.preempting && resresv->is_job) {
		if (sinfo->has_soft_limit || resresv->job->queue->has_soft_limit) {
			for (int i = 0; sinfo->jobs[i] != NULL; i++) {
				if (sinfo->jobs[i]->job != NULL) {
					int usrlim = resresv->job->queue->has_user_limit || sinfo->has_user_limit;
					int grplim = resresv->job->queue->has_grp_limit || sinfo->has_grp_limit;
					int projlim = resresv->job->queue->has_proj_limit || sinfo->has_proj_limit;
					if ((usrlim && (resresv->user == sinfo->jobs[i]->user)) ||
					    (grplim && (resresv->group == sinfo->jobs[i]->group)) ||
					    (projlim && (resresv->project == sinfo->jobs[i]->project)))
						set_preempt_prio(sinfo->jobs[i],
								 sinfo->jobs[i]->job->queue, sinfo);
				}
			}

			/* now that we've set all the preempt levels, we need to count them */
			memset(sinfo->preempt_count, 0, NUM_PPRIO * sizeof(int));
			for (int i = 0; sinfo->running_jobs[i] != NULL; i++)
				if (!sinfo->running_jobs[i]->job->can_not_preempt)
					sinfo->preempt_count[preempt_level(sinfo->running_jobs[i]->job->preempt)]++;
		}
	}
}

/**
 * @brief
 * 		read_formula - read the formula from a well known file
 *
 * @return	formula in malloc'd buffer
 * @retval	NULL	: on error
 *
 * @par MT-Safe:	no
 */
#define RF_BUFSIZE 1024
char *
read_formula(void)
{
	char *form;
	char *tmp;
	char buf[RF_BUFSIZE];
	size_t bufsize = RF_BUFSIZE;
	FILE *fp;

	if ((fp = fopen(FORMULA_FILENAME, "r")) == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_REQUEST, LOG_INFO, __func__,
			  "Can not open file to read job_sort_formula.  Please reset formula with qmgr.");
		return NULL;
	}

	if ((form = static_cast<char *>(malloc(bufsize + 1))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		fclose(fp);
		return NULL;
	}

	form[0] = '\0';

	/* first line is a comment */
	if (fgets(buf, RF_BUFSIZE, fp) == NULL) 
		log_errf(-1, __func__, "fgets failed.");

	while (fgets(buf, RF_BUFSIZE, fp) != NULL) {
		auto len = strlen(form) + strlen(buf);
		if (len > bufsize) {
			tmp = static_cast<char *>(realloc(form, len * 2 + 1));
			if (tmp == NULL) {
				log_err(errno, __func__, MEM_ERR_MSG);
				free(form);
				fclose(fp);
				return NULL;
			}
			form = tmp;
			bufsize = len;
		}
		strcat(form, buf);
	}

	if (form[strlen(form) - 1] == '\n')
		form[strlen(form) - 1] = '\0';

	fclose(fp);
	return form;
}

/**
 * @brief
 * 		dup_status - status copy constructor
 *
 * @param[in]	ost	-	status input
 *
 * @return	duplicated status
 * @retval	NULL	: on error
 */
status *
dup_status(status *ost)
{
	status *nst;

	if (ost == NULL)
		return NULL;

	nst = new status();
	if (nst == NULL)
		return NULL;

	*nst = *ost;

	return nst;
}

/**
 * @brief
 * 		free_queue_list - to free two dimensional queue_list array
 *
 * @param[in]	in_list - List which need to be deleted.
 *
 * @return	void
 */
void
free_queue_list(queue_info ***queue_list)
{
	int i;

	if (queue_list == NULL)
		return;
	for (i = 0; queue_list[i] != NULL; i++)
		free(queue_list[i]);
	free(queue_list);
}

/**
 * @brief
 * 		create_total_counts - This function checks if
 *	    total_*_counts list for user/group/project and alljobcounts
 *	    is empty and if so, it duplicates or creates new counts with the
 *	    user/group/project name mentioned in resource_resv structure.
 *
 * @param[in,out]  sinfo	-	server_info structure used to check and set
 *                          	total_*_counts
 * @param[in,out]  qinfo   	-	queue_info structure used to check and set
 *                          	total_*_counts
 * @param[in]      resresv 	-	resource_resv structure to get user/group/project
 * @param[in]      mode    	-	To state whether total_*_counts in server_info
 *                          	structure needs to be created or in queue_info.
 *
 * @return	void
 */
void
create_total_counts(server_info *sinfo, queue_info *qinfo,
		    resource_resv *resresv, int mode)
{
	if (mode == SERVER || mode == ALL) {
		if (sinfo->total_group_counts.size() == 0) {
			if (sinfo->group_counts.size() != 0)
				sinfo->total_group_counts = dup_counts_umap(sinfo->group_counts);
			else if (resresv != NULL)
				find_alloc_counts(sinfo->total_group_counts, resresv->group);
		}
		if (sinfo->total_user_counts.size() == 0) {
			if (sinfo->user_counts.size() != 0)
				sinfo->total_user_counts = dup_counts_umap(sinfo->user_counts);
			else if (resresv != NULL)
				find_alloc_counts(sinfo->total_user_counts, resresv->user);
		}
		if (sinfo->total_project_counts.size() == 0) {
			if (sinfo->project_counts.size() != 0)
				sinfo->total_project_counts = dup_counts_umap(sinfo->project_counts);
			else if (resresv != NULL)
				find_alloc_counts(sinfo->total_project_counts, resresv->project);
		}
		if (sinfo->total_alljobcounts.size() == 0) {
			if (sinfo->alljobcounts.size() != 0)
				sinfo->total_alljobcounts = dup_counts_umap(sinfo->alljobcounts);
			else
				find_alloc_counts(sinfo->total_alljobcounts, PBS_ALL_ENTITY);
		}
	}
	if (mode == QUEUE || mode == ALL) {
		if (qinfo->total_group_counts.size() == 0) {
			if (qinfo->group_counts.size() != 0)
				qinfo->total_group_counts = dup_counts_umap(qinfo->group_counts);
			else if (resresv != NULL)
				find_alloc_counts(qinfo->total_group_counts, resresv->group);
		}
		if (qinfo->total_user_counts.size() == 0) {
			if (qinfo->user_counts.size() != 0)
				qinfo->total_user_counts = dup_counts_umap(qinfo->user_counts);
			else if (resresv != NULL)
				find_alloc_counts(qinfo->total_user_counts, resresv->user);
		}
		if (qinfo->total_project_counts.size() == 0) {
			if (qinfo->project_counts.size() != 0)
				qinfo->total_project_counts = dup_counts_umap(qinfo->project_counts);
			else if (resresv != NULL)
				find_alloc_counts(qinfo->total_project_counts, resresv->project);
		}
		if (qinfo->total_alljobcounts.size() == 0) {
			if (qinfo->alljobcounts.size() != 0)
				qinfo->total_alljobcounts = dup_counts_umap(qinfo->alljobcounts);
			else if (resresv != NULL)
				find_alloc_counts(qinfo->total_alljobcounts, PBS_ALL_ENTITY);
		}
	}
	return;
}

/**
 * @brief
 * 		update_total_counts update a total counts list on running or
 *         queing a job
 *
 * @param[in]	si		-	server_info structure to use for count updation
 * @param[in]	qi		-	queue_info structure to use for count updation
 * @param[in]	rr		-	resource_resv structure to use for count updation
 * @param[in]  	mode	-	To state whether total_*_counts in server_info
 *                      	structure needs to be updated or in queue_info.
 *
 * @return	void
 *
 */
void
update_total_counts(server_info *si, queue_info *qi,
		    resource_resv *rr, int mode)
{
	create_total_counts(si, qi, rr, mode);
	if (((mode == SERVER) || (mode == ALL)) &&
	    ((si != NULL) && si->has_hard_limit)) {
		update_counts_on_run(find_alloc_counts(si->total_group_counts, rr->group), rr->resreq);
		update_counts_on_run(find_alloc_counts(si->total_project_counts, rr->project), rr->resreq);
		update_counts_on_run(find_alloc_counts(si->total_alljobcounts, PBS_ALL_ENTITY), rr->resreq);
		update_counts_on_run(find_alloc_counts(si->total_user_counts, rr->user), rr->resreq);
	} else if (((mode == QUEUE) || (mode == ALL)) &&
		   ((qi != NULL) && qi->has_hard_limit)) {
		update_counts_on_run(find_alloc_counts(qi->total_group_counts, rr->group), rr->resreq);
		update_counts_on_run(find_alloc_counts(qi->total_project_counts, rr->project), rr->resreq);
		update_counts_on_run(find_alloc_counts(qi->total_alljobcounts, PBS_ALL_ENTITY), rr->resreq);
		update_counts_on_run(find_alloc_counts(qi->total_user_counts, rr->user), rr->resreq);
	}
}

/**
 * @brief
 * 		update_total_counts_on_end update a total counts list on preempting
 *         a running job
 *
 * @param[in]	si		-	server_info structure to use for count updation
 * @param[in]	qi		-	queue_info structure to use for count updation
 * @param[in]	rr		-	resource_resv structure to use for count updation
 * @param[in]  	mode	-	To state whether total_*_counts in server_info
 *                      	structure needs to be updated or in queue_info.
 *
 * @return	void
 *
 */
void
update_total_counts_on_end(server_info *si, queue_info *qi,
			   resource_resv *rr, int mode)
{
	create_total_counts(si, qi, rr, mode);
	if (((mode == SERVER) || (mode == ALL)) &&
	    ((si != NULL) && si->has_hard_limit)) {
		update_counts_on_end(find_alloc_counts(si->total_group_counts, rr->group), rr->resreq);
		update_counts_on_end(find_alloc_counts(si->total_project_counts, rr->project), rr->resreq);
		update_counts_on_end(find_alloc_counts(si->total_alljobcounts, PBS_ALL_ENTITY), rr->resreq);
		update_counts_on_end(find_alloc_counts(si->total_user_counts, rr->user), rr->resreq);
	} else if (((mode == QUEUE) || (mode == ALL)) &&
		   ((qi != NULL) && qi->has_hard_limit)) {
		update_counts_on_end(find_alloc_counts(qi->total_group_counts, rr->group), rr->resreq);
		update_counts_on_end(find_alloc_counts(qi->total_project_counts, rr->project), rr->resreq);
		update_counts_on_end(find_alloc_counts(qi->total_alljobcounts, PBS_ALL_ENTITY), rr->resreq);
		update_counts_on_end(find_alloc_counts(qi->total_user_counts, rr->user), rr->resreq);
	}
}

/**
 * @brief
 * 		get a unique rank to uniquely identify an object
 *
 * @return	int
 * @retval	unique number for this scheduling cycle
 */
int
get_sched_rank()
{
	cstat.order++;
	return cstat.order;
}

/**
 * @brief
 * 		add_queue_to_list - This function alligns all queues according to
 *                              their priority.
 *
 * @param[in,out]	qlhead	-	address of 3 dimensional queue list.
 * @param[in]		qinfo	-	queue which is getting added in queue_list.
 *
 * @return	int
 * @retval	1	: If successful in adding the qinfo to queue_list.
 * @retval	0	: If failed to add qinfo to queue_list.
 */
int
add_queue_to_list(queue_info ****qlhead, queue_info *qinfo)
{
	int queue_list_size = 0;
	void *temp = NULL;
	queue_info ***temp_list = NULL;
	queue_info ***list_head;

	if (qlhead == NULL)
		return 0;

	list_head = *qlhead;
	queue_list_size = count_array(list_head);

	temp_list = find_queue_list_by_priority(list_head, qinfo->priority);
	if (temp_list == NULL) {
		temp = realloc(list_head, (queue_list_size + 2) * sizeof(queue_info **));
		if (temp == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return 0;
		}
		*qlhead = list_head = static_cast<queue_info ***>(temp);
		list_head[queue_list_size] = NULL;
		list_head[queue_list_size + 1] = NULL;
		if (append_to_queue_list(&list_head[queue_list_size], qinfo) == NULL)
			return 0;
	} else {
		if (append_to_queue_list(temp_list, qinfo) == NULL)
			return 0;
	}
	return 1;
}

/**
 * @brief
 * 		find_queue_list_by_priority - function finds out the array of queues
 *                               which matches with the priority passed to this
 *                               function. It returns the base address of matching
 *                               array.
 *
 * @param[in]	list_head 	- 	Head pointer to queue_info list.
 * @param[in]	priority 	-  	Priority of the queue that needs to be searched.
 *
 * @return	queue_info*** - base address of array which has given priority.
 * @retval	NULL	: when function is not able to find the array.
 *
 */
struct queue_info ***
find_queue_list_by_priority(queue_info ***list_head, int priority)
{
	int i;
	if (list_head == NULL)
		return NULL;
	for (i = 0; list_head[i] != NULL; i++) {
		if ((list_head[i][0] != NULL) && list_head[i][0]->priority == priority)
			return (&list_head[i]);
	}
	return NULL;
}

/**
 * @brief
 * 		append_to_queue_list - function that will reallocate and append
 *                               "add" to the list provided.
 * @param[in,out]	list	-	pointer to queue_info** which gets reallocated
 *                       		and "add" is appended to it.
 * @param[in] 		add 	-   queue_info  that needs to be appended.
 *
 * @return	queue_info** : newly appended list.
 * @retval	NULL	: when realloc fails.
 *           			pointer to appended list.
 */
struct queue_info **
append_to_queue_list(queue_info ***list, queue_info *add)
{
	int count = 0;
	queue_info **temp = NULL;

	if ((list == NULL) || (add == NULL))
		return NULL;
	count = count_array(*list);

	/* count contains number of elements in list (excluding NULL). we add 2 to add the NULL
	 * back in, plus our new element.
	 */
	temp = (queue_info **) realloc(*list, (count + 2) * sizeof(queue_info *));
	if (temp == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	temp[count] = add;
	temp[count + 1] = NULL;
	*list = temp;
	return (*list);
}

/**
 * @brief basically do a reslist->assigned += reqlist->amount for all of reqlist
 * @param reslist - resource list
 * @param reqlist - resource_req list
 * @return
 */
void
add_req_list_to_assn(schd_resource *reslist, resource_req *reqlist)
{
	if (reslist == NULL || reqlist == NULL)
		return;

	for (auto req = reqlist; req != NULL; req = req->next) {
		auto r = find_resource(reslist, req->def);
		if (r != NULL && r->type.is_consumable)
			r->assigned += req->amount;
	}
}

/**
 * @brief create the ninfo->res->assigned values for the node
 * @param ninfo - the node
 * @return int
 * @retval 1 success
 * @retval 0 failure
 */
int
create_resource_assn_for_node(node_info *ninfo)
{
	schd_resource *r;
	schd_resource *ncpus_res = NULL;
	int i;

	if (ninfo == NULL)
		return 0;

	for (r = ninfo->res; r != NULL; r = r->next)
		if (r->type.is_consumable) {
			r->assigned = 0;
			if (r->def == allres["ncpus"])
				ncpus_res = r;
		}

	/* First off, add resource from running jobs (that aren't in resvs) */
	if (ninfo->job_arr != NULL) {
		for (i = 0; ninfo->job_arr[i] != NULL; i++) {
			/* ignore jobs in reservations.  The resources will be accounted for with the reservation itself.  */
			if (ninfo->job_arr[i]->job != NULL && ninfo->job_arr[i]->job->resv == NULL) {
				for (auto &n : ninfo->job_arr[i]->nspec_arr) {
					if (n->ninfo->rank == ninfo->rank)
						add_req_list_to_assn(ninfo->res, n->resreq);
				}
			}
		}
	}

	/* Next up, account for running reservations.  Running reservations consume all resources on the node when they start.  */
	if (ninfo->run_resvs_arr != NULL) {
		for (i = 0; ninfo->run_resvs_arr[i] != NULL; i++) {
			for (auto &n : ninfo->run_resvs_arr[i]->nspec_arr) {
				if (n->ninfo->rank == ninfo->rank)
					add_req_list_to_assn(ninfo->res, n->resreq);
			}
		}
	}

	/* Lastly if restrict_res_to_release_on_suspend is set, suspended jobs may not have released all their resources
	 * This is tricky since a suspended job knows what resources they released.
	 * We need to know what they didn't release to account for in the nodes resources_assigned
	 * Also, we only need to deal with suspended jobs outside of reservations since resources for reservations were handled above.
	 */
	if (ninfo->num_susp_jobs > 0) {
		int i;
		server_info *sinfo = ninfo->server;
		for (i = 0; sinfo->jobs[i] != NULL; i++) {
			if (sinfo->jobs[i]->job->is_suspended && sinfo->jobs[i]->job->resv == NULL) {
				nspec *ens;
				ens = find_nspec(sinfo->jobs[i]->nspec_arr, ninfo);
				if (ens != NULL) {
					nspec *rns;
					rns = find_nspec(sinfo->jobs[i]->job->resreleased, ninfo);
					if (rns != NULL) {
						resource_req *cur_req;
						for (cur_req = ens->resreq; cur_req != NULL; cur_req = cur_req->next) {
							if (cur_req->type.is_consumable)
								if (find_resource_req(rns->resreq, cur_req->def) == NULL) {
									schd_resource *nres;
									nres = find_resource(ninfo->res, cur_req->def);
									if (nres != NULL)
										nres->assigned += cur_req->amount;
								}
						}
					}
				}
			}
		}
	}

	if (ncpus_res != NULL && ncpus_res->assigned < ncpus_res->avail)
		remove_node_state(ninfo, ND_jobbusy);

	return 1;
}

/**
 * @brief compares two schd_resource structs for equality
 *
 * @return int
 * @retval 1 if equal
 * @retval 0 if not equal
 */
int
compare_resource_avail(schd_resource *r1, schd_resource *r2)
{
	if (r1 == NULL && r2 == NULL)
		return 1;
	if (r1 == NULL || r2 == NULL)
		return 0;

	if (r1->def->type.is_string) {
		if (match_string_array(r1->str_avail, r2->str_avail) == SA_FULL_MATCH)
			return 1;
		else
			return 0;
	}
	if (r1->avail == r2->avail)
		return 1;

	return 0;
}

/**
 * @brief compare two schd_resource lists for equality
 * @return int
 * @retval 1 if equal
 * @retval 0 if not equal
 */
int
compare_resource_avail_list(schd_resource *r1, schd_resource *r2)
{
	schd_resource *cur;

	if (r1 == NULL && r2 == NULL)
		return 1;
	if (r1 == NULL || r2 == NULL)
		return 0;

	for (cur = r1; cur != NULL; cur = cur->next) {
		schd_resource *res;

		res = find_resource(r2, cur->def);
		if (res != NULL) {
			if (compare_resource_avail(cur, res) == 0)
				return 0;
		} else if (cur->type.is_boolean) { /* Unset boolean == False */
			if (cur->avail != 0)
				return 0;
		} else
			return 0;
	}

	return 1;
}

/**
 * @brief dup sinfo->unordered_nodes from the nnodes array.
 * @param[in] old_unordered_nodes - unordered_nodes array to dup
 * @param[in] nnodes - nodes from new universe.  Nodes are references into this
 * 		array
 *
 * @return new unordered_nodes
 */
node_info **
dup_unordered_nodes(node_info **old_unordered_nodes, node_info **nnodes)
{
	int i;
	int ct1;
	int ct2;
	node_info **new_unordered_nodes;

	if (old_unordered_nodes == NULL || nnodes == NULL)
		return NULL;

	ct1 = count_array(nnodes);
	ct2 = count_array(old_unordered_nodes);

	if (ct1 != ct2)
		return NULL;

	new_unordered_nodes = static_cast<node_info **>(calloc((ct1 + 1), sizeof(node_info *)));
	if (new_unordered_nodes == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0; i < ct1; i++)
		new_unordered_nodes[nnodes[i]->node_ind] = nnodes[i];

	new_unordered_nodes[ct1] = NULL;

	return new_unordered_nodes;
}


================================================
FILE: src/scheduler/server_info.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _SERVER_INFO_H
#define _SERVER_INFO_H

#include <pbs_ifl.h>
#include "state_count.h"
#include "data_types.h"
#include "constant.h"

/* Modes passed to update_total_counts_on_run() */
enum counts_on_run {
	SERVER,
	QUEUE,
	ALL
};
/*
 *      query_server - creates a structure of arrays consisting of a server
 *                      and all the queues and jobs that reside in that server
 */
server_info *query_server(status *pol, int pbs_sd);

/*
 *	query_server_info - collect information out of a statserver call
 *			    into a server_info structure
 */
server_info *query_server_info(status *pol, struct batch_status *server);

/*
 * 	query_server_dyn_res - execute all configured server_dyn_res scripts
 */
int query_server_dyn_res(server_info *sinfo);

/*
 *	find_alloc_resource[_by_str] - try and find a resource, and if it is
 *                                     not there allocate space for it and
 *                                     add it to the resource list
 */

schd_resource *find_alloc_resource(schd_resource *resplist, resdef *def);
schd_resource *find_alloc_resource_by_str(schd_resource *resplist, const char *name);
schd_resource *find_alloc_resource_by_str(schd_resource *resplist, const std::string &name);

/*  finds a resource in a resource list by string resource name */

schd_resource *find_resource_by_str(schd_resource *reslist, const char *name);
schd_resource *find_resource_by_str(schd_resource *reslist, const std::string &name);

/*
 *	find resource by resource definition
 */
schd_resource *find_resource(schd_resource *reslist, resdef *def);

/*
 *      free_resource - free a resource struct
 */
void free_resource(schd_resource *resp);

/*
 *      free_resource_list - free a resource list
 */
void free_resource_list(schd_resource *reslist);

/*
 *      new_resource - allocate and initialize new resoruce struct
 */
schd_resource *new_resource(void);

/*
 * Create new resource with given data
 */
schd_resource *create_resource(const char *name, const char *value, enum resource_fields field);

/*
 *	free_server - free a list of server_info structs
 */
void free_server(server_info *sinfo);

/*
 *      update_server_on_run - update server_info strucutre when a job is run
 */
void
update_server_on_run(status *policy, server_info *sinfo, queue_info *qinfo,
		     resource_resv *resresv, char *job_state);

/*
 *
 *      create_server_arrays - create a large server resresv array of all the
 *                             jobs on the system by coping all the jobs
 *                             from the queue job arrays.  Also create an array
 *                             of both jobs and reservations
 */
int create_server_arrays(server_info *sinfo);

/*
 *	copy_server_arrays - copy server's jobs and all_resresv arrays
 */
int copy_server_arrays(server_info *nsinfo, const server_info *osinfo);

/*
 *      check_exit_job - function used by job_filter to filter out
 *                       jobs not in the exiting state
 */
int check_exit_job(resource_resv *job, const void *arg);

/*
 *
 *	check_susp_job - function used by job_filter to filter out jobs
 *			   which are suspended
 */
int check_susp_job(resource_resv *job, const void *arg);

/*
 *
 *	check_job_running - function used by job_filter to filter out
 *			   jobs that are running
 */
int check_job_running(resource_resv *job, const void *arg);

/*
 *
 *	check_running_job_in_reservation - function used by job_filter to filter out
 *			   jobs that are in a reservation
 */
int check_running_job_in_reservation(resource_resv *job, const void *arg);

/*
 *
 *	check_running_job_not_in_reservation - function used by job_filter to filter out
 *			   jobs that are not in a reservation
 */
int check_running_job_not_in_reservation(resource_resv *job, const void *arg);

/*
 *
 *      check_resv_running_on_node - function used by resv_filter to filter out
 *				running reservations
 */
int check_resv_running_on_node(resource_resv *resv, const void *arg);

/*
 *      dup_resource_list - dup a resource list
 */
schd_resource *dup_resource_list(schd_resource *res);

/* dup a resource list selectively only duping specific resources */

schd_resource *dup_selective_resource_list(schd_resource *res, std::unordered_set<resdef *> &deflist, unsigned flags);

/*
 *	dup_ind_resource_list - dup a resource list - if a resource is indirect
 *				dup the pointed to resource instead
 */
schd_resource *dup_ind_resource_list(schd_resource *res);

/*
 *      dup_resource - duplicate a resource struct
 */
schd_resource *dup_resource(schd_resource *res);

/*
 *      check_resv_job - finds if a job has a reservation
 *                       used with job_filter
 */
int check_resv_job(resource_resv *job, void *unused);

/*
 *      free_resource_list - frees the memory used by a resource list
 */
void free_resource_list(schd_resource *reslist);

/*
 *      free_resource - frees the memory used by a resource structure
 */
void free_resource(schd_resource *resp);

/*
 *      update_server_on_end - update a server structure when a job has
 *                             finished running
 */
void
update_server_on_end(status *policy, server_info *sinfo, queue_info *qinfo,
		     resource_resv *resresv, const char *job_state);

/*
 *      check_unassoc_node - finds nodes which are not associated with queues
 *                           used with node_filter
 */
int is_unassoc_node(node_info *ninfo, void *arg);

/*
 *      new_counts - create a new counts structure and return it
 */
counts *new_counts(void);

/*
 *      free_counts_list - free a list of counts structures
 */
void free_counts_list(counts_umap &ctslist);

/*
 *	dup_counts_umap - duplicate counts_umap
 */
counts_umap dup_counts_umap(const counts_umap &omap);

/*
 *      find_counts - find a counts structure by name
 */
counts *find_counts(counts_umap &ctslist, const std::string &name);

/*
 *      find_alloc_counts - find a counts structure by name or allocate a new
 *                          counts, name it, and add it to the end of the list
 */
counts *find_alloc_counts(counts_umap &ctslist, const std::string &name);

/*
 *      update_counts_on_run - update a counts struct on the running of a job
 */
void update_counts_on_run(counts *cts, resource_req *resreq);

/*
 *      update_counts_on_end - update a counts structure on the end of a job
 */
void update_counts_on_end(counts *cts, resource_req *resreq);

/**
 *	counts_max - perform a max() the current max and a new list.  If any
 *			element from the new list is greater than the current
 *			max, we free the old, and dup the new and attach it
 *			in.
 *
 *	  \param cmax    - current max that will be updated.
 *	  \param new     - new counts lists.  If anything in this list is
 *			   greater than the cur_max, it needs to be dup'd.
 *
 *	  returns void
 */
void counts_max(counts_umap &cmax, counts_umap &ncounts);
void counts_max(counts_umap &cmax, counts *ncounts);

/*
 *      check_run_job - function used by resource_resv_filter to filter out
 *                      non-running jobs.
 */
int check_run_job(resource_resv *job, const void *arg);

/*
 *      update_universe_on_end - update a pbs universe when a job/resv ends
 */
void update_universe_on_end(status *policy, resource_resv *resresv, const char *job_state, unsigned int flags);

bool update_universe_on_run(status *policy, int pbs_sd, resource_resv *rr, std::vector<nspec *> &orig_ns, unsigned int flags);
bool update_universe_on_run(status *policy, int pbs_sd, resource_resv *rr, unsigned int flags);

/*
 *
 *	set_resource - set the values of the resource structure.  This
 *		function can be called in one of two ways.  It can be called
 *		with resources_available value, or the resources_assigned
 *		value.
 *
 *	NOTE: If we have resource type information from the server, we will
 * 		use it.  If not, we will try and set the resource type from
 * 		the resources_available value first, if not then the
 *		resources_assigned
 *
 *	res - the resource to set
 *	val - the value to set upon the resource
 *	field - the type of field to set (avaialble or assigned)
 *
 *	returns 1 on success 0 on failure/error
 *
 */
int set_resource(schd_resource *res, const char *val, enum resource_fields field);

/*
 *	update_preemption_priority - update preemption status when a
 *   					resource resv runs/ends
 *	returns nothing
 */
void update_preemption_priority(server_info *sinfo, resource_resv *resresv);

/*
 *	add_resource_list - add one resource list to another
 *			i.e. r1 += r2
 *	returns 1 on success
 *		0 on failure
 */
int add_resource_list(status *policy, schd_resource *r1, schd_resource *r2, unsigned int flags);

int modify_resource_list(schd_resource *res_list, resource_req *req_list, int type);

/*
 *	add_resource_value - add a resource value to another
 *				i.e. val1 += val2
 */
void add_resource_value(sch_resource_t *val1, sch_resource_t *val2,
			sch_resource_t default_val);

/*
 *  add_resource_string_arr - add values from a string array to
 *                             a string resource.  Only add values if
 *                             they do not exist unless specified by allow_dup
 */
int add_resource_str_arr(schd_resource *res, char **str_arr, int allow_dup);

/*
 *      accumulate two boolean resources together (r1 += r2)
 *        T + T = True | F + F = False | T + F = TRUE_FALSE
 */
int add_resource_bool(schd_resource *r1, schd_resource *r2);

/*
 *	find_indirect_resource - follow the indirect resource pointers to
 *				 find the real resource at the end
 *	returns the indirect resource or NULL on error
 */
schd_resource *find_indirect_resource(schd_resource *res, node_info **nodes);

/*
 *	resolve_indirect_resources - resource indirect resources for node array
 *
 *	  nodes - the nodes to resolve
 *
 *	returns 1 if successful
 *		0 if there were any errors
 */
int resolve_indirect_resources(node_info **nodes);

/*
 *	read_formula - read the formula from a well known file
 *
 *	returns formula in malloc'd buffer or NULL on error
 */
char *read_formula(void);

/*
 * create_total_counts -  Creates total counts list for server & queue
 */
void
create_total_counts(server_info *sinfo, queue_info *qinfo,
		    resource_resv *resresv, int mode);

/*
 * Updates total counts list for server & queue on run and on
 * preemption.
 */
void
update_total_counts(server_info *si, queue_info *qi,
		    resource_resv *rr, int mode);
void
update_total_counts_on_end(server_info *si, queue_info *qi,
			   resource_resv *rr, int mode);

/**
 * @brief - get a unique rank to uniquely identify an object
 * @return int
 * @retval unique number for this scheduling cycle
 */
int get_sched_rank();

/*
 *  add_queue_to_list - This function aligns all queues according to
 *                      their priority so that we can round robin
 *                      across those.
 */
int add_queue_to_list(queue_info ****qlhead, queue_info *qinfo);

/*
 * append_to_queue_list - function that will reallocate and append
 *                        "add" to the list provided.
 */
struct queue_info **append_to_queue_list(queue_info ***list, queue_info *add);

/*
 * find_queue_list_by_priority - function finds out the array of queues
 *                               which matches with the priority passed to this
 *                               function. It returns the base address of matching
 *                               array.
 */
struct queue_info ***find_queue_list_by_priority(queue_info ***list_head, int priority);

/*
 * free_queue_list - to free two dimensional queue_list array
 */
void free_queue_list(queue_info ***queue_list);

void add_req_list_to_assn(schd_resource *, resource_req *);

int create_resource_assn_for_node(node_info *);

int compare_resource_avail_list(schd_resource *r1, schd_resource *r2);
int compare_resource_avail(schd_resource *r1, schd_resource *r2);

node_info **dup_unordered_nodes(node_info **old_unordered_nodes, node_info **nnodes);

status *dup_status(status *ost);

struct batch_status *send_statserver(int virtual_fd, struct attrl *attrib, char *extend);

#endif /* _SERVER_INFO_H */


================================================
FILE: src/scheduler/simulate.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    simulate.c
 *
 * @brief
 * 		simulate.c - This file contains functions related to simulation of pbs event.
 *
 * Functions included are:
 * 	simulate_events()
 * 	is_timed()
 * 	get_next_event()
 * 	next_event()
 * 	find_init_timed_event()
 * 	find_first_timed_event_backwards()
 * 	find_next_timed_event()
 * 	find_prev_timed_event()
 * 	set_timed_event_disabled()
 * 	find_timed_event()
 * 	perform_event()
 * 	exists_run_event()
 * 	calc_run_time()
 * 	create_event_list()
 * 	create_events()
 * 	new_event_list()
 * 	dup_event_list()
 * 	free_event_list()
 * 	new_timed_event()
 * 	dup_timed_event()
 * 	find_event_ptr()
 * 	dup_timed_event_list()
 * 	free_timed_event()
 * 	free_timed_event_list()
 * 	add_event()
 * 	add_timed_event()
 * 	delete_event()
 * 	create_event()
 * 	determine_event_name()
 * 	dedtime_change()
 * 	add_dedtime_events()
 * 	simulate_resmin()
 * 	policy_change_to_str()
 * 	policy_change_info()
 * 	describe_simret()
 * 	add_prov_event()
 * 	generic_sim()
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <log.h>

#include "simulate.h"
#include "data_types.h"
#include "resource_resv.h"
#include "resv_info.h"
#include "node_info.h"
#include "server_info.h"
#include "queue_info.h"
#include "fifo.h"
#include "constant.h"
#include "sort.h"
#include "check.h"
#include "log.h"
#include "misc.h"
#include "prime.h"
#include "globals.h"
#include "check.h"
#include "buckets.h"
#ifdef NAS /* localmod 030 */
#include "site_code.h"
#endif /* localmod 030 */

/** @struct	policy_change_func_name
 *
 * @brief
 * 		structure to map a function pointer to string name
 * 		for printing of policy change events
 */
struct policy_change_func_name {
	event_func_t func;
	const char *str;
};

// clang-format off
static const struct policy_change_func_name policy_change_func_name[] =
{
	{(event_func_t)init_prime_time, "prime time"},
	{(event_func_t)init_non_prime_time, "non-prime time"},
	{NULL, NULL}
};

// clang-format on

/**
 * @brief
 * 		simulate the future of a PBS universe
 *
 * @param[in] 	policy   - policy info
 * @param[in] 	sinfo    - PBS universe to simulate
 * @param[in] 	cmd      - simulation command
 * @param[in] 	arg      - optional argument
 * @param[out] 	sim_time - the time in the simulated universe
 *
 * @return	bitfield of what type of event(s) were simulated
 */
unsigned int
simulate_events(status *policy, server_info *sinfo,
		enum schd_simulate_cmd cmd, void *arg, time_t *sim_time)
{
	time_t event_time = 0;	 /* time of the event being simulated */
	time_t cur_sim_time = 0; /* current time in simulation */
	unsigned int ret = 0;
	event_list *calendar;

	timed_event *event; /* the timed event to take action on */

	if (sinfo == NULL || sim_time == NULL)
		return TIMED_ERROR;

	if (cmd == SIM_TIME && arg == NULL)
		return TIMED_ERROR;

	if (cmd == SIM_NONE)
		return TIMED_NOEVENT;

	if (sinfo->calendar == NULL)
		return TIMED_NOEVENT;

	if (sinfo->calendar->current_time == NULL)
		return TIMED_ERROR;

	calendar = sinfo->calendar;

	event = next_event(sinfo, DONT_ADVANCE);

	if (event == NULL)
		return TIMED_NOEVENT;

	if (event->disabled)
		event = next_event(sinfo, ADVANCE);

	if (event == NULL)
		return TIMED_NOEVENT;

	cur_sim_time = (*calendar->current_time);

	if (cmd == SIM_NEXT_EVENT) {
		long t = 1;
		if (arg != NULL) {
			t = *((long *) arg);
			if (t == 0)
				t = 1;
		}
		/* t is the opt_backfill_fuzzy window.  In order to create more consistent estimates
		 * shorten the first window to the next time boundary (e.g. if t=1hr and it
		 * is now 12:31, the first window is 29m).  The subsequent windows will be the same.
		 */
		event_time = (event->event_time + t) / t * t;
	} else if (cmd == SIM_TIME)
		event_time = *((time_t *) arg);

	while (event != NULL && event->event_time <= event_time) {
		cur_sim_time = event->event_time;

		(*calendar->current_time) = cur_sim_time;
		if (perform_event(policy, event) == 0) {
			ret = TIMED_ERROR;
			break;
		}

		ret |= event->event_type;

		event = next_event(sinfo, ADVANCE);
	}

	if (calendar->first_run_event != NULL && cur_sim_time > calendar->first_run_event->event_time)
		calendar->first_run_event = find_init_timed_event(calendar->next_event, 0, TIMED_RUN_EVENT);

	(*sim_time) = cur_sim_time;

	if (cmd == SIM_TIME) {
		(*sim_time) = event_time;
		(*calendar->current_time) = event_time;
	}

	return ret;
}

/**
 * @brief
 *		is_timed - check if an event_ptr has timed elements
 * 			 (i.e. has a start and end time)
 *
 * @param[in]	event_ptr	-	the event to check
 *
 * @return	int
 * @retval	1	: if its timed
 * @retval	0	: if it is not
 *
 */
int
is_timed(event_ptr_t *event_ptr)
{
	if (event_ptr == NULL)
		return 0;

	if ((static_cast<resource_resv *>(event_ptr))->start == UNSPECIFIED)
		return 0;

	if ((static_cast<resource_resv *>(event_ptr))->end == UNSPECIFIED)
		return 0;

	return 1;
}

/**
 * @brief
 * 		get the next_event from an event list
 *
 * @param[in]	elist	-	the event list
 *
 * @par NOTE:
 * 			If prime status events matter, consider using
 *			next_event(sinfo, DONT_ADVANCE).  This function only
 *			returns the next_event pointer of the event list.
 *
 * @return	the current event from the event list
 * @retval	NULL	: elist is null
 *
 */
timed_event *
get_next_event(event_list *elist)
{
	if (elist == NULL)
		return NULL;

	return elist->next_event;
}

/**
 * @brief
 * 		move sinfo -> calendar to the next event and return it.
 *	     If the next event is a prime status event,  created
 *	     on the fly and returned.
 *
 * @param[in] 	sinfo 	- server containing the calendar
 * @param[in] 	advance - advance to the next event or not.  
 * 			Prime status event creation happens if we advance or not.
 *
 * @return	the next event
 * @retval	NULL	: if there are no more events
 *
 */
timed_event *
next_event(server_info *sinfo, int advance)
{
	timed_event *te;
	timed_event *pe;
	event_list *calendar;

	if (sinfo == NULL || sinfo->calendar == NULL)
		return NULL;

	calendar = sinfo->calendar;

	if (advance)
		te = find_next_timed_event(calendar->next_event,
					   IGNORE_DISABLED_EVENTS, ALL_MASK);
	else
		te = calendar->next_event;

	/* should we add a periodic prime event
	 * i.e. does a prime status event fit between now and the next event
	 * ( now -- Prime Event -- next event )
	 *
	 * or if we're out of events (te == NULL), we need to return
	 * one last prime event.  There may be things waiting on a specific prime
	 * status.
	 */
	if (!calendar->eol) {
		if (sinfo->policy->prime_status_end != SCHD_INFINITY) {
			if (te == NULL ||
			    (*calendar->current_time <= sinfo->policy->prime_status_end &&
			     sinfo->policy->prime_status_end < te->event_time)) {
				event_func_t func;

				if (sinfo->policy->is_prime)
					func = (event_func_t) init_non_prime_time;
				else
					func = (event_func_t) init_prime_time;

				pe = create_event(TIMED_POLICY_EVENT, sinfo->policy->prime_status_end,
						  (event_ptr_t *) sinfo->policy, func, NULL);

				if (pe == NULL)
					return NULL;

				add_event(sinfo->calendar, pe);
				/* important to set calendar -> eol after calling add_event(),
				 * because add_event() can clear calendar -> eol
				 */
				if (te == NULL)
					calendar->eol = 1;
				te = pe;
			}
		}
	}

	calendar->next_event = te;

	return te;
}

/**
 * @brief
 * 		find the initial event based on a timed_event
 *
 * @param[in]	event            - the current event
 * @param[in] 	ignore_disabled  - ignore disabled events
 * @param[in] 	search_type_mask - bitmask of types of events to search
 *
 * @return	the initial event of the correct type/disabled or not
 * @retval	NULL	: event is NULL.
 *
 * @par NOTE:
 * 			IGNORE_DISABLED_EVENTS exists to be passed in as the
 *		   	ignore_disabled parameter.  It is non-zero.
 *
 * @par NOTE:
 * 			ALL_MASK can be passed in for search_type_mask to search
 *		    for all events types
 */
timed_event *
find_init_timed_event(timed_event *event, int ignore_disabled, unsigned int search_type_mask)
{
	timed_event *e;

	if (event == NULL)
		return NULL;

	for (e = event; e != NULL; e = e->next) {
		if (ignore_disabled && e->disabled)
			continue;
		else if ((e->event_type & search_type_mask) == 0)
			continue;
		else
			break;
	}

	return e;
}

/**
 * @brief
 * 		find the first event based on a timed_event while iterating backwards
 *
 * @param[in] event            - the current event
 * @param[in] ignore_disabled  - ignore disabled events
 * @param[in] search_type_mask - bitmask of types of events to search
 *
 * @return the previous event of the correct type/disabled or not
 *
 * @par NOTE:
 * 			IGNORE_DISABLED_EVENTS exists to be passed in as the
 *		   	ignore_disabled parameter.  It is non-zero.
 *
 * @par NOTE:
 * 			ALL_MASK can be passed in for search_type_mask to search
 *		   	for all events types
 */
timed_event *
find_first_timed_event_backwards(timed_event *event, int ignore_disabled, unsigned int search_type_mask)
{
	timed_event *e;

	if (event == NULL)
		return NULL;

	for (e = event; e != NULL; e = e->prev) {
		if (ignore_disabled && e->disabled)
			continue;
		else if ((e->event_type & search_type_mask) == 0)
			continue;
		else
			break;
	}

	return e;
}
/**
 * @brief
 * 		find the next event based on a timed_event
 *
 * @param[in] event            - the current event
 * @param[in] ignore_disabled  - ignore disabled events
 * @param[in] search_type_mask - bitmask of types of events to search
 *
 * @return	the next timed event of the correct type and disabled or not
 * @retval	NULL	: event is NULL.
 */
timed_event *
find_next_timed_event(timed_event *event, int ignore_disabled, unsigned int search_type_mask)
{
	if (event == NULL)
		return NULL;
	return find_init_timed_event(event->next, ignore_disabled, search_type_mask);
}

/**
 * @brief
 * 		find the previous event based on a timed_event
 *
 * @param[in] event            - the current event
 * @param[in] ignore_disabled  - ignore disabled events
 * @param[in] search_type_mask - bitmask of types of events to search
 *
 * @return	the previous timed event of the correct type and disabled or not
 * @retval	NULL	: event is NULL.
 */
timed_event *
find_prev_timed_event(timed_event *event, int ignore_disabled, unsigned int search_type_mask)
{
	if (event == NULL)
		return NULL;
	return find_first_timed_event_backwards(event->prev, ignore_disabled, search_type_mask);
}
/**
 * @brief
 * 		set the timed_event disabled bit
 *
 * @param[in]	te       - timed event to set
 * @param[in] 	disabled - used to set the disabled bit
 *
 * @return	nothing
 */
void
set_timed_event_disabled(timed_event *te, int disabled)
{
	if (te == NULL)
		return;

	te->disabled = disabled ? 1 : 0;
}

/**
 * @brief
 * 		find a timed_event by any or all of the following:
 *		event name, time of event, or event type.  At times
 *		multiple search parameters are needed to
 *		differentiate between similar events.
 *
 * @param[in]	te_list 	- timed_event list to search in
 * @param[in] 	ignore_disabled - ignore disabled events
 * @param[in] 	name    	- name of timed_event to search or NULL to ignore
 * @param[in] 	event_type 	- event_type or TIMED_NOEVENT to ignore
 * @param[in] 	event_time 	- time or 0 to ignore
 *
 * @par NOTE:
 *			If all three search parameters are ignored,  the first event
 *			of te_list will be returned
 *
 * @return	found timed_event
 * @retval	NULL	: on error
 *
 */
timed_event *
find_timed_event(timed_event *te_list, const std::string &name, int ignore_disabled,
		 enum timed_event_types event_type, time_t event_time)
{
	timed_event *te;
	int found_name = 0;
	int found_type = 0;
	int found_time = 0;

	if (te_list == NULL)
		return NULL;

	for (te = te_list; te != NULL; te = find_next_timed_event(te, 0, ALL_MASK)) {
		if (ignore_disabled && te->disabled)
			continue;
		found_name = found_type = found_time = 0;
		if (name.empty() || te->name == name)
			found_name = 1;

		if (event_type == te->event_type || event_type == TIMED_NOEVENT)
			found_type = 1;

		if (event_time == te->event_time || event_time == 0)
			found_time = 1;

		if (found_name + found_type + found_time == 3)
			break;
	}

	return te;
}

timed_event *
find_timed_event(timed_event *te_list, int ignore_disabled, enum timed_event_types event_type, time_t event_time)
{
	return find_timed_event(te_list, "", ignore_disabled, event_type, event_time);
}

timed_event *
find_timed_event(timed_event *te_list, enum timed_event_types event_type)
{
	return find_timed_event(te_list, "", 0, event_type, 0);
}

timed_event *
find_timed_event(timed_event *te_list, const std::string &name, enum timed_event_types event_type, time_t event_time)
{
	return find_timed_event(te_list, name, 0, event_type, event_time);
}

timed_event *
find_timed_event(timed_event *te_list, time_t event_time)
{
	return find_timed_event(te_list, "", 0, TIMED_NOEVENT, event_time);
}

/**
 * @brief
 * 		takes a timed_event and performs any actions
 *		required by the event to be completed.
 *
 * @param[in] policy	-	status
 * @param[in] event 	- 	the event to perform
 *
 * @return int
 * @retval 1	: success
 * @retval 0	: failure
 */
int
perform_event(status *policy, timed_event *event)
{
	char logbuf[MAX_LOG_SIZE];
	char timebuf[128];
	resource_resv *resresv;
	int ret = 1;

	if (event == NULL || event->event_ptr == NULL)
		return 0;

	sprintf(timebuf, "%s", ctime(&event->event_time));
	/* ctime() puts a \n at the end of the line, nuke it*/
	timebuf[strlen(timebuf) - 1] = '\0';

	switch (event->event_type) {
		case TIMED_END_EVENT: /* event_ptr type: (resource_resv *) */
			resresv = static_cast<resource_resv *>(event->event_ptr);
			update_universe_on_end(policy, resresv, "X", NO_ALLPART);

			sprintf(logbuf, "%s end point", resresv->is_job ? "job" : "reservation");
			break;
		case TIMED_RUN_EVENT: /* event_ptr type: (resource_resv *) */
			resresv = static_cast<resource_resv *>(event->event_ptr);
			if (sim_run_update_resresv(policy, resresv, NO_ALLPART) == false) {
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
					  event->name, "Simulation: Event failed to be run");
				ret = 0;
			} else {
				sprintf(logbuf, "%s start point",
					resresv->is_job ? "job" : "reservation");
			}
			break;
		case TIMED_POLICY_EVENT:
			strcpy(logbuf, "Policy change");
			break;
		case TIMED_DED_START_EVENT:
			strcpy(logbuf, "Dedtime Start");
			break;
		case TIMED_DED_END_EVENT:
			strcpy(logbuf, "Dedtime End");
			break;
		case TIMED_NODE_UP_EVENT:
			strcpy(logbuf, "Node Up");
			break;
		case TIMED_NODE_DOWN_EVENT:
			strcpy(logbuf, "Node Down");
			break;
		default:
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_INFO,
				  event->name, "Simulation: Unknown event type");
			ret = 0;
	}
	if (event->event_func != NULL)
		event->event_func(event->event_ptr, event->event_func_arg);

	if (ret)
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			   event->name, "Simulation: %s [%s]", logbuf, timebuf);
	return ret;
}

/**
 * @brief
 * 		returns 1 if there exists a timed run event in
 *		the event list between the current event
 *		and the last event, or the end time if it is set
 *
 * @param[in] calendar 	- event list
 * @param[in] end 		- optional end time (0 means search all events)
 *
 * @return	int
 * @retval	1	: there exists a run event
 * @retval	0	: there doesn't exist a run event
 *
 */
int
exists_run_event(event_list *calendar, time_t end)
{
	if (calendar == NULL || calendar->first_run_event == NULL)
		return 0;

	if (calendar->first_run_event->event_time < end)
		return 1;
	return 0;
}

/**
 * @brief finds if there is a reservation run event between now and 'end'
 * @param[in] calendar - the calendar to search
 * @param[in] end - when to stop searching
 *
 * @returns int
 * @retval 1 found a reservation event
 * @retval 0 did not find a reservation event
 */
int
exists_resv_event(event_list *calendar, time_t end)
{
	timed_event *te;
	timed_event *te_list;

	if (calendar == NULL)
		return 0;

	te_list = calendar->first_run_event;
	if (te_list == NULL) /* no run events in our calendar */
		return 0;

	for (te = te_list; te != NULL && te->event_time <= end;
	     te = find_next_timed_event(te, 0, TIMED_RUN_EVENT)) {
		if (te->event_type == TIMED_RUN_EVENT) {
			resource_resv *resresv = static_cast<resource_resv *>(te->event_ptr);
			if (resresv->is_resv)
				return 1;
		}
	}
	return 0;
}

/**
 * @brief
 * 		calculate the run time of a resresv through simulation of
 *		future calendar events
 *
 * @param[in] name 	- the name of the resresv to find the start time of
 * @param[in] sinfo - the pbs environment
 * 					  NOTE: sinfo will be modified, it should be a copy
 * @param[in] flags - some flags to control the function
 *						SIM_RUN_JOB - simulate running the resresv
 *
 * @return	int
 * @retval	time_t of when the job will run
 *	@retval	0	: can not determine when job will run
 *	@retval	1	: on error
 *
 */
time_t
calc_run_time(const std::string &name, server_info *sinfo, int flags)
{
	time_t event_time = (time_t) 0; /* time of the simulated event */
	event_list *calendar;		/* calendar we are simulating in */
	resource_resv *resresv;		/* the resource resv to find star time for */
	/* the value returned from simulate_events().  Init to TIMED_END_EVENT to
	 * force the initial check to see if the job can run
	 */
	unsigned int ret = TIMED_END_EVENT;
	schd_error *err = NULL;
	timed_event *te_start;
	timed_event *te_end;
	std::vector<nspec *> nspec_arr;
	unsigned int ok_flags = NO_ALLPART;
	queue_info *qinfo = NULL;

	if (name.empty() || sinfo == NULL)
		return (time_t) -1;

	event_time = sinfo->server_time;
	calendar = sinfo->calendar;

	resresv = find_resource_resv(sinfo->all_resresv, name);

	if (!is_resource_resv_valid(resresv, NULL))
		return (time_t) -1;

	if (flags & USE_BUCKETS)
		ok_flags |= USE_BUCKETS;
	if (resresv->is_job) {
		ok_flags |= IGNORE_EQUIV_CLASS;
		qinfo = resresv->job->queue;
	}

	err = new_schd_error();
	if (err == NULL)
		return (time_t) 0;

	do {
		/* policy is used from sinfo instead of being passed into calc_run_time()
		 * because it's being simulated/updated in simulate_events()
		 */

		auto desc = describe_simret(ret);
		if (desc > 0 || (desc == 0 && policy_change_info(sinfo, resresv))) {
			clear_schd_error(err);
			nspec_arr = is_ok_to_run(sinfo->policy, sinfo, qinfo, resresv, ok_flags, err);
		}

		if (nspec_arr.empty()) /* event can not run */
			ret = simulate_events(sinfo->policy, sinfo, SIM_NEXT_EVENT, &sc_attrs.opt_backfill_fuzzy, &event_time);

#ifdef NAS /* localmod 030 */
		if (check_for_cycle_interrupt(0)) {
			break;
		}
#endif /* localmod 030 */
	} while (nspec_arr.empty() && !(ret & (TIMED_NOEVENT | TIMED_ERROR)));

#ifdef NAS /* localmod 030 */
	if (check_for_cycle_interrupt(0) || (ret & TIMED_ERROR)) {
#else
	if ((ret & TIMED_ERROR)) {
#endif /* localmod 030 */
		free_schd_error(err);
		free_nspecs(nspec_arr);
		return -1;
	}

	/* we can't run the job, but there are no timed events left to process */
	if (nspec_arr.empty() && (ret & TIMED_NOEVENT)) {
		schdlogerr(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, resresv->name,
			   "Can't find start time estimate", err);
		free_schd_error(err);
		return 0;
	}

	/* err is no longer needed, we've reported it. */
	free_schd_error(err);
	err = NULL;

	if (resresv->is_job)
		resresv->job->est_start_time = event_time;

	resresv->start = event_time;
	resresv->end = event_time + resresv->duration;

	te_start = create_event(TIMED_RUN_EVENT, resresv->start,
				(event_ptr_t *) resresv, NULL, NULL);
	if (te_start == NULL) {
		free_nspecs(nspec_arr);
		return -1;
	}

	te_end = create_event(TIMED_END_EVENT, resresv->end,
			      (event_ptr_t *) resresv, NULL, NULL);
	if (te_end == NULL) {
		free_nspecs(nspec_arr);
		free_timed_event(te_start);
		return -1;
	}

	add_event(calendar, te_start);
	add_event(calendar, te_end);

	if (flags & SIM_RUN_JOB)
		sim_run_update_resresv(sinfo->policy, resresv, nspec_arr, NO_ALLPART);
	else
		free_nspecs(nspec_arr);

	return event_time;
}

/**
 * @brief
 * 		create an event_list from running jobs and confirmed resvs
 *
 * @param[in]	sinfo	-	server universe to act upon
 *
 * @return	event_list
 */
event_list *
create_event_list(server_info *sinfo)
{
	event_list *elist;

	elist = new_event_list();

	if (elist == NULL)
		return NULL;

	elist->events = create_events(sinfo);

	elist->next_event = elist->events;
	elist->first_run_event = find_timed_event(elist->events, TIMED_RUN_EVENT);
	elist->current_time = &sinfo->server_time;
	add_dedtime_events(elist, sinfo->policy);

	return elist;
}

/**
 * @brief
 *		create_events - creates an timed_event list from running jobs
 *			    and confirmed reservations
 *
 * @param[in] sinfo - server universe to act upon
 *
 * @return	timed_event list
 *
 */
timed_event *
create_events(server_info *sinfo)
{
	timed_event *events = NULL;
	timed_event *te = NULL;
	resource_resv **all = NULL;
	int errflag = 0;
	int i = 0;
	time_t end = 0;
	resource_resv **all_resresv_copy;
	int all_resresv_len;

	/* create a temporary copy of all_resresv array which is sorted such that
	 * the timed events are in the front of the array.
	 * Once the first non-timed event is reached, we're done
	 */
	all_resresv_len = count_array(sinfo->all_resresv);
	all_resresv_copy = static_cast<resource_resv **>(malloc((all_resresv_len + 1) * sizeof(resource_resv *)));
	if (all_resresv_copy == NULL)
		return 0;
	for (i = 0; sinfo->all_resresv[i] != NULL; i++)
		all_resresv_copy[i] = sinfo->all_resresv[i];
	all_resresv_copy[i] = NULL;
	all = all_resresv_copy;

	/* sort the all resersv list so all the timed events are in the front */
	qsort(all, count_array(all), sizeof(resource_resv *), cmp_events);

	for (i = 0; all[i] != NULL && is_timed(all[i]); i++) {
		/* only add a run event for a job or reservation if they're
		 * in a runnable state (i.e. don't add it if they're running)
		 */
		if (in_runnable_state(all[i])) {
			te = create_event(TIMED_RUN_EVENT, all[i]->start, all[i], NULL, NULL);
			if (te == NULL) {
				errflag++;
				break;
			}
			events = add_timed_event(events, te);
		}

		if (sinfo->use_hard_duration)
			end = all[i]->start + all[i]->hard_duration;
		else
			end = all[i]->end;
		te = create_event(TIMED_END_EVENT, end, all[i], NULL, NULL);
		if (te == NULL) {
			errflag++;
			break;
		}
		events = add_timed_event(events, te);
	}

	/* for nodes that are in state=sleep add a timed event */
	for (i = 0; sinfo->nodes[i] != NULL; i++) {
		node_info *node = sinfo->nodes[i];
		if (node->is_sleeping) {
			te = create_event(TIMED_NODE_UP_EVENT, sinfo->server_time + PROVISION_DURATION,
					  (event_ptr_t *) node, (event_func_t) node_up_event, NULL);
			if (te == NULL) {
				errflag++;
				break;
			}
			events = add_timed_event(events, te);
		}
	}

	/* A malloc error was encountered, free all allocated memory and return */
	if (errflag > 0) {
		free_timed_event_list(events);
		free(all_resresv_copy);
		return 0;
	}

	free(all_resresv_copy);
	return events;
}

/**
 * @brief
 * 		new_event_list() - event_list constructor
 *
 * @return	event_list *
 * @retval	NULL	: malloc failed
 */
event_list *
new_event_list()
{
	event_list *elist;

	if ((elist = static_cast<event_list *>(malloc(sizeof(event_list)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	elist->eol = 0;
	elist->events = NULL;
	elist->next_event = NULL;
	elist->first_run_event = NULL;
	elist->current_time = NULL;

	return elist;
}

/**
 * @brief
 * 		dup_event_list() - evevnt_list copy constructor
 *
 * @param[in] oelist - event list to copy
 * @param[in] nsinfo - new universe
 *
 * @return	duplicated event_list
 *
 */
event_list *
dup_event_list(event_list *oelist, server_info *nsinfo)
{
	event_list *nelist;

	if (oelist == NULL || nsinfo == NULL)
		return NULL;

	nelist = new_event_list();

	if (nelist == NULL)
		return NULL;

	nelist->eol = oelist->eol;
	nelist->current_time = &nsinfo->server_time;

	if (oelist->events != NULL) {
		nelist->events = dup_timed_event_list(oelist->events, nsinfo);
		if (nelist->events == NULL) {
			free_event_list(nelist);
			return NULL;
		}
	}

	if (oelist->next_event != NULL) {
		nelist->next_event = find_timed_event(nelist->events, oelist->next_event->name,
						      oelist->next_event->event_type,
						      oelist->next_event->event_time);
		if (nelist->next_event == NULL) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING,
				  oelist->next_event->name, "can't find next event in duplicated list");
			free_event_list(nelist);
			return NULL;
		}
	}

	if (oelist->first_run_event != NULL) {
		nelist->first_run_event =
			find_timed_event(nelist->events, oelist->first_run_event->name, TIMED_RUN_EVENT,
					 oelist->first_run_event->event_time);
		if (nelist->first_run_event == NULL) {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, oelist->first_run_event->name,
				  "can't find first run event event in duplicated list");
			free_event_list(nelist);
			return NULL;
		}
	}

	return nelist;
}

/**
 * @brief
 * 		free_event_list - event_list destructor
 *
 * @param[in] elist - event list to freed
 */
void
free_event_list(event_list *elist)
{
	if (elist == NULL)
		return;

	free_timed_event_list(elist->events);
	free(elist);
}

/**
 * @brief
 * 		new_timed_event() - timed_event constructor
 *
 * @return	timed_event *
 * @retval	NULL	: malloc error
 *
 */
timed_event *
new_timed_event()
{
	timed_event *te;

	if ((te = new timed_event()) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	te->disabled = 0;
	te->event_type = TIMED_NOEVENT;
	te->event_time = 0;
	te->event_ptr = NULL;
	te->event_func = NULL;
	te->event_func_arg = NULL;
	te->next = NULL;
	te->prev = NULL;

	return te;
}

/**
 * @brief
 * 		dup_timed_event() - timed_event copy constructor
 *
 * @par
 * 		dup_timed_event() modifies the run_event and end_event memebers of the resource_resv.
 * 		If dup_timed_event() is not called as part of server_info() copy constructor, the resource_resvs of
 * 		the main server_info will be modified, even if server_info->calendar is not.
 *
 * @param[in]	ote 	- timed_event to copy
 * @param[in] 	nsinfo 	- "new" universe where to find the event_ptr
 *
 * @return	timed_event *
 * @retval	NULL	: something wrong
 */
timed_event *
dup_timed_event(timed_event *ote, server_info *nsinfo)
{
	timed_event *nte;
	event_ptr_t *event_ptr;

	if (ote == NULL || nsinfo == NULL)
		return NULL;

	event_ptr = find_event_ptr(ote, nsinfo);
	if (event_ptr == NULL)
		return NULL;

	nte = create_event(ote->event_type, ote->event_time, event_ptr, ote->event_func, ote->event_func_arg);
	set_timed_event_disabled(nte, ote->disabled);

	return nte;
}

/*
 * @brief constructor for te_list
 * @return new te_list structure
 */
te_list *
new_te_list()
{
	te_list *tel;
	tel = static_cast<te_list *>(malloc(sizeof(te_list)));

	if (tel == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	tel->event = NULL;
	tel->next = NULL;

	return tel;
}

/*
 * @brief te_list destructor
 * @param[in] tel - te_list to free
 *
 * @return void
 */
void
free_te_list(te_list *tel)
{
	if (tel == NULL)
		return;
	free_te_list(tel->next);
	free(tel);
}

/*
 * @brief te_list copy constructor
 * @param[in] ote - te_list to copy
 * @param[in] new_timed_even_list - new timed events
 *
 * @return copied te_list
 */
te_list *
dup_te_list(te_list *ote, timed_event *new_timed_event_list)
{
	te_list *nte;

	if (ote == NULL || new_timed_event_list == NULL)
		return NULL;

	nte = new_te_list();
	if (nte == NULL)
		return NULL;

	nte->event = find_timed_event(new_timed_event_list, ote->event->name, ote->event->event_type, ote->event->event_time);

	return nte;
}

/*
 * @brief copy constructor for a list of te_list structures
 * @param[in] ote - te_list to copy
 * @param[in] new_timed_even_list - new timed events
 *
 * @return copied te_list list
 */

te_list *
dup_te_lists(te_list *ote, timed_event *new_timed_event_list)
{
	te_list *nte;
	te_list *end_te = NULL;
	te_list *cur;
	te_list *nte_head = NULL;

	if (ote == NULL || new_timed_event_list == NULL)
		return NULL;

	for (cur = ote; cur != NULL; cur = cur->next) {
		nte = dup_te_list(cur, new_timed_event_list);
		if (nte == NULL) {
			free_te_list(nte_head);
			return NULL;
		}
		if (end_te != NULL)
			end_te->next = nte;
		else
			nte_head = nte;

		end_te = nte;
	}
	return nte_head;
}

/*
 * @brief add a te_list for a timed_event to a list sorted by the event's time
 * @param[in,out] tel - te_list to add to
 * @param[in] te - timed_event to add
 *
 * @return success/failure
 * @retval 1 success
 * @retbal 0 failure
 */
int
add_te_list(te_list **tel, timed_event *te)
{
	te_list *cur_te;
	te_list *prev = NULL;
	te_list *ntel;

	if (tel == NULL || te == NULL)
		return 0;

	for (cur_te = *tel; cur_te != NULL && cur_te->event->event_time < te->event_time; prev = cur_te, cur_te = cur_te->next)
		;

	ntel = new_te_list();
	if (ntel == NULL)
		return 0;
	ntel->event = te;

	if (prev == NULL) {
		ntel->next = *tel;
		(*tel) = ntel;
	} else {
		prev->next = ntel;
		ntel->next = cur_te;
	}
	return 1;
}

/*
 * @brief remove a te_list from a list by timed_event
 * @param[in,out] tel - te_list to remove event from
 * @param[in] te - timed_event to remove
 *
 * @return success/failure
 * @retval 1 success
 * @retval 0 failure
 */
int
remove_te_list(te_list **tel, timed_event *e)
{
	te_list *prev_tel;
	te_list *cur_tel;

	if (tel == NULL || *tel == NULL || e == NULL)
		return 0;

	prev_tel = NULL;
	for (cur_tel = *tel; cur_tel != NULL && cur_tel->event != e; prev_tel = cur_tel, cur_tel = cur_tel->next)
		;
	if (prev_tel == NULL) {
		*tel = cur_tel->next;
		free(cur_tel);
	} else if (cur_tel != NULL) {
		prev_tel->next = cur_tel->next;
		free(cur_tel);
	} else
		return 0;

	return 1;
}

/**
 * @brief
 *		find_event_ptr - find the correct event pointer for the duplicated
 *			 event based on event type
 *
 * @param[in]	ote		- old event
 * @param[in] 	nsinfo 	- "new" universe
 *
 * @return event_ptr in new universe
 * @retval	NULL	: on error
 */
event_ptr_t *
find_event_ptr(timed_event *ote, server_info *nsinfo)
{
	resource_resv *oep; /* old event_ptr in resresv form */
	event_ptr_t *event_ptr = NULL;

	if (ote == NULL || nsinfo == NULL)
		return NULL;

	switch (ote->event_type) {
		case TIMED_RUN_EVENT:
		case TIMED_END_EVENT:
			oep = static_cast<resource_resv *>(ote->event_ptr);
			if (oep->is_resv)
				event_ptr =
					find_resource_resv_by_time(nsinfo->all_resresv,
								   oep->name, oep->start);
			else
				/* In case of jobs there can be only one occurance of job in
				 * all_resresv list, so no need to search using start time of job
				 */
				event_ptr = find_resource_resv_by_indrank(nsinfo->all_resresv,
									  oep->resresv_ind, oep->rank);

			if (event_ptr == NULL) {
				log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, ote->name,
					  "Event can't be found in new server to be duplicated.");
				event_ptr = NULL;
			}
			break;
		case TIMED_POLICY_EVENT:
		case TIMED_DED_START_EVENT:
		case TIMED_DED_END_EVENT:
			event_ptr = nsinfo->policy;
			break;
		case TIMED_NODE_DOWN_EVENT:
		case TIMED_NODE_UP_EVENT:
			event_ptr = find_node_info(nsinfo->nodes,
						   static_cast<node_info *>(ote->event_ptr)->name);
			break;
		default:
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, __func__,
				   "Unknown event type: %d", (int) ote->event_type);
	}

	return event_ptr;
}

/**
 * @brief
 *		dup_timed_event_list() - timed_event copy constructor for a list
 *
 * @param[in]	ote_list 	- list of timed_events to copy
 * @param[in]	nsinfo		- "new" universe where to find the event_ptr
 *
 * @return	timed_event *
 * @retval	NULL	: one of the input is null
 */
timed_event *
dup_timed_event_list(timed_event *ote_list, server_info *nsinfo)
{
	timed_event *ote;
	timed_event *nte = NULL;
	timed_event *nte_prev = NULL;
	timed_event *nte_head = NULL;

	if (ote_list == NULL || nsinfo == NULL)
		return NULL;

	for (ote = ote_list; ote != NULL; ote = ote->next) {
		nte = dup_timed_event(ote, nsinfo);
		if (nte == NULL) {
			free_timed_event_list(nte_head);
			return NULL;
		}
		if (nte_prev != NULL)
			nte_prev->next = nte;
		else
			nte_head = nte;
		nte->prev = nte_prev;

		nte_prev = nte;
	}

	return nte_head;
}

/**
 * @brief
 * 		free_timed_event - timed_event destructor
 *
 * @param[in]	te	-	timed event.
 */
void
free_timed_event(timed_event *te)
{
	if (te == NULL)
		return;
	if (te->event_ptr != NULL) {
		if (te->event_type & TIMED_RUN_EVENT)
			static_cast<resource_resv *>(te->event_ptr)->run_event = NULL;
		if (te->event_type & TIMED_END_EVENT)
			static_cast<resource_resv *>(te->event_ptr)->end_event = NULL;
	}

	delete te;
}

/**
 * @brief
 * 		free_timed_event_list - destructor for a list of timed_event structures
 *
 * @param[in]	te_list	-	timed event list
 */
void
free_timed_event_list(timed_event *te_list)
{
	timed_event *te;
	timed_event *te_next;

	if (te_list == NULL)
		return;

	te = te_list;

	while (te != NULL) {
		te_next = te->next;
		free_timed_event(te);
		te = te_next;
	}
}

/**
 * @brief
 * 		add a timed_event to an event list
 *
 * @param[in] calendar - event list
 * @param[in] te       - timed event
 *
 * @retval 1 : success
 * @retval 0 : failure
 *
 */
int
add_event(event_list *calendar, timed_event *te)
{
	time_t current_time;
	int events_is_null = 0;

	if (calendar == NULL || calendar->current_time == NULL || te == NULL)
		return 0;

	current_time = *calendar->current_time;

	if (calendar->events == NULL)
		events_is_null = 1;

	calendar->events = add_timed_event(calendar->events, te);

	/* empty event list - the new event is the only event */
	if (events_is_null)
		calendar->next_event = te;
	else if (calendar->next_event != NULL) {
		/* check if we're adding an event between now and our current event.
		 * If so, it becomes our new current event
		 */
		if (te->event_time > current_time) {
			if (te->event_time < calendar->next_event->event_time)
				calendar->next_event = te;
			else if (te->event_time == calendar->next_event->event_time) {
				calendar->next_event =
					find_timed_event(calendar->events, te->event_time);
			}
		}
	}
	/* if next_event == NULL, then we've simulated to the end. */
	else if (te->event_time >= current_time)
		calendar->next_event = te;

	if (te->event_type == TIMED_RUN_EVENT)
		if (calendar->first_run_event == NULL || te->event_time < calendar->first_run_event->event_time)
			calendar->first_run_event = te;

	/* if we had previously run to the end of the list
	 * and now we have more work to do, clear the eol bit
	 */
	if (calendar->eol && calendar->next_event != NULL)
		calendar->eol = 0;

	return 1;
}

/**
 * @brief
 * 		add_timed_event - add an event to a sorted list of events
 *
 * @note
 *		ASSUMPTION: if multiple events are at the same time, all
 *		    end events will come first
 *
 * @param	events - event list to add event to
 * @param 	te     - timed_event to add to list
 *
 * @return	head of timed_event list
 */
timed_event *
add_timed_event(timed_event *events, timed_event *te)
{
	timed_event *eloop;
	timed_event *eloop_prev = NULL;

	if (te == NULL)
		return events;

	if (events == NULL)
		return te;

	for (eloop = events; eloop != NULL; eloop = eloop->next) {
		if (eloop->event_time > te->event_time)
			break;
		if (eloop->event_time == te->event_time &&
		    te->event_type == TIMED_END_EVENT) {
			break;
		}

		eloop_prev = eloop;
	}

	if (eloop_prev == NULL) {
		te->next = events;
		events->prev = te;
		te->prev = NULL;
		return te;
	}

	te->next = eloop;
	eloop_prev->next = te;
	te->prev = eloop_prev;
	if (eloop != NULL)
		eloop->prev = te;

	return events;
}

/**
 * @brief
 * 		delete a timed event from an event_list
 *
 * @param[in] sinfo    - sinfo which contains calendar to delete from
 * @param[in] e        - event to delete
 *
 * @return void
 */

void
delete_event(server_info *sinfo, timed_event *e)
{
	event_list *calendar;

	if (sinfo == NULL || e == NULL)
		return;

	calendar = sinfo->calendar;

	if (calendar->next_event == e)
		calendar->next_event = e->next;

	if (calendar->first_run_event == e)
		calendar->first_run_event = find_timed_event(calendar->events, TIMED_RUN_EVENT);

	if (e->prev == NULL)
		calendar->events = e->next;
	else
		e->prev->next = e->next;

	if (e->next != NULL)
		e->next->prev = e->prev;

	free_timed_event(e);
}

/**
 * @brief
 *		create_event - create a timed_event with the passed in arguemtns
 *
 * @param[in]	event_type - event_type member
 * @param[in] 	event_time - event_time member
 * @param[in] 	event_ptr  - event_ptr member
 * @param[in] 	event_func - event_func function pointer member
 *
 * @return	newly created timed_event
 * @retval	NULL	: on error
 */
timed_event *
create_event(enum timed_event_types event_type,
	     time_t event_time, event_ptr_t *event_ptr,
	     event_func_t event_func, void *event_func_arg)
{
	timed_event *te;

	if (event_ptr == NULL)
		return NULL;

	te = new_timed_event();
	if (te == NULL)
		return NULL;

	te->event_type = event_type;
	te->event_time = event_time;
	te->event_ptr = event_ptr;
	te->event_func = event_func;
	te->event_func_arg = event_func_arg;

	if (event_type & TIMED_RUN_EVENT)
		static_cast<resource_resv *>(event_ptr)->run_event = te;
	if (event_type & TIMED_END_EVENT)
		static_cast<resource_resv *>(event_ptr)->end_event = te;

	if (determine_event_name(te) == 0) {
		free_timed_event(te);
		return NULL;
	}

	return te;
}

/**
 * @brief
 *		determine_event_name - determine a timed events name based off of
 *				event type and sets it
 *
 * @param[in]	te	-	the event
 *
 * @par Side Effects
 *		te -> name is set to static data or data owned by other entities.
 *		It should not be freed.
 *
 * @return	int
 * @retval	1	: if the name was successfully set
 * @retval	0	: if not
 */
int
determine_event_name(timed_event *te)
{
	const char *name;

	if (te == NULL)
		return 0;

	switch (te->event_type) {
		case TIMED_RUN_EVENT:
		case TIMED_END_EVENT:
			te->name = static_cast<resource_resv *>(te->event_ptr)->name;
			break;
		case TIMED_POLICY_EVENT:
			name = policy_change_to_str(te);
			if (name != NULL)
				te->name = name;
			else
				te->name = "policy change";
			break;
		case TIMED_DED_START_EVENT:
			te->name = "dedtime_start";
			break;
		case TIMED_DED_END_EVENT:
			te->name = "dedtime_end";
			break;
		case TIMED_NODE_UP_EVENT:
		case TIMED_NODE_DOWN_EVENT:
			te->name = static_cast<node_info *>(te->event_ptr)->name;
			break;
		default:
			log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING,
				   __func__, "Unknown event type: %d", (int) te->event_type);
			return 0;
	}

	return 1;
}

/**
 * @brief
 * 		update dedicated time policy
 *
 * @param[in] policy - policy info (contains dedicated time policy)
 * @param[in] arg    - "START" or "END"
 *
 * @return int
 * @retval 1 : success
 * @retval 0 : failure/error
 *
 */

int
dedtime_change(status *policy, void *arg)
{
	char *event_arg;

	if (policy == NULL || arg == NULL)
		return 0;

	event_arg = (char *) arg;

	if (strcmp(event_arg, DEDTIME_START) == 0)
		policy->is_ded_time = 1;
	else if (strcmp(event_arg, DEDTIME_END) == 0)
		policy->is_ded_time = 0;
	else {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING,
			  __func__, "unknown dedicated time change");
		return 0;
	}

	return 1;
}

/**
 * @brief
 * 		add the dedicated time events from conf
 *
 * @param[in] elist 	- the event list to add the dedicated time events to
 * @param[in] policy 	- status structure for the dedicated time events
 *
 *	@retval 1 : success
 *	@retval 0 : failure
 */
int
add_dedtime_events(event_list *elist, status *policy)
{
	if (elist == NULL)
		return 0;

	for (const auto &dt : conf.ded_time) {
		auto te_start = create_event(TIMED_DED_START_EVENT, dt.from, policy, (event_func_t) dedtime_change, (void *) DEDTIME_START);
		if (te_start == NULL)
			return 0;

		auto te_end = create_event(TIMED_DED_END_EVENT, dt.to, policy, (event_func_t) dedtime_change, (void *) DEDTIME_END);
		if (te_end == NULL) {
			free_timed_event(te_start);
			return 0;
		}

		add_event(elist, te_start);
		add_event(elist, te_end);
	}
	return 1;
}

/**
 * @brief
 * 		simulate the minimum amount of a resource list
 *		for an event list until a point in time.  The
 *		comparison we are simulating the minimum for is
 *		(resources_available.foo - resources_assigned.foo)
 *		The minimum is simulated by holding resources_available
 *		constant and maximizing the resources_assigned value
 *
 * @note
 * 		This function only simulates START and END events.  If at some
 *		point in the future we start simulating events such as
 *		qmgr -c 's s resources_available.ncpus + =5' this function will
 *		will have to be revisited.
 *
 * @param[in] reslist	- resource list to simulate
 * @param[in] end	- end time
 * @param[in] calendar	- calendar to simulate
 * @param[in] incl_arr	- only use events for resresvs in this array (can be NULL)
 * @param[in] exclude	- job/resv to ignore (possibly NULL)
 *
 * @return static pointer to amount of resources available during
 * @retval the entire length from now to end
 * @retval	NULL	: on error
 *
 * @par MT-safe: No
 */
schd_resource *
simulate_resmin(schd_resource *reslist, time_t end, event_list *calendar,
		resource_resv **incl_arr, resource_resv *exclude)
{
	static schd_resource *retres = NULL; /* return pointer */

	schd_resource *cur_res;
	schd_resource *cur_resmin;
	schd_resource *res;
	schd_resource *resmin = NULL;
	timed_event *te;
	unsigned int event_mask = (TIMED_RUN_EVENT | TIMED_END_EVENT);

	if (reslist == NULL)
		return NULL;

	/* if there is no calendar, then there is nothing to do */
	if (calendar == NULL)
		return reslist;

	/* If there are no run events in the calendar between now and the end time
	 * then there is nothing to do. Nothing will reduce resources (only increase)
	 */
	if (exists_run_event(calendar, end) == 0)
		return reslist;

	if (retres != NULL) {
		free_resource_list(retres);
		retres = NULL;
	}

	if ((res = dup_resource_list(reslist)) == NULL)
		return NULL;
	if ((resmin = dup_resource_list(reslist)) == NULL) {
		free_resource_list(res);
		return NULL;
	}

	te = get_next_event(calendar);
	for (te = find_init_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask);
	     te != NULL && (end == 0 || te->event_time < end);
	     te = find_next_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask)) {
		auto resresv = static_cast<resource_resv *>(te->event_ptr);
		if (incl_arr == NULL || find_resource_resv_by_indrank(incl_arr, -1, resresv->rank) != NULL) {
			if (resresv != exclude) {
				for (auto req = resresv->resreq; req != NULL; req = req->next) {
					if (req->type.is_consumable) {
						cur_res = find_alloc_resource(res, req->def);

						if (cur_res == NULL) {
							free_resource_list(res);
							free_resource_list(resmin);
							return NULL;
						}

						if (te->event_type == TIMED_RUN_EVENT)
							cur_res->assigned += req->amount;
						else
							cur_res->assigned -= req->amount;

						cur_resmin = find_alloc_resource(resmin, req->def);
						if (cur_resmin == NULL) {
							free_resource_list(res);
							free_resource_list(resmin);
							return NULL;
						}
						if (cur_res->assigned > cur_resmin->assigned)
							cur_resmin->assigned = cur_res->assigned;
					}
				}
			}
		}
	}
	free_resource_list(res);
	retres = resmin;
	return retres;
}

/**
 * @brief
 * 		return a printable name for a policy change event
 *
 * @param[in]	te	-	policy change timed event
 *
 * @return	printable string name of policy change event
 * @retval	NULL	: if not found or error
 */
const char *
policy_change_to_str(timed_event *te)
{
	int i;
	if (te == NULL)
		return NULL;

	for (i = 0; policy_change_func_name[i].func != NULL; i++) {
		if (te->event_func == policy_change_func_name[i].func)
			return policy_change_func_name[i].str;
	}

	return NULL;
}

/**
 * @brief
 * 		should we do anything on policy change events
 *
 * @param[in] sinfo 	- server
 * @param[in] resresv 	- a resresv to check
 *
 * @return	int
 * @retval	1	: there is something to do
 * @retval 	0 	: nothing to do
 * @retval 	-1 	: error
 *
 */
int
policy_change_info(server_info *sinfo, resource_resv *resresv)
{
	status *policy;

	if (sinfo == NULL || sinfo->policy == NULL)
		return -1;

	policy = sinfo->policy;

	/* check to see if we may be holding resoures by backfilling during one
	 * prime status, just to turn it off in the next, thus increasing the
	 * resource pool
	 */
	if (conf.prime_bf != conf.non_prime_bf)
		return 1;

	/* check to see if we're backfilling around prime status changes
	 * if we are, we may have been holding up running jobs until the next
	 * prime status change.  In this case, we have something to do at a status
	 * change.
	 * We only have to worry if prime_exempt_anytime_queues is false.  If it is
	 * True, backfill_prime only affects prime or non-prime queues which we
	 * handle below.
	 */
	if (!conf.prime_exempt_anytime_queues &&
	    (conf.prime_bp + conf.non_prime_bp >= 1))
		return 1;

	if (resresv != NULL) {
		if (resresv->is_job && resresv->job != NULL) {
			if (policy->is_ded_time && resresv->job->queue->is_ded_queue)
				return 1;
			if (policy->is_prime == PRIME &&
			    resresv->job->queue->is_prime_queue)
				return 1;
			if (policy->is_prime == NON_PRIME &&
			    resresv->job->queue->is_nonprime_queue)
				return 1;
		}

		return 0;
	}

	if (policy->is_ded_time && sinfo->has_ded_queue) {
		for (auto qinfo : sinfo->queues) {
			if (qinfo->is_ded_queue &&
			    qinfo->jobs != NULL)
				return 1;
		}
	}
	if (policy->is_prime == PRIME && sinfo->has_prime_queue) {
		for (auto qinfo : sinfo->queues) {
			if (qinfo->is_prime_queue &&
			    qinfo->jobs != NULL)
				return 1;
		}
	}
	if (policy->is_prime == NON_PRIME && sinfo->has_nonprime_queue) {
		for (auto qinfo : sinfo->queues) {
			if (qinfo->is_nonprime_queue &&
			    qinfo->jobs != NULL)
				return 1;
		}
	}
	return 0;
}

/**
 * @brief
 * 		takes a bitfield returned by simulate_events and will determine if
 *      the amount resources have gone up down, or are unchanged.  If events
 *	  	caused resources to be both freed and used, we err on the side of
 *	  	caution and say there are more resources.
 *
 * @param[in]	simret	-	return bitfield from simulate_events
 *
 * @retval	1 : more resources are available for use
 * @retval  0 : resources have not changed
 * @retval -1 : less resources are available for use
 */
int
describe_simret(unsigned int simret)
{
	unsigned int more =
		(TIMED_END_EVENT | TIMED_DED_END_EVENT | TIMED_NODE_UP_EVENT);
	unsigned int less =
		(TIMED_RUN_EVENT | TIMED_DED_START_EVENT | TIMED_NODE_DOWN_EVENT);

	if (simret & more)
		return 1;
	if (simret & less)
		return -1;

	return 0;
}

/**
 * @brief
 * 		adds event(s) for bringing the node back up after we provision a node
 *
 * @param[in] calnedar 		- event list to add event(s) to
 * @param[in] event_time 	- time of the event
 * @param[in] node 			- node in question
 *
 * @return	success/failure
 * @retval 	1 : on sucess
 * @retval 	0 : in failure/error
 */
int
add_prov_event(event_list *calendar, time_t event_time, node_info *node)
{
	timed_event *te;

	if (calendar == NULL || node == NULL)
		return 0;

	te = create_event(TIMED_NODE_UP_EVENT, event_time, (event_ptr_t *) node,
			  (event_func_t) node_up_event, NULL);
	if (te == NULL)
		return 0;
	add_event(calendar, te);
	/* if the node is resv node, we need to add an event to bring the
	 * server version of the resv node back up
	 */
	if (node->svr_node != NULL) {
		te = create_event(TIMED_NODE_UP_EVENT, event_time,
				  (event_ptr_t *) node->svr_node, (event_func_t) node_up_event, NULL);
		if (te == NULL)
			return 0;
		add_event(calendar, te);
	}
	return 1;
}

/**
 * @brief
 * 		generic simulation function which will call a function pointer over
 *      events of a calendar from now up to (but not including) the end time.
 * @par
 *	  	The simulation works by looping searching for a success or failure.
 *	  	The loop will stop if the function returns 1 for success or -1 for
 *	  	failure.  We continue looping if the function returns 0.  If we run
 *	  	out of events, we return the default passed in.
 *
 * @par Function:
 * 		The function can return three return values
 *	 	>0 success - stop looping and return success
 *	  	0 failure - keep looping
 *	 	<0 failure - stop looping and return failure
 *
 * @param[in] calendar 		- calendar of timed events
 * @param[in] event_mask 	- mask of timed_events which we want to simulate
 * @param[in] end 			- end of simulation (0 means search all events)
 * @param[in] default_ret 	- default return value if we reach the end of the simulation
 * @param[in] func 			- the function to call on each timed event
 * @param[in] arg1 			- generic arg1 to function
 * @param[in] arg2 			- generic arg2 to function
 *
 * @return success of simulate
 * @retval 1 : if simulation is success
 * @retval 0 : if func returns failure or there is an error
 */
int
generic_sim(event_list *calendar, unsigned int event_mask, time_t end, int default_ret,
	    int (*func)(timed_event *, void *, void *), void *arg1, void *arg2)
{
	timed_event *te;
	int rc = 0;
	if (calendar == NULL || func == NULL)
		return 0;

	/* We need to handle the calendar's initial event special because
	 * get_next_event() only returns the calendar's next_event member.
	 * We need to make sure the initial event is of the correct type.
	 */
	te = get_next_event(calendar);

	for (te = find_init_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask);
	     te != NULL && rc == 0 && (end == 0 || te->event_time < end);
	     te = find_next_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask)) {
		rc = func(te, arg1, arg2);
	}

	if (rc > 0)
		return 1;
	else if (rc < 0)
		return 0;

	return default_ret;
}


================================================
FILE: src/scheduler/simulate.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _SIMULATE_H
#define _SIMULATE_H

#include "data_types.h"
#include "constant.h"

/*
 *	simulate_events - simulate the future of a PBS universe
 */
unsigned int
simulate_events(status *policy, server_info *sinfo,
		enum schd_simulate_cmd cmd, void *arg, time_t *sim_time);

/*
 *	is_timed - check if a resresv is a timed event
 * 			 (i.e. has a start and end time)
 */
int is_timed(event_ptr_t *event_ptr);

/*
 *      get_next_event - get the next_event from an event list
 *
 *        \param elist - the event list
 *
 *      \return the current event from the event list
 */
timed_event *get_next_event(event_list *elist);

/*
 * find the initial event based on a timed_event
 *
 *	event            - the current event
 *	ignore_disabled  - ignore disabled events
 *	search_type_mask - bitmask of types of events to search
 *
 *	returns the initial event of the correct type/disabled or not
 *
 *	NOTE: IGNORE_DISABLED_EVENTS exists to be passed in as the
 *		   ignore_disabled parameter.  It is non-zero.
 *
 *	NOTE: ALL_MASK can be passed in for search_type_mask to search
 *		   for all events types
 */
timed_event *find_init_timed_event(timed_event *event, int ignore_disabled, unsigned int search_type_mask);
/*
 *
 *	find_next_timed_event - find the next event based on a timed_event
 *
 *	event            - the current event
 *	ignore_disabled  - ignore disabled events
 *	search_type_mask - bitmask of types of events to search
 *
 *	return the next timed event of the correct type and disabled or not
 */
timed_event *find_next_timed_event(timed_event *event, int ignore_disabled, unsigned int search_type_mask);

/*
 *
 *	find the previous event based on a timed_event
 *
 *	  event            - the current event
 *	  ignore_disabled  - ignore disabled events
 *	  search_type_mask - bitmask of types of events to search
 *
 *	return the previous timed event of the correct type and disabled or not
 */
timed_event *find_prev_timed_event(timed_event *event, int ignore_disabled, unsigned int search_type_mask);

/*
 *      set_timed_event_disabled - set the timed_event disabled bit
 *
 *        te       - timed event to set
 *        disabled - used to set the disabled bit
 *
 *      return nothing
 */
void set_timed_event_disabled(timed_event *te, int disabled);

/*
 *
 *	find_timed_event - find a timed_event
 *			   we need to search by name and type because there
 *			   can be multiple events with the same name and
 *			   different types
 *
 *	  te_list - timed_event list to search in
 *	  ignore_disabled - ignore disabled events
 *	  name    - name of timed_event to search for
 *	  event_type - event_type or TIMED_LOW to ignore
 *	  event_time - time or 0 to ignore
 *
 *	return found timed_event or NULL
 *
 */
timed_event *
find_timed_event(timed_event *te_list, const std::string &name, int ignore_disabled,
		 enum timed_event_types event_type, time_t event_time);
timed_event *find_timed_event(timed_event *te_list, int ignore_disabled, enum timed_event_types event_type, time_t event_time);
timed_event *find_timed_event(timed_event *te_list, enum timed_event_types event_type);
timed_event *find_timed_event(timed_event *te_list, const std::string &name, enum timed_event_types event_type, time_t event_time);
timed_event *find_timed_event(timed_event *te_list, time_t event_time);

/*
 *      next_event - move an event_list to the next event and return it
 *
 *        \param elist - the event list
 *
 *      \return the next event or NULL if there are no more events
 */
timed_event *next_event(server_info *sinfo, int advance);

/*
 *      perform_event - takes a timed_event and performs any actions
 *                      required by the event to be completed.  Currently
 *                      only handles run and end events.
 *
 *        \param event - the event to peform
 *
 *      \return succss 1 /failure 0
 */
int perform_event(status *policy, timed_event *event);

/*
 *      create_event_list - create an event_list from running jobs and
 *                              confirmed reservations
 *
 *        \param sinfo - server universe to act upon
 *
 *      \return event_list
 */
event_list *create_event_list(server_info *sinfo);

/*
 *	exists_run_event - returns 1 if there exists a timed run event in
 *				the event list between the current event
 *				and the last event, or the end time if it is
 *				set
 *
 *	  calendar - event list
 *	  end_time - optional end time (0 means search all events)
 *
 *	returns 1: there exists a run event
 *		0: there doesn't exist a run event
 */
int exists_run_event(event_list *calendar, time_t end);

/* Checks to see if there is a run event on a node before the end time */
int exists_run_event_on_node(node_info *ninf, time_t end);

/* Checks if a reservation run event exists between now and 'end' */
int exists_resv_event(event_list *calendar, time_t end);

/*
 *      create_events - creates an timed_event list from running jobs
 *                          and confirmed reservations
 *
 *        \param sinfo - server universe to act upon
 *        \param flags -
 *
 *        \return timed_event list
 */
timed_event *create_events(server_info *sinfo);

/*
 * new_event_list() - event_list constructor
 */
#ifdef NAS /* localmod 005 */
event_list *new_event_list(void);
#else
event_list *new_event_list();
#endif /* localmod 005 */

/*
 *      dup_event_list() - evevnt_list copy constructor
 *
 *        \param oel - event list to copy
 *        \param nsinfo - new universe
 *
 *      \return duplicated event_list
 */
event_list *dup_event_list(event_list *oelist, server_info *nsinfo);

/*
 * free_event_list - event_list destructor
 */
void free_event_list(event_list *elist);

/*
 * new_timed_event() - timed_event constructor
 */
#ifdef NAS /* localmod 005 */
timed_event *new_timed_event(void);
#else
timed_event *new_timed_event();
#endif /* localmod 005 */

/*
 * dup_timed_event() - timed_event copy constructor
 *
 *   \param ote - timed_event to copy
 *   \param nsinfo - "new" universe where to find the event_ptr
 */
timed_event *dup_timed_event(timed_event *ote, server_info *nsinfo);

/*
 *      dup_timed_event_list() - timed_event copy constructor for a list
 *
 *        \param ote_list - list of timed_events to copy
 *        \param nsinfo - "new" universe where to find the event_ptr
 */
timed_event *dup_timed_event_list(timed_event *ote_list, server_info *nsinfo);

/*
 * free_timed_event - timed_event destructor
 */
void free_timed_event(timed_event *te);

/*
 * free_timed_event_list - destructor for a list of timed_event structures
 */
void free_timed_event_list(timed_event *te_list);

#ifndef NAS /* localmod 005 */
/*
 * new_event_list - event_list constructor
 */
event_list *new_event_list();

/*
 *      dup_event_list - event_list copy constructor
 *
 *        \param oel    - event list to copy
 *        \param nsinfo - "new" universe to find event pointers from
 */
event_list *dup_event_list(event_list *oel, server_info *nsinfo);

/*
 *      free_event_list - event_list destructor
 *
 *        \param el - event_list to free
 */
void free_event_list(event_list *el);
#endif /* localmod 005 */

/*
 *      find_event_by_name - find an event by event name
 *
 *        \param events - list of timed_event structures to search
 *        \param name   - name of event to search for
 *
 *      \return found timed_event or NULL
 */
timed_event *find_event_by_name(timed_event *events, char *name);

/*
 *      add_timed_event - add an event to a sorted list of events
 *
 *      ASSUMPTION: if multiple events are at the same time, all
 *                  end events will come first
 *
 *        \param events - event list to add event to
 *        \param te     - timed_event to add to list
 *
 *      \return head of timed_event list
 */
timed_event *add_timed_event(timed_event *events, timed_event *te);
/*
 *
 *	add_event - add a timed_event to an event list
 *
 *	  calendar - event list
 *	  te       - timed event
 *
 *	return 1 success / 0 failure
 *
 */
int add_event(event_list *calendar, timed_event *te);

/*
 *	delete_event - delete a timed event from an event list
 */
void delete_event(server_info *sinfo, timed_event *e);

/*
 *      create_event - create a timed_event with the passed in arguemtns
 *
 *        \param event_type - event_type member
 *        \param event_time - event_time member
 *        \param event_ptr  - event_ptr member
 *
 *      \return newly created timed_event or NULL on error
 */
timed_event *
create_event(enum timed_event_types event_type,
	     time_t event_time, event_ptr_t *event_ptr,
	     event_func_t event_func, void *event_func_arg);

/*
 *	calc_run_time - calculate the run time of a job
 *
 *	returns time_t of when the job will run
 *		or -1 on error
 */
time_t calc_run_time(const std::string &name, server_info *sinfo, int flags);

/*
 *
 *	find_event_ptr - find the correct event pointer for the duplicated
 *			 event based on event type
 *
 *	  \param ote    - old event
 *	  \param nsinfo - "new" universe
 *
 * 	\return event_ptr in new universe or NULL on error
 */
event_ptr_t *find_event_ptr(timed_event *ote, server_info *nsinfo);
/*
 *	determine_event_name - determine a timed events name based off of
 *				event type and sets it
 *
 *	  \param te - the event
 *
 *	\par Side Effects
 *	te -> name is set to static data or data owned by other entities.
 *	It should not be freed.
 *
 *	\returns 1 if the name was successfully set 0 if not
 */
int determine_event_name(timed_event *te);

/*
 *	dedtime_change - update dedicated time policy
 *
 *	  \param policy - status structure to update dedicated time policy
 *	  \param arg    - "START" or "END"
 *
 *	\return success 1 or failure/error 0
 */
int dedtime_change(status *policy, void *arg);

/*
 *	add_dedtime_events - add the dedicated time events from conf
 *
 *	  \param elist - the event list to add the dedicated time events to
 *
 *	\return success 1 / failure 0
 */
int add_dedtime_events(event_list *elist, struct status *policy);

/*
 *
 *	simulate_resmin - simulate the minimum amount of a resource list
 *			  for an event list until a point in time
 *
 *	  reslist  - resource list to simulate
 *	  end	  - end time
 *	  calendar - calendar to simulate
 *	  incl_arr - only use events for resresvs in this array (can be NULL)
 *	  exclude	  - job/resv to ignore (possibly NULL)
 *
 *	return static pointer to amount of resources available during
 *	return the entire length from now to end
 */
schd_resource *
simulate_resmin(schd_resource *reslist, time_t end, event_list *calendar,
		resource_resv **incl_arr, resource_resv *exclude);

/*
 *
 *	policy_change_to_str - return a printable name for a policy change event
 *
 *	  te - policy change timed event
 *
 *	return printable string name of policy change event
 */
const char *policy_change_to_str(timed_event *te);

/*
 * policy_change_info - should we do anything on policy change events
 */
int policy_change_info(server_info *sinfo, resource_resv *resresv);
/*
 *        takes a bitfield returned by simulate_events and will determine if
 *        the amount resources have gone up down, or are unchanged.  If events
 *	  caused resources to be both freed and used, we err on the side of
 *	  caution and say there are more resources.
 */
int describe_simret(unsigned int simret);

/*
 *       adds event(s) for bringing the node back up after we provision a node
 */
int add_prov_event(event_list *calendar, time_t event_time, node_info *node);

/*
 * generic simulation function which will call a function pointer over
 * a calendar from now to an end time.  The simulation will continue
 * until the end of the calendar or until the function returns <=0.
 */
int
generic_sim(event_list *calendar, unsigned int event_mask, time_t end, int default_ret,
	    int (*func)(timed_event *, void *, void *), void *arg1, void *arg2);

te_list *new_te_list();

te_list *dup_te_list(te_list *ote, timed_event *new_timed_event_list);
te_list *dup_te_lists(te_list *ote, timed_event *new_timed_event_list);

void free_te_list(te_list *tel);

int add_te_list(te_list **tel, timed_event *te);
int remove_te_list(te_list **tel, timed_event *e);

#endif /* _SIMULATE_H */


================================================
FILE: src/scheduler/site_code.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 *=====================================================================
 * site_code.c - Code to implement site-specific scheduler functions
 *=====================================================================
 */

// clang-format off

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <pbs_error.h>
#include <pbs_ifl.h>
#include <regex.h>
#include <sched_cmds.h>
#include <time.h>
#include <limits.h>
#include <assert.h>
#include "log.h"
#include "data_types.h"
#include "fifo.h"
#include "queue_info.h"
#include "server_info.h"
#include "node_info.h"
#include "check.h"
#include "constant.h"
#include "job_info.h"
#include "misc.h"
#include "config.h"
#include "sort.h"
#include "parse.h"
#include "globals.h"
#include "prev_job_info.h"
#include "fairshare.h"
#include "prime.h"
#include "dedtime.h"
#include "resv_info.h"
#include "range.h"
#include "resource.h"
#include "resource_resv.h"
#include "simulate.h"

#ifdef NAS

#include "site_data.h"
#include "site_code.h"
#include "site_queue.h"

#define TJ_COST_MAX	10.0	/* Max CPU to spend searching for top jobs */
/* Global NAS variables */
/* localmod 030 */
int do_soft_cycle_interrupt;
int do_hard_cycle_interrupt;
int consecutive_interrupted_cycles = 0;
time_t interrupted_cycle_start_time;
/* localmod 038 */
int num_topjobs_per_queues;      /* # of per_queues top jobs on the calendar */

struct	shr_type {
	struct shr_type	*next;
	int		sh_tidx;	/* type index */
	int		sh_cls;		/* index into sh_amt arrays */
	int		cpus_per_node;	/* guess as to CPUs per node of type */
	char		name[4];	/* actually as long as needed */
};
struct	shr_class {
	struct shr_class *next;
	int		sh_cls;		/* index into sh_amt arrays */
	char		name[4];	/* actually as long as needed */
};

static void bump_share_count(share_info *, enum site_j_share_type, sh_amt *, int);
static void bump_demand_count(share_info *, enum site_j_share_type, sh_amt *, int);
static void clear_topjob_counts(share_info* root);
static int check_cpu_share(share_head* sh, resource_resv* resv);
static void count_active_cpus(resource_resv **, int, sh_amt *);
static void count_demand_cpus(resource_resv **, int);
static void count_contrib_cpus(share_info *, share_info *, sh_amt *);
static void count_cpus(node_info **, int ncnt, queue_info **, sh_amt *);
static void set_share_cpus(share_info *node, sh_amt *, sh_amt *);
static void zero_share_counts(share_info *node);

static int dup_shares(share_head *oldsh, server_info *nsinfo);
static share_info *dup_share_tree(share_info *oroot);
static share_info *find_entity_share(char *name, share_info *node);
static share_info *find_most_favored_share(share_info* root, int topjobs);
static int find_share_class(struct shr_class *head, char *name);
static share_info *find_share_group(share_info *root, char *name);
static site_user_info *find_user(site_user_info **head, char *name);
/* static int find_share_type(struct shr_type *head, char *name); */
static void free_share_head(share_head *sh, int flag);
static void free_share_tree(share_info *root);
static void free_users(site_user_info **);
static double get_share_ratio(sh_amt*, sh_amt*, sh_amt_array*);
static int init_users(server_info *);
static void list_share_info(FILE *, share_info *, const char *, int, const char *, int);
static struct share_head* new_share_head(int cnt);
static share_info* new_share_info(char *name, int cnt);
static share_info* new_share_info_clone(share_info *old);
static int reconcile_shares(share_info *root, int cnt);
static int reconcile_share_tree(share_info *root, share_info *def, int cnt);
/* static struct shr_class* shr_class_info_by_idx(int); */
/* static struct shr_class* shr_class_info_by_name(const char *); */
static char* shr_class_name_by_idx(int);
/* static struct shr_class* shr_class_info_by_type_name(const char *); */
static struct shr_type* shr_type_info_by_idx(int);
static struct shr_type* shr_type_info_by_name(const char *);
static void squirrel_shr_head(server_info *sinfo);
static void un_squirrel_shr_head(server_info *sinfo);
static void squirrel_shr_tree(share_info *root);
static void un_squirrel_shr_tree(share_info *root);

typedef		int (pick_next_filter)(resource_resv *, share_info *);

static resource_resv* pick_next_job(status *, resource_resv **, int (*)(), share_info *);

#ifdef	NAS_HWY149
static int job_filter_hwy149(resource_resv *, share_info *);
#endif
static int job_filter_dedres(resource_resv *, share_info *);
#ifdef	NAS_HWY101
static int job_filter_hwy101(resource_resv *, share_info *);
#endif
static int job_filter_normal(resource_resv *, share_info *);

/*
 * Private variables used by CPU allocations code
 */

static	struct shr_class *shr_classes = NULL;
static	int		shr_class_count = 0;
static	struct shr_type	*shr_types = NULL;
static	int		shr_type_count = 0;
static	char		*shr_selector = NULL;
static	share_head	*cur_shr_head = NULL;

/*
 * Other private variables
 */
static	site_user_info	*users = NULL;

/*
 *=====================================================================
 * External functions
 *=====================================================================
 */


/*
 *=====================================================================
 * site_bump_topjobs(resv, delta) - Increment topjob count for job's
 *	share group
 * Entry:	resv = resource_resv for job
 *		delta = CPU time needed to calendar the job
 * Returns:	new value for topjob count
 *=====================================================================
 */
int
site_bump_topjobs(resource_resv *resv, double delta)
{
	job_info*	job;
	share_info*	si;

	if (resv == NULL || !resv->is_job || (job = resv->job) == NULL)
		return 0;
	if ((si = job->sh_info) == NULL || (si = si->leader) == NULL)
		return 0;
	si->tj_cpu_cost += delta;
#ifdef NAS_DEBUG
	printf("YYY %s %d %g %g %g\n", si->name, si->topjob_count+1,
		si->ratio, si->ratio_max, si->tj_cpu_cost);
	fflush(stdout);
#endif
	return ++(si->topjob_count);
}


/*
 *=====================================================================
 * site_check_cpu_share(sinfo, resv) - Check whether job
 *			would exceed any group CPU allocation.
 * Entry:	sinfo = Server info
 *		policy = policy in effect at current time
 *		resv = job/reservation
 * Returns:	0 if job not blocked
 *		<> if blocked by group CPU allocation
 *=====================================================================
 */
int
site_check_cpu_share(server_info *sinfo, status *policy, resource_resv *resv)
{
	int		rc = 0;		/* Assume okay */
	job_info	*job;
	share_head	*sh;		/* global share totals */
	timed_event	*te;
	long		time_left, end;
	unsigned int	event_mask;

	if (sinfo == NULL || policy == NULL || resv == NULL)
		return 0;
	if (!resv->is_job || (job = resv->job) == NULL)
		return 0;
	if ((sh = sinfo->share_head) == NULL)
		return 0;
	/* Allow accumulating shares, but not enforcing them */
	if (policy->shares_track_only)
		return 0;
	/*
	 * Skip rest if job exempt from limits
	 */
	if (resv->share_type == J_TYPE_ignore)
		return 0;
#ifdef	NAS_HWY149
	if (job->NAS_pri == NAS_HWY149)
		return 0;
#endif
#ifdef	NAS_HWY101
	if (job->NAS_pri == NAS_HWY101)
		return 0;
#endif
	if (job->resv != NULL)
		return 0;		/* job running in reservation */

	rc = check_cpu_share(sh, resv);
	if (rc != 0) {
		/*
		 * Job cannot run now
		 */
		return rc;
	}
	/*
	 * See if would conflict with anything on calendar
	 */
	if (sinfo->calendar == NULL)
		return rc;
	time_left = calc_time_left(resv, 0);
	end = sinfo->server_time + time_left;
	if (!exists_run_event(sinfo->calendar, end))
		return rc;
	squirrel_shr_head(sinfo);
	te = get_next_event(sinfo->calendar);
	event_mask = TIMED_RUN_EVENT | TIMED_END_EVENT;
	for (te = find_init_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask);
		te != NULL && te->event_time < end;
		te = find_next_timed_event(te, IGNORE_DISABLED_EVENTS, event_mask)) {

		resource_resv *te_rr;

		te_rr = (resource_resv *) te->event_ptr;
		if (te_rr == resv)
			continue;		/* Should not happen */
		if (te->event_type == TIMED_RUN_EVENT) {
			site_update_on_run(sinfo, NULL, te_rr, 0, NULL);
			rc = check_cpu_share(sh, resv);
			if (rc != 0) {
				rc = BACKFILL_CONFLICT;
				break;
			}
		}
		if (te->event_type == TIMED_END_EVENT) {
			site_update_on_end(sinfo, NULL, te_rr);
			/* Next test should never catch anything */
			rc = check_cpu_share(sh, resv);
			if (rc != 0) {
				rc = BACKFILL_CONFLICT;
				break;
			}
		}
	}
	un_squirrel_shr_head(sinfo);
	return rc;
}


/*
 *=====================================================================
 * check_cpu_share(sinfo, resv) - Check whether job would exceed CPU
 *		shares at this instant in time.
 * Entry:	sh = global share totals
 *		resv = resource reservation to check
 *=====================================================================
 */
static int
check_cpu_share(share_head *sh, resource_resv *resv)
{
	int		rc = 0;		/* Assume okay */
	job_info	*job;
	share_info	*leader;	/* info for group leader */
	int		sh_cls;		/* current share class */
	sh_amt		*job_amts;	/* amounts requested by job */

	if (sh == NULL || resv == NULL)
		return rc;
	if ((job = resv->job) == NULL)
		return rc;
	leader = job->sh_info;
	if (leader == NULL || (leader = leader->leader) == NULL)
		return 0;
	job_amts = job->sh_amts;
	if (job_amts == NULL)
		return 0;
	/*
	 * Precedence of blockages: high to low
	 * GROUP_CPU_INSUFFICIENT
	 * GROUP_CPU_SHARE
	 * none
	 */
	for (sh_cls = 0; sh_cls < shr_class_count ; ++sh_cls) {
		int limited, borrowed, allocated;
		int asking;
		int rc2 = 0;

		asking = job_amts[sh_cls];
#if	NAS_CPU_MULT > 1
		if (asking % NAS_CPU_MULT) {
			/*
			 * Round to multiple of NAS_CPU_MULT
			 */
			asking += NAS_CPU_MULT - (asking % NAS_CPU_MULT);
		}
#endif
		limited = leader->share_inuse[sh_cls][J_TYPE_limited];
		borrowed = leader->share_inuse[sh_cls][J_TYPE_borrow];
		allocated = leader->share_ncpus[sh_cls];

		switch (resv->share_type) {
			case J_TYPE_limited:
				/*
				 * If job exceeds share by itself
				 */
				if (asking > allocated) {
					rc2 = GROUP_CPU_INSUFFICIENT;
					break;
				}
				/*
				 * If total limited jobs would exceed share
				 */
				if (asking + limited > allocated) {
					rc2 = GROUP_CPU_SHARE;
					break;
				}
				/* Fall through */
			case J_TYPE_borrow:
				/*
				 * Have we borrowed too much
				 */
				if (asking + limited + borrowed >
					allocated + sh->sh_contrib[sh_cls]) {
					rc2 = GROUP_CPU_SHARE;
					break;
				}
				break;
			default:
				;
		}
		/*
		 * Remember most important limit among shares
		 */
		if (rc == 0 || rc2 == GROUP_CPU_INSUFFICIENT) rc = rc2;
	}
	return rc;
}


/*
 *=====================================================================
 * site_decode_time(str) - decode time string
 * (Based on decode_time in attr_fn_time.c)
 * Entry:	str = string in hh:mm:ss format
 * Returns:	value of str in seconds
 *=====================================================================
 */
#define PBS_MAX_TIME (LONG_MAX - 1)
time_t
site_decode_time(const char *val)
{
	int   i;
	char  msec[4];
	int   ncolon = 0;
	char *pc;
	time_t  rv = 0;
	char *workval;
	char *workvalsv;

	if (val == NULL || *val == '\0') {
		return (0);
	}

	workval = strdup(val);
	workvalsv = workval;

	for (i = 0; i < 3; ++i)
		msec[i] = '0';
	msec[i] = '\0';

	for (pc = workval; *pc; ++pc) {

		if (*pc == ':') {
			if (++ncolon > 2)
				goto badval;
			*pc = '\0';
			rv = (rv * 60) + atoi(workval);
			workval = pc + 1;

		} else if (*pc == '.') {
			*pc++ = '\0';
			for (i = 0; (i < 3) && *pc; ++i)
				msec[i] = *pc++;
			break;
		} else if (!isdigit((int)*pc)) {
			goto badval;	/* bad value */
		}
	}
	rv = (rv * 60) + atoi(workval);
	if (rv > PBS_MAX_TIME)
		goto badval;
	if (atoi(msec) >= 500)
		rv++;
	(void)free(workvalsv);
	return (rv);

	badval:	(void)free(workvalsv);
	return (0);
}


/*
 *=====================================================================
 * site_dup_shares( osinfo, nsinfo ) - Duplicate share info.
 * Entry:	osinfo = ptr to current server info
 *		nsinfo = ptr to new server info
 *			jobs[] in nsinfo must be filled in already
 * Returns:	1 if duped okay, else 0
 * Sets		nsinfo->share_head
 *=====================================================================
 */
int
site_dup_shares(server_info *osinfo, server_info *nsinfo)
{
	share_head	*oldsh;
	resource_resv	*resv;
	int		i;

	if (osinfo == NULL || nsinfo == NULL)
		return 0;
	if ((oldsh = osinfo->share_head) == NULL) {
		/*
		 * If not using shares, done.
		 */
		return 1;
	}
	if (oldsh->root == NULL)
		return 0;
	if (!dup_shares(oldsh, nsinfo))
		return 0;
	/*
	 * Need to go through copy of jobs and point them into the new tree
	 */
	for (i = 0; i < nsinfo->sc.total; ++i) {
		resv = nsinfo->jobs[i];
		if (!resv->is_job || resv->job == NULL || resv->job->sh_info == NULL)
			continue;
		resv->job->sh_info = resv->job->sh_info->tptr;
	}
	return 1;
}


/*
 *=====================================================================
 * site_dup_share_amts(oldp) - Clone share amount array
 * Entry:	oldp = ptr to existing array
 * Returns:	ptr to copy of old
 *=====================================================================
 */
sh_amt *
site_dup_share_amts(sh_amt *oldp)
{
	sh_amt	*newp;
	size_t	sz;

	if (oldp == NULL)
		return NULL;
	sz = shr_class_count * sizeof(*newp);
	newp = static_cast<sh_amt *>(malloc(sz));
	if (newp == NULL)
		return NULL;
	memcpy(newp, oldp, sz);
	return newp;
}


/*
 *=====================================================================
 * site_find_alloc_share(sinfo, name) - Find share info, allocating new
 *		entry if needed.
 * Entry:	sinfo = Current server info
 *		name = Entity to locate share info for.
 * Returns:	pointer to matching share_info structure,
 *		NULL if no match
 *=====================================================================
 */
share_info *
site_find_alloc_share(server_info *sinfo, char *name)
{
	share_info *	si;
	share_info *	nsi;

	if (sinfo->share_head == NULL || (si = sinfo->share_head->root) == NULL)
		return NULL;
	si = find_entity_share(name, si);
	if (si == NULL) {
		/*
		 * The default group is the root of the tree
		 */
		return sinfo->share_head->root;
	}
	if (si && si->pattern_type == share_info::PATTERN_SEPARATE &&
		strcmp(name, si->name) != 0) {
		/*
		 * On match against SEPARATE pattern, create new entry with
		 * exact match.
		 */
		nsi = new_share_info(name, shr_class_count);
		if (nsi != NULL) {
			nsi->pattern_type = share_info::PATTERN_NONE;
			nsi->leader = si->leader;
			nsi->parent = si;
			if (si->child) {
				for (si = si->child ; si->sibling ; si = si->sibling)
					;
				si->sibling = nsi;
			} else {
				si->child = nsi;
			}
			si = nsi;
		}
	}
	return si;
}


/*
 *=====================================================================
 * site_free_shares(sinfo) - Free cloned share info
 * Entry:	sinfo = server owning cloned info
 *=====================================================================
 */
void
site_free_shares(server_info *sinfo)
{
	share_head	*sh;

	if (sinfo == NULL || (sh = sinfo->share_head) == NULL)
		return;
	free_share_head(sh, 1);
	sinfo->share_head = NULL;
}


/*
 *=====================================================================
 * site_get_sharestatic_cast< resresv >(Get ratio of cpus used to allocated
 * Entry:	resresv = pointer to resource_resv
 * Returns:	Approximate ratio of current CPUs in use to allocation
 *		for job's group.
 *=====================================================================
 */
double
site_get_share(resource_resv *resresv)
{
	job_info	*job;
	share_info	*si;
	double		result = 0.0;

	if (!resresv->is_job ||
		(job = resresv->job) == NULL ||
		(si = job->sh_info) == NULL ||
		(si = si->leader) == NULL)
			return result;
#ifdef	NAS_HWY149
	if (job->priority == NAS_HWY149 || job->NAS_pri == NAS_HWY149) {
		return result;		/* Favor jobs on highway */
	}
#endif
#ifdef	DRT_XXX_NAS_HWY101
	if (job->priority == NAS_HWY101 || job->NAS_pri == NAS_HWY101) {
		return result;		/* Favor jobs on highway */
	}
#endif
	if (resresv->share_type == J_TYPE_ignore) {
		return result;		/* Favor jobs exempt from shares */
	}
	result = get_share_ratio(si->share_ncpus, job->sh_amts,
		si->share_inuse);
	return result;
}


/*
 *=====================================================================
 * site_init_alloc( sinfo ) - Initialize allocated shares CPUs data
 * Entry:	sinfo = ptr to server_info, with all data about jobs,
 *			queues, nodes, etc, already collected.
 * Exit:	alloc info updated
 *=====================================================================
 */
void
site_init_alloc(server_info *sinfo)
{
	share_info	*root;
	share_info	*leader;
	sh_amt *	sh_active;	/* counts of CPUs in use */
	sh_amt *	sh_avail;	/* counts of CPUs not in use */
	sh_amt *	sh_contrib;	/* counts of CPUs avail for borrow */
	sh_amt *	sh_total;	/* total counts of CPUs */
	share_head *	shead;		/* active share info */
	int		i;

	if (sinfo == NULL || (shead = sinfo->share_head) == NULL)
		return;
	sh_active = shead->sh_active;
	sh_avail = shead->sh_avail;
	sh_contrib = shead->sh_contrib;
	sh_total = shead->sh_total;
	root = shead->root;
	if (sh_active == NULL || sh_avail == NULL || sh_contrib == NULL
		|| sh_total == NULL || root == NULL)
		return;
	/*
	 * Scan nodes to total number of CPUs of each type -> sh_total
	 */
	count_cpus(sinfo->nodes, sinfo->num_nodes, sinfo->queues, sh_total);
	/*
	 * Scan jobs to accumulate CPUs in use or requested into share info
	 * structures.
	 */
	zero_share_counts(root);
	memset(sh_active, 0, shr_class_count * sizeof(*sh_active));
	count_active_cpus(sinfo->jobs, sinfo->sc.total, sh_active);
	count_demand_cpus(sinfo->jobs, sinfo->sc.total);
	/*
	 * Now, adjust CPUs available for sharing downward by current
	 * use of jobs not associated with a share group.
	 */
	leader = root->leader;
	for (i = 0; i < shr_class_count; ++i) {
		int t;
		t = sh_total[i];
		if (leader != NULL) {
			int	j;
			for (j = 0; j < J_TYPE_COUNT; ++j) {
				t -= leader->share_inuse[i][j];
			}
		}
		sh_avail[i] = t;
	}
	/*
	 * Convert raw allocations into CPU counts -> share_ncpus.
	 */
	set_share_cpus(root, root->share_gross, sh_avail);
	/*
	 * Count how many CPUs are available for borrowing.
	 */
	count_contrib_cpus(root, root, sh_contrib);
	/*
	 * Root has access to all CPUs.
	 */
	for (i = 0; i < shr_class_count; ++i) {
		root->share_ncpus[i] = sh_total[i];
	}
	if (conf.partition_id == NULL) {
		site_list_shares(stdout, sinfo, "sia_", 1);
		fflush(stdout);
	}
}


/*
 *=====================================================================
 * site_is_queue_topjob_set_aside(resv) - Check the topjob_set_aside attribute
 *		for the queue of the given job
 * Entry:	resv = resource_resv for job
 * Returns:	1 if topjob_set_aside=True for the queue
 *		0 otherwise
 *=====================================================================
 */
int
site_is_queue_topjob_set_aside(resource_resv *resv)
{
	job_info*	job;

	if (resv == NULL || !resv->is_job || (job = resv->job) == NULL ||
		job->queue == NULL)
		return 0;

	return job->queue->is_topjob_set_aside;
}


/*
 *=====================================================================
 * site_is_share_king(policy) - Check if group shares are most important
 *		job sort criterion
 * Entry:	policy = policy in effect
 *		Call with policy = NULL to fetch previously computed value.
 * Returns:	1 if group shares is second job sort key (after formula)
 *		0 otherwise
 *=====================================================================
 */
int
site_is_share_king(status *policy)
{
	static int	is_king = 0;

	if (policy == NULL)
		return is_king;		/* return previous value */
	/*
	 * If no shares, shares are not king.
	 */
	if (cur_shr_head == NULL) {
		is_king = 0;
		return is_king;
	}
	/*
	 * Examine the sort keys to see if shares are primary key
	 */
	is_king = 0;
	if (!policy->sort_by.empty() && policy->sort_by[0].res_name == SORT_ALLOC)
		is_king = 1;
	
	return is_king;
}


/*
 *=====================================================================
 * site_list_shares(fp, sinfo, pfx, flag) - Write current CPU allocation
 *			info to file
 * Entry:	fp = FILE * to write to
 *		sinfo = server to list data for
 *		pfx = string to prefix each line with
 *		flag = non-zero to list only leaders
 * Exit:	Data from tree written to file
 *=====================================================================
 */
void
site_list_shares(FILE *fp, server_info *sinfo, const char *pfx, int flag)
{
	share_info	*root;
	int		idx;

	if (fp == NULL || sinfo == NULL || sinfo->share_head == NULL
		|| (root = sinfo->share_head->root) == NULL) {
		return;
	}
	for (idx = 0; idx < shr_class_count ; ++idx) {
		char *sname;

		sname = shr_class_name_by_idx(idx);
		list_share_info(fp, root, pfx, idx, sname, flag);
	}
}


/*
 *=====================================================================
 * site_list_jobs( sinfo, rarray ) - List jobs in queue to file
 * Entry:	sinfo = server info
 *		rarray array of pointers to jobs, terminated by NULL
 *=====================================================================
 */
void
site_list_jobs(server_info *sinfo, resource_resv **rarray)
{
	FILE		*sj;
	char		*fname;
	int		i;
	share_info	*si;
	sh_amt		*job_amts;
	char		*sname;
	const char	*starving;

	fname = SORTED_FILE;
	sj = fopen(fname, "w+");
	if (sj == NULL) {
		sprintf(log_buffer, "Cannot open %s: %s\n",
			fname, strerror(errno));
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_JOB, LOG_ERR,
			__func__, log_buffer);
		return;
	}
	site_list_shares(sj, sinfo, "#A ", 0);
	for (i = 0; ; ++i) {
		struct resource_resv	*rp;
		struct job_info		*job;
		char 		*name, *queue, *user;
		time_t		start;
		int		jpri;
		int		ncpus;

		rp = rarray[i];
		if (rp == NULL)
			break;
		/*
		 * List only jobs
		 */
		if (!rp->is_job)
			continue;
		job = rp->job;
		/*
		 * that are still in the queue
		 */
		if (!job->is_queued)
			continue;
		name = rp->name;
		queue = job->queue->name;
		user = rp->user;
		si = job->sh_info;
		sname = NULL;
		if (si) {
			switch (si->pattern_type) {
				case share_info::pattern_type::PATTERN_COMBINED:
				case share_info::pattern_type::PATTERN_SEPARATE:
					if (si->leader) sname = si->leader->name;
					break;
				default:
					sname = si->name;
					break;
			}
		}
		if (sname == NULL)
			sname = "<none>";
		starving = job->is_starving ? "s" : "-";
		start = rp->start;
		jpri = job->NAS_pri;
		ncpus = rp->select ? rp->select->total_cpus : -1; /* XXX */
		job_amts = job->sh_amts;
		if (job_amts) {
			int sh_cls;
			ncpus = 0;
			for (sh_cls = 0; sh_cls < shr_class_count; ++sh_cls) {
				ncpus += job_amts[sh_cls];
			}
		}
		if (start == UNSPECIFIED || start == sinfo->server_time)
			start = 0;
		fprintf(sj, "  %s\t%s\t%s\t%s\t%s\t%lu\t%d\t%d\n",
			name, queue, user, sname, starving,
			(unsigned long)start, jpri, ncpus);
	}
	fclose(sj);
}


/*
 *=====================================================================
 * site_parse_shares(fname) - Read CPU shares file
 * Entry	fname = path to file
 * Returns	1 if all okay
 *		0 on errors, messages to log
 * Modifies	static variables declared at start of file
 *=====================================================================
 */
int
site_parse_shares(char *fname)
{
	share_info	*cur;
	int		errcnt = 0;	/* parse error counter */
	FILE 		*fp;		/* shares file */
	int		i;
	int		lineno = 0;	/* current line number in file */
	share_info	*parent;	/* parent of current node */
	share_info	*root = NULL;	/* New tree under construction */
	char		*save_ptr;	/* posn for strtok_r() */
	char		*sp;		/* temp ptr into buf */
	char		*sp2;		/* ditto */
	char		*sp3;		/* ditto */
	int		state;
	sh_amt		*tshares;	/* temp shares values */
	struct shr_class *tclass;	/* temp class pointer */
	struct shr_type	*ttype;		/* temp type pointer */
	int		new_cls_cnt;	/* number of CPU classes */
	int		new_type_cnt;	/* number of CPU types */
	struct shr_class *new_shr_clses;	/* new class list */
	struct shr_class *new_cls_tail;
	struct shr_type	*new_shr_types;	/* new type list */
	struct shr_type	*new_type_tail;
#define	LINE_BUF_SIZE	256
	char		buf[LINE_BUF_SIZE];	/* line buffer */
	char		class_and_type[LINE_BUF_SIZE];	/* [class:]type */
	char		new_sel[LINE_BUF_SIZE];	/* new value for type_selector */
	char		pattern[LINE_BUF_SIZE];	/* share group name/pattern */

	state = 0;
	new_shr_clses = new_cls_tail = NULL;
	new_shr_types = new_type_tail = NULL;
	new_cls_cnt = 0;
	new_type_cnt = 0;
	tshares = NULL;
	if ((fp = fopen(fname, "r")) == NULL) {
		i = errno;
		sprintf(log_buffer, "Error opening file %s", fname);
		log_err(i, __func__, log_buffer);
		return 1;		/* continue without shares */
	}
	while (fgets(buf, LINE_BUF_SIZE, fp) != NULL) {
		++lineno;
		cur = NULL;
		sp = strchr(buf, '\n');
		if (sp == NULL) {
			sprintf(log_buffer, "Line %d excessively long.  Giving up.",
				lineno);
			goto err_out_l;
		}
		/*
		 * Terminate lines at comment
		 */
		sp = strchr(buf, '#');
		if (sp != NULL) {
			sp[0] = '\n';
			sp[1] = '\0';
		}
		/*
		 * First non-comment line is "classes" line.
		 */
		sp = strtok_r(buf, " \t\n", &save_ptr);
		if (sp == NULL)
			continue;	/* Empty or comment */
		if (strcasecmp(sp, "classes") == 0) {
			if (state != 0) {
				sprintf(log_buffer, "\"classes\" must be first line in shares file");
				goto err_out_l;
			}
			sp = strtok_r(NULL, " \t\n", &save_ptr);
			if (sp == NULL) {
				sprintf(log_buffer, "Empty \"classes\" line");
				goto err_out_l;
			}
			strcpy(new_sel, sp);
			/*
			 * Set up default class and type entries
			 */
			strcpy(log_buffer, "Malloc failure"); /* just in case */
			tclass = static_cast<shr_class *>(malloc(sizeof(*tclass)));
			if (tclass == NULL) {
				goto err_out_l;
			}
			tclass->next = NULL;
			tclass->sh_cls = 0;
			tclass->name[0] = '\0';
			new_shr_clses = tclass;
			new_cls_tail = tclass;

			ttype = static_cast<shr_type *>(malloc(sizeof(*ttype)));
			if (ttype == NULL) {
				goto err_out_l;
			}
			ttype->next = NULL;
			ttype->sh_tidx = 0;
			ttype->sh_cls = 0;
			ttype->cpus_per_node = 1;
			ttype->name[0] = '\0';
			new_shr_types = ttype;
			new_type_tail = ttype;

			new_cls_cnt = 1;
			new_type_cnt = 1;
			/*
			 * Now, collect list of selector values
			 */
			while ((sp = strtok_r(NULL, " \t\n", &save_ptr)) != NULL) {
				sp = strcpy(class_and_type, sp);
				sp2 = strchr(sp, ':');
				/* sp gives class, sp2 gives type */
				if (sp2 == NULL) {
					/*
					 * No class given, use previous tclass,
					 * else default.
					 */
					if (tclass == NULL) {
						tclass = new_shr_clses;
					}
					sp2 = sp;
				} else if (sp2 == sp) {
					/*
					 * Empty class, use default
					 */
					tclass = new_shr_clses;
					sp2++;
				} else {
					*sp2++ = '\0';
					for (tclass = new_shr_clses; tclass;
						tclass = tclass->next) {
						if (strcmp(sp, tclass->name) == 0)
							break;
					}
					if (tclass == NULL) {
						/*
						 * New class.  Add to list.
						 */
						tclass = static_cast<shr_class *>(malloc(sizeof(*tclass)
							+ strlen(sp)));
						if (tclass == NULL)
							goto err_out_l;
						tclass->next = NULL;
						tclass->sh_cls = new_cls_cnt++;
						strcpy(tclass->name, sp);
						new_cls_tail->next = tclass;
						new_cls_tail = tclass;
					}
				}
				sp3 = strchr(sp2, '@');
				/* sp3 gives cpus_per_node */
				if (sp3) {
					*sp3++ = '\0';
				}
				/*
				 * Type names must be unique.
				 */
				for (ttype = new_shr_types; ttype; ttype = ttype->next) {
					if (strcmp(sp2, ttype->name) == 0) {
						if (*sp2 == '\0')
							break;
						sprintf(log_buffer, "duplicate type: %s", sp2);
						goto err_out_l;
					}
				}
				if (ttype == NULL) {
					ttype = static_cast<shr_type *>(malloc(sizeof(*ttype) + strlen(sp2)));
					if (ttype == NULL)
						goto err_out_l;
					ttype->sh_tidx = new_type_cnt++;
					ttype->sh_cls = tclass->sh_cls;
					ttype->cpus_per_node = 1;
					if (sp3) {
						i = atoi(sp3);
						if (i > 0)
							ttype->cpus_per_node = i;
					}
					ttype->next = NULL;
					strcpy(ttype->name, sp2);
					new_type_tail->next = ttype;
					new_type_tail = ttype;
				}
			}
			++state;
			tshares = static_cast<sh_amt *>(malloc(new_cls_cnt * sizeof(*tshares)));
			if (tshares == NULL) {
				goto err_out_l;
			}
			continue;
		}
		/*
		 * Remaining lines are tree lines, of form
		 * pattern	parent	[class:share ...] [default_share]
		 */
		if (state == 0) {
			sprintf(log_buffer, "\"classes\" must appear first in shares file");
			goto err_out_l;
		}
		if (root == NULL) {
			/*
			 * Now that we have count of classes, can allocate
			 * root node.
			 */
			root = new_share_info("root", new_cls_cnt);
			if (root == NULL) {
				strcpy(log_buffer, "Cannot allocate ROOT node");
				goto err_out_l;
			}
		}
		strcpy(pattern, sp);
		sp = strtok_r(NULL, " \t\n", &save_ptr);
		if (sp == NULL) {
			sprintf(log_buffer,
				"Unrecognized shares line: %d: begins %s",
				lineno, pattern);
			goto err_parse;
		}
		if (find_share_group(root, pattern) != NULL) {
			sprintf(log_buffer,
				"Duplicated group at line %d: %s",
				lineno, pattern);
			goto err_parse;
		}
		parent = find_share_group(root, sp);	/* check valid parent */
		if (parent == NULL) {
			sprintf(log_buffer, "Unknown parent (%s) at line %d",
				sp, lineno);
			goto err_parse;
		}
		for (i = 0; i < new_cls_cnt; ++i) {
			tshares[i] = -1;
		}
		/*
		 * Extract share pairs from rest of line.
		 * We could skip some of the following if we assumed
		 * that save_ptr pointed into the string at the next place
		 * to start scanning, but its value is supposedly opaque.
		 * Basically, we squash out spaces around colons in the
		 * rest of the line to make it easier to strtok.
		 */
		sp = strtok_r(NULL, "\n", &save_ptr);
		if (sp != NULL) {
			int st = 0;
			int c;
			char *sp4;
			for (sp4 = buf; (c = *sp++) != '\0';) {
				switch (st) {
					case 0:	/* leading space */
						if (!isspace(c)) { st = 1; }
						break;
					case 1:	/* token, possibly with trailing : */
						if (isspace(c)) { st = 2; continue; }
						if (c == ':') { st = 3; break; }
						break;
					case 2:	/* skip spaces before : */
						if (isspace(c))	continue;
						if (c == ':') { st = 3; break; }
						/* Oops, no colon, restore delimiter */
						*sp4++ = ' ';
						st = 0;
						break;
					case 3:	/* skip spaces after : */
						if (isspace(c)) continue;
						st = 4;
						break;
					case 4:	/* token after a colon */
						if (isspace(c)) { st = 0; }
						break;
				}
				*sp4++ = c;
			}
			*sp4 = '\0';
			sp = strtok_r(buf, " \t\n", &save_ptr);
		}
		/*
		 * Whew!  Now ready to extract shares
		 */
		for (; sp ; sp = strtok_r(NULL, " \t\n", &save_ptr)) {
			char	*name;
			char	*value;
			char	*sp5;
			long	l;

			name = sp;
			if ((value = strchr(sp, ':')) != NULL) {
				*value++ = '\0';
			} else {
				value = name;
			}
			/*
			 * Extract name and value
			 */
			if (value == name) {
				i = 0;
				name = "";
			} else {
				if ((i = find_share_class(new_shr_clses, name)) == 0) {
					sprintf(log_buffer, "Unknown share class (%s) on line %d",
						name, lineno);
					goto err_parse;
				}
			}
			l = strtol(value, &sp5, 10);
			if (*sp5 != '\0' || l < 0) {
				sprintf(log_buffer, "Invalid share (%s) on line %d",
					value, lineno);
				goto err_parse;
			}
			if (tshares[i] != -1) {
				sprintf(log_buffer, "Repeated type (%s) on line %d",
					name, lineno);
				goto err_parse;
			}
			tshares[i] = l;
		}
		/*
		 * We have collected everything we need to create new tree
		 * node.
		 */
		cur = new_share_info(pattern, new_cls_cnt);
		if (cur == NULL)
			continue;
		for (i = 0; i < new_cls_cnt; ++i) {
			sh_amt t;
			t = tshares[i];
			if (t < 0)
				t = 0;
			cur->share_gross[i] = t;
		}
		cur->lineno = lineno;
		/*
		 * If the name is a pattern, compile it, after bracketing
		 * between ^ and $.
		 */
		if (strpbrk(pattern, "|*.\\(){}[]+") != NULL) {
			int result;
			enum share_info::pattern_type ptype = share_info::pattern_type::PATTERN_COMBINED;
			char *t = static_cast<char *>(malloc(strlen(pattern) + 3));
			char *t2 = pattern;
			if (t != NULL) {
				if (*t2 == '+') {
					ptype = share_info::pattern_type::PATTERN_SEPARATE;
					++t2;
				}
				t[0] = '^';
				strcpy(t+1, t2);
				strcat(t+1, "$");
				result = regcomp(&cur->pattern, t,
					REG_ICASE|REG_NOSUB);
				if (result == 0) {
					cur->pattern_type = ptype;
				} else {
					sprintf(log_buffer,
						"Regcomp error on line %d for pattern %s", lineno, t);
					free(t);
					goto err_parse;
				}
				free(t);
			}
		}
		/*
		 * Link in.  We use tptr to hold youngest child.
		 */
		cur->parent = parent;
		if (parent->child == NULL) {
			parent->child = parent->tptr = cur;
		} else {
			parent->tptr->sibling = cur;
			parent->tptr = cur;
		}
		continue;		/* Done with line */
err_parse:
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE,
			__func__, log_buffer);
		if (cur) {
			free(cur);
		}
		if (++errcnt > 10) {
			strcpy(log_buffer, "Giving up on shares file.");
			goto err_out_l;
		}
	}
	fclose(fp);
	fp = NULL;
	if (errcnt > 0) {
		strcpy(log_buffer, "Errors encountered in shares file.");
		goto err_out_l;
	}
	if (root == NULL) {
		strcpy(log_buffer, "No share groups defined.");
		goto err_out_l;
	}
	/*
	 * Everything parsed okay, reconcile, then update global values
	 */
	if (!reconcile_shares(root, new_cls_cnt)) {
		strcpy(log_buffer, "Inconsistencies detected");
		goto err_out_l;
	}
	{	struct share_head *newsh;
		newsh = new_share_head(new_cls_cnt);
		if (newsh == NULL) {
			strcpy(log_buffer, "Cannot allocate new share header");
			goto err_out_l;
		}
		if (cur_shr_head) {
			free_share_head(cur_shr_head, 0);
		}
		cur_shr_head = newsh;
	}
	cur_shr_head->root = root;
	{	struct shr_class *nextp;
		for (tclass = shr_classes; tclass; tclass = nextp) {
			nextp = tclass->next;
			free(tclass);
		}
	}
	{	struct shr_type	*nextp;
		for (ttype = shr_types; ttype; ttype = nextp) {
			nextp = ttype->next;
			free(ttype);
		}
	}
	shr_classes = new_shr_clses;
	shr_types = new_shr_types;
	if (shr_selector) free(shr_selector);
	shr_selector = strdup(new_sel);
	shr_class_count = new_cls_cnt;
	shr_type_count = new_type_cnt;
	return 1;

err_out_l:
	log_err(-1, __func__, log_buffer);
	log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, __func__,
		"Warning: CPU shares file parse error: file ignored");
	for (ttype = new_shr_types; ttype; ttype = new_shr_types) {
		new_shr_types = ttype->next;
		free(ttype);
	}
	if (tshares)
		free(tshares);
	free_share_tree(root);
	if (fp)
		fclose(fp);
	return 0;
}


/*
 *=====================================================================
 * site_find_runnable_res( resv_arr ) - Site specific code for picking
 *			next resv/job to try to run
 * Entry:	resv_arr = array of ptrs to resource_resv,
 *			sorted per job sort key list.
 *		Should be called at beginning of job loop with NULL
 *		to reset state.
 * Returns:	ptr to selected resource_resv,
 *			NULL if no more choices.
 *=====================================================================
 */
resource_resv *
site_find_runnable_res(resource_resv** resresv_arr)
{
	static	enum { S_INIT, S_RESV, S_HWY149, S_DEDRES, S_HWY101, S_TOPJOB, S_NORMAL } state;
	resource_resv *	resv;
	server_info *	sinfo;
	share_head *	shp;
	share_info *	si;
	int		i;

	if (resresv_arr == NULL) {
		state = S_INIT;
		return NULL;
	}
	/*
	 * Find any job in list and use it to get current server info,
	 * which, in turn, leads to current share info
	 */
	for (i = 0; (resv = resresv_arr[i]) != NULL; ++i) {
		if (resv->is_job && resv->job != NULL)
			break;
	}
	if (resv == NULL)
		return NULL;
	sinfo = resv->job->queue->server;
	shp = sinfo->share_head;
	si = NULL;

	if (state == S_INIT) {
		if (shp) {
			clear_topjob_counts(shp->root);
		}
		state = S_RESV;
	}
	if (state == S_RESV) {
		for (i = 0; (resv = resresv_arr[i]) != NULL; i++) {
			if (!resv->is_job && !resv->can_not_run &&
					in_runnable_state(resv)) {
				return resv;
			}
		}
		state = S_HWY149;
	}
	if (state == S_HWY149) {
#ifdef	NAS_HWY149
		/*
		 * Go through operator boosted jobs (highest priority)
		 */
		if ((resv = pick_next_job(sinfo->policy, resresv_arr,
			job_filter_hwy149, NULL)) != NULL)
			return resv;
#endif
		state = S_DEDRES;
	}
	/*
	 * Stop looking now if interested only in resuming jobs.
	 * localmod XXXY
	 */
	if (conf.resume_only)
		return NULL;
	if (state == S_DEDRES) {
		/*
		 * Go through jobs in queues that use per_queues_topjobs, these
		 * queues should have nodes assigned to them and therefore
		 * these jobs will not take nodes away from later 101/top jobs
		 * in below code
		 */
		if ((resv = pick_next_job(sinfo->policy, resresv_arr,
			job_filter_dedres, NULL)) != NULL)
			return resv;

		state = S_HWY101;
	}
	if (state == S_HWY101) {
#ifdef	NAS_HWY101
		/*
		 * Go through operator boosted jobs
		 */
		if ((resv = pick_next_job(sinfo->policy, resresv_arr,
			job_filter_hwy101, NULL)) != NULL)
			return resv;
#endif
		state = S_TOPJOB;
	}
	if (state == S_TOPJOB) {
		/*
		 * Find most-favored group not at topjob limit
		 */
		if (shp != NULL)
			si = find_most_favored_share(shp->root, conf.per_share_topjobs);
		if (si == NULL) {
			state = S_NORMAL;
		}
	}
	if ((resv = pick_next_job(sinfo->policy, resresv_arr,
		job_filter_normal, si)) != NULL)
		return resv;

	/*
	 * Searched whole list without match.  Try again with different share
	 * group.
	 */
	if (si != NULL) {
		si->none_left = 1;
		resv = site_find_runnable_res(resresv_arr);
	}
	return resv;
}


/*
 *=====================================================================
 * site_resort_jobs(njob) - Possibly resort queues after starting job
 * Entry:	njob = job that was just started
 *=====================================================================
 */
void
site_resort_jobs(resource_resv *njob)
{
	server_info	*sinfo;
	queue_info	*queue;
	job_info	*job;
	int		i;

	if (njob == NULL || !njob->is_job || (job = njob->job) == NULL
		|| (queue = job->queue) == NULL || (sinfo = njob->server) == NULL)
			return;
	/*
	 * Update values that changed due to job starting.
	 */
	for (i = 0; i < sinfo->sc.total; ++i) {
		resource_resv *resv;

		resv = sinfo->jobs[i];
		if (!resv->is_job || !in_runnable_state(resv))
			continue;
		(void) job_starving(sinfo->policy, resv);
	}
	/*
	 * Now, redo sorting.
	 */
	qsort(sinfo->jobs, sinfo->sc.total, sizeof(resource_resv *), cmp_sort);
	for (i = 0; sinfo->queues[i] != NULL; ++i) {
		qsort(sinfo->queues[i]->jobs, sinfo->queues[i]->sc.total,
			sizeof(resource_resv *), cmp_sort);
	}
}


/*
 *=====================================================================
 * site_restore_users() - Restore user values after adding job to
 *			calendar
 * Exit:	User values reset
 *=====================================================================
 */
void
site_restore_users(void)
{
	site_user_info	*user;

	for (user = users; user ; user = user->next) {
		user->current_use = user->saved_cu;
		user->current_use_pqt = user->saved_cup;
	}
}


/*
 *=====================================================================
 * site_save_users() - Save users values during clone operation.
 * Exit:	Current important values stored away
 *=====================================================================
 */
void
site_save_users(void)
{
	site_user_info	*user;

	for (user = users; user ; user = user->next) {
		user->saved_cu = user->current_use;
		user->saved_cup = user->current_use_pqt;
	}
}


/*
 *=====================================================================
 * site_set_job_share(resresv) - Set counts of share resources
 *		requested by job.
 * Entry:	resresv = resource reservation for job
 *		The select spec is assumed to be parsed into chunks.
 * Exit:	job's sh_amts array set
 *=====================================================================
 */
void
site_set_job_share(resource_resv *resresv)
{
	chunk *			chunk;
	int			i;
	job_info *		job;
	resource_req *		preq;
	selspec *		select;
	sh_amt *		sh_amts;
	struct shr_type *	stp;

	if (resresv == NULL || (select = resresv->select) == NULL)
		return;
	if (!resresv->is_job || (job = resresv->job) == NULL)
		return;
	if (shr_class_count == 0 || shr_selector == NULL)
		return;
	if ((sh_amts = job->sh_amts) == NULL) {
		sh_amts = static_cast<sh_amt *>(malloc(shr_class_count * sizeof(*sh_amts)));
		if (sh_amts == NULL)
			return;
		job->sh_amts = sh_amts;
	}
	memset(sh_amts, 0, shr_class_count * sizeof(*sh_amts));
	for (i = 0; (chunk = select->chunks[i]) != NULL; ++i) {
		int ncpus;
		int sh_cls;

		ncpus = 0;
		stp = NULL;

		for (preq = chunk->req; preq != NULL; preq = preq->next) {
			if (strcmp(preq->name, shr_selector) == 0) {
				stp = shr_type_info_by_name(preq->res_str);
			} else if (strcmp(preq->name, "ncpus") == 0) {
				ncpus = preq->amount;
#if	NAS_CPU_MULT > 1
				if (ncpus % NAS_CPU_MULT) {
					ncpus += NAS_CPU_MULT - (ncpus % NAS_CPU_MULT);
				}
#endif
			}
		}
		if (stp == NULL) {
			stp = shr_type_info_by_idx(0);	/* default */
		}
		sh_cls = stp->sh_cls;
		/*
		 * The next line assumes vnodes are allocated exclusively
		 */
		if (stp->cpus_per_node > ncpus) {
			ncpus = stp->cpus_per_node;
		}
		/* XXX HACK HACK until SBUrate available, localmod 126 */
		ncpus = stp->cpus_per_node;
		/* end HACK localmod 126 */
		sh_amts[sh_cls] += chunk->num_chunks * ncpus;
	}
}


/*
 *=====================================================================
 * site_set_NAS_pri(job, max_starve, starve_num) - calculate the
 *		NAS priority for a job
 * Entry:	job = job to have its NAS_pri field set
 *		max_starve = starve time for queue job is in
 *		starve_num = how long job has starved
 * Exit:	job->NAS_pri set
 *=====================================================================
 */
#if	NAS_HWY101
#define	MAX_NAS_PRI	(NAS_HWY101 - 1)
#else
#define	MAX_NAS_PRI	100
#endif
#define	IDLE_BOOST	10	/* Boost for users with nothing else running */
void
site_set_NAS_pri(job_info *job, time_t max_starve, long starve_num)
{
	queue_info* 	queue;
	site_user_info*	sui;
	long		starve_adjust;

	if (job == NULL || (queue = job->queue) == NULL)
		return;
	if (job->priority > 0) {
		job->NAS_pri = job->priority;
		return;
	}
	/* localmod 116
	 * Queued jobs get their job priority boosted by 2 for each
	 * max_starve interval they have waited, up to a maximum of 20.
	 */
	starve_adjust = 0;
	if (max_starve > 0 && max_starve < Q_SITE_STARVE_NEVER) {
		starve_adjust = 2 * starve_num / max_starve;
		if (starve_adjust < 0) starve_adjust = 0;
		if (starve_adjust > 20) starve_adjust = 20;
	}
	job->NAS_pri = job->queue->priority + starve_adjust;
	/*
	 * Jobs get a boost of 10 if there are no other jobs currently
	 * running for the user.
	 */
	sui = job->u_info;
	if (sui != NULL) {
		sch_resource_t t;
		t = queue->is_topjob_set_aside ? sui->current_use_pqt :
			sui->current_use;
		if (t == 0 && job->NAS_pri < MAX_NAS_PRI) {
			int pri = job->NAS_pri + IDLE_BOOST;
			if (pri > MAX_NAS_PRI) pri = MAX_NAS_PRI;
			job->NAS_pri = pri;
		}
	}
}


/*
 *=====================================================================
 * site_set_node_share(ninfo, res) - Set type of share node supplies
 * Entry:	ninfo = pointer to node info
 *		res = pointer to resource available on node
 * Exit:	ninfo->sh_cls, sh_type set if appropriate
 *=====================================================================
 */
void
site_set_node_share(node_info *ninfo, schd_resource *res)
{
	int		i;
	struct shr_type	*stp = NULL;

	if (ninfo == NULL || res == NULL || shr_selector == NULL)
		return;
	if (strcmp(res->name, shr_selector) != 0)
		return;			/* not our resource */
	ninfo->sh_cls = 0;
	if (res->str_avail == NULL)
		return;
	for (i = 0; res->str_avail[i]; ++i) {
		if ((stp = shr_type_info_by_name(res->str_avail[i]))!=NULL) {
			ninfo->sh_cls = stp->sh_cls;
			ninfo->sh_type = stp->sh_tidx;
			break;
		}
	}
}


/*
 *=====================================================================
 * site_set_share_head(sinfo) - Set share head into server info
 * Entry:	sinfo = ptr to server info
 * Returns:	1 on success, 0 on error
 * Assumes:	cur_shr_head set
 *=====================================================================
 */
int
site_set_share_head(server_info *sinfo)
{
	if (sinfo == NULL)
		return 0;
	if (cur_shr_head == NULL)
		return 0;
	sinfo->share_head = cur_shr_head;
	return 1;
}


/*
 *=====================================================================
 * site_set_share_type(sinfo, resresv) - Set share type for job
 *=====================================================================
 */
void
site_set_share_type(server_info * sinfo, resource_resv * resresv)
{
	job_info *	ji;
	queue_info *	qi;
	time_t		max_borrow;
	time_t		remaining;

	if (sinfo == NULL || resresv == NULL)
		return;
	/*
	 * Assume shares not relevant
	 */
	resresv->share_type = J_TYPE_ignore;
	if (conf.max_borrow == UNSPECIFIED) {
		return;
	}
	ji = resresv->job;
	if (ji == NULL || !resresv->is_job)
		return;
	qi = ji->queue;
	if (qi == NULL)
		return;
	max_borrow = qi->max_borrow;
	if (max_borrow == UNSPECIFIED)
		max_borrow = conf.max_borrow;
	if (max_borrow == 0) {
		return;			/* max borrow of 0 means exempt */
	}
	if (ji->is_running) {
		remaining = resresv->end - sinfo->server_time;
	} else {
		remaining = resresv->duration;
	}
	if (remaining > max_borrow) {
		resresv->share_type = J_TYPE_limited;
	} else {
		resresv->share_type = J_TYPE_borrow;
	}
}


/*
 *=====================================================================
 * site_should_backfill_with_job(policy, sinfo, resresv, ntj, nqtj, err)
 * Entry:	policy = pointer to current policy
 *		sinfo = server state where job resides
 *		resresv = the job to check
 *		ntj = number of topjobs so far
 *		nqtj = number of queue topjobs so far
 *		err = error structure from trying to run job immediately
 * Returns:	0 if should not calendar
 *		1 calendar based on backfill_depth
 *		2 calendar based on per_queue_topjobs
 *		3 calendar based on per_share_topjobs
 *		4 calendar based on share usage ratio
 *=====================================================================
 */
int site_should_backfill_with_job(status *policy, server_info *sinfo, resource_resv *resresv, int ntj, int nqtj, schd_error *err)
{
	int		rc;
	share_info	*si;
	struct job_info	*job;

	if (policy == NULL || sinfo == NULL || resresv == NULL || err == NULL)
		return 0;
	if (!resresv->is_job || (job = resresv->job) == NULL)
		return 0;
	/*
	 * Do normal checks and reject if they reject.
	 */
	rc = should_backfill_with_job(policy, sinfo, resresv, ntj);
	if (rc == 0)
		return rc;
	/*
	 * Start of site-specific calendaring code
	 */
#ifdef NAS_HWY149
	/*
	 * Don't drain for node shuffle jobs or other specials.
	 */
	if (job->NAS_pri == NAS_HWY149)
		return 0;
#endif
	/*
	 * Jobs blocked by other jobs from the same user are not eligible
	 * for starving/backfill help.
	 */
	switch (err->error_code) {
		case SERVER_USER_LIMIT_REACHED:
		case QUEUE_USER_LIMIT_REACHED:
		case SERVER_USER_RES_LIMIT_REACHED:
		case QUEUE_USER_RES_LIMIT_REACHED:
			return 0;
			/*
			 * No point to backfill for jobs blocked by dedicated
			 * time.  All resources will become available at
			 * the end of the dedicated time.
			 */
		case DED_TIME:
		case CROSS_DED_TIME_BOUNDRY:
			return 0;
			/*
			 * If job exceeds total mission allocation,
			 * it can never run.
			 */
		case GROUP_CPU_INSUFFICIENT:
			return 0;
		default:
			;
	}
	/* Check if in queues with special topjob limit */
	/* localmod 038 */
	if (site_is_queue_topjob_set_aside(resresv)
			&& nqtj < conf.per_queues_topjobs)
	  	return 2;
	/* Check if per-share count exhausted. */
	si = job->sh_info;
	if (si) si = si->leader;
	if (si && si->topjob_count < conf.per_share_topjobs)
		return 3;		/* Still within share guarantee */
	/* localmod 154 */
	/* Check if share using less than allocation */
	if (si && si->ratio_max < 1.0 && si->tj_cpu_cost < TJ_COST_MAX /* XXX */)
		return 4;
	/* Back to non-NAS tests.  Have we calendared backfill_depth jobs? */
	if (ntj >= policy->backfill_depth)
		return 0;
	return 1;
}


/*
 *=====================================================================
 * site_tidy_server(sinfo) - Tweak data collected from server
 * Entry:	sinfo = Server info.  The following are some of the
 *			fields that can be used:
 *
 *			nodes = array of nodes
 *			queues = array of queues (sorted)
 *			resvs = array of reservations
 *			jobs = array of jobs (partially sorted or not,
 *				depending on by_queue or round_robin)
 *			all_resresv = array of all jobs and reservations
 *				(sorted on event time)
 *
 *			Note: the following are *not* set: running_resvs,
 *			running_jobs, exiting_jobs, starving_jobs,
 *			user_counts, group_counts.
 * Return:	0 on error, 1 on success
 *=====================================================================
 */
int
site_tidy_server(server_info *sinfo)
{
	int		rc;
	int		i;
	resource_resv	*resv;

	if (sinfo->share_head == NULL)
		sinfo->share_head = cur_shr_head;
	site_init_alloc(sinfo);
	rc = init_users(sinfo);
	if (rc != 0)
		return 0;
	/*
	 * Adjust queued job priorities now that we have user info.
	 */
	for (i = 0; i < sinfo->sc.total; ++i) {
		resv = sinfo->jobs[i];
		if (!resv->is_job || !in_runnable_state(resv))
			continue;
		(void) job_starving(sinfo->policy, resv);
	}
	return 1;
}


/*
 *=====================================================================
 * site_update_on_end(sinfo, qinfo, res) - Do site specific updating
 *		when job ends.
 * Entry:	sinfo = server info
 *		qinfo = info for queue job running in
 *		res = resv/job info
 * Exit:	Local data updated
 *=====================================================================
 */
void
site_update_on_end(server_info *sinfo, queue_info *qinfo, resource_resv *resv)
{
	job_info	*job;
	share_info	*si;
	sh_amt		*sc;
	share_head	*shead;

	if (sinfo == NULL || (shead = sinfo->share_head) == NULL)
		return;
	if (!resv->is_job || (job = resv->job) == NULL)
		return;
	if ((si = job->sh_info) == NULL || (sc = job->sh_amts) == NULL)
		return;
	bump_share_count(si, resv->share_type, sc, -1);
	bump_demand_count(si, resv->share_type, sc, 1);
	if ((si = si->leader) == NULL)
		return;
	if (resv->share_type != J_TYPE_ignore) {
		int i;

		for (i = 0; i < shr_class_count; ++i) {
			int borrowed;
			int ncpus;

			ncpus = sc[i];
			shead->sh_avail[i] += ncpus;
			borrowed = si->share_inuse[i][J_TYPE_limited] +
				si->share_inuse[i][J_TYPE_borrow] -
				si->share_ncpus[i];
			if (borrowed > 0) {
				if (borrowed > ncpus)
					borrowed = ncpus;
				shead->sh_contrib[i] += borrowed;
			}
		}
		si->ratio = get_share_ratio(si->share_ncpus, NULL,
			si->share_inuse);
	}
#ifdef NAS_DEBUG
	printf(" YYY- %s %d %g %g %s\n", si->name, (int)resv->share_type, si->ratio, si->ratio_max, resv->name);
	fflush(stdout);
#endif
}


/*
 *=====================================================================
 * site_update_on_run(sinfo, qinfo, res, flag, ns) - Do site specific
 *		updating when job started.
 * Entry:	sinfo = server info
 *		qinfo = info for queue job running in
 *		res = resv/job info
 *		flag = 0 when calendaring, 1 if really starting
 *		ns = node specification job run on
 * Exit:	Local data updated
 *=====================================================================
 */
void
site_update_on_run(server_info *sinfo, queue_info *qinfo,
	resource_resv *resv, int flag, nspec **ns)
{
	job_info	*job;
	share_info	*si;
	sh_amt		*sc;
	share_head	*shead;
	queue_info	*queue;
	site_user_info	*sui;
	int		i, ncpus, borrowed;

	if (sinfo == NULL || (shead = sinfo->share_head) == NULL)
		return;
	if (!resv->is_job || (job = resv->job) == NULL)
		return;
	if ((si = job->sh_info) == NULL || (sc = job->sh_amts) == NULL)
		return;
	queue = job->queue;
	sui = job->u_info;
	if (flag && sui && queue) {
		if (queue->is_topjob_set_aside) {
			sui->current_use_pqt += job->accrue_rate;
		} else {
			sui->current_use += job->accrue_rate;
		}
	}
	bump_share_count(si, resv->share_type, sc, 1);
	bump_demand_count(si, resv->share_type, sc, -1);
	if ((si = si->leader) == NULL)
		return;
	if (resv->share_type != J_TYPE_ignore) {
		for (i = 0; i < shr_class_count; ++i) {
			ncpus = sc[i];
			shead->sh_avail[i] -= ncpus;
			borrowed = \
			   si->share_inuse[i][J_TYPE_limited]
			  +si->share_inuse[i][J_TYPE_borrow]
			  -si->share_ncpus[i];
			if (borrowed > 0) {
				if (borrowed > ncpus)
					borrowed = ncpus;
				shead->sh_contrib[i] -= borrowed;
			}
		}
		si->ratio = get_share_ratio(si->share_ncpus, NULL,
			si->share_inuse);
		/* localmod 154 */
		/* Keep track of highest ratio seen */
		if (si->ratio > si->ratio_max)
			si->ratio_max = si->ratio;
	}
#ifdef NAS_DEBUG
	printf(" YYY+ %s %d %g %g %s\n", si->name, (int)resv->share_type, si->ratio, si->ratio_max, resv->name);
	fflush(stdout);
#endif
}


/*
 *=====================================================================
 * site_vnode_inherit( nodes ) - Have vnodes inherit certain values
 *		from their natural vnode.
 * Entry:	nodes = array of node_info structures for all vnodes
 * Exit:	vnodes updated
 *=====================================================================
 */
void
site_vnode_inherit(node_info ** nodes)
{
	int		nidx;
	node_info *	natural;
	node_info *	ninfo;
	resource *	res;
	resource *	cur;
	resource *	prev;

	if (nodes == NULL)
		return;
	natural = NULL;
	for (nidx = 0; (ninfo = nodes[nidx]) != NULL; ++nidx) {
		/*
		 * Is this a natural node?
		 */
		res = find_resource(ninfo->res, allres["host"]);
		if (res == NULL)
			continue;
		if (compare_res_to_str(res, ninfo->name, CMP_CASELESS)) {
			natural = ninfo;	/* Natural vnode */
			continue;
		}
		/*
		 * For vnode, locate natural vnode
		 */
		if (natural == NULL
			|| !compare_res_to_str(res, natural->name, CMP_CASELESS)) {
			int i;
			for (i = 0; (natural = nodes[i]) != NULL; ++i) {
				if (compare_res_to_str(res, natural->name, CMP_CASELESS)) {
					break;
				}
			}
		}
		if (natural == NULL)
			continue;
		/*
		 * Copy interesting status from natural vnode to this vnode
		 */
		ninfo->is_down |= natural->is_down;
		ninfo->is_offline |= natural->is_offline;
		ninfo->is_unknown |= natural->is_unknown;
		if (ninfo->is_down || ninfo->is_offline || ninfo->is_unknown) {
			ninfo->is_free = 0;
		}
		ninfo->no_multinode_jobs |= natural->no_multinode_jobs;
		if (natural->queue_name && ninfo->queue_name == NULL) {
			ninfo->queue_name = strdup(natural->queue_name);
		}
		if (ninfo->priority == 0) {
			ninfo->priority = natural->priority;
		}
		/*
		 * Copy natural vnode resources to this vnode
		 */
		for (res = natural->res; res != NULL; res = res->next) {
			/*
			 * Cannot duplicate consumable resources
			 */
			if (res->type.is_consumable)
				continue;
			/*
			 * Skip if resource already set for vnode
			 */
			for (prev = NULL, cur = ninfo->res; cur != NULL;
				cur = cur->next) {
				if (strcmp(cur->name, res->name) == 0) {
					break;
				}
				prev = cur;
			}
			if (cur != NULL)
				continue;
			/*
			 * Add resource to end of vnode's list
			 */
			cur = new_resource();
			if (cur == NULL)
				continue;
			cur->name = strdup(res->name);
			set_resource(cur, res->orig_str_avail, RF_AVAIL);
			if (prev == NULL) {
				ninfo->res = cur;
			} else {
				cur->next = prev->next;
				prev->next = cur;
			}
		}
	}
}


/*
 *=====================================================================
 * Internal functions
 *=====================================================================
 */


/*
 *=====================================================================
 * clear_topjob_counts(root) - Reset per group topjob counts
 * Entry:       root = root of share subtree to work on
 *=====================================================================
 */
static void
clear_topjob_counts(share_info* root)
{
	if (root == NULL)
		return;
	root->topjob_count = 0;
	root->none_left = 0;
	if (root->leader == root) {
		root->ratio = get_share_ratio(root->share_ncpus, NULL,
			root->share_inuse);
		/* localmod 154 */
		root->ratio_max = root->ratio;
		root->tj_cpu_cost = 0.0;
	}
	if (root->child)
		clear_topjob_counts(root->child);
	if (root->sibling)
		clear_topjob_counts(root->sibling);
}


/*
 *=====================================================================
 * count_cpus(nodes, ncnt, queues, totals) - Count total CPUs available
 *		for allocation
 * Entry:	nodes = array of node_info struct ptrs
 *		ncnt = count of entries in nodes
 *		queues = array of queue_info structures
 *		totals = sh_amt array for totals
 * Exit:	totals array updated with CPU type counts
 *=====================================================================
 */
static void
count_cpus(node_info **nodes, int ncnt, queue_info **queues, sh_amt *totals)
{
	int		i;
	resource	*res;
	sch_resource_t	ncpus;

	for (i = 0; i < shr_class_count; ++i) {
		totals[i] = 0;
	}
	for (i = 0; i < ncnt; ++i) {
		node_info	*node;

		node = nodes[i];
		/*
		 * Skip nodes in unusable states.
		 * (Unless jobs are still assigned to them.)
		 */
		if ((node->is_down || node->is_offline)
			&&  (node->jobs == NULL || node->jobs[0] == NULL))
			continue;
#if	NAS_DONT_COUNT_EXEMPT
		/*
		 * Don't count nodes associated with specific queues
		 * if jobs in queue are exempt from CPU shares.
		 */
		if (node->queue_name) {
			queue_info *queue;
			queue = find_queue_info(queues, node->queue_name);
			if (queue == NULL || queue->max_borrow == 0)
				continue;
		}
#endif
		/*
		 * Include available CPUs in count
		 * For hosts that are down or offline, we count only
		 * assigned CPUs.  This should exactly balance the CPUs
		 * counted against running jobs.
		 */
#if 0 /* XXX HACK until SBUrate available, localmod 126 */
		res = find_resource(node->res, allres["ncpus"]);
		if (res != NULL && res->avail != SCHD_INFINITY) {
			if (node->is_down || node->is_offline)
				/*
				 * Use string value, because reservations
				 * can affect res->assigned without updating
				 * str_assigned.
				 */
				ncpus = strtol(res->str_assigned, NULL, 0);
			else
				ncpus = res->avail;
			totals[node->sh_cls] += ncpus;
		}
#else
		{
		struct shr_type *stp;
		stp = shr_type_info_by_idx(node->sh_type);
		totals[node->sh_cls] += stp->cpus_per_node;
		}
#endif /* localmod 126 */
	}
}


/*
 *=====================================================================
 * count_active_cpus(resvs, jcnt, sh_active) - Update share alloc data
 *		based on running jobs.
 * Entry:	resvs = array of resource_resv struct ptrs
 *		jcnt = count of entries in jobs array
 *		sh_active = array to total use into
 * Exit:	share_inuse values updated
 *=====================================================================
 */
static void
count_active_cpus(resource_resv **resvs, int jcnt, sh_amt *sh_active)
{
	int		i, k;
	resource_resv	*resv;

	memset(sh_active, 0, shr_class_count * sizeof(*sh_active));
	for (i = 0; i < jcnt; ++i) {
		job_info *job;

		/*
		 * Skip everything but running jobs
		 */
		resv = resvs[i];
		if (!resv->is_job || (job = resv->job) == NULL)
			continue;
		if (!job->is_running)
			continue;
		if (job->sh_amts == NULL)
			continue;
		/*
		 * Add used CPUs to group total based on job share type
		 */
		if (resv->share_type != J_TYPE_ignore) {
			for (k = 0; k < shr_class_count; ++k) {
				sh_active[k] += job->sh_amts[k];
			}
		}
		bump_share_count(job->sh_info, resv->share_type, job->sh_amts, 1);
	}
}


/*
 *=====================================================================
 * count_demand_cpus(resvs, jcnt, sh_demand) - Update share use data
 *		for queued jobs.
 * Entry:	resvs = array of resource_resv struct ptrs
 *		jcnt = count of entries in jobs array
 * Exit:	share_demand values updated
 *=====================================================================
 */
static void
count_demand_cpus(resource_resv **resvs, int jcnt)
{
	int		i;
	job_info	*job;
	resource_resv	*resv;

	for (i = 0; i < jcnt; ++i) {
		/*
		 * Skip everything but eligible, queued jobs
		 */
		resv = resvs[i];
		if (!resv->is_job || (job = resv->job) == NULL)
			continue;
		if (!in_runnable_state(resv))
			continue;
		bump_demand_count(job->sh_info, resv->share_type, job->sh_amts, 1);
	}
}


/*
 *=====================================================================
 * count_contrib_cpus(root, node, sh_contrib) - Count CPUs available
 *		for borrowing.
 * Entry:	root = base of share info tree
 *		node = base of current sub-tree
 *		sh_contrib = where to accumulate overall totals
 * Exit:	Contents of sh_contrib set
 *=====================================================================
 */
static void
count_contrib_cpus(share_info *root, share_info *node, sh_amt *sh_contrib)
{
	int	i;
	int	contrib;

	if (root == NULL || node == NULL)
		return;
	if (node == root) {
		/* Clear counts */
		memset(sh_contrib, 0, shr_class_count * sizeof(*sh_contrib));
	}
	/*
	 * Only nodes with allocations can contribute
	 */
	if (node == node->leader && node != root) {
		for (i = 0; i < shr_class_count; ++i) {
			contrib = node->share_ncpus[i] -
				(node->share_inuse[i][J_TYPE_limited]
				+ node->share_inuse[i][J_TYPE_borrow]
				+ node->share_demand[i][J_TYPE_limited]
				+ node->share_demand[i][J_TYPE_borrow]
				) ;
			if (contrib > 0)
				sh_contrib[i] += contrib;
		}
	}
	if (node->child)
		count_contrib_cpus(root, node->child, sh_contrib);
	if (node->sibling)
		count_contrib_cpus(root, node->sibling, sh_contrib);
	if (node == root) {
		/*
		 * Remove root demand from amounts available.
		 */
		for (i = 0; i < shr_class_count; ++i) {
			int j;

			contrib = sh_contrib[i];
			for (j = 0; j < J_TYPE_COUNT; ++j) {
				if (j != J_TYPE_borrow) {
					contrib -= root->share_demand[i][j];
				}
			}
			if (contrib < 0)
				contrib = 0;
			sh_contrib[i] = contrib;
		}
	}
}


/*
 *=====================================================================
 * dup_shares (oldsh, nsinfo) - duplicate share tree
 * Entry:	oldsh = existing share head
 *		nsinfo = server info to record new share tree in
 * Returns:	1 on success, 0 on error
 *=====================================================================
 */
static int
dup_shares(share_head *oldsh, server_info *nsinfo)
{
	share_info	*oroot;
	share_info	*nroot;
	share_head	*newsh;

	if (oldsh == NULL || nsinfo == NULL)
		return 0;
	if ((oroot = oldsh->root) == NULL)
		return 0;
	newsh = new_share_head(shr_class_count);
	if (newsh == NULL)
		return 0;
	nroot = dup_share_tree(oroot);
	if (nroot == NULL) {
		free_share_head(newsh, 1);
		return 0;
	}
	newsh->root = nroot;
	newsh->prev = oldsh;
	cur_shr_head = newsh;
	memcpy(newsh->sh_total, oldsh->sh_total,
		shr_class_count*sizeof(*newsh->sh_total));
	memcpy(newsh->sh_avail, oldsh->sh_avail,
		shr_class_count*sizeof(*newsh->sh_avail));
	memcpy(newsh->sh_contrib, oldsh->sh_contrib,
		shr_class_count*sizeof(*newsh->sh_contrib));
	nsinfo->share_head = newsh;
	return 1;
}


/*
 *=====================================================================
 * dup_share_tree(root) - clone a share_info (sub)tree
 * Entry:	root = root of subtree to clone
 * Returns:	root of cloned copy
 * Modifies:	tptr link in original tree points to clone of that node
 *=====================================================================
 */
static share_info *
dup_share_tree(share_info *oroot)
{
	share_info	*nroot;

	if (oroot == NULL)
		return NULL;
	nroot = new_share_info_clone(oroot);
	if (nroot == NULL)
		return NULL;
	oroot->tptr = nroot;
	/*
	 * Update pointers where needed, etc.
	 */
	if (oroot->parent != NULL)
		nroot->parent = oroot->parent->tptr;
	if (oroot->leader != NULL)
		nroot->leader = oroot->leader->tptr;
	/*
	 * Breadth-first tree walk
	 */
	nroot->sibling = dup_share_tree(oroot->sibling);
	nroot->child = dup_share_tree(oroot->child);
	return nroot;
}


/*
 *=====================================================================
 * find_entity_share(name, node) - Look up share info for entity
 *		Patterns are taken into account.
 *		The sub-tree rooted at node is searched for the best
 *		match, where best is either an exact match, or the
 *		pattern with the lowest line number.
 * Entry:	name = Name of entity to locate.
 *		node = Root of subtree to search
 * Returns:	Pointer to matching share_info structure
 *=====================================================================
 */
static share_info *
find_entity_share(char *name, share_info *node)
{
	share_info *	si;
	share_info *	child;
	share_info *	best_si;

	if (node == NULL) {
		return NULL;
	}
	if (strcmp(name, node->name) == 0) {
		return node;		/* Simple match */
	}
	best_si = NULL;
	if (node->pattern_type != share_info::pattern_type::PATTERN_NONE) {
		if (regexec(&node->pattern, name, 0, NULL, 0) == 0) {
			/* Found one match */
			best_si = node;
		}
	}
	for (child = node->child; child; child = child->sibling) {
		si = find_entity_share(name, child);
		if (si) {
			if (si->pattern_type == share_info::pattern_type::PATTERN_NONE) {
				/* Found simple match in sub-tree */
				best_si = si;
				break;
			}
			if (best_si == NULL) {
				best_si = si;
				continue;
			}
			if (si->lineno < best_si->lineno) {
				best_si = si;
			}
		}
	}
	return best_si;
}


/*
 *=====================================================================
 * find_most_favored_share(root, topjobs) - Search share group list
 *		for group that is under the topjobs limit and has
 *		the lowest share use ratio.
 * Entry:	root = pointer to (sub)tree to search
 *		topjobs = configured topjob guarantee
 * Returns:	Pointer to favored share group info
 *		NULL if no group under topjobs.
 *=====================================================================
 */
share_info *
find_most_favored_share(share_info* root, int topjobs)
{
	share_info*	best;
	share_info*	si;

	if (root == NULL)
		return NULL;
	if (root->leader == root
		&& (root->topjob_count < topjobs
		  || root->tj_cpu_cost < TJ_COST_MAX)
		&& !root->none_left)
		best = root;
	else
		best = NULL;
	if (root->child) {
		si = find_most_favored_share(root->child, topjobs);
		if (best == NULL || (si != NULL && si->ratio < best->ratio))
			best = si;
	}
	if (root->sibling) {
		si = find_most_favored_share(root->sibling, topjobs);
		if (best == NULL || (si != NULL && si->ratio < best->ratio))
			best = si;
	}
	return best;
}


/*
 *=====================================================================
 * find_share_class(root, name) - Find share class in tree and return
 *		its class index
 * Entry:	root = root of class list to search
 *		name = name of class to search for
 * Returns:	matching class index
 *		0 (default) on no match
 *=====================================================================
 */
static int
find_share_class(struct shr_class *root, char *name)
{
	while (root) {
		if (strcmp(root->name, name) == 0)
			break;
		root = root->next;
	}
	return root ? root->sh_cls : 0;
}


/*
 *=====================================================================
 * find_share_group(root, name) - Look up share group info by name.
 *		No pattern matching is performed.
 * Entry:	root = root of share info tree
 *		name = name to find
 * Returns:	ptr to share info, or NULL if not found
 *=====================================================================
 */
static share_info *
find_share_group(share_info *root, char *name)
{
	share_info	*child;
	share_info	*result = NULL;

	if (root == NULL || name == NULL)
		return NULL;
	if (strcmp(root->name, name) == 0)
		return root;
	for (child = root->child; child; child = child->sibling) {
		result = find_share_group(child, name);
		if (result)
			break;
	}
	return result;
}


/*
 *=====================================================================
 * find_share_type(head, name) - Look up type by name and return its
 *	type index.
 * Entry:	head = head of table list
 *		name = name to find
 * Returns:	index, or 0 on no match (default)
 *=====================================================================
 */
#if 0
static int
find_share_type(struct shr_type *head, char *name)
{
	if (head == NULL || name == NULL || *name == '\0')
		return 0;
	for (; head ; head = head->next) {
		if (strcmp(name, head->name) == 0) {
			return head->sh_cls;
		}
	}
	return 0;
}
#endif


/*
 *=====================================================================
 * find_user(head, name) - Look up user in list, adding if missing.
 * Entry:	head = ptr to head of list
 *		name = name to find
 * Returns:	ptr to user info structure
 *		NULL on error
 *		*head possibly updated
 *=====================================================================
 */
static site_user_info*
find_user(site_user_info **head, char *name)
{
	site_user_info	*cur;
	site_user_info	*prev;
	site_user_info	*sui;

	if (head == NULL)
		return NULL;
	prev = NULL;
	for (cur = *head; cur ; cur = cur->next) {
		int rc = strcasecmp(name, cur->user_name);
		if (rc == 0)
			return cur;
		if (rc > 0)
			break;
		prev = cur;
	}
	/*
	 * Not found, allocate a new entry and link it in.
	 */
	sui = malloc(sizeof(site_user_info) + strlen(name));
	if (sui == NULL)
		return NULL;		/* memory allocation failed */
	strcpy(sui->user_name, name);
	sui->current_use = sui->current_use_pqt = 0;
	sui->next = cur;
	if (prev == NULL) {
		*head = sui;
	} else {
		prev->next = sui;
	}
	return sui;
}


/*
 *=====================================================================
 * free_share_head(sh, flag) - Free a share head and associated tree
 * Entry:	sh = ptr to share head
 *		flag = true if tree expected to be a clone
 *=====================================================================
 */
static void
free_share_head(share_head *sh, int flag)
{
	share_info	*root;

	if (sh == NULL)
		return;
	root = sh->root;
	if (root == NULL)
		return;
	if (flag) {
		/*
		 * Be careful when releasing things that are supposed
		 * to be clones.
		 */
		if (!root->am_clone)
			return;
		if (sh != cur_shr_head)
			return;
		cur_shr_head = cur_shr_head->prev;
	}
	free_share_tree(root);
	free(sh);
}


/*
 *=====================================================================
 * free_share_tree(root) - Free share info tree
 * Entry:	root = root of (sub)tree to free
 *=====================================================================
 */
static void
free_share_tree(share_info *root)
{
	if (root == NULL)
		return;
	free_share_tree(root->child);
	free_share_tree(root->sibling);
	if (!root->am_clone) {
		if (root->pattern_type != share_info::pattern_type::PATTERN_NONE) {
			regfree(&root->pattern);
		}
	}
	free(root);
}


/*
 *=====================================================================
 * free_users(head) - Free linked list of users rooted at head
 * Entry:	head = ptr to head of list
 * Exit:	List freed, head NULLed
 *=====================================================================
 */
static void
free_users(site_user_info **head)
{
	site_user_info*	cur;
	site_user_info* next;

	for (cur = *head; cur; cur = next) {
		next = cur->next;
		free(cur);
	}
	*head = NULL;
}


/*
 *=====================================================================
 * get_share_ratio(ncpus, asking, amts) - Compute group share use ratio
 *		This is the maximum of the use ratios for classes
 *		that are relevant.
 * Entry:	ncpus = sh_amt array for group allocation
 *		asking = sh_amt array for job,
 *			NULL if desire value for group as a whole.
 *		amts = current use numbers.
 *=====================================================================
 */
double
get_share_ratio(sh_amt* ncpus, sh_amt* asking, sh_amt_array* amts)
{
	int	cls;
	double	ratio = 0.0;
	double	t;

	for (cls = 0; cls < shr_class_count; ++cls) {
		if (ncpus[cls] == 0)
			continue;
		if (asking != NULL && asking[cls] == 0)
			continue;
		t = (double)(amts[cls][J_TYPE_limited]
			+ amts[cls][J_TYPE_borrow])
		/ (double)(ncpus[cls]);
		if (t > ratio)
			ratio = t;
	}
	return ratio;
}


/*
 *=====================================================================
 * init_users(sinfo) - Collect information about users
 * Entry:	sinfo = Server info
 * Returns:	0 on success, else non-zero
 *=====================================================================
 */
static int
init_users(server_info *sinfo)
{
	resource_resv	**resvs = sinfo->jobs;
	resource_resv	*resv;
	job_info	*job;
	int		jcnt = sinfo->sc.total;
	int		i;
	site_user_info	*sui;
	queue_info	*queue;

	free_users(&users);
	for (i = 0; i < jcnt; ++i) {
		resv = resvs[i];
		if (!resv->is_job || (job = resv->job) == NULL)
			continue;
		if ((queue = job->queue) == NULL) {
			job->u_info = NULL;
			continue;
		}
		sui = find_user(&users, resv->user);
		if (sui == NULL) {
			return 1;
		}
		job->u_info = sui;
		/*
		 * Accumulate accrual rates for running jobs
		 */
		if (!job->is_running)
			continue;
		if (queue->is_topjob_set_aside) {
			sui->current_use_pqt += job->accrue_rate;
		} else {
			sui->current_use += job->accrue_rate;
		}
	}
	return 0;
}


/*
 *=====================================================================
 * list_share_info(fp, root, pfx, idx, sname, flag) - Write current share
 *		info to file
 * Entry:	fp = FILE * to write to
 *		root = base of sub-tree to write
 *		pfx = string to prefix each line with
 *		idx = share type to report on
 *		sname = identifier for share type
 *		flag = non-zero to list only leaders
 * Exit:	subtree info written to file
 *=====================================================================
 */
static void
list_share_info(FILE *fp, share_info *root, const char *pfx, int idx, const char *sname, int flag)
{
	if (shr_types == NULL || shr_class_count == 0)
		return;
	if (flag == 0 || root == root->leader) {
		char		buf[J_TYPE_COUNT * 2 * 15];
		char		*p;
		char		*s;
		char		*lname;
		int		j;
		sh_amt		*use_amts;
		sh_amt		*dmd_amts;

		use_amts = &root->share_inuse[idx][0];
		dmd_amts = &root->share_demand[idx][0];
		s = "";
		p = buf;
		for (j = 0; j < J_TYPE_COUNT; ++j) {
			int len;

			len = sprintf(p, "%s%d+%d",
				s, use_amts[j], dmd_amts[j]);
			p += len;
			s = "/";
		}
		lname = root->leader ? root->leader->name : "<no_leader>";
		fprintf(fp, "%s%17s=%s\t%d\t%d\t%d\t%s\t%s\n",
			pfx, root->name, sname,
			root->share_gross[idx], root->share_net[idx],
			root->share_ncpus[idx], buf, lname);
	}
	if (root->child)
		list_share_info(fp, root->child, pfx, idx, sname, flag);
	if (root->sibling)
		list_share_info(fp, root->sibling, pfx, idx, sname, flag);
}


/*
 *=====================================================================
 * set_share_cpus(node, gross, sh_avail) - Apportion CPUs based on allocations
 * Entry:	node = fairshare info subtree
 *		gross = total gross share units
 *		avail = available CPUs of each type
 * Exit:	share_ncpus fields in tree updated
 *=====================================================================
 */
static void
set_share_cpus(share_info *node, sh_amt *gross, sh_amt *sh_avail)
{
	int		i;

	if (node == NULL)
		return;
	/*
	 * Only groups with allocations get ncpus set
	 */
	if (node->share_gross[0] >= 0) {
		int cpus;
		for (i = 0; i < shr_class_count; ++i) {
			if (node->share_net[i] == 0) {
				cpus = 0;
			} else {
				double t_shares, t_cpus;
				t_cpus = sh_avail[i];
				t_shares = gross[i];
				/*
				 * Have to worry about 32-bit overflow in
				 * the following computation.
				 */
				cpus = (int)((t_cpus * node->share_net[i]) /
					t_shares);
				if (cpus < 4) {
					printf("%s: group %s gets only %d %s CPUs\n",
						__func__, node->name,
						cpus, shr_class_name_by_idx(i));
					fflush(stdout);
				}
			}
			node->share_ncpus[i] = cpus;
		}
	} else {
		for (i = 0; i < shr_class_count; ++i) {
			node->share_ncpus[i] = -1;
		}
	}
	if (node->sibling)
		set_share_cpus(node->sibling, gross, sh_avail);
	if (node->child)
		set_share_cpus(node->child, gross, sh_avail);
}


/*
 *=====================================================================
 * bump_share_count(si, stype, sc, sign) - Bump group inuse CPU counts
 * Entry:	si = group's share info
 *		stype = Which counter to bump
 *		sc = Array of counts to bump by.
 *		sign = +/-1 to select incrementing/decrementing
 * Exit:	Counters bumped within tree
 *=====================================================================
 */
static void
bump_share_count(share_info *si, enum site_j_share_type stype, sh_amt *sc, int sign)
{
	share_info	*leader;
	int		i;

	if (si == NULL)
		return;
	/*
	 * Bump count for group itself and for sub-tree leader
	 * (unless group is leader)
	 */
	for (i = 0; i < shr_class_count; ++i) {
		si->share_inuse[i][stype] += sc[i] * sign;
	}
	leader = si->leader;
	if (leader && leader != si) {
		for (i = 0; i < shr_class_count; ++i) {
			leader->share_inuse[i][stype] += sc[i] * sign;
		}
	}
}


/*
 *=====================================================================
 * bump_demand_count(si, stype, sc, sign) - Bump group demand CPU counts
 * Entry:	si = group's share info
 *		stype = Which counter to bump
 *		sc = Array of counts to bump by.
 *		sign = +/-1 to select incrementing/decrementing
 * Exit:	Counters bumped within tree
 *=====================================================================
 */
static void
bump_demand_count(share_info *si, enum site_j_share_type stype, sh_amt *sc, int sign)
{
	share_info	*leader;
	int		i;

	if (si == NULL)
		return;
	for (i = 0; i < shr_class_count; ++i) {
		si->share_demand[i][stype] += sc[i] * sign;
	}
	leader = si->leader;
	if (leader && leader != si) {
		for (i = 0; i < shr_class_count; ++i) {
			leader->share_demand[i][stype] += sc[i] * sign;
		}
	}
}


/*
 *=====================================================================
 * zero_share_counts(node) - zero CPU info in tree
 * Entry:	node = root of portion of tree to zero
 * Exit:	share_inuse[], share_demand[] zeroed in sub-tree
 *=====================================================================
 */
static void
zero_share_counts(share_info *node)
{
	if (node == NULL)
		return;
	memset(node->share_inuse, 0, shr_class_count * sizeof(*node->share_inuse));
	memset(node->share_demand, 0, shr_class_count * sizeof(*node->share_demand));
	if (node->child)
		zero_share_counts(node->child);
	if (node->sibling)
		zero_share_counts(node->sibling);
}


/*
 *=====================================================================
 * new_share_head(cnt) - Allocate new share_info head structure
 * Entry:	cnt = number of sh_amt classes
 * Returns:	pointer to initialized head structure
 *=====================================================================
 */
static share_head *
new_share_head(int cnt)
{
	share_head	*newsh;
	size_t		sz;
	sh_amt		*ptr;

	/*
	 * Double cnt to allow space for backup copy of class values.
	 * Original values go in indices 0..cnt-1, backup in cnt..2*cnt-1
	 */
	cnt *= 2;

	sz = sizeof(struct share_head);
	sz += cnt * sizeof(sh_amt);	/*active*/
	sz += cnt * sizeof(sh_amt);	/*avail*/
	sz += cnt * sizeof(sh_amt);	/*contrib*/
	sz += cnt * sizeof(sh_amt);	/*total*/
	newsh = calloc(1, sz);
	if (newsh == NULL)
		return NULL;
	ptr = (sh_amt *)(newsh + 1);
	newsh->sh_active = ptr;
	ptr += cnt;
	newsh->sh_avail = ptr;
	ptr += cnt;
	newsh->sh_contrib = ptr;
	ptr += cnt;
	newsh->sh_total = ptr;
	ptr += cnt;
	return newsh;
}


/*
 *=====================================================================
 * new_share_info(name, cnt) - Create new share_info node
 * Entry:	name = name to assign to node
 *		cnt = number of classes to make room for.
 * Returns:	pointer to new share_info struct
 *=====================================================================
 */
static share_info *
new_share_info(char *name, int cnt)
{
	size_t		sz;
	sh_amt		*ptr;
	sh_amt_array	*aptr;
	share_info	*si;

	/*
	 * The share_info struct contains pointers to variable-sized
	 * arrays of sh_amts.  These arrays are allocated after the
	 * base structure and the pointers set to point to them.
	 */
	/*
	 * We allocate space for backup copies of some items.
	 * Original values use indices 0..cnt-1, backups use cnt..2*cnt-1.
	 * Note that for sh_amt_arrays, the backup copies are after all
	 * the original arrays, so again, the original values use indices
	 * 0..cnt-1 as the first subscript, and the backups use cnt..2*cnt-1.
	 */
	sz = sizeof(share_info);
	sz += cnt * sizeof(sh_amt);		/*gross*/
	sz += cnt * sizeof(sh_amt);		/*net*/
	sz += cnt * sizeof(sh_amt);		/*ncpus*/
	sz += 2 * cnt * sizeof(sh_amt_array);	/*inuse + backup*/
	sz += 2 * cnt * sizeof(sh_amt_array);	/*demand + backup*/
	si = calloc(1, sz + strlen(name) + 1);
	if (si != NULL) {
		ptr = (sh_amt *)(si + 1);
		si->share_gross = ptr;
		ptr += cnt;
		si->share_net = ptr;
		ptr += cnt;
		si->share_ncpus = ptr;
		ptr += cnt;
		aptr = (sh_amt_array *) ptr;
		si->share_inuse = aptr;
		aptr += 2 * cnt;
		si->share_demand = aptr;
		aptr += 2 * cnt;
		si->name = (char *)aptr;
		assert(si->name - (char *)si <= sz);
		strcpy(si->name, name);
		si->size = sz;
	}
	return si;
}


/*
 *=====================================================================
 * new_share_info_clone(old) - Clone a share_info structure
 *	Returned node has copy of sh_amt values, but shares
 *	name.
 * Entry:	old = ptr to existing share_info to copy
 * Returns:	ptr to clone
 *=====================================================================
 */
static share_info *
new_share_info_clone(share_info *old)
{
	share_info	*si;
	sh_amt		*ptr;
	sh_amt_array	*aptr;
	int		cnt = shr_class_count;

	if (old == NULL)
		return NULL;
	si = malloc(old->size);
	if (si) {
		memcpy(si, old, old->size);
		/* Zap tree pointers */
		si->parent = si->sibling = si->child = si->leader = NULL;
		si->am_clone = 1;
		/*
		 * Adjust internal pointers
		 */
		ptr = (sh_amt *)(si + 1);
		si->share_gross = ptr;
	ptr += cnt;
		si->share_net = ptr;
	ptr += cnt;
		si->share_ncpus = ptr;
	ptr += cnt;
		aptr = (sh_amt_array *) ptr;
		si->share_inuse = aptr;
	aptr += 2 * cnt;
		si->share_demand = aptr;
aptr += 2 * cnt;
	}
	return si;
}


/*
 *=====================================================================
 * reconcile_shares(root, cnt) - Complete construction of share tree after
 *		share file all read.
 * Entry:	root = root of share_info tree
 *		cnt = count of sh_amt entries in amount arrays
 * Returns:	1 if all okay, else 0
 *=====================================================================
 */
static int
reconcile_shares(share_info *root, int cnt)
{
	int	i;
	int	result = 1;

	if (root == NULL)
		return result;		/* Nothing to do */
	root->leader = root;		/* ROOT is its own leader */
	for (i = 0; i < cnt; ++i)
		root->share_gross[i] = -2;
	result = reconcile_share_tree(root, root, cnt);
	return result;
}


/*
 *=====================================================================
 * reconcile_share_tree(root, def, cnt) - Complete construction of
 *		share info subtree.
 * Entry:	root = root of subtree
 *		def = default leader for this subtree
 *		cnt = count of sh_amt entries in amount arrays
 * Returns:	1 if all okay, else 0
 *=====================================================================
 */
static int
reconcile_share_tree(share_info *root, share_info *def, int cnt)
{
	share_info	*child;
	int		i;

	if (root == NULL || def == NULL)
		return 1;
	/*
	 * If current root has allocation, it becomes default leader for
	 * it and its kiddies.
	 */
	for (i = 0; i < cnt; ++i) {
		if (root->share_gross[i] > 0) {
			def = root;
			break;
		}
	}
	root->leader = def;
	/*
	 * Traverse tree depth-first, using share_net as temp to accumulate
	 * gross values for children.
	 */
	for (i = 0; i < cnt; ++i) {
		root->share_net[i] = 0;
	}
	for (child = root->child; child; child = child->sibling) {
		if (!reconcile_share_tree(child, def, cnt)) {
			return 0;
		}
		for (i = 0; i < cnt; ++i) {
			root->share_net[i] += child->share_net[i];
		}
	}
	/*
	 * If we are a leader, make sure our share is sufficient to cover
	 * our children.  If not, gripe and increase it to match.
	 */
	if (def == root) {
		for (i = 0; i < cnt; ++i) {
			sh_amt c_sum, gross;

			gross = root->share_gross[i];
			c_sum = root->share_net[i];
			if (c_sum > gross) {
				if (gross >= 0) {
					sprintf(log_buffer,
						"%s share for %s too small for children: %d < %d",
						root->name, shr_class_name_by_idx(i),
						gross, c_sum);
					log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE,
						LOG_NOTICE, __func__, log_buffer);
				}
				root->share_gross[i] = gross = c_sum;
			}
			root->share_net[i] = gross - c_sum;
		}
	} else {
		for (i = 0; i < cnt; ++i) {
			root->share_gross[i] = -1;
		}
	}
	return 1;
}


/*
 *=====================================================================
 * shr_class_info_by_idx(idx) - Look up Nth CPU share class info.
 * Entry:	idx = index of share class
 * Returns:	pointer to matching class info, or default entry
 *=====================================================================
 */
#if 0
static struct shr_class *
shr_class_info_by_idx(int idx)
{
	struct shr_class	*scp;

	for (scp = shr_classes; scp; scp = scp->next) {
		if (scp->sh_cls == idx)
			break;
	}
	if (scp == NULL)
		scp = shr_classes;
	return scp;
}
#endif


/*
 *=====================================================================
 * shr_class_info_by_name(name) - Look up CPU share class by class name
 * Entry:	name = name of class
 * Returns:	pointer to matching class info, or default entry.
 *=====================================================================
 */
#if 0
static struct shr_class *
shr_class_info_by_name(const char * name)
{
	struct shr_class	*scp;

	for (scp = shr_classes; scp; scp = scp->next) {
		if (strcmp(scp->name, name) == 0)
			break;
	}
	if (scp == NULL)
		scp = shr_classes;
	return scp;
}
#endif


/*
 *=====================================================================
 * shr_class_info_by_type_name(name) - Look up share class by type name
 * Entry:	name = name of CPU type to look up
 * Returns:	pointer to matching share class, or default class if no
 *		match
 *=====================================================================
 */
#if 0
static struct shr_class *
shr_class_info_by_type_name(const char * name)
{
	struct shr_type	*stp;
	struct shr_class	*scp;

	for (stp = shr_types; stp; stp = stp->next) {
		if (strcmp(name, stp->name) == 0) {
			scp = shr_class_info_by_idx(stp->sh_cls);
			break;
		}
	}
	if (stp == NULL || scp == NULL)
		scp = shr_classes;
	return scp;
}
#endif


/*
 *=====================================================================
 * shr_class_name_by_idx(idx) - Look up Nth share class name.
 * Entry:	idx = which share class to find
 * Returns:	matching class name or "" if none
 *=====================================================================
 */
static char *
shr_class_name_by_idx(int idx)
{
	struct shr_class	*scp;
	char *sp;

	for (scp = shr_classes; scp; scp = scp->next) {
		if (scp->sh_cls == idx)
			break;
	}
	sp = scp ? scp->name : "";
	return sp;
}


/*
 *=====================================================================
 * shr_type_info_by_idx(idx) - Look up Nth CPU type info
 * Entry:	idx = desired CPU type
 * Returns:	pointer to idx'th CPU type info, or default type info
 *=====================================================================
 */
static struct shr_type *
shr_type_info_by_idx(int idx)
{
	struct shr_type	*stp;

	for (stp = shr_types; stp; stp = stp->next) {
		if (stp->sh_tidx == idx)
			break;
	}
	if (stp == NULL)
		stp = shr_types;
	return stp;
}


/*
 *=====================================================================
 * shr_type_info_by_name(name) - Look up CPU type info by type name
 * Entry:	name = desired CPU type name
 * Returns:	pointer to matching CPU type info, or default type
 *=====================================================================
 */
static struct shr_type *
shr_type_info_by_name(const char* name)
{
	struct shr_type	*stp;

	for (stp = shr_types; stp; stp = stp->next) {
		if (strcmp(stp->name, name) == 0)
			break;
	}
	if (stp == NULL)
		stp = shr_types;
	return stp;
}


/*
 *=====================================================================
 * squirrel_shr_head(sinfo) - make backup of alterable shares data
 * Entry:	sinfo = current server info
 *=====================================================================
 */
static void
squirrel_shr_head(server_info *sinfo)
{
	share_head	*sh;
	int		cnt = shr_class_count;

	if (sinfo == NULL || (sh = sinfo->share_head) == NULL)
		return;
#define MM(x) memmove(sh->x + cnt, sh->x, cnt * sizeof(*sh->x))
	MM(sh_active);
	MM(sh_avail);
	MM(sh_contrib);
	MM(sh_total);
#undef MM
	squirrel_shr_tree(sh->root);
}


/*
 *=====================================================================
 * un_squirrel_shr_head(sinfo) - restore share values from backup
 * Entry:	sinfo = server info
 *=====================================================================
 */
static void
un_squirrel_shr_head(server_info *sinfo)
{
	share_head	*sh;
	int		cnt = shr_class_count;

	if (sinfo == NULL || (sh = sinfo->share_head) == NULL)
		return;
#define MM(x) memmove(sh->x, sh->x + cnt, cnt * sizeof(*sh->x))
	MM(sh_active);
	MM(sh_avail);
	MM(sh_contrib);
	MM(sh_total);
#undef MM
	un_squirrel_shr_tree(sh->root);
}


/*
 *=====================================================================
 * squirrel_shr_tree(root) - make backup of alterable shares data
 * Entry:	root = root of (sub)tree of share_info to backup.
 *=====================================================================
 */
static void
squirrel_shr_tree(share_info *root)
{
	int		cnt = shr_class_count;

	if (root == NULL)
		return;
#define	MM(x) memmove(root->x + cnt, root->x, cnt * sizeof(*root->x))
	MM(share_inuse);
	MM(share_demand);
#undef MM
	if (root->sibling)
		squirrel_shr_tree(root->sibling);
	if (root->child)
		squirrel_shr_tree(root->child);
	root->ratio_bak = root->ratio;
}


/*
 *=====================================================================
 * un_squirrel_shr_tree(root) - restore alterable share data
 * Entry:	root = root of (sub)tree of share_info to restore.
 *=====================================================================
 */
static void
un_squirrel_shr_tree(share_info *root)
{
	int		cnt = shr_class_count;

	if (root == NULL)
		return;
#define	MM(x) memmove(root->x, root->x + cnt, cnt * sizeof(*root->x))
	MM(share_inuse);
	MM(share_demand);
#undef MM
	if (root->sibling)
		un_squirrel_shr_tree(root->sibling);
	if (root->child)
		un_squirrel_shr_tree(root->child);
	root->ratio = root->ratio_bak;
}


/*
 *=====================================================================
 * pick_next_job(policy, jobs, pnfilter, si) - Slightly modified version
 *		of Altair's extract_fairshare. We add an additional job
 *		check using the pnfilter function
 * Entry:	policy = current scheduler policy structure
 *		jobs = list of jobs to search
 *		pnfilter = pointer to a binary job filter function
 *		si = pointer to current most favored share
 * Returns:	pointer to next job that matches search criteria, else NULL
 *=====================================================================
 */
static resource_resv *
pick_next_job(status *policy, resource_resv **jobs, pick_next_filter pnfilter, share_info *si)
{
	resource_resv *good = NULL;	/* job with the min usage / percentage */
	int cmp;			/* comparison value of two jobs */
	int i;

	if (policy == NULL || jobs == NULL || pnfilter == NULL)
		return NULL;

	for (i = 0; jobs[i] != NULL; i++) {
		if (jobs[i]->is_job && jobs[i]->job !=NULL) {
			if (!jobs[i]->can_not_run && in_runnable_state(jobs[i]) &&
				pnfilter(jobs[i], si)) {
				if (!policy->fair_share)
					return jobs[i];

				if (good == NULL) {
					good = jobs[i];
					continue;
				}
				/*
				 * Restrict share comparisons to same job sort level.
				 */
				if (multi_sort(good, jobs[i]) != 0) {
#if NAS_DEBUG
					printf("%s: stopped at %s vs. %s\n",
						__func__, good->name, jobs[i]->name);
					fflush(stdout);
#endif
					break;
				}
				if (good->job->ginfo != jobs[i]->job->ginfo) {
					cmp = compare_path(good->job->ginfo->gpath,
						jobs[i]->job->ginfo->gpath);
					if (cmp > 0)
						good = jobs[i];
				}
			}
		}
	}
	return good;
}


/*
 *=====================================================================
 * job_filter_hwy149(resv, si) - binary job filter
 * Entry:	resv = job
 *		si = pointer to current most favored share
 * Returns:	1 if job passes filter, else 0
 *=====================================================================
 */
#ifdef	NAS_HWY149
static int
job_filter_hwy149(resource_resv *resv, share_info *si)
{
	if (resv == NULL || resv->job == NULL)
		return 0;

	if (resv->job->priority == NAS_HWY149 ||
		resv->job->NAS_pri == NAS_HWY149)
		return 1;

	return 0;
}
#endif


/*
 *=====================================================================
 * job_filter_dedres(resv, si) - binary job filter
 * Entry:	resv = job
 *		si = pointer to current most favored share
 * Returns:	1 if job passes filter, else 0
 *=====================================================================
 */
static int
job_filter_dedres(resource_resv *resv, share_info *si)
{
	if (resv == NULL)
		return 0;

	if (site_is_queue_topjob_set_aside(resv) &&
		num_topjobs_per_queues < conf.per_queues_topjobs)
		return 1;

	return 0;
}


/*
 *=====================================================================
 * job_filter_hwy101(resv, si) - binary job filter
 * Entry:	resv = job
 *		si = pointer to current most favored share
 * Returns:	1 if job passes filter, else 0
 *=====================================================================
 */
#ifdef	NAS_HWY101
static int
job_filter_hwy101(resource_resv *resv, share_info *si)
{
	if (resv == NULL || resv->job == NULL)
		return 0;

	if (resv->job->priority == NAS_HWY101 ||
		resv->job->NAS_pri == NAS_HWY101)
		return 1;

	return 0;
}
#endif


/*
 *=====================================================================
 * job_filter_normal(resv, si) - binary job filter
 * Entry:	resv = job
 *		si = pointer to current most favored share
 * Returns:	1 if job passes filter, else 0
 *=====================================================================
 */
static int
job_filter_normal(resource_resv *resv, share_info *si)
{
	if (resv == NULL || resv->job == NULL)
		return 0;

	if (si == NULL || resv->job->sh_info == NULL)
		/* Not using shares */
		return 1;
	if (resv->job->sh_info->leader == si &&
		!site_is_queue_topjob_set_aside(resv))
		return 1;

	return 0;
}


/*
 *=====================================================================
 *=====================================================================
 */


/* start localmod 030 */
/*
 *=====================================================================
 * check_for_cycle_interrupt(do_logging) - Check if a cycle interrupt
 has been requested.
 * Entry	do_logging = whether to print to scheduler log
 * Returns	1 if cycle should be interrupted
 *		0 if cycle should continue
 *=====================================================================
 */
int
check_for_cycle_interrupt(int do_logging)
{
	if (!do_soft_cycle_interrupt && !do_hard_cycle_interrupt) {
		return 0;
	}

	if (!do_hard_cycle_interrupt &&
	    consecutive_interrupted_cycles >= conf.max_intrptd_cycles) {
		return 0;
	}

	if (do_hard_cycle_interrupt ||
	    time(NULL) >=
		interrupted_cycle_start_time + conf.min_intrptd_cycle_length) {
		if (do_logging)
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
				"Short circuit of this cycle");

		return 1;
	}

	if (do_logging) {
		sprintf(log_buffer, "Too early to short circuit (%ds elapsed, need %ds)",
			(int)(time(NULL) - interrupted_cycle_start_time),
			conf.min_intrptd_cycle_length);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, log_buffer);
	}

	return 0;
}
/* end localmod 030 */

#endif /* NAS */
// clang-format on

================================================
FILE: src/scheduler/site_code.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * site_code.h - Site additions to scheduler code
 */

#ifdef NAS
#define SHARE_FILE "shares"
#define SORTED_FILE "sortedjobs"

extern int site_bump_topjobs(resource_resv *resv, double delta);
extern int site_check_cpu_share(server_info *, status *, resource_resv *);
extern time_t site_decode_time(const char *val);
extern int site_dup_shares(server_info *, server_info *);
extern sh_amt *site_dup_share_amts(sh_amt *oldp);
extern share_info *site_find_alloc_share(server_info *, char *);
extern void site_free_shares(server_info *);
extern double site_get_share(resource_resv *);
extern void site_init_shares(server_info *sinfo);
extern int site_is_queue_topjob_set_aside(resource_resv *resv);
extern int site_is_share_king(status *policy);
extern void site_list_shares(FILE *fp, server_info *, const char *pfx, int);
extern void site_list_jobs(server_info *sinfo, resource_resv **rarray);
extern int site_parse_shares(char *fname);
extern resource_resv *site_find_runnable_res(resource_resv **resresv_arr);
extern void site_resort_jobs(resource_resv *);
extern void site_restore_users(void);
extern void site_save_users(void);
extern void site_set_job_share(resource_resv *resresv);
extern void site_set_NAS_pri(job_info *, time_t, long);
extern void site_set_node_share(node_info *ninfo, schd_resource *res);
extern int site_set_share_head(server_info *sinfo);
extern void site_set_share_type(server_info *, resource_resv *);
extern int site_should_backfill_with_job(status *policy, server_info *sinfo, resource_resv *resresv, int ntj, int nqtj, schd_error *err);
extern int site_tidy_server(server_info *sinfo);
extern void site_update_on_end(server_info *, queue_info *, resource_resv *);
extern void site_update_on_run(server_info *, queue_info *, resource_resv *,
			       int flag, nspec **);
extern void site_vnode_inherit(node_info **);
extern int check_for_cycle_interrupt(int);

extern int num_topjobs_per_queues;

extern int do_soft_cycle_interrupt;
extern int do_hard_cycle_interrupt;
extern int consecutive_interrupted_cycles;
extern time_t interrupted_cycle_start_time;

#endif


================================================
FILE: src/scheduler/site_data.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * site_data.h - Site additions to scheduler data types
 */

#ifdef NAS

typedef sh_amt sh_amt_array[J_TYPE_COUNT];

struct share_info {
	char *name;	    /* Name for share group */
	share_info *parent; /* Pointers to build share tree */
	share_info *sibling;
	share_info *child;
	share_info *leader;		     /* group owning share this group uses */
	share_info *tptr;		     /* temp link for during tree manip */
	size_t size;			     /* total size of struct, less name */
	int am_clone;			     /* true if we are clone of another */
	int lineno;			     /* line number from shares file */
	int topjob_count;		     /* jobs considered this cycle */
	int none_left;			     /* all jobs for share considered */
	enum pattern_type {		     /* what type of pattern is name */
			    PATTERN_NONE = 0 /* not a pattern -> exact match */
			    ,
			    PATTERN_COMBINED = 1 /* pattern, usage all lumped together */
			    ,
			    PATTERN_SEPARATE = 2 /* pattern, record usage for each */
	} pattern_type;
	regex_t pattern;  /* name compiled into a regex */
	double ratio;	  /* current use / allocation */
	double ratio_bak; /* backup copy of ratio */
	/* localmod 154 */
	double ratio_max;	    /* max ratio seen during calendaring */
	double tj_cpu_cost;	    /* how much CPU time has been consumed
					 * putting top jobs on calendar */
	sh_amt *share_gross;	    /* group's gross share, if specified */
	sh_amt *share_net;	    /* gross minus children's gross */
	sh_amt *share_ncpus;	    /* share, as CPU count */
	sh_amt_array *share_inuse;  /* current CPU use by this group */
	sh_amt_array *share_demand; /* current CPU unmet demand */
};

struct share_head {
	share_info *root;   /* root of share tree */
	share_head *prev;   /* tree this was cloned from */
	sh_amt *sh_active;  /* CPU counts in use */
	sh_amt *sh_avail;   /* CPU counts not in use */
	sh_amt *sh_contrib; /* CPU counts that can be borrowed */
	sh_amt *sh_total;   /* total allocatable CPU counts */
};

struct site_user_info {
	struct site_user_info *next;	/* Linked list */
	sch_resource_t current_use;	/* Total accrual rate normal queues */
	sch_resource_t current_use_pqt; /* Accrual in set-aside queues */
	sch_resource_t saved_cu;	/* Saved current_use */
	sch_resource_t saved_cup;	/* Saved current_use_pqt */
	char user_name[1];		/* Dummy length */
};

#endif /* NAS */


================================================
FILE: src/scheduler/sort.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    sort.c
 *
 * @brief
 * 		sort.c - This file will hold the compare functions used by qsort
 *		to sort the jobs
 *
 * Functions included are:
 * 	cmpres()
 * 	cmp_placement_sets()
 * 	cmp_nspec()
 * 	cmp_queue_prio_dsc()
 * 	cmp_events()
 * 	cmp_fairshare()
 * 	cmp_preempt_priority_asc()
 * 	cmp_preempt_stime_asc()
 * 	cmp_preemption()
 * 	multi_sort()
 * 	cmp_job_sort_formula()
 * 	multi_node_sort()
 * 	multi_nodepart_sort()
 * 	resresv_sort_cmp()
 * 	node_sort_cmp()
 * 	cmp_sort()
 * 	find_nodepart_amount()
 * 	find_node_amount()
 * 	find_resresv_amount()
 * 	cmp_node_host()
 * 	cmp_aoe()
 * 	cmp_job_preemption_time_asc()
 * 	sort_jobs()
 * 	swapfunc()
 * 	med3()
 * 	qsort()
 *
 */
#include <pbs_config.h>

#include "check.h"
#include "constant.h"
#include "data_types.h"
#include "fairshare.h"
#include "fifo.h"
#include "globals.h"
#include "misc.h"
#include "node_info.h"
#include "resource.h"
#include "resource_resv.h"
#include "server_info.h"
#include "sort.h"
#include <errno.h>
#include <log.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#ifdef NAS
#include "site_code.h"
#endif

/**
 * @brief
 *		compare two new numerical resource numbers for a descending sort
 *
 * @param[in]	r1	-	resource 1
 * @param[in]	r2	-	resource 2
 *
 * @return	int
 * @retval	-1	: if r1 < r2
 * @retval	0 	: if r1 == r2
 * @retval	1  	: if r1 > r2
 */
int
cmpres(sch_resource_t r1, sch_resource_t r2)
{
	if (r1 == SCHD_INFINITY_RES && r2 == SCHD_INFINITY_RES)
		return 0;
	if (r1 == SCHD_INFINITY_RES)
		return -1;
	if (r2 == SCHD_INFINITY_RES)
		return 1;
	if (r1 < r2)
		return -1;
	if (r1 == r2)
		return 0;

	return 1;
}

/**
 * @brief
 *		cmp_placement_sets - sort placement sets by
 *			total cpus
 *			total memory
 *			free cpus
 *			free memory
 *
 * @param[in]	v1	-	node partition 1
 * @param[in]	v2	-	node partition 2
 *
 * @return	int
 * @retval	-1	: if v1 < v2
 * @retval	0 	: if v1 == v2
 * @retval	1  	: if v1 > v2
 */
int
cmp_placement_sets(const void *v1, const void *v2)
{
	node_partition *np1, *np2;
	schd_resource *ncpus1, *ncpus2;
	schd_resource *mem1, *mem2;
	int rc = 0;

	if (v1 == NULL && v2 == NULL)
		return 0;

	else if (v1 == NULL && v2 != NULL)
		return -1;

	else if (v1 != NULL && v2 == NULL)
		return 1;

	np1 = *((node_partition **) v1);
	np2 = *((node_partition **) v2);

	ncpus1 = find_resource(np1->res, allres["ncpus"]);
	ncpus2 = find_resource(np2->res, allres["ncpus"]);

	if (ncpus1 != NULL && ncpus2 != NULL)
		rc = cmpres(ncpus1->avail, ncpus2->avail);

	if (!rc) {
		mem1 = find_resource(np1->res, allres["mem"]);
		mem2 = find_resource(np2->res, allres["mem"]);

		if (mem1 != NULL && mem2 != NULL)
			rc = cmpres(mem1->avail, mem2->avail);
	}

	if (!rc) {
		if (ncpus1 != NULL && ncpus2 != NULL)
			rc = cmpres(dynamic_avail(ncpus1), dynamic_avail(ncpus2));
	}

	if (!rc) {
		if (mem1 != NULL && mem2 != NULL)
			rc = cmpres(dynamic_avail(mem1), dynamic_avail(mem2));
	}

	return rc;
}

/**
 * @brief
 * 		cmp_nspec - sort nspec by sequence number
 */
bool
cmp_nspec(const nspec *n1, const nspec *n2)
{
	if (n1->seq_num < n2->seq_num)
		return true;
	else if (n1->seq_num > n2->seq_num)
		return false;
	else
		return cmp_nspec_by_sub_seq(n1, n2);
}

/**
 * @brief
 * 		cmp_nspec_by_sub_seq - sort nspec by sub sequence number
 */
bool
cmp_nspec_by_sub_seq(const nspec *n1, const nspec *n2)
{
	if (n1->sub_seq_num < n2->sub_seq_num)
		return true;
	else
		return false;
}

/**
 * @brief
 *      cmp_queue_prio_dsc - sort queues in decending priority
 *
 * @param[in]	q1	-	queue_info 1
 * @param[in]	q2	-	queue_info 2
 *
 * @return	int
 * @retval	1	: if q1 < q2
 * @retval	0 	: if q1 >= q2
 */
bool
cmp_queue_prio_dsc(const queue_info *q1, const queue_info *q2)
{
	return (q2->priority < q1->priority);
}

/**
 * @brief
 *		cmp_events - sort jobs/resvs into a timeline of the next event
 *		to happen: running jobs ending, advanced reservations starting
 *		or ending
 *
 * @param[in]	v1	-	resource_resv 1
 * @param[in]	v2	-	resource_resv 2
 *
 * @return	int
 * @retval	-1	: if v1 < v2
 * @retval	0 	: if v1 == v2
 * @retval	1  	: if v1 > v2
 */
int
cmp_events(const void *v1, const void *v2)
{
	resource_resv *r1, *r2;
	time_t t1, t2;
	int run1, run2;			    /* are r1 and r2 in runnable states? */
	int end_event1 = 0, end_event2 = 0; /* are r1 and r2 end events? */

	r1 = *((resource_resv **) v1);
	r2 = *((resource_resv **) v2);

	if (r1->start != UNSPECIFIED && r2->start == UNSPECIFIED)
		return -1;

	if (r1->start == UNSPECIFIED && r2->start == UNSPECIFIED)
		return 0;

	if (r1->start == UNSPECIFIED && r2->start != UNSPECIFIED)
		return 1;

	run1 = in_runnable_state(r1);
	run2 = in_runnable_state(r2);

	if (r1->start >= r1->server->server_time && run1)
		t1 = r1->start;
	else {
		end_event1 = 1;
		t1 = r1->end;
	}

	if (r2->start >= r2->server->server_time && run2)
		t2 = r2->start;
	else {
		end_event2 = 1;
		t2 = r2->end;
	}

	if (t1 < t2)
		return -1;
	else if (t1 == t2) {
		/* if event times are equal, this means that events which consume
		 * resources and release resources happen at the same time.  We need to
		 * make sure events which release resources come first, so the events
		 * which consume them, can indeed do that.
		 */
		if (end_event1)
			return -1;
		else if (end_event2)
			return 1;
		else
			return 0;
	} else
		return 1;
}

/**
 * @brief
 *		cmp_fair_share - compare on fair share percentage only.
 *			 This is for strict priority.
 *
 * @param[in]	j1	-	resource_resv 1
 * @param[in]	j2	-	resource_resv 2
 *
 * @return	int
 * @retval	1	: if j1 < j2
 * @retval	0 	: if j1 == j2
 * @retval	-1  : if j1 > j2
 */
int
cmp_fairshare(const void *j1, const void *j2)
{
	resource_resv *r1 = *(resource_resv **) j1;
	resource_resv *r2 = *(resource_resv **) j2;
	if (r1->job != NULL && r1->job->ginfo != NULL &&
	    r2->job != NULL && r2->job->ginfo != NULL)
		return compare_path(r1->job->ginfo->gpath, r2->job->ginfo->gpath);

	return 0;
}

/**
 * @brief
 *		cmp_preempt_priority_asc - used to sort jobs in ascending preemption
 *				   priority
 *
 * @param[in]	j1	-	resource_resv 1
 * @param[in]	j2	-	resource_resv 2
 *
 * @return	int
 * @retval	-1	: if j1 < j2
 * @retval	0 	: if j1 == j2
 * @retval	1  : if j1 > j2
 */
int
cmp_preempt_priority_asc(const void *j1, const void *j2)
{
	if ((*(resource_resv **) j1)->job->preempt < (*(resource_resv **) j2)->job->preempt)
		return -1;
	else if ((*(resource_resv **) j1)->job->preempt > (*(resource_resv **) j2)->job->preempt)
		return 1;
	else {
		if ((*(resource_resv **) j1)->rank < (*(resource_resv **) j2)->rank)
			return -1;
		else if ((*(resource_resv **) j1)->rank > (*(resource_resv **) j2)->rank)
			return 1;
	}

	return 0;
}

/**
 * @brief
 *      cmp_preempt_stime_asc - used to soft jobs in ascending preemption
 *                              priority and start time
 *
 * @param[in]	j1	-	resource_resv 1
 * @param[in]	j2	-	resource_resv 2
 *
 * @return	int
 * @retval	-1	: if j1 < j2
 * @retval	0 	: if j1 == j2
 * @retval	1   : if j1 > j2
 */
int
cmp_preempt_stime_asc(const void *j1, const void *j2)
{
	if ((*(resource_resv **) j1)->job->preempt < (*(resource_resv **) j2)->job->preempt)
		return -1;
	else if ((*(resource_resv **) j1)->job->preempt > (*(resource_resv **) j2)->job->preempt)
		return 1;
	else {
		/* sort by start time */
		if ((*(resource_resv **) j1)->job->stime > (*(resource_resv **) j2)->job->stime)
			return -1;
		if ((*(resource_resv **) j1)->job->stime < (*(resource_resv **) j2)->job->stime)
			return 1;
	}

	return 0;
}

/**
 * @brief
 *  	cmp_premeption  - compare first by preemption priority and then
 *                   		if the job had been preempted, the order preempted.
 *
 * @param[in]	r1	-	resource_resv 1
 * @param[in]	r2	-	resource_resv 2
 *
 * @return	int
 * @retval	1	: if r1 < r2
 * @retval	0 	: if r1 == r2
 * @retval	-1  : if r1 > r2
 */
int
cmp_preemption(resource_resv *r1, resource_resv *r2)
{
	if (r1 != NULL && r2 == NULL)
		return -1;

	if (r1 == NULL && r2 == NULL)
		return 0;

	if (r1 == NULL && r2 != NULL)
		return 1;

	/* error, allow some other sort key to take over */
	if (r1->job == NULL || r2->job == NULL)
		return 0;

	if (r1->job->preempt < r2->job->preempt)
		return 1;
	else if (r1->job->preempt > r2->job->preempt)
		return -1;

	return 0;
}

/* multi keyed sorting
 * call compare function to sort for the first key
 * if the two keys are equal, call the compare funciton for the second key
 * repeat for all keys
 */

/**
 * @brief
 * 		multi_sort - a multi keyed sorting compare function for jobs
 *
 * @param[in] r1 - job to compare
 * @param[in] r2 - job to compare
 *
 * @return int
 * @retval -1, 0, 1 : standard qsort() cmp
 */
int
multi_sort(resource_resv *r1, resource_resv *r2)
{
	int ret = 0;

	for (const auto &si : *cstat.sort_by) {
		ret = resresv_sort_cmp(r1, r2, si);
		if (ret)
			break;
	}

	return ret;
}

/**
 * @brief
 * 		cmp_job_sort_formula - used to sort jobs based on their evaluated
 *				      job_sort_formula value (in DESC order)
 * @param[in] r1 - job to compare
 * @param[in] r2 - job to compare
 *
 * @return int
 * @retval -1, 0, 1 : standard qsort() cmp
 */
int
cmp_job_sort_formula(const void *j1, const void *j2)
{
	resource_resv *r1 = *(resource_resv **) j1;
	resource_resv *r2 = *(resource_resv **) j2;

	if (r1->job->formula_value < r2->job->formula_value)
		return 1;
	if (r1->job->formula_value > r2->job->formula_value)
		return -1;
	return 0;
}

/**
 * @brief
 *		multi_node_sort - a multi keyed sorting compare function for nodes
 *
 * @param[in] n1 - node1 to compare
 * @param[in] n2 - node2 to compare
 *
 * @return int
 *	@retval -1, 0, 1 - standard qsort() cmp
 */
int
multi_node_sort(const void *n1, const void *n2)
{
	int ret = 0;

	for (const auto &si : *cstat.node_sort) {
		ret = node_sort_cmp(n1, n2, si, SOBJ_NODE);
		if (ret)
			break;
	}

	if (ret == 0) {
		const node_info *r1 = *(static_cast<const node_info *const *>(n1));
		const node_info *r2 = *(static_cast<const node_info *const *>(n2));
		if (r1->rank < r2->rank)
			return -1;
		else
			return 1;
	}

	return ret;
}

/**
 * @brief
 * 		qsort() compare function for multi-resource node partition sorting
 *
 * @param[in] n1 - nodepart 1 to compare
 * @param[in] n2 - nodepart 2 to compare
 *
 * @return int
 *	@retval -1, 0, 1 - standard qsort() cmp
 */
int
multi_nodepart_sort(const void *n1, const void *n2)
{
	int ret = 0;

	for (const auto &si : *cstat.node_sort) {
		ret = node_sort_cmp(n1, n2, si, SOBJ_PARTITION);
		if (ret)
			break;
	}
	if (ret == 0) {
		const node_partition *r1 = *(static_cast<const node_partition *const *>(n1));
		const node_partition *r2 = *(static_cast<const node_partition *const *>(n2));
		if (r1->rank < r2->rank)
			return -1;
		else
			return 1;
	}
	return ret;
}

/**
 * @brief
 *		multi_bkt_sort - a multi keyed sorting compare function for node buckets
 *
 * @param[in] b1 - bkt1 to compare
 * @param[in] b2 - bkt2 to compare
 *
 * @return int
 *	@retval -1, 0, 1 - standard qsort() cmp
 */
int
multi_bkt_sort(const void *b1, const void *b2)
{
	int ret = 0;

	for (const auto &si : *cstat.node_sort) {
		ret = node_sort_cmp(b1, b2, si, SOBJ_BUCKET);
		if (ret)
			break;
	}

	return ret;
}

/**
 * @brief
 * 		compares two jobs using a sort defined by a sort_info
 *		This is used downstream by qsort()
 *
 * @param[in] r1	-	first job to compare
 * @param[in] r2 	-	second job to compare
 * @param[in] si 	- 	sort_info describing how to sort the jobs
 *
 * @returns -1, 0, 1 : standard qsort()) cmp
 *
 */
int
resresv_sort_cmp(resource_resv *r1, resource_resv *r2, const struct sort_info &si)
{
	sch_resource_t v1, v2;

	if (r1 != NULL && r2 == NULL)
		return -1;

	if (r1 == NULL && r2 == NULL)
		return 0;

	if (r1 == NULL && r2 != NULL)
		return 1;

	v1 = find_resresv_amount(r1, si.res_name, si.def);
	v2 = find_resresv_amount(r2, si.res_name, si.def);

	if (v1 == v2)
		return 0;

	if (si.order == ASC) {
		if (v1 < v2)
			return -1;
		else
			return 1;
	} else {
		if (v1 < v2)
			return 1;
		else
			return -1;
	}
}

/**
 * @brief
 * 		compares either two nodes or node_partitions based on a resource,
 *              Ascending/Descending, and what part of the resource to use (total, unused, etc)
 *
 * @param[in] vp1 		- the node/parts/bkts to compare
 * @param[in] vp2 		- the node/parts/bkts to compare
 * @param[in] si 		- sort info describing how to sort nodes
 * @param[in] obj_type 	- node or node_partition
 *
 * @return int
 * @retval -1, 0, 1 : standard qsort() cmp
 */
int
node_sort_cmp(const void *vp1, const void *vp2, const struct sort_info &si, const enum sort_obj_type obj_type)
{
	sch_resource_t v1, v2;
	node_info **n1 = NULL;
	node_info **n2 = NULL;
	node_partition **np1 = NULL;
	node_partition **np2 = NULL;
	node_bucket **b1 = NULL;
	node_bucket **b2 = NULL;

	if (vp1 != NULL && vp2 == NULL)
		return -1;

	if (vp1 == NULL && vp2 == NULL)
		return 0;

	if (vp1 == NULL && vp2 != NULL)
		return 1;

	switch (obj_type) {
		case SOBJ_NODE:
			n1 = (node_info **) vp1;
			n2 = (node_info **) vp2;
			v1 = find_node_amount(*n1, si.res_name, si.def, si.res_type);
			v2 = find_node_amount(*n2, si.res_name, si.def, si.res_type);
			break;
		case SOBJ_PARTITION:
			np1 = (node_partition **) vp1;
			np2 = (node_partition **) vp2;
			v1 = find_nodepart_amount(*np1, si.res_name, si.def, si.res_type);
			v2 = find_nodepart_amount(*np2, si.res_name, si.def, si.res_type);
			break;
		case SOBJ_BUCKET:
			b1 = (node_bucket **) vp1;
			b2 = (node_bucket **) vp2;
			v1 = find_bucket_amount(*b1, si.res_name, si.def, si.res_type);
			v2 = find_bucket_amount(*b2, si.res_name, si.def, si.res_type);
			break;

		default:
			return 0;
			break;
	}

	if (v1 == v2)
		return 0;

	if (si.order == ASC) {
		if (v1 < v2)
			return -1;
		else if (v1 > v2)
			return 1;
	} else {
		if (v1 < v2)
			return 1;
		else if (v1 > v2)
			return -1;
	}
	return 0;
}

/**
 * @brief
 * 		entrypoint into job sort used by qsort
 *
 *		1. Sort all preemption priority jobs in the front
 *		2. Sort all preempted jobs in ascending order of their preemption time
 *		3. Sort jobs according to their fairshare usage.
 *		4. sort by unique rank to stabilize the sort
 *
 * @param[in]	v1	-	resource_resv 1
 * @param[in]	v2	-	resource_resv 2
 *
 * @return	-1,0,1 : based on sorting function.
 */
int
cmp_sort(const void *v1, const void *v2)
{
	int cmp;
	resource_resv *r1;
	resource_resv *r2;

	r1 = *((resource_resv **) v1);
	r2 = *((resource_resv **) v2);

	if (r1 != NULL && r2 == NULL)
		return -1;

	if (r1 == NULL && r2 == NULL)
		return 0;

	if (r1 == NULL && r2 != NULL)
		return 1;

	if (in_runnable_state(r1) && !in_runnable_state(r2))
		return -1;
	else if (in_runnable_state(r2) && !in_runnable_state(r1))
		return 1;
	/* both jobs are runnable */
	else {
		/* sort based on preemption */
		cmp = cmp_preemption(r1, r2);
		if (cmp != 0)
			return cmp;

		cmp = cmp_job_preemption_time_asc(&r1, &r2);
		if (cmp != 0)
			return cmp;

		/* sort on the basis of job sort formula */
		cmp = cmp_job_sort_formula(&r1, &r2);
		if (cmp != 0)
			return cmp;
#ifndef NAS /* localmod 041 */
		if (r1->server->policy->fair_share) {
			cmp = cmp_fairshare(&r1, &r2);
			if (cmp != 0)
				return cmp;
		}
#endif /* localmod 041 */

		/* normal resource based sort */
		cmp = multi_sort(r1, r2);
		if (cmp != 0)
			return cmp;

		/* stabilize the sort */
		else {
			if (r1->qrank < r2->qrank)
				return -1;
			else if (r1->qrank > r2->qrank)
				return 1;
			if (r1->rank < r2->rank)
				return -1;
			else if (r1->rank > r2->rank)
				return 1;
			else {
				return 0;
			}
		}
	}
}
/**
 * @brief
 * 		return resource values based on res_type for node partition
 *
 * @param[in] np 		- node partition
 * @param[in] res 		- resource name
 * @param[in] def 		- resource definition of res
 * @param[in] res_type 	- type of resource value to use
 *
 * @note
 * 		special case sorting "resource" SORT_PRIORITY is not meaningful for
 *       	node partitions.  0 will always be returned
 *
 * @return	sch_resource_t
 */
sch_resource_t
find_nodepart_amount(node_partition *np, const std::string &res, resdef *def,
		     enum resource_fields res_type)
{
	schd_resource *nres;

	if (def != NULL)
		nres = find_resource(np->res, def);
	else
		nres = find_resource_by_str(np->res, res);

	if (nres != NULL) {
		if (res_type == RF_AVAIL)
			return nres->avail;
		else if (res_type == RF_ASSN)
			return nres->assigned;
		else if (res_type == RF_UNUSED)
			return nres->avail - nres->assigned;
		else /* error */
			return 0;
	}

	return 0;
}

/**
 * @brief
 * 		return resource values based on res_type for node bucket
 *
 * @param[in] bkt 		- node bucket
 * @param[in] res 		- resource name
 * @param[in] def 		- resource definition of res
 * @param[in] res_type 	- type of resource value to use
 *
 * @return	sch_resource_t
 */
sch_resource_t
find_bucket_amount(node_bucket *bkt, const std::string &res, resdef *def, enum resource_fields res_type)
{
	schd_resource *nres;

	if (def != NULL)
		nres = find_resource(bkt->res_spec, def);
	else if (res == SORT_PRIORITY)
		return bkt->priority;
	else
		nres = find_resource_by_str(bkt->res_spec, res);

	if (nres != NULL) {
		if (res_type == RF_AVAIL)
			return nres->avail;
		else if (res_type == RF_ASSN)
			return nres->assigned;
		else if (res_type == RF_UNUSED)
			return nres->avail - nres->assigned;
		else /* error */
			return 0;
	}

	return 0;
}

/**
 * @brief
 * 		return resource values based on res_type for a node
 *
 * @param[in] ninfo 	- node
 * @param[in] res 		- resource name or special case
 * @param[in] def 		- resource definition of res
 * @param[in] res_type 	- type of resource value to use
 *  *
 * @return sch_resource_t
 * @retval	0	: error
 */
sch_resource_t
find_node_amount(node_info *ninfo, const std::string &res, resdef *def,
		 enum resource_fields res_type)
{
	/* def is NULL on special case sort keys */
	if (def != NULL) {
		schd_resource *nres;
		nres = find_resource(ninfo->res, def);

		if (nres != NULL) {
			if (nres->indirect_res != NULL)
				nres = nres->indirect_res;
			if (res_type == RF_AVAIL)
				return nres->avail;
			else if (res_type == RF_ASSN)
				return nres->assigned;
			else if (res_type == RF_UNUSED)
				return nres->avail - nres->assigned;
			else /* error */
				return 0;
		}

	} else if (res == SORT_PRIORITY)
		return ninfo->priority;
	else if (res == SORT_USED_TIME)
		return ninfo->last_used_time;

	return 0;
}

/**
 * @brief
 * 		find resource or special case sorting values for jobs
 *
 * @param[in] resresv 	- the job
 * @param[in] res 		- the resource/special case name
 * @param[in] def 		- the resource definition of res (NULL for special case)
 *
 * @return	sch_resource_t
 * @retval	0	: on error
 */
sch_resource_t
find_resresv_amount(resource_resv *resresv, const std::string &res, resdef *def)
{
	/* def is NULL on special case sort keys */
	if (def != NULL) {
		resource_req *req;

		req = find_resource_req(resresv->resreq, def);

		if (req != NULL)
			return req->amount;
	}

	if (res == SORT_JOB_PRIORITY)
#ifdef NAS /* localmod 045 */
		return (sch_resource_t) resresv->job->NAS_pri;
#else
		return (sch_resource_t) resresv->job->priority;
#endif /* localmod 045 */
	else if (res == SORT_FAIR_SHARE && resresv->job->ginfo != NULL)
		return (sch_resource_t) resresv->job->ginfo->tree_percentage;
	else if (res == SORT_PREEMPT)
		return (sch_resource_t) resresv->job->preempt;
#ifdef NAS
	/* localmod 034 */
	else if (res == SORT_ALLOC)
		return (sch_resource_t) (100.0 * site_get_share(resresv));
	/* localmod 039 */
	else if (res == SORT_QPRI && resresv->job->queue != NULL)
		return (sch_resource_t) resresv->job->queue->priority;
	/* localmod 040 */
	else if (res == SORT_NODECT) {
		/* return the node count - dpr */
		int ndct = resresv->job->nodect;
		return (sch_resource_t) ndct;
	}
#endif
	return 0;
}

/**
 * @brief
 * 	 	sort nodes by resources_available.host
 *
 * @param[in]	v1	-	node_info 1
 * @param[in]	v2	-	node_info 2
 *
 * @return int
 * @retval -1, 0, 1 - standard qsort() cmp
*/
int
cmp_node_host(const void *v1, const void *v2)
{
	schd_resource *res1;
	schd_resource *res2;
	node_info **n1;
	node_info **n2;
	int rc = 0;

	n1 = (node_info **) v1;
	n2 = (node_info **) v2;

	res1 = find_resource((*n1)->res, allres["host"]);
	res2 = find_resource((*n2)->res, allres["host"]);

	if (res1 != NULL && res2 != NULL)
		rc = strcmp(res1->orig_str_avail, res2->orig_str_avail);

	/* if the host is the same and we have a node_sort_key, preserve the sort */
	if (rc == 0 && !cstat.node_sort->empty())
		return multi_node_sort(v1, v2);

	return rc;
}

/**
 * @brief
 *		Sorting function used with 'avoid_provision' policy
 *
 * @par Functionality:
 *		This function compares two nodes and determines the order by comparing
 *		the AOE instantiated on them with AOE requested by job (or reservation).
 *		If order cannot be determined then node_sort_key is used.
 *
 * @param[in]	v1		-	pointer to const void
 * @param[in]	v2		-	pointer to const void
 *
 * @return	int
 * @retval	 -1 : v1 has precendence
 * @retval	  0 : v1 and v2 both have equal precedence
 * @retval	  1 : v2 has precendence
 *
 * @par Side Effects:
 *		Unknown
 *
 * @par MT-safe: No
 *
 */
int
cmp_aoe(const void *v1, const void *v2)
{
	node_info **n1;
	node_info **n2;
	int v1rank = 0, v2rank = 0; /* to reduce strcmp() calls */
	int ret;

	n1 = (node_info **) v1;
	n2 = (node_info **) v2;

	/* Between nodes, one with aoe and other without aoe, one with aoe
	 * comes first.
	 */

	if ((*n1)->current_aoe) {
		if (strcmp((*n1)->current_aoe, cmp_aoename) == 0)
			v1rank = 1;
		else
			v1rank = -1;
	}

	if ((*n2)->current_aoe) {
		if (strcmp((*n2)->current_aoe, cmp_aoename) == 0)
			v2rank = 1;
		else
			v2rank = -1;
	}

	ret = v2rank - v1rank;

	if (ret == 0)
		return multi_node_sort(v1, v2);

	return ret;
}

/**
 * @brief
 * 		A function which sorts the jobs according to the time they are
 *        preempted (in ascending order)
 *
 * @param[in] j1 - job to compare.
 * @param[in] j2 - job to compare.
 *
 * @return	int
 * @retval 	-1 : If j1 was preempted before j2.
 * @retval  0  : If both were preempted at the same time
 * @retval  1  : if j2 was preempted before j1.
 */
int
cmp_job_preemption_time_asc(const void *j1, const void *j2)
{
	resource_resv *r1;
	resource_resv *r2;

	r1 = *((resource_resv **) j1);
	r2 = *((resource_resv **) j2);

	if (r1 == NULL && r2 == NULL)
		return 0;

	if (r1 != NULL && r2 == NULL)
		return -1;

	if (r1 == NULL && r2 != NULL)
		return 1;

	if (r1->job == NULL || r2->job == NULL)
		return 0;

	/* If one job is preempted and second is not then preempted job gets priority
	 * If both jobs are preempted, one which is preempted first gets priority
	 */
	if (r1->job->time_preempted == UNSPECIFIED &&
	    r2->job->time_preempted == UNSPECIFIED)
		return 0;
	else if (r1->job->time_preempted != UNSPECIFIED &&
		 r2->job->time_preempted == UNSPECIFIED)
		return -1;
	else if (r1->job->time_preempted == UNSPECIFIED &&
		 r2->job->time_preempted != UNSPECIFIED)
		return 1;

	if (r1->job->time_preempted < r2->job->time_preempted)
		return -1;
	else if (r1->job->time_preempted > r2->job->time_preempted)
		return 1;
	return 0;
}

/**
 * @brief
 * cmp_resv_state	- compare reservation state with RESV_BEING_ALTERED.
 *
 * @param[in] r1	- reservation to compare.
 * @param[in] r2	- reservation to compare.
 *
 * @return - int
 * @retval  1: If r2's state is RESV_BEING_ALTERED and r1's state is not.
 *          0: If both the reservation's states are not RESV_BEING_ALTERED.
 *         -1: If r1's state is RESV_BEING_ALTERED and r2's state is not.
 */
int
cmp_resv_state(const void *r1, const void *r2)
{
	enum resv_states resv1_state;
	enum resv_states resv2_state;

	resv1_state = (*(resource_resv **) r1)->resv->resv_state;
	resv2_state = (*(resource_resv **) r2)->resv->resv_state;

	if (resv1_state != RESV_BEING_ALTERED && resv2_state == RESV_BEING_ALTERED)
		return 1;
	if (resv2_state != RESV_BEING_ALTERED && resv1_state == RESV_BEING_ALTERED)
		return -1;
	else
		return 0;
}

/**
 * @brief
 * 		sort_jobs - This function sorts all jobs according to their preemption
 *      priority, preempted time and fairshare.
 *		sort_jobs is called whenever we need to sort jobs on the basis of
 *		various policies set in scheduler.
 * @param[in]		policy	-	Policy structure to decide whether to sort for fairshare or
 *                     			not. If yes, then according should it be according to
 *                     			by_queue or round_robin.
 * @param[in,out]	sinfo 	- 	Server info struct which contains all the jobs that needs
 *                        		sorting.
 * @return	void
 */
void
sort_jobs(status *policy, server_info *sinfo)
{
	/** sort jobs in such a way that Higher Priority jobs come on top
	 * followed by preempted jobs and then normal jobs
	 */
	if (policy->fair_share) {
		/** sort per queue basis and then use these jobs (combined from all the queues)
		 * to select the next job.
		 */
		if (policy->by_queue || policy->round_robin) {
			int job_index = 0;
			/* cycle through queues and sort them on the basis of preemption priority,
			 * preempted jobs, and fairshare usage
			 */
			for (auto qinfo : sinfo->queues) {
				if (qinfo->sc.total > 0) {
					qsort(qinfo->jobs, qinfo->sc.total,
					      sizeof(resource_resv *), cmp_sort);
				}
			}
			for (auto qinfo : sinfo->queues) {
				for (int index = 0; index < qinfo->sc.total; index++) {
					sinfo->jobs[job_index] = qinfo->jobs[index];
					job_index++;
				}
			}
			sinfo->jobs[job_index] = NULL;
		}
		/** Sort on entire complex **/
		else if (!policy->by_queue && !policy->round_robin) {
			qsort(sinfo->jobs, count_array(sinfo->jobs), sizeof(resource_resv *), cmp_sort);
		}
	} else if (policy->by_queue) {
		for (auto qinfo : sinfo->queues) {
			qsort(qinfo->jobs, count_array(qinfo->jobs), sizeof(resource_resv *), cmp_sort);
		}
		qsort(sinfo->jobs, count_array(sinfo->jobs), sizeof(resource_resv *), cmp_sort);
	} else if (policy->round_robin) {
		if (sinfo->queue_list != NULL) {
			int queue_list_size = count_array(sinfo->queue_list);
			for (int i = 0; i < queue_list_size; i++) {
				int queue_index_size = count_array(sinfo->queue_list[i]);
				for (int j = 0; j < queue_index_size; j++) {
					qsort(sinfo->queue_list[i][j]->jobs, count_array(sinfo->queue_list[i][j]->jobs),
					      sizeof(resource_resv *), cmp_sort);
				}
			}
		}
	} else
		qsort(sinfo->jobs, count_array(sinfo->jobs), sizeof(resource_resv *), cmp_sort);
}


================================================
FILE: src/scheduler/sort.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _SORT_H
#define _SORT_H

/*
 *	compare two new numerical resource numbers
 *
 *	returns -1 if r1 < r2
 *		0  if r1 == r2
 *		1  if r1 > r2
 */
int cmpres(sch_resource_t r1, sch_resource_t r2);

/*
 * cmp_nspec - sort nspec by sequence number
 *
 */
bool cmp_nspec(const nspec *n1, const nspec *n2);

/*
 * cmp_nspec_by_sub_seq - sort nspec by sub sequence number
 */
bool cmp_nspec_by_sub_seq(const nspec *n1, const nspec *n2);

/*
 *	cmp_placement_sets - sort placement sets by
 *			total cpus
 *			total memory
 *			free cpus
 *			free memory
 */
int cmp_placement_sets(const void *v1, const void *v2);

/*
 * cmp_fairshare - compare based on compare_path()
 */
int cmp_fairshare(const void *j1, const void *j2);

/*
 *
 *      cmp_queue_prio_dsc - compare function used by qsort to sort queues
 *                           by decending priority
 *
 */
bool cmp_queue_prio_dsc(const queue_info *q1, const queue_info *q2);

/*
 *      cmp_fair_share - compare function for the fair share algorithm
 */
int cmp_fair_share(const void *j1, const void *j2);

/*
 *      cmp_preempt_priority_asc - used to sort jobs in decending preemption
 *                                 priority
 */
int cmp_preempt_priority_asc(const void *j1, const void *j2);

/*
 *      cmp_preempt_stime_asc - used to soft jobs in ascending preemption
 *                              start time
 */
int cmp_preempt_stime_asc(const void *j1, const void *j2);

/*
 *      multi_sort - a multi keyed sortint compare function
 */
int multi_sort(resource_resv *r1, resource_resv *r2);

/*
 *	cmp_job_sort_formula - used to sort jobs in descending order of their evaluated formula value
 */
int cmp_job_sort_formula(const void *j1, const void *j2);

/*
 *
 *      cmp_sort - entrypoint into job sort used by qsort
 */
int cmp_sort(const void *v1, const void *v2);

/*
 *      find_resresv_amount - find resource amount for jobs + special cases
 */
sch_resource_t find_resresv_amount(resource_resv *resresv, const std::string &res, resdef *def);

/*
 *      find_node_amount - find the resource amount for nodes + special cases
 */
sch_resource_t find_node_amount(node_info *ninfo, const std::string &res, resdef *def, enum resource_fields res_type);

/* return resource values based on res_type for node partition */
sch_resource_t find_nodepart_amount(node_partition *np, const std::string &res, resdef *def, enum resource_fields res_type);

sch_resource_t find_bucket_amount(node_bucket *bkt, const std::string &res, resdef *def, enum resource_fields res_type);

/*
 * Compares either two nodes or node_partitions based on a resource,
 * Ascending/Descending, and what part of the resource to use (total, unused, etc)
 */
int node_sort_cmp(const void *vp1, const void *vp2, const struct sort_info &si, enum sort_obj_type obj_type);

/*
 *      resresv_sort_cmp - compares 2 jobs on the current resresv sort
 *                      used with qsort (qsort calls multi_sort())
 */
int resresv_sort_cmp(resource_resv *r1, resource_resv *r2, const sort_info &si);

/*
 *      multi_node_sort - a multi keyed sorting compare function for nodes
 */
int multi_node_sort(const void *n1, const void *n2);

/* qsort() compare function for multi-resource node partition sorting */
int multi_nodepart_sort(const void *n1, const void *n2);

/* qsort() compare function for multi-resource bucket sorting */
int multi_bkt_sort(const void *b1, const void *b2);

/*
 *	cmp_events - sort jobs/resvs into a timeline of the next even to
 *		happen: running jobs ending, advanced reservations starting
 *		or ending
 */
int cmp_events(const void *v1, const void *v2);

/* sort nodes by resources_available.host */
int cmp_node_host(const void *v1, const void *v2);

/* sorting routine to be used with PROVPOLICY_AVOID only */
int cmp_aoe(const void *v1, const void *v2);

/*
 *      cmp_job_preemption_time_asc- used to sort jobs in ascending preempted
 *                                 time.
 */
int cmp_job_preemption_time_asc(const void *j1, const void *j2);

/*
 *  cmp_preemption - This function is use to sort jobs according to their
 *  preemption priority
 */
int cmp_preemption(resource_resv *r1, resource_resv *r2);

/*
 * cmp_resv_state - compare based on resv_state
 */
int cmp_resv_state(const void *r1, const void *r2);

/*
 * sort_jobs - This function sorts all jobs according to their preemption
 *             priority, preempted time and fairshare.
 */
void sort_jobs(status *policy, server_info *sinfo);

#endif /* _SORT_H */


================================================
FILE: src/scheduler/state_count.cpp
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    state_count.c
 *
 * @brief
 * 		state_count.c - This file contains functions related to state_count struct
 *
 * Functions included are:
 * 	init_state_count()
 * 	count_states()
 * 	total_states()
 * 	state_count_add()
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <pbs_error.h>
#include <pbs_ifl.h>
#include <log.h>
#include "state_count.h"
#include "constant.h"
#include "misc.h"

/**
 * @brief
 *		init_state_count - initalize state count struct
 *
 * @param[out]	sc - the struct to initalize
 *
 * @return	nothing
 *
 */
void
init_state_count(state_count *sc)
{
	sc->running = 0;
	sc->queued = 0;
	sc->transit = 0;
	sc->exiting = 0;
	sc->held = 0;
	sc->waiting = 0;
	sc->suspended = 0;
	sc->userbusy = 0;
	sc->invalid = 0;
	sc->begin = 0;
	sc->expired = 0;
	sc->total = 0;
}

/**
 * @brief
 *		count_states - count the jobs in each state and set the state counts
 *
 * @param[in]	jobs - array of jobs
 * @param[out]	sc   - state count structure passed by reference
 *
 * @return	nothing
 *
 */
void
count_states(resource_resv **jobs, state_count *sc)
{
	if (jobs != NULL) {
		for (int i = 0; jobs[i] != NULL; i++) {
			if (jobs[i]->job != NULL) {
				if (jobs[i]->job->is_queued)
					sc->queued++;
				else if (jobs[i]->job->is_running)
					sc->running++;
				else if (jobs[i]->job->is_transit)
					sc->transit++;
				else if (jobs[i]->job->is_exiting)
					sc->exiting++;
				else if (jobs[i]->job->is_held)
					sc->held++;
				else if (jobs[i]->job->is_waiting)
					sc->waiting++;
				else if (jobs[i]->job->is_suspended)
					sc->suspended++;
				else if (jobs[i]->job->is_userbusy)
					sc->userbusy++;
				else if (jobs[i]->job->is_begin)
					sc->begin++;
				else if (jobs[i]->job->is_expired)
					sc->expired++;
				else {
					sc->invalid++;
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobs[i]->name, "Job in unknown state");
				}
			}
		}
	}

	sc->total = sc->queued + sc->running + sc->transit +
		    sc->exiting + sc->held + sc->waiting +
		    sc->suspended + sc->userbusy + sc->begin +
		    sc->expired + sc->invalid;
}

/**
 * @brief
 *		total_states - add the states from sc2 to the states in sc1
 *		       i.e. sc1 += sc2
 *
 * @param[out]	sc1 - the accumlator
 * @param[in]	sc2 - what is being totaled
 *
 * @return	nothing
 *
 */
void
total_states(state_count *sc1, state_count *sc2)
{
	sc1->running += sc2->running;
	sc1->queued += sc2->queued;
	sc1->held += sc2->held;
	sc1->waiting += sc2->waiting;
	sc1->exiting += sc2->exiting;
	sc1->transit += sc2->transit;
	sc1->suspended += sc2->suspended;
	sc1->userbusy += sc2->userbusy;
	sc1->begin += sc2->begin;
	sc1->expired += sc2->expired;
	sc1->invalid += sc2->invalid;
	sc1->total += sc2->total;
}

/**
 * @brief
 *		state_count_add - add a certain amount to a a state count element
 *			  based on a job state letter
 *
 * @param[out]	sc	 		- state count
 * @param[in]	job_state 	- state to decrement
 * @param[in]	amount 		- amount to add (it increment, pass 1, to decrement pass -1)
 *
 *
 * @return	nothing
 *
 */
void
state_count_add(state_count *sc, const char *job_state, int amount)
{
	if (sc == NULL || job_state == NULL)
		return;

	switch (job_state[0]) {
		case 'Q':
			sc->queued += amount;
			break;

		case 'R':
			sc->running += amount;
			break;

		case 'T':
			sc->transit += amount;
			break;

		case 'H':
			sc->held += amount;
			break;

		case 'W':
			sc->waiting += amount;
			break;

		case 'E':
			sc->exiting += amount;
			break;

		case 'S':
			sc->suspended += amount;
			break;

		case 'U':
			sc->userbusy += amount;
			break;

		case 'B':
			sc->begin += amount;
			break;

		case 'X':
			sc->expired += amount;
			break;

		default:
			sc->invalid += amount;
			break;
	}
}


================================================
FILE: src/scheduler/state_count.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _STATE_COUNT_H
#define _STATE_COUNT_H

#include "data_types.h"

/*
 *	init_state_count - initalize state count struct
 */
void init_state_count(state_count *sc);

/*
 *      count_states - count the jobs in each state and set the state counts
 */
void count_states(resource_resv **jobs, state_count *sc);

/*
 *	accumulate states from one state_count into another
 */
void total_states(state_count *sc1, state_count *sc2);

/*
 *      state_count_add - add a certain amount to a a state count element
 *                        based on a job state letter
 *                        it increment, pass in 1, to decrement pass in -1
 */
void state_count_add(state_count *sc, const char *job_state, int amount);
#endif /* _STATE_COUNT_H */


================================================
FILE: src/server/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

sbin_PROGRAMS = pbs_server.bin pbs_comm

pbs_server_bin_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	-I$(top_srcdir)/src/lib/Liblicensing \
	@expat_inc@ \
	@libical_inc@ \
	@libz_inc@ \
	@PYTHON_INCLUDES@ \
	@KRB5_CFLAGS@

pbs_server_bin_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libtpp/libtpp.a \
	$(top_builddir)/src/lib/Libattr/libattr.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	$(top_builddir)/src/lib/Libsite/libsite.a \
	$(top_builddir)/src/lib/Libpython/libpbspython_svr.a \
	$(top_builddir)/src/lib/Libdb/libpbsdb.la \
	$(top_builddir)/src/lib/Liblicensing/liblicensing.la \
	@KRB5_LIBS@ \
	@expat_lib@ \
	@libz_lib@ \
	@libical_lib@ \
	@PYTHON_LDFLAGS@ \
	@PYTHON_LIBS@ \
	-lssl \
	-lcrypto

pbs_server_bin_SOURCES = \
	accounting.c \
	array_func.c \
	attr_recov.c \
	attr_recov_db.c \
	dis_read.c \
	failover.c \
	geteusernam.c \
	hook_func.c \
	issue_request.c \
	jattr_get_set.c \
	job_func.c \
	job_recov_db.c \
	job_route.c \
	licensing_func.c \
	mom_info.c \
	daemon_info.c \
	nattr_get_set.c \
	node_func.c \
	node_manager.c \
	node_recov_db.c \
	pbs_db_func.c \
	pbsd_init.c \
	pbsd_main.c \
	process_request.c \
	qattr_get_set.c \
	queue_func.c \
	queue_recov_db.c \
	rattr_get_set.c \
	reply_send.c \
	req_delete.c \
	req_getcred.c \
	req_holdjob.c \
	req_jobobit.c \
	req_locate.c \
	req_manager.c \
	req_message.c \
	req_modify.c \
	req_preemptjob.c \
	req_movejob.c \
	req_quejob.c \
	req_register.c \
	req_rerun.c \
	req_rescq.c \
	req_runjob.c \
	req_select.c \
	req_shutdown.c \
	req_signal.c \
	req_stat.c \
	req_track.c \
	req_cred.c \
	resc_attr.c \
	run_sched.c \
	sattr_get_set.c \
	sched_attr_get_set.c \
	sched_func.c \
	setup_resc.c \
	stat_job.c \
	svr_chk_owner.c \
	svr_connect.c \
	svr_func.c \
	svr_jobfunc.c \
	svr_mail.c \
	svr_movejob.c \
	svr_recov_db.c \
	svr_resccost.c \
	svr_credfunc.c \
	user_func.c \
	vnparse.c

pbs_comm_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@libz_inc@ \
	@KRB5_CFLAGS@

pbs_comm_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libtpp/libtpp.a \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	-lpthread \
	@libz_lib@ \
	@socket_lib@ \
	@KRB5_LIBS@

pbs_comm_SOURCES = pbs_comm.c


================================================
FILE: src/server/accounting.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    accounting.c
 *
 * @brief
 * accounting.c - contains functions to record accounting information
 *
 * Functions included are:
 *	acct_open()
 *	acct_record()
 *	acct_close()
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "portability.h"
#include <sys/param.h>
#include <sys/types.h>
#include <string.h>
#include <errno.h>
#include <limits.h>
#include <stdio.h>
#include <stdlib.h>
#include <time.h>
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server_limits.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "pbs_nodes.h"
#include "log.h"
#include "acct.h"
#include "pbs_license.h"
#include "server.h"
#include "svrfunc.h"
#include "libutil.h"

/* Local Data */

static FILE *acctfile; /* open stream for log file */
static volatile int acct_opened = 0;
static int acct_opened_day;
static int acct_auto_switch = 0;
static char *acct_buf = 0;
static int acct_bufsize = PBS_ACCT_MAX_RCD;
static const char *do_not_emit_alter[] = {ATTR_estimated, ATTR_used, NULL};

/* Global Data */

extern char *acctlog_spacechar;
extern attribute_def job_attr_def[];
extern char *path_acct;
extern int resc_access_perm;
extern time_t time_now;
extern struct resc_sum *svr_resc_sum;
extern struct server server;
extern char *msg_job_end_stat;

/**
 * @brief
 * grow_acct_buf - called when need to grow the account buffer
 *
 * @param[out]	pb - New address in the account buffer after the reallocation
 * @param[out]	avail - Remaining size in the returned variable
 * @param[in]	need - Required extra size for reallocation
 *
 * @return      Error code
 * @retval	 0  - Success
 * @retval	-1  - Failure
 *
 * @par Side Effects:
 *     the accounting buffer (acct_buf) is grown
 *
 * @par MT-safe: No
 */
static int
grow_acct_buf(char **pb, int *avail, int need)
{
	size_t ln;
	char *new;

	ln = acct_bufsize + need + need + PBS_ACCT_LEAVE_EXTRA;
	new = realloc(acct_buf, (size_t) (ln + 1));
	if (new == NULL) {
		log_err(errno, __func__, "realloc failure");
		return (-1);
	}
	acct_buf = new;
	acct_bufsize = ln;
	ln = strlen(acct_buf);
	*pb = acct_buf + ln;
	*avail = acct_bufsize - ln;
	return 0;
}

/**
 * @brief
 * sum_resc_alloc() - sums up the consumable resources listed in
 *	the exec_vnode for accounting.  The caller is responsible
 *	for taking the sums in svr_resc_sum[] and formating the
 *	data into a buffer for logging.
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	list - pbs list head
 *
 * @return      Error code
 * @retval	0			- if ok and data in svr_resc_sum[]
 * @retval  non zero	- on error and data is not valid
 *
 * @par MT-safe: No
 */

static void
sum_resc_alloc(const job *pjob, pbs_list_head *list)
{
	char *chunk;
	char *exechost;
	int i;
	int j;
	int nelem;
	char *noden;
	struct key_value_pair *pkvp;
	resource *presc;
	struct pbsnode *pnode;
	int rc;

	static attribute tmpatr;

	if ((pjob == NULL) ||
	    !(is_jattr_set(pjob, JOB_ATR_exec_vnode)))
		return;

	/* if a vnode was allocated "excl",  we need to charge all of its   */
	/* resources, but only once.   So we need to mark the vnode as seen */
	/* To do that, we first need to unmark them...			    */

	for (i = 0; i < svr_totnodes; i++)
		pbsndlist[i]->nd_svrflags &= ~NODE_ACCTED;

	exechost = get_jattr_str(pjob, JOB_ATR_exec_vnode);

	/* clear the summation table used later */

	for (i = 0; svr_resc_sum[i].rs_def; ++i) {
		(void) memset((char *) &svr_resc_sum[i].rs_attr, 0, sizeof(struct attribute));

		svr_resc_sum[i].rs_set = 0;
		svr_resc_sum[i].rs_prs = NULL;
	}

	/* now, go through the exec_vnode specified for the job, for any       */
	/* resource that matches an entry in the table, set the pointer and set flag */

	chunk = parse_plus_spec(exechost, &rc);
	if (rc != 0)
		return;
	while (chunk) {
		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {

			/* find if node is shared or excl */

			pnode = find_nodebyname(noden);
			if (pnode) {
				if ((pnode->nd_state & INUSE_JOBEXCL) == 0) {

					/* shared, record only what was requested from the vnode */

					for (j = 0; j < nelem; ++j) {
						for (i = 0; svr_resc_sum[i].rs_def; ++i) {
							if (strcmp(svr_resc_sum[i].rs_def->rs_name, pkvp[j].kv_keyw) == 0) {
								/* incr sum by amount requested by user */
								rc = svr_resc_sum[i].rs_def->rs_decode(&tmpatr,
												       0, 0, pkvp[j].kv_val);
								if (rc != 0)
									return;
								(void) svr_resc_sum[i].rs_def->rs_set(&svr_resc_sum[i].rs_attr, &tmpatr, INCR);

								svr_resc_sum[i].rs_set = 1;
							}
						}
					}

				} else if (!(pnode->nd_svrflags & NODE_ACCTED)) {

					/* vnode used exclusively and not already accounted, */
					/* so incr sum by amount in whole vnode              */

					pnode->nd_svrflags |= NODE_ACCTED; /* mark that it has been recorded */
					for (i = 0; svr_resc_sum[i].rs_def; ++i) {
						presc = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAvail), svr_resc_sum[i].rs_def);
						if (presc && (is_attr_set(&presc->rs_value))) {
							(void) svr_resc_sum[i].rs_def->rs_set(&svr_resc_sum[i].rs_attr, &presc->rs_value, INCR);
							svr_resc_sum[i].rs_set = 1;
						}
					}
				}
			}

		} else {
			return;
		}
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0)
			return;
	}

	for (i = 0; svr_resc_sum[i].rs_def != NULL; ++i) {
		if (svr_resc_sum[i].rs_set) {
			(void) svr_resc_sum[i].rs_def->rs_encode(
				&svr_resc_sum[i].rs_attr,
				list,
				"resource_assigned",
				svr_resc_sum[i].rs_def->rs_name,
				ATR_ENCODE_CLIENT, NULL);
		}
	}

	return;
}

/**
 * @brief
 * cpy_quote_value - append the value to the buffer
 *	If the string contains no spaces,  it is appended as is.
 *	If the string contains spaces, and contains a ", then quote the string with ' characters,
 *	else quote the string with " characters
 *
 * @param[in,out]	pb - Source string and stores the result after appending.
 * @param[in]	value - value which needs to be appended
 *
 * @return      void
 */
static void
cpy_quote_value(char *pb, char *value)
{
	char *quotechar;

	if (strchr(value, (int) ' ') != 0) {
		if (strchr(value, (int) '"') != 0)
			quotechar = "'";
		else
			quotechar = "\"";
		(void) strcat(pb, quotechar);
		(void) strcat(pb, value);
		(void) strcat(pb, quotechar);
	} else {
		(void) strcat(pb, value);
	}
}

/* These are various printing formats used in acct_job() */
#define GRIDNAME_FMT "gridname=\"%s\" "
#define USER_FMT "user=%s "
#define GROUP_FMT "group=%s "
#define ACCOUNT_FMT "account=\"%s\" "
#define PROJECT_FMT1 "project=\"%s\" "
#define PROJECT_FMT2 "project=%s "
#define ACCOUNTING_ID_FMT "accounting_id=\"%s\" "
#define JOBNAME_FMT "jobname=%s "
#define QUEUE_FMT "queue=%s "
#define RESVNAME_FMT "resvname=%s "
#define RESVID_FMT "resvID=%s "
#define RESVJOBID_FMT "resvjobID=%s "
#define ARRAY_INDICES_FMT "array_indices=%s "
#define EXEC_HOST_FMT "exec_host=%s "
#define EXEC_VNODE_FMT "exec_vnode=%s "
#define DEPEND_FMT "depend=%s "

/* Amount of space needed in account log buffer for the ctime, qtime, etime, */
/* start attributes */
#define ACCTBUF_TIMES_NEED 72

/**
 * @brief
 * Get the resources_used job attribute
 *
 * @param[in]	pjob	- pointer to job structure
 * @param[in]	resc_used - pointer to resources used string
 * @param[in]	resc_used_size - size of resources used string
 *
 * @return	int
 * @retval	0 upon success
 * @retval	-1	if error encountered.
 *
 */
static int
get_resc_used(job *pjob, char **resc_used, int *resc_used_size)
{
	struct svrattrl *patlist = NULL;
	pbs_list_head temp_head;
	CLEAR_HEAD(temp_head);

	if (get_jattr_usr_encoded(pjob, JOB_ATR_resc_used) != NULL)
		patlist = get_jattr_usr_encoded(pjob, JOB_ATR_resc_used);
	else if (get_jattr_priv_encoded(pjob, JOB_ATR_resc_used) != NULL)
		patlist = get_jattr_priv_encoded(pjob, JOB_ATR_resc_used);
	else
		encode_resc(get_jattr(pjob, JOB_ATR_resc_used),
			    &temp_head, job_attr_def[JOB_ATR_resc_used].at_name,
			    NULL, ATR_ENCODE_CLIENT, &patlist);
	/*
	 * NOTE:
	 * Following code for constructing resources used information is same as job_obit()
	 * with minor different that to traverse patlist in this code
	 * we have to use patlist->al_sister since it is encoded information in job struct
	 * where in job_obit() we are using GET_NEXT(patlist->al_link) which is part of batch
	 * request.
	 * ji_acctrec is lost on server restart.  Recreate it here if needed.
	 */
	while (patlist) {
		/* log to accounting_logs only if there's a value */
		if (strlen(patlist->al_value) > 0) {
			if (concat_rescused_to_buffer(resc_used, resc_used_size, patlist, " ", NULL) != 0) {
				return -1;
			}
		}
		patlist = patlist->al_sister;
	}
	free_attrlist(&temp_head);
	return 0;
}

/**
 * @brief
 *	Get the value of "walltime" resource for the job's given
 *	resource index 'res'.
 *
 *
 * @param[in]	pjob	- pointer to job structure
 * @param[in]	res	- resource entity index (e.g. JOB_ATR_resource)
 *
 * @return	long
 * @retval	<n>	walltime value
 * @retval	-1	if error encountered.
 *
 */
long
get_walltime(const job *jp, int res)
{
	resource_def *rscdef;
	resource *pres;

	rscdef = &svr_resc_def[RESC_WALLTIME];
	pres = find_resc_entry(get_jattr(jp, res), rscdef);
	if (pres == NULL)
		return (-1);
	else if (!is_attr_set(&pres->rs_value))
		return (-1);
	else
		return pres->rs_value.at_val.at_long; /*wall time value*/
}

/**
 * @brief
 *	Form and write a job termination/rerun record with resource usage.
 * 	Build common data for queue/start/end job accounting record
 *
 * @par	Functionality:
 *	Used by account_jobstr() and account_jobend()
 *
 *
 * @param[in]	pjob	- pointer to job structure
 * @param[in]	type	- account record type
 * @param[in]	buf	- buffer holding the data that will be stored in
 *			  accounting logs.
 * @param[in]	len	- number of characters in 'buf' still available to
 *			  store data.
 * @return	char *
 * @retval	pointer to 'buf' containing new data.
 *
 */
static char *
acct_job(const job *pjob, int type, char *buf, int len)
{
	pbs_list_head attrlist;
	int i, k;
	int nd;
	svrattrl *pal;
	char *pb;
	int att_index;
	int len_orig;
	char save_char;
	int old_perm;

	pb = buf;
	CLEAR_HEAD(attrlist);

	/* gridname */
	if (is_jattr_set(pjob, JOB_ATR_gridname)) {
		nd = strlen(get_jattr_str(pjob, JOB_ATR_gridname)) + sizeof(GRIDNAME_FMT);
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);

		snprintf(pb, len, GRIDNAME_FMT,
			 get_jattr_str(pjob, JOB_ATR_gridname));
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* user */
	nd = sizeof(USER_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_euser));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);
	snprintf(pb, len, USER_FMT, get_jattr_str(pjob, JOB_ATR_euser));

	i = strlen(pb);
	pb += i;
	len -= i;

	/* group */
	nd = sizeof(GROUP_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_egroup));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	snprintf(pb, len, GROUP_FMT, get_jattr_str(pjob, JOB_ATR_egroup));

	i = strlen(pb);
	pb += i;
	len -= i;

	/* account */
	if (is_jattr_set(pjob, JOB_ATR_account)) {
		nd = sizeof(ACCOUNT_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_account));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);

		snprintf(pb, len, ACCOUNT_FMT, get_jattr_str(pjob, JOB_ATR_account));

		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* project */
	if (is_jattr_set(pjob, JOB_ATR_project)) {
		char *projstr;

		projstr = get_jattr_str(pjob, JOB_ATR_project);
		/* using PROJECT_FMT1 if projstr needs to be quoted; otherwise, PROJECT_FMT2 */
		nd = sizeof(PROJECT_FMT1) + strlen(projstr);
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		if (strchr(projstr, ' ') != NULL) {
			snprintf(pb, len, PROJECT_FMT1, projstr);
		} else {
			snprintf(pb, len, PROJECT_FMT2, projstr);
		}
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* accounting_id */
	if (is_jattr_set(pjob, JOB_ATR_acct_id)) {
		nd = sizeof(ACCOUNTING_ID_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_acct_id));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		snprintf(pb, len, ACCOUNTING_ID_FMT, get_jattr_str(pjob, JOB_ATR_acct_id));
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* job name */
	nd = sizeof(JOBNAME_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_jobname));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);
	snprintf(pb, len, JOBNAME_FMT, get_jattr_str(pjob, JOB_ATR_jobname));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* queue name */
	nd = sizeof(QUEUE_FMT) + strlen(pjob->ji_qhdr->qu_qs.qu_name);
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);
	snprintf(pb, len, QUEUE_FMT, pjob->ji_qhdr->qu_qs.qu_name);
	i = strlen(pb);
	pb += i;
	len -= i;

	if (pjob->ji_myResv) {
		nd = sizeof(RESVID_FMT) + strlen(pjob->ji_myResv->ri_qs.ri_resvID);
		if (is_rattr_set(pjob->ji_myResv, RESV_ATR_resv_name))
			nd += sizeof(RESVNAME_FMT) + strlen(get_rattr_str(pjob->ji_myResv, RESV_ATR_resv_name));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		/* reservation name */
		if (is_rattr_set(pjob->ji_myResv, RESV_ATR_resv_name)) {
			snprintf(pb, len, RESVNAME_FMT, get_rattr_str(pjob->ji_myResv, RESV_ATR_resv_name));
			i = strlen(pb);
			pb += i;
			len -= i;
		}

		/* reservation ID */
		snprintf(pb, len, RESVID_FMT, pjob->ji_myResv->ri_qs.ri_resvID);
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* insure space for all *times */
	nd = ACCTBUF_TIMES_NEED;
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	/* create time */
	sprintf(pb, "ctime=%ld ", get_jattr_long(pjob, JOB_ATR_ctime));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* queued time */
	sprintf(pb, "qtime=%ld ", get_jattr_long(pjob, JOB_ATR_qtime));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* eligible time, how long ready to run */
	sprintf(pb, "etime=%ld ", get_jattr_long(pjob, JOB_ATR_etime));
	i = strlen(pb);
	pb += i;
	len -= i;

	if (type != PBS_ACCT_QUEUE) {
		/* start time */
		sprintf(pb, "start=%ld ", (long) pjob->ji_qs.ji_stime);
		i = strlen(pb);
		pb += i;
		len -= i;
	} else if (is_jattr_set(pjob, JOB_ATR_depend)) {
		pbs_list_head phead;
		svrattrl *svrattrl_list = NULL;
		CLEAR_HEAD(phead);
		job_attr_def[JOB_ATR_depend].at_encode(get_jattr(pjob, JOB_ATR_depend),
						       &phead, job_attr_def[JOB_ATR_depend].at_name, NULL, ATR_ENCODE_CLIENT, &svrattrl_list);
		if (svrattrl_list != NULL) {
			nd = sizeof(DEPEND_FMT) + strlen(svrattrl_list->al_value);
			if (nd > len)
				if (grow_acct_buf(&pb, &len, nd) == -1)
					return (pb);
			snprintf(pb, len, DEPEND_FMT, svrattrl_list->al_value);
			i = strlen(pb);
			pb += i;
			len -= i;
			free_svrattrl(svrattrl_list);
		}
	}

	if ((is_jattr_set(pjob, JOB_ATR_array_indices_submitted)) &&
	    (check_job_state(pjob, JOB_STATE_LTR_BEGUN) || type == PBS_ACCT_QUEUE)) {

		/* for an Array Job in Begun state,  record index range */

		nd = sizeof(ARRAY_INDICES_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_array_indices_submitted));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		snprintf(pb, len, ARRAY_INDICES_FMT, get_jattr_str(pjob, JOB_ATR_array_indices_submitted));
		i = strlen(pb);
		pb += i;
		len -= i;

	} else {

		/* regular job */
		if ((type == PBS_ACCT_END) &&
		    (is_jattr_set(pjob, JOB_ATR_exec_host_orig)))
			att_index = JOB_ATR_exec_host_orig;
		else
			att_index = JOB_ATR_exec_host;

		if (is_jattr_set(pjob, att_index)) {
			/* execution host list, may be loooong */
			nd = sizeof(EXEC_HOST_FMT) + strlen(get_jattr_str(pjob, att_index));
			if (nd > len)
				if (grow_acct_buf(&pb, &len, nd) == -1)
					return (pb);
			snprintf(pb, len, EXEC_HOST_FMT, get_jattr_str(pjob, att_index));
			i = strlen(pb);
			pb += i;
			len -= i;
		}
		if ((type == PBS_ACCT_END) &&
		    (is_jattr_set(pjob, JOB_ATR_exec_vnode_orig)))
			att_index = JOB_ATR_exec_vnode_orig;
		else
			att_index = JOB_ATR_exec_vnode;

		if (is_jattr_set(pjob, att_index)) {
			/* execution vnode list, will be even longer */
			nd = sizeof(EXEC_VNODE_FMT) + strlen(get_jattr_str(pjob, att_index));
			if (nd > len)
				if (grow_acct_buf(&pb, &len, nd) == -1)
					return (pb);
			snprintf(pb, len, EXEC_VNODE_FMT, get_jattr_str(pjob, att_index));
			i = strlen(pb);
			pb += i;
			len -= i;
		}
	}

	/* now encode the job's resource_list attribute */
	if ((type == PBS_ACCT_END) &&
	    (is_jattr_set(pjob, JOB_ATR_resource_orig))) {
		att_index = JOB_ATR_resource_orig;
		len_orig = 5; /* length of "_orig" */
	} else {
		att_index = JOB_ATR_resource;
		len_orig = 0;
	}

	old_perm = resc_access_perm;
	resc_access_perm = READ_ONLY;
	(void) job_attr_def[att_index].at_encode(
		get_jattr(pjob, att_index),
		&attrlist,
		job_attr_def[att_index].at_name,
		NULL,
		ATR_ENCODE_CLIENT, NULL);
	resc_access_perm = old_perm;

	nd = 0; /* compute total size needed in buf */
	pal = GET_NEXT(attrlist);
	while (pal != NULL) {
		/* +5 in count is for '=', ' ', start and end quotes, and \0 */
		nd += strlen(pal->al_name) + strlen(pal->al_value) + 5;
		if (pal->al_resc)
			nd += 1 + strlen(pal->al_resc);
		pal = GET_NEXT(pal->al_link);
	}
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	while ((pal = GET_NEXT(attrlist)) != NULL) {
		/* strip off the '_orig' suffix */
		if (len_orig > 0) {
			k = strlen(pal->al_name);
			if (k > len_orig) {
				save_char = pal->al_name[k - len_orig];
				pal->al_name[k - len_orig] = '\0';
			}
		}
		(void) strcat(pb, pal->al_name);
		if (len_orig > 0) {
			if (k > len_orig) {
				pal->al_name[k - len_orig] = save_char;
			}
		}
		if (pal->al_resc) {
			(void) strcat(pb, ".");
			(void) strcat(pb, pal->al_resc);
		}
		(void) strcat(pb, "=");
		cpy_quote_value(pb, pal->al_value);
		(void) strcat(pb, " ");
		delete_link(&pal->al_link);
		(void) free(pal);
		pb += strlen(pb);
	}
	return (pb);
}

/**
 * @brief
 * acct_resv - build data for start/end reservation  accounting record
 *
 * @par	Functionality:
 *	Used by account_resvstr() and account_resvend()
 *
 * @param[in]	presv - pointer to reservation structure
 * @param[in]	buf	- buffer holding the data that will be stored in
 *			  accounting logs.
 * @param[in]	len	- number of characters in 'buf' still available to
 *			  store data.
 * @return	char *
 * @retval	pointer to 'buf' containing new data.
 */
static char *
acct_resv(resc_resv *presv, char *buf, int len)
{
	pbs_list_head attrlist; /*retrieved resources list put here*/
	int i;
	svrattrl *pal;
	char *pb;
	int old_perm;

	pb = buf;
	CLEAR_HEAD(attrlist);

	/* owner */
	i = 8 + strlen(get_rattr_str(presv, RESV_ATR_resv_owner));
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			return (pb);
	(void) sprintf(pb, "owner=%s ", get_rattr_str(presv, RESV_ATR_resv_owner));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* name */
	if (is_rattr_set(presv, RESV_ATR_resv_name)) {
		i = 7 + strlen(get_rattr_str(presv, RESV_ATR_resv_name));
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				return (pb);
		(void) sprintf(pb, "name=%s ", get_rattr_str(presv, RESV_ATR_resv_name));
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* account */
	if (is_rattr_set(presv, RESV_ATR_account)) {
		i = 10 + strlen(get_rattr_str(presv, RESV_ATR_account));
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				return (pb);
		(void) sprintf(pb, "account=%s ", get_rattr_str(presv, RESV_ATR_account));
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* queue name */
	i = 23;
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			return (pb);
	if (presv->ri_qp != NULL)
		sprintf(pb, "queue=%s ", presv->ri_qp->qu_qs.qu_name);

	i = strlen(pb);
	pb += i;
	len -= i;

	/* allow space for all *times */
	i = 90;
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			return (pb);

	/* create time */
	(void) sprintf(pb, "ctime=%ld ", get_rattr_long(presv, RESV_ATR_ctime));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* reservation start time */
	(void) sprintf(pb, "start=%ld ", (long) presv->ri_qs.ri_stime);
	i = strlen(pb);
	pb += i;
	len -= i;

	/* reservation end time */
	(void) sprintf(pb, "end=%ld ", (long) presv->ri_qs.ri_etime);
	i = strlen(pb);
	pb += i;
	len -= i;

	/* reservation duration time */
	(void) sprintf(pb, "duration=%ld ", (long) presv->ri_qs.ri_duration);
	i = strlen(pb);
	pb += i;
	len -= i;

	/* nodes string may be loooong */
	if (is_rattr_set(presv, RESV_ATR_resv_nodes)) {
		i = 8 + strlen(get_rattr_str(presv, RESV_ATR_resv_nodes));
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				return (pb);
		(void) sprintf(pb, "nodes=%s ", get_rattr_str(presv, RESV_ATR_resv_nodes));
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* now encode any user, group or host ACL */

	old_perm = resc_access_perm;
	resc_access_perm = READ_ONLY;
	(void) resv_attr_def[RESV_ATR_auth_u].at_encode(
		get_rattr(presv, RESV_ATR_auth_u),
		&attrlist,
		resv_attr_def[RESV_ATR_auth_u].at_name,
		NULL,
		ATR_ENCODE_CLIENT, NULL);

	(void) resv_attr_def[RESV_ATR_auth_g].at_encode(
		get_rattr(presv, RESV_ATR_auth_g),
		&attrlist,
		resv_attr_def[RESV_ATR_auth_g].at_name,
		NULL,
		ATR_ENCODE_CLIENT, NULL);

	(void) resv_attr_def[RESV_ATR_auth_h].at_encode(
		get_rattr(presv, RESV_ATR_auth_h),
		&attrlist,
		resv_attr_def[RESV_ATR_auth_h].at_name,
		NULL,
		ATR_ENCODE_CLIENT, NULL);

	/* now encode the reservation's resource_list attribute */

	resc_access_perm = READ_ONLY;
	(void) resv_attr_def[RESV_ATR_resource].at_encode(
		get_rattr(presv, RESV_ATR_resource),
		&attrlist,
		resv_attr_def[RESV_ATR_resource].at_name,
		NULL,
		ATR_ENCODE_CLIENT, NULL);
	resc_access_perm = old_perm;

	/* compute space need for the encode attributes */

	i = 0;
	pal = GET_NEXT(attrlist);
	while (pal != NULL) {
		/* +5 in count is for '=', ' ', start and end quotes, and \0 */
		i += strlen(pal->al_name) + strlen(pal->al_value) + 5;
		if (pal->al_resc)
			i += 1 + strlen(pal->al_resc);
		pal = GET_NEXT(pal->al_link);
	}
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			return (pb);

	/*write encoded attrlist values into buffer being developed*/

	while ((pal = GET_NEXT(attrlist)) != NULL) {
		(void) strcat(pb, pal->al_name);
		if (pal->al_resc) {
			(void) strcat(pb, ".");
			(void) strcat(pb, pal->al_resc);
		}
		(void) strcat(pb, "=");
		cpy_quote_value(pb, pal->al_value);
		(void) strcat(pb, " ");
		delete_link(&pal->al_link);
		(void) free(pal);
		pb += strlen(pb);
	}
	return (pb);
}

/**
 * @brief
 * acct_open() - open the acct file for append.
 * Opens a (new) acct file.
 * If a acct file is already open, and the new file is successfully opened,
 * the old file is closed.  Otherwise the old file is left open.
 *
 * @param[in]	filename - abs pathname or NULL
 *
 * @return      Error code
 * @retval	 0  - Success
 * @retval	-1  - Failure
 */
int
acct_open(char *filename)
{
	char filen[_POSIX_PATH_MAX];
	char logmsg[_POSIX_PATH_MAX + 80];
	FILE *newacct;
	time_t now;
	struct tm *ptm;

	if (acct_buf == NULL) { /* malloc buffer space */
		acct_buf = (char *) malloc(acct_bufsize + 1);
		if (acct_buf == NULL)
			return (-1);
	}

	if (filename == NULL) { /* go with default */
		now = time(0);
		ptm = localtime(&now);
		(void) sprintf(filen, "%s%04d%02d%02d",
			       path_acct,
			       ptm->tm_year + 1900, ptm->tm_mon + 1, ptm->tm_mday);
		filename = filen;
		acct_auto_switch = 1;
		acct_opened_day = ptm->tm_yday;
	} else if (*filename == '\0') { /* a null name is not an error */
		return (0);		/* turns off account logging.  */
	} else if (*filename != '/') {
		return (-1); /* not absolute */
	}
	if ((newacct = fopen(filename, "a")) == NULL) {
		log_err(errno, "acct_open", filename);
		return (-1);
	}

	(void) setvbuf(newacct, NULL, _IOLBF, 0); /* set line buffering */

	if (acct_opened > 0) /* if acct was open, close it */
		(void) fclose(acctfile);

	acctfile = newacct;
	acct_opened = 1; /* note that file is open */
	(void) sprintf(logmsg, "Account file %s opened", filename);
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
		  "Act", logmsg);

	return (0);
}

/**
 * @brief
 * acct_close - close the current open log file
 *
 * @return	void
 */
void
acct_close()
{
	if (acct_opened == 1) {
		(void) fclose(acctfile);
		acct_opened = 0;
	}
}

/**
 * @brief
 * write_account_record - write basic accounting record
 *
 * @param[in]	acctype - accounting record type
 * @param[in]	id - accounting record id
 * @param[in,out]	text - text to log, may be null
 *
 * @return	void
 */
void
write_account_record(int acctype, const char *id, char *text)
{
	struct tm *ptm;

	if (acct_opened == 0)
		return; /* file not open, don't bother */

	ptm = localtime(&time_now);

	/* Do we need to switch files */

	if (acct_auto_switch && (acct_opened_day != ptm->tm_yday)) {
		acct_close();
		acct_open(NULL);
	}
	if (text == NULL)
		text = "";

	(void) fprintf(acctfile,
		       "%02d/%02d/%04d %02d:%02d:%02d;%c;%s;%s\n",
		       ptm->tm_mon + 1, ptm->tm_mday, ptm->tm_year + 1900,
		       ptm->tm_hour, ptm->tm_min, ptm->tm_sec,
		       (char) acctype, id, text);
}

/**
 * @brief
 *account_record - basic job related accounting record
 *
 * @param[in]	acctype - accounting record type
 * @param[in]	pjob - pointer to job
 * @param[in]	text - text to log, may be null
 *
 * @return	void
 */
void
account_record(int acctype, const job *pjob, char *text)
{
	write_account_record(acctype, pjob->ji_qs.ji_jobid, text);
}

/**
 * @brief
 * account_recordResv - write basic accounting record
 *
 * @param[in]	acctype - accounting record type
 * @param[in]	presv - pointer to reservation structure
 * @param[in]	text - text to log, may be null
 *
 * @return	void
 */
void
account_recordResv(int acctype, resc_resv *presv, char *text)
{
	write_account_record(acctype, presv->ri_qs.ri_resvID, text);
}

/**
 * @brief
 *	Form and write a record that contains basic job information and the
 *	assigned consumable resource values for the job.
 *
 * @par	Functionality:
 *	Takes various information from the job structure, start time, owner,
 *	Resource_List, etc., and the resource assigned information (based on
 *	job's exec_vnode value) and formats the record type requested.
 *	Currently, this is used for 'R' (Job run/started).
 *
 *	The record is then written to the accounting log.
 *
 * @see:
 *	complete_running()
 *
 * @param[in]	pjob	- pointer to job structure
 * @param[in]	type	- record type, PBS_ACCT_RUN ('R'),
 *					PBS_ACCT_NEXT ('c').
 * @return	void
 *
 * @par	MT-safe: No - uses a global buffer, "acct_buf".
 */
void
account_jobstr(const job *pjob, int type)
{
	pbs_list_head attrlist;
	int nd;
	int len;
	svrattrl *pal;
	char *pb;

	CLEAR_HEAD(attrlist);

	/* pack in general information about the job */

	acct_job(pjob, type, acct_buf, acct_bufsize);
	acct_buf[acct_bufsize] = '\0';

	if (type != PBS_ACCT_QUEUE) {

		nd = strlen(acct_buf);
		pb = acct_buf + nd;
		len = acct_bufsize - nd;

		sum_resc_alloc(pjob, &attrlist);

		nd = 0; /* compute total size needed in buf */
		pal = GET_NEXT(attrlist);
		while (pal != NULL) {
			/* +5 in count is for '=', ' ', start and end quotes, and \0 */
			nd += strlen(pal->al_name) + strlen(pal->al_value) + 5;
			if (pal->al_resc)
				nd += 1 + strlen(pal->al_resc);
			pal = GET_NEXT(pal->al_link);
		}
		if ((nd <= len) ||
		    (grow_acct_buf(&pb, &len, nd) == 0)) {

			/* have room in buffer, so copy in resources_assigned */

			while ((pal = GET_NEXT(attrlist)) != NULL) {
				strcat(pb, pal->al_name);
				if (pal->al_resc) {
					strcat(pb, ".");
					strcat(pb, pal->al_resc);
				}
				strcat(pb, "=");
				cpy_quote_value(pb, pal->al_value);
				strcat(pb, " ");
				delete_link(&pal->al_link);
				free(pal);
				pb += strlen(pb);
			}
		}
	}
	account_record(type, pjob, acct_buf);
}

/**
 * @brief
 * account_resvstart - write a "reservation start" record
 *
 * @param[in]	presv - pointer to reservation structure
 *
 * @return	void
 */
void
account_resvstart(resc_resv *presv)
{
	/* pack in general information about the reservation */

	(void) acct_resv(presv, acct_buf, acct_bufsize);
	acct_buf[acct_bufsize] = '\0';
	account_recordResv(PBS_ACCT_BR, presv, acct_buf);
}

/**
 * @brief
 *	Form and write a job termination/rerun record with resource usage.
 *
 * @par	Functionality:
 *	Takes various information from the job structure, start time, owner,
 *	Resource_List, etc., and the resource usage information (see
 *	ji_acctrec) if present and formats the record type requested.
 *	Currently, this is used for 'E' and 'R' records.  The record is then
 *	written to the accounting log.
 *
 * @see:
 *	on_job_exit() and on_job_rerun() as well as force_reque().
 *
 * @param[in]	pjob	- pointer to job structure
 * @param[in]	used	- resource usage information from Mom,  this is a string
 *			  consisting of space separated keyword=value pairs,
 *			  may be null pointer
 * @param[in]	type	- record type, PBS_ACCT_END ('E') or
 *			  PBS_ACCT_RERUN ('R')
 * @return	void
 *
 * @par	MT-safe: No - uses a global buffer, "acct_buf".
 *
 */
void
account_jobend(job *pjob, char *used, int type)
{
	int i = 0;
	int len = 0;
	char *pb = NULL;
	char *resc_used;
	int resc_used_size = 0;

	/* pack in general information about the job */

	pb = acct_job(pjob, type, acct_buf, acct_bufsize);
	len = acct_bufsize - (pb - acct_buf);

	/*
	 * for each keyword=value pair added, the following steps should be
	 * followed:
	 * a. calculate (or over-estimate) the size of the date to be added
	 * b. check that there is sufficient room in the buffer, "len" is the
	 *    current unused amount.
	 * c. If necessary, grow the buffer by calling grow_acct_buf().
	 *    If this function fails,  just write out what we already have.
	 * d. Append the new datum to the buffer at "pb".  Each new item should
	 *    have a single leading space.  The variable "pb" is maintained
	 *    to point to the end to save "strcat" time.
	 * e. Advance "pb" by the length of the datum added and decrement
	 *    "len" by the same amount.
	 */

	/* session */
	i = 30;
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			goto writeit;
	(void) sprintf(pb, "session=%ld",
		       get_jattr_long(pjob, JOB_ATR_session_id));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* Alternate id if present */

	if (is_jattr_set(pjob, JOB_ATR_altid)) {
		i = 9 + strlen(get_jattr_str(pjob, JOB_ATR_altid));
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				goto writeit;

		(void) sprintf(pb, " alt_id=%s",
			       get_jattr_str(pjob, JOB_ATR_altid));

		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* add the execution ended time */
	i = 18;
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			goto writeit;
	(void) sprintf(pb, " end=%ld", (long) time_now);
	i = strlen(pb);
	pb += i;
	len -= i;

	/* finally add on resources used from req_jobobit() */
	if (type == PBS_ACCT_END || type == PBS_ACCT_RERUN) {
		if ((used == NULL && pjob->ji_acctrec == NULL) || (used != NULL && strstr(used, "resources_used") == NULL)) {
			/* If pbs_server is restarted during the end of job processing then used maybe NULL.
			 * So we try to derive the resource usage information from resources_used attribute of
			 * the job and then reconstruct the resources usage information into resc_used buffer.
			 */

			/* Allocate initial space for resc_used.  Future space will be allocated by pbs_strcat(). */
			resc_used = malloc(RESC_USED_BUF_SIZE);
			if (resc_used == NULL)
				goto writeit;
			resc_used_size = RESC_USED_BUF_SIZE;

			/* strlen(msg_job_end_stat) == 12 characters plus a number.  This should be plenty big */
			(void) snprintf(resc_used, resc_used_size, msg_job_end_stat,
					pjob->ji_qs.ji_un.ji_exect.ji_exitstat);

			if (get_resc_used(pjob, &resc_used, &resc_used_size) == -1) {
				free(resc_used);
				goto writeit;
			}

			used = resc_used;
			free(pjob->ji_acctrec);
			pjob->ji_acctrec = used;
		}
	}

	if (used != NULL) {
		i = strlen(used) + 1;
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				goto writeit;
		(void) strcat(pb, " ");
		(void) strcat(pb, used);
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* Add eligible_time */
	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1) {
		char timebuf[TIMEBUF_SIZE] = {0};
		i = 26; /* max size for " eligible_time=<value>" */
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				goto writeit;

		convert_duration_to_str(get_jattr_long(pjob, JOB_ATR_eligible_time), timebuf, TIMEBUF_SIZE);
		(void) sprintf(pb, " eligible_time=%s", timebuf);
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* Add in run count */

	i = 34; /* sort of max size for "run_count=<value>" */
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			goto writeit;
	sprintf(pb, " run_count=%ld",
		get_jattr_long(pjob, JOB_ATR_runcount));
	/* if any more is added after this point, */
	/* don't forget to reset pb and len first */

	/* done creating record,  now write it out */

writeit:
	acct_buf[acct_bufsize - 1] = '\0';
	account_record(type, pjob, acct_buf);
}
/**
 * @brief
 *	Log the license used.
 *
 * @see
 *	call_log_license
 *
 * @param[in]   pu	-	pointer to licenses_high_use
 *
 * @return      void
 */
void
log_licenses(pbs_licenses_high_use *pu)
{
	sprintf(acct_buf, "floating license hour:%d day:%d month:%d max:%d",
		pu->lu_max_hr,
		pu->lu_max_day,
		pu->lu_max_month,
		pu->lu_max_forever);
	write_account_record(PBS_ACCT_LIC, "license", acct_buf);
}

/**
 * @brief
 *	Builds job accounting record.
 *
 * @par Functionality:
 *      This function builds basic job data to be printed with provisioning
 *	record.
 *
 * @see
 *	set_job_ProvAcctRcd
 *
 * @param[in]   pjob	-	pointer to job
 * @param[in]   buf	-	pointer to buffer to contain job related data
 * @param[in]   len	-	length of buffer
 *
 * @return      pointer to string
 * @retval       char* : job accounting info
 *
 * @par Side Effects:
 *     the accounting buffer (acct_buf) is grown
 *
 * @par MT-safe: No
 *
 */
static char *
common_acct_job(job *pjob, char *buf, int len)
{
	int i;
	int nd;
	char *pb;

	pb = buf;

	/* user */
	nd = 7 + strlen(get_jattr_str(pjob, JOB_ATR_euser));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	sprintf(pb, "user=%s ", get_jattr_str(pjob, JOB_ATR_euser));

	i = strlen(pb);
	pb += i;
	len -= i;

	/* group */
	nd = 8 + strlen(get_jattr_str(pjob, JOB_ATR_egroup));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	sprintf(pb, "group=%s ", get_jattr_str(pjob, JOB_ATR_egroup));

	i = strlen(pb);
	pb += i;
	len -= i;

	/* job name */
	nd = 10 + strlen(get_jattr_str(pjob, JOB_ATR_jobname));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);
	sprintf(pb, "jobname=%s ", get_jattr_str(pjob, JOB_ATR_jobname));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* queue name */
	nd = 8 + strlen(pjob->ji_qhdr->qu_qs.qu_name);
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);
	sprintf(pb, "queue=%s ", pjob->ji_qhdr->qu_qs.qu_name);

	return (pb);
}

/**
 * @brief
 *	Creates start/end provisioning record.
 *
 * @par Functionality:
 *      This function creates start/end provisioning record for a single job.
 *
 * @see
 *
 * @param[in]   pjob	-	pointer to job
 * @param[in]   time_se	-	start or end time stamp depending upon value of type
 * @param[in]   type	-	integer value to select type of record,
 *				1 = start, 2 = end
 *
 * @return	void
 *
 * @par Side Effects:
 *      The accounting buffer (acct_buf) is grown
 *
 * @par MT-safe: No
 *
 */
void
set_job_ProvAcctRcd(job *pjob, long time_se, int type)
{
	int nd;
	int len;
	char *pb;
	int i;

	/* pack in general information about the job */

	(void) common_acct_job(pjob, acct_buf, acct_bufsize);
	acct_buf[acct_bufsize - 1] = '\0';

	nd = strlen(acct_buf);
	pb = acct_buf + nd;
	len = acct_bufsize - nd;

	/* node list that were provisioned */
#ifdef NAS /* localmod 136 */
	if (get_jattr_str(pjob, JOB_ATR_prov_vnode) == NULL) {
		char logmsg[1024];
		sprintf(logmsg, "prov_vnode is NULL for job %s", get_jattr_str(pjob, JOB_ATR_hashname));
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, "Bug", logmsg);

		return;
	}
#endif /* localmod 136 */
	nd = 18 + strlen(get_jattr_str(pjob, JOB_ATR_prov_vnode));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return;
	(void) sprintf(pb, "provision_vnode=%s ",
		       get_jattr_str(pjob, JOB_ATR_prov_vnode));
	i = strlen(pb);
	pb += i;
	len -= i;

	switch (type) {
		case PROVISIONING_STARTED:
			nd = 45;
			if (nd > len)
				if (grow_acct_buf(&pb, &len, nd) == -1)
					return;
			(void) sprintf(pb, "provision_event=START start_time=%ld", time_se);
			acct_buf[acct_bufsize - 1] = '\0';
			account_record(PBS_ACCT_PROV_START, pjob, acct_buf);
			break;
		case PROVISIONING_SUCCESS:
		case PROVISIONING_FAILURE:
			nd = 56;
			if (nd > len)
				if (grow_acct_buf(&pb, &len, nd) == -1)
					return;

			(void) sprintf(pb, "provision_event=END status=%s end_time=%ld",
				       (type == 2) ? "SUCCESS" : "FAILURE", time_se);
			acct_buf[acct_bufsize - 1] = '\0';
			account_record(PBS_ACCT_PROV_END, pjob, acct_buf);
			break;
	}
}

/**
 * @brief
 * 	Build common data for update job accounting record
 *
 * @par	Functionality:
 *	Used by account_job_update()
 *
 *
 * @param[in]	pjob	- pointer to job structure
 * @param[in]	type	- type of accounting record: PBS_ACCT_UPDATE,
 *			  PBS_ACCT_LAST.
 * @param[in]	buf	- buffer holding the data that will be stored in
 *			  accounting logs.
 * @param[in]	len	- number of characters in 'buf' still available to
 *			  store data.
 * @return	char *
 * @retval	pointer to 'buf' containing new data.
 *
 */
static char *
build_common_data_for_job_update(const job *pjob, int type, char *buf, int len)
{
	pbs_list_head attrlist;
	int ct;
	int nd;
	svrattrl *pal;
	char *pb;
	int k, len_acct, att_index;
	char save_char;
	int old_perm;

	pb = buf;
	CLEAR_HEAD(attrlist);

	/* gridname */
	if (is_jattr_set(pjob, JOB_ATR_gridname)) {
		nd = strlen(get_jattr_str(pjob, JOB_ATR_gridname)) + sizeof(GRIDNAME_FMT);
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);

		(void) snprintf(pb, len, GRIDNAME_FMT,
				get_jattr_str(pjob, JOB_ATR_gridname));
		ct = strlen(pb);
		pb += ct;
		len -= ct;
	}

	/* user */
	nd = sizeof(USER_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_euser));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	(void) snprintf(pb, len, USER_FMT,
			get_jattr_str(pjob, JOB_ATR_euser));

	ct = strlen(pb);
	pb += ct;
	len -= ct;

	/* group */
	nd = sizeof(GROUP_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_egroup));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	(void) snprintf(pb, len, GROUP_FMT,
			get_jattr_str(pjob, JOB_ATR_egroup));

	ct = strlen(pb);
	pb += ct;
	len -= ct;

	/* account */
	if (is_jattr_set(pjob, JOB_ATR_account)) {
		nd = sizeof(ACCOUNT_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_account));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);

		(void) snprintf(pb, len, ACCOUNT_FMT,
				get_jattr_str(pjob, JOB_ATR_account));

		ct = strlen(pb);
		pb += ct;
		len -= ct;
	}

	/* project */
	if (is_jattr_set(pjob, JOB_ATR_project)) {
		char *projstr;

		projstr = get_jattr_str(pjob, JOB_ATR_project);
		/* using PROJECT_FMT1 if projstr needs to be quoted; otherwise, PROJECT_FMT2 */
		nd = sizeof(PROJECT_FMT1) + strlen(projstr);
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		if (strchr(projstr, ' ') != NULL) {
			(void) snprintf(pb, len, PROJECT_FMT1, projstr);
		} else {
			(void) snprintf(pb, len, PROJECT_FMT2, projstr);
		}
		ct = strlen(pb);
		pb += ct;
		len -= ct;
	}

	/* accounting_id */
	if (is_jattr_set(pjob, JOB_ATR_acct_id)) {
		nd = sizeof(ACCOUNTING_ID_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_acct_id));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		(void) snprintf(pb, len, ACCOUNTING_ID_FMT,
				get_jattr_str(pjob, JOB_ATR_acct_id));
		ct = strlen(pb);
		pb += ct;
		len -= ct;
	}

	/* job name */
	nd = sizeof(JOBNAME_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_jobname));
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);
	(void) snprintf(pb, len, JOBNAME_FMT,
			get_jattr_str(pjob, JOB_ATR_jobname));
	ct = strlen(pb);
	pb += ct;
	len -= ct;

	/* queue name */
	nd = sizeof(QUEUE_FMT) + strlen(pjob->ji_qhdr->qu_qs.qu_name);
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);
	(void) snprintf(pb, len, QUEUE_FMT, pjob->ji_qhdr->qu_qs.qu_name);
	ct = strlen(pb);
	pb += ct;
	len -= ct;

	if (pjob->ji_myResv) {
		nd = sizeof(RESVID_FMT) + strlen(pjob->ji_myResv->ri_qs.ri_resvID);
		if (is_rattr_set(pjob->ji_myResv, RESV_ATR_resv_name))
			nd += sizeof(RESVNAME_FMT) + strlen(get_rattr_str(pjob->ji_myResv, RESV_ATR_resv_name));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		/* reservation name */
		if (is_rattr_set(pjob->ji_myResv, RESV_ATR_resv_name)) {
			(void) snprintf(pb, len, RESVNAME_FMT, get_rattr_str(pjob->ji_myResv, RESV_ATR_resv_name));
			ct = strlen(pb);
			pb += ct;
			len -= ct;
		}

		/* reservation ID */
		(void) snprintf(pb, len, RESVID_FMT,
				pjob->ji_myResv->ri_qs.ri_resvID);
		ct = strlen(pb);
		pb += ct;
		len -= ct;
	}

	/* insure space for all *times */
	nd = ACCTBUF_TIMES_NEED;
	if (nd > len)
		if (grow_acct_buf(&pb, &len, nd) == -1)
			return (pb);

	/* create time */
	sprintf(pb, "ctime=%ld ", get_jattr_long(pjob, JOB_ATR_ctime));
	ct = strlen(pb);
	pb += ct;
	len -= ct;

	/* queued time */
	sprintf(pb, "qtime=%ld ", get_jattr_long(pjob, JOB_ATR_qtime));
	ct = strlen(pb);
	pb += ct;
	len -= ct;

	/* eligible time, how long ready to run */
	sprintf(pb, "etime=%ld ", get_jattr_long(pjob, JOB_ATR_etime));
	ct = strlen(pb);
	pb += ct;
	len -= ct;

	/* start time */
	sprintf(pb, "start=%ld ", (long) pjob->ji_qs.ji_stime);
	ct = strlen(pb);
	pb += ct;
	len -= ct;

	if ((is_jattr_set(pjob, JOB_ATR_array_indices_submitted)) &&
	    check_job_state(pjob, JOB_STATE_LTR_BEGUN)) {

		/* for an Array Job in Begun state,  record index range */

		nd = sizeof(ARRAY_INDICES_FMT) + strlen(get_jattr_str(pjob, JOB_ATR_array_indices_submitted));
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);
		snprintf(pb, len, ARRAY_INDICES_FMT, get_jattr_str(pjob, JOB_ATR_array_indices_submitted));
		ct = strlen(pb);
		pb += ct;
		len -= ct;

		/* now encode the job's resource_list attribute */
		/* of the just concluded phase */
		old_perm = resc_access_perm;
		resc_access_perm = READ_ONLY;
		if (type == PBS_ACCT_UPDATE)
			att_index = JOB_ATR_resource_acct;
		else
			att_index = JOB_ATR_resource;
		job_attr_def[att_index].at_encode(
			get_jattr(pjob, att_index),
			&attrlist,
			job_attr_def[att_index].at_name,
			NULL,
			ATR_ENCODE_CLIENT, NULL);
		resc_access_perm = old_perm;

		nd = 0; /* compute total size needed in buf */
		pal = GET_NEXT(attrlist);
		while (pal != NULL) {
			/* +5 in count is for '=', ' ', start and end quotes, and \0 */
			nd += strlen(pal->al_name) + strlen(pal->al_value) + 5;
			if (pal->al_resc)
				nd += 1 + strlen(pal->al_resc);
			pal = GET_NEXT(pal->al_link);
		}
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);

		if (type == PBS_ACCT_UPDATE)
			len_acct = 5; /* for length of "_acct" */
		else
			len_acct = 0;
		while ((pal = GET_NEXT(attrlist)) != NULL) {
			/* strip off the '_acct' suffix */
			if (len_acct > 0) {
				k = strlen(pal->al_name);
				if (k > len_acct) {
					save_char = pal->al_name[k - len_acct];
					pal->al_name[k - len_acct] = '\0';
				}
			}
			(void) strcat(pb, pal->al_name);
			if (len_acct > 0) {
				if (k > len_acct) {
					pal->al_name[k - len_acct] = save_char;
				}
			}
			if (pal->al_resc) {

				(void) strcat(pb, ".");
				(void) strcat(pb, pal->al_resc);
			}
			(void) strcat(pb, "=");
			cpy_quote_value(pb, pal->al_value);
			(void) strcat(pb, " ");
			delete_link(&pal->al_link);
			(void) free(pal);
			pb += strlen(pb);
		}
	} else {

		/* regular job */
		/* record exec_host of a completed phase */
		if (type == PBS_ACCT_UPDATE)
			att_index = JOB_ATR_exec_host_acct;
		else
			att_index = JOB_ATR_exec_host;
		if (is_jattr_set(pjob, att_index)) {
			/* execution host list, may be loooong */
			nd = sizeof(EXEC_HOST_FMT) + strlen(get_jattr_str(pjob, att_index));
			if (nd > len)
				if (grow_acct_buf(&pb, &len, nd) == -1)
					return (pb);
			(void) snprintf(pb, len, EXEC_HOST_FMT,
					get_jattr_str(pjob, att_index));
			ct = strlen(pb);
			pb += ct;
			len -= ct;
		}

		/* record exec_vnode of a just concluded phase */
		if (type == PBS_ACCT_UPDATE)
			att_index = JOB_ATR_exec_vnode_acct;
		else
			att_index = JOB_ATR_exec_vnode;
		if (is_jattr_set(pjob, att_index)) {
			/* execution vnode list, will be even longer */
			nd = sizeof(EXEC_VNODE_FMT) + strlen(get_jattr_str(pjob, att_index));
			if (nd > len)
				if (grow_acct_buf(&pb, &len, nd) == -1)
					return (pb);
			(void) snprintf(pb, len, EXEC_VNODE_FMT,
					get_jattr_str(pjob, att_index));
			ct = strlen(pb);
			pb += ct;
			len -= ct;
		}

		/* now encode the job's resource_list attribute */
		/* of the just concluded phase */
		old_perm = resc_access_perm;
		resc_access_perm = READ_ONLY;
		if (type == PBS_ACCT_UPDATE)
			att_index = JOB_ATR_resource_acct;
		else
			att_index = JOB_ATR_resource;
		(void) job_attr_def[att_index].at_encode(
			get_jattr(pjob, att_index),
			&attrlist,
			job_attr_def[att_index].at_name,
			NULL,
			ATR_ENCODE_CLIENT, NULL);
		resc_access_perm = old_perm;

		nd = 0; /* compute total size needed in buf */
		pal = GET_NEXT(attrlist);
		while (pal != NULL) {
			/* +5 in count is for '=', ' ', start and end quotes, and \0 */
			nd += strlen(pal->al_name) + strlen(pal->al_value) + 5;
			if (pal->al_resc)
				nd += 1 + strlen(pal->al_resc);
			pal = GET_NEXT(pal->al_link);
		}
		if (nd > len)
			if (grow_acct_buf(&pb, &len, nd) == -1)
				return (pb);

		if (type == PBS_ACCT_UPDATE)
			len_acct = strlen("_acct");
		else
			len_acct = 0;
		while ((pal = GET_NEXT(attrlist)) != NULL) {
			/* strip off the '_acct' suffix */
			if (len_acct > 0) {
				k = strlen(pal->al_name);
				if (k > len_acct) {
					save_char = pal->al_name[k - len_acct];
					pal->al_name[k - len_acct] = '\0';
				}
			}
			(void) strcat(pb, pal->al_name);
			if (len_acct > 0) {
				if (k > len_acct) {
					pal->al_name[k - len_acct] = save_char;
				}
			}
			if (pal->al_resc) {

				(void) strcat(pb, ".");
				(void) strcat(pb, pal->al_resc);
			}
			(void) strcat(pb, "=");
			cpy_quote_value(pb, pal->al_value);
			(void) strcat(pb, " ");
			delete_link(&pal->al_link);
			(void) free(pal);
			pb += strlen(pb);
		}
	}

	return (pb);
}

/**
 * @brief
 *	Form and write a job update record with resource usage.
 *
 * @par	Functionality:
 *	Takes various information from the job structure, start time, owner,
 *	Resource_List, etc., and the resource usage information
 *	if present and formats the record type requested.
 *	Currently, this is used for 'u' and 'e' records.  The record is then
 *	written to the accounting log.
 *
 * @see build_common_data_for_job_update()
 *
 * @param[in]	pjob	- pointer to job structure
 * @param[in]	used	- resource usage information from Mom,
 *			  this is a string consisting of space separated
 *			  keyword=value pairs, may be null pointer
 * @param[in]	type	- record type, PBS_ACCT_UPDATE ('u') or PBS_ACCT_LAST ('e')
 * @return	void
 *
 * @par	MT-safe: No - uses a global buffer, "acct_buf".
 *
 */
void
account_job_update(job *pjob, int type)
{
	int i = 0;
	int len = 0;
	char *pb = NULL;
	pbs_list_head attrlist;
	struct svrattrl *patlist = NULL;
	char *resc_used = NULL;
	int resc_used_size = 0;
	int k, len_upd, attr_index;
	char save_char = '\0';
	int old_perm;

	if (!is_jattr_set(pjob, JOB_ATR_exec_vnode_acct))
		return;

	CLEAR_HEAD(attrlist);
	/* pack in general information about the job */

	pb = build_common_data_for_job_update(pjob, type, acct_buf, acct_bufsize);
	len = acct_bufsize - (pb - acct_buf);

	/* session */
	i = 30;
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			goto writeit;
	sprintf(pb, "session=%ld", get_jattr_long(pjob, JOB_ATR_session_id));
	i = strlen(pb);
	pb += i;
	len -= i;

	/* Alternate id if present */

	if (is_jattr_set(pjob, JOB_ATR_altid)) {
		/* 9 is for length of " alt_id=" and \0 */
		i = 9 + strlen(get_jattr_str(pjob, JOB_ATR_altid));
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				goto writeit;

		sprintf(pb, " alt_id=%s", get_jattr_str(pjob, JOB_ATR_altid));

		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* Add eligible_time */
	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1) {
		char timebuf[TIMEBUF_SIZE];
		i = 26; /* sort of max size for " eligible_time=<value>" */
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				goto writeit;

		convert_duration_to_str(get_jattr_long(pjob, JOB_ATR_eligible_time), timebuf, TIMEBUF_SIZE);
		(void) sprintf(pb, " eligible_time=%s", timebuf);
		i = strlen(pb);
		pb += i;
		len -= i;
	}

	/* Add in runcount */

	i = 34; /* sort of max size for "run_count=<value>" */
	if (i > len)
		if (grow_acct_buf(&pb, &len, i) == -1)
			goto writeit;
	sprintf(pb, " run_count=%ld", get_jattr_long(pjob, JOB_ATR_runcount));

	/* now encode the job's resources_used attribute */
	old_perm = resc_access_perm;
	resc_access_perm = READ_ONLY;
	if (is_jattr_set(pjob, JOB_ATR_resc_used_update)) {
		len_upd = 7; /* for length of "_update" */
		attr_index = JOB_ATR_resc_used_update;
	} else {
		len_upd = 0;
		attr_index = JOB_ATR_resc_used;
	}
	job_attr_def[attr_index].at_encode(get_jattr(pjob, attr_index),
					   &attrlist,
					   job_attr_def[attr_index].at_name,
					   NULL,
					   ATR_ENCODE_CLIENT, NULL);
	resc_access_perm = old_perm;

	/* Allocate initial space for resc_used.  Future space will be allocated by pbs_strcat(). */
	resc_used = malloc(RESC_USED_BUF_SIZE);
	if (resc_used == NULL)
		goto writeit;
	resc_used_size = RESC_USED_BUF_SIZE;
	resc_used[0] = '\0';

	patlist = GET_NEXT(attrlist);
	while (patlist) {
		k = 0;
		if (len_upd > 0) {
			/* strip off the '_update' suffix */
			k = strlen(patlist->al_name);
			if (k > len_upd) {
				save_char = patlist->al_name[k - len_upd];
				patlist->al_name[k - len_upd] = '\0';
			}
		}
		/*
		 * To calculate length of the string of the form "resources_used.<resource>=<value>".
		 * Additional length of 3 is required to accommodate the characters '.', '=' and ' '.
		 */
		if (strlen(patlist->al_value) > 0) {

			if (pbs_strcat(&resc_used, &resc_used_size, " ") == NULL) {
				log_err(errno, __func__, "Failed to allocate memory.");
				if (len_upd > 0 && k > len_upd) {
					patlist->al_name[k - len_upd] = save_char;
				}
				goto writeit;
			}
			if (pbs_strcat(&resc_used, &resc_used_size, patlist->al_name) == NULL) {
				log_err(errno, __func__, "Failed to allocate memory.");
				if (len_upd > 0 && k > len_upd) {
					patlist->al_name[k - len_upd] = save_char;
				}
				goto writeit;
			}
			if (len_upd > 0 && k > len_upd) {
				patlist->al_name[k - len_upd] = save_char;
			}
			if (patlist->al_resc) {
				if (pbs_strcat(&resc_used, &resc_used_size, ".") == NULL) {
					log_err(errno, __func__, "Failed to allocate memory.");
					goto writeit;
				}
				if (pbs_strcat(&resc_used, &resc_used_size, patlist->al_resc) == NULL) {
					log_err(errno, __func__, "Failed to allocate memory.");
					goto writeit;
				}
			}
			if (pbs_strcat(&resc_used, &resc_used_size, "=") == NULL) {
				log_err(errno, __func__, "Failed to allocate memory.");
				goto writeit;
			}
			if (patlist->al_resc && (strcmp(patlist->al_resc, WALLTIME) == 0)) {
				long j, k;

				k = get_walltime(pjob, JOB_ATR_resc_used_acct);
				j = get_walltime(pjob, JOB_ATR_resc_used);
				if ((k >= 0) && (j >= k)) {
					char timebuf[TIMEBUF_SIZE];

					convert_duration_to_str(j - k, timebuf, TIMEBUF_SIZE);
					if (pbs_strcat(&resc_used, &resc_used_size, timebuf) == NULL) {
						log_err(errno, __func__, "Failed to allocate memory.");
						goto writeit;
					}
				} else {
					if (pbs_strcat(&resc_used, &resc_used_size, patlist->al_value) == NULL) {
						log_err(errno, __func__, "Failed to allocate memory.");
						goto writeit;
					}
				}
			} else {
				if (pbs_strcat(&resc_used, &resc_used_size, patlist->al_value) == NULL) {
					log_err(errno, __func__, "Failed to allocate memory.");
					goto writeit;
				}
			}
		}
		patlist = patlist->al_sister;
	}
	free_attrlist(&attrlist);

	if (resc_used[0] != '\0') {
		i = strlen(resc_used) + 1;
		if (i > len)
			if (grow_acct_buf(&pb, &len, i) == -1)
				goto writeit;
		(void) strcat(pb, " ");
		(void) strcat(pb, resc_used);
		i = strlen(pb);
		pb += i;
		len -= i;

		set_attr_with_attr(&job_attr_def[JOB_ATR_resc_used_acct], get_jattr(pjob, JOB_ATR_resc_used_acct), get_jattr(pjob, JOB_ATR_resc_used), INCR);
	}

writeit:
	acct_buf[acct_bufsize - 1] = '\0';
	account_record(type, pjob, acct_buf);
	if (resc_used != NULL)
		free(resc_used);
}

/**
 * @brief
 * 	log an alter record for modified jobs
 * 	plist contains the attributes and resources requested to be modified.
 * 	We only modify those because the ATTR_l encode function will encode
 * 	all resources, not just the ones we want.
 *
 * @param[in] pjob - job to log records for.
 * @param[in] plist - list of attributes and resources to log
 *
 * @returns void
 */
void
log_alter_records_for_attrs(job *pjob, svrattrl *plist)
{
	svrattrl *cur_svr;
	pbs_list_head phead;
	svrattrl *cur_plist;
	char *per_attr_buf = NULL;
	static char *entire_record = NULL;
	static int entire_record_len = 0;
	int error = 0;
	int i;

	if (entire_record == NULL) {
		entire_record = malloc(1024 * sizeof(char));
		if (entire_record == NULL)
			return;
		entire_record_len = 1024;
	}
	entire_record[0] = '\0';

	CLEAR_HEAD(phead);
	for (i = 0; i < JOB_ATR_LAST; i++) {
		attribute *pattr = get_jattr(pjob, i);
		if (pattr->at_flags & ATR_VFLAG_MODIFY) {
			svrattrl *svrattrl_list = NULL;
			job_attr_def[i].at_encode(pattr, &phead, job_attr_def[i].at_name, NULL, ATR_ENCODE_CLIENT, &svrattrl_list);
			for (cur_plist = plist; cur_plist != NULL; cur_plist = (svrattrl *) GET_NEXT(cur_plist->al_link)) {
				int j;
				int ignore = 0;
				for (j = 0; do_not_emit_alter[j] != NULL; j++)
					if (strcmp(do_not_emit_alter[j], cur_plist->al_name) == 0) {
						ignore = 1;
						break;
					}
				if (ignore || strcmp(cur_plist->al_name, job_attr_def[i].at_name) != 0)
					continue;
				else {
					for (cur_svr = svrattrl_list; cur_svr != NULL; cur_svr = (svrattrl *) GET_NEXT(cur_svr->al_link)) {
						if (pattr->at_type == ATR_TYPE_RESC) {
							if (cur_plist->al_resc != NULL) {
								if (strcmp(cur_plist->al_resc, cur_svr->al_resc) == 0) {
									char *fmt;
									if (strchr(cur_svr->al_value, ' ') == NULL)
										fmt = "%s.%s=%s";
									else
										fmt = "%s.%s=\"%s\"";
									pbs_asprintf(&per_attr_buf, fmt, cur_svr->al_name, cur_svr->al_resc, cur_svr->al_value);
									break;
								}
							}
						} else {
							char *fmt;
							if (strchr(cur_svr->al_value, ' ') == NULL)
								fmt = "%s=%s";
							else
								fmt = "%s=\"%s\"";
							pbs_asprintf(&per_attr_buf, fmt, cur_svr->al_name, cur_svr->al_value);
							break;
						}
					}
				}
				if (per_attr_buf == NULL && cur_plist->al_value[0] == '\0') { /* unset */
					pbs_asprintf(&per_attr_buf, "%s%s%s=UNSET", cur_plist->al_name, cur_plist->al_resc ? "." : "", cur_plist->al_resc ? cur_plist->al_resc : "");
				}

				if (entire_record[0] != '\0')
					if (pbs_strcat(&entire_record, &entire_record_len, " ") == NULL)
						error = 1;

				if (error == 0)
					if (pbs_strcat(&entire_record, &entire_record_len, per_attr_buf) == NULL)
						error = 1;

				free(per_attr_buf);
				per_attr_buf = NULL;
				if (error)
					return;
			}
			free_svrattrl(svrattrl_list);
		}
	}
	if (entire_record[0] != '\0')
		account_record(PBS_ACCT_ALTER, pjob, entire_record);
}

/**
 * @brief
 * Common function to log a suspend/resume record
 * for suspend/resume job events respectively.
 *
 * @param[in] pjob - job to log records for.
 * @param[in] acct_type - Accounting type flag
 *
 * @returns void
 */
void
log_suspend_resume_record(job *pjob, int acct_type)
{
	if (acct_type == PBS_ACCT_SUSPEND) {
		char *resc_buf;
		int resc_buf_size = RESC_USED_BUF_SIZE;

		/* Allocating initial space as required by resc_used. Future space will be allocated by pbs_strcat(). */
		resc_buf = malloc(RESC_USED_BUF_SIZE);
		if (resc_buf == NULL)
			return;

		resc_buf[0] = '\0';

		if (get_resc_used(pjob, &resc_buf, &resc_buf_size) == -1) {
			write_account_record(acct_type, pjob->ji_qs.ji_jobid, NULL);
			free(resc_buf);
			return;
		}

		if (is_jattr_set(pjob, JOB_ATR_resc_released)) {
			char *ret;
			ret = pbs_strcat(&resc_buf, &resc_buf_size, " resources_released=");
			if (ret == NULL) {
				free(resc_buf);
				return;
			}

			ret = pbs_strcat(&resc_buf, &resc_buf_size, get_jattr_str(pjob, JOB_ATR_resc_released));
			if (ret == NULL) {
				free(resc_buf);
				return;
			}
		}
		write_account_record(acct_type, pjob->ji_qs.ji_jobid, resc_buf + 1);
		free(resc_buf);
		return;
	}

	write_account_record(acct_type, pjob->ji_qs.ji_jobid, NULL);
}


================================================
FILE: src/server/array_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * array_func.c - Functions which provide basic Job Array functions
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <sys/types.h>
#include <sys/param.h>
#include <sys/stat.h>
#include <ctype.h>
#include <errno.h>
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include "pbs_ifl.h"
#include "libpbs.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server_limits.h"
#include "server.h"
#include "job.h"
#include "log.h"
#include "pbs_error.h"
#include "batch_request.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "acct.h"
#include <sys/time.h>
#include "range.h"

/* External data */
extern char *msg_job_end_stat;
extern int resc_access_perm;
extern time_t time_now;

/*
 * list of job attributes to copy from the parent Array job
 * when creating a sub job.
 */
static enum job_atr attrs_to_copy[] = {
	JOB_ATR_jobname,
	JOB_ATR_job_owner,
	JOB_ATR_resc_used,
	JOB_ATR_state,
	JOB_ATR_in_queue,
	JOB_ATR_at_server,
	JOB_ATR_account,
	JOB_ATR_ctime,
	JOB_ATR_errpath,
	JOB_ATR_grouplst,
	JOB_ATR_join,
	JOB_ATR_keep,
	JOB_ATR_mtime,
	JOB_ATR_mailpnts,
	JOB_ATR_mailuser,
	JOB_ATR_nodemux,
	JOB_ATR_outpath,
	JOB_ATR_priority,
	JOB_ATR_qtime,
	JOB_ATR_remove,
	JOB_ATR_rerunable,
	JOB_ATR_resource,
	JOB_ATR_session_id,
	JOB_ATR_shell,
	JOB_ATR_sandbox,
	JOB_ATR_jobdir,
	JOB_ATR_stagein,
	JOB_ATR_stageout,
	JOB_ATR_substate,
	JOB_ATR_userlst,
	JOB_ATR_variables,
	JOB_ATR_euser,
	JOB_ATR_egroup,
	JOB_ATR_hashname,
	JOB_ATR_hopcount,
	JOB_ATR_queuetype,
	JOB_ATR_security,
	JOB_ATR_etime,
	JOB_ATR_refresh,
	JOB_ATR_gridname,
	JOB_ATR_umask,
	JOB_ATR_cred,
	JOB_ATR_runcount,
	JOB_ATR_eligible_time,
	JOB_ATR_sample_starttime,
	JOB_ATR_executable,
	JOB_ATR_Arglist,
	JOB_ATR_reserve_ID,
	JOB_ATR_project,
	JOB_ATR_run_version,
	JOB_ATR_tolerate_node_failures,
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	JOB_ATR_cred_id,
#endif
	JOB_ATR_submit_host,
	JOB_ATR_LAST /* This MUST be LAST	*/
};

/**
 * @brief
 * 			is_job_array - determines if the job id indicates
 *
 * @par	Functionality:
 * Note - subjob index or range may be invalid and not detected as such
 *
 * @param[in]	id - Job Id.
 *
 * @return      Job Type
 * @retval	IS_ARRAY_NO  - A regular job
 * @retval	IS_ARRAY_ArrayJob  - A ArrayJob
 * @retval	IS_ARRAY_Single  - A single subjob
 * @retval	IS_ARRAY_Range  - A range of subjobs
 */
int
is_job_array(char *id)
{
	char *pc;

	if ((pc = strchr(id, (int) '[')) == NULL)
		return IS_ARRAY_NO; /* not an ArrayJob nor a subjob (range) */
	if (*++pc == ']')
		return IS_ARRAY_ArrayJob; /* an ArrayJob */

	/* know it is either a single subjob or an range there of */

	while (isdigit((int) *pc))
		++pc;
	if ((*pc == '-') || (*pc == ','))
		return IS_ARRAY_Range; /* a range of subjobs */
	else
		return IS_ARRAY_Single;
}

/**
 * @brief
 * 		get_queued_subjobs_ct	-	get the number of queued subjobs if pjob is job array else return 1
 *
 * @param[in]	pjob	-	pointer to job structure
 *
 * @return	int
 * @retval	-1	: parse error
 * @retval	positive	: count of subjobs in JOB_ATR_array_indices_remaining if job array else 1
 */
int
get_queued_subjobs_ct(job *pjob)
{
	if (NULL == pjob)
		return -1;

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) {
		if (NULL == pjob->ji_ajinfo)
			return -1;

		return pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_QUEUED];
	}

	return 1;
}

/**
 * @brief
 * 		find_arrayparent - find and return a pointer to the job that is or will be
 * 		the parent of the subjob id string
 *
 * @param[in]	subjobid - sub job id.
 *
 *	@return	parent job
 */
job *
find_arrayparent(char *subjobid)
{
	int i;
	char idbuf[PBS_MAXSVRJOBID + 1];
	char *pc;

	for (i = 0; i < PBS_MAXSVRJOBID; i++) {
		idbuf[i] = *(subjobid + i);
		if (idbuf[i] == '[')
			break;
	}
	idbuf[++i] = ']';
	idbuf[++i] = '\0';
	pc = strchr(subjobid, (int) '.');
	if (pc)
		strcat(idbuf, pc);
	return (find_job(idbuf));
}

/**
 * @brief
 * 		update_array_indices_remaining_attr - updates array_indices_remaining attribute
 *
 * @param[in,out]	parent - pointer to parent job.
 *
 * @return	void
 */
static void
update_array_indices_remaining_attr(job *parent)
{
	char *pnewstr = range_to_str(parent->ji_ajinfo->trm_quelist);

	if (pnewstr == NULL || *pnewstr == '\0')
		pnewstr = "-";
	set_jattr_str_slim(parent, JOB_ATR_array_indices_remaining, pnewstr, NULL);
	update_subjob_state_ct(parent);
}

/**
 * @brief
 * 	update state counts of subjob based on given information
 *
 * @param[in]	parent - pointer to parent job.
 * @param[in]	sj     - pointer to subjob (can be NULL)
 * @param[in]	offset - sub job index.
 * @param[in]	newstate - newstate of the sub job.
 *
 * @return void
 */
void
update_sj_parent(job *parent, job *sj, char *sjid, char oldstate, char newstate)
{
	ajinfo_t *ptbl;
	int idx;
	int ostatenum;
	int nstatenum;

	if (oldstate == newstate)
		return;

	if (parent == NULL || sjid == NULL || sjid[0] == '\0' || (idx = get_index_from_jid(sjid)) == -1)
		return;

	ptbl = parent->ji_ajinfo;
	if (ptbl == NULL)
		return;

	ostatenum = state_char2int(oldstate);
	nstatenum = state_char2int(newstate);
	if (ostatenum == -1 || nstatenum == -1)
		return;

	ptbl->tkm_subjsct[ostatenum]--;
	ptbl->tkm_subjsct[nstatenum]++;

	if (oldstate == JOB_STATE_LTR_QUEUED)
		range_remove_value(&ptbl->trm_quelist, idx);
	if (newstate == JOB_STATE_LTR_QUEUED)
		range_add_value(&ptbl->trm_quelist, idx, ptbl->tkm_step);
	update_array_indices_remaining_attr(parent);

	if (sj && newstate != JOB_STATE_LTR_QUEUED) {
		if (is_jattr_set(sj, JOB_ATR_exit_status)) {
			int e = get_jattr_long(sj, JOB_ATR_exit_status);
			int pe = 0;
			if (is_jattr_set(parent, JOB_ATR_exit_status))
				pe = get_jattr_long(parent, JOB_ATR_exit_status);
			if (e > 0)
				pe = 1;
			else if (e < 0)
				pe = 2;
			else
				pe = 0;

			set_jattr_l_slim(parent, JOB_ATR_exit_status, pe, SET);
		}
		if (is_jattr_set(sj, JOB_ATR_stageout_status)) {
			int pe = -1;
			int e = get_jattr_long(sj, JOB_ATR_stageout_status);
			if (is_jattr_set(parent, JOB_ATR_stageout_status))
				pe = get_jattr_long(parent, JOB_ATR_stageout_status);
			if (e > 0 && pe != 0)
				set_jattr_l_slim(parent, JOB_ATR_stageout_status, e, SET);
		}
	}
	job_save_db(parent);
}

/**
 * @brief
 * 		chk_array_doneness - check if all subjobs are expired and if so,
 *		purge the Array Job itself
 *
 * @param[in,out]	parent - pointer to parent job.
 *
 *	@return	void
 */
void
chk_array_doneness(job *parent)
{
	struct batch_request *preq;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	int rc;
	ajinfo_t *ptbl = NULL;

	if (parent == NULL || parent->ji_ajinfo == NULL)
		return;

	ptbl = parent->ji_ajinfo;
	if (ptbl->tkm_flags & (TKMFLG_NO_DELETE | TKMFLG_CHK_ARRAY))
		return; /* delete of subjobs in progress, or re-entering, so return here */

	if (ptbl->tkm_subjsct[JOB_STATE_QUEUED] + ptbl->tkm_subjsct[JOB_STATE_RUNNING] + ptbl->tkm_subjsct[JOB_STATE_HELD] + ptbl->tkm_subjsct[JOB_STATE_EXITING] == 0) {

		/* Array Job all done, do simple eoj processing */
		parent->ji_qs.ji_un_type = JOB_UNION_TYPE_EXEC;
		parent->ji_qs.ji_un.ji_exect.ji_momaddr = 0;
		parent->ji_qs.ji_un.ji_exect.ji_momport = 0;

		parent->ji_qs.ji_un.ji_exect.ji_exitstat = get_jattr_long(parent, JOB_ATR_exit_status);

		check_block(parent, "");
		if (check_job_state(parent, JOB_STATE_LTR_BEGUN)) {
			char acctbuf[40];

			parent->ji_qs.ji_obittime = time_now;
			set_jattr_l_slim(parent, JOB_ATR_obittime, parent->ji_qs.ji_obittime, SET);

			/* Allocate space for the jobobit hook event params */
			preq = alloc_br(PBS_BATCH_JobObit);
			if (preq) {
				preq->rq_ind.rq_obit.rq_pjob = parent;
				DBPRT(("rq_jobobit svr_setjobstate update parent job state to 'F'"));
				svr_setjobstate(parent, JOB_STATE_LTR_FINISHED, JOB_SUBSTATE_FINISHED);
				rc = process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
				if (rc == -1) {
					log_err(-1, __func__, "rq_jobobit process_hooks call failed");
				}
				free_br(preq);
			} else {
				log_err(PBSE_INTERNAL, __func__, "rq_jobobit alloc failed");
			}

			/* if BEGUN, issue 'E' account record */
			sprintf(acctbuf, msg_job_end_stat, parent->ji_qs.ji_un.ji_exect.ji_exitstat);
			account_job_update(parent, PBS_ACCT_LAST);
			account_jobend(parent, acctbuf, PBS_ACCT_END);

			svr_mailowner(parent, MAIL_END, MAIL_NORMAL, acctbuf);
		}
		if (is_jattr_set(parent, JOB_ATR_depend))
			depend_on_term(parent);

		/*
		 * Check if the history of the finished job can be saved or it needs to be purged .
		 */
		ptbl->tkm_flags |= TKMFLG_CHK_ARRAY;
		svr_saveorpurge_finjobhist(parent);
	}
}

/**
 * @brief
 * 	find subjob and its state and substate
 *
 * @param[in]     parent    - pointer to the parent job
 * @param[in]     sjidx     - subjob index
 * @param[out]    state     - put state of subjob if not null
 * @param[out]    substate  - put substate of subjob if not null
 *
 * @return job *
 * @retval !NULL - if subjob found
 * @return NULL  - if subjob not found
 */
job *
get_subjob_and_state(job *parent, int sjidx, char *state, int *substate)
{
	job *sj;

	if (state)
		*state = JOB_STATE_LTR_UNKNOWN;
	if (substate)
		*substate = JOB_SUBSTATE_UNKNOWN;

	if (parent == NULL || sjidx < 0)
		return NULL;

	if (sjidx < parent->ji_ajinfo->tkm_start || sjidx > parent->ji_ajinfo->tkm_end)
		return NULL;

	if (((sjidx - parent->ji_ajinfo->tkm_start) % parent->ji_ajinfo->tkm_step) != 0)
		return NULL;

	sj = find_job(create_subjob_id(parent->ji_qs.ji_jobid, sjidx));
	if (sj == NULL) {
		if (range_contains(parent->ji_ajinfo->trm_quelist, sjidx)) {
			if (state)
				*state = JOB_STATE_LTR_QUEUED;
			if (substate)
				*substate = JOB_SUBSTATE_QUEUED;
		} else {
			if (state) {
				char pjs = get_job_state(parent);
				if (pjs == JOB_STATE_LTR_FINISHED)
					*state = JOB_STATE_LTR_FINISHED;
				else
					*state = JOB_STATE_LTR_EXPIRED;
			}
			if (substate)
				*substate = JOB_SUBSTATE_FINISHED;
		}
		return NULL;
	}

	if (state)
		*state = get_job_state(sj);
	if (substate)
		*substate = get_job_substate(sj);

	return sj;
}
/**
 * @brief
 * 		update_subjob_state_ct - update the "array_state_count" attribute of an
 * 		array job
 *
 * @param[in]	pjob - pointer to the job
 *
 * @return	void
 */
void
update_subjob_state_ct(job *pjob)
{
	char buf[BUF_SIZE];
	const char *statename[] = {"Transit", "Queued", "Held", "Waiting", "Running",
				   "Exiting", "Expired", "Beginning", "Moved", "Finished"};

	buf[0] = '\0';
	snprintf(buf, sizeof(buf), "%s:%d %s:%d %s:%d %s:%d",
		 statename[JOB_STATE_QUEUED],
		 pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_QUEUED],
		 statename[JOB_STATE_RUNNING],
		 pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_RUNNING],
		 statename[JOB_STATE_EXITING],
		 pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_EXITING],
		 statename[JOB_STATE_EXPIRED],
		 pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_EXPIRED]);

	set_jattr_str_slim(pjob, JOB_ATR_array_state_count, buf, NULL);
}
/**
 * @brief
 * 		subst_array_index - Substitute the actual index into the file name
 * 		if this is a sub job and if the array index substitution
 * 		string is in the specified file path.  If, not the original string
 * 		is returned unchanged.
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	path - name of local or destination
 *
 * @return	path
 */
char *
subst_array_index(job *pjob, char *path)
{
	char *pindorg;
	char *cvt;
	char trail[MAXPATHLEN + 1];
	job *ppjob = pjob->ji_parentaj;

	if (ppjob == NULL)
		return path;
	if ((pindorg = strstr(path, PBS_FILE_ARRAY_INDEX_TAG)) == NULL)
		return path; /* unchanged */

	cvt = get_range_from_jid(pjob->ji_qs.ji_jobid);
	if (cvt == NULL)
		return path;
	*pindorg = '\0';
	strcpy(trail, pindorg + strlen(PBS_FILE_ARRAY_INDEX_TAG));
	strcat(path, cvt);
	strcat(path, trail);
	return path;
}

/**
 * @brief
 * 		mk_subjob_index_tbl - make the subjob index tracking table
 *		(ajinfo_t) based on the number of indexes in the "range"
 *
 * @param[in]	range - subjob index range
 * @param[out]	pbserror - PBSError to return
 * @param[in]	mode - "actmode" parameter to action function of "array_indices_submitted"
 *
 * @return	ptr to table
 * @retval  NULL	- error
 */
static int
setup_ajinfo(job *pjob, int mode)
{
	int i;
	int limit;
	int start;
	int end;
	int step;
	int count;
	char *eptr;
	char *range;
	ajinfo_t *trktbl;

	if (pjob->ji_ajinfo) {
		free_range_list(pjob->ji_ajinfo->trm_quelist);
		free(pjob->ji_ajinfo);
	}
	pjob->ji_ajinfo = NULL;
	range = get_jattr_str(pjob, JOB_ATR_array_indices_submitted);
	if (range == NULL)
		return PBSE_BADATVAL;
	i = parse_subjob_index(range, &eptr, &start, &end, &step, &count);
	if (i != 0)
		return PBSE_BADATVAL;

	if ((mode == ATR_ACTION_NEW) || (mode == ATR_ACTION_ALTER)) {
		if (is_sattr_set(SVR_ATR_maxarraysize))
			limit = get_sattr_long(SVR_ATR_maxarraysize);
		else
			limit = PBS_MAX_ARRAY_JOB_DFL; /* default limit 10000 */

		if (count > limit)
			return PBSE_MaxArraySize;
	}

	trktbl = (ajinfo_t *) malloc(sizeof(ajinfo_t));
	if (trktbl == NULL)
		return PBSE_SYSTEM;
	for (i = 0; i < PBS_NUMJOBSTATE; i++)
		trktbl->tkm_subjsct[i] = 0;
	if (mode == ATR_ACTION_RECOV || mode == ATR_ACTION_ALTER)
		trktbl->trm_quelist = NULL;
	else {
		trktbl->trm_quelist = new_range(start, end, step, count, NULL);
		if (trktbl->trm_quelist == NULL) {
			free(trktbl);
			return PBSE_SYSTEM;
		}
		trktbl->tkm_subjsct[JOB_STATE_QUEUED] = count;
	}
	trktbl->tkm_dsubjsct = 0;
	trktbl->tkm_ct = count;
	trktbl->tkm_start = start;
	trktbl->tkm_end = end;
	trktbl->tkm_step = step;
	trktbl->tkm_flags = 0;
	pjob->ji_ajinfo = trktbl;
	return PBSE_NONE;
}

/**
 * @brief
 * 		setup_arrayjob_attrs - set up the special attributes of an Array Job
 *		Called as "action" routine for the attribute array_indices_submitted
 *
 * @param[in]	pattr - pointer to special attributes of an Array Job
 * @param[in]	pobj -  pointer to job structure
 * @param[in]	mode -  actmode
 *
 * @return	PBS error
 * @retval  0	- success
 */
int
setup_arrayjob_attrs(attribute *pattr, void *pobj, int mode)
{
	job *pjob = pobj;

	if (mode != ATR_ACTION_ALTER && mode != ATR_ACTION_NEW && mode != ATR_ACTION_RECOV)
		return PBSE_BADATVAL;

	if (is_job_array(pjob->ji_qs.ji_jobid) != IS_ARRAY_ArrayJob)
		return PBSE_BADATVAL; /* not an Array Job */

	if (mode == ATR_ACTION_ALTER && !check_job_state(pjob, JOB_STATE_LTR_QUEUED))
		return PBSE_MODATRRUN; /* cannot modify once begun */

	/* set attribute "array" True  and clear "array_state_count" */
	pjob->ji_qs.ji_svrflags |= JOB_SVFLG_ArrayJob;
	set_jattr_b_slim(pjob, JOB_ATR_array, 1, SET);
	free_jattr(pjob, JOB_ATR_array_state_count);

	if ((mode == ATR_ACTION_NEW) || (mode == ATR_ACTION_RECOV)) {
		int rc = PBSE_BADATVAL;
		if ((rc = setup_ajinfo(pjob, mode)) != PBSE_NONE)
			return rc;
	}

	if (mode == ATR_ACTION_RECOV)
		return PBSE_NONE;

	update_array_indices_remaining_attr(pjob);

	return PBSE_NONE;
}

/**
 * @brief
 * 		fixup_arrayindicies - set state of subjobs based on array_indicies_remaining
 * @par	Functionality:
 * 		This is used when a job is being qmoved into this server.
 * 		It is necessary that the indices_submitted be first to cause the
 * 		creation of the tracking tbl. If the job is created here, no need of fix indicies
 *
 * @param[in]	pattr - pointer to special attributes of an Array Job
 * @param[in]	pobj -  pointer to job structure
 * @param[in]	mode -  actmode
 * @return	PBS error
 * @retval  0	- success
 */
int
fixup_arrayindicies(attribute *pattr, void *pobj, int mode)
{
	job *pjob = pobj;
	char *range;
	int qcount;

	if (!pjob || !(pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) || !pjob->ji_ajinfo)
		return PBSE_BADATVAL;

	if (mode == ATR_ACTION_NEW && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE))
		return PBSE_NONE;

	if (pjob->ji_ajinfo->trm_quelist != NULL)
		return PBSE_BADATVAL;

	range = get_jattr_str(pjob, JOB_ATR_array_indices_remaining);
	pjob->ji_ajinfo->trm_quelist = range_parse(range);
	if (pjob->ji_ajinfo->trm_quelist == NULL) {
		if (range && range[0] == '-') {
			pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_QUEUED] = 0;
			pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_EXPIRED] = pjob->ji_ajinfo->tkm_ct;
			update_subjob_state_ct(pjob);
			return PBSE_NONE;
		}
		return PBSE_BADATVAL;
	}

	qcount = range_count(pjob->ji_ajinfo->trm_quelist);
	pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_QUEUED] = qcount;
	pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_EXPIRED] = pjob->ji_ajinfo->tkm_ct - qcount;
	update_subjob_state_ct(pjob);
	return PBSE_NONE;
}

/**
 * @brief
 * 		create_subjob - create a Subjob from the parent Array Job
 * 		Certain attributes are changed or left out
 * @param[in]	parent - pointer to parent Job
 * @param[in]	newjid -  new job id
 * @param[in]	rc -  return code
 * @return	pointer to new job
 * @retval  NULL	- error
 */
job *
create_subjob(job *parent, char *newjid, int *rc)
{
	pbs_list_head attrl;
	int i;
	int j;
	char *index;
	attribute_def *pdef;
	attribute *ppar;
	attribute *psub;
	svrattrl *psatl;
	job *subj;
	long eligibletime;
	long long time_usec;
	struct timeval tval;
	char path[MAXPATHLEN + 1];

	if (newjid == NULL) {
		*rc = PBSE_IVALREQ;
		return NULL;
	}

	if ((parent->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) == 0) {
		*rc = PBSE_IVALREQ;
		return NULL; /* parent not an array job */
	}

	/* find and copy the index */
	if ((index = get_range_from_jid(newjid)) == NULL) {
		*rc = PBSE_IVALREQ;
		return NULL;
	}

	/*
	 * allocate and clear basic structure
	 * cannot copy job attributes because cannot share strings and other
	 * malloc-ed data,  so copy ji_qs as a whole and then copy the
	 * non-saved items before ji_qs.
	 */

	if ((subj = job_alloc()) == NULL) {
		*rc = PBSE_SYSTEM;
		return NULL;
	}
	subj->ji_qs = parent->ji_qs; /* copy the fixed save area */
	subj->ji_qhdr = parent->ji_qhdr;
	subj->ji_myResv = parent->ji_myResv;
	subj->ji_parentaj = parent;
	strcpy(subj->ji_qs.ji_jobid, newjid); /* replace job id */
	*subj->ji_qs.ji_fileprefix = '\0';

	/*
	 * now that is all done, copy the required attributes by
	 * encoding and then decoding into the new array.  Then add the
	 * subjob specific attributes.
	 */

	resc_access_perm = ATR_DFLAG_ACCESS;
	CLEAR_HEAD(attrl);
	for (i = 0; attrs_to_copy[i] != JOB_ATR_LAST; i++) {
		j = (int) attrs_to_copy[i];
		ppar = get_jattr(parent, j);
		psub = get_jattr(subj, j);
		pdef = &job_attr_def[j];

		if (pdef->at_encode(ppar, &attrl, pdef->at_name, NULL,
				    ATR_ENCODE_MOM, &psatl) > 0) {
			for (psatl = (svrattrl *) GET_NEXT(attrl); psatl;
			     psatl = ((svrattrl *) GET_NEXT(psatl->al_link))) {
				set_attr_generic(psub, pdef, psatl->al_value, psatl->al_resc, INTERNAL);
			}
			/* carry forward the default bit if set */
			psub->at_flags |= (ppar->at_flags & ATR_VFLAG_DEFLT);
			free_attrlist(&attrl);
		}
	}

	set_jattr_generic(subj, JOB_ATR_array_id, parent->ji_qs.ji_jobid, NULL, INTERNAL);
	set_jattr_generic(subj, JOB_ATR_array_index, index, NULL, INTERNAL);

	/* Lastly, set or clear a few flags and link in the structure */

	subj->ji_qs.ji_svrflags &= ~JOB_SVFLG_ArrayJob;
	subj->ji_qs.ji_svrflags |= JOB_SVFLG_SubJob;
	set_job_substate(subj, JOB_SUBSTATE_TRANSICM);
	svr_setjobstate(subj, JOB_STATE_LTR_QUEUED, JOB_SUBSTATE_QUEUED);

	/* subjob needs to borrow eligible time from parent job array.
	 * expecting only to accrue eligible_time and nothing else.
	 */
	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1) {

		eligibletime = get_jattr_long(parent, JOB_ATR_eligible_time);

		if (get_jattr_long(parent, JOB_ATR_accrue_type) == JOB_ELIGIBLE)
			eligibletime += get_jattr_long(subj, JOB_ATR_sample_starttime) - get_jattr_long(parent, JOB_ATR_sample_starttime);

		set_jattr_l_slim(subj, JOB_ATR_eligible_time, eligibletime, SET);
	}

	gettimeofday(&tval, NULL);
	time_usec = (tval.tv_sec * 1000000L) + tval.tv_usec;
	/* set the queue rank attribute */
	set_jattr_ll_slim(subj, JOB_ATR_qrank, time_usec, SET);
	if (svr_enquejob(subj, NULL) != 0) {
		job_purge(subj);
		*rc = PBSE_IVALREQ;
		return NULL;
	}

	pbs_strncpy(path, get_jattr_str(subj, JOB_ATR_outpath), sizeof(path));
	subst_array_index(subj, path);
	set_jattr_str_slim(subj, JOB_ATR_outpath, path, NULL);
	pbs_strncpy(path, get_jattr_str(subj, JOB_ATR_errpath), sizeof(path));
	subst_array_index(subj, path);
	set_jattr_str_slim(subj, JOB_ATR_errpath, path, NULL);

	*rc = PBSE_NONE;
	return subj;
}

/**
 * @brief
 *	 	Duplicate the existing batch request for a running subjob
 *
 * @param[in]	opreq	- the batch status request structure to duplicate
 * @param[in]	pjob	- the parent job structure of the subjob
 * @param[in]	func	- the function to call after duplicating the batch
 *			   structure.
 * @par
 *		1. duplicate the batch request
 *		2. replace the job id with the one from the running subjob
 *		3. link the new batch request to the original and incr its ref ct
 *		4. call the "func" with the new batch request and job
 * @note
 *		Currently, this is called in PBS_Batch_DeleteJob, PBS_Batch_SignalJob,
 *		PBS_Batch_Rerun, and PBS_Batch_RunJob subjob requests.
 *		For any other request types, be sure to add another switch case below
 *		(matching request type).
 * @return int
 * @retval return value of the callback function (0 for success, 1 for error)
 */
int
dup_br_for_subjob(struct batch_request *opreq, job *pjob, int (*func)(struct batch_request *, job *))
{
	struct batch_request *npreq;

	npreq = alloc_br(opreq->rq_type);
	if (npreq == NULL)
		return 1;

	npreq->rq_perm = opreq->rq_perm;
	npreq->rq_fromsvr = opreq->rq_fromsvr;
	npreq->rq_conn = opreq->rq_conn;
	npreq->rq_orgconn = opreq->rq_orgconn;
	npreq->rq_time = opreq->rq_time;
	strcpy(npreq->rq_user, opreq->rq_user);
	strcpy(npreq->rq_host, opreq->rq_host);
	npreq->rq_extend = opreq->rq_extend;
	npreq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
	npreq->rq_refct = 0;

	/* for each type, update the job id with the one from the new job */

	switch (opreq->rq_type) {
		case PBS_BATCH_DeleteJobList:
			npreq->rq_ind.rq_deletejoblist = opreq->rq_ind.rq_deletejoblist;
			npreq->rq_ind.rq_deletejoblist.rq_count = 1;
			npreq->rq_ind.rq_deletejoblist.rq_jobslist = break_comma_list(pjob->ji_qs.ji_jobid);
			npreq->rq_ind.rq_deletejoblist.jobid_to_resume = 0;
			break;
		case PBS_BATCH_DeleteJob:
			npreq->rq_ind.rq_delete = opreq->rq_ind.rq_delete;
			strcpy(npreq->rq_ind.rq_delete.rq_objname,
			       pjob->ji_qs.ji_jobid);
			break;
		case PBS_BATCH_SignalJob:
			npreq->rq_ind.rq_signal = opreq->rq_ind.rq_signal;
			strcpy(npreq->rq_ind.rq_signal.rq_jid,
			       pjob->ji_qs.ji_jobid);
			break;
		case PBS_BATCH_Rerun:
			strcpy(npreq->rq_ind.rq_rerun,
			       pjob->ji_qs.ji_jobid);
			break;
		case PBS_BATCH_RunJob:
			npreq->rq_ind.rq_run = opreq->rq_ind.rq_run;
			strcpy(npreq->rq_ind.rq_run.rq_jid,
			       pjob->ji_qs.ji_jobid);
			break;
		default:
			delete_link(&npreq->rq_link);
			free(npreq);
			return 1;
	}

	npreq->rq_parentbr = opreq;
	opreq->rq_refct++;

	return func(npreq, pjob);
}


================================================
FILE: src/server/attr_recov.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *	This file contains the functions to perform a buffered
 *	save of an object (structure) and an attribute array to a file.
 *	It also has the function to recover (reload) an attribute array.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "pbs_ifl.h"
#include <assert.h>
#include <errno.h>
#include <memory.h>
#include <stdlib.h>
#include <stdio.h>
#include <unistd.h>
#include "list_link.h"
#include "attribute.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

/* Global Variables */

extern int resc_access_perm;

char pbs_recov_filename[MAXPATHLEN + 1];

/* data items global to functions in this file */

#define PKBUFSIZE 4096

char pk_buffer[PKBUFSIZE]; /* used to do buffered output */
static int pkbfds = -2;	   /* descriptor to use for saves */
static size_t spaceavail;  /* space in pk_buffer available */
static size_t spaceused;   /* amount of space used  in pkbuffer */

/**
 * @brief
 * 		save_setup - set up the save i/o buffer.
 *		The "buffer control information" is left updated to reflect
 *		the file descriptor, and the space in the buffer.
 * @param[in]	fds - file descriptor value
 */

void
save_setup(int fds)
{

	if (pkbfds != -2) { /* somebody forgot to flush the buffer */
		log_err(-1, "save_setup", "someone forgot to flush");
	}

	/* initialize buffer control */

	pkbfds = fds;
	spaceavail = PKBUFSIZE;
	spaceused = 0;
}

/**
 * @brief
 * 		save_struct - Copy a structure (as a block)  into the save i/o buffer
 *		This is useful to save fixed sized structure without pointers
 *		that point outside of the structure itself.
 *
 *	Write out buffer as required. Leave spaceavail and spaceused updated
 *
 * @param[in]	pobj - pointer to the structure whose contents needs to be copied into a buffer.
 * @param[in]	objsize - required size of the object.
 *
 * @return      Error code
 * @retval	 0  - Success
 * @retval	-1  - Failure
 */

int
save_struct(char *pobj, unsigned int objsize)
{
	int amt;
	size_t copysize;
	int i;
	char *pbufin;
	char *pbufout;

	assert(pkbfds >= 0);

	while (objsize > 0) {
		pbufin = pk_buffer + spaceused;
		if (objsize > spaceavail) {
			if ((copysize = spaceavail) != 0) {
				(void) memcpy(pbufin, pobj, copysize);
			}
			amt = PKBUFSIZE;
			pbufout = pk_buffer;
			while ((i = write(pkbfds, pbufout, amt)) != amt) {
				if (i == -1) {
					if (errno != EINTR) {
						return (-1);
					}
				} else {
					amt -= i;
					pbufout += i;
				}
			}
			pobj += copysize;
			spaceavail = PKBUFSIZE;
			spaceused = 0;
		} else {
			copysize = (size_t) objsize;
			(void) memcpy(pbufin, pobj, copysize);
			spaceavail -= copysize;
			spaceused += copysize;
		}
		objsize -= copysize;
	}
	return (0);
}

/**
 * @buffer
 * 		save_flush - flush out the current save operation
 *		Flush buffer if needed, reset spaceavail, spaceused,
 *		clear out file descriptor
 *
 *	Returns: 0 on success
 *		-1 on failure (flush failed)
 */

int
save_flush(void)
{
	int i;
	char *pbuf;

	assert(pkbfds >= 0);

	pbuf = pk_buffer;
	if (spaceused > 0) {
		while ((i = write(pkbfds, pbuf, spaceused)) != spaceused) {
			if (i == -1) {
				if (errno != EINTR) {
					log_err(errno, "save_flush", "bad write");
					return (-1);
				}
			} else {
				pbuf += i;
				spaceused -= i;
			}
		}
	}
	pkbfds = -2; /* flushed flag */
	return (0);
}

/**
 * @brief
 *	 	Write set of attributes to disk file
 *
 * @par	Functionality:
 *		Each of the attributes is encoded  into the attrlist form.
 *		They are packed and written using save_struct().
 *
 *		The final real attribute is followed by a dummy attribute with a
 *		al_size of ENDATTRIB.  This cannot be mistaken for the size of a
 *		real attribute.
 *
 *		Note: attributes of type ATR_TYPE_ACL are not saved with the other
 *		attribute of the parent (queue or server).  They are kept in their
 *		own file.
 *
 * @param[in]	padef - Address of parent's attribute definition array
 * @param[in]	pattr - Address of the parent objects attribute array
 * @param[in]	numattr - Number of attributes in the list
 *
 * @return      Error code
 * @retval	 0  - Success
 * @retval	-1  - Failure
 */
int
save_attr_fs(attribute_def *padef, attribute *pattr, int numattr)
{
	svrattrl dummy;
	int errct = 0;
	pbs_list_head lhead;
	int i;
	svrattrl *pal;
	int rc;

	/* encode each attribute which has a value (not non-set) */

	CLEAR_HEAD(lhead);

	for (i = 0; i < numattr; i++) {

		if ((padef + i)->at_type != ATR_TYPE_ACL) {

			/* note access lists are not saved this way */

			rc = (padef + i)->at_encode(pattr + i, &lhead,
						    (padef + i)->at_name,
						    NULL, ATR_ENCODE_SAVE, NULL);

			if (rc < 0)
				errct++;

			(pattr + i)->at_flags &= ~ATR_VFLAG_MODIFY;

			/* now that it has been encoded, block and save it */

			while ((pal = (svrattrl *) GET_NEXT(lhead)) !=
			       NULL) {

				if (save_struct((char *) pal, pal->al_tsize) < 0)
					errct++;
				delete_link(&pal->al_link);
				(void) free(pal);
			}
		}
	}

	/* indicate last of attributes by writting dummy entry */

#ifdef DEBUG
	(void) memset(&dummy, 0, sizeof(dummy));
#endif
	dummy.al_tsize = ENDATTRIBUTES;
	if (save_struct((char *) &dummy, sizeof(dummy)) < 0)
		errct++;

	if (errct)
		return (-1);
	else
		return (0);
}

/**
 * @brief
 *		read attributes from disk file
 *
 *		Recover (reload) attribute from file written by save_attr().
 *		Since this is not often done (only on server initialization),
 *		Buffering the reads isn't done.
 *
 * @param[in]	fd - The file descriptor of the file to write to
 * @param[in] 	parent - void pointer to one of the PBS objects
 *					  to whom these attributes belong
 * @param[in]   padef_idx - Search index of this attribute definition array
 * @param[in]	padef - Address of parent's attribute definition array
 * @param[in]	pattr - Address of the parent objects attribute array
 * @param[in]	limit - Index of the last attribute
 * @param[in]	unknown - Index of the start of the unknown attribute list
 *
 * @return      Error code
 * @retval	 0  - Success
 * @retval	-1  - Failure
 */

int
recov_attr_fs(int fd, void *parent, void *padef_idx, attribute_def *padef, attribute *pattr, int limit, int unknown)
{
	int amt;
	int len;
	int index;
	svrattrl *pal = NULL;
	int palsize = 0;
	svrattrl *tmpal = NULL;

	pal = (svrattrl *) malloc(sizeof(svrattrl));
	if (!pal)
		return (-1);
	palsize = sizeof(svrattrl);

	/* set all privileges (read and write) for decoding resources	*/
	/* This is a special (kludge) flag for the recovery case, see	*/
	/* decode_resc() in lib/Libattr/attr_fn_resc.c			*/

	resc_access_perm = ATR_DFLAG_ACCESS;

	/* For each attribute, read in the attr_extern header */

	while (1) {
		errno = -1;
		memset(pal, 0, palsize);
		len = read(fd, (char *) pal, sizeof(svrattrl));
		if (len != sizeof(svrattrl)) {
			sprintf(log_buffer, "read1 error of %s",
				pbs_recov_filename);
			log_err(errno, __func__, log_buffer);
			free(pal);
			return (errno);
		}
		if (pal->al_tsize == ENDATTRIBUTES)
			break; /* hit dummy attribute that is eof */
		amt = pal->al_tsize - sizeof(svrattrl);
		if (amt < 1) {
			sprintf(log_buffer, "Invalid attr list size in %s",
				pbs_recov_filename);
			log_err(errno, __func__, log_buffer);
			free(pal);
			return (errno);
		}

		/* read in the attribute chunk (name and encoded value) */

		if (palsize < pal->al_tsize) {
			tmpal = (svrattrl *) realloc(pal, pal->al_tsize);
			if (tmpal == NULL) {
				sprintf(log_buffer,
					"Unable to alloc attr list size in %s",
					pbs_recov_filename);
				log_err(errno, __func__, log_buffer);
				free(pal);
				return (errno);
			}
			pal = tmpal;
			palsize = pal->al_tsize;
		}
		if (!pal)
			return (errno);
		CLEAR_LINK(pal->al_link);

		/* read in the actual attribute data */

		len = read(fd, (char *) pal + sizeof(svrattrl), amt);
		if (len != amt) {
			sprintf(log_buffer, "read2 error of %s",
				pbs_recov_filename);
			log_err(errno, __func__, log_buffer);
			free(pal);
			return (errno);
		}

		/* the pointer into the data are of course bad, so reset them */

		pal->al_name = (char *) pal + sizeof(svrattrl);
		if (pal->al_rescln)
			pal->al_resc = pal->al_name + pal->al_nameln;
		else
			pal->al_resc = NULL;
		if (pal->al_valln)
			pal->al_value = pal->al_name + pal->al_nameln +
					pal->al_rescln;
		else
			pal->al_value = NULL;

		pal->al_refct = 1; /* ref count reset to 1 */

		/* find the attribute definition based on the name */

		index = find_attr(padef_idx, padef, pal->al_name);
		if (index < 0) {
			/*
			 * There are two ways this could happen:
			 * 1. if the (job) attribute is in the "unknown" list -
			 *    keep it there;
			 * 2. if the server was rebuilt and an attribute was
			 *    deleted, -  the fact is logged and the attribute
			 *    is discarded (system,queue) or kept (job)
			 */
			if (unknown > 0) {
				index = unknown;
			} else {
				log_errf(-1, __func__, "unknown attribute \"%s\" discarded", pal->al_name);
				continue;
			}
		}

		/*
		 * In the normal case we just decode the attribute directly
		 * into the real attribute since there will be one entry only
		 * for that attribute.
		 *
		 * However, "entity limits" are special and may have multiple,
		 * the first of which is "SET" and the following are "INCR".
		 * For the SET case, we do it directly as for the normal attrs.
		 * For the INCR,  we have to decode into a temp attr and then
		 * call set_entity to do the INCR.
		 */

		if (((padef + index)->at_type != ATR_TYPE_ENTITY) || (pal->al_atopl.op != INCR)) {
			int rc = set_attr_generic(pattr + index, padef + index, pal->al_value, pal->al_resc, INTERNAL);
			if (!rc) {
				if ((padef + index)->at_action)
					(void) (padef + index)->at_action(pattr + index, parent, ATR_ACTION_RECOV);
			}
		} else {
			/* for INCR case of entity limit, decode locally */
			set_attr_generic(pattr + index, padef + index, pal->al_value, pal->al_resc, INCR);
		}
		(pattr + index)->at_flags = pal->al_flags & ~ATR_VFLAG_MODIFY;
	}

	(void) free(pal);
	return (0);
}


================================================
FILE: src/server/attr_recov_db.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "pbs_ifl.h"
#include <assert.h>
#include <errno.h>
#include <memory.h>
#include <stdlib.h>
#include <stdio.h>
#include <unistd.h>
#include "list_link.h"
#include "attribute.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "resource.h"
#include "pbs_db.h"
#include <openssl/sha.h>

/* Global Variables */
extern int resc_access_perm;

extern struct attribute_def svr_attr_def[];
extern struct attribute_def que_attr_def[];

/**
 * @brief
 *	Compute and check whether the quick save area has been modified
 *
 * @param[in] 	    qs       - pointer to the quick save area
 * @param[in]	    len      - length of the quick save area
 * @param[in/out]   oldhash  - pointer to a opaque value of current quick save area signature/hash
 *
 * @return      Error code
 * @retval	 0 - quick save area was not changed
 * @retval	 1 - quick save area has changed
 */
int
compare_obj_hash(void *qs, int len, void *oldhash)
{
	char hash[DIGEST_LENGTH];

	if (SHA1((const unsigned char *) qs, len, (unsigned char *) &hash) == NULL)
		exit(-1);

	if (memcmp(hash, oldhash, DIGEST_LENGTH) != 0) {
		memcpy(oldhash, hash, DIGEST_LENGTH); /* update the signature */
		return 1;
	}

	return 0; /* qs was not modified */
}

/**
 * @brief
 *	Encode a single  attribute to the database structure of type pbs_db_attr_list_t
 *
 * @param[in]	padef - Address of parent's attribute definition array
 * @param[in]	pattr - Address of the parent objects attribute array
 * @param[out]	db_attr_list - pointer to the structure of type pbs_db_attr_list_t for storing in DB
 *
 * @return  error code
 * @retval   -1 - Failure
 * @retval    0 - Success
 *
 */
int
encode_single_attr_db(attribute_def *padef, attribute *pattr, pbs_db_attr_list_t *db_attr_list)
{
	pbs_list_head *lhead;
	int rc = 0;

	lhead = &db_attr_list->attrs;

	rc = padef->at_encode(pattr, lhead, padef->at_name, NULL, ATR_ENCODE_DB, NULL);
	if (rc < 0)
		return -1;

	db_attr_list->attr_count += rc;

	return 0;
}

/**
 * @brief
 *	Encode the given attributes to the database structure of type pbs_db_attr_list_t
 *
 * @param[in]	padef - Address of parent's attribute definition array
 * @param[in]	pattr - Address of the parent objects attribute array
 * @param[in]	numattr - Number of attributes in the list
 * @param[in]	all  - Encode all attributes
 *
 * @return  error code
 * @retval   -1 - Failure
 * @retval    0 - Success
 *
 */
int
encode_attr_db(attribute_def *padef, attribute *pattr, int numattr, pbs_db_attr_list_t *db_attr_list, int all)
{
	int i;

	db_attr_list->attr_count = 0;

	CLEAR_HEAD(db_attr_list->attrs);

	for (i = 0; i < numattr; i++) {
		if (!((pattr + i)->at_flags & ATR_VFLAG_MODIFY))
			continue;

		if ((((padef + i)->at_flags & ATR_DFLAG_NOSAVM) == 0) || all) {
			if (encode_single_attr_db((padef + i), (pattr + i), db_attr_list) != 0)
				return -1;

			(pattr + i)->at_flags &= ~ATR_VFLAG_MODIFY;
		}
	}
	return 0;
}

/**
 * @brief
 *	Decode the list of attributes from the database to the regular attribute structure
 *
 * @param[in]	  parent - pointer to parent object
 * @param[in]	  attr_list - recovered/to be decoded attribute list
 * @param[in]     padef_idx - Search index of this attribute array
 * @param[in]	  padef - Address of parent's attribute definition array
 * @param[in,out] pattr - Address of the parent objects attribute array
 * @param[in]	  limit - Number of attributes in the list
 * @param[in]	  unknown	- The index of the unknown attribute if any
 *
 * @return      Error code
 * @retval	 0  - Success
 * @retval	-1  - Failure
 *
 *
 */
int
decode_attr_db(void *parent, pbs_list_head *attr_list, void *padef_idx, struct attribute_def *padef, struct attribute *pattr, int limit, int unknown)
{
	int index;
	svrattrl *pal = (svrattrl *) 0;
	svrattrl *tmp_pal = (svrattrl *) 0;
	void **palarray = NULL;

	if ((palarray = calloc(limit, sizeof(void *))) == NULL) {
		log_err(-1, __func__, "Out of memory");
		return -1;
	}

	/* set all privileges (read and write) for decoding resources	*/
	/* This is a special (kludge) flag for the recovery case, see	*/
	/* decode_resc() in lib/Libattr/attr_fn_resc.c			*/

	resc_access_perm = ATR_DFLAG_ACCESS;

	for (pal = (svrattrl *) GET_NEXT(*attr_list); pal != NULL; pal = (svrattrl *) GET_NEXT(pal->al_link)) {
		/* find the attribute definition based on the name */
		index = find_attr(padef_idx, padef, pal->al_name);
		if (index < 0) {

			/*
			* There are two ways this could happen:
			* 1. if the (job) attribute is in the "unknown" list -
			*    keep it there;
			* 2. if the server was rebuilt and an attribute was
			*    deleted, -  the fact is logged and the attribute
			*    is discarded (system,queue) or kept (job)
			*/
			if (unknown > 0) {
				index = unknown;
			} else {
				snprintf(log_buffer, LOG_BUF_SIZE, "unknown attribute \"%s\" discarded", pal->al_name);
				log_err(-1, __func__, log_buffer);
				continue;
			}
		}
		if (palarray[index] == NULL)
			palarray[index] = pal;
		else {
			tmp_pal = palarray[index];
			while (tmp_pal->al_sister)
				tmp_pal = tmp_pal->al_sister;

			/* this is the end of the list of attributes */
			tmp_pal->al_sister = pal;
		}
	}

	/* now do the decoding */
	for (index = 0; index < limit; index++) {
		/*
		 * In the normal case we just decode the attribute directly
		 * into the real attribute since there will be one entry only
		 * for that attribute.
		 *
		 * However, "entity limits" are special and may have multiple,
		 * the first of which is "SET" and the following are "INCR".
		 * For the SET case, we do it directly as for the normal attrs.
		 * For the INCR,  we have to decode into a temp attr and then
		 * call set_entity to do the INCR.
		 */
		/*
		 * we don't store the op value into the database, so we need to
		 * determine (in case of an ENTITY) whether it is the first
		 * value, or was decoded before. We decide this based on whether
		 * the flag has ATR_VFLAG_SET
		 *
		 */
		pal = palarray[index];
		while (pal) {
			if ((padef[index].at_type == ATR_TYPE_ENTITY) && is_attr_set(&pattr[index])) {
				/* for INCR case of entity limit, decode locally */
				set_attr_generic(&pattr[index], &padef[index], pal->al_value, pal->al_resc, INCR);
			} else {
				set_attr_generic(&pattr[index], &padef[index], pal->al_value, pal->al_resc, INTERNAL);
				int act_rc = 0;
				if (padef[index].at_action)
					if ((act_rc = (padef[index].at_action(&pattr[index], parent, ATR_ACTION_RECOV)))) {
						log_errf(act_rc, __func__, "Action function failed for %s attr, errn %d...unsetting attribute", (padef+index)->at_name, act_rc);
						for (index++; index <= limit; index++) {
							while (pal) {
								tmp_pal = pal->al_sister;
								delete_link(&pal->al_link);
								free(pal);
								pal = tmp_pal;
							}
							if (index < limit)
								pal = palarray[index];
						}
						if (padef[index].at_free)
							padef[index].at_free(&pattr[index]);
						break;
					}
			}
			(pattr + index)->at_flags = (pal->al_flags & ~ATR_VFLAG_MODIFY) | ATR_VFLAG_MODCACHE;

			tmp_pal = pal->al_sister;
			pal = tmp_pal;
		}
	}
	(void) free(palarray);

	return 0;
}


================================================
FILE: src/server/checkkey.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    checkkey.c
 *
 * @brief
 *		attr_recov.c - The 'checkkey.c' file goes with the source package is used to verify licesnse
 *
 * Included public functions are:
 *
 *	init_fl_license_attrs	initialize values of license structure
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <strings.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <time.h>
#include <sys/types.h>
#include <netinet/in.h>
#include "portability.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_ifl.h"
#include "pbs_nodes.h"
#include "server.h"
#include "svrfunc.h"
#include "net_connect.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_license.h"
#include "work_task.h"
#include "job.h"

char *pbs_licensing_license_location = NULL;
long pbs_min_licenses = PBS_MIN_LICENSING_LICENSES;
long pbs_max_licenses = PBS_MAX_LICENSING_LICENSES;
int pbs_licensing_linger = PBS_LIC_LINGER_TIME;

/* Global Data Items: */
extern pbs_list_head svr_alljobs;

extern pbs_net_t pbs_server_addr;
unsigned long hostidnum;
int ext_license_server = 0;
int license_expired = 0;

void
return_licenses(struct work_task *ptask)
{
}

void
init_licensing(int delay)
{
}

int
status_licensing(void)
{
	return (0);
}

void
close_licensing(void)
{
}
/**
 * @brief
 * 		returning host id.
 *
 * @return      Host ID
 */
unsigned long
pbs_get_hostid(void)
{
	unsigned long hid;

	hid = (unsigned long) gethostid();
	if (hid == 0)
		hid = (unsigned long) pbs_server_addr;
	return hid;
}
/**
 * @brief
 * 		initialize values of license structure
 *
 * @param[in]	licenses - pointer to the license block structure
 */
void
init_fl_license_attrs(struct license_block *licenses)
{
	licenses->lb_glob_floating = 10000000;
	licenses->lb_aval_floating = 10000000;
	licenses->lb_used_floating = 0;
	licenses->lb_high_used_floating = 0;
	licenses->lb_do_task = 0;
}


================================================
FILE: src/server/daemon_info.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */
#include <pbs_config.h> /* the master config generated by configure */

#include "pbs_nodes.h"
#include "svrfunc.h"
#include "tpp.h"

/**
 * @file	daemon_info.c
 * @brief
 * 		mom_info.c - functions relating to the daemon_info structures
 *
 *		Functions are used for both mom and peer server
 */

#ifndef PBS_MOM /* Not Mom, i.e. the Server */

/**
 * @brief initialize daemon info structure
 * This struct is common for all service end points
 * inlcluding mom/peer-svr
 *
 * @param[in] pul - list of IP addresses of host; will be freed on error
 *			or saved in structure; caller must not free pul
 * @param[in] port - port of service end point
 * @param[in] pmi - machine info struct
 * @return dmn_info_t*
 */
dmn_info_t *
init_daemon_info(unsigned long *pul, uint port, struct machine_info *pmi)
{
	dmn_info_t *dmn_info = calloc(1, sizeof(dmn_info_t));
	if (!dmn_info)
		return NULL;

	dmn_info->dmn_state = INUSE_UNKNOWN | INUSE_DOWN | INUSE_NEEDS_HELLOSVR;
	dmn_info->dmn_stream = -1;
	CLEAR_HEAD(dmn_info->dmn_deferred_cmds);
	dmn_info->dmn_addrs = pul;

	while (*pul) {
		tinsert2(*pul, port, pmi, &ipaddrs);
		pul++;
	}

	return dmn_info;
}

/**
 * @brief free up daemon info struct and associated data
 *
 * @param[in] pmi - mom/peer-svr struct
 */
void
delete_daemon_info(struct machine_info *pmi)
{
	dmn_info_t *pdmninfo;
	unsigned long *up;

	if (!pmi || !pmi->mi_dmn_info)
		return;

	pdmninfo = pmi->mi_dmn_info;

	/* take stream out of tree */
	tpp_close(pdmninfo->dmn_stream);
	tdelete2((unsigned long) pdmninfo->dmn_stream, 0, &streams);

	if (pdmninfo->dmn_addrs) {
		for (up = pdmninfo->dmn_addrs; *up; up++) {
			/* del Mom's IP addresses from tree  */
			tdelete2(*up, pmi->mi_port, &ipaddrs);
		}
		free(pdmninfo->dmn_addrs);
		pdmninfo->dmn_addrs = NULL;
	}

	free(pdmninfo);
	pmi->mi_dmn_info = NULL;
}

#endif /* end of server functions */


================================================
FILE: src/server/dis_read.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * dis_read.c - contains function to read and decode the DIS
 *	encoded requests and replies.
 *
 *	Included public functions are:
 *
 *	decode_DIS_CopyFiles
 *	decode_DIS_CopyFiles_Cred
 *	decode_DIS_replySvr_inner
 *	decode_DIS_replySvr
 *	decode_DIS_replySvrTPP
 *	dis_request_read
 *	DIS_reply_read
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <stdlib.h>
#include <errno.h>
#include <string.h>
#include <stdio.h>
#include "dis.h"
#include "libpbs.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "log.h"
#include "pbs_error.h"
#include "credential.h"
#include "batch_request.h"
#include "net_connect.h"

/* External Global Data */

extern char *msg_nosupport;

/*	Data items are:	string		job id			(may be null)
 *			string		job owner		(may be null)
 *			string		execution user name
 *			string		execution group name	(may be null)
 *			unsigned int	direction & sandbox flag
 *			unsigned int	count of file pairs in set
 *			set of		file pairs:
 *				unsigned int	flag
 *				string		local path name
 *				string		remote path name (may be null)
 */
/**
 * @brief
 * 		decode_DIS_CopyFiles() - decode a Copy Files Dependency Batch Request
 *
 *		This request is used by the server ONLY.
 *		The batch request structure pointed to by preq must already exist.
 *
 * @see
 * dis_request_read
 *
 * @param[in] sock - socket of connection from Mom
 * @param[in] preq - pointer to the batch request structure to be filled in
 *
 * @return int
 * @retval 0 - success
 * @retval non-zero - decode failure error from a DIS routine
 */
int
decode_DIS_CopyFiles(int sock, struct batch_request *preq)
{
	int pair_ct;
	struct rq_cpyfile *pcf;
	struct rqfpair *ppair;
	int rc;

	pcf = &preq->rq_ind.rq_cpyfile;
	CLEAR_HEAD(pcf->rq_pair);
	if ((rc = disrfst(sock, PBS_MAXSVRJOBID, pcf->rq_jobid)) != 0)
		return rc;
	if ((rc = disrfst(sock, PBS_MAXUSER, pcf->rq_owner)) != 0)
		return rc;
	if ((rc = disrfst(sock, PBS_MAXUSER, pcf->rq_user)) != 0)
		return rc;
	if ((rc = disrfst(sock, PBS_MAXGRPN, pcf->rq_group)) != 0)
		return rc;
	pcf->rq_dir = disrui(sock, &rc);
	if (rc)
		return rc;

	pair_ct = disrui(sock, &rc);
	if (rc)
		return rc;

	while (pair_ct--) {

		ppair = (struct rqfpair *) malloc(sizeof(struct rqfpair));
		if (ppair == NULL)
			return DIS_NOMALLOC;
		CLEAR_LINK(ppair->fp_link);
		ppair->fp_local = 0;
		ppair->fp_rmt = 0;

		ppair->fp_flag = disrui(sock, &rc);
		if (rc) {
			(void) free(ppair);
			return rc;
		}
		ppair->fp_local = disrst(sock, &rc);
		if (rc) {
			(void) free(ppair);
			return rc;
		}
		ppair->fp_rmt = disrst(sock, &rc);
		if (rc) {
			(void) free(ppair->fp_local);
			(void) free(ppair);
			return rc;
		}
		append_link(&pcf->rq_pair, &ppair->fp_link, ppair);
	}
	return 0;
}
/*	Data items are:	string		job id			(may be null)
 *			string		job owner		(may be null)
 *			string		execution user name
 *			string		execution group name	(may be null)
 *			unsigned int	direction & sandbox flag
 *			unsigned int	count of file pairs in set
 *			set of		file pairs:
 *				unsigned int	flag
 *				string		local path name
 *				string		remote path name (may be null)
 *			unsigned int	credential length (bytes)
 *			byte string	credential
 */
/**
 * @brief
 * 		decode_DIS_CopyFiles_Cred() - decode a Copy Files with Credential
 *				 Dependency Batch Request
 *
 *		This request is used by the server ONLY.
 *		The batch request structure pointed to by preq must already exist.
 *
 * @see
 * 		dis_request_read
 *
 * @param[in] sock - socket of connection from Mom
 * @param[in] preq - pointer to the batch request structure to be filled in
 *
 * @return int
 * @retval 0 - success
 * @retval non-zero - decode failure error from a DIS routine
 */
int
decode_DIS_CopyFiles_Cred(int sock, struct batch_request *preq)
{
	int pair_ct;
	struct rq_cpyfile_cred *pcfc;
	struct rqfpair *ppair;
	int rc;

	pcfc = &preq->rq_ind.rq_cpyfile_cred;
	CLEAR_HEAD(pcfc->rq_copyfile.rq_pair);
	if ((rc = disrfst(sock, PBS_MAXSVRJOBID, pcfc->rq_copyfile.rq_jobid)) != 0)
		return rc;
	if ((rc = disrfst(sock, PBS_MAXUSER, pcfc->rq_copyfile.rq_owner)) != 0)
		return rc;
	if ((rc = disrfst(sock, PBS_MAXUSER, pcfc->rq_copyfile.rq_user)) != 0)
		return rc;
	if ((rc = disrfst(sock, PBS_MAXGRPN, pcfc->rq_copyfile.rq_group)) != 0)
		return rc;
	pcfc->rq_copyfile.rq_dir = disrui(sock, &rc);
	if (rc)
		return rc;

	pair_ct = disrui(sock, &rc);
	if (rc)
		return rc;

	while (pair_ct--) {

		ppair = (struct rqfpair *) malloc(sizeof(struct rqfpair));
		if (ppair == NULL)
			return DIS_NOMALLOC;
		CLEAR_LINK(ppair->fp_link);
		ppair->fp_local = 0;
		ppair->fp_rmt = 0;

		ppair->fp_flag = disrui(sock, &rc);
		if (rc) {
			(void) free(ppair);
			return rc;
		}
		ppair->fp_local = disrst(sock, &rc);
		if (rc) {
			(void) free(ppair);
			return rc;
		}
		ppair->fp_rmt = disrst(sock, &rc);
		if (rc) {
			(void) free(ppair->fp_local);
			(void) free(ppair);
			return rc;
		}
		append_link(&pcfc->rq_copyfile.rq_pair,
			    &ppair->fp_link, ppair);
	}

	pcfc->rq_credtype = disrui(sock, &rc);
	if (rc)
		return rc;
	pcfc->rq_pcred = disrcs(sock, &pcfc->rq_credlen, &rc);
	if (rc)
		return rc;

	return 0;
}

/**
 * @brief
 * 		decode_DIS_replySvr_inner() - decode a Batch Protocol Reply Structure for Server
 *
 *		This routine decodes a batch reply into the form used by server.
 *		The only difference between this and the command version is on status
 *		replies.  For the server,  the attributes are decoded into a list of
 *		server svrattrl structures rather than a commands's attrl.
 *
 * @see
 * 		decode_DIS_replySvrTPP
 *
 * @param[in] sock - socket connection from which to read reply
 * @param[in,out] reply - batch_reply structure defined in libpbs.h, it must be allocated
 *					  by the caller.
 *
 * @return int
 * @retval 0 - success
 * @retval -1 - if brp_choice is wrong
 * @retval non-zero - decode failure error from a DIS routine
 */

static int
decode_DIS_replySvr_inner(int sock, struct batch_reply *reply)
{
	int ct;
	struct brp_select *psel;
	struct brp_select **pselx;
	int rc = 0;
	size_t txtlen;

	/* next decode code, auxcode and choice (union type identifier) */

	reply->brp_code = disrsi(sock, &rc);
	if (rc)
		return rc;
	reply->brp_auxcode = disrsi(sock, &rc);
	if (rc)
		return rc;
	reply->brp_choice = disrui(sock, &rc);
	if (rc)
		return rc;
	reply->brp_is_part = disrui(sock, &rc);
	if (rc)
		return rc;

	switch (reply->brp_choice) {

		case BATCH_REPLY_CHOICE_NULL:
			break; /* no more to do */

		case BATCH_REPLY_CHOICE_Queue:
		case BATCH_REPLY_CHOICE_RdytoCom:
		case BATCH_REPLY_CHOICE_Commit:
			rc = disrfst(sock, PBS_MAXSVRJOBID + 1, reply->brp_un.brp_jid);
			if (rc)
				return (rc);
			break;

		case BATCH_REPLY_CHOICE_Select:

			/* have to get count of number of strings first */

			reply->brp_un.brp_select = NULL;
			pselx = &reply->brp_un.brp_select;
			ct = disrui(sock, &rc);
			if (rc)
				return rc;
			reply->brp_count = ct;

			while (ct--) {
				psel = (struct brp_select *) malloc(sizeof(struct brp_select));
				if (psel == 0)
					return DIS_NOMALLOC;
				psel->brp_next = NULL;
				psel->brp_jobid[0] = '\0';
				rc = disrfst(sock, PBS_MAXSVRJOBID + 1, psel->brp_jobid);
				if (rc) {
					(void) free(psel);
					return rc;
				}
				*pselx = psel;
				pselx = &psel->brp_next;
			}
			break;

		case BATCH_REPLY_CHOICE_Text:

			/* text reply */

			reply->brp_un.brp_txt.brp_str = disrcs(sock, &txtlen, &rc);
			reply->brp_un.brp_txt.brp_txtlen = txtlen;
			break;

		case BATCH_REPLY_CHOICE_Locate:

			/* Locate Job Reply */

			rc = disrfst(sock, PBS_MAXDEST + 1, reply->brp_un.brp_locate);
			break;

		default:
			return -1;
	}

	return rc;
}

/**
 * @brief
 * 		decode a Batch Protocol Reply Structure for Server
 *
 *  	This routine reads reply over TCP by calling decode_DIS_replySvr_inner()
 * 		to read the reply to a batch request. This routine reads the protocol type
 * 		and version before calling decode_DIS_replySvr_inner() to read the rest of
 * 		the reply structure.
 *
 * @see
 *		DIS_reply_read
 *
 * @param[in] sock - socket connection from which to read reply
 * @param[out] reply - The reply structure to be returned
 *
 * @return Error code
 * @retval DIS_SUCCESS(0) - Success
 * @retval !DIS_SUCCESS   - Failure (see dis.h)
 */
int
decode_DIS_replySvr(int sock, struct batch_reply *reply)
{
	int rc = 0;
	int i;
	/* first decode "header" consisting of protocol type and version */

	i = disrui(sock, &rc);
	if (rc != 0)
		return rc;
	if (i != PBS_BATCH_PROT_TYPE)
		return DIS_PROTO;
	i = disrui(sock, &rc);
	if (rc != 0)
		return rc;
	if (i != PBS_BATCH_PROT_VER)
		return DIS_PROTO;

	return (decode_DIS_replySvr_inner(sock, reply));
}

/**
 * @brief
 * 	decode a Batch Protocol Reply Structure for Server over TPP stream
 *
 * 	This routine reads data over TPP stream by calling decode_DIS_replySvr_inner()
 * 	to read the reply to a batch request. This routine reads the protocol type
 * 	and version before calling decode_DIS_replySvr_inner() to read the rest of
 * 	the reply structure.
 *
 * @see
 * 	DIS_reply_read
 *
 * @param[in] sock - socket connection from which to read reply
 * @param[out] reply - The reply structure to be returned
 *
 * @return Error code
 * @retval DIS_SUCCESS(0) - Success
 * @retval !DIS_SUCCESS   - Failure (see dis.h)
 */
int
decode_DIS_replySvrTPP(int sock, struct batch_reply *reply)
{
	/* for tpp based connection, header has already been read */
	return (decode_DIS_replySvr_inner(sock, reply));
}

/**
 * @brief
 * 	Read in an DIS encoded request from the network
 * 	and decodes it:
 *	Read and decode the request into the request structures
 *
 * @see
 * 	process_request and read_fo_request
 *
 * @param[in] sfds	- the socket descriptor
 * @param[in,out] request - will contain the decoded request
 *
 * @return int
 * @retval 0 	if request read ok, batch_request pointed to by request is updated.
 * @retval -1 	if EOF (no request but no error)
 * @retval >0 	if errors ( a PBSE_ number)
 */

int
dis_request_read(int sfds, struct batch_request *request)
{
#ifndef PBS_MOM
	int i;
#endif /* PBS_MOM */
	int proto_type;
	int proto_ver;
	int rc; /* return code */

	if (request->prot == PROT_TCP)
		DIS_tcp_funcs(); /* setup for DIS over tcp */

	/* Decode the Request Header, that will tell the request type */

	rc = decode_DIS_ReqHdr(sfds, request, &proto_type, &proto_ver);

	if (rc != 0) {
		if (rc == DIS_EOF)
			return EOF;
		(void) sprintf(log_buffer,
			       "Req Header bad, errno %d, dis error %d",
			       errno, rc);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
			  "?", log_buffer);

		return PBSE_DISPROTO;
	}

	if (proto_ver > PBS_BATCH_PROT_VER)
		return PBSE_DISPROTO;

	/* Decode the Request Body based on the type */

	switch (request->rq_type) {
		case PBS_BATCH_Connect:
			break;

		case PBS_BATCH_Disconnect:
			return (-1); /* set EOF return */

		case PBS_BATCH_QueueJob:
		case PBS_BATCH_SubmitResv:
			CLEAR_HEAD(request->rq_ind.rq_queuejob.rq_attr);
			rc = decode_DIS_QueueJob(sfds, request);
			break;

		case PBS_BATCH_JobCred:
			rc = decode_DIS_JobCred(sfds, request);
			break;

		case PBS_BATCH_UserCred:
			rc = decode_DIS_UserCred(sfds, request);
			break;

		case PBS_BATCH_jobscript:
		case PBS_BATCH_MvJobFile:
			rc = decode_DIS_JobFile(sfds, request);
			break;

		case PBS_BATCH_RdytoCommit:
		case PBS_BATCH_Commit:
		case PBS_BATCH_Rerun:
			rc = decode_DIS_JobId(sfds, request->rq_ind.rq_commit);
			break;

		case PBS_BATCH_DeleteJobList:
			rc = decode_DIS_DelJobList(sfds, request);
			break;

		case PBS_BATCH_DeleteJob:
		case PBS_BATCH_DeleteResv:
		case PBS_BATCH_ResvOccurEnd:
		case PBS_BATCH_HoldJob:
		case PBS_BATCH_ModifyJob:
		case PBS_BATCH_ModifyJob_Async:
			rc = decode_DIS_Manage(sfds, request);
			break;

		case PBS_BATCH_MessJob:
			rc = decode_DIS_MessageJob(sfds, request);
			break;

		case PBS_BATCH_Shutdown:
		case PBS_BATCH_FailOver:
			rc = decode_DIS_ShutDown(sfds, request);
			break;

		case PBS_BATCH_SignalJob:
			rc = decode_DIS_SignalJob(sfds, request);
			break;

		case PBS_BATCH_StatusJob:
			rc = decode_DIS_Status(sfds, request);
			break;

		case PBS_BATCH_PySpawn:
			rc = decode_DIS_PySpawn(sfds, request);
			break;

		case PBS_BATCH_Authenticate:
			rc = decode_DIS_Authenticate(sfds, request);
			break;

#ifndef PBS_MOM
		case PBS_BATCH_RegisterSched:
			request->rq_ind.rq_register_sched.rq_name = disrst(sfds, &rc);
			break;

		case PBS_BATCH_RelnodesJob:
			rc = decode_DIS_RelnodesJob(sfds, request);
			break;

		case PBS_BATCH_LocateJob:
			rc = decode_DIS_JobId(sfds, request->rq_ind.rq_locate);
			break;

		case PBS_BATCH_Manager:
		case PBS_BATCH_ReleaseJob:
			rc = decode_DIS_Manage(sfds, request);
			break;

		case PBS_BATCH_MoveJob:
		case PBS_BATCH_OrderJob:
			rc = decode_DIS_MoveJob(sfds, request);
			break;

		case PBS_BATCH_RunJob:
		case PBS_BATCH_AsyrunJob:
		case PBS_BATCH_AsyrunJob_ack:
		case PBS_BATCH_StageIn:
		case PBS_BATCH_ConfirmResv:
			rc = decode_DIS_Run(sfds, request);
			break;

		case PBS_BATCH_DefSchReply:
			request->rq_ind.rq_defrpy.rq_cmd = disrsi(sfds, &rc);
			if (rc)
				break;
			request->rq_ind.rq_defrpy.rq_id = disrst(sfds, &rc);
			if (rc)
				break;
			request->rq_ind.rq_defrpy.rq_err = disrsi(sfds, &rc);
			if (rc)
				break;
			i = disrsi(sfds, &rc);
			if (rc)
				break;
			if (i)
				request->rq_ind.rq_defrpy.rq_txt = disrst(sfds, &rc);
			break;

		case PBS_BATCH_SelectJobs:
		case PBS_BATCH_SelStat:
			CLEAR_HEAD(request->rq_ind.rq_select.rq_selattr);
			CLEAR_HEAD(request->rq_ind.rq_select.rq_rtnattr);
			rc = decode_DIS_svrattrl(sfds,
						 &request->rq_ind.rq_select.rq_selattr);
			rc = decode_DIS_svrattrl(sfds,
						 &request->rq_ind.rq_select.rq_rtnattr);
			break;

		case PBS_BATCH_StatusNode:
		case PBS_BATCH_StatusResv:
		case PBS_BATCH_StatusQue:
		case PBS_BATCH_StatusSvr:
		case PBS_BATCH_StatusSched:
		case PBS_BATCH_StatusRsc:
		case PBS_BATCH_StatusHook:
			rc = decode_DIS_Status(sfds, request);
			break;

		case PBS_BATCH_TrackJob:
			rc = decode_DIS_TrackJob(sfds, request);
			break;

		case PBS_BATCH_Rescq:
		case PBS_BATCH_ReserveResc:
		case PBS_BATCH_ReleaseResc:
			rc = decode_DIS_Rescl(sfds, request);
			break;

		case PBS_BATCH_RegistDep:
			rc = decode_DIS_Register(sfds, request);
			break;

		case PBS_BATCH_ModifyResv:
			decode_DIS_ModifyResv(sfds, request);
			break;

		case PBS_BATCH_PreemptJobs:
			decode_DIS_PreemptJobs(sfds, request);
			break;

#else /* yes PBS_MOM */

		case PBS_BATCH_CopyHookFile:
			rc = decode_DIS_CopyHookFile(sfds, request);
			break;

		case PBS_BATCH_DelHookFile:
			rc = decode_DIS_DelHookFile(sfds, request);
			break;

		case PBS_BATCH_CopyFiles:
		case PBS_BATCH_DelFiles:
			rc = decode_DIS_CopyFiles(sfds, request);
			break;

		case PBS_BATCH_CopyFiles_Cred:
		case PBS_BATCH_DelFiles_Cred:
			rc = decode_DIS_CopyFiles_Cred(sfds, request);
			break;
		case PBS_BATCH_Cred:
			rc = decode_DIS_Cred(sfds, request);
			break;

#endif /* PBS_MOM */

		default:
			sprintf(log_buffer, "%s: %d from %s", msg_nosupport,
				request->rq_type, request->rq_user);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
				  "?", log_buffer);
			rc = PBSE_UNKREQ;
			break;
	}

	if (rc == 0) { /* Decode the Request Extension, if present */
		rc = decode_DIS_ReqExtend(sfds, request);
		if (rc != 0) {
			(void) sprintf(log_buffer,
				       "Request type: %d Req Extension bad, dis error %d", request->rq_type, rc);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST,
				  LOG_DEBUG, "?", log_buffer);
			rc = PBSE_DISPROTO;
		}
	} else if (rc != PBSE_UNKREQ) {
		(void) sprintf(log_buffer,
			       "Req Body bad, dis error %d, type %d",
			       rc, request->rq_type);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST,
			  LOG_DEBUG, "?", log_buffer);
		rc = PBSE_DISPROTO;
	}

	return (rc);
}

/**
 * @brief
 * 	top level function to read and decode DIS based batch reply
 *
 * 	Calls decode_DIS_replySvrTPP in case of PROT_TPP and decode_DIS_replySvr
 * 	in case of PROT_TCP to read the reply
 *
 * @see
 *	read_reg_reply, process_Dreply and process_DreplyTPP.
 *
 * @param[in] sock - socket connection from which to read reply
 * @param[out] reply - The reply structure to be returned
 * @param[in] prot - Whether to read over tcp or tpp based connection
 *
 * @return Error code
 * @retval DIS_SUCCESS(0) - Success
 * @retval !DIS_SUCCESS   - Failure (see dis.h)
 */
int
DIS_reply_read(int sock, struct batch_reply *preply, int prot)
{
	if (prot == PROT_TPP)
		return (decode_DIS_replySvrTPP(sock, preply));

	DIS_tcp_funcs();
	return (decode_DIS_replySvr(sock, preply));
}


================================================
FILE: src/server/failover.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @brief
 * failover.c	- Functions relating to the FailOver Requests
 *
 *	Included public functions are:
 *
 *	rel_handshake
 *	utimes
 *	primary_handshake
 *	secondary_handshake
 *	fo_shutdown_reply
 *	failover_send_shutdown
 *	close_secondary
 *	put_failover
 *	req_failover
 *	read_fo_request
 *	read_reg_reply
 *	alm_handler
 *	alt_conn
 *	takeover_from_secondary
 *	be_secondary
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <fcntl.h>
#include <stdio.h>
#include <utime.h>
#include "libpbs.h"
#include <signal.h>
#include <string.h>
#include <time.h>
#include <unistd.h>
#include <sys/wait.h>
#include "server_limits.h"
#include "credential.h"
#include "attribute.h"
#include "server.h"
#include "batch_request.h"
#include "net_connect.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "dis.h"
#include "libsec.h"
#include "pbs_db.h"

/* used internal to this file only */
#define SECONDARY_STATE_noconn -1 /* not connected to Primary */
#define SECONDARY_STATE_conn 0	  /* connect to Primary */
#define SECONDARY_STATE_regsent 1 /* have sent register to Primary */
#define SECONDARY_STATE_handsk 3  /* receiving regular handshakes  */
#define SECONDARY_STATE_nohsk 4	  /* handsakes have stopped comming */
#define SECONDARY_STATE_shutd 5	  /* told to shut down */
#define SECONDARY_STATE_takeov 6  /* primary back up and taking over */
#define SECONDARY_STATE_inact 7	  /* told to go inactive/idle */
#define SECONDARY_STATE_idle 8	  /* idle until primary back up */

#define HANDSHAKE_TIME 5

/* Global Data Items: */

extern char *msg_daemonname;
extern unsigned long hostidnum;
extern char *path_priv;
extern char *path_svrlive;
extern char *path_secondaryact;
extern time_t secondary_delay;
extern time_t time_now;

extern struct connection *svr_conn;
extern struct batch_request *saved_takeover_req;
extern pbs_net_t pbs_server_addr;

int pbs_failover_active = 0; /* indicates if Seconary is active */
/* Private data items */

static int sec_sock = -1;	      /* used by Secondary */
static int Secondary_connection = -1; /* used by Primary,connection_handle*/
static int Secondary_state = SECONDARY_STATE_noconn;
static time_t hd_time;
static int goidle_ack = 0;
static char msg_takeover[] = "received takeover message from primary, going inactive";
static char msg_regfailed[] = "Primary rejected attempt to register as Secondary";

/**
 * @brief
 * 		rel_handshake_reply - free the batch request used for a handshake
 *		Cannot use release_req() as we don't want the connection closed
 *
 * @see
 * 		primary_handshake
 * @param[in]	pwt - pointer to the work task entry which invoked the function.
 *
 * @return: none
 */
static void
rel_handshake(struct work_task *pwt)
{
	DBPRT(("Failover: rel_handshake\n"))
	free_br((struct batch_request *) pwt->wt_parm1);
}

/**
 * @brief
 *		Do the handshake with secondary server to show that the primary
 *		is still alive.
 *
 * @par Functionality:
 *		Perform periodic handshake to indicate to the Secondary Server that
 *		we, the Primary Server, is alive.  The handshake consists of three
 *		separate communication channels:
 *		1. "Touching" the "svrlive" file (in PBS_HOME/server_priv);
 *	   	this is done whenever this function is called.
 *		2. If a Secondary Server has registered, a "handshake" message is sent
 *	   	over the persistent TCP connection to the Secondary.
 *		3. Also if a Secondary has registered,  the "secondary_active" file is
 *	   	status-ed to see if it exists;  this is created by the Secondary
 *	   	when it goes active.  If this file is present, the Primary will
 *	   	restart itself in an attempt to take backover.
 *		This function is called from pbsd_main.c when it initializing.  It will
 *		create a work-task to recall itself every HANDSHAKE_TIME (5) seconds.
 *
 * @see
 *		main
 *
 * @param[in]	pwt - pointer to the work task entry which invoked the function.
 *
 * @return: none
 */
void
primary_handshake(struct work_task *pwt)
{
	struct batch_request *preq;
	struct stat sb;

	/* touch svrlive file as an "I am alive" sign */

	(void) update_svrlive();

	/* if connection, send HandShake request to Secondary */

	if (Secondary_connection >= 0) {
		DBPRT(("Failover: sending handshake\n"))
		if ((preq = alloc_br(PBS_BATCH_FailOver)) != NULL) {
			preq->rq_ind.rq_failover = FAILOVER_HandShake;
			if (issue_Drequest(Secondary_connection, preq, rel_handshake, 0, 0) != 0) {
				close_conn(Secondary_connection);
				Secondary_connection = -2;
			}
		}

		/* see if Secondary has taken over even though we are up */

		if (stat(path_secondaryact, &sb) != -1) {
			set_sattr_l_slim(SVR_ATR_State, SV_STATE_SECIDLE, SET); /* cause myself to recycle */
			DBPRT(("Primary server found secondary active, restarting\n"))
		}
	}

	/* reset work_task to call this again */

	(void) set_task(WORK_Timed, time_now + HANDSHAKE_TIME, primary_handshake, NULL);

	return;
}

/**
 * @brief
 *		"Touch" the sverlive file (in PBS_HOME/server_priv) to indicate that
 *		the Secondary Server is active.
 *
 * @par Functionality:
 *		When starting up, the Primary Server will monitor the time of "svrlive"
 *		to see if the Secondary appears to be active and needs to be told to
 *		go inactive; see pbsd_main.c.
 *		This function is first called out of the main program (pbsd_main.c)
 *		when the Secondary becomes the active server.  It will create a
 *		work-task to recall itself every HANDSHAKE_TIME (5) seconds.
 *
 * @see
 *		main
 *
 * @param[in]	pwt - pointer to the work task entry which invoked the function.
 *
 * @return: none
 */
void
secondary_handshake(struct work_task *pwt)
{
	(void) update_svrlive();
	(void) set_task(WORK_Timed, time_now + HANDSHAKE_TIME,
			secondary_handshake, NULL);
}

/**
 * @brief
 *		Handles reply from Secondary for shutdown  or go inactive message
 *		Clears the SV_STATE_PRIMDLY bit from the internal Server state so
 *		the Primary can exit from the main loop.
 *
 * @see
 *		failover_send_shutdown
 *
 * @param[in]	pwt - pointer to the work task entry which invoked the function.
 *
 * @return: none
 */
static void
fo_shutdown_reply(struct work_task *pwt)
{
	set_sattr_l_slim(SVR_ATR_State, get_sattr_long(SVR_ATR_State) & ~SV_STATE_PRIMDLY, SET);
	release_req(pwt);
}
/**
 * @brief
 * 		Send a "shutdown" or "stay idle" request to the
 *		Secondary Server when the Primary is shutting down.
 *		Will cause a wait for the reply as this is critical, see
 *		fo_shutdown_reply().
 *
 * @see
 * 		svr_shutdown and req_shutdown
 *
 * @param[in] type	- type of message to send to Secondary
 *
 * @return  int - success or failure
 * @retval    0 - shutdown request sent to Secondary
 * @retval    1 - no Secondary connect, nothing (need be) done; or failed
 *		  to send message.
 */
int
failover_send_shutdown(int type)
{
	struct batch_request *preq;

	if (Secondary_connection == -1)
		return (1); /* no secondary, nothing to do */

	if ((preq = alloc_br(PBS_BATCH_FailOver)) == NULL) {
		close_conn(Secondary_connection);
		Secondary_connection = -2;
		return (1);
	}
	preq->rq_ind.rq_failover = type;
	if (issue_Drequest(Secondary_connection, preq, fo_shutdown_reply, 0, 0) != 0) {
		close_conn(Secondary_connection);
		Secondary_connection = -2;
		return (1);
	}
	return (0);
}

/**
 * @brief
 * close_secondary - clear the Secondary_connect indictor when socket closed
 *
 * @see
 * 		req_failover
 *
 * @param[in] sock	- socket of connection
 *
 * @return  none
 */

static void
close_secondary(int sock)
{
	conn_t *conn;

	conn = get_conn(sock);
	if (!conn)
		return;

	if (Secondary_connection == conn->cn_sock)
		Secondary_connection = -1;

	DBPRT(("Failover: close secondary on socket %d\n", sock))

	return;
}

/**
 * @brief
 * 		put_failover - encode the FailOver request
 *		Used via issue_Drequest() by the active server for handshake/control
 *		used directly by the secondary for register message
 *
 *	@see
 *		takeover_from_secondary, be_secondary and issue_Drequest
 *
 * @param[in] sock	- socket of connection
 * @param[in] request	- FailOver request
 *
 * @return  int
 * @retval	0	- success
 * @retval	non-zero - decode failure error from a DIS routine
 */
int
put_failover(int sock, struct batch_request *request)
{
	int rc;

	DBPRT(("Failover: sending FO(%d) request\n", request->rq_ind.rq_failover))
	DIS_tcp_funcs();
	if ((rc = encode_DIS_ReqHdr(sock, PBS_BATCH_FailOver, pbs_current_user)) == 0)
		if ((rc = diswui(sock, request->rq_ind.rq_failover)) == 0)
			if ((rc = encode_DIS_ReqExtend(sock, 0)) == 0)
				rc = dis_flush(sock);
	return rc;
}

/**
 * @brief
 *	returning host id.
 *
 * @return Host ID
 */
unsigned long
pbs_get_hostid(void)
{
	unsigned long hid;

	hid = (unsigned long) gethostid();
	if (hid == 0)
		hid = (unsigned long) pbs_server_addr;
	return hid;
}

/**
 * @brief
 * 		req_failover - service failover related requests
 *		Primary - when receives "register", this is reached via process_request
 *		  and dispatch_request (like any request)
 *		Secondary - handshake and control calls, reached directly from
 *		  handshake_decode from be_secondary
 *
 * @see
 * 		dispatch_request and read_fo_request
 *
 * @param[in,out] preq	- pointer to failover request
 *
 * @return  none
 */

void
req_failover(struct batch_request *preq)
{
	int err = 0;
	char hostbuf[PBS_MAXHOSTNAME + 1];
	conn_t *conn;
	unsigned long hostidnum;

	preq->rq_reply.brp_auxcode = 0;

	conn = get_conn(preq->rq_conn);
	if (!conn) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	DBPRT(("Failover: received FO(%d) request\n", preq->rq_ind.rq_failover))
	switch (preq->rq_ind.rq_failover) {

		case FAILOVER_Register:
			/*
			 * The one request that should be seen by the primary server
			 * - register the secondary and	return the primary's hostid
			 *
			 * Request must be from Secondary system with privileged
			 * for now - should be only one, so error if already one
			 */

			hostbuf[0] = '\0';
			(void) get_connecthost(preq->rq_conn, hostbuf, (sizeof(hostbuf) - 1));

			if (Secondary_connection >= 0) {
				err = PBSE_OBJBUSY;
				sprintf(log_buffer, "Failover: second secondary tried to register, host: %s", hostbuf);
				DBPRT(("%s\n", log_buffer))
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
					  LOG_WARNING, msg_daemonname, log_buffer);
				break;
			}
			sprintf(log_buffer, "Failover: registering %s as Secondary Server", hostbuf);
			DBPRT(("%s\n", log_buffer))
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
				  LOG_INFO, msg_daemonname, log_buffer);

			/* Mark the connection as non-expiring */

			conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;
			Secondary_connection = preq->rq_conn;
			conn->cn_func = process_Dreply;
			net_add_close_func(preq->rq_conn, close_secondary);

			/* return the host id as a text string */
			/* (make do with existing capability to return data in reply */

			hostidnum = pbs_get_hostid();
			sprintf(hostbuf, "%ld", hostidnum);
			(void) reply_text(preq, PBSE_NONE, hostbuf);
			return;

			/*
			 * the reminder of the requests come from the Primary to Secondary.
			 */

		case FAILOVER_HandShake:
			/* Handshake - the Primary is up, all is right with the world */
			/* record time of the handshake	,  then just acknowledge it   */
			hd_time = time(0);
			if (Secondary_state == SECONDARY_STATE_nohsk)
				Secondary_state = SECONDARY_STATE_handsk;
			break;

		case FAILOVER_PrimIsBack:
			/*
			 * Primary is Back - The Primary Server is back up and
			 * wishes to take control again.
			 * This is the only failover request normally
			 * seen by the Secondary while it is active.
			 */
			set_sattr_l_slim(SVR_ATR_State, SV_STATE_SECIDLE, SET);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_CRIT,
				  msg_daemonname, msg_takeover);
			(void) unlink(path_secondaryact); /* remove file */
			DBPRT(("%s\n", msg_takeover))
			break;

			/* These requests come from the Primary while the 	*/
			/* Secondary is inactive 				*/

		case FAILOVER_SecdShutdown:
			/* Primary is shutting down, Secondary should also go down */
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_CRIT,
				  msg_daemonname, "Failover: Secondary told to shut down");

			reply_send(preq);
			exit(0);

		case FAILOVER_SecdGoInactive:
			/* Primary is shutting down, Secondary should remain inactive */
			Secondary_state = SECONDARY_STATE_inact;
			break;

		case FAILOVER_SecdTakeOver:
			sleep(10); /* give primary a bit more time to go down */
			Secondary_state = SECONDARY_STATE_takeov;
			break;

		default:
			DBPRT(("Failover: invalid request\n"))
			err = 1;
	}

	if (err) {
		req_reject(PBSE_SYSTEM, 0, preq);
	} else {

		preq->rq_reply.brp_code = 0;
		preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
		if (preq->rq_ind.rq_failover == FAILOVER_PrimIsBack) {
			/*
			 * save ptr of preq, Seconday will acknowledge the
			 * request after the nodes have been saved off
			 */
			saved_takeover_req = preq;
		} else if (preq->rq_ind.rq_failover == FAILOVER_SecdTakeOver) {
			/* acknowledge the request */
			reply_send(preq);
			/*
			 * Primary is shutting down, Secondary should go active
			 * wait for Primary to actually shut down
			 * (connection closes)
			 */
			(void) wait_request(600, NULL);
			if (sec_sock != -1) {
				close_conn(sec_sock);
				sec_sock = -1;
			}
		} else {
			/* acknowledge the request */
			DBPRT(("Failover: acknowledging FO(%d) request\n", preq->rq_ind.rq_failover))
			reply_send(preq);
		}
	}
	return;
}

/**
 * @brief
 *		Read and decode the failover request.  This function is
 *		used only by the secondary,  in place of process_request().
 *
 * @see
 * 		read_reg_reply
 *
 * @param[in] conn - connection on which the batch request is to be read
 *
 * @return None
 */
static void
read_fo_request(int conn)
{
	int rc;
	struct batch_request *request;

	if ((request = alloc_br(0)) == NULL) { /* freed when reply sent */
		DBPRT(("Failover: Unable to allocate request structure\n"))
		Secondary_state = SECONDARY_STATE_noconn;
		close_conn(conn);
		sec_sock = -1;
		return;
	}
	request->rq_conn = conn;
	rc = dis_request_read(conn, request);
	DBPRT(("Failover: received request (rc=%d) secondary state %d\n", rc, Secondary_state))
	if (rc == -1) {
		/*
		 * EOF/socket closed, if the Secondary state is
		 * SECONDARY_STATE_inact or SECONDARY_STATE_noconn, then leave
		 * unchanged as there is a race as to when this end sees the
		 * connect closed by the primaryr;
		 * otherwise set to SECONDARY_STATE_nohsk to start timing
		 * to go active
		 */
		if ((Secondary_state != SECONDARY_STATE_inact) &&
		    (Secondary_state != SECONDARY_STATE_noconn))
			Secondary_state = SECONDARY_STATE_nohsk;

		/* make sure our side is closed */
		close_conn(conn);
		sec_sock = -1;
		free_br(request);
		return;

	} else if (rc != 0) {
		/* read or decode error */
		DBPRT(("Failover: read or decode error\n"))
		Secondary_state = SECONDARY_STATE_noconn;
		close_conn(conn);
		sec_sock = -1;
		free_br(request);
		return;
	}

	req_failover(request); /* will send reply, which will free request */
	return;
}

/**
 * @brief
 * 		read_reg_reply - read and decode the reply for one of two special failover
 *		messages: from the primary for the register request; or from the
 *		Secondary in reply to a take-over message.
 *
 * @par functionality:
 *		Normally, the active Server uses the normal process_Dreply() to
 *		read and decode the response to a message, even the normal failover
 *		messages such as handshake.  This function is used by the Secondary
 *		server only for the reply from register message.  On receiving a
 *		non-error reply, we advance the secondary state to "waiting for
 *		handshake".  If the Primary sends an explicit error (reject), the
 *		Secondary just exits as it isn't wanted.  Likewise on a read error,
 *		unless it is a EOF on the read.  In that case we assume the Primary
 *		really isn't up, and change set to "take over" which causes a retry
 * 		of the connection.
 *
 *		The Primary Server will use this to read/process the reply from a
 *		takeover message since at that point the Primary is not fully
 *		initialized.
 *
 * @see
 * 		takeover_from_secondary and be_secondary
 *
 * @param[in] sock - the socket from which to read.
 *
 * @return none
 */
static void
read_reg_reply(int sock)
{
	struct batch_reply fo_reply;
	int rc;
	unsigned long hid;
	char *txtm;
	char *txts;

	fo_reply.brp_code = 0;
	fo_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
	fo_reply.brp_un.brp_txt.brp_txtlen = 0;
	fo_reply.brp_un.brp_txt.brp_str = 0;
	rc = DIS_reply_read(sock, &fo_reply, 0);

	if ((rc != 0) || (fo_reply.brp_code != 0)) {
		DBPRT(("Failover: received invalid reply: non-zero code or EOF\n"))
		if ((rc == DIS_EOD) && (Secondary_state == SECONDARY_STATE_regsent)) {
			/* EOD/EOF on read of reply to register message,  */
			/* go ahead and take over as primary must be down */
			/* as we had successfully connected		  */
			Secondary_state = SECONDARY_STATE_takeov;
			return;
		}

		if (goidle_ack) {
			txts = pbs_conf.pbs_secondary;
			txtm = "failed to acknowledge request to go idle";
		} else {
			txts = pbs_conf.pbs_primary;
			txtm = "did not accept secondary registration";
		}
		sprintf(log_buffer, "Active PBS Server at %s %s", txts, txtm);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_CRIT,
			  msg_daemonname, log_buffer);
		exit(1); /* bad reply */
	}

	if (goidle_ack) {
		/* waiting for reply to "go idle" request to active secondary */
		/* ok response means the active as agreed to shut down	  */
		goidle_ack = 0; /* see takeover_from_secondary() 	  */

	} else {

		if ((fo_reply.brp_choice != BATCH_REPLY_CHOICE_Text) ||
		    (fo_reply.brp_un.brp_txt.brp_str == 0)) {

			if (fo_reply.brp_code == PBSE_UNKREQ) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_CRIT,
					  msg_daemonname, msg_regfailed);
				DBPRT(("%s\n", msg_regfailed))
				exit(1);
			}
			DBPRT(("Failover: received invalid reply\n"))
			/* reset back to beginning */
			Secondary_state = SECONDARY_STATE_noconn;
		} else {

			char fn[MAXPATHLEN + 1];
			int fd;
			size_t s;
			conn_t *conn;

			conn = get_conn(sock);
			if (!conn) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
					  LOG_CRIT, msg_daemonname,
					  "unable to socket in connection table");
				exit(1);
			}

			DBPRT(("Failover: received ok reply\n"))
			hid = (unsigned long) atol(fo_reply.brp_un.brp_txt.brp_str);
			hid = hid ^ pbs_get_hostid();
			free(fo_reply.brp_un.brp_txt.brp_str);
			fo_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
			/* change function for reading socket from read_reg_reply to */
			/* read_fo_request, and then wait for the handshakes	     */

			conn->cn_func = read_fo_request;
			Secondary_state = SECONDARY_STATE_handsk;
			hd_time = time(0);
			(void) sprintf(fn, "%s/license.fo", path_priv);
			/* save Primary's host id */
			fd = open(fn, O_WRONLY | O_CREAT | O_TRUNC, 0600);
			s = sizeof(hid);
			if ((fd == -1) || (write(fd, (char *) &hid, s) != s)) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_CRIT,
					  msg_daemonname, "unable to save Primary hostid");
				exit(1);
			}
			close(fd);
		}
	}
}

/**
 * @brief
 * 		alm_handler - handler for sigalarm for alt_conn()
 *
 * @see
 * 		alt_conn
 *
 * @param[in] sig - signal signum.
 *
 * @return	none
 */
static void
alm_handler(int sig)
{
	return;
}

/**
 * @brief
 * alt_conn - connect to primary/secondary with timeout around the connect
 *
 * @see
 * 		takeover_from_secondary and be_secondary
 *
 * @param[in] addr - host address of primary or secondary.
 * @param[in] sec - timeout in seconds.
 *
 * @return	the socket from which to read
 * @retval	-1	- error
 */
static int
alt_conn(pbs_net_t addr, unsigned int sec)
{
	int sock;
	struct sigaction act;

	act.sa_handler = alm_handler;
	sigemptyset(&act.sa_mask);
	act.sa_flags = 0;
	sigaction(SIGALRM, &act, 0);
	alarm(sec);
	sock = client_to_svr(addr, pbs_server_port_dis, B_RESERVED);
	alarm(0);
	if (sock < 0)
		sock = -1;
	act.sa_handler = SIG_DFL;
	sigaction(SIGALRM, &act, 0);

	return (sock);
}

/**
 * @brief
 * 	Function to check if stonith script exists at PBS_HOME/server_priv/stonith.
 * 	If it does then invoke the script for execution.
 *
 * @param[in]	node - hostname of the node, that needs to brought down.
 *
 * @return	Error code
 * @retval	 0 - stonith script executed successfully or script does not exist.
 * @retval      -1 - stonith script failed to bring down node.
 *
 */
int
check_and_invoke_stonith(char *node)
{
	char stonith_cmd[3 * MAXPATHLEN + 1] = {0};
	char stonith_fl[MAXPATHLEN + 1] = {0};
	char *p = NULL;
	char out_err_fl[MAXPATHLEN + 1] = {0};
	char *out_err_msg = NULL;
	int rc = 0;
	int fd = 0;
	struct stat stbuf;

	if (node == NULL)
		return -1;

	snprintf(stonith_fl, sizeof(stonith_fl), "%s/server_priv/stonith", pbs_conf.pbs_home_path);

	if (stat(stonith_fl, &stbuf) != 0) {
		if (errno == ENOENT) {
			snprintf(log_buffer, LOG_BUF_SIZE, "Skipping STONITH");
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
				  msg_daemonname, log_buffer);
			return 0;
		}
	}

	/* create unique filename by appending pid */
	snprintf(out_err_fl, sizeof(out_err_fl),
		 "%s/spool/stonith_out_err_fl_%s_%d", pbs_conf.pbs_home_path, node, getpid());

	/* execute stonith script and redirect output to file */
	snprintf(stonith_cmd, sizeof(stonith_cmd), "%s %s > %s 2>&1", stonith_fl, node, out_err_fl);
	snprintf(log_buffer, LOG_BUF_SIZE,
		 "Executing STONITH script to bring down primary at %s", pbs_conf.pbs_server_name);
	log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  msg_daemonname, log_buffer);

	rc = system(stonith_cmd);

	if (rc != 0) {
		snprintf(log_buffer, LOG_BUF_SIZE,
			 "STONITH script execution failed, script exit code: %d", rc);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_CRIT,
			  msg_daemonname, log_buffer);
	} else {
		snprintf(log_buffer, LOG_BUF_SIZE,
			 "STONITH script executed successfully");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
			  msg_daemonname, log_buffer);
	}

	/* read the contents of out_err_fl and load to out_err_msg */
	if ((fd = open(out_err_fl, 0)) != -1) {
		if (fstat(fd, &stbuf) != -1) {
			out_err_msg = malloc(stbuf.st_size + 1);
			if (out_err_msg == NULL) {
				close(fd);
				unlink(out_err_fl);
				log_err(errno, __func__, "malloc failed");
				return -1;
			}

			if (read(fd, out_err_msg, stbuf.st_size) == -1) {
				close(fd);
				snprintf(log_buffer, LOG_BUF_SIZE,
					 "%s: read failed, errno: %d", out_err_fl, errno);
				log_err(errno, __func__, log_buffer);
				free(out_err_msg);
				return -1;
			}

			*(out_err_msg + stbuf.st_size) = '\0';
			p = out_err_msg + strlen(out_err_msg) - 1;

			while ((p >= out_err_msg) && (*p == '\r' || *p == '\n'))
				*p-- = '\0'; /* supress the last newline */
		}
		close(fd);
	}

	if (out_err_msg) {
		snprintf(log_buffer, LOG_BUF_SIZE,
			 "%s, exit_code: %d.", out_err_msg, rc);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
			  msg_daemonname, log_buffer);
		free(out_err_msg);
	}

	unlink(out_err_fl);

	if (rc != 0)
		return -1;
	return rc;
}

/**
 * @brief
 *		Take control back from an active Secondary Server
 *
 * @par Functionality:
 *		Attempt to connect to the Secondary Server,  timeout the connection
 *		request if it isn't accepted in a short time.  If the connection
 *		cannot be made because the IP address is not available or if the
 *		connection is made but the Secondary does not acknowledge the request,
 *		the the Primary will print a message and exit (the process).
 *
 * @see
 * 		main
 *
 * @return  - int: failover server role
 * @retval  0 - unable to contact the Secondary Server.
 * @retval  1 - Contacted Secondary and it acknowledged the takeover request.
 */
int
takeover_from_secondary()
{
	struct batch_request *pfo_req;
	pbs_net_t addr;
	int sock;
	conn_t *conn;

	/*
	 * need to do a limited initialization of the network tables,
	 * connect to the secondary,
	 * send a go away message,
	 * wait for the reply which is very ununusual for us,
	 * wait a bit, and then clean up the network tables
	 */

	(void) init_network(0);
	(void) init_network_add(-1, NULL, NULL);

	/* connect to active secondary if we can */
	/* if connected, send take-over request */
	/* wait for reply */
	addr = get_hostaddr(pbs_conf.pbs_secondary);
	if (addr == (pbs_net_t) 0) {
		fprintf(stderr, "Cannot get network address of Secondary, aborting\n");
		exit(1);
	}
	sock = alt_conn(addr, 4);
	if (sock < 0)
		return 0;

	conn = add_conn(sock, ToServerDIS, addr, 0, NULL, read_reg_reply);
	if (conn == NULL) {
		/* path highly unlikely but theoretically possible */

		fprintf(stderr, "Connection not found, abort takeover from secondary\n");
		exit(1);
	}

	conn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;

	if ((pfo_req = alloc_br(PBS_BATCH_FailOver)) == NULL) {
		fprintf(stderr, "Unable to allocate request structure, abort takeover from secondary\n");
		exit(1);
	}
	pfo_req->rq_ind.rq_failover = FAILOVER_PrimIsBack;
	if (put_failover(sock, pfo_req) != 0) {
		fprintf(stderr, "Could not communicate with Secondary, aborting\n");
		exit(1);
	}
	goidle_ack = 1;
	(void) wait_request(600, NULL);

	if (goidle_ack == 1) {
		/* cannot seem to force active secondary to go idle */
		fprintf(stderr, "Secondary not idling, aborting\n");
		exit(2);
	}
	printf("Have taken control from Secondary Server\n");
	return 1;
}

/**
 * @brief
 * 		be_secondary - detect if primary is up
 *		if primary up - wait for it to go down, then take over
 *		if primary down and delay is not -1, wait for primary to come up
 *		if primary down and delay is -1, then take over now
 *
 * @see
 *		main
 *
 * @param[in] delay - time for which secondary to wait for primary to come up.
 *
 *	returns: 1 - if should stay inactive secondary
 *		 0 - if should take over as active
 */
int
be_secondary(time_t delay)
{
	int loop = 0;
	pbs_net_t primaddr;
	struct batch_request *pfo_req;
	struct stat sb;
	int sbloop = 0;
	time_t sbtime = 0;
	FILE *secact;
	time_t mytime = 0;
	time_t takeov_on_nocontact;
	conn_t *conn;
	int rc = 0;

	/*
	 * do limited initialization of the network tables
	 * send register request to Primary
	 * loop waiting for handshake
	 */

	(void) init_network(0);
	(void) init_network_add(-1, NULL, NULL);
	hd_time = time(0);

	/* connect to primary */

	primaddr = get_hostaddr(pbs_conf.pbs_primary);
	if (primaddr == (pbs_net_t) 0) {
		fprintf(stderr, "pbs_server: unable to obtain Primary Server's network address, aborting.\n");
		exit(1);
	}

	if (secondary_delay == (time_t) -1) {
		secondary_delay = 0;
		printf("pbs_server: secondary directed to start up as active\n");
	} else {
		sprintf(log_buffer, "pbs_server: coming up as Secondary, Primary is %s", pbs_conf.pbs_primary);
		printf("%s\n", log_buffer);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  msg_daemonname, log_buffer);
	}
	takeov_on_nocontact = hd_time + (60 * 5) + secondary_delay;

#ifndef DEBUG
	pbs_close_stdfiles(); /* set stdin/stdout/stderr to /dev/null */
#endif			      /* DEBUG */

	/*
	 * Secondary Server State machine
	 */

	while (1) {
		time_now = time(0);
		++loop;

		DBPRT(("Failover: Secondary_state is %d\n", Secondary_state));
		switch (Secondary_state) {
			case SECONDARY_STATE_noconn:
			case SECONDARY_STATE_idle:

				/* for both noconn and idle try to reconnect */
				sbloop = 0;
				sbtime = 0;
				mytime = 0;

				if (sec_sock >= 0)
					close_conn(sec_sock);

				sec_sock = client_to_svr(primaddr, pbs_server_port_dis, B_RESERVED);
				if (sec_sock < 0) {

					/* failed to reconnect to primary */
					/* if _idle, just try again later */
					/* else if time is up, go active  */

					if ((Secondary_state == SECONDARY_STATE_noconn) && ((delay == (time_t) -1) || (time_now > takeov_on_nocontact))) {
						/* can take over role of active server */
						sec_sock = -1;
						Secondary_state = SECONDARY_STATE_takeov;
					} else {
						/* wait for primary to come up and try again */
						sec_sock = -1;
						sleep(10);
					}
				} else {
					/* made contact with primary, set to send registration */
					Secondary_state = SECONDARY_STATE_conn;
					conn = add_conn(sec_sock, ToServerDIS, primaddr, 0, NULL,
							read_reg_reply);
					if (conn) {
						conn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;
						DBPRT(("Failover: reconnected to primary\n"))
					} else {
						/* a possible but unlikely case */
						log_err(-1, "be_secondary",
							"Connection not found, close socket free context");
						(void) CS_close_socket(sec_sock);
						close(sec_sock);
					}
				}
				break;

			case SECONDARY_STATE_conn:

				/* Primary is up, so send register request and wait on reply */
				/* state changed when reply processed, see read_reg_reply     */

				if ((pfo_req = alloc_br(PBS_BATCH_FailOver)) == NULL) {
					close_conn(sec_sock);
					Secondary_state = SECONDARY_STATE_noconn;
					sec_sock = -1;
				} else {
					pfo_req->rq_ind.rq_failover = FAILOVER_Register;
					if (put_failover(sec_sock, pfo_req) == 0) {
						Secondary_state = SECONDARY_STATE_regsent;
					} else {
						close_conn(sec_sock);
						Secondary_state = SECONDARY_STATE_noconn;
						sec_sock = -1;
					}
					free_br(pfo_req);
				}
				break;

			case SECONDARY_STATE_regsent:
				/* waiting on reply from register, do nothing ... */
				/* state will change in read_reg_reply() 	  */
				break;

			case SECONDARY_STATE_handsk:
				/* waiting for handshake from the primary	*/
				/* check to see if it has been too long		*/
				if (time_now >= (hd_time + 2 * HANDSHAKE_TIME)) {
					/* haven't received handshake recently */
					Secondary_state = SECONDARY_STATE_nohsk;
					sprintf(log_buffer, "Secondary has not received handshake in %ld seconds", time_now - hd_time);
					log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
						  LOG_WARNING, msg_daemonname, log_buffer);
				}
				break;

			case SECONDARY_STATE_nohsk:
				/* have not received a hankshake or connection closed */
				/* check time stamp on path_svrlive */
				if (stat(path_svrlive, &sb) == 0) {

					/* able to stat the server database */

					DBPRT(("Failover: my: %ld stat: %ld dly: %ld\n",
					       time_now, sb.st_mtime, secondary_delay))

					if (sb.st_mtime > sbtime) {
						/* mtime appears to be changing...           */
						/* this happens at least the first time here */
						sbtime = sb.st_mtime;
						mytime = time_now;

						if ((sbloop++ > 4) && (sec_sock == -1)) {
							/* files still being touched, but    */
							/* no handshake,  try to reconnect   */
							DBPRT(("Failover: going to noconn, still being touched\n"))
							Secondary_state = SECONDARY_STATE_noconn;
						}

					} else if (time_now > (mytime + secondary_delay)) {
						/* mtime hasn't changed in too long, take over */
						Secondary_state = SECONDARY_STATE_takeov;
					}

				} else if (time_now > (hd_time + secondary_delay)) {
					/*
					 * couldn't stat the directory in the last
					 * "secondary_delay" seconds, Secondary must be
					 * the one off the network, try to reconnect
					 */
					Secondary_state = SECONDARY_STATE_noconn;
					log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
						  LOG_CRIT, msg_daemonname,
						  "Secondary unable to stat server live file");
					DBPRT(("Failover: going to noconn, cannot stat\n"))

				} else if ((sec_sock == -1) && ((loop % 3) == 0)) {
					/* no connection and cannot stat, try   */
					/* once in a while to quickly reconnect */
					if ((sec_sock = alt_conn(primaddr, 8)) >= 0) {
						Secondary_state = SECONDARY_STATE_conn;
						conn = add_conn(sec_sock, ToServerDIS, primaddr, 0, NULL,
								read_reg_reply);
						if (conn) {
							conn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;
							DBPRT(("Failover: reconnected to primary\n"))
						} else {
							/* a possible but unlikely case */
							log_err(-1, "be_secondary",
								"Connection not found, close socket free context");
							(void) CS_close_socket(sec_sock);
							close(sec_sock);
						}
					}
				}
				break;

			case SECONDARY_STATE_shutd:
				exit(0); /* told to shutdown */

			case SECONDARY_STATE_takeov:
				/* check with Primary one last time before taking over */
				if (sec_sock != -1) {
					close_conn(sec_sock);
					sec_sock = -1;
				}
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
					  msg_daemonname, "Secondary attempting to connect with Primary one last time before taking over");
				if ((sec_sock = alt_conn(primaddr, 8)) >= 0) {
					Secondary_state = SECONDARY_STATE_conn;
					conn = add_conn(sec_sock, ToServerDIS, primaddr, 0, NULL,
							read_reg_reply);
					if (conn) {
						conn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;
						log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
							  LOG_NOTICE, msg_daemonname,
							  "Secondary reconnected with Primary");
					} else {
						/* a possible but unlikely case */
						log_err(-1, "be_secondary",
							"Connection not found, close socket free context");
						(void) CS_close_socket(sec_sock);
						close(sec_sock);
					}
					break;
				}
				/* Invoke stonith, to make sure primary is down */
				rc = check_and_invoke_stonith(pbs_conf.pbs_primary);
				if (rc) {
					snprintf(log_buffer, LOG_BUF_SIZE,
						 "Secondary will attempt taking over again");
					log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
						  msg_daemonname, log_buffer);

					sleep(10);
					break;
				}
				/* take over from primary */
				pbs_failover_active = 1;
				secact = fopen(path_secondaryact, "w");
				if (secact != NULL) {
					/* create file that says secondary is up */
					fprintf(secact, "%s\n", server_host);
					fclose(secact);
					DBPRT(("Secondary server creating %s\n", path_secondaryact))
				}
				return (0);

			case SECONDARY_STATE_inact:
				/*
				 * first wait for Primary to close connection indicating
				 * that it is going down, then wait a safety few more seconds
				 */
				(void) wait_request(600, NULL);
				sleep(10);
				log_event(PBSEVENT_DEBUG, LOG_DEBUG, PBS_EVENTCLASS_SERVER,
					  msg_daemonname,
					  "Secondary completed waiting for Primary to go down");
				close_conn(sec_sock);
				sec_sock = -1;
				/* change state to indicate Secondary is idle */
				Secondary_state = SECONDARY_STATE_idle;
				/* will recycle back to the top */
				break;
		}

		if (wait_request(1, NULL) == -1) {
			Secondary_state = SECONDARY_STATE_noconn;
			close_conn(sec_sock);
			sec_sock = -1;
		}
	}
}


================================================
FILE: src/server/geteusernam.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @brief
 * geteusernam.c	- Functions relating to effective user name
 *
 *	Included public functions are:
 *
 *	determine_euser
 *	determine_egroup
 *	set_objexid
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <sys/param.h>
#include <grp.h>
#include <pwd.h>
#include "pbs_ifl.h"
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "reservation.h"
#include "server.h"
#include "pbs_error.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

/* External Data */

/**
 * @brief
 *  	determine_euser - determine the effective user name
 *
 *  	Determine with which "user name" this object is to be associated
 *  	 1. from user_list use name with host name that matches this host
 *  	 2. from user_list use name with no host specification
 *  	 3. user owner name
 *
 * @see
 *		set_objexid
 *
 * @param[in]	objtype - object type
 * @param[in]	pobj -  ptr to object to link in
 * @param[in]	pattr - pointer to User_List attribute
 * @param[in,out]	isowner - Return: 1  if object's owner chosen as euser
 *
 * @return pointer to the user name
 *
 */

static char *
determine_euser(void *pobj, int objtype, attribute *pattr, int *isowner)
{
	char *hit = 0;
	int i;
	struct array_strings *parst;
	char *pn;
	char *ptr;
	attribute *objattr;
	static char username[PBS_MAXUSER + 1];

	memset(username, '\0', sizeof(username));

	/* set index and pointers based on object type */
	if (objtype == JOB_OBJECT)
		objattr = get_jattr((job *) pobj, JOB_ATR_job_owner);
	else
		objattr = get_rattr((resc_resv *) pobj, RESV_ATR_resv_owner);

	/* search the User_List attribute */

	if (is_attr_set(pattr) &&
	    (parst = pattr->at_val.at_arst)) {
		*isowner = 0;
		for (i = 0; i < parst->as_usedptr; i++) {
			pn = parst->as_string[i];
			ptr = strchr(pn, '@');
			if (ptr) { /* if has host specification, check for the complete host name, if host name is incorrect, hit is not set */
				if (!strcasecmp(server_host, ptr + 1)) {
					hit = pn; /* option 1. */
					break;
				}
			} else {	  /* wildcard host (null) */
				hit = pn; /* option 2. */
			}
		}
	}
	if (!is_attr_set(pattr)) { /* if no user is specified, default to the object owner ( 3.) */
		hit = get_attr_str(objattr);
		*isowner = 1;
	}

	/* copy user name into return buffer and strip off host name only when hit is set
	 * i.e. when either no user is specified(in this case, default the job to the object owner)
	 * or a user is provided with the correct host name.
	 * If not set, job can't be run as no user to run the job */
	if (hit) {
		cvrt_fqn_to_name(hit, username);
	}

	return (username);
}

/**
 * @brief
 * 		determine_egroup - determine the effective group name
 *
 * 		Determine (for this host) with which "group name" this object is to be
 * 		associated
 *
 * @par	Functionality:
 *  	1. from group_list use name with host name that matches this host
 *  	2. from group_list use name with no host specification
 *  	3. NULL, not specified
 *
 *	@see
 *		set_objexid
 *
 * @param[in]	objtype - object type
 * @param[in]	pobj -  ptr to object to link in
 * @param[in]	pattr - pointer to group_list attribute
 *
 * Returns pointer to the group name or a NULL pointer
 */

static char *
determine_egroup(void *pobj, int objtype, attribute *pattr)
{
	char *hit = 0;
	int i;
	struct array_strings *parst;
	char *pn;
	char *ptr;
	static char groupname[PBS_MAXUSER + 1];

	/* search the group-list attribute */

	if ((is_attr_set(pattr)) &&
	    (parst = pattr->at_val.at_arst)) {
		for (i = 0; i < parst->as_usedptr; i++) {
			pn = parst->as_string[i];
			ptr = strchr(pn, '@');
			if (ptr) { /* has host specification */
				if (!strncasecmp(server_host, ptr + 1, strlen(ptr + 1))) {
					hit = pn; /* option 1. */
					break;
				}
			} else {	  /* wildcard host (null) */
				hit = pn; /* option 2. */
			}
		}
	}
	if (!hit) /* nothing sepecified, return null */
		return NULL;

	/* copy group name into return buffer, strip host name */
	cvrt_fqn_to_name(hit, groupname);
	return (groupname);
}

/**
 * @brief
 * 		set_objexid - validate and set the object's effective/execution username
 *		and its effective/execution group name attributes.  For jobs, these
 *		are JOB_ATR_euser and JOB_ATR_egroup attributes of the job structure.
 *		For reservations, they are RESV_ATR_euser and RESV_ATR_egroup of the
 *		resc_resv structure.
 *
 * @par	Functionality:
 *		1.  Determine the effective/execution user_name.
 *		1a. Get the password entry for that username.
 *		1b. Uid of 0 (superuser) is not allowed, might cause root-rot
 *		1c. Determine if the object's owner name is permitted to map
 *	    to the effective/execution username
 *		1d. Set the object's effective/execution user_name to the name
 *	    that got determined in the above steps
 *		2.  Determine the effective/execution group name.
 *		2a. Determine if the effective/execution user_name belongs to
 *	    this effective/execution group
 *		2b. Set JOB_ATR_egroup to the execution group name.
 *		2b. Set the object's effective/execution group_name to the name
 *	    that got determined in the above step
 *
 * @see
 *		modify_job_attr, req_resvSub and svr_chkque
 *
 * @param[in]	objtype - object type
 * @param[in]	pobj -  ptr to object to link in
 * @param[in]	pattr - pointer to attribute structure
 * 						which contains group_List attributes and User_List attributes
 *
 * @returns	 int
 * @retval	 0	- if everything got determined and set appropriately else,
 * @retval	non-zero	- error number if something went awry
 */

int
set_objexid(void *pobj, int objtype, attribute *attrry)
{
	int addflags = 0;
	int isowner;
	attribute *pattr;
	char *puser;
	char *pgrpn;
	char *owner;
	int idx_ul, idx_gl;
	int idx_owner, idx_euser, idx_egroup;
	int idx_acct;
	int bad_euser, bad_egrp;
	attribute *objattrs;
	attribute_def *obj_attr_def;
	attribute *paclRoot; /*future: aclRoot resv != aclRoot job*/
	char **pmem;
	struct group *gpent;
	struct passwd *pwent;
	char gname[PBS_MAXGRPN + 1];

	/* determine index values and pointers based on object type */
	if (objtype == JOB_OBJECT) {
		idx_ul = (int) JOB_ATR_userlst;
		idx_gl = (int) JOB_ATR_grouplst;
		idx_owner = (int) JOB_ATR_job_owner;
		idx_euser = (int) JOB_ATR_euser;
		idx_egroup = (int) JOB_ATR_egroup;
		idx_acct = (int) JOB_ATR_account;
		obj_attr_def = job_attr_def;
		objattrs = ((job *) pobj)->ji_wattr;
		owner = get_jattr_str(pobj, idx_owner);
		paclRoot = get_sattr(SVR_ATR_AclRoot);
		bad_euser = PBSE_BADUSER;
		bad_egrp = PBSE_BADGRP;
	} else {
		idx_ul = (int) RESV_ATR_userlst;
		idx_gl = (int) RESV_ATR_grouplst;
		idx_owner = (int) RESV_ATR_resv_owner;
		idx_euser = (int) RESV_ATR_euser;
		idx_egroup = (int) RESV_ATR_egroup;
		idx_acct = (int) RESV_ATR_account;
		obj_attr_def = resv_attr_def;
		objattrs = ((resc_resv *) pobj)->ri_wattr;
		owner = get_rattr_str(pobj, idx_owner);
		paclRoot = get_sattr(SVR_ATR_AclRoot);
		bad_euser = PBSE_R_UID;
		bad_egrp = PBSE_R_GID;
	}

	/* if passed in "User_List" attribute is set use it - this may
	 * be a newly modified one.
	 * if not set, fall back to the object's User_List, which may
	 * actually be the same as what is passed into this function
	 */

	if ((attrry + idx_ul)->at_flags & ATR_VFLAG_SET)
		pattr = attrry + idx_ul;
	else
		pattr = &objattrs[idx_ul];

	if ((puser = determine_euser(pobj, objtype, pattr, &isowner)) == NULL)
		return (bad_euser);

	pwent = getpwnam(puser);
	if (pwent == NULL) {
		if (!get_sattr_long(SVR_ATR_FlatUID))
			return (bad_euser);
	} else if (pwent->pw_uid == 0) {
		if (!is_attr_set(paclRoot))
			return (bad_euser); /* root not allowed */
		if (acl_check(paclRoot, owner, ACL_User) == 0)
			return (bad_euser); /* root not allowed */
	}

	if (!isowner || !get_sattr_long(SVR_ATR_FlatUID)) {
		if (site_check_user_map(pobj, objtype, puser) == -1)
			return (bad_euser);
	}

	pattr = &objattrs[idx_euser];
	free_attr(obj_attr_def, pattr, idx_euser);
	set_attr_generic(pattr, &obj_attr_def[idx_euser], puser, NULL, INTERNAL);

	if (pwent != NULL) {
		/* if account (qsub -A) is not specified, set to empty string */

		pattr = &objattrs[idx_acct];
		if (!is_attr_set(pattr))
			set_attr_generic(pattr, &obj_attr_def[idx_acct], "\0", NULL, INTERNAL);

		/*
		 * now figure out (for this host) the effective/execute "group name"
		 * for the object.
		 * PBS requires that each group have an entry in the group file,
		 * see the admin guide for the reason why...
		 *
		 * use the passed group_list if set, may be a newly modified one.
		 * if it isn't set, use the object's group_list, which may in fact
		 * be same as what was passed
		 */

		if (is_attr_set(attrry + idx_gl))
			pattr = attrry + idx_gl;
		else
			pattr = &objattrs[idx_gl];
		if ((pgrpn = determine_egroup(pobj, objtype, pattr)) != NULL) {

			/* user specified a group, group must exists and either	   */
			/* must be user's primary group	 or the user must be in it */

			gpent = getgrnam(pgrpn);
			if (gpent == NULL) {
				if (pwent != NULL)	   /* no such group is allowed */
					return (bad_egrp); /* only when no user (flatuid)*/

			} else if (gpent->gr_gid != pwent->pw_gid) { /* not primary */
				pmem = gpent->gr_mem;
				while (*pmem) {
					if (!strcmp(puser, *pmem))
						break;
					++pmem;
				}
				if (*pmem == 0)
					return (bad_egrp); /* user not in group */
			}
			addflags = ATR_VFLAG_SET;

		} else {

			/* Use user login group */
			gpent = getgrgid(pwent->pw_gid);
			if (gpent != NULL) {
				pgrpn = gpent->gr_name; /* use group name */
			} else {
				(void) sprintf(gname, "%d", pwent->pw_gid);
				pgrpn = gname; /* turn gid into string */
			}

			/*
			 * setting the DEFAULT flag is a "kludy" way to keep MOM from
			 * having to do an unneeded look up of the group file.
			 * We needed to have JOB_ATR_egroup set for the server but
			 * MOM only wants it if it is not the login group, so there!
			 */
			addflags = ATR_VFLAG_SET | ATR_VFLAG_DEFLT;
		}
	} else {

		/*
		 * null password entry,
		 * set group to "default" and set default for Mom to use login group
		 */

		pgrpn = "-default-";
		addflags = ATR_VFLAG_SET | ATR_VFLAG_DEFLT;
	}

	pattr = attrry + idx_egroup;
	free_attr(obj_attr_def, pattr, idx_egroup);

	if (addflags != 0) {
		set_attr_generic(pattr, &obj_attr_def[idx_egroup], pgrpn, NULL, INTERNAL);
		pattr->at_flags |= addflags;
	}

	return (0);
}


================================================
FILE: src/server/hook_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    hook_func.c
 *
 * @brief
 * hook_func.c - contains functions to record accounting information
 *
 * Functions included are:
 *
 * hook_action_tid_set
 * hook_action_tid_get
 * hook_track_save
 * send_rescdef
 * hook_track_recov
 * mgr_hook_create
 * mgr_hook_delete
 * py_compile_and_run
 * mgr_hook_import
 * mgr_hook_export
 * copy_hook
 * mgr_hook_set
 * mgr_hook_unset
 * status_hook
 * req_stat_hook
 * set_exec_time
 * set_hold_types
 * set_attribute
 * set_job_varlist
 * set_job_reslist
 * attribute_jobmap_init
 * attribute_jobmap_clear
 * attribute_jobmap_restore
 * do_runjob_accept_actions
 * do_runjob_reject_actions
 * write_hook_reject_debug_output_and_close
 * write_hook_accept_debug_output_and_close
 * process_hooks
 * recreate_request
 * add_mom_hook_action
 * delete_mom_hook_action
 * find_mom_hook_action
 * add_pending_mom_hook_action
 * delete_pending_mom_hook_action
 * has_pending_mom_action_delete
 * sync_mom_hookfiles_count
 * collapse_hook_tr
 * mk_deferred_hook_info
 * post_sendhookTPP
 * check_add_hook_mcast_info
 * del_deferred_hook_cmds
 * sync_mom_hookfilesTPP
 * mc_sync_mom_hookfiles
 * add_pending_mom_allhooks_action
 * next_sync_mom_hookfiles
 * mark_mom_hooks_seen
 * mom_hooks_seen_count
 * uc_delete_mom_hooks
 * get_hook_rescdef_checksum
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <sys/param.h>
#include <dirent.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/wait.h>
#include <ctype.h>
#include <errno.h>
#include <assert.h>

#include <memory.h>
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "libpbs.h"
#include "list_link.h"
#include "work_task.h"
#include "attribute.h"
#include "batch_request.h"
#include "hook.h"
#include "log.h"
#include "server_limits.h"
#include "attribute.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "placementsets.h"
#include <pbs_python.h> /* for python interpreter */
#include <signal.h>
#include "hook_func.h"
#include "net_connect.h"
#include "sched_cmds.h"
#include "tpp.h"
#include "reservation.h"
#include "cmds.h"
#include "server.h"
#include "pbs_sched.h"
#include "dis.h"
#include "acct.h"

/* External functions */
extern void disable_svr_prov();
extern void set_srv_prov_attributes();
extern int should_retry_route(int);

/* Local Private Functions */

/* Global Data items */
int do_sync_mom_hookfiles = 1;
int sync_mom_hookfiles_replies_pending = 0;
pbs_list_head vnode_attr_list;
pbs_list_head resv_attr_list;

/* Local Data */
static char merr[] = "malloc failed";
static int mom_hooks_seen = 0;		    /* # of mom hooks seen */
static long long int hook_action_tid = 0LL; /* transaction id of the next */
static int g_hook_replies_expected = 0;	    /* used only in TPP mode */
static int g_hook_replies_recvd = 0;	    /* used only in TPP mode */
static time_t g_sync_hook_time = 0;	    /* time when mom hook files were last sent */
static long long int g_sync_hook_tid = 0LL; /* identifies the latest group of hook updates to send out */
static unsigned long hook_rescdef_checksum = 0;

/* mom hook action(s) to keep track */

#define GROW_MOMHOOK_ARRAY_AMT 10
#define CONN_RETRY 3
#define IS_SPECIAL_CHAR(c) ((c == '"') || (c == '\'') || (c == ',') || (c == '\\'))
#define VALID_HOOK_CONFIG_SUFFIX ".json .py .txt .xml .ini"

#define SYNC_MOM_HOOKFILES_TIMEOUT_TPP 120 /* 2 minutes */
#define SYNC_MOM_HOOKFILES_TIMEOUT 900	   /* 15 minutes */

extern char *msg_daemonname;
extern char *path_priv;
extern char *path_hooks;
extern char *path_hooks_workdir;
extern char *path_hooks_tracking;

extern char path_log[];
extern char *log_file;
extern pbs_net_t pbs_server_addr;

extern char *msg_badexit;
extern char *msg_err_malloc;
extern char *msg_manager;
extern char *msg_man_cre;
extern char *msg_man_del;
extern char *msg_man_set;
extern char *msg_man_uns;
extern char *msg_noattr;
extern char *msg_internal;
extern char *msg_norelytomom;
extern pbs_list_head svr_allhooks;
extern pbs_list_head svr_queuejob_hooks;
extern pbs_list_head svr_postqueuejob_hooks;
extern pbs_list_head svr_modifyjob_hooks;
extern pbs_list_head svr_resvsub_hooks;
extern pbs_list_head svr_modifyresv_hooks;
extern pbs_list_head svr_movejob_hooks;
extern pbs_list_head svr_runjob_hooks;
extern pbs_list_head svr_jobobit_hooks;
extern pbs_list_head svr_management_hooks;
extern pbs_list_head svr_modifyvnode_hooks;
extern pbs_list_head svr_periodic_hooks;
extern pbs_list_head svr_provision_hooks;
extern pbs_list_head svr_resv_confirm_hooks;
extern pbs_list_head svr_resv_begin_hooks;
extern pbs_list_head svr_resv_end_hooks;
extern pbs_list_head svr_execjob_begin_hooks;
extern pbs_list_head svr_execjob_prologue_hooks;
extern pbs_list_head svr_execjob_epilogue_hooks;
extern pbs_list_head svr_execjob_preterm_hooks;
extern pbs_list_head svr_execjob_end_hooks;
extern pbs_list_head svr_exechost_periodic_hooks;
extern pbs_list_head svr_exechost_startup_hooks;
extern pbs_list_head svr_execjob_launch_hooks;
extern pbs_list_head svr_execjob_attach_hooks;
extern pbs_list_head svr_execjob_resize_hooks;
extern pbs_list_head svr_execjob_abort_hooks;
extern pbs_list_head svr_execjob_postsuspend_hooks;
extern pbs_list_head svr_execjob_preresume_hooks;
extern time_t time_now;
extern struct python_interpreter_data svr_interp_data;
extern pbs_list_head task_list_event;
extern struct work_task *add_mom_deferred_list(int stream, mominfo_t *minfo, void (*func)(struct work_task *), char *msgid, void *parm1, void *parm2);

extern char *path_rescdef;
extern char *path_hooks_rescdef;

extern int comp_resc_gt;
extern int comp_resc_lt;
extern int comp_resc_nc;

struct def_hk_cmd_info {
	int index;
	int event;
	long long int tid; /* transaction id */
};

/* structures required for TPP mcast communication
 * of hooks to moms
 */
typedef struct {
	int mconn;
	char *msgid;
	char *hookname;
	int action;
} hook_mcast_info_t;

/* global array of mcast information structs */
hook_mcast_info_t *g_hook_mcast_array = NULL;
int g_hook_mcast_array_len = 0;
extern int get_msgid(char **id);

/**
 * @brief
 *		hook_action_tid_set	- Sets the value of the global 'hook_action_tid' variable to the given
 *		'newval'.
 * @see
 *		main, hook_track_recov and mc_sync_mom_hookfiles.
 *
 * @param[in]	newval - the new value.
 *
 * @return void
 */
void
hook_action_tid_set(long long int newval)
{
	hook_action_tid = newval;
	snprintf(log_buffer, sizeof(log_buffer),
		 "hook_action_tid=%lld", hook_action_tid);
	log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER,
		  LOG_INFO, "hook_action_tid_set", log_buffer);
}
/**
 * @brief
 *		Returns the value of the global 'hook_action_tid' variable.
 *
 * @see
 *		sync_mom_hookfilesTPP and mc_sync_mom_hookfiles.
 *
 * @return long long int	- the 'hook_action_tid' value.
 */
long long int
hook_action_tid_get(void)
{
	return (hook_action_tid);
}

/**
 * @brief
 * 		attrlist_add	- Add <name> = <val> attributes to list headed by 'atl'
 *
 * @param[in,out]	atl -  attribute list headed by atl.
 * @param[in]		name - name, in the name value pair.
 * @param[in]		val -  val, in the name value pair.
 *
 * @return	int
 * @retval	0 - for success
 * @retval	1 - otherwise.
 */
static int
attrlist_add(pbs_list_head *atl, char *name, char *val)
{
	svrattrl *pal2;

	if ((name == NULL) || (val == NULL)) {
		log_err(-1, __func__, "name or val param is NULL");
		return (1);
	}

	if ((name[0] == '\0') || (val[0] == '\0')) {
		sprintf(log_buffer,
			"(%s,%s) - name or val parameter is empty", name, val);
		log_err(errno, __func__, log_buffer);
		return (1);
	}

	pal2 = attrlist_create(name, NULL, (int) strlen(val) + 1);
	if (pal2 == NULL) {
		sprintf(log_buffer,
			"(%s,%s) - failed to create attribute list", name, val);
		log_err(errno, __func__, log_buffer);
		return (1);
	}
	strcpy(pal2->al_value, val);
	append_link(atl, &pal2->al_link, pal2);
	return (0);
}

/* Mom Hooks tracking functions */

/**
 * @brief
 *		hook_track_save	- Save the mom hooks pending actions data to a path_hooks_tracking file.
 *		File format is:
 *		<mom_hostname>:<mom_port> <hookname> <action> <tid>
 *
 * @par Note:
 *		If 'minfo' is not NULL and k != -1, then data from action array attached
 *		to 'minfo' at index 'k' is appended to path_hooks_tracking file.
 *
 *		If 'minfo' is not NULL and k == -1, then no data is saved
 *		as hook_track_save() returns immediately.
 *
 *		If 'minfo' is NULL and whether or not k != -1 or k == -1, then data
 *		from action array attached to each mom in the system, gets
 *		appended to path_hooks_tracking file.
 *
 * @param[in]	minfo - used in conjunction with 'k' below:
 *			if not NULL and
 *			k != -1, then append only the array
 *			data attached to 'minfo'indexed at 'k' to
 *			path_hooks_tracking file.
 *
 * @param[in]	k     - used in conjunction with 'minfo' above.
 *
 * @return	void
 *
 */

void
hook_track_save(void *minfo, int k)
{
	int i, j;
	FILE *fp = NULL;
	mominfo_t **minfo_array = NULL;
	int minfo_array_size;
	mominfo_t *minfo_array_tmp[1];
	char msg[HOOK_MSG_SIZE + 1];
	mom_hook_action_t *hook_act;

	if ((minfo != NULL) && (k == -1))
		return;

	if (minfo != NULL) {

		fp = fopen(path_hooks_tracking, "a");
		minfo_array_tmp[0] = minfo;
		minfo_array = (mominfo_t **) minfo_array_tmp;
		minfo_array_size = 1;
	} else {
		fp = fopen(path_hooks_tracking, "w");
		minfo_array = mominfo_array;
		minfo_array_size = mominfo_array_size;
	}

	if (fp == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to open hook tracking file %s",
			 path_hooks_tracking);
		log_err(errno, __func__, log_buffer);
		return;
	}

	if (lock_file(fileno(fp), F_WRLCK, path_hooks_tracking, LOCK_RETRY_DEFAULT,
		      msg, sizeof(msg)) != 0) {
		log_err(errno, __func__, msg);
		fclose(fp);
		return; /* failed to lock */
	}

	for (i = 0; i < minfo_array_size; i++) {

		if (minfo_array[i] == NULL)
			continue;

		for (j = 0; j < ((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_num_action; j++) {

			if ((minfo == NULL) || (k == j)) {
				hook_act = ((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_action[j];
				if (hook_act) {
					fprintf(fp, "%s:%d %s %d %lld\n", minfo_array[i]->mi_host,
						minfo_array[i]->mi_port,
						hook_act->hookname,
						hook_act->action,
						hook_act->tid);
				}
			}
		}
	}
	fflush(fp);

	if (lock_file(fileno(fp), F_UNLCK, path_hooks_tracking, LOCK_RETRY_DEFAULT,
		      msg, sizeof(msg)) != 0)
		log_err(errno, __func__, msg);

	fclose(fp);
}
/**
 *
 * @brief
 *		send_rescdef	- checks if server's resourcedef file has a newer timestamp than the
 *		resourcedef file currently known to hooks, and if so sets up the
 *		necessary mom hook actions to send the resourcedef file to each of the
 *		mom hosts on the next sync_mom_hookfilesTPP() call.
 *
 * @param[in]	force - if set to '1', means to skip checking for timetamps
 * 			and just force setting up the mom hook actions to
 * 			send the resourcedef file to each of the mom hosts.
 *
 * @return void
 */

void
send_rescdef(int force)
{

	int st;
	int st2;
	struct stat sbuf;
	struct stat sbuf2;

	if (mom_hooks_seen <= 0) {
		if (mom_hooks_seen < 0) { /* should not happen */
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, __func__,
				  "mom_hooks_seen went negative, resetting to 0");
			mom_hooks_seen = 0;
		}
		return;
	}

	st = stat(path_rescdef, &sbuf);
	st2 = stat(path_hooks_rescdef, &sbuf2);

	if ((st == 0) && (sbuf.st_size > 0) &&
	    (force || ((st2 == -1) && (errno == ENOENT)) ||
	     ((st2 == 0) && (sbuf.st_mtime > sbuf2.st_mtime)))) {
		st = copy_file_internal(path_rescdef, path_hooks_rescdef);
		if (st != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "warning: Failed to copy %s %s (error %d)",
				 path_rescdef, path_hooks_rescdef, st);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER,
				  LOG_ERR, __func__, log_buffer);
		} else {
			add_pending_mom_hook_action(NULL, PBS_RESCDEF,
						    MOM_HOOK_ACTION_SEND_RESCDEF);
			do_sync_mom_hookfiles = 1;
		}
	} else if (((st == -1) || (sbuf.st_size == 0)) && (st2 == 0)) {
		/* server_priv/resourcedef disappeared and yet */
		/* server_priv/hooks/resourcedef still exists */
		add_pending_mom_hook_action(NULL, PBS_RESCDEF,
					    MOM_HOOK_ACTION_DELETE_RESCDEF);
		do_sync_mom_hookfiles = 1;
		(void) unlink(path_hooks_rescdef);
	}

	hook_rescdef_checksum = crc_file(path_hooks_rescdef);
}

/**
 * @brief
 *		hook_track_recov	- Recover the tracking data in path_hooks_tracking for mom hooks.
 *
 * @par Functionality
 *		The tracking data contains the pending mom hook actions, and in a file
 *		has the format:
 *		<mom_name> <port_number> <hook_name> <action> <tid>
 *
 * @note
 *		This is to recover any pending mom hook actions when the
 *		server restarts.
 *
 *		This will also look for the highest value <tid> it has recovered
 *		from the hooks tracking file, and uses that as the new value of
 *		the global variable hook_action_tid.
 *
 *		If a hook-related file (*.HK, *.PY, resourcedef) was sent to the
 *		remote mom, and the mom was able to get the file, and if the child
 *		server goes away before it can record the result in the hooks
 *		tracking file, then the main server would be left with still the old
 *		tracking entry for the hook action, and is retried again by the
 *		next spawned child server. If the main server dies in the middle
 *		of the transaction, when it restarts, it will be able to recover any
 *		hook action results by the child server. And if there are still
 *		pending actions, then they are retried by the next child server.
 *
 * @return      void
 */
void
hook_track_recov(void)
{
	int i, j;
	FILE *fp = NULL;
	char linebuf[BUFSIZ];
	int linenum;
	char *mom_name;
	char *hook_name;
	int port_num;
	char *port_num_str;
	int action;
	char *action_str;
	long long int hook_tid;
	char *p;
	char *p2;
	char msg[HOOK_MSG_SIZE + 1];
	int msg_len = HOOK_MSG_SIZE;
	mominfo_t *minfo = NULL;
	struct stat sbuf;
	long long int max_tid_recov = 0LL; /* holds maximum tid number seen */
	/* in mom hooks tracking file */

	if (stat(path_hooks_tracking, &sbuf) != 0) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to stat %s errno=%d", path_hooks_tracking,
			 errno);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, __func__, log_buffer);
		return;
	}

	fp = fopen(path_hooks_tracking, "r");
	if (fp == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to open file %s errno=%d",
			 path_hooks_tracking, errno);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, __func__, log_buffer);
		return;
	}

	if (lock_file(fileno(fp), F_RDLCK, path_hooks_tracking, LOCK_RETRY_DEFAULT,
		      msg, sizeof(msg)) != 0) {
		log_err(errno, __func__, msg);
		fclose(fp);
		return; /* failed to lock */
	}

	/* we now have a lock on the file */

	/* Need to clear out old entries */
	for (i = 0; i < mominfo_array_size; i++) {
		if (mominfo_array[i] == NULL)
			continue;
		for (j = 0; j < ((mom_svrinfo_t *) mominfo_array[i]->mi_data)->msr_num_action; j++) {
			if (((mom_svrinfo_t *) mominfo_array[i]->mi_data)->msr_action[j] != NULL) {
				free(((mom_svrinfo_t *) mominfo_array[i]->mi_data)->msr_action[j]);
				((mom_svrinfo_t *) mominfo_array[i]->mi_data)->msr_action[j] = NULL;
			}
		}
	}

	/* We'll recover what we can, and just ignore errors */
	/* encountered processing the hook tracking file entries */
	linenum = 0;
	while (fgets(linebuf, sizeof(linebuf), fp) != NULL) {

		linenum++;
		if ((p = strrchr(linebuf, '\n')) != NULL) {
			*p = '\0';
		} else {
			snprintf(msg, msg_len - 1,
				 "warning: line %d is too long", linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			continue;
		}
		/* ignore initial white space; skip blank lines */
		p = linebuf;

		/* skip whitespace */
		while ((*p != '\0') && isspace(*p))
			p++;

		if (*p == '\0')
			continue; /* empty line */

		mom_name = p;
		if ((p2 = strchr(linebuf, ':')) == NULL) {
			snprintf(msg, msg_len - 1,
				 "warning: line %d:  missing ':'", linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			continue;
		}

		if (*(p2 + 1) == '\0') {
			snprintf(msg, msg_len - 1,
				 "warning: line %d:  no <port num>",
				 linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			continue;
		}
		*p2 = '\0';

		p2++;
		port_num_str = p2;
		/* skip non-white space */
		while ((*p2 != '\0') && !isspace(*p2))
			p2++;

		if (*p2 == '\0') {
			snprintf(msg, msg_len - 1,
				 "warning: line %d:  no <hook name>",
				 linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			continue;
		}

		*p2 = '\0';

		port_num = atoi(port_num_str);

		/* skip whitespace */
		p2++;
		while ((*p2 != '\0') && isspace(*p2))
			p2++;

		if (*p2 == '\0') {
			snprintf(msg, msg_len - 1,
				 "warning: line %d:  no <hook name>",
				 linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			continue;
		}

		hook_name = p2;
		while ((*p2 != '\0') && !isspace(*p2))
			p2++;

		if (*p2 == '\0') {
			snprintf(msg, msg_len - 1,
				 "warning: line %d:  no <hook action>", linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			continue;
		}

		*p2++ = '\0';

		/* skip whitespace */
		while ((*p2 != '\0') && isspace(*p2))
			p2++;

		action_str = p2;

		/* get non-whitespace characters */
		while ((*p2 != '\0') && !isspace(*p2))
			p2++;

		if (*p2 == '\0') {
			snprintf(msg, msg_len - 1,
				 "warning: line %d:  no <tid>", linenum);
			log_err(PBSE_SYSTEM, __func__, msg);
			continue;
		}

		*p2 = '\0';

		action = atoi(action_str);

		p2++;

		/* skip whitespace */
		while ((*p2 != '\0') && isspace(*p2))
			p2++;

		/* preserve the recovered tid value */
		/* and use it to store into mom hook */
		/* action data structure */
		hook_tid = atoll(p2);
		if (hook_tid > max_tid_recov)
			max_tid_recov = hook_tid;

		/* optimization: use previous result if match */
		if ((minfo == NULL) ||
		    (strcasecmp(minfo->mi_host, mom_name) != 0) ||
		    (minfo->mi_port != port_num)) {

			minfo = find_mom_entry(mom_name, port_num);
		}
		if (minfo != NULL) {
			add_mom_hook_action(&((mom_svrinfo_t *) minfo->mi_data)->msr_action,
					    &((mom_svrinfo_t *) minfo->mi_data)->msr_num_action,
					    hook_name, action, 1, hook_tid);
		}
	}

	hook_action_tid_set(max_tid_recov);

	if (fp != NULL) {
		if (lock_file(fileno(fp), F_UNLCK, path_hooks_tracking,
			      LOCK_RETRY_DEFAULT, msg, sizeof(msg)) != 0) {
			log_err(errno, __func__, msg);
		}
		fclose(fp);
	}
}

/*
 ************************************************************************
 *   Hook-related Qmgr operations.
 ************************************************************************
 */

/**
 * @brief
 *		mgr_hook_create	- Processes a "create hook" qmgr request.
 *
 * @see
 *		req_manager
 *
 * @param[in]	preq	- the requestor info via batch request structure
 *
 * @note
 *		Returns a reply to the sender of the batch_request.
 */
void
mgr_hook_create(struct batch_request *preq)
{
	svrattrl *plist, *plx;
	hook *phook = NULL;
	hook *phook2 = NULL;
	char hook_msg[HOOK_MSG_SIZE] = {'\0'};
	char *hook_user_val = NULL;
	char *hook_fail_action_val = NULL;
	char *hook_freq_val = NULL;

	if (strlen(preq->rq_ind.rq_manager.rq_objname) == 0) {
		reply_text(preq, PBSE_HOOKERROR, "no hook name specified");
		return;
	}

	if ((phook2 = find_hook(preq->rq_ind.rq_manager.rq_objname)) != NULL) {
		if (phook2->pending_delete) {
			snprintf(hook_msg, sizeof(hook_msg),
				 "hook name \'%s\' is pending delete, try another name",
				 preq->rq_ind.rq_manager.rq_objname);
		} else {
			snprintf(hook_msg, sizeof(hook_msg),
				 "hook name \'%s\' already registered, try another name",
				 preq->rq_ind.rq_manager.rq_objname);
		}
		goto mgr_hook_create_error;
	}

	phook = hook_alloc();
	if (phook == NULL) {
		req_reject(PBSE_INTERNAL, 0, preq);
		return;
	}

	if (set_hook_name(phook, preq->rq_ind.rq_manager.rq_objname,
			  hook_msg, sizeof(hook_msg)) != 0) {
		goto mgr_hook_create_error;
	}
	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);

	plx = plist;
	while (plx) {
		if (strcasecmp(plx->al_name, HOOKATT_TYPE) == 0) {
			if (set_hook_type(phook, plx->al_value,
					  hook_msg, sizeof(hook_msg), 0) != 0)
				goto mgr_hook_create_error;
		} else if (strcasecmp(plx->al_name, HOOKATT_ENABLED) == 0) {
			if (set_hook_enabled(phook, plx->al_value,
					     hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_create_error;
		} else if (strcasecmp(plx->al_name, HOOKATT_DEBUG) == 0) {
			if (set_hook_debug(phook, plx->al_value,
					   hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_create_error;
		} else if (strcasecmp(plx->al_name, HOOKATT_USER) == 0) {
			/* setting hook user value must be a deferred action, */
			/* as it is dependent on event having */
			/* execjob_prologue, execjob_epilogue, or */
			/* execjob_preterm being set. The event set action */
			/* could appear after this set user action. */
			if (hook_user_val != NULL)
				free(hook_user_val);
			hook_user_val = strdup(plx->al_value);
			if (hook_user_val == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "strdup(%s) failed: errno %d",
					 plx->al_value, errno);
				goto mgr_hook_create_error;
			}
		} else if (strcasecmp(plx->al_name, HOOKATT_FAIL_ACTION) == 0) {
			/* setting hook fail_action value must be a deferred action, */
			/* as it is dependent on event mom hook event */
			/* being set. The event set action */
			/* could appear after this set fail_action. */
			if (hook_fail_action_val != NULL)
				free(hook_fail_action_val);
			hook_fail_action_val = strdup(plx->al_value);
			if (hook_fail_action_val == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "strdup(%s) failed: errno %d",
					 plx->al_value, errno);
				goto mgr_hook_create_error;
			}
		} else if (strcasecmp(plx->al_name, HOOKATT_EVENT) == 0) {
			if (set_hook_event(phook, plx->al_value,
					   hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_create_error;
		} else if (strcasecmp(plx->al_name, HOOKATT_ORDER) == 0) {
			if (set_hook_order(phook, plx->al_value,
					   hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_create_error;
		} else if (strcasecmp(plx->al_name, HOOKATT_ALARM) == 0) {
			if (set_hook_alarm(phook, plx->al_value,
					   hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_create_error;
		} else if (strcasecmp(plx->al_name, HOOKATT_FREQ) == 0) {
			/* setting hook freq value must be a deferred action, */
			/* as it is dependent on event having */
			/* exechost_periodic being set. The event set action */
			/* could appear after this set freq action. */
			if (hook_freq_val != NULL)
				free(hook_freq_val);
			hook_freq_val = strdup(plx->al_value);
			if (hook_freq_val == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "strdup(%s) failed: errno %d",
					 plx->al_value, errno);
				goto mgr_hook_create_error;
			}
		} else {
			snprintf(hook_msg, sizeof(hook_msg) - 1, "%s - %s",
				 msg_noattr, plx->al_name);
			goto mgr_hook_create_error;
		}

		plx = (svrattrl *) GET_NEXT(plx->al_link);
	}

	/* Now do the deferred set actions */
	if (hook_user_val != NULL) {
		if (set_hook_user(phook, hook_user_val,
				  hook_msg, sizeof(hook_msg), 1) != 0)
			goto mgr_hook_create_error;
		free(hook_user_val);
		hook_user_val = NULL;
	}
	/* Now do the deferred set fail_action */
	if (hook_fail_action_val != NULL) {
		if (set_hook_fail_action(phook, hook_fail_action_val,
					 hook_msg, sizeof(hook_msg), 1) != 0)
			goto mgr_hook_create_error;
		free(hook_fail_action_val);
		hook_fail_action_val = NULL;
	}
	if (hook_freq_val != NULL) {
		if (set_hook_freq(phook, hook_freq_val,
				  hook_msg, sizeof(hook_msg)) != 0)
			goto mgr_hook_create_error;
		free(hook_freq_val);
		hook_freq_val = NULL;
	}

	sprintf(log_buffer, msg_manager, msg_man_cre,
		preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  preq->rq_ind.rq_manager.rq_objname, log_buffer);

	if (hook_save(phook) != 0) {
		snprintf(hook_msg, sizeof(hook_msg),
			 "Failed to store '%s' permanently.",
			 preq->rq_ind.rq_manager.rq_objname);
		goto mgr_hook_create_error;
	}

	if (phook->event & MOM_EVENTS) {
		add_pending_mom_hook_action(NULL, phook->hook_name,
					    MOM_HOOK_ACTION_SEND_ATTRS);
		mom_hooks_seen++;
		if (mom_hooks_seen == 1) {
			/* used to be no mom hooks in the system, but now */
			/* one is introduced. So see if resourcedef file */
			/* changed and need to be flagged to be sent to */
			/* the moms */
			send_rescdef(0);
		}
	}
	reply_ack(preq); /*create completely successful*/
	return;

mgr_hook_create_error:
	if (hook_user_val != NULL)
		free(hook_user_val);
	if (hook_fail_action_val != NULL)
		free(hook_fail_action_val);
	if (hook_freq_val != NULL)
		free(hook_freq_val);

	if (phook)
		hook_purge(phook, pbs_python_ext_free_python_script);
	reply_text(preq, PBSE_HOOKERROR, hook_msg);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, hook_msg);
}

/**
 * @brief
 *		mgr_hook_delete	- Processes a "delete hook" qmgr request.
 *
 * @see
 * 		req_manager
 *
 * @param[in]	preq	- a batch_request structure representing the request.
 */
void
mgr_hook_delete(struct batch_request *preq)
{

	hook *phook = NULL;
	char hookname[PBS_MAXSVRJOBID + 1] = {'\0'};
	char hook_msg[HOOK_MSG_SIZE] = {'\0'};

	if (strlen(preq->rq_ind.rq_manager.rq_objname) == 0) {
		reply_text(preq, PBSE_HOOKERROR, "no hook name specified");
		return;
	}

	snprintf(hookname, sizeof(hookname), "%s", preq->rq_ind.rq_manager.rq_objname);

	phook = find_hook(hookname);

	if (phook == NULL) {
		snprintf(hook_msg, sizeof(hook_msg), "%s does not exist!",
			 hookname);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
			  hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		return;
	}

	if (phook->pending_delete) {
		snprintf(hook_msg, sizeof(hook_msg), "%s is pending delete!",
			 hookname);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
			  hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		return;
	}

	if (phook->type == HOOK_PBS) {
		sprintf(log_buffer, "cannot delete a PBS hook named %s",
			phook->hook_name);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
			  hookname, log_buffer);
		reply_text(preq, PBSE_HOOKERROR, "cannot delete a PBS hook");
		return;
	}

	if (phook->event & HOOK_EVENT_PROVISION)
		disable_svr_prov();

	if (phook->event & HOOK_EVENT_PERIODIC)
		delete_task_by_parm1_func(phook, NULL, DELETE_ALL);

	if (phook->event & MOM_EVENTS) {

		phook->pending_delete = 1;
		add_pending_mom_hook_action(NULL, phook->hook_name,
					    MOM_HOOK_ACTION_DELETE);
		mom_hooks_seen--;
		(void) snprintf(hook_msg, sizeof(hook_msg),
				"hook %s queued for deletion", phook->hook_name);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
			  hookname, hook_msg);
		if (hook_save(phook) != 0) {
			snprintf(hook_msg, sizeof(hook_msg),
				 "Warning: failed to store '%s' permanently.",
				 preq->rq_ind.rq_manager.rq_objname);
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
				  hookname, hook_msg);
		}
		reply_ack(preq); /*request completely successful*/
	} else {
		hook_purge(phook, pbs_python_ext_free_python_script);

		(void) sprintf(log_buffer, msg_manager, msg_man_del,
			       preq->rq_user, preq->rq_host);

		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
			  hookname, log_buffer);
		reply_ack(preq); /*request completely successful*/
	}
}

/**
 *  @brief
 *  	py_compile_and_run	- Compiles and/or runs the input_file_path based on file's suffix.
 *
 * @see
 * 		mgr_hook_import
 *
 *  @param[in]	input_file_path - file to compile and/or run.
 *  @param[out]	hook_msg - any error message resulting from compilation/run
 *				filled in here.
 *  @param[in]	msg_len - size of the hook_msg
 *  @param[in]	hook_name - name of the associated hook.
 *  @param[in]	compile_only - if set to 1, means to compile only
 *  				'input_file_path'
 *
 * @return int
 * @retval	0	- for success
 * @retval	!= 0	- for any failure encountered
 */
static int
py_compile_and_run(char *input_file_path, char *hook_msg, size_t msg_len,
		   char *hookname, int compile_only)
{
	struct python_script *py_test_script = NULL;
	int rc;

	if ((input_file_path == NULL) || (hook_msg == NULL) || (hookname == NULL)) {
		return -1;
	}

	memset(hook_msg, '\0', msg_len);

	if (pbs_python_ext_alloc_python_script(input_file_path,
					       (struct python_script **) &py_test_script) == -1) {
		snprintf(hook_msg, msg_len,
			 "failed to allocate storage for python script %s",
			 input_file_path);
		return -1;
	}

	if (compile_only) {
		rc = pbs_python_check_and_compile_script(&svr_interp_data,
							 py_test_script);
	} else {
		rc = pbs_python_run_code_in_namespace(&svr_interp_data,
						      py_test_script, 0);
	}
	/* free py_script immediately, as it was used only for */
	/* test compile */
	pbs_python_ext_free_python_script(py_test_script);
	free(py_test_script);
	py_test_script = NULL;

	if (rc != 0) {
		snprintf(hook_msg, msg_len,
			 "Failed to validate config file, "
			 "hook '%s' config file not overwritten",
			 hookname);
		return (rc);
	}

	return 0;
}

/**
 * @brief
 *		mgr_hook_import	- Processes an "import hook" qmgr request.
 * @note
 *		Returns a reply to the sender of the batch_request.
 * @see
 * 		req_manager
 *
 * @param[in]	preq	- batch_request structure representing request.
 */
void
mgr_hook_import(struct batch_request *preq)
{
	svrattrl *plist, *plx;
	char hookname[PBS_MAXSVRJOBID + 1] = {'\0'};
	hook *phook;
	char content_type[BUFSIZ];
	char content_encoding[BUFSIZ];
	char input_file[MAXPATHLEN + 1];
	char input_file_path[MAXPATHLEN + 1];
	char input_path[MAXPATHLEN + 1] = {'\0'};
	char temp_path[MAXPATHLEN + 1];
	char output_path[MAXPATHLEN + 1] = {'\0'};
	char msgbuf[HOOK_MSG_SIZE];
	char *hook_msg = NULL;
	int overwrite;
	struct python_script *py_test_script = NULL;
	int rc;
	int hook_obj;

	hook_obj = preq->rq_ind.rq_manager.rq_objtype;

	if (strlen(preq->rq_ind.rq_manager.rq_objname) == 0) {
		reply_text(preq, PBSE_HOOKERROR, "no hook name specified");
		return;
	}

	snprintf(hookname, sizeof(hookname), "%s", preq->rq_ind.rq_manager.rq_objname);

	phook = find_hook(hookname);

	if ((phook == NULL) || phook->pending_delete) {
		pbs_asprintf(&hook_msg, "%s does not exist!", hookname);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		free(hook_msg);
		return;
	}

	/* Normally, only HOOK_SITE hooks can be shown/operated on in qmgr. */
	/* But HOOK_PBS hooks can also be shown if the qmgr request is */
	/* specifically operating on the "pbshook" keyword. */
	if ((phook->type != HOOK_SITE) && (hook_obj != MGR_OBJ_PBS_HOOK)) {
		pbs_asprintf(&hook_msg, "%s not of '%s' type", hookname, HOOKSTR_SITE);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		free(hook_msg);
		return;
	}

	/* Cannot show a HOOK_SITE hook if the qmgr request keyword is */
	/* "pbshook" */
	if ((phook->type == HOOK_SITE) && (hook_obj == MGR_OBJ_PBS_HOOK)) {
		pbs_asprintf(&hook_msg, "%s not of '%s' type", hookname, HOOKSTR_PBS);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		free(hook_msg);
		return;
	}

	sprintf(log_buffer, msg_manager, __func__, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  hookname, log_buffer);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	plx = plist;
	content_type[0] = '\0';
	content_encoding[0] = '\0';
	input_file[0] = '\0';
	while (plx) {

		if (strcasecmp(plx->al_name, CONTENT_TYPE_PARAM) == 0) {
			if (plx->al_value == NULL) {
				pbs_asprintf(&hook_msg, "<%s> is NULL",
					     CONTENT_TYPE_PARAM);
				goto mgr_hook_import_error;
			}
			if (hook_obj == MGR_OBJ_PBS_HOOK) {
				if (strcmp(plx->al_value, HOOKSTR_CONFIG) != 0) {
					pbs_asprintf(&hook_msg, "<%s> must be %s",
						     CONTENT_TYPE_PARAM, HOOKSTR_CONFIG);
					goto mgr_hook_import_error;
				}
			} else if ((strcmp(plx->al_value, HOOKSTR_CONTENT) != 0) &&
				   (strcmp(plx->al_value, HOOKSTR_CONFIG) != 0)) {
				pbs_asprintf(&hook_msg, "<%s> must be %s or %s",
					     CONTENT_TYPE_PARAM, HOOKSTR_CONTENT, HOOKSTR_CONFIG);
				goto mgr_hook_import_error;
			}
			strcpy(content_type, plx->al_value);
		} else if (strcasecmp(plx->al_name,
				      CONTENT_ENCODING_PARAM) == 0) {
			if (plx->al_value == NULL) {
				pbs_asprintf(&hook_msg, "<%s> is NULL",
					     CONTENT_ENCODING_PARAM);
				goto mgr_hook_import_error;
			}
			if ((strcmp(plx->al_value, HOOKSTR_DEFAULT) != 0) &&
			    (strcmp(plx->al_value, HOOKSTR_BASE64) != 0)) {
				pbs_asprintf(&hook_msg, "<%s> must be '%s' or '%s'",
					     CONTENT_ENCODING_PARAM,
					     HOOKSTR_DEFAULT, HOOKSTR_BASE64);
				goto mgr_hook_import_error;
			}
			strcpy(content_encoding, plx->al_value);
		} else if (strcasecmp(plx->al_name, INPUT_FILE_PARAM) == 0) {
			if (plx->al_value == NULL) {
				pbs_asprintf(&hook_msg, "input-file is NULL");
				goto mgr_hook_import_error;
			}

			if (is_full_path(plx->al_value)) {
				pbs_asprintf(&hook_msg, "<%s> path must be relative to %s",
					     INPUT_FILE_PARAM, path_hooks_workdir);
				goto mgr_hook_import_error;
			}
			strcpy(input_file, plx->al_value);
		} else {
			pbs_asprintf(&hook_msg, "unrecognized parameter - %s",
				     plx->al_name);
			goto mgr_hook_import_error;
		}

		plx = (struct svrattrl *) GET_NEXT(plx->al_link);
	}

	if (strcmp(content_type, HOOKSTR_CONFIG) == 0) {
		char *p;
		FILE *temp_fp;
		char *p2;
		char tempfile_path[MAXPATHLEN + 1];

		p = strrchr(input_file, '.');
		if (p != NULL) {
			if (!in_string_list(p, ' ', VALID_HOOK_CONFIG_SUFFIX)) {
				pbs_asprintf(&hook_msg,
					     "<%s> contains an invalid suffix, "
					     "should be one of: %s",
					     INPUT_FILE_PARAM,
					     VALID_HOOK_CONFIG_SUFFIX);
				goto mgr_hook_import_error;
			}

			if (strcmp(p, ".py") == 0) {
				snprintf(input_file_path, sizeof(input_file_path),
					 "%s%s", path_hooks_workdir, input_file);
				rc = py_compile_and_run(input_file_path, msgbuf,
							sizeof(msgbuf) - 1, hookname, 1);
				if (rc != 0) {
					hook_msg = strdup(msgbuf);
					goto mgr_hook_import_error;
				}
			} else if (strcmp(p, ".ini") == 0) {
				snprintf(input_file_path, sizeof(input_file_path),
					 "%s%s", path_hooks_workdir, input_file);
				snprintf(tempfile_path, sizeof(tempfile_path),
					 "%s", input_file_path);
				p2 = strrchr(tempfile_path, '.');
				*p2 = '\0';
				temp_fp = fopen(tempfile_path, "w");
				if (temp_fp != NULL) {
					fprintf(temp_fp, "import ConfigParser\n");
					fprintf(temp_fp,
						"Config  = ConfigParser.RawConfigParser()\n");
					fprintf(temp_fp,
						"Config.read(\"%s\")\n", input_file_path);
					fclose(temp_fp);
					rc = py_compile_and_run(tempfile_path,
								msgbuf, sizeof(msgbuf) - 1,
								hookname, 0);
					if (rc != 0) {
						hook_msg = strdup(msgbuf);
						goto mgr_hook_import_error;
					}
				}
			} else if (strcmp(p, ".json") == 0) {
				snprintf(input_file_path, sizeof(input_file_path),
					 "%s%s", path_hooks_workdir, input_file);
				snprintf(tempfile_path, sizeof(tempfile_path),
					 "%s", input_file_path);
				p2 = strrchr(tempfile_path, '.');
				*p2 = '\0';
				temp_fp = fopen(tempfile_path, "w");
				if (temp_fp != NULL) {
					fprintf(temp_fp,
						"import json\n");
					fprintf(temp_fp,
						"fd = open(\"%s\")\n",
						input_file_path);
					fprintf(temp_fp,
						"json.load(fd)\n");
					fprintf(temp_fp,
						"fd.close()\n");
					fclose(temp_fp);
					rc = py_compile_and_run(tempfile_path,
								msgbuf, sizeof(msgbuf) - 1,
								hookname, 0);
					if (rc != 0) {
						hook_msg = strdup(msgbuf);
						goto mgr_hook_import_error;
					}
				}
			}
		}
	}

	snprintf(input_path, sizeof(input_path),
		 "%s%s", path_hooks_workdir, input_file);
	snprintf(temp_path, sizeof(temp_path), "%s%.*s.tmp", path_hooks_workdir,
		 (int) (sizeof(temp_path) - strlen(input_file) - 5), input_file);

	if (strcmp(content_type, HOOKSTR_CONTENT) == 0) {
		snprintf(output_path, sizeof(output_path),
			 "%s%s%s", path_hooks, hookname,
			 HOOK_SCRIPT_SUFFIX);
	} else if (strcmp(content_type, HOOKSTR_CONFIG) == 0) {
		snprintf(output_path, sizeof(output_path),
			 "%s%s%s", path_hooks, hookname,
			 HOOK_CONFIG_SUFFIX);
	} else {
		pbs_asprintf(&hook_msg, "<%s> is unknown", CONTENT_TYPE_PARAM);
		goto mgr_hook_import_error;
	}

	overwrite = 0;
	if (file_exists(output_path))
		overwrite = 1;

	if (strcmp(content_type, HOOKSTR_CONFIG) == 0) {
		if (decode_hook_content(input_path, output_path, content_encoding,
					msgbuf, sizeof(msgbuf)) != 0) {
			hook_msg = strdup(msgbuf);
			goto mgr_hook_import_error;
		}
		if (overwrite) {
			pbs_asprintf(&hook_msg,
				     "hook '%s' contents overwritten", hookname);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, __func__, hook_msg);
			reply_text(preq, 0, hook_msg);
			free(hook_msg);
		} else {
			reply_ack(preq);
		}
		phook->hook_config_checksum = crc_file(output_path);

		if (phook->event & MOM_EVENTS)
			add_pending_mom_hook_action(NULL, phook->hook_name,
						    MOM_HOOK_ACTION_SEND_CONFIG);

		return;

	} else {
		if (decode_hook_content(input_path, temp_path, content_encoding,
					msgbuf, sizeof(msgbuf)) != 0) {
			hook_msg = strdup(msgbuf);
			goto mgr_hook_import_error;
		}
	}

	/* create a py_script */
	if (pbs_python_ext_alloc_python_script(temp_path,
					       (struct python_script **) &py_test_script) == -1) {
		pbs_asprintf(&hook_msg,
			     "failed to allocate storage for python script %s",
			     temp_path);
		unlink(temp_path);
		goto mgr_hook_import_error;
	}
	/* try compiling the now decoded file */
	rc = pbs_python_check_and_compile_script(&svr_interp_data,
						 py_test_script);
	/* free py_script immediately, as it was used only for test compile */
	pbs_python_ext_free_python_script(py_test_script);
	free(py_test_script);

	if (rc != 0) {
		if (overwrite)
			pbs_asprintf(&hook_msg,
				     "Failed to compile script, "
				     "hook '%s' contents not overwritten",
				     hookname);
		else
			pbs_asprintf(&hook_msg, "Failed to compile script");

		unlink(temp_path);
		goto mgr_hook_import_error;
	}

	/* now actually overwrite the old file, no decoding this time */
	if (decode_hook_content(temp_path, output_path, HOOKSTR_DEFAULT,
				msgbuf, sizeof(msgbuf)) != 0) {
		hook_msg = strdup(msgbuf);
		unlink(temp_path);
		goto mgr_hook_import_error;
	}

	unlink(temp_path);

	if (overwrite) {
		pbs_asprintf(&hook_msg, "hook '%s' contents overwritten", hookname);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, __func__, hook_msg);
		reply_text(preq, 0, hook_msg);
		free(hook_msg);
	} else {
		reply_ack(preq);
	}

	if (phook->script) {
		pbs_python_ext_free_python_script(phook->script);
		free(phook->script);
		phook->script = NULL;
	}

	if (pbs_python_ext_alloc_python_script(output_path,
					       (struct python_script **) &phook->script) == -1) {
		pbs_asprintf(&hook_msg,
			     "failed to allocate storage for python script %s",
			     output_path);
		goto mgr_hook_import_error;
	}

	phook->hook_script_checksum = crc_file(output_path);

	if (phook->event & HOOK_EVENT_PROVISION)
		set_srv_prov_attributes(); /* check and set prov attributes */

	if (phook->event & MOM_EVENTS)
		add_pending_mom_hook_action(NULL, phook->hook_name,
					    MOM_HOOK_ACTION_SEND_SCRIPT);

	if (phook->event & HOOK_EVENT_PERIODIC) {
		set_srv_pwr_prov_attribute(); /* check and set power attributes */
		if ((phook->enabled == TRUE) && (phook->freq > 0)) {
			/* Search and delete all already existing periodic hook task */
			delete_task_by_parm1_func(phook, NULL, DELETE_ALL);
			(void) set_task(WORK_Timed, time_now + phook->freq, run_periodic_hook, phook);
		}
	}

	add_to_svrattrl_list(&preq->rq_ind.rq_manager.rq_attr, OUTPUT_FILE_PARAM,
			     NULL, output_path, 0, NULL);
	return;

mgr_hook_import_error:
	unlink(temp_path);
	reply_text(preq, PBSE_HOOKERROR, hook_msg);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, hook_msg);
	free(hook_msg);
}

/**
 * @brief
 *		mgr_hook_export	- Processes an "export hook" qmgr request.
 * @note
 *		Returns a reply to the sender of the batch_request.
 *
 * @see
 * 		req_manager
 *
 * @param[in]	preq	- batch_request structure representing the request.
 */
void
mgr_hook_export(struct batch_request *preq)
{
	svrattrl *plist, *plx;
	char hookname[PBS_MAXSVRJOBID + 1] = {'\0'};
	hook *phook;
	char content_type[BUFSIZ];
	char content_encoding[BUFSIZ];
	char output_file[MAXPATHLEN + 1];
	char input_path[MAXPATHLEN + 1] = {'\0'};
	char output_path[MAXPATHLEN + 1] = {'\0'};
	char hook_msg[HOOK_MSG_SIZE] = {'\0'};
	int hook_obj;

	hook_obj = preq->rq_ind.rq_manager.rq_objtype;

	if (strlen(preq->rq_ind.rq_manager.rq_objname) == 0) {
		reply_text(preq, PBSE_HOOKERROR, "no hook name specified");
		return;
	}

	snprintf(hookname, sizeof(hookname), "%.*s", PBS_MAXSVRJOBID,
		 preq->rq_ind.rq_manager.rq_objname);

	/* Else one and only one vhook */
	phook = find_hook(hookname);

	if ((phook == NULL) || phook->pending_delete) {
		snprintf(hook_msg, sizeof(hook_msg), "%s does not exist!", hookname);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		return;
	}

	/* Normally, only HOOK_SITE hooks can be shown/operated on in qmgr. */
	/* But HOOK_PBS hooks can also be shown if the qmgr request is */
	/* specifically operating on the "pbshook" keyword. */
	if ((phook->type != HOOK_SITE) && (hook_obj != MGR_OBJ_PBS_HOOK)) {
		snprintf(hook_msg, sizeof(hook_msg), "%s not of '%s' type", hookname, HOOKSTR_SITE);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		return;
	}

	/* Cannot show a HOOK_SITE hook if the qmgr request keyword is */
	/* "pbshook" */
	if ((phook->type == HOOK_SITE) && (hook_obj == MGR_OBJ_PBS_HOOK)) {
		snprintf(hook_msg, sizeof(hook_msg), "%s not of '%s' type", hookname, HOOKSTR_PBS);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		return;
	}

	sprintf(log_buffer, msg_manager, __func__, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  hookname, log_buffer);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	plx = plist;
	content_type[0] = '\0';
	content_encoding[0] = '\0';
	output_file[0] = '\0';
	while (plx) {

		if (strcasecmp(plx->al_name, CONTENT_TYPE_PARAM) == 0) {
			if (plx->al_value == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "<%s> is NULL", CONTENT_TYPE_PARAM);
				goto mgr_hook_export_error;
			}
			if (hook_obj == MGR_OBJ_PBS_HOOK) {
				if (strcmp(plx->al_value, HOOKSTR_CONFIG) != 0) {
					snprintf(hook_msg, sizeof(hook_msg),
						 "<%s> must be %s",
						 CONTENT_TYPE_PARAM, HOOKSTR_CONFIG);
					goto mgr_hook_export_error;
				}
			} else if ((strcmp(plx->al_value,
					   HOOKSTR_CONTENT) != 0) &&
				   (strcmp(plx->al_value, HOOKSTR_CONFIG) != 0)) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "<%s> must be %s",
					 CONTENT_TYPE_PARAM, HOOKSTR_CONTENT);
				goto mgr_hook_export_error;
			}
			strcpy(content_type, plx->al_value);
		} else if (strcasecmp(plx->al_name,
				      CONTENT_ENCODING_PARAM) == 0) {
			if (plx->al_value == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "<%s> is NULL", CONTENT_ENCODING_PARAM);
				goto mgr_hook_export_error;
			}
			if ((strcmp(plx->al_value, HOOKSTR_DEFAULT) != 0) &&
			    (strcmp(plx->al_value, HOOKSTR_BASE64) != 0)) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "<%s> must be '%s' or '%s'",
					 CONTENT_ENCODING_PARAM,
					 HOOKSTR_DEFAULT, HOOKSTR_BASE64);
				goto mgr_hook_export_error;
			}
			strcpy(content_encoding, plx->al_value);
		} else if (strcasecmp(plx->al_name, OUTPUT_FILE_PARAM) == 0) {
			if (plx->al_value == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "<%s> is NULL", OUTPUT_FILE_PARAM);
				goto mgr_hook_export_error;
			}

			if (is_full_path(plx->al_value)) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "<%s> path must be relative to %s",
					 OUTPUT_FILE_PARAM, path_hooks_workdir);
				goto mgr_hook_export_error;
			}
			strcpy(output_file, plx->al_value);
		} else {
			snprintf(hook_msg, sizeof(hook_msg),
				 "unrecognized parameter - %s",
				 plx->al_name);
			goto mgr_hook_export_error;
		}

		plx = (struct svrattrl *) GET_NEXT(plx->al_link);
	}

	if (strcmp(content_type, HOOKSTR_CONTENT) == 0) {
		snprintf(input_path, MAXPATHLEN, "%s%s%s",
			 path_hooks, hookname, HOOK_SCRIPT_SUFFIX);
	} else if (strcmp(content_type, HOOKSTR_CONFIG) == 0) {
		snprintf(input_path, MAXPATHLEN, "%s%s%s",
			 path_hooks, hookname, HOOK_CONFIG_SUFFIX);
	} else {
		snprintf(hook_msg, sizeof(hook_msg),
			 "<%s> is unknown", CONTENT_TYPE_PARAM);
		goto mgr_hook_export_error;
	}

	snprintf(output_path, sizeof(output_path), "%s%.*s", path_hooks_workdir,
		 (int) (sizeof(output_path) - strlen(output_file)), output_file);
	if (encode_hook_content(input_path, output_path, content_encoding,
				hook_msg, sizeof(hook_msg)) != 0)
		goto mgr_hook_export_error;
	reply_ack(preq);
	return;

mgr_hook_export_error:
	reply_text(preq, PBSE_HOOKERROR, hook_msg);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  __func__, hook_msg);
}

#define COPY_HOOK_SAVE 0
#define COPY_HOOK_RESTORE 1
/**
 * @brief
 * 		copy_hook	- Copies some of the attribute values
 * 		(order, type, enabled, user, event, alarm) of 'src_hook' into 'dst_hook'.
 * 		If mode is COPY_HOOK_SAVE, then just do a straight copy of the values.
 * 		If mode is COPY_HOOK_RESTORE, then populate 'dst_hook' by
 * 		invoking the native set_hook* functions, in order to update any
 * 		dependencies. For example, if order is updated, then various system hooks
 * 		lists would automatically be updated to reflect the new ordering.
 *
 *	@param[in]	src_hook	- source hook from which values needs to be copied.
 *	@param[in]	dst_hook	- destination hook to which values needs to be copied.
 *	@param[in]	mode		- mode - whether direct copying or dependencies needs to be updated.
 */
static void
copy_hook(hook *src_hook, hook *dst_hook, int mode)
{
	char hook_msg[HOOK_MSG_SIZE];

	if ((src_hook == NULL) || (dst_hook == NULL)) {
		return;
	}

	switch (mode) {
		case COPY_HOOK_SAVE:
			dst_hook->order = src_hook->order;
			dst_hook->type = src_hook->type;
			dst_hook->enabled = src_hook->enabled;
			dst_hook->user = src_hook->user;
			dst_hook->fail_action = src_hook->fail_action;
			dst_hook->debug = src_hook->debug;
			dst_hook->event = src_hook->event;
			dst_hook->alarm = src_hook->alarm;
			dst_hook->freq = src_hook->freq;
			break;
		case COPY_HOOK_RESTORE:
			(void) set_hook_order(dst_hook,
					      hook_order_as_string(src_hook->order), hook_msg,
					      sizeof(hook_msg));
			(void) set_hook_type(dst_hook,
					     hook_type_as_string(src_hook->type), hook_msg,
					     sizeof(hook_msg), 1);
			(void) set_hook_enabled(dst_hook,
						hook_enabled_as_string(src_hook->enabled), hook_msg,
						sizeof(hook_msg));
			(void) set_hook_user(dst_hook,
					     hook_user_as_string(src_hook->user), hook_msg,
					     sizeof(hook_msg), 0);
			(void) set_hook_fail_action(dst_hook,
						    hook_fail_action_as_string(src_hook->fail_action), hook_msg,
						    sizeof(hook_msg), 0);
			(void) set_hook_debug(dst_hook,
					      hook_debug_as_string(src_hook->debug), hook_msg,
					      sizeof(hook_msg));
			(void) set_hook_event(dst_hook,
					      hook_event_as_string(src_hook->event), hook_msg,
					      sizeof(hook_msg));
			(void) set_hook_alarm(dst_hook,
					      hook_alarm_as_string(src_hook->alarm), hook_msg,
					      sizeof(hook_msg));
			(void) set_hook_freq(dst_hook,
					     hook_freq_as_string(src_hook->freq), hook_msg,
					     sizeof(hook_msg));
			break;
	}
}

/**
 * @brief
 * 		mgr_hook_set	- Sets hook attributes
 *
 *		Finds the set of hooks, either one specified, or all for a host.
 *		Sets the request attributes on that set.
 *		returns a reply to the sender of the batch_request
 * @note
 * 		This is an atomic operation - either all the listed attributes
 * 		are set or none at all - uses copy_hook() to save/restore values.
 *
 * @see
 * 		req_manager
 *
 * @param[in]	preq	- batch_request structure representing the request.
 */
void
mgr_hook_set(struct batch_request *preq)

{
	svrattrl *plist, *plx;
	char hookname[PBS_MAXSVRJOBID + 1] = {'\0'};
	hook *phook;
	int num_set = 0;
	int got_event = 0; /* event attribute operated on */
	char hook_msg[HOOK_MSG_SIZE] = {'\0'};
	hook shook;
	unsigned int prev_phook_event = 0;
	char *hook_user_val = NULL;
	char *hook_fail_action_val = NULL;
	enum batch_op hook_fail_action_op = DFLT;
	char *hook_freq_val = NULL;
	int hook_obj;

	hook_obj = preq->rq_ind.rq_manager.rq_objtype;

	if (strlen(preq->rq_ind.rq_manager.rq_objname) == 0) {
		reply_text(preq, PBSE_HOOKERROR, "no hook name specified");
		return;
	}

	snprintf(hookname, sizeof(hookname), "%s", preq->rq_ind.rq_manager.rq_objname);

	phook = find_hook(hookname);

	if ((phook == NULL) || phook->pending_delete) {
		snprintf(hook_msg, sizeof(hook_msg), "%s does not exist!", hookname);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		return;
	}

	prev_phook_event = phook->event;

	if ((phook->type == HOOK_PBS) && (hook_obj != MGR_OBJ_PBS_HOOK)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "cannot set attributes of a '%s' hook named %s", HOOKSTR_PBS, phook->hook_name);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, log_buffer);
		snprintf(log_buffer, sizeof(log_buffer), "cannot set attributes of a '%s' hook", HOOKSTR_PBS);
		reply_text(preq, PBSE_HOOKERROR, log_buffer);
		return;
	}

	if ((phook->type == HOOK_SITE) && (hook_obj == MGR_OBJ_PBS_HOOK)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "cannot set attributes of a '%s' hook named %s", HOOKSTR_SITE, phook->hook_name);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, log_buffer);
		snprintf(log_buffer, sizeof(log_buffer), "cannot set attributes of a '%s' hook", HOOKSTR_SITE);
		reply_text(preq, PBSE_HOOKERROR, log_buffer);
		return;
	}

	sprintf(log_buffer, msg_manager, __func__, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  hookname, log_buffer);

	copy_hook(phook, &shook, COPY_HOOK_SAVE);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	plx = plist;
	while (plx) {

		if (strcasecmp(plx->al_name, HOOKATT_TYPE) == 0) {
			if (plx->al_op != SET)
				goto opnotequal;
			if (set_hook_type(phook, plx->al_value,
					  hook_msg, sizeof(hook_msg), 0) != 0)
				goto mgr_hook_set_error;
			num_set++;
		} else if (strcasecmp(plx->al_name, HOOKATT_ENABLED) == 0) {
			if (plx->al_op != SET)
				goto opnotequal;
			if (set_hook_enabled(phook, plx->al_value,
					     hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_set_error;
			if (phook->event & HOOK_EVENT_PERIODIC) {
				if ((phook->enabled == TRUE) && (phook->freq > 0)) {
					/* Delete all existing work tasks
					 * There might be two of them:
					 *  1 - related to running the next occurance
					 *  2 - related to running the post processing function
					 */
					delete_task_by_parm1_func(phook, NULL, DELETE_ALL);
					if (phook->script != NULL)
						(void) set_task(WORK_Timed, time_now + phook->freq,
								run_periodic_hook, phook);
					else {
						sprintf(log_buffer, "periodic hook is missing information, check hook frequency and script");
						log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
							  hookname, log_buffer);
						snprintf(hook_msg, sizeof(hook_msg),
							 "periodic hook is missing information, check hook frequency and script");
						goto mgr_hook_set_error;
					}
				} else
					/* Delete any existing work task */
					delete_task_by_parm1_func(phook, NULL, DELETE_ALL);
			}
			num_set++;
		} else if (strcasecmp(plx->al_name, HOOKATT_DEBUG) == 0) {
			if (plx->al_op != SET)
				goto opnotequal;
			if (set_hook_debug(phook, plx->al_value,
					   hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_set_error;
			num_set++;
		} else if (strcasecmp(plx->al_name, HOOKATT_USER) == 0) {
			if (plx->al_op != SET)
				goto opnotequal;

			/* setting hook user value must be a deferred action, */
			/* as it is dependent on event having */
			/* execjob_prologue, execjob_epilogue, or */
			/* execjob_preterm being set. The event set action */
			/* could appear after this set user action. */
			if (hook_user_val != NULL)
				free(hook_user_val);
			hook_user_val = strdup(plx->al_value);
			if (hook_user_val == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "strdup(%s) failed: errno %d",
					 plx->al_value, errno);
				goto mgr_hook_set_error;
			}
		} else if (strcasecmp(plx->al_name, HOOKATT_FAIL_ACTION) == 0) {
			/* setting hook fail_action value must be a deferred action, */
			/* as it is dependent on event having */
			/* mom hook event being set. The event set action */
			/* could appear after this set fail_action. */
			if (hook_fail_action_val != NULL)
				free(hook_fail_action_val);
			hook_fail_action_val = strdup(plx->al_value);
			if (hook_fail_action_val == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "strdup(%s) failed: errno %d",
					 plx->al_value, errno);
				goto mgr_hook_set_error;
			}
			hook_fail_action_op = plx->al_op;

		} else if (strcasecmp(plx->al_name, HOOKATT_EVENT) == 0) {

			got_event = 1;

			switch (plx->al_op) {
				case SET:
					if (set_hook_event(phook, plx->al_value,
							   hook_msg, sizeof(hook_msg)) != 0)
						goto mgr_hook_set_error;

					/* if exechost_periodic disappears, then */
					/* unset hook freq value */
					if ((phook->event & HOOK_EVENT_EXECHOST_PERIODIC) == 0) {
						phook->freq = HOOK_FREQ_DEFAULT;
					}

					if ((phook->event & USER_MOM_EVENTS) == 0) {
						phook->user = HOOK_PBSADMIN;
					}
					if ((phook->event & FAIL_ACTION_EVENTS) == 0) {
						phook->fail_action = HOOK_FAIL_ACTION_NONE;
					}
					num_set++;
					break;
				case INCR:
					if (add_hook_event(phook, plx->al_value,
							   hook_msg, sizeof(hook_msg)) != 0)
						goto mgr_hook_set_error;
					num_set++;
					break;
				case DECR:
					if (del_hook_event(phook, plx->al_value,
							   hook_msg, sizeof(hook_msg)) != 0)
						goto mgr_hook_set_error;

					/* if exechost_periodic disappears, then */
					/* unset hook freq value */
					if ((phook->event & HOOK_EVENT_EXECHOST_PERIODIC) == 0) {
						phook->freq = HOOK_FREQ_DEFAULT;
					}

					if ((phook->event & USER_MOM_EVENTS) == 0) {
						phook->user = HOOK_PBSADMIN;
					}
					if ((phook->event & FAIL_ACTION_EVENTS) == 0) {
						phook->fail_action = HOOK_FAIL_ACTION_NONE;
					}
					if ((phook->event & HOOK_EVENT_EXECJOB_BEGIN) == 0) {
						phook->fail_action &= ~HOOK_FAIL_ACTION_SCHEDULER_RESTART_CYCLE;
					}
					if ((phook->event & HOOK_EVENT_EXECHOST_STARTUP) == 0) {
						phook->fail_action &= ~HOOK_FAIL_ACTION_CLEAR_VNODES;
					}
					num_set++;
					break;
				default:
					snprintf(hook_msg, sizeof(hook_msg),
						 "%s - %s:%d", msg_internal,
						 plx->al_name, plx->al_op);
					goto mgr_hook_set_error;
			}

		} else if (strcasecmp(plx->al_name, HOOKATT_ORDER) == 0) {
			if (plx->al_op != SET)
				goto opnotequal;
			if (phook->event & HOOK_EVENT_PERIODIC) {
				sprintf(log_buffer, "Setting order for a periodic hook has no effect");
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
					  hookname, log_buffer);
			} else if (set_hook_order(phook, plx->al_value,
						  hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_set_error;
			num_set++;
		} else if (strcasecmp(plx->al_name, HOOKATT_ALARM) == 0) {
			if (plx->al_op != SET)
				goto opnotequal;
			if (set_hook_alarm(phook, plx->al_value,
					   hook_msg, sizeof(hook_msg)) != 0)
				goto mgr_hook_set_error;
			num_set++;
		} else if (strcasecmp(plx->al_name, HOOKATT_FREQ) == 0) {
			if (plx->al_op != SET)
				goto opnotequal;
			/* setting hook freq value must be a deferred action, */
			/* as it is dependent on event having */
			/* exechost_periodic being set. The event set action */
			/* could appear after this set freq action. */
			if (hook_freq_val != NULL)
				free(hook_freq_val);
			hook_freq_val = strdup(plx->al_value);
			if (hook_freq_val == NULL) {
				snprintf(hook_msg, sizeof(hook_msg),
					 "strdup(%s) failed: errno %d",
					 plx->al_value, errno);
				goto mgr_hook_set_error;
			}
		} else {
			snprintf(hook_msg, sizeof(hook_msg) - 1, "%s - %s",
				 msg_noattr, plx->al_name);
			goto mgr_hook_set_error;
		}

		plx = (struct svrattrl *) GET_NEXT(plx->al_link);
	}

	/* Now do the deferred set actions */
	if (hook_user_val != NULL) {
		if (set_hook_user(phook, hook_user_val,
				  hook_msg, sizeof(hook_msg), 1) != 0)
			goto mgr_hook_set_error;
		else
			num_set++;
		free(hook_user_val);
		hook_user_val = NULL;
	}
	if (hook_fail_action_val != NULL) {
		switch (hook_fail_action_op) {
			case SET:
				if (set_hook_fail_action(phook,
							 hook_fail_action_val,
							 hook_msg, sizeof(hook_msg), 1) != 0)
					goto mgr_hook_set_error;
				else

					num_set++;
				break;
			case INCR:
				if (add_hook_fail_action(phook,
							 hook_fail_action_val,
							 hook_msg, sizeof(hook_msg), 1) != 0)
					goto mgr_hook_set_error;
				else
					num_set++;
				break;
			case DECR:
				if (del_hook_fail_action(phook,
							 hook_fail_action_val,
							 hook_msg, sizeof(hook_msg)) != 0)
					goto mgr_hook_set_error;
				else
					num_set++;
				break;
			default:
				snprintf(hook_msg, sizeof(hook_msg),
					 "%s - %s:%d", msg_internal,
					 plx ? plx->al_name : "", plx ? plx->al_op : -1);
				goto mgr_hook_set_error;
		}
		free(hook_fail_action_val);
		hook_fail_action_val = NULL;
	}
	if (hook_freq_val != NULL) {
		if (set_hook_freq(phook, hook_freq_val,
				  hook_msg, sizeof(hook_msg)) != 0)
			goto mgr_hook_set_error;
		else
			num_set++;
		free(hook_freq_val);
		hook_freq_val = NULL;
		if ((phook->enabled == TRUE) && (phook->freq > 0)) {
			/* Delete all existing hook related timed work tasks */
			delete_task_by_parm1_func(phook, run_periodic_hook, DELETE_ALL);
			if (phook->script != NULL)
				(void) set_task(WORK_Timed, time_now + phook->freq,
						run_periodic_hook, phook);
		}
	}

	if (num_set > 0) {
		if (hook_save(phook) != 0) {
			snprintf(hook_msg, sizeof(hook_msg),
				 "Failed to store '%s' permanently.",
				 preq->rq_ind.rq_manager.rq_objname);
			goto mgr_hook_set_error;
		}
		if (phook->event & MOM_EVENTS) {
			add_pending_mom_hook_action(NULL, phook->hook_name,
						    MOM_HOOK_ACTION_SEND_ATTRS);
			if ((prev_phook_event & MOM_EVENTS) == 0) {
				/* previous hook's event did not include a */
				/* mom hook-related event, but current */
				/* one does due to a set operation */
				mom_hooks_seen++;
				if (mom_hooks_seen == 1) {
					/* used to be no mom hooks in the system, */
					/* but now one is introduced. So see if */
					/* resourcedef file changed and need to */
					/* be flagged to be sent to the moms */
					send_rescdef(0);
				}
				add_pending_mom_hook_action(NULL,
							    phook->hook_name,
							    MOM_HOOK_ACTION_SEND_SCRIPT);
				add_pending_mom_hook_action(NULL,
							    phook->hook_name,
							    MOM_HOOK_ACTION_SEND_CONFIG);
			}
		} else {
			if (prev_phook_event & MOM_EVENTS) {
				/* previous hook's event include a */
				/* mom hook-related event, but current */
				/* one doesn't due to the set operation */
				add_pending_mom_hook_action(NULL,
							    phook->hook_name,
							    MOM_HOOK_ACTION_DELETE);
				mom_hooks_seen--;
			}
		}
	}

	if (phook->event & HOOK_EVENT_PROVISION)
		set_srv_prov_attributes(); /* check and set prov attributes */

	if (phook->event & HOOK_EVENT_PERIODIC)
		set_srv_pwr_prov_attribute(); /* check and set power attributes */

	reply_ack(preq); /*create completely successful*/
	return;

opnotequal:
	snprintf(hook_msg, sizeof(hook_msg), "'%s' operator not =",
		 plx->al_name);

mgr_hook_set_error:
	if (hook_user_val != NULL)
		free(hook_user_val);
	if (hook_fail_action_val != NULL)
		free(hook_fail_action_val);
	if (hook_freq_val != NULL)
		free(hook_freq_val);

	if ((num_set > 0) || got_event) {
		/*
		 * got_event of 1 means set_hook_event() was called which
		 * would have automatically initialized phook->event to 0
		 * so we'll need to restore previous value
		 */
		copy_hook(&shook, phook, COPY_HOOK_RESTORE);
	}

	reply_text(preq, PBSE_HOOKERROR, hook_msg);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  __func__, hook_msg);
	return;
}

/**
 * @brief
 * 		mgr_hook_unset	- Unsets hook attributes
 *
 *		Finds the set of hooks, either one specified, or all for a host.
 *		Unsets the request attributes on that set.
 *		returns a reply to the sender of the batch_request
 *
 * @note
 * 		This is an atomic operation - either all the listed attributes
 * 		are unset or none at all - uses copy_hook() to save/restore
 *								values.
 *
 * @param[in]	preq	- batch_request structure representing the request.
 */

void
mgr_hook_unset(struct batch_request *preq)

{
	svrattrl *plist, *plx;
	char hookname[PBS_MAXSVRJOBID + 1] = {'\0'};
	hook *phook;
	int num_unset = 0;
	char hook_msg[HOOK_MSG_SIZE] = {'\0'};
	hook shook;
	unsigned int prev_phook_event;
	int hook_obj;

	hook_obj = preq->rq_ind.rq_manager.rq_objtype;

	if (strlen(preq->rq_ind.rq_manager.rq_objname) == 0) {
		reply_text(preq, PBSE_HOOKERROR, "no hook name specified");
		return;
	}

	snprintf(hookname, sizeof(hookname), "%s", preq->rq_ind.rq_manager.rq_objname);

	/* Else one and only one vhook */
	phook = find_hook(hookname);

	if ((phook == NULL) || phook->pending_delete) {
		snprintf(hook_msg, sizeof(hook_msg), "%s does not exist!", hookname);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, hook_msg);
		reply_text(preq, PBSE_HOOKERROR, hook_msg);
		return;
	}

	prev_phook_event = phook->event;

	if ((phook->type == HOOK_PBS) && (hook_obj != MGR_OBJ_PBS_HOOK)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "cannot unset attributes of a '%s' hook named %s", HOOKSTR_PBS, phook->hook_name);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, log_buffer);
		snprintf(log_buffer, sizeof(log_buffer), "cannot unset attributes of a '%s' hook", HOOKSTR_PBS);
		reply_text(preq, PBSE_HOOKERROR, log_buffer);
		return;
	}

	if ((phook->type == HOOK_SITE) && (hook_obj == MGR_OBJ_PBS_HOOK)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "cannot unset attributes of a '%s' hook named %s", HOOKSTR_SITE, phook->hook_name);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, hookname, log_buffer);
		snprintf(log_buffer, sizeof(log_buffer), "cannot unset attributes of a '%s' hook", HOOKSTR_SITE);
		reply_text(preq, PBSE_HOOKERROR, log_buffer);
		return;
	}

	sprintf(log_buffer, msg_manager, __func__, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO,
		  hookname, log_buffer);

	copy_hook(phook, &shook, COPY_HOOK_SAVE);
	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	plx = plist;
	while (plx) {

		if (strcasecmp(plx->al_name, HOOKATT_TYPE) == 0) {
			if (unset_hook_type(phook, hook_msg,
					    sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_ENABLED) == 0) {
			if (unset_hook_enabled(phook, hook_msg,
					       sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_DEBUG) == 0) {
			if (unset_hook_debug(phook, hook_msg,
					     sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_USER) == 0) {
			if (unset_hook_user(phook, hook_msg,
					    sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_FAIL_ACTION) == 0) {
			if (unset_hook_fail_action(phook, hook_msg,
						   sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_EVENT) == 0) {
			if (unset_hook_event(phook, hook_msg,
					     sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			/* Given that we've set hook's event list to empty, */
			/* then we need to reset the freq, user, fail_action values, */
			/* which are dependent on certain events being */
			/* present. */
			phook->freq = HOOK_FREQ_DEFAULT;
			phook->user = HOOK_USER_DEFAULT;
			phook->fail_action = HOOK_FAIL_ACTION_DEFAULT;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_ORDER) == 0) {
			if (unset_hook_order(phook, hook_msg,
					     sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_ALARM) == 0) {
			if (unset_hook_alarm(phook, hook_msg,
					     sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else if (strcasecmp(plx->al_name, HOOKATT_FREQ) == 0) {
			if (unset_hook_freq(phook, hook_msg,
					    sizeof(hook_msg)) != 0)
				goto mgr_hook_unset_error;
			num_unset++;
		} else {
			snprintf(hook_msg, sizeof(hook_msg) - 1, "%s - %s",
				 msg_noattr, plx->al_name);
			goto mgr_hook_unset_error;
		}

		plx = (struct svrattrl *) GET_NEXT(plx->al_link);
	}

	if (num_unset > 0) {
		if (hook_save(phook) != 0) {
			snprintf(hook_msg, sizeof(hook_msg),
				 "Failed to store '%s' permanently.",
				 preq->rq_ind.rq_manager.rq_objname);
			goto mgr_hook_unset_error;
		}
		if (phook->event & MOM_EVENTS) {
			add_pending_mom_hook_action(NULL, phook->hook_name,
						    MOM_HOOK_ACTION_SEND_ATTRS);
		} else {
			if (prev_phook_event & MOM_EVENTS) {
				/* previous hook's event included a */
				/* mom hook-related event, but current */
				/* one doesn't due to the unset operation */
				add_pending_mom_hook_action(NULL,
							    phook->hook_name,
							    MOM_HOOK_ACTION_DELETE);
				mom_hooks_seen--;
			}
		}
	}

	if (phook->event & HOOK_EVENT_PROVISION)
		set_srv_prov_attributes(); /* check and set prov attributes */

	if (phook->event & HOOK_EVENT_PERIODIC)
		set_srv_pwr_prov_attribute(); /* check and set power attributes */

	reply_ack(preq); /*unset completely successful*/
	return;

mgr_hook_unset_error:

	if (num_unset > 0)
		copy_hook(&shook, phook, COPY_HOOK_RESTORE);

	reply_text(preq, PBSE_HOOKERROR, hook_msg);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, hook_msg);
}
/*
 ************************************************************************
 *   Hook-related req_stat operations.
 ************************************************************************
 */

/**
 * @brief
 * 		status_hook - Build the status reply for a single hook.
 *
 * @see
 * 		req_stat_hook
 *
 * @param[in]	phook		- ptr to hook to status
 * @param[in]	preq		- batch_request structure representing the request.
 * @param[in,out]	pstathd	- head of list to append status to
 * @param[out]	hook_msg	- output message
 * @param[out]	msg_len		- required length of output message
 *
 * @return      Error code
 * @retval	0  - Success
 * @retval	nonzero  - Failure
 */

int
status_hook(hook *phook, struct batch_request *preq, pbs_list_head *pstathd, char *hook_msg, size_t msg_len)
{
	struct brp_status *pstat;
	svrattrl *pal;
	char val_str[HOOK_BUF_SIZE];
	char *hookname;
	int hook_obj;

	/* status_hook() request will not have the object type directly. The extend */
	/* field will determine the object type */
	if (preq->rq_extend != NULL) {
		if (strcmp(preq->rq_extend, PBS_HOOK) == 0) {
			hook_obj = MGR_OBJ_PBS_HOOK;
		} else if (strcmp(preq->rq_extend, SITE_HOOK) == 0) {
			hook_obj = MGR_OBJ_SITE_HOOK;
		} else {
			return (PBSE_HOOKERROR); /* bad hook object type */
		}
	} else {
		hook_obj = MGR_OBJ_SITE_HOOK;
	}
	memset(hook_msg, '\0', msg_len);

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);

	hookname = phook->hook_name;
	pstat->brp_objtype = hook_obj;

	(void) strcpy(pstat->brp_objname, hookname);
	CLEAR_LINK(pstat->brp_stlink);
	CLEAR_HEAD(pstat->brp_attr);
	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;

	/* add attributes to the status reply */

	pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);

	if (pal) {

		while (pal) {
			val_str[0] = '\0';
			if (strcmp(pal->al_name, HOOKATT_TYPE) == 0) {
				strcpy(val_str, hook_type_as_string(phook->type));
			} else if (strcmp(pal->al_name, HOOKATT_ENABLED) == 0) {
				strcpy(val_str, hook_enabled_as_string(phook->enabled));
			} else if (strcmp(pal->al_name, HOOKATT_USER) == 0) {
				strcpy(val_str, hook_user_as_string(phook->user));
			} else if (strcmp(pal->al_name, HOOKATT_EVENT) == 0) {
				strcpy(val_str, hook_event_as_string(phook->event));
			} else if (strcmp(pal->al_name, HOOKATT_ORDER) == 0) {
				strcpy(val_str, hook_order_as_string(phook->order));
			} else if (strcmp(pal->al_name, HOOKATT_ALARM) == 0) {
				strcpy(val_str, hook_alarm_as_string(phook->alarm));
			} else if ((strcmp(pal->al_name, HOOKATT_FREQ) == 0) &&
				   (((phook->event & HOOK_EVENT_EXECHOST_PERIODIC) != 0) ||
				    ((phook->event & HOOK_EVENT_PERIODIC) != 0))) {
				strcpy(val_str, hook_freq_as_string(phook->freq));
			} else if (strcmp(pal->al_name, HOOKATT_DEBUG) == 0) {
				strcpy(val_str, hook_debug_as_string(phook->debug));
			} else if (strcmp(pal->al_name, HOOKATT_FAIL_ACTION) == 0) {
				strcpy(val_str, hook_fail_action_as_string(phook->fail_action));
			} else {
				snprintf(hook_msg, msg_len - 1,
					 "unknown hook attribute %s", pal->al_name);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, hookname, hook_msg);
				return (PBSE_HOOKERROR);
			}

			if (attrlist_add(&pstat->brp_attr, pal->al_name,
					 val_str) != 0)
				return (PBSE_INTERNAL);
			pal = (svrattrl *) GET_NEXT(pal->al_link);
		}
	} else { /* return all attribute values */

		if ((attrlist_add(&pstat->brp_attr, HOOKATT_TYPE,
				  hook_type_as_string(phook->type)) != 0) ||
		    (attrlist_add(&pstat->brp_attr, HOOKATT_ENABLED,
				  hook_enabled_as_string(phook->enabled)) != 0) ||
		    (attrlist_add(&pstat->brp_attr, HOOKATT_EVENT,
				  hook_event_as_string(phook->event)) != 0) ||
		    (attrlist_add(&pstat->brp_attr, HOOKATT_USER,
				  hook_user_as_string(phook->user)) != 0) ||
		    (attrlist_add(&pstat->brp_attr, HOOKATT_ALARM,
				  hook_alarm_as_string(phook->alarm)) != 0) ||
		    ((((phook->event & HOOK_EVENT_EXECHOST_PERIODIC) != 0) ||
		      ((phook->event & HOOK_EVENT_PERIODIC) != 0)) &&
		     (attrlist_add(&pstat->brp_attr, HOOKATT_FREQ,
				   hook_freq_as_string(phook->freq)) != 0)) ||
		    (attrlist_add(&pstat->brp_attr, HOOKATT_ORDER,
				  hook_order_as_string(phook->order)) != 0) ||
		    (attrlist_add(&pstat->brp_attr, HOOKATT_DEBUG,
				  hook_debug_as_string(phook->debug)) != 0) ||
		    (attrlist_add(&pstat->brp_attr, HOOKATT_FAIL_ACTION,
				  hook_fail_action_as_string(phook->fail_action)) != 0))
			return (PBSE_INTERNAL);
	}

	return (0);
}

/**
 * @brief
 * 		req_stat_hook - service the Status Hook Request
 *
 *		This request processes the request for status of a single SITE hook or
 *		the set of SITE hooks at the local server..
 *
 *	@see
 *		dispatch_request
 *
 * @param[in]	preq		- ptr to the decoded request
 *
 * @return	void
 */

void
req_stat_hook(struct batch_request *preq)
{
	char *name;
	hook *phook = NULL;
	struct batch_reply *preply;
	int rc = 0;
	int type = 0;
	char hook_msg[HOOK_MSG_SIZE];
	int hook_obj;

	/*
	 * first, validate the name of the requested object, either
	 * a hook, or null for all hooks
	 */

	name = preq->rq_ind.rq_status.rq_id;

	/* req_stat_hook() will not have the object type directly, but it can */
	/* be determined via the extend field of the request. */
	if (preq->rq_extend != NULL) {
		if (strcmp(preq->rq_extend, PBS_HOOK) == 0) {
			hook_obj = MGR_OBJ_PBS_HOOK;
		} else if (strcmp(preq->rq_extend, SITE_HOOK) == 0) {
			hook_obj = MGR_OBJ_SITE_HOOK;
		} else {
			reply_text(preq, PBSE_HOOKERROR, "baad hook object type");
			return;
		}
	} else {
		hook_obj = MGR_OBJ_SITE_HOOK;
	}

	if (*name == '\0') { /* match all hooks */
		type = 1;
	} else {
		phook = find_hook(name);
		if ((phook == NULL) || phook->pending_delete) {
			reply_text(preq, PBSE_HOOKERROR, "hook not found");
			return;
		}
	}

	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	if (type == 0) { /* get status of the one named hook */
		/* can only stat HOOK_SITE hooks */
		if (((hook_obj == MGR_OBJ_PBS_HOOK) &&
		     (phook->type == HOOK_PBS)) ||
		    ((hook_obj == MGR_OBJ_SITE_HOOK) &&
		     (phook->type == HOOK_SITE))) {
			rc = status_hook(phook, preq,
					 &preply->brp_un.brp_status,
					 hook_msg, sizeof(hook_msg));
		}

	} else { /* get status of SITE or PBS hooks */

		phook = (hook *) GET_NEXT(svr_allhooks);
		while (phook) {
			if (!phook->pending_delete &&
			    (((hook_obj == MGR_OBJ_PBS_HOOK) &&
			      (phook->type == HOOK_PBS)) ||
			     ((hook_obj == MGR_OBJ_SITE_HOOK) &&
			      (phook->type == HOOK_SITE)))) {
				rc = status_hook(phook, preq,
						 &preply->brp_un.brp_status, hook_msg,
						 sizeof(hook_msg));
				if (rc != 0)
					break;
			}
			phook = (hook *) GET_NEXT(phook->hi_allhooks);
		}
	}
	if (rc) {
		if (hook_msg[0] == '\0')
			req_reject(rc, 0, preq);
		else
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
	} else {
		(void) reply_send(preq);
	}
}

/**
 * @brief
 * 		This function will set pjobs Execution_Time attribute value to the value
 * 		corresponding to new_exec_time_str.
 *
 * @see
 * 		do_runjob_reject_actions
 *
 * @param[in,out]	pjob - job structure
 * @param[in]		new_exec_time_str - new execution time which needs to be placed in job structure
 * @param[out]		msg - filled in with actual error message of this function fails
 * @param[in]		msg_len - size of 'msg' buffer.
 * @param[in]		hook_name - the name of the hook where the set attribute
 *					function is called.
 *
 * @return int
 * @retval 	0	for success.
 * @retval	!= 0	otherwise.
 */
static int
set_exec_time(job *pjob, char *new_exec_time_str, char *msg,
	      int msg_len, char *hook_name)
{

	int rc = 1;
	long new_exec_time;
	char *exec_time_ctime;

	if ((msg == NULL) || (msg_len <= 0)) {
		log_err(PBSE_INTERNAL, __func__, "Bad msg buffer parameter!");
		return (2);
	}

	if ((pjob == NULL) || (new_exec_time_str == NULL) ||
	    (hook_name == NULL)) {
		snprintf(msg, msg_len - 1,
			 "%s: bad pjob, new_exec_time_str, or hook_name!", __func__);
		return (2);
	}

	new_exec_time = atol(new_exec_time_str);

	if (new_exec_time == 0) {
		snprintf(msg, msg_len - 1,
			 "%s: Failed to convert %s into long", __func__, new_exec_time_str);
		return (2);
	}

	exec_time_ctime = ctime(&new_exec_time);
	if (exec_time_ctime == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: Failed to decode new_exec_time into ctime str", __func__);
		return (2);
	}
	exec_time_ctime[strlen(exec_time_ctime) - 1] = '\0';

	free_jattr(pjob, JOB_ATR_exectime);

	rc = set_jattr_str_slim(pjob, JOB_ATR_exectime, new_exec_time_str, NULL);

	if (rc == 0) {
		if (job_attr_def[(int) JOB_ATR_exectime].at_action) {
			rc = job_attr_def[(int) JOB_ATR_exectime].at_action(
				get_jattr(pjob, JOB_ATR_exectime),
				pjob, ATR_ACTION_ALTER);
			if (rc != 0) {
				log_err(PBSE_INTERNAL, __func__,
					"Failed executing JOB_ATR_exectime action function.");
			}
		}
	} else {
		log_err(PBSE_INTERNAL, __func__,
			"Failed decoding a value for JOB_ATR_exectime.");
	}

	if (rc != 0) {
		snprintf(msg, msg_len - 1,
			 "'%s' hook failed to set job's %s = %s",
			 hook_name,
			 ATTR_a,
			 exec_time_ctime);
		free_jattr(pjob, JOB_ATR_exectime);
	} else {
		int newsub;
		char newstate;
		FILE *fp_debug_out = NULL;

		snprintf(msg, msg_len, "'%s' hook set job's %s = %s", hook_name, ATTR_a, exec_time_ctime);
		svr_evaljobstate(pjob, &newstate, &newsub, 0);
		svr_setjobstate(pjob, newstate, newsub);

		fp_debug_out = pbs_python_get_hook_debug_output_fp();
		if (fp_debug_out != NULL) {
			fprintf(fp_debug_out, "%s.%s=%ld\n", EVENT_JOB_OBJECT, ATTR_a, new_exec_time);
		}
	}

	return (rc);
}

/**
 * @brief
 * 		This takes care of setting pjobs Hold_Types attribute to the
 * 		new_hold_types_str.
 *
 * @see
 * 		do_runjob_reject_actions
 *
 * @param[in,out]	pjob - job structure
 * @param[in]		new_hold_types_str - new hold type which needs to be placed in job structure
 * @param[out]		msg - Any messages resulting from the action is logged in 'msg'
 * @param[in]		opval - set or unset will do on pjob based on the value of opval
 * @param[in]		delval - if unset is chosen delval will be assigned instead of 'new_hold_types_str'
 * @param[in]		msg_len - 'msg' is up to 'msg_len' size.
 * @param[in]		hook_name - the name of the hook where the set attribute
 *					function is called.
 *
 * @return int
 * @retval 	0	for success.
 * @retval	!= 0	otherwise.
 */
static int
set_hold_types(job *pjob, char *new_hold_types_str,
	       char *opval, char *delval, char *msg, int msg_len, char *hook_name)
{
	long old_hold;
	int do_release;
	int rc;
	char newstate;
	int newsub;

	if ((msg == NULL) || (msg_len <= 0)) {
		log_err(PBSE_INTERNAL, __func__, "Bad msg buffer parameter");
		return (2);
	}

	if ((pjob == NULL) || (new_hold_types_str == NULL) ||
	    (opval == NULL) || (delval == NULL) || (hook_name == NULL)) {
		snprintf(msg, msg_len - 1,
			 "%s: bad pjob, new_hold_types_str, or hook_name", __func__);
		return (2);
	}

	if (strcmp(opval, PY_OPVAL_SUB) == 0)
		do_release = 1;
	else
		do_release = 0;

	old_hold = get_jattr_long(pjob, JOB_ATR_hold);

	rc = set_jattr_str_slim(pjob, JOB_ATR_hold, new_hold_types_str, NULL);

	if (rc != 0) {
		log_err(PBSE_INTERNAL, __func__,
			"Failed decoding a value for JOB_ATR_hold.");
		snprintf(msg, msg_len - 1,
			 "'%s' hook failed to %s job's %s = %s",
			 hook_name,
			 (do_release ? "unset" : "set"),
			 ATTR_h,
			 (do_release ? delval : new_hold_types_str));
		free_jattr(pjob, JOB_ATR_hold);
		return (rc);
	}

	snprintf(msg, msg_len - 1,
		 "'%s' hook %s job's %s = %s",
		 hook_name,
		 (do_release ? "unset" : "set"),
		 ATTR_h,
		 (do_release ? delval : new_hold_types_str));

	if (!do_release &&
	    (get_jattr_long(pjob, JOB_ATR_hold) != 0)) {
		time_t now;
		char date[32];
		char buf[HOOK_BUF_SIZE];
		/* Note the hold time in the job comment. */
		now = time(NULL);
		snprintf(date, sizeof(date), "%s", (const char *) ctime(&now));
		(void) sprintf(buf, "Job held by '%s' hook on %s",
			       hook_name, date);
		set_jattr_str_slim(pjob, JOB_ATR_Comment, buf, NULL);
	}

	if (old_hold != get_jattr_long(pjob, JOB_ATR_hold)) {
		FILE *fp_debug_out = NULL;
		/* indicate attributes changed */
		svr_evaljobstate(pjob, &newstate, &newsub, 0);
		svr_setjobstate(pjob, newstate, newsub);

		fp_debug_out = pbs_python_get_hook_debug_output_fp();
		if (fp_debug_out != NULL) {
			fprintf(fp_debug_out, "%s.%s=%s\n", EVENT_JOB_OBJECT, ATTR_h, new_hold_types_str);
		}
	}

	return (rc);
}

/**
 * @brief
 *    	set_attribute	- This function will set pjob's attribute internally indexed
 *     						at 'attr_index' to 'new_str'.
 *
 * @see
 * 		set_job_varlist, do_runjob_accept_actions and do_runjob_reject_actions
 *
 * @param[in]	pjob - job in question
 * @param[in]	attr_index - index to internal job table holding attribute info
 * @param[in]	msg - filled in with actual error message of this function fails
 * @param[in]	msg_len - size of 'msg' buffer.
 * @param[in]	hook_name - the name of the hook where the set attribute
 *				function is called.
 *
 * @return int
 * @retval 	0	for success.
 * @retval	!= 0	otherwise.
 */
static int
set_attribute(job *pjob, int attr_index,
	      char *new_str, char *msg, int msg_len, char *hook_name)
{

	int rc = 1;
	char *attr_name = NULL;
	char *new_attrval_str = NULL;

	if ((msg == NULL) || (msg_len <= 0)) {
		log_err(PBSE_INTERNAL, __func__, "Bad msg buffer parameter!");
		return (2);
	}

	if ((pjob == NULL) || (new_str == NULL) || (hook_name == NULL)) {
		snprintf(msg, msg_len - 1,
			 "%s: bad pjob, new_attrval_str, or hook_name!", __func__);
		return (2);
	}

	attr_name = job_attr_def[attr_index].at_name;
	if (attr_name == NULL) {
		snprintf(msg, msg_len - 1,
			 "%s: bad job attribute name indexed at '%d'!", __func__,
			 attr_index);
		return (2);
	}

	/*
	 * Need to dup 'new_str' for if fed to job attribute's decode function,
	 * cannot guarantee that the value will not get "munged".
	 */
	new_attrval_str = strdup(new_str);
	if (new_attrval_str == NULL) {
		log_err(errno, __func__, "strdup");
		snprintf(msg, msg_len - 1,
			 "%s: strdup failed (errno=%d)", __func__, errno);
		return (2);
	}

	if (strcmp(attr_name, ATTR_depend) == 0) {
		char *pdepend;

		pdepend = malloc(PBS_DEPEND_LEN);
		if (pdepend == NULL) {
			log_err(errno, __func__, "malloc");
			snprintf(msg, msg_len - 1,
				 "%s: malloc failed (errno=%d)", __func__, errno);
			return (2);
		}

		/* below replaces short jobid with full jobid */
		if (parse_depend_list(new_attrval_str, &pdepend,
				      PBS_DEPEND_LEN) != 0) {
			free(pdepend);
			log_err(errno, __func__, "parse_depend_list");
			snprintf(msg, msg_len - 1,
				 "%s: failed to parse_depend_list(%s) (errno=%d)",
				 __func__, new_attrval_str, errno);
			return (2);
		}

		/* replace the value with the expanded value */
		free(new_attrval_str);
		new_attrval_str = pdepend;
	}

	free_jattr(pjob, attr_index);

	rc = set_jattr_str_slim(pjob, attr_index, new_attrval_str, NULL);
	if (rc == 0) {
		if (job_attr_def[attr_index].at_action) {
			rc = job_attr_def[attr_index].at_action(
				get_jattr(pjob, attr_index),
				pjob, ATR_ACTION_ALTER);
			if (rc != 0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "Failed executing attribute '%s' action function.",
					 attr_name);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
			}
		}
		snprintf(log_buffer, sizeof(log_buffer), "%s=%s", attr_name, new_attrval_str);
		account_record(PBS_ACCT_ALTER, pjob, log_buffer);

	} else {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed decoding a value for '%s'", attr_name);
		log_err(PBSE_INTERNAL, __func__, log_buffer);
	}

	if (rc != 0) {
		snprintf(msg, msg_len - 1,
			 "'%s' hook failed to set job's %s = %s",
			 hook_name,
			 attr_name,
			 new_str);
		free_jattr(pjob, attr_index);
	} else {
		FILE *fp_debug_out = NULL;

		snprintf(msg, msg_len - 1,
			 "'%s' hook set job's %s = %s",
			 hook_name,
			 attr_name,
			 new_str);

		fp_debug_out = pbs_python_get_hook_debug_output_fp();
		if (fp_debug_out != NULL) {
			fprintf(fp_debug_out, "%s.%s=%s\n", EVENT_JOB_OBJECT, attr_name, new_str);
		}
	}

	free(new_attrval_str);
	return (rc);
}

/**
 * @brief
 *		Sets the job's Variable_List value to the one set in the hook
 *		script, if they differ.
 *
 * @see
 * 		do_runjob_accept_actions and do_runjob_reject_actions
 *
 * @param[in]	pjob	- job to set
 * @param[in]	hook_name - name of the hook that is setting the Variable_List.
 * @param[in]	msg	- message buffer to be filled if error occurred
 * @param[in]	msg_len	- size of 'msg' buffer.
 *
 * @return int
 * @retval	0	- for success (including if nothing got set)
 * @retval	1	- for error occurred setting job's Variable_List
 */
static int
set_job_varlist(job *pjob, char *hook_name, char *msg, int msg_len)
{
	char *orig_env_str = NULL;
	int i;
	size_t elen;
	struct array_strings *astr;
	char *new_attrval_str = NULL;
	char *pfrom, *end, *pc = NULL;

	if ((pjob == NULL) || (msg == NULL) || (msg_len <= 0)) {
		log_err(-1, __func__, "pjob, msg,or msg_len parameter is bad");
		return (1);
	}

	if (is_jattr_set(pjob, JOB_ATR_variables)) {

		/* transform raw Variable_List data into a string */
		/* of the form "<var1>=<val1>,<var2>=<val2>,..." with */
		/* special characters escaped with a backslash. */
		astr = get_jattr_arst(pjob, JOB_ATR_variables);
		elen = 0;
		for (i = 0; i < astr->as_usedptr; ++i) {
			pfrom = astr->as_string[i];
			end = pfrom + strlen(pfrom);
			while (pfrom < end) {
				/* account for back-slashes required */
				/* to escape special characters */
				if (IS_SPECIAL_CHAR(*pfrom))
					elen++;
				elen++;
				pfrom++;
			}

			elen++; /* add 1 for separator comma or ending NULL */
		}

		if (elen > 0) {
			orig_env_str = (char *) malloc(elen);
			if (orig_env_str == NULL) {
				snprintf(msg, msg_len - 1,
					 "malloc failure setting Variable_List for job %s",
					 pjob->ji_qs.ji_jobid);
				log_err(errno, __func__, msg);
				return (1);
			}
			memset(orig_env_str, '\0', elen);
			for (i = 0; i < astr->as_usedptr; ++i) {
				pfrom = astr->as_string[i];
				end = pfrom + strlen(pfrom);

				/* set destination string */
				if (i == 0) {
					pc = orig_env_str;
				} else {
					*pc++ = ',';
				}

				while (pfrom < end) {
					if (IS_SPECIAL_CHAR(*pfrom))
						*pc++ = '\\';
					*pc++ = *pfrom++;
				}
			}
		}
	}

	new_attrval_str = pbs_python_event_job_getval(ATTR_v);

	if ((orig_env_str != NULL) && (new_attrval_str != NULL)) {
		if (varlist_same(orig_env_str, new_attrval_str) == 1) {
			/* nothing to reset */
			new_attrval_str = NULL;
		}
	}

	if (orig_env_str != NULL) {
		free(orig_env_str);
	}

	if (new_attrval_str == NULL)
		return (0); /* nothing to set */

	if (set_attribute(pjob, JOB_ATR_variables, new_attrval_str, msg,
			  msg_len - 1, hook_name) != 0) {
		log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_JOB,
			  LOG_ERR, pjob->ji_qs.ji_jobid, msg);
		return (1);
	} else {
		if (msg[0] != '\0')
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, msg);
	}
	return (0);
}

enum hook_result {
	ACCEPT_HOOK_EVENT,
	REJECT_HOOK_EVENT
};

/**
 * @brief
 *		Sets the job's Resource_List.<resc>* values to the ones set in the hook
 *		script. 'hook_mode' determines which set of resources (<resc>) is NOT
 *		allowed to be modified.
 *
 * @see
 * 		do_runjob_accept_actions and do_runjob_reject_actions
 *
 * @param[in]	pjob	- job to set
 * @param[in]	hook_name - name of the hook that is setting the Resource_List.
 * @param[in]	msg	- message buffer to be filled if error occurred
 * @param[in]	msg_len	- size of 'msg' buffer.
 * @param[in]	hook_mode - if ACCEPT_HOOK_EVENT the list of resources
 *			     that are not modifiable are: "nodect", "select",
 *			     "place", and any resource with the
 *			     ATR_DFLAG_CVTSLT flag set. (i.e. those that
 *			     convert to a select spec). If REJECT_HOOK_EVENT,
 *			     only "nodect" is currently not modifiable.
 *
 * @return int
 * @retval	0	- for success (including if nothing got set)
 * @retval	1	- for error occurred setting job's Variable_List
 */
static int
set_job_reslist(job *pjob, char *hook_name, char *msg, int msg_len,
		enum hook_result hook_mode)
{
	char *val_str_dup = NULL;
	char *np = NULL;
	char *np1 = NULL;
	char *resc = NULL;
	char *new_rescval_str = NULL;
	resource_def *rescdef;
	resource *prescjb;
	resource *presc;
	resource_def *pseldef = NULL;
	attribute *jb;
	int rc = 0;
	char *new_attrval_str = NULL;
	FILE *fp_debug_out = NULL;

	if ((pjob == NULL) || (hook_name == NULL) || (msg == NULL) ||
	    (msg_len <= 0)) {
		log_err(-1, __func__,
			"pjob, hook_name, msg, or msg_len parameter is bad");
		return (1);
	}

	new_attrval_str = pbs_python_event_job_getval(ATTR_l);

	if (new_attrval_str == NULL)
		return (0); /* nothing to set */

	val_str_dup = strdup(new_attrval_str);
	if (val_str_dup == NULL) {
		log_err(errno, __func__, "strdup failed");
		return (1);
	}

	fp_debug_out = pbs_python_get_hook_debug_output_fp();

	jb = get_jattr(pjob, JOB_ATR_resource);
	np = strtok(val_str_dup, ",");
	while (np != NULL) {
		resc = np;
		np1 = strstr(np, "=");
		if (np1 != NULL)
			*np1 = '\0';

		new_rescval_str = pbs_python_event_jobresc_getval_hookset(ATTR_l, resc);

		if (new_rescval_str == NULL) {
			np = strtok(NULL, ",");
			continue;
		}
		rescdef = find_resc_def(svr_resc_def, resc);
		if (rescdef == NULL) {
			snprintf(msg, msg_len - 1,
				 "Setting job '%s' attribute %s.%s failed: unknown resource", pjob->ji_qs.ji_jobid, ATTR_l, resc);

			log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, msg);

			free(val_str_dup);
			return (1);
		}

		if (((hook_mode == ACCEPT_HOOK_EVENT) &&
		     ((strcmp(resc, "nodect") == 0) ||
		      (strcmp(resc, "select") == 0) ||
		      (strcmp(resc, "place") == 0) ||
		      ((rescdef->rs_flags & ATR_DFLAG_CVTSLT) != 0))) ||
		    ((hook_mode == REJECT_HOOK_EVENT) &&
		     (strcmp(resc, "nodect") == 0))) {

			snprintf(msg, msg_len - 1,
				 "'%s' hook failed to set job's %s.%s = %s (not allowed)",
				 hook_name, ATTR_l, resc, new_rescval_str);

			log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
				  PBS_EVENTCLASS_JOB, LOG_ERR,
				  pjob->ji_qs.ji_jobid, msg);
			free(val_str_dup);
			return (1);
		}

		prescjb = find_resc_entry(jb, rescdef);

		if (prescjb == NULL) {
			prescjb = add_resource_entry(jb, rescdef);
		}

		if (prescjb == NULL) {
			snprintf(msg, msg_len - 1, "'%s' hook failed to add job's %s.%s = %s",
				 hook_name,
				 ATTR_l,
				 resc,
				 new_rescval_str);
			log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
				  PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid,
				  msg);
			free(val_str_dup);
			return (1);
		}

		if ((rc = rescdef->rs_decode(&prescjb->rs_value,
					     ATTR_l, rescdef->rs_name, new_rescval_str)) != 0) {
			snprintf(msg, msg_len - 1,
				 "'%s' hook failed to set job's %s.%s = %s",
				 hook_name, ATTR_l,
				 resc, new_rescval_str);
			log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
				  PBS_EVENTCLASS_JOB, LOG_ERR,
				  pjob->ji_qs.ji_jobid, msg);
			free(val_str_dup);
			return (1);
		}

		snprintf(msg, msg_len - 1, "'%s' hook set job's %s.%s = %s",
			 hook_name,
			 ATTR_l,
			 resc,
			 new_rescval_str);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, msg);

		snprintf(log_buffer, sizeof(log_buffer), "%s.%s=%s", ATTR_l, resc, new_rescval_str);
		account_record(PBS_ACCT_ALTER, pjob, log_buffer);

		if (fp_debug_out != NULL) {
			fprintf(fp_debug_out, "%s.%s[%s]=%s\n", EVENT_JOB_OBJECT, ATTR_l, resc, new_rescval_str);
		}
		np = strtok(NULL, ",");
	}

	/* The following forces new job's Resource_List values to be seen */
	/* in qstat -f */
	jb->at_flags |= ATR_MOD_MCACHE;

	pseldef = &svr_resc_def[RESC_SELECT];
	presc = find_resc_entry(jb, pseldef);
	if (presc && (presc->rs_value.at_flags & ATR_VFLAG_DEFLT)) {
		/* changing Resource_List and select is a default */
		/* clear "select" so it is rebuilt in set_resc_deflt */
		pseldef->rs_free(&presc->rs_value);
	}
	(void) set_resc_deflt((void *) pjob, JOB_OBJECT, NULL);
	free(val_str_dup);
	return (0);
}

/* Associates a job attribute value to a slot in an attributes table. */
struct attribute_jobmap {
	enum job_atr attr_i; /* index to some table */
	attribute attr_val;  /* job attribute value */
};

/**
 * @brief
 *		Initializes each entry of the attribute_jobmap table (a_map) to
 *		the value corresponding to the attribute entry in job attributes
 *		table.
 *
 * @see
 * 		do_runjob_accept_actions and do_runjob_reject_actions
 *
 * @param[in]	pjob - contains the original attribute values
 * @param[in]	a_map - holds the saved attribute values.
 *
 * @return void
 */
static void
attribute_jobmap_init(job *pjob, struct attribute_jobmap *a_map)
{
	int index, a_index;

	if ((pjob == NULL) || (a_map == NULL)) {
		log_err(-1, __func__, "bad pjob or a_map param");
		return;
	}

	for (index = 0; (a_index = (int) a_map[index].attr_i) >= 0; ++index) {
		if (is_attr_set(&a_map[index].attr_val))
			free_attr(job_attr_def, &a_map[index].attr_val, a_index);

		clear_attr(&a_map[index].attr_val, &job_attr_def[a_index]);
		if (is_jattr_set(pjob, a_index)) {
			job_attr_def[a_index].at_set(
				&a_map[index].attr_val,
				get_jattr(pjob, a_index), SET);
		}
	}
}

/**
 * @brief
 *		Clear each entry of the attribute_jobmap table (a_map) and
 *		zero out the memory.
 *
 * @see
 * 		do_runjob_accept_actions and do_runjob_reject_actions
 *
 * @param[in]	a_map - holds the saved attribute values.
 *
 * @return void
 */
static void
attribute_jobmap_clear(struct attribute_jobmap *a_map)
{
	int index, a_index;

	if (a_map == NULL) {
		log_err(-1, __func__, "bad a_map param");
		return;
	}

	for (index = 0; (a_index = (int) a_map[index].attr_i) >= 0; ++index) {
		if (is_attr_set(&a_map[index].attr_val))
			free_attr(job_attr_def, &a_map[index].attr_val, a_index);
		clear_attr(&a_map[index].attr_val, &job_attr_def[a_index]);
	}
}

/**
 * @brief
 * 		Restores pjob's attribute values saved in 'a_map'.
 *
 * @see
 *		process_hooks
 *
 * @param[in]	pjob - contains the attribute values to be filled in
 * @param[in]	a_map - holds the saved attribute values.
 *
 * @return void
 */
static void
attribute_jobmap_restore(job *pjob, struct attribute_jobmap *a_map)
{
	int index, a_index;
	char *attr_name = NULL;
	attribute *pattr, *pattr_o;
	attribute_def *pdef;
	char newstate;
	int newsub;

	if ((pjob == NULL) || (a_map == NULL)) {
		log_err(-1, __func__, "bad pjob or a_map param");
		return;
	}

	for (index = 0; (a_index = (int) a_map[index].attr_i) >= 0; ++index) {
		attr_name = job_attr_def[a_index].at_name;
		if (attr_name == NULL)
			continue;

		pattr = get_jattr(pjob, a_index); /* current value */
		pattr_o = &a_map[index].attr_val; /* original value */
		pdef = &job_attr_def[a_index];

		/* if there's a saved value, then use it */
		if (is_attr_set(pattr_o)) {

			if (pdef->at_comp != NULL) {
				if (pdef->at_type == ATR_TYPE_RESC) {
					if ((pdef->at_comp(pattr_o, pattr) == 0) && (comp_resc_gt == 0) && (comp_resc_lt == 0) && (comp_resc_nc == 0)) {
						continue;
					}
				} else if (pdef->at_type == ATR_TYPE_ARST) {
					/* compare if both are substrings of each other */
					if ((pdef->at_comp(pattr, pattr_o) == 0) && (pdef->at_comp(pattr_o, pattr) == 0)) {
						continue;
					}
				} else if (pdef->at_comp(pattr, pattr_o) == 0) {
					continue;
				}
			}
			if (pdef->at_free) {
				pdef->at_free(pattr);
			}
			if (pdef->at_set(pattr, pattr_o, SET) == 0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "restored job %s's previous value",
					 attr_name);
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
					  LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
			}
		} else if (is_attr_set(pattr)) {
			/* original/saved value is unset, and yet current */
			/* value is set, need to revert to unset state */
			if (pdef->at_free) {
				pdef->at_free(pattr);
				snprintf(log_buffer, sizeof(log_buffer),
					 "restored job %s's previous unset value",
					 attr_name);
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
					  LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
			}
		}
	}

	svr_evaljobstate(pjob, &newstate, &newsub, 0);
	svr_setjobstate(pjob, newstate, newsub);
}

/*
 * the following is a list of attributes modifiable in a HOOK_EVENT_RUNJOB
 * hook that ends in a pbs.event().accept().
 * If this list is updated, be sure to update the 'runjob_modifiable_jobattrs'
 * macro in src/lib/Libpython/pbs_python_svr_internal.c.
 */
struct attribute_jobmap runjob_accept_attrlist[] = {
	{JOB_ATR_outpath, {0}},
	{JOB_ATR_errpath, {0}},
	{JOB_ATR_resource, {0}},
	{JOB_ATR_variables, {0}},
	{JOB_ATR_create_resv_from_job, {0}},
	{(enum job_atr) - 1, {0}}};

/**
 *
 * @brief
 *		Perform the job updates to 'pjob' as a result of a RUNJOB hook
 *		name 'hook_name' execution ending in a pbs.event().accept() call.
 *
 * @see
 * 		process_hooks
 *
 * @param[in]	pjob	- job to modify.
 * @param[in]	hook_name - hook doing the accept action.
 * @param[in]	msg	- gets filled in with the error message in case of
 *			  	an error.
 * @param[in]	msg_len	- size of the 'msg' buffer
 *
 * @return	int
 * @retval	0	- for success
 * @retval	1	- for error, with 'msg' buffer filled.
 */
static int
do_runjob_accept_actions(job *pjob, char *hook_name, char *msg, int msg_len)
{
	int index, aindex;
	char *attr_name = NULL;
	char *new_attrval_str = NULL;

	if ((pjob == NULL) || (msg == NULL) || (msg_len <= 0) ||
	    (hook_name == NULL)) {
		log_err(-1, __func__, "bad pjob, msg, or hook_name param");
		return (1);
	}

	msg[0] = '\0';

	attribute_jobmap_init(pjob, runjob_accept_attrlist);

	for (index = 0; (aindex = (int) runjob_accept_attrlist[index].attr_i) >= 0;
	     ++index) {

		attr_name = job_attr_def[aindex].at_name;
		if (attr_name == NULL) {
			log_err(-1, __func__,
				"encountered an unexpected NULL attr_name");
			continue;
		}
		if (strcmp(attr_name, ATTR_v) == 0) {
			if (set_job_varlist(pjob, hook_name, msg,
					    msg_len - 1) != 0) {
				return (1);
			}
		} else if (strcmp(attr_name, ATTR_l) == 0) {
			if (set_job_reslist(pjob, hook_name, msg,
					    msg_len - 1, ACCEPT_HOOK_EVENT) != 0) {
				return (1);
			}
		} else if ((strcmp(attr_name, ATTR_o) == 0) ||
			   (strcmp(attr_name, ATTR_create_resv_from_job) == 0) ||
			   (strcmp(attr_name, ATTR_e) == 0)) {
			new_attrval_str =
				pbs_python_event_job_getval_hookset(attr_name,
								    NULL, 0, NULL, 0);
			if (new_attrval_str == NULL)
				continue;

			if (set_attribute(pjob, aindex, new_attrval_str, msg, msg_len - 1, hook_name) != 0) {
				log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_JOB, LOG_ERR, pjob->ji_qs.ji_jobid, msg);
				return (1);
			} else {
				if (msg[0] != '\0')
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, msg);
			}
		}
	}

	/*
	 * Don't let the values in runjob_accept_attrlist (a_map) linger.
	 * When resources get deleted and recreated between job runs, the
	 * pointer to rs_defin can get out of sync causing a crash when
	 * the data is reinitialized.
	 */
	attribute_jobmap_clear(runjob_accept_attrlist);

	return (0);
}

/*
 * the following is a list of attributes modifiable in a HOOK_EVENT_RUNJOB
 * hook that ends in a pbs.event().reject().
 * If this list is updated, be sure to update the 'runjob_modifiable_jobattrs'
 * macro in src/lib/Libpython/pbs_python_svr_internal.c.
 */
struct attribute_jobmap runjob_reject_attrlist[] = {
	{JOB_ATR_exectime, {0}},
	{JOB_ATR_hold, {0}},
	{JOB_ATR_project, {0}},
	{JOB_ATR_depend, {0}},
	{JOB_ATR_variables, {0}},
	{JOB_ATR_resource, {0}},
	{(enum job_atr) - 1, {0}}};

/**
 * @brief
 *		Perform the job updates to 'pjob' as a result of a RUNJOB hook
 *		execution ending in a pbs.event().reject() call.
 *
 * @see
 * 		process_hooks
 * @param[in]	pjob	- job to modify.
 * @param[in]	hook_name - name of hook doing the reject action.
 *
 * @return int
 * @retval 0	- success
 * @retval 1	- fail
 */
static int
do_runjob_reject_actions(job *pjob, char *hook_name)
{
	int index, aindex;
	int rc = 0;
	char *attr_name = NULL;
	char *new_attrval_str = NULL;

	if ((pjob == NULL) || (hook_name == NULL)) {
		log_err(-1, __func__, "bad pjob or hook_name param");
		return (1);
	}

	attribute_jobmap_init(pjob, runjob_reject_attrlist);

	for (index = 0; (aindex = (int) runjob_reject_attrlist[index].attr_i) >= 0;
	     ++index) {

		attr_name = job_attr_def[aindex].at_name;
		if (attr_name == NULL) {
			log_err(-1, __func__,
				"encountered an unexpected NULL attr_name");
			continue;
		}

		log_buffer[0] = '\0';
		if (strcmp(attr_name, ATTR_a) == 0) {

			new_attrval_str =
				pbs_python_event_job_getval_hookset(attr_name,
								    NULL, 0, NULL, 0);

			if (new_attrval_str == NULL)
				continue;

			if (set_exec_time(pjob, new_attrval_str, log_buffer,
					  LOG_BUF_SIZE, hook_name) != 0) {

				log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
					  PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid, log_buffer);
				rc = 1;
				break;
			} else {
				if (log_buffer[0] != '\0')
					log_event(PBSEVENT_JOB,
						  PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid,
						  log_buffer);
			}

		} else if (strcmp(attr_name, ATTR_h) == 0) {
			char hold_opval[HOOK_BUF_SIZE];
			char hold_delval[HOOK_BUF_SIZE];

			new_attrval_str =
				pbs_python_event_job_getval_hookset(ATTR_h,
								    hold_opval, HOOK_BUF_SIZE, hold_delval,
								    HOOK_BUF_SIZE);
			if (new_attrval_str == NULL)
				continue;

			if (set_hold_types(pjob, new_attrval_str,
					   hold_opval, hold_delval, log_buffer, LOG_BUF_SIZE,
					   hook_name) != 0) {
				log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
					  PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid, log_buffer);
			} else {

				if (log_buffer[0] != '\0')
					log_event(PBSEVENT_JOB,
						  PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid,
						  log_buffer);
			}

		} else if (strcmp(attr_name, ATTR_v) == 0) {
			if (set_job_varlist(pjob, hook_name, log_buffer,
					    LOG_BUF_SIZE - 1) != 0) {
				rc = 1;
				break;
			}
		} else if (strcmp(attr_name, ATTR_l) == 0) {
			if (set_job_reslist(pjob, hook_name, log_buffer,
					    LOG_BUF_SIZE - 1, REJECT_HOOK_EVENT) != 0) {
				rc = 1;
				break;
			}
		} else {
			new_attrval_str =
				pbs_python_event_job_getval_hookset(attr_name,
								    NULL, 0, NULL, 0);
			if (new_attrval_str == NULL)
				continue;

			if (set_attribute(pjob, aindex,
					  new_attrval_str, log_buffer, LOG_BUF_SIZE,
					  hook_name) != 0) {

				log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
					  PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid, log_buffer);
				rc = 1;
				break;
			} else {
				if (log_buffer[0] != '\0')
					log_event(PBSEVENT_JOB,
						  PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid,
						  log_buffer);
			}
		}
	}

	/* update the eligible time to JOB_INITIAL */
	if (is_sattr_set(SVR_ATR_EligibleTimeEnable) && get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1)
		update_eligible_time(JOB_INITIAL, pjob);

	/*
	 * Don't let the values in runjob_reject_attrlist (a_map) linger.
	 * When resources get deleted and recreated between job runs, the
	 * pointer to rs_defin can get out of sync causing a crash when
	 * the data is reinitialized.
	 */
	attribute_jobmap_clear(runjob_reject_attrlist);

	return (rc);
}

/*
 * the following is a list of attributes modifiable in a HOOK_EVENT_POSTQUEUEJOB
 * hook that ends in a pbs.event().accept().
 */
struct attribute_jobmap postqueuejob_accept_attrlist[] = {
	{JOB_ATR_hold, {0}},
	{JOB_ATR_project, {0}},
	{JOB_ATR_variables, {0}},
	{JOB_ATR_resource, {0}},
	{(enum job_atr) - 1, {0}}};

/**
 * @brief
 *		Perform the job updates to 'pjob' as a result of a POSTQUEUEJOB hook
 *		execution ending in a pbs.event().accept() call.
 *
 * @see
 * 		process_hooks
 * @param[in]	pjob	- job to modify.
 * @param[in]	hook_name - name of hook doing the accept action.
 *
 * @return int
 * @retval 0	- success
 * @retval 1	- fail
 */
static int
do_postqueuejob_accept_actions(job *pjob, char *hook_name)
{
	int index, aindex;
	int rc = 0;
	char *attr_name = NULL;
	char *new_attrval_str = NULL;

	if ((pjob == NULL) || (hook_name == NULL)) {
		log_err(-1, __func__, "bad pjob or hook_name param");
		return (1);
	}

	attribute_jobmap_init(pjob, postqueuejob_accept_attrlist);

	for (index = 0; (aindex = (int) postqueuejob_accept_attrlist[index].attr_i) >= 0;
	     ++index) {

		attr_name = job_attr_def[aindex].at_name;
		if (attr_name == NULL) {
			log_err(-1, __func__,
				"encountered an unexpected NULL attr_name");
			continue;
		}

		log_buffer[0] = '\0';
		if (strcmp(attr_name, ATTR_h) == 0) {
			char hold_opval[HOOK_BUF_SIZE];
			char hold_delval[HOOK_BUF_SIZE];

			new_attrval_str =
				pbs_python_event_job_getval_hookset(ATTR_h,
								    hold_opval, HOOK_BUF_SIZE, hold_delval,
								    HOOK_BUF_SIZE);
			if (new_attrval_str == NULL)
				continue;

			if (set_hold_types(pjob, new_attrval_str,
					   hold_opval, hold_delval, log_buffer, LOG_BUF_SIZE,
					   hook_name) != 0) {
				log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
					  PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid, log_buffer);
			} else {

				if (log_buffer[0] != '\0')
					log_event(PBSEVENT_JOB,
						  PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid,
						  log_buffer);
			}

		} else if (strcmp(attr_name, ATTR_v) == 0) {
			if (set_job_varlist(pjob, hook_name, log_buffer,
					    LOG_BUF_SIZE - 1) != 0) {
				rc = 1;
				break;
			}
		} else if (strcmp(attr_name, ATTR_l) == 0) {
			if (set_job_reslist(pjob, hook_name, log_buffer,
					    LOG_BUF_SIZE - 1, REJECT_HOOK_EVENT) != 0) {
				rc = 1;
				break;
			}
		} else {
			new_attrval_str =
				pbs_python_event_job_getval_hookset(attr_name,
								    NULL, 0, NULL, 0);
			if (new_attrval_str == NULL)
				continue;

			if (set_attribute(pjob, aindex,
					  new_attrval_str, log_buffer, LOG_BUF_SIZE,
					  hook_name) != 0) {

				log_event(PBSEVENT_ERROR | PBSEVENT_FORCE,
					  PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid, log_buffer);
				rc = 1;
				break;
			} else {
				if (log_buffer[0] != '\0')
					log_event(PBSEVENT_JOB,
						  PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid,
						  log_buffer);
			}
		}
	}
	attribute_jobmap_clear(runjob_reject_attrlist);
	return (rc);
}

/**
 * @brief
 * 		Write into the hook debug output file, information about
 * 		hook reject action, and close the hook debug output file stream.
 *
 * @param[in]	reject_msg	- the hook reject message.
 *
 * @return void
 */
void
write_hook_reject_debug_output_and_close(char *reject_msg)
{
	char *hook_outfile;
	FILE *fp_debug_out = NULL;

	fp_debug_out = pbs_python_get_hook_debug_output_fp();

	if (fp_debug_out == NULL) {
		/* prepare to open file if output file pointer not stored */
		hook_outfile = pbs_python_get_hook_debug_output_file();
		if ((hook_outfile != NULL) && (hook_outfile[0] != '\0')) {
			/* need to open in append mode, as */
			/* process_hooks() may have */
			/* already written into this file. */
			fp_debug_out = fopen(hook_outfile, "a");
			if (fp_debug_out == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: open of hook debug output file %s failed!",
					 hook_outfile);
				log_err(-1, __func__, log_buffer);
			} else {
				pbs_python_set_hook_debug_output_fp(fp_debug_out);
			}
		}
	}

	if (fp_debug_out != NULL) {
		fprintf(fp_debug_out, "%s=True\n",
			EVENT_REJECT_OBJECT);
		fprintf(fp_debug_out, "%s=False\n",
			EVENT_ACCEPT_OBJECT);
		if (reject_msg != NULL)
			fprintf(fp_debug_out, "%s=%s\n",
				EVENT_REJECT_MSG_OBJECT, reject_msg);
		fclose(fp_debug_out);
		pbs_python_set_hook_debug_output_fp(NULL);
	}
}

/**
 * @brief
 * 		Write into the hook debug output file, information about
 * 		hook accept action, and close out the hook debug output file
 * 		stream.
 *
 * @see
 * 		process_hooks
 *
 * @return void
 */
void
write_hook_accept_debug_output_and_close(void)
{
	char *hook_outfile;
	FILE *fp_debug_out = NULL;

	fp_debug_out = pbs_python_get_hook_debug_output_fp();

	if (fp_debug_out == NULL) {
		/* prepare to open file if output file pointer not stored */
		hook_outfile = pbs_python_get_hook_debug_output_file();
		if ((hook_outfile != NULL) && (hook_outfile[0] != '\0')) {
			/* need to open in append mode, as */
			/* process_hooks() may have */
			/* already written into this file. */
			fp_debug_out = fopen(hook_outfile, "a");
			if (fp_debug_out == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: open of hook debug output file %s failed!",
					 hook_outfile);
				log_err(-1, __func__, log_buffer);
			} else {
				pbs_python_set_hook_debug_output_fp(fp_debug_out);
			}
		}
	}

	if (fp_debug_out != NULL) {
		fprintf(fp_debug_out, "%s=True\n",
			EVENT_ACCEPT_OBJECT);
		fprintf(fp_debug_out, "%s=False\n",
			EVENT_REJECT_OBJECT);
		fclose(fp_debug_out);
		pbs_python_set_hook_debug_output_fp(NULL);
	}
}

/**
 * @brief
 * 		getting the vnode attributes and resource list
 *			each node attribute will be of the format:
 *			<node_name>.<attr_name>
 *
 * @see
 * 		run_periodic_hook
 *
 * @return void
 */
pbs_list_head *
get_vnode_list(void)
{
	int i;
	int index;
	char name_str_buf[STRBUF + 1] = {'\0'};
	struct pbsnode *pnode = NULL;
	attribute_def *padef = node_attr_def;

	CLEAR_HEAD(vnode_attr_list);
	for (i = 0; i < svr_totnodes; i++) {
		pnode = pbsndlist[i];
		for (index = 0; index < ND_ATR_LAST; index++) {
			if ((padef + index)->at_flags & ATR_VFLAG_SET) {
				strncpy(name_str_buf, pnode->nd_name, STRBUF);
				strcat(name_str_buf, ".");
				strncat(name_str_buf, (padef + index)->at_name, (STRBUF - strlen(name_str_buf)));
				if ((padef + index)->at_encode(get_nattr(pnode, index), &vnode_attr_list, name_str_buf, NULL, ATR_ENCODE_HOOK, NULL) < 0) {
					char *msgbuf;

					pbs_asprintf(&msgbuf,
						     "error on encoding node attributes: %s",
						     name_str_buf);
					log_event(PBSEVENT_DEBUG2,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  __func__, msgbuf);
					free(msgbuf);
					break;
				}
			}
		}
	}
	return &vnode_attr_list;
}

/**
 * @brief
 * 		getting the reservation attribute and resource list
 *
 * @see
 * 		run_periodic_hook
 *
 * @return void
 */
pbs_list_head *
get_resv_list(void)
{
	int index;
	char name_str_buf[STRBUF + 1] = {'\0'};
	resc_resv *presv;
	attribute_def *padef = resv_attr_def;

	CLEAR_HEAD(resv_attr_list);
	presv = (resc_resv *) GET_NEXT(svr_allresvs);

	while (presv != NULL) {
		for (index = 0; index < RESV_ATR_LAST; index++) {
			if ((padef + index)->at_flags & ATR_VFLAG_SET) {
				strncpy(name_str_buf, presv->ri_qs.ri_resvID, STRBUF);
				strcat(name_str_buf, ".");
				strncat(name_str_buf, (padef + index)->at_name, (STRBUF - strlen(name_str_buf)));
				if ((padef + index)->at_encode(get_rattr(presv, index), &resv_attr_list, name_str_buf, NULL, ATR_ENCODE_HOOK, NULL) < 0) {
					char *msgbuf;

					pbs_asprintf(&msgbuf,
						     "error on encoding reservation attributes: %s",
						     name_str_buf);
					log_event(PBSEVENT_DEBUG2,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  __func__, msgbuf);
					free(msgbuf);
					break;
				}
			}
		}
		presv = (resc_resv *) GET_NEXT(presv->ri_allresvs);
	}
	return &resv_attr_list;
}

/**
 * @brief
 *
 *		Process hook scripts based on request type.
 *		This loops through the matching list of
 *		hooks, and executes the corresponding hook scripts.
 *
 * @see
 * 		req_modifyjob, req_movejob, req_quejob, req_resvSub, req_delete and req_runjob
 *
 * @param[in] 	preq	- the batch request
 * @param[in] 	hook_msg  - upon failure, fill this buffer with the actual error
 *			    message.
 * @param[in]   msg_len  - the size of 'hook_msg' buffer.
 * @param[in]   pyinter_func - the interrupt function used when hook has reached
 *			its execution time limit (alarm). This function raises
 *			some signal to the calling process.
 *		      Ex. pbs_python_set_interrupt() which sends an
 *			  an INT signal (ctrl-C)
 * @return	int
 * @retval	1 means all the executed hooks have agreed to accept the request
 * @retval 	0 means at least one hook was encountered to have rejected the
 request.
 * @retval	2 means no hook script executed (special case).
 * @retval	-1 an internal error occurred
 *
 * @par MT-safe: No
 */
int
process_hooks(struct batch_request *preq, char *hook_msg, size_t msg_len,
	      void (*pyinter_func)(void))
{
	hook *phook;
	hook *phook_next = NULL;
	unsigned int hook_event;
	hook_input_param_t req_ptr;
	pbs_list_head *head_ptr;
	job *pjob = NULL;
	int t;
	char *jobid = NULL;
	int num_run = 0;
	int rc = 1;
	int event_initialized = 0;
	conn_t *conn = NULL;
	char *hostname = NULL;

	if (!svr_interp_data.interp_started) {
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__, "Python interpreter not started, skipping hooks");
		return (2);
	}

	hook_input_param_init(&req_ptr);
	if (preq->rq_type == PBS_BATCH_QueueJob) {
		hook_event = HOOK_EVENT_QUEUEJOB;
		req_ptr.rq_job = (struct rq_quejob *) &preq->rq_ind.rq_queuejob;
		head_ptr = &svr_queuejob_hooks;
	} else if (preq->rq_type == PBS_BATCH_PostQueueJob) {
		hook_event = HOOK_EVENT_POSTQUEUEJOB;
		req_ptr.rq_postqueuejob = (struct rq_postqueuejob *) &preq->rq_ind.rq_postqueuejob;
		head_ptr = &svr_postqueuejob_hooks;
		jobid = ((struct rq_postqueuejob *) (req_ptr.rq_postqueuejob))->rq_jid;
		t = is_job_array(jobid);
		if ((t == IS_ARRAY_Single) || (t == IS_ARRAY_NO)) {
			pjob = find_job(jobid);
		}
	} else if (preq->rq_type == PBS_BATCH_SubmitResv) {
		hook_event = HOOK_EVENT_RESVSUB;
		req_ptr.rq_job = (struct rq_quejob *) &preq->rq_ind.rq_queuejob;
		head_ptr = &svr_resvsub_hooks;
	} else if (preq->rq_type == PBS_BATCH_ModifyResv) {
		hook_event = HOOK_EVENT_MODIFYRESV;
		req_ptr.rq_manage = (struct rq_quejob *) &preq->rq_ind.rq_modify;
		head_ptr = &svr_modifyresv_hooks;
	} else if (preq->rq_type == PBS_BATCH_ModifyJob) {
		hook_event = HOOK_EVENT_MODIFYJOB;
		req_ptr.rq_manage = (struct rq_manage *) &preq->rq_ind.rq_modify;
		head_ptr = &svr_modifyjob_hooks;
		/* Modifyjob hooks not run if requester is the scheduler */
		if ((preq->rq_user[0] != '\0') && (strcmp(preq->rq_user, PBS_SCHED_DAEMON_NAME) == 0) && (pbs_conf.sched_modify_event == 0))
			return (2);
	} else if (preq->rq_type == PBS_BATCH_MoveJob) {
		hook_event = HOOK_EVENT_MOVEJOB;
		req_ptr.rq_move = (struct rq_move *) &preq->rq_ind.rq_move;
		head_ptr = &svr_movejob_hooks;
	} else if (preq->rq_type == PBS_BATCH_RunJob || preq->rq_type == PBS_BATCH_AsyrunJob ||
		   preq->rq_type == PBS_BATCH_AsyrunJob_ack) {
		hook_event = HOOK_EVENT_RUNJOB;
		req_ptr.rq_run = (struct rq_runjob *) &preq->rq_ind.rq_run;
		head_ptr = &svr_runjob_hooks;

		jobid = ((struct rq_runjob *) (req_ptr.rq_run))->rq_jid;
		t = is_job_array(jobid);
		if ((t == IS_ARRAY_Single) || (t == IS_ARRAY_NO)) {
			pjob = find_job(jobid); /* regular job and single subjob */
		}

		/* an array job or range of subjobs will fall through with pjob set to NULL */

		if (pjob == NULL) {
			log_event(PBSEVENT_DEBUG2,
				  PBS_EVENTCLASS_HOOK, LOG_ERR, __func__,
				  "Did not find a job tied to runjob request!");
			return (-1);
		}
	} else if (preq->rq_type == PBS_BATCH_JobObit) {
		hook_event = HOOK_EVENT_JOBOBIT;
		req_ptr.rq_obit = (struct rq_jobobit *) &preq->rq_ind.rq_obit;
		head_ptr = &svr_jobobit_hooks;
	} else if (preq->rq_type == PBS_BATCH_Manager) {
		hook_event = HOOK_EVENT_MANAGEMENT;
		preq->rq_ind.rq_management.rq_reply = &preq->rq_reply;
		preq->rq_ind.rq_management.rq_time = preq->rq_time;
		/* Copying the pointer to rq_management below is safe since
		req_manager() bumps the reference count on preq */
		req_ptr.rq_manage = (struct rq_manage *) &preq->rq_ind.rq_management;
		head_ptr = &svr_management_hooks;
	} else if (preq->rq_type == PBS_BATCH_ModifyVnode) {
		hook_event = HOOK_EVENT_MODIFYVNODE;
		req_ptr.rq_modifyvnode = (struct rq_modifyvnode *) &preq->rq_ind.rq_modifyvnode;
		head_ptr = &svr_modifyvnode_hooks;
	} else if (preq->rq_type == PBS_BATCH_HookPeriodic) {
		hook_event = HOOK_EVENT_PERIODIC;
		head_ptr = &svr_periodic_hooks;
	} else if (preq->rq_type == PBS_BATCH_DeleteResv || preq->rq_type == PBS_BATCH_ResvOccurEnd) {
		hook_event = HOOK_EVENT_RESV_END;
		req_ptr.rq_manage = (struct rq_manage *) &preq->rq_ind.rq_delete;
		head_ptr = &svr_resv_end_hooks;
	} else if (preq->rq_type == PBS_BATCH_BeginResv) {
		hook_event = HOOK_EVENT_RESV_BEGIN;
		req_ptr.rq_manage = (struct rq_manage *) &preq->rq_ind.rq_resresvbegin;
		head_ptr = &svr_resv_begin_hooks;
	} else if (preq->rq_type == PBS_BATCH_ConfirmResv) {
		hook_event = HOOK_EVENT_RESV_CONFIRM;
		req_ptr.rq_run = (struct rq_runjob *) &preq->rq_ind.rq_run;
		head_ptr = &svr_resv_confirm_hooks;
	} else {
		return (-1); /* unexpected event encountered */
	}

	memset(hook_msg, '\0', msg_len);

	/* initialize global flags */
	pbs_python_event_accept();

	for (phook = (hook *) GET_NEXT(*head_ptr); phook; phook = phook_next) {

		if (preq->rq_type == PBS_BATCH_QueueJob) {
			phook_next = (hook *) GET_NEXT(phook->hi_queuejob_hooks);
		} else if (preq->rq_type == PBS_BATCH_PostQueueJob) {
			phook_next = (hook *) GET_NEXT(phook->hi_postqueuejob_hooks);
		} else if (preq->rq_type == PBS_BATCH_SubmitResv) {
			phook_next = (hook *) GET_NEXT(phook->hi_resvsub_hooks);
		} else if (preq->rq_type == PBS_BATCH_ModifyResv) {
			phook_next = (hook *) GET_NEXT(phook->hi_modifyresv_hooks);
		} else if (preq->rq_type == PBS_BATCH_ModifyJob) {
			phook_next = (hook *) GET_NEXT(phook->hi_modifyjob_hooks);
		} else if (preq->rq_type == PBS_BATCH_MoveJob) {
			phook_next = (hook *) GET_NEXT(phook->hi_movejob_hooks);
		} else if (preq->rq_type == PBS_BATCH_RunJob || preq->rq_type == PBS_BATCH_AsyrunJob ||
			   preq->rq_type == PBS_BATCH_AsyrunJob_ack) {
			phook_next = (hook *) GET_NEXT(phook->hi_runjob_hooks);
		} else if (preq->rq_type == PBS_BATCH_JobObit) {
			phook_next = (hook *) GET_NEXT(phook->hi_jobobit_hooks);
		} else if (preq->rq_type == PBS_BATCH_Manager) {
			phook_next = (hook *) GET_NEXT(phook->hi_management_hooks);
		} else if (preq->rq_type == PBS_BATCH_ModifyVnode) {
			phook_next = (hook *) GET_NEXT(phook->hi_modifyvnode_hooks);
		} else if (preq->rq_type == PBS_BATCH_HookPeriodic) {
			phook_next = (hook *) GET_NEXT(phook->hi_periodic_hooks);
		} else if (preq->rq_type == PBS_BATCH_ConfirmResv) {
			phook_next = (hook *) GET_NEXT(phook->hi_resv_confirm_hooks);
		} else if (preq->rq_type == PBS_BATCH_BeginResv) {
			phook_next = (hook *) GET_NEXT(phook->hi_resv_begin_hooks);
		} else if (preq->rq_type == PBS_BATCH_DeleteResv || preq->rq_type == PBS_BATCH_ResvOccurEnd) {
			phook_next = (hook *) GET_NEXT(phook->hi_resv_end_hooks);
		} else {
			return (-1); /* should not get here */
		}

		if (phook->enabled == FALSE)
			continue;

		if (phook->user != HOOK_PBSADMIN)
			continue;

		if (phook->script == NULL) {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Hook has no script content. Skipping hook.");
			continue;
		}

		if (hook_event & HOOK_EVENT_PERIODIC) {
			(void) set_task(WORK_Timed, time_now + phook->freq, run_periodic_hook, phook);
			num_run++;
			continue;
		}
		if (preq->rq_conn >= 0 && (conn = get_conn(preq->rq_conn)) != NULL) {
			hostname = conn->cn_physhost;
		} else {
			hostname = preq->rq_host;
		}
		rc = server_process_hooks(preq->rq_type, preq->rq_user, hostname, phook,
					  hook_event, pjob, &req_ptr, hook_msg, msg_len, pyinter_func,
					  &num_run, &event_initialized);
		pbs_python_ext_free_global_dict(phook->script);
		if ((rc == 0) || (rc == -1)) {
			pbs_python_clear_attributes();
			return (rc);
		}
	}

	if (num_run == 0)
		return (2);
	/* clear attributes for the requests which don't call recreate_request */
	if ((preq->rq_type != PBS_BATCH_SubmitResv) && (preq->rq_type != PBS_BATCH_ModifyJob) &&
			(preq->rq_type != PBS_BATCH_QueueJob) && (preq->rq_type != PBS_BATCH_MoveJob) &&
			(preq->rq_type != PBS_BATCH_ModifyResv)) {
				pbs_python_clear_attributes();
	}
	return 1;
}
/**
 * @brief
 *
 *		This function executes the hook script passed to it in
 *		hook structure.
 *
 * @param[in] 	rq_type	    - batch request type
 * @param[in] 	rq_user	    - batch request user
 * @param[in] 	rq_host	    - request host
 * @param[in]	phook	    - structure of the hook that needs to execute
 * @param[in]	hook_event  - hook event type
 * @param[in]	pjob	    - structure of job corresponding to which hook needs to run
 *			      It is null when used with periodic hook.
 * @param[in]	req_ptr	    - Input parameters to be passed to the hook.
 * @param[in] 	hook_msg  - upon failure, fill this buffer with the actual error
 *			    message.
 * @param[in]   msg_len  - the size of 'hook_msg' buffer.
 * @param[in]   pyinter_func - the interrupt function used when hook has reached
 *			its execution time limit (alarm). This function raises
 *			some signal to the calling process.
 *		      Ex. pbs_python_set_interrupt() which sends an
 *			  an INT signal (ctrl-C)
 * @param[out]	num_run	    - reference of an integer which is incremented when
 *			      hook runs successfully.
 * @return	int
 * @retval	1 means the executed hook has agreed to accept the request
 * @retval 	0 means at least one hook was encountered to have rejected the
 request.
 * @retval	2 means no hook script executed (special case).
 * @retval	-1 an internal error occurred
 *
 * @par MT-safe: No
 */
int
server_process_hooks(int rq_type, char *rq_user, char *rq_host, hook *phook,
		     int hook_event, job *pjob, hook_input_param_t *req_ptr,
		     char *hook_msg, int msg_len, void (*pyinter_func)(void),
		     int *num_run, int *event_initialized)
{

	char hook_inputfile[MAXPATHLEN + 1];
	char hook_datafile[MAXPATHLEN + 1];
	char hook_outfile[MAXPATHLEN + 1];
	FILE *fp_debug = NULL;
	FILE *fp2_debug = NULL;
	FILE *fp_debug_out = NULL;
	FILE *fp_debug_out_save = NULL;
	static char env_pbs_hook_config[2 * MAXPATHLEN + 1];
	char hook_config_path[MAXPATHLEN + 1];
	struct python_script *py_script = NULL;
	struct stat sbuf;
	int rc;
	char *p;
	static size_t suffix_sz;
	hook_output_param_t req_params_out;
	pid_t mypid;
	pbs_list_head event_vnode;
	pbs_list_head event_resv;
	char perf_label[MAXBUFLEN];

	if (phook == NULL) {
		log_event(PBSEVENT_DEBUG3,
			  PBS_EVENTCLASS_HOOK, LOG_ERR,
			  __func__, "no associated hook");
		return -1;
	}

	if (req_ptr == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "warning: empty hook input param!");
		log_event(PBSEVENT_DEBUG3,
			  PBS_EVENTCLASS_HOOK, LOG_ERR,
			  phook->hook_name, log_buffer);
		return -1;
	}

	mypid = getpid();
	if (pjob != NULL)
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%s", hook_event_as_string(hook_event), phook->hook_name, pjob->ji_qs.ji_jobid);
	else
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", hook_event_as_string(hook_event), phook->hook_name, mypid);

	hook_perf_stat_start(perf_label, "server_process_hooks", 1);

	if (suffix_sz == 0)
		suffix_sz = strlen(HOOK_SCRIPT_SUFFIX);

	/* initialize various hook_debug_* instance */
	pbs_python_set_hook_debug_output_fp(NULL);
	pbs_python_set_hook_debug_output_file("");

	if (phook->debug) {
		if (rq_type == PBS_BATCH_HookPeriodic)
			snprintf(hook_inputfile, MAXPATHLEN, FMT_HOOK_INFILE, path_hooks_workdir,
				 hook_event_as_string(hook_event), phook->hook_name, mypid);
		else
			snprintf(hook_inputfile, MAXPATHLEN, FMT_HOOK_INFILE, path_hooks_workdir,
				 hook_event_as_string(hook_event), phook->hook_name, (int) time(0));

		fp_debug = fopen(hook_inputfile, "w");
		if (fp_debug == NULL) {
			sprintf(log_buffer,
				"warning: open of debug input file %s failed!",
				hook_inputfile);
			log_event(PBSEVENT_DEBUG3,
				  PBS_EVENTCLASS_HOOK, LOG_ERR,
				  phook->hook_name, log_buffer);
		} else {
			pbs_python_set_hook_debug_input_fp(fp_debug);
			pbs_python_set_hook_debug_input_file(hook_inputfile);
		}

		if (rq_type == PBS_BATCH_HookPeriodic)
			snprintf(hook_datafile, MAXPATHLEN, FMT_HOOK_DATAFILE,
				 path_hooks_workdir, hook_event_as_string(hook_event),
				 phook->hook_name, mypid);
		else
			snprintf(hook_datafile, MAXPATHLEN, FMT_HOOK_DATAFILE,
				 path_hooks_workdir, hook_event_as_string(hook_event),
				 phook->hook_name, (int) time(0));

		fp2_debug = fopen(hook_datafile, "w");
		if (fp2_debug == NULL) {
			sprintf(log_buffer,
				"warning: open of debug data file %s failed!",
				hook_datafile);
			log_event(PBSEVENT_DEBUG3,
				  PBS_EVENTCLASS_HOOK, LOG_ERR,
				  phook->hook_name, log_buffer);
		} else {
			pbs_python_set_hook_debug_data_fp(fp2_debug);
			pbs_python_set_hook_debug_data_file(hook_datafile);
		}
	}

	/* optimization here - create an event object only if there's */
	/* at least one enabled hook */
	if (!(*event_initialized)) { /* only once for all hooks */
		rc = pbs_python_event_set(hook_event, rq_user,
					  rq_host, req_ptr, perf_label);

		if (rc == -1) { /* internal server code failure */
			log_event(PBSEVENT_DEBUG2,
				  PBS_EVENTCLASS_HOOK, LOG_ERR,
				  phook->hook_name,
				  "Encountered an error while setting event");
		}
		*event_initialized = 1;

	} else if (phook->debug && (fp_debug != NULL)) {
		/* If we have several hooks attached to the same*/
		/* hook event, the first hook that runs */
		/* will call pbs_python_event_set() (above if case), */
		/* which will generate the hook input */
		/* debug file. On the next hook and succeeding hooks */
		/* that execute, we'll need to generate the */
		/* intermediate hook input debug file (based on */
		/* changes made by the previous hooks), by calling */
		/* recreate_request() on a 'temp_req' structure */
		/* that will be discarded (not acted upon). */
		struct batch_request *temp_req;
		int do_recreate = 0;

		temp_req = alloc_br(rq_type);
		if (temp_req != NULL) {
			switch (rq_type) {
				case PBS_BATCH_QueueJob:
				case PBS_BATCH_SubmitResv:
					CLEAR_HEAD(temp_req->rq_ind.rq_queuejob.rq_attr);
					do_recreate = 1;
					break;
				case PBS_BATCH_PostQueueJob:
					CLEAR_HEAD(temp_req->rq_ind.rq_postqueuejob.rq_attr);
					do_recreate = 1;
					break;
				case PBS_BATCH_ModifyJob:
					CLEAR_HEAD(temp_req->rq_ind.rq_modify.rq_attr);
					do_recreate = 1;
					break;
				case PBS_BATCH_Manager:
					CLEAR_HEAD(temp_req->rq_ind.rq_manager.rq_attr);
					do_recreate = 0;
					break;
				default:
					do_recreate = 0;
			}
			if (do_recreate) {
				fp_debug_out_save = pbs_python_get_hook_debug_output_fp();
				pbs_python_set_hook_debug_output_fp(fp_debug);
				/* recreate_request() appends */
				/* pbs.event().job or */
				/* pbs.event().resv values from */
				/* previous hooks execution into */
				/* 'temp_req' structure, which */
				/* results also in the values being */
				/* written into the file represented */
				/* by 'fp_debug'. */
				(void) recreate_request(temp_req);
				pbs_python_set_hook_debug_output_fp(fp_debug_out_save);
			}
			free_br(temp_req);
		} else {
			log_event(PBSEVENT_DEBUG3,
				  PBS_EVENTCLASS_HOOK, LOG_WARNING,
				  phook->hook_name,
				  "warning: can't generate complete hook input file due to malloc failure.");
		}
	}
	/* hook_name changes for each hook */
	/* This sets Python event object's hook_name value */
	rc = pbs_python_event_set_attrval(PY_EVENT_HOOK_NAME,
					  phook->hook_name);

	if (rc == -1) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name,
			  "Failed to set event 'hook_name'.");
		if (fp_debug != NULL) {
			fclose(fp_debug);
			fp_debug = NULL;
			pbs_python_set_hook_debug_input_fp(NULL);
			pbs_python_set_hook_debug_input_file("");
		}
		if (fp2_debug != NULL) {
			fclose(fp2_debug);
			fp2_debug = NULL;
			pbs_python_set_hook_debug_data_fp(NULL);
			pbs_python_set_hook_debug_data_file("");
		}
		rc = -1;
		goto server_process_hooks_exit;
	}

	/*
	 * hook_type needed for internal processing;
	 * hook_type changes for each hook.
	 * This sets Python event object's hook_type value
	 */
	rc = pbs_python_event_set_attrval(PY_EVENT_HOOK_TYPE,
					  hook_type_as_string(phook->type));

	if (rc == -1) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name,
			  "Failed to set event 'hook_type'.");
		if (fp_debug != NULL) {
			fclose(fp_debug);
			fp_debug = NULL;
			pbs_python_set_hook_debug_input_fp(NULL);
			pbs_python_set_hook_debug_input_file("");
		}
		if (fp2_debug != NULL) {
			fclose(fp2_debug);
			fp2_debug = NULL;
			pbs_python_set_hook_debug_data_fp(NULL);
			pbs_python_set_hook_debug_data_file("");
		}
		if (fp_debug_out != NULL) {
			fclose(fp_debug_out);
			fp_debug_out = NULL;
			pbs_python_set_hook_debug_output_fp(NULL);
			pbs_python_set_hook_debug_output_file("");
		}
		rc = -1;
		goto server_process_hooks_exit;
	}

	if (rq_type == PBS_BATCH_HookPeriodic) {
		char freq_str[5];
		sprintf(freq_str, "%d", phook->freq);
		rc = pbs_python_event_set_attrval(PY_EVENT_FREQ, freq_str);

		if (rc == -1) {
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Failed to set event 'freq'.");
			if (fp_debug != NULL) {
				fclose(fp_debug);
				fp_debug = NULL;
				pbs_python_set_hook_debug_input_fp(NULL);
				pbs_python_set_hook_debug_input_file("");
			}
			if (fp2_debug != NULL) {
				fclose(fp2_debug);
				fp2_debug = NULL;
				pbs_python_set_hook_debug_data_fp(NULL);
				pbs_python_set_hook_debug_data_file("");
			}
			if (fp_debug_out != NULL) {
				fclose(fp_debug_out);
				fp_debug_out = NULL;
				pbs_python_set_hook_debug_output_fp(NULL);
				pbs_python_set_hook_debug_output_file("");
			}
			rc = -1;
			goto server_process_hooks_exit;
		}
	}

	set_alarm(phook->alarm, pyinter_func);

	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
		  LOG_INFO, phook->hook_name, "started");

	pbs_python_set_mode(PY_MODE); /* hook script mode */

	/* hook script may create files, and we don't want it to */
	/* be littering server's private directory. */
	/* NOTE: path_hooks_workdir is periodically cleaned up */
	if (chdir(path_hooks_workdir) != 0) {
		log_event(PBSEVENT_DEBUG2,
			  PBS_EVENTCLASS_HOOK, LOG_WARNING, phook->hook_name,
			  "unable to go to hooks tmp directory");
	}
	pbs_python_set_os_environ(PBS_HOOK_CONFIG_FILE, NULL);
	(void) pbs_python_set_pbs_hook_config_filename(NULL);

	strncpy(env_pbs_hook_config, PBS_HOOK_CONFIG_FILE,
		sizeof(env_pbs_hook_config) - 1);
	py_script = phook->script;
	if (py_script->path != NULL) {
		strncpy(hook_config_path, py_script->path, sizeof(hook_config_path) - 1);
		p = strstr(hook_config_path, HOOK_SCRIPT_SUFFIX);
		if (p != NULL) {
			/* replace <HOOK_SCRIPT_SUFFIX> with */
			/* <HOOK_CONFIG_SUFFIX>. suffix_sz is */
			/* length of <HOOK_SCRIPT_SUFFIX> so as */
			/* to not overflow. */
			strncpy(p, HOOK_CONFIG_SUFFIX, suffix_sz);

			if (stat(hook_config_path, &sbuf) == 0) {
				pbs_python_set_os_environ(
					PBS_HOOK_CONFIG_FILE,
					hook_config_path);
				(void) pbs_python_set_pbs_hook_config_filename(hook_config_path);
			}
		}
	}

	rc = pbs_python_check_and_compile_script(&svr_interp_data,
						 phook->script);

	/* reset global flag to allow modification of */
	/* attributes and resources for every new hook execution. */
	pbs_python_event_param_mod_allow();

	/* Reset flag to restart scheduling cycle */
	pbs_python_no_scheduler_restart_cycle();

	if (rq_type == PBS_BATCH_RunJob || rq_type == PBS_BATCH_AsyrunJob || rq_type == PBS_BATCH_AsyrunJob_ack) {
		/* Clear dictionary that remembers previously */
		/* set ATTR_l resources in a hook script */
		/* Currently, only job ATTR_l resources can be */
		/* modified in a runjob hook. */
		if (pbs_python_event_jobresc_clear_hookset(ATTR_l) != 0) {
			log_event(PBSEVENT_DEBUG2,
				  PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Failed to clear jobresc hookset dictionary.");
			if (fp_debug != NULL) {
				fclose(fp_debug);
				fp_debug = NULL;
				pbs_python_set_hook_debug_input_fp(NULL);
				pbs_python_set_hook_debug_input_file("");
			}
			if (fp2_debug != NULL) {
				fclose(fp2_debug);
				fp2_debug = NULL;
				pbs_python_set_hook_debug_data_fp(NULL);
				pbs_python_set_hook_debug_data_file("");
			}
			if (fp_debug_out != NULL) {
				fclose(fp_debug_out);
				fp_debug_out = NULL;
				pbs_python_set_hook_debug_output_fp(NULL);
				pbs_python_set_hook_debug_output_file("");
			}
			rc = -1;
			goto server_process_hooks_exit;
		}
	}

	if (fp_debug != NULL) {
		/* print name of user requested queue if I am a queuejob hook */
		if (rq_type == PBS_BATCH_QueueJob) {
			char *qname = ((struct rq_queuejob *) req_ptr->rq_job)->rq_destin;
			/* use default queue if user did not specify a queue for the job */
			if ((!qname || *qname == '\0' || *qname == '@') && is_sattr_set(SVR_ATR_dflt_que))
				fprintf(fp_debug, "%s.queue=%s\n", EVENT_JOB_OBJECT, get_sattr_str(SVR_ATR_dflt_que));
			else
				fprintf(fp_debug, "%s.queue=%s\n", EVENT_JOB_OBJECT, qname);
		}
		fprintf(fp_debug, "%s.%s=%s\n", PBS_OBJ, GET_NODE_NAME_FUNC,
			(char *) server_host);
		fprintf(fp_debug, "%s.%s=%s\n", EVENT_OBJECT, PY_EVENT_TYPE,
			hook_event_as_string(hook_event));
		fprintf(fp_debug, "%s.%s=%s\n", EVENT_OBJECT, PY_EVENT_HOOK_NAME,
			phook->hook_name);
		fprintf(fp_debug, "%s.%s=%s\n", EVENT_OBJECT, PY_EVENT_HOOK_TYPE,
			hook_type_as_string(phook->type));
		fprintf(fp_debug, "%s.%s=%s\n", EVENT_OBJECT, "requestor",
			rq_user);
		fprintf(fp_debug, "%s.%s=%s\n", EVENT_OBJECT, "requestor_host",
			rq_host);
		fprintf(fp_debug, "%s.%s=%s\n", EVENT_OBJECT, "user", hook_user_as_string(phook->user));
		fprintf(fp_debug, "%s.%s=%d\n", EVENT_OBJECT, "alarm", phook->alarm);
	}

	/* let rc pass through */
	if (rc == 0) {
		hook_perf_stat_start(perf_label, "run_code", 0);
		rc = pbs_python_run_code_in_namespace(&svr_interp_data, phook->script, 0);
		hook_perf_stat_stop(perf_label, "run_code", 0);
	}

	if (fp_debug != NULL) {
		fclose(fp_debug);
		fp_debug = NULL;
		pbs_python_set_hook_debug_input_fp(NULL);
		pbs_python_set_hook_debug_input_file("");
	}

	/* set hook_debug_output_file for recreate_request(), set_* calls */
	/* to dump any hook results in the file. */
	if (phook->debug || rq_type == PBS_BATCH_HookPeriodic) {
		if (rq_type == PBS_BATCH_HookPeriodic)
			snprintf(hook_outfile, MAXPATHLEN, FMT_HOOK_OUTFILE,
				 path_hooks_workdir, hook_event_as_string(hook_event),
				 phook->hook_name, mypid);
		else
			snprintf(hook_outfile, MAXPATHLEN, FMT_HOOK_OUTFILE,
				 path_hooks_workdir, hook_event_as_string(hook_event),
				 phook->hook_name, (int) time(0));

		fp_debug_out = fopen(hook_outfile, "w");
		if (fp_debug_out == NULL) {
			char *msgbuf;

			pbs_asprintf(&msgbuf,
				     "warning: open of debug output file %s failed!",
				     hook_inputfile);
			log_event(PBSEVENT_DEBUG3,
				  PBS_EVENTCLASS_HOOK, LOG_ERR,
				  phook->hook_name, msgbuf);
			free(msgbuf);
			if (rq_type == PBS_BATCH_HookPeriodic) {
				/* we will need output file to read data from hook later */
				rc = -1;
				goto server_process_hooks_exit;
			}
		} else {
			fp_debug_out_save = pbs_python_get_hook_debug_output_fp();
			if (fp_debug_out_save != NULL) {
				fclose(fp_debug_out_save);
			}
			pbs_python_set_hook_debug_output_fp(fp_debug_out);
			pbs_python_set_hook_debug_output_file(hook_outfile);
		}
	} else {
		fp_debug_out_save = pbs_python_get_hook_debug_output_fp();
		if (fp_debug_out_save != NULL) {
			fclose(fp_debug_out_save);
		}
		pbs_python_set_hook_debug_output_fp(NULL);
		/* NOTE: don't call */
		/* pbs_python_set_hook_debug_output_file() as */
		/* we still need a file to dump any remaining */
		/* debug output in case all hooks end */
		/* up accepting the current event with some */
		/* hooks with debug=true and some that are */
		/* debug=false */
	}

	if (fp2_debug != NULL) {
		fclose(fp2_debug);
		fp2_debug = NULL;
		pbs_python_set_hook_debug_data_fp(NULL);
		pbs_python_set_hook_debug_data_file("");
	}

	/* go back to server's private directory */
	if (chdir(path_priv) != 0) {
		log_event(PBSEVENT_DEBUG2,
			  PBS_EVENTCLASS_HOOK, LOG_WARNING, phook->hook_name,
			  "unable to go back server private directory");
	}

	pbs_python_set_mode(C_MODE); /* PBS C mode - flexible */
	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
		  LOG_INFO, phook->hook_name, "finished");
	set_alarm(0, NULL);

	switch (rc) {
		case -1: /* internal error */
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Internal server error encountered. Skipping hook.");
			if (fp_debug_out != NULL) {
				fclose(fp_debug_out);
				fp_debug_out = NULL;
				pbs_python_set_hook_debug_output_fp(NULL);
				pbs_python_set_hook_debug_output_file("");
			}
			rc = -1;
			goto server_process_hooks_exit;
		case -2: /* unhandled exception */
			pbs_python_event_reject(NULL);
			pbs_python_event_param_mod_disallow();

			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "%s hook '%s' encountered an exception, "
				 "request rejected",
				 hook_event_as_string(hook_event), phook->hook_name);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
			snprintf(hook_msg, msg_len - 1,
				 "request rejected as filter hook '%s' encountered an "
				 "exception. Please inform Admin",
				 phook->hook_name);
			write_hook_reject_debug_output_and_close(hook_msg);
			rc = 0;
			goto server_process_hooks_exit;
		case -3: /* alarm timeout */
			pbs_python_event_reject(NULL);
			pbs_python_event_param_mod_disallow();

			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "alarm call while running %s hook '%s', "
				 "request rejected",
				 hook_event_as_string(hook_event), phook->hook_name);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
			snprintf(hook_msg, msg_len - 1,
				 "request rejected as filter hook '%s' got an "
				 "alarm call. Please inform Admin",
				 phook->hook_name);
			write_hook_reject_debug_output_and_close(hook_msg);
			rc = 0;
			goto server_process_hooks_exit;
	}
	*num_run += 1;
	if (pbs_python_get_scheduler_restart_cycle_flag() == TRUE) {

		set_scheduler_flag(SCH_SCHEDULE_RESTART_CYCLE, dflt_scheduler);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, phook->hook_name,
			  "requested for scheduler to restart cycle");
	}

	/* reject if at least one hook script rejects */
	if (pbs_python_event_get_accept_flag() == FALSE) {
		char *emsg = NULL;

		if (rq_type == PBS_BATCH_RunJob || rq_type == PBS_BATCH_AsyrunJob || rq_type == PBS_BATCH_AsyrunJob_ack) {
			char *new_error_path_str = NULL;
			char *new_output_path_str = NULL;

			new_error_path_str =
				pbs_python_event_job_getval_hookset(ATTR_e,
								    NULL, 0, NULL, 0);

			if (new_error_path_str != NULL) {
				sprintf(log_buffer,
					"cannot modify job attribute '%s' after runjob "
					"request has been rejected.",
					ATTR_e);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, phook->hook_name, log_buffer);
			}

			new_output_path_str =
				pbs_python_event_job_getval_hookset(ATTR_o,
								    NULL, 0, NULL, 0);

			if (new_output_path_str != NULL) {
				sprintf(log_buffer,
					"cannot modify job attribute '%s' after runjob "
					"request has been rejected.",
					ATTR_o);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, phook->hook_name, log_buffer);
			}

			if (do_runjob_reject_actions(pjob, phook->hook_name) != 0)
				attribute_jobmap_restore(pjob, runjob_reject_attrlist);
		}

		snprintf(hook_msg, msg_len - 1,
			 "%s request rejected by '%s'",
			 hook_event_as_string(hook_event),
			 phook->hook_name);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name, hook_msg);
		if ((emsg = pbs_python_event_get_reject_msg()) != NULL) {
			snprintf(hook_msg, msg_len - 1, "%s", emsg);
			/* log also the custom reject message */
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, hook_msg);

			if (rq_type == PBS_BATCH_AsyrunJob) {
				char *jcomment = NULL;

				pbs_asprintf(&jcomment, "Not Running: PBS Error: %s", hook_msg);
				/* For async run, sched won't update job's comment, so let's do that */
				set_jattr_str_slim(pjob, JOB_ATR_Comment, jcomment, NULL);
				free(jcomment);
			}
		}

		pbs_python_do_vnode_set();
		write_hook_reject_debug_output_and_close(emsg);
		rc = 0;
		goto server_process_hooks_exit;
	} else { /* hook request has been accepted */

		if (rq_type == PBS_BATCH_PostQueueJob) {

			hook_msg[0] = '\0';
			if (do_postqueuejob_accept_actions(pjob, phook->hook_name) != 0) {
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name,
					   "postqueuejob request rejected: %s", hook_msg);
				snprintf(log_buffer, sizeof(log_buffer),
					 "request rejected by filter hook: %s", hook_msg);
				strncpy(hook_msg, log_buffer, msg_len - 1);
				attribute_jobmap_restore(pjob, postqueuejob_accept_attrlist);
				write_hook_reject_debug_output_and_close(hook_msg);
				rc = 0;
				goto server_process_hooks_exit;
			}
		} else if (rq_type == PBS_BATCH_RunJob || rq_type == PBS_BATCH_AsyrunJob || rq_type == PBS_BATCH_AsyrunJob_ack) {
			char *new_exec_time_str = NULL;
			char *new_hold_types_str = NULL;
			char *new_project_str = NULL;
			char *new_depend_str = NULL;
			char *new_conv_str = NULL;
			char hold_opval[HOOK_BUF_SIZE];
			char hold_delval[HOOK_BUF_SIZE];
			int job_modified = 0;
			int vnode_modified = 0;

			new_exec_time_str =
				pbs_python_event_job_getval_hookset(ATTR_a,
								    NULL, 0, NULL, 0);

			if (new_exec_time_str != NULL) {
				job_modified = 1;
				snprintf(log_buffer, sizeof(log_buffer),
					 "Found job '%s' attribute flagged to be set",
					 ATTR_a);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name, log_buffer);
			}

			if (job_modified != 1) {
				new_hold_types_str =
					pbs_python_event_job_getval_hookset(ATTR_h,
									    hold_opval, HOOK_BUF_SIZE, hold_delval,
									    HOOK_BUF_SIZE);

				if (new_hold_types_str != NULL) {
					job_modified = 1;
					snprintf(log_buffer, sizeof(log_buffer),
						 "Found job '%s' attribute flagged to be set", ATTR_h);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name, log_buffer);
				}
			}

			if (job_modified != 1) {
				new_project_str =
					pbs_python_event_job_getval_hookset(
						ATTR_project, NULL, 0, NULL, 0);

				if (new_project_str != NULL) {
					job_modified = 1;
					snprintf(log_buffer, sizeof(log_buffer),
						 "Found job '%s' attribute flagged to be set",
						 ATTR_project);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name, log_buffer);
				}
			}

			if (job_modified != 1) {
				new_depend_str =
					pbs_python_event_job_getval_hookset(
						ATTR_depend, NULL, 0, NULL, 0);

				if (new_depend_str != NULL) {
					job_modified = 1;
					snprintf(log_buffer, sizeof(log_buffer),
						 "Found job '%s' attribute flagged to be set",
						 ATTR_depend);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name, log_buffer);
				}
			}

			if (job_modified != 1) {
				new_conv_str =
					pbs_python_event_job_getval_hookset(
						ATTR_create_resv_from_job, NULL, 0, NULL, 0);

				if (new_conv_str != NULL)
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name,
						  "Found job " ATTR_create_resv_from_job " attribute flagged to be set");
			}

			vnode_modified = pbs_python_has_vnode_set();

			if (job_modified || vnode_modified) {
				sprintf(log_buffer,
					"runjob request rejected by '%s': "
					"cannot modify %s after runjob "
					"request has been accepted.",
					phook->hook_name,
					(vnode_modified ? PY_EVENT_PARAM_VNODE : PY_EVENT_PARAM_JOB));
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, phook->hook_name, log_buffer);
				/* The following message will appear when */
				/* calling pbs_geterrmsg():		  */
				snprintf(hook_msg, msg_len - 1,
					 "request rejected by filter hook '%s': "
					 "cannot modify %s after runjob "
					 "request has been accepted.",
					 phook->hook_name,
					 (vnode_modified ? PY_EVENT_PARAM_VNODE : PY_EVENT_PARAM_JOB));

				write_hook_reject_debug_output_and_close(hook_msg);
				rc = 0;
				goto server_process_hooks_exit;
			}

			hook_msg[0] = '\0';
			if (do_runjob_accept_actions(pjob, phook->hook_name, hook_msg, msg_len - 1) != 0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "runjob request rejected: %s", hook_msg);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_ERR, phook->hook_name, log_buffer);
				snprintf(log_buffer, sizeof(log_buffer),
					 "request rejected by filter hook: %s", hook_msg);
				strncpy(hook_msg, log_buffer, msg_len - 1);
				attribute_jobmap_restore(pjob, runjob_accept_attrlist);
				write_hook_reject_debug_output_and_close(hook_msg);
				rc = 0;
				goto server_process_hooks_exit;
			}
		}

		if (rq_type == PBS_BATCH_HookPeriodic) {
			if (fp_debug_out != NULL) {
				fprintf(fp_debug_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
				fprintf(fp_debug_out, "%s=False\n", EVENT_REJECT_OBJECT);
			}
			hook_output_param_init(&req_params_out);
			CLEAR_HEAD(event_vnode);
			CLEAR_HEAD(event_resv);
			req_params_out.vns_list = (pbs_list_head *) &event_vnode;
			req_params_out.resv_list = (pbs_list_head *) &event_resv;
			rc = pbs_python_event_to_request(hook_event, &req_params_out, perf_label, HOOK_PERF_HOOK_OUTPUT);
			if (rc == -1) {
				log_err(PBSE_INTERNAL, phook->hook_name, "error occured recreating request!");
			}
			if (fp_debug_out != NULL)
				fprint_svrattrl_list(fp_debug_out, EVENT_VNODELIST_OBJECT, &event_vnode);
			free_attrlist(&event_vnode);
			CLEAR_HEAD(event_vnode);
			if (fp_debug_out != NULL)
				fclose(fp_debug_out);
			pbs_python_set_hook_debug_output_fp(NULL);
			rc = 1;
			goto server_process_hooks_exit;
		}
	}

	write_hook_accept_debug_output_and_close();
	rc = 1;
server_process_hooks_exit:
	hook_perf_stat_stop(perf_label, "server_process_hooks", 1);
	return (rc);
}

/**
 * @brief
 *		Recreates the 'preq' structure based on the values specified by
 * 		the hook writer in the corresponding Python event request object.
 *		CAUTION: If this returns -1, don't process 'preq' as it could be
 *		in an incompletely filled state. It must be freed by any of the
 * 		functions that call reply_send() (which calls free_attrlist(preq)).
 *
 * @param[in] 	preq	- the batch request
 *
 * @return	int
 * @retval	0 	- success
 * @retval	-1	- failure
 */
int
recreate_request(struct batch_request *preq)
{
	int rc;
	hook_output_param_t req_params;
	FILE *fp_debug = NULL;
	char *hook_outfile = NULL;
	char perf_label[MAXBUFLEN];

	if (!svr_interp_data.interp_started) {
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, __func__,
			  "Python interpreter not started, so no request recreation");
		return (0);
	}

	if (pbs_python_get_hook_debug_output_fp() == NULL) {
		/* prepare to open file if output file pointer not stored */
		hook_outfile = pbs_python_get_hook_debug_output_file();
	}

	if ((hook_outfile != NULL) && (hook_outfile[0] != '\0')) {
		/* need to open in append mode, as process_hooks() may have */
		/* already written into this file. */
		fp_debug = fopen(hook_outfile, "a");
		if (fp_debug == NULL) {
			sprintf(log_buffer,
				"warning: open of hook debug output file %s failed!",
				hook_outfile);
		} else {
			pbs_python_set_hook_debug_output_fp(fp_debug);
		}
	}
	hook_output_param_init(&req_params);
	if (preq->rq_type == PBS_BATCH_QueueJob) {
		req_params.rq_job = (struct rq_quejob *) &preq->rq_ind.rq_queuejob;
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", HOOKSTR_QUEUEJOB, preq->rq_ind.rq_queuejob.rq_jid, getpid());
		rc = pbs_python_event_to_request(HOOK_EVENT_QUEUEJOB,
						 &req_params, perf_label, HOOK_PERF_HOOK_OUTPUT);
	} else if (preq->rq_type == PBS_BATCH_PostQueueJob) {
		req_params.rq_postqueuejob = (struct rq_postqueuejob *) &preq->rq_ind.rq_postqueuejob;
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", HOOKSTR_QUEUEJOB, preq->rq_ind.rq_postqueuejob.rq_jid, getpid());
		rc = pbs_python_event_to_request(HOOK_EVENT_POSTQUEUEJOB,
						 &req_params, perf_label, HOOK_PERF_HOOK_OUTPUT);
	} else if (preq->rq_type == PBS_BATCH_SubmitResv) {
		req_params.rq_job = (struct rq_quejob *) &preq->rq_ind.rq_queuejob;
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", HOOKSTR_RESVSUB, preq->rq_ind.rq_queuejob.rq_jid, getpid());
		rc = pbs_python_event_to_request(HOOK_EVENT_RESVSUB,
						 &req_params, perf_label, HOOK_PERF_HOOK_OUTPUT);
	} else if (preq->rq_type == PBS_BATCH_ModifyResv) {
		req_params.rq_manage = (struct manage *) &preq->rq_ind.rq_modify;
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", HOOKSTR_MODIFYRESV, preq->rq_ind.rq_modify.rq_objname, getpid());
		rc = pbs_python_event_to_request(HOOK_EVENT_MODIFYRESV,
						 &req_params, perf_label, HOOK_PERF_HOOK_OUTPUT);
	} else if (preq->rq_type == PBS_BATCH_ModifyJob) {
		req_params.rq_manage = (struct manage *) &preq->rq_ind.rq_modify;
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", HOOKSTR_MODIFYJOB, preq->rq_ind.rq_modify.rq_objname, getpid());
		rc = pbs_python_event_to_request(HOOK_EVENT_MODIFYJOB,
						 &req_params, perf_label, HOOK_PERF_HOOK_OUTPUT);
	} else if (preq->rq_type == PBS_BATCH_MoveJob) {
		req_params.rq_move = (struct rq_move *) &preq->rq_ind.rq_move;
		snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", HOOKSTR_MOVEJOB, preq->rq_ind.rq_move.rq_jid, getpid());
		rc = pbs_python_event_to_request(HOOK_EVENT_MOVEJOB,
						 &req_params, perf_label, HOOK_PERF_HOOK_OUTPUT);
	} else {
		log_err(PBSE_INTERNAL, __func__, "unexpected request type");
		rc = -1;
	}
	if (rc == -1) {
		log_err(PBSE_INTERNAL, __func__, "error occured recreating request!");
	}

	if (fp_debug != NULL) {
		fclose(fp_debug);
		fp_debug = NULL;
		pbs_python_set_hook_debug_output_fp(NULL);
		pbs_python_set_hook_debug_output_file("");
	}
	/* clear python cached objects */
	pbs_python_clear_attributes();
	return (rc);
}

/* Mom hook action-related items */

/**
 * @brief
 *		add_mom_hook_action - create both a mom_hook_action_t entry and insert
 *		a pointer to that element into the *hookact_array which currently has
 *		a size of *hookact_array_size, which may be expanded if needed.
 *
 * @par Functionality:
 *		Searches for existing mom_hook_action_t entry in the
 *		'hookact_array', with matching hookname;
 *		if found and the tid field (transaction id) of the matching entry
 *		is <= input_tid, update that entry with 'action' and 'input_tid'
 *		values, and return the index to the updated entry. If no matching
 *		mom_hook_action_t entry is found, then find an existing empty slot in
 *		the 'hookact_array' and put in the 'hookname', 'action', and
 *		'input_tid' data entry to it, and return its index.
 * 		If there's no empty slot, the array is expanded by
 *		GROW_MOMHOOK_ARRAY_AMT amount. Then add the 'hookname' and 'action'
 *		data in the first newly created empty slot, and return its index.
 *
 * @par Note:
 *		Normally, the action value is appended to existing entries in
 *		*hookact_array. If the parameter 'set_action' is set to 1, the
 *		action value is not appended but directly assigned.
 *
 *		If hook action being added is for PBS_RESCDEF ("resourcedef"),
 *		then ensure this entry appears before other hooks in 'hookact_array',
 *		for mom hooks will depend on the PBS_RESCDEF file for custom resources.
 *
 * @see
 * 		hook_track_recov and add_pending_mom_hook_action
 *
 * @param[in/out] hookact_array - pointer to the hook action array,
 *					which if expanded would get a new pointer value.
 * @param[in/out] hookact_array_size - pointer to the number of entries in
 *					*hookact_array, which if expanded, would get a new
 *					number of elements value.
 * @param[in]	hookname - name of hook with pending action
 * @param[in]	action - flag specifying the type of pending action in hookname.
 * @param[in]	set_action - if set to 1, then the action value will be
 *				assigned directly and not appended to the list of
 *				action values.
 * @param[in]	input_tid - transaction id to assocate to newly added
 *				mom hook action (<hook_name>,<action>).
 *
 * @return	int
 * @retval	Returns the index to the 'hookact_array' containing the
 updated or added mom_hook_action_t entry.
 * @retval	-1 if no mom_hook_action_t entry got updated or added,
 *		perhaps due to an error.
 *
 * @par Side Effects: None
 *
 */

int
add_mom_hook_action(mom_hook_action_t ***hookact_array,
		    int *hookact_array_size, char *hookname,
		    unsigned int action, int set_action,
		    long long int input_tid)
{
	int empty = -1;
	int i, j;
	mom_hook_action_t *pact, *pact2, *pact_tmp;
	mom_hook_action_t **tp;

	if ((hookact_array == NULL) || (hookact_array_size == NULL) ||
	    (hookname == NULL))
		return -1;

	for (i = 0; i < *hookact_array_size; i++) {
		pact = (*hookact_array)[i];
		if (pact) {
			if (strcmp(pact->hookname, hookname) == 0) {
				/* check if existing entry is newer than */
				/* the entry being added */
				if (pact->tid > input_tid) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "not adding hook %s action %d as "
						 "entry's tid=%lld > input_tid=%lld",
						 hookname, pact->action, pact->tid,
						 input_tid);
					log_event(PBSEVENT_DEBUG3,
						  PBS_EVENTCLASS_REQUEST, LOG_WARNING,
						  "add_mom_hook_action", log_buffer);
					return (-1);
				}
				if (set_action) {
					pact->action = action;
				} else if ((pact->action & action & pact->reply_expected)) {
					continue; /* dont reuse the action object if replies are still expected for same action */
				} else {
					if (action & MOM_HOOK_ACTION_DELETE) {
						if (pact->action & MOM_HOOK_SEND_ACTIONS) {
							/* there's a current send action, so delete action should not execute first */
							pact->do_delete_action_first = 0;
						} else {
							/* there's no current send action, so delete action should execute first */
							pact->do_delete_action_first = 1;
						}
					}
					pact->action |= action;
				}
				pact->tid = input_tid;
				do_sync_mom_hookfiles = 1;
				return i;
			} else if ((pact->action == MOM_HOOK_ACTION_NONE) &&
				   (empty == -1)) {
				/* be sure to free up previous entry which */
				/* was previously malloc-ed */
				free(pact);
				(*hookact_array)[i] = NULL;
				empty = i;
			}
		} else if (empty == -1) {
			empty = i; /* save index of first empty slot */
		}
	}

	if (empty == -1) {
		/* there wasn't an empty slot in the array we can use */
		/* need to grow the array			      */

		tp = (mom_hook_action_t **) realloc(*hookact_array,
						    (size_t)(sizeof(mom_hook_action_t *) * (*hookact_array_size + GROW_MOMHOOK_ARRAY_AMT)));
		if (tp != NULL) {
			empty = *hookact_array_size;
			*hookact_array = tp;
			*hookact_array_size += GROW_MOMHOOK_ARRAY_AMT;
			for (i = empty; i < *hookact_array_size; i++)
				(*hookact_array)[i] = NULL;
		} else {
			log_err(errno, __func__, merr);
			return (-1);
		}
	}

	/* now allocate the memory for the mom_hook_action_t element itself */

	pact = (mom_hook_action_t *) malloc(sizeof(mom_hook_action_t));
	if (pact != NULL) {
		snprintf(pact->hookname, sizeof(pact->hookname), "%s", hookname);
		pact->action = action;
		pact->reply_expected = action;
		pact->do_delete_action_first = 0;
		pact->tid = input_tid;
		do_sync_mom_hookfiles = 1;
		(*hookact_array)[empty] = pact;
	} else {
		log_err(errno, __func__, merr);
		return (-1);
	}

	/* If hook action added is for PBS_RESCDEF, then we need to sort the */
	/* mom hook action array so that this resourcedef 		     */
	/* entry appear before regular mom hooks. This allows 		     */
	/* sync_mom_hookfilesTPP() to send out resourcedef files first before   */
	/* the mom hook files, for the latter could be depending on the      */
	/* former. */
	if (strcmp(hookname, PBS_RESCDEF) == 0) {

		/* j indexed array goes from last element to first */
		/* i indexed array goes from first to last */
		/* slot entry in j to be exchanged with i's,and i must be < j */
		/* for we're moving later resourcedef entry in j into */
		/* the earliest entry in i */
		for (j = (*hookact_array_size) - 1; j >= 0; j--) {
			pact = (*hookact_array)[j];
			if (pact && (strcmp(pact->hookname, PBS_RESCDEF) == 0)) {
				for (i = 0; (i < *hookact_array_size) && (i < j); i++) {
					pact2 = (*hookact_array)[i];
					if (pact2 && (strcmp(pact2->hookname,
							     PBS_RESCDEF) != 0)) {
						/* exchange places, moved later */
						/* resourcedef file entry to */
						/* earlier entry */
						pact_tmp = pact2;
						/* set resourcedef entry */
						(*hookact_array)[i] = pact;
						(*hookact_array)[j] = pact_tmp;
						break;
					}
				}
				break; /* only be one PBS_RESCDEF entry */
			}
		}
	}

	return empty;
}

/**
 * @brief
 *	Removes from hookact_array of size hookact_array_size the mom hook
 *	action: (hookname, action).
 *
 * @see
 * 		delete_pending_mom_hook_action
 *
 * @param[in]	hookact_array - mom hook action array
 * @param[in]	hookact_array_size - number of elements in hookact_array
 * @param[in]	hookname - the hook in question
 * @param[in]	action - the mom hook action to unset
 *
 * @return int
 * @retval	index to the mom hook action entry in hookact_array where
 *		'action' flag has been removed.
 * @retval	-1	- if no entry found or error encountered.
 */

int
delete_mom_hook_action(mom_hook_action_t **hookact_array,
		       int hookact_array_size, char *hookname, unsigned int action)
{
	int i;

	if ((hookact_array == NULL) || (hookname == NULL))
		return (-1);

	/* find the entry in the array that does point here */
	for (i = 0; i < hookact_array_size; i++) {
		if ((hookact_array[i] != NULL) &&
		    strcmp(hookact_array[i]->hookname, hookname) == 0) {
			hookact_array[i]->action &= ~action;
			return (i);
		}
	}
	return (-1);
}

/**S
 * @brief
 *		Find and return a pointer to a mom_hook_action_t element in
 *		hookact_array of size hookact_array_size, defined by hookname.
 *
 * @see
 * 		has_pending_mom_action_delete
 *
 * @param[in]	hookact_array - mom hook action array
 * @param[in]	hookact_array_size - number of elements in hookact_array
 * @param[in]	hookname - the hook to find.
 *
 * @return	mom_hook_action_t *
 * @retval	pointer to the the mom_hook_action_t entry
 * @retval	NULL if it did not find it.
 */

mom_hook_action_t *
find_mom_hook_action(mom_hook_action_t **hookact_array,
		     int hookact_array_size, char *hookname)
{
	int i;

	mom_hook_action_t *pact;

	for (i = 0; i < hookact_array_size; i++) {
		pact = hookact_array[i];
		if (pact &&
		    (strcmp(pact->hookname, hookname) == 0))
			return pact;
	}

	return NULL; /* didn't find it */
}

/**
 * @brief
 *		Adds a pending action to 'hookname' for the mom in 'minfo' if not NULL,
 *		or all the moms in the system.
 * @par NOTE:
 *		For every successful pending action add, a line of data is
 *		written in [PATH_HOOKS]/hook_tracking.TR file as:
 *		<mom_name>:<mom_port> <hook_name> <action>
 *		where <action> is the current action flag value.
 *
 * @param[in]	minfo		- if not NULL, then add mom hook action
 *				on this particular mom in 'minfo'.
 * @param[in]	hookname	- name of hook with pending action.
 * @param[in] 	action		- the type of action
 *				(MOM_HOOK_ACTION_SEND_ATTRS,
 *				MOM_HOOK_ACTION_SEND_SCRIPT, etc...)
 *
 * @return	void
 */
void
add_pending_mom_hook_action(void *minfo, char *hookname, unsigned int action)
{
	int i, j;
	mominfo_t **minfo_array = NULL;
	int minfo_array_size;
	mominfo_t *minfo_array_tmp[1];

	if ((mominfo_t *) minfo == NULL) {
		minfo_array = mominfo_array;
		minfo_array_size = mominfo_array_size;
	} else {
		minfo_array_tmp[0] = (mominfo_t *) minfo;
		minfo_array = (mominfo_t **) minfo_array_tmp;
		minfo_array_size = 1;
	}

	for (i = 0; i < minfo_array_size; i++) {

		if (minfo_array[i] == NULL)
			continue;

		if (!minfo_array[i]->mi_data ||
		    (minfo_array[i]->mi_dmn_info->dmn_state & (INUSE_UNKNOWN | INUSE_NEEDS_HELLOSVR))) {
			continue;
		}

		j = add_mom_hook_action(&((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_action,
					&((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_num_action, hookname,
					action, 0, hook_action_tid);

		hook_track_save((mominfo_t *) minfo_array[i], j);
	}
}

/**
 * @brief
 *		Deletes a pending action to 'hookname' in mom described by 'minfo' if
 *		not NULL, or for all the moms in the system.
 *
 * @par Note:
 *		For every successful pending action delete, a line of data is
 *		written in [PATH_HOOKS]/<hookname>.TR file as:
 *		<mom_name>:<mom_port> <hook_name> <remaining_hook_action>
 *
 * @param[in]	minfo		- if not NULL, then delete mom hook action
 *				on this particular mom in 'minfo'.
 *				if NULL, then delete mom hook action on
 *				all the moms in the system.
 * @param[in]	hookname	- name of hook with pending hook action
 * @param[in] 	action		- the type of action
 *				(MOM_HOOK_ACTION_SEND_ATTRS,
 *				MOM_HOOK_ACTION_SEND_SCRIPT, etc...)
 *
 * @return void
 */
void
delete_pending_mom_hook_action(void *minfo, char *hookname,
			       unsigned int action)
{
	int i, k;
	mominfo_t **minfo_array = NULL;
	int minfo_array_size;
	mominfo_t *minfo_array_tmp[1];

	if ((mominfo_t *) minfo == NULL) {
		minfo_array = mominfo_array;
		minfo_array_size = mominfo_array_size;
	} else {
		minfo_array_tmp[0] = (mominfo_t *) minfo;
		minfo_array = (mominfo_t **) minfo_array_tmp;
		minfo_array_size = 1;
	}

	for (i = 0; i < minfo_array_size; i++) {

		if (minfo_array[i] == NULL)
			break;

		k = delete_mom_hook_action(((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_action,
					   ((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_num_action, hookname, action);

		hook_track_save((mominfo_t *) minfo_array[i], k);
	}
}

/**
 * @brief
 *		Determines if 'hookname' has a pending MOM_HOOK_ACTION_DELETE to
 *		the moms.
 *
 * @see
 * 		collapse_hook_tr and pbsd_init
 *
 * @param[in]	hookname - the hook in question
 *
 * @return	int
 * @retval	1	if there's a pending delete action
 * @retval	0	otherwise.
 */
int
has_pending_mom_action_delete(char *hookname)
{
	mom_hook_action_t *pact;
	int i;

	for (i = 0; i < mominfo_array_size; i++) {

		if (mominfo_array[i] == NULL)
			continue;

		pact = find_mom_hook_action(((mom_svrinfo_t *) mominfo_array[i]->mi_data)->msr_action,
					    ((mom_svrinfo_t *) mominfo_array[i]->mi_data)->msr_num_action, hookname);

		if (pact && (pact->action & MOM_HOOK_ACTION_DELETE))
			return 1;
	}
	return 0;
}

/**
 * @brief
 *		Returns the number of pending hook actions, such as send hook
 *		attributes/scripts, resourcedef file,
 *		to a particular mom, or to all the moms in the
 *		system.
 *
 * @see
 * 		set_nodes
 *
 * @param[in]	minfo	- count referring to the mom described by this
 *				'minfo' only, or
 *			 	if NULL, then return total count for all the
 *				moms in the system.
 *
 * @return int
 * @retval	<num>	- Number of still pending mom hook actions.
 */
int
sync_mom_hookfiles_count(void *minfo)
{
	int i, j;
	mominfo_t **minfo_array = NULL;
	int minfo_array_size;
	mominfo_t *minfo_array_tmp[1];
	int action_expected = 0;
	mom_hook_action_t *pact;

	if (minfo == NULL) {
		minfo_array = mominfo_array;
		minfo_array_size = mominfo_array_size;
	} else {
		minfo_array_tmp[0] = minfo;
		minfo_array = (mominfo_t **) minfo_array_tmp;
		minfo_array_size = 1;
	}

	for (i = 0; i < minfo_array_size; i++) {

		if (minfo_array[i] == NULL)
			continue;

		for (j = 0; j < ((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_num_action; j++) {
			pact = ((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_action[j];

			if ((pact == NULL) ||
			    (pact->action == MOM_HOOK_ACTION_NONE))
				continue;

			if (pact->action & MOM_HOOK_ACTION_DELETE)
				action_expected++;

			if (pact->action & MOM_HOOK_ACTION_SEND_ATTRS)
				action_expected++;

			if (pact->action & MOM_HOOK_ACTION_SEND_SCRIPT)
				action_expected++;

			if (pact->action & MOM_HOOK_ACTION_SEND_CONFIG)
				action_expected++;

			if (pact->action & MOM_HOOK_ACTION_DELETE_RESCDEF) {
				action_expected++;
			} else if (pact->action & MOM_HOOK_ACTION_SEND_RESCDEF) {
				action_expected++;
			}
		}
	}

	return (action_expected);
}

/**
 * @brief
 * 		Handles the collapsing of a hook tracking file
 * 		Recovers the hooks tracking data from the hooks
 * 		tracking file, loops through the pending actions
 * 		and deletes all purged hooks, and finally does
 * 		a hook tracking file save, effectively collapsing
 * 		the tracking file.
 *
 * @see
 * 		post_sendhookTPP and next_sync_mom_hookfiles.
 */
static void
collapse_hook_tr()
{
	hook *phook;
	hook *phook_current;

	/* purge deleted hooks */
	phook = (hook *) GET_NEXT(svr_allhooks);
	while (phook) {
		phook_current = phook;
		phook = (hook *) GET_NEXT(phook->hi_allhooks);

		if (phook_current->pending_delete &&
		    !has_pending_mom_action_delete(
			    phook_current->hook_name)) {
			hook_purge(phook_current,
				   pbs_python_ext_free_python_script);
		}
	}

	/* This collapses, purges the hook tracking file, which */
	/* could become empty, so the next call to */
	/* hook_track_recov() could cause the hook_action_tid to */
	/* reset back to 0, which is what we want. */
	hook_track_save(NULL, -1);
}

/**
 * @brief
 *		Allocates a def_hk_cmd_info structure, filling it with 'index', 'event',
 *		'tid' values, and return a pointer to this structure.
 *
 * @see
 * 		check_add_hook_mcast_info
 *
 * @param[in] index - index value to the returned def_hk_cmd_info structure.
 * @param[in] event - event value to the returned def_hk_cmd_info structure.
 * @param[in] tid - transaction id value to the returned def_hk_cmd_info structure.
 *
 * @return struct def_hk_cmd_info *
 *
 * @retval pointer to the structure
 * @retval NULL - if an error occurred allocating and populating the structure.
 *
 * @Note
 *	The caller must call free() on the returned memory pointer if no longer
 *	needed.
 *
 */
struct
	def_hk_cmd_info *
	mk_deferred_hook_info(int index, int event, long long int tid)
{
	struct def_hk_cmd_info *info = malloc(sizeof(struct def_hk_cmd_info));
	if (info) {
		info->index = index;
		info->event = event;
		info->tid = tid;
	}
	return info;
}

/**
 * @brief
 *		check if there is any new pending action
 *
 * @param[in] minfo - pointer to mom info
 * @param[in] pact - pointer to current hook action
 * @param[in] j - index of pact in minfo->mi_data->msr_action[]
 * @param[in] event - action event to consider
 *
 * @return int
 * @retval 0  - not found
 * @retval 1  - found
 */
int
check_for_latest_action(mominfo_t *minfo, mom_hook_action_t *pact, int j, int event)
{
	/* if the same action is marked in the next actions for the same hook then remove
	 * the pending flag
	 */
	int i;
	mom_hook_action_t *pact2;
	for (i = 0; i < ((mom_svrinfo_t *) minfo->mi_data)->msr_num_action; i++) {
		pact2 = ((mom_svrinfo_t *) minfo->mi_data)->msr_action[i];
		if (pact2 && (i != j) && (pact2->tid > pact->tid) && (pact2->action & event) &&
		    pact2->hookname[0] && (strcmp(pact2->hookname, pact->hookname) == 0)) {
			return 1;
		}
	}
	return 0;
}

/**
 * @brief
 *		Call back for the hook deferred requests over TPP stream
 *		parm1 points to the mominfo_t
 *		parm2 points to more information about the hook cmd
 *		wt_aux has the reply code from mom
 *
 * @Note
 *		If sending or deleting a hook to a mom has been rejected because
 *		mom is not acceping root remote scripts for security reasons, then
 *		this will be considered still a successful send.
 *
 *		The globals g_hook_replies_recvd is incremented for
 *		each reply received. When this matches the global
 *		variable g_hook_replies_expected, the global variable
 *		sync_mom_hookfiles_replies_pending is reset to 0, such
 *		that the next "hook transaction" can now start.
 *
 * @param[in] pwt - The work task pointer
 *
 * @return void
 */
void
post_sendhookTPP(struct work_task *pwt)
{
	mominfo_t *minfo = pwt->wt_parm1;
	mom_hook_action_t *pact;
	int rc = pwt->wt_aux;
	struct def_hk_cmd_info *info = (struct def_hk_cmd_info *) pwt->wt_parm2;
	char hookfile[MAXPATHLEN + 1];
	int j;
	int event;
	long long int tid;
	char *msgbuf;
	bool failed_flag = FALSE;

	if (!info)
		return;

	j = info->index;
	event = info->event;
	tid = info->tid;

	free(info);

	if (tid != g_sync_hook_tid) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "%s reply (tid=%lld) not from current "
			 "batch of hook updates (tid=%lld) from mhost=%s",
			 __func__, tid, g_sync_hook_tid, minfo->mi_host[0] ? minfo->mi_host : "");
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);
		return; /* return now as info->index no longer valid */
	}

	pact = ((mom_svrinfo_t *) minfo->mi_data)->msr_action[j];

	if (event == MOM_HOOK_ACTION_DELETE_RESCDEF) {
		snprintf(hookfile, sizeof(hookfile), "%.*s%.*s",
			 (int) (sizeof(hookfile) - PBS_HOOK_NAME_SIZE),
			 path_hooks, PBS_HOOK_NAME_SIZE, pact->hookname);
		if (rc != 0) {
			pbs_asprintf(&msgbuf,
				     "errno %d: failed to delete rescdef file %s from %s",
				     pbs_errno, hookfile, minfo->mi_host);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_WARNING, msg_daemonname, msgbuf);
			free(msgbuf);
			failed_flag = TRUE;
		} else {
			pbs_asprintf(&msgbuf,
				     "successfully deleted rescdef file %s from %s:%d",
				     hookfile, minfo->mi_host, minfo->mi_port);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
			free(msgbuf);
			/* Delete all SEND_RESCDEF action */
			/* so it doesn't get retried for this */
			/* "deleted" resourcdef. */
			pact->action &= ~(MOM_HOOK_ACTION_DELETE_RESCDEF | MOM_HOOK_ACTION_SEND_RESCDEF);
			hook_track_save((mominfo_t *) minfo, j);
		}
	}

	if (event == MOM_HOOK_ACTION_SEND_RESCDEF) {
		snprintf(hookfile, sizeof(hookfile), "%.*s%.*s",
			 (int) (sizeof(hookfile) - PBS_HOOK_NAME_SIZE), path_hooks,
			 PBS_HOOK_NAME_SIZE, pact->hookname);
		if ((rc != 0) && (pbs_errno != PBSE_MOM_REJECT_ROOT_SCRIPTS)) {
			pbs_asprintf(&msgbuf,
				     "errno %d: failed to copy rescdef file %s to %s:%d",
				     pbs_errno, hookfile, minfo->mi_host, minfo->mi_port);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_WARNING, msg_daemonname, msgbuf);
			free(msgbuf);
			failed_flag = TRUE;
		} else {
			if (rc != PBSE_MOM_REJECT_ROOT_SCRIPTS) {
				pbs_asprintf(&msgbuf,
					     "successfully sent rescdef file %s to %s:%d",
					     hookfile, minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
				free(msgbuf);
			} else {
				snprintf(log_buffer, sizeof(log_buffer),
					 "warning: sending resourcedef to %s:%d got rejected (mom's reject_root_scripts=1)",
					 minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, log_buffer);
			}
			pact->action &= ~(MOM_HOOK_ACTION_SEND_RESCDEF);
			hook_track_save((mominfo_t *) minfo, j);
		}
	}

	if (event == MOM_HOOK_ACTION_DELETE) {
		snprintf(hookfile, sizeof(hookfile), "%.*s%s",
			 (int) (sizeof(hookfile) - strlen(HOOK_FILE_SUFFIX) - 1),
			 pact->hookname, HOOK_FILE_SUFFIX);
		if (rc != 0) {
			pbs_asprintf(&msgbuf,
				     "errno %d: failed to delete hook file %s from %s",
				     pbs_errno, hookfile, minfo->mi_host);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_WARNING, msg_daemonname, msgbuf);
			free(msgbuf);
			failed_flag = TRUE;
		} else {
			pbs_asprintf(&msgbuf,
				     "successfully deleted hook file %s from %s:%d",
				     hookfile, minfo->mi_host, minfo->mi_port);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
			free(msgbuf);
			pact->action &= ~MOM_HOOK_ACTION_DELETE;
			hook_track_save((mominfo_t *) minfo, j);
		}
	}

	if (event == MOM_HOOK_ACTION_SEND_ATTRS) {
		snprintf(hookfile, sizeof(hookfile), "%.*s%.*s%s",
			 (int) (sizeof(hookfile) - PBS_HOOK_NAME_SIZE - strlen(HOOK_FILE_SUFFIX)),
			 path_hooks, PBS_HOOK_NAME_SIZE, pact->hookname, HOOK_FILE_SUFFIX);
		if ((rc != 0) && (pbs_errno != PBSE_MOM_REJECT_ROOT_SCRIPTS)) {
			pbs_asprintf(&msgbuf,
				     "errno %d: failed to copy hook file %s to %s:%d",
				     pbs_errno, hookfile, minfo->mi_host, minfo->mi_port);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_WARNING, msg_daemonname, msgbuf);
			free(msgbuf);
			failed_flag = TRUE;
		} else {
			if (pbs_errno != PBSE_MOM_REJECT_ROOT_SCRIPTS) {
				pbs_asprintf(&msgbuf,
					     "successfully sent hook file %s to %s:%d",
					     hookfile, minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
				free(msgbuf);
			} else {
				pbs_asprintf(&msgbuf,
					     "warning: sending hook file %s to %s:%d got rejected (mom's reject_root_scripts=1)",
					     hookfile, minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
				free(msgbuf);
			}
			pact->action &= ~(MOM_HOOK_ACTION_SEND_ATTRS);
			hook_track_save((mominfo_t *) minfo, j);
		}
	}

	if (event == MOM_HOOK_ACTION_SEND_CONFIG) {
		snprintf(hookfile, sizeof(hookfile), "%.*s%.*s%s",
			 (int) (sizeof(hookfile) - PBS_HOOK_NAME_SIZE - strlen(HOOK_CONFIG_SUFFIX)),
			 path_hooks, PBS_HOOK_NAME_SIZE, pact->hookname, HOOK_CONFIG_SUFFIX);
		if ((rc != 0) && (pbs_errno != PBSE_MOM_REJECT_ROOT_SCRIPTS)) {
			pbs_asprintf(&msgbuf,
				     "errno %d: failed to copy hook file %s to %s:%d",
				     pbs_errno, hookfile, minfo->mi_host, minfo->mi_port);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_WARNING, msg_daemonname, msgbuf);
			free(msgbuf);
			failed_flag = TRUE;
		} else {
			if (pbs_errno != PBSE_MOM_REJECT_ROOT_SCRIPTS) {
				pbs_asprintf(&msgbuf,
					     "successfully sent hook file %s to %s:%d",
					     hookfile, minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
				free(msgbuf);
			} else {
				pbs_asprintf(&msgbuf,
					     "warning: sending hook file %s to %s:%d got rejected (mom's reject_root_scripts=1)",
					     hookfile, minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
				free(msgbuf);
			}
			pact->action &= ~(MOM_HOOK_ACTION_SEND_CONFIG);
			hook_track_save((mominfo_t *) minfo, j);
		}
	}

	if (event == MOM_HOOK_ACTION_SEND_SCRIPT) {
		snprintf(hookfile, sizeof(hookfile), "%.*s%.*s%s",
			 (int) (sizeof(hookfile) - PBS_HOOK_NAME_SIZE - strlen(HOOK_SCRIPT_SUFFIX)),
			 path_hooks, PBS_HOOK_NAME_SIZE, pact->hookname, HOOK_SCRIPT_SUFFIX);
		if ((rc != 0) && (pbs_errno != PBSE_MOM_REJECT_ROOT_SCRIPTS)) {
			pbs_asprintf(&msgbuf,
				     "errno %d: failed to copy hook file %s to %s:%d",
				     pbs_errno, hookfile, minfo->mi_host, minfo->mi_port);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_WARNING, msg_daemonname, msgbuf);
			free(msgbuf);
			failed_flag = TRUE;
		} else {
			if (pbs_errno != PBSE_MOM_REJECT_ROOT_SCRIPTS) {
				pbs_asprintf(&msgbuf,
					     "successfully sent hook file %s to %s:%d",
					     hookfile, minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
				free(msgbuf);
			} else {
				pbs_asprintf(&msgbuf,
					     "warning: sending hook file %s to %s:%d got rejected (mom's reject_root_scripts=1)",
					     hookfile, minfo->mi_host, minfo->mi_port);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_INFO, msg_daemonname, msgbuf);
				free(msgbuf);
			}
			pact->action &= ~(MOM_HOOK_ACTION_SEND_SCRIPT);
			hook_track_save((mominfo_t *) minfo, j);
		}
	}

	pact->reply_expected &= ~(event);
	if (failed_flag && check_for_latest_action(minfo, pact, j, event)) {
		pact->action &= ~(event);
		hook_track_save(minfo, j);
	}

	g_hook_replies_recvd++;

	DBPRT(("expected=%d, replies=%d\n", g_hook_replies_expected, g_hook_replies_recvd));

	if (g_hook_replies_recvd == g_hook_replies_expected) {
		/*
		 * We are done with this batch of hook replies
		 * allow next set of hook requests to go out now
		 */
		sync_mom_hookfiles_replies_pending = 0;
		g_hook_replies_recvd = 0;
		g_hook_replies_expected = 0;

		/* attempt a collapse of the hook tracking file now */
		collapse_hook_tr();
	}
}

/**
 * @brief
 *		static helper function to check and add a hook command to a mom
 *		to a list of multicast commands.
 *
 *		A TPP multicast command consists of the same command to be sent to
 *		a groups of target moms.
 *
 * @param[in] conn      - The stream to the mom
 * @param[in] minfo     - The pointer to the mom info
 * @param[in] hookname  - Name of the hook for which the command is being sent
 * @param[in] action    - The hook action/cmd being performed
 * @param[in] act_index - The index in the moms hook actions array
 *
 * @return hook_mcast_info_t	- structures required for TPP mcast communication of hooks to moms
 */
static hook_mcast_info_t *
check_add_hook_mcast_info(int conn, mominfo_t *minfo, char *hookname, int action, int act_index)
{
	int i;
	void *tmp;
	struct def_hk_cmd_info *info = NULL;
	char *dup_msgid = NULL;

	for (i = 0; i < g_hook_mcast_array_len; i++) {
		if (strcmp(g_hook_mcast_array[i].hookname, hookname) == 0 &&
		    g_hook_mcast_array[i].action == action)
			break;
	}
	if (i < g_hook_mcast_array_len) {
		/* add this connection as part of the mcast connections */

		if ((info = mk_deferred_hook_info(act_index, action,
						  g_sync_hook_tid)) == NULL)
			return NULL;

		if ((dup_msgid = strdup(g_hook_mcast_array[i].msgid)) == NULL) {
			free(info);
			return NULL;
		}

		if (add_mom_deferred_list(conn, minfo, post_sendhookTPP,
					  dup_msgid, minfo, info) == NULL) {
			free(info);
			free(dup_msgid);
			return NULL;
		}

		if (tpp_mcast_add_strm(g_hook_mcast_array[i].mconn, conn, FALSE) != 0) {
			free(info);
			free(dup_msgid);
			return NULL;
		}
		goto SUCCESS_RET;
	}

	/* we did not find a match, allocate a new index */
	i = g_hook_mcast_array_len;

	tmp = realloc(g_hook_mcast_array, sizeof(hook_mcast_info_t) * (g_hook_mcast_array_len + 1));
	if (!tmp) {
		log_err(-1, __func__, "Could not allocate array of hook info");
		return NULL;
	}
	g_hook_mcast_array = tmp;

	g_hook_mcast_array[i].action = action;
	if ((g_hook_mcast_array[i].hookname = strdup(hookname)) == NULL)
		return NULL;

	if (get_msgid(&g_hook_mcast_array[i].msgid) != 0)
		return NULL;

	if ((info = mk_deferred_hook_info(act_index, action,
					  g_sync_hook_tid)) == NULL)
		return NULL;

	if (add_mom_deferred_list(conn, minfo, post_sendhookTPP,
				  strdup(g_hook_mcast_array[i].msgid), minfo, info) == NULL) {
		free(info);
		return NULL;
	}

	if ((g_hook_mcast_array[i].mconn = tpp_mcast_open()) == -1) {
		free(info);
		return NULL;
	}

	if (tpp_mcast_add_strm(g_hook_mcast_array[i].mconn, conn, FALSE) != 0) {
		free(info);
		return NULL;
	}

	/* Increment size of the array here only when everything is successful
	 * This way, we do not have to reset anything back if we failed earlier
	 * The expanded array is okay to not be resized back
	 */
	g_hook_mcast_array_len++;

SUCCESS_RET:
	((mom_svrinfo_t *) minfo->mi_data)->msr_action[act_index]->reply_expected |= action;

	g_hook_replies_expected++;

	return &g_hook_mcast_array[i];
}

/**
 * @brief
 *		static helper function to delete the deferred hook commands from the
 *		all the moms that are part of the multicast messages information
 *		tracked by index.
 *
 * @see
 * 		sync_mom_hookfilesTPP
 *
 * @param[in]	index - The index in the g_hook_mcast_array
 *
 * @return void
 */
static void
del_deferred_hook_cmds(int index)
{
	char *msgid = g_hook_mcast_array[index].msgid;
	int mconn = g_hook_mcast_array[index].mconn;
	int *conns, count, i, handle;
	mominfo_t *pmom = 0;
	struct work_task *ptask, *tmp_task;
	struct def_hk_cmd_info *info;
	int j;
	int event;
	mom_hook_action_t *pact;
	mominfo_t *minfo;

	conns = tpp_mcast_members(mconn, &count);
	for (i = 0; i < count; i++) {
		handle = conns[i];

		if ((pmom = tfind2((u_long) handle, 0, &streams)) == NULL)
			return;

		/* get the task list */
		ptask = (struct work_task *) GET_NEXT(pmom->mi_dmn_info->dmn_deferred_cmds);

		while (ptask) {
			/* no need to compare wt_event with handle, since the
			 * task list is for this mom and so it will always match
			 */
			tmp_task = ptask;
			ptask = (struct work_task *) GET_NEXT(ptask->wt_linkobj2);
			if (tmp_task->wt_type == WORK_Deferred_cmd &&
			    strcmp(msgid, tmp_task->wt_event2) == 0) {

				if (tmp_task->wt_event2)
					free(tmp_task->wt_event2);

				minfo = tmp_task->wt_parm1;
				info = (struct def_hk_cmd_info *) tmp_task->wt_parm2;

				if (!info)
					return;

				j = info->index;
				event = info->event;
				free(info);

				pact = ((mom_svrinfo_t *) minfo->mi_data)->msr_action[j];

				pact->action &= ~(event);
				pact->reply_expected &= ~(event);
				hook_track_save((mominfo_t *) minfo, j);

				/* now dispatch the reply to the routine in the work task */
				delete_task(tmp_task);

				g_hook_replies_expected--;
			}
		}
	}
}

/**
 * @brief
 *		Performs actions such as send hook attributes/scripts, and also
 *		resourcedef file to a particular mom, or to all the moms in the
 *		system (this function performs this using deferred requests on TPP stream)
 *
 * @see
 * 		mc_sync_mom_hookfiles and uc_delete_mom_hooks
 *
 * @param[in]	minfo	- particular mom information to send hook request, or
 *			 	if NULL, then hook action request sent to all the
 *				moms in the system.
 *
 * @return enum sync_hookfiles_result
 * @retval	SYNC_HOOKFILES_NONE	if all mom hook actions succeeded in sending.
 * @retval	SYNC_HOOKFILES_FAIL	if all mom hook actions failed to be sent.
 * @retval	SYNC_HOOKFILES_PARTAIL	if some (not all) mom hook actions failed to be sent.
 */
enum sync_hookfiles_result
sync_mom_hookfilesTPP(void *minfo)
{
	int i, j;
	int conn = -1; /* a client style connection handle */
	char hookfile[MAXPATHLEN + 1];
	mominfo_t **minfo_array = NULL;
	int minfo_array_size;
	mominfo_t *minfo_array_tmp[1];
	mom_hook_action_t *pact;
	int skipped = 0;
	int ret = SYNC_HOOKFILES_NONE;

	if (minfo == NULL) {
		minfo_array = mominfo_array;
		minfo_array_size = mominfo_array_size;
	} else {
		minfo_array_tmp[0] = minfo;
		minfo_array = (mominfo_t **) minfo_array_tmp;
		minfo_array_size = 1;
	}

	sync_mom_hookfiles_replies_pending = 1;
	g_sync_hook_tid = hook_action_tid_get();
	snprintf(log_buffer, sizeof(log_buffer),
		 "g_sync_hook_tid=%lld", g_sync_hook_tid);
	log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER,
		  LOG_INFO, __func__, log_buffer);

	for (i = 0; i < minfo_array_size; i++) {

		if (minfo_array[i] == NULL)
			continue;

		conn = minfo_array[i]->mi_dmn_info->dmn_stream;
		if (conn == -1) {
			skipped++;
			continue;
		}

		if (minfo_array[i]->mi_dmn_info->dmn_state & INUSE_DOWN) {
			skipped++;
			continue;
		}

		tpp_add_close_func(conn, process_DreplyTPP); /* register a close handler */

		pbs_errno = 0;
		for (j = 0; j < ((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_num_action; j++) {
			hook *phook;
			pact = ((mom_svrinfo_t *) minfo_array[i]->mi_data)->msr_action[j];

			if ((pact == NULL) || (pact->action == MOM_HOOK_ACTION_NONE))
				continue;

			if (pact->action & MOM_HOOK_ACTION_DELETE_RESCDEF) {
				if (!check_add_hook_mcast_info(conn, minfo_array[i], pact->hookname,
							       MOM_HOOK_ACTION_DELETE_RESCDEF, j))
					ret = SYNC_HOOKFILES_FAIL;
			} else if (pact->action & MOM_HOOK_ACTION_SEND_RESCDEF) {
				if (!check_add_hook_mcast_info(conn, minfo_array[i], pact->hookname,
							       MOM_HOOK_ACTION_SEND_RESCDEF, j))
					ret = SYNC_HOOKFILES_FAIL;
			}

			/* execute delete action before the send actions */
			if (pact->do_delete_action_first && (pact->action & MOM_HOOK_ACTION_DELETE)) {
				if (!check_add_hook_mcast_info(conn, minfo_array[i], pact->hookname,
							       MOM_HOOK_ACTION_DELETE, j))
					ret = SYNC_HOOKFILES_FAIL;
			}

			phook = find_hook(pact->hookname);
			if (pact->action & MOM_HOOK_ACTION_SEND_ATTRS) {
				if (!phook || (phook->event & MOM_EVENTS) == 0)
					pact->action &= ~MOM_HOOK_ACTION_SEND_ATTRS;
				else if (!check_add_hook_mcast_info(conn, minfo_array[i], pact->hookname, MOM_HOOK_ACTION_SEND_ATTRS, j))
					ret = SYNC_HOOKFILES_FAIL;
			}

			if (pact->action & MOM_HOOK_ACTION_SEND_CONFIG) {
				if (!phook || (phook->event & MOM_EVENTS) == 0)
					pact->action &= ~MOM_HOOK_ACTION_SEND_CONFIG;
				else if (!check_add_hook_mcast_info(conn, minfo_array[i], pact->hookname, MOM_HOOK_ACTION_SEND_CONFIG, j))
					ret = SYNC_HOOKFILES_FAIL;
			}

			if (pact->action & MOM_HOOK_ACTION_SEND_SCRIPT) {
				if (!phook || (phook->event & MOM_EVENTS) == 0)
					pact->action &= ~MOM_HOOK_ACTION_SEND_SCRIPT;
				else if (!check_add_hook_mcast_info(conn, minfo_array[i], pact->hookname,
								    MOM_HOOK_ACTION_SEND_SCRIPT, j))
					ret = SYNC_HOOKFILES_FAIL;
			}

			/* execute send actions above first, and then this delete action */

			if ((!pact->do_delete_action_first) && (pact->action & MOM_HOOK_ACTION_DELETE)) {
				if (!check_add_hook_mcast_info(conn, minfo_array[i], pact->hookname,
							       MOM_HOOK_ACTION_DELETE, j))
					ret = SYNC_HOOKFILES_FAIL;
			}
		} /* j-loop */
	}	  /* i-loop */

	/* now do the actual transmissions */
	for (i = 0; i < g_hook_mcast_array_len; i++) {
		char *msgid = g_hook_mcast_array[i].msgid;
		char *hookname = g_hook_mcast_array[i].hookname;
		int mconn = g_hook_mcast_array[i].mconn;
		int rc = 0;
		int cmd;
		int filetype;

		if (g_hook_mcast_array[i].action == MOM_HOOK_ACTION_DELETE_RESCDEF) {
			snprintf(hookfile, sizeof(hookfile), "%s", hookname);
			cmd = 1;
			filetype = 1;
		} else if (g_hook_mcast_array[i].action & MOM_HOOK_ACTION_SEND_RESCDEF) {
			snprintf(hookfile, sizeof(hookfile), "%s%s", path_hooks, hookname);
			cmd = 2;
			filetype = 1;
		} else if (g_hook_mcast_array[i].action & MOM_HOOK_ACTION_DELETE) {
			snprintf(hookfile, sizeof(hookfile), "%s%s", hookname, HOOK_FILE_SUFFIX);
			cmd = 1;
			filetype = 2;
		} else if (g_hook_mcast_array[i].action & MOM_HOOK_ACTION_SEND_ATTRS) {
			snprintf(hookfile, sizeof(hookfile), "%s%s%s", path_hooks, hookname, HOOK_FILE_SUFFIX);
			cmd = 2;
			filetype = 2;
		} else if (g_hook_mcast_array[i].action & MOM_HOOK_ACTION_SEND_CONFIG) {
			snprintf(hookfile, sizeof(hookfile), "%s%s%s", path_hooks, hookname, HOOK_CONFIG_SUFFIX);
			cmd = 2;
			filetype = 2;
		} else if (g_hook_mcast_array[i].action & MOM_HOOK_ACTION_SEND_SCRIPT) {
			snprintf(hookfile, sizeof(hookfile), "%s%s%s", path_hooks, hookname, HOOK_SCRIPT_SUFFIX);
			cmd = 2;
			filetype = 2;
		} else {
			cmd = 0;
			filetype = 0;
			snprintf(log_buffer, sizeof(log_buffer), "Unrecognized hook action");
			rc = -1;
		}

		if (cmd == 1) {
			if (PBSD_delhookfile(mconn, hookfile, PROT_TPP, &msgid) != 0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "errno %d: failed to multicast deletion of %s file %s",
					 pbs_errno, ((filetype == 1) ? "rscdef" : "hook"), hookfile);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
					  LOG_INFO, __func__, log_buffer);
				rc = -1;
			} else {
				snprintf(log_buffer, sizeof(log_buffer), "PBSD_delhookfile(hookfile=%s)", hookfile);
				log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);
			}
		} else if (cmd == 2) {

			rc = PBSD_copyhookfile(mconn, hookfile, PROT_TPP, &msgid);
			if (rc == -2) {
				snprintf(log_buffer, sizeof(log_buffer), "PBSD_copyhookfile(mconn=%d, hookfile=%s): no hook file to copy (rc == -2)", mconn, hookfile);
				log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER,
					  LOG_INFO, __func__, log_buffer);
				/* no hookfile to copy */
				del_deferred_hook_cmds(i);
				rc = 0;
			} else if (rc != 0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "errno %d: failed to multicast copy %s file %s",
					 pbs_errno, ((filetype == 1) ? "rscdef" : "hook"), hookfile);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);
				rc = -1;
			} else {
				snprintf(log_buffer, sizeof(log_buffer), "PBSD_copyhookfile(hookfile=%s)", hookfile);
				log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);
			}
		}

		if (rc == -1) {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_REQUEST, LOG_WARNING, msg_daemonname, log_buffer);
			del_deferred_hook_cmds(i);
			ret = SYNC_HOOKFILES_FAIL;
		}

		/* we are done with the mcast for this index */
		tpp_mcast_close(mconn);
		free(g_hook_mcast_array[i].hookname);
		free(g_hook_mcast_array[i].msgid);
	}

	if (g_hook_mcast_array) {
		free(g_hook_mcast_array);
		g_hook_mcast_array = NULL;
		g_hook_mcast_array_len = 0;
	}

	if (g_hook_replies_expected == 0) {
		/* No hook requests sent, so we set the
		 * variable to 0, so that the next set of
		 * hook pending operations can get triggered
		 */
		sync_mom_hookfiles_replies_pending = 0;
	}

	/* set success to partial so that we come back and try again later */
	if (skipped > 0)
		ret = SYNC_HOOKFILES_SUCCESS_PARTIAL;

	/* if we returned SYNC_HOOKFILES_NONE, then all hook actions were sent, no retry
	 * needs to be done. This is in sync with mc_sync_mom_hookfiles() return values.
	 */
	return (ret);
}

/**
 * @brief
 *	Multi cast to moms all the pending mom hook sync operations
 *
 * @return int
 * @retval 0	for successfully executing the task process to sync_mom_hookfilesTPP()
 * @retval != 0 if an error occurred.
 */
int
mc_sync_mom_hookfiles(void)
{
	int rc;

	g_sync_hook_time = time(0);
	snprintf(log_buffer, sizeof(log_buffer), "g_sync_hook_time = %s", ctime(&g_sync_hook_time));
	log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);
	rc = sync_mom_hookfilesTPP(NULL);
	/* transaction id to use for next batch of updates */
	hook_action_tid_set(hook_action_tid_get() + 1);
	return rc;
}

/**
 * @brief
 *		Adds a pending action to all hooks for the mom in 'minfo' if not NULL,
 *		or all the moms in the system.
 * @par NOTE
 *		For every successful pending action add, a line of data is
 *		written in [PATH_HOOKS]/hook_tracking.TR file as:
 *			<mom_name> <mom_port> <hook_name> <action>
 *		where <action> is the current action flag value.
 *
 * @param[in]	minfo		- if not NULL, then add mom hook action
 *				on this particular mom in 'minfo'.
 * @param[in] 	action		- the type of action
 *				(MOM_HOOK_ACTION_SEND_ATTRS,
 *				MOM_HOOK_ACTION_SEND_SCRIPT, etc...)
 *
 * @return void
 */
void
add_pending_mom_allhooks_action(void *minfo, unsigned int action)
{
	hook *phook;

	phook = (hook *) GET_NEXT(svr_allhooks);
	while (phook) {
		if (phook->hook_name && (phook->event & MOM_EVENTS)) {
			add_pending_mom_hook_action((mominfo_t *) minfo, phook->hook_name, action);
		}
		phook = (hook *) GET_NEXT(phook->hi_allhooks);
	}
}

/**
 * @brief
 *		clears out reply_expected flags of timed out actions
 *		and delete their wait tasks
 *
 * @see
 * 		handle_hook_sync_timeout
 *
 * @param[in]	tid	- transaction id of timedout hook sync sequence
 *
 * @return void
 */
void
clear_timed_out_reply_expected(long long int tid)
{
	int i, j;
	mom_hook_action_t *pact;
	struct work_task *ptask, *tmp_task;
	mominfo_t *pmom;
	struct def_hk_cmd_info *info;

	for (i = 0; i < mominfo_array_size; i++) {

		if ((pmom = mominfo_array[i]) == NULL)
			continue;

		if (((mom_svrinfo_t *) pmom->mi_data)->msr_num_action && ((mom_svrinfo_t *) pmom->mi_data)->msr_action) {

			for (j = 0; j < ((mom_svrinfo_t *) pmom->mi_data)->msr_num_action; j++) {
				pact = ((mom_svrinfo_t *) pmom->mi_data)->msr_action[j];
				if (pact && pact->reply_expected && (pact->tid == tid)) {
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
						   LOG_INFO, __func__, "timedout, clearing reply_expected for %d event[%lld] of %s hook for %s",
						   pact->reply_expected, tid, pact->hookname, pmom->mi_host);
					/* get the task list */
					ptask = (struct work_task *) GET_NEXT(pmom->mi_dmn_info->dmn_deferred_cmds);

					while (ptask) {
						/* no need to compare wt_event with handle, since the
						* task list is for this mom and so it will always match
						*/
						tmp_task = ptask;
						ptask = (struct work_task *) GET_NEXT(ptask->wt_linkobj2);
						if ((tmp_task->wt_type == WORK_Deferred_cmd) &&
						    (pmom == tmp_task->wt_parm1)) {

							info = (struct def_hk_cmd_info *) tmp_task->wt_parm2;

							if (!info || (j != info->index) || !(pact->reply_expected & info->event)) {
								log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
									   LOG_INFO, __func__, "timedout, skipped deleting pending WORK_Deferred_cmd for %s:%s",
									   pact->hookname, pmom->mi_host);
								continue;
							}

							if (tmp_task->wt_event2)
								free(tmp_task->wt_event2);

							if (check_for_latest_action(pmom, pact, j, info->event))
								pact->action &= ~(info->event);

							free(info);

							delete_task(tmp_task);
						}
					}
					pact->reply_expected = 0U;
					pact->tid = hook_action_tid_get();
					hook_track_save(pmom, j);
				}
			}
		}
	}
}

/**
 * @brief
 *		checks for hook sync operation's timeout
 *		and handles timeout activities if so
 *
 * @see
 * 		next_sync_mom_hookfiles
 *
 * @return int
 * @retval 0	if no timeout has occured
 * @retval != 0 if a timeout occurred.
 */
int
handle_hook_sync_timeout(void)
{
	unsigned long timeout_sec;
	time_t timeout_time;
	time_t current_time;
	timeout_sec = SYNC_MOM_HOOKFILES_TIMEOUT_TPP;
	if (is_sattr_set(SVR_ATR_sync_mom_hookfiles_timeout))
		timeout_sec = get_sattr_long(SVR_ATR_sync_mom_hookfiles_timeout);
	current_time = time(NULL);
	timeout_time = g_sync_hook_time + timeout_sec;
	if (sync_mom_hookfiles_replies_pending) {
		if (current_time <= timeout_time) {
			/* previous updates still in progress and not timed out */
			return 0;
		}

		/* we're timing out previous sync mom hook files process/action */
		snprintf(log_buffer, sizeof(log_buffer),
			 "Timing out previous send of mom hook updates "
			 "(send replies expected=%d received=%d)",
			 g_hook_replies_expected, g_hook_replies_recvd);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
			  LOG_INFO, __func__, log_buffer);
		snprintf(log_buffer, sizeof(log_buffer), "timeout_sec=%lu", timeout_sec);
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__, log_buffer);

		clear_timed_out_reply_expected(g_sync_hook_tid);
		g_hook_replies_recvd = 0;
		g_hook_replies_expected = 0;
		/* attempt collapsing  the hook tracking file */
		collapse_hook_tr();
		sync_mom_hookfiles_replies_pending = 0;
		return 1;
	}

	return 0;
}

/**
 * @brief
 *		Checks to see if it's time to run mc_sync_mom_hookfiles() and if so,
 *		then run mc_sync_mom_hookfiles().
 *
 * @see
 * 		next_task
 *
 * @return	void
 */
void
next_sync_mom_hookfiles(void)
{
	int timed_out = handle_hook_sync_timeout();

	if ((do_sync_mom_hookfiles || timed_out) && !sync_mom_hookfiles_replies_pending && mc_sync_mom_hookfiles() == 0)
		do_sync_mom_hookfiles = 0;
}

/**
 * @brief
 *		Mark that a mom hook has been seen, resulting in 'mom_hooks_seen'
 *		variable getting incremented.
 *
 * @see
 * 		pbsd_init
 *
 * @return void
 */
void
mark_mom_hooks_seen(void)
{

	if (mom_hooks_seen < 0) { /* should not happen */
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, __func__,
			  "mom_hooks_seen went negative, resetting to 0");
		mom_hooks_seen = 0;
	}
	mom_hooks_seen++;
}

/**
 * @brief
 *		Returns the value of the 'mom_hooks_seen' variable.
 *
 * @see
 * 		create_mom_entry, delete_svrmom_entry and start_vnode_provisioning.
 *
 * @return int - the mom_hooks_seen value
 */
int
mom_hooks_seen_count(void)
{
	return (mom_hooks_seen);
}

/**
 * @brief
 *		unicast delete mom hook requests and delete rescdef request
 *		to the 'mom' represented by 'minfo' data.
 *		do not care on request failures
 *
 * @see
 * 		delete_svrmom_entry
 *
 * @param[in]	minfo	- data reprsenting the 'mom'.
 *
 * @return void
 */
void
uc_delete_mom_hooks(void *minfo)
{
	/*
	 * unicast delete hook batch request
	 */
	hook *phook;
	char hookfile[MAXPATHLEN + 1];
	mominfo_t *mom_info = (mominfo_t *) minfo;
	char *msgid = NULL;

	phook = (hook *) GET_NEXT(svr_allhooks);
	while (phook) {
		if (phook->hook_name &&
		    (phook->event & MOM_EVENTS)) {
			msgid = NULL;
			snprintf(hookfile, sizeof(hookfile), "%s%s", phook->hook_name, HOOK_FILE_SUFFIX);
			PBSD_delhookfile(mom_info->mi_dmn_info->dmn_stream, hookfile, PROT_TPP, &msgid);
			free(msgid);
			msgid = NULL;
		}
		phook = (hook *) GET_NEXT(phook->hi_allhooks);
	}
	PBSD_delhookfile(mom_info->mi_dmn_info->dmn_stream, PBS_RESCDEF, PROT_TPP, &msgid);
	free(msgid);
	return;
}

/**
 * @brief
 * 		Returns the hook resourcedef file checksum value.
 *
 * @see
 * 		is_request
 *
 * @return usigned long
 */
unsigned long
get_hook_rescdef_checksum(void)
{
	return (hook_rescdef_checksum);
}

/**
 *
 * @brief
 *	Get the results from 'output_file' of a previously run hook.
 *
 * @param[in] 		input_file -  file to process.
 * @param[in,out] 	accept_flag -  return 1 if event accept flag is true.
 * @param[in,out] 	reject_flag -  return 1 if event reject flag is true.
 * @param[in,out] 	reject_msg -  the reject message if reject_flag is 1.
 * @param[in]		reject_msg_size -  size of reject_msg buffer.
 * @param[in,out] 	pjob -  job in question, where if present (not NULL),
 *			        it gets filled in with the
 *				"pbs.event().job" entries in 'input_file'.
 *				'pjob' can be NULL in periodic hooks, since
 *				 periodic hooks are not tied to jobs.
 *				 Note that pbs.event().job_list[<jobid>] entries
 *				 in 'input_file' fill in the individual
 *				 <jobid>'s job struct entry in the system, and
 *				 not the passed 'pjob' structure.
 * @param[in]		phook -  hook that executed of which we're getting the
 *				results. If non-NULL, then phook->user is
 *				used to validate 'pbs.event().job.euser' line
 *				in 'input_file'.
 *				If main Mom is reading a job related hook
 *				results file, phook will be null; an entry in
 *				the file should give us the hook name from which
 *				phook is found.
 * @param[out]		hook_output - struct of parameters to fill in output.
 *
 * @return int
 * @retval	0 for success
 * @retval	non-zero for failure;  the returned parameters (accept_flag,
 *		reject_flag and pjob) may be invalid and should be
 *		ignored.   The list svrvnalist could have mallocate space and
 *		should be freed by the calling program.
 */
int
get_server_hook_results(char *input_file, int *accept_flag, int *reject_flag, char *reject_msg,
			int reject_msg_size, job *pjob, hook *phook, hook_output_param_t *hook_output)
{

	char *name_str;
	char *resc_str;
	char *obj_name;
	char *data_value;
	char *vname_str;
	int rc = -1;
	char *pc, *pc1, *pc2, *pc3, *pc4;
	char *in_data = NULL;
	size_t ll;
	FILE *fp;
	char *p;
	int vn_obj_len = strlen(EVENT_VNODELIST_OBJECT);
	char hook_job_outfile[MAXPATHLEN + 1];
	FILE *fp2 = NULL;
	char *line_data = NULL;
	int line_data_sz;
	long int endpos;
	char hook_euser[PBS_MAXUSER + 1] = {'\0'};
	int arg_list_entries = 0;
	int b_triple_quotes = 0;
	int e_triple_quotes = 0;
	char buf_data[STRBUF];
	int buf_data_sz = STRBUF;
	int valln = 0;
	svrattrl *plist = NULL;
	struct pbsnode *pnode;
	int bad = 0;
	char *pbse_err;
	char raw_err[10];

	/* Preset hook_euser for later.  If we are reading a job related     */
	/* copy of hook results, there will be one or more (one per hook)    */
	/* pbs_event().hook_euser=<value> entries.  In that case, hook_euser */
	/* is reset to the <value>.  A null string <value> means PBSADMIN.   */
	if (phook && pjob && (phook->user == HOOK_PBSUSER)) {
		strncpy(hook_euser,
			get_jattr_str(pjob, JOB_ATR_euser),
			PBS_MAXUSER);
	}

	/* input_file will have content of the format: */
	/* pbs.event().accept=True */
	/* pbs.event().reject=False */
	/* pbs.event().vnode.pcpus=4 */
	/* pbs.event().vnode_list["node_name"].state=sleep */
	/* pbs.event().vnode_list["node_name"].resources_available[ncpus]=10 */
	if ((input_file != NULL) && (*input_file != '\0')) {
		fp = fopen(input_file, "r");

		if (fp == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed to open input file %s", input_file);
			log_err(errno, __func__, log_buffer);
			return (1);
		}
	} else {
		log_err(PBSE_INTERNAL, __func__, "bad input_file parameter");
		return (1);
	}

	line_data_sz = STRBUF;
	line_data = (char *) malloc(line_data_sz);
	if (line_data == NULL) {
		log_err(errno, __func__, "malloc failed");
		rc = 1;
		goto get_hook_results_end;
	}
	line_data[0] = '\0';

	if (fseek(fp, 0, SEEK_END) != 0) {
		log_err(errno, __func__, "fseek to end failed");
		rc = 1;
		goto get_hook_results_end;
	}

	endpos = ftell(fp);
	if (fseek(fp, 0, SEEK_SET) != 0) {
		log_err(errno, __func__, "fseek to beginning failed");
		rc = 1;
		goto get_hook_results_end;
	}

	while (fgets(buf_data, buf_data_sz, fp) != NULL) {
		b_triple_quotes = 0;
		e_triple_quotes = 0;

		if (pbs_strcat(&line_data, &line_data_sz, buf_data) == NULL) {
			goto get_hook_results_end;
		}
		if (in_data != NULL) {
			free(in_data);
		}
		in_data = strdup(line_data); /* preserve line_data */
		if (in_data == NULL) {
			log_err(errno, __func__, "strdup failed");
			rc = 1;
			goto get_hook_results_end;
		}

		if ((p = strchr(in_data, '=')) != NULL) {
			/* string begins with three consecutive double quotes */
			b_triple_quotes = starts_with_triple_quotes(p + 1);
		}

		ll = strlen(in_data);
		if (in_data[ll - 1] == '\n') {
			/* string ends with three consecutive double quotes */
			e_triple_quotes = ends_with_triple_quotes(in_data, 0);

			if (b_triple_quotes && !e_triple_quotes) {
				int jj;

				while (fgets(buf_data, buf_data_sz, fp) != NULL) {
					if (pbs_strcat(&line_data, &line_data_sz,
						       buf_data) == NULL) {
						goto get_hook_results_end;
					}

					jj = strlen(line_data);
					if ((line_data[jj - 1] != '\n') &&
					    (ftell(fp) != endpos)) {
						/* get more input for current item. */
						continue;
					}
					e_triple_quotes = ends_with_triple_quotes(line_data, 0);

					if (e_triple_quotes) {
						break;
					}
				}

				if ((!b_triple_quotes && e_triple_quotes) ||
				    (b_triple_quotes && !e_triple_quotes)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "unmatched triple quotes! Skipping  line %s",
						 in_data);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					/* process a new line */
					line_data[0] = '\0';
					continue;
				}

				if (in_data != NULL) {
					free(in_data);
				}
				in_data = strdup(line_data); /* preserve line_data */
				if (in_data == NULL) {
					log_err(errno, __func__, "strdup failed");
					rc = 1;
					goto get_hook_results_end;
				}
				/* remove newline */
				in_data[strlen(in_data) - 1] = '\0';
			} else {
				/* remove newline */
				in_data[ll - 1] = '\0';
			}

		} else if (ftell(fp) != endpos) { /* continued on next line */
			/* get more input for current item.  */
			continue;
		}

		data_value = NULL;
		if ((p = strchr(in_data, '=')) != NULL) {
			*p = '\0';
			p++;
			while (isspace(*p))
				p++;

			if (b_triple_quotes) {
				/* strip triple quotes */
				p += 3;
			}
			data_value = p;
			if (e_triple_quotes) {
				ends_with_triple_quotes(p, 1);
			}
		}

		obj_name = in_data;

		pc = strrchr(in_data, '.');
		if (pc) {
			*pc = '\0';
			pc++;
		} else {
			pc = in_data;
		}
		name_str = pc;

		pc1 = strchr(pc, '[');
		pc2 = strchr(pc, ']');
		resc_str = NULL;
		if (pc1 && pc2 && (pc2 > pc1)) {
			*pc1 = '\0';
			pc1++;
			*pc2 = '\0';
			pc2++;

			/* now let's if there's anything quoted inside */
			pc3 = strchr(pc1, '"');
			if (pc3 != NULL)
				pc4 = strchr(pc3 + 1, '"');
			else
				pc4 = NULL;

			if (pc3 && pc4 && (pc4 > pc3)) {
				pc3++;
				*pc4 = '\0';
				resc_str = pc3;
			} else {
				resc_str = pc1;
			}
		}

		/* at this point, we have */
		/* Given:  pbs.event().<attribute>=<value> */
		/* Given:  pbs.event().job.<attribute>=<value> */
		/* Given:  pbs.event().job.<attribute>[<resc>]=<value> */
		/* Given:  pbs.event().vnode_list[<vname>].<attribute>=<value> */
		/* Given:  pbs.event().vnode_list[<vname>].<attribute>[<resc>]=<value> */
		/* We get: */

		/* obj_name = pbs.event() or "pbs.event().job" or "pbs.event().vnode_list[<vname>]" */
		/* name_str = <attribute> */
		/* resc_str = <resc> */
		/* data_value = <value> */

		if (data_value == NULL) {

			snprintf(log_buffer, sizeof(log_buffer),
				 "%s: no value given", in_data);
			log_err(errno, __func__, log_buffer);
			rc = 1;
			goto get_hook_results_end;
		}

		if (strcmp(obj_name, EVENT_OBJECT) == 0) {
			if (strcmp(name_str, "hook_euser") == 0) {
				strncpy(hook_euser, data_value, PBS_MAXUSER);
			} else if ((accept_flag != NULL) &&
				   strcmp(name_str, "accept") == 0) {
				if (strcmp(data_value, "True") == 0)
					*accept_flag = 1;
				else
					*accept_flag = 0;
			} else if ((reject_flag != NULL) &&
				   strcmp(name_str, "reject") == 0) {

				if (strcmp(data_value, "True") == 0)
					*reject_flag = 1;
				else
					*reject_flag = 0;
			} else if ((reject_msg != NULL) &&
				   (strcmp(name_str, "reject_msg") == 0)) {
				strncpy(reject_msg, data_value,
					reject_msg_size - 1);
			} else if (strcmp(name_str, PY_EVENT_PARAM_PROGNAME) == 0) {
				if (hook_output != NULL) {
					char **prog;
					/* need to free up here previous value */
					/* in case of multiple hooks! */
					prog = hook_output->progname;
					if (*prog != NULL) {
						free(*prog);
					}
					*prog = strdup(data_value);
				}
			} else if (strcmp(name_str, PY_EVENT_PARAM_ARGLIST) == 0) {
				arg_list_entries++;
				if (hook_output != NULL) {
					pbs_list_head *ar_list;
					ar_list = hook_output->argv_list;
					/* free previous values at start of new list */
					if (arg_list_entries == 1) {
						free_attrlist(ar_list);
					}
					add_to_svrattrl_list(ar_list, name_str, resc_str,
							     data_value, 0, NULL);
				}
			} else if (strcmp(name_str, PY_EVENT_PARAM_ENV) == 0) {
				if (hook_output != NULL) {
					char **env;
					env = hook_output->env;
					if (*env != NULL) {
						free(*env);
					}
					*env = strdup(data_value);
				}
			}

			/* if the hook is rejected we can go out now */
			if ((reject_flag != NULL) && (*reject_flag == 1) && (reject_msg != NULL))
				goto get_hook_results_end;
		} else if (strncmp(obj_name, EVENT_VNODELIST_OBJECT,
				   vn_obj_len) == 0) {

			/* NOTE: obj_name here is: pbs.event().vnode_list[<vname>] */

			/* important here to look for the leftmost '[' (using strchr)
			 * and the rightmost ']' (using strrchr)
			 * as we can have:
			 *	pbs.event().vnode_list["altix[5]"].<attr>=<val>
			 * 	and "altix[5]" is a valid vnode id.
			 */
			if (((pc1 = strchr(obj_name, '[')) != NULL) &&
			    ((pc2 = strrchr(obj_name, ']')) != NULL) &&
			    (pc2 > pc1)) {
				pc1++;	     /*  pc1=<vname>] */
				*pc2 = '\0'; /* pc1=<vname>  */
				pc2++;

				/* now let's if there's anything quoted inside */
				pc3 = strchr(pc1, '"');
				if (pc3 != NULL)
					pc4 = strchr(pc3 + 1, '"');
				else
					pc4 = NULL;

				if (pc3 && pc4 && (pc4 > pc3)) {
					pc3++;
					*pc4 = '\0';
					vname_str = pc3;
				} else {
					vname_str = pc1;
				}
			} else {
				snprintf(log_buffer, sizeof(log_buffer),
					 "object '%s' does not have a vnode name!",
					 obj_name);
				log_err(-1, __func__, log_buffer);
				/* process a new line */
				line_data[0] = '\0';
				continue;
			}

			/* server periodic hook vnode objects */
			valln = (int) strlen(data_value) + 1;
			plist = attrlist_create(name_str, resc_str, valln);
			if (plist == NULL) {
				(void) sprintf(log_buffer, "failed to add svrattrl list %s.%s.%s:%s",
					       vname_str, name_str, resc_str, data_value);
				log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
					  LOG_NOTICE, msg_daemonname, log_buffer);
			} else {
				strcpy(plist->al_value, data_value);
				(plist->al_link).ll_next->ll_struct = NULL;
				/* there are vnode hook updates */
				/* Push hook changes to server */
				pnode = find_nodebyname(vname_str);
				if (pnode == NULL) {
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
						  LOG_INFO, vname_str, "node_name not found");
				} else if ((pnode->nd_state & INUSE_DELETED) == 0) {

					rc = mgr_set_attr(pnode->nd_attr, node_attr_idx, node_attr_def, ND_ATR_LAST,
							  plist, ATR_DFLAG_WRACC, &bad, (void *) pnode, ATR_ACTION_ALTER);
					if (rc != 0) {
						pbse_err = pbse_to_txt(rc);
						snprintf(raw_err, sizeof(raw_err), "%d", rc);
						sprintf(log_buffer, "vnode %s: failed to set %s to %s: %s",
							pnode->nd_name, plist->al_name, plist->al_value ? plist->al_value : "",
							pbse_err ? pbse_err : raw_err);
						log_err(PBSE_SYSTEM, __func__, log_buffer);
					} else {
						mgr_log_attr(msg_man_set, plist,
							     PBS_EVENTCLASS_NODE, pnode->nd_name, NULL);
						pnode->nd_modified = 1;
					}
				}
				free_svrattrl(plist);
			}
		}
		/* TODO: for job objects */
		/* TODO: for Server objects */
		/* TODO: for PBS objects */
		if ((fp2 != NULL) && (fputs(line_data, fp2) < 0)) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to save data in file %s",
				 hook_job_outfile);
			log_err(errno, __func__, log_buffer);
			rc = 1;
			goto get_hook_results_end;
		}
		line_data[0] = '\0';
	}

	save_nodes_db(0, NULL);

	rc = 0;

get_hook_results_end:

	if (fp != NULL)
		fclose(fp);

	if (fp2 != NULL) {
		if (fflush(fp2) != 0) {
			/* error in writting job related hook results file */
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to save data in file %s",
				 hook_job_outfile);
			log_err(errno, __func__, log_buffer);
			rc = 1;
			fclose(fp2);
			unlink(hook_job_outfile);
		} else {
			fclose(fp2);
		}
	}
	if (phook && !phook->debug) {
		(void) unlink(input_file);
	}
	if (line_data != NULL) {
		free(line_data);
	}
	if (in_data != NULL) {
		free(in_data);
	}

	return (rc);
}

/**
 * @brief
 *		Callback function for reaping server periodic hook child.
 * @param[in]	ptask	- work task pointer
 *
 * @return	void
 */
static void
post_server_periodic_hook(struct work_task *ptask)
{

	int stat;
	hook *phook;
	pid_t mypid;
	char hook_outfile[MAXPATHLEN + 1];
	time_t next_time;
	int accept_flag = 1;
	int reject_flag = 0;
	stat = ptask->wt_aux;
	phook = (hook *) ptask->wt_parm1;
	mypid = ptask->wt_event;

	if (phook == NULL) {
		log_err(-1, __func__, "A periodic hook disappeared");
		return;
	}
	if (WIFEXITED(stat)) {
		char reject_msg[HOOK_MSG_SIZE + 1] = {'\0'};
		char *next_time_str;
		int hook_error_flag = 0;

		/* Check hook exit status */
		if (stat == 0) {
			snprintf(log_buffer, LOG_BUF_SIZE,
				 "Hook got rejected");
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
			hook_error_flag = 1; /* hook results are invalid */
		}

		/* hook results path */
		snprintf(hook_outfile, MAXPATHLEN, FMT_HOOK_OUTFILE,
			 path_hooks_workdir, HOOKSTR_PERIODIC,
			 phook->hook_name, mypid);

		if (hook_error_flag == 0) {
			/* hook exited normally, get results from file  */
			if (get_server_hook_results(hook_outfile, &accept_flag, &reject_flag,
						    reject_msg, sizeof(reject_msg), NULL, phook, NULL) != 0) {
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, phook->hook_name,
					  "Failed getting hook results");
				/* error getting results, do not accept results */
				hook_error_flag = 1;
			}
		}

		if ((hook_error_flag == 1) || (accept_flag == 0)) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "%s request rejected by '%s'",
				 "periodic", phook->hook_name);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
			if (reject_msg[0] != '\0') {
				snprintf(log_buffer, sizeof(log_buffer), "%s",
					 reject_msg);
				/* log also the custom reject message */
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, phook->hook_name, log_buffer);
			}
		}

		if (hook_error_flag == 0) {
			/* No hook error means data is communicated to */
			/* the server and actions are done to jobs.    */
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, phook->hook_name, "periodic hook accepted");

			/* remove the processed results file, note that if  */
			/* there was an error, it is left for debugging use */
			if (!phook->debug)
				(void) unlink(hook_outfile); /* remove file */
		}

		next_time = time_now + phook->freq;
		next_time_str = ctime(&next_time);
		if ((next_time_str != NULL) && (next_time_str[0] != '\0')) {
			next_time_str[strlen(next_time_str) - 1] = '\0'; /* remove newline */
			snprintf(log_buffer, sizeof(log_buffer), "will run on %s",
				 next_time_str);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
		}

		sprintf(log_buffer, "Server periodic hook ran successfully");
	} else
		sprintf(log_buffer, "Server periodic hook encountered errors: %d", stat);

	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_INFO,
		  __func__, log_buffer);

	return;
}

/**
 * @brief
 *		Callback function for Timed work tasks to run periodic hooks
 * @param[in]	ptask	- work task pointer
 *
 * @return  void
 */
void
run_periodic_hook(struct work_task *ptask)
{
	char hook_msg[HOOK_MSG_SIZE] = {'\0'};
	int ret;
	int num_run = 0;
	hook *phook;
	hook_input_param_t req_ptr;
	pid_t pid;
	int event_initialized = 0;

	phook = (hook *) ptask->wt_parm1;
	hook_input_param_init(&req_ptr);
	if (phook == NULL) {
		log_err(-1, __func__, "A periodic hook disappeared");
		return;
	}

	if (phook->enabled == 0 || phook->script == NULL || phook->freq < 1) {
		sprintf(log_buffer, "periodic hook is missing information, check hook frequency and script");
		log_err(-1, __func__, log_buffer);
	}

	if (has_task_by_parm1(phook) == 1) {
		/* There is already a task present related to
		 * post processing for previously running hook.
		 * Don't run hook this time, just register a
		 * timed task for it's next occurance
		 */
		(void) set_task(WORK_Timed, time_now + phook->freq, run_periodic_hook, phook);
		return;
	}

	pid = fork();

	if (pid == -1) { /* Error on fork */
		log_err(errno, __func__, "fork failed\n");
		pbs_errno = PBSE_SYSTEM;
		return;
	}

	if (pid != 0) { /* The parent (main server) */
		/* Set a task for post processing of the running hook */
		struct work_task *ptask;
		ptask = set_task(WORK_Deferred_Child, (long) pid,
				 post_server_periodic_hook, phook);
		if (!ptask) {
			log_err(errno, __func__, msg_err_malloc);
			return;
		}
		/* Set a timed task for next occurance of this hook */
		(void) set_task(WORK_Timed, time_now + phook->freq,
				run_periodic_hook, phook);
	} else {
		/* Close all server connections */
		net_close(-1);
		tpp_terminate();
		/* Unprotect child from being killed by kernel */
		daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

		/* set vnodes and reservation list to hook input parameter */
		req_ptr.vns_list = (pbs_list_head *) get_vnode_list();
		req_ptr.resv_list = (pbs_list_head *) get_resv_list();

		ret = server_process_hooks(PBS_BATCH_HookPeriodic, NULL, NULL, phook,
					   HOOK_EVENT_PERIODIC, NULL, &req_ptr, hook_msg,
					   sizeof(hook_msg), pbs_python_set_interrupt, &num_run, &event_initialized);
		if (ret == 0)
			log_event(PBSE_HOOKERROR, PBS_EVENTCLASS_HOOK, LOG_ERR, __func__, hook_msg);

#if defined(DEBUG)
		/* for valgrind, clear some stuff up */
		{
			hook *phook = (hook *) GET_NEXT(svr_allhooks);
			while (phook) {
				hook *tmp;
				free(phook->hook_name);
				if (phook->script) {
					struct python_script *scr = phook->script;
					free(scr->path);
					free(scr->py_code_obj);
				}
				free(phook->script);
				tmp = phook;
				phook = (hook *) GET_NEXT(phook->hi_allhooks);
				free(tmp);
			}
		}
#endif

		exit(ret);
	}
	return;
}


================================================
FILE: src/server/issue_request.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	issue_request.c
 *
 * @brief
 * 		Function to allow the server to issue requests to to other batch
 * 		servers, scheduler, MOM, or even itself.
 *
 * 		The encoding of the data takes place in other routines, see
 * 		the API routines in libpbs.a
 *
 * Functions included are:
 *	relay_to_mom()
 *	reissue_to_svr()
 *	issue_to_svr()
 *	release_req()
 *	add_mom_deferred_list()
 *	issue_Drequest()
 *	process_Dreply()
 *	process_DreplyTPP()
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <errno.h>
#include <string.h>
#include <sys/types.h>
#include "dis.h"
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "credential.h"
#include "batch_request.h"
#include "log.h"
#include "job.h"
#include "work_task.h"
#include "net_connect.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "server.h"
#include <libutil.h>
#include "tpp.h"

/* Global Data Items: */
extern pbs_list_head task_list_event;
extern time_t time_now;
extern char *msg_issuebad;
extern char *msg_norelytomom;
extern char *msg_err_malloc;

extern pbs_net_t pbs_server_addr;
extern int max_connection;

/**
 *
 * @brief
 *	Wrapper program to relay_to_mom2() with the 'pwt' argument
 *	passed as NULL.
 */
int
relay_to_mom(job *pjob, struct batch_request *request,
	     void (*func)(struct work_task *))
{
	return (relay_to_mom2(pjob, request, func, NULL));
}

/**
 * @brief
 * 		Relay a (typically existing) batch_request to MOM
 *
 *		Make connection to MOM and issue the request.  Called with
 *		network address rather than name to save look-ups.
 *
 *		Unlike issue_to_svr(), a failed connection is not retried.
 *		The calling routine typically handles this problem.
 *
 * @param[in,out]	pjob - pointer to job
 * @param[in]	request - the request to send
 * @param[in]	func - function pointer taking work_task structure as argument.
 * @param[out]  ppwt - the work task maintained by server
 *			to handle deferred replies from request.
 *
 * @return	int
 * @retval	0	- success
 * @retval	non-zero	- error code
 */

int
relay_to_mom2(job *pjob, struct batch_request *request,
	      void (*func)(struct work_task *), struct work_task **ppwt)
{
	int rc;
	int conn; /* a client style connection handle */
	pbs_net_t momaddr;
	unsigned int momport;
	struct work_task *pwt;
	int prot = PROT_TPP;
	mominfo_t *pmom = 0;
	pbs_list_head *mom_tasklist_ptr = NULL;

	momaddr = pjob->ji_qs.ji_un.ji_exect.ji_momaddr;
	momport = pjob->ji_qs.ji_un.ji_exect.ji_momport;

	if ((pmom = tfind2((unsigned long) momaddr, momport, &ipaddrs)) == NULL)
		return (PBSE_NORELYMOM);

	mom_tasklist_ptr = &pmom->mi_dmn_info->dmn_deferred_cmds;

	conn = svr_connect(momaddr, momport, process_Dreply, ToServerDIS, prot);
	if (conn < 0) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_REQUEST, LOG_WARNING, "", msg_norelytomom);
		return (PBSE_NORELYMOM);
	}

	request->rq_orgconn = request->rq_conn; /* save client socket */
	pbs_errno = 0;
	rc = issue_Drequest(conn, request, func, &pwt, prot);
	if ((rc == 0) && (func != release_req)) {
		/* work-task entry job related on TPP based connection, link to the job's list */
		append_link(&pjob->ji_svrtask, &pwt->wt_linkobj, pwt);
		if (prot == PROT_TPP)
			append_link(mom_tasklist_ptr, &pwt->wt_linkobj2, pwt); /* if tpp, link to mom list as well */
	}

	if (ppwt != NULL)
		*ppwt = pwt;

	/*
	 * We do not want req_reject() to send non PBSE error numbers.
	 * Check for internal errors and when found return PBSE_SYSTEM.
	 */
	if ((rc != 0) && (pbs_errno == 0))
		return (PBSE_SYSTEM);
	else
		return (rc);
}

/**
 * @brief
 * 		reissue_to_svr - recall issue_to_svr() after a delay to retry sending
 *		a request that failed for a temporary reason
 *
 * @see
 *  issue_to_svr
 *
 * @param[in]	pwt - pointer to work structure
 *
 * @return	void
 */
static void
reissue_to_svr(struct work_task *pwt)
{
	struct batch_request *preq = pwt->wt_parm1;
	int issue_to_svr(char *, struct batch_request *,
			 void (*)(struct work_task *));

	/* if not timed-out, retry send to remote server */

	if (((time_now - preq->rq_time) > PBS_NET_RETRY_LIMIT) ||
	    (issue_to_svr(preq->rq_host, preq, (void (*)(struct work_task *)) pwt->wt_parm2) == -1)) {

		/* either timed-out or got hard error, tell post-function  */
		pwt->wt_aux = -1;   /* seen as error by post function  */
		pwt->wt_event = -1; /* seen as connection by post func */
		((void (*)(struct work_task *)) pwt->wt_parm2)(pwt);
	}
	return;
}

/**
 * @brief
 * 		issue_to_svr - issue a batch request to a server
 *		This function parses the server name, looks up its host address,
 *		makes a connection and called issue_request (above) to send
 *		the request.
 *
 * @param[in]	servern - name of host sending request
 * @param[in,out]	preq - batch request to send
 * @param[in]	replyfunc - Call back func gor reply
 *
 * @return	int
 * @retval	0 - success,
 * @retval -1 - permanent error (no such host)
 *
 * @note
 *	On temporary error, establish a work_task to retry after a delay.
 */

int
issue_to_svr(char *servern, struct batch_request *preq, void (*replyfunc)(struct work_task *))
{
	int do_retry = 0;
	int handle;
	pbs_net_t svraddr;
	char *svrname;
	unsigned int port = pbs_server_port_dis;
	struct work_task *pwt;
	extern int pbs_failover_active;
	extern char primary_host[];

	(void) strcpy(preq->rq_host, servern);
	preq->rq_fromsvr = 1;
	preq->rq_perm = ATR_DFLAG_MGRD | ATR_DFLAG_MGWR | ATR_DFLAG_SvWR;
	svrname = parse_servername(servern, &port);

	if ((pbs_failover_active != 0) && (svrname != NULL)) {
		/* we are the active secondary server in a failover config    */
		/* if the message is going to the primary,then redirect to me */
		size_t len;

		len = strlen(svrname);
		if (strncasecmp(svrname, primary_host, len) == 0) {
			if ((primary_host[(int) len] == '\0') ||
			    (primary_host[(int) len] == '.'))
				svrname = server_host;
		}
	}
	if (comp_svraddr(pbs_server_addr, svrname, &svraddr) == 0)
		return (issue_Drequest(PBS_LOCAL_CONNECTION, preq, replyfunc, 0, 0));

	if (svraddr == (pbs_net_t) 0) {
		if (pbs_errno == PBS_NET_RC_RETRY)
			/* Non fatal error - retry */
			do_retry = 1;
	} else {
		handle = svr_connect(svraddr, port, process_Dreply, ToServerDIS, PROT_TCP);
		if (handle >= 0)
			return (issue_Drequest(handle, preq, replyfunc, 0, 0));
		else if (handle == PBS_NET_RC_RETRY)
			do_retry = 1;
	}

	/* if reached here, it didn`t go, do we retry? */

	if (do_retry) {
		pwt = set_task(WORK_Timed, (long) (time_now + (2 * PBS_NET_RETRY_TIME)),
			       reissue_to_svr, (void *) preq);
		pwt->wt_parm2 = (void *) replyfunc;
		return (0);
	} else
		return (-1);
}

/**
 * @brief
 * 			release_req - this is the basic function to call after we are
 *			through with an internally generated request to another server.
 *			It frees the request structure and closes the connection (handle).
 *
 *			In the work task entry, wt_event is the connection handle and
 *			wt_parm1 is a pointer to the request structure.
 *
 * @note
 *			THIS SHOULD NOT BE USED IF AN EXTERNAL (CLIENT) REQUEST WAS "relayed".
 *			The request/reply structure is still needed to reply to the client.
 *
 * @param[in]	pwt - pointer to work structure
 *
 * @return void
 */

void
release_req(struct work_task *pwt)
{
	free_br((struct batch_request *) pwt->wt_parm1);
	if (pwt->wt_event != -1 && pwt->wt_aux2 != PROT_TPP)
		svr_disconnect(pwt->wt_event);
}

/**
 *	@brief
 *		add a task to the moms deferred command list
 *		of commands issued to the server
 *
 *		Used only in case of TPP
 *
 * @param[in] stream - stream on which command is being sent
 * @param[in] minfo  - The mominfo_t pointer for the mom
 * @param[in] func   - Call back func when mom responds
 * @param[in] msgid  - String unique identifying the command from others
 * @param[in] parm1  - Fist parameter to the work task to be set
 * @param[in] parm2  - Second parameter to the work task to be set
 *
 * @return Work task structure that was allocated and added to moms deferred cmd list
 * @retval NULL  - Failure
 * @retval !NULL - Success
 *
 */
struct work_task *
add_mom_deferred_list(int stream, mominfo_t *minfo, void (*func)(struct work_task *), char *msgid, void *parm1, void *parm2)
{
	struct work_task *ptask = NULL;

	/* WORK_Deferred_cmd is very similar to WORK_Deferred_reply.
	 * However in case of WORK_Deferred_reply, the wt_parm1 is assumed to
	 * contain a batch_request structure. In cases where there is no
	 * batch_request structure associated, we use the WORK_Deferred_cmd
	 * event type to differentiate it in process_DreplyTPP.
	 */
	ptask = set_task(WORK_Deferred_cmd, (long) stream, func, parm1);
	if (ptask == NULL) {
		log_err(errno, __func__, "could not set_task");
		return NULL;
	}
	ptask->wt_aux2 = PROT_TPP; /* set to tpp */
	ptask->wt_parm2 = parm2;
	ptask->wt_event2 = msgid;

	/* remove this task from the event list, as we will be adding to deferred list anyway
	 * and there is no child process whose exit needs to be reaped
	 */
	delete_link(&ptask->wt_linkevent);

	/* append to the moms deferred command list */
	append_link(&minfo->mi_dmn_info->dmn_deferred_cmds, &ptask->wt_linkobj2, ptask);
	return ptask;
}

/**
 * @brief
 * 		issue a batch request to another server or to a MOM
 *		or even to ourself!
 *
 *		If the request is meant for this every server, then
 *		Set up work-task of type WORK_Deferred_Local with a dummy
 *		connection handle (PBS_LOCAL_CONNECTION).
 *
 *		Dispatch the request to be processed.  [reply_send() will
 *		dispatch the reply via the work task entry.]
 *
 *		If the request is to another server/MOM, then
 *		Set up work-task of type WORK_Deferred_Reply with the
 *		connection handle as the event.
 *
 *		Encode and send the request.
 *
 *		When the reply is ready,  process_Dreply() will decode it and
 *		dispatch the work task.
 *
 * @note
 *		IT IS UP TO THE FUNCTION DISPATCHED BY THE WORK TASK TO CLOSE THE
 *		CONNECTION (connection handle not socket) and FREE THE REQUEST
 *		STRUCTURE.  The connection (non-negative if open) is in wt_event
 *		and the pointer to the request structure is in wt_parm1.
 *
 * @param[in] conn	- connection index
 * @param[in] request	- batch request to send
 * @param[in] func	- The callback function to invoke to handle the batch reply
 * @param[out] ppwt	- Return work task to be maintained by server to handle deferred replies
 * @param[in] prot	- PROT_TCP or PROT_TPP
 *
 * @return  Error code
 * @retval   0 - Success
 * @retval  -1 - Failure
 *
 */
int
issue_Drequest(int conn, struct batch_request *request, void (*func)(struct work_task *), struct work_task **ppwt, int prot)
{
	struct attropl *patrl;
	struct work_task *ptask;
	struct svrattrl *psvratl;
	int rc;
	int sock = -1;
	enum work_type wt;
	char *msgid = NULL;

	request->tppcmd_msgid = NULL;

	if (conn == PBS_LOCAL_CONNECTION) {
		wt = WORK_Deferred_Local;
		request->rq_conn = PBS_LOCAL_CONNECTION;
	} else if (prot == PROT_TPP) {
		sock = conn;
		request->rq_conn = conn;
		wt = WORK_Deferred_Reply;
	} else {
		sock = conn;
		request->rq_conn = sock;
		wt = WORK_Deferred_Reply;
		DIS_tcp_funcs();
	}

	ptask = set_task(wt, (long) conn, func, (void *) request);
	if (ptask == NULL) {
		log_err(errno, __func__, "could not set_task");
		if (ppwt != 0)
			*ppwt = 0;
		return (-1);
	}

	if (conn == PBS_LOCAL_CONNECTION) {

		/* the request should be issued to ourself */

		dispatch_request(PBS_LOCAL_CONNECTION, request);
		if (ppwt != 0)
			*ppwt = ptask;
		return (0);
	}

	/* the request is bound to another server, encode/send the request */
	switch (request->rq_type) {

		case PBS_BATCH_DeleteJob:
			rc = PBSD_mgr_put(conn,
					  PBS_BATCH_DeleteJob,
					  MGR_CMD_DELETE,
					  MGR_OBJ_JOB,
					  request->rq_ind.rq_delete.rq_objname,
					  NULL,
					  request->rq_extend,
					  prot,
					  &msgid);
			break;

		case PBS_BATCH_HoldJob:
			attrl_fixlink(&request->rq_ind.rq_hold.rq_orig.rq_attr);
			psvratl = (struct svrattrl *) GET_NEXT(
				request->rq_ind.rq_hold.rq_orig.rq_attr);
			patrl = &psvratl->al_atopl;
			rc = PBSD_mgr_put(conn,
					  PBS_BATCH_HoldJob,
					  MGR_CMD_SET,
					  MGR_OBJ_JOB,
					  request->rq_ind.rq_hold.rq_orig.rq_objname,
					  patrl,
					  NULL,
					  prot,
					  &msgid);
			break;

		case PBS_BATCH_MessJob:
			rc = PBSD_msg_put(conn,
					  request->rq_ind.rq_message.rq_jid,
					  request->rq_ind.rq_message.rq_file,
					  request->rq_ind.rq_message.rq_text,
					  NULL,
					  prot,
					  &msgid);
			break;

		case PBS_BATCH_RelnodesJob:
			rc = PBSD_relnodes_put(conn,
					       request->rq_ind.rq_relnodes.rq_jid,
					       request->rq_ind.rq_relnodes.rq_node_list,
					       NULL,
					       prot,
					       &msgid);
			break;

		case PBS_BATCH_PySpawn:
			rc = PBSD_py_spawn_put(conn,
					       request->rq_ind.rq_py_spawn.rq_jid,
					       request->rq_ind.rq_py_spawn.rq_argv,
					       request->rq_ind.rq_py_spawn.rq_envp,
					       prot,
					       &msgid);
			break;

		case PBS_BATCH_ModifyJob:
			attrl_fixlink(&request->rq_ind.rq_modify.rq_attr);
			patrl = (struct attropl *) &((struct svrattrl *) GET_NEXT(
							     request->rq_ind.rq_modify.rq_attr))
					->al_atopl;
			rc = PBSD_mgr_put(conn,
					  PBS_BATCH_ModifyJob,
					  MGR_CMD_SET,
					  MGR_OBJ_JOB,
					  request->rq_ind.rq_modify.rq_objname,
					  patrl,
					  NULL,
					  prot,
					  &msgid);
			break;

		case PBS_BATCH_ModifyJob_Async:
			attrl_fixlink(&request->rq_ind.rq_modify.rq_attr);
			patrl = (struct attropl *) &((struct svrattrl *) GET_NEXT(
							     request->rq_ind.rq_modify.rq_attr))
					->al_atopl;
			rc = PBSD_mgr_put(conn,
					  PBS_BATCH_ModifyJob_Async,
					  MGR_CMD_SET,
					  MGR_OBJ_JOB,
					  request->rq_ind.rq_modify.rq_objname,
					  patrl,
					  NULL,
					  prot,
					  &msgid);
			break;

		case PBS_BATCH_Rerun:
			if (prot == PROT_TPP) {
				rc = is_compose_cmd(sock, IS_CMD, &msgid);
				if (rc != 0)
					break;
			}
			rc = encode_DIS_ReqHdr(sock, PBS_BATCH_Rerun, pbs_current_user);
			if (rc != 0)
				break;
			rc = encode_DIS_JobId(sock, request->rq_ind.rq_rerun);
			if (rc != 0)
				break;
			rc = encode_DIS_ReqExtend(sock, 0);
			if (rc != 0)
				break;
			rc = dis_flush(sock);
			break;

		case PBS_BATCH_RegistDep:
			if (prot == PROT_TPP) {
				rc = is_compose_cmd(sock, IS_CMD, &msgid);
				if (rc != 0)
					break;
			}
			rc = encode_DIS_ReqHdr(sock,
					       PBS_BATCH_RegistDep, pbs_current_user);
			if (rc != 0)
				break;
			rc = encode_DIS_Register(sock, request);
			if (rc != 0)
				break;
			rc = encode_DIS_ReqExtend(sock, 0);
			if (rc != 0)
				break;
			rc = dis_flush(sock);
			break;

		case PBS_BATCH_SignalJob:
			rc = PBSD_sig_put(conn,
					  request->rq_ind.rq_signal.rq_jid,
					  request->rq_ind.rq_signal.rq_signame,
					  NULL,
					  prot,
					  &msgid);
			break;

		case PBS_BATCH_StatusJob:
			rc = PBSD_status_put(conn,
					     PBS_BATCH_StatusJob,
					     request->rq_ind.rq_status.rq_id,
					     NULL, NULL,
					     prot,
					     &msgid);
			break;

		case PBS_BATCH_TrackJob:
			if (prot == PROT_TPP) {
				rc = is_compose_cmd(sock, IS_CMD, &msgid);
				if (rc != 0)
					break;
			}
			rc = encode_DIS_ReqHdr(sock, PBS_BATCH_TrackJob, pbs_current_user);
			if (rc != 0)
				break;
			rc = encode_DIS_TrackJob(sock, request);
			if (rc != 0)
				break;
			rc = encode_DIS_ReqExtend(sock, request->rq_extend);
			if (rc != 0)
				break;
			rc = dis_flush(sock);
			break;

		case PBS_BATCH_CopyFiles:
			if (prot == PROT_TPP) {
				rc = is_compose_cmd(sock, IS_CMD, &msgid);
				if (rc != 0)
					break;
			}
			rc = encode_DIS_ReqHdr(sock,
					       PBS_BATCH_CopyFiles, pbs_current_user);
			if (rc != 0)
				break;
			rc = encode_DIS_CopyFiles(sock, request);
			if (rc != 0)
				break;
			rc = encode_DIS_ReqExtend(sock, get_job_credid(request->rq_ind.rq_cpyfile.rq_jobid));
			if (rc != 0)
				break;
			rc = dis_flush(sock);
			break;

		case PBS_BATCH_CopyFiles_Cred:
			if (prot == PROT_TPP) {
				rc = is_compose_cmd(sock, IS_CMD, &msgid);
				if (rc != 0)
					break;
			}
			rc = encode_DIS_ReqHdr(sock,
					       PBS_BATCH_CopyFiles_Cred, pbs_current_user);
			if (rc != 0)
				break;
			rc = encode_DIS_CopyFiles_Cred(sock, request);
			if (rc != 0)
				break;
			rc = encode_DIS_ReqExtend(sock, 0);
			if (rc != 0)
				break;
			rc = dis_flush(sock);
			break;

		case PBS_BATCH_DelFiles:
			if (prot == PROT_TPP) {
				rc = is_compose_cmd(sock, IS_CMD, &msgid);
				if (rc != 0)
					break;
			}
			rc = encode_DIS_ReqHdr(sock,
					       PBS_BATCH_DelFiles, pbs_current_user);
			if (rc != 0)
				break;
			rc = encode_DIS_CopyFiles(sock, request);
			if (rc != 0)
				break;
			rc = encode_DIS_ReqExtend(sock, 0);
			if (rc != 0)
				break;
			rc = dis_flush(sock);
			break;

		case PBS_BATCH_DelFiles_Cred:
			if (prot == PROT_TPP) {
				rc = is_compose_cmd(sock, IS_CMD, &msgid);
				if (rc != 0)
					break;
			}
			rc = encode_DIS_ReqHdr(sock,
					       PBS_BATCH_DelFiles_Cred, pbs_current_user);
			if (rc != 0)
				break;
			rc = encode_DIS_CopyFiles_Cred(sock, request);
			if (rc != 0)
				break;
			rc = encode_DIS_ReqExtend(sock, 0);
			if (rc != 0)
				break;
			rc = dis_flush(sock);
			break;

		case PBS_BATCH_FailOver:
			/* we should never do this on tpp based connection */
			rc = put_failover(sock, request);
			break;

		case PBS_BATCH_Cred:
			rc = PBSD_cred(conn,
				       request->rq_ind.rq_cred.rq_credid,
				       request->rq_ind.rq_cred.rq_jobid,
				       request->rq_ind.rq_cred.rq_cred_type,
				       request->rq_ind.rq_cred.rq_cred_data,
				       request->rq_ind.rq_cred.rq_cred_validity,
				       prot,
				       &msgid);
			break;

		default:
			(void) sprintf(log_buffer, msg_issuebad, request->rq_type);
			log_err(-1, __func__, log_buffer);
			delete_task(ptask);
			rc = -1;
			break;
	}

	if (rc) {
		sprintf(log_buffer,
			"issue_Drequest failed, error=%d on request %d",
			rc, request->rq_type);
		log_err(-1, __func__, log_buffer);
		if (msgid)
			free(msgid);
		delete_task(ptask);
	} else if (ppwt != 0) {
		if (prot == PROT_TPP) {
			tpp_add_close_func(sock, process_DreplyTPP); /* register a close handler */

			ptask->wt_event2 = msgid;
			/*
			 * since its delayed task for tpp based connection
			 * remove it from the task_event list
			 * caller will add to moms deferred cmd list
			 */
			delete_link(&ptask->wt_linkevent);
		}
		ptask->wt_aux2 = prot;
		*ppwt = ptask;
	}

	return (rc);
}

/**
 * @brief
 * 		process the reply received for a request issued to
 *		another server via issue_request() over TCP
 *
 * @param[in] sock - TCP socket over which reply arrived
 *
 * @return	void
 */
void
process_Dreply(int sock)
{
	struct work_task *ptask;
	int rc;
	struct batch_request *request;

	/* find the work task for the socket, it will point us to the request */
	ptask = (struct work_task *) GET_NEXT(task_list_event);
	while (ptask) {
		if ((ptask->wt_type == WORK_Deferred_Reply) && (ptask->wt_event == sock))
			break;
		ptask = (struct work_task *) GET_NEXT(ptask->wt_linkevent);
	}
	if (!ptask) {
		close_conn(sock);
		return;
	}

	request = ptask->wt_parm1;

	/* read and decode the reply */
	/* set long timeout on I/O   */

	pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_LONG;

	if ((rc = DIS_reply_read(sock, &request->rq_reply, 0)) != 0) {
		close_conn(sock);
		request->rq_reply.brp_code = rc;
		request->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
	}
	pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_SHORT; /* short timeout */

	/* now dispatch the reply to the routine in the work task */

	dispatch_task(ptask);
	return;
}

/**
 * @brief
 * 		process the reply received for a request issued to
 *		  another server via issue_request()
 *
 * 		Reads the reply from the TPP stream and executes the work task associated
 * 		with the reply message. The request for which this reply arrived
 * 		is matched by comparing the msgid of the reply with the msgid of the work
 * 		tasks stored in the dmn_deferred_cmds list of the mom for this stream.
 *
 * @param[in] handle - TPP handle on which reply/close arrived
 *
 * @return void
 */
void
process_DreplyTPP(int handle)
{
	struct work_task *ptask;
	int rc;
	struct batch_request *request;
	struct batch_reply *reply;
	char *msgid = NULL;
	mominfo_t *pmom = 0;

	if ((pmom = tfind2((u_long) handle, 0, &streams)) == NULL)
		return;

	DIS_tpp_funcs();

	/* find the work task for the socket, it will point us to the request */
	msgid = disrst(handle, &rc);

	if (!msgid || rc) { /* tpp connection actually broke, cull all pending requests */
		while ((ptask = GET_NEXT(pmom->mi_dmn_info->dmn_deferred_cmds))) {
			/* no need to compare wt_event with handle, since the
			 * task list is for this mom and so it will always match
			 */
			if (ptask->wt_type == WORK_Deferred_Reply) {
				request = ptask->wt_parm1;
				if (request) {
					request->rq_reply.brp_code = PBSE_NORELYMOM;
					request->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
				}
			}

			ptask->wt_aux = PBSE_NORELYMOM;
			pbs_errno = PBSE_NORELYMOM;
			free(ptask->wt_event2);

			dispatch_task(ptask);
		}
	} else {
		/* we read msgid fine, so proceed to match it and process the respective task */

		/* get the task list */
		ptask = GET_NEXT(pmom->mi_dmn_info->dmn_deferred_cmds);

		while (ptask) {

			char *cmd_msgid = ptask->wt_event2;

			if (strcmp(cmd_msgid, msgid) == 0) {

				if (ptask->wt_type == WORK_Deferred_Reply)
					request = ptask->wt_parm1;
				else
					request = NULL;

				if (!request) {
					if ((reply = (struct batch_reply *) malloc(sizeof(struct batch_reply))) == 0) {
						delete_task(ptask);
						free(cmd_msgid);
						log_err(errno, msg_daemonname, "Out of memory creating batch reply");
						return;
					}
					(void) memset(reply, 0, sizeof(struct batch_reply));
				} else {
					reply = &request->rq_reply;
				}

				/* read and decode the reply */
				if ((rc = DIS_reply_read(handle, reply, 1)) != 0) {
					reply->brp_code = rc;
					reply->brp_choice = BATCH_REPLY_CHOICE_NULL;
					ptask->wt_aux = PBSE_NORELYMOM;
					pbs_errno = PBSE_NORELYMOM;
				} else {
					ptask->wt_aux = reply->brp_code;
					pbs_errno = reply->brp_code;
				}

				ptask->wt_parm3 = reply; /* set the reply in case callback fn uses without having a preq */

				dispatch_task(ptask);

				if (!request)
					PBSD_FreeReply(reply);

				free(cmd_msgid);

				break;
			}
			ptask = (struct work_task *) GET_NEXT(ptask->wt_linkobj2);
		}
		free(msgid); /* the msgid read should be free after use in matching */
	}
}


================================================
FILE: src/server/jattr_get_set.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "job.h"

/**
 * @brief	Get attribute of job based on given attr index
 *
 * @param[in] pjob     - pointer to job struct
 * @param[in] attr_idx - attribute index
 *
 * @return attribute *
 * @retval NULL  - failure
 * @retval !NULL - pointer to attribute struct
 */
attribute *
get_jattr(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return _get_attr_by_idx((attribute *) pjob->ji_wattr, attr_idx);
	return NULL;
}

/**
 * @brief	Check if the job is in the state specified
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	state - the state to check
 *
 * @return	int
 * @retval	1 if the job is in the state specified
 * @retval	0 otherwise
 */
int
check_job_state(const job *pjob, char state)
{
	if (pjob == NULL)
		return 0;

	if (get_job_state(pjob) == state)
		return 1;

	return 0;
}

/**
 * @brief	Check if the job is in the substate specified
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	substate - the substate to check
 *
 * @return	int
 * @retval	1 if the job is in the state specified
 * @retval	0 otherwise
 */
int
check_job_substate(const job *pjob, int substate)
{
	if (pjob == NULL)
		return 0;

	if (get_job_substate(pjob) == substate)
		return 1;

	return 0;
}

/**
 * @brief	Get the state character value of a job
 *
 * @param[in]	pjob - the job object
 *
 * @return char
 * @return state character
 * @return -1 for error
 */
char
get_job_state(const job *pjob)
{
	if (pjob != NULL) {
		return get_attr_c(get_jattr(pjob, JOB_ATR_state));
	}

	return JOB_STATE_LTR_UNKNOWN;
}

/**
 * @brief	Convenience function to get the numeric representation of job state value
 *
 * @param[in]	pjob - job object
 *
 * @return int
 * @retval numeric form of job state
 * @retvam -1 for error
 */
int
get_job_state_num(const job *pjob)
{
	char statec;
	int staten;

	if (pjob == NULL)
		return -1;

	statec = get_attr_c(get_jattr(pjob, JOB_ATR_state));
	if (statec == -1)
		return -1;

	staten = state_char2int(statec);

	return staten;
}

/**
 * @brief	Get the substate value of a job
 *
 * @param[in]	pjob - the job object
 *
 * @return long
 * @return substate value
 * @return -1 for error
 */
long
get_job_substate(const job *pjob)
{
	if (pjob != NULL) {
		return get_attr_l(get_jattr(pjob, JOB_ATR_substate));
	}

	return -1;
}

/**
 * @brief	Getter function for job attribute of type string
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	char *
 * @retval	string value of the attribute
 * @retval	NULL if pjob is NULL
 */
char *
get_jattr_str(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return get_attr_str(get_jattr(pjob, attr_idx));

	return NULL;
}

/**
 * @brief	Getter function for job attribute of type string of array
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	struct array_strings *
 * @retval	value of the attribute
 * @retval	NULL if pjob is NULL
 */
struct array_strings *
get_jattr_arst(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return get_attr_arst(get_jattr(pjob, attr_idx));

	return NULL;
}

/**
 * @brief	Getter for job attribute's list value
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	pbs_list_head
 * @retval	value of attribute
 */
pbs_list_head
get_jattr_list(const job *pjob, int attr_idx)
{
	return get_attr_list(get_jattr(pjob, attr_idx));
}

/**
 * @brief	Getter function for job attribute of type long
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	long
 * @retval	long value of the attribute
 * @retval	-1 if pjob is NULL
 */
long
get_jattr_long(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return get_attr_l(get_jattr(pjob, attr_idx));

	return -1;
}

/**
 * @brief	Getter function for job attribute of type long long
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	long long
 * @retval	long long value of the attribute
 * @retval	-1 if pjob is NULL
 */
long long
get_jattr_ll(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return get_attr_ll(get_jattr(pjob, attr_idx));

	return -1;
}

/**
 * @brief	Getter function for job attribute's user_encoded value
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	svrattrl *
 * @retval	user_encoded value of the attribute
 * @retval	NULL if pjob is NULL
 */
svrattrl *
get_jattr_usr_encoded(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return (get_jattr(pjob, attr_idx))->at_user_encoded;

	return NULL;
}

/**
 * @brief	Getter function for job attribute's priv_encoded value
 *
 * @param[in]	pjob - pointer to the job
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	svrattrl *
 * @retval	priv_encoded value of the attribute
 * @retval	NULL if pjob is NULL
 */
svrattrl *
get_jattr_priv_encoded(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return (get_jattr(pjob, attr_idx))->at_priv_encoded;

	return NULL;
}

/**
 * @brief	Setter for job state
 *
 * @param[in]	job - pointer to job
 * @param[in]	val - state val
 *
 * @return	void
 */
void
set_job_state(job *pjob, char val)
{
	if (pjob != NULL)
		set_attr_c(get_jattr(pjob, JOB_ATR_state), val, SET);
}

/**
 * @brief	Setter for job substate
 *
 * @param[in]	job - pointer to job
 * @param[in]	val - substate val
 *
 * @return	void
 */
void
set_job_substate(job *pjob, long val)
{
	if (pjob != NULL)
		set_jattr_l_slim(pjob, JOB_ATR_substate, val, SET);
}

/**
 * @brief	Generic Job attribute setter (call if you want at_set() action functions to be called)
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_jattr_generic(job *pjob, int attr_idx, char *val, char *rscn, enum batch_op op)
{
	if (pjob == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_jattr(pjob, attr_idx), &job_attr_def[attr_idx], val, rscn, op);
}

/**
 * @brief	"fast" job attribute setter for string values
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_jattr_str_slim(job *pjob, int attr_idx, char *val, char *rscn)
{
	if (pjob == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_jattr(pjob, attr_idx), &job_attr_def[attr_idx], val, rscn, INTERNAL);
}

/**
 * @brief	"fast" job attribute setter for long values
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_jattr_l_slim(job *pjob, int attr_idx, long val, enum batch_op op)
{
	if (pjob == NULL)
		return 1;

	set_attr_l(get_jattr(pjob, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" job attribute setter for long long values
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_jattr_ll_slim(job *pjob, int attr_idx, long long val, enum batch_op op)
{
	if (pjob == NULL)
		return 1;

	set_attr_ll(get_jattr(pjob, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" job attribute setter for boolean values
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_jattr_b_slim(job *pjob, int attr_idx, long val, enum batch_op op)
{
	if (pjob == NULL)
		return 1;

	set_attr_b(get_jattr(pjob, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" job attribute setter for char values
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_jattr_c_slim(job *pjob, int attr_idx, char val, enum batch_op op)
{
	if (pjob == NULL)
		return 1;

	set_attr_c(get_jattr(pjob, attr_idx), val, op);

	return 0;
}

/**
 * @brief	Check if a job attribute is set
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to check
 *
 * @return	int
 * @retval	1 if it is set
 * @retval	0 otherwise
 */
int
is_jattr_set(const job *pjob, int attr_idx)
{
	if (pjob != NULL)
		return is_attr_set(get_jattr(pjob, attr_idx));

	return 0;
}

/**
 * @brief	Mark a job attribute as "not set"
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 *
 * @return	void
 */
void
mark_jattr_not_set(job *pjob, int attr_idx)
{
	if (pjob != NULL) {
		attribute *attr = get_jattr(pjob, attr_idx);
		ATR_UNSET(attr);
	}
}

/**
 * @brief	Mark a job attribute as "set"
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to set
 *
 * @return	void
 */
void
mark_jattr_set(job *pjob, int attr_idx)
{
	if (pjob != NULL)
		(get_jattr(pjob, attr_idx))->at_flags |= ATR_VFLAG_SET;
}

/**
 * @brief	Free a job attribute
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to free
 *
 * @return	void
 */
void
free_jattr(job *pjob, int attr_idx)
{
	if (pjob != NULL)
		free_attr(job_attr_def, get_jattr(pjob, attr_idx), attr_idx);
}

/**
 * @brief	clear a job attribute
 *
 * @param[in]	pjob - pointer to job
 * @param[in]	attr_idx - attribute index to clear
 *
 * @return	void
 */
void
clear_jattr(job *pjob, int attr_idx)
{
	if (pjob != NULL)
		clear_attr(get_jattr(pjob, attr_idx), &job_attr_def[attr_idx]);
}


================================================
FILE: src/server/job_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <sys/param.h>
#include <dirent.h>
#include <time.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <ctype.h>
#include <errno.h>
#include <assert.h>

#include <signal.h>
#include <memory.h>
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "pbs_ifl.h"
#include "libpbs.h"
#include "list_link.h"
#include "work_task.h"
#include "attribute.h"
#include "resource.h"
#include "server_limits.h"
#include "server.h"
#include "resv_node.h"
#include "queue.h"
#include "sched_cmds.h"
#include "pbs_sched.h"

#include "job.h"
#include "reservation.h"
#include "pbs_nodes.h"
#include "log.h"
#include "pbs_error.h"
#include "batch_request.h"
#include "pbs_entlim.h"
#include "libutil.h"

#ifndef PBS_MOM
#include "pbs_idx.h"
#include "ticket.h"
#else
#include "mom_server.h"
#include "mom_func.h"
#include "mom_hook_func.h"
#endif

#include "svrfunc.h"
#include <libutil.h>
#include "acct.h"
#include "credential.h"
#include "net_connect.h"
#include "pbs_reliable.h"

#if defined(PBS_MOM) && defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
#include "renew_creds.h"
#endif

extern int time_now;

/* External functions */
#ifdef WIN32
extern int read_cred(job *pjob, char **cred, size_t *len);
#endif

void on_job_exit(struct work_task *);

/* Local Private Functions */

static void job_init_wattr(job *);

#ifndef PBS_MOM /* SERVER ONLY */
static void post_resv_purge(struct work_task *pwt);
#endif

/* Global Data items */
#ifndef PBS_MOM
extern struct server server;
#endif /* PBS_MOM */
extern char *msg_abt_err;
extern char *path_jobs;
extern char *path_spool;
extern char server_name[];
extern char *pbs_server_name;
extern pbs_list_head svr_newjobs;
extern pbs_list_head svr_alljobs;
extern char *msg_err_purgejob;

#ifdef PBS_MOM
extern void rmtmpdir(char *);
void nodes_free(job *);
extern char *std_file_name(job *pjob, enum job_file which, int *keeping);
extern char *path_checkpoint;

/**
 * @brief
 * 		free up the tasks from the list of tasks associated with particular job, delete links and close connection.
 *
 * @param[in]	pj - pointer to job structure
 *
 * @return void
 */
void
tasks_free(job *pj)
{
	pbs_task *tp = (pbs_task *) GET_NEXT(pj->ji_tasks);
	obitent *op;
	infoent *ip;
	int i;

	while (tp) {
		op = (obitent *) GET_NEXT(tp->ti_obits);
		while (op) {
			delete_link(&op->oe_next);
			free(op);
			op = (obitent *) GET_NEXT(tp->ti_obits);
		}

		ip = (infoent *) GET_NEXT(tp->ti_info);
		while (ip) {
			delete_link(&ip->ie_next);
			free(ip->ie_name);
			free(ip->ie_info);
			free(ip);
			ip = (infoent *) GET_NEXT(tp->ti_info);
		}

		if (tp->ti_tmfd != NULL) {
			for (i = 0; i < tp->ti_tmnum; i++)
				close_conn(tp->ti_tmfd[i]);
			free(tp->ti_tmfd);
		}
		delete_link(&tp->ti_jobtask);
		free(tp);
		tp = (pbs_task *) GET_NEXT(pj->ji_tasks);
	}
}
#else /* PBS_MOM */

char *
get_job_credid(char *jobid)
{
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	job *pjob;

	if ((pjob = find_job(jobid)) == NULL)
		return NULL;

	if (is_jattr_set(pjob, JOB_ATR_cred_id)) {
		return get_jattr_str(pjob, JOB_ATR_cred_id);
	}
#endif

	return NULL;
}

/**
 * @brief
 * 		job_abt - abort a job
 *
 *		The job removed from the system and a mail message is sent
 *		to the job owner.
 *
 * @param[in]	pjob - pointer to job structure
 * @param[in]	text - job status message
 */

int
job_abt(job *pjob, char *text)
{
	char old_state;
	int old_substate;
	int rc = 0;

	if (pjob == NULL)
		return 0; /* nothing to do */
	/* save old state and update state to Exiting */

	old_state = get_job_state(pjob);

	if (old_state == JOB_STATE_LTR_FINISHED)
		return 0; /* nothing to do for this job */

	old_substate = get_job_substate(pjob);

	/* notify user of abort if notification was requested */

	if (text) { /* req_delete sends own mail and acct record */
		account_record(PBS_ACCT_ABT, pjob, text);
		svr_mailowner(pjob, MAIL_ABORT, MAIL_NORMAL, text);
	}

	if ((old_state == JOB_STATE_LTR_RUNNING) && (old_substate != JOB_SUBSTATE_PROVISION)) {
		svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_ABORT);
		rc = issue_signal(pjob, "SIGKILL", release_req, 0);
		if (rc != 0) {
			(void) sprintf(log_buffer, msg_abt_err,
				       pjob->ji_qs.ji_jobid, old_substate);
			log_err(-1, __func__, log_buffer);
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
				/* notify creator that job is exited */
				set_job_state(pjob, JOB_STATE_LTR_EXITING);
				issue_track(pjob);
			}
			/*
			 * Check if the history of the finished job can be saved or it needs to be purged .
			 */
			svr_saveorpurge_finjobhist(pjob);
		}
	} else if ((old_state == JOB_STATE_LTR_TRANSIT) &&
		   (old_substate == JOB_SUBSTATE_TRNOUT)) {
		/* I don't know of a case where this could happen */
		(void) sprintf(log_buffer, msg_abt_err,
			       pjob->ji_qs.ji_jobid, old_substate);
		log_err(-1, __func__, log_buffer);
	} else if (old_substate == JOB_SUBSTATE_PROVISION) {
		svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_ABORT);
		/*
		 * Check if the history of the finished job can be saved or it needs to be purged .
		 */
		svr_saveorpurge_finjobhist(pjob);
	} else if (old_state == JOB_STATE_LTR_HELD && old_substate == JOB_SUBSTATE_DEPNHOLD &&
		   (is_jattr_set(pjob, JOB_ATR_depend))) {
		svr_setjobstate(pjob, JOB_STATE_LTR_HELD, JOB_SUBSTATE_ABORT);
		depend_on_term(pjob);
		/*
		 * Check if the history of the finished job can be saved or it needs to be purged .
		 */
		svr_saveorpurge_finjobhist(pjob);
	} else {
		svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_ABORT);
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) {
			/* notify creator that job is exited */
			issue_track(pjob);
		}
		/*
		 * Check if the history of the finished job can be saved or it needs to be purged .
		 */
		svr_saveorpurge_finjobhist(pjob);
	}

	return (rc);
}

/**
 * @brief
 * 		job_delete_attr - delete a job attribute
 *
 *		The job attribute is removed from the memory and db.
 *
 * @param[in]	pjob - pointer to job structure
 * @param[in]	attr_idx - attribute to remove
 * 
 * @return	int
 * @retval	0	- success
 * @retval	!=0	- fail
 */

int
job_delete_attr(job *pjob, int attr_idx)
{
	void *conn = (void *) svr_db_conn;
	int index;
	pbs_db_obj_info_t obj;
	pbs_db_attr_list_t db_attr_list;
	attribute_def attr_def;
	attribute *pattr;
	int rc;

	obj.pbs_db_un.pbs_db_job = NULL;
	obj.pbs_db_obj_type = PBS_DB_JOB;

	db_attr_list.attr_count = 0;
	CLEAR_HEAD(db_attr_list.attrs);

	if (is_jattr_set(pjob, attr_idx)) {
		attr_def = job_attr_def[attr_idx];
		if ((index = find_attr(job_attr_idx, job_attr_def, attr_def.at_name)) < 0) {
			return -1;
		}
		pattr = pjob->ji_wattr;
		if ((rc = encode_single_attr_db((job_attr_def + index), (pattr + index), &db_attr_list)) != 0) {
			return rc;
		}
		if ((rc = pbs_db_delete_attr_obj(conn, &obj, pjob->ji_qs.ji_jobid, &db_attr_list)) < 0) {
			free_db_attr_list(&db_attr_list);
			return rc;
		}
		free_db_attr_list(&db_attr_list);

		clear_jattr(pjob, attr_idx);
	}

	return 0;
}
#endif /* PBS_MOM */

/**
 * @brief
 * 		job_alloc - allocate space for a job structure and initialize working
 *				attribute to "unset"
 *
 * @return	pointer to structure or null is space not available.
 */

job *
job_alloc(void)
{
	job *pj;

	pj = (job *) malloc(sizeof(job));
	if (pj == NULL) {
		log_err(errno, __func__, "no memory");
		return NULL;
	}
	(void) memset((char *) pj, (int) 0, (size_t) sizeof(job));

	CLEAR_LINK(pj->ji_alljobs);
	CLEAR_LINK(pj->ji_jobque);
	CLEAR_LINK(pj->ji_unlicjobs);

	pj->ji_rerun_preq = NULL;

#ifdef PBS_MOM
	CLEAR_HEAD(pj->ji_tasks);
	CLEAR_HEAD(pj->ji_failed_node_list);
	CLEAR_HEAD(pj->ji_node_list);
	pj->ji_taskid = TM_INIT_TASK;
	pj->ji_numnodes = 0;
	pj->ji_numrescs = 0;
	pj->ji_numvnod = 0;
	pj->ji_num_assn_vnodes = 0;
	pj->ji_hosts = NULL;
	pj->ji_vnods = NULL;
	pj->ji_assn_vnodes = NULL;
	pj->ji_resources = NULL;
	pj->ji_obit = TM_NULL_EVENT;
	pj->ji_postevent = TM_NULL_EVENT;
	pj->ji_preq = NULL;
	pj->ji_nodekill = TM_ERROR_NODE;
	pj->ji_flags = 0;
	pj->ji_jsmpipe = -1;
	pj->ji_mjspipe = -1;
	pj->ji_jsmpipe2 = -1;
	pj->ji_mjspipe2 = -1;
	pj->ji_child2parent_job_update_pipe = -1;
	pj->ji_parent2child_job_update_pipe = -1;
	pj->ji_parent2child_job_update_status_pipe = -1;
	pj->ji_parent2child_moms_status_pipe = -1;
	pj->ji_updated = 0;
	pj->ji_hook_running_bg_on = BG_NONE;
	pj->ji_bg_hook_task = NULL;
	pj->ji_report_task = NULL;
	pj->ji_env.v_envp = NULL;
#ifdef WIN32
	pj->ji_hJob = NULL;
	pj->ji_user = NULL;
	pj->ji_grpcache = NULL;
#endif
	pj->ji_stdout = 0;
	pj->ji_stderr = 0;
	pj->ji_setup = NULL;
	pj->ji_momsubt = 0;
	pj->ji_msconnected = 0;
	CLEAR_HEAD(pj->ji_multinodejobs);
	pj->ji_extended.ji_ext.ji_stdout = 0;
	pj->ji_extended.ji_ext.ji_stderr = 0;
#else /* SERVER */
	pj->ji_discarding = 0;
	pj->ji_prunreq = NULL;
	pj->ji_pmt_preq = NULL;
	CLEAR_HEAD(pj->ji_svrtask);
	CLEAR_HEAD(pj->ji_rejectdest);
	pj->ji_terminated = 0;
	pj->ji_deletehistory = 0;
	pj->ji_script = NULL;
	pj->ji_prov_startjob_task = NULL;
#endif
	pj->ji_qs.ji_jsversion = JSVERSION;
	pj->ji_momhandle = -1;		/* mark mom connection invalid */
	pj->ji_mom_prot = PROT_INVALID; /* invalid protocol type */
	pj->newobj = 1;

	/* set the working attributes to "unspecified" */

	job_init_wattr(pj);

#ifndef PBS_MOM
	set_job_state(pj, JOB_STATE_LTR_TRANSIT);
	set_job_substate(pj, JOB_SUBSTATE_TRANSIN);

	/* start accruing time from the time job was created */
	set_jattr_l_slim(pj, JOB_ATR_sample_starttime, time_now, SET);
	set_jattr_l_slim(pj, JOB_ATR_eligible_time, 0, SET);

	/* if eligible_time_enable is not true, then job does not accrue eligible time */
	if (is_sattr_set(SVR_ATR_EligibleTimeEnable) && get_sattr_long(SVR_ATR_EligibleTimeEnable) == TRUE) {
		int elig_val;

		elig_val = determine_accruetype(pj);
		update_eligible_time(elig_val, pj);
	}
#endif

	return (pj);
}

#ifndef PBS_MOM

/**
 * @brief
 * 	free work tasks and pending batch requests related to this job
 *
 * @param[in]	pj - pointer to job structure
 *
 * @return	void
 */
void
free_job_work_tasks(job *pj)
{
	struct work_task *pwt;
	struct batch_request *tbr = NULL;
	/*
	* Delete any work task entries associated with the job.
	* mom deferred tasks via TPP are also hooked into the
	* ji_svrtask now, so they also get automatically cleared
	* in this following loop
	*/
	while ((pwt = (struct work_task *) GET_NEXT(pj->ji_svrtask)) != NULL) {
		if (pwt->wt_type == WORK_Deferred_Reply) {
			tbr = (struct batch_request *) pwt->wt_parm1;
			if (tbr != NULL) {
				/* Check if the reply is for scheduler
				 * If so, then reject the request.
				 */
				if ((tbr->rq_orgconn != -1) &&
				    (find_sched_from_sock(tbr->rq_orgconn, CONN_SCHED_PRIMARY) != NULL)) {
					tbr->rq_conn = tbr->rq_orgconn;
					req_reject(PBSE_HISTJOBID, 0, tbr);
				}
				/*
				* free batch request from task struct
				* if task is deferred reply
				*/
				else
					free_br(tbr);
			}
		}

		/* wt_event2 either has additional data (like msgid) or NULL */
		free(pwt->wt_event2);

		delete_task(pwt);
	}
}
#endif

/**
 * @brief
 * 		job_free - free job structure and its various sub-structures
 *
 * @param[in]	pj - pointer to job structure
 *
 * @return	void
 */
void
job_free(job *pj)
{
	int i;

#ifdef PBS_MOM

#ifdef WIN32
	if (is_jattr_set(pj, JOB_ATR_altid)) {
		char *p;

		p = strstr(get_jattr_str(pj, JOB_ATR_altid),
			   "HomeDirectory=");
		if (p) {
			struct passwd *pwdp = NULL;

			if ((get_jattr_str(pj, JOB_ATR_euser)) &&
			    (pwdp = getpwnam(get_jattr_str(pj, JOB_ATR_euser)))) {
				if (pwdp->pw_userlogin != INVALID_HANDLE_VALUE) {
					if (impersonate_user(pwdp->pw_userlogin) == 0) {
						sprintf(log_buffer, "Failed to ImpersonateLoggedOnUser user: %s", pwdp->pw_name);
						log_joberr(-1, __func__, log_buffer, pj->ji_qs.ji_jobid);
						return;
					}
				}
				/* p + 14 is the string after HomeDirectory= */
				unmap_unc_path(p + 14);
				(void) revert_impersonated_user();
			}
			unmap_unc_path(p + 14); /* also unmap under Admin to be sure */
		}
	}
#endif

#endif

	/* remove any malloc working attribute space */

	for (i = 0; i < (int) JOB_ATR_LAST; i++)
		free_jattr(pj, i);

#ifndef PBS_MOM
	{
		/* Server only */
		badplace *bp;

		free_job_work_tasks(pj);

		/* free any bad destination structs */

		bp = (badplace *) GET_NEXT(pj->ji_rejectdest);
		while (bp) {
			delete_link(&bp->bp_link);
			free(bp);
			bp = (badplace *) GET_NEXT(pj->ji_rejectdest);
		}
	}
	if (pj->ji_ajinfo) {
		free_range_list(pj->ji_ajinfo->trm_quelist);
		free(pj->ji_ajinfo);
		pj->ji_ajinfo = NULL;
	}
	pj->ji_parentaj = NULL;
	if (pj->ji_discard)
		free(pj->ji_discard);
	if (pj->ji_acctrec)
		free(pj->ji_acctrec);
	if (pj->ji_clterrmsg)
		free(pj->ji_clterrmsg);
	if (pj->ji_script)
		free(pj->ji_script);
	if (pj->ji_prov_startjob_task)
		delete_task(pj->ji_prov_startjob_task);

#else /* PBS_MOM  Mom Only */

	if (pj->ji_grpcache)
		(void) free(pj->ji_grpcache);

	assert(pj->ji_preq == NULL);
	nodes_free(pj);
	tasks_free(pj);
	if (pj->ji_resources) {
		for (i = 0; i < pj->ji_numrescs; i++) {
			free(pj->ji_resources[i].nodehost);
			pj->ji_resources[i].nodehost = NULL;
			if (is_attr_set(&pj->ji_resources[i].nr_used) != 0)
				free_attr(job_attr_def, &pj->ji_resources[i].nr_used, JOB_ATR_resc_used);
		}
		pj->ji_numrescs = 0;
		free(pj->ji_resources);
		pj->ji_resources = NULL;
	}

	reliable_job_node_free(&pj->ji_failed_node_list);
	reliable_job_node_free(&pj->ji_node_list);

	if (pj->ji_bg_hook_task) {
		mom_process_hooks_params_t *php;
		php = pj->ji_bg_hook_task->wt_parm2;
		if (php != NULL) {
			if (php->hook_output) {
				free(php->hook_output->reject_errcode);
				free(php->hook_output);
			}
			free(php->hook_input);
			free(php);
		}
		delete_task(pj->ji_bg_hook_task);
	}

	if (pj->ji_report_task)
		delete_task(pj->ji_report_task);

	/*
	 ** This gets rid of any dependent job structure(s) from ji_setup.
	 */
	if (job_free_extra != NULL)
		job_free_extra(pj);

	CLEAR_HEAD(pj->ji_multinodejobs);

#ifdef WIN32
	if (pj->ji_hJob) {
		CloseHandle(pj->ji_hJob);
		pj->ji_hJob = NULL;
	}
#endif

#endif /* PBS_MOM */
	/* if a subjob (of a Array Job), do not free certain items */
	/* which are malloced and shared with the parent Array Job */
	/* They will be freed when the parent is removed           */

	pj->ji_qs.ji_jobid[0] = 'X'; /* as a "freed" marker */
	free(pj);		     /* now free the main structure */
}

/**
 * @brief
 * 		job_init_wattr - initialize job working attribute array
 *		set the types and the "unspecified value" flag
 *
 * @see
 * 		job_alloc
 *
 * @param[in]	pj - pointer to job structure
 *
 * @return	void
 */
static void
job_init_wattr(job *pj)
{
	int i;

	for (i = 0; i < (int) JOB_ATR_LAST; i++) {
		clear_attr(get_jattr(pj, i), &job_attr_def[i]);
	}
}

/**
 * @brief
 *      spool_filename - formulate stdout/err file name in the spool area.
 *
 * @param[in]    pjob     - pointer to job structure.
 * @param[out]   namebuf  - output/error file name.
 * @param[in]    suffix   - output/error file name suffix.
 *
 * @return  void
 */
void
spool_filename(job *pjob, char *namebuf, char *suffix)
{
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(namebuf, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(namebuf, pjob->ji_qs.ji_jobid);
	(void) strcat(namebuf, suffix);
}

/**
 * @brief
 * 		remove_stdouter_files - remove stdout/err files from the spool directory
 *
 * @param[in]   pjob    - pointer to job structure
 * @param[in]	suffix	- output/error file name suffix.
 *
 * @return	void
 */
void
remove_stdouterr_files(job *pjob, char *suffix)
{
	char namebuf[MAXPATHLEN + 1];

	(void) strcpy(namebuf, path_spool);
	spool_filename(pjob, namebuf, suffix);
	if (unlink(namebuf) < 0)
		if (errno != ENOENT)
			log_joberr(errno, __func__, msg_err_purgejob, pjob->ji_qs.ji_jobid);
}

/**
 * @brief
 * 		direct_write_requested - checks whether direct_write is requested by the job.
 *
 * @param[in]	pjob	- pointer to job structure.
 *
 * @return	bool
 * @retval 1 : direct write is requested by the job.
 * @retval 0 : direct write is not requested by the job.
 */
int
direct_write_requested(job *pjob)
{
	char *pj_attrk = NULL;
	if ((is_jattr_set(pjob, JOB_ATR_keep))) {
		pj_attrk = get_jattr_str(pjob, JOB_ATR_keep);
		if (strchr(pj_attrk, 'd') && (strchr(pj_attrk, 'o') || (strchr(pj_attrk, 'e'))))
			return 1;
	}
	return 0;
}

/**
 * @brief	Convenience function to delete job related files for a job being purged
 *
 * @param[in]	pjob - the job being purged
 * @param[in]	fsuffix - suffix of the file to delete
 *
 * @return	void
 */
void
del_job_related_file(job *pjob, char *fsuffix)
{
	char namebuf[MAXPATHLEN + 1] = {'\0'};

	strcpy(namebuf, path_jobs);
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		strcat(namebuf, pjob->ji_qs.ji_fileprefix);
	else
		strcat(namebuf, pjob->ji_qs.ji_jobid);
	strcat(namebuf, fsuffix);
	if (unlink(namebuf) < 0) {
		if (errno != ENOENT) {
			log_joberr(errno, __func__, msg_err_purgejob,
				   pjob->ji_qs.ji_jobid);
		}
	}
}

#ifdef PBS_MOM
/**
 * @brief	Rename the job's <taskdir>.TK to <taskdir>.TK.RM
 *
 * @param[in]	pjob - the job being purged
 *
 * @return	char *
 * @retval	!NULL  - new taskdir path name, malloced which must be freed.
 * @retval	NULL - rename failed, error encountered
 */
static char *
rename_taskdir(job *pjob)
{
	char *namebuf = NULL;
	char *renamebuf = NULL;
	char *fprefix;

	if ((pjob == NULL) || (path_jobs == NULL))
		return (NULL);

	if (*pjob->ji_qs.ji_fileprefix != '\0')
		fprefix = pjob->ji_qs.ji_fileprefix;
	else
		fprefix = pjob->ji_qs.ji_jobid;

	if (fprefix == NULL)
		return (NULL);

	if (pbs_asprintf(&namebuf, "%s%s%s", path_jobs, fprefix, JOB_TASKDIR_SUFFIX) == -1)
		return (NULL);
	if (pbs_asprintf(&renamebuf, "%s%s", namebuf, JOB_DEL_SUFFIX) == -1)
		return (namebuf);
	if (rename(namebuf, renamebuf) == 0) {
		free(namebuf);
		return (renamebuf);
	}
	free(renamebuf);
	return (namebuf);
}

/**
 * @brief	Convenience function to delete directories associated with a job being purged
 *
 * @param[in]	pjob - the job being purged
 * @param[in]	taskdir - if not NULL, the path name to the task directory to cleanup
 *
 * @return	void
 */
void
del_job_dirs(job *pjob, char *taskdir)
{
	char namebuf[MAXPATHLEN + 1] = {'\0'};

	if (taskdir == NULL) {
		strcpy(namebuf, path_jobs); /* job directory path */
		if (*pjob->ji_qs.ji_fileprefix != '\0')
			strcat(namebuf, pjob->ji_qs.ji_fileprefix);
		else
			strcat(namebuf, pjob->ji_qs.ji_jobid);
		strcat(namebuf, JOB_TASKDIR_SUFFIX);
		remtree(namebuf);
	} else {
		remtree(taskdir);
	}
	rmtmpdir(pjob->ji_qs.ji_jobid); /* remove tmpdir */

	/* remove the staging and execution directory when sandbox=PRIVATE
	 ** and there are no stage-out errors
	 */
	if (is_jattr_set(pjob, JOB_ATR_sandbox) &&
	    (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)) {
		int check_shared = 0;
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
			/* sister mom */
			check_shared = 1;

		if (!(pjob->ji_qs.ji_svrflags & JOB_SVFLG_StgoFal)) {
			if (pjob->ji_grpcache != NULL)
				rmjobdir(pjob->ji_qs.ji_jobid,
					 jobdirname(pjob->ji_qs.ji_jobid, pjob->ji_grpcache->gc_homedir),
					 pjob->ji_grpcache->gc_uid,
					 pjob->ji_grpcache->gc_gid,
					 check_shared);
			else
				rmjobdir(pjob->ji_qs.ji_jobid,
					 jobdirname(pjob->ji_qs.ji_jobid, NULL),
					 0,
					 0,
					 check_shared);
		}
	}
}

/**
 * @brief	Convenience function to delete checkpoint files for a job being purged
 *
 * @param[in]	pjob - job being purged
 *
 * @return void
 */
void
del_chkpt_files(job *pjob)
{
	char namebuf[MAXPATHLEN + 1] = {'\0'};

	if (path_checkpoint != NULL) { /* delete checkpoint files */
		pbs_strncpy(namebuf, path_checkpoint, sizeof(namebuf));
		if (*pjob->ji_qs.ji_fileprefix != '\0')
			(void) strcat(namebuf, pjob->ji_qs.ji_fileprefix);
		else
			(void) strcat(namebuf, pjob->ji_qs.ji_jobid);
		(void) strcat(namebuf, JOB_CKPT_SUFFIX);
		(void) remtree(namebuf);
		(void) strcat(namebuf, ".old");
		(void) remtree(namebuf);
	}
}

/**
 * @brief
 * 	find_env_slot - find if the environment variable is already in the table,
 *	If so, replace the existing one with the new one.
 *
 * @param[in] ptbl - pointer to var_table which holds environment variable for job
 * @param[in] pstr - new environment variable
 *
 * @return	int
 * @retval	!(-1)	success
 * @retval	-1	Failure
 *
 */

int
find_env_slot(struct var_table *ptbl, char *pstr)
{
	int i;
	int len = 1; /* one extra for '=' */

	if (pstr == NULL)
		return (-1);
	for (i = 0; (*(pstr + i) != '=') && (*(pstr + i) != '\0'); ++i)
		++len;

	for (i = 0; i < ptbl->v_used; ++i) {
		if (strncmp(ptbl->v_envp[i], pstr, len) == 0)
			return (i);
	}
	return (-1);
}

/**
 * @brief
 *	bld_env_variables - Add an entry to the table that defines the environment variables for a job.
 * @par
 * 	Note that this function returns void. It gives the caller no indication
 * 	whether the operation failed, which it could. In the case where the
 * 	operation does fail, the variable will not be added to the table and
 * 	will not be present in the job's environment. The caller would have
 * 	to check the table upon return of this function to confirm the
 * 	variable was added/updated correctly.
 *
 * @param[in] vtable - variable table
 * @param[in] name - variable name alone or a "name=value" string
 * @param[in] value - variable value or NULL if name contains "name=value"
 *
 * @return - None
 *
 */
void
bld_env_variables(struct var_table *vtable, char *name, char *value)
{
	int amt;
	int i;
	char *block;

	if ((vtable == NULL) || (name == NULL))
		return;

	if (value == NULL) {
		/* name must contain '=' */
		if (strchr(name, (int) '=') == NULL)
			return;
	} else {
		/* name may not contain '=' */
		if (strchr(name, (int) '=') != NULL)
			return;
	}

	amt = strlen(name) + 1; /* plus 1 for terminator */
	if (value)
		amt += strlen(value) + 1; /* plus 1 for "=" */

	block = malloc(amt);
	if (block == NULL) /* no room for string */
		return;

	(void) strcpy(block, name);
	if (value) {
		(void) strcat(block, "=");
		(void) strcat(block, value);
	}

	if ((i = find_env_slot(vtable, block)) < 0) {
		/*
		 ** See if last available slot is used.
		 ** This needs to be one less than v_ensize
		 ** to make sure there is a NULL termination.
		 */
		if (vtable->v_used + 1 == vtable->v_ensize) {
			int newsize = vtable->v_ensize * 2;
			char **tt = realloc(vtable->v_envp,
					    newsize * sizeof(char *));

			if (tt == NULL)
				return; /* no room for pointer */
			vtable->v_ensize = newsize;
			vtable->v_envp = tt;
		}

		*(vtable->v_envp + vtable->v_used++) = block;
		*(vtable->v_envp + vtable->v_used) = NULL;
	} else {
		/* free old value */
		free(*(vtable->v_envp + i));
		*(vtable->v_envp + i) = block;
	}
}

/**
 * @brief
 *	Add to 'array_dest' the entries in 'array1'.
 *
 * @param[in]	array_src  - environment array to duplicate
 * @param[in]	array_dest - environment array in which to duplicate
 *
 * @return	char**
 *	!NULL	the environment array
 *	NULL	if an error occurred.
 * @par MT-safe: no
 */
void
add_envp(char **array_src, struct var_table *array_dest)
{
	char *e_var, *e_val, *p;
	int i;

	if (array_src == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ERR,
			  __func__, "Unexpected input");
		return;
	}
	i = 0;
	while ((e_var = array_src[i]) != NULL) {
		if ((p = strchr(e_var, '=')) != NULL) {
			*p = '\0';
			p++;
			e_val = p;
		} else {
			e_val = NULL; /* can be NULL */
		}
		bld_env_variables(array_dest, e_var, e_val);
		if (e_val != NULL)
			*(p - 1) = '='; /* restore */
		i++;
	}
}

#endif

/**
 * @brief
 * 		job_purge - purge job from system
 *
 * 		The job is dequeued; the job control file, script file and any spooled
 * 		output files are unlinked, and the job structure is freed.
 * 		If we are MOM, the task files and checkpoint files are also
 * 		removed.
 *
 * @param[in]	pj - pointer to job structure
 *
 * @return	void
 */

void
job_purge(job *pjob)
{
	extern char *msg_err_purgejob;
#ifdef PBS_MOM
	char namebuf[MAXPATHLEN + 1] = {'\0'};
	int keeping = 0;
	char *taskdir_path = NULL;

	pid_t pid = -1;
	int child_process = 0;

#else
	extern char *msg_err_purgejob_db;
	pbs_db_obj_info_t obj;
	pbs_db_job_info_t dbjob;
	void *conn = (void *) svr_db_conn;
#endif /* PBS_MOM */

	if (pjob->ji_rerun_preq != NULL) {
		log_joberr(PBSE_INTERNAL, __func__, "rerun request outstanding",
			   pjob->ji_qs.ji_jobid);
		reply_text(pjob->ji_rerun_preq, PBSE_INTERNAL, "job rerun");
		pjob->ji_rerun_preq = NULL;
	}
#ifndef PBS_MOM
	if (pjob->ji_pmt_preq != NULL) {
		log_joberr(PBSE_INTERNAL, __func__, "preempt request outstanding",
			   pjob->ji_qs.ji_jobid);
		reply_preempt_jobs_request(PBSE_INTERNAL, PREEMPT_METHOD_DELETE, pjob);
	}
#endif
#ifdef PBS_MOM
	if (pjob->ji_pending_ruu != NULL) {
		ruu *x = (ruu *) (pjob->ji_pending_ruu);
		send_resc_used(x->ru_cmd, 1, x);
		FREE_RUU(x);
	}
	delete_link(&pjob->ji_jobque);
	delete_link(&pjob->ji_alljobs);
	delete_link(&pjob->ji_unlicjobs);
	if (pbs_idx_delete(jobs_idx, pjob->ji_qs.ji_jobid) != PBS_IDX_RET_OK)
		log_joberr(PBSE_INTERNAL, __func__, "Failed to remove job from index", pjob->ji_qs.ji_jobid);

	if (pjob->ji_preq != NULL) {
		log_joberr(PBSE_INTERNAL, __func__, "request outstanding",
			   pjob->ji_qs.ji_jobid);
		reply_text(pjob->ji_preq, PBSE_INTERNAL, "job deleted");
		pjob->ji_preq = NULL;
	}

	free_string_array(pjob->ji_env.v_envp);

#ifndef WIN32

	if (pjob->ji_momsubt != 0) { /* child running */
		(void) kill(pjob->ji_momsubt, SIGKILL);
		pjob->ji_momsubt = 0;
	}
	/* if open, close pipes to/from Mom starter process */
	if (pjob->ji_jsmpipe != -1) {
		conn_t *connection = NULL;

		if ((is_jattr_set(pjob, JOB_ATR_session_id)) == 0 &&
		    !(get_jattr_long(pjob, JOB_ATR_session_id)) &&
		    (connection = get_conn(pjob->ji_jsmpipe)) != NULL) {
			/*
			 * If session id for the job is not set, retain pjob->ji_jsmpipe.
			 * Set cn_data to NULL so that we can kill the process when
			 * record_finish_exec is called.
			 */
			connection->cn_data = NULL;
		} else
			(void) close_conn(pjob->ji_jsmpipe);
	}
	if (pjob->ji_mjspipe != -1)
		(void) close(pjob->ji_mjspipe);

	/* if open, close 2nd pipes to/from Mom starter process */
	if (pjob->ji_jsmpipe2 != -1)
		(void) close_conn(pjob->ji_jsmpipe2);
	if (pjob->ji_mjspipe2 != -1)
		(void) close(pjob->ji_mjspipe2);

	/* if open, close 3rd pipes to/from Mom starter process */
	if (pjob->ji_child2parent_job_update_pipe != -1)
		(void) close_conn(pjob->ji_child2parent_job_update_pipe);
	if (pjob->ji_parent2child_job_update_pipe != -1)
		(void) close(pjob->ji_parent2child_job_update_pipe);

	/* if open, close 4th pipes to/from Mom starter process */
	if (pjob->ji_parent2child_job_update_status_pipe != -1)
		(void) close(pjob->ji_parent2child_job_update_status_pipe);

	/* if open, close 5th pipes to/from Mom starter process */
	if (pjob->ji_parent2child_moms_status_pipe != -1)
		(void) close(pjob->ji_parent2child_moms_status_pipe);
#else
	if (pjob->ji_user)
		wunloaduserprofile(pjob->ji_user);
#endif
#else  /* not PBS_MOM */
	if ((!check_job_substate(pjob, JOB_SUBSTATE_TRANSIN)) &&
	    (!check_job_substate(pjob, JOB_SUBSTATE_TRANSICM))) {
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) && (!check_job_state(pjob, JOB_STATE_LTR_FINISHED))) {
			if ((check_job_substate(pjob, JOB_SUBSTATE_RERUN3)) || (check_job_substate(pjob, JOB_SUBSTATE_QUEUED)))
				update_sj_parent(pjob->ji_parentaj, pjob, pjob->ji_qs.ji_jobid, get_job_state(pjob), JOB_STATE_LTR_QUEUED);
			else {
				if (pjob->ji_terminated && pjob->ji_parentaj && pjob->ji_parentaj->ji_ajinfo)
					pjob->ji_parentaj->ji_ajinfo->tkm_dsubjsct++;
				update_sj_parent(pjob->ji_parentaj, pjob, pjob->ji_qs.ji_jobid, get_job_state(pjob), JOB_STATE_LTR_EXPIRED);
				chk_array_doneness(pjob->ji_parentaj);
			}
		}

		account_entity_limit_usages(pjob, NULL, NULL, DECR,
					    pjob->ji_etlimit_decr_queued ? ETLIM_ACC_ALL_MAX : ETLIM_ACC_ALL);

		svr_dequejob(pjob);
	}
#endif /* PBS_MOM */

#ifdef PBS_MOM

	/* on the mom end, perform file-system related cleanup in a forked process
	 * only if job is executed successfully with exit status 0(JOB_EXEC_OK)
	 */
	if (pjob->ji_qs.ji_un.ji_momt.ji_exitstat == JOB_EXEC_OK) {
		/* rename the taskdir path to avoid race condition when job
		 * reruns. It will be removed later in the child process.
		 */
		taskdir_path = rename_taskdir(pjob);
		pid = fork();
		if (pid > 0) {
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
			delete_cred(pjob->ji_qs.ji_jobid);
#endif
			/* parent mom */
			job_free(pjob);
			free(taskdir_path);
			return;
		}
		if (!pid)
			child_process = 1;
	}
	/* Parent Mom process will continue the job cleanup itself, if call to fork is failed */
	/* delete script file */
	del_job_related_file(pjob, JOB_SCRIPT_SUFFIX);

	if (pjob->ji_preq != NULL) {
		req_reject(PBSE_MOMREJECT, 0, pjob->ji_preq);
		pjob->ji_preq = NULL;
	}

	del_job_dirs(pjob, taskdir_path);
	free(taskdir_path);

	del_chkpt_files(pjob);

	/* remove stdout/err files if remove_files is set. */
	if (is_jattr_set(pjob, JOB_ATR_remove) && (pjob->ji_qs.ji_un.ji_momt.ji_exitstat == JOB_EXEC_OK)) {
		char *remove = get_jattr_str(pjob, JOB_ATR_remove);
		if (strchr(remove, 'o')) {
			(void) strcpy(namebuf, std_file_name(pjob, StdOut, &keeping));
			if (*namebuf && (unlink(namebuf) < 0))
				if (errno != ENOENT)
					log_err(errno, __func__, msg_err_purgejob);
		}
		if (strchr(remove, 'e')) {
			(void) strcpy(namebuf, std_file_name(pjob, StdErr, &keeping));
			if (*namebuf && (unlink(namebuf) < 0))
				if (errno != ENOENT)
					log_err(errno, __func__, msg_err_purgejob);
		}
	}

#ifdef WIN32
	/* following introduced by fix to BZ 6363 for executing scripts */
	/* directly on the command line */
	(void) strcpy(namebuf, path_jobs); /* delete any *.BAT file */
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(namebuf, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(namebuf, pjob->ji_qs.ji_jobid);
	(void) strcat(namebuf, ".BAT");

	if (unlink(namebuf) < 0) {
		if (errno != ENOENT)
			log_err(errno, __func__, msg_err_purgejob);
	}
#endif
#else  /* PBS_MOM */

	/* server code */
	remove_stdouterr_files(pjob, JOB_STDOUT_SUFFIX);
	remove_stdouterr_files(pjob, JOB_STDERR_SUFFIX);
#endif /* PBS_MOM */

#ifdef PBS_MOM
	/* delete job file */
	del_job_related_file(pjob, JOB_FILE_SUFFIX);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	delete_cred(pjob->ji_qs.ji_jobid);
#endif

#else
	/* delete job and dependants from database */
	obj.pbs_db_obj_type = PBS_DB_JOB;
	obj.pbs_db_un.pbs_db_job = &dbjob;
	strcpy(dbjob.ji_jobid, pjob->ji_qs.ji_jobid);
	if (pbs_db_delete_obj(conn, &obj) == -1) {
		log_joberr(-1, __func__, msg_err_purgejob_db,
			   pjob->ji_qs.ji_jobid);
	}

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HasNodes)
		free_nodes(pjob);

#endif

	del_job_related_file(pjob, JOB_CRED_SUFFIX);

	/* Clearing purge job info from svr_newjobs list */
	if (pjob == (job *) GET_NEXT(svr_newjobs))
		delete_link(&pjob->ji_alljobs);

	job_free(pjob);

#ifdef PBS_MOM
	if (child_process) {
		/* I am child of the forked process. Deleted all the
		 * particular job related files, thus exiting.
		 */
		exit(0);
	}
#endif

	return;
}

/**
 * @brief
 * 		find_job() - find job by jobid
 *
 *		Search list of all server jobs for one with same job id
 *		Return NULL if not found or pointer to job struct if found.
 *
 *		If the host portion of the job ID contains a dot, it is
 *		assumed that the string represents the FQDN. If no dot is
 *		present, the string represents the short (unqualified)
 *		hostname. For example, "foo" will match "foo.bar.com", but
 *		"foo.bar" will not match "foo.bar.com".
 *
 *		If server, then search in AVL tree otherwise Linked list.
 *
 * @param[in]	jobid - job ID string.
 *
 * @return	pointer to job struct
 * @retval NULL	- if job by jobid not found.
 */

job *
find_job(char *jobid)
{
#ifndef PBS_MOM
	size_t len;
	char *host_dot;
	char *serv_dot;
	char *host;
#endif
	char *at;
	job *pj = NULL;
	char buf[PBS_MAXSVRJOBID + 1];
	void *pbuf = &buf;

	if (jobid == NULL || jobid[0] == '\0')
		return NULL;

	/* Make a copy of the job ID string before we modify it. */
	snprintf(buf, sizeof(buf), "%s", jobid);
	/*
	 * If @server_name was specified, it was used to route the
	 * request to this server. It will not be part of the string
	 * we are searching for, so truncate the string at the '@'
	 * character.
	 */
	if ((at = strchr(buf, (int) '@')) != NULL)
		*at = '\0';

#ifndef PBS_MOM
	/*
	 * index search cannot find partially formed jobid's.
	 * While storing we supplied the full jobid.
	 * So while retrieving also we have to provide
	 * the exact key that was used while storing the job
	 */
	if ((host_dot = strchr(buf, '.')) != NULL) {
		/* The job ID string contains a host string */
		host = host_dot + 1;
		if (strncasecmp(server_name, host, PBS_MAXSERVERNAME + 1) != 0) {
			/*
			 * The server_name and host strings do not match.
			 * Try to determine if one is the FQDN and the other
			 * is the short name. If there is no match, do not
			 * modify the string we will be searching for. If
			 * there is a match, replace host with server_name.
			 *
			 * Do not call is_same_host() to avoid DNS lookup
			 * because server_name may not resolve to a real
			 * host when PBS_SERVER_HOST_NAME is set or when
			 * failover is enabled. The lookup could hang the
			 * server for some amount of time.
			 */
			host_dot = strchr(host, '.');
			serv_dot = strchr(server_name, '.');
			if (host_dot != NULL) {
				/* the host string is FQDN */
				if (serv_dot == NULL) {
					/* the server_name is not FQDN */
					len = strlen(server_name);
					if (len == (host_dot - host)) {
						if (strncasecmp(host, server_name, len) == 0) {
							/* Use server_name to ensure cases match. */
							strcpy(host, server_name);
						}
					}
				}
			} else if (serv_dot != NULL) {
				/* the host string is not FQDN */
				/* the server_name is FQDN */
				len = strlen(host);
				if (len == (serv_dot - server_name)) {
					if (strncasecmp(host, server_name, len) == 0) {
						/* Use server_name to ensure cases match. */
						strcpy(host, server_name);
					}
				}
			}
		} else {
			/*
			 * Case insensitive compare was successful.
			 * Use server_name to ensure cases match.
			 */
			strcpy(host, server_name);
		}
	} else {
		/* The job ID string does not contain a host string */
		strcat(buf, ".");
		strcat(buf, server_name);
	}

#endif
	if (pbs_idx_find(jobs_idx, &pbuf, (void **) &pj, NULL) == PBS_IDX_RET_OK)
		return pj;
	return NULL;
}

/**
 *  @brief
 *		Output credential into job file.
 *
 * @param[in]		pjob - pointer to job struct
 * @param[in]		cred - JobCredential
 * @param[in]		len - size of credentials.
 *
 * @return	int
 * @retval	0	- success
 * @retval	-1	- fail
 */
int
write_cred(job *pjob, char *cred, size_t len)
{
	extern char *path_jobs;
	char name_buf[MAXPATHLEN + 1];
	int cred_fd;
	int ret = -1;

	(void) strcpy(name_buf, path_jobs);
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(name_buf, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(name_buf, pjob->ji_qs.ji_jobid);
	(void) strcat(name_buf, JOB_CRED_SUFFIX);

	if ((cred_fd = open(name_buf, O_WRONLY | O_CREAT | O_EXCL, 0600)) == -1) {
		log_err(errno, __func__, name_buf);
		return -1;
	}

#ifdef WIN32
	secure_file(name_buf, "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED);
	setmode(cred_fd, O_BINARY);
#endif

	if (write(cred_fd, cred, len) != len) {
		log_err(errno, __func__, "write cred");
		goto done;
	}

	ret = 0;

done:
	close(cred_fd);
	return ret;
}

/**
 * @brief
 *		Check if this job has an associated credential file.  If it does,
 *		the credential file is opened and the credential is read into
 *		malloc'ed memory.
 *
 * @param[in]		pjob - job whose credentials needs to be read.
 * @param[out]		cred - JobCredential
 * @param[in]		len - size of credentials.
 *
 * @return	int
 * @retval	1	- no cred
 * @retval	0	- success
 * @retval	-1	- error
 */
int
read_cred(job *pjob, char **cred, size_t *len)
{
	extern char *path_jobs;
	char name_buf[MAXPATHLEN + 1];
	char *hold = NULL;
	struct stat sbuf;
	int fd;
	int ret = -1;

	(void) strcpy(name_buf, path_jobs);
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(name_buf, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(name_buf, pjob->ji_qs.ji_jobid);
	(void) strcat(name_buf, JOB_CRED_SUFFIX);

	if ((fd = open(name_buf, O_RDONLY)) == -1) {
		if (errno == ENOENT)
			return 1;
		log_err(errno, __func__, "open");
		return ret;
	}

	if (fstat(fd, &sbuf) == -1) {
		log_err(errno, __func__, "fstat");
		goto done;
	}

	hold = malloc(sbuf.st_size);
	assert(hold != NULL);

#ifdef WIN32
	setmode(fd, O_BINARY);
#endif

	if (read(fd, hold, sbuf.st_size) != sbuf.st_size) {
		log_err(errno, __func__, "read");
		goto done;
	}
	*len = sbuf.st_size;
	*cred = hold;
	hold = NULL;
	ret = 0;

done:
	close(fd);
	if (hold != NULL)
		free(hold);
	return ret;
}

/**
 * @brief
 * 	Returns 1 if job 'job' should remain running in spite of node failures.
 * @param[in]	pjob	- job being queried
 *
 * @return int
 * @retval	1 - if true
 * @retval	0 - if false or 'tolerate_node_failures' attribute is unset
 */
int
do_tolerate_node_failures(job *pjob)
{

	if (pjob == NULL)
		return (0);

#if MOM_ALPS
	/* not currently supported on the Crays */
	return (0);
#endif

	if ((is_jattr_set(pjob, JOB_ATR_tolerate_node_failures)) &&
	    ((strcmp(get_jattr_str(pjob, JOB_ATR_tolerate_node_failures), TOLERATE_NODE_FAILURES_ALL) == 0) ||
	     ((strcmp(get_jattr_str(pjob, JOB_ATR_tolerate_node_failures), TOLERATE_NODE_FAILURES_JOB_START) == 0) &&
	      !check_job_substate(pjob, JOB_SUBSTATE_RUNNING)))) {
		return (1);
	}
	return (0);
}
/**
 * @brief
 *	This function updates/creates the resource list named
 *	'res_list_name' and indexed in pjob as
 *	'res_list_index', using resources assigned values specified
 *	in 'exec_vnode'. This also saves the previous values in
 *	pjob's 'backup_res_list_index' attribute if not already
 *	set.
 *
 * @param[in,out] pjob - job structure
 * @param[in]	  res_list_name - resource list name
 * @param[in]	  rel_list_index - attribute index in job structure
 * @param[in]	  exec_vnode - string containing  the various resource
 *			assignments
 * @param[in]	  op - kind of operation to be performed while setting
 *		     the resource value.
 * @param[in]	  always_set  - if set, even if there is no resulting
 *			resource list, try to have at least one entry
 *			(e.g., ncpus=0) to keep the list set.
 * @param[in]	  backup_res_list_index - index to  job's attribute
 *			resource list to hold original values.
 *
 * @return int
 * @retval 0  - success
 * @retval 1 - failure
 */

int
update_resources_list(job *pjob, char *res_list_name,
		      int res_list_index, char *exec_vnode, enum batch_op op,
		      int always_set, int backup_res_list_index)
{
	char *chunk;
	int j;
	int rc;
	int nelem;
	char *noden;
	struct key_value_pair *pkvp;
	resource_def *prdef;
	resource *presc, *pr, *next;
	attribute tmpattr;

	if (exec_vnode == NULL || pjob == NULL) {
		log_err(PBSE_INTERNAL, __func__, "bad input parameter");

		return (1);
	}

	/* Save current resource values in backup resource list */
	/* if backup resources list is not already set */
	if (is_jattr_set(pjob, res_list_index)) {

		if ((is_jattr_set(pjob, backup_res_list_index)) == 0) {
			free_jattr(pjob, backup_res_list_index);
			set_attr_with_attr(&job_attr_def[backup_res_list_index], get_jattr(pjob, backup_res_list_index), get_jattr(pjob, res_list_index), INCR);
		}

		pr = (resource *) GET_NEXT(get_jattr_list(pjob, res_list_index));
		while (pr != NULL) {
			next = (resource *) GET_NEXT(pr->rs_link);
			if (pr->rs_defin->rs_flags & (ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) {
				delete_link(&pr->rs_link);
				if (pr->rs_value.at_flags & ATR_VFLAG_INDIRECT)
					free_str(&pr->rs_value);
				else
					pr->rs_defin->rs_free(&pr->rs_value);
				(void) free(pr);
			}
			pr = next;
		}
	}

	rc = 0;
	for (chunk = parse_plus_spec(exec_vnode, &rc); chunk && (rc == 0);
	     chunk = parse_plus_spec(NULL, &rc)) {

		if ((rc = parse_node_resc(chunk, &noden, &nelem, &pkvp)) != 0) {
			log_err(rc, __func__, "parse of exec_vnode failed");
			goto update_resources_list_error;
		}
		for (j = 0; j < nelem; j++) {
			prdef = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
			if (prdef == NULL) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "unknown resource %s in exec_vnode",
					 pkvp[j].kv_keyw);
				log_err(PBSE_INTERNAL, __func__, log_buffer);
				goto update_resources_list_error;
			}

			if (prdef->rs_flags & (ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) {
				presc = add_resource_entry(
					get_jattr(pjob, res_list_index),
					prdef);
				if (presc == NULL) {
					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "failed to add resource"
						 "  %s",
						 prdef->rs_name);
					log_err(PBSE_INTERNAL, __func__,
						log_buffer);
					goto update_resources_list_error;
				}
				if ((rc = prdef->rs_decode(&tmpattr,
							   res_list_name, prdef->rs_name,
							   pkvp[j].kv_val)) != 0) {
					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "decode of %s failed",
						 prdef->rs_name);

					log_err(PBSE_INTERNAL, __func__,
						log_buffer);
					goto update_resources_list_error;
				}
				(void) prdef->rs_set(&presc->rs_value,
						     &tmpattr, op);
			}
		}
	}

	if (rc != 0) {
		log_err(PBSE_INTERNAL, __func__, "error parsing exec_vnode");
		goto update_resources_list_error;
	}

	if (always_set &&
	    ((is_jattr_set(pjob, res_list_index)) == 0)) {
		/* this means no resources got freed during suspend */
		/* let's put a dummy entry for ncpus=0 */
		prdef = &svr_resc_def[RESC_NCPUS];
		presc = add_resource_entry(get_jattr(pjob, res_list_index), prdef);
		if (presc == NULL) {
			log_err(PBSE_INTERNAL, __func__,
				"failed to add ncpus in resource list");
			return (1);
		}
		if ((rc = prdef->rs_decode(&tmpattr, res_list_name,
					   prdef->rs_name, "0")) != 0) {
			log_err(rc, __func__,
				"decode of ncpus=0 failed");
			return (1);
		}
		(void) prdef->rs_set(&presc->rs_value, &tmpattr, op);
	}

	return (0);

update_resources_list_error:
	free_jattr(pjob, backup_res_list_index);
	mark_jattr_not_set(pjob, backup_res_list_index);
	set_attr_with_attr(&job_attr_def[res_list_index],
			   get_jattr(pjob, res_list_index),
			   get_jattr(pjob, backup_res_list_index), INCR);
	return (1);
}

#ifndef PBS_MOM /*SERVER ONLY*/

/**
 * @brief
 * 	allocate space for a "resc_resv" structure and initialize
 *
 * @return	resc_resv *
 * @retval	nonzero	- successful
 * @retval	0	- unsuccessful
 */

resc_resv *
resv_alloc(char *resvid)
{
	int i;
	resc_resv *resvp;
	char *dot = NULL;

	resvp = (resc_resv *) calloc(1, sizeof(resc_resv));
	if (resvp == NULL) {
		log_err(errno, __func__, "no memory");
		return NULL;
	}

	CLEAR_LINK(resvp->ri_allresvs);
	CLEAR_HEAD(resvp->ri_svrtask);
	CLEAR_HEAD(resvp->ri_rejectdest);
	resvp->newobj = 1;

	/* set the reservation structure's version number and
	 * the working attributes to "unspecified"
	 */
	resvp->ri_qs.ri_rsversion = RSVERSION;
	for (i = 0; i < RESV_ATR_LAST; i++)
		clear_rattr(resvp, i);

	if ((dot = strchr(resvid, (int) '.')) != 0)
		*dot = '\0';

	/*
	 * ignore first char in given id as it can change, see req_resvSub()
	 * So, we only use digits in given id as key in index
	 */
	if (pbs_idx_insert(resvs_idx, (void *) (resvid + 1), (void *) resvp) != PBS_IDX_RET_OK) {
		*dot = '.';
		log_errf(-1, __func__, "Failed to add resv %s into index", resvid);
		free(resvp);
		return NULL;
	}
	if (dot)
		*dot = '.';

	return (resvp);
}

/**
 * @brief
 * 		resv_free - deals only with the actual "freeing" of a reservation,
 *		accounting, notifying, removing the reservation from linked lists
 *		are handled before hand by resv_abt, resv_purge.  This just frees
 *		any hanging substructures, deletes any attached work_tasks and frees
 *		the resc_resv	structure itself.
 *
 * @param[in,out]		presv - reservation struct which needs to be freed.
 *
 * @return void
 */

void
resv_free(resc_resv *presv)
{
	int i;
	struct work_task *pwt;
	badplace *bp;
	char *dot = NULL;
	char *resvid = presv->ri_qs.ri_resvID;

	/* remove any malloc working attribute space */

	for (i = 0; i < (int) RESV_ATR_LAST; i++)
		free_rattr(presv, i);

	/* delete any work task entries associated with the resv */

	while ((pwt = (struct work_task *) GET_NEXT(presv->ri_svrtask)) != 0) {
		delete_task(pwt);
	}

	/* free any bad destination structs */
	/* We may never use this code if reservations can't be routed */

	bp = (badplace *) GET_NEXT(presv->ri_rejectdest);
	while (bp) {
		delete_link(&bp->bp_link);
		free(bp);
		bp = (badplace *) GET_NEXT(presv->ri_rejectdest);
	}

	/* any "interactive" batch request? (shouldn't be); free it now */
	if (presv->ri_brp)
		free_br(presv->ri_brp);

	if ((dot = strchr(resvid, (int) '.')) != 0)
		*dot = '\0';

	if (pbs_idx_delete(resvs_idx, (void *) (resvid + 1)) != PBS_IDX_RET_OK) {
		if (dot)
			*dot = '.';
		dot = NULL;
		log_errf(-1, __func__, "Failed to delete resv %s from index", resvid);
	}
	if (dot)
		*dot = '.';

	/* now free the main structure */
	free(presv);
}

/**
 * @brief
 * 		resv_purge - purge reservation from system
 *
 * 		The reservation is unlinked from the server's svr_allresvs;
 * 		the reservation control file is unlinked, any attached work_task's
 * 		are deleted and the resc_resv structure is freed along with any
 * 		hanging, malloc'd memory areas.
 *
 * 		This function - ASSUMES - that if the reservation is supported by a
 * 		pbs_queue that queue is empty OR having history jobs only (i.e. job
 * 		in state JOB_STATE_LTR_MOVED/JOB_STATE_LTR_FINISHED). So, whatever mechanism
 * 		is being used to remove the jobs from such a supporting queue should,
 * 		at the outset, store the value "False" into the queue's "enabled"
 * 		attribute (blocks new jobs from being placed in the queue while the
 * 		server attempts to delete those currently in the queue) and into its
 * 		"scheduling" attribute (to disable servicing by the scheduler).
 *
 * 		Any hanging, empty pbs_queue will be handled by creating and issuing
 * 		to the server a PBS_BATCH_Manager request to delete this queue.  This
 * 		will be dispatched immediately and a work_task having a function whose
 * 		sole job is to free the batch_request struct is placed on the "immediate"
 * 		task list, for processing by the "next_task" function in the main loop
 * 		of the server.
 *
 * 		This function should only be called after a check has been made to
 * 		to verify that the party deleting the reservation has proper permission
 *
 * @param[in]	presv - pointer to reservation which needs to be puged.
 *
 * @return	void
 */

void
resv_purge(resc_resv *presv)
{
	struct batch_request *preq;
	struct work_task *pwt;
	extern char *msg_purgeResvFail;
	extern char *msg_purgeResvDb;
	pbs_db_obj_info_t obj;
	pbs_db_resv_info_t dbresv;

	if (presv == NULL)
		return;

	if (presv->ri_qp != NULL) {
		/*
		 * Issue a batch_request to remove the supporting pbs_queue
		 * As Stated: Assumption is that the queue is empty of jobs
		 */
		preq = alloc_br(PBS_BATCH_Manager);
		if (preq == NULL) {
			(void) sprintf(log_buffer, "batch request allocation failed");
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_RESV, LOG_ERR,
				  presv->ri_qs.ri_resvID, log_buffer);
			return;
		}

		CLEAR_LINK(preq->rq_ind.rq_manager.rq_attr);
		preq->rq_ind.rq_manager.rq_cmd = MGR_CMD_DELETE;
		preq->rq_ind.rq_manager.rq_objtype = MGR_OBJ_QUEUE;

		(void) strcpy(preq->rq_user, "pbs_server");
		(void) strcpy(preq->rq_host, pbs_server_name);
		/*
		 * Copy the queue name from the attributes rather than use the
		 * presv->ri_qp->qu_qs.qu_name value. The post_resv_purge()
		 * function could modify it at any time. See SPID 352225.
		 */
		strcpy(preq->rq_ind.rq_manager.rq_objname, get_rattr_str(presv, RESV_ATR_queue));

		/* It is assumed that the prior check on permission was OK */
		preq->rq_perm |= ATR_DFLAG_MGWR;

		if (issue_Drequest(PBS_LOCAL_CONNECTION, preq, post_resv_purge, &pwt, 0) == -1) {
			/* Failed to delete queue. */
			free_br(preq);
			log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_WARNING,
				  presv->ri_qs.ri_resvID, msg_purgeResvFail);
			return;
		}
		/*
		 * Queue was deleted. Invocation of post_resv_purge() will
		 * re-call resv_purge() (passing wt_parm2)
		 */
		if (pwt)
			pwt->wt_parm2 = presv;
		return;
	}

	/* reservation no longer has jobs or a supporting queue */

	if (presv->ri_giveback) {
		/*ok, resources were actually assigned to this reservation
		 *and must now be accounted back into the loaner's pool
		 */

		set_resc_assigned((void *) presv, 1, DECR);
		presv->ri_giveback = 0;
	}

	/* Remove reservation's link element from the server's global list (svr_allresvs) */
	delete_link(&presv->ri_allresvs);

	/* Delete any lingering tasks pointing to this reservation */
	delete_task_by_parm1_func(presv, NULL, DELETE_ALL);

	/* Release any nodes that were associated to this reservation */
	free_resvNodes(presv);
	set_scheduler_flag(SCH_SCHEDULE_TERM, dflt_scheduler);

	strcpy(dbresv.ri_resvid, presv->ri_qs.ri_resvID);
	obj.pbs_db_obj_type = PBS_DB_RESV;
	obj.pbs_db_un.pbs_db_resv = &dbresv;
	if (pbs_db_delete_obj(svr_db_conn, &obj) == -1)
		log_err(errno, __func__, msg_purgeResvDb);

	/* Free resc_resv struct, any hanging substructs, any attached *work_task structs */
	resv_free(presv);
	return;
}

/**
 * @brief
 *  	post_resv_purge - As with the other "post_*" functions, this
 *		handles the return reply from an internally generated request.
 *		Function resv_purge() ended up having to generate an internal
 *		request to qmgr() to delete the reservation's attached queue.
 *		When the reply to that is received and indicates success,
 *		resv_purge() will be re-called and this time the latter half
 *		of the resv_purge() code will execute to finish the purge.
 *		Otherwise, the reservation just won't get purged.  It will
 *		just be defunct
 *
 * @param[in]	pwt - work structure which contains internally generated request.
 *
 * @return void
 */

static void
post_resv_purge(struct work_task *pwt)
{
	int code;
	resc_resv *presv;
	struct batch_request *preq;

	preq = (struct batch_request *) pwt->wt_parm1;
	presv = (resc_resv *) pwt->wt_parm2;
	code = preq->rq_reply.brp_code;

	/*Release the batch_request hanging (wt_parm1) from the
	 *work_task structure
	 */
	release_req(pwt);

	if (code) {
		/*response from the request is that an error occured
		 *So, we failed on deleting the reservation's queue -
		 *should mail owner about the failure
		 */
		return;
	}

	/*qmgr gave no error in doing MGR_CMD_DELETE on the queue
	 *So it's safe to clear the reservation's queue pointer
	 */
	presv->ri_qp = NULL;

	/*now re-call resv_purge to execute the function's lower part*/
	resv_purge(presv);
}

/**
 * @brief
 * 		resv_abt - abort a reservation
 *
 * 		The reservation removed from the system and a mail message is sent
 * 		to the reservation owner.
 *
 * @param[in]	presv - reservation structure
 * @param[in]	text - matter/content in the mail.
 *
 * @return	error code
 * @retval	0	- success
 * @retval	-1	- error
 */

int
resv_abt(resc_resv *presv, char *text)
{
	int old_state;
	int rc = 0;

	old_state = presv->ri_qs.ri_state;

	if (old_state == RESV_BEING_DELETED) {
		if ((presv->ri_qp != NULL &&
		     presv->ri_qp->qu_numjobs == 0) ||
		    presv->ri_qp == NULL) {

			account_recordResv(PBS_ACCT_ABT, presv, "");
			svr_mailownerResv(presv, MAIL_ABORT, MAIL_NORMAL, text);
			resv_purge(presv);
		} else
			rc = -1;
	}
	return (rc);
}

/**
 * @brief
 * 		Set node state to resv-exclusive if either reservation requests
 * 		exclusive placement or the node sharing attribute is to be exclusive or
 * 		reservation requests AOE.
 *
 * @param[in]	presv The reservation being considered
 *
 * @return void
 *
 * @MT-safe: No
 */
void
resv_exclusive_handler(resc_resv *presv)
{
	resource_def *prsdef;
	resource *pplace;
	pbsnode_list_t *pnl;
	int share_node = VNS_DFLT_SHARED;
	int share_resv = VNS_DFLT_SHARED;
	char *scdsel;

	prsdef = &svr_resc_def[RESC_PLACE];
	pplace = find_resc_entry(get_rattr(presv, RESV_ATR_resource), prsdef);
	if (pplace && pplace->rs_value.at_val.at_str) {
		if ((place_sharing_type(pplace->rs_value.at_val.at_str,
					VNS_FORCE_EXCLHOST) != VNS_UNSET) ||
		    (place_sharing_type(pplace->rs_value.at_val.at_str,
					VNS_FORCE_EXCL) != VNS_UNSET)) {
			share_resv = VNS_FORCE_EXCL;
		}
		if (place_sharing_type(pplace->rs_value.at_val.at_str,
				       VNS_IGNORE_EXCL) == VNS_IGNORE_EXCL) {
			share_resv = VNS_IGNORE_EXCL;
		}
	}

	if (share_resv != VNS_FORCE_EXCL) {
		scdsel = get_rattr_str(presv, RESV_ATR_SchedSelect);
		if (scdsel && strstr(scdsel, "aoe="))
			share_resv = VNS_FORCE_EXCL;
	}
	for (pnl = presv->ri_pbsnode_list; pnl != NULL; pnl = pnl->next) {
		share_node = get_nattr_long(pnl->vnode, ND_ATR_Sharing);

		/*
		 * set node state to resv-exclusive if either node forces exclusive
		 * or reservation requests exclusive and node does not ignore
		 * exclusive.
		 */
		DBPRT(("node=%s, share_node=%d, share_resv=%d", pnl->vnode->nd_name, share_node, share_resv));
		if ((share_node == VNS_FORCE_EXCL) || (share_node == VNS_FORCE_EXCLHOST) ||
		    ((share_node != VNS_IGNORE_EXCL) && (share_resv == VNS_FORCE_EXCL)) ||
		    (((share_node == VNS_DFLT_EXCL) || (share_node == VNS_DFLT_EXCLHOST)) && (share_resv != VNS_IGNORE_EXCL))) {
			set_vnode_state(pnl->vnode, INUSE_RESVEXCL, Nd_State_Or);
		}
	}
}

/**
 * @brief
 *  	Find aoe from the reservation request
 *
 * @see
 *		resc_select_action
 *
 * @param[in]	presv	- pointer to the reservation
 *
 * @return	char *
 * @retval	NULL     - no aoe requested
 * @retval	NON NULL - value of aoe requested
 *
 * @par Side Effects:
 *	Memory returned is to be freed by caller
 *
 * @par MT-safe: yes
 *
 */
char *
find_aoe_from_request(resc_resv *presv)
{
	char *aoe_req = NULL;
	char *p, *q;
	int i = 0;

	/* look into schedselect as this is expanded form of select
	 * after taking into account default_chunk.res.
	 */
	if (presv == NULL)
		return NULL;

	if ((q = get_rattr_str(presv, RESV_ATR_SchedSelect)) != NULL) {
		/* just get first appearance of aoe */
		if ((p = strstr(q, "aoe=")) != NULL) {
			p += 4; /* strlen("aoe=") = 4 */
			/* get length of aoe name in i. */
			for (q = p; *q && *q != ':' && *q != '+'; i++, q++)
				;
			aoe_req = malloc(i + 1);
			if (aoe_req == NULL) {
				log_err(ENOMEM, __func__, "out of memory");
				return NULL;
			}
			strncpy(aoe_req, p, i);
			aoe_req[i] = '\0';
		}
	}
	return aoe_req;
}
#endif /*ifndef PBS_MOM*/

/**
 * @brief
 * 		get_jobowner - copy the basic job owner's name, without the @host suffix.
 *		The "to" buffer must be large enough (PBS_MAXUSER+1).
 *
 * @param[in]	from	-	 basic job owner's name
 * @param[out]	to	-	"to" buffer where name is copied.
 */
void
get_jobowner(char *from, char *to)
{
	int i;

	for (i = 0; i < PBS_MAXUSER; ++i) {
		if ((*(from + i) == '@') || (*(from + i) == '\0'))
			break;
		*(to + i) = *(from + i);
	}
	*(to + i) = '\0';
}

/**
 * @brief
 * 		setup_from - setup the "from" name for a standard job file:
 *		output, error, or chkpt
 *
 * @param[in]	pjob	- job structure
 * @param[in]	suffix	- suffix for the "from" name
 *
 * @return	"from" name
 */

static char *
setup_from(job *pjob, char *suffix)
{
	char *from;

	from = malloc(strlen(pjob->ji_qs.ji_jobid) + strlen(suffix) + 1);
	if (from) {
		(void) strcpy(from, pjob->ji_qs.ji_jobid);
		(void) strcat(from, suffix);
	}
	return (from);
}

/**
 * @brief
 * 		setup_cpyfiles - if need be, allocate and initialize a Copy Files
 *		batch request, then append the file pairs
 *
 * @param[in]	preq	- batch request
 * @param[in]	pjob	- job structure
 * @param[in]	from	- local (to mom) name
 * @param[in]	to		- remote (destination) name
 * @param[in]	direction	- copy direction
 * @param[in]	tflag	- 1 if stdout or stderr , 2 if stage out or in
 *
 * @return	modified batch request.
 * @retval	NULL	- failure
 */

static struct batch_request *
setup_cpyfiles(struct batch_request *preq, job *pjob, char *from, char *to, int direction, int tflag)
{
	struct rq_cpyfile *pcf;
	struct rq_cpyfile_cred *pcfc;
	struct rqfpair *pair;
	size_t cred_len = 0;
	char *cred = NULL;
	char *prq_jobid;
	char *prq_owner;
	char *prq_user;
	char *prq_group;
	int *prq_dir;
	pbs_list_head *prq_pair;
	attribute *attr;

#ifndef PBS_MOM
	/* if this is a sub job of an array job, then check to see if the */
	/* index needs to be substituted in the paths			  */
	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
		to = subst_array_index(pjob, to);
		from = subst_array_index(pjob, from);
	}
#endif

	if (preq == NULL) {
		/* check that certain required attributues are valid */

		if (get_jattr_str(pjob, JOB_ATR_job_owner) == NULL || get_jattr_str(pjob, JOB_ATR_euser) == NULL) {
			/* this case shouldn't happen, log it and don't do copy     */
			/* use null jobid, if attr missing, jobid is likely bad too */

			log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_FILE,
				  LOG_INFO, "",
				  "cannot copy files for job, owner/euser missing");
			if (from)
				free(from);
			if (to)
				free(to);
			if (cred)
				free(cred);
			return NULL;
		}
		/* allocate and initialize the batch request struct */
#ifndef PBS_MOM
		if (get_credential(parse_servername(get_jattr_str(pjob, JOB_ATR_exec_vnode), NULL),
				   pjob, PBS_GC_CPYFILE, &cred, &cred_len) == 0) {
			preq = alloc_br(PBS_BATCH_CopyFiles_Cred);
		} else
#endif
			preq = alloc_br(PBS_BATCH_CopyFiles);

		if (preq == NULL) {
			if (from)
				free(from);
			if (to)
				free(to);
			if (cred)
				free(cred);
			return (preq);
		}

		if (preq->rq_type == PBS_BATCH_CopyFiles_Cred) {
			preq->rq_ind.rq_cpyfile_cred.rq_credtype = pjob->ji_extended.ji_ext.ji_credtype;
			preq->rq_ind.rq_cpyfile_cred.rq_pcred = cred;
			preq->rq_ind.rq_cpyfile_cred.rq_credlen = cred_len;
			pcfc = &preq->rq_ind.rq_cpyfile_cred;
			prq_jobid = pcfc->rq_copyfile.rq_jobid;
			prq_owner = pcfc->rq_copyfile.rq_owner;
			prq_user = pcfc->rq_copyfile.rq_user;
			prq_group = pcfc->rq_copyfile.rq_group;
			prq_dir = &pcfc->rq_copyfile.rq_dir;
			prq_pair = &pcfc->rq_copyfile.rq_pair;
		} else {
			pcf = &preq->rq_ind.rq_cpyfile;
			prq_jobid = pcf->rq_jobid;
			prq_owner = pcf->rq_owner;
			prq_user = pcf->rq_user;
			prq_group = pcf->rq_group;
			prq_dir = &pcf->rq_dir;
			prq_pair = &pcf->rq_pair;
		}
		CLEAR_HEAD((*prq_pair));

		/* copy jobid, owner, exec-user, group names, upto the @host part */

		strcpy(prq_jobid, pjob->ji_qs.ji_jobid);
		get_jobowner(get_jattr_str(pjob, JOB_ATR_job_owner), prq_owner);
		get_jobowner(get_jattr_str(pjob, JOB_ATR_euser), prq_user);
		attr = get_jattr(pjob, JOB_ATR_egroup);
		if ((attr->at_flags & ATR_VFLAG_DEFLT) == 0 && get_attr_str(attr) != 0)
			strcpy(prq_group, get_attr_str(attr));
		else
			prq_group[0] = '\0'; /* default: use login group */

		*prq_dir = direction;

		/* set "sandbox=PRIVATE" mode */
		if (is_jattr_set(pjob, JOB_ATR_sandbox)) {
			/* set STAGE_JOBDIR mode based on job settings */
			if (strcasecmp(get_jattr_str(pjob, JOB_ATR_sandbox), "PRIVATE") == 0)
				*prq_dir |= STAGE_JOBDIR;
		} /* O_WORKDIR check would go here */

	} else {

		/* use the existing request structure */

		if (preq->rq_type == PBS_BATCH_CopyFiles_Cred) {
			pcfc = &preq->rq_ind.rq_cpyfile_cred;
			prq_pair = &pcfc->rq_copyfile.rq_pair;
		} else {
			pcf = &preq->rq_ind.rq_cpyfile;
			prq_pair = &pcf->rq_pair;
		}
	}

	pair = (struct rqfpair *) malloc(sizeof(struct rqfpair));
	if (pair == NULL) {
		free(from);
		free(to);
		free_br(preq);
		return NULL;
	}

	CLEAR_LINK(pair->fp_link);
	pair->fp_local = from;
	pair->fp_rmt = to;
	pair->fp_flag = tflag;
	append_link(prq_pair, &pair->fp_link, pair);
	return (preq);
}
/**
 * @brief
 * 		is_join - Is the file joined to another.
 *
 * @param[in]	pjob	- job structure
 * @param[in]	ati	- job attribute, output/error path.
 *
 * @return	joined or not
 * @retval	0	- either the first or not in list.
 * @retval	1	- being joined.
 */
static int
is_join(job *pjob, enum job_atr ati)
{
	char key;
	char *pd;

	if (ati == JOB_ATR_outpath)
		key = 'o';
	else if (ati == JOB_ATR_errpath)
		key = 'e';
	else
		return (0);
	if (is_jattr_set(pjob, JOB_ATR_join)) {
		pd = get_jattr_str(pjob, JOB_ATR_join);
		if (pd && *pd && (*pd != 'n')) {
			/* if not the first letter, and in list - is joined */
			if ((*pd != key) && (strchr(pd + 1, (int) key)))
				return (1); /* being joined */
		}
	}
	return (0); /* either the first or not in list */
}

/**
 * @brief
 * 		cpy_stdfile - determine if one of the job's standard files (output or error)
 *		is to be copied, if so set up the Copy Files request.
 *
 * @param[in]	preq	- batch request
 * @param[in]	pjob	- job structure
 * @param[in]	ati	- JOB_ATR_, output/error path.
 *
 * @return	modified batch request.
 * @retval	NULL	failure
 */

struct batch_request *
cpy_stdfile(struct batch_request *preq, job *pjob, enum job_atr ati)
{
	char *from;
	char key;
	char *suffix;
	char *to = NULL;
	char *keep;

	/* if the job is interactive, don't bother to return output file */

	if (is_jattr_set(pjob, JOB_ATR_interactive) && get_jattr_long(pjob, JOB_ATR_interactive))
		return NULL;

	/* set up depending on which file */

	if (ati == JOB_ATR_errpath) {
		key = 'e';
		suffix = JOB_STDERR_SUFFIX;
	} else {
		key = 'o';
		suffix = JOB_STDOUT_SUFFIX;
	}

	if (!is_jattr_set(pjob, ati)) { /* This shouldn't be */
		(void) sprintf(log_buffer, "%c file missing", key);
		log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
			  LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
		return NULL;
	}

	/* Is the file joined to another, if so don't copy it */

	if (is_join(pjob, ati))
		return (preq);

	/*
	 * If the job has a keep file attribute, and the specified file is in
	 * the keep list, MOM has already placed the file in the user's HOME
	 * directory.  It don't need to be copied.
	 */
	if (is_jattr_set(pjob, JOB_ATR_keep) && strchr((keep = get_jattr_str(pjob, JOB_ATR_keep)), key) && !strchr(keep, 'd'))
		return (preq);

	/*
	 * If the job has a remove file attribute and the job has succeeded,
	 * std_files doesn't has to be copied.
	 */
	if (is_jattr_set(pjob, JOB_ATR_exit_status)) {
		if (get_jattr_long(pjob, JOB_ATR_exit_status) == JOB_EXEC_OK) {
			if (is_jattr_set(pjob, JOB_ATR_remove) && (strchr(get_jattr_str(pjob, JOB_ATR_remove), key)))
				return (preq);
		}
	}

	/* else go with the supplied name */
	to = strdup(get_jattr_str(pjob, ati));
	if (to == NULL)
		return (preq); /* cannot continue with this one */

	/* build up the name used by MOM as the from name */

	from = setup_from(pjob, suffix);
	if (from == NULL) {
		(void) free(to);
		return (preq);
	}

	/* now set names into the batch request */

	return (setup_cpyfiles(preq, pjob, from, to, STAGE_DIR_OUT, STDJOBFILE));
}

/**
 * @brief
 * 		cpy_stage - set up a Copy Files request to include files specified by the
 *		user to be staged out (also used for stage-in).
 *		"stage_out" is a resource that may or may not *	exist on a host.
 *		If such exists, the files are listed one per string as
 *		"local_name@remote_host:remote_name".
 *
 * @param[in]	preq	- batch request
 * @param[in]	pjob	- job structure
 * @param[in]	ati	- JOB_ATR_stageout
 * @param[in]	direction	-  1 = , 2 =
 *
 * @return	batch_request *
 */

struct batch_request *
cpy_stage(struct batch_request *preq, job *pjob, enum job_atr ati, int direction)
{
	int i;
	char *from;
	struct array_strings *parst;
	char *plocal;
	char *prmt;
	char *to;

	if (is_jattr_set(pjob, ati)) {

		/* at last, we know we have files to stage out/in */

		parst = get_jattr_arst(pjob, ati);
		for (i = 0; i < parst->as_usedptr; ++i) {
			plocal = parst->as_string[i];
			prmt = strchr(plocal, (int) '@');
			if (prmt) {
				*prmt = '\0';
				from = malloc(strlen(plocal) + 1);
				if (from) {
					(void) strcpy(from, plocal);
					*prmt = '@'; /* restore the @ */
				} else {
					return (preq);
				}
				to = malloc(strlen(prmt + 1) + 1);
				if (to) {
					(void) strcpy(to, prmt + 1);
				} else {
					(void) free(from);
					return (preq);
				}
				preq = setup_cpyfiles(preq, pjob, from, to,
						      direction, STAGEFILE);
			}
		}
	}

	return (preq);
}

int
has_stage(job *pjob)
{
	struct batch_request *preq = NULL;

	preq = cpy_stdfile(NULL, pjob, JOB_ATR_outpath);
	if (preq) {
		free_br(preq);
		return 1;
	}
	preq = cpy_stdfile(NULL, pjob, JOB_ATR_errpath);
	if (preq) {
		free_br(preq);
		return 1;
	}
	preq = cpy_stage(NULL, pjob, JOB_ATR_stageout, STAGE_DIR_OUT);
	if (preq) {
		free_br(preq);
		return 1;
	}
	preq = cpy_stage(NULL, pjob, JOB_ATR_stagein, STAGE_DIR_IN);
	if (preq) {
		free_br(preq);
		return 1;
	}
	return 0;
}


================================================
FILE: src/server/job_recov_db.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include <sys/param.h>
#include <execinfo.h>

#include "pbs_ifl.h"
#include <errno.h>
#include <fcntl.h>
#include <string.h>
#include <stdlib.h>
#include <time.h>

#include <unistd.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include <memory.h>
#include "libutil.h"
#include "pbs_db.h"

#define MAX_SAVE_TRIES 3

extern void *svr_db_conn;
extern int server_init_type;
extern pbs_list_head svr_allresvs;
#define BACKTRACE_BUF_SIZE 50
void print_backtrace(char *);

/* global data items */
extern time_t time_now;

job *recov_job_cb(pbs_db_obj_info_t *dbobj, int *refreshed);
resc_resv *recov_resv_cb(pbs_db_obj_info_t *dbobj, int *refreshed);

/**
 * @brief
 *		convert job structure to DB format
 *
 * @see
 * 		job_save_db
 *
 * @param[in]	pjob - Address of the job in the server
 * @param[out]	dbjob - Address of the database job object
 *
 * @retval	-1  Failure
 * @retval	>=0 What to save: 0=nothing, OBJ_SAVE_NEW or OBJ_SAVE_QS
 */
static int
job_to_db(job *pjob, pbs_db_job_info_t *dbjob)
{
	int savetype = 0;
	int save_all_attrs = 0;

	strcpy(dbjob->ji_jobid, pjob->ji_qs.ji_jobid);

	if (check_job_state(pjob, JOB_STATE_LTR_FINISHED))
		save_all_attrs = 1;

	if ((encode_attr_db(job_attr_def, pjob->ji_wattr, JOB_ATR_LAST, &dbjob->db_attr_list, save_all_attrs)) != 0)
		return -1;

	if (pjob->newobj) /* object was never saved/loaded before */
		savetype |= (OBJ_SAVE_NEW | OBJ_SAVE_QS);

	if (compare_obj_hash(&pjob->ji_qs, sizeof(pjob->ji_qs), pjob->qs_hash) == 1) {
		int statenum;

		savetype |= OBJ_SAVE_QS;

		statenum = get_job_state_num(pjob);
		if (statenum == -1) {
			log_errf(PBSE_INTERNAL, __func__, "get_job_state_num failed for job state %c",
				 get_job_state(pjob));
			return -1;
		}

		dbjob->ji_state = statenum;
		dbjob->ji_substate = get_job_substate(pjob);
		dbjob->ji_svrflags = pjob->ji_qs.ji_svrflags;
		dbjob->ji_stime = pjob->ji_qs.ji_stime;
		strcpy(dbjob->ji_queue, pjob->ji_qs.ji_queue);
		strcpy(dbjob->ji_destin, pjob->ji_qs.ji_destin);
		dbjob->ji_un_type = pjob->ji_qs.ji_un_type;
		if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_NEW) {
			dbjob->ji_fromsock = pjob->ji_qs.ji_un.ji_newt.ji_fromsock;
			dbjob->ji_fromaddr = pjob->ji_qs.ji_un.ji_newt.ji_fromaddr;
		} else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_EXEC)
			dbjob->ji_exitstat = pjob->ji_qs.ji_un.ji_exect.ji_exitstat;
		else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_ROUTE) {
			dbjob->ji_quetime = pjob->ji_qs.ji_un.ji_routet.ji_quetime;
			dbjob->ji_rteretry = pjob->ji_qs.ji_un.ji_routet.ji_rteretry;
		} else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_MOM) {
			dbjob->ji_exitstat = pjob->ji_qs.ji_un.ji_momt.ji_exitstat;
		}
		/* extended portion */
		strcpy(dbjob->ji_jid, pjob->ji_extended.ji_ext.ji_jid);
		dbjob->ji_credtype = pjob->ji_extended.ji_ext.ji_credtype;
		dbjob->ji_qrank = get_jattr_ll(pjob, JOB_ATR_qrank);
	}

	return savetype;
}

/**
 * @brief
 *		convert from database to job structure
 *
 * @see
 * 		job_recov_db
 *
 * @param[out]	pjob - Address of the job in the server
 * @param[in]	dbjob - Address of the database job object
 *
 * @retval   !=0  Failure
 * @retval   0    Success
 */
static int
db_to_job(job *pjob, pbs_db_job_info_t *dbjob)
{
	char statec;

	/* Variables assigned constant values are not stored in the DB */
	pjob->ji_qs.ji_jsversion = JSVERSION;
	strcpy(pjob->ji_qs.ji_jobid, dbjob->ji_jobid);

	statec = state_int2char(dbjob->ji_state);
	if (statec == '0') {
		log_errf(PBSE_INTERNAL, __func__, "state_int2char failed to convert state %d", dbjob->ji_state);
		return 1;
	}
	set_job_state(pjob, statec);
	set_job_substate(pjob, dbjob->ji_substate);

	pjob->ji_qs.ji_svrflags = dbjob->ji_svrflags;
	pjob->ji_qs.ji_stime = dbjob->ji_stime;
	strcpy(pjob->ji_qs.ji_queue, dbjob->ji_queue);
	strcpy(pjob->ji_qs.ji_destin, dbjob->ji_destin);
	pjob->ji_qs.ji_fileprefix[0] = 0;
	pjob->ji_qs.ji_un_type = dbjob->ji_un_type;
	if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_NEW) {
		pjob->ji_qs.ji_un.ji_newt.ji_fromsock = dbjob->ji_fromsock;
		pjob->ji_qs.ji_un.ji_newt.ji_fromaddr = dbjob->ji_fromaddr;
		pjob->ji_qs.ji_un.ji_newt.ji_scriptsz = 0;
	} else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_EXEC)
		pjob->ji_qs.ji_un.ji_exect.ji_exitstat = dbjob->ji_exitstat;
	else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_ROUTE) {
		pjob->ji_qs.ji_un.ji_routet.ji_quetime = dbjob->ji_quetime;
		pjob->ji_qs.ji_un.ji_routet.ji_rteretry = dbjob->ji_rteretry;
	} else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_MOM) {
		pjob->ji_qs.ji_un.ji_momt.ji_svraddr = 0;
		pjob->ji_qs.ji_un.ji_momt.ji_exitstat = dbjob->ji_exitstat;
		pjob->ji_qs.ji_un.ji_momt.ji_exuid = 0;
		pjob->ji_qs.ji_un.ji_momt.ji_exgid = 0;
	}

	/* extended portion */
	strcpy(pjob->ji_extended.ji_ext.ji_jid, dbjob->ji_jid);
	pjob->ji_extended.ji_ext.ji_credtype = dbjob->ji_credtype;

	if ((decode_attr_db(pjob, &dbjob->db_attr_list.attrs, job_attr_idx, job_attr_def, pjob->ji_wattr, JOB_ATR_LAST, JOB_ATR_UNKN)) != 0)
		return -1;

	compare_obj_hash(&pjob->ji_qs, sizeof(pjob->ji_qs), pjob->qs_hash);

	pjob->newobj = 0;

	return 0;
}

/**
 * @brief
 *		Save job to database
 *
 * @param[in]	pjob - The job to save
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - Failure
 * @retval	 1 - Jobid clash, retry with new jobid
 *
 */
int
job_save_db(job *pjob)
{
	pbs_db_job_info_t dbjob = {{0}};
	pbs_db_obj_info_t obj;
	void *conn = svr_db_conn;
	int savetype;
	int rc = -1;
	int old_mtime, old_flags;
	char *conn_db_err = NULL;

	old_mtime = get_jattr_long(pjob, JOB_ATR_mtime);
	old_flags = (get_jattr(pjob, JOB_ATR_mtime))->at_flags;

	if ((savetype = job_to_db(pjob, &dbjob)) == -1)
		goto done;

	obj.pbs_db_obj_type = PBS_DB_JOB;
	obj.pbs_db_un.pbs_db_job = &dbjob;

	/* update mtime before save, so the same value gets to the DB as well */
	set_jattr_l_slim(pjob, JOB_ATR_mtime, time_now, SET);
	if ((rc = pbs_db_save_obj(conn, &obj, savetype)) == 0)
		pjob->newobj = 0;

done:
	free_db_attr_list(&dbjob.db_attr_list);

	if (rc != 0) {
		/* revert mtime, flags update */
		set_jattr_l_slim(pjob, JOB_ATR_mtime, old_mtime, SET);
		(get_jattr(pjob, JOB_ATR_mtime))->at_flags = old_flags;

		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to save job %s %s", pjob->ji_qs.ji_jobid, conn_db_err ? conn_db_err : "");
		if (conn_db_err) {
			if ((savetype & OBJ_SAVE_NEW) && strstr(conn_db_err, "duplicate key value"))
				rc = 1;
			free(conn_db_err);
		}

		if (rc == -1)
			panic_stop_db();
	}

	return (rc);
}

/**
 * @brief
 *	Utility function called inside job_recov_db
 *
 * @param[in]	dbjob - Pointer to the database structure of a job
 * @param[in]   pjob  - Pointer to job structure to populate
 *
 * @retval	 NULL - Failure
 * @retval	!NULL - Success, pointer to job structure recovered
 *
 */
job *
job_recov_db_spl(pbs_db_job_info_t *dbjob, job *pjob)
{
	job *pj = NULL;

	if (!pjob) {
		pj = job_alloc();
		pjob = pj;
	}

	if (pjob) {
		if (db_to_job(pjob, dbjob) == 0)
			return (pjob);
	}

	/* error case */
	if (pj)
		job_free(pj); /* free if we allocated here */

	log_errf(PBSE_INTERNAL, __func__, "Failed to decode job %s", dbjob->ji_jobid);

	return (NULL);
}

/**
 * @brief
 *	Recover job from database
 *
 * @param[in]	jid - Job id of job to recover
 * @param[in]	pjob - job pointer, if any, to be updated
 *
 * @return      The recovered job
 * @retval	 NULL - Failure
 * @retval	!NULL - Success, pointer to job structure recovered
 *
 */
job *
job_recov_db(char *jid, job *pjob)
{
	pbs_db_job_info_t dbjob = {{0}};
	pbs_db_obj_info_t obj;
	int rc = -1;
	void *conn = svr_db_conn;
	char *conn_db_err = NULL;

	strcpy(dbjob.ji_jobid, jid);

	rc = pbs_db_load_obj(conn, &obj);
	if (rc == -2)
		return pjob; /* no change in job, return the same job */

	if (rc == 0)
		pjob = job_recov_db_spl(&dbjob, pjob);
	else {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to load job %s %s", jid, conn_db_err ? conn_db_err : "");
		free(conn_db_err);
	}

	free_db_attr_list(&dbjob.db_attr_list);

	return (pjob);
}

/**
 * @brief
 *		convert resv structure to DB format
 *
 * @see
 * 		resv_save_db
 *
 * @param[in]	presv - Address of the resv in the server
 * @param[out]  dbresv - Address of the database resv object
 *
 * @retval   -1  Failure
 * @retval   >=0 What to save: 0=nothing, OBJ_SAVE_NEW or OBJ_SAVE_QS
 */
static int
resv_to_db(resc_resv *presv, pbs_db_resv_info_t *dbresv)
{
	int savetype = 0;

	strcpy(dbresv->ri_resvid, presv->ri_qs.ri_resvID);

	if ((encode_attr_db(resv_attr_def, presv->ri_wattr, (int) RESV_ATR_LAST, &(dbresv->db_attr_list), 0)) != 0)
		return -1;

	if (presv->newobj) /* object was never saved or loaded before */
		savetype |= (OBJ_SAVE_NEW | OBJ_SAVE_QS);

	if (compare_obj_hash(&presv->ri_qs, sizeof(presv->ri_qs), presv->qs_hash) == 1) {
		savetype |= OBJ_SAVE_QS;

		strcpy(dbresv->ri_queue, presv->ri_qs.ri_queue);
		dbresv->ri_duration = presv->ri_qs.ri_duration;
		dbresv->ri_etime = presv->ri_qs.ri_etime;
		dbresv->ri_state = presv->ri_qs.ri_state;
		dbresv->ri_stime = presv->ri_qs.ri_stime;
		dbresv->ri_substate = presv->ri_qs.ri_substate;
		dbresv->ri_svrflags = presv->ri_qs.ri_svrflags;
		dbresv->ri_tactive = presv->ri_qs.ri_tactive;
	}

	return savetype;
}

/**
 * @brief
 *		convert from database to resv structure
 *
 * @param[out]	presv - Address of the resv in the server
 * @param[in]	dbresv - Address of the database resv object
 *
 * @retval   !=0  Failure
 * @retval   0    Success
 */
static int
db_to_resv(resc_resv *presv, pbs_db_resv_info_t *dbresv)
{
	strcpy(presv->ri_qs.ri_resvID, dbresv->ri_resvid);
	strcpy(presv->ri_qs.ri_queue, dbresv->ri_queue);
	presv->ri_qs.ri_duration = dbresv->ri_duration;
	presv->ri_qs.ri_etime = dbresv->ri_etime;
	presv->ri_qs.ri_state = dbresv->ri_state;
	presv->ri_qs.ri_stime = dbresv->ri_stime;
	presv->ri_qs.ri_substate = dbresv->ri_substate;
	presv->ri_qs.ri_svrflags = dbresv->ri_svrflags;
	presv->ri_qs.ri_tactive = dbresv->ri_tactive;

	if ((decode_attr_db(presv, &dbresv->db_attr_list.attrs, resv_attr_idx, resv_attr_def, presv->ri_wattr, RESV_ATR_LAST, RESV_ATR_UNKN)) != 0)
		return -1;

	compare_obj_hash(&presv->ri_qs, sizeof(presv->ri_qs), presv->qs_hash);

	presv->newobj = 0;

	return 0;
}

/**
 * @brief
 *	Save resv to database
 *
 * @param[in]	presv - The resv to save
 * @param[in]   updatetype:
 *		SAVERESV_QUICK - Quick update without attributes
 *		SAVERESV_FULL  - Full update with attributes
 *		SAVERESV_NEW   - New resv, insert into database
 *
 * @return      Error code
 * @retval	 0 - Success
 * @retval	-1 - Failure
 * @retval	 1 - resvid clash, retry with new resvid
 *
 */
int
resv_save_db(resc_resv *presv)
{
	pbs_db_resv_info_t dbresv = {{0}};
	pbs_db_obj_info_t obj;
	void *conn = svr_db_conn;
	int savetype;
	int rc = -1;
	int old_mtime, old_flags;
	char *conn_db_err = NULL;
	attribute *mtime;

	mtime = get_rattr(presv, RESV_ATR_mtime);
	old_mtime = get_attr_l(mtime);
	old_flags = mtime->at_flags;

	if ((savetype = resv_to_db(presv, &dbresv)) == -1)
		goto done;

	obj.pbs_db_obj_type = PBS_DB_RESV;
	obj.pbs_db_un.pbs_db_resv = &dbresv;

	/* update mtime before save, so the same value gets to the DB as well */
	set_rattr_l_slim(presv, RESV_ATR_mtime, time_now, SET);
	if ((rc = pbs_db_save_obj(conn, &obj, savetype)) == 0)
		presv->newobj = 0;

done:
	free_db_attr_list(&dbresv.db_attr_list);

	if (rc != 0) {
		set_attr_l(mtime, old_mtime, SET);
		mtime->at_flags = old_flags;

		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to save resv %s %s", presv->ri_qs.ri_resvID, conn_db_err ? conn_db_err : "");
		if (conn_db_err) {
			if ((savetype & OBJ_SAVE_NEW) && strstr(conn_db_err, "duplicate key value"))
				rc = 1;
			free(conn_db_err);
		}

		if (rc == -1)
			panic_stop_db();
	}

	return (rc);
}

/**
 * @brief
 *	Recover resv from database
 *
 * @param[in]	resvid - Resv id to recover
 * @param[in]	presv - Resv pointer, if any, to be updated
 *
 * @return      The recovered reservation
 * @retval	 NULL - Failure
 * @retval	!NULL - Success, pointer to resv structure recovered
 *
 */
resc_resv *
resv_recov_db(char *resvid, resc_resv *presv)
{
	resc_resv *pr = NULL;
	pbs_db_resv_info_t dbresv = {{0}};
	pbs_db_obj_info_t obj;
	void *conn = svr_db_conn;
	int rc = -1;
	char *conn_db_err = NULL;

	if (!presv) {
		if ((pr = resv_alloc(resvid)) == NULL) {
			log_err(-1, __func__, "resv_alloc failed");
			return NULL;
		}
		presv = pr;
	}

	strcpy(dbresv.ri_resvid, resvid);
	obj.pbs_db_obj_type = PBS_DB_RESV;
	obj.pbs_db_un.pbs_db_resv = &dbresv;

	rc = pbs_db_load_obj(conn, &obj);
	if (rc == -2)
		return presv; /* no change in resv */

	if (rc == 0)
		rc = db_to_resv(presv, &dbresv);

	free_db_attr_list(&dbresv.db_attr_list);

	if (rc != 0) {
		presv = NULL; /* so we return NULL */

		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to load resv %s %s", resvid, conn_db_err ? conn_db_err : "");
		free(conn_db_err);
		if (pr)
			resv_free(pr); /* free if we allocated here */
	}

	return presv;
}

/**
 * @brief
 *	Refresh/retrieve job from database and add it into AVL tree if not present
 *
 *	@param[in]  dbobj     - The pointer to the wrapper job object of type pbs_db_job_info_t
 * 	@param[out]  refreshed - To check if job is refreshed
 *
 * @return	The recovered job
 * @retval	NULL - Failure
 * @retval	!NULL - Success, pointer to job structure recovered
 *
 */
job *
recov_job_cb(pbs_db_obj_info_t *dbobj, int *refreshed)
{
	job *pj = NULL;
	pbs_db_job_info_t *dbjob = dbobj->pbs_db_un.pbs_db_job;
	static int numjobs = 0;

	*refreshed = 0;
	if ((pj = job_recov_db_spl(dbjob, NULL)) == NULL) {
		if ((server_init_type == RECOV_COLD) || (server_init_type == RECOV_CREATE)) {
			/* remove the loaded job from db */
			if (pbs_db_delete_obj(svr_db_conn, dbobj) != 0)
				log_errf(PBSE_SYSTEM, __func__, "job %s not purged", dbjob->ji_jobid);
		}
		goto err;
	}

	pbsd_init_job(pj, server_init_type);
	*refreshed = 1;

	if ((++numjobs % 20) == 0) {
		/* periodically touch the file so the  */
		/* world knows we are alive and active */
		update_svrlive();
	}

err:
	free_db_attr_list(&dbjob->db_attr_list);
	if (pj == NULL)
		log_errf(PBSE_SYSTEM, __func__, "Failed to recover job %s", dbjob->ji_jobid);
	return pj;
}

/**
 * @brief
 * 		recov_resv_cb - callback function to process and load
 * 					  resv database result to pbs structure.
 *
 * @param[in]	dbobj	- database resv structure to C.
 * @param[out]	refreshed - To check if reservation recovered
 *
 * @return	resv structure - on success
 * @return 	NULL - on failure
 */
resc_resv *
recov_resv_cb(pbs_db_obj_info_t *dbobj, int *refreshed)
{
	resc_resv *presv = NULL;
	pbs_db_resv_info_t *dbresv = dbobj->pbs_db_un.pbs_db_resv;
	int load_type = 0;

	*refreshed = 0;
	/* if resv is not in list, load the resv from database */
	if ((presv = resv_recov_db(dbresv->ri_resvid, NULL)) == NULL)
		goto err;

	pbsd_init_resv(presv, load_type);
	*refreshed = 1;
err:
	free_db_attr_list(&dbresv->db_attr_list);
	if (presv == NULL)
		log_errf(-1, __func__, "Failed to recover resv %s", dbresv->ri_resvid);
	return presv;
}


================================================
FILE: src/server/job_route.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	job_route.c
 * @brief
 * 		job_route.c - functions to route a job to another queue
 *
 * Included functions are:
 *
 *	job_route() - attempt to route a job to a new destination.
 *	add_dest()	- Add an entry to the list of bad destinations for a job.
 *	is_bad_dest()	- Check the job for a match of dest in the list of rejected destinations.
 *	default_router()	- basic function for "routing" jobs.
 *	queue_route()	- route any "ready" jobs in a specific queue
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>

#include "pbs_ifl.h"
#include <errno.h>
#include <string.h>
#include <stdlib.h>
#include "pbs_error.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "work_task.h"
#include "server.h"
#include "log.h"
#include "credential.h"
#include "libpbs.h"
#include "batch_request.h"
#include "resv_node.h"
#include "queue.h"

#include "job.h"
#include "reservation.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include <memory.h>

/* Local Functions */

/* Global Data */

extern char *msg_badstate;
extern char *msg_routexceed;
extern char *msg_routebad;
extern char *msg_err_malloc;
extern time_t time_now;

/**
 * @brief
 * 		Add an entry to the list of bad destinations for a job.
 *
 * @see
 * 		default_router and post_routejob.
 *
 *	@param[in]	jobp - pointer to job structure
 *
 * @return	void
 */

void
add_dest(job *jobp)
{
	badplace *bp;
	char *baddest = jobp->ji_qs.ji_destin;

	bp = (badplace *) malloc(sizeof(badplace));
	if (bp == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		return;
	}
	CLEAR_LINK(bp->bp_link);

	strcpy(bp->bp_dest, baddest);

	append_link(&jobp->ji_rejectdest, &bp->bp_link, bp);
	return;
}

/**
 * @brief
 * 		Check the job for a match of dest in the list of rejected destinations.
 *
 * @see
 * 		default_router
 *
 * @param[in]	jobp - pointer to job structure
 * @param[in]	dest - destination which needs to be matched.
 *
 *	Return: pointer if found, NULL if not.
 */

badplace *
is_bad_dest(job *jobp, char *dest)
{
	badplace *bp;

	bp = (badplace *) GET_NEXT(jobp->ji_rejectdest);
	while (bp) {
		if (strcmp(bp->bp_dest, dest) == 0)
			break;
		bp = (badplace *) GET_NEXT(bp->bp_link);
	}
	return (bp);
}

/**
 * @brief
 * 		default_router - basic function for "routing" jobs.
 *		Does a round-robin attempt on the destinations as listed,
 *		job goes to first destination that takes it.
 *
 *		If no destination will accept the job, PBSE_ROUTEREJ is returned,
 *		otherwise 0 is returned.
 *
 * @see
 * 		site_alt_router and job_route.
 *
 * @param[in,out]	jobp - pointer to job structure
 * @param[in]	qp - PBS queue.
 * @param[in]	retry_time - retry time before each attempt.
 *
 * @return	int
 * @retval	0	- success
 * @retval	PBSE_ROUTEREJ	- If no destination will accept the job
 */

int
default_router(job *jobp, struct pbs_queue *qp, long retry_time)
{
	struct array_strings *dests = NULL;
	char *destination;
	int last;

	if (is_qattr_set(qp, QR_ATR_RouteDestin)) {
		dests = get_qattr_arst(qp, QR_ATR_RouteDestin);
		last = dests->as_usedptr;
	} else
		last = 0;

	/* loop through all possible destinations */

	while (1) {
		if (jobp->ji_lastdest >= last) {
			jobp->ji_lastdest = 0; /* have tried all */
			if (jobp->ji_retryok == 0) {
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG,
					  jobp->ji_qs.ji_jobid, msg_routebad);
				return (PBSE_ROUTEREJ);
			} else {

				/* set time to retry job */
				jobp->ji_qs.ji_un.ji_routet.ji_rteretry = retry_time;
				jobp->ji_retryok = 0;
				return (0);
			}
		}

		destination = dests->as_string[jobp->ji_lastdest++];

		if (is_bad_dest(jobp, destination))
			continue;

		switch (svr_movejob(jobp, destination, NULL)) {

			case -1: /* permanent failure */
				add_dest(jobp);
				break;

			case 0: /* worked */
			case 2: /* deferred */
				return (0);

			case 1: /* failed, but try destination again */
				jobp->ji_retryok = 1;
				break;
		}
	}
}

/**
 * @brief
 * 		job_route - route a job to another queue
 *
 * 		This is only called for jobs in a routing queue.
 * 		Loop over all the possible destinations for the route queue.
 * 		Check each one to see if it is ok to try it.  It could have been
 * 		tried before and returned a rejection.  If so, skip to the next
 * 		destination.  If it is ok to try it, look to see if it is a local
 * 		queue.  If so, it is an internal procedure to try/do the move.
 * 		If not, a child process is created to deal with it in the
 * 		function net_route(), see svr_movejob.c
 *
 * @see
 * 		queue_route
 *
 * @param[in]	jobp - pointer to job structure
 *
 *@return	int
 *@retval	0	- success
 *@retval	non-zero	- failure
 */

int
job_route(job *jobp)
{
	int bad_state = 0;
	time_t life;
	struct pbs_queue *qp;
	long retry_time;

	/* see if the job is able to be routed */

	switch (get_job_state(jobp)) {

		case JOB_STATE_LTR_TRANSIT:
			return (0); /* already going, ignore it */

		case JOB_STATE_LTR_QUEUED:
			break; /* ok to try */

		case JOB_STATE_LTR_HELD:
			bad_state = !get_qattr_long(jobp->ji_qhdr, QR_ATR_RouteHeld);
			break;

		case JOB_STATE_LTR_WAITING:
			bad_state = !get_qattr_long(jobp->ji_qhdr, QR_ATR_RouteWaiting);
			break;

		case JOB_STATE_LTR_MOVED:
		case JOB_STATE_LTR_FINISHED:
			/*
			 * If the job in ROUTE_Q is already deleted (ji_state ==
			 * JOB_STATE_LTR_FINISHED) or routed (ji_state == JOB_STATE_LTR_MOVED)
			 * and kept for history purpose, then ignore it until being
			 * cleaned up by SERVER.
			 */
			return (0);

		default:
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				   jobp->ji_qs.ji_jobid, "(%s) %s, state=%d",
				   __func__, msg_badstate, get_job_state(jobp));
			return (0);
	}

	/* check the queue limits, can we route any (more) */

	qp = jobp->ji_qhdr;
	if (get_qattr_long(qp, QA_ATR_Started) == 0)
		return (0); /* queue not started - no routing */

	if (is_qattr_set(qp, QA_ATR_MaxRun) && get_qattr_long(qp, QA_ATR_MaxRun) <= qp->qu_njstate[JOB_STATE_TRANSIT])
		return (0); /* max number of jobs being routed */

	/* what is the retry time and life time of a job in this queue */

	if (is_qattr_set(qp, QR_ATR_RouteRetryTime))
		retry_time = (long) time_now + get_qattr_long(qp, QR_ATR_RouteRetryTime);
	else
		retry_time = (long) time_now + PBS_NET_RETRY_TIME;

	if (is_qattr_set(qp, QR_ATR_RouteLifeTime))
		life = jobp->ji_qs.ji_un.ji_routet.ji_quetime + get_qattr_long(qp, QR_ATR_RouteLifeTime);
	else
		life = 0; /* forever */

	if (life && (life < time_now)) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  jobp->ji_qs.ji_jobid, msg_routexceed);
		return (PBSE_ROUTEEXPD); /* job too long in queue */
	}

	if (bad_state)	    /* not currently routing this job */
		return (0); /* else ignore this job */

	if (get_qattr_long(qp, QR_ATR_AltRouter) == 0)
		return (default_router(jobp, qp, retry_time));
	else
		return (site_alt_router(jobp, qp, retry_time));
}

/**
 * @brief
 * 		queue_route - route any "ready" jobs in a specific queue
 *
 *		look for any job in the queue whose route retry time has
 *		passed.

 *		If the queue is "started" and if the number of jobs in the
 *		Transiting state is less than the max_running limit, then
 *		attempt to route it.
 *
 * @see
 * 		main
 *
 * @param[in]	pque	- PBS queue.
 *
 * @return	void
 */

void
queue_route(pbs_queue *pque)
{
	job *nxjb;
	job *pjob;
	int rc;

	pjob = (job *) GET_NEXT(pque->qu_jobs);
	while (pjob) {
		nxjb = (job *) GET_NEXT(pjob->ji_jobque);
		if (pjob->ji_qs.ji_un.ji_routet.ji_rteretry <= time_now) {
			if ((rc = job_route(pjob)) == PBSE_ROUTEREJ)
				job_abt(pjob, msg_routebad);
			else if (rc == PBSE_ROUTEEXPD)
				job_abt(pjob, msg_routexceed);
		}
		pjob = nxjb;
	}
}


================================================
FILE: src/server/license_client.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	license_client.c
 * @brief
 *  This file contains stub functions
 * which are not used in the open source.
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_internal.h"
#include <sys/types.h>
#include "pbs_nodes.h"
#include "pbs_license.h"

#define LICSTATE_SERVER_UNCONF 0x1  /* no license server configured */
#define LICSTATE_HAS_SERVER 0x2	    /* license server reachable */
#define LICSTATE_SOCKETS_UNCONF 0x4 /* no socket license file configured */
#define LICSTATE_HAS_SOCKETS 0x8    /* nonzero number of socket licenses */

enum licensing_backend prev_lb = LIC_UNKNOWN; /* Value of previous licensing backend. */
enum licensing_backend last_valid_attempt = LIC_UNKNOWN;

int pbs_licensing_checkin(void);
int pbs_checkout_licensing(int);
char *pbs_license_location(void);
void inspect_license_path(void);
int licstate_is_configured(enum licensing_backend);
int licstate_is_up(enum licensing_backend);

/**
 * @brief
 *		pbs_licensing_status	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	LICSTATE_HAS_SOCKETS
 */
int
pbs_licensing_status(void)
{
	return (LICSTATE_HAS_SOCKETS);
}

/**
 * @brief
 *		pbs_licensing_count	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	10000000
 */
int
pbs_licensing_count(void)
{
	return (licenses.lb_aval_floating);
}

/**
 * @brief
 *		pbs_open_con_licensing	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	zero
 */
int
pbs_open_con_licensing(void)
{
	return (0);
}

/**
 * @brief
 *		pbs_close_con_licensing	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
pbs_close_con_licensing(void)
{
}

/**
 * @brief
 *		pbs_licensing_checkin	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	zero
 */
int
pbs_licensing_checkin(void)
{
	return (0);
}

/**
 * @brief
 *		pbs_checkout_licensing	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	need
 */
int
pbs_checkout_licensing(int need)
{
	return (need);
}

/**
 * @brief
 *		pbs_license_location	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	NULL
 */
char *
pbs_license_location(void)
{
	return (pbs_licensing_license_location);
}

/**
 * @brief
 *		inspect_license_path	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
inspect_license_path(void)
{
}

/**
 * @brief
 *		init_socket_licenses	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
init_socket_licenses(char *license_file)
{
}

/**
 * @brief
 *		sockets_release	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
sockets_release(int nsockets)
{
	return;
}

/**
 * @brief
 *		sockets_consume	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	zero
 */
int
sockets_consume(int nsockets)
{
	return (0);
}

/**
 * @brief
 *		licstate_unconfigured	- It's a placeholder function
 * 		which has intentionally kept empty.
 */
void
licstate_unconfigured(enum licensing_backend lb)
{
}

/**
 * @brief
 *		licstate_down	- It's a placeholder function
 * 		which has intentionally kept empty.
 */
void
licstate_down(void)
{
}

/**
 * @brief
 *		licstate_is_up	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	LICSTATE_HAS_SOCKETS
 */
int
licstate_is_configured(enum licensing_backend lb)
{
	return (LICSTATE_HAS_SOCKETS);
}

/**
 * @brief
 *		licstate_is_up	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	one
 */
int
licstate_is_up(enum licensing_backend lb)
{
	return (1);
}

/**
 * @brief
 *		license_sanity_check	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	zero
 */
int
license_sanity_check(void)
{
	return (0);
}

/**
 * @brief
 *		license_more_nodes	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
license_more_nodes(void)
{
	return;
}

/**
 * @brief
 *		propagate_socket_licensing	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
propagate_socket_licensing(mominfo_t *pmom)
{
	return;
}

/**
 * @brief
 *		nsockets_from_topology	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	zero
 */
int
nsockets_from_topology(char *topology_str, ntt_t type, struct pbsnode *pnode)
{
	return 0;
}

/**
 * @brief
 *		unlicense_socket_licensed_nodes	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
unlicense_socket_licensed_nodes(void)
{
	return;
}

/**
 * @brief
 *		clear_license_info	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
clear_license_info(void)
{
	return;
}

/**
 * @brief
 *		release_node_lic	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return zero
 */
int
release_node_lic(void *pobj)
{
	return 0;
}

/**
 * @brief
 *		validate_sign	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return True
 */
int
validate_sign(char *sign, void *pobj)
{
	return 1;
}

/**
 * @brief
 *		check_sign	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return zero
 */
int
check_sign(void *pobj, void *new)
{
	return 0;
}

/**
 * @brief
 *		process_topology_info	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
process_topology_info(void *pobj, char *topology_str, ntt_t type)
{
	return;
}

/**
 * @brief
 *		unset_signature	- It's a placeholder function
 * 		which has intentionally kept empty.
 * @return	void
 */
void
unset_signature(void *pobj, char *rs_name)
{
	return;
}


================================================
FILE: src/server/licensing_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    licensing_func.c
 *
 * @brief
 * 		licensing_func.c - miscellaneous server functions
 *
 * Functions included are:
 *
 */

#include <pbs_config.h>

#include <time.h>
#include "pbs_nodes.h"
#include "pbs_license.h"
#include "server.h"
#include "work_task.h"
#include "liblicense.h"
#include "svrfunc.h"

#define TEMP_BUF_LEN 20

pbs_licensing_control licensing_control;
pbs_license_counts license_counts;
pbs_list_head unlicensed_nodes_list;
struct work_task *init_licensing_task;
struct work_task *get_more_licenses_task;
struct work_task *licenses_linger_time_task;
extern time_t time_now;
/**
 * @brief
 * 	consume_licenses - use count licenses from the pool of
 * 			   already checked out licenses.
 *
 * @param[in]	- count	- number of licenses to consume
 *
 * @return int
 * @retval  0 - success - able to consume count licenses
 * @retval -1 - not enough licenses available.
 */
static int
consume_licenses(long count)
{
	if (count <= license_counts.licenses_local) {
		license_counts.licenses_local -= count;
		license_counts.licenses_used += count;
		return 0;
	} else
		return -1;
}

/**
 * @brief
 * 	return_licenses - return count licenses back to the
 * 			  pool of already checked out licenses.
 *
 * @param[in]	- count	- number of licenses to consume
 *
 * @return void
 */
static void
return_licenses(long count)
{
	license_counts.licenses_local += count;
	license_counts.licenses_used -= count;
}

/**
 * @brief
 * 	add_to_unlicensed_node_list - add a node to the list
 * 				      of unlicensed nodes
 *
 * @param[in]	- index - index of the node
 *
 * @return void
 */
static void
add_to_unlicensed_node_list(struct pbsnode *pnode)
{

	if (pnode->nd_svrflags & NODE_UNLICENSED)
		return;

	CLEAR_LINK(pnode->un_lic_link);

	append_link(&unlicensed_nodes_list, &pnode->un_lic_link, pnode);

	pnode->nd_svrflags |= NODE_UNLICENSED;
}

/**
 * @brief
 * 	remove_from_unlicensed_node_list - remove a node from
 * 					   the list of
 * 					   unlicensed nodes.
 *
 * @param[in]	- index	- index of the node
 *
 * @return void
 */
void
remove_from_unlicensed_node_list(struct pbsnode *pnode)
{
	if (!(pnode->nd_svrflags & NODE_UNLICENSED))
		return;

	pnode->nd_svrflags &= ~NODE_UNLICENSED;
	delete_link(&pnode->un_lic_link);
}

/**
 * @brief
 *	distribute_licenseinfo - for cray all the inventory is reported by the first vnode.
 *		so it has to be distributed to subsidiary vnodes.
 *		The distribution may not be even but we are trying our best.
 *
 * @param[in]	pointer to mom_svrinfo_t
 * @param[in]	total license count needed to be distributed.
 *
 * @return	void
 *
 * @par MT-Safe:	no
 */
static void
distribute_licenseinfo(mominfo_t *pmom, int lic_count)
{
	int i;
	pbsnode *pnode = NULL;
	int numvnds = ((mom_svrinfo_t *) pmom->mi_data)->msr_numvnds;
	int lic_rem = lic_count % (numvnds - 1);

	if (lic_count <= 0)
		return;

	for (i = 1; i < numvnds; i++) {
		pnode = ((mom_svrinfo_t *) pmom->mi_data)->msr_children[i];
		if (lic_rem) {
			set_nattr_l_slim(pnode, ND_ATR_LicenseInfo, ((lic_count / (numvnds - 1)) + 1), SET);
			lic_rem -= 1;
		} else {
			set_nattr_l_slim(pnode, ND_ATR_LicenseInfo, (lic_count / (numvnds - 1)), SET);
		}
	}
}

/**
 * @brief
 *		propagate the ND_ATR_License == ND_LIC_TYPE_locked value to
 *		subsidiary vnodes
 *
 * @param[in]	pointer to mom_svrinfo_t
 *
 * @return	void
 *
 * @par MT-Safe:	no
 * @par Side Effects:
 * 		socket license attribute modifications
 *
 * @par Note:
 *		Normally, a natural vnode's socket licensing state propagates
 *		to the subsidary vnodes.  However, this is not the case when
 *		the natural vnode is representing a Cray login node:  Cray login
 *		and compute nodes are licensed separately;  the socket licensing
 *		state propagates freely among a MoM's compute nodes but not from
 *		a login node to any compute node.
 */
void
propagate_licenses_to_vnodes(mominfo_t *pmom)
{
	struct pbsnode *ptmp = /* pointer to natural vnode */
		((mom_svrinfo_t *) pmom->mi_data)->msr_children[0];
	resource_def *prdefvntype;
	resource *prc; /* vntype resource pointer */
	struct array_strings *as;
	pbsnode *pfrom_Lic;   /* source License pointer */
	attribute *pfrom_RA;  /* source ResourceAvail pointer */
	int node_index_start; /* where we begin looking for socket licenses */
	int i;
	int lic_count;

	/* Any other vnodes? If not, no work to do */
	if (((mom_svrinfo_t *) pmom->mi_data)->msr_numvnds < 2)
		return;

	prdefvntype = &svr_resc_def[RESC_VNTYPE];

	/*
 	 * Determine where to begin looking for socket licensed nodes:  if
 	 * the natural vnode is for a Cray login node, the important nodes
 	 * are those for Cray compute nodes, which begin after the
 	 * login node (which is always the natural vnode and therefore
 	 * always first);  otherwise, we start looking at the beginning.
 	 */
	pfrom_RA = get_nattr(ptmp, ND_ATR_ResourceAvail);
	if (((pfrom_RA->at_flags & ATR_VFLAG_SET) != 0) &&
	    ((prc = find_resc_entry(pfrom_RA, prdefvntype)) != NULL) &&
	    ((prc->rs_value.at_flags & ATR_VFLAG_SET) != 0)) {
		/*
 		 * Node has a ResourceAvail vntype entry;  see whether it
 		 * contains CRAY_LOGIN.
 		 */
		as = prc->rs_value.at_val.at_arst;
		for (i = 0; i < as->as_usedptr; i++)
			if (strcmp(as->as_string[i], CRAY_LOGIN) == 0) {
				node_index_start = 1;
				break;
			} else
				node_index_start = 0;
	} else
		node_index_start = 0;

	/*
 	 * Make a pass over the subsidiary vnodes to see whether any have socket
 	 * licenses;  if not, no work to do.
 	 */
	for (i = node_index_start, pfrom_Lic = NULL, lic_count = 0;
	     i < ((mom_svrinfo_t *) pmom->mi_data)->msr_numvnds; i++) {
		pbsnode *n = ((mom_svrinfo_t *) pmom->mi_data)->msr_children[i];

		if (is_nattr_set(n, ND_ATR_LicenseInfo))
			lic_count = get_nattr_long(n, ND_ATR_LicenseInfo);

		if (is_nattr_set(n, ND_ATR_License) && get_nattr_c(n, ND_ATR_License) == ND_LIC_TYPE_locked) {
			pfrom_Lic = n;
		} else
			add_to_unlicensed_node_list(n);
	}
	if (node_index_start)
		distribute_licenseinfo(pmom, lic_count);

	if (pfrom_Lic == NULL)
		return;

	/*
 	 * Now make another pass, this time updating the other vnodes'
 	 * ND_ATR_License attribute.
 	 */
	for (i = node_index_start;
	     i < ((mom_svrinfo_t *) pmom->mi_data)->msr_numvnds; i++) {
		pbsnode *n = ((mom_svrinfo_t *) pmom->mi_data)->msr_children[i];
		set_nattr_c_slim(n, ND_ATR_License, ND_LIC_TYPE_locked, SET);
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE,
			   LOG_DEBUG, pmom->mi_host, "ND_ATR_License copied from %s to %s",
			   pfrom_Lic->nd_name, n->nd_name);
	}
}

/**
 * @brief
 * 	clear_node_lic_attrs -	clear a node's ND_ATR_License and maybe
 * 				ND_ATR_LicenseInfo
 *
 * @param[in] - pnode - pointer to the node
 * @param[in] - clear_license_info - if ND_ATR_LicenseInfo should be cleared.
 *
 * @return void
 */
void
clear_node_lic_attrs(pbsnode *pnode, int clear_license_info)
{
	if (clear_license_info && is_nattr_set(pnode, ND_ATR_LicenseInfo))
		clear_nattr(pnode, ND_ATR_LicenseInfo);

	if (is_nattr_set(pnode, ND_ATR_License)) {
		clear_nattr(pnode, ND_ATR_License);
		pnode->nd_svrflags &= ~NODE_UNLICENSED;
	}
}

/**
 * @brief
 * 	set_node_lic_info_attr	- set node's license information
 * 				  ND_ATR_LicenseInfo
 *
 * @param - pnode - pointer to the node
 *
 * @return - void
 */
void
set_node_lic_info_attr(pbsnode *pnode)
{
	int state = lic_needed_for_node(pnode->nd_lic_info);

	if (state == -3)
		return;
	else {
		set_nattr_l_slim(pnode, ND_ATR_LicenseInfo, state, SET);
		node_save_db(pnode);
	}
}

/**
 * @brief
 * 	check_license_expiry - 	checks if licenses are about to expire,
 * 				and if so logs the warning message and
 * 				sends an email to the account defined
 * 				by the 'mail_from' server attribute
 * 				about an expiring license.
 * @return - void
 */
void
check_license_expiry(struct work_task *wt)
{
	char *warn_str = NULL;

	warn_str = lic_check_expiry();
	if (warn_str && (strlen(warn_str) > 0)) {
		struct tm *plt;

		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  msg_daemonname, warn_str);

		plt = localtime(&time_now);
		if (plt && (plt->tm_yday != licensing_control.expiry_warning_email_yday)) {
			/* Send email at most once a day to prevent
			 * bombarding a recipient's inbox.
			 * NOTE: Sending of email can also be turned off
			 * by unsetting the 'mail_from' server attribute.
			 */
			sprintf(log_buffer, "License server %s: %s",
				pbs_licensing_location, warn_str);
			svr_mailowner(0, 0, 0, log_buffer);
			licensing_control.expiry_warning_email_yday = plt->tm_yday;
		}
	}
	set_task(WORK_Timed, time_now + 86400, check_license_expiry, NULL);
}

/**
 * @brief
 * 	get_licenses	- get count licenses from pbs_license_info
 *
 * @param[in]	- count	- number of licenses
 *
 * @return - int
 * @retval - 0 -   Succces
 * @retval - < 0 - Failure
 */
int
get_licenses(int lic_count)
{
	int status;
	int diff = lic_count - licensing_control.licenses_checked_out;
	/* Try getting the licenses */
	status = lic_get(lic_count);
	if (status < 0) {
		sprintf(log_buffer,
			"%d licenses could not be checked out from pbs_license_info=%s",
			lic_count, pbs_licensing_location);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_NOTICE, msg_daemonname, log_buffer);
		license_counts.licenses_local = 0;
		license_counts.licenses_used = 0;
		licensing_control.licenses_checked_out = 0;
	} else {
		sprintf(log_buffer,
			"%d licenses checked out from pbs_license_info=%s",
			lic_count, pbs_licensing_location);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_NOTICE, msg_daemonname, log_buffer);

		licensing_control.licenses_checked_out = lic_count;
		licensing_control.licenses_checkout_time = time_now;
		license_counts.licenses_local = lic_count - license_counts.licenses_used;
		license_counts.licenses_global -= diff;
	}
	check_license_expiry(NULL);
	return status;
}

/**
 * @brief
 * 	calc_licences_allowed - calculate the number of licenses that can be
 * 				checked out based on pbs_license_min and
 * 				pbs_license_max
 *
 * @return	int
 * @retval	n	: number of licenses we can check out
 *
 * @Note - should be called only after lic_obtainable() has been called.
 */

static long
calc_licenses_allowed()
{
	long count = licensing_control.licenses_total_needed;

	if (licensing_control.licenses_min > count)
		count = licensing_control.licenses_min;

	if (licensing_control.licenses_max < count)
		count = licensing_control.licenses_max;

	if ((license_counts.licenses_global + licensing_control.licenses_checked_out) < count)
		count = license_counts.licenses_global + licensing_control.licenses_checked_out;

	return count;
}

/**
 * @brief
 * 	get_more_licenses - task to get more licenses when we have unlicensed nodes
 *
 * @param[in] - ptask
 *
 * @return void
 */
void
get_more_licenses(struct work_task *ptask)
{
	int status;
	long lic_count;

	get_more_licenses_task = NULL;

	license_counts.licenses_global = lic_obtainable();

	if (license_counts.licenses_global < (licensing_control.licenses_total_needed - licensing_control.licenses_checked_out))
		get_more_licenses_task = set_task(WORK_Timed, time_now + 300, get_more_licenses, NULL);

	if (license_counts.licenses_global > 0) {
		lic_count = calc_licenses_allowed();
		if (lic_count != licensing_control.licenses_checked_out) {
			if ((lic_count < licensing_control.licenses_checked_out) && (lic_count < licensing_control.licenses_total_needed)) {
				int i;
				for (i = 0; i < svr_totnodes; i++)
					clear_node_lic_attrs(pbsndlist[i], 0);
				license_counts.licenses_used = 0;
			}
			status = get_licenses(lic_count);
			if (status == 0)
				license_nodes();
		}
	} else
		license_counts.licenses_global = 0;
}

/**
 * @brief - update_license_highuse - record max number of lic used over time
 * 				     This information is logged into the
 * 				     accounting license file.
 */
static void
update_license_highuse(void)
{
	int u;

	u = license_counts.licenses_used;
	if (u > license_counts.licenses_high_use.lu_max_hr)
		license_counts.licenses_high_use.lu_max_hr = u;
	if (u > license_counts.licenses_high_use.lu_max_day)
		license_counts.licenses_high_use.lu_max_day = u;
	if (u > license_counts.licenses_high_use.lu_max_month)
		license_counts.licenses_high_use.lu_max_month = u;
	if (u > license_counts.licenses_high_use.lu_max_forever)
		license_counts.licenses_high_use.lu_max_forever = u;
}

/**
 * @brief
 * 	license_one_node - try licensing a single node
 *
 * @param[in] pnode - pointer to the node
 *
 * @return void
 */
void
license_one_node(pbsnode *pnode)
{
	set_node_lic_info_attr(pnode);

	if (license_counts.licenses_global > 0 || license_counts.licenses_used > 0) {
		if (get_nattr_c(pnode, ND_ATR_License) != ND_LIC_TYPE_locked) {
			if (consume_licenses(get_nattr_long(pnode, ND_ATR_LicenseInfo)) == 0) {
				set_nattr_c_slim(pnode, ND_ATR_License, ND_LIC_TYPE_locked, SET);
				update_license_highuse();
			} else {
				add_to_unlicensed_node_list(pnode);
				if (is_nattr_set(pnode, ND_ATR_LicenseInfo)) {
					licensing_control.licenses_total_needed += get_nattr_long(pnode, ND_ATR_LicenseInfo);
				}
				if (get_more_licenses_task)
					delete_task(get_more_licenses_task);
				get_more_licenses_task = set_task(WORK_Timed, time_now + 2, get_more_licenses, NULL);
			}
		}
	} else
		add_to_unlicensed_node_list(pnode);
}

/**
 * @brief	On Cray, we need to release all licenses distributed across
 * 		the vnodes before consuming the bulk count of licenses
 * 		for the first vnode. Distribution will be done at a later stage.
 *
 * @param[in,out]	pnode	- pointer to node structure
 * @param[in]		type	- type of topology info
 *
 * @return	void
 */
void
release_lic_for_cray(struct pbsnode *pnode)
{
	int i;

	for (i = 0; i < pnode->nd_nummoms; i++) {
		if (((mom_svrinfo_t *) pnode->nd_moms[i]->mi_data)->msr_numvnds > 1) {
			mom_svrinfo_t *mi_data = (mom_svrinfo_t *) pnode->nd_moms[i]->mi_data;
			for (i = 1; i < mi_data->msr_numvnds; i++) {
				pnode = mi_data->msr_children[i];
				if (is_nattr_set(pnode, ND_ATR_License) && get_nattr_c(pnode, ND_ATR_License) == ND_LIC_TYPE_locked) {
					clear_nattr(pnode, ND_ATR_License);
					return_licenses(get_nattr_long(pnode, ND_ATR_LicenseInfo));
				}
			}
			break;
		}
	}
}

/**
 * @brief
 * 	license_nodes - License the nodes
 *
 * @return void
 */
void
license_nodes()
{
	int i;
	pbsnode *np, *pnext;

	np = (pbsnode *) GET_NEXT(unlicensed_nodes_list);
	while (np != NULL) {
		pnext = (pbsnode *) GET_NEXT(np->un_lic_link);
		if (get_nattr_c(np, ND_ATR_License) != ND_LIC_TYPE_locked) {
			if (is_nattr_set(np, ND_ATR_LicenseInfo)) {
				if (consume_licenses(get_nattr_long(np, ND_ATR_LicenseInfo)) == 0) {
					set_nattr_c_slim(np, ND_ATR_License, ND_LIC_TYPE_locked, SET);
					remove_from_unlicensed_node_list(np);
				}
			} else {
				for (i = 0; i < np->nd_nummoms; i++)
					propagate_licenses_to_vnodes(np->nd_moms[i]);
			}
		} else {
			remove_from_unlicensed_node_list(np);
		}
		np = pnext;
	}
	update_license_highuse();
	return;
}

/**
 * @brief
 * 	init_licensing - initialize licensing
 *
 * @param[in] ptask - associcated work task
 *
 * @return: void
 */

void
init_licensing(struct work_task *ptask)
{
	int i;
	int count;
	long lic_count;

	if (init_licensing_task && (init_licensing_task != ptask)) {
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_INFO, msg_daemonname,
			  "skipping a init licensing task");
		return;
	}

	/*
 	 * We have to calculate the number of licenses again
 	 * as the license location has changed.
 	 */
	memset(&license_counts, 0, sizeof(license_counts));
	licensing_control.licenses_total_needed =
		licensing_control.licenses_checkout_time =
			licensing_control.licenses_checked_out = 0;
	licensing_control.expiry_warning_email_yday = -1;

	count = lic_init(pbs_licensing_location);
	if (count < 0) {
		for (i = 0; i < svr_totnodes; i++) {
			clear_node_lic_attrs(pbsndlist[i], 1);
			add_to_unlicensed_node_list(pbsndlist[i]);
		}

		switch (count) {
			case -1:
				sprintf(log_buffer,
					"pbs_license_info=%s does not point to a license server",
					pbs_licensing_location);
				break;
			case -2:
				sprintf(log_buffer,
					"connection could not be established with pbs_license_info=%s",
					pbs_licensing_location);
				break;
			case -3:
				sprintf(log_buffer,
					"supported licenses type not available at pbs_license_info=%s",
					pbs_licensing_location);
				break;
		}
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_NOTICE, msg_daemonname, log_buffer);
		return;
	}
	for (i = 0; i < svr_totnodes; i++) {
		clear_node_lic_attrs(pbsndlist[i], 0);
		if (is_nattr_set(pbsndlist[i], ND_ATR_LicenseInfo)) {
			licensing_control.licenses_total_needed += get_nattr_long(pbsndlist[i], ND_ATR_LicenseInfo);
		} else {
			if (pbsndlist[i]->nd_lic_info != NULL) {
				set_node_lic_info_attr(pbsndlist[i]);
				licensing_control.licenses_total_needed += get_nattr_long(pbsndlist[i], ND_ATR_LicenseInfo);
			}
		}
		add_to_unlicensed_node_list(pbsndlist[i]);
	}

	/* Determine how many licenses we can check out */
	license_counts.licenses_global = count;
	lic_count = calc_licenses_allowed();

	if (lic_count > 0) {
		int status;
		status = get_licenses(lic_count);

		if (status == 0)
			/* Now let us license the nodes */
			license_nodes();
	}

	return;
}

/**
 * @brief	check the sign is valid for given node
 *
 * @param[in]	sign	hash input
 * @param[out]	pnode	pointer to node structure
 *
 * @return	int
 * @retval	PBSE_NONE	: Hash is valid
 * @retval	PBSE_BADNDATVAL	: Bad attribute value
 * @retval	PBSE_LICENSEINV	: License is invalid
 */
static int
validate_sign(char *sign, struct pbsnode *pnode)
{
	int ret;
	time_t expiry = 0;
	char **cred_list = break_delimited_str(sign, '_');

	ret = checkkey(cred_list, pnode->nd_name, &expiry);
	free_string_array(cred_list);
	switch (ret) {
		case -3:
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE,
				  LOG_NOTICE, pnode->nd_name, "Invalid signature");
			return PBSE_LICENSEINV;
		case -2:
			return PBSE_BADTSPEC;
		case -1:
			return PBSE_BADNDATVAL;
		case 0:
			snprintf(log_buffer, sizeof(log_buffer),
				 "Signature is valid till:%ld", expiry);
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
				  LOG_DEBUG, pnode->nd_name, log_buffer);
			if (is_nattr_set(pnode, ND_ATR_License) && get_nattr_c(pnode, ND_ATR_License) == ND_LIC_TYPE_locked) {
				return_licenses(get_nattr_long(pnode, ND_ATR_LicenseInfo));
				clear_nattr(pnode, ND_ATR_License);
				clear_nattr(pnode, ND_ATR_LicenseInfo);
			}
			set_nattr_c_slim(pnode, ND_ATR_License, ND_LIC_TYPE_cloud, SET);
			break;
		case 1:
			snprintf(log_buffer, sizeof(log_buffer),
				 "Signature is valid, but it has expired at:%ld", expiry);
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE,
				  LOG_DEBUG, pnode->nd_name, log_buffer);
			return PBSE_NONE;
	}
	return PBSE_NONE;
}

/**
 * @brief	If changing lic_signature, check sign
 *
 * @param[out]	pnode	pointer to node structure
 * @param[in]	new	- new attribute
 *
 * @return	int
 * @retval	PBSE_NONE	: Hash is valid
 * @retval	PBSE_BADNDATVAL	: Bad attribute value
 * @retval	PBSE_LICENSEINV	: License is invalid
 */
int
check_sign(pbsnode *pnode, attribute *new)
{
	resource *presc;
	resource_def *prdef;
	int err = PBSE_NONE;

	prdef = find_resc_def(svr_resc_def, ND_RESC_LicSignature);
	presc = find_resc_entry((attribute *) new, prdef);
	if (presc && (presc->rs_value.at_flags & ATR_VFLAG_MODIFY)) {
		if ((err = validate_sign(presc->rs_value.at_val.at_str, pnode)) != PBSE_NONE)
			return (err);
		presc->rs_value.at_flags &= ~ATR_VFLAG_DEFLT;
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 	initialize license counters
 *
 * @param[in]	counts - pointer to the pbs_license_counts structure
 */
void
reset_license_counters(pbs_license_counts *counts)
{
	long global = lic_obtainable();

	if (global > 0) {
		counts->licenses_global = global;
		counts->licenses_local = global;
	} else {
		counts->licenses_global = 0;
		counts->licenses_local = 0;
	}
	counts->licenses_used = 0;
	counts->licenses_high_use.lu_max_forever = 0;
}

/*
 * @brief - release_node_lic -  return back the licenses to the pool
 * 				when a node is deleted.
 * @param - pobj - pointer to the node
 *
 * @return - int
 * @retval - 1 - if the licenses were returned
 * @retval - 0 - the node was not licensed in the first place.
 */
int
release_node_lic(void *pobj)
{
	if (pobj) {
		struct pbsnode *pnode = pobj;

		licensing_control.licenses_total_needed -= get_nattr_long(pnode, ND_ATR_LicenseInfo);

		/* release license if node is locked */
		if (get_nattr_c(pnode, ND_ATR_License) == ND_LIC_TYPE_locked && is_nattr_set(pnode, ND_ATR_LicenseInfo)) {
			return_licenses(get_nattr_long(pnode, ND_ATR_LicenseInfo));
			clear_nattr(pnode, ND_ATR_License);
			clear_nattr(pnode, ND_ATR_LicenseInfo);
			return 1;
		}
	}
	return 0;
}

/**
 * @brief	clear license on unset action of lic_signature
 *
 * @param[in,out]	pnode	-	pointer to node structure
 * @param[in]		rs_name	-	resource name
 *
 * @return	void
 */
void
unset_signature(void *pobj, char *rs_name)
{
	struct pbsnode *pnode = pobj;

	if (!pnode || !rs_name)
		return;

	if (!strcmp(rs_name, ND_RESC_LicSignature)) {
		if (is_nattr_set(pnode, ND_ATR_License) && get_nattr_c(pnode, ND_ATR_License) == ND_LIC_TYPE_cloud)
			clear_nattr(pnode, ND_ATR_License);
	}
}

/**
 * @brief
 *		unlicense_nodes	-	reset the ND_ATR_License value
 *		of a socket-licensed node. if we don't have enough licenses.
 *
 * @return	void
 *
 * @par MT-Safe:	no
 * @par Side Effects:
 *		None
 */
void
unlicense_nodes(void)
{
	int i;
	pbsnode *np;
	int first = 1;
	static char msg_node_unlicensed[] = "%s attribute reset on one or more nodes";

	for (i = 0; i < svr_totnodes; i++) {
		np = pbsndlist[i];
		if (get_nattr_c(np, ND_ATR_License) == ND_LIC_TYPE_locked) {
			clear_nattr(np, ND_ATR_License);
			clear_nattr(np, ND_ATR_LicenseInfo);
			node_save_db(np);
			if (first) {
				first = 0;
				sprintf(log_buffer, msg_node_unlicensed,
					ATTR_NODE_License);
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
					  LOG_ERR, msg_daemonname, log_buffer);
			}
		}
	}
}

/**
 * @brief - return_lingering_licenses - task to return unused licenses
 * 					back to pbs_license_info
 *
 * @return - void
 */
void
return_lingering_licenses(struct work_task *ptask)
{
	if ((licensing_control.licenses_checked_out > licensing_control.licenses_min) &&
	    (license_counts.licenses_local > 0))
		get_licenses(licensing_control.licenses_min);

	licenses_linger_time_task = set_task(WORK_Timed,
					     time_now + licensing_control.licenses_linger_time,
					     return_lingering_licenses, NULL);
}


================================================
FILE: src/server/mom_info.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	mom_info.c
 * @brief
 * 		mom_info.c - functions relating to the mominfo structures and vnodes
 *
 *		Some of the functions here in are used by both the Server and Mom,
 *		others are used by one or the other but not both.
 *
 * Included functions are:
 *
 * 	create_mom_entry()
 * 	delete_mom_entry()
 * 	find_mom_entry()
 * 	create_svrmom_entry()
 * 	delete_svrmom_entry()
 * 	create_mommap_entry()
 * 	delete_momvmap_entry()
 * 	find_vmap_entry()
 * 	add_mom_data()
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <stdio.h>
#include <unistd.h>
#include <stdlib.h>
#include <errno.h>
#include <sys/types.h>
#include "libpbs.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "credential.h"
#include "server_limits.h"
#include "batch_request.h"
#include "server.h"
#include "pbs_nodes.h"
#include "pbs_error.h"
#include "log.h"
#include "svrfunc.h"
#include "tpp.h"
#include "pbs_internal.h"
#include "work_task.h"
#include "hook_func.h"

static char merr[] = "malloc failed";

/* Global Data Itmes */

/* mominfo_array is an array of mominfo_t pointers, one per host */

mominfo_t **mominfo_array = NULL;
int mominfo_array_size = 0;	   /* num entries in the array */
mominfo_time_t mominfo_time = {0}; /* time stamp of mominfo update */
int svr_num_moms = 0;
vnpool_mom_t *vnode_pool_mom_list = NULL;

extern char *msg_daemonname;
extern char *path_hooks_rescdef;
extern char *msg_new_inventory_mom;

extern int remove_mom_ipaddresses_list(mominfo_t *pmom);

/*
 * The following function are used by both the Server and Mom
 *	create_mom_entry()
 *	delete_mom_entry()
 *	find_mom_entry()
 */

#define GROW_MOMINFO_ARRAY_AMT 10

/**
 * @brief
 *		create_mom_entry - create both a mominfo_t entry and insert a pointer
 *		to that element into the mominfo_array which may be expanded if needed
 *
 * @par Functionality:
 *		Searches for existing mominfo_t entry with matching hostname and port;
 *		if found returns it, otherwise adds entry.   An empty slot in the
 *		mominfo_array[] will be used to hold pointer to created entry.  If no
 *		empty slot, the array is expanded by GROW_MOMINFO_ARRAY_AMT amount.
 *
 * @param[in]	hostname - hostname of host on which Mom will be running
 * @param[in]	port     - port number to which Mom will be listening
 *
 * @return	mominfo_t *
 * @retval	Returns pointer to the mominfo entry, existing or created
 * @retval	NULL on error.
 *
 * @par Side Effects: None
 *
 * @par MT-safe: no, would need lock on realloc of global mominfo_array[]
 *
 */

mominfo_t *
create_mom_entry(char *hostname, unsigned int port)
{
	int empty = -1;
	int i;
	mominfo_t *pmom;
	mominfo_t **tp;

	for (i = 0; i < mominfo_array_size; ++i) {
		pmom = mominfo_array[i];
		if (pmom) {
			if ((strcasecmp(pmom->mi_host, hostname) == 0) &&
			    (pmom->mi_port == port))
				return pmom;
		} else if (empty == -1) {
			empty = i; /* save index of first empty slot */
		}
	}

	if (empty == -1) {
		/* there wasn't an empty slot in the array we can use */
		/* need to grow the array			      */

		tp = (mominfo_t **) realloc(mominfo_array,
					    (size_t) (sizeof(mominfo_t *) * (mominfo_array_size + GROW_MOMINFO_ARRAY_AMT)));
		if (tp) {
			empty = mominfo_array_size;
			mominfo_array = tp;
			mominfo_array_size += GROW_MOMINFO_ARRAY_AMT;
			for (i = empty; i < mominfo_array_size; ++i)
				mominfo_array[i] = NULL;
		} else {
			log_err(errno, __func__, merr);
			return NULL;
		}
	}

	/* now allocate the memory for the mominfo_t element itself */

	pmom = (mominfo_t *) malloc(sizeof(mominfo_t));
	if (pmom) {
		(void) strncpy(pmom->mi_host, hostname, PBS_MAXHOSTNAME);
		pmom->mi_host[PBS_MAXHOSTNAME] = '\0';
		pmom->mi_port = port;
		pmom->mi_rmport = port + 1;
		pmom->mi_modtime = (time_t) 0;
		pmom->mi_dmn_info = NULL;
		pmom->mi_data = NULL;
		CLEAR_LINK(pmom->mi_link);
#ifndef PBS_MOM
		if (mom_hooks_seen_count() > 0) {
			struct stat sbuf;
			/*
			 * there should be at least one hook to
			 * add mom actions below, which are in
			 * behalf of existing hooks.
			 */
			add_pending_mom_allhooks_action(pmom, MOM_HOOK_ACTION_SEND_ATTRS | MOM_HOOK_ACTION_SEND_CONFIG | MOM_HOOK_ACTION_SEND_SCRIPT);
			if (stat(path_hooks_rescdef, &sbuf) == 0)
				add_pending_mom_hook_action(pmom, PBS_RESCDEF, MOM_HOOK_ACTION_SEND_RESCDEF);
		}
#endif

		mominfo_array[empty] = pmom;
		++svr_num_moms; /* increment number of Moms */
	} else {
		log_err(errno, __func__, merr);
	}

	return pmom;
}

/**
 *
 * @brief
 *		Destory a mominfo_t element and null the pointer to that
 *		element in the mominfo_array;
 * @par Functionality:
 *		The heap entry pointed to by the mi_data member is freed also.
 *		However, any extra malloc-ed space in that member must be freed
 *		independently. Note, this means the mominfo_array may have null
 *		entries anywhere.
 *
 * @param[in]	pmom - the element being operated on.
 *
 * @return	void
 */

void
delete_mom_entry(mominfo_t *pmom)
{
	int i;

	if (pmom == NULL)
		return;

	/*
	 * Remove any work_task entries that may be referencing this mom
	 * BEFORE we free any data.
	 */
	delete_task_by_parm1_func((void *) pmom, NULL, DELETE_ONE);

	/* find the entry in the arry that does point here */
	for (i = 0; i < mominfo_array_size; ++i) {
		if (mominfo_array[i] == pmom) {
			mominfo_array[i] = NULL;
			break;
		}
	}

	/* free the mi_data after all hook work is done, since the hook actions
	 * use the mi_data.
	 */
	free(pmom->mi_data);

	delete_link(&pmom->mi_link);
	memset(pmom, 0, sizeof(mominfo_t));
	free(pmom);
	--svr_num_moms;

	return;
}

/**
 * @brief
 * 		find_mom_entry - find and return a pointer to a mominfo_t element
 *		defined by the hostname and port
 * @note
 *		the mominfo_array may have null entries anywhere.
 *
 * @param[in]	hostname - hostname of host on which Mom will be running
 * @param[in]	port     - port number to which Mom will be listening
 *
 * @return	pointer to a mominfo_t element
 * @reval	NULL	- couldn't find.
 */

mominfo_t *
find_mom_entry(char *hostname, unsigned int port)
{
	int i;
	mominfo_t *pmom;

	for (i = 0; i < mominfo_array_size; ++i) {
		pmom = mominfo_array[i];
		if (pmom &&
		    (strcasecmp(pmom->mi_host, hostname) == 0) &&
		    (pmom->mi_port == port))
			return pmom;
	}

	return NULL; /* didn't find it */
}

#ifndef PBS_MOM /* Not Mom, i.e. the Server */

/*
 * The following functions are used by the Server only !
 */

/**
 * @brief
 * 		create_svrmom_entry - create both a mominfo entry and the mom_svrinfo
 *		entry associated with it.
 *		Also used as a peer server structure for multi-server.
 * @par Functionality:
 *		Finds an existing mominfo_t structure for the hostname/port tuple,
 *		create mominfo_t and associated mom_svrinfo_t structures; and array
 *		(size 1) of pointers to pbs nodes for the children vnodes.
 * @note
 * 		use delete_mom_entry() to delete both the mominfo and
 *		mom_svrinfo entries.
 * @see
 * 		create_pbs_node2
 *
 * @param[in]	hostname - hostname of host on which Mom will be running
 * @param[in]	port     - port number to which Mom will be listening
 * @param[in]	pul      - list of IP addresses of host; will be freed on error
 *			   				or saved in structure; caller must not free pul
 *
 * @return	mominfo_t *
 * @retval	pointer to the created mominfo entry	- success
 * @retval	NULL	- error.
 *
 * @par Side Effects: None
 *
 * @par MT-safe: see create_mom_entry() and tinsert2()
 *
 */

mominfo_t *
create_svrmom_entry(char *hostname, unsigned int port, unsigned long *pul)
{
	mominfo_t *pmom;
	mom_svrinfo_t *psvrmom;

	pmom = create_mom_entry(hostname, port);

	if (pmom == NULL) {
		free(pul);
		return pmom;
	}

	if (pmom->mi_data != NULL) {
		free(pul);
		return pmom; /* already there */
	}

	psvrmom = (mom_svrinfo_t *) malloc(sizeof(mom_svrinfo_t));
	if (!psvrmom) {
		log_err(PBSE_SYSTEM, __func__, merr);
		delete_mom_entry(pmom);
		return NULL;
	}

	psvrmom->msr_pcpus = 0;
	psvrmom->msr_acpus = 0;
	psvrmom->msr_pmem = 0;
	psvrmom->msr_numjobs = 0;
	psvrmom->msr_arch = NULL;
	psvrmom->msr_pbs_ver = NULL;
	psvrmom->msr_timedown = (time_t) 0;
	psvrmom->msr_wktask = 0;
	psvrmom->msr_jbinxsz = 0;
	psvrmom->msr_jobindx = NULL;
	psvrmom->msr_numvnds = 0;
	psvrmom->msr_numvslots = 1;
	psvrmom->msr_vnode_pool = 0;
	psvrmom->msr_has_inventory = 0;
	psvrmom->msr_children =
		(struct pbsnode **) calloc((size_t) (psvrmom->msr_numvslots),
					   sizeof(struct pbsnode *));
	if (psvrmom->msr_children == NULL) {
		log_err(errno, __func__, merr);
		free(psvrmom);
		delete_mom_entry(pmom);
		return NULL;
	}
	psvrmom->msr_action = NULL;
	psvrmom->msr_num_action = 0;

	pmom->mi_data = psvrmom; /* must be done before call tinsert2 */

	if (pmom->mi_dmn_info) {
		free(pul);
		return pmom; /* already there */
	}

	pmom->mi_dmn_info = init_daemon_info(pul, port, pmom);
	if (!pmom->mi_dmn_info) {
		log_err(PBSE_SYSTEM, __func__, merr);
		delete_svrmom_entry(pmom);
		return NULL;
	}

	return pmom;
}

/**
 * @brief
 * 		open_conn_stream - do an tpp_open if it is safe to do so.
 *
 * @param[in]	pmom	- pointer to mominfo structure
 *
 * @return	int
 * @retval	-1: cannot be opened or error on opening
 * @retval	>=0: success
 */
int
open_conn_stream(mominfo_t *pmom)
{
	int stream = -1;
	dmn_info_t *pdmninfo;

	pdmninfo = pmom->mi_dmn_info;
	if (pdmninfo->dmn_stream >= 0)
		return pdmninfo->dmn_stream;

	if ((stream = tpp_open(pmom->mi_host, pmom->mi_rmport)) < 0) {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			   msg_daemonname, "Failed to open connection stream for %s", pmom->mi_host);
		return -1;
	}

	pdmninfo->dmn_stream = stream;
	pdmninfo->dmn_state &= ~(INUSE_UNKNOWN | INUSE_DOWN);
	tinsert2((u_long) stream, 0, pmom, &streams);

	return stream;
}

/**
 * @brief
 * 		delete_svrmom_entry - destroy a mom_svrinfo_t element and the parent
 *		mominfo_t element.
 *
 * @see
 * 		effective_node_delete
 *
 * @param[in]	pmom	- pointer to mominfo structure
 *
 * @return	void
 */

void
delete_svrmom_entry(mominfo_t *pmom)
{
	mom_svrinfo_t *psvrmom = (mom_svrinfo_t *) pmom->mi_data;
	int i;

	if (psvrmom) {

#ifndef PBS_MOM
		/* send request to this mom to delete all hooks known from this server. */
		/* we'll just send this delete request only once */
		/* if a hook fails to delete, then that mom host when it */
		/* come back will still have the hook. */
		if (pmom->mi_dmn_info && !(pmom->mi_dmn_info->dmn_state & INUSE_UNKNOWN) && (mom_hooks_seen_count() > 0)) {
			uc_delete_mom_hooks(pmom);
		}
#endif

		if (psvrmom->msr_arch)
			free(psvrmom->msr_arch);

		if (psvrmom->msr_pbs_ver)
			free(psvrmom->msr_pbs_ver);

		if (psvrmom->msr_children)
			free(psvrmom->msr_children);

		if (psvrmom->msr_jobindx) {
			free(psvrmom->msr_jobindx);
			psvrmom->msr_jbinxsz = 0;
			psvrmom->msr_jobindx = NULL;
		}

		if (remove_mom_ipaddresses_list(pmom) != 0) {
			snprintf(log_buffer, sizeof(log_buffer), "Could not remove IP address for mom %s:%d from cache",
				 pmom->mi_host, pmom->mi_port);
			log_err(errno, __func__, log_buffer);
		}
	}

	delete_daemon_info(pmom);

#ifndef PBS_MOM
	for (i = 0; i < psvrmom->msr_num_action; ++i) {
		if (psvrmom->msr_action[i] != NULL) {
			free(psvrmom->msr_action[i]);
			psvrmom->msr_action[i] = NULL;
		}
	}
	free(psvrmom->msr_action);
#endif

	memset((void *) psvrmom, 0, sizeof(mom_svrinfo_t));

	delete_mom_entry(pmom);
}

/**
 * @brief
 *	Find the pool that matches what is set on the node
 *
 * @param[in]	pmom - pointer to the mom
 * @param[out]	ppool - pointer to the matching pool structure
 *
 * @return	vnpool_mom_t *
 * @retval	pointer to the matching pool structure
 * @retval	NULL - if there is no match
 */
vnpool_mom_t *
find_vnode_pool(mominfo_t *pmom)
{
	mom_svrinfo_t *psvrmom = (mom_svrinfo_t *) (pmom->mi_data);
	vnpool_mom_t *ppool = vnode_pool_mom_list;

	if (psvrmom->msr_vnode_pool != 0) {
		while (ppool != NULL) {
			if (ppool->vnpm_vnode_pool == psvrmom->msr_vnode_pool)
				return (ppool);

			ppool = ppool->vnpm_next;
		}
	}
	return NULL;
}

/**
 * @brief
 *	Reset the "inventory Mom" for a vnode_pool if the specified Mom is the
 *	current inventory Mom.  Done when she is down or deleted from the pool.
 *
 * @param[in] pmom - Pointer to the Mom (mominfo_t) structure of the Mom
 *	being removed/marked down.
 */
void
reset_pool_inventory_mom(mominfo_t *pmom)
{
	int i;
	vnpool_mom_t *ppool;
	mominfo_t *pxmom;
	mom_svrinfo_t *pxsvrmom;
	mom_svrinfo_t *psvrmom = (mom_svrinfo_t *) (pmom->mi_data);

	/* If this Mom is in a vnode pool and is the inventory Mom for that */
	/* pool remove her from that role and if another Mom in the pool and */
	/* is up, make that Mom the new inventory Mom */

	if (psvrmom->msr_vnode_pool != 0) {
		ppool = find_vnode_pool(pmom);
		if (ppool != NULL) {
			if (ppool->vnpm_inventory_mom != pmom)
				return; /* in the pool but is not the inventory mom */

			/* this newly down/deleted Mom was the inventory Mom, */
			/* clear her as the inventory mom in the pool */
			ppool->vnpm_inventory_mom = NULL;
			psvrmom->msr_has_inventory = 0;

			/* see if another Mom is up to become "the one" */
			for (i = 0; i < ppool->vnpm_nummoms; ++i) {
				pxmom = ppool->vnpm_moms[i];
				pxsvrmom = (mom_svrinfo_t *) pxmom->mi_data;
				if ((pxmom->mi_dmn_info->dmn_state & INUSE_DOWN) == 0) {
					ppool->vnpm_inventory_mom = pxmom;
					pxsvrmom->msr_has_inventory = 1;
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
						   LOG_DEBUG, msg_daemonname, msg_new_inventory_mom,
						   ppool->vnpm_vnode_pool, pxmom->mi_host);
				}
			}
		}
	}
}

/**
 * @brief
 *	Add a Mom (mominfo_t) to the list of Moms associated with managing
 *	a vnode pool.  Create the pool if need be (not yet exists).
 *
 * @param[in] pmom - Pointer to the mominfo_t for the Mom
 * @return Error code
 * @retval - 0 - Success
 * @retval - pbs_errno - Failure code
 *
 * @par MT-safe: No
 */
int
add_mom_to_pool(mominfo_t *pmom)
{
	int i;
	vnpool_mom_t *ppool;
	mominfo_t **tmplst;
	int added_pool = 0;
	mom_svrinfo_t *psvrmom = (mom_svrinfo_t *) pmom->mi_data;

	if (psvrmom->msr_vnode_pool == 0)
		return PBSE_NONE; /* Mom not in a pool */

	ppool = find_vnode_pool(pmom);
	if (ppool != NULL) {
		/* Found existing pool. Is Mom already in it? */
		for (i = 0; i < ppool->vnpm_nummoms; ++i) {
			if (ppool->vnpm_moms[i] == pmom) {
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE,
					   LOG_INFO, pmom->mi_host,
					   "POOL: add_mom_to_pool - "
					   "Mom already in pool %ld",
					   psvrmom->msr_vnode_pool);
				return PBSE_NONE; /* she is already there */
			}
		}
	}

	/* The pool doesn't exist yet, we need to add a pool entry */
	if (ppool == NULL) {
		ppool = (vnpool_mom_t *) calloc(1, (size_t) sizeof(struct vnpool_mom));
		if (ppool == NULL) {
			/* no memory */
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_ERR,
				  pmom->mi_host, "Failed to expand vnode_pool_mom_list");
			return PBSE_SYSTEM;
		}
		added_pool = 1;
		ppool->vnpm_vnode_pool = psvrmom->msr_vnode_pool;
	}

	/* now add Mom to pool list, expanding list if need be */

	/* expand the array, perhaps from nothingness */
	tmplst = (mominfo_t **) realloc(ppool->vnpm_moms, (ppool->vnpm_nummoms + 1) * sizeof(mominfo_t *));
	if (tmplst == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_NODE, LOG_ERR,
			  pmom->mi_host, "unable to add mom to pool, no memory");

		if (added_pool)
			free(ppool);
		return PBSE_SYSTEM;
	}
	ppool->vnpm_moms = tmplst;
	ppool->vnpm_moms[ppool->vnpm_nummoms++] = pmom;

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG, msg_daemonname,
		   "Mom %s added to vnode_pool %ld", pmom->mi_host, psvrmom->msr_vnode_pool);
	if (ppool->vnpm_inventory_mom == NULL) {
		ppool->vnpm_inventory_mom = pmom;
		psvrmom->msr_has_inventory = 1;
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, msg_daemonname,
			   msg_new_inventory_mom, psvrmom->msr_vnode_pool, pmom->mi_host);
	}

	if (vnode_pool_mom_list == NULL) {
		vnode_pool_mom_list = ppool;
	} else if (added_pool == 1) {
		ppool->vnpm_next = vnode_pool_mom_list;
		vnode_pool_mom_list = ppool;
	}

	return PBSE_NONE;
}

/**
 * @brief
 *	remove a Mom (mominfo_t) from the list of Moms associated with managing
 *	a vnode pool.
 *
 * @param[in] pmom - Pointer to the mominfo_t for the Mom
 *
 * @par MT-safe: No
 */
void
remove_mom_from_pool(mominfo_t *pmom)
{
	int i;
	int j;
	vnpool_mom_t *ppool;
	mom_svrinfo_t *psvrmom = (mom_svrinfo_t *) pmom->mi_data;

	if (psvrmom->msr_vnode_pool == 0)
		return; /* Mom not in a pool */

	ppool = find_vnode_pool(pmom);
	if (ppool != NULL) {
		/* found existing pool, if Mom is in it remove her */
		/* from it.  If not, nothing to do. */
		for (i = 0; i < ppool->vnpm_nummoms; ++i) {
			if (ppool->vnpm_moms[i] == pmom) {
				ppool->vnpm_moms[i] = NULL;
				for (j = i + 1; j < ppool->vnpm_nummoms; ++j) {
					ppool->vnpm_moms[j - 1] = ppool->vnpm_moms[j];
				}
				--ppool->vnpm_nummoms;
				/* find someone else to be the inventory Mom if need be */
				reset_pool_inventory_mom(pmom);
				psvrmom->msr_vnode_pool = 0;
			}
		}
	}
}

#else /* PBS_MOM */

/*
 * The following functions are used by Mom only !
 */

/**
 * @brief
 * 		create_mommap_entry - create an entry to map a vnode to its parent Mom
 *		and initialize it.   If the actual host of the vnode, used only for
 *		MPI is not the same as the Mom host, then set it.  If the two hosts
 *		are the same, then mvm_hostn is null and the Mom name should be used
 *
 * @param[in]	vnode	- vnode for which entry needs to be made
 * @param[in]	hostn	- host name for MPI via PBS_NODEFILE
 * @param[in]	pmom	- pointer to mominfo structure
 * @param[in]	notask	- mvm_notask
 *
 * @return	momvmap_t
 * @retval	NULL	- failure
 */
momvmap_t *
create_mommap_entry(char *vnode, char *hostn, mominfo_t *pmom, int notask)
{
	int empty = -1;
	int i;
	momvmap_t *pmmape;
	momvmap_t **tpa;

#ifdef DEBUG
	assert((vnode != NULL) && (*vnode != '\0') && (pmom != NULL));
#else
	if ((vnode == NULL) || (*vnode == '\0') || (pmom == NULL)) {
		return NULL;
	}
#endif

	/* find a empty slot in the map array */

	for (i = 0; i < mommap_array_size; ++i) {
		if (mommap_array[i] == NULL) {
			empty = i;
			break;
		}
	}
	if (empty == -1) { /* need to expand array */
		tpa = (momvmap_t **) realloc(mommap_array, (size_t) (sizeof(momvmap_t *) * (mommap_array_size + GROW_MOMINFO_ARRAY_AMT)));
		if (tpa) {
			empty = mommap_array_size;
			mommap_array = tpa;
			mommap_array_size += GROW_MOMINFO_ARRAY_AMT;
			for (i = empty; i < mommap_array_size; ++i)
				mommap_array[i] = NULL;
		} else {
			log_err(errno, __func__, merr);
			return NULL;
		}
	}

	/* now allocate the entry itself and initalize it */

	pmmape = malloc(sizeof(momvmap_t));
	if (pmmape) {
		(void) strncpy(pmmape->mvm_name, vnode, PBS_MAXNODENAME);
		pmmape->mvm_name[PBS_MAXNODENAME] = '\0';
		if ((hostn == NULL) || (*hostn == '\0')) {
			pmmape->mvm_hostn = NULL;
		} else {
			pmmape->mvm_hostn = strdup(hostn);
			if (pmmape->mvm_hostn == NULL) {
				log_err(errno, __func__, merr);
			}
		}
		pmmape->mvm_notask = notask;
		pmmape->mvm_mom = pmom;

		mommap_array[empty] = pmmape;
	} else {
		log_err(errno, __func__, merr);
	}
	return (pmmape);
}

/**
 * @brief
 *		delete_momvmap_entry - delete a momvmap_t entry
 * @see
 * 		free_vnodemap
 * @param[in,out]	- a momvmap_t entry
 *
 * @return	void
 */
void
delete_momvmap_entry(momvmap_t *pmmape)
{
	if (pmmape->mvm_hostn)
		free(pmmape->mvm_hostn);
	memset(pmmape, 0, sizeof(momvmap_t));
	free(pmmape);
}

/**
 * @brief
 * 		find_vmap_entry - find the momvmap_t entry for a vnode name
 *
 * @param[in]	vname	- vnode name
 *
 * @return	momvmap_t *
 * @retval	mom_vmap entry	- success
 * @retval	NULL	- failure
 */

momvmap_t *
find_vmap_entry(const char *vname)
{
	int i;
	momvmap_t *pmap;

	for (i = 0; i < mommap_array_size; ++i) {
		pmap = mommap_array[i];
		if ((pmap != NULL) && (strcasecmp(pmap->mvm_name, vname) == 0))
			return pmap;
	}
	return NULL;
}

mominfo_t *
find_mom_by_vnodename(const char *vname)
{
	momvmap_t *pmap;

	pmap = find_vmap_entry(vname);
	if (pmap)
		return (pmap->mvm_mom);
	else
		return NULL;
}

mominfo_t *
add_mom_data(const char *vnid, void *data)
{
	mominfo_t *pmom;

	if ((pmom = find_mom_by_vnodename(vnid)) != NULL) {
		pmom->mi_data = data;
		return (pmom);
	}

	return NULL;
}
#endif /* PBS_MOM */


================================================
FILE: src/server/nattr_get_set.c
================================================
/*
 * Copyright (C) 1994-2020 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "pbs_nodes.h"

/**
 * @brief	Get attribute of node based on given attr index
 *
 * @param[in] pnode    - pointer to node struct
 * @param[in] attr_idx - attribute index
 *
 * @return attribute *
 * @retval NULL  - failure
 * @retval !NULL - pointer to attribute struct
 */
attribute *
get_nattr(const struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		return _get_attr_by_idx((attribute *) pnode->nd_attr, attr_idx);
	return NULL;
}

/**
 * @brief	Getter function for node attribute of type string
 *
 * @param[in]	pnode - pointer to the node
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	char *
 * @retval	string value of the attribute
 * @retval	NULL if pnode is NULL
 */
char *
get_nattr_str(const struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		return get_attr_str(get_nattr(pnode, attr_idx));

	return NULL;
}

/**
 * @brief	Getter function for node attribute of type string of array
 *
 * @param[in]	pnode - pointer to the node
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	struct array_strings *
 * @retval	value of the attribute
 * @retval	NULL if pnode is NULL
 */
struct array_strings *
get_nattr_arst(const struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		return get_attr_arst(get_nattr(pnode, attr_idx));

	return NULL;
}

/**
 * @brief	Getter for node attribute's list value
 *
 * @param[in]	pnode - pointer to the node
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	pbs_list_head
 * @retval	value of attribute
 */
pbs_list_head
get_nattr_list(const struct pbsnode *pnode, int attr_idx)
{
	return get_attr_list(get_nattr(pnode, attr_idx));
}

/**
 * @brief	Getter function for node attribute of type long
 *
 * @param[in]	pnode - pointer to the node
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	long
 * @retval	long value of the attribute
 * @retval	-1 if pnode is NULL
 */
long
get_nattr_long(const struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		return get_attr_l(get_nattr(pnode, attr_idx));

	return -1;
}

/**
 * @brief	Getter function for node attribute of type char
 *
 * @param[in]	pnode - pointer to the node
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	char
 * @retval	char value of the attribute
 * @retval	-1 if pnode is NULL
 */
char
get_nattr_c(const struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		return get_attr_c(get_nattr(pnode, attr_idx));

	return -1;
}

/**
 * @brief	Generic node attribute setter (call if you want at_set() action functions to be called)
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_nattr_generic(struct pbsnode *pnode, int attr_idx, char *val, char *rscn, enum batch_op op)
{
	if (pnode == NULL || val == NULL)
		return 1;

	pnode->nd_modified = 1;
	return set_attr_generic(get_nattr(pnode, attr_idx), &node_attr_def[attr_idx], val, rscn, op);
}

/**
 * @brief	"fast" node attribute setter for string values
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_nattr_str_slim(struct pbsnode *pnode, int attr_idx, char *val, char *rscn)
{
	if (pnode == NULL || val == NULL)
		return 1;

	pnode->nd_modified = 1;
	return set_attr_generic(get_nattr(pnode, attr_idx), &node_attr_def[attr_idx], val, rscn, INTERNAL);
}

/**
 * @brief	"fast" node attribute setter for long values
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_nattr_l_slim(struct pbsnode *pnode, int attr_idx, long val, enum batch_op op)
{
	if (pnode == NULL)
		return 1;

	if ((attr_idx != ND_ATR_last_state_change_time) && 
		(attr_idx != ND_ATR_state || (val & INUSE_NOAUTO_MASK)))
		pnode->nd_modified = 1;
	set_attr_l(get_nattr(pnode, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" node attribute setter for boolean values
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_nattr_b_slim(struct pbsnode *pnode, int attr_idx, long val, enum batch_op op)
{
	if (pnode == NULL)
		return 1;

	pnode->nd_modified = 1;
	set_attr_b(get_nattr(pnode, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" node attribute setter for char values
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_nattr_c_slim(struct pbsnode *pnode, int attr_idx, char val, enum batch_op op)
{
	if (pnode == NULL)
		return 1;

	pnode->nd_modified = 1;
	set_attr_c(get_nattr(pnode, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" node attribute setter for short values
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_nattr_short_slim(struct pbsnode *pnode, int attr_idx, short val, enum batch_op op)
{
	if (pnode == NULL)
		return 1;

	pnode->nd_modified = 1;
	set_attr_short(get_nattr(pnode, attr_idx), val, op);

	return 0;
}

/**
 * @brief	Check if a node attribute is set
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to check
 *
 * @return	int
 * @retval	1 if it is set
 * @retval	0 otherwise
 */
int
is_nattr_set(const struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		return is_attr_set(get_nattr(pnode, attr_idx));

	return 0;
}

/**
 * @brief	Free a node attribute
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to free
 *
 * @return	void
 */
void
free_nattr(struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		free_attr(node_attr_def, get_nattr(pnode, attr_idx), attr_idx);
}

/**
 * @brief	clear a node attribute
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to clear
 *
 * @return	void
 */
void
clear_nattr(struct pbsnode *pnode, int attr_idx)
{
	if (pnode != NULL)
		clear_attr(get_nattr(pnode, attr_idx), &node_attr_def[attr_idx]);
}

/**
 * @brief	Special setter func to set node's job info value
 *
 * @param[in]	pnode - pointer to node
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - pointer to node as value to set
 *
 * @return	void
 */
void
set_nattr_jinfo(struct pbsnode *pnode, int attr_idx, struct pbsnode *val)
{
	pnode->nd_modified = 1;
	attribute *attr = get_nattr(pnode, attr_idx);
	attr->at_val.at_jinfo = val;
	attr->at_flags = ATR_SET_MOD_MCACHE;
}


================================================
FILE: src/server/node_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *		various functions dealing with nodes, properties and
 *		 the following global variables:
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <time.h>
#include <errno.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include "pbs_db.h"
#include <unistd.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <netdb.h>
#include <assert.h>
#include "pbs_ifl.h"
#include "libpbs.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "credential.h"
#include "server_limits.h"
#include "batch_request.h"
#include "server.h"
#include "resv_node.h"
#include "job.h"
#include "queue.h"
#include "reservation.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "pbs_error.h"
#include "log.h"
#include "tpp.h"
#include "work_task.h"
#include "net_connect.h"
#include "cmds.h"
#include "pbs_license.h"
#include "pbs_idx.h"
#include "libutil.h"
#if !defined(H_ERRNO_DECLARED)
extern int h_errno;
#endif

/* Global Data */

extern int svr_quehasnodes;
extern int svr_totnodes;
extern pbs_list_head svr_queues;
extern mominfo_time_t mominfo_time;
extern char *resc_in_err;
extern void *node_idx;
extern time_t time_now;

extern int node_delete_db(struct pbsnode *);
extern pbsnode *recov_node_cb(pbs_db_obj_info_t *, int *);
extern int check_sign(pbsnode *, attribute *);
extern void license_one_node(pbsnode *);
extern int process_topology_info(void **, char *);
extern void release_lic_for_cray(struct pbsnode *);
static void remove_node_topology(char *);

/**
 * @brief
 * 		find_nodebyname() - find a node host by its name
 * @param[in]	nodename	- node being searched
 *
 * @return	strcut pbsnode *
 * @retval	!NULL - success
 * @retval	NULL  - failure
 */
struct pbsnode *
find_nodebyname(char *nodename)
{
	char *pslash;
	struct pbsnode *node = NULL;

	if (nodename == NULL)
		return NULL;
	if (*nodename == '(')
		nodename++; /* skip over leading paren */
	if ((pslash = strchr(nodename, (int) '/')) != NULL)
		*pslash = '\0';
	if (node_idx == NULL)
		return NULL;
	if (pbs_idx_find(node_idx, (void **) &nodename, (void **) &node, NULL) != PBS_IDX_RET_OK)
		return NULL;

	return node;
}

/**
 * @brief
 * 		find_nodebyaddr() - find a node host by its addr
 * @param[in]	addr	- addr being searched
 *
 * @return	pbsnode
 * @retval	NULL	- failure
 */

struct pbsnode *
find_nodebyaddr(pbs_net_t addr)
{
	int i, j;
	dmn_info_t *pdmninfo;

	for (i = 0; i < svr_totnodes; i++) {
		pdmninfo = pbsndlist[i]->nd_moms[0]->mi_dmn_info;
		for (j = 0; pdmninfo->dmn_addrs[j]; j++) {
			if (addr == pdmninfo->dmn_addrs[j]) {
				return (pbsndlist[i]);
			}
		}
	}
	return NULL;
}

/**
 * @brief
 * 	 	add status of each requested (or all) node-attribute to the status reply.
 *		if a node-attribute is incorrectly specified, *bad is set to the node-attribute's ordinal position.
 * @see
 * 		status_node
 * @param[in,out]	pal	- the node to check
 * @param[in]	padef 	- 	the defined node attributes
 * @param[out]	pnode 	- 	no longer an attribute ptr
 * @param[in]	limit 	- 	number of array elements in padef
 * @param[in]	priv 	- 	requester's privilege
 * @param[in]	phead 	- 	heads list of svrattrl structs that hang
 * 							off the brp_attr member of the status sub
 * 							structure in the request's "reply area"
 * @param[in]	bad 	- 	if node-attribute error record it's list position here
 *
 * @return	int
 * @retval	0		- success
 * @retval	!= 0	- error
 */

int
status_nodeattrib(svrattrl *pal, struct pbsnode *pnode, int limit, int priv, pbs_list_head *phead, int *bad)
{
	int rc = 0; /*return code, 0 == success*/
	int index;
	int nth; /*tracks list position (ordinal tacker)   */
	attribute_def *padef = node_attr_def;

	priv &= ATR_DFLAG_RDACC; /* user-client privilege      */

	if (pal) { /*caller has requested status on specific node-attributes*/
		nth = 0;
		while (pal) {
			++nth;
			index = find_attr(node_attr_idx, padef, pal->al_name);
			if (index < 0) {
				*bad = nth; /* name in this position not found */
				rc = PBSE_UNKNODEATR;
				break;
			}
			if ((padef + index)->at_flags & priv) {
				rc = (padef + index)->at_encode(get_nattr(pnode, index), phead, (padef + index)->at_name, NULL, ATR_ENCODE_CLIENT, NULL);
				if (rc < 0) {
					rc = -rc;
					break;
				}
				rc = 0;
			}
			pal = (svrattrl *) GET_NEXT(pal->al_link);
		}

	} else {
		/*
		 **	non-specific request,
		 **	return all readable attributes
		 */
		for (index = 0; index < limit; index++) {
			if ((padef + index)->at_flags & priv) {
				rc = (padef + index)->at_encode(get_nattr(pnode, index), phead, (padef + index)->at_name, NULL, ATR_ENCODE_CLIENT, NULL);
				if (rc < 0) {
					rc = -rc;
					break;
				}
				rc = 0;
			}
		}
	}

	return (rc);
}

/**
 * @brief
 * 		free_prop_list
 * 		For each element of a null terminated prop list call free
 * 		to clean up any string buffer that hangs from the element.
 *		After this, call free to remove the struct prop.
 *
 * @param[in,out]	prop 	- 	prop list
 *
 * @return	void
 */

void
free_prop_list(struct prop *prop)
{
	struct prop *pp;

	while (prop) {
		pp = prop->next;
		free(prop->name);
		prop->name = NULL;
		free(prop);
		prop = pp;
	}
}

/**
 * @brief
 *		initialize_pbsnode - carries out initialization on a new
 *		pbs node.  The assumption is that all the parameters are valid.
 * @see
 * 		create_pbs_node2
 * @param[out]	pnode 	- 	new pbs node
 * @param[in]	pname	- 	node name
 * @param[in]	ntype 	- 	time-shared or cluster
 *
 * @return	int
 * @retval	PBSE_NONE	- success
 */

int
initialize_pbsnode(struct pbsnode *pnode, char *pname, int ntype)
{
	int i;
	attribute *pat1;
	attribute *pat2;
	resource_def *prd;
	resource *presc;

	pnode->nd_name = pname;
	pnode->nd_ntype = ntype;
	pnode->nd_nsn = 0;
	pnode->nd_nsnfree = 0;
	pnode->nd_svrflags = 0;
	pnode->nd_ncpus = 1;
	pnode->nd_psn = NULL;
	pnode->nd_hostname = NULL;
	pnode->nd_state = INUSE_UNKNOWN | INUSE_DOWN;
	pnode->nd_resvp = NULL;
	pnode->nd_pque = NULL;
	pnode->nd_nummoms = 0;
	pnode->nd_svrflags |= NODE_NEWOBJ;
	pnode->nd_lic_info = NULL;
	pnode->nd_modified = 0;
	pnode->nd_moms = (mominfo_t **) calloc(1, sizeof(mominfo_t *));
	if (pnode->nd_moms == NULL)
		return (PBSE_SYSTEM);
	pnode->nd_nummslots = 1;

	/* first, clear the attributes */

	for (i = 0; i < ND_ATR_LAST; i++)
		clear_attr(get_nattr(pnode, i), &node_attr_def[i]);

	/* then, setup certain attributes */
	set_nattr_l_slim(pnode, ND_ATR_state, pnode->nd_state, SET);

	set_nattr_short_slim(pnode, ND_ATR_ntype, pnode->nd_ntype, SET);

	set_nattr_jinfo(pnode, ND_ATR_jobs, pnode);
	set_nattr_jinfo(pnode, ND_ATR_resvs, pnode);

	set_nattr_l_slim(pnode, ND_ATR_ResvEnable, 1, SET);
	(get_nattr(pnode, ND_ATR_ResvEnable))->at_flags |= ATR_VFLAG_DEFLT;

	set_nattr_str_slim(pnode, ND_ATR_version, "unavailable", NULL);
	(get_nattr(pnode, ND_ATR_version))->at_flags |= ATR_VFLAG_DEFLT;

	set_nattr_l_slim(pnode, ND_ATR_Sharing, VNS_DFLT_SHARED, SET);
	(get_nattr(pnode, ND_ATR_Sharing))->at_flags |= ATR_VFLAG_DEFLT;

	pat1 = get_nattr(pnode, ND_ATR_ResourceAvail);
	pat2 = get_nattr(pnode, ND_ATR_ResourceAssn);

	prd = &svr_resc_def[RESC_ARCH];
	(void) add_resource_entry(pat1, prd);

	prd = &svr_resc_def[RESC_MEM];
	(void) add_resource_entry(pat1, prd);

	prd = &svr_resc_def[RESC_NCPUS];
	(void) add_resource_entry(pat1, prd);

	/* add to resources_assigned any resource with ATR_DFLAG_FNASSN */
	/* or  ATR_DFLAG_ANASSN set in the resource definition          */

	for (prd = svr_resc_def; prd; prd = prd->rs_next) {
		if ((prd->rs_flags & (ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) &&
		    (prd->rs_flags & ATR_DFLAG_MOM)) {
			presc = add_resource_entry(pat2, prd);
			presc->rs_value.at_flags = ATR_SET_MOD_MCACHE;
		}
	}

	/* clear the modify flags */

	for (i = 0; i < (int) ND_ATR_LAST; i++)
		(get_nattr(pnode, i))->at_flags &= ~ATR_VFLAG_MODIFY;
	return (PBSE_NONE);
}

/**
 * @brief
 * 		subnode_delete - delete the specified subnode
 *		by marking it deleted
 *
 * @see
 * 		effective_node_delete and delete_a_subnode
 *
 * @param[in]	psubn	-	ncpus on a vnode
 *
 * @return	void
 */

static void
subnode_delete(struct pbssubn *psubn)
{
	struct jobinfo *jip, *jipt;

	for (jip = psubn->jobs; jip; jip = jipt) {
		jipt = jip->next;
		free(jip->jobid);
		free(jip);
	}
	psubn->jobs = NULL;
	psubn->next = NULL;
	psubn->inuse = INUSE_DELETED;
	free(psubn);
}
/**
 * @brief
 * 		Remove the vnode from the list of vnodes of a mom.
 * @see
 * 		effective_node_delete
 *
 * @param[in]	pnode	- Vnode structure
 *
 * @return	void
 */
static void
remove_vnode_from_moms(struct pbsnode *pnode)
{
	int imom;
	int ivnd;

	mom_svrinfo_t *psvrm;

	for (imom = 0; imom < pnode->nd_nummoms; ++imom) {
		psvrm = pnode->nd_moms[imom]->mi_data;
		for (ivnd = 0; ivnd < psvrm->msr_numvnds; ++ivnd) {
			if (psvrm->msr_children[ivnd] == pnode) {
				/* move list down to remove this entry */
				while (ivnd < psvrm->msr_numvnds - 1) {
					psvrm->msr_children[ivnd] =
						psvrm->msr_children[ivnd + 1];
					++ivnd;
				}
				psvrm->msr_children[ivnd] = NULL;
				--psvrm->msr_numvnds;
				break; /* done with this Mom */
			}
		}
	}
}

/**
 * @brief
 * 		remove_mom_from_vnodes - remove this Mom from the list of Moms for any
 *		vnode (after the natural vnode) and removed from the Mom attribute
 * @see
 * 		effective_node_delete
 * @param[in]	pmom	-	Mom which needs to be removed
 *
 * @return	void
 */
static void
remove_mom_from_vnodes(mominfo_t *pmom)
{
	int imom;
	int ivnd;
	struct pbsnode *pnode;
	mom_svrinfo_t *psvrmom;
	attribute tmomattr;

	psvrmom = pmom->mi_data;
	if (psvrmom->msr_numvnds == 1)
		return;

	/* setup temp "Mom" attribute with the host name to remove */
	clear_attr(&tmomattr, &node_attr_def[(int) ND_ATR_Mom]);
	set_attr_generic(&tmomattr, &node_attr_def[(int) ND_ATR_Mom], pmom->mi_host, NULL, INTERNAL);

	/* start index "invd" at 1 to skip natural vnode for this Mom */
	for (ivnd = 1; ivnd < psvrmom->msr_numvnds; ++ivnd) {
		pnode = psvrmom->msr_children[ivnd];
		for (imom = 0; imom < pnode->nd_nummoms; ++imom) {
			if (pnode->nd_moms[imom] == pmom) {
				/* move list down to remove this mom */
				while (imom < pnode->nd_nummoms - 1) {
					pnode->nd_moms[imom] =
						pnode->nd_moms[imom + 1];
					++imom;
				}
				pnode->nd_moms[imom] = NULL;
				--pnode->nd_nummoms;
				/* remove (decr) Mom host from Mom attrbute */
				(void) node_attr_def[(int) ND_ATR_Mom].at_set(
					get_nattr(pnode, ND_ATR_Mom),
					&tmomattr, DECR);

				break;
			}
		}
	}
	node_attr_def[(int) ND_ATR_Mom].at_free(&tmomattr);
}

/**
 * @brief Free a pbsnode structure
 *
 * @param[in] pnode - ptr to pnode to delete
 *
 * @par MT-safe: No
 **/
void
free_pnode(struct pbsnode *pnode)
{
	int i;

	if (!pnode)
		return;

	free(pnode->nd_name);
	free(pnode->nd_hostname);
	free(pnode->nd_moms);
	/* free attributes */
	for (i = 0; i < ND_ATR_LAST; i++) {
		if (is_attr_set(&pnode->nd_attr[i]))
			node_attr_def[i].at_free(&pnode->nd_attr[i]);
	}
	free(pnode); /* delete the pnode from memory */
}

/**
 * @brief
 * 		effective_node_delete - physically delete a vnode, including its
 *		pbsnode structure, associated attribute, etc and free the licenses.
 *		This should not be called if the vnode has jobs running on it.
 *
 * @param[in,out]	pnode	-	vnode structure
 *
 * @return	void
 */
void
effective_node_delete(struct pbsnode *pnode)
{
	int i;
	struct pbssubn *psubn;
	struct pbssubn *pnxt;
	mom_svrinfo_t *psvrmom;
	dmn_info_t *pdmninfo;
	int iht;
	int lic_released = 0;

	psubn = pnode->nd_psn;
	while (psubn) {
		pnxt = psubn->next;
		subnode_delete(psubn);
		psubn = pnxt;
	}

	remove_from_unlicensed_node_list(pnode);
	lic_released = release_node_lic(pnode);

	if (pnode->nd_nummoms > 1) {
		/* unlink from mominfo for all parent Moms */
		remove_vnode_from_moms(pnode);
	} else if (pnode->nd_nummoms == 1) {
		psvrmom = (mom_svrinfo_t *) (pnode->nd_moms[0]->mi_data);
		pdmninfo = pnode->nd_moms[0]->mi_dmn_info;
		if (psvrmom->msr_children[0] == pnode) {
			/*
			 * This is the "natural" vnode for a Mom
			 * must mean for the Mom to go away also
			 * first remove from any vnode pool
			 */
			remove_mom_from_pool(pnode->nd_moms[0]);

			/* Then remove this MoM from any other vnode she manages */
			remove_mom_from_vnodes(pnode->nd_moms[0]);

			/* then delete the Mom */
			for (i = 0; pdmninfo->dmn_addrs[i]; i++) {
				u_long ipaddr = pdmninfo->dmn_addrs[i];
				if (ipaddr)
					delete_iplist_element(pbs_iplist, ipaddr);
			}
			delete_svrmom_entry(pnode->nd_moms[0]);
			pnode->nd_moms[0] = NULL; /* since we deleted the mom */
		} else {
			/* unlink from mominfo of parent Moms */
			remove_vnode_from_moms(pnode);
		}
	}

	/* set the nd_moms to NULL before calling save */
	if (pnode->nd_moms)
		free(pnode->nd_moms);
	pnode->nd_moms = NULL;

	DBPRT(("Deleting node %s from database\n", pnode->nd_name))
	node_delete_db(pnode);

	remove_node_topology(pnode->nd_name);

	/* delete the node from the node tree as well as the node array */
	if (node_idx != NULL)
		pbs_idx_delete(node_idx, pnode->nd_name);

	for (iht = pnode->nd_arr_index + 1; iht < svr_totnodes; iht++) {
		pbsndlist[iht - 1] = pbsndlist[iht];
		/* adjust the arr_index since we are coalescing elements */
		pbsndlist[iht - 1]->nd_arr_index--;
	}
	svr_totnodes--;
	free_pnode(pnode);

	if (lic_released)
		license_nodes();
}

/**
 * @brief
 *	setup_notification -  Sets up the  mechanism for notifying
 *	other members of the server's node pool that a new node was added
 *	manually via qmgr.
 *	The IS_CLUSTER_ADDRS message is only sent to the existing Moms.
 * @see
 * 		mgr_node_create
 *
 * @return	void
 */
void
setup_notification()
{
	int i;
	int nmom;
	static time_t addr_send_tm = 0;

	for (i = 0; i < svr_totnodes; i++) {
		if (pbsndlist[i]->nd_state & INUSE_DELETED)
			continue;

		set_vnode_state(pbsndlist[i], INUSE_DOWN, Nd_State_Or);
		post_attr_set(get_nattr(pbsndlist[i], ND_ATR_state));
		for (nmom = 0; nmom < pbsndlist[i]->nd_nummoms; ++nmom) {
			((pbsndlist[i]->nd_moms[nmom]->mi_dmn_info))->dmn_state |= INUSE_NEED_ADDRS;
		}
	}

	/* send IS_CLUSTERADDR2 to happen in next 2 seconds */
	if (addr_send_tm <= time_now) {
		addr_send_tm = time_now + MCAST_WAIT_TM;
		struct work_task *ptask = set_task(WORK_Timed, addr_send_tm, mcast_msg, NULL);
		ptask->wt_aux = IS_CLUSTER_ADDRS;
	}
}

/**
 * @brief
 * 		process_host_name_part - actually processes the node name part of the form
 *		node[:ts|:gl]
 *		checks the node type and rechecks agaist the ntype attribute which
 *		may be in the attribute list given by plist
 * @see
 * 		create_pbs_node2
 *
 * @param[in]		objname	-	node to be's name
 * @param[out]		plist	-	THINGS RETURNED
 * @param[out]		pname	-	node name w/o any :ts
 * @param[out]		ntype	-	node type, time-shared, not
 *
 * @return	int
 * @retval	0	- success
 */
int
process_host_name_part(char *objname, svrattrl *plist, char **pname, int *ntype)
{
	attribute lattr;
	char *pnodename; /*caller supplied node name */
	int len;

	len = strlen(objname);
	if (len == 0)
		return (PBSE_UNKNODE);

	pnodename = strdup(objname);

	if (pnodename == NULL)
		return (PBSE_SYSTEM);

	*ntype = NTYPE_PBS;
	if (len >= 3) {
		if (!strcmp(&pnodename[len - 3], ":ts")) {
			pnodename[len - 3] = '\0';
		}
	}
	*pname = pnodename; /* return node name	  */

	if ((*ntype == NTYPE_PBS) && (plist != NULL)) {
		/* double check type */
		while (plist) {
			if (!strcasecmp(plist->al_name, ATTR_NODE_ntype))
				break;
			plist = (svrattrl *) GET_NEXT(plist->al_link);
		}
		if (plist) {
			clear_attr(&lattr, &node_attr_def[ND_ATR_ntype]);
			(void) decode_ntype(&lattr, plist->al_name, 0, plist->al_value);
			*ntype = (int) lattr.at_val.at_short;
		}
	}

	return (0); /* function successful    */
}

static char *nodeerrtxt = "Node description file update failed";

/**
 * @brief
 *		Static function to update the specified mom in the db.
 *
 * @see
 * 		save_nodes_db, save_nodes_db_inner
 *
 * @return	error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
static int
save_nodes_db_mom(mominfo_t *pmom)
{
	struct pbsnode *np;
	pbs_list_head wrtattr;
	mom_svrinfo_t *psvrm;
	int nchild;

	CLEAR_HEAD(wrtattr);

	if (pmom == NULL)
		return -1;

	psvrm = (mom_svrinfo_t *) pmom->mi_data;
	for (nchild = 0; nchild < psvrm->msr_numvnds; ++nchild) {
		np = psvrm->msr_children[nchild];
		if (np == NULL)
			continue;

		if (np->nd_state & INUSE_DELETED) {
			/* this shouldn't happen, if it does, ignore it */
			continue;
		}

		if (np->nd_modified) {
			if (node_save_db(np) != 0) {
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_WARNING, "nodes", nodeerrtxt);
				return (-1);
			}
			np->nd_modified = 0;
		}
	}

	return 0;
}

/**
 * @brief
 *		Static function to update all the nodes in the db
 *
 * @see
 * 		save_nodes_db_mom
 *
 * @return	error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
static int
save_nodes_db_inner(void)
{
	int i;
	pbs_list_head wrtattr;
	mominfo_t *pmom;

	/* for each Mom ... */
	CLEAR_HEAD(wrtattr);

	for (i = 0; i < mominfo_array_size; ++i) {
		pmom = mominfo_array[i];
		if (pmom == NULL)
			continue;

		if (save_nodes_db_mom(pmom) == -1)
			return -1;
	}
	return 0;
}

/**
 * @brief
 *		When called, this function will update
 *		all the nodes in the db. It will update the mominfo_time to the db
 *		and save all the nodes.
 *
 *  	The updates are done under a single transaction.
 *  	Upon successful conclusion the transaction is commited.
 *
 * @param[in]	changemodtime - flag to change the mom modification time or not
 * @param[in]	p - when p is set, save the specific mom to the db
 *		    when p is unset, save all the nodes to the db
 *
 * @return	error code
 * @retval	-1 - Failure
 * @retval	 0 - Success
 *
 */
int
save_nodes_db(int changemodtime, void *p)
{
	struct pbsnode *np;
	pbs_db_mominfo_time_t mom_tm = {0, 0};
	pbs_db_obj_info_t obj;
	int num;
	resource *resc;
	char *rname;
	resource_def *rscdef;
	int i;
	mominfo_t *pmom = (mominfo_t *) p;
	char *conn_db_err = NULL;

	DBPRT(("%s: entered\n", __func__))

	if (changemodtime) { /* update generation on host-vnode map */
		if (mominfo_time.mit_time == time(0))
			mominfo_time.mit_gen++;
		else {
			mominfo_time.mit_time = time(0);
			mominfo_time.mit_gen = 1;
		}
	}

	if (svr_totnodes == 0 || mominfo_array_size == 0) {
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ALERT, "nodes",
			  "Server has empty nodes list");
		return (-1);
	}

	/* insert/update the mominfo_time to db */
	mom_tm.mit_time = mominfo_time.mit_time;
	mom_tm.mit_gen = mominfo_time.mit_gen;
	obj.pbs_db_obj_type = PBS_DB_MOMINFO_TIME;
	obj.pbs_db_un.pbs_db_mominfo_tm = &mom_tm;

	if (pbs_db_save_obj(svr_db_conn, &obj, OBJ_SAVE_QS) == 1) {	   /* no row updated */
		if (pbs_db_save_obj(svr_db_conn, &obj, OBJ_SAVE_NEW) != 0) /* insert also failed */
			goto db_err;
	}

	if (pmom) {
		if (save_nodes_db_mom(pmom) == -1)
			goto db_err;
	} else {
		if (save_nodes_db_inner() == -1)
			goto db_err;
	}

	/*
	 * Clear the ATR_VFLAG_MODIFY bit on each node attribute
	 * and on the node_group_key resource, for those nodes
	 * that possess a node_group_key resource
	 */

	if (is_sattr_set(SVR_ATR_NodeGroupKey))
		rname = get_sattr_str(SVR_ATR_NodeGroupKey);
	else
		rname = NULL;

	if (rname)
		rscdef = find_resc_def(svr_resc_def, rname);
	else
		rscdef = NULL;

	for (i = 0; i < svr_totnodes; i++) {
		np = pbsndlist[i];
		if (np->nd_state & INUSE_DELETED)
			continue;

		for (num = 0; num < ND_ATR_LAST; num++) {

			(get_nattr(np, num))->at_flags &= ~ATR_VFLAG_MODIFY;

			if (num == ND_ATR_ResourceAvail)
				if (rname != NULL && rscdef != NULL) {
					if ((resc = find_resc_entry(get_nattr(np, ND_ATR_ResourceAvail), rscdef)))
						resc->rs_value.at_flags &= ~ATR_VFLAG_MODIFY;
				}
		}
	}
	return (0);

db_err:
	pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
	log_errf(-1, __func__, "Unable to save node to the database %s", conn_db_err ? conn_db_err : "");
	free(conn_db_err);
	panic_stop_db();
	return (-1);
}

/**
 * @brief
 * 		init_prop - allocate and initialize a prop struct
 *
 * @param[in]	pname	-	points to the property string
 *
 * @return	struct prop *
 */

struct prop *
init_prop(char *pname)
{
	struct prop *pp;

	if ((pp = (struct prop *) malloc(sizeof(struct prop))) != NULL) {
		pp->name = pname;
		pp->mark = 0;
		pp->next = 0;
	}

	return (pp);
}

/**
 * @brief
 * 		create_subnode - create a subnode entry and link to parent node
 * @see
 * 		mod_node_ncpus, set_nodes, create_pbs_node2
 * @param[in] - pnode -	parent node.
 * @param[in] - lstsn - Points to the last subnode in the parent node list. This
 *						eliminates the need to find the last node in parent node list.
 *
 * @return	struct pbssubn *
 */
struct pbssubn *
create_subnode(struct pbsnode *pnode, struct pbssubn *lstsn)
{
	struct pbssubn *psubn;
	struct pbssubn **nxtsn;

	psubn = (struct pbssubn *) malloc(sizeof(struct pbssubn));
	if (psubn == NULL) {
		return NULL;
	}

	/* initialize the subnode and link into the parent node */

	psubn->next = NULL;
	psubn->jobs = NULL;
	psubn->inuse = 0;
	psubn->index = pnode->nd_nsn++;
	pnode->nd_nsnfree++;
	if ((pnode->nd_state & INUSE_JOB) != 0) {
		/* set_vnode_state(pnode, INUSE_FREE, Nd_State_Set); */
		/* removed as part of OS prov fix- this was causing a provisioning
		 * node to lose its INUSE_PROV flag. Prb occurred when OS with low
		 * ncpus booted into OS with higher ncpus.
		 */
		set_vnode_state(pnode, ~INUSE_JOB, Nd_State_And);
	}

	if (lstsn) /* If not null, then append new subnode directly to the last node */
		lstsn->next = psubn;
	else {
		nxtsn = &pnode->nd_psn; /* link subnode onto parent node's list */
		while (*nxtsn)
			nxtsn = &((*nxtsn)->next);
		*nxtsn = psubn;
	}
	return (psubn);
}

/**
 * @brief
 *		Read the, "nodes" information from database
 *		containing the list of properties for each node.
 *		The list of nodes is formed with pbsndlist as the head.
 * @see
 * 		pbsd_init
 *
 * @return	error code
 * @retval	-1	- Failure
 * @retval	0	- Success
 *
 */
int
setup_nodes()
{
	pbs_db_obj_info_t obj;
	pbs_db_node_info_t dbnode = {{0}};
	pbs_db_mominfo_time_t mom_tm = {0, 0};
	int rc;
	void *conn = (void *) svr_db_conn;
	char *conn_db_err = NULL;

	DBPRT(("%s: entered\n", __func__))

	svr_totnodes = 0;

	/* Load  the mominfo_time from the db */
	obj.pbs_db_obj_type = PBS_DB_MOMINFO_TIME;
	obj.pbs_db_un.pbs_db_mominfo_tm = &mom_tm;
	if (pbs_db_load_obj(svr_db_conn, &obj) == -1) {
		log_errf(-1, __func__, "Could not load momtime info");
		return (-1);
	}
	mominfo_time.mit_time = mom_tm.mit_time;
	mominfo_time.mit_gen = mom_tm.mit_gen;

	obj.pbs_db_obj_type = PBS_DB_NODE;
	obj.pbs_db_un.pbs_db_node = &dbnode;

	rc = pbs_db_search(conn, &obj, NULL, (query_cb_t) &recov_node_cb);
	if (rc == -1) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		if (conn_db_err != NULL) {
			log_errf(-1, __func__, conn_db_err);
			free(conn_db_err);
		}
		return (-1);
	}

	return (0);
}

/**
 * @brief
 * 		delete_a_subnode - mark a (last) single subnode entry as deleted
 * @see
 * 		mod_node_ncpus
 *
 * @param[in,out]	pnode	- parent node list
 *
 * @return	void
 */
static void
delete_a_subnode(struct pbsnode *pnode)
{
	struct pbssubn *psubn;
	struct pbssubn *pprior = 0;

	psubn = pnode->nd_psn;

	while (psubn->next) {
		pprior = psubn;
		psubn = psubn->next;
	}

	/*
	 * found last subnode in list for given node, mark it deleted
	 * note, have to update nd_nsnfree using pnode
	 * because it point to the real node rather than the the copy (pnode)
	 * and the real node is overwritten by the copy
	 */

	if ((psubn->inuse & INUSE_JOB) == 0)
		pnode->nd_nsnfree--;

	subnode_delete(psubn);
	if (pprior)
		pprior->next = NULL;
}

/**
 * @brief
 * 		mod_node_ncpus - when resources_available.ncpus changes, need to
 *		update the number of subnodes, creating or deleting as required
 *
 * @param[in,out]	pnode	- parent node list
 * @param[in]		ncpus	- resources_available.ncpus
 * @param[in]		actmode	- value for the "actmode" parameter
 *
 * @return	int
 * @return	0	- success
 */

int
mod_node_ncpus(struct pbsnode *pnode, long ncpus, int actmode)
{
	long old_np;
	struct pbssubn *lst_sn;
	if ((actmode == ATR_ACTION_NEW) || (actmode == ATR_ACTION_ALTER)) {

		if (ncpus < 0)
			return PBSE_BADATVAL;
		else if (ncpus == 0)
			ncpus = 1; /* insure at least 1 subnode */

		old_np = pnode->nd_nsn;
		lst_sn = NULL;
		while (ncpus != old_np) {

			if (ncpus < old_np) {
				delete_a_subnode(pnode);
				old_np--;
			} else {
				/* Store the last subnode of parent node list.
				 * This removes the need to find the last node of
				 * parent node's list, in create_subnode().
				 */
				lst_sn = create_subnode(pnode, lst_sn);
				old_np++;
			}
		}
		pnode->nd_nsn = old_np;
	}
	return 0;
}

/**
 * @brief
 * 		fix_indirect_resc_targets - set or clear ATR_VFLAG_TARGET flag in
 * 		a target resource "index" is the index into the node's attribute
 * 		array (which attr). If invoked with ND_ATR__ResourceAvail or
 * 		ND_ATR_ResourceAssn, the target flag is applied on both. We need
 * 		to do this as the check for target flag in fix_indirectness relies
 * 		on resources_assigned as resources_available is already got over-written.
 *
 * @param[out]	psourcend	- Vnode structure
 * @param[in]	psourcerc	- target resource
 * @param[in]	index		- index into the node's attribute array
 * @param[in]	set			- decides set or unset.
 *
 * @return	int
 * @retval	-1	- error
 * @retval	0	- success
 */
int
fix_indirect_resc_targets(struct pbsnode *psourcend, resource *psourcerc, int index, int set)
{
	char *nname;
	char *pn;
	struct pbsnode *pnode;
	resource *ptargetrc;

	if (psourcend)
		nname = psourcend->nd_name;
	else
		nname = " ";

	pn = psourcerc->rs_value.at_val.at_str;
	if ((pn == NULL) ||
	    (*pn != '@') ||
	    ((pnode = find_nodebyname(pn + 1)) == NULL)) {
		sprintf(log_buffer,
			"resource %s on vnode points to invalid vnode %s",
			psourcerc->rs_defin->rs_name, pn);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE, LOG_CRIT,
			  nname, log_buffer);
		return -1;
	}

	ptargetrc = find_resc_entry(get_nattr(pnode, index), psourcerc->rs_defin);
	if (ptargetrc == NULL) {
		sprintf(log_buffer, "resource %s on vnode points to missing resource on vnode %s", psourcerc->rs_defin->rs_name, pn + 1);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE, LOG_CRIT,
			  nname, log_buffer);
		return -1;
	} else {
		if (set)
			ptargetrc->rs_value.at_flags |= ATR_VFLAG_TARGET;
		else
			ptargetrc->rs_value.at_flags &= ~ATR_VFLAG_TARGET;

		if (index == ND_ATR_ResourceAvail)
			index = ND_ATR_ResourceAssn;
		else
			index = ND_ATR_ResourceAvail;

		ptargetrc = find_resc_entry(get_nattr(pnode, index), psourcerc->rs_defin);
		if (!ptargetrc) {
			/* For unset if the avail/assign counterpart is null, just return without creating the rescource.
			* This happens only during node clean-up stage */
			if (!set || index == ND_ATR_ResourceAvail)
				return 0;
			ptargetrc = add_resource_entry(get_nattr(pnode, index), psourcerc->rs_defin);
			if (!ptargetrc)
				return PBSE_SYSTEM;
		}

		if (set)
			ptargetrc->rs_value.at_flags |= ATR_VFLAG_TARGET;
		else
			ptargetrc->rs_value.at_flags &= ~ATR_VFLAG_TARGET;
	}

	return 0;
}

/**
 * @brief
 * 		indirect_target_check - called via a work task to (re)set ATR_VFLAG_TARGET
 *		in any resource which is the target of another indirect resource
 *
 *		This covers the cases where a target node might not have been setup
 *		on Server recovery/startup.
 * @see
 * 		fix_indirectness and mgr_unset_attr
 *
 * @param[in]	ptask	-	work task structure
 *
 * @return	void
 */

void
indirect_target_check(struct work_task *ptask)
{
	int i;
	struct pbsnode *pnode;
	resource *presc;

	for (i = 0; i < svr_totnodes; i++) {
		pnode = pbsndlist[i];
		if (pnode->nd_state & INUSE_DELETED ||
		    pnode->nd_state & INUSE_STALE)
			continue;
		if (is_nattr_set(pnode, ND_ATR_ResourceAvail)) {
			for (presc = (resource *) GET_NEXT(get_nattr_list(pnode, ND_ATR_ResourceAvail));
			     presc;
			     presc = (resource *) GET_NEXT(presc->rs_link)) {

				if (presc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
					fix_indirect_resc_targets(pnode, presc, (int) ND_ATR_ResourceAvail, 1);
				}
			}
		}
	}
}

/**
 * @brief
 * 		fix_indirectness - check if a member of a node's resource_available is
 *		becoming indirect (points to another node) or was indirect and is
 *		becoming direct.
 *
 *		If becoming indirect, check that the target node is known (unless just
 *		recovering) and that the target resource itself is not indirect.
 *
 *		If "doit" is true, then and only then make the needed changes in
 *		resources_available and resources_assigned.
 * @see
 * 		node_np_action and update2_to_vnode
 *
 * @param[in]		presc	-	pointer to resource structure
 * @param[in,out]	pnode	-	the node for checking.
 * @param[in]		doit	-	If "doit" is true, then and only then make the needed changes in
 * 								recovering) and that the target resource itself is not indirect.
 *
 * @return	int
 * @return	0	- success
 * @retval	nonzero	- failure
 *
 */
int
fix_indirectness(resource *presc, struct pbsnode *pnode, int doit)
{
	int consumable;
	resource *presc_avail; /* resource available */
	resource *presc_assn;  /* resource assigned  */
	struct pbssubn *psn;
	struct pbsnode *ptargetnd; /* target node		  */
	resource *ptargetrc;	   /* target resource avail  */
	struct resource_def *prdef;
	int recover_ok;
	int run_safety_check = 0;

	prdef = presc->rs_defin;

	recover_ok = (get_sattr_long(SVR_ATR_State) == SV_STATE_INIT); /* if true, then recoverying and targets may not yet be there */
	consumable = prdef->rs_flags & (ATR_DFLAG_ANASSN | ATR_DFLAG_FNASSN);
	presc_avail = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAvail), prdef);
	presc_assn = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAssn), prdef);

	if (doit == 0) { /* check for validity only this pass */

		if (presc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {

			/* disallow change if vnode has running jobs */
			for (psn = pnode->nd_psn; psn; psn = psn->next) {
				if (psn->jobs != NULL)
					return PBSE_OBJBUSY;
			}

			/* setting this resource to be indirect, make serveral checks */

			/* this vnode may not be a target of another indirect */
			if (presc_assn) {
				if (presc_assn->rs_value.at_flags & ATR_VFLAG_TARGET) {
					if ((resc_in_err = strdup(presc_assn->rs_defin->rs_name)) == NULL)
						return PBSE_SYSTEM;
					return PBSE_INDIRECTHOP;
				}
			}

			/* target vnode must be known unless the Server is recovering */
			/* the value (at_str) is "@vnodename", so skip over the '@'   */
			ptargetnd = find_nodebyname(presc->rs_value.at_val.at_str + 1);
			if (ptargetnd == NULL) {
				if (!recover_ok)
					return (PBSE_UNKNODE);
			} else {

				/* target resource must exist */
				ptargetrc = find_resc_entry(get_nattr(ptargetnd, ND_ATR_ResourceAvail), prdef);
				if (pnode == ptargetnd) {
					/* target node may not be itself  */
					if ((resc_in_err = strdup(prdef->rs_name)) == NULL)
						return PBSE_SYSTEM;
					return PBSE_INDIRECTHOP;
				} else if (ptargetrc == NULL) {
					if ((resc_in_err = strdup(prdef->rs_name)) == NULL)
						return PBSE_SYSTEM;
					return (PBSE_INDIRECTBT);
				} else {
					if (ptargetrc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
						/* target cannot be indirect itself */
						if ((resc_in_err = strdup(ptargetrc->rs_defin->rs_name)) == NULL)
							return PBSE_SYSTEM;
						return PBSE_INDIRECTHOP;
					}
				}
				/* if consumable, insure resource exists in this node's */
				/* resources_assigned */

				if (consumable) {
					ptargetrc = add_resource_entry(get_nattr(pnode, ND_ATR_ResourceAssn), prdef);
					if (ptargetrc == NULL)
						return PBSE_SYSTEM;
				}
			}

		} else {

			/* new is not indirect, was the original?
			* we are using resource-assigned to identify that the resource
			* was an indirect resource because attribute's set function has
			* already changed resources-available */

			if (presc_assn) {
				if (presc_assn->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
					/* disallow change if vnode has running jobs */
					for (psn = pnode->nd_psn; psn; psn = psn->next) {
						if (psn->jobs != NULL)
							return PBSE_OBJBUSY;
					}
				}
			}
		}
		return PBSE_NONE;

	} else {

		/*
		 * In this pass,  actually do the required changes:
		 * If setting...
		 *	- set ATR_VFLAG_TARGET on the target resource entry
		 *  - change the paired Resource_Assigned entry to also be indirect
		 * If unsetting...
		 *	- clear ATR_VFLAG_TARGET on the old target resource
		 *  - change the paired Resource_Assigned entry to be direct
		 */

		if (presc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
			int rc;

			/* setting to be indirect */
			rc = fix_indirect_resc_targets(pnode, presc, (int) ND_ATR_ResourceAvail, 1);
			if (rc == PBSE_SYSTEM)
				return rc;
			else if (rc == -1)
				run_safety_check = 1; /* need to set after nodes done */

			if (consumable && (presc_assn != NULL)) {
				prdef->rs_free(&presc_assn->rs_value); /* free first */
				(void) decode_str(&presc_assn->rs_value, NULL, NULL,
						  presc->rs_value.at_val.at_str);
				presc_assn->rs_value.at_flags |= ATR_VFLAG_INDIRECT;
			}

		} else if (presc_avail && presc_assn && (presc_assn->rs_value.at_flags & ATR_VFLAG_INDIRECT)) {
			/* unsetting an old indirect reference */
			/* Clear ATR_VFLAG_TARGET on target vnode */
			(void) fix_indirect_resc_targets(pnode, presc_assn, (int) ND_ATR_ResourceAssn, 0);
			presc_avail->rs_value.at_flags &= ~ATR_VFLAG_INDIRECT;
			if (consumable) {
				free_str(&presc_assn->rs_value);
				prdef->rs_decode(&presc_assn->rs_value, NULL, NULL, NULL);
				presc_assn->rs_value.at_flags &= ~ATR_VFLAG_INDIRECT;
			}
			run_safety_check = 1;
		}

		if (run_safety_check) /* double check TARGET bit on targets */
			(void) set_task(WORK_Immed, 0, indirect_target_check, NULL);
	}
	return 0;
}

/**
 * @brief
 * 		node_np_action - action routine for a node's resources_available attribute
 *		Does several things:
 *		1. prohibits resources_available.hosts from being changed;
 *		2. when resources_available.ncpus (np in nodes file) changes,
 *	   	update the subnode structures;
 *		3. For any modified resource, check if it is changing "indirectness"
 *
 * @param[in]	new	-	newly changed resources_available
 * @param[in]	pobj	-	pointer to a pbsnode struct
 * @param[in]	actmode	-	action mode: "NEW" or "ALTER"
 *
 * @return	int
 * @retval	0	- success
 * @retval	nonzero	- error
 */

int
node_np_action(attribute *new, void *pobj, int actmode)
{
	int err;
	struct pbsnode *pnode = (struct pbsnode *) pobj;
	resource_def *prdef;
	resource *presc;
	long new_np;

	if (actmode == ATR_ACTION_FREE) /* cannot unset resources_available */
		return (PBSE_IVALREQ);

	/* 1. prevent change of "host" or "vnode" */
	prdef = &svr_resc_def[RESC_HOST];
	presc = find_resc_entry(new, prdef);
	if ((presc != NULL) &&
	    (presc->rs_value.at_flags & ATR_VFLAG_MODIFY)) {
		if (actmode != ATR_ACTION_NEW)
			return (PBSE_ATTRRO);
	}
	prdef = &svr_resc_def[RESC_VNODE];
	presc = find_resc_entry(new, prdef);
	if ((presc != NULL) &&
	    (presc->rs_value.at_flags & ATR_VFLAG_MODIFY)) {
		if (actmode != ATR_ACTION_NEW)
			return (PBSE_ATTRRO);
	}
	/* prevent change of "aoe" */
	prdef = &svr_resc_def[RESC_AOE];
	presc = find_resc_entry(new, prdef);
	if ((presc != NULL) &&
	    (presc->rs_value.at_flags & ATR_VFLAG_MODIFY)) {
		if (pnode->nd_state & (INUSE_PROV | INUSE_WAIT_PROV))
			return (PBSE_NODEPROV_NOACTION);
		if (is_nattr_set(pnode, ND_ATR_Mom) && (!compare_short_hostname(
							       (get_nattr_arst(pnode, ND_ATR_Mom))->as_string[0],
							       server_host)))
			return (PBSE_PROV_HEADERROR);
	}

	/* 2. If changing ncpus, fix subnodes */
	prdef = &svr_resc_def[RESC_NCPUS];
	presc = find_resc_entry(new, prdef);

	if (presc == NULL)
		return PBSE_SYSTEM;
	if (presc->rs_value.at_flags & ATR_VFLAG_MODIFY) {
		new_np = presc->rs_value.at_val.at_long;
		presc->rs_value.at_flags &= ~ATR_VFLAG_DEFLT;
		if ((err = mod_node_ncpus(pnode, new_np, actmode)) != 0)
			return (err);
	}

	if ((err = check_sign((pbsnode *) pobj, new)) != PBSE_NONE)
		return err;

	/* 3. check each entry that is modified to see if it is now   */
	/*    becoming an indirect reference or was one and now isn't */
	/*    This first pass just validates the changes...	      */

	for (presc = (resource *) GET_NEXT(new->at_val.at_list);
	     presc != NULL;
	     presc = (resource *) GET_NEXT(presc->rs_link)) {

		if (presc->rs_value.at_flags & ATR_VFLAG_MODIFY)
			if ((err = fix_indirectness(presc, pnode, 0)) != 0)
				return (err);
	}

	/* Now do it again and actual make the needed changes since  */
	/* there are no errors to worry about			     */
	for (presc = (resource *) GET_NEXT(new->at_val.at_list);
	     presc != NULL;
	     presc = (resource *) GET_NEXT(presc->rs_link)) {
		if (presc->rs_value.at_flags & ATR_VFLAG_MODIFY)
			(void) fix_indirectness(presc, pnode, 1);
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		node_pcpu_action - action routine for node's pcpus (physical) resource
 *
 * @param[in]	new	-		derive props into this attribute
 * @param[in]	pobj	-	pointer to a pbsnode struct
 * @param[in]	actmode	-	action mode: "NEW" or "ALTER"
 *
 * @return	int
 * @retval	0	- success
 * @retval	nonzero	- error
 */

int
node_pcpu_action(attribute *new, void *pobj, int actmode)
{

	struct pbsnode *pnode = (struct pbsnode *) pobj;
	resource_def *prd;
	resource *prc;
	long new_np;

	/* get new value of pcpus */
	new_np = new->at_val.at_long;
	pnode->nd_ncpus = new_np;

	/* now get ncpus */
	prd = &svr_resc_def[RESC_NCPUS];
	prc = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAvail), prd);
	if (prc == 0) {
		return (0); /* if this error happens - ignore it */
	}
	if (((is_attr_set(&prc->rs_value)) == 0) ||
	    ((prc->rs_value.at_flags & ATR_VFLAG_DEFLT) != 0)) {
		if (prc->rs_value.at_val.at_long != new_np) {
			prc->rs_value.at_val.at_long = new_np;
			prc->rs_value.at_flags |= ATR_SET_MOD_MCACHE | ATR_VFLAG_DEFLT;
			return (mod_node_ncpus(pnode, new_np, actmode));
		}
	}
	return (0);
}

/**
 * @brief
 * 		mark_which_queues_have_nodes()
 *
 *		Mark the queue header for queues that have nodes associated with
 *		them.  This is used when looking for nodes for jobs that are in
 *		such a queue.
 *
 * @see
 * 		node_queue_action, pbsd_init and mgr_node_unset.
 *
 * @return	void
 */

void
mark_which_queues_have_nodes()
{
	int i;
	pbs_queue *pque;

	/* clear "has node" flag in all queues */

	svr_quehasnodes = 0;

	pque = (pbs_queue *) GET_NEXT(svr_queues);
	while (pque != NULL) {
		set_qattr_l_slim(pque, QE_ATR_HasNodes, 0, SET);
		ATR_UNSET(get_qattr(pque, QE_ATR_HasNodes));
		pque = (pbs_queue *) GET_NEXT(pque->qu_link);
	}

	/* now (re)set flag for those queues that do have nodes */

	for (i = 0; i < svr_totnodes; i++) {
		if (pbsndlist[i]->nd_pque) {
			set_qattr_l_slim(pbsndlist[i]->nd_pque, QE_ATR_HasNodes, 1, SET);
			svr_quehasnodes = 1;
		}
	}
}

/**
 * @brief
 * 		node_queue_action - action routine for nodes when "queue" attribute set
 *
 * @param[in]	pattr	-	attribute
 * @param[in]	pobj	-	pointer to a pbsnode struct
 * @param[in]	actmode	-	action mode: "NEW" or "ALTER"
 *
 * @return	int
 * @retval	0	- success
 * @retval	nonzero	- error
 */

int
node_queue_action(attribute *pattr, void *pobj, int actmode)
{
	struct pbsnode *pnode;
	pbs_queue *pq;

	pnode = (struct pbsnode *) pobj;

	if (is_attr_set(pattr)) {

		pq = find_queuebyname(pattr->at_val.at_str);
		if (pq == 0) {
			return (PBSE_UNKQUE);
		} else if (pq->qu_qs.qu_type != QTYPE_Execution) {
			return (PBSE_ATTRTYPE);
		} else if (is_qattr_set(pq, QA_ATR_partition) &&
			   is_nattr_set(pnode, ND_ATR_partition) &&
			   strcmp(get_qattr_str(pq, QA_ATR_partition), get_nattr_str(pnode, ND_ATR_partition))) {
			return PBSE_PARTITION_NOT_IN_QUE;
		} else {
			pnode->nd_pque = pq;
		}
	} else {
		pnode->nd_pque = NULL;
	}
	mark_which_queues_have_nodes();
	return 0;
}
/**
 * @brief
 * 		set_node_host_name returns 0 if actmode is 1, otherwise PBSE_ATTRRO
 */
int
set_node_host_name(attribute *pattr, void *pobj, int actmode)
{
	if (actmode == ATR_ACTION_NEW || actmode == ATR_ACTION_RECOV)
		return 0;
	else
		return PBSE_ATTRRO;
}
/**
 * @brief
 * 		set_node_host_name returns 0 if actmode is 1, otherwise PBSE_ATTRRO
 */
int
set_node_mom_port(attribute *pattr, void *pobj, int actmode)
{
	if (actmode == ATR_ACTION_NEW || actmode == ATR_ACTION_RECOV)
		return 0;
	else
		return PBSE_ATTRRO;
}

/**
 * @brief
 * 		Returns true (1) if none of the following bits are set:
 *			OFFLINE, OFFLINE_BY_MOM, DOWN, DELETED, STALE
 *		otherwise return false (0) for the node being "down"
 *
 a @param[in]	nodename - name of the node to check
 *
 * @return int
 * @retval 0	- means vnode is not up
 * @retval 1	- means vnode is up
 */

int
is_vnode_up(char *nodename)
{
	struct pbsnode *np;

	np = find_nodebyname(nodename);
	if ((np == NULL) ||
	    ((np->nd_state & (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM | INUSE_DOWN | INUSE_DELETED | INUSE_STALE)) != 0))
		return 0; /* vnode is not up */
	else
		return 1; /* vnode is up */
}

/**
 * @brief
 * 		decode_Mom_list - decode a comma string which specifies a list of Mom/host
 *		names into an attr of type ATR_TYPE_ARST
 *		Each host name is fully qualified before being added into the array
 *
 * @param[in,out]	patr	-	attribute
 * @param[in]		name	-	attribute name
 * @param[in]	rescn	-	resource name, unused here.
 * @param[in]	val	-	comma separated string of substrings
 *
 *	Returns: 0 if ok,
 *		>0 error number if an error occured,
 *		*patr members set
 */

int
decode_Mom_list(attribute *patr, char *name, char *rescn, char *val)
{
	int rc;
	int ns;
	int i = 0;
	char *p;
	char buf[PBS_MAXHOSTNAME + 1];
	static char **str_arr = NULL;
	static long int str_arr_len = 0;
	attribute new;
	struct sockaddr_in check_ip;
	int is_node_name_ip;

	if ((val == NULL) || (strlen(val) == 0) || count_substrings(val, &ns)) {
		node_attr_def[(int) ND_ATR_Mom].at_free(patr);
		clear_attr(patr, &node_attr_def[(int) ND_ATR_Mom]);
		/* ATTR_VFLAG_SET is cleared now */
		patr->at_flags &= ATR_MOD_MCACHE;
		return (0);
	}

	if (is_attr_set(patr)) {
		node_attr_def[(int) ND_ATR_Mom].at_free(patr);
		clear_attr(patr, &node_attr_def[(int) ND_ATR_Mom]);
	}

	if (str_arr_len == 0) {
		str_arr = malloc(((2 * ns) + 1) * sizeof(char *));
		str_arr_len = (2 * ns) + 1;
	} else if (str_arr_len < ns) {
		char **new_str_arr;
		new_str_arr = realloc(str_arr, ((2 * ns) + 1) * sizeof(char *));
		/* str_arr will be untouched if realloc failed */
		if (!new_str_arr)
			return PBSE_SYSTEM;
		str_arr = new_str_arr;
		str_arr_len = (2 * ns) + 1;
	}
	/* Filling node list to a array, this has been done outside the
	 * second for loop since, parse_comma_string() is being again called internally by
	 * decode_arst() that alters the static variable in parse_comma_string().
	 */
	str_arr[0] = NULL;
	p = parse_comma_string(val);
	for (i = 0; (str_arr[i] = p) != NULL; i++)
		p = parse_comma_string(NULL);

	for (i = 0; (p = str_arr[i]) != NULL; i++) {
		clear_attr(&new, &node_attr_def[(int) ND_ATR_Mom]);
		is_node_name_ip = inet_pton(AF_INET, p, &(check_ip.sin_addr));
		if (is_node_name_ip || get_fullhostname(p, buf, (sizeof(buf) - 1)) != 0) {
			strncpy(buf, p, (sizeof(buf) - 1));
			buf[sizeof(buf) - 1] = '\0';
		}

		rc = decode_arst(&new, ATTR_NODE_Mom, NULL, buf);
		if (rc != 0)
			continue;
		set_arst(patr, &new, INCR);
		free_arst(&new);
	}

	return (0);
}

/**
 * @brief
 * 		remember the node topology information reported by a node's MoM
 *
 * @param[in]	node_name	-	the name of the node
 * @param[in]	topology	-	topology information from node's MoM
 *
 * @return	void
 *
 * @par MT-Safe:	no
 *
 * @par Note:
 *		Information is recorded in the $PBS_HOME/server_priv/node_topology/
 *		directory, one file per node.  The information in these files may be
 *		consumed by the hwloc lstopo command using
 *		lstopo -i <node topology file path>
 *
 * @see	http://www.open-mpi.org/projects/hwloc/doc/v1.3/tools.php, lstopo(1)
 */
static void
record_node_topology(char *node_name, char *topology)
{
	char path[MAXPATHLEN + 1];
	int fd;
	int topology_len;
	static char topology_dir[] = "topology";
	static char msg_topologydiroverflow[] = "unexpected overflow "
						"creating node topology "
						"directory";
	static char msg_mkdirfail[] = "failed to create topology directory";
	static char msg_topologypathoverflow[] = "unexpected overflow "
						 "creating node topology "
						 "file %s";
	static char msg_createpathfail[] = "failed to open path to node "
					   "topology file for node %s";
	static char msg_writepathfail[] = "failed to write node topology "
					  "for node %s";
	static char msg_notdir[] = "topology directory path exists but is "
				   "not a directory";
	struct stat sb;

	if (snprintf(path, sizeof(path), "%s/server_priv/%s",
		     pbs_conf.pbs_home_path,
		     topology_dir) >= sizeof(path)) {
		sprintf(log_buffer, "%s", msg_topologydiroverflow);
		log_event(PBSEVENT_DEBUG3,
			  PBS_EVENTCLASS_SERVER,
			  LOG_DEBUG, msg_daemonname,
			  log_buffer);
		return;
	}
	if (stat(path, &sb) == -1) {
		/* can't stat path - assume it does not exist */
		if (mkdir(path, S_IRWXU) == -1) {
			sprintf(log_buffer, "%s", msg_mkdirfail);
			log_err(errno, __func__, log_buffer);
			return;
		}
	} else if (!S_ISDIR(sb.st_mode)) {
		/* path exists but is not a directory */
		sprintf(log_buffer, "%s", msg_notdir);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  msg_daemonname, log_buffer);
		return;
	}

	/* path exists and is a directory */
	if (snprintf(path, sizeof(path), "%s/server_priv/%s/%s",
		     pbs_conf.pbs_home_path,
		     topology_dir, node_name) >= sizeof(path)) {
		sprintf(log_buffer, msg_topologypathoverflow, node_name);
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  msg_daemonname, log_buffer);
		return;
	}
	if ((fd = open(path, O_CREAT | O_TRUNC | O_WRONLY, S_IRUSR)) == -1) {
		sprintf(log_buffer, msg_createpathfail,
			node_name);
		log_err(errno, __func__, log_buffer);
		return;
	}
	topology_len = strlen(topology);
	if (write(fd, topology, topology_len) != topology_len) {
		sprintf(log_buffer, msg_writepathfail, node_name);
		log_err(errno, __func__, log_buffer);
	}
	(void) close(fd);
}

/**
 * @brief
 * 		remove the node topology information for the given node name
 * @see
 * 		effective_node_delete
 *
 * @param[in]	node_name	-	the name of the node
 *
 * @return	void
 *
 * @par MT-Safe:	no
 *
 */
static void
remove_node_topology(char *node_name)
{
	char path[MAXPATHLEN + 1];
	static char topology_dir[] = "topology";
	static char msg_topologyfileoverflow[] = "unexpected overflow "
						 "removing topology "
						 "file for node %s";
	static char msg_unlinkfail[] = "unlink of topology file for "
				       "node %s failed";

	if (snprintf(path, sizeof(path), "%s/server_priv/%s/%s",
		     pbs_conf.pbs_home_path,
		     topology_dir, node_name) >= sizeof(path)) {
		sprintf(log_buffer, msg_topologyfileoverflow,
			node_name);
		log_event(PBSEVENT_DEBUG3,
			  PBS_EVENTCLASS_SERVER,
			  LOG_DEBUG, msg_daemonname,
			  log_buffer);
	} else if ((unlink(path) == -1) && (errno != ENOENT)) {
		sprintf(log_buffer, msg_unlinkfail, node_name);
		log_err(errno, __func__, log_buffer);
	}
}

/**
 * @brief
 * 		set the node topology attribute
 *
 * @param[in]	new		-	pointer to new attribute
 * @param[in]	pobj	-	pointer to parent object of the attribute (in this case,
 *							a pbsnode)
 * @param[in]	op		-	the attribute operation being performed
 *
 * @return	int
 * @retval	PBSE_NONE	- success
 * @retval	nonzero		- PBSE_* error
 *
 * @par MT-Safe:	no
 *
 * @par	Note
 * 		This attribute is versioned (by an arbitrary string terminating
 *		in a ':' character).  In the case of the NODE_TOPOLOGY_TYPE_HWLOC
 *		version, the value following the version string is the topology
 *		information captured by the MoM via hwloc_topology_load() and it
 *		is saved in $PBS_HOME/server_priv/ by record_node_topology().
 *
 * @see
 * 		record_node_topology()
 *
 * @par Side Effects:
 *		None
 */
int
set_node_topology(attribute *new, void *pobj, int op)
{
#ifdef NAS /* localmod 035 */
	return (PBSE_NONE);
#else

	int rc = PBSE_NONE;
	struct pbsnode *pnode = ((pbsnode *) pobj);
	char *valstr;
	ntt_t ntt;
	char msg_unknown_topology_type[] = "unknown topology type in "
					   "topology attribute for node %s";

	switch (op) {

		case ATR_ACTION_NOOP:
			break;

		case ATR_ACTION_NEW:
		case ATR_ACTION_ALTER:

			valstr = new->at_val.at_str;

			/*
			 *	Currently two topology types are known;  if it's one
			 *	we expect, step over it to the actual value we care
			 *	about.
			 */
			if (strstr(valstr, NODE_TOPOLOGY_TYPE_HWLOC) == valstr) {
				valstr += strlen(NODE_TOPOLOGY_TYPE_HWLOC);
				ntt = tt_hwloc;
			} else if (strstr(valstr, NODE_TOPOLOGY_TYPE_CRAY) == valstr) {
				valstr += strlen(NODE_TOPOLOGY_TYPE_CRAY);
				ntt = tt_Cray;
			} else if (strstr(valstr, NODE_TOPOLOGY_TYPE_WIN) == valstr) {
				valstr += strlen(NODE_TOPOLOGY_TYPE_WIN);
				ntt = tt_Win;
			} else {
				sprintf(log_buffer, msg_unknown_topology_type,
					pnode->nd_name);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER,
					  LOG_DEBUG, __func__, log_buffer);
				return (PBSE_INTERNAL);
			}

			record_node_topology(pnode->nd_name, valstr);
			process_topology_info(&(pnode->nd_lic_info), valstr);
			if (ntt == tt_Cray)
				release_lic_for_cray(pnode);
			license_one_node(pnode);

			break;

		case ATR_ACTION_RECOV:
		case ATR_ACTION_FREE:
		default:
			rc = PBSE_INTERNAL;
	}

	if (rc == PBSE_NONE)
		post_attr_set(new);
	return rc;
#endif /* localmod 035 */
}

/**
 * @brief chk_vnode_pool - action routine for a node's vnode_pool attribute
 *      Does several things:
 *      1. Verifies that there is only one Mom being pointed to
 *      2. Verifies in the Mom structure that this is the zero-th node
 *
 * @param[in] new - ptr to attribute being modified with new value
 * @param[in] pobj - ptr to parent object (pbs_node)
 * @param[in] actmode - type of action: recovery, new node, or altering
 *
 * @return error code
 * @retval PBSE_NONE  (zero) - on success
 * @retval PBSE_*  (non zero) - on error
 */
int
chk_vnode_pool(attribute *new, void *pobj, int actmode)
{
	static char id[] = "chk_vnode_pool";
	int pool = -1;

	switch (actmode) {
		case ATR_ACTION_NEW:
		case ATR_ACTION_RECOV:

			pool = new->at_val.at_long;
			sprintf(log_buffer, "vnode_pool value is = %d", pool);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, id, log_buffer);
			if (pool <= 0) {
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
					  LOG_WARNING, id, "invalid vnode_pool provided");
				return (PBSE_BADATVAL);
			}
			break;

		case ATR_ACTION_ALTER:
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				  LOG_DEBUG, id, "Unsupported actions for vnode_pool");
			return (PBSE_IVALREQ);

		default:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
				  LOG_DEBUG, id, "Unsupported actions for vnode_pool");
			return (PBSE_INTERNAL);
	}
	return PBSE_NONE;
}

/**
 * @brief
 *		action routine for the node's "partition" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_node_partition(attribute *pattr, void *pobj, int actmode)
{
	struct pbsnode *pnode;
	pbs_queue *pq;
	struct pbssubn *psn;

	pnode = (pbsnode *) pobj;

	if (actmode == ATR_ACTION_RECOV)
		return PBSE_NONE;

	if (strcmp(pattr->at_val.at_str, DEFAULT_PARTITION) == 0)
		return PBSE_DEFAULT_PARTITION;

	if (is_nattr_set(pnode, ND_ATR_Queue)) {
		pq = find_queuebyname(get_nattr_str(pnode, ND_ATR_Queue));
		if (pq == 0)
			return PBSE_UNKQUE;
		if (is_qattr_set(pq, QA_ATR_partition) && pattr->at_flags & ATR_VFLAG_SET) {
			if (strcmp(get_qattr_str(pq, QA_ATR_partition), pattr->at_val.at_str) != 0)
				return PBSE_QUE_NOT_IN_PARTITION;
		}
	}

	/* reject setting the node partition if the node is busy or has a reservation scheduled to run on it */
	if (pnode->nd_resvp != NULL)
		return PBSE_NODE_BUSY;

	for (psn = pnode->nd_psn; psn; psn = psn->next)
		if (psn->jobs != NULL)
			return PBSE_NODE_BUSY;
	return PBSE_NONE;
}

/**
 * @brief
 * 	Set node 'pnode's state to either use the non-down or non-inuse node state value,
 * 	or the value derived from the 'new' attribute state.
 *
 * @param[in] 		new - input attribute to derive state from
 * @param[in/out]	pnode - node who state is being set.
 * @param[in]		actmode - action mode: "NEW" or "ALTER"
 *
 * @return int
 * @retval 0			if set normally
 * @retval PBSE_NODESTALE	if pnode's state is INUSE_STALE
 * @retval PBSE_NODEPROV	if pnode's state is INUSE_PROV
 * 	   PBSE_INTERNAL	if 'actmode' is unrecognized
 */

int
node_state(attribute *new, void *pnode, int actmode)
{
	int rc = 0;
	struct pbsnode *np;
	static unsigned long keep = ~(INUSE_DOWN | INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM | INUSE_SLEEP);

	np = (struct pbsnode *) pnode; /*because of def of at_action  args*/

	/* cannot change state of stale node */
	if (np->nd_state & INUSE_STALE)
		return PBSE_NODESTALE;

	/* cannot change state of provisioning node */
	if (np->nd_state & INUSE_PROV)
		return PBSE_NODEPROV;

	switch (actmode) {

		case ATR_ACTION_NEW: /*derive attribute*/
			set_vnode_state(np, (np->nd_state & keep) | new->at_val.at_long, Nd_State_Set);
			break;

		case ATR_ACTION_ALTER:
			set_vnode_state(np, (np->nd_state & keep) | new->at_val.at_long, Nd_State_Set);
			break;

		default:
			rc = PBSE_INTERNAL;
	}
	/* Now that we are setting the node state, same state should also reflect on the mom */
	if (np->nd_nummoms == 1) {
		dmn_info_t *pdmn_info = np->nd_moms[0]->mi_dmn_info;
		pdmn_info->dmn_state = (pdmn_info->dmn_state & keep) | new->at_val.at_long;
	}
	return rc;
}


================================================
FILE: src/server/node_manager.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *		all the functions related to node management.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <sys/types.h>
#include <netdb.h>
#include <netinet/in.h>
#include <stddef.h>
#include <time.h>

#include "portability.h"
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server.h"
#include "net_connect.h"
#include "work_task.h"
#include "job.h"
#include "reservation.h"
#include "acct.h"
#include "queue.h"
#include "pbs_nodes.h"
#include "log.h"
#include "tpp.h"
#include "dis.h"
#include "resmon.h"
#include "mom_server.h"
#include "pbs_license.h"
#include "ticket.h"
#include "placementsets.h"
#include "pbs_ifl.h"
#include "grunt.h"
#include "libutil.h"
#include "pbs_db.h"
#include "batch_request.h"
#include "hook_func.h"
#include "sched_cmds.h"
#include "provision.h"
#include "pbs_sched.h"
#include "svrfunc.h"

#if !defined(H_ERRNO_DECLARED)
extern int h_errno;
#endif

int mom_send_vnode_map = 0; /* server must send vnode map to Mom */
int svr_quehasnodes;

static int mtfd_replyhello = -1;
static int mtfd_replyhello_noinv = -1;

static int cvt_overflow(size_t, size_t);
static int cvt_realloc(char **, size_t *, char **, size_t *);

static void set_resv_for_degrade(struct pbsnode *pnode, resc_resv *presv);
extern time_t time_now;
extern int server_init_type;

extern int ctnodes(char *);
extern char *resc_in_err;
extern struct server server;
extern int tpp_network_up; /* from pbsd_main.c - used only in case of TPP */

extern unsigned int pbs_mom_port;

extern char *msg_noloopbackif;
extern char *msg_job_end_stat;
extern char *msg_daemonname;
extern char *msg_new_inventory_mom;
extern pbs_list_head svr_allhooks;

extern void is_vnode_prov_done(char *); /* for provisioning */
extern void free_prov_vnode(struct pbsnode *);
extern void fail_vnode_job(struct prov_vnode_info *, int);
extern struct prov_tracking *get_prov_record_by_vnode(char *);
extern int parse_prov_vnode(char *, exec_vnode_listtype *);

static void check_and_set_multivnode(struct pbsnode *);
int write_single_node_mom_attr(struct pbsnode *np);

static char *hook_privilege = "Not allowed to update vnodes or to request scheduler restart cycle, if run as a non-manager/operator user %s@%s";

extern struct python_interpreter_data svr_interp_data;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
extern void svr_renew_job_cred(struct work_task *pwt);
#endif

extern long node_fail_requeue;

extern void propagate_licenses_to_vnodes(mominfo_t *pmom);

#define SKIP_NONE 0
#define SKIP_EXCLUSIVE 1
#define SKIP_ANYINUSE 2

#define GLOB_SZ 511
#define STR_TIME_SZ 20

#define MAX_NODE_WAIT 600

/*
 * Tree search generalized from Knuth (6.2.2) Algorithm T just like
 * the AT&T man page says.
 *
 * The tree structure is for internal use only, lint doesn't grok it.
 *
 * Written by reading the System V Interface Definition, not the code.
 *
 */
/*LINTLIBRARY*/

/*
 **      Modified by Tom Proett for PBS.
 */

struct tree *ipaddrs = NULL; /* tree of ip addrs */
struct tree *streams = NULL; /* tree of stream numbers */

extern pntPBS_IP_LIST pbs_iplist;

static int
comp_keys(u_long key1, u_long key2, struct tree *pt)
{
	if (key1 == pt->key1) {
		if (key2 == pt->key2)
			return 0;
		else if (key2 < pt->key2)
			return -1;
		else
			return 1;
	} else if (key1 < pt->key1)
		return -1;
	else
		return 1;
}

/**
 * @brief
 *  	find value in tree, return NULL if not found
 *
 * @param[in]	key1	-	key to be located
 * @param[in]	key2 	-	key to be located
 * @param[in]	rootp 	-	address of tree root
 *
 * @return	mominfo_t *
 * @retval	a pointer to the mominfo_t object located in the tree	- found
 * @retval	NULL	- not found
 *
 * @par MT-safe: No
 */
mominfo_t *
tfind2(const u_long key1, const u_long key2, struct tree **rootp)
{
	if (rootp == NULL)
		return NULL;

	while (*rootp != NULL) { /* Knuth's T1: */
		int i;

		i = comp_keys(key1, key2, *rootp);
		if (i == 0)
			return (*rootp)->momp; /* we found it! */
		else if (i < 0)
			rootp = &(*rootp)->left; /* T3: follow left branch */
		else
			rootp = &(*rootp)->right; /* T4: follow right branch */
	}
	return NULL;
}
/**
 * @brief
 *  	insert a mom on the tree.
 *
 * @param[in]	key1	-	key to be located
 * @param[in]	key2	-	key to be located
 * @param[in]	momp 	-	key to be located
 * @param[in,out]	rootp 	-	address of tree root
 *
 * @return	mominfo_t *
 * @retval	a pointer to the mominfo_t object located in the tree	- found
 * @retval	NULL	- not found
 *
 * @par MT-safe: No
 */
void
tinsert2(const u_long key1, const u_long key2, mominfo_t *momp, struct tree **rootp)
{
	int i;
	struct tree *q;

	DBPRT(("tinsert2: %lu|%lu %s stream %d\n", key1, key2,
	       momp->mi_host, momp->mi_dmn_info ? momp->mi_dmn_info->dmn_stream : -1))

	if (rootp == NULL)
		return;
	while (*rootp != NULL) { /* Knuth's T1: */
		i = comp_keys(key1, key2, *rootp);
		if (i == 0)
			return; /* we found it! */
		else if (i < 0)
			rootp = &(*rootp)->left; /* T3: follow left branch */
		else
			rootp = &(*rootp)->right; /* T4: follow right branch */
	}
	q = (struct tree *) malloc(sizeof(struct tree));
	/* T5: key not found */
	if (q != NULL) {	/* make new node */
		*rootp = q;	/* link new node to old */
		q->key1 = key1; /* initialize new node */
		q->key2 = key2; /* initialize new node */
		q->momp = momp;
		q->left = q->right = NULL;
	}
	return;
}

/**
 * @brief Send the IS_CLUSTER_ADDRS message to Mom so she has the
 *      latest list of IP addresses of the all the Moms in the complex.
 *
 * @param[in] stream - the open stream to the Mom
 * @param[in] combine_msg - combine message in the caller
 *
 * @return int
 * @retval DIS_SUCCESS (0) for success
 * @retval != 0 otherwise.
 */
static int
send_ip_addrs_to_mom(int stream, int combine_msg)
{
	int j;
	int ret;

	DBPRT(("%s: entered\n", __func__))

	if (stream < 0)
		return -1;

	if (!combine_msg)
		if ((ret = is_compose(stream, IS_CLUSTER_ADDRS)) != DIS_SUCCESS)
			return (ret);

	if ((ret = diswui(stream, pbs_iplist->li_nrowsused)) != DIS_SUCCESS)
		return ret;

	for (j = 0; j < pbs_iplist->li_nrowsused; j++) {
#ifdef DEBUG
		unsigned long ipaddr;
		ipaddr = IPLIST_GET_LOW(pbs_iplist, j);
		DBPRT(("%s: ip %d\t%ld.%ld.%ld.%ld\n", __func__, j,
		       (ipaddr & 0xff000000) >> 24,
		       (ipaddr & 0x00ff0000) >> 16,
		       (ipaddr & 0x0000ff00) >> 8,
		       (ipaddr & 0x000000ff)))
#endif /* DEBUG */
		DBPRT(("%s: depth %ld\n", __func__, (long) IPLIST_GET_HIGH(pbs_iplist, j)))
		if ((ret = diswul(stream, IPLIST_GET_LOW(pbs_iplist, j))) != DIS_SUCCESS)
			return (ret);
		if ((ret = diswul(stream, IPLIST_GET_HIGH(pbs_iplist, j))) != DIS_SUCCESS)
			return (ret);
	}
	if (!combine_msg)
		return dis_flush(stream);
	return 0;
}

/**
 * @brief Reply to IS_HELLOSVR
 * Sending all the information mom needs from the server.
 * including need inventory, rpp value and mom ip addresses.
 *
 * @param[in] stream - the open stream to the Mom
 * @param[in] need_inv - whether the server needs inventory of the mom.
 *
 * @return int
 * @retval DIS_SUCCESS (0) for success
 * @retval != 0 otherwise.
 */
static int
reply_hellosvr(int stream, int need_inv)
{
	int ret;

	DBPRT(("%s: entered\n", __func__))

	if (stream < 0)
		return -1;

	if ((ret = is_compose(stream, IS_REPLYHELLO)) != DIS_SUCCESS)
		return ret;

	if ((ret = diswsi(stream, need_inv)) != DIS_SUCCESS)
		return ret;

	if ((ret = send_ip_addrs_to_mom(stream, 1)) != DIS_SUCCESS)
		return ret;

	return dis_flush(stream);
}

/**
 * @brief
 *  	delete node with given key
 *
 * @param[in]	key1	-	key to be located
 * @param[in]	key2	-	key to be located
 * @param[in]	rootp 	-	address of tree root
 *
 * @return	root node
 * @retval	root	- after successful deletion.
 * @retval	NULL	- could not found the key to be freed.
 */
void *
tdelete2(const u_long key1, const u_long key2, struct tree **rootp)
{
	struct tree *p;
	struct tree *q;
	struct tree *r;
	int i;

	DBPRT(("tdelete2: %lu|%lu\n", key1, key2))
	if (rootp == NULL || (p = *rootp) == NULL)
		return NULL;
	while ((i = comp_keys(key1, key2, *rootp)) != 0) {
		p = *rootp;
		rootp = (i < 0) ? &(*rootp)->left : /* left branch */
				&(*rootp)->right;   /* right branch */
		if (*rootp == NULL)
			return NULL; /* key not found */
	}
	r = (*rootp)->right;		  /* D1: */
	if ((q = (*rootp)->left) == NULL) /* Left */
		q = r;
	else if (r != NULL) {	       /* Right is null? */
		if (r->left == NULL) { /* D2: Find successor */
			r->left = q;
			q = r;
		} else { /* D3: Find NULL link */
			for (q = r->left; q->left != NULL; q = r->left)
				r = q;
			r->left = q->right;
			q->left = (*rootp)->left;
			q->right = (*rootp)->right;
		}
	}
	free((struct tree *) *rootp); /* D4: Free node */
	*rootp = q;		      /* link parent to new node */
	return (p);
}
/**
 * @brief
 *  	free the entire tree
 *
 * @param[in]	rootp 	-	address of tree root
 *
 * @return	void
 */
void
tfree2(struct tree **rootp)
{
	if (rootp == NULL || *rootp == NULL)
		return;
	tfree2(&(*rootp)->left);
	tfree2(&(*rootp)->right);
	free(*rootp);
	*rootp = NULL;
}

/**
 * @brief
 * 		get the addr of the host on which a node is defined
 *
 * @param[in]	name	- is in one of the forms:
 *							nodename[:DDDD][:resc=val...]
 *							nodename[:DDDD]/DD[*DD]
 *							where D is a numerical digit;  :DDDD is a port number
 * @param[in]	port	- the port number as commonly used in exec_vnode string or
 * 							exec_host string
 *
 * @return	The IP address and port from the first Mom declared for the node
 *
 * @par MT-safe: No
 */
pbs_net_t
get_addr_of_nodebyname(char *name, unsigned int *port)
{
	char *nodename;
	struct pbsnode *np;

	nodename = parse_servername(name, NULL);
	/* ignore the port which might have been found in the string */
	np = find_nodebyname(nodename);
	if (np == 0 || is_nattr_set(np, ND_ATR_Mom) == 0)
		return (0);
	/* address and port from mom_svrinfo */
	*port = np->nd_moms[0]->mi_port;
	return (get_hostaddr(np->nd_moms[0]->mi_host));
}

enum Set_All_State_When {
	Set_ALL_State_All_Down,	  /* set on vnodes when all Moms are down */
	Set_All_State_Regardless, /* set on vnodes regardless */
	Set_All_State_All_Offline /* set on vnodes when all Moms are offline */
};

/**
 * @brief
 * 		set or clear state bits on the mominfo entry and all
 *		virtual nodes under that Mom and set the comment, if txt is null,
 *		set the comment, if txt is null,
 *		do_set = 1 means set the bits in "bits", otherwise clear them
 *
 * @param[in]	pmom	- pointer to mom
 * @param[in]	do_set	- do_set = 1 means set the bits, otherwise clear them
 * @param[in]	txt		- set the comment, if txt is null, set the comment, if txt is null,
 * @param[in]	setwhen	- of type Set_All_State_When enum, having two states.
 *
 * @return	void
 *
 * @par MT-safe: No
 */
static void
set_all_state(mominfo_t *pmom, int do_set, unsigned long bits, char *txt,
	      enum Set_All_State_When setwhen)
{
	int imom;
	unsigned long mstate;
	mom_svrinfo_t *psvrmom = (mom_svrinfo_t *) (pmom->mi_data);
	dmn_info_t *pdmn_info = pmom->mi_dmn_info;
	struct pbsnode *pvnd;
	attribute *pat;
	int nchild;
	unsigned long inuse_flag = 0;

	if (do_set) { /* STALE is not meaning in the state of the Mom, don't set it */
		pdmn_info->dmn_state |= (bits & ~INUSE_STALE);
	} else {
		pdmn_info->dmn_state &= ~bits;
	}

	log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_INFO, pmom->mi_host,
		   "set_all_state;txt=%s mi_modtime=%ld", txt, pmom->mi_modtime);

	/* Set the inuse_flag based off the value of setwhen */
	if (setwhen == Set_ALL_State_All_Down) {
		inuse_flag = INUSE_DOWN;
	} else if (setwhen == Set_All_State_All_Offline) {
		inuse_flag = INUSE_OFFLINE_BY_MOM;
	}

	for (nchild = 0; nchild < psvrmom->msr_numvnds; ++nchild) {
		int do_this_vnode;

		do_this_vnode = 1;

		pvnd = psvrmom->msr_children[nchild];

		/*
		 * If this vnode has more than one Mom and
		 * setwhen is Set_ALL_State_All_Down or
		 * setwhen is Set_All_State_All_Offline, then we only change
		 * state if all Moms are down/offline
		 */
		if ((pvnd->nd_nummoms > 1) &&
		    ((setwhen == Set_ALL_State_All_Down) ||
		     (setwhen == Set_All_State_All_Offline))) {
			for (imom = 0; imom < pvnd->nd_nummoms; ++imom) {
				mstate = pvnd->nd_moms[imom]->mi_dmn_info->dmn_state;
				if ((mstate & inuse_flag) == 0) {
					do_this_vnode = 0;
					break;
				}
			}
		}
		/* Skip resetting state only on cray_compute nodes when state is sleep */
		if ((pvnd->nd_state & INUSE_SLEEP) &&
		    (setwhen == Set_All_State_Regardless) &&
		    (bits & INUSE_SLEEP) &&
		    !(do_set)) {
			resource_def *prd;
			resource *prc;
			pat = &pvnd->nd_attr[(int) ND_ATR_ResourceAvail];
			prd = find_resc_def(svr_resc_def, "vntype");
			if (pat && prd && (prc = find_resc_entry(pat, prd))) {
				if (strcmp(prc->rs_value.at_val.at_arst->as_string[0], CRAY_COMPUTE) == 0)
					do_this_vnode = 0;
			}
		}
		if (do_this_vnode == 0)
			continue; /* skip setting state on this vnode */

		if (do_set) {
			set_vnode_state(pvnd, bits, Nd_State_Or);
		} else {
			set_vnode_state(pvnd, ~bits, Nd_State_And);
			if ((bits & INUSE_OFFLINE_BY_MOM) &&
			    (pvnd->nd_state & INUSE_OFFLINE)) {
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE,
					  LOG_NOTICE, pvnd->nd_name,
					  "clearing offline_by_mom state for "
					  "vnode: still offlined because of "
					  "previous admin offline action`");
			}
		}

		post_attr_set(get_nattr(pvnd, ND_ATR_state));
		pat = get_nattr(pvnd, ND_ATR_Comment);

		/*
		 * change the comment only if it is a default comment (set by
		 * the serve and not the Manager;  if "txt" is null, just
		 * clear (unset) the comment
		 *
		 * comments set as part of INUSE_OFFLINE_BY_MOM state
		 * action should not be touched.
		 */

		if ((bits & INUSE_OFFLINE_BY_MOM) ||
		    ((is_attr_set(pat)) == 0) ||
		    ((pat->at_flags & ATR_VFLAG_DEFLT) != 0)) {

			/* default comment */
			free_attr(node_attr_def, pat, ND_ATR_Comment);
			if (txt)
				set_attr_generic(pat, &node_attr_def[(int) ND_ATR_Comment], txt, NULL, INTERNAL);

			if (do_set && (bits & INUSE_OFFLINE_BY_MOM)) {
				/* this means not directly set by the server */
				/* This means server did not set comment */
				/* directly but as done per mom */
				pat->at_flags &= ~ATR_VFLAG_DEFLT;
				mark_attr_set(pat);
			} else {
				/* ATR_VFLAG_DEFLT means server set comment */
				/* itself */
				pat->at_flags |= ATR_VFLAG_DEFLT;
			}
		}
	}
}

/**
 * @brief
 * 		requeue/delete job on primary node going down.
 *
 * @par Functionality:
 *		If the primary, Mother Superior, node of a job goes down, it
 *		should be requeued if possible or delete.
 *
 *		Called via a work-task set up in momptr_down()
 * @see
 * 		momptr_down
 *
 * @param[in]	pwt	-	work task structure.
 *
 * @return	void
 */

static void
node_down_requeue(struct work_task *pwt)
{
	char *nname;
	mominfo_t *mp;
	mom_svrinfo_t *svmp;
	job *pj;
	struct pbsnode *np;
	struct pbssubn *psn;
	struct jobinfo *pjinfo;
	struct jobinfo *pjinfo_nxt;
	int nchild;
	int cnt;
	int i;
	char *tmp_acctrec = NULL;
	struct pbsnode *vnode = NULL;
	exec_vnode_listtype prov_vnode_list = NULL;
	struct prov_tracking *ptracking;
	struct prov_vnode_info *prov_vnode_info;

	DBPRT(("node_down_requeue invoked\n"))
	if (!pwt) {
		sprintf(log_buffer, "Illegal value passed to %s", __func__);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR,
			  msg_daemonname, log_buffer);
		return;
	}
	mp = (mominfo_t *) pwt->wt_parm1;
	if (!mp) {
		sprintf(log_buffer, "Illegal mominfo value in %s", __func__);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR,
			  msg_daemonname, log_buffer);
		return;
	}
	svmp = (mom_svrinfo_t *) (mp->mi_data);
	if (!svmp) {
		sprintf(log_buffer, "Illegal srvinfo value in %s", __func__);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_ERR,
			  msg_daemonname, log_buffer);
		return;
	}

	/* clear ptr to this worktask */
	svmp->msr_wktask = 0;

	/* is node still down? If not, leave jobs as is */
	if ((mp->mi_dmn_info->dmn_state & INUSE_DOWN) == 0)
		return;

	DBPRT(("node_down_requeue node still down\n"))

	for (nchild = 0; nchild < svmp->msr_numvnds; ++nchild) {
		np = svmp->msr_children[nchild];
		/* is node still provisioning? If yes, leave jobs as is */
		if ((np->nd_state & INUSE_PROV) == 0) {
			DBPRT(("node_down_requeue node still provisioning\n"))

			for (psn = np->nd_psn; psn; psn = psn->next) {
				for (pjinfo = psn->jobs; pjinfo; pjinfo = pjinfo_nxt) {
					pj = find_job(pjinfo->jobid);
					pjinfo_nxt = pjinfo->next;
					while (pjinfo_nxt && !strcmp(pjinfo_nxt->jobid, pj->ji_qs.ji_jobid)) {
						/* skip over next occurrence of same job in list*/
						/* if it is deleted in discard_job(), we would	*/
						/* have a pointer to nothingness		*/
						pjinfo_nxt = pjinfo_nxt->next;
					}

					nname = parse_servername(
						get_jattr_str(pj, JOB_ATR_exec_vnode), NULL);
					if (nname && (strcasecmp(np->nd_name, nname) == 0)) {
						/* node is Mother Superior for job */
						set_jattr_l_slim(pj, JOB_ATR_exit_status, JOB_EXEC_RERUN_MS_FAIL, SET);

						sprintf(log_buffer, msg_job_end_stat, JOB_EXEC_RERUN_MS_FAIL);
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pj->ji_qs.ji_jobid, log_buffer);

						/* If Job is  in wait Provision state, then fail_vnode_provisioning should be called.
						 * Since this job is going to get requed and can run on different set of vnodes
						 * hence to make sure provisioning failure on previous set of vnodes doesn't create problem.
						 */
						if (check_job_substate(pj, JOB_SUBSTATE_PROVISION)) {
							cnt = parse_prov_vnode(get_jattr_str(pj, JOB_ATR_prov_vnode),
									       &prov_vnode_list);

							/* Check if any node associated to the provisioned job is still in provisioning state. */
							for (i = 0; i < cnt; i++) {
								if ((vnode = find_nodebyname(prov_vnode_list[i]))) {
									if ((ptracking = get_prov_record_by_vnode(vnode->nd_name))) {
										prov_vnode_info = ptracking->prov_vnode_info;
										if (prov_vnode_info) {
											fail_vnode_job(prov_vnode_info, -1); /* Passing -1 so that fail_vnode_job neither hold nor requeue the job */
											break;
										}
									}
								}
							}
						}
						/* Set for requeuing the job if job is rerunnable */
						if (get_jattr_long(pj, JOB_ATR_rerunable) != 0) {
							set_job_substate(pj, JOB_SUBSTATE_RERUN3);
							if (pj->ji_acctrec != NULL) {
								if (pbs_asprintf(&tmp_acctrec, "%s %s", pj->ji_acctrec, log_buffer) == -1) {
									free(tmp_acctrec); /* free 1 byte malloc'd in pbs_asprintf() */
								} else {
									free(pj->ji_acctrec);
									pj->ji_acctrec = tmp_acctrec;
								}
							} else {
								pj->ji_acctrec = strdup(log_buffer);
							}
						}

						/* When job is non-rerunnable and if job has any dependencies,
						 *register dependency request to delete the dependent jobs.
						 */
						if (get_jattr_long(pj, JOB_ATR_rerunable) == 0 &&
						    (is_jattr_set(pj, JOB_ATR_depend))) {
							/* set job exit status from MOM */
							pj->ji_qs.ji_un.ji_exect.ji_exitstat = JOB_EXEC_RERUN_MS_FAIL;
							(void) depend_on_term(pj);
						}

						/* notify all sisters to discard the job */
						discard_job(pj, "on node down requeue", 0);

						/* Clear "resources_used" only if not waiting on any mom */
						if (!pj->ji_jdcd_waiting && ((pj->ji_qs.ji_svrflags & (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) == 0)) {
							free_jattr(pj, JOB_ATR_resc_used);
						}
					}
				}
			}
		}
	}
}

/**
 * @brief
 * 		called when a node is marked down or responds to an
 * 		IS_DISCARD_JOB message.
 *
 * @par Functionality:
 * 		If all Moms have responded or are down, then we can deal with the job
 * 		depending on the substate.
 *
 *		If the second arg (pmom) is null, just check the state; if not null
 *		then mark that Mom's slot as done, then check
 *
 * @see
 * 		discard_job
 *
 * @param[in,out]	pjob	-	point to the job
*  @param[in]		pmom	-	if (pmom) is null, just check the state; if not null then mark that Mom's slot as done
 * @param[in]		newstate-	new state.
 *
 * @return	void
 *
 * @par MT-safe: No
 */
static void
post_discard_job(job *pjob, mominfo_t *pmom, int newstate)
{
	char *downmom = NULL;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	struct jbdscrd *pdsc;
	struct batch_request *preq;
	int rc;

	if (pjob->ji_discard == NULL) {
		pjob->ji_discarding = 0;
		return;
	}
	if (pmom != NULL) {
		for (pdsc = pjob->ji_discard; pdsc->jdcd_mom; ++pdsc) {
			if (pdsc->jdcd_mom == pmom) {
				pdsc->jdcd_state = newstate;
				break;
			}
		}
	}

	for (pdsc = pjob->ji_discard; pdsc->jdcd_mom; ++pdsc) {
		if (pdsc->jdcd_state == JDCD_WAITING)
			return; /* need to wait some more */
	}
	pjob->ji_jdcd_waiting = 0;

	/* not waiting on any Mom to reply to an IS_DISCARD_JOB */
	/* so can now deal with the job                         */

	/* find name of (a) down mom */
	for (pdsc = pjob->ji_discard; pdsc->jdcd_mom; ++pdsc) {
		if (pdsc->jdcd_state == JDCD_DOWN) {
			downmom = pdsc->jdcd_mom->mi_host;
			break;
		}
	}
	if (downmom == NULL)
		downmom = ""; /* didn't find one, null string for msg */

	free(pjob->ji_discard);
	pjob->ji_discard = NULL;

	if (check_job_state(pjob, JOB_STATE_LTR_QUEUED) && (check_job_substate(pjob, JOB_SUBSTATE_QUEUED))) {
		static char nddown[] = "Job never started, execution node %s down";

		/*
		 * The job was rejected by mother superior and has
		 * already been placed back in queued state by a
		 * call to svr_evaljobstate() within post_sendjob().
		 * This is done regarless of whether the job is
		 * rerunnable or not, since it never actually started.
		 * There was no start record for this job, so no need
		 * to call account_jobend().
		 */
		sprintf(log_buffer, nddown, downmom);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return;
	}

	if (check_job_state(pjob, JOB_STATE_LTR_HELD) && (check_job_substate(pjob, JOB_SUBSTATE_HELD))) {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, "Leaving job in held state");
		return;
	}

	if (check_job_substate(pjob, JOB_SUBSTATE_RERUN3) || pjob->ji_discarding) {

		static char *ndreque;

		if (pjob->ji_discarding)
			ndreque = "Job requeued, discard response received";
		else
			ndreque = "Job requeued, execution node %s down";

		/*
		 * Job to be rerun,   no need to check if job is rerunnable
		 * because to get here the job is either rerunnable or Mom
		 * tried to run the job and it failed before it ever went
		 * into execution and sent the server JOB_EXEC_RETRY
		 */
		sprintf(log_buffer, ndreque, downmom);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		force_reque(pjob);
		if (pjob->ji_acctrec) {
			free(pjob->ji_acctrec); /* logged, so clear it */
			pjob->ji_acctrec = NULL;
		}

		/* free resc_used */
		if ((is_jattr_set(pjob, JOB_ATR_resc_used)) &&
		    ((pjob->ji_qs.ji_svrflags & (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) == 0))
			free_jattr(pjob, JOB_ATR_resc_used);

		pjob->ji_discarding = 0;
		return;
	}

	/* at this point the job is to be purged */
	pjob->ji_qs.ji_obittime = time_now;
	set_jattr_l_slim(pjob, JOB_ATR_obittime, pjob->ji_qs.ji_obittime, SET);

	/* Allocate space for the jobobit hook event params */
	preq = alloc_br(PBS_BATCH_JobObit);
	if (preq == NULL) {
		log_err(PBSE_INTERNAL, __func__, "rq_jobobit alloc failed");
	} else {
		preq->rq_ind.rq_obit.rq_pjob = pjob;
		rc = process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
		if (rc == -1) {
			log_err(-1, __func__, "rq_jobobit process_hooks call failed");
		}
		free_br(preq);
	}

	if (pjob->ji_acctrec) {
		/* fairly normal job exit, record accounting info */
		account_job_update(pjob, PBS_ACCT_LAST);
		account_jobend(pjob, pjob->ji_acctrec, PBS_ACCT_END);

		if (get_sattr_long(SVR_ATR_log_events) & PBSEVENT_JOB_USAGE) {
			/* log events set to record usage */
			log_event(PBSEVENT_JOB_USAGE, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, pjob->ji_acctrec);
		} else {
			char *pc;

			/* no usage in log, truncate messge */
			if ((pc = strchr(pjob->ji_acctrec, (int) ' ')) != NULL)
				*pc = '\0';
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, pjob->ji_acctrec);
		}

	} else {
		static char ndtext[] = "Job deleted, execution node %s down";

		sprintf(log_buffer, ndtext, downmom);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		account_record(PBS_ACCT_DEL, pjob, log_buffer);
		svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, log_buffer);
	}

	rel_resc(pjob); /* free any resc assigned to the job */
	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
		issue_track(pjob);
	/*
	 * If the server is configured to maintain job history, then
	 * keep the job structure which will be cleaned up later by
	 * SERVER, probably after the history duration. History job
	 * type is T_MOM_DOWN(2) for the jobs to be purged because
	 * of MOM failure.
	 */
	if (svr_chk_history_conf())
		svr_setjob_histinfo(pjob, T_MOM_DOWN);
	else
		job_purge(pjob);

	return;
}

/**
 * @brief
 * 		mark mom (by ptr) down and log message
 *
 * @param[in]		pmom	-	mom which is down
 * @param[in]		why		-	the reason why the mom is down
 *
 * @return	void
 */
void
momptr_down(mominfo_t *pmom, char *why)
{
	int i;
	int j;
	int nj;
	int nchild;
	struct pbsnode *np;
	struct jobinfo *pji;
	job **parray;
	struct pbssubn *psn;
	mom_svrinfo_t *psvrmom = (mom_svrinfo_t *) (pmom->mi_data);
	long sec;
	int setwktask = 0;
	int is_provisioning = 0;
	job *pj;

	pmom->mi_dmn_info->dmn_state |= INUSE_DOWN;

	/* log message if node just down or been down for an hour */
	/* mark mom down and vnodes down as well                  */
	if ((psvrmom->msr_timedown + 3600) > time_now)
		return;

	psvrmom->msr_timedown = time_now;

	/* is node provisioning? */
	for (nchild = 0; nchild < psvrmom->msr_numvnds; ++nchild) {
		np = psvrmom->msr_children[nchild];
		if (np->nd_state & INUSE_PROV) {
			is_provisioning = 1;
			break;
		}
	}

#ifndef NAS /* localmod 023 */
	/* do not display 'node down' msg and comment */
	if (is_provisioning) {
		set_all_state(pmom, 1, INUSE_DOWN, NULL,
			      Set_All_State_Regardless);
	} else {
#endif /* localmod 023 */

#ifdef NAS /* localmod 023 */
		if (is_provisioning)
			(void) snprintf(log_buffer, sizeof(log_buffer), "node down for provisioning: %s", why);
		else
#endif /* localmod 023 */
			(void) snprintf(log_buffer, sizeof(log_buffer), "node down: %s", why);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
			  LOG_ALERT, pmom->mi_host, log_buffer);

		set_all_state(pmom, 1, INUSE_DOWN, log_buffer,
			      Set_ALL_State_All_Down);
#ifndef NAS /* localmod 023 */
	}
#endif /* localmod 023 */

	for (nchild = 0; nchild < psvrmom->msr_numvnds; ++nchild) {

		np = psvrmom->msr_children[nchild];

		for (psn = np->nd_psn; psn; psn = psn->next) {
			if (psn->jobs) {
				setwktask = 1;
				nj = 0;
				/* find list of jobs on this sub-node */
				/* first, how many are they */
				for (pji = psn->jobs; pji; pji = pji->next) {
					pj = find_job(pji->jobid);
					if (pj && pj->ji_discard)
						++nj;
				}
				/* if any, save pointer to the jobs in an array as the    */
				/* list may be distrubed by the post_discard_job function */
				if (nj != 0) {
					parray = (job **) calloc((size_t) nj, sizeof(job *));
					if (parray) {
						i = 0;
						for (pji = psn->jobs; pji; pji = pji->next) {
							pj = find_job(pji->jobid);
							if (pj && pj->ji_discard) {
								/* we only want one entry per job */
								for (j = 0; j < i; ++j) {
									if (*(parray + j) == pj)
										break;
								}
								if (j == i) {
									*(parray + i) = pj; /* new, add it */
									++i;
								}
							}
						}

						for (i = 0; i < nj; ++i)
							if (*(parray + i))
								post_discard_job(*(parray + i), pmom, JDCD_DOWN);

						free(parray);
						parray = NULL;
					}
				}
			}
		}
	}

	/* If this Mom is in a vnode pool and is the inventory Mom for that pool */
	/* remove her from that role and if another Mom in the pool is up make   */
	/* that one the new inventory Mom */

	if (psvrmom->msr_vnode_pool != 0) {
		reset_pool_inventory_mom(pmom);
	}

	if (((sec = node_fail_requeue) != 0) &&
	    (setwktask != 0) && (psvrmom->msr_wktask == NULL)) {

		/* there isn't an outstanding work task to deal with the jobs    */
		/* and node has jobs, set task to deal with the jobs after delay */

		if (sec < 0) /* if less than zero, treat as if one */
			sec = 1;

		psvrmom->msr_wktask = set_task(WORK_Timed, time_now + sec, node_down_requeue, (void *) pmom);
	}

	return;
}

/**
 * @brief
 * 		Given a vnode_state_op, return the string value.
 * 		The enum is found in pbs_nodes.h
 *
 * @param[in]	op - The operation for the state change
 *
 * @return	char *
 */
char *
get_vnode_state_op(enum vnode_state_op op)
{
	switch (op) {
		case Nd_State_Set:
			return "Nd_State_Set";
		case Nd_State_Or:
			return "Nd_State_Or";
		case Nd_State_And:
			return "Nd_State_And";
	}
	return "ND_state_unknown";
}

/**
 * @brief
 * 		Create a duplicate of the specified vnode
 *
 * @param[in]	vnode - the vnode to duplicate
 *
 * @note
 *  Creates a shallow duplicate of struct * and char * members.
 *
 *
 * @return  duplicated vnode
 */
static struct pbsnode *
shallow_vnode_dup(struct pbsnode *vnode)
{
	int i;
	struct pbsnode *vnode_dup = NULL;

	if (vnode == NULL) {
		return NULL;
	}

	/*
	 * Allocate and initialize vnode_o, then copy vnode elements into vnode_o
	 */
	if ((vnode_dup = calloc(1, sizeof(struct pbsnode))) == NULL) {
		log_err(PBSE_INTERNAL, __func__, "vnode_dup alloc failed");
		return NULL;
	}

	/*
	 * Copy vnode elements (same order as "struct pbsnode" element definition)
	 */

	vnode_dup->nd_name = vnode->nd_name;
	vnode_dup->nd_moms = vnode->nd_moms;
	vnode_dup->nd_nummoms = vnode->nd_nummoms;
	vnode_dup->nd_nummslots = vnode->nd_nummslots;
	vnode_dup->nd_index = vnode->nd_index;
	vnode_dup->nd_arr_index = vnode->nd_arr_index;
	vnode_dup->nd_hostname = vnode->nd_hostname;
	vnode_dup->nd_psn = vnode->nd_psn;
	vnode_dup->nd_resvp = vnode->nd_resvp;
	vnode_dup->nd_nsn = vnode->nd_nsn;
	vnode_dup->nd_nsnfree = vnode->nd_nsnfree;
	vnode_dup->nd_ncpus = vnode->nd_ncpus;
	vnode_dup->nd_state = vnode->nd_state;
	vnode_dup->nd_ntype = vnode->nd_ntype;
	vnode_dup->nd_pque = vnode->nd_pque;
	vnode_dup->nd_svrflags = vnode->nd_svrflags;
	for (i = 0; i < ND_ATR_LAST; i++) {
		vnode_dup->nd_attr[i] = vnode->nd_attr[i];
	}
	return vnode_dup;
}

/**
 * @brief
 * 		Change the state of a vnode. See pbs_nodes.h for definition of node's
 * 		availability and unavailability.
 *
 * 		This function detects the type of change, either from available to
 * 		unavailable, and invokes the appropriate handler to handle the state
 * 		change.
 *
 * @param[in]	pbsnode	- The vnode
 * @param[in]	state_bits	- the value to set the vnode to
 * @param[in]	type	- The operation on the node
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
set_vnode_state(struct pbsnode *pnode, unsigned long state_bits, enum vnode_state_op type)
{
	/*
	 * Vars used to construct hook event data
	 */
	struct batch_request *preq = NULL;
	struct pbsnode *vnode_o = NULL;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	int time_int_val;
	int last_time_int;

	time_now = time(NULL);
	time_int_val = time_now;

	if (pnode == NULL)
		return;

	/*
	 * Allocate space for the modifyvnode hook event params
	 */
	preq = alloc_br(PBS_BATCH_ModifyVnode);
	if (preq == NULL) {
		log_err(PBSE_INTERNAL, __func__, "rq_modifyvnode alloc failed");
		return;
	}

	/*
	 * Create a duplicate of the vnode
	 */
	vnode_o = shallow_vnode_dup(pnode);
	if (vnode_o == NULL) {
		log_err(PBSE_INTERNAL, __func__, "shallow_vnode_dup failed");
		goto fn_free_and_return;
	}

	/*
	 * Apply specified state operation (to the vnode only)
	 */
	switch (type) {
		case Nd_State_Set:
			pnode->nd_state = state_bits;
			break;
		case Nd_State_Or:
			pnode->nd_state |= state_bits;
			break;
		case Nd_State_And:
			pnode->nd_state &= state_bits;
			break;
		default:
			DBPRT(("%s: operator type unrecognized %d, defaulting to Nd_State_Set",
			       __func__, type))
			type = Nd_State_Set;
			pnode->nd_state = state_bits;
	}

	/* Populate hook param rq_modifyvnode with old and new vnode states */
	preq->rq_ind.rq_modifyvnode.rq_vnode_o = vnode_o;
	preq->rq_ind.rq_modifyvnode.rq_vnode = pnode;

	DBPRT(("%s(%5s): Requested state transition 0x%lx --> 0x%lx\n", __func__,
	       pnode->nd_name, vnode_o->nd_state, pnode->nd_state))

	/* sync state attribute with nd_state */

	if (pnode->nd_state != get_nattr_long(pnode, ND_ATR_state))
		set_nattr_l_slim(pnode, ND_ATR_state, pnode->nd_state, SET);

	if (vnode_o->nd_state != pnode->nd_state) {
		set_nattr_l_slim(pnode, ND_ATR_last_state_change_time, time_int_val, SET);

		/* Write the vnode state change event to server log */
		last_time_int = (int) vnode_o->nd_attr[(int) ND_ATR_last_state_change_time].at_val.at_long;
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_INFO, pnode->nd_name,
		   	"set_vnode_state;vnode.state=0x%lx vnode_o.state=0x%lx "
		   	"vnode.last_state_change_time=%d vnode_o.last_state_change_time=%d "
		   	"state_bits=0x%lx state_bit_op_type_str=%s state_bit_op_type_enum=%d",
		   	pnode->nd_state, vnode_o->nd_state, time_int_val, last_time_int,
		   	state_bits, get_vnode_state_op(type), type);
	}

	if (pnode->nd_state & INUSE_PROV) {
		if (!(pnode->nd_state & VNODE_UNAVAILABLE) ||
		    (pnode->nd_state == INUSE_PROV)) { /* INUSE_FREE is 0 */

			resource_def *prd;
			resource *prc;

			prd = &svr_resc_def[RESC_VNTYPE];
			if (prd && (prc = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAvail), prd))) {
				if (strncmp(prc->rs_value.at_val.at_arst->as_string[0],
					    "cray_compute", 12) == 0) {

					/**
 					 * Unlike other nodes, in compute-node
 					 * provisioning, MOM node does not restart
 					 * so is_vnode_prov_done will not get call from
 					 * IS_HOOK_CHECKSUMS request and the same is
 					 * called here.
 					 */

					DBPRT(("%s: calling [is_vnode_prov_done] from set_vnode_state, type = %d\n", __func__, type))
					is_vnode_prov_done(pnode->nd_name);
				}
			}
		}

		/* while node is provisioning, we don't want the reservation
		 * to degrade, hence returning.
		 */
		goto fn_fire_event;
	}

	unsigned long bits;
	bits = vnode_o->nd_state ^ pnode->nd_state;

	if (bits & (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM |
		    INUSE_MAINTENANCE | INUSE_SLEEP |
		    INUSE_PROV | INUSE_WAIT_PROV))
		pnode->nd_modified = 1;

	DBPRT(("%s(%5s): state transition 0x%lx --> 0x%lx\n", __func__, pnode->nd_name,
	       vnode_o->nd_state, pnode->nd_state))

	/* node is marked INUSE_DOWN | INUSE_PROV when provisioning.
	 * need to check transition from INUSE_PROV to UNAVAILABLE
	 */
	if ((!(vnode_o->nd_state & VNODE_UNAVAILABLE) ||
	     (vnode_o->nd_state & INUSE_PROV)) &&
	    (pnode->nd_state & VNODE_UNAVAILABLE)) {
		/* degrade all associated reservations. The '1' instructs the function to
		 * account for the unavailable vnodes in the reservation's counter
		 */
		(void) vnode_unavailable(pnode, 1);
	} else if (((vnode_o->nd_state & VNODE_UNAVAILABLE)) &&
		   ((!(pnode->nd_state & VNODE_UNAVAILABLE)) ||
		    (pnode->nd_state == INUSE_FREE))) {
		(void) vnode_available(pnode);
	}

fn_fire_event:
	/* Fire off the vnode state change event */
	process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);

fn_free_and_return:
	free(vnode_o);
	free_br(preq);
}

/**
 *  @brief
 *  	A vnode becomes available when its state transitions towards no bits
 *  	with VNODE_UNAVAILABLE set.
 * 		If the node was associated to a reservation and the reservation was degraded
 * 		then the reservation is adjusted to reflect that one of its associated vnode
 * 		is now back up.
 *
 * 		If all the vnodes associated to the reservation are back up
 * 		then the reservation does not need to be reconfirmed by the scheduler.
 * @see
 * 		set_vnode_state
 *
 * @param[in]	np	- the node that has become available again
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
vnode_available(struct pbsnode *np)
{
	resc_resv *presv;
	struct resvinfo *rinfp;
	struct resvinfo *rinfp_hd = NULL;
	char *execvnodes = NULL;
	int occurrence = -1;

	if (np == NULL)
		return;

	/* the vnode has no associated reservations, no action is required */
	if ((rinfp = find_vnode_in_resvs(np, Skip_Degraded_Time)) == NULL)
		return;

	DBPRT(("%s(%s): entered\n", __func__, np->nd_name))

	/* keep track of the head of the linked list for garbage collection */
	rinfp_hd = rinfp;

	/* Process each reservation that this node is associated to */
	for (presv = rinfp->resvp; rinfp; rinfp = rinfp->next) {
		if ((presv = rinfp->resvp) == NULL) {
			log_err(PBSE_SYSTEM, __func__, "could not access reservation");
			continue;
		}
		/* If none of the vnodes associated to the reservation are down, reset
		 * the states of the reservation to their previous values.
		 *
		 * ri_vnodes_down lives with the reservation information during the
		 * lifecycle of the server process, it is not stored to disk upon server
		 * restart. The second check on number of nodes down != 0 is done to
		 * avoid altering reservation information if the state of a node changes
		 * to UP while no nodes were previously seen as down
		 */
		if (presv->ri_vnodes_down != 0) {
			/* decrement number of nodes down */
			presv->ri_vnodes_down--;

			if (presv->ri_vnodes_down == 0) {
				/* If the reservation is currently running, reset its state to
				 * running
				 */
				if (presv->ri_qs.ri_state == RESV_RUNNING)
					resv_setResvState(presv, RESV_RUNNING, RESV_RUNNING);
				else {
					/* Otherwise revert its state to Confirmed */
					resv_setResvState(presv, RESV_CONFIRMED, RESV_CONFIRMED);
				}
				/* Unset all of the reservation retry attributes and values */
				unset_resv_retry(presv);
			}
		} else {
			/* An inconsistency in recognizing node state transitions caused an
			 * unexpected re-entry into this handler. Since this is not
			 * supposed to happen we only log it for now.
			 */
			/* If a standing reservation we print the execvnodes sequence
			 * string for debugging purposes */
			if (get_rattr_long(presv, RESV_ATR_resv_standing)) {
				if (is_rattr_set(presv, RESV_ATR_resv_execvnodes))
					execvnodes = get_rattr_str(presv, RESV_ATR_resv_execvnodes);
				if (execvnodes == NULL)
					execvnodes = "";
 				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
				           presv->ri_qs.ri_resvID, "execvnodes sequence: %s", execvnodes);
				if (is_rattr_set(presv, RESV_ATR_resv_idx))
					occurrence = get_rattr_long(presv, RESV_ATR_resv_idx);
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
				           presv->ri_qs.ri_resvID, "vnodes in occurrence %d: %d; ",
				           occurrence, presv->ri_vnodect);
			} else {
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
			           presv->ri_qs.ri_resvID, "vnodes in reservation: %d; ",
			           presv->ri_vnodect);
			}
		}
	}

	free_rinf_list(rinfp_hd);
}

/**
 * @brief
 * 		A node is considered unavailable if it is in one of the states:
 * 		OFFLINE, DOWN, DELETED, STALE, or UNKNOWN.
 *
 * 		If a node is in a reservation and the resv is associated to the soonest
 * 		occurrence then flag the reservation as state degraded and substate
 * 		degraded.
 *
 * 		Otherwise, if the reservation is a standing reservation, and the
 * 		node is in a later occurrence, then mark the reservation in substate
 * 		degraded.
 *
 * @param[in]	np	- the unavailable node
 * @param[in]	account_vnode	- register the vnode as down in the reservation's counts.
 *
 * @return	void
 * @par MT-safe: No
 */
void
vnode_unavailable(struct pbsnode *np, int account_vnode)
{
	char *nd_name;
	char *resv_nodes;
	resc_resv *presv;
	struct resvinfo *rinfp;
	struct resvinfo *rinfp_hd = NULL;
	int *presv_state;
	int *presv_substate;
	int in_soonest_occr;
	long degraded_time;
	long resv_start_time;
	long retry_time;
	char *execvnodes = NULL;
	int occurrence = -1;

	if (np == NULL)
		return;

	if (!(nd_name = np->nd_name))
		return;

	/* If the vnode has no associated reservation, i.e., the vnode does not
	 * appear in any advance reservation nor any occurrence of a standing
	 * reservation, then no action is required.
	 */
	if ((rinfp = find_vnode_in_resvs(np, Set_Degraded_Time)) == NULL)
		return;

	DBPRT(("%s(%s): entered\n", __func__, np->nd_name))

	/* keep track of the head of the linked list for garbage collection */
	rinfp_hd = rinfp;

	/* Process each reservation that this node is associated to */
	for (presv = rinfp->resvp; rinfp; rinfp = rinfp->next) {

		if ((presv = rinfp->resvp) == NULL) {
			log_err(PBSE_SYSTEM, __func__, "could not access reservation");
			continue;
		}

		presv_state = &presv->ri_qs.ri_state;
		presv_substate = &presv->ri_qs.ri_substate;
		retry_time = get_rattr_long(presv, RESV_ATR_retry);
		resv_nodes = get_rattr_str(presv, RESV_ATR_resv_nodes);
		resv_start_time = get_rattr_long(presv, RESV_ATR_start);
		/* the start time of the soonest degraded occurrence */
		degraded_time = presv->ri_degraded_time;
		in_soonest_occr = find_vnode_in_execvnode(resv_nodes, np->nd_name);

		if (retry_time == 0)
			set_resv_retry(presv, determine_resv_retry(presv));

		/* If the downed node is part of the soonest reservation then the
		 * reservation is marked degraded. This is recognized by having the
		 * degraded_time be equal to the reservation start time or if the vnode
		 * name is present in the soonest occurrence's resv_nodes attribute.
		 */
		if ((degraded_time == resv_start_time) || (in_soonest_occr == 1)) {
			DBPRT(("vnode_unavailable: changing reservation state to degraded\n"))
			if (*presv_state == RESV_CONFIRMED) {
				(void) resv_setResvState(presv, RESV_DEGRADED, RESV_DEGRADED);
			} else {
				/* If reservation is currently running and a node is down then
				 * set its substate to degraded
				 */
				(void) resv_setResvState(presv, presv->ri_qs.ri_state, RESV_DEGRADED);
			}
		} else if (degraded_time > resv_start_time)
			(void) resv_setResvState(presv, presv->ri_qs.ri_state, RESV_DEGRADED);

		/* reference count the number of vnodes down such that the state of the
		 * reservation can be reset to CONFIRMED once the number of unavailable
		 * nodes reaches 0.
		 */
		if ((*presv_substate == RESV_DEGRADED) && (account_vnode == 1)) {
			/* the number of vnodes down could exceed the number of vnodes in
			 * the reservation only in the case of a standing reservation for
			 * which the vnodes unavailable are associated to later occurrences
			 */
			if (presv->ri_vnodes_down > presv->ri_vnodect) {
				/* If a standing reservation we print the execvnodes sequence
				 * string for debugging purposes */
				if (get_rattr_arst(presv, RESV_ATR_resv_standing)) {
					if (is_rattr_set(presv, RESV_ATR_resv_execvnodes))
						execvnodes = get_rattr_str(presv, RESV_ATR_resv_execvnodes);
					if (execvnodes == NULL)
						execvnodes = "";
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
						   presv->ri_qs.ri_resvID, "execvnodes sequence: %s",
						   execvnodes);
					if (is_rattr_set(presv, RESV_ATR_resv_idx))
						occurrence = get_rattr_long(presv, RESV_ATR_resv_idx);
 					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
					           presv->ri_qs.ri_resvID,
					           "vnodes in occurrence %d: %d;"
					           " unavailable vnodes in reservation: %d",
					           occurrence, presv->ri_vnodect, presv->ri_vnodes_down);
				} else {
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
 					   presv->ri_qs.ri_resvID,
					   "vnodes in reservation: %d; unavailable vnodes in reservation: %d",
 					   presv->ri_vnodect, presv->ri_vnodes_down);
				}
			}
			presv->ri_vnodes_down++;
		}

	} /* End of for. Process next reservation associated to the affected node */

	free_rinf_list(rinfp_hd);
}

/**
 * @brief
 * 		Search all reservations for an associated node that matches the one
 * 		passed as argument.
 *
 * @param[in]	np	-	The node to find in the reservations list
 * @param[in]	vnode_degraded_op	-	To indicate whether to set the degraded time on
 * 										the reservation or not.
 *
 * @return	resvinfo *
 * @retval	-	The reservation info structure	- for the matching reservations
 * @retval	NULL	- if none are found.
 *
 * @note
 * 		if none are found. This function allocates memory that has to be freed by
 * 		the caller.
 *
 * @par MT-safe: No
 */
struct resvinfo *
find_vnode_in_resvs(struct pbsnode *np, enum vnode_degraded_op degraded_op)
{
	struct resvinfo *rinfp;
	struct resvinfo *parent_rinfp;
	resc_resv *presv;
	pbsnode_list_t *pl;
	int match = 0;
	int is_degraded = 0;
	long retry_time;

	if (np == NULL)
		return NULL;

	/* Walk all reservations and check if the node is associated to an
	 * occurrence of a standing reservation
	 *
	 * While walking the reservation's list, we create a resv info linked list
	 * that contains all reservations on which the node appears
	 */
	rinfp = malloc(sizeof(struct resvinfo));
	if (!rinfp)
		return NULL;

	rinfp->resvp = NULL;
	rinfp->next = NULL;

	parent_rinfp = rinfp;

	for (presv = (resc_resv *) GET_NEXT(svr_allresvs); presv != NULL;
	     presv = (resc_resv *) GET_NEXT(presv->ri_allresvs)) {
		/* When processing an advance reservation, set the degraded time to be
		 * the start time of the reservation and process the next reservation
		 */
		if (get_rattr_long(presv, RESV_ATR_resv_standing) == 0) {
			for (pl = presv->ri_pbsnode_list; pl; pl = pl->next) {
				if (np == pl->vnode)
					break;
			}
			if (!pl)
				continue;

			presv->ri_degraded_time = get_rattr_long(presv, RESV_ATR_start);
			if (!match) {
				rinfp->resvp = presv;
				rinfp->next = NULL;
				match = 1;
			} else {
				rinfp->next = malloc(sizeof(struct resvinfo));
				if (!rinfp->next) {
					log_err(PBSE_SYSTEM, __func__,
						"could not allocate memory to create a resvinfo list");
					break;
				}
				rinfp = rinfp->next;
				rinfp->resvp = presv;
				rinfp->next = NULL;
			}
		} else { /* Standing Reservation */
			/* If the sequence of execvnodes of the considered standing reservation
			 * isn't set, process the next element. Note that this should never
			 * happen as the reservation should have been confirmed and the nodes
			 * been assigned to it
			 */
			if (!is_rattr_set(presv, RESV_ATR_resv_execvnodes)) {
				is_degraded = 1;
				log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV, LOG_NOTICE,
				           presv->ri_qs.ri_resvID,
				           "%s: Reservation's execvnodes_seq are corrupted, degrading it",
				           __func__);
				if (presv->ri_qs.ri_substate != RESV_DEGRADED) {
					if (presv->ri_qs.ri_state == RESV_RUNNING
					    || presv->ri_qs.ri_state == RESV_DELETING_JOBS) {
						/*
						** leave it as is, rely on resv_vnodes to run jobs in it;
						** once this occurrence finally finishes
						** we will re-evaluate whether to reconfirm next occurrence.
						** Still set substate to degraded now to alert site admins
						*/
						resv_setResvState(presv, presv->ri_qs.ri_state, RESV_DEGRADED);
					} else {
						resv_setResvState(presv, RESV_DEGRADED, RESV_DEGRADED);
						retry_time = determine_resv_retry(presv);
						/* if server just came up wait 'some time' for nodes to come up */
						if (time_now + ESTIMATED_DELAY_NODES_UP < retry_time)
							retry_time = time_now + ESTIMATED_DELAY_NODES_UP;
						/* bogus value for degraded_time, but avoid skipping a reconfirmation */
						presv->ri_degraded_time = get_rattr_long(presv, RESV_ATR_start);
						log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID,
						           "%s: Reservation with corrupted nodes, setting up reconfirmation",
						           __func__);
						force_resv_retry(presv, retry_time);
					}
				}
				/* the reservation is degraded but we cannot associate it with the node */
 				continue;
			} else {
				is_degraded = find_degraded_occurrence(presv, np, degraded_op);
 			}

			/* If no occurrence is degraded move on to the next reservation */
			if (is_degraded == 0)
				continue;

			/* Add the reservation to the constructed linked list to which this
			 * node is associated
			 */
			if (!match) {
				rinfp->resvp = presv;
				rinfp->next = NULL;
				match = 1;
			} else {
				rinfp->next = malloc(sizeof(struct resvinfo));
				if (!rinfp->next) {
					log_err(PBSE_SYSTEM, __func__,
						"could not allocate memory to create a resvinfo list");
					break;
				}
				rinfp = rinfp->next;
				rinfp->resvp = presv;
				rinfp->next = NULL;
			}
		}
	}

	/* no reservations are associated to this vnode */
	if (!match) {
		free(rinfp);
		rinfp = NULL;
		parent_rinfp = NULL;
	}

	return parent_rinfp;
}

/**
 * @brief
 * 		Walk occurrences of a standing reservation searching for the soonest
 * 		valid degraded occurrence associated to the vnode passed as argument.
 *
 * @param[in]	presv	- The reservation being processed
 * @param[in]	np	- The node affected, either available or unavailable
 * @param[in]	vnode_degraded_op	- determines if a degraded time should be set
 *
 * @return	int
 * @retval	1	- upon success finding the node in the reservation (including its
 * 					occurrences when a standing reservation)
 * @retval 0	- if the node was not found.
 *
 * @par Side-effects: this function will also set the degraded time of the
 * reservation when instructed to by the degraded_op operator.
 *
 * @par MT-safe: No
 */
int
find_degraded_occurrence(resc_resv *presv, struct pbsnode *np,
			 enum vnode_degraded_op degraded_op)
{
	char **execvnodes_seq;
	char *short_execvnodes_seq = NULL;
	char **tofree = NULL;
	char *rrule;
	char *tz;
	char *execvnodes = NULL;
	long dtstart;
	long occr_time;
	long curr_degraded_time;
	int ridx;
	int ridx_adjusted;
	int rcount;
	int rcount_adjusted;
	int i, j;
	int occr_found;

	if (presv == NULL)
		return 0;

	if (np == NULL)
		return 0;

	rrule = get_rattr_str(presv, RESV_ATR_resv_rrule);
	tz = get_rattr_str(presv, RESV_ATR_resv_timezone);
	dtstart = get_rattr_long(presv, RESV_ATR_start);
	if (is_rattr_set(presv, RESV_ATR_resv_execvnodes))
		execvnodes = get_rattr_str(presv, RESV_ATR_resv_execvnodes);
	if (execvnodes == NULL || (short_execvnodes_seq = strdup(execvnodes)) == NULL)
		return -1;
	execvnodes_seq = unroll_execvnode_seq(short_execvnodes_seq, &tofree);
	/* If an error occurred during unrolling, this reservation is ignored */
	if (!(*execvnodes_seq)) {
		free(short_execvnodes_seq);
		return -1;
	}

	ridx = get_rattr_long(presv, RESV_ATR_resv_idx);
	rcount = get_rattr_long(presv, RESV_ATR_resv_count);
	/* A reconfirmed degraded reservation reports the number of
	 * reconfirmed occurrences from the time of degradation.
	 */
	rcount_adjusted = get_execvnodes_count(execvnodes);

	ridx_adjusted = ridx - (rcount - rcount_adjusted);
	occr_found = 0;
	curr_degraded_time = 0;

	/* Search for a match for this node in each occurrence's execvnode */
	for (i = ridx_adjusted - 1, j = 1; i < rcount_adjusted; i++, j++) {
		if (i < 0) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID,
				       "%s: attempt to find vnodes for for occurence %d failed; skipping",
		           __func__, j);
			continue;
		}
		if (find_vnode_in_execvnode(execvnodes_seq[i], np->nd_name)) {
			occr_found = 1;
			if (degraded_op == Set_Degraded_Time) {
				/* we keep track of the occurrence time to determine the earliest
				 * degraded time
				 */
				occr_time = get_occurrence(rrule, dtstart, tz, j);

				if (presv->ri_degraded_time == 0 &&
				    curr_degraded_time == 0) {
					curr_degraded_time = occr_time;
				}
			} else
				break;
		}
	}
	/* clean up unrolled execvnodes sequence helpers */
	free(execvnodes_seq);
	execvnodes_seq = NULL;
	free(short_execvnodes_seq);
	short_execvnodes_seq = NULL;
	free_execvnode_seq(tofree);
	tofree = NULL;

	/* No matching vnode name was found in any occurrence */
	if (!occr_found)
		return 0;

	/* A matching vnode was found in an occurrence but no degraded time was set
	 * , we set it to curr_degraded_time for consistency
	 */
	if (presv->ri_degraded_time == 0 && curr_degraded_time != 0)
		presv->ri_degraded_time = curr_degraded_time;

	return 1;
}

/**
 * @brief
 * 		Garbage collect the dynamically generated reservation list
 * @see
 *		vnode_available and vnode_unavailable
 *
 * @param[in,out]	rinfp	-dynamically generated reservation list
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
free_rinf_list(struct resvinfo *rinfp)
{
	struct resvinfo *rinfp_tmp = rinfp;

	if (rinfp_tmp == NULL)
		return;

	while (rinfp != NULL) {
		rinfp_tmp = rinfp->next;
		free(rinfp);
		rinfp = rinfp_tmp;
	}
}

/**
 * @brief
 * 		Unset all reservations retry attributes and variables.
 *
 * @param[in]	presv - The reservation to process
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
unset_resv_retry(resc_resv *presv)
{
	if (presv == NULL)
		return;

	if (!is_rattr_set(presv, RESV_ATR_retry))
		return;

	set_rattr_l_slim(presv, RESV_ATR_retry, 0, SET);

	presv->ri_resv_retry = 0;
	presv->ri_degraded_time = 0;
}

/**
 * @brief
 * 		Set reservation retry attributes and variables.
 * 		The reservation attribute RESV_ATR_retry is recovered upon a server
 * 		restart. The field ri_resv_retry is not.
 * 		If RESV_ATR_retry is set, we add that already existing time as the
 * 		event time, otherwise we compute the event time
 *
 * @param[in]	presv	-	The reservation to process
 * @param[in]	retry_time	-	The retry time to set
 * @param[in]	forced  - determines which handler we call
 * 
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
set_resv_retry2(resc_resv *presv, long retry_time, int forced)
{
	struct work_task *pwt;
	extern void resv_retry_handler(struct work_task *ptask);
	extern void resv_retry_handler_forced(struct work_task *ptask);
	char *msg;
	char *str_time;

	if (presv == NULL)
		return;

	if (presv->ri_resv_retry)
		msg = "Next attempt to reconfirm reservation will be made on %s";
	else
		msg = "An attempt to reconfirm reservation will be made on %s";

	set_rattr_l_slim(presv, RESV_ATR_retry, retry_time, SET);

	presv->ri_resv_retry = retry_time;

	str_time = ctime(&retry_time);
	if (str_time == NULL)
		str_time = "";
	log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID, msg, str_time);

	/* Set a work task to initiate a scheduling cycle when the time to check
	 * for alternate nodes to assign the reservation comes
	 */
	if ((pwt = set_task(WORK_Timed, retry_time, forced ? resv_retry_handler_forced : resv_retry_handler, presv)) != NULL) {
		/* set things so that the reservation going away will result in
		 * any "yet to be processed" work tasks also going away
		 */
		append_link(&presv->ri_svrtask, &pwt->wt_linkobj, pwt);
	}
}

/**
 * @brief
 * 		Set reservation retry attributes and variables.
 * 		The reservation attribute RESV_ATR_retry is recovered upon a server
 * 		restart. The field ri_resv_retry is not.
 * 		If RESV_ATR_retry is set, we add that already existing time as the
 * 		event time, otherwise we compute the event time
 *
 *      This one will only kick a reconfirmation if ri_vnodes_down is positive
 *
 * @param[in]	presv	-	The reservation to process
 * @param[in]	retry_time	-	The retry time to set
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
set_resv_retry(resc_resv *presv, long retry_time)
{
	set_resv_retry2(presv, retry_time, 0);
}

/**
 * @brief
 * 		Set reservation retry attributes and variables.
 * 		The reservation attribute RESV_ATR_retry is recovered upon a server
 * 		restart. The field ri_resv_retry is not.
 * 		If RESV_ATR_retry is set, we add that already existing time as the
 * 		event time, otherwise we compute the event time
 *
 *      This will always kick a reconfirmation
 *
 * @param[in]	presv	-	The reservation to process
 * @param[in]	retry_time	-	The retry time to set
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
force_resv_retry(resc_resv *presv, long retry_time)
{
	set_resv_retry2(presv, retry_time, 1);
}

/**
 * @brief
 * 		search string big for exact occurrence of string little. The preceding
 * 		and successsor characters of the occurring string should be legal vnode
 * 		characters. The pattern defined by 'little' consists only of legal vnode
 * 		characters.
 *
 * 		This function is used to find an exact match of a vnode name within an
 * 		execvnode string, for example searching for "node1" in the execvnode
 * 		(node12:ncpus=1)+(node1node1:ncpus=2)+(node1:npcus=3)+(node3:mem=5000:npcus=1)
 * @see
 * 		vnode_unavailable and find_degraded_occurrence
 *
 * @param[in]	big	-	the original string to search
 * @param[in]	little	-	the pattern to find
 *
 * @return	int
 * @retval	1	- if the pattern is found
 * @retval	0	- otherwise
 *
 * @par MT-safe: no
 */
int
find_vnode_in_execvnode(char *big, char *little)
{
	char *s;
	int patt_length;

	if (big == NULL)
		return 0;

	if (little == NULL)
		return 0;

	s = strstr(big, little);

	patt_length = strlen(little);

	/*
	 * Note that the pattern little can never occur at the beginning of big, as
	 * the only way this would happen would be for a string containing a
	 * repetition of the pattern, as in the second execvnode in the example above,
	 * where node1 is repeated twice and therefore a vnode name distinct from
	 * node1, is skipped by catching the index value being 0.
	 */
	while (s != NULL) {
		ptrdiff_t index;

		/* Get the index in the original string at which the occurrence is found
		 * using pointer arithmetic. */
		index = s - big;

		/* If the pattern isn't part of the remainder of a pattern, for example
		 * looking for "node1" in "node1node1" and the immediately preceding and
		 * succeeding characters aren't legal vnode characters, then it is a match
		 */
		if (index != 0 && !legal_vnode_char(big[index - 1], 1) && !legal_vnode_char(big[index + patt_length], 1))
			return 1;
		/* Otherwise, we move by the amount that the pattern requires before
		 * running the search again
		 */
		s = s + patt_length;

		s = strstr(s, little);
	}
	return 0;
}

/**
 * @brief
 * 		decode_stat_update - decodes body of status update request from MOM
 *		number of jobs should already be decoded by caller
 * @see
 * 		stat_update and recv_job_obit.
 *
 * @param[in]	stream	-	TPP stream open from Mom on which to read the msg
 * @param[out]	prused	-	Job Resource Usage requests
 *
 * @return	int
 * @return	return code
 */

static int
decode_stat_update(int stream, ruu *prused)
{
	int hc;
	int rc;

	prused->ru_pjobid = disrst(stream, &rc);
	if (rc)
		return rc;

	hc = disrsi(stream, &rc);
	if (rc)
		return rc;
	if (hc) {
		/* there is a comment string following */
		prused->ru_comment = disrst(stream, &rc);
		if (rc)
			return rc;
	} else {
		prused->ru_comment = NULL;
	}
	prused->ru_status = disrsi(stream, &rc);
	if (rc)
		return rc;
	prused->ru_hop = disrsi(stream, &rc);
	if (rc)
		return rc;

	CLEAR_HEAD(prused->ru_attr);
	rc = decode_DIS_svrattrl(stream, &prused->ru_attr);
	if (rc) {
		free_attrlist(&prused->ru_attr);
	}
	return rc;
}

/**
 * @brief
 *		Update job resource usage based on information sent from Mom.
 *		All updates include the lastest information on resource usage.
 * @par Functionality:
 *		An update from Mom also contains certain attributes which
 *		need to be recorded,  the most inportant of which is the job's
 *		session id.  When the session id is modified, the job's substate is
 *		changed from PRERUN to RUNNING; this also saves the job to the database,
 *		otherwise it is saved explicitly.
 * @see
 * 		is_request
 *
 * @param[in] stream - TPP stream open from Mom on which to read the msg
 *
 * @return	void
 */
static void
stat_update(int stream)
{
	int bad;
	int num;
	int njobs;
	job *pjob;
	int rc;
	ruu rused = {0};
	svrattrl *sattrl;
	mominfo_t *mp;

	njobs = disrui(stream, &rc); /* number of jobs in update */
	if (rc)
		return;

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, "received updates = %d", njobs);

	rused.ru_next = NULL;
	while (njobs--) {

		rused.ru_pjobid = NULL;
		if (decode_stat_update(stream, &rused) != 0) {

			if ((mp = tfind2((u_long) stream, 0, &streams)) != NULL) {

				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
					  LOG_NOTICE, mp->mi_host, "error in stat_update");
			}
			tpp_eom(stream);
			break;
		}
		DBPRT(("stat_update: update for %s\n", rused.ru_pjobid))

		if (((pjob = find_job(rused.ru_pjobid)) != NULL) &&
		    (check_job_state(pjob, JOB_STATE_LTR_RUNNING) || check_job_state(pjob, JOB_STATE_LTR_EXITING)) &&
		    (get_jattr_long(pjob, JOB_ATR_run_version) == rused.ru_hop)) {

			long old_sid = 0; /* used to save prior sid of job */
			svrattrl *execvnode_entry = NULL;
			svrattrl *schedselect_entry = NULL;
			char *cur_execvnode = NULL;
			char *cur_schedselect = NULL;

			if (is_jattr_set(pjob, JOB_ATR_exec_vnode))
				cur_execvnode = get_jattr_str(pjob, JOB_ATR_exec_vnode);

			if (is_jattr_set(pjob, JOB_ATR_SchedSelect))
				cur_schedselect = get_jattr_str(pjob, JOB_ATR_SchedSelect);

			/* update all the attributes sent from Mom */
			execvnode_entry = find_svrattrl_list_entry(&rused.ru_attr, ATTR_execvnode, NULL);
			schedselect_entry = find_svrattrl_list_entry(&rused.ru_attr, ATTR_SchedSelect, NULL);

			if ((execvnode_entry != NULL) &&
			    (execvnode_entry->al_value != NULL) &&
			    (schedselect_entry != NULL) &&
			    (schedselect_entry->al_value != NULL) &&
			    (cur_execvnode != NULL) &&
			    (strcmp(cur_execvnode, execvnode_entry->al_value) != 0) &&
			    (cur_schedselect != NULL) &&
			    (strcmp(cur_schedselect, schedselect_entry->al_value) != 0)) {

				/* decreements everything found in exec_vnode */
				set_resc_assigned((void *) pjob, 0, DECR);
				free_nodes(pjob);

				if (cur_execvnode != NULL) {
					set_jattr_str_slim(pjob, JOB_ATR_exec_vnode_acct, cur_execvnode, NULL);
				}

				if ((is_jattr_set(pjob, JOB_ATR_resource_acct)) != 0) {
					free_jattr(pjob, JOB_ATR_resource_acct);
					mark_jattr_not_set(pjob, JOB_ATR_resource_acct);
				}
				set_attr_with_attr(&job_attr_def[JOB_ATR_resource_acct], get_jattr(pjob, JOB_ATR_resource_acct), get_jattr(pjob, JOB_ATR_resource), INCR);

				set_jattr_str_slim(pjob, JOB_ATR_exec_host_acct, get_jattr_str(pjob, JOB_ATR_exec_host), NULL);

				if (assign_hosts(pjob, execvnode_entry->al_value, 1) == 0) {
					resource_def *prdefsl;
					resource *presc;
					(void) update_resources_list(pjob, ATTR_l,
								     JOB_ATR_resource,
								     execvnode_entry->al_value,
								     INCR, 0,
								     JOB_ATR_resource_orig);

					if ((is_jattr_set(pjob, JOB_ATR_SchedSelect_orig)) == 0)
						set_jattr_str_slim(pjob, JOB_ATR_SchedSelect_orig, cur_schedselect, NULL);
					set_jattr_str_slim(pjob, JOB_ATR_SchedSelect, schedselect_entry->al_value, NULL);

					/* re-generate nodect */
					set_chunk_sum(get_jattr(pjob, JOB_ATR_SchedSelect), get_jattr(pjob, JOB_ATR_resource));
					set_resc_assigned((void *) pjob, 0, INCR);

					prdefsl = &svr_resc_def[RESC_SELECT];
					/* re-generate "select" resource */
					presc = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), prdefsl);
					if (presc == NULL)
						presc = add_resource_entry(get_jattr(pjob, JOB_ATR_resource), prdefsl);
					if (presc != NULL)
						(void) prdefsl->rs_decode(&presc->rs_value, NULL, "select", schedselect_entry->al_value);
					account_jobstr(pjob, PBS_ACCT_PRUNE);
				} else {
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid,
						  "error assigning hosts...requeueing job");
					discard_job(pjob, "Force rerun", 1);
					force_reque(pjob);
				}
			}

			if (execvnode_entry != NULL) {
				delete_link(&execvnode_entry->al_link);
				free(execvnode_entry);
			}
			if (schedselect_entry != NULL) {
				delete_link(&schedselect_entry->al_link);
				free(schedselect_entry);
			}
			if (is_jattr_set(pjob, JOB_ATR_session_id))
				old_sid = get_jattr_long(pjob, JOB_ATR_session_id);
			/* update all the attributes sent from Mom */
			sattrl = (svrattrl *) GET_NEXT(rused.ru_attr);
			if (sattrl != NULL) {
				if (modify_job_attr(pjob, sattrl,
						    ATR_DFLAG_MGWR | ATR_DFLAG_SvWR, &bad) != 0) {
					if ((mp = tfind2((u_long) stream, 0, &streams)) != NULL) {
						for (num = 1; num < bad; num++)
							sattrl = (struct svrattrl *) GET_NEXT(sattrl->al_link);
						sprintf(log_buffer, "unable to update attribute %s.%s in stat_update", sattrl->al_name, sattrl->al_resc);
						log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
							  LOG_NOTICE, mp->mi_host, log_buffer);
					}
				}
			}

			if ((is_jattr_set(pjob, JOB_ATR_session_id)) && (get_jattr_long(pjob, JOB_ATR_session_id) != old_sid)) {
				/* save new or updated session id for the job */
				/* and if needed update substate to running   */
				/*
				 * save the session id and likely update the job
				 * substate, normally it is changed from
				 * PRERUN (or PROVISION) to RUNNING here, but
				 * it may have already been changed to:
				 * - EXITING if the OBIT arrived first.
				 */
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid,
					   "Received session ID for job: %ld", get_jattr_long(pjob, JOB_ATR_session_id));
				if ((check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) ||
				    (check_job_substate(pjob, JOB_SUBSTATE_PROVISION))) {
					/* log acct info and make RUNNING */
					complete_running(pjob);
					/* this causes a save of the job */
					svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING,
							JOB_SUBSTATE_RUNNING);
					/*
					 * If JOB_DEPEND_TYPE_BEFORESTART dependency is set for the current job
					 * then release the after dependency for its childs as the current job
					 * is changing its state from JOB_SUBSTATE_PRERUN to JOB_SUBSTATE_RUNNING
					 */
					if (is_jattr_set(pjob, JOB_ATR_depend)) {
						(void) depend_on_exec(pjob);
					}
				}
			} else if ((is_jattr_set(pjob, JOB_ATR_session_id)) == 0) {
				/* this has been downgraded to DEBUG3  */
				/* level (from DEBUG2)		       */
				/* since a mom hook can actually send  */
				/* job updates, even before a job gets */
				/* a session id */
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB,
					  LOG_DEBUG, pjob->ji_qs.ji_jobid,
					  "update from Mom without session id");
			} else {
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "Received the same SID as before: %ld", get_jattr_long(pjob, JOB_ATR_session_id));
				job_save_db(pjob);
			}
		}
		(void) free(rused.ru_comment);
		rused.ru_comment = NULL;
		(void) free(rused.ru_pjobid);
		rused.ru_pjobid = NULL;
		free_attrlist(&rused.ru_attr);
	}
}

/**
 * @brief
 * 		receive a job_obit IS message from a Mom on TPP stream.
 *
 *		Decode the message into a resc_used_update structure and call
 *		job_obit() to start the end of job procedures
 * @see
 * 		is_request
 *
 * @param[in]	stream	-	the TPP stream connecting to the Mom
 *
 * @return	void
 */

static void
recv_job_obit(int stream)
{
	int njobs = 0;
	int i = 0;
	char **reject_list = NULL;
	char **ack_list = NULL;
	int reject_count = 0;
	int ack_count = 0;
	mominfo_t *mp = NULL;
	ruu rused = {0};

	njobs = disrui(stream, &i); /* number of jobs in update */
	if (i)
		return;

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, "received obits = %d", njobs);

	reject_list = (char **) calloc(1, njobs * sizeof(char *));
	if (reject_list == NULL)
		goto recv_job_obit_err;

	ack_list = (char **) calloc(1, njobs * sizeof(char *));
	if (ack_list == NULL)
		goto recv_job_obit_err;

	while (njobs--) {
		CLEAR_HEAD(rused.ru_attr);
		rused.ru_comment = NULL;
		rused.ru_next = NULL;
		rused.ru_pjobid = NULL;

		if (decode_stat_update(stream, &rused) == 0) {
			int is_reject = 0;

			DBPRT(("recv_job_obit: decoded obit for %s\n", rused.ru_pjobid))
			is_reject = job_obit(&rused, stream);
			if (is_reject == 1) {
				reject_list[reject_count++] = rused.ru_pjobid;
				rused.ru_pjobid = NULL;
			} else if (is_reject != -1) { /* -1 means ignore ruu */
				ack_list[ack_count++] = rused.ru_pjobid;
				rused.ru_pjobid = NULL;
			}
			free(rused.ru_comment);
			if (rused.ru_pjobid != NULL)
				free(rused.ru_pjobid);
			free_attrlist(&rused.ru_attr);
		} else
			goto recv_job_obit_err;
	}

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, __func__, "processed obits, sending replies acks: %d, rejects: %d", ack_count, reject_count);

	if (ack_count > 0 || reject_count > 0) {
		if (is_compose(stream, IS_OBITREPLY) != DIS_SUCCESS)
			goto recv_job_obit_err;
		if (diswui(stream, ack_count) != DIS_SUCCESS)
			goto recv_job_obit_err;
		if (ack_count > 0) {
			for (i = 0; i < ack_count; i++) {
				if (diswst(stream, ack_list[i]) != DIS_SUCCESS)
					goto recv_job_obit_err;
				free(ack_list[i]);
				ack_list[i] = NULL;
			}
		}
		free(ack_list);
		ack_list = NULL;
		ack_count = 0;
		if (diswui(stream, reject_count) != DIS_SUCCESS)
			goto recv_job_obit_err;
		if (reject_count > 0) {
			for (i = 0; i < reject_count; i++) {
				if (diswst(stream, reject_list[i]) != DIS_SUCCESS)
					goto recv_job_obit_err;
				free(reject_list[i]);
				reject_list[i] = NULL;
			}
		}
		dis_flush(stream);
		free(reject_list);
		reject_list = NULL;
		reject_count = 0;
	}

	return;

recv_job_obit_err:
	if (rused.ru_pjobid) {
		DBPRT(("recv_job_obit: failed to decode obit for %s\n", rused.ru_pjobid))
		log_joberr(PBSE_INTERNAL, __func__, "Failed to decode obit", rused.ru_pjobid);
		free(rused.ru_pjobid);
	}
	if (rused.ru_comment)
		free(rused.ru_comment);
	free_attrlist(&rused.ru_attr);

	/* had a error, discard rest of message */
	if ((mp = tfind2((u_long) stream, 0, &streams)) != NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_NOTICE, mp->mi_host, "error in recv_job_obit");
	}
	tpp_eom(stream);

	if (reject_list != NULL) {
		for (i = 0; i < reject_count; i++) {
			if (reject_list[i] != NULL)
				free(reject_list[i]);
		}
		free(reject_list);
	}
	if (ack_list != NULL) {
		for (i = 0; i < ack_count; i++) {
			if (ack_list[i] != NULL)
				free(ack_list[i]);
		}
		free(ack_list);
	}
}

/**
 * @brief
 * 	Tell Mom to discard (kill) a running job.
 *
 *	This is done in certain circumstances, such as
 *
 *	1. If Mom was marked down and jobs where requeued on node_down_requeue,
 *		Mom will kill off the job and then send an OBIT which wil be rejected
 *		because the run version will not match.
 *
 *	2. Mother Superior or a Sister failed to acknowledge the Delete Job request
 *		at the end of job processing.  This tells all Moms involved to delete
 *		the job and free the resources.
 *
 * @param[in]	stream	-	the TPP stream connecting to the Mom
 * @param[in]	jobid	-	job id to be discarded.
 * @param[in]	runver	-	is the run version (hop) of the jobs which should be deleted. A runver of -1 is delete any.
 * @param[in]	txt	-	the reason why it is getting discarded.
 *
 * @return	void
 */

static void
send_discard_job(int stream, char *jobid, int runver, char *txt)
{
	DBPRT(("discard_job %s\n", jobid))
	if (stream != -1) {
		static char sdjfmt[] = "Discard running job, %s %s";
		int rc;

		if ((rc = is_compose(stream, IS_DISCARD_JOB)) == DIS_SUCCESS) {
			if ((rc = diswst(stream, jobid)) == DIS_SUCCESS)
				if ((rc = diswsi(stream, runver)) == DIS_SUCCESS)
					dis_flush(stream);
		}
		if (rc != DIS_SUCCESS) {
			mominfo_t *mp;

			if (txt == NULL)
				txt = "";
			sprintf(log_buffer, sdjfmt, txt, "failed");
			mp = tfind2((u_long) stream, 0, &streams);
			if (mp)
				momptr_down(mp, log_buffer);
		} else if (txt) {
			snprintf(log_buffer, sizeof(log_buffer), sdjfmt, txt, "");
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobid,
				  log_buffer);
		}
	}
	DBPRT(("send_discard_job for %s, stream %d \n", jobid, stream))
}

/**
 * @brief
 * 		During the execution of a job, one or more Moms involved with
 *		the job apparent went down.
 *
 * @par
 *		To make sure that the resources allocated
 *		to the job by the Moms are released for other jobs, we send a
 *		IS_DISCARD_JOB message to each Mom.
 * @par
 *		A structure (struct jbdscrd) is hung off of the the job structure
 *		to track which Moms have acknowledge the IS_DISCARD_JOB message, see
 *		post_discard_job(), and which Moms are down, see mom_ptrdown().
 * @par
 *		The "txt" message is logged one time only to prevent flooding the log
 *		with duplicate messages.
 * @par
 *		If the "noack" flag is true, then we do not wish to wait for the
 *		Mom's acknowledgement because the job is being requeued/deleted
 *		immediately.   In this case we do not set ji_discard and do not
 *		call post_discard_job() for the first check.
 *
 * @param[in,out]	pjob	-	job structure
 * @param[in]	txt		-	The "txt" message is logged one time only to prevent flooding the log with duplicate messages.
 * @param[in]	noack	-	If the "noack" flag is true, then we do not wish to wait for the Mom's acknowledgement
 * 							 because the job is being requeued/deleted immediately.
 *
 * @return	void
 */
void
discard_job(job *pjob, char *txt, int noack)
{
	int i;
	int nmom;
	struct jbdscrd *pdsc = NULL;
	char *pc;
	char *pn;
	struct pbsnode *pnode;
	int rc;
	int rver;

	/* We're about to discard the job, reply to a preemption.
	 * This serves as a catch all just incase the code doesn't reply on its own.
	 */

	if (pjob->ji_pmt_preq != NULL)
		reply_preempt_jobs_request(PBSE_NONE, PREEMPT_METHOD_DELETE, pjob);

	if ((is_jattr_set(pjob, JOB_ATR_exec_vnode)) == 0) {
		/*  no exec_vnode list from which to work */
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid,
			  "in discard_job and no exec_vnode");
		return;
	}
	if (pjob->ji_discard) {
		/* must be already discarding */
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			  pjob->ji_qs.ji_jobid,
			  "cancel previous discard_job tracking for new discard_job request");
		free(pjob->ji_discard);
		pjob->ji_discard = NULL;
	}

	/* first count up number of vnodes in exec_vnode to size the	*/
	/* jbdscrd (job discard) array, this may result in more entries	*/
	/* than needed for the number of Moms, but that is ok		*/

	nmom = 1;
	pn = get_jattr_str(pjob, JOB_ATR_exec_vnode);
	while ((pn = strchr(pn, (int) '+')) != NULL) {
		nmom++;
		pn++;
	}
	/* allocate one extra for the null terminator */
	pdsc = calloc(sizeof(struct jbdscrd), (size_t) (nmom + 1));
	if (pdsc == NULL)
		return;

	/* note, calloc has zeroed the space, so the jdcd_mom ptrs are null */

	/* go through the list of hosts and add each parent Mom once */
	nmom = 0;
	pn = parse_plus_spec(get_jattr_str(pjob, JOB_ATR_exec_host), &rc);
	while (pn) {
		pc = pn;
		while ((*pc != '\0') && (*pc != ':'))
			++pc;
		*pc = '\0';

		pnode = find_nodebyname(pn);
		/* had better be the "natural" vnode with only the one parent */
		if (pnode != NULL) {
			for (i = 0; i < nmom; ++i) {
				if ((pdsc + i)->jdcd_mom == pnode->nd_moms[0])
					break; /* already have this Mom */
			}
			if (i == nmom) {
				(pdsc + nmom)->jdcd_mom = pnode->nd_moms[0];
				if (pnode->nd_moms[0]->mi_dmn_info->dmn_state & INUSE_DOWN)
					(pdsc + nmom)->jdcd_state = JDCD_DOWN;
				else {
					(pdsc + nmom)->jdcd_state = JDCD_WAITING;
					pjob->ji_jdcd_waiting = 1;
				}
				nmom++;
			}
		}
		pn = parse_plus_spec(NULL, &rc);
	}

	/* Get run version of this job */
	rver = get_jattr_long(pjob, JOB_ATR_run_version);

	/* unless "noack", attach discard array to the job */
	if (noack == 0)
		pjob->ji_discard = pdsc;
	else
		pjob->ji_discard = NULL;

	/* Send discard message to each Mom that is up or mark the entry down */
	for (i = 0; i < nmom; i++) {
		int s;

		s = (pdsc + i)->jdcd_mom->mi_dmn_info->dmn_stream;
		if ((s != -1) && ((pdsc + i)->jdcd_state != JDCD_DOWN)) {
			send_discard_job(s, pjob->ji_qs.ji_jobid, rver, txt);
			txt = NULL; /* so one log message only */
		} else
			(pdsc + i)->jdcd_state = JDCD_DOWN;
	}

	/*
	 * at this point unless "noack", we call post_discard_job() to see if
	 * there are any outstanding discard requests and if not to deal with
	 * the job the second arg is NULL to indicate "just checking"
	 */
	if (noack == 0)
		post_discard_job(pjob, NULL, 0);
	else
		free(pdsc); /* not attached to job, free it now */
}

/**
 * @brief
 * 		receive message that a job is suspended/resumed because
 *		the cycle harvesting workstation has gone busy/idle.
 *
 *		Note, the JOB_SVFLG_Actsuspd bit which is set in the job is independent
 *		of the JOB_SVRFLG_Suspend bit which is set by qsig -s suspend.
 *		Both may be set.
 *
 *		Data received:	integer  job state (1 suspended, 0 resumed)
 *			string	 jobid
 *
 * @param[in]	stream	-	the TPP stream connecting to the Mom
 *
 * @reurn	void
 */
static void
recv_wk_job_idle(int stream)
{
	int rc;
	int which;
	char *jobid;
	job *pjob;

	which = disrui(stream, &rc); /* 1 = suspend, 0 = resume */
	if (rc)
		return;

	jobid = disrst(stream, &rc); /* job id */
	if (rc)
		return;

	pjob = find_job(jobid);
	if (pjob) {
		/* suspend or resume job */

		set_job_state(pjob, JOB_STATE_LTR_RUNNING);

		if (which)
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_Actsuspd;
		else
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_Actsuspd;

		job_save_db(pjob);
	}

	free(jobid);
}

/**
 * @brief
 *	Clears job 'pjob' from the pnode's list of jobs.
 *
 * @param[in]	jobid	- job id
 * @param[in]	pnode	- node structure
 *
 * @return int
 * @retval	<val> - # of cpus freed as a result of removing 'pjob'.
 *
 */
static int
deallocate_job_from_node(char *jobid, struct pbsnode *pnode)
{
	int numcpus = 0;    /* for floating licensing */
	int still_has_jobs; /* still jobs on this vnode */
	struct pbssubn *np;
	struct jobinfo *jp, *prev, *next;

	if ((jobid == NULL) || (pnode == NULL)) {
		return (0);
	}

	still_has_jobs = 0;
	for (np = pnode->nd_psn; np; np = np->next) {

		for (prev = NULL, jp = np->jobs; jp; jp = next) {
			next = jp->next;
			if (strcmp(jp->jobid, jobid)) {
				prev = jp;
				still_has_jobs = 1; /* another job still here */
				continue;
			}

			if (prev == NULL)
				np->jobs = next;
			else
				prev->next = next;
			if (jp->has_cpu) {
				pnode->nd_nsnfree++; /* up count of free */
				numcpus++;
				if (pnode->nd_nsnfree > pnode->nd_nsn) {
					log_event(PBSEVENT_SYSTEM,
						  PBS_EVENTCLASS_NODE, LOG_ALERT,
						  pnode->nd_name,
						  "CPU count incremented free more than total");
				}
			}
			free(jp->jobid);
			free(jp);
			jp = NULL;
		}
		if (np->jobs == NULL) {
			np->inuse &= ~(INUSE_JOB | INUSE_JOBEXCL);
		}
	}
	if (still_has_jobs) {
		/* if the vnode still has jobs, then don't clear */
		/* JOBEXCL */
		if (pnode->nd_nsnfree > 0) {
			/* some cpus free, clear "job-busy" state */
			set_vnode_state(pnode, ~INUSE_JOB, Nd_State_And);
		}
	} else {
		/* no jobs at all, clear both JOBEXCL and "job-busy" */
		set_vnode_state(pnode,
				~(INUSE_JOB | INUSE_JOBEXCL),
				Nd_State_And);

		/* call function to check and free the node from the */
		/* prov list and reset wait_prov flag, if set */
		if (check_job_substate(find_job(jobid), JOB_SUBSTATE_PROVISION))
			free_prov_vnode(pnode);
	}

	return (numcpus);
}

/**
 *
 * @brief
 *	Given a string of exec_vnode format, remove the vnode entries
 *	that are found in 'vnodelist'.
 *
 * @param[in]	execvnode 	- the input exec_vnode string
 * @param[in]	vnodelist 	- list of vnodes, plus-separated, that are to be deleted from the
 *			    		'execvnode' entry.
 * @param[in]	err_msg		- if there's any failure, put appropriate message here.
 * @param[in]	err_msg_sz 	- size of the 'err_msg' buffer.
 *
 * @return char *
 * @retaval <string>	- a new version of 'execvnode' string with entries
 *			  containing the vnodes in 'vnodelist' taken out.
 * @retval  NULL	- if an error has occurred.
 *
 * @note
 *	returned string is a malloced value that must be freed.
 */
static char *
delete_from_exec_vnode(char *execvnode, char *vnodelist, char *err_msg,
		       int err_msg_sz)
{
	char *exec_vnode = NULL;
	char *new_exec_vnode = NULL;
	char *chunk = NULL;
	char *last = NULL;
	int hasprn = 0;
	int entry = 0;
	int nelem;
	char *noden;
	struct key_value_pair *pkvp;
	char buf[LOG_BUF_SIZE] = {0};
	int j;
	int paren = 0;
	int parend = 0;

	if (execvnode == NULL) {
		snprintf(err_msg, err_msg_sz, "bad parameter");
		return NULL;
	}

	exec_vnode = strdup(execvnode);
	if (exec_vnode == NULL) {
		snprintf(err_msg, err_msg_sz, "execvnode strdup error");
		goto delete_from_exec_vnode_exit;
	}

	new_exec_vnode = (char *) calloc(1, strlen(exec_vnode) + 1);
	if (new_exec_vnode == NULL) {
		snprintf(err_msg, err_msg_sz,
			 "new_exec_vnode calloc error");
		goto delete_from_exec_vnode_exit;
	}

	new_exec_vnode[0] = '\0';
	entry = 0; /* exec_vnode entries */
	paren = 0;
	for (chunk = parse_plus_spec_r(exec_vnode, &last, &hasprn);
	     chunk != NULL;
	     chunk = parse_plus_spec_r(last, &last, &hasprn)) {
		paren += hasprn;
		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {
			if ((vnodelist != NULL) &&
			    !in_string_list(noden, '+', vnodelist)) {

				/* there's something put in previously */
				if (entry > 0) {
					strcat(new_exec_vnode, "+");
				}

				if (((hasprn > 0) && (paren > 0)) ||
				    ((hasprn == 0) && (paren == 0))) {
					/* at the beginning of chunk for current host */
					if (!parend) {
						strcat(new_exec_vnode, "(");
						parend = 1;
					}
				}
				if (!parend) {
					strcat(new_exec_vnode, "(");
					parend = 1;
				}
				strcat(new_exec_vnode, noden);
				entry++;

				for (j = 0; j < nelem; ++j) {
					snprintf(buf, sizeof(buf), ":%s=%s",
						 pkvp[j].kv_keyw, pkvp[j].kv_val);
					strcat(new_exec_vnode, buf);
				}

				/* have all chunks for current host */
				if (paren == 0) {

					if (parend) {
						strcat(new_exec_vnode, ")");
						parend = 0;
					}
				}
			} else {

				if (hasprn < 0) {
					/* matched ')' in chunk, so need to */
					/* balance the parenthesis */
					if (parend) {
						strcat(new_exec_vnode, ")");
						parend = 0;
					}
				}
			}
		} else {
			snprintf(err_msg, err_msg_sz,
				 "parse_node_resc error");
			goto delete_from_exec_vnode_exit;
		}
	}

	entry = strlen(new_exec_vnode) - 1;
	if ((entry >= 0) && (new_exec_vnode[entry] == '+'))
		new_exec_vnode[entry] = '\0';

	free(exec_vnode);
	return (new_exec_vnode);

delete_from_exec_vnode_exit:
	free(exec_vnode);
	free(new_exec_vnode);
	return NULL;
}

/**
 * @brief
 *	This return 1 if the given 'pmom' is a parent mom of
 *	node 'pnode'.
 *
 * @param[in]	pmom - the parent mom
 * @param[in]	pnode - the node to match against.
 *
 * @return int
 * @retval 1	- if true
 * @retval 0	- if  false
 */
static int
is_parent_mom_of_node(mominfo_t *pmom, pbsnode *pnode)
{
	int i;

	if ((pmom == NULL) || (pnode == NULL) ||
	    (pnode->nd_moms == NULL)) {
		return (0);
	}

	for (i = 0; i < pnode->nd_nummoms; i++) {
		if (pnode->nd_moms[i] == pmom) {
			return (1);
		}
	}
	return (0);
}

/**
 * @brief
 *	This removes 'pjob' from vnodes managed by parent mom 'pmom'.
 *	Also, if pjob's 'exec_vnode_deallocated' attribute is set,
 *	then remove entries in 'exec_vnode_deallocated' that match
 *	the vnodes where 'pjob' has already been taken out.
 *
 * @param[in]	pmom - the parent mom who sent the request.
 * @param[in]	pjob - job in question
 *
 * @return void
 */
static void
deallocate_job(mominfo_t *pmom, job *pjob)
{
	int i;
	int totcpus = 0;
	int totcpus0 = 0;
	char *freed_vnode_list = NULL;
	int freed_sz = 0;
	char *new_exec_vnode = NULL;
	char *jobid;
	pbs_sched *psched;

	if ((pmom == NULL) || (pjob == NULL)) {
		return;
	}

	jobid = pjob->ji_qs.ji_jobid;
	if ((jobid == NULL) || (*jobid == '\0'))
		return;

	for (i = 0; i < svr_totnodes; i++) {
		pbsnode *pnode;

		pnode = pbsndlist[i];

		if ((pnode != NULL) && !(pnode->nd_state & INUSE_DELETED) && is_parent_mom_of_node(pmom, pnode)) {
			totcpus0 = totcpus;
			totcpus += deallocate_job_from_node(pjob->ji_qs.ji_jobid, pnode);
			if (totcpus > totcpus0) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "clearing job %s from node %s", jobid, pnode->nd_name);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG,
					  pmom->mi_host, log_buffer);
			}
			if (i != 0) {
				if (pbs_strcat(&freed_vnode_list, &freed_sz, "+") == NULL) {
					log_err(-1, __func__, "pbs_strcat failed");
					free(freed_vnode_list);
					return;
				}
			}
			if (pbs_strcat(&freed_vnode_list, &freed_sz, pnode->nd_name) == NULL) {
				log_err(-1, __func__, "pbs_strcat failed");
				free(freed_vnode_list);
				return;
			}
		}
	}
	if (totcpus > 0) {
		snprintf(log_buffer, sizeof(log_buffer), "deallocating %d cpu(s) from job %s", totcpus, jobid);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			  pmom->mi_host, log_buffer);
	}

	if ((freed_vnode_list != NULL) && (is_jattr_set(pjob, JOB_ATR_exec_vnode_deallocated))) {
		char err_msg[LOG_BUF_SIZE];

		new_exec_vnode = delete_from_exec_vnode(
			get_jattr_str(pjob, JOB_ATR_exec_vnode_deallocated),
			freed_vnode_list, err_msg, LOG_BUF_SIZE);

		if (new_exec_vnode == NULL) {
			log_err(-1, __func__, err_msg);
			free(freed_vnode_list);
			return;
		}

		set_jattr_str_slim(pjob, JOB_ATR_exec_vnode_deallocated, new_exec_vnode, NULL);
		free(new_exec_vnode);
	}
	if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
		set_scheduler_flag(SCH_SCHEDULE_TERM, psched);
	else {
		log_err(-1, __func__, "Unable to find scheduler associated with partition");
	}
	free(freed_vnode_list);
}
/**
 * @brief
 * 	We got an EOF on a stream.
 *
 * @param[in]	stream	-	the TPP stream connecting to the Mom
 * @param[in]	ret	-	not used here
 * @param[in]	msg	-	the reason why the mom is down
 *
 * @return	void
 */
void
stream_eof(int stream, int ret, char *msg)
{
	mominfo_t *mp;

	DBPRT(("entering %s", __func__))

	tpp_close(stream);

	/* find who the stream belongs to and mark down */
	if ((mp = tfind2((u_long) stream, 0, &streams)) != NULL) {
		DBPRT(("%s: %s down\n", __func__, mp->mi_host))
		log_errf(-1, __func__, "%s down", mp->mi_host);
		if (msg == NULL)
			msg = "communication closed";

		momptr_down(mp, msg);

		/* Down node and all subnodes */
		mp->mi_dmn_info->dmn_stream = -1;

		/* Since stream is now closed, reset the intermediate
		 * state INUSE_INIT.
		 */
		mp->mi_dmn_info->dmn_state &= ~INUSE_INIT;

#ifdef NAS /* localmod 005 */
		tdelete2((u_long) stream, 0ul, &streams);
#else
		tdelete2((u_long) stream, 0, &streams);
#endif /* localmod 005 */
	}
	return;
}

/**
 * @brief
 * 		Mark all the nodes in mom array as unknown
 * @see
 * 		net_down_handler
 *
 * @param[in]	this value should be 1 - to mark all the mom state as unknown.
 *
 * @return	void
 */
void
mark_nodes_unknown(int all)
{
	mominfo_t *pmom;
	int i;
	int stm;
	dmn_info_t *pdmn_info;

	DBPRT(("entering %s", __func__))

	for (i = 0; i < mominfo_array_size; i++) {
		if (mominfo_array[i]) {
			pmom = mominfo_array[i];
			pdmn_info = pmom->mi_dmn_info;

			if ((pdmn_info->dmn_state & INUSE_INIT) || all == 1) {
				set_all_state(pmom, 1, INUSE_UNKNOWN, NULL, Set_All_State_Regardless);
				stm = pdmn_info->dmn_stream;
				if (stm >= 0) {
					tpp_close(stm);
					tdelete2((u_long) stm, 0, &streams);
				}
				pdmn_info->dmn_stream = -1;

				/* Since stream is being closed, reset the intermediate
				 * state INUSE_INIT.
				 */
				pdmn_info->dmn_state &= ~INUSE_INIT;
				pdmn_info->dmn_state |= INUSE_UNKNOWN | INUSE_MARKEDDOWN;
			}
		}
	}
}

/**
 * @brief The TPP multicast version for server -> mom.
 *
 * @param[in] pmom - The mom to ping
 * @param[in] mtfd - The TPP channel to add moms for multicasting.
 * @param[in] unique - Ensure only unique values are added.
 * 
 * 
 * @return int
 * @retval 0: success
 * @retval !0: failure
 *
 */
int
mcast_add(mominfo_t *pmom, int *mtfd, bool unique)
{
	dmn_info_t *pdmninfo;
	int rc = 0;

	if (!pmom)
		return -1;

	pdmninfo = pmom->mi_dmn_info;

	DBPRT(("%s: entered\n", __func__))

	if (pdmninfo->dmn_stream < 0)
		return -1;

	/* open the tpp mcast channel here */
	if (*mtfd == -1 && (*mtfd = tpp_mcast_open()) == -1) {
		log_err(-1, __func__, "Failed to open TPP mcast channel for broadcasting messages");
		return -1;
	}

	rc = tpp_mcast_add_strm(*mtfd, pdmninfo->dmn_stream, unique);

	if (rc == -1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to add service endpoint at %s:%d to mcast", pmom->mi_host, pmom->mi_port);
		log_err(-1, __func__, log_buffer);
		tpp_close(pdmninfo->dmn_stream);
		tdelete2((u_long) pdmninfo->dmn_stream, 0, &streams);
		pdmninfo->dmn_stream = -1;
	}

	return rc;
}

/**
 * @brief
 * 	Multicast function to close all failed streams and close them
 *
 * @param[in]	stm	- multi-cast stream where broadcast is attempted
 * @param[in]	ret	- failure return code
 *
 * @return	void
 */
void
close_streams(int stm, int ret)
{
	int *strms;
	int count = 0;
	int i;
	mominfo_t *pmom;
	dmn_info_t *pdmninfo;
	struct sockaddr_in *addr;

	if (stm < 0)
		return;

	strms = tpp_mcast_members(stm, &count);

	for (i = 0; i < count; i++) {
		if ((pmom = tfind2((u_long) strms[i], 0, &streams)) != NULL) {
			pdmninfo = pmom->mi_dmn_info;
			/* find the respective mom from the stream */
			addr = tpp_getaddr(pdmninfo->dmn_stream);
			snprintf(log_buffer, sizeof(log_buffer), "%s %d to %s(%s)",
				 dis_emsg[ret], errno, pmom->mi_host, netaddr(addr));
			log_err(-1, __func__, log_buffer);
			stream_eof(pdmninfo->dmn_stream, ret, "mcast failed!");
		}
	}
}

/**
 * @brief
 * 		Mom multicast functions to broadcast a single command to all the moms.
 *
 * @param[in]	ptask	- work task structure
 *
 * @return	void
 */
void
mcast_msg(struct work_task *ptask)
{
	dmn_info_t *pdmninfo;
	int i;
	int ret;

	if (!ptask)
		return;

	DBPRT(("%s: entered\n cmd: %d", __func__, ptask->wt_aux))

	int cmd = ptask->wt_aux;
	int mtfd = -1;

	switch (cmd) {
		case IS_CLUSTER_ADDRS:
			for (i = 0; i < mominfo_array_size; i++) {

				if (!mominfo_array[i])
					continue;

				pdmninfo = mominfo_array[i]->mi_dmn_info;
				if ((pdmninfo->dmn_state & INUSE_NEED_ADDRS) && pdmninfo->dmn_stream >= 0) {
					mcast_add(mominfo_array[i], &mtfd, FALSE);
					if (pdmninfo->dmn_state & INUSE_MARKEDDOWN)
						pdmninfo->dmn_state &= ~INUSE_MARKEDDOWN;
					set_all_state(mominfo_array[i], 0, INUSE_DOWN | INUSE_NEED_ADDRS,
						      NULL, Set_All_State_Regardless);
				}
			}

			if ((ret = send_ip_addrs_to_mom(mtfd, 0)) != DIS_SUCCESS)
				close_streams(mtfd, ret);

			tpp_mcast_close(mtfd);
			break;

		case IS_REPLYHELLO:
			if (mtfd_replyhello != -1)
				if ((ret = reply_hellosvr(mtfd_replyhello, 1)) != DIS_SUCCESS)
					close_streams(mtfd_replyhello, ret);
			if (mtfd_replyhello_noinv != -1)
				if ((ret = reply_hellosvr(mtfd_replyhello_noinv, 0)) != DIS_SUCCESS)
					close_streams(mtfd_replyhello_noinv, ret);

			tpp_mcast_close(mtfd_replyhello);
			tpp_mcast_close(mtfd_replyhello_noinv);
			mtfd_replyhello = -1;
			mtfd_replyhello_noinv = -1;
			break;

		default:
			break;
	}
}

/**
 * @brief
 * 		Add placement set names to the Server's pnames attribute.
 * @see
 * 		update2_to_vnode and is_request
 *
 * @param[in]	namestr	-	The namestr paramenter is a comma separated set of strings
 * 							Each separate name is added only if it isn't already in pnames
 * @return	int
 * @retval	0	- success
 * @retval	1	- failure
 */

static int
setup_pnames(char *namestr)
{
	int i;
	char *newbuffer;
	int newentries = 0;
	char *pe;
	char *ps;
	attribute *ppnames;
	struct array_strings *pparst;
	char *workcopy;
	int resc_added = 0;

	if ((namestr == NULL) || (*namestr == '\0'))
		return 0;
	workcopy = strdup(namestr);
	if (workcopy == NULL)
		return 1;
	if ((newbuffer = (char *) malloc(strlen(workcopy) + 1)) == NULL) {
		free(workcopy);
		return 1;
	}
	*newbuffer = '\0';

	ppnames = get_sattr(SVR_ATR_PNames);
	pparst = ppnames->at_val.at_arst;
	ps = workcopy;

	/* look at each individual resource name in the comma seperated list */
	while (*ps) {
		while (*ps && isspace((int) *ps))
			ps++;
		pe = ps;
		while (*pe && (*pe != ','))
			pe++;
		if (*pe == ',')
			*pe++ = '\0';

		/* is the resource name already in the pnames attribute? */
		if (pparst) {
			for (i = 0; i < pparst->as_usedptr; ++i) {
				if (strcasecmp(ps, pparst->as_string[i]) == 0)
					break;
			}
		}
		if ((pparst == NULL) || (i == pparst->as_usedptr)) {
			/* not there already, ok to add this word */
			if (newentries++)
				strcat(newbuffer, ",");
			strcat(newbuffer, ps);
		}

		/* next see if it needs to be added to resourcedef */
		if (!find_resc_def(svr_resc_def, ps)) {
			if (add_resource_def(ps, ATR_TYPE_ARST, NO_USER_SET) == 0)
				resc_added++;
		}

		ps = pe;
	}

	if (resc_added > 0) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, "setup_pnames",
			  "Restarting Python interpreter as resourcedef file has changed.");
		pbs_python_ext_shutdown_interpreter(&svr_interp_data);
		if (pbs_python_ext_start_interpreter(&svr_interp_data) != 0) {
			log_err(PBSE_INTERNAL, __func__, "Failed to restart Python interpreter");
			free(workcopy);
			free(newbuffer);
			return 1;
		}

		send_rescdef(1);
	}

	if (newentries) {
		int flag = 0;

		if (is_attr_set(ppnames) == 0 || (ppnames->at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) == (ATR_VFLAG_SET | ATR_VFLAG_DEFLT))
			flag = ATR_VFLAG_DEFLT;

		set_sattr_generic(SVR_ATR_PNames, newbuffer, NULL, INCR);
		ppnames->at_flags |= flag;
	}
	free(workcopy);
	free(newbuffer);

	return 0;
}

/**
 * @brief
 * 		add mom to the vnode list if it is not listed, and if there is no room,
 * 		re-strucure and create room for the mom. Add Mom's name to this vnode's Mom attribute
 * 		and set reverse linkage Mom -> node.
 * @see
 * 		update2_to_vnode and create_pbs_node2.
 *
 *
 */
int
cross_link_mom_vnode(struct pbsnode *pnode, mominfo_t *pmom)
{
	int i;
	int n;
	mom_svrinfo_t *prmomsvr;

	if ((pnode == NULL) || (pmom == NULL))
		return (PBSE_NONE);

	/* see if the node already has this Mom listed,if not add her */

	for (i = 0; i < pnode->nd_nummoms; ++i) {
		if (pnode->nd_moms[i] == pmom)
			break;
	}

	if (i == pnode->nd_nummoms) {
		/* need to add this parent Mom in the node's array */
		if (pnode->nd_nummoms == pnode->nd_nummslots) {

			/* need to expand the array to make room */
			mominfo_t **tmpim;

			n = pnode->nd_nummslots;
			if (n == 0)
				n = 1;
			else
				n *= 2;
			tmpim = (mominfo_t **) realloc(pnode->nd_moms,
						       n * sizeof(mominfo_t *));
			if (tmpim == NULL)
				return (PBSE_SYSTEM);
			pnode->nd_moms = tmpim;
			pnode->nd_nummslots = n;
		}
		pnode->nd_moms[pnode->nd_nummoms++] = pmom;

		/* also add Mom's name to this vnode's Mom attribute */
		set_nattr_generic(pnode, ND_ATR_Mom, pmom->mi_host, NULL, INCR);
	}

	/* Now set reverse linkage Mom -> node */

	prmomsvr = pmom->mi_data;
	for (i = 0; i < prmomsvr->msr_numvnds; ++i) {
		if (prmomsvr->msr_children[i] == pnode)
			break;
	}
	if (i == prmomsvr->msr_numvnds) {

		/* need to add this node to array of Mom's children */
		if (prmomsvr->msr_numvnds == prmomsvr->msr_numvslots) {
			/* need to expand the array (double it) */
			struct pbsnode **tmpn;

			n = prmomsvr->msr_numvslots;
			if (n == 0)
				n = 1;
			else
				n *= 2;
			tmpn = (struct pbsnode **) realloc(prmomsvr->msr_children,
							   n * sizeof(struct pbsnode *));
			if (tmpn == NULL)
				return (PBSE_SYSTEM);
			prmomsvr->msr_children = tmpn;
			prmomsvr->msr_numvslots = n;
		}
		prmomsvr->msr_children[prmomsvr->msr_numvnds++] = pnode;
	}
	return 0;
}

#define UPDATE_FROM_HOOK "update_from_hook"
#define UPDATE2 "update2"
#define UPDATE_FROM_HOOK_U "UPDATE_FROM_HOOK"
#define UPDATE2_U "UPDATE2"
#define UPDATE_FROM_MOM_HOOK "update from mom hook"
#define UPDATE "update"
/**
 * @brief
 * 		create/update vnodes from the information sent by Mom in the UPDATE2
 * 		message.
 *
 * @param[in]  pvnal 	- info on one vnode from Mom
 * @param[in]  new   	- true if ok to create new vnode
 * @param[in]  pmom  	- the Mom which sent this update
 * @param[out] madenew 	- set non-zero if any new vnodes were created
 * @param[out] from_hook - set non-zero if request coming from hook
 *			  Normally set to 1 for regular vnoded request;
 *			  2 for qmgr-like (non-vnoded) request.
 *
 * @return int
 * @retval	zero	- ok
 * @retval	PBSE_ number	- error
 *
 * @par MT-safe: No
 */
static int
update2_to_vnode(vnal_t *pvnal, int new, mominfo_t *pmom, int *madenew, int from_hook)
{
	int bad;
	int i;
	int j;
	int localmadenew = 0;
	struct pbsnode *pnode;
	pbs_list_head atrlist;
	svrattrl *pal;
	char buf[200];
	attribute *pattr;
	attribute *pRA;
	vna_t *psrp;
	char *dot;
	char *resc;
	resource *prs;
	resource_def *prdef;
	resource_def *prdefhost;
	resource_def *prdefvnode;
	mom_svrinfo_t *pcursvrm;
	vnpool_mom_t *ppool;
	static char *cannot_def_resc = "error: resource %s for vnode %s cannot be defined";
	char *p;
	char hook_name[HOOK_BUF_SIZE + 1];
	int vn_state_updates = 0;
	int vn_resc_added = 0;

	CLEAR_HEAD(atrlist);

	/*
	 * Can't do static initialization of these because svr_resc_def
	 * may change as new resources are added dynamically.
	 */
	prdefhost = &svr_resc_def[RESC_HOST];
	prdefvnode = &svr_resc_def[RESC_VNODE];

	pnode = find_nodebyname(pvnal->vnal_id);

	if (pnode == NULL) {
		/*
		 * see if this vnode def entry contains the topology info
		 * if so, it is the natural vnode for this Mom or for the
		 * first compute node on a cray which isn't of concern here
		 */

		int have_topology = 0;
		int is_compute_node = 0;
		for (i = 0; i < pvnal->vnal_used; i++) {
			psrp = VNAL_NODENUM(pvnal, i);
			if (strcasecmp(psrp->vna_name, ATTR_NODE_TopologyInfo) == 0)
				have_topology = 1;
			if ((strcasecmp(psrp->vna_name, "resources_available.vntype") == 0) && (strcasecmp(psrp->vna_val, CRAY_COMPUTE) == 0))
				is_compute_node = 1;
		}
		if ((have_topology == 1) && (is_compute_node == 0)) {
			/* this is for the natural vnode, use that for pnode */
			mom_svrinfo_t *prmomsvr = pmom->mi_data;
			pnode = prmomsvr->msr_children[0];
		}
	}

	if ((pnode == NULL) && new) {
		/* create vnode */
		pal = attrlist_create(ATTR_NODE_Mom, 0, strlen(pmom->mi_host) + 1);
		strcpy(pal->al_value, pmom->mi_host);
		append_link(&atrlist, &pal->al_link, pal);
		if (pmom->mi_port != PBS_MOM_SERVICE_PORT) {
			sprintf(buf, "%u", pmom->mi_port);
			pal = attrlist_create(ATTR_NODE_Port, 0, strlen(buf) + 1);
			strcpy(pal->al_value, buf);
			append_link(&atrlist, &pal->al_link, pal);
		}
		pal = GET_NEXT(atrlist);
		bad = create_pbs_node(pvnal->vnal_id, pal, ATR_DFLAG_MGWR,
				      &bad, &pnode, FALSE);
		free_attrlist(&atrlist);
		if (bad != 0) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "could not autocreate vnode \"%s\", error = %d",
				 pvnal->vnal_id, bad);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
				  LOG_NOTICE, pmom->mi_host, log_buffer);
			return bad;
		}
		*madenew = 1;
		localmadenew = 1;
		snprintf(log_buffer, sizeof(log_buffer),
			 "autocreated vnode %s", pvnal->vnal_id);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
			  LOG_INFO, pmom->mi_host, log_buffer);
	}

	if (pnode == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "%s reported in %s message from Mom on %s",
			 pvnal->vnal_id,
			 from_hook ? UPDATE_FROM_HOOK_U : UPDATE2_U,
			 pmom->mi_host);
		log_err(PBSE_UNKNODE, from_hook ? UPDATE_FROM_HOOK : UPDATE2, log_buffer);
		return PBSE_UNKNODE;
	}

	/* If the request is coming from a hook, check if the MoM requesting the update
	 * actually owns the vnode. If it does not, do not crosslink and return an error.
	 */
	if (from_hook == 1) {
		int pnode_has_mom = 0;
		/* see if the node already has this Mom listed,if not add her */
		for (i = 0; i < pnode->nd_nummoms; ++i) {
			if (pnode->nd_moms[i] == pmom)
				pnode_has_mom = 1;
			break;
		}

		if (!pnode_has_mom) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Not allowed to update vnode '%s', as it is owned by a different mom", pvnal->vnal_id);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE,
				  LOG_INFO, pmom->mi_host, log_buffer);
			return (PBSE_BADHOST);
		}
	}

	/* if mom has a vnode_pool value */
	pcursvrm = (mom_svrinfo_t *) (pmom->mi_data);
	if ((localmadenew == 1) && (pcursvrm->msr_vnode_pool > 0)) {
		ppool = find_vnode_pool(pmom);
		if (ppool != NULL) {
			for (j = 0; j < ppool->vnpm_nummoms; ++j) {
				if (ppool->vnpm_moms[j] != NULL) {
					int ret;

					if ((ret = cross_link_mom_vnode(pnode, ppool->vnpm_moms[j])) != 0) {
						/* deal with error */
						return (ret);
					}
				}
			}
		}
	} else if (from_hook != 2) {
		/* not done for UPDATE_FROM_HOOK2 (i.e. from_hook == 2)
		 * as it becomes like a qmgr request. So no need to change
		 * current vnode's parent mom be the incoming node,
		 * which is what cross_link_mom_node() does.
		 */
		if ((i = cross_link_mom_vnode(pnode, pmom)) != 0)
			return (i);
	}

	/*
	 * Attributes and Resources within Resources_Available set by a Mom
	 * via this message (and not coming from the UPDATE_FROM_HOOK),
	 * have the ATR_VFLAG_DEFLT (default) flag set.
	 * If the Mom no longer reports the attribute/resource it should be
	 * unset.  The only way to do this is unset all "default" attribute/
	 * resources first then reset what Mom is now reporting.
	 *
	 * Exceptions to the above:
	 * resources_available.host - must be set,  so it isn't unset
	 *	even if default
	 * sharing - can only be set via this message, so set to the default
	 *	value to insure it is reset based on what Mom now sends or to
	 *	the default setting if Mom no longer sends anything
	 */

	if (!from_hook) {
		for (i = 0; i < ND_ATR_LAST; ++i) {
			/* if this vnode has been updated earlier in this update2 */
			/* then don't free anything but topology */
			if ((i != ND_ATR_TopologyInfo))
				continue; /* seeing vnl update for node just updated, don't clear */

			if (i != ND_ATR_ResourceAvail) {
				if (((get_nattr(pnode, i))->at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) == (ATR_VFLAG_SET | ATR_VFLAG_DEFLT))
					free_nattr(pnode, i);
			} else if (is_nattr_set(pnode, i) != 0) {
				prs = (resource *) GET_NEXT(get_nattr_list(pnode, i));
				while (prs) {
					if ((prs->rs_value.at_flags & ATR_VFLAG_DEFLT) &&
					    (prs->rs_defin != prdefhost) &&
					    (prs->rs_defin != prdefvnode)) {
						prs->rs_defin->rs_free(&prs->rs_value);
					}
					prs = (resource *) GET_NEXT(prs->rs_link);
				}
			}
		}

		set_nattr_l_slim(pnode, ND_ATR_Sharing, VNS_DFLT_SHARED, SET);
		(get_nattr(pnode, ND_ATR_Sharing))->at_flags |= ATR_VFLAG_DEFLT;
	}

	/* set attributes/resources if they are default */

	pRA = get_nattr(pnode, ND_ATR_ResourceAvail);

	for (i = 0; i < pvnal->vnal_used; i++) {
		psrp = VNAL_NODENUM(pvnal, i);
		strncpy(buf, psrp->vna_name, sizeof(buf) - 1);
		buf[sizeof(buf) - 1] = '\0';

		/* make sure no trailing white space in the value */
		for (dot = psrp->vna_val + strlen(psrp->vna_val) - 1;
		     dot >= psrp->vna_val;
		     dot--) {
			if (isspace((int) *dot))
				*dot = '\0';
			else
				break;
		}

		if ((dot = strchr(buf, (int) '.')) != NULL) {
			/* found a resource setting, had better be Resources_Available */
			resc = dot + 1;
			*dot = '\0';
			if ((strcasecmp(buf, ATTR_rescavail) != 0) &&
			    (from_hook && (strcasecmp(buf, ATTR_rescassn) != 0))) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "error: not legal to set resource in attribute %s, in %s for vnode %s",
					 psrp->vna_name, from_hook ? UPDATE_FROM_MOM_HOOK : UPDATE,
					 pnode->nd_name);
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
					  LOG_ERR, pmom->mi_host, log_buffer);
				continue;
			}

			if (from_hook && (strcasecmp(buf, ATTR_rescassn) == 0))
				pRA = get_nattr(pnode, ND_ATR_ResourceAssn);

			/* Is the resource already defined? */
			prdef = find_resc_def(svr_resc_def, resc);
			if (prdef == NULL) {
				int err;

				/* currently resource is undefined, add it */

				err = add_resource_def(resc, psrp->vna_type, psrp->vna_flag);
				if (err < 0) {
					snprintf(log_buffer, sizeof(log_buffer), cannot_def_resc,
						 resc, pvnal->vnal_id);
					log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE,
						  LOG_ERR, pmom->mi_host, log_buffer);
					continue; /* skip this attribute, go to next */
				} else {

					snprintf(log_buffer, sizeof(log_buffer),
						 "adding resource %s, type %d, in update for vnode %s", resc, psrp->vna_type, pnode->nd_name);
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
						  LOG_INFO, pmom->mi_host, log_buffer);
					vn_resc_added++;
				}
				/* now find the new resource definition */
				prdef = find_resc_def(svr_resc_def, resc);
				if (prdef == NULL)
					continue; /* skip this attribute, go to next */
			} else if ((psrp->vna_type != 0) &&
				   (psrp->vna_type != prdef->rs_type)) {
				snprintf(log_buffer, sizeof(log_buffer), cannot_def_resc,
					 resc, pvnal->vnal_id);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE,
					  LOG_ERR, pmom->mi_host, log_buffer);
				continue; /* skip this attribute/resource, go to next */
			}

			/* add resource entry to Resources_Available for the vnode */

			prs = add_resource_entry(pRA, prdef);
			if (prs) {
				bad = 0;
				if (from_hook ||
				    (prs->rs_value.at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) != ATR_VFLAG_SET) {
					/* if not from_hook, will only set */
					/* resource values that have the */
					/* ATR_VFLAG_DEFLT flag only, which */
					/* means it wasn't set externally */
					/* (i.e. qmgr). */
					/* if from_hook, we override values */
					/* set externally. */

					/* If indirect resource, decode it as a string */
					if (psrp->vna_val[0] == '@') {
						extern int resc_access_perm;
						int perms = resc_access_perm;
						resc_access_perm |= ATR_PERM_ALLOW_INDIRECT;
						bad = decode_str(&prs->rs_value, psrp->vna_name, resc, psrp->vna_val);
						resc_access_perm = perms;
						if (bad == 0) {
							prs->rs_value.at_flags |= ATR_VFLAG_DEFLT | ATR_VFLAG_INDIRECT;
							bad = fix_indirectness(prs, pnode, 1);
						}
					} else if ((bad = prdef->rs_decode(&prs->rs_value, buf, resc, psrp->vna_val)) == 0) {
						/* This (ATR_FLAG_DEFLT) means set by the */
						/* server and not manager */
						/* mom hook we're treating */
						/* set by manager */
						if (from_hook) {
							/* These flags ensure */
							/* changes survive */
							/* server restart */
							prs->rs_value.at_flags &= ~ATR_VFLAG_DEFLT;
							post_attr_set(&prs->rs_value);
							if (psrp->vna_val[0] != '\0') {
								prs->rs_value.at_flags |= (ATR_VFLAG_SET | ATR_VFLAG_MODIFY);
							} else {
								prs->rs_defin->rs_free(&prs->rs_value);
								delete_link(&prs->rs_link);
								free(prs);
							}
						} else
							prs->rs_value.at_flags |= ATR_VFLAG_DEFLT;
						if (strcasecmp("ncpus", resc) == 0) {
							/* if ncpus, adjust virtual/subnodes */
							j = prs->rs_value.at_val.at_long;
							mod_node_ncpus(pnode, j, ATR_ACTION_ALTER);
						}
					}
					if (bad != 0) {
						snprintf(log_buffer, sizeof(log_buffer),
							 "Error %d decoding resource %s in update for vnode %s", bad, resc, pnode->nd_name);
						log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
							  LOG_WARNING, pmom->mi_host, log_buffer);
					} else if (from_hook) {
						snprintf(log_buffer,
							 sizeof(log_buffer),
							 "Updated vnode %s's "
							 "resource %s=%s per "
							 "mom hook request",
							 pnode->nd_name,
							 psrp->vna_name,
							 psrp->vna_val);
						log_event(PBSEVENT_DEBUG2,
							  PBS_EVENTCLASS_NODE,
							  LOG_INFO, pmom->mi_host,
							  log_buffer);
					}
				}
			}

		} else if (strcasecmp(psrp->vna_name, VNATTR_PNAMES) == 0) {

			/* special case pnames because it is set at the Server */

			snprintf(log_buffer, sizeof(log_buffer), "pnames %s",
				 psrp->vna_val);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
				  LOG_INFO, pmom->mi_host, log_buffer);

			setup_pnames(psrp->vna_val);

		} else if (strcasecmp(psrp->vna_name, VNATTR_HOOK_REQUESTOR) == 0) {

			if (from_hook) {
				/* decides whether succeeding requests from the same 'pvnal' */
				/* should be allowed; if the name is the null string */
				/* the hook ran as the administrator (root) */

				if ((*psrp->vna_val != '\0') &&
				    ((svr_get_privilege(psrp->vna_val, pmom->mi_host) &
				      (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 hook_privilege, psrp->vna_val, pmom->mi_host);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE,
						  LOG_INFO, pmom->mi_host, log_buffer);
					return (PBSE_PERM);
				}
			}
		} else if (strcasecmp(psrp->vna_name, VNATTR_HOOK_OFFLINE_VNODES) == 0) {

			if (from_hook) {
				p = strchr(psrp->vna_val, ',');
				hook_name[0] = '\0';
				if (p != NULL) {
					*p = '\0';
					p++;
					strncpy(hook_name, p, HOOK_BUF_SIZE);
				}
				if (strcmp(psrp->vna_val, "1") == 0) {
					char hook_buf[sizeof(hook_name) + 40];
					snprintf(hook_buf, sizeof(hook_buf),
						 "offlined by hook '%s' due to hook error",
						 hook_name);
					mark_node_offline_by_mom(pnode->nd_name, hook_buf);
				} else if (strcmp(psrp->vna_val, "0") == 0) {
					clear_node_offline_by_mom(pnode->nd_name, NULL);
				}
				if (p != NULL)
					*p = ','; /* restore psrp->vna_val */
			}

		} else if (strcasecmp(psrp->vna_name, VNATTR_HOOK_SCHEDULER_RESTART_CYCLE) == 0) {

			if (from_hook) {
				p = strchr(psrp->vna_val, ',');
				hook_name[0] = '\0';
				if (p != NULL) {
					*p = '\0';
					p++;
					strncpy(hook_name, p, HOOK_BUF_SIZE);
				}
				if (strcmp(psrp->vna_val, "1") == 0) {

					set_scheduler_flag(SCH_SCHEDULE_RESTART_CYCLE, dflt_scheduler);
					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "hook '%s' requested for "
						 "scheduler to restart cycle",
						 hook_name);
					log_event(PBSEVENT_DEBUG2,
						  PBS_EVENTCLASS_NODE,
						  LOG_INFO, pmom->mi_host,
						  log_buffer);
				}
				if (p != NULL)
					*p = ','; /* restore psrp->vna_val */
			}

		} else {

			/* a non-resource attribute to set */

			j = find_attr(node_attr_idx, node_attr_def, psrp->vna_name);
			if (j == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "unknown attribute %s in %s for vnode %s",
					 psrp->vna_name,
					 from_hook ? UPDATE_FROM_MOM_HOOK : UPDATE,
					 pnode->nd_name);
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
					  LOG_WARNING, pmom->mi_host, log_buffer);
				continue;
			}
			pattr = get_nattr(pnode, j);
			if (from_hook || ((pattr->at_flags &
					   (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) != ATR_VFLAG_SET)) {
				/* if not from_hook, will only set attribute */
				/* values that have the ATR_VFLAG_DEFLT flag */
				/* only, which means it wasn't set externally */
				/* (i.e. qmgr). */
				/* if from_hook, we override values */
				/* set externally. */

				if (from_hook) {
					if (node_attr_def[j].at_action &&
					    (bad = node_attr_def[j].at_action(pattr, pnode, ATR_ACTION_ALTER))) {
						snprintf(log_buffer, sizeof(log_buffer),
						    "Error %d setting attribute %s "
						    "in %s for vnode %s",
						    bad, psrp->vna_name,
						    UPDATE_FROM_MOM_HOOK,
						    pnode->nd_name);
						log_event(PBSEVENT_SYSTEM,
						    PBS_EVENTCLASS_NODE, LOG_WARNING,
						    pmom->mi_host, log_buffer);
						continue;
					}
				}

				bad = set_attr_generic(pattr, &node_attr_def[j], psrp->vna_val, NULL, INTERNAL);
				if (bad != 0) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "Error %d decoding attribute %s "
						 "in %s for vnode %s",
						 bad, psrp->vna_name,
						 from_hook ? UPDATE_FROM_MOM_HOOK : UPDATE,
						 pnode->nd_name);
					log_event(PBSEVENT_SYSTEM,
						  PBS_EVENTCLASS_NODE, LOG_WARNING,
						  pmom->mi_host, log_buffer);
					continue;
				}
				if (from_hook) {
					/* these flag values ensure changes */
					/* are displayed and survive server */
					/* restart */

					pattr->at_flags &= ~ATR_VFLAG_DEFLT;
					pattr->at_flags |= ATR_VFLAG_MODCACHE;
					if (psrp->vna_val[0] != '\0')
						pattr->at_flags |= (ATR_VFLAG_SET | ATR_VFLAG_MODIFY);
					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "Updated vnode %s's "
						 "attribute %s=%s per "
						 "mom hook request",
						 pnode->nd_name,
						 psrp->vna_name,
						 psrp->vna_val);
					log_event(PBSEVENT_DEBUG2,
						  PBS_EVENTCLASS_NODE, LOG_INFO,
						  pmom->mi_host, log_buffer);

				} else
					pattr->at_flags |= ATR_VFLAG_DEFLT;

				if (strcasecmp(psrp->vna_name, ATTR_NODE_VnodePool) == 0) {
					if ((bad = node_attr_def[j].at_action(pattr,
									      pnode, ATR_ACTION_ALTER)) == 0) {
						pattr->at_flags |= ATR_VFLAG_DEFLT;
					} else {
						snprintf(log_buffer, sizeof(log_buffer),
							 "Error %d setting attribute %s "
							 "in update for vnode %s",
							 bad,
							 psrp->vna_name, pnode->nd_name);
						log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
							  LOG_WARNING, pmom->mi_host, log_buffer);
					}
				}
			}
			if ((strcasecmp(psrp->vna_name,
					ATTR_NODE_TopologyInfo) == 0) ||
			    (strcasecmp(psrp->vna_name,
					ATTR_NODE_state) == 0)) {
				bad = node_attr_def[j].at_action(pattr,
								 pnode, ATR_ACTION_ALTER);
				if (bad != 0) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "Error %d setting attribute %s "
						 "in %s for vnode %s",
						 bad,
						 psrp->vna_name,
						 from_hook ? UPDATE_FROM_MOM_HOOK : UPDATE,
						 pnode->nd_name);
					log_event(PBSEVENT_SYSTEM,
						  PBS_EVENTCLASS_NODE,
						  LOG_WARNING,
						  pmom->mi_host,
						  log_buffer);
				}
				if (strcasecmp(psrp->vna_name,
					       ATTR_NODE_state) == 0) {
					vn_state_updates++;
				}
			}
		}
	}

	if (vn_resc_added > 0) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, "update2_to_vnode",
			  "Restarting Python interpreter as resourcedef file has changed.");
		pbs_python_ext_shutdown_interpreter(&svr_interp_data);
		if (pbs_python_ext_start_interpreter(&svr_interp_data) != 0) {
			log_err(PBSE_INTERNAL, __func__, "Failed to restart Python interpreter");
			return PBSE_INTERNAL;
		}

		send_rescdef(1);
	}

	if (pnode) {
		int states_to_clear = 0;

		check_and_set_multivnode(pnode);

		if (from_hook) {
			/* INUSE_DOWN not part here since it could */
			/* have been set from a hook . */
			states_to_clear = (INUSE_STALE | INUSE_UNKNOWN);
			if (vn_state_updates == 0) {
				states_to_clear |= INUSE_DOWN;
			}
		} else {
			states_to_clear = (INUSE_STALE | INUSE_DOWN | INUSE_UNKNOWN);
		}

		/* clear stale, down, unknown bits in state */
		set_vnode_state(pnode,
				~states_to_clear,
				Nd_State_And);
		pnode->nd_modified = 1;
		return 0;
	} else {
		snprintf(log_buffer, sizeof(log_buffer),
			 "vnode %s declared by %s but it does not exist",
			 pvnal->vnal_id, pmom->mi_host);
		log_err(PBSE_UNKNODE, from_hook ? UPDATE_FROM_HOOK : UPDATE2, log_buffer);
		return PBSE_UNKNODE;
	}
}

/**
 * @brief
 * 		Check if vnode shares the resource "host" with any other vnode, and
 * 		set vnode attribute "in_multivnode_host" accordingly.
 * @see
 * 		update2_to_vnode
 *
 * @param[in] pnode - The node being considered
 *
 * @return void
 *
 * @par MT-Safe: no, depends on globals svr_totnodes and pbsndlist
 *
 * @par Esoteric Side-case:
 * 		In a multivnode host, all vnodes being processed
 * 		that have not been checked by this function are assumed to be in state
 * 		stale; this is needed to handle the case of two vnodes that would swap
 * 		resources_available.host on an update.
 */
static void
check_and_set_multivnode(struct pbsnode *pnode)
{
	int i;
	resource *prc;
	resource *prc_i;
	resource_def *prd;
	char *host_str1 = NULL;

	if (pnode == NULL)
		return;

	prd = &svr_resc_def[RESC_HOST];
	if (prd == NULL)
		return;

	prc = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAvail), prd);
	if (prc == NULL) {
		if (pnode->nd_hostname != NULL)
			host_str1 = pnode->nd_hostname;
	} else {
		host_str1 = prc->rs_value.at_val.at_str;
	}

	for (i = 0; i < svr_totnodes; i++) {
		if (pnode != pbsndlist[i]) {
			char *host_str2 = NULL;

			if (pbsndlist[i]->nd_state & INUSE_STALE)
				continue;

			prc_i = find_resc_entry(get_nattr(pbsndlist[i], ND_ATR_ResourceAvail), prd);
			if (prc_i == NULL) {
				if (pbsndlist[i]->nd_hostname != NULL)
					host_str2 = pbsndlist[i]->nd_hostname;
			} else {
				host_str2 = prc_i->rs_value.at_val.at_str;
			}

			if (host_str1 && host_str2 && !strcmp(host_str1, host_str2)) {
				set_nattr_l_slim(pbsndlist[i], ND_ATR_in_multivnode_host, 1, SET);
				(get_nattr(pbsndlist[i], ND_ATR_in_multivnode_host))->at_flags |= ATR_VFLAG_DEFLT;

				/* DEFLT needed to reset on update */
				set_nattr_l_slim(pnode, ND_ATR_in_multivnode_host, 1, SET);
				(get_nattr(pnode, ND_ATR_in_multivnode_host))->at_flags |= ATR_VFLAG_DEFLT;
				break;
			}
		}
	}
}

/**
 * @brief
 * 		read the list of running jobs sent by Mom in a
 *		HELLO3/4 message and validate them against their state known to the
 *		Server.  Message contains the following:
 * @par
 *		count of number of jobs which follows
 *		for each job
 *		   string - job id
 *		   int    - job substate
 *		   long   - run version (count)
 *		   int    - node id, 0 (for Mother Superior) to N-1 **
 *		   string - exec_vnode string **
 *
 *  		** - these values are not currently used for anything.
 * @see
 * 		is_request
 *
 * @param[in]	stream	- list of running jobs sent by Mom in a HELLO3/4 message
 *
 * @return	void
 */
void
mom_running_jobs(int stream)
{
	char *execvnod = NULL;
	char *jobid = NULL;
	unsigned njobs = 0;
	job *pjob = NULL;
	int rc = 0;
	int substate = 0;
	long runver = 0, runver_server = 0;
	int discarded = 0;
	mominfo_t *pmom = NULL;
	char mom_name[PBS_MAXHOSTNAME + 2] = "UNKNOWN";
	char exec_host_name[PBS_MAXHOSTNAME + 2] = "UNKNOWN2";
	char *slash_pos = NULL;
	int exec_host_hostlen = 0;

	njobs = disrui(stream, &rc); /* number of jobs in update */
	if (rc)
		return;

	while (njobs--) {
		runver_server = 0;
		discarded = 0;
		strcpy(mom_name, "_UNKNOWN_");
		strcpy(exec_host_name, "_UNKNOWN2_");
		execvnod = NULL;
		jobid = NULL;

		jobid = disrst(stream, &rc);
		if (rc)
			goto err;
		substate = disrsi(stream, &rc);
		if (rc)
			goto err;
		runver = disrsl(stream, &rc);
		if (rc)
			goto err;
		(void) disrsi(stream, &rc); /* sister is not currently used */
		if (rc)
			goto err;
		execvnod = disrst(stream, &rc);
		if (rc)
			goto err;

		DBPRT(("mom_running_jobs: %s substate: %d runver: %ld\n", jobid, substate, runver))
		if ((pjob = find_job(jobid)) == NULL) {
			/* job not found,  tell Mom to discard it */
			send_discard_job(stream, jobid, -1, "not known to Server");
			discarded = 1;
		}

		if (pjob && !discarded && (is_jattr_set(pjob, JOB_ATR_run_version)))
			runver_server = get_jattr_long(pjob, JOB_ATR_run_version);

		if (pjob && !discarded && (runver_server != runver)) {
			if (runver_server > 0) {
				/* different Version, discard it */
				send_discard_job(stream, jobid, runver, "has been run again");
				discarded = 1;
			} else {
				/* server had no clue about runver -- accept what MOM tells us if exec_host matches stream source */

				if ((pmom = tfind2((u_long) stream, 0, &streams)) != NULL && ((mom_svrinfo_t *) (pmom->mi_data))->msr_numvnds > 0)
					strncpy(mom_name, ((mom_svrinfo_t *) (pmom->mi_data))->msr_children[0]->nd_name, PBS_MAXHOSTNAME);
				if ((is_jattr_set(pjob, JOB_ATR_exec_host)) &&
				    (slash_pos = strchr(get_jattr_str(pjob, JOB_ATR_exec_host), '/')) != NULL) {
					exec_host_hostlen = slash_pos - get_jattr_str(pjob, JOB_ATR_exec_host);
					strncpy(exec_host_name, get_jattr_str(pjob, JOB_ATR_exec_host), exec_host_hostlen);
					exec_host_name[exec_host_hostlen] = '\0';
				}

				if (!strcmp(exec_host_name, mom_name)) {
					/* natural vnode of MOM at end of stream matches exec_host first entry */

					snprintf(log_buffer, sizeof(log_buffer), "run_version %ld for job recovered from MOM with vnode %s; exec_host %s", runver, mom_name, exec_host_name);
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ALERT, pjob->ji_qs.ji_jobid, log_buffer);

					set_jattr_l_slim(pjob, JOB_ATR_run_version, runver, SET);

					if (!(is_jattr_set(pjob, JOB_ATR_runcount)) || (get_jattr_long(pjob, JOB_ATR_runcount) <= 0)) {
						set_jattr_l_slim(pjob, JOB_ATR_runcount, runver, SET);
						/* update for resources used will save this to DB on later message from MOM, if it is indeed valid */
					}
				} else {
					/* wrong MOM, exec_host either empty or non-matching, discard job on MOM (and hope the correct MOM will come along) */

					snprintf(log_buffer, sizeof(log_buffer), "run_version recovery: exec_host %s != MOM name %s, discarding job on that MOM", exec_host_name, mom_name);
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_ALERT, pjob->ji_qs.ji_jobid, log_buffer);

					send_discard_job(stream, jobid, -1, "MOM fails to match exec_host");
					discarded = 1;
				}
			}
		}

		if (pjob && !discarded && !check_job_substate(pjob, substate)) {

			/* Job substates disagree */

			if ((check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP)) ||
			    (check_job_substate(pjob, JOB_SUBSTATE_SUSPEND))) {

				if (substate == JOB_SUBSTATE_RUNNING) {

					/* tell Mom to suspend job */
					(void) issue_signal(pjob, "SIG_SUSPEND", release_req, 0);
				}
			} else if (check_job_substate(pjob, JOB_SUBSTATE_RUNNING)) {
				if (substate == JOB_SUBSTATE_SUSPEND) {

					/* tell Mom to resume job */
					(void) issue_signal(pjob, "SIG_RESUME", release_req, 0);
				}

			} else if ((!check_job_state(pjob, JOB_STATE_LTR_EXITING)) &&
				   (!check_job_state(pjob, JOB_STATE_LTR_RUNNING))) {

				/* for any other disagreement of state except */
				/* in Exiting or RUNNING, discard job         */
				send_discard_job(stream, jobid, runver, "state mismatch");
				pjob->ji_discarding = 1;
			}

			/*
			 * calls to issue_signal would reset transport from TPP to TCP
			 * revert it back to TPP before continuing
			 */
			DIS_tpp_funcs();
		}

		/* all other cases - job left as is */

		free(jobid);
		jobid = NULL;
		free(execvnod);
		execvnod = NULL;
	}
	return;

err:
	snprintf(log_buffer, sizeof(log_buffer), "%s for %s", dis_emsg[rc],
		 "HELLO3/4");
	log_err(errno, "mom_running_jobs", log_buffer);
	free(jobid);
	free(execvnod);
}

/**
 * @brief
 * 		Input is coming from another server (MOM) over a TPP stream.
 *
 * @par
 *		Read the stream to get a Inter-Server request.
 *		Some error cases call stream_eof instead of tpp_close because
 *		a customer encountered a stream mixup (spid 183257) where a
 *		stream that should not have been found by tfind2 was found.
 *
 * @param[in] stream  - TPP stream on which the request is arriving
 * @param[in] version - Version of protocol, not to be changed lightly as it makes everything incompatable.
 *
 * @return none
 */
void
is_request(int stream, int version)
{
	int check_other_moms_time = 0;
	int command = 0;
	int command_orig = 0;
	int cr_node;
	int ret = DIS_SUCCESS;
	int i, j;
	u_Long l;
	int ivnd;
	char *jid = NULL;
	int made_new_vnodes;
	unsigned long hook_seq;
	char *hook_euser;
	job *pjob;
	unsigned long ipaddr;
	unsigned long port;
	struct sockaddr_in *addr;
	struct pbsnode *np = NULL;
	attribute *pala;
	resource_def *prd;
	resource *prc;
	mominfo_t *pmom;
	mom_svrinfo_t *psvrmom;
	dmn_info_t *pdmninfo;
	int s;
	char *val;
	unsigned long oldstate;
	vnl_t *vnlp; /* vnode list */
	static char node_up[] = "node up";
	pbs_list_head reported_hooks;
	hook *phook;
	char *hname = NULL;
	unsigned long hook_rescdef_checksum;
	unsigned long chksum_rescdef;
	static int reply_send_tm = 0;
	char *badconstr = "unset";

	CLEAR_HEAD(reported_hooks);
	DBPRT(("%s: stream %d version %d\n", __func__, stream, version))
	addr = tpp_getaddr(stream);
	if (version != IS_PROTOCOL_VER) {
		sprintf(log_buffer, "protocol version %d unknown from %s",
			version, netaddr(addr));
		log_err(-1, __func__, log_buffer);
		stream_eof(stream, 0, NULL);
		return;
	}
	if (addr == NULL) {
		sprintf(log_buffer, "Sender unknown");
		log_err(-1, __func__, log_buffer);
		stream_eof(stream, 0, NULL);
		return;
	}

	ipaddr = ntohl(addr->sin_addr.s_addr);

	command = disrsi(stream, &ret);
	if (ret != DIS_SUCCESS) {
		badconstr = "disrsi:command";
		goto badcon;
	}

	if (command == IS_HELLOSVR) {
		port = disrui(stream, &ret);
		if (ret != DIS_SUCCESS) {
			badconstr = "disrui:port";
			goto badcon;
		}

		DBPRT(("%s: IS_HELLOSVR addr: %s, port %lu\n", __func__, netaddr(addr), port))

		if ((pmom = tfind2(ipaddr, port, &ipaddrs)) == NULL) {
			badconstr = "tfind2:pmom";
			goto badcon;
		}

		log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
			   LOG_NOTICE, pmom->mi_host, "Hello from MoM on port=%lu", port);

		psvrmom = (mom_svrinfo_t *) (pmom->mi_data);
		pdmninfo = pmom->mi_dmn_info;
		pdmninfo->dmn_state |= INUSE_UNKNOWN;
		if (pdmninfo->dmn_stream >= 0 && pdmninfo->dmn_stream != stream) {
			DBPRT(("%s: stream %d from %s:%d already open on %d\n",
			       __func__, stream, pmom->mi_host,
			       ntohs(addr->sin_port), pdmninfo->dmn_stream))
			tpp_close(pdmninfo->dmn_stream);
			tdelete2((u_long) pdmninfo->dmn_stream, 0ul, &streams);
		}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		if (psvrmom->msr_numjobs > 0)
			pdmninfo->dmn_state |= INUSE_NEED_CREDENTIALS;
#endif

		if (psvrmom->msr_vnode_pool != 0) {
			/*
			 * Mom has a pool, see if the pool has an
			 * inventory Mom already, if not make this Mom the one
			 */
			vnpool_mom_t *ppool;
			ppool = find_vnode_pool(pmom);
			if (ppool != NULL) {
				if (ppool->vnpm_inventory_mom == NULL) {
					ppool->vnpm_inventory_mom = pmom;
					psvrmom->msr_has_inventory = 1;
					sprintf(log_buffer,
						msg_new_inventory_mom,
						ppool->vnpm_vnode_pool,
						pmom->mi_host);
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
						  LOG_DEBUG, msg_daemonname, log_buffer);
				}
			}
		}

		/* we save this stream for future communications */
		pdmninfo->dmn_stream = stream;
		pdmninfo->dmn_state |= INUSE_INIT;
		pdmninfo->dmn_state &= ~INUSE_NEEDS_HELLOSVR;
		tinsert2((u_long) stream, 0ul, pmom, &streams);
		tpp_eom(stream);

		/* mcast reply togethor */
		if (psvrmom->msr_vnode_pool <= 0 || psvrmom->msr_has_inventory)
			mcast_add(pmom, &mtfd_replyhello, FALSE);
		else
			mcast_add(pmom, &mtfd_replyhello_noinv, FALSE);

		if (reply_send_tm <= time_now) {
			struct work_task *ptask;

			/* time to wait depends on the no of moms server knows */
			reply_send_tm = time_now + (mominfo_array_size > 1024 ? MCAST_WAIT_TM : 0);
			ptask = set_task(WORK_Timed, reply_send_tm, mcast_msg, NULL);
			ptask->wt_aux = IS_REPLYHELLO;
		}
		return;

	} else if ((pmom = tfind2((u_long) stream, 0, &streams)) != NULL)
		goto found;

badcon:
	sprintf(log_buffer, "bad attempt to connect from %s, reason=%s",
		netaddr(addr), badconstr);
	log_err(-1, __func__, log_buffer);
	stream_eof(stream, 0, NULL);
	return;

found:
	psvrmom = (mom_svrinfo_t *) (pmom->mi_data);
	pdmninfo = pmom->mi_dmn_info;
	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG, msg_daemonname, "Received request2: %d", command);

	switch (command) {

		case IS_CMD_REPLY:
			DBPRT(("%s: IS_CMD_REPLY\n", __func__))
			process_DreplyTPP(stream);
			break;

		case IS_REGISTERMOM:
			if (psvrmom->msr_wktask) { /* if task requeue jobs, delete it */
				delete_task(psvrmom->msr_wktask);
				psvrmom->msr_wktask = 0;
			}

			set_all_state(pmom, 0,
				      INUSE_UNKNOWN | INUSE_NEED_ADDRS | INUSE_SLEEP, NULL,
				      Set_All_State_Regardless);
			set_all_state(pmom, 1, INUSE_DOWN | INUSE_INIT, NULL,
				      Set_ALL_State_All_Down);
			if ((pdmninfo->dmn_state & INUSE_MARKEDDOWN) == 0)
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_INFO,
					  pmom->mi_host, "Setting host to Initialize");

			/* validate jobs Mom reported against what I have */
			mom_running_jobs(stream);
			/*
			 * respond to HELLO from Mom by sending her optional vmap and
			 * all addresses of all Moms
			 */
			command_orig = command;
			if (psvrmom->msr_vnode_pool <= 0 || psvrmom->msr_has_inventory)
				command = IS_UPDATE2;
			else
				command = IS_UPDATE;
			/* fall into IS_UPDATE */

		case IS_UPDATE:
		case IS_UPDATE2:

			if (psvrmom->msr_vnode_pool != 0) {
				sprintf(log_buffer, "POOL: IS_UPDATE%c received",
					(command == IS_UPDATE) ? ' ' : '2');
				log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE,
					  LOG_INFO, pmom->mi_host, log_buffer);
			}

			cr_node = 0;
			made_new_vnodes = 0;

			if (command == IS_UPDATE) {
				DBPRT(("%s: IS_UPDATE %s\n", __func__, pmom->mi_host))
			} else {
				DBPRT(("%s: IS_UPDATE2 %s\n", __func__, pmom->mi_host))
			}

			set_all_state(pmom, 0, INUSE_BUSY | INUSE_UNKNOWN, NULL,
				      Set_All_State_Regardless);

			s = disrui(stream, &ret); /* state bits, also used later */
			if (ret != DIS_SUCCESS)
				goto err;

			DBPRT(("state 0x%x ", s))
			if (s & INUSE_DOWN) {
				momptr_down(pmom, "by mom");
			} else if (s & INUSE_BUSY) {
				set_all_state(pmom, 1, INUSE_BUSY, NULL,
					      Set_All_State_Regardless);
			}

			i = disrui(stream, &ret); /* num of phy CPUs on system */
			if (ret != DIS_SUCCESS)
				goto err;

			/* physical cpus, set on the one vnode or the "special" */
			DBPRT(("phy ncpus %d ", i))
			psvrmom->msr_pcpus = i;
			if (psvrmom->msr_numvnds > 0) {
				np = psvrmom->msr_children[0]; /* the "one" */
				np->nd_ncpus = psvrmom->msr_pcpus;
				set_nattr_l_slim(np, ND_ATR_pcpus, psvrmom->msr_pcpus, SET);
			}

			i = disrui(stream, &ret); /* num of avail CPUs on host */
			if (ret != DIS_SUCCESS)
				goto err;

			DBPRT(("avail cpus %d ", i))
			psvrmom->msr_acpus = i;

			l = disrull(stream, &ret); /* memory (KB) on system */
			if (ret != DIS_SUCCESS)
				goto err;

			DBPRT(("mem %llukb ", l))

			psvrmom->msr_pmem = l;

			val = disrst(stream, &ret); /* arch of Mom's host */
			if (ret != DIS_SUCCESS)
				goto err;

			DBPRT(("arch %s ", val))
			free(psvrmom->msr_arch);
			psvrmom->msr_arch = val;

			if ((pdmninfo->dmn_state & INUSE_MARKEDDOWN) == 0) {
				sprintf(log_buffer, "update%c state:%d ncpus:%ld",
					command == IS_UPDATE ? ' ' : '2',
					s, psvrmom->msr_pcpus);
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
					  LOG_INFO, pmom->mi_host, log_buffer);
			}

			if (command == IS_UPDATE) {
				/* Only one vnode,  set resources_available    */
				/* for multiple vnodes, the info is in UPDATE2 */

				if (psvrmom->msr_numvnds != 0) {
					np = psvrmom->msr_children[0];

					/*
					 * Sharing attribute - three cases for at_flags:
					 * 1. If the sharing attribute was explicitly set via qmgr the flag will be
					 *    ATR_VFLAG_SET.
					 * 2. If set via a prior update2 message from Mom, the flags
					 *    would be ATR_VFLAG_SET | ATR_VFLAG_DEFLT.
					 * 3. If unset, flags would be zero.
					 *
					 * For case 2 and 3, but not for case 1, set or reset the sharing attribute
					 * to the default of "default_shared" on the natural vnode as it may have been
					 * changed via a prior UPDATE2 (multi-vnode) message but the vnodedef file
					 * has now been removed; hence this UPDATE message instead of UPDATE2.
					 */
					if (((get_nattr(np, ND_ATR_Sharing))->at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) != ATR_VFLAG_SET) {
						/* unset or ATR_VFLAG_DEFLT is set */
						set_nattr_l_slim(np, ND_ATR_Sharing, VNS_DFLT_SHARED, SET);
						(get_nattr(np, ND_ATR_Sharing))->at_flags |= ATR_VFLAG_DEFLT;
					}

					/* mark all vnodes under this Mom stale, then because    */
					/* this is non-vnoded update, un-stale the natural vnode */
					/* EXCEPT when the Mom is in a vnode_pool 		 */
					if (psvrmom->msr_vnode_pool <= 0) {
						set_all_state(pmom, 1, INUSE_STALE, NULL,
							      Set_All_State_Regardless);
						set_vnode_state(np, ~INUSE_STALE, Nd_State_And);
					}

					pala = get_nattr(np, ND_ATR_ResourceAvail);

					/* available cpus */
					i = psvrmom->msr_acpus;
					prd = &svr_resc_def[RESC_NCPUS];
					prc = find_resc_entry(pala, prd);
					if (prc == NULL)
						prc = add_resource_entry(pala, prd);
					if (((is_attr_set(&prc->rs_value)) == 0) ||
					    ((prc->rs_value.at_flags & ATR_VFLAG_DEFLT) != 0)) {
						mod_node_ncpus(np, i, ATR_ACTION_ALTER);
						prc->rs_value.at_val.at_long = i;
						prc->rs_value.at_flags |= (ATR_SET_MOD_MCACHE | ATR_VFLAG_DEFLT);
					}

					/* available memory */
					prd = &svr_resc_def[RESC_MEM];
					prc = find_resc_entry(pala, prd);
					if (prc == NULL)
						prc = add_resource_entry(pala, prd);
					if ((prc->rs_value.at_flags & ATR_VFLAG_DEFLT) ||
					    ((is_attr_set(&prc->rs_value)) == 0)) {
						/* set size in KB */
						prc->rs_value.at_val.at_size.atsv_num =
							psvrmom->msr_pmem;
						prc->rs_value.at_val.at_size.atsv_shift = 10;
						prc->rs_value.at_flags |= (ATR_SET_MOD_MCACHE | ATR_VFLAG_DEFLT);
					}
				}
			}

			/* UPDATE2 message - multiple vnoded system */
			if (command == IS_UPDATE2) {
				vnlp = vn_decode_DIS(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto err;
				if (vnlp == NULL) {
					sprintf(log_buffer, "vn_decode_DIS vn failed");
					log_err(-1, __func__, log_buffer);
				} else if (vnlp->vnl_modtime >= pmom->mi_modtime) {
					int i, j;

					if (vnlp->vnl_modtime > pmom->mi_modtime)
						cr_node = 1;

					/* set stale bit in state for all non sleeping vnodes, */
					/* it will be cleared for the vnodes     */
					/* listed in the update2 messsage	 */
					set_all_state(pmom, 1, INUSE_STALE, NULL,
						      Set_All_State_Regardless);

					pmom->mi_modtime = vnlp->vnl_modtime;
					sprintf(log_buffer, "Mom reporting %lu vnodes as of %s", vnlp->vnl_used, ctime((time_t *) &vnlp->vnl_modtime));
					*(log_buffer + strlen(log_buffer) - 1) = '\0';

					if ((pdmninfo->dmn_state & INUSE_MARKEDDOWN) == 0)
						log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_INFO, pmom->mi_host, log_buffer);
					/*
					 * If the vnode will have multiple
					 * parent Moms, set flag to cross check
					 * mod time against all parent Moms
					 */
					if (vnlp->vnl_used > 1)
						check_other_moms_time = 1;

					for (i = 0; i < vnlp->vnl_used; i++) {
						vnal_t *vnrlp;
						vnrlp = VNL_NODENUM(vnlp, i);
						/* create vnode */
						(void) update2_to_vnode(vnrlp, cr_node, pmom, &made_new_vnodes, 0);
						for (j = 0; j < vnrlp->vnal_used; j++) {
							vna_t *psrp;

							psrp = VNAL_NODENUM(vnrlp, j);
							if (strcasecmp(psrp->vna_name,
								       VNATTR_PNAMES) == 0) {
								snprintf(log_buffer,
									 sizeof(log_buffer),
									 "pnames %s", psrp->vna_val);
								log_event(PBSEVENT_SYSTEM,
									  PBS_EVENTCLASS_NODE,
									  LOG_INFO,
									  pmom->mi_host, log_buffer);

								setup_pnames(psrp->vna_val);
							}
						}
					}

					/* if multiple vnodes indicated (above) and
					 * if the vnodes (except the first) have
					 * multiple Moms,  update the map mod
					 * time on those Moms as well
					 */
					if (check_other_moms_time &&
					    (psvrmom->msr_numvnds > 1)) {
						if (psvrmom->msr_children[1]->nd_nummoms > 1) {
							j = psvrmom->msr_children[1]->nd_nummoms;
							for (i = 0; i < j; ++i) {
								psvrmom->msr_children[1]->nd_moms[i]->mi_modtime = vnlp->vnl_modtime;
							}
						}
					}
					if (made_new_vnodes || cr_node) {
						save_nodes_db(1, pmom); /* update the node database */
						propagate_licenses_to_vnodes(pmom);
					}
				}
				vnl_free(vnlp);
				vnlp = NULL;
			}

			/*read mom's pbs_version data if appended*/

			val = disrst(stream, &ret);
			if (ret == DIS_SUCCESS) {
				DBPRT(("mom's pbs_version %s ", val))
				free(psvrmom->msr_pbs_ver);
				psvrmom->msr_pbs_ver = val;
			} else if (ret == DIS_EOD) {
				/*found no appended version data*/
				free(psvrmom->msr_pbs_ver);
				psvrmom->msr_pbs_ver = strdup("unavailable");
			} else
				goto err;

			/* for either UPDATE or UPDATE2...		    */
			/* log which vnodes under that Mom are stale	    */
			/* set default resources for "arch" on all vnodes   */
			/* also set each vnodes' ATR_ResvEnable if need be  */
			/* Set ncpus and mem in resources_available on the  */
			/* natural vnode if they are not already set.       */

			for (ivnd = 0; ivnd < psvrmom->msr_numvnds; ++ivnd) {
				np = psvrmom->msr_children[ivnd];

				if (np->nd_state & INUSE_STALE) {
					/* vnode is stale */
					snprintf(log_buffer, sizeof(log_buffer),
						 "vnode %s is stale", np->nd_name);
					log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
						  LOG_INFO, pmom->mi_host, log_buffer);
				}

				pala = get_nattr(np, ND_ATR_ResourceAvail);

				prd = &svr_resc_def[RESC_ARCH];
				prc = find_resc_entry(pala, prd);
				if (prc == NULL)
					prc = add_resource_entry(pala, prd);
				if (!is_attr_set(&prc->rs_value)) {
					if (is_attr_set(&prc->rs_value))
						free(prc->rs_value.at_val.at_str);
					prc->rs_value.at_val.at_str = strdup(psvrmom->msr_arch);
					prc->rs_value.at_flags |= (ATR_SET_MOD_MCACHE | ATR_VFLAG_DEFLT);
				}

				/*
				 * make sure resources_available.[ncpus,mem] are set
				 * on the "natural" (first vnode).  Use value from
				 * the Mom.
				 */
				if (ivnd == 0) {
					/* the first = natural vnode */
					prd = &svr_resc_def[RESC_NCPUS];
					prc = find_resc_entry(pala, prd);
					if (prc == NULL)
						prc = add_resource_entry(pala, prd);
					if (prc &&
					    ((is_attr_set(&prc->rs_value)) == 0)) {
						prc->rs_value.at_val.at_long = psvrmom->msr_acpus;
						prc->rs_value.at_flags |= (ATR_SET_MOD_MCACHE | ATR_VFLAG_DEFLT);
					}
					prd = &svr_resc_def[RESC_MEM];
					prc = find_resc_entry(pala, prd);
					if (prc == NULL)
						prc = add_resource_entry(pala, prd);
					if (prc &&
					    ((is_attr_set(&prc->rs_value)) == 0)) {
						prc->rs_value.at_val.at_size.atsv_num =
							psvrmom->msr_pmem;
						prc->rs_value.at_val.at_size.atsv_shift = 10;
						prc->rs_value.at_flags |= (ATR_SET_MOD_MCACHE | ATR_VFLAG_DEFLT);
					}
				}

				/*
				 * is resv_enable attribute in manual/automatic mode?
				 *
				 * Automatic mode is implemented by utilizing the
				 * ATR_VFLAG_DEFLT bit
				 * The table which follows enumerates the cases:
				 *
				 * Manual mode if:
				 * (ATR_VFLAG_SET & at_flags)==1  &&
				 * (ATR_VFLAG_DEFLT & at_flags)==0
				 *
				 * Automatic mode if:
				 * (ATR_VFLAG_SET & at_flags)==1  &&
				 * (ATR_VFLAG_DEFLT & at_flags)==1
				 * (ATR_VFLAG_SET & at_flags)==0  &&
				 * (ATR_VFLAG_DEFLT & at_flags)==1
				 * (ATR_VFLAG_SET & at_flags)==0  &&
				 * (ATR_VFLAG_DEFLT & at_flags)==0
				 *
				 * The later two forms of automatic mode transition to
				 * the first form listed.  Doing it this way provides a
				 * means by which the operator can go in to manual mode
				 * but still have a * way to revert back to automatic
				 * mode if needed.
				 */

				if (!((get_nattr(np, ND_ATR_ResvEnable))->at_flags & ATR_VFLAG_SET) ||
				    ((get_nattr(np, ND_ATR_ResvEnable))->at_flags & ATR_VFLAG_DEFLT)) {

					int change = 0;

					/*
					 * attribute resv_enable is in automatic mode
					 * does mom config file show mom configured for
					 * cycle harvesting?
					 */
					if (s & MOM_STATE_CONF_HARVEST) {
						if (get_nattr_long(np, ND_ATR_ResvEnable)) {
							set_nattr_l_slim(np, ND_ATR_ResvEnable, 0, SET);
							change = 1;
						}
					} else {
						if (!get_nattr_long(np, ND_ATR_ResvEnable)) {
							set_nattr_l_slim(np, ND_ATR_ResvEnable, 1, SET);
							change = 1;
						}
					}

					if (change || !((get_nattr(np, ND_ATR_ResvEnable))->at_flags & ATR_VFLAG_SET) || !((get_nattr(np, ND_ATR_ResvEnable))->at_flags & ATR_VFLAG_DEFLT))
						(get_nattr(np, ND_ATR_ResvEnable))->at_flags |= ATR_VFLAG_DEFLT;
				}

				if (psvrmom->msr_pbs_ver != NULL) {

					if (is_nattr_set(np, ND_ATR_version) == 0 || strcmp(psvrmom->msr_pbs_ver, get_nattr_str(np, ND_ATR_version)) != 0) {
						free_nattr(np, ND_ATR_version);
						if (!set_nattr_str_slim(np, ND_ATR_version, psvrmom->msr_pbs_ver, NULL))
							np->nd_modified = 1;
					}
				}
			}

			if (made_new_vnodes || cr_node)
				save_nodes_db(1, pmom); /* update the node database */

			if (command_orig == IS_REGISTERMOM) {
				/* Mom is acknowledging the info sent by the Server */
				/* Mark the Mom and associated vnodes as up */
				oldstate = pdmninfo->dmn_state;
				if (pdmninfo->dmn_state & INUSE_MARKEDDOWN)
					pdmninfo->dmn_state &= ~INUSE_MARKEDDOWN;

				set_all_state(pmom, 0, INUSE_DOWN | INUSE_INIT,
					      NULL, Set_All_State_Regardless);

				/* log a node up message only if it was not marked
			 * as "markeddown" by TPP layer due to broken connection
			 * to pbs_comm router
			 */
				if ((oldstate & INUSE_MARKEDDOWN) == 0) {
					log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
						  LOG_NOTICE, pmom->mi_host, node_up);
				}
				psvrmom->msr_timedown = 0;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
				if (pdmninfo->dmn_state & INUSE_NEED_CREDENTIALS) {
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
						  LOG_INFO, pmom->mi_host, "mom needs credentials");

					for (i = 0; i < psvrmom->msr_numjobs; i++) {
						if (psvrmom->msr_jobindx[i])
							set_task(WORK_Immed, 0, svr_renew_job_cred, psvrmom->msr_jobindx[i]->ji_qs.ji_jobid);
					}

					pdmninfo->dmn_state &= ~INUSE_NEED_CREDENTIALS;
				}
#endif
			}
			break;

		case IS_RESCUSED:
		case IS_RESCUSED_FROM_HOOK:

			if (command == IS_RESCUSED) {
				DBPRT(("%s: IS_RESCUSED\n", __func__))
			} else {
				DBPRT(("%s: IS_RESCUSED_FROM_HOOK\n", __func__))
			}

			stat_update(stream);
			break;

		case IS_JOBOBIT:
			DBPRT(("%s: IS_JOBOBIT\n", __func__))
			recv_job_obit(stream);
			break;

		case IS_IDLE:
			DBPRT(("%s: IS_IDLE\n", __func__))
			recv_wk_job_idle(stream);
			break;

		case IS_DISCARD_DONE:
			/* Mom is acknowledging a IS_DISCARD_JOB request    */
			/* Mark her entry in the discard structure complete */

			jid = disrst(stream, &ret); /* job id */
			if (ret != DIS_SUCCESS)
				goto err;
			j = disrsi(stream, &ret); /* run (hop) count */
			if (ret != DIS_SUCCESS)
				goto err;
			sprintf(log_buffer, "Discard done for job %s", jid);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				  pmom->mi_host, log_buffer);
			DBPRT(("%s: Mom %s %s (%d)\n", __func__, pmom->mi_host, log_buffer, j))
			pjob = find_job(jid);
			if (pjob &&
			    (get_jattr_long(pjob, JOB_ATR_run_version) == j)) {
				post_discard_job(pjob, pmom, JDCD_REPLIED);
			}
			free(jid);
			jid = NULL;
			break;

		case IS_HOOK_JOB_ACTION: {
			int *replies_seq = NULL;
			int replies_count = 0;
			int acts_count = 0;

			acts_count = i = disrsi(stream, &ret); /* number of actions in request */
			if (ret != DIS_SUCCESS)
				goto err;
			if ((replies_seq = (int *) malloc(sizeof(int) * i)) == NULL)
				goto err;
			while (i--) {
				int runct;
				int hact;
				int hook_seq;

				/* job id */
				jid = disrst(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto hook_act_reply;
				/* hook action sequence number for acknowledgement */
				hook_seq = disrul(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto hook_act_reply;
				/* run count of job to verify that job hasn't changed */
				runct = disrsi(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto hook_act_reply;
				/* action: delete or requeue */
				hact = disrsi(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto hook_act_reply;
				/* user requesting action, not currently used */
				(void) disrui(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto hook_act_reply;

				if (((pjob = find_job(jid)) != NULL) &&
				    (check_job_state(pjob, JOB_STATE_LTR_RUNNING) ||
				     check_job_state(pjob, JOB_STATE_LTR_EXITING)) &&
				    (get_jattr_long(pjob, JOB_ATR_run_version) == runct)) {
					/* set the Exit_status job attribute */
					/* to be later checked in job_obit() */
					if (hact == JOB_ACT_REQ_REQUEUE) {
						set_jattr_l_slim(pjob, JOB_ATR_exit_status, JOB_EXEC_HOOK_RERUN, SET);
						log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_INFO, pmom->mi_host,
							   "hook request rerun %s", jid);
					} else if (hact == JOB_ACT_REQ_DELETE) {
						set_jattr_l_slim(pjob, JOB_ATR_exit_status, JOB_EXEC_HOOK_DELETE, SET);
						log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE, LOG_INFO, pmom->mi_host,
							   "hook request delete %s", jid);
					} else if (hact == JOB_ACT_REQ_DEALLOCATE) {

						/* decrement everything found in exec_vnode/exec_vnode_deallocated  */
						if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) == 0) {
							/* don't update resources_assigned if job is suspended */
							set_resc_assigned((void *) pjob, 0, DECR);
						}

						deallocate_job(pmom, pjob);

						/* increment everything found in new exec_vnode/exec_vnode_deallocated  */
						if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) == 0) {
							/* don't update resources_assigned if job is suspended */
							set_resc_assigned((void *) pjob, 0, INCR);
						}
					}
				}
				free(jid);
				jid = NULL;
				replies_seq[replies_count++] = hook_seq;
			}
		hook_act_reply:
			if (replies_count > 0) {
				if (is_compose(stream, IS_HOOK_ACTION_ACK) != DIS_SUCCESS)
					goto err;
				if (ret != DIS_SUCCESS)
					goto err;
				ret = diswsi(stream, IS_HOOK_JOB_ACTION);
				if (ret != DIS_SUCCESS)
					goto err;
				ret = diswsi(stream, replies_count);
				if (ret != DIS_SUCCESS)
					goto err;
				for (i = 0; i < replies_count; i++) {
					ret = diswul(stream, replies_seq[i]);
					if (ret != DIS_SUCCESS)
						goto err;
				}
				ret = dis_flush(stream);
				if (ret != DIS_SUCCESS) {
					ret = DIS_NOCOMMIT;
					goto err;
				}
			}

			if (replies_count != acts_count)
				goto err;
		} break;

		case IS_HOOK_SCHEDULER_RESTART_CYCLE:
			hook_euser = disrst(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;
			if (*hook_euser != '\0') {
				if ((svr_get_privilege(hook_euser, pmom->mi_host) &
				     (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0) {
					snprintf(log_buffer, sizeof(log_buffer),
						 hook_privilege, hook_euser,
						 pmom->mi_host);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE,
						  LOG_INFO, pmom->mi_host, log_buffer);
					free(hook_euser);
					hook_euser = NULL;
					break;
				}
			}
			free(hook_euser);
			hook_euser = NULL;
			set_scheduler_flag(SCH_SCHEDULE_RESTART_CYCLE, dflt_scheduler);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE,
				  LOG_INFO, pmom->mi_host,
				  "requested for scheduler to restart cycle");
			break;

		case IS_UPDATE_FROM_HOOK:
		case IS_UPDATE_FROM_HOOK2:
			hook_seq = disrul(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;

			/* hook_euser is not currently used, plan on using it  */
			/* instead of VNATTR_HOOK_REQUESTOR in the future      */
			/* its here to prevent need of changing protocol later */
			hook_euser = disrst(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;
			free(hook_euser);
			hook_euser = NULL;

			vnlp = vn_decode_DIS(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;

			if (vnlp == NULL) {
				sprintf(log_buffer, "vn_decode_DIS vn failed");
				log_err(-1, __func__, log_buffer);
				goto err;
			}

			cr_node = 0;
			/* is_update2 changes (from vnodedef files) are sent at the same time */
			/* as is_update_from_hook changes, so they'll have the same vnlp timestamp. */
			/* is_update2 also records the received vnlp's vnl_modtime in pmom->mi_modtime. */
			if (vnlp->vnl_modtime >= pmom->mi_modtime)
				cr_node = 1;
			for (i = 0; i < vnlp->vnl_used; i++) {
				vnal_t *vnrlp;
				vnrlp = VNL_NODENUM(vnlp, i);
				/* update vnode */
				made_new_vnodes = 0;
				if (update2_to_vnode(vnrlp, cr_node, pmom, &made_new_vnodes, (command == IS_UPDATE_FROM_HOOK2) ? 2 : 1) == PBSE_PERM) {
					break; /* encountered a bad permission */
				}
			}
			vnl_free(vnlp);
			vnlp = NULL;

			/* tell Mom we got this one, reply with the type of */
			/* action requested and the sequence number         */

			if (is_compose(stream, IS_HOOK_ACTION_ACK) != DIS_SUCCESS)
				goto err;

			if (ret != DIS_SUCCESS)
				goto err;
			ret = diswsi(stream, IS_UPDATE_FROM_HOOK);
			if (ret != DIS_SUCCESS)
				goto err;
			ret = diswsi(stream, 1);
			if (ret != DIS_SUCCESS)
				goto err;
			ret = diswul(stream, hook_seq);
			if (ret != DIS_SUCCESS)
				goto err;
			ret = dis_flush(stream);
			if (ret != DIS_SUCCESS) {
				ret = DIS_NOCOMMIT;
				goto err;
			}
			if (made_new_vnodes || cr_node) {
				save_nodes_db(1, pmom); /* update the node database */
				propagate_licenses_to_vnodes(pmom);
			}
			break;

		case IS_HOOK_CHECKSUMS:
			CLEAR_HEAD(reported_hooks);
			i = disrsi(stream, &ret); /* number of hooks to report */
			if (ret != DIS_SUCCESS)
				goto err;

			while (i--) {
				unsigned long chksum_hk;
				unsigned long chksum_py;
				unsigned long chksum_cf;
				unsigned int haction;

				haction = 0;
				/* hook name */
				hname = disrst(stream, &ret);
				if ((ret != DIS_SUCCESS) || (hname == NULL))
					goto err;

				/* hook control file checksum */
				chksum_hk = disrul(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto err;

				/* hook script checksum */
				chksum_py = disrul(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto err;

				/* hook config file checksum */
				chksum_cf = disrul(stream, &ret);
				if (ret != DIS_SUCCESS)
					goto err;

				phook = find_hook(hname);
				if ((phook == NULL) ||
				    ((phook->event & MOM_EVENTS) == 0)) {
					/* mom has a hook that the server */
					/* does not  know about. tell mom */
					/* to delete that hook */
					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "encountered a mom (%s) hook %s "
						 "that the server does not know "
						 "about! Telling mom to delete",
						 pmom->mi_host, hname);
					log_event(PBSEVENT_DEBUG3,
						  PBS_EVENTCLASS_HOOK,
						  LOG_ERR, hname,
						  log_buffer);
					add_pending_mom_hook_action(pmom,
								    hname, MOM_HOOK_ACTION_DELETE);
					free(hname);
					continue;
				}

				if ((phook->hook_control_checksum > 0) &&
				    (phook->hook_control_checksum != chksum_hk)) {

					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "hook control file "
						 "mismatched checksums: server: "
						 "%lu mom (%s): %lu...resending",
						 phook->hook_control_checksum,
						 pmom->mi_host, chksum_hk);
					log_event(PBSEVENT_DEBUG3,
						  PBS_EVENTCLASS_HOOK,
						  LOG_ERR, phook->hook_name,
						  log_buffer);
					haction |= MOM_HOOK_ACTION_SEND_ATTRS;
				}

				if ((phook->hook_script_checksum > 0) &&
				    (phook->hook_script_checksum != chksum_py)) {

					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "hook script "
						 "mismatched checksums: server: "
						 "%lu mom (%s): %lu...resending",
						 phook->hook_script_checksum,
						 pmom->mi_host, chksum_py);
					log_event(PBSEVENT_DEBUG3,
						  PBS_EVENTCLASS_HOOK,
						  LOG_ERR, phook->hook_name,
						  log_buffer);
					haction |= MOM_HOOK_ACTION_SEND_SCRIPT;
				}

				if ((phook->hook_config_checksum > 0) &&
				    (phook->hook_config_checksum != chksum_cf)) {

					snprintf(log_buffer,
						 sizeof(log_buffer),
						 "hook config file "
						 "mismatched checksums: server: "
						 "%lu mom (%s): %lu...resending",
						 phook->hook_config_checksum,
						 pmom->mi_host, chksum_cf);
					log_event(PBSEVENT_DEBUG3,
						  PBS_EVENTCLASS_HOOK,
						  LOG_ERR, phook->hook_name,
						  log_buffer);
					haction |= MOM_HOOK_ACTION_SEND_CONFIG;
				}

				if (haction != 0) {
					add_pending_mom_hook_action(pmom,
								    hname, haction);
				}

				if (add_to_svrattrl_list(&reported_hooks, hname,
							 NULL, NULL, 0, NULL) == -1) {
					log_event(PBSEVENT_DEBUG3,
						  PBS_EVENTCLASS_HOOK,
						  LOG_INFO, hname,
						  "failed to add to reported "
						  "hooks list");
				}

				free(hname);
			}

			/* hook resourcedef checksum */
			chksum_rescdef = disrul(stream, &ret);
			if (ret != DIS_SUCCESS)
				goto err;

			hook_rescdef_checksum = get_hook_rescdef_checksum();
			if ((hook_rescdef_checksum > 0) &&
			    (hook_rescdef_checksum != chksum_rescdef)) {

				snprintf(log_buffer,
					 sizeof(log_buffer),
					 "hook resourcedef file "
					 "mismatched checksums: server: "
					 "%lu mom %s: %lu...resending",
					 hook_rescdef_checksum, pmom->mi_host,
					 chksum_rescdef);
				log_event(PBSEVENT_DEBUG3,
					  PBS_EVENTCLASS_HOOK,
					  LOG_ERR, PBS_RESCDEF,
					  log_buffer);
				add_pending_mom_hook_action(pmom,
							    PBS_RESCDEF,
							    MOM_HOOK_ACTION_SEND_RESCDEF);
			}

			/* Look for mom hooks known to the server that are */
			/* not known to the mom sending the request. */
			phook = (hook *) GET_NEXT(svr_allhooks);
			while (phook) {
				if (phook->hook_name &&
				    !phook->pending_delete &&
				    (phook->event & MOM_EVENTS) &&
				    (find_svrattrl_list_entry(&reported_hooks,
							      phook->hook_name, NULL) == NULL)) {
					add_pending_mom_hook_action(pmom,
								    phook->hook_name,
								    MOM_HOOK_ACTION_SEND_ATTRS | MOM_HOOK_ACTION_SEND_SCRIPT | MOM_HOOK_ACTION_SEND_CONFIG);
				}
				phook = (hook *) GET_NEXT(phook->hi_allhooks);
			}

			free_attrlist(&reported_hooks);
			np = psvrmom->msr_children[0];
			if (np->nd_state & INUSE_PROV) {
				DBPRT(("%s: calling [is_vnode_prov_done] from is_request\n", __func__))
				is_vnode_prov_done(np->nd_name);
			}

			break;

		case IS_CMD:
			DBPRT(("%s: IS_CMD\n", __func__))
			process_IS_CMD(stream);
			break;
	}

	tpp_eom(stream);
	return;

err:
	/*
	 ** We come here if we got a DIS write error.
	 */
	DBPRT(("\nINTERNAL or DIS i/o error\n"))
	snprintf(log_buffer, sizeof(log_buffer), "%s from %s(%s)",
		 dis_emsg[ret], pmom->mi_host, netaddr(addr));
	log_err(-1, __func__, log_buffer);
	free(jid);
	jid = NULL;
	free(hname);
	hname = NULL;
	free_attrlist(&reported_hooks);

	stream_eof(stream, ret, "write_err");

	return;
}

/**
 * @brief
 * 		free list of prop structures created by proplist()
 *
 * @param[in,out]	prop	- head to list of prop structures which needs to e freed
 *
 * @return	void
 */

static void
free_prop(struct prop *prop)
{
	struct prop *pp;

	for (pp = prop; pp; pp = prop) {
		prop = pp->next;
		free(pp->name);
		pp->name = NULL;
		free(pp);
	}
}

/**
 * @brief
 * 		Parse a number in a spec.
 *
 * @param[in]	ptr	- The string being parsed
 * @param[out]	num	- The number parsed
 * @param[in]	znotok	- (zero not ok) set true means a zero value is an error
 *
 *@return	int
 * @retval	0	- if okay
 * @retval  1	- if no number exists
 * @retval -1	- on error
 */
static int
number(char **ptr, int *num, int znotok)
{
	char holder[80];
	int i = 0;
	char *str = *ptr;

	while (isdigit(*str))
		holder[i++] = *str++;

	if (i == 0)
		return 1;
	if (isalpha((int) *str))
		return 1; /* cannot have digit followed by letter */

	holder[i] = '\0';
	if (((i = atoi(holder)) == 0) && znotok) {
		sprintf(log_buffer, "zero illegal");
		return -1;
	}

	*ptr = str;
	*num = i;
	return 0;
}

/**
 * @brief
 * 		Check string to see if it is a legal property name.
 *
 * @param[in]	ptr	- The string being parsed
 * @param[out]	prop	- set to static char array containing the property
 *
 * @see
 * 		proplist and ctcpus
 *
 * @return	int
 * @retval	0	- if string is a legal property name
 * @retval	1	- if string is not a legal property name
 *
 * @par MT-safe: No
 */
static int
property(char **ptr, char **prop)
{
	static char name[80];
	char *str = *ptr;
	int i = 0;

	if (!isalnum(*str)) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "first character of property (%s) not alphanum", str);
		return 1;
	}

	while (isalnum(*str) || *str == '-' || *str == '_' || *str == '.' || *str == '=')
		name[i++] = *str++;

	name[i] = '\0';
	*prop = (i == 0) ? NULL : name;

	/* skip over "/vp_number" */
	if (*str == '/') {
		do {
			str++;
		} while (isdigit(*str));
	}
	*ptr = str;
	return 0;
}

/**
 * @brief
 * 		Create a property list from a string.
 *
 * @param[in]	str	- The string being parsed
 * @param[out]	prop	- set to static char array containing the property
 * @param[out]	node_req	- node request
 *
 * @return	int
 * @retval 0 on success
 * @retval 1 on failure.
 */
static int
proplist(char **str, struct prop **plist, struct node_req *node_req)
{
	struct prop *pp;
	char *pname;
	char *pequal;

	node_req->nr_ppn = 1; /* default to 1 process per node */
	node_req->nr_cpp = 1; /* default to 1 cpu per process */
	node_req->nr_np = 1;  /* default to 1 total cpus */

	for (;;) {
		if (property(str, &pname))
			return 1;
		if (pname == NULL)
			break;

		/* special property */
		if ((pequal = strchr(pname, (int) '=')) != NULL) {

			/* identify the special property and place its value */
			/* into node_req 					 */
			*pequal = '\0';
			if (strcasecmp(pname, "ppn") == 0) {
				/* Processes (tasks) per Node */
				pequal++;
				if ((number(&pequal, &node_req->nr_ppn, 1) != 0) ||
				    (*pequal != '\0'))
					return 1;
				node_req->nr_np = node_req->nr_ppn * node_req->nr_cpp;
			} else if ((strcasecmp(pname, "cpp") == 0) ||
				   (strcasecmp(pname, "ncpus") == 0)) {
				/* CPUs (threads) per Process (task) */
				pequal++;
				if ((number(&pequal, &node_req->nr_cpp, 0) != 0) ||
				    (*pequal != '\0'))
					return 1;
				node_req->nr_np = node_req->nr_ppn * node_req->nr_cpp;
			} else {
				return 1; /* not recognized - error */
			}
		} else {
			pp = (struct prop *) malloc(sizeof(struct prop));
			if (pp == NULL)
				return 1; /* no mem */
			pp->mark = 1;
			if ((pp->name = strdup(pname)) == NULL) {
				free(pp);
				return 1;
			}
			pp->next = *plist;
			*plist = pp;
		}
		if (**str != ':')
			break;
		(*str)++;
	}
	return 0;
}

/**
 * @brief
 * 		Do a quick validation of the nodespec
 * @see
 * 		set_node_ct
 *
 * @param[in]	str	- nodespec string to be parsed
 *
 * @return	int
 * @retval	0	- success
 * @retval	>0	- failure
 */
int
validate_nodespec(char *str)
{
	int i;
	int num = 1;		  /*default: a request for 1 node*/
	struct prop *prop = NULL; /*assume sub-spec calls out no proper */
	struct node_req node_req;
	/* first quickly validate the node spec */

	if (str == NULL)
		return PBSE_BADNODESPEC;

	while (*str) {

		free_prop(prop);
		prop = NULL; /* this is a must */

		/*Determine how many nodes this subspec requests*/

		if ((i = number(&str, &num, 1)) == -1)
			return PBSE_BADNODESPEC;

		/*Determine properties the node must have and how many processors*/

		if (i == 0) {		   /* subspec specified a number */
			if (*str == ':') { /* subspec is specifying properties */
				(str)++;
				if (proplist(&str, &prop, &node_req)) {
					free_prop(prop);
					return PBSE_BADNODESPEC;
				}
			}
		} else { /* subspec doesn't specify a number */
			if (proplist(&str, &prop, &node_req)) {
				free_prop(prop);
				return PBSE_BADNODESPEC; /* err in gen of prop list */
			}
		}

		if (*str == '+')
			++str;
		else if (*str == '#')
			break;
		else if (*str != '\0')
			return PBSE_BADNODESPEC;
	}
	free_prop(prop);
	prop = NULL; /* this is a must */
	return 0;
}

#define GLOB_SZ 511
/**
 * @brief
 * 		Add the "global" spec to every sub-spec in "spec".
 *
 * @param[in,out]	spec	- spec to which "global" spec needs to be added
 * @param[in]	global	- which will be copied into every sub-spec in "spec".
 *
 * @return a malloc-ed copy of the newly modified string.
 * @retval	NULL	- error
 *
 * @par MT-safe: No
 */
static char *
mod_spec(char *spec, char *global)
{
	static char *line = NULL;
	static int line_len = 0;
	char *cp;
	int i;
	int glen;
	int len;

	if (line_len == 0) {
		line = (char *) malloc(GLOB_SZ + 1);
		if (line == NULL)
			return NULL;
		line_len = GLOB_SZ;
	}

	/* count number of times the global will be inserted into line */
	i = 1;
	glen = strlen(global);
	cp = spec;
	while ((cp = strchr(cp, (int) '+')) != NULL) {
		i++;
		cp++;
	}
	len = strlen(spec) + (i * (glen + 1)) + 1;
	if (len > line_len) {
		/* need to expand line */
		cp = realloc(line, (size_t) len);
		if (cp == NULL)
			return NULL;
		line = cp;
		line_len = len;
	}

	/* now copy spec into line appending ":global" at the end of */
	/* segment seperated by a "+"				     */

	cp = line;
	while (*spec) {
		if (*spec == '+') {
			*cp++ = ':';
			strcpy(cp, global);
			cp += glen;
		}
		*cp++ = *spec++;
	}
	*cp++ = ':';
	strcpy(cp, global);

	return (strdup(line));
}

/**
 * @brief
 * 		convert an existing nodespec to the "matching" select directive
 *
 * @param[in]	str	- node string
 * @param[in,out]	cvt_bp	- is a pointer to the current buffer
 * @param[in,out]	cvt_lenp	- is a pointer to the current buffer's length
 * @param[in]	pattr	- a list headed in an attribute that points to the specified resource_def structure
 *
 * @return	int
 * @retval	0	- success
 * @retval	>0	- pbs error
 * @retval	-1	- modifiers does not exist in "nodes specification"
 *
 * @par MT-safe: No
 */
int
cvt_nodespec_to_select(char *str, char **cvt_bp, size_t *cvt_lenp, attribute *pattr)
{
	int hcpp = 0;
	int hmem = 0;
	char *globs;
	int i;
	u_Long memamt = 0;
	int nt;
	char *nspec;
	int num = 1; /*default: a request for 1 node*/
	struct node_req node_req;
	char *pcvt;
	size_t pcvt_free;
	resource *pncpus;
	resource *pmem;
	struct prop *prop = NULL; /*assume sub-spec calls out no proper */
	int ret = -1;		  /*assume error occurs*/
	struct prop *walkprop;
	char sprintf_buf[BUFSIZ];
	resource_def *pncpusdef = NULL;
	resource_def *pmemdef = NULL;

	**cvt_bp = '\0';
	pcvt = *cvt_bp;
	pcvt_free = *cvt_lenp;

	pncpusdef = &svr_resc_def[RESC_NCPUS];
	pmemdef = &svr_resc_def[RESC_MEM];

	/*
	 * check the local copy of the "nodes" specification for any "global"
	 * modifiers.  Re-write the spec copy in expanded form if modifiers
	 * exist.  Ignore #excl and #shared as they are examined when
	 * creating the "place" directive.
	 */

	nspec = strdup(str);
	if (nspec == NULL)
		return (PBSE_SYSTEM);

	if ((globs = strchr(nspec, '#')) != NULL) {
		char *cp;
		char *hold;
		static char *excl = "excl";
		static char *shared = "shared";

		*globs++ = '\0';
		globs = strdup(globs);
		if (globs == NULL) {
			free(nspec);
			return (PBSE_SYSTEM);
		}
		while ((cp = strrchr(globs, '#')) != NULL) {
			*cp++ = '\0';
			if ((strcasecmp(cp, excl) != 0) &&
			    (strcasecmp(cp, shared) != 0)) {
				hold = mod_spec(nspec, cp);
				if (hold == NULL) {
					free(globs);
					free(nspec);
					return -1;
				}
				free(nspec);
				nspec = hold;
			}
		}
		if ((strcasecmp(globs, excl) != 0) &&
		    (strcasecmp(globs, shared) != 0)) {
			hold = mod_spec(nspec, globs);
			if (hold == NULL) {
				free(globs);
				free(nspec);
				return -1;
			}
			free(nspec);
			nspec = hold;
		}
		free(globs);
		globs = NULL;
	}
	str = nspec; /* work on the copy of the string */

	/* find the number of cpus specified in the node string */

	nt = ctcpus(str, &hcpp); /* total number of cpus requested in str */

	/* Is "ncpus" set as a separate resource? */

	if ((pncpus = find_resc_entry(pattr, pncpusdef)) == NULL) {
		if ((pncpus = add_resource_entry(pattr, pncpusdef)) == 0) {
			free(nspec);
			return (PBSE_SYSTEM);
		}
	}

	if ((pncpus->rs_value.at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) ==
	    ATR_VFLAG_SET) {

		long nc;

		/* ncpus is already set and not a default */

		nc = pncpus->rs_value.at_val.at_long;
		if (hcpp && (nt != pncpus->rs_value.at_val.at_long)) {
			/* if cpp string specificed, this is an error */
			free(nspec);
			return (PBSE_BADATVAL);
		} else if ((nc % nt) != 0) {
			/* ncpus must be multiple of number of tasks */
			free(nspec);
			return (PBSE_BADATVAL);
		} else if ((hcpp == 0) && ((nc / nt) > 1)) {
			/* append ncpus=(C/T) to each chunk */
			nt = nc / nt;
		} else
			nt = 1;

	} else
		nt = 1;

	/* How about "mem", is it set in the Resource_List */

	pmem = find_resc_entry(pattr, pmemdef);
	if (pmem &&
	    (pmem->rs_value.at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) ==
		    ATR_VFLAG_SET) {
		hmem = 1;
		memamt = get_kilobytes_from_attr(&pmem->rs_value) / ctnodes(str);
	}

	while (*str) {
		size_t needed;

		node_req.nr_ppn = 1;
		node_req.nr_cpp = 1;
		node_req.nr_np = 1;

		free_prop(prop);
		prop = NULL; /* this is a must */

		/*Determine how many nodes this subspec requests*/

		if ((i = number(&str, &num, 1)) == -1) {
			free(nspec);
			free_prop(prop);
			return ret;
		}

		/*Determine properties the node must have and how many processors*/

		if (i == 0) {		   /* subspec specified a number */
			if (*str == ':') { /* subspec is specifying properties */
				str++;
				if (proplist(&str, &prop, &node_req)) {
					free(nspec);
					free_prop(prop);
					return ret;
				}
			}
		} else { /* subspec doesn't specify a number */
			if (proplist(&str, &prop, &node_req)) {
				free(nspec);
				free_prop(prop);
				return ret; /* error in generation of prop list */
			}
		}

		/* start building the select spec */
		/* 1.  the number of chunks       */

		sprintf(sprintf_buf, "%d:", num);
		needed = strlen(sprintf_buf) + 1;
		if (cvt_overflow(pcvt_free, needed) &&
		    (cvt_realloc(cvt_bp, cvt_lenp, &pcvt, &pcvt_free) == 0)) {
			free(nspec);
			free_prop(prop);
			return (PBSE_SYSTEM);
		}
		(void) memcpy(pcvt, sprintf_buf, needed);
		pcvt = pcvt + needed - 1; /* advance to NULL byte */
		pcvt_free -= needed;

		/* 2.  the number of cpus */

		sprintf(sprintf_buf, "ncpus=%d", node_req.nr_np * nt);
		needed = strlen(sprintf_buf) + 1;
		if (cvt_overflow(pcvt_free, needed) &&
		    (cvt_realloc(cvt_bp, cvt_lenp, &pcvt, &pcvt_free) == 0)) {
			free(nspec);
			free_prop(prop);
			return (PBSE_SYSTEM);
		}
		(void) memcpy(pcvt, sprintf_buf, needed);
		pcvt = pcvt + needed - 1; /* advance to NULL byte */
		pcvt_free -= needed;

		/* 3. the amt of mem, if specified */

		if (hmem) {
			sprintf(sprintf_buf, ":mem=%lluKB", memamt);
			needed = strlen(sprintf_buf) + 1;
			if (cvt_overflow(pcvt_free, needed) &&
			    (cvt_realloc(cvt_bp, cvt_lenp, &pcvt, &pcvt_free) == 0)) {
				free(nspec);
				free_prop(prop);
				return (PBSE_SYSTEM);
			}
			(void) memcpy(pcvt, sprintf_buf, needed);
			pcvt = pcvt + needed - 1; /* advance to NULL byte */
			pcvt_free -= needed;
		}

		/* 4. now need to see if any property matches a node name */

		for (walkprop = prop; walkprop; walkprop = walkprop->next) {
			for (i = 0; i < svr_totnodes; i++) {
				if (pbsndlist[i]->nd_state & INUSE_DELETED)
					continue;
				if (strcasecmp(pbsndlist[i]->nd_name, walkprop->name) == 0) {
					walkprop->mark = 0;
					break;
				}
			}
		}
		/* 5. now turn each property into "property=True" unless */
		/* it was a nodename, then it is  "host=prop"	  */

		for (walkprop = prop; walkprop; walkprop = walkprop->next) {
			if (walkprop->mark)
				snprintf(sprintf_buf, sizeof(sprintf_buf),
					 ":%s=%s", walkprop->name, ATR_TRUE);
			else
				snprintf(sprintf_buf, sizeof(sprintf_buf),
					 ":host=%s", walkprop->name);
			needed = strlen(sprintf_buf) + 1;
			if (cvt_overflow(pcvt_free, needed) &&
			    (cvt_realloc(cvt_bp, cvt_lenp, &pcvt, &pcvt_free) == 0)) {
				free(nspec);
				free_prop(prop);
				return (PBSE_SYSTEM);
			}
			(void) memcpy(pcvt, sprintf_buf, needed);
			pcvt = pcvt + needed - 1; /* advance to NULL byte */
			pcvt_free -= needed;
		}

		/* 6. if nr_ppn != 1,  add mpiproces=nr_ppn */
		if (node_req.nr_ppn != 1) {
			sprintf(sprintf_buf, ":mpiprocs=%d", node_req.nr_ppn);
			needed = strlen(sprintf_buf) + 1;
			if (cvt_overflow(pcvt_free, needed) &&
			    (cvt_realloc(cvt_bp, cvt_lenp, &pcvt, &pcvt_free) == 0)) {
				free(nspec);
				free_prop(prop);
				return (PBSE_SYSTEM);
			}
			(void) memcpy(pcvt, sprintf_buf, needed);
			pcvt = pcvt + needed - 1; /* advance to NULL byte */
			pcvt_free -= needed;
		}

		if (*str == '+') {
			++str;
			needed = 2; /* 2 = strlen("+") + 1 */
			if (cvt_overflow(pcvt_free, needed) &&
			    (cvt_realloc(cvt_bp, cvt_lenp, &pcvt, &pcvt_free) == 0)) {
				free(nspec);
				free_prop(prop);
				return (PBSE_SYSTEM);
			}
			(void) memcpy(pcvt, "+", needed);
			pcvt = pcvt + needed - 1;
			pcvt_free -= needed;
		} else
			break;
	}
	free(nspec);
	free_prop(prop);
	return 0;
}

#define CVT_PAD 256 /* if less than this much free space, get more */

/**
 * @brief
 * 		is there room in this buffer or should we allocate more?
 *
 * @param[in] buflen is the current buffer's length
 * @param[in] needed is the amount of data we wish to append
 *
 * @return	int
 * @retval	0	- success
 * @retval	1	- overflow
 */
static int
cvt_overflow(size_t buflen, size_t needed)
{
	if ((needed > buflen) || ((buflen - needed) < CVT_PAD))
		return 1;
	else
		return 0;
}

/**
 * @brief
 * 		allocate more room in bufptr.
 *
 * @param[in,out] bp is a pointer to the current buffer
 * @param[in,out] bplen is a pointer to the current buffer's length
 * @param[in,out] curbp is the current pointer into the buffer
 * @param[in,out] bpfree is a pointer to the amount of free space in the
 * 					current buffer
 *
 * @return	int
 * @retval	1	- success
 * @retval	0	- failure
 */
static int
cvt_realloc(char **bp, size_t *bplen, char **curbp, size_t *bpfree)
{
	char *newbp;
	size_t realloc_incr = *bplen;
	ptrdiff_t curoffset = *curbp - *bp;

	if ((newbp = realloc(*bp, *bplen + realloc_incr)) == NULL) {
		return 0;
	} else {
		*bp = newbp;
		*bplen += realloc_incr;
		*bpfree += realloc_incr;
		*curbp = newbp + curoffset;
		return 1;
	}
}

#define JBINXSZ_GROW 16;
/**
 * @brief
 * 		add a job pointer into the index array of a mominfo_t.
 *
 * @par
 *		The index of the entry is used in the exec_host string following the
 *		slash character to be unique for each job running on that Mom
 *
 * @param[in,out]	pnode	- pbsnode structure
 * @param[in]	pjob	- a job pointer
 *
 * @return	int
 * @retval	>=0	- index in which the job got added
 * @retval	-1	- could not realloc memory for adding job index
 */
static int
add_job_index_to_mom(struct pbsnode *pnode, job *pjob)
{
	int i;
	size_t newn;
	size_t oldn;
	job **pnew;
	mom_svrinfo_t *psm;

	psm = (mom_svrinfo_t *) ((pnode->nd_moms[0])->mi_data);

	/* see if there is an empty slot in the array */

	for (i = 0; i < psm->msr_jbinxsz; i++) {
		if (psm->msr_jobindx[i] == NULL) {
			psm->msr_jobindx[i] = pjob;
			return i;
		}
	}

	/* didn't find an empty slot, need to expand array */

	oldn = psm->msr_jbinxsz;
	newn = oldn + JBINXSZ_GROW;

	pnew = realloc(psm->msr_jobindx, sizeof(struct job *) * newn);
	if (pnew == NULL) {
		log_err(PBSE_SYSTEM, "add_job_index_to_mom",
			"could not realloc memory for adding job index");
		return -1;
	}
	for (i = oldn; i < newn; i++)
		pnew[i] = NULL;
	psm->msr_jobindx = pnew;
	psm->msr_jbinxsz = newn;
	psm->msr_jobindx[oldn] = pjob;
	return oldn;
}

/**
 * @brief
 * 		add a job pointer into the index array of a mominfo_t.
 *
 * @par
 *		using a known, old, slot number.   Used to restore the index for a
 *		running job on server recovery.   If for some reason the correct slot
 *		is inuse by a different job, slot -1 is returned.
 *
 * @param[in,out]	pnode	- pbsnode structure
 * @param[in]	pjob	- a job pointer
 * @param[in]	slot	- slot into which job needs to be inserted.
 *
 * @return	int
 * @retval	>=0	- slot where job is inserted.
 * @retval	-1	- already in use or slot doesn't exist.
 */
static int
set_old_job_index(struct pbsnode *pnode, job *pjob, int slot)
{
	int i;
	job **pnew;
	mom_svrinfo_t *psm;

	psm = (mom_svrinfo_t *) ((pnode->nd_moms[0])->mi_data);

	/* see if the slot exists in the array */

	if (slot >= psm->msr_jbinxsz) {
		size_t oldn;
		size_t newn;

		/* slot doesn't exist, need to expand array */

		oldn = psm->msr_jbinxsz;
		newn = slot + JBINXSZ_GROW;

		pnew = realloc(psm->msr_jobindx, sizeof(struct job *) * newn);
		if (pnew == NULL) {
			log_err(PBSE_SYSTEM, "set_old_job_index",
				"could not realloc memory for adding job index");
			return -1;
		}
		for (i = oldn; i < newn; i++)
			pnew[i] = NULL;
		psm->msr_jobindx = pnew;
		psm->msr_jbinxsz = newn;
	}
	/* if slot is empty, or already this job, use slot */
	if ((psm->msr_jobindx[slot] == NULL) || (psm->msr_jobindx[slot] == pjob))
		psm->msr_jobindx[slot] = pjob;
	else
		slot = -1; /* all ready in use */

	return slot;
}

#define OUTBUF_SZ 200
/**
 * @brief
 * 		build an exec_vnode string when the operator only provided a list of
 * 		nodes.
 *
 * @par
 * 		From the select spec, assign each
 *		chunk on a round-robin basis to the nodes given as the destination.
 *
 *		This may very well overload some nodes or end up with chunks on nodes
 *		on which they do not belong,  the operator must be aware.
 *
 * @param[in]	pjob	- a job pointer
 * @param[in]	nds		- list of nodes
 *
 * @return	char *
 * @retval	builded string	- success
 * @retval	NULL	- failure
 *
 * @par MT-safe: No
 */
static char *
build_execvnode(job *pjob, char *nds)
{
	int i;
	int j;
	size_t ns;
	char **ndarray;
	int nnodes = 0;
	long nchunks;
	char *pc;
	char *psl;
	int rc;
	attribute *pschedselect;
	char *selspec;
	static size_t outbufsz = 0;
	static char *outbuf = NULL;

	if (!pjob || !nds)
		return NULL;

	pschedselect = get_jattr(pjob, JOB_ATR_SchedSelect);
	if (!is_attr_set(pschedselect))
		return (nds);

	selspec = pschedselect->at_val.at_str;

	if (outbufsz == 0) {
		outbufsz = OUTBUF_SZ;
		outbuf = malloc(outbufsz);
		if (outbuf == NULL) {
			log_err(ENOMEM, "build_execvnode", "out of  memory");
			return NULL;
		}
	}

	/* break the "plus-ed" list of nodes into an array */

	nnodes = 1;
	pc = nds;
	while ((pc = strchr(pc, (int) '+'))) {
		nnodes++;
		pc++;
	}
	ndarray = (char **) malloc(nnodes * sizeof(char *));
	if (ndarray == NULL)
		return NULL;
	memset(ndarray, 0, nnodes * sizeof(char *));

	i = 0;
	pc = parse_plus_spec(nds, &rc);

	while (pc) {
		if ((*(ndarray + i) = strdup(pc)) == NULL) {
			rc = errno;
			break;
		}
		psl = strchr(*(ndarray + i), (int) '/');
		if (psl)
			*psl = '\0';
		++i;
		pc = parse_plus_spec(NULL, &rc);
	}

	*outbuf = '\0';

	/*
        * if the number of nodes identified for ndarray (nnodes) are not equal
        * to the number of nodes identified by parse_plus_spec, then
        * the vnode specification is invalid.
        */

	if (rc || i != nnodes)
		goto done;

	/* now loop breaking up the select spec into separate chunks */
	/* and determining how many times each chunk is to be used   */

	i = 0;
	pc = parse_plus_spec(selspec, &rc);
	while (pc) {
		nchunks = strtol(pc, &pc, 10);
		if (nchunks <= 0)
			nchunks = 1;

		for (j = 0; j < nchunks; ++j) {

			ns = strlen(*(ndarray + i)) + strlen(pc) + 2;
			if ((strlen(outbuf) + ns) > outbufsz) {
				char *tmp;
				size_t newsz;

				if (ns > OUTBUF_SZ)
					newsz = outbufsz + ns;
				else
					newsz = outbufsz + OUTBUF_SZ;
				tmp = realloc(outbuf, newsz);
				if (tmp) {
					outbuf = tmp;
					outbufsz = newsz;
				} else {
					rc = PBSE_SYSTEM;
					break;
				}
			}

			strcat(outbuf, *(ndarray + i));
			if (*pc != ':')
				strcat(outbuf, ":");
			strcat(outbuf, pc);
			strcat(outbuf, "+");

			if (++i >= nnodes)
				i = 0;
		}
		pc = parse_plus_spec(NULL, &rc);
	}
	*(outbuf + strlen(outbuf) - 1) = '\0'; /* remove trailing '+' */
done:
	/* it is safe to freeing <ndarray> upto <nnodes> as it was memset'd */
	for (i = 0; i < nnodes; ++i)
		free(*(ndarray + i));
	free(ndarray);
	ndarray = NULL;
	if (rc)
		return NULL;
	else
		return (outbuf);
}

/**
 * @brief
 * 		foreach parent mom return the one that is up and with the fewest jobs
 *
 * @param[in]	pnode	- vnode
 * @param[in]	pcur_mom	- former parent Mom
 *
 * @return	mominfo_t *
 * @retval	rtnmom - mom will returned if successful
 * @reval	NULL	- what will be returned if all are down/offline
 */
static mominfo_t *
which_parent_mom(pbsnode *pnode, mominfo_t *pcur_mom)
{
	int i;
	int nj = 0;
	mominfo_t *pmom;
	mom_svrinfo_t *psvrmom;
	mominfo_t *rtnmom;

	/*
	 * If we have a Mom parent of the prior vnode, pcur_mom is not NULL,
	 * continue to use same parent if she is also a parent of this vnode.
	 */

	if (pcur_mom != NULL) {
		for (i = 0; i < pnode->nd_nummoms; ++i) {
			if (pcur_mom == pnode->nd_moms[i])
				return (pcur_mom); /* use same as before */
		}
	}

	/* no former parent Mom or she is not a parent of this vnode,
	 * find the "least busy" Mom parent of this vnode
	 */

	rtnmom = NULL; /* what will be returned if all are down/offline */

	for (i = 0; i < pnode->nd_nummoms; ++i) {
		pmom = pnode->nd_moms[i];
		psvrmom = (mom_svrinfo_t *) pmom->mi_data;

		/* if first mom or mom with fewer jobs, go with her for now */
		if (((pmom->mi_dmn_info->dmn_state & (INUSE_DOWN | INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM)) == 0) &&
		    ((psvrmom->msr_children[0]->nd_state & (INUSE_DOWN | INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM)) == 0)) {
			/* this mom/natural-vnode is not down nor offline */
			if ((rtnmom == NULL) || (nj > psvrmom->msr_numjobs)) {
				nj = psvrmom->msr_numjobs;
				rtnmom = pmom;
			}
		}
	}
	return (rtnmom);
}

/**
 * @brief assign jobs on each subnode of a node
 * 
 * subnode is a structure corresponds to each cpu within a node.
 * assign the jobid on them based on hw_ncpus count. subnodes will
 * be created based on jobs if svr_init is TRUE.
 * 
 * @param[in,out] pnode - node where jobs needs to be assigned
 * @param[in] hw_ncpus - number of cpus requested by the job
 * @param[in] jobid - job id going to land on the node
 * @param[in] svr_init - happens during server initialization?
 * @param[in] share_job - job sharing type
 * @return int 
 * @reval PBSE_* : for failure
 */
static int
assign_jobs_on_subnode(struct pbsnode *pnode, int hw_ncpus, char *jobid, int svr_init, int share_job)
{
	struct pbssubn *snp;
	struct jobinfo *jp;
	int rc = 0;

	if ((svr_init == FALSE) && (pnode->nd_state & INUSE_JOBEXCL)) {
		/* allocate node only if it is not occupied by other jobs */
		for (snp = pnode->nd_psn; snp; snp = snp->next) {
			for (jp = snp->jobs; jp; jp = jp->next) {
				if (strcmp(jp->jobid, jobid))
					return PBSE_RESCUNAV;
			}
		}
	}

	snp = pnode->nd_psn;
	if (hw_ncpus == 0) {
		/* setup jobinfo struture */
		jp = (struct jobinfo *) malloc(sizeof(struct jobinfo));
		if (jp) {
			jp->next = snp->jobs;
			jp->has_cpu = 0; /* has no cpus allocatted */
			snp->jobs = jp;
			jp->jobid = strdup(jobid);
			if (!jp->jobid)
				rc = PBSE_SYSTEM;
		} else
			rc = PBSE_SYSTEM;

	} else {
		struct pbssubn *lst_sn;
		int ncpus;

		lst_sn = NULL;
		for (ncpus = 0; ncpus < hw_ncpus; ncpus++) {

			while (snp->inuse != INUSE_FREE) {
				if (snp->next)
					snp = snp->next;
				else if (svr_init == TRUE) {
					/*
						* Server is in the process of recovering jobs at
						* start up. Haven't contacted the Moms yet, so
						* unsure about the number of cpus.  So add as many
						* subnodes as needed to hold all of the job chunks
						* which were allocated to the node.
						*/
					if ((snp = create_subnode(pnode, lst_sn)) == NULL) {
						return PBSE_SYSTEM;
					}
					break;
				} else
					break; /* if last subnode, use it even if in use */
			}

			if (share_job == VNS_FORCE_EXCL)
				snp->inuse |= INUSE_JOBEXCL;
			else
				snp->inuse |= INUSE_JOB;

			pnode->nd_nsnfree--;
			/*
			* Store the last subnode of parent node list.
			* This removes the need to find the last node of
			* parent node's list, in create_subnode().
			*/
			lst_sn = snp;
			if (pnode->nd_nsnfree < 0) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
					  LOG_ALERT, pnode->nd_name,
					  "free CPU count went negative on node");
			}

			/* setup jobinfo struture */
			jp = (struct jobinfo *) malloc(sizeof(struct jobinfo));
			if (jp) {
				jp->next = snp->jobs;
				jp->has_cpu = 1; /* has a cpu allocatted */
				snp->jobs = jp;
				jp->jobid = strdup(jobid);
				if (!jp->jobid) {
					rc = PBSE_SYSTEM;
					goto end;
				}
			} else {
				rc = PBSE_SYSTEM;
				goto end;
			}

			DBPRT(("set_node: node: %s/%ld to job %s, still free: %ld\n",
			       pnode->nd_name, snp->index, jobid,
			       pnode->nd_nsnfree))
		}
	}

end:
	if (rc == PBSE_SYSTEM)
		log_errf(rc, __func__, "Failed to allocate memory!");
	return rc;
}

/**
 * @brief update node state based on the job sharing type
 * and node sharing type. For instance:
 * node-state is set to exclusive if either of them are exclusive.
 * 
 * @param[in,out] pnode - node for which state is updated
 * @param[in] share_job - job sharing type
 */
static void
update_node_state(struct pbsnode *pnode, int share_job)
{
	int share_node = get_nattr_long(pnode, ND_ATR_Sharing);

	if (share_node == (int) VNS_FORCE_EXCL || share_node == (int) VNS_FORCE_EXCLHOST) {
		set_vnode_state(pnode, INUSE_JOBEXCL, Nd_State_Or);
	} else if (share_node == VNS_IGNORE_EXCL) {
		if (pnode->nd_nsnfree <= 0)
			set_vnode_state(pnode, INUSE_JOB, Nd_State_Or);
		else
			set_vnode_state(pnode, ~(INUSE_JOB | INUSE_JOBEXCL), Nd_State_And);
	} else if (share_node == VNS_DFLT_EXCL || share_node == VNS_DFLT_EXCLHOST) {
		if (share_job == VNS_IGNORE_EXCL) {
			if (pnode->nd_nsnfree <= 0)
				set_vnode_state(pnode, INUSE_JOB, Nd_State_Or);
			else
				set_vnode_state(pnode, ~(INUSE_JOB | INUSE_JOBEXCL), Nd_State_And);
		} else {
			set_vnode_state(pnode, INUSE_JOBEXCL, Nd_State_Or);
		}
	} else if (share_job == VNS_FORCE_EXCL) {
		set_vnode_state(pnode, INUSE_JOBEXCL, Nd_State_Or);
	} else if (pnode->nd_nsnfree <= 0) {
		set_vnode_state(pnode, INUSE_JOB, Nd_State_Or);
	} else {
		set_vnode_state(pnode, ~(INUSE_JOB | INUSE_JOBEXCL), Nd_State_And);
	}
}

/**
 * @brief Determines job sharing type
 * Job sharing type is determined based on the job placement directive
 * which will be in the form of job's resource.
 * 
 * @param[in] pjob - job struct
 * @return int
 * @retval enum vnode_sharing
 */
int
get_job_share_type(struct job *pjob)
{
	attribute *patresc; /* ptr to job/resv resource_list */
	patresc = get_jattr(pjob, JOB_ATR_resource);
	int share_job = VNS_UNSET;
	resource *pplace;
	resource_def *prsdef;

	prsdef = &svr_resc_def[RESC_PLACE];
	pplace = find_resc_entry(patresc, prsdef);
	if (pplace && pplace->rs_value.at_val.at_str) {
		if ((place_sharing_type(pplace->rs_value.at_val.at_str,
					VNS_FORCE_EXCLHOST) != VNS_UNSET) ||
		    (place_sharing_type(pplace->rs_value.at_val.at_str,
					VNS_FORCE_EXCL) != VNS_UNSET)) {
			share_job = VNS_FORCE_EXCL;
		} else if (place_sharing_type(pplace->rs_value.at_val.at_str,
					      VNS_IGNORE_EXCL) == VNS_IGNORE_EXCL)
			share_job = VNS_IGNORE_EXCL;
		else
			share_job = VNS_DFLT_SHARED;
	}

	return share_job;
}

#define EHBUF_SZ 500
/**
 * @brief
 *	 	set_nodes - take the node plus resource spec from the scheduler or
 *		operator and allocate the named nodes internally.
 *
 * @par Functionality:
 *
 *		Takes the node plus resource spec from the scheduler or operator and
 *		allocate the named nodes internally.  If the operator only provides
 *		a list of nodes,  we attempt to associate the resource chunks from the
 *		select spec with the nodes, see build_execvnode().
 *
 *		"mk_new_host" set true (non-zero) directs that (1) a new exec_host
 *		string should be created and returned and the job should be added to
 *		the job index array on each Mom,  or if false the existing exec_host
 *		string should be used to reset the job_index array on the Moms to
 *		the indices already listed in the existing exec_host.
 *
 *		The job index array is used to provide a "unique" number for each chunk
 *		on a given Mom.  This appears in the exec_host string following the "/"
 *		and was used by Mom on an IBM SP to set the switch interface; it is
 *		currently maintained only for backward compatibility.
 *
 *		On a non error (zero) exit, "execvnod_out" is set to point to either
 *		the original or possibly modified exec_vnode string.
 *
 *		On a non error exit,  "hoststr" is set to point to a new exec_host
 *		string if "mk_new_host" is true or left pointing to the orignal
 *		exec_host string if "mk_new_host" is false.
 *
 *		execvnod_out and hoststr should NOT be freed as they point
 *		either to the original strings or a string living in a static buffer.
 *
 *		"svr_init" is only set to TRUE when the server is recovering running
 *		jobs on startup. This flag tells the function to ignore certain
 *		errors, such as:
 *	   	- unknown resources
 *			It is possible that a resource definition has been removed,
 *			we still wish to have the job show up on the nodes; so ignore
 *			this error.
 *	   	- unlicensed nodes
 *			On initialization, the nodes have not yet been Licensed, and
 *			since they may use fixed licenses, ignore this step.
 *	   	- Job exclusive allocation
 *			Since the node was assigned to the job, just reassigne it
 *			without this check.
 *
 * @param[in]	pobj         -  pointer to an object, either job or reservation
 * @param[in]	objtype      -  set to JOB_OBJECT if pobj points to a job,
 *                              otherwise pobj points to a reservation object
 * @param[in]	execvnod_in  -  original vnode list from scheduler/operator
 * @param[out]	execvnod_out -  original or modified list of vnodes and
 *                              resources, becomes exec_vnode value.
 * @param[in]	hoststr      -  original or modified exec_host string, see
 *                              mk_new_host.
 * @param[in]	hoststr2      - original or modified exec_host2 string
 *
 * @param[in]	mk_new_host  -  if True (non-zero), this function is to create
 *                              a new hoststr including new job indices,
 *                              otherwise return existing exec_host unchanged.
 * @param[in]	svr_init     -  if True, server is recovering jobs.
 *
 * @return	int
 * @retval	PBSE_NONE : success
 * @retval	non-zero  : various PBSE error returns.
 *
 * @par Side Effects: None
 *
 * @par MT-safe: No
 */
int
set_nodes(void *pobj, int objtype, char *execvnod_in, char **execvnod_out, char **hoststr, char **hoststr2, int mk_new_host, int svr_init)
{
	char *chunk;
	int setck;
	char *execvncopy;
	int hasprn; /* set if chunk grouped in parenthesis */
	int hostcpus;
	int i;
	char *last;
	char *execvnod = NULL;
	int ndindex;
	int nelem;
	mominfo_t *parentmom;
	mominfo_t *parentmom_first = NULL;
	char *peh = NULL;
	char *pehnxt = NULL;
	job *pjob = NULL;
	char *pc;
	char *pc2;
	int share_job = VNS_UNSET;
	char *vname;
	resc_resv *presv = NULL;
	int tc; /* num of nodes being allocated  */
	struct pbsnode *pnode;
	struct key_value_pair *pkvp;
	struct howl {
		pbsnode *hw_pnd;   /* ptr to node */
		pbsnode *hw_natvn; /* pointer to "natural" vnode */
		char *hw_mom_host;
		int hw_mom_port;
		mominfo_t *hw_mom;
		int hw_ncpus; /* num of cpus needed from this node */
		int hw_chunk; /* non-zero if start of a chunk      */
		int hw_index; /* index of job on Mom if hw_chunk   */
		int hw_htcpu; /* sum of cpus on this Mom, hw_chuhk */
	} * phowl;
	static size_t ehbufsz = 0;
	static size_t ehbufsz2 = 0;
	static char *ehbuf = NULL;
	static char *ehbuf2 = NULL;
	int rc = 0;

	if (ehbufsz == 0) {
		/* allocate the basic buffer for exec_host string */
		ehbuf = (char *) malloc(EHBUF_SZ);
		if (ehbuf == NULL)
			return (PBSE_SYSTEM);
		ehbufsz = EHBUF_SZ;
	}

	if (ehbufsz2 == 0) {
		/* allocate the basic buffer for exec_host string */
		ehbuf2 = (char *) malloc(EHBUF_SZ);
		if (ehbuf2 == NULL)
			return (PBSE_SYSTEM);
		ehbufsz2 = EHBUF_SZ;
	}

	if (objtype == JOB_OBJECT) {

		pjob = (job *) pobj;

		if (execvnod_in == NULL) {
			execvnod_in = *hoststr;
		}
		if (strchr(execvnod_in, (int) ':') == NULL) {
			/* need to take node only list and build a pseudo */
			/* exec_vnode string with the resources included  */
			execvnod = build_execvnode(pjob, execvnod_in);
		} else {
			execvnod = execvnod_in;
		}
		if (execvnod == NULL)
			return PBSE_BADNODESPEC;

		if (!strlen(execvnod)) {
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				   pjob->ji_qs.ji_jobid, "Unknown node received");
			return PBSE_UNKNODE;
		}

		/* are we to allocate the nodes "excl" ? */
		share_job = get_job_share_type(pjob);

	} else if (objtype == RESC_RESV_OBJECT) {
		presv = (resc_resv *) pobj;
		execvnod = execvnod_in;
	}

	/* first count the number of vnodes */

	tc = 1;
	pc = execvnod;

	while ((pc = strchr(pc, (int) '+')) != NULL) {
		++tc;
		pc++;
	}

	/* allocate an howl array to hold info about allocated nodes */

	phowl = (struct howl *) malloc(tc * sizeof(struct howl));
	if (phowl == NULL)
		return (PBSE_SYSTEM);

	ndindex = 0;

	/* parse the exec_vnode string into a string of chunks and */
	/* then parse each chunk for the required resources        */

	execvncopy = strdup(execvnod);
	if (execvncopy == NULL) {
		rc = PBSE_SYSTEM;
		goto end;
	}

	if (mk_new_host == 0) {
		if (hoststr && *hoststr)
			peh = *hoststr; /* use old exec_host to redo index arrays */
		else
			peh = ""; /* a dummy null string */
	}
	pehnxt = peh;

	setck = 1; /* set flag to indicate likely end of chunk */
	/* therefore next entry is start of new chunk */
	hostcpus = 0; /* number of cpus from all vnodes on host   */
	/* from which chunk was taken		      */

	parentmom = NULL; /* use for multi-mom vnodes		      */

	/* note: hasprn is set based on finding '(' or ')'
	 *	> 0 = found '(' at start of substring
	 *	= 0 = no parens or found both in one substring
	 *	< 0 = found ')' at end of substring
	 */

	for (chunk = parse_plus_spec_r(execvncopy, &last, &hasprn);
	     chunk; chunk = parse_plus_spec_r(last, &last, &hasprn)) {

		if (parse_node_resc(chunk, &vname, &nelem, &pkvp) == 0) {
			if ((pnode = find_nodebyname(vname)) == NULL) {
				if (objtype == JOB_OBJECT) {
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
						   pjob->ji_qs.ji_jobid, "Unknown node %s received", vname);
				} else if (objtype == RESC_RESV_OBJECT)
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV, LOG_INFO,
						   presv->ri_qs.ri_resvID, "Unknown node %s received", vname);
				free(execvncopy);
				rc = PBSE_UNKNODE;
				goto end;
			}

			if ((pnode->nd_state & VNODE_UNAVAILABLE) && (svr_init == FALSE))
				if ((objtype == RESC_RESV_OBJECT) && (presv->ri_qs.ri_resvID[0] != PBS_MNTNC_RESV_ID_CHAR) /*&& (presv->ri_qs.ri_state == RESV_UNCONFIRMED)*/)
					set_resv_for_degrade(pnode, presv);

			if (pjob != NULL) { /* only for jobs do we warn if a mom */
				/* hook has not been sent */
				for (i = 0; i < pnode->nd_nummoms; ++i) {

					if ((pnode->nd_moms[i] != NULL) &&
					    (sync_mom_hookfiles_count(pnode->nd_moms[i]) > 0)) {
						snprintf(log_buffer, sizeof(log_buffer),
							 "vnode %s's parent mom %s:%d has a pending copy hook or delete hook request", pnode->nd_name, pnode->nd_moms[i]->mi_host,
							 pnode->nd_moms[i]->mi_port);
						log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE,
							  LOG_WARNING, pjob->ji_qs.ji_jobid, log_buffer);
						break;
					}
				}
			}

			(phowl + ndindex)->hw_pnd = pnode;
			(phowl + ndindex)->hw_ncpus = 0;
			(phowl + ndindex)->hw_chunk = setck;
			(phowl + ndindex)->hw_index = -1; /* will fill in later */
			(phowl + ndindex)->hw_htcpu = 0;
			if (setck == 1) { /* start of new chunk on host */
				if (mk_new_host) {

					/* look up "natural" vnode name for either 'the Mom' */
					/* or 'a Mom' for the real vnode.  This is used in   */
					/* the exec_host string                              */
					if (pnode->nd_nummoms > 1) { /* multi-mom */
						parentmom = which_parent_mom(pnode, parentmom);
						if (parentmom == NULL) {
							/* cannot find a Mom that works */
							free(execvncopy);
							rc = PBSE_SYSTEM;
							goto end;
						}
						/*
						 * save the "first" allocated Mom for incr
						 * the count of jobs on that Mom; used in
						 * load-balancing across multi-Mom vnodes
						 * [i.e. in a Cray]
						 */
						if (parentmom_first == NULL)
							parentmom_first = parentmom;

						/* record "native" vnode for the chosen Mom */
						(phowl + ndindex)->hw_natvn = ((struct mom_svrinfo *) (parentmom->mi_data))->msr_children[0];
						(phowl + ndindex)->hw_mom = parentmom;
					} else if (pnode->nd_nummoms == 1) {
						/* single parent Mom, just use her */
						(phowl + ndindex)->hw_natvn = ((mom_svrinfo_t *) (pnode->nd_moms[0]->mi_data))->msr_children[0];
						(phowl + ndindex)->hw_mom = pnode->nd_moms[0];
						if (parentmom_first == NULL)
							parentmom_first = pnode->nd_moms[0];
						/* if the first chunk goes to a single parent */
						/* set parentmom in case the next chunk can   */
						/* also go there;  otherwise keep the old     */
						/* parentmom value.                           */
						if (parentmom == NULL)
							parentmom = parentmom_first;
					}
				} else if (objtype == JOB_OBJECT) {
					/*
					 * exec_host applies to job's only ...
					 * Have an existing exec_host string which is being
					 * kept.  Reuse it to obtain the "natural" vnode and
					 * the "index" number which we will use in
					 * set_old_job_index() later
					 */
					while (*pehnxt && (*pehnxt != '/'))
						pehnxt++;
					*pehnxt = '\0';
					(phowl + ndindex)->hw_natvn = find_nodebyname(peh);
					if ((phowl + ndindex)->hw_natvn == NULL) {
						log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
							   pjob->ji_qs.ji_jobid, "Unknown node %s received", peh);
						free(phowl);
						free(execvncopy);
						return (PBSE_UNKNODE);
					}
					if ((phowl + ndindex)->hw_pnd->nd_moms)
						(phowl + ndindex)->hw_mom = (phowl + ndindex)->hw_pnd->nd_moms[0];
					else {
						(phowl + ndindex)->hw_mom_host = (phowl + ndindex)->hw_pnd->nd_attr[ND_ATR_Mom].at_val.at_str;
						(phowl + ndindex)->hw_mom_port = (phowl + ndindex)->hw_pnd->nd_attr[ND_ATR_Port].at_val.at_long;
					}
					*pehnxt = '/';
					(phowl + ndindex)->hw_index = atoi(++pehnxt);
					while (*pehnxt && (*pehnxt != '+'))
						pehnxt++;
					if (*pehnxt == '+')
						peh = ++pehnxt;
					else
						peh = pehnxt;
					if (parentmom_first == NULL)
						parentmom_first = (phowl + ndindex)->hw_natvn->nd_moms[0];
				}
			}

			/* set setck to indicate if next vnode starts a new chunk */
			/* stays the same if hasprn == 0			  */
			if (hasprn > 0)
				setck = 0; /* continuation of multi-vnode chunk  */
			else if (hasprn < 0)
				setck = 1; /* end of multi-vnode chunk,start new */

			for (i = 0; i < nelem; i++) {
				if (strcasecmp("ncpus", (pkvp + i)->kv_keyw) == 0)
					(phowl + ndindex)->hw_ncpus = atoi((pkvp + i)->kv_val);
				else {
					if ((find_resc_def(svr_resc_def, (pkvp + i)->kv_keyw) == NULL) && (svr_init == FALSE)) {
						free(execvncopy);
						resc_in_err = strdup((pkvp + i)->kv_keyw);
						rc = PBSE_UNKRESC;
						goto end;
					}
				}
			}

			hostcpus += (phowl + ndindex)->hw_ncpus;

			if (setck == 1) {
				(phowl + ndindex)->hw_htcpu = hostcpus;
				hostcpus = 0;
			}

		} else {
			/* Error */
			free(execvncopy);
			rc = PBSE_BADATVAL;
			goto end;
		}

		ndindex++;
	}

	free(execvncopy);
	execvncopy = NULL;

	/* now we have an array of the required nodes */

	if (objtype == JOB_OBJECT) {
		size_t ehlen;
		size_t ehlen2;

		/* FOR JOBS ... */

		/* make sure that the buf for the new exec_host str is sufficent */
		/* allow room for each name plus /NNNNNN*MMMMMM+ (16 characters) */
		ehlen = 0;
		ehlen2 = 0;

		for (i = 1; i < ndindex; ++i) {
			if ((phowl + i)->hw_chunk) {
				ehlen += strlen((phowl + i)->hw_natvn->nd_name) + 16;
				if ((phowl + i)->hw_mom)
					ehlen2 += strlen((phowl + i)->hw_mom->mi_host);
				else
					ehlen2 += strlen((phowl + i)->hw_mom_host);
				ehlen2 += 6 + 16;
			}
		}

		if (ehlen >= ehbufsz) {
			/* need to grow buffer */
			pc = realloc(ehbuf, ehlen + EHBUF_SZ);
			if (pc) {
				ehbuf = pc;
				ehbufsz = ehlen + EHBUF_SZ;
			} else {
				rc = PBSE_SYSTEM;
				goto end;
			}
		}

		if (ehlen2 >= ehbufsz2) {
			/* need to grow buffer */
			pc2 = realloc(ehbuf2, ehlen2 + EHBUF_SZ);
			if (pc2) {
				ehbuf2 = pc2;
				ehbufsz2 = ehlen2 + EHBUF_SZ;
			} else {
				rc = PBSE_SYSTEM;
				goto end;
			}
		}

		/*
		 * Add a "jobinfo" structure to each subnode of *pnode that
		 * is specified.
		 */

		for (i = 0; i < ndindex; ++i) {

			pnode = (phowl + i)->hw_pnd;

			if ((svr_init == TRUE) &&
			    ((check_job_substate(pjob, JOB_SUBSTATE_SUSPEND) ||
			      check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP))) &&
			    (is_jattr_set(pjob, JOB_ATR_resc_released)))
				/* No need to add suspended job to jobinfo structure and assign CPU slots to it*/
				break;

			rc = assign_jobs_on_subnode(pnode, (phowl + i)->hw_ncpus, pjob->ji_qs.ji_jobid, svr_init, share_job);
			if (rc != PBSE_NONE)
				goto end;

			update_node_state(pnode, share_job);

			/*
			 * now for each new chunk, add the job to the Mom job index
			 * array anew or reusing the indices from the existing
			 * exec_host
			 */

			if ((phowl + i)->hw_chunk && (phowl + i)->hw_mom) {
				if (mk_new_host) {
					/* add new job index to Mom and save it    */
					/* for creating the (new) exec_host string */
					(phowl + i)->hw_index = add_job_index_to_mom((phowl + i)->hw_natvn, pjob);
				} else {
					/* as we are keeping the exec_host from before */
					/* reset the job index to the value saved from */
					/* parsing the old exec_host earlier           */
					(phowl + i)->hw_index =
						set_old_job_index((phowl + i)->hw_natvn,
								  pjob, (phowl + i)->hw_index);
				}
			}
		}

		/* set flag in job that it has nodes associated with it */
		/* increment the number of jobs on the job's Mother Superior */

		pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HasNodes;

		/*
		 * increment the number of jobs on the job's Mother Superior
		 * this has to be done in association with setting
		 * JOB_SVFLG__HasNodes, see free_nodes()
		 * It is decremented in free_nodes()
		 */
		if (parentmom_first)
			((mom_svrinfo_t *) (parentmom_first->mi_data))->msr_numjobs++;

		if (mk_new_host) {

			/* make the new exec_host string */

			*ehbuf = '\0';
			pc = ehbuf;
			*ehbuf2 = '\0';
			pc2 = ehbuf2;
			for (i = 0; i < ndindex; ++i) {
				if ((phowl + i)->hw_chunk) {
					sprintf(pc, "%s/%d", (phowl + i)->hw_natvn->nd_name,
						(phowl + i)->hw_index);

					if ((phowl + i)->hw_mom)
						sprintf(pc2, "%s:%d/%d", (phowl + i)->hw_mom->mi_host,
							(phowl + i)->hw_mom->mi_port,
							(phowl + i)->hw_index);
					else
						sprintf(pc2, "%s:%d/%d", (phowl + i)->hw_mom_host,
							(phowl + i)->hw_mom_port,
							(phowl + i)->hw_index);

					pc = ehbuf + strlen(ehbuf);
					pc2 = ehbuf2 + strlen(ehbuf2);

					if ((phowl + i)->hw_htcpu != 1) {
						sprintf(pc, "*%d", (phowl + i)->hw_htcpu);
						pc = ehbuf + strlen(ehbuf);

						sprintf(pc2, "*%d", (phowl + i)->hw_htcpu);
						pc2 = ehbuf2 + strlen(ehbuf2);
					}
					*(pc++) = '+';
					*pc = '\0';

					*(pc2++) = '+';
					*pc2 = '\0';
				}
			}
			*(ehbuf + strlen(ehbuf) - 1) = '\0';   /* remove last '+' */
			*(ehbuf2 + strlen(ehbuf2) - 1) = '\0'; /* remove last '+' */
		}

	} else {

		/* FOR RESERVATIONS */

		/* now for each node, create a resvinfo structure */
		for (i = 0; i < ndindex; ++i) {

			struct resvinfo *rp;
			/* Create a list of pointers to each vnode associated to the reservation */
			rp = (struct resvinfo *) malloc(sizeof(struct resvinfo));
			if (rp) {
				pbsnode_list_t *tmp_pl;
				rp->next = (phowl + i)->hw_pnd->nd_resvp;
				(phowl + i)->hw_pnd->nd_resvp = rp;
				rp->resvp = presv;

				/* create a backlink from the reservation to the vnode */
				tmp_pl = malloc(sizeof(pbsnode_list_t));
				if (tmp_pl == NULL) {
					free(phowl);
					return PBSE_SYSTEM;
				}
				tmp_pl->next = presv->ri_pbsnode_list;
				tmp_pl->vnode = (phowl + i)->hw_pnd;
				presv->ri_pbsnode_list = tmp_pl;
				presv->ri_vnodect++;
				DBPRT(("%s: Adding %s to %s\n", __func__,
				       (phowl + i)->hw_pnd->nd_name, presv->ri_qs.ri_resvID))
			}
		}
		presv->ri_qs.ri_svrflags |= RESV_SVFLG_HasNodes;
	}

	*execvnod_out = execvnod;
	if (mk_new_host) {
		*hoststr = ehbuf;
		*hoststr2 = ehbuf2;
	}

end:
	free(phowl);
	return rc;
}

static void
remove_job_index_from_mom(job *pjob, struct pbsnode *pnode)
{
	int i;
	int j;
	mom_svrinfo_t *psvrmom;

	if (pnode == NULL)
		return;

	for (i = 0; i < pnode->nd_nummoms; i++) {
		if (pnode->nd_moms[i] == NULL)
			continue;
		psvrmom = (mom_svrinfo_t *) (pnode->nd_moms[i]->mi_data);

		for (j = 0; j < psvrmom->msr_jbinxsz; j++) {
			if (psvrmom->msr_jobindx[j] == pjob) {
				psvrmom->msr_jobindx[j] = NULL;
			}
		}
	}
}

/**
 * @brief
 * 		free nodes allocated to a job
 *
 * @param[in,out]	pjob	- job structure
 *
 * @return	void
 */
void
free_nodes(job *pjob)
{
	struct pbsnode *pnode;
	mom_svrinfo_t *psvrmom;
	char *execvnod_in = NULL;
	char *execvncopy;
	char *chunk;
	char *last;
	int hasprn;
	char *vname;
	int nelem;
	struct key_value_pair *pkvp;
	char *execvnod = NULL;

	/* decrement number of jobs on the Mom who is the first Mom */
	/* for the job, Mother Superior; incremented in set_nodes() */
	/* and saved in ji_destin in assign_hosts()		    */
	if (((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HasNodes) != 0) &&
	    (pjob->ji_qs.ji_destin[0] != '\0')) {
		pnode = find_nodebyname(pjob->ji_qs.ji_destin);
		if (pnode) {
			psvrmom = pnode->nd_moms[0]->mi_data;
			if (--psvrmom->msr_numjobs < 0)
				psvrmom->msr_numjobs = 0;
		}
	}

	/* Now loop through the Moms and remove the jobindx entry */
	/*  remove this jobs's jobinfo entry from each vnode   */

	if (is_jattr_set(pjob, JOB_ATR_exec_vnode_orig))
		execvnod_in = get_jattr_str(pjob, JOB_ATR_exec_vnode_orig);
	else if (is_jattr_set(pjob, JOB_ATR_exec_vnode))
		execvnod_in = get_jattr_str(pjob, JOB_ATR_exec_vnode);

	if (execvnod_in == NULL) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "in free_nodes and no exec_vnode");
		return;
	}

	if (strchr(execvnod_in, (int) ':') == NULL) {
		/* need to take node only list and build a pseudo */
		/* exec_vnode string with the resources included  */
		execvnod = build_execvnode(pjob, execvnod_in);
	} else {
		execvnod = execvnod_in;
	}
	execvncopy = strdup(execvnod);
	if (execvncopy == NULL)
		return;

	chunk = parse_plus_spec_r(execvncopy, &last, &hasprn);

	while (chunk) {
		if (parse_node_resc(chunk, &vname, &nelem, &pkvp) == 0) {
			pnode = find_nodebyname(vname);
			remove_job_index_from_mom(pjob, pnode);
			deallocate_job_from_node(pjob->ji_qs.ji_jobid, pnode);
			chunk = parse_plus_spec_r(last, &last, &hasprn);
		}
	}
	free(execvncopy);
	pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_HasNodes;
}

/**
 * @brief
 * 		free nodes allocated to a reservation object
 *
 *		This function is the analog of "free_nodes" for job objects
 *
 * @param[in]	presv	- The reservation for which nodes are freed
 *
 * @return void
 *
 * @par Side-effects: This function will unset the resv-exclusive node state if
 * the reservation has a start time in the past. Care must be taken with
 * standing reservations.
 *
 * @par MT-safe: No
 */
void
free_resvNodes(resc_resv *presv)
{
	struct pbsnode *pnode;
	struct resvinfo *rinfp, *prev;
	int i;
	pbsnode_list_t *pnl;
	pbsnode_list_t *pnl_next;

	DBPRT(("%s: entered\n", __func__))
	for (i = 0; i < svr_totnodes; i++) {
		pnode = pbsndlist[i];

		for (prev = NULL, rinfp = pnode->nd_resvp; rinfp;) {

			if (rinfp->resvp != presv) {
				prev = rinfp;
				rinfp = rinfp->next;
				continue;
			}

			/* garbage collect the pbsnode_list */
			for (pnl = presv->ri_pbsnode_list, pnl_next = pnl; pnl_next; pnl = pnl_next) {
				pnl_next = pnl->next;
				free(pnl);
			}
			presv->ri_pbsnode_list = NULL;

			/* free from provisioning list, if node was in wait_prov */
			free_prov_vnode(pnode);

			/* Unset the resv-exclusive bit if set and
			 * the node was associated to a running reservation
			 * that is either being deleted or just ended.
			 */
			if (pnode->nd_state & INUSE_RESVEXCL &&
			    presv->ri_qs.ri_stime <= time_now)
				set_vnode_state(pnode, ~INUSE_RESVEXCL, Nd_State_And);

			DBPRT(("Freeing resvinfo on node %s from reservation %s\n",
			       pnode->nd_name, presv->ri_qs.ri_resvID))
			if (prev == NULL) {
				pnode->nd_resvp = rinfp->next;
				free(rinfp);
				rinfp = pnode->nd_resvp;
			} else {
				prev->next = rinfp->next;
				free(rinfp);
				rinfp = prev->next;
			}
		}
	}
	presv->ri_vnodect = 0;
	presv->ri_qs.ri_svrflags &= ~RESV_SVFLG_HasNodes;
}

/**
 * @brief
 *	Does a check to make sure a resource value  in 'presc'
 *	has not gone negative, and if so, reset value to 0, and
 *	log a message.
 *
 * @param[in]	prdef	- resource definition of 'presc'
 * @param[in]	presc	- resource in question
 * @param[in]	noden	- non-NULL if resources coming from a vnode
 *
 * @return void
 */
static void
check_for_negative_resource(resource_def *prdef, resource *presc, char *noden)
{
	int nerr = 0;

	if ((prdef == NULL) || (presc == NULL)) {
		return;
	}
	/* make sure nothing in resources_assigned goes negative */
	switch (prdef->rs_type) {
		case ATR_TYPE_LONG:
			if (presc->rs_value.at_val.at_long < 0) {
				presc->rs_value.at_val.at_long = 0;
				nerr = 1;
			}
			break;
		case ATR_TYPE_LL:
			if (presc->rs_value.at_val.at_ll < 0) {
				presc->rs_value.at_val.at_ll = 0;
				nerr = 1;
			}
			break;
		case ATR_TYPE_SHORT:
			if (presc->rs_value.at_val.at_short < 0) {
				presc->rs_value.at_val.at_short = 0;
				nerr = 1;
			}
			break;
		case ATR_TYPE_FLOAT:
			if (presc->rs_value.at_val.at_float < 0.0) {
				presc->rs_value.at_val.at_float = 0.0;
				nerr = 1;
			}
			break;
	}

	if (nerr) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "resource %s went negative on node",
			 prdef->rs_name);
		if (noden) {
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
				  LOG_ALERT, noden, log_buffer);
		} else {
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER,
				  LOG_ALERT, msg_daemonname, log_buffer);
		}
	}
}

/**
 * @brief
 * 		adjust the resources_assigned on a node.
 *
 * @par
 *		Called with the node name, the node ordinal (0 for first node),
 *		the +/- operator, the resource name, and the resource value.
 *
 * @param[out]	noden	- node name
 * @param[in]	aflag	- node ordinal (0 for first node)
 * @param[in]	batch_op	- operator of type enum batch_op.
 * @param[in]	prdef	- resource structure which stores resource name
 * @param[in]	val	- resource value
 * @param[in]	hop	- always called with 0, this values checks for the level of indirectness.
 *
 * @return	int
 * @retval	0	- success
 * @retval	!=0	- failure code
 */
static int
adj_resc_on_node(char *noden, int aflag, enum batch_op op, resource_def *prdef, char *val, int hop)
{
	pbsnode *pnode;
	resource *presc;
	attribute *pattr;
	int rc;
	attribute tmpattr;

	/* make sure there isn't multiple levels of indirectness */
	/* resource->resource->resource */

	if (hop > 1) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "multiple level of indirectness for resource %s",
			 prdef->rs_name);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
			  LOG_ALERT, noden, log_buffer);
		return (PBSE_INDIRECTHOP);
	}

	/* If it is accumulated for the Nth node, then */

	if ((prdef->rs_flags & aflag) == 0)
		return 0;

	/* find the node */

	pnode = find_nodebyname(noden);
	if (pnode == NULL)
		return PBSE_UNKNODE;

	/* find the resources_assigned resource for the node */

	pattr = get_nattr(pnode, ND_ATR_ResourceAssn);
	if ((presc = find_resc_entry(pattr, prdef)) == NULL) {
		presc = add_resource_entry(pattr, prdef);
		if (presc == NULL)
			return PBSE_INTERNAL;
	}
	if ((presc->rs_value.at_flags & ATR_VFLAG_INDIRECT) &&
	    (*presc->rs_value.at_val.at_str == '@')) {

		/* indirect reference to another vnode, recurse w/ that node */

		noden = presc->rs_value.at_val.at_str + 1;
		return (adj_resc_on_node(noden, aflag, op, prdef, val, ++hop));
	}

	/* decode the resource value and +/- it to the attribute */

	memset((void *) &tmpattr, 0, sizeof(attribute));
	rc = 0;

	if ((rc = prdef->rs_decode(&tmpattr, ATTR_rescassn, prdef->rs_name, val)) != 0)
		return rc;
	rc = prdef->rs_set(&presc->rs_value, &tmpattr, op);
	if (op == DECR) {
		check_for_negative_resource(prdef, presc, noden);
	}
	return rc;
}

/**
 * @brief
 * 		update the resources assigned at the vnode level
 *		for a job.   Resources_assigned.X is incremented or decremented
 *		based on the operator.
 *
 * @par
 *		The resource list is taken from the exec_vnode string of the job.
 *		It is in the form: NodeA:resc=val:resc=val+NodeB:...
 * @par
 *		Each "chunk" (subspec between plus signs) is broken into the vnode
 *		name and a key_value_pair array of resources and values.  For each
 *		resource, the corresponding resource (if present) in the vnodes's
 *		resources_assigned is adjusted.
 *
 * @param[in]	pjob	- job to update
 * @param[in]	pexech	- exec_vnode string
 * @param[in]	op	- operator of type enum batch_op.
 *
 * @return	void
 */
void
update_job_node_rassn(job *pjob, attribute *pexech, enum batch_op op)
{
	int asgn = ATR_DFLAG_ANASSN | ATR_DFLAG_FNASSN;
	char *chunk;
	int j;
	int nelem;
	char *noden;
	int rc;
	resource_def *prdef = NULL;
	struct key_value_pair *pkvp;
	attribute *queru = NULL;
	attribute *sysru = NULL;
	resource *pr = NULL;
	attribute tmpattr;
	int nchunk = 0;

	/* Parse the exec_vnode string */

	if (!is_attr_set(pexech))
		return;

	if ((pjob != NULL) &&
	    (pexech == get_jattr(pjob, JOB_ATR_exec_vnode_deallocated))) {
		char *pc;
		sysru = get_sattr(SVR_ATR_resource_assn);
		queru = get_qattr(pjob->ji_qhdr, QE_ATR_ResourceAssn);

		pc = pexech->at_val.at_str;
		while (*pc != '\0') {
			/* given exec_vnode format: (<chunk1>+<chunk2>)+(<chunk3), 	*/
			/* <chunk1> and <chunk2> belong to the same node host,      	*/
			/* while  <chunk3> belongs to another node host. 		*/
			/* The number of node host chunks can be determined by # of     */
			/* left parentheses */
			if (*pc == '(') {
				nchunk++;
			}
			pc++;
		}
	}
	chunk = parse_plus_spec(pexech->at_val.at_str, &rc);
	if (rc != 0)
		return;
	while (chunk) {
		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {
			for (j = 0; j < nelem; ++j) {
				prdef = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
				if (prdef == NULL)
					return;

				/* skip all non-consumable resources (e.g. aoe) */
				if ((prdef->rs_flags & asgn) == 0) {
					continue;
				}

				rc = adj_resc_on_node(noden, asgn, op, prdef, pkvp[j].kv_val, 0);
				if (rc && rc != PBSE_UNKNODE)
					return;

				/* update system attribute of resources assigned */

				if (sysru || queru) {
					if ((rc = prdef->rs_decode(&tmpattr, ATTR_rescassn, pkvp[j].kv_keyw,
								   pkvp[j].kv_val)) != 0)
						return;
				}

				if (sysru) {
					pr = find_resc_entry(sysru, prdef);
					if (pr == NULL) {
						pr = add_resource_entry(sysru, prdef);
						if (pr == NULL)
							return;
					}
					prdef->rs_set(&pr->rs_value, &tmpattr, op);
					if (op == DECR) {
						check_for_negative_resource(prdef, pr, NULL);
					}
					post_attr_set(sysru);
				}

				/* update queue attribute of resources assigned */

				if (queru) {
					pr = find_resc_entry(queru, prdef);
					if (pr == NULL) {
						pr = add_resource_entry(queru, prdef);
						if (pr == NULL)
							return;
					}
					prdef->rs_set(&pr->rs_value, &tmpattr, op);
					if (op == DECR) {
						check_for_negative_resource(prdef, pr, NULL);
					}
					post_attr_set(queru);
				}
			}
		} else {
			return;
		}
		asgn = ATR_DFLAG_ANASSN;
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0)
			return;
	}

	if (sysru || queru) {
		/* set pseudo-resource "nodect" to the number of chunks */
		prdef = &svr_resc_def[RESC_NODECT];
		if (prdef == NULL) {
			return;
		}
	}
	if (sysru) {
		pr = find_resc_entry(sysru, prdef);
		if (pr == NULL)
			pr = add_resource_entry(sysru, prdef);
		if (pr) {

			if (op == DECR) {
				pr->rs_value.at_val.at_long -= nchunk;
				check_for_negative_resource(prdef, pr, NULL);
			} else {
				pr->rs_value.at_val.at_long += nchunk;
			}
			pr->rs_value.at_flags |= ATR_SET_MOD_MCACHE | ATR_VFLAG_DEFLT;
		}
	}
	if (queru) {
		pr = find_resc_entry(queru, prdef);
		if (pr == NULL)
			pr = add_resource_entry(queru, prdef);
		if (pr) {
			if (op == DECR) {
				pr->rs_value.at_val.at_long -= nchunk;
				check_for_negative_resource(prdef, pr, NULL);
			} else {
				pr->rs_value.at_val.at_long += nchunk;
			}
			pr->rs_value.at_flags |= ATR_VFLAG_DEFLT | ATR_SET_MOD_MCACHE;
		}
	}
	return;
}

/**
 * @brief
 * 		mark node by name down
 *
 * @param[in]	nodename - node being searched then marking as down.
 * @param[in]	why - error message
 *
 * @return void
 */
void
mark_node_down(char *nodename, char *why)
{
	struct pbsnode *pnode;

	/* note - find_nodebyname strips off /VP */

	if ((pnode = find_nodebyname(nodename)) != NULL) {
		/* XXXX fix see momptr_down() XXXX */
		momptr_down(pnode->nd_moms[0], why);
	}
}

/**
 * @brief
 * 		Mark mom (by ptr) down and log message given by 'why'.
 *
 * @param[in]	pmom - a mom entry
 * @param[in]	why - node comment
 *
 * @return void
 */
void
momptr_offline_by_mom(mominfo_t *pmom, char *why)
{
	if (pmom == NULL)
		return;

	pmom->mi_dmn_info->dmn_state |= INUSE_OFFLINE_BY_MOM;

	if ((why != NULL) && (why[0] != '\0'))
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
			  LOG_ALERT, pmom->mi_host, why);

	set_all_state(pmom, 1, INUSE_OFFLINE_BY_MOM, why, Set_All_State_All_Offline);
	return;
}

/**
 * @brief
 * 		offline_by_mom vnodes whose parent mom is 'nodename'.
 *
 * @param[in]	nodename - node to mark offline_by_mom state
 * @param[in]	why - comment to put in the node
 *
 * @return void
 */
void
mark_node_offline_by_mom(char *nodename, char *why)
{
	struct pbsnode *pnode;

	/* note - find_nodebyname strips off /VP */

	if ((pnode = find_nodebyname(nodename)) != NULL) {
		/* XXXX fix see momptr_down() XXXX */
		momptr_offline_by_mom(pnode->nd_moms[0], why);
		node_save_db(pnode);
	}
}

/**
 * @brief
 * 		Clear mom (by ptr) offline_by_mom state and log message given by 'why'.
 *
 * @param[in]	pmom - a mom entry
 * @param[in]	why - node comment
 *
 * @return void
 */
void
momptr_clear_offline_by_mom(mominfo_t *pmom, char *why)
{
	if (pmom == NULL)
		return;

	if ((why != NULL) && (why[0] != '\0'))
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_NODE,
			  LOG_ALERT, pmom->mi_host, why);

	/* '0' second argument means to clear */
	set_all_state(pmom, 0, INUSE_OFFLINE_BY_MOM, why, Set_All_State_Regardless);
	return;
}

/**
 * @brief
 * 		clears offline_by_mom vnodes whose parent mom is 'nodename'.
 *
 * @param[in]	nodename - node to clear offline_by_mom state
 * @param[in]	why - comment to put in the node
 *
 * @return void
 */
void
clear_node_offline_by_mom(char *nodename, char *why)
{
	struct pbsnode *pnode;

	/* note - find_nodebyname strips off /VP */

	if ((pnode = find_nodebyname(nodename)) != NULL) {
		/* XXXX fix see momptr_down() XXXX */
		momptr_clear_offline_by_mom(pnode->nd_moms[0], why);
		node_save_db(pnode);
	}
}

/**
 * @brief
 * 		send Mom on each node a shutdown command.
 *
 * @par
 *		Note, there is no error checking or retry.   If Mom doesn't go down,
 *		so be it.
 */
void
shutdown_nodes(void)
{
	dmn_info_t *pdmninfo;
	int i, ret;

	DBPRT(("%s: entered\n", __func__))
	for (i = 0; i < mominfo_array_size; i++) {
		mominfo_t *pmom;

		pmom = mominfo_array[i];

		if (pmom == NULL)
			continue;

		pdmninfo = pmom->mi_dmn_info;
		if (pdmninfo->dmn_stream < 0)
			continue;

		DBPRT(("%s: down %s\n", __func__, pmom->mi_host))

		ret = is_compose(pdmninfo->dmn_stream, IS_SHUTDOWN);
		if (ret == DIS_SUCCESS) {
			(void) dis_flush(pdmninfo->dmn_stream);
		}
	}
}

/**
 * @brief
 * 		count number of processors specified in node string.
 *
 * @param[out] *hascpp	- is set non-zero if :cpp or :ncpus appears in string
 *						indicating that user has specified fixed placement of cpus
 *
 * @return	totalcpu
 */
int
ctcpus(char *buf, int *hascpp)
{
	int i;
	char *pc;
	char *pplus;
	char *str;
	int totalcpu = 0;

	if (!buf)
		return 0;

	str = buf;
	*hascpp = 0;

	/* look for each subnode element: [N[:]][ppn=Y[:]][cpp=Z] */
	while (*str) {
		int cpp;
		int nd;
		int ppn;

		nd = 1;
		cpp = 1;
		ppn = 1;
		if ((pplus = strchr(str, (int) '+')))
			*pplus = '\0';

		if (number(&str, &i, 1) == 0) {
			nd = i; /* leading "N" */
			if (*str)
				str++;
		}

		while (1) {

			if (property(&str, &pc))
				break;

			if (strncasecmp(pc, "ppn=", 4) == 0) {
				i = atoi(pc + 4);
				if (i == 0)
					return 1; /* error */
				ppn = i;
			}
			if ((strncasecmp(pc, "cpp=", 4) == 0) ||
			    (strncasecmp(pc, "ncpus=", 6) == 0)) {
				*hascpp = 1; /* found a cpp/ncpus item */
				pc = strchr(pc, (int) '=');
				i = atoi(pc + 1);
				if (i == 0)
					return 1;
				cpp = i;
			}
			if (*str != ':')
				break;
			str++;
		}

		totalcpu += nd * cpp * ppn;
		if (pplus) {
			*pplus = '+';
			str = pplus + 1;
			/* continue on to next subnode element */
		} else
			break;
	}
	return totalcpu;
}

/**
 * @brief
 * 		should be called from function pbsd_init.
 *
 * @par
 *		Its purpose is to re-establish the resvinfo for any reservation
 *		having state "CONFIRMED", which is still "time-viable" and which
 *		had a set of nodes allocated to it when the server was taken down.
 *
 *	Specifically:
 *	   a) examine reservation attribute RESV_ATR_resv_nodes to
 *	      determine which vnode are in the '+' separated
 *	      string and if the server still knows about these nodes
 *
 *	   b) if (a) succeeds, call assign_resv_resc to assign the resources to
 *        the reservation
 *
 *	   c) if at any point in the process described in steps (a) or (b)
 *	      a failure occurs, update the reservation's state to cause
 *	      subsequent reservation deletion to occur
 *
 *  @return  void
 *
 *  @par Side-effects:
 *       If the reservation has yet to be CONFIRMED, or has a state
 *		indicating that it's to be deleted, the function simply
 *		returns without doing anything.
 *
 *  @par MT-safe: No
 */
void
set_old_subUniverse(resc_resv *presv)
{
	int rc;
	char *sp;

	if (presv == NULL || svr_totnodes == 0)
		return;

	if (!is_rattr_set(presv, RESV_ATR_resv_nodes)) {
		return;
	}

	if (presv->ri_qs.ri_state != RESV_CONFIRMED &&
	    presv->ri_qs.ri_substate != RESV_DEGRADED &&
	    presv->ri_qs.ri_substate != RESV_IN_CONFLICT &&
	    presv->ri_qs.ri_state != RESV_RUNNING)
		return;

	/* duplicate the resv_nodes because assign_resv_resc will first free the
	 * resv_nodes attribute before doing the allocation and setting the nodes
	 */
	sp = strdup(get_rattr_str(presv, RESV_ATR_resv_nodes));
	if (sp == NULL) {
		log_err(errno, __func__, "Could not allocate memory");
		return;
	}
	/* for resources that are not specified in the request and for which
	 * default values can be determined, set these values as the values
	 * for those resources
	 */
	if ((rc = set_resc_deflt((void *) presv, RESC_RESV_OBJECT, NULL)) != 0) {
		log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE,
			   presv->ri_qs.ri_resvID, "problem assigning default resource "
						   "to reservation %d",
			   rc);
		free(sp);
		return;
	}
	/* set the nodes on the reservation */
	rc = assign_resv_resc(presv, sp, TRUE);
	if (rc != PBSE_NONE) {
		log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV,
			   LOG_NOTICE, presv->ri_qs.ri_resvID,
			   "problem assigning resource to reservation %d", rc);
		free(sp);
		return;
	}

	if ((presv->ri_qs.ri_state == RESV_RUNNING) ||
	    (presv->ri_qs.ri_state == RESV_TIME_TO_RUN))
		resv_exclusive_handler(presv);

	/* the total number of vnodes associated to the reservation is computed
	 * in set_nodes which is called from assign_resv_resc. We assume that
	 * all vnodes are down until they report up.
	 */
	presv->ri_vnodes_down = presv->ri_vnodect;
	DBPRT(("%s: %s ri_vnodect: %d\n", __func__, presv->ri_qs.ri_resvID,
	       presv->ri_vnodect))
	/* Upon restart, ignore the degraded state of confirmed reservations by
	 * reverting their state back to confirmed. If vnodes don't report back
	 * available the reservation will go through the degradation process.
	 * In other words, we assume the reservation is confirmed again until
	 * proven wrong.
	 */
	if ((presv->ri_qs.ri_substate == RESV_DEGRADED || presv->ri_qs.ri_substate == RESV_IN_CONFLICT) &&
	    presv->ri_qs.ri_state != RESV_RUNNING) {
		(void) resv_setResvState(presv, RESV_CONFIRMED, RESV_CONFIRMED);

		/* unset the reservation retry time attribute */
		unset_resv_retry(presv);
	}
	free(sp);
}

/**
 * @brief
 * 		Walk all vnodes and invoke vnode_unavailable for all those that were
 *  	set offline or offline_by_mom.
 *
 * 		We assume that the reservation is in the state prior to it being degraded,
 * 		which would be either CONFIRMED, UNCONFIRMED, or RUNNING.
 *
 * 		If some of the nodes do not come back up, then the process of degrading
 * 		the reservation is followed by detecting a node as unavailable
 *
 * @return void
 *
 *  @par MT-safe: No
 */
void
degrade_offlined_nodes_reservations(void)
{
	int i;

	DBPRT(("%s: entered\n", __func__))
	for (i = 0; i < svr_totnodes; i++) {
		struct pbsnode *pn;
		pn = pbsndlist[i];
		if ((pn->nd_state & (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM)) != 0 ||
		    (pn->nd_state & INUSE_UNRESOLVABLE) != 0) {
			/* find all associated reservations and mark them
			 * degraded but do not increment the count of downed
			 * vnodes as these have already been accounted for in
			 * set_old_subuniverse.
			 */
			vnode_unavailable(pn, 0);
		}
	}
	/* create a task to check for vnodes that don't report back up after MAX_NODE_WAIT */
	(void) set_task(WORK_Timed, time_now + MAX_NODE_WAIT,
			degrade_downed_nodes_reservations, NULL);
}

/**
 * @brief
 * 		Walk all vnodes and invoke vnode_unavailable for all those that have
 *  	remained (unknown | down | stale) since the server restarted.
 *
 * @return	void
 *
 * @par MT-safe: No
 */
void
degrade_downed_nodes_reservations(struct work_task *pwt)
{
	int i;
	struct pbsnode *pn;

	DBPRT(("%s: entered\n", __func__))
	for (i = 0; i < svr_totnodes; i++) {
		pn = pbsndlist[i];
		/* checking for nodes that are down, including stale state,
		 * but excluding those that are offlined as those were checked
		 * earlier in degrade_offlined_nodes_reservations.
		 */
		if (!(pn->nd_state & (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM)) &&
		    (pn->nd_state & (INUSE_DOWN |
				     INUSE_UNKNOWN | INUSE_STALE))) {
			/* find all associated reservations and mark them
			 * degraded but do not increment the count of downed
			 * vnodes as these have already been accounted for in
			 * set_old_subuniverse
			 */
			vnode_unavailable(pn, 0);
		}
	}
}

/**
 * @brief	Set last_used_time for job's exec_vnodes or reservation's resv_nodes.
 *		Finds the vnodes by name and sets ND_ATR_last_used_time to time_now.
 *
 * @param[in]	pobj - pointer to job/reservation.
 * @param[in]	type - int, denoting the type of object.
 *                     Value 1 means reservation object.
 *                     Value 0 means job object.
 *
 * @retval	void
 */
void
set_last_used_time_node(void *pobj, int type)
{
	char *pc;
	char *pn;
	char *last_pn = NULL;
	struct pbsnode *pnode;
	int rc;
	int time_int_val;

	time_int_val = time_now;

	if (pobj == NULL)
		return;

	if (type) {
		resc_resv *presv;

		presv = pobj;
		pn = parse_plus_spec(get_rattr_str(presv, RESV_ATR_resv_nodes), &rc);
	} else {
		job *pjob;

		pjob = pobj;
		pn = parse_plus_spec(get_jattr_str(pjob, JOB_ATR_exec_vnode), &rc);
	}

	while (pn) {
		int cmp_ret;

		pc = pn;
		while ((*pc != '\0') && (*pc != ':'))
			++pc;
		*pc = '\0';

		if (last_pn == NULL || (cmp_ret = strcmp(pn, last_pn)) != 0) {
			pnode = find_nodebyname(pn);
			/* had better be the "natural" vnode with only the one parent */
			if (pnode) {
				set_nattr_l_slim(pnode, ND_ATR_last_used_time, time_int_val, SET);
				node_save_db(pnode);
			}
		}
		last_pn = pn;
		pn = parse_plus_spec(NULL, &rc);
	}
}

/**
 * @brief update_resource_rel - This function creates JOB_ATR_resc_released_list job attribute
 *		    and add RASSN resources reported in ATTR_released attribute to it.
 * @param[out] pjob - job structure
 * @param[in] attrib - attribute which contains list of resources to be released
 * @param[in] op - kind of operation to be performed while setting the resource value.
 *
 * @return int
 * @retval 0  - SUCCESS
 * @retval > 0 - FAILURE
 */
int
update_resources_rel(job *pjob, attribute *attrib, enum batch_op op)
{
	char *chunk;
	int j;
	int rc;
	int nelem;
	char *noden;
	struct key_value_pair *pkvp;
	resource_def *prdef;
	resource *presc;
	resource *presc_sq;
	attribute tmpattr;

	if (attrib == NULL || pjob == NULL)
		return 1;

	chunk = parse_plus_spec(attrib->at_val.at_str, &rc);
	if (rc != 0)
		return 1;
	while (chunk) {
		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {
			for (j = 0; j < nelem; j++) {
				prdef = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
				if (prdef == NULL)
					return 1;
				if (prdef->rs_flags & (ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN | ATR_DFLAG_FNASSN)) {
					presc = add_resource_entry(get_jattr(pjob, JOB_ATR_resc_released_list), prdef);
					if (presc == NULL)
						return 1;
					if ((rc = prdef->rs_decode(&tmpattr, ATTR_rel_list, prdef->rs_name, pkvp[j].kv_val)) != 0)
						return rc;
					prdef->rs_set(&presc->rs_value, &tmpattr, op);
				}
			}
			chunk = parse_plus_spec(NULL, &rc);
			if (rc != 0)
				return 1;
		} else
			return 1;
	}
	/* Now iterate through all of the job resources that are present on at
	 * queue/server level and add them to resource_release_list. Only do this if
	 * restrict_res_to_release_on_suspend is set
	 */
	if (is_sattr_set(SVR_ATR_restrict_res_to_release_on_suspend)) {
		presc_sq = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
		for (; presc_sq != NULL; presc_sq = (resource *) GET_NEXT(presc_sq->rs_link)) {
			prdef = presc_sq->rs_defin;
			/* make sure it is a server/queue level consumable resource and not
			* set in resource_released_list already
			*/
			if ((prdef->rs_flags & ATR_DFLAG_RASSN) &&
			    (find_resc_entry(get_jattr(pjob, JOB_ATR_resc_released_list), prdef) == NULL)) {
				struct array_strings *pval = get_sattr_arst(SVR_ATR_restrict_res_to_release_on_suspend);
				for (j = 0; pval != NULL && j < pval->as_usedptr; j++) {
					if (strcmp(pval->as_string[j], prdef->rs_name) == 0) {
						presc = add_resource_entry(get_jattr(pjob, JOB_ATR_resc_released_list), prdef);
						if (presc == NULL)
							return 1;
						prdef->rs_set(&presc->rs_value, &presc_sq->rs_value, op);
						break;
					}
				}
			}
		}
	}
	return 0;
}

/**
 * @brief
 *	Free pjob's vnodes whose parent mom is a sister mom.
 *
 * @param[in,out] pjob - Job structure
 * @param[in]	vnodelist - non-NULL means it's the list of vnode names
 *			to free. If NULL, free all the vnodes assigned
 *			to 'pjob' whose parent mom is a sister mom.
 * @param[in]	keep_select - non-NULL means it's a select string that
 *			describes vnodes to be kept while freeing all other vnodes
 *			assigned to 'pjob' whose parent mom is a sister mom.
 * @param[out]  err_msg - if function returns != 0 (failure), return
 *			  any error message in this buffer.
 * @param[int]	err_msg_sz - size of 'err_msg' buf.
 * @param[int]	reply_req - the batch request to reply to if any.
 * @return int
 * @retval 0 - success
 * @retval != 0  - failure error code.
 */
int
free_sister_vnodes(job *pjob, char *vnodelist, char *keep_select, char *err_msg,
		   int err_msg_sz, struct batch_request *reply_req)
{
	int rc = 0;
	pbs_sched *psched;

	if (pjob == NULL) {
		log_err(PBSE_INTERNAL, __func__, "bad pjob parameter");
		return (1);
	}

	if (!is_jattr_set(pjob, JOB_ATR_exec_vnode))
		return 0; /* nothing to free up */

	if (err_msg_sz > 0)
		err_msg[0] = '\0';

	/* decrements everything found in exec_vnode */
	set_resc_assigned((void *) pjob, 0, DECR);

	/* re-create the job's exec_vnode based on free vnodes specs */
	if ((rc = recreate_exec_vnode(pjob, vnodelist, keep_select, err_msg,
				      err_msg_sz)) != 0) {
		set_resc_assigned((void *) pjob, 0, INCR);
		return (rc);
	}
	/* increment everything found in new exec_vnode */
	set_resc_assigned((void *) pjob, 0, INCR);

	if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
		set_scheduler_flag(SCH_SCHEDULE_TERM, psched);
	else {
		log_err(-1, __func__, "Unable to find scheduler associated with partition");
	}
	rc = send_job_exec_update_to_mom(pjob, err_msg, err_msg_sz, reply_req);

	if (rc == 0) {
		account_job_update(pjob, PBS_ACCT_UPDATE);
		account_jobstr(pjob, PBS_ACCT_NEXT);
	}

	return (rc);
}

/**
 * @brief
 *	Wrapper function to update_job_node_rassn() function.
 *
 * @param[in]	pexech	- exec_vnode string
 * @param[in]	op	- operator of type enum batch_op.
 */
void
update_node_rassn(attribute *pexech, enum batch_op op)
{
	update_job_node_rassn(NULL, pexech, op);
}

/**
 * @brief update the jid on the respective nodes in the execvnode string
 * and update the state based on share_job value
 * 
 * @param[in] jid - job id
 * @param[in] exec_vnode - execvnode string
 * @param[in] op - operation INCR/DECR
 * @param[in] share_job - job sharing type
 */
void
update_jobs_on_node(char *jid, char *exec_vnode, int op, int share_job)
{
	char *chunk;
	int j;
	int nelem;
	char *noden;
	int rc;
	resource_def *prdef = NULL;
	struct key_value_pair *pkvp;
	int asgn = ATR_DFLAG_ANASSN | ATR_DFLAG_FNASSN;
	long ncpus;
	struct pbsnode *pnode;

	for (chunk = parse_plus_spec(exec_vnode, &rc);
	     chunk && !rc; chunk = parse_plus_spec(NULL, &rc)) {

		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {
			if ((pnode = find_nodebyname(noden)) == NULL)
				continue;
			for (j = 0; j < nelem; ++j) {
				prdef = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
				if (prdef == NULL)
					return;
				/* skip all non-consumable resources (e.g. aoe) */
				if ((prdef->rs_flags & asgn) == 0)
					continue;

				if (!strcmp(prdef->rs_name, "ncpus")) {
					ncpus = strtol(pkvp[j].kv_val, NULL, 10);
					if (ncpus < 0) {
						log_err(PBSE_SYSTEM, "bad value for ncpus: %s\n", pkvp[j].kv_val);
						ncpus = 0;
					}
					if (op == INCR) {
						assign_jobs_on_subnode(pnode, ncpus, jid, 0, share_job);
						update_node_state(pnode, share_job);
					} else if (op == DECR)
						deallocate_job_from_node(jid, pnode);
				}
			}
		}
	}
}

/**
 * @brief - Degrade a reservation.
 *
 * This function is different from vnode_unavailable, as here we know the
 * reservation that needs to be degraded
 *
 * @param[in] - pnode - pbsnode which has gone down.
 * @param[in] - presv - reservation that needs to be degraded.
 *
 */

static void
set_resv_for_degrade(struct pbsnode *pnode, resc_resv *presv)
{
	long degraded_time;

	if ((degraded_time = get_rattr_long(presv, RESV_ATR_resv_standing)) == 0)
		presv->ri_degraded_time = degraded_time;
	else
		find_degraded_occurrence(presv, pnode, Set_Degraded_Time);

	degraded_time = presv->ri_degraded_time;

	if (degraded_time > (time_now + resv_retry_time))
		set_resv_retry(presv, (time_now + resv_retry_time));

	(void) resv_setResvState(presv, presv->ri_qs.ri_state, RESV_DEGRADED);

	/* the number of vnodes down could exceed the number of vnodes in
	 * the reservation only in the case of a standing reservation for
	 * which the vnodes unavailable are associated to later occurrences
	 */
	if (presv->ri_vnodes_down > presv->ri_vnodect) {
		/* If a standing reservation we print the execvnodes sequence
		 * string for debugging purposes
		 */
		if (get_rattr_long(presv, RESV_ATR_resv_standing)) {
			char *execvnodes = NULL;
			int occurrence = -1;

			if (is_rattr_set(presv, RESV_ATR_resv_execvnodes))
				execvnodes = get_rattr_str(presv, RESV_ATR_resv_execvnodes);
			if (execvnodes == NULL)
				execvnodes = "";
 			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
			           presv->ri_qs.ri_resvID, "execvnodes sequence: %s",
			           execvnodes);
			if (is_rattr_set(presv, RESV_ATR_resv_idx))
				occurrence = get_rattr_long(presv, RESV_ATR_resv_idx);
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
			           presv->ri_qs.ri_resvID, "vnodes in occurrence %d: %d; "
			           "unavailable vnodes in reservation: %d",
			           occurrence, presv->ri_vnodect, presv->ri_vnodes_down);
		} else {
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_RESV, LOG_DEBUG,
			           presv->ri_qs.ri_resvID, "vnodes in reservation: %d; "
			           "unavailable vnodes in reservation: %d",
			           presv->ri_vnodect, presv->ri_vnodes_down);
		}
	}
	presv->ri_vnodes_down++;
}

/**
 * 	@brief determine the new retry time for a resv
 *
 * 	@param[in] presv - the reservation
 *
 * 	@return long
 * 	@retval next resv retry time for the resv
 */
long
determine_resv_retry(resc_resv *presv)
{
	long retry;
	long resv_start = get_rattr_long(presv, RESV_ATR_start);

	if (time_now < resv_start && time_now + resv_retry_time > resv_start)
		retry = resv_start;
	else
		retry = time_now + resv_retry_time;

	return retry;
}


================================================
FILE: src/server/node_recov_db.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    node_recov_db.c
 *
 * @brief
 *		node_recov_db.c - This file contains the functions to record a node
 *		data structure to database and to recover it from database.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>

#include "pbs_ifl.h"
#include <errno.h>
#include <fcntl.h>
#include <string.h>
#include <stdlib.h>
#include <time.h>

#include <unistd.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"

#include "log.h"
#include "attribute.h"
#include "list_link.h"
#include "server_limits.h"
#include "credential.h"
#include "libpbs.h"
#include "batch_request.h"
#include "pbs_nodes.h"
#include "job.h"
#include "resource.h"
#include "reservation.h"
#include "queue.h"
#include "svrfunc.h"
#include <memory.h>
#include "libutil.h"
#include "pbs_db.h"

struct pbsnode *recov_node_cb(pbs_db_obj_info_t *dbobj, int *refreshed);
struct pbsnode *pbsd_init_node(pbs_db_node_info_t *dbnode, int type);

/**
 * @brief
 *		convert from database to node structure
 *
 * @param[out]	pnode - Address of the node in the server
 * @param[in]	pdbnd - Address of the database node object
 *
 * @return	Error code
 * @retval   0 - Success
 * @retval  -1 - Failure
 *
 */
static int
db_to_node(struct pbsnode *pnode, pbs_db_node_info_t *pdbnd)
{
	if (pdbnd->nd_name[0] != 0) {
		free(pnode->nd_name); /* free any previously allocated value */
		pnode->nd_name = strdup(pdbnd->nd_name);
		if (pnode->nd_name == NULL)
			return -1;
	} else
		pnode->nd_name = NULL;

	if (pdbnd->nd_hostname[0] != 0) {
		free(pnode->nd_hostname); /* free any previously allocated value */
		pnode->nd_hostname = strdup(pdbnd->nd_hostname);
		if (pnode->nd_hostname == NULL) {
			free(pnode->nd_name);
			return -1;
		}
	} else
		pnode->nd_hostname = NULL;

	pnode->nd_ntype = pdbnd->nd_ntype;
	pnode->nd_state = pdbnd->nd_state;
	if (pnode->nd_pque)
		strcpy(pnode->nd_pque->qu_qs.qu_name, pdbnd->nd_pque);

	if ((decode_attr_db(pnode, &pdbnd->db_attr_list.attrs, node_attr_idx, node_attr_def, pnode->nd_attr, ND_ATR_LAST, 0)) != 0)
		return -1;

	pnode->nd_svrflags &= ~NODE_NEWOBJ;

	return 0;
}

/**
 * @brief
 *		Recover a node from the database
 *
 * @param[in]	nd_name	- node name
 * @param[in]	pnode	- node pointer, if any, to be updated
 *
 * @return	The recovered node structure
 * @retval	NULL - Failure
 * @retval	!NULL - Success - address of recovered node returned
 */
struct pbsnode *
node_recov_db(char *nd_name, struct pbsnode *pnode)
{
	pbs_db_obj_info_t obj;
	void *conn = (void *) svr_db_conn;
	pbs_db_node_info_t dbnode = {{0}};
	int rc = 0;
	struct pbsnode *pnd = NULL;
	char *conn_db_err = NULL;

	if (!pnode) {
		if ((pnd = malloc(sizeof(struct pbsnode)))) {
			pnode = pnd;
			initialize_pbsnode(pnode, strdup(nd_name), NTYPE_PBS);
		} else {
			log_err(-1, __func__, "node_alloc failed");
			return NULL;
		}
	}

	strcpy(dbnode.nd_name, nd_name);
	obj.pbs_db_obj_type = PBS_DB_NODE;
	obj.pbs_db_un.pbs_db_node = &dbnode;

	rc = pbs_db_load_obj(conn, &obj);
	if (rc == -2)
		return pnode; /* no change in node, return the same pnode */

	if (rc == 0)
		rc = db_to_node(pnode, &dbnode);
	else {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to load node %s %s", nd_name, conn_db_err ? conn_db_err : "");
		free(conn_db_err);
	}

	free_db_attr_list(&dbnode.db_attr_list);

	if (rc != 0) {
		pnode = NULL;	 /* so we return NULL */
		free_pnode(pnd); /* free if we allocated here */
	}
	return pnode;
}

/**
 * @brief
 *		convert node structure to DB format
 *
 * @param[in]	pnode - Address of the node in the server
 * @param[out]	pdbnd - Address of the database node object
 *
 * @return 0    Success
 * @retval	>=0 What to save: 0=nothing, OBJ_SAVE_NEW or OBJ_SAVE_QS
 */
static int
node_to_db(struct pbsnode *pnode, pbs_db_node_info_t *pdbnd)
{
	int wrote_np = 0;
	svrattrl *psvrl, *tmp;
	int vnode_sharing = 0;
	int savetype = 0;

	strcpy(pdbnd->nd_name, pnode->nd_name);

	savetype |= OBJ_SAVE_QS;
	/* nodes do not have a qs area, so we cannot check whether qs changed or not
	 * hence for now, we always write the qs area, for now!
	 */

	/* node_index is used to sort vnodes upon recovery.
	* For Cray multi-MoM'd vnodes, we ensure that natural vnodes come
	* before the vnodes that it manages by introducing offsetting all
	* non-natural vnodes indices to come after natural vnodes.
	*/
	if (pnode->nd_nummoms > 1)
		pdbnd->nd_index = 1; /* multiple parent moms, Cray case */
	else
		pdbnd->nd_index = 0; /* default, single parent mom */

	if (pnode->nd_hostname)
		strcpy(pdbnd->nd_hostname, pnode->nd_hostname);

	if (pnode->nd_moms && pnode->nd_moms[0])
		pdbnd->mom_modtime = pnode->nd_moms[0]->mi_modtime;

	pdbnd->nd_ntype = pnode->nd_ntype;
	pdbnd->nd_state = pnode->nd_state;
	if (pnode->nd_pque)
		strcpy(pdbnd->nd_pque, pnode->nd_pque->qu_qs.qu_name);
	else
		pdbnd->nd_pque[0] = 0;

	if ((encode_attr_db(node_attr_def, pnode->nd_attr, ND_ATR_LAST, &pdbnd->db_attr_list, 0)) != 0)
		return -1;

	/* MSTODO: how can we optimize this loop - eliminate this? */
	psvrl = (svrattrl *) GET_NEXT(pdbnd->db_attr_list.attrs);
	while (psvrl != NULL) {
		if ((!wrote_np) && (strcmp(psvrl->al_name, ATTR_rescavail) == 0) && (strcmp(psvrl->al_resc, "ncpus") == 0)) {
			wrote_np = 1;
			psvrl = (svrattrl *) GET_NEXT(psvrl->al_link);
			continue;
		}

		if (strcmp(psvrl->al_name, ATTR_NODE_pcpus) == 0) {
			/* don't write out pcpus at this point, see */
			/* check for pcpus if needed after loop end */
			tmp = (svrattrl *) GET_NEXT(psvrl->al_link); /* store next node pointer */
			delete_link(&psvrl->al_link);
			free(psvrl);
			pdbnd->db_attr_list.attr_count--;
			psvrl = tmp;
			continue;

		} else if (strcmp(psvrl->al_name, ATTR_NODE_resv_enable) == 0) {
			/*  write resv_enable only if not default value */
			if ((psvrl->al_flags & ATR_VFLAG_DEFLT) != 0) {
				tmp = (svrattrl *) GET_NEXT(psvrl->al_link); /* store next node pointer */
				delete_link(&psvrl->al_link);
				free(psvrl);
				pdbnd->db_attr_list.attr_count--;
				psvrl = tmp;
				continue;
			}
		}
		psvrl = (svrattrl *) GET_NEXT(psvrl->al_link);
	}

	/*
	 * Attributes with default values are not general saved to disk.
	 * However to deal with some special cases, things needed for
	 * attaching jobs to the vnodes on recover that we don't have
	 * except after we hear from Mom, i.e. we :
	 * 1. Need number of cpus, if it isn't writen as a non-default, as
	 *    "np", then write "pcpus" which will be treated as a default
	 * 2. Need the "sharing" attribute written even if default
	 *    and not the default value (i.e. it came from Mom).
	 *    so save it as the "special" [sharing] when it is a default
	 */
	if (wrote_np == 0) {
		char pcpu_str[10];
		svrattrl *pal;

		/* write the default value for the num of cpus */
		sprintf(pcpu_str, "%ld", pnode->nd_nsn);
		pal = make_attr(ATTR_NODE_pcpus, "", pcpu_str, 0);
		append_link(&pdbnd->db_attr_list.attrs, &pal->al_link, pal);

		pdbnd->db_attr_list.attr_count++;
	}

	if (vnode_sharing) {
		char *vn_str;
		svrattrl *pal;

		vn_str = vnode_sharing_to_str((enum vnode_sharing) get_nattr_long(pnode, ND_ATR_Sharing));
		pal = make_attr(ATTR_NODE_Sharing, "", vn_str, 0);
		append_link(&pdbnd->db_attr_list.attrs, &pal->al_link, pal);

		pdbnd->db_attr_list.attr_count++;
	}

	return savetype;
}

/**
 * @brief
 *	Save a node to the database. When we save a node to the database, delete
 *	the old node information and write the node afresh. This ensures that
 *	any deleted attributes of the node are removed, and only the new ones are
 *	updated to the database.
 *
 * @param[in]	pnode - Pointer to the node to save
 *
 * @return      Error code
 * @retval	0 - Success
 * @retval	-1 - Failure
 *
 */
int
node_save_db(struct pbsnode *pnode)
{
	pbs_db_node_info_t dbnode = {{0}};
	pbs_db_obj_info_t obj;
	void *conn = (void *) svr_db_conn;
	char *conn_db_err = NULL;
	int savetype;
	int rc = -1;

	if ((savetype = node_to_db(pnode, &dbnode)) == -1)
		goto done;

	obj.pbs_db_obj_type = PBS_DB_NODE;
	obj.pbs_db_un.pbs_db_node = &dbnode;

	if ((rc = pbs_db_save_obj(conn, &obj, savetype)) != 0) {
		savetype |= (OBJ_SAVE_NEW | OBJ_SAVE_QS);
		rc = pbs_db_save_obj(conn, &obj, savetype);
	}

	if (rc == 0)
		pnode->nd_svrflags &= ~NODE_NEWOBJ;

done:
	free_db_attr_list(&dbnode.db_attr_list);

	if (rc != 0) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to save node %s %s", pnode->nd_name, conn_db_err ? conn_db_err : "");
		free(conn_db_err);
		panic_stop_db();
	}
	return rc;
}

/**
 * @brief
 *	Delete a node from the database
 *
 * @param[in]	pnode - Pointer to the node to delete
 *
 * @return      Error code
 * @retval	0 - Success
 * @retval	-1 - Failure
 *
 */
int
node_delete_db(struct pbsnode *pnode)
{
	pbs_db_node_info_t dbnode;
	pbs_db_obj_info_t obj;
	void *conn = (void *) svr_db_conn;
	char *conn_db_err = NULL;

	strcpy(dbnode.nd_name, pnode->nd_name);
	obj.pbs_db_obj_type = PBS_DB_NODE;
	obj.pbs_db_un.pbs_db_node = &dbnode;

	if (pbs_db_delete_obj(conn, &obj) == -1) {
		log_errf(PBSE_INTERNAL, __func__, "Failed to delete node %s %s", pnode->nd_name, conn_db_err ? conn_db_err : "");
		return (-1);
	} else
		return (0); /* "success" or "success but rows deleted" */
}

/**
 * @brief
 *	Refresh/retrieve node from database and add it into node list if not present
 *
 *	@param[in]	dbobj - The pointer to the wrapper node object of type pbs_db_node_info_t
 *	@param[in]	refreshed - To check if node refreshed
 *
 * @return	The recovered node
 * @retval	NULL - Failure
 * @retval	!NULL - Success, pointer to node structure recovered
 *
 */
struct pbsnode *
recov_node_cb(pbs_db_obj_info_t *dbobj, int *refreshed)
{
	struct pbsnode *pnode = NULL;
	pbs_db_node_info_t *dbnode = dbobj->pbs_db_un.pbs_db_node;
	int load_type = 0;
	extern time_t time_now;

	*refreshed = 0;
	if ((pnode = pbsd_init_node(dbnode, load_type)) != NULL) {
		*refreshed = 1;
		pnode->nd_state |= (dbnode->nd_state & INUSE_NOAUTO_MASK);
		if (pnode->nd_state != get_nattr_long(pnode, ND_ATR_state)) {
			set_nattr_l_slim(pnode, ND_ATR_state, pnode->nd_state, SET);
			set_nattr_l_slim(pnode, ND_ATR_last_state_change_time, time_now, SET);
		}
		pnode->nd_modified = 0;
	}

	free_db_attr_list(&dbnode->db_attr_list);
	if (pnode == NULL)
		log_errf(-1, __func__, "Failed to load node %s", dbnode->nd_name);
	return pnode;
}


================================================
FILE: src/server/pbs_comm.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_comm.c
 *
 * @brief
 * 		Implements the router (pbs_comm) process in the TCP network
 *
 * @par	Functionality:
 *          Reads its own router name and port from the pbs config file.
 *          Also reads names of other routers from the pbs config file.
 *          It then calls tpp_router_init to initialize itself as a
 *          router process, and sleeps in a while loop.
 *
 *          It protects itself from SIGPIPEs generated by sends() inside
 *          the library by setting the disposition to ignore.
 *
 */
#include <pbs_config.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <fcntl.h>
#include <unistd.h>
#include <sys/stat.h>
#include <signal.h>
#include <avltree.h>

#include <grp.h>
#include <sys/resource.h>

#include <ctype.h>

#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "log.h"
#include "tpp.h"
#include "server_limits.h"
#include "pbs_version.h"
#include "auth.h"

char daemonname[PBS_MAXHOSTNAME + 8];
extern char *msg_corelimit;
extern char *msg_init_chdir;
int lockfds;
int already_forked = 0;
#define PBS_COMM_LOGDIR "comm_logs"

char server_host[PBS_MAXHOSTNAME + 1];	/* host_name of server */
char primary_host[PBS_MAXHOSTNAME + 1]; /* host_name of primary */

static int stalone = 0; /* is program running not as a service ? */
static int get_out = 0;
static int hupped = 0;

/*
 * Server failover role
 */
enum failover_state {
	FAILOVER_NONE,	       /* Only Server, no failover */
	FAILOVER_PRIMARY,      /* Primary in failover configuration */
	FAILOVER_SECONDARY,    /* Secondary in failover */
	FAILOVER_CONFIG_ERROR, /* error in configuration */
	FAILOVER_NEITHER,      /* failover configured, but I am neither primary/secondary */
};

/**
 * @brief
 *		are_we_primary - determines the failover role, are we the Primary
 *		Server, the Secondary Server or the only Server (no failover)
 *
 * @return	int: failover server role
 * @retval  FAILOVER_NONE	- failover not configured
 * @retval  FAILOVER_PRIMARY	- Primary Server
 * @retval  FAILOVER_SECONDARY	- Secondary Server
 * @retval  FAILOVER_CONFIG_ERROR	- error in pbs.conf configuration
 * @retval  FAILOVER_NEITHER	- failover configured, but I am neither primary/secondary
 */
enum failover_state
are_we_primary(void)
{
	char hn1[PBS_MAXHOSTNAME + 1];

	/* both secondary and primary should be set or neither set */
	if ((pbs_conf.pbs_secondary == NULL) && (pbs_conf.pbs_primary == NULL))
		return FAILOVER_NONE;

	if ((pbs_conf.pbs_secondary == NULL) || (pbs_conf.pbs_primary == NULL))
		return FAILOVER_CONFIG_ERROR;

	if (get_fullhostname(pbs_conf.pbs_primary, primary_host, (sizeof(primary_host) - 1)) == -1) {
		log_err(-1, __func__, "Unable to get full host name of primary");
		return FAILOVER_CONFIG_ERROR;
	}

	if (strcmp(primary_host, server_host) == 0)
		return FAILOVER_PRIMARY; /* we are the listed primary */

	if (get_fullhostname(pbs_conf.pbs_secondary, hn1, (sizeof(hn1) - 1)) == -1) {
		log_err(-1, __func__, "Unable to get full host name of secondary");
		return FAILOVER_CONFIG_ERROR;
	}
	if (strcmp(hn1, server_host) == 0)
		return FAILOVER_SECONDARY; /* we are the secondary */

	return FAILOVER_NEITHER; /* failover configured, but I am neither primary nor secondary */
}

/**
 * @brief
 *		usage - prints the usage in terminal if the user mistype in terminal
 *
 * @param[in]	prog	- program name which will be typed in the terminal along wih arguments.
 *
 * @return	void
 */
void
usage(char *prog)
{
	fprintf(stderr, "Usage: %s [-r other_pbs_comms][-t threads][-N]\n"
			"       %s --version\n",
		prog, prog);
}

/**
 * @brief
 * 		Termination signal handler for the pbs_comm daemon
 *
 * 		Handles termination signals like SIGTERM and sets a global
 * 		variable to exit the daemon
 *
 * @param[in] sig - name of signal caught
 *
 * @return	void
 */
static void
stop_me(int sig)
{
	char buf[100];

	/* set global variable to stop loop */
	get_out = 1;
	sprintf(buf, "Caught signal %d\n", sig);
	fprintf(stderr, "%s\n", buf);
	log_err(-1, __func__, buf);
}

/**
 * @brief
 * 		HUP handler for the pbs_comm daemon
 *
 * 		Handles the SIGHUP signal and sets a global
 * 		variable to reload the daemon configuration
 *
 * @param[in]	sig	- name of signal caught
 *
 * @return	void
 */
static void
hup_me(int sig)
{
	char buf[100];

	/* set global variable to stop loop */
	hupped = 1;
	sprintf(buf, "Caught signal %d\n", sig);
	fprintf(stderr, "%s\n", buf);
	log_err(-1, __func__, buf);
}

/**
 * @brief
 * 		lock out the lockfile for this daemon
 * 			$PBS_HOME/server_priv/comm.lock
 *
 * @param[in] fds - lockfile fd to lock
 * @param[in] op  - F_WRLCK to lock, F_UNLCK to unlock
 *
 * @return	void
 */
static void
lock_out(int fds, int op)
{
	int i;
	int j;
	struct flock flock;
	char buf[100];

	j = 1; /* not fail over, try lock one time */

	(void) lseek(fds, (off_t) 0, SEEK_SET);
	flock.l_type = op;
	flock.l_whence = SEEK_SET;
	flock.l_start = 0;
	flock.l_len = 0;
	for (i = 0; i < j; i++) {
		if (fcntl(fds, F_SETLK, &flock) != -1) {
			if (op == F_WRLCK) {
				/* if write-lock, record pid in file */
				if (ftruncate(fds, (off_t) 0) == -1) 
					log_errf(-1, __func__, "ftruncate failed. ERR : %s",strerror(errno));
				(void) sprintf(buf, "%d\n", getpid());
				if(write(fds, buf, strlen(buf)) == -1) 
					log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));
			}
			return;
		}
		sleep(2);
	}

	(void) strcpy(log_buffer, "another PBS comm router running at the same port");
	fprintf(stderr, "pbs_comm: %s\n", log_buffer);
	exit(1);
}

#ifndef DEBUG
/**
 * @brief
 * 		redirect stdin, stdout and stderr to /dev/null
 *		Not done if compiled with debug
 */
void
pbs_close_stdfiles(void)
{
	static int already_done = 0;

	if (!already_done) {
		(void) fclose(stdin);
		(void) fclose(stdout);
		(void) fclose(stderr);

		if (fopen(NULL_DEVICE, "r") == NULL) 
			log_errf(-1, __func__, "fopen of null device failed. ERR : %s",strerror(errno));
		if (fopen(NULL_DEVICE, "w") == NULL) 
			log_errf(-1, __func__, "fopen of null device failed. ERR : %s",strerror(errno));
		if (fopen(NULL_DEVICE, "w") == NULL) 
			log_errf(-1, __func__, "fopen of null device failed. ERR : %s",strerror(errno));
		already_done = 1;
	}
}

/**
 * @brief
 *		Forks a background process and continues on that, while
 * 		exiting the foreground process. It also sets the child process to
 * 		become the session leader. This function is avaible only on Non-Windows
 * 		platforms and in non-debug mode.
 *
 * @return -  pid_t	- sid of the child process (result of setsid)
 * @retval       >0	- sid of the child process.
 * @retval       -1	- Fork or setsid failed.
 */
static pid_t
go_to_background()
{
	pid_t sid = -1;
	int rc;

	lock_out(lockfds, F_UNLCK);
	rc = fork();
	if (rc == -1) /* fork failed */
		return ((pid_t) -1);
	if (rc > 0)
		exit(0); /* parent goes away, allowing booting to continue */

	lock_out(lockfds, F_WRLCK);
	if ((sid = setsid()) == -1) {
		fprintf(stderr, "pbs_comm: setsid failed");
		return ((pid_t) -1);
	}
	already_forked = 1;
	return sid;
}
#endif /* DEBUG is defined */

/**
 * @brief
 *		main - the initialization and main loop of pbs_comm
 *
 * @param[in]	argc	- argument count.
 * @param[in]	argv	- argument values.
 *
 * @return	int
 * @retval	0	- success
 * @retval	>0	- error
 */
int
main(int argc, char **argv)
{
	char *name = NULL;
	struct tpp_config conf;
	int tpp_fd;
	char *pc;
	int numthreads;
	char lockfile[MAXPATHLEN + 1];
	char path_log[MAXPATHLEN + 1];
	char svr_home[MAXPATHLEN + 1];
	char *log_file = 0;
	char *host;
	int port;
	char *routers = NULL;
	int c, i, rc;
	extern char *optarg;
	int are_primary;
	int num_var_env;
	struct sigaction act;
	struct sigaction oact;

	/*the real deal or just pbs_version and exit*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	/* As a security measure and to make sure all file descriptors	*/
	/* are available to us,  close all above stderr			*/

	i = sysconf(_SC_OPEN_MAX);
	while (--i > 2)
		(void) close(i); /* close any file desc left open by parent */

	/* If we are not run with real and effective uid of 0, forget it */
	if ((getuid() != 0) || (geteuid() != 0)) {
		fprintf(stderr, "%s: Must be run by root\n", argv[0]);
		return (2);
	}

	/* set standard umask */
	umask(022);

	/* load the pbs conf file */
	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "%s: Configuration error\n", argv[0]);
		return (1);
	}

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	umask(022);

	/* The following is code to reduce security risks                */
	/* start out with standard umask, system resource limit infinite */
	if ((num_var_env = setup_env(pbs_conf.pbs_environment)) == -1) {
		exit(1);
	}

	i = getgid();
	(void) setgroups(1, (gid_t *) &i); /* secure suppl. groups */

	log_event_mask = &pbs_conf.pbs_comm_log_events;
	tpp_set_logmask(*log_event_mask);

	routers = pbs_conf.pbs_comm_routers;
	numthreads = pbs_conf.pbs_comm_threads;

	server_host[0] = '\0';
	if (pbs_conf.pbs_comm_name) {
		name = pbs_conf.pbs_comm_name;
		host = tpp_parse_hostname(name, &port);
		if (host)
			snprintf(server_host, sizeof(server_host), "%s", host);
		free(host);
		host = NULL;
	} else if (pbs_conf.pbs_leaf_name) {
		char *endp;

		snprintf(server_host, sizeof(server_host), "%s", pbs_conf.pbs_leaf_name);
		endp = strchr(server_host, ','); /* find the first name */
		if (endp)
			*endp = '\0';
		endp = strchr(server_host, ':'); /* cut out the port */
		if (endp)
			*endp = '\0';
		name = server_host;
	} else {
		if (gethostname(server_host, (sizeof(server_host) - 1)) == -1) {
			sprintf(log_buffer, "Could not determine my hostname, errno=%d", errno);
			fprintf(stderr, "%s\n", log_buffer);
			return (1);
		}
		if ((get_fullhostname(server_host, server_host, (sizeof(server_host) - 1)) == -1)) {
			sprintf(log_buffer, "Could not determine my hostname");
			fprintf(stderr, "%s\n", log_buffer);
			return (1);
		}
		name = server_host;
	}
	if (server_host[0] == '\0') {
		sprintf(log_buffer, "Could not determine server host");
		fprintf(stderr, "%s\n", log_buffer);
		return (1);
	}

	while ((c = getopt(argc, argv, "r:t:e:N")) != -1) {
		switch (c) {
			case 'e':
				*log_event_mask = strtol(optarg, NULL, 0);
				break;
			case 'r':
				routers = optarg;
				break;
			case 't':
				numthreads = atol(optarg);
				if (numthreads == -1) {
					usage(argv[0]);
					return (1);
				}
				break;
			case 'N':
				stalone = 1;
				break;
			default:
				usage(argv[0]);
				return (1);
		}
	}

	(void) strcpy(daemonname, "Comm@");
	(void) strcat(daemonname, name);
	if ((pc = strchr(daemonname, (int) '.')) != NULL)
		*pc = '\0';

	if (set_msgdaemonname(daemonname)) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}

	(void) snprintf(path_log, sizeof(path_log), "%s/%s", pbs_conf.pbs_home_path, PBS_COMM_LOGDIR);
	(void) log_open(log_file, path_log);

	/* set pbs_comm's process limits */
	set_proc_limits(pbs_conf.pbs_core_limit, TPP_MAXOPENFD); /* set_proc_limits can call log_record, so call only after opening log file */

	(void) snprintf(svr_home, sizeof(svr_home), "%s/%s", pbs_conf.pbs_home_path, PBS_SVR_PRIVATE);
	if (chdir(svr_home) != 0) {
		(void) sprintf(log_buffer, msg_init_chdir, svr_home);
		log_err(-1, __func__, log_buffer);
		return (1);
	}

	(void) sprintf(lockfile, "%s/%s/comm.lock", pbs_conf.pbs_home_path, PBS_SVR_PRIVATE);
	if ((are_primary = are_we_primary()) == FAILOVER_SECONDARY) {
		strcat(lockfile, ".secondary");
	} else if (are_primary == FAILOVER_CONFIG_ERROR) {
		sprintf(log_buffer, "Failover configuration error");
		log_err(-1, __func__, log_buffer);
		return (3);
	}

	if ((lockfds = open(lockfile, O_CREAT | O_WRONLY, 0600)) < 0) {
		(void) sprintf(log_buffer, "pbs_comm: unable to open lock file");
		log_err(errno, __func__, log_buffer);
		return (1);
	}

	if ((host = tpp_parse_hostname(name, &port)) == NULL) {
		sprintf(log_buffer, "Out of memory parsing leaf name");
		log_err(errno, __func__, log_buffer);
		return (1);
	}

	/* set tpp config */
	rc = set_tpp_config(&pbs_conf, &conf, host, port, routers);
	if (rc == -1) {
		(void) sprintf(log_buffer, "Error setting TPP config");
		log_err(-1, __func__, log_buffer);
		return (1);
	}
	free(host);

	i = 0;
	if (conf.routers) {
		while (conf.routers[i]) {
			sprintf(log_buffer, "Router[%d]:%s", i, conf.routers[i]);
			fprintf(stdout, "%s\n", log_buffer);
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, log_buffer);
			i++;
		}
	}

#ifndef DEBUG
	if (stalone != 1)
		go_to_background();
#endif

	if (already_forked == 0)
		lock_out(lockfds, F_WRLCK);

	/* go_to_backgroud call creates a forked process,
	 * thus print/log pid only after go_to_background()
	 * has been called
	 */
	sprintf(log_buffer, "%s ready (pid=%d), Proxy Name:%s, Threads:%d", argv[0], getpid(), conf.node_name, numthreads);
	fprintf(stdout, "%s\n", log_buffer);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, log_buffer);
	log_supported_auth_methods(pbs_conf.supported_auth_methods);

#ifndef DEBUG
	pbs_close_stdfiles();
#endif

	/* comm runs 1 + tpp_conf.nuthreads threads - these might use avltree functionality */
	avl_set_maxthreads(numthreads + 1);

	sigemptyset(&act.sa_mask);
	act.sa_flags = 0;
	act.sa_handler = hup_me;
	if (sigaction(SIGHUP, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for HUP");
		return (2);
	}
	act.sa_handler = stop_me;
	if (sigaction(SIGINT, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for INT");
		return (2);
	}
	if (sigaction(SIGTERM, &act, &oact) != 0) {
		log_err(errno, __func__, "sigactin for TERM");
		return (2);
	}
	if (sigaction(SIGQUIT, &act, &oact) != 0) {
		log_err(errno, __func__, "sigactin for QUIT");
		return (2);
	}
#ifdef SIGSHUTDN
	if (sigaction(SIGSHUTDN, &act, &oact) != 0) {
		log_err(errno, __func__, "sigactin for SHUTDN");
		return (2);
	}
#endif /* SIGSHUTDN */

	act.sa_handler = SIG_IGN;
	if (sigaction(SIGPIPE, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for PIPE");
		return (2);
	}
	if (sigaction(SIGUSR2, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for USR2");
		return (2);
	}
	if (sigaction(SIGUSR1, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for USR1");
		return (2);
	}
	if (load_auths(AUTH_SERVER)) {
		log_err(-1, __func__, "Failed to load auth lib");
		return 2;
	}

	conf.node_type = TPP_ROUTER_NODE;
	conf.numthreads = numthreads;

	if ((tpp_fd = tpp_init_router(&conf)) == -1) {
		log_err(-1, __func__, "tpp init failed\n");
		return 1;
	}

	/* Protect from being killed by kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_ON);

	/* go in a while loop */
	while (get_out == 0) {

		if (hupped == 1) {
			struct pbs_config pbs_conf_bak;
			int new_logevent;

			hupped = 0; /* reset back */
			memcpy(&pbs_conf_bak, &pbs_conf, sizeof(struct pbs_config));

			if (pbs_loadconf(1) == 0) {
				log_err(-1, __func__, "Configuration error, ignoring");
				memcpy(&pbs_conf, &pbs_conf_bak, sizeof(struct pbs_config));
			} else {
				/* restore old pbs.conf */
				new_logevent = pbs_conf.pbs_comm_log_events;
				memcpy(&pbs_conf, &pbs_conf_bak, sizeof(struct pbs_config));
				pbs_conf.pbs_comm_log_events = new_logevent;
				log_err(-1, __func__, "Processed SIGHUP");

				log_event_mask = &pbs_conf.pbs_comm_log_events;
				tpp_set_logmask(*log_event_mask);
				set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
					     pbs_conf.locallog, pbs_conf.syslogfac,
					     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);
			}
		}
		sleep(3);
	}

	tpp_router_shutdown();

	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_NOTICE, msg_daemonname, "Exiting");
	log_close(1);

	lock_out(lockfds, F_UNLCK); /* unlock  */
	(void) close(lockfds);
	(void) unlink(lockfile);
	unload_auths();

	return 0;
}


================================================
FILE: src/server/pbs_db_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    pbsd_db_func.c
 *
 * @brief
 * pbsd_db_func.c - contains functions to initialize several pbs data structures.
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <memory.h>
#include <signal.h>
#include <time.h>
#include <sys/stat.h>
#include <libutil.h>

#include <dirent.h>
#include <grp.h>
#include <netdb.h>
#include <pwd.h>
#include <unistd.h>
#include <sys/param.h>
#include <sys/resource.h>
#include <sys/time.h>

#include "libpbs.h"
#include "pbs_ifl.h"
#include "net_connect.h"
#include "log.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "server.h"
#include "credential.h"
#include "ticket.h"
#include "batch_request.h"
#include "work_task.h"
#include "resv_node.h"
#include "job.h"
#include "queue.h"
#include "reservation.h"
#include "pbs_db.h"
#include "pbs_nodes.h"
#include "tracking.h"
#include "provision.h"
#include "avltree.h"
#include "svrfunc.h"
#include "acct.h"
#include "pbs_version.h"
#include "pbs_license.h"
#include "resource.h"
#include "pbs_python.h"
#include "hook.h"
#include "hook_func.h"
#include "pbs_share.h"

#ifndef SIGKILL
/* there is some weid stuff in gcc include files signal.h & sys/params.h */
#include <signal.h>
#endif

#define MAX_DB_RETRIES 5
#define MAX_DB_LOOP_DELAY 10
#define IPV4_STR_LEN 15
static int db_oper_failed_times = 0;
static int last_rc = -1; /* we need to reset db_oper_failed_times for each state change of the db */
static int conn_db_state = 0;
extern int pbs_failover_active;
extern int server_init_type;
extern int stalone;			  /* is program running not as a service ? */
char conn_db_host[PBS_MAXSERVERNAME + 1]; /* db host where connection is made */
void *svr_db_conn = NULL;		  /* server's global database connection pointer */
void *conn = NULL;			  /* pointer to work out a valid connection - later assigned to svr_db_conn */
extern int pbs_decrypt_pwd(char *, int, size_t, char **, const unsigned char *, const unsigned char *);
extern pid_t go_to_background();
void *setup_db_connection(char *, int, int);
static void *get_db_connect_information();
static int touch_db_stop_file(void);
static int start_db();
void stop_db();

/**
 * @brief
 *		Checks whether database is down, and if so
 *		starts up the database in asynchronous mode.
 *
 * @return - Failure code
 * @retval   PBS_DB_DOWN - Error in pbs_start_db
 * @retval   PBS_DB_STARTING - Database is starting
 *
 */
static int
start_db()
{
	char *failstr = NULL;
	int rc;

	log_eventf(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_CRIT, msg_daemonname, "Starting PBS dataservice");

	rc = pbs_start_db(conn_db_host, pbs_conf.pbs_data_service_port);
	if (rc != 0) {
		if (rc == PBS_DB_OOM_ERR) {
			pbs_db_get_errmsg(PBS_DB_OOM_ERR, &failstr);
			snprintf(log_buffer, LOG_BUF_SIZE, "%s %s", "WARNING:", failstr ? failstr : "");
		} else {
			pbs_db_get_errmsg(PBS_DB_ERR, &failstr);
			snprintf(log_buffer, LOG_BUF_SIZE, "%s %s", "Failed to start PBS dataservice.", failstr ? failstr : "");
		}
		log_eventf(PBSEVENT_SYSTEM | PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_ERR, msg_daemonname, log_buffer);
		fprintf(stderr, "%s\n", log_buffer);
		free(failstr);
		if (rc != PBS_DB_OOM_ERR)
			return PBS_DB_DOWN;
	}

	sleep(1); /* give time for database to atleast establish the ports */
	return PBS_DB_STARTING;
}

/**
 * @brief
 *		Stop the database if up, and log a message if the database
 *		failed to stop.
 *		Try to stop till not successful, with incremental delay.
 */
void
stop_db()
{
	char *db_err = NULL;
	int db_delay = 0;
	pbs_db_disconnect(svr_db_conn);
	svr_db_conn = NULL;

	/* check status of db, shutdown if up */
	db_oper_failed_times = 0;
	while (1) {
		if (pbs_status_db(conn_db_host, pbs_conf.pbs_data_service_port) != 0)
			return; /* dataservice not running, got killed? */

		log_eventf(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_CRIT, msg_daemonname, "Stopping PBS dataservice");

		if (pbs_stop_db(conn_db_host, pbs_conf.pbs_data_service_port) != 0) {
			pbs_db_get_errmsg(PBS_DB_ERR, &db_err);
			snprintf(log_buffer, LOG_BUF_SIZE, "%s %s", "Failed to stop PBS dataservice.", db_err ? db_err : "");
			log_eventf(PBSEVENT_SYSTEM | PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_ERR, msg_daemonname, log_buffer);
			fprintf(stderr, "%s\n", log_buffer);
			free(db_err);
			db_err = NULL;
		}

		db_oper_failed_times++;
		/* try stopping after some time again */
		db_delay = (int) (1 + db_oper_failed_times * 1.5);
		if (db_oper_failed_times > MAX_DB_LOOP_DELAY)
			db_delay = MAX_DB_LOOP_DELAY; /* limit to MAX_DB_LOOP_DELAY secs */
		sleep(db_delay);		      /* don't burn the CPU looping too fast */
	}
}

/**
 * @brief
 *	Attempt to mail a message to "mail_from" (administrator), shut down
 *	the database, close the log and exit the Server. Called when a database save fails.
 *	Panic shutdown of server due to database error. Closing database and log system.
 *
 */
void
panic_stop_db()
{
	char panic_stop_txt[] = "Panic shutdown of Server on database error.  Please check PBS_HOME file system for no space condition.";

	log_err(-1, __func__, panic_stop_txt);
	svr_mailowner(0, 0, 0, panic_stop_txt);
	stop_db();
	log_close(1);
	exit(1);
}

/**
 * @brief
 *		Setup a new database connection structure.
 *
 * @par Functionality:
 *		Disconnect and destroy any active connection associated
 *		with global variable conn.
 *		It then calls pbs_db_connect to initialize a new connection
 *		structure (pointed to by conn) with the values of host, timeout and
 *		have_db_control. Logs error on failure.
 *
 * @param[in]	host	- The host to connect to
 * @param[in]	port	- The port to connect to
 * @param[in]	timeout	- The connection timeout
 *
 * @return	Initialized connection handle.
 * @retval  !NULL - Connection Established.
 * @retval  NULL - No Connection.
 *
 */
void *
setup_db_connection(char *host, int port, int timeout)
{
	int failcode = 0;
	int rc = 0;
	char *conn_db_err = NULL;
	void *lconn = NULL;

	/* Make sure we have the database instance up and running */
	/* If the services are down, retry will attempt to start_db() */
	rc = pbs_status_db(host, port);
	if (rc == 1)
		return NULL;
	else if (rc == -1)
		failcode = PBS_DB_ERR;
	else
		failcode = pbs_db_connect(&lconn, host, port, timeout);
	if (!lconn) {
		pbs_db_get_errmsg(failcode, &conn_db_err);
		if (conn_db_err) {
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
				  LOG_CRIT, msg_daemonname, conn_db_err);
			free(conn_db_err);
		}
	}
	return lconn;
}

/**
 * @brief
 *		This function creates connection information which is used by
 * 		connect_to_db.
 *
 * @return - void pointer
 * @retval  NULL - Function failed. Error will be logged
 * @retval  !NULL - Newly allocated connection handler.
 *
 */
static void *
get_db_connect_information()
{
	void *lconn = NULL;
	int rc = 0;
	int conn_timeout = 0;
	char *failstr = NULL;

	/*
	 * Decide where to connect to, the timeout, and whether we can have control over the
	 * database instance or not. Based on these create a new connection structure by calling
	 * setup_db_connection. The behavior is as follows:
	 *
	 * a) If external database is configured (pbs_data_service_host), then always connect to that
	 *	and do not try to start/stop the database (both in standalone / failover cases). In case of a
	 *	connection failure (in between pbs processing) in standalone setup, try reconnecting to the
	 *	external database for ever.
	 *	In case of connection failure (not at startup) in a failover setup, try connecting to the external
	 *	database only once more and then quit, letting failover kick in.
	 *
	 *
	 * b) With embedded database:
	 *	Status the database:
	 *	- If no database running, start database locally.
	 *
	 *	- If database already running locally, its all good.
	 *
	 *	- If database is running on another host, then,
	 *		a) If standalone, continue to attempt to start database locally.
	 *		b) If primary, attempt to connect to secondary db, if it
	 *		   connects, then throw error and start over (since primary
	 *		   should never use the secondary's database. If connect fails
	 *		   database is then try to start database locally.
	 *		c) If secondary, attempt connection to primary db; if it
	 *		   connects, continue to use it happily. If it fails, attempt to start
	 *		   database locally.
	 *
	 */
	if (pbs_conf.pbs_data_service_host) {
		/*
		 * External database configured,  infinite timeout, database instance not in our control
		 */
		conn_timeout = PBS_DB_CNT_TIMEOUT_INFINITE;
		strncpy(conn_db_host, pbs_conf.pbs_data_service_host, PBS_MAXSERVERNAME);
	} else {
		/*
		 * Database is in our control, we need to figure out the status of the database first
		 * Is it already running? Is it running on another machine?
		 *  Check whether database is up or down.
		 *  It calls pbs_status_db to figure out the database status.
		 *  pbs_db_status returns:
		 *	-1 - failed to execute
		 *	0  - Data service running on local host
		 *	1  - Data service NOT running
		 *	2  - Data service running on another host
		 *
		 * If pbs_db_status is not sure whether db is running or not, then it attempts
		 * to connect to the host database to confirm that.
		 *
		 */
		if (pbs_conf.pbs_primary) {
			if (!pbs_failover_active)
				strncpy(conn_db_host, pbs_conf.pbs_primary, PBS_MAXSERVERNAME);
			else
				strncpy(conn_db_host, pbs_conf.pbs_secondary, PBS_MAXSERVERNAME);
		} else if (pbs_conf.pbs_server_host_name)
			strncpy(conn_db_host, pbs_conf.pbs_server_host_name, PBS_MAXSERVERNAME);
		else
			strncpy(conn_db_host, server_host, PBS_MAXSERVERNAME);

		rc = pbs_status_db(conn_db_host, pbs_conf.pbs_data_service_port);
		if (rc == -1) {
			pbs_db_get_errmsg(PBS_DB_ERR, &failstr);
			log_errf(PBSE_INTERNAL, msg_daemonname, "status db failed: %s", failstr ? failstr : "");
			free(failstr);
			return NULL;
		}

		log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, "pbs_status_db exit code %d", rc);

		if (last_rc != rc) {
			/*
			 * we might have failed trying to start database several times locally
			 * if however, the database state has changed (like its stopped by admin),
			 * then we reset db_oper_failed_times.
			 *
			 * Basically we check against the error code from the last try, if its
			 * not the same error code, then it means that something in the database
			 * startup has changed (or failing to start for a different reason).
			 * Since the db_oper_failed_times is used to count the number of failures
			 * of one particular kind, so we reset it when the error code differs
			 * from that in the last try.
			 */
			db_oper_failed_times = 0;
		}
		last_rc = rc;

		if (pbs_conf.pbs_primary) {
			if (rc == 0 || rc == 1) /* db running locally or db not running */
				conn_timeout = PBS_DB_CNT_TIMEOUT_INFINITE;
			if (rc == 2) /* db could be running on secondary, don't start, try connecting to secondary's */
				conn_timeout = PBS_DB_CNT_TIMEOUT_NORMAL;

			if (!pbs_failover_active) {
				/* Failover is configured, and this is the primary */
				if (rc == 0 || rc == 1) /* db running locally or db not running */
					strncpy(conn_db_host, pbs_conf.pbs_primary, PBS_MAXSERVERNAME);

				if (rc == 2) /* db could be running on secondary, don't start, try connecting to secondary's */
					strncpy(conn_db_host, pbs_conf.pbs_secondary, PBS_MAXSERVERNAME);

			} else {
				/* Failover is configured and this is active secondary */
				if (rc == 0 || rc == 1) /* db running locally or db not running */
					strncpy(conn_db_host, pbs_conf.pbs_secondary, PBS_MAXSERVERNAME);

				/* db could be running on primary, don't start, try connecting to primary's */
				if (rc == 2) {
					strncpy(conn_db_host, pbs_conf.pbs_primary, PBS_MAXSERVERNAME);
					conn_db_state = PBS_DB_STARTED;
				}
			}
		} else {
			/*
			 * No failover configured. Try connecting forever to our own instance, have control.
			 */
			conn_timeout = PBS_DB_CNT_TIMEOUT_INFINITE;
		}
	}
	if (rc == 1)
		conn_db_state = start_db();

	if (conn_db_state == PBS_DB_STARTING || conn_db_state == PBS_DB_STARTED)
		lconn = setup_db_connection(conn_db_host, pbs_conf.pbs_data_service_port, conn_timeout);
	return lconn;
}

/**
 * @brief
 * 		touch_db_stop_file	- create a touch file when db is stopped.
 *
 * @return	int
 * @retval	0	- created touch file
 * @retval	-1	- unable to create touch file
 */
static int
touch_db_stop_file(void)
{
	int fd;
	char closefile[MAXPATHLEN + 1];
	snprintf(closefile, MAXPATHLEN, "%s/datastore/pbs_dbclose", pbs_conf.pbs_home_path);

#ifndef O_RSYNC
#define O_RSYNC 0
#endif
	if ((fd = open(closefile, O_WRONLY | O_CREAT | O_RSYNC, 0600)) != -1)
		return -1;
	close(fd);
	return 0;
}

/**
 * @brief
 * 		connect_to_db	- Try and continue forever till a successful database connection is made.
 *
 * @param[in]	background	- Process can attempt to connect in the background.
 * @return	int
 * @retval	0	- Success
 * @retval	Non-Zero	- Failure
 */
int
connect_to_db(int background)
{
	int try_db = 0;
	int db_stop_counts = 0;
	int db_stop_email_sent = 0;
	int conn_state;
#ifndef DEBUG
	pid_t sid = -1;
#endif
	int db_delay = 0;
try_db_again:
	fprintf(stdout, "Connecting to PBS dataservice.");

	conn_state = PBS_DB_CONNECT_STATE_NOT_CONNECTED;
	db_oper_failed_times = 0;

	while (1) {
#ifndef DEBUG
		fprintf(stdout, ".");
#endif
		if (conn_state == PBS_DB_CONNECT_STATE_FAILED) {
			pbs_db_disconnect(conn);
			conn_state = PBS_DB_CONNECT_STATE_NOT_CONNECTED;
			db_oper_failed_times++;
			conn_db_state = PBS_DB_DOWN; /* allow to retry to start db again */
		} else if (conn_state == PBS_DB_CONNECT_STATE_CONNECTED) {
			sprintf(log_buffer, "connected to PBS dataservice@%s", conn_db_host);
			log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE,
				  PBS_EVENTCLASS_SERVER, LOG_CRIT,
				  msg_daemonname, log_buffer);
			fprintf(stdout, "%s\n", log_buffer);
		}

		if (conn && conn_state == PBS_DB_CONNECT_STATE_CONNECTED)
			break;

		if (conn_db_state == PBS_DB_DOWN) {
			conn_db_state = start_db();
			if (conn_db_state == PBS_DB_STARTING) {
				/* started new database instance, reset connection */
				pbs_db_disconnect(conn); /* disconnect from any old connection, cleanup memory */
				conn_state = PBS_DB_CONNECT_STATE_NOT_CONNECTED;
			} else if (conn_db_state == PBS_DB_DOWN) {
				db_oper_failed_times++;
			}
		}

		if (conn_state == PBS_DB_CONNECT_STATE_NOT_CONNECTED) {
			/* get fresh connection */
			if ((conn = get_db_connect_information()) == NULL)
				conn_state = PBS_DB_CONNECT_STATE_FAILED;
			else
				conn_state = PBS_DB_CONNECT_STATE_CONNECTED;
		}
		db_delay = (int) (1 + db_oper_failed_times * 1.5);
		if (db_delay > MAX_DB_LOOP_DELAY)
			db_delay = MAX_DB_LOOP_DELAY; /* limit to MAX_DB_LOOP_DELAY secs */
		sleep(db_delay);		      /* dont burn the CPU looping too fast */
		update_svrlive();		      /* indicate we are alive */
#ifndef DEBUG
		if (background && try_db >= 4) {
			fprintf(stdout, "continuing in background.\n");
			if ((sid = go_to_background()) == -1)
				return (2);
		}
#endif /* DEBUG is defined */
		try_db++;
	}

	if (!pbs_conf.pbs_data_service_host) {
		/*
		 * Check the connected host and see if it is connected to right host.
		 * In case of a failover, PBS server should be connected to database
		 * on the same host as it is executing on. Thus, if PBS server ends
		 * up connected to a database on another host (say primary server
		 * connected to database on secondary or vice versa), then it is
		 * deemed unacceptable. In such a case throw error on log notifying
		 * that PBS is attempting to stop the database on the other side
		 * and restart the loop all over.
		 */
		if (pbs_conf.pbs_primary) {
			if (!pbs_failover_active) {
				/* primary instance */
				if (strcmp(conn_db_host, pbs_conf.pbs_primary) != 0) {
					/* primary instance connected to secondary database, not acceptable */
					log_errf(-1, msg_daemonname, "PBS data service is up on the secondary instance, attempting to stop it");
					pbs_db_disconnect(conn);
					conn = NULL;

					touch_db_stop_file();

					if (db_stop_email_sent == 0) {
						if (++db_stop_counts > MAX_DB_RETRIES) {
							log_errf(-1, msg_daemonname, "Not able to stop PBS data service at the secondary site, please stop manually");
							svr_mailowner(0, 0, 1, log_buffer);
							db_stop_email_sent = 1;
						}
					}
					sleep(10);
					goto try_db_again;
				}
			} else {
				/* secondary instance */
				if (strcmp(conn_db_host, pbs_conf.pbs_primary) == 0) {
					/* secondary instance connected to primary database, not acceptable */
					log_errf(-1, msg_daemonname, "PBS data service is up on the primary instance, attempting to stop it");

					pbs_db_disconnect(conn);
					conn = NULL;

					touch_db_stop_file();

					if (db_stop_email_sent == 0) {
						if (++db_stop_counts > MAX_DB_RETRIES) {
							log_errf(-1, msg_daemonname, "Not able to stop PBS data service at the primary site, please stop manually");
							svr_mailowner(0, 0, 1, log_buffer);
							db_stop_email_sent = 1;
						}
					}
					sleep(10);
					goto try_db_again;
				}
			}
		}
	}

	svr_db_conn = conn; /* use this connection */
	conn = NULL;	    /* ensure conn does not point to svr_db_conn any more */
	return 0;
}

/**
 * @brief
 *	Frees attribute list memory
 *
 * @param[in]	attr_list - List of pbs_db_attr_list_t objects
 *
 * @return      None
 *
 */
void
free_db_attr_list(pbs_db_attr_list_t *attr_list)
{
	if (attr_list->attr_count > 0) {
		free_attrlist(&attr_list->attrs);
		attr_list->attr_count = 0;
	}
}


================================================
FILE: src/server/pbsd_init.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * contains functions to initialize several pbs data structures.
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <memory.h>
#include <signal.h>
#include <time.h>
#include <sys/stat.h>
#include <libutil.h>

#include <dirent.h>
#include <grp.h>
#include <netdb.h>
#include <pwd.h>
#include <unistd.h>
#include <sys/param.h>
#include <sys/resource.h>
#include <sys/time.h>

#include "libpbs.h"
#include "pbs_ifl.h"
#include "net_connect.h"
#include "log.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "server.h"
#include "credential.h"
#include "ticket.h"
#include "batch_request.h"
#include "work_task.h"
#include "resv_node.h"
#include "job.h"
#include "queue.h"
#include "reservation.h"
#include "pbs_db.h"
#include "pbs_nodes.h"
#include "tracking.h"
#include "provision.h"
#include "pbs_idx.h"
#include "svrfunc.h"
#include "acct.h"
#include "pbs_version.h"
#include "tpp.h"
#include "pbs_license.h"
#include "resource.h"
#include "pbs_python.h"
#include "hook.h"
#include "hook_func.h"
#include "pbs_share.h"
#include "liblicense.h"

#ifndef SIGKILL
/* there is some weid stuff in gcc include files signal.h & sys/params.h */
#include <signal.h>
#endif

/* global Data Items */

extern char *msg_startup3;
extern char *msg_daemonname;
extern char *msg_init_abt;
extern char *msg_init_queued;
extern char *msg_init_substate;
extern char *msg_err_noqueue;
extern char *msg_err_noqueue1;
extern char *msg_init_resvNOq;
extern char *msg_init_recovque;
extern char *msg_init_recovresv;
extern char *msg_init_expctq;
extern char *msg_init_nojobs;
extern char *msg_init_exptjobs;
extern char *msg_init_unkstate;
extern char *msg_init_baddb;
extern char *msg_init_chdir;
extern char *msg_unkresc;
extern char *msg_corelimit;

extern char *acct_file;
extern int ext_license_server;
extern char *log_file;
extern char *path_acct;
extern char *path_usedlicenses;
extern char path_log[];
extern char *path_priv;
extern char *path_jobs;
extern char *path_users;
extern char *path_spool;
extern char *path_track;
extern char *path_prov_track;
extern long new_log_event_mask;
extern char server_name[];
extern pbs_list_head svr_newjobs;
extern pbs_list_head svr_allresvs;
extern time_t time_now;

extern struct server server;
extern struct attribute attr_jobscript_max_size;
extern char *path_hooks;
extern char *path_hooks_workdir;
extern pbs_list_head prov_allvnodes;
extern int max_concurrent_prov;
extern void *svr_db_conn;

extern pbs_list_head svr_allhooks;

/* External Functions Called */

extern void on_job_exit(struct work_task *);
extern void on_job_rerun(struct work_task *);
extern int resize_prov_table(int newsize);
extern void offline_all_provisioning_vnodes(void);
extern void stop_db();
extern job *job_recov_db_spl(pbs_db_job_info_t *dbjob, job *pjob);
extern pbs_sched *sched_alloc(char *sched_name);
extern job *recov_job_cb(pbs_db_obj_info_t *, int *);
extern resc_resv *recov_resv_cb(pbs_db_obj_info_t *, int *);
extern pbs_queue *recov_queue_cb(pbs_db_obj_info_t *, int *);
extern pbs_sched *recov_sched_cb(pbs_db_obj_info_t *, int *);
extern void revert_alter_reservation(resc_resv *presv);
extern void log_licenses(pbs_licenses_high_use *pu);
/* Private functions in this file */

static void catch_child(int);
static void init_abt_job(job *);
static void change_logs(int);
int chk_save_file(char *filename);
static void need_y_response(int, char *);
static int pbsd_init_reque(job *job, int change_state);
static void resume_net_move(struct work_task *);
static void stop_me(int);
static int Rmv_if_resv_not_possible(job *);
static int attach_queue_to_reservation(resc_resv *);
static void call_log_license(struct work_task *);
/* private data */

#define CHANGE_STATE 1
#define KEEP_STATE 0
static char badlicense[] = "One or more PBS license keys are invalid, jobs may not run";
char *pbs_licensing_location = NULL;
/**
 * @brief
 *		Initializes the server attribute array with default values which are
 * 		necessary for recovery and action routines to work properly.
 *
 * @return	void
 */
void
init_server_attrs()
{
	resource_def *prdef = NULL;
	resource *presc = NULL;
	int i = 0;

	for (i = 0; i < SVR_ATR_LAST; i++)
		clear_attr(get_sattr(i), &svr_attr_def[i]);

	set_sattr_str_slim(SVR_ATR_scheduler_iteration, TOSTR(PBS_SCHEDULE_CYCLE), NULL);

	server.newobj = 1;

	set_sattr_l_slim(SVR_ATR_State, SV_STATE_INIT, SET);

	set_sattr_l_slim(SVR_ATR_ResvEnable, 1, SET);
	(get_sattr(SVR_ATR_ResvEnable))->at_flags |= ATR_VFLAG_DEFLT;

	set_sattr_str_slim(SVR_ATR_SvrHost, server_host, NULL);
	(get_sattr(SVR_ATR_SvrHost))->at_flags |= ATR_VFLAG_DEFLT;

	set_sattr_l_slim(SVR_ATR_NodeFailReq, PBS_NODE_FAIL_REQUEUE_DEFAULT, SET);
	(get_sattr(SVR_ATR_NodeFailReq))->at_flags |= ATR_VFLAG_DEFLT;

	set_sattr_l_slim(SVR_ATR_ResendTermDelay, PBS_RESEND_TERM_DELAY_DEFAULT, SET);
	(get_sattr(SVR_ATR_ResendTermDelay))->at_flags |= ATR_VFLAG_DEFLT;

	set_sattr_l_slim(SVR_ATR_maxarraysize, PBS_MAX_ARRAY_JOB_DFL, SET);
	(get_sattr(SVR_ATR_maxarraysize))->at_flags |= ATR_VFLAG_DEFLT;

	set_sattr_l_slim(SVR_ATR_license_min, PBS_MIN_LICENSING_LICENSES, SET);
	(get_sattr(SVR_ATR_license_min))->at_flags |= ATR_VFLAG_DEFLT;
	licensing_control.licenses_min = PBS_MIN_LICENSING_LICENSES;

	set_sattr_l_slim(SVR_ATR_license_max, PBS_MAX_LICENSING_LICENSES, SET);
	(get_sattr(SVR_ATR_license_max))->at_flags |= ATR_VFLAG_DEFLT;
	licensing_control.licenses_max = PBS_MAX_LICENSING_LICENSES;

	set_sattr_l_slim(SVR_ATR_license_linger, PBS_LIC_LINGER_TIME, SET);
	(get_sattr(SVR_ATR_license_linger))->at_flags |= ATR_VFLAG_DEFLT;
	licensing_control.licenses_linger_time = PBS_LIC_LINGER_TIME;

	set_sattr_l_slim(SVR_ATR_EligibleTimeEnable, 0, SET);
	(get_sattr(SVR_ATR_EligibleTimeEnable))->at_flags |= ATR_VFLAG_DEFLT;

	set_sattr_l_slim(SVR_ATR_max_concurrent_prov, PBS_MAX_CONCURRENT_PROV, SET);
	(get_sattr(SVR_ATR_max_concurrent_prov))->at_flags |= ATR_VFLAG_DEFLT;

	set_sattr_str_slim(SVR_ATR_max_job_sequence_id, TOSTR(SVR_MAX_JOB_SEQ_NUM_DEFAULT), NULL);
	(get_sattr(SVR_ATR_max_job_sequence_id))->at_flags |= ATR_VFLAG_DEFLT;

	set_attr_generic(&attr_jobscript_max_size, &svr_attr_def[SVR_ATR_jobscript_max_size], DFLT_JOBSCRIPT_MAX_SIZE, NULL, INTERNAL);
	attr_jobscript_max_size.at_type = ATR_TYPE_SIZE; /* needed by get_bytes_from_attr */

	set_sattr_l_slim(SVR_ATR_has_runjob_hook, 0, SET);
	set_sattr_l_slim(SVR_ATR_log_events, SVR_LOG_DFLT, SET);
	*log_event_mask = get_sattr_long(SVR_ATR_log_events);
	set_sattr_str_slim(SVR_ATR_mailer, SENDMAIL_CMD, NULL);
	set_sattr_str_slim(SVR_ATR_mailfrom, PBS_DEFAULT_MAIL, NULL);
	set_sattr_l_slim(SVR_ATR_query_others, 1, SET);
	set_sattr_l_slim(SVR_ATR_scheduling, 1, SET);
	set_sattr_l_slim(SVR_ATR_clear_est_enable, 0, SET);

	prdef = &svr_resc_def[RESC_NCPUS];
	if (prdef) {
		attribute *pattr = get_sattr(SVR_ATR_DefaultChunk);
		presc = add_resource_entry(pattr, prdef);
		if (presc) {
			presc->rs_value.at_val.at_long = 1;
			presc->rs_value.at_flags = ATR_VFLAG_DEFLT | ATR_SET_MOD_MCACHE;
			pattr->at_flags = ATR_VFLAG_DEFLT | ATR_SET_MOD_MCACHE;
			(void) deflt_chunk_action(pattr, (void *) &server, ATR_ACTION_NEW);
		}
		pattr = get_sattr(SVR_ATR_resource_deflt);
		presc = add_resource_entry(pattr, prdef);
		if (presc) {
			presc->rs_value.at_val.at_long = 1;
			presc->rs_value.at_flags = ATR_VFLAG_DEFLT | ATR_SET_MOD_MCACHE;
			pattr->at_flags = ATR_VFLAG_DEFLT | ATR_SET_MOD_MCACHE;
		}
	}
}

/**
 * @brief
 *		This file contains the functions to initialize the PBS Batch Server.
 *		The code is called once when the server is brought up.
 *
 * @param[in]	type	- The type of initialization
 *							RECOV_CREATE - reinitializes all serverdb data
 *
 * @return	Error code
 * @retval	0	- Success
 * @retval	Non-Zero	- Failure
 *
 */
int
pbsd_init(int type)
{
	int a_opt = -1;
	int baselen;
	struct dirent *pdirent;
	DIR *dir;
	int fd;
	int i = 0;
	char zone_dir[MAXPATHLEN];
	char *hook_suffix = HOOK_FILE_SUFFIX;
	int hook_suf_len = strlen(hook_suffix);
	hook *phook, *phook_current;
	char *psuffix;
	int rc;
	struct stat statbuf;
	char hook_msg[HOOK_MSG_SIZE];
	char *conn_db_err = NULL;
	struct sigaction act;
	struct sigaction oact;

	struct tm *ptm;
	pbs_db_job_info_t dbjob = {{0}};
	pbs_db_resv_info_t dbresv = {{0}};
	pbs_db_que_info_t dbque = {{0}};
	pbs_db_sched_info_t dbsched = {{0}};
	pbs_db_obj_info_t obj = {0};
	void *conn = (void *) svr_db_conn;
	char *buf = NULL;
	int buf_len = 0;

#ifdef RLIMIT_CORE
	int char_in_cname = 0;
#endif /* RLIMIT_CORE */

	if ((job_attr_idx = cr_attrdef_idx(job_attr_def, JOB_ATR_LAST)) == NULL) {
		log_err(errno, __func__, "Failed creating job attribute search index");
		return (-1);
	}
	if ((node_attr_idx = cr_attrdef_idx(node_attr_def, ND_ATR_LAST)) == NULL) {
		log_err(errno, __func__, "Failed creating node attribute search index");
		return (-1);
	}
	if ((que_attr_idx = cr_attrdef_idx(que_attr_def, QA_ATR_LAST)) == NULL) {
		log_err(errno, __func__, "Failed creating queue attribute search index");
		return (-1);
	}
	if ((svr_attr_idx = cr_attrdef_idx(svr_attr_def, SVR_ATR_LAST)) == NULL) {
		log_err(errno, __func__, "Failed creating server attribute search index");
		return (-1);
	}
	if ((sched_attr_idx = cr_attrdef_idx(sched_attr_def, SCHED_ATR_LAST)) == NULL) {
		log_err(errno, __func__, "Failed creating sched attribute search index");
		return (-1);
	}
	if ((resv_attr_idx = cr_attrdef_idx(resv_attr_def, RESV_ATR_LAST)) == NULL) {
		log_err(errno, __func__, "Failed creating resv attribute search index");
		return (-1);
	}
	if (cr_rescdef_idx(svr_resc_def, svr_resc_size) != 0) {
		log_err(errno, __func__, "Failed creating resc definition search index");
		return (-1);
	}

	/* initialize the pointers in the resource_def array */

	for (i = 0; i < (svr_resc_size - 1); ++i)
		svr_resc_def[i].rs_next = &svr_resc_def[i + 1];
	/* last entry is left with null pointer */

	/* The following is code to reduce security risks                */

	log_supported_auth_methods(pbs_conf.supported_auth_methods);

	i = getgid();
	(void) setgroups(1, (gid_t *) &i); /* secure suppl. groups */

#ifdef RLIMIT_CORE
	if (pbs_conf.pbs_core_limit) {
		char *pc = pbs_conf.pbs_core_limit;
		while (*pc != '\0') {
			if (!isdigit(*pc)) {
				/* there is a character in core limit */
				char_in_cname = 1;
				break;
			}
			pc++;
		}
	}
#endif /* RLIMIT_CORE */

	{
		struct rlimit rlimit;

		rlimit.rlim_cur = RLIM_INFINITY;
		rlimit.rlim_max = RLIM_INFINITY;

		(void) setrlimit(RLIMIT_CPU, &rlimit);
		(void) setrlimit(RLIMIT_FSIZE, &rlimit);
		(void) setrlimit(RLIMIT_DATA, &rlimit);
		(void) setrlimit(RLIMIT_STACK, &rlimit);
#ifdef RLIMIT_RSS
		(void) setrlimit(RLIMIT_RSS, &rlimit);
#endif /* RLIMIT_RSS */
#ifdef RLIMIT_VMEM
		(void) setrlimit(RLIMIT_VMEM, &rlimit);
#endif /* RLIMIT_VMEM */
#ifdef RLIMIT_CORE
		if (pbs_conf.pbs_core_limit) {
			struct rlimit corelimit;
			corelimit.rlim_max = RLIM_INFINITY;
			if (strcmp("unlimited", pbs_conf.pbs_core_limit) == 0)
				corelimit.rlim_cur = RLIM_INFINITY;
			else if (char_in_cname == 1) {
				log_record(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_WARNING,
					   __func__, msg_corelimit);
				corelimit.rlim_cur = RLIM_INFINITY;
			} else
				corelimit.rlim_cur =
					(rlim_t) atol(pbs_conf.pbs_core_limit);
			(void) setrlimit(RLIMIT_CORE, &corelimit);
		}
#endif /* RLIMIT_CORE */
	}

	/* 1. set up to catch or ignore various signals */
	sigemptyset(&act.sa_mask);
	act.sa_flags = 0;
	act.sa_handler = change_logs;
	if (sigaction(SIGHUP, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for HUP");
		return (2);
	}
	act.sa_handler = stop_me;
	if (sigaction(SIGINT, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for INT");
		return (2);
	}
	if (sigaction(SIGTERM, &act, &oact) != 0) {
		log_err(errno, __func__, "sigactin for TERM");
		return (2);
	}
#ifdef NDEBUG
	if (sigaction(SIGQUIT, &act, &oact) != 0) {
		log_err(errno, __func__, "sigactin for QUIT");
		return (2);
	}
#endif /* NDEBUG */
#ifdef SIGSHUTDN
	if (sigaction(SIGSHUTDN, &act, &oact) != 0) {
		log_err(errno, __func__, "sigactin for SHUTDN");
		return (2);
	}
#endif /* SIGSHUTDN */

	act.sa_handler = catch_child;
	if (sigaction(SIGCHLD, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for CHLD");
		return (2);
	}

	act.sa_handler = SIG_IGN;
	if (sigaction(SIGPIPE, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for PIPE");
		return (2);
	}
	if (sigaction(SIGUSR1, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for USR1");
		return (2);
	}
	if (sigaction(SIGUSR2, &act, &oact) != 0) {
		log_err(errno, __func__, "sigaction for USR2");
		return (2);
	}

	/* 2. check security and set up various global variables we need */

#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	rc = chk_file_sec(path_jobs, 1, 0, S_IWGRP | S_IWOTH, 1);
	if (stat(path_users, &statbuf) != 0)
		(void) mkdir(path_users, 0750);
	rc |= chk_file_sec(path_users, 1, 0, S_IWGRP | S_IWOTH, 1);
	rc |= chk_file_sec(path_hooks, 1, 0, S_IWGRP | S_IWOTH, 0);
	rc |= chk_file_sec(path_hooks_workdir, 1, 0, S_IWGRP | S_IWOTH, 0);
	rc |= chk_file_sec(path_spool, 1, 1, 0, 0);
	rc |= chk_file_sec(path_acct, 1, 1, S_IWGRP | S_IWOTH, 0);
	rc |= chk_file_sec(pbs_conf.pbs_environment, 0, 0, S_IWGRP | S_IWOTH, 1);

	if (rc) {
		log_err(-1, __func__, "chk_file_sec has a failure");
		return (3);
	}
#endif /* not DEBUG and not NO_SECURITY_CHECK */

	time_now = time(NULL);

	rc = setup_resc(1);
	if (rc != 0) {
		/* log_buffer set in setup_resc */
		log_err(-1, __func__, log_buffer);
		/* return value of -1 means a fatal error, -2 means errors
		 * were "auto-corrected" */
		if (rc == -1)
			return (-1);
	}

	/* 3. Set default server attibutes values */
	memset(&server, 0, sizeof(server));
	server.sv_started = time(&time_now); /* time server started */
	if (is_sattr_set(SVR_ATR_scheduling))
		a_opt = get_sattr_long(SVR_ATR_scheduling);

	init_server_attrs();

	/* 5. If not a "create" initialization, recover server db */
	/*    and sched db					  */
	rc = svr_recov_db();
	if ((rc != 0) && (type != RECOV_CREATE)) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		if (conn_db_err != NULL) {
			log_errf(-1, __func__, "%s", conn_db_err);
			free(conn_db_err);
		}
		need_y_response(type, "no server database exists");
		type = RECOV_CREATE;
	}
	if (type != RECOV_CREATE) {
		/* Server read success full ?*/

		if (rc != 0) {
			log_errf(rc, __func__, msg_init_baddb);
			return (-1);
		}

		if (is_sattr_set(SVR_ATR_resource_assn))
			free_sattr(SVR_ATR_resource_assn);

		if (new_log_event_mask) {
			/* set to what was given on command line -e option */
			set_sattr_l_slim(SVR_ATR_log_events, new_log_event_mask, SET);
		}
		*log_event_mask = get_sattr_long(SVR_ATR_log_events);

		/* if server comment is a default, clear it */
		/* it will be reset as needed               */
		if (((get_sattr(SVR_ATR_Comment))->at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) == (ATR_VFLAG_SET | ATR_VFLAG_DEFLT))
			free_sattr(SVR_ATR_Comment);

		/* now do sched db */

		obj.pbs_db_obj_type = PBS_DB_SCHED;
		obj.pbs_db_un.pbs_db_sched = &dbsched;

		rc = pbs_db_search(conn, &obj, NULL, (query_cb_t) &recov_sched_cb);
		if (rc == -1) {
			pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
			if (conn_db_err != NULL) {
				log_errf(-1, __func__, "%s", conn_db_err);
				free(conn_db_err);
			}
			return (-1);
		}

		if (!dflt_scheduler) {
			dflt_scheduler = sched_alloc(PBS_DFLT_SCHED_NAME);
			set_sched_default(dflt_scheduler, 0);
			sched_save_db(dflt_scheduler);
		}

		if (get_sattr_long(SVR_ATR_scheduling))
			set_scheduler_flag(SCH_SCHEDULE_ETE_ON, NULL);
	} else {	     /* init type is "create" */
		if (rc == 0) /* server was loaded */
			need_y_response(type, "server database exists");

		svr_save_db(&server);

		dflt_scheduler = sched_alloc(PBS_DFLT_SCHED_NAME);
		set_sched_default(dflt_scheduler, 0);
		sched_save_db(dflt_scheduler);
	}

	/* 4. Check License information */

	reset_license_counters(&license_counts);

	fd = open(path_usedlicenses, O_RDONLY, 0400);

	if ((fd == -1) ||
	    (read(fd, &(license_counts.licenses_high_use), sizeof(pbs_licenses_high_use)) !=
	     sizeof(pbs_licenses_high_use))) {
		license_counts.licenses_high_use.lu_max_hr = 0;
		license_counts.licenses_high_use.lu_max_day = 0;
		license_counts.licenses_high_use.lu_max_month = 0;
		license_counts.licenses_high_use.lu_max_forever = 0;
		ptm = localtime(&time_now);
		license_counts.licenses_high_use.lu_day = ptm->tm_mday;
		license_counts.licenses_high_use.lu_month = ptm->tm_mon;
	}
	if (fd != -1)
		close(fd);

	set_sattr_str_slim(SVR_ATR_version, PBS_VERSION, NULL);

	if ((pbs_licensing_location == NULL) && (license_counts.licenses_local == 0)) {
		printf("%s\n", badlicense);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_ALERT,
			  msg_daemonname, badlicense);
	}

	if (pbs_licensing_location) {
		sprintf(log_buffer, "Using license server at %s",
			PBS_LICENSE_LOCATION);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  msg_daemonname, log_buffer);
		printf("%s\n", log_buffer);
	}
	if (license_counts.licenses_local > 0) {
		sprintf(log_buffer,
			"Licenses valid for %ld Floating hosts",
			license_counts.licenses_local);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
			  msg_daemonname, log_buffer);
		printf("%s\n", log_buffer);
	}

	/* start a timed-event every hour to long the number of floating used */
	if ((license_counts.licenses_local > 0))
		(void) set_task(WORK_Timed, (long) (((time_now + 3600) / 3600) * 3600),
				call_log_license, 0);

	/* 6. open accounting file */

	if (acct_open(acct_file) != 0) {
		log_errf(-1, __func__, "Could not open accounting file");
		return (-1);
	}

	/* 7. Set up other server and global variables */

	if (a_opt != -1) {
		/* a_option was set, overrides saved value of scheduling attr */
		set_sattr_l_slim(SVR_ATR_scheduling, a_opt, SET);
	}

	/*
	 * 8A. If not a "create" initialization, recover queues.
	 *    If a create, remove any queues that might be there.
	 */
	if ((queues_idx = pbs_idx_create(0, 0)) == NULL) {
		log_err(-1, __func__, "Creating queue index failed!");
		return (-1);
	}

	server.sv_qs.sv_numque = 0;

	/* get jobs from DB for this instance of server, by port and address */
	obj.pbs_db_obj_type = PBS_DB_QUEUE;
	obj.pbs_db_un.pbs_db_que = &dbque;

	rc = pbs_db_search(conn, &obj, NULL, (query_cb_t) &recov_queue_cb);
	if (rc == -1) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		if (conn_db_err != NULL) {
			log_errf(-1, __func__, "%s", conn_db_err);
			free(conn_db_err);
		}
		return (-1);
	}

	/* Open and read in node list if one exists */
	if ((rc = setup_nodes()) == -1) {
		/* log_buffer set in setup_nodes */
		log_errf(-1, __func__, log_buffer);
		return (-1);
	}
	mark_which_queues_have_nodes();

	/* at this point, we know all the resource types have been defined,        */
	/* build the resource summation table for validating the Select directives */
	update_resc_sum();

	/*
	 * 8B. If not a "create" initialization, recover reservations.
	 */
	/* set the zoneinfo directory to $PBS_EXEC/zoneinfo.
	 * This is used for standing reservations user of libical */
	sprintf(zone_dir, "%s%s", pbs_conf.pbs_exec_path, ICAL_ZONEINFO_DIR);
	set_ical_zoneinfo(zone_dir);

	/* load reservations */
	if ((resvs_idx = pbs_idx_create(0, 0)) == NULL) {
		log_err(-1, __func__, "Creating reservations index failed!");
		return (-1);
	}
	obj.pbs_db_obj_type = PBS_DB_RESV;
	obj.pbs_db_un.pbs_db_resv = &dbresv;

	rc = pbs_db_search(conn, &obj, NULL, (query_cb_t) &recov_resv_cb);
	if (rc == -1) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		if (conn_db_err != NULL) {
			log_errf(-1, __func__, "%s", conn_db_err);
			free(conn_db_err);
		}
		return (-1);
	}

	/*
	 * 9. If not "create" or "clean" recovery, recover the jobs.
	 *    If a create or clean recovery, delete any jobs.
	 *    Before job creation/recovery, create the jobs index.
	 */
	if ((jobs_idx = pbs_idx_create(0, 0)) == NULL) {
		log_err(-1, __func__, "Creating jobs index failed!");
		return (-1);
	}

	server.sv_qs.sv_numjobs = 0;

	/* get jobs from DB */
	obj.pbs_db_obj_type = PBS_DB_JOB;
	obj.pbs_db_un.pbs_db_job = &dbjob;
	rc = pbs_db_search(conn, &obj, NULL, (query_cb_t) &recov_job_cb);
	if (rc == -1) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		if (conn_db_err != NULL) {
			log_errf(-1, __func__, "%s", conn_db_err);
			free(conn_db_err);
		}
		return (-1);
	} else if (rc == 1) {
		if ((type != RECOV_CREATE) && (type != RECOV_COLD))
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
				  LOG_DEBUG, msg_daemonname, msg_init_nojobs);
	}

	log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_NOTICE, msg_daemonname, msg_init_exptjobs, server.sv_qs.sv_numjobs);

	/* Now, cause any reservations marked RESV_FINISHED to be
	 * removed and place "begin" and "end" tasks onto the
	 * "work_task_timed" list, as appropriate, for those that
	 * remain
	 */

	remove_deleted_resvs();
	degrade_corrupted_confirmed_resvs();
	add_resv_beginEnd_tasks();

	resv_timer_init();

	/* Put us back in the Server's Private directory */

	if (chdir(path_priv) != 0) {
		(void) sprintf(log_buffer, msg_init_chdir, path_priv);
		log_err(-1, __func__, log_buffer);
		return (3);
	}

	/*
	 * 10. Recover the hooks.
	 *
	 */

	if (chdir(path_hooks) != 0) {
		(void) sprintf(log_buffer, msg_init_chdir, path_hooks);
		log_err(errno, __func__, log_buffer);
		return (-1);
	}

	dir = opendir(".");
	if (dir == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
			  LOG_DEBUG, msg_daemonname,
			  "Could not open hooks dir");
	} else {
		/* Now, for each hook found ... */

		while (errno = 0,
		       (pdirent = readdir(dir)) != NULL) {

			if (chk_save_file(pdirent->d_name) != 0) {
				continue;
			}

			/* recover the hooks */

			baselen = strlen(pdirent->d_name) - hook_suf_len;
			psuffix = pdirent->d_name + baselen;
			if (strcmp(psuffix, hook_suffix)) {
				continue;
			}

			if ((phook =
				     hook_recov(pdirent->d_name, NULL, hook_msg,
						sizeof(hook_msg),
						pbs_python_ext_alloc_python_script,
						pbs_python_ext_free_python_script)) == NULL) {
				sprintf(log_buffer,
					"hook_recov(%s): can't recover - %s",
					pdirent->d_name, hook_msg);
				log_event(PBSEVENT_SYSTEM,
					  PBS_EVENTCLASS_SERVER, LOG_NOTICE,
					  msg_daemonname, log_buffer);
			} else {
				sprintf(log_buffer, "Found hook %s type=%s",
					phook->hook_name,
					((phook->type == HOOK_SITE) ? "site" : "pbs"));
				log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
						  PBSEVENT_DEBUG,
					  PBS_EVENTCLASS_SERVER,
					  LOG_INFO, msg_daemonname, log_buffer);
				if (phook->event & MOM_EVENTS)
					mark_mom_hooks_seen();
			}
		}

		if (errno != 0 && errno != ENOENT)
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
				  LOG_DEBUG, msg_daemonname,
				  "Could not read hooks dir");
		(void) closedir(dir);
	}
	print_hooks(0);
	print_hooks(HOOK_EVENT_QUEUEJOB);
	print_hooks(HOOK_EVENT_POSTQUEUEJOB);
	print_hooks(HOOK_EVENT_MODIFYJOB);
	print_hooks(HOOK_EVENT_RESVSUB);
	print_hooks(HOOK_EVENT_MODIFYRESV);
	print_hooks(HOOK_EVENT_MOVEJOB);
	print_hooks(HOOK_EVENT_RUNJOB);
	print_hooks(HOOK_EVENT_JOBOBIT);
	print_hooks(HOOK_EVENT_MANAGEMENT);
	print_hooks(HOOK_EVENT_MODIFYVNODE);
	print_hooks(HOOK_EVENT_PROVISION);
	print_hooks(HOOK_EVENT_PERIODIC);
	print_hooks(HOOK_EVENT_RESV_CONFIRM);
	print_hooks(HOOK_EVENT_RESV_BEGIN);
	print_hooks(HOOK_EVENT_RESV_END);

	/*
	 * cleanup  the hooks work directory
	 */

	cleanup_hooks_workdir(0);

	/* Put us back in the Server's Private directory */

	if (chdir(path_priv) != 0) {
		(void) sprintf(log_buffer, msg_init_chdir, path_priv);
		log_err(-1, __func__, log_buffer);
		return (3);
	}

	/* 11. Open and read in tracking records */

	fd = open(path_track, O_RDONLY | O_CREAT, 0600);
	if (fd < 0) {
		log_err(errno, __func__, "unable to open tracking file");
		return (-1);
	}
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	if (chk_file_sec(path_track, 0, 0, S_IWGRP | S_IWOTH, 0) != 0)
		return (-1);
#endif /* not DEBUG and not NO_SECURITY_CHECK */

	if (fstat(fd, &statbuf) < 0) {
		log_err(errno, "pbs_init", "unable to stat tracking file");
		return (-1);
	} else {

		size_t amt;
		size_t rd;
		char *w;

		/* validate the size of the file, it should be a multiple */
		/* of the tracking structure size                         */

		i = statbuf.st_size / sizeof(struct tracking);
		amt = i * sizeof(struct tracking);

		if (amt != statbuf.st_size) {
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				  LOG_ALERT, msg_daemonname,
				  "tracking file has invalid length");
		}
		if (i < PBS_TRACK_MINSIZE)
			server.sv_tracksize = PBS_TRACK_MINSIZE;
		else
			server.sv_tracksize = i;
		server.sv_track = (struct tracking *) calloc(server.sv_tracksize,
							     sizeof(struct tracking));
		if (server.sv_track == NULL) {
			log_err(errno, "init", "out of memory");
			return -1;
		}
		for (i = 0; i < server.sv_tracksize; i++)
			(server.sv_track + i)->tk_mtime = 0;

		w = (char *) server.sv_track;

		/* read in the file (a mutiple of the struct size) */

		while (amt > 0) {
			rd = read(fd, w, amt);
			if ((rd == -1) && (errno == EINTR)) {
				continue;
			} else if (rd <= 0) {
				break;
			}
			amt -= rd;
			w += rd;
		}
		(void) close(fd);
		server.sv_trackmodifed = 0;
	}

	/* set work task to periodically save the tracking records */

	(void) set_task(WORK_Timed, (long) (time_now + PBS_SAVE_TRACK_TM),
			track_save, 0);

	fd = open(path_prov_track, O_RDONLY | O_CREAT, 0600);
	if (fd < 0) {
		log_err(errno, __func__, "unable to open prov_tracking file");
		return (-1);
	}
#if !defined(DEBUG) && !defined(NO_SECURITY_CHECK)
	if (chk_file_sec(path_prov_track, 0, 0, S_IWGRP | S_IWOTH, 0) != 0)
		return (-1);
#endif /* not DEBUG and not NO_SECURITY_CHECK */

	if (fstat(fd, &statbuf) < 0) {
		log_err(errno, "pbs_init", "unable to stat prov_tracking file");
		return (-1);
	} else {
		size_t amt;
		size_t rd;
		char *p, *buffer;  /* to hold entire file data */
		int ctrl_flag = 0; /* we always write pvtk_mtime first */
		char *token;
		long mtime;
		i = 0;

		/* whats the size of data in file */
		amt = statbuf.st_size;

		server.sv_provtracksize = get_sattr_long(SVR_ATR_max_concurrent_prov);
		DBPRT(("%s: server.sv_provtracksize=%d amt=%ld\n", __func__, server.sv_provtracksize, (long) amt))

		p = malloc(amt + 1);
		if (p == NULL) {
			log_err(errno, "pbs_init", "unable to malloc");
			close(fd);
			return (-1);
		}
		buffer = p;

		/* read entire file into buffer */
		while (amt > 0) {
			rd = read(fd, p, amt);
			if ((rd == -1) && (errno == EINTR)) {
				continue;
			} else if (rd <= 0) {
				break;
			}
			amt -= rd;
			p += rd;
		}
		(void) close(fd);
		buffer[statbuf.st_size] = '\0';

		server.sv_prov_track = (struct prov_tracking *) calloc(server.sv_provtracksize,
								       sizeof(struct prov_tracking));
		if (server.sv_prov_track == NULL) {
			free(buffer);
			log_err(errno, "pbs_init", "unable to calloc");
			return (-1);
		}

		for (i = 0; i < server.sv_provtracksize; i++) {
			server.sv_prov_track[i].pvtk_mtime = 0;
			server.sv_prov_track[i].pvtk_pid = -1;
			server.sv_prov_track[i].pvtk_vnode = NULL;
			server.sv_prov_track[i].pvtk_aoe_req = NULL;
			server.sv_prov_track[i].prov_vnode_info = NULL;
		}

		/* start tokenizing by '|' */
		i = 0;
		token = strtok(buffer, "|");
		while (token != NULL && i < server.sv_provtracksize) {
			switch (ctrl_flag) {
				case 0:
					errno = 0;
					mtime = strtol(token, NULL, 10);
					if (errno) {
						free(buffer);
						free(server.sv_prov_track);
						log_err(errno, "pbs_init",
							"bad data in prov_tracking");
						return (-1);
					}
					server.sv_prov_track[i].pvtk_mtime = mtime;
					++ctrl_flag;
					break;
				case 1:
					/* after first save, 0 is written if */
					/* value is null. If reading 0, then */
					/* pvtk_vnode should be null else it */
					/* becomes "0" */
					if (strcmp(token, "0") != 0) {
						server.sv_prov_track[i].pvtk_vnode =
							(char *) malloc(strlen(token) + 1);
						if (server.sv_prov_track[i].pvtk_vnode == NULL) {
							free(buffer);
							free(server.sv_prov_track);
							log_err(errno, "pbs_init",
								"unable to malloc");
							return (-1);
						}
						strcpy(server.sv_prov_track[i].pvtk_vnode,
						       token);
					}
					++ctrl_flag;
					break;
				case 2:
					if (strcmp(token, "0") != 0) {
						server.sv_prov_track[i].pvtk_aoe_req =
							(char *) malloc(strlen(token) + 1);
						if (server.sv_prov_track[i].pvtk_vnode == NULL) {
							free(buffer);
							free(server.sv_prov_track);
							log_err(errno, "pbs_init",
								"unable to malloc");
							return (-1);
						}
						strcpy(server.sv_prov_track[i].pvtk_aoe_req,
						       token);
					}
					ctrl_flag = 0;
					++i;
					break;
			}
			token = strtok(NULL, "|");
		}
		server.sv_provtrackmodifed = 0;
		free(buffer);
		/* less data recovered than expected */
		if ((i != server.sv_provtracksize) && (statbuf.st_size != 0)) {
			sprintf(log_buffer, "Recovered prov_tracking, "
					    "Expected %d, recovered %d records",
				server.sv_provtracksize, i);
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_WARNING,
				  msg_daemonname, log_buffer);
		}
	}

	/* mark all nodes that are in the prov tracking table as offline,
	 * also do away with all jobs that were waiting on such nodes
	 */
	offline_all_provisioning_vnodes();
	server.sv_cur_prov_records = 0;

	(void) resize_prov_table(max_concurrent_prov);
	CLEAR_HEAD(prov_allvnodes);

	/* trigger degraded reservations on offlined nodes */
	degrade_offlined_nodes_reservations();

	hook_track_recov();

	/* Check to see that jobs in the maintenance_jobs attribute on a node still exist
	 * If they don't exist any more, remove them from a node's maintenance_jobs attribute
	 */
	buf = NULL;
	buf_len = 0;
	for (i = 0; i < svr_totnodes; i++) {
		struct array_strings *arst;
		if (is_nattr_set(pbsndlist[i], ND_ATR_MaintJobs) && (arst = get_nattr_arst(pbsndlist[i], ND_ATR_MaintJobs))->as_usedptr > 0) {
			int j;
			int len = 0;
			int cur_len = 0;
			attribute new;

			for (j = 0; j < arst->as_usedptr; j++)
				len += strlen(arst->as_string[j]) + 1; /* 1 for the comma*/

			if (len > buf_len) {
				char *tmp_buf;
				tmp_buf = realloc(buf, len + 1);
				if (tmp_buf == NULL) {
					free(buf);
					return (-1);
				} else {
					buf = tmp_buf;
					buf_len = len;
				}
			}
			buf[0] = '\0';
			for (j = 0; j < arst->as_usedptr; j++) {
				if (find_job(arst->as_string[j]) == NULL) {
					strncat(buf, arst->as_string[j], len);
					strncat(buf, ",", len);
					buf[len] = '\0';
				}
			}
			/* Did we find a string we need to remove*/
			cur_len = strlen(buf);
			if (cur_len > 0) {
				buf[cur_len - 1] = '\0'; /* remove trailing comma */
				clear_attr(&new, &node_attr_def[(int) ND_ATR_MaintJobs]);
				decode_arst(&new, ATTR_NODE_MaintJobs, NULL, buf);
				set_arst(get_nattr(pbsndlist[i], ND_ATR_MaintJobs), &new, DECR);
			}

			if (arst->as_usedptr > 0)
				set_vnode_state(pbsndlist[i], INUSE_MAINTENANCE, Nd_State_Or);
		}
	}
	free(buf);

	/* purge deleted hooks */
	phook = (hook *) GET_NEXT(svr_allhooks);
	while (phook) {
		phook_current = phook;
		phook = (hook *) GET_NEXT(phook->hi_allhooks);

		if (phook_current->pending_delete && !has_pending_mom_action_delete(phook_current->hook_name))
			hook_purge(phook_current, pbs_python_ext_free_python_script);
	}
	send_rescdef(0);
	hook_track_save(NULL, -1); /* refresh path_hooks_tracking file */

	(void) set_task(WORK_Immed, time_now, memory_debug_log, NULL);

	return (0);
}

/**
 * @brief
 * 		reassign_resc - for a recovered running job, reassign the resources and
 *		nodes to the job.
 *
 * @param[in,out]	pjob	- the job.
 *
 * @return	void
 */
static void
reassign_resc(job *pjob)
{
	int set_exec_vnode;
	int rc;
	int unset_resc_released = 0;
	char *hoststr = get_jattr_str(pjob, JOB_ATR_exec_host);
	char *hoststr2 = get_jattr_str(pjob, JOB_ATR_exec_host2);
	char *vnodein;
	char *vnodeout;

	/* safety check: if no hoststr, no node (hosts) assigned, just return */
	if (hoststr == NULL)
		return;

	if ((is_jattr_set(pjob, JOB_ATR_exec_vnode)) == 0) {
		/*
		 * if exec_vnode is not set, we must be dealing with a
		 * pre-8.0 job.   Then we need to set exec_vnode anew based
		 * on the select spec that was auto generated when the job
		 * was requeued and the existing exec_host.  This is done in
		 * the same as as when a "qrun -H vn+vn+... jobid" is done.
		 */
		set_exec_vnode = 1;
		vnodein = hoststr;
	} else {
		set_exec_vnode = 0;
		vnodein = get_jattr_str(pjob, JOB_ATR_exec_vnode);
	}

	rc = set_nodes((void *) pjob, JOB_OBJECT,
		       vnodein,
		       &vnodeout,
		       &hoststr,
		       &hoststr2,
		       set_exec_vnode,
		       TRUE);

	if (rc != 0) {
		sprintf(log_buffer, "Unable to reallocate resources from nodes for job, error %d", rc);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid, log_buffer);
	} else if (set_exec_vnode == 1) {
		/* need to recreate the exec_host/exec_vnode values */
		free_jattr(pjob, JOB_ATR_exec_host);
		free_jattr(pjob, JOB_ATR_exec_vnode);
		set_jattr_str_slim(pjob, JOB_ATR_exec_vnode, vnodeout, NULL);
		set_jattr_str_slim(pjob, JOB_ATR_exec_host, hoststr, NULL);
	}

	if ((rc == 0) && (is_jattr_set(pjob, JOB_ATR_exec_vnode_deallocated))) {
		char *hstr = NULL;
		char *hstr2 = NULL;
		char *vnalloc = NULL;
		char *new_exec_vnode_deallocated;

		new_exec_vnode_deallocated = get_jattr_str(pjob, JOB_ATR_exec_vnode_deallocated);

		rc = set_nodes((void *) pjob, JOB_OBJECT, new_exec_vnode_deallocated,
			       &vnalloc, &hstr, &hstr2, 1, TRUE);
		if (rc != 0) {
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_WARNING,
				  pjob->ji_qs.ji_jobid, "warning: Failed to make some nodes aware of a deleted job");
		}
	}

	if ((check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP) || check_job_substate(pjob, JOB_SUBSTATE_SUSPEND)) &&
	    (is_jattr_set(pjob, JOB_ATR_resc_released))) {
		/*
		 * Allocating resources back to a suspended job is tricky.
		 * Suspended jobs only hold part of their resources
		 * If set_resc_assigned() is called by a job with the JOB_ATR_resc_released set,
		 * only some of the resources will be acted upon.  Since this
		 * is a fresh job from disk, we need to allocate all of
		 * its resources to it before we partially release some.
		 * We do this by temporarily unsetting JOB_ATR_resc_released attribute while
		 * restoring the job's resources.  This will allocate all of the
		 * requested resources to the job.  We add the flag back to the job
		 * and then decrement the resources released when the job was originally suspended.
		 */
		mark_jattr_not_set(pjob, JOB_ATR_resc_released);
		unset_resc_released = 1;
	}

	set_resc_assigned((void *) pjob, 0, INCR);

	if (unset_resc_released == 1) {
		mark_jattr_set(pjob, JOB_ATR_resc_released);
		set_resc_assigned((void *) pjob, 0, DECR);
	}
}

/**
 * @brief
 * 		pbsd_init_job - decide what to do with the recovered job structure
 *
 *		The action depends on the type of initialization.
 *
 * @param[in,out]	pjob	- the job.
 * @param[in]	type		- type of initialization.
 *
 * @return	int
 * @retval	0	- success
 * @retval	-1	- error.
 */
int
pbsd_init_job(job *pjob, int type)
{
	char newstate;
	int newsubstate;

	/* chk if job belongs to a reservation or is a reservation job.  If this is true
	* and the reservation is no longer possible, return (1) else return (0) */
	if (Rmv_if_resv_not_possible(pjob)) {
		account_record(PBS_ACCT_ABT, pjob, "");
		svr_mailowner(pjob, MAIL_ABORT, MAIL_NORMAL, msg_init_abt);
		check_block(pjob, msg_init_abt);
		job_purge(pjob);
		return 0;
	}

	pjob->ji_momhandle = -1;
	pjob->ji_mom_prot = PROT_INVALID;

	/* update at_server attribute in case name changed */

	free_jattr(pjob, JOB_ATR_at_server);
	set_jattr_generic(pjob, JOB_ATR_at_server, server_name, NULL, SET);

	/* now based on the initialization type */

	if ((type == RECOV_COLD) || (type == RECOV_CREATE)) {
		need_y_response(type, "jobs exists");
		init_abt_job(pjob);
	} else {

		if (type != RECOV_HOT)
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_HOTSTART;

		/* make sure JOB_SVFLG_RescAssn is cleared,		   */
		/* we will reassign resources if needed	based on the job's */
		/* substate (if the job had resources when server exited   */
		/* JOB_SVFLG_RescAssn is reset when the resources are	   */
		/* reassigned by calling reassign_resc().		   */
		pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_RescAssn;

		/* Update run_version if it is not set but run_count is,   */
		/* Likely means recovering a job from a older version      */
		if ((is_jattr_set(pjob, JOB_ATR_run_version) == 0) && is_jattr_set(pjob, JOB_ATR_runcount) != 0) {
			set_jattr_l_slim(pjob, JOB_ATR_run_version, get_jattr_long(pjob, JOB_ATR_runcount), SET);
		}

		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
			if ((pjob->ji_parentaj = find_arrayparent(pjob->ji_qs.ji_jobid)) == NULL) {
				/* parent job object not found */
				init_abt_job(pjob);
				return -1;
			}

			update_sj_parent(pjob->ji_parentaj, pjob, pjob->ji_qs.ji_jobid, JOB_STATE_LTR_EXPIRED, get_job_state(pjob));
		}

		switch (get_job_substate(pjob)) {

			case JOB_SUBSTATE_TRANSICM:
				if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {

					/*
					 * This server created the job, so client
					 * was qsub (a transient client), it won't be
					 * arround to recommit, so auto-commit now
					 */

					set_job_state(pjob, JOB_STATE_LTR_QUEUED);
					set_job_substate(pjob, JOB_SUBSTATE_QUEUED);

					if (pbsd_init_reque(pjob, CHANGE_STATE) == -1)
						return -1;
				} else {
					/*
					 * another server is sending, append to new job
					 * list and wait for commit; need to clear
					 * receiving sock number though
					 */
					pjob->ji_qs.ji_un.ji_newt.ji_fromsock = -1;
					append_link(&svr_newjobs, &pjob->ji_alljobs, pjob);
				}
				break;

			case JOB_SUBSTATE_TRNOUT:
				set_job_state(pjob, JOB_STATE_LTR_QUEUED);
				set_job_substate(pjob, JOB_SUBSTATE_QUEUED);
				/* requeue as queued */
				if (pbsd_init_reque(pjob, CHANGE_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_TRNOUTCM:

				if (check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
					/* was sending to Mom, requeue for now */

					svr_evaljobstate(pjob, &newstate, &newsubstate, 1);
					svr_setjobstate(pjob, newstate, newsubstate);
				} else {
					/* requeue as is - rdy to cmt */

					/* resend rtc */
					set_task(WORK_Immed, 0, resume_net_move, (void *) pjob);
				}
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_QUEUED:
			case JOB_SUBSTATE_PRESTAGEIN:
			case JOB_SUBSTATE_STAGEIN:
			case JOB_SUBSTATE_STAGECMP:
			case JOB_SUBSTATE_STAGEFAIL:
			case JOB_SUBSTATE_STAGEGO:
			case JOB_SUBSTATE_HELD:
			case JOB_SUBSTATE_SYNCHOLD:
			case JOB_SUBSTATE_DEPNHOLD:
			case JOB_SUBSTATE_WAITING:
				if (pbsd_init_reque(pjob, CHANGE_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_PRERUN:
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_PROVISION:
				if (is_jattr_set(pjob, JOB_ATR_prov_vnode)) /* If JOB_ATR_prov_vnode is set, free it */
					free_jattr(pjob, JOB_ATR_prov_vnode);
				if (pbsd_init_reque(pjob, CHANGE_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_RUNNING:
			case JOB_SUBSTATE_SUSPEND:
			case JOB_SUBSTATE_SCHSUSP:
			case JOB_SUBSTATE_BEGUN:
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				if (check_job_substate(pjob, JOB_SUBSTATE_RUNNING) ||
				    ((is_jattr_set(pjob, JOB_ATR_resc_released)) &&
				     (check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP) ||
				      check_job_substate(pjob, JOB_SUBSTATE_SUSPEND)))) {

					reassign_resc(pjob);
					if (type == RECOV_HOT)
						pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HOTSTART;
				}
				break;

			case JOB_SUBSTATE_SYNCRES:

				/* clear all dependent job ready flags */

				if (pbsd_init_reque(pjob, CHANGE_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_TERM:
			case JOB_SUBSTATE_EXITING:
			case JOB_SUBSTATE_STAGEOUT:
			case JOB_SUBSTATE_STAGEDEL:
			case JOB_SUBSTATE_EXITED:
				set_task(WORK_Immed, 0, on_job_exit, (void *) pjob);
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				reassign_resc(pjob);
				break;

			case JOB_SUBSTATE_ABORT:
				/* requeue job and if no nodes assigned,thats all */
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HasNodes) != 0) {
					/* has nodes so reassign */
					set_task(WORK_Immed, 0, on_job_exit, (void *) pjob);
					reassign_resc(pjob);
				}
				break;

			case JOB_SUBSTATE_MOVED:
			case JOB_SUBSTATE_FAILED:
			case JOB_SUBSTATE_FINISHED:
			case JOB_SUBSTATE_TERMINATED:
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_RERUN:
				if (check_job_state(pjob, JOB_STATE_LTR_EXITING))
					set_task(WORK_Immed, 0, on_job_rerun, (void *) pjob);
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				break;

			case JOB_SUBSTATE_RERUN1:
			case JOB_SUBSTATE_RERUN2:
			case JOB_SUBSTATE_RERUN3:
				set_task(WORK_Immed, 0, on_job_rerun, (void *) pjob);
				if (pbsd_init_reque(pjob, KEEP_STATE) == -1)
					return -1;
				break;

			default:
				(void) sprintf(log_buffer,
					       msg_init_unkstate, get_job_substate(pjob));
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
					  LOG_NOTICE,
					  pjob->ji_qs.ji_jobid, log_buffer);
				job_abt(pjob, log_buffer);
				return -1;
		}

		/* update entity limit sums for this job */
		(void) account_entity_limit_usages(pjob, NULL, NULL, INCR, ETLIM_ACC_ALL);

		/* if job has exec host of Mom, set addr and port based on hostname */

		if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_EXEC) {
			pjob->ji_qs.ji_un.ji_exect.ji_momaddr = 0;
			pjob->ji_qs.ji_un.ji_exect.ji_momport = 0;

			if (is_jattr_set(pjob, JOB_ATR_exec_host)) {
				pbs_net_t new_momaddr;
				unsigned int new_momport;

				new_momaddr =
					get_addr_of_nodebyname(
						get_jattr_str(pjob, JOB_ATR_exec_host), &new_momport);

				if (new_momaddr != 0) {
					pjob->ji_qs.ji_un.ji_exect.ji_momaddr = new_momaddr;
					pjob->ji_qs.ji_un.ji_exect.ji_momport = new_momport;
				} else {
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
						  LOG_INFO, pjob->ji_qs.ji_jobid,
						  "Failed to update mom address. Mom address not changed.");
				}
			}
		}
	}
	return 0;
}

/**
 * @brief
 * 		pbsd_init_resv - decide what to do with the recovered reservation structure.
 *
 *		The action depends on the type of initialization.
 *
 * @param[in,out]	presv	- the reservation.
 * @param[in]		type	- type of initialization (read-only=0 , or ownership=1)
 * 					type is unused for now, will be used in later PRs
 *
 */
void
pbsd_init_resv(resc_resv *presv, int type)
{
	revert_alter_reservation(presv);
	is_resv_window_in_future(presv);
	set_old_subUniverse(presv);

	/* add resv to server list */
	append_link(&svr_allresvs, &presv->ri_allresvs, presv);
	if (attach_queue_to_reservation(presv))
		/* reservation needed queue; failed to find it */
		log_eventf(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV,
			   LOG_NOTICE, msg_daemonname, msg_init_resvNOq, presv->ri_qs.ri_queue, presv->ri_qs.ri_resvID);
	else
		log_eventf(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
			   LOG_INFO, msg_daemonname, msg_init_recovresv, presv->ri_qs.ri_resvID);
}

/**
 * @brief
 * 		pbsd_init_node - decide what to do with the recovered node structure.
 *
 *		The action depends on the type of initialization.
 *
 * @param[in,out]	dbnode	- the node recovered.
 * @param[in]		type	- type of initialization (read-only=0 , or ownership=1)
 * 					type is unused for now, will be used in later PRs
 *
 * @return	ptr to pbsnode
 * @retval	Node structure	- success
 * @retval	NULL	- error.
 */
struct pbsnode *
pbsd_init_node(pbs_db_node_info_t *dbnode, int type)
{
	time_t mom_modtime = 0;
	struct pbsnode *np;
	svrattrl *pal;
	int bad;
	int rc = 0;
	int perm = ATR_DFLAG_ACCESS | ATR_PERM_ALLOW_INDIRECT;

	mom_modtime = dbnode->mom_modtime;

	pal = GET_NEXT(dbnode->db_attr_list.attrs);

	/* now create node and subnodes */
	rc = create_pbs_node2(dbnode->nd_name, pal, perm, &bad, &np, FALSE, TRUE); /* allow unknown resources */
	if (rc)
		np = NULL;

	if (np) {
		if (mom_modtime)
			np->nd_moms[0]->mi_modtime = mom_modtime;

		if (is_nattr_set(np, ND_ATR_vnode_pool) && get_nattr_long(np, ND_ATR_vnode_pool) > 0) {
			mominfo_t *pmom = np->nd_moms[0];
			if (pmom && (np == ((mom_svrinfo_t *) (pmom->mi_data))->msr_children[0])) {
				/* natural vnode being recovered, add to pool */
				add_mom_to_pool(np->nd_moms[0]);
			}
		}
	} else {
		if (rc == PBSE_NODEEXIST)
			sprintf(log_buffer, "duplicate node \"%s\"", dbnode->nd_name);
		else
			sprintf(log_buffer, "could not create node \"%s\", error = %d", dbnode->nd_name, rc);
		log_errf(-1, __func__, log_buffer);
	}
	return np;
}

/**
 * @brief
 * 		pbsd_init_reque - re-enqueue the job into the queue it was in
 *
 *		update the state, typically to some form of QUEUED.
 *		make sure substate attributes match actual value.
 *
 * @param[in,out]	pjob	- the job.
 * @param[in]	change_state- possible  values,
 * 								CHANGE_STATE - 1
 * 								KEEP_STATE	 - 0
 *
 * @return	int
 * @retval	0	- success
 * @retval	-1	- error.
 */
static int
pbsd_init_reque(job *pjob, int change_state)
{
	char logbuf[384];
	char newstate;
	int newsubstate;
	int rc;

	/* re-enqueue the job into the queue it was in */

	if (change_state) {
		/* update the state, typically to some form of QUEUED */
		unset_extra_attributes(pjob);
		svr_evaljobstate(pjob, &newstate, &newsubstate, 1);
		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob)
			update_sj_parent(pjob->ji_parentaj, pjob, pjob->ji_qs.ji_jobid, get_job_state(pjob), newstate);
		set_job_state(pjob, newstate);
		set_job_substate(pjob, newsubstate);
	}

	/* make sure substate attributes match actual value */
	post_attr_set(get_jattr(pjob, JOB_ATR_substate));

	if ((rc = svr_enquejob(pjob, NULL)) == 0) {
		sprintf(logbuf, msg_init_substate, get_job_substate(pjob));
		(void) strcat(logbuf, msg_init_queued);
		(void) strcat(logbuf, pjob->ji_qs.ji_queue);
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG,
			  PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, logbuf);
	} else {
		if (rc == PBSE_UNKQUE) {

			/* Oops, this should never happen */

			sprintf(logbuf, "%s %s; job %s queue %s",
				msg_err_noqueue, msg_err_noqueue1,
				pjob->ji_qs.ji_jobid, pjob->ji_qs.ji_queue);
		} else if (rc == PBSE_UNKRESC) {
			sprintf(logbuf, "%s %s; job %s",
				msg_err_noqueue, msg_unkresc,
				pjob->ji_qs.ji_jobid);
		} else {
			sprintf(logbuf, "%s; job %s queue %s error %d",
				msg_err_noqueue,
				pjob->ji_qs.ji_jobid, pjob->ji_qs.ji_queue, rc);
		}
		log_err(-1, "pbsd_init", logbuf);
		(void) job_abt(pjob, logbuf);
		return (-1);
	}
	return (0);
}

/**
 * @brief
 * 		catch_child() - the signal handler for  SIGCHLD.
 *		Set a flag for the main loop to know that a child processes
 *		needs to be reaped.
 *
 * @param[in]	sig	- not used in fun.
 *
 * @return	void
 */
static void
catch_child(int sig)
{
	extern int reap_child_flag;

	reap_child_flag = 1;
}

/**
 * @brief
 * 		change_logs - signal handler for SIGHUP
 *		Causes the accounting file and log file to be closed and reopened.
 *		Thus the old one can be renamed.
 *
 * @param[in]	sig	- not used in fun.
 *
 * @return	void
 */
static void
change_logs(int sig)
{
	acct_close();
	log_close(1);
	log_open(log_file, path_log);
	(void) acct_open(acct_file);
}

/**
 * @brief
 * 		stop_me - signal handler for all caught signals which terminate the server
 *
 *		Record the signal so an log_event call can be made outside of
 *		the handler, and set the server state to indicate we should shut down.
 *
 * @param[in]	sig	- not used in fun.
 *
 * @return	void
 */
/*ARGSUSED*/
static void
stop_me(int sig)
{
	set_sattr_l_slim(SVR_ATR_State, SV_STATE_SHUTSIG, SET);
}
/**
 * @brief
 * 		chk_save_file - check whether data can be saved into file.
 *
 *		checks include the file permission checks and regular file check.
 *
 * @param[in]	filename	- file which needs to be checked.
 *
 * @return	error code
 * @retval	0	- success
 * @retval	-1	- failure
 */
int
chk_save_file(char *filename)
{
	struct stat sb;

	if (stat(filename, &sb) == -1)
		return (errno);

	if (S_ISREG(sb.st_mode))
		return (0);
	return (-1);
}

/**
 * @brief
 * 		resume_net_move - call net_move() to complete the routing of a job
 *		This is invoked via a work task created on recovery of a job
 *		in JOB_SUBSTATE_TRNOUTCM state.
 *
 * @param[in]	ptask	- work task created on recovery of a job
 *
 * @return	void
 */
static void
resume_net_move(struct work_task *ptask)
{
	net_move((job *) ptask->wt_parm1, 0);
}

/**
 * @brief
 * 		need_y_response - on create/clean initialization that would delete
 *		information, obtain the operator approval first.
 *
 * @param[in]	type	- server initialization mode
 * @param[in]	txt	- text field in msg_startup3 string
 *
 * @return	void
 *
 * @par MT-safe: No
 */
static void
need_y_response(int type, char *txt)
{
	static int answ = -2;
	int c;
	char *t[] = {"Hot",
		     "Warm",
		     "Cold",
		     "Create"};

	char *tp;

	if (answ > 0)
		return; /* already gotten a response */

	fflush(stdin);
	if ((type > RECOV_CREATE) || (type < RECOV_HOT)) {
		stop_db();
		exit(1);
	}

	tp = t[type];

	printf(msg_startup3, msg_daemonname, server_name, tp, txt);
	while (1) {
		answ = getchar();
		c = answ;
		while ((c != '\n') && (c != EOF))
			c = getchar();
		switch (answ) {
			case 'y':
			case 'Y':
				return;

			case EOF:
			case '\n':
			case 'n':
			case 'N':
				printf("PBS server %s initialization aborted\n", server_name);
				stop_db();
				exit(0);
		}
		printf("y(es) or n(o) please:\n");
	}
}

/**
 * @brief
 * 		init_abt_job() - log and email owner message that job is being aborted at
 *		initialization; then purge job (must be called after job is enqueued).
 *
 * @param[in]	pjob	- job
 *
 * @return	void
 */
static void
init_abt_job(job *pjob)
{
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, msg_init_abt);
	svr_mailowner(pjob, MAIL_ABORT, MAIL_NORMAL, msg_init_abt);
	check_block(pjob, msg_init_abt);
	job_purge(pjob);
}

/**
 * @brief
 * 		Rmv_if_resv_not_possible - If the job belongs to a reservation that
 *		is no longer possible then report back that it should not be requeued.
 *
 * 		If the job is in a standing reservation queue then do not check whether it is
 * 		viable as this will be handled as part of the end event for the occurrence.
 * 		Note that the end event is added to the work task by remove_delete_resvs.
 *
 * @param[in,out]	pjob	- reservation job
 *
 * @return	return code
 * @retval	0	- OK to requeue
 * @retval	1	- should not be requeued
 */
static int
Rmv_if_resv_not_possible(job *pjob)
{
	int rc = 0; /*assume OK to requeue*/
	resc_resv *presv;
	pbs_queue *pque;

	if ((pque = find_queuebyname(pjob->ji_qs.ji_queue)) != 0) {
		if ((presv = pque->qu_resvp) != 0) {

			/*we are dealing with a job in a reservation*/

			pjob->ji_myResv = presv;

			/* If a standing reservation then ignore the check for end time
				* The behavior of a standing reservation differs from that of an
				* advance one in that only running jobs are deleted at the end of
				*  an occurrence (be it missed or not).
				*/
			if (get_rattr_long(presv, RESV_ATR_resv_count) > 1)
				return 0;

			if (presv->ri_qs.ri_etime < time_now)
				rc = 1;
		}
	}
	return (rc);
}

/**
 * @brief
 *  	attach_queue_to_reservation - if the reservation happens to
 *		be supported by a pbs_queue, find the queue and attach
 *		it to the reservation
 *
 * @param[in,out]	presv	- reservation.
 *
 * @return	int
 * @retval	0	- success
 * @retval	-1	- failure
 */
static int
attach_queue_to_reservation(resc_resv *presv)
{
	if (presv == NULL)
		return (0);
	presv->ri_qp = find_queuebyname(presv->ri_qs.ri_queue);

	if (presv->ri_qp) {
		/*resv points to queue and queue points back*/
		presv->ri_qp->qu_resvp = presv;
		return (0);
	} else
		return (-1);
}

/**
 * @brief
 * 		call_log_license - call the routine to long the floating license info
 *
 * @param[in]	ptask	- work task structure.
 *
 * @return	void
 */
static void
call_log_license(struct work_task *ptask)
{
	int fd;
	long ntime;
	struct tm *tms;

	/* log the floating license info */

	log_licenses(&license_counts.licenses_high_use);

	/* reset values for time periods that have passed */

	license_counts.licenses_high_use.lu_max_hr = 0;
	ntime = ptask->wt_event;
	tms = localtime((time_t *) &ntime);
	if (tms->tm_mday != license_counts.licenses_high_use.lu_day) {
		license_counts.licenses_high_use.lu_max_day = 0;
		license_counts.licenses_high_use.lu_day = tms->tm_mday;
	}
	if (tms->tm_mon != license_counts.licenses_high_use.lu_month) {
		license_counts.licenses_high_use.lu_max_month = 0;
		license_counts.licenses_high_use.lu_month = tms->tm_mon;
	}

	/* write current info to file */
	fd = open(path_usedlicenses, O_WRONLY | O_CREAT | O_TRUNC, 0600);
	if (fd != -1) {
		if (write(fd, &license_counts.licenses_high_use, sizeof(license_counts.licenses_high_use)) == -1)
			log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));
		close(fd);
	}

	/* call myself again at the top of the next hour */
	ntime = ((ntime + 3601) / 3600) * 3600;
	(void) set_task(WORK_Timed, ntime, call_log_license, 0);
}


================================================
FILE: src/server/pbsd_main.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @brief
 * 		The entry point function for pbs_daemon.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <sys/stat.h>
#include <sys/param.h>
#include <netinet/in.h>
#include <sys/wait.h>
#include <netdb.h>
#include <unistd.h>
#include <signal.h>
#ifdef _POSIX_MEMLOCK
#include <sys/mman.h>
#endif /* _POSIX_MEMLOCK */

#include "pbs_ifl.h"
#include <assert.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>

#include "ticket.h"
#ifdef linux
#include <sys/prctl.h>
#endif

#include "list_link.h"
#include "work_task.h"
#include "log.h"
#include "server_limits.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "server.h"
#include "net_connect.h"
#include "libpbs.h"
#include "credential.h"
#include "batch_request.h"
#include "pbs_idx.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include <libutil.h>
#include "tracking.h"
#include "acct.h"
#include "sched_cmds.h"
#include "tpp.h"
#include "dis.h"
#include "libsec.h"
#include "pbs_version.h"
#include "pbs_license.h"
#include "hook.h"
#include "pbs_ecl.h"
#include "provision.h"
#include "pbs_db.h"
#include "pbs_sched.h"
#include "pbs_share.h"
#include <pbs_python.h> /* for python interpreter */
#include "auth.h"

#include "pbs_v1_module_common.i"

/* External functions called */

extern int pbsd_init(int);
extern void shutdown_ack();
extern int takeover_from_secondary(void);
extern int be_secondary(time_t sec);
extern void set_srv_prov_attributes();
extern int connect_to_db(int);
extern void stop_db();
#ifdef NAS /* localmod 005 */
extern int chk_and_update_db_svrhost();
#endif /* localmod 005 */

/* External data items */
extern pbs_list_head svr_requests;
extern char *msg_err_malloc;
extern int pbs_failover_active;

/* Local Private Functions */

static int get_port(char *, unsigned int *, pbs_net_t *);
static time_t next_task();
static int start_hot_jobs();
static void lock_out(int, int);
#define HOT_START_PING_RATE 15

/* Global Data Items */

int stalone = 0; /* is program running not as a service ? */
char *acct_file = NULL;
char daemonname[PBS_MAXHOSTNAME + 8];
int used_unix_licenses = 0;
int used_linix_licenses = 0;
char *log_file = NULL;
char *path_acct;
char *path_usedlicenses;
char path_log[MAXPATHLEN + 1];
char *path_priv;
char *path_jobs;
char *path_hooks_tracking;
char *path_users;
char *path_hooks_rescdef;
char *path_spool;
char *path_track;
char *path_svrlive;
extern char *path_prov_track;
char *path_secondaryact;
char *pbs_o_host = "PBS_O_HOST";
pbs_net_t pbs_mom_addr;
unsigned int pbs_mom_port;
unsigned int pbs_rm_port;
pbs_net_t pbs_server_addr;
unsigned int pbs_server_port_dis;
int reap_child_flag = 0;
time_t secondary_delay = 30;
pbs_sched *dflt_scheduler = NULL; /* the default scheduler */
int shutdown_who;		  /* see req_shutdown() */
char *mom_host = server_host;
long new_log_event_mask = 0;
int server_init_type = RECOV_WARM;
pbs_list_head svr_deferred_req; /* list of lists, one for each scheduler */
pbs_list_head svr_newjobs; /* list of incomming new jobs       */
pbs_list_head svr_allscheds;
extern pbs_list_head svr_creds_cache; /* all credentials available to send */
struct batch_request *saved_takeover_req;
int svr_unsent_qrun_req = 0; /* Set to 1 for scheduling unsent qrun requests */

void *jobs_idx;
void *queues_idx;
void *resvs_idx;

sigset_t allsigs;

/* private data */
static char *suffix_slash = "/";
static int brought_up_alt_sched = 0;
void stop_db();
extern void mark_nodes_unknown(int);

/*
 * Used only by the TPP layer, to ping nodes only if the connection to the
 * local router to the server is up.
 * Initially set the connection to up, so that first time ping happens
 * by default.
 */
int tpp_network_up = 0;

/**
 * @brief
 * 		The handler that is called by TPP layer when the connection to the local
 * 		router is restored
 *
 * @param[in]	data	- Any associated data passed from TPP layer
 *
 * @return	void
 */
void
net_restore_handler(void *data)
{
	log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ALERT, __func__, "net restore handler called");
	tpp_network_up = 1;
}

/**
 * @brief
 * 		The handler that is called by TPP layer when the connection to the local
 * 		router goes down
 *
 * @param[in]	data	- Any associated data passed from TPP layer
 *
 * @return	void
 */
void
net_down_handler(void *data)
{
	if (tpp_network_up == 1) {
		tpp_network_up = 0;
		/* now loop and set all nodes to down */
		log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ALERT, __func__, "marking all nodes unknown");
		mark_nodes_unknown(1);
	}
}

static int lockfds = -1;
static int already_forked = 0; /* we check this variable even in non-debug mode, so dont condition compile it */
static int background = 0;

#ifndef DEBUG
/**
 * @brief
 *		Forks a background process and continues on that, while
 * 		exiting the foreground process. It also sets the child process to
 * 		become the session leader. This function is avaible only on Non-Windows
 * 		platforms and in non-debug mode.
 *
 * @return	pid_t	- sid of the child process (result of setsid)
 * @retval       >0	- sid of the child process.
 * @retval       -1	- Fork or setsid failed.
 */
pid_t
go_to_background()
{
	pid_t sid = -1;
	int rc;

	lock_out(lockfds, F_UNLCK);
	rc = fork();
	if (rc == -1) { /* fork failed */
		log_err(errno, msg_daemonname, "fork failed");
		return ((pid_t) -1);
	}
	if (rc > 0)
		exit(0); /* parent goes away, allowing booting to continue */

	lock_out(lockfds, F_WRLCK);
	if ((sid = setsid()) == -1) {
		log_err(errno, msg_daemonname, "setsid failed");
		return ((pid_t) -1);
	}
	pbs_close_stdfiles();
	already_forked = 1;
	return sid;
}
#endif /* DEBUG is defined */

/**
 * @brief
 * 		Read a message from a TPP stream. Only one kind of message
 * 		is expected -- Inter Server requests from MOM's.
 *
 * @param[in]	stream	- TPP stream from which message is read.
 *
 * @return	void
 */
void
do_tpp(int stream)
{
	int ret, proto, version;
	void is_request(int, int);
	void stream_eof(int, int, char *);

	DIS_tpp_funcs();
	proto = disrsi(stream, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("tpp read failure: ret: %d, proto: %d\n", ret, proto));
		stream_eof(stream, ret, NULL);
		return;
	}
	version = disrsi(stream, &ret);
	if (ret != DIS_SUCCESS) {
		DBPRT(("%s: no protocol version number %s\n",
		       __func__, dis_emsg[ret]))
		stream_eof(stream, ret, NULL);
		return;
	}

	switch (proto) {
		case IS_PROTOCOL:
			DBPRT(("%s: got an inter-server request\n", __func__))
			is_request(stream, version);
			break;
		default:
			DBPRT(("%s: unknown request %d\n", __func__, proto))
			stream_eof(stream, ret, NULL);
			break;
	}
	return;
}

/**
 * @brief
 * 		Read the TPP stream using tpp_poll and invoke do_tpp using that stream.
 *
 * @param[in]	fd	- not used.
 *
 * @return	void
 */
void
tpp_request(int fd)
{
	int iloop;
	int rpp_max_pkt_check = RPP_MAX_PKT_CHECK_DEFAULT;

	/*
	 * Interleave TPP processing with batch request processing.
	 * Certain things like hook/short-job propagation can generate a
	 * huge amount of TPP traffic that can make batch processing
	 * appear sluggish if not interleaved.
	 *
	 */
	if (is_sattr_set(SVR_ATR_rpp_max_pkt_check))
		rpp_max_pkt_check = get_sattr_long(SVR_ATR_rpp_max_pkt_check);

	for (iloop = 0; iloop < rpp_max_pkt_check; iloop++) {
		int stream;

		if ((stream = tpp_poll()) == -1) {
			log_err(errno, __func__, "tpp_poll");
			break;
		}
		if (stream == -2)
			break;
		do_tpp(stream);
	}
	return;
}

/**
 * @brief
 * 		build_path - build the pathname for a PBS directory
 *
 * @param[in]	parent	- parent directory name (dirname)
 * @param[in]	name	- sub directory name
 * @param[in]	sufix	- suffix string to append
 *
 * @return	PBS directory
 */

char *
build_path(char *parent, char *name, char *sufix)
{
	int prefixslash;
	char *ppath;
	size_t len;

	/*
	 * allocate space for the names + maybe a slash between + the suffix
	 */

	if (*(parent + strlen(parent) - 1) == '/')
		prefixslash = 0;
	else
		prefixslash = 1;

	len = strlen(parent) + strlen(name) + prefixslash + 1;
	if (sufix)
		len += strlen(sufix);
	ppath = malloc(len);
	if (ppath) {
		(void) strcpy(ppath, parent);
		if (prefixslash)
			(void) strcat(ppath, "/");
		(void) strcat(ppath, name);
		if (sufix)
			(void) strcat(ppath, sufix);
		return (ppath);
	} else {
		log_err(errno, "build_path", msg_err_malloc);
		log_close(1);
		exit(3);
	}
	/*NOTREACHED*/
}

#ifndef DEBUG
/**
 * @brief
 * 		pbs_close_stdfiles - redirect stdin, stdout and stderr to /dev/null
 *		Not done if compiled with debug
 *
 * @par MT-safe: No
 */
void
pbs_close_stdfiles(void)
{
	static int already_done = 0;

	if (!already_done) {
		FILE *dummyfile;

		(void) fclose(stdin);
		(void) fclose(stdout);
		(void) fclose(stderr);

		dummyfile = fopen(NULL_DEVICE, "r");
		assert((dummyfile != 0) && (fileno(dummyfile) == 0));

		dummyfile = fopen(NULL_DEVICE, "w");
		assert((dummyfile != 0) && (fileno(dummyfile) == 1));
		dummyfile = fopen(NULL_DEVICE, "w");
		assert((dummyfile != 0) && (fileno(dummyfile) == 2));
		already_done = 1;
	}
}
#endif /* DEBUG */

/**
 * @brief
 * 		clear_exec_vnode - clear the exec_vnode attribute
 *		This is done when the server is coming out of HOT start (first
 *		regular RUN cycle).  Jobs which were running when the Server was
 *		shut down may have there exec_vnode left to assist in HOT start.
 *		If left set, the job is trapped into requiring those nodes.
 *		Clear on any job not running and without a restart file.
 */
static void
clear_exec_vnode()
{
	job *pjob;

	for (pjob = (job *) GET_NEXT(svr_alljobs); pjob;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		if ((!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) &&
		    (!check_job_state(pjob, JOB_STATE_LTR_FINISHED)) &&
		    (!check_job_state(pjob, JOB_STATE_LTR_MOVED)) &&
		    (!check_job_state(pjob, JOB_STATE_LTR_EXITING))) {
			if (is_jattr_set(pjob, JOB_ATR_exec_vnode) && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) == 0) {
				free_jattr(pjob, JOB_ATR_exec_vnode);
				free_jattr(pjob, JOB_ATR_exec_host);
				free_jattr(pjob, JOB_ATR_exec_host2);
			}
		}
	}
}

/**
 * @brief
 * 		reap_child() - reap dead child processes
 *
 * 		Collect child status and add to work list entry for that child.
 * 		The list entry is marked as immediate to show the child is gone and
 * 		svr_delay_entry is incremented to indicate to next_task() to check for it.
 */

static void
reap_child(void)
{
	struct work_task *ptask;
	pid_t pid;
	int statloc;

	while (1) {
		if ((pid = waitpid((pid_t) -1, &statloc, WNOHANG)) == (pid_t) -1) {
			if (errno == ECHILD) {
				reap_child_flag = 0;
				return;
			} else if (errno == EINTR) {
				continue;
			} else {
				return;
			}
		} else if (pid == 0) {
			reap_child_flag = 0;
			return;
		}
		ptask = (struct work_task *) GET_NEXT(task_list_event);
		while (ptask) {
			if ((ptask->wt_type == WORK_Deferred_Child) &&
			    (ptask->wt_event == pid)) {
				ptask->wt_type = WORK_Deferred_Cmp;
				ptask->wt_aux = (int) statloc; /* exit status */
				svr_delay_entry++;	       /* see next_task() */
			}
			ptask = (struct work_task *) GET_NEXT(ptask->wt_linkevent);
		}
	}
}

/**
 * @brief
 *	this function handles auth related data before process_request()
 *
 * @param[in] conn - connection data
 *
 * @return	int
 * @retval	>0	data ready
 * @retval	0	no data ready
 * @retval	-1	error
 * @retval	-2	on EOF
 */
int
tcp_pre_process(conn_t *conn)
{
	char errbuf[LOG_BUF_SIZE];
	int rc;

	if (conn->cn_auth_config == NULL)
		return 1;

	DIS_tcp_funcs();
	if (conn->cn_auth_config->encrypt_method[0] != '\0') {
		rc = transport_chan_get_ctx_status(conn->cn_sock, FOR_ENCRYPT);
		if (rc == (int) AUTH_STATUS_UNKNOWN)
			return 1;

		if (rc < (int) AUTH_STATUS_CTX_READY) {
			errbuf[0] = '\0';
			rc = engage_server_auth(conn->cn_sock, conn->cn_hostname, FOR_ENCRYPT, AUTH_SERVER, errbuf, sizeof(errbuf));
			if (errbuf[0] != '\0') {
				if (rc != 0)
					log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, errbuf);
				else
					log_event(PBSEVENT_DEBUG | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, errbuf);
			}
			return rc;
		}
	}

	rc = transport_chan_get_ctx_status(conn->cn_sock, FOR_AUTH);
	if (rc == (int) AUTH_STATUS_UNKNOWN)
		return 1;

	if (rc < (int) AUTH_STATUS_CTX_READY) {
		errbuf[0] = '\0';
		rc = engage_server_auth(conn->cn_sock, conn->cn_hostname, FOR_AUTH, AUTH_SERVER, errbuf, sizeof(errbuf));
		if (errbuf[0] != '\0') {
			if (rc != 0)
				log_event(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_ERR, __func__, errbuf);
			else
				log_event(PBSEVENT_DEBUG | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, errbuf);
		}
		return rc;
	}

	return 1;
}

/**
 * @brief
 * 		main - the initialization and main loop of pbs_daemon
 *
 * @param[in]	argc	- argument count.
 * @param[in]	argv	- argument values.
 *
 * @return	error code
 * @retval	0	- success
 * @retval	!=0	- failed
 *
 * @par MT-safe: No
 */
int
main(int argc, char **argv)
{
	char *nodename = NULL;
	int are_primary;
	int c, rc;
	int i;
	int tppfd; /* fd to receive is HELLO's */
	struct tpp_config tpp_conf;
	char lockfile[MAXPATHLEN + 1];
	char **origevp;
	char *pc;
	pbs_queue *pque;
	char *servicename;
	time_t svrlivetime;
	int sock;
	struct stat sb_sa;
	struct batch_request *periodic_req;
	char hook_msg[HOOK_MSG_SIZE];
	pbs_sched *psched;
	char *keep_daemon_name = NULL;
	pid_t sid = -1;
	long state;
	time_t waittime;
#ifdef _POSIX_MEMLOCK
	int do_mlockall = 0;
#endif /* _POSIX_MEMLOCK */
	extern char **environ;

	static struct {
		char *it_name;
		int it_type;
	} init_name_type[] = {
		{"hot", RECOV_HOT},
		{"warm", RECOV_WARM},
		{"cold", RECOV_COLD},
		{"create", RECOV_CREATE},
		{"updatedb", RECOV_UPDATEDB},
		{"", RECOV_Invalid}};
	static int first_run = 1;

	extern int optind;
	extern char *optarg;
	extern char *msg_svrdown;  /* log message */
	extern char *msg_startup1; /* log message */
	extern char *msg_startup2; /* log message */
	/* python externs */
	extern void pbs_python_svr_initialize_interpreter_data(struct python_interpreter_data * interp_data);
	extern void pbs_python_svr_destroy_interpreter_data(struct python_interpreter_data * interp_data);

	/* set python interp data */
	svr_interp_data.data_initialized = 0;
	svr_interp_data.init_interpreter_data = pbs_python_svr_initialize_interpreter_data;
	svr_interp_data.destroy_interpreter_data = pbs_python_svr_destroy_interpreter_data;
	/*the real deal or just pbs_version and exit*/

	PRINT_VERSION_AND_EXIT(argc, argv);

	/* As a security measure and to make sure all file descriptors	*/
	/* are available to us,  close all above stderr			*/
	i = sysconf(_SC_OPEN_MAX);
	while (--i > 2)
		(void) close(i); /* close any file desc left open by parent */

	/* If we are not run with real and effective uid of 0, forget it */
	if ((getuid() != 0) || (geteuid() != 0)) {
		fprintf(stderr, "%s: Must be run by root\n", argv[0]);
		return (1);
	}

	/* set standard umask */
	umask(022);

	/* set single threaded mode */
	pbs_client_thread_set_single_threaded_mode();
	/* disable attribute verification */
	set_no_attribute_verification();

	/* initialize the thread context */
	if (pbs_client_thread_init_thread_context() != 0) {
		log_err(-1, __func__,
			"Unable to initialize thread context");
		return (1);
	}

	if (pbs_loadconf(0) == 0)
		return (1);

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	/* find out who we are (hostname) */
	server_host[0] = '\0';
	if (pbs_conf.pbs_leaf_name) {
		char *endp;
		snprintf(server_host, sizeof(server_host), "%s", pbs_conf.pbs_leaf_name);
		endp = strchr(server_host, ','); /* find first name */
		if (endp)
			*endp = '\0';
		endp = strchr(server_host, ':'); /* cut out port, if present */
		if (endp)
			*endp = '\0';
	} else if (gethostname(server_host, (sizeof(server_host) - 1)) == -1) {
		log_err(-1, __func__, "Host name too large");
		return (-1);
	}
	if ((server_host[0] == '\0') ||
	    (get_fullhostname(server_host, server_host, (sizeof(server_host) - 1)) == -1)) {
		log_err(-1, __func__, "Unable to get my host name");
		return (-1);
	}

	(void) strcpy(daemonname, "Server@");
	(void) strcat(daemonname, server_host);
	if ((pc = strchr(daemonname, (int) '.')) != NULL)
		*pc = '\0';

	if (set_msgdaemonname(daemonname)) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}

	/* initialize service port numbers for self, Scheduler, and MOM */

	pbs_server_port_dis = pbs_conf.batch_service_port;
	pbs_mom_port = pbs_conf.mom_service_port;
	pbs_rm_port = pbs_conf.manager_service_port;

	/* by default, server_name is what is set in /etc/pbs.conf */
	(void) strcpy(server_name, pbs_conf.pbs_server_name);

	pbs_server_name = pbs_default();
	if ((!pbs_server_name) || (*pbs_server_name == '\0')) {
		log_err(-1, __func__, "Unable to get server host name");
		return (-1);
	}

	pbs_server_addr = get_hostaddr(server_host);
	pbs_mom_addr = pbs_server_addr; /* assume on same host */

	/* parse the parameters from the command line */

	while ((c = getopt(argc, argv, "A:a:Cd:e:F:p:t:lL:M:NR:g:G:s:P:-:")) != -1) {
		switch (c) {
			case 'a':
				if (decode_b(get_sattr(SVR_ATR_scheduling), NULL,
					     NULL, optarg) != 0) {
					(void) fprintf(stderr, "%s: bad -a option\n", argv[0]);
					return (1);
				}
				break;
			case 'd':
				if (pbs_conf.pbs_home_path != NULL)
					free(pbs_conf.pbs_home_path);
				pbs_conf.pbs_home_path = optarg;
				break;
			case 'e':
				new_log_event_mask = strtol(optarg, NULL, 0);
				break;
			case 'p':
				servicename = optarg;
				if (strlen(server_name) + strlen(servicename) + 1 >
				    (size_t) PBS_MAXSERVERNAME) {
					(void) fprintf(stderr,
						       "%s: -p host:port too long\n", argv[0]);
					return (1);
				}
				(void) strcat(server_name, ":");
				(void) strcat(server_name, servicename);
				if ((pbs_server_port_dis = atoi(servicename)) == 0) {
					(void) fprintf(stderr,
						       "%s: -p host:port invalid\n", argv[0]);
					return (1);
				}
				break;
			case 't':
				for (i = RECOV_HOT; i < RECOV_Invalid; i++) {
					if (strcmp(optarg, init_name_type[i].it_name) == 0) {
						server_init_type = init_name_type[i].it_type;
						break;
					}
				}
				if (i == RECOV_Invalid) {
					(void) fprintf(stderr, "%s -t bad recovery type\n",
						       argv[0]);
					return (1);
				}
				break;
			case 'A':
				acct_file = optarg;
				break;
			case 'C':
				stalone = 2;
				break;
			case 'F':
				i = atoi(optarg);
				if (i < -1) {
					(void) fprintf(stderr, "%s -F invalid delay time\n",
						       argv[0]);
					return (1);
				}
				secondary_delay = (time_t) i;
				break;
			case 'l':
#ifdef _POSIX_MEMLOCK
				do_mlockall = 1;
#else
				fprintf(stderr, "-l option - mlockall not supported\n");
#endif /* _POSIX_MEMLOCK */
				break;
			case 'L':
				log_file = optarg;
				break;
			case 'M':
				if (get_port(optarg, &pbs_mom_port, &pbs_mom_addr)) {
					(void) fprintf(stderr, "%s: bad -M %s\n", argv[0], optarg);
					return (1);
				}
				if (isalpha((int) *optarg)) {
					if ((pc = strchr(optarg, (int) ':')) != NULL)
						*pc = '\0';
					mom_host = optarg;
				}
				break;
			case 'N':
				stalone = 1;
				break;
			case 'R':
				if ((pbs_rm_port = atoi(optarg)) == 0) {
					(void) fprintf(stderr, "%s: bad -R %s\n",
						       argv[0], optarg);
					return 1;
				}
				break;

			case '-':
				(void) fprintf(stderr, "%s: bad - mistyped or specified more than --version\n", argv[0]);
				return (1);

			default:
				(void) fprintf(stderr, "%s: unknown option: %c\n", argv[0], c);
				return (1);
		}
	}

	if (optind < argc) {
		(void) fprintf(stderr, "%s: invalid operand\n", argv[0]);
		return (1);
	}

	/* make sure no other server is running with this home directory */

	(void) sprintf(lockfile, "%s/%s/server.lock", pbs_conf.pbs_home_path,
		       PBS_SVR_PRIVATE);
	if ((are_primary = are_we_primary()) == FAILOVER_SECONDARY) {
		strcat(lockfile, ".secondary");
	} else if (are_primary == FAILOVER_CONFIG_ERROR) {
		log_err(-1, msg_daemonname, "neither primary or secondary server");
		return (3);
	}

#ifdef NAS /* localmod 104 */
	if ((lockfds = open(lockfile, O_CREAT | O_WRONLY, 0644)) < 0)
#else
	if ((lockfds = open(lockfile, O_CREAT | O_WRONLY, 0600)) < 0)
#endif /* localmod 104 */
	{
		(void) sprintf(log_buffer, "%s: unable to open lock file",
			       msg_daemonname);
		(void) fprintf(stderr, "%s\n", log_buffer);
		log_err(errno, msg_daemonname, log_buffer);
		return (2);
	}

	CLEAR_HEAD(svr_requests);
	CLEAR_HEAD(task_list_immed);
	CLEAR_HEAD(task_list_interleave);
	CLEAR_HEAD(task_list_timed);
	CLEAR_HEAD(task_list_event);
	CLEAR_HEAD(svr_queues);
	CLEAR_HEAD(svr_alljobs);
	CLEAR_HEAD(svr_newjobs);
	CLEAR_HEAD(svr_allresvs);
	CLEAR_HEAD(svr_deferred_req);
	CLEAR_HEAD(svr_allhooks);
	CLEAR_HEAD(svr_queuejob_hooks);
	CLEAR_HEAD(svr_postqueuejob_hooks);
	CLEAR_HEAD(svr_modifyjob_hooks);
	CLEAR_HEAD(svr_resvsub_hooks);
	CLEAR_HEAD(svr_modifyresv_hooks);
	CLEAR_HEAD(svr_movejob_hooks);
	CLEAR_HEAD(svr_runjob_hooks);
	CLEAR_HEAD(svr_jobobit_hooks);
	CLEAR_HEAD(svr_management_hooks);
	CLEAR_HEAD(svr_modifyvnode_hooks);
	CLEAR_HEAD(svr_periodic_hooks);
	CLEAR_HEAD(svr_provision_hooks);
	CLEAR_HEAD(svr_resv_confirm_hooks);
	CLEAR_HEAD(svr_resv_begin_hooks);
	CLEAR_HEAD(svr_resv_end_hooks);
	CLEAR_HEAD(svr_execjob_begin_hooks);
	CLEAR_HEAD(svr_execjob_prologue_hooks);
	CLEAR_HEAD(svr_execjob_epilogue_hooks);
	CLEAR_HEAD(svr_execjob_preterm_hooks);
	CLEAR_HEAD(svr_execjob_launch_hooks);
	CLEAR_HEAD(svr_execjob_end_hooks);
	CLEAR_HEAD(svr_exechost_periodic_hooks);
	CLEAR_HEAD(svr_exechost_startup_hooks);
	CLEAR_HEAD(svr_execjob_attach_hooks);
	CLEAR_HEAD(svr_execjob_resize_hooks);
	CLEAR_HEAD(svr_execjob_abort_hooks);
	CLEAR_HEAD(svr_execjob_postsuspend_hooks);
	CLEAR_HEAD(svr_execjob_preresume_hooks);
	CLEAR_HEAD(svr_allscheds);
	CLEAR_HEAD(svr_creds_cache);
	CLEAR_HEAD(unlicensed_nodes_list);

	/* initialize paths that we will need */
	path_priv = build_path(pbs_conf.pbs_home_path, PBS_SVR_PRIVATE,
			       suffix_slash);
	path_spool = build_path(pbs_conf.pbs_home_path, PBS_SPOOLDIR,
				suffix_slash);
	path_jobs = build_path(path_priv, PBS_JOBDIR, suffix_slash);
	path_users = build_path(path_priv, PBS_USERDIR, suffix_slash);
	path_rescdef = build_path(path_priv, PBS_RESCDEF, NULL);
	path_acct = build_path(path_priv, PBS_ACCT, suffix_slash);
	path_track = build_path(path_priv, PBS_TRACKING, NULL);
	path_prov_track = build_path(path_priv, PBS_PROV_TRACKING, NULL);
	path_usedlicenses = build_path(path_priv, "usedlic", NULL);
	path_secondaryact = build_path(path_priv, "secondary_active", NULL);
	path_hooks = build_path(path_priv, PBS_HOOKDIR, suffix_slash);
	path_hooks_workdir = build_path(path_priv, PBS_HOOK_WORKDIR,
					suffix_slash);
	path_hooks_tracking = build_path(path_priv, PBS_HOOK_TRACKING,
					 HOOK_TRACKING_SUFFIX);
	path_hooks_rescdef = build_path(path_hooks, PBS_RESCDEF, NULL);
	path_svrlive = build_path(path_priv, PBS_SVRLIVE, NULL);

	/* save original environment in case we re-exec */
	origevp = environ;

	/*
	 * Open the log file so we can start recording events
	 *
	 * set log_event_mask to point to the log_event attribute value so
	 * it controls which events are logged.
	 */
	set_sattr_l_slim(SVR_ATR_log_events, PBSEVENT_MASK, SET);
	*log_event_mask = get_sattr_long(SVR_ATR_log_events);
	(void) sprintf(path_log, "%s/%s", pbs_conf.pbs_home_path, PBS_LOGFILES);

	(void) log_open(log_file, path_log);
	(void) sprintf(log_buffer, msg_startup1, PBS_VERSION, server_init_type);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_FORCE,
		  LOG_NOTICE,
		  PBS_EVENTCLASS_SERVER, msg_daemonname, log_buffer);

	/*Initialize security library's internal data structures*/
	if (load_auths(AUTH_SERVER)) {
		log_err(-1, __func__, "Failed to load auth lib");
		exit(3);
	}

	{
		int csret;

		/* let Libsec do logging if part of PBS daemon code */
		p_cslog = log_err;

		if ((csret = CS_server_init()) != CS_SUCCESS) {
			sprintf(log_buffer,
				"Problem initializing security library (%d)", csret);
			log_err(-1, __func__, log_buffer);
			exit(3);
		}
	}

	/* At this point we must decide if we are the primary or secondary */

	if (are_primary == FAILOVER_NONE) {
		lock_out(lockfds, F_WRLCK); /* no failover configured */
	} else if (are_primary == FAILOVER_PRIMARY) {
		char *takeovermsg = "Notifying Secondary Server that we are taking over";
		/* we believe we are the primary server */

		lock_out(lockfds, F_WRLCK);
		svrlivetime = 0;
		i = 0;

		/*
		 * try to connect to the Secondary Server to tell it to go away
		 * Keep trying untill we connect or see the svrlive time is
		 * not changing
		 */

		printf("%s\n", takeovermsg);
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_FORCE,
			  LOG_NOTICE, PBS_EVENTCLASS_SERVER, msg_daemonname,
			  takeovermsg);
		while (1) {
			if (takeover_from_secondary() == 1) {
				/* contacted Secondary, its gone */
				break;
			}
			/* could not connact Secondary */
			if (stat(path_secondaryact, &sb_sa) == -1)
				break; /* no file saying its active */
			if (stat(path_svrlive, &sb_sa) == -1)
				break; /* no svrlive file */
			if (sb_sa.st_mtime > svrlivetime) {
				/* time stamp is changing, at   */
				/* least once, loop for a retry */
				svrlivetime = sb_sa.st_mtime;
			} else if ((time_now = time(0)) > (svrlivetime + secondary_delay)) {
				/* has not changed during the delay time */
				break;
			}
			sleep(4);
			if ((++i % 15) == 3) {
				/* display and log this about once a minute */
				/* after a couple of tries */
				sprintf(log_buffer, "Unable to contact Secondary Server but it appears to be running; it may need to be shutdown manually.");
				log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN |
						  PBSEVENT_FORCE,
					  LOG_NOTICE,
					  PBS_EVENTCLASS_SERVER, msg_daemonname,
					  log_buffer);
				printf("%s", log_buffer);
				printf("  Will continue to attempt to takeover\n");
			}
		}

		/* in case secondary didn't remove the file */
		/* also tells the secondary to go idle	    */
		(void) unlink(path_secondaryact);

	} else {
		/* we believe we are a secondary server */
#ifndef DEBUG
		/* go into the background and become own sess/process group */
		if (stalone == 0) {
			if ((sid = go_to_background()) == -1)
				return (2);
		}
#endif /* DEBUG */

		/* will not attempt to lock again if go_to_background was already called */
		if (already_forked == 0)
			lock_out(lockfds, F_WRLCK);

		/* Protect from being killed by kernel */
		daemon_protect(0, PBS_DAEMON_PROTECT_ON);

		do {
			c = be_secondary(secondary_delay);
		} while (c == 1); /* recycle and stay inactive */
	}

	/*
	 * At this point, we are the active Server ...
	 *
	 * Initialize the server objects and perform specified recovery
	 * will be left in the server's private directory
	 */

#ifdef linux
	/*
	 * Set floating-point emulation control bits to silently emulate
	 * fp operations accesses. This works on Linux IA64 only, so we do not
	 * check the return status. On non-IA64 linux machine, it silently fails.
	 *
	 */
	prctl(PR_SET_FPEMU, PR_FPEMU_NOPRINT, 0, 0, 0);
#endif

	/* Setup db connection here */
	if (server_init_type != RECOV_CREATE && !stalone && !already_forked)
		background = 1;
	if ((rc = connect_to_db(background)) != 0)
		return rc;

	/* database connection code end */

	if (stalone == 2) {
		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, LOG_NOTICE,
			  PBS_EVENTCLASS_SERVER, msg_daemonname, msg_svrdown);
		acct_close();
		stop_db();
		log_close(1);
		return (0);
	}

	/* initialize the network interface */

	if ((sock = init_network(pbs_server_port_dis)) < 0) {
		(void) sprintf(log_buffer,
			       "init_network failed using ports Server:%u MOM:%u RM:%u",
			       pbs_server_port_dis, pbs_mom_port, pbs_rm_port);
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, msg_daemonname, log_buffer);
		fprintf(stderr, "%s\n", log_buffer);
		stop_db();
		return (4);
	}

	/* go into the background and become own sess/process group */

#ifndef DEBUG
	if (stalone == 0 && already_forked == 0) {
		if ((sid = go_to_background()) == -1) {
			stop_db();
			return (2);
		}
	}
	pbs_close_stdfiles();
#else  /* DEBUG is defined */
	sid = getpid();
	(void) setvbuf(stdout, NULL, _IOLBF, 0);
	(void) setvbuf(stderr, NULL, _IOLBF, 0);
#endif /* end the ifndef DEBUG */

	/* Protect from being killed by kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_ON);

#ifdef _POSIX_MEMLOCK
	if (do_mlockall == 1) {
		if (mlockall(MCL_CURRENT | MCL_FUTURE) == -1) {
			log_err(errno, msg_daemonname, "mlockall failed");
		}
	}
#endif /* _POSIX_MEMLOCK */

	sigemptyset(&allsigs);
	sigaddset(&allsigs, SIGHUP);  /* remember to block these */
	sigaddset(&allsigs, SIGINT);  /* during critical sections */
	sigaddset(&allsigs, SIGTERM); /* so we don't get confused */
	sigaddset(&allsigs, SIGCHLD);
	/* block signals while we do things */
	if (sigprocmask(SIG_BLOCK, &allsigs, NULL) == -1)
		log_err(errno, msg_daemonname, "sigprocmask(BLOCK)");

	/* initialize the network interface */
	if (init_network_add(sock, tcp_pre_process, process_request) != 0) {
		(void) sprintf(log_buffer, "add connection for init_network failed");
		log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, msg_daemonname, log_buffer);
		stop_db();
		return (3);
	}

	sprintf(log_buffer, "Out of memory");
	if (pbs_conf.pbs_leaf_name) {
		char *p;
		nodename = strdup(pbs_conf.pbs_leaf_name);

		/* reset pbs_leaf_name to only the first leaf name with port */
		p = strchr(pbs_conf.pbs_leaf_name, ','); /* keep only the first leaf name */
		if (p)
			*p = '\0';
		p = strchr(pbs_conf.pbs_leaf_name, ':'); /* cut out the port */
		if (p)
			*p = '\0';
	} else {
		char *host = NULL;
		if (pbs_conf.pbs_primary)
			if (!pbs_failover_active)
				host = pbs_conf.pbs_primary;
			else
				host = pbs_conf.pbs_secondary;
		else if (pbs_conf.pbs_server_host_name)
			host = pbs_conf.pbs_server_host_name;
		else if (pbs_conf.pbs_server_name)
			host = pbs_conf.pbs_server_name;

		/* since pbs_leaf_name was not specified, determine all IPs */
		nodename = get_all_ips(host, log_buffer, sizeof(log_buffer) - 1);
	}

	if (!nodename) {
		log_err(-1, __func__, log_buffer);
		fprintf(stderr, "%s\n", "Unable to determine TPP node name");
		stop_db();
		return (1);
	}

	if (setup_env(pbs_conf.pbs_environment) == -1) {
		fprintf(stderr, "%s\n", "Setup environment failed");
		stop_db();
		return (3);
	}

	/* set tpp config */
	rc = set_tpp_config(&pbs_conf, &tpp_conf, nodename, pbs_server_port_dis, pbs_conf.pbs_leaf_routers);
	free(nodename);
	if (rc == -1) {
		(void) sprintf(log_buffer, "Error setting TPP config");
		fprintf(stderr, "%s", log_buffer);
		stop_db();
		return (3);
	}

	tpp_set_app_net_handler(net_down_handler, net_restore_handler);
	tpp_conf.node_type = TPP_LEAF_NODE_LISTEN; /* server needs to know about all CTL LEAVE messages */

	if ((tppfd = tpp_init(&tpp_conf)) == -1) {
		log_err(-1, msg_daemonname, "tpp_init failed");
		fprintf(stderr, "%s", log_buffer);
		stop_db();
		return (3);
	}

	(void) add_conn(tppfd, TppComm, (pbs_net_t) 0, 0, NULL, tpp_request);

	tfree2(&ipaddrs);
	tfree2(&streams);

	if (pbsd_init(server_init_type) != 0) {
		log_err(-1, msg_daemonname, "pbsd_init failed");
		stop_db();
		return (3);
	}

	/* record the fact that the Secondary is up and active (running) */

	if (pbs_failover_active) {
		sprintf(log_buffer, "Failover Secondary Server at %s has gone active", server_host);
		log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
			  LOG_CRIT, msg_daemonname, log_buffer);

		/* now go set up work task to do timestamp svrlive file */

		(void) set_task(WORK_Timed, time_now, secondary_handshake, NULL);

		svr_mailowner(0, 0, 1, log_buffer);
		if (get_sattr_long(SVR_ATR_scheduling)) {
			/* Bring up scheduler here */
			if (dflt_scheduler->sc_primary_conn == -1) {
				char **workenv;
				char schedcmd[MAXPATHLEN + 1];
				/* save the current, "safe", environment.
				 * reset the enviroment to that when first started
				 * this is to get PBS_CONF_FILE if specified.*/
				workenv = environ;
				environ = origevp;

				snprintf(schedcmd, sizeof(schedcmd), "%s/sbin/pbs_sched &", pbs_conf.pbs_exec_path);
				snprintf(log_buffer, sizeof(log_buffer), "starting scheduler: %s", schedcmd);
				if (system(schedcmd) == -1) 
					log_errf(-1, __func__, "system(%s) failed. ERR : %s",schedcmd, strerror(errno));

				log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE,
					  PBS_EVENTCLASS_SERVER, LOG_CRIT,
					  msg_daemonname, log_buffer);

				brought_up_alt_sched = 1;
				/* restore environment to "safe" one */
				environ = workenv;
			}
		}
	} else if (are_primary == FAILOVER_PRIMARY) {
		/* now go set up work task to do handshake with secondary */

		(void) set_task(WORK_Timed, time_now, primary_handshake, NULL);
	}

	log_eventf(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER, LOG_INFO,
		   msg_daemonname, msg_startup2,
		   sid, pbs_server_port_dis, pbs_mom_port, pbs_rm_port);

	/*
	 * Now at last, we are read to do some batch work, the
	 * following section constitutes the "main" loop of the server
	 */

	if (server_init_type == RECOV_HOT)
		set_sattr_l_slim(SVR_ATR_State, SV_STATE_HOT, SET);
	else
		set_sattr_l_slim(SVR_ATR_State, SV_STATE_RUN, SET);

	/* Can start the python interpreter this late, before the main loop,*/
	/* which is when requests are actually read and processed           */
	/* (in wait_request), and when python processing is needed.         */
	svr_interp_data.daemon_name = strdup(msg_daemonname);

	if (svr_interp_data.daemon_name == NULL) { /* should not happen */
		log_err(errno, msg_daemonname, "strdup failed!");
		stop_db();
		return (1);
	}

	/* save it so we can free it without needing the pointer inside svr_interp_data */
	keep_daemon_name = svr_interp_data.daemon_name;

	snprintf(svr_interp_data.local_host_name, sizeof(svr_interp_data.local_host_name),
		 "%s", server_host);
	if ((pc = strchr(svr_interp_data.local_host_name, '.')) != NULL)
		*pc = '\0';

	if (pbs_python_ext_start_interpreter(&svr_interp_data) != 0) {
		log_err(-1, msg_daemonname, "Failed to start Python interpreter");
		stop_db();
		free(keep_daemon_name);
		return (1);
	}

	/* check and enable the prov attributes */
	set_srv_prov_attributes();

	/* check and set power attribute */
	set_srv_pwr_prov_attribute();

	periodic_req = alloc_br(PBS_BATCH_HookPeriodic);
	if (periodic_req == NULL) {
		log_err(errno, msg_daemonname, "Out of memory!");
		stop_db();
		free(keep_daemon_name);
		return (1);
	}
	process_hooks(periodic_req, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);

	/*
	 * main loop of server
	 * stays in this loop until server's state is either
	 * 	_DOWN - time to complete shutdown and exit, or
	 *	_SECIDLE - time for Secondary Server in failover to go
	 *		back to an inactive state.
	 * If state includes SV_STATE_PRIMDLY, stay in loop; this will be
	 * cleared when Secondary Server responds to a request.
	 */
	while ((state = get_sattr_long(SVR_ATR_State)) != SV_STATE_DOWN && state != SV_STATE_SECIDLE) {

		/*
		 * double check that if we are an active Secondary Server, that
		 * that the Primary has not come back alive; if it did it will
		 * remove the "secondary active" file.
		 */
		if (are_primary == FAILOVER_SECONDARY) {
			if (stat(path_secondaryact, &sb_sa) == -1) {
				if (errno == ENOENT) {
					/* file gone, restart to go idle */
					set_sattr_l_slim(SVR_ATR_State, SV_STATE_SECIDLE, SET);
					break;
				}
			}
		}

		/* first process any task whose time delay has expired */
		waittime = next_task();

		if ((state = get_sattr_long(SVR_ATR_State)) == SV_STATE_RUN) { /* In normal Run State */

			if (first_run) {

				/*
				 * clear exec_vnode for jobs that doesn't need
				 * it, otherwise job is locked into those nodes
				 */
				clear_exec_vnode();
				first_run = 0;
			}
			for (psched = (pbs_sched *) GET_NEXT(svr_allscheds); psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {

				/* schedule anything only if sched is connected */
				if (psched->sc_primary_conn == -1 || psched->sc_secondary_conn == -1)
					continue;

				/* if we have a high prio sched command, send it 1st */
				if (psched->svr_do_sched_high != SCH_SCHEDULE_NULL)
					schedule_high(psched);
				if (psched->svr_do_schedule == SCH_SCHEDULE_RESTART_CYCLE) {
					if (!send_sched_cmd(psched, psched->svr_do_schedule, NULL)) {
						log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_NOTICE, msg_daemonname,
							   "sent scheduler restart scheduling cycle request to %s", psched->sc_name);
					} else
						psched->svr_do_schedule = SCH_SCHEDULE_NULL;
				} else if (svr_unsent_qrun_req || (psched->svr_do_schedule != SCH_SCHEDULE_NULL && get_sched_attr_long(psched, SCHED_ATR_scheduling))) {
					/*
					 * If svr_unsent_qrun_req is set to one there are pending qrun
					 * request, then do schedule_jobs irrespective of the server scheduling
					 * state.
					 * If svr_unsent_qrun_req is not set then do the existing checking and do
					 * scheduling only if server scheduling is turned on.
					 */

					psched->sch_next_schedule = time_now + get_sched_attr_long(psched, SCHED_ATR_schediteration);
					if (schedule_jobs(psched) == 0 && svr_unsent_qrun_req)
						svr_unsent_qrun_req = 0;
				}
			}
		} else if (state == SV_STATE_HOT) {

			/* Are there HOT jobs to rerun */
			/* only try every _CYCLE seconds */

			if (time_now > server.sv_hotcycle + SVR_HOT_CYCLE) {
				server.sv_hotcycle = time_now + SVR_HOT_CYCLE;
				c = start_hot_jobs();
			}

			/* If more than _LIMIT seconds since start, stop */

			if ((c == 0) ||
			    (time_now > server.sv_started + SVR_HOT_LIMIT)) {
				server_init_type = RECOV_WARM;
				set_sattr_l_slim(SVR_ATR_State, SV_STATE_RUN, SET);
				state = SV_STATE_RUN;
			}
		}

		/* any jobs to route today */

		pque = (pbs_queue *) GET_NEXT(svr_queues);
		while (pque) {
			if (pque->qu_qs.qu_type == QTYPE_RoutePush)
				queue_route(pque);
			pque = (pbs_queue *) GET_NEXT(pque->qu_link);
		}

		if (reap_child_flag)
			reap_child();

		/* wait for a request and process it */
		if (wait_request(waittime, priority_context) != 0) {
			log_err(-1, msg_daemonname, "wait_requst failed");
		}

		if (reap_child_flag)  /* check again incase signal arrived */
			reap_child(); /* before they were blocked          */

		if ((state = get_sattr_long(SVR_ATR_State)) == SV_STATE_SHUTSIG)
			(void) svr_shutdown(SHUT_SIG); /* caught sig */

		/*
		 * if in process of shuting down and all running jobs
		 * and all children are done, change state to DOWN
		 */

		if ((state > SV_STATE_RUN) &&
		    (state < SV_STATE_SECIDLE) &&
		    (server.sv_jobstates[JOB_STATE_RUNNING] == 0) &&
		    (server.sv_jobstates[JOB_STATE_EXITING] == 0) &&
		    ((void *) GET_NEXT(task_list_event) == NULL)) {
			set_sattr_l_slim(SVR_ATR_State, SV_STATE_DOWN, SET);
			state = SV_STATE_DOWN;
		}
	}
	DBPRT(("Server out of main loop, state is %ld\n", state))

	/* set the current seq id to the last id before final save */
	server.sv_qs.sv_lastid = server.sv_qs.sv_jobidnumber;
	svr_save_db(&server); /* final recording of server */
	track_save(NULL);     /* save tracking data	     */

	/* if brought up the Secondary Scheduler, take it down */

	if (brought_up_alt_sched == 1)
		send_sched_cmd(dflt_scheduler, SCH_QUIT, NULL);

	/* if Moms are to to down as well, tell them */

	if (state != SV_STATE_SECIDLE && (shutdown_who & SHUT_WHO_MOM))
		shutdown_nodes();

	/* if brought up the DB, take it down */
	stop_db();

	if (are_primary == FAILOVER_SECONDARY) {
		/* we are the secondary server */
		(void) unlink(path_secondaryact); /* remove file */

		if (state == SV_STATE_SECIDLE && saved_takeover_req != NULL) {
			/*
			 * If we are the secondary server that is
			 * going inactive AND there is a batch request struct,
			 * send acknowledgement back to primary so primary
			 * server knows that the data have been written.
			 */
			DBPRT(("Failover: acknowledging FO(%d) request\n", saved_takeover_req->rq_ind.rq_failover))
			reply_send(saved_takeover_req);
			saved_takeover_req = NULL;
		}
	}

#if defined(DEBUG)
	/* for valgrind, clear some stuff up */
	{
		hook *phook = (hook *) GET_NEXT(svr_allhooks);
		while (phook) {
			hook *tmp;
			free(phook->hook_name);
			pbs_python_ext_free_python_script(phook->script);
			free(phook->script);
			tmp = phook;
			phook = (hook *) GET_NEXT(phook->hi_allhooks);
			free(tmp);
		}
	}
#endif

	/* Shut down interpreter now before closing network connections */
	pbs_python_ext_shutdown_interpreter(&svr_interp_data); /* stop python if started */

	shutdown_ack();
	net_close(-1); /* close all network connections */
	tpp_shutdown();

	/*
	 * SERVER is going to be shutdown, destroy indexes
	 */
	pbs_idx_destroy(jobs_idx);
	pbs_idx_destroy(queues_idx);
	pbs_idx_destroy(resvs_idx);

	{
		int csret;
		if ((csret = CS_close_app()) != CS_SUCCESS) {
			/*had some problem closing the security library*/

			sprintf(log_buffer, "problem closing security library (%d)", csret);
			log_err(-1, __func__, log_buffer);
		}
	}

	log_event(PBSEVENT_SYSTEM | PBSEVENT_FORCE, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, msg_svrdown);
	acct_close();
	log_close(1);
	free(keep_daemon_name); /* logs closed, can free here */

	lock_out(lockfds, F_UNLCK); /* unlock  */
	(void) close(lockfds);
	(void) unlink(lockfile);
	unload_auths();

	if (state == SV_STATE_SECIDLE) {
		/*
		 * Secondary Server going inactive, or the Primary needs to
		 * recycle itself (found Secondary active);
		 * re-execv the Server, keeps things clean
		 */
		DBPRT(("Failover: reexecing %s as %s ", server_host, argv[0]))
		sprintf(log_buffer, "%s restarting as %s", server_host,
			are_primary == FAILOVER_PRIMARY ? "primary" : "secondary");
		if (*argv[0] == '/') {
			execve(argv[0], argv, origevp);
		} else {
			sprintf(log_buffer, "%s/sbin/pbs_server",
				pbs_conf.pbs_exec_path);
			execve(log_buffer, argv, origevp);
		}
		DBPRT(("Failover: execv failed\n"))
	}
	return (0);
}

/**
 * @brief
 * 		get_port - parse host:port for -M and -S option
 *		Returns into *port and *addr if and only if that part is specified
 *		Both port and addr are returned in HOST byte order.
 *
 * @param[in]	arg	- "host", "port", ":port", or "host:port"
 * @param[in]	port	- RETURN: new port if one given
 * @param[in]	arg	- RETURN: daemon's address if host given
 *
 * @return	int
 * @retval	0	- ok
 * @retval	-1	- error
 */

static int
get_port(char *arg, unsigned int *port, pbs_net_t *addr)
{
	if (*arg == ':')
		++arg;
	if (isdigit((int) *arg)) { /* port only specified */
		*port = (unsigned int) atoi(arg);
	} else {
		char *name;

		name = parse_servername(arg, port);
		if (name) {
			*addr = get_hostaddr(name);
		} else {
			return (-1);
		}
	}
	if ((*port == 0) || (*addr == 0))
		return (-1);
	return 0;
}

/**
 * @brief
 * 		next_task - look for the next work task to perform:
 *		1. If svr_delay_entry is set, then a delayed task is ready so
 *	   		find and process it.
 *		2. All items on the immediate list, then
 *		3. All items on the timed task list which have expired times
 *
 * @return	amount of time till next task
 */

static time_t
next_task()
{

	time_t tilwhen;
	pbs_sched *psched;

	tilwhen = default_next_task();

	/* should the scheduler be run?  If so, adjust the delay time  */

	for (psched = (pbs_sched *) GET_NEXT(svr_allscheds); psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
		time_t delay;
		if ((delay = psched->sch_next_schedule - time_now) <= 0)
			set_scheduler_flag(SCH_SCHEDULE_TIME, psched);
		else if (delay < tilwhen)
			tilwhen = delay;
	}

	next_sync_mom_hookfiles();

	return (tilwhen);
}

/**
 * @brief
 * 		start_hot_jobs - place any job which is state QUEUED and has the
 *		HOT start flag set into execution.
 *
 * @return	number of jobs to be hot started.
 */

static int
start_hot_jobs()
{
	int ct = 0;
	char *nodename;

	job *pjob;

	pjob = (job *) GET_NEXT(svr_alljobs);
	while (pjob) {
		if ((check_job_substate(pjob, JOB_SUBSTATE_QUEUED)) &&
		    (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HOTSTART)) {
			if (is_jattr_set(pjob, JOB_ATR_exec_vnode)) {
				ct++;
				/* find Mother Superior node and see if she is up */
				nodename = parse_servername(get_jattr_str(pjob, JOB_ATR_exec_vnode), NULL);
				if (is_vnode_up(nodename)) {
					/* she is up so can send her the job */
					/* else we will try later            */
					log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB,
						  LOG_INFO,
						  pjob->ji_qs.ji_jobid,
						  "attempting to hot start job");
					(void) svr_startjob(pjob, 0);
				}
			} else {
				/* no vnode list, cannot hot start, clear flag */
				pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_HOTSTART;
			}
		}
		pjob = (job *) GET_NEXT(pjob->ji_alljobs);
	}
	return (ct);
}

/**
 * @brief
 * 		lock_out - lock out other daemons from this directory.
 *		And record (on write-lock), my pid into the file
 *
 * @param[in]	fds	- file descriptor.
 * @param[in]	op	- F_WRLCK  or  F_UNLCK
 */

static void
lock_out(int fds, int op)
{
	int i;
	int j;
	struct flock flock;
	char buf[100];

	if (pbs_conf.pbs_secondary == NULL)
		j = 1; /* not fail over, try lock one time */
	else
		j = 30; /* fail over, try for a minute */

	(void) lseek(fds, (off_t) 0, SEEK_SET);
	flock.l_type = op;
	flock.l_whence = SEEK_SET;
	flock.l_start = 0;
	flock.l_len = 0;
	for (i = 0; i < j; i++) {
		if (fcntl(fds, F_SETLK, &flock) != -1) {
			if (op == F_WRLCK) {
				/* if write-lock, record pid in file */
				if (ftruncate(fds, (off_t) 0) == -1)
					log_errf(-1, __func__, "ftruncate failed. ERR : %s",strerror(errno));

				(void) sprintf(buf, "%d\n", getpid());
				if (write(fds, buf, strlen(buf)) == -1) 
					log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));
			}
			return;
		}
		sleep(2);
	}

	(void) strcpy(log_buffer, "another server running");
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_FORCE,
		  LOG_NOTICE, PBS_EVENTCLASS_SERVER, msg_daemonname,
		  log_buffer);
	fprintf(stderr, "pbs_server: %s\n", log_buffer);
	exit(1);
}


================================================
FILE: src/server/process_request.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    process_request.c
 *
 * @brief
 *  process_request - this function gets, checks, and invokes the proper
 *	function to deal with a batch request received over the network.
 *
 *	All data encoding/decoding dependencies are moved to a lower level
 *	routine.  That routine must convert
 *	the data received into the internal server structures regardless of
 *	the data structures used by the encode/decode routines.  This provides
 *	the "protocol" and "protocol generation tool" freedom to the bulk
 *	of the server.
 *
 * Functions included are:
 *	pbs_crypt_des()
 *	get_credential()
 *	process_request()
 *	set_to_non_blocking()
 *	clear_non_blocking()
 *	dispatch_request()
 *	close_client()
 *	alloc_br()
 *	close_quejob()
 *	free_rescrq()
 *	arrayfree()
 *	read_carray()
 *	decode_DIS_PySpawn()
 *	free_br()
 *	freebr_manage()
 *	freebr_cpyfile()
 *	freebr_cpyfile_cred()
 *	parse_servername()
 *	get_servername()
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <time.h>
#include <sys/types.h>
#include <sys/time.h>
#include <netinet/in.h>
#include <memory.h>
#include <assert.h>
#include <fcntl.h>
#include <grp.h>
#include <pwd.h>
#include <dlfcn.h>
#include <ctype.h>
#include "libpbs.h"
#include "pbs_error.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "server.h"
#include "user.h"
#include "credential.h"
#include "ticket.h"
#include "net_connect.h"
#include "batch_request.h"
#include "log.h"
#include "tpp.h"
#include "dis.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include <libutil.h>
#include "pbs_sched.h"
#include "auth.h"

/* global data items */

pbs_list_head svr_requests;

extern struct server server;
extern pbs_list_head svr_newjobs;
extern pbs_list_head svr_allconns;
extern time_t time_now;
extern char *msg_err_noqueue;
extern char *msg_err_malloc;
extern char *msg_reqbadhost;
extern char *msg_request;
extern char *msg_auth_request;

extern int is_local_root(char *, char *);
extern void req_stat_hook(struct batch_request *);

/* Private functions local to this file */

static void freebr_manage(struct rq_manage *);
static void freebr_cpyfile(struct rq_cpyfile *);
static void freebr_cpyfile_cred(struct rq_cpyfile_cred *);
static void close_quejob(int sfds);

/**
 * @brief
 *		Return 1 if there is no credential, 0 if there is and -1 on error.
 *
 * @param[in]	remote	- server name
 * @param[in]	jobp	- job whose credentials needs to be read.
 * @param[in]	from	- can have the following values,
 * 							PBS_GC_BATREQ, PBS_GC_CPYFILE and PBS_GC_EXEC
 * @param[out]	data	- kerberos credential
 * @param[out]	dsize	- kerberos credential data length
 *
 * @return	int
 * @retval	1	- there is no credential
 * @retval	0	- there is credential
 * @retval	-1	- error
 */
int
get_credential(char *remote, job *jobp, int from, char **data, size_t *dsize)
{
	int ret;

#ifndef PBS_MOM
	/*
	 * ensure job's euser exists as this can be called
	 * from pbs_send_job who is moving a job from a routing
	 * queue which doesn't have euser set
	 */
	if (is_jattr_set(jobp, JOB_ATR_euser) && get_jattr_str(jobp, JOB_ATR_euser)) {
		ret = user_read_password(get_jattr_str(jobp, JOB_ATR_euser), data, dsize);

		/* we have credential but type is NONE, force DES */
		if (ret == 0 && (jobp->ji_extended.ji_ext.ji_credtype == PBS_CREDTYPE_NONE))
			jobp->ji_extended.ji_ext.ji_credtype = PBS_CREDTYPE_AES;
	} else
		ret = read_cred(jobp, data, dsize);
#else
	ret = read_cred(jobp, data, dsize);
#endif
	return ret;
}

static void
req_authenticate(conn_t *conn, struct batch_request *request)
{
	auth_def_t *authdef = NULL;
	auth_def_t *encryptdef = NULL;
	conn_t *cp = NULL;

	if (!is_string_in_arr(pbs_conf.supported_auth_methods, request->rq_ind.rq_auth.rq_auth_method)) {
		req_reject(PBSE_NOSUP, 0, request);
		close_client(conn->cn_sock);
		return;
	}

	if (request->rq_ind.rq_auth.rq_encrypt_method[0] != '\0') {
		encryptdef = get_auth(request->rq_ind.rq_auth.rq_encrypt_method);
		if (encryptdef == NULL || encryptdef->encrypt_data == NULL || encryptdef->decrypt_data == NULL) {
			req_reject(PBSE_NOSUP, 0, request);
			close_client(conn->cn_sock);
			return;
		}
	}

	if (strcmp(request->rq_ind.rq_auth.rq_auth_method, AUTH_RESVPORT_NAME) != 0) {
		authdef = get_auth(request->rq_ind.rq_auth.rq_auth_method);
		if (authdef == NULL) {
			req_reject(PBSE_NOSUP, 0, request);
			close_client(conn->cn_sock);
			return;
		}
		cp = conn;
	} else {
		/* ensure resvport auth request is coming from priv port */
		if ((conn->cn_authen & PBS_NET_CONN_FROM_PRIVIL) == 0) {
			req_reject(PBSE_BADCRED, 0, request);
			close_client(conn->cn_sock);
			return;
		}
		cp = (conn_t *) GET_NEXT(svr_allconns);
		for (; cp != NULL; cp = GET_NEXT(cp->cn_link)) {
			if (request->rq_ind.rq_auth.rq_port == cp->cn_port && conn->cn_addr == cp->cn_addr) {
				cp->cn_authen |= PBS_NET_CONN_AUTHENTICATED;
				break;
			}
		}
		if (cp == NULL) {
			req_reject(PBSE_BADCRED, 0, request);
			close_client(conn->cn_sock);
			return;
		}
	}

	cp->cn_auth_config = make_auth_config(request->rq_ind.rq_auth.rq_auth_method,
					      request->rq_ind.rq_auth.rq_encrypt_method,
					      pbs_conf.pbs_exec_path,
					      pbs_conf.pbs_home_path,
					      (void *) log_event);
	if (cp->cn_auth_config == NULL) {
		req_reject(PBSE_SYSTEM, 0, request);
		close_client(conn->cn_sock);
		return;
	}

	(void) strcpy(cp->cn_username, request->rq_user);
	(void) strcpy(cp->cn_hostname, request->rq_host);
	cp->cn_timestamp = time_now;

	if (encryptdef != NULL) {
		encryptdef->set_config((const pbs_auth_config_t *) (cp->cn_auth_config));
		transport_chan_set_authdef(cp->cn_sock, encryptdef, FOR_ENCRYPT);
		transport_chan_set_ctx_status(cp->cn_sock, AUTH_STATUS_CTX_ESTABLISHING, FOR_ENCRYPT);
	}

	if (authdef != NULL) {
		if (encryptdef != authdef)
			authdef->set_config((const pbs_auth_config_t *) (cp->cn_auth_config));
		transport_chan_set_authdef(cp->cn_sock, authdef, FOR_AUTH);
		transport_chan_set_ctx_status(cp->cn_sock, AUTH_STATUS_CTX_ESTABLISHING, FOR_AUTH);
	}
	if (strcmp(request->rq_ind.rq_auth.rq_auth_method, AUTH_RESVPORT_NAME) == 0) {
		transport_chan_set_ctx_status(cp->cn_sock, AUTH_STATUS_CTX_READY, FOR_AUTH);
	}
	reply_ack(request);
}

#ifndef PBS_MOM
/**
 * @brief handle incoming register sched request
 *
 * @param[in] conn - pointer to connection structure on which request came
 * @param[in] preq - pointer to incoming request structure
 *
 * @return void
 */
static void
req_register_sched(conn_t *conn, struct batch_request *preq)
{
	pbs_sched *sched;
	conn_t *pconn;
	int rc;
	int are_primary;
	int preq_conn;
	char *auth_user = pbs_conf.pbs_daemon_service_auth_user ? pbs_conf.pbs_daemon_service_auth_user : pbs_conf.pbs_daemon_service_user;
	char *user = auth_user ? auth_user : pbs_current_user;
	char *conn_auth_user;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	conn_auth_user = malloc(strlen(conn->cn_username) + 1 + strlen(conn->cn_hostname) + 1);
	if (conn_auth_user == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		rc = PBSE_SYSTEM;
		goto rerr;
	}

	strcpy(conn_auth_user, conn->cn_username);
	strcat(conn_auth_user, "@");
	strcat(conn_auth_user, conn->cn_hostname);
#else
	conn_auth_user = strdup(conn->cn_username);
	if (conn_auth_user == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		rc = PBSE_SYSTEM;
		goto rerr;
	}
#endif

	if ((conn->cn_authen & PBS_NET_CONN_AUTHENTICATED) == 0 || strcmp(conn_auth_user, user) != 0) {
		rc = PBSE_PERM;
		free(conn_auth_user);
		goto rerr;
	}
	free(conn_auth_user);

	if (preq->rq_ind.rq_register_sched.rq_name == NULL) {
		rc = PBSE_IVALREQ;
		goto rerr;
	}
	sched = find_sched(preq->rq_ind.rq_register_sched.rq_name);
	if (sched == NULL) {
		rc = PBSE_UNKSCHED;
		goto rerr;
	}

	if (pbs_conf.pbs_primary != NULL && pbs_conf.pbs_secondary != NULL) {
		are_primary = are_we_primary();
		pbs_net_t addr;
		if (are_primary == FAILOVER_PRIMARY) {
			addr = get_hostaddr(pbs_conf.pbs_primary);
			if (addr != conn->cn_addr) {
				rc = PBSE_BADHOST;
				goto rerr;
			}
		} else if (are_primary == FAILOVER_SECONDARY) {
			addr = get_hostaddr(pbs_conf.pbs_secondary);
			if (addr != conn->cn_addr) {
				rc = PBSE_BADHOST;
				goto rerr;
			}
		} else {
			rc = PBSE_BADHOST;
			goto rerr;
		}
	}

	if (sched->sc_primary_conn != -1 && sched->sc_secondary_conn != -1) {
		rc = PBSE_SCHEDCONNECTED;
		goto rerr;
	}
	if (sched->sc_primary_conn == -1) {
		sched->sc_primary_conn = conn->cn_sock;
		net_add_close_func(conn->cn_sock, scheduler_close);
		reply_ack(preq);
		return;
	} else if (sched->sc_primary_conn != -1) {
		pconn = get_conn(sched->sc_primary_conn);
		if (!pconn) {
			rc = PBSE_INTERNAL;
			goto rerr;
		}
	} else {
		rc = PBSE_IVALREQ;
		goto rerr;
	}
	if (pconn->cn_sock == conn->cn_sock) {
		rc = PBSE_IVALREQ;
		goto rerr;
	}
	if ((pconn->cn_authen & PBS_NET_CONN_AUTHENTICATED) == 0 || strcmp(pconn->cn_physhost, conn->cn_physhost) || pconn->cn_addr != conn->cn_addr) {
		rc = PBSE_PERM;
		goto rerr;
	}
	sched->sc_primary_conn = pconn->cn_sock;
	sched->sc_secondary_conn = conn->cn_sock;
	conn->cn_authen |= PBS_NET_CONN_FROM_PRIVIL | PBS_NET_CONN_NOTIMEOUT;
	pconn->cn_authen |= PBS_NET_CONN_FROM_PRIVIL | PBS_NET_CONN_NOTIMEOUT;
	pconn->cn_origin = CONN_SCHED_PRIMARY;
	conn->cn_origin = CONN_SCHED_SECONDARY;
	net_add_close_func(conn->cn_sock, scheduler_close);
	net_add_close_func(pconn->cn_sock, scheduler_close);
	if (!set_conn_as_priority(pconn)) {
		log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SCHED, LOG_ERR, sched->sc_name, "Failed to set primary connection as priority connection");
		rc = PBSE_INTERNAL;
		goto rerr;
	}
	if (!set_conn_as_priority(conn)) {
		log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SCHED, LOG_ERR, sched->sc_name, "Failed to set secondary connection as priority connection");
		rc = PBSE_INTERNAL;
		goto rerr;
	}

	reply_ack(preq);
	log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SCHED, LOG_ERR, sched->sc_name, "scheduler connected");
	/*
	 * scheduler (re-)connected, ask it to configure itself
	 *
	 * this must come after above reply_ack
	 */
	send_sched_cmd(sched, SCH_CONFIGURE, NULL);
	return;

rerr:
	preq_conn = preq->rq_conn;
	req_reject(rc, 0, preq);
	close_client(preq_conn);
}
#endif

/*
* @brief
 * 		process_request - process an request from the network:
 *		Call function to read in the request and decode it.
 *		Validate requesting host and user.
 *		Call function to process request based on type.
 *		That function MUST free the request by calling free_br()
 *
 * @param[in]	sfds	- file descriptor (socket) to get request
 */

void
process_request(int sfds)
{
	int rc;
	struct batch_request *request;
	conn_t *conn;
#ifndef PBS_MOM
	int access_allowed;
#endif

	time_now = time(NULL);

	conn = get_conn(sfds);

	if (!conn) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_REQUEST, LOG_ERR, __func__, "did not find socket in connection table");
		closesocket(sfds);
		return;
	}

#ifndef PBS_MOM
	if (conn->cn_origin == CONN_SCHED_SECONDARY) {
		if (recv_sched_cycle_end(sfds) != 0)
			close_conn(sfds);
		return;
	}
#endif

	if ((request = alloc_br(0)) == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_REQUEST, LOG_ERR, __func__, "Unable to allocate request structure");
		close_conn(sfds);
		return;
	}
	request->rq_conn = sfds;
	if (get_connecthost(sfds, request->rq_host, PBS_MAXHOSTNAME)) {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG, __func__, "%s: %lu", msg_reqbadhost, get_connectaddr(sfds));
		req_reject(PBSE_BADHOST, 0, request);
		return;
	}
	/*
	 * Read in the request and decode it to the internal request structure.
	 */
#ifndef PBS_MOM
	if (conn->cn_active == FromClientDIS) {
		rc = dis_request_read(sfds, request);
	} else {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_REQUEST, LOG_ERR, __func__, "request on invalid type of connection");
		close_conn(sfds);
		free_br(request);
		return;
	}
#else  /* PBS_MOM */
	rc = dis_request_read(sfds, request);
#endif /* PBS_MOM */

	if (rc == -1) { /* End of file */
		close_client(sfds);
		free_br(request);
		return;
	} else if ((rc == PBSE_SYSTEM) || (rc == PBSE_INTERNAL)) {
		/* read error, likely cannot send reply so just disconnect */

		/* ??? not sure about this ??? */

		close_client(sfds);
		free_br(request);
		return;
	} else if (rc > 0) {
		/*
		 * request didn't decode, either garbage or unknown
		 * request type, in ether case, return reject-reply
		 */
		req_reject(rc, 0, request);
		close_client(sfds);
		return;
	}

#ifndef PBS_MOM
	strcpy(conn->cn_physhost, request->rq_host);
	if (conn->cn_username[0] == '\0')
		strcpy(conn->cn_username, request->rq_user);
	if (conn->cn_hostname[0] == '\0')
		strcpy(conn->cn_hostname, request->rq_host);
	if (conn->cn_origin == CONN_SCHED_PRIMARY) {
		/*
		 * If the request is coming from scheduler,
		 * change the "user" from daemon user to "Scheduler"
		 */
		strncpy(request->rq_user, PBS_SCHED_DAEMON_NAME, PBS_MAXUSER);
		request->rq_user[PBS_MAXUSER] = '\0';
	}
#endif /* PBS_MOM */
	log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_REQUEST, LOG_DEBUG, "", msg_request, request->rq_type, request->rq_user, request->rq_host, sfds);

	if (request->rq_type == PBS_BATCH_Authenticate) {
		req_authenticate(conn, request);
		return;
	}

#ifndef PBS_MOM
	if (request->rq_type != PBS_BATCH_Connect) {
		if (transport_chan_get_ctx_status(sfds, FOR_AUTH) != AUTH_STATUS_CTX_READY &&
		    (conn->cn_authen & PBS_NET_CONN_AUTHENTICATED) == 0) {
			req_reject(PBSE_BADCRED, 0, request);
			close_client(sfds);
			return;
		}

		if (conn->cn_credid == NULL &&
		    conn->cn_auth_config != NULL &&
		    conn->cn_auth_config->auth_method != NULL &&
		    strcmp(conn->cn_auth_config->auth_method, AUTH_RESVPORT_NAME) != 0) {
			char *user = NULL;
			char *host = NULL;
			char *realm = NULL;
			auth_def_t *authdef = transport_chan_get_authdef(sfds, FOR_AUTH);

			if (authdef == NULL) {
				req_reject(PBSE_PERM, 0, request);
				close_client(sfds);
				return;
			}

			if (authdef->get_userinfo(transport_chan_get_authctx(sfds, FOR_AUTH), &user, &host, &realm) != 0) {
				req_reject(PBSE_PERM, 0, request);
				close_client(sfds);
				return;
			}

			if (user != NULL && realm != NULL) {
				size_t clen = strlen(user) + strlen(realm) + 2; /* 1 for '@' and 1 for '\0' */
				if ((conn->cn_credid = (char *) calloc(1, clen)) == NULL) {
					req_reject(PBSE_SYSTEM, errno, request);
					close_client(sfds);
					return;
				}
				strcpy(conn->cn_credid, user);
				strcat(conn->cn_credid, "@");
				strcat(conn->cn_credid, realm);
				free(realm);
			}

			if (user != NULL) {
				strcpy(conn->cn_username, user);
				free(user);
			}

			if (host != NULL) {
				strcpy(conn->cn_hostname, host);
				free(host);
			}
		}

		conn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;
	}

	if (request->rq_type == PBS_BATCH_RegisterSched) {
		req_register_sched(conn, request);
		return;
	}

	/* is the request from a host acceptable to the server */
	if (get_sattr_long(SVR_ATR_acl_host_enable)) {
		/* acl enabled, check it; always allow myself	*/

		struct pbsnode *isanode = NULL;
		if (is_sattr_set(SVR_ATR_acl_host_moms_enable) && get_sattr_long(SVR_ATR_acl_host_moms_enable) == 1) {
			isanode = find_nodebyaddr(get_connectaddr(sfds));

			if ((isanode != NULL) && (isanode->nd_state & INUSE_DELETED))
				isanode = NULL;
		}

		if (isanode == NULL) {
			pbs_net_t addr;
			char ip[PBS_MAXIP_LEN + 1];

			addr = get_hostaddr(request->rq_host);
			if (snprintf(ip, PBS_MAXIP_LEN + 1, "%ld.%ld.%ld.%ld",
				     (addr & 0xff000000) >> 24,
				     (addr & 0x00ff0000) >> 16,
				     (addr & 0x0000ff00) >> 8,
				     (addr & 0x000000ff)) <= 0) {
				addr = 0;
			}

			access_allowed = 0;

			if (acl_check(get_sattr(SVR_ATR_acl_hosts), request->rq_host, ACL_Host)) {
				access_allowed = 1;
			}

			if (addr != 0 && acl_check(get_sattr(SVR_ATR_acl_hosts), ip, ACL_Subnet)) {
				access_allowed = 1;
			}

			if (strcasecmp(server_host, request->rq_host) == 0) {
				access_allowed = 1;
			}

			if (access_allowed == 0) {
				req_reject(PBSE_BADHOST, 0, request);
				close_client(sfds);
				return;
			}
		}
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	if (conn->cn_credid != NULL &&
	    conn->cn_auth_config != NULL &&
	    conn->cn_auth_config->auth_method != NULL &&
	    strcmp(conn->cn_auth_config->auth_method, AUTH_GSS_NAME) == 0) {

		access_allowed = 0;

		if (strcasecmp(server_host, request->rq_host) == 0) {
			/* always allow myself */
			access_allowed = 1;
		}

		if (get_sattr_long(SVR_ATR_acl_krb_realm_enable)) {
			if (acl_check(get_sattr(SVR_ATR_acl_krb_realms), conn->cn_credid, ACL_Host)) {
				access_allowed = 1;
			}
		} else {
			access_allowed = 1;
		}

		/*
		 * copy principal to request structure
		 * so authenticate_user() can proceed
		 */
		strcpy(request->rq_user, conn->cn_username);
		strcpy(request->rq_host, conn->cn_hostname);

		log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
			   "", msg_auth_request, request->rq_type, request->rq_user,
			   request->rq_host, conn->cn_physhost, sfds);

		if (access_allowed == 0) {
			req_reject(PBSE_PERM, 0, request);
			close_client(sfds);
			return;
		}
	}
#endif

	/*
	 * determine source (user client or another server) of request.
	 * set the permissions granted to the client
	 */
	if (conn->cn_authen & PBS_NET_CONN_FROM_PRIVIL) {

		/* request came from another server */

		request->rq_fromsvr = 1;
		request->rq_perm = ATR_DFLAG_USRD | ATR_DFLAG_USWR |
				   ATR_DFLAG_OPRD | ATR_DFLAG_OPWR |
				   ATR_DFLAG_MGRD | ATR_DFLAG_MGWR |
				   ATR_DFLAG_SvWR;

	} else {

		/* request not from another server */

		request->rq_fromsvr = 0;

		/*
		 * Client must be authenticated by a Authenticate User Request,
		 * if not, reject request and close connection.
		 * -- The following is retained for compat with old cmds --
		 * The exception to this is of course the Connect Request which
		 * cannot have been authenticated, because it contains the
		 * needed ticket; so trap it here.  Of course, there is no
		 * prior authentication on the Authenticate User request either,
		 * but it comes over a reserved port and appears from another
		 * server, hence is automatically granted authorization.

		 */

		if (request->rq_type == PBS_BATCH_Connect) {
			req_connect(request);
			return;
		}

		if ((conn->cn_authen & PBS_NET_CONN_AUTHENTICATED) == 0) {
			rc = PBSE_BADCRED;
		} else {
			rc = authenticate_user(request, conn);
		}
		if (rc != 0) {
			req_reject(rc, 0, request);
			if (rc == PBSE_BADCRED)
				close_client(sfds);
			return;
		}

		request->rq_perm = svr_get_privilege(request->rq_user, request->rq_host);
	}

	/* if server shutting down, disallow new jobs and new running */

	if (get_sattr_long(SVR_ATR_State) > SV_STATE_RUN) {
		switch (request->rq_type) {
			case PBS_BATCH_AsyrunJob:
			case PBS_BATCH_AsyrunJob_ack:
			case PBS_BATCH_JobCred:
			case PBS_BATCH_UserCred:
			case PBS_BATCH_MoveJob:
			case PBS_BATCH_QueueJob:
			case PBS_BATCH_RunJob:
			case PBS_BATCH_StageIn:
			case PBS_BATCH_jobscript:
				req_reject(PBSE_SVRDOWN, 0, request);
				return;
		}
	}

#else /* THIS CODE FOR MOM ONLY */

	/* check connecting host against allowed list of ok clients */
	if (!addrfind(conn->cn_addr)) {
		req_reject(PBSE_BADHOST, 0, request);
		close_client(sfds);
		return;
	}

	if ((conn->cn_authen & PBS_NET_CONN_FROM_PRIVIL) == 0) {
		req_reject(PBSE_BADCRED, 0, request);
		close_client(sfds);
		return;
	}

	request->rq_fromsvr = 1;
	request->rq_perm = ATR_DFLAG_USRD | ATR_DFLAG_USWR |
			   ATR_DFLAG_OPRD | ATR_DFLAG_OPWR |
			   ATR_DFLAG_MGRD | ATR_DFLAG_MGWR |
			   ATR_DFLAG_SvWR | ATR_DFLAG_MOM;
#endif

	/*
	 * dispatch the request to the correct processing function.
	 * The processing function must call reply_send() to free
	 * the request struture.
	 */

	dispatch_request(sfds, request);
	return;
}

#ifndef PBS_MOM /* Server Only Functions */
/**
 * @brief
 *		Set socket to non-blocking to prevent write from hanging up the
 *		Server for a long time.
 *
 *		This is called from dispatch_request() below for requests that will
 *		typically produce a large amout of output, such as stating all jobs.
 *		It is called after the incoming request has been read.  After the
 *		request is processed and replied to, the socket will be reset, see
 *		clear_non_blocking().  The existing socket flags are saved in the
 *		connection table entry cn_sockflgs for use by clear_non_blocking().
 *
 * @param[in] conn - the connection structure.
 *
 * @return	success or failure
 * @retval	-l	- failure
 * @retval 	0	- success
 */

static int
set_to_non_blocking(conn_t *conn)
{

	if (conn->cn_sock != PBS_LOCAL_CONNECTION) {
		int flg;
		flg = fcntl(conn->cn_sock, F_GETFL);
		if (((flg = fcntl(conn->cn_sock, F_GETFL)) == -1) ||
		    (fcntl(conn->cn_sock, F_SETFL, flg | O_NONBLOCK) == -1)) {
			log_err(errno, __func__,
				"Unable to set client socking non-blocking");
			return -1;
		}
		conn->cn_sockflgs = flg;
	}
	return 0;
}

/**
 * @brief
 *		Clear non-blocking from a socket.
 *
 *		The function set_to_non_blocking() must be called first, it saved
 *		the prior socket flags in the connection table.  This function resets
 *		the socket flags to that value.
 *
 @param[in] conn - the connection structure.
 */

static void
clear_non_blocking(conn_t *conn)
{
	if (!conn)
		return;
	if (conn->cn_sock != PBS_LOCAL_CONNECTION) {
		int flg;
		if ((flg = conn->cn_sockflgs) != -1)
			/* reset socket flag to prior value */
			(void) fcntl(conn->cn_sock, F_SETFL, flg);
		conn->cn_sockflgs = 0;
	}
}
#endif /* !PBS_MOM */

/**
 * @brief
 * 		Determine the request type and invoke the corresponding
 *		function.
 * @par
 *		The function will perform the request action and return the
 *		reply.  The function MUST also reply and free the request by calling
 *		reply_send().
 *
 * @param[in]	sfds	- socket connection
 * @param[in]	request - the request information
 */

void
dispatch_request(int sfds, struct batch_request *request)
{

	conn_t *conn = NULL;
	int prot = request->prot;

	if (prot == PROT_TCP) {
		if (sfds != PBS_LOCAL_CONNECTION) {
			conn = get_conn(sfds);
			if (!conn) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_REQUEST, LOG_ERR, __func__, "did not find socket in connection table");
				req_reject(PBSE_SYSTEM, 0, request);
				close_client(sfds);
				return;
			}
		}
	}

	switch (request->rq_type) {

		case PBS_BATCH_QueueJob:
			if (prot == PROT_TPP) {
				request->tpp_ack = 0;
				tpp_add_close_func(sfds, close_quejob);
			} else
				net_add_close_func(sfds, close_quejob);
			req_quejob(request);
			break;

		case PBS_BATCH_JobCred:
			if (prot == PROT_TPP)
				request->tpp_ack = 0;
			req_jobcredential(request);
			break;

		case PBS_BATCH_UserCred:
#ifdef PBS_MOM
#ifdef WIN32
			req_reject(PBSE_NOSUP, 0, request);
#else
			req_reject(PBSE_UNKREQ, 0, request);
#endif
			close_client(sfds);
#else
			req_usercredential(request);
#endif
			break;

		case PBS_BATCH_jobscript:
			if (prot == PROT_TPP)
				request->tpp_ack = 0;
			req_jobscript(request);
			break;

			/*
			 * The PBS_BATCH_Rdytocommit message is deprecated.
			 * The server does not do anything with it anymore, but
			 * simply acks the request (in case some client makes this call)
			 */
		case PBS_BATCH_RdytoCommit:
			if (prot == PROT_TPP)
				request->tpp_ack = 0;
			reply_ack(request);
			break;

		case PBS_BATCH_Commit:
			if (prot == PROT_TPP)
				request->tpp_ack = 0;
			req_commit(request);
			if (prot == PROT_TPP)
				tpp_add_close_func(sfds, (void (*)(int)) 0);
			else
				net_add_close_func(sfds, (void (*)(int)) 0);
			break;

		case PBS_BATCH_DeleteJobList:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  request->rq_ind.rq_deletejoblist.rq_jobslist[0],
				  "delete job request received");
			req_deletejob(request);
			break;
		case PBS_BATCH_DeleteJob:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  request->rq_ind.rq_delete.rq_objname,
				  "delete job request received");
			req_deletejob(request);
			break;

#ifndef PBS_MOM
		case PBS_BATCH_SubmitResv:
			req_resvSub(request);
			break;

		case PBS_BATCH_DeleteResv:
			req_deleteReservation(request);
			break;

		case PBS_BATCH_ModifyResv:
			req_modifyReservation(request);
			break;

		case PBS_BATCH_ResvOccurEnd:
			req_reservationOccurrenceEnd(request);
			break;
#endif

		case PBS_BATCH_HoldJob:
			if (sfds != PBS_LOCAL_CONNECTION && prot == PROT_TCP)
				conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;
			req_holdjob(request);
			break;
#ifndef PBS_MOM
		case PBS_BATCH_PreemptJobs:
			req_preemptjobs(request);
			break;

		case PBS_BATCH_LocateJob:
			req_locatejob(request);
			break;

		case PBS_BATCH_Manager:
			req_manager(request);
			break;

		case PBS_BATCH_RelnodesJob:
			req_relnodesjob(request);
			break;

#endif
		case PBS_BATCH_MessJob:
			req_messagejob(request);
			break;

		case PBS_BATCH_PySpawn:
			if (sfds != PBS_LOCAL_CONNECTION && prot == PROT_TCP)
				conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;
			req_py_spawn(request);
			break;

		case PBS_BATCH_ModifyJob:
		case PBS_BATCH_ModifyJob_Async:
			req_modifyjob(request);
			break;

		case PBS_BATCH_Rerun:
			req_rerunjob(request);
			break;
#ifndef PBS_MOM
		case PBS_BATCH_MoveJob:
			req_movejob(request);
			break;

		case PBS_BATCH_OrderJob:
			req_orderjob(request);
			break;

		case PBS_BATCH_Rescq:
			req_reject(PBSE_NOSUP, 0, request);
			break;

		case PBS_BATCH_ReserveResc:
			req_reject(PBSE_NOSUP, 0, request);
			break;

		case PBS_BATCH_ReleaseResc:
			req_reject(PBSE_NOSUP, 0, request);
			break;

		case PBS_BATCH_ReleaseJob:
			if (sfds != PBS_LOCAL_CONNECTION && prot == PROT_TCP)
				conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;
			req_releasejob(request);
			break;

		case PBS_BATCH_RunJob:
		case PBS_BATCH_AsyrunJob:
		case PBS_BATCH_AsyrunJob_ack:
			req_runjob(request);
			break;

		case PBS_BATCH_DefSchReply:
			req_defschedreply(request);
			break;

		case PBS_BATCH_ConfirmResv:
			req_confirmresv(request);
			break;

		case PBS_BATCH_SelectJobs:
		case PBS_BATCH_SelStat:
			req_selectjobs(request);
			break;

#endif /* !PBS_MOM */

		case PBS_BATCH_Shutdown:
			req_shutdown(request);
			break;

		case PBS_BATCH_SignalJob:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  request->rq_ind.rq_signal.rq_jid,
				  "signal job request received");
			req_signaljob(request);
			break;

		case PBS_BATCH_MvJobFile:
			req_mvjobfile(request);
			break;

#ifndef PBS_MOM /* Server Only Functions */

		case PBS_BATCH_StatusJob:
			if (set_to_non_blocking(conn) == -1) {
				req_reject(PBSE_SYSTEM, 0, request);
				close_client(sfds);
				return;
			}
			req_stat_job(request);
			clear_non_blocking(get_conn(sfds));
			break;

		case PBS_BATCH_StatusQue:
			if (set_to_non_blocking(conn) == -1) {
				req_reject(PBSE_SYSTEM, 0, request);
				close_client(sfds);
				return;
			}
			req_stat_que(request);
			clear_non_blocking(get_conn(sfds));
			break;

		case PBS_BATCH_StatusNode:
			if (prot != PROT_TPP && set_to_non_blocking(conn) == -1) {
				req_reject(PBSE_SYSTEM, 0, request);
				close_client(sfds);
				return;
			}
			req_stat_node(request);
			clear_non_blocking(get_conn(sfds));
			break;

		case PBS_BATCH_StatusResv:
			if (set_to_non_blocking(conn) == -1) {
				req_reject(PBSE_SYSTEM, 0, request);
				close_client(sfds);
				return;
			}
			req_stat_resv(request);
			clear_non_blocking(get_conn(sfds));
			break;

		case PBS_BATCH_StatusSvr:
			req_stat_svr(request);
			break;

		case PBS_BATCH_StatusSched:
			req_stat_sched(request);
			break;

		case PBS_BATCH_StatusHook:
			/* Scheduler is allowed to make the request */
			if (conn->cn_origin != CONN_SCHED_PRIMARY && !is_local_root(request->rq_user, request->rq_host)) {
				sprintf(log_buffer, "%s@%s is unauthorized to "
						    "access hooks data from server %s",
					request->rq_user, request->rq_host, server_host);
				reply_text(request, PBSE_HOOKERROR, log_buffer);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_HOOK,
					  LOG_INFO, "", log_buffer);
				/* don't call close_client() to allow other */
				/* non-hook related requests to continue */
				break;
			}

			if (set_to_non_blocking(conn) == -1) {
				req_reject(PBSE_SYSTEM, 0, request);
				close_client(sfds);
				return;
			}
			req_stat_hook(request);
			clear_non_blocking(get_conn(sfds));
			break;

		case PBS_BATCH_TrackJob:
			req_track(request);
			break;

		case PBS_BATCH_RegistDep:
			req_register(request);
			break;

		case PBS_BATCH_StageIn:
			req_stagein(request);
			break;

		case PBS_BATCH_FailOver:
			req_failover(request);
			break;

		case PBS_BATCH_StatusRsc:
			req_stat_resc(request);
			break;
#else /* MOM only functions */

		case PBS_BATCH_CopyFiles:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  request->rq_ind.rq_cpyfile.rq_jobid,
				  "copy file request received");
			/* don't time-out as copy may take long time */
			if (sfds != PBS_LOCAL_CONNECTION && prot == PROT_TCP)
				conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;
			req_cpyfile(request);
			break;
		case PBS_BATCH_CopyFiles_Cred:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  request->rq_ind.rq_cpyfile_cred.rq_copyfile.rq_jobid,
				  "copy file cred request received");
			/* don't time-out as copy may take long time */
			if (sfds != PBS_LOCAL_CONNECTION && prot == PROT_TCP)
				conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;
			req_cpyfile(request);
			break;

		case PBS_BATCH_DelFiles:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  request->rq_ind.rq_cpyfile.rq_jobid,
				  "delete file request received");
			req_delfile(request);
			break;
		case PBS_BATCH_DelFiles_Cred:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  request->rq_ind.rq_cpyfile_cred.rq_copyfile.rq_jobid,
				  "delete file cred request received");
			req_delfile(request);
			break;
		case PBS_BATCH_CopyHookFile:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_INFO,
				  request->rq_ind.rq_hookfile.rq_filename,
				  "copy hook-related file request received");
			req_copy_hookfile(request);
			break;
		case PBS_BATCH_DelHookFile:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_INFO,
				  request->rq_ind.rq_hookfile.rq_filename,
				  "delete hook-related file request received");
			req_del_hookfile(request);
			break;

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		case PBS_BATCH_Cred:
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_INFO,
				  request->rq_ind.rq_cred.rq_jobid,
				  "credentials received");
			req_cred(request);
			break;
#endif
#endif
		default:
			req_reject(PBSE_UNKREQ, 0, request);
			close_client(sfds);
			break;
	}
	return;
}

/**
 * @brief
 *  process_IS_CMD: Create batch request on received IS_CMD message
 *                   and dispatch request.
 *
 *  @param[in] - stream -  connection stream.
 *
 *  @return void
 *
 */
void
process_IS_CMD(int stream)
{
	int rc;
	struct batch_request *request;
	struct sockaddr_in *addr;
	char *msgid = NULL;

	if ((addr = tpp_getaddr(stream)) == NULL) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG, "?", "Sender unknown");
		return;
	}

	/* in case of IS_CMD there is a unique id passed with each command,
	 * which we need to send back with the reply so server can
	 * match the replies to the requests
	 */
	msgid = disrst(stream, &rc);
	if (!msgid || rc) {
		close(stream);
		return;
	}

	request = alloc_br(0); /* freed when reply sent */
	if (!request) {
		close(stream);
		if (msgid)
			free(msgid);
		return;
	}

	request->rq_conn = stream;
	pbs_strncpy(request->rq_host, netaddr(addr), sizeof(request->rq_host));
	request->rq_fromsvr = 1;
	request->prot = PROT_TPP;
	request->tppcmd_msgid = msgid;

	rc = dis_request_read(stream, request);
	if (rc != 0) {
		close(stream);
		free_br(request);
		return;
	}

	log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_REQUEST, LOG_DEBUG, "",
		   msg_request, request->rq_type, request->rq_user,
		   request->rq_host, stream);

	dispatch_request(stream, request);
}

/**
 * @brief
 * 		close_client - close a connection to a client, also "inactivate"
 *		  any outstanding batch requests on that connection.
 *
 * @param[in]	sfds	- connection socket
 */

void
close_client(int sfds)
{
	struct batch_request *preq;

	close_conn(sfds); /* close the connection */
	preq = (struct batch_request *) GET_NEXT(svr_requests);
	while (preq) { /* list of outstanding requests */
		if (preq->rq_conn == sfds)
			preq->rq_conn = -1;
		if (preq->rq_orgconn == sfds)
			preq->rq_orgconn = -1;
		preq = (struct batch_request *) GET_NEXT(preq->rq_link);
	}
}

/**
 * @brief
 * 		alloc_br - allocate and clear a batch_request structure
 *
 * @param[in]	type	- type of request
 *
 * @return	batch_request *
 * @retval	NULL	- error
 */

struct batch_request *
alloc_br(int type)
{
	struct batch_request *req;

	req = (struct batch_request *) malloc(sizeof(struct batch_request));
	if (req == NULL)
		log_err(errno, "alloc_br", msg_err_malloc);
	else {
		memset((void *) req, (int) 0, sizeof(struct batch_request));
		req->rq_type = type;
		CLEAR_LINK(req->rq_link);
		req->rq_conn = -1;    /* indicate not connected */
		req->rq_orgconn = -1; /* indicate not connected */
		req->rq_time = time_now;
		req->tpp_ack = 1;	  /* enable acks to be passed by tpp by default */
		req->prot = PROT_TCP;	  /* not tpp by default */
		req->tppcmd_msgid = NULL; /* NULL msgid to boot */
		req->rq_reply.brp_is_part = 0;
		req->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
		append_link(&svr_requests, &req->rq_link, req);
	}
	return (req);
}

/**
 * @brief
 * 	copy constructor for batch request - shallow copy
 *
 * @param[in]	src	- request to be copied
 *
 * @return	batch_request *
 * @retval	NULL	- error
 */

struct batch_request *
copy_br(struct batch_request *src)
{
	struct batch_request *req;

	if (!src)
		return NULL;

	req = calloc(sizeof(struct batch_request), 1);
	if (req == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		return NULL;
	}

	req->rq_type = src->rq_type;
	CLEAR_LINK(req->rq_link);
	req->rq_conn = src->rq_conn;
	req->rq_orgconn = src->rq_orgconn;
	req->rq_time = src->rq_time;
	req->tpp_ack = src->tpp_ack;
	req->prot = src->prot;
	req->rq_reply.brp_is_part = src->rq_reply.brp_is_part;
	req->rq_reply.brp_choice = src->rq_reply.brp_choice;
	req->rq_fromsvr = src->rq_fromsvr;
	req->rq_perm = src->rq_perm;
	if (src->rq_user[0])
		memcpy(&req->rq_user, &src->rq_user, sizeof(req->rq_user));
	if (src->rq_host[0])
		memcpy(&req->rq_host, &src->rq_host, sizeof(req->rq_host));
	append_link(&svr_requests, &req->rq_link, req);

	return (req);
}

/**
 * @brief
 * 		close_quejob - locate and deal with the new job that was being received
 *		  when the net connection closed.
 *
 * @param[in]	sfds	- file descriptor (socket) to get request
 */

static void
close_quejob(int sfds)
{
	job *pjob;

	pjob = (job *) GET_NEXT(svr_newjobs);
	while (pjob != NULL) {
		if (pjob->ji_qs.ji_un.ji_newt.ji_fromsock == sfds) {
			if (check_job_substate(pjob, JOB_SUBSTATE_TRANSICM)) {

#ifndef PBS_MOM
				if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) {

					/*
					 * the job was being created here for the first time
					 * go ahead and enqueue it as QUEUED; otherwise, hold
					 * it here as TRANSICM until we hear from the sending
					 * server again to commit.
					 */
					delete_link(&pjob->ji_alljobs);
					set_job_state(pjob, JOB_STATE_LTR_QUEUED);
					set_job_substate(pjob, JOB_SUBSTATE_QUEUED);
					if (svr_enquejob(pjob, NULL))
						(void) job_abt(pjob, msg_err_noqueue);
				}
#endif /* PBS_MOM */

			} else {

				/* else delete the job */

				delete_link(&pjob->ji_alljobs);
				job_purge(pjob);
			}
			break;
		}
		pjob = GET_NEXT(pjob->ji_alljobs);
	}
	return;
}

#ifndef PBS_MOM /* Server Only */
/**
 * @brief
 * 		free_rescrq - free resource queue.
 *
 * @param[in,out]	pq	- resource queue
 */
static void
free_rescrq(struct rq_rescq *pq)
{
	int i;

	i = pq->rq_num;
	while (i--) {
		if (*(pq->rq_list + i))
			(void) free(*(pq->rq_list + i));
	}
	if (pq->rq_list)
		(void) free(pq->rq_list);
}
#endif /* Server Only */

/**
 * @brief
 * 		Free malloc'ed array of strings.  Used in MOM to deal with tm_spawn
 * 		equests and both MOM and the server for py_spawn requests.
 *
 * @param[out]	array	- malloc'ed array of strings
 */
void
arrayfree(char **array)
{
	int i;

	if (array == NULL)
		return;
	for (i = 0; array[i]; i++)
		free(array[i]);
	free(array);
}

/**
 * @brief
 *		Read a bunch of strings into a NULL terminated array.
 *		The strings are regular null terminated char arrays
 *		and the string array is NULL terminated.
 *
 *		Pass in array location to hold the allocated array
 *		and return an error value if there is a problem.  If
 *		an error does occur, arrloc is not changed.
 *
 * @param[in]	stream	- socket where you reads the request.
 * @param[out]	arrloc	- NULL terminated array where strings are stored.
 *
 * @return	error code
 */
static int
read_carray(int stream, char ***arrloc)
{
	int i, num, ret;
	char *cp, **carr;

	if (arrloc == NULL)
		return PBSE_INTERNAL;

	num = 4; /* keep track of the number of array slots */
	carr = (char **) calloc(sizeof(char **), num);
	if (carr == NULL)
		return PBSE_SYSTEM;

	for (i = 0;; i++) {
		cp = disrst(stream, &ret);
		if ((cp == NULL) || (ret != DIS_SUCCESS)) {
			arrayfree(carr);
			if (cp != NULL)
				free(cp);
			return PBSE_SYSTEM;
		}
		if (*cp == '\0') {
			free(cp);
			break;
		}
		if (i == num - 1) {
			char **hold;

			hold = (char **) realloc(carr,
						 num * 2 * sizeof(char **));
			if (hold == NULL) {
				arrayfree(carr);
				free(cp);
				return PBSE_SYSTEM;
			}
			carr = hold;

			/* zero the last half of the now doubled carr */
			memset(&carr[num], 0, num * sizeof(char **));
			num *= 2;
		}
		carr[i] = cp;
	}
	carr[i] = NULL;
	*arrloc = carr;
	return ret;
}

/**
 * @brief
 *		Read a python spawn request off the wire.
 *		Each of the argv and envp arrays is sent by writing a counted
 *		string followed by a zero length string ("").
 *
 * @param[in]	sock	- socket where you reads the request.
 * @param[in]	preq	- the batch_request structure to free up.
 */
int
decode_DIS_PySpawn(int sock, struct batch_request *preq)
{
	int rc;

	rc = disrfst(sock, sizeof(preq->rq_ind.rq_py_spawn.rq_jid),
		     preq->rq_ind.rq_py_spawn.rq_jid);
	if (rc)
		return rc;

	rc = read_carray(sock, &preq->rq_ind.rq_py_spawn.rq_argv);
	if (rc)
		return rc;

	rc = read_carray(sock, &preq->rq_ind.rq_py_spawn.rq_envp);
	if (rc)
		return rc;

	return rc;
}

/**
 * @brief
 *		Read a release nodes from job request off the wire.
 *
 * @param[in]	sock	- socket where you reads the request.
 * @param[in]	preq	- the batch_request structure containing the request details.
 *
 * @return int
 *
 * @retval	0	- if successful
 * @retval	!= 0	- if not successful (an error encountered along the way)
 */
int
decode_DIS_RelnodesJob(int sock, struct batch_request *preq)
{
	int rc;

	preq->rq_ind.rq_relnodes.rq_node_list = NULL;

	rc = disrfst(sock, PBS_MAXSVRJOBID + 1, preq->rq_ind.rq_relnodes.rq_jid);
	if (rc)
		return rc;

	preq->rq_ind.rq_relnodes.rq_node_list = disrst(sock, &rc);
	return rc;
}

/**
 * @brief
 * 		Free space allocated to a batch_request structure
 *		including any sub-structures
 *
 * @param[in]	preq - the batch_request structure to free up.
 */
void
free_br(struct batch_request *preq)
{
	delete_link(&preq->rq_link);
	reply_free(&preq->rq_reply);

	if (preq->rq_parentbr) {
		/*
		 * have a parent who has the original info, so we cannot
		 * free any data malloc-ed outside of the basic structure;
		 * decrement the reference count in the parent and when it
		 * goes to zero,  reply_send() it
		 */
		if (preq->rq_parentbr->rq_refct > 0) {
			if (--preq->rq_parentbr->rq_refct == 0) {
#ifndef PBS_MOM /* Server Only */
				if (preq->rq_parentbr->rq_type == PBS_BATCH_DeleteJobList) {
					if (delete_pending_arrayjobs(preq->rq_parentbr))
						reply_send(preq->rq_parentbr);
				} else
#endif /* End of server */
					reply_send(preq->rq_parentbr);
			}
		}

		free(preq->tppcmd_msgid);
		if (preq->rq_type == PBS_BATCH_DeleteJobList)
			if (preq->rq_ind.rq_deletejoblist.rq_jobslist)
				free_string_array(preq->rq_ind.rq_deletejoblist.rq_jobslist);
		free(preq);
		return;
	}

	/*
	 * IMPORTANT - free any data that is malloc-ed outside of the
	 * basic batch_request structure below here so it is not freed
	 * when a copy of the structure (for a Array subjob) is freed
	 */
	if (preq->rq_extend)
		(void) free(preq->rq_extend);

	switch (preq->rq_type) {
		case PBS_BATCH_QueueJob:
			free_attrlist(&preq->rq_ind.rq_queuejob.rq_attr);
			break;
		case PBS_BATCH_JobCred:
			if (preq->rq_ind.rq_jobcred.rq_data)
				(void) free(preq->rq_ind.rq_jobcred.rq_data);
			break;
		case PBS_BATCH_UserCred:
			if (preq->rq_ind.rq_usercred.rq_data)
				(void) free(preq->rq_ind.rq_usercred.rq_data);
			break;
		case PBS_BATCH_jobscript:
			if (preq->rq_ind.rq_jobfile.rq_data)
				(void) free(preq->rq_ind.rq_jobfile.rq_data);
			break;
		case PBS_BATCH_CopyHookFile:
			if (preq->rq_ind.rq_hookfile.rq_data)
				(void) free(preq->rq_ind.rq_hookfile.rq_data);
			break;
		case PBS_BATCH_HoldJob:
			freebr_manage(&preq->rq_ind.rq_hold.rq_orig);
			break;
		case PBS_BATCH_MessJob:
			if (preq->rq_ind.rq_message.rq_text)
				(void) free(preq->rq_ind.rq_message.rq_text);
			break;
		case PBS_BATCH_RelnodesJob:
			if (preq->rq_ind.rq_relnodes.rq_node_list)
				(void) free(preq->rq_ind.rq_relnodes.rq_node_list);
			break;
		case PBS_BATCH_PySpawn:
			arrayfree(preq->rq_ind.rq_py_spawn.rq_argv);
			arrayfree(preq->rq_ind.rq_py_spawn.rq_envp);
			break;
		case PBS_BATCH_ModifyJob:
		case PBS_BATCH_ModifyResv:
		case PBS_BATCH_ModifyJob_Async:
			freebr_manage(&preq->rq_ind.rq_modify);
			break;

		case PBS_BATCH_RunJob:
		case PBS_BATCH_AsyrunJob:
		case PBS_BATCH_AsyrunJob_ack:
		case PBS_BATCH_StageIn:
		case PBS_BATCH_ConfirmResv:
			if (preq->rq_ind.rq_run.rq_destin) {
				free(preq->rq_ind.rq_run.rq_destin);
				preq->rq_ind.rq_run.rq_destin = NULL;
			}
			break;
		case PBS_BATCH_StatusJob:
		case PBS_BATCH_StatusQue:
		case PBS_BATCH_StatusNode:
		case PBS_BATCH_StatusSvr:
		case PBS_BATCH_StatusSched:
		case PBS_BATCH_StatusHook:
		case PBS_BATCH_StatusRsc:
		case PBS_BATCH_StatusResv:
			if (preq->rq_ind.rq_status.rq_id)
				free(preq->rq_ind.rq_status.rq_id);
			free_attrlist(&preq->rq_ind.rq_status.rq_attr);
			break;
		case PBS_BATCH_DeleteJobList:
			if (preq->rq_ind.rq_deletejoblist.rq_jobslist)
				free_string_array(preq->rq_ind.rq_deletejoblist.rq_jobslist);
			break;
		case PBS_BATCH_CopyFiles:
		case PBS_BATCH_DelFiles:
			freebr_cpyfile(&preq->rq_ind.rq_cpyfile);
			break;
		case PBS_BATCH_CopyFiles_Cred:
		case PBS_BATCH_DelFiles_Cred:
			freebr_cpyfile_cred(&preq->rq_ind.rq_cpyfile_cred);
			break;
		case PBS_BATCH_MvJobFile:
			if (preq->rq_ind.rq_jobfile.rq_data)
				free(preq->rq_ind.rq_jobfile.rq_data);
			break;
		case PBS_BATCH_Cred:
			if (preq->rq_ind.rq_cred.rq_cred_data)
				free(preq->rq_ind.rq_cred.rq_cred_data);
			break;

#ifndef PBS_MOM /* Server Only */
		case PBS_BATCH_RegisterSched:
			free(preq->rq_ind.rq_register_sched.rq_name);
			break;
		case PBS_BATCH_SubmitResv:
			free_attrlist(&preq->rq_ind.rq_queuejob.rq_attr);
			break;
		case PBS_BATCH_Manager:
			freebr_manage(&preq->rq_ind.rq_manager);
			break;
		case PBS_BATCH_ReleaseJob:
			freebr_manage(&preq->rq_ind.rq_release);
			break;
		case PBS_BATCH_Rescq:
		case PBS_BATCH_ReserveResc:
		case PBS_BATCH_ReleaseResc:
			free_rescrq(&preq->rq_ind.rq_rescq);
			break;
		case PBS_BATCH_DefSchReply:
			free(preq->rq_ind.rq_defrpy.rq_id);
			free(preq->rq_ind.rq_defrpy.rq_txt);
			break;
		case PBS_BATCH_SelectJobs:
		case PBS_BATCH_SelStat:
			free_attrlist(&preq->rq_ind.rq_select.rq_selattr);
			free_attrlist(&preq->rq_ind.rq_select.rq_rtnattr);
			break;
		case PBS_BATCH_PreemptJobs:
			free(preq->rq_ind.rq_preempt.ppj_list);
			free(preq->rq_reply.brp_un.brp_preempt_jobs.ppj_list);
			break;
#endif /* PBS_MOM */
	}
	if (preq->tppcmd_msgid)
		free(preq->tppcmd_msgid);
	(void) free(preq);
}
/**
 * @brief
 * 		it is a wrapper function of free_attrlist()
 *
 * @param[in]	pmgr - request manage structure.
 */
static void
freebr_manage(struct rq_manage *pmgr)
{
	free_attrlist(&pmgr->rq_attr);
}
/**
 * @brief
 * 		remove all the rqfpair and free their memory
 *
 * @param[in]	pcf - rq_cpyfile structure on which rq_pairs needs to be freed.
 */
static void
freebr_cpyfile(struct rq_cpyfile *pcf)
{
	struct rqfpair *ppair;

	while ((ppair = (struct rqfpair *) GET_NEXT(pcf->rq_pair)) != NULL) {
		delete_link(&ppair->fp_link);
		if (ppair->fp_local)
			(void) free(ppair->fp_local);
		if (ppair->fp_rmt)
			(void) free(ppair->fp_rmt);
		(void) free(ppair);
	}
}
/**
 * @brief
 * 		remove list of rqfpair along with encrpyted credential.
 *
 * @param[in]	pcfc - rq_cpyfile_cred structure
 */
static void
freebr_cpyfile_cred(struct rq_cpyfile_cred *pcfc)
{
	struct rqfpair *ppair;

	while ((ppair = (struct rqfpair *) GET_NEXT(pcfc->rq_copyfile.rq_pair)) != NULL) {
		delete_link(&ppair->fp_link);
		if (ppair->fp_local)
			(void) free(ppair->fp_local);
		if (ppair->fp_rmt)
			(void) free(ppair->fp_rmt);
		(void) free(ppair);
	}
	if (pcfc->rq_pcred)
		free(pcfc->rq_pcred);
}

/**
 * @brief
 * 		Obtain the name and port of the server as defined by pbs_conf
 *
 * @param[out] port - Passed through to parse_servername(), not modified here.
 *
 * @return char *
 * @return NULL - failure
 * @retval !NULL - pointer to server name
 */
char *
get_servername(unsigned int *port)
{
	char *name = NULL;

	if (pbs_conf.pbs_primary)
		name = parse_servername(pbs_conf.pbs_primary, port);
	else if (pbs_conf.pbs_server_host_name)
		name = parse_servername(pbs_conf.pbs_server_host_name, port);
	else
		name = parse_servername(pbs_conf.pbs_server_name, port);

	return name;
}


================================================
FILE: src/server/qattr_get_set.c
================================================
/*
 * Copyright (C) 1994-2020 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "job.h"
#include "reservation.h"
#include "queue.h"

/**
 * @brief	Get attribute of queue based on given attr index
 *
 * @param[in] pq    - pointer to queue struct
 * @param[in] attr_idx - attribute index
 *
 * @return attribute *
 * @retval NULL  - failure
 * @retval !NULL - pointer to attribute struct
 */
attribute *
get_qattr(const pbs_queue *pq, int attr_idx)
{
	if (pq != NULL)
		return _get_attr_by_idx((attribute *) pq->qu_attr, attr_idx);
	return NULL;
}

/**
 * @brief	Getter function for queue attribute of type string
 *
 * @param[in]	pq - pointer to the queue
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	char *
 * @retval	string value of the attribute
 * @retval	NULL if pq is NULL
 */
char *
get_qattr_str(const pbs_queue *pq, int attr_idx)
{
	if (pq != NULL)
		return get_attr_str(get_qattr(pq, attr_idx));

	return NULL;
}

/**
 * @brief	Getter function for queue attribute of type string of array
 *
 * @param[in]	pq - pointer to the queue
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	struct array_strings *
 * @retval	value of the attribute
 * @retval	NULL if pq is NULL
 */
struct array_strings *
get_qattr_arst(const pbs_queue *pq, int attr_idx)
{
	if (pq != NULL)
		return get_attr_arst(get_qattr(pq, attr_idx));

	return NULL;
}

/**
 * @brief	Getter for queue attribute's list value
 *
 * @param[in]	pq - pointer to the queue
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	pbs_list_head
 * @retval	value of attribute
 */
pbs_list_head
get_qattr_list(const pbs_queue *pq, int attr_idx)
{
	return get_attr_list(get_qattr(pq, attr_idx));
}

/**
 * @brief	Getter function for queue attribute of type long
 *
 * @param[in]	pq - pointer to the queue
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	long
 * @retval	long value of the attribute
 * @retval	-1 if pq is NULL
 */
long
get_qattr_long(const pbs_queue *pq, int attr_idx)
{
	if (pq != NULL)
		return get_attr_l(get_qattr(pq, attr_idx));

	return -1;
}

/**
 * @brief	Generic queue attribute setter (call if you want at_set() action functions to be called)
 *
 * @param[in]	pq - pointer to queue
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_qattr_generic(pbs_queue *pq, int attr_idx, char *val, char *rscn, enum batch_op op)
{
	if (pq == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_qattr(pq, attr_idx), &que_attr_def[attr_idx], val, rscn, op);
}

/**
 * @brief	"fast" queue attribute setter for string values
 *
 * @param[in]	pq - pointer to queue
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_qattr_str_slim(pbs_queue *pq, int attr_idx, char *val, char *rscn)
{
	if (pq == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_qattr(pq, attr_idx), &que_attr_def[attr_idx], val, rscn, INTERNAL);
}

/**
 * @brief	"fast" queue attribute setter for long values
 *
 * @param[in]	pq - pointer to queue
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_qattr_l_slim(pbs_queue *pq, int attr_idx, long val, enum batch_op op)
{
	if (pq == NULL)
		return 1;

	set_attr_l(get_qattr(pq, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" queue attribute setter for boolean values
 *
 * @param[in]	pq - pointer to queue
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_qattr_b_slim(pbs_queue *pq, int attr_idx, long val, enum batch_op op)
{
	if (pq == NULL)
		return 1;

	set_attr_b(get_qattr(pq, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" queue attribute setter for char values
 *
 * @param[in]	pq - pointer to queue
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_qattr_c_slim(pbs_queue *pq, int attr_idx, char val, enum batch_op op)
{
	if (pq == NULL)
		return 1;

	set_attr_c(get_qattr(pq, attr_idx), val, op);

	return 0;
}

/**
 * @brief	Check if a queue attribute is set
 *
 * @param[in]	pq - pointer to queue
 * @param[in]	attr_idx - attribute index to check
 *
 * @return	int
 * @retval	1 if it is set
 * @retval	0 otherwise
 */
int
is_qattr_set(const pbs_queue *pq, int attr_idx)
{
	if (pq != NULL)
		return is_attr_set(get_qattr(pq, attr_idx));

	return 0;
}

/**
 * @brief	Free a queue attribute
 *
 * @param[in]	pq - pointer to queue
 * @param[in]	attr_idx - attribute index to free
 *
 * @return	void
 */
void
free_qattr(pbs_queue *pq, int attr_idx)
{
	if (pq != NULL)
		free_attr(que_attr_def, get_qattr(pq, attr_idx), attr_idx);
}


================================================
FILE: src/server/queue_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    queue_func.c
 *
 *@brief
 * 		queue_func.c - various functions dealing with queues
 *
 * Included functions are:
 *	que_alloc()	- allocacte and initialize space for queue structure
 *	que_free()	- free queue structure
 *	que_purge()	- remove queue from server
 *	find_queuebyname() - find a queue with a given name
 #ifdef NAS localmod 075
 *	find_resvqueuebyname() - find a reservation queue, given resv name
 #endif localmod 075
 *	get_dfltque()	- get default queue
 * 	qstart_action() - determine accrue type for all jobs in queue
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/param.h>
#include <memory.h>
#include <stdlib.h>
#include <errno.h>
#include <string.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "log.h"
#include "attribute.h"
#include "server_limits.h"
#include "server.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "pbs_error.h"
#include "sched_cmds.h"
#include "pbs_db.h"
#include "pbs_nodes.h"
#include "pbs_sched.h"
#include "pbs_idx.h"

/* Global Data */

extern char *msg_err_unlink;
extern struct server server;
extern pbs_list_head svr_queues;
extern time_t time_now;
extern long svr_history_enable;
#ifndef PBS_MOM
extern void *svr_db_conn;
#endif

/**
 * @brief
 * 		que_alloc - allocate space for a queue structure and initialize
 *		attributes to "unset"
 *
 * @param[in]	name	- queue name
 *
 * @return	pbs_queue *
 * @retval	null	- space not available.
 */

pbs_queue *
que_alloc(char *name)
{
	int i;
	pbs_queue *pq;

	pq = (pbs_queue *) calloc(1, sizeof(pbs_queue));
	if (pq == NULL) {
		log_err(errno, __func__, "no memory");
		return NULL;
	}

	pq->qu_qs.qu_type = QTYPE_Unset;
	pq->newobj = 1;
	CLEAR_HEAD(pq->qu_jobs);
	CLEAR_LINK(pq->qu_link);

	snprintf(pq->qu_qs.qu_name, sizeof(pq->qu_qs.qu_name), "%s", name);
	if (pbs_idx_insert(queues_idx, pq->qu_qs.qu_name, pq) != PBS_IDX_RET_OK) {
		log_eventf(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_QUEUE, LOG_ERR,
			   "Failed to add queue in index %s", pq->qu_qs.qu_name);
		free(pq);
		return NULL;
	}
	append_link(&svr_queues, &pq->qu_link, pq);
	server.sv_qs.sv_numque++;

	/* set the working attributes to "unspecified" */
	for (i = 0; i < (int) QA_ATR_LAST; i++)
		clear_attr(get_qattr(pq, i), &que_attr_def[i]);

	return (pq);
}

/**
 * @brief
 *		que_free - free queue structure and its various sub-structures
 *		Queue ACL's are regular attributes that are stored in the DB
 *		and not in separate files.
 *
 * @param[in]	pq	- The pointer to the queue to free
 *
 */
void
que_free(pbs_queue *pq)
{
	int i;
	key_value_pair *pkvp = NULL;

	/* remove any malloc working attribute space */
	for (i = 0; i < (int) QA_ATR_LAST; i++)
		free_qattr(pq, i);

	/* free default chunks set on queue */
	pkvp = pq->qu_seldft;
	if (pkvp) {
		for (i = 0; i < pq->qu_nseldft; ++i) {
			free((pkvp + i)->kv_keyw);
			free((pkvp + i)->kv_val);
		}
		free(pkvp);
	}

	/* now free the main structure */
	server.sv_qs.sv_numque--;
	delete_link(&pq->qu_link);
	if (pbs_idx_delete(queues_idx, pq->qu_qs.qu_name) != PBS_IDX_RET_OK)
		log_eventf(PBSEVENT_ERROR | PBSEVENT_FORCE, PBS_EVENTCLASS_QUEUE, LOG_ERR,
			   "Failed to delete queue %s from index", pq->qu_qs.qu_name);
	(void) free(pq);
}

/**
 * @brief
 *		que_purge - purge queue from system
 *		The queue is dequeued, the queue file is unlinked.
 *		If the queue contains any jobs, the purge is not allowed.
 *		Eventually the queue is deleted from the database
 *
 * @param[in]	pque	- The pointer to the queue to purge
 *
 * @return	error code
 * @retval	0	- queue purged or queue not valid
 * @retval	PBSE_OBJBUSY	- queue deletion not allowed
 */
int
que_purge(pbs_queue *pque)
{
	pbs_db_obj_info_t obj;
	pbs_db_que_info_t dbque;
	void *conn = (void *) svr_db_conn;

	/*
	 * If the queue (pque) is not valid, then nothing to
	 * do, just return 0.
	 */
	if (pque == NULL)
		return (0);

	/* are there any jobs still in the queue */
	if (pque->qu_numjobs != 0) {
		/*
		 * If the queue still has job(s), check if the SERVER
		 * is configured for history info and all the jobs in
		 * queue are history jobs. If yes, then allow queue
		 * deletion otherwise return PBSE_OBJBUSY.
		 */
		if (svr_history_enable) { /* SVR histconf chk */

			job *pjob = NULL;
			job *nxpjob = NULL;
			int state_num;

			pjob = (job *) GET_NEXT(pque->qu_jobs);
			while (pjob) {
				/*
				 * If it is not a history job (MOVED/FINISHED), then
				 * return with PBSE_OBJBUSY error.
				 */
				if ((!check_job_state(pjob, JOB_STATE_LTR_MOVED)) &&
				    (!check_job_state(pjob, JOB_STATE_LTR_FINISHED)) &&
				    (!check_job_state(pjob, JOB_STATE_LTR_EXPIRED)))
					return (PBSE_OBJBUSY);
				pjob = (job *) GET_NEXT(pjob->ji_jobque);
			}
			/*
			 * All are history jobs, unlink all of them from queue.
			 * Update the number of jobs in the queue and their state
			 * count as the queue is going to be purged. No job(s)
			 * should point to the queue to be purged, make the queue
			 * header pointer of job(pjob->ji_qhdr) to NULL.
			 */
			pjob = (job *) GET_NEXT(pque->qu_jobs);
			state_num = get_job_state_num(pjob);
			while (pjob) {
				nxpjob = (job *) GET_NEXT(pjob->ji_jobque);
				delete_link(&pjob->ji_jobque);
				--pque->qu_numjobs;
				if (state_num != -1)
					--pque->qu_njstate[state_num];
				pjob->ji_qhdr = NULL;
				pjob = nxpjob;
			}
		} else {
			return (PBSE_OBJBUSY);
		}
	}

	/* delete queue from database */
	strcpy(dbque.qu_name, pque->qu_qs.qu_name);
	obj.pbs_db_obj_type = PBS_DB_QUEUE;
	obj.pbs_db_un.pbs_db_que = &dbque;
	if (pbs_db_delete_obj(conn, &obj) != 0) {
		(void) sprintf(log_buffer,
			       "delete of que %s from datastore failed",
			       pque->qu_qs.qu_name);
		log_err(errno, "queue_purge", log_buffer);
	}
	que_free(pque);

	return (0);
}

/**
 * @brief
 * 		find_queuebyname() - find a queue by its name
 *
 * @param[in]	quename	- queue name
 *
 * @return	pbs_queue *
 */

pbs_queue *
find_queuebyname(char *quename)
{
	char *at;
	pbs_queue *pque = NULL;
	int rc = PBS_IDX_RET_FAIL;

	if (quename == NULL || quename[0] == '\0')
		return NULL;

	at = strchr(quename, (int) '@'); /* strip off server (fragment) */
	if (at)
		*at = '\0';

	rc = pbs_idx_find(queues_idx, (void **) &quename, (void **) &pque, NULL);
	if (at)
		*at = '@'; /* restore '@' server portion */
	if (rc == PBS_IDX_RET_OK)
		return pque;
	return NULL;
}

#ifdef NAS /* localmod 075 */
/**
 * @brief
 * 		find_resvqueuebyname() - find a queue by the name of its reservation
 *
 * @param[in]	quename	- queue name.
 *
 * @return	pbs_queue *
 */
pbs_queue *
find_resvqueuebyname(char *quename)
{
	char *pc;
	pbs_queue *pque;
	char qname[PBS_MAXDEST + 1];

	(void) strncpy(qname, quename, PBS_MAXDEST);
	qname[PBS_MAXDEST] = '\0';
	pc = strchr(qname, (int) '@'); /* strip off server (fragment) */
	if (pc)
		*pc = '\0';
	for (pque = (pbs_queue *) GET_NEXT(svr_queues);
	     pque != NULL; pque = (pbs_queue *) GET_NEXT(pque->qu_link)) {
		if (pque->qu_resvp != NULL && (strcmp(qname, get_rattr_str(pque->qu_resvp, RESV_ATR_resv_name)) == 0))
			break;
	}
	if (pc)
		*pc = '@'; /* restore '@' server portion */
	return (pque);
}
#endif /* localmod 075 */

/**
 * @brief
 * 	find_resv() - find reservation resc_resv struct by its ID or queue name
 *
 *	Search list of all server resc_resv structs for one with given
 *	reservation id or reservation queue name
 *
 * @param[in]	id_or_quename - reservation ID or queue name
 *
 * @return	pointer to resc_resv struct
 * @retval	NULL	- not found
 */
resc_resv *
find_resv(char *id_or_quename)
{
	char *dot = NULL;
	resc_resv *presv = NULL;
	void *prid;

	if (id_or_quename == NULL || id_or_quename[0] == '\0')
		return NULL;

	if ((dot = strchr(id_or_quename, (int) '.')) != 0)
		*dot = '\0';

	prid = id_or_quename + 1; /* ignore first char, as index key doesn't have it */
	if (pbs_idx_find(resvs_idx, &prid, (void **) &presv, NULL) != PBS_IDX_RET_OK) {
		if (dot)
			*dot = '.';
		return NULL;
	}
	if (dot)
		*dot = '.';
	return presv;
}

/**
 * @brief
 * 		get_dftque - get the default queue (if declared)
 *
 * @return	pbs_queue *
 */

pbs_queue *
get_dfltque(void)
{
	pbs_queue *pq = NULL;

	if (is_sattr_set(SVR_ATR_dflt_que))
		pq = find_queuebyname(get_sattr_str(SVR_ATR_dflt_que));
	return (pq);
}

/**
 * @brief
 * 		queuestart_action - when queue is stopped or started,
 *		for all jobs in queue and determine their accrue type
 * 		action function for QA_ATR_started.
 *
 * @param[in]	pattr	- pointer to special attributes of an Array Job
 * @param[in]	pobject	- queue which is stopped or started
 * @param[in]	actmode	- not used.
 *
 * @return	int
 * @retval	0	- success
 */
int
queuestart_action(attribute *pattr, void *pobject, int actmode)
{
	job *pj; /* pointer to job */
	long oldtype;
	long newaccruetype = -1; /* if determining accrue type */
	pbs_queue *pque = (pbs_queue *) pobject;
	pbs_sched *psched;

	if (pque != NULL && get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1) {

		if (pattr->at_val.at_long == 0) { /* started = OFF */
			/* queue stopped, start accruing eligible time */
			/* running jobs and jobs accruing ineligible time are exempted */
			/* jobs accruing eligible time are also exempted */

			pj = (job *) GET_NEXT(pque->qu_jobs);

			while (pj != NULL) {

				oldtype = get_jattr_long(pj, JOB_ATR_accrue_type);

				if (oldtype != JOB_RUNNING && oldtype != JOB_INELIGIBLE &&
				    oldtype != JOB_ELIGIBLE) {

					/* determination of accruetype not required here */
					(void) update_eligible_time(JOB_ELIGIBLE, pj);
				}

				pj = (job *) GET_NEXT(pj->ji_jobque);
			}

		} else { /* started = ON */
			/* determine accrue type and accrue time */

			pj = (job *) GET_NEXT(pque->qu_jobs);

			while (pj != NULL) {

				oldtype = get_jattr_long(pj, JOB_ATR_accrue_type);

				if (oldtype != JOB_RUNNING && oldtype != JOB_INELIGIBLE &&
				    oldtype != JOB_ELIGIBLE) {

					newaccruetype = determine_accruetype(pj);
					update_eligible_time(newaccruetype, pj);
				}

				pj = (job *) GET_NEXT(pj->ji_jobque);
			}

			/* if scheduling = True, notify scheduler to start */
			if (get_sattr_long(SVR_ATR_scheduling)) {
				if (find_assoc_sched_pque(pque, &psched))
					set_scheduler_flag(SCH_SCHEDULE_STARTQ, psched);
				else {
					sprintf(log_buffer, "No scheduler associated with the partition %s", get_qattr_str(pque, QA_ATR_partition));
					log_err(-1, __func__, log_buffer);
				}
			}
		}
	}

	return 0;
}

/**
 * @brief
 * 		action routine for the queue's "partition" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_queue_partition(attribute *pattr, void *pobj, int actmode)
{
	int i;

	if (actmode == ATR_ACTION_RECOV)
		return PBSE_NONE;

	if (((pbs_queue *) pobj)->qu_qs.qu_type == QTYPE_RoutePush)
		return PBSE_ROUTE_QUE_NO_PARTITION;

	if (strcmp(pattr->at_val.at_str, DEFAULT_PARTITION) == 0)
		return PBSE_DEFAULT_PARTITION;

	for (i = 0; i < svr_totnodes; i++) {
		if (pbsndlist[i]->nd_pque) {
			if (strcmp(pbsndlist[i]->nd_pque->qu_qs.qu_name, ((pbs_queue *) pobj)->qu_qs.qu_name) == 0) {
				if (is_nattr_set(pbsndlist[i], ND_ATR_partition) && (pattr->at_flags) & ATR_VFLAG_SET)
					if (strcmp(get_nattr_str(pbsndlist[i], ND_ATR_partition), pattr->at_val.at_str))
						return PBSE_INVALID_PARTITION_QUE;
			}
		}
	}

	return PBSE_NONE;
}


================================================
FILE: src/server/queue_recov_db.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    queue_recov_db.c
 *
 * @brief
 *		queue_recov_db.c - This file contains the functions to record a queue
 *		data structure to database and to recover it from database.
 *
 *		The data is recorded in the database
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <sys/param.h>
#include "pbs_ifl.h"
#include <errno.h>
#include <fcntl.h>
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "pbs_db.h"

#ifndef PBS_MOM
extern void *svr_db_conn;
extern char *msg_init_recovque;
#endif

pbs_queue *recov_queue_cb(pbs_db_obj_info_t *dbobj, int *refreshed);

/**
 * @brief
 *		convert queue structure to DB format
 *
 * @param[in]	pque	- Address of the queue in the server
 * @param[out]	pdbque  - Address of the database queue object
 *
 * @retval   -1  Failure
 * @retval	>=0 What to save: 0=nothing, OBJ_SAVE_NEW or OBJ_SAVE_QS
 */
static int
que_to_db(pbs_queue *pque, pbs_db_que_info_t *pdbque)
{
	int savetype = 0;

	strcpy(pdbque->qu_name, pque->qu_qs.qu_name);
	pdbque->qu_type = pque->qu_qs.qu_type;

	if ((encode_attr_db(que_attr_def, pque->qu_attr, (int) QA_ATR_LAST, &pdbque->db_attr_list, 0)) != 0)
		return -1;

	if (pque->newobj) /* object was never saved or loaded before */
		savetype |= (OBJ_SAVE_NEW | OBJ_SAVE_QS);

	if (compare_obj_hash(&pque->qu_qs, sizeof(pque->qu_qs), pque->qs_hash) == 1) {
		savetype |= OBJ_SAVE_QS;
		pdbque->qu_type = pque->qu_qs.qu_type;
	}

	return savetype;
}

/**
 * @brief
 *		convert from database to queue structure
 *
 * @param[out]	pque	- Address of the queue in the server
 * @param[in]	pdbque	- Address of the database queue object
 *
 *@return 0      Success
 *@return !=0    Failure
 */
static int
db_to_que(pbs_queue *pque, pbs_db_que_info_t *pdbque)
{
	strcpy(pque->qu_qs.qu_name, pdbque->qu_name);
	pque->qu_qs.qu_type = pdbque->qu_type;

	if ((decode_attr_db(pque, &pdbque->db_attr_list.attrs, que_attr_idx, que_attr_def, pque->qu_attr, QA_ATR_LAST, 0)) != 0)
		return -1;

	compare_obj_hash(&pque->qu_qs, sizeof(pque->qu_qs), pque->qs_hash);

	pque->newobj = 0;

	return 0;
}

/**
 * @brief
 *	Save a queue to the database
 *
 * @param[in]	pque  - Pointer to the queue to save
 *
 * @return      Error code
 * @retval	0 - Success
 * @retval	1 - Failure
 *
 */
int
que_save_db(pbs_queue *pque)
{
	pbs_db_que_info_t dbque = {{0}};
	pbs_db_obj_info_t obj;
	void *conn = (void *) svr_db_conn;
	char *conn_db_err = NULL;
	int savetype;
	int rc = -1;

	if ((savetype = que_to_db(pque, &dbque)) == -1)
		goto done;

	obj.pbs_db_obj_type = PBS_DB_QUEUE;
	obj.pbs_db_un.pbs_db_que = &dbque;

	if ((rc = pbs_db_save_obj(conn, &obj, savetype)) == 0)
		pque->newobj = 0;

done:
	free_db_attr_list(&dbque.db_attr_list);

	if (rc != 0) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to save queue %s %s", pque->qu_qs.qu_name, conn_db_err ? conn_db_err : "");
		free(conn_db_err);
		panic_stop_db();
	}
	return rc;
}

/**
 * @brief
 *		Recover a queue from the database
 *
 * @param[in]	qname	- Name of the queue to recover
 * @param[out]  pq - Queue pointer, if any, to be updated
 *
 * @return	The recovered queue structure
 * @retval	NULL	- Failure
 * @retval	!NULL	- Success - address of recovered queue returned
 *
 */
pbs_queue *
que_recov_db(char *qname, pbs_queue *pq)
{
	pbs_queue *pque = NULL;
	pbs_db_que_info_t dbque = {{0}};
	pbs_db_obj_info_t obj;
	void *conn = (void *) svr_db_conn;
	int rc = -1;
	char *conn_db_err = NULL;

	if (!pq) {
		if ((pque = que_alloc(qname)) == NULL) {
			log_err(-1, __func__, "que_alloc failed");
			return NULL;
		}
		pq = pque;
	}

	strcpy(dbque.qu_name, qname);
	obj.pbs_db_obj_type = PBS_DB_QUEUE;
	obj.pbs_db_un.pbs_db_que = &dbque;

	rc = pbs_db_load_obj(conn, &obj);
	if (rc == -2)
		return pq; /* no change in que, return the same pq */

	if (rc == 0)
		rc = db_to_que(pq, &dbque);
	else {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to load queue %s, %s", qname, conn_db_err ? conn_db_err : "");
		free(conn_db_err);
	}

	free_db_attr_list(&dbque.db_attr_list);

	if (rc != 0) {
		pq = NULL; /* so we return NULL */

		if (pque)
			que_free(pque); /* free if we allocated here */
	}
	return pq;
}

/**
 * @brief
 *	Refresh/retrieve queue from database and add it into AVL tree if not present
 *
 *	@param[in]	dbobj - The pointer to the wrapper queue object of type pbs_db_que_info_t
 *	@param[out]	refreshed - To check if queues refreshed
 *
 * @return	The recovered queue
 * @retval	NULL - Failure
 * @retval	!NULL - Success, pointer to queue structure recovered
 *
 */
pbs_queue *
recov_queue_cb(pbs_db_obj_info_t *dbobj, int *refreshed)
{
	pbs_queue *pque = NULL;
	pbs_db_que_info_t *dbque = dbobj->pbs_db_un.pbs_db_que;

	*refreshed = 0;
	if ((pque = que_recov_db(dbque->qu_name, NULL)) != NULL) {
		/* que_recov increments sv_numque */
		log_eventf(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, msg_init_recovque, pque->qu_qs.qu_name);
		*refreshed = 1;
	}

	free_db_attr_list(&dbque->db_attr_list);
	if (pque == NULL)
		log_errf(PBSE_INTERNAL, __func__, "Failed to refresh queue %s", dbque->qu_name);
	return pque;
}


================================================
FILE: src/server/rattr_get_set.c
================================================
/*
 * Copyright (C) 1994-2020 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "attribute.h"
#include "job.h"
#include "reservation.h"
#include "resv_node.h"

/**
 * @brief	Get attribute of reservation based on given attr index
 *
 * @param[in] presv    - pointer to node struct
 * @param[in] attr_idx - attribute index
 *
 * @return attribute *
 * @retval NULL  - failure
 * @retval !NULL - pointer to attribute struct
 */
attribute *
get_rattr(const resc_resv *presv, int attr_idx)
{
	if (presv != NULL)
		return _get_attr_by_idx((attribute *) presv->ri_wattr, attr_idx);
	return NULL;
}

/**
 * @brief	Getter function for reservation attribute of type string
 *
 * @param[in]	presv - pointer to the reservation
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	char *
 * @retval	string value of the attribute
 * @retval	NULL if presv is NULL
 */
char *
get_rattr_str(const resc_resv *presv, int attr_idx)
{
	if (presv != NULL)
		return get_attr_str(get_rattr(presv, attr_idx));

	return NULL;
}

/**
 * @brief	Getter function for reservation attribute of type string of array
 *
 * @param[in]	presv - pointer to the reservation
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	struct array_strings *
 * @retval	value of the attribute
 * @retval	NULL if presv is NULL
 */
struct array_strings *
get_rattr_arst(const resc_resv *presv, int attr_idx)
{
	if (presv != NULL)
		return get_attr_arst(get_rattr(presv, attr_idx));

	return NULL;
}

/**
 * @brief	Getter for reservation attribute's list value
 *
 * @param[in]	presv - pointer to the reservation
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	pbs_list_head
 * @retval	value of attribute
 */
pbs_list_head
get_rattr_list(const resc_resv *presv, int attr_idx)
{
	return get_attr_list(get_rattr(presv, attr_idx));
}

/**
 * @brief	Getter function for reservation attribute of type long
 *
 * @param[in]	presv - pointer to the reservation
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	long
 * @retval	long value of the attribute
 * @retval	-1 if presv is NULL
 */
long
get_rattr_long(const resc_resv *presv, int attr_idx)
{
	if (presv != NULL)
		return get_attr_l(get_rattr(presv, attr_idx));

	return -1;
}

/**
 * @brief	Generic reservation attribute setter (call if you want at_set() action functions to be called)
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_rattr_generic(resc_resv *presv, int attr_idx, char *val, char *rscn, enum batch_op op)
{
	if (presv == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_rattr(presv, attr_idx), &resv_attr_def[attr_idx], val, rscn, op);
}

/**
 * @brief	"fast" reservation attribute setter for string values
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_rattr_str_slim(resc_resv *presv, int attr_idx, char *val, char *rscn)
{
	if (presv == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_rattr(presv, attr_idx), &resv_attr_def[attr_idx], val, rscn, INTERNAL);
}

/**
 * @brief	"fast" reservation attribute setter for long values
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_rattr_l_slim(resc_resv *presv, int attr_idx, long val, enum batch_op op)
{
	if (presv == NULL)
		return 1;

	set_attr_l(get_rattr(presv, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" reservation attribute setter for boolean values
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_rattr_b_slim(resc_resv *presv, int attr_idx, long val, enum batch_op op)
{
	if (presv == NULL)
		return 1;

	set_attr_b(get_rattr(presv, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" reservation attribute setter for char values
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_rattr_c_slim(resc_resv *presv, int attr_idx, char val, enum batch_op op)
{
	if (presv == NULL)
		return 1;

	set_attr_c(get_rattr(presv, attr_idx), val, op);

	return 0;
}

/**
 * @brief	Check if a reservation attribute is set
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to check
 *
 * @return	int
 * @retval	1 if it is set
 * @retval	0 otherwise
 */
int
is_rattr_set(const resc_resv *presv, int attr_idx)
{
	if (presv != NULL)
		return is_attr_set(get_rattr(presv, attr_idx));

	return 0;
}

/**
 * @brief	Free a reservation attribute
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to free
 *
 * @return	void
 */
void
free_rattr(resc_resv *presv, int attr_idx)
{
	if (presv != NULL)
		free_attr(resv_attr_def, get_rattr(presv, attr_idx), attr_idx);
}

/**
 * @brief	clear a reservation attribute
 *
 * @param[in]	presv - pointer to reservation
 * @param[in]	attr_idx - attribute index to clear
 *
 * @return	void
 */
void
clear_rattr(resc_resv *presv, int attr_idx)
{
	clear_attr(get_rattr(presv, attr_idx), &resv_attr_def[attr_idx]);
}


================================================
FILE: src/server/reply_send.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    reply_send.c
 *
 * @brief
 * 		This file contains the routines used to send a reply to a client following
 * 		the processing of a request.  The following routines are provided here:
 *
 *	reply_send()  - the main routine, used by all reply senders
 *	reply_ack()   - send a basic no error acknowledgement
 *	req_reject()  - send a basic error return
 *	reply_text()  - send a return with a supplied text string
 *	reply_jobid() - used by several requests where the job id must be sent
 *	reply_free()  - free the substructure that might hang from a reply
 *	set_err_msg() - set a message relating to the error "code"
 *	dis_reply_write()	- reply is sent to a remote client
 *	reply_badattr()	- Create a reject (error) reply for a request including the name of the bad attribute/resource.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <string.h>
#include <errno.h>
#include <sys/types.h>
#include <signal.h>
#include "libpbs.h"
#include "dis.h"
#include "log.h"
#include "pbs_error.h"
#include "server_limits.h"
#include "list_link.h"
#include "net_connect.h"
#include "attribute.h"
#include "credential.h"
#include "batch_request.h"
#include "work_task.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "tpp.h"

/* External Globals */

extern char *msg_daemonname;
extern char *msg_system;

#ifndef PBS_MOM
extern pbs_list_head task_list_event;
extern pbs_list_head task_list_immed;
extern char *resc_in_err;
#endif /* PBS_MOM */

#ifndef WIN32
extern volatile int reply_timedout; /* global to notify DIS routines reply took too long */
#endif
#define ERR_MSG_SIZE 256

/**
 * @brief
 * 		set a message relating to the error "code"
 *
 * @param code[in] - the specific error
 * @param msgbuf[out] - the buffer into which the message is placed
 * @param msglen[in] - length of above buffer
 */
static void
set_err_msg(int code, char *msgbuf, size_t msglen)
{
	char *msg = NULL;
	char *msg_tmp;

	/* subtract 1 from buffer length to insure room for null terminator */
	--msglen;

	/* see if there is an error message associated with the code */

	*msgbuf = '\0';
	if (code == PBSE_SYSTEM) {
		strncpy(msgbuf, msg_daemonname, msglen - 2);
		strcat(msgbuf, ": ");
		strncat(msgbuf, msg_system, msglen - strlen(msgbuf));
		msg_tmp = strerror(errno);

		if (msg_tmp)
			strncat(msgbuf, msg_tmp, msglen - strlen(msgbuf));
		else
			strncat(msgbuf, "Unknown error", msglen - strlen(msgbuf));

#ifndef PBS_MOM
	} else if ((
			   (code == PBSE_UNKRESC) ||
			   (code == PBSE_BADATVAL) ||
			   (code == PBSE_INVALSELECTRESC) ||
			   (code == PBSE_INVALJOBRESC) ||
			   (code == PBSE_INVALNODEPLACE) ||
			   (code == PBSE_DUPRESC) ||
			   (code == PBSE_INDIRECTHOP) ||
			   (code == PBSE_SAVE_ERR) ||
			   (code == PBSE_INDIRECTBT)) &&
		   (resc_in_err != NULL)) {
		strncpy(msgbuf, pbse_to_txt(code), msglen - 2);
		/* -2 is to make sure there is room for a colon and a space */
		strcat(msgbuf, ": ");
		strncat(msgbuf, resc_in_err, msglen - strlen(msgbuf));
		free(resc_in_err);
		resc_in_err = NULL;
		msg = NULL;
#endif
	} else if (code > PBSE_) {
		msg = pbse_to_txt(code);

	} else {
		msg = strerror(code);
	}

	if (msg) {
		(void) strncpy(msgbuf, msg, msglen);
	}
	msgbuf[msglen] = '\0';
}
#ifndef WIN32
/**
 * @brief
 * 		SIGALRM signal handler for dis_reply_write
 *
 * Set the volatile global variable reply_timedout
 * Record about the timeout in TCP reply.
 *
 * @param[in]	sig -  signal number
 *
 * @return	return void
 */
void
reply_alarm(int sig)
{
	reply_timedout = 1;
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_WARNING,
		  "dis_reply_write", "timeout attempting to send TCP reply");
}
#endif

/**
 * @brief
 * 		reply is to be sent to a remote client
 *
 * @param[in]	sfds - connection socket
 * @param[in]	preq - batch_request which contains the reply for the request
 *
 * @return	return code
 */
static int
dis_reply_write(int sfds, struct batch_request *preq)
{
	int rc;
	struct batch_reply *preply = &preq->rq_reply;
#ifndef WIN32
	struct sigaction act, oact;
	time_t old_tcp_timeout = pbs_tcp_timeout;
#endif

	if (preq->prot == PROT_TPP) {
		rc = encode_DIS_replyTPP(sfds, preq->tppcmd_msgid, preply);
	} else {
#ifndef WIN32
		reply_timedout = 0;
		/* set alarm to interrupt poll() etc. while flushing out data */
		sigemptyset(&act.sa_mask);
		act.sa_flags = 0;
		act.sa_handler = reply_alarm;
		if (sigaction(SIGALRM, &act, &oact) == -1)
			return (PBS_NET_RC_RETRY);
		alarm(PBS_DIS_TCP_TIMEOUT_REPLY);
		pbs_tcp_timeout = PBS_DIS_TCP_TIMEOUT_REPLY;
#endif
		/*
		 * clear pbs_tcp_errno - set on error in dis_flush when called
		 * either in encode_DIS_reply() or directly below.
		 */
		pbs_tcp_errno = 0;
		DIS_tcp_funcs(); /* setup for DIS over tcp */

		rc = encode_DIS_reply(sfds, preply);
	}

	if (rc == 0) {
		rc = dis_flush(sfds);
	}

#ifndef WIN32
	reply_timedout = 0; /* Resetting the value for next tcp connection */
	if (preq->prot == PROT_TCP) {
		alarm(0);
		(void) sigaction(SIGALRM, &oact, NULL); /* reset handler for SIGALRM */
	}
	pbs_tcp_timeout = old_tcp_timeout;
#endif
	if (rc) {
		char hn[PBS_MAXHOSTNAME + 1];

		if (get_connecthost(sfds, hn, PBS_MAXHOSTNAME) == -1)
			strcpy(hn, "??");
		(void) sprintf(log_buffer, "DIS reply failure, %d, to host %s, errno=%d", rc, hn, pbs_tcp_errno);
		/* if EAGAIN - then write was blocked and timed-out, note it */
		if (pbs_tcp_errno == EAGAIN)
			strcat(log_buffer, " write timed out");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_REQUEST, LOG_WARNING,
			  "dis_reply_write", log_buffer);
		close_client(sfds);
	}
	return rc;
}

int
reply_send_status_part(struct batch_request *preq)
{
	int rc = PBSE_SYSTEM;
	if (preq->rq_conn >= 0) {
		struct batch_reply *preply = &preq->rq_reply;
		preply->brp_is_part = 1;
		rc = dis_reply_write(preq->rq_conn, preq);
		if (rc != PBSE_NONE)
			return rc;
		reply_free(&preq->rq_reply);
		preply->brp_choice = BATCH_REPLY_CHOICE_Status;
		CLEAR_HEAD(preply->brp_un.brp_status);
		preply->brp_count = 0;
	}
	return rc;
}

/**
 * @brief
 * 		Send a reply to a batch request, reply either goes to a
 * 		remote client over the network:
 *		Encode the reply to a "presentation element",
 *		allocate the presenetation stream and attach to socket,
 *		write out reply, and free ps, pe, and isoreply structures.
 * 		Or the reply is for a request from the local server:
 *		locate the work task associated with the request and dispatch it
 *
 * @par Side-effects:
 *		The request (and reply) structures are freed.
 *
 * @param[in]	request	- batch request
 *
 * @return	error code
 * @retval	0	- success
 * @retval	!=0	- failure
 */
int
reply_send(struct batch_request *request)
{
#ifndef PBS_MOM
	struct work_task *ptask;
#endif /* PBS_MOM */
	int rc = 0;
	int sfds; /* socket */
	int rq_type;

	if (request == NULL)
		return 0;

	sfds = request->rq_conn;
	rq_type = request->rq_type;

	if (rq_type == PBS_BATCH_ModifyJob_Async || rq_type == PBS_BATCH_AsyrunJob) {
		free_br(request);
		return 0;
	}

	request->rq_reply.brp_is_part = 0;

	/* if this is a child request, just move the error to the parent */
	if (request->rq_parentbr) {
		if (((request->rq_parentbr->rq_reply.brp_choice == BATCH_REPLY_CHOICE_NULL) || (request->rq_parentbr->rq_reply.brp_choice == BATCH_REPLY_CHOICE_Delete)) && (request->rq_parentbr->rq_reply.brp_code == 0)) {
			request->rq_parentbr->rq_reply.brp_code = request->rq_reply.brp_code;
			request->rq_parentbr->rq_reply.brp_auxcode = request->rq_reply.brp_auxcode;
			if (request->rq_type == PBS_BATCH_DeleteJobList) {
				request->rq_parentbr->rq_reply.brp_count = request->rq_reply.brp_count;
				pbs_delstatfree(request->rq_parentbr->rq_reply.brp_un.brp_deletejoblist.brp_delstatc);
				request->rq_parentbr->rq_reply.brp_un.brp_deletejoblist.brp_delstatc = request->rq_reply.brp_un.brp_deletejoblist.brp_delstatc;
			}
			if (request->rq_reply.brp_choice == BATCH_REPLY_CHOICE_Text) {
				request->rq_parentbr->rq_reply.brp_choice =
					request->rq_reply.brp_choice;
				request->rq_parentbr->rq_reply.brp_un.brp_txt.brp_txtlen = request->rq_reply.brp_un.brp_txt.brp_txtlen;
				request->rq_parentbr->rq_reply.brp_un.brp_txt.brp_str =
					strdup(request->rq_reply.brp_un.brp_txt.brp_str);
				if (request->rq_parentbr->rq_reply.brp_un.brp_txt.brp_str == NULL) {
					log_err(-1, "reply_send", "Unable to allocate Memory!\n");
					return (PBSE_SYSTEM);
				}
			}
		}
	} else if (request->rq_refct > 0) {
		/* waiting on sister (subjob) requests, will send when */
		/* last one decrecments the reference count to zero    */
		return 0;
	} else if (sfds == PBS_LOCAL_CONNECTION) {

#ifndef PBS_MOM
		/*
		 * reply stays local, find work task and move it to
		 * the immediate list for dispatching.
		 *
		 * Special Note: In this instance the function that utimately
		 * gets dispatched by the work_task entry has the RESPONSIBILITY
		 * for freeing the batch_request structure.
		 */

		ptask = find_work_task(WORK_Deferred_Local, request, NULL);
		return convert_work_task(ptask, WORK_Immed);

		/* Uh Oh, should have found a task and didn't */

		log_err(-1, __func__, "did not find work task for local request");
#endif /* PBS_MOM */
		rc = PBSE_SYSTEM;

	} else if (sfds >= 0) {

		/*
		 * Otherwise, the reply is to be sent to a remote client
		 */
		if (rc == PBSE_NONE) {
			rc = dis_reply_write(sfds, request);
		}
	}

	free_br(request);
	return (rc);
}

/**
 * @brief
 * 		Send a normal acknowledgement reply to a request
 *
 * @param[in,out]	preq	- request structure
 *
 * @par Side-effects:
 *		Always frees the request structure.
 *
 */
void
reply_ack(struct batch_request *preq)
{
	int rq_type;

	if (preq == NULL)
		return;

	rq_type = preq->rq_type;
	if (rq_type == PBS_BATCH_ModifyJob_Async || rq_type == PBS_BATCH_AsyrunJob) {
		free_br(preq);
		return;
	}

	if (preq->prot == PROT_TPP && preq->tpp_ack == 0) {
		free_br(preq);
		return;
	}

	if (preq->rq_type != PBS_BATCH_DeleteJobList) {
		if (preq->rq_reply.brp_choice != BATCH_REPLY_CHOICE_NULL)
			/* in case another reply was being built up, clean it out */
			reply_free(&preq->rq_reply);
		preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
	}

	preq->rq_reply.brp_code = PBSE_NONE;
	preq->rq_reply.brp_auxcode = 0;

	(void) reply_send(preq);
}

/**
 * @brief
 * 		Free any sub-structures that might hang from the basic
 * 		batch_reply structure, the reply structure itself IS NOT FREED.
 *
 * @param[in]	prep	- basic batch_reply structure
 */
void
reply_free(struct batch_reply *prep)
{
	struct brp_status *pstat;
	struct brp_status *pstatx;
	struct brp_select *psel;
	struct brp_select *pselx;
	struct batch_deljob_status *pdelstat;
	struct batch_deljob_status *pdelstatx;

	if (prep->brp_choice == BATCH_REPLY_CHOICE_Text) {
		if (prep->brp_un.brp_txt.brp_str) {
			(void) free(prep->brp_un.brp_txt.brp_str);
			prep->brp_un.brp_txt.brp_str = NULL;
			prep->brp_un.brp_txt.brp_txtlen = 0;
		}

	} else if (prep->brp_choice == BATCH_REPLY_CHOICE_Select) {
		psel = prep->brp_un.brp_select;
		while (psel) {
			pselx = psel->brp_next;
			(void) free(psel);
			psel = pselx;
		}

	} else if (prep->brp_choice == BATCH_REPLY_CHOICE_Status) {
		pstat = (struct brp_status *) GET_NEXT(prep->brp_un.brp_status);
		while (pstat) {
			pstatx = (struct brp_status *) GET_NEXT(pstat->brp_stlink);
			free_attrlist(&pstat->brp_attr);
			(void) free(pstat);
			pstat = pstatx;
		}

	} else if (prep->brp_choice == BATCH_REPLY_CHOICE_Delete) {
		pdelstat = prep->brp_un.brp_deletejoblist.brp_delstatc;
		while (pdelstat) {
			pdelstatx = pdelstat->next;
			if (pdelstat->name)
				free(pdelstat->name);
			free(pdelstat);
			pdelstat = pdelstatx;
		}

	} else if (prep->brp_choice == BATCH_REPLY_CHOICE_RescQuery) {
		(void) free(prep->brp_un.brp_rescq.brq_avail);
		(void) free(prep->brp_un.brp_rescq.brq_alloc);
		(void) free(prep->brp_un.brp_rescq.brq_resvd);
		(void) free(prep->brp_un.brp_rescq.brq_down);
	}
	prep->brp_choice = BATCH_REPLY_CHOICE_NULL;
}

/**
 * @brief
 * 		Create a reject (error) reply for a request, then send the reply.
 *
 * @param[in]	code	- PBS error code indicating the reason the rejection
 * 							is taking place.  If this is PBSE_NONE, no log message is output.
 * @param[in]	aux	- Auxiliary error code
 * @param[in,out]	preq	- Pointer to batch request
 *
 * @par Side-effects:
 *		Always frees the request structure.
 */
void
req_reject(int code, int aux, struct batch_request *preq)
{
	int evt_type;
	char msgbuf[ERR_MSG_SIZE];
	int rq_type;

	if (preq == NULL)
		return;

	rq_type = preq->rq_type;
	if (rq_type == PBS_BATCH_ModifyJob_Async || rq_type == PBS_BATCH_AsyrunJob) {
		free_br(preq);
		return;
	}

	if (code != PBSE_NONE) {
		evt_type = PBSEVENT_DEBUG;
		if (code == PBSE_BADHOST)
			evt_type |= PBSEVENT_SECURITY;
		sprintf(log_buffer,
			"Reject reply code=%d, aux=%d, type=%d, from %s@%s",
			code, aux, preq->rq_type, preq->rq_user, preq->rq_host);
		log_event(evt_type, PBS_EVENTCLASS_REQUEST, LOG_INFO,
			  "req_reject", log_buffer);
	}
	set_err_msg(code, msgbuf, ERR_MSG_SIZE);

	if (preq->rq_type != PBS_BATCH_DeleteJobList) {
		if (preq->rq_reply.brp_choice != BATCH_REPLY_CHOICE_NULL) {
			/* in case another reply was being built up, clean it out */
			reply_free(&preq->rq_reply);
		}

		if (*msgbuf != '\0') {
			preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_Text;
			if ((preq->rq_reply.brp_un.brp_txt.brp_str = strdup(msgbuf)) == NULL) {
				log_err(-1, "req_reject", "Unable to allocate Memory!\n");
				return;
			}
			preq->rq_reply.brp_un.brp_txt.brp_txtlen = strlen(msgbuf);
		} else {
			preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
		}
	}

	preq->rq_reply.brp_code = code;
	preq->rq_reply.brp_auxcode = aux;

	(void) reply_send(preq);
}

/**
 * @brief
 * 		Create a reject (error) reply for a request including
 * 		the name of the bad attribute/resource.
 *
 * @param[in]	code	PBS error code indicating the reason the rejection
 * 			is taking place.  If this is PBSE_NONE, no log message is output.
 * @param[in]	aux	Auxiliary error code
 * @param[in,out] pal	external form of attributes.
 * @param[in]	preq	Pointer to batch request
 */
void
reply_badattr(int code, int aux, svrattrl *pal,
	      struct batch_request *preq)
{
	int i = 1;
	size_t len;
	char msgbuf[ERR_MSG_SIZE];

	if (preq == NULL)
		return;

	if (preq->rq_type == PBS_BATCH_ModifyJob_Async) {
		free_br(preq);
		return;
	}

#ifdef NAS /* localmod 005 */
	set_err_msg(code, msgbuf, sizeof(msgbuf));
#else
	set_err_msg(code, msgbuf, ERR_MSG_SIZE);
#endif /* localmod 005 */

	while (pal) {
		if (i == aux) {
			/* append attribute info only if it fits in msgbuf */
			/* add one for space between msg and attribute name */
			len = strlen(msgbuf) + 1 + strlen(pal->al_name);
			if (pal->al_resc)
				/* add one for dot between attribute and resource */
				len += 1 + strlen(pal->al_resc);

#ifdef NAS /* localmod 005 */
			if (len < sizeof(msgbuf)) {
#else
			if (len < ERR_MSG_SIZE) {
#endif /* localmod 005 */
				(void) strcat(msgbuf, " ");
				(void) strcat(msgbuf, pal->al_name);
				if (pal->al_resc) {
					(void) strcat(msgbuf, ".");
					(void) strcat(msgbuf, pal->al_resc);
				}
			}
			break;
		}
		pal = (svrattrl *) GET_NEXT(pal->al_link);
		++i;
	}

	(void) reply_text(preq, code, msgbuf);
}

/**
 * @brief
 * 		Return a reply with a supplied text string.
 *
 * @param[out]	preq	- Pointer to batch request
 * @param[in]	code	- PBS error code indicating the reason the rejection
 * 							is taking place.  If this is PBSE_NONE, no log message is output.
 * @param[in]	text	- text string for the reply.
 *
 * @return	error code
 */
int
reply_text(struct batch_request *preq, int code, char *text)
{
	if (preq == NULL)
		return 0;

	if (preq->rq_type == PBS_BATCH_ModifyJob_Async) {
		free_br(preq);
		return 0;
	}

	if (preq->rq_reply.brp_choice != BATCH_REPLY_CHOICE_NULL)
		/* in case another reply was being built up, clean it out */
		reply_free(&preq->rq_reply);

	preq->rq_reply.brp_code = code;
	preq->rq_reply.brp_auxcode = 0;
	if (text && *text) {
		preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_Text;
		if ((preq->rq_reply.brp_un.brp_txt.brp_str = strdup(text)) == NULL)
			return 0;
		preq->rq_reply.brp_un.brp_txt.brp_txtlen = strlen(text);
	} else {
		preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
	}
	return reply_send(preq);
}

/**
 * @brief
 * 		Return a reply with the job id.
 *
 * @see req_queuejob()
 * @see req_commit()
 *
 * @par Side-effects:
 *		Always frees the request structure.
 *
 * @param[out]	preq	- Pointer to batch request
 * @param[in]	jobid	- job id.
 * @param[in]	which	- the union discriminator
 */
int
reply_jobid(struct batch_request *preq, char *jobid, int which)
{
	if (preq->rq_reply.brp_choice != BATCH_REPLY_CHOICE_NULL)
		/* in case another reply was being built up, clean it out */
		reply_free(&preq->rq_reply);

	preq->rq_reply.brp_code = 0;
	preq->rq_reply.brp_auxcode = 0;
	preq->rq_reply.brp_choice = which;
	(void) strncpy(preq->rq_reply.brp_un.brp_jid, jobid, PBS_MAXSVRJOBID);
	return (reply_send(preq));
}


================================================
FILE: src/server/req_cred.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	req_cred.c
 *
 * @brief
 *  Server routines providing and sending credentials to superior mom.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include "libpbs.h"
#include "job.h"
#include "batch_request.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "server.h"

#define CRED_DATA_SIZE 4096

/* credential type */
#define CRED_NONE 0
#define CRED_KRB5 1

extern struct server server;
extern void release_req(struct work_task *);
extern int relay_to_mom(job *, struct batch_request *, void (*)(struct work_task *));
extern time_t time_now;
pbs_list_head svr_creds_cache; /* all credentials cached and available to send */
extern long svr_cred_renew_cache_period;

struct cred_cache {
	pbs_list_link cr_link;
	char credid[PBS_MAXUSER + 1];
	long validity;
	int type;
	char *data; /* credentials in base64 */
	size_t size;
};
typedef struct cred_cache cred_cache;

/* @brief
 *	First, this function checks whether the credentials for credid (e.g. principal) of the
 *	job are stored in server's memory cache and whether the credentials are
 *	not too old. Such credentials are returned. If they are not present
 *	in cache or are too old new credentials are requested with the
 *	SVR_ATR_cred_renew_tool and renewed credentials are stored in the cache
 *	(server's memory).
 *
 * @param[in] pjob - pointer to job, the credentials are requested for this job
 *
 * @return	cred_cache
 * @retval	structure with credentials on success
 * @retval	NULL otherwise
 */
static struct cred_cache *
get_cached_cred(job *pjob)
{
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	cred_cache *cred = NULL;
	cred_cache *nxcred = NULL;
	char cmd[MAXPATHLEN + PBS_MAXUSER + 2]; /* +1 for space and +1 for EOL */
	char buf[CRED_DATA_SIZE];
	FILE *fp;
	long validity = 0;
	int cred_type = CRED_NONE;
	int ret = 0;

	/* try the cache first */
	cred = (cred_cache *) GET_NEXT(svr_creds_cache);
	while (cred) {
		nxcred = (cred_cache *) GET_NEXT(cred->cr_link);

		if (strcmp(cred->credid, get_jattr_str(pjob, JOB_ATR_cred_id)) == 0 &&
		    cred->validity - svr_cred_renew_cache_period > time_now) {
			/* valid credential found */
			return cred;
		}

		/* too old credential - delete from cache */
		if (cred->validity - svr_cred_renew_cache_period <= time_now) {
			delete_link(&cred->cr_link);
			free(cred->data);
			free(cred);
		}

		cred = nxcred;
	}

	/* valid credentials not cached, get new one */

	if (!is_sattr_set(SVR_ATR_cred_renew_tool)) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			   LOG_ERR, msg_daemonname, "%s is not set", ATTR_cred_renew_tool);
		return NULL;
	}

	log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER,
		   LOG_DEBUG, msg_daemonname, "using %s '%s' to acquire credentials for user: %s",
		   ATTR_cred_renew_tool,
		   get_sattr_str(SVR_ATR_cred_renew_tool),
		   get_jattr_str(pjob, JOB_ATR_cred_id));

	snprintf(cmd, MAXPATHLEN + PBS_MAXUSER + 2, "%s %s", /* +1 for space and +1 for EOL */
		 get_sattr_str(SVR_ATR_cred_renew_tool),
		 get_jattr_str(pjob, JOB_ATR_cred_id));

	if ((fp = popen(cmd, "r")) == NULL) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			   LOG_ERR, msg_daemonname, "%s failed to open pipe, command: '%s'",
			   ATTR_cred_renew_tool, cmd);
		return NULL;
	}

	while (fgets(buf, CRED_DATA_SIZE, fp) != NULL) {
		strtok(buf, "\n");
		if (strncmp(buf, "Valid until:", strlen("Valid until:")) == 0)
			validity = strtol(buf + strlen("Valid until:"), NULL, 10);

		if (strncmp(buf, "Type: ", strlen("Type: ")) == 0) {
			if (strncmp(buf + strlen("Type: "), "Kerberos", strlen("Kerberos")) == 0)
				cred_type = CRED_KRB5;
		}

		/* last line in buf is credential in base64 - will be read later */
	}

	if ((ret = pclose(fp))) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			   LOG_ERR, msg_daemonname, "%s command '%s' failed, exitcode: %d",
			   ATTR_cred_renew_tool, cmd, WEXITSTATUS(ret));
		return NULL;
	}

	if (buf == NULL || strlen(buf) <= 1 || validity < time_now) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			   LOG_ERR, msg_daemonname, "%s command '%s' returned invalid credentials for %s",
			   ATTR_cred_renew_tool, cmd,
			   get_jattr_str(pjob, JOB_ATR_cred_id));

		return NULL;
	}

	if ((cred = (cred_cache *) malloc(sizeof(cred_cache))) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		return NULL;
	}

	strncpy(cred->credid, get_jattr_str(pjob, JOB_ATR_cred_id), PBS_MAXUSER);
	cred->credid[PBS_MAXUSER] = '\0';
	cred->type = cred_type;
	cred->validity = validity;
	cred->size = strlen(buf);

	if ((cred->data = (char *) malloc(cred->size + 1)) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		free(cred);
		return NULL;
	}

	/* here we read the credential in base64 */
	strcpy(cred->data, buf);

	/* store cred to cache */
	CLEAR_LINK(cred->cr_link);
	append_link(&svr_creds_cache, &cred->cr_link, cred);
	return cred;
#else
	return NULL;
#endif
}

/* @brief
 *	Prepare batch request structure for sending credentials to superior mom
 *	and fill in the structure with data like credentials or credid.
 *
 * @param[in] preq - batch request
 * @param[in] pjob - pointer to job
 *
 * @return	preq
 * @retval	structure with batch request
 */
static struct batch_request *
setup_cred(struct batch_request *preq, job *pjob)
{
	cred_cache *cred;

	if (preq == NULL) {
		preq = alloc_br(PBS_BATCH_Cred);

		if (preq == NULL) {
			return preq;
		}
	}

	preq->rq_ind.rq_cred.rq_cred_data = NULL;

	if ((cred = get_cached_cred(pjob)) == NULL) {
		free_br(preq);
		return NULL;
	}

	strcpy(preq->rq_ind.rq_cred.rq_credid, get_jattr_str(pjob, JOB_ATR_cred_id));
	strcpy(preq->rq_ind.rq_cred.rq_jobid, pjob->ji_qs.ji_jobid);
	preq->rq_ind.rq_cred.rq_cred_type = cred->type;
	preq->rq_ind.rq_cred.rq_cred_validity = cred->validity;
	if ((preq->rq_ind.rq_cred.rq_cred_data = (char *) malloc(cred->size + 1)) == NULL) {
		log_err(errno, __func__, "Unable to allocate Memory!\n");
		req_reject(PBSE_SYSTEM, 0, preq);
	}
	strcpy(preq->rq_ind.rq_cred.rq_cred_data, cred->data);

	return preq;
}

/* @brief
 *	Once the credentials are sent to to superior mom, this function is called
 *	and if the credentials were sent successfully then the job attribute
 *	JOB_ATR_cred_validity is changed to the validity of credentials.
 *
 * @param[in] pwt - pointer to work task
 *
 */
static void
post_cred(struct work_task *pwt)
{
	int code;
	job *pjob;
	struct batch_request *preq;

	preq = pwt->wt_parm1;
	code = preq->rq_reply.brp_code;
	pjob = find_job(preq->rq_ind.rq_cred.rq_jobid);

	if (pjob != NULL) {

		if (code != 0) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB,
				   LOG_INFO, pjob->ji_qs.ji_jobid,
				   "sending credential to mom failed, returned code: %d", code);
		} else {
			/* send_cred was successful  - update validity*/

			set_jattr_l_slim(pjob, JOB_ATR_cred_validity, preq->rq_ind.rq_cred.rq_cred_validity, SET);

			/* save the full job */
			(void) job_save_db(pjob);

			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "sending credential to mom succeed");
		}
	} else
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_INFO, __func__, "failed, job unknown");

	release_req(pwt); /* close connection and release request */
}

/* @brief
 *	Retrieve and send credentials for a particular job to the superior
 *	mom of the job.
 *
 * @param[in] pjob - pointer to job
 *
 * @return	int
 * @retval	0 on success
 * @retval	!= 0 on error
 */
int
send_cred(job *pjob)
{
	struct batch_request *credreq = NULL;
	int rc;

	if (pjob == NULL) {
		return PBSE_SYSTEM;
	}

	credreq = setup_cred(credreq, pjob);
	if (credreq) {
		rc = relay_to_mom(pjob, credreq, post_cred);
		if (rc == PBSE_NORELYMOM) /* otherwise the post_cred will free the request */
			free_br(credreq);
		return rc;
	}

	return PBSE_IVALREQ;
}


================================================
FILE: src/server/req_delete.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	req_delete.c
 *
 * Functions relating to the Delete Job Batch Requests.
 *
 * Included funtions are:
 *	remove_stagein()
 *	acct_del_write()
 *	check_deletehistoryjob()
 *	issue_delete()
 *	req_deletejob()
 *	req_deletejob2()
 *	req_deleteReservation()
 *	post_deljobfromresv_req()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include <signal.h>
#include "portability.h"
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "work_task.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "resv_node.h"
#include "queue.h"
#include "hook.h"

#include "job.h"
#include "reservation.h"
#include "pbs_error.h"
#include "acct.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

#define QDEL_BREAKER_SECS 5

/* Global Data Items: */

extern char *msg_deletejob;
extern char *msg_delrunjobsig;
extern char *msg_manager;
extern char *msg_noDeljobfromResv;
extern char *msg_deleteresv;
extern char *msg_deleteresvJ;
extern char *msg_job_history_delete;
extern char *msg_job_history_notset;
extern char *msg_also_deleted_job_history;
extern char *msg_err_malloc;
extern struct server server;
extern time_t time_now;

/* External functions */

extern int issue_to_svr(char *, struct batch_request *, void (*func)(struct work_task *));
extern struct batch_request *cpy_stage(struct batch_request *, job *, enum job_atr, int);
extern resc_resv *chk_rescResv_request(char *, struct batch_request *);

/* Private Functions in this file */

static void post_delete_mom1(struct work_task *);
static void post_deljobfromresv_req(struct work_task *);
static int req_deletejob2(struct batch_request *preq, job *pjob);
static void resume_deletion(struct work_task *ptask);

/* Private Data Items */

static char *sigk = "SIGKILL";
static char *sigt = "SIGTERM";
static char *sigtj = SIG_TermJob;
static char *acct_fmt = "requestor=%s@%s";
static bool qdel_mail = true; /* true: sending mail */

/**
 * @brief
 * 	Service to resume the deletion - this is called from a work_interleave task 
 *
 * @param[in/out] preq - pointer to task structure
 *
 * @return void
 */
static void
resume_deletion(struct work_task *ptask)
{
	struct batch_request *preq = (struct batch_request *) ptask->wt_parm1;

	if (preq == NULL)
		return;

	if (preq->rq_type == PBS_BATCH_DeleteJobList)
		preq->rq_ind.rq_deletejoblist.rq_resume = TRUE;

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
		   "Resuming deletetion operation");
	req_deletejob(preq);
	return;
}

/**
 * @brief
 * 		remove_stagein() - request that mom delete staged-in files for a job
 *		used when the job is to be purged after files have been staged in
 *
 * @param[in,out]	pjob	- job
 * 
 * @return	int
 * @retval	0	- success
 * @retval	non-zero	- error code
 */

int
remove_stagein(job *pjob)
{
	struct batch_request *preq = 0;
	int rc = 0;

	preq = cpy_stage(preq, pjob, JOB_ATR_stagein, 0);

	if (preq) { /* have files to delete		*/

		/* change the request type from copy to delete  */

		preq->rq_type = PBS_BATCH_DelFiles;
		preq->rq_extra = NULL;
		rc = relay_to_mom(pjob, preq, release_req);
		if (rc == 0) {
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_StagedIn;
		} else {
			/* log that we were unable to remove the files */
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_FILE,
				  LOG_NOTICE, pjob->ji_qs.ji_jobid,
				  "unable to remove staged-in files for job");
			free_br(preq);
		}
	}
	return rc;
}

/**
 * @brief
 * 		acct_del_write - write the Job Deleted account record
 *
 * @param[in]	jid	- Job Id.
 * @param[in]	pjob	- Job structure.
 * @param[in]	preq - batch_request
 * @param[in]	nomail	- do not send mail to the job owner if enabled.
 */

static void
acct_del_write(char *jid, job *pjob, struct batch_request *preq, int nomail)
{
	sprintf(log_buffer, acct_fmt, preq->rq_user, preq->rq_host);
	write_account_record(PBS_ACCT_DEL, jid, log_buffer);

	sprintf(log_buffer, msg_manager, msg_deletejob,
		preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jid, log_buffer);

	if (pjob != NULL) {
		int jt = is_job_array(jid);

		switch (jt) {
			case IS_ARRAY_NO: /* not a subjob */
			case IS_ARRAY_ArrayJob:

				/* if block set, send word */
				check_block(pjob, log_buffer);
		}

		if (preq->rq_parentbr == NULL && nomail == 0 &&
		    svr_chk_owner(preq, pjob) != 0 &&
		    qdel_mail != 0) {
			svr_mailowner_id(jid, pjob,
					 MAIL_OTHER, MAIL_FORCE, log_buffer);
		}
	}
}

/**
 * @brief check whether all jobs got deleted
 * 
 * @param[in] preply - reply struct
 * @return bool
 * @retval true - All jobs got deleted.
 * @retval false - more jobs pending to be deleted
 */
static bool
all_jobs_deleted(struct batch_reply *preply)
{
	void *idx = preply->brp_un.brp_deletejoblist.undeleted_job_idx;

	if (pbs_idx_is_empty(idx)) {
		pbs_idx_destroy(idx);
		preply->brp_un.brp_deletejoblist.undeleted_job_idx = NULL;
		return TRUE;
	}

	return FALSE;
}

/**
 * @Brief
 * 	- Updates the reply struct with the finished jobid
 *	- Updates the job's error code in reply structure by allocating 
 *		batch_deljob_status struct.
 *	- Check if it is time to respond back.
 *
 * @param[in]	preq - pointer batch request structure
 * @param[in]	jid	- job id.
 * @param[in]	errcode - Job's error code 
 *
 * @return	bool
 * @retval	TRUE	- all jobs deleted
 * @retval	FALSE	- jobs remaining to be deleted
 */
bool
update_deljob_rply(struct batch_request *preq, char *jid, int errcode)
{
	struct batch_deljob_status *pdelstat;
	struct batch_reply *preply = &preq->rq_reply;
	void *idx;
	char **data = NULL;

	if (preq->rq_type != PBS_BATCH_DeleteJobList)
		return FALSE;

	if (errcode != PBSE_NONE) {
		/* allocate reply structure and fill in jobid and status portion */
		pdelstat = (struct batch_deljob_status *) malloc(sizeof(struct batch_deljob_status));
		if (pdelstat == NULL)
			log_err(PBSE_SYSTEM, __func__, "Failed to allocate memory");

		pdelstat->name = strdup(jid);
		pdelstat->code = errcode;
		pdelstat->next = preply->brp_un.brp_deletejoblist.brp_delstatc;
		preply->brp_un.brp_deletejoblist.brp_delstatc = pdelstat;
		preq->rq_reply.brp_count++;
	}

	idx = preply->brp_un.brp_deletejoblist.undeleted_job_idx;
	if (jid)
		if (pbs_idx_find(idx, (void **) &jid, (void **) &data, NULL) == PBS_IDX_RET_OK)
			pbs_idx_delete(idx, jid);
		else
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
				   "job %s has already been deleted from delete job list", jid);
	else
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
			  __func__, "update_deljob_rply invoked with empty job id");

	return all_jobs_deleted(preply);
}

/**
 * @Brief
 *		If the job is a history job then purge its history
 *		If the job is a non-history job then it must be terminated before purging its history. Will be
 *		done by req_deletejob()
 *
 * @param[in]	preq	- Batch request structure.
 *
 * @return	int
 * @retval	TRUE	- Job history  has been purged
 * @retval	FALSE	- Job is not a history job
 */
int
check_deletehistoryjob(struct batch_request *preq, char *jid)
{
	job *histpjob;
	job *pjob;
	int historyjob;
	int histerr;
	int t;

	/*
	 * If the array subjob or range of subjobs are in a history state then
	 * reject the request as we cant delete history of array subjobs
	 */
	t = is_job_array(jid);
	if ((t == IS_ARRAY_Single) || (t == IS_ARRAY_Range)) {
		pjob = find_arrayparent(jid);
		if ((histerr = svr_chk_histjob(pjob))) {
			if (update_deljob_rply(preq, jid, PBSE_NOHISTARRAYSUBJOB))
				req_reject(PBSE_NOHISTARRAYSUBJOB, 0, preq);
			return TRUE;
		} else {
			/*
			 * Job is in a Non Finished state . It must be terminated and then its history
			 *  should be purged .
			 */
			return FALSE;
		}
	}

	histpjob = find_job(jid);

	historyjob = svr_chk_histjob(histpjob);
	if (historyjob == PBSE_HISTJOBID) {
		snprintf(log_buffer, sizeof(log_buffer),
			 msg_job_history_delete, preq->rq_user,
			 preq->rq_host);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
			  jid,
			  log_buffer);

		/* Issue history job delete request to remote server if job is moved. */
		if (check_job_state(histpjob, JOB_STATE_LTR_MOVED))
			issue_delete(histpjob);

		if (histpjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) {
			if (histpjob->ji_ajinfo) {
				int i;
				for (i = histpjob->ji_ajinfo->tkm_start; i <= histpjob->ji_ajinfo->tkm_end; i += histpjob->ji_ajinfo->tkm_step) {
					job *psjob = get_subjob_and_state(histpjob, i, NULL, NULL);
					if (psjob) {
						log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
							   psjob->ji_qs.ji_jobid,
							   msg_job_history_delete, preq->rq_user,
							   preq->rq_host);
						job_purge(psjob);
					}
				}
			}
		}

		job_purge(histpjob);

		if (update_deljob_rply(preq, jid, PBSE_HISTJOBDELETED))
			reply_send(preq);
		return TRUE;
	} else {
		/*
		 *  Job is in a Non Finished state . It must be terminated and then its history
		 * should be purged .
		 */
		return FALSE;
	}
}

/**
 * @Brief
 *		Issue PBS_BATCH_DeleteJob request to remote server.
 *
 * @param[in]	pjob - Job structure.
 */
void
issue_delete(job *pjob)
{
	struct batch_request *preq;
	char rmt_server[PBS_MAXSERVERNAME + 1] = {'\0'};
	char *at = NULL;

	if (pjob == NULL)
		return;

	if ((at = strchr(get_jattr_str(pjob, JOB_ATR_in_queue), (int) '@')) == NULL)
		return;

	snprintf(rmt_server, sizeof(rmt_server), "%s", at + 1);

	preq = alloc_br(PBS_BATCH_DeleteJob);
	if (preq == NULL)
		return;

	pbs_strncpy(preq->rq_ind.rq_delete.rq_objname, pjob->ji_qs.ji_jobid, sizeof(preq->rq_ind.rq_delete.rq_objname));
	preq->rq_extend = malloc(strlen(DELETEHISTORY) + 1);
	if (preq->rq_extend == NULL) {
		log_err(errno, "issue_delete", msg_err_malloc);
		return;
	}

	strncpy(preq->rq_extend, DELETEHISTORY, strlen(DELETEHISTORY) + 1);

	issue_to_svr(rmt_server, preq, release_req);
}

/**
 * @Brief
 *		decrement entity usage for a single un-instantiated subjob
 *
 * @param[in]	parent - pointer to parent Job structure.
 */
static void
decr_single_subjob_usage(job *parent)
{
	parent->ji_qs.ji_svrflags &= ~JOB_SVFLG_ArrayJob;				 /* small hack to decrement usage for a single un-instantiated subjob */
	account_entity_limit_usages(parent, NULL, NULL, DECR, ETLIM_ACC_ALL);		 /* for server limit */
	account_entity_limit_usages(parent, parent->ji_qhdr, NULL, DECR, ETLIM_ACC_ALL); /* for queue limit */
	parent->ji_qs.ji_svrflags |= JOB_SVFLG_ArrayJob;				 /* setting arrayjob flag back */
}

/**
 * @brief Initialize routine for deljoblist
 * reorder the deljob list so that queued jobs will appear first.
 * do not reorder if already sorted
 * 
 * deljob can wait if jobs are in transit state.
 * This triggers other jobs in deljob list to get triggerred to be run.
 * delete will take longer to delete these running jobs as it has to contact the mom
 * meanwhile other jobs in the list will start to run
 * triggering a series of delete followed by run.
 * This has performance issues and makes debugging slower. 
 * Ordering should prevent that.
 * Complexity: O(N)
 * 
 * @param[in] preq - request structure
 *
 * @return int
 * @retval 0 for success
 * @retval 1 for failure
 */
static int
init_deljoblist(struct batch_request *preq)
{
	int head = -1;
	int tail;
	char **jlist = preq->rq_ind.rq_deletejoblist.rq_jobslist;
	struct batch_reply *preply = &preq->rq_reply;
	job *pjob;
	char *temp;
	int jt;
	char *jid;
	char *p1;
	char *p2;
	char range_jid[PBS_MAXSVRJOBID];

	if (preq->rq_ind.rq_deletejoblist.rq_resume)
		return 0;

	if (!jlist || !jlist[0])
		return 0;

	preply->brp_un.brp_deletejoblist.undeleted_job_idx = pbs_idx_create(0, 0);

	for (tail = 0; jlist[tail]; tail++) {

		jt = is_job_array(jlist[tail]);

		if (jt == IS_ARRAY_Range) {
			pjob = find_arrayparent(jlist[tail]);
		} else {
			pjob = find_job(jlist[tail]);
		}

		if (!pjob)
			continue;

		if (jt == IS_ARRAY_Range) {
			/* append fqdn to range jid
			 * the result is e.g.:
			 * '123[1-3].full.domain.name'
			 */
			sprintf(range_jid, "%s", jlist[tail]);
			p1 = strchr(pjob->ji_qs.ji_jobid, '.');
			if (p1) {
				p2 = strchr(range_jid, '.');
				if (p2)
					*p2 = '\0';
				strncat(range_jid, p1, PBS_MAXSVRJOBID - 1);
			}
			free(jlist[tail]);
			jlist[tail] = strdup(range_jid);
			if (jlist[tail] == NULL) {
				return 1;
			}

			jid = jlist[tail];
		} else {
			/* use jid with fqdn */
			if (strcmp(jlist[tail], pjob->ji_qs.ji_jobid) != 0) {
				free(jlist[tail]);
				jlist[tail] = strdup(pjob->ji_qs.ji_jobid);
				if (jlist[tail] == NULL)
					return 1;
			}

			jid = jlist[tail];
		}

		if (pbs_idx_insert(preply->brp_un.brp_deletejoblist.undeleted_job_idx, jid, NULL) != PBS_IDX_RET_OK) {
			return 1;
		}

		if (head == -1) {
			if (get_job_state(pjob) != JOB_STATE_LTR_QUEUED) {
				head = tail;
			}
			continue;
		}

		if (get_job_state(pjob) == JOB_STATE_LTR_QUEUED) {
			temp = jlist[head];
			jlist[head++] = jlist[tail];
			jlist[tail] = temp;
		}
	}

	return 0;
}

/**
 * @brief delete any pending array jobs part of delete request
 * 	from the reply index
 * 
 * @param[in] preq - request structure
 * 
 * @return bool
 * @retval TRUE: no more jobs to be deleted
 * @reval  FALSE: more jobs pending to be deleted
 */
bool
delete_pending_arrayjobs(struct batch_request *preq)
{
	void *idx;
	void *idx_ctx = NULL;
	char *jid = NULL;
	struct batch_reply *preply = &preq->rq_reply;
	char **data = NULL;

	idx = preply->brp_un.brp_deletejoblist.undeleted_job_idx;

	while (pbs_idx_find(idx, (void **) &jid, (void **) &data, &idx_ctx) == PBS_IDX_RET_OK) {
		int job_type = is_job_array(jid);
		if (jid && (((job_type == IS_ARRAY_ArrayJob) || (job_type == IS_ARRAY_Range) || (job_type == IS_ARRAY_Single))))
			pbs_idx_delete(idx, jid);
	}

	pbs_idx_free_ctx(idx_ctx);

	return all_jobs_deleted(preply);
}

/**
 * @brief
 * 		req_deletejob - service the Delete Job Request
 *
 *		This request deletes a job.
 *
 * @param[in]	preq	- Job Request
 */
void
req_deletejob(struct batch_request *preq)
{
	int forcedel = 0;
	int i;
	char jid[PBS_MAXSVRJOBID + 1];
	int jt; /* job type */
	char *pc;
	job *pjob;
	job *parent;
	char *range;
	char sjst; /* subjob state */
	int rc = 0;
	int delhist = 0;
	int err = PBSE_NONE;
	char **jobids;
	int count;
	int j;
	struct batch_reply *preply = &preq->rq_reply;
	preply->brp_un.brp_deletejoblist.brp_delstatc = NULL;
	preply->brp_count = 0;
	int start_jobid = 0;
	time_t begin_time = time(NULL);

	if (preq->rq_type == PBS_BATCH_DeleteJobList) {

		if (!preq->rq_ind.rq_deletejoblist.rq_resume) {
			if (init_deljoblist(preq) != 0) {
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
						"Error while initializing deljoblist operation (init_deljoblist failed)");
				req_reject(PBSE_INTERNAL, 0, preq);
				return;
			}
		} else
			start_jobid = preq->rq_ind.rq_deletejoblist.jobid_to_resume;

		preply->brp_choice = BATCH_REPLY_CHOICE_Delete;
		jobids = preq->rq_ind.rq_deletejoblist.rq_jobslist;
		count = preq->rq_ind.rq_deletejoblist.rq_count;
	} else {
		jobids = break_comma_list(preq->rq_ind.rq_delete.rq_objname);
		count = 1;
	}

	if (preq->rq_extend && strstr(preq->rq_extend, DELETEHISTORY))
		delhist = 1;
	if (preq->rq_extend && strstr(preq->rq_extend, FORCE))
		forcedel = 1;

	/* with nomail , nomail_force , nomail_deletehist or nomailforce_deletehist options are set
	 *  no mail is sent
	 */
	if (preq->rq_extend && strstr(preq->rq_extend, NOMAIL))
		qdel_mail = false;

	for (j = start_jobid; j < count; j++) {

		if (j != start_jobid) {
			preq->rq_ind.rq_deletejoblist.rq_resume = FALSE;
			preq->rq_ind.rq_deletejoblist.jobid_to_resume = j;
		}

		if ((time(NULL) - begin_time) > QDEL_BREAKER_SECS) {
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
				   "req_delete has been running for %d seconds, Pausing for other requests",
				   QDEL_BREAKER_SECS);
			set_task(WORK_Interleave, 0, resume_deletion, preq);
			return;
		}

		snprintf(jid, sizeof(jid), "%s", jobids[j]);
		parent = chk_job_request(jid, preq, &jt, &err);
		if (parent == NULL) {
			pjob = find_job(jid);
			if (pjob != NULL && pjob->ji_pmt_preq != NULL)
				reply_preempt_jobs_request(err, PREEMPT_METHOD_DELETE, pjob);
			if (update_deljob_rply(preq, jid, err)) {
				if (preq->rq_type == PBS_BATCH_DeleteJobList)
					req_reject(err, 0, preq); /* note, req_reject is not called for delete job request 2 */
				return;
			} else
				continue;
		}

		if (delhist) {
			rc = check_deletehistoryjob(preq, jid);
			if (rc == TRUE)
				continue;
		}

		if (jt == IS_ARRAY_NO) {

			/* just a regular job, pass it on down the line and be done
			 * If the request is to purge the history of the job then set ji_deletehistory to 1
			 */
			if (delhist)
				parent->ji_deletehistory = 1;
			if (req_deletejob2(preq, parent) == 2)
				return;
			continue;

		} else if (jt == IS_ARRAY_Single) {
			/* single subjob, if running do full delete, */
			/* if not then just set it expired		 */

			pjob = get_subjob_and_state(parent, get_index_from_jid(jid), &sjst, NULL);
			if (sjst == JOB_STATE_LTR_UNKNOWN) {
				if (update_deljob_rply(preq, jid, PBSE_IVALREQ)) {
					req_reject(PBSE_IVALREQ, 0, preq);
					return;
				} else
					continue;
			}

			if ((sjst == JOB_STATE_LTR_EXITING) && (forcedel == 0)) {
				if (parent->ji_pmt_preq != NULL) {
					pjob = find_job(jid);
					reply_preempt_jobs_request(PBSE_BADSTATE, PREEMPT_METHOD_DELETE, pjob);
				}
				if (update_deljob_rply(preq, jid, PBSE_BADSTATE)) {
					req_reject(PBSE_BADSTATE, 0, preq);
					return;
				} else
					continue;
			} else if (sjst == JOB_STATE_LTR_EXPIRED) {
				if (update_deljob_rply(preq, jid, PBSE_NOHISTARRAYSUBJOB)) {
					req_reject(PBSE_NOHISTARRAYSUBJOB, 0, preq);
					return;
				} else
					continue;
			} else if (pjob != NULL) {
				/*
				* If the request is to also purge the history of the sub job then set ji_deletehistory to 1
				*/
				if (delhist)
					pjob->ji_deletehistory = 1;
				if (req_deletejob2(preq, pjob) == 2)
					return;
			} else {
				update_sj_parent(parent, NULL, jid, sjst, JOB_STATE_LTR_EXPIRED);
				acct_del_write(jid, parent, preq, 0);
				parent->ji_ajinfo->tkm_dsubjsct++;
				decr_single_subjob_usage(parent);
				if (update_deljob_rply(preq, jid, PBSE_NONE))
					reply_ack(preq);
			}
			chk_array_doneness(parent);
			continue;

		} else if (jt == IS_ARRAY_ArrayJob) {
			int del_parent = 1;
			int start = parent->ji_ajinfo->tkm_start;

			/*
			 * For array jobs the history is stored at the parent array level and also at the subjob level .
			 * If the request is to delete the history of an array job then set  ji_deletehistory to 1 for
			 * the parent array.The function chk_array_doneness() will take care of eventually
			 *  purging the history .
			 */
			if (delhist)
				parent->ji_deletehistory = 1;
			/* The Array Job itself ... */
			/* for each subjob that is running, delete it via req_deletejob2 */

			if (preq->rq_ind.rq_deletejoblist.rq_resume)
				start = preq->rq_ind.rq_deletejoblist.subjobid_to_resume;
			else {
				/* in case of resume counts are incremented already */
				++preq->rq_refct;
			}

			/* keep the array from being removed while we are looking at it */
			parent->ji_ajinfo->tkm_flags |= TKMFLG_NO_DELETE;
			for (i = start; i <= parent->ji_ajinfo->tkm_end; i += parent->ji_ajinfo->tkm_step) {

				if ((time(NULL) - begin_time) > QDEL_BREAKER_SECS) {
					preq->rq_ind.rq_deletejoblist.subjobid_to_resume = i;
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
						   "req_delete has been running for %d seconds, Pausing for other requests",
						   QDEL_BREAKER_SECS);
					set_task(WORK_Interleave, 0, resume_deletion, preq);
					return;
				}
				pjob = get_subjob_and_state(parent, i, &sjst, NULL);
				if (sjst == JOB_STATE_LTR_UNKNOWN)
					continue;
				if ((sjst == JOB_STATE_LTR_EXITING) && !forcedel)
					continue;
				if (pjob) {
					if (delhist)
						pjob->ji_deletehistory = 1;
					if (check_job_state(pjob, JOB_STATE_LTR_EXPIRED)) {
						log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
							   pjob->ji_qs.ji_jobid,
							   msg_job_history_delete, preq->rq_user,
							   preq->rq_host);
						job_purge(pjob);
					} else {
						if (dup_br_for_subjob(preq, pjob, req_deletejob2) == 2)
							continue;
						del_parent = 0;
					}
				} else {
					/* Queued, Waiting, Held, just set to expired */
					if (sjst != JOB_STATE_LTR_EXPIRED) {
						update_sj_parent(parent, NULL, create_subjob_id(parent->ji_qs.ji_jobid, i), sjst, JOB_STATE_LTR_EXPIRED);
						decr_single_subjob_usage(parent);
					}
				}
			}
			parent->ji_ajinfo->tkm_flags &= ~TKMFLG_NO_DELETE;

			/* if deleting running subjobs, then just return;            */
			/* parent will be deleted when last running subjob(s) ends   */
			/* and reply will be sent to client when last delete is done */
			/* If not deleteing running subjobs, delete2 to del parent   */

			if (--preq->rq_refct == 0) {
				if ((parent = find_job(jid)) != NULL) {
					if (req_deletejob2(preq, parent) == 2) {
						preq->rq_ind.rq_deletejoblist.subjobid_to_resume = parent->ji_ajinfo->tkm_end;
						++preq->rq_refct;
						return;
					}
					del_parent = 0;
				} else if (update_deljob_rply(preq, jid, PBSE_NONE))
					reply_send(preq);
			} else
				acct_del_write(jid, parent, preq, 0);

			if (del_parent == 1) {
				if ((parent = find_job(jid)) != NULL) {
					if (req_deletejob2(preq, parent) == 2) {
						preq->rq_ind.rq_deletejoblist.subjobid_to_resume = parent->ji_ajinfo->tkm_end;
						++preq->rq_refct;
						return;
					}
				}
			}

			continue;
		}
		/* what's left to handle is a range of subjobs, foreach subjob 	*/
		/* if running, do full delete, else just update state	        */

		range = get_range_from_jid(jid);
		if (range == NULL) {
			if (update_deljob_rply(preq, jid, PBSE_IVALREQ)) {
				req_reject(PBSE_IVALREQ, 0, preq);
				return;
			} else
				continue;
		}

		++preq->rq_refct;
		while (1) {
			int start;
			int end;
			int step;
			int count;

			if ((i = parse_subjob_index(range, &pc, &start, &end, &step, &count)) == -1) {
				if (update_deljob_rply(preq, jid, PBSE_IVALREQ))
					req_reject(PBSE_IVALREQ, 0, preq);
				break;
			} else if (i == 1)
				break;

			/*
			 * Ensure that the range specified in the delete job request does not exceed the
			 * index of the highest numbered array subjob
			 */
			if (start < parent->ji_ajinfo->tkm_start || start > parent->ji_ajinfo->tkm_end) {
				if (update_deljob_rply(preq, jid, PBSE_UNKJOBID))
					req_reject(PBSE_UNKJOBID, 0, preq);
				break;
			}
			for (i = start; i <= end; i += step) {
				pjob = get_subjob_and_state(parent, i, &sjst, NULL);
				if (sjst == JOB_STATE_LTR_UNKNOWN)
					continue;

				if ((sjst == JOB_STATE_LTR_EXITING) && !forcedel)
					continue;

				if (pjob) {
					if (delhist)
						pjob->ji_deletehistory = 1;
					if (check_job_state(pjob, JOB_STATE_LTR_EXPIRED)) {
						log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, msg_job_history_delete, preq->rq_user, preq->rq_host);
						job_purge(pjob);
					} else {
						if (dup_br_for_subjob(preq, pjob, req_deletejob2) == 2)
							continue;
					}
				} else {
					/* Queued, Waiting, Held, just set to expired */
					if (sjst != JOB_STATE_LTR_EXPIRED) {
						update_sj_parent(parent, NULL, create_subjob_id(parent->ji_qs.ji_jobid, i), sjst, JOB_STATE_LTR_EXPIRED);
						decr_single_subjob_usage(parent);
					}
				}
			}
			range = pc;
		}
		if (i != -1) {
			sprintf(log_buffer, msg_manager, msg_deletejob,
				preq->rq_user, preq->rq_host);
			if (qdel_mail != 0) {
				svr_mailowner_id(jid, parent, MAIL_OTHER, MAIL_FORCE, log_buffer);
			}
		}

		/* if deleting running subjobs, then just return;            */
		/* parent will be deleted when last running subjob(s) ends   */
		/* and reply will be sent to client when last delete is done */

		if (--preq->rq_refct == 0) {
			if (update_deljob_rply(preq, jid, PBSE_NONE))
				reply_send(preq);
			chk_array_doneness(parent);
		}
	}
}

/**
 * @brief
 * 		req_deletejob2 - service the Delete Job Request
 *
 *		This request deletes a job.
 *
 * @param[in]	preq	- Job Request
 * @param[in,out]	pjob	- Job structure
 *
 * @return int
 * @retval 0 for Success
 * @retval 1 for Error
 * @retval 2 if deljoblist needs to be suspended
 */

static int
req_deletejob2(struct batch_request *preq, job *pjob)
{
	int abortjob = 0;
	char *sig;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	char *rec = "";
	int forcedel = 0;
	struct work_task *pwtold;
	struct work_task *pwtnew;
	struct batch_request *temp_preq = NULL;
	int rc;
	int is_mgr = 0;
	int jt;
	char *job_id = NULL;

	/* + 2 is for the '@' in user@host and for the null termination byte. */
	char by_user[PBS_MAXUSER + PBS_MAXHOSTNAME + 2] = {'\0'};

	/* active job is being deleted by delete job batch request */
	pjob->ji_terminated = 1;
	if ((preq->rq_user[0] != '\0') && (preq->rq_host[0] != '\0'))
		sprintf(by_user, "%s@%s", preq->rq_user, preq->rq_host);

	if ((preq->rq_extend && strstr(preq->rq_extend, FORCE)))
		forcedel = 1;

	/* See if the request is coming from a manager */
	if (preq->rq_perm & (ATR_DFLAG_MGRD | ATR_DFLAG_MGWR))
		is_mgr = 1;

	jt = is_job_array(pjob->ji_qs.ji_jobid);

	if (check_job_state(pjob, JOB_STATE_LTR_TRANSIT)) {

		/*
		 * Find pid of router from existing work task entry,
		 * then establish another work task on same child.
		 * Next, signal the router and wait for its completion;
		 */

		pwtold = (struct work_task *) GET_NEXT(pjob->ji_svrtask);
		while (pwtold) {
			if ((pwtold->wt_type == WORK_Deferred_Child) ||
			    (pwtold->wt_type == WORK_Deferred_Cmp)) {
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid,
					   "Job in Transit state, deletion will resume once we hear back!");
				pwtnew = set_task(pwtold->wt_type,
						  pwtold->wt_event, resume_deletion,
						  preq);
				if (pwtnew) {
					/*
					 * reset type in case the SIGCHLD came
					 * in during the set_task;  it makes
					 * sure that next_task() will find the
					 * new entry.
					 */
					pwtnew->wt_type = pwtold->wt_type;
					pwtnew->wt_aux = pwtold->wt_aux;

					kill((pid_t) pwtold->wt_event, SIGTERM);
					set_job_substate(pjob, JOB_SUBSTATE_ABORT);
					if (preq->rq_type == PBS_BATCH_DeleteJobList) {
						/* let the caller know that the deljoblist request needs to be suspended */
						return 2;
					}
					return 0; /* all done for now */

				} else {
					if (pjob->ji_pmt_preq != NULL)
						reply_preempt_jobs_request(PBSE_SYSTEM, PREEMPT_METHOD_DELETE, pjob);

					if (update_deljob_rply(preq, pjob->ji_qs.ji_jobid, PBSE_SYSTEM)) {
						req_reject(PBSE_SYSTEM, 0, preq);
						return 0;
					}
				}
			}
			pwtold = (struct work_task *) GET_NEXT(pwtold->wt_linkobj);
		}
		/* should never get here ...  */
		log_err(-1, "req_delete", "Did not find work task for router");
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_INTERNAL, PREEMPT_METHOD_DELETE, pjob);

		if (update_deljob_rply(preq, pjob->ji_qs.ji_jobid, PBSE_INTERNAL)) {
			req_reject(PBSE_INTERNAL, 0, preq);
			return 0;
		}

	} else if (((jt != IS_ARRAY_Range) && (jt != IS_ARRAY_Single)) &&
		   (check_job_state(pjob, JOB_STATE_LTR_QUEUED) ||
		    check_job_state(pjob, JOB_STATE_LTR_HELD))) {
		depend_runone_remove_dependency(pjob);
	}

	if (is_mgr && forcedel) {
		/*
		 * Set exit status for the job to SIGKILL as we will not be working with any obit.
		 */
		pjob->ji_qs.ji_un.ji_exect.ji_exitstat = SIGKILL + 0x100;
	}

	if (check_job_state(pjob, JOB_STATE_LTR_RUNNING) ||
	    (check_job_substate(pjob, JOB_SUBSTATE_TERM))) {
		if (check_job_substate(pjob, JOB_SUBSTATE_RERUN)) {
			/* rerun just started, clear that substate and */
			/* normal delete will happen when mom replies  */

			set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, "deleting instead of rerunning");
			acct_del_write(pjob->ji_qs.ji_jobid, pjob, preq, 0);
			if (update_deljob_rply(preq, pjob->ji_qs.ji_jobid, PBSE_NONE))
				reply_ack(preq);
			return 0;
		}

		if (((check_job_substate(pjob, JOB_SUBSTATE_SUSPEND)) ||
		     (check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP))) &&
		    (is_jattr_set(pjob, JOB_ATR_resc_released))) {
			set_resc_assigned(pjob, 0, INCR);
			free_jattr(pjob, JOB_ATR_resc_released);
			mark_jattr_not_set(pjob, JOB_ATR_resc_released);
			if (is_jattr_set(pjob, JOB_ATR_resc_released_list)) {
				free_jattr(pjob, JOB_ATR_resc_released_list);
				mark_jattr_not_set(pjob, JOB_ATR_resc_released_list);
			}
		}

		if (check_job_substate(pjob, JOB_SUBSTATE_PROVISION)) {
			if (forcedel) {
				/*
				 * discard_job not called since job not sent
				 * to MOM
				 */
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
					  LOG_INFO,
					  pjob->ji_qs.ji_jobid, "deleting job");
				acct_del_write(pjob->ji_qs.ji_jobid, pjob,
					       preq, 0);
				if (update_deljob_rply(preq, pjob->ji_qs.ji_jobid, PBSE_NONE))
					reply_ack(preq);
				rel_resc(pjob);
				job_abt(pjob, NULL);
			} else {
				if (pjob->ji_pmt_preq != NULL)
					reply_preempt_jobs_request(PBSE_BADSTATE, PREEMPT_METHOD_DELETE, pjob);
				if (update_deljob_rply(preq, pjob->ji_qs.ji_jobid, PBSE_BADSTATE))
					req_reject(PBSE_BADSTATE, 0, preq);
			}
			return 0;
		}

		/*
		 * Job is in fact running, so we want to terminate it.
		 *
		 * Send signal request to MOM.  The server will automagically
		 * pick up and "finish" off the client request when MOM replies.
		 * If not "force" send special termjob signal,
		 * if "force" send SIGTERM.
		 */
		if (forcedel)
			sig = sigk;
		else
			sig = sigtj;

		if (is_mgr && forcedel)
			temp_preq = NULL;
		else
			temp_preq = preq;

		rc = issue_signal(pjob, sig, post_delete_mom1, temp_preq);

		/*
		 * If forcedel is set and request is from a manager,
		 * job is deleted from server regardless
		 * of issue_signal to MoM was a success or failure.
		 * Eventually, when the mom updates server about the job,
		 * server sends a discard message to mom and job is then
		 * deleted from mom as well.
		 */
		if ((rc || is_mgr) && forcedel) {
			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_EXITED);
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
				issue_track(pjob);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, "Delete forced");
			acct_del_write(pjob->ji_qs.ji_jobid, pjob, preq, 0);

			/*
			 * If we are waiting for preemption to be complete and someone does a qdel -Wforce
			 * we need to reply back to the scheduler.  We need to reply success so we don't
			 * attempt another preemption method.  This leads to a minor race condition
			 * where the moms might not be finished cleaning up when the high priority job runs.
			 */
			if (pjob->ji_pmt_preq != NULL)
				reply_preempt_jobs_request(PBSE_NONE, PREEMPT_METHOD_DELETE, pjob);

			if (preq->rq_parentbr)
				reply_ack(preq);
			else {
				if (update_deljob_rply(preq, pjob->ji_qs.ji_jobid, PBSE_NONE))
					reply_ack(preq);
			}

			pjob->ji_qs.ji_obittime = time_now;
			set_jattr_l_slim(pjob, JOB_ATR_obittime, pjob->ji_qs.ji_obittime, SET);

			/* Allocate space for the jobobit hook event params */
			temp_preq = alloc_br(PBS_BATCH_JobObit);
			if (temp_preq == NULL) {
				log_err(PBSE_INTERNAL, __func__, "rq_jobobit alloc failed");
			} else {
				temp_preq->rq_ind.rq_obit.rq_pjob = pjob;
				rc = process_hooks(temp_preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
				if (rc == -1) {
					log_err(-1, __func__, "rq_jobobit process_hooks call failed");
				}
				free_br(temp_preq);
			}
			discard_job(pjob, "Forced Delete", 1);
			rel_resc(pjob);

			account_job_update(pjob, PBS_ACCT_LAST);
			account_jobend(pjob, pjob->ji_acctrec, PBS_ACCT_END);

			if (pjob->ji_acctrec)
				rec = pjob->ji_acctrec;

			if (get_sattr_long(SVR_ATR_log_events) & PBSEVENT_JOB_USAGE) {
				/* log events set to record usage */
				log_event(PBSEVENT_JOB_USAGE | PBSEVENT_JOB_USAGE,
					  PBS_EVENTCLASS_JOB, LOG_INFO,
					  pjob->ji_qs.ji_jobid, rec);
			} else {
				char *pc;

				/* no usage in log, truncate messge */

				if ((pc = strchr(rec, ' ')) != NULL)
					*pc = '\0';
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
					  pjob->ji_qs.ji_jobid, rec);
			}

			if (is_mgr) {
				/*
				 * Set exit status for the job to SIGKILL as we will not be working with any obit.
				 */
				set_jattr_l_slim(pjob, JOB_ATR_exit_status, pjob->ji_qs.ji_un.ji_exect.ji_exitstat, SET);
			}

			/* see if it has any dependencies */
			if (is_jattr_set(pjob, JOB_ATR_depend))
				depend_on_term(pjob);

			/*
			 * Check if the history of the finished job can be saved or it needs to be purged .
			 */
			svr_saveorpurge_finjobhist(pjob);
			return 0;
		}
		if (rc) {
			if (pjob->ji_pmt_preq != NULL)
				reply_preempt_jobs_request(rc, PREEMPT_METHOD_DELETE, pjob);
			if (update_deljob_rply(preq, pjob->ji_qs.ji_jobid, rc))
				req_reject(rc, 0, preq); /* cant send to MOM */
			sprintf(log_buffer, "Delete failed %d", rc);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  pjob->ji_qs.ji_jobid, log_buffer);
			return 0;
		}
		/* normally will ack reply when mom responds */
		update_job_finish_comment(pjob, JOB_SUBSTATE_TERMINATED, by_user);
		sprintf(log_buffer, msg_delrunjobsig, sig);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		return 0;
	} else if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) != 0) {

		/* job has restart file at mom, do end job processing */

		svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_EXITING);
		pjob->ji_momhandle = -1; /* force new connection */
		pjob->ji_mom_prot = PROT_INVALID;
		set_task(WORK_Immed, 0, on_job_exit, (void *) pjob);

	} else if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_StagedIn) != 0) {

		/* job has staged-in file, should remove them */
		remove_stagein(pjob);
		abortjob = 1; /* set flag to abort job after mail sent */

	} else {

		/*
		 * the job is not transiting (though it may have been) and
		 * is not running, so abort it.
		 */
		abortjob = 1; /* set flag to abort job after mail sent */
	}
	/*
	 * Log delete and if requesting client is not job owner, send mail.
	 */

	acct_del_write(pjob->ji_qs.ji_jobid, pjob, preq, 0);
	job_id = strdup(pjob->ji_qs.ji_jobid);

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) {
		if (forcedel) {
			/* If the array job is being force deleted, then reset the subjob
			   state counts so that chk_array_doneness() doesn't consider the
			   array job to still have active subjobs. */
			pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_QUEUED] = 0;
			pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_RUNNING] = 0;
			pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_HELD] = 0;
			pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_EXITING] = 0;
		}
		chk_array_doneness(pjob);
	}
	else if (abortjob) {
		if (check_job_state(pjob, JOB_STATE_LTR_EXITING))
			discard_job(pjob, "Forced Delete", 1);
		rel_resc(pjob);
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_NONE, PREEMPT_METHOD_DELETE, pjob);
		job_abt(pjob, NULL);
	}

	if (preq->rq_parentbr)
		reply_send(preq);
	else {
		if (update_deljob_rply(preq, job_id, PBSE_NONE))
			reply_send(preq);
	}

	free(job_id);

	return 0;
}

/**
 * @brief
 * 		req_reservationOccurrenceEnd - service the PBS_BATCH_ResvOccurEnd Request
 *
 *		This request runs a hook script at the end of the reservation occurrence
 *
 * @param[in]	preq	- Job Request
 *
 */

void
req_reservationOccurrenceEnd(struct batch_request *preq)
{
	char hook_msg[HOOK_MSG_SIZE] = {0};

	switch (process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt)) {
		case 0: /* explicit reject */
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
			break;
		case 1: /* no recreate request as there are only read permissions */
		case 2: /* no hook script executed - go ahead and accept event*/
			reply_ack(preq);
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, "resv_end event: accept req by default");
			reply_ack(preq);
	}
	return;
}

/**
 * @brief
 * 		req_deleteReservation - service the PBS_BATCH_DeleteResv Request
 *
 *		This request deletes a resources reservation if the requester
 *		is authorized to do this.
 *
 * @param[in]	preq	- Job Request
 *
 * @par	MT-safe: No
 */

void
req_deleteReservation(struct batch_request *preq)
{
	static int lenF = 6; /*strlen ("False") + 1*/

	resc_resv *presv;
	job *pjob;
	struct batch_request *newreq;
	struct work_task *pwt;

	char buf[PBS_MAXHOSTNAME + PBS_MAXUSER + 2]; /* temp, possibly remove in future */
	char user[PBS_MAXUSER + 1];
	char host[PBS_MAXHOSTNAME + 1];
	int perm;
	int relVal;
	int state, sub;
	long futuredr;

	/*Does resc_resv object exist and requester have enough priviledge?*/

	presv = chk_rescResv_request(preq->rq_ind.rq_manager.rq_objname, preq);

	/*Note: on failure, chk_rescResv_request invokes req_reject
	 *Appropriate reply got sent & batch_request got freed
	 */
	if (presv == NULL)
		return;

	/*Know resc_resv struct exists and requester allowed to remove it*/
	futuredr = presv->ri_futuredr;
	presv->ri_futuredr = 0; /*would be non-zero if getting*/
	/*here from task_list_timed*/
	strcpy(user, preq->rq_user); /*need after request is gone*/
	strcpy(host, preq->rq_host);
	perm = preq->rq_perm;

	/*Generate message(s) to reservation owner (listed users) as appropriate
	 *according to what was requested in the mailpoints attribute and who
	 *the submitter of the request happens to be (user, scheduler, or us)
	 */
	resv_mailAction(presv, preq);
	/*ck_submitClient_needs_reply()*/
	if (presv->ri_brp) {
		if (presv->ri_qs.ri_state == RESV_UNCONFIRMED) {
			if (is_rattr_set(presv, RESV_ATR_interactive) &&
			    get_rattr_long(presv, RESV_ATR_interactive) < 0 &&
			    futuredr != 0) {

				sprintf(buf, "%s delete, wait period expired",
					presv->ri_qs.ri_resvID);
			} else {
				sprintf(buf, "%s DENIED", presv->ri_qs.ri_resvID);
			}

		} else {
			sprintf(buf, "%s BEING DELETED", presv->ri_qs.ri_resvID);
		}

		reply_text(presv->ri_brp, PBSE_NONE, buf);
		presv->ri_brp = NULL;
	}

	sprintf(buf, "%s@%s", preq->rq_user, preq->rq_host);
	sprintf(log_buffer, "requestor=%s", buf);

	if (strcmp(get_rattr_str(presv, RESV_ATR_resv_owner), buf))
		account_recordResv(PBS_ACCT_DRss, presv, log_buffer);
	else
		account_recordResv(PBS_ACCT_DRclient, presv, log_buffer);

	if (presv->ri_qs.ri_state != RESV_UNCONFIRMED) {
		char hook_msg[HOOK_MSG_SIZE] = {0};
		switch (process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt)) {
			case 0: /* explicit reject */
			case 1: /* no recreate request as there are only read permissions */
			case 2: /* no hook script executed - go ahead and accept event*/
				break;
			default:
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__, "resv_end event: accept req by default");
		}
	}

	/*If there are any jobs associated with the reservation, construct and
	 *issue a PBS_BATCH_DeleteJob request for each job.
	 *
	 *General notes on this process:
	 *Use issue_Drequest() to issue a PBS_BATCH_* request - can be to
	 *1) this server, 2) another server, 3) to a pbs_mom.
	 *
	 *In the present situation the server is going to issue the request to
	 *itself (a locally generated request).  The future "event" that's
	 *to occur, and which must be handled, is the reply fom this request.
	 *The handling task is initially placed on the server's "task_list_event"
	 *list as a task of type "WORK_Deferred_Local" and, a call is made to the
	 *general "dispatch" function (dispatch_request) to dispatch the request.
	 *In replying back to itself regarding the request to itself, function
	 *"reply_send" is called.  Since it is passed a pointer to the batch_request
	 *structure for the request that it received, it will note that the request
	 *came from itself (connection set to PBS_LOCAL_CONNECTION).  It finds the
	 *handling task on "task_list_event" by finding the task with task field
	 *"wt_parm1" set equal to the address of the batch request structure in
	 *question.  That task is moved off the "event_task_list" and put on the
	 *"immedite_task_list" where it can be found and invoked the next time that
	 *the server calls function "next_task" from it's main loop.
	 *The work_task function that's going to be invoked will be responding to
	 *the "reply" that comes back from the servers original request to itself.
	 *The handling function, in addition to whatever else it might do, does
	 *have the RESPONSIBILITY of calling free_br() to remove all memory associated
	 *with the batch_request structure.
	 */

	if (presv->ri_qp != NULL && presv->ri_qp->qu_numjobs > 0) {

		/*One or more jobs are attached to this resource reservation
		 *Issue a PBS_BATCH_Manager request to set "enable" to "False"
		 *for the queue (if it is not already so set), set "start" for
		 *the queue to "False" as well- so the scheduler will cease
		 *scheduling the jobs in queue, then issue a PBS_BATCH_DeleteJob
		 *request for each resident job.
		 */

		int deleteProblem = 0;
		job *pnxj;

		if (get_qattr_long(presv->ri_qp, QA_ATR_Enabled)) {

			svrattrl *psatl;
			newreq = alloc_br(PBS_BATCH_Manager);
			if (newreq == NULL) {
				req_reject(PBSE_SYSTEM, 0, preq);
				return;
			}
			CLEAR_HEAD(newreq->rq_ind.rq_manager.rq_attr);

			newreq->rq_ind.rq_manager.rq_cmd = MGR_CMD_SET;
			newreq->rq_ind.rq_manager.rq_objtype = MGR_OBJ_QUEUE;
			strcpy(newreq->rq_ind.rq_manager.rq_objname,
			       presv->ri_qp->qu_qs.qu_name);
			strcpy(newreq->rq_user, user);
			strcpy(newreq->rq_host, host);
			newreq->rq_perm = perm;

			if ((psatl = attrlist_create(ATTR_enable, NULL, lenF)) == NULL) {

				req_reject(PBSE_SYSTEM, 0, preq);
				free_br(newreq);
				return;
			}
			psatl->al_flags = que_attr_def[QA_ATR_Enabled].at_flags;
			strcpy(psatl->al_value, "False");
			append_link(&newreq->rq_ind.rq_manager.rq_attr, &psatl->al_link, psatl);

			if ((psatl = attrlist_create(ATTR_start, NULL, lenF)) == NULL) {

				req_reject(PBSE_SYSTEM, 0, preq);
				free_br(newreq);
				return;
			}
			psatl->al_flags = que_attr_def[QA_ATR_Started].at_flags;
			strcpy(psatl->al_value, "False");
			append_link(&newreq->rq_ind.rq_manager.rq_attr,
				    &psatl->al_link, psatl);

			if (issue_Drequest(PBS_LOCAL_CONNECTION, newreq,
					   release_req, &pwt, 0) == -1) {
				req_reject(PBSE_SYSTEM, 0, preq);
				free_br(newreq);
				return;
			}
			/* set things so that any removal of the reservation
			 * structure also removes any "yet to be processed"
			 * work tasks that are associated with the reservation
			 */
			append_link(&presv->ri_svrtask, &pwt->wt_linkobj, pwt);

			tickle_for_reply();
		}

		/*Ok, input to the queue is stopped, try and delete jobs in queue*/

		relVal = 1;
		eval_resvState(presv, RESVSTATE_req_deleteReservation,
			       relVal, &state, &sub);
		resv_setResvState(presv, state, sub);
		pjob = (job *) GET_NEXT(presv->ri_qp->qu_jobs);
		while (pjob != NULL) {

			pnxj = (job *) GET_NEXT(pjob->ji_jobque);

			/* skip all expired subjobs, expired subjobs are deleted when array parent is
			 * issued delete request
			 */
			for (; pnxj != NULL && (pnxj->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) &&
			       check_job_state(pnxj, JOB_STATE_LTR_EXPIRED);
			     pnxj = (job *) GET_NEXT(pnxj->ji_jobque))
				;
			/*
			 * If a history job (job state is JOB_STATE_LTR_MOVED
			 * or JOB_STATE_LTR_FINISHED, then no need to delete
			 * it again as it is already deleted.
			 */
			if (check_job_state(pjob, JOB_STATE_LTR_MOVED) ||
			    (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) ||
			    check_job_state(pjob, JOB_STATE_LTR_FINISHED)) {
				pjob = pnxj;
				continue;
			}

			newreq = alloc_br(PBS_BATCH_DeleteJob);
			if (newreq != NULL) {

				/*when owner of job is not same as owner of resv, */
				/*need extra permission; Also extra info for owner*/

				CLEAR_HEAD(newreq->rq_ind.rq_manager.rq_attr);
				newreq->rq_perm = perm | ATR_DFLAG_MGWR;
				newreq->rq_extend = NULL;

				/*reply processing needs resv*/
				newreq->rq_extra = (void *) presv;

				strcpy(newreq->rq_user, user);
				strcpy(newreq->rq_host, host);
				strcpy(newreq->rq_ind.rq_delete.rq_objname,
				       pjob->ji_qs.ji_jobid);

				if (issue_Drequest(PBS_LOCAL_CONNECTION, newreq,
						   release_req, &pwt, 0) == -1) {
					deleteProblem++;
					free_br(newreq);
				}
				/* set things so that any removal of the reservation
				 * structure also removes any "yet to be processed"
				 * work tasks that are associated with the reservation
				 */
				append_link(&presv->ri_svrtask, &pwt->wt_linkobj, pwt);

				tickle_for_reply();
			} else
				deleteProblem++;

			pjob = pnxj;
		}

		if (deleteProblem) {
			/*some problems attempting to delete reservation's jobs
			 *shouldn't end up re-calling req_deleteReservation
			 */
			sprintf(log_buffer, "%s %s\n",
				"problem deleting jobs belonging to",
				presv->ri_qs.ri_resvID);
			reply_text(preq, PBSE_RESVMSG, log_buffer);
		} else {
			/*no problems so far, we are attempting to do it
			 *If all job deletions succeed, resv_purge()
			 *should get triggered
			 */
			reply_ack(preq);

			/*
			 * If all the jobs in the RESV are history jobs, then
			 * better to purge the RESV now only without waiting
			 * for next resv delete iteration.
			 */
			pjob = NULL;
			if (presv && presv->ri_qp)
				pjob = (job *) GET_NEXT(presv->ri_qp->qu_jobs);
			while (pjob != NULL) {
				if ((!check_job_state(pjob, JOB_STATE_LTR_MOVED)) &&
				    (!check_job_state(pjob, JOB_STATE_LTR_FINISHED)) &&
				    (!check_job_state(pjob, JOB_STATE_LTR_EXPIRED)))
					break;
				pjob = (job *) GET_NEXT(pjob->ji_jobque);
			}
			if (pjob == NULL) /* all are history jobs only */
				resv_purge(presv);
			else {
				/* other jobs remain, need to set task to monitor */
				/* when they are dequeued */
				pwt = set_task(WORK_Immed, 0, post_deljobfromresv_req,
					       (void *) presv);
				if (pwt)
					append_link(&presv->ri_svrtask,
						    &pwt->wt_linkobj, pwt);
			}
		}

		/*This is all we can do for now*/
		return;
	}

	/* Ok, we have no jobs attached so can purge reservation
		If reservation has an attached queue, a request to qmgr
		will get made to delete the queue
		*/
	relVal = 2;
	eval_resvState(presv, RESVSTATE_req_deleteReservation,
		       relVal, &state, &sub);
	resv_setResvState(presv, state, sub);
	reply_ack(preq);
	resv_purge(presv);
	return;
}

/**
 * @brief
 * 		post_delete_mom1 - first of 2 work task trigger functions to finish the
 *		deleting of a running job.  This first part is invoked when MOM
 *		responds to the SIGTERM signal request.
 *
 * @param[in]	pwt	- work task
 */

static void
post_delete_mom1(struct work_task *pwt)
{
	int auxcode;
	job *pjob;
	struct batch_request *preq_sig; /* signal request to MOM */
	struct batch_request *preq_clt; /* original client request */
	int rc;
	int tries = 0;

	preq_sig = pwt->wt_parm1;
	rc = preq_sig->rq_reply.brp_code;
	/* Look for PBSE_ error code in wt_aux if brp code reports some other error */
	if (rc && pwt->wt_aux && (rc < PBSE_) && (pwt->wt_aux > PBSE_))
		rc = pwt->wt_aux;
	auxcode = preq_sig->rq_reply.brp_auxcode;
	preq_clt = preq_sig->rq_extra;
	if (preq_clt == NULL) {
		release_req(pwt);
		return;
	}

	pjob = find_job(preq_sig->rq_ind.rq_signal.rq_jid);
	if (pjob == NULL) {
		/* job has gone away */
		if (update_deljob_rply(preq_clt, preq_sig->rq_ind.rq_signal.rq_jid, PBSE_UNKJOBID))
			req_reject(PBSE_UNKJOBID, 0, preq_clt);
		release_req(pwt);
		return;
	}
	release_req(pwt);

resend:
	if (rc) {
		/* mom rejected request */
		sprintf(log_buffer, "MOM rejected signal during delete (%d)", rc);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);

		if (rc == PBSE_UNKSIG) {
			if (tries++) {
				if (update_deljob_rply(preq_clt, pjob->ji_qs.ji_jobid, rc))
					req_reject(rc, 0, preq_clt);
				return;
			}
			/* 2nd try, use SIGTERM */
			/* prevent infinite loop, try 10 times only */
			if (preq_clt->rq_reply.brp_count < 10) {
				preq_clt->rq_reply.brp_count++;
				rc = delayed_issue_signal(pjob, sigt, post_delete_mom1,
					preq_clt, get_sattr_long(SVR_ATR_ResendTermDelay));
				if (rc == 0)
					return; /* will be back when replies */
				goto resend;
			}
		} else if (rc == PBSE_UNKJOBID) {
			if (check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) {
				/* This means the job has trigerred to run again,
				 try deleting again! */

				/* prevent infinite loop, try 10 times only */
				if (preq_clt->rq_reply.brp_count < 10) {
					preq_clt->rq_reply.brp_count++;
					rc = delayed_issue_signal(pjob, sigtj, post_delete_mom1,
						preq_clt, get_sattr_long(SVR_ATR_ResendTermDelay));
					if (rc == 0)
						return; /* will be back when replies */
					goto resend;
				}
			}

			/* MOM claims no knowledge, so just purge it */
			acct_del_write(pjob->ji_qs.ji_jobid, pjob, preq_clt, 0);
			/* removed the resources assigned to job */
			free_nodes(pjob);
			set_resc_assigned(pjob, 0, DECR);
			if (update_deljob_rply(preq_clt, pjob->ji_qs.ji_jobid, PBSE_NONE))
				reply_ack(preq_clt);
			svr_saveorpurge_finjobhist(pjob);
		} else {
			if (pjob->ji_pmt_preq != NULL)
				reply_preempt_jobs_request(rc, PREEMPT_METHOD_DELETE, pjob);
			if (update_deljob_rply(preq_clt, pjob->ji_qs.ji_jobid, rc))
				req_reject(rc, 0, preq_clt);
		}
		return;
	}

	acct_del_write(pjob->ji_qs.ji_jobid, pjob, preq_clt, 0);

	if (preq_clt->rq_parentbr)
		reply_ack(preq_clt);
	else
		if (update_deljob_rply(preq_clt, pjob->ji_qs.ji_jobid, PBSE_NONE))
			reply_ack(preq_clt); /* dont need it, reply now */

	if (auxcode == JOB_SUBSTATE_TERM) {
		/* Mom running a site supplied Terminate Job script   */
		/* Put job into special Exiting state and we are done */

		svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_TERM);
		return;
	}
}

/**
 * @brief
 *		post_deljobfromresv_req
 *
 * @par Functionality:
 *
 *		This work_task function is triggered after all jobs in the queue
 *		associated with a reservation have had delete requests issued.
 *		If all jobs are  indeed found to be no longer present,
 *		the down counter in the reservation structure is
 *		decremented.  When the decremented value becomes less
 *		than or equal to zero, issue a request to delete the
 *		reservation.
 *
 *		If SERVER is configured for history jobs...
 *		If the reservation down counter is positive, check if all
 *		the jobs in the resv are history jobs. If yes, purge the
 *		reservation using resv_purge() without waiting.
 *
 *		If there are still non-history jobs, recall itself after 30 seconds.
 *
 * @param[in]	pwt	- pointer to the work task, the reservation structure
 *			  			pointer is contained in wt_parm1
 *
 * @return	void
 *
 */

static void
	post_deljobfromresv_req(struct work_task *pwt)
{
	resc_resv *presv;
	job *pjob = NULL;

	presv = (resc_resv *) ((struct batch_request *) pwt->wt_parm1);

	/* return if presv is not valid */
	if (presv == NULL)
		return;

	presv->ri_downcnt = presv->ri_qp->qu_numjobs;
	if (presv->ri_downcnt != 0) {
		if (presv->ri_qp)
			pjob = (job *) GET_NEXT(presv->ri_qp->qu_jobs);
		while (pjob != NULL) {
			if ((!check_job_state(pjob, JOB_STATE_LTR_MOVED)) &&
			    (!check_job_state(pjob, JOB_STATE_LTR_FINISHED)) &&
			    (!check_job_state(pjob, JOB_STATE_LTR_EXPIRED)))
				break;
			pjob = (job *) GET_NEXT(pjob->ji_jobque);
		}
		/*
			* If pjob is NULL, then all are history jobs only,
			* make the ri_downcnt to 0, so that resv_purge()
			* can be called down.
			*/
		if (pjob == NULL)
			presv->ri_downcnt = 0;
	}

	if (presv->ri_downcnt == 0) {
		resv_purge(presv);
	} else if (pjob) {
		/* one or more jobs still not able to be deleted; set me up for
		 * another call for 30 seconds into the future.
		 */
		pwt = set_task(WORK_Timed, time_now + 30, post_deljobfromresv_req,
			       (void *) presv);
		if (pwt)
			append_link(&presv->ri_svrtask, &pwt->wt_linkobj, pwt);
	}
}


================================================
FILE: src/server/req_getcred.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	req_getcred.c
 *
 * This file contains function relating to the PBS credential system,
 * it includes the major functions:
 *   req_connect    - validate the credential in a Connection Request (old)
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <string.h>
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "credential.h"
#include "net_connect.h"
#include "batch_request.h"
#include "pbs_share.h"
#include "log.h"

/**
 * @brief
 * 		req_connect - process a Connection Request
 * 		Almost does nothing.
 *
 * @param[in]	preq	- Connection Request
 */

void
req_connect(struct batch_request *preq)
{
	conn_t *conn = get_conn(preq->rq_conn);

	if (!conn) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	if (preq->rq_extend != NULL) {
		if (strcmp(preq->rq_extend, QSUB_DAEMON) == 0)
			conn->cn_authen |= PBS_NET_CONN_FROM_QSUB_DAEMON;
	}

	reply_ack(preq);
}


================================================
FILE: src/server/req_holdjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * @file	svr_holdjob.c
 *
 * Functions relating to the Hold and Release Job Batch Requests.
 *
 * Included funtions are:
 *	req_holdjob()
 *	req_releasejob()
 *	chk_hold_priv()
 *	get_hold()
 *	post_hold()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <time.h>
#include <sys/types.h>
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "net_connect.h"
#include "job.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "acct.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

/* Private Functions Local to this file */

static int get_hold(pbs_list_head *, char **);
void post_hold(struct work_task *);

/* Global Data Items: */

extern struct server server;

extern char *msg_jobholdset;
extern char *msg_jobholdrel;
extern char *msg_mombadhold;
extern char *msg_postmomnojob;
extern time_t time_now;
extern job *chk_job_request(char *, struct batch_request *, int *, int *);

int chk_hold_priv(long val, int perm);

/* Private Data */

static attribute temphold;

/**
 * @brief
 * 		chk_hold_priv - check that client has privilege to set/clear hold
 *
 * @param[in]	val	- hold bits being changed
 * @param[in]	perm	- client privilege
 *
 * @return	error code
 * @retval	0	- success
 * @retval	!=0	- failure
 */

int
chk_hold_priv(long val, int perm)
{
	if ((val & HOLD_s) && ((perm & ATR_DFLAG_MGWR) == 0))
		return (PBSE_PERM);
	if ((val & HOLD_o) && ((perm & (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0))
		return (PBSE_PERM);
	return (PBSE_NONE);
}

/**
 * @brief
 * 		req_holdjob - service the Hold Job Request
 *
 *		This request sets one or more holds on a job.
 *		The state of the job may change as a result.
 *
 * @param[in,out]	preq	- Job Request
 */
void
req_holdjob(struct batch_request *preq)
{
	long hold_val;
	int jt; /* job type */
	char newstate;
	int newsub;
	long old_hold;
	job *pjob;
	char *pset;
	char jid[PBS_MAXSVRJOBID + 1];
	int rc;
	char date[32];
	time_t now;
	int err = PBSE_NONE;

	snprintf(jid, sizeof(jid), "%s", preq->rq_ind.rq_hold.rq_orig.rq_objname);

	pjob = chk_job_request(jid, preq, &jt, &err);
	if (pjob == NULL) {
		pjob = find_job(jid);
		if (pjob != NULL && pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(err, PREEMPT_METHOD_CHECKPOINT, pjob);
		return;
	}
	if ((jt != IS_ARRAY_NO) && (jt != IS_ARRAY_ArrayJob)) {
		/*
		 * We need to find the job again because chk_job_request() will return
		 * the parent array if the job is a subjob.
		 */
		pjob = find_job(jid);
		if (pjob != NULL && pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_IVALREQ, PREEMPT_METHOD_CHECKPOINT, pjob);
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}
	if ((check_job_state(pjob, JOB_STATE_LTR_RUNNING)) &&
	    (check_job_substate(pjob, JOB_SUBSTATE_PROVISION))) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_BADSTATE, PREEMPT_METHOD_CHECKPOINT, pjob);

		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}

	/* cannot do anything until we decode the holds to be set */

	if ((rc = get_hold(&preq->rq_ind.rq_hold.rq_orig.rq_attr, &pset)) != 0) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(rc, PREEMPT_METHOD_CHECKPOINT, pjob);
		req_reject(rc, 0, preq);
		return;
	}

	/* if other than HOLD_u is being set, must have privil */

	if ((rc = chk_hold_priv(get_attr_l(&temphold), preq->rq_perm)) != 0) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(rc, PREEMPT_METHOD_CHECKPOINT, pjob);

		req_reject(rc, 0, preq);
		return;
	}

	/* HOLD_bad_password can only be done by root or admin */
	if ((get_attr_l(&temphold) & HOLD_bad_password) &&
	    strcasecmp(preq->rq_user, PBS_DEFAULT_ADMIN) != 0) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_PERM, PREEMPT_METHOD_CHECKPOINT, pjob);

		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	old_hold = get_jattr_long(pjob, JOB_ATR_hold);
	set_jattr_b_slim(pjob, JOB_ATR_hold, get_attr_l(&temphold), INCR);
	hold_val = get_jattr_long(pjob, JOB_ATR_hold);

	/* Note the hold time in the job comment. */
	now = time(NULL);
	(void) strncpy(date, (const char *) ctime(&now), 24);
	date[24] = '\0';
	(void) sprintf(log_buffer, "Job held by %s on %s", preq->rq_user, date);
	set_jattr_str_slim(pjob, JOB_ATR_Comment, log_buffer, NULL);

	(void) sprintf(log_buffer, msg_jobholdset, pset, preq->rq_user,
		       preq->rq_host);

	if ((check_job_state(pjob, JOB_STATE_LTR_RUNNING)) &&
	    (!check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) &&
	    (get_jattr_str(pjob, JOB_ATR_chkpnt)) &&
	    (*get_jattr_str(pjob, JOB_ATR_chkpnt) != 'n')) {

		/* have MOM attempt checkpointing */

		if ((rc = relay_to_mom(pjob, preq, post_hold)) != 0) {
			hold_val = old_hold; /* reset to the old value */
			if (pjob->ji_pmt_preq != NULL)
				reply_preempt_jobs_request(rc, PREEMPT_METHOD_CHECKPOINT, pjob);
			req_reject(rc, 0, preq);
		} else {
			pjob->ji_qs.ji_svrflags |=
				(JOB_SVFLG_HASRUN | JOB_SVFLG_CHKPT | JOB_SVFLG_HASHOLD);
			(void) job_save_db(pjob);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
		}
	} else {

		/* every thing went well, may need to update the job state */

		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		if (old_hold != hold_val) {
			/* indicate attributes changed     */
			svr_evaljobstate(pjob, &newstate, &newsub, 0);
			svr_setjobstate(pjob, newstate, newsub);
		}
		/* Reject preemption because job requested -c n */
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_NOSUP, PREEMPT_METHOD_CHECKPOINT, pjob);
		reply_ack(preq);
	}
}

/**
 * @brief
 * 		req_releasejob - service the Release Job Request
 *
 *		This request clears one or more holds on a job.
 *		As a result, the job might change state.
 *
 * @param[in]	preq	- ptr to the decoded request
 */

void
req_releasejob(struct batch_request *preq)
{
	int jt; /* job type */
	char newstate;
	int newsub;
	long old_hold;
	job *pjob;
	char *pset;
	int rc;

	pjob = chk_job_request(preq->rq_ind.rq_release.rq_objname, preq, &jt, NULL);
	if (pjob == NULL)
		return;

	if ((jt != IS_ARRAY_NO) && (jt != IS_ARRAY_ArrayJob)) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	/* cannot do anything until we decode the holds to be set */

	if ((rc = get_hold(&preq->rq_ind.rq_hold.rq_orig.rq_attr, &pset)) != 0) {
		req_reject(rc, 0, preq);
		return;
	}

	/* if other than HOLD_u is being released, must have privil */

	if ((rc = chk_hold_priv(get_attr_l(&temphold), preq->rq_perm)) != 0) {
		req_reject(rc, 0, preq);
		return;
	}

	/* all ok so far, unset the hold */

	old_hold = get_jattr_long(pjob, JOB_ATR_hold);
	rc = set_attr_with_attr(&job_attr_def[(int) JOB_ATR_hold], get_jattr(pjob, JOB_ATR_hold), &temphold, DECR);
	if (rc) {
		req_reject(rc, 0, preq);
		return;
	}

	// clang-format off

	/* every thing went well, if holds changed, update the job state */

#ifndef NAS /* localmod 105 Always reset etime on release */
	if (old_hold != get_jattr_long(pjob, JOB_ATR_hold)) {
#endif /* localmod 105 */
#ifdef NAS /* localmod 105 */
		{
			attribute *etime = get_jattr(pjob, JOB_ATR_etime);
			etime->at_val.at_long = time_now;
			post_attr_set(etime);
#endif /* localmod 105 */
		svr_evaljobstate(pjob, &newstate, &newsub, 0);
		svr_setjobstate(pjob, newstate, newsub); /* saves job */

	}

	if ((jt == IS_ARRAY_ArrayJob) && (pjob->ji_ajinfo)) {
		int i;
		for(i = pjob->ji_ajinfo->tkm_start ; i <= pjob->ji_ajinfo->tkm_end ; i += pjob->ji_ajinfo->tkm_step) {
			job *psubjob = get_subjob_and_state(pjob, i, NULL, NULL);
			if (psubjob && (check_job_state(psubjob, JOB_STATE_LTR_HELD))) {
#ifndef NAS
				old_hold = get_jattr_long(psubjob, JOB_ATR_hold);
				rc =
#endif
					set_attr_with_attr(&job_attr_def[(int)JOB_ATR_hold], get_jattr(psubjob, JOB_ATR_hold), &temphold, DECR);	
#ifndef NAS /* localmod 105 Always reset etime on release */
				if (!rc && (old_hold != get_jattr_long(psubjob, JOB_ATR_hold))) {
#endif /* localmod 105 */
#ifdef NAS /* localmod 105 */
				{
					attribute *etime = get_jattr(psubjob, JOB_ATR_etime);
					etime->at_val.at_long = time_now;
					post_attr_set(etime);
#endif /* localmod 105 */
					svr_evaljobstate(psubjob, &newstate, &newsub, 0);
					svr_setjobstate(psubjob, newstate, newsub); /* saves job */
				}
				if (get_jattr_long(psubjob, JOB_ATR_hold) == HOLD_n)
					free_jattr(psubjob, JOB_ATR_Comment);
				(void)sprintf(log_buffer, msg_jobholdrel, pset, preq->rq_user, preq->rq_host);
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, psubjob->ji_qs.ji_jobid, log_buffer);
			}
		}
	}
	if (get_jattr_long(pjob, JOB_ATR_hold) == HOLD_n) {
		if ((jt == IS_ARRAY_ArrayJob) && (pjob->ji_qs.ji_stime != 0) ) {
			char timebuf[128];

			strftime(timebuf, 128, "%a %b %d at %H:%M", localtime(&pjob->ji_qs.ji_stime));
			sprintf(log_buffer, "Job Array Began at %s", timebuf);

			set_jattr_str_slim(pjob, JOB_ATR_Comment, log_buffer, NULL);
		} else
			free_jattr(pjob, JOB_ATR_Comment);
	}
	(void)sprintf(log_buffer, msg_jobholdrel, pset, preq->rq_user,
		preq->rq_host);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		pjob->ji_qs.ji_jobid, log_buffer);
	reply_ack(preq);
}

		// clang-format on

		/**
 * @brief
 * 		get_hold - search a list of attributes (svrattrl) for the hold-types
 * 		attribute.  This is used by the Hold Job and Release Job request,
 *		therefore it is an error if the hold-types attribute is not present,
 *		or there is more than one.
 *
 *		Decode the hold attribute into temphold.
 *
 * @param[in]	phead	- pbs list head.
 * @param[out]	pset	- RETURN - ptr to hold value
 *
 * @return	error code
 */

		static int
		get_hold(pbs_list_head * phead, char **pset)
		{
			int have_one = 0;
			struct svrattrl *holdattr = NULL;
			struct svrattrl *pal;

			pal = (struct svrattrl *) GET_NEXT((*phead));
			while (pal) {
				if (!strcasecmp(pal->al_name, job_attr_def[(int) JOB_ATR_hold].at_name)) {
					holdattr = pal;
					*pset = pal->al_value;
					have_one++;
				} else {
					return (PBSE_IVALREQ);
				}
				pal = (struct svrattrl *) GET_NEXT(pal->al_link);
			}
			if (have_one != 1)
				return (PBSE_IVALREQ);

			/* decode into temporary attribute structure */

			clear_attr(&temphold, &job_attr_def[(int) JOB_ATR_hold]);
			return (set_attr_generic(&temphold, &job_attr_def[JOB_ATR_hold],
						 holdattr->al_value,
						 NULL, INTERNAL));
		}

		/**
 * @brief
 * 		"post hold" - A round hole in the ground in which a post is placed :-)
 *		This function is called when a hold request which was sent to Mom has
 *		been responed to by MOM.  The hold request for the running job is
 *		completed and replied to based on what was returned by Mom.
 *
 *		If Mom repies with:
 *	  	No error (0) - job is marked as checkpointed;
 *	  	PBSE_NOSUP - checkpoint in not supported,  job just has hold type set;
 *	  	PBSE_CKPBSY - a prior checkpoint is still in progress;
 *	  	For any error other than PBSE_NOSUP, a message is logged and returned
 *	  	to the client.
 *
 * @param[in]	pwt	- pointer to work task entry holding information about the
 *				original client "hold job" request.
 *
 * @return void
 */

		void
			post_hold(struct work_task * pwt)
		{
			int code;
			job *pjob;
			struct batch_request *preq;
			conn_t *conn;

			if (pwt->wt_aux2 != 1)
				svr_disconnect(pwt->wt_event); /* close connection to MOM */
			preq = pwt->wt_parm1;
			code = preq->rq_reply.brp_code;
			preq->rq_conn = preq->rq_orgconn; /* restore client socket */

			pjob = find_job(preq->rq_ind.rq_hold.rq_orig.rq_objname);

			if (pjob == NULL) {
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
					  preq->rq_ind.rq_hold.rq_orig.rq_objname,
					  msg_postmomnojob);
				req_reject(PBSE_UNKJOBID, 0, preq);
				return;
			}

			if (pwt->wt_aux2 != PROT_TPP) {
				conn = get_conn(preq->rq_conn);

				if (!conn) {
					if (pjob->ji_pmt_preq != NULL)
						reply_preempt_jobs_request(PBSE_SYSTEM, PREEMPT_METHOD_CHECKPOINT, pjob);
					req_reject(PBSE_SYSTEM, 0, preq);
					return;
				}

				conn->cn_authen &= ~PBS_NET_CONN_NOTIMEOUT;
			}

			if (code != PBSE_NONE) {
				/* Checkpoint failed, remove checkpoint flags from job */
				pjob->ji_qs.ji_svrflags &= ~(JOB_SVFLG_HASHOLD | JOB_SVFLG_CHKPT);
				if (pjob->ji_pmt_preq != NULL)
					reply_preempt_jobs_request(code, PREEMPT_METHOD_CHECKPOINT, pjob);

				if (code != PBSE_NOSUP) {
					/* a "real" error - log message with return error code */
					(void) sprintf(log_buffer, msg_mombadhold, code);
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
						  pjob->ji_qs.ji_jobid, log_buffer);
					/* send message back to server for display to user */
					reply_text(preq, code, log_buffer);
					return;
				}
			} else {
				/* record that MOM has a checkpoint file */
				set_job_substate(pjob, JOB_SUBSTATE_RERUN);
				if (preq->rq_reply.brp_auxcode) /* chkpt can be moved */
					pjob->ji_qs.ji_svrflags =
						(pjob->ji_qs.ji_svrflags & ~JOB_SVFLG_CHKPT) |
						JOB_SVFLG_HASRUN | JOB_SVFLG_ChkptMig;

				job_save_db(pjob);

				/* note in accounting file */

				account_record(PBS_ACCT_CHKPNT, pjob, NULL);
				if (pjob->ji_pmt_preq != NULL)
					reply_preempt_jobs_request(PBSE_NONE, PREEMPT_METHOD_CHECKPOINT, pjob);
			}

			reply_ack(preq);
		}


================================================
FILE: src/server/req_jobobit.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * functions dealing with a Job Obituary Request (Notice)
 * and the associated post execution job clean up
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <ctype.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>

#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server.h"
#include "job.h"
#include "credential.h"
#include "ticket.h"
#include "batch_request.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "acct.h"
#include "net_connect.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "sched_cmds.h"
#include "mom_server.h"
#include "dis.h"
#include "tpp.h"
#include "libutil.h"
#include "pbs_sched.h"

/* External Global Data Items */

extern unsigned int pbs_mom_port;
extern char *path_spool;
extern int server_init_type;
extern pbs_net_t pbs_server_addr;
extern char *msg_init_abt;
extern char *msg_job_end;
extern char *msg_job_end_sig;
extern char *msg_job_end_stat;
extern char *msg_momnoexec1;
extern char *msg_momnoexec2;
extern char *msg_baduser;
extern char *msg_job_globfail1;
extern char *msg_obitnojob;
extern char *msg_obitnocpy;
extern char *msg_obitnodel;
extern char *msg_bad_password;
extern char *msg_hook_reject_deletejob;
extern char *msg_hook_reject_rerunjob;
extern char *msg_momkillncpusburst;
extern char *msg_momkillncpussum;
extern char *msg_momkillvmem;
extern char *msg_momkillmem;
extern char *msg_momkillcput;
extern char *msg_momkillwalltime;
extern time_t time_now;

/* External Functions called */

extern void set_resc_assigned(void *, int, enum batch_op);
extern long get_walltime(const job *, int);

/* Local public functions  */
void on_job_rerun(struct work_task *ptask);
void on_job_exit(struct work_task *ptask);
extern void set_admin_suspend(job *pjob, int set_remove_nstate);

static char *msg_obitnotrun = "job not running, may have been requeued on node failure";

/**
 * @brief
 * 		mom_comm - if needed, open a connection with the MOM under which
 *		the job was running.  The connection is typically set up by
 *		req_jobobit() using the connection already established by MOM.
 *		However, on server recovery there will be no pre-established connection.
 *
 *		If a connection is needed and cannot be setup, set up a work-task
 *		entry and try again later.
 *
 * @param[in]	pjob	- job structure
 * @param[in]	func	- function pointer which accepts a work task structure and returns void
 * 							here it can calls on_job_exit and on_job_rerun
 *
 * @return	open connection handle to MOM
 * @retval	-1	- failure
 */

int
mom_comm(job *pjob, void (*func)(struct work_task *))
{
	unsigned int dum;
	long t;
	struct work_task *pwt;
	int prot = PROT_TPP;

	if (pjob->ji_momhandle < 0) {

		/* need to make connection, called from pbsd_init() */

		if (pjob->ji_qs.ji_un.ji_exect.ji_momaddr == 0) {
			char *exec_vnode = get_jattr_str(pjob, JOB_ATR_exec_vnode);
			if (!is_jattr_set(pjob, JOB_ATR_exec_vnode) || exec_vnode == NULL)
				return -1;
			pjob->ji_qs.ji_un.ji_exect.ji_momaddr = get_addr_of_nodebyname(exec_vnode, &dum);
			if (pjob->ji_qs.ji_un.ji_exect.ji_momaddr == 0)
				return -1;

			pjob->ji_qs.ji_un.ji_exect.ji_momport = dum;
		}
		pjob->ji_momhandle = svr_connect(
			pjob->ji_qs.ji_un.ji_exect.ji_momaddr,
			pjob->ji_qs.ji_un.ji_exect.ji_momport,
			process_Dreply,
			ToServerDIS,
			prot);
		pjob->ji_mom_prot = prot;

		if (pjob->ji_momhandle < 0) {
			char *operation;

			t = pjob->ji_retryok++;
			t = PBS_NET_RETRY_TIME + t * t;

			if (func == on_job_exit)
				operation = "exit";
			else if (func == on_job_rerun)
				operation = "rerun";
			else
				operation = "UNKNOWN";

			snprintf(log_buffer, sizeof(log_buffer),
				 "cannot connect to MOM, reschedule job %s "
				 "in %ld seconds",
				 operation, t);
			log_err(-1, pjob->ji_qs.ji_jobid, log_buffer);

			t += time_now;
			pwt = set_task(WORK_Timed, t, func, (void *) pjob);
			append_link(&pjob->ji_svrtask, &pwt->wt_linkobj, pwt);
			return (-1);
		}
	}
	return (pjob->ji_momhandle);
}

/**
 * @brief
 * 		rel_resc - release resources assigned to the job
 *
 * @param[in]	pjob	- job structure
 */
void
rel_resc(job *pjob)
{
	conn_t *conn = NULL;
	pbs_sched *psched;

	free_nodes(pjob);

	/* removed the resources used by the job from the used svr/que attr  */

	set_resc_assigned((void *) pjob, 0, DECR);

	/* is there a rerun request waiting for acknowledgement that        */
	/* resources (including licenses) are indeed released? Then ack it. */
	if (pjob->ji_rerun_preq != NULL) { /* set only in req_rerun() */
		if (pjob->ji_rerun_preq->rq_conn != PBS_LOCAL_CONNECTION)
			conn = get_conn(pjob->ji_rerun_preq->rq_conn);

		reply_ack(pjob->ji_rerun_preq);

		/* clear no-timeout flag on connection to prevent stale connections */
		if (conn)
			conn->cn_authen &= ~PBS_NET_CONN_NOTIMEOUT;

		pjob->ji_rerun_preq = NULL;
	}
	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_AdmSuspd)
		set_admin_suspend(pjob, 0);

	/* Mark that scheduler should be called */

	if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
		set_scheduler_flag(SCH_SCHEDULE_TERM, psched);
	else {
		pbs_queue *pq;
		pq = find_queuebyname(pjob->ji_qs.ji_queue);
		sprintf(log_buffer, "Unable to reach scheduler associated with partition %s", get_qattr_str(pq, QA_ATR_partition));
		log_err(-1, __func__, log_buffer);
	}
}
/**
 * @brief
 * 		on_exitrerun_msg	- log message on exit rerun fails, used with
 * 								on_job_rerun() and conn_to_mom_failed()
 *
 * @param[in]	pjob	- job which has failed
 * @param[in]	fmt	- failure message
 */
static void
on_exitrerun_msg(job *pjob, char *fmt)
{
	char *hostname = " ? ";

	if (pjob->ji_qs.ji_destin[0] != '\0')
		hostname = pjob->ji_qs.ji_destin;

	sprintf(log_buffer, fmt, pjob->ji_qs.ji_jobid, hostname);
	log_event(PBSEVENT_ERROR | PBSEVENT_ADMIN | PBSEVENT_JOB,
		  PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);
}

/**
 * @brief
 * 		conn_to_mom_failed - called when the connection to Mom for end of job
 *		processing is broken (Mom gone?).  Log it and close and attempt to
 *		open a new one by going around again.
 *
 * @param[in]	pjob	- job structure
 * @param[in]	func	- function pointer which accepts a work task structure and returns void
 * 							here it can calls on_job_exit and on_job_rerun
 */

static void
conn_to_mom_failed(job *pjob, void (*func)(struct work_task *))
{
	struct work_task *ptask;

	on_exitrerun_msg(pjob, "end of job processing for %s, connection to Mom on host %s was broken");
	if (pjob->ji_mom_prot == PROT_TCP) {
		svr_disconnect(pjob->ji_momhandle);
	} else {
		tpp_close(pjob->ji_momhandle);
		tdelete2((u_long) pjob->ji_momhandle, 0, &streams);
	}
	pjob->ji_momhandle = -1;
	ptask = set_task(WORK_Immed, 0, func, pjob);
	append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
	return;
}

static void
end_job(job *pjob, int isexpress)
{
	struct batch_request *preq;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	char *rec = "";
	int rc;

	if (isexpress) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, "express end of job");
		/* see if have any dependencies */
		if (is_jattr_set(pjob, JOB_ATR_depend))
			(void) depend_on_term(pjob);

		/* Set job's exec_vnodes with current time for last_used_time. */
		set_last_used_time_node(pjob, 0);
	}

	pjob->ji_qs.ji_obittime = time_now;
	set_jattr_l_slim(pjob, JOB_ATR_obittime, pjob->ji_qs.ji_obittime, SET);

	/* Allocate space for the jobobit hook event params */
	preq = alloc_br(PBS_BATCH_JobObit);
	if (preq == NULL) {
		log_err(PBSE_INTERNAL, __func__, "rq_jobobit alloc failed");
	} else {
		preq->rq_ind.rq_obit.rq_pjob = pjob;
		rc = process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
		if (rc == -1) {
			log_err(-1, __func__, "rq_jobobit process_hooks call failed");
		}
		free_br(preq);
	}

	if (pjob->ji_momhandle != -1 && pjob->ji_mom_prot == PROT_TCP)
		svr_disconnect(pjob->ji_momhandle);
	rel_resc(pjob); /* free any resc assigned to the job */

	account_job_update(pjob, PBS_ACCT_LAST);
	account_jobend(pjob, pjob->ji_acctrec, PBS_ACCT_END);

	if (pjob->ji_acctrec)
		rec = pjob->ji_acctrec;

	if (get_sattr_long(SVR_ATR_log_events) & PBSEVENT_JOB_USAGE) {
		/* log events set to record usage */
		log_event(PBSEVENT_JOB_USAGE | PBSEVENT_JOB_USAGE,
			  PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, rec);
	} else {
		char *pc;

		/* no usage in log, truncate messge */

		if ((pc = strchr(rec, ' ')) != NULL)
			*pc = '\0';
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, rec);
	}

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
		issue_track(pjob);

	if (pjob->ji_pmt_preq != NULL)
		reply_preempt_jobs_request(PBSE_NONE, PREEMPT_METHOD_DELETE, pjob);
	/*
	 * Check if the history of the finished job can be saved or it needs to be purged.
	 */
	svr_saveorpurge_finjobhist(pjob);
}

/**
 * @brief
 * 		continue post-execution processing of a job that terminated.
 *
 *		This function is called by pbsd_init() on recovery, by job_obit()
 *		on job termination and by itself (via a work task).  The clue to where
 *		we are is the job substate and the type of the work task entry it is
 *		called with.  If the work task entry type is Work_Immed, then this is
 *		the first time in for the job substate.  Otherwise it is with the reply
 *		given by MOM.
 *
 *		NOTE:
 *		On the initial work task (WORK_Immed), the wt_parm1 is a job pointer.
 *		On a call-back work task (WORK_Deferred_Reply) generated by
 *		send_request(), the wt_parm1 is pointing to the request; and the
 *		rq_extra field in the request points to the job.
 *
 * @param[in,out]	ptask	- work task
 */
void
on_job_exit(struct work_task *ptask)
{
	int handle;
	job *pjob;
	struct batch_request *preq;
	struct work_task *pt;
	int rc;
	int stageout_status = 1; /* success */
	long t;
	pbs_list_head *mom_tasklist_ptr = NULL;
	mominfo_t *pmom = 0;
	int release_nodes_on_stageout = 0;

	if (ptask->wt_type != WORK_Deferred_Reply) {
		preq = NULL;
		pjob = (job *) ptask->wt_parm1;
	} else {
		preq = (struct batch_request *) ptask->wt_parm1;
		pjob = (job *) preq->rq_extra;
	}

	/* minor check on validity of pjob */
	if (isdigit((int) pjob->ji_qs.ji_jobid[0]) == 0)
		return; /* not pointing to currently valid job */

	if (check_job_substate(pjob, JOB_SUBSTATE_EXITING)) {
		/*
		 * If jobs doesn't have any files to stage/delete and there is no execjob_end
		 * hook to run, end job immediately
		 *
		 * If no stage files but has execjob_end hook to run, put job directly in
		 * exited sub state
		 */
		int hs = has_stage(pjob);
		rc = num_eligible_hooks(HOOK_EVENT_EXECJOB_END);
		if (!rc && !hs) {
			end_job(pjob, 1);
			return;
		} else if (rc > 0 && !hs)
			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_EXITED);
	}

	if (is_jattr_set(pjob, JOB_ATR_relnodes_on_stageout) &&
	    (get_jattr_long(pjob, JOB_ATR_relnodes_on_stageout) != 0))
		release_nodes_on_stageout = 1;

	if ((handle = mom_comm(pjob, on_job_exit)) < 0)
		return;

	if (pjob->ji_mom_prot == PROT_TPP) {
		pmom = tfind2((unsigned long) pjob->ji_qs.ji_un.ji_exect.ji_momaddr,
			      pjob->ji_qs.ji_un.ji_exect.ji_momport,
			      &ipaddrs);
		if (!pmom || (pmom->mi_dmn_info->dmn_state & INUSE_DOWN))
			return;
		mom_tasklist_ptr = &pmom->mi_dmn_info->dmn_deferred_cmds;
	}

	switch (get_job_substate(pjob)) {

		case JOB_SUBSTATE_EXITING:
		case JOB_SUBSTATE_ABORT:

			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_STAGEOUT);
			ptask->wt_type = WORK_Immed;

			/* Initialize retryok */
			pjob->ji_retryok = 0;

			/* NO BREAK, fall into stage out processing */

		case JOB_SUBSTATE_STAGEOUT:

			if (ptask->wt_type != WORK_Deferred_Reply) {

				/* this is the very first call, have mom copy files */
				/* first check the standard files: output & error   */

				preq = cpy_stdfile(preq, pjob, JOB_ATR_outpath);
				preq = cpy_stdfile(preq, pjob, JOB_ATR_errpath);

				/* are there any stage-out files ?		 	*/

				preq = cpy_stage(preq, pjob, JOB_ATR_stageout, STAGE_DIR_OUT);

				if (preq) { /* have files to copy 		*/
					if (release_nodes_on_stageout) {
						if (free_sister_vnodes(pjob, NULL, NULL, log_buffer, LOG_BUF_SIZE, NULL) != 0) {
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_WARNING, pjob->ji_qs.ji_jobid, log_buffer);
						}
					}
					preq->rq_extra = (void *) pjob;
					rc = issue_Drequest(handle, preq, on_job_exit, &pt, pjob->ji_mom_prot);
					if (rc == 0) {
						append_link(&pjob->ji_svrtask, &pt->wt_linkobj, pt);
						if (pjob->ji_mom_prot == PROT_TPP)
							if (mom_tasklist_ptr)
								append_link(mom_tasklist_ptr, &pt->wt_linkobj2, pt); /* if tpp, link to mom list as well */
						return;								     /* come back when mom replies */
					} else {
						/* set up as if mom returned error */

						preq->rq_reply.brp_code = rc;
						preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
						preq->rq_reply.brp_un.brp_txt.brp_txtlen = 0;
						/* we will "fall" into the post reply side */
					}

				} else { /* no files to copy, any to delete? */
					svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_STAGEDEL);
					ptask = set_task(WORK_Immed, 0, on_job_exit, pjob);
					append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
					return;
				}
			}

			/* here we have a reply (maybe faked) from MOM about the copy */

			if (preq->rq_reply.brp_code != 0) { /* error from MOM */

				if ((preq->rq_reply.brp_code == DIS_EOF) ||
				    (preq->rq_reply.brp_code == DIS_EOD)) {
					/* connection to Mom broken */
					conn_to_mom_failed(pjob, on_job_exit);
					free_br(preq);
					preq = NULL;
					return;
				}

				if (preq->rq_reply.brp_code == PBSE_NOCOPYFILE)
					stageout_status = 0;

				on_exitrerun_msg(pjob, msg_obitnocpy);
				if (preq->rq_reply.brp_choice == BATCH_REPLY_CHOICE_Text) {
					int len = strlen(log_buffer);

					if (len < LOG_BUF_SIZE + 2) {
						log_buffer[len++] = '\n';
						strncpy(&log_buffer[len],
							preq->rq_reply.brp_un.brp_txt.brp_str,
							LOG_BUF_SIZE - len);
					}
				}
				svr_mailowner(pjob, MAIL_OTHER, MAIL_FORCE, log_buffer);
			}

			set_jattr_l_slim(pjob, JOB_ATR_stageout_status, stageout_status, SET);

			/*
			 * files (generally) copied ok, move on to the next phase by
			 * "faking" the immediate work task.
			 */

			free_br(preq);
			preq = NULL;
			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_STAGEDEL);
			ptask->wt_type = WORK_Immed;

			/* NO BREAK - FALL INTO THE NEXT CASE */

		case JOB_SUBSTATE_STAGEDEL:

			if (ptask->wt_type != WORK_Deferred_Reply) { /* first time in */

				/* Build list of files which were staged-in so they can
				 * can be deleted.
				 */

				preq = cpy_stage(preq, pjob, JOB_ATR_stagein, 0);

				if (preq) { /* have files to delete		*/

					/* change the request type from copy to delete  */

					if (preq->rq_type == PBS_BATCH_CopyFiles_Cred)
						preq->rq_type = PBS_BATCH_DelFiles_Cred;
					else
						preq->rq_type = PBS_BATCH_DelFiles;
					preq->rq_extra = (void *) pjob;

					rc = issue_Drequest(handle, preq, on_job_exit, &pt, pjob->ji_mom_prot);
					if (rc == 0) {
						append_link(&pjob->ji_svrtask, &pt->wt_linkobj, pt);
						if (pjob->ji_mom_prot == PROT_TPP)
							if (mom_tasklist_ptr)
								append_link(mom_tasklist_ptr, &pt->wt_linkobj2, pt); /* if tpp, link to mom list as well */
						return;								     /* come back when mom replies */
					} else {
						/* set up as if mom returned error */

						preq->rq_reply.brp_code = rc;
						preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;

						/* we will "fall" into the post reply side */
					}

				} else { /* preq == 0, no files to delete   */
					svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_EXITED);
					ptask = set_task(WORK_Immed, 0, on_job_exit, pjob);
					append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
					return;
				}
			}

			/* After MOM replied (maybe faked) to Delete Files request */

			if (preq->rq_reply.brp_code != 0) { /* an error occurred */

				if ((preq->rq_reply.brp_code == DIS_EOF) ||
				    (preq->rq_reply.brp_code == DIS_EOD)) {
					/* tcp connection to Mom broken */
					conn_to_mom_failed(pjob, on_job_exit);
					free_br(preq);
					preq = NULL;
					return;
				}
				if (preq->rq_reply.brp_code == PBSE_TRYAGAIN) {
					/* Mom hasn't finished her post processing yet,
					 * send the delete request again later.
					 */
					t = pjob->ji_retryok++;
					t = time_now + (t * t);
					ptask = set_task(WORK_Timed, t, on_job_exit, pjob);
					append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);

					free_br(preq);
					preq = NULL;
					return;
				}

				on_exitrerun_msg(pjob, msg_obitnodel);
				if (preq->rq_reply.brp_choice == BATCH_REPLY_CHOICE_Text) {
					int len = strlen(log_buffer);

					if (len < LOG_BUF_SIZE + 2) {
						log_buffer[len++] = '\n';
						strncpy(&log_buffer[len],
							preq->rq_reply.brp_un.brp_txt.brp_str,
							LOG_BUF_SIZE - len);
					}
				}
				svr_mailowner(pjob, MAIL_OTHER, MAIL_FORCE, log_buffer);
			}
			free_br(preq);
			preq = NULL;
			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_EXITED);

			ptask->wt_type = WORK_Immed;

			/* NO BREAK, FALL INTO NEXT CASE */

		case JOB_SUBSTATE_EXITED:

			if (ptask->wt_type != WORK_Deferred_Reply) { /* first time in */

				/* see if have any dependencies */

				if (is_jattr_set(pjob, JOB_ATR_depend))
					(void) depend_on_term(pjob);

				/* tell mom to delete the job */

				preq = alloc_br(PBS_BATCH_DeleteJob);
				if (preq) {
					strcpy(preq->rq_ind.rq_delete.rq_objname,
					       pjob->ji_qs.ji_jobid);
					preq->rq_extra = (void *) pjob;
					rc = issue_Drequest(handle, preq, on_job_exit, &pt, pjob->ji_mom_prot);
					if (rc == 0) {
						append_link(&pjob->ji_svrtask, &pt->wt_linkobj, pt);
						if (pjob->ji_mom_prot == PROT_TPP)
							if (mom_tasklist_ptr)
								append_link(mom_tasklist_ptr, &pt->wt_linkobj2, pt); /* if tpp, link to mom list as well */
						return;								     /* come back when mom replies */
					} else {
						/* set up as if mom returned error */

						preq->rq_reply.brp_code = rc;
						preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;

						/* we will "fall" into the post reply side */
					}
				} else {
					log_err(-1, pjob->ji_qs.ji_jobid,
						"Unable to malloc memory for deletejob");
					return;
				}
			}

			/* Set job's exec_vnodes with current time for last_used_time. */
			set_last_used_time_node(pjob, 0);

			/* here we have a reply from MOM about the delete */
			/* if delete ok, send final track and purge the job */

			if (preq->rq_reply.brp_code == PBSE_SISCOMM) {

				/* some sister Mom apparently failed to delete the job and
				 * free resoures, keep job until discard_job() does its job
				 */
				free_br(preq);
				preq = NULL;
				if (handle != -1 && pjob->ji_mom_prot == PROT_TCP)
					svr_disconnect(handle);

				discard_job(pjob, "A sister Mom failed to delete job", 0);
				return;
			} else if ((preq->rq_reply.brp_code == DIS_EOF) ||
				   (preq->rq_reply.brp_code == DIS_EOD)) {
				/* tcp connection to Mom broken */
				conn_to_mom_failed(pjob, on_job_exit);
				free_br(preq);
				preq = NULL;
				return;
			} else if (preq->rq_reply.brp_code == PBSE_TRYAGAIN) {
				/* Mom hasn't finished her post processing yet,
				 * send the delete request again later.
				 */
				t = pjob->ji_retryok++;
				t = time_now + (t * t);
				ptask = set_task(WORK_Timed, t, on_job_exit, pjob);
				append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);

				free_br(preq);
				preq = NULL;
				return;
			} else {
				/* all went ok with the delete by Mom(s) */
				free_br(preq);
				preq = NULL;
				end_job(pjob, 0);
			}
			break;
		case JOB_SUBSTATE_TERMINATED:
			set_last_used_time_node(pjob, 0);
	}
}

/**
 * @brief
 *	Unset values of various attributes of 'pjob'
 *	specifically for node ramp down feature.
 *
 * @param[in]	pjob - job in question
 *
 * @return void
 *
 */
void
unset_extra_attributes(job *pjob)
{
	if (pjob == NULL)
		return;

	if (is_jattr_set(pjob, JOB_ATR_resource_orig)) {
		free_jattr(pjob, JOB_ATR_resource);
		mark_jattr_not_set(pjob, JOB_ATR_resource);
		set_attr_with_attr(&job_attr_def[(int) JOB_ATR_resource], get_jattr(pjob, JOB_ATR_resource), get_jattr(pjob, JOB_ATR_resource_orig), INCR);

		free_jattr(pjob, JOB_ATR_resource_orig);
		mark_jattr_not_set(pjob, JOB_ATR_resource_orig);
	}

	if (is_jattr_set(pjob, JOB_ATR_resc_used_update)) {
		free_jattr(pjob, JOB_ATR_resc_used_update);
		mark_jattr_not_set(pjob, JOB_ATR_resc_used_update);
	}

	if (is_jattr_set(pjob, JOB_ATR_exec_vnode_acct)) {
		free_jattr(pjob, JOB_ATR_exec_vnode_acct);
		mark_jattr_not_set(pjob, JOB_ATR_exec_vnode_acct);
	}

	if (is_jattr_set(pjob, JOB_ATR_exec_vnode_orig)) {
		free_jattr(pjob, JOB_ATR_exec_vnode_orig);
		mark_jattr_not_set(pjob, JOB_ATR_exec_vnode_orig);
	}

	if (is_jattr_set(pjob, JOB_ATR_exec_host_acct)) {
		free_jattr(pjob, JOB_ATR_exec_host_acct);
		mark_jattr_not_set(pjob, JOB_ATR_exec_host_acct);
	}

	if (is_jattr_set(pjob, JOB_ATR_exec_host_orig)) {
		free_jattr(pjob, JOB_ATR_exec_host_orig);
		mark_jattr_not_set(pjob, JOB_ATR_exec_host_orig);
	}

	if (is_jattr_set(pjob, JOB_ATR_SchedSelect_orig)) {
		set_jattr_str_slim(pjob, JOB_ATR_SchedSelect, get_jattr_str(pjob, JOB_ATR_SchedSelect_orig), NULL);

		free_jattr(pjob, JOB_ATR_SchedSelect_orig);
		mark_jattr_not_set(pjob, JOB_ATR_SchedSelect_orig);
	}

	if (is_jattr_set(pjob, JOB_ATR_exec_vnode_deallocated)) {
		free_jattr(pjob, JOB_ATR_exec_vnode_deallocated);
		mark_jattr_not_set(pjob, JOB_ATR_exec_vnode_deallocated);
	}
}

/**
 * @brief
 * 		on_job_rerun - Handle the clean up of jobs being rerun.  This gets
 *		messy if the job is being executed on another host.  Then the
 *		"standard" files must be copied to the server for safe keeping.
 *
 *		The basic flow is very much like that of on_job_exit().
 *		The substate will already set to JOB_SUBSTATE_RERUN and the
 *		JOB_SVFLG_HASRUN bit set in ji_svrflags.
 *
 * @param[in,out]	ptask	- work task structure
 */
void
on_job_rerun(struct work_task *ptask)
{
	int handle;
	char newstate;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	int newsubst;
	job *pjob;
	struct batch_request *preq;
	struct work_task *pt;
	int rc;
	pbs_list_head *mom_tasklist_ptr = NULL;
	mominfo_t *pmom = 0;

	if (ptask->wt_type != WORK_Deferred_Reply) {
		preq = NULL;
		pjob = (job *) ptask->wt_parm1;
	} else {
		preq = (struct batch_request *) ptask->wt_parm1;
		pjob = (job *) preq->rq_extra;
	}

	/* minor check on validatity of pjob */

	if (isdigit((int) pjob->ji_qs.ji_jobid[0]) == 0)
		return; /* not pointing to currently valid job */

	if ((handle = mom_comm(pjob, on_job_rerun)) < 0)
		return;

	if (pjob->ji_mom_prot == PROT_TPP) {
		pmom = tfind2((unsigned long) pjob->ji_qs.ji_un.ji_exect.ji_momaddr,
			      pjob->ji_qs.ji_un.ji_exect.ji_momport,
			      &ipaddrs);
		if (!pmom || (pmom->mi_dmn_info->dmn_state & INUSE_DOWN))
			return;
		mom_tasklist_ptr = &pmom->mi_dmn_info->dmn_deferred_cmds;
	}

	switch (get_job_substate(pjob)) {

		case JOB_SUBSTATE_RERUN:

			if (ptask->wt_type != WORK_Deferred_Reply) {
				if (pjob->ji_qs.ji_un.ji_exect.ji_momaddr == pbs_server_addr) {

					/* files don`t need to be moved, go to next step */

					svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_RERUN1);
					ptask = set_task(WORK_Immed, 0, on_job_rerun, pjob);
					append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
					return;
				}

				/* here is where we have to save the files	*/
				/* ask mom to send them back to the server	*/
				/* mom deletes her copy if returned ok	*/

				preq = alloc_br(PBS_BATCH_Rerun);
				if (preq == NULL) {
					return;
				}
				(void) strcpy(preq->rq_ind.rq_rerun, pjob->ji_qs.ji_jobid);
				preq->rq_extra = (void *) pjob;

				rc = issue_Drequest(handle, preq, on_job_rerun, &pt, pjob->ji_mom_prot);
				if (rc == 0) {
					/* request ok, will come back when its done */
					append_link(&pjob->ji_svrtask, &pt->wt_linkobj, pt);
					if (pjob->ji_mom_prot == PROT_TPP)
						if (mom_tasklist_ptr)
							append_link(mom_tasklist_ptr, &pt->wt_linkobj2, pt); /* if tpp, link to mom list as well */
					return;
				} else {
					/* set up as if mom returned error */

					preq->rq_reply.brp_code = rc;
					preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
					/* we will "fall" into the post reply side */
				}
			}

			/* We get here if MOM replied (may be faked above)  */
			/* to the rerun (return files) request issued above */

			if (preq->rq_reply.brp_code != 0) { /* error */
				/* for now, just log it */
				if ((preq->rq_reply.brp_code == DIS_EOF) ||
				    (preq->rq_reply.brp_code == DIS_EOD)) {
					/* tcp connection to Mom broken */
					conn_to_mom_failed(pjob, on_job_rerun);
					free_br(preq);
					preq = NULL;
					return;
				}
				on_exitrerun_msg(pjob, msg_obitnocpy);
			}
			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_RERUN1);
			ptask->wt_type = WORK_Immed;
			free_br(preq);
			preq = NULL;

			/* NO BREAK, FALL THROUGH TO NEXT CASE, including the request */

		case JOB_SUBSTATE_RERUN1:

			if (ptask->wt_type != WORK_Deferred_Reply) {

				/* this is the very first call, have mom copy files */
				/* are there any stage-out files to process? 	*/

				preq = cpy_stage(preq, pjob, JOB_ATR_stageout, STAGE_DIR_OUT);

				if (preq) { /* have files to copy 		*/
					preq->rq_extra = (void *) pjob;
					rc = issue_Drequest(handle, preq, on_job_rerun, &pt, pjob->ji_mom_prot);
					if (rc == 0) {
						append_link(&pjob->ji_svrtask, &pt->wt_linkobj, pt);
						if (pjob->ji_mom_prot == PROT_TPP)
							if (mom_tasklist_ptr)
								append_link(mom_tasklist_ptr, &pt->wt_linkobj2, pt); /* if tpp, link to mom list as well */
						return;								     /* come back when mom replies */
					} else
						/* set up as if mom returned error */

						preq->rq_reply.brp_code = rc;
					preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
					preq->rq_reply.brp_un.brp_txt.brp_txtlen = 0;
					/* we will "fall" into the post reply side */

				} else { /* no files to copy, any to delete? */
					svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_RERUN2);
					ptask = set_task(WORK_Immed, 0, on_job_rerun, pjob);
					append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
					return;
				}
			}

			/* here we have a reply (maybe faked) from MOM about the copy */

			if (preq->rq_reply.brp_code != 0) { /* error from MOM */

				if ((preq->rq_reply.brp_code == DIS_EOF) ||
				    (preq->rq_reply.brp_code == DIS_EOD)) {
					/* tcp connection to Mom broken */
					conn_to_mom_failed(pjob, on_job_rerun);
					free_br(preq);
					preq = NULL;
					return;
				}
				on_exitrerun_msg(pjob, msg_obitnocpy);
				if (preq->rq_reply.brp_choice == BATCH_REPLY_CHOICE_Text) {
					int len = strlen(log_buffer);

					if (len < LOG_BUF_SIZE + 2) {
						log_buffer[len++] = '\n';
						strncpy(&log_buffer[len],
							preq->rq_reply.brp_un.brp_txt.brp_str,
							LOG_BUF_SIZE - len);
					}
				}
				svr_mailowner(pjob, MAIL_OTHER, MAIL_FORCE, log_buffer);
			}

			/*
			 * files (generally) copied ok, move on to the next phase by
			 * "faking" the immediate work task.
			 */

			free_br(preq);
			preq = NULL;
			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_RERUN2);
			ptask->wt_type = WORK_Immed;

			/* NO BREAK - FALL INTO THE NEXT CASE */

		case JOB_SUBSTATE_RERUN2:

			if (ptask->wt_type != WORK_Deferred_Reply) {

				/* here is where we delete  any stage-in files	   */

				preq = cpy_stage(preq, pjob, JOB_ATR_stagein, 0);
				if (preq) {
					preq->rq_type = PBS_BATCH_DelFiles;
					preq->rq_extra = (void *) pjob;
					rc = issue_Drequest(handle, preq, on_job_rerun, &pt, pjob->ji_mom_prot);
					if (rc == 0) {
						append_link(&pjob->ji_svrtask, &pt->wt_linkobj, pt);
						if (pjob->ji_mom_prot == PROT_TPP)
							if (mom_tasklist_ptr)
								append_link(mom_tasklist_ptr, &pt->wt_linkobj2, pt); /* if tpp, link to mom list as well */
						return;
					} else { /* error on sending request */
						preq->rq_reply.brp_code = rc;
						preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
						/* we will "fall" into the post reply side */
					}
				} else {
					svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_RERUN3);
					ptask = set_task(WORK_Immed, 0, on_job_rerun, pjob);
					append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
					return;
				}
			}

			/* post reply side for delete file request to MOM */
			if (preq->rq_reply.brp_code != 0) { /* error */
				if ((preq->rq_reply.brp_code == DIS_EOF) ||
				    (preq->rq_reply.brp_code == DIS_EOD)) {
					/* tcp connection to Mom broken */
					conn_to_mom_failed(pjob, on_job_rerun);
					free_br(preq);
					preq = NULL;
					return;
				}
				/* for other errors, just log it */
				on_exitrerun_msg(pjob, msg_obitnocpy);
			}
			free_br(preq);
			preq = NULL;
			svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_RERUN3);
			ptask->wt_type = WORK_Immed;

			/* NO BREAK, FALL THROUGH TO NEXT CASE */

		case JOB_SUBSTATE_RERUN3:

			if (ptask->wt_type != WORK_Deferred_Reply) {
				/* need to have MOM delete her copy of the job */
				preq = alloc_br(PBS_BATCH_DeleteJob);
				if (preq) {
					strcpy(preq->rq_ind.rq_delete.rq_objname,
					       pjob->ji_qs.ji_jobid);
					preq->rq_extra = (void *) pjob;
					rc = issue_Drequest(handle, preq, on_job_rerun, &pt, pjob->ji_mom_prot);
					if (rc == 0) {
						append_link(&pjob->ji_svrtask, &pt->wt_linkobj, pt);
						if (pjob->ji_mom_prot == PROT_TPP)
							if (mom_tasklist_ptr)
								append_link(mom_tasklist_ptr, &pt->wt_linkobj2, pt); /* if tpp, link to mom list as well */
						return;								     /* come back when Mom replies */
					} else {
						/* set up as if mom returned error */
						preq->rq_reply.brp_code = rc;
						preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_NULL;
						/* fall into next section */
					}
				} else {
					log_err(-1, pjob->ji_qs.ji_jobid,
						"Unable to malloc memory for rerun");
					return;
				}
			}

			/* here we have a reply from MOM about the delete */
			/* if delete ok, send final track and purge the job */

			if (preq->rq_reply.brp_code == PBSE_SISCOMM) {

				/*
				 * some sister Mom apparently failed to delete the job and
				 * free resoures, keep job until discard_job() does its job
				 */
				free_br(preq);
				preq = NULL;
				if (handle != -1 && pjob->ji_mom_prot == PROT_TCP)
					svr_disconnect(handle);

				if (pjob->ji_pmt_preq != NULL)
					reply_preempt_jobs_request(PBSE_SISCOMM, PREEMPT_METHOD_DELETE, pjob);

				discard_job(pjob, "A sister Mom failed to delete job", 0);
				return;
			} else if ((preq->rq_reply.brp_code == DIS_EOF) ||
				   (preq->rq_reply.brp_code == DIS_EOD)) {
				/* tcp connection to Mom broken */
				conn_to_mom_failed(pjob, on_job_rerun);
				free_br(preq);
				preq = NULL;
				return;
			} else {
				/* all went ok with the delete by Mom(s) */
				free_br(preq);
				preq = NULL;

				pjob->ji_qs.ji_obittime = time_now;
				set_jattr_l_slim(pjob, JOB_ATR_obittime, pjob->ji_qs.ji_obittime, SET);

				/* Allocate space for the jobobit hook event params */
				preq = alloc_br(PBS_BATCH_JobObit);
				if (preq == NULL) {
					log_err(PBSE_INTERNAL, __func__, "rq_jobobit alloc failed");
				} else {
					preq->rq_ind.rq_obit.rq_pjob = pjob;

					rc = process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
					if (rc == -1) {
						log_err(-1, __func__, "rq_jobobit process_hooks call failed");
					}
					free_br(preq);
				}

				if (handle != -1 && pjob->ji_mom_prot == PROT_TCP)
					svr_disconnect(handle);

				account_jobend(pjob, pjob->ji_acctrec, PBS_ACCT_RERUN);
				if (pjob->ji_acctrec) {
					free(pjob->ji_acctrec); /* logged, so clear it */
					pjob->ji_acctrec = NULL;
				}
				if ((is_jattr_set(pjob, JOB_ATR_resc_released))) {
					/* If JOB_ATR_resc_released attribute is set and we are trying
					 * to rerun a job then we need to reassign resources first because
					 * when we suspend a job we don't decrement all of the resources.
					 * So we need to set partially released resources
					 * back again to release all other resources
					 */
					set_resc_assigned(pjob, 0, INCR);
					free_jattr(pjob, JOB_ATR_resc_released);
					mark_jattr_not_set(pjob, JOB_ATR_resc_released);
					if (is_jattr_set(pjob, JOB_ATR_resc_released_list)) {
						free_jattr(pjob, JOB_ATR_resc_released_list);
						mark_jattr_not_set(pjob, JOB_ATR_resc_released_list);
					}
				}
				rel_resc(pjob); /* free resc assigned to job */

				/* Respond to pending preemption request from the scheduler, if any */
				if (pjob->ji_pmt_preq != NULL)
					reply_preempt_jobs_request(PBSE_NONE, PREEMPT_METHOD_REQUEUE, pjob);

				unset_extra_attributes(pjob);

				if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HOTSTART) == 0) {
					/* in case of server shutdown, don't clear exec_vnode */
					/* will use it on hotstart when next comes up	      */
					free_jattr(pjob, JOB_ATR_exec_vnode);
					free_jattr(pjob, JOB_ATR_exec_host);
					free_jattr(pjob, JOB_ATR_exec_host2);
				}
				pjob->ji_momhandle = -1;
				pjob->ji_mom_prot = PROT_INVALID;
				/* job dir has no meaning for re-queued jobs, so unset it */
				free_jattr(pjob, JOB_ATR_jobdir);

				pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_StagedIn;
				svr_evaljobstate(pjob, &newstate, &newsubst, 0);
				svr_setjobstate(pjob, newstate, newsubst);
			}
	}
}
/**
 * @brief
 * 		setrerun	- job is to be retried on start failure or
 * 		job is rerunnable and should set for rerun
 *
 * @param[in]	pjob	- job which needs to be set for rerun.
 *
 * @return	exit code
 * @retval	0	- substate set to rerun.
 * @retval	1	- substate left as it
 */
static int
setrerun(job *pjob)
{
	if ((pjob->ji_qs.ji_un.ji_exect.ji_exitstat == JOB_EXEC_RETRY) ||
	    (get_jattr_long(pjob, JOB_ATR_rerunable) != 0)) {
		set_job_substate(pjob, JOB_SUBSTATE_RERUN);
		return 0;
	} else {
		svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_init_abt);
		return 1;
	}
}

/**
 * @brief
 *		Concatenate the resources used to the buffer provided.
 *
 * @param[in,out]buffer - pointer to buffer to add info to.  May grow/change due to pbs_strcat() (realloc)
 * @param[in,out]buffer_size - size of buffer - may increase through pbs_strcat()
 * @param[in]		delim - a pointer to the delimiter to use
 * @param[in]		pjob - job structure for additional info
 */
int
concat_rescused_to_buffer(char **buffer, int *buffer_size, svrattrl *patlist, char *delim, const job *pjob)
{
	int val_len;

	if (buffer == NULL || buffer_size == NULL || patlist == NULL || delim == NULL)
		return 1;
	/*
	 * To calculate length of the string of the form "resources_used.<resource>=<value>".
	 * Additional length of 3 is required to accommodate the characters '.', '=' and '\n'.
	 */
	val_len = strlen(patlist->al_value);
	/* log to accounting_logs only if there's a value */
	if (val_len > 0) {
		if (pbs_strcat(buffer, buffer_size, delim) == NULL) {
			log_err(errno, __func__, "Failed to allocate memory.");
			return 1;
		}
		if (pbs_strcat(buffer, buffer_size, patlist->al_name) == NULL) {
			log_err(errno, __func__, "Failed to allocate memory.");
			return 1;
		}
		if (patlist->al_resc) {
			if (pbs_strcat(buffer, buffer_size, ".") == NULL) {
				log_err(errno, __func__, "Failed to allocate memory.");
				return 1;
			}
			if (pbs_strcat(buffer, buffer_size, patlist->al_resc) == NULL) {
				log_err(errno, __func__, "Failed to allocate memory.");
				return 1;
			}
		}
		if (pbs_strcat(buffer, buffer_size, "=") == NULL) {
			log_err(errno, __func__, "Failed to allocate memory.");
			return 1;
		}
		if ((pjob != NULL) &&
		    patlist->al_resc && (strcmp(patlist->al_resc, WALLTIME) == 0)) {
			long j, k;

			k = get_walltime(pjob, JOB_ATR_resc_used_acct);
			j = get_walltime(pjob, JOB_ATR_resc_used);
			if ((k >= 0) && (j >= k)) {
				char timebuf[TIMEBUF_SIZE] = {0};

				convert_duration_to_str(j - k, timebuf, TIMEBUF_SIZE);
				if (pbs_strcat(buffer, buffer_size, timebuf) == NULL) {
					log_err(errno, __func__,
						"Failed to allocate memory.");
					return 1;
				}
			} else {
				if (pbs_strcat(buffer, buffer_size,
					       patlist->al_value) == NULL) {
					log_err(errno, __func__,
						"Failed to allocate memory.");
					return 1;
				}
			}
		} else if (pbs_strcat(buffer, buffer_size,
				      patlist->al_value) == NULL) {
			log_err(errno, __func__, "Failed to allocate memory.");
			return 1;
		}
	}
	return 0;
}

/**
 * @brief
 *		Process the Job Obituary Notice (request) from MOM for a job which has.
 *		terminated.  The Obit contains the exit status and final resource
 *		usage for the job.
 * @par
 *		If the job cannot be found, the Server tells Mom to discard her copy.
 *		This may be the case if the job was forcefully deleted while Mom was
 *		down or the Server was restarted cold/clean discarding the jobs.
 *
 *		Depending on the state of the job:
 *		- Not RUNNING and not EXITING - tell Mom to discard the job.
 *		- Also not in substate _TERM - Mom wishes to restart the end of job
 *	  	 processing; likely because she hasn't heard from the Server.
 *		- If the "run count" in the obit does not match the Server's, Mom has
 *	 	 an old copy and she is told to discard it.
 * @par
 *		Normally, the Obit is received when the job is in substate RUNNING.
 *		The job is moved into that substate when Mom sends the session id of
 *		the job,  see stat_update().  However, it is possible that  the Obit
 *		is received before that and the job is in substate _PRERUN (or very
 *		unlikely _PROVISION).  If this is the case, call complete_running()
 *		to update the job to _RUNNING and write the "S" accounting record before
 *		we write the "E" record.
 * @par
 *		There are special job exit values (negative nunbers which cannot be
 *		actual exits status of the job).  These are typically because Mom
 *		could not complete starting the job or Mom is being restarted without
 *		the "-p" option.
 *		- JOB_EXEC_FAIL1: Mom could not start job, the standard out/err files
 *	  	were not created.
 *		- JOB_EXEC_FAIL2: Mom could not start the job, but had created the
 *	  	files so there is useful info in them.
 *		- JOB_EXEC_INITABT: Mom aborted the running job on her initialization.
 *		- JOB_EXEC_FAILUID: Mom aborted the job because of an invalid uid/gid.
 *		- JOB_EXEC_FAIL_PASSWORD: Mom aborted the job because she needed the
 *	  	user's password (Windows) and the password didn't work.
 *		- JOB_EXEC_RETRY: Mom couldn't start the job, but it might work later,
 *	  	so requeue it.
 *		- JOB_EXEC_BADRESRT: The job could not be started from the checkpoint
 *	  	restart file.
 *		- JOB_EXEC_INITRST: Mom aborted a checkpointed job which should be
 *	  	requeued for a later "restart".
 *		- JOB_EXEC_QUERST: The Epilogue told Mom to requeue the job which can
 *	  	be restarted from a checkpoint.
 *		- JOB_EXEC_RERUN: or JOB_EXEC_RERUN_SIS_FAIL: requeue the job if it is
 *	  	rerunable (not submitted with "-r n").
 *		- JOB_EXEC_FAILHOOK_RERUN: returned by a job rejected by a mom hook
 *	  	and the next action is to requeue/rerun the job.
 *		- JOB_EXEC_FAILHOOK_DELETE: returned by a job rejected by a mom hook
 *	  	and the next action is to just delete the job.
 *		- JOB_EXEC_HOOK_RERUN - returned by a job that ran a mom hook that
 *	  	instructed the server to requeue the job once reaching the end.
 *		- JOB_EXEC_HOOK_DELETE - returned by a job that ran a mom hook that
 *	  	instructed the server to delete the job  once reaching the end.
 *		- JOB_EXEC_HOOKERROR: returned by a job rejected by a mom hook
 *		due to an exception, or hook alarm was raised,
 *		and the next action is to requeue/rerun the job.
 * @par
 *		Otherwise record the accounting information to be recorded later in the
 *		processing.  Now, the job is moved into "exiting" processing or "rerun"
 *		porcessiong (qrerun) via a work-task entry invoking either on_job_exit()
 *		or on_job_rerun().
 *
 * @param[in] - pruu   - the structure containing the resource usage info
 * @param[in] - stream - the TPP stream connecting to the Mom
 *                       The Server will send back either a rejection or an acceptance
 *                       of  the Obit.
 * @return int
 *
 * @retval 0  - accept obit
 * @retval 1  - reject obit
 * @retval -1 - ignore obit
 *
 */
int
job_obit(ruu *pruu, int stream)
{
	int alreadymailed = 0;
	char *acctbuf = NULL;
	int acctbuf_size = 0;
	int dummy;
	int num;
	int exitstatus;
	int local_exitstatus = 0;
	char *mailbuf = NULL;
	int mailbuf_size = 0;
	char newstate;
	int newsubst;
	job *pjob;
	svrattrl *patlist;
	struct work_task *ptask;
	void (*eojproc)(struct work_task *);
	char *mailmsg = NULL;
	char *msg = NULL;

	time_now = time(0);

	DBPRT(("%s: Obit received for job %s status=%d hop=%d\n", __func__, pruu->ru_pjobid, pruu->ru_status, pruu->ru_hop))
	pjob = find_job(pruu->ru_pjobid);
	if (pjob == NULL) { /* not found */
		DBPRT(("%s: job %s not found!\n", __func__, pruu->ru_pjobid))
		if (server_init_type == RECOV_COLD || server_init_type == RECOV_CREATE)
			sprintf(log_buffer, msg_obitnojob, PBSE_CLEANEDOUT);
		else if (is_job_array(pruu->ru_pjobid) == IS_ARRAY_Single)
			sprintf(log_buffer, "%s", msg_obitnotrun);
		else
			sprintf(log_buffer, msg_obitnojob, PBSE_UNKJOBID);
		log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE, pruu->ru_pjobid, log_buffer);

		/* tell MOM the job was blown away */
		return 1;
	}

	log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO, pruu->ru_pjobid,
		   "Obit received momhop:%d serverhop:%ld state:%c substate:%d",
		   pruu->ru_hop, get_jattr_long(pjob, JOB_ATR_run_version), get_job_state(pjob), get_job_substate(pjob));

	if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
		DBPRT(("%s: job %s not in running state!\n",
		       __func__, pruu->ru_pjobid))
		if (!check_job_state(pjob, JOB_STATE_LTR_EXITING)) {

			/* not running and not exiting - bad news   */
			/* may be from old Mom and job was requeued */
			/* tell mom to trash job		    */
			DBPRT(("%s: job %s not in exiting state!\n",
			       __func__, pruu->ru_pjobid))
			pjob->ji_discarding = 0;

			log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pruu->ru_pjobid, msg_obitnotrun);
			return 1;
		} else if (!check_job_substate(pjob, JOB_SUBSTATE_TERM)) {
			/*
			 * not in special site script substate, Mom must have
			 * had a problem and wants to have the post job
			 * processing restarted.
			 *
			 * If there is an open connection to Mom for this job,
			 * find the associate work task, remove and free it and
			 * any outstanding batch_request to Mom.  Then close
			 * the connection so we start fresh and stay in sync.
			 */
			if (pjob->ji_momhandle != -1) {
				struct batch_request *prequest;
				extern pbs_list_head task_list_event;

				ptask = (struct work_task *) GET_NEXT(task_list_event);
				while (ptask) {
					if (ptask->wt_type == WORK_Deferred_Reply && ptask->wt_event == pjob->ji_momhandle)
						break;
					ptask = (struct work_task *) GET_NEXT(ptask->wt_linkevent);
				}
				if (ptask) {
					if ((prequest = ptask->wt_parm1) != NULL)
						free_br(prequest);
					delete_task(ptask);
				}
				if (pjob->ji_mom_prot == PROT_TCP)
					svr_force_disconnect(pjob->ji_momhandle);

				pjob->ji_momhandle = -1;
				pjob->ji_mom_prot = PROT_INVALID;
			}
			if (get_job_substate(pjob) < JOB_SUBSTATE_RERUN)
				eojproc = on_job_exit;
			else
				eojproc = on_job_rerun;
			ptask = set_task(WORK_Immed, 0, eojproc, (void *) pjob);
			append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
			return -1;
		}
		/*
		 * State EXITING and substate TERM, this is the real obit
		 * so fall throught and start real end of job processing
		 */
	}

	if (pruu->ru_hop < get_jattr_long(pjob, JOB_ATR_run_version)) {
		/*
		 * Obit is for an older run version,  likely a Mom coming back
		 * alive after being down awhile and job was requeue and run
		 * somewhere else.   Just tell Mom to junk job
		 */
		DBPRT(("%s: job %s run count too low\n", __func__, pruu->ru_pjobid))
		return 1;
	} else if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {

		/*
		 * Won't have a valid hop count in the job structure
		 * look at where job is running and who is sending the obit
		 */

		int ivndx;
		mominfo_t *psendmom;
		struct pbsnode *sendvnp;
		char *runningnode;
		extern struct tree *streams;

		psendmom = tfind2(stream, 0, &streams);
		runningnode = parse_servername(get_jattr_str(pjob, JOB_ATR_exec_vnode), NULL);
		if (psendmom && runningnode) {
			for (ivndx = 0; ivndx < ((mom_svrinfo_t *) (psendmom->mi_data))->msr_numvnds; ++ivndx) {
				sendvnp = ((mom_svrinfo_t *) (psendmom->mi_data))->msr_children[ivndx];
				if (strcasecmp(runningnode, sendvnp->nd_name) == 0) {
					break;
				}
			}
			if (ivndx == ((mom_svrinfo_t *) (psendmom->mi_data))->msr_numvnds) {
				/* not the same node, reject the obit */
				return 1;
			}
		}
	}

	/*
	 * have hit a race condition where the send_job child's process
	 * may not yet have been reaped.  Update accounting for job start
	 */

	if (check_job_substate(pjob, JOB_SUBSTATE_PRERUN) || check_job_substate(pjob, JOB_SUBSTATE_PROVISION)) {
		DBPRT(("%s: job %s in prerun state.\n", __func__, pruu->ru_pjobid))
		complete_running(pjob);
	}
	if (pjob->ji_prunreq) {
		reply_ack(pjob->ji_prunreq);
		pjob->ji_prunreq = NULL;
	}

	/* save exit state, update the resources used */
	exitstatus = pruu->ru_status;
	pjob->ji_qs.ji_un.ji_exect.ji_exitstat = exitstatus;

	/* set the Exit_status job attribute */
	if (is_jattr_set(pjob, JOB_ATR_exit_status))
		local_exitstatus = get_jattr_long(pjob, JOB_ATR_exit_status);

	if ((local_exitstatus == JOB_EXEC_HOOK_RERUN || local_exitstatus == JOB_EXEC_HOOK_DELETE) &&
	    exitstatus != JOB_EXEC_FAILHOOK_RERUN && exitstatus != JOB_EXEC_FAILHOOK_DELETE)
		exitstatus = local_exitstatus;
	else
		set_jattr_l_slim(pjob, JOB_ATR_exit_status, exitstatus, SET);

	patlist = (svrattrl *) GET_NEXT(pruu->ru_attr);

	/* record usage attribute to job for history */
	dummy = 0;
	if (modify_job_attr(pjob, patlist, ATR_DFLAG_MGWR | ATR_DFLAG_SvWR, &dummy) != 0) {
		for (num = 1; num < dummy; num++)
			patlist = (struct svrattrl *) GET_NEXT(patlist->al_link);
		log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid,
			   "unable to update attribute %s.%s in job_obit", patlist->al_name, patlist->al_resc);
	}

	/* Allocate initial space for acctbuf/mailbuf.  Future space will be allocated by pbs_strcat(). */
	acctbuf = malloc(RESC_USED_BUF_SIZE);
	mailbuf = malloc(RESC_USED_BUF_SIZE);

	if (acctbuf == NULL || mailbuf == NULL) {
		log_err(errno, __func__, "Failed to allocate memory");
		/* Just incase one of the buffers got allocated */
		free(acctbuf);
		acctbuf = NULL;
		free(mailbuf);
		mailbuf = NULL;
	} else {
		acctbuf_size = RESC_USED_BUF_SIZE;
		mailbuf_size = RESC_USED_BUF_SIZE;

		snprintf(acctbuf, acctbuf_size, msg_job_end_stat, pjob->ji_qs.ji_un.ji_exect.ji_exitstat);
		if (exitstatus < 10000)
			strncpy(mailbuf, acctbuf, mailbuf_size);
		else
			snprintf(mailbuf, mailbuf_size, msg_job_end_sig, exitstatus - 10000);
		/*
		 * NOTE:
		 * Following code for constructing resources used information is same as account_jobend()
		 * with minor difference that to traverse patlist in this code
		 * we have to use GET_NEXT(patlist->al_link) since it is part of batch request
		 * and in account_jobend() we are using patlist->al_sister which is encoded
		 * information in job struct.
		 * This collects all resources_used information returned from the mom.
		 */
		for (; patlist; patlist = (svrattrl *) GET_NEXT(patlist->al_link)) {
			resource_def *tmpdef;

			if (strcmp(patlist->al_name, ATTR_used) != 0)
				continue;
			tmpdef = find_resc_def(svr_resc_def, patlist->al_resc);
			if (tmpdef == NULL)
				continue;
			/*
			 * Copy all resources to the accounting buffer.
			 * Copy all but invisible resources into the mail buffer.
			 * The ATR_DFLAG_USRD flag will not be set on invisible resources.
			 */
			if (concat_rescused_to_buffer(&acctbuf, &acctbuf_size, patlist, " ", pjob) != 0)
				break;
			if (tmpdef->rs_flags & ATR_DFLAG_USRD) {
				if (concat_rescused_to_buffer(&mailbuf, &mailbuf_size, patlist, "\n", pjob) != 0)
					break;
			}
		}
	}

	/* make sure ji_momhandle is -1 to force new connection to mom */
	pjob->ji_momhandle = -1;
	pjob->ji_mom_prot = PROT_INVALID;
	pjob->ji_retryok = 0; /* for retry if Mom down */

	/* clear suspended flag if it was set, also clear suspended-workstation busy flag if set */

	pjob->ji_qs.ji_svrflags &= ~(JOB_SVFLG_Suspend | JOB_SVFLG_Actsuspd);

	/* Was there a special exit status from MOM ? */
	if (exitstatus < 0 && exitstatus != JOB_EXEC_CHKP) {
		/* negative exit status is special */
		switch (exitstatus) {
			case JOB_EXEC_FAILHOOK_DELETE:
				/* this is a reject */
				log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, msg_hook_reject_deletejob);
				DBPRT(("%s: MOM rejected job %s due to a hook.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_hook_reject_deletejob);
				alreadymailed = 1;
				break;

			case JOB_EXEC_HOOK_DELETE:
				/* more likely an accept with a hook delete option */
				log_event(PBSEVENT_ADMIN | PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, "a hook requested for job to be deleted");
				DBPRT(("%s: a hook requested for job %s to be deleted.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, "a hook requested for job to be deleted");
				alreadymailed = 1;
				break;

			case JOB_EXEC_FAIL1:
			default:
				/* MOM rejected job with fatal error, abort job */
				DBPRT(("%s: MOM rejected job %s with fatal error.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momnoexec1);
				alreadymailed = 1;
				break;

			case JOB_EXEC_FAIL2:
				/* MOM reject job after files setup, abort job */
				DBPRT(("%s: MOM rejected job %s after setup.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momnoexec2);
				alreadymailed = 1;
				break;

			case JOB_EXEC_INITABT:
				/* MOM aborted job on her initialization */
				DBPRT(("%s: MOM aborted job %s on init, no requeue.\n", __func__, pruu->ru_pjobid))
				alreadymailed = setrerun(pjob);
				pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HASRUN;
				break;

			case JOB_EXEC_FAILUID:
				/* MOM abort job because uid or gid was invalid */
				DBPRT(("%s: MOM rejected job %s with invaild uid/gid.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_baduser);
				alreadymailed = 1;
				/* go to the retry case */
				goto RetryJob;

			case JOB_EXEC_FAIL_PASSWORD:

				/* put job on password hold */
				set_jattr_b_slim(pjob, JOB_ATR_hold, HOLD_bad_password, INCR);

				set_job_substate(pjob, JOB_SUBSTATE_HELD);
				svr_evaljobstate(pjob, &newstate, &newsubst, 0);
				svr_setjobstate(pjob, newstate, newsubst);

				msg = pruu->ru_comment ? pruu->ru_comment : "";
				mailmsg = (char *) malloc(strlen(msg) + 1 + strlen(msg_bad_password) + 1);
				if (mailmsg) {
					sprintf(mailmsg, "%s:%s", msg, msg_bad_password);
					svr_mailowner(pjob, MAIL_BEGIN, MAIL_FORCE, mailmsg);
					set_jattr_str_slim(pjob, JOB_ATR_Comment, mailmsg, NULL);

					log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid, mailmsg);
					free(mailmsg);
				} else {
					svr_mailowner(pjob, MAIL_BEGIN, MAIL_FORCE, msg_bad_password);
					set_jattr_str_slim(pjob, JOB_ATR_Comment, msg_bad_password, NULL);
				}

			case JOB_EXEC_RETRY:
			case JOB_EXEC_FAILHOOK_RERUN:
			case JOB_EXEC_HOOK_RERUN:
			case JOB_EXEC_HOOKERROR:
			case JOB_EXEC_JOINJOB:
				if (exitstatus == JOB_EXEC_FAILHOOK_RERUN || exitstatus == JOB_EXEC_HOOKERROR) {
					log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, msg_hook_reject_rerunjob);
					DBPRT(("%s: MOM rejected job %s due to a hook.\n", __func__, pruu->ru_pjobid))
				} else if (exitstatus == JOB_EXEC_JOINJOB) {
					log_event(PBSEVENT_ERROR | PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
						  pjob->ji_qs.ji_jobid, "Mom rejected job due to join job error");
					exitstatus = JOB_EXEC_RETRY;
				}
			RetryJob:
				/* MOM rejected job, but said retry it */
				DBPRT(("%s: MOM rejected job %s but will retry.\n", __func__, pruu->ru_pjobid))
				if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HASRUN) /* has run before, treat this as another rerun */
					alreadymailed = setrerun(pjob);
				else /* have mom remove job files, not saving them, and requeue job */
					set_job_substate(pjob, JOB_SUBSTATE_RERUN2);

				check_failed_attempts(pjob);
				break;

			case JOB_EXEC_BADRESRT:
				/* MOM could not restart job, setup for rerun */
				DBPRT(("%s: MOM could not restart job %s, will rerun.\n", __func__, pruu->ru_pjobid))
				alreadymailed = setrerun(pjob);
				pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_CHKPT;
				break;

			case JOB_EXEC_INITRST:
				/*
					* Mom aborted job on Mom being restarted, job has been
					* checkpointed and can be "restarted" rather than rerun
					*/
			case JOB_EXEC_QUERST:
				/*
					* Epilogue requested requeue of a checkpointed job
					* it can be restarted later from restart file
					*
					* In both cases, job has checkpoint/restart file,
					* requeue job and leave all information on execution
					* host for a later restart
					*/
				DBPRT(("%s: MOM request requeue of job for restart.\n", __func__))
				if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob)
					goto RetryJob;

				rel_resc(pjob);
				pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HASRUN | JOB_SVFLG_CHKPT;

				svr_evaljobstate(pjob, &newstate, &newsubst, 1);
				svr_setjobstate(pjob, newstate, newsubst);
				if (pjob->ji_mom_prot == PROT_TCP)
					svr_disconnect(pjob->ji_momhandle);

				pjob->ji_momhandle = -1;
				pjob->ji_mom_prot = PROT_INVALID;

				free(mailbuf);
				free(acctbuf);
				return 0;

			case JOB_EXEC_INITRMG:
				/*
					* MOM abort job on init, job has migratable checkpoint
					* Must recover output and checkpoint file, do eoj
					*/

				DBPRT(("%s: MOM aborted migratable job %s on init, will requeue.\n", __func__, pruu->ru_pjobid))

				if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob)
					goto RetryJob;

				alreadymailed = setrerun(pjob);
				pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HASRUN | JOB_SVFLG_ChkptMig;
				break;

			case JOB_EXEC_RERUN:
			case JOB_EXEC_RERUN_SIS_FAIL:
				if (get_jattr_long(pjob, JOB_ATR_rerunable))
					set_job_substate(pjob, JOB_SUBSTATE_RERUN);
				else {
					set_job_substate(pjob, JOB_SUBSTATE_EXITING);
					svr_mailowner(pjob, MAIL_ABORT, MAIL_NORMAL,
						      "Non-rerunable job deleted on requeue");
				}
				break;
			case JOB_EXEC_FAIL_SECURITY:
				/* MOM rejected job with security breach fatal error, abort job */
				DBPRT(("%s: MOM rejected job %s with security breach fatal error.\n", __func__, pruu->ru_pjobid))
				set_jattr_b_slim(pjob, JOB_ATR_hold, HOLD_s, INCR);
				set_jattr_str_slim(pjob, JOB_ATR_Comment,
						   "job held due to possible security breach of job tmpdir, failed to start", NULL);
				rel_resc(pjob);
				svr_setjobstate(pjob, JOB_STATE_LTR_HELD, JOB_SUBSTATE_HELD);
				free(mailbuf);
				free(acctbuf);
				return 0;
			case JOB_EXEC_KILL_NCPUS_BURST:
				/* MOM killed job due to exceeding ncpus (burst), abort job */
				DBPRT(("%s: MOM killed job %s due to exceeding ncpus (burst).\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momkillncpusburst);
				alreadymailed = 1;
				break;
			case JOB_EXEC_KILL_NCPUS_SUM:
				/* MOM killed job due to exceeding ncpus (sum), abort job */
				DBPRT(("%s: MOM killed job %s due to exceeding ncpus (sum).\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momkillncpussum);
				alreadymailed = 1;
				break;
			case JOB_EXEC_KILL_VMEM:
				/* MOM killed job due to exceeding vmem, abort job */
				DBPRT(("%s: MOM killed job %s due to exceeding vmem.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momkillvmem);
				alreadymailed = 1;
				break;
			case JOB_EXEC_KILL_MEM:
				/* MOM killed job due to exceeding mem, abort job */
				DBPRT(("%s: MOM killed job %s due to exceeding mem.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momkillmem);
				alreadymailed = 1;
				break;
			case JOB_EXEC_KILL_CPUT:
				/* MOM killed job due to exceeding cput, abort job */
				DBPRT(("%s: MOM killed job %s due to exceeding cput.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momkillcput);
				alreadymailed = 1;
				break;
			case JOB_EXEC_KILL_WALLTIME:
				/* MOM killed job due to exceeding walltime, abort job */
				DBPRT(("%s: MOM killed job %s due to exceeding walltime.\n", __func__, pruu->ru_pjobid))
				svr_mailowner(pjob, MAIL_ABORT, MAIL_FORCE, msg_momkillwalltime);
				alreadymailed = 1;
				break;
		}
	}

	/* Send email if exiting (not rerun) */

	if ((exitstatus == JOB_EXEC_FAILHOOK_DELETE) || (exitstatus == JOB_EXEC_HOOK_DELETE) ||
	    (!check_job_substate(pjob, JOB_SUBSTATE_RERUN) && !check_job_substate(pjob, JOB_SUBSTATE_RERUN2))) {
		DBPRT(("%s: Job %s is terminating and not rerun.\n", __func__, pjob->ji_qs.ji_jobid))

		svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, JOB_SUBSTATE_EXITING);
		if (alreadymailed == 0 && mailbuf != NULL)
			svr_mailowner(pjob, MAIL_END, MAIL_NORMAL, mailbuf);
	}

	/* can free this now since no need to use it */
	free(mailbuf);

	/* save record accounting for later */
	free(pjob->ji_acctrec);
	pjob->ji_acctrec = acctbuf;

	/* Now, what do we do with the job... */
	if (exitstatus == JOB_EXEC_FAILHOOK_DELETE || exitstatus == JOB_EXEC_HOOK_DELETE ||
	    (!check_job_substate(pjob, JOB_SUBSTATE_RERUN) && !check_job_substate(pjob, JOB_SUBSTATE_RERUN2))) {
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) && ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) == 0) && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_HASHOLD)) {

			/* non-migratable checkpoint, leave there
			 * and just requeue the job.
			 */

			rel_resc(pjob);
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HASRUN;
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_HASHOLD;
			svr_evaljobstate(pjob, &newstate, &newsubst, 1);
			svr_setjobstate(pjob, newstate, newsubst);
			if (pjob->ji_mom_prot == PROT_TCP)
				svr_disconnect(pjob->ji_momhandle);
			pjob->ji_momhandle = -1;
			pjob->ji_mom_prot = PROT_INVALID;
			return 0;
		}

		check_block(pjob, ""); /* if block set, send word */
		ptask = set_task(WORK_Immed, 0, on_job_exit, (void *) pjob);
		append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);

		/* "on_job_exit()" will be dispatched out of the main loop */

	} else {
		/*
		 * Rerunning job ...
		 * If not checkpointed, clear "resources_used"
		 * Requeue job
		 */
		DBPRT(("%s: Rerunning job %s\n", __func__, pjob->ji_qs.ji_jobid))
		if ((pjob->ji_qs.ji_svrflags & (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) == 0)
			free_jattr(pjob, JOB_ATR_resc_used);

		svr_setjobstate(pjob, JOB_STATE_LTR_EXITING, get_job_substate(pjob));
		ptask = set_task(WORK_Immed, 0, on_job_rerun, (void *) pjob);
		append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);

		/* "on_job_rerun()" will be dispatched out of the main loop */
	}

	DBPRT(("%s: Returning from end of function.\n", __func__))

	return 0;
}


================================================
FILE: src/server/req_locate.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * @file	req_locate.c
 * @brief
 * 	Functions relating to the Locate Job Batch Request.
 *
 * Included funtions are:
 *	req_locatejob()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include "libpbs.h"
#include <signal.h>
#include <string.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "work_task.h"
#include "tracking.h"
#include "pbs_error.h"
#include "log.h"

/* Global Data Items: */

extern struct server server;
extern char server_name[];

/* External functions */
extern int svr_chk_histjob(job *);
extern int is_job_array(char *);

/**
 * @brief
 * 		req_locatejob - service the Locate Job Request
 *
 *		This request attempts to locate a job.
 *
 * @param[in]	preq	- Job Request
 */

void
req_locatejob(struct batch_request *preq)
{
	char *at;
	int i;
	job *pjob;
	char *location = NULL;

	if ((at = strchr(preq->rq_ind.rq_locate, (int) '@')) != NULL)
		*at = '\0'; /* strip off @server_name */
	pjob = find_job(preq->rq_ind.rq_locate);

	/*
	 * Reject request for history jobs:
	 *	i) jobs with state FINISHED
	 *	ii) jobs with state MOVED and substate FINISHED
	 */
	if (pjob && svr_chk_histjob(pjob) == PBSE_HISTJOBID) {
		req_reject(PBSE_HISTJOBID, 0, preq);
		return;
	}

	/*
	 * return the location if job is not history (i.e. state is not
	 * JOB_STATE_LTR_MOVED) else search in tracking table.
	 */
	if (pjob && (!check_job_state(pjob, JOB_STATE_LTR_MOVED)))
		location = pbs_server_name;
	else {
		int job_array_ret;
		job_array_ret = is_job_array(preq->rq_ind.rq_locate);
		if ((job_array_ret == IS_ARRAY_Single) || (job_array_ret == IS_ARRAY_Range)) {
			int i;
			char idbuf[PBS_MAXSVRJOBID + 1] = {'\0'};
			char *pc;
			for (i = 0; i < PBS_MAXSVRJOBID; i++) {
				idbuf[i] = *(preq->rq_ind.rq_locate + i);
				if (idbuf[i] == '[')
					break;
			}
			idbuf[++i] = ']';
			idbuf[++i] = '\0';
			pc = strchr(preq->rq_ind.rq_locate, (int) '.');
			if (pc)
				strcat(idbuf, pc);
			strncpy(preq->rq_ind.rq_locate, idbuf, sizeof(preq->rq_ind.rq_locate));
		}
		for (i = 0; i < server.sv_tracksize; i++) {
			if ((server.sv_track + i)->tk_mtime &&
			    !strcmp((server.sv_track + i)->tk_jobid, preq->rq_ind.rq_locate)) {
				location = (server.sv_track + i)->tk_location;
				break;
			}
		}
	}
	if (location) {
		preq->rq_reply.brp_code = 0;
		preq->rq_reply.brp_auxcode = 0;
		preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_Locate;
		(void) strcpy(preq->rq_reply.brp_un.brp_locate, location);
		reply_send(preq);
	} else
		req_reject(PBSE_UNKJOBID, 0, preq);
	return;
}


================================================
FILE: src/server/req_manager.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 *	Functions relating to the Manager Batch Request (qmgr)
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include <sys/socket.h>

#include <arpa/inet.h>
#include <ctype.h>
#include <memory.h>
#include <string.h>
#include <stdlib.h>
#include <unistd.h>
#include <netdb.h>
#include <errno.h>

#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "work_task.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_license.h"
#include "server.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "credential.h"
#include "batch_request.h"
#include "net_connect.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "pbs_ifl.h"
#include "batch_request.h"
#include "hook.h"
#include "hook_func.h"
#include "pbs_entlim.h"
#include "provision.h"
#include "pbs_db.h"
#include "assert.h"
#include "pbs_idx.h"
#include "sched_cmds.h"
#include "pbs_sched.h"
#include "pbs_share.h"

#define PERM_MANAGER (ATR_DFLAG_MGWR | ATR_DFLAG_MGRD)
#define PERM_OPorMGR (ATR_DFLAG_MGWR | ATR_DFLAG_MGRD | ATR_DFLAG_OPRD | ATR_DFLAG_OPWR)

pntPBS_IP_LIST pbs_iplist = NULL;

void *node_idx = NULL;
static void *hostaddr_idx = NULL;

/* Global Data Items: */

extern void unset_license_location(void);
extern void unset_license_min(void);
extern void unset_license_max(void);
extern void unset_license_linger(void);
extern void unset_job_history_enable(void);
extern void unset_job_history_duration(void);
extern void unset_max_job_sequence_id(void);
extern void force_qsub_daemons_update(void);
extern void unset_node_fail_requeue(void);
extern void unset_resend_term_delay(void);
extern pbs_sched *sched_alloc(char *sched_name);
extern void sched_free(pbs_sched *psched);
extern int sched_delete(pbs_sched *psched);

extern struct server server;
extern pbs_list_head svr_queues;
extern attribute_def que_attr_def[];
extern attribute_def svr_attr_def[];
extern char *msg_attrtype;
extern char *msg_daemonname;
extern char *msg_manager;
extern char *msg_man_cre;
extern char *msg_man_del;
extern char *msg_man_set;
extern char *msg_man_uns;
extern char *msg_noattr;
extern unsigned int pbs_mom_port;
extern char *path_hooks;
extern int max_concurrent_prov;
extern char *msg_cannot_set_route_que;
extern int check_req_aoe_available(struct pbsnode *, char *);
int resize_prov_table(int);

/* private data */

static char *all_quename = "_All_";
static char *all_nodes = "_All_";
enum res_op_flag {
	INDIRECT_RES_UNLINK,
	INDIRECT_RES_CHECK,
};

extern time_t time_now;
extern void *svr_db_conn;
struct work_task *rescdef_wt_g = NULL;

/*
 * This structure used as part of the index tree
 * to do a faster lookup of hostnames.
 * It is stored against pname in make_host_addresses_list()
 */
struct pul_store {
	u_long *pul; /* list of ipaddresses */
	int len;     /* length */
};

/**
 * @brief
 * 		is_local_root: returns TRUE if <user>@<host> corresponds to the local
 *  	root (or Admin-privilege account) on the local host.
 *
 * @param[in]	user	- user name
 * @param[in]	host	- host name
 *
 * @return	Boolean
 * @retval	TRUE	- User has Admin-privilege
 * @retval	FALSE	- No Admin-privilege
 */
int
is_local_root(char *user, char *host)
{
	/* Similar method used in svr_get_privilege() */
	if (strcmp(user, PBS_DEFAULT_ADMIN) == 0) {
		int is_local = 0;
		char myhostname[PBS_MAXHOSTNAME + 1];
		/* First try without DNS lookup. */
		if (strcasecmp(host, server_host) == 0) {
			is_local = 1;
		} else if (strcasecmp(host, LOCALHOST_SHORTNAME) == 0) {
			is_local = 1;
		} else if (strcasecmp(host, LOCALHOST_FULLNAME) == 0) {
			is_local = 1;
		} else {
			if (gethostname(myhostname, (sizeof(myhostname) - 1)) == -1) {
				myhostname[0] = '\0';
			}
			if (strcasecmp(host, myhostname) == 0) {
				is_local = 1;
			}
		}
		if (is_local == 0) {
			/* Now try with DNS lookup. */
			if (is_same_host(host, server_host)) {
				is_local = 1;
			} else if (is_same_host(host, myhostname)) {
				is_local = 1;
			}
		}
		if (is_local != 0)
			return (TRUE);
	}
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	char *privil_auth_user = pbs_conf.pbs_privileged_auth_user ? pbs_conf.pbs_privileged_auth_user : NULL;
	char uh[PBS_MAXUSER + PBS_MAXHOSTNAME + 2];
	if (privil_auth_user &&
	    is_string_in_arr(pbs_conf.supported_auth_methods, AUTH_GSS_NAME)) {
		strcpy(uh, user);
		strcat(uh, "@");
		strcat(uh, host);

		if (strcmp(uh, privil_auth_user) == 0) {
			return (TRUE);
		}
	}
#endif
	return (FALSE);
}

/**
 * @brief
 * 		warnings_update - adds node pointer to the warnings array if
 * 		client needs a warning about this node.
 *
 * 		The first argument, a "warning code", determines the processing that
 * 		occurs.  It might be simply some initialization, or it might be the
 * 		actual test for a "warning required" situation.
 *
 * @param[in]	wcode	- "warning code", determines the processing that occurs.
 * @param[out]	wnodes	- warnings array
 * @param[in,out]	widx	- index inside warnings array where the node is getting added
 * @param[in]	np	- node pointer which gets added into warnings array.
 *
 * @return	None
 *
 * @par MT-safe: No
 */
void
warnings_update(int wcode, pbsnode **wnodes, int *widx, pbsnode *np)
{
	resource *resc;
	struct pbssubn *psub;

	static int ngrp_had = 0;
	static char *rname = NULL;
	static resource_def *rscdef = NULL;
	int warning_ok = 0;

	switch (wcode) {
		case WARN_ngrp_init:
		case WARN_ngrp:
		case WARN_ngrp_ck:
			if (is_sattr_set(SVR_ATR_NodeGroupKey))
				warning_ok = 1;
			break;

		default:
			break;
	}

	if (warning_ok == 1 && wcode == WARN_ngrp_init) {
		/*
		 * initialize some static data
		 */

		rname = get_sattr_str(SVR_ATR_NodeGroupKey);
		if ((rname != NULL) && (*rname != '\0'))
			rscdef = find_resc_def(svr_resc_def, rname);
		return;

	} else if (warning_ok == 1 && wcode == WARN_ngrp && wnodes != NULL) {

		if (rscdef != NULL) {
			resc = find_resc_entry(get_nattr(np, ND_ATR_ResourceAvail), rscdef);
			if (resc != NULL) {
				if (resc->rs_value.at_flags & ATR_VFLAG_MODIFY) {
					if (np->nd_resvp) {
						wnodes[*widx] = np;
						*widx += 1;
					}
					for (psub = np->nd_psn; psub != 0; psub = psub->next) {
						if (psub->jobs) {
							wnodes[*widx] = np;
							*widx += 1;
						}
					}
				}
			} else if (resc == NULL && ngrp_had) {

				if (np->nd_resvp) {
					wnodes[*widx] = np;
					*widx += 1;
				}
				for (psub = np->nd_psn; psub != 0; psub = psub->next) {
					if (psub->jobs) {
						wnodes[*widx] = np;
						*widx += 1;
					}
				}
			}
		}
	} else if (warning_ok == 1 && wcode == WARN_ngrp_ck) {
		if (rscdef != NULL) {
			resc = find_resc_entry(get_nattr(np, ND_ATR_ResourceAvail), rscdef);
			if (resc != NULL)
				ngrp_had = 1;
			else
				ngrp_had = 0;
		}
	}
}

/**
 * @brief
 * 		warn_msg_build - assembles the appropriate warning message
 *
 * @param[in]	wcode	- "warning code", determines the processing that occurs.
 * @param[out]	wnodes	- warnings array
 * @param[in,out]	widx	- index inside warnings array where the node is getting added
 *
 * @return	pointer to assembled message
 * @retval	NULL	- pointer if can't build message
 *
 * @note
 * Calling party RESPONSIBLE for freeing dynamic memory that
 * is acquired by this function.
 */

char *
warn_msg_build(int wcode, pbsnode **wnodes, int widx)
{
	char whead[] = "WARNING: modified grouping resource on node(s) with reservation(s)/job(s) - ";
	char nohead[] = "";
	char *wmsg;
	char *phead;
	int i, len;

	if (widx == 0)
		return NULL;

	if (wcode == WARN_ngrp)
		phead = whead;
	else
		phead = nohead;

	for (len = strlen(phead), i = 0; i < widx; ++i)
		len += strlen(wnodes[i]->nd_name) + 2; /* 2: ", " */

	if ((wmsg = malloc(len + 1)) == NULL)
		return NULL;

	strcpy(wmsg, phead);
	for (i = 0; i < widx; ++i) {
		strcat(wmsg, wnodes[i]->nd_name);
		strcat(wmsg, ", ");
	}
	wmsg[strlen(wmsg) - 2] = '\0'; /* overwrite trailing ", " */
	return (wmsg);
}

/**
 * @brief
 * 		check_que_attr - check if attributes in request are consistent with
 *		the current queue type.  This is called when creating or setting
 *		the attributes of a queue.
 *
 * @param[in]	pque	- current queue
 *
 * @return	char *
 * @retval	NULL	- if all ok
 * @retval	NULL	- name if bad attribute is not ok
 */

static char *
check_que_attr(pbs_queue *pque)
{
	int i;
	int type;

	type = pque->qu_qs.qu_type; /* current type of queue */
	for (i = 0; i < (int) QA_ATR_LAST; ++i) {
		if (is_qattr_set(pque, i)) {
			if (que_attr_def[i].at_parent == PARENT_TYPE_QUE_ALL) {
				continue;
			} else if (que_attr_def[i].at_parent == PARENT_TYPE_QUE_EXC) {
				if (type == QTYPE_Unset)
					type = QTYPE_Execution;
				else if (type != QTYPE_Execution)
					return (que_attr_def[i].at_name);

			} else if (que_attr_def[i].at_parent == PARENT_TYPE_QUE_RTE) {
				if (type == QTYPE_Unset)
					type = QTYPE_RoutePush;
				else if (type != QTYPE_RoutePush)
					return (que_attr_def[i].at_name);
			}
		}
	}

	return NULL; /* all attributes are ok */
}
/**
 * @brief
 * 		Set resource limit on resources. If resource limits can not be set
 * 		on any resources, return error. Resource limit can not be set on
 * 		min_walltime and max_walltime.
 *
 * @param[in]	old_list	-  existing attribute list
 * @param[in]	new_list	- new attribute list
 * @param[in]	op	- operation e.g. "SET"
 *
 * @return	success/failure
 * @retval	=0	- OK
 * @retval  >0	- error.
 *
 */

int
set_resources_min_max(attribute *old, attribute *new, enum batch_op op)
{
	if (op == SET) {
		resource_def *resdef = NULL;
		resource *pres = NULL;
		resdef = &svr_resc_def[RESC_MIN_WALLTIME];
		pres = find_resc_entry(new, resdef);
		if (pres != NULL)
			return PBSE_NOLIMIT_RESOURCE;
		resdef = &svr_resc_def[RESC_MAX_WALLTIME];
		pres = find_resc_entry(new, resdef);
		if (pres != NULL)
			return PBSE_NOLIMIT_RESOURCE;
	}
	return (set_resc(old, new, op));
}
/**
 * @brief
 * 		check_que_enable - check if attempt to enable incompletely defined queue
 *		This is the at_action() routine for QA_ATR_Enabled
 *
 * @param[in]	pattr	- attribute structure
 * @param[in]	pque	- queue
 * @param[in]	mode	- not used here
 *
 * @return	error code
 * @retval	0	- success
 * @retval	!=0	- failure
 */

int
check_que_enable(attribute *pattr, void *pque, int mode)
{
	if (pattr->at_val.at_long != 0) {

		/*
		 * admin attempting to  enabled queue,
		 * is it completely defined
		 */

		if (((pbs_queue *) pque)->qu_qs.qu_type == QTYPE_Unset)
			return (PBSE_QUENOEN);
		else if (((pbs_queue *) pque)->qu_qs.qu_type == QTYPE_RoutePush) {
			if (!is_qattr_set((pbs_queue *) pque, QR_ATR_RouteDestin) || (get_qattr_arst((pbs_queue *) pque, QR_ATR_RouteDestin))->as_usedptr == 0)
				return (PBSE_QUENOEN);
		}
	}
	return (0); /* ok to enable queue */
}

/**
 * @brief
 * 		Check the requested value of the queue type attribute
 *		and set qu_type accordingly if there are no conflicts with
 *		route-only or execution-only attributes.
 *		This is the at_action() routine for QA_ATR_QType
 *
 * @param[in]	pattr - pointer to the attribute being set
 * @param[in]	pque  - pointer to parent object (queue)
 * @param[in]	mode  - mode of operation: set, recovery, ... unused here
 *
 * @return	error code
 * @retval	0	- success
 * @retval	!=0	- error
 */

int
set_queue_type(attribute *pattr, void *pque, int mode)
{
	int i;
	char *pca;
	char *pcv;
	int spectype;
	static struct {
		int type;
		char *name;
	} qt[2] = {
		{QTYPE_Execution, "Execution"},
		{QTYPE_RoutePush, "Route"}};

	if (!is_attr_set(pattr))
		/* better be set or we shouldn't be here */
		return (PBSE_BADATVAL);

	/* does the requested value match a legal value? */

	for (i = 0; i < 2; i++) {
		spectype = qt[i].type;
		pca = pattr->at_val.at_str;
		pcv = qt[i].name;
		if (*pca == '\0')
			return (PBSE_BADATVAL);

		while (*pca) {
			if (toupper((int) *pca++) != toupper((int) *pcv++)) {
				spectype = -1; /* no match */
				break;
			}
		}

		if (spectype != -1) { /* set up the attribute */

			/* If not an Execution queue, cannot */
			/* have nodes allocated to it        */
			if ((spectype != QTYPE_Execution) &&
			    is_qattr_set((pbs_queue *) pque, QE_ATR_HasNodes) &&
			    get_qattr_long((pbs_queue *) pque, QE_ATR_HasNodes) != 0) {
				return (PBSE_ATTRTYPE);
			} else {
				if (is_qattr_set((pbs_queue *) pque, QA_ATR_partition) &&
				    (spectype == QTYPE_RoutePush)) {
					return PBSE_CANNOT_SET_ROUTE_QUE;
				}
			}
			((pbs_queue *) pque)->qu_qs.qu_type = spectype;
			(void) free(pattr->at_val.at_str);
			pattr->at_val.at_str = malloc(strlen(qt[i].name) + 1);
			if (pattr->at_val.at_str == NULL)
				return (PBSE_SYSTEM);
			(void) strcpy(pattr->at_val.at_str, qt[i].name);
			pattr->at_flags |= ATR_MOD_MCACHE;
			return (0);
		}
	}
	return (PBSE_BADATVAL);
}

/**
 * @brief
 * 		mgr_log_attr - log the change of an attribute
 *
 * @param[in]	msg	- log message
 * @param[in]	plist	- svrattrl list header
 * @param[in]	logclass	- see log.h
 * @param[in]	objname	- object being modified
 * @param[in]	hookname	- for adding 'by <hookname>' msg
 */

void
mgr_log_attr(char *msg, struct svrattrl *plist, int logclass, char *objname, char *hookname)
{
	char *pstr;

	while (plist) {
		(void) strcpy(log_buffer, msg);
		(void) strcat(log_buffer, plist->al_name);
		if (plist->al_rescln) {
			(void) strcat(log_buffer, ".");
			(void) strcat(log_buffer, plist->al_resc);
		}
		if (plist->al_op == INCR)
			pstr = " + ";
		else if (plist->al_op == DECR)
			pstr = " - ";
		else
			pstr = " = ";
		(void) strcat(log_buffer, pstr);
		if (plist->al_valln)
			(void) strncat(log_buffer, plist->al_value,
				       LOG_BUF_SIZE - strlen(log_buffer) - 1);

		if (hookname != NULL) {
			(void) strncat(log_buffer, " by ",
				       LOG_BUF_SIZE - strlen(log_buffer) - 1);
			(void) strncat(log_buffer, hookname,
				       LOG_BUF_SIZE - strlen(log_buffer) - 1);
		}

		log_buffer[LOG_BUF_SIZE - 1] = '\0';
		log_event(PBSEVENT_ADMIN, logclass, LOG_INFO, objname, log_buffer);
		plist = (struct svrattrl *) GET_NEXT(plist->al_link);
	}
}

/**
 * @brief
 * 		unset_indirect - unset the indirect target for a node resource_available
 *
 * @param[in]	presc	- pointer to resource structure
 * @param[in]	pidx    - search index of the attribute array
 * @param[in]	name	- checks whether name attribute is "resources_available"
 * @param[in]	pobj	- Vnode structure
 * @param[in]	objtype	- it tells node is parent type or not
 */
static void
unset_indirect(resource *presc, void *pidx, attribute_def *pdef, char *name, void *pobj, int objtype)
{
	int i;
	struct pbsnode *pnode;
	resource_def *prdef;

	if (objtype != PARENT_TYPE_NODE)
		return;

	pnode = (struct pbsnode *) pobj;
	(void) fix_indirect_resc_targets(pnode, presc, ND_ATR_ResourceAvail, 0);
	free_str(&presc->rs_value);

	/* Now,  if and only if the above attrbute was "resources_available" */
	/* find and unset indirectness and clear for "resources_assigned"    */

	if (strcasecmp(name, ATTR_rescavail) != 0)
		return;

	i = find_attr(pidx, pdef, ATTR_rescassn);
	if (i < 0)
		return;

	prdef = presc->rs_defin;
	presc = find_resc_entry(get_nattr(pnode, i), prdef);
	if (presc) {
		if (presc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
			(void) fix_indirect_resc_targets(pnode, presc, ND_ATR_ResourceAssn, 0);
			free_str(&presc->rs_value);
		}
	}
	return;
}

/*
 * @brief
 * 		Set attributes for manager function.
 *
 * @param[in]	pattr	- Address of the parent objects attribute array
 * @param[in]	pidx	- Search index for the attribute def array
 * @param[in]	pdef	- Address of attribute definition array
 * @param[in]	limit	- Last attribute in the list
 * @param[in]	plist	- List of attributes to set
 * @param[in]	privil	- Permission list
 * @param[out]	bad 	- A bad attributes index is returned in this param
 *		       				This actually returns the bad index + 1.
 * @param[in]   parent	- Pointer to the parent object
 * @param[in]   mode 	- operation mode.
 * @param[in]   allow_unkresc	- set to TRUE to allow unknown resource values;
 * 									otherwise, FALSE.
 *
 * @return	Error code
 * @retval	PBSE_NONE  - Success
 * @retval	! PBSE_NONE - Failure
 *
 * @note
 *		The set operation is performed as an atomic operation: all specified
 *		attributes must be successfully set, or none are modified.
 */

static int
mgr_set_attr2(attribute *pattr, void *pidx, attribute_def *pdef, int limit, svrattrl *plist, int privil, int *bad, void *parent, int mode, int allow_unkresc)
{
	int index;
	attribute *new;
	attribute *pre_copy;
	attribute *pnew;
	attribute *pold;
	attribute *attr_save;
	int rc;
	resource *presc;
	resource *oldpresc;

	if (plist == NULL)
		return (PBSE_NONE);

	/*
	 * We have multiple attribute lists in play here.  pre_copy is used
	 * to copy the attributes into pattr prior to calling the action functions.
	 * This means the object passed to the action function is fully up to date.
	 * new is attribute list which the action functions are called with.  new
	 * may be modified by the action functions, so we need to copy these to pattr
	 * a second time.  Lastly we have attr_save.  It is a copy of the object's
	 * attributes prior to any change.  If any action function fails, we copy
	 * attr_copy back to the real attributes before leaving the function.
	 */

	new = (attribute *) calloc((unsigned int) limit, sizeof(attribute));
	if (new == NULL)
		return (PBSE_SYSTEM);

	/* Below says if 'allow_unkresc' is TRUE, then set 'unkn' param
	 * of attr_atomic_set() to '1'; otherwise, set it to '-1' meaning
	 * not to allow unknown resource
	 */
	if ((rc = attr_atomic_set(plist, pattr, new, pidx, pdef, limit, (allow_unkresc ? 1 : -1), privil, bad)) != 0) {
		attr_atomic_kill(new, pdef, limit);
		return (rc);
	}

	pre_copy = (attribute *) calloc((unsigned int) limit, sizeof(attribute));
	if (pre_copy == NULL) {
		attr_atomic_kill(new, pdef, limit);
		return (PBSE_SYSTEM);
	}

	attr_atomic_copy(pre_copy, new, pdef, limit);

	attr_save = calloc((unsigned int) limit, sizeof(attribute));
	if (attr_save == NULL) {
		attr_atomic_kill(new, pdef, limit);
		attr_atomic_kill(pre_copy, pdef, limit);
		return (PBSE_SYSTEM);
	}

	attr_atomic_copy(attr_save, pattr, pdef, limit);

	for (index = 0; index < limit; index++) {
		pnew = pre_copy + index;
		pold = pattr + index;
		if (pnew->at_flags & ATR_VFLAG_MODIFY) {
			/* Special test, aka kludge, for entity-limits, make sure
			 * not accepting an entity without an actual limit; i.e.
			 * [u:user] instead of [u:user=limit].  The [u:user] form
			 * is allowed in the "unset" attribute function in which
			 * case the entry isn't present when it gets here
			 */

			if ((pdef + index)->at_type == ATR_TYPE_ENTITY) {
				svr_entlim_leaf_t *pleaf;
				void *unused = NULL;

				while ((pleaf = entlim_get_next((new + index)->at_val.at_enty.ae_tree, &unused)) != NULL) {

					/* entry that is Modified, and not Set meant it had a null value - illegal */
					if ((pleaf->slf_limit.at_flags & (ATR_VFLAG_SET | ATR_VFLAG_MODIFY)) == ATR_VFLAG_MODIFY) {
						*bad = index + 1;
						attr_atomic_kill(new, pdef, limit);
						attr_atomic_kill(pre_copy, pdef, limit);
						attr_atomic_kill(attr_save, pdef, limit);
						return (PBSE_BADATVAL);
					}
				}
			}

			/* now replace the old values with any modified new values */

			(pdef + index)->at_free(pold);
			pold->at_flags = pnew->at_flags; /* includes MODIFY */

			if (pold->at_type == ATR_TYPE_LIST) {
				list_move(&pnew->at_val.at_list, &pold->at_val.at_list);
			} else if (pold->at_type == ATR_TYPE_RESC) {
				set_resc(pold, pnew, INCR);
				/* clear ATR_VFLAG_DEFLT on modified values */
				for (presc = GET_NEXT(pold->at_val.at_list);
				     presc;
				     presc = GET_NEXT(presc->rs_link)) {
					if (presc->rs_value.at_flags & ATR_VFLAG_MODIFY) {
						presc->rs_value.at_flags &= ~ATR_VFLAG_DEFLT;
					}
				}
				for (presc = GET_NEXT(pnew->at_val.at_list);
				     presc;
				     presc = GET_NEXT(presc->rs_link)) {
					if ((presc->rs_value.at_flags & ATR_VFLAG_MODIFY) == 0) {
						if (presc->rs_value.at_flags & ATR_VFLAG_DEFLT) {
							oldpresc = find_resc_entry(pold,
										   presc->rs_defin);
							if (oldpresc) {
								oldpresc->rs_value.at_flags |= ATR_VFLAG_DEFLT;
							}
						}
					}
				}
				(pdef + index)->at_free(pnew);
			} else {
				/*
				 * copy value from new into old including pointers to
				 * strings and array of strings, clear the
				 * "new" attribute so those "pointers" are not freed
				 * when "new" is freed later
				 */
				*pold = *pnew;
				clear_attr(pnew, pdef + index);
			}
		}
	}

	for (index = 0; index < limit; index++) {
		/*
		 * for each attribute which is to be modified, call the
		 * at_action routine for the attribute, if one exists, with the
		 * new value.  If the action fails, undo everything.
		 */
		if ((new + index)->at_flags & ATR_VFLAG_MODIFY) {
			if ((pdef + index)->at_action) {
				rc = (pdef + index)->at_action((new + index), parent, mode);
				if (rc) {
					*bad = index + 1;
					attr_atomic_kill(new, pdef, limit);
					attr_atomic_kill(pre_copy, pdef, limit);
					attr_atomic_copy(pattr, attr_save, pdef, limit);
					attr_atomic_kill(attr_save, pdef, limit);
					return (rc);
				}
			}
		}
	}

	/* The action functions might have modified new.  Need to set pattr again */

	for (index = 0; index < limit; index++) {
		pnew = new + index;
		pold = pattr + index;
		if (pnew->at_flags & ATR_VFLAG_MODIFY) {
			(pdef + index)->at_free(pold);
			pold->at_flags = pnew->at_flags; /* includes MODIFY */

			if (pold->at_type == ATR_TYPE_LIST) {
				list_move(&pnew->at_val.at_list, &pold->at_val.at_list);
			} else if (pold->at_type == ATR_TYPE_RESC) {
				set_resc(pold, pnew, INCR);
				/* clear ATR_VFLAG_DEFLT on modified values */
				for (presc = GET_NEXT(pold->at_val.at_list);
				     presc;
				     presc = GET_NEXT(presc->rs_link)) {
					if (presc->rs_value.at_flags & ATR_VFLAG_MODIFY) {
						presc->rs_value.at_flags &= ~ATR_VFLAG_DEFLT;
					}
				}
				for (presc = GET_NEXT(pnew->at_val.at_list);
				     presc;
				     presc = GET_NEXT(presc->rs_link)) {
					if ((presc->rs_value.at_flags & ATR_VFLAG_MODIFY) == 0) {
						if (presc->rs_value.at_flags & ATR_VFLAG_DEFLT) {
							oldpresc = find_resc_entry(pold,
										   presc->rs_defin);
							if (oldpresc) {
								oldpresc->rs_value.at_flags |= ATR_VFLAG_DEFLT;
							}
						}
					}
				}
				(pdef + index)->at_free(pnew);
			} else {
				/*
				 * copy value from new into old including pointers to
				 * strings and array of strings, clear the
				 * "new" attribute so those "pointers" are not freed
				 * when "new" is freed later
				 */
				*pold = *pnew;
				clear_attr(pnew, pdef + index);
			}
		}
	}

	/*
	 * we have moved all the "external" values to the old array, thus
	 * we just free the new array, NOT call at_free on each.
	 */
	free(new);
	free(pre_copy);
	attr_atomic_kill(attr_save, pdef, limit);
	if (pdef->at_parent == PARENT_TYPE_NODE)
		((pbsnode *)parent)->nd_modified = 1;
	return (PBSE_NONE);
}

/**
 * @brief
 * 		Wrapper function to 'mgr_set_attr2()' without the 'allow_unkresc'
 * 		argument.
 *
 * @param[in]	pattr	- Address of the parent objects attribute array
 * @param[in]	pidx	- Search index for the attribute def array
 * @param[in]	pdef	- Address of attribute definition array
 * @param[in]	limit	- Last attribute in the list
 * @param[in]	plist	- List of attributes to set
 * @param[in]	privil	- Permission list
 * @param[out]	bad 	- A bad attributes index is returned in this param
 *		       				This actually returns the bad index + 1.
 * @param[in]   parent	- Pointer to the parent object
 * @param[in]   mode 	- operation mode.
 *
 * @return	Error code
 * @retval	PBSE_NONE  - Success
 * @retval	! PBSE_NONE - Failure
 **/
int
mgr_set_attr(attribute *pattr, void *pidx, attribute_def *pdef, int limit, svrattrl *plist, int privil, int *bad, void *parent, int mode)
{
	return (mgr_set_attr2(pattr, pidx, pdef, limit, plist, privil, bad, parent, mode, FALSE));
}

/**
 * @brief
 *		Unset (clear) attributes for manager function
 *
 *		Operation depends on type of attribute and if a resource is specified.
 *		For a attribute of type ATR_TYPE_RESC:
 *	  	If a resource name is specified, unset only that resource entry.
 *	  	If a resource name is not specified, unset the whole attribute.
 *		For a attribute of type ATR_TYPE_ENTITY:
 *	  	If a resource name is specified, unset only entries with that resc
 *	  	If a resource name is not specified, unset the whole attribute.
 *		For "normal" attributes, unset the entire attribute.
 *
 * @param[in]	pattr	- Address of the parent objects attribute array
 * @param[in]	pidx	- Search index of the attribute array
 * @param[in]	pdef	- Address of attribute definition array
 * @param[in]	limit 	- Last attribute in the list
 * @param[in]	plist 	- List of attributes to unset.
 * @param[in]	privil	- Permission list.  A value of -1 is an override that
 * 			 				bypasses the check for permissions, used internally by
 * 			 				the server
 * @param[out]	bad  	- A bad attributes index is returned in this param
 * @param[in]	pobj 	- Pointer to the parent object
 * @param[in] 	ptype 	- Type of the parent object
 * @param[in] 	rflag 	- INDIRECT_RES_UNLINK will unlink indirect resources
 * 		     				INDIRECT_RES_CHECK will return an error if an indirect
 * 		    			 	resource is set
 *
 * @return	Success/Failure
 * @retval	0	- Success
 * @retval	-1  - Failure
 */
static int
mgr_unset_attr(attribute *pattr, void *pidx, attribute_def *pdef, int limit, svrattrl *plist, int privil, int *bad, void *pobj, int ptype, enum res_op_flag rflag)
{
	void *parent_id = NULL;
	pbs_db_attr_list_t db_attr_list;
	int do_indirect_check = 0;
	int index;
	int ord;
	int rc;
	svrattrl *pl;
	resource_def *prsdef;
	resource *presc;
	struct pbsnode *pnode = pobj;
	void *conn = (void *) svr_db_conn;
	pbs_db_obj_info_t obj;
	obj.pbs_db_un.pbs_db_job = NULL;

	/* first check the attribute exists and we have privilege to set */
	ord = 0;
	pl = plist;
	while (pl) {
		ord++;
		index = find_attr(pidx, pdef, pl->al_name);
		if (index < 0) {
			*bad = ord;
			return (PBSE_NOATTR);
		}

		/* have we privilege to unset the attribute ? */

		if ((privil != -1) && ((pdef + index)->at_flags & privil & ATR_DFLAG_WRACC) == 0) {
			*bad = ord;
			return (PBSE_ATTRRO);
		}
		if (((pdef + index)->at_type == ATR_TYPE_RESC) &&
		    (pl->al_resc != NULL)) {

			/* check the individual resource */

			prsdef = find_resc_def(svr_resc_def, pl->al_resc);
			if (prsdef == NULL) {
				*bad = ord;
				return (PBSE_UNKRESC);
			}
			if ((privil != -1) && ((prsdef->rs_flags & privil & ATR_DFLAG_WRACC) == 0)) {
				*bad = ord;
				return (PBSE_PERM);
			}
			presc = find_resc_entry(pattr + index, prsdef);
			if (presc &&
			    (presc->rs_value.at_flags & ATR_VFLAG_TARGET)) {
				if (rflag == INDIRECT_RES_UNLINK) {
					presc->rs_value.at_flags &= ~ATR_VFLAG_TARGET;
				} else {
					*bad = ord;
					return (PBSE_OBJBUSY);
				}
			}
			if ((pnode->nd_state & INUSE_PROV) &&
			    !strcmp(prsdef->rs_name, "aoe")) {
				*bad = ord;
				return (PBSE_NODEPROV_NOACTION);
			}
		}
		if ((pnode->nd_state & INUSE_PROV) &&
		    !strcmp((pdef + index)->at_name, ATTR_NODE_current_aoe)) {
			*bad = ord;
			return (PBSE_NODEPROV_NOACTION);
		}

		pl = (svrattrl *) GET_NEXT(pl->al_link);
	}

	/* ok, now clear them */
	db_attr_list.attr_count = 0;
	CLEAR_HEAD(db_attr_list.attrs);

	while (plist) {
		index = find_attr(pidx, pdef, plist->al_name);
		if (encode_single_attr_db((pdef + index), (pattr + index), &db_attr_list) != 0)
			return (PBSE_NOATTR);

		if (((pdef + index)->at_type == ATR_TYPE_RESC) &&
		    (plist->al_resc != NULL)) {

			/* attribute of type resource and specified resource */
			/* free resource member, not the attribute */

			prsdef = find_resc_def(svr_resc_def, plist->al_resc);
			presc = find_resc_entry(pattr + index, prsdef);
			if (presc) {
				if ((ptype != PARENT_TYPE_SERVER) ||
				    (index != (int) SVR_ATR_resource_cost)) {

					unset_signature(pnode, prsdef->rs_name);
					if ((ptype == PARENT_TYPE_NODE) && (presc->rs_value.at_flags & ATR_VFLAG_INDIRECT)) {
						unset_indirect(presc, pidx, pdef, plist->al_name, pobj, ptype);
						do_indirect_check = 1;
					}
					prsdef->rs_free(&presc->rs_value);
				}
				delete_link(&presc->rs_link);
				free(presc);
				presc = NULL;
			}
			/* If the last resource has been delinked from  */
			/* the attribute,  "unset" the attribute itself */
			presc = (resource *) GET_NEXT((pattr + index)->at_val.at_list);
			if (presc == NULL)
				mark_attr_not_set(pattr + index);
			(pattr + index)->at_flags |= ATR_MOD_MCACHE;

		} else if (((pdef + index)->at_type == ATR_TYPE_ENTITY) &&
			   (plist->al_resc != NULL)) {

			/* attribute of type ENTITY and specifed resource */
			/* unset the entity limit on that resource for    */
			/* all entities */

			unset_entlim_resc(pattr + index, plist->al_resc);

		} else {

			/* either the attribute is not of type ENTITY or RESC */
			/* or there is no specific resource specified         */
			if ((pdef + index)->at_type == ATR_TYPE_RESC) {

				/* if a resource type, check each for being indirect */
				presc = (resource *) GET_NEXT((pattr + index)->at_val.at_list);
				while (presc) {
					if (presc->rs_value.at_flags & ATR_VFLAG_INDIRECT) {
						unset_indirect(presc, pidx, pdef, plist->al_name, pobj, ptype);
						do_indirect_check = 1;
					}
					presc = (resource *) GET_NEXT(presc->rs_link);
				}
			}

			/* now free the whole attribute */

			(pdef + index)->at_free(pattr + index);
			(pattr + index)->at_flags |= ATR_VFLAG_MODIFY;
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	/* now delete the collected list from the database */
	switch (ptype) {
		case PARENT_TYPE_SERVER:
			obj.pbs_db_obj_type = PBS_DB_SVR;
			parent_id = 0;
			break;

		case PARENT_TYPE_SCHED:
			obj.pbs_db_obj_type = PBS_DB_SCHED;
			parent_id = ((pbs_sched *) pobj)->sc_name;
			break;

		case PARENT_TYPE_NODE:
			obj.pbs_db_obj_type = PBS_DB_NODE;
			parent_id = pnode->nd_name;
			break;

		case PARENT_TYPE_QUE_ALL:
			obj.pbs_db_obj_type = PBS_DB_QUEUE;
			parent_id = ((pbs_queue *) pobj)->qu_qs.qu_name;
			break;

		case PARENT_TYPE_JOB:
			obj.pbs_db_obj_type = PBS_DB_JOB;
			parent_id = ((job *) pobj)->ji_qs.ji_jobid;
			break;

		case PARENT_TYPE_RESV:
			obj.pbs_db_obj_type = PBS_DB_RESV;
			parent_id = ((resc_resv *) pobj)->ri_qs.ri_resvID;
			break;
	}

	rc = pbs_db_delete_attr_obj(conn, &obj, parent_id, &db_attr_list);
	free_db_attr_list(&db_attr_list);

	if (rc != 0)
		return -1;

	if (do_indirect_check)
		indirect_target_check(0);
	return (0);
}

/**
 * @brief
 *		Process request to create a queue
 *
 *		Creates queue and calls mgr_set_attr to set queue attributes.
 *
 * @param[in]	preq	- Pointer to a batch request structure
 */

void
	mgr_queue_create(struct batch_request *preq)
{
	int bad;
	char *badattr;
	svrattrl *plist;
	pbs_queue *pque;
	int rc;

	rc = strlen(preq->rq_ind.rq_manager.rq_objname);

	if ((rc > PBS_MAXQUEUENAME) || (rc == 0)) {
		req_reject(PBSE_QUENBIG, 0, preq);
		return;
	}
	if (find_queuebyname(preq->rq_ind.rq_manager.rq_objname)) {
		req_reject(PBSE_QUEEXIST, 0, preq);
		return;
	}

	pque = que_alloc(preq->rq_ind.rq_manager.rq_objname);

	/* set the queue attributes */

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	rc = mgr_set_attr(pque->qu_attr, que_attr_idx, que_attr_def, QA_ATR_LAST, plist, preq->rq_perm, &bad, (void *) pque, ATR_ACTION_NEW);
	if (rc != 0) {
		reply_badattr(rc, bad, plist, preq);
		que_free(pque);
		pque = NULL;
	} else {
		que_save_db(pque);

		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_QUEUE, LOG_INFO, pque->qu_qs.qu_name, msg_manager, msg_man_cre, preq->rq_user, preq->rq_host);
		mgr_log_attr(msg_man_set, plist, PBS_EVENTCLASS_QUEUE, preq->rq_ind.rq_manager.rq_objname, NULL);

		/* check the appropriateness of the attributes vs. queue type */

		if ((badattr = check_que_attr(pque)) != NULL) {
			/* miss match, issue warning */
			(void) sprintf(log_buffer, msg_attrtype, pque->qu_qs.qu_name, badattr);
			(void) reply_text(preq, PBSE_ATTRTYPE, log_buffer);
		} else {
			reply_ack(preq);
		}
	}
}

/**
 * @brief
 *		Delete a queue
 *
 * @par
 * 		The queue must be empty of jobs
 * @param[in,out]	preq	- Pointer to a batch request structure
 *     							 The request can be rejected with the following error codes:
 *       						PBSE_OBJBUSY returned if it is attached to a reservation/node or if the queue fails to get deleted
 *       						PBSE_UNKQUE returned if the queue is unknown
 *       						PBSE_SYSTEM returned for system issues like failure to allocate memory
 *
 * @par
 * 		Acknowledgement reply sent to the batch request(preq) upon successful deletion of the queue
 */

void
mgr_queue_delete(struct batch_request *preq)
{
	int i;
	int j;
	int total_queues;
	int len;
	char *problem_names;
	int problem_cnt;
	char *name;
	pbs_queue *pque = NULL;
	pbs_queue *next_queue = NULL;
	int rc;
	int type = 0;
	struct pbs_queue **problem_queues = NULL;

	name = preq->rq_ind.rq_manager.rq_objname;

	if ((*name == '\0') || (*name == '@')) {
		type = 1;
	}

	/* get the queue to be deleted */
	if (type == 0) {
		pque = find_queuebyname(name);
	} else {
		problem_queues = (struct pbs_queue **) malloc(server.sv_qs.sv_numque * sizeof(struct pbs_queue *));
		if (problem_queues == NULL) {
			log_err(ENOMEM, __func__, "out of memory");
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		problem_cnt = 0;
		pque = (pbs_queue *) GET_NEXT(svr_queues);
	}

	/* if the queue is unknown, reject the request */
	if (pque == NULL) {
		free(problem_queues);
		req_reject(PBSE_UNKQUE, 0, preq);
		return;
	}

	total_queues = server.sv_qs.sv_numque;

	for (j = 0; (pque != NULL) && (j < total_queues); j++) {
		rc = 0;
		/* Do not allow deletion of a queue associated to a reservation, unless
		 * it is coming from the server itself */
		if ((pque->qu_resvp != NULL) && (preq->rq_conn != PBS_LOCAL_CONNECTION)) {
			rc = PBSE_OBJBUSY;
		}

		/* are there nodes associated with the queue */

		for (i = 0; i < svr_totnodes; i++) {
			if (pbsndlist[i]->nd_pque == pque) {
				rc = PBSE_OBJBUSY;
				break;
			}
		}

		/* if modification is for all queues, get the next queue if the present queue will be deleted successfully */

		if (type == 1) {
			next_queue = (pbs_queue *) GET_NEXT(pque->qu_link);
		}

		if (rc == 0) {
			char queue_name[PBS_MAXQUEUENAME + 1];
			/* Save the queue name before we purge it so it will appear in the log.  */
			pbs_strncpy(queue_name, pque->qu_qs.qu_name, sizeof(queue_name));
			if ((rc = que_purge(pque)) != 0) {
				rc = PBSE_OBJBUSY;
			} else
				log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_QUEUE, LOG_INFO, queue_name, msg_manager, msg_man_del, preq->rq_user, preq->rq_host);
		}
		if (rc != 0) {
			if (type == 1) {
				if (problem_queues) /*we have an array in which to save*/
					problem_queues[problem_cnt] = pque;
				++problem_cnt;
			} else {
				req_reject(rc, 0, preq);
				return;
			}
		}

		/* Get the next queue if all queues need to be deleted
		 * from the default server */
		if (type == 1) {
			pque = next_queue;
		} else {
			break;
		}
	}

	if (type == 1) { /*modification was for all queues  */

		if (problem_cnt) { /*one or more problems encountered*/

			for (len = 0, i = 0; i < problem_cnt; i++)
				len = strlen(problem_queues[i]->qu_qs.qu_name) + 3;

			len += strlen(pbse_to_txt(PBSE_OBJBUSY));

			if ((problem_names = malloc(len)) != NULL) {

				strcpy(problem_names, pbse_to_txt(PBSE_OBJBUSY));
				for (i = 0; i < problem_cnt; i++) {
					if (i)
						strcat(problem_names, ", ");
					strcat(problem_names, " ");
					strcat(problem_names, problem_queues[i]->qu_qs.qu_name);
				}

				(void) reply_text(preq, PBSE_OBJBUSY, problem_names);
				free(problem_names);
				problem_names = NULL;
			} else {
				(void) reply_text(preq, PBSE_SYSTEM, pbse_to_txt(PBSE_SYSTEM));
			}
		}

		free(problem_queues);
		problem_queues = NULL;

		if (problem_cnt) { /*reply has already been sent  */
			return;
		}
	}

	reply_ack(preq);
}

/**
 * @brief
 *		Set Server Attribute Values
 *
 *		Sets the requested attributes and returns a reply
 *
 * @param[in]	preq	- Pointer to a batch request structure
 * @param[in]	conn	- Pointer to a connection structure assosiated with preq
 */

void
mgr_server_set(struct batch_request *preq, conn_t *conn)
{
	int bad_attr = 0;
	svrattrl *plist, *psvrat;
	pbs_list_head setlist;
	pbs_list_head unsetlist;
	int rc;
	int has_log_events = 0;

	CLEAR_HEAD(setlist);
	CLEAR_HEAD(unsetlist);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	/*Only root at server host can set server attribute "acl_roots".*/
	while (plist) {
		if (strcmp(plist->al_name, ATTR_logevents) == 0)
			has_log_events = 1;
		if (strcasecmp(plist->al_name, ATTR_aclroot) == 0) {
			if (!is_local_root(preq->rq_user, preq->rq_host)) {
				reply_badattr(PBSE_ATTRRO, bad_attr, plist, preq);
				return;
			}
		}
		/*
		 * We do not overwrite/update the entire record in the database. Therefore, to
		 * unset attributes, we will need to find out the ones with a 0 or NULL value set.
		 * We create a separate list for removal from the list of attributes provided, and
		 * pass it to mgr_unset_attr, below
		 */
		psvrat = dup_svrattrl(plist);
		if (psvrat == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			free_attrlist(&setlist);
			free_attrlist(&unsetlist);
			return;
		}
		if (psvrat->al_atopl.value == NULL || psvrat->al_atopl.value[0] == '\0')
			append_link(&unsetlist, &psvrat->al_link, psvrat);
		else
			append_link(&setlist, &psvrat->al_link, psvrat);

		plist = (struct svrattrl *) GET_NEXT(plist->al_link);
	}

	/* if the unsetist has attributes, call server_unset to remove them separately */
	plist = (svrattrl *) GET_NEXT(unsetlist);
	if (plist) {
		rc = mgr_unset_attr(server.sv_attr, svr_attr_idx, svr_attr_def, SVR_ATR_LAST, plist,
				    preq->rq_perm, &bad_attr, (void *) &server, PARENT_TYPE_SERVER, INDIRECT_RES_CHECK);
		if (rc != 0) {
			reply_badattr(rc, bad_attr, plist, preq);
			free_attrlist(&setlist);
			free_attrlist(&unsetlist);
			return;
		}
	}

	plist = (svrattrl *) GET_NEXT(setlist);
	if (!plist)
		goto done;

	rc = mgr_set_attr(server.sv_attr, svr_attr_idx, svr_attr_def, SVR_ATR_LAST, plist,
			  preq->rq_perm, &bad_attr, (void *) &server,
			  ATR_ACTION_ALTER);
	if (rc != 0) {
		reply_badattr(rc, bad_attr, plist, preq);
	} else {
		svr_save_db(&server);
	done:
		free_attrlist(&setlist);
		free_attrlist(&unsetlist);

		if (has_log_events)
			*log_event_mask = get_sattr_long(SVR_ATR_log_events);
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_INFO, msg_daemonname, msg_manager, msg_man_set, preq->rq_user, preq->rq_host);
		mgr_log_attr(msg_man_set, GET_NEXT(preq->rq_ind.rq_manager.rq_attr), PBS_EVENTCLASS_SERVER, msg_daemonname, NULL);
		reply_ack(preq);
	}
}

/**
 * @brief
 *		Unset (clear) Server Attribute Values
 *
 *		Clears the requested attributes and returns a reply
 *
 * @param[in]	preq	- Pointer to a batch request structure
 * @param[in]	conn	- Pointer to a connection structure assosiated with preq
 */

void
mgr_server_unset(struct batch_request *preq, conn_t *conn)
{
	int bad_attr = 0;
	svrattrl *plist;
	int rc;

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);

	/* Check unsetting pbs_license_info,			*/
	/*                 pbs_license_min,			*/
	/*                 pbs_license_max,			*/
	/*                 pbs_license_linger_time.		*/
	while (plist) {
		if (strcasecmp(plist->al_name, ATTR_aclroot) == 0) {
			/*Only root at server host can unset server attribute "acl_roots".*/
			if (!is_local_root(preq->rq_user, preq->rq_host)) {
				reply_badattr(PBSE_ATTRRO, bad_attr, plist, preq);
				return;
			}
		} else if (strcasecmp(plist->al_name,
				      ATTR_pbs_license_info) == 0) {
			unset_license_location();
		} else if (strcasecmp(plist->al_name,
				      ATTR_license_min) == 0) {
			unset_license_min();
		} else if (strcasecmp(plist->al_name,
				      ATTR_license_max) == 0) {
			unset_license_max();
		} else if (strcasecmp(plist->al_name,
				      ATTR_license_linger) == 0) {
			unset_license_linger();
		} else if (strcasecmp(plist->al_name, ATTR_resv_retry_init) == 0 ||
			   strcasecmp(plist->al_name, ATTR_resv_retry_time) == 0) {
			resv_retry_time = RESV_RETRY_TIME_DEFAULT;
		} else if (strcasecmp(plist->al_name,
				      ATTR_JobHistoryEnable) == 0) {
			unset_job_history_enable();
		} else if (strcasecmp(plist->al_name,
				      ATTR_JobHistoryDuration) == 0) {
			unset_job_history_duration();
		} else if (strcasecmp(plist->al_name,
				      ATTR_max_job_sequence_id) == 0) {
			unset_max_job_sequence_id();
		} else if (strcasecmp(plist->al_name,
				      ATTR_max_concurrent_prov) == 0) {
			max_concurrent_prov = PBS_MAX_CONCURRENT_PROV;
			resize_prov_table(max_concurrent_prov);
		} else if (strcasecmp(plist->al_name,
				      ATTR_dfltqsubargs) == 0) {
			force_qsub_daemons_update();
		} else if (strcasecmp(plist->al_name,
				      ATTR_nodefailrq) == 0) {
			unset_node_fail_requeue();
		} else if (strcasecmp(plist->al_name,
				      ATTR_resendtermdelay) == 0) {
			unset_resend_term_delay();
		} else if (strcasecmp(plist->al_name,
				      ATTR_jobscript_max_size) == 0) {
			unset_jobscript_max_size();
		} else if (strcasecmp(plist->al_name,
				      ATTR_scheduling) == 0) {
			if (dflt_scheduler) {
				set_sched_attr_l_slim(dflt_scheduler, SCHED_ATR_scheduling, 0, SET);
				sched_save_db(dflt_scheduler);
			}
		} else if (strcasecmp(plist->al_name, ATTR_schediteration) == 0) {
			if (dflt_scheduler) {
				svrattrl *tm_list;
				/* value is 600 so it is of size 4 including terminating character */
				tm_list = attrlist_create(plist->al_name, NULL, 8);
				if (tm_list == NULL) {
					reply_badattr(-1, bad_attr, plist, preq);
				}
				tm_list->al_link.ll_next->ll_struct = NULL;
				/* when unset, set scheduler_iteration to 600 seconds */
				sprintf(tm_list->al_value, "%d", PBS_SCHEDULE_CYCLE);
				rc = mgr_set_attr(dflt_scheduler->sch_attr, sched_attr_idx, sched_attr_def, SCHED_ATR_LAST, tm_list,
						  MGR_ONLY_SET, &bad_attr, (void *) dflt_scheduler, ATR_ACTION_ALTER);
				if (rc != 0) {
					free_svrattrl(tm_list);
					reply_badattr(rc, bad_attr, plist, preq);
					return;
				}
				sched_save_db(dflt_scheduler);
				free_svrattrl(tm_list);
			}
		}
		plist = (struct svrattrl *) GET_NEXT(plist->al_link);
	}
	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);

	rc = mgr_unset_attr(server.sv_attr, svr_attr_idx, svr_attr_def, SVR_ATR_LAST, plist,
			    preq->rq_perm, &bad_attr, (void *) &server, PARENT_TYPE_SERVER, INDIRECT_RES_CHECK);
	if (rc != 0)
		reply_badattr(rc, bad_attr, plist, preq);
	else {
		attribute *pattr = get_sattr(SVR_ATR_DefaultChunk);
		if (pattr->at_flags & ATR_VFLAG_MODIFY) {
			(void) deflt_chunk_action(pattr, (void *) &server, ATR_ACTION_ALTER);
		}
		/* Now set the default values on some of the unset attributes */
		plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
		for (plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
		     plist != NULL; plist = (struct svrattrl *) GET_NEXT(plist->al_link)) {
			if (strcasecmp(plist->al_name, ATTR_logevents) == 0) {
				set_sattr_l_slim(SVR_ATR_log_events, SVR_LOG_DFLT, SET);
				*log_event_mask = get_sattr_long(SVR_ATR_log_events);
			} else if (strcasecmp(plist->al_name, ATTR_mailer) == 0)
				set_sattr_str_slim(SVR_ATR_mailer, SENDMAIL_CMD, NULL);
			else if (strcasecmp(plist->al_name, ATTR_mailfrom) == 0)
				set_sattr_str_slim(SVR_ATR_mailfrom, PBS_DEFAULT_MAIL, NULL);
			else if (strcasecmp(plist->al_name, ATTR_queryother) == 0)
				set_sattr_l_slim(SVR_ATR_query_others, 1, SET);
			else if (strcasecmp(plist->al_name, ATTR_schediteration) == 0)
				set_sattr_str_slim(SVR_ATR_scheduler_iteration, TOSTR(PBS_SCHEDULE_CYCLE), NULL);
			else if (strcasecmp(plist->al_name, ATTR_ResvEnable) == 0)
				set_sattr_l_slim(SVR_ATR_ResvEnable, 1, SET);
			else if (strcasecmp(plist->al_name, ATTR_maxarraysize) == 0)
				set_sattr_str_slim(SVR_ATR_maxarraysize, TOSTR(PBS_MAX_ARRAY_JOB_DFL), NULL);
			else if (strcasecmp(plist->al_name, ATTR_max_concurrent_prov) == 0)
				set_sattr_str_slim(SVR_ATR_max_concurrent_prov, TOSTR(PBS_MAX_CONCURRENT_PROV), NULL);
			else if (strcasecmp(plist->al_name, ATTR_EligibleTimeEnable) == 0)
				set_sattr_l_slim(SVR_ATR_EligibleTimeEnable, 0, SET);
			else if (strcasecmp(plist->al_name, ATTR_license_linger) == 0) {
				set_sattr_l_slim(SVR_ATR_license_linger, PBS_LIC_LINGER_TIME, SET);
				licensing_control.licenses_linger_time = PBS_LIC_LINGER_TIME;
			} else if (strcasecmp(plist->al_name, ATTR_license_max) == 0) {
				set_sattr_l_slim(SVR_ATR_license_max, PBS_MAX_LICENSING_LICENSES, SET);
				licensing_control.licenses_max = PBS_MAX_LICENSING_LICENSES;
			} else if (strcasecmp(plist->al_name, ATTR_license_min) == 0) {
				set_sattr_l_slim(SVR_ATR_license_min, PBS_MIN_LICENSING_LICENSES, SET);
				licensing_control.licenses_min = PBS_MIN_LICENSING_LICENSES;
			} else if (strcasecmp(plist->al_name, ATTR_rescdflt) == 0) {
				if (plist->al_resc != NULL && strcasecmp(plist->al_resc, "ncpus") == 0) {
					svrattrl *tm_list;
					tm_list = attrlist_create(plist->al_name, "ncpus", 8);
					if (tm_list == NULL) {
						reply_badattr(-1, bad_attr, plist, preq);
						return;
					}
					tm_list->al_link.ll_next->ll_struct = NULL;
					sprintf(tm_list->al_value, "%d", 1);
					rc = mgr_set_attr(server.sv_attr, svr_attr_idx, svr_attr_def, SVR_ATR_LAST, tm_list,
							  NO_USER_SET, &bad_attr, (void *) &server, ATR_ACTION_ALTER);
					if (rc != 0) {
						free_svrattrl(tm_list);
						reply_badattr(rc, bad_attr, plist, preq);
						return;
					}
					free_svrattrl(tm_list);
				}
			} else if (strcasecmp(plist->al_name, ATTR_scheduling) == 0) {
				set_sattr_l_slim(SVR_ATR_scheduling, 1, SET);
			} else if (strcasecmp(plist->al_name, ATTR_clearesten) == 0) {
				set_sattr_l_slim(SVR_ATR_clear_est_enable, 0, SET);
			}
		}
		svr_save_db(&server);
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_INFO,
			   msg_daemonname, msg_manager, msg_man_uns,
			   preq->rq_user, preq->rq_host);
		mgr_log_attr(msg_man_uns, GET_NEXT(preq->rq_ind.rq_manager.rq_attr), PBS_EVENTCLASS_SERVER, msg_daemonname, NULL);
		reply_ack(preq);
	}
}

/**
 * @brief
 *		Set Scheduler Attribute Values
 *
 *		Sets the requested attributes and returns a reply
 *
 * @param[in] preq - Pointer to a batch request structure
 */

void
mgr_sched_set(struct batch_request *preq)
{
	int bad_attr = 0;
	svrattrl *plist, *psvrat;
	pbs_list_head setlist;
	pbs_list_head unsetlist;
	int rc;
	pbs_sched *psched;
	int only_scheduling = 1;

	psched = find_sched(preq->rq_ind.rq_manager.rq_objname);
	if (!psched) {
		req_reject(PBSE_UNKSCHED, 0, preq);
		return;
	}

	CLEAR_HEAD(setlist);
	CLEAR_HEAD(unsetlist);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	while (plist) {
		if (strcmp(plist->al_atopl.name, ATTR_scheduling)) {
			only_scheduling = 0;
		}
		/*
		 * We do not overwrite/update the entire record in the database. Therefore, to
		 * unset attributes, we will need to find out the ones with a 0 or NULL value set.
		 * We create a separate list for removal from the list of attributes provided, and
		 * pass it to mgr_unset_attr, below
		 */
		psvrat = dup_svrattrl(plist);
		if (psvrat == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			free_attrlist(&setlist);
			free_attrlist(&unsetlist);
			return;
		}
		if (psvrat->al_atopl.value == NULL || psvrat->al_atopl.value[0] == '\0')
			append_link(&unsetlist, &psvrat->al_link, psvrat);
		else
			append_link(&setlist, &psvrat->al_link, psvrat);

		plist = (struct svrattrl *) GET_NEXT(plist->al_link);
	}

	/* if the unsetlist has attributes, call server_unset to remove them separately */
	plist = (svrattrl *) GET_NEXT(unsetlist);
	if (plist) {
		rc = mgr_unset_attr(psched->sch_attr, sched_attr_idx, sched_attr_def, SCHED_ATR_LAST, plist,
				    preq->rq_perm, &bad_attr, (void *) psched, PARENT_TYPE_SCHED, INDIRECT_RES_CHECK);
		if (rc != 0) {
			reply_badattr(rc, bad_attr, plist, preq);
			free_attrlist(&setlist);
			free_attrlist(&unsetlist);
			return;
		}
	}

	plist = (svrattrl *) GET_NEXT(setlist);
	if (!plist)
		goto done;

	rc = mgr_set_attr(psched->sch_attr, sched_attr_idx, sched_attr_def,
			  SCHED_ATR_LAST, plist, preq->rq_perm, &bad_attr, (void *) psched, ATR_ACTION_ALTER);
	if (rc != 0) {
		reply_badattr(rc, bad_attr, plist, preq);
		free_attrlist(&setlist);
		free_attrlist(&unsetlist);
		return;
	}
	if (only_scheduling != 1)
		set_scheduler_flag(SCH_CONFIGURE, psched);

	sched_save_db(psched);

done:
	free_attrlist(&setlist);
	free_attrlist(&unsetlist);
	sprintf(log_buffer, msg_manager, msg_man_set, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SCHED, LOG_INFO, msg_daemonname, log_buffer);
	mgr_log_attr(msg_man_set, GET_NEXT(preq->rq_ind.rq_manager.rq_attr), PBS_EVENTCLASS_SCHED, msg_daemonname, NULL);
	reply_ack(preq);
}

/**
 * @brief
 *		Unset (clear) Sched Attribute Values
 *
 *		Clears the requested attributes and returns a reply
 *
 * @param[in]	preq	- Pointer to a batch request structure
 */

void
mgr_sched_unset(struct batch_request *preq)
{
	int bad_attr = 0;
	svrattrl *plist, *tmp_plist;
	int rc;

	pbs_sched *psched = find_sched(preq->rq_ind.rq_manager.rq_objname);
	if (!psched) {
		req_reject(PBSE_UNKSCHED, 0, preq);
		return;
	}

	for (tmp_plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr); tmp_plist; tmp_plist = (struct svrattrl *) GET_NEXT(tmp_plist->al_link)) {
		if (strcasecmp(tmp_plist->al_name, ATTR_schediteration) == 0) {
			if (dflt_scheduler) {
				svrattrl *t_list;

				t_list = attrlist_create(tmp_plist->al_name, NULL, 0);
				if (t_list == NULL)
					reply_badattr(-1, bad_attr, tmp_plist, preq);

				t_list->al_link.ll_next->ll_struct = NULL;
				rc = mgr_unset_attr(server.sv_attr, svr_attr_idx, svr_attr_def, SVR_ATR_LAST, t_list,
						    -1, &bad_attr, (void *) &server, PARENT_TYPE_SERVER, INDIRECT_RES_CHECK);
				if (rc != 0) {
					free_svrattrl(t_list);
					reply_badattr(rc, bad_attr, tmp_plist, preq);
					return;
				}
				svr_save_db(&server);
				free_svrattrl(t_list);
			}
		}
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	rc = mgr_unset_attr(psched->sch_attr, sched_attr_idx, sched_attr_def, SCHED_ATR_LAST, plist,
			    preq->rq_perm, &bad_attr, (void *) psched, PARENT_TYPE_SCHED, INDIRECT_RES_CHECK);
	if (rc != 0) {
		reply_badattr(rc, bad_attr, plist, preq);
		return;
	}

	set_sched_default(psched, 0);

	sched_save_db(psched);
	sprintf(log_buffer, msg_manager, msg_man_uns, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SCHED, LOG_INFO, msg_daemonname, log_buffer);
	mgr_log_attr(msg_man_uns, plist, PBS_EVENTCLASS_SCHED, msg_daemonname, NULL);
	reply_ack(preq);
}

/**
 * @brief
 *		Set Queue Attribute Values
 *
 *		Finds the queue, Sets the requested attributes and returns a reply
 *
 * @param[in]	preq	- Pointer to a batch request structure
 */

void
mgr_queue_set(struct batch_request *preq)
{
	int allques;
	int bad = 0;
	char *badattr;
	svrattrl *plist, *psvrat;
	pbs_list_head setlist;
	pbs_list_head unsetlist;
	pbs_queue *pque;
	char *qname;
	int rc;

	if ((*preq->rq_ind.rq_manager.rq_objname == '\0') ||
	    (*preq->rq_ind.rq_manager.rq_objname == '@')) {
		qname = all_quename;
		allques = 1;
		pque = (pbs_queue *) GET_NEXT(svr_queues);
	} else {
		qname = preq->rq_ind.rq_manager.rq_objname;
		allques = 0;
		pque = find_queuebyname(qname);
	}
	if (pque == NULL) {
		req_reject(PBSE_UNKQUE, 0, preq);
		return;
	}

	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_QUEUE, LOG_INFO, qname, msg_manager, msg_man_set, preq->rq_user, preq->rq_host);

	CLEAR_HEAD(setlist);
	CLEAR_HEAD(unsetlist);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	while (plist) {
		/*
		 * We do not overwrite/update the entire record in the database. Therefore, to
		 * unset attributes, we will need to find out the ones with a 0 or NULL value set.
		 * We create a separate list for removal from the list of attributes provided, and
		 * pass it to mgr_unset_attr, below
		 */
		psvrat = dup_svrattrl(plist);
		if (psvrat == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			free_attrlist(&setlist);
			free_attrlist(&unsetlist);
			return;
		}
		if (psvrat->al_atopl.value == NULL || psvrat->al_atopl.value[0] == '\0')
			append_link(&unsetlist, &psvrat->al_link, psvrat);
		else
			append_link(&setlist, &psvrat->al_link, psvrat);

		plist = (struct svrattrl *) GET_NEXT(plist->al_link);
	}

	if (allques)
		pque = (pbs_queue *) GET_NEXT(svr_queues);

	while (pque) {
		/* if the unsetlist has attributes, call server_unset to remove them separately */
		plist = (svrattrl *) GET_NEXT(unsetlist);
		if (plist) {
			rc = mgr_unset_attr(pque->qu_attr, que_attr_idx, que_attr_def, QA_ATR_LAST, plist,
					    preq->rq_perm, &bad, (void *) pque, PARENT_TYPE_QUE_ALL, INDIRECT_RES_CHECK);
			if (rc != 0) {
				reply_badattr(rc, bad, plist, preq);
				free_attrlist(&setlist);
				free_attrlist(&unsetlist);
				return;
			}
		}

		plist = (svrattrl *) GET_NEXT(setlist);
		if (plist) {
			rc = mgr_set_attr(pque->qu_attr, que_attr_idx, que_attr_def, QA_ATR_LAST,
					  plist, preq->rq_perm, &bad, pque, ATR_ACTION_ALTER);
			if (rc != 0) {
				reply_badattr(rc, bad, plist, preq);
				free_attrlist(&setlist);
				free_attrlist(&unsetlist);
				return;
			} else {
				que_save_db(pque);
				mgr_log_attr(msg_man_set, GET_NEXT(preq->rq_ind.rq_manager.rq_attr), PBS_EVENTCLASS_QUEUE, pque->qu_qs.qu_name, NULL);
			}
		}
		if (allques)
			pque = (pbs_queue *) GET_NEXT(pque->qu_link);
		else
			break;
	}
	free_attrlist(&setlist);
	free_attrlist(&unsetlist);

	/* check the appropriateness of the attributes based on queue type */

	if (allques)
		pque = (pbs_queue *) GET_NEXT(svr_queues);
	while (pque) {
		if ((badattr = check_que_attr(pque)) != NULL) {
			(void) sprintf(log_buffer, msg_attrtype, pque->qu_qs.qu_name, badattr);
			(void) reply_text(preq, PBSE_ATTRTYPE, log_buffer);
			return;
		}
		if (allques)
			pque = (pbs_queue *) GET_NEXT(pque->qu_link);
		else
			break;
	}

	reply_ack(preq);
}

/**
 * @brief
 *		Unset (clear)  Queue Attribute Values
 *
 *		Finds the queue, clears the requested attributes and returns a reply
 *
 * @param[in] preq - Pointer to a batch request structure
 */

void
mgr_queue_unset(struct batch_request *preq)
{
	int allques;
	int bad_attr = 0;
	svrattrl *plist;
	pbs_queue *pque;
	char *qname;
	int rc;

	if ((*preq->rq_ind.rq_manager.rq_objname == '\0') ||
	    (*preq->rq_ind.rq_manager.rq_objname == '@')) {
		qname = all_quename;
		allques = 1;
		pque = (pbs_queue *) GET_NEXT(svr_queues);
	} else {
		allques = 0;
		qname = preq->rq_ind.rq_manager.rq_objname;
		pque = find_queuebyname(qname);
	}
	if (pque == NULL) {
		req_reject(PBSE_UNKQUE, 0, preq);
		return;
	}
	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_QUEUE, LOG_INFO,
		   qname, msg_manager, msg_man_uns, preq->rq_user, preq->rq_host);

	for (plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	     plist != NULL;
	     plist = (svrattrl *) GET_NEXT(plist->al_link)) {
		if (strcmp(plist->al_name, ATTR_qtype) == 0) {
			req_reject(PBSE_NEEDQUET, 0, preq);
			return;
		}
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);

	while (pque) {
		rc = mgr_unset_attr(pque->qu_attr, que_attr_idx, que_attr_def, QA_ATR_LAST,
				    plist, preq->rq_perm, &bad_attr,
				    (void *) pque, PARENT_TYPE_QUE_ALL, INDIRECT_RES_CHECK);
		if (rc != 0) {
			reply_badattr(rc, bad_attr, plist, preq);
			return;
		} else {
			attribute *attr;
			if ((attr = get_qattr(pque, QE_ATR_DefaultChunk))->at_flags & ATR_VFLAG_MODIFY)
				(void) deflt_chunk_action(attr, (void *) pque, ATR_ACTION_ALTER);
			que_save_db(pque);
			mgr_log_attr(msg_man_uns, plist, PBS_EVENTCLASS_QUEUE, pque->qu_qs.qu_name, NULL);
			if (is_qattr_set(pque, QA_ATR_QType) == 0)
				pque->qu_qs.qu_type = QTYPE_Unset;
		}
		if (allques)
			pque = GET_NEXT(pque->qu_link);
		else
			break;
	}
	reply_ack(preq);
}

/**
 * @brief
 *		Set vnode attributes
 *
 * 		Finds the set of vnodes, either one specified, all for a host or all.
 * 		Sets the request attributes on that set.
 * 		returns a reply to the sender of the batch_request
 *
 * 		Note the use of the ':' to indicate a port number as part of a host name
 * 		is purely for internal testing and is not documented externally.
 *
 * @param[in] preq - Pointer to a batch request structure
 *
 * @par MT-safe: No
 */

static void
mgr_node_set(struct batch_request *preq)
{
	extern char *msg_queue_not_in_partition;
	extern char *msg_partition_not_in_queue;
	int bad = 0;
	char hostname[PBS_MAXHOSTNAME + 1];
	int numnodes = 1; /* number of vnodes to be operated on */
	svrattrl *plist, *psvrat;
	pbs_list_head setlist;
	pbs_list_head unsetlist;
	char *nodename;
	mominfo_t *pmom = NULL;
	mom_svrinfo_t *psvrmom = NULL;
	struct pbsnode *pnode;
	int rc;
	int i, j, len;
	int problem_cnt = 0;
	int momidx;
	char *problem_names = NULL;
	struct pbsnode **problem_nodes = NULL;
	static char *warnmsg = NULL;
	struct pbsnode **warn_nodes = NULL;
	int warn_idx = 0;
	int replied = 0; /* boolean */

	nodename = preq->rq_ind.rq_manager.rq_objname;

	if (((*preq->rq_ind.rq_manager.rq_objname == '\0') ||
	     (*preq->rq_ind.rq_manager.rq_objname == '@')) &&
	    (preq->rq_ind.rq_manager.rq_objtype != MGR_OBJ_HOST)) {

		/*
		 * In this instance the set node req is to apply to all
		 * nodes at the local ('\0')  or specified ('@') server
		 */

		if ((pbsndlist != NULL) && svr_totnodes) {
			nodename = all_nodes;
			pnode = pbsndlist[0];
			numnodes = svr_totnodes;
		} else { /* specified server has no nodes in its node table */
			pnode = NULL;
		}

	} else if (preq->rq_ind.rq_manager.rq_objtype == MGR_OBJ_HOST) {
		/* Operating on all vnodes on a named host
		 * if it is the last/only host
		 * find the mom and get the first vnode in her list
		 */

		char *pc;
		unsigned int port = pbs_mom_port;

		pc = strchr(preq->rq_ind.rq_manager.rq_objname, (int) ':');
		if (pc) {
			port = atol(pc + 1);
		}
		if (get_fullhostname(preq->rq_ind.rq_manager.rq_objname,
				     hostname, (sizeof(hostname) - 1)) != 0) {
			req_reject(PBSE_UNKNODE, 0, preq);
			return;
		}
		pmom = find_mom_entry(hostname, port);
		if (pmom) {
			psvrmom = (mom_svrinfo_t *) pmom->mi_data;
			numnodes = psvrmom->msr_numvnds;
			momidx = 0;
			pnode = psvrmom->msr_children[momidx];
		} else {
			/* no such Mom */
			req_reject(PBSE_UNKNODE, 0, preq);
			return;
		}
	} else /* Else one and only one vnode */
		pnode = find_nodebyname(nodename);

	if (pnode == NULL) {
		req_reject(PBSE_UNKNODE, 0, preq);
		return;
	}

	CLEAR_HEAD(setlist);
	CLEAR_HEAD(unsetlist);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	while (plist) {
		psvrat = dup_svrattrl(plist);
		if (psvrat == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			free_attrlist(&setlist);
			free_attrlist(&unsetlist);
			return;
		}
		if (psvrat->al_atopl.value == NULL || psvrat->al_atopl.value[0] == '\0')
			append_link(&unsetlist, &psvrat->al_link, psvrat);
		else
			append_link(&setlist, &psvrat->al_link, psvrat);

		plist = (struct svrattrl *) GET_NEXT(plist->al_link);
	}

	/* set writtable attributes of node (nodes if numnodes > 1) */
	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE, LOG_INFO, nodename, msg_manager, msg_man_set, preq->rq_user, preq->rq_host);

	if (numnodes > 1) {
		problem_nodes = (struct pbsnode **) malloc(numnodes * sizeof(struct pbsnode *));
		if (problem_nodes == NULL) {
			log_err(ENOMEM, __func__, "out of memory");
			return;
		}
		problem_cnt = 0;
	}

	warn_idx = 0;
	warn_nodes = (struct pbsnode **) malloc(numnodes * sizeof(struct pbsnode *));
	if (warn_nodes == NULL) {
		log_err(ENOMEM, __func__, "out of memory");
		free(problem_nodes);
		return;
	}
	warnings_update(WARN_ngrp_init, warn_nodes, &warn_idx, pnode);

	i = 0;
	while (pnode) {
		if ((pnode->nd_state & INUSE_DELETED) == 0) {
			for (j = 0; j < 2; j++) {
				rc = 0;
				if (j == 0) {
					plist = (svrattrl *) GET_NEXT(unsetlist);
					if (plist)
						rc = mgr_unset_attr(pnode->nd_attr, node_attr_idx, node_attr_def, ND_ATR_LAST, plist, preq->rq_perm, &bad, (void *) pnode, PARENT_TYPE_NODE, INDIRECT_RES_CHECK);
				} else {
					plist = (svrattrl *) GET_NEXT(setlist);
					if (plist)
						rc = mgr_set_attr(pnode->nd_attr, node_attr_idx, node_attr_def, ND_ATR_LAST, plist, preq->rq_perm | ATR_PERM_ALLOW_INDIRECT, &bad, (void *) pnode, ATR_ACTION_ALTER);
				}
				if (rc != 0) {
					if (numnodes > 1) {
						if (problem_nodes) {
							/*we have an array in which to save*/
							if (problem_nodes[problem_cnt - 1] != pnode) {
								/* and this node was not saved already */
								problem_nodes[problem_cnt] = pnode;
								++problem_cnt;
							}
						}
					} else { /*In the specific node case, reply w/ error and return*/
						switch (rc) {
							case PBSE_INTERNAL:
							case PBSE_SYSTEM:
								req_reject(rc, bad, preq);
								break;

							case PBSE_NOATTR:
							case PBSE_ATTRRO:
							case PBSE_MUTUALEX:
							case PBSE_BADNDATVAL:
							case PBSE_UNKRESC:
								reply_badattr(rc, bad, plist, preq);
								break;
							case PBSE_QUE_NOT_IN_PARTITION:
								(void) snprintf(log_buffer, LOG_BUF_SIZE, msg_queue_not_in_partition,
										get_nattr_str(pnode, ND_ATR_Queue));
								log_err(-1, __func__, log_buffer);
								reply_text(preq, PBSE_QUE_NOT_IN_PARTITION, log_buffer);
								break;
							case PBSE_PARTITION_NOT_IN_QUE:
								(void) snprintf(log_buffer, LOG_BUF_SIZE, msg_partition_not_in_queue,
										get_nattr_str(pnode, ND_ATR_partition));
								log_err(-1, __func__, log_buffer);
								reply_text(preq, PBSE_PARTITION_NOT_IN_QUE, log_buffer);
								break;

							default:
								req_reject(rc, 0, preq);
						}
						free(warn_nodes);
						free_attrlist(&unsetlist);
						free_attrlist(&setlist);
						return;
					}
				} else if (plist) { /*modifications succeed for this node*/
					warnings_update(WARN_ngrp, warn_nodes, &warn_idx, pnode);

					if ((pnode->nd_nsnfree == 0) && (pnode->nd_state == 0))
						set_vnode_state(pnode, INUSE_JOB, Nd_State_Or);

					mgr_log_attr(msg_man_set, GET_NEXT(preq->rq_ind.rq_manager.rq_attr), PBS_EVENTCLASS_NODE, pnode->nd_name, NULL);
					pnode->nd_modified = 1;
				}
			}
		}
		if (numnodes == 1)
			break; /* just the one vnode */
		else if (preq->rq_ind.rq_manager.rq_objtype == MGR_OBJ_HOST) {
			int update_mom_only = 0;

			/* next vnode under the Mom */
			if (++momidx >= psvrmom->msr_numvnds)
				break; /* all down */
			pnode = psvrmom->msr_children[momidx];
			if ((strcmp(plist->al_name, ATTR_NODE_state) == 0) && (plist->al_op == INCR)) {
				/* Marking nodes offline.  We should only mark the children vnodes
				 * as offline if no other mom that reports the vnodes are up.
				 */
				if (pnode->nd_nummoms > 1) {
					int imom;
					for (imom = 0; imom < pnode->nd_nummoms; ++imom) {
						unsigned long mstate;
						mstate = pnode->nd_moms[imom]->mi_dmn_info->dmn_state;
						if ((mstate & (INUSE_DOWN | INUSE_OFFLINE)) == 0) {
							/* If another mom is up (i.e. not down or offline)
							 * then do not set the vnode state of the children
							 */
							update_mom_only = 1;
							break; /* found at least one mom that's up, we can stop now */
						}
					}
				}
			}
			if (update_mom_only)
				break; /* all done */
		} else {
			if (++i == svr_totnodes)
				break;	      /* all done */
			pnode = pbsndlist[i]; /* next vnode in array */
		}
	} /*bottom of the while()*/

	free_attrlist(&setlist);
	free_attrlist(&unsetlist);

	warnmsg = warn_msg_build(WARN_ngrp, warn_nodes, warn_idx);

	save_nodes_db(0, NULL);

	if (numnodes > 1) { /*modification was for multiple vnodes  */

		if (problem_cnt) { /*one or more problems encountered*/

			for (len = 0, i = 0; i < problem_cnt; i++)
				len += strlen(problem_nodes[i]->nd_name) + 3;

			if (warnmsg == NULL)
				len += strlen(pbse_to_txt(PBSE_GMODERR));
			else
				len += strlen(pbse_to_txt(PBSE_GMODERR)) + strlen(warnmsg);

			if ((problem_names = malloc(len)) != NULL) {

				strcpy(problem_names, pbse_to_txt(PBSE_GMODERR));
				for (i = 0; i < problem_cnt; i++) {
					if (i)
						strcat(problem_names, ", ");
					strcat(problem_names, problem_nodes[i]->nd_name);
				}
				if (warnmsg != NULL)
					strcat(problem_names, warnmsg);

				(void) reply_text(preq, PBSE_GMODERR, problem_names);
				free(problem_names);
				problem_names = NULL;
				replied = 1;
			} else {
				(void) reply_text(preq, PBSE_GMODERR, pbse_to_txt(PBSE_GMODERR));
				replied = 1;
			}
		}
	}

	if (replied == 0) {

		if (warnmsg) {
			(void) reply_text(preq, PBSE_NONE, warnmsg);
			free(warnmsg);
			warnmsg = NULL;
		} else
			reply_ack(preq);
	}

	free(problem_nodes);
	free(warn_nodes);
}

/**
 * @brief
 *		Unset node attributes
 *
 * 		Finds the node, unsets the attributes and
 * 		returns a reply to the sender of the batch_request
 *
 * @note
 * 		Note, the attrbibutes of "state" and "ntype" cannot be unset.
 *
 *  @param[in]	preq	- Pointer to a batch request structure
 *
 *  @par MT-safe: No
 */

void
mgr_node_unset(struct batch_request *preq)

{
	int bad = 0;
	char hostname[PBS_MAXHOSTNAME + 1];
	int numnodes = 1; /* number of vnode to operate */
	svrattrl *plist;
	char *nodename;
	mominfo_t *pmom = NULL;
	mom_svrinfo_t *psvrmom = NULL;
	struct pbsnode *pnode;
	int rc;
	int unset_que = 0;
	int i, len;
	int problem_cnt = 0;
	int momidx;
	char *problem_names;
	struct pbsnode **problem_nodes = NULL;
	static char *warnmsg = NULL;
	struct pbsnode **warn_nodes = NULL;
	int warn_idx = 0;
	int replied = 0; /* boolean */
	attribute *patr;
	resource_def *prd;
	resource *prc;
	static char *astate = ATTR_NODE_state;
	static char *antype = ATTR_NODE_ntype;
	static char *ra = ATTR_rescavail;

	nodename = preq->rq_ind.rq_manager.rq_objname;

	if (preq->rq_ind.rq_manager.rq_objtype == MGR_OBJ_HOST) {
		/* Operating on all vnodes on a named host          */
		/* find the mom and get the first vnode in her list */
		char *pc;
		unsigned int port = pbs_mom_port;

		pc = strchr(preq->rq_ind.rq_manager.rq_objname, (int) ':');
		if (pc) {
			port = atol(pc + 1);
		}
		if (get_fullhostname(preq->rq_ind.rq_manager.rq_objname,
				     hostname, (sizeof(hostname) - 1)) != 0) {
			req_reject(PBSE_UNKNODE, 0, preq);
			return;
		}
		pmom = find_mom_entry(hostname, port);
		if (pmom) {
			/* found mom, set number of and first vnode */
			psvrmom = (mom_svrinfo_t *) pmom->mi_data;
			numnodes = psvrmom->msr_numvnds;
			momidx = 0;
			pnode = psvrmom->msr_children[momidx];
		} else {
			/* no such Mom */
			req_reject(PBSE_UNKNODE, 0, preq);
			return;
		}

	} else if ((*preq->rq_ind.rq_manager.rq_objname == '\0') ||
		   (*preq->rq_ind.rq_manager.rq_objname == '@')) {

		/*In this instance the set node req is to apply to all */
		/*nodes at the local ('\0')  or specified ('@') server */

		if ((pbsndlist != NULL) && svr_totnodes) {
			nodename = all_nodes;
			pnode = pbsndlist[0];
			numnodes = svr_totnodes;
		} else { /* specified server has no nodes in its node table */
			pnode = NULL;
		}

	} else {
		pnode = find_nodebyname(nodename);
	}

	if (pnode == NULL) {
		req_reject(PBSE_UNKNODE, 0, preq);
		return;
	}

	/* check attributes being unset */

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	while (plist) {
		bad++;

		/* check that state, vnode_pool, ntype and	*/
		/* resources_available.host are not being unset	*/
		if ((strcasecmp(plist->al_name, astate) == 0) ||
		    (strcasecmp(plist->al_name, antype) == 0) ||
		    (strcasecmp(plist->al_name, ATTR_NODE_VnodePool) == 0) ||
		    ((strcasecmp(plist->al_name, ra) == 0) &&
		     ((plist->al_resc == NULL) ||
		      (strcasecmp(plist->al_resc, "host") == 0)))) {
			reply_badattr(PBSE_BADNDATVAL, bad, plist, preq);
			return;
		}

		/* is "queue" being unset */
		if (strcasecmp(plist->al_name, "queue") == 0)
			unset_que = 1;

		plist = (struct svrattrl *) GET_NEXT(plist->al_link);
	}
	bad = 0;

	/* unset writtable attributes of node (nodes if numnodes > 1) */

	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE, LOG_INFO,
		   nodename, msg_manager, msg_man_uns,
		   preq->rq_user, preq->rq_host);

	if (numnodes > 1) {
		problem_nodes = (struct pbsnode **) malloc(numnodes * sizeof(struct pbsnode *));
		if (problem_nodes == NULL) {
			log_err(ENOMEM, __func__, "out of memory");
			return;
		}
		problem_cnt = 0;
	}

	warn_idx = 0;
	warn_nodes = (struct pbsnode **) malloc(numnodes * sizeof(struct pbsnode *));
	if (warn_nodes == NULL) {
		log_err(ENOMEM, __func__, "out of memory");
		free(problem_nodes);
		return;
	}
	warnings_update(WARN_ngrp_init, warn_nodes, &warn_idx, pnode);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	i = 0;
	while (pnode) {
		if ((pnode->nd_state & INUSE_DELETED) == 0) {
			/*
			 * The unset operation requires us to note before hand
			 * whether we have the grouping resource on this node
			 * as we loose that information if unset succeeds.
			 */

			warnings_update(WARN_ngrp_ck, warn_nodes, &warn_idx, pnode);

			rc = mgr_unset_attr(pnode->nd_attr, node_attr_idx, node_attr_def, ND_ATR_LAST,
					    plist, preq->rq_perm, &bad, (void *) pnode,
					    PARENT_TYPE_NODE, INDIRECT_RES_CHECK);
			if (rc != 0) {

				if (numnodes > 1) {
					if (problem_nodes) {
						/*we have an array in which to save*/
						problem_nodes[problem_cnt] = pnode;
						++problem_cnt;
					}

				} else { /*In the specific node case, reply w/ error and return*/
					switch (rc) {
						case PBSE_INTERNAL:
						case PBSE_SYSTEM:
							req_reject(rc, bad, preq);
							break;

						case PBSE_NOATTR:
						case PBSE_ATTRRO:
						case PBSE_MUTUALEX:
						case PBSE_BADNDATVAL:
						case PBSE_UNKRESC:
							reply_badattr(rc, bad, plist, preq);
							break;

						default:
							req_reject(rc, 0, preq);
					}
					free(warn_nodes);
					return;
				}

			} else { /*modifications succeed for this node*/

				warnings_update(WARN_ngrp, warn_nodes, &warn_idx, pnode);

				/* if queue unset, clear pointer to queue struct */
				if (unset_que) {
					pnode->nd_pque = NULL;
					mark_which_queues_have_nodes();
				}

				/* if resources_avail.ncpus unset, reset to default */
				patr = get_nattr(pnode, ND_ATR_ResourceAvail);
				prd = &svr_resc_def[RESC_NCPUS];
				prc = find_resc_entry(patr, prd);
				if (prc == NULL)
					prc = add_resource_entry(patr, prd);
				if (!is_attr_set(&prc->rs_value)) {
					prc->rs_value.at_val.at_long = pnode->nd_ncpus;
					prc->rs_value.at_flags |= ATR_VFLAG_DEFLT | ATR_SET_MOD_MCACHE;
				}

				/* If the Mom attribute is unset, reset to default */
				if (is_nattr_set(pnode, ND_ATR_Mom) == 0) {
					attribute tmp;
					if (get_fullhostname(pnode->nd_name, hostname,
							     (sizeof(hostname) - 1)) != 0) {
						strncpy(hostname, pnode->nd_name, (sizeof(hostname) - 1));
					}
					clear_attr(&tmp, &node_attr_def[(int) ND_ATR_Mom]);
					rc = decode_arst(&tmp, ATTR_NODE_Mom, NULL, hostname);
					if (rc == 0) {
						set_arst(get_nattr(pnode, ND_ATR_Mom), &tmp, INCR);
						(get_nattr(pnode, ND_ATR_Mom))->at_flags |= ATR_VFLAG_DEFLT;
						free_arst(&tmp);
					}
				}

				pnode->nd_modified = 1;
				mgr_log_attr(msg_man_set, plist, PBS_EVENTCLASS_NODE, pnode->nd_name, NULL);
			}
		}
		if (numnodes == 1)
			break;
		if (preq->rq_ind.rq_manager.rq_objtype == MGR_OBJ_HOST) {
			if (++momidx >= psvrmom->msr_numvnds)
				break;
			pnode = psvrmom->msr_children[momidx];
		} else {
			if (++i == svr_totnodes)
				break;
			pnode = pbsndlist[i];
		}
	} /* bottom of the while() */

	warnmsg = warn_msg_build(WARN_ngrp, warn_nodes, warn_idx);

	save_nodes_db(0, NULL);

	if (numnodes > 1) { /*modification was for all nodes  */

		if (problem_cnt) { /*one or more problems encountered*/

			for (len = 0, i = 0; i < problem_cnt; i++)
				len += strlen(problem_nodes[i]->nd_name) + 3;

			if (warnmsg == NULL)
				len += strlen(pbse_to_txt(PBSE_GMODERR));
			else
				len += strlen(pbse_to_txt(PBSE_GMODERR)) + strlen(warnmsg);

			if ((problem_names = malloc(len)) != NULL) {

				strcpy(problem_names, pbse_to_txt(PBSE_GMODERR));
				for (i = 0; i < problem_cnt; i++) {
					if (i)
						strcat(problem_names, ", ");
					strcat(problem_names, problem_nodes[i]->nd_name);
				}
				if (warnmsg != NULL)
					strcat(problem_names, warnmsg);

				(void) reply_text(preq, PBSE_GMODERR, problem_names);
				free(problem_names);
				problem_names = NULL;
				replied = 1;
			} else {
				(void) reply_text(preq, PBSE_GMODERR, pbse_to_txt(PBSE_GMODERR));
				replied = 1;
			}
		}
	}

	if (replied == 0) {

		if (warnmsg) {
			(void) reply_text(preq, PBSE_NONE, warnmsg);
			free(warnmsg);
		} else
			reply_ack(preq);
	}

	free(problem_nodes);
	free(warn_nodes);
}

/**
 * @brief
 * 		make_host_addresses_list - return a null terminated list of all of the
 *		IP addresses of the named host (phost)
 *
 * @param[in]	phost	- named host
 * @param[in]	pul	- ptr to null terminated address list is returned in *pul
 *
 * @return	error code
 * @retval	0	- no error
 * @retval	PBS error	- error
 */

int
make_host_addresses_list(char *phost, u_long **pul)
{
	int i;
	int err;
	struct pul_store *tpul = NULL;
	int len;
	struct addrinfo *aip, *pai;
	struct addrinfo hints;
	struct sockaddr_in *inp;

	if ((phost == 0) || (*phost == '\0'))
		return (PBSE_SYSTEM);

	/* search for the address list in the address list index
	 * so that we do not hit NS for everything
	 */
	if (hostaddr_idx != NULL) {
		if (pbs_idx_find(hostaddr_idx, (void **) &phost, (void **) &tpul, NULL) == PBS_IDX_RET_OK) {
			*pul = (u_long *) malloc(tpul->len);
			if (!*pul) {
				strcat(log_buffer, "out of memory ");
				return (PBSE_SYSTEM);
			}
			memmove(*pul, tpul->pul, tpul->len);
			return 0;
		}
	}

	memset(&hints, 0, sizeof(struct addrinfo));
	/*
	 *      Why do we use AF_UNSPEC rather than AF_INET?  Some
	 *      implementations of getaddrinfo() will take an IPv6
	 *      address and map it to an IPv4 one if we ask for AF_INET
	 *      only.  We don't want that - we want only the addresses
	 *      that are genuinely, natively, IPv4 so we start with
	 *      AF_UNSPEC and filter ai_family below.
	 */
	hints.ai_family = AF_UNSPEC;
	hints.ai_socktype = SOCK_STREAM;
	hints.ai_protocol = IPPROTO_TCP;
	if ((err = getaddrinfo(phost, NULL, &hints, &pai)) != 0) {
		sprintf(log_buffer,
			"addr not found for %s h_errno=%d errno=%d",
			phost, err, errno);
		return (PBSE_UNKNODE);
	}

	i = 0;
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		/* skip non-IPv4 addresses */
		if (aip->ai_family == AF_INET)
			i++;
	}

	/* null end it */
	len = sizeof(u_long) * (i + 1);
	*pul = (u_long *) malloc(len);
	if (*pul == NULL) {
		strcat(log_buffer, "Out of memory ");
		return (PBSE_SYSTEM);
	}

	i = 0;
	for (aip = pai; aip != NULL; aip = aip->ai_next) {
		if (aip->ai_family == AF_INET) {
			u_long ipaddr;

			inp = (struct sockaddr_in *) aip->ai_addr;
			ipaddr = ntohl(inp->sin_addr.s_addr);
			(*pul)[i] = ipaddr;
			i++;
		}
	}
	(*pul)[i] = 0; /* null term array ip adrs */

	freeaddrinfo(pai);

	tpul = malloc(sizeof(struct pul_store));
	if (!tpul) {
		strcat(log_buffer, "out of  memory");
		free(*pul);
		return (PBSE_SYSTEM);
	}
	tpul->len = len;
	tpul->pul = (u_long *) malloc(tpul->len);
	if (!tpul->pul) {
		free(tpul);
		free(*pul);
		strcat(log_buffer, "out of  memory");
		return (PBSE_SYSTEM);
	}
	memmove(tpul->pul, *pul, tpul->len);

	if (hostaddr_idx == NULL) {
		if ((hostaddr_idx = pbs_idx_create(0, 0)) == NULL) {
			free(tpul->pul);
			free(tpul);
			free(*pul);
			strcat(log_buffer, "out of  memory");
			return (PBSE_SYSTEM);
		}
	}
	if (pbs_idx_insert(hostaddr_idx, phost, tpul) != PBS_IDX_RET_OK) {
		free(tpul->pul);
		free(tpul);
		free(*pul);
		return (PBSE_SYSTEM);
	}
	return 0;
}

/**
 * @brief
 * 		remove the cached ip addresses of a mom from the host index and the ipaddrs index
 *
 * @param[in]	pmom - valid ptr to the mom info
 *
 * @return	error code
 * @retval	0		- no error
 * @retval	PBS error	- error
 */
int
remove_mom_ipaddresses_list(mominfo_t *pmom)
{
	/* take ipaddrs from ipaddrs cache index */
	if (hostaddr_idx != NULL) {
		struct pul_store *tpul = NULL;
		void *phost = &pmom->mi_host;

		if (pbs_idx_find(hostaddr_idx, &phost, (void **) &tpul, NULL) == PBS_IDX_RET_OK) {
			u_long *pul;
			for (pul = tpul->pul; *pul; pul++)
				tdelete2(*pul, pmom->mi_port, &ipaddrs);

			if (pbs_idx_delete(hostaddr_idx, pmom->mi_host) != PBS_IDX_RET_OK)
				return (PBSE_SYSTEM);

			free(tpul->pul);
			free(tpul);
		}
	}
	return 0;
}

/**
 * @brief
 *		create pbs node structure, i.e. add a node
 *
 * @param[in]	objname	- Name of node
 * @param[in]	plist 	- list of attributes to set on node
 * @param[out]	bad 	- Return the index of a bad attribute
 * @param[out]	rtnpnode	- pointer to created node structure
 * @param[in]	nodup 	- TRUE  - means duplicated name not allowed (qmgr create)
 *			 				FALSE - dups are allowed (same vnode under multi Moms)
 * @param[in]	allow_unkresc	- TRUE - allow node to have unknown resources
 * 									FALSE - do not allow unknown resources.
 *
 * @return Error code
 * @retval - 0 - Success
 * @retval - pbs_errno - Failure code
 *
 */

int
create_pbs_node2(char *objname, svrattrl *plist, int perms, int *bad, struct pbsnode **rtnpnode, int nodup, int allow_unkresc)
{
	struct pbsnode *pnode;
	struct pbsnode **tmpndlist;
	int ntype; /* node type, always PBS */
	char *pc;
	char *phost;	    /* trial host name */
	char *pname;	    /* node name w/o any :ts       */
	u_long *pul = NULL; /* 0 terminated host adrs array*/
	int rc;
	int j;
	int iht;
	attribute *pattr;
	svrattrl *plx;
	mominfo_t *pmom;
	mom_svrinfo_t *smp;
	resource_def *prdef;
	resource *presc;
	char realfirsthost[PBS_MAXHOSTNAME + 1];
	int ret;

	if (rtnpnode != NULL)
		*rtnpnode = NULL;

	ret = PBSE_NONE;

	/* change "Host" attrribute into Mom */
	/* a carry over from the past	     */
	plx = plist;
	while (plx) {
		if (strcasecmp(plx->al_name, "Host") == 0) {
			/* this only works becase strlen(Mom) < strlen(Host) */
			strcpy(plx->al_name, "Mom");
			break;
		}
		plx = (svrattrl *) GET_NEXT(plx->al_link);
	}

	rc = process_host_name_part(objname, plist, &pname, &ntype);
	if (rc)
		return (rc);

	if ((pnode = find_nodebyname(pname)) == NULL) {

		/* need to create the pbs_node entry */

		pnode = (struct pbsnode *) malloc(sizeof(struct pbsnode));
		if (pnode == NULL) {
			free(pname);
			return (PBSE_SYSTEM);
		}

		/* expand pbsndlist array exactly svr_totnodes long*/
		tmpndlist = (struct pbsnode **) realloc(pbsndlist,
							sizeof(struct pbsnode *) * (svr_totnodes + 1));

		if (tmpndlist != NULL) {
			/*add in the new entry etc*/
			pbsndlist = tmpndlist;
			/* nd_index = 0 (regular node, single parent mom), nd_index = 1 (multiple parent moms, usually Cray) */
			pnode->nd_index = 0;
			pnode->nd_arr_index = svr_totnodes; /* this is only in mem, not from db */
			pbsndlist[svr_totnodes++] = pnode;
		} else {
			free(pname);
			free_pnode(pnode);
			return (PBSE_SYSTEM);
		}
		if (initialize_pbsnode(pnode, pname, ntype) != PBSE_NONE) {
			svr_totnodes--;
			free_pnode(pnode);
			return (PBSE_SYSTEM);
		}

		/* create and initialize the first subnode to go with */
		/* the parent node */
		if (create_subnode(pnode, NULL) == NULL) {
			svr_totnodes--;
			free_pnode(pnode);
			return (PBSE_SYSTEM);
		}

		/* create node index if not already done */
		if (node_idx == NULL) {
			if ((node_idx = pbs_idx_create(0, 0)) == NULL) {
				svr_totnodes--;
				free_pnode(pnode);
				return (PBSE_SYSTEM);
			}
		}

		/* add to node to index */
		if (pbs_idx_insert(node_idx, pname, pnode) != PBS_IDX_RET_OK) {
			svr_totnodes--;
			free_pnode(pnode);
			return (PBSE_SYSTEM);
		}
	} else if (nodup == TRUE) {
		/* duplicating/modifying vnode by qmgr is not allowed */
		/* as what qmgr creates is the natural vnode          */
		free(pname);
		return (PBSE_NODEEXIST);
	}

	/*
	 * Make sure Mom attribute is or will be  set.
	 * Action functions in mgr_set_attr expect it to be set
	 *
	 * If it is specified in the provided attrl list,  turn the
	 * operation into a INCR to add any unique host names to those
	 * already there.
	 *
	 * If it isn't specified in the attrl, use the node name.
	 */
	plx = plist;
	while (plx) {
		if (strcasecmp(plx->al_name, ATTR_NODE_Mom) == 0) {
			break;
		}
		plx = (svrattrl *) GET_NEXT(plx->al_link);
	}

	if (plx) {
		plx->al_op = INCR;
	} else if (is_nattr_set(pnode, ND_ATR_Mom) == 0) {
		rc = set_nattr_str_slim(pnode, ND_ATR_Mom, pname, NULL);
		if (rc != PBSE_NONE) {
			effective_node_delete(pnode);
			return (rc);
		}
	}

	/* Make sure Port is or will be set */
	plx = plist;
	while (plx) {
		if (strcasecmp(plx->al_name, ATTR_NODE_Port) == 0) {
			break;
		}
		plx = (svrattrl *) GET_NEXT(plx->al_link);
	}
	if ((plx == NULL) && (is_nattr_set(pnode, ND_ATR_Port) == 0))
		set_nattr_l_slim(pnode, ND_ATR_Port, pbs_mom_port, SET);

	/* OK, set the attributes specified */

	rc = mgr_set_attr2(pnode->nd_attr, node_attr_idx, node_attr_def, ND_ATR_LAST,
			   plist, perms | ATR_PERM_ALLOW_INDIRECT, bad,
			   (void *) pnode, ATR_ACTION_NEW, allow_unkresc);

	if (rc != 0) {
		/*
		 * If an attribute could not be resolved, do not delete node
		 * from database, for other errors go ahead and delete node.
		 */
		if (rc != PBSE_UNKRESC)
			effective_node_delete(pnode);

		return (rc);
	}

	/*
	 * Ensure "resources_available.host=HOSTNAME" is in the resource list.
	 * Use the first hostname provided, and determine whether it is a
	 * hostname or IP address. If it is truly a host name, use the short
	 * form by truncating it at the first '.' character. If it is an IP
	 * address, use the entire string. Note that RFC 1123 allows
	 * hostnames to start with a number, so do not simply key off of the
	 * first character.
	 */

	pattr = get_nattr(pnode, ND_ATR_ResourceAvail);

	prdef = &svr_resc_def[RESC_HOST];
	presc = find_resc_entry(pattr, prdef);
	if (presc == NULL) {
		/* add the entry */
		presc = add_resource_entry(pattr, prdef);
		if (presc) {
			struct sockaddr_in sa4;
			struct sockaddr_in6 sa6;

			strncpy(realfirsthost, (get_nattr_arst(pnode, ND_ATR_Mom))->as_string[0], (sizeof(realfirsthost) - 1));
			realfirsthost[PBS_MAXHOSTNAME] = '\0';

			if ((inet_pton(AF_INET, realfirsthost, &(sa4.sin_addr)) != 1) &&
			    (inet_pton(AF_INET6, realfirsthost, &(sa6.sin6_addr)) != 1)) {
				/* Not an IPv4 or IPv6 address, truncate it. */
				pc = strchr(realfirsthost, '.');
				if (pc)
					*pc = '\0';
			}
			rc = prdef->rs_decode(&presc->rs_value, "", "host", realfirsthost);
			presc->rs_value.at_flags |= ATR_VFLAG_DEFLT; /* so not written to nodes file */
		} else {
			rc = PBSE_SYSTEM;
		}
	}

	if (rc != 0) {
		effective_node_delete(pnode);
		return (rc);
	}

	pnode->nd_hostname = strdup(presc->rs_value.at_val.at_str);
	if (pnode->nd_hostname == NULL) {
		effective_node_delete(pnode);
		return (PBSE_SYSTEM);
	}
	prdef = &svr_resc_def[RESC_VNODE];
	presc = find_resc_entry(pattr, prdef);
	if (presc == NULL)
		presc = add_resource_entry(pattr, prdef); /* add the entry */

	if (presc) {
		rc = prdef->rs_decode(&presc->rs_value, NULL, NULL, objname);
		presc->rs_value.at_flags |= ATR_VFLAG_DEFLT; /* so not written to nodes file */

	} else {
		rc = PBSE_SYSTEM;
	}

	if (rc != 0) {
		effective_node_delete(pnode);
		return (rc);
	}

	/*
	 * Now we need to create the Mom structure for each Mom who is a
	 * parent of this (v)node.
	 * The Mom structure may already exist
	 */

	pattr = get_nattr(pnode, ND_ATR_Mom);
	for (iht = 0; iht < pattr->at_val.at_arst->as_usedptr; ++iht) {
		unsigned int nport;

		phost = pattr->at_val.at_arst->as_string[iht];

		if ((rc = make_host_addresses_list(phost, &pul))) {
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE, LOG_INFO, pnode->nd_name, log_buffer);

			/* special case for unresolved nodes in case of server startup */
			if (rc == PBSE_UNKNODE && get_sattr_long(SVR_ATR_State) == SV_STATE_INIT) {
				/*
				 * mark node as INUSE_UNRESOLVABLE, pbsnodes will show unresolvable state
				 */
				set_vnode_state(pnode, INUSE_UNRESOLVABLE | INUSE_DOWN, Nd_State_Set);

				/*
				 * make_host_addresses_list failed, so pul was not allocated
				 * Since we are going ahead nevertheless, we need to allocate
				 * an "empty" pul list
				 */
				free(pul);
				pul = malloc(sizeof(u_long) * (1));
				pul[0] = 0;
				ret = PBSE_UNKNODE; /* set return of function to this, so that error is logged */
			} else {
				free(pul);
				effective_node_delete(pnode);
				return (rc); /* return the error code from make_host_addresses_list */
			}
		}

		/*
		 * Note, once create_svrmom_entry() is called, it has the
		 * responsibility for "pul" including freeing it if need be.
		 */

		nport = get_nattr_long(pnode, ND_ATR_Port);

		if ((pmom = create_svrmom_entry(phost, nport, pul)) == NULL) {
			free(pul);
			effective_node_delete(pnode);
			return (PBSE_SYSTEM);
		}

		if (!pbs_iplist) {
			pbs_iplist = create_pbs_iplist();
			if (!pbs_iplist) {
				return (PBSE_SYSTEM); /* No Memory */
			}
		}
		smp = (mom_svrinfo_t *) (pmom->mi_data);
		for (j = 0; pmom->mi_dmn_info->dmn_addrs[j]; j++) {
			u_long ipaddr = pmom->mi_dmn_info->dmn_addrs[j];
			if (insert_iplist_element(pbs_iplist, ipaddr)) {
				delete_pbs_iplist(pbs_iplist);
				return (PBSE_SYSTEM); /* No Memory */
			}
		}

		/* cross link the vnode (pnode) and its Mom (pmom) */

		if ((rc = cross_link_mom_vnode(pnode, pmom)) != 0)
			return (rc);

		/* If this is the "natural vnode" (i.e. 0th entry) */
		if (pnode->nd_nummoms == 1) {
			if (is_nattr_set(pnode, ND_ATR_vnode_pool) && get_nattr_long(pnode, ND_ATR_vnode_pool) > 0)
				smp->msr_vnode_pool = get_nattr_long(pnode, ND_ATR_vnode_pool);
		}
	}

	pnode->nd_modified = 1;
	if (rtnpnode != NULL)
		*rtnpnode = pnode;
	return (ret); /*create completely successful*/
}

/**
 * @brief
 * 		Wrapper function to create_pbs_node() but without the 'allow_unkresc'
 * 		parameter.
 */
int
create_pbs_node(char *objname, svrattrl *plist, int perms, int *bad, struct pbsnode **rtnpnode, int nodup)
{
	return (create_pbs_node2(objname, plist, perms, bad, rtnpnode, nodup, FALSE));
}

/**
 * @brief
 * 		check_sister_vnodes_for_delete	- check for sister vnodes which are eligible for delete.
 * 		returns if nd_summons is equal to one for the array of supporing vnodes.
 *
 * @param[in]	psvrmom	- mom_svrinfo structure of the mom which needs to be checked
 *
 * @return	return code
 * @retval	0	- no node to delete.
 * @retval	1	- there are nodes to be deleted
 */
static int
check_sister_vnodes_for_delete(mom_svrinfo_t *psvrmom)
{
	int ct = 0;
	int i;

	if (psvrmom->msr_numvnds <= 1)
		return ct;
	for (i = 1; i < psvrmom->msr_numvnds; ++i) {
		if (psvrmom->msr_children[i]->nd_nummoms == 1) {
			++ct;
			break;
		}
	}
	return (ct);
}

/**
 *  @brief delete a scheduler object
 *
 *  @param[in] preq - Pointer to a batch request structure
 *
 */
static void
mgr_sched_delete(struct batch_request *preq)
{
	pbs_sched *psched;
	pbs_sched *tmpsched;

	if ((*preq->rq_ind.rq_manager.rq_objname == '\0') || (*preq->rq_ind.rq_manager.rq_objname == '@')) {
		/* Delete all except default */
		psched = (pbs_sched *) GET_NEXT(svr_allscheds);
		while (psched != NULL) {
			tmpsched = psched;
			psched = (pbs_sched *) GET_NEXT(psched->sc_link);
			if (tmpsched != dflt_scheduler) {
				if (sched_delete(tmpsched) == PBSE_OBJBUSY) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "Scheduler %s is busy", tmpsched->sc_name);
					log_err(PBSE_OBJBUSY, __func__, log_buffer);
				}
			}
		}
	} else {
		psched = find_sched(preq->rq_ind.rq_manager.rq_objname);
		if (!psched) {
			req_reject(PBSE_UNKSCHED, 0, preq);
			return;
		} else if (psched == dflt_scheduler) {
			req_reject(PBSE_SCHED_NO_DEL, 0, preq);
			return;
		}

		if (sched_delete(psched) == PBSE_OBJBUSY) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "Scheduler %s is busy", psched->sc_name);
			log_err(PBSE_OBJBUSY, __func__, log_buffer);
			(void) reply_text(preq, PBSE_OBJBUSY, preq->rq_ind.rq_manager.rq_objname);
			return;
		}
	}
	reply_ack(preq); /*request completely successful*/
	return;
}

/*
 * mgr_node_delete - mark a node (or all nodes) in the server's node list
 *                   as being "deleted".  It (they) will no longer get
 *                   assigned to a job, will no longer be pinged, and
 *                   any current job tasks will continue until they end,
 *                   abort, or are killed.
 *
 *  @param[in] preq - Pointer to a batch request structure
 *
 */

static void
	mgr_node_delete(struct batch_request *preq)
{
	int numnodes = 1;
	struct pbsnode *pnode;
	struct pbssubn *psub;
	char *nodename;
	int rc;

	int i, len;
	int n;
	int problem_cnt = 0;
	char *problem_names;
	struct pbsnode **problem_nodes = NULL;
	svrattrl *plist;
	mom_svrinfo_t *psvrmom;

	nodename = preq->rq_ind.rq_manager.rq_objname;

	if ((*preq->rq_ind.rq_manager.rq_objname == '\0') ||
	    (*preq->rq_ind.rq_manager.rq_objname == '@')) {

		/*In this instance the delete node req is to apply to all */
		/*nodes at the local ('\0')  or specified ('@') server */

		if ((pbsndlist != NULL) && svr_totnodes) {
			nodename = all_nodes;
			pnode = *pbsndlist;
			numnodes = svr_totnodes;
		} else { /* specified server has no nodes in its node table */
			pnode = NULL;
		}

	} else {
		pnode = find_nodebyname(nodename);
	}

	if (pnode == NULL) {
		req_reject(PBSE_UNKNODE, 0, preq);
		return;
	}

	/* If node being deleted is linked to any queue, clear "has node" flag for that queue */
	if (pnode->nd_pque != NULL) {
		set_qattr_l_slim(pnode->nd_pque, QE_ATR_HasNodes, 0, SET);
		ATR_UNSET(get_qattr(pnode->nd_pque, QE_ATR_HasNodes));
	}

	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_NODE, LOG_INFO,
		   nodename, msg_manager, msg_man_del,
		   preq->rq_user, preq->rq_host);

	/*if doing many and problem arises with some, record them for report*/
	/*the array of "problem nodes" sees no use now and may never see use*/
	if (numnodes > 1) {
		pnode = pbsndlist[0];
		problem_nodes = (struct pbsnode **) malloc(svr_totnodes * sizeof(struct pbsnode *));
		if (problem_nodes == NULL) {
			log_err(ENOMEM, __func__, "out of memory");
			return;
		}
		problem_cnt = 0;
	}

	/*set "deleted" bit in node's (nodes, numnodes == 1) "inuse" field*/
	/*remove entire prop list, including the node name, from the node */
	/*remove the IP address array hanging from the node               */

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	for (i = 0; i < svr_totnodes; i++) {
		if (numnodes > 1)
			pnode = pbsndlist[i];

		rc = 0;

		if (pnode->nd_state & INUSE_DELETED)
			continue; /* already deleted */
		if (pnode->nd_state & INUSE_PROV)
			rc = PBSE_NODEPROV_NODEL;
		else {
			if (find_vnode_in_resvs(pnode, Skip_Degraded_Time) != NULL)
				rc = PBSE_OBJBUSY;
			for (psub = pnode->nd_psn; psub != 0; psub = psub->next) {
				if (psub->jobs)
					rc = PBSE_OBJBUSY;
			}
		}

		if (pnode->nd_nummoms == 1) {
			psvrmom = pnode->nd_moms[0]->mi_data;
			if ((numnodes == 1) &&
			    (psvrmom->msr_numvnds > 1) &&
			    (psvrmom->msr_children[0] == pnode)) {
				/*
				 * this is the "natural" vnode for a Mom with
				 * multiple vnodes.  If there running jobs, or the
				 * other vnodes under her do not have another
				 * Mom, we cannot delete this vnode (and the Mom)
				 * unless we are deleteing all vnodes.
				 */
				if (psvrmom->msr_numjobs > 0) {
					rc = PBSE_OBJBUSY;
				} else {
					n = check_sister_vnodes_for_delete(psvrmom);
					if (n > 0)
						rc = PBSE_OBJBUSY;
				}
			}
		}

		if (rc != 0) {

			if (numnodes > 1) {
				if (problem_nodes) /*we have an array in which to save*/
					problem_nodes[problem_cnt] = pnode;

				++problem_cnt;

			} else { /*In the specific node case, reply w/ error and return*/
				switch (rc) {

					default:
						req_reject(rc, 0, preq);
				}
				return;
			}

		} else { /*modifications succeed for this node*/
			nodename = strdup(pnode->nd_name);
			effective_node_delete(pnode);
			pnode = NULL; /* pnode has been freed, set it to NULL */
			i--;	      /* the array has been coalesced, so reset i to the earlier position */

			if (nodename) {
				mgr_log_attr(msg_man_set, plist, PBS_EVENTCLASS_NODE, nodename, NULL);
				free(nodename);
				nodename = NULL;
			}
		}
		if (numnodes == 1)
			break;
	} /*bottom of the for()*/

	save_nodes_db(1, NULL);

	if (numnodes > 1) { /*modification was for all nodes  */

		if (problem_cnt) { /*one or more problems encountered*/

			for (len = 0, i = 0; i < problem_cnt; i++)
				len += strlen(problem_nodes[i]->nd_name) + 3;

			len += strlen(pbse_to_txt(PBSE_GMODERR));

			if ((problem_names = malloc(len)) != NULL) {

				strcpy(problem_names, pbse_to_txt(PBSE_GMODERR));
				for (i = 0; i < problem_cnt; i++) {
					if (i)
						strcat(problem_names, ", ");
					strcat(problem_names, problem_nodes[i]->nd_name);
				}

				(void) reply_text(preq, PBSE_GMODERR, problem_names);
				free(problem_names);
				problem_names = NULL;
			} else {
				(void) reply_text(preq, PBSE_GMODERR, pbse_to_txt(PBSE_GMODERR));
			}
		}

		free(problem_nodes); /* maybe problem malloc failed */
		problem_nodes = NULL;

		if (problem_cnt) /* reply has already been sent */
			return;
	}

	reply_ack(preq);
}

/**
 * @brief
 *		mgr_sched_create - process request to create a sched
 *
 *		Creates sched
 *
 *  @param[in]	preq	- Pointer to a batch request structure
 */
static void
mgr_sched_create(struct batch_request *preq)
{
	int bad;
	svrattrl *plist;
	pbs_sched *psched;
	int rc;

	if (strlen(preq->rq_ind.rq_manager.rq_objname) > PBS_MAXSCHEDNAME) {
		req_reject(PBSE_SCHED_NAME_BIG, 0, preq);
		return;
	}
	if (find_sched(preq->rq_ind.rq_manager.rq_objname)) {
		req_reject(PBSE_SCHEDEXIST, 0, preq);
		return;
	}

	psched = sched_alloc(preq->rq_ind.rq_manager.rq_objname);
	if (!psched)
		req_reject(PBSE_SYSTEM, 0, preq);

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	rc = mgr_set_attr(psched->sch_attr, sched_attr_idx, sched_attr_def, SCHED_ATR_LAST, plist,
			  preq->rq_perm, &bad, (void *) psched, ATR_ACTION_NEW);
	if (rc != 0) {
		reply_badattr(rc, bad, plist, preq);
		sched_free(psched);
		return;
	}

	set_sched_default(psched, 0);

	sched_save_db(psched);
	snprintf(log_buffer, LOG_BUF_SIZE, msg_manager, msg_man_set, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SCHED, LOG_INFO, msg_daemonname, log_buffer);
	mgr_log_attr(msg_man_set, plist, PBS_EVENTCLASS_SCHED, msg_daemonname, NULL);
	reply_ack(preq);
}

/**
 * @brief
 *		mgr_node_create - process request to create a node
 *
 *		Creates pbsnode and calls mgr_set_attr to set
 *      any associated node attributes also specified in the
 *      request.
 *
 *  @param[in]	preq	- Pointer to a batch request structure
 */

void
mgr_node_create(struct batch_request *preq)
{
	int bad;
	svrattrl *plist;
	int rc;
	char *vnp; /* Temp storage to validate (v)node name */
	long vn_pool;
	struct pbsnode *pnode;
	mominfo_t *mymom;
	struct sockaddr_in check_ip;
	int is_node_ip;
	char *nodename;

	nodename = preq->rq_ind.rq_manager.rq_objname;

	/*
	 * Before creating the (v)node, validate the (v)node name using
	 * legal_vnode_char() to check if it contains any invalid character.
	 * If any invalid char found, then reject the batch req with
	 * PBSE_BADNDATVAL.
	 */
	if ((vnp = nodename) != NULL) {
		for (; *vnp && legal_vnode_char(*vnp, 1); vnp++)
			;
		if (*vnp) {
			req_reject(PBSE_BADNDATVAL, 0, preq);
			return;
		}
		/* Condition to make sure that node name should not exceed
		 * PBS_MAXHOSTNAME i.e. 64 characters. This is because the
		 * corresponding column nd_name in the database table pbs.node
		 * is defined as string of length 64.
		 */
		if (strlen(nodename) > PBS_MAXHOSTNAME) {
			req_reject(PBSE_NODENBIG, 0, preq);
			return;
		}
	}
	is_node_ip = inet_pton(AF_INET, nodename, &(check_ip.sin_addr));
	if (is_node_ip > 0) {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_INFO, nodename,
			   "Node added using IPv4 address\nVerify that PBS_MOM_NODE_NAME is configured on the respective host");
	}
	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	rc = create_pbs_node(nodename, plist, preq->rq_perm, &bad, &pnode, TRUE);

	if (rc != 0) {

		switch (rc) {
			case PBSE_INTERNAL:
			case PBSE_SYSTEM:
				req_reject(rc, bad, preq);
				break;

			case PBSE_NOATTR:
			case PBSE_ATTRRO:
			case PBSE_MUTUALEX:
			case PBSE_BADNDATVAL:
				reply_badattr(rc, bad, plist, preq);
				break;

			default:
				req_reject(rc, 0, preq);
		}
		return;
	}

	mymom = pnode->nd_moms[0];
	if (is_nattr_set(pnode, ND_ATR_vnode_pool) && ((vn_pool = get_nattr_long(pnode, ND_ATR_vnode_pool)) > 0)) {
		if (add_mom_to_pool(mymom) == PBSE_NONE) {
			/* cross link any vnodes of an existing Mom in pool */
			int i;
			mom_svrinfo_t *ppoolm = NULL;
			vnpool_mom_t *ppool = vnode_pool_mom_list;
			while (ppool) {
				if (ppool->vnpm_vnode_pool == vn_pool) {
					if (ppool->vnpm_inventory_mom) {
						ppoolm = (mom_svrinfo_t *) (ppool->vnpm_inventory_mom->mi_data);
					}
					break;
				}
				ppool = ppool->vnpm_next;
			}
			if (ppoolm) {
				log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_NODE, LOG_INFO,
					   mymom->mi_host, "POOL: cross linking %d vnodes from %s",
					   ppoolm->msr_numvnds - 1, ppool->vnpm_inventory_mom->mi_host);
				for (i = 1; i < ppoolm->msr_numvnds; ++i) {
					cross_link_mom_vnode(ppoolm->msr_children[i], mymom);
				}
			}
		}
	}
	mgr_log_attr(msg_man_set, plist, PBS_EVENTCLASS_NODE, nodename, NULL);

	setup_notification(); /*set mechanism for notifying */
	/*other nodes of new member   */

	save_nodes_db(1, NULL);

	reply_ack(preq); /*create completely successful*/
}

/**
 * @brief
 * 		Helper function used to handle resource deletion and setting
 *
 * @par
 * 		The caller must ensure that the parameters are valid and not NULL
 *
 * @param[in]	pattr	- attribute structure which needs to be checked
 * @param[in]	preq	- The client's batch request
 *
 * @return	a pointer to the resource
 * @retval	NULL	- if the resource is not set
 */
static resource *
get_resource(attribute *pattr, resource_def *prdef)
{
	resource *presc;

	if (is_attr_set(pattr)) {
		if (pattr->at_type == ATR_TYPE_RESC) {
			presc = (resource *) GET_NEXT(pattr->at_val.at_list);
			while (presc) {
				if (presc->rs_defin == prdef) {
					return presc;
				}
				presc = (resource *) GET_NEXT(presc->rs_link);
			}
		}
	}
	return NULL;
}
/**
 * @brief
 * 		is_entity_resource_set	- checks for a resource name in all the resources
 * 									in the tree within the attribute structure
 *
 * @param[in]	pattr	- attribute structure which contains the resource tree root
 * @param[in]	resc_name	- resource name
 *
 * @return	int
 * @retval	0	- resource set
 * @retval	1	- resource not set
 */
int
is_entity_resource_set(attribute *pattr, char *resc_name)
{
	if (is_attr_set(pattr)) {
		char *key = NULL;
		void *ctx = pattr->at_val.at_enty.ae_tree;
		char resc[PBS_MAX_RESC_NAME + 1];

		while (entlim_get_next(ctx, (void **) &key) != NULL) {
			if (entlim_resc_from_key(key, resc, PBS_MAX_RESC_NAME) == 0) {
				if (strcmp(resc, resc_name) == 0)
					return 1;
			}
		}
	}
	return 0;
}

/**
 * @brief
 * 		Helper function to check if a resource is set on jobs or reservations.
 * @par
 * 		If a resource is busy on an object, this function will respond back to
 * 		the client request's.
 *
 * @param[in]	preq	- The client's batch request
 * @param[in]	prdef	- The resource definition to check on
 * @param[in]	mod	- Set to 1 if the resource type or flag are being modified
 *
 * @return	BOOLEAN
 * @retval	1	- If resource is busy on jobs or reservations
 * @retval	0	- Otherwise
 */
static int
check_resource_set_on_jobs_or_resvs(struct batch_request *preq, resource_def *prdef, int mod)
{
	job *pj;
	resc_resv *pr;
	char *rmatch;
	int rlen;
	resource *presc;
	resource *presc_list;
	resource *presc_used;

	/* Reject if resource is on a job and the type or flag are being modified */

	for (pj = (job *) GET_NEXT(svr_alljobs); pj != NULL; pj = (job *) GET_NEXT(pj->ji_alljobs)) {
		presc_list = get_resource(get_jattr(pj, JOB_ATR_resc_used), prdef);
		presc_used = get_resource(get_jattr(pj, JOB_ATR_resource), prdef);
		if (((presc_list != NULL) || presc_used != NULL) && (mod == 1)) {
			reply_text(preq, PBSE_RESCBUSY, "Resource busy on job");
			return 1;
		}
		if (is_jattr_set(pj, JOB_ATR_SchedSelect)) {
			char *val = get_jattr_str(pj, JOB_ATR_SchedSelect);
			rmatch = strstr(val, prdef->rs_name);
			if (rmatch != NULL) {
				rlen = strlen(prdef->rs_name);
				if (((mod == 1) && (*(rmatch + rlen) == '=')) &&
				    ((rmatch == val) || *(rmatch - 1) == ':')) {
					reply_text(preq, PBSE_RESCBUSY, "Resource busy on job");
					return 1;
				}
			}
		}
	}

	/* Reject if resource is on a job and the type or flag are being modified */
	pr = (resc_resv *) GET_NEXT(svr_allresvs);
	while (pr != NULL) {
		presc = get_resource(get_rattr(pr, RESV_ATR_resource), prdef);
		if ((presc != NULL) && (mod == 1)) {
			reply_text(preq, PBSE_RESCBUSY, "Resource busy on reservation");
			return 1;
		}
		if (is_rattr_set(pr, RESV_ATR_SchedSelect)) {
			rmatch = strstr(get_rattr_str(pr, RESV_ATR_SchedSelect), prdef->rs_name);
			if (rmatch != NULL) {
				rlen = strlen(prdef->rs_name);
				if (((*(rmatch + rlen) == '=') && (*(rmatch - 1) == ':')) && (mod == 1)) {
					reply_text(preq, PBSE_RESCBUSY, "Resource busy on reservation");
					return 1;
				}
			}
		}
		pr = (resc_resv *) GET_NEXT(pr->ri_allresvs);
	}
	return 0;
}

/**
 * @brief
 * 		helper function to send/update resourcedef file.
 */
static void
timed_send_rescdef(struct work_task *pwt)
{
	send_rescdef(1); /* forcing with 1 to avoid failures due to intermittent file stamp race issues */
	rescdef_wt_g = NULL;
}

/**
 * @brief
 * 		deferred send/update resourcedef file
 *
 * 		Bursty updates to resources may result in a large number of requests to
 * 		update the resourcedef file on the MoMs, to avoid piling up the requests,
 * 		the update is sent after one second from the last request.
 */
static void
deferred_send_rescdef()
{
	if (rescdef_wt_g) {
		delete_task(rescdef_wt_g);
	}
	rescdef_wt_g = set_task(WORK_Timed, ((long) (time(0))) + 1, timed_send_rescdef, NULL);
}

/**
 * @brief
 * 		Create a resource
 *
 * @param[in]	preq	- The request containing information about the resource to
 * 		     				create
 *
 * @par
 * 		Requests to create a resource with a name that may already exist are
 * 		rejected.
 *
 * @return	void
 */
static void
mgr_resource_create(struct batch_request *preq)
{
	char *resc;
	char buf[LOG_BUF_SIZE];
	int rc;
	svrattrl *plist;
	int type = ATR_TYPE_STR;
	int flags = READ_WRITE;
	int flag_ir = 0;
	resource_def *prdef;

	if ((resc = preq->rq_ind.rq_manager.rq_objname) == NULL) {
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}

	rc = verify_resc_name(resc);
	if (rc != 0) {
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}

	prdef = find_resc_def(svr_resc_def, resc);
	if (prdef != NULL) {
		req_reject(PBSE_DUPLIST, 0, preq);
		return;
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	while (plist) {
		if (strcmp(plist->al_atopl.name, ATTR_RESC_TYPE) == 0) {
			if (parse_resc_type(plist->al_atopl.value, &type) == -1) {
				req_reject(PBSE_BADATVAL, 0, preq);
				return;
			}
		} else if (strcmp(plist->al_atopl.name, ATTR_RESC_FLAG) == 0) {
			if (parse_resc_flags(plist->al_atopl.value, &flag_ir, &flags) == -1) {
				req_reject(PBSE_BADATVAL, 0, preq);
				return;
			}
		} else {
			req_reject(PBSE_BADATVAL, 0, preq);
			return;
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	if (verify_resc_type_and_flags(type, &flag_ir, &flags, resc, buf, sizeof(buf), 0) != 0) {
		reply_text(preq, PBSE_BADATVAL, buf);
		return;
	}

	rc = add_resource_def(resc, type, flags);
	if (rc < 0) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_ERR, msg_daemonname, "resource %s can not be defined", resc);
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}

	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_RESC, LOG_INFO, resc, msg_manager, msg_man_cre, preq->rq_user, preq->rq_host);
	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	mgr_log_attr(msg_man_set, plist, PBS_EVENTCLASS_RESC, preq->rq_ind.rq_manager.rq_objname, NULL);

	if (flags & (ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) {
		update_resc_sum();
	}
	reply_ack(preq);

	restart_python_interpreter(__func__);
	deferred_send_rescdef();

	return;
}

/**
 * @brief
 * 		Delete a resource
 *
 * @param[in]	preq	- The request containing information about the resource to
 * 		     				delete
 *
 * @par
 * 		Requests to delete resources that are set on a job or reservation
 * 		are rejected. If the resource is set on any other object, i.e., server,
 * 		queue, or node, the resource is unset from the associated object.
 *
 * @return void
 */
static void
mgr_resource_delete(struct batch_request *preq)
{
	char *resc;
	int rc;
	int i, j;
	pbs_queue *pq;
	resource_def *prdef;
	attribute *pattr;
	resource_def *svr_rd;
	resource_def *svr_rd_prev;
	svrattrl *plist;
	int bad;
	int updatedb; /* set to 1 if a db update is needed */

	if ((resc = preq->rq_ind.rq_manager.rq_objname) == NULL) {
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}

	if ((prdef = find_resc_def(svr_resc_def, resc)) == NULL) {
		req_reject(PBSE_UNKRESC, 0, preq);
		return;
	}

	if (!prdef->rs_custom) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	rc = check_resource_set_on_jobs_or_resvs(preq, prdef, 1);
	if (rc == 1)
		return;

	/* check if resource is set in restrict_res_to_release_on_suspend */
	if (is_sattr_set(SVR_ATR_restrict_res_to_release_on_suspend)) {
		struct array_strings *pval = get_sattr_arst(SVR_ATR_restrict_res_to_release_on_suspend);
		for (i = 0; pval != NULL && i < pval->as_usedptr; i++) {
			if (strcmp(pval->as_string[i], prdef->rs_name) == 0) {
				reply_text(preq, PBSE_RESCBUSY, "Resource busy on server");
				return;
			}
		}
	}

	rc = update_resource_def_file(resc, RESDEF_DELETE, prdef->rs_type, prdef->rs_flags);
	if (rc != 0) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESC, LOG_ERR, msg_daemonname, "Error updating resource definitions");
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	/* Is the resource set on queues? If so unset */
	pq = (pbs_queue *) GET_NEXT(svr_queues);
	while (pq != NULL) {
		updatedb = 0;
		for (i = 0; i < QA_ATR_LAST; i++) {
			pattr = get_qattr(pq, i);
			if (is_attr_set(pattr) && (pattr->at_type == ATR_TYPE_RESC || pattr->at_type == ATR_TYPE_ENTITY)) {
				plist = attrlist_create(que_attr_def[i].at_name, prdef->rs_name, 0);
				plist->al_link.ll_next->ll_struct = NULL;
				rc = mgr_unset_attr(pq->qu_attr, que_attr_idx, que_attr_def, QA_ATR_LAST, plist, -1, &bad, (void *) pq, PARENT_TYPE_QUE_ALL, INDIRECT_RES_CHECK);
				if (rc != 0) {
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESC, LOG_DEBUG, resc, "error unsetting resource %s.%s", que_attr_def[i].at_name, prdef->rs_name);
					reply_badattr(rc, bad, plist, preq);
					free_svrattrl(plist);
					return;
				} else {
					/* default_chunk requires special handling because
					 * the server keeps track of defaults to add to
					 * schedselect @see qu_seldft
					 */
					if (i == QE_ATR_DefaultChunk && (get_qattr(pq, QE_ATR_DefaultChunk))->at_flags & ATR_VFLAG_MODIFY)
						(void) deflt_chunk_action(get_qattr(pq, QE_ATR_DefaultChunk), (void *) pq, ATR_ACTION_ALTER);
				}
				updatedb = 1;
				free_svrattrl(plist);
			}
		}
		if (updatedb) {
			que_save_db(pq);
		}
		pq = (pbs_queue *) GET_NEXT(pq->qu_link);
	}

	updatedb = 0;
	/* Is the resource set on the server? If so unset */
	for (i = 0; i < SVR_ATR_LAST; i++) {
		pattr = get_sattr(i);
		if (is_attr_set(pattr) && (pattr->at_type == ATR_TYPE_RESC || pattr->at_type == ATR_TYPE_ENTITY)) {
			plist = attrlist_create(svr_attr_def[i].at_name, prdef->rs_name, 0);
			plist->al_link.ll_next->ll_struct = NULL;
			rc = mgr_unset_attr(server.sv_attr, svr_attr_idx, svr_attr_def, SVR_ATR_LAST, plist, -1, &bad, (void *) &server, PARENT_TYPE_SERVER, INDIRECT_RES_CHECK);
			if (rc != 0) {
				log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESC, LOG_DEBUG, resc, "error unsetting resource %s.%s", svr_attr_def[i].at_name, prdef->rs_name);
				reply_badattr(rc, bad, plist, preq);
				free_svrattrl(plist);
				return;
			} else {
				/* default_chunk requires special handling because
				 * the server keeps track of defaults to add to
				 * schedselect @see sv_seldft
				 */
				attribute *dfltchk_attr;
				if ((i == SVR_ATR_DefaultChunk) && ((dfltchk_attr = get_sattr(SVR_ATR_DefaultChunk))->at_flags & ATR_VFLAG_MODIFY)) {
					(void) deflt_chunk_action(dfltchk_attr, (void *) &server, ATR_ACTION_ALTER);
				}
			}
			free_svrattrl(plist);
			updatedb = 1;
		}
	}
	if (updatedb) {
		svr_save_db(&server);
	}

	/* Is the resource set on nodes? If so unset */
	for (i = 0; i < svr_totnodes; i++) {
		updatedb = 0;
		for (j = 0; j < ND_ATR_LAST; j++) {
			pattr = get_nattr(pbsndlist[i], j);
			if (is_attr_set(pattr) && (pattr->at_type == ATR_TYPE_RESC || pattr->at_type == ATR_TYPE_ENTITY)) {
				plist = attrlist_create(node_attr_def[j].at_name, prdef->rs_name, 0);
				plist->al_link.ll_next->ll_struct = NULL;
				rc = mgr_unset_attr(pbsndlist[i]->nd_attr, node_attr_idx, node_attr_def, ND_ATR_LAST, plist, -1, &bad, (void *) pbsndlist[i], PARENT_TYPE_NODE, INDIRECT_RES_UNLINK);
				if (rc != 0) {
					log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESC, LOG_DEBUG, resc, "error unsetting resource %s.%s", node_attr_def[i].at_name, prdef->rs_name);
					reply_badattr(rc, bad, plist, preq);
					free_svrattrl(plist);
					return;
				}
				free_svrattrl(plist);
				updatedb = 1;
			}
		}
		if (updatedb) {
			node_save_db(pbsndlist[i]);
		}
	}

	for (i = 0; svr_resc_sum[i].rs_def != NULL; i++) {
		if (svr_resc_sum[i].rs_def == prdef) {
			for (j = i; svr_resc_sum[j].rs_def != NULL; j++) {
				svr_resc_sum[j].rs_def = svr_resc_sum[j + 1].rs_def;
				svr_resc_sum[j].rs_prs = svr_resc_sum[j + 1].rs_prs;
				svr_resc_sum[j].rs_attr = svr_resc_sum[j + 1].rs_attr;
				svr_resc_sum[j].rs_set = svr_resc_sum[j + 1].rs_set;
			}
			break;
		}
	}

	for (svr_rd_prev = NULL, svr_rd = svr_resc_def; svr_rd != NULL; svr_rd_prev = svr_rd, svr_rd = svr_rd->rs_next) {
		if (svr_rd == prdef) {
			if (svr_rd_prev != NULL) {
				svr_rd_prev->rs_next = svr_rd->rs_next;
			} else {
				svr_resc_def = svr_rd->rs_next;
			}
			if (pbs_idx_delete(resc_attrdef_idx, prdef->rs_name) != PBS_IDX_RET_OK)
				log_errf(-1, __func__, "Could not remove %s from server resource index", prdef->rs_name);
			free(prdef->rs_name);
			free(prdef);
			prdef = NULL;
			svr_resc_size--;
			break;
		}
	}

	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_RESC, LOG_INFO, resc, msg_manager, msg_man_del, preq->rq_user, preq->rq_host);

	reply_ack(preq);

	restart_python_interpreter(__func__);
	deferred_send_rescdef();
	set_scheduler_flag(SCH_CONFIGURE, NULL);

	return;
}

/**
 * @brief
 * 		Set a resource type and/or flag
 *
 * @param[in]	preq	- The request containing information about the resource to
 * 		     				set
 *
 * @par
 * 		Requests to set a resource type is only possible if the resource
 * 		is not set on any object, i.e. not on any job, reservation, node, queue, or
 * 		server.
 *
 * @par
 * 		Requests to set a resource flag is only possible if the resource
 * 		is not set on any job or reservation. Setting/resetting a resource's
 * 		visibility flags i or r is however always honored regardless of whether the
 * 		resource is defined on objects or not.
 *
 * @return void
 */
static void
mgr_resource_set(struct batch_request *preq)
{
	char *resc;
	char buf[LOG_BUF_SIZE];
	resource_def *prdef;
	svrattrl *plist;
	int type;
	int flags;
	int o_flags;
	int flag_ir = 0;
	int i, j;
	attribute *pattr;
	resource *presc;
	pbs_queue *pq;
	int mod_type = 0;
	int mod_flag = 0;
	int busy;
	int rc;
	struct resc_type_map *p_resc_type_map = NULL;

	if ((preq->rq_perm & PERM_MANAGER) == 0) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	if ((resc = preq->rq_ind.rq_manager.rq_objname) == NULL) {
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}

	prdef = find_resc_def(svr_resc_def, resc);
	if (prdef == NULL) {
		req_reject(PBSE_UNKRESC, 0, preq);
		return;
	}

	if (!prdef->rs_custom) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	if (plist == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "missing type and/or permissions for '%s'", resc);
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}
	while (plist != NULL) {
		if (strcmp(plist->al_atopl.name, ATTR_RESC_TYPE) == 0) {
			/* we will reject any request that modifies type if the
			 * resource is set on any object
			 */
			mod_type = 1;
		} else if (strcmp(plist->al_atopl.name, ATTR_RESC_FLAG) == 0) {
			const char *f = "fhnq";
			char *new = plist->al_atopl.value;
			char *old = find_resc_flag_map(prdef->rs_flags);

			/* If any of "fhnq" flags are being added, then reject
			 * the request if the resource is set on
			 * jobs/reservations.
			 *
			 * Adding flags r or i is allowed
			 */
			for (i = 0; (i < strlen(f)) && (mod_flag == 0); i++) {
				if ((strchr(old, f[i]) == NULL) &&
				    (strchr(new, f[i]) != NULL)) {
					mod_flag = 1;
				} else if ((strchr(old, f[i]) != NULL) &&
					   (strchr(new, f[i]) == NULL)) {
					mod_flag = 1;
				}
			}
			free(old);
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	rc = check_resource_set_on_jobs_or_resvs(preq, prdef, (mod_type || mod_flag));
	if (rc == 1) {
		/* check function replies to client's preq */
		return;
	}
	/* Reject if resource is on a queue and the type is being modified */
	pq = (pbs_queue *) GET_NEXT(svr_queues);
	while (pq != NULL) {
		busy = 0;
		for (i = 0; (i < QA_ATR_LAST) && (busy == 0); i++) {
			pattr = get_qattr(pq, i);
			if (pattr->at_type == ATR_TYPE_RESC) {
				presc = get_resource(pattr, prdef);
				if ((mod_type == 1) && (presc != NULL)) {
					busy = 1;
				}
			} else if (pattr->at_type == ATR_TYPE_ENTITY) {
				if ((mod_type == 1) && is_entity_resource_set(pattr, prdef->rs_name)) {
					busy = 1;
				}
			}
		}
		if (busy) {
			reply_text(preq, PBSE_RESCBUSY, "Resource busy on queue");
			return;
		}
		pq = (pbs_queue *) GET_NEXT(pq->qu_link);
	}

	/* Reject if resource is on the server and the type is being modified */
	for (i = 0, busy = 0; (i < SVR_ATR_LAST) && (busy == 0); i++) {
		pattr = get_sattr(i);
		if (pattr->at_type == ATR_TYPE_RESC) {
			presc = get_resource(pattr, prdef);
			if ((presc != NULL) && (mod_type == 1)) {
				busy = 1;
			}
		} else if (pattr->at_type == ATR_TYPE_ENTITY) {
			if ((mod_type == 1) && is_entity_resource_set(pattr, prdef->rs_name)) {
				busy = 1;
			}
		}
	}
	if (busy) {
		reply_text(preq, PBSE_RESCBUSY, "Resource busy on server");
		return;
	}

	/* Reject if resource is on a node and the type is being modified */
	for (i = 0; i < svr_totnodes; i++) {
		if (pbsndlist[i]->nd_state & INUSE_DELETED)
			continue;

		pattr = get_nattr(pbsndlist[i], ND_ATR_ResourceAvail);
		for (j = 0; j < ND_ATR_LAST; j++) {
			pattr = get_nattr(pbsndlist[i], j);
			presc = get_resource(pattr, prdef);
			if ((presc != NULL) && (mod_type == 1)) {
				reply_text(preq, PBSE_RESCBUSY, "Resource busy on node");
				return;
			}
		}
	}

	type = prdef->rs_type;
	o_flags = flags = prdef->rs_flags;

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	while (plist) {
		if (strcmp(plist->al_atopl.name, ATTR_RESC_TYPE) == 0) {
			p_resc_type_map = find_resc_type_map_by_typest(plist->al_atopl.value);
			if (p_resc_type_map == NULL) {
				req_reject(PBSE_BADATVAL, 0, preq);
				return;
			}
			type = p_resc_type_map->rtm_type;
		} else if (strcmp(plist->al_atopl.name, ATTR_RESC_FLAG) == 0) {
			if (parse_resc_flags(plist->al_atopl.value, &flag_ir, &flags) == -1) {
				req_reject(PBSE_BADATVAL, 0, preq);
				return;
			}
			mod_flag = 1;
		} else {
			req_reject(PBSE_BADATVAL, 0, preq);
			return;
		}

		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	if (verify_resc_type_and_flags(type, &flag_ir, &flags, resc, buf, sizeof(buf), 0) != 0) {
		reply_text(preq, PBSE_BADATVAL, buf);
		return;
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	mgr_log_attr(msg_man_set, plist, PBS_EVENTCLASS_RESC, resc, NULL);

	rc = update_resource_def_file(resc, RESDEF_UPDATE, type, flags);
	if (rc != 0) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESC, LOG_ERR, msg_daemonname, "Error updating resource definitions");
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	if (mod_type && (p_resc_type_map != NULL)) {
		prdef->rs_decode = p_resc_type_map->rtm_decode;
		prdef->rs_encode = p_resc_type_map->rtm_encode;
		prdef->rs_set = p_resc_type_map->rtm_set;
		prdef->rs_comp = p_resc_type_map->rtm_comp;
		prdef->rs_free = p_resc_type_map->rtm_free;
		prdef->rs_type = p_resc_type_map->rtm_type;
	}
	if (mod_flag) {
		prdef->rs_flags = flags;
	}

	if ((o_flags & (ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) ||
	    (flags & (ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN))) {
		update_resc_sum();
	}

	reply_ack(preq);

	restart_python_interpreter(__func__);
	deferred_send_rescdef();
	set_scheduler_flag(SCH_CONFIGURE, NULL);

	return;
}

/**
 * @brief
 * 		Unset a resource flag
 *
 * @param[in]	preq	- The request containing information about the resource to
 * 		     				unset
 *
 * @par
 * 		Request to unset a resource flag is rejected if the resource is
 * 		set on any job or reservation.
 *
 * @return void
 */
static void
mgr_resource_unset(struct batch_request *preq)
{
	resource_def *prdef;
	svrattrl *plist;
	char *resc;
	int i, j;
	attribute *pattr;
	resource *presc;
	pbs_queue *pq;
	int mod = 0;
	int busy;
	int rc;
	int o_type;
	int o_flags;
	pbs_queue **pq_list = NULL;
	int pq_list_size = 0;
	attribute *q_attr = NULL;
	int q_count = 0;

	if ((preq->rq_perm & PERM_MANAGER) == 0) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	if ((resc = preq->rq_ind.rq_manager.rq_objname) == NULL) {
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}

	prdef = find_resc_def(svr_resc_def, resc);
	if (prdef == NULL) {
		req_reject(PBSE_UNKRESC, 0, preq);
		return;
	}

	if (!prdef->rs_custom) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	if (plist == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "missing type and/or permissions for '%s'", resc);
		req_reject(PBSE_BADATVAL, 0, preq);
		return;
	}
	while (plist) {
		if ((strcmp(plist->al_atopl.name, ATTR_RESC_TYPE) == 0)) {
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		}
		if (strcmp(plist->al_atopl.name, ATTR_RESC_FLAG) == 0) {
			mod = 1;
			break;
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	rc = check_resource_set_on_jobs_or_resvs(preq, prdef, 1);
	if (rc == 1)
		return;

	/* Reject if resource is on a queue */
	pq = (pbs_queue *) GET_NEXT(svr_queues);
	while (pq != NULL) {
		for (i = 0, busy = 0; (i < QA_ATR_LAST) && (busy == 0); i++) {
			pattr = get_qattr(pq, i);
			if (pattr->at_type == ATR_TYPE_RESC) {
				presc = get_resource(pattr, prdef);
				if ((presc != NULL) && (mod == 1)) {
					if (i == QE_ATR_ResourceAssn) {
						pbs_queue **temp_q = NULL;
						temp_q = (pbs_queue **) realloc(pq_list, (pq_list_size + 1) * sizeof(pbs_queue *));
						if (temp_q == NULL) {
							reply_text(preq, PBSE_SYSTEM, "malloc failure");
							return;
						}
						pq_list = temp_q;
						pq_list[pq_list_size] = pq;
						pq_list_size++;
					} else
						busy = 1;
				}
			} else if (pattr->at_type == ATR_TYPE_ENTITY) {
				if ((mod == 1) && is_entity_resource_set(pattr, prdef->rs_name)) {
					busy = 1;
				}
			}
		}
		if (busy) {
			reply_text(preq, PBSE_RESCBUSY, "Resource busy on queue");
			if (pq_list != NULL)
				free(pq_list);
			return;
		}
		pq = (pbs_queue *) GET_NEXT(pq->qu_link);
	}

	/* Reject if resource is on a node */
	for (i = 0; i < svr_totnodes; i++) {
		if (pbsndlist[i]->nd_state & INUSE_DELETED)
			continue;

		for (j = 0; j < ND_ATR_LAST; j++) {
			pattr = get_nattr(pbsndlist[i], j);
			presc = get_resource(pattr, prdef);
			if ((presc != NULL) && (mod == 1)) {
				reply_text(preq, PBSE_RESCBUSY, "Resource busy on node");
				if (pq_list != NULL)
					free(pq_list);
				return;
			}
		}
	}

	/* Reject if resource is on the server */
	for (i = 0, busy = 0; (i < SVR_ATR_LAST) && (busy == 0); i++) {
		pattr = get_sattr(i);
		if (pattr->at_type == ATR_TYPE_RESC) {
			presc = get_resource(pattr, prdef);
			if ((presc != NULL) && (mod == 1)) {
				/* Since the resource is not present in resources_available attribute
				 * just delete the resource entry from resources_assigned attribute.
				 */
				if (i == SVR_ATR_resource_assn) {
					if (pattr->at_flags & ATR_VFLAG_SET) {
						presc->rs_defin->rs_free(&presc->rs_value);
						delete_link(&presc->rs_link);
						free(presc);
						presc = (resource *) GET_NEXT(get_attr_list(pattr));
						if (presc == NULL)
							pattr->at_flags &= ~ATR_VFLAG_SET;
						pattr->at_flags |= ATR_MOD_MCACHE;
					}
				} else
					busy = 1;
			}
		} else if (is_attr_set(pattr) && (pattr->at_type == ATR_TYPE_ENTITY)) {
			if ((mod == 1) && is_entity_resource_set(pattr, prdef->rs_name)) {
				busy = 1;
			}
		}
	}
	if (busy) {
		reply_text(preq, PBSE_RESCBUSY, "Resource busy on server");
		if (pq_list != NULL)
			free(pq_list);
		return;
	}
	if (pq_list != NULL) {
		for (q_count = 0; q_count < pq_list_size; q_count++) {
			q_attr = get_qattr(pq_list[q_count], QE_ATR_ResourceAssn);
			presc = get_resource(q_attr, prdef);
			presc->rs_defin->rs_free(&presc->rs_value);
			delete_link(&presc->rs_link);
			free(presc);
			presc = (resource *) GET_NEXT(q_attr->at_val.at_list);
			if (presc == NULL)
				mark_attr_not_set(q_attr);
			q_attr->at_flags |= ATR_MOD_MCACHE;
		}
		free(pq_list);
		pq_list = NULL;
	}

	o_type = prdef->rs_type;
	o_flags = prdef->rs_flags;

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	while (plist) {
		/* Only consider flag since unsetting type is disallowed */
		if (strcmp(plist->al_atopl.name, ATTR_RESC_FLAG) == 0) {
			prdef->rs_flags = READ_WRITE;
		} else {
			req_reject(PBSE_BADATVAL, 0, preq);
			return;
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_manager.rq_attr);
	mgr_log_attr(msg_man_uns, plist, PBS_EVENTCLASS_RESC, resc, NULL);

	rc = update_resource_def_file(resc, RESDEF_UPDATE, prdef->rs_type, prdef->rs_flags);
	if (rc != 0) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESC, LOG_ERR, msg_daemonname, "Error updating resource definitions");
		/* rollback mods */
		prdef->rs_type = o_type;
		prdef->rs_flags = o_flags;
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	if (o_flags & (ATR_DFLAG_RASSN | ATR_DFLAG_FNASSN | ATR_DFLAG_ANASSN)) {
		update_resc_sum();
	}

	reply_ack(preq);

	restart_python_interpreter(__func__);
	deferred_send_rescdef();
	set_scheduler_flag(SCH_CONFIGURE, NULL);

	return;
}

/**
 * @brief
 * 		req_manager - the dispatch routine for a series of functions which
 *		implement the Manager (qmgr) Batch Request
 *
 *		The privilege of the requester is checked against the type of
 *		the object and the operation to be performed on it.  Then the
 *		appropriate function is called to perform the operation.
 *
 * @param[in]	preq	- The request containing information about the resource to perform the operation.
 *
 * @return void
 *
 */
void
req_manager(struct batch_request *preq)
{
	int obj_name_len;
	conn_t *conn = NULL;

	++preq->rq_refct;

	if (preq->prot == PROT_TCP) {
		if (preq->rq_conn != PBS_LOCAL_CONNECTION) {
			conn = get_conn(preq->rq_conn);
			if (!conn) {
				log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_REQUEST, LOG_ERR, __func__, "did not find socket in connection table");
				req_reject(PBSE_SYSTEM, 0, preq);
				goto req_manager_exit;
			}
		}
	}

	obj_name_len = strlen(preq->rq_ind.rq_manager.rq_objname);

	switch (preq->rq_ind.rq_manager.rq_cmd) {

		case MGR_CMD_CREATE:
		case MGR_CMD_DELETE:

			/* MGR_OBJ_SITE_HOOK permission checking is different */
			if (preq->rq_ind.rq_manager.rq_objtype != MGR_OBJ_SITE_HOOK) {
				if ((preq->rq_perm & PERM_MANAGER) == 0) {
					req_reject(PBSE_PERM, 0, preq);
					goto req_manager_exit;
				}
			}

			switch (preq->rq_ind.rq_manager.rq_objtype) {
				case MGR_OBJ_QUEUE:
					if (preq->rq_ind.rq_manager.rq_cmd == MGR_CMD_CREATE)
						mgr_queue_create(preq);
					else
						mgr_queue_delete(preq);
					break;

				case MGR_OBJ_NODE:
					if (preq->rq_ind.rq_manager.rq_cmd == MGR_CMD_CREATE)
						mgr_node_create(preq);
					else
						mgr_node_delete(preq);
					break;

				case MGR_OBJ_SITE_HOOK:
					if (!is_local_root(preq->rq_user, preq->rq_host)) {
						sprintf(log_buffer,
							"%s@%s is unauthorized to access hooks data from server %s",
							preq->rq_user, preq->rq_host, server_host);

						reply_text(preq, PBSE_HOOKERROR, log_buffer);
						goto req_manager_exit;
					}
					if (preq->rq_ind.rq_manager.rq_cmd == MGR_CMD_CREATE)
						mgr_hook_create(preq);
					else
						mgr_hook_delete(preq);
					break;

				case MGR_OBJ_RSC:
					if (preq->rq_ind.rq_manager.rq_cmd == MGR_CMD_CREATE)
						mgr_resource_create(preq);
					else
						mgr_resource_delete(preq);
					break;

				case MGR_OBJ_SCHED:
					if (preq->rq_ind.rq_manager.rq_cmd == MGR_CMD_CREATE) {
						if (obj_name_len == 0) {
							strncpy(preq->rq_ind.rq_manager.rq_objname,
								PBS_DFLT_SCHED_NAME, PBS_MAXSVRJOBID);
							preq->rq_ind.rq_manager.rq_objname[PBS_MAXSVRJOBID] = '\0';
						}
						mgr_sched_create(preq);
					} else
						mgr_sched_delete(preq);
					break;

				default:
					req_reject(PBSE_IVALREQ, 0, preq);
					goto req_manager_exit;
			}
			break;

		case MGR_CMD_SET:

			/* MGR_OBJ_SITE_HOOK permission checking is different */
			if ((preq->rq_ind.rq_manager.rq_objtype != MGR_OBJ_SITE_HOOK) &&
			    (preq->rq_ind.rq_manager.rq_objtype != MGR_OBJ_PBS_HOOK)) {
				if ((preq->rq_perm & PERM_OPorMGR) == 0) {
					req_reject(PBSE_PERM, 0, preq);
					goto req_manager_exit;
				}
			}

			switch (preq->rq_ind.rq_manager.rq_objtype) {
				case MGR_OBJ_SERVER:
					mgr_server_set(preq, conn);
					break;
				case MGR_OBJ_SCHED:
					if (obj_name_len == 0) {
						strncpy(preq->rq_ind.rq_manager.rq_objname,
							PBS_DFLT_SCHED_NAME, PBS_MAXSVRJOBID);
						preq->rq_ind.rq_manager.rq_objname[PBS_MAXSVRJOBID] = '\0';
					}
					mgr_sched_set(preq);
					break;
				case MGR_OBJ_QUEUE:
					mgr_queue_set(preq);
					break;
				case MGR_OBJ_NODE:
				case MGR_OBJ_HOST:
					mgr_node_set(preq);
					break;
				case MGR_OBJ_SITE_HOOK:
				case MGR_OBJ_PBS_HOOK:
					if (!is_local_root(preq->rq_user, preq->rq_host)) {
						sprintf(log_buffer,
							"%s@%s is unauthorized to access hooks data from server %s",
							preq->rq_user, preq->rq_host, server_host);

						reply_text(preq, PBSE_HOOKERROR, log_buffer);
						goto req_manager_exit;
					}
					mgr_hook_set(preq);
					break;
				case MGR_OBJ_RSC:
					mgr_resource_set(preq);
					break;
				default:
					req_reject(PBSE_IVALREQ, 0, preq);
					goto req_manager_exit;
			}
			break;

		case MGR_CMD_UNSET:
			/* MGR_OBJ_SITE_HOOK permission checking is different */
			if ((preq->rq_ind.rq_manager.rq_objtype != MGR_OBJ_SITE_HOOK) &&
			    (preq->rq_ind.rq_manager.rq_objtype != MGR_OBJ_PBS_HOOK)) {
				if ((preq->rq_perm & PERM_OPorMGR) == 0) {
					req_reject(PBSE_PERM, 0, preq);
					goto req_manager_exit;
				}
			}

			switch (preq->rq_ind.rq_manager.rq_objtype) {
				case MGR_OBJ_SERVER:
					mgr_server_unset(preq, conn);
					break;
				case MGR_OBJ_QUEUE:
					mgr_queue_unset(preq);
					break;
				case MGR_OBJ_NODE:
					mgr_node_unset(preq);
					break;
				case MGR_OBJ_SITE_HOOK:
				case MGR_OBJ_PBS_HOOK:
					if (!is_local_root(preq->rq_user, preq->rq_host)) {
						sprintf(log_buffer,
							"%s@%s is unauthorized to access hooks data from server %s",
							preq->rq_user, preq->rq_host,
							server_host);

						reply_text(preq, PBSE_HOOKERROR, log_buffer);
						goto req_manager_exit;
					}
					mgr_hook_unset(preq);
					break;
				case MGR_OBJ_SCHED:
					if (obj_name_len == 0) {
						strncpy(preq->rq_ind.rq_manager.rq_objname,
							PBS_DFLT_SCHED_NAME, PBS_MAXSVRJOBID);
						preq->rq_ind.rq_manager.rq_objname[PBS_MAXSVRJOBID] = '\0';
					}
					mgr_sched_unset(preq);
					break;
				case MGR_OBJ_RSC:
					mgr_resource_unset(preq);
					break;
				default:
					req_reject(PBSE_IVALREQ, 0, preq);
					goto req_manager_exit;
			}
			break;

		case MGR_CMD_IMPORT:

			/* If this expands to operate on other objects like       */
			/* MGR_OBJ_SERVER, MGR_OBJ_QUEUE, MGR_OBJ_NODE, then you  */
			/* might need to put back in here the permission checking */
			/* "if( (preq->rq_perm & PERM_OPorMGR) == 0)..."          */

			switch (preq->rq_ind.rq_manager.rq_objtype) {
				case MGR_OBJ_SITE_HOOK:
				case MGR_OBJ_PBS_HOOK:
					if (!is_local_root(preq->rq_user, preq->rq_host)) {
						sprintf(log_buffer,
							"%s@%s is unauthorized to access hooks data from server %s",
							preq->rq_user, preq->rq_host, server_host);

						reply_text(preq, PBSE_HOOKERROR, log_buffer);
						goto req_manager_exit;
					}
					mgr_hook_import(preq);
					break;
				default:
					req_reject(PBSE_IVALREQ, 0, preq);
					goto req_manager_exit;
			}
			break;

		case MGR_CMD_EXPORT:

			/* If this expands to operate on other objects like       */
			/* MGR_OBJ_SERVER, MGR_OBJ_QUEUE, MGR_OBJ_NODE, then you  */
			/* might need to put back in here the permission checking */
			/* "if( (preq->rq_perm & PERM_OPorMGR) == 0)..."          */

			switch (preq->rq_ind.rq_manager.rq_objtype) {
				case MGR_OBJ_SITE_HOOK:
				case MGR_OBJ_PBS_HOOK:
					if (!is_local_root(preq->rq_user, preq->rq_host)) {
						sprintf(log_buffer,
							"%s@%s is unauthorized to access hooks data from server %s",
							preq->rq_user, preq->rq_host, server_host);

						reply_text(preq, PBSE_HOOKERROR, log_buffer);
						goto req_manager_exit;
					}
					mgr_hook_export(preq);
					break;
				default:
					req_reject(PBSE_IVALREQ, 0, preq);
					goto req_manager_exit;
			}
			break;

		default: /*batch_request specified an invalid command*/
			req_reject(PBSE_IVALREQ, 0, preq);
			goto req_manager_exit;
	}
req_manager_exit : {
	char hook_msg[HOOK_MSG_SIZE];
	process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
}
	if (--preq->rq_refct == 0) {
		reply_send(preq);
	}
}

/**
 * @brief
 * 		manager_oper_chk - check the @host part of a manager or operator acl
 *		entry to insure it is fully qualified.  This is to prevent
 *		input errors when setting the list.
 *		This is the at_action() routine for the server attributes
 *		"managers" and "operators"
 *
 * @param[in]	pattr	-     pointer to new attribute value
 * @param[in]	pobject	-     pointer to node
 * @param[in]	actmode	-     action mode
 *
 * @return	error code
 * @retval	0	- success
 * @retval	PBSE_BADHOST	- failure
 */

int
manager_oper_chk(attribute *pattr, void *pobject, int actmode)
{
	char *entry;
	int err = 0;
	char hostname[PBS_MAXHOSTNAME + 1];
	int i;
	struct array_strings *pstr;

	if (actmode == ATR_ACTION_FREE)
		return (0); /* no checking on free */

	if ((pstr = pattr->at_val.at_arst) == NULL)
		return (0);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	/* with kerberos, we do not check */
	return 0;
#endif

	for (i = 0; i < pstr->as_usedptr; ++i) {
		entry = strchr(pstr->as_string[i], (int) '@');
		if (entry == NULL) {
			err = PBSE_BADHOST;
			break;
		}
		entry++;	     /* point after the '@' */
		if (*entry != '*') { /* if == * cannot check it any more */
			/* if not wild card, must be fully qualified host */
			if (get_fullhostname(entry, hostname, (sizeof(hostname) - 1)) ||
			    strncasecmp(entry, hostname, (sizeof(hostname) - 1))) {
				if (actmode == ATR_ACTION_RECOV) {
					(void) sprintf(log_buffer, "bad entry in acl: %s",
						       pstr->as_string[i]);
					log_err(PBSE_BADHOST, "manager_oper_chk",
						log_buffer);
				} else {
					err = PBSE_BADHOST;
				}
			}
		}
	}
	return (err);
}

/**
 * @brief
 * 		node_comment - action routine for the comment attribute of a node
 *		if set to non-default, set flag to cause node_status file to
 *		be written.   The comment will be the last item on the status line.
 *
 * @param[in]	pattr	-     pointer to new attribute value
 * @param[in]	pobj    -     pointer to node
 * @param[in]	act     -     action mode
 *
 * @return	error code
 * @retval	0	- success
 */
int
node_comment(attribute *pattr, void *pobj, int act)
{
	return 0;
}

/**
 * @brief
 *		Checks if provisioning can be enabled on a vnode.
 *
 * @par Functionality:
 *		This function is an action routine for provision_enable attribute of a
 *		node and server. It checks if attribute can be set a vnode. If vnode is
 *		a head node returns error.
 *
 * @param[in]	new     -     pointer to new attribute value
 * @param[in]	pobj    -     pointer to node
 * @param[in]	act     -     action mode
 *
 * @return	int
 * @retval	 PBSE_NONE	- success
 * @retval	 PBSE_PROV_HEADERROR	- failure if setting on head node
 *
 * @par Side Effects: None
 *
 * @par MT-safe: No
 *
 */
int
node_prov_enable_action(attribute *new, void *pobj, int act)
{
	struct pbsnode *pnode = (struct pbsnode *) pobj;

	if (is_attr_set(new) && new->at_val.at_long == 1) {
		/* Check user tries to set on Head node */
		if (is_nattr_set(pnode, ND_ATR_Mom) && compare_short_hostname(get_nattr_str(pnode, ND_ATR_Mom), server_host) == 0)
			return PBSE_PROV_HEADERROR;
	}

	return PBSE_NONE;
}

/**
 * @brief
 *		Checks if prov_tracking size needs to be readjusted.
 *
 * @par Functionality:
 *		This function is action routine for max_concurrent_provision attribute
 *		of server. It resizes prov_tracking table. If new value is greater than
 *		current value, an immediate work task is created to drain queued provisioning
 *		requests.
 *
 * @see
 *		#prov_tracking in provision.h
 *
 * @param[in]	new     -     pointer to new attribute value
 * @param[in]	pobj    -     pointer to node
 * @param[in]	act     -     action mode
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	PBSE_BADATVAL : if the value provided <= 0
 * @retval	PBSE_SYSTEM : error returned if resize_prov_table function fails
 *
 * @par Side Effects:
 *		Unknown
 *
 * @par MT-safe: No
 *
 */
int
svr_max_conc_prov_action(attribute *new, void *pobj, int act)
{
	int rc;

	if (is_attr_set(new)) {

		if ((int) new->at_val.at_long <= 0)
			return PBSE_BADATVAL;
	}

	max_concurrent_prov = new->at_val.at_long;

	if (act == ATR_ACTION_RECOV)
		/* dont resize prov table yet, since we might be recovering */
		return PBSE_NONE;

	/* pick a few if size is increased */
	if (server.sv_provtracksize < max_concurrent_prov)
		set_task(WORK_Immed, 0, do_provisioning, NULL);

	rc = resize_prov_table(max_concurrent_prov);

	return rc;
}

/**
 * @brief
 *		Resizes and reinitializes prov_tracking table.
 *
 * @par Functionality:
 *		This function resizes and reinitializes provision tracking table as per
 *		newsize. If there is an action provisioning taking place and newsize is
 *		less than current size then it does not resize or reinitialize.
 *
 * @param[in]	newsize	-	new size of provision table
 *
 * @return	int
 * @retval	PBSE_NONE	: success or no action taken
 * @retval	PBSE_SYSTEM	: failure
 *
 * @par Side Effects:
 *		Unknown
 *
 * @par MT-safe: No
 *
 */
int
resize_prov_table(int newsize)
{
	struct prov_tracking *tmp;
	int i;
	int oldsize = server.sv_provtracksize; /* save  previous size */

	DBPRT(("resize_prov_table: oldsize = %d, newsize=%d\n", oldsize, newsize))

	if (newsize == oldsize)
		return PBSE_NONE;

	if (server.sv_cur_prov_records != 0) {
		if (newsize < oldsize)
			return PBSE_NONE;
	}

	server.sv_provtracksize = newsize;

	/* though the table is scattered, by the time we resize it, its guaranteed
	 that the table will have all empty slots, so resizing to smaller is also fine */

	/* realloc the existing memory size, since table size has changed */
	tmp = (struct prov_tracking *) realloc(server.sv_prov_track,
					       server.sv_provtracksize * sizeof(struct prov_tracking));
	if (tmp == NULL)
		return PBSE_SYSTEM;
	else
		server.sv_prov_track = tmp;

	for (i = oldsize; i < server.sv_provtracksize; i++) {
		memset(&(server.sv_prov_track[i]), 0, sizeof(struct prov_tracking));
		server.sv_prov_track[i].pvtk_mtime = 0;
	}

	server.sv_provtrackmodifed = 1;
	prov_track_save();
	set_sattr_l_slim(SVR_ATR_max_concurrent_prov, newsize, SET);
	svr_save_db(&server);
	return PBSE_NONE;
}

/**
 * @brief
 *		Allows or disallows setting current_aoe on a vnode.
 *
 * @par Functionality:
 *		This function is action routine for current_aoe attribute of a vnode.
 *		It allows setting current_aoe only if the aoe is available on the
 *		vnode and vnode is not provisioning/wait-provisioning and vnode is not
 *		a head node.
 *
 * @param[in]	new	-	pointer to new attribute value
 * @param[in]	pobj	-	pointer to node
 * @param[in]	act	-	action mode
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	PBSE_PROV_HEADERROR	: failure if node is a head node
 * @retval	PBSE_NODEPROV_NOACTION	: failure if node is provisioning/wait-provisioning
 * @retval	PBSE_NODE_BAD_CURRENT_AOE	: failure if aoe is not available on node
 *
 * @par Side Effects:
 *		Unknown
 *
 * @par MT-safe: No
 *
 */
int
node_current_aoe_action(attribute *new, void *pobj, int act)
{
	struct pbsnode *pnode = (struct pbsnode *) pobj;

	if (act == ATR_ACTION_RECOV)
		return PBSE_NONE;

	/* Check user tries to set on Head node */
	if (is_nattr_set(pnode, ND_ATR_Mom) && compare_short_hostname(get_nattr_str(pnode, ND_ATR_Mom), server_host) == 0)
		return PBSE_PROV_HEADERROR;

	/* Don't set/unset while provisioning */
	if ((pnode->nd_state & INUSE_PROV) ||
	    (pnode->nd_state & INUSE_WAIT_PROV))
		return PBSE_NODEPROV_NOACTION;

		/* check if value being set is available in resources_available.aoe */
#ifdef NAS /* localmod 148 */
	if (check_req_aoe_available(pnode, new->at_val.at_str) != 0) {
		if (pnode->nd_name != NULL) {
			sprintf(log_buffer, "node \"%s\" would have received PBSE_NODE_BAD_CURRENT_AOE, but localmod 148 avoided this", pnode->nd_name);
		} else {
			sprintf(log_buffer, "unknown node would have received PBSE_NODE_BAD_CURRENT_AOE");
		}

		log_err(-1, "node_current_aoe_action", log_buffer);
	}
#else
	if (check_req_aoe_available(pnode, new->at_val.at_str) != 0)
		return PBSE_NODE_BAD_CURRENT_AOE;
#endif /* localmod 148 */

	return PBSE_NONE;
}


================================================
FILE: src/server/req_message.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    req_message.c
 *
 * @brief
 * 		req_message.c - functions dealing with sending a message to a running job.
 *
 * Functions included are:
 * 	req_messagejob()
 * 	post_message_req()
 * 	post_py_spawn_req()
 * 	req_py_spawn()
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include "libpbs.h"
#include <signal.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "acct.h"

/* Private Function local to this file */

static void post_message_req(struct work_task *);

/* Global Data Items: */

extern char *msg_messagejob;

extern job *chk_job_request(char *, struct batch_request *, int *, int *);
extern int validate_perm_res_in_select(char *val, int val_exist);

/**
 * @brief
 * 		req_messagejob - service the Message Job Request
 *
 *		This request sends (via MOM) a message to a running job.
 *
 * @param[in]	preq	- Pointer to batch request
 */

void
req_messagejob(struct batch_request *preq)
{
	int jt; /* job type */
	job *pjob;
	int rc;

	if ((pjob = chk_job_request(preq->rq_ind.rq_message.rq_jid, preq, &jt, NULL)) == 0)
		return;

	if (jt != IS_ARRAY_NO) {
		reply_text(preq, PBSE_NOSUP, "not supported for Array Jobs");
		return;
	}

	/* the job must be running */

	if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}

	/* pass the request on to MOM */

	rc = relay_to_mom(pjob, preq, post_message_req);
	if (rc)
		req_reject(rc, 0, preq); /* unable to get to MOM */

	/* After MOM acts and replies to us, we pick up in post_message_req() */
}

/**
 * @brief
 * 		post_message_req - complete a Message Job Request
 *
 * @param[in]	pwt	-	work task structure
 */

static void
post_message_req(struct work_task *pwt)
{
	struct batch_request *preq;

	if (pwt->wt_aux2 != PROT_TPP)
		svr_disconnect(pwt->wt_event); /* close connection to MOM */
	preq = pwt->wt_parm1;
	preq->rq_conn = preq->rq_orgconn; /* restore socket to client */

	(void) sprintf(log_buffer, msg_messagejob, preq->rq_reply.brp_code);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  preq->rq_ind.rq_message.rq_jid, log_buffer);
	if (preq->rq_reply.brp_code)
		req_reject(preq->rq_reply.brp_code, 0, preq);
	else
		reply_ack(preq);
}

/**
 * @brief
 * 		post_py_spawn_req - complete a py_spawn Job Request
 *
 * @param[in]	pwt	-	work task structure
 */

static void
post_py_spawn_req(struct work_task *pwt)
{
	struct batch_request *preq;
	char tmp_buf[128] = "";

	if (pwt->wt_aux2 != PROT_TPP)
		svr_disconnect(pwt->wt_event); /* close connection to MOM */
	preq = pwt->wt_parm1;
	preq->rq_conn = preq->rq_orgconn; /* restore socket to client */

	if (preq->rq_reply.brp_code == 0)
		sprintf(tmp_buf, " exit value %d", preq->rq_reply.brp_auxcode);
	sprintf(log_buffer, "Python spawn status %d%s",
		preq->rq_reply.brp_code, tmp_buf);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  preq->rq_ind.rq_py_spawn.rq_jid, log_buffer);
	reply_send(preq);
}

/**
 * @brief
 * 		req_py_spawn - service the Python Spawn Request
 *
 * @param[in]	preq	- Pointer to batch request
 */

void
req_py_spawn(struct batch_request *preq)
{
	int jt; /* job type */
	job *pjob;
	int rc;
	char *jid = preq->rq_ind.rq_py_spawn.rq_jid;

	/*
	 ** Returns job pointer for singleton job or "parent" of
	 ** an array job.
	 */
	pjob = chk_job_request(jid, preq, &jt, NULL);
	if (pjob == NULL)
		return;

	/* see if requestor is the job owner */
	if (svr_chk_owner(preq, pjob) != 0) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	if (jt == IS_ARRAY_NO) { /* a regular job is okay */
		/* the job must be running */
		if ((!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) ||
		    (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING))) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	} else if (jt == IS_ARRAY_Single) { /* a single subjob is okay */
		char sjst;
		int sjsst;

		get_subjob_and_state(pjob, get_index_from_jid(jid), &sjst, &sjsst);
		if (sjst == JOB_STATE_LTR_UNKNOWN) {
			req_reject(PBSE_UNKJOBID, 0, preq);
			return;
		}

		if (sjst != JOB_STATE_LTR_RUNNING || sjsst != JOB_SUBSTATE_RUNNING) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	} else {
		reply_text(preq, PBSE_NOSUP,
			   "not supported for Array Jobs or multiple sub-jobs");
		return;
	}

	/*
	 ** Pass the request on to MOM.  If this works, the function
	 ** post_py_spawn_req will be called to handle the reply.
	 ** If it fails, send the reply now.
	 */
	rc = relay_to_mom(pjob, preq, post_py_spawn_req);
	if (rc)
		req_reject(rc, 0, preq); /* unable to get to MOM */
}

/**
 * @brief
 * 	Service the PBS_BATCH_RelnodesJob Request.
 *
 * @param[in]	preq - the request structure.
 *
 * @rerturn void
 *
 */

void
req_relnodesjob(struct batch_request *preq)
{
	int jt; /* job type */
	job *pjob;
	int rc = PBSE_NONE;
	char *jid;
	char *nodeslist = NULL;
	char msg[LOG_BUF_SIZE];
	char *keep_select = NULL;

	if (preq == NULL)
		return;

	jid = preq->rq_ind.rq_relnodes.rq_jid;
	if (jid == NULL)
		return;

	/*
	 ** Returns job pointer for singleton job or "parent" of
	 ** an array job.
	 */
	pjob = chk_job_request(jid, preq, &jt, NULL);
	if (pjob == NULL) {
		return;
	}

	if (jt == IS_ARRAY_NO) { /* a regular job is okay */
		/* the job must be running */
		if ((!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) ||
		    (!check_job_substate(pjob, JOB_SUBSTATE_RUNNING))) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	} else if (jt == IS_ARRAY_Single) { /* a single subjob is okay */
		char sjst;
		int sjsst;

		pjob = get_subjob_and_state(pjob, get_index_from_jid(jid), &sjst, &sjsst);
		if (pjob == NULL || sjst == JOB_STATE_LTR_UNKNOWN) {
			req_reject(PBSE_UNKJOBID, 0, preq);
			return;
		}

		if (sjst != JOB_STATE_LTR_RUNNING || sjsst != JOB_SUBSTATE_RUNNING) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	} else {
		reply_text(preq, PBSE_NOSUP,
			   "not supported for Array Jobs or multiple sub-jobs");
		return;
	}

	nodeslist = preq->rq_ind.rq_relnodes.rq_node_list;

	if ((nodeslist != NULL) && (nodeslist[0] == '\0')) {
		nodeslist = NULL;
	}

	if (preq->rq_extend && *preq->rq_extend) {
		keep_select = strchr(preq->rq_extend, '=');
		if (keep_select && *(keep_select + 1)) {
			keep_select++;
			rc = validate_perm_res_in_select(keep_select, 1);
		} else
			rc = PBSE_INVALSELECTRESC;

		if (rc != PBSE_NONE) {
			req_reject(rc, 0, preq);
			return;
		}
	}

	rc = free_sister_vnodes(pjob, nodeslist, keep_select, msg, LOG_BUF_SIZE, preq);

	job_save_db(pjob); /* we must save the updates anyway, if any */

	if (rc != 0) {
		reply_text(preq, PBSE_SYSTEM, msg);
	}
}


================================================
FILE: src/server/req_modify.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * 		Functions relating to the Modify Job Batch Requests.
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include "libpbs.h"
#include <signal.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "hook.h"
#include "sched_cmds.h"
#include "pbs_internal.h"
#include "pbs_sched.h"
#include "acct.h"

/* Global Data Items: */

extern attribute_def job_attr_def[];
extern char *msg_jobmod;
extern char *msg_manager;
extern char *msg_mombadmodify;
extern char *msg_defproject;
extern char *msg_max_no_minwt;
extern char *msg_min_gt_maxwt;
extern char *msg_nostf_jobarray;
extern int comp_resc_gt;
extern int comp_resc_lt;
extern char *resc_in_err;

extern int scheduler_jobs_stat;
extern int resc_access_perm;
extern char *msg_nostf_resv;

int modify_resv_attr(resc_resv *presv, svrattrl *plist, int perm, int *bad);
extern void revert_alter_reservation(resc_resv *presv);
extern int gen_future_reply(resc_resv *presv, long fromNow);
extern job *chk_job_request(char *, struct batch_request *, int *, int *);
extern resc_resv *chk_rescResv_request(char *, struct batch_request *);
void clear_job_estimate(struct work_task *ptask);

/**
 * @brief
 * 		Clear job estimate.
 *
 * @par	Functionality:
 *		If the server attribute clear_topjob_estimates_enable is set to True,
 *		the job estimates when and where the job will run are cleared.
 *
 * @param[in,out]	ptask	- work task
 */
void
clear_job_estimate(struct work_task *ptask)
{
	job *pjob;
	pjob = (job *) ptask->wt_parm1;

	if (!get_sattr_long(SVR_ATR_clear_est_enable)) {
		return;
	}

	if (is_jattr_set(pjob, JOB_ATR_estimated)) {
		clear_jattr(pjob, JOB_ATR_estimated);
	}
}
/*
 * post_modify_req - clean up after sending modify request to MOM
 */
static void
post_modify_req(struct work_task *pwt)
{
	struct batch_request *preq;

	if (pwt->wt_aux2 != PROT_TPP)
		svr_disconnect(pwt->wt_event); /* close connection to MOM */
	preq = pwt->wt_parm1;
	preq->rq_conn = preq->rq_orgconn; /* restore socket to client */

	if (preq->rq_reply.brp_code) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			   preq->rq_ind.rq_modify.rq_objname, msg_mombadmodify, preq->rq_reply.brp_code);
		req_reject(preq->rq_reply.brp_code, 0, preq);
	} else
		reply_ack(preq);
}

/**
 * @brief
 * 		Service the Modify Job Request from client such as qalter.
 *
 * @par	Functionality:
 *		This request automatically modifies one or more of a job's attributes.
 *		An error is returned to the client if the user does not have permission
 *		to perform the modification, the attribute is read-only, the job is
 *		running and the attribute is only modifiable when the job is not
 *		running, the user attempts to modify a subjob of an array.
 *
 *		If any "move job" hooks are in place, they modify the request before
 *		the Server does anything with the request.
 *
 * @param[in] preq - pointer to batch request from client
 */

void
req_modifyjob(struct batch_request *preq)
{
	int add_to_am_list = 0; /* if altered during sched cycle */
	int bad = 0;
	int jt; /* job type */
	char newstate;
	int newsubstate;
	resource_def *outsideselect = NULL;
	job *pjob;
	svrattrl *plist;
	resource *presc;
	resource_def *prsd;
	int rc;
	int running = 0;
	int sendmom = 0;
	char hook_msg[HOOK_MSG_SIZE];
	int mod_project = 0;
	pbs_sched *psched;

	switch (process_hooks(preq, hook_msg, sizeof(hook_msg),
			      pbs_python_set_interrupt)) {
		case 0: /* explicit reject */
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
			return;
		case 1:					    /* explicit accept */
			if (recreate_request(preq) == -1) { /* error */
				/* we have to reject the request, as 'preq' */
				/* may have been partly modified            */
				strcpy(hook_msg,
				       "modifyjob event: rejected request");
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, "", hook_msg);
				reply_text(preq, PBSE_HOOKERROR, hook_msg);
				return;
			}
			break;
		case 2: /* no hook script executed - go ahead and accept event*/
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, "", "modifyjob event: accept req by default");
	}

	pjob = chk_job_request(preq->rq_ind.rq_modify.rq_objname, preq, &jt, NULL);
	if (pjob == NULL)
		return;

	if ((jt == IS_ARRAY_Single) || (jt == IS_ARRAY_Range)) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	psched = find_sched_from_sock(preq->rq_conn, CONN_SCHED_PRIMARY);
	/* allow scheduler to modify job */
	if (psched == NULL) {
		/* provisioning job is not allowed to be modified */
		if ((check_job_state(pjob, JOB_STATE_LTR_RUNNING)) &&
		    (check_job_substate(pjob, JOB_SUBSTATE_PROVISION))) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	}

	/* cannot be in exiting or transit, exiting has already be checked */

	if (check_job_state(pjob, JOB_STATE_LTR_TRANSIT)) {
		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_modify.rq_attr);
	if (plist == NULL) { /* nothing to do */
		reply_ack(preq);
		return;
	}

	/*
	 * Special checks must be made:
	 *	if during a scheduling cycle and certain attributes are altered,
	 *	   make a note of the job to prevent it from being run now;
	 *	if job is running, only certain attributes/resources can be
	 *	   altered.
	 */

	if (check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
		running = 1;
	}
	while (plist) {
		int i;

		i = find_attr(job_attr_idx, job_attr_def, plist->al_name);

		/*
		 * Is the attribute being altered one which could change
		 * scheduling (ATR_DFLAG_SCGALT set) and if a scheduling
		 * cycle is in progress, then set flag to add the job to list
		 * of jobs which cannot be run in this cycle.
		 * If the scheduler itself sends a modify job request,
		 * no need to delay the job until next cycle.
		 */
		if ((psched == NULL) && (scheduler_jobs_stat) && (job_attr_def[i].at_flags & ATR_DFLAG_SCGALT))
			add_to_am_list = 1;

		/* Is the attribute modifiable in RUN state ? */

		if (i < 0) {
			reply_badattr(PBSE_NOATTR, 1, plist, preq);
			return;
		}
		if ((running == 1) &&
		    ((job_attr_def[i].at_flags & ATR_DFLAG_ALTRUN) == 0)) {

			reply_badattr(PBSE_MODATRRUN, 1, plist, preq);
			return;
		}
		if (i == (int) JOB_ATR_resource) {
			prsd = find_resc_def(svr_resc_def, plist->al_resc);
			if (prsd == 0) {
				reply_badattr(PBSE_UNKRESC, 1, plist, preq);
				return;
			}

			/* is the specified resource modifiable while */
			/* the job is running                         */

			if (running) {

				if ((prsd->rs_flags & ATR_DFLAG_ALTRUN) == 0) {
					reply_badattr(PBSE_MODATRRUN, 1, plist, preq);
					return;
				}

				sendmom = 1;
			}

			/* should the resource be only in a select spec */

			if (prsd->rs_flags & ATR_DFLAG_CVTSLT && !outsideselect &&
			    plist->al_atopl.value && plist->al_atopl.value[0]) {
				/* if "-lresource" is set and has non-NULL value,
				** remember as potential bad resource
				** if this appears along "select".
				*/
				outsideselect = prsd;
			}
		}
		if (strcmp(plist->al_name, ATTR_project) == 0) {
			mod_project = 1;
		} else if ((strcmp(plist->al_name, ATTR_runcount) == 0) &&
			   ((plist->al_flags & ATR_VFLAG_HOOK) == 0) &&
			   (plist->al_value != NULL) &&
			   (plist->al_value[0] != '\0') &&
			   ((preq->rq_perm & (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0) &&
			   (atol(plist->al_value) <
			    get_jattr_long(pjob, JOB_ATR_runcount))) {
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
				   pjob->ji_qs.ji_jobid, "regular user %s@%s cannot decrease '%s' attribute value from %ld to %ld",
				   preq->rq_user, preq->rq_host, ATTR_runcount,
				   get_jattr_long(pjob, JOB_ATR_runcount),
				   atol(plist->al_value));
			req_reject(PBSE_PERM, 0, preq);
			return;
		} else if ((strcmp(plist->al_name, ATTR_topjob) == 0) &&
				(plist->al_value != NULL) &&
				(strcmp(plist->al_value, "False") == 0)) {
			set_task(WORK_Immed, 0, clear_job_estimate, (void *) pjob);
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	if (outsideselect) {
		presc = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), &svr_resc_def[RESC_SELECT]);
		if (presc && ((presc->rs_value.at_flags & ATR_VFLAG_DEFLT) == 0)) {
			/* select is not a default, so reject qalter */
			resc_in_err = strdup(outsideselect->rs_name);
			req_reject(PBSE_INVALJOBRESC, 0, preq);
			return;
		}
	}

	/* modify the jobs attributes */

	bad = 0;
	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_modify.rq_attr);
	rc = modify_job_attr(pjob, plist, preq->rq_perm, &bad);
	if (rc) {
		if (pjob->ji_clterrmsg)
			reply_text(preq, rc, pjob->ji_clterrmsg);
		else
			reply_badattr(rc, bad, plist, preq);
		return;
	}

	/* If certain attributes modified and if in scheduling cycle  */
	/* then add to list of jobs which cannot be run in this cycle */

	if (add_to_am_list)
		am_jobs_add(pjob); /* see req_runjob() */

	/* check if project attribute was requested to be modified to */
	/* be the default project value */
	if (mod_project && is_jattr_set(pjob, JOB_ATR_project)) {

		if (strcmp(get_jattr_str(pjob, JOB_ATR_project),
			   PBS_DEFAULT_PROJECT) == 0) {
			sprintf(log_buffer, msg_defproject,
				ATTR_project, PBS_DEFAULT_PROJECT);
#ifdef NAS /* localmod 107 */
			log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
#else
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
#endif /* localmod 107 */
		}
	}

	if ((get_jattr(pjob, JOB_ATR_resource))->at_flags & ATR_VFLAG_MODIFY) {
		presc = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), &svr_resc_def[RESC_SELECT]);
		if (presc && (presc->rs_value.at_flags & ATR_VFLAG_DEFLT)) {
			/* changing Resource_List and select is a default   */
			/* clear "select" so it is rebuilt inset_resc_deflt */
			svr_resc_def[RESC_SELECT].rs_free(&presc->rs_value);
		}
	}

	/* Reset any defaults resource limit which might have been unset */
	if ((rc = set_resc_deflt((void *) pjob, JOB_OBJECT, NULL)) != 0) {
		req_reject(rc, 0, preq);
		return;
	}

	if (find_sched_from_sock(preq->rq_conn, CONN_SCHED_PRIMARY) == NULL)
		log_alter_records_for_attrs(pjob, plist);

	/* if job is not running, may need to change its state */
	if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
		svr_evaljobstate(pjob, &newstate, &newsubstate, 0);
		svr_setjobstate(pjob, newstate, newsubstate);
	}

	job_save_db(pjob); /* we must save the updates anyway, if any */

	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid, msg_manager, msg_jobmod, preq->rq_user, preq->rq_host);

	/* if a resource limit changed for a running job, send to MOM */
	if (sendmom) {
		rc = relay_to_mom(pjob, preq, post_modify_req);
		if (rc)
			req_reject(rc, 0, preq); /* unable to get to MOM */
		return;
	}

	reply_ack(preq);
}

/**
 * @brief
 * 		Returns the svrattrl entry matching attribute 'name', or NULL if not found.
 *
 * @param[in]	plist	-	head of svrattrl list
 * @param[in]	name	-	matching attribute 'name'
 *
 * @return	svrattrl entry matching attribute 'name'
 * @retval	NULL	: if entry not found
 */
static svrattrl *
find_name_in_svrattrl(svrattrl *plist, char *name)
{

	if (!name)
		return NULL;

	while (plist) {

		if (strcmp(plist->al_name, name) == 0) {
			return plist;
		}

		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}
	return NULL;
}

/**
 * @brief
 * 		modify_job_attr - modify the attributes of a job automatically
 *		Used by req_modifyjob() to alter the job attributes and by
 *		stat_update() [see req_stat.c] to update with latest from MOM
 *
 * @param[in,out]	pjob	-	job structure
 * @param[in,out]	plist	-	Pointer to list of attributes
 * @param[in]	perm	-	Permissions of the caller requesting the operation
 * @param[out]	bad	-	Pointer to the attribute index in case of a failed
 */
int
modify_job_attr(job *pjob, svrattrl *plist, int perm, int *bad)
{
	int changed_resc;
	int allow_unkn;
	long i;
	attribute *newattr;
	attribute *pre_copy;
	attribute *attr_save;
	attribute *pattr;
	resource *prc;
	int rc;
	char newstate = -1;
	int newsubstate = -1;
	long newaccruetype = -1;

	if (pjob->ji_qhdr->qu_qs.qu_type == QTYPE_Execution)
		allow_unkn = -1;
	else
		allow_unkn = (int) JOB_ATR_UNKN;

	pattr = pjob->ji_wattr;

	/* call attr_atomic_set to decode and set a copy of the attributes.
	 * We need 2 copies: 1 for copying to pattr and 1 for calling the action functions
	 * We can't use the same copy for the action functions because copying to pattr
	 * is a shallow copy and array pointers will be cleared during the copy.
	 */

	newattr = calloc(JOB_ATR_LAST, sizeof(attribute));
	if (newattr == NULL)
		return PBSE_SYSTEM;
	rc = attr_atomic_set(plist, pattr, newattr, job_attr_idx, job_attr_def, JOB_ATR_LAST, allow_unkn, perm, bad);
	if (rc) {
		attr_atomic_kill(newattr, job_attr_def, JOB_ATR_LAST);
		return rc;
	}

	pre_copy = calloc(JOB_ATR_LAST, sizeof(attribute));
	if (pre_copy == NULL) {
		attr_atomic_kill(newattr, job_attr_def, JOB_ATR_LAST);
		return PBSE_SYSTEM;
	}
	attr_atomic_copy(pre_copy, newattr, job_attr_def, JOB_ATR_LAST);

	attr_save = calloc(JOB_ATR_LAST, sizeof(attribute));
	if (attr_save == NULL) {
		attr_atomic_kill(newattr, job_attr_def, JOB_ATR_LAST);
		attr_atomic_kill(pre_copy, job_attr_def, JOB_ATR_LAST);
		return PBSE_SYSTEM;
	}

	attr_atomic_copy(attr_save, pattr, job_attr_def, JOB_ATR_LAST);

	/* If resource limits are being changed ... */

	changed_resc = is_attr_set(&newattr[JOB_ATR_resource]);
	if ((rc == 0) && (changed_resc != 0)) {

		/* first, remove ATR_VFLAG_DEFLT from any value which was set */
		/* it can no longer be a "default" as it explicitly changed   */

		prc = (resource *) GET_NEXT(newattr[(int) JOB_ATR_resource].at_val.at_list);
		while (prc) {
			if ((prc->rs_value.at_flags & (ATR_VFLAG_MODIFY | ATR_VFLAG_DEFLT)) == (ATR_VFLAG_MODIFY | ATR_VFLAG_DEFLT))
				prc->rs_value.at_flags &= ~ATR_VFLAG_DEFLT;

			if ((prc->rs_value.at_flags & (ATR_VFLAG_MODIFY | ATR_VFLAG_SET)) == (ATR_VFLAG_MODIFY | ATR_VFLAG_SET)) {
				/* if being changed at all, see if "select" */
				if (prc->rs_defin == &svr_resc_def[RESC_SELECT]) {
					/* select is modified, recalc chunk sums */
					rc = set_chunk_sum(&prc->rs_value, &newattr[(int) JOB_ATR_resource]);
					if (rc)
						break;
				}
			}
			prc = (resource *) GET_NEXT(prc->rs_link);
		}

		/* Manager/Operator can modify job just about any old way     */
		/* So, the following checks are made only if not the Op/Admin */

		if ((perm & (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0) {
			if (check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {

				/* regular user cannot raise the limits of a running job */

				if ((comp_resc(get_jattr(pjob, JOB_ATR_resource), &newattr[(int) JOB_ATR_resource]) == -1) ||
				    comp_resc_lt)
					rc = PBSE_PERM;
			}

			/* Also check against queue, system and entity limits */

			if (rc == 0) {
				rc = chk_resc_limits(&newattr[(int) JOB_ATR_resource],
						     pjob->ji_qhdr);
			}
			if (rc == 0) {
				rc = check_entity_resc_limit_max(pjob, pjob->ji_qhdr,
								 &newattr[(int) JOB_ATR_resource]);
				if (rc == 0) {
					rc = check_entity_resc_limit_queued(pjob, pjob->ji_qhdr,
									    &newattr[(int) JOB_ATR_resource]);
					if (rc == 0) {
						rc = check_entity_resc_limit_max(pjob, NULL,
										 &newattr[(int) JOB_ATR_resource]);
						if (rc == 0)
							rc = check_entity_resc_limit_queued(pjob, NULL,
											    &newattr[(int) JOB_ATR_resource]);
					}
				}
			}
		}
	}

	/* special check on permissions for hold */

	if ((rc == 0) &&
	    (newattr[(int) JOB_ATR_hold].at_flags & ATR_VFLAG_MODIFY)) {
		svrattrl *hold_e = find_name_in_svrattrl(plist, ATTR_h);
		/* don't perform permission check if Hold_Types attribute */
		/* was set in a hook script (special privilege) */
		if ((hold_e == NULL) ||
		    ((hold_e->al_flags & ATR_VFLAG_HOOK) == 0)) {
			i = newattr[(int) JOB_ATR_hold].at_val.at_long ^
			    (pattr + (int) JOB_ATR_hold)->at_val.at_long;
			rc = chk_hold_priv(i, perm);
		}
	}

	if ((rc == 0) &&
	    ((newattr[(int) JOB_ATR_userlst].at_flags & ATR_VFLAG_MODIFY) ||
	     (newattr[(int) JOB_ATR_grouplst].at_flags & ATR_VFLAG_MODIFY))) {
		/* Need to reset execution uid and gid */
		rc = set_objexid((void *) pjob, JOB_OBJECT, newattr);
	}

	if (rc) {
		attr_atomic_kill(newattr, job_attr_def, JOB_ATR_LAST);
		attr_atomic_kill(attr_save, job_attr_def, JOB_ATR_LAST);
		attr_atomic_kill(pre_copy, job_attr_def, JOB_ATR_LAST);
		return (rc);
	}

	/* OK, if resources changed, reset entity sums */

	if (changed_resc) {
		account_entity_limit_usages(pjob, NULL,
					    &newattr[(int) JOB_ATR_resource], INCR, ETLIM_ACC_ALL_RES);
		account_entity_limit_usages(pjob, pjob->ji_qhdr,
					    &newattr[(int) JOB_ATR_resource], INCR, ETLIM_ACC_ALL_RES);
	}

	/* Now copy the new values into the job attribute array for the purposes of running the action functions */

	for (i = 0; i < JOB_ATR_LAST; i++) {
		if (newattr[i].at_flags & ATR_VFLAG_MODIFY) {
			/*
			 * The function update_eligible_time() expects it is the only one setting accrue_type.
			 * If we set it here, it will get confused.  There is no action function for accrue_type,
			 * so pre-setting it for the action function calls isn't required.
			 */
			if (i == JOB_ATR_accrue_type)
				continue;
			free_attr(job_attr_def, &pattr[i], i);
			if ((pre_copy[i].at_type == ATR_TYPE_LIST) ||
			    (pre_copy[i].at_type == ATR_TYPE_RESC)) {
				list_move(&pre_copy[i].at_val.at_list,
					  &pattr[i].at_val.at_list);
			} else {
				pattr[i] = pre_copy[i];
			}
			/* ATR_VFLAG_MODCACHE will be included if set */
			pattr[i].at_flags = pre_copy[i].at_flags;
		}
	}

	for (i = 0; i < JOB_ATR_LAST; i++) {
		/* Check newattr instead of pattr for modify.  It is possible that
		 * the attribute already has the modify flag before we added the new attributes to it.
		 * We only want to call the action functions for attributes which are being modified by this function.
		 */
		if (newattr[i].at_flags & ATR_VFLAG_MODIFY) {
			if ((job_attr_def[i].at_flags & ATR_DFLAG_NOSAVM))
				continue;

			if (job_attr_def[i].at_action) {
				rc = job_attr_def[i].at_action(&newattr[i],
							       pjob, ATR_ACTION_ALTER);
				if (rc) {
					*bad = i;
					break;
				}
			}
		}
	}
	if (rc) {
		attr_atomic_copy(pjob->ji_wattr, attr_save, job_attr_def, JOB_ATR_LAST);
		free(pre_copy);
		attr_atomic_kill(newattr, job_attr_def, JOB_ATR_LAST);
		attr_atomic_kill(attr_save, job_attr_def, JOB_ATR_LAST);
		return (rc);
	}

	/* The action functions may have modified the attributes, need to set them to newattr2 */
	for (i = 0; i < JOB_ATR_LAST; i++) {
		if (newattr[i].at_flags & ATR_VFLAG_MODIFY) {
			free_attr(job_attr_def, &pattr[i], i);
			switch (i) {
				case JOB_ATR_state:
					newstate = get_attr_c(&newattr[i]);
					break;
				case JOB_ATR_substate:
					newsubstate = get_attr_l(&newattr[i]);
					break;
				case JOB_ATR_accrue_type:
					newaccruetype = get_attr_l(&newattr[i]);
					break;
				default:
					if ((newattr[i].at_type == ATR_TYPE_LIST) ||
					    (newattr[i].at_type == ATR_TYPE_RESC)) {
						list_move(&newattr[i].at_val.at_list,
							  &pattr[i].at_val.at_list);
					} else {
						pattr[i] = newattr[i];
					}
			}
			/* ATR_VFLAG_MODCACHE will be included if set */
			pattr[i].at_flags = newattr[i].at_flags;
		}
	}

	if (newstate != -1 && newsubstate != -1) {
		svr_setjobstate(pjob, newstate, newsubstate);
	}

	if (newaccruetype != -1)
		update_eligible_time(newaccruetype, pjob);

	free(newattr);
	free(pre_copy);
	attr_atomic_kill(attr_save, job_attr_def, JOB_ATR_LAST);
	return (0);
}

/**
 * @brief determine if one schedselect is made up of fewer or equal number of
 *		the same chunk types with possibly some chunk types removed.
 *
 * @return int
 * @retval 1 fewer or equal chunks
 * @retval 0 more chunks or different chunks
 * @retval -1 error
 */
int
is_select_smaller(char *select_orig, char *select_smaller)
{
	char *spec1, *spec2;
	char *subspec1, *subspec2;
	char *last1, *last2;
	int num_chunks1, num_chunks2;
	char *rest1, *rest2;

	if (select_orig == NULL || select_smaller == NULL)
		return -1;

	if ((spec1 = strdup(select_orig)) == NULL) {
		log_err(errno, __func__, "Failed to allocate memory");
		return -1;
	}
	if ((spec2 = strdup(select_smaller)) == NULL) {
		free(spec1);
		log_err(errno, __func__, "Failed to allocate memory");
		return -1;
	}

	subspec2 = parse_plus_spec_r(spec2, &last2, NULL);
	num_chunks2 = strtol(subspec2, &rest2, 10);

	for (subspec1 = parse_plus_spec_r(spec1, &last1, NULL); subspec1;
	     subspec1 = parse_plus_spec_r(last1, &last1, NULL)) {
		num_chunks1 = strtol(subspec1, &rest1, 10);

		if (strcmp(rest1, rest2) == 0 && num_chunks2 <= num_chunks1) {
			subspec2 = parse_plus_spec_r(last2, &last2, NULL);
			if (subspec2 == NULL)
				break;
			num_chunks2 = strtol(subspec2, &rest2, 10);
		}
	}

	free(spec1);
	free(spec2);

	if (subspec2 != NULL)
		return 0;

	return 1;
}

/**
 * @brief This function creates a request run destination string for a reservation.
 *	  This string is in the same format as preq->rq_ind.rq_run.rq_destin
 * @param[in] presv - reservation for which string is being made.
 * @return destination string
 */
char *
create_resv_destination(resc_resv *presv)
{
	char *format = "%s";
	char *destin = NULL;
	if (presv == NULL)
		return NULL;
	/* standing reservations format is <num>#<exec-vnode>{<num>} */
	if (get_rattr_long(presv, RESV_ATR_resv_standing))
		format = "1#%s{0}";
	pbs_asprintf(&destin, format, get_rattr_str(presv, RESV_ATR_resv_nodes));
	return destin;
}

/**
 * @brief This function creates a batch_request to confirm a reservation
 * @param[in] presv - reservation that is being confirmed.
 *
 * @return - Batch request
 */
static struct batch_request *
create_resv_confirm_req(resc_resv *presv)
{
	struct batch_request *confirm_req;
	char *part;
	confirm_req = alloc_br(PBS_BATCH_ConfirmResv);
	if (confirm_req == NULL)
		return NULL;
	if (is_rattr_set(presv, RESV_ATR_partition))
		part = get_rattr_str(presv, RESV_ATR_partition);
	else
		part = DEFAULT_PARTITION;

	if (pbs_asprintf(&confirm_req->rq_extend, "%s:partition=%s", PBS_RESV_CONFIRM_SUCCESS, part) == -1) {
		free_br(confirm_req);
		return NULL;
	}
	pbs_strncpy(confirm_req->rq_ind.rq_run.rq_jid, presv->ri_qs.ri_resvID, sizeof(confirm_req->rq_ind.rq_run.rq_jid));
	confirm_req->rq_ind.rq_run.rq_resch = get_rattr_long(presv, RESV_ATR_start);
	if (is_rattr_set(presv, RESV_ATR_resv_nodes)) {
		confirm_req->rq_ind.rq_run.rq_destin = create_resv_destination(presv);
		if (confirm_req->rq_ind.rq_run.rq_destin == NULL) {
			free_br(confirm_req);
			return NULL;
		}
	}
	return confirm_req;
}

/**
 * @brief Save the current starttime, duration, and select of a reservation.
 * 		To be reverted by revert_alter_reservation
 *
 * @param[in] presv pointer to reservation
 */
void
save_alter_reservation(resc_resv *presv)
{

	attribute *alter_revert;
	resource_def *presdef = NULL;
	resource *resc = NULL, *pselect = NULL;
	attribute atemp = {0};

	alter_revert = get_rattr(presv, RESV_ATR_alter_revert);
	if (is_attr_set(alter_revert))
		return;

	presdef = &svr_resc_def[RESC_START_TIME];
	resc = add_resource_entry(alter_revert, presdef);
	atemp.at_flags = ATR_VFLAG_SET;
	atemp.at_type = ATR_TYPE_LONG;
	atemp.at_val.at_long = get_rattr_long(presv, RESV_ATR_start);
	presdef->rs_set(&resc->rs_value, &atemp, SET);

	presdef = &svr_resc_def[RESC_WALLTIME];
	resc = add_resource_entry(alter_revert, presdef);
	atemp.at_val.at_long = get_rattr_long(presv, RESV_ATR_duration);
	presdef->rs_set(&resc->rs_value, &atemp, SET);

	presdef = &svr_resc_def[RESC_SELECT];
	pselect = find_resc_entry(get_rattr(presv, RESV_ATR_resource), presdef);
	resc = add_resource_entry(alter_revert, presdef);
	atemp.at_type = ATR_TYPE_STR;
	atemp.at_val.at_str = pselect->rs_value.at_val.at_str;
	presdef->rs_set(&resc->rs_value, &atemp, SET);

	set_rattr_str_slim(presv, RESV_ATR_SchedSelect_orig, get_rattr_str(presv, RESV_ATR_SchedSelect), NULL);
}

/**
 * @brief Revert the alter for the reservation.
 * 		Restore the values stored in save_alter_reservation
 *
 * @param[in] presv pointer to reservation
 */
void
revert_alter_reservation(resc_resv *presv)
{
	attribute *alter_revert;
	resource_def *presdef = NULL;
	resource *resc = NULL, *resc2 = NULL;
	attribute atemp = {0};
	attribute *resc_attr;
	int state = 0;
	int sub = 0;

	alter_revert = get_rattr(presv, RESV_ATR_alter_revert);
	if (!is_attr_set(alter_revert))
		return;

	/* revert start time */
	presdef = &svr_resc_def[RESC_START_TIME];
	resc = find_resc_entry(alter_revert, presdef);
	set_rattr_l_slim(presv, RESV_ATR_start, get_attr_l(&resc->rs_value), SET);
	presv->ri_qs.ri_stime = resc->rs_value.at_val.at_long;

	/* revert duration and walltime */
	presdef = &svr_resc_def[RESC_WALLTIME];
	resc = find_resc_entry(alter_revert, presdef);
	set_rattr_l_slim(presv, RESV_ATR_duration, get_attr_l(&resc->rs_value), SET);
	presv->ri_qs.ri_duration = resc->rs_value.at_val.at_long;

	resc_attr = get_rattr(presv, RESV_ATR_resource);
	resc = find_resc_entry(resc_attr, presdef);
	presdef->rs_set(&resc->rs_value, get_rattr(presv, RESV_ATR_duration), SET);

	/* revert end time */
	set_rattr_l_slim(presv, RESV_ATR_end, get_rattr_long(presv, RESV_ATR_start) + get_rattr_long(presv, RESV_ATR_duration), SET);
	presv->ri_qs.ri_etime = get_rattr_long(presv, RESV_ATR_end);

	/* revert resource_list.select */
	presdef = &svr_resc_def[RESC_SELECT];
	resc = find_resc_entry(alter_revert, presdef);
	resc2 = find_resc_entry(resc_attr, presdef);
	atemp.at_flags = ATR_VFLAG_SET;
	atemp.at_type = ATR_TYPE_STR;
	atemp.at_val.at_str = resc->rs_value.at_val.at_str;
	presdef->rs_set(&resc2->rs_value, &atemp, SET);
	presdef->rs_free(&resc->rs_value);
	set_chunk_sum(&resc2->rs_value, resc_attr);
	post_attr_set(resc_attr);
	set_rattr_str_slim(presv, RESV_ATR_SchedSelect, get_rattr_str(presv, RESV_ATR_SchedSelect_orig), NULL);
	free_rattr(presv, RESV_ATR_SchedSelect_orig);

	presv->ri_alter.ra_flags = 0;
	free_rattr(presv, RESV_ATR_alter_revert);

	eval_resvState(presv, RESVSTATE_alter_failed, 0, &state, &sub);
	/* While requesting alter, substate was retained, so we use the same here. */
	(void) resv_setResvState(presv, state, presv->ri_qs.ri_substate);
}

/**
 * @brief Save the original starttime, duration, and select of a standing reservation.
 *
 * @param[in] preq pointer to reservation
 */
void
save_standing_reservation(resc_resv *presv)
{
	attribute *standing;
	attribute atemp = {0};
	resource_def *presdef = NULL;
	resource *resc = NULL;

	standing = get_rattr(presv, RESV_ATR_standing_revert);
	if (is_attr_set(standing))
		return;

	post_attr_set(standing);

	presdef = &svr_resc_def[RESC_START_TIME];
	resc = add_resource_entry(standing, presdef);
	atemp.at_flags = ATR_VFLAG_SET;
	atemp.at_type = ATR_TYPE_LONG;
	atemp.at_val.at_long = get_rattr_long(presv, RESV_ATR_start);
	presdef->rs_set(&resc->rs_value, &atemp, SET);

	presdef = &svr_resc_def[RESC_WALLTIME];
	resc = add_resource_entry(standing, presdef);
	atemp.at_val.at_long = get_rattr_long(presv, RESV_ATR_duration);
	presdef->rs_set(&resc->rs_value, &atemp, SET);

	presdef = &svr_resc_def[RESC_SELECT];
	resc = find_resc_entry(get_rattr(presv, RESV_ATR_resource), presdef);
	atemp.at_type = ATR_TYPE_STR;
	atemp.at_val.at_str = resc->rs_value.at_val.at_str;
	resc = add_resource_entry(standing, presdef);
	presdef->rs_set(&resc->rs_value, &atemp, SET);
}

/**
 * @brief Service the Modify Reservation Request from client such as pbs_ralter.
 *
 *	This request atomically modifies one or more of a reservation's attributes.
 *	An error is returned to the client if the user does not have permission
 *	to perform the modification, the attribute is read-only, the reservation is
 *	running and the attribute is only modifiable when the reservation is not
 *	running or is empty.
 *
 * @param[in] preq - pointer to batch request from client
 */
void
req_modifyReservation(struct batch_request *preq)
{
	char *rid = NULL;
	svrattrl *psatl = NULL;
	attribute_def *pdef = NULL;
	int rc = 0;
	int bad = 0;
	char buf[PBS_MAXUSER + PBS_MAXHOSTNAME + 32] = {0};
	int sock;
	int resc_access_perm_save = 0;
	int send_to_scheduler = 0;
	int log_len = 0;
	char *fmt = "%a %b %d %H:%M:%S %Y";
	int is_standing = 0;
	int next_occr_start = 0;
	extern char *msg_stdg_resv_occr_conflict;
	resc_resv *presv;
	int num_jobs;
	long new_end_time = 0;
	resource *presc = NULL;
	int scheds_notified = 0;
	int force_alter = FALSE;
	char hook_msg[HOOK_MSG_SIZE] = {0};

	if (preq == NULL)
		return;

	switch (process_hooks(preq, hook_msg, sizeof(hook_msg),
			      pbs_python_set_interrupt)) {
		case 0: /* explicit reject */
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
			return;
		case 1:					    /* explicit accept */
			if (recreate_request(preq) == -1) { /* error */
				/* we have to reject the request, as 'preq' */
				/* may have been partly modified            */
				strcpy(hook_msg,
				       "modifyresv event: rejected request");
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, "", hook_msg);
				reply_text(preq, PBSE_HOOKERROR, hook_msg);
				return;
			}
			break;
		case 2: /* no hook script executed - go ahead and accept event*/
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, "", "modifyresv event: accept req by default");
	}

	sock = preq->rq_conn;

	presv = chk_rescResv_request(preq->rq_ind.rq_modify.rq_objname, preq);
	/* Note: on failure, chk_rescResv_request invokes req_reject
	 * appropriate reply is sent and batch_request is freed.
	 */
	if (presv == NULL)
		return;

	if (preq->rq_extend != NULL && (strcmp(preq->rq_extend, FORCE) == 0))
		force_alter = TRUE;

	rid = preq->rq_ind.rq_modify.rq_objname;
	presv = find_resv(rid);

	if (presv == NULL) {
		req_reject(PBSE_UNKRESVID, 0, preq);
		return;
	}

	if (get_rattr_long(presv, RESV_ATR_state) == RESV_BEING_ALTERED) {
		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}

	num_jobs = presv->ri_qp->qu_numjobs;
	if (svr_chk_history_conf()) {
		num_jobs -= (presv->ri_qp->qu_njstate[JOB_STATE_MOVED] + presv->ri_qp->qu_njstate[JOB_STATE_FINISHED] +
			     presv->ri_qp->qu_njstate[JOB_STATE_EXPIRED]);
	}

	is_standing = get_rattr_long(presv, RESV_ATR_resv_standing);
	if (is_standing)
		next_occr_start = get_occurrence(get_rattr_str(presv, RESV_ATR_resv_rrule),
						 get_rattr_long(presv, RESV_ATR_start),
						 get_rattr_str(presv, RESV_ATR_resv_timezone), 2);

	resc_access_perm = preq->rq_perm;
	resc_access_perm_save = resc_access_perm;
	psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_modify.rq_attr);
	presv->ri_alter.ra_flags = 0;
	presv->ri_alter.ra_state = get_rattr_long(presv, RESV_ATR_state);

	/* Only set this once to the original start/duration */
	if (is_standing && !is_rattr_set(presv, RESV_ATR_standing_revert))
		save_standing_reservation(presv);

	while (psatl) {
		long temp = 0;
		char *end = NULL;
		int index;

		/* identify the attribute by name */
		index = find_attr(resv_attr_idx, resv_attr_def, psatl->al_name);
		if (index < 0) {
			/* didn`t recognize the name */
			reply_badattr(PBSE_NOATTR, 1, psatl, preq);
			return;
		}
		pdef = &resv_attr_def[index];

		/* Does attribute's definition flags indicate that
		 * we have sufficient permission to write the attribute?
		 */

		resc_access_perm = resc_access_perm_save; /* reset */
		if (psatl->al_flags & ATR_VFLAG_HOOK) {
			resc_access_perm = ATR_DFLAG_USWR |
					   ATR_DFLAG_OPWR |
					   ATR_DFLAG_MGWR |
					   ATR_DFLAG_SvWR |
					   ATR_DFLAG_Creat;
		}
		if ((pdef->at_flags & resc_access_perm) == 0) {
			reply_badattr(PBSE_ATTRRO, 1, psatl, preq);
			return;
		}

		switch (index) {
			case RESV_ATR_start:
				if (get_rattr_long(presv, RESV_ATR_state) != RESV_RUNNING || !num_jobs) {
					temp = strtol(psatl->al_value, &end, 10);
					if (temp > time(NULL)) {
						if (!is_standing || (temp < next_occr_start)) {
							send_to_scheduler = 1;
							save_alter_reservation(presv);
							presv->ri_alter.ra_flags |= RESV_START_TIME_MODIFIED;
						} else {
							revert_alter_reservation(presv);
							log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
								  preq->rq_ind.rq_modify.rq_objname, msg_stdg_resv_occr_conflict);
							req_reject(PBSE_STDG_RESV_OCCR_CONFLICT, 0, preq);
							return;
						}
					} else {
						revert_alter_reservation(presv);
						req_reject(PBSE_BADTSPEC, 0, preq);
						return;
					}
				} else {
					revert_alter_reservation(presv);
					if (num_jobs)
						req_reject(PBSE_RESV_NOT_EMPTY, 0, preq);
					else
						req_reject(PBSE_BADTSPEC, 0, preq);
					return;
				}

				break;
			case RESV_ATR_end:
				temp = strtol(psatl->al_value, &end, 10);
				if (!is_standing || temp < next_occr_start) {
					send_to_scheduler = 1;
					presv->ri_alter.ra_flags |= RESV_END_TIME_MODIFIED;
					save_alter_reservation(presv);
				} else {
					revert_alter_reservation(presv);
					log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
						  preq->rq_ind.rq_modify.rq_objname, msg_stdg_resv_occr_conflict);
					req_reject(PBSE_STDG_RESV_OCCR_CONFLICT, 0, preq);
					return;
				}

				break;
			case RESV_ATR_duration:
				send_to_scheduler = 1;
				presv->ri_alter.ra_flags |= RESV_DURATION_MODIFIED;
				save_alter_reservation(presv);
				break;
			case RESV_ATR_resource:
				if (force_alter) {
					revert_alter_reservation(presv);
					req_reject(PBSE_NOSUP, 0, preq);
					return;
				}
				if (strcmp(psatl->al_resc, "select") != 0) {
					revert_alter_reservation(presv);
					req_reject(PBSE_BADATVAL, 0, preq);
					return;
				}
				if (get_rattr_long(presv, RESV_ATR_substate) == RESV_IN_CONFLICT)
					return;
				save_alter_reservation(presv);

				send_to_scheduler = 1;
				presv->ri_alter.ra_flags |= RESV_SELECT_MODIFIED;
				presc = find_resc_entry(get_rattr(presv, RESV_ATR_resource), &svr_resc_def[RESC_SELECT]);
				if (presc == NULL) {
					req_reject(PBSE_INTERNAL, 0, preq);
					revert_alter_reservation(presv);
					return;
				}
				set_rattr_str_slim(presv, RESV_ATR_SchedSelect_orig, get_rattr_str(presv, RESV_ATR_SchedSelect), NULL);
				break;
			default:
				break;
		}

		psatl = (svrattrl *) GET_NEXT(psatl->al_link);
	}
	/* Force option is only applied to attributes that require reconfirmation */
	if ((send_to_scheduler == 0) && (force_alter == TRUE)) {
		revert_alter_reservation(presv);
		req_reject(PBSE_NOSUP, 0, preq);
		return;
	}

	if (get_rattr_long(presv, RESV_ATR_state) == RESV_RUNNING && num_jobs) {
		if ((presv->ri_alter.ra_flags & RESV_DURATION_MODIFIED) && (presv->ri_alter.ra_flags & RESV_END_TIME_MODIFIED)) {
			revert_alter_reservation(presv);
			req_reject(PBSE_RESV_NOT_EMPTY, 0, preq);
			return;
		}
	}

	bad = 0;
	psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_modify.rq_attr);
	if (psatl) {
		rc = modify_resv_attr(presv, psatl, preq->rq_perm, &bad);
		if (rc != 0) {
			reply_badattr(rc, bad, psatl, preq);
			revert_alter_reservation(presv);
			return;
		}
	}
	resc_access_perm = resc_access_perm_save;

	new_end_time = get_rattr_long(presv, RESV_ATR_start) + get_rattr_long(presv, RESV_ATR_duration);

	if (is_standing && new_end_time >= next_occr_start) {
		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
			  preq->rq_ind.rq_modify.rq_objname, msg_stdg_resv_occr_conflict);
		req_reject(PBSE_STDG_RESV_OCCR_CONFLICT, 0, preq);
		revert_alter_reservation(presv);
		return;
	}

	if (presv->ri_alter.ra_flags & RESV_SELECT_MODIFIED) {
		presc = find_resc_entry(get_rattr(presv, RESV_ATR_resource), &svr_resc_def[RESC_SELECT]);
		make_schedselect(get_rattr(presv, RESV_ATR_resource), presc, NULL, get_rattr(presv, RESV_ATR_SchedSelect));
		if (is_select_smaller(get_rattr_str(presv, RESV_ATR_SchedSelect_orig), get_rattr_str(presv, RESV_ATR_SchedSelect)) == 0) {
			req_reject(PBSE_SELECT_NOT_SUBSET, 0, preq);
			revert_alter_reservation(presv);
			return;
		}
		rc = set_chunk_sum(&presc->rs_value, get_rattr(presv, RESV_ATR_resource));
		if (rc) {
			req_reject(rc, 0, preq);
			revert_alter_reservation(presv);
			return;
		}
	}

	if (send_to_scheduler) {
		resv_setResvState(presv, RESV_BEING_ALTERED, presv->ri_qs.ri_substate);
		if (presv->ri_alter.ra_flags & (RESV_START_TIME_MODIFIED | RESV_END_TIME_MODIFIED | RESV_DURATION_MODIFIED)) {
			/* "start", "end", "duration", and "wall"; derive and check */
			if (start_end_dur_wall(presv)) {
				req_reject(PBSE_BADTSPEC, 0, preq);
				revert_alter_reservation(presv);
				return;
			}
			/* walltime can change */
			post_attr_set(get_rattr(presv, RESV_ATR_resource));
		}
	}

	/* If Authorized_Groups is modified, we need to update the queue's acl_users
	 * Authorized_Users cannot be unset, it must always have a value
	 * The queue will have acl_user_enable set to 1 by default
	 * If Authorized_Groups is modified, we need to update the queue's acl_groups and acl_group_enable
	 * Authorized_Groups could be unset, so we need to update the queue accordingly, unsetting both acl_groups and acl_group_enable
	 */
	if ((get_rattr(presv, RESV_ATR_auth_u))->at_flags & ATR_VFLAG_MODIFY) {
		svrattrl *pattrl;
		resv_attr_def[(int) RESV_ATR_auth_u].at_encode(get_rattr(presv, RESV_ATR_auth_u), NULL, resv_attr_def[RESV_ATR_auth_u].at_name, NULL, ATR_ENCODE_CLIENT, &pattrl);
		set_qattr_str_slim(presv->ri_qp, QA_ATR_AclUsers, pattrl->al_atopl.value, NULL);
		free(pattrl);
	}
	if ((get_rattr(presv, RESV_ATR_auth_g))->at_flags & ATR_VFLAG_MODIFY) {
		if (is_rattr_set(presv, RESV_ATR_auth_g)) {
			svrattrl *pattrl = NULL;
			resv_attr_def[(int) RESV_ATR_auth_g].at_encode(get_rattr(presv, RESV_ATR_auth_g), NULL, resv_attr_def[RESV_ATR_auth_g].at_name, NULL, ATR_ENCODE_CLIENT, &pattrl);
			set_qattr_str_slim(presv->ri_qp, QE_ATR_AclGroup, pattrl->al_atopl.value, NULL);
			if (!is_qattr_set(presv->ri_qp, QE_ATR_AclGroupEnabled) || get_qattr_long(presv->ri_qp, QE_ATR_AclGroupEnabled) == 0)
				set_qattr_l_slim(presv->ri_qp, QE_ATR_AclGroupEnabled, 1, SET);
			que_save_db(presv->ri_qp);
			free(pattrl);
		} else {
			free_rattr(presv, RESV_ATR_auth_g);
			free_qattr(presv->ri_qp, QE_ATR_AclGroup);
			free_qattr(presv->ri_qp, QE_ATR_AclGroupEnabled);
			que_save_db(presv->ri_qp);
		}
	}

	if (send_to_scheduler)
		scheds_notified = notify_scheds_about_resv(SCH_SCHEDULE_RESV_RECONFIRM, presv);

	sprintf(log_buffer, "Attempting to modify reservation");
	if (presv->ri_alter.ra_flags & RESV_START_TIME_MODIFIED) {
		long dt = get_rattr_long(presv, RESV_ATR_start);
		strftime(buf, sizeof(buf), fmt, localtime((time_t *) &dt));
		log_len = strlen(log_buffer);
		snprintf(log_buffer + log_len, sizeof(log_buffer) - log_len, " start=%s", buf);
	}
	if (presv->ri_alter.ra_flags & RESV_END_TIME_MODIFIED) {
		long dt = get_rattr_long(presv, RESV_ATR_end);
		strftime(buf, sizeof(buf), fmt, localtime((time_t *) &dt));
		log_len = strlen(log_buffer);
		snprintf(log_buffer + log_len, sizeof(log_buffer) - log_len, " end=%s", buf);
	}
	if (presv->ri_alter.ra_flags & RESV_SELECT_MODIFIED) {
		log_len = strlen(log_buffer);
		snprintf(log_buffer + log_len, sizeof(log_buffer) - log_len, " select=%s", presc->rs_value.at_val.at_str);
	}
	log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, preq->rq_ind.rq_modify.rq_objname, log_buffer);

	if (force_alter == TRUE) {
		if (scheds_notified == 0) {				    /* No schedulers notified, just enforce confirmation */
			if (presv->ri_alter.ra_state == RESV_UNCONFIRMED) { /* No need to do anything, just make the change */
				resv_setResvState(presv, RESV_UNCONFIRMED, RESV_UNCONFIRMED);
				presv->ri_alter.ra_flags = 0;
				presv->ri_alter.ra_state = 0;
			} else {
				struct batch_request *confirm_req;
				struct work_task *pwt;
				confirm_req = create_resv_confirm_req(presv);
				if (confirm_req == NULL) {
					req_reject(PBSE_SYSTEM, 0, preq);
					revert_alter_reservation(presv);
					return;
				}
				confirm_req->rq_perm = preq->rq_perm;
				if (issue_Drequest(PBS_LOCAL_CONNECTION, confirm_req, release_req, &pwt, 0) == -1) {
					free_br(confirm_req);
					req_reject(PBSE_SYSTEM, 0, preq);
					revert_alter_reservation(presv);
					return;
				}
				append_link(&presv->ri_svrtask, &pwt->wt_linkobj, pwt);
			}
			snprintf(buf, sizeof(buf), "%s CONFIRMED", presv->ri_qs.ri_resvID);
			reply_text(preq, PBSE_NONE, buf);
			return;
		} else
			presv->ri_alter.ra_flags |= RESV_ALTER_FORCED;
	}

	if (is_rattr_set(presv, RESV_ATR_interactive) == 0) {
		char buf1[PBS_MAXUSER + PBS_MAXHOSTNAME + 32] = {0};
		/*Not "interactive" so don't wait on scheduler, reply now*/

		sprintf(buf, "%s ALTER REQUESTED", presv->ri_qs.ri_resvID);
		sprintf(buf1, "requestor=%s@%s", preq->rq_user, preq->rq_host);

		if ((rc = reply_text(preq, PBSE_NONE, buf))) {
			/* reply failed,  close connection; DON'T purge resv */
			close_client(sock);
			return;
		}
	} else {
		/* Don't reply back until scheduler decides */
		long dt;
		presv->ri_brp = preq;
		dt = get_rattr_long(presv, RESV_ATR_interactive);
		/*reply with id and state no decision in +dt secs*/
		(void) gen_future_reply(presv, dt);
		(void) snprintf(buf, sizeof(buf), "requestor=%s@%s Interactive=%ld",
				preq->rq_user, preq->rq_host, dt);
	}
}

/**
 * @brief modify the attributes of a reservation atomically.
 *
 * @param[in]  presv - pointer to the reservation structure.
 * @param[in]  plist - list of attributes to modify.
 * @param[in]  perm  - permissions.
 * @param[out] bad   - the index of the attribute which caused an error.
 *
 * @return 0 on success.
 * @return PBS error code.
 */
int
modify_resv_attr(resc_resv *presv, svrattrl *plist, int perm, int *bad)
{
	int allow_unkn = 0;
	long i = 0;
	attribute newattr[(int) RESV_ATR_LAST];
	attribute *pattr;
	int rc = 0;

	if (presv == NULL || plist == NULL)
		return PBSE_INTERNAL;

	allow_unkn = -1;
	pattr = presv->ri_wattr;

	/* call attr_atomic_set to decode and set a copy of the attributes */

	rc = attr_atomic_set(plist, pattr, newattr, resv_attr_idx, resv_attr_def, RESV_ATR_LAST, allow_unkn, perm, bad);
	if (rc == 0) {
		for (i = 0; i < RESV_ATR_LAST; i++) {
			if (newattr[i].at_flags & ATR_VFLAG_MODIFY) {
				if (resv_attr_def[i].at_action) {
					rc = resv_attr_def[i].at_action(&newattr[i],
									presv, ATR_ACTION_ALTER);
					if (rc)
						break;
				}
			}
		}
		if ((rc == 0) &&
		    ((newattr[(int) RESV_ATR_userlst].at_flags & ATR_VFLAG_MODIFY) ||
		     (newattr[(int) RESV_ATR_grouplst].at_flags & ATR_VFLAG_MODIFY))) {
			/* Need to reset execution uid and gid */
			rc = set_objexid((void *) presv, JOB_OBJECT, newattr);
		}
	}
	if (rc) {
		for (i = 0; i < RESV_ATR_LAST; i++)
			resv_attr_def[i].at_free(newattr + i);
		return (rc);
	}

	/* Now copy the new values into the reservation attribute array */

	for (i = 0; i < RESV_ATR_LAST; i++) {
		if (newattr[i].at_flags & ATR_VFLAG_MODIFY) {
			resv_attr_def[i].at_free(pattr + i);
			if ((newattr[i].at_type == ATR_TYPE_LIST) || (newattr[i].at_type == ATR_TYPE_RESC)) {
				list_move(&newattr[i].at_val.at_list, &(pattr + i)->at_val.at_list);
			} else {
				*(pattr + i) = newattr[i];
			}
			/* ATR_VFLAG_MODCACHE will be included if set */
			(pattr + i)->at_flags = newattr[i].at_flags;
		}
	}

	return (0);
}


================================================
FILE: src/server/req_movejob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    req_movejob.c
 *
 * @brief
 * 		req_movejob.c - function to move a job to another queue
 *
 * Included functions are:
 * 	req_movejob()
 * 	req_orderjob()
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include <sys/param.h>
#include "libpbs.h"
#include <errno.h>

#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "credential.h"
#include "batch_request.h"
#include "resv_node.h"
#include "queue.h"
#include "job.h"
#include "reservation.h"
#include "log.h"
#include "pbs_error.h"
#include "hook.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

/* Global Data Items: */

extern char *msg_badstate;
extern char *msg_manager;
extern char *msg_movejob;
extern int pbs_errno;

/**
 * @brief
 * 		req_movejob = move a job to a new destination (local or remote)
 *
 * @param[in,out]	req	-	the batch request
 */

void
req_movejob(struct batch_request *req)
{
	int jt; /* job type */
	job *jobp;
	char hook_msg[HOOK_MSG_SIZE];

	switch (process_hooks(req, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt)) {
		case 0: /* explicit reject */
			reply_text(req, PBSE_HOOKERROR, hook_msg);
			return;
		case 1:					   /* explicit accept */
			if (recreate_request(req) == -1) { /* error */
				/* we have to reject the request, as 'req' */
				/* may have been partly modified */
				strcpy(hook_msg,
				       "movejob event: rejected request");
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, "", hook_msg);
				reply_text(req, PBSE_HOOKERROR, hook_msg);
				return;
			}
			break;
		case 2: /* no hook script executed - go ahead and accept event*/
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, "", "movejob event: accept req by default");
	}

	jobp = chk_job_request(req->rq_ind.rq_move.rq_jid, req, &jt, NULL);

	if (jobp == NULL)
		return;

	if ((jt != IS_ARRAY_NO) && (jt != IS_ARRAY_ArrayJob)) {
		req_reject(PBSE_IVALREQ, 0, req);
		return;
	}

	if (!check_job_state(jobp, JOB_STATE_LTR_QUEUED) &&
	    !check_job_state(jobp, JOB_STATE_LTR_HELD) &&
	    !check_job_state(jobp, JOB_STATE_LTR_WAITING)) {
#ifndef NDEBUG
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			   jobp->ji_qs.ji_jobid, "(%s) %s, state=%c",
			   __func__, msg_badstate, get_job_state(jobp));
#endif /* NDEBUG */
		req_reject(PBSE_BADSTATE, 0, req);
		return;
	}

	if (jt != IS_ARRAY_NO) {
		/* cannot move Subjob and can only move array job if */
		/* no subjobs are running			     */
		if ((jt != IS_ARRAY_ArrayJob) ||
		    (jobp->ji_ajinfo->tkm_subjsct[JOB_STATE_RUNNING] != 0)) {
			req_reject(PBSE_IVALREQ, 0, req);
			return;
		}
	}

	/*
	 * svr_movejob() does the real work, handles both local and
	 * network moves
	 */

	switch (svr_movejob(jobp, req->rq_ind.rq_move.rq_destin, req)) {
		case 0: /* success */
			(void) strcpy(log_buffer, msg_movejob);
			(void) sprintf(log_buffer + strlen(log_buffer),
				       msg_manager, req->rq_ind.rq_move.rq_destin,
				       req->rq_user, req->rq_host);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  jobp->ji_qs.ji_jobid, log_buffer);
			reply_ack(req);
			break;
		case -1:
		case -2:
		case 1: /* fail */
			if (jobp)
				svr_evalsetjobstate(jobp);

			if (jobp && jobp->ji_clterrmsg)
				reply_text(req, pbs_errno, jobp->ji_clterrmsg);
			else
				req_reject(pbs_errno, 0, req);
			break;
		case 2: /* deferred, will be handled by 	   */
			/* post_movejob() when the child completes */
			break;
	}
	return;
}

/**
 * @brief
 * 		req_orderjob - reorder the jobs in a queue
 *
 * @param[in,out]	req	-	the batch request
 */
void
req_orderjob(struct batch_request *req)
{
	int jt1, jt2; /* job type */
	job *pjob;
	job *pjob1;
	job *pjob2;
	long long rank;
	int rc;
	char tmpqn[PBS_MAXQUEUENAME + 1];
	conn_t *conn = NULL;
	char *physhost = NULL;

	if ((pjob1 = chk_job_request(req->rq_ind.rq_move.rq_jid, req, &jt1, NULL)) == NULL)
		return;
	if ((pjob2 = chk_job_request(req->rq_ind.rq_move.rq_destin, req, &jt2, NULL)) == NULL)
		return;
	if ((jt1 == IS_ARRAY_Single) || (jt2 == IS_ARRAY_Single) ||
	    (jt1 == IS_ARRAY_Range) || (jt2 == IS_ARRAY_Range)) {
		/* can only move regular or Array Job, not Subjobs */
		req_reject(PBSE_IVALREQ, 0, req);
		return;
	}

	if (check_job_state(pjob = pjob1, JOB_STATE_LTR_RUNNING) ||
	    check_job_state(pjob = pjob2, JOB_STATE_LTR_RUNNING) ||
	    check_job_state(pjob = pjob1, JOB_STATE_LTR_BEGUN) ||
	    check_job_state(pjob = pjob2, JOB_STATE_LTR_BEGUN)) {
#ifndef NDEBUG
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG,
			   pjob->ji_qs.ji_jobid, "(%s) %s, state=%c",
			   __func__, msg_badstate, get_job_state(pjob));
#endif /* NDEBUG */
		req_reject(PBSE_BADSTATE, 0, req);
		return;
	} else if (pjob1->ji_qhdr != pjob2->ji_qhdr) {

		/* Jobs are in different queues */

		conn = get_conn(req->rq_conn);
		if (conn) {
			physhost = conn->cn_physhost;
		}

		if ((rc = svr_chkque(pjob1, pjob2->ji_qhdr,
				     get_jattr_str(pjob1, JOB_ATR_submit_host),
				     physhost,
				     MOVE_TYPE_Order)) ||
		    (rc = svr_chkque(pjob2, pjob1->ji_qhdr,
				     get_jattr_str(pjob2, JOB_ATR_submit_host),
				     physhost,
				     MOVE_TYPE_Order))) {
			req_reject(rc, 0, req);
			return;
		}
	}

	/* now swap the order of the two jobs in the queue lists */

	rank = get_jattr_ll(pjob1, JOB_ATR_qrank);
	set_jattr_ll_slim(pjob1, JOB_ATR_qrank, get_jattr_ll(pjob2, JOB_ATR_qrank), SET);
	set_jattr_ll_slim(pjob2, JOB_ATR_qrank, rank, SET);

	if (pjob1->ji_qhdr != pjob2->ji_qhdr) {
		(void) strcpy(tmpqn, pjob1->ji_qs.ji_queue);
		(void) strcpy(pjob1->ji_qs.ji_queue, pjob2->ji_qs.ji_queue);
		(void) strcpy(pjob2->ji_qs.ji_queue, tmpqn);
		svr_dequejob(pjob1);
		svr_dequejob(pjob2);
		(void) svr_enquejob(pjob1, NULL);
		(void) svr_enquejob(pjob2, NULL);

	} else {
		swap_link(&pjob1->ji_jobque, &pjob2->ji_jobque);
		swap_link(&pjob1->ji_alljobs, &pjob2->ji_alljobs);
	}

	/* need to update disk copy of both jobs to save new order */
	job_save_db(pjob1);
	job_save_db(pjob2);

	reply_ack(req);
}


================================================
FILE: src/server/req_preemptjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * @file	svr_preemptjob.c
 *
 * Functions relating to the Hold and Release Job Batch Requests.
 *
 * Included funtions are:
 *	req_holdjob()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <time.h>
#include <sys/types.h>
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "server.h"
#include "batch_request.h"
#include "net_connect.h"
#include "job.h"
#include "pbs_error.h"
#include "log.h"
#include "acct.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

extern void post_signal_req(struct work_task *);
struct preempt_ordering *svr_get_preempt_order(job *pjob, pbs_sched *psched);

/* Global Data Items: */

extern struct server server;

extern time_t time_now;

const static char *preempt_methods[] = {
	"",
	"suspend",
	"checkpoint",
	"requeue",
	"delete",
	""};

/**
 * @brief mark a job preemption as failed
 * @param[in] preempt_preq - the preemption preq from the scheduler
 * @param[in] job_id - the job to mark as failed
 * @return void
 */
static void
job_preempt_fail(struct batch_request *preempt_preq, char *job_id)
{
	int preempt_index = preempt_preq->rq_reply.brp_un.brp_preempt_jobs.count;
	preempt_job_info *preempt_jobs_list = preempt_preq->rq_reply.brp_un.brp_preempt_jobs.ppj_list;

	preempt_preq->rq_reply.brp_code = 1;
	strcpy(preempt_jobs_list[preempt_index].order, "000");
	sprintf(preempt_jobs_list[preempt_index].job_id, "%s", job_id);
	preempt_preq->rq_reply.brp_un.brp_preempt_jobs.count++;
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, job_id, "Job failed to be preempted");
}

/**
 * @brief create a local batch_request for a suspend request
 * @param[in] job_id - the job to create the request for
 * @return batch_request *
 * @retval new batch_request for suspend
 */
static struct batch_request *
create_suspend_request(char *job_id)
{
	struct batch_request *newreq;

	newreq = alloc_br(PBS_BATCH_SignalJob);
	if (newreq == NULL)
		return NULL;
	snprintf(newreq->rq_ind.rq_signal.rq_jid, sizeof(newreq->rq_ind.rq_signal.rq_jid), "%s", job_id);
	snprintf(newreq->rq_ind.rq_signal.rq_signame, sizeof(newreq->rq_ind.rq_signal.rq_signame), "%s", SIG_SUSPEND);
	return newreq;
}

/**
 * @brief create a local batch_request for a checkpoint request
 * @param[in] job_id - the job to create the request for
 * @return batch_request *
 * @retval new batch_request for holdjob (checkpoint)
 */

static struct batch_request *
create_ckpt_request(char *job_id)
{
	int hold_name_size;
	int hold_val_size = 2; /* 2 for 's' and '\0' */
	struct batch_request *newreq;
	svrattrl *hold_svrattrl;

	hold_name_size = strlen(job_attr_def[(int) JOB_ATR_hold].at_name) + 1;
	newreq = alloc_br(PBS_BATCH_HoldJob);
	hold_svrattrl = attrlist_alloc(hold_name_size, 0, hold_val_size);
	if (newreq == NULL || hold_svrattrl == NULL) {
		if (newreq != NULL)
			free_br(newreq);
		if (hold_svrattrl != NULL)
			free(hold_svrattrl);
		return NULL;
	}
	snprintf(newreq->rq_ind.rq_hold.rq_orig.rq_objname, sizeof(newreq->rq_ind.rq_hold.rq_orig.rq_objname), "%s", job_id);
	snprintf(hold_svrattrl->al_name, hold_name_size, "%s", job_attr_def[(int) JOB_ATR_hold].at_name);
	snprintf(hold_svrattrl->al_value, hold_val_size, "s");
	CLEAR_HEAD(newreq->rq_ind.rq_hold.rq_orig.rq_attr);
	append_link(&newreq->rq_ind.rq_hold.rq_orig.rq_attr, &hold_svrattrl->al_link, hold_svrattrl);

	return newreq;
}

/**
 * @brief create a local batch_request for a requeue request
 * @param[in] job_id - the job to create the request for
 * @return batch_request *
 * @retval new batch_request for rerun (requeue)
 */

static struct batch_request *
create_requeue_request(char *job_id)
{
	struct batch_request *newreq;

	newreq = alloc_br(PBS_BATCH_Rerun);
	if (newreq == NULL)
		return NULL;

	snprintf(newreq->rq_ind.rq_signal.rq_jid, sizeof(newreq->rq_ind.rq_signal.rq_jid), "%s", job_id);
	return newreq;
}

/**
 * @brief create a local batch_request for a delete request
 * @param[in] job_id - the job to create the request for
 * @return batch_request *
 * @retval new batch_request for delete
 */

static struct batch_request *
create_delete_request(char *job_id)
{
	struct batch_request *newreq;
	newreq = alloc_br(PBS_BATCH_DeleteJob);
	if (newreq == NULL)
		return NULL;
	snprintf(newreq->rq_ind.rq_delete.rq_objname, sizeof(newreq->rq_ind.rq_delete.rq_objname), "%s", job_id);
	return newreq;
}

/**
 * @brief create and issue local preemption request for a job
 * @param[in] preempt_method - preemption method
 * @param[in] pjob - the job to be preempted
 * @param[in] preq - the preempt request from the scheduler
 * @return success/failure
 */
static int
issue_preempt_request(int preempt_method, job *pjob, struct batch_request *preq)
{
	struct batch_request *newreq;
	struct work_task *pwt;

	switch (preempt_method) {
		case PREEMPT_METHOD_SUSPEND:
			newreq = create_suspend_request(pjob->ji_qs.ji_jobid);
			break;
		case PREEMPT_METHOD_CHECKPOINT:
			newreq = create_ckpt_request(pjob->ji_qs.ji_jobid);
			break;
		case PREEMPT_METHOD_REQUEUE:
			newreq = create_requeue_request(pjob->ji_qs.ji_jobid);
			break;
		case PREEMPT_METHOD_DELETE:
			newreq = create_delete_request(pjob->ji_qs.ji_jobid);
			break;
		default:
			return 1;
	}

	if (newreq != NULL) {
		newreq->rq_extend = NULL;
		snprintf(newreq->rq_user, sizeof(newreq->rq_user), "%s", preq->rq_user);
		snprintf(newreq->rq_host, sizeof(newreq->rq_host), "%s", preq->rq_host);
		newreq->rq_perm = preq->rq_perm;
		if (issue_Drequest(PBS_LOCAL_CONNECTION, newreq, release_req, &pwt, 0) == -1) {
			free_br(newreq);
			return 1;
		}
		append_link(&pjob->ji_svrtask, &pwt->wt_linkobj, pwt);
	} else
		return 1;

	return 0;
}

/**
 * @brief clear the system hold on a job after a checkpoint request
 * @param[in] pjob - the job to clear
 */
static void
clear_preempt_hold(job *pjob)
{
	long old_hold;
	int newsub;
	char newstate;

	old_hold = get_jattr_long(pjob, JOB_ATR_hold);
	set_jattr_generic(pjob, JOB_ATR_hold, "s", NULL, DECR);

	if (old_hold != get_jattr_long(pjob, JOB_ATR_hold)) {
		svr_evaljobstate(pjob, &newstate, &newsub, 0);
		svr_setjobstate(pjob, newstate, newsub); /* saves job */
	}
	if (get_jattr_long(pjob, JOB_ATR_hold) == 0)
		free_jattr(pjob, JOB_ATR_Comment);
}

/**
 * @brief
 * req_preemptjobs- service the Preempt Jobs Request
 *
 * This request tries to preempt multiple jobs.
 * The state of the job may change as a result.
 *
 * @param[in,out]	preq	- The Request
 */

void
req_preemptjobs(struct batch_request *preq)
{
	int i = 0;
	int count = 0;
	job *pjob = NULL;
	preempt_job_info *ppj = NULL;
	pbs_sched *psched;
	int preempt_index = 0;
	int preempt_total;
	preempt_job_info *preempt_jobs_list;

	preq->rq_reply.brp_code = 0;
	count = preq->rq_ind.rq_preempt.count;
	psched = find_sched_from_sock(preq->rq_conn, CONN_SCHED_PRIMARY);
	preempt_total = preq->rq_ind.rq_preempt.count;

	if (psched == NULL) {
		req_reject(PBSE_INTERNAL, 0, preq);
		return;
	}

	if ((preempt_jobs_list = calloc(sizeof(preempt_job_info), preempt_total)) == NULL) {
		req_reject(PBSE_SYSTEM, 0, preq);
		log_err(errno, __func__, "Unable to allocate memory");
		return;
	}

	preq->rq_reply.brp_un.brp_preempt_jobs.ppj_list = preempt_jobs_list;
	preq->rq_reply.brp_choice = BATCH_REPLY_CHOICE_PreemptJobs;
	preq->rq_reply.brp_un.brp_preempt_jobs.count = 0;

	for (i = 0; i < count; i++) {
		ppj = &(preq->rq_ind.rq_preempt.ppj_list[i]);
		pjob = find_job(ppj->job_id);
		/* The job is already out of the way. This must have happened after the scheduler
		 * queried the universe and before it tried to preempt the jobs.
		 * Regardless of the preempt_order, use the correct reply code to what
		 * actually happened so the scheduler correctly handles the job.
		 */
		if (pjob == NULL) {
			sprintf(preempt_jobs_list[preempt_index].job_id, "%s", ppj->job_id);
			strcpy(preempt_jobs_list[preempt_index].order, "D");
			preempt_index++;
			continue;
		}

		if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
			sprintf(preempt_jobs_list[preempt_index].job_id, "%s", ppj->job_id);
			switch (get_job_state(pjob)) {
				case JOB_STATE_LTR_QUEUED:
					strcpy(preempt_jobs_list[preempt_index].order, "Q");
					preempt_index++;
					break;
				case JOB_STATE_LTR_EXPIRED:
				case JOB_STATE_LTR_FINISHED:
				case JOB_STATE_LTR_MOVED:
					strcpy(preempt_jobs_list[preempt_index].order, "D");
					preempt_index++;
					break;
				default:
					job_preempt_fail(preq, ppj->job_id);
					preempt_index++;
			}
			continue;
		}

		pjob->ji_pmt_preq = preq;

		pjob->preempt_order = svr_get_preempt_order(pjob, psched);
		pjob->preempt_order_index = 0;
		if (issue_preempt_request((int) pjob->preempt_order[0].order[0], pjob, preq))
			reply_preempt_jobs_request(PBSE_SYSTEM, (int) pjob->preempt_order[0].order[0], pjob);
	}
	preq->rq_reply.brp_un.brp_preempt_jobs.count = preempt_index;
	/* check if all jobs failed */
	if (preempt_index == preempt_total)
		reply_send(preq);
}

/**
 * @brief
 * reply_preempt_jobs_request- synthesize and reply to Preempt Jobs Request
 *
 * If an attempt to preempt the job fails, we use the next method to preempt
 * that job as per the preemption order,
 *
 * If the job gets preempted successfully, job-id is added to the reply.
 *
 * @param[in] code - determines if the job was preempted or not.
 * @param[in] aux  - determines the method by which job was preempted.
 * @param[in] pjob - the job in which we are replying to the preemption request
 */

void
reply_preempt_jobs_request(int code, int aux, struct job *pjob)
{
	struct batch_request *preq;
	int clear_preempt_vars = 0;

	if (pjob == NULL)
		return;

	preq = pjob->ji_pmt_preq;

	if (code != PBSE_NONE) {
		snprintf(log_buffer, sizeof(log_buffer), "preemption method %s failed for job (%d)", preempt_methods[aux], code);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer);

		if (pjob->preempt_order[0].order[pjob->preempt_order_index] == PREEMPT_METHOD_CHECKPOINT)
			clear_preempt_hold(pjob);

		pjob->preempt_order_index++;
		if (pjob->preempt_order[0].order[pjob->preempt_order_index] != PREEMPT_METHOD_LOW) {
			if (issue_preempt_request((int) pjob->preempt_order[0].order[pjob->preempt_order_index], pjob, preq)) {
				job_preempt_fail(preq, pjob->ji_qs.ji_jobid);
				clear_preempt_vars = 1;
			} else {
				/* reply_preempt_jobs_request() is somewhat recursive.  If a preemption method fails, one call will issue the next
				 * preemptiom method request.  The next preemption method request immediately is rejected, it will call
				 * reply_preempt_jobs_request() again before the first call ends.  A reject like this is considered a successful
				 * call to issue_Drequest().  If pjob->ji_pmt_preq has been NULLed, it means the last preemption method has failed.
				 * If this is the last job in the preemption list, the call to reply_preempt_job_request() will have replied to
				 * the scheduler.  In this case, we do not want to reply a second time.
				 */
				if (pjob->ji_pmt_preq == NULL)
					return;
			}
		} else {
			job_preempt_fail(preq, pjob->ji_qs.ji_jobid);
			clear_preempt_vars = 1;
		}
	} else {
		int preempt_index;
		preempt_job_info *preempt_jobs_list;

		preempt_index = preq->rq_reply.brp_un.brp_preempt_jobs.count;
		preempt_jobs_list = preq->rq_reply.brp_un.brp_preempt_jobs.ppj_list;

		/* successful preemption */
		set_jattr_l_slim(pjob, JOB_ATR_sched_preempted, time(0), SET);
		switch (aux) {
			case PREEMPT_METHOD_SUSPEND:
				strcpy(preempt_jobs_list[preempt_index].order, "S");
				break;
			case PREEMPT_METHOD_CHECKPOINT:
				strcpy(preempt_jobs_list[preempt_index].order, "C");
				clear_preempt_hold(pjob);
				break;
			case PREEMPT_METHOD_REQUEUE:
				strcpy(preempt_jobs_list[preempt_index].order, "Q");
				break;
			case PREEMPT_METHOD_DELETE:
				strcpy(preempt_jobs_list[preempt_index].order, "D");
				break;
		}
		sprintf(preempt_jobs_list[preempt_index].job_id, "%s", pjob->ji_qs.ji_jobid);
		clear_preempt_vars = 1;

		preq->rq_reply.brp_un.brp_preempt_jobs.count++;
	}
	if (clear_preempt_vars) {
		pjob->preempt_order_index = 0;
		pjob->preempt_order = NULL;
		pjob->ji_pmt_preq = NULL;
	}
	/* send reply if we're done */
	if (preq->rq_reply.brp_un.brp_preempt_jobs.count == preq->rq_ind.rq_preempt.count) {
		reply_send(preq);
	}
}

/**
 * @brief
 *  get_job_req_used_time - get a running job's req and used time for preemption
 *
 * @param[in]	pjob - the job in question
 * @param[out]	rtime - return pointer to the requested time
 * @param[out]	utime - return pointer to the used time
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for error
 */
static int
get_job_req_used_time(job *pjob, int *rtime, int *utime)
{
	double req = 0;
	double used = 0;

	if (pjob == NULL || rtime == NULL || utime == NULL)
		return 1;

	req = get_softwall(pjob);
	if (req == -1)
		req = get_wall(pjob);

	if (req == -1) {
		req = get_cput(pjob);
		used = get_used_cput(pjob);
	} else
		used = get_used_wall(pjob);

	*rtime = req;
	*utime = used;

	return 0;
}

/**
 * @brief
 *  	svr_get_preempt_order - deduce the preemption ordering to be used for a job
 *
 * @param[in]	pjob	-	the job to preempt
 * @param[in]	psched	-	Pointer to the sched object.
 *
 * @return	: struct preempt_ordering.  array containing preemption order
 *
 */
struct preempt_ordering *
svr_get_preempt_order(job *pjob, pbs_sched *psched)
{
	struct preempt_ordering *po = NULL;
	int req = -1;
	int used = -1;

	if (get_job_req_used_time(pjob, &req, &used) != 0)
		return NULL;

	po = get_preemption_order(psched->preempt_order, req, used);

	return po;
}


================================================
FILE: src/server/req_quejob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * 		Functions relating to the Queue Job Batch Request sequence, including
 * 		Queue Job, Job Script, Ready to Commit, and Commit.
 *
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <ctype.h>
#include <errno.h>
#include <fcntl.h>
#include <assert.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <libutil.h>

#include <unistd.h>
#include <sys/param.h>
#include <netinet/in.h>
#include <sys/time.h>

#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server.h"
#include "work_task.h"
#include "credential.h"
#include "ticket.h"
#include "batch_request.h"
#include "resv_node.h"
#include "queue.h"
#include "job.h"
#include "reservation.h"
#include "net_connect.h"
#include "pbs_error.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "sched_cmds.h"
#include "log.h"
#include "acct.h"
#include "tpp.h"
#include "user.h"
#include "hook.h"
#include "pbs_internal.h"
#include "pbs_sched.h"
#ifndef PBS_MOM
#include "pbs_db.h"
#define SEQ_WIN_INCR 1000 /*save jobid number to database in this increment*/
#endif
#include "libutil.h"

#ifdef PBS_MOM
#include "mom_hook_func.h"
#include "placementsets.h"

#include <pwd.h>
#include "mom_func.h"

extern char mom_host[PBS_MAXHOSTNAME + 1];
#endif /* PBS_MOM */

#define RESV_INFINITY (60 * 60 * 24 * 365 * 5)

/* External Functions Called: */

extern struct connection *svr_conn;
#ifndef PBS_MOM
extern int remtree(char *);
#ifdef NAS /* localmod 005 */
extern int apply_aoe_inchunk_rules(resource *, attribute *, void *, int);
#endif /* localmod 005 */
void post_sendmom(struct work_task *);
void post_sendmom_inner(job *, struct batch_request *, int, int, char *);
#endif /* PBS_MOM */

/* Global Data Items: */

#ifndef PBS_MOM
extern char *path_spool;
extern struct server server;
extern struct attribute attr_jobscript_max_size;
extern char server_name[];
extern unsigned int pbs_server_port_dis;
extern char *resc_in_err;
#endif /* PBS_MOM */

extern int resc_access_perm;
extern pbs_list_head svr_alljobs;
extern pbs_list_head svr_newjobs;
extern attribute_def job_attr_def[];
extern char *path_jobs;
extern char *pbs_o_host;
extern char *msg_script_open;
extern char *msg_script_write;
extern char *msg_jobnew;
extern char *msg_resvQcreateFail;
extern char *msg_defproject;
extern char *msg_mom_reject_root_scripts;
extern int reject_root_scripts;
extern time_t time_now;

#ifndef PBS_MOM
extern void *svr_db_conn;
extern char *msg_max_no_minwt;
extern char *msg_min_gt_maxwt;
extern char *msg_nostf_resv;
extern char *msg_nostf_jobarray;
#endif

/* Private Functions in this file */

static job *locate_new_job(struct batch_request *preq, char *jobid);

#ifndef PBS_MOM /* SERVER only */
static void handle_qmgr_reply_to_resvQcreate(struct work_task *);
static int get_queue_for_reservation(resc_resv *);
static int ignore_attr(char *);
static int validate_place_req_of_job_in_reservation(job *pj);

/* To generate the job/resv id's locally */
void reset_svr_sequence_window(void);
long long next_svr_sequence_id = 0;

static char *pbs_o_que = "PBS_O_QUEUE=";
/**
 * @brief
 * 		validate_perm_res_in_select -	checks to see if the resources
 * 		appearing in select spec 'val' are  valid based on
 * 		"caller's" permission level (i.e. resc_access_perm).
 * 		optionally checks if the resources exist based on val_exist parameter
 *
 * @param[in]	val	-	select spec 'val'
 * @param[in]	val_exist	-	validate if res exists in server def
 *
 * @return	error code
 * @retval	0	: success
 * @retval	!0	: failure
 * @retval	PBSE_INVALSELECTRESC	: 'resc_in_err' is also set to the name of the offending resource.
 *
 * @note
 *		NOTE:	'resc_in_err' is a malloced-string which is used and
 *		freed inside req_reject().
 *		So upon PBS_INVALSELECTRES or PBSE_UNKRESC return, be sure to
 *		issue req_reject().
*/
int
validate_perm_res_in_select(char *val, int val_exist)
{
	char *chunk;
	int nchk;
	int nelem;
	struct key_value_pair *pkvp;
	int rc = 0;
	int j;
	resource_def *presc;

	if (val == NULL)
		return (0); /* nothing to validate */

	chunk = parse_plus_spec(val, &rc); /* break '+' seperated substrings */
	if (rc != 0)
		return (rc);

	while (chunk) {

		if (parse_chunk(chunk, &nchk, &nelem, &pkvp, NULL) == 0) {

			/* first check for any invalid resources in the select */
			for (j = 0; j < nelem; ++j) {
				presc = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
				if (presc) {
					if ((presc->rs_flags & resc_access_perm) == 0) {
						if ((resc_in_err = strdup(pkvp[j].kv_keyw)) == NULL)
							return PBSE_SYSTEM;
						return PBSE_INVALSELECTRESC; /* for freeing resc_in_err please read "NOTE" above in function brief*/
					}
				} else if (val_exist) {
					if ((resc_in_err = strdup(pkvp[j].kv_keyw)) == NULL)
						return PBSE_SYSTEM;
					return PBSE_UNKRESC; /* for freeing resc_in_err please read "NOTE" above in function brief*/
				}
			} /* for */
		}	  /* if */
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0)
			return (rc);
	} /* while */
	return (0);
}
#endif

#define SET_RESC_SELECT 1
#define SET_RESC_PLACE 2

#ifndef PBS_MOM

/**
 * @brief	Generate and fill jobid of the new job
 * 			Note: Consider directly modifying get_next_svr_sequence_id() if reservations
 * 			also get sharded for multi-server
 *
 * @param[out]	idbuf - buffer to fill job/resv id in
 * @param[in]	clusterid - cluster name (PBS_SERVER)
 * @param[in]	objtype - object type which specifies whether it is a normal/array job or reservation
 * @param[in]	resv_char - character representing type of reservation
 *
 * @return	int
 * @retval	0 for Success
 * @retval	1 for Failure
 */
static int
generate_objid(char *idbuf, char *clusterid, int objtype, char resv_char)
{
	if (idbuf == NULL || server_name[0] == '\0' || clusterid == NULL)
		return 1;

	if (objtype == MGR_OBJ_JOB)
		sprintf(idbuf, "%lld.%s", next_svr_sequence_id, clusterid);
	else if (objtype == MGR_OBJ_JOBARRAY_PARENT)
		sprintf(idbuf, "%lld[].%s", next_svr_sequence_id, clusterid);
	else if (objtype == MGR_OBJ_RESV)
		sprintf(idbuf, "%c%lld.%s", resv_char, next_svr_sequence_id, clusterid);

	return 0;
}

#endif /* #ifndef PBS_MOM */

/**
 * @brief
 *		Queue Job Batch Request processing routine
 *
 * @param[in] - ptr to the decoded request
 *
 */

void
req_quejob(struct batch_request *preq)
{
	int created_here = 0;
	int index;
	char *jid;
	attribute_def *pdef;
	job *pj;
	svrattrl *psatl;
	int rc;
	int sock = preq->rq_conn;
	int resc_access_perm_save;
	int implicit_commit = 0;
#ifndef PBS_MOM
	int set_project = 0;
	int i;
	char jidbuf[PBS_MAXSVRJOBID + 1];
	pbs_queue *pque;
	char *qname;
	char *result;
	resource_def *prdefnod;
	resource_def *prdefsel;
	resource_def *prdefplc;
	resource *presc;
	conn_t *conn = NULL;
	char *physhost = NULL;
#else
	mom_hook_input_t hook_input;
	mom_hook_output_t hook_output;
	int hook_errcode = 0;
	int hook_rc = 0;
	char hook_buf[HOOK_MSG_SIZE];
	hook *last_phook = NULL;
	unsigned int hook_fail_action = 0;
#endif
	char hook_msg[HOOK_MSG_SIZE];

	/* set basic (user) level access permission */

	resc_access_perm = ATR_DFLAG_USWR | ATR_DFLAG_Creat;

#ifndef PBS_MOM /* server server server server */

	if (preq->prot != PROT_TPP) {
		conn = get_conn(sock);

		if (!conn) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}

		if (conn->cn_authen & PBS_NET_CONN_FORCE_QSUB_UPDATE) {
			req_reject(PBSE_FORCE_QSUB_UPDATE, 0, preq);
			conn->cn_authen &= ~PBS_NET_CONN_FORCE_QSUB_UPDATE;
			return;
		}
	}

	psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_queuejob.rq_attr);
	while (psatl) {
		if (psatl->al_name == NULL || (!strcasecmp(psatl->al_name, ATTR_l) && psatl->al_resc == NULL)) {
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		}
		if (!strcasecmp(psatl->al_name, ATTR_l) &&
		    !strcasecmp(psatl->al_resc, "select") &&
		    ((psatl->al_value != NULL) &&
		     (psatl->al_value[0] != '\0'))) {

			if ((rc = validate_perm_res_in_select(psatl->al_value, 0)) != 0) {
				req_reject(rc, 0, preq);
				return;
			}
		}
		psatl = (svrattrl *) GET_NEXT(psatl->al_link);
	}

	switch (process_hooks(preq, hook_msg, sizeof(hook_msg),
			      pbs_python_set_interrupt)) {
		case 0: /* explicit reject */
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
			return;
		case 1:					    /* explicit accept */
			if (recreate_request(preq) == -1) { /* error */
				/* we have to reject the request, as 'preq' */
				/* may have been partly modified            */
				strcpy(hook_msg,
				       "queuejob event: rejected request");
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, "", hook_msg);
				reply_text(preq, PBSE_HOOKERROR, hook_msg);
				return;
			}
			break;
		case 2: /* no hook script executed - go ahead and accept event*/
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, "", "queuejob event: accept req by default");
	}

	prdefsel = &svr_resc_def[RESC_SELECT];
	prdefplc = &svr_resc_def[RESC_PLACE];
	prdefnod = &svr_resc_def[RESC_NODES];

	/*
	 * if the job id is supplied, the request had better be
	 * from another server
	 */

	if (preq->rq_fromsvr) {
		/* from another server - accept the extra attributes */
		resc_access_perm |= ATR_DFLAG_MGWR | ATR_DFLAG_SvWR;
		jid = preq->rq_ind.rq_queuejob.rq_jid;

	} else if (preq->rq_ind.rq_queuejob.rq_jid[0] != '\0') {
		/* a job id is not allowed from a client */
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	} else {
		/* assign it a job id */

		psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_queuejob.rq_attr);
		i = MGR_OBJ_JOB;
		while (psatl) {
			/* Ensure that array_indices_submitted has a proper   */
			/* value (non-"" and non-NULL) before asserting that  */
			/* current job is a job array.			  */
			/* The Hook script can set 	value to "" meaning none  */
			/* was specified making it a normal (non job array)   */
			/* job.						  */
			/* The value should never be NULL and if so, then     */
			/* it won't be a job array.                           */
			if (!strcasecmp(psatl->al_name,
					ATTR_array_indices_submitted) &&
			    ((psatl->al_value != NULL) &&
			     (psatl->al_value[0] != '\0'))) {
				i = MGR_OBJ_JOBARRAY_PARENT;
				break;
			}
			psatl = (svrattrl *) GET_NEXT(psatl->al_link);
		}
		/* fetch job id locally*/
		if ((next_svr_sequence_id = get_next_svr_sequence_id()) == -1) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		created_here = JOB_SVFLG_HERE;
		if (generate_objid(jidbuf, server_name, i, '\0') != 0) {
			req_reject(PBSE_INTERNAL, 0, preq);
			return;
		}
		jid = jidbuf;
	}

#else  /* PBS_MOM mom mom mom mom mom mom*/

	if (preq->rq_fromsvr) { /* must be from a server */
		/* from another server - accept the extra attributes */
		resc_access_perm |= ATR_DFLAG_MGWR | ATR_DFLAG_SvWR |
				    ATR_DFLAG_MOM;
		jid = preq->rq_ind.rq_queuejob.rq_jid;
	} else {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}
#endif /* PBS_MOM all all all all all */

	/* does job already exist, check both old and new jobs */

	if ((pj = find_job(jid)) == NULL) {
		pj = (job *) GET_NEXT(svr_newjobs);
		while (pj) {
			if (!strcasecmp(pj->ji_qs.ji_jobid, jid))
				break;
			pj = (job *) GET_NEXT(pj->ji_alljobs);
		}
	}

#ifndef PBS_MOM /* server server server server server server */
	/*
	 * Check if the server is configured for history job info. If yes and
	 * server has the history job with same job id, then don't reject the
	 * queue request with PBSE_JOBEXIST but purge the history job(i.e. with
	 * job state 'M') from the server and accept queue request. If you have
	 * the real job, keeping its history info does not make any sense.
	 * Otherwise SERVER will continue to reject queue request if job already
	 * exists.
	 */
	if (pj != NULL) {
		if ((svr_chk_history_conf()) &&
		    (check_job_state(pj, JOB_STATE_LTR_MOVED))) {
			job_purge(pj);
		} else {
			/* server rejects the queue request */
			req_reject(PBSE_JOBEXIST, 0, preq);
			return;
		}
	}

	/* find requested queue, is it there? */
	qname = preq->rq_ind.rq_queuejob.rq_destin;
	if ((*qname == '\0') || (*qname == '@')) { /* use default queue */
		pque = get_dfltque();
		rc = PBSE_QUENODFLT;
	} else { /* else find the named queue */
		pque = find_queuebyname(preq->rq_ind.rq_queuejob.rq_destin);
#ifdef NAS /* localmod 075 */
		if (pque == NULL)
			pque = find_resvqueuebyname(qname);
#endif /* localmod 075 */
		rc = PBSE_UNKQUE;
	}
	if (pque == NULL) {
		req_reject(rc, 0, preq); /* not there   */
		return;
	}

	/* create the job structure */
	if ((pj = job_alloc()) == NULL) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	*pj->ji_qs.ji_fileprefix = '\0';

#else  /* PBS_MOM mom mom mom mom*/
	if (pj) {

		/*
		 * An existing job - likely was checkpointed but in rare
		 * cases may result from a Server-Mom communication error
		 *
		 * Update run version from the new request so server will
		 * accept the obit when the job finishes.
		 */

		psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_queuejob.rq_attr);
		while (psatl) {
			/* look for run count attribute */
			index = find_attr(job_attr_idx, job_attr_def, psatl->al_name);
			if (index == (int) JOB_ATR_run_version) {
				set_jattr_str_slim(pj, index, psatl->al_value, psatl->al_resc);
				break;
			}
			psatl = (svrattrl *) GET_NEXT(psatl->al_link);
		}

		/* if actually running, tell Server we already have it */
		if (check_job_substate(pj, JOB_SUBSTATE_RUNNING)) {
			req_reject(PBSE_JOBEXIST, 0, preq);
			return;
		}

		/* if checkpointed, then keep old and skip rest of process */

		if (pj->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) {
			set_job_substate(pj, JOB_SUBSTATE_TRANSIN);
			int prot = preq->prot;
			if (reply_jobid(preq, pj->ji_qs.ji_jobid, BATCH_REPLY_CHOICE_Queue) == 0) {
				delete_link(&pj->ji_alljobs);
				if (pbs_idx_delete(jobs_idx, pj->ji_qs.ji_jobid) != PBS_IDX_RET_OK)
					log_joberr(PBSE_INTERNAL, __func__, "Failed to remove checkpointed job from index", pj->ji_qs.ji_jobid);
				append_link(&svr_newjobs, &pj->ji_alljobs, pj);
				pj->ji_qs.ji_un_type = JOB_UNION_TYPE_NEW;
				pj->ji_qs.ji_un.ji_newt.ji_fromsock = sock;
				if (prot == PROT_TCP) {
					pj->ji_qs.ji_un.ji_newt.ji_fromaddr = get_connectaddr(sock);
				} else {
					struct sockaddr_in *addr = tpp_getaddr(sock);
					if (addr)
						pj->ji_qs.ji_un.ji_newt.ji_fromaddr = (pbs_net_t) ntohl(addr->sin_addr.s_addr);
				}
				pj->ji_qs.ji_un.ji_newt.ji_scriptsz = 0;
			} else {
				close_client(sock); /* error on reply */
			}
			return;
		}
		/* unlink job from svr_alljobs since will be place on newjobs */
		delete_link(&pj->ji_alljobs);
		if (pbs_idx_delete(jobs_idx, pj->ji_qs.ji_jobid) != PBS_IDX_RET_OK)
			log_joberr(PBSE_INTERNAL, __func__, "Failed to remove job from index", pj->ji_qs.ji_jobid);
	} else {
		char *namebuf;
		char basename[MAXPATHLEN + 1] = {0};

		/* if not already here, allocate job struct */

		if ((pj = job_alloc()) == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		/*
		 *
		 * for MOM - rather than make up a hashname, we use the sent
		 * to us by the server as an attribute.
		 */
		psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_queuejob.rq_attr);
		while (psatl) {
			if (!strcmp(psatl->al_name, ATTR_hashname)) {
				strncpy(basename, psatl->al_value, MAXPATHLEN);
				if (strlen(basename) <= PBS_JOBBASE)
					strcpy(pj->ji_qs.ji_fileprefix, basename);
				else
					*pj->ji_qs.ji_fileprefix = '\0';
				break;
			}
			psatl = (svrattrl *) GET_NEXT(psatl->al_link);
		}
		pbs_asprintf(&namebuf, "%s%s%s", path_jobs, basename, JOB_TASKDIR_SUFFIX);
		if (mkdir(namebuf, 0700) == -1) {
			pj->ji_qs.ji_un.ji_momt.ji_exitstat = -1;
			if (*pj->ji_qs.ji_fileprefix == '\0' && *pj->ji_qs.ji_jobid == '\0') {
				snprintf(pj->ji_qs.ji_jobid, sizeof(pj->ji_qs.ji_jobid), "%s", jid);
			}
			job_purge(pj);
			req_reject(PBSE_SYSTEM, 0, preq);
			free(namebuf);
			return;
		}
		created_here = JOB_SVFLG_HERE;
		free(namebuf);
	}
#endif /* PBS_MOM */

	(void) strcpy(pj->ji_qs.ji_jobid, jid);
	pj->ji_qs.ji_svrflags = created_here;
	pj->ji_qs.ji_un_type = JOB_UNION_TYPE_NEW;

	/* decode attributes from request into job structure */

	psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_queuejob.rq_attr);
	resc_access_perm_save = resc_access_perm; /* save perm */
	while (psatl) {

		/* identify the attribute by name */

		index = find_attr(job_attr_idx, job_attr_def, psatl->al_name);
		if (index < 0) {

			/* didn`t recognize the name */
#ifndef PBS_MOM
			index = JOB_ATR_UNKN; /* keep as "unknown" for now */
#else					      /* is PBS_MOM */
			reply_badattr(PBSE_NOATTR, 1, psatl, preq);
			return;
#endif					      /* PBS_MOM */
		}
		pdef = &job_attr_def[index];

#ifndef PBS_MOM
		if (index == JOB_ATR_project) {
			set_project = 1;
		}
#endif

		/* Is attribute not writeable by manager or by a server? */
		/* Exempt attributes set by the hook script */
		resc_access_perm = resc_access_perm_save; /* reset */
		if ((psatl->al_flags & ATR_VFLAG_HOOK)) {
			resc_access_perm = ATR_DFLAG_USWR |
					   ATR_DFLAG_OPWR |
					   ATR_DFLAG_MGWR |
					   ATR_DFLAG_SvWR |
					   ATR_DFLAG_Creat;
		}
		if (((pdef->at_flags & resc_access_perm) == 0)) {
			job_purge(pj);
			reply_badattr(PBSE_ATTRRO, 1, psatl, preq);
			return;
		}

		/* decode attribute */
#ifndef PBS_MOM
		if (index == JOB_ATR_create_resv_from_job) {
			if (qname != NULL && *qname != '\0') {
				resc_resv *presv;
				presv = find_resv(qname);

				if (presv) {
					job_purge(pj);
					req_reject(PBSE_RESV_FROM_RESVJOB, 0, preq);
					return;
				}
			}
		}
#endif
		if ((index == JOB_ATR_resource) && (psatl->al_resc != NULL) && (strcmp(psatl->al_resc, "neednodes") == 0))
			rc = 0;
		else
			rc = set_jattr_generic(pj, index, psatl->al_value, psatl->al_resc, INTERNAL);
#ifndef PBS_MOM
		if (rc != 0) {
			if (rc == PBSE_UNKRESC) {

				/* unknown resources not allow in Exec queue */

				if (pque->qu_qs.qu_type == QTYPE_Execution) {
					job_purge(pj);
					reply_badattr(rc, 1, psatl, preq);
					return;
				}
			} else {
				/* any other error is fatal */
				job_purge(pj);
				reply_badattr(rc, 1, psatl, preq);
				return;
			}
		}
#else  /* PBS_MOM MOM MOM MOM */
		if (rc != 0) {
			/* all  errors are fatal for MOM */

			job_purge(pj);
			reply_badattr(rc, 1, psatl, preq);
			return;
		}
		if (psatl->al_op == DFLT) {
			attribute *attr = get_jattr(pj, index);
			if (psatl->al_resc) {

				resource *presc;
				resource_def *prdef;

				prdef = find_resc_def(svr_resc_def, psatl->al_resc);
				if (prdef == 0) {
					job_purge(pj);
					reply_badattr(rc, 1, psatl, preq);
					return;
				}
				presc = find_resc_entry(attr, prdef);
				if (presc)
					presc->rs_value.at_flags |= ATR_VFLAG_DEFLT;
			} else {
				attr->at_flags |= ATR_VFLAG_DEFLT;
			}
		}
#endif /* PBS_MOM */

		psatl = (svrattrl *) GET_NEXT(psatl->al_link);
	}

#ifndef PBS_MOM

	/* perform any at_action routine declared for the attributes */

	for (i = 0; i < JOB_ATR_LAST; ++i) {
		pdef = &job_attr_def[i];
		if ((is_jattr_set(pj, i)) &&
		    (pdef->at_action)) {
			rc = pdef->at_action(get_jattr(pj, i), pj, ATR_ACTION_NEW);
			if (rc) {
				job_purge(pj);
				req_reject(rc, i, preq);
				return;
			}
		}
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	/* save gssapi/krb5 creds for this job */
	if (conn && conn->cn_credid != NULL &&
	    conn->cn_auth_config != NULL &&
	    conn->cn_auth_config->auth_method != NULL && strcmp(conn->cn_auth_config->auth_method, AUTH_GSS_NAME) == 0) {
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
			   "saving creds.  conn is %d, cred id %s", preq->rq_conn, conn->cn_credid);

		set_jattr_str_slim(pj, JOB_ATR_cred_id, conn->cn_credid, NULL);

		if (is_sattr_set(SVR_ATR_acl_krb_submit_realms)) {
			if (!acl_check(get_sattr(SVR_ATR_acl_krb_submit_realms), conn->cn_credid, ACL_Host)) {
				job_purge(pj);
				req_reject(PBSE_PERM, 0, preq);
				return;
			}
		}
	}
#endif

	/*
	 * Now that the attributes have been decoded, we can setup some
	 * additional parameters and perform a few more checks.
	 *
	 * First, set some items based on who created the job...
	 */

	if (created_here) { /* created here */
		int l;
		char buf[256];

		/* check that job has a jobname */

		if ((is_jattr_set(pj, JOB_ATR_jobname)) == 0)
			set_jattr_str_slim(pj, JOB_ATR_jobname, "none", NULL);

		/* check resources in the Resource_List are valid job wide */

		if (is_jattr_set(pj, JOB_ATR_resource)) {
			int have_selectplace = 0;
			resource_def *prdefbad;

			presc = (resource *) GET_NEXT(get_jattr_list(pj, JOB_ATR_resource));

			prdefbad = NULL;
			while (presc) {
				if (presc->rs_defin == prdefsel) {
					have_selectplace |= SET_RESC_SELECT;
				} else if (presc->rs_defin == prdefplc) {
					have_selectplace |= SET_RESC_PLACE;
				} else if ((presc->rs_defin == prdefnod) &&
					   (presc->rs_value.at_val.at_str != NULL)) {
					/*
					 * if "nodes" is set and has non-NULL value,
					 * remember as potential bad resource
					 * if this appears along "select" or "place".
					 */
					prdefbad = presc->rs_defin;
				} else if (
					(presc->rs_defin->rs_flags & ATR_DFLAG_CVTSLT) &&
					(is_attr_set(&presc->rs_value))) {
					/*
					 * if this resource is not "select", "place",
					 * or "nodes", but is meant to appear inside
					 * a "select" line, then remember as potential
					 * bad resource if this appears along
					 * "select" or "place".
					 */

					prdefbad = presc->rs_defin;
				}
				presc = (resource *) GET_NEXT(presc->rs_link);
			}
			if (have_selectplace && prdefbad) {
				if (prdefbad == prdefnod)
					rc = PBSE_INVALNODEPLACE;
				else
					rc = PBSE_INVALJOBRESC;
				if ((resc_in_err = strdup(prdefbad->rs_name)) == NULL)
					rc = PBSE_SYSTEM;
				job_purge(pj);
				req_reject(rc, 0, preq);
				return;
			}
			if (have_selectplace == SET_RESC_PLACE) {
				/* cannot have place without select */
				job_purge(pj);
				req_reject(PBSE_PLACENOSELECT, 0, preq);
				return;
			}
		}

		/* check value of priority */

		if (is_jattr_set(pj, JOB_ATR_priority)) {
			if ((get_jattr_long(pj, JOB_ATR_priority) < -1024) ||
			    (get_jattr_long(pj, JOB_ATR_priority) > 1024)) {
				job_purge(pj);
				req_reject(PBSE_BADATVAL, 0, preq);
				return;
			}
		}

		/* set job owner attribute to user@host */
		strcpy(buf, preq->rq_user);
		strcat(buf, "@");
		strcat(buf, preq->rq_host);
		set_jattr_str_slim(pj, JOB_ATR_job_owner, buf, NULL);

		if (conn) {
			strcpy(buf, conn->cn_physhost);
			set_jattr_str_slim(pj, JOB_ATR_submit_host, buf, NULL);
		}

		/* set create time */
		set_jattr_l_slim(pj, JOB_ATR_ctime, time_now, SET);

		/* set hop count = 1 */

		set_jattr_l_slim(pj, JOB_ATR_hopcount, 1, SET);

		/* need to set certain environmental variables per POSIX */
		strcpy(buf, pbs_o_que);
		strcat(buf, pque->qu_qs.qu_name);
		if (conn && get_variable(pj, pbs_o_host) == NULL) {
			strcat(buf, ",");
			strcat(buf, pbs_o_host);
			strcat(buf, "=");
			strcat(buf, conn->cn_physhost);
		}
		set_jattr_generic(pj, JOB_ATR_variables, buf, NULL, INCR);

		/* if JOB_ATR_outpath/JOB_ATR_errpath not set, set default */

		if (!(is_jattr_set(pj, JOB_ATR_outpath))) {
			set_jattr_str_slim(pj, JOB_ATR_outpath, prefix_std_file(pj, (int) 'o'), NULL);
		} else {
			l = strlen(get_jattr_str(pj, JOB_ATR_outpath));
			if (l > 0) {
				if (get_jattr_str(pj, JOB_ATR_outpath)[l - 1] == ':') {

					cat_default_std(pj, (int) 'o', get_jattr_str(pj, JOB_ATR_outpath), &result);
					if (result)
						set_jattr_str_slim(pj, JOB_ATR_outpath, result, NULL);
				}
			}
		}

		if (!(is_jattr_set(pj, JOB_ATR_errpath))) {
			set_jattr_str_slim(pj, JOB_ATR_errpath, prefix_std_file(pj, (int) 'e'), NULL);
		} else {
			l = strlen(get_jattr_str(pj, JOB_ATR_errpath));
			if (l > 0) {
				if (get_jattr_str(pj, JOB_ATR_errpath)[l - 1] == ':') {

					cat_default_std(pj, (int) 'e', get_jattr_str(pj, JOB_ATR_errpath), &result);
					if (result)
						set_jattr_str_slim(pj, JOB_ATR_errpath, result, NULL);
				}
			}
		}

		if ((get_jattr_str(pj, JOB_ATR_outpath) == 0) ||
		    (get_jattr_str(pj, JOB_ATR_errpath) == 0)) {
			job_purge(pj);
			req_reject(PBSE_NOATTR, 0, preq);
			return;
		}

		if ((is_jattr_set(pj, JOB_ATR_interactive)) && (is_jattr_set(pj, JOB_ATR_array_indices_submitted))) {
			job_purge(pj);
			req_reject(PBSE_NOSUP, 0, preq);
			return;
		}
		/* Interactive jobs are not rerunable */

		if ((is_jattr_set(pj, JOB_ATR_interactive)) && get_jattr_long(pj, JOB_ATR_interactive))
			set_jattr_l_slim(pj, JOB_ATR_rerunable, 0, SET);

		if (!is_jattr_set(pj, JOB_ATR_project))
			set_jattr_str_slim(pj, JOB_ATR_project, PBS_DEFAULT_PROJECT, NULL);

	} else { /* job was created elsewhere and moved here */

		/* make sure job_owner is set, error if not */

		if (!is_jattr_set(pj, JOB_ATR_job_owner)) {
			job_purge(pj);
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		}

		/* increment hop count */

		set_jattr_l_slim(pj, JOB_ATR_hopcount, 1, INCR);
		if (get_jattr_long(pj, JOB_ATR_hopcount) > PBS_MAX_HOPCOUNT) {
			job_purge(pj);
			req_reject(PBSE_HOPCOUNT, 0, preq);
			return;
		}

		/* make sure that if job belonged to an advance reservation
		 * queue, that old information is wiped out.  If being moved
		 * into an advance reservation queue, the reservation's ID
		 * gets attached later in the code
		 */
		set_attr_generic(get_jattr(pj, JOB_ATR_reserve_ID), &job_attr_def[(int) JOB_ATR_reserve_ID], NULL, NULL, INTERNAL);
	}

	/* set up at_server attribute for status */

	set_jattr_str_slim(pj, JOB_ATR_at_server, pbs_server_name, NULL);

	/* If enabled, check the server's required cred type */

	if (is_sattr_set(SVR_ATR_ReqCredEnable) &&
	    get_sattr_long(SVR_ATR_ReqCredEnable) &&
	    is_sattr_set(SVR_ATR_ReqCred)) {
		char *reqc = get_sattr_str(SVR_ATR_ReqCred);
		char *jobc = get_jattr_str(pj, JOB_ATR_cred);
		/*
		 **	The server requires a cred, if job has none, or
		 **	it is the wrong one, reject.
		 */
		if (!is_jattr_set(pj, JOB_ATR_cred) || strcmp(reqc, jobc) != 0) {
			job_purge(pj);
			req_reject(PBSE_BADCRED, 0, preq);
			return;
		}
	}

	if (conn) {
		physhost = conn->cn_physhost;
	}

	/*
	 * See if the job is qualified to go into the requested queue.
	 * Note, if an execution queue, then ji_qs.ji_un.ji_exect is set up
	 *
	 * svr_chkque is called way down here because it needs to have the
	 * job structure and attributes already set up.
	 */

	rc = svr_chkque(pj, pque, get_jattr_str(pj, JOB_ATR_submit_host), physhost, MOVE_TYPE_Move);
	if (rc) {
		if (pj->ji_clterrmsg)
			reply_text(preq, rc, pj->ji_clterrmsg);
		else
			req_reject(rc, 0, preq);
		job_purge(pj);
		return;
	}

	(void) strcpy(pj->ji_qs.ji_queue, pque->qu_qs.qu_name);

	/* Is job being submitted to a reservation queue?
	 * If yes, have the job point to the resc_resv object and
	 * update the job attribute JOB_ATR_reservation.
	 *
	 * Also check for conflict for job and reservation place spec
	 */
	if (pque->qu_resvp) {
		free_jattr(pj, JOB_ATR_reserve_ID);
		set_jattr_str_slim(pj, JOB_ATR_reserve_ID, pque->qu_resvp->ri_qs.ri_resvID, NULL);
		pj->ji_myResv = pque->qu_resvp;

		if (!validate_place_req_of_job_in_reservation(pj)) {
			job_purge(pj);
			psatl = (svrattrl *) GET_NEXT(
				preq->rq_ind.rq_queuejob.rq_attr);
			while (psatl) {
				if (!strcasecmp(psatl->al_name, ATTR_l) &&
				    !strcasecmp(psatl->al_resc, "place")) {
					reply_badattr(PBSE_JOBINRESV_CONFLICT, 1,
						      psatl, preq);
					return;
				}
				psatl = (svrattrl *) GET_NEXT(psatl->al_link);
			}
			if (!psatl) {
				req_reject(PBSE_JOBINRESV_CONFLICT, 0, preq);
				return;
			}
		}
	}

	set_jattr_l_slim(pj, JOB_ATR_substate, JOB_SUBSTATE_TRANSIN, SET);

	/* action routine for select does not have reservation data hence
	 * returns without doing checks. Checks are called now.
	 */
	presc = find_resc_entry(get_jattr(pj, JOB_ATR_resource), prdefsel);
	if (presc) {
		rc = apply_aoe_inchunk_rules(presc, get_jattr(pj, JOB_ATR_resource),
					     pj, PARENT_TYPE_JOB);
		if (rc) {
			job_purge(pj);
			req_reject(rc, 0, preq);
			return;
		}
	}
#endif /* not PBS_MOM */

	/* set remaining job structure elements			*/

	set_job_state(pj, JOB_STATE_LTR_TRANSIT);
	set_job_substate(pj, JOB_SUBSTATE_TRANSIN);
	set_jattr_l_slim(pj, JOB_ATR_mtime, time_now, SET);

	pj->ji_qs.ji_un_type = JOB_UNION_TYPE_NEW;
	pj->ji_qs.ji_un.ji_newt.ji_fromsock = sock;
	pj->ji_qs.ji_un.ji_newt.ji_scriptsz = 0;

#ifdef PBS_MOM
	if ((is_jattr_set(pj, JOB_ATR_executable)) &&
	    (reject_root_scripts == TRUE) &&
	    (is_jattr_set(pj, JOB_ATR_euser)) &&
	    (get_jattr_str(pj, JOB_ATR_euser) != NULL)) {
#ifdef WIN32

		/* equivalent of root */
		if (isAdminPrivilege(get_jattr_str(pj, JOB_ATR_euser)))
#else
		struct passwd *pwdp;

		pwdp = getpwnam(get_jattr_str(pj, JOB_ATR_euser));
		if ((pwdp != NULL) && (pwdp->pw_uid == 0))
#endif
		{
			log_err(-1, __func__, msg_mom_reject_root_scripts);
			reply_text(preq, PBSE_MOM_REJECT_ROOT_SCRIPTS, msg_mom_reject_root_scripts);
			job_purge(pj);
			return;
		}
	}
	mom_hook_input_init(&hook_input);
	hook_input.pjob = pj;

	mom_hook_output_init(&hook_output);
	hook_output.reject_errcode = &hook_errcode;
	hook_output.last_phook = &last_phook;
	hook_output.fail_action = &hook_fail_action;

	switch ((hook_rc = mom_process_hooks(HOOK_EVENT_EXECJOB_BEGIN, PBS_MOM_SERVICE_NAME,
					     mom_host, &hook_input, &hook_output, hook_buf, sizeof(hook_buf), 1))) {
		case 1: /* explicit accept */
			break;
		case 2: /* no hook script executed - go ahead and accept event*/
			break;
		default:
			/* a value of '0' means explicit reject encountered. */
			if (hook_rc != 0) {
				/* we've hit an internal error (malloc error, full disk, etc...), so */
				/* treat this now like a  hook error so hook fail_action  */
				/* will be consulted.  */
				/* Before, behavior of an internal error was to ignore it! */
				hook_errcode = PBSE_HOOKERROR;
			}
			if (hook_errcode == PBSE_HOOKERROR) { /* error */
				/* piggy back the hook_name in the message */
				/* to be stripped out by the server upon */
				/* processing hook fail_action */
				snprintf(hook_msg, sizeof(hook_msg), "%s,%.*s",
					 last_phook ? last_phook->hook_name : "",
					 (int) (sizeof(hook_msg) - (last_phook ? strlen(last_phook->hook_name) : 0) - 2),
					 (hook_rc == 0) ? hook_buf : "internal error");
			} else {
				snprintf(hook_msg, sizeof(hook_msg), ",%.*s",
					 (int) (sizeof(hook_msg) - 2), hook_buf);
			}

			job_purge(pj);
			reply_text(preq, hook_errcode, hook_msg);
			return;
	}
#endif

	/* check implicit commit only not blocking job */
	if ((is_jattr_set(pj, JOB_ATR_block)) == 0)
		implicit_commit = ((preq->rq_extend) && (strstr(preq->rq_extend, EXTEND_OPT_IMPLICIT_COMMIT)));

	/* acknowledge the request with the job id */
	if (!implicit_commit) {
		if (preq->prot == PROT_TCP) {
			pj->ji_qs.ji_un.ji_newt.ji_fromaddr = get_connectaddr(sock);
			/* acknowledge the request with the job id */
			if (reply_jobid(preq, pj->ji_qs.ji_jobid, BATCH_REPLY_CHOICE_Queue) != 0) {
				/* reply failed, purge the job and close the connection */

				close_client(sock);
				job_purge(pj);
				return;
			}
		} else {
			struct sockaddr_in *addr = tpp_getaddr(sock);
			if (addr)
				pj->ji_qs.ji_un.ji_newt.ji_fromaddr = (pbs_net_t) ntohl(addr->sin_addr.s_addr);
			free_br(preq);
			/* No need of acknowledge for TPP */
		}
	}

#ifndef PBS_MOM
	if (set_project && (is_jattr_set(pj, JOB_ATR_project)) &&
	    (strcmp(get_jattr_str(pj, JOB_ATR_project), PBS_DEFAULT_PROJECT) == 0))
		log_eventf(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_INFO, pj->ji_qs.ji_jobid, msg_defproject, ATTR_project, PBS_DEFAULT_PROJECT);
#endif

	if (implicit_commit) {
		req_commit_now(preq, pj);
		return;
	}

	/* link job into server's new jobs list request  */

	append_link(&svr_newjobs, &pj->ji_alljobs, pj);

#ifndef PBS_MOM
	{
		job *pjob;
		int myport, port;
		char *myhost, *host;

		/*
		 **	If the JOB_ATR_block attribute is set, look through the
		 **	other jobs to make sure the host/port combo is unique.
		 */
		if ((is_jattr_set(pj, JOB_ATR_block)) == 0)
			return;

		myhost = get_jattr_str(pj, JOB_ATR_submit_host);
		if (myhost == NULL)
			return;
		myport = (int) get_jattr_long(pj, JOB_ATR_block);
		if (myport == 0)
			return;

		for (pjob = (job *) GET_NEXT(svr_alljobs);
		     pjob != NULL;
		     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
			if (pjob == pj)
				continue;
			if (!is_jattr_set(pjob, JOB_ATR_block))
				continue;

			port = (int) get_jattr_long(pjob, JOB_ATR_block);
			if (port != myport)
				continue;
			host = get_jattr_str(pjob, JOB_ATR_submit_host);
			if (host == NULL)
				continue;
			if (strcmp(host, myhost) != 0)
				continue;

			/* we found a job with the same host/port */
			sprintf(log_buffer,
				"job %s has duplicate BLOCK host %s port %d",
				pjob->ji_qs.ji_jobid, host, port);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
				  pj->ji_qs.ji_jobid, log_buffer);

			/* unset the old job's JOB_ATR_block */
			set_jattr_l_slim(pjob, JOB_ATR_block, 0, SET);
			mark_jattr_not_set(pjob, JOB_ATR_block);
		}
	}
#endif /* not PBS_MOM */
}

/**
 * @brief
 * 		req_jobcredential - receive a set of credentials to be used by the job
 *
 * @param[in]	preq	-	ptr to the decoded request
 */
void
req_jobcredential(struct batch_request *preq)
{
	job *pj;
	int type;
	char *cred;
	size_t len;

	DBPRT(("%s: entered\n", __func__))
	pj = locate_new_job(preq, NULL);
	if (pj == NULL) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}
	if (!check_job_substate(pj, JOB_SUBSTATE_TRANSIN)) {
		delete_link(&pj->ji_alljobs);
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

#ifndef PBS_MOM
	if (svr_authorize_jobreq(preq, pj) == -1) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}
#endif /* PBS_MOM */

	type = pj->ji_extended.ji_ext.ji_credtype =
		preq->rq_ind.rq_jobcred.rq_type;
	cred = preq->rq_ind.rq_jobcred.rq_data;
	len = (size_t) preq->rq_ind.rq_jobcred.rq_size;

	switch (type) {

		default:
			if (write_cred(pj, cred, len) == -1) {
				delete_link(&pj->ji_alljobs);
				req_reject(PBSE_SYSTEM, 0, preq);
			} else
				reply_ack(preq);
			break;
	}

	return;
}

/**
 * @brief
 *		Receive job script section
 * @par Functionality:
 *		For Mom, each section is appended to the file
 *		For Server, its appended to the ji_script member
 *		of the job structure, to be later saved to the DB
 *
 *  @param[in,out]	preq	-	Pointer to batch request structure
 */

void
req_jobscript(struct batch_request *preq)
{
	job *pj;
#ifdef PBS_MOM
	int filemode = 0700;
	int fds;
	char namebuf[MAXPATHLEN];
#else
	char *temp;
	u_Long size;
#endif

	pj = locate_new_job(preq, NULL);
	if (pj == NULL) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}
	if (!check_job_substate(pj, JOB_SUBSTATE_TRANSIN)) {
		delete_link(&pj->ji_alljobs);
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}
#ifndef PBS_MOM
	if (svr_authorize_jobreq(preq, pj) == -1) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}
#else
	/* mom - if job has been checkpointed, discard script,already have it */
	if (pj->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) {
		/* do nothing, ignore script */
		reply_ack(preq);
		return;
	}
#endif /* PBS_MOM */

#ifdef PBS_MOM

	if (reject_root_scripts == TRUE) {
		if (is_jattr_set(pj, JOB_ATR_euser) && get_jattr_str(pj, JOB_ATR_euser) != NULL) {
#ifdef WIN32
			/* equivalent of root */
			if (!isAdminPrivilege(get_jattr_str(pj, JOB_ATR_euser)))
#else
			struct passwd *pwdp;

			pwdp = getpwnam(get_jattr_str(pj, JOB_ATR_euser));
			if ((pwdp != NULL) && (pwdp->pw_uid == 0))
#endif
			{

				log_err(-1, "req_jobscript",
					msg_mom_reject_root_scripts);
				delete_link(&pj->ji_alljobs);
				req_reject(PBSE_MOM_REJECT_ROOT_SCRIPTS, 0, preq);
				return;
			}
		}
	}

	(void) strcpy(namebuf, path_jobs);
	if (*pj->ji_qs.ji_fileprefix != '\0')
		(void) strcat(namebuf, pj->ji_qs.ji_fileprefix);
	else
		(void) strcat(namebuf, pj->ji_qs.ji_jobid);
	(void) strcat(namebuf, JOB_SCRIPT_SUFFIX);

	if (pj->ji_qs.ji_un.ji_newt.ji_scriptsz == 0) {
		fds = open(namebuf, O_WRONLY | O_CREAT, filemode);
	} else {
		fds = open(namebuf, O_WRONLY | O_APPEND, filemode);
	}
	if (fds < 0) {
		log_err(errno, "req_jobscript", msg_script_open);
		delete_link(&pj->ji_alljobs);
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

#ifdef WIN32
	secure_file2(namebuf, "Administrators", READS_MASK | WRITES_MASK | STANDARD_RIGHTS_REQUIRED, "Everyone", READS_MASK | READ_CONTROL);
	setmode(fds, O_BINARY);
#endif /* WIN32 */

	if (write(fds, preq->rq_ind.rq_jobfile.rq_data,
		  (unsigned) preq->rq_ind.rq_jobfile.rq_size) !=
	    preq->rq_ind.rq_jobfile.rq_size) {
		log_err(errno, "req_jobscript", msg_script_write);
		delete_link(&pj->ji_alljobs);
		req_reject(PBSE_SYSTEM, 0, preq);
		(void) close(fds);
		return;
	}
	(void) close(fds);
#else /* server - server - server - server */
	/* add the script to the job */
	size = get_bytes_from_attr(&attr_jobscript_max_size);
	if (pj->ji_qs.ji_un.ji_newt.ji_scriptsz + preq->rq_ind.rq_jobfile.rq_size > size) {
		job_purge(pj);
		req_reject(PBSE_JOBSCRIPTMAXSIZE, 0, preq);
		return;
	}
	temp = realloc(pj->ji_script, pj->ji_qs.ji_un.ji_newt.ji_scriptsz +
					      preq->rq_ind.rq_jobfile.rq_size + 1);
	if (!temp) {
		job_purge(pj);
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}
	pj->ji_script = temp;
	memmove(pj->ji_script + pj->ji_qs.ji_un.ji_newt.ji_scriptsz,
		preq->rq_ind.rq_jobfile.rq_data,
		(size_t) preq->rq_ind.rq_jobfile.rq_size);
#endif
	pj->ji_qs.ji_un.ji_newt.ji_scriptsz += preq->rq_ind.rq_jobfile.rq_size;

#ifndef PBS_MOM
	pj->ji_script[pj->ji_qs.ji_un.ji_newt.ji_scriptsz] = '\0';
#endif

	pj->ji_qs.ji_svrflags = (pj->ji_qs.ji_svrflags & ~JOB_SVFLG_CHKPT) |
				JOB_SVFLG_SCRIPT; /* has a script file */

	reply_ack(preq);
}

#ifndef PBS_MOM
/* the following is for the server only, MOM has her own version below */

/**
 * @brief
 * 		req_mvjobfile - receive a job file
 *		This request is used to move a file associated with a job, typically
 *		the standard output or error, between a server and a server or from
 *		a mom back to a server.  For a server, the destination is alway
 *		within the spool directory.
 *
 * @param[in,out]	preq	-	ptr to the decoded request
 */

void
req_mvjobfile(struct batch_request *preq)
{
	int fds;
	char namebuf[MAXPATHLEN + 1];
	job *pj;
	mode_t cur_mask;
	struct stat sb;

	pj = locate_new_job(preq, NULL);
	if (pj == NULL)
		pj = find_job(preq->rq_ind.rq_jobfile.rq_jobid);

	if ((preq->rq_fromsvr == 0) || (pj == NULL)) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	(void) strcpy(namebuf, path_spool);
	if (*pj->ji_qs.ji_fileprefix != '\0')
		(void) strcat(namebuf, pj->ji_qs.ji_fileprefix);
	else
		(void) strcat(namebuf, pj->ji_qs.ji_jobid);
	switch ((enum job_file) preq->rq_ind.rq_jobfile.rq_type) {
		case StdOut:
			(void) strcat(namebuf, JOB_STDOUT_SUFFIX);
			break;

		case StdErr:
			(void) strcat(namebuf, JOB_STDERR_SUFFIX);
			break;

		case Chkpt:
			(void) strcat(namebuf, JOB_CKPT_SUFFIX);
			break;

		default:
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
	}

	/* check symlinks */
	if (lstat(namebuf, &sb) == 0) {
		/* if it exists, the file must be a prior copy which means */
		/* it must be a regular file and owned by me (root)        */
		if (((sb.st_mode & S_IFMT) != S_IFREG) ||
		    (sb.st_nlink != 1) ||
		    (sb.st_uid != 0)) {
			/* this does not meet the above conditions    */
			/* someone may be trying to hack in a link to */
			/* cause the link target to be overwritten    */
			/* lets log it and leave the file as evidence */
			log_suspect_file(__func__, "wrong type or owner", namebuf, &sb);
		}
	}
	if (preq->rq_ind.rq_jobfile.rq_sequence == 0) {
		char ntmpbuf[MAXPATHLEN + 1];

		/* receiving first piece, so create new file securely */
		/* will discard any existing file (via rename)	      */
		snprintf(ntmpbuf, sizeof(ntmpbuf), "%s", namebuf);
		if (strlen(ntmpbuf) > (sizeof(ntmpbuf) - 8))
			ntmpbuf[sizeof(ntmpbuf) - 8] = '\0';
		strcat(ntmpbuf, "XXXXXX"); /* template for mkstemp() */
		cur_mask = umask(077);	   /* force to create -rw------ */
		fds = mkstemp(ntmpbuf);
		(void) umask(cur_mask);
		if (fds != -1) {
			/* now rename to the filename we want */
			if (rename(ntmpbuf, namebuf) == -1) {
				close(fds);
				unlink(ntmpbuf);
				fds = -1;
			}
		}

	} else {
		/* receiving a follow-on chunk of data, file	*/
		/* should already exist as regular file		*/
		fds = open(namebuf, O_WRONLY | O_APPEND | O_Sync, 0600);
		if (fds != -1) {
			if (lstat(namebuf, &sb) == 0) {
				/* if exists, file must be a regular file and be */
				/* owned by me (root) 				 */
				if (((sb.st_mode & S_IFMT) != S_IFREG) ||
				    (sb.st_nlink != 1) ||
				    (sb.st_uid != 0)) {
					/* this does not meet the above conditions */
					log_suspect_file(__func__, "wrong type or owner",
							 namebuf, &sb);
					close(fds);
					unlink(namebuf);
					fds = -1;
				}
			} else {
				sprintf(log_buffer, "unable to lstat %s", namebuf);
				log_err(errno, __func__, log_buffer);
				close(fds);
				fds = -1;
			}
		}
	}

	if (fds < 0) {
		log_err(errno, "req_mvjobfile", msg_script_open);
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	if (write(fds, preq->rq_ind.rq_jobfile.rq_data,
		  (unsigned) preq->rq_ind.rq_jobfile.rq_size) !=
	    preq->rq_ind.rq_jobfile.rq_size) {
		log_err(errno, "req_jobfile", msg_script_write);
		req_reject(PBSE_SYSTEM, 0, preq);
		(void) close(fds);
		return;
	}
	(void) close(fds);
	reply_ack(preq);
}
#else /* PBS_MOM - MOM MOM MOM */
/**
 * @brief
 * 		req_mvjobfile - move the specifled job standard files
 *		This is MOM's version.  The files are owned by the user and placed
 *		in either the spool area or the user's home directory depending
 *		on the compile option, see std_file_name().
 *
 * @param[in,out]	preq	-	ptr to the decoded request
 */

void
req_mvjobfile(struct batch_request *preq)
{
	int fds;
	enum job_file jft;
	int oflag;
	job *pj;
	struct passwd *check_pwd(job *);

	jft = (enum job_file) preq->rq_ind.rq_jobfile.rq_type;
	if (preq->rq_ind.rq_jobfile.rq_sequence == 0)
		oflag = O_CREAT | O_WRONLY | O_TRUNC;
	else
		oflag = O_CREAT | O_WRONLY | O_APPEND;

	pj = locate_new_job(preq, NULL);
	if (pj == NULL)
		pj = find_job(preq->rq_ind.rq_jobfile.rq_jobid);

	if (pj == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}
	/* this call sets up home/uid/gid information for the job */
	if (check_pwd(pj) == NULL) {
		req_reject(PBSE_MOMREJECT, 0, preq);
		return;
	}
	if ((is_jattr_set(pj, JOB_ATR_sandbox)) &&
	    (strcasecmp(get_jattr_str(pj, JOB_ATR_sandbox), "PRIVATE") == 0)) {
		/* have a private sandbox which must be recreated */
		/* prior to copying standard out and err back     */

		char *pbs_jobdir;

		pbs_jobdir = jobdirname(pj->ji_qs.ji_jobid,
					pj->ji_grpcache->gc_homedir);
		/* call mkjobdir() with a NULL for the environment entry */
		/* We are not at a point where we can setup the job's    */
		/* environment and mkjobdir() will be called again in    */
		/* start_exec where the permissions are reset to match   */
		/* the user's umask and the environment is built.	 */
#ifdef WIN32

		if (mkjobdir(pj->ji_qs.ji_jobid,
			     pbs_jobdir,
			     (pj->ji_user != NULL) ? pj->ji_user->pw_name : NULL,
			     INVALID_HANDLE_VALUE) != 0) {
			sprintf(log_buffer, "unable to create the job directory %s", pbs_jobdir);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pj->ji_qs.ji_jobid, log_buffer);
			req_reject(PBSE_MOMREJECT, 0, preq);
			return;
		}
#else
		if (mkjobdir(pj->ji_qs.ji_jobid,
			     pbs_jobdir,
			     pj->ji_grpcache->gc_uid,
			     pj->ji_grpcache->gc_gid) != 0) {
			sprintf(log_buffer, "unable to create the job directory %s", pbs_jobdir);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pj->ji_qs.ji_jobid, log_buffer);
			req_reject(PBSE_MOMREJECT, 0, preq);
			return;
		}
#endif /* WIN32 */
	}

	if ((fds = open_std_file(pj, jft, oflag,
				 pj->ji_grpcache->gc_gid)) < 0) {
		req_reject(PBSE_MOMREJECT, 0, preq);
		return;
	}

	if (write(fds, preq->rq_ind.rq_jobfile.rq_data,
		  preq->rq_ind.rq_jobfile.rq_size) !=
	    preq->rq_ind.rq_jobfile.rq_size)
		req_reject(PBSE_SYSTEM, 0, preq);
	else {
		reply_ack(preq);
	}
	(void) close(fds);
}
#endif /* PBS_MOM */

/**
 * @brief
 * 	Parse the next message type and parameter from extend field
 *
 * @param[in] extend - extend field
 * @param[out] msg_type - batch request type
 * @param[out] msg_params - this array will be filled with parameter in the order they received
 * 				parameters has to be freed by the caller.
 * @param[in] param_arr_sz - size of the parameter array.
 *
 * @return int
 * @return 0 success
 * @retval -1 failure, memory allocation / input array is not of sufficient size
 */
int
parse_next_msg(char *extend, int *msg_type, char **msg_params, int param_arr_sz)
{
	int i, j;
	char **arr;
	char *pc;

	if ((arr = break_comma_list(extend)) == NULL)
		return -1;

	for (i = 0; arr[i]; i++) {
		if ((pc = strstr(arr[i], EXTEND_OPT_NEXT_MSG_TYPE))) {
			*msg_type = strtol(pc + strlen(EXTEND_OPT_NEXT_MSG_TYPE) + 1, NULL, 10);
			break;
		}
	}
	for (j = 0; arr[i]; i++) {
		if ((pc = strstr(arr[i], EXTEND_OPT_NEXT_MSG_PARAM))) {
			if (j >= param_arr_sz) {
				free_str_array(arr);
				return -1;
			} else {
				msg_params[j++] = strdup(pc + strlen(EXTEND_OPT_NEXT_MSG_PARAM) + 1);
			}
		}
	}

	if (j < param_arr_sz)
		msg_params[j] = NULL;
	free_str_array(arr);
	return 0;
}

/**
 * @brief
 *		Commit ownership of job
 * @par Functionality:
 *		Set state of job to JOB_STATE_LTR_QUEUED (or Held or Waiting) and
 *		enqueue the job into its destination queue.
 *
 * @param[in]	preq	-	The batch request structure
 * @param[in]	pj		-   Pointer to the job structure
 *
 */
void
req_commit_now(struct batch_request *preq, job *pj)
{
#ifndef PBS_MOM
	char newstate;
	int newsub;
	pbs_queue *pque;
	int rc;
	pbs_db_jobscr_info_t jobscr;
	pbs_db_obj_info_t obj;
	long long time_usec;
	struct timeval tval;
	void *conn = (void *) svr_db_conn;
	char *runjob_extend = NULL;
	struct batch_request *preq_runjob = NULL;
#endif

	if (!check_job_substate(pj, JOB_SUBSTATE_TRANSIN)) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	set_job_state(pj, JOB_STATE_LTR_TRANSIT);
	set_job_substate(pj, JOB_SUBSTATE_TRANSICM);

#ifdef PBS_MOM /* MOM only */

	/* move job from new job list to "all" job list, set to running state */
	delete_link(&pj->ji_alljobs);
	if (pbs_idx_insert(jobs_idx, pj->ji_qs.ji_jobid, pj) != PBS_IDX_RET_OK) {
		log_joberr(PBSE_INTERNAL, __func__, "Failed insert job in index", pj->ji_qs.ji_jobid);
		req_reject(PBSE_INTERNAL, 0, preq);
		job_purge(pj);
		return;
	}
	append_link(&svr_alljobs, &pj->ji_alljobs, pj);
	/*
	 ** Set JOB_SVFLG_HERE to indicate that this is Mother Superior.
	 */
	pj->ji_qs.ji_svrflags |= JOB_SVFLG_HERE;
	set_job_state(pj, JOB_STATE_LTR_RUNNING);
	set_job_substate(pj, JOB_SUBSTATE_PRERUN);
	pj->ji_qs.ji_un_type = JOB_UNION_TYPE_MOM;
	if (preq->prot) {
		struct sockaddr_in *addr = tpp_getaddr(preq->rq_conn);
		if (addr)
			pj->ji_qs.ji_un.ji_momt.ji_svraddr = (pbs_net_t) ntohl(addr->sin_addr.s_addr);
	} else
		pj->ji_qs.ji_un.ji_momt.ji_svraddr = get_connectaddr(preq->rq_conn);
	pj->ji_qs.ji_un.ji_momt.ji_exitstat = 0;
	if ((pj->ji_qs.ji_svrflags & (JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) == 0) {
		pj->ji_qs.ji_stime = time_now; /* start of walltime */
		set_jattr_l_slim(pj, JOB_ATR_stime, time_now, SET);
	}

	/*
	 * For MOM - reply to the request and start up the job
	 * any errors will be dealt with via the mechanism
	 * used for a terminated job
	 */

	(void) reply_jobid(preq, pj->ji_qs.ji_jobid, BATCH_REPLY_CHOICE_Commit);
	job_save(pj);
	start_exec(pj);

	/* The ATR_VFLAG_MODIFY bit for several attributes used to be
	 * set here. Now we rely on these bits to be set when and where
	 * an attribute is modified. Several of these are also set in
	 * record_finish_exec().
	 */

#else  /* PBS_SERVER */
	if (svr_authorize_jobreq(preq, pj) == -1) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	/* Set Server level entity usage */

	if ((rc = account_entity_limit_usages(pj, NULL, NULL, INCR, ETLIM_ACC_ALL)) != 0) {
		job_purge(pj);
		req_reject(rc, 0, preq);
		return;
	}

	/* remove job for the server new job list, set state, and enqueue it */

	delete_link(&pj->ji_alljobs);

	svr_evaljobstate(pj, &newstate, &newsub, 1);
	svr_setjobstate(pj, newstate, newsub);

	gettimeofday(&tval, NULL);
	time_usec = (tval.tv_sec * 1000000L) + tval.tv_usec;
	/* set the queue rank attribute */
	set_jattr_ll_slim(pj, JOB_ATR_qrank, time_usec, SET);

	if (preq->rq_type == PBS_BATCH_Commit)
		runjob_extend = preq->rq_extend;

	if ((rc = svr_enquejob(pj, runjob_extend)) != 0) {
		job_purge(pj);
		req_reject(rc, 0, preq);
		return;
	}
	account_jobstr(pj, PBS_ACCT_QUEUE);

	/* Make things faster by writing job only once here  - at commit time */
	if (job_save_db(pj)) {
		job_purge(pj);
		req_reject(PBSE_SAVE_ERR, 0, preq);
		return;
	}

	if (pj->ji_script) {
		strcpy(jobscr.ji_jobid, pj->ji_qs.ji_jobid);
		jobscr.script = pj->ji_script;
		obj.pbs_db_obj_type = PBS_DB_JOBSCR;
		obj.pbs_db_un.pbs_db_jobscr = &jobscr;

		if (pbs_db_save_obj(conn, &obj, OBJ_SAVE_NEW) != 0) {
			job_purge(pj);
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		free(pj->ji_script);
		pj->ji_script = NULL;
	}

	/* Now, no need to save server here because server
	   has already saved in the get_next_svr_sequence_id() */

	/*
	 * if the job went into a Route (push) queue that has been started,
	 * try once to route it to give immediate feedback as a courtsey
	 * to the user.
	 */

	pque = pj->ji_qhdr;

	if ((preq->rq_fromsvr == 0) &&
	    (pque->qu_qs.qu_type == QTYPE_RoutePush) &&
	    (get_qattr_long(pque, QA_ATR_Started) != 0)) {
		if ((rc = job_route(pj)) != 0) {
			job_purge(pj);
			req_reject(rc, 0, preq);
			return;
		}
	}

	/* need to print message first, before request goes away */
	log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pj->ji_qs.ji_jobid,
		   msg_jobnew, preq->rq_user, preq->rq_host,
		   get_jattr_str(pj, JOB_ATR_job_owner),
		   get_jattr_str(pj, JOB_ATR_jobname),
		   pj->ji_qhdr->qu_qs.qu_name);

	/* Allocate a new batch request to use for runjob as we will be freeing preq in reply_jobid()  */
	if (runjob_extend) {
		char *param_arr[1];

		if ((preq_runjob = copy_br(preq)) == NULL) {
			job_purge(pj);
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}

		if (parse_next_msg(runjob_extend, &preq_runjob->rq_type, param_arr, 1) == -1) {
			job_purge(pj);
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}

		strcpy(preq_runjob->rq_ind.rq_run.rq_jid, pj->ji_qs.ji_jobid);
		preq_runjob->rq_ind.rq_run.rq_destin = param_arr[0];
		preq_runjob->tpp_ack = 1;
		preq_runjob->tppcmd_msgid = strdup(preq->tppcmd_msgid);
	}

	/* acknowledge the request with the job id */
	if ((rc = reply_jobid(preq, pj->ji_qs.ji_jobid, BATCH_REPLY_CHOICE_Commit))) {
		log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR, pj->ji_qs.ji_jobid, "Failed to reply with Job Id, error %d", rc);
		job_purge(pj);
		return;
	}

	if ((pj->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0)
		issue_track(pj); /* notify creator where job is */

	if (!preq_runjob)
		return;

	req_runjob(preq_runjob);
#endif /* PBS_SERVER */
}

/**
 * @brief
 *		locate job and call req_commit_now
 *
 *  @param[in]	preq - The batch request structure
 *
 */
void
req_commit(struct batch_request *preq)
{
	job *pj;

	pj = locate_new_job(preq, preq->rq_ind.rq_commit);
	if (pj == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	req_commit_now(preq, pj);
}

/**
 * @brief
 * 		locate_new_job - locate a "new" job which has been set up req_quejob on
 *		the servers new job list.
 *
 * @par Functionality:
 *		This function is used by the sub-requests which make up the global
 *		"Queue Job Request" to locate the job structure.
 *
 *		If the jobid is specified (will be for rdytocommit and commit, but not
 *		for script), we search for a matching jobid.
 *
 *		The job must (also) match the socket specified and the host associated
 *		with the socket unless ji_fromsock == -1, then its a recovery situation.
 *
 * @param[in]	preq	-	The batch request structure
 * @param[in]	jobid	-	Job Id which needs to be located
 *
 * @return	job structure associated with jobid.
 */

static job *
locate_new_job(struct batch_request *preq, char *jobid)
{
	job *pj;
	int sock = -1;
	pbs_net_t conn_addr = 0;

	if (preq == NULL)
		return NULL;

	sock = preq->rq_conn;

	if (!preq->prot) { /* Connection from TCP stream */
		conn_addr = get_connectaddr(sock);
	} else {
		struct sockaddr_in *addr = tpp_getaddr(sock);
		if (addr)
			conn_addr = (pbs_net_t) ntohl(addr->sin_addr.s_addr);
	}

	pj = (job *) GET_NEXT(svr_newjobs);
	while (pj) {

		if ((pj->ji_qs.ji_un.ji_newt.ji_fromsock == -1) ||
		    ((pj->ji_qs.ji_un.ji_newt.ji_fromsock == sock) &&
		     (pj->ji_qs.ji_un.ji_newt.ji_fromaddr == conn_addr))) {

			if (jobid != NULL) {
				if (!strncmp(pj->ji_qs.ji_jobid, jobid, PBS_MAXSVRJOBID))
					break;
			} else
				break;
		}

		pj = (job *) GET_NEXT(pj->ji_alljobs);
	}
	return (pj);
}

#ifndef PBS_MOM /* SERVER only */
/**
 * @brief  Function to notify relevant scheduler of the command passed to this function
 *
 * @param[in] cmd - The command that is to be notified to the scheduler
 * @param[in] resv - The reservation related to the command
 *
 * @return Number of schedulers notified.
 *
 */
int
notify_scheds_about_resv(int cmd, resc_resv *resv)
{
	pbs_sched *psched;
	char *partition_name = NULL;
	int num_scheds = 0;

	if (resv != NULL) {
		if (is_rattr_set(resv, RESV_ATR_partition))
			partition_name = get_rattr_str(resv, RESV_ATR_partition);
		else
			/* for reservations without partitions, set request/reply count to 0
			 * because this is the only case when notification will be sent to multiple
			 * schedulers and server expects multiple replies. Once partition name is set,
			 * only relevant scheduler is notified and server will receive only one reply.
			 */
			resv->req_sched_count = resv->rep_sched_count = 0;
	}

	for (psched = (pbs_sched *) GET_NEXT(svr_allscheds); psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
		if (partition_name != NULL) {
			if (strcmp(partition_name, DEFAULT_PARTITION) == 0) {
				if (get_sched_attr_long(dflt_scheduler, SCHED_ATR_scheduling) == 1) {
					set_scheduler_flag(cmd, dflt_scheduler);
					num_scheds++;
				}
				break;
			} else {
				pbs_sched *tmp;
				tmp = find_sched_from_partition(partition_name);
				if (tmp != NULL && (get_sched_attr_long(tmp, SCHED_ATR_scheduling) == 1)) {
					set_scheduler_flag(cmd, tmp);
					num_scheds++;
					break;
				}
			}
		} else {
			if (get_sched_attr_long(psched, SCHED_ATR_scheduling) == 1) {
				set_scheduler_flag(cmd, psched);
				if (resv != NULL)
					resv->req_sched_count++;
				num_scheds++;
			}
		}
	}
	return num_scheds;
}

/**
 * @brief
 *		"resvSub" Batch Request processing routine
 *
 *  @param[in]	-	ptr to the decoded request
 */

void
req_resvSub(struct batch_request *preq)
{
	/*
	 * buf and buf1 are used to hold user@hostname strings together
	 * with a small amount (less than 64 characters) of text.
	 */
	char buf[PBS_MAXUSER + PBS_MAXHOSTNAME + 64] = {0};
	char buf1[PBS_MAXUSER + PBS_MAXHOSTNAME + 64] = {0};
	int created_here = 0;
	int i = 0;
	char *rid = NULL;
	char ridbuf[PBS_MAXSVRRESVID + 1] = {0};
	char qbuf[PBS_MAXSVRRESVID + 1] = {0};
	char *pc = NULL;
	attribute_def *pdef = NULL;
	resc_resv *presv = NULL;
	svrattrl *psatl = NULL;
	int rc = 0;
	int sock = preq->rq_conn;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	int resc_access_perm_save = 0;
	int qmove_requested = 0;
	char *fmt = "%a %b %d %H:%M:%S %Y";
	char tbuf1[256] = {0};
	char tbuf2[256] = {0};
	int is_maintenance = 0;
	int is_resv_from_job = 0;
	job *pjob;
	int rc2 = 0;
	char owner[PBS_MAXUSER + 1];
	char *partition_name = NULL;
	char *ptr = NULL;
	conn_t *conn = NULL;

	if (preq->rq_extend && strchr(preq->rq_extend, 'm'))
		is_maintenance = 1;

	if (preq->prot != PROT_TPP) {
		conn = get_conn(sock);
		if (!conn) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
	}

	switch (process_hooks(preq, hook_msg, sizeof(hook_msg),
			      pbs_python_set_interrupt)) {
		case 0: /* explicit reject */
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
			return;
		case 1:					    /* explicit accept */
			if (recreate_request(preq) == -1) { /* error */
				/* we have to reject the request, as 'preq' */
				/* may have been partly modified            */
				strcpy(hook_msg,
				       "resvsub event: rejected request");
				log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, "", hook_msg);
				reply_text(preq, PBSE_HOOKERROR, hook_msg);
				return;
			}
			break;
		case 2: /* no hook script executed - go ahead and accept event*/
			break;
		default:
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_INFO, "", "resvsub event: accept req by default");
	}

	/* Is the admin refusing to allow reservations on this server? */

	if (is_sattr_set(SVR_ATR_ResvEnable) && !get_sattr_long(SVR_ATR_ResvEnable)) {

		snprintf(buf, sizeof(buf), "reservations disallowed on %s", server_name);
		if ((rc = reply_text(preq, PBSE_RESVAUTH_U, buf))) {
			/* reply failed,  close connection; purge resv */
			close_client(sock);
		}
		return;
	}
	/* Are reservations from submitting host allowed? */
	if (get_sattr_long(SVR_ATR_acl_Resvhost_enable)) {
		/* acl enabled so need to check it */
		if (acl_check(get_sattr(SVR_ATR_acl_Resvhosts),
			      preq->rq_host, ACL_Host) == 0) {
			req_reject(PBSE_RESVAUTH_H, 0, preq);
			return;
		}
	}

	resc_access_perm = preq->rq_perm | ATR_DFLAG_Creat;

	if (is_maintenance && !(preq->rq_perm & (ATR_DFLAG_OPWR | ATR_DFLAG_MGWR))) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	/* get reservation id/queue name locally */
	if ((next_svr_sequence_id = get_next_svr_sequence_id()) == -1) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}
	/*
	 * if the reservation ID is supplied, the request had better be
	 * from another server
	 * Remark: would be the case if the reservation is being forwarded
	 *     to another server - something to think about for the future
	 */

	if (preq->rq_fromsvr) {
		/* from another server - accept the extra attributes */
		resc_access_perm |= ATR_DFLAG_MGWR | ATR_DFLAG_SvWR;
		rid = preq->rq_ind.rq_queuejob.rq_jid;

	} else if (preq->rq_ind.rq_queuejob.rq_jid[0] != '\0') {
		/* a reservation id is not allowed from a client */
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	} else {
		/* No reservation ID came with the request, create one    */
		/* Note: use server's job seq number generation mechanism */

		created_here = RESV_SVFLG_HERE;
		if (generate_objid(ridbuf, server_name, MGR_OBJ_RESV, PBS_RESV_ID_CHAR) != 0) {
			req_reject(PBSE_INTERNAL, 0, preq);
			return;
		}
		rid = ridbuf;
	}

	/* generate a queue name then update sv_jobidnumber and
	 * save serve struct
	 * generate a queue name then update sv_resvidnumber and
	 * save serve struct
	 * The second comment above is the one we really want,
	 * but the structure field would be an addition to the
	 * "quick save" area of the server - can't do
	 */
	ptr = strchr(rid, '.');
	if (ptr == NULL) {
		req_reject(PBSE_INTERNAL, 0, preq);
		return;
	}

	*ptr = '\0';
	pbs_strncpy(qbuf, rid, sizeof(qbuf));
	*ptr = '.';

	/* does reservation already exist, check both old
	 * and new reservations?
	 * This could happen if we are allowing reservations
	 * submitted to one server to be passed off to another
	 * server to fulfill or reject;  we may or may not want
	 * this capability, but will have this code here
	 */
	presv = find_resv(rid);

	if (presv != NULL) {

		/* server rejects resvSub request if already exists */
		req_reject(PBSE_RESVEXIST, 0, preq);
		return;
	}

	/* OK, we have created a name for the local backing
	 * store file and a zero length file of that name
	 * is on the disk.   Now, CREATE THE RESC_RESV STRUCTURE
	 * for managing the reservation and later on try and
	 * create a pbs_queue into which jobs submitted to the
	 * reservation get assigned
	 */

	if ((presv = resv_alloc(rid)) == NULL) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	/* Take a quick pass through the attribute list to see
	 * whether a qmove is being performed. If so, the operation
	 * is granted special permission to modify readonly
	 * resources.
	 */
	qmove_requested = 0;
	psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_queuejob.rq_attr);
	while (psatl) {
		if (strcmp(psatl->al_atopl.name, ATTR_convert) == 0) {
			qmove_requested = 1;
			break;
		}
		psatl = (svrattrl *) GET_NEXT(psatl->al_link);
	}

	/* decode attributes from resvSub request into
	 * the resc_resv structure's attributes
	 */

	resc_access_perm_save = resc_access_perm; /* save perm */
	psatl = (svrattrl *) GET_NEXT(preq->rq_ind.rq_queuejob.rq_attr);
	while (psatl) {
		int index;
		/* reservation does not support Shrink-to-fitness */
		if (!(strcasecmp(psatl->al_name, ATTR_l)) &&
		    (!(strcasecmp(psatl->al_resc, MIN_WALLTIME)) ||
		     !(strcasecmp(psatl->al_resc, MAX_WALLTIME)))) {
			req_reject(PBSE_NOSTF_RESV, 0, preq);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_REQUEST, LOG_ERR, "", msg_nostf_resv);
			resv_free(presv);
			return;
		}
		/* identify the attribute by name */
		index = find_attr(resv_attr_idx, resv_attr_def, psatl->al_name);
		if (index < 0) {

			if (ignore_attr(psatl->al_name) >= 0) {
				/*ignore some currently not handled options
				 *also helpful in debugging using qsub;
				 *remove later on
				 */

				psatl = (svrattrl *) GET_NEXT(psatl->al_link);
				continue;
			}

			/* didn`t recognize the name */
			resv_free(presv);
			reply_badattr(PBSE_NOATTR, 1, psatl, preq);
			return;
		}
		pdef = &resv_attr_def[index];

		/* Does attribute's definition flags indicate that
		 * we have sufficient permission to write the attribute?
		 */

		resc_access_perm = resc_access_perm_save; /* reset */
		if ((psatl->al_flags & ATR_VFLAG_HOOK) || qmove_requested) {
			resc_access_perm = ATR_DFLAG_USWR |
					   ATR_DFLAG_OPWR |
					   ATR_DFLAG_MGWR |
					   ATR_DFLAG_SvWR |
					   ATR_DFLAG_Creat;
		}
		if ((pdef->at_flags & resc_access_perm) == 0) {
			resv_free(presv);
			reply_badattr(PBSE_ATTRRO, 1, psatl, preq);
			return;
		}

		/* decode attribute */

		rc = set_rattr_generic(presv, index, psatl->al_value, psatl->al_resc, INTERNAL);

		if (rc != 0) {
			resv_free(presv);
			reply_badattr(rc, 1, psatl, preq);
			return;
		}

		if (!(strcasecmp(psatl->al_name, ATTR_resv_job))) {
			if ((pjob = find_job(psatl->al_value)) == NULL) {
				req_reject(PBSE_UNKJOBID, 0, preq);
				resv_free(presv);
				return;
			}

			if (pjob->ji_myResv) {
				req_reject(PBSE_RESV_FROM_RESVJOB, 0, preq);
				resv_free(presv);
				return;
			}

			if (is_job_array(psatl->al_value) != IS_ARRAY_NO) {
				req_reject(PBSE_RESV_FROM_ARRJOB, 0, preq);
				resv_free(presv);
				return;
			}

			get_jobowner(get_jattr_str(pjob, JOB_ATR_job_owner), owner);
			if (strcmp(preq->rq_user, owner)) {
				req_reject(PBSE_PERM, 0, preq);
				resv_free(presv);
				return;
			}

			rc2 = copy_params_from_job(psatl->al_value, presv);
			if (rc2) {
				req_reject(rc2, 0, preq);
				resv_free(presv);
				return;
			}
			if (is_qattr_set(pjob->ji_qhdr, QA_ATR_partition))
				partition_name = get_qattr_str(pjob->ji_qhdr, QA_ATR_partition);
			else
				partition_name = DEFAULT_PARTITION;
			is_resv_from_job = 1;
		}

		psatl = (svrattrl *) GET_NEXT(psatl->al_link);
	}
	resc_access_perm = resc_access_perm_save; /* restore perm */

	/* invoke any defined attribute at_action routines */

	for (i = 0; i < RESV_ATR_LAST; ++i) {
		pdef = &resv_attr_def[i];
		if (is_rattr_set(presv, i) && (pdef->at_action)) {
			rc = pdef->at_action(get_rattr(presv, i), presv, ATR_ACTION_NEW);
			if (rc) {
				resv_free(presv);
				req_reject(rc, i, preq);
				return;
			}
		}
	}

	/*"start", "end","duration", and "wall"; derive and check*/

	if (start_end_dur_wall(presv)) {
		resv_free(presv);
		req_reject(PBSE_BADTSPEC, 0, preq);
		return;
	}

	/* If standing reservation check the recurrence rule
	 * and possibly change the queue and reservation id to start with
	 * 'S' instead of 'R'
	 */
	if (get_rattr_long(presv, RESV_ATR_resv_standing)) {
		int resv_count;

		/* Check the recurrence rule. If this fails, an error message
		 * is sent back to the requestor. Otherwise, check the number
		 * of occurrences requested by the recurrence rule. If 1 then
		 * it is treated as an advance reservation.
		 */
		resv_count = check_rrule(
			get_rattr_str(presv, RESV_ATR_resv_rrule),
			get_rattr_long(presv, RESV_ATR_start),
			get_rattr_long(presv, RESV_ATR_end),
			get_rattr_str(presv, RESV_ATR_resv_timezone),
			&rc);

		/* rc is set by check_rrule to report any possible icalendar
		 * syntax or time problem
		 */
		if (rc != 0) {
			resv_free(presv);
			req_reject(rc, 0, preq);
			return;
		}

		set_rattr_l_slim(presv, RESV_ATR_resv_count, resv_count, SET);

		/* If more than 1 occurrence are requested then alter the
		 * reservation and queue first character
		 */
		if (resv_count > 1) {
			rid[0] = PBS_STDNG_RESV_ID_CHAR;
			qbuf[0] = PBS_STDNG_RESV_ID_CHAR;
		} else /* If only 1 occurrence, treat it as an advance reservation */
			set_rattr_l_slim(presv, RESV_ATR_resv_standing, 0, SET);
	} else
		set_rattr_l_slim(presv, RESV_ATR_resv_count, 1, SET);

	if (is_maintenance)
		rid[0] = qbuf[0] = PBS_MNTNC_RESV_ID_CHAR;

	(void) strcpy(presv->ri_qs.ri_resvID, rid);
	if (created_here) {
		presv->ri_qs.ri_svrflags = created_here;
	}

	/*
	 * for resources that are not specified in the request and
	 * for which default values can be determined, set these values
	 * as the values for those resources
	 */

	if (!is_resv_from_job && ((rc = set_resc_deflt((void *) presv, RESC_RESV_OBJECT, NULL)) != 0)) {
		resv_free(presv);
		req_reject(rc, 0, preq);
		return;
	}

	/*
	 * Now that the attributes have been decoded, setup some
	 * additional parameters and perform a few more checks.
	 */

	/* set some items based on who created the reservation... */

	if (created_here) {
		/* reservation got created by this server */

		/* ck priority value - in future, reservations
		 * may support the notion of priority
		 */

		if (is_rattr_set(presv, RESV_ATR_priority)) {
			if (get_rattr_long(presv, RESV_ATR_priority) < -1024 || get_rattr_long(presv, RESV_ATR_priority) > 1024) {
				resv_free(presv);
				req_reject(PBSE_BADATVAL, 0, preq);
				return;
			}
		}

		if (conn) {
			strcpy(buf, conn->cn_physhost);
			set_rattr_str_slim(presv, RESV_ATR_submit_host, buf, NULL);
		}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
		/* save gssapi/krb5 creds for this reservation */
		if (conn && conn->cn_credid != NULL &&
			conn->cn_auth_config != NULL &&
			conn->cn_auth_config->auth_method != NULL && strcmp(conn->cn_auth_config->auth_method, AUTH_GSS_NAME) == 0) {
			log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__,
				"saving creds.  conn is %d, cred id %s", preq->rq_conn, conn->cn_credid);

			set_rattr_str_slim(presv, RESV_ATR_cred_id, conn->cn_credid, NULL);
		}
#endif
		/* set reservation name to "NULL" if not specified by user */

		if (!is_rattr_set(presv, RESV_ATR_resv_name))
			set_rattr_str_slim(presv, RESV_ATR_resv_name, "NULL", NULL);

		if (!is_resv_from_job) {
			/* set reservation owner attribute to user@host */
			(void) strcpy(buf, preq->rq_user);
			(void) strcat(buf, "@");
			(void) strcat(buf, preq->rq_host);
			set_rattr_str_slim(presv, RESV_ATR_resv_owner, buf, NULL);
		}

		/* make sure owner is in reservation's Authorized_Users */
		if (act_resv_add_owner(get_rattr(presv, RESV_ATR_auth_u), presv, ATR_ACTION_NEW)) {
			resv_free(presv);
			req_reject(PBSE_BADATVAL, 0, preq);
			return;
		}

		/* set create time */
		set_rattr_l_slim(presv, RESV_ATR_ctime, (long) time_now, SET);
		/* set hop count = 1 */
		set_rattr_l_slim(presv, RESV_ATR_hopcount, 1, SET);

	} else {
		/* reservation created elsewhere and being moved here */
		long hop;

		/* make sure resv_owner is set, ERROR IF NOT */
		if (!is_rattr_set(presv, RESV_ATR_resv_owner)) {
			resv_purge(presv);
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		}

		/* increment hop count */
		hop = get_rattr_long(presv, RESV_ATR_hopcount);
		if (++hop > PBS_MAX_HOPCOUNT) {
			resv_purge(presv);
			req_reject(PBSE_HOPCOUNT, 0, preq);
			return;
		} else
			set_rattr_l_slim(presv, RESV_ATR_hopcount, hop, SET);
	}

	/* determine values for the "euser" and "egroup" attributes */

	if ((rc = set_objexid((void *) presv, RESC_RESV_OBJECT, presv->ri_wattr))) {
		resv_free(presv);
		req_reject(rc, 0, preq);
		return;
	}

	/*
	 * Are reservation submissions being controlled by a group ACL?
	 * If yes, check if this one is allowed or denied
	 */

	if (is_sattr_set(SVR_ATR_acl_ResvGroup_enable) && get_sattr_long(SVR_ATR_acl_ResvGroup_enable)) {

		if (acl_check(get_sattr(SVR_ATR_acl_ResvGroups), get_rattr_str(presv, RESV_ATR_euser), ACL_Group) == 0) {
			resv_free(presv);
			req_reject(PBSE_RESVAUTH_G, 0, preq);
			return;
		}
	}

	/* Is this user allowed to submit a reservation? */

	if (is_sattr_set(SVR_ATR_AclResvUserEnabled) && get_sattr_long(SVR_ATR_AclResvUserEnabled)) {
		if (preq->rq_host[0])
			snprintf(buf1, sizeof(buf1), "%s@%s", get_rattr_str(presv, RESV_ATR_euser), preq->rq_host);

		if (acl_check(get_sattr(SVR_ATR_AclResvUsers), buf1, ACL_User) == 0) {
			resv_free(presv);
			req_reject(PBSE_RESVAUTH_U, 0, preq);
			return;
		}
	}

	/* set up at_server attribute for status */
	set_rattr_str_slim(presv, RESV_ATR_at_server, server_name, NULL);

	/* set what will be the name of the reservation's associated queue */
	set_rattr_str_slim(presv, RESV_ATR_queue, qbuf, NULL);

	/*
	 * Now that the resc_resv structure exists and and has been setup,
	 * try to acquire and setup a pbs_queue into which jobs submitted
	 * to the reservation get placed - actually, right now, the user
	 * directly does a "qsub" to this created queue but, at some point
	 * it's conceivable that the interface to user might change for
	 * submitting jobs to reservations and the user would specify the
	 * reservation ID string instead of the queue
	 */

	if ((rc = get_queue_for_reservation(presv)) != 0) {
		/* couldn't acquire the queue */

		if ((pc = pbse_to_txt(rc)) != 0)
			log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
				  presv->ri_qs.ri_resvID, pc);

		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
			  presv->ri_qs.ri_resvID,
			  "error - reservation being deleted");

		resv_free(presv);

		/* Single out duplicate list entries to inform end-user about
		 * erroneous input. Other errors are internal and will fall under
		 * a generic "reservation failure" message.
		 */
		if (rc != PBSE_DUPLIST)
			rc = PBSE_resvFail;

		req_reject(rc, 0, preq);
		return;
	}

	/* set remaining resc_resv structure elements */
	presv->ri_qs.ri_state = RESV_UNCONFIRMED;
	presv->ri_qs.ri_substate = RESV_UNCONFIRMED;

	set_rattr_l_slim(presv, RESV_ATR_state, RESV_UNCONFIRMED, SET);
	set_rattr_l_slim(presv, RESV_ATR_substate, RESV_UNCONFIRMED, SET);
	set_rattr_l_slim(presv, RESV_ATR_mtime, (long) time_now, SET);

	if (is_rattr_set(presv, RESV_ATR_convert) && !is_rattr_set(presv, RESV_ATR_del_idle_time))
		set_rattr_l_slim(presv, RESV_ATR_del_idle_time, RESV_ASAP_IDLE_TIME, SET);

	/* save resv and server structure */
	if (resv_save_db(presv)) {
		(void) resv_purge(presv);
		req_reject(PBSE_SAVE_ERR, 0, preq);
		return;
	}

	/* If not a standing reservation, put onto the "timed task" list a task
	 * that causes	deletion of the reservation if the window passes
	 */
	if (!get_rattr_long(presv, RESV_ATR_resv_standing)) {
		if (get_rattr_long(presv, RESV_ATR_start) != PBS_RESV_FUTURE_SCH) {
			if (gen_task_EndResvWindow(presv)) {
				resv_purge(presv);
				req_reject(PBSE_SYSTEM, 0, preq);
				return;
			}
		}
	}

	/* link reservation into server's reservation list */
	append_link(&svr_allresvs, &presv->ri_allresvs, presv);
	if ((is_resv_from_job) && (confirm_resv_locally(presv, preq, partition_name))) {
		resv_purge(presv);
		req_reject(PBSE_resvFail, 0, preq);
		return;
	}

	/* acknowledge the request with the reservation id
	 * Remark: for reply we can use the function used for jobs
	 */

	if (is_rattr_set(presv, RESV_ATR_interactive) == 0) {
		/*Not "interactive" so don't wait on scheduler, reply now*/

		if (is_resv_from_job)
			snprintf(buf, sizeof(buf), "%s CONFIRMED", presv->ri_qs.ri_resvID);
		else
			snprintf(buf, sizeof(buf), "%s UNCONFIRMED", presv->ri_qs.ri_resvID);
		if (get_rattr_long(presv, RESV_ATR_resv_standing))
			snprintf(buf1, sizeof(buf1), "requestor=%s@%s recurrence_rrule=%s timezone=%s",
				 preq->rq_user, preq->rq_host,
				 get_rattr_str(presv, RESV_ATR_resv_rrule),
				 get_rattr_str(presv, RESV_ATR_resv_timezone));
		else
			snprintf(buf1, sizeof(buf1), "requestor=%s@%s",
				 preq->rq_user, preq->rq_host);

		if ((rc = reply_text(preq, PBSE_NONE, buf))) {
			/* reply failed,  close connection; purge resv */
			close_client(sock);
			resv_purge(presv);
			return;
		}
		if (!is_resv_from_job)
			account_recordResv(PBS_ACCT_UR, presv, buf1);
	} else {
		/*Don't reply back until scheduler decides*/
		long dt;
		presv->ri_brp = preq;
		dt = get_rattr_long(presv, RESV_ATR_interactive);
		if (dt >= 0) {
			/*reply with id and state no decision in +dt secs*/
			(void) gen_future_reply(presv, dt);
		} else {
			/*no decision in -dt seconds, delete with msg*/
			(void) gen_negI_deleteResv(presv, -dt);
		}
		if (get_rattr_long(presv, RESV_ATR_resv_standing))
			snprintf(buf, sizeof(buf), "requestor=%s@%s Interactive=%ld recurrence_rrule=%s timezone=%s",
				 preq->rq_user, preq->rq_host, dt,
				 get_rattr_str(presv, RESV_ATR_resv_rrule),
				 get_rattr_str(presv, RESV_ATR_resv_timezone));
		else
			snprintf(buf, sizeof(buf), "requestor=%s@%s Interactive=%ld",
				 preq->rq_user, preq->rq_host, dt);
		account_recordResv(PBS_ACCT_UR, presv, buf);
	}

	{
		long dt = get_rattr_long(presv, RESV_ATR_start);
		strftime(tbuf1, sizeof(tbuf1), fmt, localtime((time_t *) &dt));
		dt = get_rattr_long(presv, RESV_ATR_end);
		strftime(tbuf2, sizeof(tbuf2), fmt, localtime((time_t *) &dt));
	}

	if (!get_rattr_long(presv, RESV_ATR_resv_standing)) {
		snprintf(log_buffer, sizeof(log_buffer), "New reservation submitted start=%s end=%s", tbuf1, tbuf2);
	} else {
		snprintf(log_buffer, sizeof(log_buffer), "New reservation submitted start=%s end=%s "
							 "recurrence_rrule=%s timezone=%s",
			 tbuf1, tbuf2,
			 get_rattr_str(presv, RESV_ATR_resv_rrule),
			 get_rattr_str(presv, RESV_ATR_resv_timezone));
	}
	log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
		  presv->ri_qs.ri_resvID, log_buffer);

	/* let the scheduler know that something new
	 * is available for consideration
	 */
	if (!is_maintenance && !is_resv_from_job)
		notify_scheds_about_resv(SCH_SCHEDULE_NEW, presv);
}

static struct dont_set_in_max {
	char *ds_name;	    /* resource name */
	resource *ds_rescp; /* ptr to resource entry */
} dont_set_in_max[] = {
	{"nodes", NULL},
	{"nodect", NULL},
	{"select", NULL},
	{"place", NULL},
	{"walltime", NULL}};

/**
 * @brief
 * 		create a queue to bind to the reservation
 *
 * @par Functionality:
 * 		get_queue_for_reservation - call this function to create and setup
 *		a queue that's associated with a general resources reservation.
 *
 *		An internally generated request is built up and issued to the
 *		"batch manager" subsystem to create a queue having the desired
 *		queue attributes
 *
 * @param[in]	presv	-	The reservation to which a queue is to be be associated
 *
 * @par
 * 		Note that the queue is created by issuing a request to "ourselves"
 * 		(the server) and that this request is fulfilled asynchronously. The queue
 * 		may fail to be created and cause the reservation to be queue-less.
 *
 * @return	error code
 * @retval	0	- success
 * @retval	PBS error code - error
 *
 * @par MT-safe: No
 */
static int
get_queue_for_reservation(resc_resv *presv)
{
	int i;
	int j;
	int rc = 0;
	svrattrl *psatl;
	attribute *pattr;
	static const int lenF = 6;  /*strlen("False") + 1*/
	static const int lenT = 5;  /*strlen("True") + 1*/
	static const int lenE = 10; /*strlen("Execution") + 1*/
	pbs_list_head *plhed;
	struct work_task *pwt;
	struct batch_request *newreq;

	newreq = alloc_br(PBS_BATCH_Manager);
	if (newreq == NULL) {
		(void) sprintf(log_buffer, "batch request allocation failed");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_RESV, LOG_ERR,
			  presv->ri_qs.ri_resvID, log_buffer);
		return (PBSE_SYSTEM);
	}

	newreq->rq_ind.rq_manager.rq_cmd = MGR_CMD_CREATE;
	newreq->rq_ind.rq_manager.rq_objtype = MGR_OBJ_QUEUE;
	newreq->rq_perm = ATR_DFLAG_MGWR | ATR_DFLAG_OPWR;
	(void) strcpy(newreq->rq_user, "pbs_server");
	(void) strcpy(newreq->rq_host, server_name);

	strcpy(newreq->rq_ind.rq_manager.rq_objname, get_rattr_str(presv, RESV_ATR_queue));

	pattr = get_rattr(presv, RESV_ATR_resource);
	CLEAR_HEAD(newreq->rq_ind.rq_manager.rq_attr);
	plhed = &newreq->rq_ind.rq_manager.rq_attr;

	/* resources specified by the reservation become "resc_avail" for queue
	 * Have already (at_action processing for RESV_ATR_resource) checked
	 * that server has control of resources needed, in sufficient quantity
	 *
	 * Note: "resc_avail" and "resc_max" attributes on the queue should
	 * not include certain (string) resources from the reservation's
	 * "resource_list" attribute as specified in the array dont_set_in_max;
	 * so, that is why those links are deleted from the attribute
	 * and then appended back a few lines later
	 */

	j = sizeof(dont_set_in_max) / sizeof(struct dont_set_in_max);
	for (i = 0; i < j; ++i) {
		resource_def *prdef;
		prdef = find_resc_def(svr_resc_def, dont_set_in_max[i].ds_name);
		dont_set_in_max[i].ds_rescp = find_resc_entry(pattr, prdef);
		if (dont_set_in_max[i].ds_rescp)
			delete_link(&dont_set_in_max[i].ds_rescp->rs_link);
	}

	rc = resv_attr_def[RESV_ATR_resource].at_encode(pattr, plhed,
							ATTR_rescavail, NULL,
							ATR_ENCODE_CLIENT, NULL);

	rc += resv_attr_def[RESV_ATR_resource].at_encode(pattr, plhed,
							 ATTR_rescmax, NULL,
							 ATR_ENCODE_CLIENT, NULL);

	for (i = 0; i < j; ++i) {
		if (dont_set_in_max[i].ds_rescp)
			append_link(
				&pattr->at_val.at_list,
				&dont_set_in_max[i].ds_rescp->rs_link,
				dont_set_in_max[i].ds_rescp);
	}
	if (rc < 0) {
		free_br(newreq);
		return (PBSE_genBatchReq);
	}

	if ((psatl = attrlist_create(ATTR_qtype, NULL, lenE)) != NULL) {
		static char Execution[] = "Execution";

		psatl->al_flags = que_attr_def[QA_ATR_QType].at_flags;
		strcpy(psatl->al_value, Execution);
		append_link(plhed, &psatl->al_link, psatl);
	} else {
		free_br(newreq);
		return (PBSE_genBatchReq);
	}

	/* Don't enable queue until reservation is RESV_CONFIRMED */
	if ((psatl = attrlist_create(ATTR_enable, NULL, lenF)) !=
	    NULL) {
		psatl->al_flags = que_attr_def[QA_ATR_Enabled].at_flags;
		strcpy(psatl->al_value, ATR_FALSE);
		append_link(plhed, &psatl->al_link, psatl);
	} else {
		free_br(newreq);
		return (PBSE_genBatchReq);
	}

	/* Don't start queue until reservation window here, RESV_TIME_TO_RUN */
	if ((psatl = attrlist_create(ATTR_start, NULL, lenF)) != NULL) {
		psatl->al_flags = que_attr_def[QA_ATR_Started].at_flags;
		strcpy(psatl->al_value, ATR_FALSE);
		append_link(plhed, &psatl->al_link, psatl);
	} else {
		free_br(newreq);
		return (PBSE_genBatchReq);
	}

	/* Generate a "user_acl" for PBS_BATCH_manager req, use
	 * reservation's "Authorized_Users" attribute
	 * Remark: "Authorized_Users" has, atleast, the reservation's owner
	 */

	if (is_rattr_set(presv, RESV_ATR_auth_u)) {
		pattr = get_rattr(presv, RESV_ATR_auth_u);
		plhed = &newreq->rq_ind.rq_manager.rq_attr;
		rc = check_duplicates(pattr->at_val.at_arst);
		if (rc == 1) {
			free_br(newreq);
			return (PBSE_DUPLIST);
		}
		rc = resv_attr_def[RESV_ATR_auth_u].at_encode(pattr, plhed,
							      ATTR_acluser, NULL,
							      ATR_ENCODE_SVR, NULL);
		if (rc < 0) {
			free_br(newreq);
			return (PBSE_genBatchReq);
		}

		/*let the que know user acl is to be enforced*/
		if ((psatl = attrlist_create(ATTR_acluren,
					     NULL, lenT)) != NULL) {
			psatl->al_flags = que_attr_def[QA_ATR_AclUserEnabled].at_flags;
			strcpy(psatl->al_value, ATR_TRUE);
			append_link(plhed, &psatl->al_link, psatl);
		} else {
			free_br(newreq);
			return (PBSE_genBatchReq);
		}
	}

	/* Generate a "group_acl" for PBS_BATCH_manager req, use
	 * reservation's "Authorized_Groups" attribute
	 */

	if (is_rattr_set(presv, RESV_ATR_auth_g)) {
		pattr = get_rattr(presv, RESV_ATR_auth_g);
		plhed = &newreq->rq_ind.rq_manager.rq_attr;
		rc = check_duplicates(pattr->at_val.at_arst);
		if (rc == 1) {
			free_br(newreq);
			return (PBSE_DUPLIST);
		}
		rc = resv_attr_def[RESV_ATR_auth_g].at_encode(pattr, plhed,
							      ATTR_aclgroup, NULL,
							      ATR_ENCODE_SVR, NULL);
		if (rc < 0) {
			free_br(newreq);
			return (PBSE_genBatchReq);
		}

		/*let the que know user acl is to be enforced*/
		if ((psatl = attrlist_create(ATTR_aclgren,
					     NULL, lenT)) != NULL) {
			psatl->al_flags = que_attr_def[QE_ATR_AclGroupEnabled].at_flags;
			strcpy(psatl->al_value, ATR_TRUE);
			append_link(plhed, &psatl->al_link, psatl);
		} else {
			free_br(newreq);
			return (PBSE_genBatchReq);
		}
	}

	/* Generate a "host_acl" for PBS_BATCH_manager req, use
	 * reservation's "Authorized_Hosts" attribute
	 */

	if (is_rattr_set(presv, RESV_ATR_auth_h)) {
		pattr = get_rattr(presv, RESV_ATR_auth_h);
		plhed = &newreq->rq_ind.rq_manager.rq_attr;
		rc = check_duplicates(pattr->at_val.at_arst);
		if (rc == 1) {
			free_br(newreq);
			return (PBSE_DUPLIST);
		}
		rc = resv_attr_def[RESV_ATR_auth_h].at_encode(pattr, plhed,
							      ATTR_aclhost, NULL,
							      ATR_ENCODE_SVR, NULL);
		if (rc < 0) {
			free_br(newreq);
			return (PBSE_genBatchReq);
		}

		/*let the que know user acl is to be enforced*/
		if ((psatl = attrlist_create(ATTR_aclhten,
					     NULL, lenT)) != NULL) {
			psatl->al_flags = que_attr_def[QA_ATR_AclHostEnabled].at_flags;
			strcpy(psatl->al_value, ATR_TRUE);
			append_link(plhed, &psatl->al_link, psatl);
		} else {
			free_br(newreq);
			return (PBSE_genBatchReq);
		}
	}

	/* Ok, everything is successfully built up, issue the Batch_Request */

	if (issue_Drequest(PBS_LOCAL_CONNECTION, newreq,
			   handle_qmgr_reply_to_resvQcreate, &pwt, 0) == -1) {
		free_br(newreq);

		(void) sprintf(log_buffer, "%s", msg_resvQcreateFail);
		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_ERR,
			  presv->ri_qs.ri_resvID, log_buffer);

		return (PBSE_mgrBatchReq);
	}
	if (pwt)
		pwt->wt_parm2 = presv; /*needed to handle qmgr's response*/

	return (0);
}
/**
 * @brief
 * 		ignore_attr	- wrapper function for find_attr.
 *
 * @param[in]	name	-	attribute name to find
 *
 * @return	return vlaue from find_attr()
 */
static int
ignore_attr(char *name)
{
	return (find_attr(job_attr_idx, job_attr_def, name));
}

/**
 * @brief
 * 		act_resv_add_owner - This is a special action function
 *		for a reservation's  "Authorized_Users" attribute - i.e. who is
 *		allowed to submit jobs to the reservation.
 *
 * @param[in]	pattr	-	not used here
 * @param[in]	pobj	-	reservation structure
 * @param[in]	amode	-	"actmode" stands for the type of action,
 * 							if ATR_ACTION_NEW, just returns from the function.
 *
 * @return	error code
 * @retval	0	: Success
 * @retval	!=0	: fails
 */

int
act_resv_add_owner(attribute *pattr, void *pobj, int amode)
{
	attribute dummy, *ap;
	struct array_strings dumarst;
	enum batch_op op;
	resc_resv *presv;
	char *ps;
	int len;

	if (amode != ATR_ACTION_NEW)
		return (0); /*success - nothing to do*/

	presv = (resc_resv *) pobj;
	if (is_rattr_set(presv, RESV_ATR_resv_owner) == 0)
		return (0); /*success - nothing to do*/

	ps = get_rattr_str(presv, RESV_ATR_resv_owner);
	len = strlen(ps);

	ap = get_rattr(presv, RESV_ATR_auth_u);
	if (is_attr_set(ap)) {
		int i;

		for (i = 0; i < ap->at_val.at_arst->as_usedptr; ++i)
			if (!strcmp(ps, ap->at_val.at_arst->as_string[i]))
				return (0); /*resv owner in Authorized_Users*/
		op = INCR;
	} else
		op = SET; /*Authorized_Users is NULL, must set*/

	(void) memset(&dummy, 0, sizeof(dummy));
	dummy.at_flags = NO_USER_SET | ATR_VFLAG_SET;
	dummy.at_type = ATR_TYPE_ACL;
	dummy.at_val.at_arst = &dumarst;
	dumarst.as_npointers = 1;
	dumarst.as_usedptr = 1;
	dumarst.as_bufsize = strlen(ps) + len;
	dumarst.as_buf = ps;
	dumarst.as_next = ps + len;
	dumarst.as_string[0] = ps;

	/*"at_set" function returns 0 on success and NZ on failure*/
	/*Remark: nice thing would be to have owner appear first  */
	return (resv_attr_def[RESV_ATR_auth_u].at_set(ap, &dummy, op));
}

/**
 * @brief
 * 		handle_qmgr_reply_to_resvQcreate - this is the function that's to be
 *		called to handle the qmgr's response to the earlier issued request
 *		for queue creation for a reservation.  If the response from the
 *		qmgr is successful, copy the queue's name into the ri_queue field
 *		of the reservation and set the reservation's ri_qp field pointing
 *		to this newly established queue.  If not successful log a message.
 * @par Functionality:
 *		This function should only be called through an INTERNALLY GENERATED
 *		request to another server (including ourself).
 *		It frees the request structure and closes the connection (handle).
 * @par
 *		In the work task entry, wt_event is the connection handle and
 *		wt_parm1 is a pointer to the request structure (containing the reply).
 *		wt_parm2 should have the address of the reservation structure
 *
 * @note
 *		THIS SHOULD NOT BE USED IF AN EXTERNAL (CLIENT) REQUEST IS "relayed",
 *		because the request/reply structure is still needed to reply back
 *		to the client.
 *
 * @param[in,out]	pwt	-	earlier issued request for queue creation for a reservation.
 */

static void
handle_qmgr_reply_to_resvQcreate(struct work_task *pwt)
{
	job *pjob;
	pbs_queue *pque;
	resc_resv *presv = pwt->wt_parm2;
	struct batch_request *preq = pwt->wt_parm1;

	if (preq->rq_reply.brp_code) {

		(void) sprintf(log_buffer, msg_resvQcreateFail,
			       presv->ri_jbp->ji_qs.ji_jobid,
			       presv->ri_qs.ri_resvID);
		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
			  presv->ri_qs.ri_resvID, log_buffer);
	} else {
		pque = find_queuebyname(preq->rq_ind.rq_manager.rq_objname);
		if ((presv->ri_qp = pque) != 0)
			pque->qu_resvp = presv;
		if ((pjob = find_job(get_rattr_str(presv, RESV_ATR_job))))
			pjob->ji_myResv = presv;
		(void) strcpy(presv->ri_qs.ri_queue, get_rattr_str(presv, RESV_ATR_queue));
		if (resv_save_db(presv)) {
			(void) resv_purge(presv);
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
	}

	free_br((struct batch_request *) pwt->wt_parm1);
	if (pwt->wt_event != -1)
		svr_disconnect(pwt->wt_event);
}

/**
 * @brief
 * 		Validate job and reservation place directives.
 *
 * @param[in]	pj	-	The job to validate.
 *
 * @note
 * 		The reservation associated to the job is obtained
 * 		from the job structure.
 *
 * @return	Whether the place directive between the job
 * 			and the reservation are in conflict or not.
 *
 * @retval	1	: job and reservation place directives do not conflict
 * @retval	0	: job and reservation place directives conflict
 *
 * @par MT-safe: No
 */
static int
validate_place_req_of_job_in_reservation(job *pj)
{
	resource_def *prsdef;
	resource *job_place;
	resource *resv_place;
	attribute *jattr;
	attribute *rattr;
	enum vnode_sharing job_sharetype;
	enum vnode_sharing resv_sharetype;

	/* A job not in reservation is implicitly considered valid */
	if (pj->ji_myResv == NULL)
		return 1;

	prsdef = &svr_resc_def[RESC_PLACE];
	jattr = get_jattr(pj, JOB_ATR_resource);
	rattr = get_rattr(pj->ji_myResv, RESV_ATR_resource);

	job_place = find_resc_entry(jattr, prsdef);
	if (!job_place || !job_place->rs_value.at_val.at_str)
		return 1;

	resv_place = find_resc_entry(rattr, prsdef);
	if (!resv_place || !resv_place->rs_value.at_val.at_str)
		return 1;

	/* Cehck for exclhost should come before excl because exclhost contains
	 * the excl prefix
	 */
	job_sharetype = place_sharing_type(
		job_place->rs_value.at_val.at_str,
		VNS_FORCE_EXCLHOST);
	if (job_sharetype == VNS_UNSET) {
		job_sharetype = place_sharing_type(
			job_place->rs_value.at_val.at_str,
			VNS_FORCE_EXCL);
	}
	resv_sharetype = place_sharing_type(
		resv_place->rs_value.at_val.at_str,
		VNS_FORCE_EXCLHOST);
	if (resv_sharetype == VNS_UNSET) {
		resv_sharetype = place_sharing_type(
			resv_place->rs_value.at_val.at_str,
			VNS_FORCE_EXCL);
	}

	/* Reject the request if job requests exclusive and reservation not */
	if ((resv_sharetype == VNS_UNSET) &&
	    (job_sharetype != VNS_UNSET))
		return 0;

	/* Reject request if job requests exclhost and reservation doesn't */
	if ((resv_sharetype != VNS_FORCE_EXCLHOST) &&
	    (job_sharetype == VNS_FORCE_EXCLHOST))
		return 0;

	return 1;
}

/**
 * @brief
 * 		Provides the next job id
 *
 * @param[in] void
 *
 * @return	long long
 * @retval (>=0 to <= max_job_sequence_id): Success
 * @retval	-1	: database error
 *
 */
long long
get_next_svr_sequence_id(void)
{
	static long long lastid = -1;
	long long seq = server.sv_qs.sv_jobidnumber;

	/* If server job limit is over, reset back to zero */
	if (++server.sv_qs.sv_jobidnumber > svr_max_job_sequence_id) {
		server.sv_qs.sv_jobidnumber = 0;
		lastid = -1;
	}

	/* check if we should save jobid */
	if (lastid == -1 || server.sv_qs.sv_jobidnumber == lastid) {
		lastid = ((server.sv_qs.sv_jobidnumber / SEQ_WIN_INCR) + 1) * SEQ_WIN_INCR;
		server.sv_qs.sv_lastid = lastid;
		svr_save_db(&server);
	}
	return seq;
}

/**
 * @brief
 * 			Resets server sequence window count and server sv_jobidnumber
 *
 * @return None
 *
 */
void
reset_svr_sequence_window(void)
{
	server.sv_qs.sv_jobidnumber = 0;
}

/**
 * @brief - Copy parameters from job to reservation
 *
 * @param[in] - jobid - id of the job from which the parameters will be copied.
 * @param[in] - presv - reservation to which the parameters will be copied to.
 *
 * @return int
 * @retval 0: Success
 * @retval < 0: error
 */
int
copy_params_from_job(char *jobid, resc_resv *presv)
{
	job *pjob;
	int bufsize;
	attribute temp;
	resource *presc;
	resource_def *prdefsl;
	resource_def *resc_def;
	resource *job_resc_entry;
	resource *resv_resc_entry;
	char buf[PBS_MAXUSER + PBS_MAXHOSTNAME + 64] = {0};

	int walltime_copied = 0;

	pjob = find_job(jobid);

	if (pjob == NULL)
		return PBSE_UNKJOBID;

	if ((!check_job_substate(pjob, JOB_SUBSTATE_RUNNING)) &&
	    (get_jattr_str(pjob, JOB_ATR_exec_vnode) == NULL))
		return PBSE_BADSTATE;

	bufsize = PBS_MAXUSER + PBS_MAXHOSTNAME + 64 - 1;

	if (strchr(get_jattr_str(pjob, JOB_ATR_job_owner), '@')) {
		strncpy(buf, get_jattr_str(pjob, JOB_ATR_job_owner), bufsize);
	} else
		snprintf(buf, bufsize, "%s@%s", get_jattr_str(pjob, JOB_ATR_job_owner),
			 get_jattr_str(pjob, JOB_ATR_submit_host));

	set_rattr_str_slim(presv, RESV_ATR_resv_owner, buf, NULL);
	set_rattr_str_slim(presv, RESV_ATR_resv_nodes, get_jattr_str(pjob, JOB_ATR_exec_vnode), NULL);

	if (is_jattr_set(pjob, JOB_ATR_stime))
		set_rattr_l_slim(presv, RESV_ATR_start, get_jattr_long(pjob, JOB_ATR_stime), SET);
	else
		set_rattr_l_slim(presv, RESV_ATR_start, time_now, SET);

	post_attr_set(get_rattr(presv, RESV_ATR_SchedSelect));

	job_resc_entry = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
	for (; job_resc_entry; job_resc_entry = (resource *) GET_NEXT(job_resc_entry->rs_link)) {
		resc_def = job_resc_entry->rs_defin;
		resv_resc_entry = find_resc_entry(get_rattr(presv, RESV_ATR_resource), resc_def);
		if (resv_resc_entry == NULL) {
			if (!(resv_resc_entry = add_resource_entry(get_rattr(presv, RESV_ATR_resource), resc_def)))
				return PBSE_SYSTEM;
		}
		if (is_attr_set(&job_resc_entry->rs_value)) {
			(void) resc_def->rs_set(&resv_resc_entry->rs_value, &job_resc_entry->rs_value, SET);
		}
		if (!strcmp(resc_def->rs_name, WALLTIME))
			walltime_copied = 1;
	}

	if (!walltime_copied) {
		resc_def = &svr_resc_def[RESC_WALLTIME];
		if (resc_def != NULL) {
			resv_resc_entry = find_resc_entry(get_rattr(presv, RESV_ATR_resource), resc_def);
			if (resv_resc_entry == NULL) {
				if (!(resv_resc_entry = add_resource_entry(get_rattr(presv, RESV_ATR_resource), resc_def)))
					return PBSE_SYSTEM;
			}
			temp.at_flags = ATR_VFLAG_SET;
			temp.at_type = ATR_TYPE_LONG;
			temp.at_val.at_long = RESV_INFINITY;
			(void) resc_def->rs_set(&resv_resc_entry->rs_value, &temp, SET);
		}
	}
	prdefsl = &svr_resc_def[RESC_SELECT];
	presc = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), prdefsl);
	make_schedselect(get_jattr(pjob, JOB_ATR_resource), presc, NULL, get_rattr(presv, RESV_ATR_SchedSelect));

	return 0;
}

/**
 * @brief - Confirm reservation that is being created out of a job.
 *
 * @param[in] - presv - reservation that needs to be confirmed.
 * @param[in] - orig_preq - batch request.
 * @param[in] - partition_name - partition in which the reservation needs to be confirmed.
 *
 * @return int
 * @retval 0: Success
 * @retval != 0: error
 */
int
confirm_resv_locally(resc_resv *presv, struct batch_request *orig_preq, char *partition_name)
{
	char *at;
	job *pjob;
	struct work_task *pwt;
	struct batch_request *preq;
	int extend_size = 0;

	presv->resv_from_job = 1;
	preq = alloc_br(PBS_BATCH_ConfirmResv);
	preq->rq_ind.rq_run.rq_destin = strdup(get_rattr_str(presv, RESV_ATR_resv_nodes));
	if (preq->rq_ind.rq_run.rq_destin == NULL) {
		free_br(preq);
		return 1;
	}

	/* extend field format is "PBS_RESV_CONFIRM_SUCCESS:partition=<partition name>"
	 * allocate enough memory to be able to support the format.
	 */
	extend_size = strlen(PBS_RESV_CONFIRM_SUCCESS) + strlen(partition_name) + 12;
	preq->rq_extend = malloc(extend_size);
	if (preq->rq_extend == NULL) {
		free_br(preq);
		return 1;
	}
	snprintf(preq->rq_extend, extend_size, "%s:partition=%s", PBS_RESV_CONFIRM_SUCCESS, partition_name);

	(void) strcpy(preq->rq_ind.rq_run.rq_jid, presv->ri_qs.ri_resvID);
	preq->rq_perm |= ATR_DFLAG_MGWR;

	if (issue_Drequest(PBS_LOCAL_CONNECTION, preq, release_req, &pwt, 0) == -1) {
		free_br(preq);
		return 1;
	}

	preq = alloc_br(PBS_BATCH_MoveJob);
	preq->rq_perm |= ATR_DFLAG_MGWR;
	strcpy(preq->rq_user, orig_preq->rq_user);
	strcpy(preq->rq_host, orig_preq->rq_host);

	pjob = find_job(get_rattr_str(presv, RESV_ATR_job));

	snprintf(preq->rq_ind.rq_move.rq_jid, sizeof(preq->rq_ind.rq_move.rq_jid), "%s", get_rattr_str(presv, RESV_ATR_job));
	at = strchr(presv->ri_qs.ri_resvID, (int) '.');
	if (at)
		*at = '\0';

	snprintf(preq->rq_ind.rq_move.rq_destin, sizeof(preq->rq_ind.rq_move.rq_destin), "%s", presv->ri_qs.ri_resvID);
	if (at)
		*at = '.';

	snprintf(pjob->ji_qs.ji_destin, PBS_MAXROUTEDEST, "%s", preq->rq_ind.rq_move.rq_destin);
	return (local_move(pjob, preq));
}

#endif /*SERVER ONLY*/


================================================
FILE: src/server/req_register.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    req_register.c
 *
 * @brief
 * 		req_register.c	-	This file hold all the functions dealing with job dependency
 *
 * Included functions are:
 * 	post_run_depend()
 * 	req_register()
 * 	post_doq()
 * 	alter_unreg()
 * 	depend_on_que()
 * 	post_doe()
 * 	depend_on_exec()
 * 	depend_on_term()
 * 	set_depend_hold()
 * 	find_depend()
 * 	make_depend()
 * 	register_dep()
 * 	unregister_dep()
 * 	find_dependjob()
 * 	make_dependjob()
 * 	send_depend_req()
 * 	decode_depend()
 * 	cpy_jobsvr()
 * 	dup_depend()
 * 	encode_depend()
 * 	set_depend()
 * 	comp_depend()
 * 	free_depend()
 * 	build_depend()
 * 	clear_depend()
 * 	del_depend()
 * 	del_depend_job()
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <sys/types.h>
#include <stdlib.h>
#include <ctype.h>
#include <errno.h>
#include <stdio.h>
#include <string.h>
#include <signal.h>
#include "libpbs.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "server.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "net_connect.h"

/* External functions */

extern int issue_to_svr(char *svr, struct batch_request *, void (*func)(struct work_task *));

/* Local Private Functions */

static void set_depend_hold(job *, attribute *);
static int register_dep(attribute *, struct batch_request *, int, int *);
static int unregister_dep(attribute *, struct batch_request *);
static struct depend *make_depend(int type, attribute *pattr);
static struct depend_job *make_dependjob(struct depend *, char *jobid, char *host);
static void del_depend_job(struct depend_job *pdj);
static int build_depend(attribute *, char *);
static void clear_depend(struct depend *, int type, int exists);
static void del_depend(struct depend *);
static void update_depend(job *, char *, char *, int, int);

/* External Global Data Items */

extern struct server server;
extern char server_name[];
extern char *msg_unkjobid;
extern char *msg_movejob;
extern char *msg_err_malloc;
extern char *msg_illregister;
extern char *msg_registerdel;
extern char *msg_registerrel;
extern char *msg_regrej;
extern char *msg_job_moved;
extern char *msg_depend_runone;
extern char *msg_histdepend;
extern char *msg_historyjobid;

#define DEPEND_ADD 1
#define DEPEND_REMOVE 2
/**
 * @brief
 * 		post_run_depend - this function is called via a work task when a
 *		register dependency "after" is received for a job that is already
 *		running.  We accept the dependency and then turn around and send a
 *		"release" back to the newly registered job to remove its hold.
 *
 * param[in]	pwt	-	work task
 */
static void
post_run_depend(struct work_task *pwt)
{
	job *pjob;

	pjob = (job *) pwt->wt_parm1;
	if (is_jattr_set(pjob, JOB_ATR_depend))
		depend_on_exec(pjob);
	return;
}

/**
 * @brief	A function to add/remove dependency on a given job
 *
 * @param[in]	pjob - Job on which we need perform the operation
 * @param[in]	d_jobid - The job id which needs to be added/removed
 * @param[in]	d_svr
 * @param[in]	op -	operation to perform - DEPEND_ADD/DEPEND_REMOVE
 * @param[in]	type - Dependency type
 *
 * @return	void
 */
static void
update_depend(job *pjob, char *d_jobid, char *d_svr, int op, int type)
{
	job *d_job;
	struct depend *dp;
	struct depend_job *dpj;
	attribute *pattr;

	d_job = find_job(d_jobid);
	if (d_job == NULL)
		return;

	pattr = get_jattr(pjob, JOB_ATR_depend);
	dp = find_depend(type, pattr);
	if (op == DEPEND_ADD) {
		if (dp == NULL) {
			dp = make_depend(JOB_DEPEND_TYPE_RUNONE, pattr);
			if (dp == NULL)
				return;
		}
		dpj = find_dependjob(dp, d_jobid);
		if (dpj)
			return; /* Job dependency already established */
		if (strcmp(pjob->ji_qs.ji_jobid, d_jobid)) {
			dpj = make_dependjob(dp, d_jobid, d_svr);
			post_attr_set(pattr);
			job_save(pjob);
			/* runone dependencies are circular */
			if (type == JOB_DEPEND_TYPE_RUNONE)
				update_depend(d_job, pjob->ji_qs.ji_jobid, d_svr, op, type);
		}
		return;
	} else if (op == DEPEND_REMOVE) {
		if (dp == NULL)
			return;
		dpj = find_dependjob(dp, d_jobid);
		if (dpj == NULL)
			return;
		del_depend_job(dpj);
		if (GET_NEXT(dp->dp_jobs) == 0)
			/* no more dependencies of this type */
			del_depend(dp);

		pattr->at_flags |= ATR_MOD_MCACHE;
		/* runone dependencies are circular */
		if (type == JOB_DEPEND_TYPE_RUNONE)
			update_depend(d_job, pjob->ji_qs.ji_jobid, d_svr, op, type);
		return;
	}
	return;
}

/**
 * @brief
 * 		req_register - process the Register Dependency Request
 * @note
 *		We have an interesting problem here in that the request may well
 *		originate from ourself.  In that case we doen't really reply.
 *
 * @param[in]	preq	-	Register Dependency Request.
 */

void
req_register(struct batch_request *preq)
{
	int made;
	attribute *pattr;
	struct depend *pdep;
	struct depend_job *pdj;
	job *pjob;
	char *ps;
	struct work_task *ptask;
	int rc = 0;
	int revtype;
	int type;
	int is_finished = FALSE;

	/*  make sure request is from a server */

	if (!preq->rq_fromsvr) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	/* find the "parent" job specified in the request */

	if ((pjob = find_job(preq->rq_ind.rq_register.rq_parent)) == NULL) {

		/*
		 * job not found... if server is initializing, it may not
		 * yet recovered, that is not an error.
		 */

		if (get_sattr_long(SVR_ATR_State) != SV_STATE_INIT) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
				  preq->rq_ind.rq_register.rq_parent,
				  msg_unkjobid);
			req_reject(PBSE_UNKJOBID, 0, preq);
		} else {
			reply_ack(preq);
		}
		return;
	}

	if (check_job_state(pjob, JOB_STATE_LTR_FINISHED))
		is_finished = TRUE;

	pattr = get_jattr(pjob, JOB_ATR_depend);
	type = preq->rq_ind.rq_register.rq_dependtype;

	/* more of the server:port fix kludge */

	ps = strchr(preq->rq_ind.rq_register.rq_child, (int) '@');
	if (ps != NULL) {
		(void) strcpy(preq->rq_ind.rq_register.rq_svr, ps + 1);
		*ps = '\0';
	} else {
		(void) strcpy(preq->rq_ind.rq_register.rq_svr, preq->rq_host);
	}

	if (check_job_state(pjob, JOB_STATE_LTR_MOVED)) {
		snprintf(log_buffer, sizeof(log_buffer), "Parent %s%s", msg_movejob, pjob->ji_qs.ji_destin);
		log_event(PBSEVENT_DEBUG | PBSEVENT_SYSTEM | PBSEVENT_ERROR,
			  PBS_EVENTCLASS_REQUEST, LOG_INFO,
			  preq->rq_ind.rq_register.rq_child, log_buffer);
		req_reject(PBSE_JOB_MOVED, 0, preq);
		return;
	}
	switch (preq->rq_ind.rq_register.rq_op) {

			/*
			 * Register a dependency
			 */

		case JOB_DEPEND_OP_REGISTER:
			switch (type) {

				case JOB_DEPEND_TYPE_AFTERSTART:
					if (is_finished == TRUE) {
						rc = PBSE_HISTJOBID;
						break;
					}
					if (get_job_substate(pjob) >= JOB_SUBSTATE_RUNNING) {
						/* Job already running, setup task to send
						 * release back to child and continue with
						 * registration process.
						 */
						ptask = set_task(WORK_Immed, 0, post_run_depend,
								 (void *) pjob);
						if (ptask)
							append_link(&pjob->ji_svrtask,
								    &ptask->wt_linkobj, ptask);
					}
					/* fall through to complete registration */
				case JOB_DEPEND_TYPE_AFTERANY:
				case JOB_DEPEND_TYPE_AFTEROK:
				case JOB_DEPEND_TYPE_AFTERNOTOK:
					/* If the job has already finished, no need to add after dependency */
					if (is_finished == TRUE) {
						if (((type == JOB_DEPEND_TYPE_AFTERNOTOK) && (pjob->ji_qs.ji_un.ji_exect.ji_exitstat == 0)) ||
						    ((type == JOB_DEPEND_TYPE_AFTEROK) && (pjob->ji_qs.ji_un.ji_exect.ji_exitstat != 0)))
							rc = PBSE_HISTDEPEND;
						else
							rc = PBSE_HISTJOBID;
						break;
					}
					rc = register_dep(pattr, preq, type, &made);
					break;
				case JOB_DEPEND_TYPE_BEFORESTART:
				case JOB_DEPEND_TYPE_BEFOREANY:
				case JOB_DEPEND_TYPE_BEFOREOK:
				case JOB_DEPEND_TYPE_BEFORENOTOK:

					/* There is no need to put before dependency on a finished job */
					if (is_finished == TRUE) {
						rc = PBSE_HISTDEPEND;
						break;
					}
					/*
					 * Check job owner for permission, use the real
					 * job owner, not the sending server's name.
					 */

					(void) strcpy(preq->rq_user,
						      preq->rq_ind.rq_register.rq_owner);
					if (svr_chk_owner(preq, pjob)) {
						rc = PBSE_PERM; /* not same user */
					} else {
						/* ok owner, see if job has "on" */
						pdep = find_depend(JOB_DEPEND_TYPE_ON, pattr);
						if (pdep == 0) {
							/* on "on", see if child already registered */
							revtype = type ^ (JOB_DEPEND_TYPE_BEFORESTART -
									  JOB_DEPEND_TYPE_AFTERSTART);
							pdep = find_depend(revtype, pattr);
							if (pdep == 0) {
								/* no "on" and no prior - return error */
								rc = PBSE_BADDEPEND;
							} else {
								pdj = find_dependjob(pdep, preq->rq_ind.rq_register.rq_child);
								if (pdj) {
									/* has prior register, update it */
									(void) strcpy(pdj->dc_svr, preq->rq_ind.rq_register.rq_svr);
								}
							}
						} else if ((rc = register_dep(pattr, preq, type, &made)) == 0) {
							if (made) { /* first time registered */
								if (--pdep->dp_numexp <= 0)
									del_depend(pdep);
							}
						}
					}
					break;
				case JOB_DEPEND_TYPE_RUNONE:
					/*
					 * Check job owner for permission, use the real
					 * job owner, not the sending server's name.
					 */

					strcpy(preq->rq_user, preq->rq_ind.rq_register.rq_owner);
					if (svr_chk_owner(preq, pjob)) {
						rc = PBSE_PERM; /* not same user */
					} else {
						pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, pattr);
						if (pdep) {
							struct depend_job *dj_iter;
							job *pr_job;
							pr_job = find_job(preq->rq_ind.rq_register.rq_child);
							for (dj_iter = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
							     dj_iter != NULL; dj_iter = (struct depend_job *) GET_NEXT(dj_iter->dc_link))
								update_depend(pr_job, dj_iter->dc_child, dj_iter->dc_svr, DEPEND_ADD, JOB_DEPEND_TYPE_RUNONE);
						}
						update_depend(pjob, preq->rq_ind.rq_register.rq_child, preq->rq_ind.rq_register.rq_svr, DEPEND_ADD, JOB_DEPEND_TYPE_RUNONE);
					}
					break;

				default:
					rc = PBSE_IVALREQ;
					break;
			}
			break;

			/*
			 * Release a dependency so job might run
			 */

		case JOB_DEPEND_OP_RELEASE:
			switch (type) {

				case JOB_DEPEND_TYPE_BEFORESTART:
				case JOB_DEPEND_TYPE_BEFOREANY:
				case JOB_DEPEND_TYPE_BEFOREOK:
				case JOB_DEPEND_TYPE_BEFORENOTOK:

					/* predecessor sent release-reduce "on", */
					/* see if this job can now run 		 */
					type ^= (JOB_DEPEND_TYPE_BEFORESTART -
						 JOB_DEPEND_TYPE_AFTERSTART);
					if ((pdep = find_depend(type, pattr)) != NULL) {
						pdj = find_dependjob(pdep,
								     preq->rq_ind.rq_register.rq_child);
						if (pdj) {
							del_depend_job(pdj);
							pattr->at_flags |= ATR_MOD_MCACHE;
							(void) sprintf(log_buffer, msg_registerrel,
								       preq->rq_ind.rq_register.rq_child);
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
								  LOG_INFO,
								  pjob->ji_qs.ji_jobid, log_buffer);

							if (GET_NEXT(pdep->dp_jobs) == 0) {
								/* no more dependencies of this type */
								del_depend(pdep);
								set_depend_hold(pjob, pattr);
							}
							break;
						}
					}
					rc = PBSE_IVALREQ;
					break;
				case JOB_DEPEND_TYPE_RUNONE:
					pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, pattr);
					if (pdep) {
						struct depend_job *dj_iter;
						job *pr_job;
						pr_job = find_job(preq->rq_ind.rq_register.rq_child);
						if (pr_job) {
							for (dj_iter = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
							     dj_iter != NULL; dj_iter = (struct depend_job *) GET_NEXT(dj_iter->dc_link)) {
								update_depend(pr_job, dj_iter->dc_child, dj_iter->dc_svr, DEPEND_REMOVE, JOB_DEPEND_TYPE_RUNONE);
								log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
									   LOG_INFO, pr_job->ji_qs.ji_jobid, msg_registerrel, dj_iter->dc_child);
							}
						}
					}
					update_depend(pjob, preq->rq_ind.rq_register.rq_parent, preq->rq_ind.rq_register.rq_svr, DEPEND_REMOVE, JOB_DEPEND_TYPE_RUNONE);
					log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
						   pjob->ji_qs.ji_jobid, msg_registerrel, preq->rq_ind.rq_register.rq_parent);

					if (GET_NEXT(pdep->dp_jobs) == 0) {
						/* no more dependencies of this type */
						del_depend(pdep);
					}
					break;
			}

			break;

		case JOB_DEPEND_OP_READY:
			rc = PBSE_NOSYNCMSTR;
			break;

		case JOB_DEPEND_OP_DELETE:
			(void) sprintf(log_buffer, msg_registerdel,
				       preq->rq_ind.rq_register.rq_child);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, log_buffer);
			job_abt(pjob, log_buffer);
			/* Since the job is aborted, we can return here itself */
			reply_ack(preq);
			return;

		case JOB_DEPEND_OP_UNREG:
			unregister_dep(pattr, preq);
			set_depend_hold(pjob, pattr);
			break;

		default:
			sprintf(log_buffer, msg_illregister,
				preq->rq_ind.rq_register.rq_parent);
			log_event(PBSEVENT_DEBUG | PBSEVENT_SYSTEM | PBSEVENT_ERROR,
				  PBS_EVENTCLASS_REQUEST, LOG_INFO,
				  preq->rq_host, log_buffer);
			rc = PBSE_IVALREQ;
			break;
			;
	}

	if (rc) {
		req_reject(rc, 0, preq);
	} else {
		job_save_db(pjob);
		reply_ack(preq);
	}
	return;
}

/**
 * @brief
 * 		post_doq (que not dog) - post request/reply processing for depend_on_que
 *		i.e. the sending of register operations.
 *
 * @param[in]	pwt	-	post request/reply
 */

static void
post_doq(struct work_task *pwt)
{
	struct batch_request *preq = (struct batch_request *) pwt->wt_parm1;
	char *jobid = preq->rq_ind.rq_register.rq_child;
	char *msg;
	job *pjob;
	job *ppjob;
	struct depend_job pparent;
	int rc;

	if (preq->rq_reply.brp_code) {
		/* request was rejected */
		if (preq->rq_reply.brp_code == PBSE_HISTJOBID)
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobid,
				   "%s %s, dependency satisfied", preq->rq_ind.rq_register.rq_parent, msg_historyjobid);
		else if (preq->rq_reply.brp_code == PBSE_HISTDEPEND)
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobid,
				   "%s %s", preq->rq_ind.rq_register.rq_parent, msg_histdepend);
		else
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobid,
				   "%s%s", msg_regrej, preq->rq_ind.rq_register.rq_parent);

		pjob = find_job(jobid);
		if ((msg = pbse_to_txt(preq->rq_reply.brp_code)) != NULL) {
			(void) strcat(log_buffer, " ");
			(void) strcat(log_buffer, msg);
		}
		if (pjob) {
			ppjob = find_job(preq->rq_ind.rq_register.rq_parent);
			if (preq->rq_reply.brp_code == PBSE_JOB_MOVED) {
				/* Creating a separate log buffer because if we end up aborting the submitted job
				 * we don't want to change what goes into accounting log via job_abt
				 */
				char log_msg[LOG_BUF_SIZE];
				snprintf(log_msg, sizeof(log_msg), "%s, %s", msg_job_moved,
					 "sending dependency request to remote server");
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobid, log_msg);
				if (ppjob && (check_job_state(ppjob, JOB_STATE_LTR_MOVED)) && (check_job_substate(ppjob, JOB_SUBSTATE_MOVED))) {
					char *destin;
					/* job destination should be <remote queue>@<remote server> */
					destin = strchr(ppjob->ji_qs.ji_destin, (int) '@');
					if (destin != NULL) {
						strncpy(pparent.dc_child, ppjob->ji_qs.ji_jobid, sizeof(pparent.dc_child));
						destin++;
						strncpy(pparent.dc_svr, destin, sizeof(pparent.dc_svr) - (destin - ppjob->ji_qs.ji_destin));
						rc = send_depend_req(pjob, &pparent, preq->rq_ind.rq_register.rq_dependtype,
								     JOB_DEPEND_OP_REGISTER,
								     SYNC_SCHED_HINT_NULL, post_doq);
						if (rc) {
							snprintf(log_msg, sizeof(log_msg), "%s",
								 "Failed to send dependency request to remote server, aborting job");
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR, jobid, log_msg);
							check_block(pjob, log_buffer);
							job_abt(pjob, log_buffer);
						}
					} else {
						/* Ideally if a job is moved, destination can not be empty */
						/* If we come across an empty destination, abort the job */
						check_block(pjob, log_buffer);
						job_abt(pjob, log_buffer);
					}
				} else {
					check_block(pjob, log_buffer);
					job_abt(pjob, log_buffer);
				}
			} else if (preq->rq_reply.brp_code == PBSE_HISTJOBID) {
				if (ppjob) {
					update_depend(pjob, ppjob->ji_qs.ji_jobid, preq->rq_host, DEPEND_REMOVE, preq->rq_ind.rq_register.rq_dependtype);
					/* check and remove system hold if needed */
					set_depend_hold(pjob, get_jattr(pjob, JOB_ATR_depend));
				}

			} else {
				check_block(pjob, log_buffer);
				job_abt(pjob, log_buffer);
			}
		}
	}

	release_req(pwt);
}

/**
 * @brief
 * 		alter_unreg - if required, unregister dependencies on alter of attribute
 *		This is called from depend_on_que() when it is acting as the at_action
 *		routine for the dependency attribute.
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	old	-	current job dependency attribure
 * @param[out]	new	-	job dependency attribute after alter
 */

static void
alter_unreg(job *pjob, attribute *old, attribute *new)
{
	struct depend *poldd;
	struct depend *pnewd;
	struct depend_job *oldjd;
	int type;

	for (poldd = (struct depend *) GET_NEXT(old->at_val.at_list);
	     poldd;
	     poldd = (struct depend *) GET_NEXT(poldd->dp_link)) {

		type = poldd->dp_type;
		if (type != JOB_DEPEND_TYPE_ON) {

			pnewd = find_depend(type, new);
			oldjd = (struct depend_job *) GET_NEXT(poldd->dp_jobs);
			while (oldjd) {
				if ((pnewd == 0) ||
				    (find_dependjob(pnewd, oldjd->dc_child) == NULL)) {
					(void) send_depend_req(pjob, oldjd, type,
							       JOB_DEPEND_OP_UNREG,
							       SYNC_SCHED_HINT_NULL,
							       release_req);
				}
				oldjd = (struct depend_job *) GET_NEXT(oldjd->dc_link);
			}
		}
	}
}

/**
 * @brief
 * 		depend_on_que - Perform a series of actions if job has a dependency
 *		that needs action when the job is queued into an execution queue.
 * @par
 *		Called from svr_enquejob() when a job enters an
 *		execution queue.  Also  the at_action routine for the attribute.
 *
 * @param[out]	pattr	-	job dependency attribute after alter
 * @param[in]	pobj	-	pointer to job structure
 * @param[in]	amode	-	"actmode" stands for the type of action
 */

int
depend_on_que(attribute *pattr, void *pobj, int mode)
{
	char *b1, *b2;
	struct depend *pdep;
	struct depend_job *pparent;
	int rc;
	int type;
	job *pjob = (job *) pobj;

	if (((mode != ATR_ACTION_ALTER) && (mode != ATR_ACTION_NOOP)) ||
	    (pjob->ji_qhdr == 0) ||
	    (pjob->ji_qhdr->qu_qs.qu_type != QTYPE_Execution))
		return (0);

	if (mode == ATR_ACTION_ALTER) {
		/* if there are dependencies being removed, unregister them */

		alter_unreg(pjob, get_jattr(pjob, JOB_ATR_depend), pattr);
	}

	/* First set a System hold if required */
	set_depend_hold(pjob, pattr);

	/* Check if there are dependencies that require registering */

	pdep = (struct depend *) GET_NEXT(pattr->at_val.at_list);
	while (pdep) {
		type = pdep->dp_type;
		if (type != JOB_DEPEND_TYPE_ON) {

			pparent = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
			while (pparent) {
				if (((b1 = strchr(pparent->dc_child, (int) '[')) != NULL) &&
				    ((b2 = strchr(pparent->dc_child, (int) ']')) != NULL)) {
					if (b2 != b1 + 1)
						return PBSE_IVALREQ;
				}
				if (strcmp(pparent->dc_child, pjob->ji_qs.ji_jobid) == 0) {
					/* parent and child job ids are the same */
					return PBSE_IVALREQ;
				}

				if (type == JOB_DEPEND_TYPE_RUNONE) {
					job *djob = find_job(pparent->dc_child);
					if (djob == NULL)
						return PBSE_IVALREQ;
					/* hold this job if any of the jobs it is dependent on is
					 * either running or already held because of dependency.
					 * pay special attention to array parent jobs because those jobs
					 * may not be in BEGUN state while a subjob might already be running
					 * this is because JOB_STATE_LTR_BEGUN is set only when a mom reports
					 * session id, but there could be a case that a mom is in the process
					 * of reporting a session id and user submits a dependent job.
					 * To avoid such cases, verify that count of queued subjobs is equal
					 * to the number of subjobs
					 */
					else if (check_job_state(djob, JOB_STATE_LTR_RUNNING) ||
						 check_job_state(djob, JOB_STATE_LTR_BEGUN) ||
						 (djob->ji_ajinfo != NULL &&
						  djob->ji_ajinfo->tkm_ct != djob->ji_ajinfo->tkm_subjsct[JOB_STATE_QUEUED]) ||
						 (check_job_state(djob, JOB_STATE_LTR_HELD) &&
						  check_job_substate(djob, JOB_SUBSTATE_DEPNHOLD))) {
						/* If the dependent job is running or has system hold, then put this job on hold too*/
						set_jattr_b_slim(pjob, JOB_ATR_hold, HOLD_s, INCR);
						svr_setjobstate(pjob, JOB_STATE_LTR_HELD, JOB_SUBSTATE_DEPNHOLD);
					}
				}
				rc = send_depend_req(pjob, pparent, type,
						     JOB_DEPEND_OP_REGISTER,
						     SYNC_SCHED_HINT_NULL, post_doq);
				if (rc)
					return rc;
				pparent = (struct depend_job *) GET_NEXT(pparent->dc_link);
			}
		}
		pdep = (struct depend *) GET_NEXT(pdep->dp_link);
	}

	pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, pattr);
	if (pdep != NULL) {
		/* go through all dependent jobs */
		struct depend_job *f_pparent = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
		if (f_pparent == NULL)
			return (0);
		for (; f_pparent != NULL; f_pparent = (struct depend_job *) GET_NEXT(f_pparent->dc_link)) {
			pjob = find_job(f_pparent->dc_child);
			if (pjob == NULL)
				return (0);
			pparent = (struct depend_job *) GET_NEXT(f_pparent->dc_link);
			for (; pparent != NULL; pparent = (struct depend_job *) GET_NEXT(pparent->dc_link)) {
				if (find_dependjob(find_depend(JOB_DEPEND_TYPE_RUNONE, get_jattr(pjob, JOB_ATR_depend)), pparent->dc_child) == NULL) {
					rc = send_depend_req(pjob, pparent, pdep->dp_type,
							     JOB_DEPEND_OP_REGISTER, SYNC_SCHED_HINT_NULL, post_doq);
					if (rc)
						return (rc);
				}
			}
		}
	}
	return (0);
}

/**
 * @brief
 * 		post_doe - Post (reply) processing of requests processing for depend_on_exec
 *
 * @param[in]	pwt	-	work task containing requests to be processed
 */

static void
post_doe(struct work_task *pwt)
{
	struct batch_request *preq = pwt->wt_parm1;
	char *jobid = preq->rq_ind.rq_register.rq_child;
	attribute *pattr;
	struct depend *pdep;
	struct depend_job *pdj;
	job *pjob;

	pjob = find_job(jobid);
	if (pjob) {
		pattr = get_jattr(pjob, JOB_ATR_depend);
		pdep = find_depend(JOB_DEPEND_TYPE_BEFORESTART, pattr);
		if (pdep != NULL) {
			pdj = find_dependjob(pdep, preq->rq_ind.rq_register.rq_parent);
			if (pdj != NULL)
				del_depend_job(pdj);
			if (GET_NEXT(pdep->dp_jobs) == 0) {
				/* no more dependencies of this type */
				del_depend(pdep);
			}
		}
	}
	release_req(pwt);
}

/**
 * @brief
 * 		post_runone - Post (reply) processing of requests processing for run one job
 *
 * @param[in]	pwt	-	work task containing requests to be processed
 */
void
post_runone(struct work_task *pwt)
{
	struct batch_request *preq = pwt->wt_parm1;
	char *jobid = preq->rq_ind.rq_register.rq_child;
	attribute *pattr;
	struct depend *pdep;
	struct depend_job *pdj;
	job *pjob;
	job *del_job;

	pjob = find_job(jobid);
	if (pjob) {
		pattr = get_jattr(pjob, JOB_ATR_depend);
		pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, pattr);
		if (pdep != NULL) {
			pdj = find_dependjob(pdep, preq->rq_ind.rq_register.rq_parent);
			if (pdj != NULL)
				del_depend_job(pdj);
			if (GET_NEXT(pdep->dp_jobs) == 0) {
				/* no more dependencies of this type */
				del_depend(pdep);
			}
			del_job = find_job(preq->rq_ind.rq_register.rq_parent);
			job_abt(del_job, msg_depend_runone);
		}
	}
	release_req(pwt);
}

/**
 * @brief
 * 		depend_on_exec - Perform actions if job has
 *		"beforestart" dependency - send "register-release" to child job; or
 * @note
 *		This function is called from svr_startjob().
 *
 * @param[in]	pjob	-	job
 *
 * @return	error code
 * @retval	0	: success
 */

int
depend_on_exec(job *pjob)
{
	struct depend *pdep;
	struct depend_job *pdj;

	if (pjob == NULL)
		return (0);

	/* If any jobs come after my start, release them */

	pdep = find_depend(JOB_DEPEND_TYPE_BEFORESTART, get_jattr(pjob, JOB_ATR_depend));
	if (pdep) {
		pdj = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
		while (pdj) {
			(void) send_depend_req(pjob, pdj, pdep->dp_type, JOB_DEPEND_OP_RELEASE, SYNC_SCHED_HINT_NULL, post_doe);
			pdj = (struct depend_job *) GET_NEXT(pdj->dc_link);
		}
	}
	return (0);
}

/**
 * @brief
 * 		Helper function that goes through all dependent jobs with runone dependency
 *		on the given job and removes the given job out of their dependency list.
 * @note
 *		This function is called from req_deletejob2().
 *
 * @param[in]	pjob	-	job
 *
 * @return	error code
 * @retval	0	: success
 */
int
depend_runone_remove_dependency(job *pjob)
{
	struct depend *pdep;
	struct depend_job *pdj;
	struct job *d_pjob;

	if (pjob == NULL)
		return (0);

	pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, get_jattr(pjob, JOB_ATR_depend));
	if (pdep) {
		for (pdj = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
		     pdj != NULL; pdj = (struct depend_job *) GET_NEXT(pdj->dc_link)) {
			d_pjob = find_job(pdj->dc_child);
			if (d_pjob) {
				struct depend_job *temp_pdj = NULL;
				attribute *pattr = get_jattr(d_pjob, JOB_ATR_depend);

				temp_pdj = find_dependjob(find_depend(JOB_DEPEND_TYPE_RUNONE, pattr), pjob->ji_qs.ji_jobid);
				if (temp_pdj) {
					del_depend_job(temp_pdj);
					pattr->at_flags |= ATR_MOD_MCACHE;
				}
			}
		}
		del_depend(pdep);
	}
	return (0);
}

/**
 * @brief
 * 		Helper function that goes through all dependent jobs with runone dependency
 *		on the given job and puts all them on system hold.
 * @note
 *		This function is called from req_strtjob2().
 *
 * @param[in]	pjob	-	job
 *
 * @return	error code
 * @retval	0	: success
 */
int
depend_runone_hold_all(job *pjob)
{
	struct depend *pdep;
	struct depend_job *pdj;
	struct job *d_pjob;

	if (pjob == NULL)
		return (0);

	pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, get_jattr(pjob, JOB_ATR_depend));
	if (pdep) {
		for (pdj = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
		     pdj != NULL; pdj = (struct depend_job *) GET_NEXT(pdj->dc_link)) {
			d_pjob = find_job(pdj->dc_child);
			if (d_pjob) {
				set_jattr_b_slim(d_pjob, JOB_ATR_hold, HOLD_s, INCR);
				svr_setjobstate(d_pjob, JOB_STATE_LTR_HELD, JOB_SUBSTATE_HELD);
			}
		}
	}
	return (0);
}

/**
 * @brief
 * 		Helper function that goes through all dependent jobs with runone dependency
 *		on the given job and releases them of system hold.
 * @note
 *		This function is called from req_rerunjob2().
 *
 * @param[in]	pjob	-	job
 *
 * @return	error code
 * @retval	0	: success
 */
int
depend_runone_release_all(job *pjob)
{
	struct depend *pdep;
	struct depend_job *pdj;
	struct job *d_pjob;
	char newstate;
	int newsub;

	if (pjob == NULL)
		return (0);

	pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, get_jattr(pjob, JOB_ATR_depend));
	if (pdep) {
		pdj = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
		for (pdj = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
		     pdj != NULL; pdj = (struct depend_job *) GET_NEXT(pdj->dc_link)) {
			d_pjob = find_job(pdj->dc_child);
			if (d_pjob) {
				set_jattr_b_slim(d_pjob, JOB_ATR_hold, HOLD_s, DECR);
				svr_evaljobstate(d_pjob, &newstate, &newsub, 0);
				svr_setjobstate(d_pjob, newstate, newsub); /* saves job */
			}
		}
	}
	return (0);
}

/**
 * @brief
 * 		depend_on_term - Perform actions if job has "afterany, afterok, afternotok"
 *		dependencies, send "register-release" or "register-delete" as
 *		appropriate.
 * @par
 *		This function is invoked from on_job_exit() in req_jobobit.c.
 *		When there are no depends to deal with, free the attribute and
 *		recall on_job_exit().
 *
 * @param[in]	pjob	-	job
 *
 * @return	error code
 * @retval	0	: success
 */

int
depend_on_term(job *pjob)
{
	int exitstat = pjob->ji_qs.ji_un.ji_exect.ji_exitstat;
	int op;
	struct depend *pdep;
	struct depend_job *pparent;
	int rc;
	int type;

	pdep = (struct depend *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_depend));
	while (pdep) {
		op = -1;
		switch (type = pdep->dp_type) {

				/* for the first three, before... types, release or delete */
				/* next job depending on exit status			   */

			case JOB_DEPEND_TYPE_BEFOREOK:
				if (exitstat == 0)
					op = JOB_DEPEND_OP_RELEASE;
				else
					op = JOB_DEPEND_OP_DELETE;
				break;

			case JOB_DEPEND_TYPE_BEFORENOTOK:
				/* exitstat has defined values in case of user/admin forcefully deletes the job.
				 * In such cases delete the chain on dependency.
				 */
				if (exitstat != 0)
					op = JOB_DEPEND_OP_RELEASE;
				else
					op = JOB_DEPEND_OP_DELETE;
				break;

			case JOB_DEPEND_TYPE_BEFOREANY:
				op = JOB_DEPEND_OP_RELEASE;
				break;

			case JOB_DEPEND_TYPE_RUNONE:
				op = JOB_DEPEND_OP_DELETE;
				break;
			/* This case can only happen when a job with before start
			 * dependency is getting deleted before it even runs.
			 */
			case JOB_DEPEND_TYPE_BEFORESTART:
				op = JOB_DEPEND_OP_DELETE;
				break;
		}
		if (op != -1) {
			/* Check if the job is being deleted. If so, delete the dependency chain only for beforeok dependency */
			if (pjob->ji_terminated == 1) {
				if (type == JOB_DEPEND_TYPE_BEFORENOTOK || type == JOB_DEPEND_TYPE_BEFOREANY)
					op = JOB_DEPEND_OP_RELEASE;
				else
					op = JOB_DEPEND_OP_DELETE;
			}
			/* This function is also called from job_abt when the job is in held state and abort substate.
			 * In case of a held job, release the dependency chain.
			 */
			if (check_job_state(pjob, JOB_STATE_LTR_HELD) && check_job_substate(pjob, JOB_SUBSTATE_ABORT)) {
				op = JOB_DEPEND_OP_DELETE;
				/* In case the job being deleted is a job with runone dependency type
				 * then there is no need to delete other dependent jobs.
				 */
				if (type == JOB_DEPEND_TYPE_RUNONE)
					op = JOB_DEPEND_OP_RELEASE;
			}

			pparent = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
			while (pparent) {
				/* "release" the job to execute */
				rc = send_depend_req(pjob, pparent, type, op,
						     SYNC_SCHED_HINT_NULL, release_req);
				if (rc)
					return rc;
				pparent = (struct depend_job *) GET_NEXT(pparent->dc_link);
			}
		}
		pdep = (struct depend *) GET_NEXT(pdep->dp_link);
	}
	return (0);
}

/**
 * @brief
 * 		set_depend_hold - set a hold on the job required by the type of dependency
 *
 * @param[in]	pjob	-	job
 * @param[in]	pattr	-	attribute structure
 */

static void
set_depend_hold(job *pjob, attribute *pattr)
{
	int loop = 1;
	char newstate;
	int newsubst;
	struct depend *pdp = NULL;
	int substate = -1;

	if (is_attr_set(pattr))
		pdp = (struct depend *) GET_NEXT(pattr->at_val.at_list);
	while (pdp && loop) {
		switch (pdp->dp_type) {
			case JOB_DEPEND_TYPE_AFTERSTART:
			case JOB_DEPEND_TYPE_AFTEROK:
			case JOB_DEPEND_TYPE_AFTERNOTOK:
			case JOB_DEPEND_TYPE_AFTERANY:
				if ((struct depend_job *) GET_NEXT(pdp->dp_jobs))
					substate = JOB_SUBSTATE_DEPNHOLD;
				break;

			case JOB_DEPEND_TYPE_ON:
				if (pdp->dp_numexp)
					substate = JOB_SUBSTATE_DEPNHOLD;
				break;
		}
		pdp = (struct depend *) GET_NEXT(pdp->dp_link);
	}
	if (substate == -1) {

		/* No (more) dependencies, clear system hold and set state */

		if ((check_job_substate(pjob, JOB_SUBSTATE_SYNCHOLD)) ||
		    (check_job_substate(pjob, JOB_SUBSTATE_DEPNHOLD))) {
			set_jattr_b_slim(pjob, JOB_ATR_hold, HOLD_s, DECR);
			svr_evaljobstate(pjob, &newstate, &newsubst, 0);
			svr_setjobstate(pjob, newstate, newsubst);
		}
	} else {

		/* there are dependencies, set system hold accordingly */

		set_jattr_b_slim(pjob, JOB_ATR_hold, HOLD_s, INCR);
		svr_setjobstate(pjob, JOB_STATE_LTR_HELD, substate);
	}
	return;
}

/**
 * @brief
 * 		find_depend - find a dependency struct of a certain type for a job
 *
 * @param[in]	type	-	type of dependency struct
 * @param[in]	pattr	-	attribute structure
 *
 * @return	dependent job structure
 * @retval	NULL	: fail
 */

struct depend *
find_depend(int type, attribute *pattr)
{
	struct depend *pdep = NULL;

	if (is_attr_set(pattr)) {
		pdep = (struct depend *) GET_NEXT(pattr->at_val.at_list);
		while (pdep) {
			if (pdep->dp_type == type)
				break;
			pdep = (struct depend *) GET_NEXT(pdep->dp_link);
		}
	}
	return (pdep);
}

/**
 * @brief
 * 		make_depend - allocate and attach a depend struct to the attribute
 *
 * @param[in]	type	-	type of dependency struct
 * @param[in,out]	pattr	-	attribute structure
 *
 * @return	dependent job structure
 * @retval	NULL	: fail
 */

static struct depend *
make_depend(int type, attribute *pattr)
{
	struct depend *pdep = NULL;

	pdep = (struct depend *) malloc(sizeof(struct depend));
	if (pdep) {
		clear_depend(pdep, type, 0);
		append_link(&pattr->at_val.at_list, &pdep->dp_link, pdep);
		post_attr_set(pattr);
	}
	return (pdep);
}

/**
 * @brief
 * 		register_dep - Some job wants to run before/after the local job, so set up
 *		a dependency on the local job.
 *
 * @param[in,out]	pattr	-	attribute structure
 * @param[in,out]	preq	-	request structure
 * @param[in]	type	-	type of dependency struct
 * @param[out]	made	-	0 if dependency is found else 1
 *
 * @return	error code
 * @retval	0	-	success
 * @reval	PBSE_SYSTEM	- fail
 */

static int
register_dep(attribute *pattr, struct batch_request *preq, int type, int *made)
{
	struct depend *pdep;
	struct depend_job *pdj;

	/* change into the mirror image type */

	type ^= (JOB_DEPEND_TYPE_BEFORESTART - JOB_DEPEND_TYPE_AFTERSTART);
	if ((pdep = find_depend(type, pattr)) == NULL) {
		if ((pdep = make_depend(type, pattr)) == NULL)
			return (PBSE_SYSTEM);
	}
	if ((pdj = find_dependjob(pdep,
				  preq->rq_ind.rq_register.rq_child)) != NULL) {
		(void) strcpy(pdj->dc_svr, preq->rq_ind.rq_register.rq_svr);
		*made = 0;
		return (0);
	} else if ((pdj = make_dependjob(pdep,
					 preq->rq_ind.rq_register.rq_child,
					 preq->rq_ind.rq_register.rq_svr)) ==
		   NULL) {
		return (PBSE_SYSTEM);
	} else
		*made = 1;
	return (0);
}

/**
 * @brief
 * 		unregister_dep - remove a registered dependency
 *		Results from a qalter call to remove existing dependencies
 *
 * @param[in]	pattr	-	attribute structure
 * @param[in]	preq	-	request structure
 *
 * @return	error code
 * @retval	0	: success
 * @retval	PBSE_IVALREQ	: Invalid request, dependency could not find.
 */
static int
unregister_dep(attribute *pattr, struct batch_request *preq)
{
	int type;
	struct depend *pdp;
	struct depend_job *pdjb;

	/* if dependency has mirroring effect, get mirror image of dependency type */
	if (preq->rq_ind.rq_register.rq_dependtype < JOB_DEPEND_TYPE_RUNONE)
		type = preq->rq_ind.rq_register.rq_dependtype ^
		       (JOB_DEPEND_TYPE_BEFORESTART - JOB_DEPEND_TYPE_AFTERSTART);
	else
		type = preq->rq_ind.rq_register.rq_dependtype;

	if (((pdp = find_depend(type, pattr)) == 0) ||
	    ((pdjb = find_dependjob(pdp, preq->rq_ind.rq_register.rq_child)) == NULL))
		return (PBSE_IVALREQ);

	del_depend_job(pdjb);
	return (0);
}

/**
 * @brief
 * 		find_dependjob - find a child dependent job with a certain job id
 *
 * @param[in]	pdep	-	dependent jobs
 * @param[in]	name	-	job id to be matched
 *
 * @return	child dependent job
 * @retval	NULL	: fail
 */

struct depend_job *
find_dependjob(struct depend *pdep, char *name)
{
	struct depend_job *pdj;

	if ((pdep == NULL) || (name == NULL))
		return NULL;

	pdj = (struct depend_job *) GET_NEXT(pdep->dp_jobs);
	while (pdj) {
		if (!strcmp(name, pdj->dc_child))
			break;

		pdj = (struct depend_job *) GET_NEXT(pdj->dc_link);
	}
	return (pdj);
}

/**
 * @brief
 * 		make_dependjob - add a depend_job structure
 *
 * @param[in,out]	pdep	-	ptr to head of depend list
 * @param[in]	jobid	-	child (dependent) job
 * @param[in]	host	-	server owning job
 *
 * @return	child dependent job
 */

static struct depend_job *
make_dependjob(struct depend *pdep, char *jobid, char *host)
{
	struct depend_job *pdj;

	pdj = (struct depend_job *) malloc(sizeof(struct depend_job));
	if (pdj) {

		CLEAR_LINK(pdj->dc_link);
		pdj->dc_state = 0;
		pdj->dc_cost = 0;
		(void) strcpy(pdj->dc_child, jobid);
		(void) strcpy(pdj->dc_svr, host);
		append_link(&pdep->dp_jobs, &pdj->dc_link, pdj);
	}
	return (pdj);
}

/**
 * @brief
 * 		send_depend_req - build and send a Register Dependent request
 *
 * @param[in]	pjob	-	job structure
 * @param[in]	pparent	-	parent job
 * @param[in]	type	-	dependency type
 * @param[in]	op	-	dependent job operation
 * @param[in]	schedhint	-	not used here
 * @param[in]	postfunc	-	call back function to issue_to_svr()
 *
 * @return	error code
 * @retval	0	: success
 * @retval	PBSE_BADHOST	: Unable to perform dependency
 * @retval	PBSE_SYSTEM	: malloc failed
 */

int
send_depend_req(job *pjob, struct depend_job *pparent, int type, int op, int schedhint, void (*postfunc)(struct work_task *))
{
	int i;
	char *pc;
	struct batch_request *preq;

	preq = alloc_br(PBS_BATCH_RegistDep);
	if (preq == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		return (PBSE_SYSTEM);
	}

	if (get_jattr_str(pjob, JOB_ATR_job_owner) == NULL)
		return PBSE_INTERNAL;

	for (i = 0; i < PBS_MAXUSER; ++i) {
		preq->rq_ind.rq_register.rq_owner[i] = get_jattr_str(pjob, JOB_ATR_job_owner)[i];
		if (preq->rq_ind.rq_register.rq_owner[i] == '@')
			break;
	}
	preq->rq_ind.rq_register.rq_owner[i] = '\0';
	strcpy(preq->rq_ind.rq_register.rq_parent, pparent->dc_child);
	strcpy(preq->rq_ind.rq_register.rq_child, pjob->ji_qs.ji_jobid);
	/* Append "@<server_name>" since server's name may not match host name */
	strcat(preq->rq_ind.rq_register.rq_child, "@");
	strcat(preq->rq_ind.rq_register.rq_child, pbs_server_name);
	/* kludge for server:port follows */
	if ((pc = strchr(server_name, (int) ':')) != NULL) {
		strcat(preq->rq_ind.rq_register.rq_child, pc);
	}
	preq->rq_ind.rq_register.rq_dependtype = type;
	preq->rq_ind.rq_register.rq_op = op;
	strcpy(preq->rq_host, pparent->dc_svr); /* for issue_to_svr() */

	preq->rq_ind.rq_register.rq_cost = 0;

	if (issue_to_svr(pparent->dc_svr, preq, postfunc) == -1) {
		sprintf(log_buffer, "Unable to perform dependency with job %s", pparent->dc_child);
		return (PBSE_BADHOST);
	}
	return (0);
}

/*
 * This section contains general function for dependency attributes
 *
 * Each attribute has functions for:
 *	Decoding the value string to the machine representation.
 *	Encoding the internal representation of the attribute to external
 *	Setting the value by =, + or - operators.
 *	Comparing a (decoded) value with the attribute value.
 *	Freeing the space malloc-ed to the attribute value.
 *
 * The prototypes are declared in "attribute.h"
 *
 * ----------------------------------------------------------------------------
 * Attribute functions for attributes of type "dependency".
 *
 * The "encoded" or external form of the value is a string with sub-strings
 * separated by commas and terminated by a null.
 *
 * The "decoded" or internal form is a list of depend (and depend_child)
 * structures, which are defined in job.h.
 * ----------------------------------------------------------------------------
 */

struct dependnames {
	int type;
	char *name;
} dependnames[] = {
	{JOB_DEPEND_TYPE_AFTERSTART, "after"},
	{JOB_DEPEND_TYPE_AFTEROK, "afterok"},
	{JOB_DEPEND_TYPE_AFTERNOTOK, "afternotok"},
	{JOB_DEPEND_TYPE_AFTERANY, "afterany"},
	{JOB_DEPEND_TYPE_BEFORESTART, "before"},
	{JOB_DEPEND_TYPE_BEFOREOK, "beforeok"},
	{JOB_DEPEND_TYPE_BEFORENOTOK, "beforenotok"},
	{JOB_DEPEND_TYPE_BEFOREANY, "beforeany"},
	{JOB_DEPEND_TYPE_ON, "on"},
	{JOB_DEPEND_TYPE_RUNONE, "runone"},
	{-1, NULL}};

/**
 * @brief
 * 		decode_depend - decode a string into an attr of type dependency
 *		String is of form: depend_type:job_id[:job_id:...][,depend_type:job_id]
 *
 * @param[out]	patr	-	an attr of type dependency
 * @param[in]	name	-	attribute name
 * @param[in]	rescn	-	resource name, unused here
 * @param[in]	val	-	attribute value
 *
 * @return	error code
 * @retval	0	: ok
 * @retval	>0	: error
 */

int
decode_depend(attribute *patr, char *name, char *rescn, char *val)
{
	int rc;
	char *valwd;

	if ((val == NULL) || (*val == 0)) {
		free_depend(patr);
		patr->at_flags |= ATR_VFLAG_MODIFY;
		return (0);
	}

	/*
	 * for each sub-string (terminated by comma or new-line),
	 * add a depend or depend_child structure.
	 */
	valwd = parse_comma_string(val);
	while (valwd) {
		if ((rc = build_depend(patr, valwd)) != 0) {
			free_depend(patr);
			return (rc);
		}
		valwd = parse_comma_string(NULL);
	}

	post_attr_set(patr);
	return (0);
}

/**
 * @brief
 * 		cpy_jobsvr() - a version of strcpy() that watches for an embedded colon
 *		and escapes it with a leading blackslash.  This is needed because
 *		the colon is overloaded, both as job_id separator within a set of
 *		depend jobs, and as the server:port separator.  Ugh!
 *
 * @param[in,out]	d	-	destination string
 * @param[in,out]	s	-	source string
 */

static void
cpy_jobsvr(char *d, char *s)
{
	while (*d)
		d++;

	while (*s) {
		if (*s == ':')
			*d++ = '\\';
		*d++ = *s++;
	}
	*d = '\0';
}

/**
 * @brief
 * 		dup_depend - duplicate a dependency (see set_depend())
 *
 * @param[in,out]	pattr	-	attribute structure
 * @param[in]	pd	-	ptr dependency list
 *
 * @return	int
 * @retval	0	: success
 */

static int
dup_depend(attribute *pattr, struct depend *pd)
{
	struct depend *pnwd;
	struct depend_job *poldj;
	struct depend_job *pnwdj;
	int type;

	type = pd->dp_type;
	if ((pnwd = make_depend(type, pattr)) == 0)
		return (-1);

	pnwd->dp_numexp = pd->dp_numexp;
	pnwd->dp_numreg = pd->dp_numreg;
	pnwd->dp_released = pd->dp_released;
	pnwd->dp_numrun = pd->dp_numrun;
	for (poldj = (struct depend_job *) GET_NEXT(pd->dp_jobs); poldj;
	     poldj = (struct depend_job *) GET_NEXT(poldj->dc_link)) {
		if ((pnwdj = make_dependjob(pnwd, poldj->dc_child,
					    poldj->dc_svr)) == 0)
			return (-1);
		pnwdj->dc_state = poldj->dc_state;
		pnwdj->dc_cost = poldj->dc_cost;
	}

	return (0);
}

/**
 * @brief
 * 		encode_depend - encode dependency attr into attrlist entry
 *
 * @param[in]	attr	-	ptr to attribute to encode
 * @param[in,out]	phead	-	ptr to head of attrlist list
 * @param[in]	atname	-	attribute name
 * @param[in]	rsname	-	resource name or null
 * @param[in]	mode	-	ncode mode, unused here
 * @param[out]	rtnl	-	Return ptr to svrattrl
 *
 * @return	error code
 * @retval	>0	: ok, entry created and linked into list
 * @retval	=0	: no value to encode, entry not created
 * @retval	-1	: if error
 */
/*ARGSUSED*/

int
encode_depend(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	int ct = 0;
	char cvtbuf[22];
	int numdep = 0;
	struct depend *nxdp;
	struct svrattrl *pal;
	struct depend *pdp;
	struct depend_job *pdjb = NULL;
	struct dependnames *pn;

	if (!attr)
		return (-1);
	if (!(is_attr_set(attr)))
		return (0); /* no values */

	pdp = (struct depend *) GET_NEXT(attr->at_val.at_list);
	if (pdp == NULL)
		return (0);

	/* scan dependencies types to compute needed base size of svrattrl */

	for (nxdp = pdp; nxdp; nxdp = (struct depend *) GET_NEXT(nxdp->dp_link)) {
		if (nxdp->dp_type == JOB_DEPEND_TYPE_ON)
			ct += 30; /* a guess at a reasonable amt of spece */
		else {
			ct += 12; /* for longest type */
			pdjb = (struct depend_job *) GET_NEXT(nxdp->dp_jobs);
			while (pdjb) {
				ct += PBS_MAXSVRJOBID + PBS_MAXSERVERNAME + 3;
				pdjb = (struct depend_job *) GET_NEXT(pdjb->dc_link);
			}
		}
	}

	if ((pal = attrlist_create(atname, rsname, ct)) == NULL) {
		return (-1);
	}
	*pal->al_value = '\0';
	for (nxdp = pdp; nxdp; nxdp = (struct depend *) GET_NEXT(nxdp->dp_link)) {
		if ((nxdp->dp_type != JOB_DEPEND_TYPE_ON) &&
		    !(pdjb = (struct depend_job *) GET_NEXT(nxdp->dp_jobs)))
			continue; /* no value, skip this one */
		if (nxdp != pdp)
			strcat(pal->al_value, ","); /* comma between */
		pn = &dependnames[nxdp->dp_type];
		strcat(pal->al_value, pn->name);
		if (pn->type == JOB_DEPEND_TYPE_ON) {
			sprintf(cvtbuf, ":%d", nxdp->dp_numexp);
			strcat(pal->al_value, cvtbuf);
		} else {
			while (pdjb) {
				strcat(pal->al_value, ":");
				cpy_jobsvr(pal->al_value, pdjb->dc_child);
				if (*pdjb->dc_svr != '\0') {
					strcat(pal->al_value, "@");
					cpy_jobsvr(pal->al_value, pdjb->dc_svr);
				}
				pdjb = (struct depend_job *) GET_NEXT(pdjb->dc_link);
			}
		}
		++numdep;
	}
	if (numdep) {
		/* there are dependencies recorded, added to the list	*/
		pal->al_flags = attr->at_flags;
		append_link(phead, &pal->al_link, pal);
		if (rtnl)
			*rtnl = pal;
		return (1);
	} else {
		/* there are no dependencies, just the base structure,	*/
		/* so remove this svrattrl from ths list		*/
		(void) free(pal);
		if (rtnl)
			*rtnl = NULL;
		return (0);
	}
}

/**
 * @brief
 * 		set_depend - set value of attribute of dependency type to another
 * @par Functionality:
 *		A=B --> set of dependencies in A replaced by set in B
 *		A+B --> dependencies in B added to list in A
 *		A-B --> not defined
 *
 * @param[in,out]	pattr	-	attribute structure
 * @param[in]	new	-	ptr dependency list
 * @param[in]	op	-	operation which needs to be performed
 * 						Ex. SET, INCR, DECR.
 *
 * @return	error code
 * @retval	0	: ok
 * @retval	>0	: error
 */

int
set_depend(attribute *attr, attribute *new, enum batch_op op)
{
	struct depend *pdnew;
	struct depend *pdold;
	int rc;

	assert(attr && new);

	switch (op) {
		case SET:

			/*
			 * if the type of dependency entry already exists, we are
			 * going to replace it, so get rid of the old and dup the new
			 */

			pdnew = (struct depend *) GET_NEXT(new->at_val.at_list);
			while (pdnew) {
				pdold = find_depend(pdnew->dp_type, attr);
				if (pdold)
					del_depend(pdold);
				if ((rc = dup_depend(attr, pdnew)) != 0)
					return (rc);
				pdnew = (struct depend *) GET_NEXT(pdnew->dp_link);
			}
			break;

		case INCR: /* not defined */
		case DECR: /* not defined */
		default:
			return (PBSE_IVALREQ);
	}
	post_attr_set(attr);
	return (0);
}

/*
 * comp_depend - compare two attributes of type dependency
 *	This operation is undefined.
 *
 *	Returns: 0
 *		+1
 *		-1
 */

int
comp_depend(attribute *attr, attribute *with)
{

	return (-1);
}
/**
 * @brief
 * 		free_depend	-	free the dependency link and dependent jobs from the
 * 						list of resources in the attribute structure.
 *
 * @param[in,out]	attr	-	attribute structure which contains the resource list to be freed
 */
void
free_depend(attribute *attr)
{
	struct depend *pdp;
	struct depend_job *pdjb;

	while ((pdp = (struct depend *)
			GET_NEXT(attr->at_val.at_list)) != NULL) {
		while ((pdjb = (struct depend_job *)
				GET_NEXT(pdp->dp_jobs)) != NULL) {
			delete_link(&pdjb->dc_link);
			(void) free(pdjb);
		}
		delete_link(&pdp->dp_link);
		(void) free(pdp);
	}
	/* free any data cached for stats */
	if (attr->at_user_encoded != NULL || attr->at_priv_encoded != NULL) {
		free_svrcache(attr);
	}
	mark_attr_not_set(attr);
}

/**
 * @brief
 * 		build_depend -  build a dependency structure
 * 		parse the string and turn it into a list of depend structures
 *
 * @param[in,out]	attr	-	attribute structure which contains the dependency structure
 * @param[in]	value	-	attribute value which is a set of sub-string (terminated by comma or new-line)
 *
 * @return	error code
 * @retval	0	: success
 * @retval	non-zero	: error number
 */

static int
build_depend(attribute *pattr, char *value)
{
	char fhn[PBS_MAXHOSTNAME + 1];
	struct depend *have[JOB_DEPEND_NUMBER_TYPES];
	int i;
	int numwds;
	struct depend *pd;
	struct depend_job *pdjb;
	struct dependnames *pname;
	char *pwhere;
	char *valwd;
	char *nxwrd;
	int type;

	/*
	 * Map first subword into dependency type.
	 */

	if ((nxwrd = strchr(value, (int) ':')) != NULL)
		*nxwrd++ = '\0';
	else
		/* dependency can never be without ':<value>' */
		return (PBSE_BADATVAL);

	if (*nxwrd == '\0')
		/* dependency can never be without a job-id or a number */
		return (PBSE_BADATVAL);

	for (pname = dependnames; pname->type != -1; pname++)
		if (!strcmp(value, pname->name))
			break;

	if (pname->type == -1)
		return (PBSE_BADATVAL);
	type = pname->type;

	/* what types do we have already? */

	for (i = 0; i < JOB_DEPEND_NUMBER_TYPES; i++)
		have[i] = NULL;
	for (pd = (struct depend *) GET_NEXT(pattr->at_val.at_list);
	     pd; pd = (struct depend *) GET_NEXT(pd->dp_link))
		have[pd->dp_type] = pd;

	if ((pd = have[type]) == NULL) {
		pd = make_depend(type, pattr);
		if (pd == NULL)
			return (PBSE_SYSTEM);
	}

	/* now process the value string */

	numwds = 0;
	while (nxwrd && (*nxwrd != '\0')) {

		numwds++; /* number of arguments */
		valwd = nxwrd;

		/* find end of next word delimited by a : but not a '\:' */

		while (((*nxwrd != ':') || (*(nxwrd - 1) == '\\')) && *nxwrd)
			nxwrd++;
		if (*nxwrd)
			*nxwrd++ = '\0';

		/* now process word (argument) depending on "depend type" */

		if (type == JOB_DEPEND_TYPE_ON) {

			/* a single word argument, a count */

			if (numwds == 1) {
				pd->dp_numexp = strtol(valwd, &pwhere, 10);
				if ((pd->dp_numexp < 1) ||
				    (pwhere && (*pwhere != '\0'))) {
					return (PBSE_BADATVAL);
				}
			} else {
				return (PBSE_BADATVAL);
			}

		} else { /* all other dependency types */

			/* a set of job_id[\:port][@server[\:port]] */

			pdjb = (struct depend_job *) malloc(sizeof(*pdjb));
			if (pdjb) {
				CLEAR_LINK(pdjb->dc_link);
				pdjb->dc_state = 0;
				pdjb->dc_cost = 0;
				pdjb->dc_svr[0] = '\0';
				pwhere = pdjb->dc_child;

				while (*valwd) {
					if (*valwd == '@') { /* switch to @server */
						*pwhere = '\0';
						pwhere = pdjb->dc_svr;
					} else if ((*valwd == '\\') && (*(valwd + 1) == ':')) {
						*pwhere++ = *++valwd; /* skip over '\' */
					} else {
						*pwhere++ = *valwd; /* copy jobid */
					}
					++valwd;
				}
				*pwhere = '\0';

				if (pdjb->dc_svr[0] == '\0') {
					pwhere = strchr(pdjb->dc_child, (int) '.');
					if (pwhere) {
						pwhere++;
						if (strncmp(pwhere, pbs_conf.pbs_server_name, PBS_MAXSERVERNAME) == 0) {
							(void) strcpy(pdjb->dc_svr, pbs_default());
						} else if (get_fullhostname(pwhere, fhn, (sizeof(fhn) - 1)) == 0) {
							(void) strcpy(pdjb->dc_svr, fhn);
						} else {
							(void) free(pdjb);
							return (PBSE_BADATVAL);
						}
					} else {
						(void) free(pdjb);
						return (PBSE_BADATVAL);
					}
				}

				append_link(&pd->dp_jobs, &pdjb->dc_link, pdjb);
			} else {
				return (PBSE_SYSTEM);
			}
		}
	}

	return (0);
}

/**
 * @brief
 * 		clear_depend - clear a single dependency set
 *		If the "exist" flag is set, any depend_job sub-structures are freed.
 *
 * @param[out]	pd	-	a single dependency set
 * @param[in]	type	-	freed dependency type
 * @param[in]	exist	-	If the "exist" flag is set,
 * 							any depend_job sub-structures are freed.
 */

static void
clear_depend(struct depend *pd, int type, int exist)
{
	struct depend_job *pdj;

	if (exist) {
		while ((pdj = (struct depend_job *)
				GET_NEXT(pd->dp_jobs)) != NULL) {
			del_depend_job(pdj);
		}
	} else {
		CLEAR_HEAD(pd->dp_jobs);
		CLEAR_LINK(pd->dp_link);
	}
	pd->dp_type = type;
	pd->dp_numexp = 0;
	pd->dp_numreg = 0;
	pd->dp_released = 0;
	pd->dp_numrun = 0;
}

/**
 * @brief
 * 		del_depend - delete a single dependency set, including any depend_jobs
 *
 * @param[in,out]	pd	-	a single dependency set
 */

static void
del_depend(struct depend *pd)
{
	struct depend_job *pdj;

	while ((pdj = (struct depend_job *) GET_NEXT(pd->dp_jobs)) != NULL) {
		del_depend_job(pdj);
	}
	delete_link(&pd->dp_link);
	(void) free(pd);
}

/**
 * @brief
 * 		del_depend_job - delete a single depend_job structure
 *
 *  @param[in,out]	pdj	-	a single depend_job structure
 */

static void
del_depend_job(struct depend_job *pdj)
{
	delete_link(&pdj->dc_link);
	(void) free(pdj);
}


================================================
FILE: src/server/req_rerun.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    req_rerun.c
 *
 * @brief
 * 		req_rerun.c - functions dealing with a Rerun Job Request
 *
 * Included functions are:
 * 	post_rerun()
 * 	force_reque()
 * 	req_rerunjob()
 * 	timeout_rerun_request()
 * 	req_rerunjob2()
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include "libpbs.h"
#include <signal.h>
#include "server_limits.h"
#include "list_link.h"
#include "work_task.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "pbs_error.h"
#include "log.h"
#include "acct.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "net_connect.h"

/* Private Function local to this file */
static int req_rerunjob2(struct batch_request *preq, job *pjob);

/* Global Data Items: */

extern char *msg_manager;
extern char *msg_jobrerun;
extern time_t time_now;
extern job *chk_job_request(char *, struct batch_request *, int *, int *);

/**
 * @brief
 * 		post_rerun - handler for reply from mom on signal_job sent in req_rerunjob
 *		If mom acknowledged the signal, then all is ok.
 *		If mom rejected the signal for unknown jobid, and force is set by the
 *		original client for a non manager as indicated by the preq->rq_extra being zero,
 *		then do local requeue.
 *
 * @param[in]	pwt	-	work task structure which contains the reply from mom
 */

void
post_rerun(struct work_task *pwt)
{
	job *pjob;
	struct batch_request *preq;
	struct depend *pdep;

	preq = (struct batch_request *) pwt->wt_parm1;

	pjob = find_job(preq->rq_ind.rq_signal.rq_jid);

	if (pjob != NULL) {
		if (preq->rq_reply.brp_code != 0) {
			sprintf(log_buffer, "rerun signal reject by mom: %d",
				preq->rq_reply.brp_code);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
				  preq->rq_ind.rq_signal.rq_jid, log_buffer);

			if (pjob->ji_pmt_preq != NULL)
				reply_preempt_jobs_request(preq->rq_reply.brp_code, PREEMPT_METHOD_REQUEUE, pjob);
		} else {
			/* mom acknowledged to rerun the job, release depend hold on run-one dependency */
			pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, get_jattr(pjob, JOB_ATR_depend));
			if (pdep != NULL)
				depend_runone_release_all(pjob);
		}
	}

	release_req(pwt);
	return;
}

/**
 * @brief
 * 		force_reque - requeue (rerun) a job
 *
 * @param[in,out]	pwt	-	job which needs to be rerun
 */
void
force_reque(job *pjob)
{
	char newstate;
	int newsubstate;
	struct batch_request *preq;
	char hook_msg[HOOK_MSG_SIZE] = {0};
	int rc;

	pjob->ji_qs.ji_obittime = time_now;
	set_jattr_l_slim(pjob, JOB_ATR_obittime, pjob->ji_qs.ji_obittime, SET);

	/* Allocate space for the jobobit hook event params */
	preq = alloc_br(PBS_BATCH_JobObit);
	if (preq == NULL) {
		log_err(PBSE_INTERNAL, __func__, "rq_jobobit alloc failed");
	} else {
		preq->rq_ind.rq_obit.rq_pjob = pjob;
		rc = process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
		if (rc == -1) {
			log_err(-1, __func__, "rq_jobobit force_reque process_hooks call failed");
		}
		free_br(preq);
	}

	pjob->ji_momhandle = -1;
	pjob->ji_mom_prot = PROT_INVALID;

	if ((is_jattr_set(pjob, JOB_ATR_resc_released))) {
		/* If JOB_ATR_resc_released attribute is set and we are trying to rerun a job
		 * then we need to reassign resources first because
		 * when we suspend a job we don't decrement all the resources.
		 * So we need to set partially released resources
		 * back again to release all other resources
		 */
		set_resc_assigned(pjob, 0, INCR);
		free_jattr(pjob, JOB_ATR_resc_released);
		mark_jattr_not_set(pjob, JOB_ATR_resc_released);
		if (is_jattr_set(pjob, JOB_ATR_resc_released_list)) {
			free_jattr(pjob, JOB_ATR_resc_released_list);
			mark_jattr_not_set(pjob, JOB_ATR_resc_released_list);
		}
	}

	/* simulate rerun: free nodes, clear checkpoint flag, and */
	/* clear exec_vnode string				  */

	rel_resc(pjob);

	/* note in accounting file */
	account_jobend(pjob, pjob->ji_acctrec, PBS_ACCT_RERUN);

	/*
	 * Clear any JOB_SVFLG_Actsuspd flag too, as the job is no longer
	 * suspended (User busy).  A suspended job is rerun in case of a
	 * MOM failure after the workstation becomes active(busy).
	 */
	pjob->ji_qs.ji_svrflags &= ~(JOB_SVFLG_Actsuspd | JOB_SVFLG_StagedIn | JOB_SVFLG_CHKPT);
	free_jattr(pjob, JOB_ATR_exec_host);
	free_jattr(pjob, JOB_ATR_exec_host2);
	free_jattr(pjob, JOB_ATR_exec_vnode);
	/* job dir has no meaning for re-queued jobs, so unset it */
	free_jattr(pjob, JOB_ATR_jobdir);
	unset_extra_attributes(pjob);
	svr_evaljobstate(pjob, &newstate, &newsubstate, 1);
	svr_setjobstate(pjob, newstate, newsubstate);
}

/**
 * @brief
 * 		req_rerunjob - service the Rerun Job Request
 *
 *		This request Reruns a job by:
 *		sending to MOM a signal job request with SIGKILL
 *		marking the job as being rerun by setting the substate.
 *
 *  @param[in,out]	preq	-	Job Request
 */

void
req_rerunjob(struct batch_request *preq)
{
	int anygood = 0;
	int i;
	char jid[PBS_MAXSVRJOBID + 1];
	int jt; /* job type */
	char sjst;
	char *pc;
	job *pjob;
	job *parent;
	char *range;
	int start;
	int end;
	int step;
	int count;
	int err = PBSE_NONE;

	snprintf(jid, sizeof(jid), "%s", preq->rq_ind.rq_signal.rq_jid);
	parent = chk_job_request(jid, preq, &jt, &err);
	if (parent == NULL) {
		pjob = find_job(jid);
		if (pjob != NULL && pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(err, PREEMPT_METHOD_REQUEUE, pjob);
		return; /* note, req_reject already called */
	}

	if ((preq->rq_perm & (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0) {
		if (parent->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_BADSTATE, PREEMPT_METHOD_REQUEUE, parent);
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	if (jt == IS_ARRAY_NO) {

		/* just a regular job, pass it on down the line and be done */

		req_rerunjob2(preq, parent);
		return;

	} else if (jt == IS_ARRAY_Single) {
		/* single subjob, if running can signal */
		pjob = get_subjob_and_state(parent, get_index_from_jid(jid), &sjst, NULL);
		if (sjst == JOB_STATE_LTR_UNKNOWN) {
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		} else if (pjob && sjst == JOB_STATE_LTR_RUNNING) {
			req_rerunjob2(preq, pjob);
		} else {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
		return;

	} else if (jt == IS_ARRAY_ArrayJob) {

		/* The Array Job itself ... */

		if (!check_job_state(parent, JOB_STATE_LTR_BEGUN)) {
			if (parent->ji_pmt_preq != NULL)
				reply_preempt_jobs_request(PBSE_BADSTATE, PREEMPT_METHOD_REQUEUE, parent);
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}

		/* for each subjob that is running, call req_rerunjob2 */

		++preq->rq_refct; /* protect the request/reply struct */

		/* Setting deleted subjobs count to 0,
		 * since all the deleted subjobs will be moved to Q state
		 */
		parent->ji_ajinfo->tkm_dsubjsct = 0;

		for (i = parent->ji_ajinfo->tkm_start; i <= parent->ji_ajinfo->tkm_end; i += parent->ji_ajinfo->tkm_step) {
			pjob = get_subjob_and_state(parent, i, &sjst, NULL);
			if (sjst == JOB_STATE_LTR_UNKNOWN)
				continue;
			if (pjob) {
				if (sjst == JOB_STATE_LTR_RUNNING)
					dup_br_for_subjob(preq, pjob, req_rerunjob2);
				else
					force_reque(pjob);
			} else {
				update_sj_parent(parent, NULL, create_subjob_id(parent->ji_qs.ji_jobid, i), sjst, JOB_STATE_LTR_QUEUED);
			}
		}
		/* if not waiting on any running subjobs, can reply; else */
		/* it is taken care of when last running subjob responds  */
		if (--preq->rq_refct == 0)
			reply_send(preq);
		return;
	}
	/* what's left to handle is a range of subjobs, foreach subjob
	 * if running, all req_rerunjob2
	 */

	range = get_range_from_jid(jid);
	if (range == NULL) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	/* now do the deed */

	++preq->rq_refct; /* protect the request/reply struct */

	while (1) {
		if ((i = parse_subjob_index(range, &pc, &start, &end, &step, &count)) == -1) {
			req_reject(PBSE_IVALREQ, 0, preq);
			break;
		} else if (i == 1)
			break;
		for (i = start; i <= end; i += step) {
			pjob = get_subjob_and_state(parent, i, &sjst, NULL);
			if (pjob && sjst == JOB_STATE_LTR_RUNNING) {
				anygood++;
				dup_br_for_subjob(preq, pjob, req_rerunjob2);
			}
		}
		range = pc;
	}

	if (anygood == 0) {
		preq->rq_refct--;
		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}

	/* if not waiting on any running subjobs, can reply; else */
	/* it is taken care of when last running subjob responds  */
	if (--preq->rq_refct == 0)
		reply_send(preq);
	return;
}

/**
 * @brief
 * 		Function that causes a rerun request to return with a timeout message.
 *
 * @param[in,out]	pwt	-	work task which contains the job structure which holds the rerun request
 */
static void
timeout_rerun_request(struct work_task *pwt)
{
	job *pjob = (job *) pwt->wt_parm1;
	conn_t *conn = NULL;

	if ((pjob == NULL) || (pjob->ji_rerun_preq == NULL)) {
		return; /* nothing to timeout */
	}
	if (pjob->ji_rerun_preq->rq_conn != PBS_LOCAL_CONNECTION) {
		conn = get_conn(pjob->ji_rerun_preq->rq_conn);
	}
	reply_text(pjob->ji_rerun_preq, PBSE_INTERNAL,
		   "Response timed out. Job rerun request still in progress for");

	/* clear no-timeout flag on connection */
	if (conn)
		conn->cn_authen &= ~PBS_NET_CONN_NOTIMEOUT;

	pjob->ji_rerun_preq = NULL;
}
/**
 * @brief
 * 		req_rerunjob - service the Rerun Job Request
 *
 *  @param[in,out]	preq	-	Job Request
 *  @param[in,out]	pjob	-	ptr to the subjob
 *
 * @return int
 * @retval 0 for Success
 * @retval 1 for Error
 */
static int
req_rerunjob2(struct batch_request *preq, job *pjob)
{
	long force = 0;
	struct work_task *ptask;
	time_t rerun_to;
	conn_t *conn;
	struct depend *pdep;
	int rc;

	if (preq->rq_extend && (strcmp(preq->rq_extend, "force") == 0))
		force = 1;

	/* the job must be rerunnable or force must be on */

	if ((get_jattr_long(pjob, JOB_ATR_rerunable) == 0) &&
	    (force == 0)) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_NORERUN, PREEMPT_METHOD_REQUEUE, pjob);
		req_reject(PBSE_NORERUN, 0, preq);
		return 1;
	}

	/* the job must be running */

	if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_BADSTATE, PREEMPT_METHOD_REQUEUE, pjob);

		req_reject(PBSE_BADSTATE, 0, preq);
		return 1;
	}
	/* a node failure tolerant job could be waiting for healthy nodes
	 * and it would have a JOB_SUBSTATE_PRERUN substate.
	 */
	if ((!check_job_substate(pjob, JOB_SUBSTATE_RUNNING)) &&
	    (!check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) && (force == 0)) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_BADSTATE, PREEMPT_METHOD_REQUEUE, pjob);
		req_reject(PBSE_BADSTATE, 0, preq);
		return 1;
	}

	/* ask MOM to kill off the job */

	rc = issue_signal(pjob, SIG_RERUN, post_rerun, NULL);

	/*
	 * If force is set and request is from a PBS manager,
	 * job is re-queued regardless of issue_signal to MoM
	 * was a success or failure.
	 * Eventually, when the mom updates server about the job,
	 * server sends a discard message to mom and job is
	 * then deleted from mom as well.
	 */
	if (force == 1) {
		/* Mom is down and issue signal failed or
		 * request is from a manager and "force" is on,
		 * force the requeue */
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(rc, PREEMPT_METHOD_REQUEUE, pjob);

		pjob->ji_qs.ji_un.ji_exect.ji_exitstat = JOB_EXEC_RERUN;
		set_job_substate(pjob, JOB_SUBSTATE_RERUN3);

		discard_job(pjob, "Force rerun", 0);
		pjob->ji_discarding = 1;
		/**
		 * force_reque will be called in post_discard_job,
		 * after receiving IS_DISCARD_DONE from the MOM.
		 */
		pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, get_jattr(pjob, JOB_ATR_depend));
		if (pdep != NULL)
			depend_runone_release_all(pjob);
		reply_ack(preq);
		return 0;
	}

	if (rc != 0) {
		if (pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(rc, PREEMPT_METHOD_REQUEUE, pjob);
		req_reject(rc, 0, preq);
		return 1;
	}

	/* So job has run and is to be rerun (not restarted) */

	pjob->ji_qs.ji_svrflags = (pjob->ji_qs.ji_svrflags &
				   ~(JOB_SVFLG_CHKPT | JOB_SVFLG_ChkptMig)) |
				  JOB_SVFLG_HASRUN;
	svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_RERUN);

	sprintf(log_buffer, msg_manager, msg_jobrerun,
		preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);

	/* The following means we've detected an outstanding rerun request  */
	/* for the same job which should not happen. But if it does, let's  */
	/* ack that previous request to also free up its request structure. */
	if (pjob->ji_rerun_preq != NULL) {
		reply_ack(pjob->ji_rerun_preq);
	}
	pjob->ji_rerun_preq = preq;

	/* put a timeout on the rerun request so that it doesn't hang 	*/
	/* indefinitely; if it does, the scheduler would also hang on a */
	/* requeue request  */
	time_now = time(NULL);
	if (!is_sattr_set(SVR_ATR_JobRequeTimeout))
		rerun_to = time_now + PBS_DIS_TCP_TIMEOUT_RERUN;
	else
		rerun_to = time_now + get_sattr_long(SVR_ATR_JobRequeTimeout);
	ptask = set_task(WORK_Timed, rerun_to, timeout_rerun_request, pjob);
	if (ptask) {
		/* this ensures that the ptask created gets cleared in case */
		/* pjob gets deleted before the task is served */
		append_link(&pjob->ji_svrtask, &ptask->wt_linkobj, ptask);
	}

	/* set no-timeout flag on connection to client */
	if (preq->rq_conn != PBS_LOCAL_CONNECTION) {
		conn = get_conn(preq->rq_conn);
		if (conn)
			conn->cn_authen |= PBS_NET_CONN_NOTIMEOUT;
	}

	return 0;
}


================================================
FILE: src/server/req_rescq.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/*
 * @file	req_rescq.c
 *
 * @brief
 * 	req_rescq.c	-	Functions relating to the Resource Query Batch Request.
 *
 * Included functions are:
 *	resv_idle_delete()
 *	cnvrt_qmove()
 *	resv_timer_init()
 *	assign_resv_resc()
 *	req_confirmresv()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include "libpbs.h"
#include <ctype.h>
#include <errno.h>
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server.h"
#include "batch_request.h"
#include "resv_node.h"
#include "pbs_nodes.h"
#include "queue.h"
#include "job.h"
#include "reservation.h"
#include "sched_cmds.h"
#include "work_task.h"
#include "credential.h"
#include "pbs_error.h"
#include "svrfunc.h"
#include "log.h"
#include "acct.h"
#include "pbs_license.h"
#include "libutil.h"

/* forward definitions to keep the compiler happy */
struct name_and_val {
	char *pn;
	char *pv;
};

int gen_task_Time4resv(resc_resv *);
void revert_alter_reservation(resc_resv *presv);

extern int svr_totnodes;
extern time_t time_now;

extern int cnvrt_local_move(job *, struct batch_request *);

/**
 * @brief work task to delete reservation if there are no jobs in the reservation queue
 *
 * @param[in] ptask - work task
 *
 */
void
resv_idle_delete(struct work_task *ptask)
{
	resc_resv *presv;
	int num_jobs;

	presv = ptask->wt_parm1;

	if (presv == NULL)
		return;

	num_jobs = presv->ri_qp->qu_numjobs;
	if (svr_chk_history_conf()) {
		num_jobs -= (presv->ri_qp->qu_njstate[JOB_STATE_MOVED] + presv->ri_qp->qu_njstate[JOB_STATE_FINISHED] +
			     presv->ri_qp->qu_njstate[JOB_STATE_EXPIRED]);
	}

	if (num_jobs == 0) {
		log_eventf(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_DEBUG, presv->ri_qs.ri_resvID,
			   "Deleting reservation after being idle for %d seconds",
			   get_rattr_long(presv, RESV_ATR_del_idle_time));
		gen_future_deleteResv(presv, 1);
	}
}

/**
 * @brief if there are no jobs in the reservation queue, set a timer to delete the reservation
 *
 * @param[in]	presv - pointer to reservation
 */
void
set_idle_delete_task(resc_resv *presv)
{
	struct work_task *wt;
	long retry_time;
	int num_jobs;

	if (presv == NULL)
		return;

	if (!is_rattr_set(presv, RESV_ATR_del_idle_time))
		return;

	num_jobs = presv->ri_qp->qu_numjobs;
	if (svr_chk_history_conf()) {
		num_jobs -= (presv->ri_qp->qu_njstate[JOB_STATE_MOVED] + presv->ri_qp->qu_njstate[JOB_STATE_FINISHED] +
			     presv->ri_qp->qu_njstate[JOB_STATE_EXPIRED]);
	}

	if (num_jobs == 0 && presv->ri_qs.ri_state == RESV_RUNNING) {
		delete_task_by_parm1_func(presv, resv_idle_delete, DELETE_ONE); /* Delete the previous task if it exists */
		retry_time = time_now + get_rattr_long(presv, RESV_ATR_del_idle_time);
		if (retry_time < presv->ri_qs.ri_etime) {
			wt = set_task(WORK_Timed, retry_time, resv_idle_delete, presv);
			append_link(&presv->ri_svrtask, &wt->wt_linkobj, wt);
		}
	}
}

/**
 * @brief
 *		qmove a job into a reservation
 *
 * @parm[in]	presv	-	reservation structure
 *
 * @return	int
 *
 * @retval	0	: Success
 * @retval	-1	: Failure
 *
 */
int
cnvrt_qmove(resc_resv *presv)
{
	int rc;
	struct job *pjob;
	char *q_job_id, *at;
	struct batch_request *reqcnvrt;

	if (gen_task_EndResvWindow(presv)) {
		(void) resv_purge(presv);
		return (-1);
	}

	pjob = find_job(get_rattr_str(presv, RESV_ATR_convert));
	if (pjob != NULL)
		q_job_id = pjob->ji_qs.ji_jobid;
	else {
		(void) resv_purge(presv);
		return (-1);
	}
	if ((reqcnvrt = alloc_br(PBS_BATCH_MoveJob)) == NULL) {
		(void) resv_purge(presv);
		return (-1);
	}
	reqcnvrt->rq_perm = (presv->ri_brp)->rq_perm;
	strcpy(reqcnvrt->rq_user, (presv->ri_brp)->rq_user);
	strcpy(reqcnvrt->rq_host, (presv->ri_brp)->rq_host);

	snprintf(reqcnvrt->rq_ind.rq_move.rq_jid, sizeof(reqcnvrt->rq_ind.rq_move.rq_jid), "%s", q_job_id);
	at = strchr(presv->ri_qs.ri_resvID, (int) '.');
	if (at)
		*at = '\0';

	snprintf(reqcnvrt->rq_ind.rq_move.rq_destin, sizeof(reqcnvrt->rq_ind.rq_move.rq_destin), "%s", presv->ri_qs.ri_resvID);
	if (at)
		*at = '.';

	snprintf(pjob->ji_qs.ji_destin, PBS_MAXROUTEDEST, "%s", reqcnvrt->rq_ind.rq_move.rq_destin);
	rc = cnvrt_local_move(pjob, reqcnvrt);

	if (rc != 0)
		return (-1);
	return (0);
}

/**
 * @brief
 * 		resv_timer_init - initialize timed task for removing empty reservation
 */
void
resv_timer_init(void)
{
	resc_resv *presv;
	presv = (resc_resv *) GET_NEXT(svr_allresvs);
	while (presv) {
		if (is_rattr_set(presv, RESV_ATR_del_idle_time))
			set_idle_delete_task(presv);
		presv = (resc_resv *) GET_NEXT(presv->ri_allresvs);
	}
}

/*-----------------------------------------------------------------------
 Functions that deals with a resc_resv* rather than a job*
 These may end up being deleted if the two can be easily merged
 -----------------------------------------------------------------------
 */

/**
 * @brief
 * 		remove_node_from_resv - procedure removes node from reservation
 *		the node is removed from RESV_ATR_resv_nodes and assigned
 *		resources are accounted back to loaner's pool and finally the
 *		reservation is removed from the node
 *
 * @parm[in,out]	presv	-	reservation structure
 * @parm[in,out]	pnode	-	pointer to node
 *
 */
void
remove_node_from_resv(resc_resv *presv, struct pbsnode *pnode)
{
	char *begin = NULL;
	char *end = NULL;
	char *tmp_buf;
	struct resvinfo *rinfp, *prev;
	attribute tmpatr;

	/* +2 for colon and termination */
	tmp_buf = malloc(strlen(pnode->nd_name) + 2);
	if (tmp_buf == NULL) {
		snprintf(log_buffer, LOG_BUF_SIZE, "malloc failure (errno %d)", errno);
		log_err(PBSE_SYSTEM, __func__, log_buffer);
		return;
	}

	snprintf(tmp_buf, strlen(pnode->nd_name) + 1, "%s:", pnode->nd_name);

	/* remove the node '(vn[n]:foo)' from RESV_ATR_resv_nodes attribute */
	if (is_rattr_set(presv, RESV_ATR_resv_nodes)) {
		if ((begin = strstr(get_rattr_str(presv, RESV_ATR_resv_nodes), tmp_buf)) != NULL) {

			while (*begin != '(')
				begin--;

			end = strchr(begin, ')');
			end++;

			if (presv->ri_giveback) {
				/* resources were actually assigned to this reservation
				 * we must return the resources back into the loaner's pool.
				 *
				 * We use temp attribute for this and this attribute will
				 * contain only the removed part of resv_nodes and this part will be returned
				 */
				// FIXME: Can we create some utility func for below?
				clear_attr(&tmpatr, &resv_attr_def[(int) RESV_ATR_resv_nodes]);
				resv_attr_def[(int) RESV_ATR_resv_nodes].at_set(&tmpatr, get_rattr(presv, RESV_ATR_resv_nodes), SET);
				tmpatr.at_flags = (get_rattr(presv, RESV_ATR_resv_nodes))->at_flags;

				strncpy(tmpatr.at_val.at_str, begin, (end - begin));
				tmpatr.at_val.at_str[end - begin] = '\0';

				update_node_rassn(&tmpatr, DECR);

				resv_attr_def[(int) RESV_ATR_resv_nodes].at_free(&tmpatr);

				/* Note: We do not want to set presv->ri_giveback to 0 here.
				 * The resv_nodes may not be empty yet and there could
				 * be server resources assigned - it will be handled later.
				 */
			}

			/* remove "(vn[n]:foo)" from the resv_nodes, no '+' is removed yet */
			memmove(begin, end, strlen(end) + 1); /* +1 for '\0' */

			if (strlen(get_rattr_str(presv, RESV_ATR_resv_nodes)) == 0) {
				free_rattr(presv, RESV_ATR_resv_nodes);
				/* full remove of RESV_ATR_resv_nodes is dangerous;
				 * the associated job can run anywhere without RESV_ATR_resv_nodes
				 * so stop the associated queue */
				change_enableORstart(presv, Q_CHNG_START, ATR_FALSE);
			} else {
				/* resv_nodes looks like "+(vn2:foo)" or "(vn1:foo)+" or "(vn1:foo)++(vn3:bar)"
				 * the extra '+' is removed here */
				int tmp_len;
				char *nodes = get_rattr_str(presv, RESV_ATR_resv_nodes);

				/* remove possible leading '+' */
				if (nodes[0] == '+')
					memmove(nodes, nodes + 1, strlen(nodes));

				/* remove possible trailing '+' */
				tmp_len = strlen(nodes);
				if (nodes[tmp_len - 1] == '+')
					nodes[tmp_len - 1] = '\0';

				/* change possible '++' into single '+' */
				if ((begin = strstr(nodes, "++")) != NULL)
					memmove(begin, begin + 1, strlen(begin + 1) + 1);
				set_rattr_str_slim(presv, RESV_ATR_resv_nodes, nodes, NULL);
			}
		}
	}

	/* traverse the reservations of the node and remove the reservation if found */
	for (prev = NULL, rinfp = pnode->nd_resvp; rinfp; prev = rinfp, rinfp = rinfp->next) {
		if (strcmp(presv->ri_qs.ri_resvID, rinfp->resvp->ri_qs.ri_resvID) == 0) {
			if (prev == NULL)
				pnode->nd_resvp = rinfp->next;
			else
				prev->next = rinfp->next;
			free(rinfp);
			break;
		}
	}

	free(tmp_buf);
}

/**
 * @brief
 * 		remove_host_from_resv - it calls remove_node_from_resv() for all
 *		vnodes on the host
 *
 * @parm[in,out]	presv	-	reservation structure
 * @parm[in]		hostname -	string with hostname
 *
 */
void
remove_host_from_resv(resc_resv *presv, char *hostname)
{
	pbsnode_list_t *pl = NULL;
	pbsnode_list_t *prev = NULL;

	for (prev = NULL, pl = presv->ri_pbsnode_list; pl != NULL;) {
		if (strcmp(pl->vnode->nd_hostname, hostname) == 0) {
			remove_node_from_resv(presv, pl->vnode);
			if (prev == NULL) {
				presv->ri_pbsnode_list = pl->next;
				free(pl);
				pl = presv->ri_pbsnode_list;
			} else {
				prev->next = pl->next;
				free(pl);
				pl = prev->next;
			}
		} else {
			prev = pl;
			pl = pl->next;
		}
	}
}

/**
 * @brief
 * 		degrade_overlapping_resv - by traversing all associated nodes
 *		of the presv, search all overlapping reservations and if the
 *		reservation is not 'maintenance' and it is confirmed then
 *		degrade the reservation and wipe the overloaded node from the
 *		overlapping reservation with remove_node_from_resv()
 *
 * @parm[in,out]	presv	-	reservation structure
 *
 */
void
degrade_overlapping_resv(resc_resv *presv)
{
	pbsnode_list_t *pl = NULL;
	struct resvinfo *rip;
	resc_resv *tmp_presv;
	int modified;

	for (pl = presv->ri_pbsnode_list; pl != NULL; pl = pl->next) {
		do {
			modified = 0;

			for (rip = pl->vnode->nd_resvp; rip; rip = rip->next) {

				tmp_presv = rip->resvp;

				if (tmp_presv->ri_qs.ri_resvID[0] == PBS_MNTNC_RESV_ID_CHAR)
					continue;

				if (tmp_presv->ri_qs.ri_state == RESV_UNCONFIRMED)
					continue;

				if (strcmp(presv->ri_qs.ri_resvID, tmp_presv->ri_qs.ri_resvID) != 0 &&
				    presv->ri_qs.ri_stime <= tmp_presv->ri_qs.ri_etime &&
				    presv->ri_qs.ri_etime >= tmp_presv->ri_qs.ri_stime) {

					set_resv_retry(tmp_presv, time_now);

					if (tmp_presv->ri_qs.ri_state == RESV_CONFIRMED) {
						resv_setResvState(tmp_presv, RESV_DEGRADED, RESV_IN_CONFLICT);
					} else {
						resv_setResvState(tmp_presv, tmp_presv->ri_qs.ri_state, RESV_IN_CONFLICT);
					}

					remove_host_from_resv(tmp_presv, pl->vnode->nd_hostname);

					resv_save_db(tmp_presv);

					/* we need 'break' here and start over because remove_host_from_resv()
					 * modifies pl->vnode->nd_resvp */
					modified = 1;
					break;
				}
			}
		} while (modified);
	}
}

/**
 * @brief
 * 		assign_resv_resc - function examines the reservation object
 * 		and server global parameters to obtain the node specification.
 * 		If the above yields a non-NULL node spec, global function
 * 		set_nodes() is called to locate a set of nodes for the subject
 * 		reservation and allocate them to the reservation - each node
 * 		that's allocated to the reservation gets a resvinfo structure
 * 		added to its list of resvinfo structures and that structure
 * 		points to the reservation.
 *
 * @parm[in,out]	presv	-	reservation structure
 * @parm[in]	vnodes	-	original vnode list from scheduler/operator
 * @parm[in]	svr_init	- the server is recovering jobs and reservations
 *
 * @return	int
 * @return	0 : no problems detected in the process
 * @retval	non-zero	: error code if problem occurs
 */
int
assign_resv_resc(resc_resv *presv, char *vnodes, int svr_init)
{
	int ret;
	char *node_str = NULL;
	char *host_str = NULL; /* used only as arg to set_nodes */
	char *host_str2 = NULL;
	if ((vnodes == NULL) || (*vnodes == '\0'))
		return (PBSE_BADNODESPEC);

	ret = set_nodes((void *) presv, RESC_RESV_OBJECT, vnodes,
			&node_str, &host_str, &host_str2, 0, svr_init);

	if (ret == PBSE_NONE) {
		/* update resc_resv object's RESV_ATR_resv_nodes attribute */
		set_rattr_str_slim(presv, RESV_ATR_resv_nodes, node_str, NULL);
	}

	return (ret);
}

/**
 * @brief
 * req_confirmresv -	confirm an advance or standing reservation and
 * 			set the assigned resources and optionally the start time.
 *
 *			Handle the reconfirmation of a degraded reservation: The
 *			reconfirmation is handled by altering the reservation's execvnodes with
 *			alternate execvnodes.
 *
 *			Handle the confirmation/denial of reservation alter request.
 *
 * @param
 * preq[in, out]   -	The batch request containing the success or failure of a
 * 			reservation confirmation or re-confirmation.
 */

void
req_confirmresv(struct batch_request *preq)
{
	time_t newstart = 0;
	resc_resv *presv = NULL;
	int rc = 0;
	int state = 0;
	int sub = 0;
	int resv_count = 0;
	int is_degraded = 0;
	int is_confirmed = 0;
	char *execvnodes = NULL;
	char *next_execvnode = NULL;
	char **short_xc = NULL;
	char **tofree = NULL;
	int is_being_altered = 0;
	char *tmp_buf = NULL;
	size_t tmp_buf_size = 0;
	char buf[PBS_MAXQRESVNAME + PBS_MAXHOSTNAME + 256] = {0}; /* FQDN resvID+text */
	char *partition_name = NULL;

	if ((preq->rq_perm & (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	presv = find_resv(preq->rq_ind.rq_run.rq_jid);
	if (presv == NULL) {
		req_reject(PBSE_UNKRESVID, 0, preq);
		return;
	}
	is_degraded = (presv->ri_qs.ri_substate == RESV_DEGRADED || presv->ri_qs.ri_substate == RESV_IN_CONFLICT) ? 1 : 0;
	is_being_altered = presv->ri_alter.ra_flags;
	is_confirmed = (presv->ri_qs.ri_substate == RESV_CONFIRMED) ? 1 : 0;

	DBPRT(("resv_name=%s, is_degraded=%d, is_being_altered=%d, is_confirmed=%d",
	       presv->ri_qs.ri_resvID, is_degraded, is_being_altered, is_confirmed));

	presv->rep_sched_count++;

	/* Check if preq is coming from scheduler */
	if (preq->rq_extend == NULL) {
		req_reject(PBSE_resvFail, 0, preq);
		return;
	}

	/* If the reservation was degraded and it could not be reconfirmed by the
	 * scheduler, then the retry time for that reservation is reset to the half-
	 * time between now and the time to reservation start or, if the retry time
	 * is invalid, set it to some time after the soonest occurrence is to start
	 */
	if (strcmp(preq->rq_extend, PBS_RESV_CONFIRM_FAIL) == 0) {
		int force_requested = FALSE;
		if (is_degraded && !is_being_altered) {
			long retry_time;
			retry_time = determine_resv_retry(presv);

			set_resv_retry(presv, retry_time);

		} else {
			if (presv->rep_sched_count >= presv->req_sched_count) {
				/* Clients waiting on an interactive request must be
				* notified of the failure to confirm
				*/
				if ((presv->ri_brp != NULL) && is_rattr_set(presv, RESV_ATR_interactive)) {
					if (!(presv->ri_alter.ra_flags & RESV_ALTER_FORCED)) {
						(get_rattr(presv, RESV_ATR_interactive))->at_flags &= ~ATR_VFLAG_SET;
						snprintf(buf, sizeof(buf), "%s DENIED", presv->ri_qs.ri_resvID);
						(void) reply_text(presv->ri_brp, PBSE_NONE, buf);
						presv->ri_brp = NULL;
					}
				}
				if (!is_being_altered && !is_confirmed) {
					log_event(PBS_EVENTCLASS_RESV, PBS_EVENTCLASS_RESV, LOG_INFO, presv->ri_qs.ri_resvID, "Reservation denied");
					(void) snprintf(log_buffer, sizeof(log_buffer), "requestor=%s@%s", msg_daemonname, server_host);
					account_recordResv(PBS_ACCT_DRss, presv, log_buffer);
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID, "reservation deleted");
					resv_purge(presv);
				}
			}
		}
		if (presv->ri_qs.ri_state == RESV_BEING_ALTERED) {
			if (!(presv->ri_alter.ra_flags & RESV_ALTER_FORCED)) {
				revert_alter_reservation(presv);
				log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
					  presv->ri_qs.ri_resvID, "Reservation alter denied");
			} else if (presv->rep_sched_count >= presv->req_sched_count)
				force_requested = TRUE;
		}
		if (is_being_altered)
			free_rattr(presv, RESV_ATR_alter_revert);

		if (force_requested == FALSE) {
			reply_ack(preq);
			return;
		} else {
			/* This can only happen when ralter was requested with -Wforce option.
			 * Even though all schedulers have rejected the change, enforce it.
			 */
			presv->ri_alter.ra_flags &= ~RESV_ALTER_FORCED;
			free(preq->rq_extend);
			if (pbs_asprintf(&preq->rq_extend, "%s:partition=%s", PBS_RESV_CONFIRM_SUCCESS,
					 get_rattr_str(presv, RESV_ATR_partition)) == -1) {
				req_reject(PBSE_SYSTEM, 0, preq);
				return;
			}
			/* set start time and destination in the preq structure */
			if (is_rattr_set(presv, RESV_ATR_start))
				preq->rq_ind.rq_run.rq_resch = get_rattr_long(presv, RESV_ATR_start);
			if (is_rattr_set(presv, RESV_ATR_resv_nodes)) {
				preq->rq_ind.rq_run.rq_destin = create_resv_destination(presv);
				if (preq->rq_ind.rq_run.rq_destin == NULL) {
					req_reject(PBSE_SYSTEM, 0, preq);
					return;
				}
			}
		}
	}

	if (is_being_altered)
		free_rattr(presv, RESV_ATR_alter_revert);

	/* if passed in the confirmation, set a new start time */
	if ((newstart = (time_t) preq->rq_ind.rq_run.rq_resch) != 0) {
		presv->ri_qs.ri_stime = newstart;
		set_rattr_l_slim(presv, RESV_ATR_start, newstart, SET);

		presv->ri_qs.ri_etime = newstart + presv->ri_qs.ri_duration;
		set_rattr_l_slim(presv, RESV_ATR_end, presv->ri_qs.ri_etime, SET);
	}

	/* The main difference between an advance reservation and a standing
	 * reservation is the format of the execvnodes returned by "rq_destin":
	 * An advance reservation has a single execvnode while a standing reservation
	 * has a sting with the  particular format:
	 *    <num_resv>#<execvnode1>[<range>]<exevnode2>[...
	 * describing the execvnodes associated to each occurrence.
	 */
	if (get_rattr_str(presv, RESV_ATR_resv_standing)) {
		/* The number of occurrences in the standing reservation and index are parsed
		 * from the execvnode string which is of the form:
		 *     <num_occurrences>#<vnode1>[range1]<vnode2>[range2]...
		 */
		resv_count = get_execvnodes_count(preq->rq_ind.rq_run.rq_destin);
		if (resv_count == 0) {
			req_reject(PBSE_INTERNAL, 0, preq);
			return;
		}

		execvnodes = strdup(preq->rq_ind.rq_run.rq_destin);
		if (execvnodes == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		DBPRT(("stdg_resv conf: execvnodes_seq is %s\n", execvnodes));

		/* execvnodes is of the form:
		 *       <num_resv>#<(execvnode1)>[<range>]<(exevnode2)>[...
		 * this "condensed" string is unrolled into a pointer array of
		 * execvnodes per occurrence, e.g. short_xc[0] are the execvnodes
		 * for 1st occurrence, short_xc[1] for the 2nd etc...
		 * If something goes wrong during unrolling then NULL is returned.
		 * which causes the confirmation message to be rejected
		 */
		short_xc = unroll_execvnode_seq(execvnodes, &tofree);
		if (short_xc == NULL) {
			free(execvnodes);
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		/* The execvnode of the soonest (i.e., next) occurrence */
		next_execvnode = strdup(short_xc[0]);
		if (next_execvnode == NULL) {
			free(short_xc);
			free_execvnode_seq(tofree);
			free(execvnodes);
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		/* Release the now obsolete allocations used to manipulate the
		 * unrolled string */
		free(short_xc);
		free_execvnode_seq(tofree);
		free(execvnodes);

		/* When confirming for the first time, set the index and count */
		if (!is_degraded) {

			/* Add first occurrence's end date on timed task list */
			if (get_rattr_long(presv, RESV_ATR_start) != PBS_RESV_FUTURE_SCH) {
				if (gen_task_EndResvWindow(presv)) {
					free(next_execvnode);
					req_reject(PBSE_SYSTEM, 0, preq);
					return;
				}
			}
			/* Set first occurrence to index 1
			 * (rather than 0 because it gets displayed in pbs_rstat -f) */
			set_rattr_l_slim(presv, RESV_ATR_resv_idx, 1, SET);
		}

		/* Skip setting the execvnodes sequence when reconfirming the last
		 * occurrence or when altering a reservation.
		 */
		if (!is_being_altered) {
			char *new_execvnode = preq->rq_ind.rq_run.rq_destin;
			int remaining_occurrences = get_rattr_long(presv, RESV_ATR_resv_count) - get_rattr_long(presv, RESV_ATR_resv_idx) + 1; /* resv_idx starts at 1 */
			if (get_execvnodes_count(new_execvnode) != remaining_occurrences) {
				log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_WARNING, presv->ri_qs.ri_resvID, "Number of execvnodes given does not equal the number of occurrences left");
				free(next_execvnode);
				req_reject(PBSE_BADATVAL, 0, preq);
				return;
			}

			if (remaining_occurrences > 0) {
				/* now assign the execvnodes sequence attribute */
				set_rattr_str_slim(presv, RESV_ATR_resv_execvnodes, preq->rq_ind.rq_run.rq_destin, NULL);
			}
		}
	} else { /* Advance reservation */
		next_execvnode = strdup(preq->rq_ind.rq_run.rq_destin);
		if (next_execvnode == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
	}

	/* Is reservation still a viable reservation? */
	if ((rc = chk_resvReq_viable(presv)) != 0) {
		free(next_execvnode);
		req_reject(PBSE_BADTSPEC, 0, preq);
		return;
	}

	/* When reconfirming a degraded reservation, first free the nodes linked
	 * to the reservation and unset all attributes relating to retry attempts
	 */
	if (is_degraded) {
		if (presv->ri_qs.ri_state == RESV_RUNNING) {
			if (presv->ri_giveback) {
				set_resc_assigned((void *) presv, 1, DECR);
				presv->ri_giveback = 0;
			}
		}
		free_resvNodes(presv);
		/* Reset retry time */
		unset_resv_retry(presv);
		/* reset vnodes_down counter to 0 */
		presv->ri_vnodes_down = 0;
	}

	if (is_being_altered & RESV_END_TIME_MODIFIED) {
		if (gen_task_EndResvWindow(presv)) {
			free(next_execvnode);
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
	}

	/*
	 * Assign the allocated resources to the reservation
	 * and the reservation to the associated vnodes.
	 */
	if (is_being_altered) {
		if ((is_being_altered & RESV_SELECT_MODIFIED) && presv->ri_qs.ri_stime <= time_now) {
			/* If we are both degraded and ralter -lselect, we are fine.  We will have unset ri_giveback above */
			if (presv->ri_giveback) {
				set_resc_assigned((void *) presv, 1, DECR);
				presv->ri_giveback = 0;
			}
		}

		free_resvNodes(presv);
	}
	rc = assign_resv_resc(presv, next_execvnode, FALSE);

	DBPRT(("resv_name=%s, rc=%d, is_degraded=%d, stime=%ld, now=%ld",
	       presv->ri_qs.ri_resvID, rc, is_degraded, presv->ri_qs.ri_stime, time_now));

	if (presv->ri_qs.ri_stime <= time_now) {
		if (is_degraded || is_being_altered & RESV_SELECT_MODIFIED) {
			if (presv->ri_giveback == 0) {
				set_resc_assigned((void *) presv, 1, INCR);
				presv->ri_giveback = 1;
				resv_exclusive_handler(presv);
			}
		}
	}

	if (rc != PBSE_NONE) {
		free(next_execvnode);
		req_reject(rc, 0, preq);
		return;
	}

	/* place "Time4resv" task on "task_list_timed" only if this is a
	 * confirmation but not the reconfirmation of a degraded reservation as
	 * in this case, the reservation had already been confirmed and added to
	 * the task list before
	 */
	if (!is_degraded && (!is_being_altered || is_being_altered & RESV_START_TIME_MODIFIED) &&
	    (rc = gen_task_Time4resv(presv)) != 0) {
		free(next_execvnode);
		req_reject(rc, 0, preq);
		return;
	}

	/*
	 * compute new values for state and substate
	 * and update the resc_resv object with these
	 * newly computed values
	 */
	eval_resvState(presv, RESVSTATE_gen_task_Time4resv, 0, &state, &sub);
	resv_setResvState(presv, state, sub);
	if (strncmp(preq->rq_extend, PBS_RESV_CONFIRM_SUCCESS, strlen(PBS_RESV_CONFIRM_SUCCESS)) == 0) {
		char *p_tmp;
		p_tmp = strstr(preq->rq_extend, ":partition=");
		if (p_tmp) {
			p_tmp += strlen(":partition=");
			partition_name = strdup(p_tmp);
		} else
			partition_name = strdup(DEFAULT_PARTITION);

		if (partition_name == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		/* Reservation is not degraded anymore */
		is_degraded = 0;
	}
	if (state == RESV_CONFIRMED && partition_name != NULL) {
		/* Set the name of the partition where the reservation is confirmed*/
		pbs_queue *rque = NULL;
		char *qname = NULL;
		char *p;
		set_rattr_str_slim(presv, RESV_ATR_partition, partition_name, NULL);
		qname = strdup(presv->ri_qs.ri_resvID);
		if (qname == NULL) {
			log_err(PBSE_INTERNAL, __func__, "malloc failed");
			req_reject(PBSE_SYSTEM, 0, preq);
			free(partition_name);
			return;
		}
		p = strpbrk(qname, ".");
		if (p != NULL)
			*p = '\0';
		rque = find_queuebyname(qname);
		if (rque == NULL) {
			log_err(PBSE_INTERNAL, __func__, "Reservation queue not found");
			req_reject(PBSE_INTERNAL, 0, preq);
			free(partition_name);
			free(qname);
			return;
		} else {
			set_qattr_str_slim(rque, QA_ATR_partition, partition_name, NULL);
			que_save_db(rque);
		}
		free(qname);
	}
	free(partition_name);
	resv_save_db(presv);

	log_buffer[0] = '\0';

	/*
	 * Notify all interested parties that the reservation
	 * is moving from state UNCONFIRMED to CONFIRMED
	 */
	if (presv->ri_brp) {
		presv = find_resv(presv->ri_qs.ri_resvID);
		if (get_rattr_str(presv, RESV_ATR_convert) != NULL) {
			rc = cnvrt_qmove(presv);
			if (rc != 0) {
				snprintf(buf, sizeof(buf), "%.240s FAILED", presv->ri_qs.ri_resvID);
			} else {
				snprintf(buf, sizeof(buf), "%.240s CONFIRMED", presv->ri_qs.ri_resvID);
			}
		} else {
			snprintf(buf, sizeof(buf), "%.240s CONFIRMED", presv->ri_qs.ri_resvID);
		}

		rc = reply_text(presv->ri_brp, PBSE_NONE, buf);
		presv->ri_brp = NULL;
	}

	svr_mailownerResv(presv, MAIL_CONFIRM, MAIL_NORMAL, log_buffer);
	(get_rattr(presv, RESV_ATR_interactive))->at_flags &= ~ATR_VFLAG_SET;

	if (is_being_altered) {
		/*
		 * If the reservation is currently running and its start time is being
		 * altered after the current time, It is going back to the confirmed state.
		 * We need to stop the reservation queue as it would have been started at
		 * the original start time.
		 * This will prevent any jobs - that are submitted after the
		 * reservation's start time is changed - from running.
		 * The reservation went to CO from RN while being altered, that means the reservation
		 * had resources assigned. We should decrement their usages until it starts running
		 * again, where the resources will be accounted again.
		 */
		if (presv->ri_qs.ri_state == RESV_CONFIRMED && presv->ri_alter.ra_state == RESV_RUNNING) {
			change_enableORstart(presv, Q_CHNG_START, "FALSE");
			if (presv->ri_giveback) {
				set_resc_assigned((void *) presv, 1, DECR);
				presv->ri_giveback = 0;
			}
		}
		if (presv->ri_alter.ra_flags & RESV_SELECT_MODIFIED)
			free_rattr(presv, RESV_ATR_SchedSelect_orig);

		presv->ri_alter.ra_flags = 0;

		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
			  presv->ri_qs.ri_resvID, "Reservation alter confirmed");
	} else
		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_INFO,
			  presv->ri_qs.ri_resvID, "Reservation confirmed");

	if (!is_degraded) {
		/* 100 extra bytes for field names, times, and count */
		tmp_buf_size = 100 + strlen(preq->rq_user) + strlen(preq->rq_host) + strlen(next_execvnode);
		if (tmp_buf_size > sizeof(buf)) {
			tmp_buf = malloc(tmp_buf_size);
			if (tmp_buf == NULL) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "malloc failure (errno %d)", errno);
				log_err(PBSE_SYSTEM, __func__, log_buffer);
				free(next_execvnode);
				reply_ack(preq);
				return;
			}
		} else {
			tmp_buf = buf;
			tmp_buf_size = sizeof(buf);
		}

		if (get_rattr_long(presv, RESV_ATR_resv_standing)) {
			(void) snprintf(tmp_buf, tmp_buf_size, "requestor=%s@%s start=%ld end=%ld nodes=%s count=%ld",
					preq->rq_user, preq->rq_host,
					presv->ri_qs.ri_stime, presv->ri_qs.ri_etime,
					next_execvnode,
					get_rattr_long(presv, RESV_ATR_resv_count));
		} else {
			(void) snprintf(tmp_buf, tmp_buf_size, "requestor=%s@%s start=%ld end=%ld nodes=%s",
					preq->rq_user, preq->rq_host,
					presv->ri_qs.ri_stime, presv->ri_qs.ri_etime,
					next_execvnode);
		}
		char hook_msg[HOOK_MSG_SIZE] = {0};
		switch (process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt)) {
			case 0: /* explicit reject */
			case 1: /* no recreate request as there are only read permissions */
			case 2: /* no hook script executed - go ahead and accept event*/
				break;
			default:
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__,
					  "resv_confirm event: accept req by default");
		}
		account_recordResv(PBS_ACCT_CR, presv, tmp_buf);
		if (tmp_buf != buf) {
			free(tmp_buf);
			tmp_buf_size = 0;
		}
	}

	if (presv->ri_qs.ri_resvID[0] == PBS_MNTNC_RESV_ID_CHAR)
		degrade_overlapping_resv(presv);

	free(next_execvnode);
	reply_ack(preq);

	return;
}


================================================
FILE: src/server/req_runjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	req_runjob.c
 *
 * @brief
 * 		req_runjob.c - functions dealing with a Run Job Request
 *
 * Included functions are:
 *	check_and_provision_job()
 *	clear_from_defr()
 *	req_runjob()
 *	req_runjob2()
 *	clear_exec_on_run_fail()
 *	req_stagein()
 *	post_stagein()
 *	svr_stagein()
 *	svr_startjob()
 *	svr_strtjob2()
 *	complete_running()
 *	parse_hook_rejectmsg()
 *	post_sendmom()
 *	chk_job_torun()
 *	where_to_runjob()
 *	assign_hosts()
 *	req_defschedreply()
 *	check_failed_attempts()
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <ctype.h>
#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
#include <fcntl.h>

#include <strings.h>
#include <sys/wait.h>

#include <signal.h>
#include <stdlib.h>
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "acct.h"
#include "net_connect.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include <libutil.h>
#include "sched_cmds.h"
#include "pbs_license.h"
#include "hook.h"
#include "provision.h"
#include "pbs_share.h"
#include "pbs_sched.h"

/* External Functions Called: */

extern struct batch_request *cpy_stage(struct batch_request *, job *,
				       enum job_atr, int);
extern struct batch_request *cpy_stage(struct batch_request *, job *, enum job_atr, int);

/* Public Functions in this file */

int svr_startjob(job *, struct batch_request *);
extern char *msg_daemonname;
extern char *path_hooks_workdir;
extern char *msg_hook_reject_deletejob;

/* Private Function local to this file */

void post_sendmom(struct work_task *);
static int svr_stagein(job *, struct batch_request *, char, int);
static int svr_strtjob2(job *, struct batch_request *);
static job *chk_job_torun(struct batch_request *preq, job *);
static int req_runjob2(struct batch_request *preq, job *pjob);
static job *where_to_runjob(struct batch_request *preq, job *);
static void convert_job_to_resv(job *pjob);
/* Global Data Items: */

extern pbs_net_t pbs_mom_addr;
extern int pbs_mom_port;
extern struct server server;
extern char *msg_badexit;
extern char *msg_jobrun;
extern char *msg_job_end_sig;
extern char *msg_init_substate;
extern char *msg_manager;
extern char *msg_stageinfail;
extern char *msg_job_abort;
extern time_t time_now;
extern int svr_totnodes; /* non-zero if using nodes */
extern job *chk_job_request(char *, struct batch_request *, int *, int *);
extern int send_cred(job *pjob);

/* private data */

/**
 * @brief
 *		Take a batch_request and job pointer as arguments
 *	 	Enque provisioning by calling check_and_engue_provisioning
 *	 	if Enque is successful, sets the job substate to provisioning
 *	 	else returns an error, caller sends a req_reject to scheduler
 *
 * @see
 *		req_runjob2
 *
 * @param[in]	preq	-	batch_request
 * @param[in,out]	pjob	-	job pointer
 * @param[out]	need_prov	-	boolean value, whether job will provision
 *
 * @return	int
 * @retval	0	: no provisioning required
 * @retval	-1	: provisioning required
 * @retval	>0	: PBS error codes
 *
 * @par Side Effects:
 *	Unknown
 *
 * @par MT-safe: No
 *
 */
static int
check_and_provision_job(struct batch_request *preq, job *pjob, int *need_prov)
{
	int rc = 0;

	/* prov node is part of exec_vnodes, */
	/* cut and update exec_vnode and prov_vnode */
	if (!preq || !pjob || !need_prov)
		return (PBSE_IVALREQ);

	rc = check_and_enqueue_provisioning(pjob, need_prov);
	if (rc) {
		/* log message about failure to start provisioning for a job */
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid,
			  "Job failed to start provisioning");

		/* put system hold and move to held state */
		set_jattr_b_slim(pjob, JOB_ATR_hold, HOLD_s, INCR);
		svr_setjobstate(pjob, JOB_STATE_LTR_HELD, JOB_SUBSTATE_HELD);
		set_jattr_str_slim(pjob, JOB_ATR_Comment, "job held, provisioning failed to start", NULL);

		/* not offlining vnodes, since its not a vnode's fault. vnode */
		/* is good to run other jobs, so why waste resource. */
		return rc;
	}

	if (*need_prov == 0)
		return PBSE_NONE;

	/* provisioning was needed and enqueued */

	svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_PROVISION);
	DBPRT(("%s: Sucessfully enqueued provisioning for job %s\n", __func__, pjob->ji_qs.ji_jobid))

	/* log accounting line for start of prov for a job */
	set_job_ProvAcctRcd(pjob, time_now, PROVISIONING_STARTED);

	return PBSE_NONE;
}

/**
 * @brief
 *		Search for a deferred reply element in the list whose client
 *		request came in on the socket which was just closed.  If found,
 *		clear the pointer to the original request which has been freed
 *		when the connection was closed.
 *
 * @param[in]	sd	-	socket which was just closed
 *
 * @return	none
 *
 * @par MT-safe: not really
 */
static void
clear_from_defr(int sd)
{
	pbs_sched *psched;
	pbs_list_head *deferred_req;
	struct deferred_request *pdefr;

	for (psched = (pbs_sched *) GET_NEXT(svr_allscheds);
	     psched;
	     psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {

		deferred_req = fetch_sched_deferred_request(psched, false);
		if (deferred_req == NULL) {
			continue;
		}

		for (pdefr = (struct deferred_request *) GET_NEXT(*deferred_req);
		     pdefr;
		     pdefr = (struct deferred_request *) GET_NEXT(pdefr->dr_link)) {
			if (pdefr->dr_preq != NULL) {
				if (pdefr->dr_preq->rq_conn == sd) {
					/* found deferred run job request whose */
					/* connection to the client has closed  */
					if (pdefr->dr_sent != 0) {
						/* request sent to scheduler, wait   */
						/* for it to respond before removing */
						/* this request, just null the qrun  */
						/* request pointer                   */
						pdefr->dr_preq = NULL;
					} else {
						/* unlink & free the deferred request */
						delete_link(&pdefr->dr_link);
						free(pdefr);
					}
					break;
				}
			}
		}

		clear_sched_deferred_request(psched);
	}
}

/**
 * @brief	Wrapper function that calls process_hooks()
 *
 * @see		req_runjob()
 *
 * @return	int
 *
 */
int
call_to_process_hooks(struct batch_request *preq, char *hook_msg, size_t msg_len,
		      void(*pyinter_func))
{
	int rc;
	rc = process_hooks(preq, hook_msg, msg_len, pyinter_func);
	if (rc == -1)
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_INFO, "", "runjob event: accept req by default");
	return rc;
}

/**
 * @brief
 * 	req_runjob - service the Run Job and Asyc Run Job Requests
 *
 * @par
 *	This request forces a job into execution. Client must be privileged to run job.
 *
 * @param[in] preq - pointer to batch request structure
 *
 * @return void
 *
 */
void
req_runjob(struct batch_request *preq)
{
	int anygood;
	int i;
	int j;
	char *jid;
	int jt; /* job type */
	char *pc;
	job *pjob = NULL;
	job *pjobsub = NULL;
	job *parent = NULL;
	char *range;
	int start;
	int end;
	int step;
	int count;
	pbs_list_head *deferred_req;
	struct deferred_request *pdefr;
	char hook_msg[HOOK_MSG_SIZE];
	pbs_sched *psched;
	char sjst;

	if ((preq->rq_perm & (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	jid = preq->rq_ind.rq_run.rq_jid;
	parent = chk_job_request(jid, preq, &jt, NULL);
	if (parent == NULL)
		return; /* note, req_reject already called */

	/* the job must be in an execution queue */
	if (parent->ji_qhdr->qu_qs.qu_type != QTYPE_Execution) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	if (!find_assoc_sched_jid(jid, &psched)) {
		sprintf(log_buffer, "Unable to reach scheduler associated with job %s", jid);
		log_err(-1, __func__, log_buffer);
		req_reject(PBSE_NOSCHEDULER, 0, preq);
		return;
	}

	if ((psched->sc_cycle_started != -1) && was_job_alteredmoved(parent)) {
		/* Reject run request for altered/moved jobs if job_run_wait is set to "execjob_hook" */
		if (!is_sched_attr_set(psched, SCHED_ATR_job_run_wait) ||
		    (!strcmp(get_sched_attr_str(psched, SCHED_ATR_job_run_wait), RUN_WAIT_EXECJOB_HOOK))) {
			req_reject(PBSE_NORUNALTEREDJOB, 0, preq);
			set_scheduler_flag(SCH_SCHEDULE_NEW, psched);
			return;
		}
	}

	if (jt == IS_ARRAY_NO) {
		/* just a regular job, pass it on down the line and be done */
		pjob = chk_job_torun(preq, parent);
		if (pjob == NULL)
			return;
		if (pjob->ji_discarding) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	} else if (jt == IS_ARRAY_Single) {
		/* single subjob, if running can signal */
		pjob = get_subjob_and_state(parent, get_index_from_jid(jid), &sjst, NULL);
		if (sjst == JOB_STATE_LTR_UNKNOWN) {
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		} else if (sjst != JOB_STATE_LTR_QUEUED || (pjob && pjob->ji_discarding)) {
			/* job already running or discarding  */
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	} else if (jt == IS_ARRAY_ArrayJob) {
		/* invalid to run the array itself */
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	} else {
		/*
		 * what's left to handle is a range of subjobs,
		 * validate that given range has atleast one subjob
		 * in queue state
		 */
		anygood = 0;
		range = get_range_from_jid(jid);
		if (range == NULL) {
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		}

		while (1) {
			if ((i = parse_subjob_index(range, &pc, &start, &end, &step, &count)) == -1) {
				req_reject(PBSE_IVALREQ, 0, preq);
				return;
			} else if (i == 1)
				break; /* no more in the range */
			for (i = start; i <= end; i += step) {
				pjob = get_subjob_and_state(parent, i, &sjst, NULL);
				if (sjst == JOB_STATE_LTR_QUEUED) {
					anygood = 1;
					break;
				}
			}
			range = pc;
		}
		if (anygood == 0) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}
	}

	/*
	 * At this point, we know the basic request to run the job
	 * or jobs is valid, so we can proceed farther.
	 * If there is a specified list of execution vnodes and
	 * resources, then process the run request, else it has
	 * to go to the scheduler
	 */
	if ((preq->rq_ind.rq_run.rq_destin == NULL) ||
	    (*preq->rq_ind.rq_run.rq_destin == '\0')) {
		char fixjid[PBS_MAXSVRJOBID + 1];

		/* if runjob request is from the Scheduler, it must have a destination specified */
		if (preq->rq_conn == psched->sc_primary_conn) {
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_INFO, jid, "runjob request from scheduler with null destination");
			req_reject(PBSE_IVALREQ, 0, preq);
			return;
		}
		pdefr = (struct deferred_request *) malloc(sizeof(struct deferred_request));
		if (pdefr == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		CLEAR_LINK(pdefr->dr_link);

		/*
		 * fix the job id so the suffix matches the real jobid's
		 * suffix;  in case qrun 1.short vs 1.short.domain.com
		 */
		snprintf(fixjid, sizeof(fixjid), "%s", jid);
		pc = strchr(fixjid, (int) '.');
		if (pc)
			*pc = '\0';
		pc = strchr(parent->ji_qs.ji_jobid, (int) '.');
		if (pc)
			strcat(fixjid, pc);

		pbs_strncpy(pdefr->dr_id, fixjid, PBS_MAXSVRJOBID + 1);
		pdefr->dr_preq = preq;
		pdefr->dr_sent = 0;
		deferred_req = fetch_sched_deferred_request(psched, true);
		if (deferred_req == NULL) {
			req_reject(PBSE_SYSTEM, 0, preq);
			return;
		}
		append_link(deferred_req, &pdefr->dr_link, pdefr);
		/* ensure that request is removed if client connect is closed */
		net_add_close_func(preq->rq_conn, clear_from_defr);

		if (schedule_jobs(psched) == -1) {
			/* unable to contact the Scheduler, reject */
			req_reject(PBSE_NOSCHEDULER, 0, preq);
			/* unlink and free the deferred request entry */
			delete_link(&pdefr->dr_link);
			free(pdefr);
		}
		return;
	}

	DBPRT(("req_runjob: received command to run job on destin %s\n", preq->rq_ind.rq_run.rq_destin))

	/*
	 * OK - go back over the run job request, assign the vhosts
	 * and finally run the job by calling req_runjob2()
	 */
	if (jt == IS_ARRAY_NO) {

		/* just a regular job, pass it on down the line and be done */
		if (call_to_process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt) == 0) {
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
			return;
		}
		pjob = where_to_runjob(preq, parent);
		if (pjob) {
			/* free prov_vnode before use */
			free_jattr(pjob, JOB_ATR_prov_vnode);
			req_runjob2(preq, parent);
		}
		return;

	} else if (jt == IS_ARRAY_Single) {
		attribute sub_runcount;
		attribute sub_run_version;
		attribute sub_prev_res;

		clear_attr(&sub_runcount, &job_attr_def[JOB_ATR_runcount]);
		clear_attr(&sub_run_version, &job_attr_def[JOB_ATR_run_version]);
		clear_attr(&sub_prev_res, &job_attr_def[JOB_ATR_resource]);

		pjobsub = get_subjob_and_state(parent, get_index_from_jid(jid), NULL, NULL);
		if (pjobsub != NULL) {
			if (is_jattr_set(pjobsub, JOB_ATR_runcount))
				set_attr_with_attr(&job_attr_def[JOB_ATR_runcount], &sub_runcount, get_jattr(pjobsub, JOB_ATR_runcount), SET);
			if (is_jattr_set(pjobsub, JOB_ATR_run_version))
				set_attr_with_attr(&job_attr_def[JOB_ATR_run_version], &sub_run_version, get_jattr(pjobsub, JOB_ATR_run_version), SET);
			if (is_jattr_set(pjobsub, JOB_ATR_resource))
				set_attr_with_attr(&job_attr_def[JOB_ATR_resource], &sub_prev_res, get_jattr(pjobsub, JOB_ATR_resource), SET);
			job_purge(pjobsub);
		}

		if ((pjobsub = create_subjob(parent, jid, &j)) == NULL) {
			if (is_attr_set(&sub_runcount))
				free_attr(job_attr_def, &sub_runcount, JOB_ATR_runcount);
			if (is_attr_set(&sub_run_version))
				free_attr(job_attr_def, &sub_run_version, JOB_ATR_run_version);
			if (is_attr_set(&sub_prev_res))
				free_attr(job_attr_def, &sub_prev_res, JOB_ATR_resource);
			req_reject(j, 0, preq);
			return;
		}

		if (is_attr_set(&sub_runcount)) {
			free_jattr(pjobsub, JOB_ATR_runcount);
			set_attr_with_attr(&job_attr_def[JOB_ATR_runcount], get_jattr(pjobsub, JOB_ATR_runcount), &sub_runcount, SET);
			free_attr(job_attr_def, &sub_runcount, JOB_ATR_runcount);
		}

		if (is_attr_set(&sub_run_version)) {
			free_jattr(pjobsub, JOB_ATR_run_version);
			set_attr_with_attr(&job_attr_def[JOB_ATR_run_version], get_jattr(pjobsub, JOB_ATR_run_version), &sub_run_version, SET);
			free_attr(job_attr_def, &sub_run_version, JOB_ATR_run_version);
		}

		if (is_attr_set(&sub_prev_res)) {
			free_jattr(pjobsub, JOB_ATR_resource);
			set_attr_with_attr(&job_attr_def[JOB_ATR_resource], get_jattr(pjobsub, JOB_ATR_resource), &sub_prev_res, SET);
			free_attr(job_attr_def, &sub_prev_res, JOB_ATR_resource);
		}

		if (call_to_process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt) == 0) {
			/* subjob reject from hook*/
			reply_text(preq, PBSE_HOOKERROR, hook_msg);
			return;
		}
		pjob = where_to_runjob(preq, pjobsub);
		if (pjob) {
			/* free prov_vnode before use */
			free_jattr(pjob, JOB_ATR_prov_vnode);
			req_runjob2(preq, pjob);
		}
		return;
	}

	/*
	 * what's left to handle is a range of subjobs,
	 * foreach subjob, if queued, run it
	 */
	range = get_range_from_jid(jid);
	if (range == NULL) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	++preq->rq_refct;

	while (1) {
		if ((i = parse_subjob_index(range, &pc, &start, &end, &step, &count)) == -1) {
			req_reject(PBSE_IVALREQ, 0, preq);
			break;
		} else if (i == 1)
			break;
		for (i = start; i <= end; i += step) {
			attribute sub_runcount = {0};
			attribute sub_run_version = {0};
			attribute sub_prev_res = {0};

			clear_attr(&sub_runcount, &job_attr_def[JOB_ATR_runcount]);
			clear_attr(&sub_run_version, &job_attr_def[JOB_ATR_run_version]);
			clear_attr(&sub_prev_res, &job_attr_def[JOB_ATR_resource]);

			pjobsub = get_subjob_and_state(parent, i, &sjst, NULL);
			if (sjst != JOB_STATE_LTR_QUEUED)
				continue;

			if (pjobsub != NULL) {
				if (is_jattr_set(pjobsub, JOB_ATR_runcount))
					set_attr_with_attr(&job_attr_def[JOB_ATR_runcount], &sub_runcount, get_jattr(pjobsub, JOB_ATR_runcount), SET);
				if (is_jattr_set(pjobsub, JOB_ATR_run_version))
					set_attr_with_attr(&job_attr_def[JOB_ATR_run_version], &sub_run_version, get_jattr(pjobsub, JOB_ATR_run_version), SET);
				if (is_jattr_set(pjobsub, JOB_ATR_resource))
					set_attr_with_attr(&job_attr_def[JOB_ATR_resource], &sub_prev_res, get_jattr(pjobsub, JOB_ATR_resource), SET);
				job_purge(pjobsub);
			}

			if ((pjobsub = create_subjob(parent, create_subjob_id(parent->ji_qs.ji_jobid, i), &j)) == NULL) {
				if (is_attr_set(&sub_prev_res))
					free_attr(job_attr_def, &sub_prev_res, JOB_ATR_resource);
				req_reject(j, 0, preq);
				continue;
			}

			if (is_attr_set(&sub_run_version))
				set_jattr_l_slim(pjobsub, JOB_ATR_run_version, get_attr_l(&sub_run_version), SET);

			if (is_attr_set(&sub_runcount))
				set_jattr_l_slim(pjobsub, JOB_ATR_runcount, get_attr_l(&sub_runcount), SET);

			if (is_attr_set(&sub_prev_res)) {
				free_jattr(pjobsub, JOB_ATR_resource);
				set_attr_with_attr(&job_attr_def[JOB_ATR_resource], get_jattr(pjobsub, JOB_ATR_resource), &sub_prev_res, SET);
				free_attr(job_attr_def, &sub_prev_res, JOB_ATR_resource);
			}

			if (call_to_process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt) == 0) {
				/* subjob reject from hook*/
				reply_text(preq, PBSE_HOOKERROR, hook_msg);
				return;
			}

			if ((pjob = where_to_runjob(preq, pjobsub)) == NULL)
				continue;

			dup_br_for_subjob(preq, pjob, req_runjob2);
		}
		range = pc;
	}

	/*
	 * if not waiting on any running subjobs, can reply; else
	 * it is taken care of when last running subjob responds
	 */
	if (--preq->rq_refct == 0)
		reply_send(preq);
	return;
}
/**
 * @brief
 * 		req_runjob - service the Run Job and Asyc Run Job Requests
 *
 * @param[in,out]	preq	-	Run Job Requests
 * @param[in,out]	pjob	-	job pointer
 */
static int
req_runjob2(struct batch_request *preq, job *pjob)
{
	int rc;
	int prov_rc = 0;
	int need_prov;
	char *dest;
	int rq_type = 0;

	/* Check if prov is required, if so, reply_ack and let prov finish */
	/* else follow normal flow */
	prov_rc = check_and_provision_job(preq, pjob, &need_prov);

	/* In case of subjob, save it to the database now because
	 * not saved to the database so far.
	 */
	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
		if (job_save_db(pjob)) {
			free_nodes(pjob);
			req_reject(PBSE_SAVE_ERR, 0, preq);
			return 1;
		}
	}

	if (prov_rc) { /* problem with the request */
		free_nodes(pjob);
		req_reject(prov_rc, 0, preq);
		return 1;
	} else if (need_prov == 1) { /* prov required and request is fine */
		/* allocate resources right away */
		set_resc_assigned((void *) pjob, 0, INCR);

		/* provisioning was needed and was qneueued successfully */
		/* Allways send ack for prov jobs, even if not async run */
		reply_ack(preq);
		return 0;
	}

	/* if need_prov ==0 then no prov required, so continue normal flow */
	dest = preq->rq_ind.rq_run.rq_destin;
	if ((dest == NULL) || (*dest == '\0') || ((*dest == '-') && (*(dest + 1) == '\0'))) {
		if (is_jattr_set(pjob, JOB_ATR_exec_vnode)) {
			dest = get_jattr_str(pjob, JOB_ATR_exec_vnode);
		} else {
			dest = NULL;
		}
	}
	if ((dest == NULL) || (*dest == '\0')) {
		/* Neither the run request nor the job specified an execvnode. */
		free_nodes(pjob);
		req_reject(PBSE_IVALREQ, 0, preq);
		return 1;
	}
	sprintf(log_buffer, msg_manager, msg_jobrun, preq->rq_user, preq->rq_host);
	strcat(log_buffer, " on exec_vnode ");
	rc = LOG_BUF_SIZE - strlen(log_buffer) - 1;
	strncat(log_buffer, dest, rc);
	*(log_buffer + LOG_BUF_SIZE - 1) = '\0';
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);

	/* If async run, reply now; otherwise reply is handled in */
	/* post_sendmom or post_stagein				  */
	rq_type = preq->rq_type;
	if (preq && (rq_type == PBS_BATCH_AsyrunJob_ack)) {
		reply_ack(preq);
		preq = 0; /* cleared so we don't try to reuse */
	}

	if (((rc = svr_startjob(pjob, preq)) != 0) &&
	    ((rq_type == PBS_BATCH_AsyrunJob_ack) || preq)) {
		free_nodes(pjob);
		if (preq)
			req_reject(rc, 0, preq);
		return 1;
	}

	return 0;
}

/**
 * @brief
 *		clear_exec_on_run_fail - On failure of running a job,
 *		clear exec strings so job can be resecheduled anywhere.
 *
 * @par Functionality:
 *		If the job has been checkpointed then the job must run where it ran before.
 *		Otherwise it is free to run anywhere when re-scheduled.  In this case,
 *		clear the exec_hosts, exec_vnodes, etc.
 *
 * @param[in]	jobp	-	pointer to to job whose run failed
 *
 * @return	none
 *
 * @par MT-safe: yes
 */
void
clear_exec_on_run_fail(job *jobp)
{
	if ((jobp->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) == 0) {

		free_jattr(jobp, JOB_ATR_exec_host);
		free_jattr(jobp, JOB_ATR_exec_host2);
		free_jattr(jobp, JOB_ATR_exec_vnode);
		jobp->ji_qs.ji_destin[0] = '\0';
	}
}

/*
 * @brief
 * 		req_stagein	-	service the Stage In Files for a Job Request
 *
 *		This request causes MOM to start stagin in files.
 *		Client must be privileged.
 *
 * @param[in]	preq	-	Job Request
 */

void
req_stagein(struct batch_request *preq)
{
	req_reject(PBSE_NOSUP, 0, preq);
}

/**
 * @brief
 * 		post_stagein - process reply from MOM to stage-in request
 *
 * @param[in]	pwt	-	pointer to work task structure which contains the request
 */

static void
post_stagein(struct work_task *pwt)
{
	int code;
	char newstate;
	int newsub;
	job *paltjob;
	job *pjob;
	struct batch_request *preq;
	attribute *pwait;

	preq = pwt->wt_parm1;
	code = preq->rq_reply.brp_code;
	pjob = find_job(preq->rq_extra);
	free(preq->rq_extra);

	if (pjob != NULL) {

		if (code != 0) {

			/* stage in failed - "wait" job */

			set_resc_assigned((void *) pjob, 0, DECR);
			free_nodes(pjob);
			free_jattr(pjob, JOB_ATR_exec_host);
			free_jattr(pjob, JOB_ATR_exec_host2);
			free_jattr(pjob, JOB_ATR_exec_vnode);

			if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
				/* for subjob, "wait" the parent array */
				paltjob = pjob->ji_parentaj;
			} else {
				/* for regular job, "wait" that job */
				paltjob = pjob;
			}
			pwait = get_jattr(paltjob, JOB_ATR_exectime);
			if (!is_jattr_set(paltjob, JOB_ATR_exectime)) {
				set_jattr_l_slim(paltjob, JOB_ATR_exectime, time_now + PBS_STAGEFAIL_WAIT, SET);
				job_set_wait(pwait, paltjob, 0);
			}
			svr_setjobstate(paltjob, JOB_STATE_LTR_WAITING, JOB_SUBSTATE_STAGEFAIL);

			if (preq->rq_reply.brp_choice == BATCH_REPLY_CHOICE_Text)
				svr_mailowner(pjob, MAIL_STAGEIN, MAIL_FORCE,
					      preq->rq_reply.brp_un.brp_txt.brp_str);
		} else {
			/* stage in was successful */
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_StagedIn;
			if (check_job_substate(pjob, JOB_SUBSTATE_STAGEGO)) {
				/* continue to start job running */
				svr_strtjob2(pjob, NULL);
			} else {
				svr_evaljobstate(pjob, &newstate, &newsub, 0);
				svr_setjobstate(pjob, newstate, newsub);
			}
		}
	}
	release_req(pwt); /* close connection and release request */
}

/**
 * @brief
 * 		svr_stagein - direct MOM to stage in the requested files for a job
 *
 * @param[in,out]	pjob	-	job structure
 * @param[in,out]	preq	-	request structure
 * @param[in]	state	-	job state
 * @param[in,out]	substate	-	job substate
 *
 * @return	int
 * @retval	0	- success
 * @retval	non-zero	- error code
 */

static int
svr_stagein(job *pjob, struct batch_request *preq, char state, int substate)
{
	struct batch_request *momreq = 0;
	int rc;

	momreq = cpy_stage(momreq, pjob, JOB_ATR_stagein, STAGE_DIR_IN);
	if (momreq) { /* have files to stage in */

		/* save job id for post_stagein */

		momreq->rq_extra = malloc(PBS_MAXSVRJOBID + 1);
		if (momreq->rq_extra == 0)
			return (PBSE_SYSTEM);
		strcpy(momreq->rq_extra, pjob->ji_qs.ji_jobid);
		rc = relay_to_mom(pjob, momreq, post_stagein);
		if (rc == 0) {

			svr_setjobstate(pjob, state, substate);
			/*
			 * show resources allocated as stage-in may take
			 * take sufficient time to run into another
			 * scheduling cycle
			 */
			set_resc_assigned((void *) pjob, 0, INCR);
			/*
			 * stage-in started ok - reply to client as copy may
			 * take too long to wait.
			 */

			if (preq)
				reply_ack(preq);
		} else {
			free(momreq->rq_extra);
		}
		return (rc);

	} else {

		/* no files to stage-in, go direct to sending job to mom */

		return (svr_strtjob2(pjob, preq));
	}
}

/**
 * @brief
 * 		form_attr_comment - Creates and return attribute comment in the given template
 * 		by appending time and execvnode
 *
 * @param[in]	template	-	template of the string
 * @param[in]	execvnode	-	execution node, NULL if this field is not required in the output
 *
 * @return	string
 * @retval	new attribute comment with time and execnode appended.
 *
 * @note
 * 		Do not copy the output of this function into log_buffer. It is used internally.
 */
char *
form_attr_comment(const char *template, const char *execvnode)
{
	char timebuf[128];
	strftime(timebuf, 128, "%a %b %d at %H:%M", localtime(&time_now));
	sprintf(log_buffer, template, timebuf);
	if (execvnode != NULL) {
		strcat(log_buffer, " on ");
		if (strlen(execvnode) > COMMENT_BUF_SIZE - strlen(log_buffer) - 1) {
			strncat(log_buffer, execvnode, COMMENT_BUF_SIZE - strlen(log_buffer) - 1 - 3);
			strcat(log_buffer, "...");
			log_buffer[COMMENT_BUF_SIZE - 1] = '\0';
		} else
			strcat(log_buffer, execvnode);
	}
	return log_buffer;
}

/**
 * @brief
 * 		svr_startjob - place a job into running state by shipping it to MOM
 *
 * @param[in,out]	pjob	-	job to run
 * @param[in,out]	preq	-	 NULL or Run Job batch request
 *
 * @return	int
 * @retval	0	- success
 * @retval	non-zero	- error code
 */
int
svr_startjob(job *pjob, struct batch_request *preq)
{
	int f;
	int rc;
	char *nspec;
	pbs_queue *pque = pjob->ji_qhdr;
	long delay = 10; /* Default value for kill_delay */

	/* if not already setup, transfer the control/script file basename */
	/* into an attribute accessable to MOM				   */

	if (!(is_jattr_set(pjob, JOB_ATR_hashname)))
		if (set_jattr_str_slim(pjob, JOB_ATR_hashname, pjob->ji_qs.ji_jobid, NULL))
			return (PBSE_SYSTEM);

	/* clear Exit_status which may have been set in a hook and requeued */
	if (job_delete_attr(pjob, JOB_ATR_exit_status)) {
		return PBSE_SYSTEM;
	}

	/* if exec_vnode already set and either (hotstart or checkpoint) */
	/* then reuseuse the host(s) listed in the current exec_vnode	 */

	rc = 0;
	f = is_jattr_set(pjob, JOB_ATR_exec_vnode);
	if (f && ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HOTSTART) || (pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT)) && ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HasNodes) == 0)) {

		nspec = get_jattr_str(pjob, JOB_ATR_exec_vnode);
		if (nspec == NULL)
			return (PBSE_SYSTEM);
		rc = assign_hosts(pjob, nspec, 0);

	} else if (f == 0) {
		/* exec_vnode not already set, use hosts from request   */
		if (preq == NULL)
			return (PBSE_INTERNAL);
		nspec = preq->rq_ind.rq_run.rq_destin;
		if (nspec == NULL)
			return (PBSE_IVALREQ);

		rc = assign_hosts(pjob, nspec, 1);
	}
	if (rc != 0)
		return rc;

	if (is_jattr_set(pjob, JOB_ATR_create_resv_from_job) &&
	    get_jattr_long(pjob, JOB_ATR_create_resv_from_job))
		convert_job_to_resv(pjob);

	/* Move job_kill_delay attribute from Server to MOM */
	if (is_qattr_set(pque, QE_ATR_KillDelay))
		delay = get_qattr_long(pque, QE_ATR_KillDelay);
	set_jattr_l_slim(pjob, JOB_ATR_job_kill_delay, delay, SET);

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	if (is_jattr_set(pjob, JOB_ATR_cred_id)) {
		rc = send_cred(pjob);
		if (rc != 0) {
			return rc; /* do not start job without credentials */
		}
	}
#endif

	/* Next, are there files to be staged-in? */

	if ((is_jattr_set(pjob, JOB_ATR_stagein)) &&
	    (!check_job_substate(pjob, JOB_SUBSTATE_STAGECMP))) {

		/* yes, we do that first; then start the job */

		rc = svr_stagein(pjob, preq, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_STAGEGO);

		/* note, the positive acknowledgment to the run job request */
		/* is done by svr_stagein if the stage-in is successful     */

		if (rc != 0) {
			/* If the stage-in failed and we aren't          */
			/* checkpointed, clear the exec_host/exec_vnode; */
			/* job can be run  elsewhere			 */
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) == 0) {
				/* clear StagedIn flag for good measure */
				pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_StagedIn;
				free_jattr(pjob, JOB_ATR_exec_host);
				free_jattr(pjob, JOB_ATR_exec_host2);
				free_jattr(pjob, JOB_ATR_exec_vnode);
			}
		}

	} else {

		/* No stage-in or already done, start job executing */

		rc = svr_strtjob2(pjob, preq);
	}
	return (rc);
}

/**
 * @brief
 * 		Continue the process of running a job by sending it to Mother Superior,
 *		and making sure it is in JOB_SUBSTATE_PRERUN.
 *
 * @param[in]	pjob - pointer to job to run
 * @param[in]	preq - the run job request from the scheduler or client
 *
 * @return	int
 * @retval	0	:  success, job is being sent to Mom
 * @retval	!0	:  error in trying to send to Mom
 */
static int
svr_strtjob2(job *pjob, struct batch_request *preq)
{
	char old_state;
	int old_subst;

	old_state = get_job_state(pjob);
	old_subst = get_job_substate(pjob);
	pjob->ji_qs.ji_stime = 0; /* updated in complete_running() */

	/* if not restarting a checkpointed job, increment the run/hop count */

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT) == 0) {
		set_jattr_l_slim(pjob, JOB_ATR_run_version, 1, INCR);
		set_jattr_l_slim(pjob, JOB_ATR_runcount, 1, INCR);
	}

	/* send the job to MOM */
	set_jattr_generic(pjob, JOB_ATR_Comment,
			  form_attr_comment("Job was sent for execution at %s", get_jattr_str(pjob, JOB_ATR_exec_vnode)),
			  NULL, SET);

	if (old_subst != JOB_SUBSTATE_PROVISION)
		svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING,
				JOB_SUBSTATE_PRERUN);

	if (send_job(pjob, pjob->ji_qs.ji_un.ji_exect.ji_momaddr,
		     pjob->ji_qs.ji_un.ji_exect.ji_momport, MOVE_TYPE_Exec,
		     post_sendmom, (void *) preq) == 2) {
		pjob->ji_prunreq = preq;
		/* Clear the suspend server flag. */
		pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_Suspend;

		/* in case of async ack runjob, we need to assign resources
		 * since another scheduling cycle can happen before the
		 * mom responds to the req_commit message. This is the
		 * same logic that is done for jobs with files to stage
		 * in
		 */
		if (preq == NULL || (preq->rq_type == PBS_BATCH_AsyrunJob_ack) || (preq->rq_type == PBS_BATCH_AsyrunJob)) {
			job *base_job = NULL;
			if (check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) {
				set_resc_assigned((void *) pjob, 0, INCR);
				/* Just update dependencies for the first subjob that runs */
				if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) &&
				    !check_job_state(pjob->ji_parentaj, JOB_STATE_LTR_BEGUN))
					base_job = pjob->ji_parentaj;
				else
					base_job = pjob;
			}
			if (base_job != NULL &&
			    is_jattr_set(base_job, JOB_ATR_depend)) {
				struct depend *pdep;
				pdep = find_depend(JOB_DEPEND_TYPE_RUNONE, get_jattr(base_job, JOB_ATR_depend));
				if (pdep != NULL)
					depend_runone_hold_all(base_job);
			}
		}
		return (0);
	} else {
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  pjob->ji_qs.ji_jobid,
			  "Unable to Run Job, send to Mom failed");

		if (check_job_substate(pjob, JOB_SUBSTATE_PROVISION) ||
		    check_job_substate(pjob, JOB_SUBSTATE_PRERUN))
			rel_resc(pjob);
		else
			free_nodes(pjob);

		clear_exec_on_run_fail(pjob);
		svr_evaljobstate(pjob, &old_state, &old_subst, 1);
		svr_setjobstate(pjob, old_state, old_subst);
		return (pbs_errno);
	}
}

/**
 * @brief
 *		Complete the process of placing a job into execution state
 * @par
 *		Records a bunch of information for accouting and resource management,
 *		and sets substate to PRERUN if it isn't already.
 *		The sub moves to SUBSTATE_RUNNING when the session id is received
 *		from Mom, meaning it is in fact running; see stat_update().
 * @par
 *		Note, if a job is in substate PROVISION,  the resources have already
 *		been allocated.
 *
 * @param[in]	jobp	-	pointer to job which is just starting to run.
 */

void
complete_running(job *jobp)
{
	job *parent;

	if (jobp->ji_qs.ji_stime != 0)
		return; /* already called for this incarnation */

	jobp->ji_terminated = 0; /* reset terminated flag */
	/**
	 *	For a subjob, insure the parent array's state is set to 'B'
	 *	and deal with any dependency on the parent.
	 */
	if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
		/* if this is first subjob to run, mark */
		/* parent Array as state "Begun"	*/
		parent = jobp->ji_parentaj;
		if (check_job_state(parent, JOB_STATE_LTR_QUEUED) ||
		    (check_job_state(parent, JOB_STATE_LTR_BEGUN) && parent->ji_qs.ji_stime == 0)) {
			svr_setjobstate(parent, JOB_STATE_LTR_BEGUN, JOB_SUBSTATE_BEGUN);

			/* Also set the parent job's stime */
			parent->ji_qs.ji_stime = time_now;
			set_jattr_l_slim(parent, JOB_ATR_stime, time_now, SET);

			account_jobstr(parent, PBS_ACCT_RUN);
			set_jattr_str_slim(parent, JOB_ATR_Comment, form_attr_comment("Job Array Began at %s", NULL), NULL);

			/* if any dependencies, see if action required */
			if (is_jattr_set(parent, JOB_ATR_depend))
				depend_on_exec(parent);

			svr_mailowner(parent, MAIL_BEGIN, MAIL_NORMAL, NULL);
		}
	}
	/* Job started ATR_Comment is set in server since scheduler cannot read	*/
	/* the reply in case of error in asynchronous communication.	*/
	set_jattr_str_slim(jobp, JOB_ATR_Comment, form_attr_comment("Job run at %s", get_jattr_str(jobp, JOB_ATR_exec_vnode)), NULL);

	jobp->ji_qs.ji_svrflags &= ~JOB_SVFLG_HOTSTART;

	/* record start time for accounting and for the Scheduler */
	/* setting ji_stime is also an indicator that we have done all this */

	jobp->ji_qs.ji_stime = time_now;
	set_jattr_l_slim(jobp, JOB_ATR_stime, time_now, SET);

	/*
	 * if job is in substate PROVISION, set to PRERUN.
	 * It is possible that the job is in substate:
	 * - RUNNING if Mom sent the status update first before we get to
	 *   process the send_job SIGCHLD, see stat_update()
	 * - EXITING if the Obit was received before send_job's exit status.
	 */
	if (check_job_substate(jobp, JOB_SUBSTATE_PROVISION)) {
		svr_setjobstate(jobp, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_PRERUN);
		/* above saves job structure */
	}

	/* update resource usage attributes */
	/* may have already been done for provisioning, but    */
	/* that will be detected inside of set_resc_assigned() */
	set_resc_assigned((void *) jobp, 0, INCR);
	/* These attributes need to be cleared/freed now that the job has been resumed */
	if (is_jattr_set(jobp, JOB_ATR_resc_released)) {
		free_jattr(jobp, JOB_ATR_resc_released);
		mark_jattr_not_set(jobp, JOB_ATR_resc_released);
	}

	if (is_jattr_set(jobp, JOB_ATR_resc_released_list)) {
		free_jattr(jobp, JOB_ATR_resc_released_list);
		mark_jattr_not_set(jobp, JOB_ATR_resc_released_list);
	}

	/* accounting log for start or restart */
	if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_CHKPT)
		account_record(PBS_ACCT_RESTRT, jobp, NULL);
	else
		account_jobstr(jobp, PBS_ACCT_RUN);

	/* if any dependencies, see if action required */

	if (is_jattr_set(jobp, JOB_ATR_depend))
		depend_on_exec(jobp);

	svr_mailowner(jobp, MAIL_BEGIN, MAIL_NORMAL, NULL);
	/*
	 * it is unfortunate, but while the job has gone into execution,
	 * there is no way of obtaining the session id except by making
	 * a status request of MOM.  (Even if the session id was passed
	 * back to the sending child, it couldn't get up to the parent.)
	 */
}

/**
 * @brief
 * 		Helper function to parse the hookname and hook_msg out of a hook rejection message
 *
 * @param[in]	reject_msg	-	The hooks rejection message
 * @param[out]	hook_name	-	pointer to buffer to fill parsed hook_name
 * @param[in]	hook_name_size	- The length of the hook name output buffer
 *
 * @return	The hook message
 * @retval	NULL	: Failed to parse out hook_name and hook_msg
 * @retval	!NULL	: The hook message
 */
static char *
parse_hook_rejectmsg(char *reject_msg, char *hook_name, int hook_name_size)
{
	char *p;
	if (reject_msg != NULL) {
		p = strchr(reject_msg, ',');
		if (p != NULL) {
			*p = '\0';
			p++;
			strncpy(hook_name, reject_msg, hook_name_size);
			return p;
		}
	}
	return NULL;
}

/**
 * @brief
 *		Check and put a hold on a job if it has already been run
 *		too many times.
 *
 * @param[in,out]	pjob	-	job pointer
 *
 * @return	void
 */
void
check_failed_attempts(job *jobp)
{
	if (get_jattr_long(jobp, JOB_ATR_runcount) >
#ifdef NAS /* localmod 083 */
	    PBS_MAX_HOPCOUNT
#else
	    PBS_MAX_HOPCOUNT + PBS_MAX_HOPCOUNT
#endif /* localmod 083 */
	) {
		set_jattr_b_slim(jobp, JOB_ATR_hold, HOLD_s, INCR);
		set_jattr_str_slim(jobp, JOB_ATR_Comment, "job held, too many failed attempts to run", NULL);

		if (jobp->ji_parentaj) {
			char comment_buf[100 + PBS_MAXSVRJOBID];
			svr_setjobstate(jobp->ji_parentaj, JOB_STATE_LTR_HELD, JOB_SUBSTATE_HELD);
			set_jattr_b_slim(jobp->ji_parentaj, JOB_ATR_hold, HOLD_s, INCR);
			sprintf(comment_buf, "Job Array Held, too many failed attempts to run subjob %s", jobp->ji_qs.ji_jobid);
			set_jattr_str_slim(jobp->ji_parentaj, JOB_ATR_Comment, comment_buf, NULL);
		}
	}
}

/**
 * @brief
 * 		post_sendmom - clean up action for child started in send_job
 *		which was sending a job "home" to MOM
 * @par
 * 		If send was successfull, mark job as executing.
 * 		See comments in complete_running() above about the possible substate changes.
 *
 * 		The job's session id will be updated with Mom first responds with
 * 		the resources_used.
 *
 * 		If send didn't work, requeue the job.
 *
 * 		If the work_task has a non-null wt_parm2, it is the address of a batch
 * 		request to which a reply must be sent.
 * @par
 * 		If the ji_prunreq (pointer to the run request) is null,  the run request
 * 		has already been replied to.  This might happen if the job's Obit is
 * 		received prior to reaping the send_job child.  In that case, we skip all
 * 		this because the job has already "run" and is now in Exiting state.
 *
 * @param[in,out]	pwt	-	work_task structure
 *
 * Returns: none.
 */
void
post_sendmom(struct work_task *pwt)
{
	char newstate;
	int newsub;
	int r;
	char *reject_msg = NULL;
	int wstat = pwt->wt_aux;
	job *jobp = (job *) pwt->wt_parm2;
	struct batch_request *preq = (struct batch_request *) pwt->wt_parm1;
	int prot = pwt->wt_aux2;
	struct batch_reply *reply = (struct batch_reply *) pwt->wt_parm3;
	char dest_host[PBS_MAXROUTEDEST + 1];
	char hook_name[PBS_HOOK_NAME_SIZE + 1] = {'\0'};
	char *hook_msg = NULL;

	if (jobp == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_INFO, "", "post_sendmom failed, jobp NULL");
		if (preq)
			req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	DBPRT(("post_sendmom: %s substate is %ld", jobp->ji_qs.ji_jobid, get_job_substate(jobp)))

	if (jobp->ji_prunreq)
		jobp->ji_prunreq = NULL; /* set in svr_strtjob2() */

	if (prot == PROT_TCP) {
		if (WIFEXITED(wstat)) {
			r = WEXITSTATUS(wstat);
		} else if (WIFSIGNALED(wstat)) {
			/* Check if send_job child process has been signaled or not */
			r = SEND_JOB_SIGNAL;
			snprintf(log_buffer, LOG_BUF_SIZE, msg_job_end_sig, WTERMSIG(wstat));
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_INFO,
				  jobp->ji_qs.ji_jobid, log_buffer);
		} else {
			r = SEND_JOB_RETRY;
			sprintf(log_buffer, msg_badexit, wstat);
			strcat(log_buffer, __func__);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_INFO,
				  jobp->ji_qs.ji_jobid, log_buffer);
		}

		/* if the return code says it was hook error read the hook error message
		 * from the file and parse out hookname and hook_msg
		 */
		if ((r == SEND_JOB_HOOKERR) ||
		    (r == SEND_JOB_HOOK_REJECT) ||
		    (r == SEND_JOB_HOOK_REJECT_RERUNJOB) ||
		    (r == SEND_JOB_HOOK_REJECT_DELETEJOB)) {

			char name_buf[MAXPATHLEN + 1];
			int fd;
			struct stat sbuf;

			snprintf(name_buf, sizeof(name_buf), "%s%s%s", path_hooks_workdir, jobp->ji_qs.ji_jobid,
				 HOOK_REJECT_SUFFIX);

			if ((stat(name_buf, &sbuf) != -1) && (sbuf.st_size > 0)) {

				if ((fd = open(name_buf, O_RDONLY)) != -1) {

					reject_msg = malloc(sbuf.st_size);
					if (reject_msg != NULL) {
						if (read(fd, reject_msg, sbuf.st_size) != sbuf.st_size) {
							sprintf(log_buffer, "read %s is incomplete", name_buf);
							log_err(errno, __func__, log_buffer);
							reject_msg[0] = '\0';
						}
					}
					close(fd);
					unlink(name_buf);
				}
			}
			hook_msg = parse_hook_rejectmsg(reject_msg, hook_name, PBS_HOOK_NAME_SIZE);
		}

	} else {
		/* in case of tpp, the pbs_errno is set in wstat, based
		 * on which we determine value of r
		 */
		switch (wstat) {
			case PBSE_NONE:
				r = SEND_JOB_OK;
				break;
			case PBSE_NORELYMOM:
				r = SEND_JOB_NODEDW;
				break;
			case PBSE_HOOKERROR:
				r = SEND_JOB_HOOKERR;
				break;
			case PBSE_HOOK_REJECT:
				r = SEND_JOB_HOOK_REJECT;
				break;
			case PBSE_HOOK_REJECT_RERUNJOB:
				r = SEND_JOB_HOOK_REJECT_RERUNJOB;
				break;
			case PBSE_HOOK_REJECT_DELETEJOB:
				r = SEND_JOB_HOOK_REJECT_DELETEJOB;
				break;
			default:
				r = SEND_JOB_FATAL;
				break;
		}

		/* also take note of the reject msg if any */
		if (reply && reply->brp_choice == BATCH_REPLY_CHOICE_Text)
			reject_msg = reply->brp_un.brp_txt.brp_str;

		/*
		 * the above reject_msg should never be freed within this function
		 * since it will be freed by the caller process_DreplyTPP() in the
		 * case of a TPP based job send
		 */

		if (r != SEND_JOB_OK) {
			if (reject_msg)
				sprintf(log_buffer,
					"send of job to %s failed error = %d reject_msg=%s",
					jobp->ji_qs.ji_destin, pbs_errno, reject_msg);
			else
				sprintf(log_buffer,
					"send of job to %s failed error = %d",
					jobp->ji_qs.ji_destin, pbs_errno);

			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);
			snprintf(log_buffer, LOG_BUF_SIZE,
				 "Not Running: PBS Error: %s", pbse_to_txt(PBSE_MOMREJECT));

			if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
				/*
				 * if the job is a subjob, set the comment of parent job array
				 * only if the job array is in state Queued. Once the job
				 * array starts its comment is set to a begun message and
				 * should not change after that
				 */
				if (check_job_state(jobp->ji_parentaj, JOB_STATE_LTR_QUEUED)) {
					set_jattr_str_slim(jobp->ji_parentaj, JOB_ATR_Comment, log_buffer, NULL);
				}
			}

			/* if the job is a normal job or a subjob */
			set_jattr_generic(jobp, JOB_ATR_Comment, log_buffer, NULL, SET);

			if (pbs_errno == PBSE_MOM_REJECT_ROOT_SCRIPTS)
				check_failed_attempts(jobp);
		}

		/* in the case of hook error we parse the hook_name and hook msg */
		if ((r == SEND_JOB_HOOKERR) ||
		    (r == SEND_JOB_HOOK_REJECT) ||
		    (r == SEND_JOB_HOOK_REJECT_RERUNJOB) ||
		    (r == SEND_JOB_HOOK_REJECT_DELETEJOB)) {

			hook_msg = parse_hook_rejectmsg(reject_msg, hook_name, PBS_HOOK_NAME_SIZE);
		}
	}

	if (!(check_job_substate(jobp, JOB_SUBSTATE_PRERUN) ||
	      check_job_substate(jobp, JOB_SUBSTATE_RUNNING) ||
	      check_job_substate(jobp, JOB_SUBSTATE_PROVISION))) {
		sprintf(log_buffer, "send_job returned with exit status = %d and job substate = %ld",
			r, get_job_substate(jobp));

		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO,
			  jobp->ji_qs.ji_jobid, log_buffer);
	}

	switch (r) {

		case SEND_JOB_OK: /* send to MOM went ok */

			if (preq)
				reply_ack(preq);
			if ((check_job_substate(jobp, JOB_SUBSTATE_PRERUN)) ||
			    (check_job_substate(jobp, JOB_SUBSTATE_PROVISION)))
				complete_running(jobp);
			break;

		case SEND_JOB_SIGNAL:

			/* send_job child process has been signaled
			 * therefore kill the job if it is already
			 * running on the MOM and force requeue the job
			 */
			if (preq)
				req_reject(PBSE_SYSTEM, 0, preq);

			/* need to record log message before aborting and
			 * requeuing job both in server and accounting logs
			 */
			snprintf(log_buffer, LOG_BUF_SIZE, "%s", msg_job_abort);
			log_event(PBSEVENT_SYSTEM | PBSEVENT_JOB | PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);

			/* abort job irrespective of its presence
			 * (may or may not be running) in a MOM
			 */
			job_abt(jobp, log_buffer);

			snprintf(log_buffer, LOG_BUF_SIZE, msg_init_substate, get_job_substate(jobp));
			log_event(PBSEVENT_SYSTEM | PBSEVENT_JOB | PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);

			/* Force requeue the job since the job has been aborted by the server */
			force_reque(jobp);
			break;

		case SEND_JOB_NODEDW: /* node (mother superior) is down? */
			mark_node_down(jobp->ji_qs.ji_destin, "could not send job to mom");

			/* fall through to requeue job */

		default: /* send failed, requeue the job */
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  jobp->ji_qs.ji_jobid,
				  "Unable to Run Job, MOM rejected");

			/* release resources */
			if (check_job_substate(jobp, JOB_SUBSTATE_PROVISION) ||
			    check_job_substate(jobp, JOB_SUBSTATE_PRERUN))
				rel_resc(jobp);
			else
				free_nodes(jobp);

			/* delete stagein files if flag is set */
			if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_StagedIn)
				if (remove_stagein(jobp) != 0) {
					/* if remove stagein is failed then */
					/* we will remove stagedin flag from job */
					jobp->ji_qs.ji_svrflags &= ~JOB_SVFLG_StagedIn;
				}
			snprintf(dest_host, sizeof(dest_host), "%s", jobp->ji_qs.ji_destin);
			clear_exec_on_run_fail(jobp);

			if (!check_job_substate(jobp, JOB_SUBSTATE_ABORT)) {
				if (preq) {
					if ((r == SEND_JOB_HOOKERR) ||
					    (r == SEND_JOB_HOOK_REJECT) ||
					    (r == SEND_JOB_HOOK_REJECT_RERUNJOB) ||
					    (r == SEND_JOB_HOOK_REJECT_DELETEJOB)) {
						int err;

						if (r == SEND_JOB_HOOK_REJECT)
							err = PBSE_HOOK_REJECT;
						else if (r == SEND_JOB_HOOK_REJECT_RERUNJOB)
							err = PBSE_HOOK_REJECT_RERUNJOB;
						else if (r == SEND_JOB_HOOK_REJECT_DELETEJOB)
							err = PBSE_HOOK_REJECT_DELETEJOB;
						else
							err = PBSE_HOOKERROR;

						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB,
							  LOG_NOTICE, jobp->ji_qs.ji_jobid, pbse_to_txt(err));

						reply_text(preq, err, hook_msg ? hook_msg : "");
					} else {
						req_reject(PBSE_MOMREJECT, 0, preq);
					}
				}

				if (r == SEND_JOB_HOOK_REJECT_DELETEJOB) {
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_JOB, LOG_INFO,
						  jobp->ji_qs.ji_jobid,
						  "Job aborted per a hook rejection");

					/* Need to force queued state so */
					/* job_abt() call does not try   */
					/* to issue a kill job signal to mom */
					set_job_state(jobp, JOB_STATE_LTR_QUEUED);
					set_job_substate(jobp, JOB_SUBSTATE_QUEUED);
					job_abt(jobp, msg_hook_reject_deletejob);
					break;
				} else if ((r == SEND_JOB_HOOKERR) ||
					   (r == SEND_JOB_HOOK_REJECT) ||
					   (r == SEND_JOB_HOOK_REJECT_RERUNJOB)) {
					check_failed_attempts(jobp);
					if (r == SEND_JOB_HOOKERR) {
						hook *phook;
						phook = find_hook(hook_name);
						if (phook != NULL) {
							if ((phook->fail_action & HOOK_FAIL_ACTION_OFFLINE_VNODES) != 0) {
								/*
								 * hook_buf must be large enough
								 * to hold the hook_name and a
								 * small amount of text.
								 */
								char hook_buf[PBS_HOOK_NAME_SIZE + 64];

								snprintf(hook_buf, sizeof(hook_buf),
									 "offlined by hook '%s' due to hook error",
									 hook_name);
								mark_node_offline_by_mom(dest_host, hook_buf);
							}
							if ((phook->fail_action & HOOK_FAIL_ACTION_SCHEDULER_RESTART_CYCLE) != 0) {

								set_scheduler_flag(SCH_SCHEDULE_RESTART_CYCLE, dflt_scheduler);
								log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, phook->hook_name, "requested for scheduler to restart cycle");
							}
						}
					}
				}

				svr_evaljobstate(jobp, &newstate, &newsub, 1);
				svr_setjobstate(jobp, newstate, newsub);
			} else {
				if (preq)
					req_reject(PBSE_BADSTATE, 0, preq);
			}

			break;
	}

	if (prot == PROT_TCP && reject_msg != NULL)
		free(reject_msg); /* free this only in case of non-tpp since it was locally allocated */

	return;
}

/**
 * @brief
 * 		chk_job_torun - check state and past execution host of a job for which
 *		files are about to be staged in or the job is about to be run.
 * 		Returns pointer to job if all is ok, else returns null.
 *
 *		pjob must be to a existing job structure
 *
 * @param[in,out]	preq	-	Pointer to batch request
 * @param[in]	pjob	-	existing job structure
 *
 * @return	Pointer to job
 * @retval	null	: fail
 */

static job *
chk_job_torun(struct batch_request *preq, job *pjob)
{

	if (pjob == NULL)
		return pjob;

	if ((check_job_state(pjob, JOB_STATE_LTR_TRANSIT)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_EXITING)) ||
	    (check_job_substate(pjob, JOB_SUBSTATE_STAGEGO)) ||
	    (check_job_substate(pjob, JOB_SUBSTATE_PRERUN)) ||
	    (check_job_substate(pjob, JOB_SUBSTATE_RUNNING))) {
		req_reject(PBSE_BADSTATE, 0, preq);
		return NULL;
	}

	if (preq->rq_type == PBS_BATCH_StageIn) {
		if (check_job_substate(pjob, JOB_SUBSTATE_STAGEIN)) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return NULL;
		}
	}
	return (pjob);
}
/**
 * @brief
 * 		where to execute the job
 *
 * @param[in,out]	preq	-	Pointer to batch request
 * @param[in,out]	pjob	-	existing job structure
 *
 * @return	Pointer to job
 * @retval	null	: fail
 */
static job *
where_to_runjob(struct batch_request *preq, job *pjob)
{
	char *nspec;
	struct rq_runjob *prun = &preq->rq_ind.rq_run;
	int rc;

	if ((pjob->ji_qs.ji_svrflags & (JOB_SVFLG_CHKPT | JOB_SVFLG_StagedIn)) ||
	    ((prun->rq_destin != NULL) && (*prun->rq_destin == '-') && (*(prun->rq_destin + 1) == '\0'))) {
		/* Job has files staged, a checkpoint image, or "qrun -H -" was specified.	*/
		/* Reuse assigned resources.							*/
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HasNodes) == 0) {
			/* re-reserve nodes and leave exec_vnode as is */
			/* convert exec_vnode string into form like user spec */
			nspec = get_jattr_str(pjob, JOB_ATR_exec_vnode);
			if (nspec == NULL) {
				/* something's wrong, before we reject the */
				/* job let us clear the flags so the job can */
				/* run the next time around  */
				pjob->ji_qs.ji_svrflags &= ~(JOB_SVFLG_CHKPT |
							     JOB_SVFLG_StagedIn);
				req_reject(PBSE_IVALREQ, 0, preq);
				return NULL;
			}
			if ((rc = assign_hosts(pjob, nspec, 0)) != 0) {
				free(nspec);
				req_reject(rc, 0, preq);
				return NULL;
			}
		}
	} else {

		/* job has not run before or need not run there again	*/
		/* reserve nodes and set exec_vnode anew		*/

		if ((prun->rq_destin == NULL) ||
		    (*prun->rq_destin == '\0')) {
			req_reject(PBSE_IVALREQ, 0, preq);
			return NULL;
		}

		if ((is_jattr_set(pjob, JOB_ATR_exec_vnode)) != 0) {
			/*
			 * Instruct MoM to discard the existing job before we assign new
			 * resources. This ensures previously assigned resources are cleaned
			 * up properly and prevents orphaned processes. If the job is not
			 * discarded, files and directories created for the job will linger.
			 */
			discard_job(pjob, "Force qrun", 1);
		}

		rc = assign_hosts(pjob, prun->rq_destin, 1);

		if (rc != 0) {
			req_reject(rc, 0, preq);
			return NULL;
		}
	}

	/* If the request did not come from the scheduler, update the comment. */
	if (find_sched_from_sock(preq->rq_conn, CONN_SCHED_PRIMARY) == NULL) {
		char comment[MAXCOMMENTLEN];
		nspec = get_jattr_str(pjob, JOB_ATR_exec_vnode);
		if ((nspec != NULL) && (*nspec != '\0')) {
			snprintf(comment, MAXCOMMENTLEN, "Job manually qrun on %s", nspec);
		} else {
			snprintf(comment, MAXCOMMENTLEN, "Job manually qrun.");
		}
		set_jattr_str_slim(pjob, JOB_ATR_Comment, comment, NULL);
	}

	return (pjob);
}

/**
 * @brief
 * 		assign_hosts - assign hosts (vnodes) to job which are specified (given) by:
 *		1. the scheduler when it runs a job,
 *		2. the operator as the -H option to qrun
 *		3. from exec_vnode when required by checkpoint-restart or file stage-in
 *
 * @param[in,out]	pjob	-	pointer to a job object
 * @param[in]	given	-	original vnode list from scheduler/operator
 * @param[in]	set_exec_vnode	-	if True (non-zero), this function is to create
 *                              	a new hoststr including new job indicies,
 *                              	otherwise return existing exec_host unchanged.
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: error code
 */

int
assign_hosts(job *pjob, char *given, int set_exec_vnode)
{
	char *hoststr;
	char *hoststr2;
	char *vnodestoalloc;
	pbs_net_t momaddr = 0;
	unsigned int port;
	int rc = 0;

	if (svr_totnodes == 0) /* Must have nodes file */
		return (PBSE_NONODES);

	if (given == NULL)
		return (PBSE_IVALREQ);

	/* allocate the execution nodes and resources */

	if ((set_exec_vnode == 0) &&
	    (is_jattr_set(pjob, JOB_ATR_exec_host))) {
		hoststr = get_jattr_str(pjob, JOB_ATR_exec_host);
		hoststr2 = get_jattr_str(pjob, JOB_ATR_exec_host2);
	} else {
		hoststr = NULL;
		hoststr2 = NULL;
	}

	rc = set_nodes((void *) pjob, JOB_OBJECT, given, &vnodestoalloc, &hoststr, &hoststr2,
		       set_exec_vnode, FALSE);

	if (rc == 0) {
		if (set_exec_vnode) {
			free_jattr(pjob, JOB_ATR_exec_host);
			free_jattr(pjob, JOB_ATR_exec_host2);
			free_jattr(pjob, JOB_ATR_exec_vnode);
			set_jattr_str_slim(pjob, JOB_ATR_exec_vnode, vnodestoalloc, NULL);
			set_jattr_str_slim(pjob, JOB_ATR_exec_host, hoststr, NULL);
			set_jattr_str_slim(pjob, JOB_ATR_exec_host2, hoststr2, NULL);
		} else {
			/* leave exec_vnode alone and reuse old IP address */
			momaddr = pjob->ji_qs.ji_un.ji_exect.ji_momaddr;
			port = pjob->ji_qs.ji_un.ji_exect.ji_momport;
		}
		strncpy(pjob->ji_qs.ji_destin,
			parse_servername(hoststr, NULL),
			PBS_MAXROUTEDEST);
		if (momaddr == 0) {
			momaddr = get_addr_of_nodebyname(pjob->ji_qs.ji_destin,
							 &port);
			if (momaddr == 0) {
				free_nodes(pjob);
				free_jattr(pjob, JOB_ATR_exec_host);
				free_jattr(pjob, JOB_ATR_exec_host2);
				free_jattr(pjob, JOB_ATR_exec_vnode);
				return (PBSE_BADHOST);
			}
		}
		pjob->ji_qs.ji_un.ji_exect.ji_momaddr = momaddr;
		pjob->ji_qs.ji_un.ji_exect.ji_momport = port;
	}
	return (rc);
}

/**
 * @brief
 * 		req_defschedreply - handle the deferred scheduler reply call
 *
 * @param[in,out]	preq	-	Pointer to batch request
 */

void
req_defschedreply(struct batch_request *preq)
{
	pbs_sched *psched;
	pbs_list_head *deferred_req;
	struct deferred_request *pdefr;

	if (preq->rq_ind.rq_defrpy.rq_cmd != SCH_SCHEDULE_AJOB) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	find_assoc_sched_jid(preq->rq_ind.rq_defrpy.rq_id, &psched);
	deferred_req = fetch_sched_deferred_request(psched, false);
	if (deferred_req == NULL) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	for (pdefr = (struct deferred_request *) GET_NEXT(*deferred_req);
	     pdefr;
	     pdefr = (struct deferred_request *) GET_NEXT(pdefr->dr_link)) {
		if (strcmp(preq->rq_ind.rq_defrpy.rq_id, pdefr->dr_id) == 0)
			break;
	}

	if (pdefr == NULL) {
		req_reject(PBSE_UNKJOBID, 0, preq);
		return;
	}

	/* reply to the original (deferred) request */
	/* if the connection for the original request (qrun) was closed */
	/* the pointer to it will have been nulled */
	if (pdefr->dr_preq != NULL) {
		/* "preq" points to the deferred reply from the Scheduler  */
		/* "pdefr" points to the original qrun batch request, this */
		/* request structure will be freed on the reply            */

		if (preq->rq_ind.rq_defrpy.rq_txt) {
			/* have a text string from the Scheduler to send to qrun */
			reply_text(pdefr->dr_preq, preq->rq_ind.rq_defrpy.rq_err,
				   preq->rq_ind.rq_defrpy.rq_txt);

		} else if (preq->rq_ind.rq_defrpy.rq_err == 0) {
			/* no error, acknowledge qrun */
			reply_send(pdefr->dr_preq);

		} else {
			/* was an error (without text string), send error to qrun */
			req_reject(preq->rq_ind.rq_defrpy.rq_err, 0, pdefr->dr_preq);
		}
	}

	/* unlink and free the deferred request entry */
	delete_link(&pdefr->dr_link);
	free(pdefr);

	clear_sched_deferred_request(psched);

	reply_send(preq);
}

/**
 * @brief
 *	convert_job_to_resv - create a reservation out of the job
 * 			      and move the job to the newly created
 * 			      reservation.
 *
 * @param[in]	pjob - pointer to the job object
 *
 * @return	void
 */

void
convert_job_to_resv(job *pjob)
{
	svrattrl *psatl;
	unsigned int len;
	pbs_list_head *plhed;
	struct work_task *pwt;
	struct batch_request *newreq;

	newreq = alloc_br(PBS_BATCH_SubmitResv);
	if (newreq == NULL) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, "batch request allocation failed, could not create reservation from the job");
		return;
	}
	newreq->rq_type = PBS_BATCH_SubmitResv;

	get_jobowner(get_jattr_str(pjob, JOB_ATR_job_owner), newreq->rq_user);

	strncpy(newreq->rq_host, get_jattr_str(pjob, JOB_ATR_submit_host), PBS_MAXHOSTNAME);
	newreq->rq_perm = READ_WRITE | ATR_DFLAG_ALTRUN;

	newreq->rq_ind.rq_queuejob.rq_jid[0] = '\0';
	newreq->rq_ind.rq_queuejob.rq_destin[0] = '\0';

	len = strlen(pjob->ji_qs.ji_jobid) + 1;
	plhed = &newreq->rq_ind.rq_queuejob.rq_attr;
	CLEAR_HEAD(newreq->rq_ind.rq_queuejob.rq_attr);
	if ((psatl = attrlist_create(ATTR_resv_job, NULL, len)) != NULL) {
		psatl->al_flags = resv_attr_def[RESV_ATR_job].at_flags;
		strcpy(psatl->al_value, pjob->ji_qs.ji_jobid);
		append_link(plhed, &psatl->al_link, psatl);
	}

	if (issue_Drequest(PBS_LOCAL_CONNECTION, newreq, release_req, &pwt, 0) == -1) {
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_ERR,
			  pjob->ji_qs.ji_jobid, "Could not create reservation from the job");
		free_br(newreq);
	}
}


================================================
FILE: src/server/req_select.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * 		Functions relating to the Select Job Batch Request and the Select-Status
 * 		(SelStat) Batch Request.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#define STAT_CNTL 1

#include <sys/types.h>
#include <stdlib.h>
#include "libpbs.h"
#include <string.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "pbs_sched.h"

/* Private Data */

/* Global Data Items  */

extern int resc_access_perm;
extern pbs_list_head svr_alljobs;
extern time_t time_now;
extern char statechars[];
extern long svr_history_enable;
extern int scheduler_jobs_stat;

/* Private Functions  */

static int
build_selist(svrattrl *, int perm, struct select_list **,
	     pbs_queue **, int *bad, char **pstate);
static void free_sellist(struct select_list *pslist);
static int sel_attr(attribute *, struct select_list *);
static int select_job(job *, struct select_list *, int, int);
static int select_subjob(char, struct select_list *);

/**
 * @brief
 * 		order_chkpnt - provide order value for various checkpoint attribute values
 *		n > s > c=minutes > c
 *
 * @param[in]	attr	-	attribute structure
 *
 * @return	order value
 * @retval	0	: no match
 * @retval	!0	: value according to the checkpoints
 */

static int
order_chkpnt(attribute *attr)
{
	if (((is_attr_set(attr)) == 0) ||
	    (attr->at_val.at_str == 0))
		return 0;

	switch (*attr->at_val.at_str) {
		case 'n':
			return 5;
		case 's':
			return 4;
		case 'c':
			if (*(attr->at_val.at_str + 1) != '\0')
				return 3;
			else
				return 2;
		case 'u':
			return 1;
		default:
			return 0;
	}
}

/**
 * @brief
 * 		comp_chkpnt - compare two checkpoint attributes for selection
 *
 * @param[in]	attr	-	attribute structure to compare
 * @param[in]	with	-	attribute structure to compare with
 *
 * @return	int
 * @retval	0	: same
 * @retval	1	: attr > with
 * @retval	-1	: attr < with
 */

int
comp_chkpnt(attribute *attr, attribute *with)
{
	int a;
	int w;

	a = order_chkpnt(attr);
	w = order_chkpnt(with);

	if (a == w)
		return 0;
	else if (a > w)
		return 1;
	else
		return -1;
}

/**
 * @brief
 * 		comp_state - compare the state of a job attribute (state) with that in
 *		a select list (multiple state letters)
 *
 * @param[in]	state	-	state of a job attribute
 * @param[in]	selstate	-	select list (multiple state letters)
 *
 * @return	int
 * @retval	0	: match found
 * @retval	1	: no match
 * @retval	-1	: either state or selstate fields are empty
 */
static int
comp_state(attribute *state, attribute *selstate)
{
	char *ps;

	if (!state || !selstate || !selstate->at_val.at_str)
		return (-1);

	for (ps = selstate->at_val.at_str; *ps; ++ps) {
		if (*ps == state->at_val.at_char)
			return (0);
	}
	return (1);
}

static attribute_def state_sel = {
	ATTR_state,
	decode_str,
	encode_str,
	set_str,
	comp_state,
	free_str,
	NULL_FUNC,
	READ_ONLY,
	ATR_TYPE_STR,
	PARENT_TYPE_JOB};

/**
 * @brief
 * 		chk_job_statenum - check the state of a job (actual numeric state) with
 * 		a list of state letters
 *
 * @param[in]	state_ltr	-	state of a job as a letter
 * @param[in]	statelist	-	list of state letters
 *
 * @return	int
 * @retval	0	: no match
 * @retval	1	: match found
 */
static int
chk_job_statenum(char state_ltr, char *statelist)
{
	if (statelist == NULL)
		return 1;

	if (strchr(statelist, (int) state_ltr))
		return 1;
	return 0;
}

/**
 * @brief
 * 		add_select_entry - add one jobid entry to the select return
 *
 * @param[in]	jid	-	jobid entry
 * @param[in,out]	pselx	-	select return
 *
 * @return	int
 * @retval	0	: error and not added
 * @retval	1	: added
 */
static int
add_select_entry(char *jid, struct brp_select ***pselx)
{
	struct brp_select *pselect;

	if (jid == NULL)
		return 0;

	pselect = (struct brp_select *) malloc(sizeof(struct brp_select));
	if (pselect == NULL)
		return 0;

	pselect->brp_next = NULL;
	(void) strcpy(pselect->brp_jobid, jid);
	**pselx = pselect;
	*pselx = &pselect->brp_next;
	return 1;
}

/**
 * @brief
 * 		add_select_array_entries - add one jobid entry to the select return
 *		for each subjob whose state matches
 *
 * @param[in]	pjob	-	pointer to job
 * @param[in]	dosub	-	treat as a normal job or array job
 * @param[in]	statelist	-	If statelist is NULL, then no need to check anything,
 * 								just add the subjobs to the return list.
 * @param[in,out]	pselx	-	select return
 * @param[in]	psel	-	pointer to select list
 *
 * @return	int
 * @retval	0	: error and not added
 * @retval	>0	: no. of entries added
 */
static int
add_select_array_entries(job *pjob, int dosub, char *statelist,
			 struct brp_select ***pselx,
			 struct select_list *psel)
{
	int ct = 0;
	int i;

	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob)
		return 0;
	else if ((dosub == 0) ||
		 (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) == 0) {
		/* is or treat as a normal job */
		ct = add_select_entry(pjob->ji_qs.ji_jobid, pselx);
	} else {
		/* Array Job */
		for (i = pjob->ji_ajinfo->tkm_start; i <= pjob->ji_ajinfo->tkm_end; i += pjob->ji_ajinfo->tkm_step) {
			/*
			 * If statelist is NULL, then no need to check anything,
			 * just add the subjobs to the return list.
			 */
			char sjst;
			job *sj = get_subjob_and_state(pjob, i, &sjst, NULL);
			if (sjst == JOB_STATE_LTR_UNKNOWN)
				continue;
			if ((statelist == NULL) ||
			    (select_subjob(sjst, psel))) {
				ct += add_select_entry(sj ? sj->ji_qs.ji_jobid : create_subjob_id(pjob->ji_qs.ji_jobid, i), pselx);
			}
		}
	}

	return ct;
}

/**
 * @brief
 * 	Service both the Select Job Request and the (special for the scheduler)
 * 	Select-status Job Request
 *
 *	This request selects jobs based on a supplied criteria and returns
 *	Select   - a list of the job identifiers which meet the criteria
 *	Sel_stat - a list of the status of the jobs that meet the criteria
 *	             and only the list of specified attributes if specified
 *
 * @param[in,out] preq - Select Job Request or Select-status Job Request
 *
 * @return void
 *
 */
void
req_selectjobs(struct batch_request *preq)
{
	int bad = 0;
	int i;
	job *pjob;
	svrattrl *plist;
	pbs_queue *pque;
	struct batch_reply *preply;
	struct brp_select **pselx;
	int dosubjobs = 0;
	int dohistjobs = 0;
	char *pstate = NULL;
	int rc;
	struct select_list *selistp;
	pbs_sched *psched;

	if (preq->rq_extend != NULL) {
		/*
		 * if the letter T (or t) is in the extend string, select subjobs
		 *
		 * if the letter S is in the extend string, select real jobs,
		 * regualar and running subjobs as it is requested by the Scheduler.
		 */
		if (strchr(preq->rq_extend, 'T') || strchr(preq->rq_extend, 't'))
			dosubjobs = 1;
		else if (strchr(preq->rq_extend, 'S'))
			dosubjobs = 2;
		/*
		 * If the letter x is in the extend string, Check if the server is
		 * configured for job history info. If it is not SET or set to FALSE
		 * then return with PBSE_JOBHISTNOTSET error. Otherwise select history
		 * jobs also.
		 */
		if (strchr(preq->rq_extend, 'x')) {
			if (svr_history_enable == 0) {
				req_reject(PBSE_JOBHISTNOTSET, 0, preq);
				return;
			}
			dohistjobs = 1;
		}
	}

	/*
	 * The first selstat() call from the scheduler indicates that a cycle
	 * is in progress and has reached the point of querying for jobs.
	 *
	 * TODO: This approach must be revisited if the scheduler changes its
	 * approach to query for jobs, e.g., by issuing a single pbs_statjob()
	 * instead of a per-queue selstat()
	 */
	psched = find_sched_from_sock(preq->rq_conn, CONN_SCHED_PRIMARY);
	if (psched != NULL && psched == dflt_scheduler && !scheduler_jobs_stat)
		scheduler_jobs_stat = 1;

	plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_select.rq_selattr);
	rc = build_selist(plist, preq->rq_perm, &selistp, &pque, &bad, &pstate);
	if (rc != 0) {
		reply_badattr(rc, bad, plist, preq);
		free_sellist(selistp);
		return;
	}

	/* setup the appropriate return */
	preply = &preq->rq_reply;
	if (preq->rq_type == PBS_BATCH_SelectJobs) {
		preply->brp_choice = BATCH_REPLY_CHOICE_Select;
		preply->brp_un.brp_select = NULL;
	} else {
		preply->brp_choice = BATCH_REPLY_CHOICE_Status;
		CLEAR_HEAD(preply->brp_un.brp_status);
	}
	pselx = &preply->brp_un.brp_select;
	preply->brp_count = 0;

	/* now start checking for jobs that match the selection criteria */
	if (pque)
		pjob = (job *) GET_NEXT(pque->qu_jobs);
	else
		pjob = (job *) GET_NEXT(svr_alljobs);
	while (pjob) {
		if (get_sattr_long(SVR_ATR_query_others) || svr_authorize_jobreq(preq, pjob) == 0) {

			/*
			 * either job owner or has special permission to see job
			 * and
			 * look at the job and see if the required attributes match
			 * If "T" was specified, dosubjobs is set, and if the job is
			 * an Array Job, then the State is Not checked. The State
			 * must be checked against the state of each Subjob
			 */

			if (select_job(pjob, selistp, dosubjobs, dohistjobs)) {

				/* job is selected, include in reply */
				if (preq->rq_type == PBS_BATCH_SelectJobs) {

					/* Select Jobs Reply */

					preply->brp_count += add_select_array_entries(pjob, dosubjobs, pstate, &pselx, selistp);

				} else if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) == 0 || dosubjobs == 2) {

					/* Select-Status Reply */

					plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_select.rq_rtnattr);
					if (dosubjobs == 1 && pjob->ji_ajinfo) {
						for (i = pjob->ji_ajinfo->tkm_start; i <= pjob->ji_ajinfo->tkm_end; i += pjob->ji_ajinfo->tkm_step) {
							char sjst = JOB_STATE_LTR_QUEUED;

							get_subjob_and_state(pjob, i, &sjst, NULL);
							if (sjst == JOB_STATE_LTR_UNKNOWN)
								continue;
							if (pstate == 0 || chk_job_statenum(sjst, pstate)) {
								if (preply->brp_count >= MAX_JOBS_PER_REPLY) {
									rc = reply_send_status_part(preq);
									if (rc != PBSE_NONE)
										return;
									preply->brp_count = 0;
								}
								rc = status_subjob(pjob, preq, plist, i, &preply->brp_un.brp_status, &bad, 0);
								if (rc && rc != PBSE_PERM)
									goto out;
								plist = (svrattrl *) GET_NEXT(preq->rq_ind.rq_select.rq_rtnattr);
							}
						}
					} else {
						rc = status_job(pjob, preq, plist, &preply->brp_un.brp_status, &bad, 0);
						if (rc && rc != PBSE_PERM)
							goto out;
					}
				}
			}
		}
		if (pque)
			pjob = (job *) GET_NEXT(pjob->ji_jobque);
		else
			pjob = (job *) GET_NEXT(pjob->ji_alljobs);
		if (preq->rq_type != PBS_BATCH_SelectJobs && preply->brp_count >= MAX_JOBS_PER_REPLY && pjob) {
			rc = reply_send_status_part(preq);
			if (rc != PBSE_NONE)
				return;
		}
	}
out:
	free_sellist(selistp);
	if (rc)
		req_reject(rc, 0, preq);
	else
		reply_send(preq);
}

/**
 * @brief
 * 		select_job - determine if a single job matches the selection criteria
 *
 * @param[in]	pjob	-	pointer to job
 * @param[in]	psel	-	selection list
 * @param[in]	dosubjobs	-	Does it needs to check the subjob.
 * @param[in]	dohistjobs	-	If not being asked for history jobs specifically,
 * 									then just skip them otherwise include them.
 *
 * @return	int
 * @retval	0	: no match
 * @retval	1	: matches
 */

static int
select_job(job *pjob, struct select_list *psel, int dosubjobs, int dohistjobs)
{

	/*
	 * If not being asked for history jobs specifically, then just skip
	 * them otherwise include them. i.e. if the batch request has the special
	 * extended flag 'x'.
	 */
	if ((!dohistjobs) && ((check_job_state(pjob, JOB_STATE_LTR_FINISHED)) ||
			      (check_job_state(pjob, JOB_STATE_LTR_MOVED)))) {
		return 0;
	}

	if ((dosubjobs == 2) && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) &&
	    (!check_job_state(pjob, JOB_STATE_LTR_EXITING)) &&
	    (!check_job_state(pjob, JOB_STATE_LTR_RUNNING))) /* select only exiting or running subjobs */
		return 0;

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) == 0)
		dosubjobs = 0; /* not an Array Job,  ok to check state */
	else if ((dosubjobs != 2) &&
		 (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob))
		return 0; /* don't bother to look at sub job */

	for (; psel; psel = psel->sl_next) {

		if (psel->sl_atindx == (int) JOB_ATR_userlst) {
			if (!acl_check(&psel->sl_attr, get_jattr_str(pjob, JOB_ATR_job_owner), ACL_User))
				return (0);

		} else if (!dosubjobs || (psel->sl_atindx != JOB_ATR_state)) {
			if (!sel_attr(get_jattr(pjob, psel->sl_atindx), psel)) {
				/* Make sure we haven't incorrectly dismissed a suspended job */
				if (psel->sl_atindx == JOB_ATR_state && get_attr_str(&psel->sl_attr)[0] == 'S') {
					if (check_job_state(pjob, JOB_STATE_LTR_RUNNING) &&
					    (check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP) ||
					     check_job_substate(pjob, JOB_SUBSTATE_SUSPEND)))
						continue;
				}
				return 0;
			} else if (psel->sl_atindx == JOB_ATR_state && get_attr_str(&psel->sl_attr)[0] == 'R') {
				/* Make sure we don't incorrectly select suspended jobs */
				if (check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP) || check_job_substate(pjob, JOB_SUBSTATE_SUSPEND))
					return 0;
			}
		}
	}

	return 1;
}

/**
 * @brief
 * 		sel_attr - determine if attribute is according to the selection operator
 *
 * @param[in]	jobat	-	job attribute
 * @param[in]	pselst	-	selection operator
 *
 * @return	int
 * @retval	0	: attribute does not meets criteria
 * @retval	1	: attribute meets criteria
 *
 */

static int
sel_attr(attribute *jobat, struct select_list *pselst)
{
	int rc;
	resource *rescjb;
	resource *rescsl;

	if (pselst->sl_attr.at_type == ATR_TYPE_RESC) {

		/* Only one resource per selection entry, 		*/
		/* find matching resource in job attribute if one	*/

		rescsl = (resource *) GET_NEXT(pselst->sl_attr.at_val.at_list);
		rescjb = find_resc_entry(jobat, rescsl->rs_defin);

		if (rescjb && (is_attr_set(&rescjb->rs_value)))
			/* found match, compare them */
			rc = pselst->sl_def->at_comp(&rescjb->rs_value, &rescsl->rs_value);
		else /* not one in job,  force to .lt. */
			rc = -1;

	} else {
		/* "normal" attribute */

		rc = pselst->sl_def->at_comp(jobat, &pselst->sl_attr);
	}

	if (rc < 0) {
		if ((pselst->sl_op == NE) ||
		    (pselst->sl_op == LT) ||
		    (pselst->sl_op == LE))
			return (1);

	} else if (rc > 0) {
		if ((pselst->sl_op == NE) ||
		    (pselst->sl_op == GT) ||
		    (pselst->sl_op == GE))
			return (1);

	} else { /* rc == 0 */
		if ((pselst->sl_op == EQ) ||
		    (pselst->sl_op == GE) ||
		    (pselst->sl_op == LE))
			return (1);
	}
	return (0);
}

/**
 * @brief
 * 		Free a select_list list created by build_selist()
 * @par
 *		For each entry in the select_list free the enclosed attribute entry
 *		using the index into the job_attr_def array in sl_atindx.  For an
 *		attribute of type resource, this is the index of the resource type
 *		attribute (typically Resource_List).  Where as sl_def is specific to
 *		the resource in the list headed by that attribute.  There is only one
 *		resource per select_list entry.
 *
 * @param[in]	pslist	-	pointer to first entry in the select list.
 *
 * @return	none
 */

static void
free_sellist(struct select_list *pslist)
{
	struct select_list *next;

	while (pslist) {
		next = pslist->sl_next;
		if (pslist->sl_atindx == JOB_ATR_state)
			state_sel.at_free(&pslist->sl_attr);
		else
			free_attr(job_attr_def, &pslist->sl_attr, pslist->sl_atindx);
		(void) free(pslist); /* free the entry */
		pslist = next;
	}
}

/**
 * @brief
 * 		build_selentry - build a single entry for a select list
 *
 * @param[in]	pslist	-	svrattrl structure from which we decode the select list
 * @param[in]	pdef	-	attribute_def structure.
 * @param[in]	perm	-	permission
 * @param[out]	rtnentry	-	pointer to the single entry for the select list
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: error code
 *
 */

static int
build_selentry(svrattrl *plist, attribute_def *pdef, int perm, struct select_list **rtnentry)
{
	struct select_list *entry;
	resource_def *prd;
	int old_perms = resc_access_perm;
	int rc;

	/* create a select list entry for this attribute */

	entry = (struct select_list *)
		malloc(sizeof(struct select_list));
	if (entry == NULL)
		return (PBSE_SYSTEM);

	entry->sl_next = NULL;

	clear_attr(&entry->sl_attr, pdef);

	if (!(pdef->at_flags & ATR_DFLAG_RDACC & perm)) {
		(void) free(entry);
		return (PBSE_PERM); /* no read permission */
	}
	if ((pdef->at_flags & ATR_DFLAG_SELEQ) && (plist->al_op != EQ) &&
	    (plist->al_op != NE)) {
		/* can only select eq/ne on this attribute */
		(void) free(entry);
		return (PBSE_IVALREQ);
	}

	/*
	 * If a resource is marked flag=r in resourcedef
	 * we need to force the decode function to
	 * decode it to allow us to select upon it.
	 */
	if (plist->al_resc != NULL) {
		prd = find_resc_def(svr_resc_def, plist->al_resc);
		if (prd != NULL && (prd->rs_flags & NO_USER_SET) == NO_USER_SET) {
			resc_access_perm = ATR_DFLAG_ACCESS;
		}
	}

	/* decode the attribute into the entry */

	rc = set_attr_generic(&entry->sl_attr, pdef, plist->al_value, plist->al_resc, INTERNAL);

	resc_access_perm = old_perms;
	if (rc) {
		if (rc == PBSE_UNKRESC) {
			/* The resource was unknown, free the allocated attribute */
			pdef->at_free(&entry->sl_attr);
		}
		(void) free(entry);
		return (rc);
	}
	if (!is_attr_set(&entry->sl_attr)) {
		(void) free(entry);
		return (PBSE_BADATVAL);
	}

	/*
	 * save the pointer to the attribute definition,
	 * if a resource, use the resource specific one
	 */

	if (entry->sl_attr.at_type == ATR_TYPE_RESC) {
		entry->sl_def = (attribute_def *) find_resc_def(svr_resc_def, plist->al_resc);
		if (!entry->sl_def) {
			(void) free(entry);
			return (PBSE_UNKRESC);
		}
	} else
		entry->sl_def = pdef;

	/* save the selection operator to pass along */

	entry->sl_op = plist->al_op;

	*rtnentry = entry;
	return (0);
}

/**
 * @brief
 * 		build_selist - build the list of select_list structures based on
 *		the svrattrl structures in the request.
 * @par
 *		Function returns non-zero on an error, also returns into last
 *		four entries of the parameter list.
 *
 * @param[in]	plist	-	svrattrl structure from which we decode the select list
 * @param[in]	perm	-	permission
 * @param[out]	pselist	-	RETURN : select list
 * @param[out]	pque	-	RETURN : queue ptr if limit to que
 * @param[out]	bad	-	RETURN - index of bad attr
 * @param[out]	pstate	-	RETURN - pointer to required state
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: error code
 */

static int
build_selist(svrattrl *plist, int perm, struct select_list **pselist, pbs_queue **pque, int *bad, char **pstate)
{
	struct select_list *entry;
	int i;
	char *pc;
	attribute_def *pdef;
	struct select_list *prior = NULL;
	int rc;

	/* set permission for decode_resc() */

	resc_access_perm = perm;

	*pque = NULL;
	*bad = 0;
	*pselist = NULL;
	while (plist) {
		(*bad)++; /* list counter incase one is bad */

		/* go for all job unless a "destination" other than */
		/* "@server" is specified			    */

		if (!strcasecmp(plist->al_name, ATTR_q)) {
			if (plist->al_valln) {
				if (((pc = strchr(plist->al_value, (int) '@')) == 0) ||
				    (pc != plist->al_value)) {

					/* does specified destination exist? */

					*pque = find_queuebyname(plist->al_value);
#ifdef NAS /* localmod 075 */
					if (*pque == NULL)
						*pque = find_resvqueuebyname(plist->al_value);
#endif /* localmod 075 */
					if (*pque == NULL)
						return (PBSE_UNKQUE);
				}
			}
		} else {
			i = find_attr(job_attr_idx, job_attr_def, plist->al_name);
			if (i < 0)
				return (PBSE_NOATTR); /* no such attribute */

			if (i == JOB_ATR_state) {
				pdef = &state_sel;
				*pstate = plist->al_value;
			} else {
				pdef = job_attr_def + i;
			}

			/* create a select list entry for this attribute */

			rc = build_selentry(plist, pdef, perm, &entry);
			if (rc)
				return rc;
			entry->sl_atindx = i;

			/* add the entry to the select list */

			if (prior)
				prior->sl_next = entry; /* link into list */
			else
				*pselist = entry; /* return start of list */
			prior = entry;
		}
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}
	return (0);
}

/**
 * @brief
 *		Select subjob by matching the specified state with select_list
 *
 * @par
 *		Linkage scope: Local(static)
 *
 * @par Functionality:
 *		This function walks through the select list (which is basically a \n
 *		linked list of attribute structures built by build_selist()). Skips \n
 *		the select_list structure if the index is not JOB_ATR_state.
 *
 * @see	add_select_array_entries()
 *
 * @param[in]	state	-	state of the subjob
 * @param[in]	psel	-	pointer to select list
 *
 * @return	int
 *
 * @retval	0	- failure: no match
 * @retval	1	- success: selected subjob
 *
 * @par MT-safety: NO
 *
 */

static int
select_subjob(char state, struct select_list *psel)
{
	attribute *selstate;

	for (; psel; psel = psel->sl_next) {
		if (psel->sl_atindx != JOB_ATR_state)
			continue;
		selstate = &psel->sl_attr;
		if (selstate == NULL)
			continue;
		if (!chk_job_statenum(state, selstate->at_val.at_str))
			return (0);
	}
	return (1);
}


================================================
FILE: src/server/req_shutdown.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	req_shutdown.c
 *
 * @brief
 * 		req_shutdown.c - contains the functions to shutdown the server
 *
 * Included functions are:
 * 	svr_shutdown()
 * 	shutdown_ack()
 * 	req_shutdown()
 * 	shutdown_preempt_chkpt()
 * 	post_chkpt()
 * 	rerun_or_kill()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include "libpbs.h"
#include <errno.h>
#include <fcntl.h>
#include <signal.h>
#include <string.h>
#include "server_limits.h"
#include "list_link.h"
#include "work_task.h"
#include "log.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "pbs_error.h"
#include "sched_cmds.h"
#include "acct.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

/* Private Fuctions Local to this File */

int shutdown_preempt_chkpt(job *);
void post_hold(struct work_task *);
static void post_chkpt(struct work_task *);
static void rerun_or_kill(job *, char *text);

/* Private Data Items */

static struct batch_request *pshutdown_request = 0;

/* Global Data Items: */

extern pbs_list_head svr_alljobs;
extern char *msg_abort_on_shutdown;
extern char *msg_daemonname;
extern char *msg_init_queued;
extern char *msg_shutdown_op;
extern char *msg_shutdown_start;
extern char *msg_leftrunning;
extern char *msg_stillrunning;
extern char *msg_on_shutdown;
extern char *msg_job_abort;

extern pbs_list_head task_list_event;
extern struct server server;
extern attribute_def svr_attr_def[];

/**
 * @brief
 *		Perform start of the shutdown procedure for the server
 *
 * @par failover
 *		In failover environment, may need to tell Secondary to either stay
 *		inactive, to shutdown (only the Secondary) or to shutdown as well.
 *		In the cases the Primary is also going down, we want to wait
 *		for an acknowledgement from Secondary.  That is down by or-ing in
 *		SV_STATE_PRIMDLY to the server internal state.   see failover.c and
 *		the main processing loop in pbsd_main.c;  that loop won't exit if
 *		SV_STATE_PRIMDLY is in the state.
 *
 * @param[in]	type	-	SHUT_* - type of for shutdown, see pbs_internal.h
 */

void
svr_shutdown(int type)
{
	job *pjob;
	job *pnxt;
	long state;
	int wait_for_secondary = 0;

	/* Lets start by logging shutdown and saving everything */

	/* Saving server jobid number to the database as server is going to shutdown.
	 * Once server will come up then it will start jobid/resvid from this number onwards.
	 */
	state = get_sattr_long(SVR_ATR_State);
	(void) strcpy(log_buffer, msg_shutdown_start);

	if (state == SV_STATE_SHUTIMM) {

		/* if already shuting down, another Immed/sig will force it */

		if ((type == SHUT_IMMEDIATE) || (type == SHUT_SIG)) {
			state = SV_STATE_DOWN;
			set_sattr_l_slim(SVR_ATR_State, state, SET);
			(void) strcat(log_buffer, "Forced");
			log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG,
				  PBS_EVENTCLASS_SERVER, LOG_NOTICE,
				  msg_daemonname, log_buffer);
			return;
		}
	}

	/* in failover environments, need to communicate with Secondary */
	/* and for these two where the Primary is going down, mark to   */
	/* wait for the acknowledgement from the Secondary              */

	if (type & SHUT_WHO_SECDRY) {
		if (failover_send_shutdown(FAILOVER_SecdShutdown) == 0)
			wait_for_secondary = 1;
	} else if (type & SHUT_WHO_IDLESECDRY) {
		if (failover_send_shutdown(FAILOVER_SecdGoInactive) == 0)
			wait_for_secondary = 1;
	}

	/* what is the manner of our demise? */

	type = type & SHUT_MASK;
	if (type == SHUT_IMMEDIATE) {
		state = SV_STATE_SHUTIMM;
		set_sattr_l_slim(SVR_ATR_State, state, SET);
		(void) strcat(log_buffer, "Immediate");

	} else if (type == SHUT_DELAY) {
		state = SV_STATE_SHUTDEL;
		set_sattr_l_slim(SVR_ATR_State, state, SET);
		(void) strcat(log_buffer, "Delayed");

	} else if (type == SHUT_QUICK) {
		state = SV_STATE_DOWN; /* set to down to brk pbsd_main loop */
		set_sattr_l_slim(SVR_ATR_State, state, SET);
		(void) strcat(log_buffer, "Quick");

	} else {
		state = SV_STATE_DOWN;
		set_sattr_l_slim(SVR_ATR_State, state, SET);
		(void) strcat(log_buffer, "By Signal");
		type = SHUT_QUICK;
	}
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_SERVER, LOG_NOTICE, msg_daemonname, log_buffer);

	if (wait_for_secondary) {
		state |= SV_STATE_PRIMDLY; /* wait for reply from Secondary */
		set_sattr_l_slim(SVR_ATR_State, state, SET);
	}

	if (type == SHUT_QUICK) /* quick, leave jobs as are */
		return;
	svr_save_db(&server);

	pnxt = (job *) GET_NEXT(svr_alljobs);
	while ((pjob = pnxt) != NULL) {
		pnxt = (job *) GET_NEXT(pjob->ji_alljobs);

		if (check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
			char *val = get_jattr_str(pjob, JOB_ATR_chkpnt);

			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HOTSTART;
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_HASRUN;
			if (val && (*val != 'n')) {
				/* do checkpoint of job */

				if (shutdown_preempt_chkpt(pjob) == 0)
					continue;
			}

			/* if not checkpoint (not supported, not allowed, or fails */
			/* rerun if possible, else kill job			   */

			rerun_or_kill(pjob, msg_on_shutdown);
		}
	}
	return;
}

/**
 * @brief
 * 		shutdown_ack - acknowledge the shutdown (terminate) request
 * 		if there is one.  This is about the last thing the server does
 *		before going away.
 */

void
shutdown_ack()
{
	if (pshutdown_request) {
		reply_ack(pshutdown_request);
		pshutdown_request = 0;
	}
}

/**
 * @brief
 * 		req_shutdown - process request to shutdown the server.
 * @note
 *		Must have operator or administrator privilege.
 *
 * @param[in,out]	preq	-	Shutdown Job Request
 */

void
req_shutdown(struct batch_request *preq)
{
	int type;
	extern int shutdown_who;

	if ((preq->rq_perm & (ATR_DFLAG_MGWR | ATR_DFLAG_MGRD | ATR_DFLAG_OPRD |
			      ATR_DFLAG_OPWR)) == 0) {
		req_reject(PBSE_PERM, 0, preq);
		return;
	}

	(void) sprintf(log_buffer, msg_shutdown_op, preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_SYSTEM | PBSEVENT_ADMIN | PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_SERVER, LOG_NOTICE, msg_daemonname, log_buffer);

	pshutdown_request = preq; /* save for reply from main() when done */
	type = preq->rq_ind.rq_shutdown;
	shutdown_who = type & SHUT_WHO_MASK;

	if (shutdown_who & SHUT_WHO_SECDONLY)
		(void) failover_send_shutdown(FAILOVER_SecdShutdown);

	if (shutdown_who & SHUT_WHO_SCHED)
		send_sched_cmd(dflt_scheduler, SCH_QUIT, NULL); /* tell scheduler to quit */

	if (shutdown_who & SHUT_WHO_SECDONLY) {
		reply_ack(preq);
		return; /* do NOT shutdown this Server */
	}

	/* Moms are told to shutdown in pbsd_main.c after main loop */

	svr_shutdown(type);
	return;
}

/**
 * @brief
 * 		shutdown_preempt_chkpt - perform checkpoint of job by issuing a hold request to mom
 *
 * @param[in,out]	pjob	-	pointer to job
 * @param[in]		nest	-	pointer to the nested batch_request (if any)
 *
 * @return	int
 * @retval	0	: success
 * @retval	-1	: relay_to_mom failed
 * @retval	PBSE_SYSTEM	: error
 */

int
shutdown_preempt_chkpt(job *pjob)
{
	struct batch_request *phold;
	attribute temp;
	void (*func)(struct work_task *);

	long *hold_val = NULL;
	long old_hold = 0;

	phold = alloc_br(PBS_BATCH_HoldJob);
	if (phold == NULL)
		return (PBSE_SYSTEM);

	temp.at_flags = ATR_VFLAG_SET;
	temp.at_type = job_attr_def[(int) JOB_ATR_hold].at_type;
	temp.at_user_encoded = NULL;
	temp.at_priv_encoded = NULL;
	temp.at_val.at_long = HOLD_s;

	phold->rq_perm = ATR_DFLAG_MGRD | ATR_DFLAG_MGWR;
	(void) strcpy(phold->rq_ind.rq_hold.rq_orig.rq_objname, pjob->ji_qs.ji_jobid);
	CLEAR_HEAD(phold->rq_ind.rq_hold.rq_orig.rq_attr);
	if (job_attr_def[(int) JOB_ATR_hold].at_encode(&temp,
						       &phold->rq_ind.rq_hold.rq_orig.rq_attr,
						       job_attr_def[(int) JOB_ATR_hold].at_name,
						       NULL,
						       ATR_ENCODE_CLIENT, NULL) < 0)
		return (PBSE_SYSTEM);

	phold->rq_extra = pjob;
	func = post_chkpt;

	if (relay_to_mom(pjob, phold, func) == 0) {

		if (check_job_state(pjob, JOB_STATE_LTR_TRANSIT))
			svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_RUNNING);
		pjob->ji_qs.ji_svrflags |= (JOB_SVFLG_HASRUN | JOB_SVFLG_CHKPT | JOB_SVFLG_HASHOLD);
		(void) job_save_db(pjob);
		return (0);
	} else {
		*hold_val = old_hold; /* reset to the old value */
		return (-1);
	}
}

/**
 * @brief
 * 		post-chkpt - clean up after shutdown_preempt_chkpt
 *		This is called on the reply from MOM to a Hold request made in
 *		shutdown_preempt_chkpt().  If the request succeeded, then record in job.
 *		If the request failed, then we fall back to rerunning or aborting
 *		the job.
 *
 * @param[in]	ptask	-	work_task which contains the request
 */

static void
post_chkpt(struct work_task *ptask)
{
	job *pjob;
	struct batch_request *preq;

	preq = (struct batch_request *) ptask->wt_parm1;
	pjob = find_job(preq->rq_ind.rq_hold.rq_orig.rq_objname);
	if (!preq || !pjob)
		return;
	if (preq->rq_reply.brp_code == 0) {
		/* checkpointed ok */
		if (preq->rq_reply.brp_auxcode) { /* chkpt can be moved */
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_CHKPT;
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_ChkptMig;
			job_save_db(pjob);
		}
		account_record(PBS_ACCT_CHKPNT, pjob, NULL);
	} else {
		/* need to try rerun if possible or just abort the job */
		if (preq->rq_reply.brp_code != PBSE_CKPBSY) {
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_CHKPT;
			set_job_substate(pjob, JOB_SUBSTATE_RUNNING);
			job_save_db(pjob);
			if (check_job_state(pjob, JOB_STATE_LTR_RUNNING))
				rerun_or_kill(pjob, msg_on_shutdown);
		}
	}

	release_req(ptask);
}
/**
 * @brief
 * 	rerun_or_kill - rerun or kill a job and log the message
 *
 * 	@par Functionality:
 * 		If the job is re-runnable mark it to be re-queued.
 * 		If the job is not re-runnable, immediately kill the job.
 * 		Record log message before purging job.
 * 		If shutdown takes time, leave the job running.
 *
 * @param[in]	pjob	-	job which needs to be killed or re-runned.
 * @param[in]	text	-	message to be logged before purging the job.
 */
static void
rerun_or_kill(job *pjob, char *text)
{
	long server_state = get_sattr_long(SVR_ATR_State);

	if (get_jattr_long(pjob, JOB_ATR_rerunable)) {

		/* job is rerunable, mark it to be requeued */

		(void) issue_signal(pjob, "SIGKILL", release_req, 0);
		set_job_substate(pjob, JOB_SUBSTATE_RERUN);
		(void) strcpy(log_buffer, msg_init_queued);
		(void) strcat(log_buffer, pjob->ji_qhdr->qu_qs.qu_name);
		(void) strcat(log_buffer, text);
	} else if (server_state != SV_STATE_SHUTDEL) {

		/* job not rerunable, immediate shutdown - kill it off */

		(void) strcpy(log_buffer, msg_job_abort);
		(void) strcat(log_buffer, text);
		/* need to record log message before purging job */
		log_event(PBSEVENT_SYSTEM | PBSEVENT_JOB | PBSEVENT_DEBUG,
			  PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			  log_buffer);
		(void) job_abt(pjob, log_buffer);
		return;
	} else {

		/* delayed shutdown, leave job running */

		(void) strcpy(log_buffer, msg_leftrunning);
		(void) strcat(log_buffer, text);
	}
	log_event(PBSEVENT_SYSTEM | PBSEVENT_JOB | PBSEVENT_DEBUG,
		  PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid,
		  log_buffer);
}


================================================
FILE: src/server/req_signal.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	req_signaljob.c
 *
 * @brief
 * 		req_signaljob.c - functions dealing with sending a signal
 *		     to a running job.
 *
 * Functions included are:
 * 	req_signaljob()
 * 	req_signaljob2()
 * 	issue_signal()
 * 	post_signal_req()
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <errno.h>
#include <signal.h>
#include <stdio.h>
#include "libpbs.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "sched_cmds.h"
#include "pbs_sched.h"
#include "acct.h"

/* Private Function local to this file */

void post_signal_req(struct work_task *);
static int req_signaljob2(struct batch_request *preq, job *pjob);
void set_admin_suspend(job *pjob, int set_remove_nstate);
int create_resreleased(job *pjob);

/* Global Data Items: */

extern char *msg_momreject;
extern char *msg_signal_job;
extern job *chk_job_request(char *, struct batch_request *, int *, int *);
extern time_t time_now;

/**
 * @brief
 * 		req_signaljob - service the Signal Job Request
 * @par
 *		This request sends (via MOM) a signal to a running job.
 *
 * @param[in]	preq	-	Signal Job Request
 */

void
req_signaljob(struct batch_request *preq)
{
	int anygood = 0;
	int i;
	char jid[PBS_MAXSVRJOBID + 1];
	int jt; /* job type */
	char *pc;
	job *pjob;
	job *parent;
	char *range;
	int suspend = 0;
	int resume = 0;
	int start;
	int end;
	int step;
	int count;
	int err = PBSE_NONE;
	char sjst;

	snprintf(jid, sizeof(jid), "%s", preq->rq_ind.rq_signal.rq_jid);

	parent = chk_job_request(jid, preq, &jt, &err);
	if (parent == NULL) {
		pjob = find_job(jid);
		if (pjob != NULL && pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(err, PREEMPT_METHOD_SUSPEND, pjob);
		return; /* note, req_reject already called */
	}

	if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_RESUME) == 0 || strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_RESUME) == 0)
		resume = 1;
	else if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_SUSPEND) == 0 || strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_SUSPEND) == 0)
		suspend = 1;

	if (suspend || resume) {

		if ((preq->rq_perm & (ATR_DFLAG_OPRD | ATR_DFLAG_OPWR |
				      ATR_DFLAG_MGRD | ATR_DFLAG_MGWR)) == 0) {
			/* for suspend/resume, must be mgr/op */
			req_reject(PBSE_PERM, 0, preq);
			return;
		}
	}

	if (jt == IS_ARRAY_NO) {

		/* just a regular job, pass it on down the line and be done */

		req_signaljob2(preq, parent);
		return;

	} else if (jt == IS_ARRAY_Single) {
		/* single subjob, if running can signal */
		pjob = get_subjob_and_state(parent, get_index_from_jid(jid), &sjst, NULL);
		if (sjst == JOB_STATE_LTR_UNKNOWN) {
			req_reject(PBSE_UNKJOBID, 0, preq);
			return;
		} else if (pjob && sjst == JOB_STATE_LTR_RUNNING) {
			req_signaljob2(preq, pjob);
		} else {
			req_reject(PBSE_BADSTATE, 0, preq);
		}
		return;
	} else if (jt == IS_ARRAY_ArrayJob) {

		/* The Array Job itself ... */

		if (!check_job_state(parent, JOB_STATE_LTR_BEGUN)) {
			req_reject(PBSE_BADSTATE, 0, preq);
			return;
		}

		/* for each subjob that is running, signal it via req_signaljob2 */

		++preq->rq_refct; /* protect the request/reply struct */

		for (i = parent->ji_ajinfo->tkm_start; i <= parent->ji_ajinfo->tkm_end; i += parent->ji_ajinfo->tkm_step) {
			pjob = get_subjob_and_state(parent, i, &sjst, NULL);
			if (!pjob || sjst != JOB_STATE_LTR_RUNNING)
				continue;
			/* if suspending,  skip those already suspended,  */
			if (suspend && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend))
				continue;
			/* if resuming, skip those not suspended         */
			if (resume && !(pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend))
				continue;
			dup_br_for_subjob(preq, pjob, req_signaljob2);
		}
		/* if not waiting on any running subjobs, can reply; else */
		/* it is taken care of when last running subjob responds  */
		if (--preq->rq_refct == 0)
			reply_send(preq);
		return;
	}
	/* what's left to handle is a range of subjobs, foreach subjob 	*/
	/* if running, signal it					*/

	range = get_range_from_jid(jid);
	if (range == NULL) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	/* now do the deed */

	++preq->rq_refct; /* protect the request/reply struct */

	while (1) {
		if ((i = parse_subjob_index(range, &pc, &start, &end, &step, &count)) == -1) {
			req_reject(PBSE_IVALREQ, 0, preq);
			break;
		} else if (i == 1)
			break;
		for (i = start; i <= end; i += step) {
			pjob = get_subjob_and_state(parent, i, &sjst, NULL);
			if (!pjob || sjst != JOB_STATE_LTR_RUNNING)
				continue;
			/* if suspending,  skip those already suspended,  */
			if (suspend && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend))
				continue;
			/* if resuming, skip those not suspended         */
			if (resume && !(pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend))
				continue;
			anygood = 1;
			dup_br_for_subjob(preq, pjob, req_signaljob2);
		}
		range = pc;
	}

	if (anygood == 0) { /* no running subjobs in the range */
		req_reject(PBSE_BADSTATE, 0, preq);
		return;
	}

	/* if not waiting on any running subjobs, can reply; else */
	/* it is taken care of when last running subjob responds  */
	if (--preq->rq_refct == 0)
		reply_send(preq);
	return;
}
/**
 * @brief
 * 		req_signaljob2 - service the Signal Job Request
 * @par
 *		This request sends (via MOM) a signal to a running job.
 *
 * @param[in]	preq	-	Signal Job Request
 *
 * @return int
 * @retval 0 for Success
 * @retval 1 for Error
 */
static int
req_signaljob2(struct batch_request *preq, job *pjob)
{
	int rc;
	char *pnodespec;
	int suspend = 0;
	int resume = 0;
	pbs_sched *psched;

	if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING) ||
	    (check_job_state(pjob, JOB_STATE_LTR_RUNNING) && check_job_substate(pjob, JOB_SUBSTATE_PROVISION))) {
		req_reject(PBSE_BADSTATE, 0, preq);
		return 1;
	}
	if ((strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_RESUME) == 0 && !(pjob->ji_qs.ji_svrflags & JOB_SVFLG_AdmSuspd)) ||
	    (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_RESUME) == 0 && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_AdmSuspd))) {
		req_reject(PBSE_WRONG_RESUME, 0, preq);
		return 1;
	}

	if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_RESUME) == 0 || strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_RESUME) == 0)
		resume = 1;
	else if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_SUSPEND) == 0 || strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_SUSPEND) == 0)
		suspend = 1;

	/* Special pseudo signals for suspend and resume require op/mgr */

	if (suspend || resume) {

		preq->rq_extra = pjob; /* save job ptr for post_signal_req() */

		sprintf(log_buffer, "%s job by %s@%s",
			preq->rq_ind.rq_signal.rq_signame,
			preq->rq_user, preq->rq_host);

		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);

		if (resume) {
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) != 0) {

				if (preq->rq_fromsvr == 1 ||
				    strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_RESUME) == 0) {
					/* from Scheduler, resume job */
					pnodespec = get_jattr_str(pjob, JOB_ATR_exec_vnode);
					if (pnodespec) {
						rc = assign_hosts(pjob, pnodespec, 0);
						if (rc == 0) {
							set_resc_assigned((void *) pjob, 0, INCR);
							/* if resume fails,need to free resources */
						} else {
							req_reject(rc, 0, preq);
							return 1;
						}
					}
					if (is_jattr_set(pjob, JOB_ATR_exec_vnode_deallocated)) {

						char *hoststr = NULL;
						char *hoststr2 = NULL;
						char *vnodestoalloc = NULL;
						char *new_exec_vnode_deallocated;
						new_exec_vnode_deallocated =
							get_jattr_str(pjob, JOB_ATR_exec_vnode_deallocated);

						rc = set_nodes((void *) pjob, JOB_OBJECT, new_exec_vnode_deallocated, &vnodestoalloc, &hoststr, &hoststr2, 1, FALSE);
						if (rc != 0) {
							req_reject(rc, 0, preq);
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_WARNING,
								  pjob->ji_qs.ji_jobid, "Warning: Failed to make some nodes aware of deleted job");
						}
					}
				} else {
					/* not from scheduler, change substate so the  */
					/* scheduler will resume the job when possible */
					svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_SCHSUSP);
					if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
						set_scheduler_flag(SCH_SCHEDULE_NEW, psched);
					else {
						sprintf(log_buffer, "Unable to reach scheduler associated with job %s", pjob->ji_qs.ji_jobid);
						log_err(-1, __func__, log_buffer);
					}
					reply_send(preq);
					return 0;
				}
			} else {
				/* Job can be resumed only on suspended state */
				req_reject(PBSE_BADSTATE, 0, preq);
				return 1;
			}
		}
	}

	/* log and pass the request on to MOM */

	sprintf(log_buffer, msg_signal_job, preq->rq_ind.rq_signal.rq_signame,
		preq->rq_user, preq->rq_host);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
		  pjob->ji_qs.ji_jobid, log_buffer);
	rc = relay_to_mom(pjob, preq, post_signal_req);
	if (rc) {
		if (resume)
			rel_resc(pjob);
		req_reject(rc, 0, preq); /* unable to get to MOM */
		return 1;
	}

	return 0;

	/* After MOM acts and replies to us, we pick up in post_signal_req() */
}

/**
 * @brief
 * 		issue_signal - send an internally generated signal to a running job
 *
 * @param[in,out]	pjob	-	running job
 * @param[in]	signame	-	name of the signal to send
 * @param[in]	func	-	function pointer taking work_task structure as argument.
 * @param[in]	extra	-	extra parameter to be stored in sig request
 * @param[in]	nest	-	pointer to the nested batch_request (if any)
 *
 * @return	int
 * @retval	0	- success
 * @retval	non-zero	- error code
 */

int
issue_signal(job *pjob, char *signame, void (*func)(struct work_task *), void *extra)
{
	struct batch_request *newreq;

	/* build up a Signal Job batch request */

	if ((newreq = alloc_br(PBS_BATCH_SignalJob)) == NULL)
		return (PBSE_SYSTEM);

	newreq->rq_extra = extra;

	strcpy(newreq->rq_ind.rq_signal.rq_jid, pjob->ji_qs.ji_jobid);
	strncpy(newreq->rq_ind.rq_signal.rq_signame, signame, PBS_SIGNAMESZ);
	return (relay_to_mom(pjob, newreq, func));

	/* when MOM replies, we just free the request structure */
}

/**
 * @brief
 * 		issue_signal_task - task to send signal to a job
 *
 * @param[in,out]	pwt	-	work_task which contains Signal Job Request and post function
 */

static void
issue_signal_task(struct work_task *pwt)
{
	struct batch_request *newreq;
	void *func;
	job *pjob;
	int rc;

	newreq = (struct batch_request *) pwt->wt_parm1;
	func = pwt->wt_parm2;

	pjob = find_job(newreq->rq_ind.rq_signal.rq_jid);
	if (pjob) {
		if ((rc = relay_to_mom(pjob, newreq, func)) != PBSE_NONE) {
			sprintf(log_buffer, "Issue signal error (%d)", rc);
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
				pjob->ji_qs.ji_jobid, log_buffer);
		}
	}
}

/**
 * @brief
 * 		delayed_issue_signal - send an internally generated signal to a running job
 *
 * @param[in,out]	pjob	-	running job
 * @param[in]	signame	-	name of the signal to send
 * @param[in]	func	-	function pointer taking work_task structure as argument.
 * @param[in]	extra	-	extra parameter to be stored in sig request
 * @param[in]	delay	-	the signal is sent after <delay> seconds
 *
 * @return	int
 * @retval	0	- success
 * @retval	non-zero	- error code
 */

int
delayed_issue_signal(job *pjob, char *signame, void (*func)(struct work_task *), void *extra, int delay)
{
	struct work_task *pwt;
	struct batch_request *newreq;

	/* build up a Signal Job batch request */

	if ((newreq = alloc_br(PBS_BATCH_SignalJob)) == NULL) {
		log_err(PBSE_SYSTEM, __func__, "Failed to allocate batch request");
		return PBSE_SYSTEM;
	}

	newreq->rq_extra = extra;

	strcpy(newreq->rq_ind.rq_signal.rq_jid, pjob->ji_qs.ji_jobid);
	strncpy(newreq->rq_ind.rq_signal.rq_signame, signame, PBS_SIGNAMESZ);

	pwt = set_task(WORK_Timed, time_now + delay,
		issue_signal_task, newreq);
	pwt->wt_parm2 = func;

	return PBSE_NONE;
}

/**
 * @brief
 * 		post_signal_req - complete a Signal Job Request (externally generated)
 *
 * @param[in,out]	pwt	-	work_task which contains Signal Job Request
 */

void
post_signal_req(struct work_task *pwt)
{
	job *pjob;
	struct batch_request *preq;
	int rc;
	int ss;
	int suspend = 0;
	int resume = 0;

	if (pwt->wt_aux2 != PROT_TPP)
		svr_disconnect(pwt->wt_event); /* disconnect from MOM */

	preq = pwt->wt_parm1;
	preq->rq_conn = preq->rq_orgconn; /* restore client socket */
	pjob = preq->rq_extra;

	if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_SUSPEND) == 0 ||
	    strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_SUSPEND) == 0)
		suspend = 1;
	else if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_RESUME) == 0 ||
		 strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_RESUME) == 0)
		resume = 1;

	if ((rc = preq->rq_reply.brp_code)) {

		/* there was an error on the Mom side of things */

		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_REQUEST, LOG_DEBUG,
			  preq->rq_ind.rq_signal.rq_jid, msg_momreject);
		errno = 0;
		if (rc == PBSE_UNKJOBID)
			rc = PBSE_INTERNAL;
		if (resume) {
			/* resume failed, re-release resc and nodes */
			rel_resc(pjob);
		}

		if (pjob == NULL)
			pjob = find_job(preq->rq_ind.rq_signal.rq_jid);
		if (pjob != NULL && pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(rc, PREEMPT_METHOD_SUSPEND, pjob);

		req_reject(rc, 0, preq);
	} else {

		/* everything went ok for signal request at Mom */

		if (suspend && pjob && (check_job_state(pjob, JOB_STATE_LTR_RUNNING))) {
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) == 0) {
				if (preq->rq_fromsvr == 1 || pjob->ji_pmt_preq != NULL)
					ss = JOB_SUBSTATE_SCHSUSP;
				else
					ss = JOB_SUBSTATE_SUSPEND;
				if (is_sattr_set(SVR_ATR_restrict_res_to_release_on_suspend)) {
					if (create_resreleased(pjob) == 1) {
						sprintf(log_buffer, "Unable to create resource released list");
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
							  pjob->ji_qs.ji_jobid, log_buffer);
					}
				}
				pjob->ji_qs.ji_svrflags |= JOB_SVFLG_Suspend;
				/* update all released resources */
				svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, ss);
				rel_resc(pjob); /* release resc and nodes */
				job_save(pjob); /* save released resc and nodes */
				log_suspend_resume_record(pjob, PBS_ACCT_SUSPEND);
				/* Since our purpose is to put the node in maintenance state if "admin-suspend"
				 * signal is used, be sure that rel_resc() is called before set_admin_suspend().
				 * Otherwise, set_admin_suspend will move the node to maintenance state and
				 * rel_resc() will pull it out of maintenance state */
				if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_SUSPEND) == 0)
					set_admin_suspend(pjob, 1);
			}
		} else if (resume && pjob && (check_job_state(pjob, JOB_STATE_LTR_RUNNING))) {
			/* note - the resources have already been reallocated */
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_Suspend;
			if (strcmp(preq->rq_ind.rq_signal.rq_signame, SIG_ADMIN_RESUME) == 0)
				set_admin_suspend(pjob, 0);

			free_jattr(pjob, JOB_ATR_resc_released);
			mark_jattr_not_set(pjob, JOB_ATR_resc_released);

			free_jattr(pjob, JOB_ATR_resc_released_list);
			mark_jattr_not_set(pjob, JOB_ATR_resc_released_list);

			svr_setjobstate(pjob, JOB_STATE_LTR_RUNNING, JOB_SUBSTATE_RUNNING);
			log_suspend_resume_record(pjob, PBS_ACCT_RESUME);

			set_jattr_generic(pjob, JOB_ATR_Comment,
					  form_attr_comment("Job run at %s", get_jattr_str(pjob, JOB_ATR_exec_vnode)), NULL, SET);
		}

		if (pjob == NULL)
			pjob = find_job(preq->rq_ind.rq_signal.rq_jid);
		if (pjob != NULL && pjob->ji_pmt_preq != NULL)
			reply_preempt_jobs_request(PBSE_NONE, PREEMPT_METHOD_SUSPEND, pjob);

		reply_ack(preq);
	}
}

/**
 * @brief  Create the job's resources_released and Resource_Rel_List
 *	    attributes based on its exec_vnode
 * @param[in/out] pjob - Job structure
 *
 * @return int
 * @retval 1 - In case of failure
 * @retval 0 - In case of success
 */
int
create_resreleased(job *pjob)
{
	char *chunk;
	int j;
	int nelem;
	char *noden;
	int rc;
	struct key_value_pair *pkvp;
	char *resreleased;
	char buf[1024] = {0};
	char *dflt_ncpus_rel = ":ncpus=0";
	int no_res_rel = 1;

	attribute *pexech = get_jattr(pjob, JOB_ATR_exec_vnode);
	/* Multiplying by 2 to take care of superchunks of the format
	 * (node:resc=n+node:resc=m) which will get converted to
	 * (node:resc=n)+(node:resc=m). This will add room for this
	 * expansion.
	 */
	resreleased = (char *) calloc(1, strlen(pexech->at_val.at_str) * 2 + 1);
	if (resreleased == NULL)
		return 1;
	resreleased[0] = '\0';

	chunk = parse_plus_spec(pexech->at_val.at_str, &rc);
	if (rc != 0) {
		free(resreleased);
		return 1;
	}
	while (chunk) {
		no_res_rel = 1;
		strcat(resreleased, "(");
		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {
			strcat(resreleased, noden);
			if (is_sattr_set(SVR_ATR_restrict_res_to_release_on_suspend)) {
				struct array_strings *pval = get_sattr_arst(SVR_ATR_restrict_res_to_release_on_suspend);
				for (j = 0; pval != NULL && j < nelem; ++j) {
					int k;
					int np = pval->as_usedptr;
					for (k = 0; np != 0 && k < np; k++) {
						char *res;
						res = pval->as_string[k];
						if ((res != NULL) && (strcmp(pkvp[j].kv_keyw, res) == 0)) {
							sprintf(buf, ":%s=%s", res, pkvp[j].kv_val);
							strcat(resreleased, buf);
							no_res_rel = 0;
							break;
						}
					}
				}
			} else {
				free(resreleased);
				return 1;
			}
		} else {
			free(resreleased);
			return 1;
		}
		/* If there are no resources released on this vnode then add a dummy "ncpus=0"
		 * This is needed otherwise scheduler will not be able to assign this chunk to
		 * the job while trying to resume it
		 */
		if (no_res_rel)
			strcat(resreleased, dflt_ncpus_rel);
		strcat(resreleased, ")");
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0) {
			free(resreleased);
			return 1;
		}
		if (chunk)
			strcat(resreleased, "+");
	}
	if (resreleased[0] != '\0')
		set_jattr_generic(pjob, JOB_ATR_resc_released, resreleased, NULL, SET);

	free(resreleased);
	return 0;
}

/**
 *	@brief Handle admin-suspend/admin-resume on the job and nodes
 *		set or remove the JOB_SVFLG_AdmSuspd flag on the job
 *		set or remove nodes in state maintenance
 *
 *	@param[in] pjob - job to act upon
 *	@param[in] set_remove_nstate if 1, set flag/state if 0 remove flag/state
 *
 *	@return void
 */
void
set_admin_suspend(job *pjob, int set_remove_nstate)
{
	char *chunk;
	char *execvncopy;
	char *last;
	char *vname;
	struct key_value_pair *pkvp;
	int hasprn;
	int nelem;
	struct pbsnode *pnode;
	attribute new;

	if (pjob == NULL)
		return;

	execvncopy = strdup(get_jattr_str(pjob, JOB_ATR_exec_vnode));

	if (execvncopy == NULL)
		return;

	if (set_remove_nstate)
		pjob->ji_qs.ji_svrflags |= JOB_SVFLG_AdmSuspd;
	else
		pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_AdmSuspd;

	clear_attr(&new, &node_attr_def[(int) ND_ATR_MaintJobs]);
	decode_arst(&new, ATTR_NODE_MaintJobs, NULL, pjob->ji_qs.ji_jobid);

	chunk = parse_plus_spec_r(execvncopy, &last, &hasprn);

	while (chunk) {

		if (parse_node_resc(chunk, &vname, &nelem, &pkvp) == 0) {
			pnode = find_nodebyname(vname);
			if (pnode) {
				if (set_remove_nstate) {
					set_arst(get_nattr(pnode, ND_ATR_MaintJobs), &new, INCR);
					set_vnode_state(pnode, INUSE_MAINTENANCE, Nd_State_Or);
				} else {
					set_arst(get_nattr(pnode, ND_ATR_MaintJobs), &new, DECR);
					if ((get_nattr_arst(pnode, ND_ATR_MaintJobs))->as_usedptr == 0)
						set_vnode_state(pnode, ~INUSE_MAINTENANCE, Nd_State_And);
				}
			}
			pnode->nd_modified = 1;
		}
		chunk = parse_plus_spec_r(last, &last, &hasprn);
	}
	save_nodes_db(0, NULL);
	job_save_db(pjob);
	free_arst(&new);
	free(execvncopy);
}


================================================
FILE: src/server/req_stat.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	req_stat.c
 *
 * @brief
 * 		req_stat.c - Functions relating to the Status Job, Status Queue, and
 * 		Status Server Batch Requests.
 *
 * Functions included are:
 * 	do_stat_of_a_job()
 * 	stat_a_jobidname()
 * 	req_stat_job()
 * 	req_stat_que()
 * 	status_que()
 * 	req_stat_node()
 * 	status_node()
 * 	req_stat_svr()
 * 	req_stat_sched()
 * 	update_state_ct()
 * 	update_license_ct()
 * 	req_stat_resv()
 * 	status_resv()
 * 	status_resc()
 * 	req_stat_resc()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#define STAT_CNTL 1

#include <stdio.h>
#include <sys/types.h>
#include <stdlib.h>
#include "libpbs.h"
#include <ctype.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "work_task.h"
#include "pbs_entlim.h"
#include "pbs_error.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "net_connect.h"
#include "pbs_license.h"
#include "resource.h"
#include "pbs_sched.h"
#include "liblicense.h"
#include "ifl_internal.h"

/* Global Data Items: */

extern struct server server;
extern pbs_list_head svr_alljobs;
extern pbs_list_head svr_queues;
extern char server_name[];
extern attribute_def svr_attr_def[];
extern attribute_def que_attr_def[];
extern attribute_def job_attr_def[];
extern time_t time_now;
extern char *msg_init_norerun;
extern int resc_access_perm;
extern long svr_history_enable;
extern pbs_list_head svr_runjob_hooks;

extern pbs_license_counts license_counts;

/* Extern Functions */

extern int status_attrib(svrattrl *, void *, attribute_def *, attribute *, int, int, pbs_list_head *, int *);
extern int status_nodeattrib(svrattrl *, struct pbsnode *, int, int, pbs_list_head *, int *);

extern int svr_chk_histjob(job *);

/* Private Data Definitions */

static int bad;

/* The following private support functions are included */

static int status_que(pbs_queue *, struct batch_request *, pbs_list_head *);
static int status_node(struct pbsnode *, struct batch_request *, pbs_list_head *);
static int status_resv(resc_resv *, struct batch_request *, pbs_list_head *);

/**
 * @brief
 * 	Support function for req_stat_job() and stat_a_jobidname().
 * 	Builds status reply for normal job, Array job, and if requested all of the
 * 	subjobs of the array (but not a single or range of subjobs).
 *
 * @note
 * 	If dohistjobs is not set and the job is history, no status or error
 * 	is returned. If an error return is needed, the caller must make that check.
 *
 * @param[in,out] preq       - pointer to the stat job batch request, reply updated
 * @param[in]     pjob       - pointer to the job to be statused
 * @param[in]     dohistjobs - flag to include job if it is a history job
 * @param[in]     dosubjobs  - flag to expand a Array job to include all subjobs
 *
 * @return int
 * @retval PBSE_NONE  - no error
 * @retval !PBSE_NONE - PBS error code to return to client
 */
static int
do_stat_of_a_job(struct batch_request *preq, job *pjob, int dohistjobs, int dosubjobs)
{
	int i;
	svrattrl *pal;
	int rc;
	struct batch_reply *preply = &preq->rq_reply;

	/* if history job and not asking for them, just return */
	if (!dohistjobs && (check_job_state(pjob, JOB_STATE_LTR_FINISHED) || check_job_state(pjob, JOB_STATE_LTR_MOVED))) {
		return (PBSE_NONE); /* just return nothing */
	}

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) == 0) {
		/* this is not a subjob, go ahead and build the status reply for this job */
		pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
		rc = status_job(pjob, preq, pal, &preply->brp_un.brp_status, &bad, dosubjobs);
		if (dosubjobs && (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) && (rc == PBSE_NONE || rc != PBSE_PERM) && pjob->ji_ajinfo != NULL && pjob->ji_ajinfo->tkm_ct != pjob->ji_ajinfo->tkm_subjsct[JOB_STATE_QUEUED]) {
			for (i = pjob->ji_ajinfo->tkm_start; i <= pjob->ji_ajinfo->tkm_end; i += pjob->ji_ajinfo->tkm_step) {
				if (range_contains(pjob->ji_ajinfo->trm_quelist, i))
					continue;
				rc = status_subjob(pjob, preq, pal, i, &preply->brp_un.brp_status, &bad, 1);
				if (rc && rc != PBSE_PERM)
					break;
			}
		}
		if (rc && rc != PBSE_PERM)
			return (rc);
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 	Support function for req_stat_job().
 * 	Builds status reply for a single job id, which may be: a normal job,
 * 	an Array job, a single subjob or a range of subjobs.
 * 	Finds the job structure for the job id and calls either do_stat_of_a_job()
 * 	or status_subjob() to build that actual status reply.
 *
 * @param[in,out] preq       - pointer to the stat job batch request, reply updated
 * @param[in]     name       - job id to be statused
 * @param[in]     dohistjobs - flag to include job if it is a history job
 * @param[in]     dosubjobs  - flag to expand a Array job to include all subjobs
 *
 * @return int
 * @retval PBSE_NONE  - no error
 * @retval !PBSE_NONE - PBS error code to return to client
 */
static int
stat_a_jobidname(struct batch_request *preq, char *name, int dohistjobs, int dosubjobs)
{
	int i;
	char *pc;
	char *range;
	int rc;
	job *pjob;
	struct batch_reply *preply = &preq->rq_reply;
	svrattrl *pal;

	i = is_job_array(name);
	if (i == IS_ARRAY_Single) {
		int idx;

		pjob = find_arrayparent(name);
		if (pjob == NULL)
			return PBSE_UNKJOBID;
		else if (!dohistjobs && (rc = svr_chk_histjob(pjob)))
			return rc;
		idx = get_index_from_jid(name);
		if (idx != -1) {
			pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
			rc = status_subjob(pjob, preq, pal, idx, &preply->brp_un.brp_status, &bad, 0);
		} else
			rc = PBSE_UNKJOBID;
		return rc; /* no job still needs to be stat-ed */

	} else if ((i == IS_ARRAY_NO) || (i == IS_ARRAY_ArrayJob)) {
		pjob = find_job(name);
		if (pjob == NULL)
			return PBSE_UNKJOBID;
		else if (!dohistjobs && (rc = svr_chk_histjob(pjob)) != PBSE_NONE)
			return rc;
		return do_stat_of_a_job(preq, pjob, dohistjobs, dosubjobs);
	} else {
		/* range of sub jobs */
		range = get_range_from_jid(name);
		if (range == NULL)
			return PBSE_IVALREQ;
		pjob = find_arrayparent(name);
		if (pjob == NULL)
			return PBSE_UNKJOBID;
		else if (!dohistjobs && (rc = svr_chk_histjob(pjob)) != PBSE_NONE)
			return rc;
		pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
		while (1) {
			int start;
			int end;
			int step;
			int unused;

			if ((i = parse_subjob_index(range, &pc, &start, &end, &step, &unused)) == -1)
				return PBSE_IVALREQ;
			else if (i == 1)
				break;
			for (i = start; i <= end; i += step) {
				if (preply->brp_count >= MAX_JOBS_PER_REPLY) {
					rc = reply_send_status_part(preq);
					if (rc != PBSE_NONE)
						return rc;
				}
				rc = status_subjob(pjob, preq, pal, i, &preply->brp_un.brp_status, &bad, 0);
				if (rc && rc != PBSE_PERM)
					return rc;
			}
			range = pc;
		}
		/* stat-ed the range, no more to stat for this id */
		return PBSE_NONE;
	}
}

/**
 * @brief
 * 	Service the Status Job Request
 *
 * 	This processes the request for status of a single job or
 * 	the set of jobs at a destination.  It uses the currently known data
 * 	for resources_used in the case of a running job.  If Mom for that
 * 	job is down, the data is likely stale.
 * 	The requested object may be a job id (either a single regular job, an Array
 * 	job, a subjob or a range of subjobs), a comma separated list of the above,
 * 	a queue name or null (or @...) for all jobs in the Server.
 *
 * @param[in/out] preq - pointer to the stat job batch request, reply updated
 *
 * @return void
 *
 */
void
req_stat_job(struct batch_request *preq)
{
	int at_least_one_success = 0;
	int dosubjobs = 0;
	int dohistjobs = 0;
	char *name;
	job *pjob = NULL;
	pbs_queue *pque = NULL;
	struct batch_reply *preply;
	int rc = 0;
	int type = 0;
	char *pnxtjid = NULL;

	/* check for any extended flag in the batch request. 't' for
	 * the sub jobs. If 'x' is there, then check if the server is
	 * configured for history job info. If not set or set to FALSE,
	 * return with PBSE_JOBHISTNOTSET error. Otherwise select history
	 * jobs.
	 */
	if (preq->rq_extend) {
		if (strchr(preq->rq_extend, (int) 't'))
			dosubjobs = 1; /* status sub jobs of an Array Job */
		if (strchr(preq->rq_extend, (int) 'x')) {
			if (svr_history_enable == 0) {
				req_reject(PBSE_JOBHISTNOTSET, 0, preq);
				return;
			}
			dohistjobs = 1; /* status history jobs */
		}
	}

	/*
	 * first, validate the name of the requested object, either
	 * a job, a queue, or the whole server.
	 * type = 1 for a job, Array job, subjob or range of subjobs, or
	 *          a comma separated list of  the above.
	 *        2 for jobs in a queue,
	 *        3 for jobs in the server, or
	 */

	name = preq->rq_ind.rq_status.rq_id;

	if (isdigit((int) *name)) {
		/* a single job id */
		type = 1;
		rc = PBSE_UNKJOBID;

	} else if (isalpha((int) *name)) {
		pque = find_queuebyname(name) /* status jobs in a queue */;
#ifdef NAS /* localmod 075 */
		if (pque == NULL)
			pque = find_resvqueuebyname(name);
#endif /* localmod 075 */
		if (pque)
			type = 2;
		else
			rc = PBSE_UNKQUE;

	} else if ((*name == '\0') || (*name == '@'))
		type = 3; /* status all jobs at server */
	else
		rc = PBSE_IVALREQ;

	if (type == 0) { /* is invalid - an error */
		req_reject(rc, 0, preq);
		return;
	}
	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	if (dosubjobs && GET_NEXT(preq->rq_ind.rq_status.rq_attr) != NULL) {
		if (find_svrattrl_list_entry(&preq->rq_ind.rq_status.rq_attr, ATTR_array_indices_remaining, NULL) == NULL)
			add_to_svrattrl_list(&preq->rq_ind.rq_status.rq_attr, ATTR_array_indices_remaining, NULL, "", SET, NULL);
	}

	rc = PBSE_NONE;
	if (type == 1) {
		/*
		 * If there is more than one job id, any status for any
		 * one job is returned, then no error is given.
		 * If a single job id is requested and there is an error
		 * the error is returned.
		 */
		pnxtjid = name;
		while ((name = parse_comma_string_r(&pnxtjid)) != NULL) {
			if ((rc = stat_a_jobidname(preq, name, dohistjobs, dosubjobs)) == PBSE_NONE)
				at_least_one_success = 1;
		}
		if (at_least_one_success == 1)
			reply_send(preq);
		else
			req_reject(rc, 0, preq);
		return;

	} else {
		pjob = (job *) GET_NEXT(type == 2 ? pque->qu_jobs : svr_alljobs);
		while (pjob) {
			rc = do_stat_of_a_job(preq, pjob, dohistjobs, dosubjobs);
			if (rc != PBSE_NONE) {
				req_reject(rc, bad, preq);
				return;
			}
			pjob = (job *) GET_NEXT(type == 2 ? pjob->ji_jobque : pjob->ji_alljobs);
			if (preply->brp_count >= MAX_JOBS_PER_REPLY && pjob) {
				rc = reply_send_status_part(preq);
				if (rc != PBSE_NONE)
					return;
			}
		}
	}

	if (rc && rc != PBSE_PERM)
		req_reject(rc, bad, preq);
	else
		reply_send(preq);
}

/**
 * @brief
 * 		req_stat_que - service the Status Queue Request
 *
 *		This request processes the request for status of a single queue or
 *		the set of queues at a destination.
 *
 * @param[in,out]	preq	-	ptr to the decoded request
 */

void
req_stat_que(struct batch_request *preq)
{
	char *name;
	pbs_queue *pque;
	struct batch_reply *preply;
	int rc = 0;
	int type = 0;

	/*
	 * first, validate the name of the requested object, either
	 * a queue, or null for all queues
	 */

	name = preq->rq_ind.rq_status.rq_id;

	if ((*name == '\0') || (*name == '@'))
		type = 1;
	else {
		pque = find_queuebyname(name);
#ifdef NAS /* localmod 075 */
		if (pque == NULL)
			pque = find_resvqueuebyname(name);
#endif /* localmod 075 */
		if (pque == NULL) {
			req_reject(PBSE_UNKQUE, 0, preq);
			return;
		}
	}

	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	if (type == 0) { /* get status of the one named queue */
		rc = status_que(pque, preq, &preply->brp_un.brp_status);

	} else { /* get status of queues */

		pque = (pbs_queue *) GET_NEXT(svr_queues);
		while (pque) {
			rc = status_que(pque, preq, &preply->brp_un.brp_status);
			if (rc != 0) {
				if (rc == PBSE_PERM)
					rc = 0;
				else
					break;
			}
			pque = (pbs_queue *) GET_NEXT(pque->qu_link);
		}
	}
	if (rc) {
		reply_free(preply);
		req_reject(rc, bad, preq);
	} else {
		reply_send(preq);
	}
}

/**
 * @brief
 * 		status_que - Build the status reply for a single queue.
 *
 * @param[in,out]	pque	-	ptr to que to status
 * @param[in]		preq	-	ptr to the decoded request
 * @param[in,out]	pstathd	-	head of list to append status to
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: PBSE error code
 */

static int
status_que(pbs_queue *pque, struct batch_request *preq, pbs_list_head *pstathd)
{
	struct brp_status *pstat;
	svrattrl *pal;
	long total_jobs;
	int rc = 0;
	attribute *qattr;

	if ((preq->rq_perm & ATR_DFLAG_RDACC) == 0)
		return (PBSE_PERM);

	/* ok going to do status, update count and state counts from qu_qs */

	if (!svr_chk_history_conf()) {
		total_jobs = pque->qu_numjobs;
	} else {
		total_jobs = pque->qu_numjobs - (pque->qu_njstate[JOB_STATE_MOVED] + pque->qu_njstate[JOB_STATE_FINISHED] + pque->qu_njstate[JOB_STATE_EXPIRED]);
	}
	set_qattr_l_slim(pque, QA_ATR_TotalJobs, total_jobs, SET);

	qattr = get_qattr(pque, QA_ATR_JobsByState);
	update_state_ct(qattr, pque->qu_njstate, &que_attr_def[QA_ATR_JobsByState]);

	/* allocate status sub-structure and fill in header portion */

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);
	pstat->brp_objtype = MGR_OBJ_QUEUE;
	strcpy(pstat->brp_objname, pque->qu_qs.qu_name);
	CLEAR_LINK(pstat->brp_stlink);
	CLEAR_HEAD(pstat->brp_attr);
	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;

	/* add attributes to the status reply */

	bad = 0;
	pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
	if (status_attrib(pal, que_attr_idx, que_attr_def, pque->qu_attr, QA_ATR_LAST,
			  preq->rq_perm, &pstat->brp_attr, &bad))
		rc = PBSE_NOATTR;

	if (is_attr_set(qattr))
		free_attr(que_attr_def, qattr, QA_ATR_JobsByState);
	return rc;
}

/**
 * @brief
 * 		req_stat_node - service the Status Node Request
 *
 *		This request processes the request for status of a single node or
 *		set of nodes at a destination.
 *
 * @param[in]	preq	-	ptr to the decoded request
 */

void
req_stat_node(struct batch_request *preq)
{
	char *name;
	struct batch_reply *preply;
	svrattrl *pal;
	struct pbsnode *pnode = NULL;
	int rc = 0;
	int type = 0;
	int i;

	/*
	 * first, check that the server indeed has a list of nodes
	 * and if it does, validate the name of the requested object--
	 * either name is that of a spedific node, or name[0] is null/@
	 * meaning request is for all nodes in the server's jurisdiction
	 */

	if (pbsndlist == 0 || svr_totnodes <= 0) {
		req_reject(PBSE_NONODES, 0, preq);
		return;
	}

	resc_access_perm = preq->rq_perm;

	name = preq->rq_ind.rq_status.rq_id;

	if ((*name == '\0') || (*name == '@'))
		type = 1;
	else {
		pnode = find_nodebyname(name);
		if (pnode == NULL) {
			req_reject(PBSE_UNKNODE, 0, preq);
			return;
		}
	}

	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	if (type == 0) { /* get status of the named node */
		rc = status_node(pnode, preq, &preply->brp_un.brp_status);

	} else { /* get status of all nodes */

		for (i = 0; i < svr_totnodes; i++) {
			pnode = pbsndlist[i];

			rc = status_node(pnode, preq,
					 &preply->brp_un.brp_status);
			if (rc)
				break;
		}
	}

	if (!rc) {
		reply_send(preq);
	} else {
		if (rc != PBSE_UNKNODEATR)
			req_reject(rc, 0, preq);

		else {
			pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
			reply_badattr(rc, bad, pal, preq);
		}
	}
}

/**
 * @brief
 * 		status_node - Build the status reply for a single node.
 *
 * @param[in,out]	pnode	-	ptr to node receiving status query
 * @param[in]	preq	-	ptr to the decoded request
 * @param[in,out]	pstathd	-	head of list to append status to
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: PBSE error code
 */

static int
status_node(struct pbsnode *pnode, struct batch_request *preq, pbs_list_head *pstathd)
{
	int rc = 0;
	struct brp_status *pstat;
	svrattrl *pal;
	unsigned long old_nd_state = VNODE_UNAVAILABLE;

	if (pnode->nd_state & INUSE_DELETED) /*node no longer valid*/
		return (0);

	if ((preq->rq_perm & ATR_DFLAG_RDACC) == 0)
		return (PBSE_PERM);

	/* sync state attribute with nd_state */

	if (pnode->nd_state != get_nattr_long(pnode, ND_ATR_state))
		set_nattr_l_slim(pnode, ND_ATR_state, pnode->nd_state, SET);

	/*node is provisioning - mask out the DOWN/UNKNOWN flags while prov is on*/
	if (get_nattr_long(pnode, ND_ATR_state) & (INUSE_PROV | INUSE_WAIT_PROV)) {
		old_nd_state = get_nattr_long(pnode, ND_ATR_state);

		/* don't want to show job-busy, job/resv-excl while provisioning */
		set_nattr_l_slim(pnode, ND_ATR_state,
				 old_nd_state & ~(INUSE_DOWN | INUSE_UNKNOWN | INUSE_JOB | INUSE_JOBEXCL | INUSE_RESVEXCL),
				 SET);
	}

	/*allocate status sub-structure and fill in header portion*/

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);

	pstat->brp_objtype = MGR_OBJ_NODE;
	strcpy(pstat->brp_objname, pnode->nd_name);
	CLEAR_LINK(pstat->brp_stlink);
	CLEAR_HEAD(pstat->brp_attr);

	/*add this new brp_status structure to the list hanging off*/
	/*the request's reply substructure                         */

	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;

	/*point to the list of node-attributes about which we want status*/
	/*hang that status information from the brp_attr field for this  */
	/*brp_status structure                                           */
	bad = 0; /*global variable*/
	pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);

	rc = status_nodeattrib(pal, pnode, ND_ATR_LAST, preq->rq_perm, &pstat->brp_attr, &bad);

	/*reverting back the state*/

	if (get_nattr_long(pnode, ND_ATR_state) & INUSE_PROV)
		set_nattr_l_slim(pnode, ND_ATR_state, old_nd_state, SET);

	return (rc);
}

/**
 * @brief
 * 	update_isrunhook - update the value is has_runjob_hook
 *
 * @param[in]	pattr - ptr to the server attribute object
 *
 * @return	void
 */
static void
update_isrunhook(attribute *pattr)
{
	hook *phook = NULL;
	long old_val = pattr->at_val.at_long;
	long new_val = 0;

	/* Check if there are any valid runjob hooks */
	for (phook = (hook *) GET_NEXT(svr_runjob_hooks);
	     phook != NULL;
	     phook = (hook *) GET_NEXT(phook->hi_runjob_hooks)) {
		if (phook->enabled) {
			new_val = 1;
			break;
		}
	}

	if (new_val != old_val) {
		pattr->at_val.at_long = new_val;
		post_attr_set(pattr);
	}
}

/**
 * @brief
 * 		req_stat_svr - service the Status Server Request
 * @par
 *		This request processes the request for status of the Server
 *
 * @param[in]	preq	-	ptr to the decoded request
 */

void
req_stat_svr(struct batch_request *preq)
{
	svrattrl *pal;
	struct batch_reply *preply;
	struct brp_status *pstat;
	conn_t *conn;

	/* update count and state counts from sv_numjobs and sv_jobstates */
	set_sattr_l_slim(SVR_ATR_TotalJobs, server.sv_qs.sv_numjobs, SET);
	update_state_ct(get_sattr(SVR_ATR_JobsByState), server.sv_jobstates, &svr_attr_def[SVR_ATR_JobsByState]);

	update_license_ct();

	conn = get_conn(preq->rq_conn);
	if (!conn) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}
	if (conn->cn_origin == CONN_SCHED_PRIMARY) {
		/* Request is from sched so update "has_runjob_hook" */
		update_isrunhook(get_sattr(SVR_ATR_has_runjob_hook));
	}

	/* allocate a reply structure and a status sub-structure */

	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL) {
		reply_free(preply);
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}
	CLEAR_LINK(pstat->brp_stlink);
	strcpy(pstat->brp_objname, server_name);
	pstat->brp_objtype = MGR_OBJ_SERVER;
	CLEAR_HEAD(pstat->brp_attr);
	append_link(&preply->brp_un.brp_status, &pstat->brp_stlink, pstat);
	preply->brp_count++;

	/* add attributes to the status reply */

	bad = 0;
	pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
	if (status_attrib(pal, svr_attr_idx, svr_attr_def, server.sv_attr, SVR_ATR_LAST,
			  preq->rq_perm, &pstat->brp_attr, &bad))
		reply_badattr(PBSE_NOATTR, bad, pal, preq);
	else
		reply_send(preq);
}

/**
 * @brief
 * 		status_sched - Build the status reply for single scheduler
 *
 * @param[in]	psched	-	ptr to sched receiving status query
 * @param[in]	preq	-	ptr to the decoded request
 * @param[out]	pstathd	-	head of list to append status to
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: PBSE error code
 */
static int
status_sched(pbs_sched *psched, struct batch_request *preq, pbs_list_head *pstathd)
{
	int rc = 0;
	struct brp_status *pstat;
	svrattrl *pal;

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);

	pstat->brp_objtype = MGR_OBJ_SCHED;
	strncpy(pstat->brp_objname, psched->sc_name, (PBS_MAXSVRJOBID > PBS_MAXDEST ? PBS_MAXSVRJOBID : PBS_MAXDEST) - 1);
	pstat->brp_objname[(PBS_MAXSVRJOBID > PBS_MAXDEST ? PBS_MAXSVRJOBID : PBS_MAXDEST) - 1] = '\0';

	CLEAR_LINK(pstat->brp_stlink);
	CLEAR_HEAD(pstat->brp_attr);
	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;

	bad = 0;
	pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
	if (status_attrib(pal, sched_attr_idx, sched_attr_def, psched->sch_attr, SCHED_ATR_LAST,
			  preq->rq_perm, &pstat->brp_attr, &bad))
		reply_badattr(PBSE_NOATTR, bad, pal, preq);

	return (rc);
}

/**
 * @brief
 * 		req_stat_sched - service a PBS_BATCH_StatusSched request
 * @par
 *		This function processes a request regarding scheduler status
 *
 * @param[in]	preq	-	ptr to the decoded request
 *
 * @par MT-safe: No
 */

void
req_stat_sched(struct batch_request *preq)
{
	svrattrl *pal;
	struct batch_reply *preply;
	int rc = 0;
	pbs_sched *psched;

	/* allocate a reply structure and a status sub-structure */

	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	for (psched = (pbs_sched *) GET_NEXT(svr_allscheds);
	     (psched != NULL);
	     psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
		rc = status_sched(psched, preq, &preply->brp_un.brp_status);
		if (rc != 0) {
			break;
		}
	}

	if (!rc) {
		reply_send(preq);
	} else {
		if (rc != PBSE_NOATTR)
			req_reject(rc, 0, preq);
		else {
			pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);
			reply_badattr(rc, bad, pal, preq);
		}
	}
}

/**
 * @brief
 * 		update-state_ct - update the count of jobs per state (in queue and server
 *		attributes.
 *
 * @param[out]	pattr	-	queue or server attribute
 * @param[in]	ct_array	-	number of jobs per state
 * @param[in] attr_def - attribute def of pattr
 *
 * @par MT-safe: No
 */

void
update_state_ct(attribute *pattr, int *ct_array, attribute_def *attr_def)
{
	static char *statename[] = {"Transit", "Queued", "Held", "Waiting",
				    "Running", "Exiting", "Expired", "Begun",
				    "Moved", "Finished"};
	int index;
	char buf[BUF_SIZE];

	buf[0] = '\0';
	for (index = 0; index < (PBS_NUMJOBSTATE); index++) {
		if ((index == JOB_STATE_EXPIRED) ||
		    (index == JOB_STATE_MOVED) ||
		    (index == JOB_STATE_FINISHED))
			continue; /* skip over Expired/Moved/Finished */
		sprintf(buf + strlen(buf), "%s:%d ", statename[index],
			*(ct_array + index));
	}
	set_attr_generic(pattr, attr_def, buf, NULL, INTERNAL);
}

/**
 * @brief
 * 	update_license_ct - update the # of licenses (counters) in 'license_count' server attribute.
 */
void
update_license_ct(void)
{
	char buf[BUF_SIZE];

	buf[0] = '\0';
	snprintf(buf, sizeof(buf), "Avail_Global:%ld Avail_Local:%ld Used:%ld High_Use:%d",
		 license_counts.licenses_global,
		 license_counts.licenses_local,
		 license_counts.licenses_used,
		 license_counts.licenses_high_use.lu_max_forever);
	set_sattr_str_slim(SVR_ATR_license_count, buf, NULL);
}

/**
 * @brief
 * 		req_stat_resv - service the Status Reservation Request
 * @par
 *		This request processes the request for status of a single
 *		reservation or the set of reservations at a destination.
 *
 * @param[in,out]	preq	-	ptr to the decoded request
 */

void
req_stat_resv(struct batch_request *preq)
{
	char *name;
	struct batch_reply *preply;
	resc_resv *presv = NULL;
	int rc = 0;
	int type = 0;

	/*
	 * first, validate the name sent in the request.
	 * This is either the ID of a specific reservation
	 * or a '\0' or "@..." for all reservations.
	 */

	name = preq->rq_ind.rq_status.rq_id;

	if ((*name == '\0') || (*name == '@'))
		type = 1;
	else {
		presv = find_resv(name);
		if (presv == NULL) {
			req_reject(PBSE_UNKRESVID, 0, preq);
			return;
		}
	}

	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	if (type == 0) {
		/* get status of the specifically named reservation */
		rc = status_resv(presv, preq, &preply->brp_un.brp_status);

	} else {
		/* get status of all the reservations */

		presv = (resc_resv *) GET_NEXT(svr_allresvs);
		while (presv) {
			rc = status_resv(presv, preq, &preply->brp_un.brp_status);
			if (rc == PBSE_PERM)
				rc = 0;
			if (rc)
				break;
			presv = (resc_resv *) GET_NEXT(presv->ri_allresvs);
		}
	}

	if (rc == 0)
		reply_send(preq);
	else
		req_reject(rc, bad, preq);
}

/**
 * @brief
 * 		status_resv - Build the status reply for a single resv.
 *
 * @param[in]	presv	-	get status for this reservation
 * @param[in]	preq	-	ptr to the decoded request
 * @param[in,out]	pstathd	-	append retrieved status to list
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: PBSE error
 */

static int
status_resv(resc_resv *presv, struct batch_request *preq, pbs_list_head *pstathd)
{
	struct brp_status *pstat;
	svrattrl *pal;

	if ((preq->rq_perm & ATR_DFLAG_RDACC) == 0)
		return (PBSE_PERM);

	/*first do any need update to attributes from
	 *"quick save" area of the resc_resv structure
	 */

	/*now allocate status sub-structure and fill header portion*/

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);

	pstat->brp_objtype = MGR_OBJ_RESV;
	strcpy(pstat->brp_objname, presv->ri_qs.ri_resvID);
	CLEAR_LINK(pstat->brp_stlink);
	CLEAR_HEAD(pstat->brp_attr);
	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;

	/*finally, add the requested attributes to the status reply*/

	bad = 0; /*global: record ordinal position where got error*/
	pal = (svrattrl *) GET_NEXT(preq->rq_ind.rq_status.rq_attr);

	if (status_attrib(pal, resv_attr_idx, resv_attr_def, presv->ri_wattr,
			  RESV_ATR_LAST, preq->rq_perm, &pstat->brp_attr, &bad) == 0)
		return (0);
	else
		return (PBSE_NOATTR);
}

/**
 * @brief
 * 		status_resc - Build the status reply for a single resource.
 *
 * @param[in]	prd	-	pointer to resource def to status
 * @param[in]	preq	-	pointer to the batch request to service
 * @param[in]	pstathd	-	pointer to head of list to append status to
 * @param[in]	private	-	if a pbs private request, the status returns numeric
 * 							values for type and flags. Otherwise it returns strings
 *
 * @par
 * 		At the current time, the only things returned in the reply are
 *		the resource type and the flags, both as "integers".
 *
 * @return	whether the operation was successful or not
 * @retval	0	: on success
 * @retval	PBSE_SYSTEM	: on error
 */

static int
status_resc(struct resource_def *prd, struct batch_request *preq, pbs_list_head *pstathd, int private)
{
	attribute attr;
	struct brp_status *pstat;

	if (((prd->rs_flags & ATR_DFLAG_USRD) == 0) &&
	    (preq->rq_perm & (ATR_DFLAG_MGRD | ATR_DFLAG_OPRD)) == 0)
		return (PBSE_PERM);

	/* allocate status sub-structure and fill in header portion */

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);
	pstat->brp_objtype = MGR_OBJ_RSC;
	strcpy(pstat->brp_objname, prd->rs_name);
	CLEAR_LINK(pstat->brp_stlink);
	CLEAR_HEAD(pstat->brp_attr);

	/* add attributes to the status reply */
	if (private) {
		attr.at_val.at_long = prd->rs_type;
		attr.at_flags = ATR_VFLAG_SET;
		if (encode_l(&attr, &pstat->brp_attr, ATTR_RESC_TYPE, NULL, 0, NULL) == -1)
			return PBSE_SYSTEM;

		attr.at_val.at_long = prd->rs_flags;
		attr.at_flags = ATR_VFLAG_SET;
		if (encode_l(&attr, &pstat->brp_attr, ATTR_RESC_FLAG, NULL, 0, NULL) == -1)
			return PBSE_SYSTEM;
	} else {
		struct resc_type_map *p_resc_type_map;

		p_resc_type_map = find_resc_type_map_by_typev(prd->rs_type);
		if (p_resc_type_map == NULL) {
			return PBSE_SYSTEM;
		}

		attr.at_val.at_str = p_resc_type_map->rtm_rname;
		attr.at_flags = ATR_VFLAG_SET;
		if (encode_str(&attr, &pstat->brp_attr, ATTR_RESC_TYPE, NULL, 0, NULL) == -1)
			return PBSE_SYSTEM;

		attr.at_val.at_str = find_resc_flag_map(prd->rs_flags);
		attr.at_flags = ATR_VFLAG_SET;
		if (encode_str(&attr, &pstat->brp_attr, ATTR_RESC_FLAG, NULL, 0, NULL) == -1)
			return PBSE_SYSTEM;
	}
	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;
	return 0;
}

/**
 * @brief
 * 		req_stat_resc - service the Status Resource Request
 *
 *		This request processes the request for status of (information on)
 *		a set of resources
 *
 * @param[in]	preq	-	ptr to the decoded request
 */

void
req_stat_resc(struct batch_request *preq)
{
	int i;
	char *name;
	char *extend;
	struct resource_def *prd = NULL;
	struct batch_reply *preply;
	int rc = 0;
	int type;
	int private = 0;

	if (preq == NULL)
		return;
	/*
	 * first, validate the name of the requested object, either
	 * a resource name, or null for all resources
	 */

	name = preq->rq_ind.rq_status.rq_id;

	if ((*name == '\0') || (*name == '@'))
		type = 1;
	else {
		type = 0;
		prd = find_resc_def(svr_resc_def, name);
		if (prd == NULL) {
			req_reject(PBSE_UNKRESC, 0, preq);
			return;
		}
	}

	extend = preq->rq_extend;
	if (extend != NULL) {
		if (strchr(preq->rq_extend, (int) 'p'))
		      private
		= 1;
	}

	preply = &preq->rq_reply;
	preply->brp_choice = BATCH_REPLY_CHOICE_Status;
	CLEAR_HEAD(preply->brp_un.brp_status);
	preply->brp_count = 0;

	if (type == 0) { /* get status of the one named resource */
		rc = status_resc(prd, preq, &preply->brp_un.brp_status, private);

	} else { /* get status of all resources */

		i = svr_resc_size;
		prd = &svr_resc_def[0];
		while (i--) {
			/* skip the unknown resource because it would fail
			 * to pass the string encoding routine
			 */
			if (!private && (strcmp(prd->rs_name, RESOURCE_UNKNOWN) == 0)) {
				prd = prd->rs_next;
				continue;
			}
			rc = status_resc(prd, preq, &preply->brp_un.brp_status, private);
			if (rc == PBSE_PERM) {
				/* we skip resources that are disallowed to be
				 * stat'ed by this user
				 */
				rc = 0;
			}
			prd = prd->rs_next;
		}
	}
	if (rc) {
		reply_free(preply);
		req_reject(rc, bad, preq);
	} else {
		reply_send(preq);
	}
}


================================================
FILE: src/server/req_track.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    req_track.c
 *
 * @brief
 * 	req_track.c	-	Functions relation to the Track Job Request and job tracking.
 *
 * Functions included are:
 *	req_track()
 *	track_save()
 *	issue_track()
 *	track_history_job()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <errno.h>
#include <sys/types.h>
#include <stdlib.h>
#include "libpbs.h"
#include <fcntl.h>
#include <signal.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "pbs_error.h"
#include "work_task.h"
#include "tracking.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

/* External functions */

extern int issue_to_svr(char *svr, struct batch_request *, void (*func)(struct work_task *));

/* Local functions */

static void track_history_job(struct rq_track *, char *);

/* Global Data Items: */

extern char *path_track;
extern struct server server;
extern time_t time_now;
extern char server_name[];

/**
 * @brief
 * 		req_track - record job tracking information
 *
 * @param[in,out]	preq	-	request from the server.
 */

void
req_track(struct batch_request *preq)
{
	struct tracking *empty = NULL;
	int i;
	int need;
	struct tracking *new;
	struct tracking *ptk;
	struct rq_track *prqt;

	/*  make sure request is from a server */

	if (!preq->rq_fromsvr) {
		req_reject(PBSE_IVALREQ, 0, preq);
		return;
	}

	/* attempt to locate tracking record for this job    */
	/* also remember first empty slot in case its needed */

	prqt = &preq->rq_ind.rq_track;

	ptk = server.sv_track;
	for (i = 0; i < server.sv_tracksize; i++) {
		if ((ptk + i)->tk_mtime) {
			if (!strcmp((ptk + i)->tk_jobid, prqt->rq_jid)) {

				/*
				 * found record, discard it if state == exiting,
				 * otherwise, update it if older
				 */

				if (*prqt->rq_state == 'E') {
					(ptk + i)->tk_mtime = 0;
					track_history_job(prqt, NULL);
				} else if ((ptk + i)->tk_hopcount < prqt->rq_hopcount) {
					(ptk + i)->tk_hopcount = prqt->rq_hopcount;
					(void) strcpy((ptk + i)->tk_location, prqt->rq_location);
					(ptk + i)->tk_state = *prqt->rq_state;
					(ptk + i)->tk_mtime = time_now;
					track_history_job(prqt, preq->rq_extend);
				}
				server.sv_trackmodifed = 1;
				reply_ack(preq);
				return;
			}
		} else if (empty == NULL) {
			empty = ptk + i;
		}
	}

	/* if we got here, didn't find it... */

	if (*prqt->rq_state != 'E') {

		/* and need to add it */

		if (empty == NULL) {

			/* need to make room for more */

			need = server.sv_tracksize * 3 / 2;
			new = (struct tracking *) realloc(server.sv_track,
							  need * sizeof(struct tracking));
			if (new == NULL) {
				log_err(errno, "req_track", "malloc failed");
				req_reject(PBSE_SYSTEM, 0, preq);
				return;
			}
			empty = new + server.sv_tracksize; /* first new slot */
			for (i = server.sv_tracksize; i < need; i++)
				(new + i)->tk_mtime = 0;
			server.sv_tracksize = need;
			server.sv_track = new;
		}

		empty->tk_mtime = time_now;
		empty->tk_hopcount = prqt->rq_hopcount;
		(void) strcpy(empty->tk_jobid, prqt->rq_jid);
		(void) strcpy(empty->tk_location, prqt->rq_location);
		empty->tk_state = *prqt->rq_state;
		server.sv_trackmodifed = 1;
	}
	reply_ack(preq);
	return;
}

/**
 * @brief
 * 		track_save - save the tracking records to a file
 * @par
 *		This routine is invoked periodically by a timed work task entry.
 *		The first entry is created at server initialization time and then
 *		recreated on each entry.
 * @par
 *		On server shutdown, track_save is called with a null work task pointer.
 *
 * @param[in]	pwt	-	unused
 */

void
track_save(struct work_task *pwt)
{
	int fd;

	/* set task for next round trip */

	if (pwt) { /* set up another work task for next time period */
		if (!set_task(WORK_Timed, (long) time_now + PBS_SAVE_TRACK_TM,
			      track_save, 0))
			log_err(errno, __func__, "Unable to set task for save");
	}

	if (server.sv_trackmodifed == 0)
		return; /* nothing to do this time */

	fd = open(path_track, O_WRONLY, 0);
	if (fd < 0) {
		log_err(errno, __func__, "Unable to open tracking file");
		return;
	}

	if (write(fd, (char *) server.sv_track, server.sv_tracksize * sizeof(struct tracking)) == -1) 
		log_errf(-1, __func__, "write failed. ERR : %s",strerror(errno));
	(void) close(fd);
	server.sv_trackmodifed = 0;
	return;
}

/**
 * @brief
 * 		issue_track - issue a Track Job Request to another server
 *
 * @param[in]	pwt	-	Job Request to another server
 */

void
issue_track(job *pjob)
{
	struct batch_request *preq;
	char *pc;

	preq = alloc_br(PBS_BATCH_TrackJob);
	if (preq == NULL)
		return;

	preq->rq_ind.rq_track.rq_hopcount = get_jattr_long(pjob, JOB_ATR_hopcount);
	(void) strcpy(preq->rq_ind.rq_track.rq_jid, pjob->ji_qs.ji_jobid);
	(void) strcpy(preq->rq_ind.rq_track.rq_location, pbs_server_name);
	preq->rq_ind.rq_track.rq_state[0] = get_job_state(pjob);
	preq->rq_extend = (char *) malloc(PBS_MAXROUTEDEST + 1);
	if (preq->rq_extend != NULL)
		(void) strncpy(preq->rq_extend, pjob->ji_qs.ji_queue, PBS_MAXROUTEDEST + 1);

	pc = pjob->ji_qs.ji_jobid;
	while (*pc != '.')
		pc++;
	(void) issue_to_svr(++pc, preq, release_req);
}

/**
 * @brief
 * 		track_history_job()	-	It updates the substate and comment attribute of
 * 		history job (job state = JOB_STATE_LTR_MOVED).
 *
 * @param[in]	prqt	-	request track structure
 * @param[in]	extend	-	request "extension" data
 *
 * @return	Nothing
 */
static void
track_history_job(struct rq_track *prqt, char *extend)
{
	char *comment = "Job has been moved to";
	job *pjob = NULL;
	char dest_queue[PBS_MAXROUTEDEST + 1] = {'\0'};

	/* return if the server is not configured for job history */
	if (svr_chk_history_conf() == 0)
		return;

	pjob = find_job(prqt->rq_jid);

	/*
	 * Return if not found the job OR job is not created here
	 * OR job is not in state MOVED.
	 */
	if ((pjob == NULL) ||
	    ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_HERE) == 0) ||
	    (!check_job_state(pjob, JOB_STATE_LTR_MOVED))) {
		return;
	}

	/*
	 * If the track state is 'E', then update the substate of
	 * the history job substate=JOB_SUBSTATE_MOVED to JOB_SUBSTATE_FINISHED
	 * and update the comment message.
	 */
	if (*prqt->rq_state == 'E') {
		set_job_substate(pjob, JOB_SUBSTATE_FINISHED);
		/* over write the default comment message */
		comment = "Job finished at";
	}

	/* If the track state is 'Q' and extend has data, update
	 * history information with new destination queue.
	 */
	if (*prqt->rq_state == 'Q' && extend != NULL) {
		(void) strncpy(dest_queue, extend, PBS_MAXQUEUENAME + 1);
		(void) strcat(dest_queue, "@");
		(void) strcat(dest_queue, prqt->rq_location);
		/* Set the new queue attribute to destination */
		set_jattr_generic(pjob, JOB_ATR_in_queue, dest_queue, NULL, SET);
	}

	/*
	 * Populate the appropriate comment message in log_buffer
	 * and call the decode API for the comment attribute of job
	 * to update the modified comment message.
	 */
	sprintf(log_buffer, "%s \"%s\"", comment, prqt->rq_location);
	set_jattr_str_slim(pjob, JOB_ATR_Comment, log_buffer, NULL);
	svr_histjob_update(pjob, get_job_state(pjob), get_job_substate(pjob));
}


================================================
FILE: src/server/resc_attr.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * 	Functions relation to the Track Job Request and job tracking.
 *
 */

#include <pbs_config.h> /* the master config generated by configure */
#include <sys/types.h>
#include <stdlib.h>
#include <stdio.h>
#include <ctype.h>
#include "pbs_ifl.h"
#include "server_limits.h"
#include <string.h>
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "grunt.h"
#include "pbs_share.h"
#include "server.h"
#ifndef PBS_MOM
#include "queue.h"
#endif /* PBS_MOM */

extern char *find_aoe_from_request(resc_resv *);
/**
 * @brief
 * 		ctnodes	-	count the num of nodes from attribute struct holding value
 *
 * @param[in]	spec	-	attribute struct holding value
 *
 * @return	num of nodes
 */
int
ctnodes(char *spec)
{
	int ct = 0;
	char *pc;

	while (1) {

		while (isspace((int) *spec))
			++spec;

		if (isdigit((int) *spec)) {
			pc = spec;
			while (isdigit((int) *pc))
				++pc;
			if (!isalpha((int) *pc))
				ct += atoi(spec);
			else
				++ct;
		} else
			++ct;
		if ((pc = strchr(spec, '+')) == NULL)
			break;
		spec = pc + 1;
	}
	return (ct);
}

/**
 * @brief
 * 		set_node_ct = set node count
 * @par
 *		This is the "at_action" routine for the resource "nodes".
 *		When the resource_list attribute changes, then set/update
 *		the value of the resource "nodect" for use by the scheduler.
 *		Also updates "ncpus" in most circumstances.
 *
 * @param[in]	pnodesp	-	pointer to resource
 * @param[in,out]	pattr	-	pointer to attribute
 * @param[in]	pobj	-	unused here.
 * @param[in]	type	-	unused here.
 * @param[in]	actmode	-	mode of action routine
 */

int
set_node_ct(resource *pnodesp, attribute *pattr, void *pobj, int type, int actmode)
{
#ifndef PBS_MOM
	int nn;	      /* num of nodes */
	int nt;	      /* num of tasks (processes) */
	int hcpp = 0; /* has :ccp in string */
	long nc;
	resource *pnct;
	resource *pncpus;
	resource_def *pndef;

	if ((actmode == ATR_ACTION_RECOV) ||
	    ((is_attr_set(&pnodesp->rs_value)) == 0))
		return (0);

	/* first validate the spec */

	if ((nn = validate_nodespec(pnodesp->rs_value.at_val.at_str)) != 0)
		return nn;

	/* Set "nodect" to count of nodes in "nodes" */

	pndef = &svr_resc_def[RESC_NODECT];
	if (pndef == NULL)
		return (PBSE_SYSTEM);

	if ((pnct = find_resc_entry(pattr, pndef)) == NULL) {
		if ((pnct = add_resource_entry(pattr, pndef)) == 0)
			return (PBSE_SYSTEM);
	}

	nn = ctnodes(pnodesp->rs_value.at_val.at_str);
	pnct->rs_value.at_val.at_long = nn;
	post_attr_set(&pnct->rs_value);

	/* find the number of cpus specified in the node string */

	nt = ctcpus(pnodesp->rs_value.at_val.at_str, &hcpp);

	/* Is "ncpus" set as a separate resource? */

	pndef = &svr_resc_def[RESC_NCPUS];
	if (pndef == NULL)
		return (PBSE_SYSTEM);
	if ((pncpus = find_resc_entry(pattr, pndef)) == NULL) {
		if ((pncpus = add_resource_entry(pattr, pndef)) == 0)
			return (PBSE_SYSTEM);
	}

	if (((pncpus->rs_value.at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) == ATR_VFLAG_SET) && (actmode == ATR_ACTION_NEW)) {
		/* ncpus is already set and not a default and new job */

		nc = pncpus->rs_value.at_val.at_long;
		if (hcpp && (nt != pncpus->rs_value.at_val.at_long)) {
			/* if cpp string specificed, this is an error */
			return (PBSE_BADATVAL);
		} else if ((nc % nt) != 0) {
			/* ncpus must be multiple of number of tasks */
			return (PBSE_BADATVAL);
		}

	} else {
		/* ncpus is not set or not a new job (qalter being done) */
		/* force ncpus to the correct thing */
		pncpus->rs_value.at_val.at_long = nt;
		post_attr_set(&pncpus->rs_value);
	}

#endif /* not MOM */
	return (0);
}

struct place_words {
	char *pw_word;	   /* place keyword */
	short pw_oneof;	   /* bit mask for which cannot be together */
	short pw_equalstr; /* one if word has following "=value" */
} place_words[] = {
	{PLACE_Group, 0, 1},
	{PLACE_Excl, 2, 0},
	{PLACE_ExclHost, 2, 0},
	{PLACE_Shared, 2, 0},
	{PLACE_Free, 1, 0},
	{PLACE_Pack, 1, 0},
	{PLACE_Scatter, 1, 0},
	{PLACE_VScatter, 1, 0}};
/**
 * @brief
 * 		decode_place	-	not used.
 */

int
decode_place(attribute *patr, char *name, char *rescn, char *val)
{
#ifndef PBS_MOM
	int have_oneof = 0;
	int i;
	size_t ln;
	char h;
	char *pc;
	char *px;
	struct resource_def *pres;

	pc = val;

	while (1) {
		while (isspace((int) *pc))
			++pc;
		if (*pc == '\0' || !isalpha((int) *pc))
			return PBSE_BADATVAL;
		/* found start of word,  look for end of word */
		px = pc + 1;
		while (isalpha((int) *px))
			px++;

		for (i = 0; i < sizeof(place_words) / sizeof(place_words[0]); ++i) {
			if (strlen(place_words[i].pw_word) >= (size_t) (px - pc))
				ln = strlen(place_words[i].pw_word);
			else
				ln = (size_t) (px - pc);
			if (strncasecmp(pc, place_words[i].pw_word, ln) == 0) {
				break;
			}
		}
		if (i == sizeof(place_words) / sizeof(place_words[0]))
			return PBSE_BADATVAL;

		if (place_words[i].pw_oneof & have_oneof)
			return PBSE_BADATVAL;
		have_oneof |= place_words[i].pw_oneof;

		if (place_words[i].pw_equalstr) {
			if (*px != '=')
				return PBSE_BADATVAL;
			pc = ++px;
			while ((isalnum((int) *px) || (*px == '_') || (*px == '-')) &&
			       (*px != ':'))
				++px;
			if (pc == px)
				return PBSE_BADATVAL;
			/* now need to see if the value is a valid resource/type */
			h = *px;
			*px = '\0';
			pres = find_resc_def(svr_resc_def, pc);
			if (pres == NULL)
				return PBSE_UNKRESC;
			if ((pres->rs_type != ATR_TYPE_STR) &&
			    (pres->rs_type != ATR_TYPE_ARST))
				return PBSE_RESCNOTSTR;
			*px = h;

			if (*px == '\0')
				break;
			else if (*px != ':')
				return PBSE_BADATVAL;
		}
		pc = px;
		if (*pc == '\0')
			break;
		else if (*pc != ':')
			return PBSE_BADATVAL;
		pc++;
	}

#endif /* not PBS_MOM */

	return (decode_str(patr, name, rescn, val));
}

/**
 * @brief
 * 		to_kbsize - decode a "size" string to a value in kilobytes
 *
 * @param[in]	val	-	"size" string
 *
 * @return	long
 * @retval	value in kilobytes
 */

long long
to_kbsize(char *val)
{
	int havebw = 0;
	long long sv_num;
	int sv_shift = 0;
	char *pc;

	sv_num = strtol(val, &pc, 0);
	if (pc == val) /* no numeric part */
		return (0);

	switch (*pc) {
		case '\0':
			break;
		case 'k':
		case 'K':
			sv_shift = 10;
			break;
		case 'm':
		case 'M':
			sv_shift = 20;
			break;
		case 'g':
		case 'G':
			sv_shift = 30;
			break;
		case 't':
		case 'T':
			sv_shift = 40;
			break;
		case 'p':
		case 'P':
			sv_shift = 50;
			break;
		case 'b':
		case 'B':
			havebw = 1;
			break;
		case 'w':
		case 'W':
			havebw = 1;
			sv_num *= SIZEOF_WORD;
			break;

		default:
			return (0); /* invalid string */
	}
	if (*pc != '\0')
		pc++;
	if (*pc != '\0') {
		if (havebw)
			return (0); /* invalid string */
		switch (*pc) {
			case 'b':
			case 'B':
				break;
			case 'w':
			case 'W':
				sv_num *= sizeof(int);
				break;
			default:
				return (0);
		}
	}

	if (sv_shift == 0) {
		sv_num = (sv_num + 1023) >> 10;
	} else {
		sv_num = sv_num << (sv_shift - 10);
	}
	return (sv_num);
}

/**
 * @brief
 * 		preempt_targets_action - A function which is used to validate the <attribute>
 *                          out of "<attribute>=<value>" pair assigned to preempt_targets
 *
 * @param[in]	presc    -       pointer to resource
 * @param[in]   pattr    -       pointer to attribute
 * @param[in]   pobj     -       pointer to job or reservation
 * @param[in]   type     -       if job or reservation
 * @param[in]   actmode  -       mode of action routine
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	PBSE_BADATVAL	: if a non existent attribute is given
 */

int
preempt_targets_action(resource *presc, attribute *pattr, void *pobject, int type, int actmode)
{
	char *name;
	char *p;
	int i;
	char *res_name = NULL;
	resource_def *resdef = NULL;
	char ch;

	if ((actmode == ATR_ACTION_FREE) || (actmode == ATR_ACTION_RECOV))
		return PBSE_NONE;

	if (!is_attr_set(pattr))
		return PBSE_NONE;

	if (presc->rs_value.at_val.at_arst == NULL)
		return PBSE_BADATVAL;

	for (i = 0; i < presc->rs_value.at_val.at_arst->as_usedptr; ++i) {
		name = presc->rs_value.at_val.at_arst->as_string[i];

		if (!strncasecmp(name, TARGET_NONE, strlen(TARGET_NONE))) {
			if (presc->rs_value.at_val.at_arst->as_usedptr > 1)
				return PBSE_BADATVAL;
			return PBSE_NONE;
		}
		p = strpbrk(name, ".=");
		if (p) {
			ch = *p;
			*p = '\0';
			if (!(strcasecmp(name, ATTR_l))) {
				*p = ch;
				res_name = p + 1;
				p = strpbrk(res_name, "=");
				if (p) {
					ch = *p;
					*p = '\0';
					resdef = find_resc_def(svr_resc_def, res_name);
					*p = ch;
					if (resdef == NULL)
						return PBSE_UNKRESC;
					else
						continue;
				} else
					return PBSE_BADATVAL;
			} else if (!(strcasecmp(name, ATTR_queue))) {
				*p = ch;
#ifndef PBS_MOM
				if (ch != '=')
					return PBSE_BADATVAL;
				p++;
				if (find_queuebyname(p) != NULL) {
					continue;
				} else {
					return PBSE_UNKQUE;
				}
#endif
			} else {
				*p = ch;
				return PBSE_BADATVAL;
			}
		} else {
			return PBSE_BADATVAL;
		}
	}
	return PBSE_NONE;
}

#ifndef PBS_MOM
/**
 * @brief
 * 		host_action - action routine for job's resource_list host resource
 *		validate the legality of the host name syntax
 *
 * @param[in]	presc    -       pointer to resource
 * @param[in]   pattr    -       not used here
 * @param[in]   pobj     -       not used here
 * @param[in]   type     -       not used here
 * @param[in]   actmode  -       mode of action routine
 *
 * @return	int
 * @retval	0	: success
 * @retval	PBSE_BADATVAL	: host name is not alpha numerical
 * @retval	PBSE_SYSTEM	: strdup failed, probably due to malloc failure
 */
int
host_action(resource *presc, attribute *pattr, void *pobj, int type, int actmode)
{
	char *name;
	extern char *resc_in_err;

	if ((actmode != ATR_ACTION_ALTER) && (actmode != ATR_ACTION_NEW))
		return 0;

	name = presc->rs_value.at_val.at_str;
	if (name) {
		for (; *name; ++name) {
			if (isalnum((int) *name) ||
			    *name == '-' ||
			    *name == '_' ||
			    *name == '.') {
				continue;
			} else {
				if ((resc_in_err = strdup(presc->rs_value.at_val.at_str)) == NULL)
					return PBSE_SYSTEM;
				return PBSE_BADATVAL;
			}
		}
	}
	return 0;
}

/**
 * @brief
 *		Check select string for key
 * @par
 *		We can't just use strstr because it could match something with
 *		key as the last part of a longer string.  For example, looking
 *		for "eoe=" in "1:cooleoe=3" would match with strstr but would
 *		be a false positive.
 * @param[in]	str		string from select to search
 * @param[in]	key		string to search for
 *
 * @return	char*
 * @retval	NULL	key not found
 * @retval	!NULL	location of key
 */
char *
select_search(char *str, char *key)
{
	char *loc = strstr(str, key);
	char *prev;

	if (loc == NULL) /* not found at all */
		return NULL;
	if (str == loc) /* key is initial string */
		return loc;
	prev = loc - 1;			  /* look at char before key */
	if (*prev == ':' || *prev == '+') /* key is really there */
		return loc;
	return NULL; /* some other string like "1:xeoe=42" */
}

/**
 * @brief
 *      Wrapper routine for resc_select_action
 *
 * @par Functionality:
 *      It applies rules to validate eoe in the chunks. Rules are:
 *      (a) either all chunks request eoe or none request eoe
 *      (b) all chunks request same eoe
 *
 * @param[in]   presc    -       pointer to resource
 * @param[in]   pattr    -       pointer to attribute
 * @param[in]   pobj     -       pointer to job or reservation
 * @param[in]   type     -       if job or reservation
 *
 * @return		int
 * @retval		PBSE_NONE : success if no provisioning needed
 * @retval		PBSE_IVAL_AOECHUNK : if rules not met, the message for
 *						this EOE define is what is needed here as well
 * @retval		PBSE_SYSTEM : if error
 *
 * @par Side Effects:
 *	None
 *
 * @par MT-safe: Yes
 *
 */
static int
apply_eoe_inchunk_rules(resource *presc, attribute *pattr, void *pobj,
			int type)
{
	int c = 1, i; /* # of chunks, len of aoename */
	int ret = PBSE_NONE;
	static char key[] = "eoe=";
	char *name;
	char *peoe = NULL;    /* stores addr of eoe */
	char *eoename = NULL; /* 1st eoe found in select */
	char *tmpptr;	      /* store temp addr */

	if ((name = presc->rs_value.at_val.at_str) == NULL)
		return PBSE_NONE;

	/* eoe is requested? */
	if ((peoe = select_search(name, key)) == NULL)
		return PBSE_NONE;

	/* count # of chunks; ignore chunk multiplier */
	for (tmpptr = name; *tmpptr; tmpptr++)
		if (*tmpptr == '+')
			c++;

	/* find key ; reduce c each time pattern is found. */
	for (; peoe; c--, (peoe = select_search(peoe, key))) {
		/* point to eoe name. */
		peoe += strlen(key);
		tmpptr = peoe;
		/* get length of eoe name in i */
		for (i = 0; *tmpptr && *tmpptr != ':' && *tmpptr != '+';
		     i++, tmpptr++)
			;
		/* if first appearance of eoe, store it. */
		if (eoename == NULL) {
			eoename = malloc(i + 1);
			if (eoename == NULL)
				return PBSE_SYSTEM;
			strncpy(eoename, peoe, i);
			eoename[i] = '\0';
		}
		/* compare previously stored eoe and this eoe  */
		if (strncmp(peoe, eoename, i)) {
			ret = PBSE_IVAL_AOECHUNK; /* rule (b)*/
			break;
		}
	}
	/* there were chunks without eoe */
	if (c)
		ret = PBSE_IVAL_AOECHUNK; /* rule (a) */

	if (eoename)
		free(eoename);
	return ret;
}
/**
 * @brief
 *      Action routine for resource 'select'
 *
 * @param[in]   presc    -       pointer to resource
 * @param[in]   pattr    -       pointer to attribute
 * @param[in]   pobj     -       pointer to job or reservation
 * @param[in]   type     -       if job or reservation
 * @param[in]   actmode  -       mode of action routine
 *
 * @return	int
 * @retval	PBSE_NONE	: success if no provisioning needed
 * @retval	PBSE_IVAL_AOECHUNK	: if rules not met
 * @retval	PBSE_SYSTEM	: if error
 *
 * @par Side Effects:
 *		None
 *
 * @par	MT-safe: Yes
 *
 */

int
resc_select_action(resource *presc, attribute *pattr, void *pobj,
		   int type, int actmode)
{
	int rc = 0;
	if ((actmode != ATR_ACTION_NEW) && (actmode != ATR_ACTION_ALTER))
		return PBSE_NONE;
	rc = apply_select_inchunk_rules(presc, pattr, pobj, type, actmode);
	if (rc != PBSE_NONE)
		return rc;
	rc = apply_eoe_inchunk_rules(presc, pattr, pobj, type);
	if (rc != PBSE_NONE)
		return rc;

	/* not performing check if job is being created since reservation
	 * related data is not available yet.
	 */
	if (type == PARENT_TYPE_JOB && actmode == ATR_ACTION_NEW)
		return PBSE_NONE;

	return apply_aoe_inchunk_rules(presc, pattr, pobj, type);
}

/**
 * @brief
 *      Wrapper routine for resc_select_action
 *
 * @par Functionality:
 *      It applies rules to validate aoe in the chunks. Rules are:
 *      (a) either all chunks request aoe or none request aoe
 *      (b) all chunks request same aoe
 *      (c) job with aoe cannot be in reservation without aoe
 *      (d) job without aoe cannot be in reservation with aoe
 *      (e) reservation and job in it, have same aoe
 *
 * @param[in]   presc    -       pointer to resource
 * @param[in]   pattr    -       pointer to attribute
 * @param[in]   pobj     -       pointer to job or reservation
 * @param[in]   type     -       if job or reservation
 *
 * @return	int
 * @retval	PBSE_NONE	: success if no provisioning needed
 * @retval	PBSE_IVAL_AOECHUNK	: if rules not met
 * @retval	PBSE_SYSTEM	: if error
 *
 * @par Side Effects:
 *		None
 *
 * @par MT-safe: Yes
 *
 */
int
apply_aoe_inchunk_rules(resource *presc, attribute *pattr, void *pobj,
			int type)
{
	job *jb = NULL;
	int c = 1, i; /* # of chunks, len of aoename */
	char *name;
	char *paoe = NULL;    /* stores addr of aoe */
	char *aoename = NULL; /* 1st aoe found in select */
	char *tmpptr;	      /* store temp addr */
	char *aoe_req = NULL; /* Null if job outside reservation,
					 * Null if reservation has no aoe,
					 * not NULL if reservation has aoe */

	if (type == PARENT_TYPE_JOB) {
		jb = (job *) pobj;
		if (jb->ji_myResv) /* Get aoe requested by reservation */
			aoe_req = (char *) find_aoe_from_request(jb->ji_myResv);
	}

	name = presc->rs_value.at_val.at_str;
	if (name) {
		/* easy n quick check first: aoe is requested? */
		if ((paoe = strstr(name, "aoe=")) == NULL) {
			if (aoe_req) {
				free(aoe_req);
				return PBSE_IVAL_AOECHUNK; /* rule (d) */
			}
		} else {
			/* aoe is requested, slow down for checks */

			tmpptr = name;
			/* count # of chunks; ignore chunk multiplier */
			for (; *tmpptr; tmpptr++)
				if (*tmpptr == '+')
					c++;

			/* find pattern aoe= ; reduce c each time
			 * pattern is found. paoe was set in 'if' block
			 */
			for (; paoe; c--, (paoe = strstr(paoe, "aoe="))) {
				/* point to aoe name. */
				paoe += 4;
				tmpptr = paoe;
				/* get length of aoe name in i. */
				for (i = 0; *tmpptr && *tmpptr != ':' &&
					    *tmpptr != '+';
				     i++, tmpptr++)
					;
				/* if first appearance of aoe, store it. */
				if (aoename == NULL) {
					aoename = malloc(i + 1);
					if (aoename == NULL) {
						if (aoe_req)
							free(aoe_req);
						return PBSE_SYSTEM;
					}
					strncpy(aoename, paoe, i);
					aoename[i] = '\0';
				}
				/* compare previously stored aoe and
				 * this aoe.
				 */
				if (strncmp(paoe, aoename, i)) {
					if (aoe_req)
						free(aoe_req);
					if (aoename)
						free(aoename);
					return PBSE_IVAL_AOECHUNK; /* rule (b)*/
				}
				/* if job is in reservation, compare
				 * with reservation's aoe.
				 */
				if (type == PARENT_TYPE_JOB && jb->ji_myResv) {
					if (aoe_req == NULL ||
					    strncmp(aoe_req, aoename, i)) {
						if (aoe_req)
							free(aoe_req);
						if (aoename)
							free(aoename);
						/* rule (c/e) */
						return PBSE_IVAL_AOECHUNK;
					}
				}
			}
		}
	}

	if (aoe_req)
		free(aoe_req);
	if (aoename)
		free(aoename);
	return PBSE_NONE;
}
#endif /* not PBS_MOM */
/**
 * @brief
 *      action routine for built-in resources to check if its value is zero
 *      or positive whose datatype is long.
 *
 * @param[in]   presc	-	pointer to resource
 * @param[in]   pattr	-	pointer to attribute
 * @param[in]   pobj	-	pointer to job or reservation
 * @param[in]   type	-	if job or reservation
 * @param[in]   actmode	-	mode of action routine
 *
 * @return	int
 * @retval	PBSE_NONE	: success(if value is greater than or equal to zero)
 * @retval	PBSE_BADATVAL	: if value is less than zero
 *
 * @par Side Effects:
 *		None
 *
 * @par MT-safe: Yes
 *
 */
int
zero_or_positive_action(resource *presc, attribute *pattr, void *pobj, int type, int actmode)
{
	long l;
	if ((actmode != ATR_ACTION_ALTER) && (actmode != ATR_ACTION_NEW))
		return 0;
	l = presc->rs_value.at_val.at_long;
	if (l < 0)
		return PBSE_BADATVAL;
	return PBSE_NONE;
}
/**
 * @brief
 *      Wrapper routine for resc_select_action
 *      It applies rules to validate all individual resources in all the chunks.
 *
 * @par Functionality:
 *      1. Parses select specification by calling parse_chunk function.
 *      2. Decodes each chunk
 *      3. Calls resource action function for each resource in a chunk if
 *	   the resource is of type long.
 *
 * @param[in]   presc	-	pointer to resource
 * @param[in]   pattr	-	pointer to attribute
 * @param[in]   pobj	-	pointer to job
 * @param[in]   type	-	if job or reservation
 * @param[in]   actmode	-	mode of action routine
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	> 0	: if error
 *
 * @par Side Effects:
 *		None
 *
 */
int
apply_select_inchunk_rules(resource *presc, attribute *pattr, void *pobj, int type, int actmode)
{
	char *chunk;
	int nchk;
	int nelem;
	struct key_value_pair *pkvp;
	int rc = 0;
	int j;
	struct resource tmp_resc;
	char *select_str = NULL;

	select_str = presc->rs_value.at_val.at_str;
	if ((select_str == NULL) || (select_str[0] == '\0'))
		return PBSE_BADATVAL;
	chunk = parse_plus_spec(select_str, &rc); /* break '+' seperated substrings */
	if (rc != 0)
		return (rc);
	while (chunk) {
		if (parse_chunk(chunk, &nchk, &nelem, &pkvp, NULL) == 0) {
			for (j = 0; j < nelem; ++j) {
				tmp_resc.rs_defin = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
				if ((tmp_resc.rs_defin != NULL) && (tmp_resc.rs_defin->rs_type == ATR_TYPE_LONG)) {
					tmp_resc.rs_value.at_val.at_long = atol(pkvp[j].kv_val);
					if (tmp_resc.rs_defin->rs_action) {
						if ((rc = tmp_resc.rs_defin->rs_action(&tmp_resc, pattr, pobj,
										       type, actmode)) != 0)
							return (rc);
					}
				}
			}
		} else {
			return PBSE_BADATVAL;
		}
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0)
			return (rc);
	} /* while */
	return PBSE_NONE;
}
/**
 * @brief action_soft_walltime - action function for the soft_walltime resource.
 *
 * 	returns int
 * 	@retval PBSE_BADATVAL - soft_walltime > walltime
 * 	@retval PBSE_SOFTWT_STF - min_walltime is set
 * 	@retval PBSE_NONE - everything is fine
 */
int
action_soft_walltime(resource *presc, attribute *pattr, void *pobject, int type, int actmode)
{
	job *pjob;

	if ((actmode != ATR_ACTION_ALTER) && (actmode != ATR_ACTION_NEW))
		return PBSE_NONE;

	if (pobject != NULL) {
		static resource_def *walltime_def = NULL;
		static resource_def *min_walltime_def = NULL;
		resource *entry;

		if (type != PARENT_TYPE_JOB)
			return PBSE_NONE;

		pjob = (job *) pobject;

		/* Make sure soft_walltime < walltime */
		if (walltime_def == NULL)
			walltime_def = &svr_resc_def[RESC_WALLTIME];
		entry = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), walltime_def);
		if (entry != NULL) {
			if (is_attr_set(&entry->rs_value)) {
				if (walltime_def->rs_comp(&(entry->rs_value), &(presc->rs_value)) < 0)
					return PBSE_BADATVAL;
			}
		}

		/* soft_walltime and STF jobs are incompatible */
		if (min_walltime_def == NULL)
			min_walltime_def = &svr_resc_def[RESC_MIN_WALLTIME];
		entry = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), min_walltime_def);
		if (entry != NULL) {
			if (is_attr_set(&entry->rs_value))
				return PBSE_SOFTWT_STF;
		}
	}
	return PBSE_NONE;
}
/**
 * @brief action_walltime - action function for the soft_walltime resource.
 *
 * 	returns int
 * 	@retval PBSE_BADATVAL - walltime < soft_walltime
 * 	@retval PBSE_NONE - everything is fine
 */

int
action_walltime(resource *presc, attribute *pattr, void *pobject, int type, int actmode)
{
	job *pjob;
	resource *entry;

	if ((actmode != ATR_ACTION_ALTER) && (actmode != ATR_ACTION_NEW))
		return PBSE_NONE;

	if (pobject != NULL) {
		static resource_def *soft_walltime_def = NULL;

		if (type != PARENT_TYPE_JOB)
			return PBSE_NONE;

		pjob = (job *) pobject;

		/* Make sure walltime > soft_walltime */
		if (soft_walltime_def == NULL)
			soft_walltime_def = &svr_resc_def[RESC_SOFT_WALLTIME];
		entry = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), soft_walltime_def);
		if (entry != NULL) {
			if (is_attr_set(&entry->rs_value)) {
				if (soft_walltime_def->rs_comp(&(entry->rs_value), &(presc->rs_value)) > 0)
					return PBSE_BADATVAL;
			}
		}
	}
	return PBSE_NONE;
}

/**
 * @brief action_min_walltime - action function for min_walltime.
 * @return int
 * @retval PBSE_NOSTF_JOBARRAY - if min_walltime is on a job array
 * @retval PBSE_SOFTWT_STF - if min_walltime is set with soft_walltime
 * @retval PBSE_MIN_GT_MAXWT - if min_walltime > max_walltime
 * @retval PBSE_NONE - all is fine
 */
int
action_min_walltime(resource *presc, attribute *pattr, void *pobject, int type, int actmode)
{
	job *pjob;

	if ((actmode != ATR_ACTION_ALTER) && (actmode != ATR_ACTION_NEW))
		return PBSE_NONE;

	if (pobject != NULL) {
		static resource_def *soft_walltime_def = NULL;
		static resource_def *max_walltime_def = NULL;
		resource *entry;

		if (type != PARENT_TYPE_JOB)
			return PBSE_NONE;

		pjob = (job *) pobject;

#ifndef PBS_MOM /* MOM doesn't call the action functions and doesn't have access to is_job_array() */
		/* Job arrays can't be STF jobs */
		if (is_job_array(pjob->ji_qs.ji_jobid) != IS_ARRAY_NO)
			return PBSE_NOSTF_JOBARRAY;
#endif
		/* STF jobs can't request soft_walltime */
		if (soft_walltime_def == NULL)
			soft_walltime_def = &svr_resc_def[RESC_SOFT_WALLTIME];
		if (soft_walltime_def != NULL) {
			entry = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), soft_walltime_def);
			if (entry != NULL) {
				if (is_attr_set(&entry->rs_value))
					return PBSE_SOFTWT_STF;
			}
		}

		/* max_walltime needs to be greater than min_walltime */
		if (max_walltime_def == NULL)
			max_walltime_def = &svr_resc_def[RESC_MAX_WALLTIME];
		if (max_walltime_def != NULL) {
			entry = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), max_walltime_def);
			if (entry != NULL && (is_attr_set(&entry->rs_value)))
				if (max_walltime_def->rs_comp(&(entry->rs_value), &(presc->rs_value)) < 0)
					return PBSE_MIN_GT_MAXWT;
		}
	}
	return PBSE_NONE;
}

/**
 * @brief action_max_walltime - action function for max_walltime.
 * @return int
 * @retval PBSE_SOFTWT_STF - if max_walltime is set with soft_walltime
 * @retval PBSE_MIN_GT_MAXWT - if max_walltime < min_walltime
 * @retval PBSE_MAX_NO_MINWT - max_walltime with no min_walltime
 * @retval PBSE_NONE - all is fine
 */

int
action_max_walltime(resource *presc, attribute *pattr, void *pobj, int type, int actmode)
{
	job *pjob;

	if ((actmode != ATR_ACTION_ALTER) && (actmode != ATR_ACTION_NEW))
		return PBSE_NONE;

	if (pobj != NULL) {
		static resource_def *soft_walltime_def = NULL;
		static resource_def *min_walltime_def = NULL;
		resource *entry;

		if (type != PARENT_TYPE_JOB)
			return PBSE_NONE;

		pjob = (job *) pobj;

		/* STF jobs can't request soft_walltime */
		if (soft_walltime_def == NULL)
			soft_walltime_def = &svr_resc_def[RESC_SOFT_WALLTIME];
		if (soft_walltime_def != NULL) {
			entry = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), soft_walltime_def);
			if (entry != NULL) {
				if (is_attr_set(&entry->rs_value))
					return PBSE_SOFTWT_STF;
			}
		}

		/* max_walltime needs to be greater than min_walltime */
		if (min_walltime_def == NULL)
			min_walltime_def = &svr_resc_def[RESC_MIN_WALLTIME];
		if (min_walltime_def != NULL) {
			entry = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), min_walltime_def);
			if (entry != NULL) {
				if (is_attr_set(&entry->rs_value)) {
					if (min_walltime_def->rs_comp(&(entry->rs_value), &(presc->rs_value)) > 0)
						return PBSE_MIN_GT_MAXWT;
				}
			} else
				return PBSE_MAX_NO_MINWT;
		}
	}
	return PBSE_NONE;
}


================================================
FILE: src/server/run_sched.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>
#include "libpbs.h"
#include "server.h"
#include "svrfunc.h"

/* Global Data */

extern struct server server;
extern char server_name[];
extern char *msg_sched_called;

int scheduler_jobs_stat = 0; /* set to 1 once scheduler queried jobs in a cycle*/
extern int svr_unsent_qrun_req;

/**
 * @brief
 * 		am_jobs - array of pointers to jobs which were moved or which had certain
 * 		attributes altered (qalter) while a schedule cycle was in progress.
 *		If a job in the array is run by the scheduler in the cycle, that run
 *		request is rejected as the move/modification may impact the job's
 *		requirements and placement.
 */
static struct am_jobs {
	int am_used;	/* number of jobs in the array  */
	int am_max;	/* number of slots in the array */
	job **am_array; /* pointer the malloc-ed array  */
} am_jobs = {0, 0, NULL};

/**
 * @brief
 *	send sched command 'cmd' to given sched
 *	if cmd == SCH_SCHEDULE_AJOB send jobid also
 *
 * @param[in]	sched	-	pointer to sched obj
 * @param[in]	cmd	-	the command to send
 * @param[in]	jobid	-	the jobid to send if 'cmd' is SCH_SCHEDULE_AJOB
 *
 * @return	int
 * @retval	1	for success
 * @retval	0	for failure
 */
int
send_sched_cmd(pbs_sched *sched, int cmd, char *jobid)
{
	int ret = -1;

	DIS_tcp_funcs();

	if (sched->sc_secondary_conn < 0)
		goto err;

	if ((ret = diswsi(sched->sc_secondary_conn, cmd)) != DIS_SUCCESS)
		goto err;

	if (cmd == SCH_SCHEDULE_AJOB) {
		if ((ret = diswst(sched->sc_secondary_conn, jobid)) != DIS_SUCCESS)
			goto err;
	}

	if (dis_flush(sched->sc_secondary_conn) != 0)
		goto err;

	log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SERVER, LOG_INFO, server_name, msg_sched_called, cmd);

	sched->sc_cycle_started = 1;

	return 1;

err:
	log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SERVER, LOG_INFO, server_name, "write to scheduler failed, err=%d", ret);
	return 0;
}

/**
 * @brief
 * 		find_assoc_sched_jid - find the corresponding scheduler which is responsible
 * 		for handling this job.
 *
 * @param[in]	jid - job id
 * @param[out]	target_sched - pointer to the corresponding scheduler to which the job belongs to
 *
 * @retval - 1  if success
 * 	   - 0 if fail
 */
int
find_assoc_sched_jid(char *jid, pbs_sched **target_sched)
{
	job *pj;
	int t;

	*target_sched = NULL;

	t = is_job_array(jid);
	if ((t == IS_ARRAY_NO) || (t == IS_ARRAY_ArrayJob))
		pj = find_job(jid); /* regular or ArrayJob itself */
	else
		pj = find_arrayparent(jid); /* subjob(s) */

	if (pj == NULL)
		return 0;

	return find_assoc_sched_pque(pj->ji_qhdr, target_sched);
}

/**
 * @brief
 * 		find_assoc_sched_pque - find the corresponding scheduler which is responsible
 * 		for handling this job.
 *
 * @param[in]	pq		- pointer to pbs_queue
 * @param[out]  target_sched	- pointer to the corresponding scheduler to which the job belongs to
 *
  * @retval - 1 if success
 * 	    - 0 if fail
 */
int
find_assoc_sched_pque(pbs_queue *pq, pbs_sched **target_sched)
{
	pbs_sched *psched;

	*target_sched = NULL;
	if (pq == NULL)
		return 0;

	if (is_qattr_set(pq, QA_ATR_partition)) {
		char *partition = get_qattr_str(pq, QA_ATR_partition);

		if (strcmp(partition, DEFAULT_PARTITION) == 0) {
			*target_sched = dflt_scheduler;
			return 1;
		}
		for (psched = (pbs_sched *) GET_NEXT(svr_allscheds); psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
			if (is_sched_attr_set(psched, SCHED_ATR_partition)) {
				if (!strcmp(get_sched_attr_str(psched, SCHED_ATR_partition), partition)) {
					*target_sched = psched;
					return 1;
				}
			}
		}
	} else {
		*target_sched = dflt_scheduler;
		return 1;
	}
	return 0;
}

/**
 * @brief
 * 		find_sched_from_sock - find the corresponding scheduler which is having
 * 		the given socket.
 *
 * @param[in]	sock	- socket descriptor
 * @param[in]	which	- which connection to check, primary or secondary
 * 			  can be one of CONN_SCHED_PRIMARY or CONN_SCHED_SECONDARY
 *
 * @retval - pointer to the corresponding pbs_sched object if success
 * 		 -  NULL if fail
 */
pbs_sched *
find_sched_from_sock(int sock, conn_origin_t which)
{
	pbs_sched *psched;

	if (sock < 0 || (which != CONN_SCHED_PRIMARY && which != CONN_SCHED_SECONDARY && which != CONN_SCHED_ANY))
		return NULL;

	for (psched = (pbs_sched *) GET_NEXT(svr_allscheds); psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
		if ((which == CONN_SCHED_PRIMARY || which == CONN_SCHED_ANY) && psched->sc_primary_conn == sock)
			return psched;
		if ((which == CONN_SCHED_SECONDARY || which == CONN_SCHED_ANY) && psched->sc_secondary_conn == sock)
			return psched;
	}
	return NULL;
}

/**
 * @brief
 * Sets SCHED_ATR_sched_state and then sets flags on SVR_ATR_State if default scheduler.
 * We need to set MOD_MCACHE so the attribute can get re-encoded
 *
 * @param[in] psched - scheduler to set state on
 * @param[in] state - state of scheduler
 *
 */
static void
set_sched_state(pbs_sched *psched, char *state)
{
	if (psched == NULL)
		return;

	set_sched_attr_str_slim(psched, SCHED_ATR_sched_state, state, NULL);
	if (psched == dflt_scheduler)
		(get_sattr(SVR_ATR_State))->at_flags |= ATR_MOD_MCACHE;
}

/**
 * @brief
 * 	Receives end of cycle notification from the corresponding Scheduler
 *
 * @param[in] sock - socket to read
 *
 * @return int
 * @retval 0  - on success
 * @retval !0 - on error
 */
int
recv_sched_cycle_end(int sock)
{
	int rc = 0;
	pbs_sched *psched = find_sched_from_sock(sock, CONN_SCHED_SECONDARY);
	char *state = SC_IDLE;

	if (!psched)
		return 0;

	DIS_tcp_funcs();
	(void) disrsi(sock, &rc); /* read end cycle marker and ignore as we don't need its value */
	psched->sc_cycle_started = 0;

	if (rc != 0)
		state = SC_DOWN;

	set_sched_state(psched, state);

	/* clear list of jobs which were altered/modified during cycle */
	am_jobs.am_used = 0;
	scheduler_jobs_stat = 0;
	handle_deferred_cycle_close(psched);

	if (rc == DIS_EOF)
		rc = -1;

	return rc;
}

/**
 * @brief
 * 		schedule_high	-	send high priority commands to the scheduler
 *
 * @return	int
 * @retval  1	: scheduler busy
 * @retval  0	: scheduler notified
 * @retval	-1	: error
 */
int
schedule_high(pbs_sched *psched)
{
	if (psched == NULL)
		return -1;
	if (psched->sc_cycle_started == 0) {
		if (!send_sched_cmd(psched, psched->svr_do_sched_high, NULL)) {
			set_sched_state(psched, SC_DOWN);
			return -1;
		}
		psched->svr_do_sched_high = SCH_SCHEDULE_NULL;
		set_sched_state(psched, SC_SCHEDULING);
		return 0;
	}
	return 1;
}

/**
 * @brief
 * 		Contact scheduler and direct it to run a scheduling cycle
 *		If a request is already outstanding, skip this one.
 *
 * @return	int
 * @retval	-1	: error
 * @reval	0	: scheduler notified
 * @retval	+1	: scheduler busy
 *
 * @par Side Effects:
 *     the global variable (first_time) is changed.
 *
 * @par MT-safe: No
 */

int
schedule_jobs(pbs_sched *psched)
{
	int cmd;
	int s;
	static int first_time = 1;
	struct deferred_request *pdefr = NULL;
	pbs_list_head *deferred_req;
	char *jid = NULL;

	if (psched == NULL)
		return -1;

	if (first_time)
		cmd = SCH_SCHEDULE_FIRST;
	else
		cmd = psched->svr_do_schedule;

	if (psched->sc_cycle_started == 0) {

		/* are there any qrun requests from manager/operator */
		/* which haven't been sent,  they take priority      */
		deferred_req = fetch_sched_deferred_request(psched, false);
		if (deferred_req) {
			pdefr = (struct deferred_request *) GET_NEXT(*deferred_req);
		} /* else pdefr is NULL */
		while (pdefr) {
			if (pdefr->dr_sent == 0) {
				s = is_job_array(pdefr->dr_id);
				if (s == IS_ARRAY_NO) {
					if (find_job(pdefr->dr_id) != NULL) {
						jid = pdefr->dr_id;
						cmd = SCH_SCHEDULE_AJOB;
						break;
					}
				} else if ((s == IS_ARRAY_Single) ||
					   (s == IS_ARRAY_Range)) {
					if (find_arrayparent(pdefr->dr_id) != NULL) {
						jid = pdefr->dr_id;
						cmd = SCH_SCHEDULE_AJOB;
						break;
					}
				}
			}
			pdefr = (struct deferred_request *) GET_NEXT(pdefr->dr_link);
		}

		if (!send_sched_cmd(psched, cmd, jid)) {
			set_sched_state(psched, SC_DOWN);
			return -1;
		} else if (pdefr != NULL)
			pdefr->dr_sent = 1; /* mark entry as sent to sched */

		psched->svr_do_schedule = SCH_SCHEDULE_NULL;
		set_sched_state(psched, SC_SCHEDULING);

		first_time = 0;

		/* if there are more qrun requests queued up, reset cmd so */
		/* they are sent when the Scheduler completes this cycle   */
		if (deferred_req) {
			pdefr = GET_NEXT(*deferred_req);
		} /* else pdefr is NULL */
		while (pdefr) {
			if (pdefr->dr_sent == 0) {
				pbs_sched *target_sched;
				if (find_assoc_sched_jid(pdefr->dr_preq->rq_ind.rq_queuejob.rq_jid, &target_sched))
					target_sched->svr_do_schedule = SCH_SCHEDULE_AJOB;
				break;
			}
			pdefr = (struct deferred_request *) GET_NEXT(pdefr->dr_link);
		}

		return (0);
	} else
		return (1); /* scheduler was busy */
}

/**
 * @brief
 * 		scheduler_close - connection to scheduler has closed, clear scheduler_called
 * @par
 * 		Connection to scheduler has closed, mark scheduler sock as
 *		closed with -1 and if any clean up any outstanding deferred scheduler
 *		requests (qrun).
 * @par
 * 		Perform some cleanup as connection to scheduler has closed
 *
 * @param[in]	sock	-	communication endpoint.
 * 							closed (scheduler connection) socket, not used but
 *							required to match general prototype of functions called when
 *							a socket is closed.
 * @return	void
 */
void
scheduler_close(int sock)
{
	pbs_sched *psched;
	int other_conn = -1;

	psched = find_sched_from_sock(sock, CONN_SCHED_ANY);
	if (psched == NULL)
		return;

	if (sock == psched->sc_primary_conn)
		other_conn = psched->sc_secondary_conn;
	else if (sock == psched->sc_secondary_conn)
		other_conn = psched->sc_primary_conn;
	else
		return;
	log_eventf(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SCHED, LOG_CRIT, psched->sc_name, "scheduler disconnected");
	psched->sc_secondary_conn = -1;
	psched->sc_primary_conn = -1;
	if (other_conn != -1) {
		net_add_close_func(other_conn, NULL);
		close_conn(other_conn);
	}
	psched->sc_cycle_started = 0;
	set_sched_state(psched, SC_DOWN);

	/* clear list of jobs which were altered/modified during cycle */
	am_jobs.am_used = 0;
	scheduler_jobs_stat = 0;

	handle_deferred_cycle_close(psched);
}

/**
 * @brief
 * 		Add a job to the am_jobs array, called when a job is moved (locally)
 *		or modified (qalter) during a scheduling cycle
 *
 * @param[in]	pjob	-	pointer to job to add to the array.
 */
void
am_jobs_add(job *pjob)
{
	if (am_jobs.am_used == am_jobs.am_max) {
		/* Need to expand the array, increase by 4 slots */
		job **tmp = realloc(am_jobs.am_array, sizeof(job *) * (am_jobs.am_max + 4));
		if (tmp == NULL)
			return; /* cannot increase array, so be it */
		am_jobs.am_array = tmp;
		am_jobs.am_max += 4;
	}
	*(am_jobs.am_array + am_jobs.am_used++) = pjob;
}

/**
 * @brief
 * 		Determine if the job in question is in the list of moved/altered
 *		jobs.  Called when a run request for a job comes from the Scheduler.
 *
 * @param[in]	pjob	-	pointer to job in question.
 *
 * @return	int
 * @retval	0	- job not in list
 * @retval	1	- job is in list
 */
int
was_job_alteredmoved(job *pjob)
{
	int i;
	for (i = 0; i < am_jobs.am_used; ++i) {
		if (*(am_jobs.am_array + i) == pjob)
			return 1;
	}
	return 0;
}

/**
 * @brief
 * 		set_scheduler_flag - set the flag to call the Scheduler
 *		certain flag values should not be overwritten
 *
 * @param[in]	flag	-	scheduler command.
 * @param[in] psched -   pointer to sched object. Then set the flag only for this object.
 *                                     NULL. Then set the flag for all the scheduler objects.
 */
void
set_scheduler_flag(int flag, pbs_sched *psched)
{
	int single_sched;

	if (psched)
		single_sched = 1;
	else {
		single_sched = 0;
		psched = (pbs_sched *) GET_NEXT(svr_allscheds);
	}

	for (; psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
		/* high priority commands:
		 * Note: A) usually SCH_QUIT is sent directly and not via here
		 *       B) if we ever add a 3rd high prio command, we can lose them
		 */
		if (flag == SCH_CONFIGURE || flag == SCH_QUIT) {
			if (psched->svr_do_sched_high == SCH_QUIT)
				return; /* keep only SCH_QUIT */

			psched->svr_do_sched_high = flag;
		} else
			psched->svr_do_schedule = flag;
		if (single_sched)
			break;
	}
}

/**
 * @brief
 * 	Handles deferred requests during scheduling cycle closure
 *
 * @return void
 */
void
handle_deferred_cycle_close(pbs_sched *psched)
{
	pbs_list_head *deferred_req;
	struct deferred_request *pdefr;

	deferred_req = fetch_sched_deferred_request(psched, false);
	if (deferred_req == NULL) {
		return;
	}

	/*
	 * If a deferred (from qrun) had been sent to the Scheduler and is still
	 * there, then the Scheduler must have closed the connection without
	 * dealing with the job. Tell qrun it failed if the qrun connection
	 * is still there.
	 *
	 * If any qrun request is pending in the deffered list, set svr_unsent_qrun_req so
	 * they are sent when the Scheduler completes this cycle
	 */
	pdefr = (struct deferred_request *) GET_NEXT(*deferred_req);

	while (pdefr) {
		struct deferred_request *next_pdefr = (struct deferred_request *) GET_NEXT(pdefr->dr_link);

		if (pdefr->dr_sent != 0) {
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pdefr->dr_id, "deferred qrun request to scheduler failed");
			if (pdefr->dr_preq != NULL)
				req_reject(PBSE_INTERNAL, 0, pdefr->dr_preq);
			/* unlink and free the deferred request entry */
			delete_link(&pdefr->dr_link);
			free(pdefr);
		} else if (pdefr->dr_sent == 0 && svr_unsent_qrun_req == 0)
			svr_unsent_qrun_req = 1;

		pdefr = next_pdefr;
	}

	clear_sched_deferred_request(psched);
}


================================================
FILE: src/server/sattr_get_set.c
================================================
/*
 * Copyright (C) 1994-2020 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "server.h"

/**
 * @brief	Get attribute of server based on given attr index
 *
 * @param[in] attr_idx - attribute index
 *
 * @return attribute *
 * @retval NULL  - failure
 * @retval !NULL - pointer to attribute struct
 */
attribute *
get_sattr(int attr_idx)
{
	return &(server.sv_attr[attr_idx]);
}

/**
 * @brief	Getter function for server attribute of type string
 *
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	char *
 * @retval	string value of the attribute
 * @retval	NULL if pjob is NULL
 */
char *
get_sattr_str(int attr_idx)
{
	return get_attr_str(get_sattr(attr_idx));
}

/**
 * @brief	Getter function for server attribute of type string of array
 *
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	struct array_strings *
 * @retval	value of the attribute
 * @retval	NULL if pjob is NULL
 */
struct array_strings *
get_sattr_arst(int attr_idx)
{
	return get_attr_arst(get_sattr(attr_idx));
}

/**
 * @brief	Getter for server attribute's list value
 *
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	pbs_list_head
 * @retval	value of attribute
 */
pbs_list_head
get_sattr_list(int attr_idx)
{
	return get_attr_list(get_sattr(attr_idx));
}

/**
 * @brief	Getter function for server attribute of type long
 *
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	long
 * @retval	long value of the attribute
 * @retval	-1 if pjob is NULL
 */
long
get_sattr_long(int attr_idx)
{
	return get_attr_l(get_sattr(attr_idx));
}

/**
 * @brief	Generic server attribute setter (call if you want at_set() action functions to be called)
 *
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_sattr_generic(int attr_idx, char *val, char *rscn, enum batch_op op)
{
	return set_attr_generic(get_sattr(attr_idx), &svr_attr_def[attr_idx], val, rscn, op);
}

/**
 * @brief	"fast" server attribute setter for string values
 *
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_sattr_str_slim(int attr_idx, char *val, char *rscn)
{
	return set_attr_generic(get_sattr(attr_idx), &svr_attr_def[attr_idx], val, rscn, INTERNAL);
}

/**
 * @brief	"fast" server attribute setter for long values
 *
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_sattr_l_slim(int attr_idx, long val, enum batch_op op)
{
	set_attr_l(get_sattr(attr_idx), val, op);
	return 0;
}

/**
 * @brief	"fast" server attribute setter for boolean values
 *
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_sattr_b_slim(int attr_idx, long val, enum batch_op op)
{
	set_attr_b(get_sattr(attr_idx), val, op);
	return 0;
}

/**
 * @brief	"fast" server attribute setter for char values
 *
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_sattr_c_slim(int attr_idx, char val, enum batch_op op)
{
	set_attr_c(get_sattr(attr_idx), val, op);
	return 0;
}

/**
 * @brief	Check if a server attribute is set
 *
 * @param[in]	attr_idx - attribute index to check
 *
 * @return	int
 * @retval	1 if it is set
 * @retval	0 otherwise
 */
int
is_sattr_set(int attr_idx)
{
	return is_attr_set(get_sattr(attr_idx));
}

/**
 * @brief	Free a server attribute
 *
 * @param[in]	attr_idx - attribute index to free
 *
 * @return	void
 */
void
free_sattr(int attr_idx)
{
	free_attr(svr_attr_def, get_sattr(attr_idx), attr_idx);
}


================================================
FILE: src/server/sched_attr_get_set.c
================================================
/*
 * Copyright (C) 1994-2020 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include "pbs_sched.h"

/**
 * @brief	Get attribute of sched based on given attr index
 *
 * @param[in] psched    - pointer to sched struct
 * @param[in] attr_idx - attribute index
 *
 * @return attribute *
 * @retval NULL  - failure
 * @retval !NULL - pointer to attribute struct
 */
attribute *
get_sched_attr(const pbs_sched *psched, int attr_idx)
{
	if (psched != NULL)
		return _get_attr_by_idx((attribute *) psched->sch_attr, attr_idx);
	return NULL;
}

/**
 * @brief	Getter function for sched attribute of type string
 *
 * @param[in]	psched - pointer to the sched
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	char *
 * @retval	string value of the attribute
 * @retval	NULL if psched is NULL
 */
char *
get_sched_attr_str(const pbs_sched *psched, int attr_idx)
{
	if (psched != NULL)
		return get_attr_str(get_sched_attr(psched, attr_idx));

	return NULL;
}

/**
 * @brief	Getter function for sched attribute of type string of array
 *
 * @param[in]	psched - pointer to the sched
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	struct array_strings *
 * @retval	value of the attribute
 * @retval	NULL if psched is NULL
 */
struct array_strings *
get_sched_attr_arst(const pbs_sched *psched, int attr_idx)
{
	if (psched != NULL)
		return get_attr_arst(get_sched_attr(psched, attr_idx));

	return NULL;
}

/**
 * @brief	Getter for sched attribute's list value
 *
 * @param[in]	psched - pointer to the sched
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	pbs_list_head
 * @retval	value of attribute
 */
pbs_list_head
get_sched_attr_list(const pbs_sched *psched, int attr_idx)
{
	return get_attr_list(get_sched_attr(psched, attr_idx));
}

/**
 * @brief	Getter function for sched attribute of type long
 *
 * @param[in]	psched - pointer to the sched
 * @param[in]	attr_idx - index of the attribute to return
 *
 * @return	long
 * @retval	long value of the attribute
 * @retval	-1 if psched is NULL
 */
long
get_sched_attr_long(const pbs_sched *psched, int attr_idx)
{
	if (psched != NULL)
		return get_attr_l(get_sched_attr(psched, attr_idx));

	return -1;
}

/**
 * @brief	Generic sched attribute setter (call if you want at_set() action functions to be called)
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_sched_attr_generic(pbs_sched *psched, int attr_idx, char *val, char *rscn, enum batch_op op)
{
	if (psched == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_sched_attr(psched, attr_idx), &sched_attr_def[attr_idx], val, rscn, op);
}

/**
 * @brief	"fast" sched attribute setter for string values
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	rscn - new resource val to set, if applicable
 *
 * @return	int
 * @retval	0 for success
 * @retval	!0 for failure
 */
int
set_sched_attr_str_slim(pbs_sched *psched, int attr_idx, char *val, char *rscn)
{
	if (psched == NULL || val == NULL)
		return 1;

	return set_attr_generic(get_sched_attr(psched, attr_idx), &sched_attr_def[attr_idx], val, rscn, INTERNAL);
}

/**
 * @brief	"fast" sched attribute setter for long values
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_sched_attr_l_slim(pbs_sched *psched, int attr_idx, long val, enum batch_op op)
{
	if (psched == NULL)
		return 1;

	set_attr_l(get_sched_attr(psched, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" sched attribute setter for boolean values
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_sched_attr_b_slim(pbs_sched *psched, int attr_idx, long val, enum batch_op op)
{
	if (psched == NULL)
		return 1;

	set_attr_b(get_sched_attr(psched, attr_idx), val, op);

	return 0;
}

/**
 * @brief	"fast" sched attribute setter for char values
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to set
 * @param[in]	val - new val to set
 * @param[in]	op - batch_op operation, SET, INCR, DECR etc.
 *
 * @return	int
 * @retval	0 for success
 * @retval	1 for failure
 */
int
set_sched_attr_c_slim(pbs_sched *psched, int attr_idx, char val, enum batch_op op)
{
	if (psched == NULL)
		return 1;

	set_attr_c(get_sched_attr(psched, attr_idx), val, op);

	return 0;
}

/**
 * @brief	Check if a sched attribute is set
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to check
 *
 * @return	int
 * @retval	1 if it is set
 * @retval	0 otherwise
 */
int
is_sched_attr_set(const pbs_sched *psched, int attr_idx)
{
	if (psched != NULL)
		return is_attr_set(get_sched_attr(psched, attr_idx));

	return 0;
}

/**
 * @brief	Free a sched attribute
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to free
 *
 * @return	void
 */
void
free_sched_attr(pbs_sched *psched, int attr_idx)
{
	if (psched != NULL)
		free_attr(sched_attr_def, get_sched_attr(psched, attr_idx), attr_idx);
}

/**
 * @brief	clear a sched attribute
 *
 * @param[in]	psched - pointer to sched
 * @param[in]	attr_idx - attribute index to clear
 *
 * @return	void
 */
void
clear_sched_attr(pbs_sched *psched, int attr_idx)
{
	clear_attr(get_sched_attr(psched, attr_idx), &sched_attr_def[attr_idx]);
}


================================================
FILE: src/server/sched_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    sched_func.c
 *
 *@brief
 * 		sched_func.c - various functions dealing with schedulers
 *
 */
#include <pbs_config.h>

#ifdef PYTHON
#include <pbs_python_private.h>
#include <Python.h>
#endif

#include <ctype.h>
#include <errno.h>
#include <string.h>
#include <memory.h>

#include <pbs_python.h>
#include "pbs_version.h"
#include "pbs_share.h"
#include "pbs_sched.h"
#include "log.h"
#include "pbs_ifl.h"
#include "pbs_db.h"
#include "pbs_error.h"
#include "pbs_internal.h"
#include "pbs_sched.h"
#include "pbs_share.h"
#include "resource.h"
#include "sched_cmds.h"
#include "server.h"
#include <server_limits.h>
#include "svrfunc.h"

extern struct server server;

/* Functions */
#ifdef PYTHON
extern char *pbs_python_object_str(PyObject *);
#endif /* PYTHON */

extern void *svr_db_conn;

/**
 * @brief	Helper function to write job sort formula to a sched's sched_priv
 *
 * @param[in]	formula - the formula to write
 * @param[in]	sched_priv_path - path to scheduler's sched_priv
 *
 * @return	int
 * @return 	PBSE_NONE for Success
 * @return	PBSE_ error code for Failure
 */
static int
write_job_sort_formula(char *formula, char *sched_priv_path)
{
	char pathbuf[MAXPATHLEN];
	FILE *fp;

	snprintf(pathbuf, sizeof(pathbuf), "%s/%s", sched_priv_path, FORMULA_FILENAME);
	if ((fp = fopen(pathbuf, "w")) == NULL) {
		return PBSE_SYSTEM;
	}

	fprintf(fp, "### PBS INTERNAL FILE DO NOT MODIFY ###\n");
	fprintf(fp, "%s\n", formula);
	fclose(fp);

	return PBSE_NONE;
}

/**
 * @brief
 * 	validate_job_formula - validate that the sorting forumla is in the
 *	correct form.  We do this by calling python and having
 *	it catch exceptions.
 *
 */
int
validate_job_formula(attribute *pattr, void *pobject, int actmode)
{
	char *formula;
	char *errmsg = NULL;
	struct resource_def *pres;
	char buf[1024];
	char *globals1 = NULL;
	int globals_size1 = 1024;
	char *globals2 = NULL;
	int globals_size2 = 1024;
	char *script = NULL;
	int script_size = 2048;
	PyThreadState *ts_main = NULL;
	PyThreadState *ts_sub = NULL;
	pbs_sched *psched = NULL;
	int rc = 0;
	int err = 0;

	if (actmode == ATR_ACTION_FREE)
		return (0);

#ifndef PYTHON
	return PBSE_INTERNAL;
#else

	formula = pattr->at_val.at_str;
	if (formula == NULL)
		return PBSE_INTERNAL;

	if (pobject == &server) {
		/* check if any sched's JSF is set to a different, incompatible value */
		for (psched = (pbs_sched *) GET_NEXT(svr_allscheds);
		     psched != NULL;
		     psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
			if (is_sched_attr_set(psched, SCHED_ATR_job_sort_formula)) {
				if (strcmp(get_sched_attr_str(psched, SCHED_ATR_job_sort_formula), formula) != 0)
					return PBSE_SVR_SCHED_JSF_INCOMPAT;
			}
		}
	} else {
		/* Check if server's JSF is set to a different value */
		if (is_sattr_set(SVR_ATR_job_sort_formula) && strcmp(get_sattr_str(SVR_ATR_job_sort_formula), formula) != 0)
			return PBSE_SVR_SCHED_JSF_INCOMPAT;
	}

	if (!Py_IsInitialized()) {
		if (actmode == ATR_ACTION_RECOV)
			return 0;
		return PBSE_INTERNAL;
	}

	globals1 = malloc(globals_size1);
	if (globals1 == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}

	globals2 = malloc(globals_size2);
	if (globals2 == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}

	strcpy(globals1, "globals1={");
	strcpy(globals2, "globals2={");

	/* We need to create a python dictionary to pass to python as a list
	 * of valid symbols.
	 */

	for (pres = svr_resc_def; pres; pres = pres->rs_next) {
		/* unknown resource is used as a delimiter between builtin and custom resources */
		if (strcmp(pres->rs_name, RESOURCE_UNKNOWN) != 0) {
			snprintf(buf, sizeof(buf), "\'%s\':1,", pres->rs_name);
			if (pbs_strcat(&globals1, &globals_size1, buf) == NULL) {
				rc = PBSE_SYSTEM;
				goto validate_job_formula_exit;
			}
			if (pres->rs_type == ATR_TYPE_LONG ||
			    pres->rs_type == ATR_TYPE_SIZE ||
			    pres->rs_type == ATR_TYPE_LL ||
			    pres->rs_type == ATR_TYPE_SHORT ||
			    pres->rs_type == ATR_TYPE_FLOAT) {
				if (pbs_strcat(&globals2, &globals_size2, buf) == NULL) {
					rc = PBSE_SYSTEM;
					goto validate_job_formula_exit;
				}
			}
		}
	}

	snprintf(buf, sizeof(buf), "\'%s\':1, '%s':1, \'%s\':1,\'%s\':1, \'%s\':1, \'%s\':1, \'%s\':1, \'%s\': 1}\n",
		 FORMULA_ELIGIBLE_TIME, FORMULA_QUEUE_PRIO, FORMULA_JOB_PRIO,
		 FORMULA_FSPERC, FORMULA_FSPERC_DEP, FORMULA_TREE_USAGE, FORMULA_FSFACTOR, FORMULA_ACCRUE_TYPE);
	if (pbs_strcat(&globals1, &globals_size1, buf) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	if (pbs_strcat(&globals2, &globals_size2, buf) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}

	/* Allocate a buffer for the Python code */
	script = malloc(script_size);
	if (script == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	*script = '\0';

	/* import math and initialize variables */
	sprintf(buf,
		"ans = 0\n"
		"errnum = 0\n"
		"errmsg = \'\'\n"
		"try:\n"
		"    from math import *\n"
		"except ImportError as e:\n"
		"    errnum=4\n"
		"    errmsg=str(e)\n");
	if (pbs_strcat(&script, &script_size, buf) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	/* set up our globals dictionary */
	if (pbs_strcat(&script, &script_size, globals1) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	if (pbs_strcat(&script, &script_size, globals2) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	/* Now for the real guts: The initial try/except block*/
	sprintf(buf,
		"try:\n"
		"    exec(\'ans=");
	if (pbs_strcat(&script, &script_size, buf) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	if (pbs_strcat(&script, &script_size, formula) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	sprintf(buf, "\', globals1, locals())\n"
		     "except SyntaxError as e:\n"
		     "    errnum=1\n"
		     "    errmsg=str(e)\n"
		     "except NameError as e:\n"
		     "    errnum=2\n"
		     "    errmsg=str(e)\n"
		     "except Exception as e:\n"
		     "    pass\n"
		     "if errnum == 0:\n"
		     "    try:\n"
		     "        exec(\'ans=");
	if (pbs_strcat(&script, &script_size, buf) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	if (pbs_strcat(&script, &script_size, formula) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	sprintf(buf, "\', globals2, locals())\n"
		     "    except NameError as e:\n"
		     "        errnum=3\n"
		     "        errmsg=str(e)\n"
		     "    except Exception as e:\n"
		     "        pass\n");
	if (pbs_strcat(&script, &script_size, buf) == NULL) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}

	/* run the script in a subinterpreter */
	ts_main = PyThreadState_Get();
	ts_sub = Py_NewInterpreter();
	if (!ts_sub) {
		rc = PBSE_SYSTEM;
		goto validate_job_formula_exit;
	}
	err = PyRun_SimpleString(script);

	/* peek into the interpreter to get the values of err and errmsg */
	if (err == 0) {
		PyObject *module;
		PyObject *dict;
		PyObject *val;
		err = -1;
		if ((module = PyImport_AddModule("__main__"))) {
			if ((dict = PyModule_GetDict(module))) {
				char *p;
				if ((val = PyDict_GetItemString(dict, "errnum"))) {
					p = pbs_python_object_str(val);
					if (*p != '\0')
						err = atoi(p);
				}
				if ((val = PyDict_GetItemString(dict, "errmsg"))) {
					p = pbs_python_object_str(val);
					if (*p != '\0')
						errmsg = strdup(p);
				}
			}
		}
	}

	switch (err) {
		case 0: /* Success */
			rc = 0;
			break;
		case 1: /* Syntax error in formula */
			rc = PBSE_BAD_FORMULA;
			break;
		case 2: /* unknown resource name */
			rc = PBSE_BAD_FORMULA_KW;
			break;
		case 3: /* resource of non-numeric type */
			rc = PBSE_BAD_FORMULA_TYPE;
			break;
		case 4: /* import error */
			rc = PBSE_SYSTEM;
			break;
		default: /* unrecognized error */
			rc = PBSE_INTERNAL;
			break;
	}

	if (err == 0) {
		if (pobject == &server) {
			/* Write formula to all scheds' sched_priv */
			for (psched = (pbs_sched *) GET_NEXT(svr_allscheds);
			     psched != NULL;
			     psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
				rc = write_job_sort_formula(formula, get_sched_attr_str(psched, SCHED_ATR_sched_priv));
				if (rc != PBSE_NONE)
					goto validate_job_formula_exit;
			}
		} else { /* Write formula to a specific sched's sched_priv */
			psched = (pbs_sched *) pobject;
			rc = write_job_sort_formula(formula, get_sched_attr_str(psched, SCHED_ATR_sched_priv));
			if (rc != PBSE_NONE)
				goto validate_job_formula_exit;
		}

	} else {
		snprintf(buf, sizeof(buf), "Validation Error: %s", errmsg ? errmsg : "Internal error");
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_DEBUG, __func__, buf);
	}

validate_job_formula_exit:
	if (ts_main) {
		if (ts_sub)
			Py_EndInterpreter(ts_sub);
		PyThreadState_Swap(ts_main);
	}
	free(script);
	free(globals1);
	free(globals2);
	free(errmsg);
	return rc;
#endif
}

/**
 * @brief
 * 		sched_alloc - allocate space for a pbs_sched structure and
 * 		initialize attributes to "unset" and pbs_sched object is added
 * 		to svr_allscheds list
 *
 * @param[in]	sched_name	- scheduler  name
 *
 * @return	pbs_sched *
 * @retval	null	- space not available.
 */
pbs_sched *
sched_alloc(char *sched_name)
{
	int i;
	pbs_sched *psched;

	psched = calloc(1, sizeof(pbs_sched));

	if (psched == NULL) {
		log_err(errno, __func__, "Unable to allocate memory (malloc error)");
		return NULL;
	}

	CLEAR_LINK(psched->sc_link);
	strncpy(psched->sc_name, sched_name, PBS_MAXSCHEDNAME);
	psched->sc_name[PBS_MAXSCHEDNAME] = '\0';
	psched->svr_do_schedule = SCH_SCHEDULE_NULL;
	psched->svr_do_sched_high = SCH_SCHEDULE_NULL;
	psched->sc_primary_conn = -1;
	psched->sc_secondary_conn = -1;
	psched->newobj = 1;
	append_link(&svr_allscheds, &psched->sc_link, psched);

	/* set the working attributes to "unspecified" */

	for (i = 0; i < (int) SCHED_ATR_LAST; i++)
		clear_sched_attr(psched, i);

	return (psched);
}

/**
 * @brief find a scheduler
 *
 * @param[in]	sched_name - scheduler name
 *
 * @return	pbs_sched *
 */

pbs_sched *
find_sched(char *sched_name)
{
	pbs_sched *psched = NULL;
	if (!sched_name)
		return NULL;
	psched = (pbs_sched *) GET_NEXT(svr_allscheds);
	while (psched != NULL) {
		if (strcmp(sched_name, psched->sc_name) == 0)
			break;
		psched = (pbs_sched *) GET_NEXT(psched->sc_link);
	}
	return (psched);
}

/**
 * @brief find a scheduler from partition name
 *
 * @param[in]	partition - partition name
 *
 * @return	pbs_sched *
 */

pbs_sched *
find_sched_from_partition(char *partition)
{
	pbs_sched *psched = NULL;

	if (!partition)
		return NULL;

	for (psched = (pbs_sched *) GET_NEXT(svr_allscheds); psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
		if (is_sched_attr_set(psched, SCHED_ATR_partition)) {
			char *value = get_sched_attr_str(psched, SCHED_ATR_partition);
			if (value != NULL && !strcmp(partition, value))
				return psched;
		}
	}
	return NULL;
}

/**
 * @brief free sched structure
 *
 * @param[in]	psched	- The pointer to the sched to free
 *
 */
void
sched_free(pbs_sched *psched)
{
	int i;

	/* remove any malloc working attribute space */

	for (i = 0; i < (int) SCHED_ATR_LAST; i++)
		free_sched_attr(psched, i);

	/* now free the main structure */
	delete_link(&psched->sc_link);
	(void) free(psched);
}

/**
 * @brief - purge scheduler from system
 *
 * @param[in]	psched	- The pointer to the delete to delete
 *
 * @return	error code
 * @retval	0	- scheduler purged
 * @retval	PBSE_OBJBUSY	- scheduler deletion not allowed
 */
int
sched_delete(pbs_sched *psched)
{
	pbs_db_obj_info_t obj;
	pbs_db_sched_info_t dbsched;
	void *conn = (void *) svr_db_conn;

	if (psched == NULL)
		return (0);

	/* TODO check for scheduler activity and return PBSE_OBJBUSY */
	/* delete scheduler from database */
	strcpy(dbsched.sched_name, psched->sc_name);
	obj.pbs_db_obj_type = PBS_DB_SCHED;
	obj.pbs_db_un.pbs_db_sched = &dbsched;
	if (pbs_db_delete_obj(conn, &obj) != 0) {
		snprintf(log_buffer, LOG_BUF_SIZE,
			 "delete of scheduler %s from datastore failed",
			 psched->sc_name);
		log_err(errno, __func__, log_buffer);
	}
	sched_free(psched);

	return (0);
}

/**
 * @brief
 * 		action routine for the sched's "sched_host" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_sched_host(attribute *pattr, void *pobj, int actmode)
{
	pbs_sched *psched;
	psched = (pbs_sched *) pobj;

	if (actmode == ATR_ACTION_NEW || actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_RECOV) {
		psched->sc_conn_addr = get_hostaddr(pattr->at_val.at_str);
		if (psched->sc_conn_addr == (pbs_net_t) 0)
			return PBSE_BADATVAL;
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		action routine for the sched's "sched_priv" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_sched_priv(attribute *pattr, void *pobj, int actmode)
{
	pbs_sched *psched;

	psched = (pbs_sched *) pobj;

	if (pobj == dflt_scheduler)
		return PBSE_SCHED_OP_NOT_PERMITTED;

	if (actmode == ATR_ACTION_NEW || actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_RECOV) {
		psched = (pbs_sched *) GET_NEXT(svr_allscheds);
		while (psched != NULL) {
			if (is_sched_attr_set(psched, SCHED_ATR_sched_priv)) {
				if (!strcmp(get_sched_attr_str(psched, SCHED_ATR_sched_priv), pattr->at_val.at_str)) {
					if (psched != pobj) {
						return PBSE_SCHED_PRIV_EXIST;
					} else
						break;
				}
			}
			psched = (pbs_sched *) GET_NEXT(psched->sc_link);
		}
	}

	return PBSE_NONE;
}

/**
 * @brief
 * 		action routine for the sched's "sched_log" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_sched_log(attribute *pattr, void *pobj, int actmode)
{
	pbs_sched *psched;
	psched = (pbs_sched *) pobj;

	if (pobj == dflt_scheduler)
		return PBSE_SCHED_OP_NOT_PERMITTED;

	if (actmode == ATR_ACTION_NEW || actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_RECOV) {
		psched = (pbs_sched *) GET_NEXT(svr_allscheds);
		while (psched != NULL) {
			if (is_sched_attr_set(psched, SCHED_ATR_sched_log)) {
				if (!strcmp(get_sched_attr_str(psched, SCHED_ATR_sched_log), pattr->at_val.at_str)) {
					if (psched != pobj) {
						return PBSE_SCHED_LOG_EXIST;
					} else
						break;
				}
			}
			psched = (pbs_sched *) GET_NEXT(psched->sc_link);
		}
	}

	return PBSE_NONE;
}

/**
 * @brief
 * 		action routine for the sched's "sched_iteration" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_sched_iteration(attribute *pattr, void *pobj, int actmode)
{
	if (pobj == dflt_scheduler) {
		set_sattr_l_slim(SVR_ATR_scheduler_iteration, pattr->at_val.at_long, SET);
		svr_save_db(&server);
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		action routine for the sched's "sched_user" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_sched_user(attribute *pattr, void *pobj, int actmode)
{
	if (actmode == ATR_ACTION_ALTER) {
		/*TODO*/
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		action routine for the sched's "preempt_order" attribute
 *
 * @param[in]	pattr	-	attribute being set
 * @param[in]	pobj	-	Object on which attribute is being set
 * @param[in]	actmode	-	the mode of setting, recovery or just alter
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */
int
action_sched_preempt_order(attribute *pattr, void *pobj, int actmode)
{
	char *tok = NULL;
	char *endp = NULL;
	pbs_sched *psched = pobj;

	if ((actmode == ATR_ACTION_ALTER) || (actmode == ATR_ACTION_RECOV)) {
		char copy[256] = {0};

		if (!(pattr->at_val.at_str))
			return PBSE_BADATVAL;
		strcpy(copy, pattr->at_val.at_str);
		tok = strtok(copy, "\t ");

		if (tok != NULL && !isdigit(tok[0])) {
			int i = 0;
			int num = 0;
			char s_done = 0;
			char c_done = 0;
			char r_done = 0;
			char d_done = 0;
			char next_is_num = 0;

			psched->preempt_order[0].order[0] = PREEMPT_METHOD_LOW;
			psched->preempt_order[0].order[1] = PREEMPT_METHOD_LOW;
			psched->preempt_order[0].order[2] = PREEMPT_METHOD_LOW;
			psched->preempt_order[0].order[3] = PREEMPT_METHOD_LOW;

			psched->preempt_order[0].high_range = 100;
			i = 0;
			do {
				int j = 0;
				j = isdigit(tok[0]);
				if (j) {
					if (next_is_num) {
						num = strtol(tok, &endp, 10);
						if (*endp == '\0') {
							psched->preempt_order[i].low_range = num + 1;
							i++;
							psched->preempt_order[i].high_range = num;
							next_is_num = 0;
						} else
							return PBSE_BADATVAL;
					} else
						return PBSE_BADATVAL;
				} else if (!next_is_num) {
					for (j = 0; tok[j] != '\0'; j++) {
						switch (tok[j]) {
							case 'S':
								if (!s_done) {
									psched->preempt_order[i].order[j] = PREEMPT_METHOD_SUSPEND;
									s_done = 1;
								} else
									return PBSE_BADATVAL;
								break;
							case 'C':
								if (!c_done) {
									psched->preempt_order[i].order[j] = PREEMPT_METHOD_CHECKPOINT;
									c_done = 1;
								} else
									return PBSE_BADATVAL;
								break;
							case 'R':
								if (!r_done) {
									psched->preempt_order[i].order[j] = PREEMPT_METHOD_REQUEUE;
									r_done = 1;
								} else
									return PBSE_BADATVAL;
								break;
							case 'D':
								if (!d_done) {
									psched->preempt_order[i].order[j] = PREEMPT_METHOD_DELETE;
									d_done = 1;
								} else
									return PBSE_BADATVAL;
								break;

							default:
								return PBSE_BADATVAL;
						}
						next_is_num = 1;
					}
					s_done = 0;
					c_done = 0;
					r_done = 0;
					d_done = 0;
				} else
					return PBSE_BADATVAL;
				tok = strtok(NULL, "\t ");
			} while (tok != NULL && i < PREEMPT_ORDER_MAX);

			if (tok != NULL)
				return PBSE_BADATVAL;

			psched->preempt_order[i].low_range = 0;
		} else
			return PBSE_BADATVAL;
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		poke_scheduler - action routine for the server's "scheduling" attribute.
 *		Call the scheduler whenever the attribute is set (or reset) to true.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 */

int
poke_scheduler(attribute *pattr, void *pobj, int actmode)
{
	if (pobj == &server || pobj == dflt_scheduler) {
		if (pobj == &server) {
			/* set this attribute on main scheduler */
			if (dflt_scheduler) {
				set_attr_with_attr(&sched_attr_def[SCHED_ATR_scheduling], get_sched_attr(dflt_scheduler, SCHED_ATR_scheduling), pattr, SET);
				sched_save_db(dflt_scheduler);
			}
		} else {
			set_sattr_l_slim(SVR_ATR_scheduling, pattr->at_val.at_long, SET);
			svr_save_db(&server);
		}
		if (actmode == ATR_ACTION_ALTER) {
			if (pattr->at_val.at_long)
				set_scheduler_flag(SCH_SCHEDULE_CMD, dflt_scheduler);
		}
	} else {
		if (actmode == ATR_ACTION_ALTER) {
			if (pattr->at_val.at_long)
				set_scheduler_flag(SCH_SCHEDULE_CMD, (pbs_sched *) pobj);
		}
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		Sets default scheduler attributes
 *
 * @param[in] psched		- Scheduler
 * @parma[in] unset_flag	- flag to indicate if this function is called after unset of any sched attributes.
 * @parma[in] from_scheduler	- flag to indicate if this function is called on a request from scheduler.
 *
 *
  */
void
set_sched_default(pbs_sched *psched, int from_scheduler)
{
	char dir_path[MAXPATHLEN + 1] = {0};

	if (!psched)
		return;

	if (!is_sched_attr_set(psched, SCHED_ATR_sched_cycle_len))
		set_sched_attr_l_slim(psched, SCHED_ATR_sched_cycle_len, PBS_SCHED_CYCLE_LEN_DEFAULT, SET);
	if (!is_sched_attr_set(psched, SCHED_ATR_schediteration))
		set_sched_attr_l_slim(psched, SCHED_ATR_schediteration, PBS_SCHEDULE_CYCLE, SET);
	if (!is_sched_attr_set(psched, SCHED_ATR_scheduling)) {
		if (psched != dflt_scheduler)
			set_sched_attr_b_slim(psched, SCHED_ATR_scheduling, FALSE, SET);
		else
			set_sched_attr_b_slim(psched, SCHED_ATR_scheduling, TRUE, SET);
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_sched_state)) {
		if (psched != dflt_scheduler)
			set_sched_attr_str_slim(psched, SCHED_ATR_sched_state, SC_DOWN, NULL);
		else
			set_sched_attr_str_slim(psched, SCHED_ATR_sched_state, SC_IDLE, NULL);
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_sched_priv)) {
		if (psched != dflt_scheduler)
			(void) snprintf(dir_path, MAXPATHLEN, "%s/sched_priv_%s", pbs_conf.pbs_home_path, psched->sc_name);
		else
			(void) snprintf(dir_path, MAXPATHLEN, "%s/sched_priv", pbs_conf.pbs_home_path);
		set_sched_attr_str_slim(psched, SCHED_ATR_sched_priv, dir_path, NULL);
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_sched_log)) {
		if (psched != dflt_scheduler)
			(void) snprintf(dir_path, MAXPATHLEN, "%s/sched_logs_%s", pbs_conf.pbs_home_path, psched->sc_name);
		else
			(void) snprintf(dir_path, MAXPATHLEN, "%s/sched_logs", pbs_conf.pbs_home_path);
		set_sched_attr_str_slim(psched, SCHED_ATR_sched_log, dir_path, NULL);
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_log_events)) {
		set_sched_attr_l_slim(psched, SCHED_ATR_log_events, SCHED_LOG_DFLT, SET);
		(get_sched_attr(psched, SCHED_ATR_log_events))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_preempt_queue_prio)) {
		set_sched_attr_l_slim(psched, SCHED_ATR_preempt_queue_prio, PBS_PREEMPT_QUEUE_PRIO_DEFAULT, SET);
		(get_sched_attr(psched, SCHED_ATR_preempt_queue_prio))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_preempt_prio)) {
		set_sched_attr_str_slim(psched, SCHED_ATR_preempt_prio, PBS_PREEMPT_PRIO_DEFAULT, NULL);
		(get_sched_attr(psched, SCHED_ATR_preempt_prio))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_preempt_order)) {
		set_sched_attr_str_slim(psched, SCHED_ATR_preempt_order, PBS_PREEMPT_ORDER_DEFAULT, NULL);
		action_sched_preempt_order(get_sched_attr(psched, SCHED_ATR_preempt_order), psched, ATR_ACTION_ALTER);
		(get_sched_attr(psched, SCHED_ATR_preempt_order))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_preempt_sort)) {
		set_sched_attr_str_slim(psched, SCHED_ATR_preempt_sort, PBS_PREEMPT_SORT_DEFAULT, NULL);
		(get_sched_attr(psched, SCHED_ATR_preempt_sort))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_server_dyn_res_alarm)) {
		set_sched_attr_l_slim(psched, SCHED_ATR_server_dyn_res_alarm, PBS_SERVER_DYN_RES_ALARM_DEFAULT, SET);
		(get_sched_attr(psched, SCHED_ATR_server_dyn_res_alarm))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_job_run_wait)) {
		set_sched_attr_str_slim(psched, SCHED_ATR_job_run_wait, RUN_WAIT_RUNJOB_HOOK, NULL);
		(get_sched_attr(psched, SCHED_ATR_job_run_wait))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (!is_sched_attr_set(psched, SCHED_ATR_throughput_mode) && strcmp(get_sched_attr_str(psched, SCHED_ATR_job_run_wait), RUN_WAIT_NONE)) {
		set_sched_attr_l_slim(psched, SCHED_ATR_throughput_mode, TRUE, SET);
		(get_sched_attr(psched, SCHED_ATR_throughput_mode))->at_flags |= ATR_VFLAG_DEFLT;
	}
	if (psched == dflt_scheduler) {
		if (!is_sched_attr_set(psched, SCHED_ATR_partition)) {
			set_sched_attr_str_slim(psched, SCHED_ATR_partition, DEFAULT_PARTITION, NULL);
			(get_sched_attr(psched, SCHED_ATR_partition))->at_flags |= ATR_VFLAG_DEFLT;
		}
		if (!is_sched_attr_set(psched, SCHED_ATR_SchedHost)) {
			set_sched_attr_str_slim(psched, SCHED_ATR_SchedHost, server_host, NULL);
			(get_sched_attr(psched, SCHED_ATR_SchedHost))->at_flags |= ATR_VFLAG_DEFLT;
			psched->sc_conn_addr = get_hostaddr(server_host);
		}
	}
	set_scheduler_flag(SCH_CONFIGURE, psched);
}

/**
 * @brief
 * 		action routine for the scheduler's partition attribute
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 *
 * @return	error code
 * @retval	PBSE_NONE	-	Success
 * @retval	!PBSE_NONE	-	Failure
 *
 */

int
action_sched_partition(attribute *pattr, void *pobj, int actmode)
{
	pbs_sched *psched;

	if (actmode == ATR_ACTION_RECOV)
		return PBSE_NONE;

	if (pobj == dflt_scheduler)
		return PBSE_SCHED_OP_NOT_PERMITTED;

	if (pattr->at_val.at_str == NULL)
		return PBSE_NONE;
	if (strcmp(pattr->at_val.at_str, DEFAULT_PARTITION) == 0)
		return PBSE_DEFAULT_PARTITION;
	for (psched = (pbs_sched *) GET_NEXT(svr_allscheds); psched; psched = (pbs_sched *) GET_NEXT(psched->sc_link)) {
		if (psched == pobj)
			continue;
		if (is_sched_attr_set(psched, SCHED_ATR_partition) && !strcmp(pattr->at_val.at_str, get_sched_attr_str(psched, SCHED_ATR_partition)))
			return PBSE_SCHED_PARTITION_ALREADY_EXISTS;
	}

	return PBSE_NONE;
}

/**
 * @brief	action function for 'opt_backfill_fuzzy' sched attribute
 *
 * @param[in]	pattr		attribute being set
 * @param[in]	pobj		Object on which the attribute is being set
 * @param[in]	actmode		the mode of setting
 *
 * @return error code
 */
int
action_opt_bf_fuzzy(attribute *pattr, void *pobj, int actmode)
{
	char *str = pattr->at_val.at_str;
	char *endp = NULL;

	if (str == NULL)
		return PBSE_BADATVAL;

	if (actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_RECOV) {
		/* Check if this is numeric, also acceptable */
		strtol(str, &endp, 10);
		if (*endp == '\0')
			return PBSE_NONE;

		if (!strcasecmp(str, "off") ||
		    !strcasecmp(str, "low") ||
		    !strcasecmp(str, "medium") || !strcasecmp(str, "med") ||
		    !strcasecmp(str, "high"))
			return PBSE_NONE;
		else
			return PBSE_BADATVAL;
	}

	return PBSE_NONE;
}

/**
 * @brief action function for 'job_run_wait' sched attribute
 *
 * @param[in]	pattr		attribute being set
 * @param[in]	pobj		Object on which the attribute is being set
 * @param[in]	actmode		the mode of setting
 *
 * @return error code
 */
int
action_job_run_wait(attribute *pattr, void *pobj, int actmode)
{
	char *str = pattr->at_val.at_str;

	if (str == NULL)
		return PBSE_BADATVAL;

	if (actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_NEW || actmode == ATR_ACTION_RECOV) {
		pbs_sched *psched = NULL;
		char *tp_val = NULL;

		if (!strcasecmp(str, RUN_WAIT_EXECJOB_HOOK))
			tp_val = ATR_FALSE;
		else if (!strcasecmp(str, RUN_WAIT_RUNJOB_HOOK))
			tp_val = ATR_TRUE;
		else if (!strcasecmp(str, RUN_WAIT_NONE))
			tp_val = NULL;
		else
			return PBSE_BADATVAL;

		psched = (pbs_sched *) pobj;
		if (tp_val == NULL)
			/* No equivalent value of 'none' for throughput_mode, so unset it */
			clear_sched_attr(psched, SCHED_ATR_throughput_mode);
		else
			set_sched_attr_str_slim(psched, SCHED_ATR_throughput_mode, tp_val, NULL);
	}

	return PBSE_NONE;
}

/**
 * @brief action function for 'throughput_mode' sched attribute
 *
 * @param[in]	pattr		attribute being set
 * @param[in]	pobj		Object on which the attribute is being set
 * @param[in]	actmode		the mode of setting
 *
 * @return error code
 */
int
action_throughput_mode(attribute *pattr, void *pobj, int actmode)
{
	long val = pattr->at_val.at_long;
	pbs_sched *psched = NULL;

	psched = (pbs_sched *) pobj;
	if (actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_NEW || actmode == ATR_ACTION_RECOV) {
		char *jrw_val = NULL;

		if (val)
			jrw_val = RUN_WAIT_RUNJOB_HOOK;
		else
			jrw_val = RUN_WAIT_EXECJOB_HOOK;

		set_sched_attr_str_slim(psched, SCHED_ATR_job_run_wait, jrw_val, NULL);
	}

	/* Log a message letting user know that this attribute is deprecated */
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_REQUEST, LOG_WARNING, psched->sc_name,
		  "'throughput_mode' is being deprecated, it is recommended to use 'job_run_wait'");

	return PBSE_NONE;
}


================================================
FILE: src/server/setup_resc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * 		File contains functions related to setting up of resources.
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <string.h>
#include <fcntl.h>
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "log.h"
#include "pbs_python.h"
#include "sched_cmds.h"
#include "pbs_nodes.h"
#include <sys/file.h>
#include "libutil.h"
#include "pbs_sched.h"

extern char *msg_daemonname;
#ifndef PBS_MOM
extern struct python_interpreter_data svr_interp_data;

struct resc_sum *svr_resc_sum;

/**
 * @brief
 * 		Helper function to restart the Python interpreter and record the
 * 		occurrence in the log.
 *
 * @param[in]	caller	-	The name of the calling function (for logging)
 */
int
restart_python_interpreter(const char *caller)
{
	int rc;
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
		  LOG_INFO, (char *) caller,
		  "Restarting Python interpreter as resourcedef file has changed.");
	pbs_python_ext_shutdown_interpreter(&svr_interp_data);
	rc = pbs_python_ext_start_interpreter(&svr_interp_data);
	if (rc != 0) {
		log_err(PBSE_INTERNAL, (char *) caller, "Failed to restart Python interpreter");
	}
	return rc;
}
#endif

/**
 * @brief
 * 		Add a resource to the resource definition array and update the
 * 		resourcedef file
 *
 * @param[in]	name	-	The name of the resource to operate on
 * @param[in]	type	-	The type of the resource
 * @param[in]	perms	-	The permissions/flags of the resource
 *
 * @return	int
 * @retval	-2	: if resource already exists as a different type or the h flag
 * 					is being modified
 * @retval	-1	: on any other error
 * @retval	0	: if ok
 */
int
add_resource_def(char *name, int type, int perms)
{
	resource_def *prdef;
	int rc;

	/* first see if the resource "name" already exists */
	if ((prdef = find_resc_def(svr_resc_def, name)) != NULL) {
		if (prdef->rs_type != type)
			return -2;
		if ((prdef->rs_flags & ATR_DFLAG_CVTSLT) != (perms & ATR_DFLAG_CVTSLT))
			return -2;
		return 0; /* there are correct, just return */
	}

	if (expand_resc_array(name, type, perms) == -1) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESC, LOG_ERR, msg_daemonname, "Error creating resource");
		return -1;
	}

	rc = update_resource_def_file(name, RESDEF_CREATE, type, perms);
	if (rc < 0) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "resource %s can not be defined", name);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
			  LOG_ERR, msg_daemonname, log_buffer);
		return -1;
	}
#ifndef PBS_MOM
	set_scheduler_flag(SCH_CONFIGURE, NULL);
#endif

	return 0;
}

/**
 * @brief
 * 		Helper function to determine whether a line in the resourcedef file
 * 		is an exact match to a given resource name
 *
 * @param[in]	line	-	The line in a resourcedef file
 * @param[name]	name	-	The name of the resource to match
 * @note
 * 		Note that entries in the resourcedef file are of the form
 *		<resource name><white space>type=<type><white space>[flag=<flag>]
 *
 * @return	int
 * @retval	1	: if a match is found
 * @retval	0	: otherwise
 */
static int
is_res_in_line(char *line, char *name)
{
	int i, j;

	if ((line == NULL) || (name == NULL))
		return 0;

	for (i = 0; (line[i] != '\0') && isspace(line[i]); i++)
		;

	for (j = 0; (line[i] != '\0') && (name[j] != '\0') && (line[i] == name[j]); i++, j++)
		;

	if ((j == 0) || (name[j] != '\0'))
		return 0;

	if (!isspace(line[i]) && (line[i] != '\0'))
		return 0;

	return 1;
}

/**
 * @brief
 * 		modify a resource type/flag in the resourcedef file
 *
 * @param[in]	name	-	The name of the resource to operate on
 * @param[in]	op	-	The operation to perform, one of RESDEF_CREATE,
 * 						RESDEF_UPDATE, RESDEF_DELETE
 * @param[in]	type	-	The type of the resource
 * @param[in]	perms	-	The permissions/flags of the resource
 *
 * @return	Whether the operation was successful or not
 * @retval	-1	: on error
 * @retval	0	: on success
 */
int
update_resource_def_file(char *name, resdef_op_t op, int type, int perms)
{
	FILE *rfile;
	FILE *tmpfile;
	int tmp_fd;
	int fd;
	extern char *path_rescdef;
	char template[] = "pbstmpXXXXXX";
	char *line;
	int line_len = 256;
	char msg[LOG_BUF_SIZE];
	struct resc_type_map *p_resc_type_map = NULL;
	char *flags = NULL;
	int rc;

	fd = open(path_rescdef, O_CREAT | O_RDONLY, 0644);
	if (fd == -1)
		return -1;

	if ((rfile = fdopen(fd, "r")) == NULL) {
		close(fd);
		return -1;
	}
	tmp_fd = mkstemp(template);
	tmpfile = fdopen(tmp_fd, "w");
	/* set mode bits because mkstemp() created files don't ensure 0644 */
	fchmod(tmp_fd, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH);
	line = malloc(line_len * sizeof(char));
	if (line == NULL) {
		log_err(errno, __func__, MALLOC_ERR_MSG);
		fclose(tmpfile);
		unlink(template);
		return -1;
	}

	if (lock_file(fileno(rfile), F_RDLCK, path_rescdef, LOCK_RETRY_DEFAULT, msg, sizeof(msg)) != 0) {
		log_err(errno, __func__, msg);
		fclose(rfile);
		fclose(tmpfile);
		unlink(template);
		free(line);
		return -1;
	}
	if ((op == RESDEF_UPDATE) || (op == RESDEF_CREATE)) {
		p_resc_type_map = find_resc_type_map_by_typev(type);
		if (p_resc_type_map == NULL) {
			(void) fclose(rfile);
			free(line);
			fclose(tmpfile);
			unlink(template);
			return -1;
		}
		flags = find_resc_flag_map(perms);
	}

	while (pbs_fgets(&line, &line_len, rfile)) {
		if (((op == RESDEF_UPDATE) || (op == RESDEF_DELETE)) &&
		    ((line[0] != '#') && (is_res_in_line(line, name)))) {
			if (op == RESDEF_UPDATE) {
				fprintf(tmpfile, "%s type=%s", name, p_resc_type_map->rtm_rname);
				if ((flags != NULL) && (flags[0] != '\0')) {
					fprintf(tmpfile, " flag=%s", flags);
				}
				fprintf(tmpfile, "\n");
			} else if (op == RESDEF_DELETE) {
				continue;
			}
		} else {
			fprintf(tmpfile, "%s", line);
		}
	}
	if (op == RESDEF_CREATE) {
		fprintf(tmpfile, "%s type=%s", name, p_resc_type_map->rtm_rname);
		if ((flags != NULL) && (strcmp(flags, "") != 0)) {
			fprintf(tmpfile, " flag=%s", flags);
		}
		fprintf(tmpfile, "\n");
	}

	if (lock_file(fileno(rfile), F_UNLCK, path_rescdef, LOCK_RETRY_DEFAULT, msg, sizeof(msg)) != 0)
		log_err(errno, __func__, msg);

	(void) fclose(rfile);
	(void) fclose(tmpfile);

	free(line);
	free(flags);

	rc = 0;
	if (rename(template, path_rescdef) != 0) {
		rc = 1;
	}
	if (rc != 0) {
		snprintf(log_buffer, sizeof(log_buffer), "error renaming resourcedef file");
		log_err(errno, __func__, log_buffer);
		unlink(template);
		return -1;
	}

	unlink(template);

	return 0;
}

/**
 * @brief
 * 		expand_resc_array - expand the list (no longer an array) of resource
 *		definitions, linking the new to the current last entry
 *
 * @param[in]	rname	-	The name of the resource to operate on
 * @param[in]	rtype	-	The type of the resource
 * @param[in]	rflag	-	The permissions/flags of the resource
 *
 * @return	int
 * @retval	-1	- error
 * @retval	0	- success
 */
int
expand_resc_array(char *rname, int rtype, int rflag)
{
	resource_def *pnew;
	resource_def *pold;
	struct resc_type_map *p_resc_type_map;
	extern void *resc_attrdef_idx;

	/* get mapping between type and functions */

	p_resc_type_map = find_resc_type_map_by_typev(rtype);
	if (p_resc_type_map == NULL)
		return -1;

	/* find the old last entry */
	pold = svr_resc_def;
	while (pold->rs_next)
		pold = pold->rs_next;

	/* allocate new resc_def entry */

	pnew = (resource_def *) malloc(sizeof(resource_def));
	if (pnew == NULL)
		return (-1);

	if ((pnew->rs_name = strdup(rname)) == NULL) {
		free(pnew);
		return (-1);
	}
	pnew->rs_decode = p_resc_type_map->rtm_decode;
	pnew->rs_encode = p_resc_type_map->rtm_encode;
	pnew->rs_set = p_resc_type_map->rtm_set;
	pnew->rs_comp = p_resc_type_map->rtm_comp;
	pnew->rs_free = p_resc_type_map->rtm_free;
	pnew->rs_action = NULL_FUNC_RESC;
	pnew->rs_custom = 1; /*  built-in resources are loaded from XML defn and initialized to 0 */
	pnew->rs_flags = rflag;
	pnew->rs_type = rtype;
	pnew->rs_entlimflg = 0;
	pnew->rs_next = NULL;

	if (pbs_idx_insert(resc_attrdef_idx, pnew->rs_name, pnew) != PBS_IDX_RET_OK) {
		free(pnew->rs_name);
		free(pnew);
		return (-1);
	}

	pold->rs_next = pnew;
	svr_resc_size++;

	return 0;
}

/**
 * @brief
 * 		Setup resource definitions
 * @par
 * 		Read the file, "resourcedef", which defines new resources.
 * 		Expand the array of resource_defs
 *
 * @param[in]	autocorrect	-	Whether to autocorrect (when possible) erroneous
 * 								resource flags/type combinations.
 *
 * @retval	-1	: on error
 * @retval	-2	: on error that got auto-corrected
 * @retval	0	: otherwise.
 * @par
 *  	Format of entries in the file are:
 *	    resource name type=x flag=y
 * 	where
 *		x is "long", "float",  "size", "boolean" or  "string"
 *		y is a combination of the characters 'n' and 'q'
 * @par
 *		If routine returns -1 or -2, then "log_buffer" contains a message to
 *		be logged.
 *
 * @par MT-safe: No
 */

int
setup_resc(int autocorrect)
{
	FILE *nin;
	char *line = NULL;
	char buf[4096];
	char *token;
	int linenum;
	int err;
	char *val;
	char xchar;
	char *rescname;
	int resc_type;
	int resc_flag;
	int flag_ir = 0;
	int rc;
	int err_code = -1;
	int len = 0;
	resource_def *presc;
	extern char *path_rescdef;
	static char *invalchar = "invalid character in resource "
				 "name \"%s\" on line %d of ";
	static char *invalchar_skip = "invalid character in resource name \"%s\"";

	if ((nin = fopen(path_rescdef, "r")) == NULL) {
		return 0;
	}

	for (linenum = 1; pbs_fgets(&line, &len, nin); linenum++) {
		resc_flag = READ_WRITE;
		resc_type = ATR_TYPE_LONG;

		if (line[0] == '#') /* comment */
			continue;

		/* first token is the resource name */

		token = parse_node_token(line, 1, &err, &xchar);
		if (token == NULL)
			continue; /* blank line */
		if (err) {

			if (autocorrect) {
				if (err_code != -2) {
					err_code = -2;
				}
				snprintf(log_buffer, sizeof(log_buffer), invalchar_skip, token);
				fprintf(stderr, "%s\n", log_buffer);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
					  LOG_WARNING, msg_daemonname, log_buffer);
				continue;
			} else {
				snprintf(log_buffer, sizeof(log_buffer), invalchar, token, linenum);
				goto errtoken2;
			}
		}

		rc = verify_resc_name(token);
		if (rc == -1) {
			if (autocorrect) {
				if (err_code != -2) {
					err_code = -2;
				}
				snprintf(log_buffer, sizeof(log_buffer), "resource name \"%s\" does not "
									 "start with alpha; ignoring resource.",
					 token);
				fprintf(stderr, "%s\n", log_buffer);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
					  LOG_WARNING, msg_daemonname, log_buffer);
				continue;
			} else {
				snprintf(log_buffer, sizeof(log_buffer), "resource name \"%s\" does not "
									 "start with alpha on line %d of ",
					 token, linenum);
				goto errtoken2;
			}
		} else if (rc == -2) {
			if (autocorrect) {
				if (err_code != -2) {
					err_code = -2;
				}
				snprintf(log_buffer, sizeof(log_buffer), invalchar_skip, token);
				fprintf(stderr, "%s\n", log_buffer);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_WARNING, msg_daemonname, log_buffer);
				continue;
			} else {
				snprintf(log_buffer, sizeof(log_buffer), invalchar, token, linenum);
				goto errtoken2;
			}
		}

		rescname = token;

		/* now process remaining tokens (if any), 	*/
		/* they must be of the form keyword=value	*/

		while (1) {

			token = parse_node_token(NULL, 0, &err, &xchar);
			if (err) {
				if (autocorrect) {
					if (err_code != -2) {
						err_code = -2;
					}
					snprintf(log_buffer, sizeof(log_buffer), invalchar_skip, token);
					fprintf(stderr, "%s\n", log_buffer);
					log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
						  LOG_WARNING, msg_daemonname, log_buffer);
					break;
				} else {
					goto errtoken1;
				}
			}
			if (token == NULL)
				break;

			if (xchar == '=') {

				/* have  keyword=value */

				val = parse_node_token(NULL, 0, &err, &xchar);
				if ((val == NULL) || err || (xchar == '=')) {
					if (autocorrect) {
						if (err_code != -2) {
							err_code = -2;
						}
						snprintf(log_buffer, sizeof(log_buffer), invalchar_skip, token);
						fprintf(stderr, "%s\n", log_buffer);
						log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
							  LOG_WARNING, msg_daemonname, log_buffer);
						break;
					} else {
						goto errtoken1;
					}
				}

				if (strcmp(token, "type") == 0) {
					if (parse_resc_type(val, &resc_type) == -1) {
						if (autocorrect) {
							if (err_code != -2) {
								err_code = -2;
							}
							snprintf(log_buffer, sizeof(log_buffer), "invalid resource type %s", val);
							fprintf(stderr, "%s\n", log_buffer);
							log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
								  LOG_WARNING, msg_daemonname, log_buffer);
							break;
						} else {
							goto errtoken1;
						}
					}
				} else if (strcmp(token, "flag") == 0) {
					if (parse_resc_flags(val, &flag_ir, &resc_flag) == -1) {
						if (autocorrect) {
							if (err_code != -2) {
								err_code = -2;
							}
							snprintf(log_buffer, sizeof(log_buffer), "Invalid resource flag %s", val);
							fprintf(stderr, "%s\n", log_buffer);
							log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
								  LOG_WARNING, msg_daemonname, log_buffer);
							break;
						} else {
							goto errtoken1;
						}
					}
				} else {
					if (autocorrect) {
						if (err_code != -2) {
							err_code = -2;
						}
						snprintf(log_buffer, sizeof(log_buffer), "Unrecognized token %s; skipping", token);
						fprintf(stderr, "%s\n", log_buffer);
						log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
							  LOG_WARNING, msg_daemonname, log_buffer);
						break;
					} else {
						goto errtoken1;
					}
				}
			} else {
				if (autocorrect) {
					if (err_code != -2) {
						err_code = -2;
					}
					snprintf(log_buffer, sizeof(log_buffer), "Unrecognized token %s; skipping", token);
					fprintf(stderr, "%s\n", log_buffer);
					log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
						  LOG_WARNING, msg_daemonname, log_buffer);
					break;
				} else {
					goto errtoken1;
				}
			}
		}

		rc = verify_resc_type_and_flags(resc_type, &flag_ir, &resc_flag, rescname, buf, sizeof(buf), autocorrect);
		if (rc != 0) {
			fprintf(stderr, "%s\n", buf);
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				  LOG_WARNING, msg_daemonname, buf);
			/* with autocorrect enabled a return code of -2 would be returned on error */
			if (rc == -1) {
				goto errtoken3;
			}
		}
		/* create resource definition */

		presc = find_resc_def(svr_resc_def, rescname);
		if (presc != NULL) {
			if (resc_type == presc->rs_type) {
				resc_flag &= (ATR_DFLAG_RASSN |
					      ATR_DFLAG_ANASSN |
					      ATR_DFLAG_FNASSN |
					      ATR_DFLAG_CVTSLT |
					      ATR_DFLAG_MOM |
					      READ_WRITE);
				presc->rs_flags &= ~(ATR_DFLAG_RASSN |
						     ATR_DFLAG_ANASSN |
						     ATR_DFLAG_FNASSN |
						     ATR_DFLAG_CVTSLT |
						     ATR_DFLAG_MOM |
						     READ_WRITE);
				presc->rs_flags |= resc_flag;
#ifndef PBS_MOM
			} else {
				sprintf(log_buffer,
					"Erroneous to define duplicate "
					"resource \"%s\" with differing type "
					"specification, ignoring new definition",
					rescname);
				fprintf(stderr, "%s\n", log_buffer);
				log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
					  LOG_WARNING, msg_daemonname, log_buffer);
#endif
			}
		} else {
			err = expand_resc_array(rescname, resc_type, resc_flag);
			if (err == -1) {
				(void) strcpy(log_buffer, "error allocating memory in setup_resc");
				goto errtoken3;
			}
		}
	}

	free(line);
	fclose(nin);
	return 0;

errtoken1:
	sprintf(log_buffer, "token \"%s\" in error on line %d of ",
		token, linenum);
errtoken2:
	strcat(log_buffer, path_rescdef);
errtoken3:
	free(line);
	fclose(nin);
	return err_code;
}

#ifndef PBS_MOM
/**
 * @brief
 * 		Update the global resource summation array that tracks the resources
 * 		that need to be accumulated across chunks
 *
 * @see svr_resc_sum
 */
void
update_resc_sum(void)
{
	resource_def *prdef;
	struct resc_sum *tmp_resc_sum;
	int i = 0;

	for (prdef = svr_resc_def; prdef; prdef = prdef->rs_next) {
		if (prdef->rs_flags & (ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN | ATR_DFLAG_FNASSN))
			i++;
	}

	/* allocating i+1 for the NULL terminator */
	tmp_resc_sum = (struct resc_sum *) calloc((size_t) (i + 1), sizeof(struct resc_sum));
	if (tmp_resc_sum == NULL) {
		log_err(-1, "setup_resc", "unable to malloc for svr_resc_sum");
		return;
	}

	if (svr_resc_sum != NULL)
		free(svr_resc_sum);

	svr_resc_sum = tmp_resc_sum;

	for (i = 0, prdef = svr_resc_def; prdef; prdef = prdef->rs_next) {
		if (prdef->rs_flags & (ATR_DFLAG_RASSN | ATR_DFLAG_ANASSN | ATR_DFLAG_FNASSN)) {
			svr_resc_sum[i].rs_def = prdef;
			svr_resc_sum[i].rs_prs = NULL;
			(void) memset((char *) &svr_resc_sum[i].rs_attr, 0, sizeof(struct attribute));
			svr_resc_sum[i].rs_attr.at_type = prdef->rs_type;
			svr_resc_sum[i].rs_set = 0;
			i++;
		}
	}
	svr_resc_sum[i].rs_def = NULL;
}
#endif


================================================
FILE: src/server/stat_job.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

/*
 * @file	stat_job.c
 *
 * @brief
 * 	stat_job.c	-	Functions which support the Status Job Batch Request.
 *
 * Included funtions are:
 *	svrcached()
 *	status_attrib()
 *	status_job()
 *	status_subjob()
 *
 */
#include <sys/types.h>
#include <stdlib.h>
#include "libpbs.h"
#include <ctype.h>
#include <time.h>
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "work_task.h"
#include "pbs_error.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "pbs_ifl.h"
#include "ifl_internal.h"

/* Global Data Items: */

extern attribute_def job_attr_def[];
extern int resc_access_perm; /* see encode_resc() in attr_fn_resc.c */
extern struct server server;
extern char statechars[];
extern time_t time_now;

/**
 * @brief
 * 		svrcached - either link in (to phead) a cached svrattrl struct which is
 *		pointed to by the attribute, or if the cached struct isn't there or
 *		is out of date, then replace it with a new svrattrl structure.
 * @par
 *		When replacing, unlink and delete old one if the reference count goes
 *		to zero.
 *
 * @par[in,out]	pat	-	attribute structure which contains a cached svrattrl struct
 * @par[in,out]	phead	-	list of new attribute values
 * @par[in]	pdef	-	attribute for any parent object.
 *
 * @note
 *	If an attribute has the ATR_DFLAG_HIDDEN flag set, then no
 *	need to obtain and cache new svrattrl values.
 */

static void
svrcached(attribute *pat, pbs_list_head *phead, attribute_def *pdef)
{
	svrattrl *working = NULL;
	svrattrl *wcopy;
	svrattrl *encoded;

	if (pdef == NULL)
		return;

	if ((pdef->at_flags & ATR_DFLAG_HIDDEN) &&
	    (get_sattr_long(SVR_ATR_show_hidden_attribs) == 0)) {
		return;
	}
	if (pat->at_flags & ATR_VFLAG_MODCACHE) {
		/* free old cache value if the value has changed */
		free_svrcache(pat);
		encoded = NULL;
	} else {
		if (resc_access_perm & PRIV_READ)
			encoded = pat->at_priv_encoded;
		else
			encoded = pat->at_user_encoded;
	}

	if ((encoded == NULL) || (pat->at_flags & ATR_VFLAG_MODCACHE)) {
		if (is_attr_set(pat)) {
			/* encode and cache new svrattrl structure */
			(void) pdef->at_encode(pat, phead, pdef->at_name,
					       NULL, ATR_ENCODE_CLIENT, &working);
			if (resc_access_perm & PRIV_READ)
				pat->at_priv_encoded = working;
			else
				pat->at_user_encoded = working;

			pat->at_flags &= ~ATR_VFLAG_MODCACHE;
			while (working) {
				working->al_refct++; /* incr ref count */
				working = working->al_sister;
			}
		}
	} else {
		/* can use the existing cached svrattrl struture */

		working = encoded;
		if (working->al_refct < 2) {
			while (working) {
				CLEAR_LINK(working->al_link);
				if (phead != NULL)
					append_link(phead, &working->al_link, working);
				working->al_refct++; /* incr ref count */
				working = working->al_sister;
			}
		} else {
			/*
			 * already linked in, must make a copy to link
			 * NOTE: the copy points to the original's data
			 * so it should be freed by itself, hence the
			 * ref count is set to 1 and the sisters are not
			 * linked in
			 */
			while (working) {
				wcopy = malloc(sizeof(struct svrattrl));
				if (wcopy) {
					*wcopy = *working;
					working = working->al_sister;
					CLEAR_LINK(wcopy->al_link);
					if (phead != NULL)
						append_link(phead, &wcopy->al_link, wcopy);
					wcopy->al_refct = 1;
					wcopy->al_sister = NULL;
				}
			}
		}
	}
}

/*
 * status_attrib - add each requested or all attributes to the status reply
 *
 * @param[in,out]	pal 	-	specific attributes to status
 * @param[in]		pidx 	-	Search index of the attribute array
 * @param[in]		padef	-	attribute definition structure
 * @param[in,out]	pattr	-	attribute structure
 * @param[in]		limit	-	limit on size of def array
 * @param[in]		priv	-	user-client privilege
 * @param[in,out]	phead	-	pbs_list_head
 * @param[out]		bad 	-	RETURN: index of first bad attribute
 *
 * @return	int
 * @retval	0	: success
 * @retval	-1	: on error (bad attribute)
 */

int
status_attrib(svrattrl *pal, void *pidx, attribute_def *padef, attribute *pattr, int limit, int priv, pbs_list_head *phead, int *bad)
{
	int index;
	int nth = 0;

	priv &= (ATR_DFLAG_RDACC | ATR_DFLAG_SvWR); /* user-client privilege */
	resc_access_perm = priv;		    /* pass privilege to encode_resc()	*/

	/* for each attribute asked for or for all attributes, add to reply */

	if (pal) { /* client specified certain attributes */
		while (pal) {
			++nth;
			index = find_attr(pidx, padef, pal->al_name);
			if (index < 0) {
				*bad = nth;
				return (-1);
			}
			if ((padef + index)->at_flags & priv) {
				svrcached(pattr + index, phead, padef + index);
			}
			pal = (svrattrl *) GET_NEXT(pal->al_link);
		}
	} else { /* non specified, return all readable attributes */
		for (index = 0; index < limit; index++) {
			if ((padef + index)->at_flags & priv) {
				svrcached(pattr + index, phead, padef + index);
			}
		}
	}
	return (0);
}

/**
 * @brief
 * 		status_job - Build the status reply for a single job, regular or Array,
 *		but not a subjob of an Array Job.
 *
 * @param[in,out]	pjob	-	ptr to job to status
 * @param[in]		preq	-	request structure
 * @param[in]		pal	-	specific attributes to status
 * @param[in,out]	pstathd	-	RETURN: head of list to append status to
 * @param[out]		bad	-	RETURN: index of first bad attribute
 * @param[in]		dosubjobs -	flag to expand a Array job to include all subjobs
 *
 * @return	int
 * @retval	0	: success
 * @retval	PBSE_PERM	: client is not authorized to status the job
 * @retval	PBSE_SYSTEM	: memory allocation error
 * @retval	PBSE_NOATTR	: attribute error
 */

int
status_job(job *pjob, struct batch_request *preq, svrattrl *pal, pbs_list_head *pstathd, int *bad, int dosubjobs)
{
	struct brp_status *pstat;
	long oldtime = 0;
	int old_elig_flags = 0;
	int old_atyp_flags = 0;
	int revert_state_r = 0;

	/* see if the client is authorized to status this job */

	if (!get_sattr_long(SVR_ATR_query_others))
		if (svr_authorize_jobreq(preq, pjob))
			return (PBSE_PERM);

	/* calc eligible time on the fly and return, don't save. */
	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == TRUE) {
		if (get_jattr_long(pjob, JOB_ATR_accrue_type) == JOB_ELIGIBLE) {
			oldtime = get_jattr_long(pjob, JOB_ATR_eligible_time);
			set_jattr_l_slim(pjob, JOB_ATR_eligible_time,
					 time_now - get_jattr_long(pjob, JOB_ATR_sample_starttime), INCR);
		}
	} else {
		/* eligible_time_enable is off so, clear set flag so that eligible_time and accrue type dont show */
		old_elig_flags = get_jattr(pjob, JOB_ATR_eligible_time)->at_flags;
		mark_jattr_not_set(pjob, JOB_ATR_eligible_time);

		old_atyp_flags = get_jattr(pjob, JOB_ATR_accrue_type)->at_flags;
		mark_jattr_not_set(pjob, JOB_ATR_accrue_type);
	}

	/* allocate reply structure and fill in header portion */

	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);
	CLEAR_LINK(pstat->brp_stlink);
	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) != 0 && dosubjobs)
		pstat->brp_objtype = MGR_OBJ_JOBARRAY_PARENT;
	else if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) != 0 && dosubjobs)
		pstat->brp_objtype = MGR_OBJ_SUBJOB;
	else
		pstat->brp_objtype = MGR_OBJ_JOB;
	(void) strcpy(pstat->brp_objname, pjob->ji_qs.ji_jobid);
	CLEAR_HEAD(pstat->brp_attr);
	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;

	/* Temporarily set suspend/user suspend states for the stat */
	if (check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {
		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_Suspend) {
			set_job_state(pjob, JOB_STATE_LTR_SUSPENDED);
			revert_state_r = 1;
		} else if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_Actsuspd) {
			set_job_state(pjob, JOB_STATE_LTR_USUSPENDED);
			revert_state_r = 1;
		}
	}

	/* add attributes to the status reply */

	*bad = 0;
	if (status_attrib(pal, job_attr_idx, job_attr_def, pjob->ji_wattr, JOB_ATR_LAST, preq->rq_perm, &pstat->brp_attr, bad))
		return (PBSE_NOATTR);

	/* reset eligible time, it was calctd on the fly, real calctn only when accrue_type changes */

	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) != 0) {
		if (get_jattr_long(pjob, JOB_ATR_accrue_type) == JOB_ELIGIBLE)
			set_jattr_l_slim(pjob, JOB_ATR_eligible_time, oldtime, SET);
	} else {
		/* reset the set flags */
		get_jattr(pjob, JOB_ATR_eligible_time)->at_flags = old_elig_flags;

		get_jattr(pjob, JOB_ATR_accrue_type)->at_flags = old_atyp_flags;
	}

	if (revert_state_r)
		set_job_state(pjob, JOB_STATE_LTR_RUNNING);

	return (0);
}

/**
 * @brief
 * 		status_subjob - status a single subjob (of an Array Job)
 *		Works by statusing the parrent unless subjob is actually running.
 *
 * @param[in,out]	pjob	-	ptr to parent Array
 * @param[in]		preq	-	request structure
 * @param[in]		pal	-	specific attributes to status
 * @param[in]		subj	-	if not = -1 then include subjob [n]
 * @param[in,out]	pstathd	-	RETURN: head of list to append status to
 * @param[out]		bad	-	RETURN: index of first bad attribute
 * @param[in]		dosubjobs -	flag to expand a Array job to include all subjobs
 *
 * @return	int
 * @retval	0	: success
 * @retval	PBSE_PERM	: client is not authorized to status the job
 * @retval	PBSE_SYSTEM	: memory allocation error
 * @retval	PBSE_IVALREQ	: something wrong with the flags
 */
int
status_subjob(job *pjob, struct batch_request *preq, svrattrl *pal, int subj, pbs_list_head *pstathd, int *bad, int dosubjobs)
{
	int limit = (int) JOB_ATR_LAST;
	struct brp_status *pstat;
	job *psubjob; /* ptr to job to status */
	char realstate;
	int rc = 0;
	int oldeligflags = 0;
	int oldatypflags = 0;
	char *old_subjob_comment = NULL;
	char sjst;
	int sjsst;
	char *objname;

	/* see if the client is authorized to status this job */

	if (!get_sattr_long(SVR_ATR_query_others))
		if (svr_authorize_jobreq(preq, pjob))
			return (PBSE_PERM);

	if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) == 0)
		return PBSE_IVALREQ;

	/* if subjob job obj exists, use real job structure */

	psubjob = get_subjob_and_state(pjob, subj, &sjst, &sjsst);
	if (psubjob)
		return status_job(psubjob, preq, pal, pstathd, bad, dosubjobs);

	if (sjst == JOB_STATE_LTR_UNKNOWN)
		return PBSE_UNKJOBID;

	/* otherwise we fake it with info from the parent      */
	/* allocate reply structure and fill in header portion */

	objname = create_subjob_id(pjob->ji_qs.ji_jobid, subj);
	if (objname == NULL)
		return PBSE_SYSTEM;

	/* for the general case, we don't want to include the parent's */
	/* array related attrbutes as they belong only to the Array    */
	if (pal == NULL)
		limit = JOB_ATR_array;
	pstat = (struct brp_status *) malloc(sizeof(struct brp_status));
	if (pstat == NULL)
		return (PBSE_SYSTEM);
	CLEAR_LINK(pstat->brp_stlink);
	if (dosubjobs)
		pstat->brp_objtype = MGR_OBJ_SUBJOB;
	else
		pstat->brp_objtype = MGR_OBJ_JOB;
	(void) strcpy(pstat->brp_objname, objname);
	CLEAR_HEAD(pstat->brp_attr);
	append_link(pstathd, &pstat->brp_stlink, pstat);
	preq->rq_reply.brp_count++;

	/* add attributes to the status reply */

	*bad = 0;

	/*
	 * fake the job state and comment by setting the parent job's state
	 * and comment to that of the subjob
	 */
	realstate = get_job_state(pjob);
	set_job_state(pjob, sjst);

	if (sjst == JOB_STATE_LTR_EXPIRED || sjst == JOB_STATE_LTR_FINISHED) {
		if (sjsst == JOB_SUBSTATE_FINISHED) {
			if (is_jattr_set(pjob, JOB_ATR_Comment)) {
				old_subjob_comment = strdup(get_jattr_str(pjob, JOB_ATR_Comment));
				if (old_subjob_comment == NULL)
					return (PBSE_SYSTEM);
			}
			if (set_jattr_str_slim(pjob, JOB_ATR_Comment, "Subjob finished", NULL)) {
				return (PBSE_SYSTEM);
			}
		} else if (sjsst == JOB_SUBSTATE_FAILED) {
			if (is_jattr_set(pjob, JOB_ATR_Comment)) {
				old_subjob_comment = strdup(get_jattr_str(pjob, JOB_ATR_Comment));
				if (old_subjob_comment == NULL)
					return (PBSE_SYSTEM);
			}
			if (set_jattr_str_slim(pjob, JOB_ATR_Comment, "Subjob failed", NULL)) {
				return (PBSE_SYSTEM);
			}
		} else if (sjsst == JOB_SUBSTATE_TERMINATED) {
			if (is_jattr_set(pjob, JOB_ATR_Comment)) {
				old_subjob_comment = strdup(get_jattr_str(pjob, JOB_ATR_Comment));
				if (old_subjob_comment == NULL)
					return (PBSE_SYSTEM);
			}
			if (set_jattr_str_slim(pjob, JOB_ATR_Comment, "Subjob terminated", NULL)) {
				return (PBSE_SYSTEM);
			}
		}
	}

	/* when eligible_time_enable is off,				      */
	/* clear the set flag so that eligible_time and accrue_type dont show */
	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 0) {
		attribute *attr = get_jattr(pjob, JOB_ATR_eligible_time);

		oldeligflags = attr->at_flags;
		mark_jattr_not_set(pjob, JOB_ATR_eligible_time);

		attr = get_jattr(pjob, JOB_ATR_accrue_type);
		oldatypflags = attr->at_flags;
		mark_jattr_not_set(pjob, JOB_ATR_accrue_type);
	}

	if (status_attrib(pal, job_attr_idx, job_attr_def, pjob->ji_wattr, limit, preq->rq_perm, &pstat->brp_attr, bad))
		rc = PBSE_NOATTR;

	/* Set the parent state back to what it really is */
	set_job_state(pjob, realstate);

	/* Set the parent comment back to what it really is */
	if (old_subjob_comment != NULL) {
		if (set_jattr_str_slim(pjob, JOB_ATR_Comment, old_subjob_comment, NULL)) {
			return (PBSE_SYSTEM);
		}

		free(old_subjob_comment);
	}

	/* reset the flags */
	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 0) {
		attribute *attr = get_jattr(pjob, JOB_ATR_eligible_time);
		attr->at_flags = oldeligflags;

		attr = get_jattr(pjob, JOB_ATR_accrue_type);
		attr->at_flags = oldatypflags;
	}

	return (rc);
}


================================================
FILE: src/server/svr_chk_owner.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    svr_chk_owner.c
 *
 * @brief
 * 		svr_chk_owner.c	-	This file contains functions related to authorizing a job request.
 *
 * Functions included are:
 * 	svr_chk_owner()
 *	svr_authorize_jobreq()
 *	svr_get_privilege()
 *	authenticate_user()
 *	chk_job_request()
 *	chk_rescResv_request()
 *	svr_chk_ownerResv()
 *	svr_authorize_resvReq()
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>
#include "libpbs.h"
#include "string.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "server.h"
#include "credential.h"
#include "batch_request.h"
#include "net_connect.h"

#include <unistd.h>

#include "job.h"
#include "reservation.h"
#include "pbs_error.h"
#include "log.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "libutil.h"

/* Global Data */

extern char *msg_badstate;
extern char *msg_permlog;
extern char *msg_unkjobid;
extern char *msg_system;
extern char *msg_unkresvID;
extern char *msg_delProgress;
extern time_t time_now;

/* Global functions */
extern int svr_chk_histjob(job *pjob);

/* Non-global functions */
static int svr_authorize_resvReq(struct batch_request *, resc_resv *);

/**
 * @brief
 * 		svr_chk_owner - compare a user name from a request and the name of
 *		the user who owns the job.
 *
 * @param[in]	preq	-	request structure which contains the user name
 * @param[in]	pjob	-	job structure
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: user is not the job owner
 */

int
svr_chk_owner(struct batch_request *preq, job *pjob)
{
	char owner[PBS_MAXUSER + 1];
	char *pu;
	char *ph;
	char rmtuser[PBS_MAXUSER + PBS_MAXHOSTNAME + 2];
	extern int ruserok(const char *rhost, int suser, const char *ruser,
			   const char *luser);

	/* Are the owner and requestor the same? */
	snprintf(rmtuser, sizeof(rmtuser), "%s", get_jattr_str(pjob, JOB_ATR_job_owner));
	pu = rmtuser;
	ph = strchr(rmtuser, '@');
	if (!ph)
		return -1;
	*ph++ = '\0';
	if (strcmp(preq->rq_user, pu) == 0) {
		/* Avoid the lookup if they match. */
		if (strcmp(preq->rq_host, ph) == 0)
			return 0;
		/* Perform the lookup. */
		if (is_same_host(preq->rq_host, ph))
			return 0;
	}

	/* map requestor user@host to "local" name */

	pu = site_map_user(preq->rq_user, preq->rq_host);
	if (pu == NULL)
		return (-1);
	(void) strncpy(rmtuser, pu, PBS_MAXUSER);

	/*
	 * Get job owner name without "@host" and then map to "local" name.
	 */

	get_jobowner(get_jattr_str(pjob, JOB_ATR_job_owner), owner);
	pu = site_map_user(owner, get_hostPart(get_jattr_str(pjob, JOB_ATR_job_owner)));

	if (get_sattr_long(SVR_ATR_FlatUID)) {
		/* with flatuid, all that must match is user names */
		return (strcmp(rmtuser, pu));
	} else {
		/* non-flatuid space, must validate rmtuser vs owner */
		return (ruserok(preq->rq_host, 0, rmtuser, pu));
	}
}

/**
 * @brief
 * 		svr_authorize_jobreq - determine if requestor is authorized to make
 *		request against the job.  This is only called for batch requests
 *		against jobs, not manager requests against queues or the server.
 *
 * @param[in]	preq	-	request structure which contains the user name
 * @param[in]	pjob	-	job structure
 *
 * @return	int
 * @retval	0	: if authorized (job owner, operator, administrator)
 * @retval	!0	: not authorized.
 */

int
svr_authorize_jobreq(struct batch_request *preq, job *pjob)
{
	/* Is requestor special privileged? */

	if ((preq->rq_perm & (ATR_DFLAG_OPRD | ATR_DFLAG_OPWR |
			      ATR_DFLAG_MGRD | ATR_DFLAG_MGWR)) != 0)
		return (0);

	/* if not, see if requestor is the job owner */

	else if (svr_chk_owner(preq, pjob) == 0)
		return (0);

	else
		return (-1);
}

/**
 * @brief
 * 		svr_get_privilege - get privilege level of a user.
 *
 *		Privilege is granted to a user at a host.  A user is automatically
 *		granted "user" privilege.  The user@host pair must appear in
 *		the server's administrator attribute list to be granted "manager"
 *		privilege and/or appear in the operators attribute list to be
 *		granted "operator" privilege.  If either acl is unset, then root
 *		on the server machine is granted that privilege.
 *
 *		If "PBS_ROOT_ALWAYS_ADMIN" is defined, then root always has privilege
 *		even if not in the list.
 *
 *		The returns are based on the access permissions of attributes, see
 *		attribute.h.
 *
 * @param[in]	user	-	user in user@host pair
 * @param[in]	host	-	host in user@host pair
 *
 * @return	int
 * @retval	access privilage of the user
 */

int
svr_get_privilege(char *user, char *host)
{
	int is_root = 0;
	int priv = (ATR_DFLAG_USRD | ATR_DFLAG_USWR);
	char uh[PBS_MAXUSER + PBS_MAXHOSTNAME + 2];

	(void) strcpy(uh, user);
	(void) strcat(uh, "@");
	(void) strcat(uh, host);

	if (strcmp(user, PBS_DEFAULT_ADMIN) == 0) {
		char myhostname[PBS_MAXHOSTNAME + 1];
		/* First try without DNS lookup. */
		if (strcasecmp(host, server_host) == 0) {
			is_root = 1;
		} else if (strcasecmp(host, LOCALHOST_SHORTNAME) == 0) {
			is_root = 1;
		} else if (strcasecmp(host, LOCALHOST_FULLNAME) == 0) {
			is_root = 1;
		} else {
			if (gethostname(myhostname, (sizeof(myhostname) - 1)) == -1) {
				myhostname[0] = '\0';
			}
			if (strcasecmp(host, myhostname) == 0) {
				is_root = 1;
			}
		}
		if (is_root == 0) {
			/* Now try with DNS lookup. */
			if (is_same_host(host, server_host)) {
				is_root = 1;
			} else if (is_same_host(host, myhostname)) {
				is_root = 1;
			}
		}
	}

#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	char *privil_auth_user = pbs_conf.pbs_privileged_auth_user ? pbs_conf.pbs_privileged_auth_user : NULL;
	if (privil_auth_user &&
	    is_string_in_arr(pbs_conf.supported_auth_methods, AUTH_GSS_NAME)) {
		if (strcmp(uh, privil_auth_user) == 0) {
			is_root = 1;
		}
	}
#endif

#ifdef PBS_ROOT_ALWAYS_ADMIN
	if (is_root)
		return (priv | ATR_DFLAG_MGRD | ATR_DFLAG_MGWR | ATR_DFLAG_OPRD | ATR_DFLAG_OPWR);
#endif /* PBS_ROOT_ALWAYS_ADMIN */

	if (!is_sattr_set(SVR_ATR_managers)) {
		if (is_root)
			priv |= (ATR_DFLAG_MGRD | ATR_DFLAG_MGWR);

	} else if (acl_check(get_sattr(SVR_ATR_managers), uh, ACL_User))
		priv |= (ATR_DFLAG_MGRD | ATR_DFLAG_MGWR);

	if (!is_attr_set(get_sattr(SVR_ATR_operators))) {
		if (is_root)
			priv |= (ATR_DFLAG_OPRD | ATR_DFLAG_OPWR);

	} else if (acl_check(get_sattr(SVR_ATR_operators), uh, ACL_User))
		priv |= (ATR_DFLAG_OPRD | ATR_DFLAG_OPWR);

	return (priv);
}

/**
 * @brief
 * 		authenticate_user - authenticate user by checking name against credential
 *		       provided on connection via Authenticate User request.
 *
 * @param[in]	preq	-	user to be authenticated
 * @param[in]	pcred	-	credential provided on connection via Authenticate User request.
 *
 * @return	int
 * @retval	0	: if user is who s/he claims
 * @retval	nonzero	: error code
 */

int
authenticate_user(struct batch_request *preq, struct connection *pcred)
{
	char uath[PBS_MAXUSER + PBS_MAXHOSTNAME + 1];

	if (strncmp(preq->rq_user, pcred->cn_username, PBS_MAXUSER))
		return (PBSE_BADCRED);
	if (strncasecmp(preq->rq_host, pcred->cn_hostname, PBS_MAXHOSTNAME))
		return (PBSE_BADCRED);
	if (pcred->cn_timestamp) {
		if ((pcred->cn_timestamp - CREDENTIAL_TIME_DELTA > time_now) ||
		    (pcred->cn_timestamp + CREDENTIAL_LIFETIME < time_now))
			return (PBSE_EXPIRED);
	}

	/* If Server's Acl_User enabled, check if user in list */

	if (get_sattr_long(SVR_ATR_AclUserEnabled)) {

		(void) strcpy(uath, preq->rq_user);
		(void) strcat(uath, "@");
		(void) strcat(uath, preq->rq_host);
		if (acl_check(get_sattr(SVR_ATR_AclUsers),
			      uath, ACL_User) == 0) {
			/* not in list, next check if listed as a manager */

			if ((svr_get_privilege(preq->rq_user, preq->rq_host) &
			     (ATR_DFLAG_MGWR | ATR_DFLAG_OPWR)) == 0)
				return (PBSE_PERM);
		}
	}

	/* A site stub for additional checking */

	return (site_allow_u(preq->rq_user, preq->rq_host));
}

/**
 * @brief
 * 		chk_job_request - check legality of a request against a job
 * @par
 *		this checks the most conditions common to most job batch requests.
 *		It also returns a pointer to the job if found and the tests pass.
 *		If the request is for a single subjob or a range of subjobs (of an
 *		Job Array),  the return job pointer is to the parent Array Job.
 * @par
 *		Depending on what the "jobid" identifies, the following is returned
 *		in the integer pointed to by rc:
 *	   	IS_ARRAY_NO (0)       - for a regular job
 *	   	IS_ARRAY_ArrayJob (1) - for an Array Job
 *	   	IS_ARRAY_Single (2)   - for a single subjob
 *	   	IS_ARRAY_Range (3)    - for a range of  subjobs
 *
 * @param[in]	jobid	-	Job Id.
 * @param[in,out]	preq	-	job batch request
 * @param[out]	rc	-	Depending on what the "jobid" identifies,
 * 						the following is returned
 *						(0)       - for a regular job
 *						(1) - for an Array Job
 *						(2)   - for a single subjob
 *						(3)    - for a range of  subjobs
 * @param[out]	err		PBSE reason why request was rejected
 *
 * @return	job *
 * @retval	a pointer to the job	: if found and the tests pass.
 * @retval	NULL	: failed
 */

job *
chk_job_request(char *jobid, struct batch_request *preq, int *rc, int *err)
{
	int t;
	int histerr = 0;
	job *pjob;
	int deletehist = 0;
	char *p1;
	char *p2;

	if (preq->rq_extend && strstr(preq->rq_extend, DELETEHISTORY))
		deletehist = 1;
	t = is_job_array(jobid);
	if ((t == IS_ARRAY_NO) || (t == IS_ARRAY_ArrayJob))
		pjob = find_job(jobid); /* regular or ArrayJob itself */
	else
		pjob = find_arrayparent(jobid); /* subjob(s) */

	*rc = t;

	if (pjob == NULL) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
			  jobid, msg_unkjobid);
		if (err != NULL)
			*err = PBSE_UNKJOBID;

		if (preq->rq_type != PBS_BATCH_DeleteJobList)
			req_reject(PBSE_UNKJOBID, 0, preq);
		return NULL;
	} else {
		histerr = svr_chk_histjob(pjob);
		if (histerr && deletehist == 0) {
			if (err != NULL)
				*err = histerr;
			if (preq->rq_type != PBS_BATCH_DeleteJobList)
				req_reject(histerr, 0, preq);
			return NULL;
		}
		if (deletehist == 1 && check_job_state(pjob, JOB_STATE_LTR_MOVED) &&
		    !check_job_substate(pjob, JOB_SUBSTATE_FINISHED)) {
			job_purge(pjob);
			if (preq->rq_type != PBS_BATCH_DeleteJobList)
				req_reject(PBSE_UNKJOBID, 0, preq);
			return NULL;
		}
	}

	/*
	 * The job was found using the job ID in the request, but it may not
	 * match exactly (i.e. FQDN vs. unqualified hostname). Overwrite the
	 * host portion of the job ID in the request with the host portion of
	 * the one from the server job structure. Do not modify anything
	 * before the first dot in the job ID because it may be an array job.
	 * This will allow find_job() to look for an exact match when the
	 * request is serviced by MoM.
	 */
	p1 = strchr(pjob->ji_qs.ji_jobid, '.');
	if (p1) {
		p2 = strchr(jobid, '.');
		if (p2)
			*p2 = '\0';
		strncat(jobid, p1, PBS_MAXSVRJOBID - 1);
	}

	if (svr_authorize_jobreq(preq, pjob) == -1) {
		(void) sprintf(log_buffer, msg_permlog, preq->rq_type,
			       "Job", pjob->ji_qs.ji_jobid,
			       preq->rq_user, preq->rq_host);
		log_event(PBSEVENT_SECURITY, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
		if (err != NULL)
			*err = PBSE_PERM;
		if (preq->rq_type != PBS_BATCH_DeleteJobList)
			req_reject(PBSE_PERM, 0, preq);
		return NULL;
	}

	if ((t == IS_ARRAY_NO) && (check_job_state(pjob, JOB_STATE_LTR_EXITING))) {

		/* special case Deletejob with "force" */
		if (((preq->rq_type == PBS_BATCH_DeleteJob) || (preq->rq_type == PBS_BATCH_DeleteJobList)) &&
		    (preq->rq_extend != NULL) &&
		    (strcmp(preq->rq_extend, "force") == 0)) {
			return pjob;
		}

		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
			   "%s, state=%c", msg_badstate, get_job_state(pjob));
		if (err != NULL)
			*err = PBSE_BADSTATE;
		if (preq->rq_type != PBS_BATCH_DeleteJobList)
			req_reject(PBSE_BADSTATE, 0, preq);
		return NULL;
	}

	return pjob;
}

/**
 * @brief
 * 		chk_rescResv_request - check legality of a request against named
 *	 	resource reservation
 * @par
 *		This checks the conditions common to most batch requests
 *		against a resc_resv object.  If the object is found in the
 *		system and the tests are passed, a non-zero resc_resv
 *		pointer is returned.
 * @par
 *		If the object can't be found or an applied test fails,
 *		an appropriate error event is logged, an error code is passed
 *		back to the requester via function req_reject(), the batch
 *		request structure is handled appropriately, and
 *		value NULL is returned to the caller.
 * @note
 *		Notes: On failure the reply back to the requester will be handled
 *	       for the caller - as is the batch request structure itself.
 *	       It would be better if the caller got back an error code
 *	       and then called a function passing it that code and request
 *	       and let it handle the event log and rejection of the
 *	       request.  Currently, we are modeled along the lines of
 *	       the function chk_job_request().
 *
 * @param[in]	resvID	-	reservation ID
 * @param[in,out]	preq	-	job batch request
 *
 * @return	resc_resv *
 * @retval	resc_resv object ptr	: successful
 * @retval	NULL	: failed test/no object
 */

resc_resv *
chk_rescResv_request(char *resvID, struct batch_request *preq)
{
	resc_resv *presv;

	if ((presv = find_resv(resvID)) == NULL) {
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV, LOG_INFO,
			  resvID, msg_unkresvID);
		req_reject(PBSE_UNKRESVID, 0, preq);
		return NULL;
	}

	if (resvID[0] == PBS_MNTNC_RESV_ID_CHAR && !(preq->rq_perm & (ATR_DFLAG_OPWR | ATR_DFLAG_MGWR))) {
		req_reject(PBSE_PERM, 0, preq);
		return NULL;
	}

	if (svr_authorize_resvReq(preq, presv) == -1) {
		(void) sprintf(log_buffer, msg_permlog, preq->rq_type,
			       "RESCRESV", presv->ri_qs.ri_resvID,
			       preq->rq_user, preq->rq_host);
		log_event(PBSEVENT_SECURITY, PBS_EVENTCLASS_RESV, LOG_INFO,
			  presv->ri_qs.ri_resvID, log_buffer);
		req_reject(PBSE_PERM, 0, preq);
		return NULL;
	}

	return (presv);
}

/**
 * @return
 * 		svr_chk_ownerResv - compare a user name from a request and the name of
 *		the user who owns the resources reservation.
 *
 * @param[in]	preq	-	request structure which contains the user name
 * @param[in]	presv	-	resources reservation.
 *
 * @return	int
 * @retval	0	: if same
 * @retval	nonzero	: if user is not the reservation owner
 */

int
svr_chk_ownerResv(struct batch_request *preq, resc_resv *presv)
{
	char owner[PBS_MAXUSER + 1];
	char *host;
	char *pu;
	char rmtuser[PBS_MAXUSER + 1];

	/* map user@host to "local" name */

	pu = site_map_user(preq->rq_user, preq->rq_host);
	if (pu == NULL)
		return (-1);
	(void) strncpy(rmtuser, pu, PBS_MAXUSER);

	get_jobowner(get_rattr_str(presv, RESV_ATR_resv_owner), owner);
	host = get_hostPart(get_rattr_str(presv, RESV_ATR_resv_owner));
	pu = site_map_user(owner, host);

	return (strcmp(rmtuser, pu));
}

/**
 * @brief
 * 		svr_authorize_resvReq - determine if requestor is authorized to make
 *		request against the reservation.  This is only called for batch requests
 *		against reservations.
 *
 * @param[in]	preq	-	batch request structure
 * @param[in]	presv	-	resources reservation.
 *
 * @return	int
 * @retval	0	: if authorized (reservation owner, operator, administrator)
 * @retval	-1	: if not authorized.
 */

static int
svr_authorize_resvReq(struct batch_request *preq, resc_resv *presv)
{
	/* Is requestor special privileged? */

	if ((preq->rq_perm & (ATR_DFLAG_OPRD | ATR_DFLAG_OPWR |
			      ATR_DFLAG_MGRD | ATR_DFLAG_MGWR)) != 0)
		return (0);
	/* Only Manager has privilage to force modify reservation */
	if (preq->rq_type == PBS_BATCH_ModifyResv && (preq->rq_extend != NULL) &&
	    (strcmp(preq->rq_extend, FORCE) == 0) && ((preq->rq_perm & ATR_DFLAG_MGWR) == 0))
		return (-1);

	/* if not, see if requestor is the reservation owner */

	else if (svr_chk_ownerResv(preq, presv) == 0)
		return (0);

	else
		return (-1);
}


================================================
FILE: src/server/svr_connect.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    svr_connect.c
 *
 * @brief
 * 		svr_connect.c - contains routines to tie the structures used by
 *		net_client and net_server together with those used by the
 *		various PBS_*() routines in the API.
 *
 *		svr_connect() opens a connection with can be used with the
 *		API routines and still be selected in wait_request().
 *
 *		svr_disconnect() closes the above connection.
 *
 *		svr_disconnect_with_wait_option() like svr_disconnect() but there's
 *		an option to wait until connection has completely closed.
 *
 *		svr_force_disconnect() = directly closes the connection without asking
 *		the other end to close first.
 *
 * Functions included are:
 * 	svr_connect()
 * 	svr_disconnect()
 * 	svr_disconnect_with_wait_option()
 * 	svr_force_disconnect()
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <sys/types.h>

#include <unistd.h>
#include <sys/socket.h>
#include <signal.h>

#include <errno.h>
#include "libpbs.h"
#include "server_limits.h"
#include "net_connect.h"
#include "attribute.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "dis.h"
#include "list_link.h"
#include "attribute.h"
#include "work_task.h"
#include "log.h"
#include "server.h"

/* global data */
extern int errno;
extern int pbs_errno;
extern unsigned int pbs_mom_port;
extern char *msg_daemonname;
extern char *msg_noloopbackif;

extern pbs_net_t pbs_server_addr;

extern sigset_t allsigs; /* see pbsd_main.c */

/**
 * @brief
 *		opens a connection which can be used with the
 *      API routines and still be selected in wait_request(). It is called by
 *      the server whenever we need to send a request to another server, or
 *      talk to MOM.
 *
 * @param[in]   hostaddr - address of the host
 * @param[in]   port - port number f the host
 * @param[in]   func - pointer to function
 * @param[in]   cntype - indicates whether a connection table entry is in
 *                  use or is free
 * @param[in]   prot    - PROT_TPP or PROT_TCP
 *
 * @return	int
 * @retval	>=0	: connection handle returned on success. Note that a value
 *		 			of PBS_LOCAL_CONNECTION is special, it means the server
 *		 			is talking to itself.
 * @retval	-1	: PBS_NET_RC_FATAL (-1) is retuned if the error is believed
 *               	to be permanent
 * @retval	-2	: PBS_NET_RC_RETRY (-2) if the error is believed to be temporary,
 *               	ie retry.
 */
int
svr_connect(pbs_net_t hostaddr, unsigned int port, void (*func)(int), enum conn_type cntype, int prot)
{
	int sock;
	mominfo_t *pmom = NULL;
	conn_t *conn = NULL;
	dmn_info_t *pdmninfo;

	/* First, determine if the request is to another server or ourselves */

	if ((hostaddr == pbs_server_addr) && (port == pbs_server_port_dis))
		return (PBS_LOCAL_CONNECTION); /* special value for local */
	pmom = tfind2((unsigned long) hostaddr, port, &ipaddrs);

	if (pmom && (port == pmom->mi_port)) {
		pdmninfo = pmom->mi_dmn_info;
		/* connect to peer server associated with this mom */
		if (pdmninfo->dmn_state & INUSE_DOWN) {
			if (pdmninfo->dmn_state & INUSE_NEEDS_HELLOSVR) {
				if (open_conn_stream(pmom) < 0) {
					pbs_errno = PBSE_NORELYMOM;
					return (PBS_NET_RC_FATAL);
				}
			} else {
				pbs_errno = PBSE_NORELYMOM;
				return (PBS_NET_RC_FATAL);
			}
		}
	}

	if (prot == PROT_TPP) {
		if (!pmom) {
			pbs_errno = PBSE_SYSTEM;
			return (PBS_NET_RC_RETRY);
		}
		return pmom->mi_dmn_info->dmn_stream;
	}

	/* obtain the connection to the other server */
	/*  block signals while we attempt to connect */

	if (sigprocmask(SIG_BLOCK, &allsigs, NULL) == -1)
		log_err(errno, msg_daemonname, "sigprocmask(BLOCK)");

	sock = client_to_svr(hostaddr, port, B_RESERVED);
	if (pbs_errno == PBSE_NOLOOPBACKIF)
		log_err(PBSE_NOLOOPBACKIF, "client_to_svr", msg_noloopbackif);

	if ((sock < 0) && (errno == ECONNREFUSED)) {
		/* try one additional time */
		sock = client_to_svr(hostaddr, port, B_RESERVED);
		if (pbs_errno == PBSE_NOLOOPBACKIF)
			log_err(PBSE_NOLOOPBACKIF, "client_to_svr", msg_noloopbackif);
	}

	/* unblock signals */
	if (sigprocmask(SIG_UNBLOCK, &allsigs, NULL) == -1)
		log_err(errno, msg_daemonname, "sigprocmask(UNBLOCK)");

	if (sock < 0) {
		/* if execution node, mark it down  */
		if (pmom) {
			static char error_mess[256];

			sprintf(error_mess, "cannot open TCP stream: %s (%d)",
				strerror(errno), errno);
			momptr_down(pmom, error_mess);
		}
		pbs_errno = PBSE_NORELYMOM;
		return (sock); /* PBS_NET_RC_RETRY or PBS_NET_RC_FATAL */
	}

	/* We need to further identify our identity with the remote execution node
	 * to prevent against IP spoofing. The encoded cipher will include the local
	 * port used to connect to the remote execution node.
	 */
	if ((sock >=0) && pmom && (prot == PROT_TCP)) {
		char errbuf[LOG_BUF_SIZE] = "";
		struct sockaddr sockname;
		pbs_socklen_t socknamelen;
		char port_str[6]; /* TCP ports can go up to 65536, so 5 digits + 1 for null term */
		socknamelen = sizeof(sockname);

		if (getsockname(sock, (struct sockaddr *) &sockname, &socknamelen) < 0) {
			log_err(errno, __func__, "Error getting the socket's bound address");
			return (PBS_NET_RC_RETRY);
		}
		snprintf(port_str, sizeof(port_str), "%d", ntohs(GET_IP_PORT(&sockname)));
		if (client_cipher_auth(sock, port_str, errbuf, sizeof(errbuf)) != 0) {
			log_err(errno, __func__, errbuf);
			pbs_errno = PBSE_BADCRED;
			return (PBS_NET_RC_RETRY);
		}
	}

	/* add the connection to the server connection table and select list */

	if (func) {
		conn = add_conn(sock, ToServerDIS, hostaddr, port, NULL, func);
	} else {
		conn = add_conn(sock, ToServerDIS, 0, 0, NULL, NULL); /* empty slot */
	}

	if (!conn) {
		(void) close(sock);
		pbs_errno = PBSE_SYSTEM;
		return (PBS_NET_RC_FATAL);
	}

	conn->cn_sock = sock;
	conn->cn_authen |= PBS_NET_CONN_AUTHENTICATED;

	return (sock);
}
/**
 * @brief
 *		Close a connection made with svr_connect() by sending a
 *		PBS_BATCH_Disconnect request to the remote host.
 *
 * @note
 *		This will not wait for the remote host to close the
 *		connection. The calling program (like the main server) should
 *		take care of checking existing connections where the
 *		remote end has closed the connection as a PBS_BATCH_Disconnect
 *		response. If so, then proceed to locally close the connection.
 *
 * @param[in]	handle	-	the index to the connection table containing the socket
 *							to communicate the PBS_BATCH_Disconnect request.
 * @return	void
 */

void
svr_disconnect(int handle)
{
	svr_disconnect_with_wait_option(handle, 0);
}

/**
 * @brief
 *		Close a connection made with svr_connect() by sending a
 *		PBS_BATCH_Disconnect to the remote host. If the parameter
 *		'wait' is set to 1, then this function call would wait until
 *		connection is completely closed by the remote host.
 *
 * @note
 *		In addition to closing the actual connection, both the
 *		server's connection table and the handle table used by
 *		the API routines must be cleaned-up.
 *
 * @param[in]	handle	-	the index to the connection table containing the socket
 *							to communicate the PBS_BATCH_Disconnect request.
 * @param[in]	wait	-	if set to 1, then  this function waits until the remote
 *							host has closed the connection.
 *
 * @return	void
 *
 */

void
svr_disconnect_with_wait_option(int sock, int wait)
{
	char x;

	if (sock < 0 || sock >= PBS_LOCAL_CONNECTION)
		return;
	if (pbs_client_thread_lock_connection(sock) != 0)
		return;
	DIS_tcp_funcs();
	if ((encode_DIS_ReqHdr(sock, PBS_BATCH_Disconnect, pbs_current_user) == 0) && (dis_flush(sock) == 0)) {
		conn_t *conn = get_conn(sock);

		/* if no error, will be closed when process_request */
		/* sees the EOF					    */

		if (wait) {
			for (;;) {
				/* wait for EOF (closed connection) */
				/* from remote host, in response to */
				/* PBS_BATCH_Disconnect */
				if (read(sock, &x, 1) < 1)
					break;
			}

			(void) close(sock);
		} else if (conn) {
			conn->cn_func = close_conn;
			conn->cn_oncl = 0;
		}
	} else {
		/* error sending disconnect, just close now */
		close_conn(sock);
	}
	set_conn_errtxt(sock, NULL);
	set_conn_errno(sock, 0);
	(void) pbs_client_thread_unlock_connection(sock);
	pbs_client_thread_destroy_connect_context(sock);
}

/**
 * @brief
 * 		svr_force_disconnect - force the close of a connection
 *		Unlike svr_disconnect(), this does not send disconnect message
 *		and wait for the connection to be closed by the other end;
 *		just force it closed now.
 *
 * @param[in]	sock	-	connection sock
 */
void
svr_force_disconnect(int sock)
{
	if (sock < 0 || sock > PBS_LOCAL_CONNECTION)
		return;
	if (pbs_client_thread_lock_connection(sock) != 0)
		return;

	close_conn(sock);
	set_conn_errtxt(sock, NULL);
	(void) pbs_client_thread_unlock_connection(sock);
	pbs_client_thread_destroy_connect_context(sock);
}


================================================
FILE: src/server/svr_credfunc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	svr_credfunc.c
 *
 * @brief
 *	Routines for work task that takes care of renewing credentials for
 *	running jobs.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <errno.h>
#include <unistd.h>

#include "attribute.h"
#include "job.h"
#include "work_task.h"
#include "pbs_error.h"
#include "log.h"

#include <stdlib.h>

#define SVR_RENEW_CREDS_TM 300		    /* each 5*60 seconds, reschedule the work task and spread renew within the 5*60 seconds */
#define SVR_RENEW_PERIOD_DEFAULT 3600	    /* default renew creds 1 hour befor expiration */
#define SVR_RENEW_CACHE_PERIOD_DEFAULT 7200 /* default cred usable 2 hours befor expiration */

long svr_cred_renew_enable = 0; /*disable by default*/
long svr_cred_renew_period = SVR_RENEW_PERIOD_DEFAULT;
long svr_cred_renew_cache_period = SVR_RENEW_CACHE_PERIOD_DEFAULT;

extern time_t time_now;
extern pbs_list_head svr_alljobs;

extern int send_cred(job *pjob);

/* @brief
 *	The work task for particular job. This work task renew credentials for
 *	a job specified in the work task and sends the credentials to the
 *	superior mom.
 *
 * @param[in] pwt - work task structure
 *
 */
void
svr_renew_job_cred(struct work_task *pwt)
{
	char *jobid = (char *) pwt->wt_parm1;
	job *pjob = NULL;
	int rc;
	if ((pjob = find_job(jobid)) != NULL) {
		if (!check_job_state(pjob, JOB_STATE_LTR_RUNNING))
			return;

		/* job without cred id */
		if ((is_jattr_set(pjob, JOB_ATR_cred_id)) == 0)
			return;

		rc = send_cred(pjob);
		if (rc != 0) {
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER,
				   LOG_NOTICE, msg_daemonname,
				   "svr_renew_job_cred %s renew failed, send_cred returned: %d", pjob->ji_qs.ji_jobid, rc);
		} else {
			log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				   LOG_NOTICE, msg_daemonname,
				   "svr_renew_job_cred %s renew was successful", pjob->ji_qs.ji_jobid);
		}
	} /* else job does not exists - job probably finished */
}

/* @brief
 *	This is the main credentials renew work task. This work task runs every
 *	SVR_RENEW_CREDS_TM and it checks all the running jobs and for running
 *	jobs it checks the validity of credentials. If the credentials are too
 *	old then svr_renew_job_cred() work task is planned for the particular
 *	job.
 *
 * @param[in] pwt - work task structure
 *
 */
void
svr_renew_creds(struct work_task *pwt)
{
	job *pjob = NULL;
	job *nxpjob = NULL;

	/* first, set up another work task for next time period */
	if (pwt && svr_cred_renew_enable) {
		if (!set_task(WORK_Timed,
			      (time_now + SVR_RENEW_CREDS_TM),
			      svr_renew_creds, NULL)) {
			log_err(errno,
				__func__,
				"Unable to set task for renew credentials");
		}
	}

	/*
	 * Traverse through the SERVER job list and set renew task if necessary.
	 * The renew tasks are spread within SVR_RENEW_CREDS_TM
	 */
	pjob = (job *) GET_NEXT(svr_alljobs);

	while (pjob) {
		/* save the next job */
		nxpjob = (job *) GET_NEXT(pjob->ji_alljobs);

		if ((is_jattr_set(pjob, JOB_ATR_cred_id)) &&
		    check_job_state(pjob, JOB_STATE_LTR_RUNNING)) {

			if ((is_jattr_set(pjob, JOB_ATR_cred_validity)) &&
			    (get_jattr_long(pjob, JOB_ATR_cred_validity) - svr_cred_renew_period <= time_now)) {
				/* spread the renew tasks to the SVR_RENEW_CREDS_TM interval */
				if (!set_task(WORK_Timed, (time_now + (rand() % SVR_RENEW_CREDS_TM)), svr_renew_job_cred, pjob->ji_qs.ji_jobid)) {
					log_err(errno, __func__, "Unable to set task for renew job credential");
				}
			}
		}
		/* restore the saved next in pjob */
		pjob = nxpjob;
	}
}

/* @brief
 *	Enables renewing credentials for running jobs. It starts the renewing
 *	work task.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE on success
 * @retval	!= PBSE_NONE on error
 */
int
set_cred_renew_enable(attribute *pattr, void *pobject, int actmode)
{
#if defined(PBS_SECURITY) && (PBS_SECURITY == KRB5)
	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		svr_cred_renew_enable = pattr->at_val.at_long;
		if (svr_cred_renew_enable) {
			(void) set_task(WORK_Timed,
					(long) (time_now + SVR_RENEW_CREDS_TM),
					svr_renew_creds, 0);
		}
	}
#endif
	return (PBSE_NONE);
}

/* @brief
 *	Sets the svr_cred_renew_period.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE on success
 * @retval	!= PBSE_NONE on error
 */
int
set_cred_renew_period(attribute *pattr, void *pobject, int actmode)
{
	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if ((pattr->at_val.at_long < SVR_RENEW_CREDS_TM)) {
			log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				   LOG_NOTICE, msg_daemonname,
				   "%s value to low, using: %ld",
				   ATTR_cred_renew_period,
				   svr_cred_renew_period);
			return PBSE_BADATVAL;
		}

		svr_cred_renew_period = pattr->at_val.at_long;

		if ((svr_cred_renew_period > svr_cred_renew_cache_period)) {
			/* warning */
			log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				   LOG_NOTICE, msg_daemonname,
				   "%s: %ld should be lower than %s: %ld",
				   ATTR_cred_renew_period,
				   pattr->at_val.at_long,
				   ATTR_cred_renew_cache_period,
				   svr_cred_renew_cache_period);
		}

		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			   LOG_NOTICE, msg_daemonname,
			   "svr_cred_renew_period set to val %ld",
			   svr_cred_renew_period);
	}
	return PBSE_NONE;
}

/* @brief
 *	Sets the svr_cred_renew_cache_period.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE on success
 * @retval	!= PBSE_NONE on error
 */
int
set_cred_renew_cache_period(attribute *pattr, void *pobject, int actmode)
{
	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if ((pattr->at_val.at_long < SVR_RENEW_CREDS_TM)) {
			log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				   LOG_NOTICE, msg_daemonname,
				   "%s value to low, using: %ld",
				   ATTR_cred_renew_cache_period,
				   svr_cred_renew_cache_period);
			return PBSE_BADATVAL;
		}

		svr_cred_renew_cache_period = pattr->at_val.at_long;

		if ((svr_cred_renew_cache_period < svr_cred_renew_period)) {
			/* warning */
			log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				   LOG_NOTICE, msg_daemonname,
				   "%s: %ld should be greater than %s: %ld",
				   ATTR_cred_renew_cache_period,
				   pattr->at_val.at_long,
				   ATTR_cred_renew_period,
				   svr_cred_renew_period);
		}

		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			   LOG_NOTICE, msg_daemonname,
			   "svr_cred_renew_cache_period set to val %ld",
			   svr_cred_renew_cache_period);
	}
	return PBSE_NONE;
}


================================================
FILE: src/server/svr_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * 		miscellaneous server functions
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#ifdef PYTHON
#include "pbs_python_private.h"
#endif

#include "portability.h"
#include <assert.h>
#include <sys/types.h>
#include <ctype.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <sys/stat.h>
#include <sys/wait.h>
#include <unistd.h>
#include <fcntl.h>
#include <signal.h>
#include "server_limits.h"
#include "list_link.h"
#include "log.h"
#include "attribute.h"
#include "resource.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "server.h"
#include "pbs_error.h"
#include "sched_cmds.h"
#include "ticket.h"
#include "pbs_nodes.h"
#include "tpp.h"
#include "pbs_license.h"
#include "pbs_share.h"
#include "pbs_entlim.h"
#include "work_task.h"
#include "acct.h"
#include "provision.h"
#include "hook.h"
#include "net_connect.h"
#include "libpbs.h"
#include "batch_request.h"
#include "svrfunc.h"
#include "pbs_db.h"
#include "libutil.h"
#include "pbs_ecl.h"
#include "pbs_sched.h"
#include "liblicense.h"

extern struct python_interpreter_data svr_interp_data;
extern pbs_list_head svr_runjob_hooks;
extern pbs_list_head svr_deferred_req;

extern time_t time_now;
extern char *resc_in_err;
extern char *msg_daemonname;
extern char server_name[];

extern pbs_list_head svr_allconns;

#define ERR_MSG_SIZE 256
#define MAXNLINE 2048
#define SERVER_ID "1"

/*
 * application provisioning returns success status as 1
 */
#define APP_PROV_SUCCESS 1

extern char *path_hooks_workdir;
extern char *path_priv;

char *path_prov_track;
int max_concurrent_prov = PBS_MAX_CONCURRENT_PROV;
int provision_timeout;

/*
 * the top level list of all vnodes queued for provisioning
 */
pbs_list_head prov_allvnodes;

static int is_runnable(job *, struct prov_vnode_info *);
extern void set_srv_prov_attributes();
static void del_prov_vnode_entry(job *);
extern int resize_prov_table(int);
static void prov_startjob(struct work_task *ptask);
extern enum failover_state are_we_primary(void);

/*
 * Added for History jobs.
 */
extern void svr_clean_job_history(struct work_task *);
long svr_history_enable = 0;			 /* disable by default */
long svr_history_duration = SVR_JOBHIST_DEFAULT; /* default 2 weeks */
/* Added for Trillion Jobid*/
long long svr_max_job_sequence_id = SVR_MAX_JOB_SEQ_NUM_DEFAULT; /* default max job id 9999999 */

/*
 * Added for Node_fail_requeue
 */
long node_fail_requeue = PBS_NODE_FAIL_REQUEUE_DEFAULT; /* default value for node_fail_requeue 310 */

/*
 * Added for jobscript_max_size
 */
struct attribute attr_jobscript_max_size; /* to store default size value for jobscript_max_size */

extern int do_sync_mom_hookfiles;
extern int sync_mom_hookfiles_replies_pending;

/*
 * Added for licensing
 */
extern struct work_task *init_licensing_task;
extern struct work_task *get_more_licenses_task;
extern struct work_task *licenses_linger_time_task;
extern void get_more_licenses(struct work_task *ptask);
extern void return_lingering_licenses(struct work_task *ptask);

/*
 * Miscellaneous server functions
 */
extern void db_to_svr_svr(struct server *ps, pbs_db_svr_info_t *pdbsvr);
#ifdef NAS /* localmod 005 */
extern int write_single_node_state(struct pbsnode *np);
#endif /* localmod 005 */

char primary_host[PBS_MAXHOSTNAME + 1]; /* host_name of primary */

/*
 * the following array of strings is used in decoding/encoding the server state
 */
static char *svr_idle = "Idle";
static char *svr_sched = "Scheduling";
static char *svr_state_names[] = {
	"",		     /* SV_STATE_DOWN */
	"",		     /* SV_STATE_INIT */
	"Hot_Start",	     /* SV_STATE_HOT  */
	"Active",	     /* SV_STATE_RUN  */
	"Terminating_Delay", /* SV_STATE_SHUTDEL */
	"Terminating",	     /* SV_STATE_SHUTIMM */
	"Terminating"	     /* SV_STATE_SHUTSIG */
};

/**
 * @brief
 * 		encode_svrstate - encode the current server state from the internal
 *		integer to a state name string.
 *
 * @param[in]	pattr	-	ptr to attribute
 * @param[in,out]	phead	-	head of attrlist list
 * @param[in]	atname	-	attribute name
 * @param[in]	rsname	-	resource name
 * @param[in]	mode	-	encode mode
 * @param[out]	rtnl	-	RETURN: ptr to svrattrl
 *
 * @return	int
 * @retval	0	: don't bother to encode it
 * @retval	1	: encoded.
 */

int
encode_svrstate(const attribute *pattr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	svrattrl *pal;
	char *psname;

	if (!pattr)
		return (-1);
	if ((mode == ATR_ENCODE_SAVE) ||
	    (pattr->at_val.at_long <= SV_STATE_DOWN) ||
	    (pattr->at_val.at_long > SV_STATE_SHUTSIG))
		return (0); /* don't bother to encode it */

	psname = svr_state_names[pattr->at_val.at_long];
	if (pattr->at_val.at_long == SV_STATE_RUN) {
		if (get_sattr_long(SVR_ATR_scheduling) == 0)
			psname = svr_idle;
		else if (dflt_scheduler && dflt_scheduler->sc_cycle_started == 1)
			psname = svr_sched;
	}

	pal = attrlist_create(atname, rsname, strlen(psname) + 1);
	if (pal == NULL)
		return (-1);
	(void) strcpy(pal->al_value, psname);
	pal->al_flags = pattr->at_flags;
	append_link(phead, &pal->al_link, pal);
	if (rtnl)
		*rtnl = pal;
	return (1);
}

/**
 * @brief
 * 		set_resc_assigned - updates server and/or queue resources_assigned
 *		attribute depending on to what kind of object the first argument
 *		points and possibly on what value of "state" the object has
 *
 * @param[in,out]	pobj	-	pointer to reservation or object based on the type
 * @param[in]	objtype	-	0=job, 1=reservation
 * @param[in]	op	-	operation to be performed.
 *
 */
void
set_resc_assigned(void *pobj, int objtype, enum batch_op op)
{
	resc_resv *presv = NULL;
	resource_def *rscdef;
	job *pjob = NULL;
	resource *pr = NULL;
	resource *rescp = NULL;
	attribute *queru = NULL;
	attribute *sysru = NULL;

	/*First part of this lengthy function figures out which
	 *"resources_assigned" lists need to get updated.  Most of
	 *the time it's two lists that will get updated, but it can
	 *be only one (or even none, if the resources have already
	 *been accounted earlier) if for example we have a job belonging
	 *to a reservation and the job is told to run or the job exits
	 */

	if (!objtype) {
		pjob = (job *) pobj;

		if ((pjob->ji_qhdr == 0) ||
		    (pjob->ji_qhdr->qu_qs.qu_type != QTYPE_Execution))
			return;

		if (op == INCR) {
			if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_RescAssn)
				return; /* already added in */
			pjob->ji_qs.ji_svrflags |= JOB_SVFLG_RescAssn;
		} else if (op == DECR) {
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_RescAssn) == 0)
				return; /* not currently included */
			pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_RescAssn;
		} else {
			return; /* invalid op */
		}

		rescp = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
		if ((check_job_substate(pjob, JOB_SUBSTATE_SUSPEND)) ||
		    (check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP))) {
			/* If resources_released attribute is not set for this suspended job then use release all
			 * resources assigned to the job */
			if ((is_jattr_set(pjob, JOB_ATR_resc_released)) == 0)
				rescp = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
			else {
				/* Use resource_released_list for updating queue/server resources,
				 * If resource_released_list is not present then create it by
				 * using resources_released attribute.
				 */
				if (is_jattr_set(pjob, JOB_ATR_resc_released_list))
					rescp = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resc_released_list));
				else {
					if (update_resources_rel(pjob, get_jattr(pjob, JOB_ATR_resc_released), INCR) != 0)
						rescp = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
					else
						rescp = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resc_released_list));
				}
			}
		} else {
			/* If job is not suspended then just release all resources assigned to the job */
			rescp = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
			if (is_jattr_set(pjob, JOB_ATR_resc_released_list))
				rescp = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resc_released_list));
		}
		sysru = get_sattr(SVR_ATR_resource_assn);
		queru = get_qattr(pjob->ji_qhdr, QE_ATR_ResourceAssn);

		if (pjob->ji_myResv &&
		    (pjob->ji_myResv->ri_qs.ri_state == RESV_RUNNING ||
		     pjob->ji_myResv->ri_qs.ri_state == RESV_DELETED ||
		     pjob->ji_myResv->ri_qs.ri_state == RESV_BEING_DELETED ||
		     pjob->ji_myResv->ri_qs.ri_state == RESV_FINISHED)) {

			/*for jobs running under a reservation, server's
			 *"resources_assigned" is updated when reservation
			 *itself begins running or is terminated.  So don't touch
			 *the server's resources_assigned
			 */
			sysru = NULL;
		}
	} else if (objtype == 1) {

		presv = (resc_resv *) pobj;
		queru = NULL;
		sysru = NULL;
		rescp = (resource *) GET_NEXT(get_rattr_list(presv, RESV_ATR_resource));
		if (presv->ri_parent != NULL &&
		    (presv->ri_parent->ri_qs.ri_state == RESV_RUNNING ||
		     presv->ri_parent->ri_qs.ri_state == RESV_DELETED ||
		     presv->ri_parent->ri_qs.ri_state == RESV_BEING_DELETED ||
		     presv->ri_parent->ri_qs.ri_state == RESV_FINISHED)) {
			/*if the reservation has a parent (as reservation jobs can)
			 *the parent's "resources_assigned" list is the relevant list
			 *to modify
			 *Remark: The -server's- "resources_assigned" updates when the
			 *parent starts running or is terminated
			 */
			sysru = get_qattr(presv->ri_parent->ri_qp, QE_ATR_ResourceAssn);
		} else if (presv->ri_parent == NULL &&
			   (presv->ri_qs.ri_state == RESV_RUNNING ||
			    presv->ri_qs.ri_state == RESV_DELETED ||
			    presv->ri_qs.ri_state == RESV_BEING_DELETED ||
			    presv->ri_qs.ri_state == RESV_FINISHED)) {
			/*when reservation object has no parent reservation, the server's
			 *"resources_asigned" list is the one that's relevant in this case.
			 *if the reservation object is that of a "reservation job",
			 *the job's queue needs to have its "resources_assigned" list
			 *modified.  Otherwise the "queru" should be set NULL
			 */

			sysru = get_sattr(SVR_ATR_resource_assn);
		}
	}

	/*
	 *for each resource in the job (or reservation's or reservation-job's)
	 *list, check in the definition for that resource to see if the "RASSN"
	 *flag is turned on.  If the flag is set, modify the appropriate
	 *"resources_assigned" lists ("queue", "sys" or both) to account for
	 *the amount of the resources being consumed or relinquished by the object.
	 *
	 *Note: if we aren't supposed to be updating the server's or the queue's
	 *	"resources_assigned" the pointers "sysru"/"queru" should be NULL
	 */
	while (rescp) {
		rscdef = rescp->rs_defin;

		/* if resource usage is to be tracked */
		if ((rscdef->rs_flags & ATR_DFLAG_RASSN) &&
		    (is_attr_set(&rescp->rs_value))) {

			/* update system attribute of resources assigned */

			if (sysru) {
				pr = find_resc_entry(sysru, rscdef);
				if (pr == NULL) {
					pr = add_resource_entry(sysru, rscdef);
					if (pr == NULL)
						return;
				}
				rscdef->rs_set(&pr->rs_value, &rescp->rs_value, op);
				sysru->at_flags |= ATR_MOD_MCACHE;
			}

			/* update queue attribute of resources assigned */

			if (queru) {
				pr = find_resc_entry(queru, rscdef);
				if (pr == NULL) {
					pr = add_resource_entry(queru, rscdef);
					if (pr == NULL)
						return;
				}
				rscdef->rs_set(&pr->rs_value, &rescp->rs_value, op);
				queru->at_flags |= ATR_MOD_MCACHE;
			}
		}
		rescp = (resource *) GET_NEXT(rescp->rs_link);
	}

	/* if a job, update resource_assigned at the node level */
	if (objtype == 1)
		update_node_rassn(get_rattr(presv, RESV_ATR_resv_nodes), op);
	else if ((objtype == 0) && (pjob->ji_myResv == NULL)) {
		if (is_jattr_set(pjob, JOB_ATR_resc_released))
			/* This is just the normal case when job was not suspended but trying to run| end */
			update_job_node_rassn(pjob, get_jattr(pjob, JOB_ATR_resc_released), op);
		else
			/* updating all resources from exec vnode attribute */
			update_job_node_rassn(pjob, get_jattr(pjob, JOB_ATR_exec_vnode), op);
		if (is_jattr_set(pjob, JOB_ATR_exec_vnode_deallocated)) {
			update_job_node_rassn(pjob, get_jattr(pjob, JOB_ATR_exec_vnode_deallocated), op);
		}
	}
}

/**
 * @brief
 * 		ck_chkpnt - check validity of job checkpoint attribute value
 *
 * @param[in]	pattr	-	checkpoint attribute
 * @param[in]	pobject	-	job object
 * @param[in]	mode	-	action mode
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: PBS Error Code
 */
int
ck_chkpnt(attribute *pattr, void *pobject, int mode)
{
	char *val;

	val = pattr->at_val.at_str;
	if (val == NULL)
		return (0);

	if ((*val == 'n') || (*val == 's') || (*val == 'u')) {
		if (*(val + 1) != '\0')
			return (PBSE_BADATVAL);
	} else if (*val == 'c') {
		val++;
		if (*val != '\0') {
			if (*val++ != '=')
				return (PBSE_BADATVAL);
			if (atoi(val) <= 0)
				return (PBSE_BADATVAL);
		}
	} else if (*val == 'w') {
		val++;
		if (*val != '\0') {
			if (*val++ != '=')
				return (PBSE_BADATVAL);
			if (atoi(val) <= 0)
				return (PBSE_BADATVAL);
		}
	} else
		return (PBSE_BADATVAL);

	/* If the checkpoint attribute is being altered, then check    */
	/* against the queue's Checkpoint_min attribute as when queued */
	if (mode == ATR_ACTION_ALTER)
		eval_chkpnt((job *) pobject, get_qattr(((job *) pobject)->ji_qhdr, QE_ATR_ChkptMin));
	return (0);
}

/**
 * @brief
 *      keepfiles_action - check validity of job keepfiles attribute value
 *
 * @param[in]   pattr   -   keepfiles attribute
 * @param[in]   pobject -   job object
 * @param[in]   mode    -   action mode
 *
 * @return  int
 * @retval  0   : success
 * @retval  !0  : PBS Error Code
 */
int
keepfiles_action(attribute *pattr, void *pobject, int mode)
{
	if ((mode != ATR_ACTION_ALTER) && (mode != ATR_ACTION_NEW))
		return PBSE_NONE;
	if (pobject && check_job_state((job *) pobject, JOB_STATE_LTR_RUNNING))
		return PBSE_MODATRRUN;
	return verify_keepfiles_common(pattr->at_val.at_str);
}

/**
 * @brief
 *      removefiles_action - check validity of job removefiles attribute value
 *
 * @param[in]   pattr   -   remove attribute
 * @param[in]   pobject -   job object
 * @param[in]   mode    -   action mode
 *
 * @return  int
 * @retval  0   : success
 * @retval  !0  : PBS Error Code
 */
int
removefiles_action(attribute *pattr, void *pobject, int mode)
{
	if ((mode != ATR_ACTION_ALTER) && (mode != ATR_ACTION_NEW))
		return PBSE_NONE;
	if (pobject && check_job_state((job *) pobject, JOB_STATE_LTR_RUNNING))
		return PBSE_MODATRRUN;
	return verify_removefiles_common(pattr->at_val.at_str);
}

/**
 * @brief
 * 		cred_name_okay - action routine for the "required_cred" attribute.
 *		Check to make sure the cred name is okay.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: failure
 */

int
cred_name_okay(attribute *pattr, void *pobj, int actmode)
{
	static const char *cred_list[] = {
		PBS_CREDNAME_AES,
		NULL /* must be last */
	};

	if (actmode == ATR_ACTION_ALTER) {
		char *val = pattr->at_val.at_str;
		int i;

		for (i = 0; cred_list[i]; i++) {
			if (strcmp(cred_list[i], val) == 0)
				return PBSE_NONE;
		}
		return PBSE_BADATVAL;
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		action_resv_retry_time - action routine for the server's
 * 		"reserve_retry_time" attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: failure
 */
int
action_reserve_retry_time(attribute *pattr, void *pobj, int actmode)
{
	if (actmode == ATR_ACTION_ALTER ||
	    actmode == ATR_ACTION_RECOV) {

		if (pattr->at_val.at_long <= 0)
			return PBSE_BADATVAL;
		ATR_UNSET(get_sattr(SVR_ATR_resv_retry_init));
		resv_retry_time = pattr->at_val.at_long;
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		action_resv_retry_init - action routine for the server's
 * 		"reserve_retry_init" attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: failure
 */
int
action_reserve_retry_init(attribute *pattr, void *pobj, int actmode)
{
	if (actmode == ATR_ACTION_ALTER ||
	    actmode == ATR_ACTION_RECOV) {

		if (pattr->at_val.at_long <= 0)
			return PBSE_BADATVAL;
		set_sattr_l_slim(SVR_ATR_resv_retry_time, pattr->at_val.at_long, SET);

		resv_retry_time = pattr->at_val.at_long;
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		dummy action function for rpp_retry
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: failure
 */
int
set_rpp_retry(attribute *pattr, void *pobj, int actmode)
{
	log_err(-1, __func__, "rpp_retry is deprecated. This functionality is now automatic without needing this attribute");
	return PBSE_NONE;
}

/**
 * @brief
 * 		dummy action function for rpp_highwater
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: failure
 */
int
set_rpp_highwater(attribute *pattr, void *pobj, int actmode)
{
	log_err(-1, __func__, "rpp_highwater is deprecated. This functionality is now automatic without needing this attribute");
	return PBSE_NONE;
}

/**
 * @brief
 *		is_valid_resource - action function to make sure attribute value is
 *			        a valid resource of type string
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: failure
 */
int
is_valid_resource(attribute *pattr, void *pobject, int actmode)
{
	int i;
	struct resource_def *pres;

	if (actmode == ATR_ACTION_FREE)
		return (PBSE_NONE);

	if (is_attr_set(pattr) == 0)
		return (PBSE_NONE);

	for (i = 0; i < pattr->at_val.at_arst->as_usedptr; ++i) {
		pres = find_resc_def(svr_resc_def, pattr->at_val.at_arst->as_string[i]);
		if (pres == NULL)
			return PBSE_UNKRESC;

		if ((pres->rs_type != ATR_TYPE_STR) &&
		    (pres->rs_type != ATR_TYPE_ARST))
			return PBSE_RESCNOTSTR;
	}

	return PBSE_NONE;
}

/**
 * @brief
 * 		action_svr_iteration - the "action" routine for the server
 *		scheduler_iteration attribute
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: PBSE Error Code
 */
int
action_svr_iteration(attribute *pattr, void *pobj, int mode)
{
	/* set this attribute on main scheduler */
	if (dflt_scheduler) {
		if (mode == ATR_ACTION_NEW || mode == ATR_ACTION_ALTER || mode == ATR_ACTION_RECOV) {
			set_sched_attr_l_slim(dflt_scheduler, SCHED_ATR_schediteration, pattr->at_val.at_long, SET);
			sched_save_db(dflt_scheduler);
		}
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		deflt_chunk_action - the "action" routine for the queue and server
 *		default_chunk attribute
 * @par
 *		Builds an array of key_value_pair structures for the defaults
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	0	: success
 * @retval	!0	: PBSE Error Code
 */
int
deflt_chunk_action(attribute *pattr, void *pobj, int mode)
{
	int i;
	int j;
	int nelem;
	int *nkv;
	int old_perm;
	struct key_value_pair **pkvp;
	resource *presc;
	pbs_list_head head;
	svrattrl *psvratrl;
	int rc;
	extern int resc_access_perm;

	CLEAR_HEAD(head);

	if (pobj == (void *) &server) {
		pkvp = &server.sv_seldft;
		nkv = &server.sv_nseldft;
	} else {
		pkvp = &((pbs_queue *) pobj)->qu_seldft;
		nkv = &((pbs_queue *) pobj)->qu_nseldft;
	}

	/* free any existing key_value_pair structure */
	if (*pkvp) {
		for (i = 0; i < *nkv; ++i) {
			free(((*pkvp) + i)->kv_keyw);
			free(((*pkvp) + i)->kv_val);
		}
		free(*pkvp);
		*pkvp = NULL;
	}
	*nkv = 0;

	if (((is_attr_set(pattr)) == 0) ||
	    (mode == ATR_ACTION_FREE))
		return 0;

	/* validate and count the number of pairs in the default attribute */
	nelem = 0;

	presc = GET_NEXT(pattr->at_val.at_list);
	while (presc) {
		if ((presc->rs_defin->rs_flags & ATR_DFLAG_CVTSLT) == 0) {
			if ((resc_in_err = strdup(presc->rs_defin->rs_name)) == NULL)
				return PBSE_SYSTEM;
			return PBSE_INVALJOBRESC;
		}
		nelem++;
		presc = GET_NEXT(presc->rs_link);
	}

	/* encode the default resources so we can get the values */
	/* need to save & restore the current value incase we are recovering */
	old_perm = resc_access_perm;
	resc_access_perm = ATR_DFLAG_RDACC;
	rc = encode_resc(pattr, &head, ATTR_DefaultChunk, NULL, ATR_ENCODE_CLIENT, NULL);
	resc_access_perm = old_perm;
	if (rc < 0) {
		return PBSE_SYSTEM;
	}

	*pkvp = (struct key_value_pair *) malloc((nelem + 1) * sizeof(struct key_value_pair));
	if (*pkvp == NULL) {
		free_attrlist(&head);
		return PBSE_SYSTEM;
	}

	/* now set the name and value words */
	i = 0;
	psvratrl = GET_NEXT(head);
	while (psvratrl && i < nelem) {
		if ((((*pkvp) + i)->kv_keyw = strdup(psvratrl->al_resc)) == NULL) {
			free_attrlist(&head);
			if (*pkvp) {
				for (j = 0; j < i; ++j) {
					free(((*pkvp) + j)->kv_keyw);
					free(((*pkvp) + j)->kv_val);
				}
				free(*pkvp);
				*pkvp = NULL;
			}
			return PBSE_SYSTEM;
		}
		if ((((*pkvp) + i)->kv_val = strdup(psvratrl->al_value)) == NULL) {
			free_attrlist(&head);
			if (*pkvp) {
				for (j = 0; j < i; ++j) {
					free(((*pkvp) + j)->kv_keyw);
					free(((*pkvp) + j)->kv_val);
				}
				free(*pkvp);
				*pkvp = NULL;
			}
			return PBSE_SYSTEM;
		}
		++i;
		psvratrl = GET_NEXT(psvratrl->al_link);
	}
	free_attrlist(&head); /* free svrattrl list created by the encode */

	*nkv = i;

	return 0;
}

/**
 * @brief
 *	set_license_location - action function for the pbs_license_info
 * 				server attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 */
int
set_license_location(attribute *pattr, void *pobject, int actmode)
{
	if (actmode == ATR_ACTION_FREE)
		return (PBSE_NONE);

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {
		int delay = 5;

		if (pbs_licensing_location)
			free(pbs_licensing_location);

		pbs_licensing_location = strdup(pattr->at_val.at_str ? pattr->at_val.at_str : "");
		if (pbs_licensing_location == NULL) {
			log_err(errno, __func__, "warning: strdup failed!");
			return PBSE_SYSTEM;
		}

		if (actmode == ATR_ACTION_RECOV)
			delay = 0;

		init_licensing_task = set_task(WORK_Timed, time_now + delay, init_licensing, NULL);
	}

	return (PBSE_NONE);
}

/**
 * @brief
 *		unset_license_location - set the floating licensing
 * 				server attribute to default value.
 *
 */
void
unset_license_location(void)
{

	if (pbs_licensing_location) {

		if (pbs_licensing_location[0] != '\0') {
			lic_close();
			unlicense_nodes();
			memset(&license_counts, 0, sizeof(license_counts));
		} else
			reset_license_counters(&license_counts);

		free(pbs_licensing_location);
		pbs_licensing_location = NULL;
	}
}

/*
 *
 * @brief
 *	Set node_fail_requeue attribute.
 *
 * @par Functionality:
 *	This function sets the node_fail_requeue server attribute.
 *	Since node_fail_requeue can be a negative value no check
 *	for < 0 is performed.
 *
 * @param[in]	pattr	-	ptr to attribute
 * @param[in]	pobject	-	pointer to some parent object.(required but unused here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE
 *
 */
int
set_node_fail_requeue(attribute *pattr, void *pobject, int actmode)
{
	if (actmode == ATR_ACTION_FREE)
		return (PBSE_NONE);

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		node_fail_requeue = pattr->at_val.at_long;
		sprintf(log_buffer,
			"node_fail_requeue value changed to %ld",
			node_fail_requeue);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_NOTICE, msg_daemonname, log_buffer);
	}

	return (PBSE_NONE);
}

/*
 *
 * @brief
 *	Unset node_fail_requeue attribute.
 *
 * @par Functionality:
 *	This function unsets the node_fail_requeue server attribute
 *	by reverting it back to it's default value.
 *
 * @param[in]	void
 *
 * @return	void
 *
 */
void
unset_node_fail_requeue(void)
{
	node_fail_requeue = PBS_NODE_FAIL_REQUEUE_DEFAULT;

	sprintf(log_buffer,
		"node_fail_requeue reverting back to default val %ld",
		node_fail_requeue);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);
}

/*
 *
 * @brief
 *	Set resend_term_delay attribute.
 *
 * @par Functionality:
 *	This function sets the resend_term_delay server attribute.
 *	resend_term_delay can not be < 0 and > 1800.
 *
 * @param[in]	pattr	-	ptr to attribute
 * @param[in]	pobject	-	pointer to some parent object.(required but unused here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE
 *
 */
int
set_resend_term_delay(attribute *pattr, void *pobject, int actmode)
{
	if (actmode == ATR_ACTION_FREE)
		return (PBSE_NONE);

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if (pattr->at_val.at_long >= 0 && pattr->at_val.at_long <= 1800) {
			set_sattr_l_slim(SVR_ATR_ResendTermDelay, pattr->at_val.at_long, SET);
		} else {
			return (PBSE_BADATVAL);
		}
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			LOG_NOTICE, msg_daemonname, "resend_term_delay value changed to %ld",
			pattr->at_val.at_long);
	}

	return (PBSE_NONE);
}

/*
 *
 * @brief
 *	Unset resend_term_delay attribute.
 *
 * @par Functionality:
 *	This function unsets the resend_term_delay server attribute
 *	by reverting it back to it's default value.
 *
 * @param[in]	void
 *
 * @return	void
 *
 */
void
unset_resend_term_delay(void)
{
	set_sattr_l_slim(SVR_ATR_ResendTermDelay,
		PBS_RESEND_TERM_DELAY_DEFAULT, SET);
	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		LOG_NOTICE, msg_daemonname,
		"resend_term_delay reverting back to default val %ld",
		PBS_RESEND_TERM_DELAY_DEFAULT);
}

/**
 * @brief
 *		set_license_min - action function for the pbs_license_min server
 *			  attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 */
int
set_license_min(attribute *pattr, void *pobject, int actmode)
{
	if (actmode == ATR_ACTION_FREE)
		return (PBSE_NONE);

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if ((pattr->at_val.at_long < 0) ||
		    (pattr->at_val.at_long > licensing_control.licenses_max)) {
			return (PBSE_LICENSE_MIN_BADVAL);
		}
		licensing_control.licenses_min = pattr->at_val.at_long;

		if (licensing_control.licenses_min > licensing_control.licenses_checked_out)
			if (get_more_licenses_task == NULL)
				get_more_licenses_task = set_task(WORK_Timed, time(NULL) + 2, get_more_licenses, NULL);
	}

	return (PBSE_NONE);
}

/**
 * @brief
 *		unset_license_min - set the the pbs_license_min server
 *			  attribute to default value.
 */
void
unset_license_min(void)
{
	licensing_control.licenses_min = PBS_MIN_LICENSING_LICENSES;

	sprintf(log_buffer,
		"pbs_license_min reverting back to default val %ld",
		licensing_control.licenses_min);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);
}

/**
 * @brief
 *		set_license_max - action function for the pbs_license_max server
 *			  attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	PBSE_LICENSE_MAX_BADVAL	: wrong value for pbs_license_max attribute
 */
int
set_license_max(attribute *pattr, void *pobject, int actmode)
{
	if (actmode == ATR_ACTION_FREE)
		return (PBSE_NONE);

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if ((pattr->at_val.at_long < 0) ||
		    (pattr->at_val.at_long < licensing_control.licenses_min)) {
			return (PBSE_LICENSE_MAX_BADVAL);
		}
		licensing_control.licenses_max = pattr->at_val.at_long;

		if ((licensing_control.licenses_max < licensing_control.licenses_checked_out) ||
		    ((licensing_control.licenses_checked_out < licensing_control.licenses_total_needed) &&
		     (licensing_control.licenses_checked_out < licensing_control.licenses_max)))
			if (get_more_licenses_task == NULL)
				get_more_licenses_task = set_task(WORK_Timed, time(NULL) + 2, get_more_licenses, NULL);
	}

	return (PBSE_NONE);
}

/**
 * @brief
 *		unset_license_max - set pbs_license_max server
 *			  attribute to default value.
 */
void
unset_license_max(void)
{
	licensing_control.licenses_max = PBS_MAX_LICENSING_LICENSES;

	sprintf(log_buffer,
		"pbs_license_max reverting back to default val %ld",
		licensing_control.licenses_max);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);
}

/**
 * @brief
 *		set_license_linger - action function for the pbs_license_linger server
 *			  attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	PBSE_LICENSE_LINGER_BADVAL	: wrong value for pbs_license_linger attribute
 */
int
set_license_linger(attribute *pattr, void *pobject, int actmode)
{

	if (actmode == ATR_ACTION_FREE)
		return (PBSE_NONE);

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if ((pattr->at_val.at_long <= 0)) {
			return (PBSE_LICENSE_LINGER_BADVAL);
		}
		licensing_control.licenses_linger_time = pattr->at_val.at_long;

		if (licenses_linger_time_task)
			delete_task(licenses_linger_time_task);

		licenses_linger_time_task = set_task(WORK_Timed,
						     licensing_control.licenses_checkout_time + licensing_control.licenses_linger_time,
						     return_lingering_licenses, NULL);
	}

	return (PBSE_NONE);
}

/**
 * @brief
 *		unset_license_linger - set pbs_license_linger server
 *			  attribute to default value.
 */
void
unset_license_linger(void)
{
	licensing_control.licenses_linger_time = PBS_LIC_LINGER_TIME;

	sprintf(log_buffer,
		"pbs_license_linger_time reverting back to default val %ld",
		licensing_control.licenses_linger_time);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);
}

/**
 * @brief
 *		Function name: unset_job_history_enable
 * @par
 *		Description: It is called when the job_history_enable attr will be
 *		     unset through "qmgr".
 * @par
 *		Purpose: If the job_history_enable server attribute is unset, then
 *		 set the global svr_history_enable to '0' and purge all the
 *		 the history jobs available in the server immediately. Also
 *		 will be called if job_history_enable set to 0.
 * @par
 *		Input : None
 *		Output: None
 */
void
unset_job_history_enable(void)
{
	job *pjob = NULL;
	job *nxpjob = NULL;

	sprintf(log_buffer, "job_history_enable has been unset.");
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);

	/*
	 * Reset the SERVER level global switch for job history
	 * feature i.e. svr_history_enable. It will not keep the
	 * job history information anymore.
	 */
	svr_history_enable = 0;

	/*
	 * Find all the history jobs (jobs with state JOB_STATE_LTR_MOVED
	 * and JOB_STATE_LTR_FINISHED) in the server and purge them right
	 * now as job_history_enable has been UNSET OR SET to FALSE.
	 */
	pjob = (job *) GET_NEXT(svr_alljobs);
	while (pjob != NULL) {
		/* save the next */
		nxpjob = (job *) GET_NEXT(pjob->ji_alljobs);

		if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
		    (check_job_state(pjob, JOB_STATE_LTR_FINISHED)) ||
		    (check_job_state(pjob, JOB_STATE_LTR_EXPIRED))) {
			job_purge(pjob);
			pjob = NULL;
		}
		/* restore the next and continue */
		pjob = nxpjob;
	}
}

/**
 * @brief
 *		set_job_history_enable - action function for the job_history_enable server
 *			  attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 */
int
set_job_history_enable(attribute *pattr, void *pobject, int actmode)
{
	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		svr_history_enable = pattr->at_val.at_long;
		if (svr_history_enable) {
			(void) set_task(WORK_Timed,
					(long) (time_now + SVR_CLEAN_JOBHIST_TM),
					svr_clean_job_history, 0);
		} else {
			unset_job_history_enable();
		}
	}
	return (PBSE_NONE);
}

/**
 * @brief
 *		set_log_events - action function for the log_events
 *			  server attribute, also sets the tpp logmask
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 */
int
set_log_events(attribute *pattr, void *pobject, int actmode)
{
	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {
		tpp_set_logmask(pattr->at_val.at_long);
	}
	return (PBSE_NONE);
}

/**
 * @brief
 *		set_job_history_duration - action function for the job_history_duration
 *			  server attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	PBSE_BADATVAL	: Invalid attribute value
 */
int
set_job_history_duration(attribute *pattr, void *pobject, int actmode)
{

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if ((pattr->at_val.at_long < 0))
			return (PBSE_BADATVAL);

		svr_history_duration = pattr->at_val.at_long;
		sprintf(log_buffer, "svr_history_duration set to val %ld",
			svr_history_duration);
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_NOTICE, msg_daemonname, log_buffer);
	}
	return (PBSE_NONE);
}

/**
 * @brief
 *		unset_job_history_duration - set job_history_duration server
 *			  attribute to default value.
 */
void
unset_job_history_duration(void)
{
	svr_history_duration = SVR_JOBHIST_DEFAULT;

	sprintf(log_buffer,
		"svr_history_duration reverting back to default val %ld",
		svr_history_duration);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);
}

/**
 * @brief
 *	set_max_job_sequence_id - action function for the max_job_sequence_id server
 *				  attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 */
int
set_max_job_sequence_id(attribute *pattr, void *pobject, int actmode)
{

	if ((actmode == ATR_ACTION_ALTER) ||
	    (actmode == ATR_ACTION_RECOV)) {

		if ((pattr->at_val.at_ll < SVR_MAX_JOB_SEQ_NUM_DEFAULT) ||
		    (pattr->at_val.at_ll > PBS_SEQNUMTOP)) {
			return (PBSE_INVALID_MAX_JOB_SEQUENCE_ID);
		}
		svr_max_job_sequence_id = pattr->at_val.at_ll;
		/* If the max_job_sequence_id is set to something smaller than current job id,
		 * then it will wrap to 0(ZERO)*/
		if (server.sv_qs.sv_jobidnumber > svr_max_job_sequence_id) {
			(void) reset_svr_sequence_window(); /* wrap it*/
			sprintf(log_buffer, "svr_max_job_sequence_id wrapped to 0");
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				  LOG_NOTICE, msg_daemonname, log_buffer);
		} else {
			sprintf(log_buffer, "svr_max_job_sequence_id set to val %lld",
				svr_max_job_sequence_id);
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				  LOG_NOTICE, msg_daemonname, log_buffer);
		}
	}
	return (PBSE_NONE);
}

/**
 * @brief
 *	unset_max_job_sequence_id - set server attribute "max_job_sequence_id" to
 *				    default value.
 */
void
unset_max_job_sequence_id(void)
{
	svr_max_job_sequence_id = SVR_MAX_JOB_SEQ_NUM_DEFAULT;
	/* If the max_job_sequence_id is set to something smaller than current job id,
	 * then it will wrap to 0(ZERO)*/
	if (server.sv_qs.sv_jobidnumber >= svr_max_job_sequence_id) {
		(void) reset_svr_sequence_window(); /* wrap it*/
		sprintf(log_buffer, "svr_max_job_sequence_id wrapped to 0");
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_NOTICE, msg_daemonname, log_buffer);
	}
	sprintf(log_buffer,
		"svr_max_job_sequence_id reverting back to default val %lld",
		svr_max_job_sequence_id);
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);
}

/**
 * @brief
 *		eligibletime_action - set/unset ATR_VFLAG_SET flag for
 *			      all jobs in server.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)(not used here)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 */
int
eligibletime_action(attribute *pattr, void *pobject, int actmode)
{
	job *pj;
	long accruetype;

	/* switching on eligible_time_enable. when switch happens,
	 * job's old accrue_type is not reliable
	 */
	if (pattr->at_val.at_long == 1) {

		pj = (job *) GET_NEXT(svr_alljobs);
		while (pj != NULL) {
			accruetype = determine_accruetype(pj);
			update_eligible_time(accruetype, pj);

			pj = (job *) GET_NEXT(pj->ji_alljobs);
		}

		/* if scheduling is true, need to run the scheduling cycle */
		/* so that, accrue type is determined for cases */
		if (get_sattr_long(SVR_ATR_scheduling))
			set_scheduler_flag(SCH_SCHEDULE_ETE_ON, NULL);
	}

	return 0;
}

/**
 * @brief
 *		decode_formula - decode the job sort formula from a secure file
 * @par
 *		returns value from decode_str
 *
 * @param[in]	patr	-	pointer to attribute structure
 * @param[in]	name	-	attribute name
 * @param[in]	rescn	-	resource name - unused here
 * @param[in]	val	-	attribute value
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: PBSE Error Code
 */
int
decode_formula(attribute *patr, char *name, char *rescn, char *val)
{
	FILE *fp;
	char pathbuf[MAXPATHLEN];
	char *formula_buf;
	int formula_buf_len = 1024;
	int rc;

	/* when we are coming up, we need to read from the server's database */
	if (get_sattr_long(SVR_ATR_State) == SV_STATE_INIT)
		return decode_str(patr, name, rescn, val);

	sprintf(pathbuf, "%s/%s", pbs_conf.pbs_home_path, FORMULA_ATTR_PATH);

	if ((fp = fopen(pathbuf, "r")) == NULL) {
		return PBSE_PERM;
	}

	formula_buf = malloc(formula_buf_len);
	if (formula_buf == NULL) {
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ALERT, msg_daemonname,
			  "unable to decode formula, no memory");
		fclose(fp);
		remove(pathbuf);
		return PBSE_INTERNAL;
	}
	memset(formula_buf, 0, formula_buf_len);

	if (pbs_fgets(&formula_buf, &formula_buf_len, fp) == NULL) {
		fclose(fp);
		remove(pathbuf);
		free(formula_buf);
		return PBSE_INTERNAL;
	}

	fclose(fp);

	/* now that we have the data, the file may be removed */
	remove(pathbuf);

	/* remove the newline */
	formula_buf[strlen(formula_buf) - 1] = '\0';

	rc = decode_str(patr, name, rescn, formula_buf);
	free(formula_buf);
	return rc;
}

/*
 *  Following datum and functions are used to enforce the rule that the
 * entity-limits (entlims) attributes cannot be used if the old style
 * user/group/run limeits are in use and vice versa.
 *
 * The datum entlim_type_in_use is set to:
 *	 0 - when neither type has been set (yet)
 *	+1 - when newer "entlims" have been set
 *	-1 - when older style limits have been set.
 *
 * If the datum is 0, the first style limit of either style is allowed
 * and sets the datum accordingly.  If set to +1, then any additional new
 * style entlim is allowed without additional checks.  If set to -1, then
 * additionaly old style are allowed to be set.
 *
 * If the wrong type is being set,  then an exhustive search of the server
 * attributes and queue attributes of all queues are required to see if the
 * other style is in use.  This is needed because the datum cannot be reset to
 * zero if the last of a style is unset, the mechinism isn't in place to do so.
 *
 * There are two lists, one for server the other for queues, of the attributs
 * which must be checked.
 */

static int entlim_type_in_use = 0;

static int svr_oldstyle[] = {
	(int) SVR_ATR_max_running,
	(int) SVR_ATR_MaxUserRun,
	(int) SVR_ATR_MaxGrpRun,
	(int) SVR_ATR_MaxUserRes,
	(int) SVR_ATR_MaxGroupRes,
	(int) SVR_ATR_MaxUserRunSoft,
	(int) SVR_ATR_MaxGrpRunSoft,
	(int) SVR_ATR_MaxUserResSoft,
	(int) SVR_ATR_MaxGroupResSoft,
	-1};
static int svr_newstyle[] = {
	(int) SVR_ATR_max_run,
	(int) SVR_ATR_max_run_res,
	(int) SVR_ATR_max_run_soft,
	(int) SVR_ATR_max_run_res_soft,
	-1};
static int que_oldstyle[] = {
	(int) QA_ATR_MaxJobs,
	(int) QA_ATR_MaxRun,
	(int) QE_ATR_MaxUserRun,
	(int) QE_ATR_MaxGrpRun,
	(int) QE_ATR_MaxUserRes,
	(int) QE_ATR_MaxGroupRes,
	(int) QE_ATR_MaxUserRunSoft,
	(int) QE_ATR_MaxGrpRunSoft,
	(int) QE_ATR_MaxUserResSoft,
	(int) QE_ATR_MaxGroupResSoft,
	-1};
static int que_newstyle[] = {
	(int) QA_ATR_max_queued,
	(int) QA_ATR_queued_jobs_threshold,
	(int) QE_ATR_max_run,
	(int) QE_ATR_max_run_res,
	(int) QE_ATR_max_run_soft,
	(int) QE_ATR_max_run_res_soft,
	-1};

extern pbs_list_head svr_queues;
/**
 * @brief
 * 		is_attrs_in_list_set - for a list of certain attributes, is any of them
 * 		set in the parent objects array of attributes
 *
 * @param[in]	wlist	-	style of queue/server
 * @param[in]	attrs	-	pointer to attribute structure
 *
 *	Returns >=0 index of the first attribute found to be set,
 *		 -1 if none set
 */
static int
is_attrs_in_list_set(int *wlist, attribute *attrs)
{
	int i;

	for (i = 0; *(wlist + i) != -1; ++i) {
		if (((attrs + *(wlist + i))->at_flags & ATR_VFLAG_SET) != 0)
			return *(wlist + i);
	}
	return -1;
}

/**
 * @brief
 * 		log_mixed_limit_controls - log a message when the administrator attempts
 *		to mix the type of queue/run limits.
 *
 * @param[in]	pq	-	pointer to the queue
 * @param[in]	index	-	index of queue/server attribute definition structure
 * @param[in]	type	-	type of queue/run limits
 */
static void
log_mixed_limit_controls(pbs_queue *pq, int index, char *type)
{
	attribute_def *pdef;
	char *objname;

	if (pq) {
		objname = pq->qu_qs.qu_name;
		pdef = &que_attr_def[index];
	} else {
		objname = "Server";
		pdef = &svr_attr_def[index];
	}
	snprintf(log_buffer, LOG_BUF_SIZE - 1,
		 "%s style attribute \"%s\" already set in %s %s, cannot mix types",
		 type, pdef->at_name, pq ? "queue" : "", objname);
	log_buffer[LOG_BUF_SIZE - 1] = '\0';
	log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_ALERT,
		  msg_daemonname, log_buffer);
}

/**
 * @brief
 * 		action_entlim_chk - the at_action for the entity attribute
 *		Prevents old and new type controls from being used at same time
 *
 * @param[in]	pattr	-	pointer to attribute structure(not used here)
 * @param[in]	pobject -	pointer to some parent object.(not used here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)(not used here)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	PBSE_MIXENTLIMS	: mixing old and new limit enformcement
 */
int
action_entlim_chk(attribute *pattr, void *pobject, int actmode)
{
	int i;
	pbs_queue *pq;

	/* first check if the new style limits cannot be used */
	/* due to a conflict with the old style.              */
	if (entlim_type_in_use == +1)
		return PBSE_NONE;
	else if (entlim_type_in_use == 0) {
		entlim_type_in_use = +1; /* show new stype in use */
		return PBSE_NONE;
	}

	/* flags says wrong (old) style in use, but need to double check */
	if ((i = is_attrs_in_list_set(svr_oldstyle, server.sv_attr)) != -1) {
		log_mixed_limit_controls(NULL, i, "old");
		return PBSE_MIXENTLIMS;
	}
	pq = (pbs_queue *) GET_NEXT(svr_queues);
	while (pq) {
		if ((i = is_attrs_in_list_set(que_oldstyle, pq->qu_attr)) != -1) {
			log_mixed_limit_controls(pq, i, "old");
			return PBSE_MIXENTLIMS;
		}
		pq = (pbs_queue *) GET_NEXT(pq->qu_link);
	}

	entlim_type_in_use = +1; /* show new stype in use */
	return PBSE_NONE;
}

/**
 * @brief
 * 		entlim_resum - Re-totals the entity usage, either count or resources
 *		for a specific entity limit attribute
 *
 * @param[in]	pwt	-	pointer to work task structure
 */

static void
entlim_resum(struct work_task *pwt)
{
	void *ctx;
	int is_resc;
	attribute *pattr;
	attribute *pattr2;
	char *key = NULL;
	svr_entlim_leaf_t *plf;
	job *pj;
	void *pobject;
	pbs_queue *pque;
	extern pbs_list_head svr_alljobs;

	pobject = pwt->wt_parm1; /* pointer to parent object */
	is_resc = pwt->wt_aux;	 /* 1=resource, 0-count */

	/* now determine if the parent object is a queue or is the Server */
	/* this tells us which list of jobs we need to walk.		  */
	if ((struct server *) pobject == &server) {
		/* server is the parent */
		pque = NULL;
		if (is_resc) {
			pattr = get_sattr(SVR_ATR_max_queued_res);
			pattr2 = get_sattr(SVR_ATR_queued_jobs_threshold_res);
		} else {
			pattr = get_sattr(SVR_ATR_max_queued);
			pattr2 = get_sattr(SVR_ATR_queued_jobs_threshold);
		}
		pj = (job *) GET_NEXT(svr_alljobs);
	} else {
		/* a queue is the parent */
		pque = (pbs_queue *) pobject;
		if (is_resc) {
			pattr = get_qattr(pque, QA_ATR_max_queued_res);
			pattr2 = get_qattr(pque, QA_ATR_queued_jobs_threshold_res);
		} else {
			pattr = get_qattr(pque, QA_ATR_max_queued);
			pattr2 = get_qattr(pque, QA_ATR_queued_jobs_threshold);
		}
		pj = (job *) GET_NEXT(pque->qu_jobs);
	}

	/* Next, walk the limit tree and clear all current values */

	ctx = pattr->at_val.at_enty.ae_tree;
	while ((plf = entlim_get_next(ctx, (void **) &key)) != NULL) {
		if (is_attr_set(&plf->slf_sum)) {
			plf->slf_rescd->rs_free(&plf->slf_sum);
			DBPRT(("clearing %s\n", key))
		}
	}

	ctx = pattr2->at_val.at_enty.ae_tree;
	key = NULL;
	while ((plf = entlim_get_next(ctx, (void **) &key)) != NULL) {
		if (is_attr_set(&plf->slf_sum)) {
			plf->slf_rescd->rs_free(&plf->slf_sum);
			DBPRT(("clearing %s\n", key))
		}
	}

	/* then for each job in the parent object, sum up its count/resource */

	while (pj) {
		if ((pj->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) == 0) {
			if (is_resc) {
				account_entity_limit_usages(pj, pque, NULL, INCR, ETLIM_ACC_ALL_RES);
			} else {
				account_entity_limit_usages(pj, pque, NULL, INCR, ETLIM_ACC_ALL_CT);
			}
		}

		if (pque)
			pj = (job *) GET_NEXT(pj->ji_jobque);
		else
			pj = (job *) GET_NEXT(pj->ji_alljobs);
	}
}

/**
 * @brief
 * 		action_entlim_ct - the at_action for the entity job count attributes
 *		calls the common "action_entlim" function with an zero flag to indicate
 *		that the entity limit is a count limit.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	nonzero	: PBSE error code
 */

int
action_entlim_ct(attribute *pattr, void *pobject, int actmode)
{
	struct work_task *pwt;
	int rc;

	rc = action_entlim_chk(pattr, pobject, actmode);
	if (rc != PBSE_NONE)
		return rc;

	if (actmode == ATR_ACTION_ALTER) {
		/*
		 * setup a work task to resum the count for this
		 * limit after the "set" has been really set in the
		 * attribute.  At this instant in time, the real attribute
		 * still has the old information and may even be unset
		 */
		pwt = set_task(WORK_Immed, 0, entlim_resum, pobject);
		if (pwt)
			pwt->wt_aux = 0; /* resum count of jobs */
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		action_entlim_res - the at_action for the entity resource limit attributes
 *		calls the common "action_entlim" function with the flag indicating
 *		that the entity limit is a resource limit.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: success
 * @retval	nonzero	: PBSE error code
 */

int
action_entlim_res(attribute *pattr, void *pobject, int actmode)
{
	int rc;
	struct work_task *pwt;

	rc = action_entlim_chk(pattr, pobject, actmode);
	if (rc != PBSE_NONE)
		return rc;

	if (actmode == ATR_ACTION_ALTER) {
		/*
		 * setup a work task to resum the resource usage for this
		 * limit after the "set" has been really set in the
		 * attribute.  At this instant in time, the real attribute
		 * still has the old information and may even be unset
		 */
		pwt = set_task(WORK_Immed, 0, entlim_resum, pobject);
		if (pwt)
			pwt->wt_aux = 1; /* resum resources */
	}
	return PBSE_NONE;
}

/**
 * @brief
 * 		check_no_entlim - checks for conflicting attributes which restrict what can
 *		run or be enqueued.  If an old style is being set, the newer "entlim"
 *		types cannot be set.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobject -	pointer to some parent object.
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	int
 * @retval	PBSE_NONE	: no new entlim type currently set
 * @retval	PBSE_MIXENTLIMS	: here is a new style entlim limit set
 */
int
check_no_entlim(attribute *pattr, void *pobject, int actmode)
{
	int i;
	pbs_queue *pq;

	if (entlim_type_in_use == -1)
		return PBSE_NONE;
	else if (entlim_type_in_use == 0) {
		entlim_type_in_use = -1; /* show old style in use */
		return PBSE_NONE;
	}

	/* flags says wrong (new) style in use, but need to double check */
	if ((i = is_attrs_in_list_set(svr_newstyle, server.sv_attr)) != -1) {
		log_mixed_limit_controls(NULL, i, "new");
		return PBSE_MIXENTLIMS;
	}
	pq = (pbs_queue *) GET_NEXT(svr_queues);
	while (pq) {
		if ((i = is_attrs_in_list_set(que_newstyle, pq->qu_attr)) != -1) {
			log_mixed_limit_controls(pq, i, "new");
			return PBSE_MIXENTLIMS;
		}
		pq = (pbs_queue *) GET_NEXT(pq->qu_link);
	}

	entlim_type_in_use = -1; /* show old style in use */
	return 0;
}

/* Defines for return value of check_single_entity_* */
#define Exceeds_Generic -2
#define Exceeds_Limit -1
#define No_Limit 0
#define Within_Limit 1

#define ET_LIM_DBG(format, ...)                                                                              \
	if (will_log_event(PBSEVENT_DEBUG4)) {                                                               \
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "ET_LIM_DBG: %s: " format, __VA_ARGS__);              \
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, log_buffer); \
	}

extern char statechars[];

/**
 * @brief
 * 		check_single_entity_ct	-	check the single entity count
 *
 * @param[in]	kt	-	Key type- user/group/project or overall.
 * @param[in]	ename	-	entity name.
 * @param[in]	patr	-	pointer to attribute structure
 * @param[in]	subjobs	-	number of subjobs if any.
 * @param[in]	pjob	-	pointer to job
 *
 * @return	int
 * @retval	Exceeds_Generic	: count exceeds generic limit
 * @retval	Exceeds_Limit	: count exceeds slf_limit
 * @retval	No_Limit	: There is no limit
 * @retval	Within_Limit	: count is within the limit
 */
static int
check_single_entity_ct(enum lim_keytypes kt, char *ename, attribute *patr, int subjobs, job *pjob)
{
	char *kstr;
	void *ctx;
	svr_entlim_leaf_t *plf;
	int count = subjobs;

	kstr = entlim_mk_runkey(kt, ename);
	if (kstr == NULL) {
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ALERT, msg_daemonname,
			  "rejecting job,  unable to make entity limit key, no memory");
		ET_LIM_DBG("exiting, ret %d [kstr is NULL]", __func__, LIM_OVERALL)
		return LIM_OVERALL;
	}
	ET_LIM_DBG("kstr %s, %d", __func__, kstr, subjobs)
	ctx = patr->at_val.at_enty.ae_tree;
	plf = (svr_entlim_leaf_t *) entlim_get(kstr, ctx);

	if (plf) {
		count += plf->slf_sum.at_val.at_long;
		ET_LIM_DBG("ct usage for %s is %ld", __func__, kstr, plf->slf_sum.at_val.at_long)
		ET_LIM_DBG("ct specific limit for %s is %ld", __func__, kstr, plf->slf_limit.at_val.at_long)
	}
	free(kstr);

	ET_LIM_DBG("count is %d", __func__, count)
	if (plf && (is_attr_set(&plf->slf_limit))) {
		if (count > plf->slf_limit.at_val.at_long) {
			ET_LIM_DBG("exiting, ret Exceeds_Limit [specific limit]", __func__)
			return Exceeds_Limit;
		} else {
			ET_LIM_DBG("exiting, ret Within_Limit [specific limit]", __func__)
			return Within_Limit;
		}
	} else if (kt != LIM_OVERALL) {
		/* compare against generic limit if one */
		kstr = entlim_mk_runkey(kt, PBS_GENERIC_ENTITY);
		if (kstr == NULL) {
			ET_LIM_DBG("exiting, ret No_Limit [generic limit]", __func__)
			return No_Limit;
		}
		plf = (svr_entlim_leaf_t *) entlim_get(kstr, ctx);
		if (plf && (is_attr_set(&plf->slf_limit))) {
			ET_LIM_DBG("ct generic limit for %s is %ld", __func__, kstr, plf->slf_limit.at_val.at_long)
			free(kstr);
			if (count > plf->slf_limit.at_val.at_long) {
				ET_LIM_DBG("exiting, ret Exceeds_Generic [generic limit]", __func__)
				return Exceeds_Generic;
			} else {
				ET_LIM_DBG("exiting, ret Within_Limit [generic limit]", __func__)
				return Within_Limit;
			}
		}
		free(kstr);
	}
	ET_LIM_DBG("exiting, ret No_Limit [all ok]", __func__)
	return No_Limit;
}
/**
 * @brief
 * 		check_single_entity_res	-	check single entity resource
 *
 * @param[in]	kt	-	Key type- user/group/project or overall.
 * @param[in]	ename	-	entity name.
 * @param[in]	patr	-	pointer to attribute structure
 * @param[in]	newr	-	new resource
 * @param[in]	oldr	-	old resource
 * @param[in]	subjobs -	number of subjobs if any.
 * @param[in]	pjob	-	pointer to job
 *
 * @return	int
 * @retval	Exceeds_Generic	: count exceeds generic limit
 * @retval	Exceeds_Limit	: count exceeds slf_limit
 * @retval	No_Limit	: There is no limit
 * @retval	Within_Limit	: count is within the limit
 */
static int
check_single_entity_res(enum lim_keytypes kt, char *ename,
			attribute *patr,
			resource *newr,
			resource *oldr,
			int subjobs,
			job *pjob)
{
	char *kstr;
	void *ctx;
	svr_entlim_leaf_t *plf;
	int rc;
	int i;
	attribute tmpval = {0};

	kstr = entlim_mk_reskey(kt, ename, newr->rs_defin->rs_name);
	if (kstr == NULL) {
		log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
			  LOG_ALERT, msg_daemonname,
			  "rejecting job,  unable to make entity limit key, no memory");
		ET_LIM_DBG("exiting, ret %d [kstr is NULL]", __func__, LIM_OVERALL)
		return LIM_OVERALL;
	}
	ET_LIM_DBG("kstr %s, %d, oldr %p", __func__, kstr, subjobs, oldr)
	ctx = patr->at_val.at_enty.ae_tree;
	plf = (svr_entlim_leaf_t *) entlim_get(kstr, ctx);

	if (plf) {
		tmpval = plf->slf_sum;
		for (i = 0; i < subjobs; i++) {
			if (oldr)
				plf->slf_rescd->rs_set(&tmpval, &oldr->rs_value, DECR);
			/* add in requested amount */
			plf->slf_rescd->rs_set(&tmpval, &newr->rs_value, INCR);
		}
		if (will_log_event(PBSEVENT_DEBUG4)) {
			svrattrl *sum = NULL, *limit = NULL;
			char *sum_val, *limit_val;
			if (is_attr_set(&plf->slf_sum)) {
				plf->slf_rescd->rs_encode(&plf->slf_sum, NULL, "sumval", NULL, ATR_ENCODE_CLIENT, &sum);
				sum_val = sum->al_value;
			} else
				sum_val = "(not_set)";
			if (is_attr_set(&plf->slf_limit)) {
				plf->slf_rescd->rs_encode(&plf->slf_limit, NULL, "limval", NULL, ATR_ENCODE_CLIENT, &limit);
				limit_val = limit->al_value;
			} else
				limit_val = "(not_set)";
			ET_LIM_DBG("res usage for %s is %s", __func__, kstr, sum_val)
			ET_LIM_DBG("res specific limit for %s is %s", __func__, kstr, limit_val)
			free(sum);
			free(limit);
		}
	}
	free(kstr);
	if (plf && (is_attr_set(&plf->slf_limit))) {
		/* check the specific user's limit */
		rc = plf->slf_rescd->rs_comp(&tmpval, &plf->slf_limit);
		if (rc > 0) {
			ET_LIM_DBG("exiting, ret Exceeds_Limit, rc=%d [specific limit]", __func__, rc)
			return Exceeds_Limit;
		}
		ET_LIM_DBG("exiting, ret Within_Limit, rc=%d [specific limit]", __func__, rc)
		return Within_Limit;
	} else if (kt != LIM_OVERALL) {
		/* check against the generic limit if one */
		kstr = entlim_mk_reskey(kt, PBS_GENERIC_ENTITY, newr->rs_defin->rs_name);
		if (kstr == NULL) {
			ET_LIM_DBG("exiting, ret No_Limit [generic limit]", __func__)
			return No_Limit;
		}
		plf = (svr_entlim_leaf_t *) entlim_get(kstr, ctx);
		if (plf && (is_attr_set(&plf->slf_limit))) {
			if (!(is_attr_set(&tmpval))) { /* for no recorded usage for entity */
				plf->slf_rescd->rs_set(&tmpval, &newr->rs_value, SET);
				for (i = 0; i < (subjobs - 1); i++) {
					plf->slf_rescd->rs_set(&tmpval, &newr->rs_value, INCR);
				}
				if (will_log_event(PBSEVENT_DEBUG4) && (is_attr_set(&tmpval))) {
					svrattrl *count;
					plf->slf_rescd->rs_encode(&tmpval, NULL, "tmpval", NULL, ATR_ENCODE_CLIENT, &count);
					ET_LIM_DBG("res generic limit for %s is %s", __func__, kstr, count->al_value)
					free(count);
				} else
					ET_LIM_DBG("res generic limit for %s is (not_set)", __func__, kstr)
			}
			rc = plf->slf_rescd->rs_comp(&tmpval, &plf->slf_limit);
			free(kstr);
			if (rc > 0) {
				ET_LIM_DBG("exiting, ret Exceeds_Generic, rc=%d [generic limit]", __func__, rc)
				return Exceeds_Generic;
			}
			ET_LIM_DBG("exiting, ret Within_Limit, rc=%d [generic limit]", __func__, rc)
			return Within_Limit;
		}
		free(kstr);
	}
	ET_LIM_DBG("exiting, ret No_Limit [all ok]", __func__)
	return No_Limit;
}

/**
 * @brief
 * 		check_entity_ct_limit_queued() - called to see if a job can be enqueued
 *		1. Called when new job is arriving against server attributes:
 *	   		- pque will be null
 *		2. Called to check against queue attributes on any enqueue
 *	   	(submit, move or route):
 *	   	- pque will point to queue struct, i.e. not null
 *
 * @param[in]	pjob	-	new job
 * @param[in]	pque	-	any enqueue
 *
 * @return	within the limit or not
 * @retval	zero	: within defined limit
 * @retval	PBS_Enumber	: if limit exceeded
 * @note
 *		On an error, a formatted message is attached to the job in ji_
 */
int
check_entity_ct_limit_queued(job *pjob, pbs_queue *pque)
{
	char *egroup;
	char *project;
	char *euser;
	attribute *pqueued_jobs_threshold;
	int rc;
	int subjobs;
	char ebuff[COMMENT_BUF_SIZE + 1];
	extern char *msg_et_qct_q;
	extern char *msg_et_sct_q;
	extern char *msg_et_ggq_q;
	extern char *msg_et_ggs_q;
	extern char *msg_et_gpq_q;
	extern char *msg_et_gps_q;
	extern char *msg_et_guq_q;
	extern char *msg_et_gus_q;
	extern char *msg_et_sgq_q;
	extern char *msg_et_sgs_q;
	extern char *msg_et_spq_q;
	extern char *msg_et_sps_q;
	extern char *msg_et_suq_q;
	extern char *msg_et_sus_q;

	ET_LIM_DBG("entered for %s", __func__, pque ? pque->qu_qs.qu_name : "server")
	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);
	if (pjob->ji_clterrmsg) {
		free(pjob->ji_clterrmsg);
		pjob->ji_clterrmsg = NULL;
	}
	if (pque)
		pqueued_jobs_threshold = get_qattr(pque, QA_ATR_queued_jobs_threshold);
	else
		pqueued_jobs_threshold = get_sattr(SVR_ATR_queued_jobs_threshold);

	if (!is_attr_set(pqueued_jobs_threshold)) {
		ET_LIM_DBG("exiting, ret 0 [queued_jobs_threshold limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return PBSE_NONE; /* no limits set */
	}

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0) {
		ET_LIM_DBG("exiting, ret %d [get_queued_subjobs_ct() returned %d]", __func__,
			   PBSE_INTERNAL, subjobs)
		return PBSE_INTERNAL;
	}

	/* I.  For jobs count limits */

	/* 1. Check against Overall limit, [o:PBS_ALL] */
	rc = check_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pqueued_jobs_threshold, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_qct_q,
				 pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, "%s", msg_et_sct_q);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(o:" PBS_ALL_ENTITY ",%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, subjobs)
		return PBSE_ENTLIMCT;
	}

	/* 2. Check against specific user limit, [u:user] */
	rc = check_single_entity_ct(LIM_USER, euser, pqueued_jobs_threshold, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_suq_q,
				 euser, pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sus_q, euser);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(u:%s,%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, euser, subjobs)
		return PBSE_ENTLIMCT;

	} else if (rc == Exceeds_Generic) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_guq_q,
				 "generic", pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_gus_q, "generic");
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(u:%s,%d) returned Exceeds_Generic]", __func__,
			   PBSE_ENTLIMCT, euser, subjobs)
		return PBSE_ENTLIMCT;
	}

	/* 3. Check against specific group limit, [g:group] */
	rc = check_single_entity_ct(LIM_GROUP, egroup, pqueued_jobs_threshold, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sgq_q,
				 egroup, pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sgs_q, egroup);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(g:%s,%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, egroup, subjobs)
		return PBSE_ENTLIMCT;

	} else if (rc == Exceeds_Generic) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_ggq_q,
				 pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, "%s", msg_et_ggs_q);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(g:%s,%d) returned Exceeds_Generic]", __func__,
			   PBSE_ENTLIMCT, egroup, subjobs)
		return PBSE_ENTLIMCT;
	}

	/* 4. Check against specific project limit, [p:project] */
	rc = check_single_entity_ct(LIM_PROJECT, project, pqueued_jobs_threshold, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_spq_q,
				 project, pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sps_q, project);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(p:%s,%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, project, subjobs)
		return PBSE_ENTLIMCT;

	} else if (rc == Exceeds_Generic) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_gpq_q,
				 pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, "%s", msg_et_gps_q);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(p:%s,%d) returned Exceeds_Generic]", __func__,
			   PBSE_ENTLIMCT, project, subjobs)
		return PBSE_ENTLIMCT;
	}

	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	return 0; /* within all count limits */
}

/**
 * @brief
 * 		check_entity_ct_limit_max() - called to see if a job can be enqueued
 *		1. Called when new job is arriving against server attributes:
 *	   	- pque will be null
 *		2. Called to check against queue attributes on any enqueue
 *	   	(submit, move or route):
 *	   	- pque will point to queue struct, i.e. not null
 *
 * @param[in]	pjob	-	new job
 * @param[in]	pque	-	any enqueue
 *
 * @return	within the limit or not
 * @retval	zero	: within defined limit
 * @retval	PBS_Enumber	: if limit exceeded
 * @note
 *		On an error, a formatted message is attached to the job in ji_
 */
int
check_entity_ct_limit_max(job *pjob, pbs_queue *pque)
{
	char *egroup;
	char *project;
	char *euser;
	attribute *pmax_queued;
	int rc;
	int subjobs;
	char ebuff[COMMENT_BUF_SIZE + 1];
	extern char *msg_et_qct;
	extern char *msg_et_sct;
	extern char *msg_et_ggq;
	extern char *msg_et_ggs;
	extern char *msg_et_gpq;
	extern char *msg_et_gps;
	extern char *msg_et_guq;
	extern char *msg_et_gus;
	extern char *msg_et_sgq;
	extern char *msg_et_sgs;
	extern char *msg_et_spq;
	extern char *msg_et_sps;
	extern char *msg_et_suq;
	extern char *msg_et_sus;

	ET_LIM_DBG("entered for %s", __func__, pque ? pque->qu_qs.qu_name : "server")
	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);
	if (pjob->ji_clterrmsg) {
		free(pjob->ji_clterrmsg);
		pjob->ji_clterrmsg = NULL;
	}
	if (pque)
		pmax_queued = get_qattr(pque, QA_ATR_max_queued);
	else
		pmax_queued = get_sattr(SVR_ATR_max_queued);

	if (!is_attr_set(pmax_queued)) {
		ET_LIM_DBG("exiting, ret 0 [max_queued limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return PBSE_NONE; /* no limits set */
	}

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0) {
		ET_LIM_DBG("exiting, ret %d [get_queued_subjobs_ct() returned %d]", __func__,
			   PBSE_INTERNAL, subjobs)
		return PBSE_INTERNAL;
	}

	/* I.  For jobs count limits */

	/* 1. Check against Overall limit, [o:PBS_ALL] */
	rc = check_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pmax_queued, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_qct,
				 pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, "%s", msg_et_sct);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(o:" PBS_ALL_ENTITY ",%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, subjobs)
		return PBSE_ENTLIMCT;
	}

	/* 2. Check against specific user limit, [u:user] */
	rc = check_single_entity_ct(LIM_USER, euser, pmax_queued, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_suq,
				 euser, pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sus, euser);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(u:%s,%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, euser, subjobs)
		return PBSE_ENTLIMCT;

	} else if (rc == Exceeds_Generic) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_guq,
				 "generic", pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_gus, "generic");
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(u:%s,%d) returned Exceeds_Generic]", __func__,
			   PBSE_ENTLIMCT, euser, subjobs)
		return PBSE_ENTLIMCT;
	}

	/* 3. Check against specific group limit, [g:group] */
	rc = check_single_entity_ct(LIM_GROUP, egroup, pmax_queued, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sgq,
				 egroup, pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sgs, egroup);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(g:%s,%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, egroup, subjobs)
		return PBSE_ENTLIMCT;

	} else if (rc == Exceeds_Generic) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_ggq,
				 pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, "%s", msg_et_ggs);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(g:%s,%d) returned Exceeds_Generic]", __func__,
			   PBSE_ENTLIMCT, egroup, subjobs)
		return PBSE_ENTLIMCT;
	}

	/* 4. Check against specific project limit, [p:project] */
	rc = check_single_entity_ct(LIM_PROJECT, project, pmax_queued, subjobs, pjob);
	if (rc == Exceeds_Limit) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_spq,
				 project, pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_sps, project);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(p:%s,%d) returned Exceeds_Limit]", __func__,
			   PBSE_ENTLIMCT, project, subjobs)
		return PBSE_ENTLIMCT;

	} else if (rc == Exceeds_Generic) {
		if (pque) {
			snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_gpq,
				 pque->qu_qs.qu_name);
		} else {
			snprintf(ebuff, COMMENT_BUF_SIZE, "%s", msg_et_gps);
		}
		ebuff[COMMENT_BUF_SIZE] = '\0';
		if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
			return PBSE_SYSTEM;
		ET_LIM_DBG("exiting, ret %d [check_single_entity_ct(p:%s,%d) returned Exceeds_Generic]", __func__,
			   PBSE_ENTLIMCT, project, subjobs)
		return PBSE_ENTLIMCT;
	}

	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	return 0; /* within all count limits */
}

/**
 * @brief
 * 		check_entity_res_limit_queued() - called to see if a job can be enqueued
 *		based on requested (or altered) job wide resources
 *		1. Called when new job is arriving against server attributes:
 *	   	- pque will be null
 *		2. Called to check against queue attributes on any enqueue
 *	   	(submit, move or route):
 *	   	- pque will point to queue struct, i.e. not null
 *
 * @param[in]	pjob	-	new job
 * @param[in]	pque	-	any enqueue
 * @param[in]	altered_resc	-	altered job wide resources
 *
 * @return	within the limit or not
 * @retval	zero	: within defined limit
 * @retval	PBS_Enumber	: if limit exceeded
 * @note
 *		Error message text returned in ebuffer if limit exceeded
 */
int
check_entity_resc_limit_queued(job *pjob, pbs_queue *pque, attribute *altered_resc)
{
	char *egroup;
	char *project;
	char *euser;
	int rc;
	int subjobs;
	attribute *pmaxqresc;
	attribute *pattr_new;
	attribute *pattr_old;
	resource *presc_new;
	resource *presc_old;
	char ebuff[COMMENT_BUF_SIZE + 1];

	extern char *msg_et_ggq_q;
	extern char *msg_et_ggs_q;
	extern char *msg_et_guq_q;
	extern char *msg_et_gus_q;
	extern char *msg_et_sgq_q;
	extern char *msg_et_sgs_q;
	extern char *msg_et_spq_q;
	extern char *msg_et_sps_q;
	extern char *msg_et_suq_q;
	extern char *msg_et_sus_q;
	extern char *msg_et_raq_q;
	extern char *msg_et_ras_q;
	extern char *msg_et_rggq_q;
	extern char *msg_et_rggs_q;
	extern char *msg_et_rgpq_q;
	extern char *msg_et_rgps_q;
	extern char *msg_et_rguq_q;
	extern char *msg_et_rgus_q;
	extern char *msg_et_rsgq_q;
	extern char *msg_et_rsgs_q;
	extern char *msg_et_rspq_q;
	extern char *msg_et_rsps_q;
	extern char *msg_et_rsuq_q;
	extern char *msg_et_rsus_q;

	ET_LIM_DBG("entered for %s, alt_res %p", __func__, pque ? pque->qu_qs.qu_name : "server", altered_resc)
	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);
	if (pjob->ji_clterrmsg) {
		free(pjob->ji_clterrmsg);
		pjob->ji_clterrmsg = NULL;
	}
	if (pque)
		pmaxqresc = get_qattr(pque, QA_ATR_queued_jobs_threshold_res);
	else
		pmaxqresc = get_sattr(SVR_ATR_queued_jobs_threshold_res);

	if (!is_attr_set(pmaxqresc)) {
		ET_LIM_DBG("exiting, ret 0 [queued_jobs_threshold_res limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return 0; /* no limits set */
	}

	if (altered_resc) {
		pattr_new = altered_resc;
		pattr_old = get_jattr(pjob, JOB_ATR_resource);
	} else {
		pattr_new = get_jattr(pjob, JOB_ATR_resource);
		pattr_old = NULL; /* null */
	}

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0) {
		ET_LIM_DBG("exiting, ret %d [get_queued_subjobs_ct() returned %d]", __func__,
			   PBSE_INTERNAL, subjobs)
		return PBSE_INTERNAL;
	}

	for (presc_new = (resource *) GET_NEXT(pattr_new->at_val.at_list);
	     presc_new != NULL;
	     presc_new = (resource *) GET_NEXT(presc_new->rs_link)) {
		char *rescn = presc_new->rs_defin->rs_name;
		/* is there an entity limit set for this resource */
		if (!(is_attr_set(&presc_new->rs_value)) || (presc_new->rs_defin->rs_entlimflg != PBS_ENTLIM_LIMITSET))
			continue; /* no limit set */

		/* If this is from qalter where presc_old is set, see if    */
		/* corresponding resource is in presc_old, had a pior value */

		if (pattr_old)
			presc_old = find_resc_entry(pattr_old, presc_new->rs_defin);
		else
			presc_old = NULL;

		ET_LIM_DBG("checking for resc %s", __func__, rescn)
		/* 1. check against overall limit o:PBS_ALL */
		rc = check_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_raq_q,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_ras_q,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(o:" PBS_ALL_ENTITY ";%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}

		/* 2. check aginst user/generic-user limit */
		rc = check_single_entity_res(LIM_USER, euser,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsuq_q,
					 euser,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsus_q,
					 euser, presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(u:%s;%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, euser, rescn, subjobs)
			return PBSE_ENTLIMRESC;

		} else if (rc == Exceeds_Generic) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rguq_q,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rgus_q,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(u:%s;%s,%d) returned Exceeds_Generic]", __func__,
				   PBSE_ENTLIMRESC, euser, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}

		/* 3. check against specific/generic group limit */
		rc = check_single_entity_res(LIM_GROUP, egroup,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsgq_q,
					 egroup,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsgs_q,
					 egroup,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(g:%s;%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, egroup, rescn, subjobs)
			return PBSE_ENTLIMRESC;

		} else if (rc == Exceeds_Generic) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rggq_q,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rggs_q,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(g:%s;%s,%d) returned Exceeds_Generic]", __func__,
				   PBSE_ENTLIMRESC, egroup, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}

		/* 4. check against specific/generic project limit */
		rc = check_single_entity_res(LIM_PROJECT, project,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rspq_q,
					 project,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsps_q,
					 project,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(p:%s;%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, project, rescn, subjobs)
			return PBSE_ENTLIMRESC;

		} else if (rc == Exceeds_Generic) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rgpq_q,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rgps_q,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(p:%s;%s,%d) returned Exceeds_Generic]", __func__,
				   PBSE_ENTLIMRESC, project, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}
	}

	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	/* At this point the job is good to go (into the queue/server */
	return 0;
}

/**
 * @buffer
 * 		check_entity_res_limit_max() - called to see if a job can be enqueued
 *		based on requested (or altered) job wide resources
 *		1. Called when new job is arriving against server attributes:
 *	   	- pque will be null
 *		2. Called to check against queue attributes on any enqueue
 *	   	(submit, move or route):
 *	   	- pque will point to queue struct, i.e. not null
 *
 * @param[in]	pjob	-	new job
 * @param[in]	pque	-	any enqueue
 * @param[in]	altered_resc	-	altered job wide resources
 *
 * @return	within the limit or not
 * @retval	zero	: within defined limit
 * @retval	PBS_Enumber	: if limit exceeded
 * @note
 * 		Error message text returned in ebuffer if limit exceeded
 */
int
check_entity_resc_limit_max(job *pjob, pbs_queue *pque, attribute *altered_resc)
{
	char *egroup;
	char *project;
	char *euser;
	int rc;
	int subjobs;
	attribute *pmaxqresc;
	attribute *pattr_new;
	attribute *pattr_old;
	resource *presc_new;
	resource *presc_old;
	char ebuff[COMMENT_BUF_SIZE + 1];

	extern char *msg_et_ggq;
	extern char *msg_et_ggs;
	extern char *msg_et_guq;
	extern char *msg_et_gus;
	extern char *msg_et_sgq;
	extern char *msg_et_sgs;
	extern char *msg_et_spq;
	extern char *msg_et_sps;
	extern char *msg_et_suq;
	extern char *msg_et_sus;
	extern char *msg_et_raq;
	extern char *msg_et_ras;
	extern char *msg_et_rggq;
	extern char *msg_et_rggs;
	extern char *msg_et_rgpq;
	extern char *msg_et_rgps;
	extern char *msg_et_rguq;
	extern char *msg_et_rgus;
	extern char *msg_et_rsgq;
	extern char *msg_et_rsgs;
	extern char *msg_et_rspq;
	extern char *msg_et_rsps;
	extern char *msg_et_rsuq;
	extern char *msg_et_rsus;

	ET_LIM_DBG("entered for %s, alt_res %p", __func__, pque ? pque->qu_qs.qu_name : "server", altered_resc)
	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);
	if (pjob->ji_clterrmsg) {
		free(pjob->ji_clterrmsg);
		pjob->ji_clterrmsg = NULL;
	}
	if (pque)
		pmaxqresc = get_qattr(pque, QA_ATR_max_queued_res);
	else
		pmaxqresc = get_sattr(SVR_ATR_max_queued_res);

	if (!is_attr_set(pmaxqresc)) {
		ET_LIM_DBG("exiting, ret 0 [max_queued_res limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return 0; /* no limits set */
	}

	if (altered_resc) {
		pattr_new = altered_resc;
		pattr_old = get_jattr(pjob, JOB_ATR_resource);
	} else {
		pattr_new = get_jattr(pjob, JOB_ATR_resource);
		pattr_old = NULL; /* null */
	}

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0) {
		ET_LIM_DBG("exiting, ret %d [get_queued_subjobs_ct() returned %d]", __func__,
			   PBSE_INTERNAL, subjobs)
		return PBSE_INTERNAL;
	}

	for (presc_new = (resource *) GET_NEXT(pattr_new->at_val.at_list);
	     presc_new != NULL;
	     presc_new = (resource *) GET_NEXT(presc_new->rs_link)) {
		char *rescn = presc_new->rs_defin->rs_name;
		/* is there an entity limit set for this resource */
		if (!(is_attr_set(&presc_new->rs_value)) || (presc_new->rs_defin->rs_entlimflg != PBS_ENTLIM_LIMITSET))
			continue; /* no limit set */

		/* If this is from qalter where presc_old is set, see if    */
		/* corresponding resource is in presc_old, had a pior value */

		if (pattr_old)
			presc_old = find_resc_entry(pattr_old, presc_new->rs_defin);
		else
			presc_old = NULL;

		ET_LIM_DBG("checking for resc %s", __func__, rescn)
		/* 1. check against overall limit o:PBS_ALL */
		rc = check_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_raq,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_ras,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(o:" PBS_ALL_ENTITY ";%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}

		/* 2. check aginst user/generic-user limit */
		rc = check_single_entity_res(LIM_USER, euser,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsuq,
					 euser,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsus,
					 euser, presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(u:%s;%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, euser, rescn, subjobs)
			return PBSE_ENTLIMRESC;

		} else if (rc == Exceeds_Generic) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rguq,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rgus,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(u:%s;%s,%d) returned Exceeds_Generic]", __func__,
				   PBSE_ENTLIMRESC, euser, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}

		/* 3. check against specific/generic group limit */
		rc = check_single_entity_res(LIM_GROUP, egroup,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsgq,
					 egroup,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsgs,
					 egroup,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(g:%s;%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, egroup, rescn, subjobs)
			return PBSE_ENTLIMRESC;

		} else if (rc == Exceeds_Generic) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rggq,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rggs,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(g:%s;%s,%d) returned Exceeds_Generic]", __func__,
				   PBSE_ENTLIMRESC, egroup, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}

		/* 4. check against specific/generic project limit */
		rc = check_single_entity_res(LIM_PROJECT, project,
					     pmaxqresc,
					     presc_new, presc_old, subjobs, pjob);
		if (rc == Exceeds_Limit) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rspq,
					 project,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rsps,
					 project,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(p:%s;%s,%d) returned Exceeds_Limit]", __func__,
				   PBSE_ENTLIMRESC, project, rescn, subjobs)
			return PBSE_ENTLIMRESC;

		} else if (rc == Exceeds_Generic) {
			if (pque) {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rgpq,
					 presc_new->rs_defin->rs_name,
					 pque->qu_qs.qu_name);
			} else {
				snprintf(ebuff, COMMENT_BUF_SIZE, msg_et_rgps,
					 presc_new->rs_defin->rs_name);
			}
			ebuff[COMMENT_BUF_SIZE] = '\0';
			if ((pjob->ji_clterrmsg = strdup(ebuff)) == NULL)
				return PBSE_SYSTEM;
			ET_LIM_DBG("exiting, ret %d [check_single_entity_res(p:%s;%s,%d) returned Exceeds_Generic]", __func__,
				   PBSE_ENTLIMRESC, project, rescn, subjobs)
			return PBSE_ENTLIMRESC;
		}
	}

	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	/* At this point the job is good to go (into the queue/server */
	return 0;
}

/**
 * @brief
 * 		set_single_entity_ct - incr/decr a count for a single entity (user/group/all)
 *		for an attribute owned by queue or server
 * @see
 *		set_entity_ct_sum()
 *
 * @param[in]	kt    - key type
 * @param[in]	ename - entity name
 * @param[in]	patr  - pointer to attribute
 * @param[in]	pjob  - pointer to job
 * @param[in]	subjobs   - count
 * @param[in]	op    - increment or decrement
 *
 * @return	within the limit or not
 * @retval	zero	: adjusted Entity count
 * @retval	PBS_Enumber	: something got wrong!
 *
 */

static int
set_single_entity_ct(enum lim_keytypes kt, char *ename, attribute *patr, job *pjob, int subjobs, enum batch_op op)
{
	char *kstr;
	void *ctx;
	svr_entlim_leaf_t *plf;
	int rc;

	kstr = entlim_mk_runkey(kt, ename);
	if (kstr == NULL) {
		ET_LIM_DBG("exiting, ret %d [kstr is NULL]", __func__, PBSE_SYSTEM)
		return (PBSE_SYSTEM);
	}
	ET_LIM_DBG("kstr %s, %d, %s", __func__, kstr, subjobs, (op == INCR) ? "INCR" : "DECR")
	ctx = patr->at_val.at_enty.ae_tree;
	plf = (svr_entlim_leaf_t *) entlim_get(kstr, ctx);
	if (op == INCR) {
		if (plf == NULL) {
			/* add leaf for this entity-limit */
			if ((rc = alloc_svrleaf(NULL, &plf)) != PBSE_NONE) {
				free(kstr);
				ET_LIM_DBG("exiting, ret %d [alloc_svrleaf failed]", __func__, rc)
				return (rc);
			}
			if (entlim_add(kstr, plf, ctx) == -1) {
				free(kstr);
				free(plf);
				ET_LIM_DBG("exiting, ret %d [entlim_add failed]", __func__, PBSE_SYSTEM)
				return (PBSE_SYSTEM);
			}
		}
		plf->slf_sum.at_val.at_long += subjobs;
		mark_attr_set(&plf->slf_sum);
		ET_LIM_DBG("usage INCR to %ld, by %d", __func__, plf->slf_sum.at_val.at_long, subjobs)
	} else {
		if (plf == NULL) {
			free(kstr);
			/* Do not decrement what isn't there */
			ET_LIM_DBG("exiting, ret %d [plf is NULL]", __func__, PBSE_INTERNAL)
			return (PBSE_INTERNAL);
		}
		plf->slf_sum.at_val.at_long -= subjobs;
		mark_attr_set(&plf->slf_sum);
		ET_LIM_DBG("usage DECR to %ld, by %d", __func__, plf->slf_sum.at_val.at_long, subjobs)

		if (plf->slf_sum.at_val.at_long < 0L) {
			ET_LIM_DBG("zeroing usage, was %ld, by %d", __func__, plf->slf_sum.at_val.at_long, subjobs)
			plf->slf_sum.at_val.at_long = 0L;
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "set_single_entity_ct zeroing negative usage for %s", kstr);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_WARNING, msg_daemonname, log_buffer);
		}
	}
	free(kstr);
	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	return PBSE_NONE;
}

/*
 * set_single_entity_res - incr/decr a single resource for a single
 *	entity (user/group/all) for an attribute owned by queue or server,
 *	see set_entity_res_sum()
 *
 *	kt     - key type
 *	ename  - entity name
 *	patr   - pointer to attribute owned by queue or server to update
 *	newval - ptr to resource new value
 *	oldval - ptr to resource old value, null except for qalter case
 *		 where value is being changed, not just set
 *	pjob   - pointer to job
 *	subjobs    - count
 *	op     - increment or decrement
 *
 * @return	within the limit or not
 * @retval	zero	: adjusted Entity count
 * @retval	PBS_Enumber	: something got wrong!
 */
static int
set_single_entity_res(enum lim_keytypes kt, char *ename,
		      attribute *patr, resource *newval,
		      resource *oldval, job *pjob, int subjobs, enum batch_op op)
{
	char *rescn = newval->rs_defin->rs_name;
	char *kstr;
	void *ctx;
	svr_entlim_leaf_t *plf;
	int rc;
	int i;
	attribute tmpval = newval->rs_value;

	kstr = entlim_mk_reskey(kt, ename, rescn);
	if (kstr == NULL) {
		snprintf(log_buffer, LOG_BUF_SIZE - 1, "Error in entlim_mk_reskey for rescn %s", rescn);
		log_err(-1, __func__, log_buffer);
		ET_LIM_DBG("exiting, ret %d [kstr is NULL]", __func__, PBSE_SYSTEM)
		return (PBSE_SYSTEM);
	}
	ET_LIM_DBG("kstr %s, %d, %s, res %s, %p", __func__, kstr,
		   subjobs, (op == INCR) ? "INCR" : "DECR", rescn, oldval)
	ctx = patr->at_val.at_enty.ae_tree;
	plf = (svr_entlim_leaf_t *) entlim_get(kstr, ctx);

	if (oldval && plf) {
		if (!(plf->slf_rescd->rs_comp(&tmpval, &oldval->rs_value))) {
			free(kstr);
			ET_LIM_DBG("exiting, ret 0 [newval == oldval]", __func__)
			return PBSE_NONE;
		}
		plf->slf_rescd->rs_set(&tmpval, &oldval->rs_value, DECR); /* subtract prior value (qalter case) */
		if (will_log_event(PBSEVENT_DEBUG4)) {
			svrattrl *new, *old, *diff;
			char *new_val, *old_val, *diff_val;
			new = old = diff = NULL;
			if (is_attr_set(&newval->rs_value)) {
				plf->slf_rescd->rs_encode(&newval->rs_value, NULL, "newval", NULL, ATR_ENCODE_CLIENT, &new);
				new_val = new->al_value;
			} else
				new_val = "(not_set)";
			if (is_attr_set(&oldval->rs_value)) {
				plf->slf_rescd->rs_encode(&oldval->rs_value, NULL, "oldval", NULL, ATR_ENCODE_CLIENT, &old);
				old_val = old->al_value;
			} else
				old_val = "(not_set)";
			if (is_attr_set(&tmpval)) {
				plf->slf_rescd->rs_encode(&tmpval, NULL, "diffval", NULL, ATR_ENCODE_CLIENT, &diff);
				diff_val = diff->al_value;
			} else
				diff_val = "(not_set)";
			ET_LIM_DBG("DECR old from new, %s - %s = %s", __func__, new_val, old_val, diff_val)
			free(new);
			free(old);
			free(diff);
		}
	}

	if (op == INCR) {

		/* increment resource by newval, subtracting oldval if there */
		if (plf == NULL) {
			/* add leaf for this entity-limit */
			if ((rc = alloc_svrleaf(rescn, &plf)) != PBSE_NONE) {
				free(kstr);
				ET_LIM_DBG("exiting, ret %d [alloc_svrleaf failed]", __func__, rc)
				return (rc);
			}
			if (entlim_add(kstr, plf, ctx) == -1) {
				snprintf(log_buffer, LOG_BUF_SIZE - 1, "Error in entlim_add for reskey %s", kstr);
				log_err(-1, __func__, log_buffer);
				free(kstr);
				free(plf);
				ET_LIM_DBG("exiting, ret %d [entlim_add failed]", __func__, PBSE_SYSTEM)
				return (PBSE_SYSTEM);
			}
		}

		for (i = 0; i < subjobs; i++) {
			/* add in requested amount */
			(void) plf->slf_rescd->rs_set(&plf->slf_sum,
						      &tmpval, INCR);
		}
		if (will_log_event(PBSEVENT_DEBUG4) && (is_attr_set(&plf->slf_sum))) {
			svrattrl *sum;
			plf->slf_rescd->rs_encode(&plf->slf_sum, NULL, "sumval", NULL, ATR_ENCODE_CLIENT, &sum);
			ET_LIM_DBG("usage INCR to %s", __func__, sum->al_value)
			free(sum);
		} else
			ET_LIM_DBG("usage INCR to (not_set)", __func__)

	} else { /* DECR */

		/* decrement resource by newval, adding oldval if there */
		if (plf == NULL) {
			/* Do not decrement what isn't there */
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "decrementing resource for reskey %s: isn't found in attribute tree", kstr);
			log_err(-1, __func__, log_buffer);
			free(kstr);
			ET_LIM_DBG("exiting, ret %d [plf is NULL]", __func__, PBSE_INTERNAL)
			return (PBSE_INTERNAL);
		}

		for (i = 0; i < subjobs; i++) {
			(void) plf->slf_rescd->rs_set(&plf->slf_sum, &tmpval, DECR);
		}

		if (will_log_event(PBSEVENT_DEBUG4) && (is_attr_set(&plf->slf_sum))) {
			svrattrl *sum;
			plf->slf_rescd->rs_encode(&plf->slf_sum, NULL, "sumval", NULL, ATR_ENCODE_CLIENT, &sum);
			ET_LIM_DBG("usage DECR to %s", __func__, sum->al_value)
			free(sum);
		} else
			ET_LIM_DBG("usage DECR to (not_set)", __func__)

		tmpval = plf->slf_sum;
		plf->slf_rescd->rs_decode(&tmpval, NULL, NULL, "0");
		if (plf->slf_rescd->rs_comp(&plf->slf_sum, &tmpval) < 0) {
			ET_LIM_DBG("zeroing res usage", __func__)
			plf->slf_sum = tmpval;
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "set_single_entity_res zeroing negative usage for %s-%s", plf->slf_rescd->rs_name, kstr);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_WARNING, msg_daemonname, log_buffer);
		}
	}

	free(kstr);
	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	return PBSE_NONE;
}

/**
 * @brief
 * 		set_entity_ct_sum_queued() - set (increment/decrement) entity usage sum
 *		1.Againt Server attribute (pque will be null):
 *	   		a. Called when new job is arriving (INCR)
 *	   		b. Called when job is purged (DECR)
 *		2. against queue attributes
 *	   		a. on any enqueue (INCR) or
 *	   		b. any dequeue (DECR)
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	pque	-	pque will point to queue structure, i.e. not be null
 * @param[in]	op	-	operator example- INCR, DECR
 *
 * @return	int
 * @retval	zero	: all went ok
 * @retval	PBS_Enumber	: if error, typically a system or internal error
 */
int
set_entity_ct_sum_queued(job *pjob, pbs_queue *pque, enum batch_op op)
{
	char *egroup;
	char *project;
	char *euser;
	attribute *pqueued_jobs_threshold;
	enum batch_op rev_op;
	int rc;
	int subjobs;

	/* if the job is in states JOB_STATE_LTR_MOVED or JOB_STATE_LTR_FINISHED, */
	/* then just return,  the job's resources were removed from the   */
	/* entity sums when it went into the MOVED/FINISHED state	  */
	/* also return if the entity limits for this job were 		  */
	/* decremented before.						  */

	if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_FINISHED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_EXPIRED)) ||
	    ((check_job_state(pjob, JOB_STATE_LTR_RUNNING)) && (op == INCR))) {
		ET_LIM_DBG("exiting, ret 0 [job in %c state]", __func__, get_job_state(pjob))
		return 0;
	}

	/* set reverse op incase we have to back up */
	if (op == INCR)
		rev_op = DECR;
	else
		rev_op = INCR;

	if (pque)
		pqueued_jobs_threshold = get_qattr(pque, QA_ATR_queued_jobs_threshold);
	else
		pqueued_jobs_threshold = get_sattr(SVR_ATR_queued_jobs_threshold);

	if (!is_attr_set(pqueued_jobs_threshold)) {
		ET_LIM_DBG("exiting, ret 0 [queued_jobs_threshold limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return PBSE_NONE; /* no limits set */
	}

	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0) {
		ET_LIM_DBG("exiting, ret %d [get_queued_subjobs_ct() returned %d]", __func__,
			   PBSE_INTERNAL, subjobs)
		return PBSE_INTERNAL;
	}

	/* 1. set Overall limit, [o:PBS_ALL] */
	rc = set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pqueued_jobs_threshold, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(o:" PBS_ALL_ENTITY ",%d,%s) failed]", __func__,
			   rc, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}

	/* 2. set specific user limit, [u:user] */
	rc = set_single_entity_ct(LIM_USER, euser, pqueued_jobs_threshold, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		/* undo what was done above */
		(void) set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pqueued_jobs_threshold, pjob,
					    subjobs, rev_op);
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(u:%s,%d,%s) failed]", __func__,
			   rc, euser, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}

	/* 3. set specific group limit, [g:group] */
	rc = set_single_entity_ct(LIM_GROUP, egroup, pqueued_jobs_threshold, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		/* undo what was done above */
		(void) set_single_entity_ct(LIM_USER, euser, pqueued_jobs_threshold, pjob, subjobs, rev_op);
		(void) set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pqueued_jobs_threshold, pjob,
					    subjobs, rev_op);
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(g:%s,%d,%s) failed]", __func__,
			   rc, egroup, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}

	/* 4. set specific project limit, [p:project] */
	rc = set_single_entity_ct(LIM_PROJECT, project, pqueued_jobs_threshold, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		/* undo what was done above */
		(void) set_single_entity_ct(LIM_GROUP, egroup, pqueued_jobs_threshold, pjob, subjobs, rev_op);
		(void) set_single_entity_ct(LIM_USER, euser, pqueued_jobs_threshold, pjob, subjobs, rev_op);
		(void) set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pqueued_jobs_threshold, pjob, subjobs, rev_op);
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(p:%s,%d,%s) failed]", __func__,
			   rc, project, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}

	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	return 0;
}
/**
 * @brief
 * 		set_entity_ct_sum_max() - set (increment/decrement) entity usage sum
 *		1.Againt Server attribute (pque will be null):
 *	   		a. Called when new job is arriving (INCR)
 *	   		b. Called when job is purged (DECR)
 *		2. against queue attributes
 *	   		a. on any enqueue (INCR) or
 *	   		b. any dequeue (DECR)
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	pque	-	pque will point to queue structure, i.e. not be null
 * @param[in]	op	-	operator example- INCR, DECR
 *
 * @return	int
 * @retval	zero	: all went ok
 * @retval	PBS_Enumber	: if error, typically a system or internal error
 */
int
set_entity_ct_sum_max(job *pjob, pbs_queue *pque, enum batch_op op)
{
	char *egroup;
	char *project;
	char *euser;
	attribute *pmax_queued;
	enum batch_op rev_op;
	int rc;
	int subjobs;

	/* if the job is in states JOB_STATE_LTR_MOVED or JOB_STATE_LTR_FINISHED, */
	/* then just return,  the job's resources were removed from the   */
	/* entity sums when it went into the MOVED/FINISHED state	  */

	if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_EXPIRED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_FINISHED))) {
		ET_LIM_DBG("exiting, ret 0 [job in %c state]", __func__, get_job_state(pjob))
		return 0;
	}

	/* set reverse op incase we have to back up */
	if (op == INCR)
		rev_op = DECR;
	else
		rev_op = INCR;

	if (pque)
		pmax_queued = get_qattr(pque, QA_ATR_max_queued);
	else
		pmax_queued = get_sattr(SVR_ATR_max_queued);

	if (!is_attr_set(pmax_queued)) {
		ET_LIM_DBG("exiting, ret 0 [max_queued limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return PBSE_NONE;
	}

	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0) {
		ET_LIM_DBG("exiting, ret %d [get_queued_subjobs_ct() returned %d]", __func__,
			   PBSE_INTERNAL, subjobs)
		return PBSE_INTERNAL;
	}

	/* 1. set Overall limit, [o:PBS_ALL] */
	rc = set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pmax_queued, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(o:" PBS_ALL_ENTITY ",%d,%s) failed]", __func__,
			   rc, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}

	/* 2. set specific user limit, [u:user] */
	rc = set_single_entity_ct(LIM_USER, euser, pmax_queued, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		/* undo what was done above */
		(void) set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pmax_queued, pjob, subjobs, rev_op);
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(u:%s,%d,%s) failed]", __func__,
			   rc, euser, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}

	/* 3. set specific group limit, [g:group] */
	rc = set_single_entity_ct(LIM_GROUP, egroup, pmax_queued, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		/* undo what was done above */
		(void) set_single_entity_ct(LIM_USER, euser, pmax_queued, pjob, subjobs, rev_op);
		(void) set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pmax_queued, pjob, subjobs, rev_op);
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(g:%s,%d,%s) failed]", __func__,
			   rc, egroup, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}

	/* 4. set specific project limit, [p:project] */
	rc = set_single_entity_ct(LIM_PROJECT, project, pmax_queued, pjob, subjobs, op);
	if (rc != PBSE_NONE) {
		/* undo what was done above */
		(void) set_single_entity_ct(LIM_GROUP, egroup, pmax_queued, pjob, subjobs, rev_op);
		(void) set_single_entity_ct(LIM_USER, euser, pmax_queued, pjob, subjobs, rev_op);
		(void) set_single_entity_ct(LIM_OVERALL, PBS_ALL_ENTITY, pmax_queued, pjob, subjobs, rev_op);
		ET_LIM_DBG("exiting, ret %d [set_single_entity_ct(p:%s,%d,%s) failed]", __func__,
			   rc, project, subjobs, (op == INCR) ? "INCR" : "DECR")
		return rc;
	}
	ET_LIM_DBG("exiting, ret 0 [all ok]", __func__)
	return 0; /* within all count limits */
}

/**
 * @brief
 *		revert_entity_resources - unset prior entity resource count, if any failure occurs.
 *
 *
 * @param[in]  pmaxqresc    -   pointer to queue attribute structure
 * @param[in]  pattr_old    -   pointer to job attribute
 * @param[in]  presc_new    -   pointer to current processing resource
 * @param[in]  presc_old    -   pointer to old resource before alter
 * @param[in]  presc_first  -   pointer to first resource, used to reach the starting of resource list
 * @param[in]  pjob...      -   pointer to job
 * @param[in]  subjobs      -   number of subjobs, if any.
 * @param[in]  op           -   operator example- INCR, DECR
 *
 * @return      int
 * @retval      zero        -   all went ok
 * @retval      -1          -   error in input parameters
 */

static int
revert_entity_resources(attribute *pmaxqresc, attribute *pattr_old,
			resource *presc_new, resource *presc_old, resource *presc_first,
			job *pjob, int subjobs, enum batch_op op)
{

	int res_flag = 1;
	char *euser = get_jattr_str(pjob, JOB_ATR_euser);
	char *egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	char *project = get_jattr_str(pjob, JOB_ATR_project);

	if (pmaxqresc && presc_new && presc_first && euser && egroup && project) {

		for (presc_new = (resource *) GET_PRIOR(presc_new->rs_link);
		     (presc_new != NULL) && res_flag;
		     presc_new = (resource *) GET_PRIOR(presc_new->rs_link)) {

			if (presc_new == presc_first)
				res_flag = 0;
			if (!(is_attr_set(&presc_new->rs_value)) || ((presc_new->rs_defin->rs_entlimflg & PBS_ENTLIM_LIMITSET) == 0))
				continue;

			/* If this is from qalter where presc_old is set, see if    */
			/* corresponding resource is in presc_old, had a pior value */

			if (pattr_old)
				presc_old = find_resc_entry(pattr_old, presc_new->rs_defin);
			else
				presc_old = NULL;

			(void) set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY, pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
			(void) set_single_entity_res(LIM_USER, euser, pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
			(void) set_single_entity_res(LIM_GROUP, egroup, pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
			(void) set_single_entity_res(LIM_PROJECT, project, pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		}

		return (0);
	} else
		return (-1);
}

/**
 * @brief
 * 		set_entity_resc_sum_queued() - set entity resource usage
 *		based on requested (or altered) job wide resources
 *		1. Called against server attributes (pque will be null):
 *	   		a. When new job arrives (INCR)
 *	   		b. when job is purged (DECR)
 *		2. Called against queue attributes (pque will point to queue struct):
 *	   		a. on any enqueue (INCR), or
 *	   		b. on any dequeue (DECR)
 *
 * @param[in,out]	pjob	-	pointer to job structure
 * @param[in]	pque	-	pque will point to queue structure, i.e. not be null
 * @param[in]	altered_resc	-	altered resources.
 * @param[in]	op	-	operator example- INCR, DECR
 *
 * @return	int
 * @retval	zero	: all went ok
 * @retval	PBS_Enumber	: if error, typically a system or internal error
 */
int
set_entity_resc_sum_queued(job *pjob, pbs_queue *pque, attribute *altered_resc,
			   enum batch_op op)
{
	char *egroup = NULL;
	char *project = NULL;
	char *euser = NULL;
	int rc = PBSE_NONE;
	int rc_final;
	int subjobs;
	attribute *pmaxqresc = NULL;
	attribute *pattr_new = NULL;
	attribute *pattr_old = NULL;
	resource *presc_new = NULL;
	resource *presc_old = NULL;
	resource *presc_first = NULL;
	enum batch_op rev_op;

	ET_LIM_DBG("entered [alt_res %p]", __func__, altered_resc)
	/* if the job is in states JOB_STATE_LTR_MOVED or JOB_STATE_LTR_FINISHED, */
	/* then just return,  the job's resources were removed from the   */
	/* entity sums when it went into the MOVED/FINISHED state	  */
	/* also return if the entity limits for this job were 		  */
	/* decremented before.						  */

	if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_FINISHED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_EXPIRED)) ||
	    ((check_job_state(pjob, JOB_STATE_LTR_RUNNING)) && (op == INCR))) {
		ET_LIM_DBG("exiting, ret 0 [job in %c state]", __func__, get_job_state(pjob))
		return 0;
	}

	/* set reverse op incase we have to back up */
	if (op == INCR)
		rev_op = DECR;
	else
		rev_op = INCR;

	if (pque)
		pmaxqresc = get_qattr(pque, QA_ATR_queued_jobs_threshold_res);
	else
		pmaxqresc = get_sattr(SVR_ATR_queued_jobs_threshold_res);

	if (!is_attr_set(pmaxqresc)) {
		ET_LIM_DBG("exiting, ret 0 [queued_jobs_threshold_res limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return 0; /* no limits set */
	}

	if (altered_resc) {
		pattr_new = altered_resc;
		pattr_old = get_jattr(pjob, JOB_ATR_resource);
	} else {
		pattr_new = get_jattr(pjob, JOB_ATR_resource);
		pattr_old = NULL; /* null */
	}

	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0)
		rc = PBSE_INTERNAL;

	if (!euser) {
		log_err(PBSE_INTERNAL, __func__, "EMPTY USER");
		rc = PBSE_INTERNAL;
	}
	if (!egroup) {
		log_err(PBSE_INTERNAL, __func__, "EMPTY GROUP");
		rc = PBSE_INTERNAL;
	}
	if (!project) {
		log_err(PBSE_INTERNAL, __func__, "EMPTY PROJECT");
		rc = PBSE_INTERNAL;
	}

	if (rc == PBSE_INTERNAL) {
		ET_LIM_DBG("exiting, ret %d [something not right, subjobs %d, %p, %p, %p]", __func__,
			   PBSE_INTERNAL, subjobs, euser, egroup, project)
		return PBSE_INTERNAL;
	}

	rc_final = 0;

	for (presc_new = (resource *) GET_NEXT(pattr_new->at_val.at_list), presc_first = presc_new;
	     presc_new != NULL;
	     presc_new = (resource *) GET_NEXT(presc_new->rs_link)) {

		char *rescn;
		if (!(is_attr_set(&presc_new->rs_value)) || ((presc_new->rs_defin->rs_entlimflg & PBS_ENTLIM_LIMITSET) == 0))
			continue;

		/* If this is from qalter where presc_old is set, see if    */
		/* corresponding resource is in presc_old, had a pior value */

		if (pattr_old)
			presc_old = find_resc_entry(pattr_old, presc_new->rs_defin);
		else
			presc_old = NULL;

		rescn = presc_new->rs_defin->rs_name;
		if (rescn == NULL) {
			if (presc_new != presc_first)
				if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
					log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
			log_err(PBSE_INTERNAL, __func__, "EMPTY RESOURCE");
			ET_LIM_DBG("exiting, ret %d [rescn is NULL]", __func__, PBSE_INTERNAL)
			return PBSE_INTERNAL;
		}

		ET_LIM_DBG("setting usage for res %s", __func__, rescn)
		/* 1. set overall limit o:PBS_ALL */
		rc = set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(o:" PBS_ALL_ENTITY ";%s,%d,%s) failed with rc %d", __func__,
				   rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in LIM_OVERALL for resource %s", rescn);
			log_err(rc, __func__, log_buffer);
			if (op == INCR) {
				if (presc_new != presc_first)
					if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
			}
			continue;
		}

		/* 2. sets user limit */
		rc = set_single_entity_res(LIM_USER, euser,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(u:%s;%s,%d,%s) failed with rc %d", __func__,
				   euser, rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in LIM_USER for euser %s for resource %s", euser, rescn);
			log_err(rc, __func__, log_buffer);
			/* reverse change made above */
			(void) set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY, pmaxqresc,
						     presc_new, presc_old, pjob, subjobs, rev_op);
			if (op == INCR) {
				if (presc_new != presc_first)
					if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
				continue;
			}
		}

		/* 3. set specific group limit */
		rc = set_single_entity_res(LIM_GROUP, egroup,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(g:%s;%s,%d,%s) failed with rc %d", __func__,
				   egroup, rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)

			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in LIM_GROUP for egroup %s for resource %s", egroup, rescn);
			log_err(rc, __func__, log_buffer);

			/* reverse changes made above */
			(void) set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			(void) set_single_entity_res(LIM_USER, euser,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			if (op == INCR) {
				if (presc_new != presc_first)
					if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
				continue;
			}
		}

		/* 4. set specific project limit */
		rc = set_single_entity_res(LIM_PROJECT, project,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(p:%s;%s,%d,%s) failed with rc %d", __func__,
				   project, rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in LIM_USER for project %s for resource %s", project, rescn);
			log_err(rc, __func__, log_buffer);

			/* reverse changes made above */
			(void) set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			(void) set_single_entity_res(LIM_USER, euser,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			(void) set_single_entity_res(LIM_GROUP, egroup,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			if (op == INCR) {
				if (presc_new != presc_first)
					if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
				continue;
			}
		}
	}

	ET_LIM_DBG("exiting, ret %d", __func__, rc_final)
	return rc_final;
}

/**
 * @brief
 * 		set_entity_res_sum_max() - set entity resource usage
 *		based on requested (or altered) job wide resources
 *		1. Called against server attributes (pque will be null):
 *	   		a. When new job arrives (INCR)
 *	   		b. when job is purged (DECR)
 *		2. Called against queue attributes (pque will point to queue struct):
 *	   		a. on any enqueue (INCR), or
 *	   		b. on any dequeue (DECR)
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	pque	-	pque will point to queue structure, i.e. not be null
 * @param[in]	altered_resc	-	altered resources.
 * @param[in]	op	-	operator example- INCR, DECR
 *
 * @return	int
 * @retval	zero	: all went ok
 * @retval	PBS_Enumber	: if error, typically a system or internal error
 */
int
set_entity_resc_sum_max(job *pjob, pbs_queue *pque, attribute *altered_resc,
			enum batch_op op)
{
	char *egroup = NULL;
	char *project = NULL;
	char *euser = NULL;
	int rc = PBSE_NONE;
	int rc_final;
	int subjobs;
	attribute *pmaxqresc = NULL;
	attribute *pattr_new = NULL;
	attribute *pattr_old = NULL;
	resource *presc_new = NULL;
	resource *presc_old = NULL;
	resource *presc_first = NULL;
	enum batch_op rev_op;

	ET_LIM_DBG("entered [alt_res %p]", __func__, altered_resc)
	/* if the job is in states JOB_STATE_LTR_MOVED or JOB_STATE_LTR_FINISHED, */
	/* then just return,  the job's resources were removed from the   */
	/* entity sums when it went into the MOVED/FINISHED state	  */

	if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_EXPIRED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_FINISHED))) {
		ET_LIM_DBG("exiting, ret 0 [job in %c state]", __func__, get_job_state(pjob))
		return 0;
	}

	/* set reverse op incase we have to back up */
	if (op == INCR)
		rev_op = DECR;
	else
		rev_op = INCR;

	if (pque)
		pmaxqresc = get_qattr(pque, QA_ATR_max_queued_res);
	else
		pmaxqresc = get_sattr(SVR_ATR_max_queued_res);

	if (!is_attr_set(pmaxqresc)) {
		ET_LIM_DBG("exiting, ret 0 [max_queued_res limit not set for %s]", __func__, pque ? pque->qu_qs.qu_name : "server")
		return 0; /* no limits set */
	}

	if (altered_resc) {
		pattr_new = altered_resc;
		pattr_old = get_jattr(pjob, JOB_ATR_resource);
	} else {
		pattr_new = get_jattr(pjob, JOB_ATR_resource);
		pattr_old = NULL; /* null */
	}

	euser = get_jattr_str(pjob, JOB_ATR_euser);
	egroup = get_jattr_str(pjob, JOB_ATR_egroup);
	project = get_jattr_str(pjob, JOB_ATR_project);

	if ((subjobs = get_queued_subjobs_ct(pjob)) < 0) {
		rc = PBSE_INTERNAL;
	}

	if (!euser) {
		log_err(PBSE_INTERNAL, __func__, "EMPTY USER");
		rc = PBSE_INTERNAL;
	}
	if (!egroup) {
		log_err(PBSE_INTERNAL, __func__, "EMPTY GROUP");
		rc = PBSE_INTERNAL;
	}
	if (!project) {
		log_err(PBSE_INTERNAL, __func__, "EMPTY PROJECT");
		rc = PBSE_INTERNAL;
	}

	if (rc == PBSE_INTERNAL) {
		ET_LIM_DBG("exiting, ret %d [something not right, subjobs %d, %p, %p, %p]", __func__,
			   PBSE_INTERNAL, subjobs, euser, egroup, project)
		return PBSE_INTERNAL;
	}

	rc_final = 0;

	for (presc_new = (resource *) GET_NEXT(pattr_new->at_val.at_list), presc_first = presc_new;
	     presc_new != NULL;
	     presc_new = (resource *) GET_NEXT(presc_new->rs_link)) {
		char *rescn;
		if (!(is_attr_set(&presc_new->rs_value)) || ((presc_new->rs_defin->rs_entlimflg & PBS_ENTLIM_LIMITSET) == 0))
			continue;

		/* If this is from qalter where presc_old is set, see if    */
		/* corresponding resource is in presc_old, had a pior value */

		if (pattr_old)
			presc_old = find_resc_entry(pattr_old, presc_new->rs_defin);
		else
			presc_old = NULL;

		rescn = presc_new->rs_defin->rs_name;
		if (rescn == NULL) {
			if (presc_new != presc_first)
				if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
					log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
			log_err(PBSE_INTERNAL, __func__, "EMPTY RESOURCE");
			ET_LIM_DBG("exiting, ret %d [rescn is NULL]", __func__, PBSE_INTERNAL)
			return PBSE_INTERNAL;
		}

		ET_LIM_DBG("setting usage for res %s", __func__, rescn)
		/* 1. set overall limit o:PBS_ALL */
		rc = set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(o:" PBS_ALL_ENTITY ";%s,%d,%s) failed with rc %d", __func__,
				   rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)

			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in  LIM_OVERALL for resource %s", rescn);
			log_err(rc, __func__, log_buffer);
			if (op == INCR) {
				if (presc_new != presc_first)
					if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
				continue;
			}
		}

		/* 2. sets user limit */
		rc = set_single_entity_res(LIM_USER, euser,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(u:%s;%s,%d,%s) failed with rc %d", __func__,
				   euser, rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)
			/* reverse change made above */
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in  LIM_USER for euser %s for resource %s", euser, rescn);
			log_err(rc, __func__, log_buffer);
			(void) set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			if (op == INCR) {
				if (presc_new != presc_first)
					if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
				continue;
			}
		}

		/* 3. set specific group limit */
		rc = set_single_entity_res(LIM_GROUP, egroup,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(g:%s;%s,%d,%s) failed with rc %d", __func__,
				   egroup, rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in  LIM_GROUP for egroup %s for resource %s", egroup, rescn);
			log_err(rc, __func__, log_buffer);
			/* reverse changes made above */
			(void) set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			(void) set_single_entity_res(LIM_USER, euser,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			if (op == INCR) {
				if (presc_new != presc_first)
					if ((revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op)) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
				continue;
			}
		}

		/* 4. set specific project limit */
		rc = set_single_entity_res(LIM_PROJECT, project,
					   pmaxqresc, presc_new, presc_old, pjob, subjobs, op);
		if (rc) {
			ET_LIM_DBG("set_single_entity_res(p:%s;%s,%d,%s) failed with rc %d", __func__,
				   project, rescn, subjobs, (op == INCR) ? "INCR" : "DECR", rc)
			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "Error in LIM_PROJECT for project %s for resource %s", project, rescn);
			log_err(rc, __func__, log_buffer);
			/* reverse changes made above */
			(void) set_single_entity_res(LIM_OVERALL, PBS_ALL_ENTITY,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			(void) set_single_entity_res(LIM_USER, euser,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			(void) set_single_entity_res(LIM_GROUP, egroup,
						     pmaxqresc, presc_new, presc_old, pjob, subjobs, rev_op);
			if (op == INCR) {
				if (presc_new != presc_first)
					if (revert_entity_resources(pmaxqresc, pattr_old, presc_new, presc_old, presc_first, pjob, subjobs, rev_op) != 0)
						log_err(PBSE_INTERNAL, __func__, "Error in revert_entity_resources");
				return rc;
			} else {
				if (!rc_final)
					rc_final = rc;
				continue;
			}
		}
	}

	ET_LIM_DBG("exiting, ret %d", __func__, rc_final)
	return rc_final;
}
/**
 * @brief
 * 		account_entity_limit_usages() - set entity usage
 *		for all four combination of entity limits res/ct and max/queued
 *		1. Called against server attributes (pque will be null):
 *	   		a. When new job arrives (INCR)
 *	   		b. when job is purged (DECR)
 *		2. Called against queue attributes (pque will point to queue struct):
 *	   		a. on any enqueue (INCR), or
 *	   		b. on any dequeue (DECR)
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	pque	-	pque will point to queue structure, i.e. not be null
 * @param[in]	altered_resc	-	altered resources.
 * @param[in]	op	-	operator example- INCR, DECR
 * @param[in]	op_flag	-	operation flag for selecting combinations of set_entity_*_sum_*()
 * 				use ETLIM_ACC_* flag macros defined in pbs_entlim.h, ex: ETLIM_ACC_ALL
 *
 * @return	int
 * @retval	zero	: all went ok
 * @retval	PBS_Enumber	: if error, typically a system or internal error
 */
int
account_entity_limit_usages(job *pjob, pbs_queue *pque, attribute *altered_resc,
			    enum batch_op op, int op_flag)
{
	int rc, ret_error = PBSE_NONE;

	/* not doing NULL checks of parameters as this function is currently invoked from sane locations */

	ET_LIM_DBG("entered, %s on %s %s, op_flag %x, alt_res_ptr %p", __func__,
		   (op == INCR) ? "INCR" : "DECR", pque ? "queue" : "server", pque ? pque->qu_qs.qu_name : server_name, op_flag, altered_resc)

	if ((op_flag & ETLIM_ACC_CT_MAX) == ETLIM_ACC_CT_MAX)
		if ((rc = set_entity_ct_sum_max(pjob, pque, op)) != 0) {
			ret_error = rc;
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "set_entity_ct_sum_max %s on %s %s failed with %d",
				 (op == INCR) ? "INCR" : "DECR", pque ? "queue" : "server", pque ? pque->qu_qs.qu_name : server_name, rc);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
		}

	if ((op_flag & ETLIM_ACC_CT_QUEUED) == ETLIM_ACC_CT_QUEUED)
		if ((rc = set_entity_ct_sum_queued(pjob, pque, op)) != 0) {
			ret_error = rc;
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "set_entity_ct_sum_queued %s on %s %s failed with %d",
				 (op == INCR) ? "INCR" : "DECR", pque ? "queue" : "server", pque ? pque->qu_qs.qu_name : server_name, rc);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
		}

	if ((op_flag & ETLIM_ACC_RES_MAX) == ETLIM_ACC_RES_MAX)
		if ((rc = set_entity_resc_sum_max(pjob, pque, altered_resc, op)) != 0) {
			ret_error = rc;
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "set_entity_resc_sum_max %s on %s %s failed with %d, (altered_resc %p)",
				 (op == INCR) ? "INCR" : "DECR", pque ? "queue" : "server", pque ? pque->qu_qs.qu_name : server_name, rc, altered_resc);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
		}

	if ((op_flag & ETLIM_ACC_RES_QUEUED) == ETLIM_ACC_RES_QUEUED)
		if ((rc = set_entity_resc_sum_queued(pjob, pque, altered_resc, op)) != 0) {
			ret_error = rc;
			snprintf(log_buffer, LOG_BUF_SIZE - 1, "set_entity_resc_sum_queued %s on %s %s failed with %d, (altered_resc %p)",
				 (op == INCR) ? "INCR" : "DECR", pque ? "queue" : "server", pque ? pque->qu_qs.qu_name : server_name, rc, altered_resc);
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE, pjob->ji_qs.ji_jobid, log_buffer);
		}

	ET_LIM_DBG("exiting, ret_error %d", __func__, ret_error)

	return ret_error;
}

/**
 * @brief
 *		Adds a record for a provisioning vnode.
 *
 * @par Functionality:
 *      This function loops through 'sv_prov_track' table
 *		and stores input arguments, if it finds an empty record.
 *
 * @see
 *		start_vnode_provisioning
 *
 * @param[in]   pid		-	provision process id
 * @param[in]   prov_vnode_info	-	prov_vnode_info structure
 *
 * @return	int
 * @retval	0	: On successful addtion of record
 * @retval	-1	: could not add provision record
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static int
add_prov_record(prov_pid pid,
		struct prov_vnode_info *prov_vnode_info)
{
	int i;

	for (i = 0; i < server.sv_provtracksize; i++) {
		if (server.sv_prov_track[i].pvtk_mtime == 0) {
			/* found an empty record */
			break;
		}
	}
	if (i == server.sv_provtracksize) {
		DBPRT(("%s: Could not add records: current records = %d\n",
		       __func__, server.sv_cur_prov_records))
		return -1;
	}
	server.sv_prov_track[i].pvtk_mtime = time_now;
	if ((server.sv_prov_track[i].pvtk_vnode = strdup(prov_vnode_info->pvnfo_vnode)) == NULL) {
		DBPRT(("%s: Unable to allocate Memory!\n", __func__));
		return -1;
	}
	if ((server.sv_prov_track[i].pvtk_aoe_req = strdup(prov_vnode_info->pvnfo_aoe_req)) == NULL) {
		free(server.sv_prov_track[i].pvtk_vnode);
		DBPRT(("%s: Unable to allocate Memory!\n", __func__));
		return -1;
	}
	server.sv_prov_track[i].prov_vnode_info = prov_vnode_info;
	server.sv_prov_track[i].pvtk_pid = pid;
	server.sv_cur_prov_records++;
	server.sv_provtrackmodifed = 1;
	DBPRT(("%s: Added a record: current records = %d\n",
	       __func__, server.sv_cur_prov_records))
	return 0;
}

/**
 * @brief
 *		remove_prov_record
 *
 * @par Functionality:
 *      This function loops through 'sv_prov_track' table and resets the record
 *		for a vnode. It is called when vnode finishes provisioning or fails one.
 *
 * @see
 *
 * @param[in]   vnode	-	vnode name
 *
 * @return      void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static void
remove_prov_record(char *vnode)
{
	int i;

	for (i = 0; i < server.sv_provtracksize; i++) {
		if (server.sv_prov_track[i].pvtk_mtime != 0 &&
		    (strcmp(vnode, server.sv_prov_track[i].pvtk_vnode) == 0)) {
			if (server.sv_prov_track[i].pvtk_aoe_req)
				free(server.sv_prov_track[i].pvtk_aoe_req);
			if (server.sv_prov_track[i].pvtk_vnode)
				free(server.sv_prov_track[i].pvtk_vnode);
			memset(&server.sv_prov_track[i], 0,
			       sizeof(struct prov_tracking));
			server.sv_prov_track[i].pvtk_mtime = 0;
			server.sv_provtrackmodifed = 1;
			server.sv_cur_prov_records--;
			break;
		}
	}
}

/**
 * @brief
 *		Save the provisioning records to a file.
 *
 * @par Functionality:
 *      This function is invoked periodically by a timed work task. It saves
 *		vnode name, aoe name and time stamp to prov_tracking file.
 *
 * @see
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

void
prov_track_save()
{
	FILE *fd;
	int i;

	/* set task for next round trip */
	if (server.sv_provtrackmodifed == 0)
		return; /* nothing to do this time */

	fd = fopen(path_prov_track, "w");
	if (fd == NULL) {
		DBPRT(("%s: unable to open tracking file\n", __func__))
		return;
	}

	/* we write only mtime , vnode name and AOE name to file */
	for (i = 0; i < server.sv_provtracksize; i++) {
		/* write in the file (size of each record may vary) */
		fprintf(fd, "%ld|", server.sv_prov_track[i].pvtk_mtime);

		if (server.sv_prov_track[i].pvtk_vnode)
			fprintf(fd, "%s|", server.sv_prov_track[i].pvtk_vnode);
		else
			fprintf(fd, "0|"); /* dont want to write (null) */

		if (server.sv_prov_track[i].pvtk_aoe_req)
			fprintf(fd, "%s", server.sv_prov_track[i].pvtk_aoe_req);
		else
			fprintf(fd, "0"); /* dont want to write (null) */

		if (i < server.sv_provtracksize - 1)
			fprintf(fd, "|");
	}

	(void) fclose(fd);
	server.sv_provtrackmodifed = 0;
}

/**
 * @brief
 *		Looks up a provisioning vnode record by a vnode name.
 *
 * @par Functionality:
 *      This function gets the index of the provisioning table given the
 *		vnode name. It returns NULL if match not found.
 *
 * @see
 *		#prov_tracking in provision.h
 *
 * @param[in]	vnode	-	vnode name
 *
 * @return	pointer to prov_tracking
 * @retval	pointer to prov_tracking	: if prov_tracking record is found
 * @retval	NULL	: if prov_tracking record is not found
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

struct prov_tracking *
get_prov_record_by_vnode(char *vnode)
{
	int i;

	for (i = 0; i < server.sv_provtracksize; i++) {
		if ((server.sv_prov_track[i].pvtk_mtime != 0) &&
		    strcmp(vnode,
			   server.sv_prov_track[i].pvtk_vnode) == 0) {
			return &(server.sv_prov_track[i]);
		}
	}
	return NULL;
}

/**
 * @brief
 *		Looks up a provisioning vnode record by a given pid.
 *
 *
 * @par Functionality:
 *      This function takes 'pid' as an input and returns address
 * 		of the provision record. If it doesn't find any entry then
 *		it returns -1.
 *
 * @see
 *		#prov_tracking in provision.h
 *
 * @param[in]	pid	-	provision process id
 *
 * @return	pointer to prov_tracking
 * @retval	pointer to prov_tracking	: if prov_tracking record is found
 * @retval	NULL	: if prov_tracking record is not found
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static struct prov_tracking *
get_prov_record_by_pid(prov_pid pid)
{
	int i;

	for (i = 0; i < server.sv_provtracksize; i++) {
		if (pid == server.sv_prov_track[i].pvtk_pid) {
			return &(server.sv_prov_track[i]);
		}
	}
	return NULL;
}

/**
 * @brief
 *		Deletes a single prov_vnode_info record.
 *
 *
 * @par Functionality:
 *      This function deletes an entry of prov_vnode_info type
 *
 * @see
 *
 * @param[in]	pvinfo	-	provision vnode info structure.
 *
 * @return      void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static void
free_pvnfo(struct prov_vnode_info *pvnfo)
{
	if (pvnfo == NULL)
		return;
	if (pvnfo->pvnfo_vnode)
		free(pvnfo->pvnfo_vnode);
	if (pvnfo->pvnfo_aoe_req)
		free(pvnfo->pvnfo_aoe_req);
	free(pvnfo);
	pvnfo = NULL;
}

/**
 * @brief
 *		Checks if aoe is available on a vnode.
 *
 *
 * @par Functionality:
 *      This function checks if aoe is available in node's
 *		resources_available.aoe
 *
 * @see
 *
 * @param[in]	pnode	-	pointer to pbsnode struct
 * @param[in]   aoe_req	-	aoe requested
 *
 * @return	int
 * @retval	0	: aoe is available on the vnode
 * @retval	-1	: aoe is unavailable on the vnode
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

int
check_req_aoe_available(struct pbsnode *pnode, char *aoe_req)
{
	resource_def *prd;
	resource *prc;
	struct array_strings *pas;
	int i;

	if (!pnode || !aoe_req)
		return -1;

	prd = &svr_resc_def[RESC_AOE];
	if (prd == NULL)
		return -1;
	prc = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAvail), prd);
	if (prc) {
		pas = prc->rs_value.at_val.at_arst;

		if (pas != NULL) {
			for (i = 0; i < pas->as_usedptr; i++) {
				if (strcmp(aoe_req, pas->as_string[i]) == 0)
					return 0;
			}
		}
	}
	return -1;
}

/**
 * @brief
 *		This function disables provisioning functionality.
 *
 * @par Functionality:
 *		This function disables provision_enable (internal)attribute on server.
 *
 * @see
 *		mgr_hook_delete
 *		mgr_hook_set
 *		mgr_hook_unset
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

void
disable_svr_prov()
{
	if (is_sattr_set(SVR_ATR_ProvisionEnable))
		set_sattr_l_slim(SVR_ATR_ProvisionEnable, 0, SET);
}

/**
 * @brief
 *		Parses prov_vnode attribute of job
 *
 * @par Functionality:
 *      This function parses 'prov_vnode' attribute of job and returns
 *		number of nodes required to run the job or -1 for failure.
 *
 * @see
 *		is_runnable
 *		fail_vnode_job
 *
 * @param[in]	prov_vnode	-	vnode name
 * @param[in]   prov_vnodes	-	ptr to prov_vnode string
 *
 * @return      int
 * @retval     >=1	: number of nodes to be provisioned
 * @retval      -1	: parsing failure.
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

int
parse_prov_vnode(char *prov_vnode, exec_vnode_listtype *prov_vnodes)
{
	/* Variables used in parsing the "exec_vnode" string */
	char *psubspec;
	char *slast;
	char *sbuf = NULL;
	int hpn;
	int i = 0, k;
	int num_of_prov_vnodes = 1;
	char *p = NULL;

	if (prov_vnode == NULL) {
		DBPRT(("%s: invalid params\n", __func__))
		return (-1);
	}

	/* Find number of nodes required to run the job */
	for (p = prov_vnode; *p; p++) {
		if (*p == '+')
			num_of_prov_vnodes++;
	}
	/* Allocate tempory memory to hold prov_vnode attribute */
	sbuf = strdup(prov_vnode);
	if (sbuf == NULL)
		return -1;

	/* Allocate memory to hold vnodenames */
	*prov_vnodes = calloc(num_of_prov_vnodes, PBS_MAXHOSTNAME + 1);
	if (*prov_vnodes == NULL) {
		free(sbuf);
		return -1;
	}

	psubspec = parse_plus_spec_r(sbuf, &slast, &hpn);
	while (psubspec) {
		/* Read vnodename */
		k = 0;
		for (p = psubspec; *p && *p != ':'; p++, k++) {
			(*prov_vnodes)[i][k] = *p;
		}
		(*prov_vnodes)[i][k] = '\0';
		DBPRT(("%s: %s\n", __func__, (*prov_vnodes)[i]))
		++i;
		psubspec = parse_plus_spec_r(slast, &slast, &hpn);
	}
	free(sbuf);

	return num_of_prov_vnodes;
}

/**
 * @brief
 *		Checks if node needs provisioning.
 *
 * @par Functionality:
 *		Checks if node needs provisioning by matching the requested aoe and
 *		current aoe on the node. It also checks if requested aoe is available
 *		on the node. Node need not provision if requested aoe is current aoe
 *		on the node. If reqeusted aoe is not available on node or available
 *		list on node is empty then job cannot run.
 *
 * @see
 *		find_prov_vnode_list
 *
 * @param[in]	pnode	-	vnode
 * @param[in]	aoe_name	-	aoe requested
 *
 * @return	int
 * @retval	-1	: node cannot be provisioned
 * @retval	0	: node need not provision
 * @retval	1	: node can be provisioned
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:  Yes
 *
 */

static int
node_need_prov(struct pbsnode *pnode, char *aoe_name)
{
	resource *presc;
	resource_def *prdef;
	char *aoe; /* hold current_aoe of pnode */
	int i;
	struct array_strings *pas = NULL;

	if (pnode == NULL || aoe_name == NULL)
		return -1;

	prdef = &svr_resc_def[RESC_AOE];
	presc = find_resc_entry(get_nattr(pnode, ND_ATR_ResourceAvail), prdef);

	/* if resources_available.aoe not set */
	if (presc == NULL)
		return -1;

	if (presc->rs_value.at_flags & ATR_VFLAG_MODIFY) {
		/* if aoe is not in resources_available.aoe */

		pas = presc->rs_value.at_val.at_arst;
		for (i = 0; i < pas->as_usedptr; i++) {
			if (strcmp(pas->as_string[i], aoe_name) == 0) { /* aoe is available */
				/* if aoe is already instantiated */
				aoe = get_nattr_str(pnode, ND_ATR_current_aoe);
				if (aoe != NULL) {
					if (strcmp(aoe_name, aoe) == 0)
						return 0;
				}
				return 1;
			}
		}
	}

	return -1;
}

/**
 * @brief
 *		Parses exec_vnode string sent by scheduler and sets prov_vnode of job
 *
 * @par Functionality:
 *      This function takes 'exec_vnode' attribute sent by scheduler
 *		and on sucessful parsing returns number of nodes with aoe in
 *		their chunk. Multiple nodes in exec_vnode are reported once.
 *		aoe_name contains the name of aoe to be provisioned with.
 *		prov_vnode attribute of job is also set.
 *
 * @see
 *		check_and_enqueue_provisioning
 *
 * @param[in]	pjob		-	pointer to job
 * @param[out]  prov_vnodes	-	list of nodes
 * @param[out]  aoe_name	-	aoe requested
 *
 * @return	int
 * @retval	>=0	: number of nodes to be provisioned
 * @retval	-1	: parsing failure.
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

int
find_prov_vnode_list(job *pjob, exec_vnode_listtype *prov_vnodes, char **aoe_name)
{
	/* Variables used in parsing the "exec_vnode" string */
	char *psubspec;
	char *slast;
	char *sbuf = NULL;
	int hpn;
	int i = 0, k, j;
	int num_of_exec_vnodes = 1;
	char *p = NULL;
	char *aoe = NULL;
	char *vname;
	int nelem;
	struct key_value_pair *pkvp;
	int no_add = 0;
	struct pbsnode *pnode;
	int ret; /* return code of node_need_provision() */
	char *pbuf = NULL;
	char *execvnod = NULL;

	if (is_jattr_set(pjob, JOB_ATR_exec_vnode))
		execvnod = get_jattr_str(pjob, JOB_ATR_exec_vnode);

	if (execvnod == NULL) {
		DBPRT(("%s: invalid params\n", __func__))
		return (-1);
	}

	/* Find number of nodes required to run the job */
	for (p = execvnod; *p; p++) {
		if (*p == '+')
			num_of_exec_vnodes++;
	}
	/* Allocate temporary memory to hold execvnod attribute */
	sbuf = strdup(execvnod);
	if (sbuf == NULL)
		return -1;

	/* Allocate temp memory to hold prov_vnode attribute */
	pbuf = calloc(1, strlen(execvnod) + 1);
	if (pbuf == NULL) {
		free(sbuf);
		return -1;
	}

	/* Allocate memory to hold vnodenames and their aoe's */
	*prov_vnodes = calloc(num_of_exec_vnodes, PBS_MAXHOSTNAME + 1);
	if (*prov_vnodes == NULL) {
		free(sbuf);
		free(pbuf);
		return -1;
	}

	psubspec = parse_plus_spec_r(sbuf, &slast, &hpn);
	while (psubspec) {
		if (parse_node_resc(psubspec, &vname, &nelem, &pkvp) == 0) {
			for (k = 0; k < nelem; k++) {
				no_add = 0;
				/* Read vnodename if aoe requested */
				if (strcasecmp("aoe", (pkvp + k)->kv_keyw) == 0) {

					/* check if same vnode is request again */
					for (j = 0; j <= i; j++) {
						if (strcmp(vname, (*prov_vnodes)[i]) == 0) {
							no_add = 1;
							break;
						}
					}
					if (no_add)
						break;

					DBPRT(("%s: Look up node %s\n", __func__, vname))
					pnode = find_nodebyname(vname);
					/* check if node really needs provisioning, if not, continue.
					 * This is to stop qrun -H from provisioning a node (including
					 * head node) that does not have aoe_req in its available list.
					 */
					ret = node_need_prov(pnode, (pkvp + k)->kv_val);
					if (ret == -1) {
						free(sbuf);
						free(pbuf);
						return -1;
					}
					if (ret == 0)
						break;

					strcpy((*prov_vnodes)[i], vname);
					DBPRT(("%s: %s\n", __func__, (*prov_vnodes)[i]))
					++i;
					if (aoe_name != NULL) {
						if (*aoe_name) {
							if (strcmp(*aoe_name, ((pkvp + k)->kv_val)) != 0) {
								/* Aoe name can not be different across chunks, it's an error */
								free(sbuf);
								free(pbuf);
								free(*aoe_name);
								return -1;
							}
						} else {
							aoe = strdup((pkvp + k)->kv_val);
							if (aoe == NULL) {
								free(sbuf);
								free(pbuf);
								return -1;
							}
							(*aoe_name) = aoe;
						}
						DBPRT(("%s: %s\n", __func__, (*aoe_name)))
					}
					break;
				}
			}
		}
		psubspec = parse_plus_spec_r(slast, &slast, &hpn);
	}

	/* prepare prov_vnode and assign to job. We do this because prov_vnode
	 * is to be parsed again later to find vnodes that were provisioned.
	 * exec_vnode cannot be parsed again since vnodes would have their
	 * current_aoe set right.
	 */
	for (j = 0; j < i; j++) {
		if (j == 0) {
			strcpy(pbuf, (*prov_vnodes)[j]);
		} else {
			strcat(pbuf, "+");
			strcat(pbuf, (*prov_vnodes)[j]);
		}
		strcat(pbuf, ":aoe=");
		strcat(pbuf, (*aoe_name));
	}
	set_jattr_str_slim(pjob, JOB_ATR_prov_vnode, pbuf, NULL);

	DBPRT(("%s: prov_vnode: %s\n", __func__, pbuf))

	free(pbuf);
	free(sbuf);
	return i;
}

/**
 * @brief
 *		Finds a vnode's entry in prov_vnode_info.
 *
 * @par Functionality:
 *      This function loops through list of provision vnodes
 *		and returns prov_vnode_info. Returns NULL, if not able to find.
 *
 * @see
 *		free_prov_vnode
 *		#prov_vnode_info in provision.h
 *
 * @param[in]	pnode	-	pointer to pbsnode
 *
 * @return	pointer to prov_vnode_info
 * @retval	pointer to prov_vnode_info	: if entry in prov_vnode_info is found
 * @retval	NULL	: if entry is not found
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static struct prov_vnode_info *
find_prov_vnode(struct pbsnode *pnode)
{
	struct prov_vnode_info *prov_vnode_info = NULL;

	prov_vnode_info = GET_NEXT(prov_allvnodes);
	while (prov_vnode_info) {
		if (strcmp(prov_vnode_info->pvnfo_vnode, pnode->nd_name) == 0) {
			return prov_vnode_info;
		}
		prov_vnode_info = GET_NEXT(prov_vnode_info->al_link);
	}
	return NULL;
}

/**
 * @brief
 *		Removes vnode's entry from prov_vnode_info.
 *
 * @par Functionality:
 *      This function removes the vnode from prov_vnode_info and
 *		unsets vnode's INUSE_WAIT_PROV state.
 *
 * @see
 *		free_nodes
 *
 * @param[in]	pnode	-	pointer to pbsnode
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

void
free_prov_vnode(struct pbsnode *pnode)
{
	struct prov_vnode_info *prov_vnode_info = NULL;

	if (pnode->nd_state & INUSE_WAIT_PROV) {
		if ((prov_vnode_info = find_prov_vnode(pnode))) {
			delete_link(&prov_vnode_info->al_link);
			free_pvnfo(prov_vnode_info);
		}

		set_vnode_state(pnode, ~INUSE_WAIT_PROV, Nd_State_And);
	}
}

/**
 * @brief
 *		Determines if job can be run on account of a vnode finishing
 *		provisioning.
 *
 * @par Functionality:
 *      This function checks for a job, if all its vnodes have finished
 *		provisioning. If at least one vnode is offline or in wait-provisioning
 *		state or has finished provisioning but has another aoe set then job
 *		cannot be run.
 *		It also checks the case where a multi-vnode job has one
 *		vnode failing provisioning while others are still provisioning.
 *
 * @see
 *		check_and_run_jobs
 *
 * @param[in]   ptr	-	pointer to job struct
 * @param[in]   pvinfo	-	pointer to prov_vnode_info struct
 *
 * @return	int
 * @retval	0	: job is eligible to run
 * @retval	-1	: job is not eligible to run since other vnodes
 *					still provisioning or error
 * @retval	-2	:	nodes are done provisioning, but some are down
 * @retval	-3	:	nodes are all done prov, but curr_aoe, does not
 *					match req_aoe
 * @retval	-4	:	left over provisioning just returned
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static int
is_runnable(job *ptr, struct prov_vnode_info *pvnfo)
{
	struct pbsnode *np = NULL;
	int i;
	int eflag = 0;
	exec_vnode_listtype prov_vnode_list = NULL;
	int num_of_prov_vnodes = 1;
	job *pjob;
	char *aoe_req = NULL;
	char *current_aoe;

	if (!ptr) {
		DBPRT(("%s: ptr is NULL\n", __func__))
		return -1;
	}

	pjob = (job *) ptr;
	DBPRT(("%s: Entered jobid=%s\n", __func__, pjob->ji_qs.ji_jobid))

	aoe_req = pvnfo->pvnfo_aoe_req;

	num_of_prov_vnodes = parse_prov_vnode(get_jattr_str(pjob, JOB_ATR_prov_vnode), &prov_vnode_list);

	if (num_of_prov_vnodes == -1) {
		if (prov_vnode_list)
			free(prov_vnode_list);
		return -1;
	}

	/* it could happen that some vnode started provisioning but another */
	/* failed to provision. Since, first vnode will return later, this is */
	/* a catch to stop processing further since job would have already */
	/* been held or re queued */
	if (!check_job_substate(pjob, JOB_SUBSTATE_PROVISION)) {
		DBPRT(("%s: stray provisioning for job %s\n", __func__,
		       pjob->ji_qs.ji_jobid))
		eflag = -4;
		goto label1;
	}

	for (i = 0; i < num_of_prov_vnodes; i++) {

		np = find_nodebyname(prov_vnode_list[i]);
		if (np == NULL) {
			DBPRT(("%s: node %s is null\n",
			       __func__, prov_vnode_list[i]))
			eflag = -2;
			/* let eflag get overwritten in next iterations
			 by other conditions */
			break;
		}

		/* check if vnode offline, since it could have failed prov */
		if (np->nd_state & (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM)) {

			DBPRT(("%s: vnode %s is offline (failed prov)\n",
			       __func__, np->nd_name))
			eflag = -2;
			break;

		} else if ((np->nd_state & INUSE_PROV) ||
			   (np->nd_state & INUSE_WAIT_PROV)) {
			/* Check any vnode is provisioning */
			eflag = -1;
			DBPRT(("%s: Some nodes still provisioning\n", __func__))
			break;
		} else {
			/* check if node has the correct aoe or not */
			current_aoe = NULL;
			if (is_nattr_set(np, ND_ATR_current_aoe))
				current_aoe = get_nattr_str(np, ND_ATR_current_aoe);

			if ((current_aoe == NULL) ||
			    strcmp(current_aoe, aoe_req) != 0) {
				eflag = -3;
				DBPRT(("%s: req_aoe mismatch on %s\n",
				       __func__, prov_vnode_list[i]))
				break;
			}
		}
	}
label1:

	if (num_of_prov_vnodes > 0)
		free(prov_vnode_list);

	return eflag;
}

/**
 * @brief
 *		Requeue/Hold job on provisioning failure.
 *
 * @par Functionality:
 * 		This function requeues/holds the job for which provisioning failed.
 *	 	- writes accounting log message for failure
 *	 	- frees prov_vnode of job
 *	 	- removes all pending provisioning requests
 *	 	- releases resources held by job
 *	 	- applies server hold or requeues the job
 *
 * @see
 *		fail_vnode
 *		check_and_run_jobs
 *		do_provisioning
 *
 * @param[in]   prov_vnod_info	-	pointer to prov_vnode_info struct
 * @param[in]   hold_or_que	-	indicates if job is to be held or queued
 *								hold_or_que = 0 if job is to be held
 *								hold_or_que > 0 if job is to be queued
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

void
fail_vnode_job(struct prov_vnode_info *prov_vnode_info, int hold_or_que)
{
	job *pjob;
	int cnt; /* no. of prov vnodes */
	exec_vnode_listtype prov_vnode_list = NULL;
	int i;
	struct pbsnode *np;
	struct prov_tracking *ptracking = NULL;

	if (!prov_vnode_info) {
		DBPRT(("%s: prov_vnode_info is NULL\n", __func__))
		return;
	}

	/*
	 * fail_vnode_job could be called by pending work tasks
	 * of a job, which might have already been requeued/held.
	 * However, in that case, prov_vnode_info->pvnfo_jobid
	 * will be empty, return without performing any action
	 */
	if (prov_vnode_info->pvnfo_jobid[0] == '\0')
		return;

	pjob = (job *) find_job(prov_vnode_info->pvnfo_jobid);
	if (!pjob)
		return;

	/* add accounting log for provision failure for job */
	set_job_ProvAcctRcd(pjob, time_now, PROVISIONING_FAILURE);

	/* log job prov failed message */
	if (hold_or_que == 0) {
		sprintf(log_buffer,
			"Provisioning for job %s failed, job held",
			pjob->ji_qs.ji_jobid);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);

	} else if (hold_or_que == 1) {
		sprintf(log_buffer,
			"Provisioning for job %s failed, job queued",
			pjob->ji_qs.ji_jobid);
		log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);
	}
	/* remove from table other vnodes that might provision.*/
	/* vnodes that start provisioning are not within control. */
	/* These have not yet entered tracking table. */
	del_prov_vnode_entry(pjob);

	/* release resource, put system hold and move to held state */
	if (hold_or_que == 0) {
		rel_resc(pjob);
		clear_exec_on_run_fail(pjob);
		set_jattr_b_slim(pjob, JOB_ATR_hold, HOLD_s, INCR);
		set_jattr_str_slim(pjob, JOB_ATR_Comment, "job held, provisioning failed to start", NULL);
		svr_setjobstate(pjob, JOB_STATE_LTR_HELD, JOB_SUBSTATE_HELD);
	} else if (hold_or_que == 1) {
		/* don't purge job, instead requeue */
		(void) force_reque(pjob);
	}

	/*
	 * The first time fail_job_vnode is called for a job, the
	 * job is requeued/held, prov_vnode freed, and accounting
	 * record written. However, pending work tasks for the same
	 * job could trigger fail_job_vnode again later.
	 *
	 * Thus, on the first call to fail_vnode_job, loop through
	 * all prov_vnode_info's for this job and remove the job_id
	 * from them, so future calls to fail_vnode_job from pending
	 * work tasks would return without performing any action
	 */
	cnt = parse_prov_vnode(get_jattr_str(pjob, JOB_ATR_prov_vnode), &prov_vnode_list);
	for (i = 0; i < cnt; i++) {
		if ((np = find_nodebyname(prov_vnode_list[i]))) {
			if ((ptracking = get_prov_record_by_vnode(np->nd_name))) {
				prov_vnode_info = ptracking->prov_vnode_info;
				if (prov_vnode_info)
					prov_vnode_info->pvnfo_jobid[0] = '\0';
			}
		}
	}
	if (prov_vnode_list)
		free(prov_vnode_list);

	/* remove the prov_node attribute from the job here */
	if (is_jattr_set(pjob, JOB_ATR_prov_vnode))
		free_jattr(pjob, JOB_ATR_prov_vnode);
}

/**
 * @brief
 *		Marks the vnode offline.
 *
 * @par Functionality:
 *      This function marks a given vnode as offline and may log a message
 *      with it why vnode marked offline.
 *
 * @see
 *		fail_vnode
 *		offline_all_provisioning_vnodes
 *
 * @param[in]   pnode		-	pointer to pbsnode
 * @param[in]   comment		-	comment to be set on vnode and logged
 *
 * @return      void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static void
mark_prov_vnode_offline(pbsnode *pnode, char *comment)
{
	if (!pnode) {
		DBPRT(("%s: pnode is NULL\n", __func__))
		return;
	}

	/* unset the current aoe settings, as this may not be right now */
	free_nattr(pnode, ND_ATR_current_aoe);

	DBPRT(("%s: node=%s set to offline, resetting current_aoe\n",
	       __func__, pnode->nd_name))

	/* set node to down state */
	set_vnode_state(pnode, INUSE_OFFLINE, Nd_State_Or);
	set_vnode_state(pnode, ~INUSE_PROV, Nd_State_And);

	/* write the node state and current_aoe */
	node_save_db(pnode);

	if (comment != NULL) {
		/* log msg about marking node as offline */
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_NOTICE, msg_daemonname, "Vnode %s: %s", pnode->nd_name, comment);
		set_nattr_str_slim(pnode, ND_ATR_Comment, comment, NULL);
	}
}

/**
 * @brief
 *		On provisioning failure, marks vnode offline and fails the job.
 *
 * @par Functionality:
 *      This function marks a vnode offline and requeue/holds all jobs on it.
 *
 * @see
 *		prov_request_deferred
 *		prov_request_timed
 *
 * @param[in]   prov_vnode_info	-	pointer to struct prov_vnode_info
 * @param[in]   hold_or_que	-	indicates if job is to be held or queued
 *								hold_or_que = 0 if job is to be held
 *								hold_or_que > 0 if job is to be queued
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

static void
fail_vnode(struct prov_vnode_info *prov_vnode_info, int hold_or_que)
{
	struct pbsnode *pnode;
	char comment[MAXNLINE];

	if (!prov_vnode_info) {
		DBPRT(("%s: prov_vnode_info is NULL\n", __func__))
		return;
	}

	pnode = find_nodebyname(prov_vnode_info->pvnfo_vnode);

	DBPRT(("%s: node=%s entered\n", __func__, prov_vnode_info->pvnfo_vnode))

	if (pnode == NULL)
		return;

	strcpy(comment, "Vnode offlined since it failed provisioning");
	mark_prov_vnode_offline(pnode, comment);

	fail_vnode_job(prov_vnode_info, hold_or_que);
}

/**
 * @brief
 *		Marks vnodes in prov_tracking table offline during startup.
 *
 * @par Functionality:
 *      This function marks all vnodes present in prov_tracking table as offline
 *		Called from pbsd_init, when server recovers from a crash or server is
 *		started. Since, status of vnodes undergoing provisioning is not known,
 *		it marks them offline.
 *
 * @see
 *		#prov_tracking in provision.h
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

void
offline_all_provisioning_vnodes()
{
	int i;
	int count = 0;
	struct pbsnode *pnode;
	char comment[MAXNLINE];
	char *vnode;

	strcpy(comment,
	       "Vnode offlined since server went down during provisioning");

	for (i = 0; i < server.sv_provtracksize; i++) {
		if (server.sv_prov_track[i].pvtk_mtime != 0) {
			/* found an empty record */
			vnode = server.sv_prov_track[i].pvtk_vnode;
			pnode = find_nodebyname(vnode);

			if (pnode) {
				mark_prov_vnode_offline(pnode, comment);
				/*
				 * reservations will take care of
				 * themselves in pbsd_init
				 */
				count++;
			}
		}
		if (server.sv_prov_track[i].pvtk_vnode)
			free(server.sv_prov_track[i].pvtk_vnode);
		if (server.sv_prov_track[i].pvtk_aoe_req)
			free(server.sv_prov_track[i].pvtk_aoe_req);
		memset(&(server.sv_prov_track[i]), 0,
		       sizeof(struct prov_tracking));
		server.sv_prov_track[i].pvtk_mtime = 0; /* mark slot empty */
	}

	server.sv_cur_prov_records = 0;
	server.sv_provtrackmodifed = 1;

	DBPRT(("%s: Marked %d nodes offline (from prov recovery)\n",
	       __func__, count))

	/* save the provisioning table to disk */
	prov_track_save();
}

/**
 * @brief
 *		Runs a job if it can when a vnode finished provisioning.
 *
 * @par Functionality:
 *      This function checks if job is runnable by calling is_runnable().
 *		A vnode finished provisioning, so check if job can be run. If it can be
 *		run, writes accounting log and server log and sends job to mom.
 *		If job cannot run because of provisioning failure, it calls fail_vnode_job
 *		to requeue job and mark vnode offline.
 *
 * @see
 *		is_runnable
 *		is_vnode_prov_done
 *		fail_vnode_job
 *
 * @param[in]	prov_vnode_info	-	pointer to struct prov_vnode_info
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

static void
check_and_run_jobs(struct prov_vnode_info *prov_vnode_info)
{
	job *pjob;
	int rc;
	struct work_task task;

	if (!prov_vnode_info) {
		DBPRT(("%s: prov_vnode_info is NULL\n", __func__))
		return;
	}

	/*
	 * job info is stale - this is from a pending work task for a job
	 * which would have failed provisioning already and requeued/held.
	 * So, dont process any further
	 */
	if (prov_vnode_info->pvnfo_jobid[0] == '\0')
		return;

	DBPRT(("%s: Entered, node=%s, jobid=%s\n", __func__,
	       prov_vnode_info->pvnfo_vnode, prov_vnode_info->pvnfo_jobid))

	pjob = (job *) find_job(prov_vnode_info->pvnfo_jobid);
	if (pjob == NULL)
		return;

	rc = is_runnable(pjob, prov_vnode_info);

	if (rc == 0) {
		task.wt_parm1 = (void *) pjob;
		prov_startjob(&task);

	} else if (rc == -2 || rc == -3) {
		/*
		 * prov over on all nodes,
		 * but some nodes offline or curr_aoe bad
		 */
		DBPRT(("%s: Jobid: %s isjob_eligible returned %d\n", __func__,
		       pjob->ji_qs.ji_jobid, rc))
		if (rc == -3)
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, "provisioning error: AOE mis-match");
		else
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_INFO,
				  pjob->ji_qs.ji_jobid, "provisioning error: vnode offline");

		if (rc == -3)
			fail_vnode_job(prov_vnode_info, 0);
		else
			fail_vnode_job(prov_vnode_info, 1);
	}
}

/**
 * @brief
 *		Checks if vnode is up after provisioning.
 *
 * @par Functionality:
 *      This function checks whether the concerned vnode is up after
 *		provisioning. If vnode is up:
 *			- cancels the timeout work task
 *			- updates the nodes file to reflect the new state
 *			- calls check_and_run_job to run jobs
 *			- frees the prov_vnode_info structure allocated
 *		  		by do_provisioning
 *		If vnode is not yet up:
 *			- it returns. It will get called again by set_vnode_state.
 *
 * @see
 *		set_vnode_state
 *		prov_request_deferred
 *
 * @param[in]	vnode	-	pointer to string containing vnode name
 *
 * @return	void
 *
 * @par Side Effects:
 *     starts a new work task to do more provisioning
 *
 * @par MT-safe:	No
 *
 */

void
is_vnode_prov_done(char *vnode)
{
	struct pbsnode *pnode = NULL;
	struct prov_vnode_info *prov_vnode_info;
	struct work_task *ptask_timeout;
	struct prov_tracking *ptracking;

	ptracking = get_prov_record_by_vnode(vnode);
	if (ptracking == NULL)
		/* prov tracking record not created */
		return;
	if (ptracking->pvtk_pid > -1) {
		DBPRT(("%s: Provisioning script not yet done\n", __func__))
		return;
	}

	prov_vnode_info = ptracking->prov_vnode_info;

	pnode = (struct pbsnode *) find_nodebyname(prov_vnode_info->pvnfo_vnode);
	assert(pnode != NULL);

	ptask_timeout = prov_vnode_info->ptask_timed;

	DBPRT(("%s: Entered for node:%s\n", __func__, prov_vnode_info->pvnfo_vnode))

	/* check if this node is up or not */
	if ((pnode->nd_state & VNODE_UNAVAILABLE) ||
	    (pnode->nd_state & INUSE_INIT)) {
		/* node is is still not up
		 return, since this will be called again
		 when the vnode gets up (from set_vnode_state)
		 */
		DBPRT(("%s: node:%s not yet up\n",
		       __func__, prov_vnode_info->pvnfo_vnode))
		return;
	}

	DBPRT(("%s: node:%s is up - cancelling timeout task\n",
	       __func__, prov_vnode_info->pvnfo_vnode))
	/* delete the timeout task */
	delete_task(ptask_timeout);

	/* unset the provisioning flag on this node */
	if (pnode->nd_state & INUSE_PROV) {
		DBPRT(("%s: node:%s is up - removing prov\n",
		       __func__, prov_vnode_info->pvnfo_vnode))
		set_vnode_state(pnode, ~INUSE_PROV, Nd_State_And);
	}

	/* save the state of this node to the nodes file */
	node_save_db(pnode);

	/* log msg about prov of node success */
	sprintf(log_buffer, "Provisioning of Vnode %s successful",
		prov_vnode_info->pvnfo_vnode);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE,
		  LOG_NOTICE, msg_daemonname, log_buffer);

	check_and_run_jobs(prov_vnode_info);

	/* Remove record from prov tracking table */
	remove_prov_record(pnode->nd_name);
	prov_track_save(); /* save tracking table since its modified now */

	free_pvnfo(prov_vnode_info);

	/*
	 * since one provisioning was finished, we have space
	 * to do more prov so start a task for looking at
	 * other nodes in the provisioning queue
	 */
	set_task(WORK_Immed, 0, do_provisioning, NULL);
}

/**
 * @brief
 *		Determines if any of the provisionable vnodes assigned to the job
 *		has a pending mom hook-related file copy action.
 *
 * @param[in]   pjob	-	pointer to job struct
 *
 * @return	int
 * @retval	1	: job has a pending hook-related copy action on at least
 *			  of its provisioning vnodes.
 * @retval	0	: either no pending hook-related action detected, or an
 *			  an error has occurred.
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

static int
prov_vnode_pending_hook_copy(job *pjob)
{
	struct pbsnode *np = NULL;
	int i;
	exec_vnode_listtype prov_vnode_list = NULL;
	int num_of_prov_vnodes = 1;
	int rcode = 0;

	if (pjob == NULL) {
		DBPRT(("%s: job is NULL\n", __func__))
		return 0;
	}

	DBPRT(("%s: Entered jobid=%s\n", __func__, pjob->ji_qs.ji_jobid))

	num_of_prov_vnodes = parse_prov_vnode(get_jattr_str(pjob, JOB_ATR_prov_vnode), &prov_vnode_list);

	if (num_of_prov_vnodes == -1) {
		if (prov_vnode_list)
			free(prov_vnode_list);
		return 0;
	}

	for (i = 0; i < num_of_prov_vnodes; i++) {
		int j;

		np = find_nodebyname(prov_vnode_list[i]);
		if (np == NULL) {
			DBPRT(("%s: node %s is null\n",
			       __func__, prov_vnode_list[i]))
			goto prov_vnode_label;
		}
		/* hook has not been sent */
		for (j = 0; j < np->nd_nummoms; j++) {
			if ((np->nd_moms[j] != NULL) && (sync_mom_hookfiles_count(np->nd_moms[j]) > 0)) {
				log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_WARNING, pjob->ji_qs.ji_jobid, "prov vnode %s's parent mom %s:%d has a pending copy hook or delete hook request", np->nd_name, np->nd_moms[j]->mi_host, np->nd_moms[j]->mi_port);
				rcode = 1;
				break;
			}
		}
	}
prov_vnode_label:

	if (num_of_prov_vnodes > 0)
		free(prov_vnode_list);

	return rcode;
}

/**
 * @brief
 * 	This function ensures that the hooks are synced with the
 * 	provisioned node before starting the job on it.
 *
 * @param[in,out]
 * 	ptask - work task structure contains prov_vnode_info
 *
 * @return	void
 *
 */

static void
prov_startjob(struct work_task *ptask)
{
	job *pjob;
	int rc;

	assert(ptask->wt_parm1 != NULL);
	pjob = (job *) ptask->wt_parm1;
	if (pjob == NULL) {
		DBPRT(("%s: pjob is NULL\n", __func__))
		return;
	}
	/* task being serviced here */
	pjob->ji_prov_startjob_task = NULL;
	if ((do_sync_mom_hookfiles || sync_mom_hookfiles_replies_pending) &&
	    (prov_vnode_pending_hook_copy(pjob))) {

		/**
		 * If mom hook files sync is in process then create
		 * a time task where you perform this check again,
		 * and start the job once it is done
		 */

		DBPRT(("%s: setting the time task as sync mom"
		       "hookfiles is not completed\n",
		       __func__))

		/* set a work task to run after 5 sec from now */
		pjob->ji_prov_startjob_task = set_task(WORK_Timed, time_now + 5,
						       prov_startjob, pjob);
		if (pjob->ji_prov_startjob_task == NULL) {
			log_err(errno, __func__, "Unable to set task for prov_startjob; requeuing the job");
			(void) force_reque(pjob);
		}
		return;
	}

	/*  accounting log about prov for job over */
	set_job_ProvAcctRcd(pjob, time_now,
			    PROVISIONING_SUCCESS);

	/* log msg about prov for job over */
	sprintf(log_buffer,
		"Provisioning for Job %s succeeded, running job",
		pjob->ji_qs.ji_jobid);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
		  LOG_INFO, pjob->ji_qs.ji_jobid,
		  log_buffer);

	DBPRT(("%s: Jobid: %s about to run after prov success\n",
	       __func__, pjob->ji_qs.ji_jobid))

	/* now prov_vnode is stale, remove it */
	if (is_jattr_set(pjob, JOB_ATR_prov_vnode))
		free_jattr(pjob, JOB_ATR_prov_vnode);

	DBPRT(("%s: calling [svr_startjob] from prov_startjob\n", __func__))
	/* Move the job to MOM */
	if ((rc = svr_startjob(pjob, 0)) != 0) {
		DBPRT(("%s: Jobid: %s - startjob failed - rc:%d\n",
		       __func__, pjob->ji_qs.ji_jobid, rc))
		free_nodes(pjob);
	}
	DBPRT(("%s: Jobid: %s, startjob returned: %d\n",
	       __func__, pjob->ji_qs.ji_jobid, rc))
}

/**
 * @brief
 *		Performs provisioning cleanup when provisioning script returns.
 *
 * @par Functionality:
 *      This function is called when deferred child task, set by
 *		start_vnode_provisioning, returns (i.e. provisioning script finishes,
 *		either success or failure). This can get triggered before/after
 *		provision_timeout occurs.
 *			1) Gets the childs exit status:
 *		if provisioning script exited with success (0),
 *			- updates vnodes current_aoe attribute to
 *			 the aoe for provisioning
 *			- removes the provisioning record from the provisioing table
 *			- saves the provisioing table to disk
 *		if provisioning script exited with error (non-zero)
 *			- cancels the timeout work task
 *			- removes the provisioning record from the
 * 			 prov table and saves to disk
 *			- calls fail_vnode to mark node offline
 *			 and requeue all jobs on vnode
 *
 * @see
 *		start_vnode_provisioning
 *
 * @param[in]	wtask	-	pointer to work_task
 *							wtask->wt_parm1	: should have pointer to
 *						  			prov_vnode_info structure
 *							wtask->wt_parm2	: should have pointer to timeout task
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

static void
prov_request_deferred(struct work_task *wtask)
{
	struct work_task *timeout_task;
	int stat;
	struct pbsnode *pnode = NULL;
	struct prov_vnode_info *prov_vnode_info;
	prov_pid this_pid;
	int exit_status = -1;
	struct prov_tracking *prov_tracking;

	assert(wtask->wt_parm1 != NULL);

	prov_vnode_info = (struct prov_vnode_info *) wtask->wt_parm1;
	pnode = (struct pbsnode *) find_nodebyname(prov_vnode_info->pvnfo_vnode);
	this_pid = (pid_t) wtask->wt_event;
	DBPRT(("%s: pid = %ld\n", __func__, (long) this_pid))
	timeout_task = (struct work_task *) prov_vnode_info->ptask_timed;

	/* Now, figure out exitvalue of the child process */
	stat = wtask->wt_aux;

	/* update the fact that the process is gone in the prov table */
	prov_tracking = get_prov_record_by_pid(this_pid);
	prov_tracking->pvtk_pid = -1; /* indicating the process has exited */

	if (WIFEXITED(stat))
		exit_status = WEXITSTATUS(stat);

	DBPRT(("%s: stat=%d, exit_status=%d\n", __func__, stat, exit_status))

	/* success or application prov over */
	if (exit_status == 0 || exit_status == APP_PROV_SUCCESS) {

		if (pnode == NULL) {
			delete_task(timeout_task);
			free_pvnfo(prov_vnode_info);
			return;
		}

		/* Update Current aoe */
		set_nattr_str_slim(pnode, ND_ATR_current_aoe, prov_vnode_info->pvnfo_aoe_req, NULL);

		DBPRT(("%s: node:%s current_aoe set: %s\n",
		       __func__, pnode->nd_name, prov_vnode_info->pvnfo_aoe_req))

		/* write the node current_aoe */
		node_save_db(pnode);

		/* if exit_status says app_prov returned success, reset down
		 * that we set. after setting the state, is_vnode_prov_done()
		 * is called which would delete the timed work task.
		 */
		if (exit_status == APP_PROV_SUCCESS &&
		    (pnode->nd_state & INUSE_DOWN))
			set_vnode_state(pnode, ~INUSE_DOWN, Nd_State_And);

		is_vnode_prov_done(pnode->nd_name);

		return;
	}

	/* log msg about prov of node failure */
	sprintf(log_buffer,
		"Provisioning of %s with %s for %s failed, provisioning exit status=%d",
		prov_vnode_info->pvnfo_vnode, prov_vnode_info->pvnfo_aoe_req,
		prov_vnode_info->pvnfo_jobid, exit_status);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER,
		  LOG_NOTICE, msg_daemonname, log_buffer);

	/* kill the timed task since we dont need it any more */
	delete_task(timeout_task);

	/* Remove record from prov tracking table */
	remove_prov_record(pnode->nd_name);
	prov_track_save(); /* save tracking table since its modified now */

	/* Any other exit code */
	/* Failure, move all jobs to be run_err
	 * on this node to failed state
	 */
	fail_vnode(prov_vnode_info, 1);
	free_pvnfo(prov_vnode_info);

	/*
	 * since one provisioning was failed, we have space to
	 * do more prov so start a task for looking at other
	 * nodes in the provisioning queue
	 */
	set_task(WORK_Immed, 0, do_provisioning, NULL);
}

/**
 * @brief
 *		Performs provisioning cleanup if provisioning timed out.
 *
 * @par Functionality:
 *      This function performs provisioning cleanup if timed out.
 *      It is triggered after "provision_timeout" seconds have elapsed.
 *      This can get triggered before/after the deferred task finishes.
 *		1) Kills the program group of the provisioning script, if deferred
 *	   		child task not yet called.
 *      2) Cancels the deferred child work task if its not yet complete.
 *      3) Calls fail_vnode (for the concerned vnode) to mark vnode offline and
 *	   		requeue all jobs on this vnode.
 *      4) Frees the prov_vnode_info structure, allocated by do_provisioning.
 *
 * @see
 *		start_vnode_provisioning
 *
 * @param[in]	wtask	-	pointer to work_task
 *							wtask->wt_parm1	: should have pointer to
 *					  		prov_vnode_info structure
 *							wtask->wt_parm2 : should have pointer to
 *					  		sdeferred child task
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

static void
prov_request_timed(struct work_task *wtask)
{
	struct work_task *ptask_defer;
	struct prov_vnode_info *prov_vnode_info;
	prov_pid this_pid;
	struct prov_tracking *ptracking;

	assert(wtask->wt_parm1 != NULL);

	prov_vnode_info = (struct prov_vnode_info *) wtask->wt_parm1;
	ptask_defer = (struct work_task *) prov_vnode_info->ptask_defer;

	sprintf(log_buffer,
		"Provisioning of %s with %s for %s timed out",
		prov_vnode_info->pvnfo_vnode, prov_vnode_info->pvnfo_aoe_req,
		prov_vnode_info->pvnfo_jobid);
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_SERVER, LOG_NOTICE,
		  msg_daemonname, log_buffer);

	DBPRT(("%s: Entered node:%s Timed timeout work task\n",
	       __func__, prov_vnode_info->pvnfo_vnode))

	ptracking = get_prov_record_by_vnode(prov_vnode_info->pvnfo_vnode);
	if (ptracking->pvtk_pid > -1) {
		/* pid is part of the deferred task event */
		this_pid = ptracking->pvtk_pid;
		DBPRT(("%s: pid = %d\n", __func__, this_pid))

		/* Kill all process belonging to this process group */
		if (kill(((-1) * this_pid), SIGKILL) == -1) {
			DBPRT(("%s: couldn't kill prov process pgid = %d\n",
			       __func__, this_pid))
		}
		DBPRT(("%s: killed provisioning process tree for pgid = %d\n",
		       __func__, this_pid))

		/*
		 * script was running, it means that prov_request_deferred did
		 * not occur. so safe to delete task.
		 */
		delete_task(ptask_defer);
	}

	/* remove prov record */
	remove_prov_record(prov_vnode_info->pvnfo_vnode);
	prov_track_save();

	/* Move jobs on this node to the failed state */
	fail_vnode(prov_vnode_info, 1);
	free_pvnfo(prov_vnode_info);

	/*
	 * since one provisioning was failed, we have space
	 * to do more prov so start a task for looking at other nodes
	 * in the provisioning queue
	 */
	set_task(WORK_Immed, 0, do_provisioning, NULL);
}

/**
 * @brief
 *		Sets provision_enable and provision_timeout on server every time
 *		provision hook is modified.
 *
 * @par Functionality:
 *      This function sets server level attributes, SVR_ATR_ProvisionEnable and
 *		SVR_ATR_provision_timeout from the provisioning hook. It checks whether
 *		server attributes should be set or not.
 *
 * @see
 *		mgr_hook_import
 *		mgr_hook_set
 *		mgr_hook_unset
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

void
set_srv_prov_attributes(void)
{
#ifdef PYTHON
	hook *phook;

	DBPRT(("Entered %s\n", __func__))

	phook = find_hookbyevent(HOOK_EVENT_PROVISION);
	if (!phook || !phook->script || !phook->enabled) {
		disable_svr_prov();
		DBPRT(("%s: script/enabled not set\n", __func__))
		return;
	}

	provision_timeout = phook->alarm;
	set_sattr_l_slim(SVR_ATR_provision_timeout, provision_timeout, SET);
	set_sattr_l_slim(SVR_ATR_ProvisionEnable, 1, SET);
#else
	disable_svr_prov();
	DBPRT(("%s: Python not enabled\n", __func__))
#endif
}

/**
 * @brief
 *		Executes provisioning hook script for a vnode.
 *
 * @par Functionality:
 *      This function initializes python environment and runs python top level
 *		script. If compiled without python support, it can run a shell script
 *		(for testing).
 *
 * @see
 *		start_vnode_provisioning
 *
 * @param[in]	phook	-	pointer to provisioning hook
 * @param[in]   prov_vnode_info	-	pointer to prov_vnode_info
 *
 * @return	int
 * @retval	>1	: error code as returned by provisioning hook script
 * @retval	1	: success if doing application provisioning
 * @retval	0	: success if doing os provisioning
 * @retval	-1	: failure
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe: No
 *
 */

int
execute_python_prov_script(hook *phook,
			   struct prov_vnode_info *prov_vnode_info)
{
	int rc = 255;
	int exit_code = 255;
#ifdef PYTHON
	unsigned int hook_event;
	char *emsg = NULL;
	hook_input_param_t req_ptr;
	char perf_label[MAXBUFLEN];

	if (!phook || !prov_vnode_info)
		return rc;

	hook_event = HOOK_EVENT_PROVISION;

	if (phook->user != HOOK_PBSADMIN)
		return rc;

	snprintf(perf_label, sizeof(perf_label), "hook_%s_%s_%d", HOOKSTR_PROVISION, phook->hook_name, getpid());
	req_ptr.rq_prov = (struct prov_vnode_info *) prov_vnode_info;
	rc = pbs_python_event_set(hook_event, "root",
				  "server", &req_ptr, perf_label);
	if (rc == -1) { /* internal server code failure */
		log_event(PBSEVENT_DEBUG2,
			  PBS_EVENTCLASS_HOOK, LOG_ERR, __func__,
			  "Failed to set event; request accepted by default");
		return (-1);
	}

	/* hook_name changes for each hook */
	/* This sets Python event object's hook_name value */
	rc = pbs_python_event_set_attrval(PY_EVENT_HOOK_NAME,
					  phook->hook_name);

	if (rc == -1) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name,
			  "Failed to set event 'hook_name'.");
		return (-1);
	}

	/* hook_type needed for internal processing; */
	/* hook_type changes for each hook.	     */
	/* This sets Python event object's hook_type value */
	rc = pbs_python_event_set_attrval(PY_EVENT_HOOK_TYPE,
					  hook_type_as_string(phook->type));

	if (rc == -1) {
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
			  LOG_ERR, phook->hook_name,
			  "Failed to set event 'hook_type'.");
		return (-1);
	}

	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
		  LOG_INFO, phook->hook_name, "started");

	pbs_python_set_mode(PY_MODE); /* hook script mode */

	/* hook script may create files, and we don't want it to */
	/* be littering server's private directory. */
	/* NOTE: path_hooks_workdir is periodically cleaned up */
	if (chdir(path_hooks_workdir) != 0) {
		log_event(PBSEVENT_DEBUG2,
			  PBS_EVENTCLASS_HOOK, LOG_WARNING, phook->hook_name,
			  "unable to go to hooks tmp directory");
	}

	/* let rc pass through */
	hook_perf_stat_start(perf_label, HOOK_PERF_RUN_CODE, 0);
	rc = pbs_python_run_code_in_namespace(&svr_interp_data,
					      phook->script,
					      &exit_code);
	hook_perf_stat_stop(perf_label, HOOK_PERF_RUN_CODE, 0);

	/* go back to server's private directory */
	if (chdir(path_priv) != 0) {
		log_event(PBSEVENT_DEBUG2,
			  PBS_EVENTCLASS_HOOK, LOG_WARNING, phook->hook_name,
			  "unable to go back server private directory");
	}

	pbs_python_set_mode(C_MODE); /* PBS C mode - flexible */
	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
		  LOG_INFO, phook->hook_name, "finished");

	switch (rc) {
		case 0:
			/* reject if at least one hook script rejects */
			if (pbs_python_event_get_accept_flag() == FALSE) { /* a reject occurred */
				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "%s request rejected by '%s'",
					 hook_event_as_string(hook_event),
					 phook->hook_name);
				log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, phook->hook_name, log_buffer);
				if ((emsg = pbs_python_event_get_reject_msg()) != NULL) {
					snprintf(log_buffer, LOG_BUF_SIZE - 1, "%s", emsg);
					/* log also the custom reject message */
					log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_HOOK,
						  LOG_ERR, phook->hook_name, log_buffer);
				}
			}
			return (exit_code);

		case -1: /* internal error */
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name,
				  "Internal server error encountered. Skipping hook.");
			return (rc); /* should not happen */

		case -2: /* unhandled exception */
			pbs_python_event_reject(NULL);
			pbs_python_event_param_mod_disallow();

			snprintf(log_buffer, LOG_BUF_SIZE - 1,
				 "%s hook '%s' encountered an exception, "
				 "request rejected",
				 hook_event_as_string(hook_event), phook->hook_name);
			log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, phook->hook_name, log_buffer);
			return (rc);
	}
#endif
	return rc;
}

/**
 * @brief
 *		Performs basic checks and then kicks off provisioning of a vnode.
 *
 * @par Functionality:
 *      This function starts provisioning of a vnode with aoe specified by
 *		starting provisioning hook in another process. do_provisioning() is
 *		called in the end to drain the provisioning list. Deferred and Timed
 *		work tasks are set and a provisioning record is added in server. vnode
 *		state is marked down and provisioning. wait-provisioning state flag is
 *		cleared.
 *
 * @see
 *		check_and_enqueue_provisioning
 *
 * @param[in]	prov_vnode_info	-	pointer to prov_vnode_info entry in server
 *
 * @return	int
 * @retval	PBSE_NONE	: success if provisioning started for a vnode
 * @retval	PBS Error code	: if failed to start provisioning
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

static int
start_vnode_provisioning(struct prov_vnode_info *prov_vnode_info)
{
	prov_pid pid;
	struct work_task *ptask_defer;
	struct work_task *ptask_timed;
	struct pbsnode *pnode;
	job *pjob;
	int rc = -1;
	struct sigaction act;
	hook *phook;

	DBPRT(("%s: Provisioning vnode: %s with aoe: %s\n", __func__,
	       prov_vnode_info->pvnfo_vnode, prov_vnode_info->pvnfo_aoe_req))

	pnode = find_nodebyname(prov_vnode_info->pvnfo_vnode);
	if (!pnode) {
		DBPRT(("%s: Could not find vnode %s\n", __func__,
		       prov_vnode_info->pvnfo_vnode))
		return (PBSE_SYSTEM);
	}

	phook = find_hookbyevent(HOOK_EVENT_PROVISION);
	if (!phook) {
		DBPRT(("%s: Provisioning hook not found\n", __func__))
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_SERVER, LOG_INFO,
			  msg_daemonname, "Provisioning hook not found");
		return rc;
	}

	if ((rc = pbs_python_check_and_compile_script(&svr_interp_data,
						      phook->script)) != 0) {
		DBPRT(("%s: Recompilation failed\n", __func__))
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_INFO,
			  msg_daemonname, "Provisioning script recompilation failed");
		return rc;
	}

	/* Create child process to run TOP-LEVEL provisioning script */
	pid = fork();
	if (pid == -1) { /* fork failed */
		DBPRT(("%s: fork() failed\n", __func__))
		return (PBSE_SYSTEM);
	} else if (pid == 0) { /* child process */
		alarm(0);
		/* standard tpp closure and net close */
		net_close(-1);
		tpp_terminate();

		/* Reset signal actions for most to SIG_DFL */
		sigemptyset(&act.sa_mask);
		act.sa_flags = 0;
		act.sa_handler = SIG_DFL;
		(void) sigaction(SIGCHLD, &act, NULL);
		(void) sigaction(SIGHUP, &act, NULL);
		(void) sigaction(SIGINT, &act, NULL);
		(void) sigaction(SIGTERM, &act, NULL);

		/* Reset signal mask */
		(void) sigprocmask(SIG_SETMASK, &act.sa_mask, NULL);

		/*
		 * set process as session leader
		 */
		if (setsid() < 0)
			exit(13);

		/* Redirect standard files to /dev/null */
		if (freopen("/dev/null", "r", stdin) == NULL) 
			log_errf(-1, __func__, "freopen of null device failed. ERR : %s",strerror(errno));


		/* Unprotect child from being killed by system */
		daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

		/* exit with the return code from the script */
		rc = execute_python_prov_script(phook, prov_vnode_info);

		/* if python did sys.exit we wont be here */
		exit(rc);
	}

	/* parent process */
	/* set node state to provisioning */
	/*
	 * set_vnode_state(pnode, INUSE_PROV, Nd_State_Or);
	 * This is now done earlier
	 */
	/* unset the current_aoe for the node here provisioning */
	free_nattr(pnode, ND_ATR_current_aoe);

	/* write the node current_aoe */
	node_save_db(pnode);

	/*
	 * Parent process creates two work tasks
	 * i.e deferred child work task and timed work task.Deferred child
	 * task is to capture the exit code of the provisioning script.
	 * The Timed task is to implement the timeout feature.
	 */

	/*
	 * wt_parm1 is passed the address of the prov_vnode_info
	 * structure allocated earlier
	 */
	ptask_defer = set_task(WORK_Deferred_Child, pid,
			       prov_request_deferred,
			       (void *) prov_vnode_info);
	if (!ptask_defer)
		return (PBSE_INTERNAL);

	ptask_timed = set_task(WORK_Timed, time_now + provision_timeout,
			       prov_request_timed,
			       (void *) prov_vnode_info);
	if (!ptask_timed) {
		/* cancel deferred child work task */
		delete_task(ptask_defer);
		return (PBSE_INTERNAL);
	}

	/* store the addresses in prov_vnode_info */
	prov_vnode_info->ptask_defer = ptask_defer;
	prov_vnode_info->ptask_timed = ptask_timed;

	/*
	 * add a provisioning record to the prov_record table,
	 * used for server crash recovery
	 */
	if (add_prov_record(pid, prov_vnode_info) == -1) {
		/* this actually should not fail, since we checked before */
		delete_task(ptask_defer);
		delete_task(ptask_timed);
		return (PBSE_INTERNAL);
	}

	pjob = find_job(prov_vnode_info->pvnfo_jobid);
	if (pjob) {
		/* log job prov success message */
		sprintf(log_buffer, "Provisioning vnode %s with AOE %s "
				    "started successfully",
			prov_vnode_info->pvnfo_vnode,
			prov_vnode_info->pvnfo_aoe_req);
		log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB,
			  LOG_INFO, pjob->ji_qs.ji_jobid, log_buffer);
	}

	/* remove the INUSE_WAIT_PROV flag as it is prov now */
	set_vnode_state(pnode, ~INUSE_WAIT_PROV, Nd_State_And);

	/* set prov and down states */
	set_vnode_state(pnode, INUSE_PROV | INUSE_DOWN, Nd_State_Or);

	return (PBSE_NONE);
}

/**
 * @brief
 *		Checks if provisioning is required or not.
 *
 * @par Functionality:
 *      This function parses job's exec_vnode attribute, if set, it checks if
 *		job needs one or more vnodes to be provisioned. If exec_vnode is null,
 *		need_prov contains 0. If one or more vnodes need provisioning, need_prov is 1.
 *
 * @see
 *		check_and_provision_job
 * @param[in]   pjob	-	pointer to job
 * @param[out]  need_prov	-	boolean value, whether job will provision
 *
 * @return	int
 * @retval	PBSE_NONE	: success if no provisioning needed
 * @retval	PBS Error code	: if some error occurs
 *
 * @par Side Effects:
 *  	Unknown
 *
 * @par MT-safe:	No
 *
 */

int
check_and_enqueue_provisioning(job *pjob, int *need_prov)
{
	exec_vnode_listtype prov_vnode_list = NULL;
	int num_of_prov_vnodes = -1;
	int i;
	struct prov_vnode_info *prov_vnode_info;
	struct pbsnode *pnode;
	struct work_task *ptask_start_prov;
	char *aoe_req = NULL; /* to point to aoe */

	DBPRT(("%s: Entered\n", __func__))

	if (need_prov == NULL) {
		DBPRT(("%s: bad params\n", __func__))
		return (PBSE_IVALREQ);
	}

	*need_prov = 0;

	/* prov_vnode_list is of type exec_vnode_listtype.
	 * This is an array of "pointers to arrays[PBS_MAXCLTJOBID]"
	 */
	num_of_prov_vnodes = find_prov_vnode_list(pjob, &prov_vnode_list, &aoe_req);
	if (num_of_prov_vnodes == -1) {
		if (prov_vnode_list)
			free(prov_vnode_list);
		if (aoe_req)
			free(aoe_req);
		return (PBSE_IVALREQ);
	}

	DBPRT(("%s: aoe_req: %s\n", __func__, (aoe_req ? aoe_req : "NULL")))

	if (num_of_prov_vnodes == 0) {
		*need_prov = 0;
		DBPRT(("%s: Provisioning will not be done, "
		       "since no aoe requested or scheduler did not give provision vnode\n",
		       __func__))
		if (prov_vnode_list)
			free(prov_vnode_list);
		return (PBSE_NONE);
	}

	/* enque the provisioning request */
	for (i = 0; i < num_of_prov_vnodes; i++) {
		prov_vnode_info =
			(struct prov_vnode_info *) calloc(1,
							  sizeof(struct prov_vnode_info));
		if (!prov_vnode_info) {
			free(prov_vnode_list);
			if (aoe_req)
				free(aoe_req);
			return (PBSE_INTERNAL);
		}
		/*
		 * prepare prov_vnode_info structure thats
		 * passed as arg to work tasks
		 */

		/*
		 * prov_vnode_info carries only the id's of the
		 * job/resv and not pointers this is because, this
		 * structure would be used by work tasks later and
		 * at that point of time, job / resv pointers may not
		 * be valid as its possible that they could be
		 * deleted by the server
		 */
		if ((prov_vnode_info->pvnfo_vnode = strdup(prov_vnode_list[i])) == NULL) {
			free(prov_vnode_list);
			free_pvnfo(prov_vnode_info);
			if (aoe_req)
				free(aoe_req);
			return PBSE_SYSTEM;
		}
		if ((prov_vnode_info->pvnfo_aoe_req = strdup(aoe_req)) == NULL) {
			free(prov_vnode_list);
			free_pvnfo(prov_vnode_info);
			if (aoe_req)
				free(aoe_req);
			return PBSE_SYSTEM;
		}
		strcpy(prov_vnode_info->pvnfo_jobid, pjob->ji_qs.ji_jobid);

		CLEAR_LINK(prov_vnode_info->al_link);
		append_link(&prov_allvnodes, &prov_vnode_info->al_link,
			    prov_vnode_info);

		pnode = find_nodebyname(prov_vnode_list[i]);

		set_vnode_state(pnode, INUSE_WAIT_PROV, Nd_State_Or);
	}

	/*
	 * then start a immediate work task to start provisioning
	 * based on max allowed provisioings - start an immediate
	 * work task repeatable every PROV_POLL interval
	 */
	ptask_start_prov = set_task(WORK_Immed, 0,
				    do_provisioning, NULL);

	if (ptask_start_prov == NULL) {
		free(prov_vnode_list);
		if (aoe_req)
			free(aoe_req);
		return (PBSE_INTERNAL);
	}

	DBPRT(("%s: Provisioning will be done\n", __func__))

	free(prov_vnode_list);
	if (aoe_req)
		free(aoe_req);

	/* could be a good time to resize the prov table */
	resize_prov_table(max_concurrent_prov);

	*need_prov = 1;
	return (PBSE_NONE);
}

/**
 * @brief
 *		Starts as many provisioning as possible from the list available
 *		with server.
 *
 * @par Functionality:
 *      This function is called by a work task. It runs as many provisioning
 *		from the linked list as allowed. It calls start_vnode_provisioning()
 *		to start the provisioning for a vnode. If starting a provisioning fails
 *		it does not fail the vnode but the job that was waiting on that vnode is
 *		held.
 *
 * @see
 *		start_vnode_provisioning
 *
 * @param[in]	wtask	-	pointer to work_task
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */

void
do_provisioning(struct work_task *wtask)
{
	struct prov_vnode_info *prov_vnode_info;
	struct pbsnode *pnode;
	int rc;

	prov_vnode_info = GET_NEXT(prov_allvnodes);

	/*
	 * check number of provisionings needed to be done,
	 * should not cross max limit
	 */
	while (prov_vnode_info &&
	       (server.sv_cur_prov_records < max_concurrent_prov)) {

		/*
		 * allocate prov_vnode_info, its kept as long as provisioning
		 * goes on. This will be freed by the fail_vnode,
		 * prov_request_deferred(if script failed),prov_request_timeout
		 * (always), is_vnode_prov_done
		 * (before running job)
		 */

		/* remove this node from the linked list */
		delete_link(&prov_vnode_info->al_link);

		pnode = find_nodebyname(prov_vnode_info->pvnfo_vnode);
		if (pnode == NULL) {
			DBPRT(("%s: node %s was deleted\n", __func__,
			       prov_vnode_info->pvnfo_vnode))
			free_pvnfo(prov_vnode_info);
			prov_vnode_info = GET_NEXT(prov_allvnodes);
			continue;
		}

		rc = start_vnode_provisioning(prov_vnode_info);

		if (rc != 0) {
			/* we want to fail jobs/resv but not the node */
			/* fail all the jobs that were logged on this vnode */
			/* vnode is not offlined */
			fail_vnode_job(prov_vnode_info, 0);

			/* this node will not provision, remove flag */
			pnode = find_nodebyname(prov_vnode_info->pvnfo_vnode);
			if (pnode) {
				DBPRT(("%s: \n", __func__))
				set_vnode_state(pnode, ~(INUSE_PROV | INUSE_WAIT_PROV),
						Nd_State_And);
			}
			free_pvnfo(prov_vnode_info);
		}
		prov_vnode_info = GET_NEXT(prov_allvnodes);
	}

	/* Save provisioning records to file */
	prov_track_save();
}

/**
 * @brief
 *		Deletes prov_vnode_info entry.
 *
 * @par Functionality:
 *      This function deletes all prov_vnode_info entries for a job in server.
 *
 * @see
 *		fail_vnode_job
 *
 * @param[in]	pjob	-	pointer to job
 *
 * @return	void
 *
 * @par Side Effects:
 *      Unknown
 *
 * @par MT-safe:	No
 *
 */
static void
del_prov_vnode_entry(job *pjob)
{
	struct prov_vnode_info *tmp_record;
	struct prov_vnode_info *nxt_record;
	struct pbsnode *pnode;

	/* since entry is plucked from list, it won't come again */
	tmp_record = GET_NEXT(prov_allvnodes);
	while (tmp_record) {
		nxt_record = GET_NEXT(tmp_record->al_link);
		if (strcmp(tmp_record->pvnfo_jobid, pjob->ji_qs.ji_jobid) == 0) {
			delete_link(&tmp_record->al_link);
			DBPRT(("%s: vnode %s\n", __func__, tmp_record->pvnfo_vnode))
			/* node is no longer going to provision */
			pnode = find_nodebyname(tmp_record->pvnfo_vnode);
			if (pnode)
				set_vnode_state(pnode,
						~(INUSE_PROV | INUSE_WAIT_PROV),
						Nd_State_And);
			free_pvnfo(tmp_record);
		}
		tmp_record = nxt_record;
	}
}

/**
 * @brief
 * function to enable/disable power_provisioning
 *
 * Reflect the change to the server attribute from enabled flag for
 * a PBS hook.
 * *
 * @return	None.
 */
void
set_srv_pwr_prov_attribute()
{
	char hook_name[] = PBS_POWER;
	hook *phook = NULL;
	int val = 0;
	unsigned int action = 0;
	char str_val[2] = {0};

	phook = find_hook(hook_name);
	if (phook == NULL)
		return;

	if (phook->enabled == TRUE)
		val = 1;

	snprintf(str_val, sizeof(str_val), "%d", val);
	set_sattr_str_slim(SVR_ATR_PowerProvisioning, str_val, NULL);

	/*
	 * The enabled attribute is changed so send the attributes.
	 * If enabled is true, we also need to send the hook.
	 */
	action = MOM_HOOK_ACTION_SEND_ATTRS;
	if (val)
		action |= MOM_HOOK_ACTION_SEND_SCRIPT;
	add_pending_mom_hook_action(NULL, hook_name, action);
}

/**
 * @brief
 *		action_backfill_depth - action function for backfill_depth
 *				valid input range is >=1
 *
 * @param[in]	pattr	-	The estimated start time frequency
 * @param[in]	pobj	-	object being considered
 * @param[in]	actmode	-	action mode
 *
 * @return	Whether function completed successfully or not
 * @retval	PBSE_NONE	: when no errors are encountered
 * @retval	PBSE_BADATVAL	: if bad attribute is attempted to be set
 *
 * @return	int
 */
int
action_backfill_depth(attribute *pattr, void *pobj, int actmode)
{

	if (pattr == NULL)
		return PBSE_NONE;

	if (actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_RECOV) {
		if (pattr->at_val.at_long < 0)
			return PBSE_BADATVAL;
	}
	return PBSE_NONE;
}

/**
 * @brief
 *	action_jobscript_max_size - action function for jobscript_max_size
 *	valid input range is >=1 to <=2GB
 *
 * @param[in] pattr - server attributes (jobscript_max_size)
 * @param[in] pobj  - object being considered
 * @param[in] actmode - action mode
 *
 * @return Whether function completed successfully or not
 * @retval PBSE_NONE when no errors are encountered
 * @retval PBSE_BADJOBSCRIPTMAXSIZE when size is set to more than 2GB
 *
 */

int
action_jobscript_max_size(attribute *pattr, void *pobj, int actmode)
{
	attribute attrib;
	if (pattr == NULL)
		return PBSE_NONE;
	set_attr_generic(&attrib, &svr_attr_def[SVR_ATR_jobscript_max_size], "2gb", NULL, INTERNAL);
	if (actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_RECOV) {
		if (comp_size(pattr, &attrib) > 0)
			return PBSE_BADJOBSCRIPTMAXSIZE;
	}
	set_size(&attr_jobscript_max_size, pattr, SET);
	return PBSE_NONE;
}

/**
 * @brief
 *	action_check_res_to_release - action function for restrict_res_to_release_on_suspend
 *	it validates that input is a list of legitimate resource names
 *
 * @param[in] pattr - server attribute
 * @param[in] pobj  - object being considered
 * @param[in] actmode - action mode
 *
 * @return Whether function completed successfully or not
 * @retval PBSE_NONE when no errors are encountered
 * @retval PBSE_UNKRESC when any of the resource is not known
 *
 */

int
action_check_res_to_release(attribute *pattr, void *pobj, int actmode)
{
	int i;
	if (pattr == NULL)
		return PBSE_NONE;

	if (actmode == ATR_ACTION_ALTER || actmode == ATR_ACTION_NEW) {
		for (i = 0; i < pattr->at_val.at_arst->as_usedptr; i++) {
			if (find_resc_def(svr_resc_def, pattr->at_val.at_arst->as_string[i]) == NULL)
				return PBSE_UNKRESC;
		}
	}
	return PBSE_NONE;
}

/**
  * @brief
  *      Unset jobscript_max_size attribute.
  *
  * @par Functionality:
  *      This function unsets the jobscript_max_size server attribute
  *      by reverting it back to it's default value.
  *
  * @param[in]   void
  *
  * @return      void
  *
  */
void
unset_jobscript_max_size(void)
{
	log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER, LOG_NOTICE, msg_daemonname,
		   "unsetting jobscript_max_size - reverting back to default val %s",
		   DFLT_JOBSCRIPT_MAX_SIZE);
	set_attr_generic(&attr_jobscript_max_size, &svr_attr_def[SVR_ATR_jobscript_max_size], DFLT_JOBSCRIPT_MAX_SIZE, NULL, INTERNAL);
}

/**
 * @brief
 *		Create a copy of the job script from database to a temporary file
 *		This filename is then passed onto the sendjob process to send the
 *		jobfile to the target mom/server
 *
 * @param[in]	pj	-	Job pointer
 * @param[out]	script_name	-	Name of the temporary filename to which
 *								the job script was copied to
 *
 * @return	Error code
 * @retval	0	: Success
 * @retval	-1	: Failure
 *
 */
extern char *msg_script_open;
extern char *msg_script_write;
extern char *path_spool;

/*
 * @brief
 *  	Loads the job-script associated to the job from the database.
 *  	It populates the ji_script field of the job as well as returns
 *      a pointer to the script
 *
 * @param[in, out] pj - Job pointer. pj->ji_script has the script loaded into it.
 *
 * @return Text buffer containing the job script
 * @retval NULL  - Failed to load job script
 * @retval !NULL - Job script
 *
 */
char *
svr_load_jobscript(job *pj)
{
	void *conn = (void *) svr_db_conn;
	pbs_db_jobscr_info_t jobscr;
	pbs_db_obj_info_t obj;

	if (pj->ji_script) {
		free(pj->ji_script);
		pj->ji_script = NULL;
	}

	if (pj->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
		strcpy(jobscr.ji_jobid, pj->ji_parentaj->ji_qs.ji_jobid);
	} else {
		strcpy(jobscr.ji_jobid, pj->ji_qs.ji_jobid);
	}
	jobscr.script = NULL;
	obj.pbs_db_obj_type = PBS_DB_JOBSCR;
	obj.pbs_db_un.pbs_db_jobscr = &jobscr;

	if (pbs_db_load_obj(conn, &obj) != 0) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Failed to load job script for job %s from PBS datastore",
			 pj->ji_qs.ji_jobid);
		log_err(-1, __func__, log_buffer);
		return NULL;
	}

	if (jobscr.script == NULL) {
		snprintf(log_buffer, sizeof(log_buffer),
			 "Out of memory loading script for job %s from PBS datastore",
			 pj->ji_qs.ji_jobid);
		log_err(-1, __func__, log_buffer);
		return NULL;
	}

	pj->ji_script = jobscr.script;

	return jobscr.script;
}

/*
 * @brief
 *  	Write the job script from the job structure into a temporary file
 *
 * @param[in] pj - Job pointer
 * @param[in] script_name - The name of the script file to be created in tmpdir
 *
 * @return Error code
 * @retval -1 - Failure
 * @retval  0 - Success
 */
int
svr_create_tmp_jobscript(job *pj, char *script_name)
{
	int fds;
	int filemode = 0600;
	int len;

	if (pj->ji_script == NULL) {
		(void) snprintf(log_buffer, sizeof(log_buffer), "Job has no script loaded!! Can't write temp job script");
		log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_INFO, pj->ji_qs.ji_jobid, log_buffer);
		return -1;
	}

	(void) strcpy(script_name, pbs_conf.pbs_tmpdir);
	(void) strcat(script_name, "/");

	if (*pj->ji_qs.ji_fileprefix != '\0')
		(void) strcat(script_name, pj->ji_qs.ji_fileprefix);

	(void) strcat(script_name, pj->ji_qs.ji_jobid);
	(void) strcat(script_name, JOB_SCRIPT_SUFFIX);

	fds = open(script_name, O_WRONLY | O_CREAT, filemode);
	if (fds < 0) {
		log_err(errno, __func__, msg_script_open);
		return -1;
	}

	len = strlen(pj->ji_script);
	if (write(fds, pj->ji_script, len) != len) {
		log_err(errno, __func__, msg_script_write);
		(void) close(fds);
		return -1;
	}

	(void) close(fds);
	return 0;
}

/**
 * @brief
 * 		Determines type of place directive.
 *
 * @param[in]	place_str	: The string representation of the place directive
 * @param[in]	by	: The type of exclusivity to check for.
 *
 * @return	The place sharing type
 *
 * @par MT-Safe: No
 */
enum vnode_sharing
place_sharing_type(char *place_str, enum vnode_sharing by)
{
	enum vnode_sharing ret = VNS_UNSET;

	if (place_str == NULL)
		return ret;

	if (by == VNS_FORCE_EXCL) {
		if (place_sharing_check(place_str, PLACE_Excl))
			ret = VNS_FORCE_EXCL;
	} else if (by == VNS_FORCE_EXCLHOST) {
		if (place_sharing_check(place_str, PLACE_ExclHost))
			ret = VNS_FORCE_EXCLHOST;
	} else if (by == VNS_IGNORE_EXCL) {
		if (place_sharing_check(place_str, PLACE_Shared))
			ret = VNS_IGNORE_EXCL;
	}

	return ret;
}
/**
 * @brief
 * 		function for default queue check.
 *
 * @param[in]	pattr	-	The estimated start time frequency
 * @param[in]	pobj	-	object being considered
 * @param[in]	actmode	-	action mode
 *
 * @return	Whether function completed successfully or not
 * @retval	PBSE_NONE	: when no errors are encountered
 * @retval	PBSE_UNKQUE	: Unknown queue name
 * @retval	PBSE_INTERNAL	: on an internal error
 *
 */
int
default_queue_chk(attribute *pattr, void *pobj, int actmode)
{
	pbs_queue *pq = NULL;

	if (pattr == NULL) {
		return (PBSE_INTERNAL);
	}

	if (actmode == ATR_ACTION_ALTER) {
		if (is_attr_set(pattr)) {
			pq = find_queuebyname(pattr->at_val.at_str);
			if (pq == NULL) {
				return (PBSE_UNKQUE);
			}
		}
	}
	return (PBSE_NONE);
}

/**
 *
 * @brief
 *		Marks a connection flag that tells a qsub daemon that something has
 *		changed in the server, and its req_queuejob request needs to be redone.
 *
 */
void
force_qsub_daemons_update(void)
{
	conn_t *cp = NULL;
	if (svr_allconns.ll_next == NULL)
		return;
	for (cp = (conn_t *) GET_NEXT(svr_allconns); cp; cp = GET_NEXT(cp->cn_link)) {
		if (cp->cn_authen & PBS_NET_CONN_FROM_QSUB_DAEMON)
			cp->cn_authen |= PBS_NET_CONN_FORCE_QSUB_UPDATE;
	}
}

/**
 * @brief
 *		The action function for the "default_qsub_arguments" server
 *		attribute, which tells qsub daemons to redo some req_queuejob
 *		operation as this attribute has changed.

 * @param[in]	pattr	-	target "default_qsub_arguments" attribute value
 * @param[in]	pobject	-	pointer to some parent object.(required but unused here)
 * @param[in]	actmode	-	the action to take (e.g. ATR_ACTION_ALTER)
 *
 * @return	Whether or not okay to set to new value.
 * @retval	PBSE_NONE	: Action is okay.
 * @retval	PBSE_INTERNAL	: for any error.
 */
int
force_qsub_daemons_update_action(attribute *pattr, void *pobj, int actmode)
{
	if (pattr == NULL) {
		return (PBSE_INTERNAL);
	}
	force_qsub_daemons_update();

	return (PBSE_NONE);
}

/**
 * @brief
 *		are_we_primary - determines the failover role, are we the Primary
 *		Server, the Secondary Server or the only Server (no failover)
 *
 * @return  int			- failover server role
 * @retval  FAILOVER_NONE		- failover not configured
 * @retval  FAILOVER_PRIMARY		- Primary Server
 * @retval  FAILOVER_SECONDARY		- Secondary Server
 * @retval  FAILOVER_CONFIG_ERROR	- error in pbs.conf configuration
 */
enum failover_state
are_we_primary(void)
{
	char hn1[PBS_MAXHOSTNAME + 1];

	/* both secondary and primary should be set or neither set */
	if ((pbs_conf.pbs_secondary == NULL) && (pbs_conf.pbs_primary == NULL))
		return FAILOVER_NONE;
	if ((pbs_conf.pbs_secondary == NULL) || (pbs_conf.pbs_primary == NULL))
		return FAILOVER_CONFIG_ERROR;

	if (get_fullhostname(pbs_conf.pbs_primary, primary_host, (sizeof(primary_host) - 1)) == -1) {
		log_err(-1, "pbsd_main", "Unable to get full host name of primary");
		return FAILOVER_CONFIG_ERROR;
	}

	if (strcmp(primary_host, server_host) == 0)
		return FAILOVER_PRIMARY; /* we are the listed primary */

	if (get_fullhostname(pbs_conf.pbs_secondary, hn1, (sizeof(hn1) - 1)) == -1) {
		log_err(-1, "pbsd_main", "Unable to get full host name of secondary");
		return FAILOVER_CONFIG_ERROR;
	}
	if (strcmp(hn1, server_host) == 0)
		return FAILOVER_SECONDARY; /* we are the secondary */

	return FAILOVER_CONFIG_ERROR; /* cannot be neither */
}

/**
 * @brief
 * 		dumps the memory usage of the heap into server log in every 10 minutes.
 *
 * @param[in]	ptask	-	pointer to the work task
 *
 * @return	void
 *
 * @par MT-Safe: Yes
 * @par Side Effects: None
 *
 */
void
memory_debug_log(struct work_task *ptask)
{

	if (ptask)
		(void) set_task(WORK_Timed, time_now + 600, memory_debug_log, NULL);
	if (!will_log_event(PBSEVENT_DEBUG4))
		return;
	snprintf(log_buffer, LOG_BUF_SIZE, "MEM_DEBUG: sbrk: %zu", (size_t) sbrk(0));
	log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_DEBUG, msg_daemonname, log_buffer);
#ifdef HAVE_MALLOC_INFO
	char *buf;
	buf = get_mem_info();
	if (buf) {
		log_event(PBSEVENT_DEBUG4, PBS_EVENTCLASS_SERVER, LOG_DEBUG, msg_daemonname, buf);
		free(buf);
	}
#endif /* malloc_info */
}

/**
 * @brief
 *		Get list of deferred requests for a particular scheduler.
 * 		If the list does not exist yet and the 'create' is TRUE,
 * 		then create the list.
 *
 * @param[in]	psched	-	scheduler structure to identify list of deferred requests.
 * @param[in]	create	-	boolean - if true, create non-existing list
 *
 * @return	List of deferred requests for the particular scheduler
 * @retval	NULL	: list not found or not created
 * @retval	pbs_list_head*	: list of scheduler deferred requests.
 */
pbs_list_head *
fetch_sched_deferred_request(pbs_sched *psched, bool create)
{
	struct sched_deferred_request *psdefr;

	for (psdefr = (struct sched_deferred_request *) GET_NEXT(svr_deferred_req);
	     psdefr;
	     psdefr = (struct sched_deferred_request *) GET_NEXT(psdefr->sdr_link)) {
		if (psdefr->sdr_psched == psched)
			break;
	}

	if (psdefr) {
		return &psdefr->sdr_deferred_req;
	}

	if (create == FALSE) {
		return NULL;
	}

	psdefr = (struct sched_deferred_request *) malloc(sizeof(struct sched_deferred_request));
	if (psdefr == NULL) {
		log_err(-1, __func__, "Failed to allocate memory.");
		return NULL;
	}
	CLEAR_LINK(psdefr->sdr_link);
	CLEAR_HEAD(psdefr->sdr_deferred_req);
	psdefr->sdr_psched = psched;
	append_link(&svr_deferred_req, &psdefr->sdr_link, psdefr);

	return &psdefr->sdr_deferred_req;
}

/**
 * @brief
 *		Remove list of deferred requests for a particular scheduler
 *		if the list is empty.
 *
 * @param[in]	psched	-	scheduler structure to identify list of deferred requests.
 *
 */
void
clear_sched_deferred_request(pbs_sched *psched)
{
	struct sched_deferred_request *psdefr;

	for (psdefr = (struct sched_deferred_request *) GET_NEXT(svr_deferred_req);
	     psdefr;
	     psdefr = (struct sched_deferred_request *) GET_NEXT(psdefr->sdr_link)) {
		if (psdefr->sdr_psched == psched)
			break;
	}

	if (psdefr && GET_NEXT(psdefr->sdr_deferred_req) == NULL) {
		/* no more requests in psdefr->sdr_deferred_req
		 * lets remove the scheduler related list
		 */
		delete_link(&psdefr->sdr_link);
		free(psdefr);
	}
}

/**
 * @brief
 * 		action_clear_topjob_estimates - action routine for the server's
 * 		"clear_topjob_estimates_enable" attribute.
 *
 * @param[in]	pattr	-	pointer to attribute structure
 * @param[in]	pobj	-	not used
 * @param[in]	actmode	-	action mode
 *
 * @return	int
 * @retval	zero	: success
 * @retval	nonzero	: failure
 */
int
action_clear_topjob_estimates(attribute *pattr, void *pobj, int actmode)
{
	if (actmode == ATR_ACTION_NEW ||
	    actmode == ATR_ACTION_ALTER) {

		if (is_attr_set(pattr) && pattr->at_val.at_long) {
			job *pjob = (job *) GET_NEXT(svr_alljobs);
			for (; pjob; pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
				if (check_job_substate(pjob, JOB_SUBSTATE_FINISHED)) {
					continue;
				}

				if (get_jattr_long(pjob, JOB_ATR_topjob)) {
					continue;
				}

				if (is_jattr_set(pjob, JOB_ATR_estimated)) {
					clear_jattr(pjob, JOB_ATR_estimated);
				}
			}
		}
	}
	return PBSE_NONE;
}


================================================
FILE: src/server/svr_jobfunc.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 * @brief
 * 		contains server functions dealing with jobs
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <fcntl.h>
#include <assert.h>
#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <errno.h>
#include <string.h>
#include <ctype.h>
#include <time.h>
#include <math.h>
#include <netdb.h>
#include <signal.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/poll.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include "pbs_ifl.h"
#include "libutil.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "libpbs.h"
#include "credential.h"
#include "batch_request.h"
#include "resource.h"
#include "server.h"
#include "work_task.h"
#include "resv_node.h"
#include "queue.h"
#include "job.h"
#include "pbs_sched.h"
#include "reservation.h"
#include "pbs_error.h"
#include "log.h"
#include "acct.h"
#include "pbs_idx.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "sched_cmds.h"
#include "dis.h"
#include "libsec.h"
#include "pbs_license.h"
#include "pbs_reliable.h"
#include <sys/wait.h>

#define MIN_WALLTIME_LIMIT 0
#define MAX_WALLTIME_LIMIT 1

char statechars[] = "TQHWREXBMF";

/* Private Functions */

static void default_std(job *, int key, char *to);
static void Time4reply(struct work_task *);
static void Time4resv(struct work_task *);
static void Time4resv1(struct work_task *);
static void resvFinishReply(struct work_task *);
int change_enableORstart(resc_resv *, int, char *);
static void handle_qmgr_reply_to_startORenable(struct work_task *);
static void delete_occurrence_jobs(resc_resv *presv);
static void Time4occurrenceFinish(resc_resv *);
static void running_jobs_count(struct work_task *);

/* Global Data Items: */
extern char *msg_noloopbackif;
extern char *msg_mombadmodify;

extern struct server server;
extern int pbs_mom_port;
extern pbs_list_head svr_alljobs;
extern char *msg_badwait; /* error message */
extern char *msg_daemonname;
extern char *msg_also_deleted_job_history;
extern char server_name[];
extern pbs_list_head svr_queues;
extern int comp_resc_lt;
extern int comp_resc_gt;
extern time_t time_now;
extern char *resc_in_err;

extern struct licenses_high_use usedlicenses;

/* For history jobs only */
extern long svr_history_enable;
extern long svr_history_duration;

/* Work Task Handlers */

extern void resv_retry_handler(struct work_task *);
extern long determine_resv_retry(resc_resv *);

/* external functions */
extern void free_job_work_tasks(job *);

/* Private Functions */

#ifndef NDEBUG
static void correct_ct(pbs_queue *);
#endif /* NDEBUG */

/**
 * @brief
 * 		clear the default resource from structures
 *
 * @param[in]	pjob	-	The job to be enqueued.
 */
static void
clear_default_resc(job *pjob)
{
	resource *presc;

	if (is_jattr_set(pjob, JOB_ATR_resource)) {
		presc = (resource *) GET_NEXT(get_jattr_list(pjob, JOB_ATR_resource));
		while (presc) {
			if (presc->rs_value.at_flags & ATR_VFLAG_DEFLT)
				presc->rs_defin->rs_free(&presc->rs_value);
			presc = (resource *) GET_NEXT(presc->rs_link);
		}
	}
}

/**
 * @brief
 * 		tickle_for_reply ()
 * 		For internally generated requests to the server we would like
 * 		processing of the reply from the particular server subsystem
 * 		to happen as "soon" as the server get back to its main loop -
 * 		see server's main loop and "next_task()" and variable, "waittime".
 * 		By placing a do nothing task on the "timed_task_list" whose time
 * 		is now (or already passed), we can get next_task() to look at the
 * 		"task_list_immed" tasks now rather than wait for a while
 */
void
tickle_for_reply(void)
{
	(void) set_task(WORK_Timed, time_now + 10, 0, NULL);
}

/**
 * @brief
 * 		svr_enquejob	-	Enqueue the job into specified queue.
 *
 * @param[in]	pjob	-	The job to be enqueued.
 * @param[in]	selectspec -	select spec of the job.
 *
 * @return	int
 * @retval	0	: on success
 * @retval	PBSE	: specified error number.
 *
 * @par MT-Safe:	no
 *
 * @par Note:
 *		Enqueue the job to the specific queue and update the queue state.
 *		Updated default attributes and resources specific to job type.
 */
int
svr_enquejob(job *pjob, char *selectspec)
{
	job *pjcur;
	pbs_queue *pque;
	int rc;
	pbs_sched *psched;
	int state_num;
	char *qtype;
	char hook_msg[HOOK_MSG_SIZE] = {0};

	state_num = get_job_state_num(pjob);

	/* make sure queue is still there, there exist a small window ... */

	pque = find_queuebyname(pjob->ji_qs.ji_queue);
	if (pque == NULL) {
		/*
		 * If it is a history job, then don't return PBSE_UNKQUE
		 * error but link the job to SERVER job list and update
		 * job history timestamp and subjob state table and return
		 * 0 (SUCCESS). INFO: The job is not associated with any
		 * queue as the queue has been already purged.
		 */
		if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
		    (check_job_state(pjob, JOB_STATE_LTR_FINISHED))) {
			if (is_linked(&svr_alljobs, &pjob->ji_alljobs) == 0) {
				if (pbs_idx_insert(jobs_idx, pjob->ji_qs.ji_jobid, pjob) != PBS_IDX_RET_OK) {
					log_joberr(PBSE_INTERNAL, __func__, "Failed add history job in index", pjob->ji_qs.ji_jobid);
					return PBSE_INTERNAL;
				}
				append_link(&svr_alljobs, &pjob->ji_alljobs, pjob);
			}
			server.sv_qs.sv_numjobs++;
			if (state_num != -1)
				server.sv_jobstates[state_num]++;
			return (0);
		} else {
			return (PBSE_UNKQUE);
		}
	}

	/* add job to server's all job list and update server counts */

#ifndef NDEBUG
	(void) sprintf(log_buffer, "enqueuing into %s, state %c hop %ld",
		       pque->qu_qs.qu_name, get_job_state(pjob),
		       get_jattr_long(pjob, JOB_ATR_hopcount));
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
#endif /* NDEBUG */

	if (pbs_idx_insert(jobs_idx, pjob->ji_qs.ji_jobid, pjob) != PBS_IDX_RET_OK) {
		log_joberr(PBSE_INTERNAL, __func__, "Failed add job in index", pjob->ji_qs.ji_jobid);
		return PBSE_INTERNAL;
	}

	pjcur = (job *) GET_PRIOR(svr_alljobs);
	while (pjcur) {
		if (get_jattr_ll(pjob, JOB_ATR_qrank) >= get_jattr_ll(pjcur, JOB_ATR_qrank))
			break;
		pjcur = (job *) GET_PRIOR(pjcur->ji_alljobs);
	}
	if (pjcur == 0) {
		/* link first in server's list */
		insert_link(&svr_alljobs, &pjob->ji_alljobs, pjob,
			    LINK_INSET_AFTER);
	} else {
		/* link after 'current' job in server's list */
		insert_link(&pjcur->ji_alljobs, &pjob->ji_alljobs, pjob,
			    LINK_INSET_AFTER);
	}

	server.sv_qs.sv_numjobs++;
	if (state_num != -1)
		server.sv_jobstates[state_num]++;

	/* place into queue in order of queue rank starting at end */

	pjob->ji_qhdr = pque;

	pjcur = (job *) GET_PRIOR(pque->qu_jobs);
	while (pjcur) {
		if (get_jattr_ll(pjob, JOB_ATR_qrank) >= get_jattr_ll(pjcur, JOB_ATR_qrank))
			break;
		pjcur = (job *) GET_PRIOR(pjcur->ji_jobque);
	}
	if (pjcur == 0) {
		/* link first in list */
		insert_link(&pque->qu_jobs, &pjob->ji_jobque, pjob,
			    LINK_INSET_AFTER);
	} else {
		/* link after 'current' job in list */
		insert_link(&pjcur->ji_jobque, &pjob->ji_jobque, pjob,
			    LINK_INSET_AFTER);
	}

	/* update counts: queue and queue by state */

	pque->qu_numjobs++;
	if (state_num != -1)
		pque->qu_njstate[state_num]++;

	if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) || (check_job_state(pjob, JOB_STATE_LTR_FINISHED))) {
		return (0);
	}

	/* update the current location and type attribute */
	set_jattr_generic(pjob, JOB_ATR_in_queue, pque->qu_qs.qu_name, NULL, SET);

	if ((qtype = get_qattr_str(pque, QA_ATR_QType)) == NULL) {
		log_eventf(PBSEVENT_ADMIN, PBS_EVENTCLASS_QUEUE, LOG_ERR,
			   pjob->ji_qs.ji_jobid, "queue type must be set for queue `%s`",
			   pque->qu_qs.qu_name);
		return PBSE_NEEDQUET;
	}
	set_jattr_c_slim(pjob, JOB_ATR_queuetype, *qtype, SET);

	if (!is_jattr_set(pjob, JOB_ATR_qtime))
		set_jattr_l_slim(pjob, JOB_ATR_qtime, time_now, SET);

	/*
	 * set any "unspecified" resources which have default values,
	 * first with queue defaults, then with server defaults
	 */

	rc = set_resc_deflt((void *) pjob, JOB_OBJECT, NULL);
	if (rc)
		return rc;

	/*
	 * Ensure that all jobs has JOB_ATR_project set.
	 * It could be unset if coming from an overlay upgrade.
	 */
	if (!is_jattr_set(pjob, JOB_ATR_project))
		set_jattr_str_slim(pjob, JOB_ATR_project, PBS_DEFAULT_PROJECT, NULL);

	/* update any entity count and entity resources usage for the queue */

	if (!(pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) ||
	    (get_sattr_long(SVR_ATR_State) == SV_STATE_INIT))
		account_entity_limit_usages(pjob, pque, NULL, INCR, ETLIM_ACC_ALL);

	/*
	 * See if we need to do anything special based on type of queue
	 */

	if (pque->qu_qs.qu_type == QTYPE_Execution) {

		/* set union to "EXEC" and clear mom's address */

		if (pjob->ji_qs.ji_un_type != JOB_UNION_TYPE_EXEC) {
			pjob->ji_qs.ji_un_type = JOB_UNION_TYPE_EXEC;
			pjob->ji_qs.ji_un.ji_exect.ji_momaddr = 0;
			pjob->ji_qs.ji_un.ji_exect.ji_momport = 0;
			pjob->ji_qs.ji_un.ji_exect.ji_exitstat = 0;
		}

		/* check the job checkpoint against the queue's  min */

		eval_chkpnt(pjob, get_qattr(pque, QE_ATR_ChkptMin));

		/*
		 * do anything needed doing regarding job dependencies,
		 * ignore this during Server recovery as the dependency
		 * was registered when the job was first enqueued.
		 */

		if (get_sattr_long(SVR_ATR_State) != SV_STATE_INIT) {
			if (is_jattr_set(pjob, JOB_ATR_depend)) {
				rc = depend_on_que(get_jattr(pjob, JOB_ATR_depend), pjob, ATR_ACTION_NOOP);
				if (rc)
					return rc;
			}
		}

		/* set eligible time */

		if (!is_jattr_set(pjob, JOB_ATR_etime) && check_job_state(pjob, JOB_STATE_LTR_QUEUED)) {
			set_jattr_l_slim(pjob, JOB_ATR_etime, time_now, SET);

			/* better notify the Scheduler we have a new job */
			if (!selectspec) {
				if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
					set_scheduler_flag(SCH_SCHEDULE_NEW, psched);
				else {
					sprintf(log_buffer, "Unable to reach scheduler associated with job %s", pjob->ji_qs.ji_jobid);
					log_err(-1, __func__, log_buffer);
				}
			}
			if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
				set_scheduler_flag(SCH_SCHEDULE_NEW, psched);
			else {
				sprintf(log_buffer, "Unable to reach scheduler associated with job %s", pjob->ji_qs.ji_jobid);
				log_err(-1, __func__, log_buffer);
			}
		} else if (get_sattr_long(SVR_ATR_EligibleTimeEnable) && get_sattr_long(SVR_ATR_scheduling) && !selectspec) {

			/* notify the Scheduler we have moved a job here */

			if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
				set_scheduler_flag(SCH_SCHEDULE_MVLOCAL, psched);
			else {
				sprintf(log_buffer, "Unable to reach scheduler associated with job %s", pjob->ji_qs.ji_jobid);
				log_err(-1, __func__, log_buffer);
			}
		}

	} else if (pque->qu_qs.qu_type == QTYPE_RoutePush) {

		/* start attempts to route job */

		pjob->ji_qs.ji_un_type = JOB_UNION_TYPE_ROUTE;
		pjob->ji_qs.ji_un.ji_routet.ji_quetime = time_now;
		pjob->ji_qs.ji_un.ji_routet.ji_rteretry = 0;
	}

	/* start postqueuejob hook */

	struct batch_request *preq;
	preq = alloc_br(PBS_BATCH_PostQueueJob);
	if (preq == NULL) {
		log_err(PBSE_INTERNAL, __func__, "failed to alloc_br for PBS_BATCH_PostQueueJob");
	} else {
		preq->rq_ind.rq_postqueuejob.rq_pjob = pjob;
		strcpy(preq->rq_ind.rq_postqueuejob.rq_jid, pjob->ji_qs.ji_jobid);
		strncpy(preq->rq_user, pbs_current_user, PBS_MAXUSER);
		strncpy(preq->rq_host, server_host, PBS_MAXHOSTNAME);

		rc = process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt);
		if (rc == -1) {
			log_eventf(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
				   "postqueuejob process_hooks call failed: %s", hook_msg);
		}
		free_br(preq);
	}
	return (0);
}

/**
 * @brief
 * 		svr_dequejob() - remove job from whatever queue its in and reduce counts
 *
 * @param[in]	pjob	-	The job to be enqueued.
 */

void
svr_dequejob(job *pjob)
{
	int bad_ct = 0;
	pbs_queue *pque;
	int state_num;

	/* remove job from server's all job list and reduce server counts */

	if (is_linked(&svr_alljobs, &pjob->ji_alljobs)) {
		int state_num;

		delete_link(&pjob->ji_alljobs);
		delete_link(&pjob->ji_unlicjobs);
		if (pbs_idx_delete(jobs_idx, pjob->ji_qs.ji_jobid) != PBS_IDX_RET_OK)
			log_joberr(PBSE_INTERNAL, __func__, "Failed to delete job from index", pjob->ji_qs.ji_jobid);
		if (--server.sv_qs.sv_numjobs < 0)
			bad_ct = 1;

		state_num = get_job_state_num(pjob);
		if (state_num != -1 && --server.sv_jobstates[state_num] < 0)
			bad_ct = 1;
	}

	if ((pque = pjob->ji_qhdr) != NULL) {

		/* update any entity count and entity resources usage at que */

		account_entity_limit_usages(pjob, pque, NULL, DECR,
					    pjob->ji_etlimit_decr_queued ? ETLIM_ACC_ALL_MAX : ETLIM_ACC_ALL);

		if (is_linked(&pque->qu_jobs, &pjob->ji_jobque)) {
			delete_link(&pjob->ji_jobque);
			if (--pque->qu_numjobs < 0)
				bad_ct = 1;

			state_num = get_job_state_num(pjob);
			if (state_num != -1 && --pque->qu_njstate[state_num] < 0)
				bad_ct = 1;
		}
		pjob->ji_qhdr = NULL;
	}

#ifndef NDEBUG
	sprintf(log_buffer, "dequeuing from %s, state %c",
		pque ? pque->qu_qs.qu_name : "", get_job_state(pjob));
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
		  pjob->ji_qs.ji_jobid, log_buffer);
	if (bad_ct) /* state counts are all messed up */
		correct_ct(pque);
#endif /* NDEBUG */

	mark_jattr_not_set(pjob, JOB_ATR_qtime);

	/* clear any default resource values */
	clear_default_resc(pjob);
}

/**
 * @brief
 * 		svr_setjobstate - set the job state, update the server/queue state counts,
 *		and save the job
 *
 * @param[in,out]	pjob	-	The job to be operated on.
 * @param[in]	newstate	-	new job state
 * @param[in]	newsubstate	-	new sub state of the job.
 *
 * @return	int
 * @retval	0	: success
 * @retval	!=0	: failure
 */

int
svr_setjobstate(job *pjob, char newstate, int newsubstate)
{
	pbs_queue *pque = pjob->ji_qhdr;
	pbs_sched *psched;

	/*
	 * If the job has already finished, then do not make any new changes
	 * to job state or substate.
	 */
	if (check_job_state(pjob, JOB_STATE_LTR_FINISHED) ||
	    (check_job_state(pjob, newstate) && (check_job_substate(pjob, newsubstate))))
		return (0);

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_INFO, pjob->ji_qs.ji_jobid,
		   "Updated job state to %d and substate to %d", newstate, newsubstate);

	/*
	 * if its is a new job, then don't update counts, svr_enquejob() will
	 * take care of that, also req_commit() will see that the job is saved.
	 */

	if (!check_job_substate(pjob, JOB_SUBSTATE_TRANSICM)) {
		char oldstate = get_job_state(pjob);

		/* if the state is changing, also update the state counts */

		if (oldstate != newstate) {
			int oldstatenum;
			int newstatenum;

			oldstatenum = state_char2int(oldstate);
			newstatenum = state_char2int(newstate);
			if (oldstatenum != -1)
				server.sv_jobstates[oldstatenum]--;
			if (newstatenum != -1)
				server.sv_jobstates[newstatenum]++;
			if (pque != NULL) {
				if (oldstatenum != -1)
					pque->qu_njstate[oldstatenum]--;
				if (newstatenum != -1)
					pque->qu_njstate[newstatenum]++;

				/*
				 * if execution queue, and eligability to run
				 * has improved, kick the scheduler.
				 */

				if ((pque->qu_qs.qu_type == QTYPE_Execution) &&
				    (newstate == JOB_STATE_LTR_QUEUED)) {
					if (find_assoc_sched_jid(pjob->ji_qs.ji_jobid, &psched))
						set_scheduler_flag(SCH_SCHEDULE_NEW, psched);
					else {
						sprintf(log_buffer, "Unable to reach scheduler associated with job %s", pjob->ji_qs.ji_jobid);
						log_err(-1, __func__, log_buffer);
					}

					if (!is_jattr_set(pjob, JOB_ATR_etime))
						set_jattr_l_slim(pjob, JOB_ATR_etime, time_now, SET);

					/* clear start time (stime) */
					free_jattr(pjob, JOB_ATR_stime);

				} else if ((newstate == JOB_STATE_LTR_HELD) || (newstate == JOB_STATE_LTR_WAITING)) {
					/* on hold or wait, clear etime */
					free_jattr(pjob, JOB_ATR_etime);
					/* TODO: remove attr etime from database */
				}
			}
			/* if subjob, update parent Array Job */
			if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
				update_sj_parent(pjob->ji_parentaj, pjob, pjob->ji_qs.ji_jobid, oldstate, newstate);
				chk_array_doneness(pjob->ji_parentaj);
			}
		}
	}

	/* set the states accordingly */
	set_job_state(pjob, newstate);
	set_job_substate(pjob, newsubstate);

	/* eligible_time_enable */
	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1) {
		long newaccruetype;

		newaccruetype = determine_accruetype(pjob);
		update_eligible_time(newaccruetype, pjob);
	}

	/* update the job file */

	if (newstate == JOB_STATE_LTR_RUNNING) {
		if (pjob->ji_etlimit_decr_queued == FALSE) {
			account_entity_limit_usages(pjob, NULL, NULL, DECR, ETLIM_ACC_ALL_QUEUED);
			account_entity_limit_usages(pjob, pjob->ji_qhdr, NULL, DECR, ETLIM_ACC_ALL_QUEUED);
			pjob->ji_etlimit_decr_queued = TRUE;
		}
	}

	if (pjob->newobj) {
		/* object was never saved/loaded before, so new object */
		return 0;
	}

	return (job_save_db(pjob));
}

/**
 * @brief	Helper function thats re-evaluates job state and sub state.
 *
 * @param	jobp - pointer to the job
 *
 * @return	void
 */
void
svr_evalsetjobstate(job *jobp)
{
	char newstate;
	int newsub;

	/* force re-eval of job state out of Transit */
	svr_evaljobstate(jobp, &newstate, &newsub, 1);
	svr_setjobstate(jobp, newstate, newsub);
}

/**
 * @brief
 * 		svr_evaljobstate - evaluate and return the job state and substate
 *		according to the the values of the hold, execution time, and
 *		dependency attributes.  This is typically called after the job has been
 *		enqueued or the (hold, execution-time) attributes have been modified.
 * @par
 *		IF the job is a history job i.e. job state is JOB_STATE_MOVED
 *		or JOB_STATE_FINISHED, then just return state/substate without
 *		any change, irrespective of the value of "forceeval".
 *
 * @param[in]	pjob	-	pointer to the job structure
 * @param[out]	newstate	-	recommended new state for job
 * @param[out]	newsub	-	recommended new substate for job
 * @param[in]	forceeval	-	whether to forcefully change the value or not.
 *
 * @return	void
 */
void
svr_evaljobstate(job *pjob, char *newstate, int *newsub, int forceeval)
{
	/*
	 * A value MUST be assigned to newstate and newsub because
	 * they may have been passed in uninitialized. We MUST put
	 * the job in a valid state or the scheduler will bail out
	 * on subsequent cycles and not schedule ANY work. The
	 * safest thing to do is to hold the job by default.
	 */
	*newstate = JOB_STATE_LTR_HELD;
	*newsub = JOB_SUBSTATE_HELD;

	if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_FINISHED))) {

		/* History job, just return state/sub-state. */
		*newstate = get_job_state(pjob);
		*newsub = get_job_substate(pjob);

	} else if ((forceeval == 0) &&
		   (check_job_state(pjob, JOB_STATE_LTR_TRANSIT) ||
		    check_job_state(pjob, JOB_STATE_LTR_RUNNING))) {

		/* Leave as is. */
		*newstate = get_job_state(pjob);
		*newsub = get_job_substate(pjob);
	} else if (get_jattr_long(pjob, JOB_ATR_hold)) {

		*newstate = JOB_STATE_LTR_HELD;
		/* is the hold due to a dependency? */
		if ((check_job_substate(pjob, JOB_SUBSTATE_SYNCHOLD)) ||
		    (check_job_substate(pjob, JOB_SUBSTATE_DEPNHOLD))) {
			/* Retain substate. */
			*newsub = get_job_substate(pjob);
		} else {
			*newsub = JOB_SUBSTATE_HELD;
		}

	} else if (get_jattr_long(pjob, JOB_ATR_exectime) > (long) time_now) {

		*newstate = JOB_STATE_LTR_WAITING;
		*newsub = JOB_SUBSTATE_WAITING;

	} else if (is_jattr_set(pjob, JOB_ATR_stagein)) {

		*newstate = JOB_STATE_LTR_QUEUED;
		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_StagedIn) {
			*newsub = JOB_SUBSTATE_STAGECMP;
		} else {
			*newsub = JOB_SUBSTATE_PRESTAGEIN;
		}

	} else {

		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) {
			/* This is an array job. */
			ajinfo_t *ptbl = pjob->ji_ajinfo;
			if (ptbl) {
				if (ptbl->tkm_subjsct[JOB_STATE_QUEUED] + ptbl->tkm_dsubjsct < ptbl->tkm_ct) {
					*newstate = JOB_STATE_LTR_BEGUN;
					*newsub = JOB_SUBSTATE_BEGUN;
				} else {
					/* All subjobs are queued. */
					*newstate = JOB_STATE_LTR_QUEUED;
					*newsub = JOB_SUBSTATE_QUEUED;
				}
			} else {
				sprintf(log_buffer, "Array job has no tracking table!");
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_ERR,
					  pjob->ji_qs.ji_jobid, log_buffer);
				*newstate = JOB_STATE_LTR_HELD;
				*newsub = JOB_SUBSTATE_HELD;
			}
		} else {
			*newstate = JOB_STATE_LTR_QUEUED;
			*newsub = JOB_SUBSTATE_QUEUED;
		}
	}
}

/**
 * @brief
 * 		get_variable - get the value associated with a specified environment
 *		variable of a job
 *
 * @param[in]	pjob	-	pointer to the job object
 * @param[in]	variable	-	string variable which needs to be searched in object attribute.
 *
 * @return	pointer to the start of the value
 * @retval	NULL	: if the variable is not found in the variable_list attribute.
 */

char *
get_variable(job *pjob, char *variable)
{
	char *pc;

	pc = arst_string(variable, get_jattr(pjob, JOB_ATR_variables));
	if (pc) {
		if ((pc = strchr(pc, (int) '=')) != 0)
			pc++;
	}
	return (pc);
}

/**
 * @brief
 * 		lookup_variable - lookup the value of a particular environment variable
 *		associated with the object.
 *
 * @param[in]	pobj	-	pointer to the object structure
 * @param[in]	objtype	-	object type
 * @param[in]	variable	-	string variable which needs to be searched in object attribute.
 *
 * @return	a pointer to the beginning of the value string
 * @retval	NULL	: pointer if the variable isn't found in the object's "variable_list"
 */

char *
lookup_variable(void *pobj, int objtype, char *variable)
{
	char *pc;
	attribute *objattr;

	if (objtype == JOB_OBJECT)
		objattr = get_jattr((job *) pobj, JOB_ATR_variables);
	else
		objattr = get_rattr((resc_resv *) pobj, RESV_ATR_variables);

	pc = arst_string(variable, objattr);
	if (pc) {
		if ((pc = strchr(pc, (int) '=')) != 0)
			pc++;
	}
	return (pc);
}

/**
 * @brief
 * 		compare the job resource limit against the system limit
 * 		unless a queue limit exists, it take priority
 *
 * @param[in]	jobatr	-	job attribute
 * @param[in]	queatr	-	resource (value) entry
 * @param[in]	svratr	-	server attribute.
 * @param[in]	qtype	-	type of queue (not used here)
 *
 * @return	number of .gt. and .lt. comparison in comp_resc_gt and comp_resc_lt
 * 			does not make use of comp_resc_eq or comp_resc_nc
 */

static void
chk_svr_resc_limit(attribute *jobatr, attribute *queatr,
		   attribute *svratr, int qtype)
{
	int rc;
	resource *jbrc;
	resource *qurc;
	resource *svrc;
	resource *cmpwith;
	static resource_def *noderesc = NULL;

	if (noderesc == NULL) {
		noderesc = &svr_resc_def[RESC_NODES];
	}
	comp_resc_gt = 0;
	comp_resc_lt = 0;

	jbrc = (resource *) GET_NEXT(jobatr->at_val.at_list);
	while (jbrc) {
		cmpwith = 0;
		if (is_attr_set(&jbrc->rs_value)) {
			qurc = find_resc_entry(queatr, jbrc->rs_defin);
			if ((qurc == 0) ||
			    ((is_attr_set(&qurc->rs_value)) == 0)) {
				/* queue limit not set, check server's */

				svrc = find_resc_entry(svratr, jbrc->rs_defin);
				if ((svrc != 0) &&
				    (is_attr_set(&svrc->rs_value))) {
					cmpwith = svrc;
				}

			} else {
				/* queue limit is set, use it */
				cmpwith = qurc;
			}

			if ((jbrc->rs_defin != noderesc) && cmpwith) {
				rc = jbrc->rs_defin->rs_comp(&cmpwith->rs_value,
							     &jbrc->rs_value);
				if (rc > 0)
					comp_resc_gt++;
				else if (rc < 0)
					comp_resc_lt++;
			}
		}
		jbrc = (resource *) GET_NEXT(jbrc->rs_link);
	}
}
/**
 * @brief
 * 		get_wt_limit - get limit set on walltime from the list of resource limits.
 *
 * @param[in]	plimit_attr	-	list of resource limits
 * @param[out]	wt_attr	-	A pointer to walltime limit
 *
 * @return	int
 * @retval	0	: if walltime limit is set
 * @retval 	1	: no walltime limit is set
 */

int
get_wt_limit(attribute *plimit_attr, attribute *wt_attr)
{
	resource *wiresc = NULL;
	if (plimit_attr == NULL || wt_attr == NULL)
		return 1;
	/* Check min_walltime if min_or_max == MIN_WALLTIME_LIMIT */
	wiresc = (resource *) GET_NEXT(plimit_attr->at_val.at_list);
	while (wiresc != NULL) {
		if ((strcasecmp(wiresc->rs_defin->rs_name, WALLTIME) == 0) && (is_attr_set(&wiresc->rs_value))) {
			*wt_attr = wiresc->rs_value;
			return 0;
		}
		wiresc = (resource *) GET_NEXT(wiresc->rs_link);
	}
	return 1;
}
/**
 * @brief
 * 		comp_wt_limits_STF - check a job's min_walltime OR max_walltime against
 * 		configured "walltime" limits.
 *
 * @param[in]	resc_minmaxwt	-	resource(min_walltime or max_walltime) to be compared
 * @param[in] 	limit_attr	-	attribute containing resource limit
 * @param[in] 	min_or_max	-	check aginst minimum walltime limit if MIN_WALLTIME_LIMIT,
 * 								else check against maximum walltime limit
 * @return	int
 * @retval 	0	: within limits OR if resc_minmaxwt == NULL OR is unset.
 * @retval	PBSE_EXCQRESC	: not within limits
 */
int
comp_wt_limits_STF(resource *resc_minmaxwt, attribute limit_attr, int min_or_max)
{
	int rc = 0;

	if (resc_minmaxwt == NULL || !(is_attr_set(&resc_minmaxwt->rs_value)))
		return 0;

	/* Check minimum walltime limit if min_or_max == MIN_WALLTIME_LIMIT */
	if (min_or_max == MIN_WALLTIME_LIMIT) {
		if ((rc = resc_minmaxwt->rs_defin->rs_comp(&(resc_minmaxwt->rs_value), &limit_attr)) < 0)
			return (PBSE_EXCQRESC);
	} else {
		/* Check maximum walltime limit*/
		if ((rc = resc_minmaxwt->rs_defin->rs_comp(&(resc_minmaxwt->rs_value), &limit_attr)) > 0)
			return (PBSE_EXCQRESC);
	}
	return 0;
}

/**
 * @brief
 * 		chk_wt_limits_STF - check a STF job's min and max wlltime against the queue
 * 		and server maximum and mininum "walltime" limits.
 * 		max_walltime will be set to resources_max.walltime(if set), if resc_maxwt == NULL
 *
 * @param[in]	resc_minwt	-	resource_list.min_walltime
 * @param[in]	resc_maxwt	-	resource_list.max_walltime
 * @param[in]	pque	-	queue
 * @param[out]	pattr	-	resource_list, resource_list.max_walltime will be set if NULL
 * @return	int
 * @retval 	0	: within limits OR if resc_minwt == NULL
 * @retval	PBSE_EXCQRESC	: not within limits
 */
int
chk_wt_limits_STF(resource *resc_minwt, resource *resc_maxwt, pbs_queue *pque, attribute *pattr)
{
	attribute wt_min_queue_limit;
	attribute wt_max_queue_limit;
	attribute wt_max_server_limit;
	resource *new_res = NULL;
	resource_def *rscdef = NULL;
	int have_max_queue_limit = 0;
	int have_max_server_limit = 0;

	if (resc_minwt == NULL)
		return 0;
	/* The following should be true:
	 min_walltime >= resources_min.walltime
	 min_walltime <= resources_max.walltime
	 max_walltime >= resources_min.walltime
	 max_walltime <= resources_max.walltime
	 */
	/* Check against queue maximum */
	if (pque && get_wt_limit(get_qattr(pque, QA_ATR_ResourceMax), &wt_max_queue_limit) == 0)
		have_max_queue_limit = 1;
	/* Check server maximum limit only if queue maximum limit is not present */
	if (!have_max_queue_limit && pque && get_wt_limit(get_sattr(SVR_ATR_ResourceMax), &wt_max_server_limit) == 0)
		have_max_server_limit = 1;

#ifndef NAS /* localmod 026 */
	/* If res_maxwt is NULL and resources_max.walltime is set on either server/queue,
	 * set resource_list.max_walltime on the server/queue to value of resources_max.walltime.
	 * If resources_max.walltime is set on both server and queue, set resource_list.max_walltime
	 * to queue's resources_max.walltime. */
	if (resc_maxwt == NULL && pattr != NULL && (have_max_queue_limit || have_max_server_limit)) {
		rscdef = &svr_resc_def[RESC_MAX_WALLTIME];
		new_res = add_resource_entry(pattr, rscdef);
		if (have_max_queue_limit)
			new_res->rs_defin->rs_set(&new_res->rs_value, &wt_max_queue_limit, SET);
		else if (have_max_server_limit)
			new_res->rs_defin->rs_set(&new_res->rs_value, &wt_max_server_limit, SET);
		mark_attr_set(&new_res->rs_value);
	}
#endif /* localmod 026 */
	/* Check against queue maximum */
	if (have_max_queue_limit) {
		if (PBSE_EXCQRESC == comp_wt_limits_STF(resc_minwt,
							wt_max_queue_limit, MAX_WALLTIME_LIMIT) ||
		    PBSE_EXCQRESC == comp_wt_limits_STF(resc_maxwt,
							wt_max_queue_limit, MAX_WALLTIME_LIMIT))
			return (PBSE_EXCQRESC);
	}
	/* Queue limit not present, check against server maximum */
	else if (have_max_server_limit) {
		if ((PBSE_EXCQRESC == comp_wt_limits_STF(resc_maxwt,
							 wt_max_server_limit, MAX_WALLTIME_LIMIT) ||
		     PBSE_EXCQRESC == comp_wt_limits_STF(resc_minwt,
							 wt_max_server_limit, MAX_WALLTIME_LIMIT)))
			return (PBSE_EXCQRESC);
	}
	/* Check against queue minimum */
	if (pque && (get_wt_limit(get_qattr(pque, QA_ATR_ResourceMin), &wt_min_queue_limit) == 0)) {
		if (PBSE_EXCQRESC == comp_wt_limits_STF(resc_minwt,
							wt_min_queue_limit, MIN_WALLTIME_LIMIT) ||
		    PBSE_EXCQRESC == comp_wt_limits_STF(resc_maxwt,
							wt_min_queue_limit, MIN_WALLTIME_LIMIT))
			return (PBSE_EXCQRESC);
	}
	return 0;
}
/**
 * @brief
 * 		chk_resc_limits - check job Resource_Limits attribute against the queue
 *		and server maximum and minimum values.
 *
 * @param[in]	pattr	-	attribute list containing resource request of the job
 * @param[in]	pque	-	queue
 *
 * @return	int
 * @retval 	0	: within limits
 * @retval 	PBSE_EXCQRESC	: not within limits
 */
int
chk_resc_limits(attribute *pattr, pbs_queue *pque)
{
	resource *atresc;
	resource *resc_maxwt = NULL;
	resource *resc_minwt = NULL;

	/* Get resource_list.min_walltime and resource_list.max_walltime if it is a STF job */
	atresc = (resource *) GET_NEXT(pattr->at_val.at_list);
	while (atresc != NULL) {
		if ((strcasecmp(atresc->rs_defin->rs_name, MIN_WALLTIME) == 0)) {
			resc_minwt = atresc;
		} else if ((strcasecmp(atresc->rs_defin->rs_name, MAX_WALLTIME) == 0)) {
			resc_maxwt = atresc;
		}
		/* No need to traverse further if both min_walltime and max_walltime are set */
		if (resc_minwt && resc_maxwt)
			break;
		atresc = (resource *) GET_NEXT(atresc->rs_link);
	}

	/* Check min and max walltime of a STF job against "walltime" resource limit on queue and server */
	if (resc_minwt != NULL && PBSE_EXCQRESC == chk_wt_limits_STF(resc_minwt, resc_maxwt, pque, pattr))
		return (PBSE_EXCQRESC);
	if ((comp_resc(get_qattr(pque, QA_ATR_ResourceMin), pattr) == -1) ||
	    comp_resc_gt)
		return (PBSE_EXCQRESC);

	/* now check individual resources against queue or server maximum */
	chk_svr_resc_limit(pattr,
			   get_qattr(pque, QA_ATR_ResourceMax),
			   get_sattr(SVR_ATR_ResourceMax),
			   pque->qu_qs.qu_type);

	if (comp_resc_lt > 0)
		return (PBSE_EXCQRESC);
	return (0);
}

/**
 * @brief
 * 		svr_chkque - check if job can enter a queue
 *
 * @note
 * 		Note: job owner must be set before calling svr_chkque()
 * 		set_objexid() will be called to set a uid/gid/name if not already set
 *
 * @param[in]	pjob	-	job structure
 * @param[in]	submithost	-	job's submit machine
 * @param[in]	hostname	-	host machine issued this check
 * @param[in]	mtype	-	MOVE_TYPE_* type;  see server_limits.h
 *
 * @return	int
 * @retval	0	: all ok, job can enter queue
 * @retval	PBSE Number	: error code
 */

int
svr_chkque(job *pjob, pbs_queue *pque, char *submithost, char *hostname, int mtype)
{
	int i;

	/* if not already set, set up a uid/gid/name */

	if (!is_jattr_set(pjob, JOB_ATR_euser) || !is_jattr_set(pjob, JOB_ATR_egroup)) {
		if ((i = set_objexid((void *) pjob, JOB_OBJECT, pjob->ji_wattr)) != 0)
			return (i); /* PBSE_BADUSER or GRP */
	}

	/*
	 * 1. If the queue is an Execution queue ...
	 *    These are checked first because 1b - 1d are more damaging
	 *    (see local_move() in svr_movejob.c)
	 */

	if (pque->qu_qs.qu_type == QTYPE_Execution) {

		/* 1b. Check site restrictions */

		if (site_acl_check(pjob, pque))
			return (PBSE_PERM);

		/* 1c. cannot have an unknown resource */

		if (find_resc_entry(get_jattr(pjob, JOB_ATR_resource),
				    svr_resc_def + svr_resc_unk))
			return (PBSE_UNKRESC);

		/* 1d. cannot have an unknown attribute */

		if (is_jattr_set(pjob, JOB_ATR_UNKN))
			return (PBSE_NOATTR);
	}

	/* checks 2, 2a, and 3 are bypassed for a move by manager or qorder */

	if ((mtype != MOVE_TYPE_MgrMv) && (mtype != MOVE_TYPE_Order)) {

		/* 2. the queue must be enabled and the job limit not exceeded */

		if (get_qattr_long(pque, QA_ATR_Enabled) == 0)
			return (PBSE_QUNOENB);

		if (is_qattr_set(pque, QA_ATR_MaxJobs)) {
			int histjobs = 0;
			if (svr_chk_history_conf()) {
				/* calculate number of finished and moved jobs */
				histjobs = pque->qu_njstate[JOB_STATE_MOVED] +
					   pque->qu_njstate[JOB_STATE_FINISHED] +
					   pque->qu_njstate[JOB_STATE_EXPIRED];
			}
			/*
			 * check number of jobs in queue excluding
			 * finished and moved jobs
			 */
			if ((pque->qu_numjobs - histjobs) >= get_qattr_long(pque, QA_ATR_MaxJobs))
				return (PBSE_MAXQUED);
		}

		/* 2a. if job array, check for queue max_array_size */

		if (is_qattr_set(pque, QA_ATR_maxarraysize)) {
			if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) &&
			    (pjob->ji_ajinfo != NULL)) {
				if (pjob->ji_ajinfo->tkm_ct > get_qattr_long(pque, QA_ATR_maxarraysize))
					return (PBSE_MaxArraySize);
			}
		}

		/* 3. If "from_route_only" is true, only local route allowed */

		if (is_qattr_set(pque, QA_ATR_FromRouteOnly) && get_qattr_long(pque, QA_ATR_FromRouteOnly) == 1)
			if (mtype == MOVE_TYPE_Move) /* ok if not plain user or scheduler */
				return (PBSE_QACESS);
	}

	/* 4. If enabled, check the queue's host ACL */

	if (get_qattr_long(pque, QA_ATR_AclHostEnabled))
		if ((acl_check(get_qattr(pque, QA_ATR_AclHost),
			      submithost, ACL_Host) == 0) &&
			(acl_check(get_qattr(pque, QA_ATR_AclHost),
			      hostname, ACL_Host) == 0))
			if (mtype != MOVE_TYPE_MgrMv) /* ok if mgr */
				return (PBSE_BADHOST);

	/* 5a. If enabled, check the queue's user ACL */

	if (get_qattr_long(pque, QA_ATR_AclUserEnabled))
		if (acl_check(get_qattr(pque, QA_ATR_AclUsers),
			      get_jattr_str(pjob, JOB_ATR_job_owner), ACL_User) == 0)
			if (mtype != MOVE_TYPE_MgrMv) /* ok if mgr */
				return (PBSE_PERM);

	/* 5b. If enabled, check the queue's group ACL */

	if (get_qattr_long(pque, QE_ATR_AclGroupEnabled))
		if (acl_check(get_qattr(pque, QE_ATR_AclGroup),
			      get_jattr_str(pjob, JOB_ATR_euser),
			      ACL_Group) == 0)
			if (mtype != MOVE_TYPE_MgrMv) /* ok if mgr */
				return (PBSE_PERM);

	/* 6. If enabled, check the queue's required cred type */

	if (is_qattr_set(pque, QA_ATR_ReqCredEnable) &&
	    get_qattr_long(pque, QA_ATR_ReqCredEnable) &&
	    is_qattr_set(pque, QA_ATR_ReqCred)) {
		char *reqc = get_qattr_str(pque, QA_ATR_ReqCred);
		char *jobc = get_jattr_str(pjob, JOB_ATR_cred);
		/*
		 **	The queue requires a cred, if job has none, or
		 **	it is the wrong one, and if not mgr, reject.
		 */
		if ((!is_jattr_set(pjob, JOB_ATR_cred) || strcmp(reqc, jobc) != 0) && mtype != MOVE_TYPE_MgrMv)
			return PBSE_BADCRED;
	}

	/* checks 7 and 7a are bypassed for a move by manager or qorder */
	if (mtype != MOVE_TYPE_MgrMv) {
		/* 7. resources of the job must be in the limits of the queue */

		/* 7a. Check limit on number of jobs per entity in queue */

		i = check_entity_ct_limit_max(pjob, pque);
		if (i != 0)
			return i;

		i = check_entity_ct_limit_queued(pjob, pque);
		if (i != 0)
			return i;

		/* 7b. Check limit on number of jobs per entity in server only if */
		/*     this is a new job defined by state == JOB_STATE_LTR_TRANSIT    */
		if (check_job_state(pjob, JOB_STATE_LTR_TRANSIT)) {
			i = check_entity_ct_limit_max(pjob, NULL);
			if (i != 0)
				return i;
			i = check_entity_ct_limit_queued(pjob, NULL);
			if (i != 0)
				return i;
		}
	}

	/* Need to unset current default resources and reset them */
	/* from new queue before check if can enter that queue    */

	clear_default_resc(pjob);
	i = set_resc_deflt(pjob, JOB_OBJECT, pque);
	if (i == 0) {

		/* checks 7c and 7d are bypassed for a move by manager or qorder */
		if (mtype != MOVE_TYPE_MgrMv) {
			/* 7c. Check resource limits per entity in queue */
			i = check_entity_resc_limit_max(pjob, pque, NULL);
			if (i == 0)
				i = check_entity_resc_limit_queued(pjob, pque, NULL);

			if (i == 0) {
				/* 7d. Check resource limits per entity in server if this */
				/*     is a new job defined by state == JOB_STATE_TRANSIT */
				i = check_entity_resc_limit_max(pjob, NULL, NULL);
				if (i == 0)
					i = check_entity_resc_limit_queued(pjob, NULL, NULL);

				if (i == 0) {
					/* 7e.  test old gateing limits */
					i = chk_resc_limits(get_jattr(pjob, JOB_ATR_resource), pque);
				}
			}
		}
	}

	/* after check unset defaults & reset based on current queue, if one */
	if (pjob->ji_qhdr) {
		clear_default_resc(pjob);
		(void) set_resc_deflt(pjob, JOB_OBJECT, NULL);
	}

	if (i != 0)
		if (mtype != MOVE_TYPE_MgrMv) /* ok if mgr */
			return (i);

	return (0); /* all ok, job can enter queue */
}

/**
 * @brief
 *		check_block_wt	-	A worktask to reply to the blocked job client
 *
 * @param[in]	ptask	-	work_task structure
 */
void
check_block_wt(struct work_task *ptask)
{
	struct block_job_reply *blockj = ptask->wt_parm1;
	struct pollfd fds[1];
	int rc;
	pbs_socklen_t len = sizeof(rc);
	int conn = 0;
	int ret = 0;
	int check_error;

	if (blockj->fd == -1) {
		int sock_flags;
		struct hostent *hp;
		struct sockaddr_in remote;

		if ((hp = gethostbyname(blockj->client)) == NULL) {
			sprintf(log_buffer, "client host %s not found for block job %s",
				blockj->client, blockj->jobid);
			goto err;
		}

		memset(&remote, 0, sizeof(remote));
		memcpy(&remote.sin_addr, hp->h_addr, hp->h_length);
		remote.sin_port = htons((unsigned short) blockj->port);
		remote.sin_family = hp->h_addrtype;

		if ((blockj->fd = socket(AF_INET, SOCK_STREAM, 0)) == -1) {
			sprintf(log_buffer, "Failed to create socket for job %s", blockj->jobid);
			goto err;
		}

		/* Set socket to Non-blocking */
		sock_flags = fcntl(blockj->fd, F_GETFL, 0);
		if (fcntl(blockj->fd, F_SETFL, sock_flags | O_NONBLOCK) == -1) {
			sprintf(log_buffer, "Failed to set non-blocking flag on socket for job %s",
				blockj->jobid);
			goto err;
		}

		conn = connect(blockj->fd, (struct sockaddr *) &remote, sizeof(remote));
		if ((conn == -1) && !(errno == EINPROGRESS || errno == EWOULDBLOCK)) {
			goto retry;
		}
	}

	while (1) {
		fds[0].fd = blockj->fd;
		fds[0].events = POLLOUT;
		fds[0].revents = 0;

		rc = poll(fds, (nfds_t) 1, 0);
		if (rc == -1) {
			if ((errno != EAGAIN) && (errno != EINTR))
				break;
		} else
			break; /* no error */
	}

	if (rc <= 0)
		goto retry;

	rc = 0;
	check_error = getsockopt(fds[0].fd, SOL_SOCKET, SO_ERROR, &rc, &len);
	if ((rc != 0) || (check_error != 0) || (fds[0].revents != POLLOUT))
		goto retry;

	rc = CS_server_auth(blockj->fd);
	if ((rc != CS_SUCCESS) && (rc != CS_AUTH_CHECK_PORT)) {
		sprintf(log_buffer, "Unable to authenticate with %s:%d", blockj->client, blockj->port);
		goto err;
	}

	/*
	**	All ready to talk... now send the info.
	*/

	DIS_tcp_funcs();
	ret = diswsi(blockj->fd, 1); /* version */
	if (ret != DIS_SUCCESS)
		goto err;
	ret = diswst(blockj->fd, blockj->jobid);
	if (ret != DIS_SUCCESS)
		goto err;
	if (blockj->msg == NULL) {
		ret = diswst(blockj->fd, "");
	} else {
		ret = diswst(blockj->fd, blockj->msg);
	}
	if (ret != DIS_SUCCESS)
		goto err;
	ret = diswsi(blockj->fd, blockj->exitstat);
	if (ret != DIS_SUCCESS)
		goto err;
	(void) dis_flush(blockj->fd);

	sprintf(log_buffer, "%s: Write successful to client %s for job %s ", __func__,
		blockj->client, blockj->jobid);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_NOTICE, blockj->jobid, log_buffer);
	dis_destroy_chan(blockj->fd);
	CS_close_socket(blockj->fd);
	goto end;

retry:
	if ((time(0) - blockj->reply_time) < BLOCK_JOB_REPLY_TIMEOUT) {
		set_task(WORK_Timed, time_now + 10, check_block_wt, blockj);
		return;
	} else {
		sprintf(log_buffer, "Unable to reply to client %s for job %s",
			blockj->client, blockj->jobid);
	}
err:
	DIS_tcp_funcs();
	dis_destroy_chan(blockj->fd);
	if (ret != DIS_SUCCESS) {
		sprintf(log_buffer, "DIS error while replying to client %s for job %s",
			blockj->client, blockj->jobid);
	}
	log_err(-1, __func__, log_buffer);
end:
	if (blockj->fd != -1)
		close(blockj->fd);
	free(blockj->msg);
	free(blockj);
}

/**
 * @brief
 *		check_block	-	See if "block" is set and send reply.
 *
 * @param[in,out]	pjob	-	job structure
 * @param[in]	message	-	message needs to be send to the port.
 */
void
check_block(job *pjob, char *message)
{
	int port;
	char *phost;
	char *jobid = pjob->ji_qs.ji_jobid;
	struct block_job_reply *blockj;

	if ((is_jattr_set(pjob, JOB_ATR_block)) == 0)
		return;
	if ((get_jattr_long(pjob, JOB_ATR_block)) == -1)
		return;

	port = (int) get_jattr_long(pjob, JOB_ATR_block);
	/*
	 * The blocking attribute of the job needs to be unset . This contains the port number on which the job
	 * submission host is waiting for the exit status of the job . This is done here i.e check_block() as it is the
	 * final function in processing of a blocking job .
	 *
	 * Since for posterity it would be useful to record the fact that a job was a blocking job we set the
	 * port number to an impossible value instead of clearing it so that the database only contains
	 * a reference to the fact that a history job was a blocking job . Port number need not be recorded .
	 */
	set_jattr_l_slim(pjob, JOB_ATR_block, -1, SET);

	phost = get_jattr_str(pjob, JOB_ATR_submit_host);
	if (port == 0 || phost == NULL) {
		sprintf(log_buffer, "%s: cannot reply %s:%d", __func__,
			phost == NULL ? "<no host>" : phost, port);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  jobid, log_buffer);
		return;
	}

	blockj = (struct block_job_reply *) malloc(sizeof(struct block_job_reply));
	if (blockj == NULL) {
		sprintf(log_buffer, "%s: Unable to allocate memory for the job %s", __func__, jobid);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  jobid, log_buffer);
		return;
	}

	blockj->msg = strdup(message);
	strncpy(blockj->client, phost, PBS_MAXHOSTNAME);
	blockj->client[PBS_MAXHOSTNAME - 1] = '\0';
	blockj->port = port;
	blockj->fd = -1;
	blockj->reply_time = time(NULL);
	blockj->exitstat = pjob->ji_qs.ji_un.ji_exect.ji_exitstat;
	strcpy(blockj->jobid, pjob->ji_qs.ji_jobid);

	set_task(WORK_Immed, 0, check_block_wt, blockj);
	return;
}

/**
 * @brief
 * 		job_wait_over - The execution wait time of a job has been reached, at
 *		least according to a work_task entry via which we were invoked.
 * @par
 *		IMP: Should not invoke/create any such work task(s) for history
 *	     	jobs (job with state JOB_STATE_MOVED or JOB_STATE_FINISHED).
 * @par
 *		If indeed the case, re-evaluate and set the job state.
 *
 * @param[in]	pwt	-	work task structure
 */

static void
job_wait_over(struct work_task *pwt)
{
	char newstate;
	int newsub;
	job *pjob;

	pjob = (job *) pwt->wt_parm1;

	/* If history job, just return from here */
	if ((check_job_state(pjob, JOB_STATE_LTR_MOVED)) ||
	    (check_job_state(pjob, JOB_STATE_LTR_FINISHED)))
		return;

#ifndef NDEBUG
	{
		time_t now = time(NULL);
		time_t when = get_jattr_long((job *) pjob, JOB_ATR_exectime);
		struct work_task *ptask;

		if (when > now) {
			sprintf(log_buffer, msg_badwait, ((job *) pjob)->ji_qs.ji_jobid);
			log_err(-1, "job_wait_over", log_buffer);

			/* recreate the work task entry */

			ptask = set_task(WORK_Timed, when, job_wait_over, pjob);
			if (ptask) {
				append_link(&pjob->ji_svrtask,
					    &ptask->wt_linkobj, ptask);
			}
			return;
		}
	}
#endif
	pjob->ji_qs.ji_svrflags &= ~JOB_SVFLG_HASWAIT;

	/* clear the exectime attribute */
	free_jattr(pjob, JOB_ATR_exectime);
	svr_evaljobstate(pjob, &newstate, &newsub, 0);
	svr_setjobstate(pjob, newstate, newsub);
}

/**
 * @brief
 * 		job_set_wait - set up a work task entry that will trigger at the execution
 *		wait time of the job.
 * @par
 *		IMP: History jobs:
 *	     If the SERVER is configured for history jobs and the job is
 *	     in state JOB_STATE_MOVED or JOB_STATE_FINISHED, then do not
 *	     create/schedule any further work task on this job which may
 *	     modify the HISTORY jobs.
 * @par
 *		This is called as the at_action (see attribute.h) function associated
 *		with the execution-time job attribute.
 * 		parameter pjob is a job * cast to a void *
 * 		parameter mode is unused;  do it for all action modes
 *
 * @param[in]	pattr	-	execution-time job attribute.
 * @param[in]	pjob	-	pjob is a job * cast to a void *
 * @param[in]	pattr	-	mode is unused;  do it for all action modes
 */

int
job_set_wait(attribute *pattr, void *pjob, int mode)
{
	struct work_task *ptask;
	long when;

	/* Return 0 if it is history job */
	if (check_job_state((job *) pjob, JOB_STATE_LTR_MOVED) || check_job_state((job *) pjob, JOB_STATE_LTR_FINISHED))
		return (0);

	if (!is_attr_set(pattr))
		return (0);
	when = pattr->at_val.at_long;
	ptask = (struct work_task *) GET_NEXT(((job *) pjob)->ji_svrtask);

	/* Is there already an entry for this job?  Then reuse it */

	if (((job *) pjob)->ji_qs.ji_svrflags & JOB_SVFLG_HASWAIT) {
		while (ptask) {
			if ((ptask->wt_event == WORK_Timed) &&
			    (ptask->wt_func == job_wait_over) &&
			    (ptask->wt_parm1 == pjob)) {
				ptask->wt_event = when;
				return (0);
			}
			ptask = (struct work_task *) GET_NEXT(ptask->wt_linkobj);
		}
	}

	ptask = set_task(WORK_Timed, when, job_wait_over, pjob);
	if (ptask == NULL)
		return (-1);
	append_link(&((job *) pjob)->ji_svrtask, &ptask->wt_linkobj, ptask);

	/* set JOB_SVFLG_HASWAIT to show job has work task entry */

	((job *) pjob)->ji_qs.ji_svrflags |= JOB_SVFLG_HASWAIT;
	return (0);
}

/**
 * @brief
 * 		default_std - make the default name for standard output or error
 *		"job_name".[e|o]job_sequence_number
 *		or
 *		"job_name".[e|o]job_sequence_number^index^ for an Array Job
 * 		parameter key is 'e' for stderr, 'o' for stdout
 *	 	parameter to points to a buffer into which the name is returned; callers
 *		are responsible for ensuring that the buffer is of sufficient size
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	key	-	the letter before the sequence number
 * @param[out]	to	-	output name
 */

static void
default_std(job *pjob, int key, char *to)
{
	int len;
	char *pd;

	pd = strrchr(get_jattr_str(pjob, JOB_ATR_jobname), '/');
	if (pd)
		++pd;
	else
		pd = get_jattr_str(pjob, JOB_ATR_jobname);
	len = strlen(pd);

	(void) strcpy(to, pd);	    /* start with the job name */
	*(to + len++) = '.';	    /* the dot        */
	*(to + len++) = (char) key; /* the letter     */
	pd = pjob->ji_qs.ji_jobid;  /* the seq_number */
	while (isdigit((int) *pd))
		*(to + len++) = *pd++;
	*(to + len) = '\0';
	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) {
		/* Array Job - append special substituation string for index */
		strcat(to, ".");
		strcat(to, PBS_FILE_ARRAY_INDEX_TAG);
	}
}

/**
 * @brief
 * 		prefix_std_file - build the absolute pathname for the job's standard
 * 		output or error:
 *		outputhost:$PBS_O_WORKDIR/job_name.[eo]job_sequence_number
 *
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	key	-	integer that is either 'e' or 'o'
 *
 * @return	char *
 * @retval	NULL	-	Failed to construct prefix
 * @retval	!NULL	-	Pointer to the prefix string
 */
char *
prefix_std_file(job *pjob, int key)
{
	char *name = NULL;
	char *outputhost;
	char *wdir;

	if (pbs_conf.pbs_output_host_name)
		outputhost = pbs_conf.pbs_output_host_name;
	else
		outputhost = get_jattr_str(pjob, JOB_ATR_submit_host);
	wdir = get_variable(pjob, "PBS_O_WORKDIR");
	if (outputhost) {
		int len;

		len = strlen(outputhost) +
		      strlen(get_jattr_str(pjob, JOB_ATR_jobname)) + PBS_MAXSEQNUM + strlen(PBS_FILE_ARRAY_INDEX_TAG) + 6;
		if (wdir)
			len += strlen(wdir);
		name = malloc(len);
		if (name) {
			strcpy(name, outputhost); /* the qsub host name	*/
			strcat(name, ":");	  /* the :		*/
			if (wdir) {
				strcat(name, wdir); /* the qsub cwd		*/
				strcat(name, "/");  /* the final /		*/
			}
			/* now add the rest	*/
			default_std(pjob, key, name + strlen(name));
		}
	}
	return (name);
}

/**
 * @brief
 * 		cat_default_std  - function concatenates the default name for the job's
 * 		stdout/err filename to the string residing in buffer "in".  Space for the
 * 		newly created string is dynamically acquired and returned to the caller
 * 		via the argument "out".  It is the responsibility of some other function
 * 		to free this heap memory when it is no longer needed.
 * @par
 * 		parameter key is 'e' for stderr, 'o' for stdout
 * 		parameter in is the location of the input buffer
 * 		parameter out is the return location of the result string
 *
 * @param[in]	pjob	-	job structure
 * @param[in]	key	-	the letter before the sequence number
 * @param[in]	in	-	the string residing in buffer "in".
 * @param[in]	out	-	Space for the newly created string.
 */
void
cat_default_std(job *pjob, int key, char *in, char **out)
{
	char *result;
	int len;
	len = strlen(in) +
	      strlen(get_jattr_str(pjob, JOB_ATR_jobname)) +
	      PBS_MAXSEQNUM + 5 + strlen(PBS_FILE_ARRAY_INDEX_TAG) + 1;
	if ((result = malloc(len))) {
		strcpy(result, in);
		default_std(pjob, key, &result[strlen(result)]);
	}
	*out = result;
}

/**
 * @brief
 * 		cvrt_fqn_to_name - copy the name only (no @host suffix) to the "to" buffer.
 *		"to" buffer is (PBS_MAXUSER+1) characters long. Null terminate string.
 *
 * @param[in]	from	-	 basic job owner's name
 * @param[out]	to	-	"to" buffer where name is copied.
 */
void
cvrt_fqn_to_name(char *from, char *to)
{
	int i;

	for (i = 0; i < PBS_MAXUSER; ++i) {
		if ((*(from + i) == '@') || (*(from + i) == '\0'))
			break;
		*(to + i) = *(from + i);
	}
	*(to + i) = '\0';
}

/**
 * @brief
 *		get_hostPart - return a pointer to the "host" part of a "name@host"
 *		string.
 *
 * @param[in]	from	-	pointer to a string of the form user@host
 *
 * @return	char *
 * @retval	pointer to host part of the input string
 * @retval 	NULL	: if no '@' in input or host part following the '@' is null
 *
 * @par MT-safe:	yes
 */
char *
get_hostPart(char *from)
{
	char *pc;

	if ((pc = strchr(from, '@')) == NULL)
		return NULL;
	else if (*(++pc) == '\0')
		return NULL;
	return pc;
}

#define CVT_SIZE 1500

/**
 * @brief
 * 		set_select_and_place - create a select and place resource for the job
 *
 * @param[in]	objtype	-	type of the object
 * @param[in]	pobj	-	pointer to void * object, not used here.
 * @param[in]	patr	-	pointer to attriute structure which contains the resources.
 *
 * @return	int
 * @retval	0	: success
 * @retval	PBSE_Error	: Error Code
 *
 * @par MT-safe:	No.
 */
int
set_select_and_place(int objtype, void *pobj, attribute *patr)
{
	pbs_list_head collectresc;
	static char *cvt = NULL;
	static size_t cvt_len;
	char *ndspec;
	resource *presc;
	resource *prescsl;
	resource *prescpc;
	resource_def *prdefnd;
	resource_def *prdefpc;
	resource_def *prdefsl;
	int rc;
	extern int resc_access_perm;

	if (cvt == NULL) {
		cvt = malloc(CVT_SIZE);
		if (cvt == NULL)
			return PBSE_SYSTEM;
		else
			cvt_len = CVT_SIZE;
	}

	prdefpc = &svr_resc_def[RESC_PLACE];
	prdefnd = &svr_resc_def[RESC_NODES];
	prdefsl = &svr_resc_def[RESC_SELECT];
	presc = find_resc_entry(patr, prdefnd);

	/* add "select" and "place" resource */

	prescsl = add_resource_entry(patr, prdefsl);
	if (prescsl == NULL)
		return PBSE_SYSTEM;

	prescpc = find_resc_entry(patr, prdefpc);
	if (prescpc == NULL) {
		prescpc = add_resource_entry(patr, prdefpc);
		if (prescpc == NULL)
			return PBSE_SYSTEM;
	}

	if (presc && ((ndspec = presc->rs_value.at_val.at_str) != NULL)) {

		/* Have a nodes spec, use it  to make select and place */

		if ((rc = cvt_nodespec_to_select(ndspec, &cvt, &cvt_len, patr)) != 0)
			return rc;

		if ((rc = prdefsl->rs_decode(&prescsl->rs_value, NULL, "select", cvt)) != 0)
			return rc;
		prescsl->rs_value.at_flags |= ATR_VFLAG_DEFLT;

		if (strstr(ndspec, "#excl") != NULL) {
			prdefpc->rs_decode(&prescpc->rs_value, NULL, "place", "scatter:excl");
		} else if (strstr(ndspec, "#shared") != NULL) {
			prdefpc->rs_decode(&prescpc->rs_value, NULL, "place", "scatter:share");
		} else {
			prdefpc->rs_decode(&prescpc->rs_value, NULL, "place", "scatter");
		}

	} else {
		attribute_def *objatrdef;

		/* No nodes spec, use ncpus/mem/arch/host/software	*/
		/* from the resource_List attribute			*/

		if (objtype == JOB_OBJECT)
			objatrdef = &job_attr_def[(int) JOB_ATR_resource];
		else
			objatrdef = &resv_attr_def[(int) RESV_ATR_resource];

		CLEAR_HEAD(collectresc);
		resc_access_perm = READ_ONLY;
		if (objatrdef->at_encode(patr, &collectresc, objatrdef->at_name, NULL, ATR_ENCODE_CLIENT, NULL) > 0) {
			svrattrl *psvrl;

			*cvt = '1';
			*(cvt + 1) = '\0';
			psvrl = (svrattrl *) GET_NEXT(collectresc);
			while (psvrl) {
				resource_def *prdefcopy;

				prdefcopy = find_resc_def(svr_resc_def, psvrl->al_resc);
				if (prdefcopy && (prdefcopy->rs_flags & ATR_DFLAG_CVTSLT)) {
					size_t cvtneed;

					/* how much space is needed in cvt buffer, 	 */
					/* +5 = one for : = possible quotes and null */
					cvtneed = strlen(psvrl->al_resc) +
						  strlen(psvrl->al_value) + 5;
					if ((strlen(cvt) + cvtneed) > cvt_len) {
						/* double cvt buffer */
						char *tcvt;
						tcvt = realloc(cvt, 2 * cvt_len);
						if (tcvt) {
							cvt = tcvt;
							cvt_len *= 2;
						} else {
							log_event(PBSEVENT_ERROR,
								  PBS_EVENTCLASS_SERVER, LOG_ALERT,
								  msg_daemonname,
								  "unable to malloc space");
							return PBSE_SYSTEM;
						}
					}
					strcat(cvt, ":");
					strcat(cvt, psvrl->al_resc);
					strcat(cvt, "=");
					if (strpbrk(psvrl->al_value, "\"'+:=()")) {
						char *quotec;
						if (strchr(psvrl->al_value, (int) '"'))
							quotec = "'";
						else
							quotec = "\"";
						strcat(cvt, quotec);
						strcat(cvt, psvrl->al_value);
						strcat(cvt, quotec);
					} else {
						strcat(cvt, psvrl->al_value);
					}
				}
				psvrl = (svrattrl *) GET_NEXT(psvrl->al_link);
			}
			free_attrlist(&collectresc);
		} else {
			strcpy(cvt, "ncpus=1");
		}
		if (prdefsl->rs_decode(&prescsl->rs_value, NULL, "select", cvt) == 0) {

			if (objtype == JOB_OBJECT) { /* set default flg only on jobs */
				prescsl->rs_value.at_flags |= ATR_VFLAG_DEFLT;
				if ((prescpc->rs_value.at_flags & (ATR_VFLAG_SET | ATR_VFLAG_DEFLT)) != ATR_VFLAG_SET)
					if (prdefpc->rs_decode(&prescpc->rs_value, NULL, "place", "pack") == 0)

						if (objtype == JOB_OBJECT) /* set default flg only on jobs */
							prescpc->rs_value.at_flags |= ATR_VFLAG_DEFLT;
			}
		}
	}
	return 0;
}

/**
 * @brief
 * 		set_chunk_sums() - set the sums of consumable resources listed
 *		in the chunks as job limits if not already set.
 *
 * @param[in]	pselectattr	-	attribute structure from which we parse the select directive
 * @param[in]	pattr	-	attribute structure where resource limit is set.
 *
 * @return	int
 * @retval	0	: success
 * @retval	PBSE_Error	: Error Code
 *
 * @par MT-safe:	No.
 */

int
set_chunk_sum(attribute *pselectattr, attribute *pattr)
{
	char *chunk;
	int i;
	int j;
	int nchk;
	int nelem;
	int rc;
	int default_flag;
	int total_chunks = 0;
	struct key_value_pair *pkvp;
	resource *presc;
	resource_def *pdef;
	static attribute tmpatr;

	if ((pselectattr == NULL) || (pattr == NULL))
		return 0;

	/* first clear the summation table used later */

	for (i = 0; svr_resc_sum[i].rs_def; ++i) {
		(void) memset((char *) &svr_resc_sum[i].rs_attr, 0, sizeof(struct attribute));

		svr_resc_sum[i].rs_set = 0;
		svr_resc_sum[i].rs_prs = NULL;
	}

	/* now, look through the resource limits specified for the job        */
	/* if any matches an entry in the table, set the pointer and set flag */

	presc = (resource *) GET_NEXT(pattr->at_val.at_list);
	while (presc) {
		for (i = 0; svr_resc_sum[i].rs_def; ++i) {
			if (strcmp(presc->rs_defin->rs_name, svr_resc_sum[i].rs_def->rs_name) == 0) {
				/* found one, save the resource ptr in sum table */
				svr_resc_sum[i].rs_prs = presc;
			}
		}
		presc = (resource *) GET_NEXT(presc->rs_link);
	}

	/* now, parse the select directive */

	chunk = parse_plus_spec(pselectattr->at_val.at_str, &rc);
	if (rc != 0)
		return rc;
	while (chunk) {
		if (parse_chunk(chunk, &nchk, &nelem, &pkvp, NULL) == 0) {
			total_chunks += nchk;
			for (j = 0; j < nelem; ++j) {
				for (i = 0; svr_resc_sum[i].rs_def; ++i) {
					if (strcmp(svr_resc_sum[i].rs_def->rs_name, pkvp[j].kv_keyw) == 0) {
						rc = svr_resc_sum[i].rs_def->rs_decode(&tmpatr, 0,
										       0, pkvp[j].kv_val);
						if (rc != 0)
							return rc;
						else if (!is_attr_set(&tmpatr))
							return PBSE_BADATVAL; /* illegal null value */
						if (svr_resc_sum[i].rs_def->rs_type == ATR_TYPE_SIZE)
							tmpatr.at_val.at_size.atsv_num *= nchk;
						else if (svr_resc_sum[i].rs_def->rs_type == ATR_TYPE_FLOAT)
							tmpatr.at_val.at_float *= nchk;
						else
							tmpatr.at_val.at_long *= nchk;

						(void) svr_resc_sum[i].rs_def->rs_set(&svr_resc_sum[i].rs_attr, &tmpatr, INCR);
						svr_resc_sum[i].rs_set = 1;
						break;
					}
				}
			}
		} else {
			return (PBSE_BADATVAL);
		}
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0)
			return rc;
	}

	/* check that the user asked for at least one chunk total */

	if (total_chunks <= 0)
		return (PBSE_BADATVAL);

	/*
	 * now that we have summed up the chunks, for each one summed (set) ...
	 * set or reset the corresponding job wide limit
	 */
	for (i = 0; svr_resc_sum[i].rs_def; ++i) {
		if (svr_resc_sum[i].rs_set) {

			if (svr_resc_sum[i].rs_prs) {
				presc = svr_resc_sum[i].rs_prs;
				default_flag = presc->rs_value.at_flags & ATR_VFLAG_DEFLT;
			} else {
				default_flag = ATR_VFLAG_DEFLT;
				presc = add_resource_entry(pattr, svr_resc_sum[i].rs_def);
				if (presc == NULL)
					return PBSE_SYSTEM;
			}
			(void) svr_resc_sum[i].rs_def->rs_set(&presc->rs_value, &svr_resc_sum[i].rs_attr, SET);
			presc->rs_value.at_flags |= default_flag;
		}
	}

	/* set pseudo-resource "nodect" to the number of chunks */

	pdef = &svr_resc_def[RESC_NODECT];
	if (pdef) {
		presc = find_resc_entry(pattr, pdef);
		if (presc == NULL)
			presc = add_resource_entry(pattr, pdef);
		if (presc) {
			presc->rs_value.at_val.at_long = total_chunks;
			presc->rs_value.at_flags |= ATR_VFLAG_DEFLT | ATR_SET_MOD_MCACHE;
		}
	}
	return 0;
}

/**
 * @par
 * 		make_schedselect - decode a selection specification,  and produce the
 *		the "schedselect" attribute which contains any default resources
 *		missing from the chunks in the select spec.
 *		Also translates the value of any boolean resource to the "formal"
 *		value of "True" or "False" for the Scheduler who needs to know it
 *		is a boolean and not a string or number.
 *
 *	@param[in]	patrl	-	(not used)
 * 	@param[in]	pselect -	pointer to the select specification
 * 	@param[in]	pque	-	used to obtain queue defaults
 *	@param[in,out]	psched	-	scheduler attribute
 *
 *	@return	int
 *	@retval	0	: success
 *	@retval	PBSE_Error	: Error Code.
 *
 *	@par MT-safe:	No.
 */

extern int resc_access_perm;

int
make_schedselect(attribute *patrl, resource *pselect,
		 pbs_queue *pque, attribute *psched)
{
	int rc;
	char *sched_select_out = NULL;

	if ((pselect == NULL) || (psched == NULL)) {
		return (PBSE_SYSTEM);
	}

	rc = do_schedselect(pselect->rs_value.at_val.at_str, (struct server *) &server, (pbs_queue *) pque, &resc_in_err, &sched_select_out);

	if (rc == 0) {
		free_str(psched);
		(void) decode_str(psched, NULL, NULL, sched_select_out);
		psched->at_flags |= ATR_VFLAG_DEFLT;
	}
	return (rc);
}

/**
 * @brief
 * 		set_deflt_resc - set resource attributes based on a set of defaults provided
 *
 *	@param[in,out]	jb	-	is the job resource list attribute
 *	@param[in]	dflt	-	is the parent object (queue, server, ...) list of defaults
 *	@param[in]	selflg	-	if set means set select/place from the defaults
 */

static void
set_deflt_resc(attribute *jb, attribute *dflt, int selflg)
{
	resource *prescjb;
	resource *prescdt;
	resource_def *seldef;
	resource_def *plcdef;

	seldef = &svr_resc_def[RESC_SELECT];
	plcdef = &svr_resc_def[RESC_PLACE];

	if (is_attr_set(dflt)) {

		/* for each resource in the default value list */

		for (prescdt = (resource *) GET_NEXT(dflt->at_val.at_list);
		     prescdt;
		     prescdt = (resource *) GET_NEXT(prescdt->rs_link)) {

			if ((prescdt->rs_defin == seldef) ||
			    (prescdt->rs_defin == plcdef)) {
				if (!selflg)
					continue; /* dont use select/place */
			}

			if (is_attr_set(&prescdt->rs_value)) {
				/* see if the job already has that resource */
				prescjb = find_resc_entry(jb, prescdt->rs_defin);
				if ((prescjb == NULL) ||
				    ((prescjb->rs_value.at_flags &
				      ATR_VFLAG_SET) == 0)) {

					if (prescjb == NULL)
						prescjb = add_resource_entry(jb,
									     prescdt->rs_defin);
					if (prescjb) {
						if (prescdt->rs_defin->rs_set(&prescjb->rs_value, &prescdt->rs_value, SET) == 0)
							prescjb->rs_value.at_flags |= (ATR_VFLAG_SET | ATR_VFLAG_DEFLT);
						jb->at_flags |= ATR_MOD_MCACHE;
					}
				}
			}
		}
	}
}

/**
 * @brief
 * 		set_resc_deflt - sets default resource limit values
 * 		on the object pointed to by input "pobj"
 *
 * @param[in]	pobj	-	job/reservation structure
 * @param[in]	objtype	-	type of object - job or reservation.
 * @param[in,out]	pque	-	Queue structure
 *
 * @return	int
 * @retval	0	: success
 * @retval	PBSE_Error	: Error Code.
 *
 * @par MT-safe:	No.
 */
int
set_resc_deflt(void *pobj, int objtype, pbs_queue *pque)
{
	static resc_resv *presv;
	job *pjob;
	attribute *pdest = NULL;
	attribute *psched = NULL;
	resource *presc;
	resource_def *prdefsl;
	resource_def *prdefpc;
	int rc;

	switch (objtype) {
		case JOB_OBJECT:
			pjob = (job *) pobj;
			assert(pjob != NULL);
			if (pque == NULL)
				pque = pjob->ji_qhdr;
			assert(pque != NULL);
			pdest = get_jattr(pjob, JOB_ATR_resource);
			psched = get_jattr(pjob, JOB_ATR_SchedSelect);
			break;

		case RESC_RESV_OBJECT:
			presv = (resc_resv *) pobj;
			assert(presv != NULL);
			pque = NULL;
			pdest = get_rattr(presv, RESV_ATR_resource);
			psched = get_rattr(presv, RESV_ATR_SchedSelect);
			break;

		default:
			break;
	}

	/* set defaults based on the Queue's resources_default */
	if (pque) {
		set_deflt_resc(pdest,
			       get_qattr(pque, QA_ATR_ResourceDefault), 1);
	}

	/* set defaults based on the Server' resources_default */
	set_deflt_resc(pdest, get_sattr(SVR_ATR_resource_deflt), 1);

	/* set defaults based on the Queue's resources_max */
	if (pque) {
		set_deflt_resc(pdest,
			       get_qattr(pque, QA_ATR_ResourceMax), 0);
	}

	/* set defaults based on the Server's resources_max */
	set_deflt_resc(pdest, get_sattr(SVR_ATR_ResourceMax), 0);

	/* if needed, set "select" and "place" from the other resources */

	prdefsl = &svr_resc_def[RESC_SELECT];
	presc = find_resc_entry(pdest, prdefsl);
	/* if not set, set select/place */
	if ((presc == NULL) || ((is_attr_set(&presc->rs_value)) == 0))
		if ((rc = set_select_and_place(objtype, pobj, pdest)) != 0)
			return rc;

	prdefpc = &svr_resc_def[RESC_PLACE];
	presc = find_resc_entry(pdest, prdefpc);
	/* if "place" still not set, force to "free" */
	if ((presc == NULL) || ((is_attr_set(&presc->rs_value)) == 0)) {
		presc = add_resource_entry(pdest, prdefpc);
		if (presc == NULL)
			return PBSE_SYSTEM;
		if (prdefpc->rs_decode(&presc->rs_value, NULL, "place", "free") == 0)
			if (objtype == JOB_OBJECT) /* only for jobs, set DEFLT */
				presc->rs_value.at_flags |= ATR_VFLAG_DEFLT;
	}

	/* now set up the Scheduler's version of select JOB_ATR_SchedSelect */
	presc = find_resc_entry(pdest, prdefsl);
	if (presc) {
		if ((rc = make_schedselect(pdest, presc, pque, psched)) == 0)
			rc = set_chunk_sum(psched, pdest);

	} else
		rc = PBSE_SYSTEM;
	return rc;
}

/**
 * @brief
 * 		eval_chkpnt - if the job's checkpoint attribute is "c=nnnn" and
 * 		nnnn is less than the queue' minimum checkpoint time, reset
 *		to the queue min time.
 *
 * @param[in]	jobckp	-	the job's checkpoint attribute
 * @param[in]	queckp	-	the queue's checkpoint attribute
 */

void
eval_chkpnt(job *pjob, attribute *queckp)
{
	char *pv = get_jattr_str(pjob, JOB_ATR_chkpnt);

	if (!is_jattr_set(pjob, JOB_ATR_chkpnt) || !is_attr_set(queckp))
		return; /* need do nothing */

	if ((*pv == 'c') || (*pv == 'w')) {
		int jobs;
		char queues[30];
		char ckt;

		ckt = *pv;
		if (*++pv == '=')
			pv++;
		jobs = atoi(pv);
		if (jobs < queckp->at_val.at_long) {
			sprintf(queues, "%c=%ld", ckt, queckp->at_val.at_long);
			set_jattr_generic(pjob, JOB_ATR_chkpnt, queues, NULL, INTERNAL);
		}
	}
}

#ifndef NDEBUG
/**
 * @brief
 * 		correct_ct - This is a work-around for an as yet unfound bug where
 *		the counts of jobs in each state sometimes (rarely) become wrong.
 *		When this happens, the count for a state can become negative.
 *		If this is detected (see above), this routine is called to reset
 *		all of the counts and log a message.
 *
 * @param[in]	pqj	-	pbs queue structure
 */

static void
correct_ct(pbs_queue *pqj)
{
	int i;
	char *pc;
	job *pjob;
	pbs_queue *pque;

	(void) sprintf(log_buffer, "Job state counts incorrect, server %d: ",
		       server.sv_qs.sv_numjobs);
	server.sv_qs.sv_numjobs = 0;
	for (i = 0; i < PBS_NUMJOBSTATE - 4; ++i) {
		pc = log_buffer + strlen(log_buffer);
		(void) sprintf(pc, "%d ", server.sv_jobstates[i]);
		server.sv_jobstates[i] = 0;
	}
	if (pqj) {
		pc = log_buffer + strlen(log_buffer);
		(void) sprintf(pc, "; queue %s %d: ", pqj->qu_qs.qu_name,
			       pqj->qu_numjobs);
		for (i = 0; i < PBS_NUMJOBSTATE - 4; ++i) {
			pc = log_buffer + strlen(log_buffer);
			(void) sprintf(pc, "%d ", pqj->qu_njstate[i]);
		}
	}
	log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_SERVER, LOG_DEBUG,
		  msg_daemonname, log_buffer);

	for (pque = (pbs_queue *) GET_NEXT(svr_queues); pque;
	     pque = (pbs_queue *) GET_NEXT(pque->qu_link)) {
		pque->qu_numjobs = 0;
		for (i = 0; i < PBS_NUMJOBSTATE - 4; ++i)
			pque->qu_njstate[i] = 0;
	}

	for (pjob = (job *) GET_NEXT(svr_alljobs); pjob;
	     pjob = (job *) GET_NEXT(pjob->ji_alljobs)) {
		int state_num;

		state_num = get_job_state_num(pjob);
		server.sv_qs.sv_numjobs++;
		if (state_num != -1)
			server.sv_jobstates[state_num]++;
		if (pjob->ji_qhdr) {
			(pjob->ji_qhdr)->qu_numjobs++;
			if (state_num != -1)
				(pjob->ji_qhdr)->qu_njstate[state_num]++;
		}
	}
	return;
}
#endif /* NDEBUG */

/**
 * @brief
 * 		get_wall - get the value of "walltime" for the job
 *
 * @param[in]	jp	-	jp is a valid job pointer
 *
 * @return	int
 * @retval	-1	: function failed
 * @retval	walltime value	: function succeeded
 *
 * @note
 * 		Assumption: input jp is a valid job pointer
 */
int
get_wall(job *jp)
{
	resource_def *rscdef;
	resource *pres;

	rscdef = &svr_resc_def[RESC_WALLTIME];
	if (rscdef == 0)
		return (-1);
	pres = find_resc_entry(get_jattr(jp, JOB_ATR_resource), rscdef);
	if (pres == 0)
		return (-1);
	else if (!is_attr_set(&pres->rs_value))
		return (-1);
	else
		return pres->rs_value.at_val.at_long; /*wall time value*/
}

/**
 * @brief
 * 		get the amount of "walltime" resource USED for the job
 *
 * @param[in]	jp	- Pointer to a job
 *
 * @return	Success/Failure
 * @retval	-1 		- Function failed
 * @retval	walltime value	- Function succeeded
 * @note
 * 		Assumption: input jp is a valid job pointer
 *
 * @return	wall time value
 * @retval	-1	: failure
 *
 */
int
get_used_wall(job *jp)
{
	resource_def *rscdef;
	resource *pres;

	rscdef = &svr_resc_def[RESC_WALLTIME];
	if (rscdef == 0)
		return (-1);
	pres = find_resc_entry(get_jattr(jp, JOB_ATR_resc_used), rscdef);
	if (pres == 0)
		return (-1);
	else if (!is_attr_set(&pres->rs_value))
		return (-1);
	else
		return pres->rs_value.at_val.at_long; /*wall time value*/
}

/**
 * @brief
 * 		get_softwall - get the value of "soft_walltime" for the job
 *
 * @param[in]	jp	-	jp is a valid job pointer
 *
 * @return	int
 * @retval	-1	: function failed
 * @retval	soft walltime value	: function succeeded
 *
 * @note
 * 		Assumption: input jp is a valid job pointer
 */
int
get_softwall(job *jp)
{
	resource_def *rscdef;
	resource *pres;

	rscdef = &svr_resc_def[RESC_SOFT_WALLTIME];
	if (rscdef == 0)
		return (-1);
	pres = find_resc_entry(get_jattr(jp, JOB_ATR_resource), rscdef);
	if (pres == 0)
		return (-1);
	else if (!is_attr_set(&pres->rs_value))
		return (-1);
	else
		return pres->rs_value.at_val.at_long; /*wall time value*/
}

/**
 * @brief
 * 		get_cput - get the value of "cput" for the job
 *
 * @param[in]	jp	-	jp is a valid job pointer
 *
 * @return	int
 * @retval	-1	: function failed
 * @retval	cput value	: function succeeded
 *
 * @note
 * 		Assumption: input jp is a valid job pointer
 */
int
get_cput(job *jp)
{
	resource_def *rscdef;
	resource *pres;

	rscdef = &svr_resc_def[RESC_CPUT];
	if (rscdef == 0)
		return (-1);
	pres = find_resc_entry(get_jattr(jp, JOB_ATR_resource), rscdef);
	if (pres == 0)
		return (-1);
	else if (!is_attr_set(&pres->rs_value))
		return (-1);
	else
		return pres->rs_value.at_val.at_long; /*wall time value*/
}

/**
 * @brief
 * 		get the amount of "cput" resource USED for the job
 *
 * @param[in]	jp	- Pointer to a job
 *
 * @return	Success/Failure
 * @retval	-1 		- Function failed
 * @retval	walltime value	- Function succeeded
 * @note
 * 		Assumption: input jp is a valid job pointer
 *
 * @return	wall time value
 * @retval	-1	: failure
 *
 */
int
get_used_cput(job *jp)
{
	resource_def *rscdef;
	resource *pres;

	rscdef = &svr_resc_def[RESC_CPUT];
	if (rscdef == 0)
		return (-1);
	pres = find_resc_entry(get_jattr(jp, JOB_ATR_resc_used), rscdef);
	if (pres == 0)
		return (-1);
	else if (!is_attr_set(&pres->rs_value))
		return (-1);
	else
		return pres->rs_value.at_val.at_long; /*wall time value*/
}
/*-------------------------------------------------------------------------------
 Functions for establishing reservation related tasks
 --------------------------------------------------------------------------------*/
/**
 * @brief
 * 		Time4reply	-	reply when reservation becomes unconfirmed.
 *
 * @param[in,out]	ptask	-	work task structure which contains reservation structure.
 */
static void
Time4reply(struct work_task *ptask)
{
	resc_resv *presv = ptask->wt_parm1;

	if (presv->ri_brp) {
		char buf[512] = {0};
		if (presv->ri_qs.ri_state == RESV_UNCONFIRMED ||
		    presv->ri_qs.ri_state == RESV_BEING_ALTERED)
			snprintf(buf, sizeof(buf), "%s UNCONFIRMED", presv->ri_qs.ri_resvID);
		else if (presv->ri_qs.ri_state == RESV_CONFIRMED) {
			/*Remark: this part of the if is unlikely to happen*/
			/*        reply would happen in req_rescreserve()  */
			snprintf(buf, sizeof(buf), "%s CONFIRMED", presv->ri_qs.ri_resvID);
		}

		(void) reply_text(presv->ri_brp, PBSE_NONE, buf);
		presv->ri_brp = NULL;
	}
}

/**
 * @brief
 * 		Time4resv - function to execute when the "start time" for a
 *		CONFIRMED reservation finally arrives.
 *		At some prior point in time a task that's to be processed
 *		at "start time" is put onto  the "timed-tasks" list.  This
 *		task's function pointer field points at this function -
 *		see "gen_task_Time4resv" regards the task on the "timed_tasks"
 *		list.
 *		A pointer to the resc_resv structure is put in the task's
 *		"wt_parm1" void* field.
 * @note
 *		Note: function "dispatch_task" unlinks the task structure
 *	      from whatever list(s) it's on and it frees the memory
 *	      consumed by the work_task struct
 *
 * @param[in,out]	ptask	-	work task structure which contains reservation structure.
 *
 *	Returns   none
 */
static void
Time4resv(struct work_task *ptask)
{
	resc_resv *presv = ptask->wt_parm1;
	int pbs_ecode;
	int state, sub;

	/* cause to have issued to the qmgr subsystem
	 * a request to start the reservation's queue
	 * note: if presv is for a job reservation no
	 * request gets made
	 */

	pbs_ecode = change_enableORstart(presv, Q_CHNG_START, "True");
	if (!pbs_ecode) {
		/*
		 *this is really the line we want once the scheduler
		 *has the capability to say "begin this reservation"
		 */

		eval_resvState(presv, RESVSTATE_Time4resv, 0, &state, &sub);
		resv_setResvState(presv, state, sub);

		/*ok, time for the reservation to be running so adjust
		 *server's/queue's resource accounting to reflect that
		 *their "resources_assigned" values are now higher by the
		 *amounts requested by the reservation.  Also, set a flag to
		 *indicate that in the future resources have to be returned
		 *and, setup so that the scheduler gets notified
		 */
		if (!presv->resv_from_job)
			set_resc_assigned((void *) presv, 1, INCR);
		presv->ri_giveback = 1;

		resv_exclusive_handler(presv);
		notify_scheds_about_resv(SCH_SCHEDULE_JOBRESV, presv);

		/*notify the relevant persons that the reservation time has arrived*/
		if (presv->ri_qs.ri_tactive == time_now) {
			svr_mailownerResv(presv, MAIL_BEGIN, MAIL_NORMAL, "");
			account_resvstart(presv);

			/* make an artifical request so we can fire process hooks */
			struct batch_request *preq = alloc_br(PBS_BATCH_BeginResv);
			preq->rq_perm |= ATR_DFLAG_MGWR;
			strncpy(preq->rq_user, pbs_current_user, PBS_MAXUSER);
			strncpy(preq->rq_host, server_host, PBS_MAXHOSTNAME);
			strncpy(preq->rq_ind.rq_manager.rq_objname, presv->ri_qs.ri_resvID, PBS_MAXSVRRESVID);
			/* handle truncation warning */
			preq->rq_ind.rq_manager.rq_objname[PBS_MAXSVRJOBID] = '\0';

			char hook_msg[HOOK_MSG_SIZE] = {0};
			switch (process_hooks(preq, hook_msg, sizeof(hook_msg), pbs_python_set_interrupt)) {
				case 0: /* explicit reject */
				case 1: /* no recreate request as there are only read permissions */
				case 2: /* no hook script executed - go ahead and accept event*/
					break;
				default:
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, __func__,
						  "resv_begin event: accept req by default");
			}
			free_br(preq);
		}

		presv->resv_start_task = NULL;
		if ((ptask = set_task(WORK_Timed, time_now + 60,
				      Time4resv1, presv)) != 0) {

			ptask->wt_aux = 4; /*we will attempt up to 5 times*/

			/* set things so that the reservation going away causes */
			/* any "yet to be processed" work tasks also going away */

			append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);
		}
	}

	if (is_rattr_set(presv, RESV_ATR_del_idle_time)) {
		/* Catch the idle case where the reservation never has any jobs in it */
		set_idle_delete_task(presv);
	}
}

/**
 * @brief
 * 		Time4resv1 - function that's executed when a "n-th reminder"
 *		on the timed-tasks list gets dispatched.
 * @par
 *		This function checks if the reservation is still in state
 *		RESV_TIME_TO_RUN and, if it is, it sets into the global
 *		server variable "svr_do_schedule" an appropriate command
 *		for the scheduler, notes how many times it has done this
 *		and, from that, determines whether or not to put itself
 *		back on the task list.
 *
 * @param[in,out]	ptask	-	work task structure which contains reservation structure.
 *
 *	@return   none
 */
static void
Time4resv1(struct work_task *ptask)
{
	struct work_task *pwt;
	resc_resv *presv = ptask->wt_parm1;

	if (get_rattr_long(presv, RESV_ATR_state) != RESV_TIME_TO_RUN)
		return; /*no more reminders needed*/

	/*put on another reminder timed for 60 seconds in the future*/
	if (ptask->wt_aux > 0) {
		if ((pwt = set_task(WORK_Timed, time_now + 60,
				    Time4resv1, presv)) != 0) {

			pwt->wt_aux = ptask->wt_aux - 1;

			/* set things so that the job going away will result in */
			/* any "yet to be processed" work tasks also going away */

			append_link(&presv->ri_svrtask, &pwt->wt_linkobj, pwt);
		}
	}

#if 0
	For general reservation, where duration can be less than end - start
	time, the scheduler can(eventually) choose when to run the reservation
	so going to want something different than what we currently have for
		reservation jobs
#endif

	/* specify the scheduling command for the scheduler */
	set_scheduler_flag(SCH_SCHEDULE_JOBRESV, dflt_scheduler);
}

/**
 * @brief
 * 		Time4resvFinish - function that's to execute when "time_now" exceeds
 *		the ending time of the reservation
 *
 * @param[in,out]	ptask	-	work task structure which contains reservation structure.
 *
 *	Returns   none
 */
void
Time4resvFinish(struct work_task *ptask)
{
	resc_resv *presv = ptask->wt_parm1;
	struct batch_request *preq;

	/* If more than one occurrence then process the occurrence end. The sequence
	 * of events that are needed for the end of a standing reservation are:
	 *
	 * 1) change the queue state from started True to False
	 * 2) Delete all Running Jobs and Keep Queued Jobs
	 * 3) Once all Obits are received (see running_jobs_count):
	 *    3.a) Determine if occurrences were missed
	 *    3.b) Add the next occurrence start and end event on the work task
	 */
	presv->resv_end_task = NULL;
	if (get_rattr_long(presv, RESV_ATR_resv_count) > 1) {
		int ridx = get_rattr_long(presv, RESV_ATR_resv_idx);
		int rcount = get_rattr_long(presv, RESV_ATR_resv_count);

		DBPRT(("reached end of occurrence %d/%d\n", ridx, rcount))
		log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID,
				       "reached end of occurrence %d/%d", ridx, rcount);

		/* When recovering past the last occurrence the standing reservation is purged
		 * in a manner similar to an advance reservation
		 */
		if (ridx < rcount) {
			/*
			 * Invoke the reservation end hook for every occurrence
			 */
			struct batch_request *newreq;
			newreq = alloc_br(PBS_BATCH_ResvOccurEnd);
			if (newreq != NULL) {
				newreq->rq_perm |= ATR_DFLAG_MGWR;
				strcpy(newreq->rq_user, pbs_current_user);
				strcpy(newreq->rq_host, server_host);
				strcpy(newreq->rq_ind.rq_manager.rq_objname, presv->ri_qs.ri_resvID);
				if (issue_Drequest(PBS_LOCAL_CONNECTION, newreq, resvFinishReply, NULL, 0) == -1) {
					free_br(newreq);
				}
				tickle_for_reply();
			}
			/* 1) Change queue state from started True to False and change
			 * state of the reservation queue
			 */
			change_enableORstart(presv, Q_CHNG_START, "FALSE");
			resv_setResvState(presv, RESV_DELETING_JOBS, presv->ri_qs.ri_substate);

			/* 2) Issue delete messages to jobs in running state and keep jobs in
			 * Queued state. Server periodically monitors the reservation queue
			 * to determine if all jobs in run state have been purged.
			 */
			delete_occurrence_jobs(presv);

			/* Done processing the current occurrence. If MOM locks up during cleanup
			 * or stage out for a duration that exceeds the time of the last occurrence
			 * then this handler will be invoked again with an occurrence index (ridx)
			 * equal to the last occurrence (rcount) and be processed as a DeleteReservation
			 * event in the next block.
			 */
			return;
		}
	}
	/* If an advance reservation or last occurrence of a standing reservation
	 * construct a "deleteResv" batch request for the dummy connection
	 * PBS_LOCAL_CONNECTION; Issue that request via "issue_Drequest".
	 * "issue_Drequest" will notice this request is to be handled here
	 * and call upon "dispatch_request", the mechanism for dispatching of
	 * incomming requests.  "issue_Drequest" is passed a function that's
	 * to deal with the reply to the request when it arrives.  A task
	 * having this reply handling function (pointer) is placed on the
	 * global list, "task_list_event".  Request dispatching proceeds
	 * as it normally does and invokes the function "reply_send", which
	 * is to send back a reply to the batch request.  In this instance,
	 * (response recipent local) reply_send  moves the task of dealing
	 * with the "reply to request" on to "task_list_immediate", so it
	 * can get recognized the next time function "next_task" in the
	 * server's main loop gets invoked
	 */
	if ((preq = alloc_br(PBS_BATCH_DeleteResv)) != 0) {
		/*setup field so don't fail a check on perm*/
		preq->rq_perm |= ATR_DFLAG_MGWR;

		strcpy(preq->rq_user, pbs_current_user);
		strcpy(preq->rq_host, server_host);
		strcpy(preq->rq_ind.rq_manager.rq_objname,
		       presv->ri_qs.ri_resvID);

		/*notify relevant parties that the reservation's
		 *ending time has arrived and reservation is being deleted
		 */
		svr_mailownerResv(presv, MAIL_END, MAIL_NORMAL, "");

		set_last_used_time_node(presv, 1);
		(void) issue_Drequest(PBS_LOCAL_CONNECTION, preq,
				      resvFinishReply, NULL, 0);
		tickle_for_reply();
	}
}

/**
 * @brief
 * 		If processing a Standing Reservation
 * 		1) Get the occurrence index and the total number of occurrences,
 *    		if this is the last occurrence, an event to purge reservation is added to
 *    		the work task.
 * 		2) If not last, then set the next occurrence's start and end time and
 *    		appropriate execvnodes and add to server's work task
 * 		3) Update state and save reservation
 * @par
 * 		This function is also entered upon reservation recovery to handle skipped
 * 		occurrences.
 *
 * @param[in]	presv	-	Standing Reservation
 */
static void
Time4occurrenceFinish(resc_resv *presv)
{
	time_t newend;
	time_t newstart;
	int state = 0;
	int sub = 0;
	int rc = 0;
	int rcount_adjusted = 0;
	char *execvnodes_orig = NULL;
	char *execvnodes = NULL;
	char *newxc = NULL;
	char **short_xc = NULL;
	char **tofree = NULL;
	time_t dtstart;
	time_t dtend;
	time_t next;
	time_t now;
	struct work_task *ptask = NULL;
	pbsnode_list_t *pl = NULL;
	char start_time[9] = {0}; /* 9 = sizeof("%H:%M:%S")[=8] + 1('\0') */
	resource_def *rscdef = NULL;
	resource *prsc = NULL;
	attribute atemp = {0};
	int j = 2;
	int occurrence_ended_early = 0;
	int ridx = get_rattr_long(presv, RESV_ATR_resv_idx);
	int rcount = get_rattr_long(presv, RESV_ATR_resv_count);
	char *rrule = get_rattr_str(presv, RESV_ATR_resv_rrule);
	char *tz = get_rattr_str(presv, RESV_ATR_resv_timezone);

	/* the next occurrence returned by get_occurrence is counted from the current
	 * one which is at index 1. */

	/* If the reservation was altered,
	 * use the stored values in RESV_ATR_standing_revert.
	 */
	if (is_rattr_set(presv, RESV_ATR_standing_revert)) {
		resource *resc, *resc2;
		attribute *stnd_revert = get_rattr(presv, RESV_ATR_standing_revert);
		attribute *resc_attr = get_rattr(presv, RESV_ATR_resource);

		resc = find_resc_entry(stnd_revert, &svr_resc_def[RESC_START_TIME]);
		dtstart = resc->rs_value.at_val.at_long;

		resc = find_resc_entry(stnd_revert, &svr_resc_def[RESC_WALLTIME]);
		set_rattr_l_slim(presv, RESV_ATR_duration, resc->rs_value.at_val.at_long, SET);
		presv->ri_qs.ri_duration = resc->rs_value.at_val.at_long;

		resc = find_resc_entry(resc_attr, &svr_resc_def[RESC_SELECT]);
		resc2 = find_resc_entry(stnd_revert, &svr_resc_def[RESC_SELECT]);
		free(resc->rs_value.at_val.at_str);
		resc->rs_value.at_val.at_str = strdup(resc2->rs_value.at_val.at_str);
		post_attr_set(resc_attr);
		make_schedselect(resc_attr, resc, NULL, get_rattr(presv, RESV_ATR_SchedSelect));
		set_chunk_sum(&resc->rs_value, resc_attr);
	} else
		dtstart = get_rattr_long(presv, RESV_ATR_start);

	dtend = get_rattr_long(presv, RESV_ATR_end);
	next = dtstart;
	now = time(NULL);

	/* Add next occurrence and account for missed occurrences.
	 * There are three ways we can get into this function:
	 * 1) When the server is initializating.  We need to account for all occurrences we have missed.
	 * 2) The end of an occurrence.  We need to move onto the next.
	 * 3) If an occurrence ends early.  We need to move onto the next.
	 */
	if (presv->ri_qs.ri_substate == RESV_RUNNING && next < now)
		occurrence_ended_early = 1;
	while (occurrence_ended_early || dtend <= now) {
		/* We may loop and skip several occurrences for different reasons,
		 * if an occurrence ended early, it can only be the one we are in
		 */
		occurrence_ended_early = 0;
		/* get occurrence that is "j" numbers away from dtstart. */
		next = get_occurrence(rrule, dtstart, tz, j);
		dtend = next + presv->ri_qs.ri_duration;

		/* Index of next occurrence from dtstart */
		j++;

		/* Log information notifying of missed occurrences. An occurrence is
		 * "missed" either if it was interrupted, in which case it never was
		 * instructed to "give back" its allocated resources, or if the server
		 * was down for an extended period of time extending over a number of
		 * occurrences.
		 * The first time around j has the value 2 and is incremented to 3 to
		 * account for the next occurrence. Any increments after that characterize
		 * missed occurrences that are noted in the log file. */
		if (j > 3 || presv->ri_giveback == 0) {
			if (strftime(start_time, sizeof(start_time),
				     "%H:%M:%S", localtime(&dtstart))) {
				sprintf(log_buffer,
					"reservation occurrence %d/%d "
					"scheduled at %s was skipped because "
					"its end time is in the past",
					ridx, rcount, start_time);
			} else {
				sprintf(log_buffer,
					"reservation occurrence %d/%d was "
					"skipped because its end time is in "
					"the past",
					ridx, rcount);
			}
			log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV,
				  LOG_NOTICE, presv->ri_qs.ri_resvID,
				  log_buffer);
		}

		/* The reservation index is incremented */
		ridx++;

		/* If skipped past the last occurrence then return to the
		 * caller which will handle issuing a reservation delete
		 * message
		 */
		if (ridx > rcount) {
			set_rattr_l_slim(presv, RESV_ATR_resv_idx, rcount, SET);

			if ((ptask = set_task(WORK_Immed, 0, Time4resvFinish, presv)) != 0)
				append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);

			return;
		}

		DBPRT(("stdg_resv: next occurrence start = %s", ctime(&next)))
		DBPRT(("stdg_resv: next occurrence end   = %s", ctime(&dtend)))
	}
	if (is_rattr_set(presv, RESV_ATR_resv_execvnodes))
		execvnodes_orig = get_rattr_str(presv, RESV_ATR_resv_execvnodes);
	if (execvnodes_orig != NULL) {
		DBPRT(("stdg_resv: execvnodes sequence   = %s\n", execvnodes_orig))
		execvnodes = strdup(execvnodes_orig);
	} else {
		DBPRT(("stdg_resv: execvnodes sequence missing"))
		;
	}
	short_xc = (char **) unroll_execvnode_seq(execvnodes, &tofree);

	/* when a reservation is reconfirmed, the 'count' of occurrences may differ
	 * from the original 'count', we need to adjust for the actual remaining
	 * count
	 */
	rcount_adjusted = rcount - get_execvnodes_count(execvnodes);

	/* The reservation index starts at 1 but the short_xc array at 0. Occurrence 1
	 * is therefore given by array element 0.
	 */
	if (ridx - rcount_adjusted >= 1 && short_xc != NULL)
		newxc = strdup(short_xc[ridx - rcount_adjusted - 1]);
	else {
		newxc = NULL;
		log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID,
		           "%s: attempt to find vnodes for for occurence %d failed; using empty set",
		           __func__, ridx);
	}

	/* clean up helper variables */
	free(short_xc);
	free(execvnodes);
	free_execvnode_seq(tofree);

	/* Set reservation state to finished. Will re-evaluate
	 * the state for the next occurrence later in the function.
	 */
	resv_setResvState(presv, RESV_FINISHED, RESV_FINISHED);

	/* Decrement resources assigned */
	if (presv->ri_giveback == 1) {
		set_resc_assigned((void *) presv, 1, DECR);
		presv->ri_giveback = 0;
	}

	/* Reservation Nodes are freed and a -possibly- new set assigned */
	free_resvNodes(presv);
	/* set ri_vnodes_down to 0 because the previous occurrences downed nodes might
	 * not exist in the following occurrence.  The new occurrence's ri_vnodes_down
	 * will be set properly in set_nodes()
	 */
	presv->ri_vnodes_down = 0;

	/* Set the new start time, end time, and occurrence index */
	newstart = next;
	newend = (time_t)(newstart + presv->ri_qs.ri_duration);

	set_rattr_l_slim(presv, RESV_ATR_start, newstart, SET);
	presv->ri_qs.ri_stime = newstart;

	set_rattr_l_slim(presv, RESV_ATR_end, newend, SET);
	presv->ri_qs.ri_etime = newend;

	set_rattr_l_slim(presv, RESV_ATR_resv_idx, ridx, SET);
	set_rattr_l_slim(presv, RESV_ATR_duration, presv->ri_qs.ri_duration, SET);

	rscdef = &svr_resc_def[RESC_WALLTIME];
	prsc = find_resc_entry(get_rattr(presv, RESV_ATR_resource), rscdef);
	atemp.at_flags = ATR_VFLAG_SET;
	atemp.at_type = ATR_TYPE_LONG;
	atemp.at_val.at_long = presv->ri_qs.ri_duration;
	rscdef->rs_set(&prsc->rs_value, &atemp, SET);
	post_attr_set(get_rattr(presv, RESV_ATR_resource));

	/* Assign the allocated resources to the reservation
	 * and the reservation to the associated vnodes
	 */
	rc = assign_resv_resc(presv, newxc, FALSE);
	free(newxc);

	if (rc != PBSE_NONE) {
		sprintf(log_buffer, "problem assigning resource to reservation occurrence (%d)", rc);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID, log_buffer);
		resv_setResvState(presv, RESV_DEGRADED, RESV_DEGRADED);
		/* avoid skipping a reconfirmation */
		presv->ri_degraded_time = newstart;
		force_resv_retry(presv, determine_resv_retry(presv));
		resv_save_db(presv);
		return;
	}

	/* place "Time4resv" task on "task_list_timed" */
	if ((rc = gen_task_Time4resv(presv)) != 0) {
		sprintf(log_buffer, "problem generating task Time for occurrence (%d)", rc);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID, log_buffer);
		resv_setResvState(presv, RESV_DEGRADED, RESV_DEGRADED);
		/* avoid skipping a reconfirmation */
		presv->ri_degraded_time = newstart;
		force_resv_retry(presv, determine_resv_retry(presv));
		resv_save_db(presv);
		return;
	}
	/* add task to handle the end of the next occurrence */
	if ((rc = gen_task_EndResvWindow(presv)) != 0) {
		(void) resv_purge(presv);
		sprintf(log_buffer, "problem generating reservation end task for occurrence (%d); "
		        "purging reservation", rc);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID, log_buffer);
		return;
	}

	/* compute new values for state and substate */
	eval_resvState(presv, RESVSTATE_gen_task_Time4resv, 1, &state, &sub);

	/*
	 * Walk the nodes list associated to this reservation to determine if any
	 * node is unavailable. If so, mark this next occurrence as degraded
	 */
	for (pl = presv->ri_pbsnode_list; pl != NULL; pl = pl->next) {
		if ((pl->vnode->nd_state & (INUSE_OFFLINE | INUSE_OFFLINE_BY_MOM | INUSE_DOWN | INUSE_UNKNOWN)) != 0) {
			DBPRT(("vnode %s unavailable\n", pl->vnode->nd_name))
			state = RESV_DEGRADED;
			sub = RESV_DEGRADED;

			presv->ri_degraded_time = newstart;
			break;
		}
	}

	/* All nodes of this occurrence are up, mark reservation confirmed */
	if (pl == NULL)
		state = RESV_CONFIRMED;

	/* If the reservation already has a retry time set then its substate is
	 * marked degraded.  If all degraded occurrences are in the past, the
	 * scheduler will fix this on the next retry attempt.
	 */
	if (is_rattr_set(presv, RESV_ATR_retry)) {
		sub = RESV_DEGRADED;
		if (get_rattr_long(presv, RESV_ATR_retry) > 0 && get_rattr_long(presv, RESV_ATR_retry) <= time_now)
			set_resv_retry(presv, time_now + 120);
	}

	if (sub == RESV_DEGRADED) {
		DBPRT(("degraded_time of %s is %s", presv->ri_qs.ri_resvID, ctime(&presv->ri_degraded_time)))
	}

	/* Set the reservation state and substate */
	resv_setResvState(presv, state, sub);

	resv_save_db(presv);
}

/**
 * @brief
 * 		Handler to check on number of remaining jobs in RUNNING/EXITING state.
 * 		The jobs asynchronously update their state as they get purged from the system.
 * 		Once all jobs have been purged, the process for adding the next occurrence is
 * 		triggered.
 *
 * @param[in,out]	ptask	-	work task structure which contains reservation
 */
static void
running_jobs_count(struct work_task *ptask)
{
	resc_resv *presv;
	int rj;
	presv = (resc_resv *) ptask->wt_parm1;

	/* Number of remaining jobs in RUNNING/EXITING state */
	rj = presv->ri_qp->qu_njstate[JOB_STATE_RUNNING] + presv->ri_qp->qu_njstate[JOB_STATE_EXITING];

	if (rj == 0)
		/* If none are left then process the next occurrence */
		Time4occurrenceFinish(presv);
	else
		/* If some are left then issue another set of requests to clean up */
		delete_occurrence_jobs(presv);
}

/**
 * @brief
 * 		Delete all Running jobs associated to a standing reservation queue.
 * 		The queued jobs will remain queued
 *
 * @param[in,out]	presv	-	The reservation to obtain queue and jobs from
 *
 */
static void
delete_occurrence_jobs(resc_resv *presv)
{
	job *pjob, *pnxj;
	struct work_task *ptask;

	pjob = (job *) GET_NEXT(presv->ri_qp->qu_jobs);
	while (pjob != NULL) {
		/* Get the next job from the queue before the job is unlinked as a result
		 * of job_abt
		 */
		pnxj = (job *) GET_NEXT(pjob->ji_jobque);
		if (check_job_state(pjob, JOB_STATE_LTR_RUNNING) && !check_job_substate(pjob, JOB_SUBSTATE_ABORT))
			(void) job_abt(pjob, "Deleting running job at end of reservation occurrence");

		pjob = pnxj;
	}
	/* Check if all running jobs have been cleaned up every 5 seconds.
	 * Link the work task into the server's reservation info work tasks such that
	 * the work task gets deleted when the reservation is deleted.
	 * This can happen if a pbs_rdel is invoked on the reservation while it is
	 * processing the deletion of running jobs. */
	if ((ptask = set_task(WORK_Timed, time_now + 5, running_jobs_count, presv)) != 0)
		append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);
}

/**
 * @brif
 * 		Time4_term - function that's to execute when server wants to delete
 *		a reservation, e.g. when the server needs to delete the reservation
 *		part of a "reservation job".
 *
 * @param[in]	ptask	-	The reservation to be deleted.
 *
 *	@return	none
 */
void
Time4_term(struct work_task *ptask)
{
	resc_resv *presv = ptask->wt_parm1;
	struct batch_request *preq;

	/*construct a "deleteResv" batch request for the dummy connection
	 *PBS_LOCAL_CONNECTION; Issue that request via "issue_Drequest".
	 *"issue_Drequest" will notice this request is to be handled here
	 *and call upon "dispatch_request", the mechanism for dispatching of
	 *incomming requests.  "issue_Drequest" is passed a function that's
	 *to deal with the reply to the request when it arrives.  A task
	 *having this reply handling function (pointer) is placed on the
	 *global list, "task_list_event".  Request dispatching proceeds
	 *as it normally does and invokes the function "reply_send", which
	 *is to send back a reply to the batch request.  In this instance,
	 *(response recipent local) reply_send  moves the task of dealing
	 *with the "reply to request" on to "task_list_immediate", so it
	 *can get recognized the next time function "next_task" in the
	 *server's main loop gets invoked
	 */

	if ((preq = alloc_br(PBS_BATCH_DeleteResv)) != 0) {
		/*setup field so don't fail a check on perm*/
		preq->rq_perm |= ATR_DFLAG_MGWR;

		strcpy(preq->rq_user, pbs_current_user);
		strcpy(preq->rq_host, server_host);
		strcpy(preq->rq_ind.rq_manager.rq_objname,
		       presv->ri_qs.ri_resvID);

		(void) issue_Drequest(PBS_LOCAL_CONNECTION, preq,
				      resvFinishReply, NULL, 0);

		/*notify relevant parties that the reservation's
		 *ending time has arrived and reservation is being deleted
		 */
		svr_mailownerResv(presv, MAIL_END, MAIL_NORMAL, "");

		tickle_for_reply();
		set_last_used_time_node(presv, 1);
	}
}

/**
 * @brief
 * 		Time4_I_term - function that's to execute when an "interactive"
 *		reservation is submitted with a ngative "I" value.  If the state
 *		on the reservation is UNCONFIRMED a delete request is generated.
 *		If the state is not UNCONFIRMED, this task function does nothing.
 *
 * @param[in]	ptask	-	The reservation submitted with a negative "I" value.
 *
 *	@return	none
 */
void
Time4_I_term(struct work_task *ptask)
{
	resc_resv *presv = ptask->wt_parm1;
	struct batch_request *preq;

	if (presv->ri_qs.ri_state != RESV_UNCONFIRMED)
		return;

	/*construct a "deleteResv" batch request for the dummy connection
	 *PBS_LOCAL_CONNECTION; Issue that request via "issue_Drequest".
	 *"issue_Drequest" will notice this request is to be handled here
	 *and call upon "dispatch_request", the mechanism for dispatching of
	 *incomming requests.  "issue_Drequest" is passed a function that's
	 *to deal with the reply to the request when it arrives.  A task
	 *having this reply handling function (pointer) is placed on the
	 *global list, "task_list_event".  Request dispatching proceeds
	 *as it normally does and invokes the function "reply_send", which
	 *is to send back a reply to the batch request.  In this instance,
	 *(response recipent local) reply_send  moves the task of dealing
	 *with the "reply to request" on to "task_list_immediate", so it
	 *can get recognized the next time function "next_task" in the
	 *server's main loop gets invoked
	 */

	if ((preq = alloc_br(PBS_BATCH_DeleteResv)) != 0) {
		/*setup field so don't fail a check on perm*/
		preq->rq_perm |= ATR_DFLAG_MGWR;

		strcpy(preq->rq_user, pbs_current_user);
		strcpy(preq->rq_host, server_host);
		strcpy(preq->rq_ind.rq_manager.rq_objname,
		       presv->ri_qs.ri_resvID);

		(void) issue_Drequest(PBS_LOCAL_CONNECTION, preq,
				      resvFinishReply, NULL, 0);

		/*notify relevant parties that the reservation's
		 *ending time has arrived and reservation is being deleted
		 */
		svr_mailownerResv(presv, MAIL_END, MAIL_NORMAL, "");

		tickle_for_reply();
	}
}

/**
 * @brief
 * 		resvFinishReply - function gets executed to dispatch the reply
 *		to an internally generated request to delete a reservation
 *		whose time has passed (it's FINISHED).
 *		Here, we just delete the batch_request structure.  If the
 *		request bombs for some internal reason, mail should go back
 *		to those on the reservation's mail list as well as an error
 *		being entered into the server's logging files.
 * @param[in,out]	ptask	-	wt_param1 holds the address of the batch_request structure,
 *								which needs to be freed
 *
 * @return	none
 */
static void
resvFinishReply(struct work_task *ptask)
{
	if (ptask->wt_event == PBS_LOCAL_CONNECTION) {
		/*we passed the little sanity check so do the free*/
		free_br((struct batch_request *) ptask->wt_parm1);
	}
}

/**
 * @brief
 * 		eval_resvState - does an evaluation to determine
 * 		what should be set for state and substate values on
 * 		the reservation in question.
 * @par
 * 		Evaluation is based on current time, current state
 * 		and substate, pointer to some relevant function and
 * 		possibly it's success or failure return value
 *
 * @param[in]	presv	-	reservation in question.
 * @param[in]	s	-	identifies the caller
 * @param[in]	relVal	-	relVal can have following possible values 0,1,2.
 * @param[out]	pstate	-	internal copy of state
 * @param[out]	psub	-	substate of resv state
 */
void
eval_resvState(resc_resv *presv, enum resvState_discrim s, int relVal, int *pstate, int *psub)
{
	int is_running = 0;

	*pstate = presv->ri_qs.ri_state;
	*psub = presv->ri_qs.ri_substate;

	if (time_now >= presv->ri_qs.ri_stime && time_now < presv->ri_qs.ri_etime)
		is_running = 1;

	if (s == RESVSTATE_gen_task_Time4resv) {
		/* from a successful confirmation */
		if (relVal == 0) {
			if (*psub == RESV_DEGRADED) {
				if (is_running) {
					*pstate = RESV_RUNNING;
					*psub = RESV_RUNNING;
				} else {
					*pstate = RESV_CONFIRMED;
					*psub = RESV_CONFIRMED;
				}
			} else {
				if (*pstate == RESV_BEING_ALTERED) {
					if (is_running) {
						*pstate = RESV_RUNNING;
						*psub = RESV_RUNNING;

					} else {
						/* Altering a reservation after its start time */
						*pstate = RESV_CONFIRMED;
						*psub = RESV_CONFIRMED;
					}
				} else if (presv->ri_qs.ri_etime > time_now) {
					*pstate = RESV_CONFIRMED;
					*psub = RESV_CONFIRMED;
				}
			}
		} else {
			/* End of standing occurrence */
			if (*psub == RESV_DEGRADED)
				*pstate = RESV_DEGRADED;
			else {
				*pstate = RESV_CONFIRMED;
				*psub = RESV_CONFIRMED;
			}
		}
	} else if (s == RESVSTATE_Time4resv) {
		if (relVal == 0) {
			if (presv->ri_qs.ri_stime <= time_now &&
			    time_now <= presv->ri_qs.ri_etime) {
				if (*pstate == RESV_DEGRADED || *psub == RESV_DEGRADED)
					*psub = RESV_DEGRADED;
				else
					*psub = RESV_RUNNING;
				*pstate = RESV_RUNNING;
				if (presv->ri_qs.ri_tactive < get_rattr_long(presv, RESV_ATR_start))
					/* Assigning time_now to indicate when reservation become active
 					 *to help in fend off accounting on server restart
					 */
					presv->ri_qs.ri_tactive = time_now;
			}
		}
	} else if (s == RESVSTATE_req_deleteReservation) {
		if (relVal == 0) {

			*pstate = RESV_BEING_DELETED;
			*psub = RESV_BEING_DELETED;
		} else if (relVal == 1) {

			*pstate = RESV_BEING_DELETED;
			*psub = RESV_DELETING_JOBS;
		} else if (relVal == 2) {

			*pstate = RESV_DELETED;
			*psub = RESV_DELETED;
		}
	} else if (s == RESVSTATE_add_resc_resv_to_job) {
		*pstate = RESV_UNCONFIRMED;
		*psub = RESV_UNCONFIRMED;
	} else if (s == RESVSTATE_is_resv_window_in_future) {
		if (presv->ri_qs.ri_etime < time_now) {
			*pstate = RESV_FINISHED;
			*psub = RESV_FINISHED;
		}
	} else if (s == RESVSTATE_req_resvSub) {
		*pstate = RESV_UNCONFIRMED;
		*psub = RESV_UNCONFIRMED;
	} else if (s == RESVSTATE_alter_failed) {
		if (presv->ri_alter.ra_state) {
			*pstate = presv->ri_alter.ra_state;
		} else if (*psub == RESV_IN_CONFLICT || *psub == RESV_DEGRADED) {
			if (is_running) {
				*pstate = RESV_RUNNING;
			} else {
				*pstate = RESV_DEGRADED;
			}
		} else if (is_running) {
			*pstate = RESV_RUNNING;
			*psub = RESV_RUNNING;
		} else if (is_rattr_set(presv, RESV_ATR_resv_nodes)) {
			*pstate = RESV_CONFIRMED;
			*psub = RESV_CONFIRMED;
		} else {
			*pstate = RESV_UNCONFIRMED;
			*psub = RESV_UNCONFIRMED;
		}
	}
}

/**
 * @brief
 * 		resv_setResvState - function modifies the state, substate
 * 		and related fields of the resc_resv object and updates
 * 		the local backing store for the object as appropriate -
 * 		either a full save of the structure or a quick save of the
 * 		structure
 *
 * @param[out]	presv	-	resc_resv object
 * @param[in]	state	-	internal copy of state
 * @param[in]	sub	-	substate of resv state
 */
void
resv_setResvState(resc_resv *presv, int state, int sub)
{
	if ((presv->ri_qs.ri_state == state) &&
	    (presv->ri_qs.ri_substate == sub))
		return;

	DBPRT(("resv_name=%s, o_state=%d, o_sub=%d, state=%d, sub=%d",
	       presv->ri_qs.ri_resvID, presv->ri_qs.ri_state, presv->ri_qs.ri_substate,
	       state, sub))

	presv->ri_qs.ri_state = state;
	presv->ri_qs.ri_substate = sub;

	set_rattr_l_slim(presv, RESV_ATR_state, state, SET);
	set_rattr_l_slim(presv, RESV_ATR_substate, sub, SET);

	resv_save_db(presv);
	return;
}

/**
 * @brief
 * 		Set a scheduler flag to initiate a scheduling cycle when a reservation is
 * 		in degraded mode and needs to have nodes replaced.
 *
 * @param[in]	ptask	-	work task structure which contains reservation.
 * @param[in]	forced 	- 	whether to neuter scheduler call if ri_vnodes_down is 0
 */
void
resv_retry_handler2(struct work_task *ptask, int forced)
{
	resc_resv *presv = ptask->wt_parm1;

	if (!presv)
		return;

	/* If all nodes associated to this reservation are back to available (due to
	 * a change in the system setup or a recovery) then no action is required as
	 * the handler vnode_available takes care of updating the reservation state
	 */
	if (!forced && presv->ri_vnodes_down == 0)
		return;

	/* Notify scheduler that a reservation needs to be reconfirmed */
	notify_scheds_about_resv(SCH_SCHEDULE_RESV_RECONFIRM, presv);
}

/**
 * @brief
 * 		Set a scheduler flag to initiate a scheduling cycle when a reservation is
 * 		in degraded mode and needs to have nodes replaced.
 *		this version will only kick scheduler if ri_vnodes_down > 0
 *
 * @param[in]	ptask	-	work task structure which contains reservation.
 */
void
resv_retry_handler(struct work_task *ptask)
{
	resv_retry_handler2(ptask, 0);
}

/**
 * @brief
 * 		Set a scheduler flag to initiate a scheduling cycle when a reservation is
 * 		in degraded mode and needs to have nodes replaced.
 *		this version will also kick scheduler if ri_vnodes_down is 0
 *
 * @param[in]	ptask	-	work task structure which contains reservation.
 */
void
resv_retry_handler_forced(struct work_task *ptask)
{
	resv_retry_handler2(ptask, 1);
}

/**
 * @brief
 * 		chk_resvReq_viable - checks if scheduler's request to reserve is viable
 *
 * @param[in]	presv	-	pointer to reservation.
 *
 * @return	int
 * @retval	0	: no problems occur
 * @retval	error code	: if problem detected
 */
int
chk_resvReq_viable(resc_resv *presv)
{
	long state = get_rattr_long(presv, RESV_ATR_state);
	int rc;

	if (state == RESV_NONE)
		return PBSE_INTERNAL;

	rc = 0; /*assume no problems occur*/

	if (state == RESV_FINISHED || state == RESV_DELETED || state == RESV_BEING_DELETED)
		rc = PBSE_INTERNAL;

	return rc;
}

/**
 * @brief
 * 		gen_task_Time4resv - creates a work_task structure and puts it onto
 * 		the "WORK_Timed" work_task list at the appropriate (time sequential)
 * 		location.
 * @par
 * 		The assumption here is that gen_task_Time4resv () won't be called
 * 		if the "rescreserve" is not viable - see chk_resvReq_viable ()
 *
 * @param[in]	presv	-	pointer to reservation.
 *
 * @return	int
 * @retval	0	: work_task created and put on timed task list
 * @retval	error code	: if problem was detected
 */
int
gen_task_Time4resv(resc_resv *presv)
{
	struct work_task *ptask;
	int rc;
	long startTime;

	if (get_rattr_long(presv, RESV_ATR_state) == RESV_NONE)
		return PBSE_INTERNAL;

	if (presv->resv_start_task)
		delete_task(presv->resv_start_task);
	presv->resv_start_task = NULL;
	startTime = get_rattr_long(presv, RESV_ATR_start);
	if ((ptask = set_task(WORK_Timed, startTime,
			      Time4resv, presv)) != 0) {
		/* set things so that the reservation going away causes
		 * any "yet to be processed" work tasks to also go away
		 */

		append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);

		/* cause to have issued to the qmgr subsystem
		 * a request to enable the reservation's queue
		 */
		rc = change_enableORstart(presv, Q_CHNG_ENABLE, "True");
		presv->resv_start_task = ptask;

	} else
		rc = PBSE_SYSTEM;

	return (rc);
}

/**
 * @brief
 * 		gen_task_EndResvWindow - creates a work_task for deleting a reservation
 * 		whose window has expired and puts it on the "WORK_Timed" work_task list
 * 		at the appropriate (time sequential) location.
 *
 * @param[in]	presv	-	pointer to reservation.
 *
 * @return	int
 * @retval	0	: task was created and put on timed task list
 * @retval	error code	: if a problem was detected
 */
int
gen_task_EndResvWindow(resc_resv *presv)
{
	int rc;
	long fromNow;

	if (presv == NULL)
		return (PBSE_INTERNAL);

	fromNow = presv->ri_qs.ri_etime - (long) time_now;
	if (is_sattr_set(SVR_ATR_resv_post_processing))
		fromNow -= get_sattr_long(SVR_ATR_resv_post_processing);
	rc = gen_future_deleteResv(presv, fromNow);
	return (rc);
}

/**
 * @brief
 * 		gen_deleteResv - creates a work_task for deleting a reservation
 * 		Argument "fromNow" needs to be a non-negative value.  It's the number of
 * 		seconds into the future (measured from from global variable "time_now")
 * 		that this task is to be activated.
 *
 * @param[in,out]	presv	-	pointer to reservation.
 * @param[in]	fromNow	-	It's the number of seconds into the future that this task is to be activated.
 *
 * @return	int
 * @retval	0	: task was created and put on timed task list
 * @retval	error code	: if a problem was detected
 */
int
gen_deleteResv(resc_resv *presv, long fromNow)
{
	struct work_task *ptask;
	int rc = 0; /*assume success*/
	long event = (long) time_now + fromNow;

	if ((ptask = set_task(WORK_Timed, event,
			      Time4_term, presv)) != 0) {

		/* set things so that the reservation going away results in
		 * any "yet to be processed" work tasks also going away
		 * and set up to notify Scheduler of new reservation-job
		 */

		append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);
		presv->ri_futuredr = 1;
	} else
		rc = PBSE_SYSTEM;

	return (rc);
}

/**
 * @brief
 * 		gen_negI_deleteResv - creates a work_task for deleting a reservation
 * 		if the reservation was submitted with a negative value for "I" attribute -
 * 		meaning: willing to wait "n" seconds, but after that forget it.
 * 		Argument "fromNow" needs to be a non-negative value.  It's the number of
 * 		seconds into the future (measured from from global variable "time_now")
 * 		that this task is to be activated.
 *
 * @param[in,out]	presv	-	pointer to reservation.
 * @param[in]	fromNow	-	It's the number of seconds into the future that this task is to be activated.
 *
 * @return	int
 * @retval	0	: task was created and put on timed task list
 * @retval	error code	: if a problem was detected
 */
int
gen_negI_deleteResv(resc_resv *presv, long fromNow)
{
	struct work_task *ptask;
	int rc = 0; /*assume success*/
	long event = (long) time_now + fromNow;

	if ((ptask = set_task(WORK_Timed, event,
			      Time4_I_term, presv)) != 0) {

		/* set things so that the reservation going away results in
		 * any "yet to be processed" work tasks also going away
		 * and set up to notify Scheduler of new reservation-job
		 */

		append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);
		presv->ri_futuredr = 1;
	} else
		rc = PBSE_SYSTEM;

	return (rc);
}

/**
 * @brief
 * 		gen_future_deleteResv - creates a work_task for deleting a reservation
 * 		in the future and puts it on the "WORK_Timed" work_task list at the
 * 		appropriate (time sequential) location.  Argument "fromNow" is to be a
 * 		non-negative value.  It's the number of seconds into the future
 * 		(measured from from global variable "time_now") that the task is to become
 * 		active.
 *
 * @param[in,out]	presv	-	pointer to reservation.
 * @param[in]	fromNow	-	It's the number of seconds into the future that this task is to be activated.
 *
 * @return	int
 * @retval	0	: task was created and put on timed task list
 * @retval	error code	: if a problem was detected
 */
int
gen_future_deleteResv(resc_resv *presv, long fromNow)
{
	struct work_task *ptask = NULL;
	int rc = 0; /*assume success*/
	long event = (long) time_now + fromNow;

	if (presv->resv_end_task)
		delete_task(presv->resv_end_task);
	presv->resv_end_task = NULL;
	if ((ptask = set_task(WORK_Timed, event,
			      Time4resvFinish, presv)) != 0) {

		/* set things so that the reservation going away results in
		 * any "yet to be processed" work tasks also going away
		 * and set up to notify Scheduler of new reservation-job
		 */

		append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);
		presv->ri_futuredr = 1;
		presv->resv_end_task = ptask;
	} else
		rc = PBSE_SYSTEM;

	return (rc);
}

/**
 * @brief
 * 		gen_future_reply - creates a work_task to reply in the future to a
 * 		reservation request submitted now. Place on the "WORK_Timed" work_task
 * 		list at the appropriate (time sequential) location.  Argument "fromNow"
 * 		is to be a non-negative value.  It's the number of seconds into the future
 * 		(measured from from global variable "time_now") that the task is to become
 * 		active.
 *
 * @param[in,out]	presv	-	pointer to reservation.
 * @param[in]	fromNow	-	It's the number of seconds into the future that this task is to be activated.
 *
 * @return	int
 * @retval	0	: task was created and put on timed task list
 * @retval	error code	: if a problem was detected
 */
int
gen_future_reply(resc_resv *presv, long fromNow)
{
	struct work_task *ptask;
	int rc = 0; /*assume success*/
	long event = (long) time_now + fromNow;

	if ((ptask = set_task(WORK_Timed, event,
			      Time4reply, presv)) != 0) {

		/* set things so that the reservation going away results in
		 * any "yet to be processed" work tasks also going away
		 * and set up to notify Scheduler of new reservation-job
		 */

		append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);
		presv->ri_futuredr = 1;
	} else
		rc = PBSE_SYSTEM;

	return (rc);
}

/**
 * @brief
 * 		change_enableORstart - call this function to build and issue an internally
 *		generated request to the qmgr subsystem to change the value of either
 *		attributes "start" or "enable" for the queue associated with a general
 *		resources reservation.
 *
 * @note
 *		Notes:  the "issue_Drequest" function called in the body of this
 *		code causes the request to be dispatched to qmgr immediately
 *		(since its local) and the reply from qmgr will get handled
 *		by the "reply handling function" passed to issue_Drequest.
 *		The reply handler gets triggered by invocation of "next_task()"
 *		in the server's main loop, since it's put into a work_task on the
 *		"immediate_tasks" work_list.
 *
 * @param[in]	presv	-	pointer to reservation structure
 * @param[in]	which	-	Q_CHNG_START, Q_CHNG_ENABLE
 * @param[in]	value	-	"True", "False"
 *
 * @return	int
 * @retval	0	: if build and issuance successful
 * @retval	!=0	: error code if function fails
 */
int
change_enableORstart(resc_resv *presv, int which, char *value)
{
	extern char *msg_internalReqFail;
	struct batch_request *newreq;
	pbs_list_head *plhed;
	int len;
	svrattrl *psatl;
	struct work_task *pwt;
	char *at_name;
	int index;

	if (which == Q_CHNG_START && strcmp(value, ATR_TRUE) == 0 && !is_rattr_set(presv, RESV_ATR_resv_nodes))
		return (0);

	newreq = alloc_br(PBS_BATCH_Manager);
	if (newreq == NULL) {
		(void) sprintf(log_buffer, "batch request allocation failed");
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_RESV, LOG_NOTICE,
			  presv->ri_qs.ri_resvID, log_buffer);
		return (PBSE_SYSTEM);
	}

	newreq->rq_ind.rq_manager.rq_cmd = MGR_CMD_SET;
	newreq->rq_ind.rq_manager.rq_objtype = MGR_OBJ_QUEUE;
	newreq->rq_perm = ATR_DFLAG_MGWR | ATR_DFLAG_OPWR;
	(void) strcpy(newreq->rq_user, "pbs_server");
	(void) strcpy(newreq->rq_host, pbs_server_name);

	strcpy(newreq->rq_ind.rq_manager.rq_objname, get_rattr_str(presv, RESV_ATR_queue));

	CLEAR_HEAD(newreq->rq_ind.rq_manager.rq_attr);
	plhed = &newreq->rq_ind.rq_manager.rq_attr;

	if (which == Q_CHNG_ENABLE) {
		index = QA_ATR_Enabled;
		at_name = que_attr_def[index].at_name;
	} else if (which == Q_CHNG_START) {
		index = QA_ATR_Started;
		at_name = que_attr_def[index].at_name;
	} else
		return (PBSE_INTERNAL);

	len = strlen(value) + 1;
	if ((psatl = attrlist_create(at_name, NULL, len)) != NULL) {
		psatl->al_flags = que_attr_def[index].at_flags;
		strcpy(psatl->al_value, value);
		append_link(plhed, &psatl->al_link, psatl);
	} else {
		free_br(newreq);
		return (PBSE_INTERNAL);
	}

	if (issue_Drequest(PBS_LOCAL_CONNECTION, newreq,
			   handle_qmgr_reply_to_startORenable, &pwt, 0) == -1) {
		free_br(newreq);

		(void) sprintf(log_buffer, "%s", msg_internalReqFail);
		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_NOTICE,
			  presv->ri_qs.ri_resvID, log_buffer);

		return (PBSE_mgrBatchReq);
	}
	tickle_for_reply();
	if (pwt)
		pwt->wt_parm2 = presv; /*needed to handle qmgr's response*/

	return (0);
}

/**
 * @brief
 * 		handle_qmgr_reply_to_startORenable - this is the function that's to be
 *		called to handle the qmgr's response to the request issued in
 *		"change_enableORstart()".  If not successful log a message.
 * @par
 *		This function should only be called through an INTERNALLY GENERATED
 *		request to another server (including ourself).
 *		It frees the request structure and closes the connection (handle).
 * @par
 *		In the work task entry, wt_event is the connection handle and
 *		wt_parm1 is a pointer to the request structure (that contains the reply).
 *		wt_parm2 should have the address of the reservation structure
 * @par
 *		THIS SHOULD NOT BE USED IF AN EXTERNAL (CLIENT) REQUEST IS "relayed",
 *		because the request/reply structure is still needed to reply back
 *		to the client.
 *
 * @param[in]	pwt	-	work task entry
 */
static void
handle_qmgr_reply_to_startORenable(struct work_task *pwt)
{
	extern char *msg_qEnabStartFail;
	struct batch_request *preq = pwt->wt_parm1;
	resc_resv *presv = pwt->wt_parm2;

	if (preq->rq_reply.brp_code) {

		(void) sprintf(log_buffer, "%s", msg_qEnabStartFail);
		log_event(PBSEVENT_RESV, PBS_EVENTCLASS_RESV, LOG_NOTICE,
			  presv->ri_qs.ri_resvID, log_buffer);
	}

	free_br((struct batch_request *) pwt->wt_parm1);
	if (pwt->wt_event != -1)
		svr_disconnect(pwt->wt_event);

	/*I don't know why, except for system error, that a
	 *the server couldn't set "start" or "enable" on one
	 *of its own queues.  However, if this happens it probably
	 *should result in the reservation being deleted by the
	 *server and a message sent back to the owner regarding the
	 *action.  We will pass on that for now.
	 */
}

/**
 * @brief
 * 		remove_deleted_resvs - Walk the server's "svr_allresvs"
 *		list and cause to be removed any reservation whose state
 *		is marked RESV_FINISHED.  Function used in "pbsd_init" code
 *
 *	@return	Nothing
 */
void
remove_deleted_resvs(void)
{
	resc_resv *presv, *nxresv;
	struct work_task *ptask;

	presv = (resc_resv *) GET_NEXT(svr_allresvs);
	while (presv) {
		nxresv = (resc_resv *) GET_NEXT(presv->ri_allresvs);

		if (presv->ri_qs.ri_state == RESV_FINISHED) {
			/*put a task on the server's "task_list_timed" that causes
			 *an internal BATCH_REQUEST_DeleteResv to be generated
			 *and issued against this reservation
			 */

			if ((ptask = set_task(WORK_Timed, time_now + 5,
					      Time4resvFinish, presv)) != 0) {

				/* set things so that the reservation going away results in
				 * any "yet to be processed" work tasks also going away
				 * and set up to notify Scheduler of new reservation-job
				 */

				append_link(&presv->ri_svrtask, &ptask->wt_linkobj, ptask);
			}
		} else if (presv->ri_qs.ri_state == RESV_DELETING_JOBS) {
				/* this will set up the task to finally move it to RESV_FINISHED */
				delete_occurrence_jobs(presv);
		}
		presv = nxresv;
	}
}

/**
 * @brief
 *  	degrade_corrupted_confirmed_resvs - Walk the server's "svr_allresvs"
 *  	list and cause to be degraded any reservation whose state
 *  	is marked RESV_CONFIRMED but is missing resv_nodes or resv_execvnodes.
 *  	Function used in "pbsd_init" code
 *
 * @return Nothing
 */
void
degrade_corrupted_confirmed_resvs(void)
{
	int is_degraded = 0;
	resc_resv *presv, *nxresv;
	long retry_time = 0;
	char *str_time;

	presv = (resc_resv *) GET_NEXT(svr_allresvs);
	while (presv) {
		nxresv = (resc_resv *) GET_NEXT(presv->ri_allresvs);
		/* if corrupted and already degraded we still need to set a retry time for the scheduler to be prodded again */
		if (presv->ri_qs.ri_state == RESV_CONFIRMED || presv->ri_qs.ri_state == RESV_DEGRADED) {
			if (get_rattr_long(presv, RESV_ATR_resv_standing))
				if (!(is_rattr_set(presv, RESV_ATR_resv_execvnodes)) || get_rattr_str(presv, RESV_ATR_resv_execvnodes) == NULL)
					is_degraded = 1;
			if (!(is_rattr_set(presv, RESV_ATR_resv_nodes)) || get_rattr_str(presv, RESV_ATR_resv_nodes) == NULL)
				is_degraded = 1;
		} else if (presv->ri_qs.ri_state == RESV_FINISHED && get_rattr_long(presv, RESV_ATR_resv_standing))
			if (get_rattr_long(presv, RESV_ATR_resv_idx) < get_rattr_long(presv, RESV_ATR_resv_count))
				/* should never keep a standing reservation in RESV_FINISHED state for anything but the last occurrence */
				/* if we don't degrade it then remove_deleted_resvs may create a task to nuke it */
				is_degraded = 1;
		if (is_degraded) {
			resv_setResvState(presv, RESV_DEGRADED, RESV_DEGRADED);
			/* there is no point in trying to reconfirm it immediately at server start,
			 * since the nodes will not have reported as free yet.
			 * One minute is a reasonable time to try, but jobs may already have filled
			 * some nodes by then. Tough luck, but it's the best we can do. It beats
			 * waiting for the default 600 seconds.
			 */
			retry_time = determine_resv_retry(presv);
			if (time_now + 60 < retry_time)
				retry_time = time_now + 60;
			str_time = ctime(&retry_time);
			if (str_time == NULL)
				str_time = "";
			presv->ri_degraded_time = get_rattr_long(presv, RESV_ATR_start);
			/* bogus value, but avoid skipping a reconfirmation */
			log_eventf(PBSEVENT_ERROR, PBS_EVENTCLASS_RESV, LOG_NOTICE, presv->ri_qs.ri_resvID,
				   "Reservation with corrupted nodes, degrading with retry time set to %s", str_time);
			force_resv_retry(presv, retry_time);
		}
		presv = nxresv;
	}
}

/**
 * @brief
 *  	add_resv_beginEnd_tasks - for each reservation not in state
 *  	RESV_FINISHED add to "task_list_timed" the "begin" and
 *  	"end" reservation tasks as appropriate.  Function used
 *  	in "pbsd_init" code
 *
 * @return	none
 */
void
add_resv_beginEnd_tasks(void)
{
	resc_resv *presv;
	char txt[PBS_MAXSVRRESVID + 100];
	int rc;

	presv = (resc_resv *) GET_NEXT(svr_allresvs);
	while (presv) {
		rc = 0;
		if (presv->ri_qs.ri_state == RESV_CONFIRMED ||
		    presv->ri_qs.ri_state == RESV_RUNNING) {

			/* add "begin" and "end" tasks onto "task_list_timed" */

			if ((rc = gen_task_EndResvWindow(presv)) != 0) {
				sprintf(txt, "%s : EndResvWindow task creation failed",
					presv->ri_qs.ri_resvID);
				log_err(rc, "add_resv_beginEnd_tasks", txt);
			}
			if ((rc = gen_task_Time4resv(presv)) != 0) {
				sprintf(txt, "%s : Time4resv task creation failed",
					presv->ri_qs.ri_resvID);
				log_err(rc, "add_resv_beginEnd_tasks", txt);
			}
		} else if (presv->ri_qs.ri_state == RESV_UNCONFIRMED) {

			/* add "end" task onto "task_list_timed" */

			if ((rc = gen_task_EndResvWindow(presv)) != 0) {
				sprintf(txt, "%s : EndResvWindow task creation failed",
					presv->ri_qs.ri_resvID);
				log_err(rc, "add_resv_beginEnd_tasks", txt);
			}
		}

		presv = (resc_resv *) GET_NEXT(presv->ri_allresvs);
	}
}

/**
 * @brief
 * 		uniq_nameANDfile - develop a unique name and file in the directory
 *		pointed to by "pdir".  The root name of the file is initially
 *		given by "pname".  The name pointed to by pname may be modified
 *		in place in the process of arriving at a unique filename for
 *		the file.  The file, if generated, will have zero length.
 *
 * @param[in]	pname	-	The root name of the file is initially given by "pname"
 * @param[in]	psuffix	-	suffix of the name
 * @param[in]	pdir	-	points to the directory in which file contains.
 *
 * @return	int
 * @return	0	: on success
 * @retval	PBSE_*	: code on failure
 */
int
uniq_nameANDfile(char *pname, char *psuffix, char *pdir)
{
	int fds, L1, L2;
	int rc = 0;
	char *pc;
	char namebuf[MAXPATHLEN + 1];

	if (!pname || !psuffix || !pdir ||
	    !(L1 = strlen(pname)) ||
	    !(L2 = strlen(pdir)) ||
	    ((L1 + L2 + strlen(psuffix)) >= MAXPATHLEN))
		return (PBSE_INTERNAL);

	do {
		(void) strcpy(namebuf, pdir);
		(void) strcat(namebuf, pname);
		(void) strcat(namebuf, psuffix);
		fds = open(namebuf, O_CREAT | O_EXCL | O_WRONLY, 0600);
		if (fds < 0) {
			if (errno == EEXIST) {
				pc = pname + strlen(pname) - 1;
				while (!isprint((int) *pc)) {
					pc--;
					if (pc <= pname) {
						rc = PBSE_INTERNAL;
						break;
					}
				}
				(*pc)++;
			} else {
				rc = PBSE_SYSTEM;
				break;
			}
		}
	} while (fds < 0);

	if (fds)
		(void) close(fds);
	return (rc);
}

/**
 * @brief
 *		start_end_dur_wall - This function considers the information specified for
 *		start_time, end_time, duration and walltime.  Using what was
 *		specified, it computes those unspecified values that are
 *		possible to compute. If the initially supplied information
 *		is bogus, or not enough information is specified or results
 *		are inconsistent, the function returns "failure" otherwise,
 *		it returns "success".
 * @par
 * 		reservation attributes dealing with start, end, duration times
 *		can be modified by this function.  In addition, if this is
 *		happens to be a RESC_RESV_OBJECT  its "ri_qs.ri_stime",
 *		"ri_qs.ri_etime", and "ri_qs.ri_duration" fields are subject
 *		to modification.
 *
 * @param[in,out]	presv	-	the "resc_resv" object
 *
 * @return	int
 * @retval	0	: Success
 * @retval	!= 0	: don't have a complete or consistent set of
 * 					information, or possibly some other error
 * 					occurred - e.g. problem adding the "walltime"
 * 					resource entry if it doesn't exist
 */
int
start_end_dur_wall(resc_resv *presv)
{
	resource_def *rscdef = NULL;
	resource *prsc = NULL;
	attribute *pattr = NULL;
	attribute atemp = {0};
	int pstate = 0;
	long stime, etime, duration;

	int swcode = 0; /* "switch code" */
	int rc = 0;	/* return code, assume success */
	short check_start = 1;

	if (presv == 0)
		return (-1);

	rscdef = &svr_resc_def[RESC_WALLTIME];
	pstate = get_rattr_long(presv, RESV_ATR_state);
	stime = get_rattr_long(presv, RESV_ATR_start);
	etime = get_rattr_long(presv, RESV_ATR_end);
	duration = get_rattr_long(presv, RESV_ATR_duration);

	pattr = get_rattr(presv, RESV_ATR_resource);
	prsc = find_resc_entry(pattr, rscdef);
	check_start = !is_rattr_set(presv, RESV_ATR_job);

	if (pstate != RESV_BEING_ALTERED) {
		if (is_rattr_set(presv, RESV_ATR_start))
			swcode += 1; /* have start */
		if (is_rattr_set(presv, RESV_ATR_end))
			swcode += 2; /* have end */
		if (is_rattr_set(presv, RESV_ATR_duration))
			swcode += 4; /* have duration */
		if (prsc)
			swcode += 8; /* have walltime */
		else if (!(prsc = add_resource_entry(pattr, rscdef)))
			return (-1);
	} else {
		if (presv->ri_alter.ra_flags & RESV_DURATION_MODIFIED)
			swcode += 4;
		if (presv->ri_alter.ra_flags & RESV_END_TIME_MODIFIED)
			swcode += 2; /* calcualte start time */
		if (presv->ri_alter.ra_flags & RESV_START_TIME_MODIFIED)
			swcode += 1; /* calculate end time */
		if (presv->ri_alter.ra_flags == RESV_START_TIME_MODIFIED || presv->ri_alter.ra_flags == RESV_END_TIME_MODIFIED) {
			swcode = 3;
		}
	}

	atemp.at_flags = ATR_VFLAG_SET;
	atemp.at_type = ATR_TYPE_LONG;
	switch (swcode) {
		case 3: /* start, end */
			if (((check_start && (stime < time_now)) && (pstate != RESV_BEING_ALTERED)) ||
			    (etime <= stime))
				rc = -1;
			else {
				if (pstate == RESV_BEING_ALTERED) {
					presv->ri_alter.ra_flags |= RESV_DURATION_MODIFIED;
				}
				atemp.at_val.at_long = etime - stime;
				set_rattr_l_slim(presv, RESV_ATR_duration, atemp.at_val.at_long, SET);
				rscdef->rs_set(&prsc->rs_value, &atemp, SET);
			}
			break;

		case 4:
		case 5: /* start, duration */
			if (((check_start && stime < time_now) && (pstate != RESV_BEING_ALTERED)) ||
			    (duration <= 0))
				rc = -1;
			else {
				if (pstate == RESV_BEING_ALTERED) {
					presv->ri_alter.ra_flags |= RESV_END_TIME_MODIFIED;
				}
				set_rattr_l_slim(presv, RESV_ATR_end, stime + duration, SET);
				set_attr_l(&atemp, duration, SET);
				rscdef->rs_set(&prsc->rs_value, &atemp, SET);
			}
			break;

		case 7: /* start, end, duration */
			if (((check_start) && (stime < time_now)) ||
			    (etime < stime) ||
			    (duration <= 0) ||
			    ((etime - stime) !=
			     duration))
				rc = -1;
			else {
				atemp.at_val.at_long = duration;
				rscdef->rs_set(&prsc->rs_value, &atemp, SET);
			}
			break;

		case 6:
		case 8: /* end, duration */
			if ((duration <= 0) ||
			    (etime - duration <
			     time_now)) {
				rc = -1;
			} else {
				if (pstate == RESV_BEING_ALTERED) {
					presv->ri_alter.ra_flags |= RESV_START_TIME_MODIFIED;
				}
				set_rattr_l_slim(presv, RESV_ATR_start, etime - duration, SET);
				atemp.at_val.at_long = duration;
				rscdef->rs_set(&prsc->rs_value, &atemp, SET);
			}
			break;

		case 9: /* start, wall */
			if (((check_start) && (stime < time_now)) ||
			    (prsc->rs_value.at_val.at_long <= 0))
				rc = -1;
			else {
				if (pstate == RESV_BEING_ALTERED) {
					presv->ri_alter.ra_flags |= RESV_END_TIME_MODIFIED | RESV_DURATION_MODIFIED;
				}
				set_rattr_l_slim(presv, RESV_ATR_end, stime + prsc->rs_value.at_val.at_long, SET);
				set_rattr_l_slim(presv, RESV_ATR_duration, prsc->rs_value.at_val.at_long, SET);
			}
			break;

		case 10: /* end, wall */
			if ((prsc->rs_value.at_val.at_long <= 0) ||
			    (etime - prsc->rs_value.at_val.at_long <
			     time_now)) {
				rc = -1;
			} else {
				if (pstate == RESV_BEING_ALTERED) {
					presv->ri_alter.ra_flags |= RESV_START_TIME_MODIFIED;
				}
				set_rattr_l_slim(presv, RESV_ATR_start, etime - prsc->rs_value.at_val.at_long, SET);
				set_rattr_l_slim(presv, RESV_ATR_duration, prsc->rs_value.at_val.at_long, SET);
			}
			break;

		case 11: /* start, end, wall */
			if (((check_start) && (stime < time_now)) ||
			    (prsc->rs_value.at_val.at_long <= 0) ||
			    (etime - stime !=
			     prsc->rs_value.at_val.at_long))
				rc = -1;
			else {
				if (pstate == RESV_BEING_ALTERED) {
					presv->ri_alter.ra_flags |= RESV_DURATION_MODIFIED;
				}
				set_rattr_l_slim(presv, RESV_ATR_duration, prsc->rs_value.at_val.at_long, SET);
			}
			break;

		case 13: /* start, duration & wall */
			if (((check_start) && (stime < time_now)) ||
			    (prsc->rs_value.at_val.at_long != duration) ||
			    (duration <= 0))
				rc = -1;
			else {
				if (pstate == RESV_BEING_ALTERED) {
					presv->ri_alter.ra_flags |= RESV_END_TIME_MODIFIED;
				}
				set_rattr_l_slim(presv, RESV_ATR_end, stime + presv->ri_qs.ri_duration, SET);
			}
			break;

		case 15: /* start, end, duration & wall */
			if (((check_start) || (stime < time_now)) ||
			    (etime < stime) ||
			    (duration <= 0) ||
			    (prsc->rs_value.at_val.at_long != duration) ||
			    ((etime - stime) !=
			     duration))
				rc = -1;
			break;

		default:
			rc = -1;
	}

	if (is_sattr_set(SVR_ATR_resv_post_processing)) {
		duration += get_sattr_long(SVR_ATR_resv_post_processing);
		etime += get_sattr_long(SVR_ATR_resv_post_processing);
	}

	presv->ri_qs.ri_stime = get_rattr_long(presv, RESV_ATR_start);
	presv->ri_qs.ri_etime = get_rattr_long(presv, RESV_ATR_end);
	presv->ri_qs.ri_duration = get_rattr_long(presv, RESV_ATR_duration);

	return (rc);
}

/**
 * @brief
 * 		is_resv_window_in_future - Updates the reservation's state
 *		to RESV_FINISHED if the current time is already beyond
 *		the start of the reservation's window otherwise, it
 *		just returns.  It's used in pbsd_init.c to decide if
 *		an existing reservation, that's read back into the system
 *		from the disk at sever restart, should continue to remain.
 *
 * @param[in,out]	presv	-	reservation structure
 *
 * @return	Nothing
 */
void
is_resv_window_in_future(resc_resv *presv)
{
	int state, sub;

	eval_resvState(presv, RESVSTATE_is_resv_window_in_future, 0, &state,
		       &sub);
	resv_setResvState(presv, state, sub);
}

/**
 * @brief
 * 		resv_mailAction - Based on what was requested on reservation submission
 * 		and on who is issuing the current *request*, generate (or not) a mail
 * 		message about some aspect of the reservation to the appropriate parties
 * @par
 * 		This function makes use of mail function svr_mailownerResv () but
 * 		it is not intended that this be the only way that svr_mailownerResv
 * 		should be called, for we may not be presented with any related
 * 		batch_request at the point where some message ought to be issued -
 * 		e.g. the case, "reservation start-time has finally arrived."
 *
 * @param[in]	presv	-	reservation structure
 * @param[in]	preq	-	batch_request structure
 */
void
resv_mailAction(resc_resv *presv, struct batch_request *preq)
{
	int force;
	char text[PBS_MAXUSER + PBS_MAXHOSTNAME + 64];

	if (preq->rq_type != PBS_BATCH_DeleteResv)
		return;

	snprintf(text, sizeof(text), "Requesting party: %s@%s",
		 preq->rq_user, preq->rq_host);
#ifdef NAS /* localmod 028 */
	/*
	 * The extend attribute can contain additional explanation
	 */
	if (preq->rq_extend) {
		size_t len;
		len = strlen(text);
		snprintf(text + len, sizeof(text) - len,
			 "\nReason: %s\n", preq->rq_extend);
	}
#endif /* localmod 028 */
	if (preq->rq_fromsvr != 0)
		force = MAIL_FORCE;
	else
		force = MAIL_NORMAL;
	svr_mailownerResv(presv, MAIL_ABORT, force, text);
}

/**
 * @brief
 * 		This function converts long to hh:mm:ss format
 *
 * @param[in]	l	-	time passed as a long number
 *
 * @return	pointer to the converted time string, allocated
 *         	by the function. Memory deallocation rests in
 *         	the hands of caller.
 * @retval	NULL	: failure
 */

char *
convert_long_to_time(long l)
{
	unsigned int h;
	unsigned int temp;
	int m;
	int s;
	int hr_len = 0;
	char *str;

	temp = h = l / 3600;
	l = l % 3600;
	m = l / 60;
	l = l % 60;
	s = l;
	while (temp > 0) {
		hr_len++;
		temp = temp / 10;
	}
	/* Allocating memory for hours field and other 9 chars which can
	 * accommodate "hh:mm:ss\0"
	 */
	str = (char *) malloc(hr_len + 9);
	if (str == NULL)
		return NULL;

	sprintf(str, "%02u:%02d:%02d", h, m, s);
	return str;
}

/**
 * @brief
 * 		  determine_accruetype
 *        determine accrue_type for new job or after overlay upgrade
 *        or after recovery.
 *        If coming after an overlay upgrade or enabling accrual after a long time,
 *        jobs which entered system when accrual was false or those before the upgrade,
 *        accrual will begin from start time of the scheduling cycle.
 *        if, scheduler cannot determine accrual type, then server determines it and
 *        accrual begins from the time job was created in the server.
 *
 *        precedence of accrual :
 *	        1) run time, exit time 2) ineligible time 3) eligible time
 * @param[in]	pjob	-	Job whose accrue type needs to be determined
 * @return	long
 * @retval	JOB_ELIGIBLE	-	when job is eligible to accrue eligible_time
 * @retval	JOB_INELIGIBLE	-	when job is ineligible to accrue eligible_time
 * @retval	JOB_RUNNING	-	when job is running or provisioning
 * @retval	JOB_EXIT	-	when job is exiting
 * @retval	-1	- when accrue type couldn'tbe determined
 */
long
determine_accruetype(job *pjob)
{
	struct pbs_queue *pque;
	long temphold;

	/* have to determine accrue type */

	/* if job is truely running or provisioning */
	if (check_job_state(pjob, JOB_STATE_LTR_RUNNING) &&
	    (check_job_substate(pjob, JOB_SUBSTATE_RUNNING) ||
	     check_job_substate(pjob, JOB_SUBSTATE_PROVISION)))
		return JOB_RUNNING;

	/* if job exit */
	if (check_job_state(pjob, JOB_STATE_LTR_EXITING))
		return JOB_EXIT;

	/* handling qsub -a, waiting with substate 30 ; accrue ineligible time */
	if (get_jattr_long(pjob, JOB_ATR_exectime))
		return JOB_INELIGIBLE;

	/* 'user' hold applied ; accrue ineligible time */
	if (get_jattr_long(pjob, JOB_ATR_hold) & HOLD_u)
		return JOB_INELIGIBLE;

	/* other than 'user' hold applied */
	/* accrue type is set to JOB_INELIGIBLE incase a job has dependency */
	/* on another job and hold type is set to system hold. */
	/* For all other cases accrue type is set to JOB_ELIGIBLE. */
	temphold = get_jattr_long(pjob, JOB_ATR_hold);
	if (temphold & HOLD_o || temphold & HOLD_bad_password || temphold & HOLD_s) {
		if ((check_job_substate(pjob, JOB_SUBSTATE_DEPNHOLD)) && (temphold & HOLD_s))
			return JOB_INELIGIBLE;

		return JOB_ELIGIBLE;
	}

	/* scheduler suspend job ; accrue eligible time */
	if (check_job_substate(pjob, JOB_SUBSTATE_SCHSUSP))
		return JOB_ELIGIBLE;

	/* qsig suspended job ; accrue eligible time */
	if (check_job_substate(pjob, JOB_SUBSTATE_SUSPEND))
		return JOB_ELIGIBLE;

	/* check for stopped queue: routing and execute ; accrue eligible time */
	pque = find_queuebyname(pjob->ji_qs.ji_queue);
	if (pque != NULL)
		if (get_qattr_long(pque, QA_ATR_Started) == 0)
			return JOB_ELIGIBLE;

	/* The job doesn't have any reason to not accrue eligible time (e.g. on hold), so it should accrue it */
	if (check_job_state(pjob, JOB_STATE_LTR_TRANSIT) &&
	    check_job_substate(pjob, JOB_SUBSTATE_TRANSIN))
		return JOB_ELIGIBLE;

	return -1;
}

/**
 * @brief
 * 		update_eligible_time - this function is responsible for calculating eligible time accrued
 *			  for a job. it also updates the accrue type and sample start time
 *
 * @param[in]	newaccruetype	-	new accrue type to be set
 * @param[in,out]	pjob	-	pointer to job
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: if updating same accrue type or do nothing
 *
 * @par MT-Safe: No
 */

int
update_eligible_time(long newaccruetype, job *pjob)
{
	static char *msg[] = {"initial_time", "ineligible_time", "eligible_time", "run_time", "exiting"};
	char *strtime;
	static char errtime[] = "00:00:00";
	char str[256];
	long accrued_time = 0; /* accrued time */
	long oldaccruetype = get_jattr_long(pjob, JOB_ATR_accrue_type);
	long timestamp = (long) time_now; /* time since accrual begins */

	/* check if updating same accrue type or do nothing */
	if (newaccruetype == oldaccruetype || newaccruetype == -1)
		return 1;

	/* time since accrue type last changed  */
	accrued_time = timestamp - get_jattr_long(pjob, JOB_ATR_sample_starttime);

	if (oldaccruetype == JOB_ELIGIBLE && accrued_time > 0)
		set_jattr_l_slim(pjob, JOB_ATR_eligible_time, accrued_time, INCR);

	/* change type to new accrue type, update start time to mark change of accrue type */
	set_jattr_l_slim(pjob, JOB_ATR_accrue_type, newaccruetype, SET);
	set_jattr_l_slim(pjob, JOB_ATR_sample_starttime, timestamp, SET);

	/* Prepare and print log message */
	strtime = convert_long_to_time(get_jattr_long(pjob, JOB_ATR_eligible_time));
	if (strtime == NULL)
		strtime = errtime;

	sprintf(str, "Accrue type has changed to %s, previous accrue type was %s for %ld secs, total eligible_time=%s",
		msg[newaccruetype], msg[oldaccruetype], accrued_time, strtime);
	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, str);

	if (strtime != NULL && strtime != errtime)
		free(strtime);

	return 0;
}

/**
 * @brief
 * 		alter_eligibletime 	this is action function for eligible_time.
 *			qalter will alter the value of eligible_time,
 *			hence need to set sample_starttime to now so that
 *			accrual begins with this change. log message is
 *			printed to mark the change. the time accrued while
 *			in present accruetype from last change is printed.
 *			Accrual continues from now.
 *
 * @param[in]	pattr	-	attribute structure
 * @param[in,out]	pobject	-	object which will be later typecasted into job type.
 * @param[in]	actmode	-	action mode
 *
 * @par MT-Safe: No
 */
int
alter_eligibletime(attribute *pattr, void *pobject, int actmode)
{
	static char errtime[] = "00:00:00";
	long timestamp = (long) time_now; /* accrual begins from here */
	job *pjob = (job *) pobject;
	long oldaccruetype = get_jattr_long(pjob, JOB_ATR_accrue_type);
	long newaccruetype = oldaccruetype; /* We are not changing accrue type */

	/* distinguish between genuine qalter and call by action */
	if (actmode == ATR_ACTION_ALTER) {

		/* eligible_time_enable is OFF, then error */
		if (!get_sattr_long(SVR_ATR_EligibleTimeEnable)) {
			return PBSE_ETEERROR;
		} else {
			long accrued_time;
			char *strtime;
			char logstr[256];
			static char *msg[] = {
				"initial_time",
				"ineligible_time",
				"eligible_time",
				"run_time",
				"exiting"};

			accrued_time = (long) time_now -
				       get_jattr_long(pjob, JOB_ATR_sample_starttime);

			/* Sample time accrual continues with this time .... */
			set_jattr_l_slim(pjob, JOB_ATR_sample_starttime, timestamp, SET);
			/* eligible_time is set to new value again in modify_job_attr.
			 * this is for log message, we have the new value anyways.
			 */
			strtime = convert_long_to_time(pattr->at_val.at_long);

			sprintf(logstr, "Accrue type is %s, previous accrue type was %s for %ld secs, due to qalter total eligible_time=%s",
				msg[newaccruetype], msg[oldaccruetype], accrued_time, strtime != NULL ? strtime : errtime);
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
				  pjob->ji_qs.ji_jobid, logstr);

			free(strtime);

			return PBSE_NONE;
		}
	}
	return PBSE_NONE;
}
/**
 * @brief
 *		Check if the history of the  finished job needs to be saved or purged .
 *		If it needs to be saved and history management is ON then call svr_setjob_histinfo() to
 *		store the data in the server's history . Else if the history management is OFF or the
 *		request is to not store the jobs history then call job_purge()
 *
 * @param[in]	pjob	-	Pointer to the job structure
 *
 *
 */
void
svr_saveorpurge_finjobhist(job *pjob)
{
	int flag = 0;
	resc_resv *presv;

	presv = pjob->ji_myResv;

	flag = svr_chk_history_conf();
	if (flag && !pjob->ji_deletehistory) {
		svr_setjob_histinfo(pjob, T_FIN_JOB);
		if (pjob->ji_ajinfo != NULL)
			pjob->ji_ajinfo->tkm_flags &= ~TKMFLG_CHK_ARRAY;
		if (pjob->ji_terminated &&
		    (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) &&
		    pjob->ji_parentaj != NULL &&
		    pjob->ji_parentaj->ji_ajinfo != NULL)
			pjob->ji_parentaj->ji_ajinfo->tkm_dsubjsct++;
	} else {
		if (pjob->ji_deletehistory && flag) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB,
				  LOG_INFO, pjob->ji_qs.ji_jobid,
				  msg_also_deleted_job_history);
		}
		/* For an array subjob if exit status is non-zero mark sub state
		 * as JOB_SUBSTATE_FAILED. Otherwise set to JOB_SUBSTATE_FINISHED
		 * when current sub state is JOB_SUBSTATE_EXITED.
		 */
		if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
			if (pjob->ji_terminated)
				set_job_substate(pjob, JOB_SUBSTATE_TERMINATED);
			else if (is_jattr_set(pjob, JOB_ATR_exit_status)) {
				if (get_jattr_long(pjob, JOB_ATR_exit_status))
					set_job_substate(pjob, JOB_SUBSTATE_FAILED);
				else if (check_job_substate(pjob, JOB_SUBSTATE_EXITED))
					set_job_substate(pjob, JOB_SUBSTATE_FINISHED);
			}
		}
		job_purge(pjob);
	}
	set_idle_delete_task(presv);
}
/**
 * @brief
 *		Function name: svr_clean_job_history
 * @par Purpose: Periodically checks for the history jobs in the server and
 *		 purge the history jobs whose history duration exceeds the
 *		 configured job_history_duration server attribute.
 * @par Functionality: It is a work_task and reschedule itself after 2 mins if
 *		 and only if job_history_enable is set.
 *		Output: None
 *
 * @param[in]	pwt	-	work_task structure
 */
void
svr_clean_job_history(struct work_task *pwt)
{
	job *pjob;
	job *nxpjob = NULL;
	int walltime_used = 0;

	/*
	 * Keep track of time spent purging jobs, interrupts purge if necessary.
	 * Timed task in nearby future set if purge took too long.
	 * Timed task in far future only set if this task completes.
	 * Autotunes time between job history purges:
	 * - raised if last purge was short
	 * - lowered if this purge needs to be interrupted
	 */

	time_t begin_time;
	time_t end_time;
	static time_t time_between_tasks = SVR_CLEAN_JOBHIST_TM;

	begin_time = time(NULL);
	/* Initialize end_time, in case we do not get into the while loop */
	end_time = begin_time;

	/*
	 * Traverse through the SERVER job list and find the history
	 * jobs (job with state JOB_STATE_LTR_MOVED and JOB_STATE_LTR_FINISHED)
	 * which exceed the configured job_history_duration value and
	 * purge them immediately.
	 */
	pjob = (job *) GET_NEXT(svr_alljobs);

	while (pjob != NULL) {
		/* save the next job */
		nxpjob = (job *) GET_NEXT(pjob->ji_alljobs);

		if ((check_job_state(pjob, JOB_STATE_LTR_MOVED) && check_job_substate(pjob, JOB_SUBSTATE_FINISHED)) ||
		    (check_job_state(pjob, JOB_STATE_LTR_FINISHED)) ||
		    (check_job_state(pjob, JOB_STATE_LTR_EXPIRED))) {

			if (!(is_jattr_set(pjob, JOB_ATR_history_timestamp))) {
				if (check_job_state(pjob, JOB_STATE_LTR_MOVED))
					set_jattr_l_slim(pjob, JOB_ATR_history_timestamp, time_now, SET);
				else {
					if (((walltime_used = get_used_wall(pjob)) == -1) ||
					    !(is_jattr_set(pjob, JOB_ATR_stime))) {
						log_err(-1, "svr_clean_job_history",
							"Finished job missing start-time/walltime used, cannot clean history");
						pjob = nxpjob;
						continue;
					}
					set_jattr_l_slim(pjob, JOB_ATR_history_timestamp,
							 get_jattr_long(pjob, JOB_ATR_stime) + walltime_used, SET);
				}
				job_save_db(pjob);
			}

			if (time_now >= (get_jattr_long(pjob, JOB_ATR_history_timestamp) + svr_history_duration)) {
				job_purge(pjob);
				pjob = NULL;
			}
		}
		/* restore the saved next in pjob */
		pjob = nxpjob;

		/* check if we spent too long hogging the pbs_server process here */
		end_time = time(NULL);
		if ((end_time - begin_time) > SVR_CLEAN_JOBHIST_SECS) {
			/* Apparently the interval between history purges is too long.
			 * reduce it using factor 0.7
			 */
			time_between_tasks = (floor((double) time_between_tasks * 0.7));

			/* no use reducing to less than 4 * SVR_CLEAN_JOBHIST_SECS
			 * since we'll already schedule a continuation task here
			 */
			if (time_between_tasks < (4 * SVR_CLEAN_JOBHIST_SECS))
				time_between_tasks = 4 * SVR_CLEAN_JOBHIST_SECS;

			/* set up another work task in near future,
			 * but leave as much time as we spent in this routine for other work first
			 */
			if (!set_task(WORK_Timed,
				      (end_time + SVR_CLEAN_JOBHIST_SECS),
				      svr_clean_job_history, NULL)) {
				log_err(errno,
					"svr_clean_job_history",
					"Unable to set task for clean job history");
				/* on error to set task
					 * just continue purging the history
					 */
			} else
				/* but if we managed to set a task in near future, return;
				 * that task will continue where we left off
				 */
				return;
		}
	} /* end of while loop through jobs */

	/* We purged everything necessary in this task if we get here.
	 * set up another work task for next time period.
	 */
	if (pwt && svr_history_enable) {
		if (!set_task(WORK_Timed,
			      (time_now + time_between_tasks),
			      svr_clean_job_history, NULL)) {
			log_err(errno,
				"svr_clean_job_history",
				"Unable to set task for clean job history");
		}
	}

	/* try to move the time between tasks up again
	 * but only if we spent less than 2/3rds of what we were allowed to spend
	 * Note the last purge of a chain of purges will often tend to undo part of the lowering
	 * in the earlier incomplete purges -- that's OK: 0.7*1.1 is still smaller than 1
	 */

	if ((time_between_tasks < SVR_CLEAN_JOBHIST_TM) &&
	    ((end_time - begin_time) < floor((double) SVR_CLEAN_JOBHIST_SECS * 2 / 3))) {
		time_between_tasks = ceil((double) time_between_tasks * 1.1);
		if (time_between_tasks > SVR_CLEAN_JOBHIST_TM)
			time_between_tasks = SVR_CLEAN_JOBHIST_TM;
	}
}

/**
 * @brief
 * 		Function name: svr_histjob_update()
 * 		Description: Update the state/substate of the history job and save
 *		the job structure to the disk.
 * 		Input: 1) pjob 2) newstate 3) newsubstate
 *
 * @param[in,out]	pjob	-	job which needs to be updated.
 * @param[in]	newstate	-	internal copy of state
 * @param[in]	newsubstate	-	job sub-state
 *
 * @return	Nothing
 */
void
svr_histjob_update(job *pjob, char newstate, int newsubstate)
{
	char oldstate = get_job_state(pjob);
	pbs_queue *pque = pjob->ji_qhdr;

	/* update the state count in queue and server */
	if (oldstate != newstate) {
		int oldstatenum;
		int newstatenum;

		oldstatenum = state_char2int(oldstate);
		newstatenum = state_char2int(newstate);
		if (oldstatenum != -1)
			server.sv_jobstates[oldstatenum]--;
		if (newstatenum != -1)
			server.sv_jobstates[newstatenum]++;
		if (pque != NULL) {
			if (oldstatenum != -1)
				pque->qu_njstate[oldstatenum]--;
			if (newstatenum != -1)
				pque->qu_njstate[newstatenum]++;
		}
	}
	/* set the job state and state char */
	set_job_state(pjob, newstate);
	set_job_substate(pjob, newsubstate);

	/* For subjob update the state */
	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
		update_sj_parent(pjob->ji_parentaj, pjob, pjob->ji_qs.ji_jobid, oldstate, newstate);
		chk_array_doneness(pjob->ji_parentaj);
	}

	/* set the status of each subjob if it is an array job */
	if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) {
		int i;
		ajinfo_t *ptbl = pjob->ji_ajinfo;
		if (ptbl) {
			for (i = ptbl->tkm_start; i <= ptbl->tkm_end; i += ptbl->tkm_step) {
				int sjsst;
				char sjst;
				job *psubj = get_subjob_and_state(pjob, i, &sjst, &sjsst);
				if (psubj) {
					if (sjsst != JOB_SUBSTATE_TERMINATED &&
					    sjsst != JOB_SUBSTATE_FINISHED &&
					    sjsst != JOB_SUBSTATE_FAILED &&
					    sjsst != JOB_SUBSTATE_MOVED)
						svr_histjob_update(psubj, newstate, newsubstate);
					else
						svr_histjob_update(psubj, newstate, sjsst);
				} else
					update_sj_parent(pjob, NULL, create_subjob_id(pjob->ji_qs.ji_jobid, i), sjst, newstate);
			}
		}
	}

	job_save_db(pjob);
}

/**
 * @brief
 * 		 svr_chk_history_conf - Check if server is configured to keep job history info.
 *
 * @return	Boolen value
 * @retval	1	: if the server is configured for job history info
 * @retval	0	: otherwise. i.e. onei/both of svr_history_enable and
 * 					 svr_history_duration is/are zero.
 */
int
svr_chk_history_conf()
{
	return (svr_history_enable && svr_history_duration);
}

/**
 * @brief:
 *        update_job_finish_comment	- Append job comment on exit (finished/ terminated/ failed) of job.
 *
 * @param[in]  *pjob       -	job structure
 * @param[in]  newsubstate -	new substate of the job
 * @param[in]  user        -	username who invoked job termination
 *
 * @return void
 *
 */
void
update_job_finish_comment(job *pjob, int newsubstate, char *user)
{
	char buffer[LOG_BUF_SIZE + 1] = {'\0'};
	if ((is_jattr_set(pjob, JOB_ATR_Comment)) == 0) {
		return;
	}

	if (newsubstate == JOB_SUBSTATE_FINISHED) {
		snprintf(buffer, LOG_BUF_SIZE, "%s and finished",
			 get_jattr_str(pjob, JOB_ATR_Comment));
	} else if (newsubstate == JOB_SUBSTATE_FAILED) {
		if (is_jattr_set(pjob, JOB_ATR_exit_status)) {
			switch (get_jattr_long(pjob, JOB_ATR_exit_status)) {
				case JOB_EXEC_KILL_NCPUS_BURST:
					snprintf(buffer, LOG_BUF_SIZE, "%s and exceeded resource ncpus (burst)",
						 get_jattr_str(pjob, JOB_ATR_Comment));
					break;
				case JOB_EXEC_KILL_NCPUS_SUM:
					snprintf(buffer, LOG_BUF_SIZE, "%s and exceeded resource ncpus (sum)",
						 get_jattr_str(pjob, JOB_ATR_Comment));
					break;
				case JOB_EXEC_KILL_VMEM:
					snprintf(buffer, LOG_BUF_SIZE, "%s and exceeded resource vmem",
						 get_jattr_str(pjob, JOB_ATR_Comment));
					break;
				case JOB_EXEC_KILL_MEM:
					snprintf(buffer, LOG_BUF_SIZE, "%s and exceeded resource mem",
						 get_jattr_str(pjob, JOB_ATR_Comment));
					break;
				case JOB_EXEC_KILL_CPUT:
					snprintf(buffer, LOG_BUF_SIZE, "%s and exceeded resource cput",
						 get_jattr_str(pjob, JOB_ATR_Comment));
					break;
				case JOB_EXEC_KILL_WALLTIME:
					snprintf(buffer, LOG_BUF_SIZE, "%s and exceeded resource walltime",
						 get_jattr_str(pjob, JOB_ATR_Comment));
					break;
				default:
					snprintf(buffer, LOG_BUF_SIZE, "%s and failed",
						 get_jattr_str(pjob, JOB_ATR_Comment));
					break;
			}
		} else {
			snprintf(buffer, LOG_BUF_SIZE, "%s and failed",
				 get_jattr_str(pjob, JOB_ATR_Comment));
		}
	} else if (newsubstate == JOB_SUBSTATE_TERMINATED) {
		/* Don't overwrite the comment; if already set by req_deletejob2 */
		if (strstr(get_jattr_str(pjob, JOB_ATR_Comment), "terminated") == NULL) {
			if (user != NULL) {
				snprintf(buffer, LOG_BUF_SIZE, "%s and terminated by %s",
					 get_jattr_str(pjob, JOB_ATR_Comment),
					 user);
			} else {
				snprintf(buffer, LOG_BUF_SIZE, "%s and terminated",
					 get_jattr_str(pjob, JOB_ATR_Comment));
			}
		}
	}
	if (buffer[0] != '\0') {
		set_jattr_str_slim(pjob, JOB_ATR_Comment, buffer, NULL);
	}
}

/**
 * @brief
 *		Set the history info for the job and keep until cleaned up by the
 *		server after the svr_history_duration period.
 *		Called on the execution completion of jobs i.e. normal job (non-array)
 *		or sub jobs; and when an array job is done (all subjobs complete).
 *		Also called when locally created normal jobs and array jobs are
 *		moved/routed to a new server.
 *
 * @param[in]	*pjob	-	job structure
 * @param[in]	type	-	type of history
 *	  						type = T_FIN_JOB for FINISHED jobs
 *	  						type = T_MOV_JOB for MOVED jobs
 *	  						type = T_MOM_DOWN for non-rerunnable jobs FAILED
 *	  						because MOM went down.
 *
 * @return	void
 */

void
svr_setjob_histinfo(job *pjob, histjob_type type)
{
	char newstate = 'T';
	int newsubstate = 0;
	ajinfo_t *ptbl = NULL;

	if (type == T_MOV_JOB) { /* MOVED job */
		char *destination = pjob->ji_qs.ji_destin;
		char *tmpstr = NULL;
		char qname[PBS_MAXROUTEDEST + 1];

		if (destination == NULL || *destination == '\0') {
			return;
		}

		/*
		 * If the move_job request comes from the scheduler because of
		 * peer-2-peer scheduling, then destin will have port number
		 * (format: "[<queue>]<server>:<portno>")which is not required,
		 * so strip the string after ':'.
		 */
		tmpstr = strchr(destination, ':');
		if (tmpstr != NULL) {
			*tmpstr = '\0';
		}

		sprintf(log_buffer,
			"Job Moved to destination: \"%s\"", destination);
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO,
			  pjob->ji_qs.ji_jobid, log_buffer);

		/* put the accounting log for MOVED job */
		sprintf(log_buffer, "destination=%s", destination);
		account_record(PBS_ACCT_MOVED, pjob, log_buffer);

		/*
		 * parse the queue name from the destination
		 * set the queue attribute to the destination
		 * set the server's ji_queue info to just the queue name
		 */
		snprintf(qname, sizeof(qname), "%s", destination);

		/* strip off the portion that isn't the queue name */
		tmpstr = strchr(qname, '@');
		if (tmpstr != NULL) {
			*tmpstr = '\0';
		}
		snprintf(pjob->ji_qs.ji_queue, sizeof(pjob->ji_qs.ji_queue),
			 "%.*s", PBS_MAXQUEUENAME, qname);

		/* Set the queue attribute to destination */
		set_jattr_generic(pjob, JOB_ATR_in_queue, destination, NULL, SET);

		/* set the job comment attr with destination */
		sprintf(log_buffer, "Job has been moved to \"%s\"", destination);
		set_jattr_generic(pjob, JOB_ATR_Comment, log_buffer, NULL, SET);

		/*
		 * SET the NEW STATE/SUB-STATE for the job (which is moved).
		 * New STATE for the job will be JOB_STATE_LTR_MOVED and new
		 * SUBSTATE will be JOB_SUBSTATE_MOVED.
		 */
		newstate = JOB_STATE_LTR_MOVED;
		newsubstate = JOB_SUBSTATE_MOVED;

	} else if (type == T_FIN_JOB) {
		/*
		 * FINISHED job:
		 * set the OGSA-BES compliant substate for the job.
		 * If it is terminated by deljob batch request, then
		 * set it as TERMINATED. Else, if the job has run and
		 * exited with non-zero exit status, then it is FAILED,
		 * otherwise FINISHED.
		 */
		newstate = (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) ? JOB_STATE_LTR_EXPIRED : JOB_STATE_LTR_FINISHED; /* default X for subjob, F for other jobs */
		newsubstate = JOB_SUBSTATE_FINISHED;									  /* default */

		/* If Array job, handle here */
		if ((pjob->ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) &&
		    (ptbl = pjob->ji_ajinfo)) {
			if (pjob->ji_terminated)
				newsubstate = JOB_SUBSTATE_TERMINATED;
			else {
				int i;
				for (i = ptbl->tkm_start; i <= ptbl->tkm_end; i += ptbl->tkm_step) {
					int sjsst;
					get_subjob_and_state(pjob, i, NULL, &sjsst);
					if (sjsst == JOB_SUBSTATE_FAILED || sjsst == JOB_SUBSTATE_TERMINATED) {
						newsubstate = sjsst;
						break;
					}
				}
			}
		} else { /* Non-Array job */
			if (pjob->ji_terminated) {
				newsubstate = JOB_SUBSTATE_TERMINATED;
			} else if (is_jattr_set(pjob, JOB_ATR_exit_status)) {
				if (get_jattr_long(pjob, JOB_ATR_exit_status))
					newsubstate = JOB_SUBSTATE_FAILED;
			}
		}
		update_job_finish_comment(pjob, newsubstate, NULL);
	} else if (type == T_MOM_DOWN) {
		newstate = JOB_STATE_LTR_FINISHED;
		newsubstate = JOB_SUBSTATE_FAILED;
	}

	/* if the job is not already in MOVED or FINISHED state, then */
	/* decrement the entity job counts and entity resource sums   */

	if (!check_job_state(pjob, JOB_STATE_LTR_MOVED) &&
	    !check_job_state(pjob, JOB_STATE_LTR_EXPIRED) &&
	    !check_job_state(pjob, JOB_STATE_LTR_FINISHED)) {
		account_entity_limit_usages(pjob, NULL, NULL, DECR,
					    pjob->ji_etlimit_decr_queued ? ETLIM_ACC_ALL_MAX : ETLIM_ACC_ALL);
		account_entity_limit_usages(pjob, pjob->ji_qhdr, NULL, DECR,
					    pjob->ji_etlimit_decr_queued ? ETLIM_ACC_ALL_MAX : ETLIM_ACC_ALL);
	}

	/* set the history timestamp */
	set_jattr_l_slim(pjob, JOB_ATR_history_timestamp, time_now, SET);
	/* update the history job state and substate */
	svr_histjob_update(pjob, newstate, newsubstate);

	/*
	 * Work tasks on history jobs are not required and may change the
	 * history info which is dangerous, so better delete them.
	 */
	free_job_work_tasks(pjob);
}

/**
 * @brief
 * 		svr_chk_histjob - check whether job is a history job: called from
 * 			req_stat_job() if type = 1;
 *
 * @param[in]	pjob	-	job structure to be checked
 *
 * @return	PBSE_*
 * @retval	PBSE_NONE	: if it is not a history job or feature is not enabled.
 * @retval	PBSE_UNKJOBID	: if it is a moved job but active at remote server
 * @retval	PBSE_HISTJOBID	: if it is a Finished job or moved and finished
 *	    		    			at remote server.
 */

int
svr_chk_histjob(job *pjob)
{
	int rc = PBSE_NONE;

	/*
	 * If server is not configured for history job information,
	 * no need to check further, return PBSE_NONE.
	 */
	if (svr_history_enable == 0)
		return PBSE_NONE;

	/*
	 * If it is FINISHED or MOVED with substate FINISHED, then
	 * return PBSE_HISTJOBID otherwise PBSE_NONE.
	 */
	if (pjob) {
		switch (get_job_state(pjob)) {
			case JOB_STATE_LTR_FINISHED:
				rc = PBSE_HISTJOBID;
				break;
			case JOB_STATE_LTR_MOVED:
				if (check_job_substate(pjob, JOB_SUBSTATE_FINISHED))
					rc = PBSE_HISTJOBID;
				else /* other than JOB_SUBSTATE_FINISHED */
					rc = PBSE_UNKJOBID;
				break;
		}
	}
	return rc;
}

/**
 * @brief
 * 	Finish the request to mom to update a job's exec_* values.
 *	Both the mom request and the originating client request are acknowledged.
 *
 * @param[in,out]	pwt -	work_task structure, containing info
 *				about the mom request and the client request.
 * @return none
 */
static void
post_send_job_exec_update_req(struct work_task *pwt)
{
	struct batch_request *mom_preq = NULL;
	struct batch_request *cli_preq = NULL;
	int bcode = 0;

	if (pwt == NULL)
		return;

	if (pwt->wt_aux2 != PROT_TPP)
		svr_disconnect(pwt->wt_event); /* close connection to MOM */
	mom_preq = pwt->wt_parm1;
	mom_preq->rq_conn = mom_preq->rq_orgconn; /* restore socket to client */
	bcode = mom_preq->rq_reply.brp_code;

	cli_preq = pwt->wt_parm2;

	if (bcode) {
		char err_msg[LOG_BUF_SIZE];

		/* also take note of the reject msg if any */
		if (mom_preq->rq_reply.brp_choice == BATCH_REPLY_CHOICE_Text) {
			(void) snprintf(err_msg, sizeof(err_msg), "%s", mom_preq->rq_reply.brp_un.brp_txt.brp_str);
		} else {
			(void) snprintf(err_msg, sizeof(err_msg), msg_mombadmodify, bcode);
		}
		log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, mom_preq->rq_ind.rq_modify.rq_objname, err_msg);
		req_reject(bcode, 0, mom_preq);
		reply_text(cli_preq, bcode, err_msg);
	} else {
		reply_ack(mom_preq);
		if (cli_preq != NULL) {
			if (cli_preq->rq_extend == NULL) {
				reply_ack(cli_preq);
			} else {
				reply_text(cli_preq, PBSE_NONE, cli_preq->rq_extend);
			}
		}
	}
}

/**
 * @brief
 *
 * Communicate to the MS mom pjob's exec_vnode, exec_host,
 * exec_host2, and schedselect attributes.
 *
 * @param[in]	pjob - job structure
 * @param[out]  err_msg - a buffer of size 'err_msg_sz' supplied by the
 *       		  caller and upon a failure will contain an appropriate
 *       		  error message
 * @param[in]	err_msg_sz - size of 'err_msg' buf
 * @param[in]	reply_req - the batch request to reply to if any
 *
 * @return int
 * @retrval	0	- sucess
 * @retrval	1	- fail
 */

int
send_job_exec_update_to_mom(job *pjob, char *err_msg, int err_msg_sz,
			    struct batch_request *reply_req)
{
	struct batch_request *newreq;
	char *new_exec_vnode = NULL;
	char *new_exec_host = NULL;
	char *new_exec_host2 = NULL;
	int rc = 1;
	int num_updates = 0;
	struct work_task *pwt = NULL;

	if (pjob == NULL) {
		log_err(-1, __func__, "bad job parameter");
		return (1);
	}

	if ((err_msg[0] != '\0') && (reply_req != NULL)) {
		/*
		 * be sure to save/send this extra info in
		 * 'err_msg' buf
		 */
		reply_req->rq_extend = strdup(err_msg);
		if (reply_req->rq_extend == NULL) {
			log_err(-1, __func__, "strdup failed");
			return (1);
		}
	}

	newreq = alloc_br(PBS_BATCH_ModifyJob);

	if (newreq == (struct batch_request *) 0) {
		log_err(-1, __func__, "failed to alloc_br for PBS_MATCH_modifyjob");
		return (1);
	}
	CLEAR_HEAD(newreq->rq_ind.rq_modify.rq_attr);

	(void) strcpy(newreq->rq_ind.rq_modify.rq_objname,
		      pjob->ji_qs.ji_jobid);

	if (is_jattr_set(pjob, JOB_ATR_exec_vnode)) {
		new_exec_vnode =
			get_jattr_str(pjob, JOB_ATR_exec_vnode);

		if (add_to_svrattrl_list(
			    &(newreq->rq_ind.rq_modify.rq_attr),
			    ATTR_execvnode, NULL, new_exec_vnode, 0,
			    NULL) == -1) {
			if ((err_msg != NULL) && (err_msg_sz > 0)) {
				snprintf(err_msg, err_msg_sz, "failed to add_to_svrattrl_list(%s,%s,%s)", ATTR_execvnode, "", new_exec_vnode);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, err_msg);
			}
			goto send_job_exec_update_exit;
		}
		num_updates++;
	}

	if (is_jattr_set(pjob, JOB_ATR_exec_host)) {
		new_exec_host =
			get_jattr_str(pjob, JOB_ATR_exec_host);

		if (add_to_svrattrl_list(
			    &(newreq->rq_ind.rq_modify.rq_attr),
			    ATTR_exechost, NULL, new_exec_host, 0, NULL) == -1) {
			if ((err_msg != NULL) && (err_msg_sz > 0)) {
				snprintf(err_msg, err_msg_sz, "failed to add_to_svrattrl_list(%s,%s,%s)", ATTR_exechost, "", new_exec_host);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, err_msg);
			}
			goto send_job_exec_update_exit;
		}
		num_updates++;
	}

	if (is_jattr_set(pjob, JOB_ATR_exec_host2)) {
		new_exec_host2 =
			get_jattr_str(pjob, JOB_ATR_exec_host2);

		if (add_to_svrattrl_list(
			    &(newreq->rq_ind.rq_modify.rq_attr),
			    ATTR_exechost2, NULL, new_exec_host2, 0, NULL) == -1) {
			if ((err_msg != NULL) && (err_msg_sz > 0)) {
				snprintf(err_msg, err_msg_sz, "failed to add_to_svrattrl_list(%s,%s,%s)", ATTR_exechost2, "", new_exec_host2);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, err_msg);
			}
			goto send_job_exec_update_exit;
		}
		num_updates++;
	}

	if (is_jattr_set(pjob, JOB_ATR_SchedSelect)) {
		if (add_to_svrattrl_list(
			    &(newreq->rq_ind.rq_modify.rq_attr),
			    ATTR_SchedSelect, NULL,
			    get_jattr_str(pjob, JOB_ATR_SchedSelect),
			    0, NULL) == -1) {
			if ((err_msg != NULL) && (err_msg_sz > 0)) {
				snprintf(err_msg, err_msg_sz, "failed to add_to_svrattrl_list(%s,%s,%s)", ATTR_SchedSelect, "", get_jattr_str(pjob, JOB_ATR_SchedSelect));
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, err_msg);
			}
			goto send_job_exec_update_exit;
		}
		num_updates++;
	}

	if ((is_jattr_set(pjob, JOB_ATR_resource)) != 0) {
		pbs_list_head collectresc;
		svrattrl *psvrl;
		attribute_def *objatrdef;
		extern int resc_access_perm;

		objatrdef = &job_attr_def[(int) JOB_ATR_resource];
		CLEAR_HEAD(collectresc);
		resc_access_perm = READ_ONLY;
		if (objatrdef->at_encode(get_jattr(pjob, JOB_ATR_resource), &collectresc, objatrdef->at_name, NULL, ATR_ENCODE_CLIENT, NULL) > 0) {

			psvrl = (svrattrl *) GET_NEXT(collectresc);
			while (psvrl) {
				if (add_to_svrattrl_list(
					    &(newreq->rq_ind.rq_modify.rq_attr),
					    objatrdef->at_name, psvrl->al_resc,
					    psvrl->al_value, 0, NULL) == -1) {
					free_attrlist(&collectresc);
					if ((err_msg != NULL) && (err_msg_sz > 0)) {
						snprintf(err_msg, err_msg_sz, "failed to add_to_svrattrl_list(%s,%s,%s)", objatrdef->at_name, psvrl->al_resc, psvrl->al_value);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, err_msg);
					}
					goto send_job_exec_update_exit;
				}
				num_updates++;
				psvrl = (svrattrl *) GET_NEXT(psvrl->al_link);
			}
			free_attrlist(&collectresc);
		}
	}

	/* pass the request on to MOM */

	if (num_updates > 0) {
		rc = relay_to_mom2(pjob, newreq,
				   post_send_job_exec_update_req, &pwt);
		if (rc != 0) {
			log_err(-1, __func__, "failed telling mom of the request");
		} else {
			pwt->wt_parm2 = reply_req;
		}
	} else {
		/* no updates, ok */
		rc = 0;
	}

send_job_exec_update_exit:

	if ((rc != 0) || (num_updates == 0)) {
		free_br(newreq);
	}

	return (rc);
}

/**
 *
 * @brief
 *	Extracts mom hostnames from exechostx and adds it to list
 *
 * @param[in/out]	to_head - destination reliable_job_node list
 * @param[in]	exechostx - string in exechost format
 *
 * @return 	void
 */
static void
populate_mom_list(pbs_list_head *to_head, char *exechostx)
{
	char *hostn = NULL, *last = NULL, *peh;
	int hasprn = 0;

	if (!to_head || !exechostx || !*exechostx) {
		log_err(-1, __func__, "bad param passed");
		return;
	}

	peh = strdup(exechostx);
	if (peh == NULL) {
		log_err(errno, __func__, "strdup error");
		return;
	}

	CLEAR_HEAD((*to_head));

	for (hostn = parse_plus_spec_r(peh, &last, &hasprn);
	     hostn;
	     hostn = parse_plus_spec_r(last, &last, &hasprn)) {
		if (reliable_job_node_add(to_head, strtok(hostn, ":/")) == -1) {
			free(peh);
			return;
		}
	}
	free(peh);
	return;
}

/**
 * @brief
 *	returns a copy of partial select string representing the MS (first) chunk
 *	Note - caller to free the returned string pointer
 *
 * @param[in]		select_str - pointer to complete schedselect string
 *
 * @return char *
 * @retval ptr	pointer to malloc'd string containing ms (first) chunk's select str
 *
 * @note
 * caller to free the returned string pointer
*/
static char *
get_ms_select_chunk(char *select_str)
{
	char *slast, *selbuf, *psubspec, *retval = NULL;
	int hpn;

	if (select_str == NULL) {
		log_err(-1, __func__, "bad param passed");
		return (NULL);
	}

	selbuf = strdup(select_str);
	if (selbuf == NULL) {
		log_err(errno, __func__, "strdup fail");
		return (NULL);
	}
	psubspec = parse_plus_spec_r(selbuf, &slast, &hpn);

	if (psubspec) {
		while (*psubspec && !isalpha(*(psubspec++)))
			; /* one line loop */

		if (!(retval = strdup(--psubspec)))
			log_err(errno, __func__, "strdup fail");
	}

	free(selbuf);
	return retval;
}
/**
 * @brief
 *	Recreates the pjob's exec_vnode, updating at the same time
 *	its corresponding exec_host and exec_host2 attributes
 *	by taking out the vnodes managed by sister moms.
 *
 * @param[in,out]	pjob - job structure
 * @param[in]		vnodelist - if non-NULL, lists the vnodes to be
 *				freed whose parent mom is a sister mom.
 *				if NULL, releases all the sister
 *				vnodes assigned to 'pjob'
 * @param[in]		keep_select - non-NULL means it's a select string that
 *				describes vnodes to be kept while freeing all other vnodes
 *				assigned to 'pjob' whose parent mom is a sister mom.
 * @param[out]  err_msg - if function returns != 0 (failure), return
 *			  any error message in this buffer.
 * @param[int]	err_msg_sz - size of 'err_msg' buf.
 * @return int
 * @retval 0	for success
 * @reval 1	for error
*/
int
recreate_exec_vnode(job *pjob, char *vnodelist, char *keep_select, char *err_msg,
		    int err_msg_sz)
{
	char *exec_vnode = NULL;
	char *exec_host = NULL;
	char *exec_host2 = NULL;
	char *new_exec_vnode = NULL;
	char *new_exec_host = NULL;
	char *new_exec_host2 = NULL;
	char *new_select = NULL;
	char *schedselect = NULL;
	char *deallocated_execvnode = NULL;
	char *new_deallocated_execvnode = NULL;
	resource_def *prdefsl = NULL;
	resource *presc;
	int rc = 1;
	relnodes_input_t r_input;
	relnodes_input_vnodelist_t r_input_vnlist;
	relnodes_input_select_t r_input_keep_select;
	pbs_list_head succeeded_mom_list;

	if (pjob == NULL) {
		log_err(-1, __func__, "bad job parameter");
		return (1);
	}

	if ((!check_job_state(pjob, JOB_STATE_LTR_RUNNING)) &&
	    (!check_job_state(pjob, JOB_STATE_LTR_EXITING))) {
		log_err(-1, __func__, "job not in running or exiting state");
		return (1);
	}

	if ((is_jattr_set(pjob, JOB_ATR_exec_vnode)) == 0) {
		log_err(-1, __func__, "exec_vnode is not set");
		return (1);
	}

	if ((is_jattr_set(pjob, JOB_ATR_exec_host)) == 0) {
		log_err(-1, __func__, "exec_host is not set");
		return (1);
	}

	if ((is_jattr_set(pjob, JOB_ATR_exec_host2)) == 0) {
		log_err(-1, __func__, "exec_host2 is not set");
		return (1);
	}

	if ((is_jattr_set(pjob, JOB_ATR_SchedSelect)) == 0) {
		log_err(-1, __func__, "schedselect is not set");
		return (1);
	}

	exec_vnode = get_jattr_str(pjob, JOB_ATR_exec_vnode);

	exec_host = get_jattr_str(pjob, JOB_ATR_exec_host);

	exec_host2 = get_jattr_str(pjob, JOB_ATR_exec_host2);

	schedselect = get_jattr_str(pjob, JOB_ATR_SchedSelect);

	if (is_jattr_set(pjob, JOB_ATR_exec_vnode_deallocated))
		deallocated_execvnode = get_jattr_str(pjob, JOB_ATR_exec_vnode_deallocated);

	relnodes_input_init(&r_input);
	r_input.jobid = pjob->ji_qs.ji_jobid;
	r_input.execvnode = exec_vnode;
	r_input.exechost = exec_host;
	r_input.exechost2 = exec_host2;
	r_input.schedselect = schedselect;
	r_input.p_new_exec_vnode = &new_exec_vnode;
	r_input.p_new_exec_host[0] = &new_exec_host;
	r_input.p_new_exec_host[1] = &new_exec_host2;
	r_input.p_new_schedselect = &new_select;

	if (keep_select == NULL) {
		relnodes_input_vnodelist_init(&r_input_vnlist);
		r_input_vnlist.vnodelist = vnodelist;
		r_input_vnlist.deallocated_nodes_orig = deallocated_execvnode;
		r_input_vnlist.p_new_deallocated_execvnode = &new_deallocated_execvnode;

		rc = pbs_release_nodes_given_nodelist(&r_input, &r_input_vnlist, err_msg, err_msg_sz);
	} else {
		int select_str_sz = 0;
		relnodes_input_select_init(&r_input_keep_select);
		r_input_keep_select.select_str = get_ms_select_chunk(schedselect); /* has to be freed later */
		select_str_sz = strlen(r_input_keep_select.select_str) + 1;
		pbs_strcat(&r_input_keep_select.select_str, &select_str_sz, "+");
		pbs_strcat(&r_input_keep_select.select_str, &select_str_sz, keep_select);
		populate_mom_list(&succeeded_mom_list, exec_host2);
		r_input_keep_select.succeeded_mom_list = &succeeded_mom_list;

		rc = pbs_release_nodes_given_select(&r_input, &r_input_keep_select, err_msg, err_msg_sz);
		free(r_input_keep_select.select_str);
		reliable_job_node_free(&succeeded_mom_list);
	}

	if (rc != 0) {
		goto recreate_exec_vnode_exit;
	}

	if (new_exec_vnode && (new_exec_vnode[0] != '\0')) {

		if (strcmp(get_jattr_str(pjob, JOB_ATR_exec_vnode),
			   new_exec_vnode) == 0) {
			/* no change */

			if ((err_msg != NULL) && (err_msg_sz > 0)) {
				snprintf(err_msg, err_msg_sz, "node(s) requested to be released not part of the job: %s", vnodelist ? vnodelist : "");
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, pjob->ji_qs.ji_jobid, err_msg);
			}
			goto recreate_exec_vnode_exit;
		}
		set_jattr_str_slim(pjob, JOB_ATR_exec_vnode_acct, get_jattr_str(pjob, JOB_ATR_exec_vnode), NULL);

		/* save original value which will be used later in the accounting end record */
		if ((is_jattr_set(pjob, JOB_ATR_exec_vnode_orig)) == 0) {
			set_jattr_str_slim(pjob, JOB_ATR_exec_vnode_orig,
					   get_jattr_str(pjob, JOB_ATR_exec_vnode), NULL);
		}

		if ((is_jattr_set(pjob, JOB_ATR_resource_acct)) != 0) {
			free_jattr(pjob, JOB_ATR_resource_acct);
			mark_jattr_not_set(pjob, JOB_ATR_resource_acct);
		}
		set_attr_with_attr(&job_attr_def[JOB_ATR_resource_acct], get_jattr(pjob, JOB_ATR_resource_acct), get_jattr(pjob, JOB_ATR_resource), INCR);
		set_jattr_str_slim(pjob, JOB_ATR_exec_vnode, new_exec_vnode, NULL);

		(void) update_resources_list(pjob, ATTR_l,
					     JOB_ATR_resource, new_exec_vnode, INCR, 0,
					     JOB_ATR_resource_orig);
	} else {
		log_err(-1, __func__, "new_exec_vnode is null or empty string");
		goto recreate_exec_vnode_exit;
	}

	if (!keep_select && new_deallocated_execvnode && *new_deallocated_execvnode) {
		set_jattr_str_slim(pjob, JOB_ATR_exec_vnode_deallocated, new_deallocated_execvnode, NULL);
	}

	if (new_exec_host && *new_exec_host) {

		set_jattr_str_slim(pjob, JOB_ATR_exec_host_acct, get_jattr_str(pjob, JOB_ATR_exec_host), NULL);

		/* save original value which will be used later in the accounting end record */
		if ((is_jattr_set(pjob, JOB_ATR_exec_host_orig)) == 0) {
			set_jattr_str_slim(pjob, JOB_ATR_exec_host_orig, get_jattr_str(pjob, JOB_ATR_exec_host), NULL);
		}

		set_jattr_str_slim(pjob, JOB_ATR_exec_host, new_exec_host, NULL);
	} else {
		log_err(-1, __func__, "new_exec_host is null or empty string");
		goto recreate_exec_vnode_exit;
	}

	if (new_exec_host2 && *new_exec_host2) {

		set_jattr_str_slim(pjob, JOB_ATR_exec_host2, new_exec_host2, NULL);
	} else {
		log_err(-1, __func__, "new_exec_host2 is null or empty string");
		goto recreate_exec_vnode_exit;
	}

	if (new_select && *new_select) {
		prdefsl = &svr_resc_def[RESC_SELECT];
		/* re-generate "select" resource */
		if (prdefsl != NULL) {
			presc = find_resc_entry(get_jattr(pjob, JOB_ATR_resource), prdefsl);
			if (presc == NULL)
				presc = add_resource_entry(get_jattr(pjob, JOB_ATR_resource), prdefsl);
			if (presc != NULL) {
				(void) prdefsl->rs_decode(
					&presc->rs_value, NULL, "select", new_select);
			}
		}
		/* re-generate "schedselect" attribute */

		if (is_jattr_set(pjob, JOB_ATR_SchedSelect)) {
			/* Save current SchedSelect value if not */
			/* already saved in *_orig */
			if (!is_jattr_set(pjob, JOB_ATR_SchedSelect_orig))
				set_jattr_str_slim(pjob, JOB_ATR_SchedSelect_orig, get_jattr_str(pjob, JOB_ATR_SchedSelect), NULL);
		}
		set_jattr_str_slim(pjob, JOB_ATR_SchedSelect, new_select, NULL);
		/* re-generate nodect */
		set_chunk_sum(get_jattr(pjob, JOB_ATR_SchedSelect), get_jattr(pjob, JOB_ATR_resource));

	} else {
		log_err(-1, __func__, "new_select is null or empty string");
		goto recreate_exec_vnode_exit;
	}
recreate_exec_vnode_exit:
	free(new_exec_vnode);
	free(new_exec_host);
	free(new_exec_host2);
	free(new_select);
	free(new_deallocated_execvnode);

	return (rc);
}

/**
 * @brief
 *  action_max_run_subjobs This is action function for max_run_subjobs attribute.
 *			   It verifies that the attribute is being set only on array jobs.
 *
 * @param[in]	pattr	-	attribute structure
 * @param[in]	pobject	-	job object
 * @param[in]	actmode	-	action mode
 */
int
action_max_run_subjobs(attribute *pattr, void *pobject, int actmode)
{
	job *pjob = (job *) pobject;
	int jtype;

	if (pjob == NULL)
		return PBSE_INTERNAL;

	jtype = is_job_array(pjob->ji_qs.ji_jobid);
	if (jtype != IS_ARRAY_ArrayJob)
		return PBSE_NOTARRAY_ATTR;

	return PBSE_NONE;
}


================================================
FILE: src/server/svr_mail.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    svr_mail.c
 *
 * @brief
 * 		svr_mail.c - send mail to mail list or owner of job on
 *		job begin, job end, and/or job abort
 *
 * 	Included public functions are:
 *		create_socket_and_connect()
 *		read_smtp_reply()
 *		write3_smtp_data()
 *		send_mail()
 *		send_mail_detach()
 *		svr_mailowner_id()
 *		svr_mailowner()
 *		svr_mailownerResv()
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <errno.h>
#include <sys/types.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "log.h"

#include "job.h"
#include "reservation.h"
#include "server.h"
#include "tpp.h"

/* External Functions Called */

extern void net_close(int);

/* Globol Data */

extern struct server server;
extern char *msg_job_abort;
extern char *msg_job_start;
extern char *msg_job_end;
extern char *msg_resv_abort;
extern char *msg_resv_start;
extern char *msg_resv_end;
extern char *msg_resv_confirm;
extern char *msg_job_stageinfail;

#define MAIL_ADDR_BUF_LEN 1024

/**
 * @brief
 * 		Exec mailer (sendmail like) and return a descriptor with a pipe
 *		where the mailer is waiting for data on stdin. The descriptor
 *		must be closed after conveying data.
 *
 * @param[in]	mailer - path to sendmail/mailer
 * @param[in]	mailfrom - the sender of the email
 * @param[in]	mailto - the recipient of the email
 *
 * @return	FILE *
 * @retval	file descriptor : if fdopen succeed
 * @retval	NULL : failed
 */
static FILE *
svr_exec_mailer(char *mailer, char *mailfrom, char *mailto)
{
	char *margs[5];
	int mfds[2];
	pid_t mcpid;

	/* setup sendmail/mailer command line with -f from_whom */

	margs[0] = mailer;
	margs[1] = "-f";
	margs[2] = mailfrom;
	margs[3] = mailto;
	margs[4] = NULL;

	if (pipe(mfds) == -1)
		exit(1);

	mcpid = fork();
	if (mcpid == 0) {
		/* this child will be sendmail with its stdin set to the pipe */
		close(mfds[1]);
		if (mfds[0] != 0) {
			(void) close(0);
			if (dup(mfds[0]) == -1)
				exit(1);
		}
		(void) close(1);
		(void) close(2);
		if (execv(mailer, margs) == -1)
			exit(1);
	}
	if (mcpid == -1) { /* Error on fork */
		log_err(errno, __func__, "fork failed\n");
		(void) close(mfds[0]);
		exit(1);
	}

	/* parent (not the real server though) will write body of message on pipe */
	(void) close(mfds[0]);

	return (fdopen(mfds[1], "w"));
}

/**
 * @brief
 * 		Send mail to owner of a job when an event happens that
 *		requires mail, such as the job starts, ends or is aborted.
 *		The event is matched against those requested by the user.
 *		For Unix/Linux, a child is forked to not hold up the Server.  This child
 *		will fork/exec sendmail and pipe the To, Subject and body to it.
 *
 * @param[in]	jid	-	the Job ID (string)
 * @param[in]	pjob	-	pointer to the job structure
 * @param[in]	mailpoint	-	which mail event is triggering the send
 * @param[in]	force	-	if non-zero, force the mail even if not requested
 * @param[in]	text	-	the body text of the mail message
 *
 * @return	none
 */
void
svr_mailowner_id(char *jid, job *pjob, int mailpoint, int force, char *text)
{
	int addmailhost;
	int i;
	char *mailer;
	char *mailfrom;
	char mailto[MAIL_ADDR_BUF_LEN];
	int mailaddrlen = 0;
	struct array_strings *pas;
	char *stdmessage = NULL;
	char *pat;

	FILE *outmail;
	pid_t mcpid;

	/* if force is true, force the mail out regardless of mailpoint */

	if (force != MAIL_FORCE) {
		if (pjob != 0) {

			if (pjob->ji_qs.ji_svrflags & JOB_SVFLG_SubJob) {
				if (is_jattr_set(pjob, JOB_ATR_mailpnts)) {
					if (strchr(get_jattr_str(pjob, JOB_ATR_mailpnts), MAIL_SUBJOB) == NULL)
						return;
				} else
					return;
			}

			/* see if user specified mail of this type */

			if (is_jattr_set(pjob, JOB_ATR_mailpnts)) {
				if (strchr(get_jattr_str(pjob, JOB_ATR_mailpnts), mailpoint) == NULL)
					return;
			} else if (mailpoint != MAIL_ABORT) /* not set, default to abort */
				return;

		} else if (!is_sattr_set(SVR_ATR_mailfrom)) {

			/* not job related, must be system related;  not sent unless */
			/* forced or if "mailfrom" attribute set         		 */
			return;
		}
	}

	/*
	 * ok, now we will fork a process to do the mailing to not
	 * hold up the server's other work.
	 */

	mcpid = fork();
	if (mcpid == -1) { /* Error on fork */
		log_err(errno, __func__, "fork failed\n");
		return;
	}
	if (mcpid > 0)
		return; /* its all up to the child now */

	/*
	 * From here on, we are a child process of the server.
	 * Fix up file descriptors and signal handlers.
	 */
	net_close(-1);
	tpp_terminate();

	/* Unprotect child from being killed by kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

	if (is_sattr_set(SVR_ATR_mailer))
		mailer = get_sattr_str(SVR_ATR_mailer);
	else
		mailer = SENDMAIL_CMD;

	/* Who is mail from, if SVR_ATR_mailfrom not set use default */

	if (is_sattr_set(SVR_ATR_mailfrom))
		mailfrom = get_sattr_str(SVR_ATR_mailfrom);
	else
		mailfrom = PBS_DEFAULT_MAIL;

	/* Who does the mail go to?  If mail-list, them; else owner */

	*mailto = '\0';
	if (pjob != 0) {
		if (jid == NULL)
			jid = pjob->ji_qs.ji_jobid;

		if (is_jattr_set(pjob, JOB_ATR_mailuser)) {

			/* has mail user list, send to them rather than owner */

			pas = get_jattr_arst(pjob, JOB_ATR_mailuser);
			if (pas != NULL) {
				for (i = 0; i < pas->as_usedptr; i++) {
					addmailhost = 0;
					mailaddrlen += strlen(pas->as_string[i]) + 2;
					if ((pbs_conf.pbs_mail_host_name) &&
					    (strchr(pas->as_string[i], (int) '@') == NULL)) {
						/* no host specified in address and      */
						/* pbs_mail_host_name is defined, use it */
						mailaddrlen += strlen(pbs_conf.pbs_mail_host_name) + 1;
						addmailhost = 1;
					}
					if (mailaddrlen < sizeof(mailto)) {
						(void) strcat(mailto, pas->as_string[i]);
						if (addmailhost) {
							/* append pbs_mail_host_name */
							(void) strcat(mailto, "@");
							(void) strcat(mailto, pbs_conf.pbs_mail_host_name);
						}
						(void) strcat(mailto, " ");
					} else {
						sprintf(log_buffer, "Email list is too long: \"%.77s...\"", mailto);
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_WARNING, pjob->ji_qs.ji_jobid, log_buffer);
						break;
					}
				}
			}

		} else {

			/* no mail user list, just send to owner */

			pbs_strncpy(mailto, get_jattr_str(pjob, JOB_ATR_job_owner), sizeof(mailto));
			/* if pbs_mail_host_name is set in pbs.conf, then replace the */
			/* host name with the name specified in pbs_mail_host_name    */
			if (pbs_conf.pbs_mail_host_name) {
				if ((pat = strchr(mailto, (int) '@')) != NULL)
					*pat = '\0'; /* remove existing @host */
				if ((strlen(mailto) + strlen(pbs_conf.pbs_mail_host_name) + 1) < sizeof(mailto)) {
					/* append the pbs_mail_host_name since it fits */
					strcat(mailto, "@");
					strcat(mailto, pbs_conf.pbs_mail_host_name);
				} else {
					if (pat)
						*pat = '@'; /* did't fit, restore the "at" sign */
					sprintf(log_buffer, "Email address is too long: \"%.77s...\"", mailto);
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_WARNING, pjob->ji_qs.ji_jobid, log_buffer);
				}
			}
		}

	} else {
		/* send system related mail to "mailfrom" */
		strcpy(mailto, mailfrom);
	}

	if ((outmail = svr_exec_mailer(mailer, mailfrom, mailto)) == NULL)
		exit(1);

	/* Pipe in mail headers: To: and Subject: */

	fprintf(outmail, "To: %s\n", mailto);

	if (pjob)
		fprintf(outmail, "Subject: PBS JOB %s\n\n", jid);
	else
		fprintf(outmail, "Subject: PBS Server on %s\n\n", server_host);

	/* Now pipe in "standard" message */

	switch (mailpoint) {

		case MAIL_ABORT:
			stdmessage = msg_job_abort;
			break;

		case MAIL_BEGIN:
			stdmessage = msg_job_start;
			break;

		case MAIL_END:
			stdmessage = msg_job_end;
			break;

		case MAIL_STAGEIN:
			stdmessage = msg_job_stageinfail;
			break;
	}

	if (pjob) {
		fprintf(outmail, "PBS Job Id: %s\n", jid);
		fprintf(outmail, "Job Name:   %s\n",
			get_jattr_str(pjob, JOB_ATR_jobname));
	}
	if (stdmessage)
		fprintf(outmail, "%s\n", stdmessage);
	if (text != NULL)
		fprintf(outmail, "%s\n", text);
	fclose(outmail);

	exit(0);
}
/**
 * @brief
 * 		svr_mailowner - Send mail to owner of a job when an event happens that
 *		requires mail, such as the job starts, ends or is aborted.
 *		The event is matched against those requested by the user.
 *		For Unix/Linux, a child is forked to not hold up the Server.  This child
 *		will fork/exec sendmail and pipe the To, Subject and body to it.
 *
 * @param[in]	pjob	-	ptr to job (null for server based mail)
 * @param[in]	mailpoint	-	note, single character
 * @param[in]	force	-	if set, force mail delivery
 * @param[in]	text	-	additional message text
 */
void
svr_mailowner(job *pjob, int mailpoint, int force, char *text)
{
	svr_mailowner_id(NULL, pjob, mailpoint, force, text);
}

/**
 * @brief
 * 		Send mail to owner of a reservation when an event happens that
 *		requires mail, such as the reservation starts, ends or is aborted.
 *		The event is matched against those requested by the user.
 *		For Unix/Linux, a child is forked to not hold up the Server.  This child
 *		will fork/exec sendmail and pipe the To, Subject and body to it.
 *
 * @param[in]	presv	-	pointer to the reservation structure
 * @param[in]	mailpoint	-	which mail event is triggering the send
 * @param[in]	force	-	if non-zero, force the mail even if not requested
 * @param[in]	text	-	the body text of the mail message
 *
 * @return	none
 */
void
svr_mailownerResv(resc_resv *presv, int mailpoint, int force, char *text)
{
	int i;
	int addmailhost;
	char *mailer;
	char *mailfrom;
	char mailto[MAIL_ADDR_BUF_LEN];
	int mailaddrlen = 0;
	struct array_strings *pas;
	char *pat;
	char *stdmessage = NULL;

	FILE *outmail;
	pid_t mcpid;

	if (force != MAIL_FORCE) {
		/*Not forcing out mail regardless of mailpoint */

		if (is_rattr_set(presv, RESV_ATR_mailpnts)) {
			/*user has set one or mode mailpoints is this one included?*/
			if (strchr(get_rattr_str(presv, RESV_ATR_mailpnts), mailpoint) == NULL)
				return;
		} else {
			/*user hasn't bothered to set any mailpoints so default to
			 *sending mail only in the case of reservation deletion and
			 *reservation confirmation
			 */
			if ((mailpoint != MAIL_ABORT) && (mailpoint != MAIL_CONFIRM))
				return;
		}
	}

	if (is_rattr_set(presv, RESV_ATR_mailpnts)) {
		if (strchr(get_rattr_str(presv, RESV_ATR_mailpnts), MAIL_NONE) != NULL)
			return;
	}

	/*
	 * ok, now we will fork a process to do the mailing to not
	 * hold up the server's other work.
	 */

	mcpid = fork();
	if (mcpid == -1) { /* Error on fork */
		log_err(errno, __func__, "fork failed\n");
		return;
	}
	if (mcpid > 0)
		return; /* its all up to the child now */

	/*
	 * From here on, we are a child process of the server.
	 * Fix up file descriptors and signal handlers.
	 */

	net_close(-1);
	tpp_terminate();

	/* Unprotect child from being killed by kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_OFF);

	if (is_sattr_set(SVR_ATR_mailer))
		mailer = get_sattr_str(SVR_ATR_mailer);
	else
		mailer = SENDMAIL_CMD;

	/* Who is mail from, if SVR_ATR_mailfrom not set use default */

	if (is_sattr_set(SVR_ATR_mailfrom))
		mailfrom = get_sattr_str(SVR_ATR_mailfrom);
	else
		mailfrom = PBS_DEFAULT_MAIL;

	/* Who does the mail go to?  If mail-list, them; else owner */

	*mailto = '\0';
	if (is_rattr_set(presv, RESV_ATR_mailuser)) {

		/* has mail user list, send to them rather than owner */

		pas = get_rattr_arst(presv, RESV_ATR_mailuser);
		if (pas != NULL) {
			for (i = 0; i < pas->as_usedptr; i++) {
				addmailhost = 0;
				mailaddrlen += strlen(pas->as_string[i]) + 2;
				if ((pbs_conf.pbs_mail_host_name) &&
				    (strchr(pas->as_string[i], (int) '@') == NULL)) {
					/* no host specified in address and      */
					/* pbs_mail_host_name is defined, use it */
					mailaddrlen += strlen(pbs_conf.pbs_mail_host_name) + 1;
					addmailhost = 1;
				}
				if (mailaddrlen < sizeof(mailto)) {
					(void) strcat(mailto, pas->as_string[i]);
					if (addmailhost) {
						/* append pbs_mail_host_name */
						(void) strcat(mailto, "@");
						(void) strcat(mailto, pbs_conf.pbs_mail_host_name);
					} else {
						sprintf(log_buffer, "Email list is too long: \"%.77s...\"", mailto);
						log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_WARNING, presv->ri_qs.ri_resvID, log_buffer);
						break;
					}
					(void) strcat(mailto, " ");
				}
			}
		}

	} else {

		/* no mail user list, just send to owner */

		(void) pbs_strncpy(mailto, get_rattr_str(presv, RESV_ATR_resv_owner), sizeof(mailto));
		/* if pbs_mail_host_name is set in pbs.conf, then replace the */
		/* host name with the name specified in pbs_mail_host_name    */
		if (pbs_conf.pbs_mail_host_name) {
			if ((pat = strchr(mailto, (int) '@')) != NULL)
				*pat = '\0'; /* remove existing @host */
			if ((strlen(mailto) + strlen(pbs_conf.pbs_mail_host_name) + 1) < sizeof(mailto)) {
				/* append the pbs_mail_host_name since it fits */
				strcat(mailto, "@");
				strcat(mailto, pbs_conf.pbs_mail_host_name);
			} else {
				if (pat)
					*pat = '@'; /* did't fit, restore the "at" sign */
				sprintf(log_buffer, "Email address is too long: \"%.77s...\"", mailto);
				log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_WARNING, presv->ri_qs.ri_resvID, log_buffer);
			}
		}
	}

	if ((outmail = svr_exec_mailer(mailer, mailfrom, mailto)) == NULL)
		exit(1);

	/* Pipe in mail headers: To: and Subject: */

	fprintf(outmail, "To: %s\n", mailto);
	fprintf(outmail, "Subject: PBS RESERVATION %s\n\n", presv->ri_qs.ri_resvID);

	/* Now pipe in "standard" message */

	switch (mailpoint) {

		case MAIL_ABORT:
			/*"Aborted by Server, Scheduler, or User "*/
			stdmessage = msg_resv_abort;
			break;

		case MAIL_BEGIN:
			/*"Reservation period starting"*/
			stdmessage = msg_resv_start;
			break;

		case MAIL_END:
			/*"Reservation terminated"*/
			stdmessage = msg_resv_end;
			break;

		case MAIL_CONFIRM:
			/*scheduler requested, "CONFIRM reservation"*/
			stdmessage = msg_resv_confirm;
			break;
	}

	fprintf(outmail, "PBS Reservation Id: %s\n", presv->ri_qs.ri_resvID);
	fprintf(outmail, "Reservation Name:   %s\n", get_rattr_str(presv, RESV_ATR_resv_name));
	if (stdmessage)
		fprintf(outmail, "%s\n", stdmessage);
	if (text != NULL)
		fprintf(outmail, "%s\n", text);
	fclose(outmail);

	exit(0);
}


================================================
FILE: src/server/svr_movejob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <errno.h>
#include <string.h>
#include <signal.h>
#include <sys/types.h>

#include <unistd.h>
#include <fcntl.h>
#include <time.h>
#include <sys/time.h>
#include <sys/param.h>
#include <sys/wait.h>
#include <netdb.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>

#include "libpbs.h"
#include "pbs_error.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "work_task.h"
#include "log.h"
#include "pbs_db.h"
#include "batch_request.h"
#include "resv_node.h"
#include "queue.h"
#include "job.h"
#include "reservation.h"
#include "credential.h"
#include "ticket.h"
#include "queue.h"
#include "job.h"
#include "net_connect.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include <libutil.h>
#include "tpp.h"
#include <memory.h>
#include "server.h"
#include "hook.h"
#include "pbs_sched.h"
#include "acct.h"

#define RETRY 3 /* number of times to retry network move */

/* External functions called */

extern void stat_mom_job(job *);
int local_move(job *, struct batch_request *);

/* Private Functions local to this file */

static void post_movejob(struct work_task *);
static void post_routejob(struct work_task *);
static int small_job_files(job *pjob);
extern int should_retry_route(int err);
extern int move_job_file(int con, job *pjob, enum job_file which, int prot, char **msgid);
extern void post_sendmom(struct work_task *pwt);

/* Global Data */

#if !defined(H_ERRNO_DECLARED)
extern int h_errno;
#endif
extern char *path_jobs;
extern char *path_spool;
extern attribute_def job_attr_def[];
extern char *msg_badexit;
extern char *msg_routebad;
extern char *msg_routexceed;
extern char *msg_manager;
extern char *msg_movejob;
extern char *msg_err_malloc;
extern int comp_resc_gt, comp_resc_eq, comp_resc_lt;
extern int pbs_errno;
extern pbs_net_t pbs_server_addr;
extern int resc_access_perm;
extern time_t time_now;
extern int svr_create_tmp_jobscript(job *pj, char *script_name);
extern int scheduler_jobs_stat;
extern char *path_hooks_workdir;
extern struct work_task *add_mom_deferred_list(int stream, mominfo_t *minfo, void (*func)(struct work_task *), char *msgid, void *parm1, void *parm2);

/**
 * @brief
 * 		svr_movejob - Test if the destination is local or not and call a routine to
 * 		do the appropriate move.
 *
 * param[in,out]	jobp	-	pointer to job to move
 * param[in]	destination	-	destination to be moved
 * param[in]	req	-	client request from a qmove client, null if a route
 *
 * @return	int
 * @retval	0	: success
 * @retval	-1	: permenent failure or rejection,
 * @retval	1	: failed but try again
 * @reval	2	: deferred (ie move in progress), check later
 */
int
svr_movejob(job *jobp, char *destination, struct batch_request *req)
{
	unsigned int port = pbs_server_port_dis;
	char *toserver;

	if (strlen(destination) >= (size_t) PBS_MAXROUTEDEST) {
		sprintf(log_buffer, "name %s over maximum length of %d",
			destination, PBS_MAXROUTEDEST);
		log_err(-1, "svr_movejob", log_buffer);
		pbs_errno = PBSE_QUENBIG;
		return -1;
	}

	strncpy(jobp->ji_qs.ji_destin, destination, PBS_MAXROUTEDEST);
	jobp->ji_qs.ji_un_type = JOB_UNION_TYPE_ROUTE;

	if ((toserver = strchr(destination, '@')) != NULL) {
		/* check to see if the part after '@' is this server */
		int comp = -1;
		comp = comp_svraddr(pbs_server_addr, parse_servername(++toserver, &port), NULL);
		if ((comp == 1) ||
		    (port != pbs_server_port_dis)) {
			return (net_move(jobp, req)); /* not a local dest */
		} else if (comp == 2)
			return -1;
	}

	/* if get to here, it is a local destination */
	return (local_move(jobp, req));
}

/**
 * @brief
 * 		Move a job to another queue in this Server.
 *
 * @par
 * 		Check the destination to see if it can accept the job.
 * 		If the job can enter the new queue, dequeue from the existing queue and
 * 		enqueue into the new queue
 *
 * @par
 * 		Note - the destination is specified by the queue's name in the
 *		ji_qs.ji_destin element of the job structure.
 *
 * param[in]	jobp	-	pointer to job to move
 * param[in]	req	-	client request from a qmove client, null if a route
 *
 * @return	int
 * @retval  0	: success
 * @retval -1	: permanent failure or rejection, see pbs_errno
 * @retval  1	: failed but try again later
 */
int
local_move(job *jobp, struct batch_request *req)
{
	pbs_queue *qp;
	char *destination = jobp->ji_qs.ji_destin;
	int mtype;
	long newtype = -1;
	long long time_usec;
	struct timeval tval;
	conn_t *conn = NULL;
	char *physhost = NULL;

	/* search for destination queue */
	if ((qp = find_queuebyname(destination)) == NULL) {
		sprintf(log_buffer,
			"queue %s does not exist",
			destination);
		log_err(-1, __func__, log_buffer);
		pbs_errno = PBSE_UNKQUE;
		return -1;
	}

	/*
	 * if being moved at specific request of administrator, then
	 * checks on queue availability, etc. are skipped;
	 * otherwise all checks are enforced.
	 */

	if (req == NULL) {
		mtype = MOVE_TYPE_Route; /* route */
	} else if (req->rq_perm & (ATR_DFLAG_MGRD | ATR_DFLAG_MGWR) && find_sched_from_sock(req->rq_conn, CONN_SCHED_PRIMARY) == NULL) {
		mtype = MOVE_TYPE_MgrMv; /* privileged move */
	} else {
		mtype = MOVE_TYPE_Move; /* non-privileged move */
	}

	if (req != NULL) {
		conn = get_conn(req->rq_conn);
		if (conn) {
			physhost = conn->cn_physhost;
		}
	}

	pbs_errno = svr_chkque(jobp, qp, get_jattr_str(jobp, JOB_ATR_submit_host), physhost, mtype);
	if (pbs_errno) {
		/* should this queue be retried? */
		return (should_retry_route(pbs_errno));
	}

	/* dequeue job from present queue, update destination and	*/
	/* queue rank for new queue and enqueue into destination	*/

	svr_dequejob(jobp);
	jobp->ji_myResv = NULL;
	pbs_strncpy(jobp->ji_qs.ji_queue, qp->qu_qs.qu_name, PBS_MAXQUEUENAME + 1);

	gettimeofday(&tval, NULL);
	time_usec = (tval.tv_sec * 1000000L) + tval.tv_usec;

	set_jattr_ll_slim(jobp, JOB_ATR_qrank, time_usec, SET);

	if (qp->qu_resvp) {
		set_jattr_generic(jobp, JOB_ATR_reserve_ID, qp->qu_resvp->ri_qs.ri_resvID, NULL, INTERNAL);
		jobp->ji_myResv = qp->qu_resvp;
	} else
		set_jattr_generic(jobp, JOB_ATR_reserve_ID, NULL, NULL, INTERNAL);

	if (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1) {
		newtype = determine_accruetype(jobp);
		update_eligible_time(newtype, jobp);
	}

	if ((pbs_errno = svr_enquejob(jobp, NULL)) != 0)
		return -1; /* should never ever get here */
	account_jobstr(jobp, PBS_ACCT_QUEUE);

	jobp->ji_lastdest = 0; /* reset in case of another route */

	job_save_db(jobp);

	/* If a scheduling cycle is in progress, then this moved job may have
	 * had changes resulting from the move that would impact scheduling or
	 * placement, add job to list of jobs which cannot be run in this cycle.
	 */
	if ((req == NULL || (find_sched_from_sock(req->rq_conn, CONN_SCHED_PRIMARY) == NULL)) && (scheduler_jobs_stat))
		am_jobs_add(jobp);

	return 0;
}

/**
 * @brief
 * 		post_routejob - clean up action for child started in net_move/send_job
 *		   to "route" a job to another server
 * @par
 * 		If route was successfull, delete job.
 * @par
 * 		If route didn't work, mark destination not to be tried again for this
 * 		job and call route again.
 *
 * @param[in]	pwt	-	work task structure
 *
 * @return	none.
 */
static void
post_routejob(struct work_task *pwt)
{
	char newstate;
	int newsub;
	int r;
	int stat = pwt->wt_aux;
	job *jobp = (job *) pwt->wt_parm2;

	if (jobp == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_INFO, "", "post_routejob failed, jobp NULL");
		return;
	}

	if (WIFEXITED(stat)) {
		r = WEXITSTATUS(stat);
	} else {
		r = SEND_JOB_FATAL;
		(void) sprintf(log_buffer, msg_badexit, stat);
		(void) strcat(log_buffer, __func__);
		log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_NOTICE,
			  jobp->ji_qs.ji_jobid, log_buffer);
	}

	switch (r) {
		case SEND_JOB_OK: /* normal return, job was routed */

			if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_StagedIn)
				remove_stagein(jobp);
			/*
			 * If the server is configured to keep job history and the job
			 * is created here, do not purge the job structure but save
			 * it for history purpose. No need to check for sub-jobs as
			 * sub jobs can not be routed.
			 */
			if (svr_chk_history_conf())
				svr_setjob_histinfo(jobp, T_MOV_JOB);
			else
				job_purge(jobp); /* need to remove server job struct */
			return;
		case SEND_JOB_FATAL: /* permanent rejection (or signal) */
			if (check_job_substate(jobp, JOB_SUBSTATE_ABORT)) {

				/* Job Delete in progress, just set to queued status */

				svr_setjobstate(jobp, JOB_STATE_LTR_QUEUED,
						JOB_SUBSTATE_ABORT);
				return;
			}
			add_dest(jobp); /* else mark destination as bad */
					/* fall through */
		default:		/* try routing again */
			/* force re-eval of job state out of Transit */
			svr_evaljobstate(jobp, &newstate, &newsub, 1);
			svr_setjobstate(jobp, newstate, newsub);
			jobp->ji_retryok = 1;
			if ((r = job_route(jobp)) == PBSE_ROUTEREJ)
				(void) job_abt(jobp, msg_routebad);
			else if (r != 0)
				(void) job_abt(jobp, msg_routexceed);
			break;
	}
	return;
}

extern pbs_list_head task_list_event;
extern pbs_list_head task_list_immed;

/**
 * @brief
 * 		check_move_status - check if the move was successful or not
 * @param[in]	jobp	-	pointer to job being moved
 * @param[in]	prot	-	request protocol
 * @param[in]	wstat	-	child status
 * @param[in]	rq_move	-	pointer to move job structure
 * @param[in]	rq_user	-	requesting user
 * @param[in]	rq_host	-	requesting host
 *
 * @return	move status
 * @retval  0 	success
 * @retval  !0 	failure
 */
int
check_move_status(job *jobp, int prot, int wstat, struct rq_move *rq_move, char *rq_user, char *rq_host)
{
	int r = 0;

	if (prot == PROT_TCP) {
		if (WIFEXITED(wstat)) {
			r = WEXITSTATUS(wstat);
			if (r != SEND_JOB_OK) {
				r = PBSE_ROUTEREJ;
			}
		} else
			r = PBSE_SYSTEM;

	} else {
		switch (wstat) {
			case PBSE_NONE:
				r = SEND_JOB_OK;
				break;
			case PBSE_SYSTEM:
				r = PBSE_SYSTEM;
				break;
			default:
				r = PBSE_ROUTEREJ;
				break;
		}
	}

	switch (r) {
		case SEND_JOB_OK:
			if (jobp && jobp->ji_qs.ji_svrflags & JOB_SVFLG_StagedIn)
				remove_stagein(jobp);
			strcpy(log_buffer, msg_movejob);
			sprintf(log_buffer + strlen(log_buffer),
				msg_manager,
				rq_move->rq_destin,
				rq_user, rq_host);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  rq_move->rq_jid, log_buffer);
			break;
		case PBSE_SYSTEM:
			sprintf(log_buffer, msg_badexit, wstat);
			strcat(log_buffer, __func__);
			log_event(PBSEVENT_SYSTEM, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  rq_move->rq_jid, log_buffer);
			break;
		case PBSE_ROUTEREJ:
			log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_NOTICE,
				  rq_move->rq_jid, msg_routebad);
	}

	return r;
}

/**
 * @brief
 * 		post_movejob - clean up action for child started in net_move/send_job
 *		   to "move" a job to another server
 * @par
 * 		If move was successfull, delete server's copy of thejob structure,
 * 		and reply to request.
 * @par
 * 		If route didn't work, reject the request.
 *
 * @param[in]	pwt	-	work task structure
 *
 * @return	none.
 */
static void
post_movejob(struct work_task *pwt)
{
	struct batch_request *req;
	int r;
	job *jobp;
	int prot = pwt->wt_aux2;
	int wstat = pwt->wt_aux;
	struct rq_move *rq_move;

	req = (struct batch_request *) pwt->wt_parm1;
	pbs_errno = PBSE_NONE;
	if (req->rq_type != PBS_BATCH_MoveJob) {
		sprintf(log_buffer, "bad request type %d", req->rq_type);
		log_err(-1, __func__, log_buffer);
		return;
	}

	rq_move = &req->rq_ind.rq_move;
	jobp = find_job(rq_move->rq_jid);

	if ((jobp == NULL) || (jobp != (job *) pwt->wt_parm2))
		log_errf(-1, __func__, "job %s not found", rq_move->rq_jid);

	r = check_move_status(jobp, prot, wstat, rq_move, req->rq_user, req->rq_host);

	if (r == SEND_JOB_OK) {
		/*
		* If server is configured to keep job history info and
		* the job is created here, then keep the job struture
		* for history purpose without purging. No need to check
		* for sub-jobs as sub jobs can't be moved.
		*/
		if (jobp) {
			if (svr_chk_history_conf())
				svr_setjob_histinfo(jobp, T_MOV_JOB);
			else
				job_purge(jobp);
		}
		reply_ack(req);
	} else {
		if (jobp)
			svr_evalsetjobstate(jobp);
		req_reject(r, 0, req);
	}

	return;
}

/**
 *
 * @brief
 * 	Send execution job on connected tpp stream.
 *	Note: Job structure has been loaded with the script by now (ji_script populated)
 *
 * @param[in]	jobp - pointer to the job being sent
 * @param[in]	hostaddr - the address of host to send job to, host byte order
 * @param[in]	port - the destination port, host byte order
 * @param[in]	move_type - the type of move (e.g. MOVE_TYPE_exec)
 * @param[in]	request - The batch request associated with this send job call
 *
 * @return int
 * @retval  2 	success
 * @retval  -1 	failure (pbs_errno set to error number)
 *
 */
int
send_job_exec(job *jobp, pbs_net_t hostaddr, int port, int move_type, struct batch_request *request)
{
	pbs_list_head attrl;
	mominfo_t *pmom = NULL;
	int stream = -1;
	int encode_type;
	char *destin = jobp->ji_qs.ji_destin;
	int i;
	size_t credlen = 0;
	char *credbuf = NULL;
	char job_id[PBS_MAXSVRJOBID + 1];
	struct attropl *pqjatr; /* list (single) of attropl for quejob */
	int rc;
	char *jobid = NULL;
	char *msgid = NULL;
	char *dup_msgid = NULL;
	struct work_task *ptask = NULL;
	int save_resc_access_perm;
	char *extend = NULL;
	void (*post_func)(struct work_task *) = post_sendmom;
	char *extend_commit = NULL;

	/* saving resc_access_perm global variable as backup */
	save_resc_access_perm = resc_access_perm;
	pbs_errno = PBSE_NONE;

	stream = svr_connect(hostaddr, port, NULL, ToServerDIS, PROT_TPP);
	if (stream < 0) {
		sprintf(log_buffer, "Could not connect to Mom, svr_connect returned %d", stream);
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_REQUEST, LOG_WARNING, "", log_buffer);
		goto send_err;
	}

	pmom = tfind2(hostaddr, port, &ipaddrs);
	if (!pmom || (pmom->mi_dmn_info->dmn_state & INUSE_DOWN)) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_REQUEST, LOG_WARNING, "", "Mom is down");
		pbs_errno = PBSE_NORELYMOM;
		goto send_err;
	}

	CLEAR_HEAD(attrl);

	resc_access_perm = ATR_DFLAG_MOM;
	encode_type = ATR_ENCODE_MOM;

	for (i = 0; i < (int) JOB_ATR_LAST; i++) {
		if ((job_attr_def + i)->at_flags & resc_access_perm) {
			(void) (job_attr_def + i)->at_encode(get_jattr(jobp, i), &attrl, (job_attr_def + i)->at_name, NULL, encode_type, NULL);
		}
	}
	attrl_fixlink(&attrl);
	/* save the job id for when after we purge the job */

	/* read any credential file */
	get_credential(pmom->mi_host, jobp, PBS_GC_BATREQ, &credbuf, &credlen);

	strcpy(job_id, jobp->ji_qs.ji_jobid);

	if (((jobp->ji_qs.ji_svrflags & JOB_SVFLG_SCRIPT) == 0) && (credlen <= 0) && ((jobp->ji_qs.ji_svrflags & JOB_SVFLG_HASRUN) == 0))
		extend = EXTEND_OPT_IMPLICIT_COMMIT;

	pqjatr = &((svrattrl *) GET_NEXT(attrl))->al_atopl;
	jobid = PBSD_queuejob(stream, jobp->ji_qs.ji_jobid, destin, pqjatr, extend, PROT_TPP, &msgid, NULL);
	free_attrlist(&attrl);
	if (jobid == NULL)
		goto send_err;

	tpp_add_close_func(stream, process_DreplyTPP); /* register a close handler */

	/* adding msgid to deferred list, dont free msgid */
	if ((ptask = add_mom_deferred_list(stream, pmom, post_func, msgid, request, jobp)) == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_REQUEST, LOG_WARNING, "", "add_mom_deferred_list returned NULL");
		pbs_errno = PBSE_SYSTEM;
		goto send_err;
	}

	/* add to pjob->svrtask list so its automatically cleared when job is purged */
	append_link(&jobp->ji_svrtask, &ptask->wt_linkobj, ptask);

	/*
	 * svr-mom communication is asynchronous, so PBSD_quejob does not return in this flow
	 * hence commit_done is meaningless here
	 * We only need to check extend and skip sending the other messages
	 */
	if (extend)
		goto done;

	/* we cannot use the same msgid, since it is not part of the preq,
	 * make a dup of it, and we can freely free it
	 */
	if ((dup_msgid = strdup(msgid)) == NULL) {
		log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_REQUEST, LOG_WARNING, "", "strdup returned NULL");
		pbs_errno = PBSE_SYSTEM;
		goto send_err;
	}

	/*
	 * henceforth use the same msgid, since we mean to say all this is
	 * part of a single logical request to the mom
	 * and we will be hanging off one request to be answered to finally
	 */
	if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_SCRIPT) {
		if (PBSD_jscript_direct(stream, jobp->ji_script, PROT_TPP, &dup_msgid) != 0)
			goto send_err;
	}
	if (jobp->ji_script) {
		free(jobp->ji_script);
		jobp->ji_script = NULL;
	}

	if (credlen > 0) {
		rc = PBSD_jcred(stream, jobp->ji_extended.ji_ext.ji_credtype, credbuf, credlen, PROT_TPP, &dup_msgid);
		if (credbuf)
			free(credbuf);
		if (rc != 0)
			goto send_err;
	}

	if ((jobp->ji_qs.ji_svrflags & JOB_SVFLG_HASRUN) && (hostaddr != pbs_server_addr)) {
		if ((move_job_file(stream, jobp, StdOut, PROT_TPP, &dup_msgid) != 0) ||
		    (move_job_file(stream, jobp, StdErr, PROT_TPP, &dup_msgid) != 0) ||
		    (move_job_file(stream, jobp, Chkpt, PROT_TPP, &dup_msgid) != 0))
			goto send_err;
	}

	if (PBSD_commit(stream, job_id, PROT_TPP, &dup_msgid, extend_commit) != 0)
		goto send_err;

done:
	free(dup_msgid);			  /* free this as it is not part of any work task */
	resc_access_perm = save_resc_access_perm; /* reset back to it's old value */
	return 2;

send_err:
	free(dup_msgid);

	if (jobp->ji_script) {
		free(jobp->ji_script);
		jobp->ji_script = NULL;
	}

	if (ptask) {
		if (ptask->wt_event2)
			free(ptask->wt_event2);
		delete_task(ptask);
	}

	sprintf(log_buffer, "send of job to %s failed error = %d", destin, pbs_errno);
	log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);
	resc_access_perm = save_resc_access_perm; /* reset back to it's old value */
	return (-1);
}

/**
 *
 * @brief
 * 		Send a job over the network to some other server or MOM.
 * @par
 * 		Under Linux/Unix, this starts a child process to do the work.
 *		Connect to the destination host and port,
 * 		and go through the protocol to transfer the job.
 * 		Signals are blocked.
 *
 * @param[in]	jobp	-	pointer to the job being sent.
 * @param[in]	hostaddr	-	the address of host to send job to, host byte order.
 * @param[in]	port	-	the destination port, host byte order
 * @param[in]	move_type	-	the type of move (e.g. MOVE_TYPE_exec)
 * @param[in]	post_func	-	the function to execute once the child process
 *								sending job completes (Linux/Unix only)
 * @param[in]	data	-	input data to 'post_func'
 *
 * @return	int
 * @retval	2	parent	: success (child forked)
 * @retval	-1	parent	: on failure (pbs_errno set to error number)
 * @retval	SEND_JOB_OK	child	: 0 success, job sent
 * @retval	SEND_JOB_FATAL	child	: 1 permenent failure or rejection,
 * @retval	SEND_JOB_RETRY	child	: 2 failed but try again
 * @retval	SEND_JOB_NODEDW child	: 3 execution node down, retry different node
 */
int
send_job(job *jobp, pbs_net_t hostaddr, int port, int move_type,
	 void (*post_func)(struct work_task *), struct batch_request *preq)
{
	pbs_list_head attrl;
	enum conn_type cntype = ToServerDIS;
	int con;
	char *credbuf = NULL;
	size_t credlen = 0;
	char *destin = jobp->ji_qs.ji_destin;
	int encode_type;
	int i;
	char job_id[PBS_MAXSVRJOBID + 1];
	pid_t pid;
	struct attropl *pqjatr; /* list (single) of attropl for quejob */
	char script_name[MAXPATHLEN + 1];
	struct work_task *ptask;
	struct hostent *hp;
	struct in_addr addr;
	long tempval;

	/* if job has a script read it from database */
	if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_SCRIPT) {
		if (svr_load_jobscript(jobp) == NULL) {
			pbs_errno = PBSE_SYSTEM;
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to load job script for job %s",
				 jobp->ji_qs.ji_jobid);
			log_err(pbs_errno, __func__, log_buffer);
			return (-1);
		}
	}

	if (move_type == MOVE_TYPE_Exec && small_job_files(jobp))
		return send_job_exec(jobp, hostaddr, port, move_type, preq);

	snprintf(log_buffer, sizeof(log_buffer), "big job files, sending via subprocess");
	log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);

	script_name[0] = '\0';
	/* if job has a script read it from database */
	if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_SCRIPT) {
		/* write the job script to a temporary file */
		if (svr_create_tmp_jobscript(jobp, script_name) != 0) {
			pbs_errno = PBSE_SYSTEM;
			snprintf(log_buffer, sizeof(log_buffer),
				 "Failed to create temporary job script for job %s",
				 jobp->ji_qs.ji_jobid);
			log_err(pbs_errno, __func__, log_buffer);

			if (jobp->ji_script) {
				free(jobp->ji_script);
				jobp->ji_script = NULL;
			}

			return -1;
		}
	}

	if (jobp->ji_script) {
		free(jobp->ji_script);
		jobp->ji_script = NULL;
	}

	pid = fork();
	if (pid == -1) { /* Error on fork */
		log_err(errno, __func__, "fork failed\n");
		pbs_errno = PBSE_SYSTEM;
		return -1;
	}

	if (pid != 0) { /* The parent (main server) */

		ptask = set_task(WORK_Deferred_Child, pid, post_func, preq);
		if (!ptask) {
			log_err(errno, __func__, msg_err_malloc);
			return (-1);
		} else {
			ptask->wt_parm2 = jobp;
			append_link(&((job *) jobp)->ji_svrtask,
				    &ptask->wt_linkobj, ptask);
		}
		return 2;
	}

	/*
	 * the child process
	 *
	 * set up signal cather for error return
	 */
	DBPRT(("%s: child started, sending to port %d\n", __func__, port))
	tpp_terminate();

	/* Unprotect child from being killed by kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_OFF);
	addr.s_addr = htonl(hostaddr);
	hp = gethostbyaddr((void *) &addr, sizeof(struct in_addr), AF_INET);
	if (hp == NULL) {
		sprintf(log_buffer, "%s: h_errno=%d",
			inet_ntoa(addr), h_errno);
		log_err(-1, __func__, log_buffer);
	} else {
		/* read any credential file */
		(void) get_credential(hp->h_name, jobp, PBS_GC_BATREQ,
				      &credbuf, &credlen);
	}
	/* encode job attributes to be moved */

	CLEAR_HEAD(attrl);

	/* select attributes/resources to send based on move type */

	if (move_type == MOVE_TYPE_Exec) {
		resc_access_perm = ATR_DFLAG_MOM;
		encode_type = ATR_ENCODE_MOM;
		cntype = ToServerDIS;
	} else {
		resc_access_perm = ATR_DFLAG_USWR | ATR_DFLAG_OPWR |
				   ATR_DFLAG_MGWR | ATR_DFLAG_SvRD;
		encode_type = ATR_ENCODE_SVR;
		svr_dequejob(jobp); /* clears default resource settings */
	}

	/* our job is to calc eligible time accurately and save it */
	/* on new server, accrue type should be calc afresh */
	/* Note: if job is being sent for execution on mom, then don't calc eligible time */

	if ((get_jattr_long(jobp, JOB_ATR_accrue_type) == JOB_ELIGIBLE) &&
	    (get_sattr_long(SVR_ATR_EligibleTimeEnable) == 1) &&
	    (move_type != MOVE_TYPE_Exec)) {
		tempval = ((long) time_now - get_jattr_long(jobp, JOB_ATR_sample_starttime));
		set_jattr_l_slim(jobp, JOB_ATR_eligible_time, tempval, INCR);
	}

	for (i = 0; i < (int) JOB_ATR_LAST; i++) {
		if ((job_attr_def + i)->at_flags & resc_access_perm) {
			(void) (job_attr_def + i)->at_encode(get_jattr(jobp, i), &attrl, (job_attr_def + i)->at_name, NULL, encode_type, NULL);
		}
	}
	attrl_fixlink(&attrl);

	/* save the job id for when after we purge the job */

	(void) strcpy(job_id, jobp->ji_qs.ji_jobid);

	pbs_errno = 0;
	con = -1;

	for (i = 0; i < RETRY; i++) {

		/* connect to receiving server with retries */

		if (i > 0) { /* recycle after an error */
			if (con >= 0)
				svr_disconnect(con);
			if (should_retry_route(pbs_errno) == -1) {
				/* delete the temp script file */
				unlink(script_name);
				exit(SEND_JOB_FATAL); /* fatal error, don't retry */
			}
			sleep(1 << i);
		}
		if ((con = svr_connect(hostaddr, port, 0, cntype, PROT_TCP)) == PBS_NET_RC_FATAL) {
			log_errf(pbs_errno, __func__, "send_job failed to %lx port %d",
				 hostaddr, port);

			/* delete the temp script file */
			unlink(script_name);

			if ((move_type == MOVE_TYPE_Exec) && (pbs_errno == PBSE_BADCRED))
				exit(SEND_JOB_NODEDW);

			exit(SEND_JOB_FATAL);
		} else if (con == PBS_NET_RC_RETRY) {
			pbs_errno = ECONNREFUSED; /* should retry */
			continue;
		}

		/*
		 * if the job is substate JOB_SUBSTATE_TRNOUTCM which means
		 * we are recovering after being down or a late failure, we
		 * just want to send the commit"
		 */

		if (!check_job_substate(jobp, JOB_SUBSTATE_TRNOUTCM)) {

			if (!check_job_substate(jobp, JOB_SUBSTATE_TRNOUT))
				set_job_substate(jobp, JOB_SUBSTATE_TRNOUT);

			pqjatr = &((svrattrl *) GET_NEXT(attrl))->al_atopl;
			if (PBSD_queuejob(con, jobp->ji_qs.ji_jobid, destin, pqjatr, NULL, PROT_TCP, NULL, NULL) == 0) {
				if (pbs_errno == PBSE_JOBEXIST && move_type == MOVE_TYPE_Exec) {
					/* already running, mark it so */
					log_event(PBSEVENT_ERROR, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, "Mom reports job already running");
					exit(SEND_JOB_OK);
				} else if ((pbs_errno == PBSE_HOOKERROR) || (pbs_errno == PBSE_HOOK_REJECT) ||
					   (pbs_errno == PBSE_HOOK_REJECT_RERUNJOB) || (pbs_errno == PBSE_HOOK_REJECT_DELETEJOB)) {
					char name_buf[MAXPATHLEN + 1];
					int rfd;
					int len;
					char *reject_msg;
					int err;

					err = pbs_errno;

					reject_msg = pbs_geterrmsg(con);
					(void) sprintf(log_buffer, "send of job to %s failed error = %d reject_msg=%s", destin, err, reject_msg ? reject_msg : "");
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);

					(void) strcpy(name_buf, path_hooks_workdir);
					(void) strcat(name_buf, jobp->ji_qs.ji_jobid);
					(void) strcat(name_buf, HOOK_REJECT_SUFFIX);

					if ((reject_msg != NULL) && (reject_msg[0] != '\0')) {
						if ((rfd = open(name_buf, O_RDWR | O_CREAT | O_TRUNC, 0600)) == -1) {
							sprintf(log_buffer, "open of reject file %s failed: errno %d", name_buf, errno);
							log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);
						} else {
							len = strlen(reject_msg) + 1;
							/* write also trailing null char */
							if (write(rfd, reject_msg, len) != len) {
								sprintf(log_buffer, "write to file %s incomplete: errno %d", name_buf, errno);
								log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);
							}
							close(rfd);
						}
					}

					if (err == PBSE_HOOKERROR)
						exit(SEND_JOB_HOOKERR);
					if (err == PBSE_HOOK_REJECT)
						exit(SEND_JOB_HOOK_REJECT);
					if (err == PBSE_HOOK_REJECT_RERUNJOB)
						exit(SEND_JOB_HOOK_REJECT_RERUNJOB);
					if (err == PBSE_HOOK_REJECT_DELETEJOB)
						exit(SEND_JOB_HOOK_REJECT_DELETEJOB);
				} else {
					(void) sprintf(log_buffer, "send of job to %s failed error = %d", destin, pbs_errno);
					log_event(PBSEVENT_JOB, PBS_EVENTCLASS_JOB, LOG_INFO, jobp->ji_qs.ji_jobid, log_buffer);
					continue;
				}
			}

			if (jobp->ji_qs.ji_svrflags & JOB_SVFLG_SCRIPT) {
				if (PBSD_jscript(con, script_name, PROT_TCP, NULL) != 0)
					continue;
			}

			if ((move_type == MOVE_TYPE_Exec) &&
			    (jobp->ji_qs.ji_svrflags & JOB_SVFLG_HASRUN) &&
			    (hostaddr != pbs_server_addr)) {
				/* send files created on prior run */
				if ((move_job_file(con, jobp, StdOut, PROT_TCP, NULL) != 0) ||
				    (move_job_file(con, jobp, StdErr, PROT_TCP, NULL) != 0) ||
				    (move_job_file(con, jobp, Chkpt, PROT_TCP, NULL) != 0))
					continue;
			}

			set_job_substate(jobp, JOB_SUBSTATE_TRNOUTCM);
		}

		if (PBSD_commit(con, job_id, PROT_TCP, NULL, NULL) != 0) {
			/* delete the temp script file */
			unlink(script_name);
			exit(SEND_JOB_FATAL);
		}

		svr_disconnect(con);

		/* delete the temp script file */
		unlink(script_name);

		exit(SEND_JOB_OK); /* This child process is all done */
	}
	if (con >= 0)
		svr_disconnect(con);
	/*
	 * If connection is actively refused by the execution node(or mother superior) OR
	 * the execution node(or mother superior) is rejecting request with error
	 * PBSE_BADHOST(failing to authorize server host), the node should be marked down.
	 */
	if ((move_type == MOVE_TYPE_Exec) && (pbs_errno == ECONNREFUSED || pbs_errno == PBSE_BADHOST)) {
		i = SEND_JOB_NODEDW;
	} else if (should_retry_route(pbs_errno) == -1) {
		i = SEND_JOB_FATAL;
	} else {
		i = SEND_JOB_RETRY;
	}
	(void) sprintf(log_buffer, "send_job failed with error %d", pbs_errno);
	log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_NOTICE, jobp->ji_qs.ji_jobid, log_buffer);

	/* delete the temp script file */
	unlink(script_name);

	exit(i);
	return -1; /* NOT REACHED */
}

/**
 * @brief
 * 		net_move - move a job over the network to another queue.
 * @par
 * 		Get the address of the destination server and call send_job()
 *
 * @return	int
 * @retval	2	: success (child started, see send_job())
 * @retval	-1	: error
 */

int
net_move(job *jobp, struct batch_request *req)
{
	void *data;
	char *destination = jobp->ji_qs.ji_destin;
	pbs_net_t hostaddr;
	char *hostname;
	int move_type;
	unsigned int port = pbs_server_port_dis;
	void (*post_func)(struct work_task *);
	char *toserver;

	/* Determine to whom are we sending the job */

	if ((toserver = strchr(destination, '@')) == NULL) {
		sprintf(log_buffer,
			"no server specified in %s", destination);
		log_err(-1, __func__, log_buffer);
		return (-1);
	}

	toserver++; /* point to server name */
	hostname = parse_servername(toserver, &port);
	hostaddr = get_hostaddr(hostname);

	if (req) {
		/* note, in this case, req is the orginal Move Request */
		move_type = MOVE_TYPE_Move;
		post_func = post_movejob;
		data = req;
	} else {
		/* note, in this case req is NULL */
		move_type = MOVE_TYPE_Route;
		post_func = post_routejob;
		data = 0;
	}

	svr_setjobstate(jobp, JOB_STATE_LTR_TRANSIT, JOB_SUBSTATE_TRNOUT);
	return (send_job(jobp, hostaddr, port, move_type, post_func, data));
}

/**
 * @brief
 * 		should_retry_route - should the route be retried based on the error return
 * @par
 *		Certain error are temporary, and that destination should not be
 *		considered bad.
 *
 * @param[in]	err	-	error return
 *
 * @return	int
 * @retval	1	: it should retry this destination
 * @retval	-1	: if destination should not be retried
 */

int
should_retry_route(int err)
{
	switch (err) {
		case 0:
		case EADDRINUSE:
		case EADDRNOTAVAIL:
		case ECONNREFUSED:
		case PBSE_JOBEXIST:
		case PBSE_SYSTEM:
		case PBSE_INTERNAL:
		case PBSE_EXPIRED:
		case PBSE_MAXQUED:
		case PBSE_QUNOENB:
		case PBSE_NOCONNECTS:
		case PBSE_ENTLIMCT:
		case PBSE_ENTLIMRESC:
			return (1);

		default:
			return (-1);
	}
}
/**
 * @brief
 * 		move_job_file - send files created on prior run
 *
 * @param[in]	conn	-	connection handle
 * @param[in]	pjob	-	pointer to job structure
 * @param[in]	which	-	standard file type, see libpbs.h
 * @param[in]	prot	-	PROT_TPP or PROT_TCP
 * @param[out]	msgid	-	message id
 *
 * @return	int
 * @retval	0	: success
 * @retval	!=0	: error code
 */
int
move_job_file(int conn, job *pjob, enum job_file which, int prot, char **msgid)
{
	char path[MAXPATHLEN + 1];

	(void) strcpy(path, path_spool);
	if (*pjob->ji_qs.ji_fileprefix != '\0')
		(void) strcat(path, pjob->ji_qs.ji_fileprefix);
	else
		(void) strcat(path, pjob->ji_qs.ji_jobid);
	if (which == StdOut)
		(void) strcat(path, JOB_STDOUT_SUFFIX);
	else if (which == StdErr)
		(void) strcat(path, JOB_STDERR_SUFFIX);
	else if (which == Chkpt)
		(void) strcat(path, JOB_CKPT_SUFFIX);

	if (access(path, F_OK) < 0) {
		if (errno == ENOENT)
			return (0);
		else
			return (errno);
	}
	return PBSD_jobfile(conn, PBS_BATCH_MvJobFile, path, pjob->ji_qs.ji_jobid, which, prot, msgid);
}

/**
 * @brief
 * 		cnvrt_local_move - internally move a job to another queue
 * @par
 * 		Check the destination to see if it can accept the job.
 *
 * @return	int
 * @retval	0	: success
 * @retval	-1	: permanent failure or rejection, see pbs_errno
 * @retval	1	: failed but try again
 */
int
cnvrt_local_move(job *jobp, struct batch_request *req)
{
	return (local_move(jobp, req));
}

/**
 * @brief
 * 		check size of job files
 * @par
 * 		Checks the size of the job-script/output/error/checkpoint files for a job.
 * 		If the job is not being rerun, simply returns 1.
 *
 * @return	int
 * @retval	0	: at least one file is larger than 2MB.
 * @retval	1	: all job files are smaller than 2MB.
 */
static int
small_job_files(job *pjob)
{
	int max_bytes_over_tpp = 2 * 1024 * 1024;
	char path[MAXPATHLEN + 1] = {0};
	struct stat sb;
	int have_file_prefix = 0;

	if (pjob->ji_script && (strlen(pjob->ji_script) > max_bytes_over_tpp))
		return 0;

	/*
	 * If the job is not being rerun, we need not check
	 * the size of the spool files.
	 */
	if (!(pjob->ji_qs.ji_svrflags & JOB_SVFLG_HASRUN))
		return 1;

	if (*pjob->ji_qs.ji_fileprefix != '\0')
		have_file_prefix = 1;

	if (have_file_prefix)
		snprintf(path, MAXPATHLEN, "%s%s%s", path_spool, pjob->ji_qs.ji_fileprefix, JOB_STDOUT_SUFFIX);
	else
		snprintf(path, MAXPATHLEN, "%s%s%s", path_spool, pjob->ji_qs.ji_jobid, JOB_STDOUT_SUFFIX);
	if ((access(path, F_OK) == 0) && !stat(path, &sb))
		if (sb.st_size > max_bytes_over_tpp)
			return 0;

	memset(path, 0, sizeof(path));
	if (have_file_prefix)
		snprintf(path, MAXPATHLEN, "%s%s%s", path_spool, pjob->ji_qs.ji_fileprefix, JOB_STDERR_SUFFIX);
	else
		snprintf(path, MAXPATHLEN, "%s%s%s", path_spool, pjob->ji_qs.ji_jobid, JOB_STDERR_SUFFIX);
	if ((access(path, F_OK) == 0) && !stat(path, &sb))
		if (sb.st_size > max_bytes_over_tpp)
			return 0;

	memset(path, 0, sizeof(path));
	if (have_file_prefix)
		snprintf(path, MAXPATHLEN, "%s%s%s", path_spool, pjob->ji_qs.ji_fileprefix, JOB_CKPT_SUFFIX);
	else
		snprintf(path, MAXPATHLEN, "%s%s%s", path_spool, pjob->ji_qs.ji_jobid, JOB_CKPT_SUFFIX);
	if ((access(path, F_OK) == 0) && !stat(path, &sb))
		if (sb.st_size > max_bytes_over_tpp)
			return 0;

	return 1;
}


================================================
FILE: src/server/svr_recov_db.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    svr_recov_db.c
 *
 * @brief
 * 		svr_recov_db.c - contains functions to save server state and recover
 *
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <unistd.h>
#include <stdlib.h>
#include <errno.h>
#include <fcntl.h>
#include <string.h>
#include <sys/types.h>
#include <sys/param.h>
#include <sys/stat.h>
#include <sys/time.h>
#include "pbs_ifl.h"
#include "server_limits.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "reservation.h"
#include "queue.h"
#include "server.h"
#include "pbs_nodes.h"
#include "svrfunc.h"
#include "log.h"
#include "pbs_db.h"
#include "pbs_sched.h"
#include "pbs_share.h"

/* Global Data Items: */

extern struct server server;
extern pbs_list_head svr_queues;
extern attribute_def svr_attr_def[];
extern char *path_priv;
extern time_t time_now;
extern char *msg_svdbopen;
extern char *msg_svdbnosv;
extern char *path_svrlive;
extern void *svr_db_conn;
extern void sched_free(pbs_sched *psched);

extern pbs_sched *sched_alloc(char *sched_name);

/**
 * @brief
 *		Update the $PBS_HOME/server_priv/svrlive file timestamp
 *
 * @return	Error code
 * @retval	0	: Success
 * @retval	-1	: Failed to update timestamp
 *
 */
int
update_svrlive()
{
	static int fdlive = -1;
	if (fdlive == -1) {
		/* first time open the file */
		fdlive = open(path_svrlive, O_WRONLY | O_CREAT, 0600);
		if (fdlive < 0)
			return -1;
	}
	(void) utimes(path_svrlive, NULL);
	return 0;
}

/**
 * @brief
 *	convert server structure to DB format
 *
 * @param[in]	ps	-	Address of the server in pbs server
 * @param[out]	pdbsvr	-	Address of the database server object
 *
 * @retval   -1  Failure
 * @retval	>=0 What to save: 0=nothing, OBJ_SAVE_NEW or OBJ_SAVE_QS
 *
 */
static int
svr_to_db(struct server *ps, pbs_db_svr_info_t *pdbsvr)
{
	int savetype = 0;

	pdbsvr->sv_jobidnumber = ps->sv_qs.sv_lastid;

	if ((encode_attr_db(svr_attr_def, ps->sv_attr, (int) SVR_ATR_LAST, &pdbsvr->db_attr_list, 1)) != 0) /* encode all attributes */
		return -1;

	if (ps->newobj) /* object was never saved or loaded before */
		savetype |= (OBJ_SAVE_NEW | OBJ_SAVE_QS);

	return savetype;
}

/**
 * @brief
 *	convert from DB to server structure
 *
 * @param[out]	ps	-	Address of the server in pbs server
 * @param[in]	pdbsvr	-	Address of the database server object
 *
 * @return   !=0   - Failure
 * @return   0     - Success
 */
int
db_to_svr(struct server *ps, pbs_db_svr_info_t *pdbsvr)
{
	if ((decode_attr_db(ps, &pdbsvr->db_attr_list.attrs, svr_attr_idx, svr_attr_def, ps->sv_attr, SVR_ATR_LAST, 0)) != 0)
		return -1;

	ps->newobj = 0;
	ps->sv_qs.sv_jobidnumber = pdbsvr->sv_jobidnumber;

	return 0;
}

/**
 * @brief
 *	convert sched structure to DB format
 *
 * @param[in]	ps - Address of the scheduler in pbs server
 * @param[out]  pdbsched  - Address of the database scheduler object
 *
 * @retval   -1  Failure
 * @retval	>=0 What to save: 0=nothing, OBJ_SAVE_NEW or OBJ_SAVE_QS
 */
static int
sched_to_db(struct pbs_sched *ps, pbs_db_sched_info_t *pdbsched)
{
	int savetype = 0;

	strcpy(pdbsched->sched_name, ps->sc_name);

	if ((encode_attr_db(sched_attr_def, ps->sch_attr, (int) SCHED_ATR_LAST, &pdbsched->db_attr_list, 0)) != 0)
		return -1;

	if (ps->newobj) /* was never loaded or saved before */
		savetype |= OBJ_SAVE_NEW;

	return savetype;
}

/**
 * @brief
 *	convert from DB to sched structure
 *
 * @param[out] ps - Address of the scheduler in pbs server
 * @param[in]  pdbsched  - Address of the database scheduler object
 *
 */
static int
db_to_sched(struct pbs_sched *ps, pbs_db_sched_info_t *pdbsched)
{
	strcpy(ps->sc_name, pdbsched->sched_name);

	if ((decode_attr_db(ps, &pdbsched->db_attr_list.attrs, sched_attr_idx, sched_attr_def, ps->sch_attr, SCHED_ATR_LAST, 0)) != 0)
		return -1;

	ps->newobj = 0;

	return 0;
}

/**
 * @brief
 *		Recover server information and attributes from server database
 *
 * @return	Error code
 * @retval	0	: On successful recovery and creation of server structure
 * @retval	-1	: On failure
 *
 */
int
svr_recov_db(void)
{
	void *conn = (void *) svr_db_conn;
	pbs_db_svr_info_t dbsvr = {0};
	pbs_db_obj_info_t obj;
	int rc = -1;

	obj.pbs_db_obj_type = PBS_DB_SVR;
	obj.pbs_db_un.pbs_db_svr = &dbsvr;

	rc = pbs_db_load_obj(conn, &obj);
	if (rc == -2)
		return 0; /* no change in server, return 0 */

	if (rc == 0)
		rc = db_to_svr(&server, &dbsvr);

	free_db_attr_list(&dbsvr.db_attr_list);

	return rc;
}

/**
 * @brief
 *		Save the state of the server, server quick save sub structure and
 *		optionally the attributes.
 *
 * @param[in]	ps   -	Pointer to struct server
 * @param[in]	mode -  type of save, either SVR_SAVE_QUICK or SVR_SAVE_FULL
 *
 * @return	Error code
 * @retval	 0	: Successful save of data.
 * @retval	-1	: Failure
 *
 */

int
svr_save_db(struct server *ps)
{
	void *conn = (void *) svr_db_conn;
	pbs_db_svr_info_t dbsvr = {0};
	pbs_db_obj_info_t obj;
	int savetype;
	int rc = -1;
	char *conn_db_err = NULL;

	/* as part of the server save, update svrlive file now,
	 * used in failover
	 */
	if (update_svrlive() != 0)
		goto done;

	if ((savetype = svr_to_db(ps, &dbsvr)) == -1)
		goto done;

	obj.pbs_db_obj_type = PBS_DB_SVR;
	obj.pbs_db_un.pbs_db_svr = &dbsvr;

	if ((rc = pbs_db_save_obj(conn, &obj, savetype)) == 0)
		ps->newobj = 0;

done:
	free_db_attr_list(&dbsvr.db_attr_list);

	if (rc != 0) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to save server %s", conn_db_err ? conn_db_err : "");
		panic_stop_db();
		free(conn_db_err);
	}

	return (rc);
}

/**
 * @brief Recover Schedulers
 *
 * @param[in]	sname	- scheduler name
 * @param[in]	ps	- scheduler pointer, if any, to be updated
 *
 * @return	The recovered sched structure
 * @retval	NULL - Failure
 * @retval	!NULL - Success - address of recovered sched returned
 * */

pbs_sched *
sched_recov_db(char *sname, pbs_sched *ps)
{
	pbs_db_sched_info_t dbsched = {{0}};
	pbs_db_obj_info_t obj;
	void *conn = (void *) svr_db_conn;
	int rc = -1;
	char *conn_db_err = NULL;

	if (!ps) {
		if ((ps = sched_alloc(sname)) == NULL) {
			log_err(-1, __func__, "sched_alloc failed");
			return NULL;
		}
	}

	obj.pbs_db_obj_type = PBS_DB_SCHED;
	obj.pbs_db_un.pbs_db_sched = &dbsched;

	/* load sched */
	snprintf(dbsched.sched_name, sizeof(dbsched.sched_name), "%s", sname);

	rc = pbs_db_load_obj(conn, &obj);
	if (rc == -2)
		return ps; /* no change in sched */

	if (rc == 0)
		rc = db_to_sched(ps, &dbsched);
	else {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to load sched %s %s", sname, conn_db_err ? conn_db_err : "");
		free(conn_db_err);
	}

	free_db_attr_list(&dbsched.db_attr_list);

	if (rc != 0) {
		if (ps)
			sched_free(ps); /* free if we allocated here */
		ps = NULL;		/* so we return NULL */
	}
	return ps;
}

/**
 * @brief
 *		Save the state of the scheduler structure which consists only of attributes
 *
 * @param[in]	ps   -	Pointer to struct sched
 * @param[in]	mode -  type of save, only SVR_SAVE_FULL
 *
 * @return	Error code
 * @retval	 0 :	Successful save of data.
 * @retval	-1 :	Failure
 *
 */

int
sched_save_db(pbs_sched *ps)
{
	void *conn = (void *) svr_db_conn;
	pbs_db_sched_info_t dbsched = {{0}};
	pbs_db_obj_info_t obj;
	int savetype;
	int rc = -1;
	char *conn_db_err = NULL;

	if ((savetype = sched_to_db(ps, &dbsched)) == -1)
		goto done;

	obj.pbs_db_obj_type = PBS_DB_SCHED;
	obj.pbs_db_un.pbs_db_sched = &dbsched;

	if ((rc = pbs_db_save_obj(conn, &obj, savetype)) == 0)
		ps->newobj = 0;

done:
	free_db_attr_list(&dbsched.db_attr_list);

	if (rc != 0) {
		pbs_db_get_errmsg(PBS_DB_ERR, &conn_db_err);
		log_errf(PBSE_INTERNAL, __func__, "Failed to save sched %s %s", ps->sc_name, conn_db_err ? conn_db_err : "");
		panic_stop_db();
		free(conn_db_err);
	}

	return rc;
}

/**
 * @brief
* 	recov_sched_cb - callback function to process and load
* 			sched database result to pbs structure.
 *
 * @param[in]	dbobj	- database sched structure to C.
 * @param[out]	refreshed - if rows processed.
 *
 * @return	resv structure - on success
 * @return 	NULL - on failure
 */
pbs_sched *
recov_sched_cb(pbs_db_obj_info_t *dbobj, int *refreshed)
{
	pbs_sched *psched = NULL;
	pbs_db_sched_info_t *dbsched = dbobj->pbs_db_un.pbs_db_sched;

	*refreshed = 0;
	/* recover sched */
	if ((psched = sched_recov_db(dbsched->sched_name, NULL)) != NULL) {
		if (!strncmp(dbsched->sched_name, PBS_DFLT_SCHED_NAME, strlen(PBS_DFLT_SCHED_NAME)))
			dflt_scheduler = psched;
		psched->sc_conn_addr = get_hostaddr(get_sched_attr_str(psched, SCHED_ATR_SchedHost));
		set_scheduler_flag(SCH_CONFIGURE, psched);
		*refreshed = 1;
	}

	free_db_attr_list(&dbsched->db_attr_list);
	return psched;
}


================================================
FILE: src/server/svr_resccost.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    svr_resccost.c
 *
 * @brief
 * 		svr_resccost.c - This file contains the functions for manipulating the server
 * 		attribute "resource cost", which is of type ATR_TYPE_LIST
 *
 *  	It contains functions for:
 *		Decoding the value string to the machine representation,
 *		a long integer within the resource cost structure.
 *		Encoding the long integer value to external form
 *		Setting the value by =, + or - operators.
 *		Freeing the storage space used by the list.
 *
 *		note - it was my original intent to have the cost be an integer recorded
 *		in the resource_defination structure itself.  It seemed logical, one
 *		value per definition, why not.  But "the old atomic set" destroys that
 *		idea.  Have to be able to have temporary attributes with their own
 *		values...  Hence it came down to another linked-list of values.
 *
 *		Resource_cost entry, one per resource type which has been set.
 * 		The list is headed in the resource_cost attribute.
 *
 * Included functions are:
 *	decode_rcost()
 *	encode_rcost()
 *	set_rcost()
 *	free_rcost()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <assert.h>
#include <ctype.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include <sys/types.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "resource.h"
#include "pbs_error.h"
#include "server_limits.h"
#include "server.h"
#include "job.h"

struct resource_cost {
	pbs_list_link rc_link;
	resource_def *rc_def;
	long rc_cost;
};

/**
 * @brief
 * 		add_cost_entry	-	add a new cost entry to the resource_cost list.
 *
 * @param[in,out]	patr	-	attribute structure
 * @param[in]	prdef	-	resource definition structure
 *
 * @return	resource_cost *
 */

static struct resource_cost *
add_cost_entry(attribute *patr, resource_def *prdef)
{
	struct resource_cost *pcost;

	pcost = malloc(sizeof(struct resource_cost));
	if (pcost) {
		CLEAR_LINK(pcost->rc_link);
		pcost->rc_def = prdef;
		pcost->rc_cost = 0;
		append_link(&patr->at_val.at_list, &pcost->rc_link, pcost);
	}
	return (pcost);
}

/**
 * @brief
 * 		decode_rcost - decode string into resource cost value
 *
 * @param[in,out]	patr	-	attribute name
 * @param[in]	name	-	attribute name
 * @param[in]	rescn	-	resource name, unused here
 * @param[in]	val	-	attribute value
 *
 * @return	int
 * @retval	0	: if ok
 * @retval	>0	: error number if error
 * @retval	*patr
 *	Returns: 0 if ok
 *		>0 error number if error
 */

int
decode_rcost(attribute *patr, char *name, char *rescn, char *val)
{
	resource_def *prdef;
	struct resource_cost *pcost;
	void free_rcost(attribute *);

	if ((val == NULL) || (rescn == NULL)) {
		ATR_UNSET(patr);
		return (0);
	}
	if (is_attr_set(patr))
		free_rcost(patr);

	prdef = find_resc_def(svr_resc_def, rescn);
	if (prdef == NULL)
		return (PBSE_UNKRESC);
	pcost = (struct resource_cost *) GET_NEXT(patr->at_val.at_list);
	while (pcost) {
		if (pcost->rc_def == prdef)
			break; /* have entry in attr already */
		pcost = (struct resource_cost *) GET_NEXT(pcost->rc_link);
	}
	if (pcost == NULL) { /* add entry */
		if ((pcost = add_cost_entry(patr, prdef)) == NULL)
			return (PBSE_SYSTEM);
	}
	pcost->rc_cost = atol(val);
	post_attr_set(patr);
	return (0);
}

/**
 * @brief
 * 		encode_rcost - encode attribute of type long into attr_extern
 *
 * @param[in]	attr	-	ptr to attribute
 * @param[in,out]	phead	-	head of attrlist list
 * @param[in]	atname	-	attribute name
 * @param[in]	rsname	-	esource name or null
 * @param[in]	mode	-	encode mode, unused here
 * @param[out]	rtnl	-	RETURN: ptr to svrattrl
 *
 * @return	int
 * @retval	>0	: if ok
 * @retval	=0	: if no value, no attrlist link added
 * @retval	<0	: if error
 */
/*ARGSUSED*/

int
encode_rcost(const attribute *attr, pbs_list_head *phead, char *atname, char *rsname, int mode, svrattrl **rtnl)
{
	svrattrl *pal;
	struct resource_cost *pcost;
	int first = 1;
	svrattrl *xprior = NULL;

	if (!attr)
		return (-1);
	if (!(is_attr_set(attr)))
		return (0);

	pcost = (struct resource_cost *) GET_NEXT(attr->at_val.at_list);
	while (pcost) {
		rsname = pcost->rc_def->rs_name;
		if ((pal = attrlist_create(atname, rsname, 23)) == NULL)
			return (-1);

		(void) sprintf(pal->al_value, "%ld", pcost->rc_cost);
		pal->al_flags = attr->at_flags;
		append_link(phead, &pal->al_link, pal);
		if (first) {
			if (rtnl)
				*rtnl = pal;
			first = 0;
		} else {
			xprior->al_sister = pal;
		}
		xprior = pal;

		pcost = (struct resource_cost *) GET_NEXT(pcost->rc_link);
	}

	return (1);
}

/**
 * @brief
 * 		set_rcost - set attribute A to attribute B,
 *		either A=B, A += B, or A -= B
 *
 * @param[in,out]	old	-	attribute A
 * @param[in]	new	-	attribute B
 * @param[in]	op	-	batch operator. Ex: SET, INCR, DECR.
 *
 * @return	int
 * @retval	0	: if ok
 * @retval	>0 	: if error
 */

int
set_rcost(attribute *old, attribute *new, enum batch_op op)
{
	struct resource_cost *pcnew;
	struct resource_cost *pcold;

	assert(old && new && (is_attr_set(new)));

	pcnew = (struct resource_cost *) GET_NEXT(new->at_val.at_list);
	while (pcnew) {
		pcold = (struct resource_cost *) GET_NEXT(old->at_val.at_list);
		while (pcold) {
			if (pcnew->rc_def == pcold->rc_def)
				break;
			pcold = (struct resource_cost *) GET_NEXT(pcold->rc_link);
		}
		if (pcold == NULL)
			if ((pcold = add_cost_entry(old, pcnew->rc_def)) == NULL)
				return (PBSE_SYSTEM);

		switch (op) {
			case SET:
				pcold->rc_cost = pcnew->rc_cost;
				break;

			case INCR:
				pcold->rc_cost += pcnew->rc_cost;
				break;

			case DECR:
				pcold->rc_cost -= pcnew->rc_cost;
				break;

			default:
				return (PBSE_INTERNAL);
		}
		pcnew = (struct resource_cost *) GET_NEXT(pcnew->rc_link);
	}
	post_attr_set(old);
	return (0);
}

/**
 * @brief
 * 		free_rcost - free space used by resource cost attribute
 *
 * @param[in]	pattr	-	attribute structure
 */

void
free_rcost(attribute *pattr)
{
	struct resource_cost *pcost;

	while ((pcost = (struct resource_cost *) GET_NEXT(
			pattr->at_val.at_list)) != NULL) {
		delete_link(&pcost->rc_link);
		(void) free(pcost);
	}
	mark_attr_not_set(pattr);
}


================================================
FILE: src/server/user_func.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    user_func.c
 *
 *@brief
 * 		user_func.c - Functions which provide basic operation on the user concept
 *
 * Included public functions are:
 *
 *   user_write_password  saves a user password to a file
 *   user_read_password   reads user's saved password from a file
 *   req_usercredential   receive save per user/per server password request
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <unistd.h>
#include <sys/param.h>
#include <dirent.h>

#include <sys/types.h>
#include <sys/stat.h>
#include <ctype.h>
#include <errno.h>
#include <assert.h>

#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#include <netdb.h>

#include "pbs_ifl.h"
#include "log.h"
#include "user.h"
#include "list_link.h"
#include "server_limits.h"
#include "attribute.h"
#include "credential.h"
#include "ticket.h"
#include "libpbs.h"
#include "batch_request.h"
#include "server.h"
#include "net_connect.h"
#include "pbs_nodes.h"
#include "svrfunc.h"

#define MIG_RETRY_LIMIT 3

extern struct server server;
extern char *path_users;

/* External functions */
extern int should_retry_route(int err);

/* Local Private Functions */

/* Global Data items */

/**
 * @brief
 *  	user_write_password - Output password into user password file.
 *
 * @param[in]	user	-	The user name.
 * @param[in]	cred	-	Credential
 * @param[in]	len	-	length of cred.
 *
 * @return	int
 * @retval	0	: success
 * @retval	-2	: if a request was made to delete a non-existent user password file.
 * @retval	-1	: on all other errors.
 * @note
 *      NOTE: The well known 'log_buffer' array will be overwritten as to what
 *		action took place.
 *      Also, if cred is "" and len is 0, then the user password file is
 *      deleted!
 */
int
user_write_password(char *user, char *cred, size_t len)
{
	extern char *path_users;
	char name_buf[MAXPATHLEN + 1];
	int cred_fd;
	int ret = -1;

	assert(user != NULL);
	assert(cred != NULL);

	(void) strcpy(name_buf, path_users);
	(void) strcat(name_buf, user);
	(void) strcat(name_buf, USER_PASSWORD_SUFFIX);

	if (len == 0) {
		struct stat sbuf;
		if ((stat(name_buf, &sbuf) == -1) &&
		    (errno == ENOENT)) {
			sprintf(log_buffer, "user %s has no password file!",
				user);
			return (-2);
		}
		if (unlink(name_buf) == -1) {
			sprintf(log_buffer, "Deleting user %s failed: error %d",
				user, errno);
			return (-1);
		}
		return (0);
	}

	if ((cred_fd = open(name_buf, O_RDWR | O_CREAT | O_TRUNC, 0600)) == -1) {
		sprintf(log_buffer,
			"open of user password file %s failed: errno %d",
			name_buf, errno);
		return -1;
	}

	if (write(cred_fd, cred, len) != len) {
		sprintf(log_buffer,
			"write to file %s incomplete: errno %d", name_buf, errno);
		goto done;
	}
	sprintf(log_buffer, "saved user %s's per server password", user);
	ret = 0;

done:
	if (cred_fd > 0)
		close(cred_fd);
	return ret;
}

/**
 * @brief
 * 		user_read_password
 *		Check if this user has an associated user password file.  If it does,
 *		the user password file is opened and the password is read into
 *		malloc'ed memory.
 *
 * @param[in]	user	-	The user name.
 * @param[out]	cred	-	Credential
 * @param[out]	len	-	length of cred.
 *
 * @return	int
 * @retval	1	: if there is no password
 * @retval	0	: if there is a password
 * @retval	-1	: error.
 */
int
user_read_password(char *user, char **cred, size_t *len)
{
	extern char *path_users;
	char name_buf[MAXPATHLEN + 1];
	char *hold = NULL;
	struct stat sbuf;
	int fd;
	int ret = -1;

	assert(user != NULL);
	assert(cred != NULL);

	(void) strcpy(name_buf, path_users);
	(void) strcat(name_buf, user);
	(void) strcat(name_buf, USER_PASSWORD_SUFFIX);

	if ((fd = open(name_buf, O_RDONLY)) == -1) {
		if (errno == ENOENT)
			return 1;

		sprintf(log_buffer, "failed to open %s errno", name_buf);
		log_err(errno, __func__, log_buffer);
		return ret;
	}

	if (fstat(fd, &sbuf) == -1) {
		sprintf(log_buffer, "failed to fstat %s", name_buf);
		log_err(errno, __func__, log_buffer);
		goto done;
	}

	hold = malloc(sbuf.st_size);
	assert(hold != NULL);

	if (read(fd, hold, sbuf.st_size) != sbuf.st_size) {
		sprintf(log_buffer, "read %s is incomplete", name_buf);
		log_err(errno, __func__, log_buffer);
		goto done;
	}
	*len = sbuf.st_size;
	*cred = hold;
	hold = NULL;
	ret = 0;

done:
	if (fd > 0)
		close(fd);

	if (hold != NULL)
		free(hold);

	return ret;
}

/**
 * @brief
 * 		req_usercredential - receive password credential of a user that
 *                      is to be saved by the server.
 *
 * @param[in,out]	preq	-	ptr to the decoded request
 */
void
req_usercredential(struct batch_request *preq)
{
	char *user;
	int type;
	char *cred;
	size_t len;
	char info[PBS_MAXUSER + PBS_MAXHOSTNAME + 2];
	int rval;

	DBPRT(("%s: entered\n", __func__))
	user = preq->rq_ind.rq_usercred.rq_user;
	type = preq->rq_ind.rq_usercred.rq_type;
	cred = preq->rq_ind.rq_usercred.rq_data;
	len = (size_t) preq->rq_ind.rq_usercred.rq_size;

	if ((preq->rq_host[0] == '\0') || (preq->rq_user[0] == '\0') ||
	    user == NULL) { /* no user */
		req_reject(PBSE_INTERNAL, 0, preq);
		return;
	}

	snprintf(info, sizeof(info), "%s@%s", preq->rq_user, preq->rq_host);

	if (strcasecmp(preq->rq_user, user) != 0) {
		/* ok if request coming from another server */
		if (!preq->rq_fromsvr &&
		    (strcasecmp(preq->rq_user, PBS_DEFAULT_ADMIN) != 0) &&
		    (ruserok(preq->rq_host, 0, preq->rq_user, user) != 0)) {
			req_reject(PBSE_PERM, 0, preq);
			return;
		}
	}

	if (type != PBS_CREDTYPE_AES) {
		req_reject(PBSE_SYSTEM, 0, preq);
		return;
	}

	strcpy(log_buffer, "");

	rval = user_write_password(user, cred, len);
	if (rval == -2) {
		if (strlen(log_buffer) > 0)
			log_err(-1, info, log_buffer);
		req_reject(PBSE_BADUSER, 0, preq);
	} else if (rval == -1) {
		if (strlen(log_buffer) > 0)
			log_err(-1, info, log_buffer);
		req_reject(PBSE_SYSTEM, 0, preq);
	} else {
		if (strlen(log_buffer) > 0)
			log_event(PBSEVENT_ADMIN, PBS_EVENTCLASS_SERVER,
				  LOG_INFO, info, log_buffer);
		reply_ack(preq);
	}

	return;
}


================================================
FILE: src/server/vnparse.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *
 *@brief
 * 		Functions which provide basic operation on the parsing of vnl files.
 *
 */
#include <sys/types.h>
#include <sys/stat.h>
#include <assert.h>
#include <ctype.h>
#include <errno.h>
#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <unistd.h>
#include <time.h>
#include "dis.h"
#include "pbs_error.h"
#include "log.h"
#include "placementsets.h"
#include "pbs_config.h"
#include "list_link.h"
#include "attribute.h"
#include "pbs_nodes.h"
#include "cmds.h"
#include "server.h"
#include "queue.h"
#include "pbs_reliable.h"

static vnal_t *vnal_alloc(vnal_t **);
static vnal_t *id2vnrl(vnl_t *, char *);
static vna_t *attr2vnr(vnal_t *, char *);

static const char iddelim = ':';
static const char attrdelim = '=';

extern char *msg_err_malloc;

/**
 * @brief
 *		Exported interfaces responsible for opening and reading the given file
 *		(which should contain vnode-specific data in the form described in the
 *		design document), parsing it into a vnl_t (see "placementsets.h").
 *		On error, NULL is returned;  on success, a pointer to the resulting
 *		vnl_t structure is returned.  Space allocated by the parse functions
 *		should be freed with vnl_free() below.
 *
 *		In order to allow the user to effect actions based on the attributes
 *		or vnode IDs, a callback function may be supplied.  It will be called
 *		before inserting a new name/value pair, and supplied the vnode ID,
 *		attribute name and value;  if it returns zero, the insertion of the
 *		given <ID, name, value> tuple will not occur but processing of the
 *		file will continue normally.
 *
 * @param[in]	file	-	file which should contain vnode-specific data
 * 							in the form described in the design document.
 * @param[in]	callback	-	callback function which will be called
 * 								before inserting a new name/value pair.
 *
 * @return	vnl_t structure
 */
vnl_t *
vn_parse(const char *file, callfunc_t callback)
{
	FILE *fp;
	vnl_t *vnlp;

	if ((fp = fopen(file, "r")) == NULL) {
		sprintf(log_buffer, "%s", file);
		log_err(errno, __func__, log_buffer);
		return NULL;
	}

	vnlp = vn_parse_stream(fp, callback);

	(void) fclose(fp);
	return (vnlp);
}

/**
 * @brief
 * 		Read a configuration file.  The lines of the file have the form:
 * @par
 * 		@verbatim
 * 		<ID><IDDELIM><ATTRNAME><ATTRDELIM><ATTRVAL> [<TYPE> <ATTRDELIM> <TYPEVAL>]
 * @par
 * 		For example:
 * 		fred: thing = blue   type = string_array
 * 		@endverbatim
 * @par
 * 		where <ID>, <ATTRNAME>, <ATTRVAL> and <TYPEVAL>
 * 		are all strings; <IDDELIM> and <ATTRDELIM> are
 * 		characters (':' and '=' respectively - see iddelim,
 * 		attrdelim above); <TYPE> is the literal string "type" and
 * 		begins an optional section used to define the data type for <ATTRNAME>.
 *
 * @param[in]	file	-	file which should contain vnode-specific data
 * 							in the form described in the design document.
 * @param[in]	callback	-	callback function which will be called
 * 								before inserting a new name/value pair.
 *
 * @return	vnl_t structure
 */
vnl_t *
vn_parse_stream(FILE *fp, callfunc_t callback)
{
	int linenum;
	char linebuf[BUFSIZ];
	vnl_t *vnlp = NULL;
	struct stat sb;
	static char type[] = "type";

	if (vnl_alloc(&vnlp) == NULL) {
		return NULL;
	}

	if (fstat(fileno(fp), &sb) == -1) {
		log_err(errno, __func__, "fstat");
		vnl_free(vnlp);
		return NULL;
	} else
		vnlp->vnl_modtime = sb.st_mtime;

	/*
	 *	linenum begins at 1, not 0, because of the implicit assumption
	 *	that each file we're asked to parse must have begun with a line
	 *	of the form
	 *
	 *		$configversion	...
	 */
	linenum = 1;
	while (fgets(linebuf, sizeof(linebuf), fp) != NULL) {
		char *p, *opt;
		char *tokbegin, *tokend;
		char *pdelim;
		char *vnid;	  /* vnode ID */
		char *attrname;	  /* attribute name */
		char *attrval;	  /* attribute value */
		char *vnp;	  /* vnode ID ptr*/
		int typecode = 0; /* internal attribute type */
		/* internal attribute flag, default */
		int typeflag = READ_WRITE | ATR_DFLAG_CVTSLT;
		struct resc_type_map *ptmap;

		/* cost of using fgets() - have to remove trailing newline */
		if ((p = strrchr(linebuf, '\n')) != NULL) {
			*p = '\0';
			linenum++;
		} else {
			sprintf(log_buffer, "line %d not newline-terminated",
				linenum);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		}

		/* ignore initial white space;  skip blank lines */
		p = linebuf;
		while ((*p != '\0') && isspace(*p))
			p++;
		if (*p == '\0')
			continue;

		/* <ID> <IDDELIM> */
		if ((pdelim = strchr(linebuf, iddelim)) == NULL) {
			sprintf(log_buffer, "line %d:  missing '%c'", linenum,
				iddelim);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		}
		while ((p < pdelim) && isspace(*p))
			p++;
		if (p == pdelim) {
			sprintf(log_buffer, "line %d:  no vnode id",
				linenum);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		} else {
			tokbegin = p;
			while ((p < pdelim) && !isspace(*p))
				p++;
			tokend = p;
			*tokend = '\0';
			vnid = tokbegin;
		}

		/*
		 * Validate the vnode name here in MOM before sending UPDATE2
		 * command to SERVER (is_request()->update2_to_vnode()->
		 * create_pbs_node()) to create the vnode. MOM does not allow
		 * any invalid character in vnode name which is not supported
		 * by PBS server.
		 */
		for (vnp = vnid; *vnp && legal_vnode_char(*vnp, 1); vnp++)
			;
		if (*vnp) {
			log_errf(PBSE_SYSTEM, __func__, "invalid character in vnode name \"%s\"", vnid);
			vnl_free(vnlp);
			return NULL;
		}
		/* Condition to make sure that vnode name should not exceed
		 * PBS_MAXHOSTNAME i.e. 64 characters. This is because the
		 * corresponding column nd_name in the database table pbs.node
		 * is defined as string of length 64.
		 */
		if (strlen(vnid) > PBS_MAXHOSTNAME) {
			log_errf(PBSE_SYSTEM, __func__, "Node name \"%s\" is too big", vnid);
			return NULL;
		}
		/* <ATTRNAME> <ATTRDELIM> */
		p = pdelim + 1; /* advance past iddelim */
		if ((pdelim = strchr(p, attrdelim)) == NULL) {
			sprintf(log_buffer, "line %d:  missing '%c'", linenum,
				attrdelim);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		}
		while ((p < pdelim) && isspace(*p))
			p++;
		if (p == pdelim) {
			sprintf(log_buffer, "line %d:  no attribute name",
				linenum);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		} else {
			tokbegin = p;
			while ((p < pdelim) && !isspace(*p))
				p++;
			tokend = p;
			*tokend = '\0';
			attrname = tokbegin;
		}

		/* <ATTRVAL> */
		p = pdelim + 1; /* advance past attrdelim */
		while (isspace(*p))
			p++;
		if (*p == '\0') {
			sprintf(log_buffer, "line %d:  no attribute value",
				linenum);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		}

		/*
		 * Check to see if the optional "type" section exists.
		 */
		tokbegin = NULL;
		opt = strchr(p, attrdelim);
		if (opt != NULL) { /* found one */
			opt--;	   /* skip backward from '=' */
			while ((p < opt) && isspace(*opt))
				opt--;
			if (p < opt) { /* check for "type" */
				/*
				 * We want to see if the string value
				 * of "type" exists.  opt is pointing to
				 * the first non-space char so back up
				 * enough to get to the beginning of "type".
				 * The sizeof(type) is the same as strlen+1
				 * so we need to backup sizeof(type)-2 to
				 * get to the beginning of "type".
				 */
				opt -= (sizeof(type) - 2);
				if ((p < opt) && (strncmp(opt, type,
							  sizeof(type) - 1) == 0)) {
					tokend = opt - 1;
					/* must have a space before "type" */
					if (isspace(*tokend)) {
						tokbegin = p;
						*tokend = '\0';
						p = opt;
					}
				}
			}
		}
		if (tokbegin == NULL) { /* no optional section */
			tokbegin = p;
			while (*p != '\0')
				p++;
			tokend = p;
		}

		/*
		 * The attribute value needs to be checked for
		 * bad chars.  The only one is attrdelim '='.
		 */
		attrval = tokbegin;
		if (strchr(attrval, attrdelim) != NULL) {
			sprintf(log_buffer,
				"line %d:  illegal char '%c' in value",
				linenum, attrdelim);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		}

		/* look for optional "keyword = typeval" */
		while ((*p != '\0') && isspace(*p))
			++p;
		if (*p != '\0') {
			/* there is a keyword ("type") */
			if ((pdelim = strchr(p, attrdelim)) == NULL) {
				sprintf(log_buffer, "line %d:  missing '%c'",
					linenum, attrdelim);
				log_err(PBSE_SYSTEM, __func__, log_buffer);
				vnl_free(vnlp);
				return NULL;
			}
			tokbegin = p;
			while ((p < pdelim) && !isspace(*p))
				p++;
			tokend = p;
			*tokend = '\0';
			p = pdelim + 1;
			if (strcmp(tokbegin, type) == 0) {
				while (isspace(*p))
					++p;
				if (*p == '\0') {
					sprintf(log_buffer,
						"line %d:  no keyword value",
						linenum);
					log_err(PBSE_SYSTEM, __func__, log_buffer);
					vnl_free(vnlp);
					return NULL;
				}
				tokbegin = p;
				while ((*p != '\0') && !isspace(*p))
					++p;
				tokend = p;
				*tokend = '\0';
				ptmap = find_resc_type_map_by_typest(tokbegin);
				if (ptmap == NULL) {
					sprintf(log_buffer,
						"line %d: invalid type '%s'",
						linenum, tokbegin);
					log_err(PBSE_SYSTEM, __func__,
						log_buffer);
					vnl_free(vnlp);
					return NULL;
				}
				typecode = ptmap->rtm_type;

			} else {
				sprintf(log_buffer,
					"line %d:  invalid keyword '%s'",
					linenum, tokbegin);
				log_err(PBSE_SYSTEM, __func__, log_buffer);
				vnl_free(vnlp);
				return NULL;
			}
		}

		if (vn_addvnr(vnlp, vnid, attrname, attrval, typecode,
			      typeflag, callback) == -1) {
			sprintf(log_buffer,
				"line %d:  vn_addvnr failed", linenum);
			log_err(PBSE_SYSTEM, __func__, log_buffer);
			vnl_free(vnlp);
			return NULL;
		}
	}

	return ((vnl_t *) vnlp);
}

/**
 * @brief
 *		Merge data from the newly-parse vnode list (new) into a previously-
 *		parsed one (cur) adding any attribute/value pairs found in new to
 *		cur, and overwriting any duplicate attributes with new's values.
 *		If successful, cur is returned, otherwise NULL.
 *
 * @param[in,out]	cur	-	previously-parsed one (cur)
 * @param[in]	new	-	newly-parse vnode list (new)
 * @param[in]	callback	-	callback function which will be called
 * 								before inserting a new name/value pair.
 */
vnl_t *
vn_merge(vnl_t *cur, vnl_t *new, callfunc_t callback)
{
	unsigned long i, j;

	for (i = 0; i < new->vnl_used; i++) {
		vnal_t *newreslist = VNL_NODENUM(new, i);

		for (j = 0; j < newreslist->vnal_used; j++) {
			vna_t *newres = VNAL_NODENUM(newreslist, j);

			if (vn_addvnr(cur, newreslist->vnal_id,
				      newres->vna_name, newres->vna_val,
				      newres->vna_type, newres->vna_flag,
				      callback) == -1)
				return NULL;
		}
	}

	cur->vnl_modtime = (cur->vnl_modtime > new->vnl_modtime) ? cur->vnl_modtime : new->vnl_modtime;
	return (cur);
}

/**
 * @brief
 *		Merge data from the newly-parse vnode list (new) into a previously-
 *		parsed one (cur) adding any attribute/value pairs of those attribute
 *		names listed in the 'allow_attribs'.
 *		This overwrites any duplicate attributes with new's values.
 * @note
 *		An entry in 'new' will be matched just before a dot (.) in the name
 *		if one exists.
 *		For example, a 'new' entry of "resources_available.ncpus" will
 *		match with 'allow_attribs' entry of "resources_available".
 *
 * @param[in]	cur - previously parsed vnode list
 * @param[in]	new - newly parsed vnode list
 * @param[in]	allow_attribs - list of attribute names to to match
 *
 * @return	vnl_t *
 * @retval	cur	- if successful
 * @retval	NULL	- if not successful.
 */
vnl_t *
vn_merge2(vnl_t *cur, vnl_t *new, char **allow_attribs, callfunc_t callback)
{
	unsigned long i, j;
	char *vna_name, *dot;
	int match;

	for (i = 0; i < new->vnl_used; i++) {
		vnal_t *newreslist = VNL_NODENUM(new, i);

		for (j = 0; j < newreslist->vnal_used; j++) {
			vna_t *newres = VNAL_NODENUM(newreslist, j);

			vna_name = newres->vna_name;
			dot = strchr(vna_name, (int) '.');
			if (dot)
				*dot = '\0';

			/* match up to but not including dot */
			match = is_string_in_arr(allow_attribs, vna_name);
			if (dot)
				*dot = '.'; /* restore */
			if (!match)
				continue;

			if (vn_addvnr(cur, newreslist->vnal_id,
				      newres->vna_name, newres->vna_val,
				      newres->vna_type, newres->vna_flag,
				      callback) == -1)
				return NULL;
		}
	}

	cur->vnl_modtime = cur->vnl_modtime > new->vnl_modtime ? cur->vnl_modtime : new->vnl_modtime;
	return cur;
}

/**
 * @brief
 * 		Search for an attribute in a vnode.
 *
 * @param[in]	vnrlp	-	vnode to check
 * @param[in]	attr	-	check for the existence of the given attribute
 *
 * @return	atrribute value
 * @retval	NULL	: not found
 */
char *
attr_exist(vnal_t *vnrlp, char *attr)
{
	vna_t *vnrp;

	if (vnrlp == NULL)
		return NULL;

	if ((vnrp = attr2vnr(vnrlp, attr)) == NULL)
		return NULL;

	return vnrp->vna_val;
}

/**
 * @brief
 * 		Check if a vnode exists.
 *
 * @param[in]	vnlp	-	vnode to check
 * @param[in]	id	-	vnode name to look for
 *
 * @return	vnal_t *
 */
vnal_t *
vn_vnode(vnl_t *vnlp, char *id)
{
	if (vnlp == NULL)
		return NULL;
	return id2vnrl(vnlp, id);
}

/**
 * @brief
 * 		Search for a named vnode, then search for an attribute in that vnode.
 *
 * @param[in]	vnlp	-	vnode list to search
 * @param[in]	id	-	vnode name to look for
 * @param[in]	attr	-	check for the existence of the given attribute
 *
 * @return	atrribute value
 * @retval	NULL	: not found
 */
char *
vn_exist(vnl_t *vnlp, char *id, char *attr)
{
	vnal_t *vnrlp;

	if (vnlp == NULL)
		return NULL;
	if ((vnrlp = id2vnrl(vnlp, id)) == NULL)
		return NULL;

	return attr_exist(vnrlp, attr);
}

/**
 * @brief
 *		Add the given attribute (attr) and value (attrval) to the vnode with
 *		ID id;  if no vnode with the given ID is found, one is created.
 *
 * @param[in,out]	vnlp	-	vnode list to search
 * @param[in]	id	-	vnode name to look for
 * @param[in]	attr	-	check for the existence of the given attribute
 * @param[in]	attrval	-	attribute value
 * @param[in]	attrtype	-	attribute type
 * @param[in]	attrflags	-	attribute flags
 * @param[in]	callback	-	callback function which will be called
 * 								before inserting a new name/value pair.
 *
 * @return	int
 * @retval	-1	: error
 * @retval	0	: success
 */
int
vn_addvnr(vnl_t *vnlp, char *id, char *attr, char *attrval,
	  int attrtype, int attrflags, callfunc_t callback)
{
	vnal_t *vnrlp;
	vna_t *vnrp;
	char *newid, *newname, *newval;

	if ((callback != NULL) && (callback(id, attr, attrval) == 0))
		return (0);

	if ((newname = strdup(attr)) == NULL) {
		return (-1);
	} else if ((newval = strdup(attrval)) == NULL) {
		free(newname);
		return (-1);
	}

	if ((vnrlp = id2vnrl(vnlp, id)) == NULL) {
		if ((newid = strdup(id)) == NULL) {
			free(newval);
			free(newname);
			return (-1);
		}

		/*
		 *	No vnode_attrlist with this ID - add one.
		 */
		if ((vnlp->vnl_used >= vnlp->vnl_nelem) &&
		    (vnl_alloc(&vnlp) == NULL)) {
			free(newid);
			free(newval);
			free(newname);
			return (-1);
		}
		vnlp->vnl_cur = vnlp->vnl_used++;
		if (pbs_idx_insert(vnlp->vnl_ix, id, (void *) vnlp->vnl_dl.dl_cur) != PBS_IDX_RET_OK) {
			free(newid);
			free(newval);
			free(newname);
			return (-1);
		}
		vnrlp = CURVNLNODE(vnlp);
		vnrlp->vnal_id = newid;
	}

	if ((vnrp = attr2vnr(vnrlp, attr)) == NULL) {
		/*
		 *	No vnode_attr for this attribute - add one.
		 */
		if ((vnrlp->vnal_used >= vnrlp->vnal_nelem) &&
		    (vnal_alloc(&vnrlp) == NULL)) {
			free(newval);
			free(newname);
			return (-1);
		}
		vnrlp->vnal_cur = vnrlp->vnal_used++;
		vnrp = CURVNRLNODE(vnrlp);
	} else {
		free(vnrp->vna_name);
		free(vnrp->vna_val);
	}

	vnrp->vna_name = newname;
	vnrp->vna_val = newval;
	vnrp->vna_type = attrtype;
	vnrp->vna_flag = attrflags;
	return (0);
}

/**
 * @brief
 *		If a vnal_t entry with the given ID (id) exists, return a pointer
 *		to it;  otherwise NULL is returned.
 *
 * @param[in,out]	vnlp	-	vnode list to search
 * @param[in]	id	-	vnode name to look for
 *
 * @return	vnal_t *
 * @retval	a pointer to vnal_t	: entry with the given ID (id) exists
 * @retval	NULL	: does not exists.
 */
static vnal_t *
id2vnrl(vnl_t *vnlp, char *id)
{
	unsigned long i = 0;
	if (vnlp != NULL && pbs_idx_find(vnlp->vnl_ix, (void **) &id, (void **) &i, NULL) == PBS_IDX_RET_OK) {
		vnal_t *vnrlp = VNL_NODENUM(vnlp, i);

		return (vnrlp);
	}

	return NULL;
}

/**
 * @brief
 *		If a vna_t entry with the given ID attribute (attr), return a pointer
 *		to it;  otherwise NULL is returned.
 *
 * @param[in]	vnrlp	-	vnode list to search
 * @param[in]	attr	-	check for the existence of the given attribute
 *
 * @return	vnal_t *
 * @retval	a pointer to vnal_t	: entry with the given ID (attr) exists
 * @retval	NULL	: does not exists.
 */
static vna_t *
attr2vnr(vnal_t *vnrlp, char *attr)
{
	unsigned long i;

	if (vnrlp == NULL || attr == NULL)
		return NULL;

	for (i = 0; i < vnrlp->vnal_used; i++) {
		vna_t *vnrp = VNAL_NODENUM(vnrlp, i);

		if (strcmp(vnrp->vna_name, attr) == 0)
			return vnrp;
	}

	return NULL;
}

/**
 * @brief
 * 		free the given vnl_t
 *
 * @param[in]	vnlp	-	vnl_t which needs to be freed.
 */
void
vnl_free(vnl_t *vnlp)
{
	unsigned long i, j;

	if (vnlp) {
		assert(vnlp->vnl_list != NULL);
		if (vnlp->vnl_used == 0 && vnlp->vnl_nelem && vnlp->vnl_list) {
			vnal_t *vnrlp = (vnal_t *) vnlp->vnl_list;
			free(vnrlp->vnal_list);
		}
		for (i = 0; i < vnlp->vnl_used; i++) {
			vnal_t *vnrlp = VNL_NODENUM(vnlp, i);

			assert(vnrlp->vnal_list != NULL);
			for (j = 0; j < vnrlp->vnal_used; j++) {
				vna_t *vnrp = VNAL_NODENUM(vnrlp, j);

				free(vnrp->vna_name);
				free(vnrp->vna_val);
			}
			free(vnrlp->vnal_list);
			free(vnrlp->vnal_id);
		}
		free(vnlp->vnl_list);
#ifdef PBS_MOM
		pbs_idx_destroy(vnlp->vnl_ix);
#endif /* PBS_MOM */
		free(vnlp);
	}
}

/**
 * @brief
 *		Check character in a vnode name.
 *
 * @param[in]	c	-	character in a vnode name.
 * @param[in]	extra	-	extra should be non-zero if a period, '.', is to be accepted
 *
 * @return	int
 * @retval	1	: character is legal in a vnode name
 * @retval	0	: character is not legal in a vnode name
 */
int
legal_vnode_char(char c, int extra)
{
	if (isalnum((int) c) ||
	    (c == '-') || (c == '_') || (c == '@') ||
	    (c == '[') || (c == ']') || (c == '#') || (c == '^') ||
	    (c == '/') || (c == '\\'))
		return 1; /* ok */
	if (extra == 1) {
		/* extra character, the period,  allowed */
		if (c == '.')
			return 1;
	} else if (extra == 2) {
		/* extra characters, the period and comma,  allowed */
		if ((c == '.') || (c == ','))
			return 1;
	} else {
		if (c == ',')
			return 1;
	}
	return 0;
}

/**
 *
 * @brief
 * 		Parse tokens in the nodes file
 *
 * @par
 *		Token is returned, if null then there was none.
 *		If there is an error, then "err" is set non-zero.
 *		On following call, with argument "start" as null pointer, then
 *		resume where it left off.
 *
 * @param[in]	start	-	where the parsing last left off. If start is NULL,
 *							then restart where the function last left off.
 * @param[in]	cok	-	states if certain characters are legal, separaters,
 *						or are illegal.   If cok is
 *						0: '.' and '=' are separators, and ',' is ok:
 *		   	   			'=' as separator between "keyword" and "value", and
 *		   	   			'.' between attribute and resource.
 *						1: '.' is allowed as character and '=' is illegal
 *						2: use quoted string parsing rules
 *						Typically "cok" is 1 when parsing what should be the
 *						vnode name:
 *			   				0 when parsing attribute/resource names
 *			   				2 when parsing (resource) values
 * @param[out]	err	-	returns in '*err' the error return code
 * @param[out]	term	-	character terminating token.
 *
 * @return	char *
 * @retval	<value>	Returns the get next element (resource or value) as
 *			next token.
 *
 * @note
 * 		If called with cok = 2, the returned value, if non-null, will be on the
 * 		heap and must be freed by the caller.
 *
 * @par MT-safe: No
 */

char *
parse_node_token(char *start, int cok, int *err, char *term)
{
	static char *pt;
	char *ts;
	char quote;
	char *rn;

	*err = 0;
	if (start)
		pt = start;

	if (cok == 2) {
		/* apply quoted value parsing rules */
		if ((*err = pbs_quote_parse(pt, &rn, &ts, QMGR_NO_WHITE_IN_VALUE)) == 0) {
			*term = *ts;
			if (*ts != '\0')
				pt = ts + 1;
			else
				pt = ts;
			return rn;
		} else {
			return NULL;
		}
	}

	while (*pt && isspace((int) *pt)) /* skip leading whitespace */
		pt++;
	if (*pt == '\0')
		return NULL; /* no token */

	ts = pt;

	/* test for legal characters in token */

	for (; *pt; pt++) {
		if (*pt == '\"') {
			quote = *pt;
			++pt;
			while (*pt != '\0' && *pt != quote)
				pt++;
			quote = 0;
		} else {
			if (legal_vnode_char(*pt, cok) || (*pt == ':'))
				continue; /* valid anywhere */
			else if (isspace((int) *pt))
				break; /* separator anywhere */
			else if (!cok && (*pt == '.'))
				break; /* separator attr.resource */
			else if (!cok && (*pt == '='))
				break; /* separate attr(.resc)=value */
			else
				*err = 1;
		}
	}
	*term = *pt;
	*pt = '\0';
	pt++;
	return (ts);
}

#define VN_NCHUNKS 4 /* number of chunks to allocate initially */
#define VN_MULT 4    /* multiplier for next allocation size */

/**
 * @brief
 *		Handle initial allocation of a vnl_t as well as reallocation when
 *		we run out of space.  The list of vnodes (vnl_t) and the attributes
 *		for each (vnal_t) are initially allocated VN_NCHUNKS entries;  when
 *		that size is outgrown, a list VN_MULT times the current size is
 *		reallocated.
 *
 * @param[out]	vp	-	vnl_t which requires allocation or reallocation.
 */
vnl_t *
vnl_alloc(vnl_t **vp)
{
	vnl_t *newchunk;
	vnal_t *newlist;

	assert(vp != NULL);
	if (*vp == NULL) {
		/*
		 *	Allocate chunk structure and first chunk of
		 *	VN_NCHUNKS attribute list entries.
		 */
		if ((newchunk = malloc(sizeof(vnl_t))) == NULL) {
			sprintf(log_buffer, "malloc vnl_t");
			log_err(errno, __func__, log_buffer);
			return NULL;
		}

		newlist = NULL;
		if (vnal_alloc(&newlist) == NULL) {
			free(newchunk);
			return NULL;
		}
		if ((newchunk->vnl_ix = pbs_idx_create(0, 0)) == NULL) {
			free(newchunk);
			return NULL;
		}
		newchunk->vnl_list = newlist;
		newchunk->vnl_nelem = 1;
		newchunk->vnl_cur = 0;
		newchunk->vnl_used = 0;
		newchunk->vnl_modtime = time(NULL);
		return (*vp = newchunk);
	} else {
		/*
		 *	Reallocate a larger chunk, multiplying the number of
		 *	entries by VN_MULT and initializing the new ones to 0.
		 */
		int cursize = (*vp)->vnl_nelem;
		int newsize = cursize * VN_MULT;

		assert((*vp)->vnl_list != NULL);
		if ((newlist = realloc((*vp)->vnl_list,
				       newsize * sizeof(vnal_t))) == NULL) {
			sprintf(log_buffer, "realloc vnl_list");
			log_err(errno, __func__, log_buffer);
			return NULL;
		} else {
			(*vp)->vnl_list = newlist;
			memset(((vnal_t *) (*vp)->vnl_list) + cursize, 0,
			       ((newsize - cursize) * sizeof(vnal_t)));
			(*vp)->vnl_nelem = newsize;
			return (*vp);
		}
	}
}

/**
 * @brief
 *		Handle initial allocation of a vnal_t as well as reallocation when
 *		we run out of space.  The list of vnode attributes for a given vnode
 *		(vnal_t) is initially allocated VN_NCHUNKS entries;  when that size
 *		is outgrown, a list VN_MULT times the current size is reallocated.
 *
 * @param[out]	vp	-	vnl_t which requires allocation or reallocation.
 */
static vnal_t *
vnal_alloc(vnal_t **vp)
{
	vnal_t *newchunk;
	vna_t *newlist;

	assert(vp != NULL);
	if (*vp == NULL) {
		/*
		 *	Allocate chunk structure and first chunk of
		 *	VN_NCHUNKS attribute list entries.
		 */
		if ((newchunk = malloc(sizeof(vnal_t))) == NULL) {
			sprintf(log_buffer, "malloc vnal_t");
			log_err(errno, __func__, log_buffer);
			return NULL;
		}
		if ((newlist = calloc(VN_NCHUNKS, sizeof(vna_t))) == NULL) {
			sprintf(log_buffer, "calloc vna_t");
			log_err(errno, __func__, log_buffer);
			free(newchunk);
			return NULL;
		} else {
			newchunk->vnal_nelem = VN_NCHUNKS;
			newchunk->vnal_cur = 0;
			newchunk->vnal_used = 0;
			newchunk->vnal_list = newlist;
			return (*vp = newchunk);
		}
	} else {
		/*
		 *	Reallocate a larger chunk, multiplying the number of
		 *	entries by VN_MULT and initializing the new ones to 0.
		 */
		int cursize = (*vp)->vnal_nelem;
		int newsize = (cursize == 0 ? 1 : cursize) * VN_MULT;

		if ((newlist = realloc((*vp)->vnal_list,
				       newsize * sizeof(vna_t))) == NULL) {
			sprintf(log_buffer, "realloc vnal_list");
			log_err(errno, __func__, log_buffer);
			return NULL;
		} else {
			(*vp)->vnal_list = newlist;
			memset(((vna_t *) (*vp)->vnal_list) + cursize, 0,
			       ((newsize - cursize) * sizeof(vna_t)));
			(*vp)->vnal_nelem = newsize;
			return (*vp);
		}
	}
}

/**
 * @brief
 *	This return 1 if the given 'host' and 'part' matches the
 *	parent mom of node 'pnode'.
 *
 * @param[in]	pnode - the node to match host against
 * @param[in]	node_parent_host - if pnode is NULL, consults this as node parent host.
 * @param[in]	host - hostname to match
 * @param[in]	port - port to match
 *
 * @return int
 * @retval 1	- if true
 * @retval 0 	- if  false
 */
static int
is_parent_host_of_node(pbsnode *pnode, char *node_parent_host, char *host, int port)
{
	if (((pnode == NULL) && (node_parent_host == NULL)) || (host == NULL))
		return (0);

	if (pnode == NULL) {
		if (strcmp(node_parent_host, host) == 0)
			return (1);

	} else {
		int i;
		for (i = 0; i < pnode->nd_nummoms; i++) {
			if ((strcmp(pnode->nd_moms[i]->mi_host, host) == 0) &&
			    (pnode->nd_moms[i]->mi_port == port)) {
				return (1);
			}
		}
	}
	return (0);
}

/**
 *
 * @brief
 *	Return <resource>=<value> entries in 'chunk' where
 *	<resource> does not appear in the comma-separated
 *	list 'res_list'.
 * @par
 *	For example, suppposed:
 *		res_list = <resA>,<resB>
 *	and
 *		chunk = <resB>=<valB>:<resC>=<valC>:<resD>=<valD>
 *
 *	then this function returns:
 *		<resC>=<valC>:<resD>=<valD>
 *
 * @param[in]	res_list - the resources list
 * @param[in]	chunk - the chunk to check for new resources.
 *
 * @return char *
 * @retval != NULL	the resources that are used in 'chunk',
 *			but not in 'res_list'.
 * @retval == NULL	if error encountered.
 *
 * @note
 *	The returned string points to a statically allocated buffer
 *	that must not be freed, and will get overwritten on the
 *	next call to this function.
 *
 */
static char *
return_missing_resources(char *chunk, char *res_list)
{
	int snc;
	int snelma;
	static int snelmt = 0;		   /* must be static per parse_chunk_r() */
	static key_value_pair *skv = NULL; /* must be static per parse_chunk_r() */
	int rc = 0;
	static char *ret_buf = NULL;
	static int ret_buf_size = 0;
	int l;
	char *chunk_dup = NULL;

	if ((res_list == NULL) || (chunk == NULL)) {
		log_err(-1, __func__, "bad params passed");
		return (NULL);
	}

	if (ret_buf == NULL) {
		int chunk_len;

		chunk_len = strlen(chunk);
		ret_buf = malloc(chunk_len + 1);
		if (ret_buf == NULL) {
			log_err(errno, __func__, "malloc failed");
			return NULL;
		}
		ret_buf_size = chunk_len;
	}

	chunk_dup = strdup(chunk);
	if (chunk_dup == NULL) {
		log_err(errno, __func__, "strdup failed on chunk");
		return (NULL);
	}
	rc = parse_chunk_r(chunk_dup, &snc, &snelma,
			   &snelmt, &skv, NULL);
	if (rc != 0) {
		snprintf(log_buffer, sizeof(log_buffer), "bad parse of %s", chunk_dup);
		log_err(-1, __func__, log_buffer);
		free(chunk_dup);
		return (NULL);
	}
	ret_buf[0] = '\0';
	for (l = 0; l < snelma; ++l) {
		if (!in_string_list(skv[l].kv_keyw, ',', res_list)) {
			if (ret_buf[0] != '\0') {
				if (pbs_strcat(&ret_buf, &ret_buf_size, ":") == NULL)
					return NULL;
			}

			if (pbs_strcat(&ret_buf, &ret_buf_size, skv[l].kv_keyw) == NULL)
				return NULL;
			if (pbs_strcat(&ret_buf, &ret_buf_size, "=") == NULL)
				return NULL;
			if (pbs_strcat(&ret_buf, &ret_buf_size, skv[l].kv_val) == NULL)
				return NULL;
		}
	}
	free(chunk_dup);
	return (ret_buf);
}

/**
 *
 * @brief
 *	Return a comma-separated list of resource names
 *	used/assigned in the given 'exec_vnode' string.
 *
 * @param[in]	exec_vnode - the master exec_vnode to search on.
 * @return char *
 * @retval != NULL	the resources from 'exec_vnode'.
 * @retval == NULL	if error encountered.
 *
 * @note
 *	The returned string can have duplicate resource
 *	names in them.
 *	The returned string points to a malloced area that
 *	must be freed when not needed.
 *
 */
static char *
resources_seen(char *exec_vnode)
{
	char *selbuf = NULL;
	int hasprn;
	char *last = NULL;
	int snelma;
	static key_value_pair *skv = NULL; /* must be static */
	int j;
	char *psubspec;
	char *res_list = NULL;
	char *noden = NULL;
	size_t ssize = 0;
	size_t slen = 0;

	if (exec_vnode == NULL) {
		log_err(-1, __func__, "bad params passed");
		return (NULL);
	}

	selbuf = strdup(exec_vnode);
	if (selbuf == NULL) {
		log_err(errno, __func__, "strdup failed on exec_vnode");
		return (NULL);
	}
	ssize = strlen(exec_vnode) + 1;
	res_list = (char *) calloc(1, strlen(exec_vnode) + 1);
	if (res_list == NULL) {
		log_err(errno, __func__, "calloc failed on exec_vnode");
		free(selbuf);
		return (NULL);
	}

	for (psubspec = parse_plus_spec_r(selbuf, &last, &hasprn); psubspec != NULL;
	     psubspec = parse_plus_spec_r(last, &last, &hasprn)) {

		if (parse_node_resc(psubspec, &noden, &snelma, &skv) != 0) {
			free(selbuf);
			free(res_list);
			return (NULL);
		}

		for (j = 0; j < snelma; ++j) {
			if (res_list[0] == '\0') {
				strncpy(res_list, skv[j].kv_keyw, ssize - 1);
			} else {
				slen = strlen(res_list);
				strncat(res_list, ",", ssize - slen - 1);
				slen += 1;
				strncat(res_list, skv[j].kv_keyw, ssize - slen - 1);
			}
		}
	}
	free(selbuf);
	return (res_list);
}

/**
 * @brief
 *	Look into a job's exec_host2 or exec_host attribute
 *	for the first entry which is considered the MS host and its
 *	port. 'exec_host2' is consulted first if it is non-NULL, then 'exec_host'.
 * @param[in]	exec_host - exechost to consult
 * @param[in]	exec_host2 - exechost to consult
 * @param[out]  port	- where the corresponding port is returned.
 *
 * @return char *
 * @retval	!= NULL - mother superior full hostname
 * @retval	NULL - if error obtaining hostname.
 *
 * @note
 *	Returned string is in a malloc-ed area which must be freed
 *	outside after use.
 */
static char *
find_ms_full_host_and_port(char *exec_host, char *exec_host2, int *port)
{
	char *ms_exec_host = NULL;
	char *p;

	if (((exec_host == NULL) && (exec_host2 == NULL)) || (port == NULL)) {
		log_err(PBSE_INTERNAL, __func__, "bad input parameter");
		return (NULL);
	}

	*port = pbs_conf.mom_service_port;

	if (exec_host2 != NULL) {
		ms_exec_host = strdup(exec_host2);
		if (ms_exec_host == NULL) {
			log_err(errno, __func__, "strdup failed");
			return (NULL);
		}
		if ((p = strchr(ms_exec_host, '/')) != NULL)
			*p = '\0';

		if ((p = strchr(ms_exec_host, ':')) != NULL) {
			char *endp;
			long pnum;

			pnum = (int) strtol(p + 1, &endp, 10);
			if ((*endp != '\0') || (pnum == LONG_MIN) || (pnum == LONG_MAX)) {
				log_err(errno, __func__, "strtoul error");
				return (NULL);
			}
			*p = '\0';
			*port = pnum;
		}
	} else if (exec_host != NULL) {
		ms_exec_host = strdup(exec_host);
		if (ms_exec_host == NULL) {
			log_err(errno, __func__, "strdup failed");
			return (NULL);
		}
		if ((p = strchr(ms_exec_host, '/')) != NULL)
			*p = '\0';
	}
	return (ms_exec_host);
}

/**
 * @brief
 *	Given a select string specification of the form:
 *		<num>:<resA>=<valA>:<resB>=<valB>+<resN>=<valN>
 *	expand the spec to write out the repeated chunks
 *	completely. For example, given:
 *		2:ncpus=1:mem=3gb:mpiprocs=5
 *	this expands to:
 *	   ncpus=1:mem=3gb:mpiprocs=5+ncpus=1:mem=3gb:mpiprocs=5
 * @param[in]	select_str - the select/schedselect specification
 *
 * @return char *
 * @retval	!= NULL - the expanded select string
 * @retval	NULL - if unexpected encountered during processing.
 *
 * @note
 *	Returned string is in a malloc-ed area which must be freed
 *	outside after use.
 */
static char *
expand_select_spec(char *select_str)
{
	char *selbuf = NULL;
	int hasprn3;
	char *last3 = NULL;
	int snc;
	int snelma;
	static int snelmt = 0;		   /* must be static per parse_chunk_r() */
	static key_value_pair *skv = NULL; /* must be static per parse_chunk_r() */
	int i, j;
	char *psubspec;
	char buf[LOG_BUF_SIZE + 1];
	int ns_malloced = 0;
	char *new_sel = NULL;

	if (select_str == NULL) {
		log_err(-1, __func__, "bad param passed");
		return (NULL);
	}

	selbuf = strdup(select_str);
	if (selbuf == NULL) {
		log_err(errno, __func__, "strdup fail");
		return (NULL);
	}

	/* parse chunk from select spec */
	for (psubspec = parse_plus_spec_r(selbuf, &last3, &hasprn3); psubspec != NULL;
	     psubspec = parse_plus_spec_r(last3, &last3, &hasprn3)) {
		int rc = 0;
		rc = parse_chunk_r(psubspec, &snc, &snelma, &snelmt, &skv, NULL);
		/* snc = number of chunks */
		if (rc != 0) {
			free(selbuf);
			free(new_sel);
			return (NULL);
		}

		for (i = 0; i < snc; ++i) { /* for each chunk in select.. */

			for (j = 0; j < snelma; ++j) {
				if (j == 0) {
					snprintf(buf, sizeof(buf), "1:%s=%s",
						 skv[j].kv_keyw, skv[j].kv_val);
				} else {
					snprintf(buf, sizeof(buf), ":%s=%s",
						 skv[j].kv_keyw, skv[j].kv_val);
				}
				if ((new_sel != NULL) && (new_sel[0] != '\0') && (j == 0)) {
					if (pbs_strcat(&new_sel, &ns_malloced, "+") == NULL) {
						if (ns_malloced > 0)
							free(new_sel);
						log_err(errno, __func__, "pbs_strcat failed");
						free(selbuf);
						return (NULL);
					}
				}
				if (pbs_strcat(&new_sel, &ns_malloced, buf) == NULL) {
					if (ns_malloced > 0)
						free(new_sel);
					log_err(errno, __func__, "pbs_strcat failed");
					free(selbuf);
					return (NULL);
				}
			}
		}
	}
	free(selbuf);
	return (new_sel);
}

enum resc_sum_action {
	RESC_SUM_ADD,
	RESC_SUM_GET_CLEAR
};

/**
 * @brief
 *	manage_resc_sum_values: perform some 'action' on the internal resc_sum_values
 *	array, whether adding a new entry, getting an entry, or clearing/initializing
 *	an entry.
 *
 * @param[in]	action	- can either be 'RESC_SUM_ADD' to add an entry (resc_def,
 *			  keyw, value) into the internal resc_sum_values array,
 *			  or 'RESC_SUM_GET_CLEAR' to return the contents of the
 *			  resc_sum_values array.
 * @param[in]	resc_def- resource definition of the resource to be added to the array.
 *			- must be non-NULL if 'action' is 'RESC_SUM_ADD'.
 * @param[in]	keyw	- resource name of the resource to be added to the array.
 *			- must be non-NULL if 'action' is 'RESC_SUM_ADD'.
 * @param[in]	value	- value of the resource to be added to the array.
 *			  must be non-NULL if 'action' is 'RESC_SUM_ADD'.
 * @param[out]	err_msg	- error message buffer filled in if there's an error executing
 *			  this function.
 * @param[in]	err_msg_sz - size of 'err_msg' buffer.
 *
 * @return 	char *
 * @retval	<string> If 'action' is RESC_SUM_ADD, then this returns the 'keyw' to
 *			 signal success adding the <resc_def, keyw, value>.
 *			 If 'action' is RESC_SUM_GET_CLEAR, then this returns the
 *			 <res>=<value> entries in the internal resc_sum_values
 *			 array, as well as clear/initialize entries in the resc_sum_values
 *			 array.The returned string is of the form:
 *				":<res>=<value>:<res1>=(value1>:<res2>=<value2>..."
 * @retval	NULL	 If an error has occurred, filling in the 'err_msg' with the error
 *			 message.
 * @par	MT-safe: No.
 */
static char *
manage_resc_sum_values(enum resc_sum_action action, resource_def *resc_def, char *keyw, char *value,
		       char *err_msg, int err_msg_sz)
{
	static struct resc_sum *resc_sum_values = NULL;
	static int resc_sum_values_size = 0;
	struct resc_sum *rs;
	int k;

	if ((action == RESC_SUM_ADD) && ((resc_def == NULL) || (keyw == NULL) || (value == NULL))) {
		log_err(-1, __func__, "RESC_SUM_ADD: resc_def, keyw, or value is NULL");
		return (NULL);
	}

	if (resc_sum_values_size == 0) {
		resc_sum_values = (struct resc_sum *) calloc(20,
							     sizeof(struct resc_sum));
		if (resc_sum_values == NULL) {
			log_err(-1, __func__, "resc_sum_values calloc error");
			return (NULL);
		}
		resc_sum_values_size = 20;
	}

	if (action == RESC_SUM_ADD) {
		int r;
		struct resc_sum *tmp_rs;
		int found_match = 0;
		struct attribute tmpatr;

		found_match = 0;
		for (k = 0; k < resc_sum_values_size; k++) {
			rs = resc_sum_values;
			if (rs[k].rs_def == NULL)
				break;

			if (strcmp(rs[k].rs_def->rs_name, keyw) == 0) {
				r = rs[k].rs_def->rs_decode(&tmpatr, keyw, NULL, value);
				if (r == 0)
					rs[k].rs_def->rs_set(&rs[k].rs_attr, &tmpatr, INCR);
				found_match = 1;
				break;
			}
		}

		if (k == resc_sum_values_size) {
			int t;
			/* add a new entry */

			t = resc_sum_values_size + 5;
			tmp_rs = (struct resc_sum *) realloc(resc_sum_values,
							     t * sizeof(struct resc_sum));
			if (tmp_rs == NULL) {
				log_err(-1, __func__, "resc_sum_values realloc error");
				return (NULL);
			}
			resc_sum_values = tmp_rs;
			for (k = resc_sum_values_size; k < t; k++) {
				rs = resc_sum_values;
				rs[k].rs_def = NULL;
				memset(&rs[k].rs_attr, 0, sizeof(struct attribute));
			}
			/* k becomes the index to the new netry */
			k = resc_sum_values_size;
			resc_sum_values_size = t;
		}

		if (!found_match) {
			rs = resc_sum_values;
			rs[k].rs_def = resc_def;
			rs[k].rs_def->rs_decode(&rs[k].rs_attr, keyw, NULL,
						value);
		}
		return (keyw);

	} else if (action == RESC_SUM_GET_CLEAR) {
		svrattrl *val = NULL;
		static char *buf = NULL;
		static int buf_size = 0;

		if (buf_size == 0) {
			buf = (char *) malloc(LOG_BUF_SIZE);

			if (buf == NULL) {
				log_err(-1, __func__, "local buf malloc error");
				return (NULL);
			}
			buf_size = LOG_BUF_SIZE;
		}
		buf[0] = '\0';

		for (k = 0; k < resc_sum_values_size; k++) {
			int rc;

			rs = resc_sum_values;
			if (rs[k].rs_def == NULL)
				break;

			rc = rs[k].rs_def->rs_encode(&rs[k].rs_attr,
						     NULL, ATTR_l, rs[k].rs_def->rs_name,
						     ATR_ENCODE_CLIENT, &val);
			if (rc > 0) {
				if (pbs_strcat(&buf, &buf_size, ":") == NULL)
					return (NULL);
				if (pbs_strcat(&buf, &buf_size, val->al_resc) == NULL)
					return (NULL);
				if (pbs_strcat(&buf, &buf_size, "=") == NULL)
					return (NULL);
				if (pbs_strcat(&buf, &buf_size, val->al_value) == NULL)
					return (NULL);
			}
			free(val);

			rs[k].rs_def->rs_free(&rs[k].rs_attr);
			rs[k].rs_def = NULL;
			memset(&rs[k].rs_attr, 0, sizeof(struct attribute));
		}
		return (buf);
	}
	return (NULL);
}

/*
 * @brief
 *	Initialize the relnodes_input_vnodelist_t structure used as argument to
 *	pbs_release_nodes_given_nodelist() function.
 *
 * @param[out]	r_input	- structure to initialize
 * @return none
 */
void
relnodes_input_vnodelist_init(relnodes_input_vnodelist_t *r_input)
{
	r_input->vnodelist = NULL;
	r_input->deallocated_nodes_orig = NULL;
	r_input->p_new_deallocated_execvnode = NULL;
}

/*
 * @brief
 *	Release node resources from a job whose node/vnode are appearing in
 *	specified nodelist.
 *
 * @param[in]		r_input	- contains various input including the job id
 * @param[in,out]	r_input2 - contains various input and output parameters
 *				   including the list of nodes/vnodes to release
 *				   resources from, as well
 *				   the resulting new values to job's exec_vnode,
 *				   exec_host, exec_host2, and schedselect.
 * @param[out]		err_msg - gets filled in with the error message if this
 *				  function returns a non-zero value.
 * @param[in]		err_sz - size of the 'err_msg' buffer.
 * @return int
 * @retval 0 - success
 * @retval 1 - fail with 'err_msg' filled in with message.
 */
int
pbs_release_nodes_given_nodelist(relnodes_input_t *r_input, relnodes_input_vnodelist_t *r_input2, char *err_msg, int err_msg_sz)
{
	char *new_exec_vnode = NULL;
	char *new_exec_host = NULL;
	char *new_exec_host2 = NULL;
	char *new_select = NULL;
	char *chunk_buf = NULL;
	int chunk_buf_sz = 0;
	char *chunk = NULL;
	char *chunk1 = NULL;
	char *chunk2 = NULL;
	char *chunk3 = NULL;
	char *last = NULL;
	char *last1 = NULL;
	char *last2 = NULL;
	char *last3 = NULL;
	int hasprn = 0;
	int hasprn1 = 0;
	int hasprn2 = 0;
	int hasprn3 = 0;
	int entry = 0;
	int f_entry = 0;
	int h_entry = 0;
	int sel_entry = 0;
	int j;
	int nelem;
	char *noden;
	struct key_value_pair *pkvp;
	char buf[LOG_BUF_SIZE] = {0};
	struct pbsnode *pnode = NULL;
	int rc = 1;
	int ns_malloced = 0;
	char *buf_sum = NULL;
	int paren = 0;
	int found_paren = 0;
	int found_paren_dealloc = 0;
	resource_def *resc_def = NULL;
	char *deallocated_execvnode = NULL;
	int deallocated_execvnode_sz = 0;
	char *extra_res = NULL;
	resource *prs;
	resource_def *prdefvntype;
	char *parent_mom;
	char prev_noden[PBS_MAXNODENAME + 1];
	char *res_in_exec_vnode = NULL;
	char *ms_fullhost = NULL;
	int ms_port = 0;
	char *exec_vnode = NULL;
	char *exec_host = NULL;
	char *exec_host2 = NULL;
	char *sched_select = NULL;
#ifdef PBS_MOM
	momvmap_t *vn_vmap = NULL;
#endif

	if ((r_input == NULL) || (r_input->jobid == NULL) || (r_input->execvnode == NULL) || (r_input->exechost == NULL) || (r_input->exechost2 == NULL) || (r_input->schedselect == NULL) || (err_msg == NULL) || (err_msg_sz <= 0)) {

		log_err(errno, __func__, "required parameter is null");
		return (1);
	}

	err_msg[0] = '\0';

	exec_vnode = strdup(r_input->execvnode);
	if (exec_vnode == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodeslist_exit;
	}

	exec_host = strdup(r_input->exechost);
	if (exec_host == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodeslist_exit;
	}

	exec_host2 = strdup(r_input->exechost2);
	if (exec_host2 == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodeslist_exit;
	}

	sched_select = expand_select_spec(r_input->schedselect);
	if (sched_select == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodeslist_exit;
	}

	ms_fullhost = find_ms_full_host_and_port(exec_host, exec_host2, &ms_port);
	if (ms_fullhost == NULL) {
		log_err(-1, __func__, "can't determine primary execution host and port");
		goto release_nodeslist_exit;
	}

	res_in_exec_vnode = resources_seen(exec_vnode);

	new_exec_vnode = (char *) calloc(1, strlen(exec_vnode) + 1);
	if (new_exec_vnode == NULL) {
		log_err(-1, __func__, "new_exec_vnode calloc error");
		goto release_nodeslist_exit;
	}
	new_exec_vnode[0] = '\0';

	chunk_buf_sz = strlen(exec_vnode) + 1;
	chunk_buf = (char *) calloc(1, chunk_buf_sz);
	if (chunk_buf == NULL) {
		log_err(-1, __func__, "chunk_buf calloc error");
		goto release_nodeslist_exit;
	}

	deallocated_execvnode_sz = strlen(exec_vnode) + 1;
	deallocated_execvnode = (char *) calloc(1, deallocated_execvnode_sz);
	if (deallocated_execvnode == NULL) {
		log_err(-1, __func__, "deallocated_execvnode calloc error");
		goto release_nodeslist_exit;
	}

	if (exec_host != NULL) {
		new_exec_host = (char *) calloc(1, strlen(exec_host) + 1);
		if (new_exec_host == NULL) {
			log_err(-1, __func__, "new_exec_host calloc error");
			goto release_nodeslist_exit;
		}
		new_exec_host[0] = '\0';
	}

	if (exec_host2 != NULL) {
		new_exec_host2 = (char *) calloc(1, strlen(exec_host2) + 1);
		if (new_exec_host2 == NULL) {
			log_err(-1, __func__, "new_exec_host2 calloc error");
			goto release_nodeslist_exit;
		}
		new_exec_host2[0] = '\0';
	}

	prdefvntype = &svr_resc_def[RESC_VNTYPE];
	/* There's a 1:1:1 mapping among exec_vnode parenthesized
	 * entries, exec_host, and exec_host2.
	 */
	entry = 0;     /* exec_vnode entries */
	h_entry = 0;   /* exec_host* entries */
	sel_entry = 0; /* select and schedselect entries */
	f_entry = 0;   /* number of freed sister nodes */
	paren = 0;
	prev_noden[0] = '\0';
	parent_mom = NULL;
	for (chunk = parse_plus_spec_r(exec_vnode, &last, &hasprn),
	    chunk1 = parse_plus_spec_r(exec_host, &last1, &hasprn1),
	    chunk2 = parse_plus_spec_r(exec_host2, &last2, &hasprn2),
	    chunk3 = parse_plus_spec_r(sched_select, &last3, &hasprn3);
	     (chunk != NULL) && (chunk1 != NULL) && (chunk2 != NULL) && (chunk3 != NULL);
	     chunk = parse_plus_spec_r(last, &last, &hasprn)) {

		paren += hasprn;
		strncpy(chunk_buf, chunk, chunk_buf_sz - 1);
		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {

#ifdef PBS_MOM
			/* see if previous entry already matches this */
			if ((strcmp(prev_noden, noden) != 0)) {
				vn_vmap = find_vmap_entry(noden);
				if (vn_vmap == NULL) { /* should not happen */

					snprintf(log_buffer, sizeof(log_buffer), "no vmap entry for %s", noden);
					log_err(errno, __func__, log_buffer);
					goto release_nodeslist_exit;
				}
				if (vn_vmap->mvm_hostn != NULL)
					parent_mom = vn_vmap->mvm_hostn;
				else
					parent_mom = vn_vmap->mvm_name;
			}

			if (parent_mom == NULL) { /* should not happen */

				snprintf(log_buffer, sizeof(log_buffer), "no parent_mom for %s", noden);
				log_err(errno, __func__, log_buffer);
				goto release_nodeslist_exit;
			}

			strncpy(prev_noden, noden, PBS_MAXNODENAME);
#else
			if (r_input->vnodes_data != NULL) {
				/* see if previous entry already matches this */
				if ((strcmp(prev_noden, noden) != 0)) {
					char key_buf[BUF_SIZE];
					svrattrl *svrattrl_e;

					snprintf(key_buf, BUF_SIZE, "%s.resources_assigned", noden);
					if ((svrattrl_e = find_svrattrl_list_entry(r_input->vnodes_data, key_buf, "host,string")) != NULL) {
						parent_mom = svrattrl_e->al_value;
					}
				}

				if (parent_mom == NULL) { /* should not happen */

					snprintf(log_buffer, sizeof(log_buffer), "no parent_mom for %s", noden);
					log_err(errno, __func__, log_buffer);
					goto release_nodeslist_exit;
				}

				strncpy(prev_noden, noden, PBS_MAXNODENAME);
			} else {
				/* see if previous entry already matches this */

				if ((pnode == NULL) ||
				    (strcmp(pnode->nd_name, noden) != 0)) {
					pnode = find_nodebyname(noden);
				}

				if (pnode == NULL) { /* should not happen */
					if ((err_msg != NULL) && (err_msg_sz > 0)) {
						snprintf(err_msg, err_msg_sz, "no node entry for %s", noden);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
					}
					goto release_nodeslist_exit;
				}
			}
#endif

			if (is_parent_host_of_node(pnode, parent_mom, ms_fullhost, ms_port) &&
			    (r_input2->vnodelist != NULL) &&
			    in_string_list(noden, '+', r_input2->vnodelist)) {
				if ((err_msg != NULL) && (err_msg_sz > 0)) {
					snprintf(err_msg, err_msg_sz,
						 "Can't free '%s' since it's on a primary execution host", noden);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
				}
				goto release_nodeslist_exit;
			}

			if ((r_input2->vnodelist != NULL) &&
			    in_string_list(noden, '+', r_input2->vnodelist) && (pnode != NULL) &&
			    (is_nattr_set(pnode, ND_ATR_ResourceAvail) != 0)) {
				for (prs = (resource *) GET_NEXT(get_nattr_list(pnode, ND_ATR_ResourceAvail)); prs != NULL; prs = (resource *) GET_NEXT(prs->rs_link)) {
					if ((prdefvntype != NULL) &&
					    (prs->rs_defin == prdefvntype) &&
					    (is_attr_set(&prs->rs_value)) != 0) {
						struct array_strings *as;
						int l;
						as = prs->rs_value.at_val.at_arst;
						for (l = 0; l < as->as_usedptr; l++) {
							if (strncmp(as->as_string[l], "cray_", 5) == 0) {
								if ((err_msg != NULL) && (err_msg_sz > 0)) {
									snprintf(err_msg, err_msg_sz, "not currently supported on Cray X* series nodes: %s", noden);
									log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
								}
								goto release_nodeslist_exit;
							}
						}
					}
				}
			}

			if (is_parent_host_of_node(pnode, parent_mom, ms_fullhost, ms_port) ||
			    ((r_input2->vnodelist != NULL) && !in_string_list(noden, '+', r_input2->vnodelist))) {

				if (entry > 0) /* there's something put in previously */
					strcat(new_exec_vnode, "+");

				if (((hasprn > 0) && (paren > 0)) ||
				    ((hasprn == 0) && (paren == 0))) {
					/* at the beginning of chunk for current host */
					if (!found_paren) {
						strcat(new_exec_vnode, "(");
						found_paren = 1;

						if (h_entry > 0) {
							/* there's already previous exec_host entry */
							if (new_exec_host != NULL)
								strcat(new_exec_host, "+");
							if (new_exec_host2 != NULL)
								strcat(new_exec_host2, "+");
						}

						if (new_exec_host != NULL)
							strcat(new_exec_host, chunk1);
						if (new_exec_host2 != NULL)
							strcat(new_exec_host2, chunk2);
						h_entry++;
					}
				}

				if (!found_paren) {
					strcat(new_exec_vnode, "(");
					found_paren = 1;

					if (h_entry > 0) {
						/* there's already previous exec_host entry */
						if (new_exec_host != NULL)
							strcat(new_exec_host, "+");
						if (new_exec_host2 != NULL)
							strcat(new_exec_host2, "+");
					}

					if (new_exec_host != NULL)
						strcat(new_exec_host, chunk1);
					if (new_exec_host2 != NULL)
						strcat(new_exec_host2, chunk2);
					h_entry++;
				}
				strcat(new_exec_vnode, noden);
				entry++;

				for (j = 0; j < nelem; ++j) {

					resc_def = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
					if (resc_def == NULL) {
						continue;
					}

					if (manage_resc_sum_values(RESC_SUM_ADD, resc_def,
								   pkvp[j].kv_keyw, pkvp[j].kv_val, err_msg, err_msg_sz) == NULL) {
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							  __func__, err_msg);
						goto release_nodeslist_exit;
					}

					snprintf(buf, sizeof(buf),
						 ":%s=%s", pkvp[j].kv_keyw, pkvp[j].kv_val);
					strcat(new_exec_vnode, buf);
				}

				if (paren == 0) { /* have all chunks for current host */

					if (found_paren) {
						strcat(new_exec_vnode, ")");
						found_paren = 0;
					}

					if (found_paren_dealloc) {
						strcat(deallocated_execvnode, ")");
						found_paren_dealloc = 0;
					}

					buf_sum = manage_resc_sum_values(RESC_SUM_GET_CLEAR,
									 NULL, NULL, NULL, err_msg, err_msg_sz);

					if (buf_sum == NULL) {
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							  __func__, err_msg);
						goto release_nodeslist_exit;
					}

					if (buf_sum[0] != '\0') {
						extra_res = return_missing_resources(chunk3,
										     res_in_exec_vnode);

						if (sel_entry > 0) {
							/* there's already previous select/schedselect entry */
							if (pbs_strcat(
								    &new_select,
								    &ns_malloced,
								    "+") == NULL) {
								log_err(-1, __func__, "pbs_strcat failed");
								goto release_nodeslist_exit;
							}
						}
						if (pbs_strcat(&new_select, &ns_malloced, "1") == NULL) {
							log_err(-1, __func__, "pbs_strcat failed");
							goto release_nodeslist_exit;
						}
						if (pbs_strcat(&new_select, &ns_malloced, buf_sum) == NULL) {
							log_err(-1, __func__, "pbs_strcat failed");
							goto release_nodeslist_exit;
						}
						if ((extra_res != NULL) && (extra_res[0] != '\0')) {
							if (pbs_strcat(&new_select, &ns_malloced, ":") == NULL) {
								log_err(-1, __func__, "pbs_strcat failed");
								goto release_nodeslist_exit;
							}
							if (pbs_strcat(&new_select, &ns_malloced, extra_res) == NULL) {
								log_err(-1, __func__, "pbs_strcat failed");
								goto release_nodeslist_exit;
							}
						}
						sel_entry++;
					}
				}
			} else {
				if (!is_parent_host_of_node(pnode, parent_mom, ms_fullhost, ms_port)) {
					if (f_entry > 0) { /* there's something put in previously */
						strcat(deallocated_execvnode, "+");
					}

					if (((hasprn > 0) && (paren > 0)) || ((hasprn == 0) && (paren == 0))) {
						/* at the beginning of chunk for current host */
						if (!found_paren_dealloc) {
							strcat(deallocated_execvnode, "(");
							found_paren_dealloc = 1;
						}
					}

					if (!found_paren_dealloc) {
						strcat(deallocated_execvnode, "(");
						found_paren_dealloc = 1;
					}
					strcat(deallocated_execvnode, chunk_buf);
					f_entry++;

					if (paren == 0) { /* have all chunks for current host */

						if (found_paren) {
							strcat(new_exec_vnode, ")");
							found_paren = 0;
						}

						if (found_paren_dealloc) {
							strcat(deallocated_execvnode, ")");
							found_paren_dealloc = 0;
						}
					}
				}

				if (hasprn < 0) {
					/* matched ')' in chunk, so need to balance the parenthesis */
					if (found_paren) {
						strcat(new_exec_vnode, ")");
						found_paren = 0;
					}
					if (found_paren_dealloc) {
						strcat(deallocated_execvnode, ")");
						found_paren_dealloc = 0;
					}

					buf_sum = manage_resc_sum_values(RESC_SUM_GET_CLEAR,
									 NULL, NULL, NULL, err_msg, err_msg_sz);

					if (buf_sum == NULL) {
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							  __func__, err_msg);
						goto release_nodeslist_exit;
					}

					if (buf_sum[0] != '\0') {
						extra_res = return_missing_resources(chunk3,
										     res_in_exec_vnode);

						if (sel_entry > 0) {
							/* there's already previous select/schedselect entry */
							if (pbs_strcat(&new_select, &ns_malloced, "+") == NULL) {
								log_err(-1, __func__, "pbs_strcat failed");
								goto release_nodeslist_exit;
							}
						}
						if (pbs_strcat(&new_select, &ns_malloced, "1") == NULL) {
							log_err(-1, __func__, "pbs_strcat failed");
							goto release_nodeslist_exit;
						}
						if (pbs_strcat(&new_select, &ns_malloced, buf_sum) == NULL) {
							log_err(-1, __func__, "pbs_strcat failed");
							goto release_nodeslist_exit;
						}
						if ((extra_res != NULL) && (extra_res[0] != '\0')) {
							if (pbs_strcat(&new_select, &ns_malloced, ":") == NULL) {
								log_err(-1, __func__, "pbs_strcat failed");
								goto release_nodeslist_exit;
							}
							if (pbs_strcat(&new_select, &ns_malloced, extra_res) == NULL) {
								log_err(-1, __func__, "pbs_strcat failed");
								goto release_nodeslist_exit;
							}
						}
						sel_entry++;
					}
				}
			}
		} else {
			log_err(-1, __func__, "parse_node_resc error");
			goto release_nodeslist_exit;
		}

		if (paren == 0) {
			chunk1 = parse_plus_spec_r(last1, &last1, &hasprn1),
			chunk2 = parse_plus_spec_r(last2, &last2, &hasprn2);
			chunk3 = parse_plus_spec_r(last3, &last3, &hasprn3);
		}
	}
	entry = strlen(new_exec_vnode) - 1;
	if ((entry >= 0) && (new_exec_vnode[entry] == '+'))
		new_exec_vnode[entry] = '\0';

	if (strcmp(new_exec_vnode, r_input->execvnode) == 0) {
		/* no change, don't bother setting the new_* return values */
		goto release_nodeslist_exit;
	}

	if (new_exec_host != NULL) {
		entry = strlen(new_exec_host) - 1;
		if ((entry >= 0) && (new_exec_host[entry] == '+'))
			new_exec_host[entry] = '\0';
	}

	if (new_exec_host2 != NULL) {
		entry = strlen(new_exec_host2) - 1;
		if ((entry >= 0) && (new_exec_host2[entry] == '+'))
			new_exec_host2[entry] = '\0';
	}

	entry = strlen(new_select) - 1;
	if ((entry >= 0) && (new_select[entry] == '+'))
		new_select[entry] = '\0';

	entry = strlen(deallocated_execvnode) - 1;
	if ((entry >= 0) && (deallocated_execvnode[entry] == '+'))
		deallocated_execvnode[entry] = '\0';

	if (deallocated_execvnode[0] != '\0') {
		if ((r_input2->deallocated_nodes_orig != NULL) && (r_input2->deallocated_nodes_orig[0] != '\0')) {
			if (pbs_strcat(&deallocated_execvnode,
				       &deallocated_execvnode_sz, "+") == NULL) {
				log_err(-1, __func__,
					"pbs_strcat deallocated_execvnode failed");
				goto release_nodeslist_exit;
			}
			if (pbs_strcat(&deallocated_execvnode, &deallocated_execvnode_sz,
				       r_input2->deallocated_nodes_orig) == NULL) {
				log_err(-1, __func__,
					"pbs_strcat deallocated_execvnode failed");
				goto release_nodeslist_exit;
			}
		}
	}

	/* output message about nodes to be freed but no part of job */
	if ((r_input2->vnodelist != NULL) && (err_msg != NULL) &&
	    (err_msg_sz > 0)) {
		char *tmpbuf;
		char *tmpbuf2;
		char *pc = NULL;
		char *pc1 = NULL;
		char *save_ptr; /* posn for strtok_r() */

		tmpbuf = strdup(r_input2->vnodelist);
		/* will contain nodes that are in 'vnodelist' but not in deallocated_execvnode */
		tmpbuf2 = strdup(r_input2->vnodelist);
		if ((tmpbuf != NULL) && (tmpbuf2 != NULL)) {

			tmpbuf2[0] = '\0';

			pc = strtok_r(tmpbuf, "+", &save_ptr);
			while (pc != NULL) {
				/* trying to match '(<vnode_name>:'
				 *  or '+<vnode_name>:'
				 */
				snprintf(chunk_buf, chunk_buf_sz, "(%s:", pc);
				pc1 = strstr(deallocated_execvnode, chunk_buf);
				if (pc1 == NULL) {
					snprintf(chunk_buf, chunk_buf_sz, "+%s:", pc);
					pc1 = strstr(deallocated_execvnode, chunk_buf);
				}
				if (pc1 == NULL) {
					if (tmpbuf2[0] != '\0')
						strcat(tmpbuf2, " ");
					strcat(tmpbuf2, pc);
				}
				pc = strtok_r(NULL, "+", &save_ptr);
			}

			if (tmpbuf2[0] != '\0') {
				snprintf(err_msg, err_msg_sz,
					 "node(s) requested to be released not part of the job: %s", tmpbuf2);
				free(tmpbuf);
				free(tmpbuf2);
				goto release_nodeslist_exit;
			}
		}
		free(tmpbuf);
		free(tmpbuf2);
	}

	if (new_exec_vnode[0] != '\0') {

		if (strcmp(r_input->execvnode, new_exec_vnode) == 0) {
			/* no change */
			if ((err_msg != NULL) && (err_msg_sz > 0)) {
				snprintf(err_msg, err_msg_sz, "node(s) requested to be released not part of the job: %s", r_input2->vnodelist ? r_input2->vnodelist : "");
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
			}
			goto release_nodeslist_exit;
		}
		if (r_input->p_new_exec_vnode != NULL)
			*(r_input->p_new_exec_vnode) = new_exec_vnode;
	}

	if (deallocated_execvnode[0] != '\0') {
		if (r_input2->p_new_deallocated_execvnode != NULL)
			*(r_input2->p_new_deallocated_execvnode) = deallocated_execvnode;
	}

	if ((new_exec_host != NULL) && (new_exec_host[0] != '\0')) {

		if (r_input->p_new_exec_host[0] != NULL)
			*(r_input->p_new_exec_host[0]) = new_exec_host;
	}

	if ((new_exec_host2 != NULL) && (new_exec_host2[0] != '\0')) {

		if (r_input->p_new_exec_host[1] != NULL)
			*(r_input->p_new_exec_host[1]) = new_exec_host2;
	}

	if (new_select[0] != '\0') {
		if (r_input->p_new_schedselect != NULL)
			*(r_input->p_new_schedselect) = new_select;
	}
	rc = 0;

release_nodeslist_exit:
	free(ms_fullhost);
	free(res_in_exec_vnode);
	free(chunk_buf);
	free(exec_vnode);
	free(exec_host);
	free(exec_host2);
	free(sched_select);
	if ((rc != 0) || (strcmp(new_exec_vnode, r_input->execvnode) == 0)) {
		free(new_exec_vnode);
		free(new_exec_host);
		free(new_exec_host2);
		free(new_select);
		free(deallocated_execvnode);
	}
	/* clear the summation buffer */
	(void) manage_resc_sum_values(RESC_SUM_GET_CLEAR, NULL, NULL, NULL, buf, sizeof(buf));

	return (rc);
}

/**
 *
 * @brief
 *	 Print/log all the entries in the list of nodes for a job.
 *
 * @param[in]	header_str	- header string for logging
 * @param[in]	node_list	- the PBS node list
 *
 * @return none
 */
void
reliable_job_node_print(char *header_str, pbs_list_head *node_list, int logtype)
{
	reliable_job_node *rjn;

	if ((header_str == NULL) || (node_list == NULL))
		return;

	for (rjn = (reliable_job_node *) GET_NEXT(*node_list); rjn != NULL;
	     rjn = (reliable_job_node *) GET_NEXT(rjn->rjn_link)) {
		snprintf(log_buffer, sizeof(log_buffer), "%s: node %s", header_str, rjn->rjn_host);
		log_event(logtype, PBS_EVENTCLASS_NODE,
			  LOG_INFO, __func__, log_buffer);
	}
}

/**
 *
 * @brief
 *	 Free up all the entries in the list of nodes for a job.
 *
 * @param[in]	node_list	- the PBS node list
 *
 * @return none
 */
void
reliable_job_node_free(pbs_list_head *node_list)
{
	reliable_job_node *rjn;

	if (node_list == NULL)
		return;

	for (rjn = (reliable_job_node *) GET_NEXT(*node_list); rjn != NULL; rjn = (reliable_job_node *) GET_NEXT(*node_list)) {
		delete_link(&rjn->rjn_link);
		free(rjn);
	}
}

/**
 *
 * @brief
 *	 Find an entry from the list of nodes for a job.
 *
 * @param[in]	node_list	- the PBS node list
 * @param[in]	nname		- node hostname to search for.
 *
 * @return reliable_job_node *
 *
 * @retval <reliable_nob_node entry>	- if one found.
 * @retval NULL  			- if no entry found.
 *
 */
reliable_job_node *
reliable_job_node_find(pbs_list_head *node_list, char *nname)
{
	reliable_job_node *rjn = NULL;

	if ((node_list == NULL) || (nname == NULL))
		return (NULL);

	for (rjn = (reliable_job_node *) GET_NEXT(*node_list); rjn != NULL; rjn = (reliable_job_node *) GET_NEXT(rjn->rjn_link)) {
		if (strcmp(rjn->rjn_host, nname) == 0) {
			return (rjn);
		}
	}
	return (NULL);
}

/**
 *
 * @brief
 * 	Add a unique entry to the list of mom nodes for a job.
 *
 * @param[in]	node_list	- the PBS node list
 * @param[in]	nname		- node hostname
 *
 * @return int
 * @retval 0	- success
 * @retval -1	- error encountered
 *
 * @return none
 */
int
reliable_job_node_add(pbs_list_head *node_list, char *nname)
{
	reliable_job_node *rjn = NULL;

	if ((node_list == NULL) || (nname == NULL) || (nname[0] == '\0')) {
		log_err(-1, __func__, "unexpected input");
		return (-1);
	}

	if (reliable_job_node_find(node_list, nname) != NULL) {
		return (0);
	}

	rjn = (reliable_job_node *) malloc(sizeof(reliable_job_node));
	if (rjn == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		return (-1);
	}
	CLEAR_LINK(rjn->rjn_link);

	snprintf(rjn->rjn_host, sizeof(rjn->rjn_host), "%s", nname);

	rjn->prologue_hook_success = 0;

	append_link(node_list, &rjn->rjn_link, rjn);

	return (0);
}

/**
 *
 * @brief
 * 	Delete an entry from the list nodes for a job.
 *
 * @param[in]	node_list	- the PBS node list
 * @param[in]	nname		- node hostname to delete
 *
 * @return none
 */
void
reliable_job_node_delete(pbs_list_head *node_list, char *nname)
{
	reliable_job_node *rjn;

	if ((node_list == NULL) || (nname == NULL)) {
		return;
	}

	for (rjn = (reliable_job_node *) GET_NEXT(*node_list); rjn != NULL; rjn = (reliable_job_node *) GET_NEXT(rjn->rjn_link)) {
		if (strcmp(rjn->rjn_host, nname) == 0) {
			delete_link(&rjn->rjn_link);
			free(rjn);
			return;
		}
	}
}

/**
 *
 * @brief
 *	Find an entry from the list of nodes for a job
 *	named 'nname', and mark this node host as having
 *	successfully executed execjob_prologue hook,
 *	resulting in a hook event accept.
 *	If no existing node host was matched, then add one.
 *
 * @param[in]	node_list	- the PBS node list
 * @param[in]	nname		- node hostname to search for.
 *
 * @return reliable_job_node *
 *
 * @retval <reliable_nob_node entry>	- the updated/added node entry
 * @retval NULL  			- if an error occurred.
 *
 */
reliable_job_node *
reliable_job_node_set_prologue_hook_success(pbs_list_head *node_list, char *nname)
{
	reliable_job_node *rjn = NULL;

	if ((node_list == NULL) || (nname == NULL))
		return (NULL);

	for (rjn = (reliable_job_node *) GET_NEXT(*node_list); rjn != NULL; rjn = (reliable_job_node *) GET_NEXT(rjn->rjn_link)) {
		if (strcmp(rjn->rjn_host, nname) == 0) {
			rjn->prologue_hook_success = 1;
			return (rjn);
		}
	}
	/* no entry matched so add one */
	rjn = (reliable_job_node *) malloc(sizeof(reliable_job_node));
	if (rjn == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		return (NULL);
	}
	CLEAR_LINK(rjn->rjn_link);

	snprintf(rjn->rjn_host, sizeof(rjn->rjn_host), "%s", nname);

	rjn->prologue_hook_success = 1;

	append_link(node_list, &rjn->rjn_link, rjn);

	return (rjn);
}

/* Functions and structure in support of releasing node resources to satisfy
 * a new select spec.
 */

typedef struct resc_limit_entry {
	pbs_list_link rl_link;
	resc_limit_t *resc;
} rl_entry;

#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
/**
 * @brief
 * compare lexicographically the names of resources in the resource list contained in
 * two resc_limit_t structures
 *
 * @param[in]	left - the left resource limit.
 * @param[in]	right - the right resource limit.
 *
 * @return int
 * @retval -1	- left < right
 * @retval 0	- left = right
 * @retval 1	- left > right
 * @retval -2	- error
 */
static int
resc_limit_list_cmp_name(resc_limit_t *left, resc_limit_t *right)
{
	resource *pres_l, *pres_r;

	if ((left == NULL) || (right == NULL))
		return -2;

	if (left->rl_ncpus && !right->rl_ncpus)
		return 1;
	if (!left->rl_ncpus && right->rl_ncpus)
		return -1;

	if (left->rl_ssi && !right->rl_ssi)
		return 1;
	if (!left->rl_ssi && right->rl_ssi)
		return -1;

	if (left->rl_mem && !right->rl_mem)
		return 1;
	if (!left->rl_mem && right->rl_mem)
		return -1;

	if (left->rl_vmem && !right->rl_vmem)
		return 1;
	if (!left->rl_vmem && right->rl_vmem)
		return -1;

	if (left->rl_naccels && !right->rl_naccels)
		return 1;
	if (!left->rl_naccels && right->rl_naccels)
		return -1;

	if (left->rl_accel_mem && !right->rl_accel_mem)
		return 1;
	if (!left->rl_accel_mem && right->rl_accel_mem)
		return -1;

	for (pres_l = (resource *) GET_NEXT(left->rl_other_res),
	    pres_r = (resource *) GET_NEXT(right->rl_other_res);
	     pres_l && pres_r;
	     pres_l = (resource *) GET_NEXT(pres_l->rs_link),
	    pres_r = (resource *) GET_NEXT(pres_r->rs_link)) {
		int cmp_res;
		if ((cmp_res = strcasecmp(pres_l->rs_defin->rs_name, pres_r->rs_defin->rs_name)))
			return cmp_res;
	}

	return 0;
}

/**
 * @brief
 * compare the values of resources in the resource list contained in
 * two resc_limit_t structures
 *
 * @param[in]	left - the left resource limit.
 * @param[in]	right - the right resource limit.
 *
 * @return int
 * @retval -1	- left < right
 * @retval 0	- left = right
 * @retval 1	- left > right
 * @retval -2	- error
 */
static int
resc_limit_list_cmp_val(resc_limit_t *left, resc_limit_t *right)
{
	resource *pres_l, *pres_r;

	if ((left == NULL) || (right == NULL))
		return -2;

	if (left->rl_ncpus > right->rl_ncpus)
		return 1;
	if (left->rl_ncpus < right->rl_ncpus)
		return -1;

	if (left->rl_ssi > right->rl_ssi)
		return 1;
	if (left->rl_ssi < right->rl_ssi)
		return -1;

	if (left->rl_mem > right->rl_mem)
		return 1;
	if (left->rl_mem < right->rl_mem)
		return -1;

	if (left->rl_vmem > right->rl_vmem)
		return 1;
	if (left->rl_vmem < right->rl_vmem)
		return -1;

	if (left->rl_naccels > right->rl_naccels)
		return 1;
	if (left->rl_naccels < right->rl_naccels)
		return -1;

	if (left->rl_accel_mem > right->rl_accel_mem)
		return 1;
	if (left->rl_accel_mem < right->rl_accel_mem)
		return -1;

	for (pres_l = (resource *) GET_NEXT(left->rl_other_res),
	    pres_r = (resource *) GET_NEXT(right->rl_other_res);
	     pres_l && pres_r;
	     pres_l = (resource *) GET_NEXT(pres_l->rs_link),
	    pres_r = (resource *) GET_NEXT(pres_r->rs_link)) {
		int cmp_res;
		if (pres_l->rs_defin->rs_type == ATR_TYPE_BOOL)
			cmp_res = pres_l->rs_value.at_val.at_long - pres_r->rs_value.at_val.at_long;
		else
			cmp_res = pres_l->rs_defin->rs_comp(&pres_l->rs_value, &pres_r->rs_value);

		if (cmp_res)
			return cmp_res;
	}

	return 0;
}
#endif
/**
 * @brief
 *	Add the resc_limit entry 'resc' into pbs list 'pbs_head' in
 *	a sorted manner, in the order of increasing cpus or mem.
 *
 * @param[in,out]	phead - the list to add to.
 * @param[in]		resc - the resource limit to add.
 *
 * @return int
 * @retval 0	- successful operation.
 * @retval 1	- unsuccessful operation.
 * 0 for successfully added; 1 otherwise.
 */
static int
add_to_resc_limit_list_sorted(pbs_list_head *phead, resc_limit_t *resc)
{
	pbs_list_link *plink_cur;
	rl_entry *p_entry_cur = NULL;
	rl_entry *new_resc = NULL;
	resc_limit_t *p_res_cur;

	if ((phead == NULL) || (resc == NULL))
		return (1);

	for (plink_cur = phead,
	    p_entry_cur = (rl_entry *) GET_NEXT(*phead);
	     p_entry_cur;
	     p_entry_cur = (rl_entry *) GET_NEXT(*plink_cur)) {
		plink_cur = &p_entry_cur->rl_link;
		p_res_cur = p_entry_cur->resc;

		if (p_res_cur != NULL) {
#if defined(PBS_MOM) || defined(PBS_PYTHON)
			/* order according to increasing # of cpus
			 * if same # of cpus, use increasing amt of mem
			 */
			if ((p_res_cur->rl_ncpus > resc->rl_ncpus) || ((p_res_cur->rl_ncpus == resc->rl_ncpus) && (p_res_cur->rl_mem > resc->rl_mem))) {
				break;
			}
#else
			int cmp_res_name;

			if (p_res_cur->rl_res_count < resc->rl_res_count)
				continue;
			else if (p_res_cur->rl_res_count > resc->rl_res_count)
				break;

			cmp_res_name = resc_limit_list_cmp_name(p_res_cur, resc);

			if (cmp_res_name < 0)
				continue;
			else if (cmp_res_name > 0)
				break;
			else {
				int cmp_res_val = resc_limit_list_cmp_val(p_res_cur, resc);
				if (cmp_res_val < 0)
					continue;
				else
					break;
			}
#endif
		}
	}

	new_resc = (rl_entry *) malloc(sizeof(rl_entry));
	if (new_resc == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		return (1);
	}
	CLEAR_LINK(new_resc->rl_link);

	new_resc->resc = resc;

	/* link after 'current' (or end) of resc_limit_entry in list */
	if (p_entry_cur != NULL) {
		insert_link(plink_cur, &new_resc->rl_link, new_resc, LINK_INSET_BEFORE);
	} else {
		insert_link(plink_cur, &new_resc->rl_link, new_resc, LINK_INSET_AFTER);
	}

	return (0);
}

/**
 * @brief
 *	Add the resc_limit entry 'resc' into the beginning of pbs list
 *	'pbs_head'.
 *
 * @param[in,out]	phead - the list to add to.
 * @param[in]		resc - the resource limit to add as head.
 *
 * @return int
 * @retval 0	- successful operation.
 * @retval 1	- unsuccessful operation.
 */
static int
add_to_resc_limit_list_as_head(pbs_list_head *phead, resc_limit_t *resc)
{
	pbs_list_link *plink_cur;
	rl_entry *new_resc = NULL;
	rl_entry *p_entry_cur = NULL;

	if ((phead == NULL) || (resc == NULL))
		return (1);

	plink_cur = phead;
	p_entry_cur = (rl_entry *) GET_NEXT(*phead);

	if (p_entry_cur) {
		plink_cur = &p_entry_cur->rl_link;
	}

	new_resc = (rl_entry *) malloc(sizeof(rl_entry));
	if (new_resc == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		return (1);
	}
	CLEAR_LINK(new_resc->rl_link);

	new_resc->resc = resc;

	/* link after 'current' (or end) of resc_limit_entry in list */
	if (p_entry_cur) {
		insert_link(plink_cur, &new_resc->rl_link, new_resc, LINK_INSET_BEFORE);
	} else {
		insert_link(plink_cur, &new_resc->rl_link, new_resc, LINK_INSET_AFTER);
	}
	return (0);
}

#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
/**
 * @brief
 *	inserts the resource in the resc_limit_t in lexically increasing order of
 *	resource name
 *
 * @param[in]	have - the resc_limit structure.
 * @param[in]	kv_keyw - resource name.
 * @param[in]	kv_val - resource value.
 * @param[in]	execv_f - flag to indicate if the resource was found in execvnode
 *
 * @return int
 * @retval 0	- successful operation.
 * @retval PBSE_Error	- Error Code.
 */
int
resc_limit_insert_other_res(resc_limit_t *have, char *kv_keyw, char *kv_val, int execv_f)
{
	resource *pres, *pnewres;
	resource_def *resc_def = NULL;
	int cmp_res = -1;
	int rc;

	if (have == NULL) {
		log_err(-1, __func__, "have is NULL");
		return PBSE_INTERNAL;
	}

	if (kv_keyw == NULL) {
		log_err(-1, __func__, "kv_keyw is NULL");
		return PBSE_INVALJOBRESC;
	}

	if (kv_val == NULL) {
		log_err(-1, __func__, "kv_val is NULL");
		return PBSE_INVALJOBRESC;
	}

	resc_def = find_resc_def(svr_resc_def, kv_keyw);
	if (resc_def == NULL) {
		log_err(-1, __func__, "resc_def is NULL");
		return PBSE_UNKRESC;
	}

	for (pres = (resource *) GET_NEXT(have->rl_other_res);
	     pres != NULL;
	     pres = (resource *) GET_NEXT(pres->rs_link)) {
		if ((cmp_res = strcasecmp(pres->rs_defin->rs_name, kv_keyw)) >= 0)
			break;
	}

	if (!cmp_res) {
		attribute tmp = {0};
		if ((rc = pres->rs_defin->rs_decode(&tmp, NULL, NULL, kv_val))) {
			snprintf(log_buffer, sizeof(log_buffer), "failed to decode res %s=%s, (rc=%d)", kv_keyw, kv_val, rc);
			log_err(-1, __func__, log_buffer);
			return rc;
		}
		pres->rs_defin->rs_set(&pres->rs_value, &tmp, INCR);
		free_svrcache(&pres->rs_value);
		pres->rs_defin->rs_encode(&pres->rs_value, NULL, pres->rs_defin->rs_name,
					  NULL, ATR_ENCODE_CLIENT, &pres->rs_value.at_priv_encoded);
		pres->rs_defin->rs_free(&tmp);
	} else {
		pnewres = (resource *) calloc(1, sizeof(resource));
		if (pnewres == NULL) {
			log_err(-1, __func__, "unable to calloc resource");
			return 1;
		}
		CLEAR_LINK(pnewres->rs_link);
		pnewres->rs_defin = resc_def;
		if ((rc = resc_def->rs_decode(&pnewres->rs_value, NULL, NULL, kv_val))) {
			snprintf(log_buffer, sizeof(log_buffer), "failed to decode res %s=%s, (rc=%d)", kv_keyw, kv_val, rc);
			log_err(-1, __func__, log_buffer);
			free(pnewres);
			return rc;
		}
		resc_def->rs_encode(&pnewres->rs_value, NULL, resc_def->rs_name,
				    NULL, ATR_ENCODE_CLIENT, &pnewres->rs_value.at_priv_encoded);
		if (execv_f)
			pnewres->rs_value.at_flags |= ATR_VFLAG_IN_EXECVNODE_FLAG;
		if (cmp_res < 0) /* pres will be NULL */
			append_link(&have->rl_other_res, &pnewres->rs_link, pnewres);
		else /* cmp_res > 0, pres wont be NULL */
			insert_link(&pres->rs_link, &pnewres->rs_link, pnewres, LINK_INSET_BEFORE);
	}
	have->rl_res_count++;

	return 0;
}
#endif

/**
 * @brief
 *	Initialize to zero the resc_limit_t structure.
 *
 * @param[in]	have - the resc_limit_t structure.
 *
 * @return none
 */
void
resc_limit_init(resc_limit_t *have)
{
	if (have == NULL)
		return;

	have->rl_ncpus = 0;
	have->rl_ssi = 0;
	have->rl_mem = 0LL;
	have->rl_vmem = 0LL;
	have->rl_naccels = 0;
	have->rl_accel_mem = 0LL;
	CLEAR_HEAD(have->rl_other_res);
	have->rl_res_count = 0U;
	have->chunkstr = NULL;
	have->chunkstr_sz = 0;
	have->chunkspec = NULL;
	have->host_chunk[0].str = NULL;
	have->host_chunk[0].num = 0;
	have->host_chunk[1].str = NULL;
	have->host_chunk[1].num = 0;
}

/**
 * @brief
 *	Free resource list.
 *
 * @param[in]	pl_head - pointer to pbs_list_head of res list
 *
 * @return none
 */
void
resc_limit_free_res_list(pbs_list_head *pl_head)
{
	resource *next;
	resource *pr;

	if ((pl_head == NULL) || (pl_head->ll_next == NULL))
		return;

	pr = (resource *) GET_NEXT(*pl_head);
	while (pr != NULL) {
		next = (resource *) GET_NEXT(pr->rs_link);
		delete_link(&pr->rs_link);
		pr->rs_defin->rs_free(&pr->rs_value);
		free(pr);
		pr = next;
	}
	CLEAR_HEAD((*pl_head));
}

/**
 * @brief
 *	Free any malloced entries in resc_limit structure.
 *
 * @param[in]	have - the resc_limit structure.
 *
 * @return none
 */
void
resc_limit_free(resc_limit_t *have)
{
	if (have == NULL)
		return;

	resc_limit_free_res_list(&have->rl_other_res);
	have->rl_res_count = 0U;
	free(have->chunkstr);
	have->chunkstr = NULL;
	have->chunkstr_sz = 0;
	free(have->chunkspec);
	have->chunkspec = NULL;
	free(have->host_chunk[0].str);
	have->host_chunk[0].str = NULL;
	have->host_chunk[0].num = 0;
	free(have->host_chunk[1].str);
	have->host_chunk[1].str = NULL;
	have->host_chunk[1].num = 0;
}

/**
 * @brief
 *	Free any malloced entries in the 'resc_list' parameter..
 *
 * @param[in]	have - the resc_limit structure.
 *
 * @return none
 */
void
resc_limit_list_free(pbs_list_head *res_list)
{
	rl_entry *p_entry = NULL;

	if (res_list == NULL)
		return;

	for (p_entry = (rl_entry *) GET_NEXT(*res_list); p_entry != NULL; p_entry = (rl_entry *) GET_NEXT(*res_list)) {
		resc_limit_free(p_entry->resc);
		free(p_entry->resc);
		delete_link(&p_entry->rl_link);
		free(p_entry);
	}
}

/**
 * @brief
 *	Print out the entries in the 'res_list' the server log under 'logtype'
 *
 * @param[in]	header_str - a string to accompany the logged message
 * @param[in]	res_list - the resc_limit structure list
 * @param[in]	logtype -  log level type
 *
 * @return none
 */
void
resc_limit_list_print(char *header_str, pbs_list_head *res_list, int logtype)
{
	rl_entry *p_entry = NULL;
	int i;
	resource *phave;

	if ((header_str == NULL) || (res_list == NULL))
		return;

	p_entry = (rl_entry *) GET_NEXT(*res_list);
	i = 0;
	while (p_entry) {
		resc_limit_t *have;

		have = p_entry->resc;

		snprintf(log_buffer, sizeof(log_buffer), "%s[%d]: ncpus=%d ssi=%d mem=%lld vmem=%lld naccels=%d accel_mem=%lld chunkstr=%s host_chunk[0].str=%s host_chunk[1].str=%s",
			 header_str,
			 i,
			 have->rl_ncpus,
			 have->rl_ssi,
			 have->rl_mem,
			 have->rl_vmem,
			 have->rl_naccels,
			 have->rl_accel_mem,
			 have->chunkstr ? have->chunkstr : "",
			 have->host_chunk[0].str ? have->host_chunk[0].str : "",
			 have->host_chunk[1].str ? have->host_chunk[1].str : "");
		log_event(logtype, PBS_EVENTCLASS_RESC,
			  LOG_INFO, __func__, log_buffer);
		for (phave = (resource *) GET_NEXT(have->rl_other_res);
		     phave;
		     phave = (resource *) GET_NEXT(phave->rs_link)) {
			snprintf(log_buffer, sizeof(log_buffer), "%s[%d]: other res %s=%s",
				 header_str, i, phave->rs_defin->rs_name, phave->rs_value.at_priv_encoded->al_value);
			log_event(logtype, PBS_EVENTCLASS_RESC,
				  LOG_INFO, __func__, log_buffer);
		}
		p_entry = (rl_entry *) GET_NEXT(p_entry->rl_link);
		i++;
	}
}

/**
 * @brief
 * 	Return in 'buf' of size 'sz' a string of the form:
 *
 *		<resource_name>=<resource_value>
 *
 * 	where <resource_name> and <resource_val> maps 'have_resc',
 *	'have_val'  against map_need value. <resource_value> must be of type int.
 *
 * @param[out]		buf - the buffer to fill
 * @param[in]		buf_sz - the size of 'buf'.
 * @param[in]		have_resc 	- the resource name being matched.
 * @param[in]		have_val	- the resource value available.
 * @param[in,out]	map_need_val 	- the needed value. If have_val is <
 *					  map_need_val, then map_need_val is
 *					  decremented by have_val amount and
 *					  returned.
 * @return none
 */
static void
intmap_need_to_have_resources(char *buf, size_t buf_sz,
			      char *have_resc, char *have_val, int *map_need_val)
{
	int have_int;
	char *endp;

	if ((have_resc == NULL) || (have_val == NULL) || (buf == NULL) ||
	    (buf_sz == 0) || (map_need_val == NULL)) {
		log_err(-1, __func__, "map_need_to_have_resources");
		return;
	}

	if (*map_need_val == 0)
		return;

	have_int = (int) strtol(have_val, &endp, 10);
	if (*endp != '\0') {
		log_err(errno, __func__, "strtoul error");
		return;
	}

	if (have_int > *map_need_val) {
		snprintf(buf, buf_sz, ":%s=%d", have_resc, *map_need_val);
		*map_need_val = 0;
	} else {
		*map_need_val -= have_int;
		snprintf(buf, buf_sz, ":%s=%s", have_resc, have_val);
	}
}

/**
 * @brief
 * 	Return in 'buf' of size 'sz' a string of the form:
 *
 *		<resource_name>=<resource_value>kb
 *
 * 	where <resource_name> and <resource_val> maps 'have_resc',
 *	'have_val'  against map_neeed value. <resource_value> must be of size
 *	value.
 *
 * @param[out]		buf - the buffer to fill
 * @param[in]		buf_sz - the size of 'buf'.
 * @param[in]		have_resc 	- the resource name being matched.
 * @param[in]		have_val	- the resource value we have in stock.
 * @param[in,out]	map_need_val 	- the needed value. If have_val is <
 *					  map_neeed_val, then map_need_val is
 *					  decremented by have_val amount and
 *					  returned.
 * @return none
 */
static void
sizemap_need_to_have_resources(char *buf, size_t buf_sz, char *have_resc, char *have_val,
			       long long *map_need_val)
{
	long long have_size;

	if ((have_resc == NULL) || (have_val == NULL) || (buf == NULL) ||
	    (buf_sz == 0) || (map_need_val == NULL)) {
		log_err(-1, __func__, "map_need_to_have_resources");
		return;
	}

	if (*map_need_val == 0LL)
		return;

	have_size = to_kbsize(have_val);

	if (have_size > *map_need_val) {
		snprintf(buf, buf_sz, ":%s=%lldkb", have_resc, *map_need_val);
		*map_need_val = 0LL;
	} else {
		*map_need_val -= have_size;
		snprintf(buf, buf_sz, ":%s=%s", have_resc, have_val);
	}
}

/**
 * @brief
 * 	Return in 'buf' of size 'sz' a string of the form:
 *
 *		<resource_name>=<resource_value>kb
 *
 * 	where <resource_name> and <resource_val> map 'have_resc',
 *	'have_val' against the resc_limit 'need' value.
 *
 * @param[out]		buf - the buffer to fill
 * @param[in]		buf_sz - the size of 'buf'.
 * @param[in]		have_resc 	- the resource name being matched.
 * @param[in]		have_val	- the resource value we have in stock.
 * @param[in,out]	need		- a resc_limit_t structure.
 *					  The 'need' value is
 *					  decremented by have_val amount and
 *					  returned.
 * @return none
 */
static void
map_need_to_have_resources(char *buf, size_t buf_sz, char *have_resc,
			   char *have_val, resc_limit_t *need)
{

	if ((buf == NULL) || (buf_sz == 0) || (have_resc == NULL) ||
	    (have_val == NULL) || (need == NULL)) {
		return;
	}

	if (strcmp(have_resc, "ncpus") == 0) {
		intmap_need_to_have_resources(buf, buf_sz,
					      have_resc, have_val, &need->rl_ncpus);

	} else if (strcmp(have_resc, "mem") == 0) {
		sizemap_need_to_have_resources(buf, buf_sz,
					       have_resc, have_val, &need->rl_mem);

	} else if (strcmp(have_resc, "vmem") == 0) {
		sizemap_need_to_have_resources(buf, buf_sz,
					       have_resc, have_val, &need->rl_vmem);

	} else if (strcmp(have_resc, "naccelerators") == 0) {
		intmap_need_to_have_resources(buf, buf_sz,
					      have_resc, have_val, &need->rl_naccels);

	} else if (strcmp(have_resc, "accelerator_memory") == 0) {
		sizemap_need_to_have_resources(buf, buf_sz,
					       have_resc, have_val, &need->rl_accel_mem);
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	} else {
		resource *pneed;
		for (pneed = (resource *) GET_NEXT(need->rl_other_res);
		     pneed;
		     pneed = (resource *) GET_NEXT(pneed->rs_link)) {
			if (strcasecmp(have_resc, pneed->rs_defin->rs_name) == 0) {
				attribute hattr = {0};
				int cmp_res;
				if (!(pneed->rs_value.at_flags & ATR_VFLAG_IN_EXECVNODE_FLAG))
					return;
				pneed->rs_defin->rs_decode(&hattr, NULL, NULL, have_val);
				cmp_res = pneed->rs_defin->rs_comp(&hattr, &pneed->rs_value);
				if (!cmp_res) {
					resource *tmp = pneed;
					pneed = (resource *) pneed->rs_link.ll_prior;
					snprintf(buf, buf_sz, ":%s=%s", have_resc, have_val);
					delete_link(&tmp->rs_link);
					tmp->rs_defin->rs_free(&tmp->rs_value);
					free(tmp);
				} else {
					if (cmp_res > 0) {
						snprintf(buf, buf_sz, ":%s=%s", have_resc, pneed->rs_value.at_priv_encoded->al_value);
						pneed->rs_defin->rs_decode(&pneed->rs_value, NULL, NULL, "0");
					} else {
						pneed->rs_defin->rs_set(&pneed->rs_value, &hattr, DECR);
						snprintf(buf, buf_sz, ":%s=%s", have_resc, have_val);
					}
					free_svrcache(&pneed->rs_value);
					pneed->rs_defin->rs_encode(&pneed->rs_value, NULL, pneed->rs_defin->rs_name,
								   NULL, ATR_ENCODE_CLIENT, &pneed->rs_value.at_priv_encoded);
				}
			}
		}
#endif
	}
}

/**
 * @brief
 *	Helper function that adds 'noden' resources assigned
 *	'keyw' = 'keyval' values to 'vnlp'.
 * @param[in]	vnlp	- vnode list structure
 * @param[in]	noden   - the node/vnode represented
 * @param[in]	keyw	- resource name
 * @param[in]	keyval	- resource value
 * @return int
 * @retval	0	- success
 * @retval	1	- failure
 */
static int
add_to_vnl(vnl_t **vnlp, char *noden, char *keyw, char *keyval)
{
#if defined(PBS_MOM) || defined(PBS_PYTHON)
	int rc;
	char buf[LOG_BUF_SIZE];
	char buf_val[LOG_BUF_SIZE];
	char *attr_val = NULL;

	if ((vnlp == NULL) || (noden == NULL) || (keyw == NULL) || (keyval == NULL))
		return (0);

	if (*vnlp == NULL) {
		if (vnl_alloc(vnlp) == NULL) {
			log_err(errno, __func__,
				"Failed to allocate a vnlp structure");
			return (1);
		}
	}

	snprintf(buf, sizeof(buf), "resources_assigned.%s", keyw);

	snprintf(buf_val, sizeof(buf_val), "%s", keyval);

	attr_val = vn_exist(*vnlp, noden, buf);
	if (attr_val != NULL) {

		if ((strcmp(buf, "resources_assigned.mem") == 0) ||
		    (strcmp(buf, "resources_assigned.vmem") == 0) ||
		    (strcmp(buf, "resources_assigned.accelerator_memory") == 0)) {
			long long size1;
			long long size2;

			size1 = to_kbsize(attr_val);
			size2 = to_kbsize(keyval);

			snprintf(buf_val, sizeof(buf_val), "%lldkb", size1 + size2);

		} else {
			int val1;
			int val2;

			val1 = atol(attr_val);
			val2 = atol(keyval);
			snprintf(buf_val, sizeof(buf_val) - 1, "%d", val1 + val2);
		}
	}
	rc = vn_addvnr(*vnlp, noden, buf, buf_val, 0, 0, NULL);
	if (rc == -1) {
		char *msgbuf;
		pbs_asprintf(&msgbuf, "failed to add '%s=%s', buf, keyval");
		log_err(-1, __func__, msgbuf);
		free(msgbuf);
		return (1);
	}
#endif
	return (0);
}

#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
/**
 * @brief
 *	Check if other resources in 'have' satisfy the remaining
 *	 resources from 'need'.
 *
 * @param[in]	need - the need value of resc_limit_t type.
 * @param[in]	have - the have value of resc_limit_t type.
 *
 * @return int
 *	 1 - if not satisfied
 *	 0 - otherwise
 *	-1 - error
 */
static int
check_other_res(resc_limit_t *need, resc_limit_t *have)
{
	resource *pneed, *phave;

	if ((need == NULL) || (have == NULL))
		return -1;

	if (!GET_NEXT(need->rl_other_res))
		return 0;

	for (pneed = (resource *) GET_NEXT(need->rl_other_res);
	     pneed;
	     pneed = (resource *) GET_NEXT(pneed->rs_link)) {
		int matched = 0;
		for (phave = (resource *) GET_NEXT(have->rl_other_res);
		     phave;
		     phave = (resource *) GET_NEXT(phave->rs_link)) {
			if (pneed->rs_defin == phave->rs_defin) {
				resource_def *prdef = pneed->rs_defin;
				unsigned int atr_type = prdef->rs_type;
				if ((atr_type == ATR_TYPE_STR) || (atr_type == ATR_TYPE_BOOL)) {
					if (!prdef->rs_comp(&pneed->rs_value, &phave->rs_value)) {
						matched = 1;
						break;
					}
				} else { /* for atr type long, float and size */
					if (prdef->rs_comp(&pneed->rs_value, &phave->rs_value) <= 0) {
						matched = 1;
						break;
					}
				}
			}
		}
		if (!matched)
			return 1;
	}

	return 0;
}

/**
 * @brief
 *	appends a chunk spec to sched select and also tries to
 *	group identical chunk specs by increasing the chunk count
 *
 * @param[in/out]	new_schedselect - pointer to new sched select
 * @param[in]		chunkstr - current chunk spec to append
 * @param[in/out]	tmp_chunk_spec - buffer to accumulate identical chunk specs
 * @param[in/out]	tmp_chunk_ct - count of gathered identical chunk specs
 *
 * @return none
 */
static void
append_and_group_sched_sel(char *new_schedselect, char *chunkstr, char *tmp_chunk_spec, int *tmp_chunk_ct)
{
	if ((new_schedselect == NULL) || (chunkstr == NULL) || (tmp_chunk_spec == NULL) || (tmp_chunk_ct == NULL)) {
		log_err(-1, __func__, "a parameter is NULL");
		return;
	}

	if (*tmp_chunk_spec) {
		if (!strcasecmp(tmp_chunk_spec, chunkstr)) {
			(*tmp_chunk_ct)++;
			return;
		}
		if (*new_schedselect)
			strcat(new_schedselect, "+");
		sprintf(new_schedselect + strlen(new_schedselect), "%d:%s", *tmp_chunk_ct, tmp_chunk_spec);
	}

	(*tmp_chunk_ct) = 1;
	strcpy(tmp_chunk_spec, chunkstr);
}
#endif

/**
 * @brief
 *	Return a string representing a chunk that satisfies 'need'
 *	 resources from the 'have' pool.
 *
 * @param[in]	need - the need value of resc_limit_t type.
 * @param[in]	have - the have value of resc_limit_t type.
 * @param[in]	vnlp - if not-NULL, add the vnodes and
 *			resources that satisfy 'need'
 *			request against 'have' resources.
 *
 * @return char *
 *	<chunk string> - if successful
 *	NULL 		- if could not find a chunk string to satisfy need
 *			  against have, or if an error occurred.
 */
static char *
satisfy_chunk_need(resc_limit_t *need, resc_limit_t *have, vnl_t **vnlp)
{
	resc_limit_t map_need;
	char *chunk = NULL;
	char *noden;
	int nelem;
	char *chunkstr = NULL;
	static char *ret_chunkstr = NULL;
	static size_t ret_chunkstr_size = 0;
	size_t data_size = 0;
	char buf[LOG_BUF_SIZE];
	struct key_value_pair *pkvp;
	int paren = 0;
	int found_paren = 0;
	char *last = NULL;
	int hasprn = 0;
	int j;
	int entry = 0;
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	resource *presnew, *pres, *pneed;
#endif

	if ((need == NULL) || (have == NULL))
		return (NULL);

	if ((have->chunkstr == NULL) || (have->chunkstr[0] == '\0'))
		return (NULL);

	if ((need->rl_ncpus > have->rl_ncpus) ||
	    (need->rl_mem > have->rl_mem) ||
	    (need->rl_ssi > have->rl_ssi) ||
	    (need->rl_vmem > have->rl_vmem) ||
	    (need->rl_naccels > have->rl_naccels) ||
	    (need->rl_accel_mem > have->rl_accel_mem)
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	    || check_other_res(need, have)
#endif
	) {
		return (NULL);
	}

	memset(&map_need, 0, sizeof(resc_limit_t));
	resc_limit_init(&map_need);

#if defined(PBS_MOM) || defined(PBS_PYTHON)
	map_need.rl_ncpus = need->rl_ncpus;
	map_need.rl_mem = need->rl_mem;
	map_need.rl_ssi = need->rl_ssi;
	map_need.rl_vmem = need->rl_vmem;
	map_need.rl_naccels = need->rl_naccels;
	map_need.rl_accel_mem = need->rl_accel_mem;
#else
	map_need.rl_ncpus = have->rl_ncpus;
	map_need.rl_mem = have->rl_mem;
	map_need.rl_ssi = have->rl_ssi;
	map_need.rl_vmem = have->rl_vmem;
	map_need.rl_naccels = have->rl_naccels;
	map_need.rl_accel_mem = have->rl_accel_mem;

	for (pres = (resource *) GET_NEXT(have->rl_other_res);
	     pres;
	     pres = (resource *) GET_NEXT(pres->rs_link)) {
		presnew = (resource *) calloc(1, sizeof(resource));
		if (presnew == NULL) {
			log_err(-1, __func__, "unable to calloc resource");
			return (NULL);
		}
		CLEAR_LINK(presnew->rs_link);
		presnew->rs_defin = pres->rs_defin;
		append_link(&map_need.rl_other_res, &presnew->rs_link, presnew);
		presnew->rs_defin->rs_set(&presnew->rs_value, &pres->rs_value, SET);
		presnew->rs_defin->rs_encode(&presnew->rs_value, NULL, presnew->rs_defin->rs_name,
					     NULL, ATR_ENCODE_CLIENT, &presnew->rs_value.at_priv_encoded);
		if (pres->rs_value.at_flags & ATR_VFLAG_IN_EXECVNODE_FLAG)
			presnew->rs_value.at_flags |= ATR_VFLAG_IN_EXECVNODE_FLAG;
	}

	if (need->rl_ncpus)
		map_need.rl_ncpus = need->rl_ncpus;
	if (need->rl_mem)
		map_need.rl_mem = need->rl_mem;
	if (need->rl_ssi)
		map_need.rl_ssi = need->rl_ssi;
	if (need->rl_vmem)
		map_need.rl_vmem = need->rl_vmem;
	if (need->rl_naccels)
		map_need.rl_naccels = need->rl_naccels;
	if (need->rl_accel_mem)
		map_need.rl_accel_mem = need->rl_accel_mem;

	pres = (resource *) GET_NEXT(map_need.rl_other_res);
	pneed = (resource *) GET_NEXT(need->rl_other_res);
	while (pres && pneed) {
		unsigned int res_type = pneed->rs_defin->rs_type;
		;
		while (pres && (pneed->rs_defin != pres->rs_defin))
			pres = (resource *) GET_NEXT(pres->rs_link);
		if (!pres)
			break;

		if (((res_type == ATR_TYPE_LONG) || (res_type == ATR_TYPE_SIZE) || (res_type == ATR_TYPE_FLOAT)) && (pres->rs_defin->rs_comp(&pres->rs_value, &pneed->rs_value))) {
			pres->rs_defin->rs_free(&pres->rs_value); /* ATR_VFLAG_IN_EXECVNODE_FLAG gets preserved */
			pres->rs_defin->rs_set(&pres->rs_value, &pneed->rs_value, SET);
			pres->rs_defin->rs_encode(&pres->rs_value, NULL, pres->rs_defin->rs_name,
						  NULL, ATR_ENCODE_CLIENT, &pres->rs_value.at_priv_encoded);
		}
		pneed = (resource *) GET_NEXT(pneed->rs_link);
	}
#endif

	data_size = strlen(have->chunkstr) + 1;
	if (data_size > ret_chunkstr_size) {
		char *tpbuf;

		tpbuf = realloc(ret_chunkstr, data_size);
		if (tpbuf == NULL) {
			log_err(-1, __func__, "realloc failure");
			resc_limit_free(&map_need);
			return (NULL);
		}
		ret_chunkstr = tpbuf;
		ret_chunkstr_size = data_size;
	}
	ret_chunkstr[0] = '\0';

	chunkstr = strdup(have->chunkstr);
	if (chunkstr == NULL) {
		log_err(errno, __func__, "strdup 1 failure");
		resc_limit_free(&map_need);
		return (NULL);
	}

	for (chunk = parse_plus_spec_r(chunkstr, &last, &hasprn);
	     chunk != NULL;
	     chunk = parse_plus_spec_r(last, &last, &hasprn)) {

		paren += hasprn;

		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {
			int vnode_in = 0;

			if (((hasprn > 0) && (paren > 0)) || ((hasprn == 0) && (paren == 0))) {
				/* at the beginning of chunk for current host */
				if (!found_paren) {
					strcat(ret_chunkstr, "(");
					found_paren = 1;
				}
				for (j = 0; j < nelem; ++j) {

					buf[0] = '\0';
					map_need_to_have_resources(buf,
								   sizeof(buf) - 1, pkvp[j].kv_keyw, pkvp[j].kv_val, &map_need);

					if (buf[0] != '\0') {
						if (!vnode_in) {
							if (entry > 0) {
								strcat(ret_chunkstr, "+");
							}
							strcat(ret_chunkstr, noden);
							entry++;
							vnode_in = 1;
						}
						strcat(ret_chunkstr, buf);
						(void) add_to_vnl(vnlp, noden, pkvp[j].kv_keyw, pkvp[j].kv_val);
					}
				}

				if (paren == 0) { /* have all chunks for current host */

					if (found_paren) {
						strcat(ret_chunkstr, ")");
						found_paren = 0;
					}
				}
			} else {

				if (!found_paren) {
					strcat(ret_chunkstr, "(");
					found_paren = 1;
				}
				for (j = 0; j < nelem; ++j) {
					buf[0] = '\0';
					map_need_to_have_resources(buf, sizeof(buf) - 1, pkvp[j].kv_keyw, pkvp[j].kv_val, &map_need);

					if (buf[0] != '\0') {
						if (!vnode_in) {
							if (entry > 0) {
								strcat(ret_chunkstr, "+");
							}
							strcat(ret_chunkstr, noden);
							entry++;
							vnode_in = 1;
						}
						strcat(ret_chunkstr, buf);
						(void) add_to_vnl(vnlp, noden, pkvp[j].kv_keyw, pkvp[j].kv_val);
					}
				}
			}

			if (paren == 0) { /* have all chunks for current host */

				if (found_paren) {
					strcat(ret_chunkstr, ")");
					found_paren = 0;
				}
			}

		} else {
			log_err(errno, __func__, "parse_node_resc_error");
			free(chunkstr);
			resc_limit_free(&map_need);
			return (NULL);
		}
	}

	free(chunkstr);
	resc_limit_free(&map_need);
	return (ret_chunkstr);
}

/*
 * @brief
 *	Initialize the relnodes_input_t structure used as argument to
 *	pbs_release_nodes_given_nodelist() and pbs_release_nodes_given_select()
 *	functions.
 * @param[out]	r_input	- structure to initialize
 * @return none
 */
void
relnodes_input_init(relnodes_input_t *r_input)
{
	r_input->jobid = NULL;
	r_input->vnodes_data = NULL;
	r_input->execvnode = NULL;
	r_input->exechost = NULL;
	r_input->exechost2 = NULL;
	r_input->schedselect = NULL;
	r_input->p_new_exec_vnode = NULL;
	r_input->p_new_exec_host[0] = NULL;
	r_input->p_new_exec_host[1] = NULL;
	r_input->p_new_schedselect = NULL;
}

/*
 * @brief
 *	Initialize the relnodes_input_select_t structure used as argument to
 *	pbs_release_nodes_given_select() function.
 *
 * @param[out]	r_input	- structure to initialize
 * @return none
 */
void
relnodes_input_select_init(relnodes_input_select_t *r_input)
{
	r_input->select_str = NULL;
	r_input->failed_mom_list = NULL;
	r_input->succeeded_mom_list = NULL;
	r_input->failed_vnodes = NULL;
	r_input->good_vnodes = NULL;
}

/**
 *
 * @brief
 *	Return a subset of the exec_vnode string 'e_vnode'
 *	where only vnode chunks matching the vnode names
 *	in 'vnl_good' (list of healthy vnodes) are shown.
 * @par
 *	For example, given:
 *		e_vnode = (vn1:<r1>=<v1>)+(vn2:<r2>=<v2>)+(vn3:<r3>=<v3>)
 *	and
 *		vnl_fails lists: vn2
 *
 *	then this function returns:
 *		e_vnode = (vn1:<r1>=<v1>)+(vn3:<r3>=<v3>)
 *
 * @param[in]	e_vnode - exec_vnode string
 * @param[in]	vnl_good - some list of names of failed vnodes
 *
 * @return char *
 * @retval != NULL	the exec_vnode string of healthy vnodes
 * @retval == NULL	if error encountered.
 *
 * @note
 *	The returned string points to a statically allocated buffer
 *	that must not be freed, and will get overwritten on the
 *	next call to this function.
 *
 */
static char *
return_available_vnodes(char *e_vnode, vnl_t *vnl_good)
{
	char *save_ptr;
	char *pc;
	char *tmpbuf;
	static char *ebuf = NULL;
	static int ebuf_size = 0;

	if (e_vnode == NULL)
		return NULL;

	tmpbuf = strdup(e_vnode);
	if (tmpbuf == NULL) {
		log_err(errno, __func__, "strdup failed");
		return NULL;
	}

	if (ebuf == NULL) {
		ebuf = malloc(LOG_BUF_SIZE + 1);
		if (ebuf == NULL) {
			log_err(errno, __func__, "malloc failed");
			return NULL;
		}
		ebuf_size = LOG_BUF_SIZE;
	}

	ebuf[0] = '\0';
	for (pc = strtok_r(tmpbuf, "+", &save_ptr); pc != NULL; pc = strtok_r(NULL, "+", &save_ptr)) {
		char *vn = pc;
		char *p;

		p = strchr(pc, ':');
		if (p != NULL) {
			*p = '\0';
			if (*vn == '(')
				vn++;
			if (vn_vnode(vnl_good, vn)) {
				*p = ':';
				if (ebuf[0] != '\0') {
					if (pbs_strcat(&ebuf, &ebuf_size, "+") == NULL) {
						free(tmpbuf);
						return NULL;
					}
				}
				if (pbs_strcat(&ebuf, &ebuf_size, pc) == NULL) {
					free(tmpbuf);
					return NULL;
				}
			} else {
				*p = ':';
			}

		} else {
			if (ebuf[0] != '\0') {
				if (pbs_strcat(&ebuf, &ebuf_size, "+") == NULL) {
					free(tmpbuf);
					return NULL;
				}
			}
			if (pbs_strcat(&ebuf, &ebuf_size, pc) == NULL) {
				free(tmpbuf);
				return NULL;
			}
		}
	}

	free(tmpbuf);
	return (ebuf);
}

/**
 * @brief
 *	Release node resources from a job in such a way it satisfies some
 *	specified select value.
 *
 * @param[in]		r_input	- contains various input including the job id
 * @param[in,out]	r_input2 - contains various input and output parameters
 *				   including the desired 'select' spec, as well
 *				   the resulting new values to job's exec_vnode,
 *				   exec_host, exec_host2, and schedselect.
 * @param[out]		err_msg - gets filled in with the error message if this
 *				  function returns a non-zero value.
 * @param[int]		err_sz - size of the 'err_msg' buffer.
 * @return int
 * @retval 0 - success
 * @retval 1 - fail with 'err_msg' filled in with message.
 */
int
pbs_release_nodes_given_select(relnodes_input_t *r_input, relnodes_input_select_t *r_input2, char *err_msg, int err_msg_sz)
{
	char *new_exec_vnode = NULL;
	char *new_exec_host = NULL;
	char *new_exec_host2 = NULL;
	char *new_schedselect = NULL;
	char *noden;
	int nelem;
	int paren = 0;
	int found_paren = 0;
	char *chunk = NULL;
	char *chunk1 = NULL;
	char *chunk2 = NULL;
	int entry = 0;
	int h_entry = 0;
	char buf[LOG_BUF_SIZE];

	struct key_value_pair *pkvp;
	char *last = NULL;
	char *last1 = NULL;
	char *last2 = NULL;
	char *last3 = NULL;
	int hasprn = 0;
	int hasprn1 = 0;
	int hasprn2 = 0;
	int hasprn3;
	char *exec_vnode = NULL;
	char *exec_host = NULL;
	char *exec_host2 = NULL;

	resc_limit_t *have = NULL;
	resc_limit_t *have2 = NULL;
	pbs_list_head resc_limit_list;
	resc_limit_t *have0 = NULL;

	char *selbuf = NULL;
	char *psubspec;
	int rc = 1;
	resc_limit_t need;
	int snelma;
	static int snelmt = 0;
	static key_value_pair *skv = NULL;
	rl_entry *p_entry = NULL;
	int matched = 0;
	int snc;
	int h, i, j, k, l;
	char *new_chunkstr = NULL;
	/* job vnodes that have been out as their parent moms are non-functioning */
	vnl_t *vnl_fails = NULL;
	/* job vnodess that have functioning parent moms */
	vnl_t *vnl_good = NULL;
	vnl_t *vnl_good_master = NULL;
	char prev_noden[PBS_MAXNODENAME + 1];
	char *parent_mom;
	char *tmpstr;
	char *chunk_buf = NULL;
	int chunk_buf_sz = 0;
#ifdef PBS_MOM
	resource_def *resc_def = NULL;
	momvmap_t *vn_vmap = NULL;
#else
	struct pbsnode *pnode = NULL;
	char e2buf[PBS_MAXHOSTNAME + 1 + 6 + 16];
#ifndef PBS_PYTHON
	char *extra_res = NULL;
	resource *pres;
	char *sched_select = NULL;
	char *chunkschsel = NULL;
	char *res_in_exec_vnode = NULL;
	char *lastschsel = NULL;
	int hasprnschsel = 0;
	char *tmp_chunk_spec = NULL;
	int tmp_chunk_ct;
#endif
#endif

	if ((r_input == NULL) || (r_input2 == NULL) || (r_input->jobid == NULL) || (r_input->execvnode == NULL) || (r_input->exechost == NULL) || (r_input->exechost2 == NULL) || (r_input->schedselect == NULL) || (err_msg == NULL) || (err_msg_sz <= 0)) {
		log_err(-1, __func__, "required parameter is null");
		return (1);
	}
	err_msg[0] = '\0';
	resc_limit_init(&need);
	exec_vnode = strdup(r_input->execvnode);
	if (exec_vnode == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodes_exit;
	}

	exec_host = strdup(r_input->exechost);
	if (exec_host == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodes_exit;
	}

	exec_host2 = strdup(r_input->exechost2);
	if (exec_host2 == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodes_exit;
	}

#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	sched_select = expand_select_spec(r_input->schedselect);
	if (sched_select == NULL) {
		log_err(errno, __func__, "strdup error");
		goto release_nodes_exit;
	}
	if (!(new_schedselect = malloc(strlen(sched_select)))) {
		log_err(errno, __func__, "new_schedselect malloc failed");
		goto release_nodes_exit;
	}
	*new_schedselect = '\0';

	if (!(tmp_chunk_spec = malloc(strlen(r_input->schedselect)))) {
		log_err(errno, __func__, "tmp_chunk_spec malloc failed");
		goto release_nodes_exit;
	}
	*tmp_chunk_spec = '\0';
	res_in_exec_vnode = resources_seen(exec_vnode);
#endif

	chunk_buf_sz = strlen(exec_vnode) + 1;
	chunk_buf = (char *) calloc(1, chunk_buf_sz);
	if (chunk_buf == NULL) {
		log_err(errno, __func__, "chunk_buf calloc error");
		goto release_nodes_exit;
	}

	reliable_job_node_print("job failed_mom_list",
				r_input2->failed_mom_list, PBSEVENT_DEBUG3);
	reliable_job_node_print("job succeeded_mom_list",
				r_input2->succeeded_mom_list, PBSEVENT_DEBUG3);

	/* now parse exec_vnode to build up the 'have' resources list */
	CLEAR_HEAD(resc_limit_list);

	/* There's a 1:1:1 mapping among exec_vnode parenthesized entries, exec_host, */
	/* and exec_host2,  */
	entry = 0;   /* exec_vnode entries */
	h_entry = 0; /* exec_host* entries */
	paren = 0;
	prev_noden[0] = '\0';
	k = 0;
	parent_mom = NULL;
	for (chunk = parse_plus_spec_r(exec_vnode, &last, &hasprn),
	    chunk1 = parse_plus_spec_r(exec_host, &last1, &hasprn1),
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	    chunkschsel = parse_plus_spec_r(sched_select, &lastschsel, &hasprnschsel),
#endif
	    chunk2 = parse_plus_spec_r(exec_host2, &last2, &hasprn2);
	     (chunk != NULL) && (chunk1 != NULL)
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	     && (chunkschsel != NULL)
#endif
	     && (chunk2 != NULL);
	     chunk = parse_plus_spec_r(last, &last, &hasprn)) {

		paren += hasprn;
		strncpy(chunk_buf, chunk, chunk_buf_sz - 1);
		if (parse_node_resc(chunk, &noden, &nelem, &pkvp) == 0) {

#ifdef PBS_MOM
			/* see if previous entry already matches this */
			if ((strcmp(prev_noden, noden) != 0)) {
				vn_vmap = find_vmap_entry(noden);
				if (vn_vmap == NULL) { /* should not happen */

					if ((err_msg != NULL) && (err_msg_sz > 0)) {
						snprintf(err_msg, err_msg_sz, "no vmap entry for %s", noden);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
					}
					goto release_nodes_exit;
				}
				if (vn_vmap->mvm_hostn != NULL) {
					parent_mom = vn_vmap->mvm_hostn;
				} else {
					parent_mom = vn_vmap->mvm_name;
				}
			}

			if (parent_mom == NULL) { /* should not happen */

				if ((err_msg != NULL) && (err_msg_sz > 0)) {
					snprintf(err_msg, err_msg_sz, "no parent_mom for for %s", noden);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
				}
				goto release_nodes_exit;
			}

			strncpy(prev_noden, noden, PBS_MAXNODENAME);
#else
			e2buf[0] = '\0';
			if (r_input->vnodes_data != NULL) {
				/* see if previous entry already matches this */
				if ((strcmp(prev_noden, noden) != 0)) {
					char key_buf[BUF_SIZE];
					svrattrl *svrattrl_e;

					snprintf(key_buf, BUF_SIZE, "%s.resources_assigned", noden);
					if ((svrattrl_e = find_svrattrl_list_entry(r_input->vnodes_data, key_buf, "host,string")) != NULL) {
						parent_mom = svrattrl_e->al_value;
					}
				}

				strncpy(prev_noden, noden, PBS_MAXNODENAME);
			} else {
				/* see if previous entry already matches this */
				if ((pnode == NULL) ||
				    (strcmp(pnode->nd_name, noden) != 0)) {
					pnode = find_nodebyname(noden);
				}

				if (pnode == NULL) { /* should not happen */
					if ((err_msg != NULL) && (err_msg_sz > 0)) {
						snprintf(err_msg, err_msg_sz, "no node entry for %s", noden);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
					}
					goto release_nodes_exit;
				}

				parent_mom = NULL;

				if (chunk2 && *chunk2) {
					char *tmp;
					int i;
					snprintf(e2buf, sizeof(e2buf), "%s", chunk2);
					tmp = strtok(e2buf, ":/");

					for (i = 0; tmp && (i < pnode->nd_nummoms); i++) {
						if ((strcmp(pnode->nd_moms[i]->mi_host, tmp) == 0)) {
							parent_mom = tmp;
						}
					}
				}
			}

			if (parent_mom == NULL) { /* should not happen */

				if ((err_msg != NULL) && (err_msg_sz > 0)) {
					snprintf(err_msg, err_msg_sz, "no parent_mom for for %s", noden);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, r_input->jobid, err_msg);
				}
				goto release_nodes_exit;
			}
#endif

			if (reliable_job_node_find(r_input2->succeeded_mom_list, parent_mom) != NULL) {
				if (entry > 0) { /* there's something */
						 /* put in previously */
					if (have != NULL) {
						if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, "+") == NULL)
							goto release_nodes_exit;
					}
				}

				if (((hasprn > 0) && (paren > 0)) ||
				    ((hasprn == 0) && (paren == 0))) {
					/* at the beginning of chunk for current host */
					if (!found_paren) {

						free(have);
						have = (resc_limit_t *) malloc(sizeof(resc_limit_t));
						if (have == NULL) {
							goto release_nodes_exit;
						}
						/* clear "have" counts */
						resc_limit_init(have);

						if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, "(") == NULL)
							goto release_nodes_exit;
						found_paren = 1;

						if (h_entry > 0) {
							/* there's already previous exec_host entry */
							if ((have->host_chunk[0].str != NULL) &&
							    have->host_chunk[0].str[0] != '\0') {
								if (pbs_strcat(&have->host_chunk[0].str, &have->host_chunk[0].num, "+") == NULL)
									goto release_nodes_exit;
							}
							if ((have->host_chunk[1].str != NULL) &&
							    (have->host_chunk[1].str[0] != '\0')) {
								if (pbs_strcat(&have->host_chunk[1].str, &have->host_chunk[1].num, "+") == NULL)
									goto release_nodes_exit;
							}
						}

						if (pbs_strcat(&have->host_chunk[0].str, &have->host_chunk[0].num, chunk1) == NULL)
							goto release_nodes_exit;
						if (pbs_strcat(&have->host_chunk[1].str, &have->host_chunk[1].num, chunk2) == NULL)
							goto release_nodes_exit;
						h_entry++;
					}
				}
				if (have == NULL) {
					log_err(-1, __func__, "unexpected NULL 'have' value");
					goto release_nodes_exit;
				}

				if (!found_paren) {
					if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, "(") == NULL)
						goto release_nodes_exit;
					found_paren = 1;

					if (h_entry > 0) {
						/* there's already previous */
						/* exec_host entry */
						if ((have->host_chunk[0].str != NULL) &&
						    (have->host_chunk[0].str[0] != '\0')) {
							if (pbs_strcat(&have->host_chunk[0].str, &have->host_chunk[0].num, "+") == NULL)
								goto release_nodes_exit;
						}
						if ((have->host_chunk[1].str != NULL) &&
						    (have->host_chunk[1].str[0] != '\0')) {
							if (pbs_strcat(&have->host_chunk[1].str, &have->host_chunk[1].num, "+") == NULL)
								goto release_nodes_exit;
						}
					}
					if (pbs_strcat(&have->host_chunk[0].str, &have->host_chunk[0].num, chunk1) == NULL)
						goto release_nodes_exit;

					if (pbs_strcat(&have->host_chunk[1].str, &have->host_chunk[1].num, chunk2) == NULL)
						goto release_nodes_exit;

					h_entry++;
				}
				if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, noden) == NULL)
					goto release_nodes_exit;
				entry++;

				for (j = 0; j < nelem; ++j) {

#ifdef PBS_MOM
					resc_def = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
					if (resc_def == NULL) {
						continue;
					}
					if (add_to_vnl(&vnl_good, noden, pkvp[j].kv_keyw, pkvp[j].kv_val) != 0) {
						goto release_nodes_exit;
					}
#endif
					snprintf(buf, sizeof(buf),
						 ":%s=%s", pkvp[j].kv_keyw, pkvp[j].kv_val);
					if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, buf) == NULL)
						goto release_nodes_exit;
					if (strcmp(pkvp[j].kv_keyw, "ncpus") == 0) {
						have->rl_ncpus += atol(pkvp[j].kv_val);
					} else if (strcmp(pkvp[j].kv_keyw, "mem") == 0) {
						have->rl_mem += to_kbsize(pkvp[j].kv_val);
					} else if (strcmp(pkvp[j].kv_keyw, "vmem") == 0) {
						have->rl_vmem += to_kbsize(pkvp[j].kv_val);
					} else if (strcmp(pkvp[j].kv_keyw, "ssinodes") == 0) {
						have->rl_ssi += atol(pkvp[j].kv_val);
					} else if (strcmp(pkvp[j].kv_keyw, "naccelerators") == 0) {
						have->rl_naccels += atol(pkvp[j].kv_val);
					} else if (
						strcmp(pkvp[j].kv_keyw, "accelerator_memory") == 0) {
						have->rl_accel_mem += to_kbsize(pkvp[j].kv_val);
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
					} else {
						rc = resc_limit_insert_other_res(have, pkvp[j].kv_keyw, pkvp[j].kv_val, TRUE);
						if (rc != 0) {
							snprintf(log_buffer, sizeof(log_buffer), "failed to insert resource %s", pkvp[j].kv_keyw);
							log_err(-1, __func__, log_buffer);
							goto release_nodes_exit;
						}
#endif
					}
				}

				if (paren == 0) { /* have all chunks for current host */

					if (found_paren) {
						if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, ")") == NULL)
							goto release_nodes_exit;
						found_paren = 0;
					}

#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
					if (!(have->chunkspec = strdup(chunkschsel + 2))) { /* +2 is to skip past '1:' */
						log_err(errno, __func__, "strdup error");
						goto release_nodes_exit;
					}
					extra_res = return_missing_resources(chunkschsel,
									     res_in_exec_vnode);
					if ((extra_res) && (*extra_res)) {
						char *word, *value, *last;
						int x;
						for (x = parse_resc_equal_string(extra_res, &word, &value, &last);
						     x == 1;
						     x = parse_resc_equal_string(last, &word, &value, &last)) {
							if ((rc = resc_limit_insert_other_res(have, word, value, FALSE))) {
								snprintf(log_buffer, sizeof(log_buffer), "failed to insert resource %s", word);
								log_err(-1, __func__, log_buffer);
								goto release_nodes_exit;
							}
						}
					}

					if (have->rl_ncpus)
						have->rl_res_count++;
					if (have->rl_ssi)
						have->rl_res_count++;
					if (have->rl_mem)
						have->rl_res_count++;
					if (have->rl_vmem)
						have->rl_res_count++;
					if (have->rl_naccels)
						have->rl_res_count++;
					if (have->rl_accel_mem)
						have->rl_res_count++;
#endif
				}
			} else {
				if (paren == 0) { /* have all chunks for current host */

					if (found_paren) {
						if (have == NULL) {
							log_err(-1, __func__, "unexpected NULL 'have' value");
							goto release_nodes_exit;
						}
						if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, ")") == NULL)
							goto release_nodes_exit;
						found_paren = 0;
					}
				}
				/* only save in 'failed_nodes' those nodes that are non in good mom_List but in failed_mom_list */
				if ((r_input2->failed_vnodes != NULL) && (reliable_job_node_find(r_input2->failed_mom_list, parent_mom) != NULL)) {
					for (j = 0; j < nelem; ++j) {
						if (add_to_vnl(&vnl_fails, noden, pkvp[j].kv_keyw, pkvp[j].kv_val) != 0) {
							goto release_nodes_exit;
						}
					}
				}
			}

			if (hasprn < 0) {
				/* matched ')' in chunk, so need to */
				/* balance the parenthesis */
				if (found_paren) {
					if (have == NULL) {
						log_err(-1, __func__, "unexpected NULL 'have' value");
						goto release_nodes_exit;
					}
					if (pbs_strcat(&have->chunkstr, &have->chunkstr_sz, ")") == NULL)
						goto release_nodes_exit;
					found_paren = 0;
				}
			}
		} else {
			log_err(-1, __func__, "parse_node_resc error");
			goto release_nodes_exit;
		}

		if (paren == 0) {
			if (k == 0) {
				have0 = have;
				have = NULL;
			} else if (add_to_resc_limit_list_sorted(&resc_limit_list, have) == 0) {
				have = NULL;
				/* already saved in list  */
			} else if (have != NULL) {
				log_err(-1, __func__, "problem saving 'have' value");
				goto release_nodes_exit;
			}
			chunk1 = parse_plus_spec_r(last1, &last1,
						   &hasprn1),
			chunk2 = parse_plus_spec_r(last2, &last2,
						   &hasprn2);
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
			chunkschsel = parse_plus_spec_r(lastschsel, &lastschsel,
							&hasprnschsel);
#endif
			k++;
		}
	}
	/* First chunk in the 'have' list must always be the first */
	/* entry since it pertains to the MS */

	if (have0 != NULL) {
		if (add_to_resc_limit_list_as_head(&resc_limit_list, have0) == 0) {
			have0 = NULL; /* already saved in listl  */
		}
	}

	new_exec_vnode = (char *) calloc(1, strlen(r_input->execvnode) + 1);
	if (new_exec_vnode == NULL) {
		log_err(-1, __func__, "calloc error");
		goto release_nodes_exit;
	}
	new_exec_vnode[0] = '\0';

	if (r_input->exechost != NULL) {
		new_exec_host = (char *) calloc(1, strlen(r_input->exechost) + 1);
		if (new_exec_host == NULL) {
			log_err(-1, __func__, "calloc error");
			goto release_nodes_exit;
		}
		new_exec_host[0] = '\0';
	}

	if (r_input->exechost2 != NULL) {
		new_exec_host2 = (char *) calloc(1, strlen(r_input->exechost2) + 1);
		if (new_exec_host2 == NULL) {
			log_err(-1, __func__, "calloc error");
			goto release_nodes_exit;
		}
		new_exec_host2[0] = '\0';
	}

	if (r_input2->select_str == NULL) {
		/* not satisfying some schedselect */
		rc = 0;
		goto release_nodes_exit;
	}

	/* save vnl_good for logging later, as we now try to satisfy */
	/* select_str */
	vnl_good_master = vnl_good;
	vnl_good = NULL;

	selbuf = strdup(r_input2->select_str);
	if (selbuf == NULL) {
		log_err(-1, __func__, "strdup failed");
		goto release_nodes_exit;
	}
	resc_limit_list_print("HAVE", &resc_limit_list, PBSEVENT_DEBUG4);
	reliable_job_node_print("job failed_mom_list", r_input2->failed_mom_list, PBSEVENT_DEBUG4);
	reliable_job_node_print("job succeeded_mom_list", r_input2->succeeded_mom_list, PBSEVENT_DEBUG4);

	/* (1) parse chunk from select spec */
	psubspec = parse_plus_spec_r(selbuf, &last3, &hasprn3);
	h = 0; /* tracks # of plus entries in select */
	l = 0; /* tracks # of chunks in new_exec_vnode */
	while (psubspec) {
		rc = parse_chunk_r(psubspec, &snc, &snelma, &snelmt, &skv, NULL);
		/* snc = number of chunks */
		if (rc != 0)
			goto release_nodes_exit;

		for (i = 0; i < snc; ++i) { /* for each chunk in select.. */
			char *have_exec_vnode;

			/* clear "need" counts */
			memset(&need, 0, sizeof(need));
			resc_limit_init(&need);

			/* figure out what is "need"ed */
			for (j = 0; j < snelma; ++j) {
				if (strcmp(skv[j].kv_keyw, "ncpus") == 0)
					need.rl_ncpus = atol(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "ssinodes") == 0)
					need.rl_ssi = atol(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "mem") == 0)
					need.rl_mem = to_kbsize(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "vmem") == 0)
					need.rl_vmem = to_kbsize(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "naccelerators") == 0)
					need.rl_naccels = atol(skv[j].kv_val);
				else if (strcmp(skv[j].kv_keyw, "accelerator_memory") == 0)
					need.rl_accel_mem = to_kbsize(skv[j].kv_val);
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
				else {
					if ((rc = resc_limit_insert_other_res(&need, skv[j].kv_keyw, skv[j].kv_val, FALSE))) {
						sprintf(log_buffer, "failed to insert resource %s", skv[j].kv_keyw);
						log_err(-1, __func__, log_buffer);
						goto release_nodes_exit;
					}
				}
#endif
			}

			/* go through the list of chunk resources */
			/* we have and find a matching chunk */
			/* If none matched, then we return  */
			p_entry = (rl_entry *) GET_NEXT(resc_limit_list);
			matched = 0; /* set to 1 if an entry is matched for current select chunk */
			k = 0;
			while (p_entry) {
				have2 = p_entry->resc;
				new_chunkstr = satisfy_chunk_need(&need, have2, &vnl_good);
				if (new_chunkstr != NULL) {
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
					append_and_group_sched_sel(new_schedselect, have2->chunkspec, tmp_chunk_spec, &tmp_chunk_ct);
#endif
					if (l > 0) {
						strcat(new_exec_vnode, "+");
						if (have2->host_chunk[0].str) {
							if (new_exec_host != NULL)
								strcat(new_exec_host, "+");
						}
						if (have2->host_chunk[1].str) {
							if (new_exec_host2 != NULL)
								strcat(new_exec_host2, "+");
						}
					}
					strcat(new_exec_vnode, new_chunkstr);
					free(have2->chunkstr);
					have2->chunkstr = NULL;

					if (have2->host_chunk[0].str) {
						if (new_exec_host != NULL)
							strcat(new_exec_host, have2->host_chunk[0].str);
						free(have2->host_chunk[0].str);
						have2->host_chunk[0].str = NULL;
					}

					if (have2->host_chunk[1].str) {
						if (new_exec_host2 != NULL)
							strcat(new_exec_host2, have2->host_chunk[1].str);
						free(have2->host_chunk[1].str);
						have2->host_chunk[1].str = NULL;
					}
					matched = 1;
					l++;
					break;
				}
				k++;
				p_entry = (rl_entry *) GET_NEXT(p_entry->rl_link);
			}
			if (matched == 0) {
				/* did not find a matching chunk */
				/* for current select chunk. */
				snprintf(log_buffer, sizeof(log_buffer),
					 "could not satisfy select "
					 "chunk (ncpus=%d "
					 "ssi=%d "
					 "mem=%lld vmem=%lld naccels=%d "
					 "accel_mem=%lld)",
					 need.rl_ncpus, need.rl_ssi, need.rl_mem,
					 need.rl_vmem, need.rl_naccels,
					 need.rl_accel_mem);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
				for (pres = (resource *) GET_NEXT(need.rl_other_res);
				     pres != NULL;
				     pres = (resource *) GET_NEXT(pres->rs_link)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "(%s=%s)", pres->rs_defin->rs_name, pres->rs_value.at_priv_encoded->al_value);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
				}
#endif
				snprintf(log_buffer, sizeof(log_buffer), "NEED chunks for keep_select (%s)", (r_input2->select_str ? r_input2->select_str : ""));
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
				have_exec_vnode = return_available_vnodes(r_input->execvnode, vnl_good_master);
				snprintf(log_buffer, sizeof(log_buffer), "HAVE chunks from job's exec_vnode: %s", have_exec_vnode ? have_exec_vnode : "none");
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
				resc_limit_list_print("HAVE", &resc_limit_list, PBSEVENT_DEBUG3);
				reliable_job_node_print("job failed_mom_list", r_input2->failed_mom_list, PBSEVENT_DEBUG3);
				reliable_job_node_print("job succeeded_mom_list", r_input2->succeeded_mom_list, PBSEVENT_DEBUG3);
				rc = 1;
				goto release_nodes_exit;
			} else if ((h == 0) && (i == 0) && (k != 0)) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "could not satisfy 1st "
					 "select chunk (ncpus=%d "
					 "ssi=%d "
					 "mem=%lld vmem=%lld naccels=%d "
					 "accel_mem=%lld) "
					 " with first available chunk",
					 need.rl_ncpus, need.rl_ssi, need.rl_mem,
					 need.rl_vmem, need.rl_naccels,
					 need.rl_accel_mem);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
				for (pres = (resource *) GET_NEXT(need.rl_other_res);
				     pres != NULL;
				     pres = (resource *) GET_NEXT(pres->rs_link)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "(%s=%s)", pres->rs_defin->rs_name, pres->rs_value.at_priv_encoded->al_value);
					log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
				}
#endif
				snprintf(log_buffer, sizeof(log_buffer), "NEED chunks for keep_select (%s)", (r_input2->select_str ? r_input2->select_str : ""));
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
				have_exec_vnode = return_available_vnodes(r_input->execvnode, vnl_good_master);
				snprintf(log_buffer, sizeof(log_buffer), "HAVE chunks from job's exec_vnode: %s", have_exec_vnode ? have_exec_vnode : "none");
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_ERR, r_input->jobid, log_buffer);
				resc_limit_list_print("HAVE", &resc_limit_list, PBSEVENT_DEBUG3);

				reliable_job_node_print("job failed_mom_list", r_input2->failed_mom_list, PBSEVENT_DEBUG3);
				reliable_job_node_print("job succeeded_mom_list", r_input2->succeeded_mom_list, PBSEVENT_DEBUG3);
				rc = 1;
				goto release_nodes_exit;
			}
			resc_limit_free(&need);
		}

		/* do next section of select */
		psubspec = parse_plus_spec_r(last3, &last3, &hasprn3);
		h++;
	}

	if (strcmp(new_exec_vnode, r_input->execvnode) == 0) {
		/* no change, don't bother setting the new_* return values */
		rc = 0;
		goto release_nodes_exit;
	}

#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	append_and_group_sched_sel(new_schedselect, "", tmp_chunk_spec, &tmp_chunk_ct);
	rc = do_schedselect(new_schedselect, NULL, NULL, NULL, &tmpstr);
	free(new_schedselect);
#else
	rc = do_schedselect(r_input2->select_str, NULL, NULL, NULL, &tmpstr);
#endif
	if (rc != 0) {
		rc = 1;
		goto release_nodes_exit;
	}
	new_schedselect = strdup(tmpstr);
	if (new_schedselect == NULL) {
		log_err(errno, __func__, msg_err_malloc);
		rc = 1;
		goto release_nodes_exit;
	}

	rc = 0;
release_nodes_exit:
	free(exec_vnode);
	free(exec_host);
	free(exec_host2);
#if !(defined(PBS_MOM) || defined(PBS_PYTHON))
	free(sched_select);
	free(res_in_exec_vnode);
	if (tmp_chunk_spec)
		free(tmp_chunk_spec);
#endif
	free(chunk_buf);
	resc_limit_list_free(&resc_limit_list);
	resc_limit_free(have);
	free(have);
	resc_limit_free(&need);
	resc_limit_free(have0);
	free(have0);
	free(selbuf);
	vnl_free(vnl_good_master);

	if ((rc != 0) || (strcmp(r_input->execvnode, new_exec_vnode) == 0)) {
		/* error or if there was no change */
		free(new_exec_vnode);
		free(new_exec_host);
		free(new_exec_host2);
		free(new_schedselect);
		vnl_free(vnl_fails);
		vnl_free(vnl_good);
	} else if (r_input2->select_str == NULL) {
		if (r_input2->failed_vnodes != NULL) {
			*(r_input2->failed_vnodes) = vnl_fails;
		} else {
			vnl_free(vnl_fails);
		}

		if (r_input2->good_vnodes != NULL) {
			*(r_input2->good_vnodes) = vnl_good;
		} else {
			vnl_free(vnl_good);
		}
		free(new_exec_vnode);
		free(new_exec_host);
		free(new_exec_host2);
		free(new_schedselect);

	} else {
		if (r_input2->failed_vnodes != NULL) {
			*(r_input2->failed_vnodes) = vnl_fails;
		} else {
			vnl_free(vnl_fails);
		}

		if (r_input2->good_vnodes != NULL) {
			*(r_input2->good_vnodes) = vnl_good;
		} else {
			vnl_free(vnl_good);
		}
		if (r_input->p_new_exec_vnode != NULL)
			*(r_input->p_new_exec_vnode) = new_exec_vnode;
		if ((r_input->p_new_exec_host[0] != NULL) && (new_exec_host != NULL))
			*(r_input->p_new_exec_host[0]) = new_exec_host;
		if ((r_input->p_new_exec_host[1] != NULL) && (new_exec_host2 != NULL))
			*(r_input->p_new_exec_host[1]) = new_exec_host2;
		if (r_input->p_new_schedselect != NULL)
			*(r_input->p_new_schedselect) = new_schedselect;
	}

	return (rc);
}

/**
 * @brief
 *		strcat_grow
 *
 * @par Functionality:
 *		If the buffer, buf, whose size is lenbuf is too small to cat source,
 *		increase the size of buf by the length of "source" plus an extra
 *		PBS_STRCAT_GROW_INCR bytes.
 *		Makes sure there is at least PBS_STRCAT_GROW_MIN free bytes
 *		in "buff" for those simple one or two byte direct additions..
 *		Assumes both current string in buf and source are null terminated.
 *
 * @param[in]	buf    -	pointer to the address of buffer, may be updated.
 * @param[in] 	curr   -	current point to which source string will be
 *							concatenated.  This is within the current string or the end
 *							of the current string in "buff", may have data after
 *							"curr" in the buffer.
 * @param[in]	lenbuf -	current size of buf, may be updated.
 * @param[in]	source - 	string which is to be concatenated to "curr".
 *
 * @return	int
 * @retval	 0	: success
 * @retval	-1	: realloc failure, out of memory
 *
 * @par Side-effect:	If buffer is increased in size, "buf", "curr" and "lenbuf"
 *						are updated.
 *
 * @par MT-safe:	No
 *
 * @par	Future extension	- This function is currently designed as a drop in
 *	for make_schedselect().  It could be simplified for more general use
 *	by removing the use of "curr".
 */

#define PBS_STRCAT_GROW_MIN 16
#define PBS_STRCAT_GROW_INCR 512
static int
strcat_grow(char **buf, char **curr, size_t *lenbuf, char *source)
{

	size_t add;
	size_t currsize;
	ssize_t delta;
	if ((lenbuf == NULL) || (curr == NULL) || (buf == NULL) || (source == NULL))
		return -1;

	currsize = *lenbuf;
	delta = *curr - *buf; /* offset in buffer */
	add = strlen(source);
	if ((delta + strlen(*curr) + add + PBS_STRCAT_GROW_MIN) >= currsize) {
		/* need to grow buffer */
		char *newbuf;
		size_t newlen;

		newlen = currsize + add + PBS_STRCAT_GROW_INCR;

		newbuf = realloc((void *) *buf, newlen);
		if (newbuf) {
			*buf = newbuf;
			*curr = newbuf + delta;
			*lenbuf = newlen;
		} else {
			return -1; /* error */
		}
	}
	(void) strcat(*curr, source);
	return 0;
}
/*
 *
 * @note
 *	The return value *p_sched_select is in a static dynamic memory that
 *	will get overwritten in the next call.
 */
/**
 * @par
 * 		Decode a selection specification, and produce the
 *		the "schedselect" attribute which contains any default resources
 *		missing from the chunks in the select spec.
 *		Also translates the value of any boolean resource to the "formal"
 *		value of "True" or "False" for the Scheduler who needs to know it
 *		is a boolean and not a string or number.
 *
 *	@param[in]	select_val -	the select specification being decoded
 * 	@param[in]	server -	used to obtain server defaults
 * 	@param[in]	destin -	used to obtain queue defaults
 *	@param[out]	presc_in_err -	error information filled in here
 *	@param[out]	p_schedselect -	the resulting schedselect value.
 *
 *	@return	int
 *	@retval	0	: success
 *	@retval	PBSE_Error	: Error Code.
 *
 *	@par MT-safe:	No.
 */
int
do_schedselect(char *select_val, void *server, void *destin, char **presc_in_err, char **p_sched_select)
{
	char *chunk;
	int i;
	int firstchunk;
	size_t len;
	int nchk;
	int already_set = 0;
	int nchunk_internally_set;
	int nelem;
	static char *outbuf = NULL;
	struct key_value_pair *pkvp;
	struct key_value_pair *qdkvp;
	int qndft;
	struct key_value_pair *sdkvp;
	int sndft;
	char *quotec;
	resource_def *presc;
	char *pc;
	int rc;
	char *tb;
	int validate_resource_exist = 0;
	static size_t bufsz = 0;
	struct server *pserver = NULL;
	pbs_queue *pque = NULL;

	if ((select_val == NULL) || (p_sched_select == NULL)) {
		return (PBSE_SYSTEM);
	}

	pserver = server;
	pque = destin;

	/* allocate or realloc bigger the out buffer for parsing */
	if ((len = (strlen(select_val) + 100)) >= (bufsz >> 1)) {
		len = (2 * len) + 500 + bufsz;
		if (bufsz) {
			tb = (char *) realloc(outbuf, len);
			if (tb == NULL)
				return PBSE_SYSTEM;
			outbuf = tb;
		} else {
			outbuf = (char *) malloc(len);
			if (outbuf == NULL)
				return PBSE_SYSTEM;
		}
		bufsz = len;
	}

	if (pque == NULL || pque->qu_qs.qu_type == QTYPE_Execution)
		validate_resource_exist = 1;

	*outbuf = '\0';
	/* copy input, the string will be broken during parsing */
	firstchunk = 1;
	chunk = parse_plus_spec(select_val, &rc); /* break '+' separated substrings */
	if (rc != 0)
		return rc;
	while (chunk) {
		if (firstchunk)
			firstchunk = 0;
		else
			strcat(outbuf, "+");

		if (parse_chunk(chunk, &nchk, &nelem, &pkvp, &nchunk_internally_set) == 0) {
			int j;

			/* first check for any invalid resources in the select */
			for (j = 0; j < nelem; ++j) {

				/* see if resource is repeated within the chunk - an err */
				for (i = 0; i < j; ++i) {
					if (strcmp(pkvp[j].kv_keyw, pkvp[i].kv_keyw) == 0) {
						if (presc_in_err != NULL) {
							if ((*presc_in_err = strdup(pkvp[j].kv_keyw)) == NULL)
								return PBSE_SYSTEM;
						}
						return PBSE_DUPRESC;
					}
				}
				presc = find_resc_def(svr_resc_def, pkvp[j].kv_keyw);
				if (presc) {
					if ((presc->rs_flags & ATR_DFLAG_CVTSLT) == 0) {
						if (presc_in_err != NULL) {
							if ((*presc_in_err = strdup(pkvp[j].kv_keyw)) == NULL)
								return PBSE_SYSTEM;
						}
						return PBSE_INVALSELECTRESC;
					}
				} else if (validate_resource_exist) {
					if (presc_in_err != NULL) {
						if ((*presc_in_err = strdup(pkvp[j].kv_keyw)) == NULL)
							return PBSE_SYSTEM;
					}
					return PBSE_UNKRESC;
				}
			}

			pc = outbuf + strlen(outbuf);

			/* add in any defaults, first from the queue,... */
			/* then add in any defaults from the server */

			if (pque) {
				qndft = pque->qu_nseldft;
				qdkvp = pque->qu_seldft;
				rc = parse_chunk_make_room(nelem, qndft, &pkvp);
				if (rc)
					return rc;
				for (i = 0; i < qndft; ++i) {
					for (j = 0; j < nelem; ++j) {
						if (strcasecmp(qdkvp[i].kv_keyw, pkvp[j].kv_keyw) == 0)
							break;
					}
					if (j == nelem) {
						/* check to see if the value is "nchunk" */
						/* If nchunk_internally_set is set, then */
						/* the user did not specify a chunk size in the */
						/* select line.  Set nchk to the "nchunk" value  */
						if (strcasecmp(qdkvp[i].kv_keyw, "nchunk") == 0) {
							if (nchunk_internally_set) {
								nchk = atoi(qdkvp[i].kv_val);
								already_set = 1;
							}
						} else {
							/* Add in the defaults from the Queue */
							pkvp[nelem].kv_keyw = qdkvp[i].kv_keyw;
							pkvp[nelem++].kv_val = qdkvp[i].kv_val;
						}
					}
				}
			}

			if (pserver != NULL) {
				sndft = pserver->sv_nseldft;
				sdkvp = pserver->sv_seldft;
				rc = parse_chunk_make_room(nelem, sndft, &pkvp);
				if (rc)
					return rc;
			} else {
				sndft = 0;
				sdkvp = NULL;
			}
			for (i = 0; i < sndft; ++i) {
				for (j = 0; j < nelem; ++j) {
					if (strcasecmp(sdkvp[i].kv_keyw, pkvp[j].kv_keyw) == 0)
						break;
				}
				if (j == nelem) {
					/* check to see if the value is "nchunk" */
					/* If nchunk_internally_set is set, then    */
					/* the user did not specify a chunk size in the */
					/* select line, so set nchk to the "nchunk" value  */
					if (strcasecmp(sdkvp[i].kv_keyw, "nchunk") == 0) {
						if (nchunk_internally_set && (!already_set))
							nchk = atoi(sdkvp[i].kv_val);
					} else {
						/* Add in the defaults from the Server */
						pkvp[nelem].kv_keyw = sdkvp[i].kv_keyw;
						pkvp[nelem++].kv_val = sdkvp[i].kv_val;
					}
				}
			}
			sprintf(pc, "%d", nchk);
			if (nelem > 0) {
				/*
				 * if the resource is known to be of type boolean, then
				 * replace its value with exactly "True" or "False" as
				 * appropriate for the Scheduler.  Then rebuild it in
				 * the out buf.
				 */
				presc = find_resc_def(svr_resc_def, pkvp[0].kv_keyw);
				for (i = 0; i < nelem; ++i) {
					strcat(pc, ":");
					if (strcat_grow(&outbuf, &pc, &bufsz, pkvp[i].kv_keyw) == -1)
						return PBSE_SYSTEM;
					strcat(pc, "=");
					presc = find_resc_def(svr_resc_def, pkvp[i].kv_keyw);
					if (presc && (presc->rs_type == ATR_TYPE_BOOL)) {
						j = is_true_or_false(pkvp[i].kv_val);
						if (j == 1)
							strcat(pc, ATR_TRUE);
						else if (j == 0)
							strcat(pc, ATR_FALSE);
						else
							return PBSE_BADATVAL;

					} else {
						if (presc && (presc->rs_type == ATR_TYPE_SIZE)) {
							if (strcat_grow(&outbuf, &pc, &bufsz, pkvp[i].kv_val) == -1)
								return PBSE_SYSTEM;
							tb = pkvp[i].kv_val + strlen(pkvp[i].kv_val) - 1;
							if (*tb != 'b' && *tb != 'w' &&
							    *tb != 'B' && *tb != 'W')
								strcat(pc, "b");
						} else if (presc &&
							   ((presc->rs_type == ATR_TYPE_STR) ||
							    (presc->rs_type == ATR_TYPE_ARST))) {
							if (strpbrk(pkvp[i].kv_val, "\"'+:=()")) {
								if (strchr(pkvp[i].kv_val, (int) '"'))
									quotec = "'";
								else
									quotec = "\"";
								strcat(pc, quotec);
								if (strcat_grow(&outbuf, &pc, &bufsz, pkvp[i].kv_val) == -1)
									return PBSE_SYSTEM;
								strcat(pc, quotec);
							} else {
								if (strcat_grow(&outbuf, &pc, &bufsz, pkvp[i].kv_val) == -1)
									return PBSE_SYSTEM;
							}

						} else {
							if (strcat_grow(&outbuf, &pc, &bufsz, pkvp[i].kv_val) == -1)
								return PBSE_SYSTEM;
						}
					}
				}
			} else
				return (PBSE_INVALSELECTRESC);

		} else {
			if (presc_in_err != NULL) {
				if ((*presc_in_err = strdup(chunk)) == NULL)
					return PBSE_SYSTEM;
			}
			return (PBSE_UNKRESC);
		}
		chunk = parse_plus_spec(NULL, &rc);
		if (rc != 0)
			return (rc);
	}

	*p_sched_select = outbuf;
	return 0;
}


================================================
FILE: src/tools/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

bin_PROGRAMS = \
	pbs_hostn \
	pbs_python \
	pbs_tclsh \
	pbs_wish \
	printjob.bin \
	printjob_svr.bin \
	tracejob \
	pbs_sleep

sbin_PROGRAMS = \
	pbs_ds_monitor \
	pbs_idled \
	pbs_probe \
	pbs_upgrade_job

EXTRA_PROGRAMS = \
	chk_tree \
	rstester

common_cflags = \
	-I$(top_srcdir)/src/include \
	@KRB5_CFLAGS@

common_libs = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	@KRB5_LIBS@ \
	-lpthread \
	@socket_lib@

pbs_sleep_LDFLAGS = -all-static
pbs_sleep_SOURCES = pbs_sleep.c

chk_tree_CPPFLAGS = ${common_cflags}
chk_tree_LDADD = ${common_libs}
chk_tree_SOURCES = chk_tree.c

pbs_ds_monitor_CPPFLAGS = ${common_cflags}
pbs_ds_monitor_LDADD = \
	$(top_builddir)/src/lib/Libdb/libpbsdb.la \
	${common_libs} \
	-lssl \
	-lcrypto

pbs_ds_monitor_SOURCES = pbs_ds_monitor.c $(top_srcdir)/src/lib/Libcmds/cmds_common.c

pbs_idled_CPPFLAGS = ${X_CFLAGS} ${common_cflags}
pbs_idled_LDADD = \
	${common_libs} \
	${X_PRE_LIBS} \
	${X_LIBS} \
	-lX11
pbs_idled_SOURCES = pbs_idled.c $(top_srcdir)/src/lib/Libcmds/cmds_common.c

pbs_hostn_CPPFLAGS = ${common_cflags}
pbs_hostn_LDADD = ${common_libs}
pbs_hostn_SOURCES = hostn.c

pbs_probe_CPPFLAGS = \
	${common_cflags} \
	@PYTHON_INCLUDES@
pbs_probe_LDADD = \
	${common_libs} \
	@PYTHON_LDFLAGS@ \
	@PYTHON_LIBS@
pbs_probe_SOURCES = pbs_probe.c $(top_srcdir)/src/lib/Libcmds/cmds_common.c

pbs_python_CPPFLAGS =  \
	-DPBS_PYTHON=1.1 \
	${common_cflags} \
	@PYTHON_INCLUDES@

pbs_python_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libattr/libattr.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	$(top_builddir)/src/lib/Libpython/libpbspython.a \
	@PYTHON_LDFLAGS@ \
	@PYTHON_LIBS@
	-lpthread \
	@socket_lib@ \
	@KRB5_LIBS@

pbs_python_SOURCES = \
	$(top_srcdir)/src/server/resc_attr.c \
	$(top_srcdir)/src/server/jattr_get_set.c \
	$(top_srcdir)/src/server/sattr_get_set.c \
	$(top_srcdir)/src/server/qattr_get_set.c \
	$(top_srcdir)/src/server/nattr_get_set.c \
	$(top_srcdir)/src/server/setup_resc.c \
	$(top_srcdir)/src/server/vnparse.c \
	$(top_srcdir)/src/lib/Libcmds/cmds_common.c \
	pbs_python.c

pbs_tclsh_CPPFLAGS = \
	${common_cflags} \
	@libz_inc@ \
	@tcl_inc@

pbs_tclsh_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libtpp/libtpp.a \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	-lpthread \
	@KRB5_LIBS@ \
	@socket_lib@ \
	@libz_lib@ \
	@tcl_lib@

pbs_tclsh_SOURCES = \
	pbs_tclWrap.c \
	site_tclWrap.c \
	pbsTclInit.c

pbs_upgrade_job_CPPFLAGS = ${common_cflags}
pbs_upgrade_job_LDADD = ${common_libs}
pbs_upgrade_job_SOURCES = pbs_upgrade_job.c

pbs_wish_CPPFLAGS = \
	${common_cflags} \
	@libz_inc@ \
	@tk_inc@

pbs_wish_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libtpp/libtpp.a \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libsec/libsec.a \
	-lpthread \
	@KRB5_LIBS@ \
	@socket_lib@ \
	@libz_lib@ \
	@tk_lib@

pbs_wish_SOURCES = \
	pbs_tclWrap.c \
	site_tclWrap.c \
	pbsTkInit.c

printjob_bin_CPPFLAGS = ${common_cflags}
printjob_bin_LDADD = ${common_libs}
printjob_bin_SOURCES = printjob.c $(top_srcdir)/src/lib/Libcmds/cmds_common.c

printjob_svr_bin_CPPFLAGS = \
	${common_cflags} \
	-I$(top_srcdir)/src/lib/Libdb \
	-DPRINTJOBSVR

printjob_svr_bin_LDADD = \
	$(top_builddir)/src/lib/Libdb/libpbsdb.la \
	${common_libs} \
	-lssl \
	-lcrypto

printjob_svr_bin_SOURCES = \
	$(top_srcdir)/src/server/jattr_get_set.c \
	$(top_srcdir)/src/lib/Libcmds/cmds_common.c \
	printjob.c

rstester_CPPFLAGS = ${common_cflags}
rstester_LDADD = ${common_libs}
rstester_SOURCES = rstester.c

tracejob_CPPFLAGS = ${common_cflags}
tracejob_LDADD = ${common_libs}
tracejob_SOURCES = \
	$(top_srcdir)/src/lib/Libcmds/cmds_common.c \
	tracejob.c \
	tracejob.h


================================================
FILE: src/tools/chk_tree.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    chk_tree.c
 *
 * @brief
 * 		chk_tree.c - Check permissions on the PBS Tree Built
 *		Files should be owned by root, and not world writable.
 *
 * Functions included are:
 * 	main()
 * 	log_err()
 */

#include <pbs_config.h> /* the master config generated by configure */
#include "pbs_version.h"

#include <sys/types.h>
#include <sys/stat.h>
#include <errno.h>
#include <limits.h>
#include <stdio.h>
#include <unistd.h>
#include <string.h>
#include "cmds.h"
#include "portability.h"
#include "log.h"

/**
 * @brief
 * 		main	-	The main function of chk_tree
 *
 * @param[in]	argc	-	argument count
 * @param[in]	argv	-	argument variables.
 *
 * @return	int
 * @retval	0	: success
 * @retval	!=0	: some error.
 */
int
main(int argc, char *argv[])
{
	int err = 0;
	int i;
	int j;
	int chk_file_sec();
	int dir = 0;
	int no_err = 0;
	int sticky = 0;
	extern int optind;

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);
	if (set_msgdaemonname("chk_tree")) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}
	set_logfile(stderr);

	while ((i = getopt(argc, argv, "dns-:")) != EOF) {
		switch (i) {
			case 'd':
				dir = 1;
				break;
			case 'n':
				no_err = 1;
				break;
			case 's':
				sticky = 1;
				break;
			default:
				err = 1;
		}
	}

	if (err || (optind == argc)) {
		fprintf(stderr, "Usage %s -d -s -n path ...\n\twhere:\t-d indicates directory (file otherwise)\n\t\t-s indicates world write allowed if sticky set\n\t\t-n indicates do not return the error status, exit with 0\n", argv[0]);
		fprintf(stderr, "      %s --version display version, exit with 0\n", argv[0]);
		return 1;
	}

	for (i = optind; i < argc; ++i) {
#ifdef WIN32
		/* we're not checking fullpath */
		j = chk_file_sec(argv[i], dir, sticky, WRITES_MASK ^ FILE_WRITE_EA, 0);
#else
		j = chk_file_sec(argv[i], dir, sticky, S_IWGRP | S_IWOTH, 1);
#endif
		if (j)
			err = 1;
	}

	if (no_err)
		return 0;
	else
		return (err);
}


================================================
FILE: src/tools/create_env_file.sh
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
#
# Script to create an environment variables files for the PBS daemons
#
if [ $# -eq 0 ] ; then
	echo Usage: $0 filename
	exit 1
fi
F=$1
ans=y
ED=${EDITOR:-vi}
if [ -f $F ] ; then
	if [ -w $F ] ; then
		echo ""
		echo PBS environment file $F exists and is writable.
		echo 'Do you wish to overwrite it [y|(n)]?'
		read ans
		if [ X$ans = X ] ; then ans=n ; fi
		if [ $ans = y ] ; then
			echo 'Are you sure [y\|(n)]?'
			read ans
			if [ X$ans = X ] ; then ans=n ; fi
			if [ $ans = y ] ; then
				rm $F
			fi
		fi
	elif [ -r $F ] ; then
		echo WARNING, file $F exists and is not writable.
		exit 1
	fi
fi
if [ $ans = y ] ; then
	echo ""
	echo Creating PBS environment file $F
	printenv > $F
	chmod 700 $F
fi
echo 'Do you wish to edit it [(y)\|n]?'
read ans
if [ X$ans = X ] ; then ans=y ; fi
if [ $ans = y ] ; then
	$ED $F
fi


================================================
FILE: src/tools/hostn.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    hostn.c
 *
 * @brief
 * 		hostn.c - Functions related to get host by name.
 *
 * Functions included are:
 * 	usage()
 * 	main()
 * 	prt_herrno()
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <netdb.h>
#include <string.h>

#include <sys/types.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include "cmds.h"
#include "pbs_version.h"

#if !defined(H_ERRNO_DECLARED)
extern int h_errno;
#endif

/**
 * @brief
 * 		usage - shows the usage of the module
 *
 * @param[in]	name	-	hostname
 */
void
usage(char *name)
{
	fprintf(stderr, "Usage: %s [-v] hostname\n", name);
	fprintf(stderr, "\t -v turns on verbose output\n");
	fprintf(stderr, "       %s --version\n", name);
}
/**
 * @brief
 * 		main - the entry point in hostn.c
 *
 * @param[in]	argc	-	argument count
 * @param[in]	argv	-	argument variables.
 * @param[in]	env	-	environment values.
 *
 * @return	int
 * @retval	0	: success
 * @retval	!=0	: error code
 */
int
main(int argc, char *argv[], char *env[])
{
	int i;
	struct hostent *host;
	struct hostent *hosta;
	struct in_addr *ina;
	int naddr;
	int vflag = 0;
	void prt_herrno();
	extern int optind;

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	if (initsocketlib())
		return 1;

	while ((i = getopt(argc, argv, "v-:")) != EOF) {
		switch (i) {
			case 'v':
				vflag = 1;
				break;
			default:
				usage(argv[0]);
				return 1;
		}
	}

	if (optind != argc - 1) {
		usage(argv[0]);
		return 1;
	}

#ifndef WIN32
	h_errno = 0;
#endif

	i = 0;
	while (env[i]) {
		if (!strncmp(env[i], "LOCALDOMAIN", 11)) {
			printf("%s\n", env[i]);
			env[i] = "";
			break;
		}
		++i;
	}

	host = gethostbyname(argv[optind]);
	if (host) {
		if (vflag)
			printf("primary name: ");
		printf("%s", host->h_name);
		if (vflag)
			printf(" (from gethostbyname())");
		printf("\n");
		if (vflag) {
			if (host->h_aliases && *host->h_aliases) {
				for (i = 0; host->h_aliases[i]; ++i)
					printf("aliases:           %s\n",
					       host->h_aliases[i]);
			} else {
				printf("aliases:            -none-\n");
			}

			printf("     address length:  %d bytes\n", host->h_length);
		}

		/* need to save address because they will be over writen on */
		/* next call to gethostby*()				    */

		naddr = 0;
		for (i = 0; host->h_addr_list[i]; ++i) {
			++naddr;
		}
		ina = (struct in_addr *) malloc(sizeof(struct in_addr) * naddr);
		if (ina == NULL) {
			fprintf(stderr, "%s: out of memory\n", argv[0]);
			return 1;
		}

		for (i = 0; i < naddr; ++i) {
			(void) memcpy((char *) (ina + i), host->h_addr_list[i],
				      host->h_length);
		}
		if (vflag) {
			for (i = 0; i < naddr; ++i) {
				printf("     address:      %15.15s  ", inet_ntoa(*(ina + i)));
				printf(" (%u dec)  ", (int) (ina + i)->s_addr);

#ifndef WIN32
				h_errno = 0;
#endif
				hosta = gethostbyaddr((char *) (ina + i), host->h_length,
						      host->h_addrtype);
				if (hosta) {
					printf("name:  %s", host->h_name);
				} else {
					printf("name:  -null-");
					prt_herrno();
				}
				printf("\n");
			}
		}

	} else {
		fprintf(stderr, "no name entry found for %s\n", argv[optind]);
		prt_herrno();
	}
	return 0;
}
/**
 * @brief
 * 		prt_herrno - assigns error descriptions corresponding to error number.
 */
void
prt_herrno()
{
	char *txt;

	switch (h_errno) {
		case 0:
			return;

		case HOST_NOT_FOUND:
			txt = "Answer Host Not Found";
			break;

		case TRY_AGAIN:
			txt = "Try Again";
			break;

		case NO_RECOVERY:
			txt = "No Recovery";
			break;

		case NO_DATA:
			txt = "No Data";
			break;

		default:
			txt = "unknown error";
			break;
	}
	fprintf(stderr, " ** h_errno is %d %s\n", h_errno, txt);
}


================================================
FILE: src/tools/pbsTclInit.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    pbsTclInit.c
 *
 * @brief
 *		pbsTclInit - All the pbs specific code needed to make pbstclsh
 *		work is here.  The routine pbsTcl_Init() is to be called
 *		in place of Tcl_Init().
 *
 * Functions included are:
 * 	pbsTcl_Init()
 * 	main()
 */
#include "pbs_config.h"
#include "pbs_version.h"
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include "tcl.h"
#include "rm.h"
#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "log.h"
#include "tpp.h"

#ifdef NAS /* localmod 099 */
extern int quiet;
#endif /* localmod 099 */

extern void add_cmds(Tcl_Interp *interp);

#define SHOW_NONE 0xff

/**
 * @brief
 * 		pbsTcl_Init	- Function to initialize Tcl interpreter based on the environment.
 *
 * @param[in,out]	interp	-	Interpreter for application.
 *
 * @return	int
 * @retval	TCL_OK	: everything looks good.
 * @retval	TCL_ERROR	: something got wrong!
 */
int
pbsTcl_Init(Tcl_Interp *interp)
{
	if (Tcl_Init(interp) == TCL_ERROR)
		return TCL_ERROR;
#if TCLX
	if (Tclx_Init(interp) == TCL_ERROR)
		return TCL_ERROR;
#endif

	fullresp(0);
	add_cmds(interp);

	Tcl_SetVar(interp, "tcl_rcFileName", "~/.tclshrc", TCL_GLOBAL_ONLY);
	return TCL_OK;
}
/**
 * @brief
 * 		main - the entry point in pbsTclInit.c
 *
 * @param[in]	argc	-	argument count.
 * @param[in]	argv	-	argument variables.
 *
 * @return	int
 * @retval	0	: success
 */
int
main(int argc, char *argv[])
{
	char tbuf_env[256];
	int rc;
	struct tpp_config tpp_conf;
	fd_set selset;
	struct timeval tv;

	/*the real deal or just pbs_version and exit?*/

	PRINT_VERSION_AND_EXIT(argc, argv);
	if (set_msgdaemonname("pbs_tclsh")) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}
	set_logfile(stderr);

	/* load the pbs conf file */
	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "%s: Configuration error\n", argv[0]);
		return (1);
	}

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	if (!getenv("TCL_LIBRARY")) {
		if (pbs_conf.pbs_exec_path) {
			sprintf(tbuf_env, "%s/tcltk/lib/tcl%s", pbs_conf.pbs_exec_path, TCL_VERSION);
			setenv("TCL_LIBRARY", tbuf_env, 1);
		}
	}

	if (!pbs_conf.pbs_leaf_name) {
		char my_hostname[PBS_MAXHOSTNAME + 1];
		if (gethostname(my_hostname, (sizeof(my_hostname) - 1)) < 0) {
			fprintf(stderr, "Failed to get hostname\n");
			return -1;
		}
		pbs_conf.pbs_leaf_name = get_all_ips(my_hostname, log_buffer, sizeof(log_buffer) - 1);
		if (!pbs_conf.pbs_leaf_name) {
			fprintf(stderr, "%s\n", log_buffer);
			fprintf(stderr, "%s\n", "Unable to determine TPP node name");
			return -1;
		}
	}

	/* call tpp_init */
	rc = set_tpp_config(&pbs_conf, &tpp_conf, pbs_conf.pbs_leaf_name, -1, pbs_conf.pbs_leaf_routers);
	if (rc == -1) {
		fprintf(stderr, "Error setting TPP config\n");
		return -1;
	}

	if ((tpp_fd = tpp_init(&tpp_conf)) == -1) {
		fprintf(stderr, "tpp_init failed\n");
		return -1;
	}

	/*
	 * Wait for net to get restored, ie, app to connect to routers
	 */
	FD_ZERO(&selset);
	FD_SET(tpp_fd, &selset);
	tv.tv_sec = 5;
	tv.tv_usec = 0;
	select(FD_SETSIZE, &selset, NULL, NULL, &tv);

	tpp_poll(); /* to clear off the read notification */

	Tcl_Main(argc, argv, pbsTcl_Init);
	return 0;
}


================================================
FILE: src/tools/pbsTkInit.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *  @file    pbsTkInit.c
 *
 *  @brief
 *		pbsTkInit - All the pbs specific code needed to make pbswish
 *		work is here.  The routine pbsTk_Init() is to be called
 *		in place of Tk_Init().
 *
 * Functions included are:
 * 	pbsTcl_Init()
 * 	main()
 */
#include "pbs_config.h"
#include "pbs_version.h"

#include "tcl.h"
#include "tk.h"
#include <string.h>
#include <stdlib.h>
#include "rm.h"
#include "pbs_ifl.h"
#include "pbs_internal.h"
#include "log.h"

extern void add_cmds(Tcl_Interp *interp);

/**
 * @brief
 * 		pbsTcl_Init	- Function to initialize Tcl interpreter based on the environment.
 *
 * @param[in,out]	interp	-	Interpreter for application.
 *
 * @return	int
 * @retval	TCL_OK	: everything looks good.
 * @retval	TCL_ERROR	: something got wrong!
 */
int
pbsTcl_Init(Tcl_Interp *interp)
{
	if (Tcl_Init(interp) == TCL_ERROR)
		return TCL_ERROR;
	if (Tk_Init(interp) == TCL_ERROR)
		return TCL_ERROR;
	Tcl_StaticPackage(interp, "Tk", Tk_Init, Tk_SafeInit);
#if TCLX
	if (Tclx_Init(interp) == TCL_ERROR)
		return TCL_ERROR;
	if (Tkx_Init(interp) == TCL_ERROR)
		return TCL_ERROR;
#endif

	fullresp(0);
	add_cmds(interp);

	Tcl_SetVar(interp, "tcl_rcFileName", "~/.wishrc", TCL_GLOBAL_ONLY);
	return TCL_OK;
}
/**
 * @brief
 * 		main - the entry point in pbsTkInit.c
 *
 * @param[in]	argc	-	argument count.
 * @param[in]	argv	-	argument variables.
 *
 * @return	int
 * @retval	0	: success
 */
int
main(int argc, char *argv[])
{

	char tbuf_env[256];

	/*the real deal or just pbs_version and exit?*/

	PRINT_VERSION_AND_EXIT(argc, argv);
	set_logfile(stderr);

	pbs_loadconf(0);

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	if (!getenv("TCL_LIBRARY")) {
		if (pbs_conf.pbs_exec_path) {
			sprintf(tbuf_env, "%s/tcltk/lib/tcl%s", pbs_conf.pbs_exec_path, TCL_VERSION);
			setenv("TCL_LIBRARY", tbuf_env, 1);
		}
	}

	if (!getenv("TK_LIBRARY")) {
		if (pbs_conf.pbs_exec_path) {
			sprintf(tbuf_env, "%s/tcltk/lib/tk%s", pbs_conf.pbs_exec_path, TK_VERSION);
			setenv("TK_LIBRARY", tbuf_env, 1);
		}
	}

	Tk_Main(argc, argv, pbsTcl_Init);
	return 0;
}


================================================
FILE: src/tools/pbs_ds_monitor.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 *  @file    pbs_ds_monitor.c
 *
 *  @brief
 *		pbs_ds_monitor - This file contains functions related to database and serialization.
 *
 * Functions included are:
 * 	clear_stop_db_file()
 * 	check_and_stop_db()
 * 	get_pid()
 * 	lock_out()
 * 	acquire_lock()
 * 	win_db_monitor()
 * 	clear_tmp_files()
 * 	checkpid()
 * 	win_db_monitor_child()
 * 	acquire_lock()
 * 	unix_db_monitor()
 * 	main()
 */
#include <pbs_config.h>
#include <pbs_version.h>
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <fcntl.h>
#include <signal.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <errno.h>
#include "server_limits.h"
#include <pbs_internal.h>
#include "pbs_db.h"
#include "pbs_ifl.h"

#define MAX_LOCK_ATTEMPTS 5
#define MAX_DBPID_ATTEMPTS 20
#define TEMP_BUF_SIZE 100
#define RES_BUF_SIZE 4096

char thishost[PBS_MAXHOSTNAME + 1];

/**
 * @brief
 * 		clear_stop_db_file - Function to clear the db stop file
 *
 * @return	void
 *
 * @par MT-safe: Yes
 */
void
clear_stop_db_file(void)
{
	char closefile[MAXPATHLEN + 1];
	snprintf(closefile, MAXPATHLEN, "%s/datastore/pbs_dbclose", pbs_conf.pbs_home_path);
	unlink(closefile);
}

/**
 * @brief
 * 		check_and_stop_db - Function to check for db stop file and stop the database
 *          if such a file exists
 *
 * @param[in]	dbpid	-	Pid of the database process (unused for now)
 *
 * @return	void
 *
 * @par MT-safe: Yes
 */
void
check_and_stop_db(int dbpid)
{
	char closefile[MAXPATHLEN + 1];

	snprintf(closefile, MAXPATHLEN, "%s/datastore/pbs_dbclose", pbs_conf.pbs_home_path);

	if (access(closefile, R_OK) == 0) {
		/* file present, somebody is asking us to quit the database */
		/* first clear the file */
		unlink(closefile);
		/* now stop the database */
		pbs_stop_db(thishost, pbs_conf.pbs_data_service_port);
	}
}

/**
 * @brief
 * 		Get the pid of the database from the postmaster.pid
 *			file located inside directory pointed by dbstore
 *
 * @param[in]	dbstore	-	The path to the database data directory
 *
 * @retval	0	-	Function failed
 * @retval	>0	-	Pid of the postmaster master process
 *
 * @par MT-safe:	Yes
 */
static pid_t
get_pid()
{
	char pidfile[MAXPATHLEN + 1];
	FILE *fp;
	char buf[TEMP_BUF_SIZE + 1];
	pid_t pid = 0;

	snprintf(pidfile, MAXPATHLEN, "%s/datastore/postmaster.pid", pbs_conf.pbs_home_path);
	if (access(pidfile, R_OK) != 0)
		return 0;

	if ((fp = fopen(pidfile, "r")) == NULL)
		return 0;

	memset(buf, 0, TEMP_BUF_SIZE + 1);
	if (fgets(buf, TEMP_BUF_SIZE, fp) == NULL) 
		fprintf(stderr, "%s fgets failed. \n", __func__);
	buf[TEMP_BUF_SIZE] = '\0';

	fclose(fp);

	if (strlen(buf) == 0)
		return 0;

	pid = atol(buf);
	if (pid == 0)
		return 0;

	if (kill(pid, 0) != 0)
		return 0;
	return pid;
}

/**
 * @brief
 * 		lock_out - Function to lock/unlock a file.
 *
 *		For Unix, this uses fcntl lock (not inheritable).
 *		If the operand is F_WRLCK, then this also writes
 *		the pid of this process to the lockfile.
 *
 * @param[in]	fds	-	The descriptor of the file to be locked
 * @param[in]	op	- 	Operation to perform
 *						F_WRLCK - To obtain a "write lock"
 *						F_UNLCK	- To release a previous lock
 * 						These contants are defined in win.h.
 *
 * @retval	0	-	Function succeeded for the given operation
 * @retval	1	-	Failed (eg to lock the file).
 *
 * @par MT-safe:	Yes
 */
static int
lock_out(int fds, int op)
{
	struct flock flock;
	char buf[PBS_MAXHOSTNAME + 10];

	(void) lseek(fds, (off_t) 0, SEEK_SET);
	flock.l_type = op;
	flock.l_whence = SEEK_SET;
	flock.l_start = 0;
	flock.l_len = 0;

	if (fcntl(fds, F_SETLK, &flock) != -1) {
		if (op == F_WRLCK) {
			/* if write-lock, record hostname and pid in file */
			if (ftruncate(fds, (off_t) 0) == -1) 
				fprintf(stderr, "ftruncate failed, ERR = %s\n", strerror(errno));
			(void) sprintf(buf, "%s:%d\n", thishost, getpid());
			if (write(fds, buf, strlen(buf)) == -1) 
				fprintf(stderr, "write failed, ERR = %s\n", strerror(errno));
		}
		return 0;
	}
	return 1;
}

/**
 * @brief
 * 		This is the Unix counterpart of acquire_lock
 * @par
 *  	This function creates/opens the lock file, and locks the file.
 *  	In case of a failover environment, the whole operation is retried
 *  	several times in a loop.
 *
 * @param[in]  lockfile         - Path of db_lock file.
 * @param[out] reason           - Reason for failure, if not able to accquire lock
 * @param[in]  reasonlen        - reason buffer legnth.
 * @param[out] is_lock_hld_by_thishost  - This flag is set if the lock is held by the host
 *                                         requesting accquire_lock in check_mode.
 *
 * @return	File descriptor of the open and locked file
 * @retval	-1	: Function failed to acquire lock
 * @retval	!=-1	: Function succeeded (file descriptor returned)
 *
 * @par MT-safe:	Yes
 */
int
acquire_lock(char *lockfile, char *reason, int reasonlen, int *is_lock_hld_by_thishost)
{
	int fd;
	struct stat st;
	int i, j;
	time_t lasttime = 0;
	int rc;
	char who[PBS_MAXHOSTNAME + 10];
	char *p;

	if (reasonlen > 0)
		reason[0] = '\0';

	if (pbs_conf.pbs_secondary == NULL)
		j = 1; /* not fail over, try lock one time */
	else
		j = MAX_LOCK_ATTEMPTS; /* fail over, try X times */

#ifndef O_RSYNC
#define O_RSYNC 0
#endif

again:
	if ((fd = open(lockfile, O_RDWR | O_CREAT | O_RSYNC, 0600)) == -1) {
		snprintf(reason, reasonlen, "Could not access lockfile, errno=%d", errno);
		return -1;
	}

	/* check time stamp of lock file */
	if (fstat(fd, &st) == -1) {
		snprintf(reason, reasonlen, "Failed to stat lockfile, errno=%d", errno);
		close(fd);
		return -1;
	}

	/* record the last modified timestamp */
	lasttime = st.st_mtime;

	for (i = 0; i < j; i++) { /* try X times where X is MAX_LOCK_ATTEMPTS */
		if (i > 0)
			sleep(1);
		/* attempt to lock the datastore directory */
		if (lock_out(fd, F_WRLCK) == 0)
			return fd;
	}

	/* do this only if failover is configured */
	if (pbs_conf.pbs_secondary != NULL) {
		/*
		 * Came here, means we could not lock even after j attempts.
		 *
		 * 2 levels of check will be performed (based on the last modified timestamp):
		 *
		 * 1) Check the lock file's modified timestamp and compare with "lasttime" to see if the file was modified
		 *    in between. If the file was modified, then the other side up and so we give up.
		 *
		 * 2) We know that the modified timestamp is not updating however we need to make
		 *    sure that the other side is really gone. Therefore we check the difference of last
		 *    updated timestamp from now (current system time). If the difference > (4*j) seconds,
		 *    then the other side has vanished at the OS level itself, and NFS cannot unlock it.
		 *    So delete the lockfile and start afresh. For this to work, make sure that the
		 *    time on primary, secondary and the pbs_home server (NFS server) are synced.
		 */

		/* Re-check time stamp of lock file */
		if (fstat(fd, &st) == -1) {
			snprintf(reason, reasonlen, "Failed to stat lockfile, errno=%d", errno);
			close(fd);
			return -1;
		}

		/* Check if time stamp of lock file has updated at all */
		if (st.st_mtime == lasttime) {
			/* Modified times stamp did not update in the given window. Re-check how long it has been stale */
			if (time(0) - lasttime >= (MAX_LOCK_ATTEMPTS * 4)) {
				/* other side is long dead, clear up stuff */
				close(fd);
				unlink(lockfile);
				fd = -1;
				lasttime = 0;
				goto again;
			}
		}
	}

	/* all attempts to lock failed, try to see who has it locked */
	(void) lseek(fd, (off_t) 0, SEEK_SET);
	if ((rc = read(fd, who, sizeof(who) - 1)) > 0) {
		who[rc - 1] = '\0';
		p = strchr(who, ':');
		if (p) {
			*p = '\0';
			snprintf(reason, reasonlen,
				 "Lock seems to be held by pid: %s running on host: %s",
				 (p + 1), who);
		} else {
			snprintf(reason, reasonlen, "Lock seems to be held by %s", who);
		}
		if (is_lock_hld_by_thishost != NULL) {
			if (strcmp(thishost, who) == 0)
				*is_lock_hld_by_thishost = 1;
			else
				*is_lock_hld_by_thishost = 0;
		}
	}

	close(fd);
	fd = -1;

	return fd;
}

/**
 * @brief	This is the Unix couterpart of the monitoring
 *			code.
 * @par
 *		This function does the following:
 *		a) Creates a pipe, forks itself, parent waits to read on pipe.
 *		b) Child creates/opens a file $PBS_HOME/datastore/pbs_dblock.
 *		c) Attempts to lock the file. If locking
 *			succeeds, unlocks the file and writes 0 (success) to the write
 *			end of the pipe. If locking fails, writes 1 (failure) to pipe.
 *			Parent reads from pipe and exits with the code read from pipe.
 *		d) If mode is "check" then child quits.
 *		e) If mode is "monitor", continues in the background, checking
 *			the database pid in a loop forever. If database pid goes
 *			down, then it unlocks the file and exits.
 *
 * @param[in]	mode	-	"check" - to just check if lockfile can be locked
 *		     				"monitor" - to launch a monitoring child process that
 *							holds onto the file lock.
 *
 * @retval	1	-	Function failed to acquire lock
 * @retval	0	-	Function succeded in the requested operation
 * @par
 * 		The return values are not used by the caller (parent process) since
 * 		in the success case this function does not return. Instead, the parent
 * 		waits on the read end of the pipe to read a status from the monitoring
 * 		child process.
 *
 * @par MT-safe: Yes
 */
int
unix_db_monitor(char *mode)
{
	int fd;
	int rc;
	int i;
	pid_t dbpid;
	char lockfile[MAXPATHLEN + 1];
	int pipefd[2];
	int res;
	int is_lock_local = 0;
	char reason[RES_BUF_SIZE];

	reason[0] = '\0';

	if (pipe(pipefd) != 0) {
		fprintf(stderr, "Unable to create pipe, errno = %d\n", errno);
		return 1;
	}

	snprintf(lockfile, MAXPATHLEN, "%s/datastore/pbs_dblock", pbs_conf.pbs_home_path);

	/* first fork off */
	rc = fork();
	if (rc == -1) {
		fprintf(stderr, "Unable to create process, errno = %d\n", errno);
		return 1;
	}

	if (rc > 0) {
		close(pipefd[1]);
		/*
		 * child can continue to execute in case of "monitor",
		 * so dont wait for child to exit, rather read code
		 * from pipe that child will write to
		 */
		if (read(pipefd[0], &res, sizeof(int)) != sizeof(int))
			return 1;

		if (res != 0) {
			if (read(pipefd[0], &reason, sizeof(reason)) == -1) 
				fprintf(stderr, "read failed, ERR = %s\n", strerror(errno));
			fprintf(stderr, "Failed to acquire lock on %s. %s\n", lockfile, reason);
		}

		return (res); /* return parent with success */
	}

	close(pipefd[0]);

	/* child */
	if (setsid() == -1) {
		close(pipefd[1]);
		return 1;
	}

	(void) fclose(stdin);
	(void) fclose(stdout);
	(void) fclose(stderr);

	/* Protect from being killed by kernel */
	daemon_protect(0, PBS_DAEMON_PROTECT_ON);

	if ((fd = acquire_lock(lockfile, reason, sizeof(reason), &is_lock_local)) == -1) {
		if (is_lock_local && strcmp(mode, "check") == 0) {
			/* write success to parent since lock is already held by the localhost */
			res = 0;
			if (write(pipefd[1], &res, sizeof(int)) == -1) 
				fprintf(stderr, "write failed, ERR = %s\n", strerror(errno));
			close(pipefd[1]);
			return 0;
		}
		res = 1;
		if (write(pipefd[1], &res, sizeof(int)) == -1) 
			fprintf(stderr, "write failed, ERR = %s\n", strerror(errno));
		if (write(pipefd[1], reason, sizeof(reason)) == -1) 
			fprintf(stderr, "write failed, ERR = %s\n", strerror(errno));
		close(pipefd[1]);
		return 1;
	}

	/* unlock before writing success to parent, to avoid race */
	if (strcmp(mode, "check") == 0) {
		lock_out(fd, F_UNLCK);
		close(fd);
		unlink(lockfile);
	}

	/* write success to parent since we acquired the lock */
	res = 0;
	if (write(pipefd[1], &res, sizeof(int)) == -1) 
		fprintf(stderr, "%s : write failed, ERR = %s\n", __func__ , strerror(errno));
	close(pipefd[1]);

	if (strcmp(mode, "check") == 0)
		return 0;

	/* clear any residual stop db file before starting monitoring */
	clear_stop_db_file();

	/*
	 * first find out the pid of the postgres process from dbstore/postmaster.pid
	 * wait for a while till it is found
	 * if not found within MAX_DBPID_ATTEMPTS then break with error
	 * if found, start monitoring the pid
	 *
	 */
	dbpid = 0;
	for (i = 0; i < MAX_DBPID_ATTEMPTS; i++) {
		if ((dbpid = get_pid()) > 0)
			break;
		(void) utimes(lockfile, NULL);
		sleep(1);
	}

	if (dbpid == 0) {
		/* database did not come up, so quit after unlocking file */
		lock_out(fd, F_UNLCK);
		close(fd);
		unlink(lockfile);
		return 0;
	}

	while (1) {
		(void) utimes(lockfile, NULL);

		if (kill(dbpid, 0) != 0)
			break;
		if (!((dbpid = get_pid()) > 0))
			break;

		/* check if stop db file exists */
		check_and_stop_db(dbpid);

		sleep(1);
	}

	lock_out(fd, F_UNLCK);
	close(fd);
	unlink(lockfile);

	return 0;
}

/**
 * @brief
 * 		main - the entry point in pbs_config_add_win.c
 *
 * @param[in]	argc	-	argument count
 * @param[in]	argv	-	argument variables.
 *
 * @return	int
 * @retval	1	-	Function failed to perform the requested operation.
 * @retval	0	-	Function succeeded in the requested operation
 */
int
main(int argc, char *argv[])
{
	char *mode;

	if (argc < 2) {
		fprintf(stderr, "Usage: %s check|monitor\n", argv[0]);
		return 1;
	}
	mode = argv[1];

	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "Failed to load PBS conf file\n");
		return 1;
	}

	if (gethostname(thishost, (sizeof(thishost) - 1)) == -1) {
		fprintf(stderr, "Failed to detect hostname\n");
		return -1;
	}

	return unix_db_monitor(mode);
}


================================================
FILE: src/tools/pbs_idled.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file	pbs_idled.c
 *
 * @brief
 * 		pbs_idled.c	- This file functions related to making the pbs idle.
 *
 * Functions included are:
 * 	main()
 * 	event_setup()
 * 	pointer_query()
 * 	update_utime()
 * 	X_handler()
 */
#include <pbs_config.h>
#include <pbs_ifl.h>
#include "cmds.h"
#include "pbs_version.h"

#include <X11/X.h>
#include <X11/Xlib.h>
#include <time.h>
#include <X11/Intrinsic.h>

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <utime.h>
#include <errno.h>

#define EVER 1

/* used to pass back pointer locations from pointer_query() */
struct xy {
	int x;
	int y;
};

/* prototypes */
int event_setup(Window w, Display *dsp);
int pointer_query(Display *dsp, Window w, struct xy *p);
void update_utime(char *filename);
int X_handler(Display *dsp);

/* globals */
char **argv_save;
char **env_save;
/**
 * @brief
 * 		main - the entry point in pbs_config_add_win.c
 *
 * @param[in]	argc	-	argument count
 * @param[in]	argv	-	argument variables.
 * @param[in]	envp	-	environment values.
 *
 * @return	int
 * @retval	1	-	Function failed to perform the requested operation.
 * @retval	0	-	Function succeeded in the requested operation
 */
int
main(int argc, char *argv[], char *envp[])
{
	Window w;
	char *env_dsp = NULL;
	Display *dsp = NULL;
	XEvent event;
	int delay = 5;
	int reconnect_delay = 180;
	int do_update = 0;
	int is_daemon = 0;
	time_t create_time = 0;
	char *filename = NULL;
	char filename_buf[MAXPATHLEN];
	char *username;
	struct xy cur_xy, prev_xy;
	struct stat st;
	char errbuf[BUFSIZ]; /* BUFSIZ is sufficient to hold buffer msg */
	int fd;
	int c;

	cur_xy.x = -1;
	cur_xy.y = -1;

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	pbs_loadconf(0);

	while ((c = getopt(argc, argv, "D:w:f:r:t:-:")) != -1)
		switch (c) {
			case 'w':
				delay = atoi(optarg);
				break;
			case 'r':
				reconnect_delay = atoi(optarg);
				break;
			case 'f':
				filename = optarg;
				break;
			case 'D':
				env_dsp = optarg;
				break;
			case 't':
				if (!strcmp(optarg, "daemon"))
					is_daemon = 1;
				break;
			default:
				/* show usage and exit */
				fprintf(stderr, "USAGE: %s [-w wait between X queries] [-f idle_file] [-D Display] [-r reconnct_delay]\n", argv[0]);
				fprintf(stderr, "       %s --version\n", argv[0]);
				exit(1);
		}

	prev_xy.x = -1;
	prev_xy.y = -1;

	if (filename == NULL) {
		username = getlogin();
		if (username == NULL)
			username = getenv("USER");
		if (username == NULL)
			username = "UNKNOWN";
		sprintf(filename_buf, "%s/%s/%s", pbs_conf.pbs_home_path, "spool/idledir", username);
		filename = filename_buf;
	}

	if (stat(filename, &st) == -1) {
		if (errno == ENOENT) { /* file doesn't exist... lets create it */
			if ((fd = creat(filename, S_IRUSR | S_IWUSR)) == -1) {
				sprintf(errbuf, "Can not open %s", filename);
				perror(errbuf);
				exit(1);
			}
			close(fd);
		} else {
			perror("File Error");
			exit(1);
		}
	}

	argv_save = argv;
	env_save = envp;

	if (env_dsp == NULL)
		env_dsp = getenv("DISPLAY");

	if (env_dsp == NULL)
		env_dsp = ":0";

	while (dsp == NULL) {
		dsp = XOpenDisplay(env_dsp);

		if (dsp == NULL) {
#ifdef DEBUG
			printf("Could not open display %s\n", env_dsp == NULL ? "(null)" : env_dsp);
#endif
			sleep(reconnect_delay);
		}
	}

	/* only set the io error handler to ignore X connection closes IF
	 * we're running as a daemon.  If we are run out of Xsession, and
	 * ignore the close of the X connection, we'll stick around forever... not
	 * good.
	 */
	if (is_daemon)
		XSetIOErrorHandler(X_handler);

	w = RootWindow(dsp, XDefaultScreen(dsp));

	event_setup(w, dsp);

	for (; EVER;) {
		sleep(delay);

		while (XCheckMaskEvent(dsp, KeyPressMask | KeyReleaseMask | SubstructureNotifyMask, &event)) {
			switch (event.type) {
				case KeyPress:
				case KeyRelease:
					do_update = 1;
					break;
				case CreateNotify:
					create_time = time(NULL) + 30;
					break;
			}
		}

		if (create_time != 0) {
			if (time(NULL) >= create_time) {
				event_setup(w, dsp);
				create_time = 0;
			}
		}

		if (pointer_query(dsp, w, &cur_xy))
			if (cur_xy.x != prev_xy.x || cur_xy.y != prev_xy.y) {
				do_update = 1;
				prev_xy = cur_xy;
			}

		if (do_update) {
			update_utime(filename);
			do_update = 0;
		}
	}
}

/**
 * @brief
 * 		setup the event on an event in an X server.
 *
 * @param[in]	w	-	Specifies the connection to the X server.
 * @param[in]	dsp	-	Specifies the window whose events you are interested in.
 *
 * @return	int
 * @retval	0	: XQueryTree has failed
 * @retval	1	: successfully completed.
 */
int
event_setup(Window w, Display *dsp)
{
	Window root, parent, *kids;
	unsigned int nkids;
	unsigned int mask;
	int i;

	if (!XQueryTree(dsp, w, &root, &parent, &kids, &nkids))
		return 0;

	mask = (KeyPressMask | KeyReleaseMask | SubstructureNotifyMask);

	XSelectInput(dsp, w, mask);

	if (kids) {
		for (i = 0; i < nkids; i++)
			event_setup(kids[i], dsp);
	}
	if (kids != NULL)
		XFree(kids);

	return 1;
}
/**
 * @brief
 * 		It returns the root window the pointer is logically on and the pointer
 * 		coordinates relative to the root window's origin.
 *
 * @param[in]	dsp	-	Specifies the window whose events you are interested in.
 * @param[in]	w	-	Specifies the connection to the X server.
 * @param[out]	p	-	X,Y coordinate
 *
 * @return	int
 * @retval	0	: p is NULL
 * @retval	1	: successfully completed.
 */
int
pointer_query(Display *dsp, Window w, struct xy *p)
{
	Window root_return;
	Window child_return;
	int root_x;
	int root_y;
	int win_x;
	int win_y;
	unsigned int mask;

	if (p == NULL)
		return 0;

	if (XQueryPointer(dsp, w,
			  &root_return, &child_return, &root_x, &root_y, &win_x, &win_y, &mask)) {
		p->x = root_x;
		p->y = root_y;
	} else
		printf("XQueryPointer failed\n");

	return 1;
}
/**
 * @brief
 * 		set access time and modify time to current time
 *
 * @param[in]	filename	-	file for which access time needs to be updated.
 */
void
update_utime(char *filename)
{
	utime(filename, NULL);

#ifdef DEBUG
	printf("Updating utime\n");
#endif
}

/**
 * @brief
 * 		we lost our X display... let's just reexec ourself
 *
 * @param[in]	dsp	-	pointer to display ( not used here)
 *
 * @return	int
 * @retval	0	: success
 */
int
X_handler(Display *dsp)
{

#ifdef DEBUG
	printf("Lost X connection, restarting!\n");
#endif

	execve(argv_save[0], argv_save, env_save);

	return 0;
}


================================================
FILE: src/tools/pbs_probe.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file
 *		pbs_probe.c
 *
 * @brief
 * 		Much of this program derives from the PBS utility chk_tree
 * 		and the manner in which thing were done in that program.
 *
 * Functions included are:
 * 	main()
 * 	am_i_authorized()
 * 	infrastruct_params()
 * 	print_infrastruct()
 * 	title_string()
 * 	print_problems()
 * 	msg_table_set_defaults()
 * 	get_primary_values()
 * 	pbsdotconf()
 * 	get_realpath_values()
 * 	is_parent_rpathnull()
 * 	inspect_dir_entries()
 * 	which_suffixset()
 * 	is_suffix_ok()
 * 	which_knwn_mpugs()
 * 	chk_entries()
 * 	pbs_dirtype()
 * 	non_db_resident()
 * 	is_a_numericname()
 * 	check_paths()
 * 	check_owner_modes()
 * 	mbits_and_owner()
 * 	perm_owner_msg()
 * 	perm_string()
 * 	owner_string()
 * 	process_ret_code()
 * 	conf4primary()
 * 	env4primary()
 * 	fix()
 * 	fix_perm_owner()
 *
 */
#include <pbs_config.h>

#include <pbs_python_private.h>
#include <Python.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/utsname.h>
#include <fcntl.h>
#include <pwd.h>
#include <limits.h>
#include <stdlib.h>
#include <sys/stat.h>
#include <errno.h>
#include <stdio.h>
#include <unistd.h>
#include <string.h>
#include <assert.h>
#include <dirent.h>
#include <grp.h>
#include "cmds.h"
#include "pbs_version.h"
#include "pbs_ifl.h"
#include "glob.h"

// clang-format off

#ifndef	S_ISLNK
#define	S_ISLNK(m)	(((m) & S_IFMT) == S_IFLNK)
#endif

#define	DEMARC	'/'
#define DFLT_MSGTBL_SZ (1024)

/* ---- required and disallowed dir/file modes ----*/

#define DFLT_REQ_DIR_MODES (S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IWOTH)
#define DFLT_DIS_DIR_MODES (S_IWGRP | S_IWOTH)

#define rwxrxrx		(S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH)
#define frwxrxrx	(S_IFREG | S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH)
#define drwxrxrx	(S_IFDIR | S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH)
#define tdrwxrwxrwx	(S_ISVTX | S_IFDIR | S_IRWXU | S_IRWXG | S_IRWXO)
#define tgworwx		(S_ISVTX | S_IWGRP | S_IRWXO)

#define drwxgo		(S_IFDIR | S_IRWXU)
#define drwxrxo		(S_IFDIR | S_IRWXU | S_IRGRP | S_IXGRP)
#define tgrwxorwx	(S_ISVTX | S_IRWXG | S_IRWXO)
#define tgwow		(S_ISVTX | S_IWGRP | S_IWOTH)

#define drwxrxx		(S_IFDIR | S_IRWXU | S_IRGRP | S_IXGRP | S_IXOTH)
#define tgworw		(S_ISVTX | S_IWGRP | S_IROTH | S_IWOTH)
#define dtgwow		(S_IFDIR | S_ISVTX | S_IWGRP | S_IWOTH)

#define frwxrxrx	(S_IFREG | S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH)
#define sgswow		(S_ISUID | S_ISGID | S_IWGRP | S_IWOTH)

#define fsrwxrxrx	(S_IFREG | S_ISUID | S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH)
#define gswow		(S_ISGID | S_IWGRP | S_IWOTH)

#define frwxgo		(S_IFREG | S_IRWXU)
#define sgsrwxorwx	(S_ISUID | S_ISGID | S_IRWXG | S_IRWXO)

#define frwrr		(S_IFREG | S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH)
#define xsgswxowx	(S_IXUSR | S_ISUID | S_ISGID | S_IWGRP | S_IXGRP | S_IWOTH | S_IXOTH)

#define frwgo		(S_IFREG | S_IRUSR | S_IWUSR)
#define xsgsrwxorwx	(S_IXUSR | S_ISUID | S_ISGID | S_IRWXG | S_IRWXO)

#define frgror		(S_IFREG | S_IRUSR | S_IRGRP | S_IROTH)
#define sgswxowx	(S_ISUID | S_ISGID | S_IWGRP | S_IXGRP | S_IWOTH | S_IXOTH)

#define	drwxrr		(S_IFDIR | S_IRWXU | S_IRGRP | S_IROTH)
#define tgwxowx		(S_ISVTX | S_IWGRP | S_IXGRP | S_IWOTH | S_IXOTH)


/* ---- Codes to identify the source of various data items ----*/

#define	SRC_NONE	0	/* no source/can't determine */
#define	SRC_DFLT	1	/* source is default value */
#define	SRC_ENV		2	/* source is environment variable */
#define	SRC_CONF	3	/* source is PBS config file */


/* -----------  error values -------------*/

#define	PBS_CONF_NO_EXIST	1
#define	PBS_CONF_CAN_NOT_OPEN	2

#define LSTAT_PATH_ERR	-1
#define PATH_ERR	 1


typedef struct  statdata {
	int populated;		/* member "sb" populated */
	struct stat	sb;	/* stat  "buffer" */
} STATDATA;

typedef struct  utsdata {
	int	populated;	/* member "ub" populated */
	struct  utsname ub;	/* uname "buffer" */
} UTSDATA;

typedef struct vld_ug {
	/*
	 * each directory/file in the PBS infrastructure should
	 * one of these "valid users, valid groups" structures
	 * associated with it
	 */
	int	*uids;		/* -1 terminated array UID values */
	int	*gids;		/* -1 terminated array GID values */

	char	**unames; 	/* null terminated table user names */
	char	**gnames; 	/* null terminated table group names */
} VLD_UG;


typedef struct modes_path_user_group {
	/*
	 * each directory/file in the PBS infrastructure should have
	 * one of these "modes, path, user, group, type" structures
	 * associated with it
	 */
	int	fc;		/* fix code: 0=no, 1=perm/own, 2=create */

	int	notReq;		/* bit1 (0x1): 0=always required, 1=never required
				   bit2 (0x2): 1=not required for command-only install
				   bit3 (0x4): 1=not required for execution-only install
				   Note: used in conjunction with "notbits"
				 */

	int	chkfull;	/* 1=check each path component */

	int	req_modes;	/* required permissions (modes) */
	int	dis_modes;	/* disallowed permissions (modes) */
	VLD_UG	*vld_ug;	/* tables of valid users and groups */
	char	*path;		/* location of file/directory */
	char	*realpath;	/* canonicalized absolute location */
} MPUG;

typedef struct modeadjustments {
	/*
	 * an instance of this structure will contain modification
	 * data that should be used in conjunction with the mode data
	 * found in a corresponding MPUG data struccture.
	 */
	int	req;	/* required modes   */
	int	dis;	/* disallowed modes */
} ADJ;


typedef struct primary {

	MPUG	*pbs_mpug;	/* MPUGs: PBS primary dirs/files */

	/*
	 * record values and sources for "path" and "started"
	 */

	struct {
		unsigned	server:1, mom:1, sched:1;
	} started;

	struct {
		unsigned	server:2, mom:2, sched:2;
	} src_started;

	struct {
		unsigned	conf:2, home:2, exec:2;
	} src_path;

} PRIMARY;

/*
 * Numeric codes - use in title generation (see function, title_string)
 */
enum code_title { TC_top, TC_sys, TC_ro, TC_fx, TC_pri, TC_ho, TC_ex,
	TC_cnt, TC_tvrb, TC_datpri, TC_datho, TC_datex, TC_noerr,
	TC_use };
/*
 * Numeric codes - for use in function process_ret_code()
 */
enum func_names { GET_PRIMARY_VALUES, END_FUNC_NAMES };

/*
 * Message Header data - use, output of pbs_probe's "Primary" variables
 */
enum	mhp { MHP_cnf, MHP_home, MHP_exec, MHP_svr, MHP_mom, MHP_sched };
static char mhp[][20] = {
	"PBS_CONF_FILE",
	"PBS_HOME",
	"PBS_EXEC",
	"PBS_START_SERVER",
	"PBS_START_MOM",
	"PBS_START_SCHED"
};

/* ---- default values for uid/gid, user names, group names ----*/

static int pbsdata[] = {-1, -1};		  /* PBS datastore */
static int pbsservice[] = {0, -1}; /* PBS daemon service user */
static int pbsu[] = {0, -1};		  /* PBS UID, default */
static int du[] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, -1}; /* non-PBS UIDs, default */

static char *pbs_dataname[] = {"pbsdata", NULL}; /* PBS data name, default */
static char *pbs_servicename[] = {"root", NULL}; /* PBS daemon service name, default */
static char *pbs_unames[] = {"root", NULL}; /* PBS user name, default */
static char *pbs_gnames[] = {NULL}; /* PBS group name, default*/

static	int	dg[] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, -1}; /* non-PBS GIDs, default */


/* ---------- default VLD_UG structures, PBS and non-PBS -----------*/

static VLD_UG dflt_pbs_data = { pbsdata, dg, &pbs_dataname[0], &pbs_gnames[0] };
static VLD_UG dflt_pbs_service = { pbsservice, dg, &pbs_servicename[0], &pbs_gnames[0] };
static VLD_UG dflt_pbs_ug = { pbsu, dg, &pbs_unames[0], &pbs_gnames[0] };
static VLD_UG dflt_ext_ug = { du, dg, &pbs_unames[0], &pbs_gnames[0] };

/* ============  PBS path names ============ */

static  char default_pbsconf[] = "/etc/pbs.conf";

/* ------------ PBS HOME: relative paths -----------*/


static char svrhome[][80] = {
	/* 00 */ "server_logs",
	/* 01 */ "spool",
	/* 02 */ "server_priv",
	/* 03 */ "server_priv/resourcedef",
	/* 04 */ "server_priv/server.lock",
	/* 05 */ "server_priv/tracking",
	/* 06 */ "server_priv/accounting",
	/* 07 */ "server_priv/jobs",
	/* 08 */ "server_priv/users",
	/* 09 */ "server_priv/hooks",
	/* 10 */ "server_priv/hooks/tmp",
	/* 11 */ "server_priv/prov_tracking",
	/* 12 */ "server_priv/db_password",
	/* 13 */ "server_priv/db_svrhost",
	/* 14 */ "server_priv/db_svrhost.new",
	/* 15 */ "server_priv/svrlive",
	/* 16 */ "datastore"
};

static char momhome[][80] = {
	/* 0 */ "aux",
	/* 1 */ "checkpoint",
	/* 2 */ "mom_logs",
	/* 3 */ "mom_priv",
	/* 4 */ "mom_priv/mom.lock",
	/* 5 */ "mom_priv/config",
	/* 6 */ "mom_priv/jobs",
	/* 7 */ "spool",
	/* 8 */ "undelivered",
	/* 9 */ "mom_priv/config.d",
	/* 10 */ "mom_priv/hooks",
	/* 11 */ "mom_priv/hooks/tmp"
};

static char schedhome[][80] = {
	/* 0 */ "sched_logs",
	/* 1 */ "sched_priv",
	/* 2 */ "sched_priv/dedicated_time",
	/* 3 */ "sched_priv/holidays",
	/* 4 */ "sched_priv/sched_config",
	/* 5 */ "sched_priv/resource_group",
	/* 6 */ "sched_priv/sched.lock",
	/* 7 */ "sched_priv/sched_out"
};

static char exec[][80] = {
	/* 0 */ "bin",
	/* 1 */ "etc",
	/* 2 */ "include",
	/* 3 */ "lib",
	/* 4 */ "man",
	/* 5 */ "sbin",
	/* 6 */ "tcltk",
	/* 7 */ "python",
	/* 8 */ "pgsql"
};


/* ------------ PBS EXEC: relative paths ----------*/

static char exbin[][80] = {
	/* 00 */ "bin/pbs_topologyinfo",
	/* 01 */ "bin/pbs_hostn",
	/* 02 */ "bin/pbs_rdel",
	/* 03 */ "bin/pbs_rstat",
	/* 04 */ "bin/pbs_rsub",
	/* 05 */ "bin/pbs_tclsh",
	/* 06 */ "bin/pbs_wish",
	/* 07 */ "bin/pbsdsh",
	/* 08 */ "bin/pbsnodes",
	/* 09 */ "bin/printjob",
	/* 10 */ "bin/qalter",
	/* 11 */ "bin/qdel",
	/* 12 */ "bin/qdisable",
	/* 13 */ "bin/qenable",
	/* 14 */ "bin/qhold",
	/* 15 */ "bin/qmgr",
	/* 16 */ "bin/qmove",
	/* 17 */ "bin/qmsg",
	/* 18 */ "bin/qorder",
	/* 19 */ "bin/qrerun",
	/* 20 */ "bin/qrls",
	/* 21 */ "bin/qrun",
	/* 22 */ "bin/qselect",
	/* 23 */ "bin/qsig",
	/* 24 */ "bin/qstart",
	/* 25 */ "bin/qstat",
	/* 26 */ "bin/qstop",
	/* 27 */ "bin/qsub",
	/* 28 */ "bin/qterm",
	/* 29 */ "bin/tracejob",
	/* 30 */ "bin/pbs_lamboot",
	/* 31 */ "bin/pbs_mpilam",
	/* 32 */ "bin/pbs_mpirun",
	/* 33 */ "bin/pbs_mpihp",
	/* 34 */ "bin/pbs_attach",
	/* 35 */ "bin/pbs_remsh",
	/* 36 */ "bin/pbs_tmrsh",
	/* 37 */ "bin/mpiexec",
	/* 38 */ "bin/pbsrun",
	/* 39 */ "bin/pbsrun_wrap",
	/* 40 */ "bin/pbsrun_unwrap",
	/* 41 */ "bin/pbs_python",
	/* 42 */ "bin/pbs_ds_password",
	/* 43 */ "bin/pbs_dataservice"
};

static char exsbin[][80] = {
	/* 00 */ "sbin/pbs-report",
	/* 01 */ "sbin/pbs_demux",
	/* 02 */ "sbin/pbs_idled",
	/* 03 */ "sbin/pbs_iff",
	/* 04 */ "sbin/pbs_mom",
	/* 05 */ "XXX",				/* slot available for use */
	/* 06 */ "XXX",				/* slot available for use */
	/* 07 */ "sbin/pbs_rcp",
	/* 08 */ "sbin/pbs_sched",
	/* 09 */ "sbin/pbs_server",
	/* 10 */ "sbin/pbsfs",
	/* 11 */ "sbin/pbs_probe",
	/* 12 */ "sbin/pbs_upgrade_job"
};

static char exetc[][80] = {
	/* 00 */ "etc/modulefile",
	/* 01 */ "etc/pbs_dedicated",
	/* 02 */ "etc/pbs_habitat",
	/* 03 */ "etc/pbs_holidays",
	/* 04 */ "etc/pbs_init.d",
	/* 05 */ "etc/pbs_postinstall",
	/* 06 */ "etc/pbs_resource_group",
	/* 07 */ "etc/pbs_sched_config",
	/* 08 */ "etc/pbs_db_utility",
	/* 09 */ "etc/pbs_topologyinfo"
};

static char exinc[][80] = {
	/* 00 */ "include/pbs_error.h",
	/* 01 */ "include/pbs_ifl.h",
	/* 02 */ "include/rm.h",
	/* 03 */ "include/tm.h",
	/* 04 */ "include/tm_.h"
};

static char exlib[][80] = {
	/* 00 */ "lib/libattr.a",
	/* 01 */ "SLOT_AVAILABLE",
	/* 02 */ "lib/liblog.a",
	/* 03 */ "lib/libnet.a",
	/* 04 */ "lib/libpbs.a",
	/* 05 */ "lib/libsite.a",
	/* 06 */ "lib/pbs_sched.a",
	/* 07 */ "lib/pm",
	/* 08 */ "lib/pm/PBS.pm",
	/* 09 */ "lib/MPI",
	/* 10 */ "lib/MPI/sgiMPI.awk",
	/* 11 */ "lib/MPI/pbsrun.ch_gm.init.in",
	/* 12 */ "lib/MPI/pbsrun.ch_mx.init.in",
	/* 13 */ "lib/MPI/pbsrun.gm_mpd.init.in",
	/* 14 */ "lib/MPI/pbsrun.mx_mpd.init.in",
	/* 15 */ "lib/MPI/pbsrun.mpich2.init.in",
	/* 16 */ "lib/MPI/pbsrun.intelmpi.init.in",
	/* 17 */ "SLOT_AVAILABLE",
	/* 18 */ "lib/python",
	/* 19 */ "lib/python/altair",
	/* 20 */ "lib/python/altair/pbs",
	/* 21 */ "lib/python/altair/pbs/__pycache__",
	/* 22 */ "lib/python/altair/pbs/__pycache__/__init__.cpython-3?.pyc",
	/* 23 */ "lib/python/altair/pbs/__init__.py",
	/* 24 */ "lib/python/altair/pbs/v1",
	/* 25 */ "lib/python/altair/pbs/v1/__pycache__",
	/* 26 */ "lib/python/altair/pbs/v1/__pycache__/__init__.cpython-3?.pyc",
	/* 27 */ "lib/python/altair/pbs/v1/__init__.py",
	/* 28 */ "lib/python/altair/pbs/v1/_export_types.py",
	/* 29 */ "lib/python/altair/pbs/v1/_attr_types.py",
	/* 30 */ "lib/python/altair/pbs/v1/__pycache__/_attr_types.cpython-3?.pyc",
	/* 31 */ "lib/python/altair/pbs/v1/_base_types.py",
	/* 32 */ "lib/python/altair/pbs/v1/__pycache__/_base_types.cpython-3?.pyc",
	/* 33 */ "lib/python/altair/pbs/v1/_exc_types.py",
	/* 34 */ "lib/python/altair/pbs/v1/__pycache__/_exc_types.cpython-3?.pyc",
	/* 35 */ "lib/python/altair/pbs/v1/__pycache__/_export_types.cpython-3?.pyc",
	/* 36 */ "lib/python/altair/pbs/v1/_svr_types.py",
	/* 37 */ "lib/python/altair/pbs/v1/__pycache__/_svr_types.cpython-3?.pyc",
};

#if 0
static char exec_man1[] = "man/man1";
static char exec_man3[] = "man/man3";
static char exec_man7[] = "man/man7";
static char exec_man8[] = "man/man8";
#endif

static char exman1[][80] = {
	/* 00 */ "man/man1",
	/* 01 */ "man/man1/pbs_python.1B",
	/* 02 */ "man/man1/pbs_rdel.1B",
	/* 03 */ "man/man1/pbs_rstat.1B",
	/* 04 */ "man/man1/pbs_rsub.1B",
	/* 05 */ "man/man1/pbsdsh.1B",
	/* 06 */ "man/man1/qalter.1B",
	/* 07 */ "man/man1/qdel.1B",
	/* 08 */ "man/man1/qhold.1B",
	/* 09 */ "man/man1/qmove.1B",
	/* 10 */ "man/man1/qmsg.1B",
	/* 11 */ "man/man1/qorder.1B",
	/* 12 */ "man/man1/qrerun.1B",
	/* 13 */ "man/man1/qrls.1B",
	/* 14 */ "man/man1/qselect.1B",
	/* 15 */ "man/man1/qsig.1B",
	/* 16 */ "man/man1/qstat.1B",
	/* 17 */ "man/man1/qsub.1B"
};

static char exman3[][80] = {
	/* 00 */ "man/man3",
	/* 01 */ "man/man3/pbs_alterjob.3B",
	/* 02 */ "man/man3/pbs_connect.3B",
	/* 03 */ "man/man3/pbs_default.3B",
	/* 04 */ "man/man3/pbs_deljob.3B",
	/* 05 */ "man/man3/pbs_disconnect.3B",
	/* 06 */ "man/man3/pbs_geterrmsg.3B",
	/* 07 */ "man/man3/pbs_holdjob.3B",
	/* 08 */ "man/man3/pbs_manager.3B",
	/* 09 */ "man/man3/pbs_movejob.3B",
	/* 10 */ "man/man3/pbs_msgjob.3B",
	/* 11 */ "man/man3/pbs_orderjob.3B",
	/* 12 */ "man/man3/pbs_rerunjob.3B",
	/* 13 */ "man/man3/pbs_statsched.3B",
	/* 14 */ "man/man3/pbs_rescreserve.3B",
	/* 15 */ "man/man3/pbs_rlsjob.3B",
	/* 16 */ "man/man3/pbs_runjob.3B",
	/* 17 */ "man/man3/pbs_selectjob.3B",
	/* 18 */ "man/man3/pbs_sigjob.3B",
	/* 19 */ "man/man3/pbs_stagein.3B",
	/* 20 */ "man/man3/pbs_statjob.3B",
	/* 21 */ "man/man3/pbs_statnode.3B",
	/* 22 */ "man/man3/pbs_statque.3B",
	/* 23 */ "man/man3/pbs_statserver.3B",
	/* 24 */ "man/man3/pbs_submit.3B",
	/* 25 */ "man/man3/pbs_terminate.3B",
	/* 26 */ "man/man3/tm.3",
	/* 27 */ "man/man3/pbs_tclapi.3B",
	/* 28 */ "man/man3/pbs_delresv.3B",
	/* 29 */ "man/man3/pbs_locjob.3B",
	/* 30 */ "man/man3/pbs_selstat.3B",
	/* 31 */ "man/man3/pbs_statresv.3B",
	/* 32 */ "man/man3/pbs_statfree.3B"
};

static char exman7[][80] = {
	/* 00 */ "man/man7",
	/* 01 */ "man/man7/pbs_job_attributes.7B",
	/* 02 */ "man/man7/pbs_node_attributes.7B",
	/* 03 */ "man/man7/pbs_queue_attributes.7B",
	/* 04 */ "man/man7/pbs_resources.7B",
	/* 05 */ "man/man7/pbs_resv_attributes.7B",
	/* 06 */ "man/man7/pbs_server_attributes.7B",
	/* 07 */ "man/man7/pbs_sched_attributes.7B",
	/* 08 */ "man/man7/pbs_professional.7B"
};

static char exman8[][80] = {
	/* 00 */ "man/man8",
	/* 01 */ "man/man8/pbs_idled.8B",
	/* 02 */ "man/man8/pbs_mom.8B",
	/* 03 */ "man/man8/pbs_sched.8B",
	/* 04 */ "man/man8/pbs_server.8B",
	/* 05 */ "man/man8/pbsfs.8B",
	/* 06 */ "man/man8/pbsnodes.8B",
	/* 07 */ "man/man8/qdisable.8B",
	/* 08 */ "man/man8/qenable.8B",
	/* 09 */ "man/man8/qmgr.8B",
	/* 10 */ "man/man8/qrun.8B",
	/* 11 */ "man/man8/qstart.8B",
	/* 12 */ "man/man8/qstop.8B",
	/* 13 */ "man/man8/qterm.8B",
	/* 14 */ "man/man8/pbs_lamboot.8B",
	/* 15 */ "man/man8/pbs_mpilam.8B",
	/* 16 */ "man/man8/pbs_mpirun.8B",
	/* 17 */ "man/man8/pbs_attach.8B",
	/* 18 */ "man/man8/pbs_mkdirs.8B",
	/* 19 */ "man/man8/pbs_hostn.8B",
	/* 20 */ "man/man8/pbs_probe.8B",
	/* 21 */ "man/man8/pbs-report.8B",
	/* 22 */ "man/man8/pbs_tclsh.8B",
	/* 23 */ "man/man8/pbs_tmrsh.8B",
	/* 24 */ "man/man8/pbs_wish.8B",
	/* 25 */ "man/man8/printjob.8B",
	/* 26 */ "man/man8/pbs.8B",
	/* 27 */ "man/man8/pbs_interactive.8B"
};

static char extcltk[][80] = {
	/* 0 */ "tcltk/bin",
	/* 1 */ "tcltk/include",
	/* 2 */ "tcltk/lib",
	/* 3 */ "tcltk/license.terms"
};

static char expython[][80] = {
	/* 0 */ "python/bin",
	/* 1 */ "python/include",
	/* 2 */ "python/lib",
	/* 3 */ "python/man",
	/* 4 */ "python/python.changes.txt",
	/* 5 */ "python/bin/python"
};

static char expgsql[][80] = {
	/* 0 */ "pgsql/bin",
	/* 1 */ "pgsql/include",
	/* 2 */ "pgsql/lib",
	/* 3 */ "pgsql/share"
};

/* -------- global static PBS variables -------- */

ADJ dflt_modeadjustments = { S_IFDIR | S_IXUSR | S_IXGRP | S_IXOTH, S_IFREG };

enum fixcodes	{ FIX_none, FIX_po };
enum pbsdirtype { PBS_niltype, PBS_logsdir, PBS_acctdir,
	PBS_spooldir, PBS_jobsdir,
	PBS_usersdir,
	PBS_hooksdir, PBS_hookswdir };


enum pbs_mpugs { PBS_conf, PBS_home, PBS_exec, PBS_last };
char	*origin_names[] = {"PBS CONF FILE", "PBS HOME", "PBS EXEC"};

/*
 * The following definitions simplify setting bit field codes
 */

#define C000	{0, 0, 0}		/* no fix,    Req'd, !ckfull */
#define C010	{0, 1, 0}		/* no fix,    noReq, !ckfull */
#define C100	{1, 0, 0}		/* fix perms, Req'd, !ckfull */
#define C110	{1, 1, 0}		/* fix perms, noReq, !ckfull */
#define C111	{1, 1, 1}		/* fix perms, noReq,  ckfull */
#define C200	{2, 0, 0}		/* fix exist, Req'd, !ckfull */
#define C201	{2, 0, 1}		/* fix exist, Req'd,  ckfull */

/*
 * MPUG arrays and mask to use with MPUG's "notReq" member
 */

/*
 * variable records which bits in an MPUG's "notReq" member need be considered
 *	notbits starts as 0x1
 *	For execution only (Mom) set to 0x5
 *	For commands only	 set to 0x3
 *
 *	"notReq" is set to
 *	0 - required for all
 *	1 - not required ever
 *	2 - not required for commands only install
 *	4 - not required for execuition only (Mom) install
 *
 * The two are "and"ed together.  If the result is 0 the file should be there,
 * if the result is non-zero, the file need not be present.
 */
static int	notbits = 0x1;


static MPUG	pbs_mpugs[] = {
	/*
	 * infrastructure data associated with PBS origins
	 * dir, chkfull, required and disallowed modes, pointer
	 * to "valid users, valid groups", path, realpath
	 */
	{1, 0, 0, frwrr,  xsgswxowx, &dflt_ext_ug, NULL, NULL},
	{1, 0, 1, drwxrxrx,   tgwow, &dflt_ext_ug, NULL, NULL},
	{1, 0, 1, drwxrxrx,   tgwow, &dflt_ext_ug, NULL, NULL} };

enum exec_mpugs { EXEC_exec, EXEC_bin, EXEC_sbin,  EXEC_etc, EXEC_include,
	EXEC_lib, EXEC_man, EXEC_man1, EXEC_man3, EXEC_man7,
	EXEC_man8, EXEC_tcltk, EXEC_python, EXEC_pgsql, EXEC_last };

char *exec_mpug_set[EXEC_last] = {"exec", "bin", "sbin", "etc", "include",
	"lib", "man", "man1", "man3", "man7",
	"man8", "tcltk", "python", "pgsql"};

int  exec_sizes[EXEC_last];

static MPUG	 exec_mpugs[] = {
	/*
	 * infrastructure data associated with PBS execution -
	 * bin, sbin, etc, include, lib, man, tcltk, python, pgsql
	 */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[0], NULL}, /* bin */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[1], NULL}, /* etc */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[2], NULL}, /* include */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[3], NULL}, /* lib */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[4], NULL}, /* man */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[5], NULL}, /* sbin */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[6], NULL}, /* tcltk */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[7], NULL}, /* python */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[8], NULL}  /* pgsql */
};


static MPUG	bin_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/bin
	 */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[0],    NULL},
	{1, 6, 0,   frwxgo,   sgsrwxorwx, &dflt_pbs_ug, exbin[ 0], NULL }, /* pbs_topologyinfo */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 1], NULL }, /* pbs_hostn */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 2], NULL }, /* pbs_rdel */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 3], NULL }, /* pbs_rstat */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 4], NULL }, /* pbs_rsub */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 5], NULL }, /* pbs_tclsh */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 6], NULL }, /* pbs_wish */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 7], NULL }, /* pbsdsh */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 8], NULL }, /* pbsnodes */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[ 9], NULL }, /* printjob */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[10], NULL }, /* qalter */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[11], NULL }, /* qdel */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[12], NULL }, /* qdisable */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[13], NULL }, /* qenable */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[14], NULL }, /* qhold */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[15], NULL }, /* qmgr */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[16], NULL }, /* qmove */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[17], NULL }, /* qmsg */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[18], NULL }, /* qorder */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[19], NULL }, /* qrerun */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[20], NULL }, /* qrls */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[21], NULL }, /* qrun */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[22], NULL }, /* qselect */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[23], NULL }, /* qsig */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[24], NULL }, /* qstart */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[25], NULL }, /* qstat */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[26], NULL }, /* qstop */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[27], NULL }, /* qsub */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[28], NULL }, /* qterm */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[29], NULL }, /* tracejob */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[30], NULL }, /* pbs_lamboot */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[31], NULL }, /* pbs_mpilam */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[32], NULL }, /* pbs_mpirun */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[33], NULL }, /* pbs_mpihp */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[34], NULL }, /* pbs_attach */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[35], NULL }, /* pbs_remsh */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[36], NULL }, /* pbs_tmrsh */
	{1, 2, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[37], NULL }, /* mpiexec */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[38], NULL }, /* pbsrun */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[39], NULL }, /* pbsrun_wrap */
	{1, 1, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[40], NULL }, /* pbsrun_unwrap */
	{1, 2, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exbin[41], NULL },  /* pbs_python */
	{1, 6, 0,   frwxgo,     tgrwxorwx, &dflt_pbs_ug, exbin[42], NULL },  /* pbs_ds_password */
	{1, 6, 0,   frwxgo,     tgrwxorwx, &dflt_pbs_ug, exbin[43], NULL }  /* pbs_dataservice */
};

static MPUG	sbin_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/sbin
	 */
	{1, 0, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, exec[5], NULL},
	{1, 2, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exsbin[ 0], NULL }, /* pbs-report */
	{1, 2, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exsbin[ 1], NULL }, /* pbs_demux */
	{1, 2, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exsbin[ 2], NULL }, /* pbs_idled */
	{1, 0, 0,  fsrwxrxrx,      gswow, &dflt_pbs_ug, exsbin[ 3], NULL }, /* pbs_iff */
	{1, 2, 0,     frwxgo, sgsrwxorwx, &dflt_pbs_ug, exsbin[ 4], NULL }, /* pbs_mom */
	{1, 1, 0,     frwxgo, sgsrwxorwx, &dflt_pbs_ug, exsbin[ 5], NULL }, /* slot available for use */
	{1, 1, 0,     frwxgo, sgsrwxorwx, &dflt_pbs_ug, exsbin[ 6], NULL }, /* slot available for use */
	{1, 2, 0,  fsrwxrxrx,      gswow, &dflt_pbs_ug, exsbin[ 7], NULL }, /* pbs_rcp */
	{1, 6, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exsbin[ 8], NULL }, /* pbs_sched */
	{1, 6, 0,     frwxgo, sgsrwxorwx, &dflt_pbs_ug, exsbin[ 9], NULL }, /* pbs_server */
	{1, 6, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exsbin[10], NULL }, /* pbsfs */
	{1, 0, 0,   frwxrxrx,     sgswow, &dflt_pbs_ug, exsbin[11], NULL }, /* pbs_probe */
	{1, 2, 0,     frwxgo, sgsrwxorwx, &dflt_pbs_ug, exsbin[12], NULL } /* pbs_upgrade_job */
};


static MPUG	etc_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/etc
	 */
	{1, 0, 0, drwxrxrx,      tgwow, &dflt_pbs_ug,  exec[ 1], NULL },
	{1, 0, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exetc[ 0], NULL }, /* modulefile */
	{1, 6, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exetc[ 1], NULL }, /* pbs_dedicated */
	{1, 2, 0,   frwxgo, sgsrwxorwx, &dflt_pbs_ug, exetc[ 2], NULL }, /* pbs_habitat */
	{1, 6, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exetc[ 3], NULL }, /* pbs_holidays */
	{1, 2, 0,   frwxgo, sgsrwxorwx, &dflt_pbs_ug, exetc[ 4], NULL }, /* pbs_init.d */
	{1, 0, 0,   frwxgo, sgsrwxorwx, &dflt_pbs_ug, exetc[ 5], NULL }, /* pbs_postinstall */
	{1, 6, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exetc[ 6], NULL }, /* pbs_resource_group */
	{1, 6, 0,   frgror,   sgswxowx, &dflt_pbs_ug, exetc[ 7], NULL }, /* pbs_sched_config */
	{1, 6, 0,   frwxgo,  tgrwxorwx, &dflt_pbs_ug, exetc[ 8], NULL }, /* pbs_db_utility */
	{1, 6, 0,   frwxgo, sgsrwxorwx, &dflt_pbs_ug, exetc[ 9], NULL }  /* pbs_topologyinfo */
};


static MPUG	include_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/include
	 */
	{1, 1, 0,   drwxrxrx,    tgwow, &dflt_pbs_ug, exec[2], NULL},
	{1, 1, 0,     frgror,   sgswxowx, &dflt_pbs_ug, exinc[0], NULL }, /* pbs_error.h */
	{1, 1, 0,     frgror,   sgswxowx, &dflt_pbs_ug, exinc[1], NULL }, /* pbs_ifl.h */
	{1, 1, 0,     frgror,   sgswxowx, &dflt_pbs_ug, exinc[2], NULL }, /* rm.h */
	{1, 1, 0,     frgror,   sgswxowx, &dflt_pbs_ug, exinc[3], NULL }, /* tm.h */
	{1, 1, 0,     frgror,   sgswxowx, &dflt_pbs_ug, exinc[4], NULL } }; /* tm_.h */


static MPUG	lib_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/lib
	 */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[3],    NULL},
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 0], NULL }, /* libattr.a */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 1], NULL }, /* SLOT_AVAILABLE */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 2], NULL }, /* liblog.a */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 3], NULL }, /* libnet.a */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 4], NULL }, /* libpbs.a */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 5], NULL }, /* libsite.a */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 6], NULL }, /* pbs_sched.a */
	{1, 2, 0,   drwxrxrx,    tgwow, &dflt_pbs_ug, exlib[ 7], NULL }, /* pm */
	{1, 0, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[ 8], NULL }, /* PBS.pm */
	{1, 2, 0,   drwxrxrx,    tgwow, &dflt_pbs_ug, exlib[ 9], NULL}, /* MPI */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[10], NULL}, /* sgiMPI.awk */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[11], NULL}, /* pbsrun.ch_gm.init.in */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[12], NULL}, /* pbsrun.ch_mx.init.in */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[13], NULL}, /* pbsrun.gm_mpd.init.in */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[14], NULL}, /* pbsrun.mx_mpd.init.in */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[15], NULL}, /* pbsrun.mpich2.init.in */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[16], NULL},  /* pbsrun.intelmpi.init.in */
	{1, 1, 0,    frwrr,  xsgswxowx, &dflt_pbs_ug, exlib[17], NULL},  /* SLOT_AVAILABLE */
	{1, 6, 0,    drwxrxrx,   tgwow, &dflt_pbs_ug, exlib[18], NULL},  /* lib/python */
	{1, 2, 0,    drwxrxrx,   tgwow, &dflt_pbs_ug, exlib[19], NULL},  /* lib/python/altair */
	{1, 2, 0,    drwxrxrx,   tgwow, &dflt_pbs_ug, exlib[20], NULL},  /* lib/python/altair/pbs */
	{1, 2, 0,    drwxrxrx,   tgwow, &dflt_pbs_ug, exlib[21], NULL},  /* lib/python/altair/pbs/__pycache__ */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[22], NULL},  /* lib/python/altair/pbs/__pycache__
	/__init__.cpython-3?.pyc */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[23], NULL},  /* lib/python/altair/pbs/__init__.py */
	{1, 2, 0,    drwxrxrx,   tgwow, &dflt_pbs_ug, exlib[24], NULL},  /* lib/python/altair/pbs/v1 */
	{1, 2, 0,    drwxrxrx,   tgwow, &dflt_pbs_ug, exlib[25], NULL},  /* lib/python/altair/pbs/v1/__pycache__ */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[26], NULL},  /* lib/python/altair/pbs/v1/__pycache__
	/__init__.cpython-3?.pyc */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[27], NULL},  /* lib/python/altair/pbs/v1/__init__.py */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[28], NULL},  /* lib/python/altair/pbs/v1/_export_types.py */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[29], NULL},  /* lib/python/altair/pbs/v1/_attr_types.py */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[30], NULL},  /* lib/python/altair/pbs/v1/__pycache__
	/_attr_types.cpython-3?.pyc */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[31], NULL},  /* lib/python/altair/pbs/v1/_base_types.py */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[32], NULL},  /* lib/python/altair/pbs/v1/__pycache__
	/_base_types.cpython-3?.pyc */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[33], NULL},  /* lib/python/altair/pbs/v1/_exc_types.py */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[34], NULL},  /* lib/python/altair/pbs/v1/__pycache__
	/_exc_types.cpython-3?.pyc */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[35], NULL},  /* lib/python/altair/pbs/v1/__pycache__
	/_export_types.cpython-3?pyc */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[36], NULL},  /* lib/python/altair/pbs/v1/_svr_types.py */
	{1, 2, 0,    frgror,  sgswxowx, &dflt_pbs_ug, exlib[37], NULL},  /* lib/python/altair/pbs/v1/__pycache__
	/_svr_types.cpython-3?.pyc */
};

static MPUG	man_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/man
	 */
	{1, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, exec[4],    NULL},

	/*
	 * infrastructure data associated with PBS_EXEC/man/man1
	 */
	{1, 0, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, exman1[ 0], NULL }, /* man1 */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 1], NULL }, /* pbs_python.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 2], NULL }, /* pbs_rdel.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 3], NULL }, /* pbs_rstat.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 4], NULL }, /* pbs_rsub.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 5], NULL }, /* pbsdsh.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 6], NULL }, /* qalter.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 7], NULL }, /* qdel.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 8], NULL }, /* qhold.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[ 9], NULL }, /* qmove.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[10], NULL }, /* qmsg.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[11], NULL }, /* qorder.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[12], NULL }, /* qrerun.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[13], NULL }, /* qrls.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[14], NULL }, /* qselect.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[15], NULL }, /* qsig.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[16], NULL }, /* qstat.1B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman1[17], NULL }, /* qsub.1B */

	/*
	 * infrastructure data associated with PBS_EXEC/man/man3
	 */
	{1, 0, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, exman3[ 0], NULL }, /* man3 */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 1], NULL }, /* pbs_alterjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 2], NULL }, /* pbs_connect.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 3], NULL }, /* pbs_default.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 4], NULL }, /* pbs_deljob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 5], NULL }, /* pbs_disconnect.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 6], NULL }, /* pbs_geterrmsg.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 7], NULL }, /* pbs_holdjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 8], NULL }, /* pbs_manager.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[ 9], NULL }, /* pbs_movejob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[10], NULL }, /* pbs_msgjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[11], NULL }, /* pbs_orderjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[12], NULL }, /* pbs_rerunjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[13], NULL }, /* pbs_statsched.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[14], NULL }, /* pbs_rescreserve.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[15], NULL }, /* pbs_rlsjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[16], NULL }, /* pbs_runjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[17], NULL }, /* pbs_selectjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[18], NULL }, /* pbs_sigjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[19], NULL }, /* pbs_stagein.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[20], NULL }, /* pbs_statjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[21], NULL }, /* pbs_statnode.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[22], NULL }, /* pbs_statque.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[23], NULL }, /* pbs_statserver.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[24], NULL }, /* pbs_submit.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[25], NULL }, /* pbs_terminate.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[26], NULL }, /* tm.3 */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[27], NULL }, /* pbs_tclapi.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[28], NULL }, /* pbs_delresv.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[20], NULL }, /* pbs_locjob.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[30], NULL }, /* pbs_selstat.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[31], NULL }, /* pbs_statresv.3B */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, exman3[32], NULL }, /* pbs_statfree.3B */

	/*
	 * infrastructure data associated with PBS_EXEC/man/man7
	 */
	{1, 0, 0, drwxrxrx,  tgwow, &dflt_pbs_ug, exman7[ 0], NULL }, /* man7 */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 1], NULL }, /* pbs_job_attributes.7B */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 2], NULL }, /* pbs_node_attributes.7B */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 3], NULL }, /* pbs_queue_attributes.7B */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 4], NULL }, /* pbs_resources.7B */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 5], NULL }, /* pbs_resv_attributes.7B */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 6], NULL }, /* pbs_server_attributes.7B */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 7], NULL }, /* pbs_sched_attributes.7B */
	{1, 0, 0, frwrr, xsgswxowx, &dflt_pbs_ug, exman7[ 8], NULL }, /* pbs_professional.7B */

	/*
	 * infrastructure data associated with PBS_EXEC/man/man8
	 */
	{1, 0, 0,  drwxrxrx,      tgwow, &dflt_pbs_ug, exman8[ 0], NULL }, /* man8 */
	{1, 2, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 1], NULL }, /* pbs_idled.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 2], NULL }, /* pbs_mom.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 3], NULL }, /* pbs_sched.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 4], NULL }, /* pbs_server.8B */
	{1, 2, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 5], NULL }, /* pbsfs.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 6], NULL }, /* pbsnodes.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 7], NULL }, /* qdisable.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 8], NULL }, /* qenable.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[ 9], NULL }, /* qmgr.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[10], NULL }, /* qrun.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[11], NULL }, /* qstart.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[12], NULL }, /* qstop.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[13], NULL }, /* qterm.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[14], NULL }, /* pbs_lamboot.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[15], NULL }, /* pbs_mpilam.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[16], NULL }, /* pbs_mpirun.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[17], NULL }, /* pbs_attach.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[18], NULL }, /* pbs_mkdirs.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[19], NULL }, /* pbs_hostn.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[20], NULL }, /* pbs_probe.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[21], NULL }, /* pbs-report.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[22], NULL }, /* pbs_tclsh.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[23], NULL }, /* pbs_tmrsh.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[24], NULL }, /* pbs_wish.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[25], NULL }, /* printjob.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[26], NULL }, /* pbs.8B */
	{1, 0, 0,     frwrr,  xsgswxowx, &dflt_pbs_ug, exman8[27], NULL } }; /* pbs_interactive.8B */

static MPUG	tcltk_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/tcltk
	 */
	{1, 0, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, exec[6],  NULL},
	{1, 0, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, extcltk[0], NULL }, /* tcltk/bin */
	{1, 0, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, extcltk[1], NULL }, /* tcltk/include */
	{1, 0, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, extcltk[2], NULL }, /* tcltk/lib */
	{1, 0, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, extcltk[3], NULL } }; /* tcltk/license.terms */

static MPUG	python_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/python
	 */
	{1, 2, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, exec[7],  NULL},
	{1, 2, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expython[0], NULL }, /* python/bin */
	{1, 2, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expython[1], NULL }, /* python/include */
	{1, 2, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expython[2], NULL }, /* python/lib */
	{1, 2, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expython[3], NULL }, /* python/man */
	{1, 2, 0,      frwrr,  xsgswxowx, &dflt_pbs_ug, expython[4], NULL }, /* python/python.changes.txt */
	{1, 2, 0,      frwxrxrx,  sgswow, &dflt_pbs_ug, expython[5], NULL } }; /* python/bin/python */

static MPUG	pgsql_mpugs[] = {
	/*
	 * infrastructure data associated with PBS_EXEC/pgsql
	 */
	{1, 6, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, exec[8],  NULL},
	{1, 6, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expgsql[0], NULL }, /* pgsql/bin */
	{1, 6, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expgsql[1], NULL }, /* pgsql/include */
	{1, 6, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expgsql[2], NULL }, /* pgsql/lib */
	{1, 6, 0,   drwxrxrx,      tgwow, &dflt_pbs_ug, expgsql[3], NULL } }; /* pgsql/share */


enum pbshome_mpugs { PH_server, PH_mom, PH_sched, PH_last };

int  home_sizes[PH_last];
char *home_mpug_set[PH_last] = {"pbs_server", "pbs_mom", "pbs_sched"};

enum svr_mpugs { SVR_logs,  SVR_spool, SVR_priv,  SVR_acct,
	SVR_jobs,
	SVR_users, SVR_hooks, SVR_hookswdir, SVR_last };

static MPUG	 svr_mpugs[] = {
	/*
	 * infrastructure data associated with server daemon
	 * home dir, chkfull, required and disallowed modes,
	 * pointer to "valid users, valid groups", path, realpath
	 */
	{2, 0, 0, drwxrxrx,  tgwow,  &dflt_pbs_ug, svrhome[ 0], NULL}, /* logs */
	{2, 0, 0, tdrwxrwxrwx,   0,  &dflt_pbs_ug, svrhome[ 1], NULL}, /* spool */
	{2, 0, 0, drwxrxo, tgworwx,  &dflt_pbs_ug, svrhome[ 2], NULL}, /* priv */
	{1, 1, 0, frwrr, xsgswxowx,  &dflt_pbs_ug, svrhome[ 3], NULL}, /* resourcedef */
	{0, 1, 0, frwgo, sgsrwxorwx, &dflt_pbs_ug, svrhome[ 4], NULL}, /* server.lock */
	{2, 0, 0, frwgo, sgsrwxorwx, &dflt_pbs_ug, svrhome[ 5], NULL}, /* tracking */
	{2, 0, 0, drwxrxrx,  tgwow,  &dflt_pbs_ug, svrhome[ 6], NULL}, /* accounting */
	{2, 0, 0, drwxrxo, tgworwx,  &dflt_pbs_ug, svrhome[ 7], NULL}, /* jobs */
	{2, 0, 0, drwxrxo, tgworwx,  &dflt_pbs_ug, svrhome[ 8], NULL}, /* users */
	{2, 0, 0, drwxrxo, tgworwx,  &dflt_pbs_ug, svrhome[ 9], NULL}, /* hooks */
	{2, 0, 0, drwxrxo, tgworwx,  &dflt_pbs_ug, svrhome[10], NULL}, /* hooks' workdir */
	{1, 0, 0, frwgo, sgsrwxorwx, &dflt_pbs_ug, svrhome[11], NULL}, /* prov_tracking */
	{1, 6, 0, frwgo, sgsrwxorwx, &dflt_pbs_ug, svrhome[12], NULL}, /* db_password */
	{1, 1, 0, frwgo, sgsrwxorwx, &dflt_pbs_ug, svrhome[13], NULL}, /* db_svrhost */
	{1, 1, 0, frwgo, sgsrwxorwx, &dflt_pbs_ug, svrhome[14], NULL}, /* db_svrhost.new */
	{1, 6, 0, frwgo, sgsrwxorwx, &dflt_pbs_ug, svrhome[15], NULL}, /* svrlive */
	{1, 6, 0, drwxgo, tgworwx, &dflt_pbs_data, svrhome[16], NULL}  /* datastore (must be last) */
};


enum mom_mpugs { MOM_aux, MOM_checkpoint, MOM_logs, MOM_priv,
	MOM_jobs, MOM_spool, MOM_undelivered, MOM_last };

static MPUG	mom_mpugs[] = {
	/*
	 * infrastructure data associated with mom daemon
	 * dir, chkfull, required and disallowed modes, pointer
	 * to "valid users, valid groups", path, realpath
	 */
	{2, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, momhome[0], NULL}, /* aux */
	{2, 0, 0, drwxgo,  tgrwxorwx, &dflt_pbs_ug, momhome[1], NULL}, /* checkpoint */
	{2, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_ug, momhome[2], NULL}, /* mom_logs */
	{2, 0, 0, drwxrxx,    tgworw, &dflt_pbs_ug, momhome[3], NULL}, /* mom_priv */
	{0, 1, 0, frwrr,   xsgswxowx, &dflt_pbs_ug, momhome[4], NULL}, /* mom.lock */
	{2, 0, 0, frwrr,   xsgswxowx, &dflt_pbs_ug, momhome[5], NULL}, /* config */
	{2, 0, 0, drwxrxx,    tgworw, &dflt_pbs_ug, momhome[6], NULL}, /* jobs */
	{2, 0, 0, tdrwxrwxrwx,     0, &dflt_pbs_ug, momhome[7], NULL}, /* spool */
	{2, 0, 0, tdrwxrwxrwx,     0, &dflt_pbs_ug, momhome[8], NULL}, /* undelivered */
	{0, 1, 0, drwxgo,     tgworw, &dflt_pbs_ug, momhome[9], NULL}, /* config.d */
	{0, 1, 0, drwxgo,     tgworw, &dflt_pbs_ug, momhome[10], NULL}, /* mom_priv/hooks */
	{0, 1, 0, drwxgo,     tgworw, &dflt_pbs_ug, momhome[11], NULL}};/* mom_priv/hooks/tmp */


enum sched_mpugs { SCHED_logs, SCHED_priv, SCHED_last };

static MPUG	sched_mpugs[] = {
	/*
	 * infrastructure data associated with sched daemon
	 * dir, chkfull, required and disallowed modes, pointer
	 * to "valid users, valid groups", path, realpath
	 */
	{2, 0, 0, drwxrxrx,    tgwow, &dflt_pbs_service, schedhome[0], NULL}, /* sched_logs */
	{2, 0, 0, drwxrxo,   tgworwx, &dflt_pbs_service, schedhome[1], NULL}, /* sched_priv */
	{2, 0, 0, frwrr,   xsgswxowx, &dflt_pbs_service, schedhome[2], NULL}, /* dedicated_time */
	{2, 0, 0, frwrr,   xsgswxowx, &dflt_pbs_service, schedhome[3], NULL}, /* holidays */
	{2, 0, 0, frwrr,   xsgswxowx, &dflt_pbs_service, schedhome[4], NULL}, /* sched_config */
	{2, 0, 0, frwrr,   xsgswxowx, &dflt_pbs_service, schedhome[5], NULL}, /* resource_group */
	{0, 1, 0, frwrr,   xsgswxowx, &dflt_pbs_service, schedhome[6], NULL}, /* sched.lock */
	{2, 1, 0, frwrr,   xsgswxowx, &dflt_pbs_service, schedhome[7], NULL} }; /* sched_out */


enum  msg_sources { SRC_pri, SRC_home, SRC_exec, SRC_last, SRC_none };
enum  msg_categories { MSG_md, MSG_mf, MSG_po, MSG_unr, MSG_real, MSG_pri, MSG_oth, MSG_last, MSG_none };
/*
 * MSG_md   - missing directories
 * MSG_mf   - missing files
 * MSG_po   - permission/owner errors
 * MSG_unr  - unrecognized directory entry
 * MSG_pri  - primary data
 * MSG_real - real path problem
 * MSG_oth  - other problems
 * MSG_last - last enumeration value
 */

/*
 * The structure below is used in mechanizing storage of messages in
 * memory for subsequent output.  Things are done this in order that
 * there be more flexibility/control over how information flowing on
 * stdout is organized.
 *
 * For each "source" of output messages, there will be an instance of
 * PROBEMSGS data structure - i.e.,
 * there will be an instance for messages relating to the PRIMARY data,
 * one relating to messages associated with PBS HOME data, and one
 * relating to messages associated with PBS EXEC data.
 */

typedef struct	probemsgs {
	/*
	 * each pointer in mtbls will point to an array of
	 * pointers to messages.  The message pointers in each
	 * array are pointing to output messages from pbs_probe that
	 * belong to the same "category" of message - e.g. messages
	 * about a file being "missing". (see enum msg_categories)
	 *
	 * Structure member "idx" is an array of index values, one for
	 * each array of message pointers - e.g. idx[MSG_mf] holds the
	 * index of the last "missing file" message placed in the array.
	 */
	char **mtbls[MSG_last];
	int  idx[MSG_last];
}  PROBEMSGS;


typedef struct	infrastruct {

	int	mode;		/* pbs_probe "mode" */
	char*	phost;		/* host running pbs_probe */

	/* PRIMARY related MPUGS and their sources */

	PRIMARY	pri;

	/* pointers to PBS HOME related MPUG arrays */

	MPUG	*home[PH_last];

	/* pointers to PBS EXEC related MPUG arrays */

	MPUG	*exec[EXEC_last];

	PROBEMSGS *msgs[SRC_last];

	struct utsdata	utsd;
	struct statdata statd;
} INFRA;

static void	am_i_authorized(void);
static void	infrastruct_params(struct infrastruct *, int);
static void	adjust_for_os(struct infrastruct *pinf);
static void	print_infrastruct(struct infrastruct *);
static void	title_string(enum code_title, int, INFRA *);
static void	print_problems(INFRA *);
static void	msg_table_set_defaults(INFRA *, int, int);
static int	put_msg_in_table(INFRA *, int, int, char*);
static int	get_primary_values(struct infrastruct *);
static int	get_realpath_values(struct infrastruct *);
static int	is_parent_rpathnull(char *, MPUG **, int, int *);
#if 0
static int	is_suffix_ok(char *, char *);
static int	inspect_dir_entries(struct infrastruct *);
static const	char *which_suffixset(MPUG *);
static MPUG	**which_knwn_mpugs(MPUG *, MPUG *[], int *, int asz);
static MPUG	**which_Knwn_mpugs(MPUG *, MPUG *, int);
static void	chk_entries(MPUG *, MPUG **);
static void	pbs_dirtype(int *, MPUG *);
static int	non_db_resident(MPUG*, char*, int, char *entryname);
static int	is_a_numericname(char *);
#endif
static int	check_paths(struct infrastruct *);
static int	check_owner_modes(char *, MPUG *, int);
static int	mbits_and_owner(struct stat *, MPUG *, int);
static char	*perm_string(mode_t);

static const char *perm_owner_msg(struct stat *, MPUG *, ADJ *, int);
static const char *owner_string(struct stat *, MPUG *, int);

static int	process_ret_code(enum func_names, int, struct infrastruct *);
static int	conf4primary(FILE *, struct infrastruct *);
static int	env4primary(struct infrastruct *);
static void     fix(int, int, int, MPUG *, ADJ *, struct stat *, int);
static void     fix_perm_owner(MPUG *, struct stat *, ADJ *);

/* Variables visible to all functions in this file */

static int   flag_verbose;
static	int  mode = 0;
static	int  max_level = FIX_po;
int	nonlocaldata = 0;
/**
 * @Brief
 *      This is main function of pbs_probe process.
 *
 * @return	int
 * @retval	0	: On Success
 * @retval	!=0	: failure
 *
 */
int
main(int argc, char *argv[])
{
	int rc;
	int i=0;
	int err=0;
	struct infrastruct infra;

	extern int optind;

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);

	/* If not authorized, don't proceed any further */
	am_i_authorized();

	/*
	 * Check that this invocation of pbs_probe is properly formed
	 * compute the "run mode"
	 */

	while (err == 0 && (i = getopt(argc, argv, "fcv")) != EOF) {

		switch (i) {

				/*other two "recognized" modes*/

			case 'v':
				flag_verbose = 1;
				break;

			case 'f':
				if (mode)
					/*
				 *program allows only one mode at a time, so if
				 *already has a value that is bad
				 */
					err = 1;
				else
					mode = i;
				break;

				/*
				 * Currently, only options are: "none", f, v
				 * Also, for any non-recognized option getopt outputs
				 * an error message to stderr.
				 */

			case 'c':
			default: err = 1;
		}
	}


	if (err == 0 && mode != 'c' && argv[optind] == NULL) {

		/*
		 * Determine name of this host, pbs.conf pathname,
		 * and values for certain primary parameters
		 */

		infrastruct_params(&infra, mode);
		msg_table_set_defaults(&infra, SRC_pri, MSG_oth);

		/*
		 * generate for each infrastructure file/directory
		 * the canonicalized, absolute pathname
		 */

		if ((rc = get_realpath_values(&infra)))
			exit(rc);

		/*
		 * check modes/ownership on those database paths which
		 * successfully mapped to a realpath
		 */

		check_paths(&infra);

		/*
		 * For existing infrastucture directories, inspect their
		 * entries for validity:
		 *   - valid name  (name in database, other general criteria)
		 *   - valid modes (modes from database or suitable default)
		 *
		 * example:
		 * checking content of server's "jobs" directory by checking
		 * entry's suffix and mode
		 */

#if 0
		inspect_dir_entries(&infra);
#endif
		print_problems(&infra);

	} else {

		/*
		 * err == 0 || (for the time being) mode == 'c'
		 * output typical kind of usage message
		 */
		title_string(TC_use, mode, &infra);
		exit(1);
	}

	if (flag_verbose)
		print_infrastruct(&infra);
	exit(0);
}
/**
 * @brief
 * 		Check whether user is authorized to use pbs_probe.
 *
 * @par MT-safe:	No
 */
static void
am_i_authorized(void)
{
	static char allow[] = "root";
	uid_t getuid(void);
	struct passwd *ppwd = getpwuid(getuid()) ;

	if (ppwd && strcmp(ppwd->pw_name, allow) == 0)
		return;

	/*problem encountered*/

	if (ppwd)
		fprintf(stderr, "User %s not authorized to use pbs_probe\n", ppwd->pw_name);
	else
		fprintf(stderr, "Problem checking user authorization for utility\n");
	exit(1);
}
/**
 * @brief
 * 		configure values for various infrastructure parameters.
 *
 * @param[out]	pinf	-	 structpointer to infrastruct
 * @param[out]	mode	-	 pbs_probe "mode"
 */
static void
infrastruct_params(struct infrastruct *pinf, int mode)
{

	int	i, rc;			/* return code */
	char	hname[PBS_MAXHOSTNAME+1];

	memset((void *)pinf, 0, (size_t)sizeof(struct infrastruct));

	for (i=0; i<SRC_last; ++i) {
		pinf->msgs[i] = (PROBEMSGS *)malloc(sizeof(PROBEMSGS));
		if (pinf->msgs[i] == NULL) {
			fprintf(stderr, "pbs_probe: Out of Memory\n");
			exit(1);
		}
		memset((void *)pinf->msgs[i], 0, sizeof(PROBEMSGS));
	}

	pinf->mode = mode;
	pinf->pri.pbs_mpug = &pbs_mpugs[0];

	if (gethostname(hname, (sizeof(hname) - 1)))
		strcpy(hname, "localhost");
	pinf->phost = strdup(hname);

	if (uname(&pinf->utsd.ub) >= 0) {
		pinf->utsd.populated = 1;
		adjust_for_os(pinf);
	}

	/*
	 * output a title and accompanying system information
	 */

	title_string(TC_sys, mode, pinf);

	/*
	 * determine values for the primary variables:
	 * paths - pbs_home, ps_exec,
	 * pbs_start_server, pbs_start_mom, pbs_start_sched
	 */

	if ((rc = get_primary_values(pinf)))
		if (process_ret_code(GET_PRIMARY_VALUES, rc, pinf)) {
			print_problems(pinf);
			exit(1);
		}

	if (nonlocaldata)	/* don't check datastore if it is nonlocal */
		home_sizes[PH_server] -= 1;

	/*
	 * PBS HOME:  load pointers to the various arrays of MPUG data
	 * relevant to value of PBS HOME stored in *pinf's pri element
	 */

	if (pinf->pri.started.server)
		pinf->home[PH_server] = &svr_mpugs[0];

	if (pinf->pri.started.mom)
		pinf->home[PH_mom] =    &mom_mpugs[0];

	if (pinf->pri.started.sched)
		pinf->home[PH_sched] =  &sched_mpugs[0];

	/*
	 * Record install type in the "notbits" variable
	 */

	if (pinf->pri.started.server == 0 &&
		pinf->pri.started.sched == 0  &&  pinf->pri.started.mom) {

		/* did "execution-only" install */

		notbits |= 0x4;
	}
	else if (!pinf->pri.started.server && !pinf->pri.started.sched &&
		!pinf->pri.started.mom) {
		/* did "cmds-only" install */
		notbits |= 0x2;
	}

	home_sizes[PH_server] = sizeof(svr_mpugs)/sizeof(MPUG);
	home_sizes[PH_mom] =  sizeof(mom_mpugs)/sizeof(MPUG);
	home_sizes[PH_sched] = sizeof(sched_mpugs)/sizeof(MPUG);

	/*
	 * PBS EXEC:  load pointers to the various arrays of MPUG data
	 * relevant to value of PBS EXEC stored in *pinf's pri element
	 */

	pinf->exec[EXEC_exec] =  &exec_mpugs[0]; /* make irix compiler happy */
	pinf->exec[EXEC_exec] =  NULL;
	pinf->exec[EXEC_bin] =   &bin_mpugs[0];
	pinf->exec[EXEC_sbin] =  &sbin_mpugs[0];
	pinf->exec[EXEC_etc] =   &etc_mpugs[0];
	pinf->exec[EXEC_lib] =   &lib_mpugs[0];
	pinf->exec[EXEC_man] =   &man_mpugs[0];
	pinf->exec[EXEC_man1] =  NULL;
	pinf->exec[EXEC_man3] =  NULL;
	pinf->exec[EXEC_man7] =  NULL;
	pinf->exec[EXEC_man8] =  NULL;

	pinf->exec[EXEC_tcltk] =   &tcltk_mpugs[0];
	pinf->exec[EXEC_python] =   &python_mpugs[0];
	pinf->exec[EXEC_include] = &include_mpugs[0];
	pinf->exec[EXEC_pgsql] =   &pgsql_mpugs[0];

	exec_sizes[EXEC_exec] = sizeof(exec_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_bin] =  sizeof(bin_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_sbin] = sizeof(sbin_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_etc] =  sizeof(etc_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_lib] =  sizeof(lib_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_man] =  sizeof(man_mpugs)/sizeof(MPUG);

	exec_sizes[EXEC_man1] = 0;
	exec_sizes[EXEC_man3] = 0;
	exec_sizes[EXEC_man7] = 0;
	exec_sizes[EXEC_man8] = 0;

	exec_sizes[EXEC_tcltk] =   sizeof(tcltk_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_python] =   sizeof(python_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_include] = sizeof(include_mpugs)/sizeof(MPUG);
	exec_sizes[EXEC_pgsql] =   sizeof(pgsql_mpugs)/sizeof(MPUG);
}
/**
 * @brief
 * 		adjust the infrastruct parameter values based on the os.
 *
 * @param[out]	pinf	-	 pointer to infrastruct
 */
static void
adjust_for_os(struct infrastruct *pinf)
{
	/* offset to use with specific MPUG array */

	int	ofs_bin = 1;  /* use with bin_mpugs[] */
	int	ofs_lib = 1;  /* use with lib_mpugs[] */

	if (strstr(pinf->utsd.ub.sysname, "Linux") != NULL) {

		/* Linux: pbs_lamboot, pbs_mpilam, pbs_mpirun, mpiexec, pbsrun, pbsrun_wrap, pbsrun_unwrap  */

		bin_mpugs[ofs_bin + 31].notReq &= ~(0x1);
		bin_mpugs[ofs_bin + 32].notReq &= ~(0x1);
		bin_mpugs[ofs_bin + 33].notReq &= ~(0x1);
		bin_mpugs[ofs_bin + 38].notReq &= ~(0x1);
		bin_mpugs[ofs_bin + 39].notReq &= ~(0x1);
		bin_mpugs[ofs_bin + 40].notReq &= ~(0x1);
		bin_mpugs[ofs_bin + 41].notReq &= ~(0x1);

		/* Linux + /etc/sgi-compute-node_release => SGI ICE	*/
		if (access("/etc/sgi-compute-node-release", R_OK) == 0) {
			lib_mpugs[ofs_lib + 23].notReq = 0;    /* sgiMPI.awk       */
		}

		/* Linux: pbsrun.<keyword>.init.in files must exist */
		lib_mpugs[ofs_lib + 24].notReq &= ~(0x1);
		lib_mpugs[ofs_lib + 25].notReq &= ~(0x1);
		lib_mpugs[ofs_lib + 26].notReq &= ~(0x1);
		lib_mpugs[ofs_lib + 27].notReq &= ~(0x1);
		lib_mpugs[ofs_lib + 28].notReq &= ~(0x1);
		lib_mpugs[ofs_lib + 29].notReq &= ~(0x1);
		bin_mpugs[ofs_bin + 30].notReq &= ~(0x1);
	}
}

/**
 * @brief
 * 		print the values of infrstruct.
 *
 * @param[in]	pinf	-	 pointer to infrastruct
 */
static void
print_infrastruct(struct infrastruct *pinf)
{
	int	i, j;
	int	tflag;
	MPUG	*pmpug;

	tflag = 0;
	for (i=0; i<PBS_last; ++i) {

		if (!tflag) {
			++tflag;
			title_string(TC_tvrb, mode, pinf);
		}

		if (pinf->pri.pbs_mpug[i].path) {

			if (tflag == 1) {
				++tflag;
				title_string(TC_datpri, mode, pinf);
			}
			fprintf(stdout, "%s: %s\n", mhp[i], pinf->pri.pbs_mpug[i].path);
		}
	}
	if (tflag) {
		fprintf(stdout, "%s: %d\n", mhp[MHP_svr], pinf->pri.started.server);
		fprintf(stdout, "%s: %d\n", mhp[MHP_mom], pinf->pri.started.mom);
		fprintf(stdout, "%s: %d\n", mhp[MHP_sched], pinf->pri.started.sched);
	}

	tflag = 0;
	for (i=0; i<PH_last; ++i) {

		if ((pmpug = pinf->home[i]) == NULL || (pmpug->notReq & notbits))
			continue;

		if (!tflag++)
			title_string(TC_datho, mode, pinf);

		fprintf(stdout, "\nHierarchy %s:\n", home_mpug_set[i]);

		for (j=0; j<home_sizes[i]; ++j, ++pmpug) {
			if (pmpug->path == NULL || (pmpug->notReq & notbits))
				continue;
                        fprintf(stdout, "%-70s(%s, %s)\n", pmpug->path, perm_string((mode_t)pmpug->req_modes), owner_string(NULL, pmpug, 0));
		}
	}

	tflag = 0;
	for (i=0; i<EXEC_last; ++i) {
                if ((pmpug = pinf->exec[i]) == NULL || (pmpug->notReq & notbits))
			continue;

		if (!tflag++)
			title_string(TC_datex, mode, pinf);

		fprintf(stdout, "\nHierarchy %s:\n\n", exec_mpug_set[i]);

		for (j=0; j<exec_sizes[i]; ++j, ++pmpug) {

			if (pmpug->path == NULL || (pmpug->notReq & notbits))
				continue;
			fprintf(stdout, "%-70s(%s, %s)\n", pmpug->path, perm_string((mode_t)pmpug->req_modes), owner_string(NULL, pmpug, 0));
		}
	}
}
/**
 * @brief
 * 		print the title string based on the code_title value.
 *
 * @param[in]	tc	-	code_title value.
 * @param[in]	mode	-	mode (not used here)
 * @param[in]	pinf	-	pointer to infrastruct
 */
static void
title_string(enum code_title tc, int mode, INFRA *pinf)
{
	switch (tc) {
		case TC_sys:
			fprintf(stdout, "\n\n====== System Information =======\n\n");
			fprintf(stdout,
				"\nsysname=%s\nnodename=%s\nrelease=%s\nversion=%s\nmachine=%s\n",
				pinf->utsd.ub.sysname, pinf->utsd.ub.nodename,
				pinf->utsd.ub.release, pinf->utsd.ub.version,
				pinf->utsd.ub.machine);
			break;

		case TC_top:
			fprintf(stdout,
				"\n\n====== PBS Infrastructure Report =======\n\n");
			break;

		case TC_pri:
			fprintf(stdout,
				"\n\n====== Problems in pbs_probe's Primary Data =======\n\n");
			break;

		case TC_ho:
			fprintf(stdout,
				"\n\n====== Problems in PBS HOME Hierarchy =======\n\n");
			break;

		case TC_ex:
			fprintf(stdout,
				"\n\n====== Problems in PBS EXEC Hierarchy =======\n\n");
			break;

		case TC_ro:
		case TC_fx:
		case TC_cnt:
			/* Not explicitely handled, but keeps compiler quiet. */
			break;

			/*
			 * verbose related strings
			 */

		case TC_tvrb:
			fprintf(stdout,
				"\n\n=== Primary variables and specific hierarchies checked by pbs_probe ===\n\n");
			break;

		case TC_datpri:
			fprintf(stdout, "\nPbs_probe's Primary variables:\n\n");
			break;

		case TC_datho:
			fprintf(stdout, "\n\n=== PBS HOME Infrastructure ===\n");
			break;

		case TC_datex:
			fprintf(stdout, "\n\n=== PBS EXEC Infrastructure ===\n");
			break;

		case TC_noerr:
			fprintf(stdout,
				"\n\n=== No PBS Infrastructure Problems Detected ===\n");
			break;

		case TC_use:
			fprintf(stderr, "Usage: pbs_probe [ -fv ]\n");
			fprintf(stderr, "       pbs_probe --version\n");
			fprintf(stderr,
				"\tno option - run in 'report' mode\n");
			fprintf(stderr,
				"\t-f        - run in 'fix' mode\n");
			fprintf(stderr,
				"\t-v        - show hierarchy examined\n");
			fprintf(stderr,
				"\t--version - show version and exit\n");
			break;
	}
}
/**
 * @brief
 * 		print the title string based on the code_title value.
 *
 * @param[in]	tc	-	code_title value.
 * @param[in]	mode	-	mode (not used here)
 * @param[in]	pinf	-	pointer to infrastruct
 */
static void
print_problems(INFRA *pinf)
{
	int i, j, k;
	int idx;
	int tflag, output_err = 0;
	char **pa;

	for (i=0; i<SRC_last; ++i) {
		tflag = 0;
		for (j=0; j < MSG_last; ++j) {

			if (pinf->msgs[i]->mtbls[j] == NULL)
				continue;

			if (!tflag++)
				switch (i) {
					case SRC_pri:
						title_string(TC_pri, mode, pinf);
						break;

					case SRC_home:
						title_string(TC_ho, mode, pinf);
						break;

					case SRC_exec:
						title_string(TC_ex, mode, pinf);
						break;

					default:
						break;
				}
			idx = pinf->msgs[i]->idx[j];
			pa = pinf->msgs[i]->mtbls[j];
			for (k=0; k < idx; ++k) {
				output_err = 1;
				fprintf(stdout, "%s\n", pa[k]);
			}
		}
	}
	if (output_err == 0)
		title_string(TC_noerr, mode, pinf);
}

/**
 * @brief
 * 		Calling put_msg_in_table with a NULL message pointer is the
 * 		mechanism used to cause the loading of new values into the
 *	 	function's three internal static variables: dflt_pinf, dflt_src,
 * 		dflt_cat - i.e. causing new default values to be established.
 *
 * @param[in]	pinf	-	pointer to infrastruct
 * @param[in]	src	-	default source.
 * @param[in]	category	-default category.
 */
static void
msg_table_set_defaults(INFRA *pinf, int src, int category)
{

	put_msg_in_table(pinf, src, category, NULL);
}
/**
 * @brief
 * 		put values in message table.
 *
 * @param[in]	pinf	-	pointer to infrastruct
 * @param[in]	src	-	source. can be SRC_pri, SRC_home,
 * 						SRC_exec, SRC_last, SRC_none
 * @param[in]	category	-	message category.
 * @param[in]	msg	-	message which needs to be put into table.
 *
 * @return	int
 * @retval	0	: things are fine.
 * @retval	1	: something smells bad!
 *
 * @par MT-safe: No
 */
static int
put_msg_in_table(INFRA *pinf, int src, int category, char* msg)
{
	static INFRA			*dflt_pinf = NULL;
	static enum  msg_sources	dflt_src = SRC_none;
	static enum  msg_categories	dflt_cat = MSG_none;
	static char  *msg_headers[MSG_last] = { NULL};

	char   **ptbl;
	char   **mtb;
	int    idx;

	/*
	 * One shot: Create pointers to table headings
	 */

	if (msg_headers[0] == NULL) {
		msg_headers[MSG_md]   = "Missing Directory Problems:";
		msg_headers[MSG_mf]   = "Missing File Problems:";
		msg_headers[MSG_po]   = "Permission/Ownership Problems:";
		msg_headers[MSG_unr]  = "Directory Entry Problems:";
		msg_headers[MSG_pri]  = "Primary Data Problems:";
		msg_headers[MSG_oth]  = "Other Problems:";
		msg_headers[MSG_real] = "Real Path Problems:";
	}

	if (msg == NULL) {

		/* Load new default values */

		if (pinf)
			dflt_pinf = pinf;

		if (src != SRC_none) {
			if (src != SRC_pri && src != SRC_home && src != SRC_exec) {

				fprintf(stderr, "put_msg_in_table: Bad value for argument \"src\"\n");
				exit(1);
			}
			dflt_src = (enum  msg_sources)src;
		}

		if (category != MSG_none) {

			if (category != MSG_mf   &&  category  != MSG_md  &&
				category != MSG_po   &&  category  != MSG_unr &&
				category != MSG_real &&  category  != MSG_pri &&
				category != MSG_oth) {

				fprintf(stderr, "put_msg_in_table: Bad value for argument \"category\"\n");
				exit(1);
			}
			dflt_cat = (enum  msg_categories)category;
		}

		return (0);
	} /* end of msg == NULL */

	if (pinf == NULL) {
		if (dflt_pinf == NULL) {
			fprintf(stderr, "put_msg_in_table: No default set for pinf\n");
			exit(1);
		}
		pinf = dflt_pinf;
	}

	if (src == SRC_none) {
		if (dflt_src == SRC_none) {
			fprintf(stderr, "put_msg_in_table: No default value for \"argument\" src\n");
			exit(1);
		}
		src = dflt_src;
	}

	if (src != SRC_pri && src != SRC_home && src != SRC_exec) {

		fprintf(stderr, "put_msg_in_table: Bad value for message source\n");
		fprintf(stderr, "message %s:  not saved to table\n\n", msg);
		return (1);
	}

	if (category == MSG_none) {
		if (dflt_cat == MSG_none) {
			fprintf(stderr, "put_msg_in_table: No default value for \"argument\" category\n");
			exit(1);
		}
		category = dflt_cat;
	}

	if (category != MSG_mf  && category != MSG_md  && category != MSG_po &&
		category != MSG_unr && category != MSG_pri && category != MSG_oth &&
		category != MSG_real) {

		fprintf(stderr, "put_msg_in_table: Bad value for message category\n");
		fprintf(stderr, "message %s:  not saved to table\n\n", msg);
		return (1);
	}

	if (pinf->msgs[src] != NULL) {
		if (pinf->msgs[src]->mtbls[category] == NULL) {

			/*
			 * No table exists, malloc memory for one and store
			 * in the first location a pointer to a header message
			 */

			mtb = (char **)malloc(DFLT_MSGTBL_SZ * sizeof(char *));
			if (mtb == NULL) {
				fprintf(stderr, "pbs_probe: Out of Memory\n");
				return (1);
			}
			pinf->msgs[src]->mtbls[category] = mtb;
			idx = pinf->msgs[src]->idx[category];

			pinf->msgs[src]->mtbls[category][idx] = msg_headers[category];
			++pinf->msgs[src]->idx[category];
		}
	} else {

		fprintf(stderr, "put_msg_in_table: No initialization of pinf->msgs\n");
		exit(1);
	}

	idx = pinf->msgs[src]->idx[category];
	if (idx >= DFLT_MSGTBL_SZ) {
		fprintf(stderr, "put_msg_in_table: Table full\n");
		fprintf(stderr, "message %s:  not saved to table\n\n", msg);
		return (1);
	}

	/* add pointer to the message into the table and bump table index */

	ptbl = pinf->msgs[src]->mtbls[category];
	ptbl [ idx ] = strdup(msg);
	++pinf->msgs[src]->idx[category];
	return (0);
}
/**
 * @brief
 * 		get primary vaues from configuration file Then,
 * 		over ride conf derived settings with any values
 * 		set in the process's environment.
 *
 * @param[in]	pinf	-	pointer to infrastruct
 *
 * @return	int
 * @retval	0	: things are fine.
 * @retval	!=0	: something smells bad!
 */
static int
get_primary_values(struct infrastruct *pinf)
{
	FILE	*fp;
	int	rc;
	char	*gvalue;		/* used with getenv() */


	origin_names[PBS_conf] = "PBS CONF FILE";
	origin_names[PBS_home] = "PBS HOME";
	origin_names[PBS_exec] = "PBS EXEC";

	/*
	 * determine path for PBS infrastructure configuration file
	 */

	pinf->pri.pbs_mpug = &pbs_mpugs[0];

	gvalue = getenv("PBS_CONF_FILE");
	if (gvalue == NULL || *gvalue == '\0') {
		pinf->pri.pbs_mpug[PBS_conf].path = default_pbsconf;
		pinf->pri.src_path.conf = SRC_DFLT;
	} else {
		pinf->pri.pbs_mpug[PBS_conf].path = strdup(gvalue);
		pinf->pri.src_path.conf = SRC_ENV;
	}

	if ((fp = fopen(pinf->pri.pbs_mpug[PBS_conf].path, "r")) == NULL) {
		if (stat(pinf->pri.pbs_mpug[PBS_conf].path, &pinf->statd.sb)) {
			if (errno == ENOENT)
				if (mode != 'f')
					return (PBS_CONF_NO_EXIST);
			else {
#if 0
				/*
				 * In "fix" mode and pbs.conf doesn't exist
				 * try to find and run pbs_postinstall to create it
				 */
				path = pinf->pri.pbs_mpug[PBS_conf].path;
				return (pbsdotconf(path));
				return (PBS_CONF_NO_EXIST);
#endif
				return (PBS_CONF_CAN_NOT_OPEN);
			}
			else
				return (PBS_CONF_CAN_NOT_OPEN);
		}
	}

	/*
	 * first source for the primary variables is the config file
	 * Then, over ride conf derived settings with any values set
	 * in the process's environment
	 */

	if ((rc = conf4primary(fp, pinf))) {
	}

	if ((rc = env4primary(pinf))) {
	}
	return (rc);
}
/**
 * @brief
 * 		Read the PBS_CONF_FILE path and store in a buffer.
 *
 * @param[in]	path	-	PBS_CONF_FILE path
 *
 * @return	int
 * @retval	PBS_CONF_NO_EXIST	: No PBS_CONF_FILE.
 */
#if 0
static int
pbsdotconf(char * path)
{

	char	*gvalue_save = NULL;

	if (path == NULL)
		return (PBS_CONF_NO_EXIST);

	pbuf = malloc(strlen("PBS_CONF_FILE=") + strlen(path) + 1);
	if (pbuf == NULL)
		return (PBS_CONF_NO_EXIST);

	if ((gvalue = getenv("PBS_CONF_FILE")) != NULL)
		if ((len = strlen(gvalue)))
			gvalue_save = strdup(gvalue);

	strcpy(pbuf, "PBS_CONF_FILE=");
	strcat(pbuf, path);
	if ((rc = putenv(pbuf))) {
		free(pbuf);
		if (gvalue_save)
			free(gvalue_save);
		return (PBS_CONF_NO_EXIST);
	}
}
#endif
/**
 * @brief
 * 		First try and resolve to a real path the MPUG path
 * 		data belonging to *pinf's "pri" member.
 * @par
 * 		If the PBS HOME pathname was resolvable to a realpath in
 * 		the file system - i.e. have good PBS HOME primary value,
 * 		compute MPUG data for PBS_HOME hierarchy.
 *
 * @param[in]	pinf	-	PBS_CONF_FILE path
 *
 * @return	int
 * @retval	0	: good to go.
 */
static	int
get_realpath_values(struct infrastruct *pinf)
{
	char *real = NULL;
	char path[MAXPATHLEN + 1];
	char *endhead;
	char demarc[]="/";
	int  i, j;
	MPUG *pmpug;
	int  good_prime[PBS_last];
	char *msgbuf;
	const char *pycptr;
        /*
	 * First try and resolve to a real path the MPUG path
	 * data belonging to *pinf's "pri" member
	 */
	for (i = 0; i < PBS_last; ++i) {
		good_prime[i] = 0;
		if (pinf->pri.pbs_mpug[i].path) {
			if ((real = realpath(pinf->pri.pbs_mpug[i].path, NULL)) != NULL) {
				pinf->pri.pbs_mpug[i].realpath = strdup(real);
				good_prime[i] = 1;
				free(real);
			} else if (pinf->pri.pbs_mpug[i].notReq == 0) {
				/*
				 * system not able to convert path string to valid
				 * file system path
				 */
				pbs_asprintf(&msgbuf,
					"Unable to convert the primary, %s, string to a real path\n%s\n",
					origin_names[i], strerror(errno));
				put_msg_in_table(pinf, SRC_pri, MSG_pri, msgbuf);
				free(msgbuf);
				pbs_asprintf(&msgbuf, "%s: %s\n",
					origin_names[i], pinf->pri.pbs_mpug[i].path);
				put_msg_in_table(pinf, SRC_pri, MSG_pri, msgbuf);
				free(msgbuf);
				/* good_prime[i] = 0; */
			}
		} else {
			if (pinf->pri.pbs_mpug[i].notReq == 0) {
				pbs_asprintf(&msgbuf, "Missing primary path %s",
					origin_names[i]);
				put_msg_in_table(pinf, SRC_pri, MSG_pri, msgbuf);
				free(msgbuf);
			}
		}
	}
	for (i = 0; i < PBS_last; ++i) {
		if (good_prime[i] == 0 && pinf->pri.pbs_mpug[i].notReq == 0) {
			print_problems(pinf);
			exit(0);
		}
	}

	/*
	 * If the PBS HOME pathname was resolvable to a realpath in
	 * the file system - i.e. have good PBS HOME primary value,
	 * compute MPUG data for PBS_HOME hierarchy.
	 */

	if (good_prime[PBS_home]) {
		/* only need to check database directory if it is local */
		if (nonlocaldata == 0) {
			int fd;
			struct stat st;
			char buf[MAXPATHLEN+1];
			struct passwd	*pw;

			/*
			 * create path for db_user
			 * This is done outside of the table driven files
			 * because it is optional and no message should
			 * be generated if it does not exist.
			 */
			strcpy(path, pinf->pri.pbs_mpug[PBS_home].path);
			strcat(path, "/server_priv/db_user");

			if ((fd = open(path, O_RDONLY)) != -1) {
				if (fstat(fd, &st) != -1) {
					if ((st.st_mode & 0777) != 0600) {
						pbs_asprintf(&msgbuf,
							"%s, permission must be 0600\n",
							path);
						put_msg_in_table(NULL,
							SRC_home, MSG_real, msgbuf);
						free(msgbuf);
					}
					if (st.st_uid != 0) {
						pbs_asprintf(&msgbuf,
							"%s, owner must be root\n",
							path);
						put_msg_in_table(NULL,
							SRC_home, MSG_real, msgbuf);
						free(msgbuf);
					}
					if (st.st_size < sizeof(buf) &&
						read(fd, buf, st.st_size) ==
						st.st_size) {
						buf[st.st_size] = 0;
						pw = getpwnam(buf);
						if (pw != NULL)
							pbs_dataname[0] = strdup(buf);
						else {
							pbs_asprintf(&msgbuf,
								"db_user %s does not exist\n",
								buf);
							put_msg_in_table(NULL,
								SRC_home, MSG_real, msgbuf);
							free(msgbuf);
						}
					}
				}
				close(fd);
			}
			pw = getpwnam(pbs_dataname[0]);
			if (pw != NULL)
				pbsdata[0] = pw->pw_uid;
		}

		strcpy(path, pinf->pri.pbs_mpug[PBS_home].path);
		strcat(path, demarc);
		endhead = &path[strlen(path)];

		for (i = 0; i < PH_last; ++i) {
			if ((pmpug = pinf->home[i]) == NULL)
				continue;

			for (j = 0; j < home_sizes[i]; ++j) {
				if (pmpug[j].path) {

					/* proceed only if parent realpath is not NULL */

					if (is_parent_rpathnull(pmpug[j].path, pinf->home, PH_last, home_sizes))
						continue;

					strcpy(endhead, pmpug[j].path);

					if ((real = realpath(path, NULL)) != NULL) {
						pmpug[j].realpath = strdup(real);
						free(real);
					} else if ((pmpug[j].notReq & notbits) == 0) {

						if (errno == ENOENT)
							pbs_asprintf(&msgbuf, "%s, %s\n",
								path, strerror(errno));
						else
							pbs_asprintf(&msgbuf,
								"%s,  errno = %d\n",
								path, errno);

						put_msg_in_table(NULL, SRC_home, MSG_real, msgbuf);
						free(msgbuf);
					}
				}
			}
		}
	}


	/*
	 * If the PBS EXEC string was  resolvable to a realpath in
	 * the file system - i.e. have good PBS HOME primary value,
	 * compute MPUG data for PBS EXEC hierarchy
	 */

	if (good_prime[PBS_exec]) {
		strcpy(path, pinf->pri.pbs_mpug[PBS_exec].path);
		strcat(path, demarc);
		endhead = &path[strlen(path)];

		for (i = 0; i < EXEC_last; ++i) {

			if ((pmpug = pinf->exec[i]) == NULL)
				continue;

			for (j = 0; j < exec_sizes[i]; ++j) {
				if (pmpug[j].path) {

					/* proceed only if parent realpath is not NULL */

					if ((is_parent_rpathnull(pmpug[j].path, pinf->exec, EXEC_last, exec_sizes)))
						continue;

					strcpy(endhead, pmpug[j].path);
					if ((real = realpath(path, NULL)) != NULL) {
						pmpug[j].realpath = strdup(real);
						free(real);
					} else if ((pycptr = strstr(path, ".pyc")) != NULL){
						glob_t pycbuf;
						glob(path, 0, NULL, &pycbuf);
						if (pycbuf.gl_pathc == 1){
							pmpug[j].realpath = strdup(pycbuf.gl_pathv[0]);
							pmpug[j].path = strdup((pycbuf.gl_pathv[0] + strlen(pinf->pri.pbs_mpug[PBS_exec].path) + strlen(demarc)));
						}
						globfree(&pycbuf);
					} else if ((pmpug[j].notReq & notbits) == 0) {
                        			if (errno == ENOENT)
							pbs_asprintf(&msgbuf, "%s, %s\n",
								path, strerror(errno));
						else
							pbs_asprintf(&msgbuf,
								"%s,  errno = %d\n",
								path, errno);
						put_msg_in_table(NULL, SRC_exec, MSG_real, msgbuf);
						free(msgbuf);
					}
				}
			}
		}
	}
	return (0);
}

/**
 * @brief
 * 		Does path have a parent directory?
 * @par
 * 		replace demarc value
 *
 * @param[in]	path	-	location of file/directory
 * @param[in]	mpa	-	pointer to MPUG structure which stores file/directory properties.
 * @param[in]	nelts	-	number of elements in mpa
 * @param[in]	nmems	-	array storing number of members for each MPUG.
 *
 * @return	int
 * @retval	0	: good to go.
 * @retval	1	: parent unresolved.
 */
static int
is_parent_rpathnull(char *path, MPUG **mpa, int nelts, int * nmems)
{
	char *dp;
	MPUG *mpug;
	int  i, j;
	int  rc = 0, done = 0;

	/*
	 * Does path have a parent directory?
	 */

	if (path == NULL)
		return (0);
	else if (!((dp = strrchr(path, DEMARC)) && (dp != path)))
		return (0);

	*dp = '\0';	/* temporarily overwrite demarc */

	for (i=0; i<nelts; ++i) {

		if ((mpug = mpa[i]) == NULL)
			continue;

		for (j=0; j<nmems[i]; ++j, ++mpug)

			if (strcmp(path, mpug->path) == 0) {

				/* is parent unresolved */
				if (mpug->realpath == NULL) {
					rc = 1;
				}
				done = 1;
				break;
			}

		if (done)
			break;
	}

	/* replace demarc value */

	*dp = DEMARC;
	return rc;
}
/**
 * @brief
 * 		inspect the directory entries in infrastruct
 *
 * @param[in]	pinf	-	pointer to infrastruct
 *
 * @return	int
 * @retval	0	: good to go.
 */
#if 0
static	int
inspect_dir_entries(struct infrastruct *pinf)
{
	int	i, j;
	MPUG	*pmpug;
	MPUG	**knwn_set;
	int	tsz;


	for (i=0; i<PH_last; ++i) {

		if ((pmpug = pinf->home[i]) == NULL)
			continue;
		tsz = home_sizes[i];

		for (j=0; j<home_sizes[i]; ++j) {

			if (pmpug[j].path && pmpug[j].realpath) {

				/*
				 * If pmpug[j] relates to a directory, find all database
				 * MPUG's for entries that belong to that directory.
				 *
				 * A pointer to an array of MPUG pointers is returned.
				 * These are MPUGS gleened from pbs_probe's database and
				 * is thought of as the, "known set of MPUGS".
				 */

				knwn_set = which_Knwn_mpugs(&pmpug[j], pmpug, tsz);
				msg_table_set_defaults(pinf, SRC_home, MSG_none);

				/*
				 * If *pmpug[j] happens to the MPUG data for a directory,
				 * check each entry of that directory either against
				 * MPUG data from the "known set" or against some other
				 * criteria to ascertain its "correctness"
				 */

				chk_entries(&pmpug[j], knwn_set);
			}
		}
	}

	for (i=0; i<EXEC_last; ++i) {

                if ((pmpug = pinf->exec[i]) == NULL)
			continue;
		tsz = exec_sizes[i];

		for (j=0; j<exec_sizes[i]; ++j) {

			if ((pmpug[j].path)) {
				/*
				 * Refer to block comments in previous code block
				 * for explanation of what this code block does
				 */

				knwn_set = which_Knwn_mpugs(&pmpug[j], pmpug, tsz);
				msg_table_set_defaults(pinf, SRC_exec, MSG_none);
				chk_entries(&pmpug[j], knwn_set);
			}
		}
	}

	return 0;
}
#endif	/* 0 */
/**
 * @brief
 * 		defines the suffix set and returns the set corresponding to the path of directory.
 *
 * @param[in]	pmpug	-	pointer to MPUG struct
 *
 * @return	char *
 * @retval	NULL	: No match found.
 * @retval	the suffix set	: corresponding to the directory.
 */
#if 0
static const char *
which_suffixset(MPUG *pmpug)
{

	static char vld_job[] = ".JB,.SC,.CR,.XP,.OU,.ER,.CK,.TK,.CS,.BD";
	static char vld_hooks[] = ".HK,.PY";
	static char vld_resv[] = ".RB,.RBD";
	static char vld_tcltk[] = ".h,8.3,8.3.a,.sh";
	static char vld_python[] = ".py,.pyc,.so";
	char buf[MAXPATHLEN];
	char py_version[4];
	/* Get version of the Python interpreter */
	strncpy(py_version, Py_GetVersion(), 3);
	py_version[4] = '\0';

	if (pmpug->path == NULL)
		return NULL;
	if (strcmp("server_priv/jobs", pmpug->path) == 0)
		return (vld_job);
	if (strcmp("server_priv/users", pmpug->path) == 0)
		return (vld_job);
	if (strcmp("server_priv/hooks", pmpug->path) == 0)
		return (vld_hooks);
	if (strcmp("mom_priv/jobs", pmpug->path) == 0)
		return (vld_job);
	if (strcmp("undelivered", pmpug->path) == 0)
		return (vld_job);
	if (strcmp("spool", pmpug->path) == 0)
		return (vld_job);
	if (strcmp("tcltk/bin", pmpug->path) == 0)
		return (vld_tcltk);
	if (strcmp("tcltk/include", pmpug->path) == 0)
		return (vld_tcltk);
	if (strcmp("tcltk/lib", pmpug->path) == 0)
		return (vld_tcltk);
	if (strcmp("lib/python", pmpug->path) == 0)
		return (vld_python);
	if (strcmp("lib/python/altair", pmpug->path) == 0)
		return (vld_python);
	if (strcmp("lib/python/altair/pbs", pmpug->path) == 0)
		return (vld_python);
	if (strcmp("lib/python/altair/pbs/v1", pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s/logging", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s/shared", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s/xml", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s/xml/dom", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s/xml/etree", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s/xml/parsers", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	snprintf(buf, sizeof(buf), "lib/python/python%s/xml/sax", py_version);
	if (strcmp(buf, pmpug->path) == 0)
		return (vld_python);
	return NULL;
}
#endif /* 0 */

#if 0
static	int
is_suffix_ok(char *entryname, char *psuf)
{
	char	tbuf[100];
	char	*tok;
	int	len;
	int	elen = strlen(entryname);

	if (psuf == NULL)
		return 1;

	strcpy(tbuf, psuf);

	tok = strtok(tbuf, ",");
	for (; tok; tok = strtok(NULL,  ",")) {

		len = strlen(tok);
		if (elen <= len)
			continue;
		else if (strcmp(&entryname[elen - len], tok))
			continue;
		else {
			/* matched */
			return (1);
		}
	}
	return 0;
}
#endif	/* 0 */


#if 0
static 	MPUG  **
which_knwn_mpugs(MPUG *pmpug, MPUG *sets[], int *ssizes, int asz)
{
	/* Assumption being made that argument setsz < 100 */

	static	MPUG *knwn_mpugs[100];
	MPUG	     *pm;
	char	     *dp;
	char	     tmp_path[MAXPATHLEN];
	int i, j, idx=0;

	knwn_mpugs[0] = NULL;

	if ((pmpug == NULL) ||  !(pmpug->req_modes & S_IFDIR))
		return knwn_mpugs;

	for (i=0, pm=sets[0]; i<asz; ++i, pm = sets[i]) {
		for (j=0; j<ssizes[i]; ++j, ++pm) {

			/*
			 * copy to temporary avoids a problem when pmpug->path
			 * and pm->path never point to the same memory location
			 */

			strcpy(tmp_path, pm->path);

			if ((dp = strrchr(tmp_path, (int)'/')) == NULL)
				continue;

			*dp = '\0';
			if (strcmp(pmpug->path, tmp_path) == 0)
				knwn_mpugs[idx++] = pm;
			*dp = DEMARC;
		}
	}

	/*
	 * MPUG pointer array _must_ end with a NULL pointer
	 */

	knwn_mpugs[idx] = NULL;
	return	(knwn_mpugs);
}
#endif	/* 0 */

#if 0
static 	MPUG  **
which_Knwn_mpugs(MPUG *pmpug, MPUG *base, int tsize)
{
	/* Assumption being made that argument setsz < 100 */

	static	MPUG *knwn_mpugs[100];
	MPUG	     *pm;
	char	     *dp;
	char	     tmp_path[MAXPATHLEN];
	int	     j, idx=0;

	knwn_mpugs[0] = NULL;

	if ((pmpug == NULL) ||  !(pmpug->req_modes & S_IFDIR))
		return knwn_mpugs;

	for (j=0, pm=base; j<tsize; ++j, ++pm) {

		/*
		 * copy to temporary avoids a problem when pmpug->path
		 * and pm->path never point to the same memory location
		 */

		strcpy(tmp_path, pm->path);

		if ((dp = strrchr(tmp_path, (int)'/')) == NULL)
			continue;

		*dp = '\0';
		if (strcmp(pmpug->path, tmp_path) == 0)
			knwn_mpugs[idx++] = pm;

		*dp = DEMARC;
	}

	/*
	 * MPUG pointer array _must_ end with a NULL pointer
	 */

	knwn_mpugs[idx] = NULL;
	return	(knwn_mpugs);
}
#endif	/* 0 */

#if 0
/**
 * @brief
 * If pmpug happens to the MPUG data for a directory,
 * check each entry of that directory either against
 * MPUG data from the "known set" or against some other
 * criteria to ascertain its "correctness"
 *
 * @param[in] pmpug - pointer to struct modes_path_user_group
 * @param[in] knwn_set - known set of MPUGS
 */
static void
chk_entries(MPUG *pmpug, MPUG **knwn_set)
{
	DIR		*dir;
	struct dirent	*pdirent;
	char		*dirpath = pmpug->realpath;
	int		i;
	int		dirtype;
	char		*name;
	char		*psuf;
	char		msg[1024];

	if ((dirpath == NULL) || !(pmpug->req_modes & S_IFDIR))
		return;

	if ((dir = opendir(dirpath)) == NULL) {

		snprintf(msg, sizeof(msg), "Can't open directory %s for inspection\n", dirpath);
		put_msg_in_table(NULL, SRC_none, MSG_oth, msg);
		return;
	}

	/*
	 * Certain directories will have a list of associated suffixes.
	 * Get the location of any such list.
	 */

	psuf = (char *)which_suffixset(pmpug);

	/*
	 * Determine PBS directory type
	 */

	pbs_dirtype(&dirtype, pmpug);

	while (errno = 0, (pdirent = readdir(dir)) != NULL) {

		/*
		 * Ignore non-relevant directory entries
		 */

		if (strcmp(".", pdirent->d_name) == 0)
			continue;
		else if (strcmp("..", pdirent->d_name) == 0)
			continue;

		/*
		 * Begin by checking if the name of this entry matches any one
		 * of the names stored in the "known names (MPUGS)" subset
		 * supplied as input to this function
		 */

		for (i=0; knwn_set[i]; ++i) {
			if ((name = strrchr(knwn_set[i]->path, DEMARC))) {
				++name;
				if (strcmp(name, pdirent->d_name) == 0)
					break;
			}
		}

		if (knwn_set[i] != NULL) {

			/* matched a known entry, call readdir again */
			continue;
		}

		/*
		 * See if there is any, "name is outside the database,"
		 * kind of processing that would apply, and do it
		 */

		if (non_db_resident(pmpug, psuf, dirtype, pdirent->d_name))
			continue;

		/*
		 * entry is not a known name in pbs_probe's database and none
		 * of the other mechanisms for evaluating, in so way, the
		 * fitness of this entry were found to apply.
		 */

		snprintf(msg, sizeof(msg), "%s, unrecognized entry appears in %s\n", pdirent->d_name, pmpug->path);
		put_msg_in_table(NULL, SRC_none, MSG_unr, msg);
	}
	if (errno != 0 && errno != ENOENT) {

		snprintf(msg, sizeof(msg), "Can't read directory %s for inspection\n", dirpath);
		put_msg_in_table(NULL, SRC_none, MSG_oth, msg);
		(void)closedir(dir);
		return;
	}
	(void)closedir(dir);
}
#endif	/* 0 */

#if 0
static	void
pbs_dirtype(int *dirtype, MPUG *pmpug)
{
	if (strstr(pmpug->path, "logs"))
		*dirtype = PBS_logsdir;
	else if (strstr(pmpug->path, "accounting"))
		*dirtype = PBS_acctdir;
	else if (strstr(pmpug->path, "spool"))
		*dirtype = PBS_spooldir;
	else if (strstr(pmpug->path, "jobs"))
		*dirtype = PBS_jobsdir;
	else if (strstr(pmpug->path, "users"))
		*dirtype = PBS_usersdir;
	else if (strstr(pmpug->path, "hooks"))
		*dirtype = PBS_hooksdir;
	else if (strstr(pmpug->path, "hooks/tmp"))
		*dirtype = PBS_hookswdir;
	else
		*dirtype = PBS_niltype;
}
#endif	/* 0 */

#if 0
static	int
non_db_resident(MPUG *pmpug, char* psuf, int dirtype, char *entryname)
{
	char	msg[1024];

	switch (dirtype) {
		case PBS_acctdir:
		case PBS_logsdir:
			if (is_a_numericname(entryname) == 0) {

				snprintf(msg, sizeof(msg), "%s, unrecognized entry appears in %s\n", entryname, pmpug->path);
				put_msg_in_table(NULL, SRC_none, MSG_unr, msg);
			}
	}

	if (psuf && is_suffix_ok(entryname, psuf)) {
		return (1);
	}

	/* needs further examination to decide */

	return (0);
}
#endif	/* 0 */

#if 0
static	int
is_a_numericname(char *entryname)
{

	char	*endptr;

	(void)strtol(entryname, &endptr, 0);
	if (*endptr == '\0')
		return (1);
	else
		return (0);
}
#endif	/* 0 */
/**
 * @brief
 * 		check owner mode on pbs directories.
 *
 * @param[in]	pinf	-	pointer to infrasruct
 *
 * @return	int
 * @retval	0	: success
 */
static	int
check_paths(struct infrastruct *pinf)
{
	int	i, j;
	MPUG	*pmpug;
	char	*realpath;


	for (i=0; i<PBS_last; ++i) {
		msg_table_set_defaults(pinf, SRC_pri, MSG_po);
		if ((realpath = pinf->pri.pbs_mpug[i].realpath))
			check_owner_modes(realpath, &pinf->pri.pbs_mpug[i], 0);
	}

	for (i=0; i<PH_last; ++i) {
		msg_table_set_defaults(pinf, SRC_home, MSG_po);

		if ((pmpug = pinf->home[i]) == NULL)
			continue;

		for (j=0; j<home_sizes[i]; ++j) {
			if ((realpath = pmpug[j].realpath))
				check_owner_modes(realpath, pmpug + j, 0);
		}
	}

	for (i=0; i<EXEC_last; ++i) {

		msg_table_set_defaults(pinf, SRC_exec, MSG_po);

		if ((pmpug = pinf->exec[i]) == NULL)
			continue;

		for (j=0; j<exec_sizes[i]; ++j) {
			if ((realpath = pmpug[j].realpath) &&
				!(pmpug[j].notReq & notbits)) {
                                check_owner_modes(realpath, pmpug + j, 0);
			}
		}
	}
	return 0;
}
/**
 * @brief
 * 		if full path check is required, see if the path contains
 * 		a sub-path and if it does, call check_owner_modes on that
 * 		sub-path
 * @par
 * 		if lstat on the path is successful, check perms and owners
 * 		against values stored in MPUG structure
 *
 * @param[in]	path	-	path which needs to be checked.
 * @param[in]	p_mpug	-	pointer to MPUG structure
 * @param[in]	sys	-	indicates ownerID < 10, group id < 10
 *
 * @return	int
 * @retval	0	: success
 * @retval	!=0	: something got wrong!
 *
 * @par MT-safe: No
 */
static	int
check_owner_modes(char *path, MPUG *p_mpug, int sys)
{
	int	    rc = 0;		/* encountered no mode problem */
	char	    *dp;
	char	    msg[256];
	const char  *perm_msg;

	struct stat sbuf;
	static int  cnt_recursive = 0;

	/*
	 * if full path check is required, see if the path contains
	 * a sub-path and if it does, call check_owner_modes on that
	 * sub-path
	 */

	if (p_mpug->chkfull &&
		(dp = strrchr(path, DEMARC)) && (dp != path)) {
		/* temporarily overwrite demarc */

		*dp = '\0';

		++cnt_recursive;
		rc = check_owner_modes(path, p_mpug, 0);

		/* replace demarc value and stat this component of real path */

		*dp = DEMARC;

	}

	/*
	 * if lstat on the path is successful, check perms and owners
	 * against values stored in MPUG structure
	 */

	if (rc == LSTAT_PATH_ERR) {
		if (cnt_recursive > 0)
			--cnt_recursive;
		return (rc);
	}

	/*
	 * Clarification for reader may be in order:
	 *
	 * For a fullpath check, getting to this point in the
	 * code means the prior subpath was ok, else would be
	 * taking the above return.
	 *
	 * For a non-fullpath check, we are immediately here
	 */

	if (! lstat(path, &sbuf)) {

		/* successful on the lstat */
		rc = mbits_and_owner(&sbuf, p_mpug, sys);
		if (rc) {
			snprintf(msg, sizeof(msg), "\n%s", path);
			put_msg_in_table(NULL, SRC_none, MSG_po, msg);
			perm_msg = perm_owner_msg(&sbuf, p_mpug, NULL, sys);
			strcpy(msg, perm_msg);
			put_msg_in_table(NULL, SRC_none, MSG_po, msg);
		}
		/*
		 * if running in "fix" mode, do fixing up to and including
		 * the maximum authorized level (max_level).
		 */
		fix(mode, rc, max_level, p_mpug, NULL, &sbuf, FIX_po);

	} else {

		/* lstat complained about something */

		if (errno != ENOENT || ! p_mpug->notReq) {
			/* this PBS file is required */

			snprintf(msg, sizeof(msg), "lstat error: %s, \"%s\"\n", path, strerror(errno));
			put_msg_in_table(NULL, SRC_none, MSG_real, msg);
			rc = LSTAT_PATH_ERR;
		}
	}

	if (cnt_recursive > 0)
		--cnt_recursive;
	return (rc);
}

/**
 * @brief
 * 		Test mode bits and ownerships
 *
 * @param[in]	ps	-	 stat  "buffer"
 * @param[in]	p_mpug	-	pointer to MPUG structure
 * @param[in]	sys	-	indicates ownerID < 10, group id < 10
 *
 * @return	int
 * @retval	0	: success
 * @retval	PATH_ERR	: something got wrong!
 */

static	int
mbits_and_owner(struct stat *ps, MPUG *p_mpug, int sys)
{
	int	    i;
	mode_t	    modes;

	/*
	 * first adjust bits from the MPUG by turning off mode bits that should
	 * be disallowed at this level in the hierarchy and turn on those bits
	 * that are required, before testing the modes produced by lstat call
	 */

	if (sys == 0) {

		modes = (mode_t)p_mpug->req_modes;
		if ((ps->st_mode & modes) != modes)
			return (PATH_ERR);

		modes = (mode_t)p_mpug->dis_modes;
		if (ps->st_mode & modes)
			return (PATH_ERR);
	}

	/*
	 * if the MPUG has associated "user and group"
	 * data, test if this file's user and group is consitent
	 * with what is in the database
	 */

	if (p_mpug->vld_ug) {
		for (i=0; p_mpug->vld_ug->uids[i] != -1; ++i) {
			if (p_mpug->vld_ug->uids[i] == ps->st_uid)
				break;
		}
		if (p_mpug->vld_ug->uids[i] == -1)
			return (PATH_ERR);
	}

	if (p_mpug->vld_ug) {

		for (i=0; p_mpug->vld_ug->gids[i]; ++i) {
			if (p_mpug->vld_ug->gids[i] == ps->st_gid)
				break;
		}
		if (p_mpug->vld_ug->gids[i] == -1)
			return (PATH_ERR);
	}

	return (0);
}
/**
 * @brief
 * 		prepare a permission owner message in the following format
 * 		perm_is, owner_is, perm_need, owner_need
 *
 * @param[in]	ps	-	 stat  "buffer"
 * @param[in]	p_mpug	-	pointer to MPUG structure
 * @param[in]	p_adj	-	pointer to ADJ structure
 * @param[in]	sys	-	indicates ownerID < 10, group id < 10
 *
 * @return	permission owner message
 *
 * @par MT-safe: No
 */
static const	char *
perm_owner_msg(struct stat *ps, MPUG *p_mpug,
	ADJ  *p_adj, int sys)
{
	mode_t	    modes;
	char	    *perm_is;
	char	    *perm_need;
	char	    *owner_is;
	char	    *owner_need;
	static char buf[1024];

	/*
	 * first adjust bits from the MPUG by turning off mode bits that should
	 * be disallowed at this level in the hierarchy and turn on those bits
	 * that are required, before testing the modes produced by lstat call
	 */

	owner_is = strdup(owner_string(ps, NULL, sys));
	owner_need = strdup(owner_string(NULL, p_mpug, sys));

	if (sys) {

		snprintf(buf, sizeof(buf), "(%s) needs to be (%s)", owner_is, owner_need);
		free(owner_is);
		free(owner_need);
		return (buf);
	}

	/* continue with this part if part of PBS hierarchy proper */

	modes = (mode_t)p_mpug->req_modes;
	if (p_adj)
		modes = (modes & ~p_adj->dis) | p_adj->req;

	perm_is = strdup(perm_string(ps->st_mode));
	perm_need = strdup(perm_string(modes));

	snprintf(buf, sizeof(buf), "(%s , %s) needs to be (%s , %s)",
		perm_is, owner_is, perm_need, owner_need);

	free(perm_is);
	free(perm_need);
	free(owner_is);
	free(owner_need);
	return (buf);
}

/**
 * @brief
 * 		perm_string - create permission string from mode.
 *
 * @param[in]	modes	-	required permissions (modes)
 *
 * @return	permission string
 *
 * @par MT-safe: No
 */
static	char *
perm_string(mode_t modes)
{
	static char buf[12];

	strcpy(buf, "----------");

	if (S_IFDIR & modes)
		buf[0] = 'd';

	if (S_IRUSR & modes)
		buf[1] = 'r';
	if (S_IWUSR & modes)
		buf[2] = 'w';

	if (S_IXUSR & modes)
		buf[3] = 'x';

	if (S_ISUID & modes)
		buf[3] = 's';

	if (S_IRGRP & modes)
		buf[4] = 'r';
	if (S_IWGRP & modes)
		buf[5] = 'w';
	if (S_IXGRP & modes)
		buf[6] = 'x';

	if (S_ISGID & modes)
		buf[6] = 's';

	if (S_IROTH & modes)
		buf[7] = 'r';
	if (S_IWOTH & modes)
		buf[8] = 'w';
	if (S_IXOTH & modes)
		buf[9] = 'x';

	if (S_ISVTX & modes)
		buf[9] = 't';

	return buf;
}
/**
 * @brief
 * 		formulate a string contains owner user info and group info.
 *
 * @param[in]	ps	-	data returned by the stat() function
 * @param[in]	p_mpug	-	modes_path_user_group structure
 * @param[in]	sys	-	indicates ownerID < 10, group id < 10
 *
 * @return	string contains owner user info and group info.
 *
 * @par MT-safe: No
 */
static	const char *
owner_string(struct stat *ps, MPUG *p_mpug, int sys)
{
	struct passwd	*ppw;
	struct group	*pgrp;

	static char buf[1024];

	buf[0] = '\0';
	if (ps) {
		ppw = getpwuid(ps->st_uid);
		pgrp = getgrgid(ps->st_gid);

		if (ppw != NULL && pgrp != NULL &&
			ppw->pw_name != NULL && pgrp->gr_name != NULL)

			snprintf(buf, sizeof(buf), "%s , %s", ppw->pw_name, pgrp->gr_name);
		else
			snprintf(buf, sizeof(buf), "%d , %d", ps->st_uid, ps->st_gid);

	} else if (p_mpug) {
		if (p_mpug->vld_ug) {
			if (sys)
				snprintf(buf, sizeof(buf), "ownerID < 10, group id < 10");
			else
				snprintf(buf, sizeof(buf), "%s, group id < 10", p_mpug->vld_ug->unames[0]);
		} else
			snprintf(buf, sizeof(buf), " ");
	}
	return buf;
}

/**
 * @brief
 * 		process return code and arrive at a return code that will determine the fate of pbs_probe
 *
 * @param[in]	from	-	Numeric codes, options - GET_PRIMARY_VALUES, END_FUNC_NAMES.
 * @param[in]	rc	-	return code to be processed.
 * @param[in]	pinf	-	pointer to infrastruct
 *
 * @return	int
 * @retval	0	: primary data is fine, continue with pbs_probe.
 * @retval	1	:  primary data is bogus, pbs_probe must exit
 */
static int
process_ret_code(enum func_names from, int rc, struct infrastruct *pinf)
{
	int  ret = 0;
	char msg[1024];

	if (from == GET_PRIMARY_VALUES) {

		if (rc != 0) {
			if (pinf->pri.pbs_mpug[PBS_conf].path) {

				if (rc == PBS_CONF_NO_EXIST)
					snprintf(msg, sizeof(msg), "File %s does not exist\n",
						pinf->pri.pbs_mpug[PBS_conf].path);
				else if (rc == PBS_CONF_CAN_NOT_OPEN)
					snprintf(msg, sizeof(msg), "Could not open PBS configuration file %s\n",
						pinf->pri.pbs_mpug[PBS_conf].path);
				else
					snprintf(msg, sizeof(msg),
						"Internal pbs_probe problem, unknown return code\n");

				put_msg_in_table(pinf, SRC_pri, MSG_pri, msg);
			}
			ret = 1;	/* primary data is bogus, pbs_probe must exit */
		}
	}

	return (ret);
}

/**
 * @brief
 * 		read the configuration file and obtain primary data for infrastruct structureS
 *
 * @param[in]	fp	-	file pointer to config file
 * @param[out]	pointer to infrastuct structure
 */
static	int
conf4primary(FILE *fp, struct infrastruct *pinf)
{
	char buf[1024];
	char *conf_name;              /* the name of the conf parameter */
	char *conf_value;             /* the value from the conf file or env*/
	unsigned int uvalue;          /* used with sscanf() */

	/* should not be calling with a NULL value for fp */

	assert(fp != NULL);

	while (fgets(buf, 1024, fp) != NULL) {
		if (buf[0] != '#') {
			/* replace '\n' with '\0' */
			buf[strlen(buf)-1] = '\0';
			conf_name = strtok(buf, "=");
			conf_value = strtok(NULL, "     ");

			/* ignore the unexpected (inserted blank line?) */

			if ((conf_name == NULL) || (conf_value == NULL))
				continue;

			if (!strcmp(conf_name, "PBS_START_SERVER")) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pinf->pri.started.server = ((uvalue > 0) ? 1 : 0);
				pinf->pri.src_started.server = SRC_CONF;
			}
			else if (!strcmp(conf_name, "PBS_START_MOM")) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pinf->pri.started.mom = ((uvalue > 0) ? 1 : 0);
				pinf->pri.src_started.mom = SRC_CONF;
			}
			else if (!strcmp(conf_name, "PBS_START_SCHED")) {
				if (sscanf(conf_value, "%u", &uvalue) == 1)
					pinf->pri.started.sched = ((uvalue > 0) ? 1 : 0);
				pinf->pri.src_started.sched = SRC_CONF;
			}
			else if (!strcmp(conf_name, "PBS_HOME")) {
				if (pinf->pri.pbs_mpug[PBS_home].path)
					free(pinf->pri.pbs_mpug[PBS_home].path);
				pinf->pri.pbs_mpug[PBS_home].path = strdup(conf_value);
				pinf->pri.src_path.home = SRC_CONF;
			}
			else if (!strcmp(conf_name, "PBS_CONF_DATA_SERVICE_HOST")) {
				nonlocaldata = 1;
			}
			else if (!strcmp(conf_name, "PBS_EXEC")) {
				if (pinf->pri.pbs_mpug[PBS_exec].path)
					free(pinf->pri.pbs_mpug[PBS_exec].path);
				pinf->pri.pbs_mpug[PBS_exec].path = strdup(conf_value);
				pinf->pri.src_path.exec = SRC_CONF;
			}
			else if (!strcmp(conf_name, "PBS_DAEMON_SERVICE_USER")) {
				struct passwd *pw;
				pw = getpwnam(conf_value);
				if (pw != NULL) {
					pbs_servicename[0] = strdup(conf_value);
					pbsservice[0] = pw->pw_uid;
				}
				else {
					char *msgbuf;
					pbs_asprintf(&msgbuf, "Service user %s does not exist\n", conf_value);
					put_msg_in_table(NULL, SRC_CONF, MSG_real, msgbuf);
					free(msgbuf);
				}
			}

		} else {
			/* ignore comment lines (# in column 1) */
			continue;
		}
	}
	return (0);
}
/**
 * @brief
 * 		read the environment values and store in infrastruct.
 *
 * @param[out]	pinf	-	pointer to environment structure.
 *
 * @return	int
 * @retval	0	: success
 */
static	int
env4primary(struct infrastruct *pinf)
{
	char *gvalue;                 /* used with getenv() */
	unsigned int uvalue;          /* used with sscanf() */

	if ((gvalue = getenv("PBS_START_SERVER"))) {
		if (sscanf(gvalue, "%u", &uvalue) == 1) {
			pinf->pri.started.server = ((uvalue > 0) ? 1 : 0);
			pinf->pri.src_started.server = SRC_ENV;
		}
	}
	if ((gvalue = getenv("PBS_START_MOM"))) {
		if (sscanf(gvalue, "%u", &uvalue) == 1) {
			pinf->pri.started.mom = ((uvalue > 0) ? 1 : 0);
			pinf->pri.src_started.mom = SRC_ENV;
		}
	}
	if ((gvalue = getenv("PBS_START_SCHED"))) {
		if (sscanf(gvalue, "%u", &uvalue) == 1) {
			pinf->pri.started.sched = ((uvalue > 0) ? 1 : 0);
			pinf->pri.src_started.sched = SRC_ENV;
		}
	}
	if ((gvalue = getenv("PBS_HOME"))) {

		if (pinf->pri.pbs_mpug[PBS_home].path)
			free(pinf->pri.pbs_mpug[PBS_home].path);

		pinf->pri.pbs_mpug[PBS_home].path = strdup(gvalue);
		pinf->pri.src_path.home = SRC_ENV;
	}
	if ((gvalue = getenv("PBS_EXEC"))) {

		if (pinf->pri.pbs_mpug[PBS_exec].path)
			free(pinf->pri.pbs_mpug[PBS_exec].path);

		pinf->pri.pbs_mpug[PBS_exec].path = strdup(gvalue);
		pinf->pri.src_path.exec = SRC_ENV;
	}
	if ((gvalue = getenv("PBS_CONF_DATA_SERVICE_HOST")) != NULL) {
		nonlocaldata = 1;
	}
	if ((gvalue = getenv("PBS_DAEMON_SERVICE_USER")) != NULL) {
		struct passwd *pw;
		pw = getpwnam(gvalue);
		if (pw != NULL) {
			pbs_servicename[0] = strdup(gvalue);
			pbsservice[0] = pw->pw_uid;
		}
		else {
			char *msgbuf;
			pbs_asprintf(&msgbuf, "Service user %s does not exist\n", gvalue);
			put_msg_in_table(NULL, SRC_CONF, MSG_real, msgbuf);
			free(msgbuf);
		}
	}


	return (0);
}

/**
 * @brief
 * 		fix - check is a fix is necessary and, if it is, attempt to do
 * 		the fix, being careful not to attempt a fix whose code is higher
 * 		than the maximum allowed (max_level.)
 * @par
 * 		If a fix is attempted, add an appropriate message(s) to the end of
 * 		the relevant message category.
 *
 * @param[in]	probemode	-	probe mode
 * @param[in]	need	-	required or not ?
 * @param[in]	max_level	-	maximum allowed
 * @param[in]	pmpug	-	pointer to modes_path_user_group structure
 * @param[in]	padj	-	pointer to a structure which holds data for modeadjustments.
 * @param[in]	ps	-	data returned by the stat() function
 * @param[in]	fc	-	fix codes.
 *
 * @return	none
 */
static void
fix(int probemode, int need, int max_level, MPUG *pmpug, ADJ *padj, struct stat *ps, int fc)
{
	if ((need == 0) || (probemode != (int)'f') || (fc > max_level))
		return;

	switch (fc) {
		case FIX_po:
			if (padj == NULL)
				fix_perm_owner(pmpug, ps, padj);
			break;
	}
}

/**
 * @brief
 * 		fix_perm_owner - attempt a fix of permission or ownership problems on
 * 		the input file and add a message(s) to whatever default message category
 * 		is currently set.
 *
 * @param[in]	p_mpug	-	pointer to modes_path_user_group structure
 * @param[in]	ps	-	data returned by the stat() function
 * @param[in]	p_adj	-	pointer to a structure which holds data for modeadjustments.
 *
 * @return	none
 */
static void
fix_perm_owner(MPUG *p_mpug, struct stat *ps, ADJ *p_adj)
{
	char		msg[512];
	mode_t		modes;
	mode_t		dis_modes;
	unsigned	fixes = 0;
	int		i, rc;

	if (ps == NULL)
		return;

	modes = (mode_t)p_mpug->req_modes;
	if (p_adj)
		modes = (modes & ~p_adj->dis) | p_adj->req;

	if (p_adj)
		dis_modes = (~modes & (mode_t)p_mpug->dis_modes) | p_adj->dis;
	else
		dis_modes = (mode_t)p_mpug->dis_modes;

	if (dis_modes & modes) {
		snprintf(msg, sizeof(msg), "%s: database problem, 'allowed/disallowed' modes overlap", p_mpug->path);
		put_msg_in_table(NULL, SRC_none, MSG_po, msg);
		return;
	}

	if (ps->st_mode != modes) {
		if ((rc = chmod(p_mpug->realpath, modes))) {
			snprintf(msg, sizeof(msg), "%s: permission correction failed, %s", p_mpug->path, strerror(errno));
			put_msg_in_table(NULL, SRC_none, MSG_po, msg);
		} else {
			fixes |= 0x1;	/* permission */
		}
	}

	/*
	 * Fix any ownership problems (user/group) if they exist
	 */

	if (p_mpug->vld_ug) {
		for (i=0; p_mpug->vld_ug->uids[i] != -1; ++i) {
			if (p_mpug->vld_ug->uids[i] == ps->st_uid)
				break;
		}
		if (p_mpug->vld_ug->uids[i] == -1) {
			rc = chown(p_mpug->realpath, p_mpug->vld_ug->uids[0], -1);
			if (rc) {
				snprintf(msg, sizeof(msg), "%s: ownership correction failed, %s", p_mpug->path, strerror(errno));
				put_msg_in_table(NULL, SRC_none, MSG_po, msg);
			} else {
				fixes |= 0x2;
			}
		}
	}

	if (p_mpug->vld_ug) {
		for (i=0; p_mpug->vld_ug->gids[i]; ++i) {
			if (p_mpug->vld_ug->gids[i] == ps->st_gid)
				break;
		}
		if (p_mpug->vld_ug->gids[i] == -1) {
			/*
			 * Remark: we are using the gid value "0" because
			 * on most of the systems checked the group value was
			 * this value.  On a few it was "1".
			 */
			rc = chown(p_mpug->realpath, -1, p_mpug->vld_ug->gids[0]);
			if (rc) {
				snprintf(msg, sizeof(msg), "%s: group correction failed, %s", p_mpug->path, strerror(errno));
				put_msg_in_table(NULL, SRC_none, MSG_po, msg);
			} else {
				fixes |= 0x4;
			}
		}
	}

	switch (fixes) {
		case 1:
			snprintf(msg, sizeof(msg), "%s: corrected permissions", p_mpug->path);
			put_msg_in_table(NULL, SRC_none, MSG_po, msg);
			break;

		case 2:
		case 4:
		case 6:
		  	snprintf(msg, sizeof(msg), "%s: corrected ownership(s)", p_mpug->path);
			put_msg_in_table(NULL, SRC_none, MSG_po, msg);
			break;

		case 3:
		case 5:
		case 7:
			snprintf(msg, sizeof(msg), "%s: corrected permissions and ownership(s)", p_mpug->path);
			put_msg_in_table(NULL, SRC_none, MSG_po, msg);
			break;
	}
}
// clang-format on


================================================
FILE: src/tools/pbs_python.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file
 *		pbs_python.c
 *
 * @brief
 *		This file contains functions related to Pbs  with Python.
 *
 * Functions included are:
 * 	check_que_enable()
 * 	decode_rcost()
 * 	encode_rcost()
 * 	encode_svrstate()
 * 	decode_depend()
 * 	encode_depend()
 * 	node_queue_action()
 * 	node_np_action()
 * 	node_pcpu_action()
 * 	pbs_python_populate_svrattrl_from_file()
 * 	pbs_python_populate_server_svrattrl_from_file()
 * 	fprint_svrattrl_list()
 * 	fprint_str_array()
 * 	argv_list_to_str()
 * 	main()
 */
#include <pbs_config.h>

#include <pbs_python_private.h>
#include <Python.h>

#include <pbs_ifl.h>
#include <pbs_internal.h>
#include <pbs_version.h>

#ifdef NAS /* localmod 005 */
#include <ctype.h>
#endif /* localmod 005 */
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <errno.h>
#include <fcntl.h>
#include <pbs_python.h>
#include <pbs_error.h>
#include <pbs_entlim.h>
#include <work_task.h>
#include <resource.h>
#include <list_link.h>
#include <attribute.h>
#include "libpbs.h"
#include "batch_request.h"
#include "hook.h"
#include <signal.h>
#include "job.h"
#include "reservation.h"
#include "server.h"
#include "queue.h"
#include <pbs_nodes.h>
#include "libutil.h"
#include "cmds.h"
#include "svrfunc.h"
#include "pbs_sched.h"
#include "portability.h"

#define PBS_V1_COMMON_MODULE_DEFINE_STUB_FUNCS 1
#include "pbs_v1_module_common.i"

#define MAXBUF 4096
#define PYHOME "PYTHONHOME"
#define PYHOME_EQUAL "PYTHONHOME="

#define HOOK_MODE "--hook"

extern char *vnode_state_to_str(int state_bit);
extern char *vnode_sharing_to_str(enum vnode_sharing vns);
extern char *vnode_ntype_to_str(int type);

extern int str_to_vnode_state(char *state_str);
extern int str_to_vnode_ntype(char *ntype_str);
extern enum vnode_sharing str_to_vnode_sharing(char *sharing_str);

/**
 * @brief
 *		Takes data from input file or stdin of the form:
 *		<attribute_name>=<attribute value>
 *		<attribute_name>[<resource_name>]=<resource value>
 *		and populate the given various lists with the value obtained.
 *
 * @param[in]	input_file	-	if NULL, will get data from stdin.
 * @param[in]	default_svrattrl	-	the "catch all" list
 * @param[in]	event_svrattrl	-	gets <attribute_name>=EVENT_OBJECT data
 * @param[in]	event_job_svrattrl	-	gets <attribute_name>=EVENT_JOB_OBJECT data
 * @param[in]	event_job_o_svrattrl	-	gets <attribute_name>=EVENT_JOB_O_OBJECT data
 * @param[in]	event_resv_svrattrl	-	gets <attribute_name>=EVENT_RESV_OBJECT data
 * @param[in]	event_vnode_svrattrl	-	gets <attribute_name>=EVENT_VNODE_OBJECT data
 * 			             		Caution: svrattrl values stored in sorted order
 * @param[in] event_vnode_fail_svrattrl -	gets <attribute_name>=EVENT_VNODELIST_FAIL_OBJECT data
 * 			             		Caution: svrattrl values stored in sorted order
 * @param[in] job_failed_mom_list_svrattrl -	gets <attribute_name>=JOB_FAILED_MOM_LIST_OBJECT data
 * @param[in] job_succeeded_mom_list_svrattrl -	gets <attribute_name>=JOB_SUCCEEDED_MOM_LIST_OBJECT data
 * @param[in]	event_src_queue_svrattrl	-	gets <attribute_name>=EVENT_SRC_QUEUE_OBJECT data
 * @param[in]	event_aoe_svrattrl	-	gets <attribute_name=EVENT_AOE_OBJECT data
 * @param[in]	event_argv_svrattrl	-	gets <attribute_name=EVENT_ARGV_OBJECT data
 *
 * @param[in]	event_jobs_svrattrl	-	gets <attribute_name>=EVENT_JOBLIST_OBJECT data
 * 			            				Caution: svrattrl values stored in sorted order
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 * @param[in]	perf_action - passed on to hook_perf_stat* call.
 *
 * @return	int
 * @retval	0	: success
 * @retval	-1	: failure, and free_attrlist() is used to free the memory
 *					associated with each non-NULL list parameter.
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
int
pbs_python_populate_svrattrl_from_file(char *input_file,
				       pbs_list_head *default_svrattrl, pbs_list_head *event_svrattrl,
				       pbs_list_head *event_job_svrattrl, pbs_list_head *event_job_o_svrattrl,
				       pbs_list_head *event_resv_svrattrl, pbs_list_head *event_vnode_svrattrl,
				       pbs_list_head *event_vnode_fail_svrattrl,
				       pbs_list_head *job_failed_mom_list_svrattrl,
				       pbs_list_head *job_succeeded_mom_list_svrattrl,
				       pbs_list_head *event_src_queue_svrattrl, pbs_list_head *event_aoe_svrattrl,
				       pbs_list_head *event_argv_svrattrl, pbs_list_head *event_jobs_svrattrl,
				       char *perf_label, char *perf_action)
{

	char *attr_name;
	char *name_str;
	char name_str_buf[STRBUF + 1] = {'\0'};
	char *resc_str;
	char argv_index[STRBUF + 1] = {'\0'};
	char *val_str;
	char *obj_name;
	int rc = -1;
	char *pc, *pc1, *pc2, *pc3, *pc4;
	char *in_data = NULL;
	long int endpos;
	int in_data_sz;
	char *data_value;
	size_t ll;
	FILE *fp = NULL;
	char *p;
	int vn_obj_len = strlen(EVENT_VNODELIST_OBJECT);
	int vn_fail_obj_len = strlen(EVENT_VNODELIST_FAIL_OBJECT);
	int job_obj_len = strlen(EVENT_JOBLIST_OBJECT);
	int b_triple_quotes = 0;
	int e_triple_quotes = 0;
	char buf_data[STRBUF];

	if ((default_svrattrl == NULL) || (event_svrattrl == NULL) ||
	    (event_job_svrattrl == NULL) || (event_job_o_svrattrl == NULL) ||
	    (event_resv_svrattrl == NULL) || (event_vnode_svrattrl == NULL) ||
	    (event_src_queue_svrattrl == NULL) || (event_aoe_svrattrl == NULL) ||
	    (event_argv_svrattrl == NULL) || (event_vnode_fail_svrattrl == NULL) ||
	    (job_failed_mom_list_svrattrl == NULL) ||
	    (job_succeeded_mom_list_svrattrl == NULL) ||
	    (event_jobs_svrattrl == NULL)) {
		log_err(-1, __func__, "Bad input parameter!");
		rc = -1;
		goto populate_svrattrl_fail;
	}

	if ((input_file != NULL) && (*input_file != '\0')) {
		fp = fopen(input_file, "r");

		if (fp == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed to open input file %s", input_file);
			log_err(errno, __func__, log_buffer);
			rc = -1;
			goto populate_svrattrl_fail;
		}
	} else {
		fp = stdin;
	}

	hook_perf_stat_start(perf_label, perf_action, 0);
	if (default_svrattrl)
		free_attrlist(default_svrattrl);
	if (event_svrattrl)
		free_attrlist(event_svrattrl);
	if (event_job_svrattrl)
		free_attrlist(event_job_svrattrl);
	if (event_job_o_svrattrl)
		free_attrlist(event_job_o_svrattrl);
	if (event_resv_svrattrl)
		free_attrlist(event_resv_svrattrl);
	if (event_vnode_svrattrl)
		free_attrlist(event_vnode_svrattrl);
	if (event_vnode_fail_svrattrl)
		free_attrlist(event_vnode_fail_svrattrl);
	if (job_failed_mom_list_svrattrl)
		free_attrlist(job_failed_mom_list_svrattrl);
	if (job_succeeded_mom_list_svrattrl)
		free_attrlist(job_succeeded_mom_list_svrattrl);
	if (event_src_queue_svrattrl)
		free_attrlist(event_src_queue_svrattrl);
	if (event_aoe_svrattrl)
		free_attrlist(event_aoe_svrattrl);
	if (event_argv_svrattrl)
		free_attrlist(event_argv_svrattrl);
	if (event_jobs_svrattrl)
		free_attrlist(event_jobs_svrattrl);

	in_data_sz = STRBUF;
	in_data = (char *) malloc(in_data_sz);
	if (in_data == NULL) {
		log_err(errno, __func__, "malloc failed");
		rc = -1;
		goto populate_svrattrl_fail;
	}
	in_data[0] = '\0';

	if (fseek(fp, 0, SEEK_END) != 0) {
		log_err(errno, __func__, "fseek to end failed");
		rc = 1;
		goto populate_svrattrl_fail;
	}
	endpos = ftell(fp);
	if (fseek(fp, 0, SEEK_SET) != 0) {
		log_err(errno, __func__, "fseek to beginning failed");
		rc = 1;
		goto populate_svrattrl_fail;
	}
	while (fgets(buf_data, STRBUF, fp) != NULL) {

		b_triple_quotes = 0;
		e_triple_quotes = 0;

		if (pbs_strcat(&in_data, &in_data_sz, buf_data) == NULL) {
			goto populate_svrattrl_fail;
		}

		ll = strlen(in_data);
#ifdef WIN32
		/* The file is being read in O_BINARY mode (see _fmode setting) */
		/* so on Windows, there's a carriage return (\r) line feed (\n), */
		/* then the linefeed needs to get processed out */
		if (ll >= 2) {
			if (in_data[ll - 2] == '\r') {
				/* remove newline */
				in_data[ll - 2] = '\0';
			}
		}
#endif
		if ((p = strchr(in_data, '=')) != NULL) {
			b_triple_quotes = starts_with_triple_quotes(p + 1);
		}

		if (in_data[ll - 1] == '\n') {
			e_triple_quotes = ends_with_triple_quotes(in_data, 0);

			if (b_triple_quotes && !e_triple_quotes) {
				int jj;

				while (fgets(buf_data, STRBUF, fp) != NULL) {
					if (pbs_strcat(&in_data, &in_data_sz,
						       buf_data) == NULL) {
						goto populate_svrattrl_fail;
					}

					jj = strlen(in_data);
					if ((in_data[jj - 1] != '\n') &&
					    (ftell(fp) != endpos)) {
						/* get more input for
						 * current item.
						 */
						continue;
					}
					e_triple_quotes =
						ends_with_triple_quotes(in_data, 0);

					if (e_triple_quotes) {
						break;
					}
				}

				if ((!b_triple_quotes && e_triple_quotes) ||
				    (b_triple_quotes && !e_triple_quotes)) {
					snprintf(log_buffer, sizeof(log_buffer),
						 "unmatched triple quotes! Skipping  line %s",
						 in_data);
					log_err(PBSE_INTERNAL, __func__, log_buffer);
					/* process a new line */
					in_data[0] = '\0';
					continue;
				}
				in_data[strlen(in_data) - 1] = '\0';

			} else {
				/* remove newline */
				in_data[ll - 1] = '\0';
			}
		} else if (ftell(fp) != endpos) { /* continued on next line */
			/* get more input for current item.  */
			continue;
		}
		data_value = NULL;
		if ((p = strchr(in_data, '=')) != NULL) {
			int i;
			*p = '\0';
			p++;
			/* Given '<obj_name>=<data_value>' line, */
			/* strip off leading spaces from <data_value> */
			while (isspace(*p))
				p++;
			if (b_triple_quotes) {
				/* strip triple quotes */
				p += 3;
			}
			data_value = p;
			if (e_triple_quotes) {
				(void) ends_with_triple_quotes(p, 1);
			}

			i = strlen(p);
			while (--i > 0) { /* strip trailing blanks */
				if (!isspace((int) *(p + i)))
					break;
				*(p + i) = '\0';
			}
		}
		obj_name = in_data;

		pc = strrchr(in_data, '.');
		if (pc) {
			*pc = '\0';
			pc++;
		} else {
			pc = in_data;
		}
		name_str = pc;

		pc1 = strchr(pc, '[');
		pc2 = strchr(pc, ']');
		resc_str = NULL;
		if (pc1 && pc2 && (pc2 > pc1)) {
			*pc1 = '\0';
			pc1++;
			resc_str = pc1;
			*pc2 = '\0';
			pc2++;

			/* now let's if there's anything quoted inside */
			pc3 = strchr(pc1, '"');
			if (pc3 != NULL)
				pc4 = strchr(pc3 + 1, '"');
			else
				pc4 = NULL;

			if (pc3 && pc4 && (pc4 > pc3)) {
				pc3++;
				*pc4 = '\0';
				resc_str = pc3;
			}
		}

		val_str = NULL;
		if (data_value) {
			val_str = data_value;

			if (strcmp(obj_name, EVENT_OBJECT) == 0) {
				if (strcmp(name_str, PY_EVENT_PARAM_ARGLIST) == 0) {
					if (event_argv_svrattrl) {
						/* 'resc_str' holds the */
						/* numeric index to argv (0,1,...). */
						/* enumerating argv[0], argv[1],... */
						/* argv_index is the 'resc_str' value */
						/* that is padded to have a fixed */
						/* length, so that when use as a sort */
						/* key, natural ordering is respected */
						/* in the lexicographical comparison */
						/* done by add_to_svrattrl_list_sorted(). */
						/* Without the padding, the argv index */
						/* would get ordered as 0,1,10,11,12,2,3,.. */
						/* With padding, then the order would be */
						/* 000,001,002,003,...,010,011,... */
						/* respecting natural order. */
						/* leading zeros added up to a length of 8 */
						snprintf(argv_index, sizeof(argv_index) - 1,
							 "%08d", atoi(resc_str));

						rc = add_to_svrattrl_list_sorted(event_argv_svrattrl, name_str, resc_str, val_str, 0, argv_index);
					}
				} else {
					if (event_svrattrl)
						rc = add_to_svrattrl_list(event_svrattrl, name_str, resc_str, val_str, 0, NULL);
				}
			} else if (event_job_svrattrl &&
				   (strcmp(obj_name, EVENT_JOB_OBJECT) == 0)) {
				if (strcmp(name_str, PY_JOB_FAILED_MOM_LIST) == 0) {
					if (job_failed_mom_list_svrattrl) {
						rc = add_to_svrattrl_list(job_failed_mom_list_svrattrl, val_str, NULL, NULL, 0, NULL);
					}
				} else if (strcmp(name_str, PY_JOB_SUCCEEDED_MOM_LIST) == 0) {
					if (job_succeeded_mom_list_svrattrl) {
						rc = add_to_svrattrl_list(job_succeeded_mom_list_svrattrl, val_str, NULL, NULL, 0, NULL);
					}
				} else {
					rc = add_to_svrattrl_list(event_job_svrattrl, name_str, resc_str, val_str, 0, NULL);
				}
			} else if (event_job_o_svrattrl &&
				   (strcmp(obj_name, EVENT_JOB_O_OBJECT) == 0)) {
				rc = add_to_svrattrl_list(event_job_o_svrattrl, name_str,
							  resc_str, val_str, 0, NULL);
			} else if (event_resv_svrattrl &&
				   (strcmp(obj_name, EVENT_RESV_OBJECT) == 0)) {
				rc = add_to_svrattrl_list(event_resv_svrattrl, name_str,
							  resc_str, val_str, 0, NULL);
			} else if ((event_vnode_fail_svrattrl &&
				    (strncmp(obj_name, EVENT_VNODELIST_FAIL_OBJECT, vn_fail_obj_len) == 0)) ||
				   (event_vnode_svrattrl &&
				    (strncmp(obj_name, EVENT_VNODELIST_OBJECT, vn_obj_len) == 0))) {

				/* pbs.event().vnode_list_fail[<vnode_name>]\0<attribute name>\0<resource name>\0<value>
				 * where obj_name = pbs.event().vnode_list_fail[<vnode_name>]
				 *	  name_str = <attribute name>
				 *     - or -
				 * pbs.event().vnode_list[<vnode_name>]\0<attribute name>\0<resource name>\0<value>
				 * where obj_name = pbs.event().vnode_list[<vnode_name>]
				 *	  name_str = <attribute name>
				 */

				/* import here to look for the leftmost '[' (using strchr)
				 * and the rightmost ']' (using strrchr)
				 * as we can have:
				 *	pbs.event().vnode_list_fail["altix[5]"].<attr>=<val>
				 *    - or -
				 *	pbs.event().vnode_list["altix[5]"].<attr>=<val>
				 * and "altix[5]" is a valid vnode id.
				 */
				if (((pc1 = strchr(obj_name, '[')) != NULL) &&
				    ((pc2 = strrchr(obj_name, ']')) != NULL) &&
				    (pc2 > pc1)) {
					pc1++; /* <vnode_name> part */

					*pc2 = '.'; /* pbs.event().vnode_list_fail[<vnode_name>. or pbs.event().vnode_list[<vnode_nam.. */
					pc2++;

					/* now let's if there's anything quoted inside */
					pc3 = strchr(pc1, '"');
					if (pc3 != NULL)
						pc4 = strchr(pc3 + 1, '"');
					else
						pc4 = NULL;

					if (pc3 && pc4 && (pc4 > pc3)) {
						pc3++;
						*pc4 = '.';
						pc4++;
						/* we're saving 'name_str' in a separate array (name_str_buf), */
						/* as strcpy() does something odd under rhel6/centos if the */
						/* destination (pc4)  and the source (name_str) are in the same */
						/* memory area, even though non-overlapping. */
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc4, name_str_buf); /* <vnode_name>.<attr name> */
						name_str = pc3;
					} else {
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc2, name_str_buf); /* <vnode_name>.<attr name> */
						name_str = pc1;
					}
					attr_name = strrchr(name_str, '.');
					if (attr_name == NULL)
						attr_name = name_str;
					else
						attr_name++;

				} else {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' does not have a vnode name!", obj_name);
					log_err(-1, __func__, log_buffer);
					/* process a new line */
					in_data[0] = '\0';
					continue;
				}
				if (strncmp(obj_name, EVENT_VNODELIST_FAIL_OBJECT, vn_fail_obj_len) == 0) {
					rc = add_to_svrattrl_list_sorted(event_vnode_fail_svrattrl, name_str, resc_str, return_internal_value(attr_name, val_str), 0, NULL);
				} else {
					rc = add_to_svrattrl_list_sorted(event_vnode_svrattrl, name_str, resc_str, return_internal_value(attr_name, val_str), 0, NULL);
				}

			} else if (event_jobs_svrattrl && (strncmp(obj_name, EVENT_JOBLIST_OBJECT, job_obj_len) == 0)) {

				/* pbs.event().job_list[<jobid>]\0<attribute name>\0<resource name>\0<value>
				 * where obj_name = pbs.event().job_list[<jobid>]
				 *	  name_str = <attribute name>
				 */

				/* import here to look for the leftmost '[' (using strchr)
				 * and the rightmost ']' (using strrchr)
				 * as we can have:
				 *		pbs.event().job_list["5.altix"].<attr>=<val>
				 * and "5.altix" is a valid job id.
				 */
				if (((pc1 = strchr(obj_name, '[')) != NULL) &&
				    ((pc2 = strrchr(obj_name, ']')) != NULL) &&
				    (pc2 > pc1)) {
					pc1++; /* <jobid> part */

					*pc2 = '.'; /* pbs.event().job_list[<jobid>. */
					pc2++;

					/* now let's if there's anything quoted inside */
					pc3 = strchr(pc1, '"');
					if (pc3 != NULL)
						pc4 = strchr(pc3 + 1, '"');
					else
						pc4 = NULL;

					if (pc3 && pc4 && (pc4 > pc3)) {
						pc3++;
						*pc4 = '.';
						pc4++;
						/* we're saving 'name_str' in a separate array (name_str_buf), */
						/* as strcpy() does something odd under rhel6/centos if the */
						/* destination (pc4)  and the source (name_str) are in the same */
						/* memory area, even though non-overlapping. */
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc4, name_str_buf); /* <jobid>.<attr name> */
						name_str = pc3;
					} else {
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc2, name_str_buf); /* <jobid>.<attr name> */
						name_str = pc1;
					}
					attr_name = strrchr(name_str, '.');
					if (attr_name == NULL)
						attr_name = name_str;
					else
						attr_name++;

				} else {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' does not have a job name!", obj_name);
					log_err(-1, __func__, log_buffer);
					/* process a new line */
					in_data[0] = '\0';
					continue;
				}
				rc = add_to_svrattrl_list_sorted(event_jobs_svrattrl,
								 name_str, resc_str, val_str, 0, NULL);
			} else if (event_src_queue_svrattrl && (strcmp(obj_name, EVENT_SRC_QUEUE_OBJECT) == 0)) {
				rc = add_to_svrattrl_list(event_src_queue_svrattrl,
							  name_str, resc_str, val_str, 0, NULL);
			} else if (event_aoe_svrattrl && (strcmp(obj_name, EVENT_AOE_OBJECT) == 0)) {
				rc = add_to_svrattrl_list(event_aoe_svrattrl, name_str,
							  resc_str, val_str, 0, NULL);
			} else if ((strcmp(obj_name, PBS_OBJ) == 0) &&
				   (strcmp(name_str, GET_NODE_NAME_FUNC) == 0)) {
				strncpy(svr_interp_data.local_host_name, val_str,
					PBS_MAXHOSTNAME);
				rc = 0;
			} else {
				rc = add_to_svrattrl_list(default_svrattrl,
							  name_str, resc_str, val_str, 0, NULL);
			}

			if (rc == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to add_to_svrattrl_list(%s,%s,%s",
					 name_str, resc_str, (val_str ? val_str : ""));
				log_err(errno, __func__, log_buffer);
				goto populate_svrattrl_fail;
			}
		}
		in_data[0] = '\0';
	}

	if (fp != stdin)
		fclose(fp);

	if (in_data != NULL) {
		free(in_data);
	}
	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (0);

populate_svrattrl_fail:
	if (default_svrattrl)
		free_attrlist(default_svrattrl);
	if (event_svrattrl)
		free_attrlist(event_svrattrl);
	if (event_job_svrattrl)
		free_attrlist(event_job_svrattrl);
	if (event_job_o_svrattrl)
		free_attrlist(event_job_o_svrattrl);
	if (event_resv_svrattrl)
		free_attrlist(event_resv_svrattrl);
	if (event_vnode_svrattrl)
		free_attrlist(event_vnode_svrattrl);
	if (event_vnode_fail_svrattrl)
		free_attrlist(event_vnode_fail_svrattrl);
	if (event_src_queue_svrattrl)
		free_attrlist(event_src_queue_svrattrl);
	if (event_aoe_svrattrl)
		free_attrlist(event_aoe_svrattrl);
	if (event_argv_svrattrl)
		free_attrlist(event_argv_svrattrl);
	if (event_jobs_svrattrl)
		free_attrlist(event_jobs_svrattrl);

	if ((fp != NULL) && (fp != stdin))
		fclose(fp);

	if (in_data != NULL) {
		free(in_data);
	}

	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (rc);
}

/**
 *
 * @brief
 *
 * 		This is like populate_svrattrl_from_file() but data is focused
 * 		on pbs.server() type of data.
 *		Takes data from input file or stdin of the form:
 *		<attribute_name>=<attribute value>
 *		<attribute_name>[<resource_name>]=<resource value>
 *		and populate the given various lists with the value obtained.
 *
 * @param[out]	input_file	-	if NULL, will get data from stdin.
 * @param[out]	default_svrattrl	-	the "catch all" list
 * @param[out]	server_svrattrl	-	gets <attribute_name>=SERVER_OBJECT data
 * @param[out]	server_jobs_svrattrl	-	gets <attribute_name>=SERVER_JOB_OBJECT data
 * 			              					Caution: stored in sorted order.
 * @param[out]	server_jobs_ids_svrattrl	-	gets the list of job ids obtained
 * @param[out]	server_queues_svrattrl	-	gets <attribute_name>=SERVER_QUEUE_OBJECT data
 * 			                				Caution: stored in sorted order.
 * @param[out]	server_queues_names_svrattrl	-	gets list of queue names obtained
 * @param[out]	server_resvs_svrattrl	-	gets <attribute_name>=SERVER_RESV_OBJECT data
 * 			               					Caution: stored in sorted order.
 * @param[out]	server_resvs_resvids_svrattrl	-	gets list of reservation ids obtained
 * @param[out]	server_vnodes_svrattrl	-	gets <attribute_name>=SERVER_VNODE_OBJECT data
 * 			                				Caution: stored in sorted order.
 * @param[out]	server_vnodes_names_svrattrl	-	gets list of vnode names obtained.
 * @param[in]	perf_label - passed on to hook_perf_stat* call.
 * @param[in]	perf_action - passed on to hook_perf_stat* call.
 *
 * @return	int
 * @retval	0	: success
 * @retval	-1	: failure, and free_attrlist() is used to free the memory
 *					associated with each non-NULL list parameter.
 *
 * @note
 *		This function calls a single hook_perf_stat_start()
 *		that has some malloc-ed data that are freed in the
 *		hook_perf_stat_stop() call, which is done at the end of
 *		this function.
 *		Ensure that after the hook_perf_stat_start(), all
 *		program execution path lead to hook_perf_stat_stop()
 *		call.
 */
int
pbs_python_populate_server_svrattrl_from_file(char *input_file,
					      pbs_list_head *default_svrattrl,
					      pbs_list_head *server_svrattrl,
					      pbs_list_head *server_jobs_svrattrl,
					      pbs_list_head *server_jobs_ids_svrattrl,
					      pbs_list_head *server_queues_svrattrl,
					      pbs_list_head *server_queues_names_svrattrl,
					      pbs_list_head *server_resvs_svrattrl,
					      pbs_list_head *server_resvs_resvids_svrattrl,
					      pbs_list_head *server_vnodes_svrattrl,
					      pbs_list_head *server_vnodes_names_svrattrl,
					      char *perf_label, char *perf_action)
{

	char *attr_name;
	char *name_str;
	char name_str_buf[STRBUF + 1] = {'\0'};
	char *resc_str;
	char *val_str;
	char *obj_name;
	char *obj_name2;
	int rc = -1;
	int rc2 = -1;
	char *pc, *pc1, *pc2, *pc3, *pc4;
	char *in_data = NULL;
	char *tmp_data = NULL;
	long int curpos;
	long int endpos;
	size_t in_data_sz;
	char *data_value;
	size_t ll;
	FILE *fp = NULL;
	char *p, *p2;
	int jobs_obj_len = strlen(SERVER_JOB_OBJECT);
	int queue_obj_len = strlen(SERVER_QUEUE_OBJECT);
	int resv_obj_len = strlen(SERVER_RESV_OBJECT);
	int vnode_obj_len = strlen(SERVER_VNODE_OBJECT);

	if ((default_svrattrl == NULL) ||
	    (server_svrattrl == NULL) ||
	    (server_jobs_svrattrl == NULL) ||
	    (server_jobs_ids_svrattrl == NULL) ||
	    (server_queues_svrattrl == NULL) ||
	    (server_queues_names_svrattrl == NULL) ||
	    (server_vnodes_svrattrl == NULL) ||
	    (server_vnodes_names_svrattrl == NULL) ||
	    (server_resvs_svrattrl == NULL) ||
	    (server_resvs_resvids_svrattrl == NULL)) {
		log_err(errno, __func__, "Bad input parameter!");
		rc = -1;
		goto populate_server_svrattrl_fail;
	}

	if ((input_file != NULL) && (*input_file != '\0')) {
		fp = fopen(input_file, "r");

		if (fp == NULL) {
			snprintf(log_buffer, sizeof(log_buffer),
				 "failed to open input file %s", input_file);
			log_err(errno, __func__, log_buffer);
			rc = -1;
			goto populate_server_svrattrl_fail;
		}
	} else {
		fp = stdin;
	}

	hook_perf_stat_start(perf_label, perf_action, 0);

	if (default_svrattrl) {
		free_attrlist(default_svrattrl);
		CLEAR_HEAD((*default_svrattrl));
	}
	if (server_svrattrl) {
		free_attrlist(server_svrattrl);
		CLEAR_HEAD((*server_svrattrl));
	}
	if (server_jobs_svrattrl) {
		free_attrlist(server_jobs_svrattrl);
		CLEAR_HEAD((*server_jobs_svrattrl));
	}
	if (server_jobs_ids_svrattrl) {
		free_attrlist(server_jobs_ids_svrattrl);
		CLEAR_HEAD((*server_jobs_ids_svrattrl));
	}
	if (server_queues_svrattrl) {
		free_attrlist(server_queues_svrattrl);
		CLEAR_HEAD((*server_queues_svrattrl));
	}
	if (server_queues_names_svrattrl) {
		free_attrlist(server_queues_names_svrattrl);
		CLEAR_HEAD((*server_queues_names_svrattrl));
	}
	if (server_vnodes_svrattrl) {
		free_attrlist(server_vnodes_svrattrl);
		CLEAR_HEAD((*server_vnodes_svrattrl));
	}
	if (server_vnodes_names_svrattrl) {
		free_attrlist(server_vnodes_names_svrattrl);
		CLEAR_HEAD((*server_vnodes_names_svrattrl));
	}
	if (server_resvs_svrattrl) {
		free_attrlist(server_resvs_svrattrl);
		CLEAR_HEAD((*server_resvs_svrattrl));
	}
	if (server_resvs_resvids_svrattrl) {
		free_attrlist(server_resvs_resvids_svrattrl);
		CLEAR_HEAD((*server_resvs_resvids_svrattrl));
	}

	in_data_sz = STRBUF;
	in_data = (char *) malloc(in_data_sz);
	if (in_data == NULL) {
		log_err(errno, __func__, "malloc failed");
		rc = -1;
		goto populate_server_svrattrl_fail;
	}

	if (fseek(fp, 0, SEEK_END) != 0) {
		log_err(errno, __func__, "fseek to end failed");
		rc = 1;
		goto populate_server_svrattrl_fail;
	}
	endpos = ftell(fp);
	if (fseek(fp, 0, SEEK_SET) != 0) {
		log_err(errno, __func__, "fseek to beginning failed");
		rc = 1;
		goto populate_server_svrattrl_fail;
	}
	curpos = ftell(fp);
	while (fgets(in_data, in_data_sz, fp) != NULL) {

		ll = strlen(in_data);
#ifdef WIN32
		/* The file is being read in O_BINARY mode (see _fmode setting) */
		/* so on Windows, there's a carriage return (\r) line feed (\n), */
		/* then the linefeed needs to get processed out */
		if (ll >= 2) {
			if (in_data[ll - 2] == '\r') {
				/* remove newline */
				in_data[ll - 2] = '\0';
			}
		}
#endif
		if (in_data[ll - 1] == '\n') {
			/* remove newline */
			in_data[ll - 1] = '\0';
		} else if (ftell(fp) != endpos) { /* continued on next line */
			in_data_sz = 2 * in_data_sz;
			tmp_data = (char *) realloc(in_data, in_data_sz);
			if (tmp_data == NULL) {
				log_err(errno, __func__, "realloc failed");
				rc = -1;
				goto populate_server_svrattrl_fail;
			}
			in_data = tmp_data;
			if (fseek(fp, curpos, SEEK_SET) != 0) {
				log_err(errno, __func__, "failed to fseek");
				rc = -1;
				goto populate_server_svrattrl_fail;
			}
			continue;
		}
		curpos = ftell(fp);
		data_value = NULL;
		if ((p = strchr(in_data, '=')) != NULL) {
			int i;
			*p = '\0';
			p++;
			/* Given '<obj_name>=<data_value>' line, */
			/* strip off leading spaces from <data_value> */
			while (isspace(*p))
				p++;
			data_value = p;
			/* and strip off trailing spaces from <data_value> */
			i = strlen(p);
			while (--i > 0) { /* strip trailing blanks */
				if (!isspace((int) *(p + i)))
					break;
				*(p + i) = '\0';
			}
		}
		obj_name = in_data;

		pc = strrchr(in_data, '.');
		if (pc) {
			*pc = '\0';
			pc++;
		} else {
			pc = in_data;
		}
		name_str = pc;

		pc1 = strchr(pc, '[');
		pc2 = strchr(pc, ']');
		resc_str = NULL;
		if (pc1 && pc2 && (pc2 > pc1)) {
			*pc1 = '\0';
			pc1++;
			resc_str = pc1;
			*pc2 = '\0';
			pc2++;

			/* now let's if there's anything quoted inside */
			pc3 = strchr(pc1, '"');
			if (pc3 != NULL)
				pc4 = strchr(pc3 + 1, '"');
			else
				pc4 = NULL;

			if (pc3 && pc4 && (pc4 > pc3)) {
				pc3++;
				*pc4 = '\0';
				resc_str = pc3;
			}
		}

		val_str = NULL;
		if (data_value) {
			val_str = data_value;

			if (strcmp(obj_name, SERVER_OBJECT) == 0) {
				if (server_svrattrl) {
					rc = add_to_svrattrl_list(server_svrattrl, name_str, resc_str, val_str, 0, NULL);
				}
				rc2 = 0;
			} else if (server_jobs_svrattrl &&
				   (strncmp(obj_name, SERVER_JOB_OBJECT,
					    jobs_obj_len) == 0)) {
				obj_name2 = obj_name + jobs_obj_len;

				/* pbs.server().job(<jobid>)\0<attribute name>\0<resource name>\0<value>
				 * where obj_name = pbs.server().job(<jobid>)
				 *       obj_name2 = (<jobid>
				 *	  name_str = <attribute name>
				 *
				 */

				/* import here to look for the first '(' (using strrchr)
				 * and the last')' (using strrchr)
				 * as we can have:
				 *		pbs.server().job("23.ricardo").<attr>=<val>
				 * and "23.ricardo" is a valid job id.
				 */
				if (((pc1 = strchr(obj_name2, '(')) != NULL) &&
				    ((pc2 = strchr(obj_name2, ')')) != NULL) &&
				    (pc2 > pc1)) {
					pc1++; /* <jobid> part */

					*pc2 = '.'; /* pbs.server().job(<jobid>. */
					pc2++;

					/* now let's if there's anything quoted inside */
					pc3 = strchr(pc1, '"');
					if (pc3 != NULL)
						pc4 = strchr(pc3 + 1, '"');
					else
						pc4 = NULL;

					if (pc3 && pc4 && (pc4 > pc3)) {
						pc3++;
						*pc4 = '.';
						pc4++;
						/* we're saving 'name_str' in a separate array (name_str_buf), */
						/* as strcpy() does something odd under rhel6/centos if the */
						/* destination (pc4)  and the source (name_str) are in the same */
						/* memory area, even though non-overlapping. */
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc4, name_str_buf); /* <jobid>.<attr name> */
						name_str = pc3;
					} else {
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc2, name_str_buf); /* <jobid>.<attr name> */
						name_str = pc1;
					}
					attr_name = strrchr(name_str, '.');
					if (attr_name == NULL)
						attr_name = name_str;
					else
						attr_name++;

				} else {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' does not have a job id!", obj_name);
					log_err(-1, __func__, log_buffer);
					continue;
				}
				rc = add_to_svrattrl_list_sorted(server_jobs_svrattrl,
								 name_str, resc_str, val_str, 0, NULL);

				if ((p2 = strrchr(name_str, '.')) != NULL)
					*p2 = '\0'; /* name_str=<jobid> */

				if (!find_svrattrl_list_entry(server_jobs_ids_svrattrl,
							      name_str, NULL))
					rc2 = add_to_svrattrl_list(server_jobs_ids_svrattrl, name_str, NULL, "", 0, NULL);

				if (p2 != NULL)
					*p2 = '.'; /* name_str=<jobid>.<attr> */

			} else if (server_vnodes_svrattrl &&
				   (strncmp(obj_name, SERVER_VNODE_OBJECT,
					    vnode_obj_len) == 0)) {

				obj_name2 = obj_name + vnode_obj_len;
				/* pbs.server().vnode(<vnode_name>)\0<attribute name>\0<resource name>\0<value>
				 * where obj_name = pbs.server().vnode(<vnode_name>)
				 *       obj_name = (<vnode_name>)
				 *	  name_str = <attribute name>
				 */

				/* import here to look for the leftmost '(' (using strchr)
				 * and the rightmost ')' (using strrchr)
				 * as we can have:
				 *		pbs.server().vnode("altix[5]").<attr>=<val>
				 * and "altix[5]" is a valid vnode id.
				 */
				if (((pc1 = strchr(obj_name2, '(')) != NULL) &&
				    ((pc2 = strrchr(obj_name2, ')')) != NULL) &&
				    (pc2 > pc1)) {
					pc1++; /* <vnode_name> part */

					*pc2 = '.'; /* pbs.server().vnode(<vnode_name>. */
					pc2++;

					/* now let's if there's anything quoted inside */
					pc3 = strchr(pc1, '"');
					if (pc3 != NULL)
						pc4 = strchr(pc3 + 1, '"');
					else
						pc4 = NULL;

					if (pc3 && pc4 && (pc4 > pc3)) {
						pc3++;
						*pc4 = '.';
						pc4++;
						/* we're saving 'name_str' in a separate array (name_str_buf), */
						/* as strcpy() does something odd under rhel6/centos if the */
						/* destination (pc4)  and the source (name_str) are in the same */
						/* memory area, even though non-overlapping. */
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc4, name_str_buf); /* <vnode_name>.<attr name> */
						name_str = pc3;
					} else {
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc2, name_str_buf); /* <vnode_name>.<attr name> */
						name_str = pc1;
					}
					attr_name = strrchr(name_str, '.');
					if (attr_name == NULL)
						attr_name = name_str;
					else
						attr_name++;

				} else {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' does not have a vnode name!", obj_name);
					log_err(-1, __func__, log_buffer);
					continue;
				}
				rc = add_to_svrattrl_list_sorted(server_vnodes_svrattrl,
								 name_str, resc_str,
								 return_internal_value(attr_name, val_str), 0, NULL);
				if ((p2 = strrchr(name_str, '.')) != NULL)
					*p2 = '\0'; /* name_str=<vname> */

				if (!find_svrattrl_list_entry(server_vnodes_names_svrattrl,
							      name_str, NULL))
					rc2 = add_to_svrattrl_list(server_vnodes_names_svrattrl, name_str, NULL, "", 0, NULL);

				if (p2 != NULL)
					*p2 = '.'; /* name_str=<vname>.<attr> */

			} else if (server_queues_svrattrl &&
				   (strncmp(obj_name, SERVER_QUEUE_OBJECT,
					    queue_obj_len) == 0)) {

				obj_name2 = obj_name + queue_obj_len;
				/* pbs.server().queue(<qname>)\0<attribute name>\0<resource name>\0<value>
				 * where obj_name = pbs.server().queue(<qname>)
				 * where obj_name = pbs.server().queue(<qname>)
				 *	  name_str = <attribute name>
				 */

				/* import here to look for the leftmost '(' (using strchr)
				 * and the rightmost ')' (using strrchr)
				 * as we can have:
				 *		pbs.server().queue("workq").<attr>=<val>
				 * and "workq" is a valid queue id.
				 */
				if (((pc1 = strrchr(obj_name2, '(')) != NULL) &&
				    ((pc2 = strrchr(obj_name2, ')')) != NULL) &&
				    (pc2 > pc1)) {
					pc1++; /* <qname> part */

					*pc2 = '.'; /* pbs.server().queue(<qname>. */
					pc2++;

					/* now let's if there's anything quoted inside */
					pc3 = strchr(pc1, '"');
					if (pc3 != NULL)
						pc4 = strchr(pc3 + 1, '"');
					else
						pc4 = NULL;

					if (pc3 && pc4 && (pc4 > pc3)) {
						pc3++;
						*pc4 = '.';
						pc4++;
						/* we're saving 'name_str' in a separate array (name_str_buf), */
						/* as strcpy() does something odd under rhel6/centos if the */
						/* destination (pc4)  and the source (name_str) are in the same */
						/* memory area, even though non-overlapping. */
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc4, name_str_buf); /* <qname>.<attr name> */
						name_str = pc3;
					} else {
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc2, name_str_buf); /* <qname>.<attr name> */
						name_str = pc1;
					}
					attr_name = strrchr(name_str, '.');
					if (attr_name == NULL)
						attr_name = name_str;
					else
						attr_name++;

				} else {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' does not have a queue name!", obj_name);
					log_err(-1, __func__, log_buffer);
					continue;
				}
				rc = add_to_svrattrl_list_sorted(server_queues_svrattrl,
								 name_str, resc_str, val_str, 0, NULL);
				if ((p2 = strrchr(name_str, '.')) != NULL)
					*p2 = '\0'; /* name_str=<qname> */

				if (!find_svrattrl_list_entry(server_queues_names_svrattrl,
							      name_str, NULL))
					rc2 = add_to_svrattrl_list(server_queues_names_svrattrl, name_str, NULL, "", 0, NULL);

				if (p2 != NULL)
					*p2 = '.'; /* name_str=<qname>.<attr> */
			} else if (server_resvs_svrattrl &&
				   (strncmp(obj_name, SERVER_RESV_OBJECT,
					    resv_obj_len) == 0)) {

				obj_name2 = obj_name + resv_obj_len;
				/* pbs.server().resv(<resv_name>)\0<attribute name>\0<resource name>\0<value>
				 * where obj_name = pbs.server().resv(<resv_name>)
				 * 	 obj_name = (<resv_name>)
				 *	  name_str = <attribute name>
				 */

				/* import here to look for the leftmost '(' (using strchr)
				 * and the rightmost ')' (using strrchr)
				 * as we can have:
				 *		pbs.server().resv("R5").<attr>=<val>
				 * and "R5" is a valid resv id.
				 */
				if (((pc1 = strrchr(obj_name2, '(')) != NULL) &&
				    ((pc2 = strrchr(obj_name2, ')')) != NULL) &&
				    (pc2 > pc1)) {
					pc1++; /* <resv_name> part */

					*pc2 = '.'; /* pbs.server().resv(<resv_name>. */
					pc2++;

					/* now let's if there's anything quoted inside */
					pc3 = strchr(pc1, '"');
					if (pc3 != NULL)
						pc4 = strchr(pc3 + 1, '"');
					else
						pc4 = NULL;

					if (pc3 && pc4 && (pc4 > pc3)) {
						pc3++;
						*pc4 = '.';
						pc4++;
						/* we're saving 'name_str' in a separate array (name_str_buf), */
						/* as strcpy() does something odd under rhel6/centos if the */
						/* destination (pc4)  and the source (name_str) are in the same */
						/* memory area, even though non-overlapping. */
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc4, name_str_buf); /* <resv_name>.<attr name> */
						name_str = pc3;
					} else {
						strncpy(name_str_buf, name_str, sizeof(name_str_buf) - 1);
						strcpy(pc2, name_str_buf); /* <resv_name>.<attr name> */
						name_str = pc1;
					}
					attr_name = strrchr(name_str, '.');
					if (attr_name == NULL)
						attr_name = name_str;
					else
						attr_name++;

				} else {
					snprintf(log_buffer, sizeof(log_buffer),
						 "object '%s' does not have a resv name!", obj_name);
					log_err(-1, __func__, log_buffer);
					continue;
				}
				rc = add_to_svrattrl_list_sorted(server_resvs_svrattrl,
								 name_str, resc_str, val_str, 0, NULL);
				if ((p2 = strrchr(name_str, '.')) != NULL)
					*p2 = '\0'; /* name_str=<qname> */

				if (!find_svrattrl_list_entry(server_resvs_resvids_svrattrl, name_str, NULL))
					rc2 = add_to_svrattrl_list(server_resvs_resvids_svrattrl, name_str, NULL, "", 0, NULL);

				if (p2 != NULL)
					*p2 = '.'; /* name_str=<qname>.<attr> */
			} else {
				rc = add_to_svrattrl_list(default_svrattrl,
							  name_str, resc_str, val_str, 0, NULL);
				rc2 = 0;
			}

			if (rc == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to add_to_svrattrl_list(%s,%s,%s)",
					 name_str, resc_str, (val_str ? val_str : ""));
				log_err(errno, __func__, log_buffer);
				goto populate_server_svrattrl_fail;
			}

			if (rc2 == -1) {
				snprintf(log_buffer, sizeof(log_buffer),
					 "failed to add %s to list of names",
					 name_str);
				log_err(errno, __func__, log_buffer);
				goto populate_server_svrattrl_fail;
			}
		}
	}

	if (fp != stdin)
		fclose(fp);

	if (in_data != NULL) {
		free(in_data);
	}
	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (0);

populate_server_svrattrl_fail:

	if (default_svrattrl) {
		free_attrlist(default_svrattrl);
		CLEAR_HEAD((*default_svrattrl));
	}
	if (server_svrattrl) {
		free_attrlist(server_svrattrl);
		CLEAR_HEAD((*server_svrattrl));
	}
	if (server_jobs_svrattrl) {
		free_attrlist(server_jobs_svrattrl);
		CLEAR_HEAD((*server_jobs_svrattrl));
	}
	if (server_jobs_ids_svrattrl) {
		free_attrlist(server_jobs_ids_svrattrl);
		CLEAR_HEAD((*server_jobs_ids_svrattrl));
	}
	if (server_queues_svrattrl) {
		free_attrlist(server_queues_svrattrl);
		CLEAR_HEAD((*server_queues_svrattrl));
	}
	if (server_queues_names_svrattrl) {
		free_attrlist(server_queues_names_svrattrl);
		CLEAR_HEAD((*server_queues_names_svrattrl));
	}
	if (server_resvs_svrattrl) {
		free_attrlist(server_resvs_svrattrl);
		CLEAR_HEAD((*server_resvs_svrattrl));
	}
	if (server_resvs_resvids_svrattrl) {
		free_attrlist(server_resvs_resvids_svrattrl);
		CLEAR_HEAD((*server_resvs_resvids_svrattrl));
	}
	if (server_vnodes_svrattrl) {
		free_attrlist(server_vnodes_svrattrl);
		CLEAR_HEAD((*server_vnodes_svrattrl));
	}
	if (server_vnodes_names_svrattrl) {
		free_attrlist(server_vnodes_names_svrattrl);
		CLEAR_HEAD((*server_vnodes_names_svrattrl));
	}

	if ((fp != NULL) && (fp != stdin))
		fclose(fp);

	if (in_data != NULL) {
		free(in_data);
	}

	hook_perf_stat_stop(perf_label, perf_action, 0);
	return (rc);
}

/**
 *
 * @brief
 *		Prints out to the file opened in stream 'fp', the contents of the
 *		string array 'str_array'.
 *
 * @param[in]	fp	-	the stream pointer of the file to write output into
 * @param[in]	head_str	-	some string to print out the beginning.
 * @param[in]	str_array	-	the array whose contents are being printed.
 *
 * @return	none
 */
void
fprint_str_array(FILE *fp, char *head_str, void **str_array)
{
	int i;

	for (i = 0; str_array[i]; i++)
		fprintf(fp, "%s[%d]=%s\n", head_str, i, (char *) str_array[i]);
}

/**
 * @brief
 * 		Given an 'argv_list', return a malloc-ed
 * 		string, containing the argv_list->al_values separated
 *		by spaces.
 * @note
 *		Need to free() returned value.
 *
 * @param[in]	argv_list	-	an argv list.
 *
 * @return	char *
 * @retval	<string>	-	pointer to a malloced area holding
 *				  			the values of 'argv_list'.
 * @retval	NULL	: error
 *
 */
static char *
argv_list_to_str(pbs_list_head *argv_list)
{
	int i, len;
	char *ret_string = NULL;
	svrattrl *plist = NULL;

	if (argv_list == NULL)
		return NULL;

	len = 0;
	i = 0;

	/* calculate the list size */
	plist = (svrattrl *) GET_NEXT(*argv_list);
	while (plist) {
		if (plist->al_value == NULL) {
			return NULL;
		}
		len += strlen(plist->al_value);
		len++; /* for ' ' (space) */
		i++;
		plist = (svrattrl *) GET_NEXT(plist->al_link);
	}

	len++; /* for trailing '\0' */

	if (len > 1) { /* not an empty list */
		ret_string = (char *) malloc(len);

		if (ret_string == NULL)
			return NULL;
		i = 0;
		plist = (svrattrl *) GET_NEXT(*argv_list);
		while (plist) {
			if (i == 0) {
				strcpy(ret_string, plist->al_value);
			} else {
				strcat(ret_string, " ");
				strcat(ret_string, plist->al_value);
			}
			i++;
			plist = (svrattrl *) GET_NEXT(plist->al_link);
		}
	}
	return (ret_string);
}

/**
 *
 * @brief
 * 		pbs_python is a wrapper to the Python program shipped with
 *      PBS. It will construct a Python search path for modules
 *      (i.e. sys.path/PYTHONPATH) that points to directories in
 *      $PBS_EXEC/python, and then will call the Python interpreter taking
 * 	  	as input arguments from the commandline if they exist; otherwise,
 *	  	the name of the script file to execute as taken from STDIN.
 */

int
main(int argc, char *argv[], char *envp[])
{
#ifndef WIN32
	char dirname[MAXPATHLEN + 1];
	int env_len = 0;
#else
	char python_cmdline[MAXBUF + 1];
#endif
	char **lenvp = NULL;
	int i, rc;

	/* python externs */
	extern void pbs_python_svr_initialize_interpreter_data(struct python_interpreter_data * interp_data);
	extern void pbs_python_svr_destroy_interpreter_data(struct python_interpreter_data * interp_data);

	if (set_msgdaemonname(PBS_PYTHON_PROGRAM)) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}

#ifdef WIN32
	/* The following needed so that buffered writes (e.g. fprintf) */
	/* won't end up getting ^M */
	_set_fmode(_O_BINARY);
#endif

	if (initsocketlib())
		return 1;

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);
	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "Failed to load pbs.conf!\n");
		return 1;
	}

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	/* by default, server_name is what is set in /etc/pbs.conf */
	(void) strcpy(server_name, pbs_conf.pbs_server_name);

	/* determine the actual server name */
	pbs_server_name = pbs_default();
	if ((!pbs_server_name) || (*pbs_server_name == '\0')) {
		log_err(-1, PBS_PYTHON_PROGRAM, "Unable to get server name");
		return (-1);
	}

	/* determine the server host name */
	if (get_fullhostname(pbs_server_name, server_host, PBS_MAXSERVERNAME) != 0) {
		log_err(-1, PBS_PYTHON_PROGRAM, "Unable to get server host name");
		return (-1);
	}

	if ((job_attr_idx = cr_attrdef_idx(job_attr_def, JOB_ATR_LAST)) == NULL) {
		log_err(errno, PBS_PYTHON_PROGRAM, "Failed creating job attribute search index");
		return (-1);
	}
	if ((node_attr_idx = cr_attrdef_idx(node_attr_def, ND_ATR_LAST)) == NULL) {
		log_err(errno, PBS_PYTHON_PROGRAM, "Failed creating node attribute search index");
		return (-1);
	}
	if ((que_attr_idx = cr_attrdef_idx(que_attr_def, QA_ATR_LAST)) == NULL) {
		log_err(errno, PBS_PYTHON_PROGRAM, "Failed creating queue attribute search index");
		return (-1);
	}
	if ((svr_attr_idx = cr_attrdef_idx(svr_attr_def, SVR_ATR_LAST)) == NULL) {
		log_err(errno, PBS_PYTHON_PROGRAM, "Failed creating server attribute search index");
		return (-1);
	}
	if ((sched_attr_idx = cr_attrdef_idx(sched_attr_def, SCHED_ATR_LAST)) == NULL) {
		log_err(errno, PBS_PYTHON_PROGRAM, "Failed creating sched attribute search index");
		return (-1);
	}
	if ((resv_attr_idx = cr_attrdef_idx(resv_attr_def, RESV_ATR_LAST)) == NULL) {
		log_err(errno, PBS_PYTHON_PROGRAM, "Failed creating resv attribute search index");
		return (-1);
	}
	if (cr_rescdef_idx(svr_resc_def, svr_resc_size) != 0) {
		log_err(errno, PBS_PYTHON_PROGRAM, "Failed creating resc definition search index");
		return (-1);
	}

	/* initialize the pointers in the resource_def array */

	for (i = 0; i < (svr_resc_size - 1); ++i)
		svr_resc_def[i].rs_next = &svr_resc_def[i + 1];
	/* last entry is left with null pointer */

	if ((argv[1] == NULL) || (strcmp(argv[1], HOOK_MODE) != 0)) {
		char *python_path = NULL;
		if (get_py_progname(&python_path)) {
			log_err(-1, PBS_PYTHON_PROGRAM, "Failed to find python binary path!");
			return -1;
		}
#ifdef WIN32
		/* unset PYTHONHOME if any */
		SetEnvironmentVariable(PYHOME, NULL);

		/* Just pass on the command line arguments onto Python */

		snprintf(python_cmdline, sizeof(python_cmdline), "%s", python_path);
		for (i = 1; i < argc; i++) {
			strncat(python_cmdline, " \"", sizeof(python_cmdline) - strlen(python_cmdline) - 1);
			strncat(python_cmdline, argv[i], sizeof(python_cmdline) - strlen(python_cmdline) - 1);
			strncat(python_cmdline, "\"", sizeof(python_cmdline) - strlen(python_cmdline) - 1);
		}
		rc = wsystem(python_cmdline, INVALID_HANDLE_VALUE, NULL);
#else
		char in_data[MAXBUF + 1];
		char *largv[3];
		int ll;
		char *pc, *pc2;

		/* Linux/Unix: Create a local environment block (i.e. lenvp)    */
		/* containing PYTHONHOME setting, and give to execve() when it	*/
		/* executes the python script.					*/
		lenvp = (char **) envp;
		do
			env_len += 1;
		while (*lenvp++);

		lenvp = (char **) malloc((env_len + 1) * sizeof(char *));
		if (lenvp == NULL) {
			errno = ENOMEM;
			return 1;
		}

		/* Copy envp to lenvp */
		for (i = 0; envp[i] != NULL; i++) {
			/* Ignore PYTHONHOME as it will be set by python itself */
			if (strncmp(envp[i], PYHOME_EQUAL, sizeof(PYHOME_EQUAL) - 1) != 0) {
				lenvp[i] = envp[i];
			}
		}
		lenvp[i] = NULL;

		if (argc == 1) {
			/* If no command line options, just check stdin for input */
			/* name, which is what mom does. Also, under              */
			/* sandbox=private, mom passes                            */
			/* "cd <homedir>;<input script>" so we'll need to extract */
			/* the script name this way.                              */

			if (fgets(in_data, sizeof(in_data), stdin) == NULL) {
				fprintf(stderr, "No python script file found!\n");
				return 1;
			}
			ll = strlen(in_data);

			if (in_data[ll - 1] == '\n')
				/* remove newline */
				in_data[ll - 1] = '\0';

			pc = strchr(in_data, ';');
			if (pc) {
				pc++;
				while (isspace(*pc))
					pc++;
				largv[1] = pc;

				/* looking for the "cd <homedir>" part */
				if ((pc = strstr(in_data, "cd"))) { /* found a chdir */
					pc2 = in_data + 2;
					while (isspace(*pc2))
						pc2++;
					pbs_strncpy(dirname, pc2, MAXPATHLEN);
					if ((pc = strrchr(dirname, ';')))
						*pc = '\0';
					if (chdir(dirname) == -1) {
						fprintf(stderr,
							"Failed to chdir to %s (errno %d)\n",
							dirname, errno);
						return 1;
					}
				}
			} else {
				pc = in_data;
				while (isspace(*pc))
					pc++;
				largv[1] = pc;
			}

			if (largv[1][0] == '\0') {
				fprintf(stderr, "Failed to obtain python script\n");
				return 1;
			}

			largv[0] = python_path;
			largv[2] = NULL;

			rc = execve(python_path, largv, lenvp);
		} else {
			argv[0] = python_path;
			rc = execve(python_path, argv, lenvp);
		}
#endif
		free(python_path);
	} else { /* hook mode */

		char **argv2 = NULL;
		int argc2;
		int argv_len = 0;
		char hook_script[MAXPATHLEN + 1] = {'\0'};
		char the_input[MAXPATHLEN + 1] = {'\0'};
		char the_output[MAXPATHLEN + 1] = {'\0'};
		char the_server_output[MAXPATHLEN + 1] = {'\0'};
		char the_data[MAXPATHLEN + 1] = {'\0'};
		char path_log[MAXPATHLEN + 1] = {'\0'};
		char logname[MAXPATHLEN + 1] = {'\0'};

		char hook_name[MAXBUF + 1] = {'\0'};
		char req_user[PBS_MAXUSER + 1] = {'\0'};
		char req_host[PBS_MAXHOSTNAME + 1] = {'\0'};
		char hookstr_type[MAXBUF + 1] = {'\0'};
		char hookstr_event[MAXBUF + 1] = {'\0'};
		int hook_alarm = 0;
		int c, j;
		int errflg = 0;
		unsigned int hook_event = 0;
		struct python_script *py_script = NULL;
		pbs_list_head default_list, event, event_job, event_job_o,
			event_resv, event_vnode, event_src_queue, event_vnode_fail,
			event_aoe, event_argv, event_jobs,
			server, server_jobs, server_jobs_ids,
			server_queues, server_queues_names,
			server_resvs, server_resvs_resvids,
			server_vnodes, server_vnodes_names,
			job_failed_mom_list, job_succeeded_mom_list;
		svrattrl *svrattrl_e;
		FILE *fp_out = NULL;
		FILE *fp_server_out = NULL;
		svrattrl *plist = NULL;
		struct rq_queuejob rqj;
		struct rq_manage rqm;
		struct rq_move rqmv;
		struct rq_runjob rqrun;
		char *rej_msg = NULL;
		char *rerunjob_str = NULL;
		char *deletejob_str = NULL;
		char *new_exec_time_str = NULL;
		char *new_hold_types_str = NULL;
		char *new_project_str = NULL;
		hook_input_param_t req_params;
		hook_output_param_t req_params_out;
		char *progname = NULL;
		char *progname_orig = NULL;
		char *env_str = NULL;
		char *env_str_orig = NULL;
		char *argv_str_orig = NULL;
		char *argv_str = NULL;
		int print_progname = 0;
		int print_argv = 0;
		int print_env = 0;
		char *tmp_str = NULL;
		char perf_label[MAXBUF];
		char perf_action[MAXBUFLEN + 13]; /* Additional 13 byte for description string*/
		char *sp;

		the_input[0] = '\0';
		the_output[0] = '\0';
		the_server_output[0] = '\0';
		the_data[0] = '\0';
		hook_name[0] = '\0';
		req_user[0] = '\0';
		req_host[0] = '\0';
		hookstr_type[0] = '\0';
		hookstr_event[0] = '\0';
		hook_script[0] = '\0';
		logname[0] = '\0';
		strcpy(path_log, ".");

		if (*(argv + 2) == NULL) {
			fprintf(stderr, "%s --hook -i <input_file> [-s <data_file>] [-o <output_file>] [-L <path_log>] [-l <logname>] [-r <resourcedef>] [-e <log_event_mask>] [<python_script>]\n", argv[0]);
			exit(2);
		}
		argv2 = (char **) argv;
		do
			argv_len += 1;
		while (*argv2++);

		argv2 = (char **) malloc((argv_len + 1) * sizeof(char *));
		if (argv2 == NULL) {
			return 1;
		}

		argc2 = 0;
		for (i = 0, j = 0; argv[i] != NULL; i++) {
			if (strncmp(argv[i], HOOK_MODE,
				    sizeof(HOOK_MODE) - 1) == 0)
				continue;
			argv2[j++] = argv[i];
			argc2++;
		}
		argv2[i] = NULL;

		pbs_python_set_use_static_data_value(0);
		while ((c = getopt(argc2, argv2, "i:o:l:L:e:r:s:")) != EOF) {

			switch (c) {
				case 'i':
					while (isspace((int) *optarg))
						optarg++;

					if (optarg[0] == '\0') {
						fprintf(stderr, "pbs_python: illegal -i value\n");
						errflg++;
					} else {
						snprintf(the_input, sizeof(the_input), "%s", optarg);
					}
					break;
				case 'o':
					while (isspace((int) *optarg))
						optarg++;

					if (optarg[0] == '\0') {
						fprintf(stderr, "pbs_python: illegal -o value\n");
						errflg++;
					} else {
						snprintf(the_output, sizeof(the_output), "%s", optarg);
					}
					break;
				case 's':
					while (isspace((int) *optarg))
						optarg++;

					if (optarg[0] == '\0') {
						fprintf(stderr, "pbs_python: illegal -s value\n");
						errflg++;
					} else {
						snprintf(the_data, sizeof(the_data), "%s", optarg);
						pbs_python_set_use_static_data_value(1);
					}
					break;
				case 'L':
					while (isspace((int) *optarg))
						optarg++;

					if (optarg[0] == '\0') {
						fprintf(stderr, "pbs_python: illegal -L value\n");
						errflg++;
					} else {
						snprintf(path_log, sizeof(path_log), "%s", optarg);
					}
					break;
				case 'l':
					while (isspace((int) *optarg))
						optarg++;

					if (optarg[0] == '\0') {
						fprintf(stderr, "pbs_python: illegal -l value\n");
						errflg++;
					} else {
						snprintf(logname, sizeof(logname), "%s", optarg);
					}
					break;
				case 'e':
					while (isspace((int) *optarg))
						optarg++;

					if (optarg[0] == '\0') {
						fprintf(stderr, "pbs_python: illegal -e value\n");
						errflg++;
					} else {
						char *bad;

						*log_event_mask = strtol(optarg, &bad, 0);
						if ((*bad != '\0') && !isspace((int) *bad)) {
							fprintf(stderr,
								"pbs_python: bad -e value %s\n",
								optarg);
							errflg++;
						}
					}
					break;
				case 'r':
					while (isspace((int) *optarg))
						optarg++;

					if (optarg[0] == '\0') {
						fprintf(stderr, "pbs_python: illegal -r value\n");
						errflg++;
					} else {
						path_rescdef = strdup(optarg);
						if (path_rescdef == NULL) {
							fprintf(stderr,
								"pbs_python: errno %d mallocing path_rescdef\n", errno);
							errflg++;
						}
					}
					break;
				default:
					errflg++;
			}
			if (errflg) {
				fprintf(stderr, "%s --hook -i <hook_input> [-s <data_file>] [-o <hook_output>] [-L <path_log>] [-l <logname>] [-r <resourcedef>] [-e <log_event_mask>] [<python_script>]\n", argv[0]);
				exit(2);
			}
		}

		if (the_input[0] == '\0') {
			fprintf(stderr, "%s: No -i <input_file> given\n",
				argv[0]);
			exit(2);
		}

		if (path_rescdef != NULL) {
			if (setup_resc(1) == -1) {
				fprintf(stderr, "setup_resc() of %s failed!",
					path_rescdef);
				exit(2);
			}
		}

		if ((optind < argc2) && (argv2[optind] != NULL)) {
			strncpy(hook_script, argv2[optind],
				sizeof(hook_script) - 1);
		}
		if (log_open_main(logname, path_log, 1) != 0) { /* use given name */
			fprintf(stderr, "pbs_python: Unable to open logfile\n");
			exit(1);
		}

		sp = NULL;
		if (the_input[0] != '\0') {
			sp = strrchr(the_input, '/');
			if (sp != NULL)
				sp++;
			else
				sp = the_input;
		}
		snprintf(perf_label, sizeof(perf_label), "%s", sp ? sp : "stdin");
		hook_perf_stat_start(perf_label, PBS_PYTHON_PROGRAM, 1);

		CLEAR_HEAD(default_list);
		CLEAR_HEAD(event);
		CLEAR_HEAD(event_job);
		CLEAR_HEAD(event_job_o);
		CLEAR_HEAD(event_resv);
		CLEAR_HEAD(event_vnode);
		CLEAR_HEAD(event_vnode_fail);
		CLEAR_HEAD(job_failed_mom_list);
		CLEAR_HEAD(job_succeeded_mom_list);
		CLEAR_HEAD(event_src_queue);
		CLEAR_HEAD(event_aoe);
		CLEAR_HEAD(event_argv);
		CLEAR_HEAD(event_jobs);

		rc = pbs_python_populate_svrattrl_from_file(the_input,
							    &default_list,
							    &event, &event_job, &event_job_o, &event_resv,
							    &event_vnode, &event_vnode_fail, &job_failed_mom_list,
							    &job_succeeded_mom_list, &event_src_queue,
							    &event_aoe, &event_argv, &event_jobs,
							    perf_label, HOOK_PERF_LOAD_INPUT);
		if (rc == -1) {
			fprintf(stderr, "%s: failed to populate svrattrl \n", argv[0]);
			exit(2);
		}
		if (the_data[0] != '\0') {
			CLEAR_HEAD(server);
			CLEAR_HEAD(server_jobs);
			CLEAR_HEAD(server_jobs_ids);
			CLEAR_HEAD(server_queues);
			CLEAR_HEAD(server_queues_names);
			CLEAR_HEAD(server_resvs);
			CLEAR_HEAD(server_resvs_resvids);
			CLEAR_HEAD(server_vnodes);
			CLEAR_HEAD(server_vnodes_names);
			pbs_python_unset_server_info();
			pbs_python_unset_server_jobs_info();
			pbs_python_unset_server_queues_info();
			pbs_python_unset_server_resvs_info();
			pbs_python_unset_server_vnodes_info();

			rc = pbs_python_populate_server_svrattrl_from_file(the_data,
									   &default_list, &server,
									   &server_jobs, &server_jobs_ids,
									   &server_queues, &server_queues_names,
									   &server_resvs, &server_resvs_resvids,
									   &server_vnodes, &server_vnodes_names,
									   the_data, HOOK_PERF_LOAD_DATA);
			if (rc == -1) {
				fprintf(stderr,
					"%s: failed to populate svrattrl \n",
					argv[0]);
				exit(2);
			}
			pbs_python_set_server_info(&server);
			pbs_python_set_server_jobs_info(&server_jobs,
							&server_jobs_ids);
			pbs_python_set_server_queues_info(&server_queues,
							  &server_queues_names);
			pbs_python_set_server_resvs_info(&server_resvs,
							 &server_resvs_resvids);
			pbs_python_set_server_vnodes_info(&server_vnodes,
							  &server_vnodes_names);
		}

		plist = (svrattrl *) GET_NEXT(event);
		while (plist) {

			if (strcmp(plist->al_name, "type") == 0) {
				hook_event =
					hookstr_event_toint(plist->al_value);
				sprintf(hookstr_event, "%u", hook_event);
			} else if (strcmp(plist->al_name, "hook_name") == 0) {
				strcpy(hook_name, plist->al_value);
			} else if (strcmp(plist->al_name, "requestor") == 0) {
				strcpy(req_user, plist->al_value);
			} else if (strcmp(plist->al_name,
					  "requestor_host") == 0) {
				strcpy(req_host, plist->al_value);
			} else if (strcmp(plist->al_name, "hook_type") == 0) {
				strcpy(hookstr_type, plist->al_value);
			} else if (strcmp(plist->al_name, "alarm") == 0) {
				hook_alarm = atoi(plist->al_value);
			} else if (strcmp(plist->al_name, "debug") == 0) {
				strncpy(the_server_output, plist->al_value,
					sizeof(the_server_output) - 1);
				fp_server_out = fopen(the_server_output,
						      "w");
				if (fp_server_out == NULL) {
					log_eventf(PBSEVENT_DEBUG,
						   PBS_EVENTCLASS_HOOK, LOG_WARNING,
						   __func__,
						   "warning: error opening debug data file %s",
						   the_server_output);
					pbs_python_set_hook_debug_data_fp(NULL);
					pbs_python_set_hook_debug_data_file("");
				} else {
					pbs_python_set_hook_debug_data_fp(fp_server_out);
					pbs_python_set_hook_debug_data_file(the_server_output);
				}
			} else if ((strcmp(plist->al_name, HOOKATT_USER) != 0) &&
				   (strcmp(plist->al_name, HOOKATT_FREQ) != 0) &&
				   (strcmp(plist->al_name, PY_EVENT_PARAM_PROGNAME) != 0) &&
				   (strcmp(plist->al_name, PY_EVENT_PARAM_ARGLIST) != 0) &&
				   (strcmp(plist->al_name, PY_EVENT_PARAM_ENV) != 0) &&
				   (strcmp(plist->al_name, PY_EVENT_PARAM_PID) != 0) &&
				   (strcmp(plist->al_name, HOOKATT_FAIL_ACTION) != 0)) {
				fprintf(stderr, "%s: unknown event attribute '%s'\n", argv[0], plist->al_name);
				exit(2);
			}

			plist = (svrattrl *) GET_NEXT(plist->al_link);
		}

		if (req_host[0] == '\0')
			gethostname(req_host, PBS_MAXHOSTNAME);

		fix_path(logname, 3);

		if ((logname[0] != '\0') && (!is_full_path(logname))) {
			char curdir[MAXPATHLEN + 1];
			char full_logname[MAXPATHLEN + 1];
			char *slash;
#ifdef WIN32
			slash = "\\";
#else
			slash = "/";
#endif
			/* save current working dir before any chdirs */
			if (getcwd(curdir, MAXPATHLEN) == NULL) {
				fprintf(stderr, "getcwd failed\n");
				exit(2);
			}
			if ((strlen(curdir) + strlen(logname) + 1) >= sizeof(full_logname)) {
				fprintf(stderr, "log file path too long\n");
				exit(2);
			}
			/*
			 * The following silliness is brought to you by gcc version 8.
			 * Having checked to ensure full_logname is large enough we
			 * should be able to snprintf() the entire string in one call.
			 * However, the bounds checking in gcc version 8 is overzealous
			 * and generates a format-overflow warning forcing us to use
			 * strcat() instead.
			 */
			snprintf(full_logname, sizeof(full_logname), "%s", curdir);
			strncat(full_logname, slash, sizeof(full_logname) - strlen(full_logname));
			strncat(full_logname, logname, sizeof(full_logname) - strlen(full_logname));
			snprintf(logname, sizeof(logname), "%s", full_logname);
		}

		/* set python interp data */
		svr_interp_data.data_initialized = 0;
		svr_interp_data.init_interpreter_data = pbs_python_svr_initialize_interpreter_data;
		svr_interp_data.destroy_interpreter_data = pbs_python_svr_destroy_interpreter_data;

		svr_interp_data.daemon_name = strdup(PBS_PYTHON_PROGRAM);

		if (svr_interp_data.daemon_name == NULL) { /* should not happen */
			fprintf(stderr, "strdup failed");
			exit(1);
		}

		(void) pbs_python_ext_alloc_python_script(hook_script,
							  (struct python_script **) &py_script);

		hook_perf_stat_start(perf_label, HOOK_PERF_START_PYTHON, 0);
		if (pbs_python_ext_start_interpreter(&svr_interp_data) != 0) {
			fprintf(stderr, "Failed to start Python interpreter");
			exit(1);
		}
		hook_perf_stat_stop(perf_label, HOOK_PERF_START_PYTHON, 0);
		hook_input_param_init(&req_params);
		switch (hook_event) {

			case HOOK_EVENT_QUEUEJOB:
				rqj.rq_jid[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqj.rq_jid,
					       svrattrl_e->al_value);
				}
				rqj.rq_destin[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   ATTR_queue, NULL)) != NULL) {
					strcpy((char *) rqj.rq_destin,
					       svrattrl_e->al_value);
				}
				if (copy_svrattrl_list(&event_job,
						       &rqj.rq_attr) == -1) {
					log_err(errno, PBS_PYTHON_PROGRAM, "failed to copy event_job");
					rc = 1;
					goto pbs_python_end;
				}

				req_params.rq_job = (struct rq_quejob *) &rqj;
				req_params.vns_list = (pbs_list_head *) &event_vnode;
				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_POSTQUEUEJOB:
				rqj.rq_jid[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqj.rq_jid,
					       svrattrl_e->al_value);
				}
				rqj.rq_destin[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   ATTR_queue, NULL)) != NULL) {
					strcpy((char *) rqj.rq_destin,
					       svrattrl_e->al_value);
				}
				if (copy_svrattrl_list(&event_job,
						       &rqj.rq_attr) == -1) {
					log_err(errno, PBS_PYTHON_PROGRAM, "failed to copy event_job");
					rc = 1;
					goto pbs_python_end;
				}

				req_params.rq_job = (struct rq_postqueuejob *) &rqj;
				req_params.vns_list = (pbs_list_head *) &event_vnode;
				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_MODIFYJOB:
				rqm.rq_objname[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqm.rq_objname,
					       svrattrl_e->al_value);
				}
				if (copy_svrattrl_list(&event_job,
						       &rqm.rq_attr) == -1) {
					log_err(errno, PBS_PYTHON_PROGRAM, "failed to copy event_job");
					rc = 1;
					goto pbs_python_end;
				}

				req_params.rq_manage = (struct rq_manage *) &rqm;
				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_MOVEJOB:
				rqmv.rq_jid[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqmv.rq_jid,
					       svrattrl_e->al_value);
				}

				req_params.rq_move = (struct rq_move *) &rqmv;
				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_RUNJOB:
				rqrun.rq_jid[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqrun.rq_jid,
					       svrattrl_e->al_value);
				}
				req_params.rq_run = (struct rq_runjob *) &rqrun;

				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_RESVSUB:
				rqj.rq_jid[0] = '\0';
				if ((svrattrl_e = find_svrattrl_list_entry(&event_resv,
									   "resvid", NULL)) != NULL) {
					strcpy((char *) rqj.rq_jid,
					       svrattrl_e->al_value);
				}
				if (copy_svrattrl_list(&event_resv,
						       &rqj.rq_attr) == -1) {
					log_err(errno, PBS_PYTHON_PROGRAM, "failed to copy event_job");
					rc = 1;
					goto pbs_python_end;
				}
				req_params.rq_job = (struct rq_queuejob *) &rqj;
				req_params.vns_list = (pbs_list_head *) &event_vnode;
				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_EXECJOB_BEGIN:
			case HOOK_EVENT_EXECJOB_PROLOGUE:
			case HOOK_EVENT_EXECJOB_EPILOGUE:
			case HOOK_EVENT_EXECJOB_END:
			case HOOK_EVENT_EXECJOB_PRETERM:
			case HOOK_EVENT_EXECJOB_RESIZE:
			case HOOK_EVENT_EXECJOB_ABORT:
			case HOOK_EVENT_EXECJOB_POSTSUSPEND:
			case HOOK_EVENT_EXECJOB_PRERESUME:

				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqj.rq_jid,
					       svrattrl_e->al_value);
				}
				rqj.rq_destin[0] = '\0';

				if (copy_svrattrl_list(&event_job,
						       &rqj.rq_attr) == -1) {
					log_err(errno, PBS_PYTHON_PROGRAM, "failed to copy event_job");
					rc = 1;
					goto pbs_python_end;
				}
				req_params.rq_job = (struct rq_queuejob *) &rqj;
				req_params.vns_list = (pbs_list_head *) &event_vnode;

				if (hook_event == HOOK_EVENT_EXECJOB_PROLOGUE) {
					req_params.vns_list_fail = (pbs_list_head *) &event_vnode_fail;
					req_params.failed_mom_list = &job_failed_mom_list;
					req_params.succeeded_mom_list = &job_succeeded_mom_list;
				}

				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;

			case HOOK_EVENT_EXECJOB_LAUNCH:

				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqj.rq_jid,
					       svrattrl_e->al_value);
				}
				rqj.rq_destin[0] = '\0';

				if (copy_svrattrl_list(&event_job,
						       &rqj.rq_attr) == -1) {
					log_err(errno, PBS_PYTHON_PROGRAM, "failed to copy event_job");
					rc = 1;
					goto pbs_python_end;
				}

				req_params.rq_job = (struct rq_queuejob *) &rqj;
				req_params.vns_list = &event_vnode;
				req_params.vns_list_fail = &event_vnode_fail;
				req_params.failed_mom_list = &job_failed_mom_list;
				req_params.succeeded_mom_list = &job_succeeded_mom_list;

				if ((svrattrl_e = find_svrattrl_list_entry(&event,
									   PY_EVENT_PARAM_PROGNAME, NULL)) != NULL) {
					req_params.progname = svrattrl_e->al_value;
					progname_orig = svrattrl_e->al_value;
				} else {
					progname_orig = "";
				}

				req_params.argv_list = (pbs_list_head *) &event_argv;

				argv_str_orig = argv_list_to_str((pbs_list_head *) &event_argv);
				if ((svrattrl_e = find_svrattrl_list_entry(&event,
									   PY_EVENT_PARAM_ENV, NULL)) != NULL) {
					req_params.env = svrattrl_e->al_value;
					env_str_orig = svrattrl_e->al_value;
				} else {
					env_str_orig = "";
				}

				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_EXECJOB_ATTACH:

				if ((svrattrl_e = find_svrattrl_list_entry(&event_job,
									   "id", NULL)) != NULL) {
					strcpy((char *) rqj.rq_jid,
					       svrattrl_e->al_value);
				}
				rqj.rq_destin[0] = '\0';

				if (copy_svrattrl_list(&event_job,
						       &rqj.rq_attr) == -1) {
					log_err(errno, PBS_PYTHON_PROGRAM, "failed to copy event_job");
					rc = 1;
					goto pbs_python_end;
				}

				req_params.rq_job = (struct rq_queuejob *) &rqj;

				if ((svrattrl_e = find_svrattrl_list_entry(&event,
									   PY_EVENT_PARAM_PID, NULL)) != NULL) {
					req_params.pid = atoi(svrattrl_e->al_value);
				} else {
					req_params.pid = -1;
				}

				req_params.vns_list = (pbs_list_head *) &event_vnode;

				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}

				break;
			case HOOK_EVENT_EXECHOST_PERIODIC:
			case HOOK_EVENT_EXECHOST_STARTUP:
				req_params.vns_list = &event_vnode;
				if (hook_event == HOOK_EVENT_EXECHOST_PERIODIC) {
					req_params.jobs_list = &event_jobs;
				}
				rc = pbs_python_event_set(hook_event, req_user, req_host, &req_params, perf_label);

				if (rc == -1) { /* internal server code failure */
					log_event(PBSEVENT_DEBUG,
						  PBS_EVENTCLASS_HOOK, LOG_ERR,
						  hook_name,
						  "Encountered an error while setting event");
				}
				break;
			default:
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_ERR,
					  hook_name, "Unexpected event");
				rc = 1;
				goto pbs_python_end;
		}

		/* This sets Python event object's hook_name value */
		rc = pbs_python_event_set_attrval(PY_EVENT_HOOK_NAME,
						  hook_name);

		if (rc == -1) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, hook_name, "Failed to set event 'hook_name'.");
		}

		rc = pbs_python_event_set_attrval(PY_EVENT_HOOK_TYPE,
						  hookstr_type);

		if (rc == -1) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, hook_name, "Failed to set event 'hook_type'.");
		}

		rc = pbs_python_event_set_attrval(PY_EVENT_TYPE,
						  hookstr_event);

		if (rc == -1) {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK,
				  LOG_ERR, hook_name,
				  "Failed to set event 'type'.");
		}

		pbs_python_set_mode(PY_MODE); /* hook script mode */

		/* reset global flag to allow modification of             */
		/* attributes and resources for every new hook execution. */
		pbs_python_event_param_mod_allow();

		set_alarm(hook_alarm, pbs_python_set_interrupt);
		if (hook_script[0] == '\0') {
			wchar_t *tmp_argv[2];

			tmp_argv[0] = Py_DecodeLocale(argv[0], NULL);
			if (tmp_argv[0] == NULL) {
				fprintf(stderr, "Fatal error: cannot decode script name\n");
				exit(2);
			}
			tmp_argv[1] = NULL;

			rc = Py_Main(1, tmp_argv);
			PyMem_RawFree(tmp_argv[0]);
		} else {
			hook_perf_stat_start(perf_label, HOOK_PERF_RUN_CODE, 0);
			rc = pbs_python_run_code_in_namespace(&svr_interp_data,
							      py_script, 0);
			hook_perf_stat_stop(perf_label, HOOK_PERF_RUN_CODE, 0);
		}
		set_alarm(0, pbs_python_set_interrupt);

		pbs_python_set_mode(C_MODE); /* PBS C mode - flexible */

		/* Prepare output file */
		if (*the_output != '\0') {
			fp_out = fopen(the_output, "w");

			if (fp_out == NULL) {
				fprintf(stderr, "failed to open event output file %s\n", the_output);
				exit(2);
			}
		} else {
			fp_out = stdout;
		}

		switch (rc) {
			case -1: /* internal error */
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, hook_name,
					  "Internal server error encountered. Skipping hook.");
				rc = -1; /* should not happen */
				goto pbs_python_end;
			case -2: /* unhandled exception */
				pbs_python_event_reject(NULL);
				pbs_python_event_param_mod_disallow();

				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "%s hook '%s' encountered an exception, "
					 "request rejected",
					 hook_event_as_string(hook_event), hook_name);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, hook_name, log_buffer);
				rc = -2; /* should not happen */
				break;
			case -3: /* alarm timeout */
				pbs_python_event_reject(NULL);
				pbs_python_event_param_mod_disallow();

				snprintf(log_buffer, LOG_BUF_SIZE - 1,
					 "alarm call while running %s hook '%s', "
					 "request rejected",
					 hook_event_as_string(hook_event), hook_name);
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK,
					  LOG_ERR, hook_name, log_buffer);
				rc = -3; /* should not happen */
				break;
		}

		hook_output_param_init(&req_params_out);

		sp = NULL;
		if (the_output[0] != '\0') {
			sp = strrchr(the_output, '/');
			if (sp != NULL)
				sp++;
			else
				sp = the_output;
		}
		snprintf(perf_action, sizeof(perf_action), "%s:%s", HOOK_PERF_HOOK_OUTPUT, sp ? sp : "stdout");

		switch (hook_event) {

			case HOOK_EVENT_QUEUEJOB:

				if (pbs_python_event_get_accept_flag() == FALSE) {
					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);
				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);

					req_params_out.rq_job = (struct rq_quejob *) &rqj;
					pbs_python_event_to_request(hook_event, &req_params_out, perf_label, perf_action);

					fprint_svrattrl_list(fp_out, EVENT_JOB_OBJECT,
							     &rqj.rq_attr);
				}
				break;

			case HOOK_EVENT_POSTQUEUEJOB:

				if (pbs_python_event_get_accept_flag() == FALSE) {
					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);
				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);

					req_params_out.rq_job = (struct rq_postqueuejob *) &rqj;
					pbs_python_event_to_request(hook_event, &req_params_out, perf_label, perf_action);

					fprint_svrattrl_list(fp_out, EVENT_JOB_OBJECT,
							     &rqj.rq_attr);
				}
				break;

			case HOOK_EVENT_MODIFYJOB:

				if (pbs_python_event_get_accept_flag() == FALSE) {
					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);

				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);
					req_params_out.rq_manage = (struct rq_manage *) &rqm;
					pbs_python_event_to_request(hook_event, &req_params_out, perf_label, perf_action);
					fprint_svrattrl_list(fp_out, EVENT_JOB_OBJECT,
							     &rqm.rq_attr);
				}
				break;
			case HOOK_EVENT_MOVEJOB:

				if (pbs_python_event_get_accept_flag() == FALSE) {
					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);

				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);
					req_params_out.rq_move = (struct rq_manage *) &rqmv;
					pbs_python_event_to_request(hook_event, &req_params_out, perf_label, perf_action);
					if (rqmv.rq_destin[0] != '\0')
						fprintf(fp_out, "%s.%s=%s\n", EVENT_OBJECT,
							PY_EVENT_PARAM_SRC_QUEUE, rqmv.rq_destin);
				}
				break;

			case HOOK_EVENT_RUNJOB:

				if (pbs_python_event_get_accept_flag() == FALSE) {
					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);

					new_exec_time_str =
						pbs_python_event_job_getval_hookset(ATTR_a,
										    NULL, 0, NULL, 0);

					if (new_exec_time_str != NULL)
						fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT,
							ATTR_a, new_exec_time_str);

					new_hold_types_str =
						pbs_python_event_job_getval_hookset(ATTR_h,
										    NULL, 0, NULL, 0);

					if (new_hold_types_str != NULL)
						fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT,
							ATTR_h, new_hold_types_str);

					new_project_str =
						pbs_python_event_job_getval_hookset(ATTR_project,
										    NULL, 0, NULL, 0);
					if (new_project_str != NULL)
						fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT,
							ATTR_project, new_project_str);

				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);
				}
				break;
			case HOOK_EVENT_RESVSUB:

				if (pbs_python_event_get_accept_flag() == FALSE) {
					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);

				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);
					req_params_out.rq_job = (struct rq_quejob *) &rqj;
					pbs_python_event_to_request(hook_event, &req_params_out, perf_label, perf_action);
					fprint_svrattrl_list(fp_out, EVENT_RESV_OBJECT,
							     &rqj.rq_attr);
				}
				break;

			case HOOK_EVENT_EXECJOB_BEGIN:
			case HOOK_EVENT_EXECJOB_PROLOGUE:
			case HOOK_EVENT_EXECJOB_EPILOGUE:
			case HOOK_EVENT_EXECJOB_END:
			case HOOK_EVENT_EXECJOB_PRETERM:
			case HOOK_EVENT_EXECJOB_LAUNCH:
			case HOOK_EVENT_EXECJOB_ABORT:
			case HOOK_EVENT_EXECJOB_POSTSUSPEND:
			case HOOK_EVENT_EXECJOB_PRERESUME:

				if (pbs_python_event_get_accept_flag() == FALSE) {

					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);

				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);
				}

				/* Whether accept or reject, show job, vnode_list changes and job actions */
				free_attrlist(&event_vnode);
				CLEAR_HEAD(event_vnode);

				if (hook_event == HOOK_EVENT_EXECJOB_LAUNCH) {
					if (progname != NULL) {
						free(progname);
						progname = NULL;
					}
					free_attrlist(&event_argv);
					CLEAR_HEAD(event_argv);
					if (env_str != NULL) {
						free(env_str);
						env_str = NULL;
					}

					free_attrlist(&event_vnode_fail);
					CLEAR_HEAD(event_vnode_fail);

					req_params_out.progname = (char **) &progname;
					req_params_out.argv_list = (pbs_list_head *) &event_argv;
					req_params_out.env = (char **) &env_str;
					req_params_out.vns_list = (pbs_list_head *) &event_vnode;
					req_params_out.vns_list_fail = (pbs_list_head *) &event_vnode_fail;
				} else if (hook_event == HOOK_EVENT_EXECJOB_PROLOGUE) {

					free_attrlist(&event_vnode_fail);
					CLEAR_HEAD(event_vnode_fail);
					req_params_out.vns_list_fail = (pbs_list_head *) &event_vnode_fail;
				}

				req_params_out.rq_job = (struct rq_quejob *) &rqj;
				req_params_out.vns_list = (pbs_list_head *) &event_vnode;
				pbs_python_event_to_request(hook_event,
							    &req_params_out, perf_label, perf_action);
				fprint_svrattrl_list(fp_out, EVENT_JOB_OBJECT,
						     &rqj.rq_attr);
				fprint_svrattrl_list(fp_out,
						     EVENT_VNODELIST_OBJECT,
						     &event_vnode);

				if (hook_event == HOOK_EVENT_EXECJOB_LAUNCH) {
					fprint_svrattrl_list(fp_out, EVENT_VNODELIST_FAIL_OBJECT, &event_vnode_fail);
					fprintf(fp_out, "%s=%s\n", EVENT_PROGNAME_OBJECT, progname);
					fprint_svrattrl_list(fp_out, EVENT_OBJECT, &event_argv);
					fprintf(fp_out, "%s=\"\"\"%s\"\"\"\n", EVENT_ENV_OBJECT, env_str);
					if (strcmp(progname_orig, progname) != 0)
						print_progname = 1;

					argv_str = argv_list_to_str((pbs_list_head *) &event_argv);

					if (((argv_str_orig == NULL) && (argv_str != NULL)) ||
					    ((argv_str_orig != NULL) && (argv_str == NULL)) ||
					    ((argv_str_orig != NULL) && (argv_str != NULL) &&
					     (strcmp(argv_str_orig, argv_str) != 0)))
						print_argv = 1;

					if (!varlist_same(env_str_orig, env_str))
						print_env = 1;

					if (print_progname) {
						snprintf(log_buffer, sizeof(log_buffer), "progname orig: %s", progname_orig);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, hook_name, log_buffer);
						snprintf(log_buffer, sizeof(log_buffer), "progname new: %s", progname);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, hook_name, log_buffer);
					}
					if (print_argv) {
						snprintf(log_buffer, sizeof(log_buffer), "argv orig: %s", argv_str_orig ? argv_str_orig : "");
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, hook_name, log_buffer);
						snprintf(log_buffer, sizeof(log_buffer), "argv new: %s", argv_str ? argv_str : "");
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, hook_name, log_buffer);
					}
					if (print_env) {
						snprintf(log_buffer, sizeof(log_buffer), "env orig: %s", env_str_orig);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, hook_name, log_buffer);
						snprintf(log_buffer, sizeof(log_buffer), "env new: %s", env_str);
						log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_HOOK, LOG_INFO, hook_name, log_buffer);
					}
					free(argv_str_orig);
					free(argv_str);
					/* Put something here the modified stuff */
					tmp_str = pbs_python_event_job_getval_hookset(ATTR_execvnode, NULL, 0, NULL, 0);
					if (tmp_str != NULL)
						fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT, ATTR_execvnode, tmp_str);

					tmp_str = pbs_python_event_job_getval_hookset(ATTR_exechost, NULL, 0, NULL, 0);
					if (tmp_str != NULL)
						fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT, ATTR_exechost, tmp_str);

					tmp_str = pbs_python_event_job_getval_hookset(ATTR_exechost2, NULL, 0, NULL, 0);
					if (tmp_str != NULL)
						fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT, ATTR_exechost2, tmp_str);

					tmp_str = pbs_python_event_job_getval_hookset(ATTR_SchedSelect, NULL, 0, NULL, 0);
					if (tmp_str != NULL)
						fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT, ATTR_SchedSelect, tmp_str);
				} else if (hook_event == HOOK_EVENT_EXECJOB_PROLOGUE) {
					fprint_svrattrl_list(fp_out, EVENT_VNODELIST_FAIL_OBJECT, &event_vnode_fail);
				}

				/* job actions */
				rerunjob_str = pbs_python_event_job_getval_hookset(
					PY_RERUNJOB_FLAG, NULL, 0, NULL, 0);
				if (rerunjob_str != NULL) {
					fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT,
						PY_RERUNJOB_FLAG, rerunjob_str);
				}
				deletejob_str = pbs_python_event_job_getval_hookset(
					PY_DELETEJOB_FLAG, NULL, 0, NULL, 0);
				if (deletejob_str != NULL) {
					fprintf(fp_out, "%s.%s=%s\n", EVENT_JOB_OBJECT,
						PY_DELETEJOB_FLAG,
						deletejob_str);
				}
				break;
			case HOOK_EVENT_EXECHOST_PERIODIC:
			case HOOK_EVENT_EXECHOST_STARTUP:
				if (pbs_python_event_get_accept_flag() == FALSE) {
					rej_msg = pbs_python_event_get_reject_msg();
					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);
				} else {
					fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);
				}
				/* show vnode_list changes whether or not accepted or */
				/*  rejected */
				free_attrlist(&event_vnode);
				CLEAR_HEAD(event_vnode);
				free_attrlist(&event_jobs);
				CLEAR_HEAD(event_jobs);
				req_params_out.vns_list = (pbs_list_head *) &event_vnode;
				if (hook_event == HOOK_EVENT_EXECHOST_PERIODIC) {
					free_attrlist(&event_jobs);
					CLEAR_HEAD(event_jobs);
					req_params_out.jobs_list = (pbs_list_head *) &event_jobs;
				}
				pbs_python_event_to_request(hook_event,
							    &req_params_out, perf_label, perf_action);

				fprint_svrattrl_list(fp_out, EVENT_VNODELIST_OBJECT,
						     &event_vnode);
				if (hook_event == HOOK_EVENT_EXECHOST_PERIODIC) {
					fprint_svrattrl_list(fp_out, EVENT_JOBLIST_OBJECT,
							     &event_jobs);
				}
				break;
			case HOOK_EVENT_EXECJOB_ATTACH:
			case HOOK_EVENT_EXECJOB_RESIZE:

				if (pbs_python_event_get_accept_flag() == FALSE) {

					rej_msg = pbs_python_event_get_reject_msg();

					fprintf(fp_out, "%s=True\n", EVENT_REJECT_OBJECT);
					fprintf(fp_out, "%s=False\n", EVENT_ACCEPT_OBJECT);
					if (rej_msg != NULL)
						fprintf(fp_out, "%s=%s\n", EVENT_REJECT_MSG_OBJECT,
							rej_msg);
					break;
				}
				fprintf(fp_out, "%s=True\n", EVENT_ACCEPT_OBJECT);
				fprintf(fp_out, "%s=False\n", EVENT_REJECT_OBJECT);
				break;
			default:
				log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_HOOK, LOG_ERR,
					  hook_name, "event_to_request: Unexpected event");
				rc = 1;
		}
	pbs_python_end:
		if (pbs_python_get_reboot_host_flag() == TRUE) {
			char *reboot_cmd;

			fprintf(fp_out, "%s.%s=True\n", PBS_OBJ,
				PBS_REBOOT_OBJECT);
			reboot_cmd = pbs_python_get_reboot_host_cmd();
			if (reboot_cmd != NULL)
				fprintf(fp_out, "%s.%s=%s\n", PBS_OBJ,
					PBS_REBOOT_CMD_OBJECT, reboot_cmd);
		}
		if (pbs_python_get_scheduler_restart_cycle_flag() == TRUE) {

			fprintf(fp_out, "%s.%s=True\n",
				SERVER_OBJECT,
				PY_SCHEDULER_RESTART_CYCLE_METHOD);
		}

		if ((fp_out != NULL) && (fp_out != stdout))
			fclose(fp_out);

		if ((fp_server_out != NULL) && (fp_server_out != stdout))
			fclose(fp_server_out);

		pbs_python_ext_free_global_dict(py_script);
		pbs_python_clear_attributes();
		pbs_python_ext_shutdown_interpreter(&svr_interp_data);

		free_attrlist(&event_vnode);
		CLEAR_HEAD(event_vnode);
		free_attrlist(&event_vnode_fail);
		CLEAR_HEAD(event_vnode_fail);
		free_attrlist(&event_argv);
		CLEAR_HEAD(event_argv);
		free_attrlist(&event_jobs);
		CLEAR_HEAD(event_jobs);
		if (progname != NULL)
			free(progname);
		if (env_str != NULL)
			free(env_str);

		hook_perf_stat_stop(perf_label, PBS_PYTHON_PROGRAM, 1);
	}

	return rc;
}


================================================
FILE: src/tools/pbs_sleep.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file
 *		pbs_sleep.c
 *
 * @brief
 *		This file contains functions related to sleep of PBS.
 *
 * Functions included are:
 * 	main()
 *
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <signal.h>

/**
 * @Brief
 *      This is main function of pbs_sleep process.
 *      It calls sleep internally for the number of seconds passed to it, -1 for sleep indefinitely.
 *
 */

int
main(int argc, char *argv[])
{
	int i;
	int forever = 0;
	int secs = 0;

	if (argc != 2) {
		fprintf(stderr, "%s secs\n", argv[0]);
		exit(1);
	}

	/* if argv[1] is -1, loop with sleep 1 indefinitely */
	if (strcmp(argv[1], "-1") == 0)
		forever = 1;
	else
		secs = atoi(argv[1]);

	for (i = 0; i < secs || forever; i++)
		sleep(1);

	return 0;
}


================================================
FILE: src/tools/pbs_tclWrap.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <errno.h>
#include <time.h>
#include <string.h>
#include <assert.h>
#include <tcl.h>

#include "pbs_error.h"
#include "pbs_ifl.h"
#include "ifl_internal.h"
#include "log.h"
#include "resmon.h"
#include "rm.h"
#include "cmds.h"
#include "attribute.h"

#if !defined(HAVE_TCL_SIZE)
typedef int Tcl_Size;
#endif

char badparm[] = "%s: bad parameter";
char missingfd[] = "%s: missing file descriptor";
char not_connected[] = "not connected";
char fail[] = "failed";
#ifdef NAS /* localmod 071 */
char *tcl_atrsep = NULL;
#endif /* localmod 071 */
Tcl_Obj *pbserr;
Tcl_Obj *pbsmsg;

int connector = -1;
int (*local_disconnect)(int connection) = __pbs_disconnect;

#define SET_PBSERR(value)                           \
	(void) Tcl_ObjSetVar2(interp, pbserr, NULL, \
			      Tcl_NewIntObj((value)), TCL_GLOBAL_ONLY | TCL_LEAVE_ERR_MSG)

#define SET_PBSMSG(msg)                             \
	(void) Tcl_ObjSetVar2(interp, pbsmsg, NULL, \
			      Tcl_NewStringObj((msg), -1), TCL_GLOBAL_ONLY)

#ifdef NAS
#define PBS_CALL(function)                                         \
	if (function) {                                            \
		Tcl_SetObjResult(interp, Tcl_NewIntObj(-1));       \
		msg = pbs_geterrmsg(connector);                    \
		sprintf(log_buffer, "%s: %s (%d)", argv[1],        \
			msg ? msg : fail, pbs_errno);              \
		if (!quiet)                                        \
			log_err(-1, (char *) argv[0], log_buffer); \
	} else                                                     \
		Tcl_SetObjResult(interp, Tcl_NewIntObj(0));
#else
#define PBS_CALL(function)                                   \
	if (function) {                                      \
		Tcl_SetObjResult(interp, Tcl_NewIntObj(-1)); \
		msg = pbs_geterrmsg(connector);              \
		sprintf(log_buffer, "%s: %s (%d)", argv[1],  \
			msg ? msg : fail, pbs_errno);        \
		log_err(-1, (char *) argv[0], log_buffer);   \
	} else                                               \
		Tcl_SetObjResult(interp, Tcl_NewIntObj(0));
#endif

int
OpenRM(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	int port = 0;
	int fd;
	char *host;

	if (objc == 3) {
		if (Tcl_GetIntFromObj(interp, objv[2], &port) != TCL_OK)
			return TCL_ERROR;
	} else if (objc != 2) {
		Tcl_WrongNumArgs(interp, 1, objv, "host ?port?");
		return TCL_ERROR;
	}

	host = Tcl_GetStringFromObj(objv[1], NULL);
	if ((fd = openrm(host, port)) < 0) {
		Tcl_PosixError(interp);
#ifdef NAS
		if (!quiet)
#endif
			log_err(pbs_errno, Tcl_GetStringFromObj(objv[0], NULL), host);
	}

	SET_PBSERR(pbs_errno);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(fd));
	return TCL_OK;
}

int
CloseRM(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	int fd, ret;
	char *cmd;

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if (objc != 2) {
		sprintf(log_buffer, missingfd, cmd);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (Tcl_GetIntFromObj(interp, objv[1], &fd) != TCL_OK)
		return TCL_ERROR;

	if ((ret = closerm(fd)) == -1) {
		Tcl_PosixError(interp);
#ifdef NAS
		if (!quiet)
#endif
			log_err(pbs_errno, cmd, Tcl_GetStringFromObj(objv[1], NULL));
	}

	SET_PBSERR(pbs_errno);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(ret));
	return TCL_OK;
}

int
DownRM(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	int fd, ret;
	char *cmd;

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if (objc != 2) {
		sprintf(log_buffer, missingfd, cmd);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (Tcl_GetIntFromObj(interp, objv[1], &fd) != TCL_OK)
		return TCL_ERROR;

	if ((ret = downrm(fd)) == -1) {
		Tcl_PosixError(interp);
#ifdef NAS
		if (!quiet)
#endif
			log_err(pbs_errno, cmd, Tcl_GetStringFromObj(objv[1], NULL));
	}

	SET_PBSERR(pbs_errno);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(ret));
	return TCL_OK;
}

int
ConfigRM(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	int fd, ret;
	char *cmd, *filename;

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if (objc != 3) {
		sprintf(log_buffer,
			"%s: missing file descriptor or filename", cmd);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (Tcl_GetIntFromObj(interp, objv[1], &fd) != TCL_OK)
		return TCL_ERROR;

	filename = Tcl_GetStringFromObj(objv[2], NULL);
	ret = configrm(fd, filename);
	if (ret == -1) {
		Tcl_PosixError(interp);
#ifdef NAS
		if (!quiet)
#endif
			log_err(pbs_errno, cmd, filename);
	}

	SET_PBSERR(pbs_errno);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(ret));
	return TCL_OK;
}

int
AddREQ(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	int fd, ret;
	char *cmd, *request;

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if (objc != 3) {
		sprintf(log_buffer,
			"%s: missing file descriptor or request", cmd);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (Tcl_GetIntFromObj(interp, objv[1], &fd) != TCL_OK)
		return TCL_ERROR;

	request = Tcl_GetStringFromObj(objv[2], NULL);
	ret = addreq(fd, request);
	if (ret == -1) {
		Tcl_PosixError(interp);
#ifdef NAS
		if (!quiet)
#endif
			log_err(pbs_errno, cmd, request);
	}

	SET_PBSERR(pbs_errno);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(ret));
	return TCL_OK;
}

int
AllREQ(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	int ret;

	if (argc != 2) {
		sprintf(log_buffer, "%s: missing request", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	ret = allreq((char *) argv[1]);
	SET_PBSERR(pbs_errno);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(ret));
	return TCL_OK;
}

int
GetREQ(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	int fd;
	char *ret;
	char *cmd;

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if (objc != 2) {
		sprintf(log_buffer, missingfd, cmd);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (Tcl_GetIntFromObj(interp, objv[1], &fd) != TCL_OK)
		return TCL_ERROR;

	if ((ret = getreq(fd)) == NULL) {
		if (pbs_errno) {
			Tcl_PosixError(interp);
#ifdef NAS
			if (!quiet)
#endif
				log_err(pbs_errno, cmd,
					Tcl_GetStringFromObj(objv[1], NULL));
		}
		SET_PBSERR(pbs_errno);
	} else {
		int err = 0;

		Tcl_SetResult(interp, ret, (Tcl_FreeProc *) free);
		if (*ret == '?') {
			if (strlen(ret) > (size_t) 2 && /* look for err num */
			    Tcl_GetInt(interp, &ret[2], &err) != TCL_OK)
				return TCL_ERROR;
		}
		SET_PBSERR(err);
	}

	return TCL_OK;
}

int
FlushREQ(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	if (argc != 1) {
		sprintf(log_buffer, badparm, (char *) argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	flushreq();

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
ActiveREQ(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	int ret;

	if (argc != 1) {
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	ret = activereq();
	if (ret == -1) {
		Tcl_PosixError(interp);
		sprintf(log_buffer, "result %d", ret);
#ifdef NAS
		if (!quiet)
#endif
			log_err(pbs_errno, (char *) argv[0], log_buffer);
	}

	SET_PBSERR(pbs_errno);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(ret));
	return TCL_OK;
}

int
FullResp(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	int flag;

	if (argc != 2) {
		sprintf(log_buffer, "%s: missing flag", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (Tcl_GetBoolean(interp, (char *) argv[1], &flag) != TCL_OK)
		return TCL_ERROR;

	fullresp(flag);
	SET_PBSERR(0);
	return TCL_OK;
}

int
PBS_Connect(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	const char *server = NULL;

	if (argc == 2)
		server = argv[1];
	else if (argc != 1) {
		sprintf(log_buffer, "%s: wrong # args: ?server?", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	local_disconnect(connector);
	pbs_errno = PBSE_NONE;
	if ((connector = pbs_connect(server)) < 0) {
		Tcl_SetObjResult(interp, Tcl_NewIntObj(-1));
		sprintf(log_buffer, "%s (%d)",
			server ? server : "DefaultServer",
			pbs_errno);
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], log_buffer);
	} else
		Tcl_SetObjResult(interp, Tcl_NewIntObj(0));

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_Disconnect(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	if (argc != 1) {
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	pbs_errno = PBSE_NONE;
	local_disconnect(connector);
	Tcl_SetObjResult(interp, Tcl_NewIntObj(0));
	connector = -1;

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

Tcl_Obj *
attrlist(Tcl_Interp *interp, struct attrl *ap)
{
	Tcl_Obj *ret;

	ret = Tcl_NewListObj(0, NULL); /* null list */
	while (ap) {
		Tcl_Obj *twol[2];

		twol[0] = Tcl_NewStringObj(ap->name, -1);
		if (ap->resource) {
			Tcl_AppendStringsToObj(twol[0],
#ifdef NAS /* localmod 071 */
					       tcl_atrsep, ap->resource, NULL);
#else
					       TCL_ATRSEP, ap->resource, NULL);
#endif /* localmod 071 */
		}
		twol[1] = Tcl_NewStringObj(ap->value, -1);
		Tcl_ListObjAppendElement(interp, ret, Tcl_NewListObj(2, twol));

		ap = ap->next;
	}
	return (ret);
}

void
	batresult(Tcl_Interp *interp, struct batch_status *bs)
{
	Tcl_Obj *batchl;
	struct batch_status *bp;

	batchl = Tcl_NewObj(); /* empty list */
	for (bp = bs; bp; bp = bp->next) {
		Tcl_Obj *threel[3];

		threel[0] = Tcl_NewStringObj(bp->name, -1);
		threel[1] = attrlist(interp, bp->attribs);
		threel[2] = Tcl_NewStringObj(bp->text, -1);

		Tcl_ListObjAppendElement(interp, batchl,
					 Tcl_NewListObj(3, threel));
	}
	Tcl_SetObjResult(interp, batchl);
	pbs_statfree(bs);
}

int
PBS_StatServ(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	struct batch_status *bs;
	Tcl_Obj *threel[3];

	if (argc != 1) {
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_statserver(connector, NULL, NULL)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
#ifdef NAS
			if (!quiet)
#endif
				log_err(-1, (char *) argv[0], log_buffer);
		}
	} else {
		threel[0] = Tcl_NewStringObj(bs->name, -1);
		threel[1] = attrlist(interp, bs->attribs);
		threel[2] = Tcl_NewStringObj(bs->text, -1);

		Tcl_SetObjResult(interp, Tcl_NewListObj(3, threel));

		pbs_statfree(bs);
	}

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_StatJob(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	struct batch_status *bs;
	char *extend = NULL;

	if (argc > 2) { /* can have one argument for extend field */
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}
	if (argc == 2) {
		extend = (char *) argv[1];
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_statjob(connector, NULL, NULL, extend)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
#ifdef NAS
			if (!quiet)
#endif
				log_err(-1, (char *) argv[0], log_buffer);
		}
	} else
		batresult(interp, bs);

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_SelStat(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	struct batch_status *bs;

	static struct attropl att1 = {
		NULL,
		"queue_type",
		NULL,
		"E",
		EQ};
	static struct attropl att2 = {
		&att1,
		"job_state",
		NULL,
		"Q",
		EQ};

	if (argc != 1) {
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_selstat(connector, &att2, NULL, NULL)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
#ifdef NAS
			if (!quiet)
#endif
				log_err(-1, (char *) argv[0], log_buffer);
		}
	} else
		batresult(interp, bs);

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_StatQue(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	struct batch_status *bs;

	if (argc != 1) {
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_statque(connector, NULL, NULL, NULL)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
#ifdef NAS
			if (!quiet)
#endif
				log_err(-1, (char *) argv[0], log_buffer);
		}
	} else
		batresult(interp, bs);

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_StatNode(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	char *msg, *cmd;
	char *node = NULL;
	struct batch_status *bs;

	if (objc == 2)
		node = Tcl_GetStringFromObj(objv[1], NULL);
	else if (objc != 1) {
		Tcl_WrongNumArgs(interp, 1, objv, "?node?");
		return TCL_ERROR;
	}

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_statnode(connector, node, NULL, NULL)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
#ifdef NAS
			if (!quiet)
#endif
				log_err(-1, cmd, log_buffer);
		}
	} else
		batresult(interp, bs);

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_AsyRunJob(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	char *location = NULL;

	if (argc == 3)
		location = (char *) argv[2];
	else if (argc != 2) {
		sprintf(log_buffer,
			"%s: wrong # args: job_id ?location?", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	PBS_CALL(pbs_asyrunjob(connector, (char *) argv[1], location, NULL))

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_RunJob(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	char *location = NULL;

	if (argc == 3)
		location = (char *) argv[2];
	else if (argc != 2) {
		sprintf(log_buffer,
			"%s: wrong # args: job_id ?location?", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	PBS_CALL(pbs_runjob(connector, (char *) argv[1], location, NULL))

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_ReRun(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	char *extend = "0";

	if (argc != 2) {
		sprintf(log_buffer,
			"%s: wrong # args: job_id", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	PBS_CALL(pbs_rerunjob(connector, (char *) argv[1], extend))

	SET_PBSERR(pbs_errno);

	return TCL_OK;
}

int
PBS_MoveJob(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	char *location = NULL;
	char job_id_out[PBS_MAXCLTJOBID];
	char server_out[MAXSERVERNAME];

	if (argc == 3)
		location = (char *) argv[2];
	else if (argc != 2) {
		sprintf(log_buffer,
			"%s: wrong # args: job_id ?location?", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if (get_server((char *) argv[1], job_id_out, server_out)) {
		msg = pbs_geterrmsg(connector);
		sprintf(log_buffer, "%s: %s (%d)", argv[1],
			msg ? msg : fail, pbs_errno);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	PBS_CALL(pbs_movejob(connector, job_id_out, location, NULL))

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_DelJob(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	char *message = NULL;

	if (argc == 3)
		message = (char *) argv[2];
	else if (argc != 2) {
		sprintf(log_buffer,
			"%s: wrong # args: job_id ?message?", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	PBS_CALL(pbs_deljob(connector, (char *) argv[1], message))

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_HoldJob(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;

	if (argc != 2) {
		sprintf(log_buffer,
			"%s: wrong # args: job_id", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	PBS_CALL(pbs_holdjob(connector, (char *) argv[1], SYSTEM_HOLD, NULL))

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_QueueOp(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[], struct attropl *attr)
{
	int merr;

	if (argc != 2) {
		sprintf(log_buffer,
			"%s: wrong # args: queue", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}
	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	merr = pbs_manager(connector, MGR_CMD_SET, MGR_OBJ_QUEUE,
			   (char *) argv[1], attr, NULL);
	if (merr != 0) {
		sprintf(log_buffer, "%s: %s %s", argv[0], argv[1],
			pbs_geterrmsg(connector));
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	Tcl_SetObjResult(interp, Tcl_NewIntObj(0));
	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_EnableQueue(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	static struct attropl attr = {NULL, "enabled", NULL, "TRUE", SET};
	return PBS_QueueOp(clientData, interp, argc, argv, &attr);
}

int
PBS_DisableQueue(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	static struct attropl attr = {NULL, "enabled", NULL, "FALSE", SET};
	return PBS_QueueOp(clientData, interp, argc, argv, &attr);
}

int
PBS_StartQueue(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	static struct attropl attr = {NULL, "started", NULL, "TRUE", SET};
	return PBS_QueueOp(clientData, interp, argc, argv, &attr);
}

int
PBS_StopQueue(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	static struct attropl attr = {NULL, "started", NULL, "FALSE", SET};
	return PBS_QueueOp(clientData, interp, argc, argv, &attr);
}

int
PBS_AlterJob(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	static char id[] = "PBS_AlterJob";
	char *msg;
	int i, ret;
	Tcl_Size num;
	Tcl_Size tre;
	Tcl_Obj **listp, **indp;
	struct attrl *attrs, *atp = NULL;
	char *cmd, *jobid;

	if (objc != 3) {
		Tcl_WrongNumArgs(interp, 1, objv, "job_id attribute(s)");
		return TCL_ERROR;
	}

	if ((ret = Tcl_ListObjGetElements(interp, objv[2],
					  &num, &listp)) != TCL_OK)
		return ret;
	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	attrs = NULL;
	for (i = 0; i < num; i++) {
		if ((ret = Tcl_ListObjGetElements(interp, listp[i],
						  &tre, &indp)) != TCL_OK)
			goto done;
		if (tre != 3) {
			sprintf(log_buffer,
				"%s: bad attribute format: %s",
				cmd, Tcl_GetStringFromObj(listp[i], NULL));
			Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
			ret = TCL_ERROR;
			goto done;
		}
		atp = new_attrl();
		if (atp == NULL) {
			sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
			if (!quiet)
#endif
				log_err(errno, id, log_buffer);
			return TCL_ERROR;
		}
		if ((atp->name = strdup(Tcl_GetStringFromObj(indp[0], NULL))) == NULL) {
			sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
			if (!quiet)
#endif
				log_err(errno, id, log_buffer);
			free(atp);
			return TCL_ERROR;
		}
		if ((atp->resource = strdup(Tcl_GetStringFromObj(indp[1], NULL))) == NULL) {
			sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
			if (!quiet)
#endif
				log_err(errno, id, log_buffer);
			free(atp->name);
			free(atp);
			return TCL_ERROR;
		}
		if ((atp->value = strdup(Tcl_GetStringFromObj(indp[2], NULL))) == NULL) {
			sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
			if (!quiet)
#endif
				log_err(errno, id, log_buffer);
			free(atp->resource);
			free(atp->name);
			free(atp);
			return TCL_ERROR;
		}
		atp->next = attrs;
		attrs = atp;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		goto done;
	}

	jobid = Tcl_GetStringFromObj(objv[1], NULL);
	if (pbs_alterjob(connector, jobid, atp, NULL)) {
		Tcl_SetObjResult(interp, Tcl_NewIntObj(-1));
		msg = pbs_geterrmsg(connector);
		sprintf(log_buffer, "%s: %s (%d)", jobid,
			msg ? msg : fail, pbs_errno);
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, log_buffer);
	} else
		Tcl_SetObjResult(interp, Tcl_NewIntObj(0));

done:
	for (atp = attrs; attrs; atp = attrs) {
		attrs = atp->next;
		free(atp->name);
		free(atp->resource);
		free(atp->value);
		free(atp);
	}

	SET_PBSERR(pbs_errno);
	return ret;
}

int
PBS_RescQuery(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	static char id[] = "PBS_RescQuery";
	char *msg;
	int i, ret;
	Tcl_Size num;
	Tcl_Obj **listp, *fourl[4], *retl;
	char *cmd;
	char **res_array;
	int *avail_array, *alloc_array, *reser_array, *down_array;

	if (objc != 2) {
		Tcl_WrongNumArgs(interp, 1, objv, "{resource1 resource2 ...}");
		return TCL_ERROR;
	}

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if ((ret = Tcl_ListObjGetElements(interp, objv[1],
					  &num, &listp)) != TCL_OK)
		return ret;
	if (num == 0) {
		sprintf(log_buffer, "%s: null resource list", cmd);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	res_array = (char **) malloc(sizeof(char *) * num);
	if (res_array == NULL) {
		sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
		if (!quiet)
#endif
			log_err(errno, id, log_buffer);
		return TCL_ERROR;
	}
	avail_array = (int *) malloc(sizeof(int) * num);
	if (avail_array == NULL) {
		sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
		if (!quiet)
#endif
			log_err(errno, id, log_buffer);
		free(res_array);
		return TCL_ERROR;
	}
	alloc_array = (int *) malloc(sizeof(int) * num);
	if (alloc_array == NULL) {
		sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
		if (!quiet)
#endif
			log_err(errno, id, log_buffer);
		free(res_array);
		free(avail_array);
		return TCL_ERROR;
	}
	reser_array = (int *) malloc(sizeof(int) * num);
	if (reser_array == NULL) {
		sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
		if (!quiet)
#endif
			log_err(errno, id, log_buffer);
		free(res_array);
		free(avail_array);
		free(alloc_array);
		return TCL_ERROR;
	}
	down_array = (int *) malloc(sizeof(int) * num);
	if (down_array == NULL) {
		sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
		if (!quiet)
#endif
			log_err(errno, id, log_buffer);
		free(res_array);
		free(avail_array);
		free(alloc_array);
		free(reser_array);
		return TCL_ERROR;
	}
	for (i = 0; i < num; i++)
		res_array[i] = Tcl_GetStringFromObj(listp[i], NULL);

	retl = Tcl_NewObj(); /* empty list */
	if (pbs_rescquery(connector, res_array, num,
			  avail_array, alloc_array, reser_array, down_array)) {
		msg = pbs_geterrmsg(connector);
		sprintf(log_buffer, "%s (%d)", msg ? msg : fail, pbs_errno);
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, log_buffer);
	} else {
		for (i = 0; i < num; i++) {
			fourl[0] = Tcl_NewIntObj(avail_array[i]);
			fourl[1] = Tcl_NewIntObj(alloc_array[i]);
			fourl[2] = Tcl_NewIntObj(reser_array[i]);
			fourl[3] = Tcl_NewIntObj(down_array[i]);

			Tcl_ListObjAppendElement(interp, retl,
						 Tcl_NewListObj(4, fourl));
		}
	}
	Tcl_SetObjResult(interp, retl);

	free(res_array);
	free(avail_array);
	free(alloc_array);
	free(reser_array);
	free(down_array);

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_RescReserve(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	static char id[] = "PBS_RescReserve";
	char *msg;
	int i, ret;
	Tcl_Size num;
	Tcl_Obj **listp;
	char *cmd;
	char **res_array;
	pbs_resource_t resid;

	if (objc != 3) {
		Tcl_WrongNumArgs(interp, 1, objv,
				 "resource_id {resource1 resource2 ...}");
		return TCL_ERROR;
	}

	if (Tcl_GetIntFromObj(interp, objv[1], &resid) != TCL_OK)
		return TCL_ERROR;

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if ((ret = Tcl_ListObjGetElements(interp, objv[2],
					  &num, &listp)) != TCL_OK)
		return ret;
	if (num == 0) {
		sprintf(log_buffer, "%s: null resource list", cmd);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	res_array = (char **) malloc(sizeof(char *) * num);
	if (res_array == NULL) {
		sprintf(log_buffer, "Unable to allocate memory (malloc error)");
#ifdef NAS
		if (!quiet)
#endif
			log_err(errno, id, log_buffer);
		return TCL_ERROR;
	}
	for (i = 0; i < num; i++)
		res_array[i] = Tcl_GetStringFromObj(listp[i], NULL);

	pbs_errno = 0;
	if (pbs_rescreserve(connector, res_array, num, &resid) != 0) {
		msg = pbs_geterrmsg(connector);
		sprintf(log_buffer, "%s (%d)", msg ? msg : fail, pbs_errno);
		SET_PBSMSG(log_buffer);
	}
	Tcl_SetObjResult(interp, Tcl_NewIntObj(resid));

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_RescRelease(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	char *msg;
	int ret;
	char *cmd;
	pbs_resource_t resid;

	if (objc != 2) {
		Tcl_WrongNumArgs(interp, 1, objv, "resource_id");
		return TCL_ERROR;
	}

	if (Tcl_GetIntFromObj(interp, objv[1], &resid) != TCL_OK)
		return TCL_ERROR;

	cmd = Tcl_GetStringFromObj(objv[0], NULL);

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((ret = pbs_rescrelease(connector, resid)) != 0) {
		msg = pbs_geterrmsg(connector);
		sprintf(log_buffer, "%s (%d)", msg ? msg : fail, pbs_errno);
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, cmd, log_buffer);
	}
	Tcl_SetObjResult(interp, Tcl_NewIntObj(ret));

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_ResvStatus(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	char *msg;
	struct batch_status *bs;

	if (argc != 1) {
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}
	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}
	if ((bs = pbs_statresv(connector, NULL, NULL, NULL)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
#ifdef NAS
			if (!quiet)
#endif
				log_err(-1, argv[0], log_buffer);
		}
	} else
		batresult(interp, bs);
	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_ResvConfirm(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	const char *msg = NULL;
	unsigned long stime = 0;

	if (argc < 2 || argc > 4) {
		sprintf(log_buffer,
			"%s: wrong # args: resv_id vnodes ?stime? ?reason?",
			argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}
	if (argc == 4) {
		msg = argv[3];
	}
	if (argc == 3) {
		stime = strtoul(argv[2], NULL, 10);
	}
	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}
	PBS_CALL(pbs_confirmresv(connector, argv[1], argv[2], stime, msg))
	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_ResvDelete(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	const char *msg = NULL;

	if (argc < 2 || argc > 3) {
		sprintf(log_buffer,
			"%s: wrong # args: resv_id ?reason?", argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}
	if (argc == 3)
		msg = argv[2];
	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}
	PBS_CALL(pbs_delresv(connector, argv[1], msg))
	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
LogMsg(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	char *tag = NULL;
	char *msg = NULL;

	if (objc != 3) {
		Tcl_WrongNumArgs(interp, 1, objv, "tag message");
		return TCL_ERROR;
	} else {
		tag = Tcl_GetStringFromObj(objv[1], NULL);
		msg = Tcl_GetStringFromObj(objv[2], NULL);
	}

	if (connector < 0) {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, tag, not_connected);
		Tcl_SetObjResult(interp, Tcl_NewIntObj(-1));
	} else {
#ifdef NAS
		if (!quiet)
#endif
			log_err(-1, tag, msg);
		Tcl_SetObjResult(interp, Tcl_NewIntObj(0));
	}

	return TCL_OK;
}

int
DateTime(ClientData clientData, Tcl_Interp *interp, int argc, const char *argv[])
{
	time_t when;
	struct tm tm, *t = NULL;
	int i, yyy, len;
	char rtime[64], hold[8];
	static char *wkday[] = {"Sun", "Mon", "Tue", "Wed",
				"Thu", "Fri", "Sat", NULL};

	switch (argc) {

		case 1: /* current date/time */
			when = time(NULL);
			sprintf(log_buffer, "%ld", (long) when);
			Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
			return TCL_OK;

		case 2:
			snprintf(rtime, sizeof(rtime), "%s", argv[1]);
			len = strlen(rtime);
			when = 0;
			if (len < 12)
				break;

			/* absolute date/time */
			for (i = 0; i < len; i++) {
				if (!isdigit(rtime[i]))
					break;
			}
			if (i != len || len > 14) {
				sprintf(log_buffer,
					"%s: bad absolute date format: %s",
					argv[0], rtime);
				Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
				return TCL_ERROR;
			}

			yyy = len - 10;
			for (i = 0; i < yyy; i++)
				hold[i] = rtime[i];
			hold[i] = '\0';
			tm.tm_year = atoi(hold);

			hold[0] = rtime[i++];
			hold[1] = rtime[i++];
			hold[2] = '\0';
			tm.tm_mon = atoi(hold) - 1;

			hold[0] = rtime[i++];
			hold[1] = rtime[i++];
			tm.tm_mday = atoi(hold);

			hold[0] = rtime[i++];
			hold[1] = rtime[i++];
			tm.tm_hour = atoi(hold);

			hold[0] = rtime[i++];
			hold[1] = rtime[i++];
			tm.tm_min = atoi(hold);

			hold[0] = rtime[i++];
			hold[1] = rtime[i];
			tm.tm_sec = atoi(hold);
			tm.tm_isdst = -1;

			when = mktime(&tm);
			if (when == -1) {
				sprintf(log_buffer,
					"%s: could not convert date: %s",
					argv[0], rtime);
				Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
				return TCL_ERROR;
			}
			Tcl_SetObjResult(interp, Tcl_NewLongObj((long) when));
			return TCL_OK;

		case 3: /* relative weekday */
			for (i = 0; wkday[i]; i++) {
				if (strcmp(argv[1], wkday[i]) == 0)
					break;
			}
			if (wkday[i] == NULL) {
				sprintf(log_buffer,
					"%s: unrecognized weekday: %s",
					argv[0], argv[1]);
				Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
				return TCL_ERROR;
			}
			when = time(NULL);
			t = localtime(&when);
			t->tm_mday += (i - t->tm_wday + 7) % 7;
			t->tm_hour = 0;
			t->tm_min = 0;
			t->tm_sec = 0;
			t->tm_isdst = -1;
			when = mktime(t);
			snprintf(rtime, sizeof(rtime), "%s", argv[2]);
			len = strlen(rtime);
			break;

		default:
			sprintf(log_buffer,
				"%s: wrong # args: ?day? ?time?", argv[0]);
			Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
			return TCL_ERROR;
	}

	if (len != 8 || rtime[2] != ':' || rtime[5] != ':' ||
	    !isdigit(rtime[0]) || !isdigit(rtime[1]) ||
	    !isdigit(rtime[3]) || !isdigit(rtime[4]) ||
	    !isdigit(rtime[6]) || !isdigit(rtime[7])) {
		sprintf(log_buffer,
			"%s: bad relative time format: %s", argv[0], rtime);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}
	rtime[2] = rtime[5] = '\0';
	when += atoi(&rtime[0]) * 3600 +
		atoi(&rtime[3]) * 60 + atoi(&rtime[6]);

	Tcl_SetObjResult(interp, Tcl_NewLongObj((long) when));
	return TCL_OK;
}

int
StrFtime(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	struct tm *t;
	long hold;
	time_t when;

	if (objc != 3) {
		sprintf(log_buffer,
			"%s: wrong # args: format time",
			Tcl_GetStringFromObj(objv[0], NULL));
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (Tcl_GetLongFromObj(interp, objv[2], &hold) != TCL_OK)
		return TCL_ERROR;

	when = (time_t) hold;
	t = localtime(&when);
	(void) strftime(log_buffer, LOG_BUF_SIZE,
			Tcl_GetStringFromObj(objv[1], NULL), t);
	Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);

	return TCL_OK;
}

int
PBS_PbsPortInfoCmd(ClientData clientData, Tcl_Interp *interp, int objc, Tcl_Obj *const objv[])
{
	int index, result;
	static const char *subCmds[] = {
		"batch_service_port", "batch_service_port_dis",
		"mom_service_port", "manager_service_port",
		NULL};
	enum ISubCmdIdx {
		IBatchSvcIdx,
		IBatchSvcDisIdx,
		IMomSvcIdx,
		IManSvcIdx
	};

	if (objc != 2) {
		Tcl_WrongNumArgs(interp, 1, objv, "batch_service_port|batch_service_port_dis|mom_service_port|manager_service_port");
		return TCL_ERROR;
	}

	result = Tcl_GetIndexFromObj(interp, objv[1], subCmds, "option", 0, &index);
	if (result != TCL_OK) {
		return result;
	}

	switch (index) {
		case IBatchSvcIdx:
			result = pbs_conf.batch_service_port;
			break;
		case IBatchSvcDisIdx:
			result = pbs_conf.batch_service_port_dis;
			break;
		case IMomSvcIdx:
			result = pbs_conf.mom_service_port;
			break;
		case IManSvcIdx:
			result = pbs_conf.manager_service_port;
			break;
	}

	Tcl_SetObjResult(interp, Tcl_NewIntObj(result));
	return TCL_OK;
}

void
	add_cmds(Tcl_Interp *interp)
{
	extern void site_cmds(Tcl_Interp * interp);

	Tcl_CreateObjCommand(interp, "openrm", OpenRM, NULL, NULL);
	Tcl_CreateObjCommand(interp, "closerm", CloseRM, NULL, NULL);
	Tcl_CreateObjCommand(interp, "downrm", DownRM, NULL, NULL);
	Tcl_CreateObjCommand(interp, "configrm", ConfigRM, NULL, NULL);
	Tcl_CreateObjCommand(interp, "getreq", GetREQ, NULL, NULL);
	Tcl_CreateObjCommand(interp, "addreq", AddREQ, NULL, NULL);
	Tcl_CreateCommand(interp, "allreq", AllREQ, NULL, NULL);
	Tcl_CreateCommand(interp, "flushreq", FlushREQ, NULL, NULL);
	Tcl_CreateCommand(interp, "activereq", ActiveREQ, NULL, NULL);
	Tcl_CreateCommand(interp, "fullresp", FullResp, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsportinfo", PBS_PbsPortInfoCmd,
			     NULL, NULL);
	Tcl_CreateCommand(interp, "pbsconnect", PBS_Connect, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsdisconnect", PBS_Disconnect, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsstatserv", PBS_StatServ, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsstatjob", PBS_StatJob, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsstatque", PBS_StatQue, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsstatnode", PBS_StatNode, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsselstat", PBS_SelStat, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsrunjob", PBS_RunJob, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsmovejob", PBS_MoveJob, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsqenable", PBS_EnableQueue, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsqdisable", PBS_DisableQueue, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsqstart", PBS_StartQueue, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsqstop", PBS_StopQueue, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsasyrunjob", PBS_AsyRunJob, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsdeljob", PBS_DelJob, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsholdjob", PBS_HoldJob, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsalterjob", PBS_AlterJob, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsrescquery", PBS_RescQuery, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsrescreserve", PBS_RescReserve,
			     NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsrescrelease", PBS_RescRelease,
			     NULL, NULL);
	Tcl_CreateCommand(interp, "pbsresvstat", PBS_ResvStatus, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsresvconf", PBS_ResvConfirm, NULL, NULL);
	Tcl_CreateCommand(interp, "pbsresvdel", PBS_ResvDelete, NULL, NULL);
	Tcl_CreateObjCommand(interp, "logmsg", LogMsg, NULL, NULL);
	Tcl_CreateCommand(interp, "datetime", DateTime, NULL, NULL);
	Tcl_CreateObjCommand(interp, "strftime", StrFtime, NULL, NULL);

	/*
	 * Extended scheduler commands from Univ. of Colorado
	 */
	Tcl_CreateCommand(interp, "pbsrerunjob", PBS_ReRun, NULL, NULL);

	/*
	 * Initialize global variables pbs_errno and pbs_errmsg
	 */
	pbserr = Tcl_NewStringObj("pbs_errno", -1);
	Tcl_ObjSetVar2(interp, pbserr, NULL, Tcl_NewIntObj((0)),
		       TCL_GLOBAL_ONLY | TCL_LEAVE_ERR_MSG);
	pbsmsg = Tcl_NewStringObj("pbs_errmsg", -1);
	Tcl_ObjSetVar2(interp, pbsmsg, NULL, Tcl_NewStringObj("no msg", -1),
		       TCL_GLOBAL_ONLY | TCL_LEAVE_ERR_MSG);

#ifdef NAS /* localmod 071 */
	if (tcl_atrsep)
		free(tcl_atrsep);
	tcl_atrsep = strdup(TCL_ATRSEP);
#endif /* localmod 071 */
	site_cmds(interp);
}


================================================
FILE: src/tools/pbs_upgrade_job.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file pbs_upgrade_job.c
 *
 * @brief
 *		pbs_upgrade_job.c - This file contains the functions to read in an older .JB file (from 13.x to 19.x versions)
 *		and convert it into the newer format.
 * @par
 *		This tool is required due to the change in PBS macros which are defined in the pbs_ifl.h/server_limits.h
 		or in any other file and the same macros PBS uses in the job structure(see job.h) as well that alters the
		size of the jobfix and taskfix structures.
 *
 * Functions included are:
 * 	main()
 * 	print_usage()
 * 	check_job_file()
 * 	upgrade_job_file()
 * 	upgrade_task_file()
 * 	main()
 */

/* Need to define PBS_MOM to get the pbs_task structure from job.h */
#define PBS_MOM

#include "pbs_config.h"

#include <sys/types.h>
#include <sys/stat.h>
#include <unistd.h>
#include <fcntl.h>
#include <dirent.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include "pbs_ifl.h"
#include "list_link.h"
#include "attribute.h"
#include "job.h"
#include "tm.h"
#include "server_limits.h"
#include "pbs_version.h"

#define O_BINARY 0

/*
 * Define macros that controlled the size of the jobfix and taskfix structure (see job.h)
 * from 13.x to pre 19.x versions. Append the _PRE19 suffix to each.
 */

/* From pbs_ifl.h */
#define PBS_MAXSEQNUM_PRE19 7
#define PBS_MAXSVRJOBID_PRE19 (PBS_MAXSEQNUM_PRE19 - 1 + PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2)
#define PBS_MAXSVRJOBID_19_21 (PBS_MAXSEQNUM - 1 + PBS_MAXSERVERNAME + PBS_MAXPORTNUM + 2)

/*
 * Replicate the jobfix structure as it was defined in versions 19.x - 21.x
 */
typedef struct jobfix_19_21 {
	int ji_jsversion;   /* job structure version - JSVERSION */
	int ji_state;	    /* internal copy of state */
	int ji_substate;    /* job sub-state */
	int ji_svrflags;    /* server flags */
	int ji_numattr;	    /* not used */
	int ji_ordering;    /* special scheduling ordering */
	int ji_priority;    /* internal priority */
	time_t ji_stime;    /* time job started execution */
	time_t ji_endtBdry; /* estimate upper bound on end time */

	char ji_jobid[PBS_MAXSVRJOBID_19_21 + 1]; /* job identifier */
	char ji_fileprefix[PBS_JOBBASE + 1];	  /* no longer used */
	char ji_queue[PBS_MAXQUEUENAME + 1];	  /* name of current queue */
	char ji_destin[PBS_MAXROUTEDEST + 1];	  /* dest from qmove/route */
	/* MomS for execution    */

	int ji_un_type;				 /* type of ji_un union */
	union {					 /* depends on type of queue currently in */
		struct {			 /* if in execution queue .. */
			pbs_net_t ji_momaddr;	 /* host addr of Server */
			unsigned int ji_momport; /* port # */
			int ji_exitstat;	 /* job exit status from MOM */
		} ji_exect;
		struct {
			time_t ji_quetime;  /* time entered queue */
			time_t ji_rteretry; /* route retry time */
		} ji_routet;
		struct {
			int ji_fromsock;	  /* socket job coming over */
			pbs_net_t ji_fromaddr;	  /* host job coming from   */
			unsigned int ji_scriptsz; /* script size */
		} ji_newt;
		struct {
			pbs_net_t ji_svraddr; /* host addr of Server */
			int ji_exitstat;      /* job exit status from MOM */
			uid_t ji_exuid;	      /* execution uid */
			gid_t ji_exgid;	      /* execution gid */
		} ji_momt;
	} ji_un;
} jobfix_19_21;

union jobextend_19_21 {
	char fill[256]; /* fill to keep same size */
	struct {
#if defined(__sgi)
		jid_t ji_jid;
		ash_t ji_ash;
#else
		char ji_4jid[8];
		char ji_4ash[8];
#endif /* sgi */
		int ji_credtype;
#ifdef PBS_MOM
		tm_host_id ji_nodeidx; /* my node id */
		tm_task_id ji_taskidx; /* generate task id's for job */
#if MOM_ALPS
		long ji_reservation;
		/* ALPS reservation identifier */
		unsigned long long ji_pagg;
		/* ALPS process aggregate ID */
#endif /* MOM_ALPS */
#endif /* PBS_MOM */
	} ji_ext;
};

/*
 * Replicate the jobfix and taskfix structures as they were defined in 13.x to pre 19.x versions.
 * Use the macros defined above for convenience.
 */
typedef struct jobfix_PRE19 {
	int ji_jsversion;   /* job structure version - JSVERSION */
	int ji_state;	    /* internal copy of state */
	int ji_substate;    /* job sub-state */
	int ji_svrflags;    /* server flags */
	int ji_numattr;	    /* not used */
	int ji_ordering;    /* special scheduling ordering */
	int ji_priority;    /* internal priority */
	time_t ji_stime;    /* time job started execution */
	time_t ji_endtBdry; /* estimate upper bound on end time */

	char ji_jobid[PBS_MAXSVRJOBID_PRE19 + 1]; /* job identifier */
	char ji_fileprefix[PBS_JOBBASE + 1];	  /* no longer used */
	char ji_queue[PBS_MAXQUEUENAME + 1];	  /* name of current queue */
	char ji_destin[PBS_MAXROUTEDEST + 1];	  /* dest from qmove/route */
	/* MomS for execution    */

	int ji_un_type; /* type of ji_un union */
	union {		/* depends on type of queue currently in */
		struct
		{				 /* if in execution queue .. */
			pbs_net_t ji_momaddr;	 /* host addr of Server */
			unsigned int ji_momport; /* port # */
			int ji_exitstat;	 /* job exit status from MOM */
		} ji_exect;
		struct
		{
			time_t ji_quetime;  /* time entered queue */
			time_t ji_rteretry; /* route retry time */
		} ji_routet;
		struct
		{
			int ji_fromsock;	  /* socket job coming over */
			pbs_net_t ji_fromaddr;	  /* host job coming from   */
			unsigned int ji_scriptsz; /* script size */
		} ji_newt;
		struct
		{
			pbs_net_t ji_svraddr; /* host addr of Server */
			int ji_exitstat;      /* job exit status from MOM */
			uid_t ji_exuid;	      /* execution uid */
			gid_t ji_exgid;	      /* execution gid */
		} ji_momt;
	} ji_un;
} jobfix_PRE19;

typedef struct taskfix_PRE19 {
	char ti_parentjobid[PBS_MAXSVRJOBID_PRE19 + 1];
	tm_node_id ti_parentnode; /* parent vnode */
	tm_node_id ti_myvnode;	  /* my vnode */
	tm_task_id ti_parenttask; /* parent task */
	tm_task_id ti_task;	  /* task's taskid */
	int ti_status;		  /* status of task */
	pid_t ti_sid;		  /* session id */
	int ti_exitstat;	  /* exit status */
	union {
		int ti_hold[16]; /* reserved space */
	} ti_u;
} taskfix_PRE19;

/* Create a global buffer for reading and writing data. */
#define BUFSZ 4096
char buf[BUFSZ];

svrattrl *read_all_attrs_from_jbfile(int fd, char **state, char **substate, char **errbuf);

/**
 * @brief
 *		Print usage text to stderr and exit.
 *
 * @return	void
 */
void
print_usage(void)
{
	fprintf(stderr, "Invalid parameter specified. Usage:\n");
	fprintf(stderr, "pbs_upgrade_job [-c] -f file.JB\n");
}

/**
 * @brief
 *		Attempt to identify the format version of job file.
 *
 * @param[in]	fd	-File descriptor from which to read
 *
 * @return	int
 * @retval	-1	: failure
 * @retval	>=0	: version number
 */
int
check_job_file(int fd)
{
	off_t pos_saved;
	off_t pos_new;
	int ret_version = -1;
	int length = -1;
	jobfix_PRE19 old_jobfix_pre19;
	errno = 0;

	/* Save our current position so we can comeback to it */
	pos_saved = lseek(fd, 0, SEEK_CUR);

	/*---------- For PBS >=13.x or <=18.x versions jobfix structure ---------- */
	pos_new = lseek(fd, pos_saved, SEEK_SET);
	if (pos_new != 0) {
		fprintf(stderr, "Couldn't set the file position to zero [%s]\n",
			errno ? strerror(errno) : "No error");
		goto check_job_file_exit;
	}
	old_jobfix_pre19.ji_jsversion = 0;
	length = read(fd, (char *) &old_jobfix_pre19.ji_jsversion, sizeof(old_jobfix_pre19.ji_jsversion));
	if (length < 0) {
		fprintf(stderr, "Failed to read input file [%s]\n",
			errno ? strerror(errno) : "No error");
		goto check_job_file_exit;
	}
	if (old_jobfix_pre19.ji_jsversion == JSVERSION_18) {
		/* for all type of jobfix structures, from 13.x to 18.x PBS versions */
		ret_version = 18;
		goto check_job_file_exit;
	} else if (old_jobfix_pre19.ji_jsversion == JSVERSION_19) {
		/* if job has already updated structure */
		ret_version = 19;
		goto check_job_file_exit;
	} else if (old_jobfix_pre19.ji_jsversion == JSVERSION) {
		/* if job has already updated structure */
		ret_version = 21;
		goto check_job_file_exit;
	} else {
		fprintf(stderr, "Job structure version (JSVERSION) not recognized, found=%d.\n",
			old_jobfix_pre19.ji_jsversion);
		goto check_job_file_exit;
	}

check_job_file_exit:
	pos_new = lseek(fd, pos_saved, SEEK_SET);
	if (pos_new != 0) {
		fprintf(stderr, "Couldn't set the file position back to zero [%s]\n",
			errno ? strerror(errno) : "No error");
		goto check_job_file_exit;
	}
	return ret_version;
}

/**
 * @brief	Upgrade pre 18.x jobfix structure to 19
 *
 * @param[in]	old_jobfix_pre19 - pre-19 jobfix struct
 *
 * @return	jobfix_19_21
 * @retval	v19 converted jobfix
 */
jobfix_19_21
convert_pre19jf_to_19(jobfix_PRE19 old_jobfix_pre19)
{
	jobfix_19_21 jf_19_21;

	/* Copy the data to the new jobfix structure */
	memset(&jf_19_21, 0, sizeof(jf_19_21));
	jf_19_21.ji_jsversion = JSVERSION_19;
	jf_19_21.ji_state = old_jobfix_pre19.ji_state;
	jf_19_21.ji_substate = old_jobfix_pre19.ji_substate;
	jf_19_21.ji_svrflags = old_jobfix_pre19.ji_svrflags;
	jf_19_21.ji_numattr = old_jobfix_pre19.ji_numattr;
	jf_19_21.ji_ordering = old_jobfix_pre19.ji_ordering;
	jf_19_21.ji_priority = old_jobfix_pre19.ji_priority;
	jf_19_21.ji_stime = old_jobfix_pre19.ji_stime;
	jf_19_21.ji_endtBdry = old_jobfix_pre19.ji_endtBdry;
	snprintf(jf_19_21.ji_jobid, sizeof(jf_19_21.ji_jobid),
		 "%s", old_jobfix_pre19.ji_jobid);
	snprintf(jf_19_21.ji_fileprefix, sizeof(jf_19_21.ji_fileprefix),
		 "%s", old_jobfix_pre19.ji_fileprefix);
	snprintf(jf_19_21.ji_queue, sizeof(jf_19_21.ji_queue),
		 "%s", old_jobfix_pre19.ji_queue);
	snprintf(jf_19_21.ji_destin, sizeof(jf_19_21.ji_destin),
		 "%s", old_jobfix_pre19.ji_destin);
	jf_19_21.ji_un_type = old_jobfix_pre19.ji_un_type;
	memcpy(&jf_19_21.ji_un, &old_jobfix_pre19.ji_un, sizeof(jf_19_21.ji_un));

	return jf_19_21;
}

/**
 * @brief	Upgrade 19-21 jobfix structure to latest
 *
 * @param[in]	old_jf - 19-21 jobfix struct
 *
 * @return	jobfix_19_21
 * @retval	converted jobfix
 */
struct jobfix
convert_19jf_to_22(jobfix_19_21 old_jf)
{
	struct jobfix jf;

	memset(&jf, 0, sizeof(jf));
	jf.ji_jsversion = JSVERSION;
	jf.ji_svrflags = old_jf.ji_svrflags;
	jf.ji_stime = old_jf.ji_stime;
	snprintf(jf.ji_jobid, sizeof(jf.ji_jobid), "%s", old_jf.ji_jobid);
	snprintf(jf.ji_fileprefix, sizeof(jf.ji_fileprefix), "%s", old_jf.ji_fileprefix);
	snprintf(jf.ji_queue, sizeof(jf.ji_queue), "%s", old_jf.ji_queue);
	snprintf(jf.ji_destin, sizeof(jf.ji_destin), "%s", old_jf.ji_destin);
	jf.ji_un_type = old_jf.ji_un_type;
	memcpy(&jf.ji_un, &old_jf.ji_un, sizeof(jf.ji_un));

	return jf;
}

/**
 * @brief	Upgrade 19-21 jobextend structure to latest
 *
 * @param[in]	old_extend - 19-21 jobextend struct
 *
 * @return	jobextend
 * @retval	converted jobextend
 */
union jobextend
convert_19ext_to_22(union jobextend_19_21 old_extend)
{
	union jobextend je;

	memset(&je, 0, sizeof(je));
	snprintf(je.fill, sizeof(je.fill), "%s", old_extend.fill);
#if !defined(__sgi)
	snprintf(je.ji_ext.ji_jid, sizeof(je.ji_ext.ji_jid), "%s", old_extend.ji_ext.ji_4jid);
#endif
	je.ji_ext.ji_credtype = old_extend.ji_ext.ji_credtype;
#ifdef PBS_MOM
	je.ji_ext.ji_nodeidx = old_extend.ji_ext.ji_nodeidx;
	je.ji_ext.ji_taskidx = old_extend.ji_ext.ji_taskidx;
#if MOM_ALPS
	je.ji_ext.ji_reservation = old_extend.ji_ext.ji_reservation;
	je.ji_ext.ji_pagg = old_extend.ji_ext.ji_pagg;
#endif
#endif

	return je;
}

/**
 * @brief
 *		Upgrade a job file from an earlier version.
 *
 * @param[in]	fd		-	File descriptor from which to read
 * @param[in]	ver		-	Old version
 *
 * @return	int
 * @retval	1	: failure
 * @retval	 0	: success
 */
int
upgrade_job_file(int fd, int ver)
{
	FILE *tmp = NULL;
	int tmpfd = -1;
	jobfix_19_21 qs_19_21;
	jobfix_PRE19 old_jobfix_pre19;
	union jobextend_19_21 old_ji_extended;
	int ret;
	off_t pos;
	job new_job;
	errno = 0;
	int len;
	svrattrl *pal = NULL;
	char statechar;
	svrattrl *pali;
	svrattrl dummy;
	char statebuf[2];
	char ssbuf[5];
	char *charstrm;

	/* The following code has been modeled after job_recov_fs() */

	if (ver == 18) {
		/* Read in the pre19 jobfix structure */
		memset(&old_jobfix_pre19, 0, sizeof(old_jobfix_pre19));
		len = read(fd, (char *) &old_jobfix_pre19, sizeof(old_jobfix_pre19));
		if (len < 0) {
			fprintf(stderr, "Failed to read input file [%s]\n",
				errno ? strerror(errno) : "No error");
			return 1;
		}
		if (len != sizeof(old_jobfix_pre19)) {
			fprintf(stderr, "Format not recognized, not enough fixed data.\n");
			return 1;
		}

		qs_19_21 = convert_pre19jf_to_19(old_jobfix_pre19);
	} else {
		/* Read in the 19_21 jobfix structure */
		memset(&qs_19_21, 0, sizeof(qs_19_21));
		len = read(fd, (char *) &qs_19_21, sizeof(qs_19_21));
		if (len < 0) {
			fprintf(stderr, "Failed to read input file [%s]\n",
				errno ? strerror(errno) : "No error");
			return 1;
		}
		if (len != sizeof(qs_19_21)) {
			fprintf(stderr, "Format not recognized, not enough fixed data.\n");
			return 1;
		}
	}
	memset(&new_job, 0, sizeof(new_job));
	new_job.ji_qs = convert_19jf_to_22(qs_19_21);

	/* Convert old extended data to new */
	memset(&old_ji_extended, 0, sizeof(old_ji_extended));
	len = read(fd, (char *) &old_ji_extended, sizeof(union jobextend_19_21));
	if (len < 0) {
		fprintf(stderr, "Failed to read input file [%s]\n", errno ? strerror(errno) : "No error");
		return 1;
	}
	if (len != sizeof(union jobextend_19_21)) {
		fprintf(stderr, "Format not recognized, not enough extended data.\n");
		return 1;
	}
	new_job.ji_extended = convert_19ext_to_22(old_ji_extended);

	/* previous versions may not have updated values of state and substate in the attribute list
	 * since we now rely on these attributes instead of the quick save area, it's important
	 * to make sure that state and substate attributes are set correctly */
	statechar = state_int2char(qs_19_21.ji_state);
	if (statechar != JOB_STATE_LTR_UNKNOWN) {
		bool stateset = false;
		bool substateset = false;
		char *errbuf = malloc(1024);

		if (errbuf == NULL) {
			fprintf(stderr, "Malloc error\n");
			return 1;
		}
		snprintf(statebuf, sizeof(statebuf), "%c", statechar);
		snprintf(ssbuf, sizeof(ssbuf), "%d", qs_19_21.ji_substate);
		pal = read_all_attrs_from_jbfile(fd, NULL, NULL, &errbuf);
		if (pal == NULL && errbuf[0] != '\0') {
			fprintf(stderr, "%s\n", errbuf);
			return 1;
		}
		pali = pal;
		while (pali != NULL) {
			if (strcmp(pali->al_name, ATTR_state) == 0) {
				pali->al_valln = strlen(statebuf) + 1;
				pali->al_value = pali->al_name + pali->al_nameln + pali->al_rescln;
				strcpy(pali->al_value, statebuf);
				pali->al_tsize = sizeof(svrattrl) + pali->al_nameln + pali->al_valln;
				stateset = true;
				if (substateset)
					break;
			} else if (strcmp(pali->al_name, ATTR_substate) == 0) {
				pali->al_valln = strlen(ssbuf) + 1;
				pali->al_value = pali->al_name + pali->al_nameln + pali->al_rescln;
				strcpy(pali->al_value, ssbuf);
				pali->al_tsize = sizeof(svrattrl) + pali->al_nameln + pali->al_valln;
				substateset = true;
				if (stateset)
					break;
			}
			if (pali->al_link.ll_next == NULL)
				break;
			pali = GET_NEXT(pali->al_link);
		}
	}

	/* Open a temporary file to stage data */
	tmp = tmpfile();
	if (!tmp) {
		fprintf(stderr, "Failed to open temporary file [%s]\n", errno ? strerror(errno) : "No error");
		return 1;
	}
	tmpfd = fileno(tmp);
	if (tmpfd < 0) {
		fprintf(stderr, "Failed to find temporary file descriptor [%s]\n", errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Write the new jobfix structure to the output file */
	len = write(tmpfd, &new_job.ji_qs, sizeof(new_job.ji_qs));
	if (len != sizeof(new_job.ji_qs)) {
		fprintf(stderr, "Failed to write jobfix to output file [%s]\n", errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Write the new extend structure to the output file */
	len = write(tmpfd, &new_job.ji_extended, sizeof(new_job.ji_extended));
	if (len != sizeof(new_job.ji_extended)) {
		fprintf(stderr, "Failed to write job extend data to output file [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Write the job attribute list to the output file */
	pali = pal;
	while (pali != NULL) { /* Modeled after save_struct() */
		int copysize;
		int objsize;

		objsize = pali->al_tsize;
		charstrm = (char *) pali;
		while (objsize > 0) {
			if (objsize > BUFSZ)
				copysize = BUFSZ;
			else
				copysize = objsize;
			memcpy(buf, charstrm, copysize);
			len = write(tmpfd, buf, copysize);
			if (len < 0) {
				fprintf(stderr, "Failed to write output file [%s]\n", errno ? strerror(errno) : "No error");
				return 1;
			}
			objsize -= len;
			charstrm += len;
		}
		if (pali->al_link.ll_next == NULL)
			break;
		pali = GET_NEXT(pali->al_link);
	}

	/* Write a dummy attribute to indicate the end of attribute list, refer to save_attr_fs */
	dummy.al_tsize = ENDATTRIBUTES;
	charstrm = (char *) &dummy;
	memcpy(buf, charstrm, sizeof(dummy));
	len = write(tmpfd, buf, sizeof(dummy));
	if (len < 0) {
		fprintf(stderr, "Failed to write dummy to output file [%s]\n", errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Read the rest of the input and write it to the temporary file */
	do {
		len = read(fd, buf, BUFSZ);
		if (len < 0) {
			fprintf(stderr, "Failed to read input file [%s]\n", errno ? strerror(errno) : "No error");
			return 1;
		}
		if (len < 1)
			break;
		len = write(tmpfd, buf, len);
		if (len < 0) {
			fprintf(stderr, "Failed to write output file [%s]\n", errno ? strerror(errno) : "No error");
			return 1;
		}
	} while (len > 0);

	/* Reset the file descriptors to zero */
	pos = lseek(fd, 0, SEEK_SET);
	if (pos != 0) {
		fprintf(stderr, "Failed to reset job file position [%s]\n", errno ? strerror(errno) : "No error");
		return 1;
	}
	pos = lseek(tmpfd, 0, SEEK_SET);
	if (pos != 0) {
		fprintf(stderr, "Failed to reset temporary file position [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* truncate the original file before writing new contents */
	if (ftruncate(fd, 0) != 0) {
		fprintf(stderr, "Failed to truncate the job file [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Copy the data from the temporary file back to the original */
	do {
		len = read(tmpfd, buf, BUFSZ);
		if (len < 0) {
			fprintf(stderr, "Failed to read temporary file [%s]\n", errno ? strerror(errno) : "No error");
			return 1;
		}
		if (len < 1)
			break;
		len = write(fd, buf, len);
		if (len < 0) {
			fprintf(stderr, "Failed to write job file [%s]\n", errno ? strerror(errno) : "No error");
			return 1;
		}
	} while (len > 0);

	ret = fclose(tmp);
	if (ret != 0) {
		fprintf(stderr, "Failed to close temporary file [%s]\n", errno ? strerror(errno) : "No error");
		return 1;
	}
	return 0;
}

/**
 * @brief
 *		Upgrade a task file from an earlier version.
 *
 * @param[in]	taskfile		-	File name of the task file
 * @return	int
 * @retval	-1	: failure
 * @retval	0	: success
 */
int
upgrade_task_file(char *taskfile)
{
	FILE *tmp = NULL;
	int fd;
	int tmpfd = -1;
	int len;
	int ret;
	off_t pos;
	taskfix_PRE19 old_taskfix_pre19;
	pbs_task new_task;
	errno = 0;

	/* The following code has been modeled after task_recov() */

	/* Open the task file */
	fd = open(taskfile, O_BINARY | O_RDWR);
	if (fd < 0) {
		fprintf(stderr, "Failed to open %s [%s]\n", taskfile,
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Read in the pre19 task structure */
	memset(&old_taskfix_pre19, 0, sizeof(old_taskfix_pre19));
	len = read(fd, (char *) &old_taskfix_pre19, sizeof(old_taskfix_pre19));
	if (len < 0) {
		fprintf(stderr, "Failed to read input file [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}
	if (len != sizeof(old_taskfix_pre19)) {
		fprintf(stderr, "Format not recognized, not enough fixed data.\n");
		return 1;
	}
	/* Copy the data to the new task structure */
	memset(&new_task, 0, sizeof(new_task));
	strncpy(new_task.ti_qs.ti_parentjobid, old_taskfix_pre19.ti_parentjobid,
		sizeof(new_task.ti_qs.ti_parentjobid));
	new_task.ti_qs.ti_parentnode = old_taskfix_pre19.ti_parentnode;
	new_task.ti_qs.ti_myvnode = old_taskfix_pre19.ti_myvnode;
	new_task.ti_qs.ti_parenttask = old_taskfix_pre19.ti_parenttask;
	new_task.ti_qs.ti_task = old_taskfix_pre19.ti_task;
	new_task.ti_qs.ti_status = old_taskfix_pre19.ti_status;
	new_task.ti_qs.ti_sid = old_taskfix_pre19.ti_sid;
	new_task.ti_qs.ti_exitstat = old_taskfix_pre19.ti_exitstat;
	memcpy(&new_task.ti_qs.ti_u, &old_taskfix_pre19.ti_u, sizeof(old_taskfix_pre19.ti_u));

	/* Open a temporary file to stage data */
	tmp = tmpfile();
	if (!tmp) {
		fprintf(stderr, "Failed to open temporary file [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}
	tmpfd = fileno(tmp);
	if (tmpfd < 0) {
		fprintf(stderr, "Failed to find temporary file descriptor [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Write the new taskfix structure to the output file */
	len = write(tmpfd, &new_task.ti_qs, sizeof(new_task.ti_qs));
	if (len != sizeof(new_task.ti_qs)) {
		fprintf(stderr, "Failed to write taskfix to output file [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Read the rest of the input and write it to the temporary file */
	do {
		len = read(fd, buf, sizeof(buf));
		if (len < 0) {
			fprintf(stderr, "Failed to read input file [%s]\n",
				errno ? strerror(errno) : "No error");
			return 1;
		}
		if (len < 1)
			break;
		len = write(tmpfd, buf, len);
		if (len < 0) {
			fprintf(stderr, "Failed to write output file [%s]\n",
				errno ? strerror(errno) : "No error");
			return 1;
		}
	} while (len > 0);

	/* Reset the file descriptors to zero */
	pos = lseek(fd, 0, SEEK_SET);
	if (pos != 0) {
		fprintf(stderr, "Failed to reset task file position [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}
	pos = lseek(tmpfd, 0, SEEK_SET);
	if (pos != 0) {
		fprintf(stderr, "Failed to reset temporary file position [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Copy the data from the temporary file back to the original */
	do {
		len = read(tmpfd, buf, sizeof(buf));
		if (len < 0) {
			fprintf(stderr, "Failed to read temporary file [%s]\n",
				errno ? strerror(errno) : "No error");
			return 1;
		}
		if (len < 1)
			break;
		len = write(fd, buf, len);
		if (len < 0) {
			fprintf(stderr, "Failed to write job file [%s]\n",
				errno ? strerror(errno) : "No error");
			return 1;
		}
	} while (len > 0);

	ret = fclose(tmp);
	if (ret != 0) {
		fprintf(stderr, "Failed to close temporary file [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	return 0;
}
/**
 * @brief
 *      This is main function of pbs_upgrade_job process.
 */
int
main(int argc, char *argv[])
{
	DIR *dir;
	struct stat statbuf;
	struct dirent *dirent;
	char taskdir[MAXPATHLEN + 1] = {'\0'};
	char namebuf[MAXPATHLEN + 1] = {'\0'};
	char *jobfile = NULL;
	char *p;
	char *task_start;
	int fd = -1;
	int flags = 0;
	int err = 0;
	int check_flag = 0;
	int i;
	int ret;

	errno = 0;

	/* Print pbs_version and exit if --version specified */
	PRINT_VERSION_AND_EXIT(argc, argv);

	/* Parse the command line parameters */
	while (!err && ((i = getopt(argc, argv, "cf:")) != EOF)) {
		switch (i) {
			case 'c':
				check_flag = 1;
				break;
			case 'f':
				if (jobfile) {
					err = 1;
					break;
				}
				jobfile = optarg;
				break;
			default:
				err = 1;
				break;
		}
	}
	if (!jobfile)
		err = 1;
	if (err) {
		print_usage();
		return 1;
	}

	/* Ensure the tasks directory exists */
	snprintf(namebuf, sizeof(namebuf), "%s", jobfile);
	p = strrchr(namebuf, '.');
	if (!p) {
		fprintf(stderr, "Missing job file suffix");
		return 1;
	}
	if (strncmp(p, JOB_FILE_SUFFIX, strlen(JOB_FILE_SUFFIX)) != 0) {
		fprintf(stderr, "Invalid job file suffix");
		return 1;
	}
	strcpy(p, JOB_TASKDIR_SUFFIX);
	p += strlen(JOB_TASKDIR_SUFFIX);
	ret = stat(namebuf, &statbuf);
	if (ret < 0) {
		fprintf(stderr, "Failed to stat task directory %s [%s]\n",
			namebuf, errno ? strerror(errno) : "No error");
		return 1;
	}
	if (!S_ISDIR(statbuf.st_mode)) {
		fprintf(stderr, "Expected directory at %s", namebuf);
		return 1;
	}
	strncpy(taskdir, namebuf, sizeof(taskdir));
	strcat(p, "/");
	task_start = ++p;

	if (check_flag)
		flags = O_BINARY | O_RDONLY;
	else
		flags = O_BINARY | O_RDWR;

	/* Open the job file for reading */
	fd = open(jobfile, flags);
	if (fd < 0) {
		fprintf(stderr, "Failed to open %s [%s]\n", jobfile,
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Determine the format of the file */
	ret = check_job_file(fd);
	if (ret < 0) {
		fprintf(stderr, "Unknown job format: %s\n", jobfile);
		return 1;
	}
	if (check_flag) {
		printf("%d\n", ret);
		close(fd);
		return 0;
	}

	switch (ret) {
		case 18:
			/* this case will execute for all PBS >=13.x or <=18.x versions */
		case 19:
			/* this case will execute for all PBS >=19.x or <=21.x versions */
			break;
		case 21:
			/* no need to update the job sturcture */
			return 0;
		default:
			fprintf(stderr, "Unsupported version, job_name=%s\n", jobfile);
			return 1;
	}

	/* Upgrade the job file */
	ret = upgrade_job_file(fd, ret);
	if (ret != 0) {
		fprintf(stderr, "Failed to upgrade the job file:%s\n", jobfile);
		return 1;
	}

	/* Close the job file */
	ret = close(fd);
	if (ret < 0) {
		fprintf(stderr, "Failed to close the job file [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}

	/* Upgrade the task files */
	dir = opendir(taskdir);
	if (!dir) {
		fprintf(stderr, "Failed to open the task directory [%s]\n",
			errno ? strerror(errno) : "No error");
		return 1;
	}
	errno = 0;
	while ((dirent = readdir(dir)) != NULL) {
		if (errno != 0) {
			fprintf(stderr, "Failed to read directory [%s]\n",
				errno ? strerror(errno) : "No error");
			closedir(dir);
			return 1;
		}
		if (dirent->d_name[0] == '.')
			continue;
		strcpy(task_start, dirent->d_name);
		ret = upgrade_task_file(namebuf);
		if (ret != 0) {
			fprintf(stderr, "Failed to upgrade the task file:%s\n", jobfile);
			closedir(dir);
			return 1;
		}
	}
	closedir(dir);
	return 0;
}


================================================
FILE: src/tools/printjob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file printjob.c
 *
 * @brief
 *		printjob.c - This file contains the functions related to the print job task.
 *
 * Functions included are:
 * 	print_usage()
 * 	prt_job_struct()
 * 	prt_task_struct()
 * 	read_attr()
 * 	print_db_job()
 * 	main()
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <sys/types.h>
#include <errno.h>
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <strings.h>
#include <unistd.h>
#include <dirent.h>

#define PBS_MOM 1 /* this is so we can use the task struct */

#include "cmds.h"
#include "pbs_version.h"
#include "portability.h"
#include "list_link.h"
#include "attribute.h"
#include "server_limits.h"
#include "job.h"
#ifdef PRINTJOBSVR
#include "pbs_db.h"
void *conn = NULL;
#endif

#ifdef PRINTJOBSVR
/* just to make jattr_get_set.c happy */
attribute_def job_attr_def[1] = {{0}};
#endif

#define BUF_SIZE 512
int display_script = 0; /* to track if job-script is required or not */

svrattrl *read_all_attrs_from_jbfile(int fd, char **state, char **substate, char **errbuf);

/**
 * @brief
 *		Print usage text to stderr and exit.
 *
 * @return	void
 *
 */
void
print_usage()
{
	fprintf(stderr, "Usage: %s [-a] (jobid|file)\n", "printjob");
	fprintf(stderr, "       %s -s jobid\n", "printjob");
	fprintf(stderr, "       %s --version\n", "printjob");
}
/**
 * @brief
 *		print the job struct.
 *
 * @param[in]	pjob	-	pointer to the job struct.
 */
static void
prt_job_struct(job *pjob, char *state, char *substate)
{
	unsigned int ss_num;
	unsigned int s_num;
	char *endp = NULL;

	ss_num = strtol(substate, &endp, 10);
	s_num = state_char2int(state[0]);

	printf("---------------------------------------------------\n");
	printf("jobid:\t%s\n", pjob->ji_qs.ji_jobid);
	printf("---------------------------------------------------\n");
	printf("state:\t\t0x%x\n", s_num);
	printf("substate:\t0x%x (%d)\n", ss_num, ss_num);
	printf("svrflgs:\t0x%x (%d)\n", pjob->ji_qs.ji_svrflags,
	       pjob->ji_qs.ji_svrflags);
	printf("stime:\t\t%ld\n", (long) pjob->ji_qs.ji_stime);
	printf("obittime:\t\t%ld\n", (long) pjob->ji_qs.ji_obittime);
	printf("file base:\t%s\n", pjob->ji_qs.ji_fileprefix);
	printf("queue:\t\t%s\n", pjob->ji_qs.ji_queue);
	switch (pjob->ji_qs.ji_un_type) {
		case JOB_UNION_TYPE_NEW:
			printf("union type new:\n");
			printf("\tsocket\t%d\n", pjob->ji_qs.ji_un.ji_newt.ji_fromsock);
			printf("\taddr\t%lu\n", pjob->ji_qs.ji_un.ji_newt.ji_fromaddr);
			printf("\tscript\t%d\n", pjob->ji_qs.ji_un.ji_newt.ji_scriptsz);
			break;
		case JOB_UNION_TYPE_EXEC:
			printf("union type exec:\n");
			printf("\texits\t%d\n",
			       pjob->ji_qs.ji_un.ji_exect.ji_exitstat);
			break;
		case JOB_UNION_TYPE_ROUTE:
			printf("union type route:\n");
			printf("\tquetime\t%ld\n",
			       (long) pjob->ji_qs.ji_un.ji_routet.ji_quetime);
			printf("\tretry\t%ld\n",
			       (long) pjob->ji_qs.ji_un.ji_routet.ji_rteretry);
			break;
		case JOB_UNION_TYPE_MOM:
			printf("union type mom:\n");
			printf("\tsvraddr\t%lu\n",
			       pjob->ji_qs.ji_un.ji_momt.ji_svraddr);
			printf("\texitst\t%d\n", pjob->ji_qs.ji_un.ji_momt.ji_exitstat);
			printf("\tuid\t%d\n", pjob->ji_qs.ji_un.ji_momt.ji_exuid);
			printf("\tgid\t%d\n", pjob->ji_qs.ji_un.ji_momt.ji_exgid);
			break;
		default:
			printf("--bad union type %d\n", pjob->ji_qs.ji_un_type);
	}
}
/**
 * @brief
 *		print the pbs_task struct.
 *
 * @param[in]	ptask	-	pointer to the task struct.
 */
void
prt_task_struct(pbs_task *ptask)
{
	printf("\n");
	printf("\tparentjobid:\t%s\n", ptask->ti_qs.ti_parentjobid);
	printf("\tparentnode:\t%d\n", ptask->ti_qs.ti_parentnode);
	printf("\tmyvnode:\t%d\n", ptask->ti_qs.ti_myvnode);
	printf("\tparenttask:\t%d\n", ptask->ti_qs.ti_parenttask);
	printf("\ttask:\t\t%d\n", ptask->ti_qs.ti_task);
	printf("\tstatus:\t\t%d\t", ptask->ti_qs.ti_status);
	switch (ptask->ti_qs.ti_status) {

		case TI_STATE_EMBRYO:
			printf("TI_STATE_EMBRYO\n");
			break;

		case TI_STATE_RUNNING:
			printf("TI_STATE_RUNNING\n");
			break;

		case TI_STATE_EXITED:
			printf("TI_STATE_EXITED\n");
			break;

		case TI_STATE_DEAD:
			printf("TI_STATE_DEAD\n");
			break;

		default:
			printf("unknown value\n");
			break;
	}

	printf("\tsid:\t\t%d\n", ptask->ti_qs.ti_sid);
	printf("\texitstat:\t%d\n", ptask->ti_qs.ti_exitstat);
}

#define ENDATTRIBUTES -711

/**
 * @brief	Print an attribute
 *
 * @param[in]	pal  - pointer to attribute
 *
 * @return	void
 */
static void
print_attr(svrattrl *pal)
{
	printf("%s", pal->al_name);
	if (pal->al_resc)
		printf(".%s", pal->al_resc);
	printf(" = ");
	if (pal->al_value)
		printf("%s", show_nonprint_chars(pal->al_value));
	printf("\n");
}

/**
 * @brief
 * 		save the db info into job structure
 *
 * @param[out]	pjob	-	pointer to job struct
 * @param[in]	pdjob	-	pbs DB job info.
 */
#ifdef PRINTJOBSVR
static void
db_2_job(job *pjob, pbs_db_job_info_t *pdjob)
{
	char statec;

	strcpy(pjob->ji_qs.ji_jobid, pdjob->ji_jobid);
	statec = state_int2char(pdjob->ji_state);
	if (statec != '0')
		set_job_state(pjob, statec);

	set_job_substate(pjob, pdjob->ji_substate);
	pjob->ji_qs.ji_svrflags = pdjob->ji_svrflags;
	pjob->ji_qs.ji_stime = pdjob->ji_stime;
	pjob->ji_qs.ji_fileprefix[0] = 0;
	strcpy(pjob->ji_qs.ji_queue, pdjob->ji_queue);
	strcpy(pjob->ji_qs.ji_destin, pdjob->ji_destin);
	pjob->ji_qs.ji_un_type = pdjob->ji_un_type;
	if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_NEW) {
		pjob->ji_qs.ji_un.ji_newt.ji_fromsock = pdjob->ji_fromsock;
		pjob->ji_qs.ji_un.ji_newt.ji_fromaddr = pdjob->ji_fromaddr;
	} else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_EXEC)
		pjob->ji_qs.ji_un.ji_exect.ji_exitstat = pdjob->ji_exitstat;
	else if (pjob->ji_qs.ji_un_type == JOB_UNION_TYPE_ROUTE) {
		pjob->ji_qs.ji_un.ji_routet.ji_quetime = pdjob->ji_quetime;
		pjob->ji_qs.ji_un.ji_routet.ji_rteretry = pdjob->ji_rteretry;
	}

	/* extended portion */
	strcpy(pjob->ji_extended.ji_ext.ji_jid, pdjob->ji_jid);
	pjob->ji_extended.ji_ext.ji_credtype = pdjob->ji_credtype;
}

/**
 * @brief
 * 		enable db lookup only for server version of printjob
 *
 * @param[in]	id	-	Job Id.
 * @param[in]	no_attributes	-	if set means no need to set attr_info
 *
 * @return	int
 */
int
print_db_job(char *id, int no_attributes)
{
	pbs_db_obj_info_t obj;
	pbs_db_job_info_t dbjob;
	pbs_db_jobscr_info_t jobscr;
	job xjob;
	char *db_errmsg = NULL;
	int failcode;

	if (conn == NULL) {

		/* connect to database */
#ifdef NAS /* localmod 111 */
		if (pbs_conf.pbs_data_service_host) {
			failcode = pbs_db_connect(&conn, pbs_conf.pbs_data_service_host, pbs_conf.pbs_data_service_port, PBS_DB_CNT_TIMEOUT_NORMAL);
		} else
#endif /* localmod 111 */
			failcode = pbs_db_connect(&conn, pbs_conf.pbs_server_name, pbs_conf.pbs_data_service_port, PBS_DB_CNT_TIMEOUT_NORMAL);
		if (!conn && pbs_conf.pbs_secondary != NULL) {
			failcode = pbs_db_connect(&conn, pbs_conf.pbs_secondary, pbs_conf.pbs_data_service_port, PBS_DB_CNT_TIMEOUT_NORMAL);
			if (!conn) {
				pbs_db_get_errmsg(failcode, &db_errmsg);
				fprintf(stderr, "%s\n", db_errmsg);
				free(db_errmsg);
				return -1;
			}
		}
	}

	/*
	 * On a server machine, if display_script is set,
	 * retrieve the job-script from database.
	 */
	if (display_script) {
		obj.pbs_db_obj_type = PBS_DB_JOBSCR;
		obj.pbs_db_un.pbs_db_jobscr = &jobscr;
		strcpy(jobscr.ji_jobid, id);
		if (strchr(id, '.') == 0) {
			strcat(jobscr.ji_jobid, ".");
			strcat(jobscr.ji_jobid, pbs_conf.pbs_server_name);
		}

		if (pbs_db_load_obj(conn, &obj) != 0) {
			fprintf(stderr, "Job %s not found\n", jobscr.ji_jobid);
			return (1);
		} else {
			printf("---------------------------------------------------\n");
			printf("Jobscript for jobid:%s\n", jobscr.ji_jobid);
			printf("---------------------------------------------------\n");

			printf("%s \n", jobscr.script);
		}
	}

	/*
	 * On a server machine, if display_script is not set,
	 * retrieve the job info from database.
	 */
	else {
		char state[2];
		char substate[4];
		obj.pbs_db_obj_type = PBS_DB_JOB;
		obj.pbs_db_un.pbs_db_job = &dbjob;
		strcpy(dbjob.ji_jobid, id);
		if (strchr(id, '.') == 0) {
			strcat(dbjob.ji_jobid, ".");
			strcat(dbjob.ji_jobid, pbs_conf.pbs_server_name);
		}

		if (pbs_db_load_obj(conn, &obj) != 0) {
			fprintf(stderr, "Job %s not found\n", dbjob.ji_jobid);
			return (1);
		}
		db_2_job(&xjob, &dbjob);
		snprintf(state, sizeof(state), "%c", get_job_state(&xjob));
		snprintf(substate, sizeof(substate), "%ld", get_job_substate(&xjob));
		prt_job_struct(&xjob, state, substate);

		if (no_attributes == 0) {
			svrattrl *pal;
			printf("--attributes--\n");
			for (pal = (svrattrl *) GET_NEXT(dbjob.db_attr_list.attrs); pal != NULL; pal = (svrattrl *) GET_NEXT(pal->al_link)) {
				printf("%s", pal->al_atopl.name);
				if (pal->al_atopl.resource && pal->al_atopl.resource[0] != 0)
					printf(".%s", pal->al_atopl.resource);
				printf(" = ");
				if (pal->al_atopl.value)
					printf("%s", pal->al_atopl.value);
				printf("\n");
			}
		}
		printf("\n");
		free_attrlist(&dbjob.db_attr_list.attrs);
	}

	return 0;
}
#endif
/**
 * @brief
 *      This is main function of printjob.
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: failure
 */
int
main(int argc, char *argv[])
{
	int amt;
	int err = 0;
	int f;
	int fp;
	int no_attributes = 0;
	job xjob;
	pbs_task xtask;
	extern int optopt;
	extern int opterr;
	extern int optind;
	char *job_id = NULL;
	char job_script[BUF_SIZE];

	/*
	 * Check for the user. If the user is not root/administrator,
	 * display appropriate error message and exit. Else, continue.
	 */

#ifdef WIN32
	if (!isAdminPrivilege(getlogin())) {
		fprintf(stderr, "printjob must be run by Admin\n");
		exit(1);
	}

#else
	if ((getuid() != 0) || (geteuid() != 0)) {
		fprintf(stderr, "printjob must be run by root\n");
		exit(1);
	}
#endif

	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "%s\n", "couldnot load conf file");
		exit(1);
	}

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);
	opterr = 0;
	while ((f = getopt(argc, argv, "as")) != EOF) {
		switch (f) {
			case 'a':
				if (display_script) {
					print_usage();
					exit(1);
				}
				no_attributes = 1;
				break;

			case 's':
				/* set display_script if job-script is required */
				if (no_attributes) {
					print_usage();
					exit(1);
				}
				display_script = 1;
				break;

			default:
				err = 1;
				fprintf(stderr, "printjob: invalid option -- %c\n", optopt);
		}
	}
	if (err || (argc - optind < 1)) {
		print_usage();
		return 1;
	}

	for (f = optind; f < argc; ++f) {
		char *jobfile = argv[f];
		int len;
		char *dirname;
		DIR *dirp;
		FILE *fp_script = NULL;
		struct dirent *dp;

		fp = open(jobfile, O_RDONLY, 0);

		if (display_script) {

			/*
			 * if open() succeeds, it means argument is jobfile-path which
			 * is not allowed with -s option. Print the usage error and exit
			 */
			if (fp > 0) {
				print_usage();
				close(fp);
				exit(1);
			}
		}

		/* If open () fails to open the jobfile, assume argument is jobid */
		if (fp < 0) {

#ifdef PRINTJOBSVR
			if (print_db_job(jobfile, no_attributes) == 0) {
				continue;
			} else {
				if (conn != NULL) {
					pbs_db_disconnect(conn);
				}
				exit(1);
			}
#else
			/*
			 * On non-server host, execute the following code when
			 * the job-id is given to open the job file in mom_priv
			 */
			job_id = (char *) malloc(strlen(jobfile) + strlen(pbs_conf.pbs_server_name) + 2);
			if (job_id == NULL) {
				perror("malloc failed");
				exit(1);
			}
			strcpy(job_id, jobfile);
			if (strchr(job_id, '.') == 0) {
				strcat(job_id, ".");
				strcat(job_id, pbs_conf.pbs_server_name);
			}

			/*frame the jobfile to contain $PBS_HOME/mom_priv/jobs/jobid.JB */
			jobfile = (char *) malloc(strlen(pbs_conf.pbs_home_path) + (strlen(job_id)) + (strlen("/mom_priv/jobs/.JB")) + 1);
			if (jobfile == NULL) {
				perror("malloc failed");
				free(job_id);
				exit(1);
			}
			sprintf(jobfile, "%s/mom_priv/jobs/%s.JB", pbs_conf.pbs_home_path, job_id);
			fp = open(jobfile, O_RDONLY, 0);

			/* If open() fails, the jobfile formed by jobid is not found in $PBS_HOME */
			if (fp < 0) {
				fprintf(stderr, "Job %s not found\n", job_id);
				free(job_id);
				free(jobfile);
				exit(1);
			}
#endif
		}

		/* If not asked for displaying of script, execute below code */
		if (!display_script) {
			svrattrl *pal, *pali, *ppal;
			char *state = "";
			char *substate = "";
			char *errbuf = malloc(1024);

			if (errbuf == NULL) {
				fprintf(stderr, "Malloc error\n");
				exit(1);
			}

			amt = read(fp, &xjob.ji_qs, sizeof(xjob.ji_qs));
			if (amt != sizeof(xjob.ji_qs)) {
				fprintf(stderr, "Short read of %d bytes, file %s\n",
					amt, jobfile);
			}

			/* if present, skip over extended area */
			if (xjob.ji_qs.ji_jsversion > 500) {
				amt = read(fp, &xjob.ji_extended, sizeof(xjob.ji_extended));
				if (amt != sizeof(xjob.ji_extended)) {
					fprintf(stderr, "Short read of %d bytes, file %s\n",
						amt, jobfile);
				}
			}

			/* if array job, skip over sub job table */
			if (xjob.ji_qs.ji_svrflags & JOB_SVFLG_ArrayJob) {
				size_t xs;
				ajinfo_t *ajtrk;

				if (read(fp, (char *) &xs, sizeof(xs)) != sizeof(xs)) {
					if ((ajtrk = (ajinfo_t *) malloc(xs)) == NULL) {
						(void) close(fp);
						return 1;
					}
					if (read(fp, (char *) ajtrk + sizeof(xs), xs - sizeof(xs)) == -1) 
						fprintf(stderr, "read failed, ERR = %s\n", strerror(errno));
					free(ajtrk);
				}
			}

			pal = read_all_attrs_from_jbfile(fp, &state, &substate, &errbuf);
			if (pal == NULL && errbuf[0] != '\0') {
				fprintf(stderr, "%s\n", errbuf);
				exit(1);
			}

			/* Print the summary first */
			prt_job_struct(&xjob, state, substate);

			/* now do attributes, one at a time */
			if (no_attributes == 0 && pal != NULL) {
				/* Now print all attributes */
				printf("--attributes--\n");

				pali = GET_NEXT(pal->al_link);
				while (pali != NULL) {
					print_attr(pali);
					if (pali->al_link.ll_next == NULL) {
						free(pali);
						break;
					}
					ppal = pali;
					pali = GET_NEXT(pali->al_link);
					free(ppal);
				}
				free(pal);
			}

			(void) close(fp);
			printf("\n");

			len = strlen(jobfile);
			if (len <= 2 ||
			    jobfile[len - 2] != 'J' ||
			    jobfile[len - 1] != 'B')
				continue;
			dirname = malloc(len + 50);
			strcpy(dirname, jobfile);

			dirname[len - 2] = 'T';
			dirname[len - 1] = 'K';
			dirp = opendir(dirname);

			if (dirp == NULL) {
				free(dirname);
				continue;
			}

			dirname[len++] = '/';
			dirname[len] = '\0';
			while (errno = 0, (dp = readdir(dirp)) != NULL) {
				if (dp->d_name[0] == '.')
					continue;
				strcpy(&dirname[len], dp->d_name);

				printf("task file %s\n", dirname);
				fp = open(dirname, O_RDONLY, 0);
				if (fp < 0) {
					perror("open failed");
					continue;
				}

				amt = read(fp, &xtask.ti_qs, sizeof(xtask.ti_qs));
				if (amt != sizeof(xtask.ti_qs)) {
					fprintf(stderr,
						"Short read of %d bytes\n", amt);
					continue;
				}

				prt_task_struct(&xtask);
				close(fp);
			}
			if (errno != 0 && errno != ENOENT) {
				perror("readdir failed");
				free(dirname);
				closedir(dirp);
				continue;
			}
			free(dirname);
			if (jobfile != argv[f])
				free(jobfile);
			if (job_id)
				free(job_id);
			closedir(dirp);
			free(errbuf);
		}
		/* if asked for displaying of script, execute below code  (for mom-side) */
		else {

			len = strlen(jobfile);
			jobfile[len - 2] = 'S';
			jobfile[len - 1] = 'C';

			fp_script = fopen(jobfile, "r");

			/* If fopen fails, display the usage error */
			if (fp_script == NULL) {
				print_usage();
				exit(1);
			}
			if (job_id) {
				printf("--------------------------------------------------\n");
				printf("jobscript for %s\n", job_id);
				printf("--------------------------------------------------\n");
			}
			while ((fgets(job_script, BUF_SIZE - 1, fp_script)) != NULL) {
				if (fputs(job_script, stdout) < 0) {
					fprintf(stderr, "Error reading job-script file\n");
					exit(1);
				}
			}
			printf("\n");
			free(jobfile);
			fclose(fp_script);
			free(job_id);
			close(fp);
		}
	}
#ifdef PRINTJOBSVR
	if (conn != NULL) {
		pbs_db_disconnect(conn);
	}
#endif
	return (0);
}


================================================
FILE: src/tools/rstester.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file rstester.c
 *
 * @brief
 *		rstester.c - This file contains the functions related to resource testing.
 *
 * Functions included are:
 * 	main()
 * 	read_attrs()
 */
#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <pbs_ifl.h>
#include "attribute.h"

/* prototypes */
static struct attrl *read_attrs(FILE *fp);
/**
 * @brief
 *      This is main function of rstester.
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: failure
 *
 */
int
main(int argc, char *argv[])
{
	int c;
	int print_parse = 0;
	int print_resc = 0;
	int print_assn = 0;
	int read_values = 0;
	FILE *fp = NULL;
	rescspec *parse_tree;
	struct batch_status *bs;
	struct attrl *al = NULL;
	int eval_value;
	char logbuf[256];

	while ((c = getopt(argc, argv, "parv:")) != -1)
		switch (c) {
			case 'p':
				print_parse = 1;
				break;
			case 'a':
				print_assn = 1;
				break;
			case 'r':
				print_resc = 1;
				break;
			case 'v':
				read_values = 1;
				fp = fopen(optarg, "r");
				break;

			default:
				fprintf(stderr, "Invalid Option: -%c\n", c);
		}

	if (argc < optind) {
		fprintf(stderr, "no rescspec!\n");
		return 1;
	}

	if (read_values && (fp == NULL || (al = read_attrs(fp)) == NULL)) {
		fprintf(stderr, "No file to read attribs from!\n");
		return 1;
	}

	/* turn on error output to stdout */
	rescspec_print_errors(1);

	parse_tree = rescspec_parse(argv[optind]);

	if (parse_tree != NULL) {
		if (read_values) {
			logbuf[0] = '\0';
			eval_value = rescspec_evaluate(parse_tree, al, logbuf);
			if (eval_value > 0)
				printf("Evaluate: yes\n");
			else if (eval_value == 0)
				printf("Evaluate: no: %s\n", logbuf);
			else
				printf("Evaluate: Error\n");
		}

		if (print_parse) {
			printf("The Parse Tree:\n");
			print_rescspec_tree(parse_tree, NULL);
		}

		if (print_resc) {
			printf("The Resources: \n");
			bs = rescspec_get_resources(parse_tree);
			if (bs != NULL) {
				print_attrl(bs->attribs);
				/*      pbs_statfree(bs); */
			}
		}

		if (print_assn) {
			printf("The Assignments: \n");
			bs = rescspec_get_assignments(parse_tree);
			if (bs != NULL) {
				print_attrl(bs->attribs);
				/*      pbs_statfree(bs); */
			}
		}
	}
	if (fp != NULL)
		fclose(fp);
	return 0;
}

/**
 * @brief
 *		read_attrs - read attribvalue pairs from file
 *
 * @param[in]	fp	-	the file to read from
 *
 * @return	attrl
 * @retval	list of attrib value pairs	: success
 * @retval	NULL	: failed
 *
 */
static struct attrl *
read_attrs(FILE *fp)
{
	char buf[1024];		   /* buf to read into */
	struct attrl *head = NULL; /* head of list */
	struct attrl *cur = NULL;  /* current entry in list */
	struct attrl *prev = NULL; /* prev entry to add current one to */

	if (fp == NULL)
		return NULL;

	while (fgets(buf, 1024, fp) != NULL) {
		if ((cur = new_attrl()) == NULL)
			return NULL;

		/* chop the \n */
		buf[strlen(buf) - 1] = '\0';

		cur->name = ATTR_l;
		cur->resource = strdup(strtok(buf, "= 	"));
		cur->value = strdup(strtok(NULL, "= 	"));

		if (prev != NULL) {
			prev->next = cur;
			prev = cur;
		} else {
			prev = cur;
			head = cur;
		}
	}

	return head;
}


================================================
FILE: src/tools/site_tclWrap.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h> /* the master config generated by configure */

#include <tcl.h>
#ifdef NAS
#include <string.h>
#include <stdlib.h>
#endif
#include "portability.h"
#include "pbs_error.h"
#ifdef NAS
#include "pbs_ifl.h"
#include "pbs_internal.h"
#endif
#include "log.h"

#ifdef NAS
/* localmod 071 */
extern char *tcl_atrsep;

/* localmod 099 */
int quiet = 0;

/* localmod 098 */
extern char badparm[];
extern char not_connected[];
extern char fail[];
extern Tcl_Obj *pbserr;
extern Tcl_Obj *pbsmsg;
extern int connector;
void batresult(Tcl_Interp *interp, struct batch_status *bs);
Tcl_Obj *attrlist(Tcl_Interp *interp, struct attrl *ap);

#define SET_PBSERR(value)                           \
	(void) Tcl_ObjSetVar2(interp, pbserr, NULL, \
			      Tcl_NewIntObj((value)), TCL_GLOBAL_ONLY | TCL_LEAVE_ERR_MSG)

#define SET_PBSMSG(msg)                             \
	(void) Tcl_ObjSetVar2(interp, pbsmsg, NULL, \
			      Tcl_NewStringObj((msg), -1), TCL_GLOBAL_ONLY)

#define PBS_CALL(function, note)                             \
	if (function) {                                      \
		Tcl_SetObjResult(interp, Tcl_NewIntObj(-1)); \
		msg = pbs_geterrmsg(connector);              \
		sprintf(log_buffer, "%s: %s (%d)", note,     \
			msg ? msg : fail, pbs_errno);        \
		if (!quiet)                                  \
			log_err(-1, cmd, log_buffer);        \
	} else                                               \
		Tcl_SetObjResult(interp, Tcl_NewIntObj(0));

/* localmod 071 */
int
PBS_atrsep(ClientData clientData, Tcl_Interp *interp, int objc,
	   Tcl_Obj *CONST objv[])
{
	int ret;
	char *newvalue;

	newvalue = NULL;
	switch (objc) {
		case 2:
			newvalue = Tcl_GetString(objv[1]);
		case 1:
			break;
		default:
			Tcl_WrongNumArgs(interp, 1, objv, "?string?");
			return TCL_ERROR;
	}
	Tcl_SetObjResult(interp, Tcl_NewStringObj(tcl_atrsep, strlen(tcl_atrsep)));
	if (newvalue) {
		free(tcl_atrsep);
		tcl_atrsep = strdup(newvalue);
	}
	return TCL_OK;
}

/* localmod 098 */
int
PBS_confirm(ClientData clientData, Tcl_Interp *interp, int objc,
	    Tcl_Obj *CONST objv[])
{
	char *cmd;
	char *reqid;
	char *exechost;
	unsigned long start = 0;
	char *extend = NULL;
	char *msg;
	int ret;

	switch (objc) {
		case 5:
			extend = Tcl_GetString(objv[4]);
			/* Fall through */
		case 4:
			ret = Tcl_GetLongFromObj(interp, objv[3], (long *) &start);
			if (ret != TCL_OK) {
				return ret;
			}
			/* Fall through */
		case 3:
			exechost = Tcl_GetString(objv[2]);
			reqid = Tcl_GetString(objv[1]);
			break;
		default:
			Tcl_WrongNumArgs(interp, 1, objv, "resvid exechost ?start_time? ?extra?");
			return TCL_ERROR;
	}
	cmd = Tcl_GetString(objv[0]);
	if (connector < 0) {
		if (!quiet)
			log_err(-1, cmd, not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	PBS_CALL(pbs_confirmresv(connector, reqid, exechost, start, extend), reqid)
	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

/* localmod 099 */
int
PBS_quiet(ClientData clientData, Tcl_Interp *interp, int objc,
	  Tcl_Obj *CONST objv[])
{
	int ret;
	int newvalue;

	newvalue = quiet;
	switch (objc) {
		case 2:
			ret = Tcl_GetBooleanFromObj(interp, objv[1], &newvalue);
			if (ret != TCL_OK) {
				return ret;
			}
		case 1:
			break;
		default:
			Tcl_WrongNumArgs(interp, 1, objv, "?bool?");
			return TCL_ERROR;
	}
	Tcl_SetObjResult(interp, Tcl_NewIntObj(quiet));
	quiet = newvalue;
	return TCL_OK;
}

/* localmod 098 */
int
PBS_StatResv(ClientData clientData, Tcl_Interp *interp, int objc,
	     Tcl_Obj *CONST objv[])
{
	char *msg;
	struct batch_status *bs;
	char *extend = NULL;

	if (objc > 2) { /* can have one argument for extend field */
		sprintf(log_buffer, badparm, Tcl_GetString(objv[0]));
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}
	if (objc == 2) {
		extend = Tcl_GetString(objv[1]);
	}

	if (connector < 0) {
		if (!quiet)
			log_err(-1, Tcl_GetString(objv[0]), not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_statresv(connector, NULL, NULL, extend)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
			if (!quiet)
				log_err(-1, Tcl_GetString(objv[0]), log_buffer);
		}
	} else
		batresult(interp, bs);

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_StatSched(clientData, interp, argc, argv)
ClientData clientData;
Tcl_Interp *interp;
int argc;
char *argv[];
{
	char *msg;
	struct batch_status *bs;
	Tcl_Obj *threel[3];

	if (argc != 1) {
		sprintf(log_buffer, badparm, argv[0]);
		Tcl_SetResult(interp, log_buffer, TCL_VOLATILE);
		return TCL_ERROR;
	}

	if (connector < 0) {
		if (!quiet)
			log_err(-1, (char *) argv[0], not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_statsched(connector, NULL, NULL)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
			if (!quiet)
				log_err(-1, (char *) argv[0], log_buffer);
		}
	} else {
		threel[0] = Tcl_NewStringObj(bs->name, -1);
		threel[1] = attrlist(interp, bs->attribs);
		threel[2] = Tcl_NewStringObj(bs->text, -1);

		Tcl_SetObjResult(interp, Tcl_NewListObj(3, threel));

		pbs_statfree(bs);
	}

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}

int
PBS_StatVnode(clientData, interp, objc, objv)
ClientData clientData;
Tcl_Interp *interp;
int objc;
Tcl_Obj *CONST objv[];
{
	char *msg, *cmd;
	char *node = NULL;
	struct batch_status *bs;

	if (objc == 2)
		node = Tcl_GetStringFromObj(objv[1], NULL);
	else if (objc != 1) {
		Tcl_WrongNumArgs(interp, 1, objv, "?node?");
		return TCL_ERROR;
	}

	cmd = Tcl_GetStringFromObj(objv[0], NULL);
	if (connector < 0) {
		if (!quiet)
			log_err(-1, cmd, not_connected);
		SET_PBSERR(PBSE_NOSERVER);
		return TCL_OK;
	}

	if ((bs = pbs_statvnode(connector, node, NULL, NULL)) == NULL) {
		if (pbs_errno != PBSE_NONE) {
			msg = pbs_geterrmsg(connector);
			sprintf(log_buffer, "%s (%d)",
				msg ? msg : fail, pbs_errno);
			if (!quiet)
				log_err(-1, cmd, log_buffer);
		}
	} else
		batresult(interp, bs);

	SET_PBSERR(pbs_errno);
	return TCL_OK;
}
#endif

/*
 **	This is a site dependent routine provided as a place holder
 **	for whatever C code which may be required for your scheduler.
 */
void
	site_cmds(Tcl_Interp *interp)
{
	DBPRT(("%s: entered\n", __func__))
#ifdef NAS
	/* localmod 071 */
	Tcl_CreateObjCommand(interp, "pbsatrsep", PBS_atrsep, NULL, NULL);
	/* localmod 099 */
	Tcl_CreateObjCommand(interp, "pbsquiet", PBS_quiet, NULL, NULL);
	/* localmod 098 */
	Tcl_CreateObjCommand(interp, "pbsconfirm", PBS_confirm, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsstatresv", PBS_StatResv, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsstatsched", PBS_StatSched, NULL, NULL);
	Tcl_CreateObjCommand(interp, "pbsstatvnode", PBS_StatVnode, NULL, NULL);
#endif
	return;
}


================================================
FILE: src/tools/tracejob.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file tracejob.c
 *
 * @brief
 *		tracejob.c - This file contains the functions related to the tracejob command.
 *
 * Functions included are:
 * 	get_cols()
 * 	main()
 * 	parse_log()
 * 	sort_by_date()
 * 	sort_by_message()
 * 	strip_path()
 * 	free_log_entry()
 * 	line_wrap()
 * 	log_path()
 * 	alloc_more_space()
 * 	filter_excess()
 *
 */
#include <pbs_config.h> /* the master config generated by configure */

#include <stdio.h>
#include <string.h>
#include <time.h>
#include <stdlib.h>
#include <unistd.h>
#include <ctype.h>
#include <termios.h>
#if defined(HAVE_SYS_IOCTL_H)
#include <sys/ioctl.h>
#endif
#include "cmds.h"
#include "pbs_version.h"
#include "pbs_ifl.h"
#include "log.h"
#include "tracejob.h"

/* path from pbs home to the log files:
 index in mid_path must match with enum field in header */
const char *mid_path[] = {"server_priv/accounting", "server_logs", "mom_logs",
			  "sched_logs"};

struct log_entry *log_lines;
int ll_cur_amm;
int ll_max_amm;
int has_high_res_timestamp = 0;

static char none[1] = {'\0'};
/**
 * @brief
 * 		returns columns, in characters from winsize struct.
 *
 * @return	int
 * @retval	0	: failed.
 * @retval	columns, in characters	: success
 */
int
get_cols()
{

#ifdef WIN32
	CONSOLE_SCREEN_BUFFER_INFO csbi;

	if (GetConsoleScreenBufferInfo(GetStdHandle(STD_OUTPUT_HANDLE), &csbi)) {
		return (csbi.dwSize.X);
	}
	return (0);
#else
	struct winsize ws;

	if (ioctl(STDOUT_FILENO, TIOCGWINSZ, &ws) != -1) {
		return ws.ws_col;
	}
	return (0);
#endif
}
/**
 * @brief
 * 		This is main function of tracejob.
 *
 * @return	int
 * @retval	0	: success
 * @retval	1	: failure
 */
int
main(int argc, char *argv[])
{
	/* Array for the log entries for the specified job */
	FILE *fp;
	int i, j;
	char *filename; /* full path of logfile to read */
	struct tm *tm_ptr;
	int month, day, year;
	time_t t, t_save;
	signed char c;
	char *prefix_path = NULL;
	int number_of_days = 1;
	char *endp;
	short error = 0;
	int opt;
	char no_acct = 0, no_svr = 0, no_mom = 0, no_schd = 0;
	char verbose = 0;
	int wrap = -1;
	int log_filter = 0;
	int event_type;
	char filter_excessive = 0;
	int excessive_count;
#ifdef NAS /* localmod 022 */
	struct stat sbuf;
#endif /* localmod 022 */
	int unknw_job = 0;

	/*the real deal or output pbs_version and exit?*/
	PRINT_VERSION_AND_EXIT(argc, argv);

#if defined(FILTER_EXCESSIVE)
	filter_excessive = 1;
#endif

#if defined(EXCESSIVE_COUNT)
	excessive_count = EXCESSIVE_COUNT;
#endif

	pbs_loadconf(0);

	while ((c = getopt(argc, argv, "zvamslw:p:n:f:c:-:")) != EOF) {
		switch (c) {
			case 'v':
				verbose = 1;
				break;

			case 'a':
				no_acct = 1;
				break;

			case 's':
				no_svr = 1;
				break;

			case 'm':
				no_mom = 1;
				break;

			case 'l':
				no_schd = 1;
				break;

			case 'z':
				filter_excessive = filter_excessive ? 0 : 1;
				break;

			case 'c':
				excessive_count = strtol(optarg, &endp, 10);
				if (*endp != '\0')
					error = 1;
				break;

			case 'w':
				wrap = strtol(optarg, &endp, 10);
				if (*endp != '\0')
					error = 1;
				break;

			case 'p':
				prefix_path = optarg;
				break;

			case 'n':
				number_of_days = strtol(optarg, &endp, 10);
				if (*endp != '\0')
					error = 1;
				break;

			case 'f':
				if (strcmp(optarg, "error") == 0)
					log_filter |= PBSEVENT_ERROR;
				else if (strcmp(optarg, "system") == 0)
					log_filter |= PBSEVENT_SYSTEM;
				else if (strcmp(optarg, "admin") == 0)
					log_filter |= PBSEVENT_ADMIN;
				else if (strcmp(optarg, "job") == 0)
					log_filter |= PBSEVENT_JOB;
				else if (strcmp(optarg, "job_usage") == 0)
					log_filter |= PBSEVENT_JOB_USAGE;
				else if (strcmp(optarg, "security") == 0)
					log_filter |= PBSEVENT_SECURITY;
				else if (strcmp(optarg, "sched") == 0)
					log_filter |= PBSEVENT_SCHED;
				else if (strcmp(optarg, "debug") == 0)
					log_filter |= PBSEVENT_DEBUG;
				else if (strcmp(optarg, "debug2") == 0)
					log_filter |= PBSEVENT_DEBUG2;
				else if (strcmp(optarg, "resv") == 0)
					log_filter |= PBSEVENT_RESV;
				else if (strcmp(optarg, "debug3") == 0)
					log_filter |= PBSEVENT_DEBUG3;
				else if (strcmp(optarg, "debug4") == 0)
					log_filter |= PBSEVENT_DEBUG4;
				else if (strcmp(optarg, "force") == 0)
					log_filter |= PBSEVENT_FORCE;
				else if (isdigit(optarg[0])) {
					log_filter = strtol(optarg, &endp, 16);
					if (*endp != '\0')
						error = 1;
				} else
					error = 1;
				break;

			default:
				error = 1;
		}
	}

	/* no jobs */
	if (error || argc == optind) {
		printf(
			"USAGE: %s [-a|s|l|m|v] [-w size] [-p path] [-n days] [-f filter_type] job_identifier...\n",
			strip_path(argv[0]));

		printf(
			"   -p : path to PBS_HOME\n"
			"   -w : number of columns of your terminal\n"
			"   -n : number of days in the past to look for job(s) [default 1]\n"
			"   -f : filter out types of log entries, multiple -f's can be specified\n"
			"        error, system, admin, job, job_usage, security, sched, debug, \n"
			"        debug2, resv, debug3, debug4, force or absolute numberic equiv\n"
			"   -z : toggle filtering excessive messages\n"
			"   -c : what message count is considered excessive\n"
			"   -a : don't use accounting log files\n"
			"   -s : don't use server log files\n"
			"   -l : don't use scheduler log files\n"
			"   -m : don't use mom log files\n"
			"   -v : verbose mode - show more error messages\n");

		printf("\n       %s --version\n", strip_path(argv[0]));
		printf("   --version : display version only\n\n");

		printf("default prefix path = %s\n", pbs_conf.pbs_home_path);
#if defined(FILTER_EXCESSIVE)
		printf("filter_excessive: ON\n");
#else
		printf("filter_excessive: OFF\n");
#endif
		return 1;
	}

	if (wrap == -1)
		wrap = get_cols();

	time(&t);
	t_save = t;

	for (opt = optind; opt < argc; opt++) {
		ll_cur_amm = 0; /* reset line count to zero */
		for (i = 0, t = t_save; i < number_of_days; i++, t -= SECONDS_IN_DAY) {
			tm_ptr = localtime(&t);
			month = tm_ptr->tm_mon;
			day = tm_ptr->tm_mday;
			year = tm_ptr->tm_year;

			for (j = 0; j < 4; j++) {
				if ((j == IND_ACCT && no_acct) || (j == IND_SERVER && no_svr) ||
				    (j == IND_MOM && no_mom) || (j == IND_SCHED && no_schd))
					continue;

#ifdef NAS /* localmod 022 */
				filename = log_path(prefix_path, j, 1, month, day, year);
				if (stat(filename, &sbuf) == -1) {
					filename = log_path(prefix_path, j, 0, month, day, year);
				}
#else
				filename = log_path(prefix_path, j, month, day, year);
#endif /* localmod 022 */

				if ((fp = fopen(filename, "r")) == NULL) {
					if (verbose)
						perror(filename);
					continue;
				}

				parse_log(fp, argv[opt], j);

				fclose(fp);
			}
		}

		if (filter_excessive)
			filter_excess(excessive_count);

		qsort(log_lines, ll_cur_amm, sizeof(struct log_entry), sort_by_date);

		if (ll_cur_amm != 0) {
			printf("\nJob: %s\n\n", log_lines[0].name);
			for (i = 0; i < ll_cur_amm; i++) {
				if (log_lines[i].log_file == 'A')
					event_type = 0;
				else
					event_type = strtol(log_lines[i].event, &endp, 16);
				if (!(log_filter & event_type) && !(log_lines[i].no_print)) {
					if (has_high_res_timestamp) {
						printf("%-27s %-5c", log_lines[i].date, log_lines[i].log_file);
						line_wrap(log_lines[i].msg, 33, wrap);
					} else {
						printf("%-20s %-5c", log_lines[i].date, log_lines[i].log_file);
						line_wrap(log_lines[i].msg, 26, wrap);
					}
				}
			}
		} else {
			/*
			 * if line count is zero, it means that there is
			 * no job associated with the job-id given.
			 */
			unknw_job = 1;
			if (strchr(argv[opt], '.') == NULL)
				fprintf(stderr, "\ntracejob: Couldn't find Job Id %s.%s in logs of past %d day%s\n\n", argv[opt],
					pbs_conf.pbs_server_name, number_of_days, number_of_days == 1 ? "" : "s");
			else
				fprintf(stderr, "\ntracejob: Couldn't find Job Id %s in logs of past %d day%s\n\n", argv[opt],
					number_of_days, number_of_days == 1 ? "" : "s");
		}
	}

	/* return 1 if unknown job-id */
	if (unknw_job)
		return 1;

	return 0;
}

/**
 * @brief
 *		parse_log - parse out entires of a log file for a specific job
 *		    and return them in log_entry structures
 *
 * @param[in]	fp	-	the log file
 * @param[in]	job	-	the name of the job
 * @param[in]	ind	-	which log file - index in enum index
 *
 *	@return	nothing
 *	@note
 *		modifies global variables: loglines, ll_cur_amm, ll_max_amm
 *
 * @par MT-safe: No
 */
void
parse_log(FILE *fp, char *job, int ind)
{
	struct log_entry tmp; /* temporary log entry */
	char *buf;	      /* buffer to read in from file */
	char *tbuf;	      /* temporarily hold realloc's for main buffer */
	char job_buf[128];    /* hold the jobid and the . */
	char *p;	      /* pointer to use for strtok */
	int field_count;      /* which field in log entry */
	int j = 0;
	struct tm tms; /* used to convert date to unix date */
	int lineno = 0;
	int slen;
	char *pdot;
	int buf_size = 16384; /* initial buffer size */
	int break_fl = 0;

	buf = (char *) calloc(buf_size, sizeof(char));
	if (!buf)
		return;

	tms.tm_isdst = -1; /* mktime() will attempt to figure it out */

	strcpy(job_buf, job);

	while (fgets(buf, buf_size, fp) != NULL) {
		while (buf_size == (strlen(buf) + 1)) {
			buf_size *= 2;
			tbuf = (char *) realloc(buf, (buf_size + 1) * sizeof(char));
			if (!tbuf) {
				break_fl = 1;
				break;
			}
			buf = tbuf;
			if (fgets(buf + strlen(buf), buf_size / 2 + 1, fp) == NULL) {
				break_fl = 1;
				break;
			}
		}
		if (break_fl)
			break;
		lineno++;
		j++;
		buf[strlen(buf) - 1] = '\0';
		p = strtok(buf, ";");
		field_count = 0;
		memset(&tmp, 0, sizeof(struct log_entry));

		for (field_count = 0; field_count < 6 && p != NULL; field_count++) {
			switch (field_count) {
				case FLD_DATE:
					tmp.date = p;
					if (ind == IND_ACCT)
						field_count = 2;
					break;

				case FLD_EVENT:
					tmp.event = p;
					break;

				case FLD_OBJ:
					tmp.obj = p;
					break;

				case FLD_TYPE:
					tmp.type = p;
					break;

				case FLD_NAME:
					tmp.name = p;
					break;

				case FLD_MSG:
					tmp.msg = p;
					break;

				default:
					printf("Field count too big!\n");
					printf("%s\n", p);
			}

			p = strtok(NULL, ";");
		}

		pdot = strchr(job_buf, (int) '.');
		if (pdot == NULL && tmp.name != NULL) {
			int tlen = strlen(job_buf);

			slen = strcspn(tmp.name, ".");
			if (tlen > slen)
				slen = tlen;
		} else
			slen = strlen(job_buf);

		if (tmp.name != NULL && strncmp(job_buf, tmp.name, slen) == 0) {
			if (ll_cur_amm >= ll_max_amm)
				alloc_more_space();

			free_log_entry(&log_lines[ll_cur_amm]);

			if (tmp.date != NULL) {
				/*
				 * We need to parse the time string.
				 * The string will either have high res logging or not.
				 * The high res logging is after the dot after the seconds field.
				 */
				log_lines[ll_cur_amm].date = strdup(tmp.date);
				if ((ind != IND_ACCT) && (strchr(tmp.date, '.'))) {
					/* Parse time string looking for high res logging.  If we don't parse 7 fields, we have a invalid log time. */
					if (sscanf(tmp.date, "%d/%d/%d %d:%d:%d.%ld", &tms.tm_mon,
						   &tms.tm_mday, &tms.tm_year, &tms.tm_hour, &tms.tm_min,
						   &tms.tm_sec, &(log_lines[ll_cur_amm].highres)) != 7) {
						log_lines[ll_cur_amm].date_time = -1; /* error in date field */
						log_lines[ll_cur_amm].highres = NO_HIGH_RES_TIMESTAMP;
					} else { /* We found all 7 fields, correctly formed time string */
						has_high_res_timestamp = 1;
						if (tms.tm_year > 1900)
							tms.tm_year -= 1900;
						/* The number of months since January,
 						 * in the range 0 to 11 for mktime()
 						 */
						tms.tm_mon--;
						log_lines[ll_cur_amm].date_time = mktime(&tms);
					}
				} else { /* Normal time string */
					if (sscanf(tmp.date, "%d/%d/%d %d:%d:%d", &tms.tm_mon, &tms.tm_mday,
						   &tms.tm_year, &tms.tm_hour, &tms.tm_min, &tms.tm_sec) != 6) {
						log_lines[ll_cur_amm].date_time = -1; /* error in date field */
					} else {				      /* We found all 6 fields, correctly formed time string */
						if (tms.tm_year > 1900)
							tms.tm_year -= 1900;
						tms.tm_mon--; /* The number of months since January, in the range 0 to 11 for mktime */
						log_lines[ll_cur_amm].date_time = mktime(&tms);
					}
					log_lines[ll_cur_amm].highres = NO_HIGH_RES_TIMESTAMP;
				}
			}
			if (tmp.event != NULL)
				log_lines[ll_cur_amm].event = strdup(tmp.event);
			else
				log_lines[ll_cur_amm].event = none;
			if (tmp.obj != NULL)
				log_lines[ll_cur_amm].obj = strdup(tmp.obj);
			else
				log_lines[ll_cur_amm].obj = none;
			if (tmp.type != NULL)
				log_lines[ll_cur_amm].type = strdup(tmp.type);
			else
				log_lines[ll_cur_amm].type = none;
			if (tmp.name != NULL)
				log_lines[ll_cur_amm].name = strdup(tmp.name);
			else
				log_lines[ll_cur_amm].name = none;
			if (tmp.msg != NULL)
				log_lines[ll_cur_amm].msg = strdup(tmp.msg);
			else
				log_lines[ll_cur_amm].msg = none;
			switch (ind) {
				case IND_SERVER:
					log_lines[ll_cur_amm].log_file = 'S';
					break;

				case IND_SCHED:
					log_lines[ll_cur_amm].log_file = 'L';
					break;

				case IND_ACCT:
					log_lines[ll_cur_amm].log_file = 'A';
					break;

				case IND_MOM:
					log_lines[ll_cur_amm].log_file = 'M';
					break;
				default:
					log_lines[ll_cur_amm].log_file = 'U'; /* undefined */
			}
			log_lines[ll_cur_amm].lineno = lineno;
			ll_cur_amm++;
		}
	}
	free(buf);
}

/**
 * @brief
 *		sort_by_date - compare function for qsort.  It compares two time_t
 *			variables and high resolution time stamp (if set)
 *
 * @param[in]	v1	-	log_entry structure1 which contains time_t variables.
 * @param[in]	v1	-	log_entry structure2 which contains time_t variables.
 *
 * @return	int
 * @retval	0	: both are same.
 * @retval	-1	: v1 is lesser than v2
 * @retval	1	: v1 is greater than v2
 */

int
sort_by_date(const void *v1, const void *v2)
{
	struct log_entry *l1, *l2;

	l1 = (struct log_entry *) v1;
	l2 = (struct log_entry *) v2;

	if (l1->date_time < l2->date_time)
		return -1;
	else if (l1->date_time > l2->date_time)
		return 1;
	else {
		if ((l1->highres != NO_HIGH_RES_TIMESTAMP) && (l2->highres != NO_HIGH_RES_TIMESTAMP)) {
			if (l1->highres < l2->highres)
				return -1;
			else if (l1->highres > l2->highres)
				return 1;
		}

		if (l1->log_file == l2->log_file) {
			if (l1->lineno < l2->lineno)
				return -1;
			else if (l1->lineno > l2->lineno)
				return 1;
		}
		return 0;
	}
}

/**
 * @brief
 *		sort_by_message - compare function used by qsort.  Compares the message
 *
 * @param[in]	v1	-	log_entry structure1 which contains message to be compared.
 * @param[in]	v1	-	log_entry structure2 which contains message to be compared.
 *
 * @return	return value from strcmp by passing v1 and v2 as arguments.
 */
int
sort_by_message(const void *v1, const void *v2)
{
	return strcmp(((struct log_entry *) v1)->msg, ((struct log_entry *) v2)->msg);
}

/**
 * @brief
 *		strip_path - strips all leading path and returns the command name
 *			i.e. /usr/bin/vi => vi
 *
 * @param[in]	path	-	the path to strip
 *
 * @return	striped path
 *
 */
char *
strip_path(char *path)
{
	char *p;

	p = path + strlen(path);

	while (p != path && *p != '/')
		p--;

	if (*p == '/')
		p++;

	return p;
}

/**
 * @brief
 *		free_log_entry - free the interal data used by a log entry
 *
 * @param[in,out]	lg	-	log entry to free
 *
 * @return nothing
 *
 */
void
free_log_entry(struct log_entry *lg)
{
	if (lg->date != NULL && lg->date != none)
		free(lg->date);

	lg->date = NULL;

	if (lg->event != NULL && lg->event != none)
		free(lg->event);

	lg->event = NULL;

	if (lg->obj != NULL && lg->obj != none)
		free(lg->obj);

	lg->obj = NULL;

	if (lg->type != NULL && lg->type != none)
		free(lg->type);

	lg->type = NULL;

	if (lg->name != NULL && lg->name != none)
		free(lg->name);

	lg->name = NULL;

	if (lg->msg != NULL && lg->msg != none)
		free(lg->msg);

	lg->msg = NULL;

	lg->log_file = '\0';
}

/**
 * @brief
 *		line_wrap - wrap lines at word margin and print
 *		    The first line will be printed.  The rest will be indented
 *		    by start and will not go over a max line length of end chars
 *
 *
 * @param[in]	line	-	the line to wrap
 * @param[in]	start	-	amount of whitespace to indent subsequent lines
 * @param[in]	end	-	number of columns in the terminal
 *
 * @return	nothing
 *
 */
void
line_wrap(char *line, int start, int end)
{
	int wrap_at;
	int total_size;
	int start_index;
	char *cur_ptr;
	char *start_ptr;

	start_ptr = line;
	total_size = strlen(line);
	wrap_at = (end > start) ? (end - start) : 0;
	start_index = 0;

	if (end == 0)
		printf("%s\n", show_nonprint_chars(line));
	else {
		while (start_index < total_size) {
			if (start_index + wrap_at < total_size) {
				cur_ptr = start_ptr + wrap_at;

				while (cur_ptr > start_ptr && *cur_ptr != ' ')
					cur_ptr--;

				if (cur_ptr == start_ptr) {
					cur_ptr = start_ptr + wrap_at;
					while (*cur_ptr != ' ' && *cur_ptr != '\0')
						cur_ptr++;
				}

				*cur_ptr = '\0';
			} else
				cur_ptr = line + total_size;

			/* first line, don't indent */
			if (start_ptr == line)
				printf("%s\n", show_nonprint_chars(start_ptr));
			else
				printf("%*s%s\n", start, " ", show_nonprint_chars(start_ptr));

			start_ptr = cur_ptr + 1;
			start_index = cur_ptr - line;
		}
	}
}

/**
 * brief
 *		log_path - create the path to a log file
 *
 * @param[out]	path	-	prefix path
 * @param[in]	index	-	index into the prefix_path array
 * @param[in]	old	-	old date or new
 * @param[in]	month	-	month in numeric starts from 0.
 * @param[in]	day	-	day in numeric.
 * @param[in]	year	-	year as a count from 1900.
 *
 * @return path to log file
 *
 * @par MT-safe:	No
 */
#ifdef NAS /* localmod 022 */
char *
log_path(char *path, int index, int old, int month, int day, int year)
{
	static char buf[256];
	char *oldd;

	oldd = old ? "/old.d" : "";
	if (pbs_conf.pbs_mom_home && index == IND_MOM)
		path = pbs_conf.pbs_mom_home;

	if (path != NULL)
		sprintf(buf, "%s/%s%s/%04d%02d%02d", path, mid_path[index], oldd,
			year + 1900, month + 1, day);
	else
		sprintf(buf, "%s/%s%s/%04d%02d%02d", pbs_conf.pbs_home_path,
			mid_path[index], oldd,
			year + 1900, month + 1, day);

	return buf;
}
#else
/**
 * brief
 *		log_path - create the path to a log file
 *
 * @param[out]	path	-	prefix path
 * @param[in]	index	-	index into the prefix_path array
 * @param[in]	month	-	month in numeric starts from 0.
 * @param[in]	day	-	day in numeric.
 * @param[in]	year	-	year as a count from 1900.
 *
 * @return path to log file
 *
 * @par MT-safe:	No
 */
char *
log_path(char *path, int index, int month, int day, int year)
{
	static char buf[256];

	if (pbs_conf.pbs_mom_home && index == IND_MOM)
		path = pbs_conf.pbs_mom_home;

	if (path != NULL)
		sprintf(buf, "%s/%s/%04d%02d%02d", path, mid_path[index],
			year + 1900, month + 1, day);
	else
		sprintf(buf, "%s/%s/%04d%02d%02d", pbs_conf.pbs_home_path, mid_path[index],
			year + 1900, month + 1, day);

	return buf;
}
#endif /* localmod 022 */

/**
 * @brief
 *		alloc_space - double the allocation of current log entires
 *
 */
void
alloc_more_space()
{
	int old_amm = ll_max_amm;
	struct log_entry *temp_log_lines;

	if (ll_max_amm == 0)
		ll_max_amm = DEFAULT_LOG_LINES;
	else
		ll_max_amm *= 2;

	if ((temp_log_lines = realloc(log_lines, ll_max_amm * sizeof(struct log_entry))) == NULL) {
		perror("Error allocating memory");
		exit(1);
	} else
		log_lines = temp_log_lines;

	memset(&log_lines[old_amm], 0, (ll_max_amm - old_amm) * sizeof(struct log_entry));
}

/**
 * @brief
 *		filter_excess - count and set the no_print flags if the count goes over
 *		       the message thrashold
 *
 * @param[in]	threshold	-	if the number of messages exceeds this, don't print them
 *
 * @return	nothing
 *
 * @note
 *		log_lines array will be sorted in place
 */
void
filter_excess(int threshold)
{
	int cur_count = 1;
	char *msg;
	int i;
	int j = 0;

	if (ll_cur_amm) {
		qsort(log_lines, ll_cur_amm, sizeof(struct log_entry), sort_by_message);
		msg = log_lines[0].msg;

		for (i = 1; i < ll_cur_amm; i++) {
			if (strcmp(log_lines[i].msg, msg) == 0)
				cur_count++;
			else {
				if (cur_count >= threshold) {
					/* we want to print 1 of the many messages */
					for (; j < i - 1; j++)
						log_lines[j].no_print = 1;
				}

				j = i;
				cur_count = 1;
				msg = log_lines[i].msg;
			}
		}

		if (cur_count >= threshold) {
			j++;
			for (; j < i; j++)
				log_lines[j].no_print = 1;
		}
	}
}


================================================
FILE: src/tools/tracejob.h
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef _TRACEJOB_H
#define _TRACEJOB_H
#ifdef __cplusplus
extern "C" {
#endif

/* Symbolic constants */

/* default number of columns on a terminal */
#ifndef DEFAULT_WRAP
#define DEFAULT_WRAP 80
#endif

/*
 * filter excessive log entires
 */
#ifndef FILTER_EXCESSIVE
#define FILTER_EXCESSIVE
#endif

/* if filter excessive if turned on and there are at least this many
 * log entires, its considered is considered excessive
 */
#ifndef EXCESSIVE_COUNT
#define EXCESSIVE_COUNT 15
#endif

/* number of entries to start */
#ifndef DEFAULT_LOG_LINES
#define DEFAULT_LOG_LINES 1024
#endif

#define SECONDS_IN_DAY 86400

/* indicies into the mid_path array */
enum index {
	IND_ACCT = 0,
	IND_SERVER = 1,
	IND_MOM = 2,
	IND_SCHED = 3
};

/* fields of a log entry */
enum field {
	FLD_DATE = 0,
	FLD_EVENT = 1,
	FLD_OBJ = 2,
	FLD_TYPE = 3,
	FLD_NAME = 4,
	FLD_MSG = 5
};

/* A PBS log entry */
struct log_entry {
	char *date;	       /* date of log entry */
	time_t date_time;      /* number of seconds from the epoch to date */
	long highres;	       /* high resolution portion of the log entry (number smaller than seconds) */
	char *event;	       /* event type */
	char *obj;	       /* what entity is writing the log */
	char *type;	       /* type of object Job/Svr/etc */
	char *name;	       /* name of object */
	char *msg;	       /* log message */
	char log_file;	       /* What log file */
	int lineno;	       /* what line in the file.  used to stabilize the sort */
	unsigned no_print : 1; /* whether or not to print the message */
			       /* A=accounting S=server M=Mom L=Scheduler */
};

/* prototypes */
int sort_by_date(const void *v1, const void *v2);
void parse_log(FILE *fp, char *job, int act);
char *strip_path(char *path);
void free_log_entry(struct log_entry *lg);
void line_wrap(char *line, int start, int end);
#ifdef NAS /* localmod 022 */
char *log_path(char *path, int index, int old, int month, int day, int year);
#else
char *log_path(char *path, int index, int month, int day, int year);
#endif /* localmod 022 */
void alloc_more_space();
void filter_excess(int threshold);
int sort_by_message(const void *v1, const void *v2);

/* Macros */
#define NO_HIGH_RES_TIMESTAMP -1

/* used by getopt(3) */
extern char *optarg;
extern int optind;
#ifdef __cplusplus
}
#endif
#endif /* _TRACEJOB_H */


================================================
FILE: src/tools/wrap_tcl.sh.in
================================================
#!/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

if [ $# -eq 1 ] && [ $1 = "--version" ]; then
   echo pbs_version = @PBS_VERSION@
   exit 0
fi

EXEC_FULL_NAME=$0
EXEC_SHORT_NAME=`basename $0`
EXEC_DIR_NAME=`dirname $0`
EXEC_ARGS=$*

LIBS_TO_LOAD=/opt/pbs/lib:/usr/pbs/lib:/usr/lib:/usr/local/lib

PBS_CONF_FILE=${PBS_CONF_FILE:-@PBS_CONF_FILE@}

test -f $PBS_CONF_FILE && . $PBS_CONF_FILE

PBS_LIB_PATH=${PBS_EXEC}/lib
if [ ! -d ${PBS_LIB_PATH} -a -d ${PBS_EXEC}/lib64 ] ; then
	PBS_LIB_PATH=${PBS_EXEC}/lib64
fi

if  test -f ${EXEC_DIR_NAME}/../pbs_wish &&  \
    test -f ${EXEC_DIR_NAME}/${EXEC_SHORT_NAME}.src.tk ; then
	PBS_WISH_PATH="${EXEC_DIR_NAME}/.."
	EXEC_PATH="${EXEC_DIR_NAME}"
elif test "$PBS_EXEC" != "" ; then
	PBS_WISH_PATH=${PBS_EXEC}/bin
	EXEC_PATH=${PBS_LIB_PATH}/${EXEC_SHORT_NAME}
else
	PBS_WISH_PATH=/usr/local/bin
	EXEC_PATH=/usr/local/lib/${EXEC_SHORT_NAME}
fi

env LD_LIBRARY_PATH=${LIBS_TO_LOAD}:${LD_LIBRARY_PATH} LD_LIBRARY_PATH_64=${LIBS_TO_LOAD}:${LD_LIBRARY_PATH_64} ${PBS_WISH_PATH}/pbs_wish ${EXEC_PATH}/${EXEC_SHORT_NAME}.src.tk ${EXEC_ARGS}


================================================
FILE: src/unsupported/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

unsupporteddir = ${exec_prefix}/unsupported

unsupported_PROGRAMS = pbs_rmget

dist_unsupported_SCRIPTS = \
	pbs_loganalyzer \
	pbs_stat \
	pbs_config \
	sgiICEvnode.sh \
	sgiICEplacement.sh \
	sgigenvnodelist.awk

# Marking all *.py files as data as these files are meant to be used as hooks and
# need no compilation.
dist_unsupported_DATA = \
	NodeHealthCheck.py \
	load_balance.py \
	mom_dyn_res.py \
	rapid_inter.py \
	run_pelog_shell.py \
	NodeHealthCheck.json \
	README \
	pbs_jobs_at.8B \
	pbs_rescquery.3B \
	run_pelog_shell.ini \
	cray_readme \
	ReliableJobStartup.py \
	pbs_output.py

pbs_rmget_CPPFLAGS = \
	-I$(top_srcdir)/src/include \
	@libz_inc@ \
	@KRB5_CFLAGS@

pbs_rmget_LDADD = \
	$(top_builddir)/src/lib/Libpbs/libpbs.la \
	$(top_builddir)/src/lib/Libtpp/libtpp.a \
	$(top_builddir)/src/lib/Liblog/liblog.a \
	$(top_builddir)/src/lib/Libnet/libnet.a \
	$(top_builddir)/src/lib/Libutil/libutil.a \
	-lpthread \
	@KRB5_LIBS@ \
	@libz_lib@

pbs_rmget_SOURCES = pbs_rmget.c


================================================
FILE: src/unsupported/NodeHealthCheck.json
================================================
{
   "mounts": {

      "comment": [ "Check the these mount points on the system",
         "This should be the actual mount point and not a link. ",
         "Consider looking to see if it is a link and points to a mount point ",
         "Possible actions upon failure: Warn,Offline,Reboot"
      ],
      "check":true,
      "mount_points" : { 
         "/home":"Warn", 
         "/scratch":"Warn"
      }
   },

   "disk_space": {
      "check":true,

      "comment": [
         "Check the disk space on the system.",
         "Format 'Directory':['Min free space','Action upon fail']",
         "if % is used then it refers to the amount of space used. example '15%'",
         "if a number is used then its units are bytes. example 1073741824",
         "if string is used then units must be defined example '1gb'"
      ],
      "dirs" : {
         "/tmp":["1gb","Warn"],
         "/scratch":[1073741824,"Warn"]
      },

      "comment1": [
         "Return the values in decimal (KB, MB, GB, etc) or in binary (KiB, MiB, GiB, etc)",
         "values:decimal,binary"
      ],
      "units" : "decimal"
   },

   "permissions": {
      "check":true,

      "comment": [
         "Check the system permissions.",
         "Format 'File':['Required permissions','Action upon fail']",
         "Format 'Directory':['Required permissions','Action upon fail']"
      ],
      "check_dirs_and_files" : {
         "/tmp":["1777","Warn"]
      }
   },

   "processes": {
      "check":true,

      "comment": [
         "Check the system permissions.",
         "Format 'File':['Required permissions','Action upon fail']",
         "Format 'Directory':['Required permissions','Action upon fail']"
      ],
      "running" : {
         "sshd":["root","Warn"]
      },
      "stopped" : {
         "nscd":["root","Warn"]
      }
   },

   "as_user_operations": {
      "comment": "To disable the touch file check set the value to False",
      "check" : true,

      "comment": [
         "Touch a file in the following directories",
         "Format 'Directory':['Touch file as this user','Action upon fail']",
         "Possible options for Directory: ",
         "<user_home> (Will be replaced with the users home dir)",
         "<userid> (Will be replace with the users id)",
         "'/actual/path' (No changes)",
         "Possible options for user: pbsuser (user running job) or pbsadmin (root)",
         "To look in the Variable list place a $ in front of the variable (i.e. $PBS_O_WORKDIR)"
      ],
      "touch_files" : { 
         "<user_home>":["pbsuser","Warn"], 
         "/scratch/<userid>":["pbsuser","Warn"], 
         "$PBS_O_WORKDIR":["pbsuser","Warn"],
         "/var/spool/pbs/mom_priv":["pbsadmin","Warn"]
      }
   }
}


================================================
FILE: src/unsupported/NodeHealthCheck.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


##############################################################################
# Purpose: To create a class for preforming node disk checks
# Date: 20141114
##############################################################################

'''
create hook NHC
set hook NHC event = 'execjob_begin,execjob_prologue'
set hook NHC fail_action = offline_vnodes
import hook NHC application/x-python default NodeHealthCheck.py
import hook NHC application/x-config default NodeHealthCheck.json

One can also optionally add exechost_periodic to NHC event
'''

import json
import os
# Import the needed modules for the program
import platform
import signal
import subprocess
import sys
import time
from pwd import getpwnam

try:
    import pbs

    # Remember, periodic events do not have a job associated to them.
    if pbs.event().type != pbs.EXECHOST_PERIODIC:
        who = pbs.event().job.euser

# For limiting testing to 1 user's jobs, uncomment this and change username
#        pbs.logmsg(pbs.EVENT_DEBUG3,'User: %s'%who)
#        if who != 'jshelley':
#            pbs.logmsg(pbs.EVENT_DEBUG,'jshelley != %s'%who)
#            pbs.event().accept()

    pbs.logmsg(pbs.EVENT_DEBUG3, 'Event: %s' % pbs.event().type)

    # Add the site-packages paths to the sys path
    pbs_conf = pbs.pbs_conf
#    py_path = '/opt/pbs/default/python/lib'
    py_path = pbs_conf['PBS_EXEC'] + os.sep + 'python/lib'
    py_version = str(sys.version_info.major) + "." + \
        str(sys.version_info.minor)
    my_paths = [py_path + '/python' + py_version + '.zip',
                py_path + '/python' + py_version,
                py_path + '/python' + py_version + '/plat-linux2',
                py_path + '/python' + py_version + '/lib-tk',
                py_path + '/python' + py_version + '/lib-dynload',
                py_path + '/python' + py_version + '/site-packages']

    if not sys.path.__contains__(py_path + '/python' + py_version):
        for my_path in my_paths:
            if my_path not in sys.path:
                sys.path.append(my_path)

except ImportError:
    pass


class NodeHealthCheck:
    def __init__(self, **kwords):
        self.host = ''
        self.user = ''
        self.job_id = ''
        self.nhc_cfg = None

        # Set up the values for host and user
        pbs.logmsg(pbs.EVENT_DEBUG3, "get node name")
        self.host = pbs.get_local_nodename()

        # Read in the configurations file
        pbs_hook_cfg = pbs.hook_config_filename
        if pbs_hook_cfg is None:
            pbs.logmsg(pbs.EVENT_DEBUG3, "%s" % os.environ)
            pbs_hook_cfg = os.environ["PBS_HOOK_CONFIG_FILE"]
        pbs.logmsg(pbs.EVENT_DEBUG3, "read config file: %s" %
                   pbs.hook_config_filename)
        config_file = open(pbs.hook_config_filename).read()

        self.nhc_cfg = json.loads(config_file)
        pbs.logmsg(pbs.EVENT_DEBUG3, "config file: %s" % self.nhc_cfg)

        # Check to make sure the event has a user associated with it
        pbs.logmsg(pbs.EVENT_DEBUG3, 'Event: %s' % pbs.event().type)
        if pbs.event().type != pbs.EXECHOST_PERIODIC:
            self.user = repr(pbs.event().job.Job_Owner).split("@")[
                0].replace("'", "")
            self.job_id = pbs.event().job.id
        else:
            self.user = 'EXECHOST_PERIODIC'
            self.job_id = str(time.time())

        pbs.logmsg(pbs.EVENT_DEBUG3, 'Done initializing NodeHealthCheck')

    def ChkMountPoints(self):
        if not self.nhc_cfg['mounts']['check']:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Skipping mounts check")
            return True

        for mnt_pnt in self.nhc_cfg["mounts"]["mount_points"]:
            pbs.logmsg(pbs.EVENT_DEBUG3, "mount point: %s, %s" % (
                mnt_pnt, self.nhc_cfg["mounts"]["mount_points"][mnt_pnt]))
            try:
                # Added the line below to check to see if the real path is a
                # mount or not
                if not os.path.ismount(os.path.realpath(mnt_pnt)):
                    pbs.logmsg(
                        pbs.EVENT_DEBUG3, "Mount: %s\tAction: %s" %
                        (mnt_pnt,
                         self.nhc_cfg["mounts"]["mount_points"][mnt_pnt]))
                    return [self.nhc_cfg["mounts"]["mount_points"][mnt_pnt],
                            '%s does not appear to be mounted' % mnt_pnt]
            except Exception as e:
                pbs.logmsg(pbs.EVENT_DEBUG, "Mount check error: %s" % e)
                return False
            pbs.logmsg(pbs.EVENT_DEBUG3,
                       "mount point %s checked out" % (mnt_pnt))
        return True

    def ConvertToBytes(self, value):
        # Determine what units the user would like to use.
        if self.nhc_cfg["disk_space"]["units"].lower() == 'binary':
            units = {'kb': 1024, 'mb': 1048576,
                     'gb': 1073741824, 'tb': 1099511627776}
        elif self.nhc_cfg["disk_space"]["units"].lower() == 'decimal':
            units = {'kb': 1000, 'mb': 1000000,
                     'gb': 1000000000, 'tb': 1000000000000}
        else:
            pbs.logmsg(
                pbs.EVENT_DEBUG3,
                ("I'm not sure how to handle units: %s\n"
                 "So I will default to binary") %
                (self.nhc_cfg["disk_space"]["units"]))
            units = {'kb': 1024, 'mb': 1048576,
                     'gb': 1073741824, 'tb': 1099511627776}

        value = value.lower()
        if value.find('%') != -1:
            pbs.logmsg(pbs.EVENT_DEBUG3, "found a % symbol")
            # Returned as a float so that I can distinguish between percentage
            # vs free space
            value = float(value.strip('%'))
            pbs.logmsg(pbs.EVENT_DEBUG3, "value: %s" % value)
        else:
            for key in list(units.keys()):
                if value.find(key) != -1:
                    try:
                        value = int(value[:-2].strip()) * units[key]
                    except Exception as e:
                        pbs.logmsg(
                            pbs.EVENT_DEBUG,
                            "Error convertion value to int: %s\tkey: %s" %
                            (value, key))
                        return False
                    break
        return value

    def ChkDiskUsage(self):
        """
            Checks to see the disk usage. Returns True if the tests pass.
        """
        if not self.nhc_cfg["disk_space"]["check"]:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Skipping disk space check")
            return True

        for check_dir in self.nhc_cfg["disk_space"]["dirs"]:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Dir: %s\tSpace: %s" % (
                check_dir, self.nhc_cfg["disk_space"]["dirs"][check_dir]))
            # Get the requested space required for the check
            spaceVal = self.nhc_cfg["disk_space"]["dirs"][check_dir][0]
            if isinstance(spaceVal, int) or isinstance(spaceVal, (float)):
                spaceVal = int(spaceVal)
            else:
                spaceVal = self.ConvertToBytes(spaceVal)
                if not spaceVal:
                    return False

            try:
                st = os.statvfs(check_dir)
                free = (st.f_bavail * st.f_frsize)
                total = (st.f_blocks * st.f_frsize)
                used = (st.f_blocks - st.f_bfree) * st.f_frsize
            except OSError:
                line = "No file or directory: %s" % check_dir
                return [self.nhc_cfg["disk_space"]["dirs"][check_dir]
                        [1], "No file or directory: %s" % check_dir]
            except Exception as e:
                pbs.logmsg(pbs.EVENT_DEBUG, "Check Disk Usage Error: %s" % (e))
                return False

            gb_unit = 1073741824
            if self.nhc_cfg["disk_space"]['units'].lower() == 'decimal':
                gb_unit = 1000000000

            if isinstance(spaceVal, int):
                pbs.logmsg(
                    pbs.EVENT_DEBUG3, "Free: %0.2lfgb\tRequested: %0.2lfgb" %
                    (float(free) / float(gb_unit),
                     float(spaceVal) / float(gb_unit)))
                if free < spaceVal:
                    return [
                        self.nhc_cfg["disk_space"]["dirs"][check_dir][1],
                        ('%s failed disk space check. Free: %0.2lfgb\t'
                         'Requested: %0.2lfgb') %
                        (check_dir,
                            float(free) /
                            float(gb_unit),
                            float(spaceVal) /
                            float(gb_unit))]

            elif isinstance(spaceVal, (float)):
                try:
                    pbs.logmsg(
                        pbs.EVENT_DEBUG3,
                        ("Free: %d\tTotal: %d\tUsed: %d\tUsed+Free: %d\t"
                         "SpaceVal: %d") %
                        (free, total, used, used + free, int(spaceVal)))
                    percent = 100 - \
                        int((float(used) / float(used + free)) * 100)
                    pbs.logmsg(
                        pbs.EVENT_DEBUG3, "Free: %d%%\tRequested: %d%%" %
                        (percent, int(spaceVal)))

                    if percent < int(spaceVal):
                        return [
                            self.nhc_cfg["disk_space"]["dirs"][check_dir][1],
                            ('%s failed disk space check. Free: %d%%\t'
                             'Requested: %d%%') %
                            (check_dir,
                             percent,
                             int(spaceVal))]
                except Exception as e:
                    pbs.logmsg(pbs.EVENT_DEBUG, "Error: %s" % e)

        return True

    def ChkDirFilePermissions(self):
        """
            Returns True if the permissions match. The permissions from python
            are returned as string with the '0100600'. The last three digits
            are the file permissions for user,group, world Return action if the
            permissions don't match and NoFileOrDir if it can't find the
            file/dir
        """

        if not self.nhc_cfg["permissions"]["check"]:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Skipping permissions check")
            return True

        for file_dir in self.nhc_cfg["permissions"]["check_dirs_and_files"]:
            pbs.logmsg(
                pbs.EVENT_DEBUG3, "File/Dir: %s\t%s" %
                (file_dir, str(
                    self.nhc_cfg["permissions"]["check_dirs_and_files"]
                    [file_dir][0])))
            try:
                st = os.stat(file_dir)
                permissions = oct(st.st_mode)

                if (permissions[-len(self.nhc_cfg["permissions"]
                                     ["check_dirs_and_files"][file_dir][0]):]
                        != str(self.nhc_cfg["permissions"]
                               ["check_dirs_and_files"][file_dir][0])):
                    pbs.logmsg(
                        pbs.EVENT_DEBUG3,
                        "Required permissions: %s\tpermissions: %s" %
                        (str(self.nhc_cfg["permissions"]
                             ["check_dirs_and_files"][file_dir][0]),
                         permissions[-len(self.nhc_cfg["permissions"]
                                          ["check_dirs_and_files"][file_dir][0]
                                          ):]))
                    return ([
                        self.nhc_cfg["permissions"]["check_dirs_and_files"]
                        [file_dir][1],
                        "File/Dir: %s\tRequired permissions: %s\tpermissions: "
                        "%s" %
                        (file_dir,
                         str(self.nhc_cfg["permissions"]
                             ["check_dirs_and_files"][file_dir][0]),
                         permissions[-len(self.nhc_cfg["permissions"]
                                          ["check_dirs_and_files"][file_dir][0]
                                          ):])])
            except OSError:
                return [self.nhc_cfg["permissions"]["check_dirs_and_files"]
                        [file_dir][1], "Can not find file/dir: %s" % file_dir]
            except BaseException:
                return False

        return True

    def ChkProcesses(self):
        if not self.nhc_cfg["processes"]["check"]:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Skipping processes check")
            return True

        # List all of the processes
        procs = {}
        if platform.uname()[0] == 'Linux':
            # out, err = subprocess.Popen(
            #   ['ps', '-Af'], stdout=subprocess.PIPE).communicate()
            out, err = subprocess.Popen(
                ['top', '-bn1'], stdout=subprocess.PIPE).communicate()
            lines = out.split('\n')
            for line in lines[1:]:
                if line != "":
                    line = line.split()
                    # If ps -Af is used
                    # procs[os.path.split(line[-1].split()[0])[-1]] = line[0]

                    # If top -bn1 is used
                    procs[os.path.split(line[-1].split()[0])[-1]] = line[1]

        pbs.logmsg(pbs.EVENT_DEBUG3, "Processes: %s" % procs)

        # store procs that violate the checks
        chk_procs = {}
        chk_procs['running'] = []
        chk_procs['stopped'] = []
        chk_action = ""

        # Loop through processes
        for proc in self.nhc_cfg["processes"]["running"]:
            if proc not in list(procs.keys()):
                pbs.logmsg(
                    pbs.EVENT_DEBUG,
                    "Process: %s is not in the running process list but "
                    "should be" %
                    proc)
                chk_procs['running'].append(proc)
                if chk_action == "":
                    chk_action = self.nhc_cfg['processes']['running'][proc][1]

        for proc in self.nhc_cfg['processes']['stopped']:
            if proc in list(procs.keys()):
                pbs.logmsg(
                    pbs.EVENT_DEBUG,
                    "Process: %s is in the stopped process list but was found "
                    "to be running" %
                    proc)
                chk_procs['stopped'].append(proc)
                if chk_action == "":
                    chk_action = self.nhc_cfg['processes']['stopped'][proc][1]

        if len(chk_procs['running']) > 0 or len(chk_procs['stopped']) > 0:
            line = "running: %s\nstopped: %s" % (
                ",".join(chk_procs['running']), ",".join(chk_procs['stopped']))
            return [
                chk_action,
                "CheckProcesses: One or more processes were found which "
                "violates the check\n%s" %
                line]

        return True

    def ChkTouchFileAsUser(self):
        if not self.nhc_cfg["as_user_operations"]["check"]:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Skipping touch file as user check")
            return True

        for file_dir in self.nhc_cfg["as_user_operations"]["touch_files"]:
            file_dir_orig = file_dir
            # Check to see if this is a periodic hook. If so skip pbsuser file
            # touches
            if (pbs.event().type == pbs.EXECHOST_PERIODIC and
                    self.nhc_cfg["as_user_operations"]["touch_files"]
                [file_dir_orig][0] == 'pbsuser'):
                pbs.logmsg(
                    pbs.EVENT_DEBUG3,
                    "Skipping this check dir: %s, since this is a periodic "
                    "hook" %
                    file_dir)
                continue

#            pbs.logmsg(pbs.EVENT_DEBUG3, "Dir: %s\tUser: %s" %
#                       (file_dir, str(self.nhc_cfg["as_user_operations"]
#                        ["touch_files"][file_dir_orig][0])))
#            pbs.logmsg(pbs.EVENT_DEBUG3,"Job User: %s"%(self.user))

            try:
                new_file_dir = ''
                if file_dir.startswith('$') != -1:
                    # I need to flesh out how to best handle this.
                    # It will require looking through the job environment
                    # varilables
                    V = pbs.event().job.Variable_List
                    pbs.logmsg(pbs.EVENT_DEBUG3, "Type(V): %s" % (type(V)))
                    pbs.logmsg(pbs.EVENT_DEBUG3, "Job variable list: %s" % (V))
                    for var in V:
                        pbs.logmsg(pbs.EVENT_DEBUG3,
                                   "var: %s, file_dir: %s" % (var, file_dir))
                        pbs.logmsg(pbs.EVENT_DEBUG3, "V[var]: %s" % (V[var]))
                        if var.startswith(file_dir[1:]):
                            new_file_dir = V[var]
                            pbs.logmsg(pbs.EVENT_DEBUG3,
                                       "New dir: %s" % (file_dir))
                            break

                    pass

                # Check to see what user this test should be run as.
                # Options: pbsuser or pbsadmin
                status = ''
                if (self.nhc_cfg["as_user_operations"]["touch_files"]
                    [file_dir_orig][0] == 'pbsadmin'):
                    pbs.logmsg(pbs.EVENT_DEBUG3,
                               "TouchFileAsAdmin: %s" % (file_dir))
                    if new_file_dir != '':
                        status = self.TouchFileAsUser(
                            'root', new_file_dir, file_dir_orig)
                    else:
                        status = self.TouchFileAsUser(
                            'root', file_dir, file_dir_orig)

                elif (self.nhc_cfg["as_user_operations"]["touch_files"]
                      [file_dir_orig][0] == 'pbsuser'):
                    # Check to see if check is to be written to a specific user
                    # dir
                    pbs.logmsg(
                        pbs.EVENT_DEBUG3,
                        "TouchFileAsUser: User: %s, Dir: %s" %
                        (self.user, file_dir))
                    if file_dir.find('<userid>') != -1:
                        file_dir = file_dir.replace('<userid>', self.user)

                    # Try to touch the file
                    if new_file_dir != '':
                        status = self.TouchFileAsUser(
                            self.user, new_file_dir, file_dir_orig)
                    else:
                        status = self.TouchFileAsUser(
                            self.user, file_dir, file_dir_orig)
                else:
                    pbs.logmsg(
                        pbs.EVENT_DEBUG,
                        "Unknown User: %s. Please specify either pbsadmin or "
                        "pbsuser" %
                        (str(
                            self.nhc_cfg["as_user_operations"]["touch_files"]
                            [file_dir_orig][0])))
                    return [
                        self.nhc_cfg["as_user_operations"]["touch_files"]
                        [file_dir_orig][1],
                        "Unknown User: %s. Please specify either pbsadmin or "
                        "pbsuser" %
                        (str(
                            self.nhc_cfg["as_user_operations"]["touch_files"]
                            [file_dir_orig][0]))]

                if not status:
                    return status

            except OSError:
                return [self.nhc_cfg["as_user_operations"]["touch_files"][
                    file_dir_orig][1], 'Can not find file/dir: %s' % file_dir]
            except Exception as e:
                return [
                    self.nhc_cfg["as_user_operations"]["touch_files"]
                    [file_dir_orig][1],
                    'Encountered an error %s for file/dir: %s' % (e, file_dir)
                ]
                # return False

        return True

    def TouchFileAsUser(self, user, file_dir, file_dir_orig):
        # file_dir_orig is needed to access the "Warn" or "Offline" information
        # for the file/directory in question from the config file when variable
        # substitution has taken place
        # Define the child var
        child = 0
        user_data = None

        pbs.logmsg(pbs.EVENT_DEBUG3, "User name: %s\tFile dir: %s" %
                   (user, file_dir))
        try:
            # user_data = getpwnam(self.user)
            user_data = getpwnam(user)

            if file_dir.find('<user_home>') != -1:
                file_dir = file_dir.replace('<user_home>', user_data[5])

            pbs.logmsg(pbs.EVENT_DEBUG3, "User name: %s\tDir to write to: %s" %
                       (user_data[4], file_dir))

# This is a special case where the user account does not exist on the
# node.  Offlining here is a good alternative to the job failing to run 20
# times and being held, but it can be changed if desired
        except KeyError:
            pbs.logmsg(pbs.EVENT_DEBUG, "Unable to find user: %s" % user)
            #
            return ['Offline', 'unable to find user: %s' % user]

        # Fork the process for touching a file as the user
        r, w = os.pipe()

        pid = os.fork()
        pbs.logmsg(pbs.EVENT_DEBUG3, "pid: %d" % pid)

        if pid:
            # We are the parent
            os.close(w)

            r = os.fdopen(r)  # turn r into a file object

            child = pid

            pbs.logmsg(pbs.EVENT_DEBUG3,
                       "Ready to read from the child process: %d" % pid)
            lines = r.read()

            pbs.logmsg(pbs.EVENT_DEBUG3, lines)
            # Wait for the child process to complete
            os.waitpid(child, 0)

            # Close the pipes
            r.close()

            # Check to see if the file was successfully touched
            if lines.find('Successfully touched file') == - \
                    1 or lines.find('Failed to remove file') != -1:
                pbs.logmsg(
                    pbs.EVENT_DEBUG3,
                    "Failed to touch/remove file in %s as %s" %
                    (file_dir, user))
                return [
                    self.nhc_cfg["as_user_operations"]["touch_files"]
                    [file_dir_orig][1],
                    'Failed to touch/remove file for %s in %s' %
                    (user,
                     file_dir)]
            else:
                pbs.logmsg(
                    pbs.EVENT_DEBUG3,
                    "Successfully touched and removed file for %s in %s" %
                    (user, file_dir))

        else:
            try:
                # Close the reading pipe
                os.close(r)

                # Turn w into a file object
                w = os.fdopen(w, 'w')

                # Switch to the user
                w.write("Ready to switch to user: %s\tuid: %s\n" %
                        (user, user_data[2]))
                os.setuid(user_data[2])

                # Change to the user home dir
                w.write("Changing dir to: %s\n" % (file_dir))
                if os.path.isdir(file_dir):
                    os.chdir(file_dir)

                    # Touch a file in the user's home directory
                    touch_file_name = (
                        "__user_%s_jobid_%s_host_%s_pbs_test.txt" %
                        (user, self.job_id, self.host))
                    w.write("Ready to touch file: %s\n" % (touch_file_name))
                    touchFileSuccess = self.TouchFile(touch_file_name)

                    if touchFileSuccess:
                        w.write("Successfully touched file\n")

                    try:
                        os.remove(touch_file_name)
                    except OSError:
                        w.write("Failed to remove file: %s" % touch_file_name)
                    except Exception as e:
                        w.write("Remove file exception: %s\n" % (e))
                else:
                    w.write("%s does not appear to be a directory" % file_dir)

            except Exception as e:
                w.write("Exception: %s\n" % (e))
            finally:
                # Close the pipe
                w.close()
                # Exit the child thread
                os._exit(0)

        return True

    def TouchFile(self, fname, times=None):
        try:
            open(fname, 'a').close()
            os.utime(fname, times)
            return True
        except IOError:
            pbs.logmsg(pbs.EVENT_DEBUG3, "Failed to touch file: %s" % (fname))
            return False

    def CheckNode(self):
        # Setup the fail counter
        failCnt = 0

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to check the mounts")
        if not c.ContinueChk(c.ChkMountPoints()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to check the disk usage")
        if not c.ContinueChk(c.ChkDiskUsage()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to check the file permissions")
        if not c.ContinueChk(c.ChkDirFilePermissions()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to check the processes")
        if not c.ContinueChk(c.ChkProcesses()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to touch file as user")
        if not c.ContinueChk(c.ChkTouchFileAsUser()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Exiting CheckNode function")

        return failCnt

    def CheckNodePeriodic(self):
        # Setup the fail counter
        failCnt = 0

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready perform check node periodic")

        # Run block of code with timeouts
        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to check the mounts")
        if not c.ContinueChk(c.ChkMountPoints()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to check the disk usage")
        if not c.ContinueChk(c.ChkDiskUsage()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Ready to check the file permissions")
        if not c.ContinueChk(c.ChkDirFilePermissions()):
            failCnt += 1

        pbs.logmsg(pbs.EVENT_DEBUG3, "Exiting CheckNode function")

        return failCnt

    def CheckOfflineNode(self):

        failCnt = self.CheckNodePeriodic()

        if failCnt == 0:
            localtime = time.asctime(time.localtime(time.time()))
            self.ContinueChk(
                ['Online', 'Passed the periodic test at %s' % localtime])
        return True

    def ContinueChk(self, status, comment=''):
        if isinstance(status, list):
            comment = str(status[1])
            status = status[0].lower()
        elif not isinstance(status, bool):
            status = status.lower()

        # Check to see how to handle the status
        pbs.logmsg(pbs.EVENT_DEBUG3, 'Status: %s\tComment: %s' %
                   (status, comment))
        if not status:
            return False
        elif status == 'warn':
            pbs.logmsg(pbs.EVENT_DEBUG, 'WARNING: %s' % comment)
            return True
        elif status == 'offline' or status == 'reboot':
            pbs.logmsg(pbs.EVENT_DEBUG, "Status: %s\tComment: %s" %
                       (status, comment))
            # Get the node, offline it,
            pbs.logmsg(pbs.EVENT_DEBUG, "Offline node: %s" % (self.host))
            myvnode = pbs.event().vnode_list[self.host]
            myvnode.state = pbs.ND_OFFLINE
            pbs.logmsg(
                pbs.EVENT_DEBUG,
                "Offline node type: %s, comment: %s" %
                (type(
                    str(comment)),
                    comment))
            myvnode.comment = "-attn_nhc: " + comment
            # pbs.logmsg(
            #     pbs.EVENT_DEBUG, "restart scheduler: %s %s" %
            #     (self.host, repr(myvnode.state)))
            # pbs.server().scheduler_restart_cycle()

            # Check to see if the node should be rebooted
            if status == 'reboot':
                pbs.logmsg(
                    pbs.EVENT_DEBUG,
                    "Comment: %s\nOfflined node: %s and rebooted" %
                    (comment, self.host))
                pbs.event().job.rerun()
                pbs.reboot('reboot')

                # Run this command if the node is rebooted
                # The event().reject function ends the script
                pbs.logmsg(
                    pbs.EVENT_DEBUG,
                    "Comment: %s\nOfflined node: %s and restarted scheduling "
                    "cycle" %
                    (comment,
                     self.host))
                pbs.event().reject("Offlined node, sent the reboot signal, "
                                   "and restarted scheduling cycle")

            # Reject the job
            pbs.event().reject("Offlined node and restarted scheduling cycle")

        elif status == 'online':
            pbs.logmsg(pbs.EVENT_DEBUG, "Onlined node: %s" % (self.host))
            mynodename = pbs.get_local_nodename()
            myvnode = pbs.event().vnode_list[mynodename]
            mynodename = pbs.get_local_nodename()
            pbs.logmsg(pbs.EVENT_DEBUG3, "got node: %s" % (mynodename))
            myvnode.state = pbs.ND_FREE
            pbs.logmsg(pbs.EVENT_DEBUG,
                       "Changed node state to ND_FREE: %s" % (mynodename))
            myvnode.comment = None
            pbs.logmsg(pbs.EVENT_DEBUG, "Onlined node: %s" % (mynodename))

        else:
            return True


if __name__ == "__builtin__":
    start = time.time()
    pbs.logmsg(pbs.EVENT_DEBUG3, "Starting the node health check")
    c = NodeHealthCheck()

    if pbs.event().type == pbs.EXECHOST_PERIODIC:
        vnode = pbs.server().vnode(c.host)
        if vnode.state == pbs.ND_OFFLINE and vnode.comment.startswith(
                '-attn_nhc:'):
            # Still need to flesh out CheckOfflineNode function
            c.CheckOfflineNode()
        else:
            c.CheckNodePeriodic()
    else:
        c.CheckNode()

    pbs.logmsg(pbs.EVENT_DEBUG3, "Finished check disk hook: %0.5lf (s)" %
               (time.time() - start))


================================================
FILE: src/unsupported/README
================================================
The material in this directory is unsupported.  It is provided as is,
and its inclusion with the distribution of PBS does not
imply any warranty or support.  Scripts, programs, etc. in this
directory are provided as examples and/or for diagnostic purposes.

The scripts, programs, etc. included here may or may not run on all
supported platforms.  The behavior of scripts, programs, etc. in this
directory may change without notice with a new release.

The material in this directory may or may not have documentation.  The
material in this directory may or may not contain proper commenting.

The material in this directory may appear or disappear without notice
with a new release.


================================================
FILE: src/unsupported/ReliableJobStartup.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# ReliableJobStartup.py:
#
# A job is started and one or more of the sister moms in a cluster fails to
# join job due to a reject from an execjob_begin hook or a reject from an
# execjob_prologue hook, and that sister mom goes offline.
# See NodeHealthCheck.py that might be used for this purpose.
#
# Using the reliable job startup feature, if the job's tolerate_node_failures
# is set to "job_start" (or "all"), the job's original select spec is
# expanded in increment_chunks() in a queuejob event.
#
# If ran by the primary mom, in an execjob_launch event the list of selected
# nodes for the job and the ones that failed after job started are logged and
# release_nodes(keep_select) will use good nodes to satisfy the select spec.
# The failed nodes are offlined.  The 's' accounting record is generated.

# To register the hook, as root via qmgr:
# qmgr << RJS
# create hook rjs_hook
# set hook rjs_hook event = 'queuejob,execjob_launch'
# set hook rjs_hook enabled = true
# import hook rjs_hook application/x-python default ReliableJobStartup.py
# RJS

import pbs
e = pbs.event()

if e.type == pbs.QUEUEJOB:
    # add a log entry in server logs
    pbs.logmsg(pbs.LOG_DEBUG, "queuejob hook executed")
    e.job.tolerate_node_failures = "job_start"

    # Save current select spec in resource 'site'
    selspec = e.job.Resource_List["select"]
    if selspec is None:
        e.reject("Event job does not have select spec!")
    e.job.Resource_List["site"] = str(selspec)

    # increment_chunks() can use a percentage argument or an integer. For
    # example add 1 chunk to each chunk (except the first) in the job's
    # select spec
    new_select = selspec.increment_chunks(1)
    e.job.Resource_List["select"] = new_select
    pbs.logmsg(pbs.LOG_DEBUG, "job's select spec changed to %s" % new_select)

elif e.type == pbs.EXECJOB_LAUNCH:
    # PBS_TASKNUM exists on primary Mom when executing launch hook, has value:
    # 1  - for the first time when launching top-level shell, or
    # >1 - for the spawned tasks servicing TM_SPAWN requests
    if not e.job.in_ms_mom() or (
            ('PBS_TASKNUM' in e.env) and (int(e.env['PBS_TASKNUM']) > 1)):
        e.accept()
    # add a log entry in primary mom logs
    pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")

    # print out the vnode_list[] values
    for vn in e.vnode_list:
        v = e.vnode_list[vn]
        pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")

    # print out the vnodes in vnode_list_fail[] and offline them
    for vn in e.vnode_list_fail:
        v = e.vnode_list_fail[vn]
        pbs.logjobmsg(
            e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
        v.state = pbs.ND_OFFLINE

    # prune the job's vnodes to satisfy the select spec in resource 'site'
    # and vnodes in vnode_list_fail[] are not used.
    pj = e.job.release_nodes(keep_select=e.job.Resource_List["site"])
    if pj is None:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at LAUNCH")


================================================
FILE: src/unsupported/cray_readme
================================================
Contents
--------

	pbs_output.py

This script is not intended to be run by users or Administrators.
It is run by the Cray RUR system as an "output plugin" that will
write data specific to a PBS job to a well known path that PBS hooks
can access:

PBS_HOME/spool/<jobid>.rur

The format of the file will be:

pluginName : apid : pluginOutput

See the Cray document: "Managing System Software for the Cray®
Linux Environment" section 12.7 "RUR Plugins" for more
information on the RUR plugin interface.
http://docs.cray.com/books/S-2393-5101/S-2393-5101.pdf


================================================
FILE: src/unsupported/load_balance.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

# This is a periodic hook script that monitors the load average on the local
# host, and offlines or frees the vnode representing the host depending the
# cpu load.
#
# A site can modify the "ideal_load" and "max_load" value below, so that:
# if the system's cpu load average falls above "max_load", then the
# vnode corresponding to the current host is offlined.
# This prevents the scheduler from scheduling jobs on this vnode.
#
# If the system's cpu load average falls below "ideal_load" value,
# then vnode representing the current host is set to free.
# This ensure the scheduler can now schedule jobs on this vnode.
#
# To instantiate this hook, specify the following:
#    qmgr -c "create hook load_balance event=exechost_periodic,freq=10"
#    qmgr -c "import hook load_balance application/x-python default
#             load_balance.py"

import os
import re

import pbs

ideal_load=1.5
max_load=2.0

# get_la: returns a list of load averages within the past 1-minute, 5-minute,
#         15-minutes range.
def get_la():
    line=os.popen("uptime").read()
    r = re.search(r'load average: (\S+), (\S+), (\S+)$', line).groups()
    return list(map(float, r))

local_node = pbs.get_local_nodename()

vnl = pbs.event().vnode_list
current_state = pbs.server().vnode(local_node).state
mla = get_la()[0]
if (mla >= max_load) and ((current_state & pbs.ND_OFFLINE) == 0):
    vnl[local_node].state = pbs.ND_OFFLINE
    vnl[local_node].comment = "offlined node as it is heavily loaded"
elif (mla < ideal_load) and ((current_state & pbs.ND_OFFLINE) != 0):
    vnl[local_node].state = pbs.ND_FREE
    vnl[local_node].comment = None


================================================
FILE: src/unsupported/mom_dyn_res.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

# A hook script that periodically updates the values of a set of

# custom resources for the vnode representing the current mom.
#
# The current set includes 2 size types: scratch, home
#
# Prerequisites:
#
#    1. Define the following custom resources in server's resourcedef file, and
#       restart pbs_server.
#
#       % cat PBS_HOME/server_priv/resourcedef
#           scratch type=size flag=nh
#           home type=size flag=nh
#
#    2. Add the new resources to the "resources:" line in sched_config file and
#       restart pbs_sched:
#
#       % cat PBS_HOME/sched_priv/sched_config
#           resources: ncpus, mem, arch, [...], scratch, home
#
#    3. Install this hook as:
#       qmgr -c "create hook mom_dyn_res event=exechost_periodic,freq=30"
#       qmgr -c "import hook mom_dyn_res application/x-python default
#                mom_dyn_res.py"
#
# NOTE:
#    Update the dyn_res[] array below to include any other custom resources
#    to be included in the updates. Ensure that each resource added has an
#    entry in the server's resourcedef file and scheduler's sched_config file.

import os

import pbs


# get_filesystem_avail_unprivileged: returns available size in kbytes
# (in pbs.size type) to unprivileged users, of the filesystem where 'dirname'
# resides.
#
def get_filesystem_avail_unprivileged( dirname ):
    o = os.statvfs(dirname)
    return pbs.size( "%skb" % ((o.f_bsize * o.f_bavail) / 1024) )

# get_filesystem_avail_privileged: returns available size in kbytes
# (in pbs.size type) to privileged users, of the filesystem where 'dirname'
# resides.
#
def get_filesystem_avail_privileged( dirname ):
    o = os.statvfs(dirname)
    return pbs.size( "%skb" % ((o.f_bsize * o.f_bfree) / 1024) )


# Define here the custom resources as key, and the function and its argument
# for obtaining the value of the custom resource:
#    Format: dyn_res[<resource_name>] = [<function_name>, <function_argument>]
# So "<function_name>(<function_argument>)" is called to return the value
# for custom <resource_name>.
dyn_res = {}
dyn_res["scratch"] = [get_filesystem_avail_unprivileged, "/tmp"]
dyn_res["home"]    = [get_filesystem_avail_unprivileged, "/home"]

vnl = pbs.event().vnode_list
local_node = pbs.get_local_nodename()

for k in list(dyn_res.keys()):
    vnl[local_node].resources_available[k] = dyn_res[k][0](dyn_res[k][1])


================================================
FILE: src/unsupported/pbs-mailer/README.md
================================================
### pbs-mailer

OpenPBS can easily send a huge amount of emails to one user/email. pbs-mailer is a service for an aggregation of emails sent by OpenPBS to the same user/email. The first email is sent immediately and subsequent emails are sent after a configurable time period. The emails are squashed into one email.

### Building package

* RPM package: run  'release-rpm.sh'
* DEB package: run  'release-deb.sh'

### Manual instalation

Move pbs_mail.json, pbs_mail_saver, and pbs_mail_sender into an appropriate location.

### Configure the mailer

The configuration file is pbs_mail.json. This file is located in /opt/pbs/etc/ by default.

* pidfile - the daemon's PID file location
* sqlite_db - sqlite database location
* sendmail - path to sendmail
* gathering_period -  during this period the emails are gathered
* mailer_cycle_sleep - the length of sleep before the next sender periods begin
* add_servername - add the server name to the email
* send_begin_immediately - if true, the notification of beginning job or reservation is sent immediately (together with already gathered emails) - the gathering_period is shortened

### Configure the pbs_server

* Set the server attribute 'mailer' to 'pbs_mail_saver'. E.g.: 'set server mailer = /opt/pbs/bin/pbs_mail_saver'
* Start the pbs-mailer (pbs_mail_sender) service.


================================================
FILE: src/unsupported/pbs-mailer/debian/changelog
================================================
pbs-mailer (1.0-1) unstable; urgency=low

  * initial package

 -- Altair Engineering, Inc. <https://www.openpbs.org/>  Mon, 14 Sep 2020 11:30:00 +0100


================================================
FILE: src/unsupported/pbs-mailer/debian/compat
================================================
9


================================================
FILE: src/unsupported/pbs-mailer/debian/conffiles
================================================
/opt/pbs/etc/pbs_mail.json


================================================
FILE: src/unsupported/pbs-mailer/debian/control
================================================
Source: pbs-mailer
Section: unknown
Priority: optional
Maintainer: Altair Engineering, Inc. <https://www.openpbs.org/>
Build-Depends: debhelper
Standards-Version: 3.8.4
 
Package: pbs-mailer
Depends: python3
Section: utils
Architecture: all
Description: Mailing service for PBS software.


================================================
FILE: src/unsupported/pbs-mailer/debian/pbs-mailer.service
================================================
[Unit]
Description=pbs-mailer

[Service]
Type=forking
ExecStart=/opt/pbs/bin/pbs_mail_sender start
ExecStop=/opt/pbs/bin/pbs_mail_sender stop

[Install]
WantedBy=multi-user.target


================================================
FILE: src/unsupported/pbs-mailer/debian/rules
================================================
#!/usr/bin/make -f

%:
	dh $@ --with-systemd

override_dh_auto_install:
	mkdir -p $(CURDIR)/debian/pbs-mailer/opt/pbs/bin
	mkdir -p $(CURDIR)/debian/pbs-mailer/opt/pbs/etc
	cp $(CURDIR)/pbs_mail.json $(CURDIR)/debian/pbs-mailer/opt/pbs/etc/
	cp $(CURDIR)/pbs_mail_saver $(CURDIR)/debian/pbs-mailer/opt/pbs/bin/
	cp $(CURDIR)/pbs_mail_sender $(CURDIR)/debian/pbs-mailer/opt/pbs/bin/
	dh_auto_install
	dh_systemd_enable || true
	dh_systemd_start || true

clean:
	dh_testdir
	dh_testroot
	dh_clean


================================================
FILE: src/unsupported/pbs-mailer/pbs_mail.json
================================================
{
	"pidfile": "/var/spool/pbs/pbs_mail.pid",
	"sqlite_db": "/var/spool/pbs/pbs_mail.sqlite",
	"sendmail": "/usr/sbin/sendmail",
	"gathering_period": 1800,
	"mailer_cycle_sleep": 60,
	"add_servername": true,
	"send_begin_immediately": false
}


================================================
FILE: src/unsupported/pbs-mailer/pbs_mail_saver
================================================
#!/usr/bin/env python3

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import sys
import time
import sqlite3
import json
import os


#
# CLASS saver
#
class PBS_mail_saver(object):
    """
    Email saver class
    """

    sqlite_db = "/var/spool/pbs/pbs_mail.sqlite",
    tb_name_emails = "pbs_emails"

    email_from = "adm"
    email_to = ""
    email_subject = ""
    email_body = []

    def __init__(self):
        config = {}
        try:
            config_file = "pbs_mail.json"
            paths = []

            abspath = os.path.dirname(os.path.abspath(__file__))
            paths.append(os.path.join(abspath, config_file))
            paths.append(os.path.join(abspath, '..', 'etc', config_file))
            paths.append(os.path.join('/etc', config_file))
            paths.append(os.path.join('/opt', 'pbs', 'etc', config_file))

            for path in paths:
                if os.path.isfile(path):
                    config_file = path
                    break

            f = open(os.path.join(path, config_file),)
            config = json.load(f)
            f.close()

            self.sqlite_db = config["sqlite_db"]

        except Exception as err:
            print("Failed to load configuration: %s" % err)
            exit(1)

        if len(sys.argv) > 1:

            pos = 1
            if sys.argv[1] == "-f" and len(sys.argv) >= 2:
                self.email_from = sys.argv[2]
                pos = 3
            if len(sys.argv) >= pos:
                self.email_to = sys.argv[3]

    def read_mail(self):
        """
        Read email from stdin
        """

        data = sys.stdin.readlines()

        for line in data:
            if not line.strip():
                continue

            if line.startswith("To: "):
                self.email_to = line[3:].strip()
            elif line.startswith("Subject: "):
                self.email_subject = line[8:].strip()
            else:
                self.email_body.append(line.strip())

    def save_mail_db(self):
        """
        Save email into sqlite database
        """

        now = int(time.time())

        try:
            conn = sqlite3.connect(self.sqlite_db)
            c = conn.cursor()
        except Exception as err:
            print(str(err))
            conn.commit()
            conn.close()
            return

        req = "SELECT name FROM sqlite_master \
              WHERE type='table' AND name='%s'"\
              % self.tb_name_emails
        c.execute(req)
        if c.fetchone() is None:
                req = "CREATE TABLE %s ( \
                      date integer, \
                      email_to text, \
                      email_from text, \
                      subject text, \
                      body text)" % self.tb_name_emails
                c.execute(req)

        req = "INSERT INTO %s \
              VALUES (%d, '%s', '%s', '%s', '%s')" % (
              self.tb_name_emails,
              now, self.email_to,
              self.email_from,
              self.email_subject,
              "\n".join(self.email_body))
        c.execute(req)

        conn.commit()
        conn.close()

if __name__ == "__main__":
    saver = PBS_mail_saver()
    saver.read_mail()
    saver.save_mail_db()


================================================
FILE: src/unsupported/pbs-mailer/pbs_mail_sender
================================================
#!/usr/bin/env python3

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import sys
import time
import sqlite3
import subprocess
import socket
import json
import os
import atexit
import re
from signal import SIGTERM


#
# CLASS Daemon
#
class Daemon(object):
    """
    Deamon class
    """

    sleeptime = 5

    def __init__(self, pidfile, debug):
        self.pidfile = pidfile
        self.debug = debug

    def daemonize(self):
        """
        Daemonize me
        """

        try:
            pid = os.fork()
            if pid > 0:
                sys.exit(0)
        except Exception as err:
            printf("fork failed: %s" % err)
            sys.exit(1)

        os.chdir("/")
        os.setsid()
        os.umask(0)

        atexit.register(self.delPID)
        pid = str(os.getpid())
        open(self.pidfile, 'w+').write("%s\n" % pid)

    def delPID(self):
        """
        Delete PID file
        """

        try:
            os.remove(self.pidfile)
        except OSError:
            pass

    def status(self):
        """
        Check status of daemon
        """

        try:
            f = open(self.pidfile, 'r')
            pid = int(f.read().strip())
            f.close()
        except IOError:
            return None

        try:
            os.kill(pid, 0)
        except Exception:
            self.delPID()
            return None

        return pid

    def start(self):
        """
        Daemonize and start main process: run()
        """

        pid = self.status()

        if pid:
            print("Daemon already running with pid %d" % pid)
            sys.exit(1)

        if not self.debug:
            if self.daemonize():
                sys.exit(1)

        try:
            self.run()
        except Exception as err:
            if self.debug:
                print("run() failed: %s" % err)
            return(1)

        return(0)

    def stop(self):
        """
        Stop process
        """

        try:
            f = open(self.pidfile, 'r')
            pid = int(f.read().strip())
            f.close()
        except IOError:
            pid = None

        if not pid:
            return(0)

        try:
            while True:
                os.kill(pid, SIGTERM)
                time.sleep(0.1)
        except OSError as err:
            err = str(err)
            if err.find("No such process") > 0:
                if os.path.exists(self.pidfile):
                    self.delPID()
            else:
                return(1)

        return(0)

    def restart(self):
        """
        Restart process - stop and start again
        """

        if self.stop() == 0:
            return self.start()

        return 1

    def run(self):
        """
        Main loop
        """

        while True:
            time.sleep(self.sleeptime)


#
# CLASS sender
#
class PBS_mail_sender(Daemon):
    """
    Email sender class
    """

    pidfile = "/var/spool/pbs/pbs_mail.pid"
    sqlite_db = "/var/spool/pbs/mail.sqlite"
    tb_name_emails = "pbs_emails"
    tb_name_timestamps = "pbs_users_timestamp"
    gathering_period = 1800
    mailer_cycle_sleep = 60
    sendmail = "/usr/sbin/sendmail"
    add_servername = True
    send_begin_immediately = False

    def __init__(self, debug):
        config = {}
        try:
            config_file = "pbs_mail.json"
            paths = []

            abspath = os.path.dirname(os.path.abspath(__file__))
            paths.append(os.path.join(abspath, config_file))
            paths.append(os.path.join(abspath, '..', 'etc', config_file))
            paths.append(os.path.join('/etc', config_file))
            paths.append(os.path.join('/opt', 'pbs', 'etc', config_file))

            for path in paths:
                if os.path.isfile(path):
                    config_file = path
                    break

            f = open(os.path.join(path, config_file),)
            config = json.load(f)
            f.close()

            self.pidfile = config["pidfile"]
            self.sqlite_db = config["sqlite_db"]
            self.gathering_period = config["gathering_period"]
            self.mailer_cycle_sleep = config["mailer_cycle_sleep"]
            self.sendmail = config["sendmail"]
            self.add_servername = config["add_servername"]
            self.send_begin_immediately = \
                config["send_begin_immediately"]

        except Exception as err:
            print("Failed to load configuration: %s" % err)
            sys.exit(1)

        super(PBS_mail_sender, self).__init__(self.pidfile, debug)

    def db_delete_emails(self, c):
        """
        Delete 'emails_to_delete' from sqllite db
        """

        for rowid in self.emails_to_delete:
            c.execute("DELETE FROM '%s' WHERE rowid == %d" % (
                self.tb_name_emails,
                rowid))
        self.emails_to_delete = []

    def send_mail(self, email_to, email_from, subject, body):
        """
        Real email sending
        """

        p = subprocess.Popen([self.sendmail, '-f ' + email_from, email_to],
                             stdout=subprocess.PIPE,
                             stdin=subprocess.PIPE,
                             stderr=subprocess.STDOUT)

        email_input = "To: %s\n" % email_to
        email_input += "Subject: %s\n\n" % subject
        email_input += body
        p.communicate(input=str.encode(email_input))

    def run(self):
        """
        Main
        """

        while True:
            now = int(time.time())

            try:
                conn = sqlite3.connect(self.sqlite_db)

                def regexp(expr, item):
                    reg = re.compile(expr)
                    return reg.search(item) is not None
                conn.create_function("REGEXP", 2, regexp)

                c = conn.cursor()
                req = "SELECT name FROM sqlite_master \
                      WHERE type='table' AND name='%s'" % \
                      self.tb_name_emails
                c.execute(req)
                if c.fetchone() is None:
                    conn.commit()
                    conn.close()
                    time.sleep(self.mailer_cycle_sleep)
                    continue
            except Exception as err:
                print(str(err))
                conn.commit()
                conn.close()
                time.sleep(self.mailer_cycle_sleep)
                continue

            emails_to_send = {}
            self.emails_to_delete = []
            threshold = now - self.gathering_period

            if self.send_begin_immediately:
                req = "SELECT rowid, date, email_to, email_from, subject, body \
                      FROM '%s' \
                      WHERE body REGEXP \
                      '.*Begun execution.*|\
.*Reservation period starting.*'" % self.tb_name_emails
                for email in c.execute(req):
                    (rowid,
                        timestamp,
                        email_to,
                        email_from,
                        subject,
                        body) = email

                    if email_to not in emails_to_send.keys():
                        emails_to_send[email_to] = []

                    emails_to_send[email_to].append([email_from,
                                                    subject,
                                                    body])
                    self.emails_to_delete.append(rowid)

            self.db_delete_emails(c)

            req = "SELECT name FROM sqlite_master \
                  WHERE type='table' AND name='%s'" % \
                  self.tb_name_timestamps
            c.execute(req)
            if c.fetchone() is None:
                req = "CREATE TABLE %s \
                      (date integer, recipient text UNIQUE)" % \
                      self.tb_name_timestamps
                c.execute(req)

            recipients = {}

            req = "SELECT DISTINCT email_to FROM '%s'" % self.tb_name_emails
            for email_to, in c.execute(req):
                recipients[email_to] = 1

            req = "SELECT date, recipient FROM '%s'" % self.tb_name_timestamps
            for timestamp, email_to in c.execute(req):
                recipients[email_to] = timestamp

            for i in recipients.keys():
                req = "SELECT rowid, date, email_to, email_from, subject, body \
                      FROM '%s' WHERE email_to = '%s'" % (
                      self.tb_name_emails,
                      i)
                for email in c.execute(req):
                    (rowid,
                        timestamp,
                        email_to,
                        email_from,
                        subject,
                        body) = email

                    is_time = recipients[email_to] < \
                        now - self.gathering_period
                    is_present = email_to in emails_to_send.keys()
                    if is_time or is_present:
                        if email_to not in emails_to_send.keys():
                            emails_to_send[email_to] = []

                        emails_to_send[email_to].append([
                            email_from,
                            subject,
                            body])
                        self.emails_to_delete.append(rowid)

            self.db_delete_emails(c)

            for email_to in emails_to_send.keys():
                req = "SELECT recipient FROM '%s' \
                      WHERE recipient='%s'" % (
                      self.tb_name_timestamps,
                      email_to)
                c.execute(req)
                if c.fetchone() is None:
                    req = "INSERT INTO %s VALUES (%d, '%s')" % (
                          self.tb_name_timestamps,
                          now,
                          email_to)
                else:
                    req = "UPDATE '%s' SET date = %d \
                          WHERE recipient = '%s'" % (
                          self.tb_name_timestamps,
                          now,
                          email_to)
                c.execute(req)

            conn.commit()
            conn.close()

            for email_to in emails_to_send.keys():
                email_from = ""
                email_body = ""
                subject = "PBS report"
                subjects = []

                for email in emails_to_send[email_to]:
                    email_from = email[0]
                    if self.add_servername:
                        email_body += email[1] \
                                      + "@" \
                                      + socket.gethostname()\
                                      + "\n\t"
                    else:
                        email_body += email[1] + "\n\t"
                    email_body += email[2].replace("\n", "\n\t") + "\n\n"
                    subjects.append(email[1])

                if len(subjects) == 1:
                    subject = subjects[0]
                else:
                    is_job = False
                    is_resv = False
                    for s in subjects:
                        if s.startswith("PBS JOB"):
                            is_job = True
                        if s.startswith("PBS RESERVATION"):
                            is_resv = True
                    subject = "PBS "
                    if is_job:
                        subject += "JOB"
                    if is_job and is_resv:
                        subject += "|"
                    if is_resv:
                        subject += "RESERVATION"
                    subject += " squashed report"
                    email_body = "This e-mail is a squashed report of " \
                                 + str(len(subjects)) \
                                 + " e-mails from PBS.\n\n" \
                                 + email_body
                self.send_mail(email_to, email_from, subject, email_body)

            time.sleep(self.mailer_cycle_sleep)


if __name__ == "__main__":
    debug = False
    if "--debug" in sys.argv or "-d" in sys.argv:
        debug = True

    sender = PBS_mail_sender(debug)

    if len(sys.argv) > 1:
        if 'restart' in sys.argv:
            if sender.stop() != 0 or sender.start() != 0:
                print("Restarting failed")

        elif 'stop' in sys.argv:
            if sender.stop() > 0:
                print("Stopping failed")

        elif 'start' in sys.argv:
            if sender.start() > 0:
                print("Starting failed")

        else:
            print("Unknown deamon command: %s" % " ".join(sys.argv))
            print("usage: %s start|stop|restart [-d|--debug]" % sys.argv[0])
            sys.exit(1)

        sys.exit(0)

    else:
        print("usage: %s start|stop|restart [-d|--debug]" % sys.argv[0])
        sys.exit(1)


================================================
FILE: src/unsupported/pbs-mailer/release-deb.sh
================================================
#!/bin/bash

dpkg-buildpackage -us -uc


================================================
FILE: src/unsupported/pbs-mailer/release-rpm.sh
================================================
#!/bin/bash

VERSION="1.0"

rm pbs-mailer-$VERSION -rf
mkdir -p pbs-mailer-$VERSION

cp pbs-mailer.spec pbs-mailer-$VERSION/
cp pbs_mail_saver pbs-mailer-$VERSION/
cp pbs_mail_sender pbs-mailer-$VERSION/
cp pbs_mail.json pbs-mailer-$VERSION/
cp debian/pbs-mailer.service pbs-mailer-$VERSION/

tar -cvzf pbs-mailer-${VERSION}.tar.gz pbs-mailer-$VERSION
rm pbs-mailer-$VERSION -rf

mkdir -p ~/rpmbuild/SOURCES/
mv pbs-mailer-${VERSION}.tar.gz ~/rpmbuild/SOURCES/

rpmbuild -ba pbs-mailer.spec


================================================
FILE: src/unsupported/pbs_config
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


pbs_conf=${PBS_CONF_FILE:-/etc/pbs.conf}
if [ -r "${pbs_conf}" ]; then
	. ${pbs_conf}
else
	echo "***" >&2
	echo "*** No PBS_CONF_FILE found, exiting" >&2
	echo "***" >&2
	exit 1
fi

export PYTHONPATH=${PBS_EXEC}/unsupported/fw:${PYTHONPATH}

if [ -x "${PBS_EXEC}/python/bin/python" ]; then
	${PBS_EXEC}/python/bin/python ${PBS_EXEC}/unsupported/fw/bin/pbs_config.py "${@}"
else
	python3 ${PBS_EXEC}/unsupported/fw/bin/pbs_config.py "${@}"
fi


================================================
FILE: src/unsupported/pbs_jobs_at.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"

.TH pbs_jobs_at 8B "22 September 2015" Local "PBS"
.SH NAME
.B pbs_jobs_at
\- tool to identify historical PBS jobs
.SH SYNOPSIS
.B pbs_jobs_at
[-s <start date>]
[-e <end date>]
[-n <nodes>]
.br
\ \ \ \ \ \ \ \ \ \ \
[-a <accounting logs directory>]
[-w <max walltime>]
.br
\ \ \ \ \ \ \ \ \ \ \
[-v]
[-h]

.SH DESCRIPTION
The
.B pbs_jobs_at
command allows you to identify historical jobs that were running on
node(s) during a certain period of time, perhaps because the cluster
manager identified possible issues and we need to know which jobs may
have been affected.

The tool reports jobs that were running on node(s) during a specified
period of time. This means jobs that started or finished as well as
were running when the period started (jobs that spanned the period of
time). During testing this has highlighted a few old jobs that have
finished but don't have end records due to hardware/software issues
that meant PBS wasn't able to properly clean up.

The tool queries either the system accounting logs on the host it is
run on or a named directory containing copies of accounting logs.

When specifying nodes of interest it is possible to define node ranges
using host[xx-yy], e.g. node[1-100] or node[01-09]. It is also
possible to specify multiple node(s) as a comma-separated list, for
example node[1-10],node[20-29].

All arguments are optional. If no arguments are specified it will
report all jobs on all nodes in all the accounting logs.

When giving a date and time for start or end the search for jobs is
accurate to the second specified. This can be useful if an exact time
if known for a historical issue.

.SH OPTIONS
.IP "-s <start date>" 10
Start date/time of time period. If no start date specified, begins
at first accounting log.

.IP "-e <end date>" 10
End date/time of time period. If no end date specified, finishes at
last accounting log.

.IP "-n <nodes>" 10
Nodes of interest. If no nodes specified, reports jobs on all nodes.

.IP "-a <accounting logs directory>" 10
Path to directory containing accounting logs.  If no accounting logs
directory specified, uses system logs in
$PBS_HOME/server_priv/accounting

.IP "-w <max walltime>" 10
Specify maximum job length to optimize search for jobs still running
at <start date>.  If not specified, searches from first accounting log

.IP "-v" 10
Verbose output. Display Nodes-Per-Job and Jobs-Per-Node.  If not
specified, displays list of jobs.

.IP "-h"  10
Displays help message.


================================================
FILE: src/unsupported/pbs_loganalyzer
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


pbs_conf=${PBS_CONF_FILE:-/etc/pbs.conf}
if [ -r "${pbs_conf}" ]; then
	. ${pbs_conf}
else
	echo "***" >&2
	echo "*** No PBS_CONF_FILE found, exiting" >&2
	echo "***" >&2
	exit 1
fi

export PYTHONPATH=${PBS_EXEC}/unsupported/fw:${PYTHONPATH}

if [ -x "${PBS_EXEC}/python/bin/python" ]; then
	${PBS_EXEC}/python/bin/python ${PBS_EXEC}/unsupported/fw/bin/pbs_loganalyzer.py "${@}"
else
	python3 ${PBS_EXEC}/unsupported/fw/bin/pbs_loganalyzer.py "${@}"
fi


================================================
FILE: src/unsupported/pbs_output.py
================================================
# coding: utf-8
#!/usr/bin/env python3
"""
/*
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

 *
 */
"""
__doc__ = """
This script is not intended to be run by users or Administrators.
It is run by the Cray RUR system as an "output plugin".
"""

import os
import sys
rur_path = os.path.join(os.path.sep, 'opt', 'cray', 'rur', 'default', 'bin')
if rur_path not in sys.path:
    sys.path.append(rur_path)
try:
    from rur_plugins import rur_output_args, get_plugin_name, rur_errorlog
except Exception:
    sys.stderr.write("Failed to import from rur_plugins\n")
    raise ImportError


def outname(jobid):
    # Create the pathname to write the RUR data for PBS.
    # By default it will be "/var/spool/pbs/spool/<jobid>.rur"
    home = "PBS_HOME"
    dirname = "/var/spool/pbs"
    if home in os.environ:
        dirname = os.environ[home]
    else:
        conf = 'PBS_CONF_FILE'
        if conf in os.environ:
            confile = os.environ[conf]
        else:
            confile = '/etc/pbs.conf'
        with open(confile, "r") as fp:
            for line in fp:
                line = line.strip()
                if line == "":
                    continue
                var, _, val = line.partition('=')
                if var == home:
                    dirname = val
                    break
    dirname = os.path.join(dirname, "spool")
    if os.path.isdir(dirname):
        return os.path.join(dirname, "%s.rur" % jobid)
    else:
        raise IOError("not a directory")


def main():
    # An RUR output plugin that will write data specific to a PBS job
    # to a well known path that PBS hooks can access.  The format of
    # the file will be:
    # pluginName : apid : pluginOutput
    #
    # See the Cray document: "Managing System Software for the Cray
    # Linux Environment" section 12.7 "RUR Plugins" for more
    # information on the RUR plugin interface.
    # http://docs.cray.com/books/S-2393-5101/S-2393-5101.pdf

    try:
        rur_output = list()
        rur_output = rur_output_args(sys.argv[1:], True)
        apid = rur_output[0]
        jobid = rur_output[1]
        inputfilelist = rur_output[4]
    except Exception as e:
        rur_errorlog("RUR PBS output plugin rur_output_args error '%s'" %
                     str(e))
        exit(1)

    # If an aprun runs within a PBS job, the jobid will have the PBS
    # jobid set.  It will have the short servername like "77.sdb".
    # If an aprun is run interactively, the jobid will be "0".
    if jobid == "0":		# not from a PBS job
        exit(0)

    try:
        output = outname(jobid)
        outfile = open(output, "a")
    except Exception:
        rur_errorlog("RUR PBS output plugin cannot access output file %s" %
                     output)
        exit(1)

    # copy input to job specific output file
    for inputfile in inputfilelist:
        try:
            plugin = get_plugin_name(inputfile)
            plugin = plugin.split()[1]		# keep just the plugin name
            with open(inputfile, "r") as infile:
                for line in infile:
                    outfile.write("%s : %s : %s" % (plugin, apid, line))
        except Exception:
            pass
    outfile.close()


if __name__ == "__main__":
    main()


================================================
FILE: src/unsupported/pbs_rescquery.3B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"

.if \n(Pb .ig Ig
.TH pbs_rescquery 3B "" Local "PBS Pro"
.\" The following macros are style for object names and values.
.de Ar		\" command/function arguments and operands (italic)
.ft 2
.if \\n(.$>0 \&\\$1\f1\\$2
..
.de Av		\" data item values  (Helv)
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
.ps -1
.if \\n(.$>0 \&\\$1\s+1\f1\\$2
..
.de At		\" attribute and data item names (Helv Bold)
.if  \n(Pb .ft 6
.if !\n(Pb .ft 2
.ps -1
.if \\n(.$>0 \&\\$1\s+1\f1\\$2
..
.de Ty		\" Type-ins and examples (typewritter)
.if  \n(Pb .ft 5
.if !\n(Pb .ft 3
.if \\n(.$>0 \&\\$1\f1\\$2
..
.de Er		\" Error values ( [Helv] )
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
\&\s-1[\^\\$1\^]\s+1\f1\\$2
..
.de Sc		\" Symbolic constants ( {Helv} )
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
\&\s-1{\^\\$1\^}\s+1\f1\\$2
..
.de Al		\" Attribute list item, like .IP but set font and size
.if !\n(Pb .ig Ig
.ft 6
.IP "\&\s-1\\$1\s+1\f1"
.Ig
.if  \n(Pb .ig Ig
.ft 2
.IP "\&\\$1\s+1\f1"
.Ig
..
.\" the following pair of macros are used to bracket sections of code
.de Cs
.ft 5
.nf
..
.de Ce
.sp
.fi
.ft 1
..
.\" End of macros
.Ig
.SH NAME
pbs_rescquery, avail, totpool, usepool - query resource availability
.SH SYNOPSIS
#include <pbs_error.h>
.br
#include <pbs_ifl.h>
.sp
.ft 3
.nf
int pbs_rescquery\^(\^int\ connect, char\ **resourcelist, int *arraysize,
int *available, int *allocated, int *reserved, int *down \^)
.sp
char *avail\^(\^int connect, char *resc\^)
.sp
int totpool\^(\^int connect, int update\^)
.sp
int usepool\^(\^int connect, int update\^)
.fi
.ft 1
.SH DESCRIPTION
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B pbs_rescquery
.br
Issue a request to the batch server to query the availability of resources.
.Ar connect
is the connection returned by \f3pbs_connect\fP().
.Ar resourcelist
is an array of one or more strings specifying the resources to be queried.
.Ar arraysize
is the is the number of strings in resourcelist.
.Ar available ,
.Ar allocated ,
.Ar reserved ,
and
.Ar down
are integer arrays of size arraysize.  The amount of resource specified in
the corresponding resourcelist string which is available, already allocated,
reserved, and down/off-line is returned in the integer arrays.
.IP
At the present time the only resources which may be specified is "nodes".
It may be specified as
.br
.Ty \ \ \ \ nodes
.br
.Ty \ \ \ \ nodes=
.br
.Ty \ \ \ \ nodes=\f2specification\f1
.br
where specification is what a user specifies in the -l option arguement list
for nodes, see qsub(1B) and the various pbs_resource_* man pages.
.IP
Where the node resourcelist is a simple type, such as "nodes", "nodes=",
or "nodes=\f2type\fP", the numbers returned reflect the actual number of nodes
(of the specified type) which are \f2available\fP, \f2allocated\fP,
\f2reserved\fP, or \f2down\fP.
.IP
For a more complex node resourcelist, such as
"nodes=2" or "nodes=type1:type2", only the value returned in
.I available
has meaning.
If the number in
.I available
is positive, it is the number of nodes required to satisfy the specification
and that some set of nodes are available which will satisfy it, see
.I avail ().
If the number in
.I available
is zero, some number of nodes required for the specification are
currently unavailable, the request might be satisfied at a later time.
If the number in
.I available
is negative, no combination of known nodes can fulfill the specification.
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B avail
.br
The
.I avail ()
call is provided as a conversion aid for schedulers written for early versions
of PBS.   The avail() routine uses pbs_rescquery() and returns a character
string answer.
.Ar connect
is the connection returned by \f3pbs_connect\fP().
.Ar resc
is a single
.I node=specification
specification as discussed above.  If the nodes to satisfy the specification
are currently available, the return value is the character string
.B yes .
If the nodes are currently unavailable, the return is the character string
.B no .
If the specification could never be satisfied, the return is the string
.B never .
An error in the specification returns the character string
.B ? .
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B totpool
.br
The
.I totpool ()
function returns the total number of nodes known to the PBS server.  This is
the sum of the number of nodes available, allocated, reserved, and down.
The parameter
.Ar connection
is the connection returned by pbs_connect().
The parameter
.Ar update
if non-zero, causes totpool() to issue a pbs_rescquery() call to obtain
fresh information.   If zero, numbers from the prior pbs_rescquery() are used.
.if \n(Pb .ig Ig
.HP 2
.Ig
.if !\n(Pb .ig Ig
.sp
.Ig
.B usepool
.br
.I usepool ()
returns the number of nodes currently in use, the sum of allocated, reserved,
and down.
The parameter
.Ar connection
is the connection returned by pbs_connect().
The parameter
.Ar update
if non-zero, causes totpool() to issue a pbs_rescquery() call to obtain
fresh information.   If zero, numbers from the prior pbs_rescquery() are used.
.SH "SEE ALSO"
qsub(1B), pbs_connect(3B), pbs_disconnect(3B), pbs_rescreserve(3B) and
pbs_resources(7B)
.SH DIAGNOSTICS
When the batch request generated by the \f3pbs_rescquery\f1()
function has been completed successfully
by a batch server, the routine will return 0 (zero).
Otherwise, a non zero error is returned.  The error number is also set
in pbs_errno.
.LP
The functions usepool() and totpool() return -1 on error.


================================================
FILE: src/unsupported/pbs_rmget.8B
================================================
.\"
.\" Copyright (C) 1994-2021 Altair Engineering, Inc.
.\" For more information, contact Altair at www.altair.com.
.\"
.\" This file is part of both the OpenPBS software ("OpenPBS")
.\" and the PBS Professional ("PBS Pro") software.
.\"
.\" Open Source License Information:
.\"
.\" OpenPBS is free software. You can redistribute it and/or modify it under
.\" the terms of the GNU Affero General Public License as published by the
.\" Free Software Foundation, either version 3 of the License, or (at your
.\" option) any later version.
.\"
.\" OpenPBS is distributed in the hope that it will be useful, but WITHOUT
.\" ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
.\" FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
.\" License for more details.
.\"
.\" You should have received a copy of the GNU Affero General Public License
.\" along with this program.  If not, see <http://www.gnu.org/licenses/>.
.\"
.\" Commercial License Information:
.\"
.\" PBS Pro is commercially licensed software that shares a common core with
.\" the OpenPBS software.  For a copy of the commercial license terms and
.\" conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
.\" Altair Legal Department.
.\"
.\" Altair's dual-license business model allows companies, individuals, and
.\" organizations to create proprietary derivative works of OpenPBS and
.\" distribute them - whether embedded or bundled with other software -
.\" under a commercial license agreement.
.\"
.\" Use of Altair's trademarks, including but not limited to "PBS™",
.\" "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
.\" subject to Altair's trademark licensing policies.
.\"

.if \n(Pb .ig Iq
.TH pbs_rmget 8B "8 February 2007" Local "PBS"
.\" The following macros are style for object names and values.
.de Ar		\" command/function arguments and operands (italic)
.ft 2
.if \\n(.$>0 \&\\$1\f1\\$2
..
.de Av		\" data item values  (Helv)
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
.ps -1
.if \\n(.$>0 \&\\$1\s+1\f1\\$2
..
.de At		\" attribute and data item names (Helv Bold)
.if  \n(Pb .ft 6
.if !\n(Pb .ft 2
.ps -1
.if \\n(.$>0 \&\\$1\s+1\f1\\$2
..
.de Ty		\" Type-ins and examples (typewriter)
.if  \n(Pb .ft 5
.if !\n(Pb .ft 3
.if \\n(.$>0 \&\\$1\f1\\$2
..
.de Er		\" Error values ( [Helv] )
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
\&\s-1[\^\\$1\^]\s+1\f1\\$2
..
.de Sc		\" Symbolic constants ( {Helv} )
.if  \n(Pb .ft 6
.if !\n(Pb .ft 3
\&\s-1{\^\\$1\^}\s+1\f1\\$2
..
.de Al		\" Attribute list item, like .IP but set font and size
.if !\n(Pb .ig Ig
.ft 6
.IP "\&\s-1\\$1\s+1\f1"
.Ig
.if  \n(Pb .ig Ig
.ft 2
.IP "\&\\$1\s+1\f1"
.Ig
..
.\" the following pair of macros are used to bracket sections of code
.de Cs
.ft 5
.nf
..
.de Ce
.sp
.fi
.ft 1
..
.\" End of macros
.Iq


.SH NAME
.B pbs_rmget
\- queries MOM for resource values

.SH SYNOPSIS
pbs_rmget [-m MOM name] [-p port] [resource list]

.SH DESCRIPTION
The
.B pbs_rmget
command uses the resource monitor interface to query the MOM
for resource values.

.SH OPTIONS
.IP "-m MOM name" 15
The
.I MOM name
(hostname) to query.
If the
.I MOM name
is not specified, the MOM on the current host is queried.

.IP "-p port" 15
Specifies the MOM's RM
.I port
to query.  If the
.I port
is not specified, the default port is queried.

.SH OPERANDS
.IP "resource list" 15
Space-separated list of one or more resources.
If no
.I resource list
is given, the
.B pbs_rmget
command returns its usage.

.SH OUTPUT
Given
.B pbs_rmget RES_A RES_B,
the output is:
.RS 5
[0] RES_A=<value of RES_A>
.br
[1] RES_B=<value of RES_B>
.RE
.br

Querying a nonexistent resource:
.br
Given
.B pbs_rmget RES_C,
where RES_C is nonexistent, the output is:
.RS 5
[0] RES_C=? 15201
.RE

.SH EXIT STATUS
.IP "0" 15
Success
.IP "1" 15
if MOM name, option, or port is unrecognized.
A message is printed to standard error.
.LP

.SH ERROR MESSAGES
If the
.B pbs_rmget
command fails to open a connection to the MOM name given in the
.I -m
option:
.RS 5
"Unable to open connection to mom: <MOM name>, <MOM port>"
.RE
The default MOM port is reported as zero.
.br

If the
.B pbs_rmget
command fails to get a message back from MOM:
.RS 5
"Error getting response <resource request> from mom."
.RE

.SH SEE ALSO
The
.B PBS Professional External Reference Specification,
The
.B PBS Administrator's Guide,
.br
rm(3B),
pbs_mom(8B), pbs_tclsh(8B)


================================================
FILE: src/unsupported/pbs_rmget.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <pbs_config.h>

#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <unistd.h>
#include <pbs_ifl.h>
#include <rm.h>
#include "pbs_internal.h"
#include "tpp.h"
#include "log.h"

#define SHOW_NONE 0xff

int
main(int argc, char *argv[])
{
	int i;
	char mom_name[PBS_MAXHOSTNAME + 1];
	int mom_port = 0;
	int c;
	int mom_sd;
	char *req;

	if (initsocketlib())
		return 1;

	if (gethostname(mom_name, (sizeof(mom_name) - 1)) < 0)
		mom_name[0] = '\0';

	while ((c = getopt(argc, argv, "m:p:")) != EOF) {
		switch (c) {
			case 'm':
				strcpy(mom_name, optarg);
				break;
			case 'p':
				mom_port = atoi(optarg);
				break;
			default:
				fprintf(stderr, "Bad option: %c\n", c);
		}
	}

	if (mom_name[0] == '\0' || optind == argc) {
		fprintf(stderr,
			"Error in usage: pbs_rmget [-m mom name] [-p mom port] <req1>...[reqN]\n");
		return 1;
	}

	if (set_msgdaemonname("pbs_rmget")) {
		fprintf(stderr, "Out of memory\n");
		return 1;
	}

	/* load the pbs conf file */
	if (pbs_loadconf(0) == 0) {
		fprintf(stderr, "%s: Configuration error\n", argv[0]);
		return (1);
	}

	set_log_conf(pbs_conf.pbs_leaf_name, pbs_conf.pbs_mom_node_name,
		     pbs_conf.locallog, pbs_conf.syslogfac,
		     pbs_conf.syslogsvr, pbs_conf.pbs_log_highres_timestamp);

	if (!pbs_conf.pbs_leaf_name) {
		char my_hostname[PBS_MAXHOSTNAME + 1];
		if (gethostname(my_hostname, (sizeof(my_hostname) - 1)) < 0) {
			fprintf(stderr, "Failed to get hostname\n");
			return -1;
		}
		pbs_conf.pbs_leaf_name = get_all_ips(my_hostname, log_buffer, sizeof(log_buffer) - 1);
		if (!pbs_conf.pbs_leaf_name) {
			fprintf(stderr, "%s\n", log_buffer);
			fprintf(stderr, "%s\n", "Unable to determine TPP node name");
			return -1;
		}
	}

	if ((mom_sd = openrm(mom_name, mom_port)) < 0) {
		fprintf(stderr, "Unable to open connection to mom: %s:%d\n", mom_name, mom_port);
		return 1;
	}

	for (i = optind; i < argc; i++)
		addreq(mom_sd, argv[i]);

	for (i = optind; i < argc; i++) {
		req = getreq(mom_sd);
		if (req == NULL) {
			fprintf(stderr, "Error getting response %d from mom.\n", i - optind);
			return 1;
		}
		printf("[%d] %s\n", i - optind, req);
		free(req);
	}

	closerm(mom_sd);

	return 0;
}


================================================
FILE: src/unsupported/pbs_stat
================================================
#!/bin/bash
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


pbs_conf=${PBS_CONF_FILE:-/etc/pbs.conf}
if [ -r "${pbs_conf}" ]; then
	. ${pbs_conf}
else
	echo "***" >&2
	echo "*** No PBS_CONF_FILE found, exiting" >&2
	echo "***" >&2
	exit 1
fi

export PYTHONPATH=${PBS_EXEC}/unsupported/fw:${PYTHONPATH}

if [ -x "${PBS_EXEC}/python/bin/python" ]; then
	${PBS_EXEC}/python/bin/python ${PBS_EXEC}/unsupported/fw/bin/pbs_stat.py "${@}"
else
	python3 ${PBS_EXEC}/unsupported/fw/bin/pbs_stat.py "${@}"
fi


================================================
FILE: src/unsupported/rapid_inter.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

# This is a queuejob hook script that determines if a job entering the system
# is an interactive job. And if so, directs it to the high priority queue
# specified in 'high_priority_queue', and also tells the server to restart
# the scheduling cycle. This  for faster qsub -Is throughput.
#
# Prerequisite:
#    Site must define a "high" queue as follows:
#        qmgr -c "create queue high queue_type=e,Priority=150
#        qenable high
#        qstart high
#    NOTE:
#        A) 150 is the default priority for an express (high) queue.
#           This will have the interactive job to preempt currently running
#           work.
#        B) If site does not want this, lower the priority of the high
#           priority queue.  This might not cause the job to run right away,
#           but will try.
#
#    This hook is instantiated as follows:
#        qmgr -c "create hook rapid event=queuejob"
#        qmgr -c "import hook rapid_inter application/x-python default
#                 rapid_inter.py"
import pbs

high_priority_queue="high"

e = pbs.event()
if e.job.interactive:
    high = pbs.server().queue(high_priority_queue)
    if high is not None:
        e.job.queue = high
        pbs.logmsg(pbs.LOG_DEBUG, "quick start interactive job")
        pbs.server().scheduler_restart_cycle()


================================================
FILE: src/unsupported/renew-test/base64.c
================================================
/* -*- mode: c; c-basic-offset: 4; indent-tabs-mode: nil -*- */
/* util/support/base64.c - base64 encoder and decoder */
/*
 * Copyright (c) 1995-2001 Kungliga Tekniska Högskolan
 * (Royal Institute of Technology, Stockholm, Sweden).
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 *
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 *
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * 3. Neither the name of the Institute nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE INSTITUTE AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE INSTITUTE OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

//#include <k5-platform.h>
//#include <k5-base64.h>
#include <string.h>
#include <stdlib.h>

#ifndef SIZE_MAX
#define SIZE_MAX ((size_t) ((size_t) 0 - 1))
#endif

static const char base64_chars[] =
	"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";

char *
k5_base64_encode(const void *data, size_t len)
{
	char *s, *p;
	size_t i;
	unsigned int c;
	const unsigned char *q;

	if (len > SIZE_MAX / 4)
		return NULL;

	p = s = malloc(len * 4 / 3 + 4);
	if (p == NULL)
		return NULL;
	q = (const unsigned char *) data;

	for (i = 0; i < len;) {
		c = q[i++];
		c *= 256;
		if (i < len)
			c += q[i];
		i++;
		c *= 256;
		if (i < len)
			c += q[i];
		i++;
		p[0] = base64_chars[(c & 0x00fc0000) >> 18];
		p[1] = base64_chars[(c & 0x0003f000) >> 12];
		p[2] = base64_chars[(c & 0x00000fc0) >> 6];
		p[3] = base64_chars[(c & 0x0000003f) >> 0];
		if (i > len)
			p[3] = '=';
		if (i > len + 1)
			p[2] = '=';
		p += 4;
	}
	*p = '\0';
	return s;
}

#define DECODE_ERROR 0xffffffff

/* Decode token, which must be four bytes long. */
static unsigned int
decode_token(const char *token)
{
	int i, marker = 0;
	unsigned int val = 0;
	const char *p;

	for (i = 0; i < 4; i++) {
		val *= 64;
		if (token[i] == '=') {
			marker++;
		} else if (marker > 0) {
			return DECODE_ERROR;
		} else {
			p = strchr(base64_chars, token[i]);
			if (p == NULL)
				return DECODE_ERROR;
			val += p - base64_chars;
		}
	}
	if (marker > 2)
		return DECODE_ERROR;
	return (marker << 24) | val;
}

void *
k5_base64_decode(const char *str, size_t *len_out)
{
	unsigned char *data, *q;
	unsigned int val, marker;
	size_t len;

	*len_out = SIZE_MAX;

	/* Allocate the output buffer. */
	len = strlen(str);
	if (len % 4)
		return NULL;
	q = data = malloc(len / 4 * 3);
	if (data == NULL) {
		*len_out = 0;
		return NULL;
	}

	/* Decode the string. */
	for (; *str != '\0'; str += 4) {
		val = decode_token(str);
		if (val == DECODE_ERROR) {
			free(data);
			return NULL;
		}
		marker = (val >> 24) & 0xff;
		*q++ = (val >> 16) & 0xff;
		if (marker < 2)
			*q++ = (val >> 8) & 0xff;
		if (marker < 1)
			*q++ = val & 0xff;
	}
	*len_out = q - data;
	return data;
}


================================================
FILE: src/unsupported/renew-test/base64.h
================================================
/* -*- mode: c; c-basic-offset: 4; indent-tabs-mode: nil -*- */
/* include/k5-base64.h - base64 declarations */
/*
 * Copyright (c) 1995, 1996, 1997 Kungliga Tekniska Högskolan
 * (Royal Institute of Technology, Stockholm, Sweden).
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 *
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 *
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * 3. Neither the name of the Institute nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE INSTITUTE AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE INSTITUTE OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#ifndef K5_BASE64_H
#define K5_BASE64_H

#include <stddef.h>

/* base64-encode data and return it in an allocated buffer.  Return NULL if out
 * of memory. */
char *k5_base64_encode(const void *data, size_t len);

/*
 * Decode str as base64 and return the result in an allocated buffer, setting
 * *len_out to the length.  Return NULL and *len_out == 0 if out of memory,
 * NULL and *len_out == SIZE_MAX on invalid input.
 */
void *k5_base64_decode(const char *str, size_t *len_out);

#endif /* K5_BASE64_H */


================================================
FILE: src/unsupported/renew-test/renew-test.c
================================================
/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <krb5.h>

#include "base64.h"

#define VAR_NAME_KEYTAB "PBS_RENEW_KRB_KEYTAB"

static krb5_error_code
prepare_ccache(krb5_context context, krb5_creds *creds, krb5_ccache *cc)
{
	krb5_error_code ret;
	krb5_ccache ccache = NULL;

	ret = krb5_cc_new_unique(context, "MEMORY", NULL, &ccache);
	if (ret) {
		fprintf(stderr, "krb5_cc_new_unique() failed (%s)",
			krb5_get_error_message(context, ret));
		goto end;
	}

	ret = krb5_cc_initialize(context, ccache, creds->client);
	if (ret) {
		fprintf(stderr, "krb5_cc_initialize() failed (%s)",
			krb5_get_error_message(context, ret));
		goto end;
	}

	ret = krb5_cc_store_cred(context, ccache, creds);
	if (ret) {
		fprintf(stderr, "krb5_cc_store_cred() failed (%s)",
			krb5_get_error_message(context, ret));
		goto end;
	}

	*cc = ccache;
	ccache = NULL;

end:
	if (ccache)
		krb5_cc_destroy(context, ccache);

	return ret;
}

static krb5_error_code
get_init_creds_user(krb5_context context, const char *username, krb5_creds *creds)
{
	krb5_error_code ret;
	krb5_get_init_creds_opt *opt = NULL;
	krb5_keytab keytab = NULL;
	krb5_principal user = NULL;

	ret = krb5_parse_name(context, username, &user);
	if (ret) {
		fprintf(stderr, "Parsing user principal (%s) failed: %s.\n",
			username, krb5_get_error_message(context, ret));
		goto end;
	}

	if (getenv(VAR_NAME_KEYTAB))
		ret = krb5_kt_resolve(context, getenv(VAR_NAME_KEYTAB), &keytab);
	else
		ret = krb5_kt_default(context, &keytab);
	if (ret) {
		fprintf(stderr, "Cannot open keytab: %s\n",
			krb5_get_error_message(context, ret));
		goto end;
	}

	ret = krb5_get_init_creds_opt_alloc(context, &opt);
	if (ret) {
		fprintf(stderr, "krb5_get_init_creds_opt_alloc() failed (%s)\n",
			krb5_get_error_message(context, ret));
		goto end;
	}

	krb5_get_init_creds_opt_set_forwardable(opt, 1);

	ret = krb5_get_init_creds_keytab(context, creds, user, keytab, 0, NULL, opt);
	if (ret) {
		fprintf(stderr, "krb5_get_init_creds_keytab() failed (%s)\n",
			krb5_get_error_message(context, ret));
		goto end;
	}

end:
	if (opt)
		krb5_get_init_creds_opt_free(context, opt);
	if (user)
		krb5_free_principal(context, user);
	if (keytab)
		krb5_kt_close(context, keytab);

	return (ret);
}

static krb5_error_code
init_auth_context(krb5_context context, krb5_auth_context *auth_context)
{
	int32_t flags;
	krb5_error_code ret;

	ret = krb5_auth_con_init(context, auth_context);
	if (ret) {
		fprintf(stderr, "krb5_auth_con_init() failed: %s.\n",
			krb5_get_error_message(context, ret));
		return ret;
	}

	krb5_auth_con_getflags(context, *auth_context, &flags);
	/* We disable putting times in the message so the message could be cached
	   and re-sent in the future. If caching isn't needed, it could be enabled
	   again (but read below) */
	/* N.B. The semantics of KRB5_AUTH_CONTEXT_DO_TIME applied in
	   krb5_fwd_tgt_creds() seems to differ between Heimdal and MIT. MIT uses
	   it to (also) enable replay cache checks (that are useless and
	   troublesome for us). Heimdal uses it to just specify whether or not the
	   timestamp is included in the forwarded message. */
	flags &= ~(KRB5_AUTH_CONTEXT_DO_TIME);
#ifdef HEIMDAL
	/* With Heimdal, we need explicitly set that the credential is in cleartext.
	 * MIT does not have the flag KRB5_AUTH_CONTEXT_CLEAR_FORWARDED_CRED */
	flags |= KRB5_AUTH_CONTEXT_CLEAR_FORWARDED_CRED;
#endif
	krb5_auth_con_setflags(context, *auth_context, flags);

	return 0;
}

/* Creates a KRB_CRED message containing serialized credentials. The credentials
   aren't encrypted, relying on the protection by application protocol, see RFC 6448 */
static krb5_error_code
get_fwd_creds(krb5_context context, krb5_creds *creds, krb5_data *creds_data)
{
	krb5_error_code ret;
	krb5_auth_context auth_context = NULL;
	krb5_ccache ccache = NULL;

	ret = init_auth_context(context, &auth_context);
	if (ret)
		goto end;

	ret = prepare_ccache(context, creds, &ccache);
	if (ret)
		goto end;

	/* It's necessary to pass a hostname to pass the code (Heimdal segfaults
	 * otherwise), MIT tries to get a credential for the host if session keys
	 * doesn't exist. It should be noted that the krb5 configuration should set
	 * the no-address flags for tickets (otherwise tickets couldn't be cached,
	 * wouldn't work with multi-homed machines etc.).
     */
	ret = krb5_fwd_tgt_creds(context, auth_context, "localhost", creds->client,
				 NULL, ccache, 1, creds_data);
	if (ret) {
		fprintf(stderr, "krb5_fwd_tgt_creds() failed: %s.\n",
			krb5_get_error_message(context, ret));
		goto end;
	}

end:
	if (auth_context)
		krb5_auth_con_free(context, auth_context);
	if (ccache)
		krb5_cc_destroy(context, ccache);

	return (ret);
}

static int
output_creds(krb5_context context, krb5_creds *target_creds)
{
	krb5_error_code ret;
	krb5_auth_context auth_context = NULL;
	krb5_creds **creds = NULL, **c;
	char *encoded = NULL;
	krb5_data _creds_data, *creds_data = &_creds_data;

	memset(&_creds_data, 0, sizeof(_creds_data));

	ret = get_fwd_creds(context, target_creds, creds_data);
	if (ret)
		goto end;

	ret = init_auth_context(context, &auth_context);
	if (ret)
		goto end;

	encoded = k5_base64_encode(creds_data->data, creds_data->length);
	if (encoded == NULL) {
		fprintf(stderr, "failed to encode the credentials, exiting.\n");
		ret = -1;
		goto end;
	}

	ret = krb5_rd_cred(context, auth_context, creds_data, &creds, NULL);
	if (ret) {
		fprintf(stderr, "krb5_rd_cred() failed: %s.\n",
			krb5_get_error_message(context, ret));
		goto end;
	}

	printf("Type: Kerberos\n");
	/* there might be multiple credentials exported, which we silently ignore */
	printf("Valid until: %ld\n", (long int) creds[0]->times.endtime);
	printf("%s\n", encoded);

	ret = 0;

end:
	krb5_free_data_contents(context, &_creds_data);
	if (auth_context)
		krb5_auth_con_free(context, auth_context);
	if (encoded)
		free(encoded);
	if (creds) {
		for (c = creds; c != NULL && *c != NULL; c++)
			krb5_free_creds(context, *c);
		free(creds);
	}

	return (ret);
}

static int
doit(const char *user)
{
	int ret;
	krb5_creds my_creds;
	krb5_context context = NULL;

	memset((char *) &my_creds, 0, sizeof(my_creds));

	ret = krb5_init_context(&context);
	if (ret) {
		fprintf(stderr, "Cannot initialize Kerberos, exiting.\n");
		return (ret);
	}

	ret = get_init_creds_user(context, user, &my_creds);
	if (ret)
		goto end;

	ret = output_creds(context, &my_creds);

end:
	krb5_free_cred_contents(context, &my_creds);
	krb5_free_context(context);

	return (ret);
}

int
main(int argc, char *argv[])
{
	char *progname;
	int ret;

	if ((progname = strrchr(argv[0], '/')))
		progname++;
	else
		progname = argv[0];

	if (argc != 2) {
		fprintf(stderr, "Usage: %s principal_name\n", progname);
		exit(1);
	}

	ret = doit(argv[1]);

	if (ret != 0)
		ret = 1;
	return (ret);
}


================================================
FILE: src/unsupported/run_pelog_shell.ini
================================================
[run_pelog_shell]
# Enable parallel prologues/epilogues that run on sister moms. Note that all
# the normal requirements apply, except the scripts should be named pprologue 
# and pepilogue.
ENABLE_PARALLEL=False

# Provide verbose hook output to the user's .o/.e file
VERBOSE_USER_OUTPUT=False

# DEFAULT_ACTION can be one of DELETE or RERUN
DEFAULT_ACTION=RERUN

# Enable Torque argument compatibility
TORQUE_COMPAT=False


================================================
FILE: src/unsupported/run_pelog_shell.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

"""
run_pelog_shell.py - PBS hook that runs the classic shell script prologue or
epilogue, if it exists, while still being able to use execjob_prologue or
execjob_epilogue hooks. Also adds the capability of running parallel prologue
or epilogue shell scripts and Torque compatibility.

On the primary execution host (the first host listed in PBS_NODEFILE), the
standard naming convention of 'prologue' and 'epilogue' apply. Parallel
prologues and epilogues use the naming conventions 'pprologue' and 'pepilogue',
respectively, but will only run on the secondary execution hosts. Classic
prologues and epilogues in Windows are not currently implemented.

Parallel prologues will not run until a task associated with the job (i.e. via
pbs_attach, pbs_tmrsh, pbsdsh) begins on the secondary execution hosts.

Parallel epilogues will not run unless the prologue ran successfully on the
primary execution host. Only the primary execution host will have a value for
resources_used in epilogue argument $7.

We assume the same requirements as listed in PBS 13.0
Administrator's Guide 11.5.4 for running all types of prologue and epilogue
shell scripts:
    - The script must be in the PBS_HOME/mom_priv directory
    - The prologue must have the exact name "prologue" under UNIX/Linux, or
      "prologue.bat" under Windows
    - The epilogue must have the exact name "epilogue" under UNIX/Linux, or
      "epilogue.bat" under Windows
    - The script must be written to exit with one of the zero or positive exit
      values listed in section 11.5.12, "Prologue and Epilogue Exit Codes". The
      negative values are set by MOM
    - Under UNIX/Linux, the script must be owned by root, be readable and exe-
      cutable by root, and cannot be writable by anyone but root
    - Under Windows, the script's permissions must give "Full Access" to the
      local Administrators group on the local computer

The hook will kill the prologue/epilogue after the hook_alarm time - 5 has been
reached. At this point the job will be requeued/deleted depending on the value
of DEFAULT_ACTION below. If the hook_alarm time is not available, the default
value of 30 seconds is assumed, giving the prologue/epilogue approximately 25
seconds to complete.

Installation:
Technically you could create a single hook that fires on both the
execjob_prologue and the execjob_epilogue events, but to ensure execution order
we separate the two into the individual events by creating two separate hooks
that refer to the same hook script.

Edit the run_pelog_shell.ini to make configuration changes, then create and
import the hook as follows.

As root, run the following:
qmgr << EOF
create hook run_prologue_shell
set hook run_prologue_shell event = execjob_prologue
set hook run_prologue_shell enabled = true
set hook run_prologue_shell order = 1
set hook run_prologue_shell alarm = 35
import hook run_prologue_shell application/x-python default run_pelog_shell.py
import hook run_prologue_shell application/x-config default run_pelog_shell.ini

create hook run_epilogue_shell
set hook run_epilogue_shell event = execjob_epilogue
set hook run_epilogue_shell enabled = true
set hook run_epilogue_shell order = 999
set hook run_prologue_shell alarm = 35
import hook run_epilogue_shell application/x-python default run_pelog_shell.py
import hook run_epilogue_shell application/x-config default run_pelog_shell.ini
EOF

Any further configuration changes to run_pelog_shell.ini will require
re-importing the file to both hooks:
qmgr << EOF
import hook run_prologue_shell application/x-config default run_pelog_shell.ini
import hook run_epilogue_shell application/x-config default run_pelog_shell.ini
EOF

Direct modifications to this hook are not recommended.
Proceed at your own risk.
"""

import os
import sys
import time

import pbs

RERUN = 14
DELETE = 6

# The following constants can be modified in run_pelog_shell.ini to match
# site preferences.

ENABLE_PARALLEL = False
VERBOSE_USER_OUTPUT = False
DEFAULT_ACTION = RERUN
TORQUE_COMPAT = False


# Set up a few variables
start_time = time.time()
pbs_event = pbs.event()
hook_name = pbs_event.hook_name
hook_alarm = 30  # default, we'll read it from the .HK later
DEBUG = False  # default, we'll read it from the .HK later
job = pbs_event.job

# The trace_hook function has been written to be portable between hooks.


def trace_hook(**kwargs):
    """Simple exception trace logger for PBS hooks
    loglevel=<int> (pbs.LOG_DEBUG): log level to pass to pbs.logmsg()
    reject=True: reject the job upon completion of logging trace
    trace_in_reject=<bool> (False): pass trace to pbs.event().reject()
    trace_in_reject=<str>: message to pass to pbs.event().reject() with trace
    """
    import sys

    if 'loglevel' in kwargs:
        loglevel = kwargs['loglevel']
    else:
        loglevel = pbs.LOG_ERROR
    if 'reject' in kwargs:
        reject = kwargs['reject']
    else:
        reject = True
    if 'trace_in_reject' in kwargs:
        trace_in_reject = kwargs['trace_in_reject']
    else:
        trace_in_reject = False

    # Associate hook events with the appropriate PBS constant. This is a list
    # of all hook events as of PBS 13.0. If the event does not exist, it is
    # removed from the list.
    hook_events=['queuejob', 'modifyjob', 'movejob', 'runjob', 'execjob_begin',
                 'execjob_prologue', 'execjob_launch', 'execjob_attach',
                 'execjob_preterm', 'execjob_epilogue', 'execjob_end',
                 'resvsub', 'provision', 'exechost_periodic',
                 'exechost_startup', 'execjob_resize', 'execjob_abort',
                 'execjob_postsuspend', 'execjob_preresume']

    hook_event={}
    for he in hook_events:
        # Only set available hooks for the current version of PBS.
        if hasattr(pbs, he.upper()):
            event_code = eval('pbs.' + he.upper())
            hook_event[event_code] = he
            hook_event[he] = event_code
            hook_event[he.upper()] = event_code
            del event_code
        else:
            del hook_events[hook_events.index(he)]

    trace = {
        'line': sys.exc_info()[2].tb_lineno,
        'module': sys.exc_info()[2].tb_frame.f_code.co_name,
        'exception': sys.exc_info()[0].__name__,
        'message': sys.exc_info()[1].message,
    }
    tracemsg = '%s hook %s encountered an exception: Line %s in %s %s: %s' % (
        hook_event[pbs.event().type], pbs.event().hook_name,
        trace['line'], trace['module'], trace['exception'], trace['message']
    )
    rejectmsg = "Hook Error: request rejected as filter hook '%s' " \
        "encountered an exception. Please inform Admin" % pbs.event().hook_name
    if not isinstance(loglevel, int):
        loglevel = pbs.LOG_ERROR
        tracemsg = 'trace_hook() called with invalid argument (loglevel=%s), '\
            'setting to pbs.LOG_ERROR. ' + tracemsg

    pbs.logmsg(pbs.LOG_ERROR, tracemsg)

    if reject:
        tracemsg += ', request rejected'
        if isinstance(trace_in_reject, bool):
            if trace_in_reject:
                pbs.event().reject(tracemsg)
            else:
                pbs.event().reject(rejectmsg)
        else:
            pbs.event().reject(str(trace_in_reject) + 'Line %s in %s %s:\n%s' %
                               (trace['line'], trace['module'],
                                trace['exception'], trace['message']))


class JobLog:
    """ Class for managing output to job stdout and stderr."""

    def __init__(self):
        PBS_SPOOL = os.path.join(pbs_conf()['PBS_MOM_HOME'], 'spool')
        self.stdout_log = os.path.join(PBS_SPOOL,
                                       '%s.OU' % str(pbs.event().job.id))
        self.stderr_log = os.path.join(PBS_SPOOL,
                                       '%s.ER' % str(pbs.event().job.id))

        if str(pbs.event().job.Join_Path) == 'oe':
            self.stderr_log = self.stdout_log
        elif str(pbs.event().job.Join_Path) == 'eo':
            self.stdout_log = self.stderr_log

    def stdout(self, msg):
        """Write msg to appropriate file handle for stdout"""
        import sys

        try:
            if not pbs.event().job.interactive and pbs.event().job.in_ms_mom:
                logfile = open(self.stdout_log, 'ab+')
            else:
                logfile = sys.stdout

            if DEBUG:
                pbs.logmsg(pbs.EVENT_DEBUG3,
                           '%s;%s;[DEBUG3]: writing %s to %s' %
                           (pbs.event().hook_name,
                            pbs.event().job.id,
                            repr(msg),
                            logfile.name))

            logfile.write(msg)
            logfile.flush()
            logfile.close()
        except IOError:
            trace_hook()

    def stderr(self, msg):
        """Write msg to appropriate file handle for stdout"""
        import sys

        try:
            if not pbs.event().job.interactive and pbs.event().job.in_ms_mom():
                logfile = open(self.stderr_log, 'ab+')
            else:
                logfile = sys.stderr

            if DEBUG:
                pbs.logmsg(pbs.EVENT_DEBUG3,
                           '%s;%s;[DEBUG3]: writing %s to %s' %
                           (pbs.event().hook_name,
                            pbs.event().job.id,
                            repr(msg),
                            logfile.name))

            logfile.write(msg)
            logfile.flush()
            logfile.close()
        except IOError:
            trace_hook()


# Read in pbs.conf
def pbs_conf(pbs_key=None):
    """Function to return the values from /etc/pbs.conf
    If the PBS python interpreter hasn't been recycled, it is not necessary
    to re-read and re-parse /etc/pbs.conf. This function will simply return
    the variable that exists from the first time this function ran.
    Creates a dict containing the key/value pairs in pbs.conf, accounting for
    comments in lines and empty lines.
    Returns a string representing the pbs.conf setting for pbs_key if set, or
    the dict of all pbs.conf settings if pbs_key is not set.
    """
    import os

    if hasattr(pbs_conf, 'pbs_keys'):
        return pbs_conf.pbs_keys[pbs_key] if pbs_key else pbs_conf.pbs_keys

    if 'PBS_CONF_FILE' in list(os.environ.keys()):
        pbs_conf_file = os.environ['PBS_CONF_FILE']
    elif sys.platform == 'win32':
        if 'ProgramFiles(x86)' in list(os.environ.keys()):
            program_files = os.environ['ProgramFiles(x86)']
        else:
            program_files = os.environ['ProgramFiles']
        pbs_conf_file = '%s\\PBS\\pbs.conf' % program_files
    else:
        pbs_conf_file = '/etc/pbs.conf'

    pbs_conf.pbs_keys = dict([line.split('#')[0].strip().split('=')
                              for line in open(pbs_conf_file)
                              if not line.startswith('#') and '=' in line])

    if 'PBS_MOM_HOME' not in list(pbs_conf.pbs_keys.keys()):
        pbs_conf.pbs_keys['PBS_MOM_HOME'] = \
            pbs_conf.pbs_keys['PBS_HOME']

    return pbs_conf.pbs_keys[pbs_key] if pbs_key else pbs_conf.pbs_keys


# Primary hook execution begins here
try:

    def rejectjob(reason, action=DEFAULT_ACTION):
        """Log job rejection and then call pbs.event().reject()"""

        # Arguments to pbs.event().reject() do nothing in execjob events. Log a
        # warning instead, update the job comment, then reject the job.
        if action == RERUN:
            job.rerun()
            reason = 'Requeued - %s' % reason
        elif action == DELETE:
            job.delete()
            reason = 'Deleted - %s' % reason
        else:
            reason = 'Rejected - %s' % reason

        job.comment = '%s: %s' % (hook_name, reason)
        pbs.logmsg(pbs.LOG_WARNING, ';'.join([hook_name, job.id, reason]))
        pbs.logjobmsg(job.id, reason)  # Add a message that can be tracejob'd
        if VERBOSE_USER_OUTPUT:
            print(reason)
        pbs_event.reject()

    # For the path to mom_priv, we use PBS_MOM_HOME in case that is set,
    # pbs_conf() will return PBS_HOME if it is not.
    mom_priv = os.path.abspath(os.path.join(
        pbs_conf()['PBS_MOM_HOME'], 'mom_priv'))

    # Get the hook alarm time from the .HK file if it exists.
    hk_file = os.path.join(mom_priv, 'hooks', '%s.HK' % hook_name)
    if os.path.exists(hk_file):
        hook_settings = dict([l.strip().split('=') for l in
                              open(hk_file, 'r').readlines()])
        if 'alarm' in list(hook_settings.keys()):
            hook_alarm = int(hook_settings['alarm'])
        if 'debug' in list(hook_settings.keys()):
            DEBUG = True if hook_settings['debug'] == 'true' else False

    if DEBUG:
        pbs.logmsg(pbs.LOG_DEBUG, '%s;%s;[DEBUG] starting.' %
                   (hook_name, job.id))

    if 'PBS_HOOK_CONFIG_FILE' in os.environ:
        config_file = os.environ["PBS_HOOK_CONFIG_FILE"]
        config = dict([l.split('#')[0].strip().split('=')
                       for l in open(config_file, 'r').readlines()
                       if '=' in l])

        # Set the true/false configurations
        if 'ENABLE_PARALLEL' in list(config.keys()):
            ENABLE_PARALLEL = config['ENABLE_PARALLEL'].lower()[0] in [
                't', '1']
        if 'VERBOSE_USER_OUTPUT' in list(config.keys()):
            VEROSE_USER_OUTPUT = config['VERBOSE_USER_OUTPUT'].lower()[0] in [
                't', '1']
        if 'DEFAULT_ACTION' in list(config.keys()):
            if config['DEFAULT_ACTION'].upper() == 'DELETE':
                DEFAULT_ACTION = DELETE
            elif config['DEFAULT_ACTION'].upper() == 'RERUN':
                DEFAULT_ACTION = RERUN
            else:
                pbs.logmsg(
                    pbs.LOG_WARN, '%s;%s;[ERROR] ' % (hook_name, job.id) +
                    'DEFAULT_ACTION in %s.ini must be one ' % (hook_name) +
                    'of DELETE or RERUN.')
        if 'TORQUE_COMPAT' in list(config.keys()):
            TORQUE_COMPAT = config['TORQUE_COMPAT'].lower()[0] in ['t', '1']

    # Skip sister mom if parallel pelogs aren't enabled.
    if not ENABLE_PARALLEL and not job.in_ms_mom():
        pbs_event.accept()

    # Prologues and epilogues have different arguments
    if pbs_event.type == pbs.EXECJOB_PROLOGUE:
        event = 'prologue'
        args = [
            job.id,                         # argv[1]
            job.euser,                      # argv[2]
            job.egroup                      # argv[3]
        ]
        if TORQUE_COMPAT:
            args.extend([
                job.Job_Name,               # argv[4]
                job.Resource_List,          # argv[5]
                job.queue.name,             # argv[6]
                job.Account_Name or ''      # argv[7]
            ])
    elif pbs_event.type == pbs.EXECJOB_EPILOGUE:
        null = 'null' if not TORQUE_COMPAT else ''
        event = 'epilogue'
        args = [
            job.id,                         # argv[1]
            job.euser,                      # argv[2]
            job.egroup,                     # argv[3]
            job.Job_Name,                   # argv[4]
            job.session_id,                 # argv[5]
            job.Resource_List,              # argv[6]
            job.resources_used,             # argv[7]
            job.queue.name,                 # argv[8]
            job.Account_Name or null,       # argv[9]
            job.Exit_status                 # argv[10]
        ]
    else:  # hook has wrong events added
        pbs.logmsg(
            pbs.LOG_WARNING,
            '%s;%s;[ERROR] PBS event type %s not supported in this hook.' %
            (hook_name, job.id, pbs_event.type))
        pbs_event.accept()

    # Handle empty arguments
    args = [str(a) if (a or a == 0) else '' for a in args]

    if DEBUG:
        pbs.logmsg(pbs.LOG_DEBUG,
                   '%s;%s;[DEBUG] %s event triggered.' %
                   (hook_name, job.id, event))

    if DEBUG:
        pbs.logmsg(pbs.LOG_DEBUG, '%s;%s;[DEBUG3] args=%s' %
                   (hook_name, job.id, repr(args)))

    # execjob_prologue and execjob_epilogue hooks can run on all nodes, so use
    # pprologue/pepilogue if available and not on primary execution node.
    p = '' if job.in_ms_mom() else 'p'

    if DEBUG:
        pbs.logmsg(pbs.LOG_DEBUG, '%s;%s;[DEBUG] %s.' %
                   (pbs_event.hook_name,
                    job.id,
                    'in sister mom' if p else 'in mother superior'))

    script = os.path.join(mom_priv, p + event)

    if sys.platform == 'win32':
        script = script + '.bat'

    if DEBUG:
        pbs.logmsg(pbs.EVENT_DEBUG3, '%s;%s;[DEBUG3] script set to %s.' % (
            pbs_event.hook_name, job.id, script))

    correct_permissions = False
    if not script:
        pbs_event.accept()

    if not os.path.exists(script):
        pbs_event.accept()

    if sys.platform == 'win32':
        # Windows support is currently not implemented.
        pbs.logmsg(pbs.LOG_WARNING,
                   '%s;%s;[ERROR] ' % (hook_name, job.id) +
                   'Classic prologues and epilogues on Windows are not ' +
                   'currently implemented in this hook.')
        pbs_event.accept()

    else:
        try:
            struct_stat = os.stat(script)
        except OSError:
            rejectjob('Could not stat the %s script (%s).' %
                      (event, script), RERUN)

        # We mask for read and execute on owner make sure no one else can write
        # with 0522 (?r?x?w??w?). With this, permissions such as 0777 masked by
        # 522 will return 522. Acceptable permissions will return 500.
        correct_permissions = bool(struct_stat.st_mode & 0o522 == 0o500 and
                                   struct_stat.st_uid == 0)

    if correct_permissions:
        import signal
        import subprocess
        import shlex

        # Correction for subprocess SIGPIPE handling courtesy of Colin Watson:
        # http://www.chiark.greenend.org.uk/~cjwatson/blog/python-sigpipe.html
        def subprocess_setup():
            """subprocess_setup corrects a known bug where python installs a
            SIGPIPE handler by default. This is usually not what non-Python
            subprocesses expect"""
            signal.signal(signal.SIGPIPE, signal.SIG_DFL)

        if DEBUG:
            pbs.logmsg(
                pbs.EVENT_DEBUG2,
                '%s;%s;[DEBUG2] script %s has appropriate permissions.' %
                (hook_name, job.id, script))

        # change to the correct working directory (PBS_HOME):
        os.chdir(pbs_conf()['PBS_MOM_HOME'])

        # add PBS_JOBDIR environment variable, accounting for empty job.jobdir
        os.environ['PBS_JOBDIR'] = job.jobdir or ''

        shell = ""
        if sys.platform == 'win32':  # win32 is _always_ cmd
            shell = "cmd /c"
        else:
            # check the script for the interpreter line
            shebang = open(script, 'r').readline().strip().split('#!')
            if len(shebang) == 2:
                shell = shebang[1].split()[0]
                if not os.path.exists(shell):
                    rejectjob(
                        'Interpreter specified in %s (%s) does not exist.' %
                        (p + event, shell),
                        RERUN)
            else:
                rejectjob(
                    'No interpreter specified in %s.' %
                    (p + event), RERUN)

        if DEBUG:
            pbs.logmsg(pbs.EVENT_DEBUG2,
                       '%s;%s;[DEBUG2] interpreter set to "%s".' %
                       (hook_name, job.id, shell))

        pbs.logmsg(pbs.LOG_DEBUG, '%s;%s;running %s.' %
                   (hook_name, job.id, p + event))

        # We perform a shlex.split to make sure we capture any #! arguments
        cmd = shlex.split('%s %s' % (shell, script))
        cmd.extend(args)

        if DEBUG:
            pbs.logmsg(
                pbs.EVENT_DEBUG3, '%s;%s;[DEBUG3] cmd=%s' %
                (hook_name, job.id, repr(cmd)))

        if str(job.Join_Path) in ['oe', 'eo']:
            proc = subprocess.Popen(
                cmd,
                stdout=subprocess.PIPE,
                stderr=subprocess.STDOUT,
                preexec_fn=subprocess_setup)
        else:
            proc = subprocess.Popen(
                cmd,
                stdout=subprocess.PIPE,
                stderr=subprocess.PIPE,
                preexec_fn=subprocess_setup)

        # Wait for the script to gracefully exit.
        while time.time() < start_time + hook_alarm - 5:
            if proc.poll() is not None:
                break
            time.sleep(1)

        # If we reach the alarm time - 5 seconds, send a SIGTERM
        if proc.poll() is None:
            pbs.logmsg(
                pbs.LOG_WARNING,
                '%s;%s;[WARNING] Terminating %s after %s seconds' %
                (hook_name, job.id, event, int(time.time() - start_time)))
            os.kill(proc.pid, signal.SIGTERM)
            while time.time() < start_time + hook_alarm - 3:
                if proc.poll() is not None:
                    break
                time.sleep(0.5)

        # If we reach an alarm time - 3 seconds, send a SIGKILL
        if proc.poll() is None:
            pbs.logmsg(
                pbs.LOG_WARNING,
                '%s;%s;[WARNING] Killing %s after %s seconds' %
                (hook_name, job.id, event, int(time.time() - start_time)))
            os.kill(proc.pid, signal.SIGKILL)
            while time.time() < start_time + hook_alarm - 1:
                if proc.poll() is not None:
                    break
                time.sleep(0.5)

        # If we still can't kill the script, log a warning and let pbs kill it
        if proc.poll() is None:
            pbs.logmsg(pbs.LOG_WARNING,
                       '%s;%s;[WARNING] Unable to kill %s after %s seconds' %
                       (hook_name, job.id, event, start_time - time.time()))

        # Get the stdout and stderr from the pelog
        (o, e) = proc.communicate()

        if DEBUG:
            pbs.logmsg(
                pbs.EVENT_DEBUG2,
                '%s;%s;[DEBUG2]: stdout=%s, stderr=%s.' %
                (hook_name, job.id, repr(o), repr(e)))

        joblog = JobLog()
        if o:
            joblog.stdout(o)
        if e:
            joblog.stderr(e)

        if proc.returncode:
            return_action = RERUN
            if event == 'prologue':
                return_action = RERUN
                if proc.returncode == 1:
                    return_action = DELETE
            elif event == 'epilogue':
                return_action = DELETE
                if proc.returncode == 2:
                    return_action = RERUN

            rejectjob(
                '%s exited with a status of %s.' % (
                    p + event, proc.returncode),
                return_action)
        else:
            if DEBUG:
                pbs.logmsg(pbs.LOG_DEBUG,
                           '%s;%s;[DEBUG] %s exited with a status of 0.' %
                           (hook_name, job.id, p + event))

            if pbs_event.type == pbs.EXECJOB_PROLOGUE and VERBOSE_USER_OUTPUT:
                print('%s: attached as primary execution host.' %
                      pbs.get_local_nodename())

            pbs_event.accept()
    else:
        rejectjob("The %s does not have the correct " % (p + event) +
                  'permissions. See the section entitled, ' +
                  '"Prologue and Epilogue Requirements" in the PBS ' +
                  "Administrator's Guide.", RERUN)

except SystemExit:
    pass
except BaseException:
    trace_hook()


================================================
FILE: src/unsupported/sgiICEplacement.sh
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


. ${PBS_CONF_FILE:-/etc/pbs.conf}

echo Setting placement set data ...
${PBS_EXEC}/bin/pbsnodes -a | grep "^[a-zA-Z]" | while read node
do
    if [ -n "`echo $node | grep 'r[0-9][0-9]*i[0-9]n[0-9][0-9]*'`" ]
    then
	L1=`echo $node | sed -e "s/\(r[0-9][0-9]*i[0-9][0-9]*\)n.*/\1/"`
	L2=`echo $node | sed -e "s/\(r[0-9][0-9]*\)i[0-9][0-9]*n.*/\1/"`
	echo "  for $node as resources_available.router=\"${L1},${L2}\""
	${PBS_EXEC}/bin/qmgr -c "s node $node resources_available.router=\"${L1},${L2}\""
    else
	echo " "
	echo Node ${node} name is not in standard SGI naming convention,
	echo no placement set created for ${node}
	echo " "
    fi

done
exit 0


================================================
FILE: src/unsupported/sgiICEvnode.sh
================================================
#!/bin/sh
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
# writevnode - write cpuset information for a vnode
#    $1 is the subdirectory (node0, node1, ...) under SYSDIRNODE
#    $2 is the vnode name of the form "host[n]" for multiple nodes
#       or "host" for a single node
#    $3 is the node number, 0 to n-1
#
writevnode ()
{
        numcpus=`ls -1d ${SYSDIRNODE}/${1}/cpu* | grep cpu\[0-9\] | wc -l`
	numcpus=`echo $numcpus | sed -e "s/^ *//"`
        cpustr=`ls -1d ${SYSDIRNODE}/${1}/cpu* | grep cpu\[0-9\] | \
                sed -e "s/^.*cpu\([0-9]*\)/\1/" | sort -n`
        cpustr=`echo $cpustr | sed -e "s/ /,/g"`
	echo "${2}: resources_available.ncpus = $numcpus"
	echo "${2}: cpus = $cpustr"
	amtmem=`grep MemTotal ${SYSDIRNODE}/${1}/meminfo | sed -e "s/^.*: *//"`
	amtmem=`echo $amtmem | sed -e "s/ .*$//"`
	echo "${2}: resources_available.mem = ${amtmem}kb"
	echo "${2}: mems = $3"
}

host=`/bin/hostname | sed -e 's/\..*//'`

echo "\$configversion 2"
echo "$host: pnames = router"

if [ -n "$1" ]
then
    if [ "$1" = "cpuset" ]
    then

#	create and write cpuset related information

	SYSDIRNODE="/sys/devices/system/node"
	NODECT=`ls -1d $SYSDIRNODE/node[0-9]* | wc -l`
	if [ $NODECT -eq 1 ] ; then
            echo "$host: sharing = default_excl"
            writevnode "node0" $host "0"
	else
            echo "$host: sharing = ignore_excl"
            echo "$host: resources_available.ncpus = 0"
            echo "$host: resources_available.mem = 0"
	    JN=0
            while [ $JN -lt $NODECT ] ; do
                echo "${host}[${JN}]: sharing = default_excl"
                writevnode "node${JN}" "${host}[${JN}]" ${JN}
                JN=`expr $JN + 1`
            done
        fi
    else
	echo invalid argument to script $0
    fi
fi

exit 0


================================================
FILE: src/unsupported/sgigenvnodelist.awk
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.
#
#	Usage:
#
#		awk -f ThisScript [ -v type=m ] [ inputfile ]
#		awk -f ThisScript [ -v type=q ] [ inputfile ]
#
#	If no input file is given, the value of topology_file (below) is used.
#
#	This script is designed to consume the Altix ProPack 4+ system topology
#	file and emit placement set information in one of two forms, one for
#	consumption by pbs_mom and the other in qmgr form.  The form of output
#	is controlled by the command-line variable "type", whose value should
#	be either 'm' (for the pbs_mom form) or 'q' (for the qmgr form).
#
#	For the pbs_mom form, we first emit a prologue describing the types of
#	placement sets and any global options.  This prologue uses the special
#	vnode ID of NODE and the special attribute name "pnames":
#
#		NODE:	pnames = TYPE1 [, TYPE2 ...]
#
#	then a list of the various placement sets by node
#
#		NODE[N]:	NAME = ps1 [ , ps2 ... ]
#
#	where NODE is derived from the host's FQDN by dropping the domain
#	qualifier(s), N is a node number, NAME is the name of a resource
#	(e.g. "cbrick" or "router"), and ps1, ... is a list of placement
#	set names.
#
#	This script currently computes only one type of placement set
#	("router").  It does this by associating with each router that
#	is directly connected to a node the list of node IDs.  Then, for
#	each router that is two hops removed from a node, we associate
#	the union of the lists of nodes of each directly-connected router.
#	The expanding ring computation goes on until we either run out of
#	routers or have failed to make progress.
#
#	The qmgr form of output is a series of lines like this:
#
#		set NAME[N] resources_available.TYPE = "ps1 [ , ps2 ... ]"
#
#	where NAME is the host's name, N is a node number, TYPE is the name
#	of the resource type (e.g. "cbrick" or "router", as above), and ps1,
#	... is a list of placement set names.
#
#	Additionally the script emits generic vnode information (vnode ID,
#	number of CPUs, amount of memory) for consumption by pbs_mom in this
#	form
#
#		NODE[ID]:	cpus = <CPUlist>
#		NODE[ID]:	resources_available.ncpus = X
#		NODE[ID]:	resources_available.mem = Y
#
#	where NODE is derived from the host's FQDN by dropping the domain
#	qualifier(s), ID is a vnode ID, X is the number of CPUs belonging
#	to the vnode with this ID, and Y is the amount of memory (in KB).
#	<CPUlist> is a list of CPUs in the given NODE[ID].
#
#	Note:  the list of vnodes is culled to ensure that it excludes CPUs
#	that belong to CPU sets not claimed by PBS.

BEGIN {
	# Sort cpus, mems, and vnodes numerically
	PROCINFO["sorted_in"] = "@ind_num_asc";

	deftype = "m";			#	by default, output for pbs_mom
	exitval = 0;			#	used to elide END actions
	listsep = ", "
	ncpus = 0;
	nnodes = 0;
	npnames = 0;
	nnumalinks = 0;
	nrouters = 0;

	ptype = "router";		#	placement set type
	pshort = "R";			#	shorthand used in resource value
					#	(later modified by prepending
					#	nodename to uniquify values

	#	command to find "cpus" and "mems" files that do not belong to
	#	PBS (CPU sets that are not the root, and not under /PBSPro)
	#	in the "cpuset" file system
	findcmd = "find /dev/cpuset -name cpus -o -name cpuset.cpus \
		-o -name mems -o -name cpuset.mems | \
		egrep -v -e '/dev/cpuset/cpus$' -e '/dev/cpuset/cpuset.cpus$' \
		-e '/dev/cpuset/mems$' -e '/dev/cpuset/cpuset.mems$' \
		-e '/PBSPro/'";

	topology_version_min = 1;	#	the versions we understand
	topology_version_max = 2;	#	the versions we understand
	UVtopology_version_min = 1;	#	the versions we understand
	UVtopology_version_max = 1;	#	the versions we understand
	topology_file = "/proc/sgi_sn/sn_topology"
	UVtopology_file = "/proc/sgi_uv/topology"

	#	override standard input default if no input file is given
	if (ARGC == 1) {
		if ((getline < topology_file) > 0) {
			ARGV[ARGC++] = topology_file;
			close(topology_file);
		} else if ((getline < UVtopology_file) > 0) {
			ARGV[ARGC++] = UVtopology_file;
			close(UVtopology_file);
		}
		if (ARGC == 1) {
			printf("no input files given, no known topology files found\n");
			exitval = 1;
			exit(1);
		}
	}

	"uname -n | sed -e 's/\\..*//'" | getline nodename
	close("uname -n | sed -e 's/\\..*//'");
	pshort = nodename "-" pshort;	#	shorthand is now "H-RN" where
					#	H is the unFQDNed host name and
					#	N is a nonnegative integer

	#	make two lists, excludedCPUs[] and excludedmems[],
	#	of all CPUs and memory boards found in CPU sets
	#	that do not belong to PBS
	while ((findcmd | getline cpumemfile) > 0)
		read_excludelist(cpumemfile);
	close(findcmd);

	if (type == "")
		type = deftype;
	else if ((type != "m") && (type != "q")) {
		printf("type should be one of 'm' or 'q'\n");
		exitval = 1;
		exit(1);
	}
}

#	check for supported version(s)
$2 == "sn_topology" && $3 == "version" {
	is_UV = 0
	topology_version = $4;
	verscheck($4, topology_version_min, topology_version_max)
	if (debug)
		printf("SN topology file (version %d)\n", topology_version);
}

#	check for supported version(s) for UV
$2 == "uv_topology" && $3 == "version" {
	is_UV = 1
	topology_version = $4;
	verscheck($4, UVtopology_version_min, UVtopology_version_max)
	if (debug)
		printf("UV topology file (version %d)\n", topology_version);
}

#	cpu 0 001c05#0a local freq 1500MHz, arch ia64, dist 10:10:45:...
#	cpu 000 r001i01b00#00_00-000 local freq 2666MHz, arch UV , dist 10:10:10:...
/^cpu[[:space:]]+[[:digit:]]+/ {
	cpuid[int($2)] = $3;
	if (debug)
		printf("cpu[%d]:  id %s\n", ncpus, $3);

	if (is_UV == 0) {
		#	Even though the sn_topology version stays the same, the
		#	distance vector may appear in multiple places within the
		#	line.
		if ($9 == "dist") {
			split($10, tmp, ":");
			do_cpudist = 1;
		} else if ($13 == "dist") {
			split($14, tmp, ":");
			do_cpudist = 1;
		} else
			do_cpudist = 0;
	} else {
		if ($10 == "dist") {
			split($11, tmp, ":");
			do_cpudist = 1;
		} else
			do_cpudist = 0;
	}

	if (do_cpudist)
		for (tmpindex in tmp)
			cpudist[int($2), tmpindex - 1] = tmp[tmpindex];
	ncpus++;
}

#	node 0 001c05#0 local asic SHub_1.2, nasid 0x0, dist 10:45:...
/^node[[:space:]]+[[:digit:]]+/ {
	nodeid[$2] = $3;
	nodenums[$3] = $2;
	if (debug)
		printf("node[%d]:  id %s\n", nnodes, $3);

	#	Even though the sn_topology version stays the same, the
	#	distance vector may appear in multiple places within the
	#	line.
	if ($9 == "dist") {
		split($10, tmp, ":");
		do_nodedist = 1;
	} else if ($13 == "dist") {
		split($14, tmp, ":");
		do_nodedist = 1;
	} else
		do_nodedist = 0;

	if (do_nodedist)
		for (tmpindex in tmp) {
			#	Does the distance list terminate the line, or
			#	is it followed by ", near_mem_nodeid ..."?  In
			#	the latter case, remove any possible trailing
			#	',' from the distance number.
			if (topology_version == 2)
				sub(",$", "", tmp[tmpindex]);
			nodedist[$2, tmpindex - 1] = tmp[tmpindex];
		}
	nnodes++;
}

#	Info from SGI:
#	A "local" NUMAlink connection connects to another device that resides
#	in the same partition as the source.
#	A "foreign" NUMAlink connection terminates to another device that is
#	in a non-local partition.
#	A "shared" connection terminates on a device that is shared between
#	several partitions (always routers presently.)
#
#	numalink 1 001c05#0-1 local endpoint 001c05#5-1, protocol LLP4
#			^			    ^
#			|			    |
#			-- stored in		    -- stored in
#			   numalinkremoteid[]  	       numalinklocalid[]
#
/^numalink[[:space:]]+[[:digit:]]+/ {
	if ($6 == "disconnected,")
		next;
	if (($4 == "foreign") || ($4 == "local") || ($4 == "shared")) {
		sub(",$", "", $6);
		numalinklocalid[$2] = $3;
		numalinkremoteid[$2] = $6;
		ridtmp = NUMAlink2router($3);

		#	nrouterconnections[] is an array (indexed by router ID,
		#	ridtmp) that records the number of routers connected to
		#	the router with ID ridtmp.  routerconnections[] holds
		#	the names of those routers.
		if (!(ridtmp in nrouterconnections))
			nrouterconnections[ridtmp] = 0;
		routerconnections[ridtmp, nrouterconnections[ridtmp]] = NUMAlink2router($6);
		nrouterconnections[ridtmp]++;
		if (debug)
			printf("NUMAlink %d:  %s -> %s\n", nnumalinks,
			       numalinklocalid[$2], numalinkremoteid[$2]);
	}
	nnumalinks++;
}

#	router 0 001c05#4 local asic NL4Router
#	router 1 001c21#5 shared asic NL4Router
/^router[[:space:]]+[[:digit:]]+/ {
	routernum[$3] = $2;
	routerid[$2] = $3;
	if (debug)
		printf("router[%d]:  id %s\n", nrouters, $3);
	nrouters++;
}

#	read a list of "cpus" and "mems" files from the "cpuset" file system
#	and remember those CPUs and memory board numbers found there.  Later
#	(in printmompsdefs() and printqmgrpsdefs()) any vnode containing an
#	excluded CPU or memory board will not appear in the resulting placement
#	definitions.
function read_excludelist(listfile)
{
	if (debug)
		printf("read_excludelist:  listfile %s\n", listfile);
	if (listfile ~ "/cpus$" || listfile ~ "/cpuset.cpus$") {
		while ((getline cpumemlist < listfile) > 0)
			parse_CPUs(cpumemlist);
		close(listfile);
	} else if (listfile ~ "/mems$" || listfile ~ "/cpuset.mems$") {
		while ((getline cpumemlist < listfile) > 0)
			parse_mems(cpumemlist);
		close(listfile);
	} else {
		printf("read_excludelist:  not reading from cpus or mems\n");
		exit (1);
	}
}

#	break list at ',' characters, if any, then handle lists of
#	the form M or "M-N"
function parse_CPUs(cpulist,		cpusublist, rangenum)
{
	split(cpulist, cpusublist, ",");
	for (rangenum in cpusublist)
		exclude_range(cpusublist[rangenum], "cpus");
}


#	break list at ',' characters, if any, then handle lists of
#	the form M or "M-N"
function parse_mems(memlist,		memsublist, rangenum)
{
	#	break list at ',' characters, if any, then handle lists of
	#	the form M or "M-N"

	split(memlist, memsublist, ",");
	for (rangenum in memsublist)
		exclude_range(memsublist[rangenum], "mems");
}

function exclude_range(range, excltype,	nexcludedcpus, nexlcudedmems,
					nnums, nums)
{
	nnums = split(range, nums, "-");

	if (nnums == 1) {
		if (debug)
			printf("exclude %s %d\n", excltype, nums[1]);
		nums[2] = nums[1];
	} else if (nnums == 2) {
		if (debug)
			printf("exclude %s %d - %d\n", excltype,
			    nums[1], nums[2]);
	} else {
		printf("exclude_cpus:  internal error - nnums (%d) > 2\n",
		    nnums);
		exit (1);
	}

	if (excltype == "cpus")
		for (exclindex = nums[1]; exclindex <= nums[2]; exclindex++)
			excludedCPUs[nexcludedcpus++] = exclindex;
	else
		for (exclindex = nums[1]; exclindex <= nums[2]; exclindex++)
			excludedmems[nexcludedmems++] = exclindex;
}

function report_memory(nodenum,		meminfofile)
{
	# use "-v sysdir=/..." to direct this script to an alternate /sys
	meminfofile = sysdir "/sys/devices/system/node/node" nodenum "/meminfo";

	if (debug)
		printf("report_memory(node %d, meminfofile %s)\n", nodenum,
		    meminfofile);
	while ((getline meminfo < meminfofile) > 0)
		if (meminfo ~ /MemTotal/) {
			sub(".*MemTotal:[[:space:]]*", "", meminfo);
			sub("[[:space:]]*[kK][bB]$", "", meminfo);
			close(meminfofile);
			return (meminfo);
		}
	close(meminfofile);

	printf("No memory information for node %d\n", nodenum) | "cat 1>&2";
	return (-1);
}

#	emit the virtual partition list prologue, if any
function momprologue(			firsttime, momfmt,
					nocpusfmt, nomemfmt, novmemfmt,
					pnamefmt, sharedfmt, t, versionfmt)
{
	versionfmt = "$configversion 2\n";	# same as CONFIG_VNODEVERS
	pnamefmt = "%s:  pnames = %s";
	sharedfmt = "%s:  sharing = ignore_excl\n";
	nocpusfmt = "%s:  resources_available.ncpus = 0\n";
	nomemfmt = "%s:  resources_available.mem = 0\n";
	novmemfmt = "%s:  resources_available.vmem = 0\n";

	printf(versionfmt);

	firsttime = 1;
	for (t in pnames) {
		if (firsttime == 1) {
			firsttime = 0;
			printf(pnamefmt, nodename, pnames[t]);
		} else {
			printf(",%s", pnames[t]);
		}
	}
	if (npnames > 0)
		printf("\n");

	printf(sharedfmt, nodename);
	printf(nocpusfmt, nodename);
	printf(nomemfmt, nodename);
	printf(novmemfmt, nodename);
}

#	emit the virtual partition list prologue, if any
function qprologue(			firsttime,
					nocpusfmt, nomemfmt, novmemfmt,
					pnamefmt, sharedfmt, t)
{
	pnamefmt = "set node %s pnames = \"%s"
	sharedfmt = "set node %s sharing = ignore_excl\n";
	nocpusfmt = "set node %s resources_available.ncpus = 0\n";
	nomemfmt = "set node %s resources_available.mem = 0\n";
	novmemfmt = "set node %s resources_available.vmem = 0\n";

	firsttime = 1;
	for (t in pnames) {
		if (firsttime == 1) {
			firsttime = 0;
			printf(pnamefmt, nodename, pnames[t]);
		} else {
			printf(",%s", pnames[t]);
		}
	}
	if (npnames > 0)
		printf("\"\n");

	printf(sharedfmt, nodename);
	printf(nocpusfmt, nodename);
	printf(nomemfmt, nodename);
	printf(novmemfmt, nodename);
}

#	for debugging
#	consistency checks:  distance should be symmetric
function doconsistencychecks(		i, j)
{
	for (i in cpuid)
		for (j = 0; j < ncpus; j++)
			if (cpudist[i, j] != cpudist[j, i]) {
				printf("cpudist[%d, %d] (%s) != ", i, j,
				    cpudist[i, j]);
				printf("cpudist[%d, %d] (%s)\n", j, i,
				    cpudist[j, i]);
			}
	if (is_UV == 0)
		for (i in nodeid) {
			for (j = 0; j < nnodes; j++) {
				if (nodedist[i, j] != nodedist[j, i]) {
					printf("nodedist[%s, %d] (%s) != ", i, j,
					    nodedist[i, j]);
					printf("nodedist[%d, %s] (%s)\n", j, i,
					    nodedist[j, i]);
				}
			}
		}
}

#	for debugging
function dumpnodeinfo(			cid, i, ix, j, UVnode)
{
	for (i in nodeid) {
		for (j in cpuid) {
			if (is_UV) {
				split(cpuid[j], UVnode, "_");
				cid = UVnode[1];
			} else {
				cid = cpuid[j];
			}
				
			if ((nodeid[i] != "") && (cid != "")) {
				if ((ix = index(cid, nodeid[i])) == 1) {
					printf("dumpnodeinfo:  cpuid[%s] = \"%s\", nodeid[%s] = \"%s\", index(cid, nodeid[i]) = %d\n", j, cpuid[j], i, nodeid[i], ix);
					printf("node %s contains CPU[%s]\n", nodeid[i], j);
				}
			}
		}
	}
}

#	for debugging
function dumprouterinfo(		i, j, k, rconn, rid)
{
	for (i in routerid) {
		for (j in numalinklocalid) {
			if (index(numalinklocalid[j], routerid[i]) == 1) {
				rid = numalinkremoteid[j];
				for (k in nodeid) {
					if (index(rid, nodeid[k]) == 1) {
						printf("router[%s] -> node %s\n",
						    i, nodeid[k]);
					}
				}
			}
		}
	}

	for (i = 0; i < nrouters; i++) {
		rid = routerid[i];
		for (j = 0; j < nrouterconnections[rid]; j++) {
			rconn = routerconnections[rid, j];
			printf("router %s connected to %s %s\n", rid,
			    (rconn in nodenums) ? "node" : "router", rconn);
		}
	}

}

#	Add a new placement set type, t, to the list of known types.
function newpstype(t)
{
	if (!(t in pnames)) {
		if (debug)
			printf("newpstype:  \"%s\"\n", t);
		pnames[npnames++] = t "";
	}
}

#	Emit vnode definitions for consumption by pbs_mom.
#	In constructing vnode names, we are careful to ensure that the index
#	(in name[index]) is the same as the node number that appears in the
#	sn_topology file.
#
#	In constructing the values for the placement sets, we are also careful
#	to ensure that the index (in R[index]) is the same as the router number
#	in the sn_topology file.  We must also be sure when concatenating names
#	to form the a placement set value that we always concatenate in the same
#	order (that is, even though a human can tell that placement set "ABC" is
#	the same as placement set "BCA", PBS regards them as different);  we
#	achieve this by always traversing the router list the same way.
function printmompsdefs(			cpusfmt, cpuspernode, i, j, id,
						exclCPUfmt, exclmemfmt, extmp,
						firsttime, 
						memfmt, ncpusfmt, psfmt,
						ptmp, rid, vnodename)
{
	psfmt = "%s:  resources_available.%s = %s\n";
	cpusfmt = "%s:  cpus = %s\n";
	memnodefmt = "%s:  mems = %d\n";
	ncpusfmt = "%s:  resources_available.ncpus = %d\n";
	memfmt = "%s:  resources_available.mem = %dkb\n";
	exclCPUfmt = "deleting node[%d] (ID %s) - contains excluded CPU %d\n";
	exclmemfmt = "deleting node[%d] (ID %s) - contains excluded memory %d\n";

	#	Refrain from reporting any vnode which contains an excluded CPU.
	for (i in excludedCPUs) {
		extmp = excludedCPUs[i];
		for (j in nodeid)
			if (index(cpuid[extmp], nodeid[j]) == 1) {
				if (debug)
					printf(exclCPUfmt, j, nodeid[j], extmp);
				delete nodeid[j];
				nnodes--;
			}
	}

	#	Refrain from reporting any vnode which contains an excluded
	#	memory board.  This relies on the fact that there is exactly
	#	one memory board per topology file node.
	for (i in excludedmems) {
		extmp = excludedmems[i];
		if (nodeid[extmp] != "") {
			if (debug)
				printf(exclmemfmt, extmp, nodeid[extmp], extmp);
			delete nodeid[extmp];
			nnodes--;
		}
	}

	for (i in nodeid) {
		if ((id = nodeid[i]) == "")
			continue;

		#	Make sure that the vnode name we construct maps directly
		#	to the node number in the sn_topology file.
		vnodename = nodename "[" nodenums[id] "]";

		printf("%s:  sharing = default_excl\n", vnodename);

		cpuspernode = 0;
		vnodeCPUs = "";
		for (j in cpuid)
			if (index(cpuid[j], id) == 1) {
				if (cpuspernode == 0)
					vnodeCPUs = j;
				else
					vnodeCPUs = vnodeCPUs "," j;
				cpuspernode++;
			}

		if (cpuspernode > 0) {
			printf(ncpusfmt, vnodename, cpuspernode);
			printf(cpusfmt, vnodename, vnodeCPUs);
		} else
			printf(ncpusfmt, vnodename, 0);

		meminfo = report_memory(i);
		if (meminfo >= 0) {
			printf(memfmt, vnodename, meminfo);
			printf(memnodefmt, vnodename, i)
		} else
			printf(memfmt, vnodename, 0);

		if ((cpuspernode > 0) || (meminfo > 0)) {
			firsttime = 1;
			ptmp = "";
			#	Make sure that the router names in the placement
			#	set values map directly to the router numbers in
			#	the sn_topology file.
			for (j = 0; j < nrouters; j++) {
				rid = routerid[j];
				if (index(nodesof[rid], id))
					if (firsttime) {
						firsttime = 0;
						ptmp = pshort routernum[rid];
					} else
						ptmp = ptmp "," pshort routernum[rid];
			}
			if (ptmp != "") {
				#	add a value for the whole machine
				ptmp = ptmp "," nodename;
				printf(psfmt, vnodename, ptype, ptmp);
			}
		}
	}
}

#	Emit vnode definitions for consumption by qmgr.
#	In constructing vnode names, we are careful to ensure that the index
#	(in name[index]) is the same as the node number that appears in the
#	sn_topology file.
#
#	In constructing the values for the placement sets, we are also careful
#	to ensure that the index (in R[index]) is the same as the router number
#	in the sn_topology file.  We must also be sure when concatenating names
#	to form the a placement set value that we always concatenate in the same
#	order (that is, even though a human can tell that placement set "ABC" is
#	the same as placement set "BCA", PBS regards them as different);  we
#	achieve this by always traversing the router list the same way.
function printqmgrpsdefs(		i, j, id, cpuspernode,
					exclCPUfmt, exclmemfmt, extmp,
					firsttime,
					memfmt, ncpusfmt, psfmt,
					ptmp, rid, vnodename)
{
	ncpusfmt = "set node %s resources_available.ncpus = %d\n";
	memfmt = "set node %s resources_available.mem = %dkb\n";
	psfmt = "set node %s resources_available.%s = %s\n";
	exclCPUfmt = "deleting node[%d] (ID %s) - contains excluded CPU %d\n";
	exclmemfmt = "deleting node[%d] (ID %s) - contains excluded memory %d\n";

	#	Refrain from reporting any vnode which contains an excluded CPU.
	for (i in excludedCPUs) {
		extmp = excludedCPUs[i];
		for (j in nodeid)
			if (index(cpuid[extmp], nodeid[j]) == 1) {
				if (debug)
					printf(exclCPUfmt, j, nodeid[j], extmp);
				delete nodeid[j];
				nnodes--;
			}
	}

	#	Refrain from reporting any vnode which contains an excluded
	#	memory board.
	for (i in excludedmems) {
		extmp = excludedmems[i];
		if (nodeid[extmp] != "") {
			if (debug)
				printf(exclmemfmt, extmp, nodeid[extmp], extmp);
			delete nodeid[extmp];
			nnodes--;
		}
	}

	for (i in nodeid) {
		if ((id = nodeid[i]) == "")
			continue;

		#	Make sure that the vnode name we construct maps directly
		#	to the node number in the sn_topology file.
		vnodename = nodename "[" nodenums[id] "]";

		printf("set node %s sharing = default_excl\n",
		    vnodename);

		cpuspernode = 0;
		vnodeCPUs = "";
		for (j in cpuid)
			if (index(cpuid[j], id) == 1) {
				if (cpuspernode == 0)
					vnodeCPUs = j;
				else
					vnodeCPUs = vnodeCPUs "," j;
				cpuspernode++;
			}

		if (cpuspernode > 0) {
			printf(ncpusfmt, vnodename, cpuspernode);

			meminfo = report_memory(i);
			if (meminfo >= 0)
				printf(memfmt, vnodename, meminfo);
			firsttime = 1;
			ptmp = "";
			#	Make sure that the router names in the placement
			#	set values map directly to the router numbers in
			#	the sn_topology file.
			for (j = 0; j < nrouters; j++) {
				rid = routerid[j];
				if (index(nodesof[rid], id))
					if (firsttime) {
						firsttime = 0;
						ptmp = pshort routernum[rid];
					} else
						ptmp = ptmp "," pshort routernum[rid];
			}
			if (ptmp != "") {
				#	add a value for the whole machine
				ptmp = ptmp "," nodename;
				printf(psfmt, vnodename, ptype, ptmp);
			}
		}
	}
}

#	These are functions to convert between various IDs (CPU, node, NUMAlink,
#	router).  The IDs follow a pattern illustrated by this excerpt
#
#		cpu 1 001c01^3#0a local freq 1596MHz, arch ia64, ...
#		node 1 001c01^3#0 local asic SHub_2.0, nasid 0x2, ...
#		numalink 4 001.01^10#0-2 local endpoint 001c01^3#0-0, ...
#		router 0 001.01^10#0 local asic NL4Router
#		numalink 14 001.01^11#1-4 local endpoint 001c01^3#0-1, ...
#		router 1 001.01^11#1 local asic NL4Router
#
#	from an sn_topology file.
#	A node ID is derived from a CPU ID by dropping the last character:
function CPU2node(id,				tmpid)
{
	tmpid = id;
	sub(/.$/, "", tmpid)

	return (tmpid);
}

#	A router ID is derived from a NUMAlink ID by dropping the trailing
#	"-[[:digit:]]":
function NUMAlink2router(id,			tmpid)
{
	tmpid = id;
	sub(/-[[:digit:]]$/, "", tmpid)

	return (tmpid);
}

#	Find routers h hops removed from a node.  We depend on having already
#	computed the list of routers that are less than h hops removed, in
#	which case any router whose hop count is still not known and which is
#	one hop removed from a router with hop count h-1 must have hop count h.
#	The function returns the number of new assignements done.
function nexthop(h,				i, j, ndone, rid, rtmp)
{
	ndone = 0;
	for (i = 0; i < nrouters; i++) {
		rid = routerid[i];
		if (hops[rid] != -1)
			continue;
		for (j = 0; j < nrouterconnections[rid]; j++) {
			rtmp = routerconnections[rid, j];
			if ((rtmp in hops) && (hops[rtmp] == (h - 1))) {
				hops[rid] = h;
				ndone++;
				break;
			}
		}
	}

	return (ndone);
}

#	Use an expanding ring to assign hop counts (number of hops removed from
#	a node) to routers, and returns the maximum possible hop count.
function genhops(				curhop, i, j, nroutersleft,
						progress, rid)
{
	curhop = 1;
	nroutersleft = nrouters;

	#	The first pass is special since we care only about routers that
	#	are directly connected to nodes.
	for (i = 0; i < nrouters; i++) {
		rid = routerid[i];
		progress = 0;
		for (j = 0; j < nrouterconnections[rid]; j++)
			if (routerconnections[rid, j] in nodenums) {
				hops[rid] = curhop;
				nroutersleft--;
				progress = 1;
				break;
			}
		if (progress == 0)
			hops[rid] = -1;
	}

	#	Now derive the count for the rest of the routers, one hop at a
	#	time.  As a safety measure, we terminate the loop if we have
	#	made no progress (found no routers with a given hop count).
	do {
		curhop++;
		progress = nexthop(curhop);
		nroutersleft -= progress;
	} while ((progress > 0) && (nroutersleft > 0));

	if (debug == 1)
		for (i = 0; i < nrouters; i++) {
			rid = routerid[i];
			printf("router %s:  hop %d\n", rid, hops[rid]);
		}

	return (curhop);
}

#	This function generates placement sets for each router based on
#	the nodes to which the router is connected (through one or more
#	hops).  For each router, we build a list (nodesof[router ID]),
#	which is a concatenation of the node IDs for each node (if any)
#	to which the router is directly connected.  For subsequent hops
#	H (2 through nhops), the list of nodes for each new router, R,
#	is formed by concatenating the lists for every router directly
#	connected to R whose hop count is less than H.
function genps(nhops,				curhop, i, j, nid, rconn, rid)
{
	curhop = 1;

	#	The first pass is special since we care only about routers that
	#	are directly connected to nodes.
	newpstype(ptype);
	for (i = 0; i < nrouters; i++) {
		rid = routerid[i];
		if (hops[rid] == curhop) {
			nodesof[rid] = "";
			for (j = 0; j < nrouterconnections[rid]; j++) {
				rconn = routerconnections[rid, j];
				if (is_UV) {
					#	nid[1] will be the router ID
					#	(currently dysfunctional)
					split(j, nid, "#");
					if (rid == nid[1])
						nodesof[rid] = nodesof[rid] "" rconn;
				} else {
					if (rconn in nodenums)
						nodesof[rid] = nodesof[rid] "" rconn;
				}
			}
		}
	}

	#	For
	do {
		curhop++;
		for (i = 0; i < nrouters; i++) {
			rid = routerid[i];
			if (hops[rid] == curhop) {
				#	This should not happen ...
				if ((debug == 1) && (rid in nodesof))
					printf("router %s in nodesof[]\n", rid);
				nodesof[rid] = "";
				for (j = 0; j < nrouterconnections[rid]; j++) {
					rconn = routerconnections[rid, j];
					if (hops[rconn] < curhop)
						nodesof[rid] = nodesof[rid] "" nodesof[rconn];
				}
			}
		}
	} while (curhop <= nhops);

	if (debug == 1)
		for (i = 0; i < nrouters; i++) {
			rid = routerid[i];
			printf("router %s:  hop %d, nodesof %s\n",
			    rid, hops[rid], nodesof[rid]);
		}
}

function verscheck(vers, version_min, version_max)
{
	if ((vers < version_min) || (vers > version_max)) {
		printf("unsupported version (%d) - not between %d and %d\n",
		    vers, version_min, version_max);
		exitval = 1;
		exit(1);
	}
}

#	This function infers the existence of nodes and routers in order to
#	allow this script to work for both UV and non-UV systems with minimal
#	changes.  It does this by assuming that the blade IDs (a.k.a. nodes)
#	are derived from CPU IDs by truncating the ID string at an '_' character
#	and that routers are derived from blade IDs by truncating at a '#'
#	character.
function UV_infer_nodes_and_routers(		i, n, nid, UVnodeID, UVnode, nlid)
{
	if (nnodes == 0) {
		n = asort(cpuid, temp)
		for (i = 0; i < n; i++) {
			split(cpuid[i], UVnode, "_");
			UVnodeID = UVnode[1];

			if (UVnodeID in nodenums)
				continue;
			else {
				#	nid is currently unused;
				#	nid[1] would be a router ID
				split(UVnodeID, nid, "#");
				nodenums[UVnodeID] = nnodes;
				nodeid[nnodes] = UVnodeID "";
				if (debug) {
					printf("nodenums[%s]:  %d\n", UVnodeID, nnodes);
					printf("nodeid[%d]:  %s\n", nnodes, nodeid[nnodes]);
				}
				nnodes++;
			}
		}
	}
	if (nrouters == 0) {
		for (i in numalinklocalid) {
			nlid = NUMAlink2router(numalinklocalid[i]);
			if (nlid in routernum) {
				if (debug)
					printf("router %s already in routernum\n", nlid);
				continue;
			}
			routernum[nlid] = nrouters;
			routerid[nrouters] = nlid;
			if (debug) {
				printf("routernum[%s]:  %d\n", nlid, nrouters);
				printf("routerid[%d]:  %s\n", nrouters, nlid);
			}
			nrouters++;
		}
	}
}

END {
	#	Even though BEGIN may have called exit(), the END rule will
	#	still be executed.  Avoid any actions that shouldn't occur
	#	in that case.
	if (exitval)
		exit(exitval);

	if (is_UV)
		UV_infer_nodes_and_routers();
	if (debug) {
		doconsistencychecks();
		dumpnodeinfo();
		dumprouterinfo();
	}

	numhops = genhops();
	genps(numhops);

	if (type == "m") {
		momprologue();
		printmompsdefs();
	} else if (type == "q") {
		qprologue();
		printqmgrpsdefs();
	}
}


================================================
FILE: test/Makefile.am
================================================

#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

SUBDIRS = fw tests


================================================
FILE: test/fw/MANIFEST.in
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

include *.txt
graft bin
graft ptl


================================================
FILE: test/fw/Makefile.am
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#

# making aptl installation in case it is enabled with configure
# all directories for ptl install start with 'ptl_'

if ENABLEPTL
ptlpkg_bindir = ${ptl_prefix}/bin

dist_ptlpkg_bin_SCRIPTS = $(wildcard $(srcdir)/bin/*)

ptlpkg_fwdir = ${ptl_prefix}/fw

dist_ptlpkg_fw_DATA =  $(srcdir)/requirements.txt

ptlpkg_pylib_topdir = ${ptl_prefix}/lib/python$(PYTHON_VERSION)/site-packages/ptl

dist_ptlpkg_pylib_top_PYTHON = $(wildcard $(builddir)/ptl/*.py)

ptlpkg_pylib_libdir = $(ptlpkg_pylib_topdir)/lib

dist_ptlpkg_pylib_lib_PYTHON = $(wildcard $(srcdir)/ptl/lib/*.py)

ptlpkg_pylib_utilsdir = $(ptlpkg_pylib_topdir)/utils

dist_ptlpkg_pylib_utils_PYTHON = $(wildcard $(srcdir)/ptl/utils/*.py)

ptlpkg_pylib_pluginsdir = $(ptlpkg_pylib_utilsdir)/plugins

dist_ptlpkg_pylib_plugins_PYTHON = $(wildcard $(srcdir)/ptl/utils/plugins/*.py)

sysprofiledir = /etc/profile.d

dist_sysprofile_DATA = \
	ptl.csh \
	ptl.sh
endif

ptlmoduledir = $(exec_prefix)/unsupported/fw/ptl
ptlbindir = $(exec_prefix)/unsupported/fw/bin

dist_ptlbin_SCRIPTS = \
	bin/pbs_stat \
	bin/pbs_loganalyzer \
	bin/pbs_snapshot \
	bin/pbs_config \
	bin/pbs_compare_results

dist_ptlmodule_PYTHON = ptl/__init__.py

ptlmodulelibdir = $(ptlmoduledir)/lib

dist_ptlmodulelib_PYTHON = \
	ptl/lib/pbs_api_to_cli.py \
	ptl/lib/pbs_ifl_mock.py \
	ptl/lib/pbs_testlib.py \
	ptl/lib/__init__.py \
	ptl/lib/ptl_config.py \
	ptl/lib/ptl_error.py \
	ptl/lib/ptl_types.py \
	ptl/lib/ptl_batchutils.py \
	ptl/lib/ptl_constants.py \
	ptl/lib/ptl_expect_action.py \
	ptl/lib/ptl_object.py \
	ptl/lib/ptl_mom.py \          
	ptl/lib/ptl_sched.py \
	ptl/lib/ptl_server.py \
	ptl/lib/ptl_comm.py \
	ptl/lib/ptl_entities.py \
	ptl/lib/ptl_fairshare.py \
	ptl/lib/ptl_resourceresv.py \
	ptl/lib/ptl_service.py \
	ptl/lib/ptl_wrappers.py

ptlmoduleutilsdir = $(ptlmoduledir)/utils

dist_ptlmoduleutils_PYTHON = \
	ptl/utils/pbs_procutils.py \
	ptl/utils/pbs_dshutils.py \
	ptl/utils/pbs_covutils.py \
	ptl/utils/pbs_cliutils.py \
	ptl/utils/pbs_logutils.py \
	ptl/utils/pbs_testsuite.py \
	ptl/utils/pbs_anonutils.py \
	ptl/utils/pbs_snaputils.py \
	ptl/utils/pbs_testusers.py \
	ptl/utils/__init__.py

ptlmoduleutilspluginsdir = $(ptlmoduleutilsdir)/plugins

dist_ptlmoduleutilsplugins_PYTHON = \
	ptl/utils/plugins/ptl_test_tags.py \
	ptl/utils/plugins/ptl_test_loader.py \
	ptl/utils/plugins/ptl_test_db.py \
	ptl/utils/plugins/ptl_test_info.py \
	ptl/utils/plugins/ptl_test_runner.py \
	ptl/utils/plugins/ptl_test_data.py \
	ptl/utils/plugins/__init__.py

install-data-hook:
	cd $(DESTDIR)$(ptlbindir) && \
	mv pbs_stat pbs_stat.py && \
	mv pbs_loganalyzer pbs_loganalyzer.py && \
	mv pbs_snapshot pbs_snapshot.py && \
	mv pbs_config pbs_config.py

uninstall-hook:
	cd $(DESTDIR)$(ptlbindir) && \
	rm -f pbs_stat.py pbs_loganalyzer.py pbs_snapshot.py pbs_config.py


================================================
FILE: test/fw/bin/pbs_as
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import getopt
import os
import pickle
import pwd
import sys

from ptl.lib.pbs_testlib import (PbsAlterError, PbsDeleteError, PbsDeljobError,
                                 PbsDelresvError, PbsHoldError,
                                 PbsManagerError, PbsMessageError,
                                 PbsMoveError, PbsOrderError, PbsQtermError,
                                 PbsReleaseError, PbsRerunError, PbsRunError,
                                 PbsSignalError, PbsStatusError,
                                 PbsSubmitError, PtlConfig, Server)


def usage():
    msg = []
    msg += ['PBS user impersonation tool. This tool is an internal ']
    msg += ['tool and is not intended to be used by end-users\n\n']
    msg += ['Usage: ' + os.path.basename(sys.argv[0]) + ' [OPTION]\n\n']
    msg += ['-c <cmd>: command to perform, one of submit, status\n']
    msg += ['-e <extend>: extend options to commands']
    msg += ['-o <objid>: identifier of object to act upon\n']
    msg += ['-u <user>: username to perform commandd as\n']
    msg += ['-f <serialized_file>: filename containing serialized data\n']
    msg += ['-s <hostname>: name of host on which to perform command\n']
    msg += ['-h: usage help\n']

    print("".join(msg))


def _load_data(objfile=None, servername=None, user=None):
    if objfile:
        f = open(objfile, 'r')
        _data = pickle.load(f)
        f.close()
    else:
        _data = None
    if user is not None:
        uid = pwd.getpwnam(user)[2]
        if os.getuid() == 0 and uid != 0:
            os.setuid(uid)
    s = Server(servername, stat=False)
    return (s, _data)


if __name__ == '__main__':

    if len(sys.argv) < 2:
        usage()
        sys.exit(1)

    try:
        opts, args = getopt.getopt(sys.argv[1:], "c:e:o:u:f:s:h")
    except BaseException:
        usage()
        sys.exit(1)

    cmd = None
    objid = None
    user = None
    objfile = None
    servername = None
    extend = None

    for o, val in opts:
        if o == '-e':
            extend = val
        elif o == '-c':
            cmd = val
        elif o == '-o':
            objid = val.split(',')
        elif o == '-u':
            user = val
        elif o == '-f':
            objfile = val
        elif o == '-s':
            servername = val
        elif o == '-h':
            usage()
            sys.exit(0)
        else:
            sys.stderr.write('unrecognized option. Exiting')
            usage()
            sys.exit(1)

    if cmd is None or user is None or servername is None:
        print(None)
        sys.exit(0)

    PtlConfig()

    if cmd == 'submit':
        (s, job) = _load_data(objfile, servername, user)
        job.attrl = s.utils.dict_to_attrl(job.attributes)
        job.attropl = s.utils.dict_to_attropl(job.attributes)
        try:
            jid = s.submit(job)
            sys.stdout.write(jid.strip())
        except PbsSubmitError as e:
            sys.stdout.write(str(e.rv))
            sys.stderr.write(repr(e))
            sys.exit(e.rc)

    elif cmd == 'status':
        (s, _data) = _load_data(objfile, servername, user)
        if 'obj_type' in _data:
            obj_type = int(_data['obj_type'])
        else:
            obj_type = None
        if 'attrib' in _data:
            attrib = _data['attrib']
        else:
            attrib = None
        if 'id' in _data:
            id = _data['id']
        else:
            id = None

        try:
            rv = s.status(obj_type, attrib, id, extend=extend)
            sys.stdout.write(str(rv))
        except PbsStatusError as e:
            rv = e.rv
            sys.stdout.write(str(rv))
            sys.stderr.write(repr(e))
            sys.stderr.flush()
            sys.exit(e.rc)

    elif cmd == 'delete':
        if objid is None:
            print('1')
        else:
            (s, data) = _load_data(objfile, servername, user)
            try:
                rc = s.delete(objid, extend=extend)
                sys.stdout.write(str(rc))
            except PbsDeleteError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'deljob':
        if objid is None:
            print('1')
        else:
            (s, data) = _load_data(objfile, servername, user)
            try:
                rc = s.deljob(objid, extend=extend)
                sys.stdout.write(str(rc))
            except PbsDeljobError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'delresv':
        if objid is None:
            print('1')
        else:
            (s, data) = _load_data(objfile, servername, user)
            try:
                rc = s.delresv(objid, extend=extend)
                sys.stdout.write(str(rc))
            except PbsDelresvError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'select':
        (s, attrib) = _load_data(objfile, servername, user)
        rv = s.select(attrib, extend=extend)
        print(rv)

    elif cmd == 'alterjob':
        if objid is None:
            print('1')
        else:
            (s, attrib) = _load_data(objfile, servername, user)
            try:
                rc = s.alterjob(objid, attrib, extend=extend)
                sys.stdout.write(str(rc))
            except PbsAlterError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'holdjob':
        if objid is None:
            print('1')
        else:
            (s, hold_list) = _load_data(objfile, servername, user)
            try:
                rc = s.holdjob(objid, str(hold_list), extend=extend)
                sys.stdout.write(str(rc))
            except PbsHoldError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'sigjob':
        if objid is None:
            print('1')
        else:
            (s, signal) = _load_data(objfile, servername, user)
            try:
                rc = s.sigjob(objid, str(signal), extend=extend)
                sys.stdout.write(str(rc))
            except PbsSignalError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'msgjob':
        if objid is None:
            print('1')
        else:
            (s, msg) = _load_data(objfile, servername, user)
            try:
                rc = s.holdjob(objid, str(msg), extend=extend)
                sys.stdout.write(str(rc))
            except PbsMessageError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'rlsjob':
        if objid is None:
            print('1')
        else:
            (s, hold_list) = _load_data(objfile, servername, user)
            try:
                rc = s.rlsjob(objid, str(hold_list), extend=extend)
                sys.stdout.write(str(rc))
            except PbsReleaseError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'rerunjob':
        if objid is None:
            print('1')
        else:
            (s, data) = _load_data(objfile, servername, user)
            try:
                rc = s.rerunjob(objid, extend=extend)
                sys.stdout.write(str(rc))
            except PbsRerunError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'orderjob':
        if objid is None:
            print('1')
        else:
            (s, jobid2) = _load_data(objfile, servername, user)
            try:
                rc = s.orderjob(objid, str(jobid2), extend=extend)
                sys.stdout.write(str(rc))
            except PbsOrderError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    elif cmd == 'runjob':
        if objid is None:
            print('1')
        else:
            (s, location) = _load_data(objfile, servername, user)
            try:
                rc = s.runjob(objid, str(location), extend=extend)
            except PbsRunError as e:
                rc = e.rc
            print(str(rc))

    elif cmd == 'movejob':
        if objid is None:
            print('1')
        else:
            (s, destination) = _load_data(objfile, servername, user)
            try:
                rc = s.movejob(objid, str(destination), extend=extend)
                sys.stdout.write(rc)
            except PbsMoveError as e:
                sys.stdout.write(str(rc))
                sys.stderr.write(repr(e))
                sys.exit(e.rc)

    # elif cmd == 'alterresv':
    #    if objid is None:
    #        print '1'
    #    else:
    #        (s, attrib) = _load_data(objfile, servername, user)
    #        try:
    #            rc = s.alterresv(objid, attrib, extend=extend)
    #            sys.stdout.write(str(rc))
    #        except PbsAlterError, e:
    #            sys.stdout.write(str(rc))
    #            sys.stderr.write(repr(e))
    #            sys.exit(e.rc)

    elif cmd == 'manager':
        (s, _data) = _load_data(objfile, servername, user)
        if 'cmd' in _data:
            cmd = int(_data['cmd'])
        else:
            cmd = None
        if 'obj_type' in _data:
            obj_type = int(_data['obj_type'])
        else:
            obj_type = None
        if 'attrib' in _data:
            attrib = _data['attrib']
        else:
            attrib = None
        if 'id' in _data:
            id = _data['id']
        else:
            id = None
        try:
            rc = s.manager(cmd, obj_type, attrib, id, extend=extend)
            sys.stdout.write(str(rc))
        except PbsManagerError as e:
            sys.stderr.write(repr(e))
            sys.exit(e.rc)

    elif cmd == 'terminate':
        (s, data) = _load_data(servername, user)
        rc = s.terminate(manner=data['manner'],
                         server_name=data['server_name'], extend=extend)
        print(str(rc))

    sys.exit(0)


================================================
FILE: test/fw/bin/pbs_benchpress
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import sys
import os
import getopt
import logging
import logging.config
import platform
import errno
import signal
import importlib
import ptl
import nose
from nose.plugins.base import Plugin
from nose.plugins.manager import PluginManager
from ptl.lib.pbs_testlib import PtlConfig
from distutils.version import LooseVersion
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_dshutils import TimeOut
from ptl.utils.plugins.ptl_test_loader import PTLTestLoader
from ptl.utils.plugins.ptl_test_runner import PTLTestRunner
from ptl.utils.plugins.ptl_test_db import PTLTestDb
from ptl.utils.plugins.ptl_test_info import PTLTestInfo
from ptl.utils.plugins.ptl_test_tags import PTLTestTags
from ptl.utils.plugins.ptl_test_data import PTLTestData


class PTLNoseConfig(nose.config.Config):
    def __init__(self, log_format=None, outfile_handler=None, **kw):
        super().__init__(**kw)
        self.outfile_handler = outfile_handler
        self.log_format = log_format

    def configureLogging(self):
        super().configureLogging()
        nose_logger = logging.getLogger('nose')
        if self.log_format:
            formatter = logging.Formatter(self.log_format)
            for handler in nose_logger.handlers:
                handler.setFormatter(formatter)
        if self.outfile_handler:
            nose_logger.addHandler(self.outfile_handler)


# trap SIGINT and SIGPIPE
def trap_exceptions(etype, value, tb):
    sys.excepthook = sys.__excepthook__
    if issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)


sys.excepthook = trap_exceptions


def sighandler(signum, frames):
    signal.alarm(0)
    raise KeyboardInterrupt('Signal %d received' % (signum))


def timeout_handler(signum, frames):
    raise TimeOut('pbs_benchpress timed out by signal %d' % (signum))


# join process group of caller makes it possible to programmatically interrupt
# when run in a subshell
if os.getpgrp() != os.getpid():
    os.setpgrp()
signal.signal(signal.SIGINT, sighandler)
signal.signal(signal.SIGTERM, sighandler)


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0]) + ' [OPTION]\n\n']
    msg += ['  Test harness used to run or list test suites and test ' +
            'cases\n\n']
    msg += ['-f <file names>: comma-separated list of file names to run\n']
    msg += ['-F: set logging format to include timestamp and level\n']
    msg += ['-g <testgroup file>: path to file containing comma-separated']
    msg += [' list of testsuites\n']
    msg += ['-h: display usage information\n']
    msg += ['-i: show test info\n']
    msg += ['-l <level>: log level\n']
    msg += ['-L: display list of tests\n']
    msg += ['-o <logfile>: log file name\n']
    msg += ['-p <param>: test parameter. Comma-separated list of key=val']
    msg += [' pairs. Note that the comma can not be used in val\n']
    msg += ['-t <test suites>: comma-separated list of test suites to run\n']
    msg += ['--exclude=<names>: comma-separated string of tests to exclude\n']
    msg += ['--user-plugins=<names>: comma-separated list of key=val of']
    msg += [' user plugins to load, where key is module and val is']
    msg += [' classname of plugin which is subclass of nose.plugins.base']
    msg += ['.Plugin\n']
    msg += ['--db-type=<type>: Type of database to use.']
    msg += [' can be one of "html", "file", "sqlite", "pgsql", "json".']
    msg += [' Default to "json"\n']
    msg += ['--db-name=<name>: database name. Default to']
    msg += [' ptl_test_results.json\n']
    msg += ['--db-access=<path>: Path to a file that defines db options '
            '(PostreSQL only)\n']
    msg += ['--lcov-bin=<bin>: path to lcov binary. Defaults to lcov\n']
    msg += ['--genhtml-bin=<bin>: path to genhtml binary. '
            'Defaults to genhtml\n']
    msg += ['--lcov-data=<dir>: path to directory containig .gcno files\n']
    msg += ['--lcov-out=<dir>: path to output directory\n']
    msg += ['--lcov-baseurl=<url>: use <url> as baseurl in html report\n']
    msg += ['--lcov-nosrc: don\'t include PBS source in coverage analysis.']
    msg += [' Default PBS source will be included in coverage analysis\n']
    msg += ['--log-conf=<file>: logging config file\n']
    msg += ['--min-pyver=<version>: minimum Python version\n']
    msg += ['--max-pyver=<version>: maximum Python version\n']
    msg += ['--param-file=<file>: get params from file. Overrides -p\n']
    msg += ['--post-analysis-data=<dir>: path to post analysis data' +
            ' directory\n']
    msg += ['--max-postdata-threshold=<count>: max post analysis data' +
            ' threshold per testsuite. Defaults to 10. <count>=0 will' +
            ' disable this threshold\n']
    msg += ['--tc-failure-threshold=<count>: test case failure threshold' +
            ' per testsuite. Defaults to 10. <count>=0 will disable this' +
            ' threshold\n']
    msg += ['--cumulative-tc-failure-threshold=<count>: cumulative test' +
            ' case failure threshold. Defaults to 100. <count>=0 will' +
            ' disable this threshold.\n                              ' +
            '             Must be greater or equal to' +
            ' \'tc-failure-threshold\'\n']
    msg += ['--stop-on-failure: if set, stop when one of multiple tests ' +
            'fails\n']
    msg += ['--timeout=<seconds>: duration after which no test suites are '
            'run\n']
    msg += ['--repeat-count=<count>: repeat given all tests <count> times\n']
    msg += ['--repeat-delay=<seconds>: delay between two repetition\n']
    msg += ['--follow-child: if set, walk the test hierarchy and run ' +
            'each test\n']
    msg += ['--tags=<tag>: Select only tests that have <tag> tag.']
    msg += [' can be applied multiple times\n']
    msg += ['               Format: [!]tag[,tag]\n']
    msg += ['               Example:\n']
    msg += ['                 smoke - This will select all tests which has']
    msg += [' "smoke" tag\n']
    msg += ['                 !smoke - This will select all tests which']
    msg += [' doesn\'t have "smoke" tag\n']
    msg += ['                 smoke,regression - This will select all tests']
    msg += [' which has both "smoke" and "regression" tag\n']
    msg += ['--eval-tags=\'<Python expression>\': Select only tests for whose']
    msg += [' tags evaluates <Python expression> to True.']
    msg += [' can be applied multiple times\n']
    msg += ['            Example:\n']
    msg += ['               \'smoke and (not regression)\' - This will select']
    msg += [' all tests which has "smoke" tag and does\'t have "regression"']
    msg += [' tag\n']
    msg += ['               \'priority>4\' - This will select all tests which']
    msg += [' has "priority" tag and its value is >4\n']
    msg += ['--tags-info: List all selected test suite (or test cases if ']
    msg += ['--verbose applied)\n']
    msg += [
        '            used with --tags or --eval-tags (also -t or --exclude']
    msg += [' can be applied to limit selection)\n']
    msg += ['--list-tags: List all currenlty used tags\n']
    msg += [
        '--verbose: show verbose output (used with -i, -L or --tag-info)\n']
    msg += ['--use-current-setup: Runs test on current PBS setup\n']
    msg += ['--version: show version number and exit\n']

    print(''.join(msg))


if __name__ == '__main__':

    if len(sys.argv) < 2:
        usage()
        sys.exit(1)

    level = 'INFOCLI2'
    fmt = '%(asctime)-15s %(levelname)-8s %(message)s'
    outfile = None
    dbtype = None
    dbname = None
    use_cur_setup = False
    dbaccess = None
    testfiles = None
    testsuites = None
    testparam = None
    testgroup = None
    list_test = False
    showinfo = False
    follow = False
    excludes = None
    stoponfail = False
    paramfile = None
    logconf = None
    minpyver = None
    maxpyver = None
    verbose = False
    lcov_data = None
    lcov_bin = None
    lcov_out = None
    lcov_nosrc = False
    lcov_baseurl = None
    genhtml_bin = None
    timeout = None
    repeat_count = 1
    repeat_delay = 0
    nosedebug = False
    only_info = False
    tags = []
    eval_tags = []
    tags_info = False
    list_tags = False
    post_data_dir = None
    gen_ts_tree = False
    tc_failure_threshold = 10
    cumulative_tc_failure_threshold = 100
    max_postdata_threshold = 10
    user_plugins = None
    PtlConfig()

    largs = ['exclude=', 'log-conf=', 'timeout=', 'repeat-count=']
    largs += ['param-file=', 'min-pyver=', 'max-pyver=']
    largs += ['db-name=', 'db-access=', 'db-type=', 'genhtml-bin=']
    largs += ['lcov-bin=', 'lcov-data=', 'lcov-out=', 'lcov-nosrc']
    largs += ['lcov-baseurl=', 'tags=', 'eval-tags=', 'tags-info', 'list-tags']
    largs += ['version', 'verbose', 'follow-child']
    largs += ['stop-on-failure', 'enable-nose-debug']
    largs += ['post-analysis-data=', 'gen-ts-tree', 'repeat-delay=']
    largs += ['tc-failure-threshold=', 'cumulative-tc-failure-threshold=']
    largs += ['max-postdata-threshold=', 'user-plugins=', 'use-current-setup']

    try:
        opts, args = getopt.getopt(
            sys.argv[1:], 'f:il:t:o:p:g:hLF', largs)
    except Exception:
        sys.stderr.write('Unrecognized option. Exiting\n')
        usage()
        sys.exit(1)

    if args:
        sys.stderr.write('Invalid usage. Exiting\n')
        usage()
        sys.exit(1)

    for o, val in opts:
        if o == '-i':
            showinfo = True
            list_test = False
            gen_ts_tree = False
            only_info = True
        elif o == '-L':
            showinfo = False
            list_test = True
            gen_ts_tree = False
            only_info = True
        elif o == '--gen-ts-tree':
            showinfo = False
            list_test = False
            gen_ts_tree = True
            only_info = True
        elif o == '-l':
            level = val
        elif o == '-o':
            outfile = CliUtils.expand_abs_path(val)
        elif o == '-f':
            testfiles = CliUtils.expand_abs_path(val)
        elif o == '-t':
            testsuites = val
        elif o == '--user-plugins':
            user_plugins = val
        elif o == '--tags':
            tags.append(val.strip())
        elif o == '--eval-tags':
            eval_tags.append(val.strip())
        elif o == '--tags-info':
            tags_info = True
        elif o == '--list-tags':
            list_tags = True
        elif o == '--exclude':
            excludes = val
        elif o == '-F':
            fmt = '%(asctime)-15s %(levelname)-8s %(name)s %(message)s'
        elif o == '-p':
            testparam = val
        elif o == '-g':
            testgroup = val
        elif o == '--timeout':
            timeout = int(val)
        elif o == '--repeat-count':
            repeat_count = int(val)
        elif o == '--repeat-delay':
            repeat_delay = int(val)
        elif o == '--db-type':
            dbtype = val
        elif o == '--db-name':
            dbname = CliUtils.expand_abs_path(val)
        elif o == '--db-access':
            dbaccess = CliUtils.expand_abs_path(val)
        elif o == '--genhtml-bin':
            genhtml_bin = CliUtils.expand_abs_path(val)
        elif o == '--lcov-bin':
            lcov_bin = CliUtils.expand_abs_path(val)
        elif o == '--lcov-data':
            lcov_data = CliUtils.expand_abs_path(val)
        elif o == '--lcov-out':
            lcov_out = CliUtils.expand_abs_path(val)
        elif o == '--lcov-nosrc':
            lcov_nosrc = True
        elif o == '--lcov-baseurl':
            lcov_baseurl = val
        elif o == '--param-file':
            paramfile = CliUtils.expand_abs_path(val)
        elif o == '--stop-on-failure':
            stoponfail = True
        elif o == '--follow-child':
            follow = True
        elif o == '--log-conf':
            logconf = val
        elif o == '--min-pyver':
            minpyver = val
        elif o == '--max-pyver':
            maxpyver = val
        elif o == '--enable-nose-debug':
            nosedebug = True
        elif o == '--verbose':
            verbose = True
        elif o == '--post-analysis-data':
            post_data_dir = CliUtils.expand_abs_path(val)
        elif o == '--tc-failure-threshold':
            tc_failure_threshold = val
        elif o == '--cumulative-tc-failure-threshold':
            cumulative_tc_failure_threshold = val
        elif o == '--max-postdata-threshold':
            max_postdata_threshold = val
        elif o == '-h':
            usage()
            sys.exit(0)
        elif o == '--use-current-setup':
            use_cur_setup = True
        elif o == '--version':
            print(ptl.__version__)
            sys.exit(0)
        else:
            sys.stderr.write('Unreocgnized option %s\n' % o)
            usage()
            sys.exit(1)

    if nosedebug:
        level = 'DEBUG'

    log_lvl = CliUtils.get_logging_level(level)
    if logconf:
        logging.config.fileConfig(logconf)
    else:
        logging.basicConfig(level=log_lvl, format=fmt)

    if not log_lvl and level:
        logging.error('Invalid log level:%s', level)
        sys.exit(1)
    if outfile:
        outfile_hdlr = logging.FileHandler(outfile)
        outfile_hdlr.setLevel(log_lvl)
        outfile_hdlr.setFormatter(logging.Formatter(fmt))
        ptl_logger = logging.getLogger('ptl')
        ptl_logger.addHandler(outfile_hdlr)
        ptl_logger.setLevel(log_lvl)
    else:
        outfile_hdlr = None

    pyver = platform.python_version()
    if minpyver is not None and LooseVersion(pyver) < LooseVersion(minpyver):
        logging.error('Python version ' + str(pyver) + ' does not meet ' +
                      'required minimum version of ' + minpyver)
        sys.exit(1)
    if maxpyver is not None and LooseVersion(pyver) > LooseVersion(maxpyver):
        logging.error('Python version ' + str(pyver) + ' does not meet ' +
                      'required max version of ' + maxpyver)
        sys.exit(1)

    if showinfo and testsuites is None:
        logging.error(
            'Testsuites names require (see -t) along with -i option!')
        sys.exit(1)

    try:
        tc_failure_threshold = int(tc_failure_threshold)
        if tc_failure_threshold < 0:
            raise ValueError
    except ValueError:
        _msg = 'Invalid value provided for testcase failure threshold, '
        _msg += 'please provide integer'
        logging.error(_msg)
        sys.exit(1)

    try:
        cumulative_tc_failure_threshold = int(cumulative_tc_failure_threshold)
        if cumulative_tc_failure_threshold < 0:
            raise ValueError
    except ValueError:
        _msg = 'Invalid value provided for cumulative-tc-failure-threshold, '
        _msg += 'please provide integer'
        logging.error(_msg)
        sys.exit(1)

    if cumulative_tc_failure_threshold < tc_failure_threshold:
        _msg = 'Value for cumulative-tc-failure-threshould should'
        _msg += ' be greater or equal to \'tc-failure-threshold\''
        logging.error(_msg)
        sys.exit(1)

    try:
        max_postdata_threshold = int(max_postdata_threshold)
        if max_postdata_threshold < 0:
            raise ValueError
    except ValueError:
        _msg = 'Invalid value provided for max-postdata-threshold, '
        _msg += 'please provide integer'
        logging.error(_msg)
        sys.exit(1)

    if outfile is not None and not os.path.isdir(os.path.dirname(outfile)):
        os.mkdir(os.path.dirname(outfile))

    if timeout is not None:
        PTLTestRunner.timeout = timeout
        signal.signal(signal.SIGALRM, timeout_handler)
        signal.alarm(timeout)

    if list_test:
        excludes = None
        testgroup = None
        follow = True
    if testfiles is not None:
        tests = testfiles.split(',')
    else:
        tests = os.getcwd()

    if testsuites is None:
        testsuites = 'PBSTestSuite'
        follow = True

    loader = PTLTestLoader()

    if only_info:
        testinfo = PTLTestInfo()
        loader.set_data(testgroup, testsuites, excludes, True,
                        testfiles)
        testinfo.set_data(testsuites, list_test,
                          showinfo, verbose, gen_ts_tree)
        plugins = (loader, testinfo)
    elif (tags_info or list_tags):
        testtags = PTLTestTags()
        loader.set_data(testgroup, testsuites, excludes, True)
        testtags.set_data(tags, eval_tags, tags_info, list_tags, verbose)
        plugins = (loader, testtags)
    else:
        testtags = PTLTestTags()
        runner = PTLTestRunner()
        db = PTLTestDb()
        data = PTLTestData()
        loader.set_data(testgroup, testsuites, excludes, follow, testfiles)
        testtags.set_data(tags, eval_tags)
        runner.set_data(paramfile, testparam, repeat_count,
                        repeat_delay, lcov_bin, lcov_data,
                        lcov_out, genhtml_bin, lcov_nosrc,
                        lcov_baseurl, tc_failure_threshold,
                        cumulative_tc_failure_threshold, use_cur_setup)
        db.set_data(dbtype, dbname, dbaccess)
        data.set_data(post_data_dir, max_postdata_threshold)
        plugins = (loader, testtags, runner, db, data)
    if user_plugins:
        for plugin in user_plugins.split(','):
            if '=' not in plugin:
                _msg = 'Invalid value (%s)' % (plugin)
                _msg += ' provided in user-plugins, it should be key value'
                _msg += ' pair where key is module name and value is class'
                _msg += ' name of plugin'
                logging.error(_msg)
                sys.exit(1)
            mod, clsname = plugin.split('=', 1)
            try:
                loaded_mod = importlib.import_module(mod)
            except ImportError:
                _msg = 'Failed to load module (%s)' % mod
                _msg += ' for plugin (%s)' % plugin
                logging.error(_msg)
                sys.exit(1)
            _plugin = getattr(loaded_mod, clsname, None)
            if not _plugin:
                _msg = 'Could not find class named "%s"' % clsname
                _msg += ' in module (%s)' % mod
                logging.error(_msg)
                sys.exit(1)
            if not issubclass(_plugin, Plugin):
                _msg = 'Plugin class (%s) should be subclass of ' % (clsname)
                _msg += 'nose.plugins.base.Plugin'
                logging.error(_msg)
                sys.exit(1)
            plugins += (_plugin(),)
    test_regex = r'(^(?:[\w]+|^)Test|pbs_|^test_[\(]*)'
    os.environ['NOSE_TESTMATCH'] = test_regex
    nose_config = PTLNoseConfig(
        env=os.environ,
        log_format=fmt,
        outfile_handler=outfile_hdlr,
        plugins=PluginManager(plugins=plugins),
        verbosity=7 if nosedebug else 2,
        stopOnError=stoponfail)
    nose.main(defaultTest=tests, argv=[sys.argv[0]], config=nose_config)
    if outfile_hdlr:
        outfile_hdlr.close()


================================================
FILE: test/fw/bin/pbs_compare_results
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import os
import csv
import json
import sys
import getopt
import time


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0])]
    msg += [' [benchmark_json_file] [tocompare_json_file] [OPTION]\n\n']
    msg += [' Performance test results comparision tool']
    msg += [' to generate csv and html report\n\n']
    msg += ['--html-report : option to generate html report\n']
    msg += ['--output-file : path to generate csv and html file\n']
    msg += ['--help or -h : To display usage information\n']
    msg += ['--append : Append results to an existing file\n']
    print(''.join(msg))


def generate_html_report(filepath, append):
    """
    Generate html performance comparision report
    """
    HTML = '''<html>
    <head>
      <style>
        table {
          font-family: sans-serif, "Times New Roman", serif;
          border-collapse: collapse;
          width: 100%%;
        }
        td, th {
          border: 1px solid #dddddd;
          text-align: left;
          padding: 8px;
        }
      </style>
    </head>
    <body>
      <table>
        <tr><th><b>Performance tests benchmark comparision results</b>
        </th></tr>
        <tr><td><b>user:</b> %s</td></tr>
        <tr><td><b>host:</b> %s</td></tr>
      </table>
      <table>
      %s
      </table>
     </body>
    </html>
    '''

    HTML_add = '''
      %s
      </table>
     </body>
    </html>
    '''

    if not filepath.endswith('.html'):
        filepath = filepath + '.html'
    if append:
        fd = open(filepath, "r")
        d = fd.read()
        fd.close()
        m = d.split("\n")
        s = "\n".join(m[:-4])
        fd = open(filepath, "w+")
        for i in range(len(s)):
            fd.write(s[i])
        fd.close()

        with open(filepath, 'a+') as fp:
            fp.write(HTML_add % (''.join(_data)))
    else:
        with open(filepath, 'w+') as fp:
            fp.write(HTML % (oldv['user'],
                             list(oldv['machine_info'].keys())[0],
                             _h + ''.join(_data)))


def generate_csv_report(filepath, append):
    """
    compare 2 json results and generate csv report
    """
    if not filepath.endswith('.csv'):
        filepath = filepath + '.csv'
    if append:
        with open(filepath, 'a+') as fp:
            csv.writer(fp).writerows(mdata)
    else:
        with open(filepath, 'w+') as fp:
            csv.writer(fp).writerows([header] + mdata)


def percent_change(nv, ov, unit):
    """
    swap the values to find approriate percent
    change for units
    """
    if unit == 'jobs/sec':
        a = ov
        ov = nv
        nv = a
    diff = ov - nv
    pchange = 0
    if nv == 0:
        nv = 1
    if diff > 0:
        pchange = (diff / nv) * 100
    elif diff < 0:
        diff = nv - ov
        pchange = -(diff / nv) * 100
    pchange = round(pchange, 2)
    return str(pchange) + '%'


if __name__ == '__main__':
    if len(sys.argv) < 3:
        usage()
        sys.exit(1)

    html_report = False
    try:
        opts, args = getopt.getopt(sys.argv[3:], "h",
                                   ["help", "html-report", "output-file=",
                                    "append"])
    except getopt.GetoptError as err:
        print(err)
        usage()
        sys.exit(1)

    filepath = None
    append = 0
    for o, val in opts:
        if o == '--html-report':
            html_report = True
        elif o in ("-h", "--help"):
            usage()
            sys.exit(0)
        elif o == "--output-file":
            filepath = val
        elif o == "--append":
            append = 1

    with open(sys.argv[1]) as fp:
        oldv = json.load(fp)

    newfiles = sys.argv[2].split(',')
    header = ['TestCase', 'Test Measure', 'Unit',
              oldv['product_version'] + ' baseline PBS']
    TR = '    <tr>\n%s    </tr>\n'
    TH = '      <th>%s</th>\n'
    TD = '      <td>%s</td>\n'
    TDR = '      <td rowspan=%d>%s</td>\n'
    filenum = 0
    mult_data = {}
    for newfile in newfiles:
        with open(newfile) as fp:
            newv = json.load(fp)
        header.extend([newv['product_version'], '% Improvement'])
        for k, v in sorted(oldv['avg_measurements']['testsuites'].items()):
            assert k in newv['avg_measurements']['testsuites'], k
            _ntcs = newv['avg_measurements']['testsuites'][k]['testcases']
            _otcs = v['testcases']
            mn = 0
            for _k, _v in sorted(v['testcases'].items()):
                _tcn = k + '.' + _k
                assert _k in _ntcs, _tcn
                _om = _v
                _om = [x for x in _om if 'test_measure' in x]
                _om = sorted(_om, key=lambda x: x['test_measure'])
                _nm = _ntcs[_k]
                _nm = [x for x in _nm if 'test_measure' in x]
                _nm = sorted(_nm, key=lambda x: x['test_measure'])
                _nm_ms = [x['test_measure'] for x in _nm]
                for key, val in sorted(oldv['testsuites'].items()):
                    assert key in newv['testsuites'], key
                    for tc, doc in sorted(val['testcases'].items()):
                        if _k == tc:
                            _docs = doc['docstring']
                for i, _m in enumerate(_om):
                    data = []
                    _mn = _m['test_measure']
                    _msg = 'test measure %s missing' % _mn
                    _msg += ' in new %s' % _tcn
                    assert _mn in _nm_ms, _msg
                    _os = _m['test_data']['std_dev']
                    _o = _m['test_data']['mean']
                    _omi = _m['test_data']['minimum']
                    _oma = _m['test_data']['maximum']
                    _omt = _m['test_data']['total_samples']
                    _oms = _m['test_data']['samples_considered']
                    _n = _nm[i]['test_data']['mean']
                    _ns = _nm[i]['test_data']['std_dev']
                    _nsmi = _nm[i]['test_data']['minimum']
                    _nsma = _nm[i]['test_data']['maximum']
                    _nst = _nm[i]['test_data']['total_samples']
                    _nss = _nm[i]['test_data']['samples_considered']
                    _old_vals = ('mean:' + str(round(_o, 2)) +
                                 ', std_dev:' + str(round(_os, 2)) +
                                 ', minimum:' + str(round(_omi, 2)) +
                                 ', maximum:' + str(round(_oma, 2)) +
                                 ', mean_samples:' + str(round(_omt, 2)) +
                                 ', samples_considered:' + str(round(_oms, 2)))
                    _new_vals = ('mean:' + str(round(_n, 2)) +
                                 ', std_dev:' + str(round(_ns, 2)) +
                                 ', minimum:' + str(round(_nsmi, 2)) +
                                 ', maximum:' + str(round(_nsma, 2)) +
                                 ', mean_samples:' + str(round(_nst, 2)) +
                                 ', samples_considered:' + str(round(_nss, 2)))
                    _row = [_tcn, _mn, _m['unit'], _old_vals]
                    _rowadd = [_new_vals, percent_change(_n, _o, _m['unit'])]
                    if filenum == 0:
                        data = _row
                        mult_data[mn] = data
                        data.extend(_rowadd)
                    else:
                        data.extend(_rowadd)
                        mult_data[mn].extend(data)
                    mn = mn + 1
        filenum += 1
    mdata = []
    for ind, dat in mult_data.items():
        mdata.append(dat)
    _h = TR % ''.join([TH % x for x in header])
    _data = []
    _rsns = {}
    _adf = []
    for i, d in enumerate(mdata):
        if d[1] in _rsns:
            _rsns[d[1]] += 1
        else:
            _rsns.setdefault(d[1], 1)
    for i, d in enumerate(mdata):
        if _rsns[d[1]] > 1:
            if d[1] in _adf:
                _data.append(TR % ''.join([TD % x for x in d[2:]]))
            else:
                _d = [TDR % (_rsns[d[1]], x) for x in d[:2]]
                _d1 = [TD % x for x in d[2:]]
                _data.append(TR % ''.join(_d + _d1))
                _adf.append(d[1])
        else:
            _data.append(TR % ''.join([TD % x for x in d]))
    if not filepath:
        filepath = 'performance_test_report'
    if html_report:
        generate_html_report(filepath, append)
    generate_csv_report(filepath, append)


================================================
FILE: test/fw/bin/pbs_config
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import getopt
import logging
import errno

import ptl
from ptl.lib.pbs_testlib import *
from ptl.utils.pbs_testsuite import PBS_GROUPS

# trap SIGINT and SIGPIPE


def trap_exceptions(etype, value, tb):
    sys.excepthook = sys.__excepthook__
    if issubclass(etype, KeyboardInterrupt):
        pass
    elif issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)


sys.excepthook = trap_exceptions


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0]) + ' [OPTION]\n\n']
    msg += ['-t <hostnames>: comma-separated hosts to operate on. Defaults '
            'to localhost\n']
    msg += ['-l <log level>: one of DEBUG, INFO, ERROR, FATAL, WARNING\n']
    msg += ['\n']
    msg += ['--log-conf=<file>: logging config file\n']
    msg += ['--snap=<pbs_snapshot>: Mimic pbs_snapshot\n']
    msg += ['\t --acct-logs=<path to acct logs>: path to accounting logs'
            ', used to create users & groups\n']
    msg += ['--revert-config: revert services to their default ' +
            'configuration\n']
    msg += ['\t --scheduler: operate on scheduler\n']
    msg += ['\t --server: operate on server\n']
    msg += ['\t --mom: operate on MoM\n']
    msg += ['\t --del-hooks=<True|False>: If True delete hooks.']
    msg += [' Defaults to True\n']
    msg += ['\t --del-queues=<True|False>: Delete non-default queues.']
    msg += [' Defaults to True\n']
    msg += ['--save-config=<config>: save configuration to file\n']
    msg += ['\t revert-config and save-config can operate on the following\n']
    msg += ['\t --scheduler: operate on scheduler\n']
    msg += ['\t --server: operate on server\n']
    msg += ['\t --mom: operate on MoM\n']
    msg += ['--load-config=<config>: load configuration from saved file.\n']
    msg += ['\n']

    msg += ['--vnodify: define vnodes using the following suboptions:\n']
    msg += ['\t-a <attrs>: comma separated list of attributes to set ' +
            'on vnodes.\n']
    msg += ['\t            format: <name>=<value>. Defaults to 8 cpus ' +
            '8gb of mem.\n']
    msg += ['\t-A: set additive mode, leave vnode definitions in ' +
            'place. \n']
    msg += ['\t    Default is to clear all existing vnode definition ' +
            'files.\n']
    msg += ['\t-d <y|n>: if y, delete all server nodes. Defaults to y.\n']
    msg += ['\t-f <filename>: use output of pbsnodes -av from file as ' +
            'definition\n']
    msg += ['\t-P <num>: number of vnodes per host\n']
    msg += ['\t-o <filename>: output vnode definition to filename\n']
    msg += ['\t-M <mom>: MoM to operate on, format <host>@<path/to/conf>.\n'
            '\t          Defaults to localhost.\n']
    msg += ['\t-N <num vnodes>: number of vnodes to create. No default.\n']
    msg += ['\t-n <name>: name of the natural vnode to create. ' +
            'Defaults to MoM FQDN\n']
    msg += ['\t-p <name>: prefix of name of node to create. ' +
            'Output format: \n']
    msg += ['\t           prefix followed by [<num]. Defaults to vnode\n']
    msg += ['\t-r <y|n>: restart MoM or not, defaults to y\n']
    msg += ['\t-s: if set, share vnodes on the host. ' +
            'Default is "standalone" hosts\n']
    msg += ['\t-u: if set, allocate the natural vnode\n']
    msg += ['\n']

    msg += ['--multi-mom: Define and create multiple MoMs on a host\n']
    msg += ['\t--create=<num>: number of MoMs to create. No default.\n']
    msg += ['\t--restart=<[seq]>: restart MoMs in sequence\n']
    msg += ['\t--stop=<[seq]>: stop MoMs in sequence\n']
    msg += ['\t--serverhost=<host>: hostname of server, defaults to '
            'localhost\n']
    msg += ['\t--home-prefix=<path>: prefix to PBS_HOME directory, defaults\n'
            '\t                      to /var/spool/PBS_m\n']
    msg += ['\t--conf-prefix=<path>: prefix to pbs.conf file. Defaults to\n'
            '\t                      /etc/pbs.conf.m\n']
    msg += ['\t--init-port=<number>: initial port to allocate. Defaults to\n'
            '\t                      15011\n']
    msg += ['\t--step-port=<number>: step for port sequence. Defaults to 2\n']
    msg += ['\n']
    msg += ['--switch-version=<version>: switch to a given installed ' +
            'version of PBS\n']
    msg += ['\tcurrently only works for "vanilla" installs, i.e, not '
            'developer installs\n']
    msg += ['\tbased on /etc/pbs.conf and "default" PBS_EXEC\n']
    msg += ['\n']
    msg += ['--check-ug: verifies whether test users and groups are ']
    msg += [' defined as expected.\n               Note that -t option '
            'will be ignored.\n']
    msg += ['--make-ug: create users and groups to match what is expected\n']
    msg += ['           Note that -t option will be ignored\n']
    msg += ['--del-ug: delete users and groups which is expected for PTL\n']
    msg += ['           Note that -t option will be ignored\n']
    msg += ['--version: print version number and exit\n']

    print("".join(msg))


def process_config(hosts, process_obj, conf_file=None, type='default',
                   delqueues=False, delhooks=False):
    for host in hosts:
        svr_obj = Server(host)
        if MGR_OBJ_SCHED in process_obj:
            if type == 'default':
                Scheduler(svr_obj, host).revert_to_defaults()
            elif type == 'load':
                Scheduler(svr_obj, host).load_configuration(conf_file)
            elif type == 'save':
                Scheduler(svr_obj, host).save_configuration(conf_file)
        if MGR_OBJ_SERVER in process_obj:
            if type == 'default':
                Server(host).revert_to_defaults(delhooks=delhooks,
                                                delqueues=delqueues)
            elif type == 'load':
                Server(host).load_configuration(conf_file)
            elif type == 'save':
                Server(host).save_configuration(conf_file)
        if MGR_OBJ_NODE in process_obj:
            if type == 'default':
                MoM(svr_obj, host).revert_to_defaults()
            elif type == 'load':
                MoM(svr_obj, host).load_configuration(conf_file)
            elif type == 'save':
                MoM(svr_obj, host).save_configuration(conf_file)


def process_attributes(attrs):
    nattrs = {}
    for a in attrs.split(','):
        if '=' not in a:
            logging.error('attributes must be of the form' +
                          ' <name>=<value>')
            sys.exit(1)
        k, v = a.split('=')
        nattrs[k] = v
    return nattrs


def common_users_groups_ops():
    du = DshUtils()
    g_create = []
    u_create = []
    gm_expected = {}
    gm_actual = du.group_memberships([str(g) for g in PBS_GROUPS])
    for g in PBS_GROUPS:
        gm_expected[g] = g.users
    for k, v in gm_expected.items():
        if str(k) not in gm_actual:
            g_create.append(k)
            for _u in v:
                if _u not in u_create:
                    u_create.append(_u)
        else:
            for _u in v:
                if ((str(_u) not in gm_actual[str(k)]) and
                        (_u not in u_create)):
                    u_create.append(_u)
    return (gm_expected, gm_actual, g_create, u_create)


def check_users_groups():
    gm_expected, gm_actual, g_create, u_create = common_users_groups_ops()
    if ((len(g_create) > 0) or (len(u_create) > 0)):
        out = ['Expected (format is <group name>: <user> [, <user2>...) ']
        for k, v in gm_expected.items():
            out += [str(k) + ': ' + ', '.join([str(u) for u in v])]
        out += ['\n', 'Actual: ']
        for k, v in gm_actual.items():
            out += [k + ': ' + ', '.join(v)]
        print('\n'.join(out))
        return False
    else:
        return True


def make_users_groups():
    du = DshUtils()
    _, _, g_create, u_create = common_users_groups_ops()
    for g in g_create:
        du.groupadd(g, g.gid, logerr=False)
    for u in u_create:
        du.useradd(name=u, uid=u.uid, gid=u.groups[0], groups=u.groups,
                   logerr=False)
    return True


def delete_users_groups():
    du = DshUtils()
    _, gm_actual, _, _ = common_users_groups_ops()
    for v in gm_actual.values():
        for u in v:
            du.userdel(u, logerr=False)
    for k in gm_actual.keys():
        du.groupdel(k, logerr=False)
    return True


if __name__ == '__main__':

    if len(sys.argv) < 2:
        usage()
        sys.exit(0)

    # vnodify options
    vnodify = False
    vnodeprefix = 'vnode'
    num_vnodes = None
    additive = False
    sharedhost = False
    filename = None
    attrs = "resources_available.ncpus=8,resources_available.mem=8gb"
    hostname = None
    conf_file = None
    restart = True
    delall = True
    natvnode = None
    usenatvnode = False
    vdefname = None
    # end of vnodify options

    hosts = None
    revert = False
    op = None
    loadconf = None
    saveconf = None
    logconf = None
    vnodes_per_host = 1
    delqueues = True
    delhooks = True
    lvl = logging.INFO

    switchversion = None

    check_ug = False
    make_ug = False
    del_ug = False

    multimom = False
    num_moms = None
    restart_moms = None
    stop_moms = None
    clienthost = None
    serverhost = None
    init_port = 15011
    step_port = 2

    import_jobs = False
    home_prefix = 'PBS_m'
    conf_prefix = 'pbs.conf_m'
    acct_logs = None

    as_snap = None

    process_obj = []
    vnodify_args = "a:d:f:N:n:o:P:p:M:l:r:v:Asu"
    generic_args = "l:t:h"
    largs = ["scheduler", "server", "mom", "revert-config", "load-config=",
             "save-config=", "vnodify", "import-jobs", "del-ug",
             "switch-version=", "log-conf=", "check-ug", "del-hooks=",
             "del-queues=", "version", "make-ug", "multi-mom", "clienthost=",
             "home-prefix=", "conf-prefix=", "serverhost=", "init-port=",
             "step-port=", "snap=", "acct-logs=", "create=", "restart=",
             "stop="]

    try:
        opts, args = getopt.getopt(sys.argv[1:], vnodify_args + generic_args,
                                   largs)
    except getopt.GetoptError:
        usage()
        sys.exit(1)

    for o, val in opts:
        if o == '-l':
            lvl = CliUtils().get_logging_level(val)
        elif o == '-t':
            hosts = val
        elif o == '-a':
            attrs = val
        elif o == '-A':
            additive = True
        elif o == '-d':
            if val.startswith('y'):
                delall = True
            else:
                delall = False
        elif o == '-f':
            filename = CliUtils.expand_abs_path(val)
        elif o == '-P':
            vnodes_per_host = int(val)
        elif o == '-p':
            vnodeprefix = val
        elif o == '-M':
            if '@' in val:
                (hostname, conf_file) = val.split('@')
            else:
                hostname = val
        elif o == '-N':
            num_vnodes = int(val)
        elif o == '-o':
            vdefname = val
        elif o == '-s':
            sharedhost = True
        elif o == '-r':
            if val.startswith('y'):
                restart = True
        elif o == '-n':
            natvnode = val
        elif o == '-u':
            usenatvnode = True
        elif o == '--check-ug':
            check_ug = True
        elif o == '--make-ug':
            make_ug = True
        elif o == '--del-ug':
            del_ug = True
        elif o == '--del-hooks':
            delhooks = eval(val)
        elif o == '--del-queues':
            delqueues = eval(val)
        elif o == '--snap':
            as_snap = CliUtils.expand_abs_path(val)
        elif o == '--acct-logs':
            confirm = raw_input("--acct-logs will create users & groups "
                                "from accounting log trace\n"
                                "Ok to do so? (Y/N)")
            if confirm in ("Y", "y"):
                acct_logs = CliUtils.expand_abs_path(val)
            else:
                acct_logs = None
        elif o == '--import-jobs':
            import_jobs = True
        elif o == '--log-conf':
            logconf = val
        elif o == '--multi-mom':
            multimom = True
        elif o == '--create':
            num_moms = int(val)
        elif o == '--home-prefix':
            home_prefix = val
        elif o == '--conf-prefix':
            conf_prefix = val
        elif o == '--scheduler':
            process_obj.append(MGR_OBJ_SCHED)
        elif o == '--server':
            process_obj.append(MGR_OBJ_SERVER)
        elif o == '--mom':
            process_obj.append(MGR_OBJ_NODE)
        elif o == '--restart':
            restart_moms = eval(val, {}, {})
        elif o == '--stop':
            stop_moms = eval(val, {}, {})
        elif o == '--vnodify':
            vnodify = True
        elif o == '--revert-config':
            revert = True
        elif o == '--load-config':
            loadconf = CliUtils.expand_abs_path(val)
        elif o == '--save-config':
            saveconf = CliUtils.expand_abs_path(val)
        elif o == '--serverhost':
            serverhost = val
        elif o == '--init-port':
            init_port = int(val)
        elif o == '--step-port':
            step_port = int(val)
        elif o == '--switch-version':
            switchversion = val
        elif o == '--version':
            print(ptl.__version__)
            sys.exit(0)
        else:
            sys.stderr.write("Unrecognized option " + o + "\n")
            usage()
            sys.exit(1)

    PtlConfig()

    if logconf:
        logging.config.fileConfig(logconf)
    else:
        logging.basicConfig(level=lvl)

    if hosts is None:
        hosts = [socket.gethostname()]
    else:
        hosts = hosts.split(',')

    if check_ug:
        rv = check_users_groups()
        if rv:
            sys.exit(0)
        sys.exit(1)

    if del_ug:
        rv = delete_users_groups()
        if rv:
            sys.exit(0)
        sys.exit(1)

    if make_ug:
        rv = make_users_groups()
        if rv:
            sys.exit(0)
        sys.exit(1)

    if revert:
        process_config(hosts, process_obj, type='default', delqueues=delqueues,
                       delhooks=delhooks)
    elif loadconf:
        # when loading configuration apply the saved configuration based
        # on what was saved irregardless of what object types were passed in
        allobjs = [MGR_OBJ_SCHED, MGR_OBJ_SERVER, MGR_OBJ_NODE]
        process_config(hosts, allobjs, loadconf, type='load',
                       delqueues=delqueues, delhooks=delhooks)
    elif saveconf:
        if os.path.isfile(saveconf):
            answer = input('file ' + saveconf + ' exists, overwrite? '
                           '[y]/n: ')
            if answer == 'n':
                sys.exit(1)
        if not process_obj:
            process_obj = [MGR_OBJ_SERVER, MGR_OBJ_SCHED, MGR_OBJ_NODE]
        process_config(hosts, process_obj, saveconf, type='save',
                       delqueues=delqueues, delhooks=delhooks)
    elif vnodify:
        if filename:
            vdef = BatchUtils().file_to_vnodedef(filename)
            if vdef:
                svr_obj = Server(hostname, pbsconf_file=conf_file)
                MoM(svr_obj, hostname,
                    pbsconf_file=conf_file).insert_vnode_def(vdef)
        elif num_vnodes is None:
            logging.error('A number of vnodes to create is required\n')
            sys.exit(1)
        else:
            nattrs = process_attributes(attrs)
            for hostname in hosts:
                svr_obj = Server(hostname, pbsconf_file=conf_file)
                m = MoM(svr_obj, hostname, pbsconf_file=conf_file)
                m.create_vnodes(nattrs, num_vnodes,
                                additive, sharedhost, restart, delall,
                                natvnode, usenatvnode, fname=vdefname,
                                vnodes_per_host=vnodes_per_host)
    elif switchversion:
        pi = PBSInitServices()
        for host in hosts:
            pi.switch_version(host, switchversion)

    elif multimom:
        if num_moms is not None:
            if os.getuid() != 0:
                logging.error('Must be run as root')
                sys.exit(1)
            du = DshUtils()
            conf = du.parse_pbs_config(serverhost)
            serverhost = DshUtils().get_pbs_server_name(conf)
            s = Server(serverhost)
            nattrs = process_attributes(attrs)
            s.create_moms(num=num_moms, attrib=nattrs, conf_prefix=conf_prefix,
                          home_prefix=home_prefix, momhosts=hosts,
                          init_port=init_port, step_port=step_port)
        if (restart_moms or stop_moms):
            mom_op = []
            if restart_moms:
                mom_op = restart_moms
            if stop_moms:
                mom_op += stop_moms
            for i in mom_op:
                c = os.path.join('/etc', conf_prefix + str(i))
                pi = PBSInitServices(serverhost, conf=c)
                if restart_moms:
                    ret = pi.restart()
                if stop_moms:
                    ret = pi.stop()
                if ret['rc'] != 0:
                    logging.error(ret['err'])
                del pi
    elif as_snap is not None:
        if os.getuid() != 0:
            logging.error('Must be run as root')
            sys.exit(1)
        Server(snap=as_snap).clusterize(conf_file, hosts, acct_logs=acct_logs,
                                        import_jobs=import_jobs)


================================================
FILE: test/fw/bin/pbs_cov
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import sys
import getopt
import logging
import logging.config
import errno

import ptl
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_covutils import LcovUtils
from ptl.lib.pbs_testlib import PtlConfig


# trap SIGINT and SIGPIPE
def trap_exceptions(etype, value, tb):
    sys.excepthook = sys.__excepthook__
    if issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)


sys.excepthook = trap_exceptions


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0]) + ' [OPTION]\n\n']
    msg += ['    code coverage tools\n\n']
    msg += ['-c: capture coverage\n']
    msg += ['-d <path>: path to directory that contains coverage data\n']
    msg += ['-i: initialize coverage\n']
    msg += ['-o <path>: path to output directory\n']
    msg += ['-m <f1,f2>: merge comma-separated coverage files\n']
    msg += ['-r <path>: path to file to remove coverage patterns from\n']
    msg += ['-z: reset coverage counters\n']
    msg += ['--exclude=<p1,p2>: comma-separated pattern of files to exclude\n']
    msg += ['--summarize: summarize coverage analysis\n']
    msg += ['--html: Generate HTML from coverage analysis\n']
    msg += ['--no-source: don\'t include PBS source in coverage analysis']
    msg += [' (Must be used with --html)\n']
    msg += ['--baseurl=<url>: use <url> as baseurl in html report']
    msg += [' (Must be used with --html)\n']
    msg += [' Default source will be in coverage analysis\n']
    msg += ['--version: print version number and exit\n']

    print("".join(msg))


if __name__ == '__main__':

    if len(sys.argv) < 2:
        usage()
        sys.exit(1)

    data_dir = None
    capture = None
    initialize = None
    merge = None
    reset = None
    remove = None
    out = None
    html_nosrc = False
    html = False
    html_baseurl = None
    exclude = ['"*work/gSOAP/*"', '"*/pbs/doc/*"', 'lex.yy.c',
               'pbs_ifl_wrap.c', 'usr/include/*', 'unsupported/*']

    summarize = None
    lvl = logging.INFO
    logconf = None

    lopts = ["version", "exclude=", "summarize", 'no-source', 'html']
    lopts += ['baseurl=']

    try:
        opts, args = getopt.getopt(sys.argv[1:], "ciszd:mo:l:rh", lopts)
    except Exception:
        usage()
        sys.exit(1)

    for o, val in opts:
        if o == '-d':
            data_dir = CliUtils.expand_abs_path(val)
        elif o == '-c':
            capture = True
        elif o == '-o':
            out = CliUtils.expand_abs_path(val)
        elif o == '-i':
            initialize = True
        elif o == '-l':
            lvl = CliUtils.get_logging_level(val)
        elif o == '-m':
            merge = val
        elif o == '-l':
            lvl = CliUtils().get_logging_level(val)
        elif o == '-r':
            remove = CliUtils.expand_abs_path(val)
        elif o == '-z':
            reset = True
        elif o == '-h':
            usage()
            sys.exit(0)
        elif o == '--exclude':
            exclude = val.split(',')
        elif o == '--log-conf':
            logconf = val
        elif o in ('-s', '--summarize'):
            summarize = True
        elif o == '--html':
            html = True
        elif o in '--no-source':
            html_nosrc = False
        elif o in '--baseurl':
            html_baseurl = val
        elif o == '--version':
            print(ptl.__version__)
            sys.exit(0)
        else:
            sys.stderr.write("Unrecognized option")
            usage()
            sys.exit(1)

    PtlConfig()

    if logconf:
        logging.config.fileConfig(logconf)
    else:
        logging.basicConfig(level=lvl)

    if html_nosrc and not html:
        logging.error('--no-source must be used with --html')
        sys.exit(1)

    if html_baseurl and not html:
        logging.error('--baseurl must be used with --html')
        sys.exit(1)

    cu = LcovUtils(cov_out=out, data_dir=data_dir, html_nosrc=html_nosrc,
                   html_baseurl=html_baseurl)

    if reset:
        cu.zero_coverage()
    if initialize:
        cu.initialize_coverage()
    if capture:
        cu.capture_coverage()
    if merge is not None:
        for m in merge.split(','):
            cu.add_trace(m)
        cu.merge_coverage_traces(exclude=exclude)
    if html:
        cu.generate_html()
        if html_baseurl:
            cu.change_baseurl()
    if summarize:
        cu.summarize_coverage()


================================================
FILE: test/fw/bin/pbs_loganalyzer
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import getopt
import sys
import os
import traceback
import logging
import logging.config
import time
import errno
import ptl
from ptl.utils.pbs_logutils import PBSLogUtils, PBSLogAnalyzer
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.plugins.ptl_test_db import PTLTestDb
from ptl.lib.pbs_testlib import PtlConfig


# trap SIGINT and SIGPIPE
def trap_exceptions(etype, value, tb):
    sys.excepthook = sys.__excepthook__
    if issubclass(etype, KeyboardInterrupt):
        pass
    elif issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)


sys.excepthook = trap_exceptions


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0]).split('.pyc')[0]]
    msg += [' [OPTION]\n\n']
    msg += ['  Analyze PBS logs and return various throughput metrics\n\n']
    msg += ['-a <acctlog>: path to accounting log file/dir to analyze\n']
    msg += ['-b: process log from corresponding begin/start time\n']
    msg += ['    format: %m/%d/%Y %H:%M:%S\n']
    msg += ['-c: output cycle summary\n']
    msg += ['-d <diag>: path to a pbs_diag directory\n']
    msg += ['-e: process log up to corresponding end time\n']
    msg += ['    format: %m/%d/%Y %H:%M:%S\n']
    msg += ['-f <log>: generic log file for analysis\n']
    msg += ['-h: display usage information\n']
    msg += ['-t <hostname>: hostname. Defaults to FQDN local hostname\n']
    msg += ['-l <schedlog>: path to scheduler log file/dir to analyze\n']
    msg += ['-m <momlog>: path to mom log file/dir to analyze\n']
    msg += ['-s <serverlog>: path to server log file/dir to analyze\n']
    msg += ['-S: show per job scheduling details, time to '
            'run/discard/calendar\n']
    msg += ['-U: show utilization. Requires paths to jobs and nodes info\n']
    msg += ['--estimated-info: show job start time estimate info. '
            'Requires scheduler log(s)\n']
    msg += ['--estimated-info-only: write only  estimated info to the DB.'
            ' Requires --db-out\n']
    msg += ['--last-week: analyze logs of the last 7 days\n']
    msg += ['--last-month: analyze logs of the last month\n']
    msg += ['--re-interval=<regexp>: report time interval between '
            'occurrences of regexp\n']
    msg += ['--re-frequency=<seconds>: report frequency of occurrences of '
            'the re-interval\n']
    msg += ['                          expression for every <seconds>\n']
    msg += ['--silent: do not display progress bar. Defaults to False\n']
    msg += ['--log-conf=<file>: logging config file\n']
    msg += ['--nodes-file=<path>: path to file with output of pbsnodes -av\n']
    msg += ['--jobs-file=<path>: path to file with output of qstat -f\n']
    msg += ['--db-out=<file>: send results to db file\n']
    msg += ['--db-type=<type>: database type\n']
    msg += ['--db-access=<path>: Path to a file that defines db options '
            '(PostreSQL only)\n']
    msg += ['--version: print version number and exit\n']

    print("".join(msg))


if __name__ == '__main__':
    if len(sys.argv) < 2:
        usage()
        sys.exit(0)

    diag = None
    schedulerlog = None
    serverlog = None
    momlog = None
    acctlog = None
    genericlog = None
    hostname = None
    sj = False
    compact = False
    begin = None
    end = None
    cyclesummary = False
    nodesfile = None
    jobsfile = None
    utilization = None
    silent = False
    logconf = None
    estimated_info = False
    estimated_info_only = False
    dbout = None
    dbtype = None
    dbaccess = None
    re_interval = None
    re_frequency = None
    re_conditional = None
    json_on = False
    level = logging.FATAL
    logutils = PBSLogUtils()
    dbutils = PTLTestDb()

    try:
        shortopt = "a:b:d:e:f:t:l:L:s:m:cShU"
        longopt = ["nodes-file=", "jobs-file=", "version", "log-conf=",
                   "estimated-info", "db-out=", "json", "re-interval=",
                   "re-frequency=", "last-week", "last-month",
                   "re-conditional=", "estimated-info-only", "silent",
                   "db-type=", "db-access="]
        opts, args = getopt.getopt(sys.argv[1:], shortopt, longopt)
    except Exception:
        usage()
        sys.exit(1)

    for o, val in opts:
        if o == '-a':
            acctlog = CliUtils.expand_abs_path(val)
        elif o == '-b':
            try:
                begin = logutils.convert_date_time(val)
            except Exception:
                print('Error converting time, expected format '
                      '%m/%d/%Y %H:%M:%S')
                sys.exit(1)
        elif o == '-e':
            try:
                end = logutils.convert_date_time(val)
            except Exception:
                print('Error converting time, expected format '
                      '%m/%d/%Y %H:%M:%S')
                print(traceback.print_exc())
                sys.exit(1)
        elif o == '-d':
            diag = CliUtils.expand_abs_path(val)
        elif o == '-f':
            genericlog = CliUtils.expand_abs_path(val)
        elif o == '-t':
            hostname = val
        elif o == '-l':
            schedulerlog = CliUtils.expand_abs_path(val)
        elif o == '-s':
            serverlog = CliUtils.expand_abs_path(val)
        elif o == '-m':
            momlog = CliUtils.expand_abs_path(val)
        elif o == '-c':
            cyclesummary = True
        elif o == '-C':
            compact = True
        elif o == '-L':
            level = CliUtils.get_logging_level(val)
        elif o == '-S':
            sj = True
        elif o == '-U':
            utilization = True
        elif o == '--db-out':
            dbout = CliUtils.expand_abs_path(val)
        elif o == '--db-type':
            dbtype = val
        elif o == '--db-access':
            dbaccess = CliUtils.expand_abs_path(val)
        elif o == '--estimated-info':
            estimated_info = True
        elif o == '--estimated-info-only':
            estimated_info_only = True
        elif o == '--json':
            json_on = True
        elif o == '--last-week':
            s = time.localtime(time.time() - (7 * 24 * 3600))
            begin = time.mktime(time.strptime(time.strftime("%m/%d/%Y", s),
                                              "%m/%d/%Y"))
            end = time.time()
        elif o == '--last-month':
            s = time.localtime(time.time() - (30 * 24 * 3600))
            begin = time.mktime(time.strptime(time.strftime("%m/%d/%Y", s),
                                              "%m/%d/%Y"))
            end = time.time()
        elif o == '--log-conf':
            logconf = CliUtils.expand_abs_path(val)
        elif o == '--nodes-file':
            nodesfile = CliUtils.expand_abs_path(val)
        elif o == '--jobs-file':
            jobsfile = CliUtils.expand_abs_path(val)
        elif o == '--re-conditional':
            re_conditional = eval(val, {}, {})
        elif o == '--re-interval':
            re_interval = val
        elif o == '--silent':
            silent = True
        elif o == '--re-frequency':
            re_frequency = int(val)
        elif o == '--version':
            print(ptl.__version__)
            sys.exit(0)
        elif o == '-h':
            usage()
            sys.exit(0)
        else:
            sys.stderr.write("Unrecognized option " + o)
            usage()
            sys.exit(1)

    if logconf:
        logging.config.fileConfig(logconf)
    else:
        logging.basicConfig(level=level)

    PtlConfig()

    if diag:
        if nodesfile is None:
            if os.path.isfile(os.path.join(diag, 'pbsnodes_va.out')):
                nodesfile = os.path.join(diag, 'pbsnodes_va.out')
        if jobsfile is None:
            if os.path.isfile(os.path.join(diag, 'qstat_f.out')):
                jobsfile = os.path.join(diag, 'qstat_f.out')

    if ((re_interval is not None or re_conditional is not None) and
            genericlog is None):
        if schedulerlog is not None:
            genericlog = schedulerlog
            schedulerlog = None
        elif serverlog is not None:
            genericlog = serverlog
            serverlog = None
        elif momlog is not None:
            genericlog = momlog
            momlog = None
        elif acctlog is not None:
            genericlog = acctlog
            acctlog = None

    show_progress = not silent
    pla = PBSLogAnalyzer(schedulerlog, serverlog, momlog, acctlog,
                         genericlog, hostname, show_progress)

    if utilization:
        if acctlog is None:
            logging.error("Accounting log is required to compute utilization")
            sys.exit(1)
        pla.accounting.enable_utilization_parsing(hostname, nodesfile,
                                                  jobsfile)

    if re_interval is not None:
        pla.set_custom_match(re_interval, re_frequency)

    if re_conditional is not None:
        pla.set_conditional_match(re_conditional)

    if estimated_info or estimated_info_only:
        if schedulerlog is None:
            logging.error("Scheduler log is required for estimated start time "
                          "analysis")
            sys.exit(1)
        pla.scheduler.estimated_parsing_enabled = True
        if estimated_info_only:
            pla.scheduler.parse_estimated_only = True

    info = pla.analyze_logs(start=begin, end=end, showjob=sj)

    if genericlog:
        dbutils.process_output(pla.info)

    # Drift analysis and custom regex matching require additional
    # post-processing and can't currently be passed through to JSON
    if json_on:
        if cyclesummary:
            info['scheduler'] = info['scheduler']['summary']
        print(CliUtils.__json__(info))
        sys.exit(0)

    if acctlog:
        dbutils.process_output(info['accounting'], dbout, dbtype, dbaccess,
                               name=acctlog, logtype='accounting')
    if schedulerlog:
        dbutils.process_output(info['scheduler'], dbout, dbtype, dbaccess,
                               name=schedulerlog, logtype='scheduler',
                               summary=cyclesummary)
    if serverlog:
        dbutils.process_output(info['server'], dbout, dbtype, dbaccess,
                               name=serverlog, logtype='server')
    if momlog:
        dbutils.process_output(info['mom'], dbout, dbtype, dbaccess,
                               name=momlog, logtype='mom')


================================================
FILE: test/fw/bin/pbs_py_spawn
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import sys
import os
import getopt
import logging
import tempfile
import errno

import ptl
try:
    from ptl.lib.pbs_ifl import pbs_py_spawn
    from ptl.lib.pbs_testlib import Server, MoM, JOB, ResourceResv
    from ptl.utils.pbs_cliutils import CliUtils
except Exception:
    sys.stderr.write("API wrapping is required, see pbs_swigify utility")
    exit(1)


# trap SIGINT and SIGPIPE
def trap_exceptions(etype, value, tb):
    sys.excepthook = sys.__excepthook__
    if issubclass(etype, KeyboardInterrupt):
        pass
    elif issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)


sys.excepthook = trap_exceptions

# Helper script to allow a py_spawned script to run detached from the
# session associated to a PBS Job

# sys.argv[1] must be a valid path to the pbs_attach command
# sys.argv[2] must be a valid job identifier
# sys.argv[3:] must be a valid path to a Python script and args to run in
# the background. The first output of this script must be its PID (e.g., a
# shell script shall echo $$)
_wrapper_body = """import os
import sys
from subprocess import Popen, PIPE

if len(sys.argv) < 3:
    exit(1)

(r, w) = os.pipe()
p = os.fork()
if p < 0:
    exit(1)
elif p > 0:
    os.close(w)
    pid = os.read(r, 256)
    p = Popen([sys.argv[1], "-j", sys.argv[2], "-p", str(pid)], stdout=PIPE)
    p.communicate()
    os.close(r)
    exit(p.retcode)
# child
os.close(r)
p = Popen(["setsid"] + sys.argv[3:], stdout=PIPE)
os.write(w, p.stdout.readline())
os.close(w)
"""


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0]) + ' [OPTION] '
            '<path> <args>\n\n']
    msg += ['   Run a py_spawn command\n\n']
    msg += ['-e <envs>: comma-separated list of environment options\n']
    msg += ['-j <jobid>: jobid to which the spawned process is run\n']
    msg += ['-l <level>: logging level, INFO, DEBUG, ..., defaults to ERROR\n']
    msg += ['-t <hostname>: target hostname to operate on\n']
    msg += ['--detach: If set, run Python script in background\n']
    msg += ['--wrapper=<path>: Optional path to wrapper script, to use with '
            'detach\n']
    msg += ['--version: print version number and exit\n']

    print("".join(msg))


if __name__ == '__main__':

    if len(sys.argv) < 2:
        usage()
        sys.exit(0)

    jobid = None
    envs = []
    detach = False
    lvl = logging.ERROR
    wrapper = None
    cleanup_wrapper = False
    hostname = None

    try:
        opts, args = getopt.getopt(sys.argv[1:], "e:j:l:t:hw",
                                   ['detach', 'wrapper='])
    except Exception:
        usage()
        sys.exit(1)

    for o, val in opts:
        if o == '-j':
            jobid = val
        elif o == '-e':
            envs = val.split(',')
        elif o == '-l':
            lvl = CliUtils.get_logging_level(val)
        elif o == '-h':
            usage()
            sys.exit(0)
        elif o == '-t':
            hostname = val
        elif o == '--detach':
            detach = True
        elif o == '--wrapper':
            wrapper = val
        else:
            sys.stderr.write("Unrecognized option")
            usage()
            sys.exit(1)

    logging.basicConfig(level=lvl)

    s = Server(hostname)
    if detach:
        d = s.status(JOB, 'exec_host', id=jobid)
        if d and 'exec_host' in d[0]:
            hosts = ResourceResv.get_hosts(d[0]['exec_host'])
            svr_obj = Server(hosts[0])
            pconf = MoM(svr_obj, hosts[0]).pbs_conf['PBS_EXEC']
            # Use path to pbs_attach on natural vnode of the job
            pbs_attach = os.path.join(pconf, 'bin', 'pbs_attach')
            if wrapper is None:
                (fd, fn) = tempfile.mkstemp()
                os.write(fd, _wrapper_body)
                os.close(fd)
                os.chmod(fn, 0o755)
                wrapper = fn
                cleanup_wrapper = True
            a = [wrapper, pbs_attach, jobid] + args
            logging.debug(str(a))
            pbs_py_spawn(s._conn, jobid, a, envs)
            if cleanup_wrapper:
                os.remove(wrapper)
    else:
        pbs_py_spawn(s._conn, jobid, args, envs)

    sys.exit(0)


================================================
FILE: test/fw/bin/pbs_snapshot
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import sys
import getopt
import errno
import logging
import ptl
import time
import tarfile

from getopt import GetoptError
from threading import Thread
from pathlib import Path

from ptl.lib.pbs_testlib import PtlConfig
from ptl.utils.pbs_snaputils import PBSSnapUtils, ObfuscateSnapshot
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_dshutils import DshUtils


def trap_exceptions(etype, value, tb):
    """
    Trap SIGINT and SIGPIPE
    """
    # This is done so that any exceptions created by this method itself
    # are caught by the default excepthook to prevent endless recursion
    sys.excepthook = sys.__excepthook__

    if issubclass(etype, KeyboardInterrupt):
        pass
    elif issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)

    # Set sys.excepthook back to trap_exceptions to catch future exceptions
    sys.excepthook = trap_exceptions


sys.excepthook = trap_exceptions


def usage():
    msg = """
Usage: pbs_snapshot -o <path to existing output directory> [OPTION]

    Take snapshot of a PBS system and optionally capture logs for diagnostics

    -H <hostname>                     primary hostname to operate on
                                      Defaults to local host
    -l <loglevel>                     set log level to one of INFO, INFOCLI,
                                      INFOCLI2, DEBUG, DEBUG2, WARNING, ERROR
                                      or FATAL
    -h, --help                        display this usage message
    --basic                           Capture only basic config & state data
    --daemon-logs=<num days>          number of daemon logs to collect
    --accounting-logs=<num days>      number of accounting logs to collect
    --additional-hosts=<hostname>     collect data from additional hosts
                                      'hostname' is a comma separated list
    --map=<file>                      file to store the map of obfuscated data
    --obfuscate                       obfuscates sensitive data
    --with-sudo                       Uses sudo to capture privileged data
    --version                         print version number and exit
    --obf-snap                        path to existing snapshot to obfuscate
"""
    print(msg)


def create_snapshot_tar(snappath):
    """
    Create a compressed tar for the snapshot given
    Warning: Deletes the snapshot directory after creating its tar

    snappath: path to snapshot to compress and tar
    type: str

    return: str - path to the compressed tar file
    """
    outtar = snappath + ".tgz"
    with tarfile.open(outtar, "w:gz") as tar:
        tar.add(snappath, arcname=os.path.basename(snappath))

    # Delete the snapshot directory itself
    du.rm(path=snappath, recursive=True, force=True)

    return outtar


def get_snapshot_from_tar(logger, tarpath):
    """
    Extract the snapshot from tarfile given

    :tarpath - path to the tar
    :type - str

    :return tuple of (string path to extracted snapshot, True/False),
        True: if the extraction was a success
        False: if there was already a snapshot by the name of the one
            being extracted, so the tar was not untar'd
    """
    parentdir = Path(tarpath).parent
    with tarfile.open(tarpath) as tar:
        main_snap = tar.getnames()[0].split(os.sep, 1)[0]
        main_snap = os.path.join(os.path.abspath(parentdir), main_snap)
        if os.path.isdir(main_snap):
            logger.error("Existing snapshot %s found, cannot extract tar" %
                         main_snap)
            return (main_snap, False)
        tar.extractall(path=parentdir)

    return (main_snap, True)


def remotesnap_thread(logger, host):
    """
    Routine to capture snapshot from a remote host

    :param logger - Logging object
    :type logger - logging.Logger
    :param host - the hostname for remote host
    :type host - str
    """
    logger.info("Capturing snapshot from host %s" % (host))

    du = DshUtils()

    # Get path to pbs_snapshot on remote host
    host_pbsconf = du.parse_pbs_config(hostname=host)
    try:
        pbs_exec_path = host_pbsconf["PBS_EXEC"]
    except KeyError:
        logger.error("Couldn't find PBS_EXEC on host %s"
                     ", won't capture snapshot on this host" % (
                         host))
        return
    host_pbssnappath = os.path.join(pbs_exec_path, "sbin",
                                    "pbs_snapshot")

    # Create a directory on the remote host with a unique name
    # We will create the snapshot here
    timestamp = str(int(time.time()))
    snap_home = "host_" + timestamp
    du.mkdir(hostname=host, path=snap_home)

    # Run pbs_snapshot on the remote host
    cmd = [host_pbssnappath, "-o", snap_home,
           "--daemon-logs=" + str(daemon_logs),
           "--accounting-logs=" + str(acct_logs)]
    if obfuscate:
        cmd.extend(["--obfuscate", "--map=" + map_file])
    if with_sudo:
        cmd.append("--with-sudo")

    ret = du.run_cmd(hosts=host, cmd=cmd, logerr=False)
    if ret['rc'] != 0:
        logger.error("Error capturing snapshot from host %s" % (host))
        print(ret['err'])
        return

    # Get the snapshot tar filename from stdout
    child_stdout = ret['out'][-1]
    snaptarname = child_stdout.split("Snapshot available at: ")[1]

    # Copy over the snapshot tar file as <hostname>_snapshot.tgz
    dest_path = os.path.join(out_dir, host + "_snapshot.tgz")
    ret = du.run_copy(srchost=host, src=snaptarname, dest=dest_path)
    if ret['rc'] != 0:
        logger.error("Error copying child snapshot from host %s" % (host))

    # Copy over map file if any as 'host_<map filename>'
    if map_file is not None:
        mfilename = os.path.basename(map_file)
        dest_path = os.path.join(out_dir, host + "_" + mfilename)
        src_path = os.path.join(snap_home, map_file)
        ret = du.run_copy(srchost=host, src=src_path, dest=dest_path)
        if ret['rc'] != 0:
            logger.error("Error copying map file from host %s" % (host))

    # Delete the snapshot home from remote host
    du.rm(hostname=host, path=snap_home, recursive=True, force=True)


def obfuscate_snapshot_wrapper(snap_name, map_file=None, sudo_val=False):
    if map_file is None:
        snappath = Path(snap_name)
        if snappath is None:
            sys.stderr.write("snapshot path not found")
            usage()
            sys.exit(1)
        map_file = os.path.join(snappath.parent, "obfuscate.map")
    obj = ObfuscateSnapshot()
    obj.obfuscate_snapshot(snap_name, map_file, sudo_val)


def capture_local_snap(sudo_val):
    """
    Helper method to capture snapshot of the local host

    :param sudo_val - Value of the --with-sudo option
    :type sudo_val - bool

    :returns Name of the snapshot directory/tar file captured
    """
    if obfuscate or additional_hosts is not None:
        # We will need to the captured snapshot directory in these 2 cases
        create_tar = False
    else:
        create_tar = True

    with PBSSnapUtils(out_dir, basic=basic, acct_logs=acct_logs,
                      daemon_logs=daemon_logs, create_tar=create_tar,
                      log_path=log_path, with_sudo=sudo_val) as snap_utils:
        snap_name = snap_utils.capture_all()

    if obfuscate:
        obfuscate_snapshot_wrapper(snap_name, map_file, sudo_val)
        if additional_hosts is None:
            # Now create the tar
            snap_name = create_snapshot_tar(snap_name)

    return snap_name


if __name__ == '__main__':

    # Arguments to PBSSnapUtils
    out_dir = None
    primary_host = None
    log_level = "INFOCLI2"
    acct_logs = None
    daemon_logs = None
    additional_hosts = None
    map_file = None
    obfuscate = False
    log_file = "pbs_snapshot.log"
    with_sudo = False
    du = DshUtils()
    basic = False
    obf_snap = None

    PtlConfig()

    # Parse the options provided to pbs_snapshot
    try:
        sopt = "d:H:l:o:h"
        lopt = ["basic", "accounting-logs=", "daemon-logs=", "help",
                "additional-hosts=", "map=", "obfuscate", "with-sudo",
                "version", "obf-snap="]
        opts, args = getopt.getopt(sys.argv[1:], sopt, lopt)
    except GetoptError:
        usage()
        sys.exit(1)

    for o, val in opts:
        if o == "-o":
            out_dir = val
        elif o == "-H":
            primary_host = val
        elif o == "-l":
            log_level = val
        elif o == "-h" or o == "--help":
            usage()
            sys.exit(0)
        elif o == "--basic":
            basic = True
        elif o == "--accounting-logs":
            try:
                acct_logs = int(val)
            except ValueError:
                raise ValueError("Invalid value for --accounting-logs" +
                                 "option, should be an integer")
        elif o == "--daemon-logs":
            try:
                daemon_logs = int(val)
            except ValueError:
                raise ValueError("Invalid value for --daemon-logs" +
                                 "option, should be an integer")
        elif o == "--additional-hosts":
            additional_hosts = val
        elif o == "--map":
            map_file = val
        elif o == "--obfuscate":
            obfuscate = True
        elif o == "--with-sudo":
            with_sudo = True
        elif o == "--version":
            print(ptl.__version__)
            sys.exit(0)
        elif o == "--obf-snap":
            obf_snap = val
        else:
            sys.stderr.write("Unrecognized option")
            usage()
            sys.exit(1)

    if obf_snap:
        obfuscate = True
        path = Path(obf_snap)
        if path:
            out_dir = str(path.parent)

    # Check that parent of snapshot directory exists
    if out_dir is None:
        sys.stderr.write("-o option not provided")
        usage()
        sys.exit(1)
    elif not os.path.isdir(out_dir):
        sys.stderr.write("-o path should exist,"
                         " this is where the snapshot is captured")
        usage()
        sys.exit(1)

    fmt = '%(asctime)-15s %(levelname)-8s %(message)s'
    level_int = CliUtils.get_logging_level(log_level)
    log_path = os.path.join(out_dir, log_file)
    logging.basicConfig(filename=log_path, filemode='w+',
                        level=level_int, format=fmt)
    stream_hdlr = logging.StreamHandler()
    stream_hdlr.setLevel(level_int)
    stream_hdlr.setFormatter(logging.Formatter(fmt))
    ptl_logger = logging.getLogger('ptl')
    ptl_logger.addHandler(stream_hdlr)
    ptl_logger.setLevel(level_int)

    if obfuscate is True:
        # find the parent directory of the snapshot
        # This will be used to store the map file
        out_abspath = os.path.abspath(out_dir)
        if map_file is None:
            map_file = os.path.join(out_abspath, "obfuscate.map")

    # Obfuscate an existing snapshot
    if obf_snap:
        istar = False
        if os.path.isfile(obf_snap):
            if tarfile.is_tarfile(obf_snap):
                istar = True
                obf_snap, ret = get_snapshot_from_tar(ptl_logger, obf_snap)
                if ret is False:
                    sys.exit(1)
            else:
                ptl_logger.error("Path is not a valid snapshot")
                sys.exit(1)

        # The obfuscated snapshot will be at path: <obf_snap>_obf
        obfout = obf_snap + "_obf"
        if os.path.isfile(obfout + ".tgz"):
            ptl_logger.error("%s.tgz already exists, "
                             "delete it to create a new obfuscated snapshot" %
                             obfout)
            if istar:
                # If input was a tar file, then we'd have extracted it
                # So, delete the dir that was extracted from the input tar
                du.rm(path=obf_snap, force=True, recursive=True)
            sys.exit(1)
        du.run_copy(src=obf_snap, dest=obfout, recursive=True)
        obfuscate_snapshot_wrapper(obfout, map_file, with_sudo)
        # Create the tar
        obfout = create_snapshot_tar(obfout)
        if istar:
            du.rm(path=obf_snap, force=True, recursive=True)

        print("Obfuscated snapshot at: " + str(obfout))
        sys.exit(0)

    if not basic:
        # Capture 5 days of daemon logs and 30 days of accounting logs
        # by default
        if daemon_logs is None:
            daemon_logs = 5
        if acct_logs is None:
            acct_logs = 30

    if additional_hosts is not None:
        # Capture snapshot of remote hosts in addition to the main host

        hostnames = additional_hosts.split(",")
        remotesnap_threads = {}
        for host in hostnames:
            thread = Thread(target=remotesnap_thread, args=(
                ptl_logger, host))
            thread.start()
            remotesnap_threads[host] = thread

        # Capture snapshot of the main host in the meantime
        thread_p = None
        if not du.is_localhost(primary_host):
            # The main host is remote
            thread_p = Thread(target=remotesnap_thread,
                              args=(ptl_logger, primary_host))
            thread_p.start()
        else:
            # Capture a local snapshot
            main_snap = capture_local_snap(with_sudo)

        if thread_p is not None:
            # Let's get the main host's snapshot first
            thread_p.join()

            # We need to copy additional hosts' snapshosts in
            # the main snapshot, so un-tar the snapshot
            p_snappath = os.path.join(out_dir, primary_host + "_snapshot.tgz")
            main_snap, _ = get_snapshot_from_tar(ptl_logger, p_snappath)

            # Delete the tar file
            du.rm(path=p_snappath, force=True)

        # Let's reconcile the child snapshots
        for host, thread in remotesnap_threads.items():
            thread.join()
            host_snappath = os.path.join(out_dir, host + "_snapshot.tgz")
            if os.path.isfile(host_snappath):
                # Move the tar file to the main snapshot
                du.run_copy(src=host_snappath, dest=main_snap)
                du.rm(path=host_snappath, force=True)

        # Finally, create a tar of the whole snapshot
        outtar = create_snapshot_tar(main_snap)
    elif not du.is_localhost(primary_host):
        # Capture snapshot of a remote host
        remotesnap_thread(ptl_logger, primary_host)
        p_snappath = os.path.join(out_dir, primary_host + "_snapshot.tgz")
        with tarfile.open(p_snappath) as tar:
            main_snap = tar.getnames()[0].split(os.sep, 1)[0]
            main_snap = os.path.join(os.path.abspath(out_dir), main_snap)

        outtar = main_snap + ".tgz"

        # remotesnap_thread named the tar as <hostname>_snapshot.tgz
        # rename it to the timestamp name of the original snapshot
        du.run_copy(src=p_snappath, dest=outtar)
        du.rm(path=p_snappath, force=True)
    else:
        # Capture snapshot of the local host
        outtar = capture_local_snap(with_sudo)

    if outtar is not None:
        print("Snapshot available at: " + outtar)


================================================
FILE: test/fw/bin/pbs_stat
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import errno
import getopt
import logging
import logging.config
import os
import re
import sys
import time

import ptl
from ptl.lib.pbs_testlib import (HOOK, JOB, PTL_AND, PTL_CLI, PTL_OR, QUEUE,
                                 RESOURCES_AVAILABLE, RESOURCES_TOTAL, RESV,
                                 RSC, SCHED, SERVER, VNODE, BatchUtils,
                                 PbsStatusError, PbsTypeSize, PtlConfig,
                                 Scheduler, Server)
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_logutils import PBSAccountingLog

# trap SIGINT and SIGPIPE


def trap_exceptions(etype, value, tb):
    sys.excepthook = sys.__excepthook__
    if issubclass(etype, KeyboardInterrupt):
        pass
    elif issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)


sys.excepthook = trap_exceptions


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0]).split('.pyc')[0]]
    msg += [' [OPTION]\n\n']
    msg += ['\tStatus and filter PBS entities on given attributes\n\n']
    msg += ['\tNote: All output of this unsupported tool is experimental, \n']
    msg += ['\tdo not rely on it remaining as-is across releases.\n\n']
    msg += ['-A <path>: Path to accounting log\n']
    msg += ['-a <attrs>: comma-separated list of attributes\n']
    msg += ['    attrs can be in key[OP]val format where OP is one ' +
            'of <,<=,=,>=,>,~\n']
    msg += ['-b: show available resources (a.k.a backfill hole)\n']
    msg += ['-c: counts number of matching items\n']
    msg += ['-C: counts grand total of given attribute values in complex\n']
    msg += ['-j: report job equivalence classes\n']
    msg += ['-n: report node equivalence classes\n']
    msg += ['-r <name>: comma-separated list of resource names, ' +
            'e.g. ncpus, mem.\n']
    msg += ['-s: show selected objects in qselect-like format\n']
    msg += ['-t <hostname>: target hostname\n']
    msg += ['-T: report total resources available. Operates only on '
            'equivalence classes\n']
    msg += ['-U: show current utilization of the system, use -r to \n' +
            '    specify resources, default to ncpus, mem, nodes\n']
    msg += ['--snap=<pbs_snapshot>: path to snap directory\n']
    msg += ['--id=<obj_id>: identifier of the object to query\n']
    msg += ['--key=<account record>: Accounting record key, one of Q or E\n']
    msg += ['--user=<username>: username to query for limits or '
            'utilization\n']
    msg += ['--group=<groupname>: group to query for limits or '
            'utilization\n']
    msg += ['--project=<project>: project to query for limits\n']
    msg += ['--json: display object type information in json format.\n']
    msg += ['--mode: show operating mode of PTL, one of cli or api\n']
    msg += ['--cli: force stat to query PBS server over cli\n']
    msg += ['--report-twiki: produce report in Twiki format\n']
    msg += ['--nodes: operate on node\n']
    msg += ['--queues: operate on queues\n']
    msg += ['--jobs: operate on jobs\n']
    msg += ['--resvs: operate on reservations\n']
    msg += ['--server: operate on server\n']
    msg += ['--scheduler: operate on scheduler\n']
    msg += ['--report: produce a site report\n']
    msg += ['--resources: operate on resources\n']
    msg += ['--resource=<name>: name of resource to stat\n']
    msg += ['--resources-set: list resources set for a given object type\n']
    msg += ['--fairshare-info=<entity>: query and display fairshare ' +
            ' info of entity\n']
    msg += ['--fairshare-tree: query and display fairshare tree \n']
    msg += ['--sline: show selected objects on a single line\n'
            '\t will not affect output of --json, -j, -s, nor -n\n']
    msg += ['--eval-formula: evaluate job priority\n']
    msg += ['--include-running-jobs: include running jobs in formula'
            ' evaluation\n']
    msg += ['--pports: show number of privileged ports in use\n']
    msg += ['--resolve-indirectness: If set, dereference indirect '
            ' resources\n']
    msg += ['--db-access=<cred>: file to credentials to access db\n']
    msg += ['--limits-info: show limit information per entity and '
            'object\n']
    msg += ['--over-soft-limits: show entities that are over soft '
            'limits\n']
    msg += [
        '--server-file=<path>: path to file with output of qstat -Bf\n']
    msg += ['--dedtime-file=<path>: path to a dedicated time file\n']
    msg += [
        '--nodes-file=<path>: path to file with output of pbsnodes -av\n']
    msg += [
        '--queues-file=<path>: path to file with output of qstat -Qf\n']
    msg += ['--jobs-file=<path>: path to file with output of qstat -f\n']
    msg += [
        '--resvs-file=<path>: path to file with output of pbs_rstat -f\n']
    msg += ['--log-conf=<file>: logging config file\n']
    msg += ['--version: print version number and exit\n']

    print("".join(msg))


class SiteReportFormatter:

    def __init__(self, snap, version, sched_version, jeq, neq, utilization,
                 limits, qtypes, users, groups, sc, formula, backfill, hooks,
                 job_states, osrelease):

        self.report_tm = time.ctime()
        if snap and len(snap) > 1:
            snap = snap.replace(".", "")
            snap = snap.replace("/", "_")
            snap = snap.replace("snapshot_", "")
            if snap[0] == '_':
                snap = snap[1:]
            m = re.search(r"(?P<dtm>\d{6}_\d{6})", snap)
            if m:
                _tm = m.group("dtm")
                _kt = time.mktime(time.strptime(_tm, "%y%m%d_%H%M%S"))
                self.report_tm = time.ctime(_kt)

        self.snap = snap
        self.version = version
        self.sched_version = sched_version
        self.jeq = sorted(jeq, key=lambda e: len(e.entities))
        self.neq = sorted(neq, key=lambda e: len(e.entities))
        self.utilization = utilization
        self.limits = limits
        self.qtypes = qtypes
        self.users = users
        self.groups = groups
        self.sc = sc
        self.formula = formula
        self.backfill = backfill
        self.hooks = hooks
        self.job_states = job_states

        self.delim = "\n"
        self.open_tag = []
        self.close_tag = []

    def __twiki__(self):
        self.delim = "---+++++"
        self.open_tag = ["<verbatim>"]
        self.close_tag = ["</verbatim>"]
        return self.__str__()

    def __str__(self):
        title = 'PBS cluster report on ' + self.report_tm
        if len(self.open_tag) == 0 or self.snap is None:
            msg = []
            self.sep = ['-' * len(title)]
        else:
            msg = ["---+++" + str(self.snap)]
            self.sep = []

        msg += [title]
        msg += self.sep
        msg += [self.delim + 'PBS version']
        msg += self.sep
        msg += self.open_tag
        if self.version == self.sched_version:
            msg += [self.version]
        else:
            msg += ['Server: ' + self.version]
            msg += ['Scheduler: ' + self.sched_version]
        msg += self.close_tag
        if osrelease is not None:
            msg += [self.delim + 'OS release']
            msg += self.sep
            msg += self.open_tag
            msg += [osrelease]
            msg += self.close_tag
        msg += [self.delim + 'Utilization']
        msg += self.sep
        msg += self.open_tag
        msg += u
        msg += self.close_tag
        msg += [self.delim + 'Job States']
        msg += self.sep
        msg += self.open_tag
        for k, v in self.job_states.items():
            msg += ["%s: %d" % (k.split('=')[1], v)]
        msg += self.close_tag
        if self.limits:
            qsl = ssl = qhl = shl = 0
            if SERVER in self.limits:
                for l in self.limits[SERVER]:
                    if '_soft' in l.limit_type:
                        ssl += 1
                    else:
                        shl += 1
            if QUEUE in self.limits:
                for l in self.limits[QUEUE]:
                    if '_soft' in l.limit_type:
                        qsl += 1
                    else:
                        qhl += 1
            msg += [self.delim + 'Limits']
            msg += self.sep
            msg += self.open_tag
            msg += ["Queue soft limits: %d" % qsl]
            msg += ["Queue hard limits: %d" % qhl]
            msg += ["Server soft limits: %d" % ssl]
            msg += ["Server hard limits: %d" % shl]
            msg += self.close_tag
        msg += [self.delim + 'Queue types']
        msg += self.sep
        msg += self.open_tag
        for k, v in qtypes.items():
            msg += ["%s: %d" % (k.split('=')[1], v)]
        msg += self.close_tag
        msg += [self.delim + 'Number of users and groups']
        msg += self.sep
        msg += self.open_tag
        msg += ["users: %d" % (users)]
        msg += ["groups: %d" % (groups)]
        msg += self.close_tag
        if self.hooks:
            msg += [self.delim + 'Hooks']
            msg += self.sep
            msg += self.open_tag
            msg += self.hooks
            msg += self.close_tag
        msg += [self.delim + 'Scheduling policies']
        msg += self.sep
        msg += self.open_tag
        if 'preemptive_sched' in sc:
            msg += ["preemption: %s" % sc['preemptive_sched']]
        if 'backfill' in sc:
            msg += ["backfilling: %s" % sc['backfill']]
        if 'fair_share' in sc:
            msg += ["fair share: %s" % sc['fair_share']]
        if formula is not None:
            msg += ["formula: %s" % self.formula]
        if backfill is not None:
            msg += ["backfill depth: %s" % self.backfill]
        msg += self.close_tag
        msg += [self.delim + 'Node Equivalence Classes']
        msg += self.sep
        msg += self.open_tag
        for e in self.neq:
            msg += [str(e)]
        msg += self.close_tag
        msg += [self.delim + 'Job Equivalence Classes']
        msg += self.sep
        msg += self.open_tag
        for e in self.jeq:
            msg += [str(e)]
        msg += self.close_tag
        return "\n".join(msg)


def utilization_to_str(u):
    msg = []
    for k, v in u.items():
        if len(v) != 2:
            continue

        if v[1] == 0:
            perc = 100
        else:
            perc = 100 * v[0] / v[1]

        if 'mem' in k:
            v[0] = PbsTypeSize(str(v[0]) + 'kb')
            v[1] = PbsTypeSize(str(v[1]) + 'kb')
            msg += [k + ': (' + str(v[0]) + '/' + str(v[1]) + ') ' +
                    str(perc) + '%']
        else:
            msg += [k + ': (' + str(v[0]) + '/' + str(v[1]) + ') ' +
                    str(perc) + '%']

    return msg


if __name__ == '__main__':

    if len(sys.argv) < 2:
        usage()
        sys.exit(1)

    snap = None
    lvl = logging.ERROR
    hostname = None
    objtype = None
    jobclasses = False
    nodeclasses = False
    attributes = None
    backfillhole = None
    attrop = PTL_OR
    accumulate = False
    grandtotal = False
    inputfile = {}
    qselectfmt = False
    resources = None
    utilization = False
    fsusage_entity = None
    fstree = False
    fsentity = None
    fsperc_entity = None
    pbsfs = False
    eval_formula = False
    entity = {}
    objid = None
    resourcesset = None
    dedtimefile = None
    limits_info = False
    over_soft_limits = False
    json_on = False
    pports = False
    db_access = None
    logconf = None
    scheduler = None
    server = None
    report = False
    report_twiki = False
    force_cli = False
    get_mode = False
    fmt = {'%6': '\n'}
    acct = None
    key = 'E'
    indirectness = False
    osrelease = None
    include_running_jobs = False
    restotal = RESOURCES_AVAILABLE  # equivalence classes report avail - assgnd

    lopts = ["nodes", "queues", "server", "scheduler", "jobs", "resvs"]
    lopts += ["fairshare-tree", "eval-formula", "user=", "group=", "project="]
    lopts += ["fairshare-info=", "resource=", "resources-set", "nodes-file="]
    lopts += ["queues-file=", "jobs-file=", "resvs-file=", "server-file="]
    lopts += ["dedtime-file=", "limits-info", "json", "pports", "db-access="]
    lopts += ["over-soft-limits", "id=", "resources", "log-conf=", "version"]
    lopts += ["mode", "cli", "report", "sline", "key=", "resolve-indirectness"]
    lopts += ["report-twiki", "include-running-jobs", "snap="]
    try:
        opts, args = getopt.getopt(sys.argv[1:], "a:A:l:r:t:fUbcChjnsT",
                                   lopts)
    except getopt.GetoptError:
        logging.error('unhandled option')
        usage()
        sys.exit(1)

    for o, val in opts:
        if o == '-a':
            attributes = val
        elif o == '-A':
            acct = CliUtils.expand_abs_path(val)
        elif o == '-b':
            backfillhole = True
            objtype = VNODE
        elif o == '-c':
            accumulate = True
        elif o == '-C':
            grandtotal = True
        elif o == '-j':
            jobclasses = True
        elif o == '-l':
            lvl = CliUtils().get_logging_level(val)
        elif o == '-n':
            nodeclasses = True
        elif o == '-r':
            resources = val
        elif o == '-s':
            qselectfmt = True
        elif o == '-t':
            hostname = val
        elif o == '-U':
            utilization = True
        elif o == '-h':
            usage()
            sys.exit(0)
        elif o == '--snap':
            snap = CliUtils.expand_abs_path(val)
            if not os.path.isdir(snap):
                sys.stderr.write('Cannnot access snapshot at ' +
                                 str(snap) + '\n')
                sys.exit(1)
        elif o == '--cli':
            force_cli = True
        elif o == '--key':
            key = val
        elif o == '--id':
            objid = val
        elif o == '--sline':
            fmt = {'%1': ': ', '%2': '', '%3': '=', '%4': ', ', '%5': '\n'}
        elif o == "--pports":
            pports = True
        elif o == '--version':
            print(ptl.__version__)
            sys.exit(0)
        elif o == "--user":
            entity['euser'] = val
        elif o == "--group":
            entity['egroup'] = val
        elif o == "--mode":
            get_mode = True
        elif o == "--project":
            entity['project'] = val
        elif o == "--fairshare-info":
            fsentity = val
            fstree = True
        elif o == "--fairshare-tree":
            fstree = True
        elif o == "--eval-formula":
            eval_formula = True
        elif o == '--include-running-jobs':
            include_running_jobs = True
        elif o == "--db-access":
            db_access = CliUtils.expand_abs_path(val)
        elif o == "--json":
            json_on = True
        elif o == "--limits-info":
            limits_info = True
        elif o == "--over-soft-limits":
            over_soft_limits = True
        elif o == "--log-conf":
            logconf = val
        elif o == "--nodes":
            objtype = VNODE
        elif o == "--queues":
            objtype = QUEUE
        elif o == "--jobs":
            objtype = JOB
        elif o == "--resvs":
            objtype = RESV
        elif o == "--server":
            objtype = SERVER
        elif o == "--scheduler":
            objtype = SCHED
        elif o == "--report":
            report = True
        elif o == "--report-twiki":
            report_twiki = True
        elif o == "--resources":
            objtype = RSC
        elif o == "--resource":
            objtype = RSC
            objid = val
        elif o == "--resources-set":
            resourcesset = True
        elif o == "--resolve-indirectness":
            indirectness = True
        elif o == "--nodes-file":
            objtype = VNODE
            inputfile[VNODE] = CliUtils.expand_abs_path(val)
        elif o == "--queues-file":
            objtype = QUEUE
            inputfile[QUEUE] = CliUtils.expand_abs_path(val)
        elif o == "--jobs-file":
            objtype = JOB
            inputfile[JOB] = CliUtils.expand_abs_path(val)
        elif o == "--resvs-file":
            objtype = RESV
            inputfile[RESV] = CliUtils.expand_abs_path(val)
        elif o == "--server-file":
            objtype = SERVER
            inputfile[SERVER] = CliUtils.expand_abs_path(val)
        elif o == "--dedtime-file":
            dedtimefile = CliUtils.expand_abs_path(val)
        elif o == '-T':
            restotal = None
        else:
            sys.stderr.write("Unrecognized option")
            usage()
            sys.exit(1)

    PtlConfig()

    if pports:
        msg = CliUtils().priv_ports_info(hostname)
        if not msg:
            sys.exit(1)
        print("\n".join(msg))
        sys.exit(0)

    if logconf:
        logging.config.fileConfig(logconf)
    else:
        logging.basicConfig(level=lvl)
    bu = BatchUtils()

    if len(inputfile) > 0:
        server = Server(snapmap=inputfile, db_access=db_access)
    elif snap is not None or db_access is not None:
        server = Server(hostname, snap=snap, db_access=db_access)
        scheduler = Scheduler(server=server, snap=snap, db_access=db_access)
    else:
        if hostname is None:
            if 'PBS_SERVER' in os.environ:
                _h = os.environ['PBS_SERVER']
            else:
                if 'PBS_CONF_FILE' in os.environ:
                    _c = DshUtils().parse_pbs_config(
                        file=os.environ['PBS_CONF_FILE'])
                elif os.path.isfile('/etc/pbs.conf'):
                    _c = DshUtils().parse_pbs_config()
                if 'PBS_SERVER' in _c:
                    _h = _c['PBS_SERVER']
                else:
                    _h = None
        else:
            _h = hostname
        server = Server(_h, stat=False)

    if force_cli:
        if server.get_op_mode() != PTL_CLI:
            server.set_op_mode(PTL_CLI)

    if get_mode:
        print(server.get_op_mode())
        sys.exit(0)

    if dedtimefile:
        if scheduler is None:
            scheduler = Scheduler(
                server=server, snap=snap, db_access=db_access)
        scheduler.set_dedicated_time_file(dedtimefile)

    # server is assumed up in snap mode
    if not server.isUp() and objtype != RSC and\
            not db_access:
        logging.error('PBS Server is down, exiting')
        sys.exit(1)

    if report or report_twiki:
        jobs = server.status(JOB)
        nodes = server.status(VNODE)
        queues = server.status(QUEUE)

        jeq = server.equivalence_classes(JOB, bslist=jobs)
        if scheduler is not None:
            res = scheduler.get_resources(exclude=['host', 'vnode', 'arch'])
            if res:
                for i in range(len(res)):
                    res[i] = "resources_available." + str(res[i])
        else:
            res = ['resources_available.ncpus', 'resources_available.mem']

        neq = server.equivalence_classes(VNODE, res, bslist=nodes,
                                         show_zero_resources=True,
                                         op=RESOURCES_TOTAL,
                                         resolve_indirectness=indirectness)

        job_states = server.counter(JOB, 'job_state', bslist=jobs)

        u = utilization_to_str(server.utilization(entity=entity, nodes=nodes,
                                                  jobs=jobs))
        lims = server.parse_all_limits(
            server=[server.attributes], queues=queues)
        qtypes = server.counter(QUEUE, 'queue_type', bslist=queues)
        d = server.counter(JOB, ['euser', 'egroup'], bslist=jobs)
        users = groups = 0
        for k, v in d.items():
            if 'euser' in k:
                users += 1
            elif 'egroup' in k:
                groups += 1
        if scheduler is None:
            scheduler = Scheduler(server=server, snap=server.snap,
                                  snapmap=server.snapmap)
        sc = scheduler.sched_config
        formula = backfill = None
        version = 'unavailable'
        sched_version = 'unavailable'
        hooks = []
        _hlist = server.status(HOOK)
        for hook in _hlist:
            if 'enabled' in hook and hook['enabled'] == 'false':
                _disabled = '[disabled]'
            else:
                _disabled = ''
            hooks.append(hook['id'] + ': ' + hook['event'] + ' ' +
                         _disabled)
        try:
            if 'pbs_version' not in server.attributes:
                d = server.status(SERVER, ['pbs_version', 'job_sort_formula',
                                           'backfill_depth'])
            else:
                d = [server.attributes]

            if 'job_sort_formula' in d[0]:
                formula = d[0]['job_sort_formula']
            if 'backfill_depth' in d[0]:
                backfill = d[0]['backfill_depth']
            if 'pbs_version' in d[0]:
                version = d[0]['pbs_version']
        except PbsStatusError:
            pass
        try:
            server.status(SCHED, 'pbs_version')
        except PbsStatusError:
            pass
        if d and 'pbs_version' in d[0]:
            sched_version = d[0]['pbs_version']

        if snap is not None:
            f = os.path.join(snap, 'OSrelease')
            if os.path.isfile(f):
                fos = open(f)
                osrelease = fos.readline()
                fos.close()

        sr = SiteReportFormatter(snap, version, sched_version, jeq, neq, u,
                                 lims, qtypes, users, groups, sc, formula,
                                 backfill, hooks, job_states, osrelease)
        if report_twiki:
            print(str(sr.__twiki__()))
        else:
            print(str(sr))
        sys.exit(0)

    if utilization:
        if resources:
            resources = resources.split(',')
        u = server.utilization(resources, entity=entity)
        msg = utilization_to_str(u)
        if msg:
            print("\n".join(msg))
        sys.exit(0)

    if fstree:
        if scheduler is None:
            scheduler = Scheduler(server=server, snap=server.snap,
                                  snapmap=server.snapmap, db_access=db_access)

        fs_as_bs = scheduler.fairshare_tree.__batch_status__()
        if json_on:
            print(CliUtils.__json__(fs_as_bs))
        else:
            scheduler.utils.show(fs_as_bs, fsentity)
        sys.exit(0)

    if eval_formula:
        f = server.evaluate_formula(include_running_jobs=include_running_jobs)
        if f:
            d = server.status(SERVER, 'job_sort_formula')
            print('Formula: ' + d[0]['job_sort_formula'])
            ret = sorted(list(f.items()), key=lambda x: x[1][1], reverse=True)
            for (jobid, (fml, val)) in ret:
                print(jobid + ': ' + fml + ' = ' + str(val))
        sys.exit(0)

    # parse resources and attributes 'language', i.e., handling of && and ||
    if resources is not None:
        if objtype in (JOB, RESV):
            _r = "Resource_List."
        else:
            _r = "resources_available."
        # add the resources to any attributes that may have been specified
        if attributes is None:
            attributes = ''
        else:
            attributes += ","
        if "&&" in resources:
            attrop = PTL_AND
            resources = resources.replace("&&", ",")
        elif "||" in resources:
            resources = resources.replace("||", ',')
        attributes += ",".join([_r + n for n in resources.split(',')])

    if attributes is not None:
        attributes = attributes.replace(" ", "")
        if "&&" in attributes:
            attrop = PTL_AND
            attributes = attributes.replace("&&", ",")
        elif "||" in attributes:
            attributes = attributes.replace("||", ',')

        attributes = attributes.split(",")

    if attributes:
        setattrs = False
        operators = ('<=', '>=', '!=', '=', '>', '<', '~')
        for a in attributes:
            for op in operators:
                if op in a:
                    setattrs = True
                    break

        d = bu.convert_attributes_by_op(attributes, setattrs)
        if len(d) > 0:
            attributes = d

    if backfillhole is not None:
        server.show_whats_available(attrib=attributes)
        sys.exit(0)

    # other than the backfill hole that requires working with server objects,
    # since updating object attributes can be an expensive operation on large
    # systems, we disable it on these select calls where they are needed
    server.ptl_conf['update_attributes'] = False

    if limits_info or over_soft_limits:
        etype = None
        ename = None
        if 'euser' in entity:
            etype = 'u'
            ename = entity['euser']
        elif 'egroup' in entity:
            etype = 'g'
            ename = entity['egroup']
        elif 'project' in entity:
            etype = 'p'
            ename = entity['project']

        linfo = server.limits_info(etype=etype,
                                   ename=ename,
                                   db_access=db_access,
                                   over=over_soft_limits)
        if json_on:
            CliUtils.__json__(server.utils.decode_dictlist(linfo))
        else:
            server.utils.show(linfo)
        sys.exit(0)

    if nodeclasses:
        if scheduler is None and os.getuid() == 0:
            scheduler = Scheduler(server=server, snap=server.snap,
                                  snapmap=server.snapmap, db_access=db_access)

        if attributes:
            res = attributes
        elif scheduler is not None:
            res = scheduler.get_resources(exclude=['host', 'vnode', 'arch'])
            if res:
                # ncpus and mem may have been removed from the resources line
                # in which case we must add them back
                if 'ncpus' not in res:
                    res.append('ncpus')
                if 'mem' not in res:
                    res.append('mem')
                for i in range(len(res)):
                    res[i] = "resources_available." + str(res[i])

        else:
            res = ['resources_available.ncpus', 'resources_available.mem']

        server.show_equivalence_classes(None, VNODE, res, op=restotal,
                                        show_zero_resources=True,
                                        db_access=db_access,
                                        resolve_indirectness=indirectness)

    if jobclasses or acct is not None:
        if acct is not None:
            eqclasses = {}
            # no need to ping a live server, so pretend
            sm = {SERVER: None}
            # disable logging to avoid displaying server instatiation messages
            logging.disable(logging.INFO)
            server = Server('__snapserver__', snapmap=sm)
            logging.disable(logging.NOTSET)

            alog = PBSAccountingLog(show_progress=True)
            alog.enable_accounting_workload_parsing()
            alog.analyze(acct)
            attrs = list(alog.job_attrs.values())
            eq = server.equivalence_classes(JOB, attributes, bslist=attrs)
            server.show_equivalence_classes(eq)
            if alog.parser_errors > 0:
                print('Failed to parse: ' + str(alog.parser_errors))
            sys.exit(0)
        else:
            server.show_equivalence_classes(None, JOB, attributes, op=restotal,
                                            db_access=db_access)

    # remaining operations are to filter an object type, skip if an
    # equivalence class or resource was requested
    if (jobclasses or nodeclasses):
        sys.exit(0)

    if restotal is None:
        logging.error('-T option operates only an equivalence classes')
        sys.exit(1)

    if resourcesset is not None:
        if objtype is None:
            logging.error('no object type specified')
            sys.exit(1)
        res = bu.list_resources(objtype, server.status(objtype))
        if res:
            print("\n".join(res))
        sys.exit(0)

    if (accumulate or grandtotal) and (attributes is not None):
        if objtype is None:
            logging.error('no object type specified')
            sys.exit(1)

        d = server.counter(objtype, attributes, attrop=attrop,
                           grandtotal=grandtotal, db_access=db_access,
                           extend='t', resolve_indirectness=indirectness)
        for k, v in d.items():
            if grandtotal and 'mem' in k:
                d[k] = PbsTypeSize().encode(value=v)
            else:
                d[k] = v
    else:
        if objtype is None:
            logging.error('no object type specified')
            sys.exit(1)
        idonly = True
        if not qselectfmt:
            idonly = False
        if attributes:
            d = server.filter(objtype, attributes, attrop=attrop,
                              idonly=idonly, id=objid, extend='t',
                              db_access=db_access, grandtotal=grandtotal,
                              resolve_indirectness=indirectness)
        else:
            statinfo = server.status(objtype, id=objid, extend='t',
                                     db_access=db_access,
                                     resolve_indirectness=indirectness)
            if json_on:
                print(
                    CliUtils.__json__(
                        server.utils.decode_dictlist(statinfo)))
            else:
                server.utils.show(statinfo, fmt=fmt)
            sys.exit(0)

    if not d:
        sys.exit(0)

    if not qselectfmt and not (grandtotal or accumulate):
        if objtype is None:
            logging.error('no object type specified')
            sys.exit(1)
        visited = []
        toshow = []
        for objs in d.values():
            for obj in objs:
                if obj['id'] in visited:
                    continue
                else:
                    toshow.append(obj)
                visited.append(obj['id'])

        if json_on:
            CliUtils.__json__(server.utils.decode_dictlist(toshow))
        else:
            server.utils.show(toshow, fmt=fmt)

    elif attrop == PTL_AND and len(d) > 0:
        if objtype is None:
            logging.error('no object type specified')
            sys.exit(1)
        if isinstance(attributes, (list, dict)):
            if grandtotal:
                for k, v in d.items():
                    print(k + ": " + str(v))
            elif accumulate:
                print(" && ".join(d.keys()) + ": " + str(list(d.values())[0]))
            else:
                print(" && ".join(d.keys()) + ": \n" +
                      "\n".join(str(list(d.values())[0])))
        else:
            print(str(" && ".join(d.keys())) + ": " + str(list(d.values())[0]))
    else:
        if objtype is None:
            logging.error('no object type specified')
            sys.exit(1)
        for k, v in d.items():
            if isinstance(v, list):
                print(k + ":")
                for val in v:
                    print(val)
            else:
                print(k + ":" + str(v))


================================================
FILE: test/fw/bin/pbs_swigify
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import sys
import socket
import getopt
import tempfile
import logging
import logging.config
import errno

import ptl
import ptl.lib
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_dshutils import DshUtils
from ptl.lib.pbs_testlib import PtlConfig


# trap SIGINT and SIGPIPE
def trap_exceptions(etype, value, tb):
    sys.excepthook = sys.__excepthook__
    if issubclass(etype, KeyboardInterrupt):
        pass
    elif issubclass(etype, IOError) and value.errno == errno.EPIPE:
        pass
    else:
        sys.__excepthook__(etype, value, tb)


sys.excepthook = trap_exceptions

# A basic SWIG interface definition to wrap PBS IFL
swiginter = '''\
%module pbs_ifl

%typemap(out) char ** {
  int len,i;
  len = 0;
  while ($1[len]) len++;
  $result = PyList_New(len);
  for (i = 0; i < len; i++) {
    PyList_SetItem($result,i,PyString_FromString($1[i]));
  }
}

%typemap(in) char ** {
  /* Check if is a list */
  if (PyList_Check($input)) {
    int size = PyList_Size($input);
    int i = 0;
    $1 = (char **) malloc((size+1)*sizeof(char *));
    for (i = 0; i < size; i++) {
      PyObject *o = PyList_GetItem($input,i);
      if (PyString_Check(o))
    $1[i] = PyString_AsString(PyList_GetItem($input,i));
      else {
    PyErr_SetString(PyExc_TypeError,"list must contain strings");
    free($1);
    return NULL;
      }
    }
    $1[i] = 0;
  } else {
    PyErr_SetString(PyExc_TypeError,"not a list");
    return NULL;
  }
}

%typemap(out) struct batch_status * {
    struct batch_status *head_bs, *bs;
    struct attrl *attribs;
    char *resource;
    char *str;
    int i, j;
    int len;
    char buf[4096];
    static char *id = "id";

    head_bs = $1;
    bs = $1;

    for (len=0; bs != NULL; len++)
        bs = bs->next;

    $result = PyList_New(len);

    bs = head_bs;

    for (i=0; i < len; i++) {
        PyObject *dict;
        PyObject *a, *v, *tmpv;

        dict = PyDict_New();
        PyList_SetItem($result, i, dict);

        a = PyString_FromString(id);
        v = PyString_FromString(bs->name);
        PyDict_SetItem(dict, a, v);

        attribs = bs->attribs;
        while (attribs) {
            resource = attribs->resource;
            if (resource != NULL) {
                /* +2 to account for the '.' between name and resource */
                str = malloc(strlen(attribs->name) + strlen(resource) + 2);
                sprintf(str, "%s.%s", attribs->name, attribs->resource);
                a = PyString_FromString(str);
            }
            else {
                a = PyString_FromString(attribs->name);
            }
            tmpv = PyDict_GetItem(dict, a);
            /* if the key already exists, append as comma-separated */
            if (tmpv != NULL) {
                char *s = PyString_AsString(tmpv);
                /* +4 for the quotes, the comma, and a NULL byte */
                str = malloc(strlen(attribs->value) + strlen(s) + 4);
                sprintf(str, "%s,%s", attribs->value, s);
                v = PyString_FromString(str);
            }
            else {
                v = PyString_FromString(attribs->value);
            }
            PyDict_SetItem(dict, a, v);
            attribs = attribs->next;
        }
        bs = bs->next;
    }
}
%{
#include "pbs_ifl.h"
int pbs_py_spawn(int, char *, char **, char **);
%}

%include "pbs_ifl.h"
int pbs_py_spawn(int, char *, char **, char **);
'''


def _remove_file(workdir, filename):
    f = os.path.join(workdir, filename)
    if os.path.isfile(f):
        logging.debug('removing intermediary file ' + filename)
        os.remove(f)


def usage():
    msg = []
    msg += ['Usage: ' + os.path.basename(sys.argv[0]) + ' [OPTION]\n\n']
    msg += ['  Produce Python wrappers for PBS IFL API\n\n']
    msg += ['-c <pbs_conf>: path to pbs.conf\n']
    msg += [
        '-f: force overwrite of _pbs_ifl.so and pbs_ifl.py when present\n']
    msg += ['-h: display usage information\n']
    msg += ['-i <swig.i>: path to swig interface file\n']
    msg += ['-I <python_include>: path to python include directory\n']
    msg += ['-l <level>: logging level\n']
    msg += ['-s <swig>: path to swig binary to use\n']
    msg += ['-t <targethost>: hostname to operate on\n']
    msg += ['-w <workdir>: path to working directory\n']
    msg += ['--log-conf=<file>: logging config file\n']
    msg += ['--version: print version number and exit\n']

    print("".join(msg))


if __name__ == '__main__':

    workdir = tempfile.gettempdir()
    targethost = socket.gethostname()
    config = None
    interface = None
    pythoninc = None
    level = 'INFO'
    force = False
    swigbin = 'swig'
    logconf = None
    complete_options = {}
    duplicate_options = []

    if 'PBS_CONF_FILE' in os.environ:
        config = os.environ['PBS_CONF_FILE']
    else:
        config = '/etc/pbs.conf'

    opts, args = getopt.getopt(sys.argv[1:], "t:i:I:c:w:l:s:hf",
                               ["log-conf=", "version"])

    for o, val in opts:
        if o == '-t':
            targethost = val
        elif o == '-w':
            workdir = CliUtils.expand_abs_path(val)
        elif o == '-i':
            interface = val
        elif o == '-l':
            level = val
        elif o == '-c':
            config = val
        elif o == '-I':
            pythoninc = CliUtils.expand_abs_path(val)
        elif o == '-f':
            force = True
        elif o == '-s':
            swigbin = CliUtils.expand_abs_path(val)
        elif o == '--log-conf':
            logconf = val
        elif o == '--version':
            print(ptl.__version__)
            sys.exit(0)
        elif o == '-h':
            usage()
            sys.exit(0)
        else:
            sys.stderr.write("Unrecognized option\n")
            usage()
            sys.exit(1)
        if o in complete_options:
            duplicate_options.append("option %s -> %s already used.\n"
                                     % (o, val))
        complete_options[o] = val

    if len(duplicate_options) > 0:
        sys.stderr.write("Please use an option only once, exiting.\n")
        for option in duplicate_options:
            sys.stderr.write("    %s" % option)
        sys.exit(1)

    cu = CliUtils()

    if logconf:
        logging.config.fileConfig(logconf)
    else:
        log_lvl = cu.get_logging_level(level)
        logging.basicConfig(level=log_lvl)

    b = cu.check_bin(swigbin)
    if not b:
        logging.error("swig is missing, exiting")
        sys.exit(1)

    b = cu.check_bin("gcc")
    if not b:
        logging.error("gcc is missing, exiting")
        sys.exit(1)

    if pythoninc is None:
        logging.error("Path to Python include directory is mandatory")
        usage()
        sys.exit(1)

    if targethost != socket.gethostname():
        logging.error("This command only works on localhost")
        sys.exit(1)

    PtlConfig()
    du = DshUtils()
    pbs_conf = du.parse_pbs_config(targethost, file=config)

    os.chdir(workdir)

    if interface is None:
        interface = os.path.join(workdir, "pbs_ifl.i")
        f = open(interface, 'w')
        f.write(swiginter)
        f.close()
        srcdir = os.getcwd()
    else:
        srcdir = os.path.dirname(interface)

    if 'PBS_EXEC' in pbs_conf:
        pbsinclude = os.path.join(pbs_conf['PBS_EXEC'], 'include')
        cmd = [swigbin, '-python', '-I' + pbsinclude, interface]
        logging.debug(du.run_cmd(targethost, cmd))
        if srcdir != os.getcwd():
            logging.debug(du.run_copy(targethost,
                                      src=os.path.join(
                                          srcdir, "pbs_ifl_wrap.c"),
                                      dest=workdir))
            logging.debug(du.run_copy(targethost,
                                      src=os.path.join(srcdir, "pbs_ifl.py"),
                                      dest=workdir))
        cmd = ['gcc', '-Wall', '-Wno-unused-variable', '-fPIC', '-shared',
               '-I' + pbsinclude]
        cmd += ['-I' + pythoninc]
        cmd += ['pbs_ifl_wrap.c']
        cmd += ['-L' + os.path.join(pbs_conf['PBS_EXEC'], 'lib')]
        cmd += ['-lpbs']
        cmd += ['-o', '_pbs_ifl.so']
        cmd += ['-lcrypto', '-lssl']
        logging.debug(du.run_cmd(targethost, cmd))

    libdir = os.path.dirname(ptl.lib.__file__)
    if force or not os.path.isfile(libdir + '/_pbs_ifo.so'):
        du.run_copy(targethost,
                    src=os.path.join(workdir, '_pbs_ifl.so'),
                    dest=os.path.join(libdir, '_pbs_ifl.so'), sudo=True)
    if force or not os.path.isfile(os.path.join(libdir, '/pbs_ifl.py')):
        du.run_copy(targethost,
                    src=os.path.join(workdir, 'pbs_ifl.py'),
                    dest=os.path.join(libdir, 'pbs_ifl.py'), sudo=True)

    _remove_file(workdir, "pbs_ifl.py")
    _remove_file(workdir, "_pbs_ifl.so")
    _remove_file(workdir, "pbs_ifl_wrap.c")
    _remove_file(workdir, "pbs_ifl.i")


================================================
FILE: test/fw/bin/pbs_sys_report
================================================
#!/usr/bin/env python3
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import csv
import json
import sys
import os
import argparse


def write_to_csv(head, csvrows, i, filepath):
    with open(filepath, 'a+') as fp:
        if i == 0:
            csv.writer(fp).writerow(head)
        csv.writer(fp).writerow(csvrows)


if __name__ == '__main__':

    msg = 'System monitoring results to csv conversion tool'
    parser = argparse.ArgumentParser(description=msg)
    parser.add_argument('PTL_JSON_FILE', help='path to ptl_test_results.json')
    parser.add_argument(
        '--outputfile', default='sys_report.csv', help='path to generate file')
    args = parser.parse_args()
    filepath = args.outputfile

    if os.path.exists(filepath):
        os.remove(filepath)

    with open(args.PTL_JSON_FILE) as fp:
        td = json.load(fp)

    for k, v in sorted(td['testsuites'].items()):
        _otcs = v['testcases']
        for _k, _v in sorted(v['testcases'].items()):
            _tcn = k + '.' + _k
            _om = _v['results']
            for key, val in _om.items():
                for item in val['measurements']:
                    for ky, vl in item.items():
                        if ky == 'procs':
                            timelist = []
                            name = ''
                            time = ''
                            for mes in vl:
                                timelist.append(mes['time'])
                                timelist = list(set(timelist))
                            timelist.sort()
                            i = 0
                            for tm in timelist:
                                head = ['Time']
                                csvrows = []
                                csvrows.append(tm)
                                for mes in vl:
                                    name = mes['name']
                                    if mes['time'] == tm:
                                        for nm, value in sorted(mes.items()):
                                            if nm != 'name' and nm != 'time':
                                                head.append(nm + '_' + name)
                                                csvrows.append(value)
                                write_to_csv(head, csvrows, i, filepath)
                                i += 1


================================================
FILE: test/fw/doc/caveats.rst
================================================
Caveats
=======

Standing reservation PBS_TZID
-----------------------------

Standing reservations cannot be submitted using the API interface alone due
to the need to set the PBS_TZID environment variable, such reservations are
always submitted using a CLI.

qmgr operations for hooks and formula
-------------------------------------

Qmgr operations for hooks and for the job_sort_formula must be done as root,
they are performed over the CLI.

CLI and API differences
-----------------------

PTL redefines the PBS IFL such that it can dynamically call them via either
the API or the CLI. The methods are typically named after their PBS IFL
counterpart omitting the `pbs_` prefix, for example pbs_manager() becomes
manager() in PTL. Each method will typically either return the return code
of its API/CLI counterpart, or raise a specific PTL exception. In some cases
(e.g. manager) the return value may be that of the call to the expect() method.

When calling expect on an attribute value, the value may be different
depending on whether the library is operating in CLI or API mode; as an
example, when submitting a reservation, expecting it to be confirmed via the
API calls for an expect of {'reserve_state':'2'} whereas using the CLI one
would expect {'reserve_state':'RESV_CONFIRMED'}.
This can be handled in several ways:
The preferred way is to use the MATCH_RE operation on the attribute and
check for either one of the possible values: for example to match either
RESV_CONFIRMED or 2 one can write::

   Server().expect(RESV, {'reserve_state':(MATCH_RE,"RESV_CONFIRMED|2")})

An alternative way is to set the operating mode to the one desired at the
beginning of the test (to one of PTL_API, or PTL_CLI) and ensure it is set
accordingly by calling get_op_mode(), or handle the response in the test by
checking if the operating mode is CLI or API, which is generally speaking
more robust and the favored approach as the automation may be run in either
mode on different systems.

List (non-exhaustive) of attribute type differences between CLI and API:

 - reserve_state
 - all times: ctime, mtime, qtime, reserve_start, reserve_end, estimated.start_time, Execution_Time

Creating temp files
-------------------

When creating temp files, favor the use of DshUtils().mkstemp

Unsetting attributes
--------------------

To unset attributes in alterjob, set the attribute value to '' (two single
quotes) in order to escape special quote handling in Popen.

Example::

 obj.unset_attributes([ATTR_Arglist])

Stat'ing objects via db-access
------------------------------

Not all object attributes are written to the DB, as a result, when using
pbs_stat with db-access enabled, information may appear to be missing.

Scheduler holidays file handling
--------------------------------

When reverting scheduler's default configuration, the holidays file is
reverted only if it was specifically parsed, either by calling parse_holidays
or by calling set_prime_time, to the contents of the file first parsed. In
other words, if the contents of the file were updated outside PbsTestLab, and
edited in PbsTestLab, the file will be reverted to that version rather than
the vanilla file that ships with PBS.

Interactive Jobs
----------------

Interactive jobs are only supported through CLI operations and require the
pexpect module to be installed.

Interactive Jobs are submitted as a thread that sets the jobid as soon as it
is returned by qsub -I, such that the caller can get back to monitoring
the state of PBS while the interactive session goes on in the thread.

The commands to be run within an interactive session are specified in the
job's interactive_script attribute as a list of tuples, where the first
item in each tuple is the command to run, and the subsequent items are
the expected returned data.

.. topic:: Implementation details:

  The submission of an interactive job requires passing in job attributes,
  the command to execute (i.e. path to qsub -I), the hostname and a
  user-to-password map, details follow:

  On Linux/Unix:

    - when not impersonating:

      pexpect spawns the qsub -I command and expects a prompt back, for each
      tuple in the interactive_script, it sends the command and expects to
      match the return value.

    - when impersonating:

      pexpect spawns sudo -u <user> qsub -I. The rest is as described in
      non-impersonating mode.


================================================
FILE: test/fw/doc/commands.rst
================================================
Overview of commands
=====================

Here is an overview of the most common usage of the PTL commands, there are many
more options to control the commands, see the --help option of each command for
details.

.. _pbs_benchpress:

How to use pbs_benchpress
-------------------------

pbs_benchpress is PTL's test harness, it is used to drive testing, logging
and reporting of test suites and test cases.

To list information about a test suite::

  pbs_benchpress -t <TestSuiteName> -i

To check for compilation errors use below command::

  python -m py_compile /path/to/your/test/file.py

Before running any test we have to export below 2 paths::

  export PYTHONPATH=</path/to/install/location>/lib/python<python version>/site-packages

::

  export PATH=</path/to/install/location>/bin

To Run a test suite and/or a test case

   1. To run the entire test suite::

        pbs_benchpress -t <TestSuiteName>

    where `TestSuiteName` is the name of the class in the .py file you created

   2. To run a test case part of a test suite::

        pbs_benchpress -t <TestSuiteName>.<test_case_name>

    where `TestSuiteName` is as described above and `test_case_name` is the name
    of the test method in the class

   3. You can run the under various logging levels using the -l option::

        pbs_benchpress -t <TestSuiteName> -l DEBUG

    To see various logging levels see :ref:`log_levels`

   4. To run all tests that inherit from a parent test suite class run the
      parent test suite passing the `--follow-child` param to pbs_benchpress::

        pbs_benchpress -t <TestSuite> --follow-child

   5. To exclude specific testsuites, use the --excluding option as such::

        pbs_benchpress -t <TestSuite> --follow-child --exclude=<SomeTest>

   6. To run the test by the name of the test file, for example, if a test
      class is defined in a file named pbs_XYZ.py then you an run it using::

        pbs_benchpress -f ./path/to/pbs_XYZ.py

   7. To pass custom parameters to a test suite::

        pbs_benchpress -t <TestSuite> -p "<key1>=<val1>,<key2>=<val2>,..."

    Alternatively you can pass --param-file pointing to a file where parameters
    are specified. The contents of the file should be one parameter per line::

        pbs_benchpress -t <TestSuite> --param-file=</path/to/file>

        Example: take file as "param_file" then file content should be as below.

        key1=val1
        key2=val2
        .
        .

    Once params are specified, a class variable called param is set in the Test
    that can then be parsed out to be used in the test. When inheriting from
    PBSTestSuite, the key=val pairs are parsed out and made available in the
    class variable ``conf``, so the test can retrieve the information using::

        if self.conf.has_key(key1):
            ...

   8. To check that the available Python version is above a minimum::

        pbs_benchpress --min-pyver=<version>

   9. To check that the available Python version is less than a maximum::

        pbs_benchpress --max-pyver=<version>


   10. On Linux, you can generate PBS coverage data using PTL.
       To collect coverage data using LCOV/LTP, first ensure that PBS was
       compiled using --set-cflags="--coverage" and make sure that you have the lcov
       utility installed. Lcov utility can be obtained at http://ltp.sourceforge.net/coverage/lcov.php
       Then to collect PBS coverage data run pbs_benchpress as follow::

        pbs_benchpress -t <TestName> --lcov-data=</path/to/gcov/build/dir>

       By default the output data will be written to TMPDIR/pbscov-YYYMMDD_HHMMSS,
       this can be controlled using the option --lcov-out.
       By default the lcov binary is expected to be available in the environment, if
       it isn't you can set the path using the option --lcov-bin.


   11. For tests that inherit from PBSTestSuite, to collect procecess information::

        pbs_benchpress -t <TestSuite> -p "procmon=<proc name>[:<proc name>],procmon-freq=<seconds>"

       where `proc name` is a process name such as pbs_server, pbs_sched, pbs_mom.
       RSS,VSZ,PCPU info will be collected for each colon separated name.


   12. To run ptl on multinode cluster we have following two basic requirements.

         A. PTL to be installed on all the nodes.
         B. Passwordless ssh between all the nodes.

       Suppose we have a multinode cluster of three node (M1-type1, M2-type2, M3-type3)
       We can invoke pbs_benchpress command as below::

        pbs_benchpress -t <TestSuite> -p "servers=M1,moms=M1:M2:M3"


.. _log_levels:

Logging levels
~~~~~~~~~~~~~~

PTL uses the generic unittest log levels: INFO, WARNING, DEBUG, ERROR, FATAL

and three custom log levels: INFOCLI, INFOCLI2, DEBUG2.

INFOCLI is used to log command line calls such that the output of a test run
can be read with anyone familiar with the PBS commands.

INFOCLI2 is used to log a wider set of commands run through PTL.

DEBUG2 is a verbose debugging level. It will log commands, including return
code, stdout and stderr.

.. _pbs_loganalyzer:

How to use pbs_loganalyzer
--------------------------

To analyze scheduler logs::

  pbs_loganalyzer -l </path/to/schedlog>

To only display scheduling cycles summary::

  pbs_loganalyzer -l </path/to/schedlog> -c

To analyze server logs::

  pbs_loganalyzer -s </path/to/serverlog>

To analyze mom logs::

  pbs_loganalyzer -m </path/to/momlog>

To analyze accounting logs::

  pbs_loganalyzer -a </path/to/accountinglog>

To specify a begin and/or end time::

  pbs_loganalyzer -b "02/20/2013 21:00:00" -e "02/20/2013 22:00:00" <rest>

Note that for accounting logs, the file will be 'cat' using the sudo command,
so the tool can be run as a regular user with sudo privilege.

To compute cpu/hour utilization against a given snapshot of nodes::

  pbs_loganalyzer -U --nodes-file=/path/to/pbsnodes-av-file
                     --jobs-file=/path/to/qstat-f-file
                     -a /path/acct

A progress bar can be displayed by issuing::

  pbs_loganalyzer --show-progress ...

To analyze the scheduler's estimated start time::

  pbs_loganalyzer --estimated-info -l <path/to/sched/log>

To analyze per job scheduler performance metrics, time to run, time to discard,
time in scheduler (solver time as opposed to I/O with the server), time to
calendar::

  pbs_loganalyzer -l </path/to/schedlog> -S

In addition to a scheduler log, a server log is required to compute the time in
scheduler metric, this is due to the fact that the time in sched is measured
as the difference between a sched log "Considering job to run" and a
corresponding server log's "Job Run" message.

To output analysis to a SQLite file::

  pbs_loganalyzer --db-name=<name or path of database> --db-type=sqlite

Note that the sqlite3 module is needed to write out to the DB file.

To output to a PostgreSQL database::

  pbs_loganalyzer --db-access=</path/to/pgsql/cred/file>
                  --db-name=<name or path of database>
                  --db-type=psql

Note that the psycopg2 module is needed to write out ot the PostgreSQL database.
The cred file should specify the following::

  user=<db username> password=<user's password> dbname=<databasename> port=<val>

To analyze the time (i.e., log record time) between occurrences of a regular
expression in any log file::

  pbs_loganalyzer --re-interval=<regex expression>

This can be used, for example, to measure the interval of occurrences between
E records in an accounting log::

  pbs_loganalyzer -a <path/to/accountlog> --re-interval=";E;"

A useful extended option to the occurrences interval is to compute the number
of regular expression matches over a given period of time::

  pbs_loganalyzer --re-interval=<regex> --re-frequency=<seconds>

For example, to count how many E records are emitted over a 60 second window::

  pbs_loganalyzer -a <acctlog> --re-interval=";E;" --re-frequency=60

When using --re-interval, the -f option can be used to point to an arbitrary
log file instead of depending on -a, -l, -s, or -m, however all these log
specific options will work.

A note about the regular expression used, every Python named group, i.e.,
expressions of the (?P<name>...), will be reported out as a dictionary of
items mapped to each named group.

.. _pbs_stat:

How to use pbs_stat
-------------------

pbs_stat is a useful tool to display filtered information from querying
PBS objects. The supported objects are nodes, jobs, resvs, server, queues.
The supported operators on filtering attributes or resources are >,
<, >=, <=, and ~, the latter being for a regular expression match on the value
associated to an attribute or resource.

In the examples below one can replace the object type by any of
those alternative ones, with the appropriate changes in attribute or resource
names.

Each command can be run by passing a -t <hostname> option to specify a
desired target hostname, the default (no -t) will query the localhost.

To list a summary of all jobs equivalence classes on Resource_List.select, use::

  pbs_stat -j -a "Resource_List.select"

To list a summary of all nodes equivalence classes::

  pbs_stat -n

Note that node equivalence classes are collected by default on
resources_available.ncpus, resources_available.mem, and state. To specify
attributes to create the equivalence class on use -a/-r.

To list all nodes that have more than 2 cpus::

  pbs_stat --nodes -a "resources_available.ncpus>2"

or equivalently (for resources)::

  pbs_stat --nodes -r "ncpus>2"

To list all jobs that request more than 2 cpus and are in state 'R'::

  pbs_stat --jobs -a "Resource_List.ncpus>2&&job_state='R'"

To filter all nodes that have a host value that start with n and end with a,
i.e., "n.*a"::

  pbs_stat --nodes -r "host~n.*a"

To display information in qselect like format use the option -s to each command
using -s the attributes selected are displayed first followed by a list of
names that match the selection criteria.

To display data with one entity per line use the --sline option::

  pbs_stat --nodes --sline

To show what is available now in the complex (a.k.a, backfill hole) use::

  pbs_stat -b

by default the backfill hole is computed based on ncpus, mem, and state, you
can specify the attributes to compute it on by passing comma-separated list of
attributes into the -a option. An alternative to compute the backfill hole is
to use pbs_sim -b.

To show utilization of the system use::

  pbs_stat -U [-r "<resource1,resource2,...>]

resources default to ncpus, memory, and nodes

To show utilization of a specific user::

  pbs_stat -U --user=<name>

To show utilization of a specific group::

  pbs_stat -U --group=<name>

To show utilization of a specific project::

  pbs_stat -U --project=<name>

To count the grand total of a resource values in complex for the queried resource::

  pbs_stat -r <resource, e.g. ncpus> -C --nodes

Note that nodes that are not up are not counted

To count the number of resources having same values in complex for the queried resource::

  pbs_stat -r <resource e.g. ncpus>  -c --nodes

To show an evaluation of the formula for all non-running jobs::

  pbs_stat --eval-formula

To show the fairshare tree and fairshare usage::

  pbs_stat --fairshare

To read information from file use for example::

  pbs_stat -f /path/to/pbsnodes/or/qstat_f/output --nodes -r ncpus

To list all resources currently set on a given object type::

  pbs_stat --nodes --resources-set

To list all resources defined in resourcedef::

  pbs_stat --resources

To list a specific resource by name from resourcedef (if it exists)::

  pbs_stat --resource=<custom_resource>

To show limits associated to all entities::

  pbs_stat --limits-info

To show limits associated to a specific user::

  pbs_stat --limits-info --user=<name>

To show limits associated to a specific group::

  pbs_stat --limits-info --group=<name>

To show limits associated to a specific project::

  pbs_stat --limits-info --project=<name>

To show entities that are over their soft limits::

  pbs_stat --over-soft-limits

The output of limits information shows named entities associated to each
container (server or queue) to which a limit is applied. The entity's usage
as well as limit set are displayed, as well as a remainder usage value that
indicates whether an entity is over a limit (represented by a negative value)
or under a limit (represented by a positive or zero value). In the case of a
PBS_ALL or PBS_GENERIC limit setting, each entity's name is displayed using
the entity's name followed by "/PBS_ALL" or "/PBS_GENERIC" as the case may be.

Here are a few examples, if a server soft limit is set to 0::

    qmgr -c "set server max_run_soft=[u:user1=0]"

for user user1 on the server object, pbs_stat --limits-info will show::

    u:user1
        container = server:minita.pbs.com
        limit_type = max_run_soft
        remainder = -1
        usage/limit = 1/0


if a server soft limit is set to 0 on generic users::

    qmgr -c "set server max_run_soft=[u:PBS_GENERIC=0]"

then pbs_stat --limits-info will show::

    u:user1/PBS_GENERIC
        container = server:minita.pbs.com
        limit_type = max_run_soft
        remainder = -1
        usage/limit = 1/0

To print a site report that summarizes some key metrics from a site::

  pbs_stat --report

optionally, use the path to a pbs_snapshot using the -d option to summarize that
site's information.

To show the number of privileged ports in use::

  pbs_stat --pports

To show information directly from the database (requires psycopg2 module)::

  pbs_stat --db-access=<path/to/dbaccess_file> --db-type=psql
           --<objtype> [-a <attribs>]

where the dbaccess file is of the form::

  user=<value>
  password=<value>
  # and optionally
  [port=<value>]
  [dbname=<value>]

.. _pbs_config:

How to use pbs_config
---------------------

pbs_config is useful in the following cases, use:

.. option:: --revert-config

    To revert a configuration of PBS entities specified as one or
    more of --scheduler, --server, --mom to its default configuration. Note that
    for the server, non-default queues and hooks are not deleted but disabled
    instead.

.. option:: --save-config

    save the configuration of a PBS entity, one of --scheduler,
    --server, --mom to file. The server saves the resourcedef, a qmgr print
    server, qmgr print sched, qmgr print hook. The scheduler saves sched_config,
    resource_group, dedicated_time, holidays. The mom saves the config file.

.. option:: --load-config

    load configuration from file. The changes will be applied to
    all PBS entities as saved in the file.

.. option:: --vnodify

    create a vnode definition and insert it into a given MoM. There are
    many options to this command, see the help page for details.

.. option:: --switch-version

    swith to a version of PBS installed on the system. This
    only supports modifying the PBS installed on a system that matches
    PBS_CONF_FILE.

.. option:: --check-ug

    To check if the users and groups required for automated testing are defined as
    expected on the system

.. option:: --make-ug

    To make users and groups as required for automated testing.This will create
    user home directories with 755 permission.If test user is not using this command
    for user creation then he/she has to make sure that the home directories
    should have 755 permission.

To setup, start, and add (to the server) multiple MoMs::

  pbs_config --multi-mom=<num> -a <attributes> --serverhost=<host>

The multi-mom option creates <num> pbs.conf files, prefixed by pbs.conf_m
followed by an incrementing number by default, for which each configuration
file has a unique PBS_HOME directory that is defined by default to be PBS_m
followed by the same incrementing number as the configuration file. The
configuration prefix can be changed by passing the --conf-prefix option and
the PBS_HOME prefix can be changed via --home-prefix.

To make a PBS daemons mimic the snapshot of a pbs_snapshot::

  pbs_config --as-snap=<path/to/snap>

This will set all server and queue attributes from the snapshot, copy sched_config,
resource_group, holidays, resourcedef, all site hooks, and create and insert a
vnode definition that translates all of the nodes reported by pbsnodes -av.
There may be some specific attributes to adjust, such as pbs_license_info,
or users or groups, that may prevent submission of jobs.

.. _pbs_py_spawn:

How to use pbs_py_spawn
-----------------------

The pbs_py_spawn wrapper can only be used when the pbs_ifl.h API is SWIG
wrapped. The tool can be used to invoke a pbs_py_spawn action associated to a
job running on a MoM.

To call a Python script during the runtime of a job::

  pbs_py_spawn -j <jobid> <path/to/python/script/on/MoM>

To call a Python script that will detach from the job's session::

  pbs_py_spawn --detach -j <jobid> </path/to/python/script/on/MoM>

Detached scripts essentially background themselves and are attached back to
the job monitoring through pbs_attach such that they are terminated when the
job terminates. The detached script must write out its PID as its first
output.

How to use pbs_compare_results
-----------------------

The pbs_compare_results is a tool to compare performance test results by
comparing the json output generated by pbs_benchpress.

To run pbs_compare_results and generate csv only report::

  pbs_compare_results <benchmark_version>.json <tocompare_version>.json

To run pbs_compare_results and generate html report along with csv::
  
  pbs_compare_results <benchmark_version>.json <tocompare_version>.json --html-report

To run pbs_compare_results and generate reports at user defined location::

  pbs_compare_results <benchmark_version>.json <tocompare_version>.json --output-file=<path>


================================================
FILE: test/fw/doc/conf.py
================================================
# -*- coding: utf-8 -*-
#
# PbsTestLab documentation build configuration file, created by
# sphinx-quickstart on Fri May 27 11:57:52 2016.
#
# This file is execfile()d with the current directory set to its
# containing dir.
#
# Note that not all possible configuration values are present in this
# autogenerated file.
#
# All configuration values have a default; values that are commented out
# serve to show the default.

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import sys

HAS_RTD = False
try:
    import sphinx_rtd_theme
    HAS_RTD = True
except Exception:
    HAS_RTD = False
# If extensions (or modules to document with autodoc) are in another directory,
# add these directories to sys.path here. If the directory is relative to the
# documentation root, use os.path.abspath to make it absolute, like shown here.

sys.path.insert(0, os.path.abspath('..'))
sys.path.insert(0, os.path.abspath('.'))
# import ptl

# -- General configuration ------------------------------------------------

# If your documentation needs a minimal Sphinx version, state it here.
needs_sphinx = '1.3'

# Add any Sphinx extension module names here, as strings. They can be
# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
# ones.
extensions = ['sphinx.ext.autodoc']

autodoc_member_order = 'bysource'
# Add any paths that contain templates here, relative to this directory.
# templates_path = []

# The suffix of source filenames.
source_suffix = '.rst'

# The encoding of source files.
# source_encoding = 'utf-8-sig'

# The master toctree document.
master_doc = 'index'

# General information about the project.
project = 'PbsTestLab'
copyright = '(C) 1994-2020 Altair Engineering, Inc'

# The version info for the project you're documenting, acts as replacement for
# |version| and |release|, also used in various other places throughout the
# built documents.
#
# The short X.Y version.
__version__ = 'unknown'
exec(compile(open('../ptl/__init__.py').read(), '../ptl/__init__.py', 'exec'))
version = __version__
# The full version, including alpha/beta/rc tags.
release = '1.0.0'

# The language for content autogenerated by Sphinx. Refer to documentation
# for a list of supported languages.
# language = None

# There are two options for replacing |today|: either, you set today to some
# non-false value, then it is used:
# today = ''
# Else, today_fmt is used as the format for a strftime call.
# today_fmt = '%B %d, %Y'

# List of patterns, relative to source directory, that match files and
# directories to ignore when looking for source files.
exclude_patterns = ['target']

# The reST default role (used for this markup: `text`) to use for all
# documents.
# default_role = None

# If true, '()' will be appended to :func: etc. cross-reference text.
# add_function_parentheses = True

# If true, the current module name will be prepended to all description
# unit titles (such as .. function::).
# add_module_names = True

# If true, sectionauthor and moduleauthor directives will be shown in the
# output. They are ignored by default.
# show_authors = False

# The name of the Pygments (syntax highlighting) style to use.
pygments_style = 'sphinx'

# A list of ignored prefixes for module index sorting.
# modindex_common_prefix = []

# If true, keep warnings as "system message" paragraphs in the built documents.
# keep_warnings = False


# -- Options for HTML output ----------------------------------------------

# The theme to use for HTML and HTML Help pages.  See the documentation for
# a list of builtin themes.
if HAS_RTD:
    html_theme = 'sphinx_rtd_theme'
    html_theme_path = [sphinx_rtd_theme.get_html_theme_path()]
else:
    html_theme = 'sphinxdoc'

# Theme options are theme-specific and customize the look and feel of a theme
# further.  For a list of options available for each theme, see the
# documentation.
# html_theme_options = {}

# Add any paths that contain custom themes here, relative to this directory.
# html_theme_path = []

# The name for this set of Sphinx documents.  If None, it defaults to
# "<project> v<release> documentation".
# html_title = None

# A shorter title for the navigation bar.  Default is the same as html_title.
# html_short_title = None

# The name of an image file (relative to this directory) to place at the top
# of the sidebar.
# html_logo = None

# The name of an image file (within the static path) to use as favicon of the
# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
# pixels large.
# html_favicon = None

# Add any paths that contain custom static files (such as style sheets) here,
# relative to this directory. They are copied after the builtin static files,
# so a file named "default.css" will overwrite the builtin "default.css".
# html_static_path = []

# Add any extra paths that contain custom files (such as robots.txt or
# .htaccess) here, relative to this directory. These files are copied
# directly to the root of the documentation.
# html_extra_path = []

# If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
# using the given strftime format.
# html_last_updated_fmt = '%b %d, %Y'

# If true, SmartyPants will be used to convert quotes and dashes to
# typographically correct entities.
# html_use_smartypants = True

# Custom sidebar templates, maps document names to template names.
# html_sidebars = {}

# Additional templates that should be rendered to pages, maps page names to
# template names.
# html_additional_pages = {}

# If false, no module index is generated.
# html_domain_indices = True

# If false, no index is generated.
# html_use_index = True

# If true, the index is split into individual pages for each letter.
# html_split_index = False

# If true, links to the reST sources are added to the pages.
html_show_sourcelink = True

# If true, "Created using Sphinx" is shown in the HTML footer. Default is True.
html_show_sphinx = False

# If true, "(C) Copyright ..." is shown in the HTML footer. Default is True.
html_show_copyright = True

# If true, an OpenSearch description file will be output, and all pages will
# contain a <link> tag referring to it.  The value of this option must be the
# base URL from which the finished HTML is served.
# html_use_opensearch = ''

# This is the file name suffix for HTML files (e.g. ".xhtml").
# html_file_suffix = None

# Output file base name for HTML help builder.
htmlhelp_basename = 'PbsTestLabdoc'


# -- Options for LaTeX output ---------------------------------------------

latex_elements = {'papersize': 'a4paper', }
# The paper size ('letterpaper' or 'a4paper').

# The font size ('10pt', '11pt' or '12pt').
# 'pointsize': '10pt',

# Additional stuff for the LaTeX preamble.
# 'preamble': '',


# Grouping the document tree into LaTeX files. List of tuples
# (source start file, target name, title,
#  author, documentclass [howto, manual, or own class]).
latex_documents = [('index', 'PbsTestLab.tex', 'PbsTestLab Documentation',
                    'Copyright (C) 1994-2021 Altair Engineering, Inc',
                    'manual'), ]

# The name of an image file (relative to this directory) to place at the top of
# the title page.
# latex_logo = None

# For "manual" documents, if this is true, then toplevel headings are parts,
# not chapters.
# latex_use_parts = False

# If true, show page references after internal links.
# latex_show_pagerefs = False

# If true, show URL addresses after external links.
latex_show_urls = 'True'

# Documents to append as an appendix to all manuals.
# latex_appendices = []

# If false, no module index is generated.
# latex_domain_indices = True


# -- Options for manual page output ---------------------------------------

# One entry per manual page. List of tuples
# (source start file, name, description, authors, manual section).
man_pages = [('index', 'pbstestlab', 'PbsTestLab Documentation',
              ['Copyright (C) 1994-2021 Altair Engineering, Inc'], 1)]

# If true, show URL addresses after external links.
# man_show_urls = False


# -- Options for Texinfo output -------------------------------------------

# Grouping the document tree into Texinfo files. List of tuples
# (source start file, target name, title, author,
#  dir menu entry, description, category)
texinfo_documents = [('index', 'PbsTestLab', 'PbsTestLab Documentation',
                      'Copyright (C) 1994-2021 Altair Engineering, Inc',
                      'PbsTestLab', 'PBS Testing and Benchmarking\
                      Framework', 'Miscellaneous'), ]

# Documents to append as an appendix to all manuals.
# texinfo_appendices = []

# If false, no module index is generated.
# texinfo_domain_indices = True

# How to display URL addresses: 'footnote', 'no', or 'inline'.
texinfo_show_urls = 'inline'

# If true, do not generate a @detailmenu in the "Top" node's menu.
# texinfo_no_detailmenu = False


# Skip the document for unwanted members iside API documentation
def autodoc_skip_member(app, what, name, obj, skip, options):
    exclusions = ('chunks_tag', 'chunk_tag', 'array_tag', 'subjob_tag',
                  'pbsobjname_re', 'pbsobjattrval_re', 'dt_tag',
                  'hms_tag', 'lim_tag', 'fgc_attr_pat', 'fgc_val_pat',
                  'version_tag', 'fs_tag', 'conf_re', 'generic_tag',
                  'node_type_tag', 'queue_type_tag', 'job_type_tag',
                  'job_exit_tag', 'tm_tag', 'server_run_tag',
                  'server_nodeup_tag', 'server_enquejob_tag',
                  'server_endjob_tag', 'startcycle_tag', 'endcycle_tag',
                  'alarm_tag', 'considering_job_tag', 'sched_job_run_tag',
                  'estimated_tag', 'run_failure_tag', 'calendarjob_tag',
                  'preempt_failure_tag', 'preempt_tag', 'record_tag',
                  'mom_run_tag', 'mom_end_tag', 'mom_enquejob_tag',
                  'record_tag', 'S_sub_record_tag', 'E_sub_record_tag',
                  'sub_record_tag', 'generic_tag', 'node_type_tag',
                  'queue_type_tag', 'job_type_tag', 'job_exit_tag', 'tm_tag',
                  'server_run_tag', 'server_nodeup_tag', 'server_enquejob_tag',
                  'server_endjob_tag', 'startcycle_tag', 'endcycle_tag',
                  'alarm_tag', 'considering_job_tag', 'sched_job_run_tag',
                  'estimated_tag', 'run_failure_tag', 'calendarjob_tag',
                  'preempt_failure_tag', 'preempt_tag', 'record_tag',
                  'mom_run_tag', 'mom_end_tag', 'mom_enquejob_tag',
                  'record_tag', 'S_sub_record_tag', 'E_sub_record_tag',
                  'sub_record_tag')
    exclude = name in exclusions
    return skip or exclude


def setup(app):
    app.connect('autodoc-skip-member', autodoc_skip_member)


# Default autodoc members for API rst file
autodoc_default_flags = ['members', 'no-undoc-members', 'no-private-members']


================================================
FILE: test/fw/doc/howtotest.rst
================================================
How to write test suite/case
============================

Assumptions
-----------

The library and utility make several assumptions about the environment:

- OS should be Unix or Linux
- Password-less authentication should be setup on all systems
- Required users are available (see ``pbs_config --check-ug``)
- The PTL package should be installed on all systems
- The file system layout should be same on all systems
- PBS_CONF_FILE variable should be set on all systems

Naming conventions, recommended practices, and guidelines
---------------------------------------------------------

Write the test in a filename prefixed by ``pbs_`` followed by feature name
``pbs_<featurename>.py``

Name of the test class should be  prefixed by ``Test`` and followed by unique
explanatory name ``Test<feature>``

Each test case name should start with ``test_`` followed by lower case characters.
``test_<testname>`` Test case name should be unique, accurate & explanatory, but
concise, can have multiple words if needed. The test cases running sequence is
unordered (some claim that it is lexicographic ordering but it is best to not write
your test suites based on such assumptions).

Put every functionality that is common to all test cases in its own method,
and consider adding it to the library or utility if it is a generic interface to
PBS.

PTL strongly follows PEP8 Python coding style. so please style your code to follow
PEP8 Python codeing style. You can find PEP8 at https://www.python.org/dev/peps/pep-0008/

Some info about PBSTestSuite
----------------------------

Tests that inherit functionality from a parent class such as PBSTestSuite have
available to them predefined functionality for setUpclass, setUp, tearDownclass, tearDown,
or whatever capability they make available in the parent class.

PBSTestSuite offers the following:

.. topic:: setUpclass:

  - Parse custom parameters that are passed in to the Class variable called 'param' (i.e. -p option to pbs_benchpress).
    The built-in parameters are:

    - servers: Colon-separated list of hostnames hosting a PBS server/scheduler.
    - server: The hostname on which the PBS Server/scheduler is running
    - moms: Colon-separated list of hostnames hosting a PBS MoMs.
    - mom: The hostname on which the PBS MoM is running
    - nomom: Colon-separated list of hostnames where not to expect MoM running.
    - comms: Colon-separated list of hostnames hosting a PBS Comms.
    - comm: The hostname on which the PBS Comm is running
    - client: For CLI mode only, name of the host on which the PBS client commands are to be run from.
    - clienthost: the hostnames to set in the MoM config file
    - mode: Mode of operation to PBS server. Can be either ‘cli’ or ‘api’.
    - conn_timeout: set a timeout in seconds after which a pbs_connect IFL call is refreshed (i.e., disconnected)
    - skip-setup: Bypasses setUp of PBSTestSuite (not custom ones)
    - skip-teardown: Bypasses tearDown of PBSTestSuite (not custom ones)
    - repeat-count: Number of tests repetition
    - repeat-delay: delay between two repetition
    - procinfo: Enables process monitoring thread, logged into ptl_proc_info test metrics.
    - procmon: Colon-separated process name to monitor. For example to monitor server, sched, and mom use procmon=pbs_server:pbs_sched:pbs_mom
    - procmon-freq: Sets a polling frequency for the process monitoring tool. Defaults to 10 seconds.
    - revert-to-defaults=<True|False>: if False, will not revert to defaults. Defaults to True.
    - revert-hooks=<True|False>: if False, do not revert hooks to defaults. Defaults to True. revert-to-defaults set to False overrides this setting.
    - del-hooks=<True|False>: If False, do not delete hooks. Defaults to False. revert-to-defaults set to False overrides this setting.
    - revert-queues=<True|False>: If False, do not revert queues to defaults. Defaults to True. revert-to-defaults set to False overrides this setting.
    - revert-resources=<True|False>: If False, do not revert resources to defaults. Defaults to True. revert-to-defaults set to False overrides this setting.
    - del-queues=<True|False>: If False, do not delete queues. Defaults to False. revert-to-defaults set to False overrides this setting.
    - del-vnodes=<True|False>: If False, do not delete vnodes on MoM instances. Defaults to True.
    - server-revert-to-defaults=<True|False>: if False, don’t revert Server to defaults
    - comm-revert-to-defaults=<True|False>: if False, don’t revert Comm to defaults
    - mom-revert-to-defaults=<True|False>: if False, don’t revert MoM to defaults
    - sched-revert-to-defaults=<True|False>: if False, don’t revert Scheduler to defaults
    - test-users: colon-separated list of users to use as test users. The users specified override the default users in the order in which they appear in the PBS_USERS list.
    - data-users: colon-separated list of data users.
    - oper-users: colon-separated list of operator users.
    - mgr-users: colon-separated list of manager users.
    - root-users: colon-separated list of root users.
    - build-users: colon-separated list of build users.
    - daemon-users: colon-seperating list of daemon users.

  - Check required users are available or not
  - Creates servers, moms, schedulers and comms object

.. topic:: setUp:

  - Check that servers, schedulers, moms and comms services are up or not.
  - If any of services is down then starts that services.
  - Add the current user to the list of managers
  - Bring servers, schedulers, moms and comms configurations back to out-of-box defaults
  - Cleanup jobs and reservations
  - If no nodes are defined in the system, a single 8 cpu node is defined.
  - start process monitoring thread if process monitoring enabled

.. topic:: setUpClass:

  - If setUpClass is overridden, use super() instead of the class you are overriding to call setUpClass of the parent.

.. topic:: tearDown:

  - If process monitoring is enabled the stop process monitoring thread and collect process metrics

.. topic:: tearDownClass:

  - If tearDownClass is overridden, use super() instead of the class you are overriding to call tearDownClass of the parent.

.. topic:: analyze_logs:

  - Analyzes all PBS daemons and accounting logs and collect logs metrics

You can take advantage of PBSTestSuite's setUp and tearDown methods and extend
their functionality by overriding the setUp and/or tearDown methods in your
own class, for example

::

      class TestMyFix(PBSTestSuite):

            def setUp(self):
                PBSTestSuite.setUp(self)
                # create custom nodes, server/sched config, etc...

For detailed test directory structure please check document.

Writing a test suite
--------------------

See ptl/tests/pbs_smoketest.py for some basic examples how to write test suite.

Whenever possible consider making the test class inherit from PBSTestSuite, it
is a generic setup and teardown class that delete all jobs and reservations,
reverts PBS deamons configuration to defaults and ensures that there
is at least one cpu to schedule work on.

How to mark a test as skipped
------------------------------

The unittest module in Python versions less than 2.7 do not support
registering skipping tests. PTL offers a mechanism to skip test, it
is however up to the test writer to ensure that a test is not run if
it needs to be skipped.

.. topic:: skipTest:

  Tests that inherit from PBSTestSuite inherit a method called ``skipTest`` that
  is used to skip tests, whenever a test is to be skipped, that method should be
  called and the test should return.

.. topic:: checkModule:

  Tests that inherit from PBSTestSuite inherit a method called ``checkModule`` that
  is used to skip tests if require Python module is not installed.

.. topic:: skipOnCray:

  Tests that inherit from PBSTestSuite inherit a method called ``skipOnCray`` that
  is used to skip tests on Cray platform.

.. topic:: skipOnShasta:

  Tests that inherit from PBSTestSuite inherit a method called ``skipOnShasta`` that
  is used to skip tests on Cray Shasta platform.

How to add a new attribute to the library
-----------------------------------------

This section is targeted to PBS developers who may be adding a new job, queue,
server, or node attribute and need to write tests that depend on such a new
attribute.
PTL does not automatically generate mappings from API to CLI, so when adding
new attributes, it is the responsibility of the test writer to define the
attribute conversion in ptl/lib/pbs_api_to_cli.py. The new attribute must also
be defined ptl/lib/pbs_ifl_mock.py so that the attribute name can be
dereferenced if the SWIG wrapping was not performed.

Here is an example, let's assume we are introducing a new job attribute called
ATTR_geometry that maps to the string "job_geometry", in order to be able to
set the attribute on a job, we need to define it in pbs_api_to_cli.py as:
ATTR_geometry: "W job_geometry="
and add it to ptl/lib/pbs_ifl_mock.py as:
ATTR_geometry: "job_geometry".
In order to get the API to take the new attribute into consideration,
pbs_swigify must be rerun so that symbols from pbs_ifl.h are read in.


================================================
FILE: test/fw/doc/index.rst
================================================
Welcome to PbsTestLab's documentation!
======================================
A unit testing and benchmarking framework to write, execute, and catalog
PBS tests.

.. toctree::
   :numbered:

   install
   intro
   tutorial
   howtotest
   commands
   caveats
   ptl


================================================
FILE: test/fw/doc/install.rst
================================================
Installation
============

Prerequisite
------------
    - Python >= 2.6
    - `Pip`_ >= 8

Install
-------
To install package run following::

    pip install -r requirements.txt .

To install package in non-default location run following::

    pip install -r requirements.txt --prefix=/path/to/install/location .

If you install in non-default location then export `PYTHONPATH` variable before using PTL as follow::

    export PYTHONPATH=</path/to/install/location>/lib/python<python version>/site-packages

::

    </path/to/install/location/bin>/pbs_benchpress -h


Upgrade
-------

To upgrade package run following::

    pip install -U -r requirements.txt .

Uninstall
---------

To uninstall package run following::

    pip uninstall PbsTestLab

If you have installed in non-default location then export `PYTHONPATH` first before running uninstall command like::

    export PYTHONPATH=</path/to/install/location>/lib/python<python version>/site-packages
    pip uninstall PbsTestLab

.. _Pip: https://pip.pypa.io/en/stable


================================================
FILE: test/fw/doc/intro.rst
================================================
Introduction of PbsTestLab
==========================

Command line tools
------------------

- :ref:`pbs_benchpress <pbs_benchpress>` used to run unit tests
- :ref:`pbs_loganalyzer <pbs_loganalyzer>` used to analyze PBS logs
- :ref:`pbs_stat <pbs_stat>` used to filter PBS objects based on select properties
- :ref:`pbs_config <pbs_config>` used to configure services, e.g., create vnodes
- :ref:`pbs_py_spawn <pbs_py_spawn>` used to invoke a pbs_py_spawn action associated to a job running on a MoM
- :ref:`pbs_compare_results <pbs_compare_results>` used to compare performance test results

Library
-------

- Provides PBS IFL operations through either SWIG-wrappers or PBS CLI e.g. qstat, qsub etc.
- Encapsulated PBS entities: :py:class:`~ptl.lib.pbs_testlib.Server`, :py:class:`~ptl.lib.pbs_testlib.Scheduler`,
  :py:class:`~ptl.lib.pbs_testlib.MoM`, :py:class:`~ptl.lib.pbs_testlib.Comm`, :py:class:`~ptl.lib.pbs_testlib.Queue`,
  :py:class:`~ptl.lib.pbs_testlib.Job`, :py:class:`~ptl.lib.pbs_testlib.Reservation`, :py:class:`~ptl.lib.pbs_testlib.Hook`,
  :py:class:`~ptl.lib.pbs_testlib.Resource`
- Utility class to convert batch status and attributes to Python lists, strings and dictionaries
- High-level PBS operations to operate on PBS entities including nodes, queues, jobs, reservations, resources, and server

Utilities
---------

- Logging to parse and report metrics from :py:class:`Server <ptl.utils.pbs_logutils.PBSServerLog>`, :py:class:`Scheduler <ptl.utils.pbs_logutils.PBSSchedulerLog>`,
  :py:class:`MoM <ptl.utils.pbs_logutils.PBSMoMLog>` and :py:class:`Accounting <ptl.utils.pbs_logutils.PBSAccountingLog>` logs.
- Distributed tools to transparently run commands locally or remotely, including file copying.

Plugins
-------

- Provides utilities to load, run and get info of test cases in form of `Nose framework`_ plugins

Documentation
-------------

- API documentation describing the capabilities of the framework and utilities
- For the command-line tools use the -h option for help

Directory structure
-------------------

::

    fw
    |- bin -- Command line tools
    |- doc -- Documentation
    `- ptl -- PTL package
       |- lib -- Library
       `- utils -- Utilities
          `- plugins -- plugins of PTL for Nose framework

.. _Nose framework: http://readthedocs.org/docs/nose/


================================================
FILE: test/fw/doc/make.bat
================================================
@ECHO OFF

REM Command file for Sphinx documentation

if "%SPHINXBUILD%" == "" (
	set SPHINXBUILD=sphinx-build
)
set BUILDDIR=target
set ALLSPHINXOPTS=-d %BUILDDIR%/doctrees %SPHINXOPTS% .
set I18NSPHINXOPTS=%SPHINXOPTS% .
if NOT "%PAPER%" == "" (
	set ALLSPHINXOPTS=-D latex_paper_size=%PAPER% %ALLSPHINXOPTS%
	set I18NSPHINXOPTS=-D latex_paper_size=%PAPER% %I18NSPHINXOPTS%
)

if "%1" == "" goto help

if "%1" == "help" (
	:help
	echo.Please use `make ^<target^>` where ^<target^> is one of
	echo.  html       to make standalone HTML files
	echo.  dirhtml    to make HTML files named index.html in directories
	echo.  singlehtml to make a single large HTML file
	echo.  pickle     to make pickle files
	echo.  json       to make JSON files
	echo.  htmlhelp   to make HTML files and a HTML help project
	echo.  qthelp     to make HTML files and a qthelp project
	echo.  devhelp    to make HTML files and a Devhelp project
	echo.  epub       to make an epub
	echo.  latex      to make LaTeX files, you can set PAPER=a4 or PAPER=letter
	echo.  latexpdf   to make LaTeX files and run them through pdflatex
	echo.  latexpdfja to make LaTeX files and run them through platex/dvipdfmx
	echo.  text       to make text files
	echo.  man        to make manual pages
	echo.  texinfo    to make Texinfo files
	echo.  gettext    to make PO message catalogs
	echo.  changes    to make an overview over all changed/added/deprecated items
	echo.  xml        to make Docutils-native XML files
	echo.  pseudoxml  to make pseudoxml-XML files for display purposes
	echo.  linkcheck  to check all external links for integrity
	echo.  doctest    to run all doctests embedded in the documentation if enabled
	goto end
)

if "%1" == "clean" (
	for /d %%i in (%BUILDDIR%\*) do rmdir /q /s %%i
	del /q /s %BUILDDIR%\*
	goto end
)


%SPHINXBUILD% 2> nul
if errorlevel 9009 (
	echo.
	echo.The 'sphinx-build' command was not found. Make sure you have Sphinx
	echo.installed, then set the SPHINXBUILD environment variable to point
	echo.to the full path of the 'sphinx-build' executable. Alternatively you
	echo.may add the Sphinx directory to PATH.
	echo.
	echo.If you don't have Sphinx installed, grab it from
	echo.http://sphinx-doc.org/
	exit /b 1
)

if "%1" == "html" (
	%SPHINXBUILD% -b html %ALLSPHINXOPTS% %BUILDDIR%/html
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The HTML pages are in %BUILDDIR%/html.
	goto end
)

if "%1" == "dirhtml" (
	%SPHINXBUILD% -b dirhtml %ALLSPHINXOPTS% %BUILDDIR%/dirhtml
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The HTML pages are in %BUILDDIR%/dirhtml.
	goto end
)

if "%1" == "singlehtml" (
	%SPHINXBUILD% -b singlehtml %ALLSPHINXOPTS% %BUILDDIR%/singlehtml
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The HTML pages are in %BUILDDIR%/singlehtml.
	goto end
)

if "%1" == "pickle" (
	%SPHINXBUILD% -b pickle %ALLSPHINXOPTS% %BUILDDIR%/pickle
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished; now you can process the pickle files.
	goto end
)

if "%1" == "json" (
	%SPHINXBUILD% -b json %ALLSPHINXOPTS% %BUILDDIR%/json
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished; now you can process the JSON files.
	goto end
)

if "%1" == "htmlhelp" (
	%SPHINXBUILD% -b htmlhelp %ALLSPHINXOPTS% %BUILDDIR%/htmlhelp
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished; now you can run HTML Help Workshop with the ^
.hhp project file in %BUILDDIR%/htmlhelp.
	goto end
)

if "%1" == "qthelp" (
	%SPHINXBUILD% -b qthelp %ALLSPHINXOPTS% %BUILDDIR%/qthelp
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished; now you can run "qcollectiongenerator" with the ^
.qhcp project file in %BUILDDIR%/qthelp, like this:
	echo.^> qcollectiongenerator %BUILDDIR%\qthelp\PbsTestLab.qhcp
	echo.To view the help file:
	echo.^> assistant -collectionFile %BUILDDIR%\qthelp\PbsTestLab.ghc
	goto end
)

if "%1" == "devhelp" (
	%SPHINXBUILD% -b devhelp %ALLSPHINXOPTS% %BUILDDIR%/devhelp
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished.
	goto end
)

if "%1" == "epub" (
	%SPHINXBUILD% -b epub %ALLSPHINXOPTS% %BUILDDIR%/epub
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The epub file is in %BUILDDIR%/epub.
	goto end
)

if "%1" == "latex" (
	%SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished; the LaTeX files are in %BUILDDIR%/latex.
	goto end
)

if "%1" == "latexpdf" (
	%SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex
	cd %BUILDDIR%/latex
	make all-pdf
	cd %BUILDDIR%/..
	echo.
	echo.Build finished; the PDF files are in %BUILDDIR%/latex.
	goto end
)

if "%1" == "latexpdfja" (
	%SPHINXBUILD% -b latex %ALLSPHINXOPTS% %BUILDDIR%/latex
	cd %BUILDDIR%/latex
	make all-pdf-ja
	cd %BUILDDIR%/..
	echo.
	echo.Build finished; the PDF files are in %BUILDDIR%/latex.
	goto end
)

if "%1" == "text" (
	%SPHINXBUILD% -b text %ALLSPHINXOPTS% %BUILDDIR%/text
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The text files are in %BUILDDIR%/text.
	goto end
)

if "%1" == "man" (
	%SPHINXBUILD% -b man %ALLSPHINXOPTS% %BUILDDIR%/man
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The manual pages are in %BUILDDIR%/man.
	goto end
)

if "%1" == "texinfo" (
	%SPHINXBUILD% -b texinfo %ALLSPHINXOPTS% %BUILDDIR%/texinfo
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The Texinfo files are in %BUILDDIR%/texinfo.
	goto end
)

if "%1" == "gettext" (
	%SPHINXBUILD% -b gettext %I18NSPHINXOPTS% %BUILDDIR%/locale
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The message catalogs are in %BUILDDIR%/locale.
	goto end
)

if "%1" == "changes" (
	%SPHINXBUILD% -b changes %ALLSPHINXOPTS% %BUILDDIR%/changes
	if errorlevel 1 exit /b 1
	echo.
	echo.The overview file is in %BUILDDIR%/changes.
	goto end
)

if "%1" == "linkcheck" (
	%SPHINXBUILD% -b linkcheck %ALLSPHINXOPTS% %BUILDDIR%/linkcheck
	if errorlevel 1 exit /b 1
	echo.
	echo.Link check complete; look for any errors in the above output ^
or in %BUILDDIR%/linkcheck/output.txt.
	goto end
)

if "%1" == "doctest" (
	%SPHINXBUILD% -b doctest %ALLSPHINXOPTS% %BUILDDIR%/doctest
	if errorlevel 1 exit /b 1
	echo.
	echo.Testing of doctests in the sources finished, look at the ^
results in %BUILDDIR%/doctest/output.txt.
	goto end
)

if "%1" == "xml" (
	%SPHINXBUILD% -b xml %ALLSPHINXOPTS% %BUILDDIR%/xml
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The XML files are in %BUILDDIR%/xml.
	goto end
)

if "%1" == "pseudoxml" (
	%SPHINXBUILD% -b pseudoxml %ALLSPHINXOPTS% %BUILDDIR%/pseudoxml
	if errorlevel 1 exit /b 1
	echo.
	echo.Build finished. The pseudo-XML files are in %BUILDDIR%/pseudoxml.
	goto end
)

:end


================================================
FILE: test/fw/doc/ptl.rst
================================================
.. _full-api:

=================
API documentation
=================

Library
=======

pbs_api_to_cli
--------------

.. automodule:: ptl.lib.pbs_api_to_cli

pbs_ifl_mock
------------

.. automodule:: ptl.lib.pbs_ifl_mock

pbs_testlib
-----------

.. automodule:: ptl.lib.pbs_testlib

Utilities
=========

pbs_cliutils
------------

.. automodule:: ptl.utils.pbs_cliutils

pbs_covutils
------------

.. automodule:: ptl.utils.pbs_covutils

pbs_dshutils
------------

.. automodule:: ptl.utils.pbs_dshutils

pbs_logutils
------------

.. automodule:: ptl.utils.pbs_logutils

pbs_procutils
-------------

.. automodule:: ptl.utils.pbs_procutils

pbs_testsuite
-------------

.. automodule:: ptl.utils.pbs_testsuite

Plugins
-------

ptl_test_data
~~~~~~~~~~~~~

.. automodule:: ptl.utils.plugins.ptl_test_data

ptl_test_db
~~~~~~~~~~~

.. automodule:: ptl.utils.plugins.ptl_test_db

ptl_test_info
~~~~~~~~~~~~~

.. automodule:: ptl.utils.plugins.ptl_test_info

ptl_test_loader
~~~~~~~~~~~~~~~

.. automodule:: ptl.utils.plugins.ptl_test_loader

ptl_test_runner
~~~~~~~~~~~~~~~

.. automodule:: ptl.utils.plugins.ptl_test_runner

ptl_test_tags
~~~~~~~~~~~~~

.. automodule:: ptl.utils.plugins.ptl_test_tags


================================================
FILE: test/fw/doc/tutorial.rst
================================================
Brief tutorial about common library API
=======================================

Most of the examples below show specific calls to the library functions,
there are typically many more derivations possible, check the :ref:`full API documentation <full-api>`
for details.

Importing the library
---------------------
Because the library may leverage SWIG-wrappers it is preferred to import all so that the pbs_ifl module imports all IFL symbols as shown below:

::

  from ptl.lib.pbs_testlib import *

Instantiating a Server
----------------------
Instantiate a Server object and populate it's attributes values after stat'ing the PBS server.

::

  server = Server('remotehost')
  OR
  server = Server() # no hostname defaults to the FQDN of the current host

Adding a user as manager
------------------------

::

  server.manager(MGR_CMD_SET, SERVER, {ATTR_managers: (INCR, 'user@host')})

Reverting server's configuration to defaults
--------------------------------------------

::

  server.revert_to_defaults()


Instantiating a Job
-------------------

::

  job = Job()

Setting job attributes
----------------------

::

  job.set_attributes({'Resource_List.select':'2:ncpus=1','Resource_List.place':'scatter'})

Submitting a job
----------------

::

  server.submit(job)

Stat'ing a server
-----------------

::

  server.status()

Stat'ing all jobs job_state attribute
-------------------------------------

::

  server.status(JOB, 'job_state')

Counting all vnodes by state
----------------------------

::

  server.counter(NODE, 'state')

Expecting a job to be running
-----------------------------

::

  server.expect(JOB, {'job_state':'R','substate':42}, attrop=PTL_AND, id=jid)

where `jid` is the result of a server.submit(job)

Each attribute can be given an operand, one of LT, LE, EQ, GE, GT, NE
For example to expect a job to be in state R and substate != 41::

  server.expect(JOB, {'job_state':(EQ,'R'), 'substate':(NE,41)}, id=jid)

Instantiating a Scheduler object
--------------------------------

::

  sched = Scheduler('hostname')
  OR
  sched = Scheduler() # no hostname defaults to the FQDN of the current host

Setting scheduler configuration
-------------------------------

::

  sched.set_sched_config({'backfill':'true  ALL'})

Reverting scheduler's configuration to defaults
-----------------------------------------------

::

  sched.revert_to_defaults()


Instantiating a MoM
-------------------

::

  mom = MoM('hostname')

Creating a vnode definition file
--------------------------------

::

  attrs = {'resources_available.ncpus':8,'resources_available.mem':'8gb'}
  vdef = node.create_vnode_def('vn', attrs, 10)

Inserting a vnode definition to a MoM
-------------------------------------

::

  mom.insert_vnode_def(vdef)

Reverting mom's configuration to defaults
-----------------------------------------

::

  mom.revert_to_defaults()


================================================
FILE: test/fw/ptl/__init__.py.in
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


__version__ = '@PBS_VERSION@'


================================================
FILE: test/fw/ptl/lib/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


================================================
FILE: test/fw/ptl/lib/pbs_api_to_cli.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.lib.pbs_ifl_mock import *

api_to_cli = {
    ATTR_a: 'a',
    ATTR_c: 'c',
    ATTR_e: 'e',
    ATTR_g: 'W group_list=',
    ATTR_h: 'h',
    ATTR_j: 'j',
    ATTR_J: 'J',
    ATTR_k: 'k',
    ATTR_l: 'l',
    ATTR_m: 'm',
    ATTR_o: 'o',
    ATTR_p: 'p',
    ATTR_q: 'q',
    ATTR_R: 'R',
    ATTR_r: 'r',
    ATTR_u: 'u',
    ATTR_v: 'v',
    ATTR_A: 'A',
    ATTR_M: 'M',
    ATTR_N: 'N',
    ATTR_S: 'S',
    ATTR_W: 'W',
    ATTR_array_indices_submitted: 'J',
    ATTR_depend: 'W depend=',
    ATTR_inter: 'I',
    ATTR_sandbox: 'W sandbox=',
    ATTR_stagein: 'W stagein=',
    ATTR_stageout: 'W stageout=',
    ATTR_resvTag: 'reserve_Tag',
    ATTR_resv_start: 'R',
    ATTR_resv_end: 'E',
    ATTR_resv_duration: 'D',
    ATTR_resv_state: 'reserve_state',
    ATTR_resv_substate: 'reserve_substate',
    ATTR_del_idle_time: 'W delete_idle_time=',
    ATTR_auth_u: 'U',
    ATTR_auth_g: 'G',
    ATTR_auth_h: 'Authorized_Hosts',
    ATTR_cred: 'cred',
    ATTR_nodemux: 'no_stdio_sockets',
    ATTR_umask: 'W umask=',
    ATTR_block: 'W block=',
    ATTR_convert: 'W qmove=',
    ATTR_DefaultChunk: 'default_chunk',
    ATTR_X11_cookie: 'forward_x11_cookie',
    ATTR_X11_port: 'forward_x11_port',
    ATTR_resv_standing: '',
    ATTR_resv_count: 'reserve_count',
    ATTR_resv_idx: 'reserve_index',
    ATTR_resv_rrule: 'r',
    ATTR_resv_execvnodes: 'reserve_execvnodes',
    ATTR_resv_timezone: '',
    ATTR_ctime: 'c',
    ATTR_estimated: 't',
    ATTR_exechost: 'exec_host',
    ATTR_exechost2: 'exec_host2',
    ATTR_execvnode: 'exec_vnode',
    ATTR_resv_nodes: 'resv_nodes',
    ATTR_mtime: 'm',
    ATTR_qtime: 'q',
    ATTR_session: 'session_id',
    ATTR_jobdir: 'jobdir',
    ATTR_euser: 'euser',
    ATTR_egroup: 'egroup',
    ATTR_project: 'P',
    ATTR_hashname: 'hashname',
    ATTR_hopcount: 'hop_count',
    ATTR_security: 'security',
    ATTR_sched_hint: 'sched_hint',
    ATTR_SchedSelect: 'schedselect',
    ATTR_substate: 'substate',
    ATTR_name: 'N',
    ATTR_owner: 'Job_Owner',
    ATTR_used: 'resources_used',
    ATTR_state: 's',
    ATTR_queue: 'q',
    ATTR_server: 'server',
    ATTR_maxrun: 'max_running',
    ATTR_max_run: 'max_run',
    ATTR_max_run_res: 'max_run_res',
    ATTR_max_run_soft: 'max_run_soft',
    ATTR_max_run_res_soft: 'max_run_res_soft',
    ATTR_total: 'total_jobs',
    ATTR_comment: 'W comment=',
    ATTR_cookie: 'cookie',
    ATTR_qrank: 'queue_rank',
    ATTR_altid: 'alt_id',
    ATTR_altid2: 'alt_id2',
    ATTR_acct_id: 'accounting_id',
    ATTR_array: 'J',
    ATTR_array_id: 'array_id',
    ATTR_array_index: 'array_index',
    ATTR_array_state_count: 'array_state_count',
    ATTR_array_indices_remaining: 'array_indices_remaining',
    ATTR_etime: 'e',
    ATTR_gridname: 'gridname',
    ATTR_refresh: 'last_context_refresh',
    ATTR_ReqCredEnable: 'require_cred_enable',
    ATTR_ReqCred: 'require_cred',
    ATTR_runcount: 'W run_count=',
    ATTR_stime: 's',
    ATTR_executable: 'executable',
    ATTR_Arglist: 'argument_list',
    ATTR_version: 'pbs_version',
    ATTR_eligible_time: 'g',
    ATTR_accrue_type: 'accrue_type',
    ATTR_sample_starttime: 'sample_starttime',
    ATTR_job_kill_delay: 'job_kill_delay',
    ATTR_history_timestamp: 'history_timestamp',
    ATTR_stageout_status: 'Stageout_status',
    ATTR_exit_status: 'Exit_status',
    ATTR_submit_arguments: 'Submit_arguments',
    ATTR_resv_name: 'Reserve_Name',
    ATTR_resv_owner: 'Reserve_Owner',
    ATTR_resv_Tag: 'reservation_Tag',
    ATTR_resv_ID: 'reserve_ID',
    ATTR_resv_retry: 'reserve_retry',
    ATTR_aclgren: 'acl_group_enable',
    ATTR_aclgroup: 'acl_groups',
    ATTR_aclhten: 'acl_host_enable',
    ATTR_aclhost: 'acl_hosts',
    ATTR_acluren: 'acl_user_enable',
    ATTR_acluser: 'acl_users',
    ATTR_altrouter: 'alt_router',
    ATTR_chkptmin: 'checkpoint_min',
    ATTR_enable: 'enabled',
    ATTR_fromroute: 'from_route_only',
    ATTR_HasNodes: 'hasnodes',
    ATTR_killdelay: 'kill_delay',
    ATTR_maxgrprun: 'max_group_run',
    ATTR_maxgrprunsoft: 'max_group_run_soft',
    ATTR_maxque: 'max_queuable',
    ATTR_max_queued: 'max_queued',
    ATTR_max_queued_res: 'max_queued_res',
    ATTR_maxuserrun: 'max_user_run',
    ATTR_maxuserrunsoft: 'max_user_run_soft',
    ATTR_qtype: 'queue_type',
    ATTR_rescassn: 'resources_assigned',
    ATTR_rescdflt: 'resources_default',
    ATTR_rescmax: 'resources_max',
    ATTR_rescmin: 'resources_min',
    ATTR_rndzretry: 'rendezvous_retry',
    ATTR_routedest: 'route_destinations',
    ATTR_routeheld: 'route_held_jobs',
    ATTR_routewait: 'route_waiting_jobs',
    ATTR_routeretry: 'route_retry_time',
    ATTR_routelife: 'route_lifetime',
    ATTR_rsvexpdt: 'reserved_expedite',
    ATTR_rsvsync: 'reserved_sync',
    ATTR_start: 'started',
    ATTR_count: 'state_count',
    ATTR_number: 'number_jobs',
    ATTR_SvrHost: 'server_host',
    ATTR_aclroot: 'acl_roots',
    ATTR_managers: 'managers',
    ATTR_dfltque: 'default_queue',
    ATTR_defnode: 'default_node',
    ATTR_locsvrs: 'location_servers',
    ATTR_logevents: 'log_events',
    ATTR_logfile: 'log_file',
    ATTR_mailfrom: 'mail_from',
    ATTR_nodepack: 'node_pack',
    ATTR_nodefailrq: 'node_fail_requeue',
    ATTR_resendtermdelay: 'resend_term_delay',
    ATTR_operators: 'operators',
    ATTR_queryother: 'query_other_jobs',
    ATTR_resccost: 'resources_cost',
    ATTR_rescavail: 'resources_available',
    ATTR_maxuserres: 'max_user_res',
    ATTR_maxuserressoft: 'max_user_res_soft',
    ATTR_maxgroupres: 'max_group_res',
    ATTR_maxgroupressoft: 'max_group_res_soft',
    ATTR_maxarraysize: 'max_array_size',
    ATTR_PNames: 'pnames',
    ATTR_schedit: 'scheduler_iteration',
    ATTR_scheduling: 'scheduling',
    ATTR_status: 'server_state',
    ATTR_syscost: 'system_cost',
    ATTR_FlatUID: 'flatuid',
    ATTR_FLicenses: 'FLicenses',
    ATTR_ResvEnable: 'resv_enable',
    ATTR_aclResvgren: 'acl_resv_group_enable',
    ATTR_aclResvgroup: 'acl_resv_groups',
    ATTR_aclResvhten: 'acl_resv_host_enable',
    ATTR_aclResvhost: 'acl_resv_hosts',
    ATTR_aclResvuren: 'acl_resv_user_enable',
    ATTR_aclResvuser: 'acl_resv_users',
    ATTR_NodeGroupEnable: 'node_group_enable',
    ATTR_NodeGroupKey: 'node_group_key',
    ATTR_dfltqdelargs: 'default_qdel_arguments',
    ATTR_dfltqsubargs: 'default_qsub_arguments',
    ATTR_rpp_retry: 'rpp_retry',
    ATTR_rpp_highwater: 'rpp_highwater',
    ATTR_pbs_license_info: 'pbs_license_info',
    ATTR_license_min: 'pbs_license_min',
    ATTR_license_max: 'pbs_license_max',
    ATTR_license_linger: 'pbs_license_linger_time',
    ATTR_license_count: 'license_count',
    ATTR_job_sort_formula: 'job_sort_formula',
    ATTR_EligibleTimeEnable: 'eligible_time_enable',
    ATTR_resv_retry_init: 'reserve_retry_init',
    ATTR_resv_retry_time: 'reserve_retry_time',
    ATTR_JobHistoryEnable: 'job_history_enable',
    ATTR_JobHistoryDuration: 'job_history_duration',
    ATTR_max_concurrent_prov: 'max_concurrent_provision',
    ATTR_resv_post_processing: 'resv_post_processing_time',
    ATTR_backfill_depth: 'backfill_depth',
    ATTR_job_requeue_timeout: 'job_requeue_timeout',
    ATTR_SchedHost: 'sched_host',
    ATTR_sched_cycle_len: 'sched_cycle_length',
    ATTR_do_not_span_psets: 'do_not_span_psets',
    ATTR_soft_time: 'Wsoft_limit_time',
    ATTR_power_provisioning: 'power_provisioning',
    ATTR_max_job_sequence_id: 'max_job_sequence_id',
    ATTR_tolerate_node_failures: 'Wtolerate_node_failures=',
    ATTR_NODE_Host: 'Host',
    ATTR_NODE_Mom: 'Mom',
    ATTR_NODE_Port: 'Port',
    ATTR_NODE_state: 'state',
    ATTR_NODE_ntype: 'ntype',
    ATTR_NODE_jobs: 'jobs',
    ATTR_NODE_resvs: 'resv',
    ATTR_NODE_resv_enable: 'resv_enable',
    ATTR_NODE_np: 'np',
    ATTR_NODE_pcpus: 'pcpus',
    ATTR_NODE_properties: 'properties',
    ATTR_NODE_NoMultiNode: 'no_multinode_jobs',
    ATTR_NODE_No_Tasks: 'no_tasks',
    ATTR_NODE_Sharing: 'sharing',
    ATTR_NODE_HPCBP_User_name: 'hpcbp_user_name',
    ATTR_NODE_HPCBP_WS_address: 'hpcbp_webservice_address',
    ATTR_NODE_HPCBP_Stage_protocol: 'hpcbp_stage_protocol',
    ATTR_NODE_HPCBP_enable: 'hpcbp_enable',
    ATTR_NODE_ProvisionEnable: 'provision_enable',
    ATTR_NODE_current_aoe: 'current_aoe',
    ATTR_NODE_in_multivnode_host: 'in_multivnode_host',
    ATTR_NODE_License: 'license',
    ATTR_NODE_LicenseInfo: 'license_info',
    ATTR_NODE_TopologyInfo: 'topology_info',
    ATTR_NODE_last_used_time: 'last_used_time',
    ATTR_NODE_last_state_change_time: 'last_state_change_time',
    ATTR_sched_server_dyn_res_alarm: 'server_dyn_res_alarm',
    ATTR_RESC_TYPE: 'type',
    ATTR_RESC_FLAG: 'flag',
    SHUT_QUICK: 't quick',
    SHUT_DELAY: 't delay',
    SHUT_IMMEDIATE: 't immediate',
    SHUT_WHO_SCHED: 's',
    SHUT_WHO_MOM: 'm',
    SHUT_WHO_SECDRY: 'f',
    SHUT_WHO_IDLESECDRY: 'i',
    SHUT_WHO_SECDONLY: 'F',
}


def convert_api_to_cli(attrs):
    ret = []
    for a in attrs:
        if '.' in a:
            (attribute, resource) = a.split('.')
            ret.append(api_to_cli[attribute] + resource)
        else:
            ret.append(api_to_cli[a])
    return ret


================================================
FILE: test/fw/ptl/lib/pbs_ifl_mock.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


MGR_OBJ_NONE = -1
MGR_OBJ_SERVER = 0
MGR_OBJ_QUEUE = 1
MGR_OBJ_JOB = 2
MGR_OBJ_NODE = 3
MGR_OBJ_RESV = 4
MGR_OBJ_RSC = 5
MGR_OBJ_SCHED = 6
MGR_OBJ_HOST = 7
MGR_OBJ_HOOK = 8
MGR_OBJ_PBS_HOOK = 9

MGR_CMD_NONE = 10
MGR_CMD_CREATE = 11
MGR_CMD_DELETE = 12
MGR_CMD_SET = 13
MGR_CMD_UNSET = 14
MGR_CMD_LIST = 15
MGR_CMD_PRINT = 16
MGR_CMD_ACTIVE = 17
MGR_CMD_IMPORT = 18
MGR_CMD_EXPORT = 19

MSG_OUT = 1
MSG_ERR = 2

ATTR_a = 'Execution_Time'
ATTR_c = 'Checkpoint'
ATTR_e = 'Error_Path'
ATTR_g = 'group_list'
ATTR_h = 'Hold_Types'
ATTR_j = 'Join_Path'
ATTR_J = 'array_indices_submitted'
ATTR_k = 'Keep_Files'
ATTR_l = 'Resource_List'
ATTR_m = 'Mail_Points'
ATTR_o = 'Output_Path'
ATTR_p = 'Priority'
ATTR_q = 'destination'
ATTR_R = 'Remove_Files'
ATTR_r = 'Rerunable'
ATTR_u = 'User_List'
ATTR_v = 'Variable_List'
ATTR_A = 'Account_Name'
ATTR_M = 'Mail_Users'
ATTR_N = 'Job_Name'
ATTR_S = 'Shell_Path_List'
ATTR_W = 'Additional_Attributes'  # Not in pbs_ifl.h
ATTR_array_indices_submitted = ATTR_J
ATTR_max_run_subjobs = 'max_run_subjobs'
ATTR_depend = 'depend'
ATTR_inter = 'interactive'
ATTR_sandbox = 'sandbox'
ATTR_stagein = 'stagein'
ATTR_stageout = 'stageout'
ATTR_resvTag = 'reserve_Tag'
ATTR_resv_start = 'reserve_start'
ATTR_resv_end = 'reserve_end'
ATTR_resv_duration = 'reserve_duration'
ATTR_resv_alter_revert = 'reserve_alter_revert'
ATTR_resv_state = 'reserve_state'
ATTR_resv_substate = 'reserve_substate'
ATTR_del_idle_time = 'delete_idle_time'
ATTR_auth_u = 'Authorized_Users'
ATTR_auth_g = 'Authorized_Groups'
ATTR_auth_h = 'Authorized_Hosts'
ATTR_cred = 'cred'
ATTR_nodemux = 'no_stdio_sockets'
ATTR_umask = 'umask'
ATTR_block = 'block'
ATTR_convert = 'qmove'
ATTR_DefaultChunk = 'default_chunk'
ATTR_X11_cookie = 'forward_x11_cookie'
ATTR_X11_port = 'forward_x11_port'
ATTR_resv_standing = 'reserve_standing'
ATTR_resv_count = 'reserve_count'
ATTR_resv_idx = 'reserve_index'
ATTR_resv_rrule = 'reserve_rrule'
ATTR_resv_execvnodes = 'reserve_execvnodes'
ATTR_resv_timezone = 'reserve_timezone'
ATTR_ctime = 'ctime'
ATTR_estimated = 'estimated'
ATTR_exechost = 'exec_host'
ATTR_exechost2 = 'exec_host2'
ATTR_execvnode = 'exec_vnode'
ATTR_resv_nodes = 'resv_nodes'
ATTR_mtime = 'mtime'
ATTR_qtime = 'qtime'
ATTR_session = 'session_id'
ATTR_jobdir = 'jobdir'
ATTR_job = 'reserve_job'
ATTR_euser = 'euser'
ATTR_egroup = 'egroup'
ATTR_project = 'project'
ATTR_hashname = 'hashname'
ATTR_hopcount = 'hop_count'
ATTR_security = 'security'
ATTR_sched_hint = 'sched_hint'
ATTR_SchedSelect = 'schedselect'
ATTR_substate = 'substate'
ATTR_name = 'Job_Name'
ATTR_owner = 'Job_Owner'
ATTR_used = 'resources_used'
ATTR_state = 'job_state'
ATTR_queue = 'queue'
ATTR_server = 'server'
ATTR_maxrun = 'max_running'
ATTR_max_run = 'max_run'
ATTR_max_run_res = 'max_run_res'
ATTR_max_run_soft = 'max_run_soft'
ATTR_max_run_res_soft = 'max_run_res_soft'
ATTR_total = 'total_jobs'
ATTR_comment = 'comment'
ATTR_cookie = 'cookie'
ATTR_qrank = 'queue_rank'
ATTR_altid = 'alt_id'
ATTR_altid2 = 'alt_id2'
ATTR_metaid = 'meta_id'
ATTR_acct_id = 'accounting_id'
ATTR_array = 'array'
ATTR_array_id = 'array_id'
ATTR_array_index = 'array_index'
ATTR_array_state_count = 'array_state_count'
ATTR_array_indices_remaining = 'array_indices_remaining'
ATTR_etime = 'etime'
ATTR_gridname = 'gridname'
ATTR_refresh = 'last_context_refresh'
ATTR_ReqCredEnable = 'require_cred_enable'
ATTR_ReqCred = 'require_cred'
ATTR_runcount = 'run_count'
ATTR_stime = 'stime'
ATTR_executable = 'executable'
ATTR_Arglist = 'argument_list'
ATTR_version = 'pbs_version'
ATTR_eligible_time = 'eligible_time'
ATTR_accrue_type = 'accrue_type'
ATTR_sample_starttime = 'sample_starttime'
ATTR_job_kill_delay = 'job_kill_delay'
ATTR_history_timestamp = 'history_timestamp'
ATTR_stageout_status = 'Stageout_status'
ATTR_exit_status = 'Exit_status'
ATTR_submit_arguments = 'Submit_arguments'
ATTR_resv_name = 'Reserve_Name'
ATTR_resv_owner = 'Reserve_Owner'
ATTR_resv_Tag = 'reservation_Tag'
ATTR_resv_ID = 'reserve_ID'
ATTR_resv_retry = 'reserve_retry'
ATTR_aclgren = 'acl_group_enable'
ATTR_aclgroup = 'acl_groups'
ATTR_aclhten = 'acl_host_enable'
ATTR_aclhost = 'acl_hosts'
ATTR_acluren = 'acl_user_enable'
ATTR_acluser = 'acl_users'
ATTR_altrouter = 'alt_router'
ATTR_chkptmin = 'checkpoint_min'
ATTR_enable = 'enabled'
ATTR_fromroute = 'from_route_only'
ATTR_HasNodes = 'hasnodes'
ATTR_killdelay = 'kill_delay'
ATTR_maxgrprun = 'max_group_run'
ATTR_maxgrprunsoft = 'max_group_run_soft'
ATTR_maxque = 'max_queuable'
ATTR_max_queued = 'max_queued'
ATTR_max_queued_res = 'max_queued_res'
ATTR_maxuserrun = 'max_user_run'
ATTR_maxuserrunsoft = 'max_user_run_soft'
ATTR_qtype = 'queue_type'
ATTR_rescassn = 'resources_assigned'
ATTR_rescdflt = 'resources_default'
ATTR_rescmax = 'resources_max'
ATTR_rescmin = 'resources_min'
ATTR_rndzretry = 'rendezvous_retry'
ATTR_routedest = 'route_destinations'
ATTR_routeheld = 'route_held_jobs'
ATTR_routewait = 'route_waiting_jobs'
ATTR_routeretry = 'route_retry_time'
ATTR_routelife = 'route_lifetime'
ATTR_rsvexpdt = 'reserved_expedite'
ATTR_rsvsync = 'reserved_sync'
ATTR_start = 'started'
ATTR_count = 'state_count'
ATTR_number = 'number_jobs'
ATTR_SvrHost = 'server_host'
ATTR_aclroot = 'acl_roots'
ATTR_managers = 'managers'
ATTR_dfltque = 'default_queue'
ATTR_defnode = 'default_node'
ATTR_locsvrs = 'location_servers'
ATTR_logevents = 'log_events'
ATTR_logfile = 'log_file'
ATTR_mailfrom = 'mail_from'
ATTR_nodepack = 'node_pack'
ATTR_nodefailrq = 'node_fail_requeue'
ATTR_resendtermdelay = 'resend_term_delay'
ATTR_operators = 'operators'
ATTR_queryother = 'query_other_jobs'
ATTR_resccost = 'resources_cost'
ATTR_rescavail = 'resources_available'
ATTR_maxuserres = 'max_user_res'
ATTR_maxuserressoft = 'max_user_res_soft'
ATTR_maxgroupres = 'max_group_res'
ATTR_maxgroupressoft = 'max_group_res_soft'
ATTR_maxarraysize = 'max_array_size'
ATTR_PNames = 'pnames'
ATTR_schedit = 'scheduler_iteration'
ATTR_scheduling = 'scheduling'
ATTR_status = 'server_state'
ATTR_syscost = 'system_cost'
ATTR_FlatUID = 'flatuid'
ATTR_FLicenses = 'FLicenses'
ATTR_ResvEnable = 'resv_enable'
ATTR_aclResvgren = 'acl_resv_group_enable'
ATTR_aclResvgroup = 'acl_resv_groups'
ATTR_aclResvhten = 'acl_resv_host_enable'
ATTR_aclResvhost = 'acl_resv_hosts'
ATTR_aclResvuren = 'acl_resv_user_enable'
ATTR_aclResvuser = 'acl_resv_users'
ATTR_NodeGroupEnable = 'node_group_enable'
ATTR_NodeGroupKey = 'node_group_key'
ATTR_dfltqdelargs = 'default_qdel_arguments'
ATTR_dfltqsubargs = 'default_qsub_arguments'
ATTR_rpp_retry = 'rpp_retry'
ATTR_rpp_highwater = 'rpp_highwater'
ATTR_rpp_max_pkt_check = 'rpp_max_pkt_check'
ATTR_pbs_license_info = 'pbs_license_info'
ATTR_license_min = 'pbs_license_min'
ATTR_license_max = 'pbs_license_max'
ATTR_license_linger = 'pbs_license_linger_time'
ATTR_license_count = 'license_count'
ATTR_job_sort_formula = 'job_sort_formula'
ATTR_EligibleTimeEnable = 'eligible_time_enable'
ATTR_resv_retry_init = 'reserve_retry_init'
ATTR_resv_retry_time = 'reserve_retry_time'
ATTR_JobHistoryEnable = 'job_history_enable'
ATTR_JobHistoryDuration = 'job_history_duration'
ATTR_max_concurrent_prov = 'max_concurrent_provision'
ATTR_resv_post_processing = 'resv_post_processing_time'
ATTR_backfill_depth = 'backfill_depth'
ATTR_job_requeue_timeout = 'job_requeue_timeout'
ATTR_SchedHost = 'sched_host'
ATTR_sched_cycle_len = 'sched_cycle_length'
ATTR_do_not_span_psets = 'do_not_span_psets'
ATTR_soft_time = 'soft_limit_time'
ATTR_power_provisioning = 'power_provisioning'
ATTR_max_job_sequence_id = 'max_job_sequence_id'
ATTR_rel_list = 'resource_released_list'
ATTR_released = 'resources_released'
ATTR_restrict_res_to_release_on_suspend = 'restrict_res_to_release_on_suspend'
ATTR_sched_preempt_enforce_resumption = 'sched_preempt_enforce_resumption'
ATTR_tolerate_node_failures = 'tolerate_node_failures'
ATTR_HOOK_type = 'type'
ATTR_HOOK_enable = 'enable'
ATTR_HOOK_event = 'event'
ATTR_HOOK_alarm = 'alarm'
ATTR_HOOK_order = 'order'
ATTR_HOOK_debug = 'debug'
ATTR_HOOK_fail_action = 'fail_action'
ATTR_HOOK_user = 'user'
ATTR_NODE_Host = 'Host'
ATTR_NODE_Mom = 'Mom'
ATTR_NODE_Port = 'Port'
ATTR_NODE_state = 'state'
ATTR_NODE_ntype = 'ntype'
ATTR_NODE_jobs = 'jobs'
ATTR_NODE_resvs = 'resv'
ATTR_NODE_resv_enable = 'resv_enable'
ATTR_NODE_np = 'np'
ATTR_NODE_pcpus = 'pcpus'
ATTR_NODE_properties = 'properties'
ATTR_NODE_NoMultiNode = 'no_multinode_jobs'
ATTR_NODE_No_Tasks = 'no_tasks'
ATTR_NODE_Sharing = 'sharing'
ATTR_NODE_HPCBP_User_name = 'hpcbp_user_name'
ATTR_NODE_HPCBP_WS_address = 'hpcbp_webservice_address'
ATTR_NODE_HPCBP_Stage_protocol = 'hpcbp_stage_protocol'
ATTR_NODE_HPCBP_enable = 'hpcbp_enable'
ATTR_NODE_ProvisionEnable = 'provision_enable'
ATTR_NODE_current_aoe = 'current_aoe'
ATTR_NODE_in_multivnode_host = 'in_multivnode_host'
ATTR_NODE_License = 'license'
ATTR_NODE_LicenseInfo = 'license_info'
ATTR_NODE_TopologyInfo = 'topology_info'
ATTR_NODE_last_used_time = 'last_used_time'
ATTR_NODE_last_state_change_time = 'last_state_change_time'
ATTR_sched_server_dyn_res_alarm = 'server_dyn_res_alarm'
ATTR_RESC_TYPE = 'type'
ATTR_RESC_FLAG = 'flag'

SHUT_IMMEDIATE = 0x0
SHUT_DELAY = 0x01
SHUT_QUICK = 0x02
SHUT_WHO_SCHED = 0x10
SHUT_WHO_MOM = 0x20
SHUT_WHO_SECDRY = 0x40
SHUT_WHO_IDLESECDRY = 0x80
SHUT_WHO_SECDONLY = 0x100

USER_HOLD = 'u'
OTHER_HOLD = 'o'
SYSTEM_HOLD = 's'
BAD_PASSWORD_HOLD = 'p'


class attropl:

    def __init__(self):
        self.name = None
        self.value = None
        self.attribute = None
        self.next = None
        self.resource = None
        self.op = None


class attrl:

    def __init__(self):
        self.name = None
        self.value = None
        self.attribute = None
        self.next = None
        self.resource = None
        self.op = None


class batch_status:

    def __init__(self):
        self.next = None
        self.name = None
        self.attribs = None
        self.text = None


class ecl_attrerr:

    def __init__(self):
        self.ecl_attribute = None
        self.ecl_errcode = None
        self.ecl_errmsg = None


class ecl_attribute_errors:

    def __init(self):
        self.ecl_numerrors = None
        self.ecl_attrerr = None


def pbs_asyrunjob(c, jobid, attrib, extend):
    pass


def pbs_alterjob(c, jobid, attrib, extend):
    pass


def pbs_connect(c):
    pass


def pbs_connect_extend(c, extend):
    pass


def pbs_default(void):
    pass


def pbs_deljob(c, jobid, extend):
    pass


def pbs_disconnect(c):
    pass


def pbs_geterrmsg(c):
    pass


def pbs_holdjob(c, jobid, hold, extend):
    pass


def pbs_locjob(c, jobid, extend):
    pass


def pbs_manager(c, cmd, type, id, attropl, extend):
    pass


def pbs_movejob(c, jobid, destin, extend):
    pass


def pbs_msgjob(c, jobid, file, msg, extend):
    pass


def pbs_orderjob(c, jobid1, jobid2, extend):
    pass


def pbs_rerunjob(c, jobid, extend):
    pass


def pbs_rlsjob(c, jobid, hold, extend):
    pass


def pbs_runjob(c, jobid, loc, extend):
    pass


def pbs_selectjob(c, attropl, extend):
    pass


def pbs_sigjob(c, jobid, sig, extend):
    pass


def pbs_statfree(batch_status):
    pass


def pbs_statjob(c, jobid, attrl, extend):
    pass


def pbs_selstat(c, attropl, attrl, extend):
    pass


def pbs_statque(c, q, attrl, extend):
    pass


def pbs_statserver(c, attrl, extend):
    pass


def pbs_statsched(c, attrl, extend):
    pass


def pbs_stathost(c, id, attrl, extend):
    pass


def pbs_statnode(c, id, attrl, extend):
    pass


def pbs_statvnode(c, id, attrl, extend):
    pass


def pbs_statresv(c, id, attrl, extend):
    pass


def pbs_stathook(c, id, attrl, s1):
    pass


def pbs_statrsc(c, id, attrl, extend):
    pass


def pbs_get_attributes_in_error(c):
    pass


def pbs_submit(c, attropl, script, destin, extend):
    pass


def pbs_submit_resv(c, attropl, jobid):
    pass


def pbs_delresv(c, id, extend):
    pass


def pbs_terminate(c, manner, extend):
    pass


def pbs_modify_resv(c, resvid, attrib, extend):
    pass


================================================
FILE: test/fw/ptl/lib/pbs_testlib.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.lib.ptl_error import *
from ptl.lib.ptl_expect_action import *
from ptl.lib.ptl_batchutils import *
from ptl.lib.ptl_types import *
from ptl.lib.ptl_object import *
from ptl.lib.ptl_service import *
from ptl.lib.ptl_config import *
from ptl.lib.ptl_constants import *
from ptl.lib.ptl_server import *
from ptl.lib.ptl_sched import *
from ptl.lib.ptl_mom import *
from ptl.lib.ptl_comm import *
from ptl.lib.ptl_resourceresv import *
from ptl.lib.ptl_fairshare import *
from ptl.lib.ptl_entities import *


================================================
FILE: test/fw/ptl/lib/ptl_batchutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import collections
import copy
import datetime
import json
import logging
import os
import random
import re
import string
import sys
import time
from collections import OrderedDict
from distutils.version import LooseVersion

from ptl.lib.pbs_api_to_cli import api_to_cli
from ptl.utils.pbs_dshutils import DshUtils
from ptl.lib.ptl_constants import *

from ptl.lib.ptl_types import (PbsTypeSize, PbsTypeChunk,
                               PbsTypeDuration, PbsAttribute)


class BatchUtils(object):

    """
    Utility class to create/convert/display various PBS
    data structures
    """

    legal = r"\d\w:\+=\[\]~"
    chunks_tag = re.compile(r"(?P<chunk>\([\d\w:\+=\[\]~]\)[\+]?)")
    chunk_tag = re.compile(r"(?P<vnode>[\w\d\[\]]+):" +
                           r"(?P<resources>[\d\w:\+=\[\]~])+\)")

    array_tag = re.compile(r"(?P<jobid>[\d]+)\[(?P<subjobid>[0-9]*)\]*" +
                           r"[.]*[(?P<server>.*)]*")
    subjob_tag = re.compile(r"(?P<jobid>[\d]+)\[(?P<subjobid>[0-9]+)\]*" +
                            r"[.]*[(?P<server>.*)]*")

    pbsobjname_re = re.compile(r"^(?P<tag>[\w\d][\d\w\s]*:?[\s]+)" +
                               r"*(?P<name>[\^\\\w@\.\d\[\]-]+)$")
    pbsobjattrval_re = re.compile(r"""
                            [\s]*(?P<attribute>[\w\d\.-]+)
                            [\s]*=[\s]*
                            (?P<value>.*)
                            [\s]*""",
                                  re.VERBOSE)
    dt_re = r'(?P<dt_from>\d\d/\d\d/\d\d\d\d \d\d:\d\d)' + \
            r'[\s]+' + \
            r'(?P<dt_to>\d\d/\d\d/\d\d\d\d \d\d:\d\d)'
    dt_tag = re.compile(dt_re)
    hms_tag = re.compile(r'(?P<hr>\d\d):(?P<mn>\d\d):(?P<sc>\d\d)')
    lim_tag = re.compile(r"(?P<limtype>[a-z_]+)[\.]*(?P<resource>[\w\d-]*)"
                         r"=[\s]*\[(?P<entity_type>[ugpo]):"
                         r"(?P<entity_name>[\w\d-]+)"
                         r"=(?P<entity_value>[\d\w]+)\][\s]*")

    def __init__(self):
        self.logger = logging.getLogger(__name__)
        self.du = DshUtils()
        self.platform = self.du.get_platform()

    def list_to_attrl(self, l):
        """
        Convert a list to a PBS attribute list

        :param l: List to be converted
        :type l: List
        :returns: PBS attribute list
        """
        return self.list_to_attropl(l, None)

    def list_to_attropl(self, l, op=SET):
        """
        Convert a list to a PBS attribute operation list

        :param l: List to be converted
        :type l: List
        :returns: PBS attribute operation list
        """
        head = None
        prev = None

        for i in l:
            a = self.str_to_attropl(i, op)
            if prev is None:
                head = a
            else:
                prev.next = a
            prev = a
            if op is not None:
                a.op = op
        return head

    def str_to_attrl(self, s):
        """
        Convert a string to a PBS attribute list

        :param s: String to be converted
        :type s: str
        :returns: PBS attribute list
        """
        return self.str_to_attropl(s, None)

    def str_to_attropl(self, s, op=SET):
        """
        Convert a string to a PBS attribute operation list

        :param s: String to be converted
        :type s: str
        :returns: PBS attribute operation list
        """
        if op is not None:
            a = attropl()
        else:
            a = attrl()
        if '.' in s:
            (attribute, resource) = s.split('.')
            a.name = attribute
            a.resource = resource.strip()
        else:
            a.name = s
        a.value = ''
        a.next = None
        if op:
            a.op = op
        return a

    def dict_to_attrl(self, d={}):
        """
        Convert a dictionary to a PBS attribute list

        :param d: Dictionary to be converted
        :type d: Dictionary
        :returns: PBS attribute list
        """
        return self.dict_to_attropl(d, None)

    def dict_to_attropl(self, d={}, op=SET):
        """
        Convert a dictionary to a PBS attribute operation list

        :param d: Dictionary to be converted
        :type d: Dictionary
        :returns: PBS attribute operation list
        """
        if len(d.keys()) == 0:
            return None

        prev = None
        head = None

        for k, v in d.items():
            if isinstance(v, tuple):
                op = v[0]
                v = v[1]
            if op is not None:
                a = attropl()
            else:
                a = attrl()
            if '.' in k:
                (attribute, resource) = k.split('.')
                a.name = attribute
                a.resource = resource
            else:
                a.name = k
            a.value = str(v)
            if op is not None:
                a.op = op
            a.next = None

            if prev is None:
                head = a
            else:
                prev.next = a
            prev = a
        return head

    def convert_to_attrl(self, attrib):
        """
        Generic call to convert Python type to PBS attribute list

        :param attrib: Attributes to be converted
        :type attrib: List or tuple or dictionary or str
        :returns: PBS attribute list
        """
        return self.convert_to_attropl(attrib, None)

    def convert_to_attropl(self, attrib, cmd=MGR_CMD_SET, op=None):
        """
        Generic call to convert Python type to PBS attribute
        operation list

        :param attrib: Attributes to be converted
        :type attrib: List or tuple or dictionary or str
        :returns: PBS attribute operation list
        """
        if op is None:
            op = self.command_to_op(cmd)

        if isinstance(attrib, (list, tuple)):
            a = self.list_to_attropl(attrib, op)
        elif isinstance(attrib, (dict, OrderedDict)):
            a = self.dict_to_attropl(attrib, op)
        elif isinstance(attrib, str):
            a = self.str_to_attropl(attrib, op)
        else:
            a = None
        return a

    def command_to_op(self, cmd=None):
        """
        Map command to a ``SET`` or ``UNSET`` Operation. An unrecognized
        command will return SET. No command will return None.

        :param cmd: Command to be mapped
        :type cmd: str
        :returns: ``SET`` or ``UNSET`` operation for the command
        """

        if cmd is None:
            return None
        if cmd in (MGR_CMD_SET, MGR_CMD_EXPORT, MGR_CMD_IMPORT):
            return SET
        if cmd == MGR_CMD_UNSET:
            return UNSET
        return SET

    def display_attrl(self, a=None, writer=sys.stdout):
        """
        Display an attribute list using writer, defaults to sys.stdout

        :param a: Attributes
        :type a: List
        :returns: Displays attribute list
        """
        return self.display_attropl(a)

    def display_attropl(self, attropl=None, writer=sys.stdout):
        """
        Display an attribute operation list with writer, defaults to
        sys.stdout

        :param attropl: Attribute operation list
        :type attropl: List
        :returns: Displays an attribute operation list
        """
        attrs = attropl
        while attrs is not None:
            if attrs.resource:
                writer.write('\t' + attrs.name + '.' + attrs.resource + '= ' +
                             attrs.value + '\n')
            else:
                writer.write('\t' + attrs.name + '= ' + attrs.value + '\n')
            attrs = attrs.__next__

    def display_dict(self, d, writer=sys.stdout):
        """
        Display a dictionary using writer, defaults to sys.stdout

        :param d: Dictionary
        :type d: Dictionary
        :returns: Displays a dictionary
        """
        if not d:
            return
        for k, v in d.items():
            writer.write(k + ': ' + v + '\n')

    def batch_status_to_dictlist(self, bs=None, attr_names=None, id=None):
        """
        Convert a batch status to a list of dictionaries.
        version 0.1a6 added this conversion as a typemap(out) as
        part of the swig wrapping itself so there are fewer uses
        for this function.Returns a list of dictionary
        representation of batch status

        :param bs: Batch status
        :param attr_names: Attribute names
        :returns: List of dictionaries
        """
        attr_time = (
            'ctime', 'mtime', 'qtime', 'start', 'end', 'reserve_start',
            'reserve_end', 'estimated.start_time')
        ret = []
        while bs:
            if id is not None and bs.name != id:
                bs = bs.__next__
                continue
            d = {}
            attrs = bs.attribs
            while attrs is not None:
                if attrs.resource:
                    key = attrs.name + '.' + attrs.resource
                else:
                    key = attrs.name
                if attr_names is not None:
                    if key not in attr_names:
                        attrs = attrs.__next__
                        continue
                val = attrs.value
                if attrs.name in attr_time:
                    val = self.convert_time(val)
                # for attributes that may occur multiple times (e.g., max_run)
                # append the value in a comma-separated representation
                if key in d:
                    d[key] = d[key] + ',' + str(val)
                else:
                    d[key] = str(val)
                attrs = attrs.__next__
            if len(d.keys()) > 0:
                ret.append(d)
                d['id'] = bs.name
            bs = bs.__next__
        return ret

    def display_batch_status(self, bs=None, attr_names=None,
                             writer=sys.stdout):
        """
        Display a batch status using writer, defaults to sys.stdout
        :param bs: Batch status
        :param attr_name: Attribute name
        :type attr_name: str
        :returns: Displays batch status
        """
        if bs is None:
            return

        attr_list = self.batch_status_to_dictlist(bs, attr_names)
        self.display_batch_status_as_dictlist(attr_list, writer)

    def display_dictlist(self, dict_list=[], writer=sys.stdout, fmt=None):
        """
        Display a list of dictionaries using writer, defaults to
        sys.stdout

        :param l: The list to display
        :type l: List
        :param writer: The stream on which to write
        :param fmt: An optional formatting string
        :type fmt: str or None
        :returns: Displays list of dictionaries
        """
        self.display_batch_status_as_dictlist(dict_list, writer, fmt)

    def dictlist_to_file(self, dict_list=[], filename=None, mode='w'):
        """
        write a dictlist to file

        :param l: Dictlist
        :type l: List
        :param filename: File to which dictlist need to be written
        :type filename: str
        :param mode: Mode of file
        :type mode: str
        :raises: Exception writing to file
        """
        if filename is None:
            self.logger.error('a filename is required')
            return

        d = os.path.dirname(filename)
        if d != '' and not os.path.isdir(d):
            os.makedirs(d)
        try:
            with open(filename, mode) as f:
                self.display_dictlist(dict_list, f)
        except Exception:
            self.logger.error('error writing to file ' + filename)
            raise

    def batch_status_as_dictlist_to_file(self, dictlist=[], writer=sys.stdout):
        """
        Write a dictlist to file

        :param dictlist: Dictlist
        :type dictlist: List
        :raises: Exception writing to file
        """
        return self.dictlist_to_file(dictlist, writer)

    def file_to_dictlist(self, fpath=None, attribs=None, id=None):
        """
        Convert a file to a batch dictlist format

        :param fpath: File to be converted
        :type fpath: str
        :param attribs: Attributes
        :returns: File converted to a batch dictlist format
        """
        if fpath is None:
            return []

        try:
            with open(fpath, 'r') as f:
                lines = f.readlines()
        except Exception as e:
            self.logger.error('error converting list of dictionaries to ' +
                              'file ' + str(e))
            return []

        return self.convert_to_dictlist(lines, attribs, id=id)

    def file_to_vnodedef(self, fpath=None):
        """
        Convert a file output of pbsnodes -av to a vnode
        definition format

        :param fpath: File to be converted
        :type fpath: str
        :returns: Vnode definition format
        """
        if fpath is None:
            return None
        try:
            with open(fpath, 'r') as f:
                lines = f.readlines()
        except Exception:
            self.logger.error('error converting nodes to vnode def')
            return None

        dl = self.convert_to_dictlist(lines)

        return self.dictlist_to_vnodedef(dl)

    def show(self, obj_list=[], name=None, fmt=None):
        """
        Alias to display_dictlist with sys.stdout as writer

        :param name: if specified only show the object of
                     that name
        :type name: str
        :param fmt: Optional formatting string, uses %n for
                    object name, %a for attributes, for example
                    a format of r'%nE{}nE{}t%aE{}n' will display
                    objects with their name starting on the first
                    column, a new line, and attributes indented by
                    a tab followed by a new line at the end.
        :type fmt: str
        """
        if name:
            i = 0
            for obj in obj_list:
                if obj['id'] == name:
                    obj_list = [obj_list[i]]
                    break
                i += 1
        self.display_dictlist(obj_list, fmt=fmt)

    def get_objtype(self, d={}):
        """
        Get the type of a given object

        :param d: Dictionary
        :type d: Dictionary
        :Returns: Type of the object
        """
        if 'Job_Name' in d:
            return JOB
        elif 'queue_type' in d:
            return QUEUE
        elif 'Reserve_Name' in d:
            return RESV
        elif 'server_state' in d:
            return SERVER
        elif 'Mom' in d:
            return NODE
        elif 'event' in d:
            return HOOK
        elif 'type' in d:
            return RSC
        return None

    def display_batch_status_as_dictlist(self, dict_list=[], writer=sys.stdout,
                                         fmt=None):
        """
        Display a batch status as a list of dictionaries
        using writer, defaults to sys.stdout

        :param dict_list: List
        :type dict_list: List
        :param fmt: - Optional format string
        :type fmt: str or None
        :returns: Displays batch status as a list of dictionaries
        """
        if dict_list is None:
            return

        for d in dict_list:
            self.display_batch_status_as_dict(d, writer, fmt)

    def batch_status_as_dict_to_str(self, d={}, fmt=None):
        """
        Return a string representation of a batch status dictionary

        :param d: Dictionary
        :type d: Dictionary
        :param fmt: Optional format string
        :type fmt: str or None
        :returns: String representation of a batch status dictionary
        """
        objtype = self.get_objtype(d)

        if fmt is not None:
            if '%1' in fmt:
                _d1 = fmt['%1']
            else:
                _d1 = '\n'
            if '%2' in fmt:
                _d2 = fmt['%2']
            else:
                _d2 = '    '
            if '%3' in fmt:
                _d3 = fmt['%3']
            else:
                _d3 = ' = '
            if '%4' in fmt:
                _d4 = fmt['%4']
            else:
                _d4 = '\n'
            if '%5' in fmt:
                _d5 = fmt['%5']
            else:
                _d5 = '\n'
            if '%6' in fmt:
                _d6 = fmt['%6']
            else:
                _d6 = ''
        else:
            _d1 = '\n'
            _d2 = '    '
            _d3 = ' = '
            _d4 = '\n'
            _d5 = '\n'
            _d6 = ''

        if objtype == JOB:
            _n = 'Job Id: ' + d['id'] + _d1
        elif objtype == QUEUE:
            _n = 'Queue: ' + d['id'] + _d1
        elif objtype == RESV:
            _n = 'Name: ' + d['id'] + _d1
        elif objtype == SERVER:
            _n = 'Server: ' + d['id'] + _d1
        elif objtype == RSC:
            _n = 'Resource: ' + d['id'] + _d1
        elif 'id' in d:
            _n = d['id'] + _d1
            del d['id']
        else:
            _n = ''

        _a = []
        for k, v in sorted(d.items()):
            if k == 'id':
                continue
            _a += [_d2 + k + _d3 + str(v)]

        return _n + _d4.join(_a) + _d5 + _d6

    def display_batch_status_as_dict(self, d={}, writer=sys.stdout, fmt=None):
        """
        Display a dictionary representation of a batch status
        using writer, defaults to sys.stdout

        :param d: Dictionary
        :type d: Dictionary
        :param fmt: Optional format string
        :param fmt: str
        :returns: Displays dictionary representation of a batch
                  status
        """
        writer.write(self.batch_status_as_dict_to_str(d, fmt))

    def decode_dictlist(self, dict_list=None, json=True):
        """
        decode a list of dictionaries

        :param dict_list: List of dictionaries
        :type dict_list: List
        :param json: The target of the decode is meant for ``JSON``
                     formatting
        :returns: Decoded list of dictionaries
        """
        if dict_list is None:
            return ''

        _js = []
        for d in dict_list:
            _jdict = {}
            for k, v in d.items():
                if ',' in v:
                    _jdict[k] = v.split(',')
                else:
                    _jdict[k] = PbsAttribute.decode_value(v)
            _js.append(_jdict)
        return _js

    def convert_to_ascii(self, s):
        """
        Convert char sequences within string like ^A, ^B, ... to
        ASCII 0x01, ...

        :param s: string to convert
        :type s: string
        :returns: converted string
        """
        def repl(m):
            c = m.group(1)
            return chr(ord(c) - 64) if "@" < c <= "_" else m.group(0)
        return re.sub(r"\^(.)", repl, s)

    def convert_to_dictlist(self, l, attribs=None, mergelines=True, id=None,
                            obj_type=None):
        """
        Convert a list of records into a dictlist format.

        :param l: array of records to convert
        :type l: List
        :param mergelines: merge qstat broken lines into one
        :param obj_type: The type of object to query, one of the *
                         objects.
        :returns: Record list converted into dictlist format
        """

        if mergelines:
            lines = []
            count = 1
            for i in range(len(l)):
                if l[i].startswith('\t'):
                    _e = len(lines) - 1
                    lines[_e] = lines[_e].strip('\r\n\t') + \
                        l[i].strip('\r\n\t')
                elif (not l[i].startswith(' ') and i > count and
                      l[i - count].startswith('\t')):
                    _e = len(lines) - count
                    lines[_e] = lines[_e] + l[i]
                    if ((i + 1) < len(l) and not
                            l[i + 1].startswith(('\t', ' '))):
                        count += 1
                    else:
                        count = 1
                else:
                    lines.append(l[i])
        else:
            lines = l

        objlist = []
        d = {}

        for l in lines:
            strip_line = l.strip()
            m = self.pbsobjname_re.match(strip_line)
            if m:
                if len(d.keys()) > 1:
                    if id is None or (id is not None and d['id'] == id):
                        objlist.append(d.copy())
                d = {}
                d['id'] = self.convert_to_ascii(m.group('name'))
                _t = m.group('tag')
                if _t == 'Resv ID: ':
                    d[_t.replace(': ', '')] = d['id']
            else:
                m = self.pbsobjattrval_re.match(strip_line)
                if m:
                    attr = m.group('attribute')
                    # Revisit this after having separate VNODE class
                    if (attribs is None or attr.lower() in attribs or
                            attr in attribs or (obj_type == MGR_OBJ_NODE and
                                                attr == 'Mom')):
                        if attr in d:
                            d[attr] = d[attr] + "," + m.group('value')
                        else:
                            d[attr] = m.group('value')
        # add the last element
        if len(d.keys()) > 1:
            if id is None or (id is not None and d['id'] == id):
                objlist.append(d.copy())

        return objlist

    def convert_to_batch(self, l, mergelines=True):
        """
        Convert a list of records into a batch format.

        :param l: array of records to convert
        :type l: List
        :param mergelines: qstat breaks long lines over
                           multiple lines, merge them\
                           to one by default.
        :type mergelines: bool
        :returns: A linked list of batch status
        """

        if mergelines:
            lines = []
            for i in range(len(l)):
                if l[i].startswith('\t'):
                    _e = len(lines) - 1
                    lines[_e] = lines[_e].strip('\r\t') + \
                        l[i].strip('\r\n')
                else:
                    lines.append(l[i])
        else:
            lines = l

        head_bs = None
        prev_bs = None
        prev_attr = None

        for l in lines:
            strip_line = l.strip()
            m = self.pbsobjname_re.match(strip_line)
            if m:
                bs = batch_status()
                bs.name = m.group('name')
                bs.attribs = None
                bs.next = None
                if prev_bs:
                    prev_bs.next = bs
                if head_bs is None:
                    head_bs = bs
                prev_bs = bs
                prev_attr = None
            else:
                m = self.pbsobjattrval_re.match(strip_line)
                if m:
                    attr = attrl()
                    attr.name = m.group('attribute')
                    attr.value = m.group('value')
                    attr.next = None
                    if bs.attribs is None:
                        bs.attribs = attr
                    if prev_attr:
                        prev_attr.next = attr
                    prev_attr = attr

        return head_bs

    def file_to_batch(self, fpath=None):
        """
        Convert a file to batch format

        :param fpath: File to be converted
        :type fpath: str or None
        :returns: File converted into batch format
        """
        if fpath is None:
            return None

        try:
            with open(fpath, 'r') as f:
                lines = f.readlines()
        except Exception:
            self.logger.error('error converting file ' + fpath + ' to batch')
            return None

        return self.convert_to_batch(lines)

    def batch_to_file(self, bs=None, fpath=None):
        """
        Write a batch object to file

        :param bs: Batch status
        :param fpath: File to which batch object is to be written
        :type fpath: str
        """
        if bs is None or fpath is None:
            return

        try:
            with open(fpath, 'w') as f:
                self.display_batch_status(bs, writer=f)
        except Exception:
            self.logger.error('error converting batch status to file')

    def batch_to_vnodedef(self, bs):
        """
        :param bs: Batch status
        :returns: The vnode definition string representation
                  of nodes batch_status
        """
        out = ["$configversion 2\n"]

        while bs is not None:
            attr = bs.attribs
            while attr is not None:
                if attr.name.startswith("resources_available") or \
                        attr.name.startswith("sharing"):
                    out += [bs.name + ": "]
                    out += [attr.name + "=" + attr.value + "\n"]
                attr = attr.__next__
            bs = bs.__next__
        return "".join(out)

    def dictlist_to_vnodedef(self, dl=None):
        """
        :param dl: Dictionary list
        :type dl: List
        :returns: The vnode definition string representation
                  of a dictlist
        """
        if dl is None:
            return ''

        out = ["$configversion 2\n"]

        for node in dl:
            for k, v in node.items():
                if (k.startswith("resources_available") or
                        k.startswith("sharing") or
                        k.startswith("provision_enable") or
                        k.startswith("queue")):
                    out += [node['id'] + ": "]
                    # MoM dislikes empty values reported in vnode defs so
                    # we substitute no value for an actual empty string
                    if not v:
                        v = '""'
                    out += [k + "=" + str(v) + "\n"]

        return "".join(out)

    def objlist_to_dictlist(self, objlist=None):
        """
        Convert a list of PBS/PTL objects ``(e.g. Server/Job...)``
        into a dictionary list representation of the batch status

        :param objlist: List of ``PBS/PTL`` objects
        :type objlist: List
        :returns: Dictionary list representation of the batch status
        """
        if objlist is None:
            return None

        bsdlist = []
        for obj in objlist:
            newobj = self.obj_to_dict(obj)
            bsdlist.append(newobj)
        return bsdlist

    def obj_to_dict(self, obj):
        """
        Convert a PBS/PTL object (e.g. Server/Job...) into a
        dictionary format

        :param obj: ``PBS/PTL`` object
        :returns: Dictionary of ``PBS/PTL`` objects
        """
        newobj = dict(obj.attributes.items())
        newobj[id] = obj.name
        return newobj

    def parse_execvnode(self, s=None):
        """
        Parse an execvnode string into chunk objects

        :param s: Execvnode string
        :type s: str or None
        :returns: Chunk objects for parsed execvnode string
        """
        if s is None:
            return None

        chunks = []
        start = 0
        for c in range(len(s)):
            if s[c] == '(':
                start = c + 1
            if s[c] == ')':
                chunks.append(PbsTypeChunk(chunkstr=s[start:c]).info)
        return chunks

    def anupbs_exechost_numhosts(self, s=None):
        """
        :param s: Exechost string
        :type s: str or None
        """
        n = 0
        if '[' in s:
            eh = re.sub(r'.*\[(.*)\].*', r'\1', s)
            hosts = eh.split(',')
            for hid in hosts:
                elm = hid.split('-')
                if len(elm) == 2:
                    n += int(elm[1]) - int(elm[0]) + 1
                else:
                    n += 1
        else:
            n += 1
        return n

    def parse_exechost(self, s=None):
        """
        Parse an exechost string into a dictionary representation

        :param s: String to be parsed
        :type s: str or None
        :returns: Dictionary format of the exechost string
        """
        if s is None:
            return None

        hosts = []
        hsts = s.split('+')
        for h in hsts:
            hi = {}
            ti = {}
            (host, task) = h.split('/',)
            d = task.split('*')
            if len(d) == 1:
                taskslot = d[0]
                ncpus = 1
            elif len(d) == 2:
                (taskslot, ncpus) = d
            else:
                (taskslot, ncpus) = (0, 1)
            ti['task'] = taskslot
            ti['ncpus'] = ncpus
            hi[host] = ti
            hosts.append(hi)
        return hosts

    def parse_select(self, s=None):
        """
        Parse a ``select/schedselect`` string into a list
        of dictionaries.

        :param s: select/schedselect string
        :type s: str or None
        :returns: List of dictonaries
        """
        if s is None:
            return
        info = []
        chunks = s.split('+')
        for chunk in chunks:
            d = chunk.split(':')
            numchunks = int(d[0])
            resources = {}
            for e in d[1:]:
                k, v = e.split('=')
                resources[k] = v
            for _ in range(numchunks):
                info.append(resources)

        return info

    def convert_time(self, val, fmt='%a %b %d %H:%M:%S %Y'):
        """
        Convert a date time format into number of seconds
        since epoch

        :param val: date time value
        :param fmt: date time format
        :type fmt: str
        :returns: seconds
        """
        # Tweak for NAS format that puts the number of seconds since epoch
        # in between
        if val.split()[0].isdigit():
            val = int(val.split()[0])
        elif not val.isdigit():
            val = time.strptime(val, fmt)
            val = int(time.mktime(val))
        return val

    def convert_duration(self, val):
        """
        Convert HH:MM:SS into number of seconds
        If a number is fed in, that number is returned
        If neither formatted data is fed in, returns 0

        :param val: duration value
        :type val: str
        :raises: Incorrect format error
        :returns: seconds
        """
        if val.isdigit():
            return int(val)

        hhmmss = val.split(':')
        if len(hhmmss) != 3:
            self.logger.error('Incorrect format, expected HH:MM:SS')
            return 0
        return int(hhmmss[0]) * 3600 + int(hhmmss[1]) * 60 + int(hhmmss[2])

    def convert_seconds_to_datetime(self, tm, fmt=None, seconds=True):
        """
        Convert time format to number of seconds since epoch

        :param tm: the time to convert
        :type tm: str
        :param fmt: optional format string. If used, the seconds
                    parameter is ignored.Defaults to ``%Y%m%d%H%M``
        :type fmt: str or None
        :param seconds: if True, convert time with seconds
                        granularity. Defaults to True.
        :type seconds: bool
        :returns: Number of seconds
        """
        if fmt is None:
            fmt = "%Y%m%d%H%M"
            if seconds:
                fmt += ".%S"

        return time.strftime(fmt, time.localtime(int(tm)))

    def convert_stime_to_seconds(self, st):
        """
        Convert a time to seconds, if we fail we return the
        original time

        :param st: Time to be converted
        :type st: str
        :returns: Number of seconds
        """
        try:
            ret = time.mktime(time.strptime(st, '%a %b %d %H:%M:%S %Y'))
        except Exception:
            ret = st
        return ret

    def convert_dedtime(self, dtime):
        """
        Convert dedicated time string of form %m/%d/%Y %H:%M.

        :param dtime: A datetime string, as an entry in the
                      dedicated_time file
        :type dtime: str
        :returns: A tuple of (from,to) of time since epoch
        """
        dtime_from = None
        dtime_to = None

        m = self.dt_tag.match(dtime.strip())
        if m:
            try:
                _f = "%m/%d/%Y %H:%M"
                dtime_from = self.convert_datetime_to_epoch(m.group('dt_from'),
                                                            fmt=_f)
                dtime_to = self.convert_datetime_to_epoch(m.group('dt_to'),
                                                          fmt=_f)
            except Exception:
                self.logger.error('error converting dedicated time')
        return (dtime_from, dtime_to)

    def convert_datetime_to_epoch(self, mdyhms, fmt="%m/%d/%Y %H:%M:%S"):
        """
        Convert the date time to epoch

        :param mdyhms: date time
        :type mdyhms: str
        :param fmt: Format for date time
        :type fmt: str
        :returns: Epoch time
        """
        return int(time.mktime(time.strptime(mdyhms, fmt)))

    def compare_versions(self, v1, v2, op=None):
        """
        Compare v1 to v2 with respect to operation op

        :param v1: If not a looseversion, it gets converted
                   to it
        :param v2: If not a looseversion, it gets converted
                   to it
        :param op: An operation, one of ``LT``, ``LE``, ``EQ``,
                   ``GE``, ``GT``
        :type op: str
        :returns: True or False
        """
        if op is None:
            self.logger.error('missing operator, one of LT,LE,EQ,GE,GT')
            return None

        if v1 is None or v2 is None:
            return False

        if isinstance(v1, str):
            v1 = LooseVersion(v1)
        if isinstance(v2, str):
            v2 = LooseVersion(v2)

        if op == GT:
            if v1 > v2:
                return True
        elif op == GE:
            if v1 >= v2:
                return True
        elif op == EQ:
            if v1 == v2:
                return True
        elif op == LT:
            if v1 < v2:
                return True
        elif op == LE:
            if v1 <= v2:
                return True

        return False

    def convert_arglist(self, attr):
        """
        strip the XML attributes from the argument list attribute

        :param attr: Argument list attributes
        :type attr: List
        :returns: Stripped XML attributes
        """

        xmls = "<jsdl-hpcpa:Argument>"
        xmle = "</jsdl-hpcpa:Argument>"
        nattr = attr.replace(xmls, " ")
        nattr = nattr.replace(xmle, " ")

        return nattr.strip()

    def convert_to_cli(self, attrs, op=None, hostname=None, dflt_conf=True,
                       exclude_attrs=None):
        """
        Convert attributes into their CLI format counterpart. This
        method is far from complete, it grows as needs come by and
        could use a rewrite, especially going along with a rewrite
        of pbs_api_to_cli

        :param attrs: Attributes to convert
        :type attrs: List or str or dictionary
        :param op: The qualifier of the operation being performed,
                   such as ``IFL_SUBMIT``, ``IFL_DELETE``,
                   ``IFL_TERMINUTE``...
        :type op: str or None
        :param hostname: The name of the host on which to operate
        :type hostname: str or None
        :param dflt_conf: Whether we are using the default PBS
                          configuration
        :type dflt_conf: bool
        :param exclude_attrs: Optional list of attributes to not
                              convert
        :type exclude_attrs: List
        :returns: CLI format of attributes
        """
        ret = []

        if op == IFL_SUBMIT:
            executable = arglist = None

        elif op == IFL_DELETE:
            _c = []
            if isinstance(attrs, str):
                attrs = [attrs]

            if isinstance(attrs, list):
                for a in attrs:
                    if 'force' in a:
                        _c.append('-Wforce')
                    if 'deletehist' in a:
                        _c.append('-x')
                    if 'nomail' in a:
                        _c.append('-Wsuppress_email=-1')
            return _c

        elif op == IFL_TERMINATE:
            _c = []
            if attrs is None:
                _c = []
            elif isinstance(attrs, str):
                _c = ['-t', attrs]
            else:
                if ((attrs & SHUT_QUICK) == SHUT_QUICK):
                    _c = ['-t', 'quick']
                if ((attrs & SHUT_IMMEDIATE) == SHUT_IMMEDIATE):
                    _c = ['-t', 'immediate']
                if ((attrs & SHUT_DELAY) == SHUT_DELAY):
                    _c = ['-t', 'delay']
                if ((attrs & SHUT_WHO_SCHED) == SHUT_WHO_SCHED):
                    _c.append('-s')
                if ((attrs & SHUT_WHO_MOM) == SHUT_WHO_MOM):
                    _c.append('-m')
                if ((attrs & SHUT_WHO_SECDRY) == SHUT_WHO_SECDRY):
                    _c.append('-f')
                if ((attrs & SHUT_WHO_IDLESECDRY) == SHUT_WHO_IDLESECDRY):
                    _c.append('-F')
                if ((attrs & SHUT_WHO_SECDONLY) == SHUT_WHO_SECDONLY):
                    _c.append('-i')
            return _c

        elif op == IFL_RALTER:
            if isinstance(attrs, dict):
                if 'extend' in attrs and attrs['extend'] == 'force':
                    ret.append('-Wforce')
                    del attrs['extend']

        if attrs is None or len(attrs) == 0:
            return ret

        # if a list, convert to a dictionary to fall into a single processing
        # of the attributes
        if (isinstance(attrs, list) and len(attrs) > 0 and
                not isinstance(attrs[0], tuple)):
            tmp_attrs = {}
            for each_attr in attrs:
                tmp_attrs[each_attr] = ''
            del attrs
            attrs = tmp_attrs
            del tmp_attrs

        if isinstance(attrs, (dict, OrderedDict)):
            attrs = attrs.items()

        for a, v in attrs:
            # In job name string, use prefix "\" with special charater
            # to read as an ordinary character on
            # cray, craysim, and shasta platform
            if (a == "Job_Name") and (self.platform == 'cray' or
                                      self.platform == 'craysim' or
                                      self.platform == 'shasta'):
                v = v.translate({ord(c): "\\" +
                                 c for c in r"~`!@#$%^&*()[]{};:,/<>?\|="})
            if exclude_attrs is not None and a in exclude_attrs:
                continue

            if op == IFL_SUBMIT:
                if a == ATTR_executable:
                    executable = v
                    continue
                if a == ATTR_Arglist:
                    if v is not None:
                        arglist = self.convert_arglist(v)
                        if len(arglist) == 0:
                            return []
                    continue
            if isinstance(v, list):
                v = ','.join(v)

            # when issuing remote commands, escape spaces in attribute values
            if (((hostname is not None) and
                 (not self.du.is_localhost(hostname))) or
                    (not dflt_conf)):
                if ' ' in str(v):
                    v = '"' + v + '"'

            if '.' in a:
                (attribute, resource) = a.split('.')
                ret.append('-' + api_to_cli[attribute])
                rv = resource
                if v is not None:
                    rv += '=' + str(v)
                ret.append(rv)
            else:
                try:
                    val = api_to_cli[a]
                except KeyError:
                    self.logger.error('error  retrieving key ' + str(a))
                    # for unknown or junk options
                    ret.append(a)
                    if v is not None:
                        ret.append(str(v))
                    continue
                # on a remote job submit append the remote server name
                # to the queue name
                if ((op == IFL_SUBMIT) and (hostname is not None)):
                    if ((not self.du.is_localhost(hostname)) and
                            (val == 'q') and (v is not None) and
                            ('@' not in v) and (v != '')):
                        v += '@' + hostname
                val = '-' + val
                if '=' in val:
                    if v is not None:
                        ret.append(val + str(v))
                    else:
                        ret.append(val)
                else:
                    ret.append(val)
                    if v is not None:
                        ret.append(str(v))

        # Executable and argument list must come last in a job submission
        if ((op == IFL_SUBMIT) and (executable is not None)):
            ret.append('--')
            ret.append(executable)
            if arglist is not None:
                ret.append(arglist)
        return ret

    def filter_batch_status(self, bs, attrib):
        """
        Filter out elements that don't have the attributes requested
        This is needed to adapt to the fact that requesting a
        resource attribute returns all ``'<resource-name>.*'``
        attributes so we need to ensure that the specific resource
        requested is present in the stat'ed object.

        This is needed especially when calling expect with an op=NE
        because we need to filter on objects that have exactly
        the attributes requested

        :param bs: Batch status
        :param attrib: Requested attributes
        :type attrib: str or dictionary
        :returns: Filtered batch status
        """

        if isinstance(attrib, dict):
            keys = attrib.keys()
        elif isinstance(attrib, str):
            keys = attrib.split(',')
        else:
            keys = attrib

        if keys:
            del_indices = []
            for idx in range(len(bs)):
                for k in bs[idx].keys():
                    if '.' not in k:
                        continue
                    if k != 'id' and k not in keys:
                        del bs[idx][k]
                # if no matching resources, remove the object
                if len(bs[idx]) == 1:
                    del_indices.append(idx)

            for i in sorted(del_indices, reverse=True):
                del bs[i]

        return bs

    def convert_attributes_by_op(self, attributes, setattrs=False):
        """
        Convert attributes by operator, i.e. convert an attribute
        of the form

        ``<attr_name><op><value>`` (e.g. resources_available.ncpus>4)

        to

        ``<attr_name>: (<op>, <value>)``
        (e.g. resources_available.ncpus: (GT, 4))

        :param attributes: the attributes to convert
        :type attributes: List
        :param setattrs: if True, set the attributes with no operator
                         as (SET, '')
        :type setattrs: bool
        :returns: Converted attributes by operator
        """
        # the order of operator matters because they are used to search by
        # regex so the longer strings to search must come first
        operators = ('<=', '>=', '!=', '=', '>', '<', '~')
        d = {}
        for attr in attributes:
            found = False
            for op in operators:
                if op in attr:
                    a = attr.split(op)
                    d[a[0]] = (PTL_STR_TO_OP[op], a[1])
                    found = True
                    break
            if not found and setattrs:
                d[attr] = (SET, '')
        return d

    def operator_in_attribute(self, attrib):
        """
        Returns True if an operator string is present in an
        attribute name

        :param attrib: Attribute name
        :type attrib: str
        :returns: True or False
        """
        operators = PTL_STR_TO_OP.keys()
        for a in attrib:
            for op in operators:
                if op in a:
                    return True
        return False

    def list_resources(self, objtype=None, objs=[]):
        """
        Lists the resources

        :param objtype: Type of the object
        :type objtype: str
        :param objs: Object list
        :type objs: List
        :returns: List of resources
        """
        if objtype in (VNODE, NODE, SERVER, QUEUE, SCHED):
            prefix = 'resources_available.'
        elif objtype in (JOB, RESV):
            prefix = 'Resource_List.'
        else:
            return

        resources = []
        for o in objs:
            for a in o.keys():
                if a.startswith(prefix):
                    res = a.replace(prefix, '')
                    if res not in resources:
                        resources.append(res)
        return resources

    def compare(self, obj1, obj2, showdiff=False):
        """
        Compare two objects.

        :param showdiff: whether to print the specific differences,
                         defaults to False
        :type showdiff: bool
        :returns: 0 if objects are identical and non zero otherwise
        """
        if not showdiff:
            ret = cmp(obj1, obj2)
            if ret != 0:
                self.logger.info('objects differ')
            return ret

        if not isinstance(obj1, type(obj2)):
            self.logger.error('objects are of different type')
            return 1

        if isinstance(obj1, list):
            if len(obj1) != len(obj2):
                self.logger.info(
                    'comparing ' + str(
                        obj1) + ' and ' + str(
                        obj2))
                self.logger.info('objects are of different lengths')
                return
            for i in range(len(obj1)):
                self.compare(obj1[i], obj2[i], showdiff=showdiff)
            return

        if isinstance(obj1, dict):
            self.logger.info('comparing ' + str(obj1) + ' and ' + str(obj2))
            onlyobj1 = []
            diffobjs = []
            onlyobj2 = []
            for k1, v1 in obj1.items():
                if k1 not in obj2:
                    onlyobj1.append(k1 + '=' + str(v1))

                if k1 in obj2 and obj2[k1] != v1:
                    diffobjs.append(
                        k1 + '=' + str(v1) + ' vs ' + k1 + '=' + str(obj2[k1]))

            for k2, v2 in obj2.items():
                if k2 not in obj1:
                    onlyobj2.append(k2 + '=' + str(v2))

            if len(onlyobj1) > 0:
                self.logger.info("only in first object: " + " ".join(onlyobj1))
            if len(onlyobj2) > 0:
                self.logger.info(
                    "only in second object: " + " ".join(onlyobj2))
            if len(diffobjs) > 0:
                self.logger.info("diff between objects: " + " ".join(diffobjs))
            if len(onlyobj1) == len(onlyobj2) == len(diffobjs) == 0:
                self.logger.info("objects are identical")
                return 0

            return 1

    def _make_template_formula(self, formula):
        """
        Create a template of the formula

        :param formula: Formula for which template is to be created
        :type formula: str
        :returns: Template
        """
        tformula = []
        skip = False
        for c in formula:
            if not skip and c.isalpha():
                tformula.append('$')
                skip = True
            if c in ('+', '-', '/', ' ', '*', '%'):
                skip = False
            tformula.append(c)
        return "".join(tformula)

    def update_attributes_list(self, obj):
        """
        Updates the attribute list

        :param obj: Objects
        :returns: Updated attribute list
        """
        if not hasattr(obj, 'attributes'):
            return
        if not hasattr(obj, 'Resource_List'):
            setattr(obj, 'Resource_List', {})

        for attr, val in obj.attributes.items():
            if attr.startswith('Resource_List.'):
                (_, resource) = attr.split('.')
                obj.Resource_List[resource] = val

    def parse_fgc_limit(self, limstr=None):
        """
        Parse an ``FGC`` limit entry, of the form:

        ``<limtype>[.<resource>]=[<entity_type>:<entity_name>
        =<entity_value>]``

        :param limstr: FGC limit string
        :type limstr: str or None
        :returns: Parsed FGC string in given format
        """
        m = self.lim_tag.match(limstr)
        if m:
            _v = str(PbsAttribute.decode_value(m.group('entity_value')))
            return (m.group('limtype'), m.group('resource'),
                    m.group('entity_type'), m.group('entity_name'), _v)
        return None

    def is_job_array(self, jobid):
        """
        If a job array return True, otherwise return False

        :param jobid: PBS jobid
        :returns: True or False
        """
        if self.array_tag.match(jobid):
            return True
        return False

    def is_subjob(self, jobid):
        """
        If a subjob of a job array, return the subjob id
        otherwise return False

        :param jobid: PBS job id
        :type jobid: str
        :returns: True or False
        """
        m = self.subjob_tag.match(jobid)
        if m:
            return m.group('subjobid')
        return False


class PbsBatchObject(list):

    def __init__(self, bs):
        self.set_batch_status(bs)

    def set_batch_status(self, bs):
        """
        Sets the batch status

        :param bs: Batch status
        """
        if 'id' in bs:
            self.name = bs['id']
        for k, v in bs.items():
            self.append(PbsAttribute(k, v))


class PbsBatchStatus(list):

    """
    Wrapper class for Batch Status object
    Converts a batch status (as dictlist) into a list of
    PbsBatchObjects

    :param bs: Batch status
    :type bs: List or dictionary
    :returns: List of PBS batch objects
    """

    def __init__(self, bs):
        if not isinstance(bs, (list, dict)):
            raise TypeError("Expected a list or dictionary")

        if isinstance(bs, dict):
            self.append(PbsBatchObject(bs))
        else:
            for b in bs:
                self.append(PbsBatchObject(b))

    def __str__(self):
        rv = []
        for l in self.__bs:
            rv += [self.__bu.batch_status_as_dict_to_str(l)]
        return "\n".join(rv)


================================================
FILE: test/fw/ptl/lib/ptl_comm.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import copy
import datetime
import logging
import os
import re
import socket
import string
import sys
import time
from ptl.lib.ptl_service import PBSService, PBSInitServices


class Comm(PBSService):

    """
    PBS ``Comm`` configuration and control
    """

    """
    :param name: The hostname of the Comm. Defaults to current hostname.
    :type name: str
    :param attrs: Dictionary of attributes to set, these will override
                  defaults.
    :type attrs: dictionary
    :param pbsconf_file: path to config file to parse for PBS_HOME,
                         PBS_EXEC, etc
    :type pbsconf_file: str or None
    :param snapmap: A dictionary of PBS objects (node,server,etc) to
                    mapped files from PBS snap directory
    :type snapmap: dictionary
    :param snap: path to PBS snap directory (This will override snapmap)
    :type snap: str or None
    :param server: A PBS server instance to which this Comm is associated
    :type server: str
    :param db_access: set to either file containing credentials to DB access or
                      dictionary containing {'dbname':...,'user':...,
                      'port':...}
    :type db_access: str or dictionary
        """
    dflt_attributes = {}

    def __init__(self, server, name=None, attrs={}, pbsconf_file=None,
                 snapmap={}, snap=None, db_access=None):
        self.server = server
        if snap is None and self.server.snap is not None:
            snap = self.server.snap
        if (len(snapmap) == 0) and (len(self.server.snapmap) != 0):
            snapmap = self.server.snapmap
        super().__init__(name, attrs, self.dflt_attributes,
                         pbsconf_file, snapmap, snap)
        _m = ['Comm ', self.shortname]
        if pbsconf_file is not None:
            _m += ['@', pbsconf_file]
        _m += [': ']
        self.logprefix = "".join(_m)
        self.conf_to_cmd_map = {
            'PBS_COMM_ROUTERS': '-r',
            'PBS_COMM_THREADS': '-t'
        }
        self.pi = PBSInitServices(hostname=self.hostname,
                                  conf=self.pbs_conf_file)

    def start(self, args=None, launcher=None):
        """
        Start the comm

        :param args: Argument required to start the comm
        :type args: str
        :param launcher: Optional utility to invoke the launch of the service
        :type launcher: str or list
        """
        if args is not None or launcher is not None:
            return super()._start(inst=self, args=args,
                                  cmd_map=self.conf_to_cmd_map,
                                  launcher=launcher)
        else:
            try:
                rv = self.pi.start_comm()
                pid = self._validate_pid(self)
                if pid is None:
                    raise PbsServiceError(rv=False, rc=-1,
                                          msg="Could not find PID")
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
            return rv

    def stop(self, sig=None):
        """
        Stop the comm.

        :param sig: Signal to stop the comm
        :type sig: str
        """
        if sig is not None:
            self.logger.info(self.logprefix + 'stopping Comm on host ' +
                             self.hostname)
            return super(Comm, self)._stop(sig, inst=self)
        else:
            try:
                self.pi.stop_comm()
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
            return True

    def restart(self):
        """
        Restart the comm.
        """
        if self.isUp():
            if not self.stop():
                return False
        return self.start()

    def log_match(self, msg=None, id=None, n=50, tail=True, allmatch=False,
                  regexp=False, max_attempts=None, interval=None,
                  starttime=None, endtime=None, level=logging.INFO,
                  existence=True):
        """
        Match given ``msg`` in given ``n`` lines of Comm log

        :param msg: log message to match, can be regex also when
                    ``regexp`` is True
        :type msg: str
        :param id: The id of the object to trace. Only used for
                   tracejob
        :type id: str
        :param n: 'ALL' or the number of lines to search through,
                  defaults to 50
        :type n: str or int
        :param tail: If true (default), starts from the end of
                     the file
        :type tail: bool
        :param allmatch: If True all matching lines out of then
                         parsed are returned as a list. Defaults
                         to False
        :type allmatch: bool
        :param regexp: If true msg is a Python regular expression.
                       Defaults to False
        :type regexp: bool
        :param max_attempts: the number of attempts to make to find
                             a matching entry
        :type max_attempts: int
        :param interval: the interval between attempts
        :type interval: int
        :param starttime: If set ignore matches that occur before
                          specified time
        :type starttime: float
        :param endtime: If set ignore matches that occur after
                        specified time
        :type endtime: float
        :param level: The logging level, defaults to INFO
        :type level: int
        :param existence: If True (default), check for existence of
                        given msg, else check for non-existence of
                        given msg.
        :type existence: bool

        :return: (x,y) where x is the matching line
                 number and y the line itself. If allmatch is True,
                 a list of tuples is returned.
        :rtype: tuple
        :raises PtlLogMatchError:
                When ``existence`` is True and given
                ``msg`` is not found in ``n`` line
                Or
                When ``existence`` is False and given
                ``msg`` found in ``n`` line.

        .. note:: The matching line number is relative to the record
                  number, not the absolute line number in the file.
        """
        return self._log_match(self, msg, id, n, tail, allmatch, regexp,
                               max_attempts, interval, starttime, endtime,
                               level=level, existence=existence)


================================================
FILE: test/fw/ptl/lib/ptl_config.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import copy
import datetime
import logging
import os
import random
import re
import sys
import time

from ptl.utils.pbs_dshutils import DshUtils
from ptl.lib.ptl_object import PBSObject


class PtlConfig(object):

    """
    Holds configuration options
    The options can be stored in a file as well as in the OS environment
    variables.When set, the environment variables will override
    definitions in the file.By default, on Unix like systems, the file
    read is ``/etc/ptl.conf``, the environment variable ``PTL_CONF_FILE``
    can be used to set the path to the file to read.

    The format of the file is a series of ``<key> = <value>`` properties.
    A line that starts with a '#' is ignored and can be used for comments

    :param conf: Path to PTL configuration file
    :type conf: str or None
    """
    logger = logging.getLogger(__name__)

    def __init__(self, conf=None):
        self.options = {
            'PTL_SUDO_CMD': 'sudo -H',
            'PTL_RSH_CMD': 'ssh',
            'PTL_CP_CMD': 'scp -p',
            'PTL_MAX_ATTEMPTS': 180,
            'PTL_ATTEMPT_INTERVAL': 0.5,
            'PTL_UPDATE_ATTRIBUTES': True,
        }
        self.handlers = {
            'PTL_SUDO_CMD': DshUtils.set_sudo_cmd,
            'PTL_RSH_CMD': DshUtils.set_rsh_cmd,
            'PTL_CP_CMD': DshUtils.set_copy_cmd,
            'PTL_MAX_ATTEMPTS': PBSObject.set_max_attempts,
            'PTL_ATTEMPT_INTERVAL': PBSObject.set_attempt_interval,
            'PTL_UPDATE_ATTRIBUTES': PBSObject.set_update_attributes
        }
        if conf is None:
            conf = os.environ.get('PTL_CONF_FILE', '/etc/ptl.conf')
        try:
            with open(conf) as f:
                lines = f.readlines()
        except IOError:
            lines = []
        for line in lines:
            line = line.strip()
            if (line.startswith('#') or (line == '')):
                continue
            try:
                k, v = line.split('=', 1)
                k = k.strip()
                v = v.strip()
                self.options[k] = v
            except Exception:
                self.logger.error('Error parsing line ' + line)
        # below two if block are for backword compatibility
        if 'PTL_EXPECT_MAX_ATTEMPTS' in self.options:
            _o = self.options['PTL_EXPECT_MAX_ATTEMPTS']
            _m = self.options['PTL_MAX_ATTEMPTS']
            _e = os.environ.get('PTL_EXPECT_MAX_ATTEMPTS', _m)
            del self.options['PTL_EXPECT_MAX_ATTEMPTS']
            self.options['PTL_MAX_ATTEMPTS'] = max([int(_o), int(_m), int(_e)])
            _msg = 'PTL_EXPECT_MAX_ATTEMPTS is deprecated,'
            _msg += ' use PTL_MAX_ATTEMPTS instead'
            self.logger.warn(_msg)
        if 'PTL_EXPECT_INTERVAL' in self.options:
            _o = self.options['PTL_EXPECT_INTERVAL']
            _m = self.options['PTL_ATTEMPT_INTERVAL']
            _e = os.environ.get('PTL_EXPECT_INTERVAL', _m)
            del self.options['PTL_EXPECT_INTERVAL']
            self.options['PTL_ATTEMPT_INTERVAL'] = \
                max([int(_o), int(_m), int(_e)])
            _msg = 'PTL_EXPECT_INTERVAL is deprecated,'
            _msg += ' use PTL_ATTEMPT_INTERVAL instead'
            self.logger.warn(_msg)
        for k, v in self.options.items():
            if k in os.environ:
                v = os.environ[k]
            else:
                os.environ[k] = str(v)
            if k in self.handlers:
                self.handlers[k](v)


================================================
FILE: test/fw/ptl/lib/ptl_constants.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import copy
import datetime
import logging
import os
import random
import re
import sys
import time

try:
    from ptl.lib.pbs_ifl import *
    API_OK = True
except Exception:
    try:
        from ptl.lib.pbs_ifl_mock import *
    except Exception:
        sys.stderr.write("failed to import pbs_ifl, run pbs_swigify " +
                         "to make it\n")
        raise ImportError
    API_OK = False
# suppress logging exceptions
logging.raiseExceptions = False

# Various mappings and aliases
MGR_OBJ_VNODE = MGR_OBJ_NODE

VNODE = MGR_OBJ_VNODE
NODE = MGR_OBJ_NODE
HOST = MGR_OBJ_HOST
JOB = MGR_OBJ_JOB
RESV = MGR_OBJ_RESV
SERVER = MGR_OBJ_SERVER
QUEUE = MGR_OBJ_QUEUE
SCHED = MGR_OBJ_SCHED
HOOK = MGR_OBJ_HOOK
RSC = MGR_OBJ_RSC
PBS_HOOK = MGR_OBJ_PBS_HOOK

# the order of these symbols matters, see pbs_ifl.h
(SET, UNSET, INCR, DECR, EQ, NE, GE, GT,
 LE, LT, MATCH, MATCH_RE, NOT, DFLT) = list(range(14))

(PTL_OR, PTL_AND) = [0, 1]

(IFL_SUBMIT, IFL_SELECT, IFL_TERMINATE, IFL_ALTER,
 IFL_MSG, IFL_DELETE, IFL_RALTER) = [0, 1, 2, 3, 4, 5, 6]

(PTL_API, PTL_CLI) = ['api', 'cli']

(PTL_COUNTER, PTL_FILTER) = [0, 1]

PTL_STR_TO_OP = {
    '<': LT,
    '<=': LE,
    '=': EQ,
    '>=': GE,
    '>': GT,
    '!=': NE,
    ' set ': SET,
    ' unset ': UNSET,
    ' match ': MATCH,
    '~': MATCH_RE,
    '!': NOT
}

PTL_OP_TO_STR = {
    LT: '<',
    LE: '<=',
    EQ: '=',
    GE: '>=',
    GT: '>',
    SET: ' set ',
    NE: '!=',
    UNSET: ' unset ',
    MATCH: ' match ',
    MATCH_RE: '~',
    NOT: 'is not'
}

PTL_ATTROP_TO_STR = {PTL_AND: '&&', PTL_OR: '||'}

(RESOURCES_AVAILABLE, RESOURCES_TOTAL) = [0, 1]

EXPECT_MAP = {
    UNSET: 'Unset',
    SET: 'Set',
    EQ: 'Equal',
    NE: 'Not Equal',
    LT: 'Less Than',
    GT: 'Greater Than',
    LE: 'Less Equal Than',
    GE: 'Greater Equal Than',
    MATCH_RE: 'Matches regexp',
    MATCH: 'Matches',
    NOT: 'Not'
}

PBS_CMD_MAP = {
    MGR_CMD_CREATE: 'create',
    MGR_CMD_SET: 'set',
    MGR_CMD_DELETE: 'delete',
    MGR_CMD_UNSET: 'unset',
    MGR_CMD_IMPORT: 'import',
    MGR_CMD_EXPORT: 'export',
    MGR_CMD_LIST: 'list',
}

PBS_CMD_TO_OP = {
    MGR_CMD_SET: SET,
    MGR_CMD_UNSET: UNSET,
    MGR_CMD_DELETE: UNSET,
    MGR_CMD_CREATE: SET,
}

PBS_OBJ_MAP = {
    MGR_OBJ_NONE: 'none',
    SERVER: 'server',
    QUEUE: 'queue',
    JOB: 'job',
    NODE: 'node',
    RESV: 'reservation',
    RSC: 'resource',
    SCHED: 'sched',
    HOST: 'host',
    HOOK: 'hook',
    VNODE: 'node',
    PBS_HOOK: 'pbshook'
}

PTL_TRUE = ('1', 'true', 't', 'yes', 'y', 'enable', 'enabled', 'True', True)
PTL_FALSE = ('0', 'false', 'f', 'no', 'n', 'disable', 'disabled', 'False',
             False)
PTL_NONE = ('None', None)
PTL_FORMULA = '__formula__'
PTL_NOARG = '__noarg__'
PTL_ALL = '__ALL__'

CMD_ERROR_MAP = {
    'alterjob': 'PbsAlterError',
    'holdjob': 'PbsHoldError',
    'sigjob': 'PbsSignalError',
    'msgjob': 'PbsMessageError',
    'rlsjob': 'PbsReleaseError',
    'rerunjob': 'PbsRerunError',
    'orderjob': 'PbsOrderError',
    'runjob': 'PbsRunError',
    'movejob': 'PbsMoveError',
    'delete': 'PbsDeleteError',
    'deljob': 'PbsDeljobError',
    'delresv': 'PbsDelresvError',
    'status': 'PbsStatusError',
    'manager': 'PbsManagerError',
    'submit': 'PbsSubmitError',
    'terminate': 'PbsQtermError',
    'alterresv': 'PbsResvAlterError'
}


================================================
FILE: test/fw/ptl/lib/ptl_entities.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import copy
import datetime
import logging
import os
import pwd
import re
import sys
import time

from ptl.utils.pbs_testusers import (ROOT_USER, TEST_USER, PbsUser,
                                     DAEMON_SERVICE_USER)
from ptl.lib.ptl_error import PbsManagerError
from ptl.lib.ptl_object import PBSObject
from ptl.lib.ptl_constants import (ATTR_resv_start, ATTR_job,
                                   ATTR_resv_end, ATTR_resv_duration,
                                   ATTR_count, ATTR_rescassn, ATTR_qtype,
                                   ATTR_enable, ATTR_start, ATTR_total,
                                   MGR_CMD_SET, MGR_CMD_UNSET, MGR_OBJ_QUEUE,
                                   QUEUE)


class Resource(PBSObject):

    """
    PBS resource referenced by name, type and flag

    :param name: Resource name
    :type name: str or None
    :param type: Type of resource
    """

    def __init__(self, name=None, type=None, flag=None):
        PBSObject.__init__(self, name)
        self.set_name(name)
        self.set_type(type)
        self.set_flag(flag)

    def __del__(self):
        del self.__dict__

    def set_name(self, name):
        """
        Set the resource name
        """
        self.name = name
        self.attributes['id'] = name

    def set_type(self, type):
        """
        Set the resource type
        """
        self.type = type
        self.attributes['type'] = type

    def set_flag(self, flag):
        """
        Set the flag
        """
        self.flag = flag
        self.attributes['flag'] = flag

    def __str__(self):
        s = [self.attributes['id']]
        if 'type' in self.attributes:
            s.append('type=' + self.attributes['type'])
        if 'flag' in self.attributes:
            s.append('flag=' + self.attributes['flag'])
        return " ".join(s)


class Hook(PBSObject):

    """
    PBS hook objects. Holds attributes information and pointer
    to server

    :param name: Hook name
    :type name: str or None
    :param attrs: Hook attributes
    :type attrs: Dictionary
    :param server: Pointer to server
    """

    dflt_attributes = {}

    def __init__(self, name=None, attrs={}, server=None):
        PBSObject.__init__(self, name, attrs, self.dflt_attributes)
        self.server = server


class Queue(PBSObject):

    """
    PBS Queue container, holds attributes of the queue and
    pointer to server

    :param name: Queue name
    :type name: str or None
    :param attrs: Queue attributes
    :type attrs: Dictionary
    """

    dflt_attributes = {}

    def __init__(self, name=None, attrs={}, server=None):
        PBSObject.__init__(self, name, attrs, self.dflt_attributes)

        self.server = server
        m = ['queue']
        if server is not None:
            m += ['@' + server.shortname]
        if self.name is not None:
            m += [' ', self.name]
        m += [': ']
        self.logprefix = "".join(m)

    def __del__(self):
        del self.__dict__

    def revert_to_defaults(self):
        """
        reset queue attributes to defaults
        """

        ignore_attrs = ['id', ATTR_count, ATTR_rescassn]
        ignore_attrs += [ATTR_qtype, ATTR_enable, ATTR_start, ATTR_total]
        ignore_attrs += ['THE_END']

        len_attrs = len(ignore_attrs)
        unsetlist = []
        setdict = {}

        self.logger.info(
            self.logprefix +
            "reverting configuration to defaults")
        if self.server is not None:
            self.server.status(QUEUE, id=self.name, level=logging.DEBUG)

        for k in self.attributes.keys():
            for i in range(len_attrs):
                if k.startswith(ignore_attrs[i]):
                    break
            if (i == (len_attrs - 1)) and k not in self.dflt_attributes:
                unsetlist.append(k)

        if len(unsetlist) != 0 and self.server is not None:
            try:
                self.server.manager(MGR_CMD_UNSET, MGR_OBJ_QUEUE, unsetlist,
                                    self.name)
            except PbsManagerError as e:
                self.logger.error(e.msg)

        for k in self.dflt_attributes.keys():
            if (k not in self.attributes or
                    self.attributes[k] != self.dflt_attributes[k]):
                setdict[k] = self.dflt_attributes[k]

        if len(setdict.keys()) != 0 and self.server is not None:
            self.server.manager(MGR_CMD_SET, MGR_OBJ_QUEUE, setdict)


class Entity(object):

    """
    Abstract representation of a PBS consumer that has an
    external relationship to the PBS system. For example, a
    user associated to an OS identifier (uid) maps to a PBS
    user entity.

    Entities may be subject to policies, such as limits, consume
    a certain amount of resource and/or fairshare usage.

    :param etype: Entity type
    :type etype: str or None
    :param name: Entity name
    :type name: str or None
    """

    def __init__(self, etype=None, name=None):
        self.type = etype
        self.name = name
        self.limits = []
        self.resource_usage = {}
        self.fairshare_usage = 0

    def set_limit(self, limit=None):
        """
        :param limit: Limit to be set
        :type limit: str or None
        """
        for l in self.limits:
            if str(limit) == str(l):
                return
        self.limits.append(limit)

    def set_resource_usage(self, container=None, resource=None, usage=None):
        """
        Set the resource type

        :param resource: PBS resource
        :type resource: str or None
        :param usage: Resource usage value
        :type usage: str or None
        """
        if self.type:
            if container in self.resource_usage:
                if self.resource_usage[self.type]:
                    if resource in self.resource_usage[container]:
                        self.resource_usage[container][resource] += usage
                    else:
                        self.resource_usage[container][resource] = usage
                else:
                    self.resource_usage[container] = {resource: usage}

    def set_fairshare_usage(self, usage=0):
        """
        Set fairshare usage

        :param usage: Fairshare usage value
        :type usage: int
        """
        self.fairshare_usage += usage

    def __repr__(self):
        return self.__str__()

    def __str__(self):
        return str(self.limits) + ' ' + str(self.resource_usage) + ' ' + \
            str(self.fairshare_usage)


class Policy(object):

    """
    Abstract PBS policy. Can be one of ``limits``,
    ``access control``, ``scheduling policy``, etc...this
    class does not currently support any operations
    """

    def __init__(self):
        pass


class Limit(Policy):

    """
    Representation of a PBS limit
    Limits apply to containers, are of a certain type
    (e.g., max_run_res.ncpus) associated to a given resource
    (e.g., resource), on a given entity (e.g.,user Bob) and
    have a certain value.

    :param limit_type: Type of the limit
    :type limit_type: str or None
    :param resource: PBS resource
    :type resource: str or None
    :param entity_obj: Entity object
    :param value: Limit value
    :type value: int
    """

    def __init__(self, limit_type=None, resource=None,
                 entity_obj=None, value=None, container=None,
                 container_id=None):
        self.set_container(container, container_id)
        self.soft_limit = False
        self.hard_limit = False
        self.set_limit_type(limit_type)
        self.set_resource(resource)
        self.set_value(value)
        self.entity = entity_obj

    def set_container(self, container, container_id):
        """
        Set the container

        :param container: Container which is to be set
        :type container: str
        :param container_id: Container id
        """
        self.container = container
        self.container_id = container_id

    def set_limit_type(self, t):
        """
        Set the limit type

        :param t: Limit type
        :type t: str
        """
        self.limit_type = t
        if '_soft' in t:
            self.soft_limit = True
        else:
            self.hard_limit = True

    def set_resource(self, resource):
        """
        Set the resource

        :param resource: resource value to set
        :type resource: str
        """
        self.resource = resource

    def set_value(self, value):
        """
        Set the resource value

        :param value: Resource value
        :type value: str
        """
        self.value = value

    def __eq__(self, value):
        if str(self) == str(value):
            return True
        return False

    def __str__(self):
        return self.__repr__()

    def __repr__(self):
        limit_list = [self.container_id, self.limit_type, self.resource, '[',
                      self.entity.type, ':', self.entity.name, '=',
                      self.value, ']']
        return " ".join(limit_list)


class EquivClass(PBSObject):

    """
    Equivalence class holds information on a collection of entities
    grouped according to a set of attributes
    :param attributes: Dictionary of attributes
    :type attributes: Dictionary
    :param entities: List of entities
    :type entities: List
    """

    def __init__(self, name, attributes={}, entities=[]):
        self.name = name
        self.attributes = attributes
        self.entities = entities

    def add_entity(self, entity):
        """
        Add entities

        :param entity: Entity to add
        :type entity: str
        """
        if entity not in self.entities:
            self.entities.append(entity)

    def __str__(self):
        s = [str(len(self.entities)), ":", ":".join(self.name)]
        return "".join(s)

    def show(self, showobj=False):
        """
        Show the entities

        :param showobj: If true then show the entities
        :type showobj: bool
        """
        s = " && ".join(self.name) + ': '
        if showobj:
            s += str(self.entities)
        else:
            s += str(len(self.entities))
        print(s)
        return s


class Holidays():
    """
    Descriptive calss for Holiday file.
    """

    def __init__(self):
        self.year = {'id': "YEAR", 'value': None, 'valid': False}
        self.weekday = {'id': "weekday", 'p': None, 'np': None, 'valid': None,
                        'position': None}
        self.monday = {'id': "monday", 'p': None, 'np': None, 'valid': None,
                       'position': None}
        self.tuesday = {'id': "tuesday", 'p': None, 'np': None, 'valid': None,
                        'position': None}
        self.wednesday = {'id': "wednesday", 'p': None, 'np': None,
                          'valid': None, 'position': None}
        self.thursday = {'id': "thursday", 'p': None, 'np': None,
                         'valid': None, 'position': None}
        self.friday = {'id': "friday", 'p': None, 'np': None, 'valid': None,
                       'position': None}
        self.saturday = {'id': "saturday", 'p': None, 'np': None,
                         'valid': None, 'position': None}
        self.sunday = {'id': "sunday", 'p': None, 'np': None, 'valid': None,
                       'position': None}

        self.days_set = []  # list of set days
        self._days_map = {'weekday': self.weekday, 'monday': self.monday,
                          'tuesday': self.tuesday, 'wednesday': self.wednesday,
                          'thursday': self.thursday, 'friday': self.friday,
                          'saturday': self.saturday, 'sunday': self.sunday}
        self.holidays = []  # list of calendar holidays

    def __str__(self):
        """
        Return the content to write to holidays file as a string
        """
        content = []
        if self.year['valid']:
            content.append(self.year['id'] + "\t" +
                           self.year['value'])

        for i in range(0, len(self.days_set)):
            content.append(self.days_set[i]['id'] + "\t" +
                           self.days_set[i]['p'] + "\t" +
                           self.days_set[i]['np'])

        # Add calendar holidays
        for day in self.holidays:
            content.append(day)

        return "\n".join(content)


================================================
FILE: test/fw/ptl/lib/ptl_error.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


class PtlException(Exception):

    """
    Generic errors raised by PTL operations.
    Sets a ``return value``, a ``return code``, and a ``message``
    A post function and associated positional and named arguments
    are available to perform any necessary cleanup.

    :param rv: Return value set for the error occured during PTL
               operation
    :type rv: int or None.
    :param rc: Return code set for the error occured during PTL
               operation
    :type rc: int or None.
    :param msg: Message set for the error occured during PTL operation
    :type msg: str or None.
    :param post: Execute given post callable function if not None.
    :type post: callable or None.
    :raises: PTL exceptions
    """

    def __init__(self, rv=None, rc=None, msg=None, post=None, *args, **kwargs):
        self.rv = rv
        self.rc = rc
        self.msg = msg
        if post is not None:
            post(*args, **kwargs)

    def __str__(self):
        return ('rc=' + str(self.rc) + ', rv=' + str(self.rv) +
                ', msg=' + str(self.msg))

    def __repr__(self):
        return (self.__class__.__name__ + '(rc=' + str(self.rc) + ', rv=' +
                str(self.rv) + ', msg=' + str(self.msg) + ')')


class PtlFailureException(AssertionError):

    """
    Generic failure exception raised by PTL operations.
    Sets a ``return value``, a ``return code``, and a ``message``
    A post function and associated positional and named arguments
    are available to perform any necessary cleanup.

    :param rv: Return value set for the failure occured during PTL
               operation
    :type rv: int or None.
    :param rc: Return code set for the failure occured during PTL
               operation
    :type rc: int or None.
    :param msg: Message set for the failure occured during PTL operation
    :type msg: str or None.
    :param post: Execute given post callable function if not None.
    :type post: callable or None.
    :raises: PTL exceptions
    """

    def __init__(self, rv=None, rc=None, msg=None, post=None, *args, **kwargs):
        self.rv = rv
        self.rc = rc
        self.msg = msg
        if post is not None:
            post(*args, **kwargs)

    def __str__(self):
        return ('rc=' + str(self.rc) + ', rv=' + str(self.rv) +
                ', msg=' + str(self.msg))

    def __repr__(self):
        return (self.__class__.__name__ + '(rc=' + str(self.rc) + ', rv=' +
                str(self.rv) + ', msg=' + str(self.msg) + ')')


class PbsServiceError(PtlException):
    pass


class PbsConnectError(PtlException):
    pass


class PbsStatusError(PtlException):
    pass


class PbsSubmitError(PtlException):
    pass


class PbsManagerError(PtlException):
    pass


class PbsDeljobError(PtlException):
    pass


class PbsDelresvError(PtlException):
    pass


class PbsDeleteError(PtlException):
    pass


class PbsRunError(PtlException):
    pass


class PbsSignalError(PtlException):
    pass


class PbsMessageError(PtlException):
    pass


class PbsHoldError(PtlException):
    pass


class PbsReleaseError(PtlException):
    pass


class PbsOrderError(PtlException):
    pass


class PbsRerunError(PtlException):
    pass


class PbsMoveError(PtlException):
    pass


class PbsAlterError(PtlException):
    pass


class PbsResourceError(PtlException):
    pass


class PbsSelectError(PtlException):
    pass


class PbsSchedConfigError(PtlException):
    pass


class PbsMomConfigError(PtlException):
    pass


class PbsFairshareError(PtlException):
    pass


class PbsQdisableError(PtlException):
    pass


class PbsQenableError(PtlException):
    pass


class PbsQstartError(PtlException):
    pass


class PbsQstopError(PtlException):
    pass


class PtlExpectError(PtlFailureException):
    pass


class PbsInitServicesError(PtlException):
    pass


class PbsQtermError(PtlException):
    pass


class PtlLogMatchError(PtlFailureException):
    pass


class PbsResvAlterError(PtlException):
    pass


================================================
FILE: test/fw/ptl/lib/ptl_expect_action.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import logging


class ExpectActions(object):

    """
    List of action handlers to run when Server's expect
    function does not get the expected result

    :param action: Action to run
    :type action: str
    :param level: Logging level
    """

    actions = {}

    def __init__(self, action=None, level=logging.INFO):
        self.logger = logging.getLogger(__name__)
        self.add_action(action, level=level)

    def add_action(self, action=None, hostname=None, level=logging.INFO):
        """
        Add an action

        :param action: Action to add
        :param hostname: Machine hostname
        :type hostname: str
        :param level: Logging level
        """
        if action is not None and action.name is not None and\
           action.name not in self.actions:
            self.actions[action.name] = action
            msg = ['expect action: added action ' + action.name]
            if hostname:
                msg += [' to server ' + hostname]
            if level >= logging.INFO:
                self.logger.info("".join(msg))
            else:
                self.logger.debug("".join(msg))

    def has_action(self, name):
        """
        check whether action exists or not

        :param name: Name of action
        :type name: str
        """
        if name in self.actions:
            return True
        return False

    def get_action(self, name):
        """
        Get an action if exists

        :param name: Name of action
        :type name: str
        """
        if name in self.actions:
            return self.actions[name]
        return None

    def list_actions(self, level=logging.INFO):
        """
        List an actions

        :param level: Logging level
        """
        if level >= logging.INFO:
            self.logger.info(self.get_all_cations)
        else:
            self.logger.debug(self.get_all_cations)

    def get_all_actions(self):
        """
        Get all the action
        """
        return list(self.actions.values())

    def get_actions_by_type(self, atype=None):
        """
        Get an action by type

        :param atype: Action type
        :type atype: str
        """
        if atype is None:
            return None

        ret_actions = []
        for action in self.actions.values():
            if action.type is not None and action.type == atype:
                ret_actions.append(action)
        return ret_actions

    def _control_action(self, action=None, name=None, enable=None):
        if action:
            action.enabled = False
            name = action.name
        elif name is not None:
            if name == 'ALL':
                for a in self.actions:
                    a.enabled = enable
            else:
                a = self.get_action(name)
                a.enabled = False
        else:
            return

        if enable:
            msg = 'enabled'
        else:
            msg = 'disabled'

        self.logger.info('expect action: ' + name + ' ' + msg)

    def disable_action(self, action=None, name=None):
        """
        Disable an action
        """
        self._control_action(action, name, enable=False)

    def enable_action(self, action=None, name=None):
        """
        Enable an action
        """
        self._control_action(action, name, enable=True)

    def disable_all_actions(self):
        """
        Disable all actions
        """
        for a in self.actions.values():
            a.enabled = False

    def enable_all_actions(self):
        """
        Enable all actions
        """
        for a in self.actions.values():
            a.enabled = True


class ExpectAction(object):

    """
    Action function to run when Server's expect function does
    not get the expected result

    :param atype: Action type
    :type atype: str
    """

    def __init__(self, name=None, enabled=True, atype=None, action=None,
                 level=logging.INFO):
        self.logger = logging.getLogger(__name__)
        self.set_name(name, level=level)
        self.set_enabled(enabled)
        self.set_type(atype)
        self.set_action(action)

    def set_name(self, name, level=logging.INFO):
        """
        Set the actione name

        :param name: Action name
        :type name: str
        """
        if level >= logging.INFO:
            self.logger.info('expect action: created new action ' + name)
        else:
            self.logger.debug('expect action: created new action ' + name)
        self.name = name

    def set_enabled(self, enabled):
        self.enabled = enabled

    def set_type(self, atype):
        self.type = atype

    def set_action(self, action):
        self.action = action


================================================
FILE: test/fw/ptl/lib/ptl_fairshare.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import copy
import logging
import os
import pwd
import re
import grp
import sys
import time

from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_testusers import ROOT_USER, PbsUser
from ptl.lib.ptl_error import PbsFairshareError


class FairshareTree(object):

    """
    Object representation of the Scheduler's resource_group
    file and pbsfs data

    :param hostname: Hostname of the machine
    :type hostname: str
    """
    du = DshUtils()

    def __init__(self, hostname=None, resource_group=None):
        self.logger = logging.getLogger(__name__)
        self.hostname = hostname
        self.resource_group = resource_group
        self.nodes = {}
        self.root = None
        self._next_id = -1

    def update_resource_group(self):
        if self.resource_group:
            fn = self.du.create_temp_file(body=self.__str__())
            ret = self.du.run_copy(self.hostname, src=fn,
                                   dest=self.resource_group,
                                   preserve_permission=False, sudo=True)
            os.remove(fn)

            if ret['rc'] != 0:
                raise PbsFairshareError(rc=1, rv=False,
                                        msg='error updating resource group')
        return True

    def update(self):
        for node in self.nodes.values():
            if node._parent is None:
                pnode = self.get_node(id=node.parent_id)
                if pnode:
                    node._parent = pnode
                    if node not in pnode._child:
                        pnode._child.append(node)

    def _add_node(self, node):
        if node.name == 'TREEROOT' or node.name == 'root':
            self.root = node
        self.nodes[node.name] = node
        if node.parent_name in self.nodes:
            self.nodes[node.parent_name]._child.append(node)
            node._parent = self.nodes[node.parent_name]

    def add_node(self, node, apply=True):
        """
        add node to the fairshare tree
        """
        self._add_node(node)
        if apply:
            return self.update_resource_group()
        return True

    def create_node(self, name, id, parent_name, nshares):
        """
        Add an entry to the ``resource_group`` file

        :param name: The name of the entity to add
        :type name: str
        :param id: The uniqe numeric identifier of the entity
        :type id: int
        :param parent: The name of the parent/group of the entity
        :type parent: str
        :param nshares: The number of shares assigned to this entity
        :type nshares: int
        :returns: True on success, False otherwise
        """
        if name in self.nodes:
            self.logger.warning('fairshare: node ' + name + ' already defined')
            return True
        self.logger.info('creating tree node: ' + name)

        node = FairshareNode(name, id, parent_name=parent_name,
                             nshares=nshares)
        self._add_node(node)
        return self.update_resource_group()

    def get_node(self, name=None, id=None):
        """
        Return a node of the fairshare tree identified by either
        name or id.

        :param name: The name of the entity to query
        :type name: str or None
        :param id: The id of the entity to query
        :returns: The fairshare information of the entity when
                  found, if not, returns None

        .. note:: The name takes precedence over the id.
        """
        for node in self.nodes.values():
            if name is not None and node.name == name:
                return node
            if id is not None and node.id == id:
                return node
        return None

    def __batch_status__(self):
        """
        Convert fairshare tree object to a batch status format
        """
        dat = []
        for node in self.nodes.values():
            if node.name == 'root':
                continue
            einfo = {}
            einfo['cgroup'] = node.id
            einfo['id'] = node.name
            einfo['group'] = node.parent_id
            einfo['nshares'] = node.nshares
            if len(node.prio) > 0:
                p = []
                for k, v in node.prio.items():
                    p += ["%s:%d" % (k, int(v))]
                einfo['penalty'] = ", ".join(p)
            einfo['usage'] = node.usage
            if node.perc:
                p = []
                for k, v in node.perc.items():
                    p += ["%s:%.3f" % (k, float(v))]
                    einfo['shares_perc'] = ", ".join(p)
            ppnode = self.get_node(id=node.parent_id)
            if ppnode:
                ppname = ppnode.name
                ppid = ppnode.id
            else:
                ppnode = self.get_node(name=node.parent_name)
                if ppnode:
                    ppname = ppnode.name
                    ppid = ppnode.id
                else:
                    ppname = ''
                    ppid = None
            einfo['parent'] = "%s (%s) " % (str(ppid), ppname)
            dat.append(einfo)
        return dat

    def get_next_id(self):
        self._next_id -= 1
        return self._next_id

    def __repr__(self):
        return self.__str__()

    def _dfs(self, node, dat):
        if node.name != 'root':
            s = []
            if node.name is not None:
                s += [node.name]
            if node.id is not None:
                s += [str(node.id)]
            if node.parent_name is not None:
                s += [node.parent_name]
            if node.nshares is not None:
                s += [str(node.nshares)]
            if node.usage is not None:
                s += [str(node.usage)]
            dat.append("\t".join(s))
        for n in node._child:
            self._dfs(n, dat)

    def __str__(self):
        dat = []
        if self.root:
            self._dfs(self.root, dat)
        if len(dat) > 0:
            dat += ['\n']
        return "\n".join(dat)


class FairshareNode(object):

    """
    Object representation of the fairshare data as queryable through
    the command ``pbsfs``.

    :param name: Name of fairshare node
    :type name: str or None
    :param nshares: Number of shares
    :type nshares: int or None
    :param usage: Fairshare usage
    :param perc: Percentage the entity has of the tree
    """

    def __init__(self, name=None, id=None, parent_name=None, parent_id=None,
                 nshares=None, usage=None, perc=None):
        self.name = name
        self.id = id
        self.parent_name = parent_name
        self.parent_id = parent_id
        self.nshares = nshares
        self.usage = usage
        self.perc = perc
        self.prio = {}
        self._parent = None
        self._child = []

    def __str__(self):
        ret = []
        if self.name is not None:
            ret.append(self.name)
        if self.id is not None:
            ret.append(str(self.id))
        if self.parent_name is not None:
            ret.append(str(self.parent_name))
        if self.nshares is not None:
            ret.append(str(self.nshares))
        if self.usage is not None:
            ret.append(str(self.usage))
        if self.perc is not None:
            ret.append(str(self.perc))
        return "\t".join(ret)


class Fairshare(object):
    du = DshUtils()
    logger = logger = logging.getLogger(__name__)
    fs_re = r'(?P<name>[\S]+)[\s]*:[\s]*Grp:[\s]*(?P<Grp>[-]*[0-9]*)' + \
            r'[\s]*cgrp:[\s]*(?P<cgrp>[-]*[0-9]*)[\s]*' + \
            r'Shares:[\s]*(?P<Shares>[-]*[0-9]*)[\s]*Usage:[\s]*' + \
            r'(?P<Usage>[0-9]+)[\s]*Perc:[\s]*(?P<Perc>.*)%'
    fs_tag = re.compile(fs_re)

    def __init__(self, has_snap=None, pbs_conf={}, sc_name=None,
                 hostname=None, user=None):
        self.has_snap = has_snap
        self.pbs_conf = pbs_conf
        self.sc_name = sc_name
        self.hostname = hostname
        self.user = user
        _m = ['fairshare']
        if self.sc_name is not None:
            _m += ['-', str(self.sc_name)]
        if self.user is not None:
            _m += ['-', str(self.user)]
        _m += [':']
        self.logprefix = "".join(_m)

    def revert_fairshare(self):
        """
        Helper method to revert scheduler's fairshare tree.
        """
        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbsfs'), '-e']
        if self.sc_name != 'default':
            cmd += ['-I', self.sc_name]
        self.du.run_cmd(self.hostname, cmd=cmd, runas=self.user)

    def query_fairshare(self, name=None, id=None):
        """
        Parse fairshare data using ``pbsfs`` and populates
        fairshare_tree.If name or id are specified, return the data
        associated to that id.Otherwise return the entire fairshare
        tree
        """
        if self.has_snap:
            return None

        tree = FairshareTree()
        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbsfs')]
        if self.sc_name != 'default':
            cmd += ['-I', self.sc_name]

        ret = self.du.run_cmd(self.hostname, cmd=cmd,
                              sudo=True, logerr=False)

        if ret['rc'] != 0:
            raise PbsFairshareError(rc=ret['rc'], rv=None,
                                    msg=str(ret['err']))
        pbsfs = ret['out']
        for p in pbsfs:
            m = self.fs_tag.match(p)
            if m:
                usage = int(m.group('Usage'))
                perc = float(m.group('Perc'))
                nm = m.group('name')
                cgrp = int(m.group('cgrp'))
                pid = int(m.group('Grp'))
                nd = tree.get_node(id=pid)
                if nd:
                    pname = nd.parent_name
                else:
                    pname = None
                # if an entity has a negative cgroup it should belong
                # to the unknown resource, we work around the fact that
                # PBS (up to 13.0) sets this cgroup id to -1 by
                # reassigning it to 0
                # TODO: cleanup once PBS code is updated
                if cgrp < 0:
                    cgrp = 0
                node = FairshareNode(name=nm,
                                     id=cgrp,
                                     parent_id=pid,
                                     parent_name=pname,
                                     nshares=int(m.group('Shares')),
                                     usage=usage,
                                     perc={'TREEROOT': perc})
                if perc:
                    node.prio['TREEROOT'] = float(usage) / perc
                if nm == name or id == cgrp:
                    return node

                tree.add_node(node, apply=False)
        # now that all nodes are known, update parent and child
        # relationship of the tree
        tree.update()

        for node in tree.nodes.values():
            pnode = node._parent
            while pnode is not None and pnode.id != 0:
                if pnode.perc['TREEROOT']:
                    node.perc[pnode.name] = \
                        (node.perc['TREEROOT'] * 100 / pnode.perc[
                         'TREEROOT'])
                if pnode.name in node.perc and node.perc[pnode.name]:
                    node.prio[pnode.name] = (
                        node.usage / node.perc[pnode.name])
                pnode = pnode._parent

        if name:
            n = tree.get_node(name)
            if n is None:
                raise PbsFairshareError(rc=1, rv=None,
                                        msg='Unknown entity ' + name)
            return n
        if id:
            n = tree.get_node(id=id)
            raise PbsFairshareError(rc=1, rv=None,
                                    msg='Unknown entity ' + str(id))
            return n
        return tree

    def set_fairshare_usage(self, name=None, usage=None):
        """
        Set the fairshare usage associated to a given entity.

        :param name: The entity to set the fairshare usage of
        :type name: str or :py:class:`~ptl.lib.pbs_testlib.PbsUser` or None
        :param usage: The usage value to set
        """
        if self.has_snap:
            return True

        if name is None:
            self.logger.error(self.logprefix + ' an entity name required')
            return False

        if isinstance(name, PbsUser):
            name = str(name)

        if usage is None:
            self.logger.error(self.logprefix + ' a usage is required')
            return False

        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbsfs')]
        if self.sc_name != 'default':
            cmd += ['-I', self.sc_name]
        cmd += ['-s', name, str(usage)]
        ret = self.du.run_cmd(self.hostname, cmd, runas=self.user)
        if ret['rc'] == 0:
            return True
        return False

    def cmp_fairshare_entities(self, name1=None, name2=None):
        """
        Compare two fairshare entities. Wrapper of ``pbsfs -c e1 e2``

        :param name1: name of first entity to compare
        :type name1: str or :py:class:`~ptl.lib.pbs_testlib.PbsUser` or None
        :param name2: name of second entity to compare
        :type name2: str or :py:class:`~ptl.lib.pbs_testlib.PbsUser` or None
        :returns: the name of the entity of higher priority or None on error
        """
        if self.has_snap:
            return None

        if name1 is None or name2 is None:
            self.logger.erro(self.logprefix + 'two fairshare entity names ' +
                             'required')
            return None

        if isinstance(name1, PbsUser):
            name1 = str(name1)

        if isinstance(name2, PbsUser):
            name2 = str(name2)

        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbsfs')]
        if self.sc_name != 'default':
            cmd += ['-I', self.sc_name]
        cmd += ['-c', name1, name2]
        ret = self.du.run_cmd(self.hostname, cmd, runas=self.user)
        if ret['rc'] == 0:
            return ret['out'][0]
        return None


================================================
FILE: test/fw/ptl/lib/ptl_mom.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import ast
import base64
import copy
import datetime
import json
import logging
import os
import pwd
import re
import socket
import string
import sys
import tempfile
import time
import pkg_resources


from ptl.utils.pbs_testusers import (ROOT_USER, TEST_USER, PbsUser,
                                     DAEMON_SERVICE_USER)

try:
    from nose.plugins.skip import SkipTest
except ImportError:
    class SkipTest(Exception):
        pass

from ptl.lib.ptl_error import (PtlExpectError, PbsServiceError,
                               PbsInitServicesError, PtlLogMatchError,
                               PbsStatusError, PbsManagerError,
                               PbsMomConfigError)
from ptl.lib.ptl_constants import (MGR_CMD_DELETE, MGR_OBJ_NODE,
                                   MGR_CMD_CREATE, MGR_CMD_IMPORT,
                                   MGR_CMD_SET, ATTR_rescavail,
                                   NODE, VNODE, HOOK, HOST, MATCH_RE)
from ptl.lib.ptl_service import PBSService, PBSInitServices


def get_mom_obj(server, name=None, attrs={}, pbsconf_file=None,
                snapmap={}, snap=None, db_access=None,
                pbs_conf=None, platform=None):
    return MoM(server, name, attrs, pbsconf_file, snapmap,
               snap, db_access, pbs_conf, platform)


class MoM(PBSService):

    """
    Container for MoM properties.
    Provides various MoM operations, such as creation, insertion,
    deletion of vnodes.

    :param name: The hostname of the server. Defaults to calling
                 pbs_default()
    :type name: str or None
    :param attrs: Dictionary of attributes to set, these will
                  override defaults.
    :type attrs: Dictionary
    :param pbsconf_file: path to config file to parse for
                         ``PBS_HOME``, ``PBS_EXEC``, etc
    :type pbsconf_file: str or None
    :param snapmap: A dictionary of PBS objects ``(node,server,etc)``
                    to mapped files from PBS snap directory
    :type snapmap: Dictionary
    :param snap: path to PBS snap directory (This will overrides
                 snapmap)
    :type snap: str or None
    :param server: A PBS server instance to which this mom is associated
    :param db_acccess: set to either file containing credentials to DB
                       access or dictionary containing
                       {'dbname':...,'user':...,'port':...}
    :type db_access: str or dictionary
    :param pbs_conf: Parsed pbs.conf in dictionary format
    :type pbs_conf: Dictionary or None
    :param platform: Mom's platform
    :type platform: str or None
    """
    dflt_attributes = {}
    conf_to_cmd_map = {'PBS_MOM_SERVICE_PORT': '-M',
                       'PBS_MANAGER_SERVICE_PORT': '-R',
                       'PBS_HOME': '-d'}

    def __init__(self, server, name=None, attrs={}, pbsconf_file=None,
                 snapmap={}, snap=None, db_access=None, pbs_conf=None,
                 platform=None):
        self.server = server
        if snap is None and self.server.snap is not None:
            snap = self.server.snap
        if (len(snapmap) == 0) and (len(self.server.snapmap) != 0):
            snapmap = self.server.snapmap

        super().__init__(name, attrs, self.dflt_attributes,
                         pbsconf_file, snap=snap, snapmap=snapmap,
                         pbs_conf=pbs_conf, platform=platform)
        _m = ['mom ', self.shortname]
        if pbsconf_file is not None:
            _m += ['@', pbsconf_file]
        _m += [': ']
        self.logprefix = "".join(_m)
        self.pi = PBSInitServices(hostname=self.hostname,
                                  conf=self.pbs_conf_file)
        self.configd = os.path.join(self.pbs_conf['PBS_HOME'], 'mom_priv',
                                    'config.d')
        self.config = {}
        if self.platform == 'cray' or self.platform == 'craysim':
            usecp = os.path.realpath('/home')
            if self.platform == 'cray':
                if os.path.exists('/opt/cray/alps/default/bin/apbasil'):
                    alps_client = '/opt/cray/alps/default/bin/apbasil'
                else:
                    alps_client = self.du.which(exe='apbasil')
            else:
                alps_client = "/opt/alps/apbasil.sh"
            self.dflt_config = {'$vnodedef_additive': 0,
                                '$alps_client': alps_client,
                                '$usecp': '*:%s %s' % (usecp, usecp)}
        elif self.platform == 'shasta':
            usecp = os.path.realpath('/lus')
            self.dflt_config = {'$usecp': '*:%s %s' % (usecp, usecp)}
        else:
            self.dflt_config = {}
        self._is_cpuset_mom = None

        # If this is true, the mom will revert to default.
        # This is true by default, but can be set to False if
        # required by a test
        self.revert_to_default = True
        pbs_conf = self.du.parse_pbs_config()
        self.sleep_cmd = os.path.join(pbs_conf['PBS_EXEC'], 'bin', 'pbs_sleep')
        if not os.path.isfile(self.sleep_cmd):
            self.sleep_cmd = '/bin/sleep'

    def get_formed_path(self, *argv):
        """
        :param argv: argument variables
        :type argv: str
        :returns: A string of formed path
        """

        if len(argv) == 0:
            return None
        return os.path.join(*argv)

    def rm(self, path=None, sudo=False, runas=None, recursive=False,
           force=False, logerr=True, as_script=False):
        """
        :param path: the path to the files or directories to remove
                     for more than one files or directories pass as
                     list
        :type path: str or None
        :param sudo: whether to remove files or directories as root
                     or not.Defaults to False
        :type sudo: boolean
        :param runas: remove files or directories as given user
                      Defaults to calling user
        :param recursive: remove files or directories and their
                          contents recursively
        :type recursive: boolean
        :param force: force remove files or directories
        :type force: boolean
        :param cwd: working directory on local host from which
                    command is run
        :param logerr: whether to log error messages or not.
                       Defaults to True.
        :type logerr: boolean
        :param as_script: if True, run the rm in a script created
                          as a temporary file that gets deleted after
                          being run. This is used mainly to handle
                          wildcard in path list. Defaults to False.
        :type as_script: boolean
        """
        return self.du.rm(hostname=self.hostname, path=path, sudo=sudo,
                          runas=runas, recursive=recursive, force=force,
                          logerr=logerr, as_script=as_script)

    def listdir(self, path=None, sudo=False, runas=None, fullpath=True):
        """
        :param path: The path to directory to list
        :type path: str or None
        :param sudo: Whether to list directory as root or not.
                     Defaults to False
        :type sudo: bool
        :param runas: run command as user
        :type runas: str or None
        :param fullpath: Whether to return full path of contents.
        :type fullpath: bool
        :returns: A list containing the names of the entries in
                  the directory or an empty list in case no files exist
        """
        return self.du.listdir(self.hostname, path, sudo, runas, fullpath)

    def isfile(self, path=None, sudo=False, runas=None):
        """
        :param path: The path to the file to check
        :type path: str or None
        :param sudo: Whether to run the command as a privileged user
        :type sudo: boolean
        :param runas: run command as user
        :type runas: str or None
        :returns: True if file pointed to by path exists, and False
                  otherwise
        """
        return self.du.isfile(self.hostname, path, sudo, runas)

    def create_and_format_stagein_path(self, storage_info={}, asuser=None):
        """
        Return the formatted stagein path
        :param storage_info: The name of the process to query.
        :type storage_info: Dictionary
        :param asuser: Optional username of temp file owner
        :type asuser: str or None
        :returns: Formatted stageout path
        """
        if 'hostname' in storage_info:
            storage_host = storage_info['hostname']
        else:
            storage_host = self.server.hostname

        if 'suffix' in storage_info:
            storage_file_suffix = storage_info['suffix']
        else:
            storage_file_suffix = None

        if 'prefix' in storage_info:
            storage_file_prefix = storage_info['prefix']
        else:
            storage_file_prefix = 'PtlPbs'
        storage_path = self.du.create_temp_file(storage_host,
                                                storage_file_suffix,
                                                storage_file_prefix,
                                                asuser=asuser)

        execution_path = self.du.create_temp_file(self.hostname, asuser=asuser)

        path = '%s@%s:%s' % (execution_path, storage_host, storage_path)
        return path

    def create_and_format_stageout_path(self, execution_info={},
                                        storage_info={},
                                        asuser=None):
        """
        Return the formatted stageout path
        :param execution_info: Contains execution host information
        :type execution_info: Dictionary
        :param storage_info: The name of the process to query.
        :type storage_info: Dictionary
        :param asuser: Optional username of temp file owner
        :type asuser: str or None
        :returns: Formatted stageout path
        """
        if 'hostname' in storage_info:
            storage_host = storage_info['hostname']
        else:
            storage_host = self.server.hostname

        if 'hostname' in execution_info:
            execution_host = execution_info['hostname']
        else:
            execution_host = self.hostname

        if 'suffix' in execution_info:
            execution_file_suffix = execution_info['suffix']
        else:
            execution_file_suffix = None

        if 'prefix' in execution_info:
            execution_file_prefix = execution_info['prefix']
        else:
            execution_file_prefix = 'PtlPbs'

        # create temp file on execution host which will be staged out
        execution_path = self.du.create_temp_file(execution_host,
                                                  execution_file_suffix,
                                                  execution_file_prefix,
                                                  asuser=asuser)

        # Path where file will be staged out after job completion
        storage_path = tempfile.gettempdir()
        path = '%s@%s:%s' % (execution_path, storage_host, storage_path)
        return path

    def printjob(self, job_id=None):
        """
        Run the printjob command for the given job id
        :param job_id: job's id for which to run printjob cmd
        :type job_id: string
        """

        if job_id is None:
            return None

        printjob = os.path.join(self.pbs_conf['PBS_EXEC'], 'bin',
                                'printjob')
        jbfile = os.path.join(self.pbs_conf['PBS_HOME'], 'mom_priv',
                              'jobs', job_id + '.JB')
        ret = self.du.run_cmd(self.hostname, cmd=[printjob, jbfile],
                              sudo=True)
        return ret

    def is_proc_suspended(self, pid=None):
        """
        Check if given process is in suspended state or not
        :param pid: process ID
        :type pid: string
        """

        if pid is None:
            self.logger.error("Could not get pid to check the state")
            return False
        state = 'T'
        rv = self.pu.get_proc_state(self.hostname, pid)
        if rv != state:
            return False
        childlist = self.pu.get_proc_children(self.hostname, pid)
        for child in childlist:
            rv = self.pu.get_proc_state(self.hostname, child)
            if rv != state:
                return False
        return True

    def isUp(self, max_attempts=None):
        """
        Check for PBS mom up
        """
        # Poll for few seconds to see if mom is up and node is free
        if max_attempts is None:
            max_attempts = self.ptl_conf['max_attempts']
        for _ in range(max_attempts):
            rv = super(MoM, self)._isUp()
            if rv:
                break
            time.sleep(1)
        if rv:
            try:
                nodes = self.server.status(NODE, id=self.shortname)
                if nodes:
                    attr = {'state': (MATCH_RE,
                                      'free|provisioning|offline|job-busy')}
                    self.server.expect(NODE, attr, id=self.shortname)
            # Ignore PbsStatusError if mom daemon is up but there aren't
            # any mom nodes
            except PbsStatusError:
                pass
            except PtlExpectError:
                rv = False
        return rv

    def start(self, args=None, launcher=None):
        """
        Start the PBS mom

        :param args: Arguments to start the mom
        :type args: str or None
        :param launcher: Optional utility to invoke the launch of the service
        :type launcher: str or list or None
        """
        if args is not None or launcher is not None:
            return super(MoM, self)._start(inst=self, args=args,
                                           cmd_map=self.conf_to_cmd_map,
                                           launcher=launcher)
        else:
            try:
                rv = self.pi.start_mom()
                pid = self._validate_pid(self)
                if pid is None:
                    raise PbsServiceError(rv=False, rc=-1,
                                          msg="Could not find PID")
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
            return rv

    def stop(self, sig=None):
        """
        Stop the PBS mom

        :param sig: Signal to stop the PBS mom
        :type sig: str
        """
        if sig is not None:
            self.logger.info(self.logprefix + 'stopping MoM on host ' +
                             self.hostname)
            return super(MoM, self)._stop(sig, inst=self)
        else:
            try:
                self.pi.stop_mom()
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
            return True

    def restart(self, args=None):
        """
        Restart the PBS mom
        """
        if self.isUp():
            if not self.stop():
                return False
        return self.start(args=args)

    def log_match(self, msg=None, id=None, n=50, tail=True, allmatch=False,
                  regexp=False, max_attempts=None, interval=None,
                  starttime=None, endtime=None, level=logging.INFO,
                  existence=True):
        """
        Match given ``msg`` in given ``n`` lines of MoM log

        :param msg: log message to match, can be regex also when
                    ``regexp`` is True
        :type msg: str
        :param id: The id of the object to trace. Only used for
                   tracejob
        :type id: str
        :param n: 'ALL' or the number of lines to search through,
                  defaults to 50
        :type n: str or int
        :param tail: If true (default), starts from the end of
                     the file
        :type tail: bool
        :param allmatch: If True all matching lines out of then
                         parsed are returned as a list. Defaults
                         to False
        :type allmatch: bool
        :param regexp: If true msg is a Python regular expression.
                       Defaults to False
        :type regexp: bool
        :param max_attempts: the number of attempts to make to find
                             a matching entry
        :type max_attempts: int
        :param interval: the interval between attempts
        :type interval: int
        :param starttime: If set ignore matches that occur before
                          specified time
        :type starttime: float
        :param endtime: If set ignore matches that occur after
                        specified time
        :type endtime: float
        :param level: The logging level, defaults to INFO
        :type level: int
        :param existence: If True (default), check for existence of
                        given msg, else check for non-existence of
                        given msg.
        :type existence: bool

        :return: (x,y) where x is the matching line
                 number and y the line itself. If allmatch is True,
                 a list of tuples is returned.
        :rtype: tuple
        :raises PtlLogMatchError:
                When ``existence`` is True and given
                ``msg`` is not found in ``n`` line
                Or
                When ``existence`` is False and given
                ``msg`` found in ``n`` line.

        .. note:: The matching line number is relative to the record
                  number, not the absolute line number in the file.
        """
        return self._log_match(self, msg, id, n, tail, allmatch, regexp,
                               max_attempts, interval, starttime, endtime,
                               level, existence)

    def delete_vnodes(self):
        rah = ATTR_rescavail + '.host'
        rav = ATTR_rescavail + '.vnode'
        a = {rah: self.hostname, rav: None}
        try:
            _vs = self.server.status(HOST, a, id=self.hostname)
        except PbsStatusError:
            try:
                _vs = self.server.status(HOST, a, id=self.shortname)
            except PbsStatusError as e:
                err_msg = e.msg[0].rstrip()
                if (err_msg.endswith('Server has no node list') or
                        err_msg.endswith('Unknown node')):
                    _vs = []
                else:
                    raise e
        vs = []
        for v in _vs:
            if v[rav].split('.')[0] != v[rah].split('.')[0]:
                vs.append(v['id'])
        if len(vs) > 0:
            self.server.manager(MGR_CMD_DELETE, VNODE, id=vs)

    def revert_to_defaults(self, delvnodedefs=True):
        """
        1. ``Revert MoM configuration to defaults.``

        2. ``Remove epilogue and prologue``

        3. ``Delete all vnode definitions
        HUP MoM``

        :param delvnodedefs: if True (the default) delete all vnode
                             definitions and restart the MoM
        :type delvnodedefs: bool

        :returns: True on success and False otherwise
        """
        self.logger.info(self.logprefix +
                         'reverting configuration to defaults')
        restart = False
        if not self.has_snap:
            self.delete_pelog()
            if delvnodedefs and self.has_vnode_defs():
                restart = True
                if not self.delete_vnode_defs():
                    return False
                self.delete_vnodes()
            if not (self.config == self.dflt_config):
                # Clear older mom configuration. Apply default.
                self.config = {}
                self.apply_config(self.dflt_config, hup=False, restart=True)
            if restart:
                self.restart()
            else:
                self.signal('-HUP')
            return self.isUp()
        return True

    def _get_dflt_pbsconfval(self, conf, svr_hostname, hosttype, hostobj):
        """
        Helper function to revert_pbsconf, tries to determine and return
        default value for the pbs.conf variable given
        :param conf: the pbs.conf variable
        :type conf: str
        :param svr_hostname: hostname of the server host
        :type svr_hostname: str
        :param hosttype: type of host being reverted
        :type hosttype: str
        :param hostobj: PTL object associated with the host
        :type hostobj: PBSService
        :return default value of the pbs.conf variable if it can be determined
        as a string, otherwise None
        """
        if conf == "PBS_SERVER":
            return svr_hostname
        elif conf == "PBS_START_SCHED":
            return "0"
        elif conf == "PBS_START_COMM":
            return "0"
        elif conf == "PBS_START_SERVER":
            return "0"
        elif conf == "PBS_START_MOM":
            return "1"
        elif conf == "PBS_CORE_LIMIT":
            return "unlimited"
        elif conf == "PBS_SCP":
            scppath = self.du.which(hostobj.hostname, "scp")
            if scppath != "scp":
                return scppath
        elif conf == "PBS_LOG_HIGHRES_TIMESTAMP":
            return "1"
        elif conf == "PBS_PUBLIC_HOST_NAME":
            return None
        elif conf == "PBS_DAEMON_SERVICE_USER":
            # Only set if scheduler user is not default
            if DAEMON_SERVICE_USER.name == 'root':
                return None
            else:
                return DAEMON_SERVICE_USER.name

        return None

    def cat(self, filename=None, sudo=False, runas=None,
            logerr=True, level=logging.INFOCLI2, option=None):
        """
        Wrapper for cat function
        """
        return self.du.cat(self.hostname, filename, sudo, runas,
                           logerr, level, option)

    def revert_mom_pbs_conf(self, primary_server, vals_to_set):
        """
        Helper function to revert_pbsconf to revert all mom daemons' pbs.conf
        :param primary_server: object of the primary PBS server
        :type primary_server: PBSService
        :param vals_to_set: dict of pbs.conf values to set
        :type vals_to_set: dict
        """

        new_pbsconf = dict(vals_to_set)
        restart_mom = False
        pbs_conf_val = self.du.parse_pbs_config(self.hostname)
        if not pbs_conf_val:
            raise ValueError("Could not parse pbs.conf on host %s" %
                             (self.hostname))

        # to start with, set all keys in new_pbsconf with values from the
        # existing pbs.conf
        keys_to_delete = []
        for conf in new_pbsconf:
            if conf in pbs_conf_val:
                new_pbsconf[conf] = pbs_conf_val[conf]
            else:
                # existing pbs.conf doesn't have a default variable set
                # Try to determine the default
                val = self._get_dflt_pbsconfval(conf,
                                                primary_server.hostname,
                                                "mom", self)
                if val is None:
                    self.logger.error("Couldn't revert %s in pbs.conf"
                                      " to its default value" %
                                      (conf))
                    keys_to_delete.append(conf)
                else:
                    new_pbsconf[conf] = val

        for key in keys_to_delete:
            del(new_pbsconf[key])

        # Set the mom start bit to 1
        if (new_pbsconf["PBS_START_MOM"] != "1"):
            new_pbsconf["PBS_START_MOM"] = "1"
            restart_mom = True

        # Set PBS_CORE_LIMIT, PBS_SCP and PBS_SERVER
        if new_pbsconf["PBS_CORE_LIMIT"] != "unlimited":
            new_pbsconf["PBS_CORE_LIMIT"] = "unlimited"
            restart_mom = True
        if new_pbsconf["PBS_SERVER"] != primary_server.hostname:
            new_pbsconf["PBS_SERVER"] = primary_server.hostname
            restart_mom = True
        if "PBS_SCP" not in new_pbsconf:
            scppath = self.du.which(self.hostname, "scp")
            if scppath != "scp":
                new_pbsconf["PBS_SCP"] = scppath
                restart_mom = True
        if new_pbsconf["PBS_LOG_HIGHRES_TIMESTAMP"] != "1":
            new_pbsconf["PBS_LOG_HIGHRES_TIMESTAMP"] = "1"
            restart_mom = True

        # Check if existing pbs.conf has more/less entries than the
        # default list
        if len(pbs_conf_val) != len(new_pbsconf):
            restart_mom = True
        # Check if existing pbs.conf has correct ownership
        dest = self.du.get_pbs_conf_file(self.hostname)
        (cf_uid, cf_gid) = (os.stat(dest).st_uid, os.stat(dest).st_gid)
        if cf_uid != 0 or cf_gid > 10:
            restart_mom = True

        if restart_mom:
            self.du.set_pbs_config(self.hostname, confs=new_pbsconf,
                                   append=False)
            self.pbs_conf = new_pbsconf
            self.pi.initd(self.hostname, "restart", daemon="mom")
            if not self.isUp():
                self.fail("Mom is not up")

    def save_configuration(self, outfile=None, mode='w'):
        """
        Save a MoM ``mom_priv/config``

        :param outfile: Optional Path to a file to which configuration
                        is saved, when not provided, data is saved in
                        class variable saved_config
        :type outfile: str
        :param mode: the mode in which to open outfile to save
                     configuration.
        :type mode: str
        :returns: True on success, False on error

        .. note:: first object being saved should open this file
                  with 'w' and subsequent calls from other objects
                  should save with mode 'a' or 'a+'. Defaults to a+
        """
        conf = {}
        mpriv = os.path.join(self.pbs_conf['PBS_HOME'], 'mom_priv')
        cf = os.path.join(mpriv, 'config')
        self._save_config_file(conf, cf)

        if os.path.isdir(os.path.join(mpriv, 'config.d')):
            for f in self.du.listdir(path=os.path.join(mpriv, 'config.d'),
                                     sudo=True):
                self._save_config_file(conf,
                                       os.path.join(mpriv, 'config.d', f))
        mconf = {self.hostname: conf}
        if MGR_OBJ_NODE not in self.server.saved_config:
            self.server.saved_config[MGR_OBJ_NODE] = {}
        self.server.saved_config[MGR_OBJ_NODE].update(mconf)
        if outfile is not None:
            try:
                with open(outfile, mode) as f:
                    json.dump(self.server.saved_config, f)
            except Exception:
                self.logger.error('error saving configuration to ' + outfile)
                return False
        return True

    def load_configuration(self, infile):
        """
        load mom configuration from saved file infile
        """
        rv = self._load_configuration(infile, MGR_OBJ_NODE)
        self.signal('-HUP')
        return rv

    def is_cray(self):
        """
        Returns True if the version of PBS used was built for Cray platforms
        """
        try:
            self.log_match("alps_client", n='ALL', tail=False, max_attempts=1)
        except PtlLogMatchError:
            return False
        else:
            return True

    def is_shasta(self):
        """
        Returns True if the version of PBS used is installed on Shasta platform
        """
        if self.platform == 'shasta':
            return True
        else:
            return False

    def is_only_linux(self):
        """
        Returns True if MoM is only Linux
        """
        return True

    def check_mom_bash_version(self):
        """
        Return True if bash version on mom is greater than or equal to 4.2.46
        """
        cmd = ['echo', '${BASH_VERSION%%[^0-9.]*}']
        ret = self.du.run_cmd(self.hostname, cmd=cmd, sudo=True,
                              as_script=True)
        req_bash_version = "4.2.46"
        if len(ret['out']) > 0:
            mom_bash_version = ret['out'][0]
        else:
            # If we can't get the bash version, there is no harm
            # in trying to run the test. It might fail in an error,
            # but at least we tried.
            return True
        if mom_bash_version >= req_bash_version:
            return True
        else:
            return False

    def is_cpuset_mom(self):
        """
        Check for cgroup cpuset enabled system
        """
        if self._is_cpuset_mom is not None:
            return self._is_cpuset_mom
        hpe_file1 = "/etc/sgi-compute-node-release"
        hpe_file2 = "/etc/sgi-known-distributions"
        ret1 = self.du.isfile(self.hostname, path=hpe_file1)
        ret2 = self.du.isfile(self.hostname, path=hpe_file2)
        if ret1 or ret2:
            self._is_cpuset_mom = True
        else:
            self._is_cpuset_mom = False
        return self._is_cpuset_mom

    def skipTest(self, reason=None):
        """
        Skip Test
        :param reason: message to indicate why test is skipped
        :type reason: str or None
        """
        if reason:
            self.logger.warning('test skipped: ' + reason)
        else:
            reason = 'unknown'
        raise SkipTest(reason)

    def check_mem_request(self, attrib):
        if 'resources_available.mem' in attrib:
            del attrib['resources_available.mem']
            self.skipTest(
                'mem requested cannot be set on cpuset mom')

    def check_ncpus_request(self, attrib, vn):
        skipmsg = 'ncpus requested are not same as available'
        skipmsg += ' on a cpuset node'
        at = 'resources_available.ncpus'
        if at in attrib:
            if int(attrib[at]) != int(vn[at]):
                self.skipTest(skipmsg)
            else:
                del attrib['resources_available.ncpus']

    def set_node_attrib(self, vnode, attrib):
        """
        set attribute on a node
        """
        for res, value in attrib.items():
            ecmd = 'set node '
            ecmd += vnode['id'] + ' ' + res + '=' + str(value)
            pcmd = [os.path.join(self.pbs_conf['PBS_EXEC'],
                                 'bin', 'qmgr'), '-c', ecmd]
            ret = self.du.run_cmd(self.hostname, pcmd,
                                  sudo=True,
                                  level=logging.INFOCLI,
                                  logerr=True)

    def create_vnodes(self, attrib=None, num=1,
                      additive=False, sharednode=True, restart=True,
                      delall=True, natvnode=None, usenatvnode=False,
                      attrfunc=None, fname=None, vnodes_per_host=1,
                      createnode=True, expect=True, vname=None):
        """
        helper function to create vnodes.
        :param attrib: attributes to assign to each node
        :type attrib: dict
        :param num: the number of vnodes to create. Defaults to 1
        :type num: int
        :param additive: If True, vnodes are added to the existing
                         vnode defs.Defaults to False.
        :type additive: bool
        :param sharednode: If True, all vnodes will share the same
                           host.Defaults to True.
        :type sharednode: bool
        :param restart: If True the MoM will be restarted.
        :type restart: bool
        :param delall: If True delete all server nodes prior to
                       inserting vnodes
        :type delall: bool
        :param natvnode: name of the natural vnode.i.e. The node
                         name in qmgr -c "create node <name>"
        :type natvnode: str or None
        :param usenatvnode: count the natural vnode as an
                            allocatable node.
        :type usenatvnode: bool
        :param attrfunc: an attribute=value function generator,
                         see create_vnode_def
        :param fname: optional name of the vnode def file
        :type fname: str or None
        :param vnodes_per_host: number of vnodes per host
        :type vnodes_per_host: int
        :param createnode: whether to create the node via manage or
                           not. Defaults to True
        :type createnode: bool
        :param expect: whether to expect attributes to be set or
                       not. Defaults to True
        :type expect: bool
        :returns: True on success and False otherwise
        :param vname: optional vnode prefix name to be used
                      only if vnodes cannot have mom hostname
                      as vnode prefix under some condition
        :type vname: str or None
        """
        if attrib is None:
            self.logger.error("attributes are required")
            return False

        if self.is_cpuset_mom():
            if vname:
                msg = "cpuset nodes cannot have vnode names"
                self.skipTest(msg)
            self.check_mem_request(attrib)
            if len(attrib) == 0:
                return True
            nodes = self.server.status(HOST, id=self.shortname)
            del nodes[0]  # don't set any attribute on natural node
            if len(nodes) < num:
                msg = 'cpuset mom does not have required number of nodes'
                self.skipTest(msg)
            elif len(nodes) == num:
                if attrib:
                    for vnode in nodes:
                        self.check_ncpus_request(attrib, vnode)
                        if len(attrib) != 0:
                            self.set_node_attrib(vnode, attrib)
                return True
            else:
                i = 0
                for vnode in nodes:
                    if i < num:
                        i += 1
                        self.check_ncpus_request(attrib, vnode)
                        if len(attrib) != 0:
                            self.set_node_attrib(vnode, attrib)
                    else:
                        at = {'state': 'offline'}
                        self.set_node_attrib(vnode, at)
                return True

        if natvnode is None:
            natvnode = self.shortname

        if vname is None:
            vname = self.shortname

        if delall:
            try:
                rv = self.server.manager(MGR_CMD_DELETE, NODE, None, "")
                if rv != 0:
                    return False
            except PbsManagerError:
                pass

        vdef = self.create_vnode_def(vname, attrib, num, sharednode,
                                     usenatvnode=usenatvnode,
                                     attrfunc=attrfunc,
                                     vnodes_per_host=vnodes_per_host)
        self.insert_vnode_def(vdef, fname=fname, additive=additive,
                              restart=restart)

        new_vnodelist = []
        if usenatvnode:
            new_vnodelist.append(natvnode)
            num_check = num - 1
        else:
            num_check = num
        for i in range(num_check):
            new_vnodelist.append("%s[%s]" % (vname, i))

        if createnode:
            try:
                statm = self.server.status(NODE, id=natvnode)
            except Exception:
                statm = []
            if len(statm) >= 1:
                _m = 'Mom %s already exists, not creating' % (natvnode)
                self.logger.info(_m)
            else:
                if self.pbs_conf and 'PBS_MOM_SERVICE_PORT' in self.pbs_conf:
                    m_attr = {'port': self.pbs_conf['PBS_MOM_SERVICE_PORT']}
                else:
                    m_attr = None
                self.server.manager(MGR_CMD_CREATE, NODE, m_attr, natvnode)
        # only expect if vnodes were added rather than the nat vnode modified
        if expect and num > 0:
            attrs = {'state': 'free'}
            attrs.update(attrib)
            for vn in new_vnodelist:
                self.server.expect(VNODE, attrs, id=vn)
        return True

    def create_vnode_def(self, name, attrs={}, numnodes=1, sharednode=True,
                         pre='[', post=']', usenatvnode=False, attrfunc=None,
                         vnodes_per_host=1):
        """
        Create a vnode definition string representation

        :param name: The prefix for name of vnode to create,
                     name of vnode will be prefix + pre + <num> +
                     post
        :type name: str
        :param attrs: Dictionary of attributes to set on each vnode
        :type attrs: Dictionary
        :param numnodes: The number of vnodes to create
        :type numnodes: int
        :param sharednode: If true vnodes are shared on a host
        :type sharednode: bool
        :param pre: The symbol preceding the numeric value of that
                    vnode.
        :type pre: str
        :param post: The symbol following the numeric value of that
                     vnode.
        :type post: str
        :param usenatvnode: use the natural vnode as the first vnode
                            to allocate this only makes sense
                            starting with PBS 11.3 when natural
                            vnodes are reported as a allocatable
        :type usenatvnode: bool
        :param attrfunc: function to customize the attributes,
                         signature is (name, numnodes, curnodenum,
                         attrs), must return a dict that contains
                         new or modified attrs that will be added to
                         the vnode def. The function is called once
                         per vnode being created, it does not modify
                         attrs itself across calls.
        :param vnodes_per_host: number of vnodes per host
        :type vnodes_per_host: int
        :returns: A string representation of the vnode definition
                  file
        """
        sethost = False

        attribs = attrs.copy()
        if not sharednode and 'resources_available.host' not in attrs:
            sethost = True

        if attrfunc is None:
            customattrs = attribs

        vdef = ["$configversion 2"]

        # altering the natural vnode information
        if numnodes == 0:
            for k, v in attribs.items():
                vdef += [name + ": " + str(k) + "=" + str(v)]
        else:
            if usenatvnode:
                if attrfunc:
                    customattrs = attrfunc(name, numnodes, "", attribs)
                for k, v in customattrs.items():
                    vdef += [self.shortname + ": " + str(k) + "=" + str(v)]
                # account for the use of the natural vnode
                numnodes -= 1
            else:
                # ensure that natural vnode is not allocatable by the scheduler
                vdef += [self.shortname + ": resources_available.ncpus=0"]
                vdef += [self.shortname + ": resources_available.mem=0"]

        for n in range(numnodes):
            vnid = name + pre + str(n) + post
            if sethost:
                if vnodes_per_host > 1:
                    if n % vnodes_per_host == 0:
                        _nid = vnid
                    else:
                        _nid = name + pre + str(n - n % vnodes_per_host) + post
                    attribs['resources_available.host'] = _nid
                else:
                    attribs['resources_available.host'] = vnid

            if attrfunc:
                customattrs = attrfunc(vnid, numnodes, n, attribs)
            for k, v in customattrs.items():
                vdef += [vnid + ": " + str(k) + "=" + str(v)]

        if numnodes == 0:
            nn = 1
        else:
            nn = numnodes
        if numnodes > 1:
            vnn_msg = ' vnodes '
        else:
            vnn_msg = ' vnode '

        self.logger.info(self.logprefix + 'created ' + str(nn) +
                         vnn_msg + name + ' with attr ' +
                         str(attribs) + ' on host ' + self.hostname)
        vdef += ["\n"]
        del attribs
        return "\n".join(vdef)

    def add_checkpoint_abort_script(self, dirname=None, body=None,
                                    abort_time=30):
        """
        Add checkpoint script in the mom config.
        returns: a temp file for checkpoint script
        """
        chk_file = self.du.create_temp_file(hostname=self.hostname, body=body,
                                            dirname=dirname)
        self.du.chmod(hostname=self.hostname, path=chk_file, mode=0o700)
        self.du.chown(hostname=self.hostname, path=chk_file, runas=ROOT_USER,
                      uid=0, gid=0)
        c = {'$action checkpoint_abort':
             str(abort_time) + ' !' + chk_file + ' %sid'}
        self.add_config(c)
        return chk_file

    def add_restart_script(self, dirname=None, body=None,
                           abort_time=30):
        """
        Add restart script in the mom config.
        returns: a temp file for restart script
        """
        rst_file = self.du.create_temp_file(hostname=self.hostname, body=body,
                                            dirname=dirname)
        self.du.chmod(hostname=self.hostname, path=rst_file, mode=0o700)
        self.du.chown(hostname=self.hostname, path=rst_file, runas=ROOT_USER,
                      uid=0, gid=0)
        c = {'$action restart': str(abort_time) + ' !' + rst_file + ' %sid'}
        self.add_config(c)
        return rst_file

    def parse_config(self):
        """
        Parse mom config file into a dictionary of configuration
        options.

        :returns: A dictionary of configuration options on success,
                  and None otherwise
        """
        try:
            mconf = os.path.join(self.pbs_conf['PBS_HOME'], 'mom_priv',
                                 'config')
            ret = self.du.cat(self.hostname, mconf, sudo=True)
            if ret['rc'] != 0:
                self.logger.error('error parsing configuration file')
                return None

            self.config = {}
            lines = ret['out']
            for line in lines:
                if line.startswith('$action'):
                    (ac, k, v) = line.split(' ', 2)
                    k = ac + ' ' + k
                else:
                    (k, v) = line.split(' ', 1)
                if k in self.config:
                    if isinstance(self.config[k], list):
                        self.config[k].append(v)
                    else:
                        self.config[k] = [self.config[k], v]
                else:
                    self.config[k] = v
        except Exception:
            self.logger.error('error in parse_config')
            return None

        return self.config

    def add_config(self, conf={}, hup=True):
        """
        Add config options to mom_priv_config.

        :param conf: The configurations to add to ``mom_priv/config``
        :type conf: Dictionary
        :param hup: If True (default) ``HUP`` the MoM
        :type hup: bool
        :returns: True on success and False otherwise
        """

        doconfig = False

        if not self.config:
            self.parse_config()

        mc = self.config

        if mc is None:
            mc = {}

        for k, v in conf.items():
            if k in mc and (mc[k] == v or (isinstance(v, list) and
                                           mc[k] in v)):
                self.logger.debug(self.logprefix + 'config ' + k +
                                  ' already set to ' + str(v))
                continue
            else:
                doconfig = True
                break

        if not doconfig:
            return True

        self.logger.info(self.logprefix + "config " + str(conf))

        return self.apply_config(conf, hup)

    def unset_mom_config(self, name, hup=True):
        """
        Delete a mom_config entry

        :param name: The entry to remove from ``mom_priv/config``
        :type name: String
        :param hup: if True (default) ``HUP`` the MoM
        :type hup: bool
        :returns: True on success and False otherwise
        """
        mc = self.parse_config()
        if mc is None or name not in mc:
            return True
        self.logger.info(self.logprefix + "unsetting config " + name)
        del mc[name]

        return self.apply_config(mc, hup)

    def apply_config(self, conf={}, hup=True, restart=False):
        """
        Apply configuration options to MoM.

        :param conf: A dictionary of configuration options to apply
                     to MoM
        :type conf: Dictionary
        :param hup: If True (default) , HUP the MoM to apply the
                    configuration
        :type hup: bool
        :returns: True on success and False otherwise.
        """
        self.config = {**self.config, **conf}
        try:
            fn = self.du.create_temp_file()
            with open(fn, 'w+') as f:
                for k, v in self.config.items():
                    if isinstance(v, list):
                        for eachprop in v:
                            f.write(str(k) + ' ' + str(eachprop) + '\n')
                    else:
                        f.write(str(k) + ' ' + str(v) + '\n')
            dest = os.path.join(
                self.pbs_conf['PBS_HOME'], 'mom_priv', 'config')
            self.du.run_copy(self.hostname, src=fn, dest=dest,
                             preserve_permission=False, sudo=True)
            os.remove(fn)
        except Exception:
            raise PbsMomConfigError(rc=1, rv=False,
                                    msg='error processing add_config')
        if restart:
            return self.restart()
        elif hup:
            return self.signal('-HUP')

        return True

    def get_vnode_def(self, vnodefile=None):
        """
        :returns: A vnode def file as a single string
        """
        if vnodefile is None:
            return None
        with open(vnodefile) as f:
            lines = f.readlines()
        return "".join(lines)

    def insert_vnode_def(self, vdef, fname=None, additive=False, restart=True):
        """
        Insert and enable a vnode definition. Root privilege
        is required

        :param vdef: The vnode definition string as created by
                     create_vnode_def
        :type vdef: str
        :param fname: The filename to write the vnode def string to
        :type fname: str or None
        :param additive: If True, keep all other vnode def files
                         under config.d Default is False
        :type additive: bool
        :param delete: If True, delete all nodes known to the server.
                       Default is True
        :type delete: bool
        :param restart: If True, restart the MoM. Default is True
        :type restart: bool
        """

        if self.is_cpuset_mom():
            msg = 'Creating multiple vnodes is not supported on cpuset mom'
            self.skipTest(msg)

        try:
            fn = self.du.create_temp_file(self.hostname, body=vdef)
        except Exception:
            raise PbsMomConfigError(rc=1, rv=False,
                                    msg="Failed to insert vnode definition")
        if fname is None:
            fname = 'pbs_vnode_' + str(int(time.time())) + '.def'
        if not additive:
            self.delete_vnode_defs()
        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbs_mom')]
        cmd += ['-s', 'insert', fname, fn]
        ret = self.du.run_cmd(self.hostname, cmd, sudo=True, logerr=False,
                              level=logging.INFOCLI)
        self.du.rm(hostname=self.hostname, path=fn, force=True)
        if ret['rc'] != 0:
            raise PbsMomConfigError(rc=1, rv=False, msg="\n".join(ret['err']))
        msg = self.logprefix + 'inserted vnode definition file '
        msg += fname + ' on host: ' + self.hostname
        self.logger.info(msg)
        if restart:
            self.restart()

    def has_vnode_defs(self):
        """
        Check for vnode definition(s)
        """
        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbs_mom')]
        cmd += ['-s', 'list']
        ret = self.du.run_cmd(self.hostname, cmd, sudo=True, logerr=False,
                              level=logging.INFOCLI)
        if ret['rc'] == 0:
            files = [x for x in ret['out'] if not x.startswith('PBS')]
            if len(files) > 0:
                return True
            else:
                return False
        else:
            return False

    def delete_vnode_defs(self, vdefname=None):
        """
        delete vnode definition(s) on this MoM

        :param vdefname: name of a vnode definition file to delete,
                         if None all vnode definitions are deleted
        :type vdefname: str
        :returns: True if delete succeed otherwise False
        """
        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbs_mom')]
        cmd += ['-s', 'list']
        ret = self.du.run_cmd(self.hostname, cmd, sudo=True, logerr=False,
                              level=logging.INFOCLI)
        if ret['rc'] != 0:
            return False
        rv = True
        if len(ret['out']) > 0:
            for vnodedef in ret['out']:
                vnodedef = vnodedef.strip()
                if (vnodedef == vdefname) or vdefname is None:
                    if vnodedef.startswith('PBS'):
                        continue
                    cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin',
                                        'pbs_mom')]
                    cmd += ['-s', 'remove', vnodedef]
                    ret = self.du.run_cmd(self.hostname, cmd, sudo=True,
                                          logerr=False, level=logging.INFOCLI)
                    if ret['rc'] != 0:
                        return False
                    else:
                        rv = True
        return rv

    def has_pelog(self, filename=None):
        """
        Check for prologue and epilogue
        """
        _has_pro = False
        _has_epi = False
        phome = self.pbs_conf['PBS_HOME']
        prolog = os.path.join(phome, 'mom_priv', 'prologue')
        epilog = os.path.join(phome, 'mom_priv', 'epilogue')
        if self.du.isfile(self.hostname, path=prolog, sudo=True):
            _has_pro = True
        if filename == 'prologue':
            return _has_pro
        if self.du.isfile(self.hostname, path=epilog, sudo=True):
            _has_epi = True
        if filename == 'epilogue':
            return _has_pro
        if _has_epi or _has_pro:
            return True
        return False

    def has_prologue(self):
        """
        Check for prologue
        """
        return self.has_pelog('prolouge')

    def has_epilogue(self):
        """
        Check for epilogue
        """
        return self.has_pelog('epilogue')

    def delete_pelog(self):
        """
        Delete any prologue and epilogue files that may have been
        defined on this MoM
        """
        phome = self.pbs_conf['PBS_HOME']
        prolog = os.path.join(phome, 'mom_priv', 'prologue')
        epilog = os.path.join(phome, 'mom_priv', 'epilogue')
        ret = self.du.rm(self.hostname, epilog, force=True,
                         sudo=True, logerr=False)
        if ret:
            ret = self.du.rm(self.hostname, prolog, force=True,
                             sudo=True, logerr=False)
        if not ret:
            self.logger.error('problem deleting prologue/epilogue')
            # we don't bail because the problem may be that files did not
            # exist. Let tester fix the issue
        return ret

    def create_pelog(self, body=None, src=None, filename=None):
        """
        create ``prologue`` and ``epilogue`` files, functionality
        accepts either a body of the script or a source file.

        :returns: True on success and False on error
        """

        if self.has_snap:
            _msg = 'MoM is in loaded from snap so bypassing pelog creation'
            self.logger.info(_msg)
            return False

        if (src is None and body is None) or (filename is None):
            self.logger.error('file and body of script are required')
            return False

        pelog = os.path.join(self.pbs_conf['PBS_HOME'], 'mom_priv', filename)

        self.logger.info(self.logprefix +
                         ' creating ' + filename + ' with body\n' + '---')
        if body is not None:
            self.logger.info(body)
            src = self.du.create_temp_file(prefix='pbs-pelog', body=body)
        elif src is not None:
            with open(src) as _b:
                self.logger.info("\n".join(_b.readlines()))
        self.logger.info('---')

        ret = self.du.run_copy(self.hostname, src=src, dest=pelog,
                               preserve_permission=False, sudo=True)
        if body is not None:
            os.remove(src)
        if ret['rc'] != 0:
            self.logger.error('error creating pelog ')
            return False

        ret = self.du.chown(self.hostname, path=pelog, uid=0, gid=0, sudo=True,
                            logerr=False)
        if not ret:
            self.logger.error('error chowning pelog to root')
            return False
        ret = self.du.chmod(self.hostname, path=pelog, mode=0o755, sudo=True)
        return ret

    def prologue(self, body=None, src=None):
        """
        create prologue
        """
        return self.create_pelog(body, src, 'prologue')

    def epilogue(self, body=None, src=None):
        """
        Create epilogue
        """
        return self.create_pelog(body, src, 'epilogue')

    def action(self, act, script):
        """
        Define action script. Not currently implemented
        """
        pass

    def enable_cgroup_cset(self):
        """
        Configure and enable cgroups hook
        """
        # check if cgroups subsystems including cpusets are mounted
        file = os.path.join(os.sep, 'proc', 'mounts')
        mounts = self.du.cat(self.hostname, file)['out']
        pat = 'cgroup /sys/fs/cgroup'
        enablemem = False
        for line in mounts:
            entries = line.split()
            if entries[2] != 'cgroup':
                continue
            flags = entries[3].split(',')
            if 'memory' in flags:
                enablemem = True
        if str(mounts).count(pat) >= 6 and str(mounts).count('cpuset') >= 2:
            pbs_conf_val = self.du.parse_pbs_config(self.hostname)
            f1 = os.path.join(pbs_conf_val['PBS_EXEC'], 'lib',
                              'python', 'altair', 'pbs_hooks',
                              'pbs_cgroups.CF')
            # set vnode_per_numa_node = true, use_hyperthreads = true
            with open(f1, "r") as cfg:
                cfg_dict = json.load(cfg)
            cfg_dict['vnode_per_numa_node'] = True
            cfg_dict['use_hyperthreads'] = True

            # if the memory subsystem is not mounted, do not enable mem
            # in the cgroups config otherwise PTL tests will fail.
            # This matches what is documented for cgroups and mem.
            cfg_dict['cgroup']['memory']['enabled'] = enablemem
            _, path = tempfile.mkstemp(prefix="cfg", suffix=".json")
            with open(path, "w") as cfg1:
                json.dump(cfg_dict, cfg1, indent=4)
            # read in the cgroup hook configuration
            a = {'content-type': 'application/x-config',
                 'content-encoding': 'default',
                 'input-file': path}
            # check that mom is ready before importing hook
            self.server.expect(NODE, {'state': 'free'}, id=self.shortname)
            self.server.manager(MGR_CMD_IMPORT, HOOK, a,
                                'pbs_cgroups')
            os.remove(path)
            # enable cgroups hook
            self.server.manager(MGR_CMD_SET, HOOK,
                                {'enabled': 'True'}, 'pbs_cgroups')
        else:
            self.logger.error('%s: cgroup subsystems not mounted' %
                              self.hostname)
            raise AssertionError('cgroup subsystems not mounted')


================================================
FILE: test/fw/ptl/lib/ptl_object.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import copy
import logging
import os
import pwd
import re
import sys
import time
from collections import OrderedDict

from ptl.lib.ptl_batchutils import *


class PBSObject(object):

    """
    Generic PBS Object encapsulating attributes and defaults

    The ptl_conf dictionary holds general configuration for the
    framework's operations, specifically, one can control:

    mode: set to ``PTL_CLI`` to operate in ``CLI`` mode or
    ``PTL_API`` to operate in ``API`` mode

    max_attempts: the default maximum number of attempts
    to be used by different methods like expect, log_match.
    Defaults to 60

    attempt_interval: the default time interval (in seconds)
    between each requests. Defaults to 0.5

    update_attributes: the default on whether Object attributes
    should be updated using a list of dictionaries. Defaults
    to True

    :param name: The name associated to the object
    :type name: str
    :param attrs: Dictionary of attributes to set on object
    :type attrs: Dictionary
    :param defaults: Dictionary of default attributes. Setting
                     this will override any other object's default
    :type defaults: Dictionary
    """

    logger = logging.getLogger(__name__)
    utils = BatchUtils()
    platform = sys.platform

    ptl_conf = {
        'mode': PTL_API,
        'max_attempts': 60,
        'attempt_interval': 0.5,
        'update_attributes': True,
    }

    def __init__(self, name, attrs={}, defaults={}):
        self.attributes = OrderedDict()
        self.name = name
        self.dflt_attributes = defaults
        self.attropl = None
        self.custom_attrs = OrderedDict()
        self.ctime = time.time()

        self.set_attributes(attrs)

    @classmethod
    def set_update_attributes(cls, val):
        """
        Set update attributes
        """
        cls.logger.info('setting update attributes ' + str(val))
        if val or (val.isdigit() and int(val) == 1) or val[0] in ('t', 'T'):
            val = True
        else:
            val = False
        cls.ptl_conf['update_attributes'] = val

    @classmethod
    def set_max_attempts(cls, val):
        """
        Set max attempts
        """
        cls.logger.info('setting max attempts ' + str(val))
        cls.ptl_conf['max_attempts'] = int(val)

    @classmethod
    def set_attempt_interval(cls, val):
        """
        Set attempt interval
        """
        cls.logger.info('setting attempt interval ' + str(val))
        cls.ptl_conf['attempt_interval'] = float(val)

    def set_attributes(self, a={}):
        """
        set attributes and custom attributes on this object.
        custom attributes are used when converting attributes
        to CLI

        :param a: Attribute dictionary
        :type a: Dictionary
        """
        if isinstance(a, list):
            a = OrderedDict(a)

        self.attributes = OrderedDict(list(self.dflt_attributes.items()) +
                                      list(self.attributes.items()) +
                                      list(a.items()))

        self.custom_attrs = OrderedDict(list(self.custom_attrs.items()) +
                                        list(a.items()))

    def unset_attributes(self, attrl=[]):
        """
        Unset attributes from object's attributes and custom
        attributes

        :param attrl: Attribute list
        :type attrl: List
        """
        for attr in attrl:
            if attr in self.attributes:
                del self.attributes[attr]
            if attr in self.custom_attrs:
                del self.custom_attrs[attr]

    def __str__(self):
        """
        Return a string representation of this PBSObject
        """
        if self.name is None:
            return ""

        s = []
        if isinstance(self, Job):
            s += ["Job Id: " + self.name + "\n"]
        elif isinstance(self, Queue):
            s += ["Queue: " + self.name + "\n"]
        elif isinstance(self, Server):
            s += ["Server: " + self.hostname + "\n"]
        elif isinstance(self, Reservation):
            s += ["Name: " + "\n"]
        else:
            s += [self.name + "\n"]
        for k, v in self.attributes.items():
            s += ["    " + k + " = " + str(v) + "\n"]
        return "".join(s)

    def __repr__(self):
        return str(self.attributes)


================================================
FILE: test/fw/ptl/lib/ptl_resourceresv.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import ast
import copy
import logging
import os
import pwd
import re
import string
import sys
import threading
import time
import traceback
from collections import OrderedDict

from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_procutils import ProcUtils
from ptl.utils.pbs_testusers import (ROOT_USER, TEST_USER, PbsUser,
                                     DAEMON_SERVICE_USER)

from ptl.lib.ptl_object import PBSObject
from ptl.lib.ptl_constants import (ATTR_N, ATTR_j, ATTR_m, ATTR_v, ATTR_k,
                                   ATTR_p, ATTR_r, ATTR_Arglist,
                                   ATTR_executable, ATTR_S, ATTR_resv_start,
                                   ATTR_job, ATTR_resv_end,
                                   ATTR_resv_duration)
from ptl.lib.ptl_types import (PbsTypeExecVnode, PbsTypeExecHost,
                               PbsTypeSelect)


class ResourceResv(PBSObject):

    """
    Generic PBS resource reservation, i.e., job or
    ``advance/standing`` reservation
    """

    def execvnode(self, attr='exec_vnode'):
        """
        PBS type execution vnode
        """
        if attr in self.attributes:
            return PbsTypeExecVnode(self.attributes[attr])
        else:
            return None

    def exechost(self):
        """
        PBS type execution host
        """
        if 'exec_host' in self.attributes:
            return PbsTypeExecHost(self.attributes['exec_host'])
        else:
            return None

    def resvnodes(self):
        """
        nodes assigned to a reservation
        """
        if 'resv_nodes' in self.attributes:
            return self.attributes['resv_nodes']
        else:
            return None

    def select(self):
        if hasattr(self, '_select') and self._select is not None:
            return self._select

        if 'schedselect' in self.attributes:
            self._select = PbsTypeSelect(self.attributes['schedselect'])

        elif 'select' in self.attributes:
            self._select = PbsTypeSelect(self.attributes['select'])
        else:
            return None

        return self._select

    @classmethod
    def get_hosts(cls, exechost=None):
        """
        :returns: The hosts portion of the exec_host
        """
        hosts = []
        exechosts = cls.utils.parse_exechost(exechost)
        if exechosts:
            for h in exechosts:
                eh = list(h.keys())[0]
                if eh not in hosts:
                    hosts.append(eh)
        return hosts

    def get_vnodes(self, execvnode=None):
        """
        :returns: The unique vnode names of an execvnode as a list
        """
        if execvnode is None:
            if 'exec_vnode' in self.attributes:
                execvnode = self.attributes['exec_vnode']
            elif 'resv_nodes' in self.attributes:
                execvnode = self.attributes['resv_nodes']
            else:
                return []

        vnodes = []
        execvnodes = PbsTypeExecVnode(execvnode)
        if execvnodes:
            for n in execvnodes:
                ev = list(n.keys())[0]
                if ev not in vnodes:
                    vnodes.append(ev)
        return vnodes

    def walltime(self, attr='Resource_List.walltime'):
        if attr in self.attributes:
            return self.utils.convert_duration(self.attributes[attr])


class Reservation(ResourceResv):

    """
    PBS Reservation. Attributes and Resources
    :param attrs: Reservation attributes
    :type attrs: Dictionary
    :param hosts: List of hosts for maintenance
    :type hosts: List
    """

    dflt_attributes = {}

    def __init__(self, username=TEST_USER, attrs=None, hosts=None):
        self.server = {}
        self.script = None

        if attrs:
            self.attributes = attrs
        else:
            self.attributes = {}

        if hosts:
            self.hosts = hosts
        else:
            self.hosts = []

        if username is None:
            userinfo = pwd.getpwuid(os.getuid())
            self.username = userinfo[0]
        else:
            self.username = str(username)

        # These are not in dflt_attributes because of the conversion to CLI
        # options is done strictly
        if ATTR_resv_start not in self.attributes and \
           ATTR_job not in self.attributes:
            self.attributes[ATTR_resv_start] = str(int(time.time()) +
                                                   36 * 3600)

        if ATTR_resv_end not in self.attributes and \
           ATTR_job not in self.attributes:
            if ATTR_resv_duration not in self.attributes:
                self.attributes[ATTR_resv_end] = str(int(time.time()) +
                                                     72 * 3600)

        PBSObject.__init__(self, None, self.attributes, self.dflt_attributes)
        self.set_attributes()

    def __del__(self):
        del self.__dict__

    def set_variable_list(self, user, workdir=None):
        pass


class Job(ResourceResv):

    """
    PBS Job. Attributes and Resources

    :param username: Job username
    :type username: str or None
    :param attrs: Job attributes
    :type attrs: Dictionary
    :param jobname: Name of the PBS job
    :type jobname: str or None
    """

    dflt_attributes = {
        ATTR_N: 'STDIN',
        ATTR_j: 'n',
        ATTR_m: 'a',
        ATTR_p: '0',
        ATTR_r: 'y',
        ATTR_k: 'oe',
    }
    runtime = 100
    du = DshUtils()

    def __init__(self, username=TEST_USER, attrs={}, jobname=None):
        self.platform = self.du.get_platform()
        self.server = {}
        self.script = None
        self.script_body = None
        if username is not None:
            self.username = str(username)
        else:
            self.username = None
        self.du = None
        self.interactive_handle = None
        if self.platform == 'cray' or self.platform == 'craysim':
            if 'Resource_List.select' in attrs:
                select = attrs['Resource_List.select']
                attrs['Resource_List.select'] = self.add_cray_vntype(select)
            elif 'Resource_List.vntype' not in attrs:
                attrs['Resource_List.vntype'] = 'cray_compute'

        PBSObject.__init__(self, None, attrs, self.dflt_attributes)

        if jobname is not None:
            self.custom_attrs[ATTR_N] = jobname
            self.attributes[ATTR_N] = jobname
        self.set_variable_list(self.username)
        self.set_sleep_time(100)

    def __del__(self):
        del self.__dict__

    def add_cray_vntype(self, select=None):
        """
        Cray specific function to add vntype as ``cray_compute`` to each
        select chunk

        :param select: PBS select statement
        :type select: str or None
        """
        ra = []
        r = select.split('+')
        for i in r:
            select = PbsTypeSelect(i)
            novntype = 'vntype' not in select.resources
            nohost = 'host' not in select.resources
            novnode = 'vnode' not in select.resources
            if novntype and nohost and novnode:
                i = i + ":vntype=cray_compute"
            ra.append(i)
        select_str = ''
        for l in ra:
            select_str = select_str + "+" + l
        select_str = select_str[1:]
        return select_str

    def set_attributes(self, a={}):
        """
        set attributes and custom attributes on this job.
        custom attributes are used when converting attributes to CLI.
        In case of Cray platform if 'Resource_List.vntype' is set
        already then remove it and add vntype value to each chunk of a
        select statement.

        :param a: Attribute dictionary
        :type a: Dictionary
        """
        if isinstance(a, list):
            a = OrderedDict(a)

        self.attributes = OrderedDict(list(self.dflt_attributes.items()) +
                                      list(self.attributes.items()) +
                                      list(a.items()))

        if self.platform == 'cray' or self.platform == 'craysim':
            s = 'Resource_List.select' in a
            v = 'Resource_List.vntype' in self.custom_attrs
            if s and v:
                del self.custom_attrs['Resource_List.vntype']
                select = a['Resource_List.select']
                a['Resource_List.select'] = self.add_cray_vntype(select)

        self.custom_attrs = OrderedDict(list(self.custom_attrs.items()) +
                                        list(a.items()))

    def set_variable_list(self, user=None, workdir=None):
        """
        Customize the ``Variable_List`` job attribute to ``<user>``
        """
        if user is None:
            userinfo = pwd.getpwuid(os.getuid())
            user = userinfo[0]
            homedir = userinfo[5]
        else:
            try:
                homedir = pwd.getpwnam(user)[5]
            except Exception:
                homedir = ""

        self.username = user

        s = ['PBS_O_HOME=' + homedir]
        s += ['PBS_O_LANG=en_US.UTF-8']
        s += ['PBS_O_LOGNAME=' + user]
        s += ['PBS_O_PATH=/usr/bin:/bin:/usr/bin:/usr/local/bin']
        s += ['PBS_O_MAIL=/var/spool/mail/' + user]
        s += ['PBS_O_SHELL=/bin/bash']
        s += ['PBS_O_SYSTEM=Linux']
        if workdir is not None:
            wd = workdir
        else:
            wd = os.getcwd()
        s += ['PBS_O_WORKDIR=' + str(wd)]

        self.attributes[ATTR_v] = ",".join(s)
        self.set_attributes()

    def set_sleep_time(self, duration):
        """
        Set the sleep duration for this job.

        :param duration: The duration, in seconds, to sleep
        :type duration: int
        """
        pbs_conf = DshUtils().parse_pbs_config()
        exe_path = os.path.join(pbs_conf['PBS_EXEC'], 'bin', 'pbs_sleep')
        if not os.path.isfile(exe_path):
            exe_path = '/bin/sleep'
        self.set_execargs(exe_path, duration)

    def set_execargs(self, executable, arguments=None):
        """
        Set the executable and arguments to use for this job

        :param executable: path to an executable. No checks are made.
        :type executable: str
        :param arguments: arguments to executable.
        :type arguments: str or list or int
        """
        msg = ['job: executable set to ' + str(executable)]
        if arguments is not None:
            msg += [' with arguments: ' + str(arguments)]

        self.logger.info("".join(msg))
        self.attributes[ATTR_executable] = executable
        if arguments is not None:
            args = ''
            xml_beginargs = '<jsdl-hpcpa:Argument>'
            xml_endargs = '</jsdl-hpcpa:Argument>'
            if isinstance(arguments, list):
                for a in arguments:
                    args += xml_beginargs + str(a) + xml_endargs
            elif isinstance(arguments, str):
                args = xml_beginargs + arguments + xml_endargs
            elif isinstance(arguments, int):
                args = xml_beginargs + str(arguments) + xml_endargs
            self.attributes[ATTR_Arglist] = args
        else:
            self.unset_attributes([ATTR_Arglist])
        self.set_attributes()

    def create_script(self, body=None, asuser=None, hostname=None):
        """
        Create a job script from a given body of text into a
        temporary location

        :param body: the body of the script
        :type body: str or None
        :param asuser: Optionally the user to own this script,
                      defaults ot current user
        :type asuser: str or None
        :param hostname: The host on which the job script is to
                         be created
        :type hostname: str or None
        """

        if body is None:
            return None

        if isinstance(body, list):
            body = '\n'.join(body)

        if self.platform == 'cray' or self.platform == 'craysim':
            body = body.split("\n")
            for i, line in enumerate(body):
                if line.startswith("#PBS") and "select=" in line:
                    if 'Resource_List.vntype' in self.attributes:
                        self.unset_attributes(['Resource_List.vntype'])
                    line_arr = line.split(" ")
                    for j, element in enumerate(line_arr):
                        select = element.startswith("select=")
                        lselect = element.startswith("-lselect=")
                        if select or lselect:
                            if lselect:
                                sel_str = element[9:]
                            else:
                                sel_str = element[7:]
                            sel_str = self.add_cray_vntype(select=sel_str)
                            if lselect:
                                line_arr[j] = "-lselect=" + sel_str
                            else:
                                line_arr[j] = "select=" + sel_str
                    body[i] = " ".join(line_arr)
            body = '\n'.join(body)

        # If the user has a userhost, the job will run from there
        # so the script should be made there
        if self.username:
            user = PbsUser.get_user(self.username)
            if user.host:
                hostname = user.host
                asuser = user.name

        self.script_body = body
        if self.du is None:
            self.du = DshUtils()
        # First create the temporary file as current user and only change
        # its mode once the current user has written to it
        fn = self.du.create_temp_file(hostname, prefix='PtlPbsJobScript',
                                      asuser=asuser, body=body)
        self.du.chmod(hostname, fn, mode=0o755)
        self.script = fn
        return fn

    def create_subjob_id(self, job_array_id, subjob_index):
        """
        insert subjob index into the square brackets of job array id

        :param job_array_id: PBS parent array job id
        :type job_array_id: str
        :param subjob_index: index of subjob
        :type subjob_index: int
        :returns: subjob id string
        """
        idx = job_array_id.find('[]')
        return job_array_id[:idx + 1] + str(subjob_index) + \
            job_array_id[idx + 1:]

    def create_eatcpu_job(self, duration=None, hostname=None):
        """
        Create a job that eats cpu indefinitely or for the given
        duration of time

        :param duration: The duration, in seconds, to sleep
        :type duration: int
        :param hostname: hostname on which to execute the job
        :type hostname: str or None
        """
        if self.du is None:
            self.du = DshUtils()
        shebang_line = '#!' + self.du.which(hostname, exe='python3')
        body = """
import signal
import sys

x = 0


def receive_alarm(signum, stack):
    sys.exit()

signal.signal(signal.SIGALRM, receive_alarm)

if (len(sys.argv) > 1):
    input_time = sys.argv[1]
    print('Terminating after %s seconds' % input_time)
    signal.alarm(int(input_time))
else:
    print('Running indefinitely')

while True:
    x += 1
"""
        script_body = shebang_line + body
        script_path = self.du.create_temp_file(hostname=hostname,
                                               body=script_body,
                                               suffix='.py')
        pbs_conf = self.du.parse_pbs_config(hostname)
        shell_path = os.path.join(pbs_conf['PBS_EXEC'],
                                  'bin', 'pbs_python')
        a = {ATTR_S: shell_path}
        self.set_attributes(a)
        mode = 0o755
        if not self.du.chmod(hostname=hostname, path=script_path, mode=mode,
                             sudo=True):
            raise AssertionError("Failed to set permissions for file %s"
                                 " to %s" % (script_path, oct(mode)))
        self.set_execargs(script_path, duration)
        return script_path


class InteractiveJob(threading.Thread):

    """
    An Interactive Job thread

    Interactive Jobs are submitted as a thread that sets the jobid
    as soon as it is returned by ``qsub -I``, such that the caller
    can get back to monitoring the state of PBS while the interactive
    session goes on in the thread.

    The commands to be run within an interactive session are
    specified in the job's interactive_script attribute as a list of
    tuples, where the first item in each tuple is the command to run,
    and the subsequent items are the expected returned data.

    Implementation details:

    Support for interactive jobs is currently done through the
    pexpect module which must be installed separately from PTL.
    Interactive jobs are submitted through ``CLI`` only, there is no
    API support for this operation yet.

    The submission of an interactive job requires passing in job
    attributes,the command to execute ``(i.e. path to qsub -I)``
    and the hostname

    when not impersonating:

    pexpect spawns the ``qsub -I`` command and expects a prompt
    back, for each tuple in the interactive_script, it sends the
    command and expects to match the return value.

    when impersonating:

    pexpect spawns ``sudo -u <user> qsub -I``. The rest is as
    described in non- impersonating mode.
    """

    logger = logging.getLogger(__name__)

    pexpect_timeout = 15
    pexpect_sleep_time = .1
    du = DshUtils()

    def __init__(self, job, cmd, host):
        threading.Thread.__init__(self)
        self.job = job
        self.cmd = cmd
        self.jobid = None
        self.hostname = host
        self._ru = ""
        if self.du.get_platform() == "shasta":
            self._ru = PbsUser.get_user(job.username)
            if self._ru.host:
                self.hostname = self._ru.host

    def __del__(self):
        del self.__dict__

    def run(self):
        """
        Run the interactive job
        """
        try:
            import pexpect
        except Exception:
            self.logger.error('pexpect module is required for '
                              'interactive jobs')
            return None

        job = self.job
        cmd = self.cmd

        self.jobid = None
        self.logger.info("submit interactive job as " + job.username +
                         ": " + " ".join(cmd))
        if not hasattr(job, 'interactive_script'):
            self.logger.debug('no interactive_script attribute on job')
            return None

        try:
            # sleep to allow server to communicate with client
            # this value is set empirically so tweaking may be
            # needed
            _st = self.pexpect_sleep_time
            _to = self.pexpect_timeout
            _sc = job.interactive_script
            current_user = pwd.getpwuid(os.getuid())[0]
            if current_user != job.username:
                if hasattr(job, 'preserve_env') and job.preserve_env is True:
                    cmd = (copy.copy(self.du.sudo_cmd) +
                           ['-E', '-u', job.username] + cmd)
                else:
                    cmd = (copy.copy(self.du.sudo_cmd) +
                           ['-u', job.username] + cmd)

            self.logger.debug(cmd)
            is_local = self.du.is_localhost(self.hostname)
            _p = ""
            if is_local:
                _p = pexpect.spawn(" ".join(cmd), timeout=_to)
            else:
                self.logger.info("Submit interactive job from a remote host")
                if self.du.get_platform() == "shasta":
                    ssh_cmd = self.du.rsh_cmd + \
                        ['-p', self._ru.port,
                         self._ru.name + '@' + self.hostname]
                    _p = pexpect.spawn(" ".join(ssh_cmd), timeout=_to)
                    _p.sendline(" ".join(self.cmd))
                else:
                    ssh_cmd = self.du.rsh_cmd + [self.hostname]
                    _p = pexpect.spawn(" ".join(ssh_cmd), timeout=_to)
                    _p.sendline(" ".join(cmd))
            self.job.interactive_handle = _p
            time.sleep(_st)
            expstr = "qsub: waiting for job "
            expstr += r"(?P<jobid>\d+.[0-9A-Za-z-.]+) to start"
            _p.expect(expstr)
            if _p.match:
                self.jobid = _p.match.group('jobid').decode()
            else:
                _p.close()
                self.job.interactive_handle = None
                return None
            self.logger.debug(_p.after.decode())
            _to = 5
            for _l in _sc:
                (cmd, out) = _l
                if 'sleep ' in cmd:
                    timev = cmd.split(' ')[1]
                    if timev.isnumeric():
                        _to = int(timev)
                self.logger.info('sending: ' + cmd)
                _p.sendline(cmd)
                self.logger.info('expecting: ' + out)
                _p.expect(out)
            self.logger.info('sending exit')
            _p.sendline("exit")
            while True:
                try:
                    # timeout value is same as sleep time of job
                    _p.read_nonblocking(timeout=_to)
                except Exception:
                    break
            if _p.isalive():
                _p.close()
            self.job.interactive_handle = None
        except Exception:
            self.logger.error(traceback.print_exc())
            return None
        return self.jobid


================================================
FILE: test/fw/ptl/lib/ptl_sched.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import ast
import copy
import datetime
import grp
import json
import logging
import os
import pwd
import re
import string
import sys
import tempfile
import time
import traceback
from distutils.version import LooseVersion
from operator import itemgetter

from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_testusers import (ROOT_USER, TEST_USER, PbsUser,
                                     DAEMON_SERVICE_USER)
from ptl.lib.ptl_service import PBSService, PBSInitServices
from ptl.lib.ptl_fairshare import (FairshareTree, FairshareNode,
                                   Fairshare)
from ptl.lib.ptl_entities import Holidays
from ptl.lib.ptl_error import (PbsManagerError, PbsStatusError,
                               PbsInitServicesError, PbsServiceError,
                               PtlLogMatchError, PbsSchedConfigError,
                               PbsFairshareError)
from ptl.lib.ptl_constants import (SCHED, MGR_CMD_SET, MGR_CMD_UNSET,
                                   MGR_CMD_LIST, MGR_OBJ_SCHED, NE)


class Scheduler(PBSService):

    """
    Container of Scheduler related properties

    :param hostname: The hostname on which the scheduler instance
                     is operating
    :type hostname: str or None
    :param server: A PBS server instance to which this scheduler
                   is associated
    :param pbsconf_file: path to a PBS configuration file
    :type pbsconf_file: str or None
    :param snapmap: A dictionary of PBS objects (node,server,etc)
                    to mapped files from PBS snap directory
    :type snapmap: Dictionary
    :param snap: path to PBS snap directory (This will overrides
                 snapmap)
    :type snap: str or None
    :param db_acccess: set to either file containing credentials
                       to DB access or dictionary containing
                       ``{'dbname':...,'user':...,'port':...}``
    :type db_access: str or dictionary
    """

    # A vanilla scheduler configuration. This set may change based on
    # updates to PBS
    sched_dflt_config = {
        "backfill": "true        ALL",
        "backfill_prime": "false ALL",
        "strict_ordering": "false ALL",
        "provision_policy": "\"aggressive_provision\"",
        "preempt_order": "\"SCR\"",
        "fairshare_entity": "euser",
        "dedicated_prefix": "ded",
        "primetime_prefix": "p_",
        "nonprimetime_prefix": "np_",
        "preempt_queue_prio": "150",
        "preempt_prio": "\"express_queue, normal_jobs\"",
        "prime_exempt_anytime_queues": "false",
        "round_robin": "False    all",
        "fairshare_usage_res": "cput",
        "smp_cluster_dist": "pack",
        "fair_share": "false     ALL",
        "preempt_sort": "min_time_since_start",
        "node_sort_key": "\"sort_priority HIGH\" ALL",
        "sort_queues": "true     ALL",
        "by_queue": "True                ALL",
        "preemptive_sched": "true        ALL",
        "resources": "\"ncpus, mem, arch, host, vnode, aoe\"",
    }

    sched_config_options = ["node_group_key",

                            "fairshare_enforce_no_shares",
                            "strict_ordering",
                            "resource_unset_infinite",
                            "unknown_shares",
                            "dedicated_prefix",
                            "sort_queues",
                            "backfill",
                            "primetime_prefix",
                            "nonprimetime_prefix",
                            "backfill_prime",
                            "prime_exempt_anytime_queues",
                            "prime_spill",
                            "prime_exempt_anytime_queues",
                            "prime_spill",
                            "resources",
                            "mom_resources",
                            "smp_cluster_dist",
                            "preempt_queue_prio",
                            "preempt_suspend",
                            "preempt_checkpoint",
                            "preempt_requeue",
                            "preemptive_sched",
                            "node_group_key",
                            "fairshare_enforce_no_shares",
                            "strict_ordering",
                            "resource_unset_infinite",
                            "provision_policy",
                            "resv_confirm_ignore",
                            "allow_aoe_calendar",
                            "max_job_check",
                            "preempt_attempts",
                            "update_comments",
                            "sort_by",
                            "key",
                            "assign_ssinodes",
                            "cpus_per_ssinode",
                            "mem_per_ssinode",
                            "strict_fifo",
                            "mem_per_ssinode",
                            "strict_fifo"
                            ]

    def __init__(self, server, hostname=None, pbsconf_file=None,
                 snapmap={}, snap=None, db_access=None, id='default',
                 sched_priv=None):

        self.sched_config_file = None
        self.dflt_holidays_file = None
        self.holidays_file = None
        self.sched_config = {}
        self._sched_config_comments = {}
        self._config_order = []
        self.dedicated_time_file = None
        self.dedicated_time = None
        self.dedicated_time_as_str = None
        self.fairshare_tree = None
        self.resource_group = None
        self.holidays_obj = None
        self.server = None
        self.db_access = None
        self.user = None

        self.server = server
        if snap is None and self.server.snap is not None:
            snap = self.server.snap
        if (len(snapmap) == 0) and (len(self.server.snapmap) != 0):
            snapmap = self.server.snapmap

        if hostname is None:
            hostname = self.server.hostname

        super().__init__(hostname, pbsconf_file=pbsconf_file,
                         snap=snap, snapmap=snapmap)
        _m = ['scheduler ', self.shortname]
        if pbsconf_file is not None:
            _m += ['@', pbsconf_file]
        _m += [': ']
        self.logprefix = "".join(_m)
        self.pi = PBSInitServices(hostname=self.hostname,
                                  conf=self.pbs_conf_file)
        self.pbs_conf = self.server.pbs_conf
        self.sc_name = id

        self.user = DAEMON_SERVICE_USER
        self.fairshare = Fairshare(self.has_snap, self.pbs_conf, self.sc_name,
                                   self.hostname, self.user)

        self.dflt_sched_config_file = os.path.join(self.pbs_conf['PBS_EXEC'],
                                                   'etc', 'pbs_sched_config')

        self.dflt_holidays_file = os.path.join(self.pbs_conf['PBS_EXEC'],
                                               'etc', 'pbs_holidays')

        self.dflt_resource_group_file = os.path.join(self.pbs_conf['PBS_EXEC'],
                                                     'etc',
                                                     'pbs_resource_group')
        self.dflt_dedicated_file = os.path.join(self.pbs_conf['PBS_EXEC'],
                                                'etc',
                                                'pbs_dedicated')
        self.setup_sched_priv(sched_priv)
        self.setup_sched_logs()

        self.db_access = db_access

        self.version = None

    def setup_sched_priv(self, sched_priv=None):
        """
        Initialize Scheduler() member variables on initialization or if
        sched_priv changes
        """
        if sched_priv is None:
            if 'sched_priv' in self.attributes:
                sched_priv = self.attributes['sched_priv']
            else:
                sched_priv = os.path.join(self.pbs_conf['PBS_HOME'],
                                          'sched_priv')

        self.du.chown(self.hostname, sched_priv, uid=self.user,
                      recursive=True, sudo=True)

        self.sched_config_file = os.path.join(sched_priv, 'sched_config')
        self.resource_group_file = os.path.join(sched_priv, 'resource_group')
        self.holidays_file = os.path.join(sched_priv, 'holidays')
        self.set_dedicated_time_file(os.path.join(sched_priv,
                                                  'dedicated_time'))

        if not os.path.exists(sched_priv):
            return

        self.parse_sched_config()

        self.fairshare_tree = self.fairshare.query_fairshare()
        rg = self.parse_resource_group(self.hostname, self.resource_group_file)
        self.resource_group = rg

        self.holidays_obj = Holidays()
        self.holidays_parse_file(level=logging.DEBUG)

    def setup_sched_logs(self):
        if 'sched_log' in self.attributes:
            sched_logs = self.attributes['sched_log']
        else:
            sched_logs = os.path.join(self.pbs_conf['PBS_HOME'],
                                      'sched_logs')

        self.du.chown(self.hostname, sched_logs, uid=self.user,
                      recursive=True, sudo=True)

    def initialise_service(self):
        """
        initialise the scheduler object
        """
        super().initialise_service()
        try:
            attrs = self.server.status(SCHED, level=logging.DEBUG,
                                       db_access=self.db_access,
                                       id=self.sc_name)
            if attrs is not None and len(attrs) > 0:
                self.attributes = attrs[0]
        except (PbsManagerError, PbsStatusError) as e:
            self.logger.error('Error querying scheduler %s' % e.msg)

    def start(self, sched_home=None, args=None, launcher=None):
        """
        Start the scheduler
        :param sched_home: Path to scheduler log and home directory
        :type sched_home: str
        :param args: Arguments required to start the scheduler
        :type args: str
        :param launcher: Optional utility to invoke the launch of the service
        :type launcher: str or list
        """
        if self.attributes['id'] != 'default':
            cmd = [os.path.join(self.pbs_conf['PBS_EXEC'],
                                'sbin', 'pbs_sched')]
            cmd += ['-I', self.attributes['id']]
            if sched_home is not None:
                cmd += ['-d', sched_home]
            try:
                ret = self.du.run_cmd(self.hostname, cmd, sudo=True,
                                      logerr=False, level=logging.INFOCLI)
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
            self.server.manager(MGR_CMD_LIST, SCHED)
            return ret

        if args is not None or launcher is not None:
            return super()._start(inst=self, args=args,
                                  launcher=launcher)
        else:
            try:
                rv = self.pi.start_sched()
                pid = self._validate_pid(self)
                if pid is None:
                    raise PbsServiceError(rv=False, rc=-1,
                                          msg="Could not find PID")
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
            return rv

    def stop(self, sig=None):
        """
        Stop the PBS scheduler

        :param sig: Signal to stop the PBS scheduler
        :type sig: str
        """
        if sig is not None:
            self.logger.info(self.logprefix + 'stopping Scheduler on host ' +
                             self.hostname)
            return super()._stop(sig, inst=self)
        elif self.attributes['id'] != 'default':
            self.logger.info(self.logprefix + 'stopping MultiSched ' +
                             self.attributes['id'] + ' on host ' +
                             self.hostname)
            return super()._stop(inst=self)
        else:
            try:
                self.pi.stop_sched()
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
            return True

    def restart(self):
        """
        Restart the PBS scheduler
        """
        if self.isUp():
            if not self.stop():
                return False
        return self.start()

    def log_match(self, msg=None, id=None, n=50, tail=True, allmatch=False,
                  regexp=False, max_attempts=None, interval=None,
                  starttime=None, endtime=None, level=logging.INFO,
                  existence=True):
        """
        Match given ``msg`` in given ``n`` lines of Scheduler log

        :param msg: log message to match, can be regex also when
                    ``regexp`` is True
        :type msg: str
        :param id: The id of the object to trace. Only used for
                   tracejob
        :type id: str
        :param n: 'ALL' or the number of lines to search through,
                  defaults to 50
        :type n: str or int
        :param tail: If true (default), starts from the end of
                     the file
        :type tail: bool
        :param allmatch: If True all matching lines out of then
                         parsed are returned as a list. Defaults
                         to False
        :type allmatch: bool
        :param regexp: If true msg is a Python regular expression.
                       Defaults to False
        :type regexp: bool
        :param max_attempts: the number of attempts to make to find
                             a matching entry
        :type max_attempts: int
        :param interval: the interval between attempts
        :type interval: int
        :param starttime: If set ignore matches that occur before
                          specified time
        :type starttime: float
        :param endtime: If set ignore matches that occur after
                        specified time
        :type endtime: float
        :param level: The logging level, defaults to INFO
        :type level: int
        :param existence: If True (default), check for existence of
                        given msg, else check for non-existence of
                        given msg.
        :type existence: bool

        :return: (x,y) where x is the matching line
                 number and y the line itself. If allmatch is True,
                 a list of tuples is returned.
        :rtype: tuple
        :raises PtlLogMatchError:
                When ``existence`` is True and given
                ``msg`` is not found in ``n`` line
                Or
                When ``existence`` is False and given
                ``msg`` found in ``n`` line.

        .. note:: The matching line number is relative to the record
                  number, not the absolute line number in the file.
        """
        return self._log_match(self, msg, id, n, tail, allmatch, regexp,
                               max_attempts, interval, starttime, endtime,
                               level=level, existence=existence)

    def run_scheduling_cycle(self):
        """
        Convenience method to start and finish a sched cycle
        """
        sched = self.attributes['id']
        old_val = self.server.status(SCHED, 'scheduling', id=sched)[
            0]['scheduling']

        # Make sure that we aren't in a sched cycle already
        self.server.manager(MGR_CMD_SET, SCHED, {
                            'scheduling': 'False'}, id=sched)

        # Kick a new cycle
        tbefore = time.time()
        self.server.manager(MGR_CMD_SET, SCHED, {
                            'scheduling': 'True'}, id=sched)
        self.log_match("Starting Scheduling",
                       starttime=tbefore)

        if old_val == 'False':
            # This will also ensure that the sched cycle is over before
            # returning
            self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'False'},
                                id=sched)
        else:
            self.server.expect(SCHED, {'state': 'scheduling'}, op=NE,
                               id=sched, interval=1, max_attempts=1200,
                               trigger_sched_cycle=False)

    def pbs_version(self):
        """
        Get the version of the scheduler instance
        """
        if self.version:
            return self.version

        version = self.log_match('pbs_version', tail=False)
        if version:
            version = version[1].strip().split('=')[1]
        else:
            version = "unknown"

        self.version = LooseVersion(version)

        return self.version

    def parse_sched_config(self, schd_cnfg=None):
        """
        Parse a sceduling configuration file into a dictionary.
        Special handling of identical keys ``(e.g., node_sort_key)``
        is done using a list of values as the value of the key.
        When printed back to file, each entry in the list
        gets written on a line of its own. For example, the python
        dictionary entry:

        ``{'node_sort_key':
        ['"ncpus HIGH unused" prime', '"node_priority HIGH" non-prime']}``

        will get written as:

        ``node_sort_key: "ncpus HIGH unused" prime``
        ``node_sort_key: "node_priority HIGH" non-prime``

        Returns sched_config dictionary that gets reinitialized
        every time this method is called.
        """
        # sched_config is initialized
        if self.sched_config:
            del(self.sched_config)
            self.sched_config = {}
            self._sched_config_comments = {}
            self._config_order = []
        if schd_cnfg is None:
            if self.sched_config_file is not None:
                schd_cnfg = self.sched_config_file
            else:
                self.logger.error('no scheduler configuration file to parse')
                return False

        try:
            conf_opts = self.du.cat(self.hostname, schd_cnfg,
                                    sudo=(not self.has_snap),
                                    level=logging.DEBUG2)['out']
        except Exception:
            self.logger.error('error parsing scheduler configuration')
            return False

        _comment = []
        conf_re = re.compile(
            r'[#]?[\s]*(?P<conf_id>[\w]+):[\s]*(?P<conf_val>.*)')
        for line in conf_opts:
            m = conf_re.match(line)
            if m:
                key = m.group('conf_id')
                val = m.group('conf_val')
                # line is a comment, it could be a commented out scheduling
                # option, or the description of an option. It could also be
                # that part of the description is an example setting of the
                # option.
                # We must keep track of commented out options in order to
                # rewrite the configuration in the same order as it was defined
                if line.startswith('#'):
                    if key in self.sched_config_options:
                        _comment += [line]
                        if key in self._sched_config_comments:
                            self._sched_config_comments[key] += _comment
                            _comment = []
                        else:
                            self._sched_config_comments[key] = _comment
                            _comment = []
                        if key not in self._config_order:
                            self._config_order.append(key)
                    else:
                        _comment += [line]
                    continue

                if key not in self._sched_config_comments:
                    self._sched_config_comments[key] = _comment
                else:
                    self._sched_config_comments[key] += _comment
                if key not in self._config_order:
                    self._config_order.append(key)

                _comment = []
                if key in self.sched_config:
                    if isinstance(self.sched_config[key], list):
                        if isinstance(val, list):
                            self.sched_config[key].extend(val)
                        else:
                            self.sched_config[key].append(val)
                    else:
                        if isinstance(val, list):
                            self.sched_config[key] = [self.sched_config[key]]
                            self.sched_config[key].extend(val)
                        else:
                            self.sched_config[key] = [self.sched_config[key],
                                                      val]
                else:
                    self.sched_config[key] = val
            else:
                _comment += [line]
        self._sched_config_comments['PTL_SCHED_CONFIG_TAIL'] = _comment
        return True

    def check_defaults(self, config):
        """
        Check the values in argument config against default values
        """

        if len(config.keys()) == 0:
            return
        for k, v in self.sched_dflt_config.items():
            if k in config:
                s1 = v
                s1 = s1.replace(" ", "")
                s1 = s1.replace("\t", "").strip()
                s2 = config[k]
                s2 = s2.replace(" ", "")
                s2 = s2.replace("\t", "").strip()

                if s1 != s2:
                    self.logger.debug(k + ' non-default: ' + v +
                                      ' != ' + config[k])

    def apply_config(self, config=None, validate=True, path=None):
        """
        Apply the configuration specified by config

        :param config: Configurations to set. Default: self.
                       sched_config
        :param validate: If True (the default) validate that
                         settings did not yield an error.
                         Validation is done by parsing the
                         scheduler log which, in some cases may
                         be slow and therefore undesirable.
        :type validate: bool
        :param path: Optional path to file to which configuration
                     is written. If None, the configuration is
                     written to PBS_HOME/sched_priv/sched_config
        :type path: str
        :returns: True on success and False otherwise. Success
                  means that upon applying the new configuration
                  the scheduler did not emit an
                  "Error reading line" in its log file.
        """

        if config is None:
            config = self.sched_config

        if len(config) == 0:
            return True

        reconfig_time = time.time()
        try:
            fn = self.du.create_temp_file()
            with open(fn, "w", encoding="utf-8") as fd:
                for k in self._config_order:
                    if k in config:
                        if k in self._sched_config_comments:
                            fd.write("\n".join(self._sched_config_comments[k]))
                            fd.write("\n")
                        v = config[k]
                        if isinstance(v, list):
                            for val in v:
                                fd.write(k + ": " + str(val) + "\n")
                        else:
                            fd.write(k + ": " + str(v) + "\n")
                    elif k in self._sched_config_comments:
                        fd.write("\n".join(self._sched_config_comments[k]))
                        fd.write("\n")
                for k, v in self.sched_config.items():
                    if k not in self._config_order:
                        if isinstance(v, list):
                            for val in v:
                                fd.write(k + ": " + str(val).strip() + "\n")
                        else:
                            fd.write(k + ": " + str(v).strip() + "\n")

                if 'PTL_SCHED_CONFIG_TAIL' in self._sched_config_comments:
                    fd.write("\n".join(
                        self._sched_config_comments['PTL_SCHED_CONFIG_TAIL']))
                    fd.write("\n")

            if path is None:
                if 'sched_priv' in self.attributes:
                    sched_priv = self.attributes['sched_priv']
                else:
                    sched_priv = os.path.join(self.pbs_conf['PBS_HOME'],
                                              "sched_priv")
                sp = os.path.join(sched_priv, "sched_config")
            else:
                sp = path
            self.du.run_copy(self.hostname, src=fn, dest=sp,
                             preserve_permission=False,
                             sudo=True, uid=self.user)
            os.remove(fn)

            self.logger.debug(self.logprefix + "updated configuration")
        except Exception:
            m = self.logprefix + 'error in apply_config '
            self.logger.error(m + str(traceback.print_exc()))
            raise PbsSchedConfigError(rc=1, rv=False, msg=m)

        if validate:
            self.get_pid()
            self.signal('-HUP')
            try:
                self.log_match("Sched;reconfigure;Scheduler is reconfiguring",
                               starttime=reconfig_time)
                self.log_match("Error reading line", max_attempts=2,
                               starttime=reconfig_time, existence=False)
            except PtlLogMatchError as log_error:
                self.logger.error(log_error.msg)
                _msg = 'Error in validating sched_config changes'
                raise PbsSchedConfigError(rc=1, rv=False,
                                          msg=_msg)
        return True

    def set_sched_config(self, confs={}, apply=True, validate=True):
        """
        set a ``sched_config`` property

        :param confs: dictionary of key value sched_config entries
        :type confs: Dictionary
        :param apply: if True (the default), apply configuration.
        :type apply: bool
        :param validate: if True (the default), validate the
                         configuration settings.
        :type validate: bool
        """
        self.parse_sched_config()
        self.logger.info(self.logprefix + "config " + str(confs))
        self.sched_config = {**self.sched_config, **confs}
        if apply:
            try:
                self.apply_config(validate=validate)
            except PbsSchedConfigError as sched_error:
                _msg = sched_error.msg
                self.logger.error(_msg)
                for k in confs:
                    del self.sched_config[k]
                self.apply_config(validate=validate)
                raise PbsSchedConfigError(rc=1, rv=False, msg=_msg)
        return True

    def add_server_dyn_res(self, custom_resource, script_body=None,
                           res_file=None, apply=True, validate=True,
                           dirname=None, host=None, perm=0o700,
                           prefix='PtlPbsSvrDynRes', suffix='.scr'):
        """
        Add a root owned server dynamic resource script or file to the
        scheduler configuration.

        :param custom_resource: The name of the custom resource to
                                define
        :type custom_resource: str
        :param script_body: The body of the server dynamic resource
        :param res_file: Alternatively to passing the script body, use
                     the file instead
        :type res_file: str or None
        :param apply: if True (the default), apply configuration.
        :type apply: bool
        :param validate: if True (the default), validate the
                         configuration settings.
        :type validate: bool
        :param dirname: the file will be created in this directory
        :type dirname: str or None
        :param host: the hostname on which dyn res script is created
        :type host: str or None
        :param perm: perm to use while creating scripts
                     (must be octal like 0o777)
        :param prefix: the file name will begin with this prefix
        :type prefix: str
        :param suffix: the file name will end with this suffix
        :type suffix: str
        :return Absolute path of the dynamic resource script
        """
        if res_file is not None:
            with open(res_file) as f:
                script_body = f.readlines()
                self.du.chmod(hostname=host, path=res_file, mode=perm,
                              sudo=True)
        else:
            if dirname is None:
                dirname = self.pbs_conf['PBS_HOME']
            tmp_file = self.du.create_temp_file(prefix=prefix, suffix=suffix,
                                                body=script_body,
                                                hostname=host)
            res_file = os.path.join(dirname, tmp_file.split(os.path.sep)[-1])
            self.du.run_copy(host, src=tmp_file, dest=res_file, sudo=True,
                             preserve_permission=False)

            user = self.user
            group = pwd.getpwnam(str(user)).pw_gid

            self.du.chown(hostname=host, path=res_file, uid=user, gid=group,
                          sudo=True)
            self.du.chmod(hostname=host, path=res_file, mode=perm, sudo=True)
            if host is None:
                self.dyn_created_files.append(res_file)

        self.logger.info(self.logprefix + "adding server dyn res " + res_file)
        self.logger.info("-" * 30)
        self.logger.info(script_body)
        self.logger.info("-" * 30)

        a = {'server_dyn_res': '"' + custom_resource + ' !' + res_file + '"'}
        self.set_sched_config(a, apply=apply, validate=validate)
        return res_file

    def unset_sched_config(self, name, apply=True):
        """
        Delete a ``sched_config`` entry

        :param name: the entry to delete from sched_config
        :type name: str
        :param apply: if True, apply configuration. Defaults to True
        :type apply: bool
        """
        self.parse_sched_config()
        if name not in self.sched_config:
            return True
        self.logger.info(self.logprefix + "unsetting config " + name)
        del self.sched_config[name]

        if apply:
            return self.apply_config()

    def set_dedicated_time_file(self, filename):
        """
        Set the path to a dedicated time
        """
        self.logger.info(self.logprefix + " setting dedicated time file to " +
                         str(filename))
        self.dedicated_time_file = filename

    def revert_to_defaults(self):
        """
        Revert scheduler configuration to defaults.

        :returns: True on success, False otherwise
        """
        self.logger.info(self.logprefix +
                         "reverting configuration to defaults")

        ignore_attrs = ['id', 'pbs_version', 'sched_host', 'state']
        unsetattrs = []
        for k in self.attributes.keys():
            if k not in ignore_attrs:
                unsetattrs.append(k)
        if len(unsetattrs) > 0:
            self.server.manager(MGR_CMD_UNSET, SCHED, unsetattrs)
        self.clear_dedicated_time(hup=False)
        if self.du.cmp(self.hostname, self.dflt_resource_group_file,
                       self.resource_group_file, sudo=True) != 0:
            self.du.run_copy(self.hostname, src=self.dflt_resource_group_file,
                             dest=self.resource_group_file,
                             preserve_permission=False,
                             sudo=True, uid=self.user)
        rc = self.holidays_revert_to_default()
        if self.du.cmp(self.hostname, self.dflt_sched_config_file,
                       self.sched_config_file, sudo=True) != 0:
            self.du.run_copy(self.hostname, src=self.dflt_sched_config_file,
                             dest=self.sched_config_file,
                             preserve_permission=False,
                             sudo=True, uid=self.user)
        if self.du.cmp(self.hostname, self.dflt_dedicated_file,
                       self.dedicated_time_file, sudo=True):
            self.du.run_copy(self.hostname, src=self.dflt_dedicated_file,
                             dest=self.dedicated_time_file,
                             preserve_permission=False, sudo=True,
                             uid=self.user)

        self.signal('-HUP')
        if self.platform == 'cray' or self.platform == 'craysim':
            self.add_resource('vntype')
            self.add_resource('hbmem')
        # Revert fairshare usage
        self.fairshare.revert_fairshare()
        self.fairshare_tree = None
        self.resource_group = None
        self.parse_sched_config()
        return self.isUp()

    def create_scheduler(self, sched_home=None):
        """
        Start scheduler with creating required directories for scheduler
        :param sched_home: path of scheduler home and log directory
        :type sched_home: str
        """
        if sched_home is None:
            sched_home = self.server.pbs_conf['PBS_HOME']
        sched_priv_dir = os.path.join(sched_home,
                                      self.attributes['sched_priv'])
        sched_logs_dir = os.path.join(sched_home,
                                      self.attributes['sched_log'])
        self.server.update_special_attr(SCHED, id=self.attributes['id'])
        if not os.path.exists(sched_priv_dir):
            self.du.mkdir(path=sched_priv_dir, sudo=True)
            if self.user.name != 'root':
                self.du.chown(hostname=self.hostname, path=sched_priv_dir,
                              sudo=True, uid=self.user)
            self.du.run_copy(self.hostname, src=self.dflt_resource_group_file,
                             dest=self.resource_group_file, mode=0o644,
                             sudo=True, uid=self.user)
            self.du.run_copy(self.hostname, src=self.dflt_holidays_file,
                             dest=self.holidays_file, mode=0o644,
                             sudo=True, uid=self.user)
            self.du.run_copy(self.hostname, src=self.dflt_sched_config_file,
                             dest=self.sched_config_file, mode=0o644,
                             sudo=True, uid=self.user)
            self.du.run_copy(self.hostname, src=self.dflt_dedicated_file,
                             dest=self.dedicated_time_file, mode=0o644,
                             sudo=True, uid=self.user)
        if not os.path.exists(sched_logs_dir):
            self.du.mkdir(path=sched_logs_dir, sudo=True)
            if self.user.name != 'root':
                self.du.chown(hostname=self.hostname, path=sched_logs_dir,
                              sudo=True, uid=self.user)

        self.setup_sched_priv(sched_priv=sched_priv_dir)

    def save_configuration(self, outfile=None, mode='w'):
        """
        Save scheduler configuration

        :param outfile: Optional Path to a file to which configuration
                        is saved, when not provided, data is saved in
                        class variable saved_config
        :type outfile: str
        :param mode: mode to use to access outfile. Defaults to
                     append, 'w'.
        :type mode: str
        :returns: True on success and False otherwise
        """
        conf = {}
        if 'sched_priv' in self.attributes:
            sched_priv = self.attributes['sched_priv']
        else:
            sched_priv = os.path.join(
                self.pbs_conf['PBS_HOME'], 'sched_priv')
        sc = os.path.join(sched_priv, 'sched_config')
        self._save_config_file(conf, sc)
        rg = os.path.join(sched_priv, 'resource_group')
        self._save_config_file(conf, rg)
        dt = os.path.join(sched_priv, 'dedicated_time')
        self._save_config_file(conf, dt)
        hd = os.path.join(sched_priv, 'holidays')
        self._save_config_file(conf, hd)

        self.server.saved_config[MGR_OBJ_SCHED] = conf
        if outfile is not None:
            try:
                with open(outfile, mode) as f:
                    json.dump(self.server.saved_config, f)
                    self.server.saved_config[MGR_OBJ_SCHED].clear()
            except Exception:
                self.logger.error('error saving configuration ' + outfile)
                return False

        return True

    def load_configuration(self, infile):
        """
        load scheduler configuration from saved file infile
        """
        rv = self._load_configuration(infile, MGR_OBJ_SCHED)
        self.signal('-HUP')
        return rv

    def get_resources(self, exclude=[]):
        """
        returns a list of allocatable resources.

        :param exclude: if set, excludes the named resources, if
                        they exist, from the resulting list
        :type exclude: List
        """
        if 'resources' not in self.sched_config:
            return None
        resources = self.sched_config['resources']
        resources = resources.replace('"', '')
        resources = resources.replace(' ', '')
        res = resources.split(',')
        if len(exclude) > 0:
            for e in exclude:
                if e in res:
                    res.remove(e)
        return res

    def add_resource(self, name, apply=True):
        """
        Add a resource to ``sched_config``.

        :param name: the resource name to add
        :type name: str
        :param apply: if True, apply configuration. Defaults to True
        :type apply: bool
        :returns: True on success and False otherwise.
                  Return True if the resource is already defined.
        """
        # if the sched_config has not been read in yet, parse it
        if not self.sched_config:
            self.parse_sched_config()

        if 'resources' in self.sched_config:
            resources = self.sched_config['resources']
            resources = resources.replace('"', '')
            splitres = [r.strip() for r in resources.split(",")]
            if name in splitres:
                return True
            resources = '"' + resources + ', ' + name + '"'
        else:
            resources = '"' + name + '"'

        return self.set_sched_config({'resources': resources}, apply=apply)

    def remove_resource(self, name, apply=True):
        """
        Remove a resource to ``sched_config``.

        :param name: the resource name to remove
        :type name: str
        :param apply: if True, apply configuration. Defaults to True
        :type apply: bool
        :returns: True on success and False otherwise
        """
        # if the sched_config has not been read in yet, parse it
        if not self.sched_config:
            self.parse_sched_config()

        if 'resources' in self.sched_config:
            resources = self.sched_config['resources']
            resources = resources.replace('"', '')
            splitres = [r.strip() for r in resources.split(",")]
            if name not in splitres:
                return True

            newres = []
            for r in splitres:
                if r != name:
                    newres.append(r)

            resources = '"' + ",".join(newres) + '"'
            return self.set_sched_config({'resources': resources}, apply=apply)

    def holidays_revert_to_default(self, level=logging.INFO):
        """
        Revert holidays file to default
        """
        self.logger.log(level, self.logprefix +
                        "reverting holidays file to default")

        rc = None
        # Copy over the holidays file from PBS_EXEC if it exists
        if self.du.cmp(self.hostname, self.dflt_holidays_file,
                       self.holidays_file, sudo=True) != 0:
            ret = self.du.run_copy(self.hostname, src=self.dflt_holidays_file,
                                   dest=self.holidays_file,
                                   preserve_permission=False, sudo=True,
                                   logerr=True)
            rc = ret['rc']
            # Update the internal data structures for the updated file
            self.holidays_parse_file(level=level)
        else:
            rc = 1
        return rc

    def holidays_parse_file(self, path=None, obj=None, level=logging.INFO):
        """
        Parse the existing holidays file

        :param path: optional path to the holidays file to parse
        :type path: str or None
        :param obj: optional holidays object to be used instead
                    of internal
        :returns: The content of holidays file as a list of lines
        """
        self.logger.log(level, self.logprefix + "Parsing holidays file")

        if obj is None:
            obj = self.holidays_obj

        days_map = obj._days_map
        days_set = obj.days_set
        if path is None:
            path = self.holidays_file
        lines = self.du.cat(self.hostname, path, sudo=True)['out']

        content = []    # valid content to return

        self.holidays_delete_entry(
            'a', apply=False, obj=obj, level=logging.DEBUG)

        for line in lines:
            entry = str(line).split()
            if len(entry) == 0:
                continue
            tag = entry[0].lower()
            if tag == "year":   # initialize year
                content.append("\t".join(entry))
                obj.year['valid'] = True
                if len(entry) > 1:
                    obj.year['value'] = entry[1]
            elif tag in days_map.keys():   # initialize a day
                content.append("\t".join(entry))
                day = days_map[tag]
                day['valid'] = True
                days_set.append(day)
                day['position'] = len(days_set) - 1
                if len(entry) > 1:
                    day['p'] = entry[1]
                if len(entry) > 2:
                    day['np'] = entry[2]
            elif tag.isdigit():   # initialize a holiday
                content.append("\t".join(entry))
                obj.holidays.append(tag)
            else:
                pass
        return content

    def holidays_set_day(self, day_id, prime="", nonprime="", apply=True,
                         obj=None, level=logging.INFO):
        """
        Set prime time values for a day

        :param day_id: the day to be set (string)
        :type day_id: str
        :param prime: the prime time value
        :param nonprime: the non-prime time value
        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead
                    of internal
        :returns: The position ``(0-7)`` of the set day
        """
        self.logger.log(level, self.logprefix +
                        "setting holidays file entry for %s",
                        day_id)

        if obj is None:
            obj = self.holidays_obj

        day = obj._days_map[str(day_id).lower()]
        days_set = obj.days_set

        if day['valid'] is None:    # Fresh entry
            days_set.append(day)
            day['position'] = len(days_set) - 1
        elif day['valid'] is False:  # Previously invalidated entry
            days_set.insert(day['position'], day)
        else:
            pass

        day['valid'] = True
        day['p'] = str(prime)
        day['np'] = str(nonprime)

        self.logger.debug("holidays_set_day(): changed day struct: " +
                          str(day))

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

        return day['position']

    def holidays_get_day(self, day_id, obj=None, level=logging.INFO):
        """
        :param obj: optional holidays object to be used instead
                    of internal
        :param day_id: either a day's name or "all"
        :type day_id: str
        :returns: A copy of info about a day/all set days
        """
        self.logger.log(level, self.logprefix +
                        "getting holidays file entry for " +
                        day_id)

        if obj is None:
            obj = self.holidays_obj

        days_set = obj.days_set
        days_map = obj._days_map

        if day_id == "all":
            return days_set[:]
        else:
            return days_map[day_id].copy()

    def holidays_reposition_day(self, day_id, new_pos, apply=True, obj=None,
                                level=logging.INFO):
        """
        Change position of a day ``(0-7)`` as it appears in the
        holidays file

        :param day_id: name of the day
        :type day_id: str
        :param new_pos: new position
        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead
                    of internal
        :returns: The new position of the day
        """
        self.logger.log(level, self.logprefix +
                        "repositioning holidays file entry for " +
                        day_id + " to position " + str(new_pos))

        if obj is None:
            obj = self.holidays_obj

        days_map = obj._days_map
        days_set = obj.days_set
        day = days_map[str(day_id).lower()]

        if new_pos == day['position']:
            return

        # We also want to update order of invalid days, so add them to
        # days_set temporarily
        invalid_days = []
        for name in days_map:
            if days_map[name]['valid'] is False:
                invalid_days.append(days_map[name])
        days_set += invalid_days

        # Sort the old list
        days_set.sort(key=itemgetter('position'))

        # Change position of 'day_id'
        day['position'] = new_pos
        days_set.remove(day)
        days_set.insert(new_pos, day)

        # Update the 'position' field
        for i in range(0, len(days_set)):
            days_set[i]['position'] = i

        # Remove invalid days from days_set
        len_days_set = len(days_set)
        days_set = [days_set[i] for i in range(0, len_days_set)
                    if days_set[i] not in invalid_days]

        self.logger.debug("holidays_reposition_day(): List of days after " +
                          " re-positioning " + str(day_id) + " is:\n" +
                          str(days_set))

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

        return new_pos

    def holidays_unset_day(self, day_id, apply=True, obj=None,
                           level=logging.INFO):
        """
        Unset prime time values for a day

        :param day_id: day to unset (string)
        :type day_id: str
        :param apply: to reflect the changes to file
        :param obj: optional holidays object to be used instead
                    of internal

        .. note:: we do not unset the 'valid' field here so the entry
                  will still be displayed but without any values
        """
        self.logger.log(level, self.logprefix +
                        "unsetting holidays file entry for " + day_id)

        if obj is None:
            obj = self.holidays_obj

        day = obj._days_map[str(day_id).lower()]
        day['p'] = ""
        day['np'] = ""

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

    def holidays_invalidate_day(self, day_id, apply=True, obj=None,
                                level=logging.INFO):
        """
        Remove a day's entry from the holidays file

        :param day_id: the day to remove (string)
        :type day_id: str
        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead
                    of internal
        """
        self.logger.log(level, self.logprefix +
                        "invalidating holidays file entry for " +
                        day_id)

        if obj is None:
            obj = self.holidays_obj

        days_map = obj._days_map
        days_set = obj.days_set

        day = days_map[str(day_id).lower()]
        day['valid'] = False
        days_set.remove(day)

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

    def holidays_validate_day(self, day_id, apply=True, obj=None,
                              level=logging.INFO):
        """
        Make valid a previously set day's entry

        :param day_id: the day to validate (string)
        :type day_id: str
        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead
                    of internal

        .. note:: The day will retain its previous position in
                  the file
        """
        self.logger.log(level, self.logprefix +
                        "validating holidays file entry for " +
                        day_id)

        if obj is None:
            obj = self.holidays_obj

        days_map = obj._days_map
        days_set = obj.days_set

        day = days_map[str(day_id).lower()]
        if day in days_set:  # do not insert a pre-existing day
            self.logger.debug("holidays_validate_day(): " +
                              day_id + " is already valid!")
            return

        day['valid'] = True
        days_set.insert(day['position'], day)

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

    def holidays_delete_entry(self, entry_type, idx=None, apply=True,
                              obj=None, level=logging.INFO):
        """
        Delete ``one/all`` entries from holidays file

        :param entry_type: 'y':year, 'd':day, 'h':holiday or 'a': all
        :type entry_type: str
        :param idx: either a day of week (monday, tuesday etc.)
                    or Julian date  of a holiday
        :type idx: str or None
        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead of
                    internal
        :returns: False if entry_type is invalid, otherwise True

        .. note:: The day cannot be validated and will lose it's
                  position in the file
        """
        self.logger.log(level, self.logprefix +
                        "Deleting entries from holidays file")

        if obj is None:
            obj = self.holidays_obj

        days_map = obj._days_map
        days_set = obj.days_set
        holiday_list = obj.holidays
        year = obj.year

        if entry_type not in ['a', 'y', 'd', 'h']:
            return False

        if entry_type == 'y' or entry_type == 'a':
            self.logger.debug(self.logprefix +
                              "deleting year entry from holidays file")
            # Delete year entry
            year['value'] = None
            year['valid'] = False

        if entry_type == 'd' or entry_type == 'a':
            # Delete one/all day entries
            num_days_to_delete = 1
            if entry_type == 'a':
                self.logger.debug(self.logprefix +
                                  "deleting all days from holidays file")
                num_days_to_delete = len(days_set)
            for i in range(0, num_days_to_delete):
                if (entry_type == 'd'):
                    self.logger.debug(self.logprefix +
                                      "deleting " + str(idx) +
                                      " entry from holidays file")
                    day = days_map[str(idx).lower()]
                else:
                    day = days_set[0]

                day['p'] = None
                day['np'] = None
                day['valid'] = None
                day['position'] = None
                days_set.remove(day)
                if entry_type == 'd':
                    # Correct 'position' field of every day
                    for i in range(0, len(days_set)):
                        days_set[i]['position'] = i

        if entry_type == 'h' or entry_type == 'a':
            # Delete one/all calendar holiday entries
            if entry_type == 'a':
                self.logger.debug(self.logprefix +
                                  "deleting all holidays from holidays file")
                del holiday_list[:]
            else:
                self.logger.debug(self.logprefix +
                                  "deleting holiday on " + str(idx) +
                                  " from holidays file")
                holiday_list.remove(str(idx))

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

        return True

    def holidays_set_year(self, new_year="", apply=True, obj=None,
                          level=logging.INFO):
        """
        Set the year value

        :param newyear: year value to set
        :type newyear: str
        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead
                    of internal
        """
        self.logger.log(level, self.logprefix +
                        "setting holidays file year entry to " +
                        str(new_year))
        if obj is None:
            obj = self.holidays_obj

        year = obj.year

        year['value'] = str(new_year)
        year['valid'] = True

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

    def holidays_unset_year(self, apply=True, obj=None, level=logging.INFO):
        """
        Unset the year value

        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead
                    of internal
        """
        self.logger.log(level, self.logprefix +
                        "unsetting holidays file year entry")
        if obj is None:
            obj = self.holidays_obj

        obj.year['value'] = ""

        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

    def holidays_get_year(self, obj=None, level=logging.INFO):
        """
        :param obj: optional holidays object to be used instead
                    of internal
        :returns: The year entry of holidays file
        """
        self.logger.log(level, self.logprefix +
                        "getting holidays file year entry")
        if obj is None:
            obj = self.holidays_obj

        year = obj.year
        return year.copy()

    def holidays_add_holiday(self, date=None, apply=True, obj=None,
                             level=logging.INFO):
        """
        Add a calendar holiday to the holidays file

        :param date: Date value for the holiday
        :param apply: to reflect the changes to file
        :type apply: bool
        :param obj: optional holidays object to be used instead
                    of internal
        """
        self.logger.log(level, self.logprefix +
                        "adding holiday " + str(date) +
                        " to holidays file")
        if obj is None:
            obj = self.holidays_obj

        holiday_list = obj.holidays

        if date is not None:
            holiday_list.append(str(date))
        else:
            pass
        self.logger.debug("holidays list after adding one: " +
                          str(holiday_list))
        if apply:
            self.holidays_write_file(obj=obj, level=logging.DEBUG)

    def holidays_get_holidays(self, obj=None, level=logging.INFO):
        """
        :param obj: optional holidays object to be used instead
                    of internal
        :returns: The list of holidays in holidays file
        """
        self.logger.log(level, self.logprefix +
                        "retrieving list of holidays")

        if obj is None:
            obj = self.holidays_obj

        holiday_list = obj.holidays
        return holiday_list[:]

    def _holidays_process_content(self, content, obj=None):
        """
        Process a user provided list of holidays file content

        :param obj: optional holidays object to be used instead
                    of internal
        """
        self.logger.debug("_holidays_process_content(): " +
                          "Processing user provided holidays content:\n" +
                          str(content))
        if obj is None:
            obj = self.holidays_obj

        days_map = obj._days_map
        year = obj.year
        holiday_list = obj.holidays
        days_set = obj.days_set

        self.holidays_delete_entry(
            'a', apply=False, obj=obj, level=logging.DEBUG)

        if content is None:
            self.logger.debug("Holidays file was wiped out")
            return

        for line in content:
            entry = line.split()
            if len(entry) == 0:
                continue
            tag = entry[0].lower()
            if tag == "year":   # initialize self.year
                year['valid'] = True
                if len(entry) > 1:
                    year['value'] = entry[1]
            elif tag in days_map.keys():   # initialize self.<day>
                day = days_map[tag]
                day['valid'] = True
                days_set.append(day)
                day['position'] = len(days_set) - 1
                if len(entry) > 1:
                    day['p'] = entry[1]
                if len(entry) > 2:
                    day['np'] = entry[2]
            elif tag.isdigit():   # initialize self.holiday
                holiday_list.append(tag)
            else:
                pass

    def holidays_write_file(self, content=None, out_path=None,
                            hup=True, obj=None, level=logging.INFO):
        """
        Write to the holidays file with content ``given/generated``

        :param hup: SIGHUP the scheduler after writing the holidays
                    file
        :type hup: bool
        :param obj: optional holidays object to be used instead of
                    internal
        """
        self.logger.log(level, self.logprefix +
                        "Writing to the holidays file")

        if obj is None:
            obj = self.holidays_obj

        if out_path is None:
            out_path = self.holidays_file

        if content is not None:
            self._holidays_process_content(content, obj)
        else:
            content = str(obj)

        self.logger.debug("content being written:\n" + str(content))

        fn = self.du.create_temp_file(self.hostname, body=content)
        ret = self.du.run_copy(self.hostname, src=fn, dest=out_path,
                               preserve_permission=False, sudo=True)
        self.du.rm(self.hostname, fn)

        if ret['rc'] != 0:
            raise PbsSchedConfigError(rc=ret['rc'], rv=ret['out'],
                                      msg=('error applying holidays file' +
                                           ret['err']))
        if hup:
            rv = self.signal('-HUP')
            if not rv:
                raise PbsSchedConfigError(rc=1, rv=False,
                                          msg='error applying holidays file')
        return True

    def parse_dedicated_time(self, file=None):
        """
        Parse the dedicated_time file and populate dedicated times
        as both a string dedicated_time array of dictionaries defined
        as ``[{'from': datetime, 'to': datetime}, ...]`` as well as a
        dedicated_time_as_str array with a string representation of
        each entry

        :param file: optional file to parse. Defaults to the one under
                     ``PBS_HOME/sched_priv``
        :type file: str or None

        :returns: The dedicated_time list of dictionaries or None on
                  error.Return an empty array if dedicated time file
                  is empty.
        """
        self.dedicated_time_as_str = []
        self.dedicated_time = []

        if file:
            dt_file = file
        elif self.dedicated_time_file:
            dt_file = self.dedicated_time_file
        else:
            dt_file = os.path.join(self.pbs_conf['PBS_HOME'], 'sched_priv',
                                   'dedicated_time')
        try:
            lines = self.du.cat(self.hostname, dt_file, sudo=True)['out']
            if lines is None:
                return []

            for line in lines:
                if not line.startswith('#') and len(line) > 0:
                    self.dedicated_time_as_str.append(line)
                    (dtime_from, dtime_to) = self.utils.convert_dedtime(line)
                    self.dedicated_time.append({'from': dtime_from,
                                                'to': dtime_to})
        except Exception:
            self.logger.error('error in parse_dedicated_time')
            return None

        return self.dedicated_time

    def clear_dedicated_time(self, hup=True):
        """
        Clear the dedicated time file
        """
        self.parse_dedicated_time()
        if ((len(self.dedicated_time) == 0) and
                (len(self.dedicated_time_as_str) == 0)):
            return True
        if self.dedicated_time:
            for d in self.dedicated_time:
                del d
        if self.dedicated_time_as_str:
            for d in self.dedicated_time_as_str:
                del d
        self.dedicated_time = []
        self.dedicated_time_as_str = []
        dt = "# FORMAT: MM/DD/YYYY HH:MM MM/DD/YYYY HH:MM"
        return self.add_dedicated_time(dt, hup=hup)

    def add_dedicated_time(self, as_str=None, start=None, end=None, hup=True):
        """
        Append a dedicated time entry. The function can be called
        in one of two ways, either by passing in start and end as
        time values, or by passing as_str, a string that gets
        appended to the dedicated time entries and formatted as
        follows, note that no check on validity of the format will
        be made the function uses strftime to parse the datetime
        and will fail if the strftime can not convert the string.
        ``MM/DD/YYYY HH:MM MM/DD/YYYY HH:MM``

        :returns: True on success and False otherwise
        """
        if self.dedicated_time is None:
            self.parse_dedicated_time()

        if start is not None and end is not None:
            dtime_from = time.strftime("%m/%d/%Y %H:%M", time.localtime(start))
            dtime_to = time.strftime("%m/%d/%Y %H:%M", time.localtime(end))
            dedtime = dtime_from + " " + dtime_to
        elif as_str is not None:
            (dtime_from, dtime_to) = self.utils.convert_dedtime(as_str)
            dedtime = as_str
        else:
            self.logger.warning("no dedicated from/to specified")
            return True

        for d in self.dedicated_time_as_str:
            if dedtime == d:
                if dtime_from is None or dtime_to is None:
                    self.logger.info(self.logprefix +
                                     "dedicated time already defined")
                else:
                    self.logger.info(self.logprefix +
                                     "dedicated time from " + dtime_from +
                                     " to " + dtime_to + " already defined")
                return True

        if dtime_from is not None and dtime_to is not None:
            self.logger.info(self.logprefix +
                             "adding dedicated time " + dedtime)

        self.dedicated_time_as_str.append(dedtime)
        if dtime_from is not None and dtime_to is not None:
            self.dedicated_time.append({'from': dtime_from, 'to': dtime_to})
        try:
            fn = self.du.create_temp_file()
            with open(fn, "w") as fd:
                for l in self.dedicated_time_as_str:
                    fd.write(l + '\n')
            ddfile = os.path.join(self.pbs_conf['PBS_HOME'], 'sched_priv',
                                  'dedicated_time')
            self.du.run_copy(self.hostname, src=fn, dest=ddfile, sudo=True,
                             preserve_permission=False)
            os.remove(fn)
        except Exception:
            raise PbsSchedConfigError(rc=1, rv=False,
                                      msg='error adding dedicated time')

        if hup:
            ret = self.signal('-HUP')
            if ret['rc'] != 0:
                raise PbsSchedConfigError(rc=1, rv=False,
                                          msg='error adding dedicated time')

        return True

    def terminate(self):
        self.signal('-KILL')

    def valgrind(self):
        """
        run scheduler instance through valgrind
        """
        if self.isUp():
            self.terminate()

        rv = CliUtils().check_bin('valgrind')
        if not rv:
            self.logger.error(self.logprefix + 'valgrind not available')
            return None

        cmd = ['valgrind']

        cmd += ["--log-file=" + os.path.join(tempfile.gettempdir(),
                                             'schd.vlgrd')]
        cmd += [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbs_sched')]

        return self.du.run_cmd(self.hostname, cmd, sudo=True)

    def alloc_to_execvnode(self, chunks):
        """
        convert a resource allocation to an execvnode string representation
        """
        execvnode = []
        for chunk in chunks:
            execvnode += ["(" + chunk.vnode]
            for res, val in chunk.resources.items():
                execvnode += [":" + str(res) + "=" + str(val)]
            for vchk in chunk.vchunk:
                execvnode += ["+" + vchk.vnode]
                for res, val in vchk.resources():
                    execvnode += [":" + str(res) + "=" + str(val)]
            execvnode += [")+"]

        if len(execvnode) != 0:
            ev = execvnode[len(execvnode) - 1]
            ev = ev[:-1]
            execvnode[len(execvnode) - 1] = ev

        return "".join(execvnode)

    def cycles(self, start=None, end=None, firstN=None, lastN=None):
        """
        Analyze scheduler log and return cycle information

        :param start: Optional setting of the start time to consider
        :param end: Optional setting of the end time to consider
        :param firstN: Optional setting to consider the given first
                       N cycles
        :param lastN: Optional setting to consider only the given
                      last N cycles
        """
        try:
            from ptl.utils.pbs_logutils import PBSSchedulerLog
        except Exception:
            self.logger.error('error loading ptl.utils.pbs_logutils')
            return None

        if 'sched_log' in self.attributes:
            logdir = self.attributes['sched_log']
        else:
            logdir = os.path.join(self.pbs_conf['PBS_HOME'], 'sched_logs')

        tm = time.strftime("%Y%m%d", time.localtime())
        log_file = os.path.join(logdir, tm)

        if start is not None or end is not None:
            analyze_path = os.path.dirname(log_file)
        else:
            analyze_path = log_file

        sl = PBSSchedulerLog()
        sl.analyze(analyze_path, start, end, self.hostname)
        cycles = sl.cycles
        if cycles is None or len(cycles) == 0:
            return []

        if lastN is not None:
            return cycles[-lastN:]
        elif firstN is not None:
            return cycles[:firstN]

        return cycles

    def decay_fairshare_tree(self):
        """
        Decay the fairshare tree through pbsfs
        """
        if self.has_snap:
            return True

        cmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', 'pbsfs')]
        if self.sc_name != 'default':
            cmd += ['-I', self.sc_name]
        cmd += ['-d']

        ret = self.du.run_cmd(self.hostname, cmd, runas=self.user)
        if ret['rc'] == 0:
            self.fairshare_tree = self.fairshare.query_fairshare()
            return True
        return False

    def parse_resource_group(self, hostname=None, resource_group=None):
        """
        Parse the Scheduler's ``resource_group`` file

        :param hostname: The name of the host from which to parse
                         resource_group
        :type hostname: str or None
        :param resource_group: The path to a resource_group file
        :type resource_group: str or None
        :returns: A fairshare tree
        """

        if hostname is None:
            hostname = self.hostname
        # if resource_group is None:
        resource_group = self.resource_group_file
        # if.has_snap is True acces to sched_priv may not require su privilege
        ret = self.du.cat(hostname, resource_group, sudo=(not self.has_snap))
        if ret['rc'] != 0:
            self.logger.error(hostname + ' error reading ' + resource_group)
        tree = FairshareTree(hostname, resource_group)
        root = FairshareNode('root', -1, parent_id=0, nshares=100)
        tree.add_node(root, apply=False)
        lines = ret['out']
        for line in lines:
            line = line.strip()
            if not line.startswith("#") and len(line) > 0:
                # could have 5th column but we only need the first 4
                (name, id, parent, nshares) = line.split()[:4]
                node = FairshareNode(name, id, parent_name=parent,
                                     nshares=nshares)
                tree.add_node(node, apply=False)
        tree.update()
        return tree

    def add_to_resource_group(self, name, fairshare_id, parent, nshares,
                              validate=True):
        """
        Add an entry to the resource group file

        :param name: The name of the entity to add
        :type name: str or :py:class:`~ptl.lib.pbs_testlib.PbsUser`
        :param fairshare_id: The numeric identifier of the entity to add
        :type fairshare_id: int
        :param parent: The name of the parent group
        :type parent: str
        :param nshares: The number of shares associated to the entity
        :type nshares: int
        :param validate: if True (the default), validate the
                         configuration settings.
        :type validate: bool
        """
        if self.resource_group is None:
            self.resource_group = self.parse_resource_group(
                self.hostname, self.resource_group_file)
        if not self.resource_group:
            self.resource_group = FairshareTree(
                self.hostname, self.resource_group_file)
        if isinstance(name, PbsUser):
            name = str(name)
        reconfig_time = time.time()
        rc = self.resource_group.create_node(name, fairshare_id,
                                             parent_name=parent,
                                             nshares=nshares)
        if validate:
            self.get_pid()
            self.signal('-HUP')
            try:
                self.log_match("Sched;reconfigure;Scheduler is reconfiguring",
                               starttime=reconfig_time)
                self.log_match("fairshare;resgroup: error ",
                               starttime=reconfig_time, existence=False,
                               max_attempts=2)
            except PtlLogMatchError:
                _msg = 'Error in validating resource_group changes'
                raise PbsSchedConfigError(rc=1, rv=False,
                                          msg=_msg)
        return rc

    def job_formula(self, jobid=None, starttime=None, max_attempts=None):
        """
        Extract formula value out of scheduler log

        :param jobid: Optional, the job identifier for which to get
                      the formula.
        :type jobid: str or int
        :param starttime: The time at which to start parsing the
                          scheduler log
        :param max_attempts: The number of attempts to search for
                             formula in the logs
        :type max_attempts: int
        :returns: If jobid is specified, return the formula value
                  associated to that job if no jobid is specified,
                  returns a dictionary mapping job ids to formula
        """
        if jobid is None:
            jobid = "(?P<jobid>.*)"
            _alljobs = True
        else:
            if isinstance(jobid, int):
                jobid = str(jobid)
            _alljobs = False

        formula_pat = (".*Job;" + jobid +
                       ".*;Formula Evaluation = (?P<fval>.*)")
        if max_attempts is None:
            max_attempts = self.ptl_conf['max_attempts']
        rv = self.log_match(formula_pat, regexp=True, starttime=starttime,
                            n='ALL', allmatch=True,
                            max_attempts=max_attempts)
        ret = {}
        if rv:
            for _, l in rv:
                m = re.match(formula_pat, l)
                if m:
                    if _alljobs:
                        jobid = m.group('jobid')
                    ret[jobid] = float(m.group('fval').strip())

        if not _alljobs:
            if jobid in ret:
                return ret[jobid]
            else:
                return
        return ret


================================================
FILE: test/fw/ptl/lib/ptl_server.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import ast
import base64
import copy
import datetime
import grp
import json
import logging
import os
import socket
import string
import sys
import time

from ptl.utils.pbs_dshutils import DshUtils, PtlUtilError
from ptl.utils.pbs_testusers import (ROOT_USER, TEST_USER, PbsUser,
                                     DAEMON_SERVICE_USER)

try:
    import psycopg2
    PSYCOPG = True
except Exception:
    PSYCOPG = False
from ptl.lib.ptl_error import (PbsStatusError, PbsSubmitError,
                               PbsDeljobError, PbsDelresvError,
                               PbsDeleteError, PbsSelectError,
                               PbsManagerError, PbsSignalError,
                               PbsAlterError, PbsHoldError,
                               PbsRerunError, PbsOrderError,
                               PbsRunError, PbsMoveError,
                               PbsQtermError, PbsQdisableError,
                               PbsQenableError, PbsQstartError,
                               PbsQstopError, PbsResourceError,
                               PbsResvAlterError, PtlExpectError,
                               PbsConnectError, PbsServiceError,
                               PbsInitServicesError, PbsMessageError,
                               PtlLogMatchError)
from ptl.lib.ptl_types import PbsAttribute
from ptl.lib.ptl_constants import *
from ptl.lib.ptl_entities import (Hook, Queue, Entity, Limit,
                                  EquivClass, Resource)
from ptl.lib.ptl_sched import Scheduler
from ptl.lib.ptl_mom import MoM, get_mom_obj
from ptl.lib.ptl_service import PBSService, PBSInitServices
from ptl.lib.ptl_wrappers import *


class Server(Wrappers):

    """
    PBS server ``configuration`` and ``control``
    The Server class is a container to PBS server attributes
    and implements wrappers to the ``IFL API`` to perform
    operations on the server. For example to submit, status,
    delete, manage, etc... jobs, reservations and configurations.
    This class also offers higher-level routines to ease testing,
    see functions, for ``example: revert_to_defaults,
    init_logging, expect, counter.``
    :param name: The hostname of the server. Defaults to
                 calling pbs_default()
    :type name: str
    :param attrs: Dictionary of attributes to set, these will
                  override defaults.
    :type attrs: Dictionary
    :param defaults: Dictionary of default attributes.
                     Default: dflt_attributes
    :type defaults: Dictionary
    :param pbsconf_file: path to config file to parse for PBS_HOME,
                         PBS_EXEC, etc
    :type pbsconf_file: str
    :param snapmap: A dictionary of PBS objects (node,server,etc)
                    to mapped files from PBS snap directory
    :type snapmap: Dictionary
    :param snap: path to PBS snap directory (This will overrides
                 snapmap)
    :type snap: str
    :param client: The host to use as client for CLI queries.
                   Defaults to the local hostname.
    :type client: str
    :param client_pbsconf_file: The path to a custom PBS_CONF_FILE
                                on the client host. Defaults to
                                the same path as pbsconf_file.
    :type client_pbsconf_file: str
    :param db_acccess: set to either file containing credentials
                       to DB access or dictionary containing
                       {'dbname':...,'user':...,'port':...}
    :param stat: if True, stat the server attributes
    :type stat: bool
    """

    def __init__(self, name=None, attrs={}, defaults={}, pbsconf_file=None,
                 snapmap={}, snap=None, client=None, client_pbsconf_file=None,
                 db_access=None, stat=True):
        super().__init__(name, attrs, defaults, pbsconf_file, snapmap,
                         snap, client, client_pbsconf_file, db_access, stat)

    def add_expect_action(self, name=None, action=None):
        """
        Add an action handler to expect. Expect Actions are
        custom handlers that are triggered when an unexpected
        value is encountered
        :param name: Action name
        :type name: str or None
        :param action: Action to add
        """
        if name is None and action.name is None:
            return
        if name is None and action.name is not None:
            name = action.name

        if not self.actions.has_action(name):
            self.actions.add_action(action, self.shortname)

    def counter(self, obj_type=None, attrib=None, id=None, extend=None,
                op=None, attrop=None, bslist=None, level=logging.INFO,
                idonly=True, grandtotal=False, db_access=None, runas=None,
                resolve_indirectness=False):
        """
        Accumulate properties set on an object. For example, to
        count number of free nodes:
        ``server.counter(VNODE,{'state':'free'})``
        :param obj_type: The type of object to query, one of the
                         * objects
        :param attrib: Attributes to query, can be a string, a
                       list, a dictionary
        :type attrib: str or list or dictionary
        :param id: The id of the object to act upon
        :param extend: The extended parameter to pass to the stat
                       call
        :param op: The operation used to match attrib to what is
                   queried. SET or None
        :type op: str or None
        :param attrop: Operation on multiple attributes, either
                       PTL_AND, PTL_OR
        :param bslist: Optional, use a batch status dict list
                       instead of an obj_type
        :param idonly: if true, return the name/id of the matching
                       objects
        :type idonly: bool
        :param db_access: credentials to access db, either a path
                          to file or dictionary
        :type db_access: str or dictionary
        :param runas: run as user
        :type runas: str or None
        """
        self.logit('counter: ', obj_type, attrib, id, level=level)
        return self._filter(obj_type, attrib, id, extend, op, attrop, bslist,
                            PTL_COUNTER, idonly, grandtotal, db_access,
                            runas=runas, level=level,
                            resolve_indirectness=resolve_indirectness)

    def set_attributes(self, a={}):
        """
        set server attributes
        :param a: Attribute dictionary
        :type a: Dictionary
        """
        super(Server, self).set_attributes(a)
        self.__dict__.update(a)

    def isUp(self, max_attempts=None):
        """
        returns ``True`` if server is up and ``False`` otherwise
        """
        if max_attempts is None:
            max_attempts = self.ptl_conf['max_attempts']
        if self.has_snap:
            return True
        i = 0
        op_mode = self.get_op_mode()
        if ((op_mode == PTL_API) and (self._conn is not None)):
            self._disconnect(self._conn, force=True)
        while i < max_attempts:
            rv = False
            try:
                if op_mode == PTL_CLI:
                    self.status(SERVER, level=logging.DEBUG, logerr=False)
                else:
                    c = self._connect(self.hostname)
                    self._disconnect(c, force=True)
                return True
            except (PbsConnectError, PbsStatusError):
                # if the status/connect operation fails then there might be
                # chances that server process is running but not responsive
                # so we wait until the server is reported operational.
                rv = self._isUp()
                # We really mean to check != False rather than just "rv"
                if str(rv) != 'False':
                    self.logger.warning('Server process started' +
                                        'but not up yet')
                    time.sleep(1)
                    i += 1
                else:
                    # status/connect failed + no server process means
                    # server is actually down
                    return False
        return False

    def start(self, args=None, launcher=None):
        """
        Start the PBS server
        :param args: Argument required to start the server
        :type args: str
        :param launcher: Optional utility to invoke the launch of the service
        :type launcher: str or list
        """
        if args is not None or launcher is not None:
            rv = super(Server, self)._start(inst=self, args=args,
                                            launcher=launcher)
        else:
            try:
                rv = self.pi.start_server()
                pid = self._validate_pid(self)
                if pid is None:
                    raise PbsServiceError(rv=False, rc=-1,
                                          msg="Could not find PID")
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg)
        if self.isUp():
            return rv
        else:
            raise PbsServiceError(rv=False, rc=1, msg=rv['err'])

    def stop(self, sig=None):
        """
        Stop the PBS server
        :param sig: Signal to stop PBS server
        :type sig: str
        """
        if sig is not None:
            self.logger.info(self.logprefix + 'stopping Server on host ' +
                             self.hostname)
            rc = super(Server, self)._stop(sig, inst=self)
        else:
            try:
                self.pi.stop_server()
            except PbsInitServicesError as e:
                raise PbsServiceError(rc=e.rc, rv=e.rv, msg=e.msg,
                                      post=self._disconnect, conn=self._conn,
                                      force=True)
            rc = True
        self._disconnect(self._conn, force=True)
        return rc

    def restart(self):
        """
        Terminate and start a PBS server.
        """
        if self.isUp():
            if not self.stop():
                return False
        start_rc = self.start()
        self.expect(NODE, {'state=state-unknown,down': 0})
        return start_rc

    def log_match(self, msg=None, id=None, n=50, tail=True, allmatch=False,
                  regexp=False, max_attempts=None, interval=None,
                  starttime=None, endtime=None, level=logging.INFO,
                  existence=True):
        """
        Match given ``msg`` in given ``n`` lines of Server log
        :param msg: log message to match, can be regex also when
                    ``regexp`` is True
        :type msg: str
        :param id: The id of the object to trace. Only used for
                   tracejob
        :type id: str
        :param n: 'ALL' or the number of lines to search through,
                  defaults to 50
        :type n: str or int
        :param tail: If true (default), starts from the end of
                     the file
        :type tail: bool
        :param allmatch: If True all matching lines out of then
                         parsed are returned as a list. Defaults
                         to False
        :type allmatch: bool
        :param regexp: If true msg is a Python regular expression.
                       Defaults to False
        :type regexp: bool
        :param max_attempts: the number of attempts to make to find
                             a matching entry
        :type max_attempts: int
        :param interval: the interval between attempts
        :type interval: int
        :param starttime: If set ignore matches that occur before
                          specified time
        :type starttime: float
        :param endtime: If set ignore matches that occur after
                        specified time
        :type endtime: float
        :param level: The logging level, defaults to INFO
        :type level: int
        :param existence: If True (default), check for existence of
                        given msg, else check for non-existence of
                        given msg.
        :type existence: bool
        :return: (x,y) where x is the matching line
                 number and y the line itself. If allmatch is True,
                 a list of tuples is returned.
        :rtype: tuple
        :raises PtlLogMatchError:
                When ``existence`` is True and given
                ``msg`` is not found in ``n`` line
                Or
                When ``existence`` is False and given
                ``msg`` found in ``n`` line.
        .. note:: The matching line number is relative to the record
                  number, not the absolute line number in the file.
        """
        return self._log_match(self, msg, id, n, tail, allmatch, regexp,
                               max_attempts, interval, starttime, endtime,
                               level=level, existence=existence)

    def revert_to_defaults(self, reverthooks=True, revertqueues=True,
                           revertresources=True, delhooks=True,
                           delqueues=True, delscheds=True, delnodes=True,
                           server_stat=None):
        """
        reset server attributes back to out of box defaults.
        :param reverthooks: If True disable all hooks. Defaults
                            to True
        :type reverthooks: bool
        :param revertqueues: If True disable all non-default
                             queues. Defaults to True
        :type revertqueues: bool
        :param revertresources: If True, resourcedef file is
                                removed. Defaults to True.
                                Reverting resources causes a server
                                restart to occur.
        :type revertresources: bool
        :param delhooks: If True, hooks are deleted, if deletion
                         fails, fall back to reverting hooks. Defaults
                         to True.
        :type delhooks: bool
        :param delqueues: If True, all non-default queues are deleted,
                          will attempt to delete all jobs first, if it
                          fails, revertqueues will be honored,
                          otherwise,revertqueues is ignored. Defaults
                          to True
        :type delqueues: bool
        :param delscheds: If True all non-default schedulers are deleted
                          The sched_priv and sched_logs directories will be
                          deleted.
        :type delscheds: bool
        :param delnodes: If True all vnodes are deleted
        :type delnodes: bool
        :returns: True upon success and False if an error is
                  encountered.
        :raises: PbsStatusError or PbsManagerError
        """
        setdict = {}
        skip_site_hooks = ['pbs_cgroups']
        self.logger.info(self.logprefix +
                         'reverting configuration to defaults')
        self.cleanup_jobs_and_reservations()
        self.atom_hk = os.path.join(self.pbs_conf['PBS_HOME'],
                                    'server_priv', 'hooks',
                                    'PBS_cray_atom.HK')
        self.dflt_atom_hk = os.path.join(self.pbs_conf['PBS_EXEC'],
                                         'lib', 'python', 'altair',
                                         'pbs_hooks',
                                         'PBS_cray_atom.HK')
        self.atom_cf = os.path.join(self.pbs_conf['PBS_HOME'],
                                    'server_priv', 'hooks',
                                    'PBS_cray_atom.CF')
        self.dflt_atom_cf = os.path.join(self.pbs_conf['PBS_EXEC'],
                                         'lib', 'python', 'altair',
                                         'pbs_hooks',
                                         'PBS_cray_atom.CF')
        self.unset_svr_attrib()
        for k in self.dflt_attributes.keys():
            if(k not in self.attributes or
               self.attributes[k] != self.dflt_attributes[k]):
                setdict[k] = self.dflt_attributes[k]
        if self.platform == 'cray' or self.platform == 'craysim':
            setdict[ATTR_restrict_res_to_release_on_suspend] = 'ncpus'
        if delhooks:
            self.delete_site_hooks()
        if delqueues:
            revertqueues = False
            self.delete_queues()
            a = {ATTR_qtype: 'Execution',
                 ATTR_enable: 'True',
                 ATTR_start: 'True'}
            self.manager(MGR_CMD_CREATE, QUEUE, a, id='workq')
            setdict.update({ATTR_dfltque: 'workq'})
        if delscheds:
            self.delete_sched_config()

        if delnodes:
            self.delete_nodes()
        if reverthooks:
            if self.platform == 'shasta':
                dohup = False
                if (self.du.cmp(self.hostname, self.dflt_atom_hk,
                                self.atom_hk, sudo=True) != 0):
                    self.du.run_copy(self.hostname, src=self.dflt_atom_hk,
                                     dest=self.atom_hk, mode=0o644, sudo=True)
                    dohup = True
                if self.du.cmp(self.hostname, self.dflt_atom_cf,
                               self.atom_cf, sudo=True) != 0:
                    self.du.run_copy(self.hostname, src=self.dflt_atom_cf,
                                     dest=self.atom_cf, mode=0o644, sudo=True)
                    dohup = True
                if dohup:
                    self.signal('-HUP')
            hooks = self.status(HOOK, level=logging.DEBUG)
            hooks = [h['id'] for h in hooks]
            a = {ATTR_enable: 'false'}
            if len(hooks) > 0:
                self.manager(MGR_CMD_SET, MGR_OBJ_HOOK, a, hooks)
        if revertqueues:
            self.status(QUEUE, level=logging.DEBUG)
            queues = []
            for (qname, qobj) in self.queues.items():
                # skip reservation queues. This syntax for Python 2.4
                # compatibility
                if (qname.startswith('R') or qname.startswith('S') or
                        qname == server_stat[ATTR_dfltque]):
                    continue
                qobj.revert_to_defaults()
                queues.append(qname)
                a = {ATTR_enable: 'false'}
                self.manager(MGR_CMD_SET, QUEUE, a, id=queues)
            a = {ATTR_enable: 'True', ATTR_start: 'True'}
            self.manager(MGR_CMD_SET, MGR_OBJ_QUEUE, a,
                         id=server_stat[ATTR_dfltque])
        if len(setdict) > 0:
            self.manager(MGR_CMD_SET, MGR_OBJ_SERVER, setdict)
        if revertresources:
            self.delete_resources()
        return True

    def delete_resources(self):
        """
        Delete all resources
        """
        try:
            rescs = self.status(RSC)
            rescs = [r['id'] for r in rescs]
        except Exception:
            rescs = []
        if len(rescs) > 0:
            self.manager(MGR_CMD_DELETE, RSC, id=rescs)

    def unset_svr_attrib(self, server_stat=None):
        """
        Unset server attributes
        """
        ignore_attrs = ['id', 'pbs_license', ATTR_NODE_ProvisionEnable]
        ignore_attrs += [ATTR_status, ATTR_total, ATTR_count]
        ignore_attrs += [ATTR_rescassn, ATTR_FLicenses, ATTR_SvrHost]
        ignore_attrs += [ATTR_license_count, ATTR_version, ATTR_managers]
        ignore_attrs += [ATTR_operators, ATTR_license_min]
        ignore_attrs += [ATTR_pbs_license_info, ATTR_power_provisioning]
        unsetlist = []
        self.cleanup_jobs_and_reservations()
        if server_stat is None:
            server_stat = self.status(SERVER, level=logging.DEBUG)[0]
        for k in server_stat.keys():
            if (k in ignore_attrs) or (k in self.dflt_attributes.keys()):
                continue
            elif (('.' in k) and (k.split('.')[0] in ignore_attrs)):
                continue
            else:
                unsetlist.append(k)
        if len(unsetlist) != 0:
            self.manager(MGR_CMD_UNSET, MGR_OBJ_SERVER, unsetlist)

    def delete_site_hooks(self):
        """
        Delete site hooks from PBS
        """
        skip_site_hooks = ['pbs_cgroups']
        hooks = self.status(HOOK, level=logging.DEBUG)
        hooks = [h['id'] for h in hooks]
        for h in skip_site_hooks:
            if h in hooks:
                hooks.remove(h)
        if len(hooks) > 0:
            self.manager(MGR_CMD_DELETE, HOOK, id=hooks)

    def delete_queues(self):
        """
        Delete queues
        """
        queues = self.status(QUEUE, level=logging.DEBUG)
        queues = [q['id'] for q in queues]
        if len(queues) > 0:
            try:
                nodes = self.status(VNODE, logerr=False)
                for node in nodes:
                    if 'queue' in node.keys():
                        self.manager(MGR_CMD_UNSET, NODE, 'queue',
                                     node['id'])
            except Exception:
                pass
            self.manager(MGR_CMD_DELETE, QUEUE, id=queues)

    def delete_sched_config(self):
        """
        Delete sched_priv & sched_log files
        """
        self.manager(MGR_CMD_LIST, SCHED)
        for name in list(self.schedulers.keys()):
            if name != 'default':
                self.schedulers[name].terminate()
                sched_log = self.schedulers[
                    name].attributes['sched_log']
                sched_priv = self.schedulers[
                    name].attributes['sched_priv']
                self.du.rm(path=sched_log, sudo=True,
                           recursive=True, force=True)
                self.du.rm(path=sched_priv, sudo=True,
                           recursive=True, force=True)
                self.manager(MGR_CMD_DELETE, SCHED, id=name)

    def create_node(self, name, level="INFO", logerr=False):
        """
        Add a node to PBS
        """
        ret = self.manager(MGR_CMD_CREATE, VNODE, name,
                           level=level, logerr=logerr)
        return ret

    def delete_node(self, name, level="INFO", logerr=False):
        """
        Remove a node from PBS
        """
        try:
            ret = self.manager(MGR_CMD_DELETE, VNODE, name,
                               level=level, logerr=logerr)
        except PbsManagerError as err:
            if "Unknown node" not in err.msg[0]:
                raise
            else:
                ret = 15062
        return ret

    def delete_nodes(self):
        """
        Remove all the nodes from PBS
        """
        try:
            self.manager(MGR_CMD_DELETE, VNODE, id="@default",
                         runas=ROOT_USER)
        except PbsManagerError as e:
            if "Unknown node" not in e.msg[0]:
                raise

    def save_configuration(self, outfile=None, mode='w'):
        """
        Save a server configuration, this includes:
          - ``server_priv/resourcedef``
          - ``qmgr -c "print server"``
          - ``qmgr -c "print sched"``
          - ``qmgr -c "print hook"``
        :param outfile: the output file to which onfiguration is
                        saved
        :type outfile: str
        :param mode: The mode in which to open outfile to save
                     configuration. The first object being saved
                     should open this file with 'w' and subsequent
                     calls from other objects should save with
                     mode 'a' or 'a+'. Defaults to a+
        :type mode: str
        :returns: True on success, False on error
        """
        conf = {}
        # save pbs.conf file
        cfg_path = self.du.get_pbs_conf_file()
        with open(cfg_path, 'r') as p:
            pbs_cfg = p.readlines()
            config = self.utils.convert_to_dictlist(pbs_cfg)
            cfg_str = str(config[0])
            encode_utf = cfg_str.encode('UTF-8')
            pbs_cfg_b64 = base64.b64encode(encode_utf)
            decode_utf = pbs_cfg_b64.decode('UTF-8')
        conf['pbs_conf'] = decode_utf
        # save hook files
        hooks_str = self._save_hook_files()
        if hooks_str:
            conf.update(hooks_str)
            conf['hooks'] = hooks_str
        else:
            self.logger.error('Failed to save site hooks')
            return False
        qmgr = os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qmgr')
        pbsnodes = os.path.join(
            self.client_conf['PBS_EXEC'], 'bin', 'pbsnodes')
        ret = self.du.run_cmd(
            self.hostname, [
                qmgr, '-c', 'print server'], sudo=True,
            logerr=False, level=logging.DEBUG)
        if ret['rc'] != 0:
            self.logger.error('Failed to get Server attributes')
            return False
        else:
            conf['qmgr_print_server'] = ret['out']
        ret = self.du.run_cmd(self.hostname, [qmgr, '-c', 'print sched'],
                              logerr=False, level=logging.DEBUG, sudo=True)
        if ret['rc'] != 0:
            self.logger.error('Failed to get sched attributes')
            return False
        else:
            conf['qmgr_print_sched'] = ret['out']

        # sudo=True is added while running "pbsnodes -av", to make
        # sure that all the node attributes are preserved in
        # save_configuration. If this command is run without sudo,
        # some of the node attributes like port, version is not listed.
        ret = self.du.run_cmd(self.hostname, [pbsnodes, '-av'],
                              logerr=False, level=logging.DEBUG, sudo=True)
        err_msg = "Server has no node list"
        # pbsnodes -av returns a non zero exit code when there are
        # no nodes in cluster
        if ret['rc'] != 0 and err_msg in ret['err']:
            self.logger.error('Failed to get nodes info')
            return False
        else:
            nodes_val = self.utils.convert_to_dictlist(ret['out'])
            conf['pbsnodes'] = nodes_val
        self.saved_config[MGR_OBJ_SERVER] = conf
        if outfile is not None:
            try:
                with open(outfile, mode) as f:
                    json.dump(self.saved_config, f)
                    self.saved_config[MGR_OBJ_SERVER].clear()
            except Exception:
                self.logger.error('Error processing file ' + outfile)
                return False

        return True

    def _save_hook_files(self):
        """
        save all the hooks .CF, .PY, .HK files
        """
        qmgr = os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qmgr')
        cfg = {"hooks": ""}
        cmd = [qmgr, '-c', 'print hook @default']
        ret = self.du.run_cmd(self.hostname, cmd,
                              sudo=True)
        if ret['rc'] != 0:
            self.logger.error('Failed to save hook files ')
            return False
        else:
            cfg['qmgr_print_hook'] = ret['out']
        return cfg

    def load_configuration(self, infile):
        """
        load server configuration from saved file ``infile``
        """
        rv = self._load_configuration(infile, MGR_OBJ_SERVER)
        return rv

    def get_hostname(self):
        """
        return the default server hostname
        """

        if self.get_op_mode() == PTL_CLI:
            return self.hostname
        return pbs_default()

    def _db_connect(self, db_access=None):
        if self._db_conn is None:
            if 'user' not in db_access or\
               'password' not in db_access:
                self.logger.error('missing credentials to access DB')
                return None

            if 'dbname' not in db_access:
                db_access['dbname'] = 'pbs_datastore'
            if 'port' not in db_access:
                db_access['port'] = '15007'

            if 'host' not in db_access:
                db_access['host'] = self.hostname

            user = db_access['user']
            dbname = db_access['dbname']
            port = db_access['port']
            password = db_access['password']
            host = db_access['host']

            cred = "host=%s dbname=%s user=%s password=%s port=%s" % \
                (host, dbname, user, password, port)
            self._db_conn = psycopg2.connect(cred)

        return self._db_conn

    def _db_server_host(self, cur=None, db_access=None):
        """
        Get the server host name from the database. The server
        host name is stored in the pbs.server table and not in
        pbs.server_attr.
        :param cur: Optional, a predefined cursor to use to
                    operate on the DB
        :param db_acccess: set to either file containing
                           credentials to DB access or
                           dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        """
        local_init = False

        if cur is None:
            conn = self._db_connect(db_access)
            local_init = True
            if conn is None:
                return None
            cur = conn.cursor()

        # obtain server name. The server hostname is stored in table
        # pbs.server
        cur.execute('SELECT sv_hostname from pbs.server')
        if local_init:
            conn.commit()

        tmp_query = cur.fetchone()
        if len(tmp_query) > 0:
            svr_host = tmp_query[0]
        else:
            svr_host = "unknown"
        return svr_host

    def status_db(self, obj_type=None, attrib=None, id=None, db_access=None,
                  logerr=True):
        """
        Status PBS objects from the SQL database
        :param obj_type: The type of object to query, one of the
                         * objects, Default: SERVER
        :param attrib: Attributes to query, can a string, a list,
                       a dictionary Default: None. All attributes
                       will be queried
        :type attrib: str or list or dictionary
        :param id: An optional identifier, the name of the object
                   to status
        :type id: str
        :param db_access: information needed to access the database,
                          can be either a file containing user,
                          port, dbname, password info or a
                          dictionary of key/value entries
        :type db_access: str or dictionary
        """
        if not PSYCOPG:
            self.logger.error('psycopg module unavailable, install from ' +
                              'http://initd.org/psycopg/ and retry')
            return None

        if not isinstance(db_access, dict):
            try:
                with open(db_access, 'r') as f:
                    lines = f.readlines()
            except IOError:
                self.logger.error('Unable to access ' + db_access)
                return None
            db_access = {}
            for line in lines:
                (k, v) = line.split('=')
                db_access[k] = v

        conn = self._db_connect(db_access)
        if conn is None:
            return None

        cur = conn.cursor()

        stmt = []
        if obj_type == SERVER:
            stmt = ["SELECT sv_name,attr_name,attr_resource,attr_value " +
                    "FROM pbs.server_attr"]
            svr_host = self.hostname  # self._db_server_host(cur)
        elif obj_type == SCHED:
            stmt = ["SELECT sched_name,attr_name,attr_resource,attr_value " +
                    "FROM pbs.scheduler_attr"]
            # reuse server host name for sched host
            svr_host = self.hostname
        elif obj_type == JOB:
            stmt = ["SELECT ji_jobid,attr_name,attr_resource,attr_value " +
                    "FROM pbs.job_attr"]
            if id:
                id_stmt = ["ji_jobid='" + id + "'"]
        elif obj_type == QUEUE:
            stmt = ["SELECT qu_name,attr_name,attr_resource,attr_value " +
                    "FROM pbs.queue_attr"]
            if id:
                id_stmt = ["qu_name='" + id + "'"]
        elif obj_type == RESV:
            stmt = ["SELECT ri_resvid,attr_name,attr_resource,attr_value " +
                    "FROM pbs.resv_attr"]
            if id:
                id_stmt = ["ri_resvid='" + id + "'"]
        elif obj_type in (NODE, VNODE):
            stmt = ["SELECT nd_name,attr_name,attr_resource,attr_value " +
                    "FROM pbs.node_attr"]
            if id:
                id_stmt = ["nd_name='" + id + "'"]
        else:
            self.logger.error('status: object type not handled')
            return None

        if attrib or id:
            stmt += ["WHERE"]
            extra_stmt = []
            if attrib:
                if isinstance(attrib, dict):
                    attrs = attrib.keys()
                elif isinstance(attrib, list):
                    attrs = attrib
                elif isinstance(attrib, str):
                    attrs = attrib.split(',')
                for a in attrs:
                    extra_stmt += ["attr_name='" + a + "'"]
                stmt += [" OR ".join(extra_stmt)]
            if id:
                stmt += [" AND ", " AND ".join(id_stmt)]

        exec_stmt = " ".join(stmt)
        self.logger.debug('server: executing db statement: ' + exec_stmt)
        cur.execute(exec_stmt)
        conn.commit()
        _results = cur.fetchall()
        obj_dict = {}
        for _res in _results:
            if obj_type in (SERVER, SCHED):
                obj_name = svr_host
            else:
                obj_name = _res[0]
            if obj_name not in obj_dict:
                obj_dict[obj_name] = {'id': obj_name}
            attr = _res[1]
            if _res[2]:
                attr += '.' + _res[2]

            obj_dict[obj_name][attr] = _res[3]

        return list(obj_dict.values())

    def qdisable(self, queue=None, runas=None, logerr=True):
        """
        Disable queue. ``CLI`` mode only
        :param queue: The name of the queue or list of queue to
                      disable
        :type queue: str or list
        :param runas: Optional name of user to run command as
        :type runas: str or None
        :param logerr: Set to False ot disable logging command
                       errors.Defaults to True.
        :type logerr: bool
        :raises: PbsQdisableError
        """
        prefix = 'qdisable on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if queue is not None:
            if not isinstance(queue, list):
                queue = queue.split(',')
            prefix += ', '.join(queue)
        self.logger.info(prefix)

        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'qdisable')]
            if queue is not None:
                pcmd += queue
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = ret['rc']
            if self.last_rc != 0:
                raise PbsQdisableError(rc=self.last_rc, rv=False,
                                       msg=self.last_error)
        else:
            _msg = 'qdisable: currently not supported in API mode'
            raise PbsQdisableError(rv=False, rc=1, msg=_msg)

    def qenable(self, queue=None, runas=None, logerr=True):
        """
        Enable queue. ``CLI`` mode only
        :param queue: The name of the queue or list of queue to
                      enable
        :type queue: str or list
        :param runas: Optional name of user to run command as
        :type runas: str or None
        :param logerr: Set to False ot disable logging command
                       errors.Defaults to True.
        :type logerr: bool
        :raises: PbsQenableError
        """
        prefix = 'qenable on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if queue is not None:
            if not isinstance(queue, list):
                queue = queue.split(',')
            prefix += ', '.join(queue)
        self.logger.info(prefix)

        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'qenable')]
            if queue is not None:
                pcmd += queue
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = ret['rc']
            if self.last_rc != 0:
                raise PbsQenableError(rc=self.last_rc, rv=False,
                                      msg=self.last_error)
        else:
            _msg = 'qenable: currently not supported in API mode'
            raise PbsQenableError(rv=False, rc=1, msg=_msg)

    def qstart(self, queue=None, runas=None, logerr=True):
        """
        Start queue. ``CLI`` mode only
        :param queue: The name of the queue or list of queue
                      to start
        :type queue: str or list
        :param runas: Optional name of user to run command as
        :type runas: str or None
        :param logerr: Set to False ot disable logging command
                       errors.Defaults to True.
        :type logerr: bool
        :raises: PbsQstartError
        """
        prefix = 'qstart on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if queue is not None:
            if not isinstance(queue, list):
                queue = queue.split(',')
            prefix += ', '.join(queue)
        self.logger.info(prefix)

        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'qstart')]
            if queue is not None:
                pcmd += queue
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = ret['rc']
            if self.last_rc != 0:
                raise PbsQstartError(rc=self.last_rc, rv=False,
                                     msg=self.last_error)
        else:
            _msg = 'qstart: currently not supported in API mode'
            raise PbsQstartError(rv=False, rc=1, msg=_msg)

    def qstop(self, queue=None, runas=None, logerr=True):
        """
        Stop queue. ``CLI`` mode only
        :param queue: The name of the queue or list of queue to stop
        :type queue: str or list
        :param runas: Optional name of user to run command as
        :type runas: str or None
        :param logerr: Set to False ot disable logging command errors.
                       Defaults to True.
        :type logerr: bool
        :raises: PbsQstopError
        """
        prefix = 'qstop on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if queue is not None:
            if not isinstance(queue, list):
                queue = queue.split(',')
            prefix += ', '.join(queue)
        self.logger.info(prefix)

        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'qstop')]
            if queue is not None:
                pcmd += queue
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = ret['rc']
            if self.last_rc != 0:
                raise PbsQstopError(rc=self.last_rc, rv=False,
                                    msg=self.last_error)
        else:
            _msg = 'qstop: currently not supported in API mode'
            raise PbsQstopError(rv=False, rc=1, msg=_msg)

    def parse_resources(self):
        """
        Parse server resources as defined in the resourcedef file
        Populates instance variable self.resources
        :returns: The resources as a dictionary
        """
        if not self.has_snap:
            self.manager(MGR_CMD_LIST, RSC)
        return self.resources

    def remove_resource(self, name):
        """
        Remove an entry from resourcedef
        :param name: The name of the resource to remove
        :type name: str
        :param restart: Whether to restart the server or not.
                        Applicable to update_mode 'file'
                        operations only.
        :param update_mode: one of 'file' or 'auto' (the default).
                            If 'file', updates the resourcedef file
                            only and will not use the qmgr
                            operations on resources introduced in
                            12.3. If 'auto', will automatically
                            handle the update on resourcedef or
                            using qmgr based on the version of the
                            Server.
        """
        self.parse_resources()
        if not self.has_snap:
            if name in self.resources:
                self.manager(MGR_CMD_DELETE, RSC, id=name)

    def add_resource(self, name, type=None, flag=None):
        """
        Define a server resource
        :param name: The name of the resource to add to the
                     resourcedef file
        :type name: str
        :param type: The type of the resource, one of string,
                     long, boolean, float
        :param flag: The target of the resource, one of n, h, q,
                     or none
        :type flag: str or None
        :param restart: Whether to restart the server after adding
                        a resource.Applicable to update_mode 'file'
                        operations only.
        :param update_mode: one of 'file' or 'auto' (the default).
                            If 'file', updates the resourcedef file
                            only and will not use the qmgr
                            operations on resources introduced in
                            12.3. If 'auto', will automatically
                            handle the update on resourcedef or
                            using qmgr based on the version of the
                            Server.
        :returns: True on success False on error
        """
        rv = self.parse_resources()
        if rv is None:
            return False

        resource_exists = False
        if name in self.resources:
            msg = [self.logprefix + "resource " + name]
            if type:
                msg += ["type: " + type]
            if flag:
                msg += ["flag: " + flag]
            msg += [" already defined"]
            self.logger.info(" ".join(msg))

            (t, f) = (self.resources[name].type, self.resources[name].flag)
            if type == t and flag == f:
                return True

            self.logger.info("resource: redefining resource " + name +
                             " type: " + str(type) + " and flag: " + str(flag))
            del self.resources[name]
            resource_exists = True

        r = Resource(name, type, flag)
        self.resources[name] = r
        a = {}
        if type:
            a['type'] = type
        if flag:
            a['flag'] = flag
        if resource_exists:
            self.manager(MGR_CMD_SET, RSC, a, id=name)
        else:
            self.manager(MGR_CMD_CREATE, RSC, a, id=name)
        return True

    def write_resourcedef(self, resources=None, filename=None, restart=True):
        """
        Write into resource def file
        :param resources: PBS resources
        :type resources: dictionary
        :param filename: resourcedef file name
        :type filename: str or None
        """
        if resources is None:
            resources = self.resources
        if isinstance(resources, Resource):
            resources = {resources.name: resources}
        fn = self.du.create_temp_file()
        with open(fn, 'w+') as f:
            for r in resources.values():
                f.write(r.attributes['id'])
                if r.attributes['type'] is not None:
                    f.write(' type=' + r.attributes['type'])
                if r.attributes['flag'] is not None:
                    f.write(' flag=' + r.attributes['flag'])
                f.write('\n')
        if filename is None:
            dest = os.path.join(self.pbs_conf['PBS_HOME'], 'server_priv',
                                'resourcedef')
        else:
            dest = filename
        self.du.run_copy(self.hostname, src=fn, dest=dest, sudo=True,
                         preserve_permission=False)
        os.remove(fn)
        if restart:
            return self.restart()
        return True

    def parse_resourcedef(self, file=None):
        """
        Parse an arbitrary resource definition file passed as
        input and return a dictionary of resources
        :param file: resource definition file
        :type file: str or None
        :returns: Dictionary of resource
        :raises: PbsResourceError
        """
        if file is None:
            file = os.path.join(self.pbs_conf['PBS_HOME'], 'server_priv',
                                'resourcedef')
        ret = self.du.cat(self.hostname, file, logerr=False, sudo=True)
        if ret['rc'] != 0 or len(ret['out']) == 0:
            # Most probable error is that file does not exist, we'll let it
            # be created
            return {}

        resources = {}
        lines = ret['out']
        try:
            for l in lines:
                strip_line = l.strip()
                if strip_line == '' or strip_line.startswith('#'):
                    continue
                name = None
                rtype = None
                flag = None
                res = strip_line.split()
                e0 = res[0]
                if len(res) > 1:
                    e1 = res[1].split('=')
                else:
                    e1 = None
                if len(res) > 2:
                    e2 = res[2].split('=')
                else:
                    e2 = None
                if e1 is not None and e1[0] == 'type':
                    rtype = e1[1]
                elif e2 is not None and e2[0] == 'type':
                    rtype = e2[1]
                if e1 is not None and e1[0] == 'flag':
                    flag = e1[0]
                elif e2 is not None and e2[0] == 'flag':
                    flag = e2[1]
                name = e0
                r = Resource(name, rtype, flag)
                resources[name] = r
        except Exception:
            raise PbsResourceError(rc=1, rv=False,
                                   msg="error in parse_resources")
        return resources

    def is_history_enabled(self):
        """
        Short-hand method to return the value of job_history_enable
        """
        a = ATTR_JobHistoryEnable
        attrs = self.status(SERVER, level=logging.DEBUG)[0]
        if ((a in attrs.keys()) and attrs[a] == 'True'):
            return True
        return False

    def cleanup_jobs(self):
        """
        Helper function to delete all jobs.
        By default this method will determine whether
        job_history_enable is on and will cleanup all history
        jobs. Specifying an extend parameter could override
        this behavior.
        """
        delete_xt = 'force'
        select_xt = None
        if self.is_history_enabled():
            delete_xt += 'deletehist'
            select_xt = 'x'
        jobs = self.status(JOB, extend=select_xt)
        job_ids = sorted(list(set([x['id'] for x in jobs])))
        running_jobs = sorted([j['id'] for j in jobs if j['job_state'] == 'R'])
        host_pid_map = {}
        for job in jobs:
            exec_host = job.get('exec_host', None)
            if not exec_host or 'session_id' not in job:
                continue
            _host = exec_host.split('/')[0].split(':')[0]
            if _host not in host_pid_map:
                host_pid_map.setdefault(_host, [])
            host_pid_map[_host].append(job['session_id'])

        # Turn off scheduling so jobs don't start when trying to
        # delete. Restore the orignial scheduling state
        # once jobs are deleted.
        sched_state = []
        scheds = self.status(SCHED)
        for sc in scheds:
            if sc['scheduling'] == 'True':
                sched_state.append(sc['id'])
                # runas is required here because some tests remove
                # current user from managers list
                a = {'scheduling': 'False'}
                self.manager(MGR_CMD_SET, SCHED, a, id=sc['id'],
                             runas=ROOT_USER)
        try:
            self.deljob(id=job_ids, extend=delete_xt,
                        runas=ROOT_USER, wait=False)
        except PbsDeljobError:
            pass
        st = time.time()
        if len(job_ids) > 100:
            for host, pids in host_pid_map.items():
                chunks = [pids[i:i + 5000] for i in range(0, len(pids), 5000)]
                pbsnodes = os.path.join(
                    self.client_conf['PBS_EXEC'], 'bin', 'pbsnodes')
                ret = self.du.run_cmd(
                    self.hostname, [pbsnodes, '-v', host, '-F', 'json'],
                    logerr=False, level=logging.DEBUG, sudo=True)
                pbsnodes_json = json.loads('\n'.join(ret['out']))
                host = pbsnodes_json['nodes'][host]['Mom']
                for chunk in chunks:
                    self.du.run_cmd(host, ['kill', '-9'] + chunk,
                                    runas=ROOT_USER, logerr=False)
            if running_jobs:
                last_running_job = running_jobs[-1]
                _msg = last_running_job + ';'
                _msg += 'Job Obit notice received has error 15001'
                try:
                    self.log_match(_msg, starttime=st, interval=10,
                                   max_attempts=10)
                except PtlLogMatchError:
                    # don't fail on log match error as here purpose
                    # of log match is to allow mom to catch up with
                    # sigchild but we don't want to wait too long
                    # so limit max attempts to 10 ~ total 100 sec
                    # of wait
                    pass
        rv = self.expect(JOB, {'job_state': 0}, count=True, op=SET)
        # restore 'scheduling' state
        for sc in sched_state:
            a = {'scheduling': 'True'}
            self.manager(MGR_CMD_SET, SCHED, a, id=sc, runas=ROOT_USER)
            self.expect(SCHED, a, id=sc)
        return rv

    def cleanup_reservations(self):
        """
        Helper function to delete all reservations
        """
        reservations = self.status(RESV, runas=ROOT_USER)
        while reservations:
            resvs = [r['id'] for r in reservations]
            if len(resvs) > 0:
                try:
                    self.delresv(resvs, runas=ROOT_USER)
                except Exception:
                    pass
                reservations = self.status(RESV, runas=ROOT_USER)

    def cleanup_jobs_and_reservations(self):
        """
        Helper function to delete all jobs and reservations
        """
        rv = self.cleanup_jobs()
        self.cleanup_reservations()
        return rv

    def filter(self, obj_type=None, attrib=None, id=None, extend=None, op=None,
               attrop=None, bslist=None, idonly=True, grandtotal=False,
               db_access=None, runas=None, resolve_indirectness=False):
        """
        Filter objects by properties. For example, to filter all
        free nodes:``server.filter(VNODE,{'state':'free'})``
        For each attribute queried, if idonly is True, a list of
        matching object names is returned; if idonly is False, then
        the value of each attribute queried is returned.
        This is unlike Python's built-in 'filter' that returns a
        subset of objects matching from a pool of objects. The
        Python filtering mechanism remains very useful in some
        situations and should be used programmatically to achieve
        desired filtering goals that can not be met easily with
        PTL's filter method.
        :param obj_type: The type of object to query, one of the
                         * objects
        :param attrib: Attributes to query, can be a string, a
                       list, a dictionary
        :type attrib: str or list or dictionary
        :param id: The id of the object to act upon
        :param extend: The extended parameter to pass to the stat
                       call
        :param op: The operation used to match attrib to what is
                   queried. SET or None
        :type op: str or None
        :param bslist: Optional, use a batch status dict list
                       instead of an obj_type
        :type bslist: List or None
        :param idonly: if true, return the name/id of the matching
                       objects
        :type idonly: bool
        :param db_access: credentials to access db, either path to
                          file or dictionary
        :type db_access: str or dictionary
        :param runas: run as user
        :type runas: str or None
        """
        self.logit('filter: ', obj_type, attrib, id)
        return self._filter(obj_type, attrib, id, extend, op, attrop, bslist,
                            PTL_FILTER, idonly, db_access, runas=runas,
                            resolve_indirectness=resolve_indirectness)

    def equivalence_classes(self, obj_type=None, attrib={}, bslist=None,
                            op=RESOURCES_AVAILABLE, show_zero_resources=True,
                            db_access=None, resolve_indirectness=False):
        """
        :param obj_type: PBS Object to query, one of *
        :param attrib: attributes to build equivalence classes
                       out of.
        :type attrib: dictionary
        :param bslist: Optional, list of dictionary representation
                       of a batch status
        :type bslist: List
        :param op: set to RESOURCES_AVAILABLE uses the dynamic
                   amount of resources available, i.e., available -
                   assigned, otherwise uses static amount of
                   resources available
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        """

        if attrib is None:
            attrib = {}

        if len(attrib) == 0 and obj_type is not None:
            if obj_type in (VNODE, NODE):
                attrib = ['resources_available.ncpus',
                          'resources_available.mem', 'state']
            elif obj_type == JOB:
                attrib = ['Resource_List.select',
                          'queue', 'array_indices_submitted']
            elif obj_type == RESV:
                attrib = ['Resource_List.select']
            else:
                return {}

        if bslist is None and obj_type is not None:
            # To get the resources_assigned we must stat the entire object so
            # bypass the specific attributes that would filter out assigned
            if op == RESOURCES_AVAILABLE:
                bslist = self.status(obj_type, None, level=logging.DEBUG,
                                     db_access=db_access,
                                     resolve_indirectness=resolve_indirectness)
            else:
                bslist = self.status(obj_type, attrib, level=logging.DEBUG,
                                     db_access=db_access,
                                     resolve_indirectness=resolve_indirectness)

        if bslist is None or len(bslist) == 0:
            return {}

        # automatically convert an objectlist into a batch status dict list
        # for ease of use.
        if not isinstance(bslist[0], dict):
            bslist = self.utils.objlist_to_dictlist(bslist)

        if isinstance(attrib, str):
            attrib = attrib.split(',')

        self.logger.debug("building equivalence class")
        equiv = {}
        for bs in bslist:
            cls = ()
            skip_cls = False
            # attrs will be part of the EquivClass object
            attrs = {}
            # Filter the batch attributes by the attribs requested
            for a in attrib:
                if a in bs:
                    amt = PbsAttribute.decode_value(bs[a])
                    if a.startswith('resources_available.'):
                        val = a.replace('resources_available.', '')
                        if (op == RESOURCES_AVAILABLE and
                                'resources_assigned.' + val in bs):
                            amt = (int(amt) - int(PbsAttribute.decode_value(
                                   bs['resources_assigned.' + val])))
                        # this case where amt goes negative is not a bug, it
                        # may happen when computing whats_available due to the
                        # fact that the computation is subtractive, it does
                        # add back resources when jobs/reservations end but
                        # is only concerned with what is available now for
                        # a given duration, that is why in the case where
                        # amount goes negative we set it to 0
                        if amt < 0:
                            amt = 0

                        # TODO: not a failproof way to catch a memory type
                        # but PbsTypeSize should return the right value if
                        # it fails to parse it as a valid memory value
                        if a.endswith('mem'):
                            try:
                                amt = PbsTypeSize().encode(amt)
                            except Exception:
                                # we guessed the type incorrectly
                                pass
                    else:
                        val = a
                    if amt == 0 and not show_zero_resources:
                        skip_cls = True
                        break
                    # Build the key of the equivalence class
                    cls += (val + '=' + str(amt),)
                    attrs[val] = amt
            # Now that we are done with this object, add it to an equiv class
            if len(cls) > 0 and not skip_cls:
                if cls in equiv:
                    equiv[cls].add_entity(bs['id'])
                else:
                    equiv[cls] = EquivClass(cls, attrs, [bs['id']])

        return list(equiv.values())

    def show_equivalence_classes(self, eq=None, obj_type=None, attrib={},
                                 bslist=None, op=RESOURCES_AVAILABLE,
                                 show_zero_resources=True, db_access=None,
                                 resolve_indirectness=False):
        """
        helper function to show the equivalence classes
        :param eq: equivalence classes as compute by
                   equivalence_classes see equivalence_classes
                   for remaining parameters description
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        """
        if eq is None:
            equiv = self.equivalence_classes(obj_type, attrib, bslist, op,
                                             show_zero_resources, db_access,
                                             resolve_indirectness)
        else:
            equiv = eq
        equiv = sorted(equiv, key=lambda e: len(e.entities))
        for e in equiv:
            # e.show()
            print((str(e)))

    def whats_available(self, attrib=None, jobs=None, resvs=None, nodes=None):
        """
        Returns what's available as a list of node equivalence
        classes listed by availability over time.
        :param attrib: attributes to consider
        :type attrib: List
        :param jobs: jobs to consider, if None, jobs are queried
                     locally
        :param resvs: reservations to consider, if None, they are
                      queried locally
        :param nodes: nodes to consider, if None, they are queried
                      locally
        """

        if attrib is None:
            attrib = ['resources_available.ncpus',
                      'resources_available.mem', 'state']

        if resvs is None:
            self.status(RESV)
            resvs = self.reservations

        if jobs is None:
            self.status(JOB)
            jobs = self.jobs

        if nodes is None:
            self.status(NODE)
            nodes = self.nodes

        nodes_id = list(nodes.keys())
        avail_nodes_by_time = {}

        def alloc_resource(self, node, resources):
            # helper function. Must work on a scratch copy of nodes otherwise
            # resources_available will get corrupted
            for rsc, value in resources.items():
                if isinstance(value, int) or value.isdigit():
                    avail = node.attributes['resources_available.' + rsc]
                    nvalue = int(avail) - int(value)
                    node.attributes['resources_available.' + rsc] = nvalue

        # Account for reservations
        for resv in resvs.values():
            resvnodes = resv.execvnode('resv_nodes')
            if resvnodes:
                starttime = self.utils.convert_stime_to_seconds(
                    resv.attributes['reserve_start'])
                for node in resvnodes:
                    for n, resc in node.items():
                        tm = int(starttime) - int(self.ctime)
                        if tm < 0 or n not in nodes_id:
                            continue
                        if tm not in avail_nodes_by_time:
                            avail_nodes_by_time[tm] = []
                        if nodes[n].attributes['sharing'] in ('default_excl',
                                                              'force_excl'):
                            avail_nodes_by_time[tm].append(nodes[n])
                            try:
                                nodes_id.remove(n)
                            except Exception:
                                pass
                        else:
                            ncopy = copy.copy(nodes[n])
                            ncopy.attributes = copy.deepcopy(
                                nodes[n].attributes)
                            avail_nodes_by_time[tm].append(ncopy)
                            self.alloc_resource(nodes[n], resc)

        # go on to look at the calendar of scheduled jobs to run and set
        # the node availability according to when the job is estimated to
        # start on the node
        for job in self.jobs.values():
            if (job.attributes['job_state'] != 'R' and
                    'estimated.exec_vnode' in job.attributes):
                estimatednodes = job.execvnode('estimated.exec_vnode')
                if estimatednodes:
                    st = job.attributes['estimated.start_time']
                    # Tweak for nas format of estimated time that has
                    # num seconds from epoch followed by datetime
                    if st.split()[0].isdigit():
                        starttime = st.split()[0]
                    else:
                        starttime = self.utils.convert_stime_to_seconds(st)
                    for node in estimatednodes:
                        for n, resc in node.items():
                            tm = int(starttime) - int(self.ctime)
                            if (tm < 0 or n not in nodes_id or
                                    nodes[n].state != 'free'):
                                continue
                            if tm not in avail_nodes_by_time:
                                avail_nodes_by_time[tm] = []
                            if (nodes[n].attributes['sharing'] in
                                    ('default_excl', 'force_excl')):
                                avail_nodes_by_time[tm].append(nodes[n])
                                try:
                                    nodes_id.remove(n)
                                except Exception:
                                    pass
                            else:
                                ncopy = copy.copy(nodes[n])
                                ncopy.attributes = copy.deepcopy(
                                    nodes[n].attributes)
                                avail_nodes_by_time[tm].append(ncopy)
                                self.alloc_resource(nodes[n], resc)

        # remaining nodes are free "forever"
        for node in nodes_id:
            if self.nodes[node].state == 'free':
                if 'infinity' not in avail_nodes_by_time:
                    avail_nodes_by_time['infinity'] = [nodes[node]]
                else:
                    avail_nodes_by_time['infinity'].append(nodes[node])

        # if there is a dedicated time, move the availaility time up to that
        # time as necessary
        if self.schedulers[self.dflt_sched_name] is None:
            self.schedulers[self.dflt_sched_name] = Scheduler(server=self)

        self.schedulers[self.dflt_sched_name].parse_dedicated_time()

        if self.schedulers[self.dflt_sched_name].dedicated_time:
            dedtime = self.schedulers[
                self.dflt_sched_name].dedicated_time[0]['from'] - int(
                self.ctime)
            if dedtime <= int(time.time()):
                dedtime = None
        else:
            dedtime = None

        # finally, build the equivalence classes off of the nodes availability
        # over time
        self.logger.debug("Building equivalence classes")
        whazzup = {}
        if 'state' in attrib:
            attrib.remove('state')
        for tm, nds in avail_nodes_by_time.items():
            equiv = self.equivalence_classes(VNODE, attrib, bslist=nds,
                                             show_zero_resources=False)
            if dedtime and (tm > dedtime or tm == 'infinity'):
                tm = dedtime
            if tm != 'infinity':
                tm = str(datetime.timedelta(seconds=int(tm)))
            whazzup[tm] = equiv

        return whazzup

    def show_whats_available(self, wa=None, attrib=None, jobs=None,
                             resvs=None, nodes=None):
        """
        helper function to show availability as computed by
        whats_available
        :param wa: a dictionary of available attributes. see
                   whats_available for a\
                   description of the remaining parameters
        :type wa: Dictionary
        """
        if wa is None:
            wa = self.whats_available(attrib, jobs, resvs, nodes)
        if len(wa) > 0:
            print(("%24s\t%s" % ("Duration of availability", "Resources")))
            print("-------------------------\t----------")
        swa = sorted(wa.items(), key=lambda x: x[0])
        for (k, eq_classes) in swa:
            for eq_cl in eq_classes:
                print(("%24s\t%s" % (str(k), str(eq_cl))))

    def utilization(self, resources=None, nodes=None, jobs=None, entity={}):
        """
        Return utilization of consumable resources on a set of
        nodes
        :param nodes: A list of dictionary of nodes on which to
                      compute utilization.Defaults to nodes
                      resulting from a stat call to the current
                      server.
        :type nodes: List
        :param resources: comma-separated list of resources to
                          compute utilization on. The name of the
                          resource is for example, ncpus or mem
        :type resources: List
        :param entity: An optional dictionary of entities to
                       compute utilization of,
                       ``e.g. {'user':u1, 'group':g1, 'project'=p1}``
        :type entity: Dictionary
        The utilization is returned as a dictionary of percentage
        utilization for each resource.
        Non-consumable resources are silently ignored.
        """
        if nodes is None:
            nodes = self.status(NODE)

        if jobs is None:
            jobs = self.status(JOB)

        if resources is None:
            rescs = ['ncpus', 'mem']
        else:
            rescs = resources

        utilization = {}
        resavail = {}
        resassigned = {}
        usednodes = 0
        totnodes = 0
        nodes_set = set()

        for res in rescs:
            resavail[res] = 0
            resassigned[res] = 0

        # If an entity is specified utilization must be collected from the
        # Jobs usage, otherwise we can get the information directly from
        # the nodes.
        if len(entity) > 0 and jobs is not None:
            for job in jobs:
                if 'job_state' in job and job['job_state'] != 'R':
                    continue
                entity_match = True
                for k, v in entity.items():
                    if k not in job or job[k] != v:
                        entity_match = False
                        break
                if entity_match:
                    for res in rescs:
                        r = 'Resource_List.' + res
                        if r in job:
                            tmpr = int(PbsAttribute.decode_value(job[r]))
                            resassigned[res] += tmpr
                    if 'exec_host' in job:
                        hosts = ResourceResv.get_hosts(job['exec_host'])
                        nodes_set |= set(hosts)

        for node in nodes:
            # skip nodes in non-schedulable state
            nstate = node['state']
            if ('down' in nstate or 'unavailable' in nstate or
                    'unknown' in nstate or 'Stale' in nstate):
                continue

            totnodes += 1

            # If an entity utilization was requested, all used nodes were
            # already filtered into the nodes_set specific to that entity, we
            # simply add them up. If no entity was requested, it suffices to
            # have the node have a jobs attribute to count it towards total
            # used nodes
            if len(entity) > 0:
                if node['id'] in nodes_set:
                    usednodes += 1
            elif 'jobs' in node:
                usednodes += 1

            for res in rescs:
                avail = 'resources_available.' + res
                if avail in node:
                    val = PbsAttribute.decode_value(node[avail])
                    if isinstance(val, int):
                        resavail[res] += val

                        # When entity matching all resources assigned are
                        # accounted for by the job usage
                        if len(entity) == 0:
                            assigned = 'resources_assigned.' + res
                            if assigned in node:
                                val = PbsAttribute.decode_value(
                                    node[assigned])
                                if isinstance(val, int):
                                    resassigned[res] += val

        for res in rescs:
            if res in resavail:
                if res in resassigned:
                    if resavail[res] > 0:
                        utilization[res] = [resassigned[res], resavail[res]]

        # Only report nodes utilization if no specific resources were requested
        if resources is None:
            utilization['nodes'] = [usednodes, totnodes]

        return utilization

    def create_moms(self, name=None, attrib=None, num=1, delall=True,
                    createnode=True, conf_prefix='pbs.conf_m',
                    home_prefix='pbs_m', momhosts=None, init_port=15011,
                    step_port=2):
        """
        Create MoM configurations and optionall add them to the
        server. Unique ``pbs.conf`` files are defined and created
        on each hosts on which MoMs are to be created.
        :param name: Optional prefix name of the nodes to create.
                     Defaults to the name of the MoM host.
        :type name: str or None
        :param attrib: Optional node attributes to assign to the
                       MoM.
        :param num: Number of MoMs to create
        :type num: int
        :param delall: Whether to delete all nodes on the server.
                       Defaults to True.
        :type delall: bool
        :param createnode: Whether to create the nodes and add them
                           to the server.Defaults to True.
        :type createnode: bool
        :param conf_prefix: The prefix of the PBS conf file.Defaults
                            to pbs.conf_m
        :type conf_prefix: str
        :param home_prefix: The prefix of the PBS_HOME directory.
                            Defaults to pbs_m
        :type home_prefix: str
        :param momhosts: A list of hosts on which to deploy num
                         MoMs.
        :type momhosts: List
        :param init_port: The initial port number to start assigning
                          ``PBS_MOM_SERIVCE_PORT to.
                          Default 15011``.
        :type init_port: int
        :param step_port: The increments at which ports are
                          allocated. Defaults to 2.
        :type step_port: int
        .. note:: Since PBS requires that
                  PBS_MANAGER_SERVICE_PORT = PBS_MOM_SERVICE_PORT+1
                  The step number must be greater or equal to 2.
        """

        if not self.isUp():
            logging.error("An up and running PBS server on " + self.hostname +
                          " is required")
            return False

        if delall:
            try:
                rc = self.manager(MGR_CMD_DELETE, NODE, None, "")
            except PbsManagerError as e:
                rc = e.rc
            if rc:
                node_length = 0
                try:
                    node_length = len(self.status(NODE))
                except PbsStatusError as err:
                    if "Server has no node list" not in err.msg[0]:
                        self.logger.error(
                            "Error while checking node length:" + str(err))
                        return False
                if node_length > 0:
                    self.logger.error("create_moms: Error deleting all nodes")
                    return False

        pi = PBSInitServices()
        if momhosts is None:
            momhosts = [self.hostname]

        if attrib is None:
            attrib = {}

        error = False
        momnum = 0
        for hostname in momhosts:
            momnum += 1
            _pconf = self.du.parse_pbs_config(hostname)
            if 'PBS_HOME' in _pconf:
                _hp = _pconf['PBS_HOME']
                if _hp.endswith('/'):
                    _hp = _hp[:-1]
                _hp = os.path.dirname(_hp)
            else:
                _hp = '/var/spool'
            _np_conf = _pconf
            _np_conf['PBS_START_SERVER'] = '0'
            _np_conf['PBS_START_SCHED'] = '0'
            _np_conf['PBS_START_COMM'] = '0'
            _np_conf['PBS_START_MOM'] = '1'
            for i in range(0, num * step_port, step_port):
                _np = os.path.join(_hp, home_prefix + str(i))
                _n_pbsconf = os.path.join('/etc', conf_prefix + str(i))
                _np_conf['PBS_HOME'] = _np
                port = init_port + i
                _np_conf['PBS_MOM_SERVICE_PORT'] = str(port)
                _np_conf['PBS_MANAGER_SERVICE_PORT'] = str(port + 1)
                self.du.set_pbs_config(hostname, fout=_n_pbsconf,
                                       confs=_np_conf)
                pi.initd(hostname, conf_file=_n_pbsconf, op='start')
                m = MoM(self, hostname, pbsconf_file=_n_pbsconf)
                if m.isUp():
                    m.stop()
                try:
                    m.start()
                except PbsServiceError:
                    # The service failed to start
                    self.logger.error("Service failed to start using port " +
                                      str(port) + "...skipping")
                    self.du.rm(hostname, _n_pbsconf)
                    continue
                if createnode:
                    attrib['Mom'] = hostname
                    attrib['port'] = port
                    if name is None:
                        name = hostname.split('.')[0]
                    if momnum == 1:
                        _n = name + '-' + str(i)
                    else:
                        _n = name + str(momnum) + '-' + str(i)
                    rc = self.manager(MGR_CMD_CREATE, NODE, attrib, id=_n)
                    if rc != 0:
                        self.logger.error("error creating node " + _n)
                        error = True
        if error:
            return False

        return True

    def create_hook(self, name, attrs):
        """
        Helper function to create a hook by name.
        :param name: The name of the hook to create
        :type name: str
        :param attrs: The attributes to create the hook with.
        :type attrs: str
        :returns: False if hook already exists
        :raises: PbsManagerError, otherwise return True.
        """
        hooks = self.status(HOOK)
        if ((hooks is None or len(hooks) == 0) or
                (name not in [x['id'] for x in hooks])):
            self.manager(MGR_CMD_CREATE, HOOK, None, name)
        else:
            self.logger.error('hook named ' + name + ' exists')
            return False
        self.update_special_attr(HOOK, id=name)
        self.manager(MGR_CMD_SET, HOOK, attrs, id=name)
        return True

    def delete_hook(self, name):
        """
        Helper function to delete a hook by name.
        :param name: The name of the hook to delete
        :type name: str
        :returns: False if hook does not exist
        :raises: PbsManagerError, otherwise return True.
        """
        hooks = self.status(HOOK, level=logging.DEBUG)
        for hook in hooks:
            if hook['id'] == name:
                self.logger.info("Removing hook:%s" % name)
                self.manager(MGR_CMD_DELETE, HOOK, id=name)
        return True

    def import_hook(self, name, body, level=logging.INFO):
        """
        Helper function to import hook body into hook by name.
        The hook must have been created prior to calling this
        function.
        :param name: The name of the hook to import body to
        :type name: str
        :param body: The body of the hook as a string.
        :type body: str
        :returns: True on success.
        :raises: PbsManagerError
        """
        # sync_mom_hookfiles_timeout is 15min by default
        # Setting it to lower value to avoid the race condition at hook copy
        srv_stat = self.status(SERVER, 'sync_mom_hookfiles_timeout')
        try:
            sync_val = srv_stat[0]['sync_mom_hookfiles_timeout']
        except Exception:
            self.logger.info("Setting sync_mom_hookfiles_timeout to 15s")
            self.manager(MGR_CMD_SET, SERVER,
                         {"sync_mom_hookfiles_timeout": 15})

        fn = self.du.create_temp_file(body=body)

        if not self._is_local:
            tmpdir = self.du.get_tempdir(self.hostname)
            rfile = os.path.join(tmpdir, os.path.basename(fn))
            self.du.run_copy(self.hostname, src=fn, dest=rfile)
        else:
            rfile = fn

        a = {'content-type': 'application/x-python',
             'content-encoding': 'default',
             'input-file': rfile}
        self.manager(MGR_CMD_IMPORT, HOOK, a, name)

        os.remove(rfile)
        if not self._is_local:
            self.du.rm(self.hostname, rfile)
        self.logger.log(level, 'server ' + self.shortname +
                        ': imported hook body\n---\n' +
                        body + '---')
        return True

    def create_import_hook(self, name, attrs=None, body=None, overwrite=True,
                           level=logging.INFO):
        """
        Helper function to create a hook, import content into it,
        set the event and enable it.
        :param name: The name of the hook to create
        :type name: str
        :param attrs: The attributes to create the hook with.
                      Event and Enabled are mandatory. No defaults.
        :type attrs: str
        :param body: The hook body as a string
        :type body: str
        :param overwrite: If True, if a hook of the same name
                          already exists, bypass its creation.
                          Defaults to True
        :returns: True on success and False otherwise
        """
        # Check for log messages 20 seconds earlier, to account for
        # server and mom system time differences
        t = time.time() - 20

        if 'event' not in attrs:
            self.logger.error('attrs must specify at least an event and key')
            return False

        hook_exists = False
        hooks = self.status(HOOK)
        for h in hooks:
            if h['id'] == name:
                hook_exists = True

        if not hook_exists or not overwrite:
            rv = self.create_hook(name, attrs)
            if not rv:
                return False
        else:
            if attrs is None:
                attrs = {'enabled': 'true'}
            rc = self.manager(MGR_CMD_SET, HOOK, attrs, id=name)
            if rc != 0:
                return False

        # In 12.0 A MoM hook must be enabled and the event set prior to
        # importing, otherwise the MoM does not get the hook content
        ret = self.import_hook(name, body, level)

        # In case of mom hooks, make sure that the hook related files
        # are successfully copied to the MoM
        events = attrs['event']
        if not isinstance(events, (list,)):
            events = [events]
        events = [hk for hk in events if 'exec' in hk]
        msg = "successfully sent hook file"
        for hook in events:
            hook_py = name + '.PY'
            hook_hk = name + '.HK'
            pyfile = os.path.join(self.pbs_conf['PBS_HOME'],
                                  "server_priv", "hooks", hook_py)
            hfile = os.path.join(self.pbs_conf['PBS_HOME'],
                                 "server_priv", "hooks", hook_hk)
            logmsg = hook_py + ";copy hook-related file request received"
            cmd = os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                               'pbsnodes') + ' -a' + ' -Fjson'
            cmd_out = self.du.run_cmd(self.hostname, cmd, sudo=True)
            if cmd_out['rc'] != 0:
                return False
            pbsnodes_json = json.loads('\n'.join(cmd_out['out']))
            for m in pbsnodes_json['nodes']:
                if m in self.moms:
                    try:
                        self.log_match("%s %s to %s" %
                                       (msg, hfile, m), interval=1)
                        self.log_match("%s %s to %s" %
                                       (msg, pyfile, m), interval=1)
                        self.moms[m].log_match(logmsg, starttime=t)
                    except PtlLogMatchError:
                        return False
        return ret

    def import_hook_config(self, hook_name, hook_conf, hook_type,
                           level=logging.INFO):
        """
        Helper function to import hook config body into hook by name.
        The hook must have been created prior to calling this
        function.
        :param hook_name: The name of the hook to import hook config
        :type name: str
        :param hook_conf: The body of the hook config as a dict.
        :type hook_conf: dict
        :param hook_type: The hook type "site" or "pbshook"
        :type hook_type: str
        :returns: True on success.
        :raises: PbsManagerError
        """
        if hook_type == "site":
            hook_t = HOOK
        else:
            hook_t = PBS_HOOK

        hook_config_data = json.dumps(hook_conf, indent=4)
        fn = self.du.create_temp_file(body=hook_config_data)

        if not self._is_local:
            tmpdir = self.du.get_tempdir(self.hostname)
            rfile = os.path.join(tmpdir, os.path.basename(fn))
            rc = self.du.run_copy(self.hostname, src=fn, dest=rfile)
            if rc != 0:
                raise AssertionError("Failed to copy file %s"
                                     % (rfile))
        else:
            rfile = fn

        a = {'content-type': 'application/x-config',
             'content-encoding': 'default',
             'input-file': rfile}

        self.manager(MGR_CMD_IMPORT, hook_t, a, hook_name)

        os.remove(rfile)
        if not self._is_local:
            self.du.rm(self.hostname, rfile)
        self.logger.log(level, 'server ' + self.shortname +
                        ': imported hook config\n---\n' +
                        str(hook_config_data) + '\n---\n')
        return True

    def export_hook_config(self, hook_name, hook_type):
        """
        Helper function to export hook config body.
        The hook must have been created prior to calling this
        function.
        :param hook_name: The name of the hook to export config from
        :type name: str
        :param hook_type: The hook type "site" or "pbshook"
        :type hook_type: str
        :returns: Dictionary on success False on failure
        """
        if hook_type == "site":
            hook_t = "hook"
        else:
            hook_t = "pbshook"
        cmd = ["export", hook_t, hook_name]
        cmd += ["application/x-config", "default"]
        if not self._is_local:
            cmd = '\'' + " ".join(cmd) + '\''
        else:
            cmd = " ".join(cmd)
        pcmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'bin', 'qmgr'),
                '-c', cmd]
        ret = self.du.run_cmd(self.hostname, pcmd, sudo=True)
        if ret['rc'] == 0:
            config_out = ''.join(ret['out'])
            config_dict = json.loads(config_out)
            return config_dict
        else:
            raise AssertionError("Failed to export hook config, %s"
                                 % (ret['err']))

    def evaluate_formula(self, jobid=None, formula=None, full=True,
                         include_running_jobs=False, exclude_subjobs=True):
        """
        Evaluate the job sort formula
        :param jobid: If set, evaluate the formula for the given
                      jobid, if not set,formula is evaluated for
                      all jobs in state Q
        :type jobid: str or None
        :param formula: If set use the given formula. If not set,
                        the server's formula, if any, is used
        :param full: If True, returns a dictionary of job
                     identifiers as keys and the evaluated formula
                     as values. Returns None if no formula is used.
                     Each job id formula is returned as a tuple
                     (s,e) where s is the formula expression
                     associated to the job and e is the evaluated
                     numeric value of that expression, for example,
                     if job_sort_formula is ncpus + mem
                     a job requesting 2 cpus and 100kb of memory
                     would return ('2 + 100', 102). If False, if
                     a jobid is specified, return the integer
                     value of the evaluated formula.
        :type full: bool
        :param include_running_jobs: If True, reports formula
                                     value of running jobs.
                                     Defaults to False.
        :type include_running_jobs: bool
        :param exclude_subjobs: If True, only report formula of
                                parent job array
        :type exclude_subjobs: bool
        """
        _f_builtins = ['queue_priority', 'job_priority', 'eligible_time',
                       'fair_share_perc']
        if formula is None:
            d = self.status(SERVER, 'job_sort_formula')
            if len(d) > 0 and 'job_sort_formula' in d[0]:
                formula = d[0]['job_sort_formula']
            else:
                return None

        template_formula = self.utils._make_template_formula(formula)
        # to split up the formula into keywords, first convert all possible
        # operators into spaces and split the string.
        # TODO: The list of operators may need to be expanded
        T = formula.maketrans('()%+*/-', ' ' * 7)
        fres = formula.translate(T).split()
        if jobid:
            d = self.status(JOB, id=jobid, extend='t')
        else:
            d = self.status(JOB, extend='t')
        ret = {}
        for job in d:
            if not include_running_jobs and job['job_state'] != 'Q':
                continue
            f_value = {}
            # initialize the formula values to 0
            for res in fres:
                f_value[res] = 0
            if 'queue_priority' in fres:
                queue = self.status(JOB, 'queue', id=job['id'])[0]['queue']
                d = self.status(QUEUE, 'Priority', id=queue)
                if d and 'Priority' in d[0]:
                    qprio = int(d[0]['Priority'])
                    qprio = int(d[0]['Priority'])
                    f_value['queue_priority'] = qprio
                else:
                    continue
            if 'job_priority' in fres:
                if 'Priority' in job:
                    jprio = int(job['Priority'])
                    f_value['job_priority'] = jprio
                else:
                    continue
            if 'eligible_time' in fres:
                if 'eligible_time' in job:
                    f_value['eligible_time'] = self.utils.convert_duration(
                        job['eligible_time'])
            if 'fair_share_perc' in fres:
                if self.schedulers[self.dflt_sched_name] is None:
                    self.schedulers[self.dflt_sched_name] = Scheduler(
                        server=self)

                if 'fairshare_entity' in self.schedulers[
                    self.dflt_sched_name
                ].sched_config:
                    entity = self.schedulers[
                        self.dflt_sched_name
                    ].sched_config['fairshare_entity']
                else:
                    self.logger.error(self.logprefix +
                                      ' no fairshare entity in sched config')
                    continue
                if entity not in job:
                    self.logger.error(self.logprefix +
                                      ' job does not have property ' + entity)
                    continue
                try:
                    fs_info = self.schedulers[
                        self.dflt_sched_name
                    ].fairshare.query_fairshare(
                        name=job[entity])
                    if fs_info is not None and 'TREEROOT' in fs_info.perc:
                        f_value['fair_share_perc'] = \
                            (fs_info.perc['TREEROOT'] / 100)
                except PbsFairshareError:
                    f_value['fair_share_perc'] = 0

            for job_res, val in job.items():
                val = PbsAttribute.decode_value(val)
                if job_res.startswith('Resource_List.'):
                    job_res = job_res.replace('Resource_List.', '')
                if job_res in fres and job_res not in _f_builtins:
                    f_value[job_res] = val
            tf = string.Template(template_formula)
            tfstr = tf.safe_substitute(f_value)
            if (jobid is not None or not exclude_subjobs or
                    (exclude_subjobs and not self.utils.is_subjob(job['id']))):
                ret[job['id']] = (tfstr, eval(tfstr))
        if not full and jobid is not None and jobid in ret:
            return ret[job['id']][1]
        return ret

    def _parse_limits(self, container=None, dictlist=None, id=None,
                      db_access=None):
        """
        Helper function to parse limits syntax on a given
        container.
        :param container: The PBS object to query, one of ``QUEUE``
                          or ``SERVER``.Metascheduling node group
                          limits are not yet queri-able
        :type container: str or None
        :param dictlist: A list of dictionaries off of a batch
                         status
        :type diclist: List
        :param id: Optional id of the object to query
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        """
        if container is None:
            self.logger.error('parse_limits expect container to be set')
            return {}

        if dictlist is None:
            d = self.status(container, db_access=db_access)
        else:
            d = dictlist

        if not d:
            return {}

        limits = {}
        for obj in d:
            # filter the id here instead of during the stat call so that
            # we can call a full stat once rather than one stat per object
            if id is not None and obj['id'] != id:
                continue
            for k, v in obj.items():
                if k.startswith('max_run'):
                    v = v.split(',')
                    for rval in v:
                        rval = rval.strip("'")
                        limit_list = self.utils.parse_fgc_limit(k + '=' + rval)
                        if limit_list is None:
                            self.logger.error("Couldn't parse limit: " +
                                              k + str(rval))
                            continue

                        (lim_type, resource, etype, ename, value) = limit_list
                        if (etype, ename) not in self.entities:
                            entity = Entity(etype, ename)
                            self.entities[(etype, ename)] = entity
                        else:
                            entity = self.entities[(etype, ename)]

                        lim = Limit(lim_type, resource, entity, value,
                                    container, obj['id'])

                        if container in limits:
                            limits[container].append(lim)
                        else:
                            limits[container] = [lim]

                        entity.set_limit(lim)
        return limits

    def parse_server_limits(self, server=None, db_access=None):
        """
        Parse all server limits
        :param server: list of dictionary of server data
        :type server: List
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        """
        return self._parse_limits(SERVER, server, db_access=db_access)

    def parse_queue_limits(self, queues=None, id=None, db_access=None):
        """
        Parse queue limits
        :param queues: list of dictionary of queue data
        :type queues: List
        :param id: The id of the queue to parse limit for. If None,
                   all queue limits are parsed
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        """
        return self._parse_limits(QUEUE, queues, id=id, db_access=db_access)

    def parse_all_limits(self, server=None, queues=None, db_access=None):
        """
        Parse all server and queue limits
        :param server: list of dictionary of server data
        :type server: List
        :param queues: list of dictionary of queue data
        :type queues: List
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        """
        if hasattr(self, 'limits'):
            del self.limits

        slim = self.parse_server_limits(server, db_access=db_access)
        qlim = self.parse_queue_limits(queues, id=None, db_access=db_access)
        self.limits = dict(list(slim.items()) + list(qlim.items()))
        del slim
        del qlim
        return self.limits

    def limits_info(self, etype=None, ename=None, server=None, queues=None,
                    jobs=None, db_access=None, over=False):
        """
        Collect limit information for each entity on which a
        ``server/queue`` limit is applied.
        :param etype: entity type, one of u, g, p, o
        :type etype: str or None
        :param ename: entity name
        :type ename: str or None
        :param server: optional list of dictionary representation
                       of server object
        :type server: List
        :param queues: optional list of dictionary representation
                       of queues object
        :type queues: List
        :param jobs: optional list of dictionary representation of
                     jobs object
        :type jobs: List
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        :param over: If True, show only entities that are over their
                     limit.Default is False.
        :type over: bool
        :returns: A list of dictionary similar to that returned by
                  a converted batch_status object, i.e., can be
                  displayed using the Utils.show method
        """
        def create_linfo(lim, entity_type, id, used):
            """
            Create limit information
            :param lim: Limit to apply
            :param entity_type: Type of entity
            """
            tmp = {}
            tmp['id'] = entity_type + ':' + id
            c = [PBS_OBJ_MAP[lim.container]]
            if lim.container_id:
                c += [':', lim.container_id]
            tmp['container'] = "".join(c)
            s = [str(lim.limit_type)]
            if lim.resource:
                s += ['.', lim.resource]
            tmp['limit_type'] = "".join(s)
            tmp['usage/limit'] = "".join([str(used), '/', str(lim.value)])
            tmp['remainder'] = int(lim.value) - int(used)

            return tmp

        def calc_usage(jobs, attr, name=None, resource=None):
            """
            Calculate the usage for the entity
            :param attr: Job attribute
            :param name: Entity name
            :type name: str or None
            :param resource: PBS resource
            :type resource: str or None
            :returns: The usage
            """
            usage = {}
            # initialize usage of the named entity
            if name is not None and name not in ('PBS_GENERIC', 'PBS_ALL'):
                usage[name] = 0
            for j in jobs:
                entity = j[attr]
                if entity not in usage:
                    if resource:
                        usage[entity] = int(
                            PbsAttribute.decode_value(
                                j['Resource_List.' + resource]))
                    else:
                        usage[entity] = 1
                else:
                    if resource:
                        usage[entity] += int(
                            PbsAttribute.decode_value(
                                j['Resource_List.' + resource]))
                    else:
                        usage[entity] += 1
            return usage

        self.parse_all_limits(server, queues, db_access)
        entities_p = self.entities.values()

        linfo = []
        cache = {}

        if jobs is None:
            jobs = self.status(JOB)

        for entity in sorted(entities_p, key=lambda e: e.name):
            for lim in entity.limits:
                _t = entity.type
                # skip non-matching entity types. We can't skip the entity
                # name due to proper handling of the PBS_GENERIC limits
                # we also can't skip overall limits
                if (_t != 'o') and (etype is not None and etype != _t):
                    continue

                _n = entity.name

                a = {}
                if lim.container == QUEUE and lim.container_id is not None:
                    a['queue'] = (EQ, lim.container_id)
                if lim.resource:
                    resource = 'Resource_List.' + lim.resource
                    a[resource] = (GT, 0)
                a['job_state'] = (EQ, 'R')
                a['substate'] = (EQ, 42)
                if etype == 'u' and ename is not None:
                    a['euser'] = (EQ, ename)
                else:
                    a['euser'] = (SET, '')
                if etype == 'g' and ename is not None:
                    a['egroup'] = (EQ, ename)
                else:
                    a['egroup'] = (SET, '')
                if etype == 'p' and ename is not None:
                    a['project'] = (EQ, ename)
                else:
                    a['project'] = (SET, '')

                # optimization: cache filtered results
                d = None
                for v in cache.keys():
                    if cmp(a, eval(v)) == 0:
                        d = cache[v]
                        break
                if d is None:
                    d = self.filter(JOB, a, bslist=jobs, attrop=PTL_AND,
                                    idonly=False, db_access=db_access)
                    cache[str(a)] = d
                if not d or 'job_state=R' not in d:
                    # in the absence of jobs, display limits defined with usage
                    # of 0
                    if ename is not None:
                        _u = {ename: 0}
                    else:
                        _u = {_n: 0}
                else:
                    if _t in ('u', 'o'):
                        _u = calc_usage(
                            d['job_state=R'], 'euser', _n, lim.resource)
                        # an overall limit applies across all running jobs
                        if _t == 'o':
                            all_used = sum(_u.values())
                            for k in _u.keys():
                                _u[k] = all_used
                    elif _t == 'g':
                        _u = calc_usage(
                            d['job_state=R'], 'egroup', _n, lim.resource)
                    elif _t == 'p':
                        _u = calc_usage(
                            d['job_state=R'], 'project', _n, lim.resource)

                for k, used in _u.items():
                    if not over or (int(used) > int(lim.value)):
                        if ename is not None and k != ename:
                            continue
                        if _n in ('PBS_GENERIC', 'PBS_ALL'):
                            if k not in ('PBS_GENERIC', 'PBS_ALL'):
                                k += '/' + _n
                        elif _n != k:
                            continue
                        tmp_linfo = create_linfo(lim, _t, k, used)
                        linfo.append(tmp_linfo)
                del a
        del cache
        return linfo

    def __insert_jobs_in_db(self, jobs, hostname=None):
        """
        An experimental interface that converts jobs from file
        into entries in the PBS database that can be recovered
        upon server restart if all other ``objects``, ``queues``,
        ``resources``, etc... are already defined.
        The interface to PBS used in this method is incomplete
        and will most likely cause serious issues. Use only for
        development purposes
        """

        if not jobs:
            return []

        if hostname is None:
            hostname = socket.gethostname()

        # a very crude, and not quite maintainale way to get the flag value
        # of an attribute. This is one of the reasons why this conversion
        # of jobs is highly experimental
        flag_map = {'ctime': 9, 'qtime': 9, 'hop_count': 9, 'queue_rank': 9,
                    'queue_type': 9, 'etime': 9, 'job_kill_delay': 9,
                    'run_version': 9, 'job_state': 9, 'exec_host': 9,
                    'exec_host2': 9, 'exec_vnode': 9, 'mtime': 9, 'stime': 9,
                    'substate': 9, 'hashname': 9, 'comment': 9, 'run_count': 9,
                    'schedselect': 13}

        state_map = {'Q': 1, 'H': 2, 'W': 3, 'R': 4, 'E': 5, 'X': 6, 'B': 7}

        job_attr_stmt = ("INSERT INTO pbs.job_attr (ji_jobid, attr_name, "
                         "attr_resource, attr_value, attr_flags)")

        job_stmt = ("INSERT INTO pbs.job (ji_jobid, ji_sv_name, ji_state, "
                    "ji_substate, ji_svrflags, ji_stime, "
                    "ji_queue, ji_destin, ji_un_type, "
                    "ji_exitstat, ji_quetime, ji_rteretry, "
                    "ji_fromsock, ji_fromaddr, ji_jid, "
                    "ji_credtype, ji_savetm, ji_creattm)")

        all_stmts = []

        for job in jobs:

            keys = []
            values = []
            flags = []

            for k, v in job.items():
                if k in ('id', 'Mail_Points', 'Mail_Users'):
                    continue
                keys.append(k)
                if not v.isdigit():
                    values.append("'" + v + "'")
                else:
                    values.append(v)
                if k in flag_map:
                    flags.append(flag_map[k])
                elif k.startswith('Resource_List'):
                    flags.append(15)
                else:
                    flags.append(11)

            jobid = job['id'].split('.')[0] + '.' + hostname

            for i in range(len(keys)):
                stmt = job_attr_stmt
                stmt += " VALUES('" + jobid + "', "
                if '.' in keys[i]:
                    k, v = keys[i].split('.')
                    stmt += "'" + k + "', '" + v + "'" + ", "
                else:
                    stmt += "'" + keys[i] + "', ''" + ", "
                stmt += values[i] + "," + str(flags[i])
                stmt += ");"
                self.logger.debug(stmt)
                all_stmts.append(stmt)

            js = job['job_state']
            svrflags = 1
            state = 1
            if js in state_map:
                state = state_map[js]
                if state == 4:
                    # Other states svrflags aren't handled and will
                    # cause issues, another reason this is highly experimental
                    svrflags = 12289

            tm = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime())
            stmt = job_stmt
            stmt += " VALUES('" + jobid + "', 1, "
            stmt += str(state) + ", " + job['substate']
            stmt += ", " + str(svrflags)
            stmt += ", 0, 0, 0"
            if 'stime' in job:
                print(job['stime'])
                st = time.strptime(job['stime'], "%a %b %d %H:%M:%S %Y")
                stmt += ", " + str(time.mktime(st))
            else:
                stmt += ", 0"
            stmt += ", 0"
            stmt += ", '" + job['queue'] + "'"
            if 'exec_host2' in job:
                stmt += ", " + job['exec_host2']
            else:
                stmt += ", ''"
            stmt += ", 0, 0, 0, 0, 0, 0, 0, 0, '', '', 0, 0"
            stmt += ", '" + tm + "', '" + tm + "');"
            self.logger.debug(stmt)

            all_stmts.append(stmt)

        return all_stmts

    def clusterize(self, conf_file=None, hosts=None, acct_logs=None,
                   import_jobs=False, db_creds_file=None):
        """
        Mimic a ``pbs_snapshot`` snapshot onto a set of hosts running
        a PBS ``server``,``scheduler``, and ``MoM``.
        This method clones the following information from the snap:
        ``Server attributes``
        ``Server resourcedef``
        ``Hooks``
        ``Scheduler configuration``
        ``Scheduler resource_group``
        ``Scheduler holiday file``
        ``Per Queue attributes``
        Nodes are copied as a vnode definition file inserted into
        each host's MoM instance.
        Currently no support for cloning the server 'sched' object,
        nor to copy nodes to multi-mom instances.
        Jobs are copied over only if import_jobs is True, see below
        for details
        :param conf_file: Configuration file for the MoM instance
        :param hosts: List of hosts on which to clone the snap
                      snapshot
        :type hosts: List
        :param acct_logs: path to accounting logs
        :type acct_logs str
        :param include_jobs: [Experimental] if True jobs from the
                             pbs_snapshot are imported into the host's
                             database. There are several caveats to
                             this option:
                             The scripts are not imported
                             The users and groups are not created on
                             the local system.There are no actual
                             processes created on the MoM for each
                             job so operations on the job such as
                             signals or delete will fail (delete -W
                             force will still work)
        :type include_jobs: bool
        :param db_creds_file: Path to file containing credentials
                              to access the DB
        :type db_creds_file: str or None
        """
        if not self.has_snap:
            return
        if hosts is None:
            return

        # Create users & groups (need to associate users to groups)
        if acct_logs is not None:
            self.logger.info("Parsing accounting logs to find "
                             "users & groups to create")
            groups = set()
            users = {}
            for name in os.listdir(acct_logs):
                fpath = os.path.join(acct_logs, name)
                with open(fpath, "r") as fd:
                    for line in fd:
                        rec_list = line.split(";", 3)
                        if len(rec_list) < 4 or rec_list[1] != "E":
                            continue
                        try:
                            uname = rec_list[3].split(
                                "user=")[1].split()[0]
                            if uname not in users:
                                users[uname] = set()
                            gname = rec_list[3].split(
                                "group=")[1].split()[0]
                            users[uname].add(gname)
                            groups.add(gname)
                        except IndexError:
                            continue
            # Create groups first
            for grp in groups:
                try:
                    self.du.groupadd(name=grp)
                except PtlUtilError as e:
                    if "already exists" not in e.msg[0]:
                        raise
            # Now create users and add them to their associated groups
            for user, u_grps in users.items():
                try:
                    self.du.useradd(name=user, groups=list(u_grps))
                except PtlUtilError as e:
                    if "already exists" not in e.msg[0]:
                        raise

        for h in hosts:
            svr = Server(h)
            sched = Scheduler(server=svr, snap=self.snap,
                              snapmap=self.snapmap)
            try:
                svr.manager(MGR_CMD_DELETE, NODE, None, id="")
            except Exception:
                pass
            svr.revert_to_defaults(delqueues=True, delhooks=True)
            local = svr.pbs_conf['PBS_HOME']

            snap_rdef = os.path.join(self.snap, 'server_priv', 'resourcedef')
            snap_sc = os.path.join(self.snap, 'sched_priv', 'sched_config')
            snap_rg = os.path.join(self.snap, 'sched_priv', 'resource_group')
            snap_hldy = os.path.join(self.snap, 'sched_priv', 'holidays')
            nodes = os.path.join(self.snap, 'node', 'pbsnodes_va.out')
            snap_hooks = os.path.join(self.snap, 'hook',
                                      'qmgr_ph_default.out')
            snap_ps = os.path.join(self.snap, 'server', 'qmgr_ps.out')
            snap_psched = os.path.join(self.snap, 'scheduler',
                                       'qmgr_psched.out')
            snap_pq = os.path.join(self.snap, 'server', 'qmgr_pq.out')

            local_rdef = os.path.join(local, 'server_priv', 'resourcedef')
            local_sc = os.path.join(local, 'sched_priv', 'sched_config')
            local_rg = os.path.join(local, 'sched_priv', 'resource_group')
            local_hldy = os.path.join(local, 'sched_priv', 'holidays')

            _fcopy = [(snap_rdef, local_rdef), (snap_sc, local_sc),
                      (snap_rg, local_rg), (snap_hldy, local_hldy)]

            # Restart since resourcedef may have changed
            svr.restart()

            if os.path.isfile(snap_ps):
                with open(snap_ps) as tmp_ps:
                    cmd = [os.path.join(svr.pbs_conf['PBS_EXEC'], 'bin',
                                        'qmgr')]
                    self.du.run_cmd(h, cmd, stdin=tmp_ps, sudo=True,
                                    logerr=False)
            else:
                self.logger.error("server information not found in snapshot")

            # Unset any site-sensitive attributes
            for a in ['pbs_license_info', 'mail_from', 'acl_hosts']:
                try:
                    svr.manager(MGR_CMD_UNSET, SERVER, a, sudo=True)
                except Exception:
                    pass

            for (d, l) in _fcopy:
                if os.path.isfile(d):
                    self.logger.info('copying ' + d + ' to ' + l)
                    self.du.run_copy(h, src=d, dest=l, sudo=True)

            if os.path.isfile(snap_pq):
                with open(snap_pq) as tmp_pq:
                    cmd = [os.path.join(svr.pbs_conf['PBS_EXEC'], 'bin',
                                        'qmgr')]
                    self.du.run_cmd(h, cmd, stdin=tmp_pq, sudo=True,
                                    logerr=False)
            else:
                self.logger.error("queue information not found in snapshot")

            if os.path.isfile(snap_psched):
                with open(snap_psched) as tmp_psched:
                    cmd = [os.path.join(svr.pbs_conf['PBS_EXEC'], 'bin',
                                        'qmgr')]
                    self.du.run_cmd(h, cmd, stdin=tmp_psched, sudo=True,
                                    logerr=False)
            else:
                self.logger.error("sched information not found in snapshot")

            if os.path.isfile(nodes):
                with open(nodes) as f:
                    lines = f.readlines()
                dl = self.utils.convert_to_dictlist(lines)
                vdef = self.utils.dictlist_to_vnodedef(dl)
                if vdef:
                    try:
                        svr.manager(MGR_CMD_DELETE, NODE, None, "")
                    except Exception:
                        pass
                    MoM(self, h, pbsconf_file=conf_file).insert_vnode_def(
                        vdef)
                    svr.restart()
                    svr.manager(MGR_CMD_CREATE, NODE, id=svr.shortname)
                # check if any node is associated to a queue.
                # This is needed because the queues 'hasnodes' attribute
                # does not get set through vnode def update and must be set
                # via qmgr. It only needs to be set once, not for each node
                qtoset = {}
                for n in dl:
                    if 'queue' in n and n['queue'] not in qtoset:
                        qtoset[n['queue']] = n['id']

                # before setting queue on nodes make sure that the vnode
                # def is all set
                svr.expect(NODE, {'state=free': (GE, len(dl))}, interval=3)
                for k, v in qtoset.items():
                    svr.manager(MGR_CMD_SET, NODE, {'queue': k}, id=v)
            else:
                self.logger.error("nodes information not found in snapshot")

            # populate hooks
            if os.path.isfile(snap_hooks):
                hooks = svr.status(HOOK, level=logging.DEBUG)
                hooks = [hk['id'] for hk in hooks]
                if len(hooks) > 0:
                    svr.manager(MGR_CMD_DELETE, HOOK, id=hooks)
                with open(snap_hooks) as tmp_hook:
                    cmd = [os.path.join(svr.pbs_conf['PBS_EXEC'], 'bin',
                                        'qmgr')]
                    self.du.run_cmd(h, cmd, stdin=tmp_hook, sudo=True)
            else:
                self.logger.error("hooks information not found in snapshot")

            # import jobs
            if import_jobs:
                jobs = self.status(JOB)
                sql_stmt = self.__insert_jobs_in_db(jobs, h)
                print("\n".join(sql_stmt))
                if db_creds_file is not None:
                    pass


================================================
FILE: test/fw/ptl/lib/ptl_service.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import ast
import base64
import copy
import datetime
import json
import logging
import os
import re
import socket
import string
import sys
import time
import traceback
import platform

from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_procutils import ProcUtils
from ptl.utils.pbs_testusers import (ROOT_USER, TEST_USER, PbsUser,
                                     DAEMON_SERVICE_USER)
from ptl.lib.ptl_error import (PbsInitServicesError, PbsServiceError,
                               PtlLogMatchError)
from ptl.lib.ptl_object import PBSObject

from ptl.lib.ptl_constants import (SERVER, VNODE, QUEUE, JOB,
                                   RESV, SCHED, HOOK)


class PBSInitServices(object):
    """
    PBS initialization services

    :param hostname: Machine hostname
    :type hostname: str or None
    :param conf: PBS configuaration file
    :type conf: str or None
    """

    def __init__(self, hostname=None, conf=None):
        self.logger = logging.getLogger(__name__)
        self.hostname = hostname
        if self.hostname is None:
            self.hostname = socket.gethostname()
        self.dflt_conf_file = os.environ.get('PBS_CONF_FILE', '/etc/pbs.conf')
        self.conf_file = conf
        self.du = DshUtils()
        self.is_linux = sys.platform.startswith('linux')

    def initd(self, hostname=None, op='status', conf_file=None,
              init_script=None, daemon='all'):
        """
        Run the init script for a given operation

        :param hostname: hostname on which to execute the init script
        :type hostname: str or None
        :param op: one of status, start, stop, restart
        :type op: str
        :param conf_file: optional path to a configuration file
        :type conf_file: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        :param daemon: name of daemon to operate on. one of server, mom,
                       sched, comm or all
        :type daemon: str
        """
        if hostname is None:
            hostname = self.hostname
        if conf_file is None:
            conf_file = self.conf_file
        return self._unix_initd(hostname, op, conf_file, init_script, daemon)

    def restart(self, hostname=None, init_script=None):
        """
        Run the init script for a restart operation

        :param hostname: hostname on which to execute the init script
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='restart', init_script=init_script)

    def restart_server(self, hostname=None, init_script=None):
        """
        Run the init script for a restart server

        :param hostname: hostname on which to restart server
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='restart', init_script=init_script,
                          daemon='server')

    def restart_mom(self, hostname=None, init_script=None):
        """
        Run the init script for a restart mom

        :param hostname: hostname on which to restart mom
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='restart', init_script=init_script,
                          daemon='mom')

    def restart_sched(self, hostname=None, init_script=None):
        """
        Run the init script for a restart sched

        :param hostname: hostname on which to restart sched
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='restart', init_script=init_script,
                          daemon='sched')

    def restart_comm(self, hostname=None, init_script=None):
        """
        Run the init script for a restart comm

        :param hostname: hostname on which to restart comm
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='restart', init_script=init_script,
                          daemon='comm')

    def start(self, hostname=None, init_script=None):
        """
        Run the init script for a start operation

        :param hostname: hostname on which to execute the init script
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='start', init_script=init_script)

    def start_server(self, hostname=None, init_script=None):
        """
        Run the init script for a start server

        :param hostname: hostname on which to start server
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='start', init_script=init_script,
                          daemon='server')

    def start_mom(self, hostname=None, init_script=None):
        """
        Run the init script for a start mom

        :param hostname: hostname on which to start mom
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='start', init_script=init_script,
                          daemon='mom')

    def start_sched(self, hostname=None, init_script=None):
        """
        Run the init script for a start sched

        :param hostname: hostname on which to start sched
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='start', init_script=init_script,
                          daemon='sched')

    def start_comm(self, hostname=None, init_script=None):
        """
        Run the init script for a start comm

        :param hostname: hostname on which to start comm
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='start', init_script=init_script,
                          daemon='comm')

    def stop(self, hostname=None, init_script=None):
        """
        Run the init script for a stop operation

        :param hostname: hostname on which to execute the init script
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='stop', init_script=init_script)

    def stop_server(self, hostname=None, init_script=None):
        """
        Run the init script for a stop server

        :param hostname: hostname on which to stop server
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='stop', init_script=init_script,
                          daemon='server')

    def stop_mom(self, hostname=None, init_script=None):
        """
        Run the init script for a stop mom

        :param hostname: hostname on which to stop mom
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='stop', init_script=init_script,
                          daemon='mom')

    def stop_sched(self, hostname=None, init_script=None):
        """
        Run the init script for a stop sched

        :param hostname: hostname on which to stop sched
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='stop', init_script=init_script,
                          daemon='sched')

    def stop_comm(self, hostname=None, init_script=None):
        """
        Run the init script for a stop comm

        :param hostname: hostname on which to stop comm
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='stop', init_script=init_script,
                          daemon='comm')

    def status(self, hostname=None, init_script=None):
        """
        Run the init script for a status operation

        :param hostname: hostname on which to execute the init script
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='status', init_script=init_script)

    def status_server(self, hostname=None, init_script=None):
        """
        Run the init script for a status server

        :param hostname: hostname on which to status server
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='status', init_script=init_script,
                          daemon='server')

    def status_mom(self, hostname=None, init_script=None):
        """
        Run the init script for a status mom

        :param hostname: hostname on which to status mom
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='status', init_script=init_script,
                          daemon='mom')

    def status_sched(self, hostname=None, init_script=None):
        """
        Run the init script for a status sched

        :param hostname: hostname on which to status sched
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='status', init_script=init_script,
                          daemon='sched')

    def status_comm(self, hostname=None, init_script=None):
        """
        Run the init script for a status comm

        :param hostname: hostname on which to status comm
        :type hostname: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        """
        return self.initd(hostname, op='status', init_script=init_script,
                          daemon='comm')

    def _unix_initd(self, hostname, op, conf_file, init_script, daemon):
        """
        Helper function for initd ``(*nix version)``

        :param hostname: hostname on which init script should run
        :type hostname: str
        :param op: Operation on daemons - start, stop, restart or status
        :op type: str
        :param conf_file: Optional path to the pbs configuration file
        :type conf_file: str or None
        :param init_script: optional path to a PBS init script
        :type init_script: str or None
        :param daemon: name of daemon to operate on. one of server, mom,
                       sched, comm or all
        :type daemon: str
        """
        init_cmd = copy.copy(self.du.sudo_cmd)
        if daemon is not None and daemon != 'all':
            conf = self.du.parse_pbs_config(hostname, conf_file)
            dconf = {
                'PBS_START_SERVER': 0,
                'PBS_START_MOM': 0,
                'PBS_START_SCHED': 0,
                'PBS_START_COMM': 0
            }
            if daemon == 'server' and conf.get('PBS_START_SERVER', 0) != 0:
                dconf['PBS_START_SERVER'] = 1
            elif daemon == 'mom' and conf.get('PBS_START_MOM', 0) != 0:
                dconf['PBS_START_MOM'] = 1
            elif daemon == 'sched' and conf.get('PBS_START_SCHED', 0) != 0:
                dconf['PBS_START_SCHED'] = 1
            elif daemon == 'comm' and conf.get('PBS_START_COMM', 0) != 0:
                dconf['PBS_START_COMM'] = 1
            for k, v in dconf.items():
                init_cmd += ["%s=%s" % (k, str(v))]
            _as = True
        else:
            fn = None
            if (conf_file is not None) and (conf_file != self.dflt_conf_file):
                init_cmd += ['PBS_CONF_FILE=' + conf_file]
                _as = True
            else:
                _as = False
            conf = self.du.parse_pbs_config(hostname, conf_file)
        if (init_script is None) or (not init_script.startswith('/')):
            if 'PBS_EXEC' not in conf:
                msg = 'Missing PBS_EXEC setting in pbs config'
                raise PbsInitServicesError(rc=1, rv=False, msg=msg)
            if init_script is None:
                init_script = os.path.join(conf['PBS_EXEC'], 'libexec',
                                           'pbs_init.d')
            else:
                init_script = os.path.join(conf['PBS_EXEC'], 'etc',
                                           init_script)
            if not self.du.isfile(hostname, path=init_script, sudo=True):
                # Could be Type 3 installation where we will not have
                # PBS_EXEC/libexec/pbs_init.d
                return []
        init_cmd += [init_script, op]
        msg = 'running init script to ' + op + ' pbs'
        if daemon is not None and daemon != 'all':
            msg += ' ' + daemon
        msg += ' on ' + hostname
        if conf_file is not None:
            msg += ' using ' + conf_file
        msg += ' init_cmd=%s' % (str(init_cmd))
        self.logger.info(msg)
        ret = self.du.run_cmd(hostname, init_cmd, as_script=_as,
                              logerr=False)
        if ret['rc'] != 0:
            raise PbsInitServicesError(rc=ret['rc'], rv=False,
                                       msg='\n'.join(ret['err']))
        else:
            return ret

    def switch_version(self, hostname=None, version=None):
        """
        Switch to another version of PBS installed on the system

        :param hostname: The hostname to operate on
        :type hostname: str or None
        :param version: version to switch
        """
        pbs_conf = self.du.parse_pbs_config(hostname)
        if 'PBS_EXEC' in pbs_conf:
            dn = os.path.dirname(pbs_conf['PBS_EXEC'])
            newver = os.path.join(dn, version)
            ret = self.du.isdir(hostname, path=newver)
            if not ret:
                msg = 'no version ' + version + ' on host ' + hostname
                raise PbsInitServicesError(rc=0, rv=False, msg=msg)
            self.stop(hostname)
            dflt = os.path.join(dn, 'default')
            ret = self.du.isfile(hostname, path=dflt)
            if ret:
                self.logger.info('removing symbolic link ' + dflt)
                self.du.rm(hostname, dflt, sudo=True, logerr=False)
                self.du.set_pbs_config(hostname, confs={'PBS_EXEC': dflt})
            else:
                self.du.set_pbs_config(hostname, confs={'PBS_EXEC': newver})

            self.logger.info('linking ' + newver + ' to ' + dflt)
            self.du.run_cmd(hostname, ['ln', '-s', newver, dflt],
                            sudo=True, logerr=False)
            self.start(hostname)


class PBSService(PBSObject):

    """
    Generic PBS service object to hold properties of PBS daemons

    :param name: The name associated to the object
    :type name: str or None
    :param attrs: Dictionary of attributes to set on object
    :type attrs: Dictionary
    :param defaults: Dictionary of default attributes. Setting
                     this will override any other object's default
    :type defaults: Dictionary
    :param pbsconf_file: Optional path to the pbs configuration
                         file
    :type pbsconf_file: str or None
    :param snapmap: A dictionary of PBS objects (node,server,etc)
                    to mapped files from PBS snapshot directory
    :type snapmap: Dictionary
    :param snap: path to PBS snap directory
                 (This will override snapmap)
    :type snap: str or None
    :param pbs_conf: Parsed pbs.conf in dictionary format
    :type pbs_conf: Dictionary or None
    :param platform: PBS service's platform
    :type platform: str or None
    """
    du = DshUtils()
    pu = ProcUtils()

    def __init__(self, name=None, attrs=None, defaults=None, pbsconf_file=None,
                 snapmap=None, snap=None, pbs_conf=None, platform=None):
        if attrs is None:
            attrs = {}
        if defaults is None:
            defaults = {}
        if snapmap is None:
            snapmap = {}
        if name is None:
            self.hostname = socket.gethostname()
        else:
            self.hostname = name
        if snap:
            self.snapmap = self._load_from_snap(snap)
            self.has_snap = True
            self.snap = snap
        elif len(snapmap) > 0:
            self.snapmap = snapmap
            self.snap = None
            self.has_snap = True
        else:
            self.snapmap = {}
            self.snap = None
            self.has_snap = False
        if not self.has_snap:
            try:
                self.fqdn = socket.gethostbyaddr(self.hostname)[0]
                if self.hostname != self.fqdn:
                    self.logger.info('FQDN name ' + self.fqdn + ' differs '
                                     'from name provided ' + self.hostname)
                    self.hostname = self.fqdn
            except Exception:
                pass
        else:
            self.fqdn = self.hostname

        self.shortname = self.hostname.split('.')[0]
        if platform is None:
            self.platform = self.du.get_platform()
        else:
            self.platform = platform

        self.logutils = None
        self.logfile = None
        self.acctlogfile = None
        self.pbs_conf = {}
        self.pbs_env = {}
        self._is_local = True
        self.launcher = None
        self.dyn_created_files = []
        self.saved_config = {}

        PBSObject.__init__(self, name, attrs, defaults)

        if not self.has_snap:
            if not self.du.is_localhost(self.hostname):
                self._is_local = False

        if pbsconf_file is None and not self.has_snap:
            self.pbs_conf_file = self.du.get_pbs_conf_file(name)
        else:
            self.pbs_conf_file = pbsconf_file

        if self.pbs_conf_file == '/etc/pbs.conf':
            self.default_pbs_conf = True
        elif (('PBS_CONF_FILE' not in os.environ) or
              (os.environ['PBS_CONF_FILE'] != self.pbs_conf_file)):
            self.default_pbs_conf = False
        else:
            self.default_pbs_conf = True

        # default pbs_server_name to hostname, it will get set again once the
        # config file is processed
        self.pbs_server_name = self.hostname

        # If snap is given then bypass parsing pbs.conf
        if self.has_snap:
            if snap is None:
                t = 'snapshot_%s' % (time.strftime("%y%m%d_%H%M%S"))
                self.snap = os.path.join(self.du.get_tempdir(), t)
            self.pbs_conf['PBS_HOME'] = self.snap
            self.pbs_conf['PBS_EXEC'] = self.snap
            self.pbs_conf['PBS_SERVER'] = self.hostname
            m = re.match(r'.*snapshot_(?P<datetime>\d{6,6}_\d{6,6}).*',
                         self.snap)
            if m:
                tm = time.strptime(m.group('datetime'), "%y%m%d_%H%M%S")
                self.ctime = int(time.mktime(tm))
        elif pbs_conf is not None:
            self.pbs_conf = pbs_conf
            self.pbs_server_name = self.du.get_pbs_server_name(self.pbs_conf)
        else:
            self.pbs_conf = self.du.parse_pbs_config(self.hostname,
                                                     self.pbs_conf_file)
            if self.pbs_conf is None or len(self.pbs_conf) == 0:
                self.pbs_conf = {'PBS_HOME': "", 'PBS_EXEC': ""}
            else:
                ef = os.path.join(self.pbs_conf['PBS_HOME'], 'pbs_environment')
                self.pbs_env = self.du.parse_pbs_environment(self.hostname, ef)
                self.pbs_server_name = self.du.get_pbs_server_name(
                    self.pbs_conf)

        self.init_logfile_path(self.pbs_conf)

    def _load_from_snap(self, snap):
        snapmap = {}
        snapmap[SERVER] = os.path.join(snap, 'server', 'qstat_Bf.out')
        snapmap[VNODE] = os.path.join(snap, 'node', 'pbsnodes_va.out')
        snapmap[QUEUE] = os.path.join(snap, 'server', 'qstat_Qf.out')
        snapmap[JOB] = os.path.join(snap, 'job', 'qstat_tf.out')
        if not os.path.isfile(snapmap[JOB]):
            snapmap[JOB] = os.path.join(snap, 'job', 'qstat_f.out')
        snapmap[RESV] = os.path.join(snap, 'reservation', 'pbs_rstat_f.out')
        snapmap[SCHED] = os.path.join(snap, 'scheduler', 'qmgr_psched.out')
        snapmap[HOOK] = []
        if (os.path.isdir(os.path.join(snap, 'server_priv')) and
                os.path.isdir(os.path.join(snap, 'server_priv', 'hooks'))):
            _ld = os.listdir(os.path.join(snap, 'server_priv', 'hooks'))
            for f in _ld:
                if f.endswith('.HK'):
                    snapmap[HOOK].append(
                        os.path.join(snap, 'server_priv', 'hooks', f))

        return snapmap

    def init_logfile_path(self, conf=None):
        """
        Initialize path to log files for this service

        :param conf: PBS conf file parameters
        :type conf: Dictionary
        """
        elmt = self._instance_to_logpath(self)
        if elmt is None:
            return

        if conf is not None and 'PBS_HOME' in conf:
            tm = time.strftime("%Y%m%d", time.localtime())
            self.logfile = os.path.join(conf['PBS_HOME'], elmt, tm)
            self.acctlogfile = os.path.join(conf['PBS_HOME'], 'server_priv',
                                            'accounting', tm)

    def _instance_to_logpath(self, inst):
        """
        returns the log path associated to this service
        """
        if inst.__class__.__name__ == "Scheduler":
            logval = 'sched_logs'
        elif inst.__class__.__name__ == "Server":
            logval = 'server_logs'
        elif inst.__class__.__name__ == "MoM":
            logval = 'mom_logs'
        elif inst.__class__.__name__ == "Comm":
            logval = 'comm_logs'
        else:
            logval = None
        return logval

    def _instance_to_cmd(self, inst):
        """
        returns the command associated to this service
        """
        if inst.__class__.__name__ == "Scheduler":
            cmd = 'pbs_sched'
        elif inst.__class__.__name__ == "Server":
            cmd = 'pbs_server'
        elif inst.__class__.__name__ == "MoM":
            cmd = 'pbs_mom'
        elif inst.__class__.__name__ == "Comm":
            cmd = 'pbs_comm'
        else:
            cmd = None
        return cmd

    def _instance_to_servicename(self, inst):
        """
        return the service name associated to the instance. One of
        ``server, scheduler, or mom.``
        """
        if inst.__class__.__name__ == "Scheduler":
            nm = 'scheduler'
        elif inst.__class__.__name__ == "Server":
            nm = 'server'
        elif inst.__class__.__name__ == "MoM":
            nm = 'mom'
        elif inst.__class__.__name__ == "Comm":
            nm = 'comm'
        else:
            nm = ''
        return nm

    def _instance_to_privpath(self, inst):
        """
        returns the path to priv associated to this service
        """
        if inst.__class__.__name__ == "Scheduler":
            priv = 'sched_priv'
        elif inst.__class__.__name__ == "Server":
            priv = 'server_priv'
        elif inst.__class__.__name__ == "MoM":
            priv = 'mom_priv'
        elif inst.__class__.__name__ == "Comm":
            priv = 'server_priv'
        else:
            priv = None
        return priv

    def _instance_to_lock(self, inst):
        """
        returns the path to lock file associated to this service
        """
        if inst.__class__.__name__ == "Scheduler":
            lock = 'sched.lock'
        elif inst.__class__.__name__ == "Server":
            lock = 'server.lock'
        elif inst.__class__.__name__ == "MoM":
            lock = 'mom.lock'
        elif inst.__class__.__name__ == "Comm":
            lock = 'comm.lock'
        else:
            lock = None
        return lock

    def set_launcher(self, execargs=None):
        self.launcher = execargs

    def _isUp(self):
        """
        returns True if service is up and False otherwise
        """
        live_pids = self._all_instance_pids()
        pid = self._get_pid()
        if live_pids is not None and pid in live_pids:
            return True
        return False

    def _signal(self, sig, procname=None):
        """
        Send signal ``sig`` to service. sig is the signal name
        as it would be sent to the program kill, e.g. -HUP.

        Return the ``out/err/rc`` from the command run to send
        the signal. See DshUtils.run_cmd

        :param procname: Process name
        :type procname: str or None
        """
        pid = self._get_pid()

        if procname is not None:
            pi = self.pu.get_proc_info(self.hostname, procname)
            if pi is not None and pi.values() and list(pi.values())[0]:
                for _p in list(pi.values())[0]:
                    ret = self.du.run_cmd(self.hostname, ['kill', sig, _p.pid],
                                          sudo=True)
                return ret

        if pid is None:
            return {'rc': 0, 'err': '', 'out': 'no pid to signal'}

        return self.du.run_cmd(self.hostname, ['kill', sig, pid], sudo=True)

    def _all_instance_pids(self):
        """
        Return a list of all ``PIDS`` that match the
        instance name or None.
        """
        cmd = self._instance_to_cmd(self)
        self.pu.get_proc_info(self.hostname, ".*" + cmd + ".*",
                              regexp=True)
        _procs = self.pu.processes.values()
        if _procs:
            _pids = []
            for _p in _procs:
                _pids.extend([x.pid for x in _p])
            return _pids
        return None

    def _get_pid(self):
        """
        Get the ``PID`` associated to this instance.
        Implementation note, the pid is read from the
        daemon's lock file.

        This is different than _all_instance_pids in that
        the PID of the last running instance can be retrieved
        with ``_get_pid`` but not with ``_all_instance_pids``
        """
        priv = self._instance_to_privpath(self)
        lock = self._instance_to_lock(self)
        if ((self.__class__.__name__ == "Scheduler") and
                'sched_priv' in self.attributes):
            path = os.path.join(self.attributes['sched_priv'], lock)
        else:
            path = os.path.join(self.pbs_conf['PBS_HOME'], priv, lock)
        rv = self.du.cat(self.hostname, path, sudo=True, logerr=False)
        if ((rv['rc'] == 0) and (len(rv['out']) > 0)):
            pid = rv['out'][0].strip()
        else:
            pid = None
        return pid

    def _validate_pid(self, inst):
        """
        Get pid and validate
        :param inst: inst to update pid
        :type inst: object
        """
        for i in range(30):
            live_pids = self._all_instance_pids()
            pid = self._get_pid()
            if live_pids is not None and pid in live_pids:
                return pid
            time.sleep(1)
        return None

    def _start(self, inst=None, args=None, cmd_map=None, launcher=None):
        """
        Generic service startup

        :param inst: The instance to act upon
        :type inst: str
        :param args: Optional command-line arguments
        :type args: List
        :param cmd_map: Optional dictionary of command line
                        options to configuration variables
        :type cmd_map: Dictionary
        :param launcher: Optional utility to invoke the launch
                         of the service. This option only takes
                         effect on ``Unix/Linux``. The option can
                         be a string or a list.Options may be passed
                         to the launcher, for example to start a
                         service through the valgrind utility
                         redirecting to a log file,launcher could be
                         set to e.g.
                         ``['valgrind', '--log-file=/tmp/vlgrd.out']``
                         or ``'valgrind --log-file=/tmp/vlgrd.out'``
        """
        if launcher is None and self.launcher is not None:
            launcher = self.launcher

        app = self._instance_to_cmd(inst)
        if app is None:
            return
        _m = ['service: starting', app]
        if args is not None:
            _m += ['with args: ']
            _m += args

        as_script = False
        wait_on = True
        if launcher is not None:
            if isinstance(launcher, str):
                launcher = launcher.split()
            if app == 'pbs_server':
                # running the pbs server through valgrind requires a bit of
                # a dance because the pbs_server binary is pbs_server.bin
                # and to run it requires being able to find libraries, so
                # LD_LIBRARY_PATH is set and pbs_server.bin is run as a
                # script
                pexec = inst.pbs_conf['PBS_EXEC']
                ldlib = ['LD_LIBRARY_PATH=' +
                         os.path.join(pexec, 'lib') + ':' +
                         os.path.join(pexec, 'pgsql', 'lib')]
                app = 'pbs_server.bin'
            else:
                ldlib = []
            cmd = ldlib + launcher
            as_script = True
            wait_on = False
        else:
            cmd = []

        cmd += [os.path.join(self.pbs_conf['PBS_EXEC'], 'sbin', app)]
        if args is not None:
            cmd += args
        if not self.default_pbs_conf:
            cmd = ['PBS_CONF_FILE=' + inst.pbs_conf_file] + cmd
            as_script = True
        if cmd_map is not None:
            conf_cmd = self.du.map_pbs_conf_to_cmd(cmd_map,
                                                   pconf=self.pbs_conf)
            cmd.extend(conf_cmd)
            _m += conf_cmd

        self.logger.info(" ".join(_m))

        ret = self.du.run_cmd(self.hostname, cmd, sudo=True,
                              as_script=as_script, wait_on_script=wait_on,
                              level=logging.INFOCLI, logerr=False)
        if ret['rc'] != 0:
            raise PbsServiceError(rv=False, rc=ret['rc'], msg=ret['err'])

        ret_msg = True
        if ret['err']:
            ret_msg = ret['err']
        pid = self._validate_pid(inst)
        if pid is None:
            raise PbsServiceError(rv=False, rc=-1, msg="Could not find PID")
        return ret_msg

    def _stop(self, sig='-TERM', inst=None):
        if inst is None:
            return True
        self._signal(sig)
        pid = self._get_pid()
        chk_pid = self._all_instance_pids()
        if pid is None or chk_pid is None:
            return True
        num_seconds = 0
        while (chk_pid is not None) and (str(pid) in chk_pid):
            if num_seconds > 60:
                m = (self.logprefix + 'could not stop service ' +
                     self._instance_to_servicename(inst))
                raise PbsServiceError(rv=False, rc=-1, msg=m)
            time.sleep(1)
            num_seconds += 1
            chk_pid = self._all_instance_pids()
        return True

    def initialise_service(self):
        """
        Purpose of this method is to override and initialise
        the service
        """

    def log_lines(self, logtype, id=None, n=50, tail=True, starttime=None,
                  endtime=None, host=None):
        """
        Return the last ``<n>`` lines of a PBS log file, which
        can be one of ``server``, ``scheduler``, ``MoM``, or
        ``tracejob``

        :param logtype: The entity requested, an instance of a
                        Scheduler, Server or MoM object, or the
                        string 'tracejob' for tracejob
        :type logtype: str or object
        :param id: The id of the object to trace. Only used for
                   tracejob
        :param n: One of 'ALL' of the number of lines to
                  process/display, defaults to 50.
        :type n: str or int
        :param tail: if True, parse log from the end to the start,
                     otherwise parse from the start to the end.
                     Defaults to True.
        :type tail: bool
        :param day: Optional day in ``YYYMMDD`` format. Defaults
                    to current day
        :type day: int
        :param starttime: date timestamp to start matching
        :type starttime: float
        :param endtime: date timestamp to end matching
        :type endtime: float
        :param host: Hostname
        :type host: str
        :returns: Last ``<n>`` lines of logfile for ``Server``,
                  ``Scheduler``, ``MoM or tracejob``
        """
        logval = None
        lines = []
        sudo = False
        if endtime is None:
            endtime = time.time()
        if starttime is None:
            starttime = self.ctime
        if host is None:
            host = self.hostname
        try:
            if logtype == 'tracejob':
                if id is None:
                    return None
                cmd = [os.path.join(
                       self.pbs_conf['PBS_EXEC'],
                       'bin',
                       'tracejob')]
                cmd += [str(id)]
                lines = self.du.run_cmd(host, cmd)['out']
                if n != 'ALL':
                    lines = lines[-n:]
            else:
                daystart = time.strftime("%Y%m%d", time.localtime(starttime))
                dayend = time.strftime("%Y%m%d", time.localtime(endtime))
                firstday_obj = datetime.datetime.strptime(daystart, '%Y%m%d')
                lastday_obj = datetime.datetime.strptime(dayend, '%Y%m%d')
                if logtype == 'accounting':
                    logdir = os.path.join(self.pbs_conf['PBS_HOME'],
                                          'server_priv', 'accounting')
                    sudo = True
                elif ((self.__class__.__name__ == "Scheduler") and
                        'sched_log' in self.attributes):
                    # if setup is multi-sched then get logdir from
                    # its attributes
                    logdir = self.attributes['sched_log']
                else:
                    logval = self._instance_to_logpath(logtype)
                    if logval is None:
                        m = 'Invalid logtype'
                        raise PtlLogMatchError(rv=False, rc=-1, msg=m)
                    logdir = os.path.join(self.pbs_conf['PBS_HOME'], logval)
                while firstday_obj <= lastday_obj:
                    day = firstday_obj.strftime("%Y%m%d")
                    filename = os.path.join(logdir, day)
                    if n == 'ALL':
                        day_lines = self.du.cat(
                            host, filename, sudo=sudo,
                            level=logging.DEBUG2)['out']
                    else:
                        if tail:
                            cmd = ['/usr/bin/tail']
                        else:
                            cmd = ['/usr/bin/head']

                        cmd += ['-n']
                        cmd += [str(n), filename]
                        day_lines = self.du.run_cmd(
                            host, cmd, sudo=sudo,
                            level=logging.DEBUG2)['out']
                    lines.extend(day_lines)
                    firstday_obj = firstday_obj + datetime.timedelta(days=1)
                    if n == 'ALL':
                        continue
                    n = n - len(day_lines)
                    if n <= 0:
                        break
        except (Exception, IOError, PtlLogMatchError):
            self.logger.error('error in log_lines ')
            self.logger.error(traceback.print_exc())
            return None

        return lines

    def _log_match(self, logtype, msg, id=None, n=50, tail=True,
                   allmatch=False, regexp=False, max_attempts=None,
                   interval=None, starttime=None, endtime=None,
                   level=logging.INFO, existence=True):
        """
        Match given ``msg`` in given ``n`` lines of log file

        :param logtype: The entity requested, an instance of a
                        Scheduler, Server, or MoM object, or the
                        strings 'tracejob' for tracejob or
                        'accounting' for accounting logs.
        :type logtype: object
        :param msg: log message to match, can be regex also when
                    ``regexp`` is True
        :type msg: str
        :param id: The id of the object to trace. Only used for
                   tracejob
        :type id: str
        :param n: 'ALL' or the number of lines to search through,
                  defaults to 50
        :type n: str or int
        :param tail: If true (default), starts from the end of
                     the file
        :type tail: bool
        :param allmatch: If True all matching lines out of then
                         parsed are returned as a list. Defaults
                         to False
        :type allmatch: bool
        :param regexp: If true msg is a Python regular expression.
                       Defaults to False
        :type regexp: bool
        :param max_attempts: the number of attempts to make to find
                             a matching entry
        :type max_attempts: int
        :param interval: the interval between attempts
        :type interval: int
        :param starttime: If set ignore matches that occur before
                          specified time
        :type starttime: float
        :param endtime: If set ignore matches that occur after
                        specified time
        :type endtime: float
        :param level: The logging level, defaults to INFO
        :type level: int
        :param existence: If True (default), check for existence of
                        given msg, else check for non-existence of
                        given msg.
        :type existence: bool

        :return: (x,y) where x is the matching line
                 number and y the line itself. If allmatch is True,
                 a list of tuples is returned.
        :rtype: tuple
        :raises PtlLogMatchError:
                When ``existence`` is True and given
                ``msg`` is not found in ``n`` line
                Or
                When ``existence`` is False and given
                ``msg`` found in ``n`` line.

        .. note:: The matching line number is relative to the record
                  number, not the absolute line number in the file.
        """
        try:
            from ptl.utils.pbs_logutils import PBSLogUtils
        except Exception:
            _msg = 'error loading ptl.utils.pbs_logutils'
            raise ImportError(_msg)

        if self.logutils is None:
            self.logutils = PBSLogUtils()
        if max_attempts is None:
            max_attempts = self.ptl_conf['max_attempts']
        if interval is None:
            interval = self.ptl_conf['attempt_interval']
        rv = (None, None)
        attempt = 1
        lines = None
        name = self._instance_to_servicename(logtype)
        infomsg = (name + ' ' + self.shortname +
                   ' log match: searching for "' + msg + '"')
        if regexp:
            infomsg += ' - using regular expression '
        if allmatch:
            infomsg += ' - on all matches '
        if existence:
            infomsg += ' - with existence'
        else:
            infomsg += ' - with non-existence'
        if starttime:
            starttimestr = time.strftime(
                "%Y/%m/%d %H:%M:%S", time.localtime(starttime))
            infomsg += " - from %s" % starttimestr
        if endtime:
            endtimestr = time.strftime(
                "%Y/%m/%d %H:%M:%S", time.localtime(endtime))
            infomsg += " - to %s" % endtimestr
        attemptmsg = ' - No match'
        while attempt <= max_attempts:
            if attempt > 1:
                attemptmsg = ' - attempt ' + str(attempt)
            lines = self.log_lines(logtype, id, n=n, tail=tail,
                                   starttime=starttime, endtime=endtime)
            rv = self.logutils.match_msg(lines, msg, allmatch=allmatch,
                                         regexp=regexp, starttime=starttime,
                                         endtime=endtime)
            if not existence:
                if rv:
                    _msg = infomsg + ' - but exists'
                    raise PtlLogMatchError(rc=1, rv=False, msg=_msg)
                else:
                    self.logger.log(level, infomsg + attemptmsg + '... OK')
                    break
            if rv:
                self.logger.log(level, infomsg + '... OK')
                break
            else:
                if n != 'ALL':
                    if attempt > max_attempts:
                        # We will do one last attempt to match in case the
                        # number of lines that were provided did not capture
                        # the start or end time of interest
                        max_attempts += 1
                    n = 'ALL'
                self.logger.log(level, infomsg + attemptmsg)
            attempt += 1
            time.sleep(interval)
        try:
            # Depending on whether the hostname is local or remote and whether
            # sudo privileges were required, lines returned by log_lines can be
            # an open file descriptor, we close here but ignore errors in case
            # any were raised for all irrelevant cases
            lines.close()
        except Exception:
            pass
        if (rv is None and existence):
            _msg = infomsg + attemptmsg
            raise PtlLogMatchError(rc=1, rv=False, msg=_msg)
        return rv

    def accounting_match(self, msg, id=None, n=50, tail=True,
                         allmatch=False, regexp=False, max_attempts=None,
                         interval=None, starttime=None, endtime=None,
                         level=logging.INFO, existence=True):
        """
        Match given ``msg`` in given ``n`` lines of accounting log

        :param msg: log message to match, can be regex also when
                    ``regexp`` is True
        :type msg: str
        :param id: The id of the object to trace. Only used for
                   tracejob
        :type id: str
        :param n: 'ALL' or the number of lines to search through,
                  defaults to 50
        :type n: str or int
        :param tail: If true (default), starts from the end of
                     the file
        :type tail: bool
        :param allmatch: If True all matching lines out of then
                         parsed are returned as a list. Defaults
                         to False
        :type allmatch: bool
        :param regexp: If true msg is a Python regular expression.
                       Defaults to False
        :type regexp: bool
        :param max_attempts: the number of attempts to make to find
                             a matching entry
        :type max_attempts: int
        :param interval: the interval between attempts
        :type interval: int
        :param starttime: If set ignore matches that occur before
                          specified time
        :type starttime: int
        :param endtime: If set ignore matches that occur after
                        specified time
        :type endtime: int
        :param level: The logging level, defaults to INFO
        :type level: int
        :param existence: If True (default), check for existence of
                        given msg, else check for non-existence of
                        given msg.
        :type existence: bool

        :return: (x,y) where x is the matching line
                 number and y the line itself. If allmatch is True,
                 a list of tuples is returned.
        :rtype: tuple
        :raises PtlLogMatchError:
                When ``existence`` is True and given
                ``msg`` is not found in ``n`` line
                Or
                When ``existence`` is False and given
                ``msg`` found in ``n`` line.

        .. note:: The matching line number is relative to the record
                  number, not the absolute line number in the file.
        """
        return self._log_match('accounting', msg, id, n, tail, allmatch,
                               regexp, max_attempts, interval, starttime,
                               endtime, level, existence)

    def tracejob_match(self, msg, id=None, n=50, tail=True,
                       allmatch=False, regexp=False, max_attempts=None,
                       interval=None, starttime=None, endtime=None,
                       level=logging.INFO, existence=True):
        """
        Match given ``msg`` in given ``n`` lines of tracejob log

        :param msg: log message to match, can be regex also when
                    ``regexp`` is True
        :type msg: str
        :param id: The id of the object to trace.
        :type id: str
        :param n: 'ALL' or the number of lines to search through,
                  defaults to 50
        :type n: str or int
        :param tail: If true (default), starts from the end of
                     the file
        :type tail: bool
        :param allmatch: If True all matching lines out of then
                         parsed are returned as a list. Defaults
                         to False
        :type allmatch: bool
        :param regexp: If true msg is a Python regular expression.
                       Defaults to False
        :type regexp: bool
        :param max_attempts: the number of attempts to make to find
                             a matching entry
        :type max_attempts: int
        :param interval: the interval between attempts
        :type interval: int
        :param starttime: If set ignore matches that occur before
                          specified time
        :type starttime: float
        :param endtime: If set ignore matches that occur after
                        specified time
        :type endtime: float
        :param level: The logging level, defaults to INFO
        :type level: int
        :param existence: If True (default), check for existence of
                        given msg, else check for non-existence of
                        given msg.
        :type existence: bool

        :return: (x,y) where x is the matching line
                 number and y the line itself. If allmatch is True,
                 a list of tuples is returned.
        :rtype: tuple
        :raises PtlLogMatchError:
                When ``existence`` is True and given
                ``msg`` is not found in ``n`` line
                Or
                When ``existence`` is False and given
                ``msg`` found in ``n`` line.

        .. note:: The matching line number is relative to the record
                  number, not the absolute line number in the file.
        """
        return self._log_match('tracejob', msg, id, n, tail, allmatch,
                               regexp, max_attempts, interval, starttime,
                               endtime, level, existence)

    def _save_config_file(self, dict_conf, fname):
        ret = self.du.cat(self.hostname, fname, sudo=True)
        if ret['rc'] == 0:
            dict_conf[fname] = ret['out']
        else:
            self.logger.error('error saving configuration ' + fname)

    def _load_configuration(self, infile, objtype=None):
        """
        Load configuration as was saved in infile

        :param infile: the file in which configuration
                       was saved
        :type infile: str
        :param objtype: the object type to load configuration
                        for, one of server, scheduler, mom or
                        if None, load all objects in infile
        """
        if os.path.isfile(infile):
            conf = {}
            sconf = {}
            with open(infile, 'r') as f:
                try:
                    sconf = json.load(f)
                except ValueError:
                    self.logger.info("Error loading JSON file: %s"
                                     % infile)
                    return False
            conf = sconf[str(objtype)]
            if objtype == MGR_OBJ_SERVER:
                qmgr = os.path.join(self.client_conf['PBS_EXEC'],
                                    'bin', 'qmgr')
                for k, v in conf.items():
                    # Load server configuration
                    if k.startswith('qmgr_'):
                        fpath = self.du.create_temp_file()
                        print_svr = '\n'.join(v)
                        with open(fpath, 'w') as f:
                            f.write(print_svr)
                        file_qmgr = open(fpath)
                        d = self.du.run_cmd(
                            self.hostname, [qmgr], stdin=file_qmgr, sudo=True,
                            logerr=False, level=logging.DEBUG)
                        err_msg = "Failed to load server configurations"
                        file_qmgr.close()
                        if d['rc'] != 0:
                            self.logger.error("%s" % err_msg)
                            return False
                    # Load pbs.conf file
                    elif k == "pbs_conf":
                        enc_utf = v.encode('UTF-8')
                        dec_b64 = base64.b64decode(enc_utf)
                        cfg_vals = dec_b64.decode('UTF-8')
                        config = ast.literal_eval(cfg_vals)
                        self.du.set_pbs_config(self.hostname, confs=config)
                    # Load hooks
                    elif k == "hooks":
                        fpath = self.du.create_temp_file()
                        print_hooks = '\n'.join(v['qmgr_print_hook'])
                        with open(fpath, 'w') as f:
                            f.write(print_hooks)
                        file_qmgr = open(fpath)
                        d = self.du.run_cmd(
                            self.hostname, [qmgr], stdin=file_qmgr, sudo=True,
                            level=logging.DEBUG)
                        file_qmgr.close()
                        if d['rc'] != 0:
                            self.logger.error("Failed to load site hooks")
                if 'pbsnodes' in conf:
                    nodes = conf['pbsnodes']
                    for node in nodes:
                        node_name = str(node['id'])
                        nodes_created = self.create_pbsnode(node_name, node)
                        if not nodes_created:
                            self.logger.error("Failed to create node: %s"
                                              % node)
                            return False
                return True
            elif objtype == MGR_OBJ_SCHED:
                for k, v in conf.items():
                    fn = self.du.create_temp_file()
                    try:
                        rv = self.du.chmod(path=fn, mode=0o644)
                        if not rv:
                            self.logger.error("Failed to restore " +
                                              "configuration: %s" % k)
                            return False
                        with open(fn, 'w') as fd:
                            fd.write("\n".join(v))
                        rv = self.du.run_copy(
                            self.hostname, src=fn, dest=k, sudo=True)
                        if rv['rc'] != 0:
                            self.logger.error("Failed to restore " +
                                              "configuration: %s" % k)
                            return False
                        rv = self.du.chown(path=k, runas=ROOT_USER,
                                           uid=0, gid=0, sudo=True)
                        if not rv:
                            self.logger.error("Failed to restore " +
                                              "configuration: %s" % k)
                            return False
                    except Exception:
                        self.logger.error("Failed to restore " +
                                          "configuration: %s" % k)
                        return False
                    finally:
                        if os.path.isfile(fn):
                            self.du.rm(path=fn, force=True, sudo=True)
                return True
            elif objtype == MGR_OBJ_NODE:
                nconf = conf[str(self.hostname)]
                for k, v in nconf.items():
                    try:
                        fn = self.du.create_temp_file()
                        rv = self.du.chmod(path=fn, mode=0o644)
                        if not rv:
                            self.logger.error("Failed to restore " +
                                              "configuration: %s" % k)
                            return False
                        with open(fn, 'w') as fd:
                            mom_config_data = "\n".join(v) + "\n"
                            fd.write(mom_config_data)
                        rv = self.du.run_copy(
                            self.hostname, src=fn, dest=k, sudo=True)
                        if rv['rc'] != 0:
                            self.logger.error("Failed to restore " +
                                              "configuration: %s" % k)
                            return False
                        rv = self.du.chown(path=k, runas=ROOT_USER,
                                           uid=0, gid=0, sudo=True)
                        if not rv:
                            self.logger.error("Failed to restore " +
                                              "configuration: %s" % k)
                            return False
                    except Exception:
                        self.logger.error("Failed to restore " +
                                          "configuration: %s" % k)
                        return False
                    finally:
                        if os.path.isfile(fn):
                            self.du.rm(path=fn, force=True, sudo=True)
                return True

    def create_pbsnode(self, node_name, attrs):
        """
        Create node in PBS with given attributes
        """
        qmgr = os.path.join(self.client_conf['PBS_EXEC'],
                            'bin', 'qmgr')
        execcmd = "create node " + node_name
        execcmd += " Port=" + attrs['Port']
        cmd = [qmgr, "-c", execcmd]
        ret = self.du.run_cmd(self.hostname, cmd, sudo=True)
        if ret['rc'] != 0:
            self.logger.info("Failed to create node: %s" % node_name)
            self.logger.error("Error: %s" % ret['err'])
            return False
        # skip all read-only attributes
        skip_atb_list = ['id', 'pbs_version', 'pcpus',
                         'last_state_change_time', 'ntype',
                         'Mom', 'sharing', 'resources_available.vnode',
                         'resources_available.host', 'last_used_time',
                         'resource_assigned', 'resv', 'Port'
                         ]
        for node_atb, val in attrs.items():
            # only offline state of node is read, write attribute
            if(node_atb in skip_atb_list or
               'resources_assigned' in node_atb or
               (node_atb == 'state' and val != 'offline')):
                continue
            k = str(node_atb)
            v = str(val)
            execcmd = "set node %s %s='%s'" % (node_name, k, v)
            cmd = [qmgr, "-c", execcmd]
            ret = self.du.run_cmd(self.hostname, cmd, sudo=True,
                                  level=logging.DEBUG)
            if ret['rc'] != 0:
                self.logger.info("Failed to set node attribute %s=%s" % (k, v))
                return False
        return True

    def get_tempdir(self):
        """
        platform independent call to get a temporary directory
        """
        return self.du.get_tempdir(self.hostname)

    def get_uname(self, hostname=None, pyexec=None):
        """
        Get a local or remote platform info in uname format, essentially
        the value of Python's platform.uname
        :param hostname: The hostname to query for platform info
        :type hostname: str or None
        :param pyexec: A path to a Python interpreter to use to query
                       a remote host for platform info
        :type pyexec: str or None
        For efficiency the value is cached and retrieved from the
        cache upon subsequent request
        """
        uplatform = ' '.join(platform.uname())
        if hostname is None:
            hostname = socket.gethostname()
        if not self.du.is_localhost(hostname):
            if pyexec is None:
                pyexec = self.du.which(
                    hostname, 'python3', level=logging.DEBUG2)
            _cmdstr = '"import platform;'
            _cmdstr += 'print(\' \'.join(platform.uname()))"'
            cmd = [pyexec, '-c', _cmdstr]
            ret = self.du.run_cmd(hostname, cmd=cmd)
            if ret['rc'] != 0 or len(ret['out']) == 0:
                _msg = 'Unable to retrieve platform info,'
                _msg += 'defaulting to local platform'
                self.logger.warning(_msg)
            else:
                uplatform = ret['out'][0]
        return uplatform

    def get_os_info(self, hostname=None, pyexec=None):
        """
        Get a local or remote OS info
        :param hostname: The hostname to query for platform info
        :type hostname: str or None
        :param pyexec: A path to a Python interpreter to use to query
                       a remote host for platform info
        :type pyexec: str or None
        :returns: a 'str' object containing os info
        """

        local_info = platform.platform()

        if hostname is None or self.du.is_localhost(hostname):
            return local_info

        if pyexec is None:
            pyexec = self.du.which(hostname, 'python3', level=logging.DEBUG2)

        cmd = [pyexec, '-c',
               '"import platform; print(platform.platform())"']
        ret = self.du.run_cmd(hostname, cmd=cmd)
        if ret['rc'] != 0 or len(ret['out']) == 0:
            self.logger.warning("Unable to retrieve OS info, defaulting "
                                "to local")
            ret_info = local_info
        else:
            ret_info = ret['out'][0]

        return ret_info

    def __str__(self):
        return (self.__class__.__name__ + ' ' + self.hostname + ' config ' +
                self.pbs_conf_file)

    def __repr__(self):
        return (self.__class__.__name__ + '/' + self.pbs_conf_file + '@' +
                self.hostname)

    def cleanup_files(self):
        """
        This function removes any dynamic resource files created by server/mom
        objects
        """
        for dyn_files in self.dyn_created_files:
            self.du.rm(path=dyn_files, sudo=True, force=True)
        self.dyn_created_files = []

    def isUp(self, max_attempts=None):
        """
        Check for daemons up
        """
        if max_attempts is None:
            max_attempts = self.ptl_conf['max_attempts']
        for _ in range(max_attempts):
            rv = self._isUp()
            if rv:
                break
            time.sleep(1)
        return rv

    def signal(self, sig):
        """
        Send signal to daemons
        """
        self.logger.info(self.__class__.__name__ + " sent signal " + sig)
        return self._signal(sig)

    def get_pid(self):
        """
        Get the daemons pid
        """
        return self._get_pid()

    def all_instance_pids(self):
        """
        Get all pids of given instance
        """
        return self._all_instance_pids()


================================================
FILE: test/fw/ptl/lib/ptl_types.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import collections
import datetime
import os
import re
import sys
import time
import string
import random
try:
    from collections.abc import Callable  # Python 3.10+
except ImportError:
    from collections import Callable  # For Python versions before 3.10


class PbsAttribute(object):
    """
    Descriptor class for PBS attribute

    :param name: PBS attribute name
    :type name: str
    :param value: Value for the attribute
    :type value: str or int or float
    """

    def __init__(self, name=None, value=None):
        self.set_name(name)
        self.set_value(value)

    @classmethod
    def isfloat(cls, value):
        """
        returns true if value is a float or a string representation
        of a float returns false otherwise

        :param value: value to be checked
        :type value: str or int or float
        :returns: True or False
        """
        if isinstance(value, float):
            return True
        if isinstance(value, str):
            try:
                float(value)
                return True
            except ValueError:
                return False

    @classmethod
    def decode_value(cls, value):
        """
        Decode an attribute/resource value, if a value is
        made up of digits only then return the numeric value
        of it, if it is made of alphanumeric values only, return
        it as a string, if it is of type size, i.e., with a memory
        unit such as b,kb,mb,gb then return the converted size to
        kb without the unit

        :param value: attribute/resource value
        :type value: str or int
        :returns: int or float or string
        """

        if value is None or isinstance(value, Callable):
            return value

        if isinstance(value, (int, float)):
            return value

        if value.isdigit():
            return int(value)

        if value.isalpha() or value == '':
            return value

        if cls.isfloat(value):
            return float(value)

        if ':' in value:
            try:
                value = int(PbsTypeDuration(value))
            except ValueError:
                pass
            return value

        # TODO revisit:  assume (this could be the wrong type, need a real
        # data model anyway) that the remaining is a memory expression
        try:
            value = PbsTypeSize(value)
            return value.value
        except ValueError:
            pass
        except TypeError:
            # if not then we pass to return the value as is
            pass

        return value

    @classmethod
    def random_str(cls, length=1, prefix=''):
        """
        Generates the random string

        :param length: Length of the string
        :type length: int
        :param prefix: Prefix of the string
        :type prefix: str
        :returns: Random string
        """
        r = [random.choice(string.ascii_letters) for _ in range(length)]
        r = ''.join([prefix] + r)
        if hasattr(cls, '__uniq_rstr'):
            while r in cls.__uniq_rstr:
                r = [random.choice(string.ascii_letters)
                     for _ in range(length)]
                r = ''.join([prefix] + r)
            cls.__uniq_rstr.append(r)
        else:
            cls.__uniq_rstr = [r]

        return r

    def set_name(self, name):
        """
        Set PBS attribute name

        :param name: PBS attribute
        :type name: str
        """
        self.name = name
        if name is not None and '.' in name:
            self.is_resource = True
            self.resource_type, self.resource_name = self.name.split('.')
        else:
            self.is_resource = False
            self.resource_type = self.resource_name = None

    def set_value(self, value):
        """
        Set PBS attribute value

        :param value: Value of PBS attribute
        :type value: str or int or float
        """
        self.value = value
        if isinstance(value, (int, float)) or str(value).isdigit():
            self.is_consumable = True
        else:
            self.is_consumable = False

    def obfuscate_name(self, a=None):
        """
        Obfuscate PBS attribute name
        """
        if a is not None:
            on = a
        else:
            on = cls.random_str(len(self.name))

        self.decoded_name = self.name
        if self.is_resource:
            self.set_name(self.resource_name + '.' + on)

    def obfuscate_value(self, v=None):
        """
        Obfuscate PBS attribute value
        """
        if not self.is_consuable:
            self.decoded_value = self.value
            return

        if v is not None:
            ov = v
        else:
            ov = cls.random_str(len(self.value))

        self.decoded_value = self.value
        self.set_value(ov)


class PbsTypeSize(str):

    """
    Descriptor class for memory as a numeric entity.
    Units can be one of ``b``, ``kb``, ``mb``, ``gb``, ``tb``, ``pt``

    :param unit: The unit type associated to the memory value
    :type unit: str
    :param value: The numeric value of the memory
    :type value: int or None
    :raises: ValueError and TypeError
    """

    def __init__(self, value=None):
        if value is None:
            return

        if len(value) < 2:
            raise ValueError

        if value[-1:] in ('b', 'B') and value[:-1].isdigit():
            self.unit = 'b'
            self.value = int(int(value[:-1]) / 1024)
            return

        # lower() applied to ignore case
        unit = value[-2:].lower()
        self.value = value[:-2]
        if not self.value.isdigit():
            raise ValueError
        if unit == 'kb':
            self.value = int(self.value)
        elif unit == 'mb':
            self.value = int(self.value) * 1024
        elif unit == 'gb':
            self.value = int(self.value) * 1024 * 1024
        elif unit == 'tb':
            self.value = int(self.value) * 1024 * 1024 * 1024
        elif unit == 'pb':
            self.value = int(self.value) * 1024 * 1024 * 1024 * 1024
        else:
            raise TypeError
        self.unit = 'kb'

    def encode(self, value=None, valtype='kb', precision=1):
        """
        Encode numeric memory input in kilobytes to a string, including
        unit

        :param value: The numeric value of memory to encode
        :type value: int or None.
        :param valtype: The unit of the input value, defaults to kb
        :type valtype: str
        :param precision: Precision of the encoded value, defaults to 1
        :type precision: int
        :returns: Encoded memory in kb to string
        """
        if value is None:
            value = self.value

        if valtype == 'b':
            val = value
        elif valtype == 'kb':
            val = value * 1024
        elif valtype == 'mb':
            val = value * 1024 * 1024
        elif valtype == 'gb':
            val = value * 1024 * 1024 * 1024 * 1024
        elif valtype == 'tb':
            val = value * 1024 * 1024 * 1024 * 1024 * 1024
        elif valtype == 'pt':
            val = value * 1024 * 1024 * 1024 * 1024 * 1024 * 1024

        m = (
            (1 << 50, 'pb'),
            (1 << 40, 'tb'),
            (1 << 30, 'gb'),
            (1 << 20, 'mb'),
            (1 << 10, 'kb'),
            (1, 'b')
        )

        for factor, suffix in m:
            if val >= factor:
                break

        return '%.*f%s' % (precision, float(val) / factor, suffix)

    def __cmp__(self, other):
        if self.value < other.value:
            return -1
        if self.value == other.value:
            return 0
        return 1

    def __lt__(self, other):
        if self.value < other.value:
            return True
        return False

    def __le__(self, other):
        if self.value <= other.value:
            return True
        return False

    def __gt__(self, other):
        if self.value > other.value:
            return True
        return False

    def __ge__(self, other):
        if self.value < other.value:
            return True
        return False

    def __eq__(self, other):
        if self.value == other.value:
            return True
        return False

    def __get__(self):
        return self.value

    def __add__(self, other):
        if isinstance(other, int):
            self.value += other
        else:
            self.value += other.value
        return self

    def __mul__(self, other):
        if isinstance(other, int):
            self.value *= other
        else:
            self.value *= other.value
        return self

    def __floordiv__(self, other):
        self.value /= other.value
        return self

    def __sub__(self, other):
        self.value -= other.value
        return self

    def __repr__(self):
        return self.__str__()

    def __str__(self):
        return self.encode(valtype=self.unit)


class PbsTypeDuration(str):

    """
    Descriptor class for a duration represented as ``hours``,
    ``minutes``, and ``seconds``,in the form of ``[HH:][MM:]SS``

    :param as_seconds: HH:MM:SS represented in seconds
    :type as_seconds: int
    :param as_str: duration represented in HH:MM:SS
    :type as_str: str
    """

    def __init__(self, val):
        if isinstance(val, str):
            if ':' in val:
                s = val.split(':')
                fields = len(s)
                if fields > 3:
                    raise ValueError
                hr = mn = sc = 0
                if fields >= 2:
                    sc = s[fields - 1]
                    mn = s[fields - 2]
                    if fields == 3:
                        hr = s[0]
                self.duration = int(hr) * 3600 + int(mn) * 60 + int(sc)
            elif val.isdigit():
                self.duration = int(val)
        elif isinstance(val, int) or isinstance(val, float):
            self.duration = val

    def __add__(self, other):
        self.duration += other.duration
        return self

    def __sub__(self, other):
        self.duration -= other.duration
        return self

    def __cmp__(self, other):
        if self.duration < other.duration:
            return -1
        if self.duration == other.duration:
            return 0
        return 1

    def __lt__(self, other):
        if self.duration < other.duration:
            return True
        return False

    def __le__(self, other):
        if self.duration <= other.duration:
            return True
        return False

    def __gt__(self, other):
        if self.duration > other.duration:
            return True
        return False

    def __ge__(self, other):
        if self.duration < other.duration:
            return True
        return False

    def __eq__(self, other):
        if self.duration == other.duration:
            return True
        return False

    def __get__(self):
        return self.as_str

    def __repr__(self):
        return self.__str__()

    def __int__(self):
        return int(self.duration)

    def __str__(self):
        return str(datetime.timedelta(seconds=self.duration))


class PbsTypeArray(list):

    """
    Descriptor class for a PBS array list type, e.g. String array

    :param value: Array value to be passed
    :param sep: Separator for two array elements
    :type sep: str
    :returns: List
    """

    def __init__(self, value=None, sep=','):
        self.separator = sep
        self = list.__init__(self, value.split(sep))

    def __str__(self):
        return self.separator.join(self)


class PbsTypeList(dict):

    """
    Descriptor class for a generic PBS list that are key/value pairs
    delimited

    :param value: List value to be passed
    :param sep: Separator for two key/value pair
    :type sep: str
    :param kvsep: Separator for key and value
    :type kvsep: str
    :returns: Dictionary
    """

    def __init__(self, value=None, sep=',', kvsep='='):
        self.kvsep = kvsep
        self.separator = sep
        d = {}
        as_list = [v.split(kvsep) for v in value.split(sep)]
        if as_list:
            for k, v in as_list:
                d[k] = v
            del as_list
        dict.__init__(self, d)

    def __str__(self):
        s = []
        for k, v in self.items():
            s += [str(k) + self.kvsep + str(v)]
        return self.separator.join(s)


class PbsTypeLicenseCount(PbsTypeList):

    """
    Descriptor class for a PBS license_count attribute.

    It is a specialized list where key/values are ':' delimited, separated
    by a ' ' (space)

    :param value: PBS license_count attribute value
    :returns: Specialized list
    """

    def __init__(self, value=None):
        super(PbsTypeLicenseCount, self).__init__(value, sep=' ', kvsep=':')


class PbsTypeVariableList(PbsTypeList):

    """
    Descriptor class for a PBS Variable_List attribute

    It is a specialized list where key/values are '=' delimited, separated
    by a ',' (space)

    :param value: PBS Variable_List attribute value
    :returns: Specialized list
    """

    def __init__(self, value=None):
        super(PbsTypeVariableList, self).__init__(value, sep=',', kvsep='=')


class PbsTypeSelect(list):

    """
    Descriptor class for PBS select/schedselect specification.
    Select is of the form:

    ``<select> ::= <m>":"<chunk> | <select>"+"<select>``

    ``<m> ::= <digit> | <digit><m>``

    ``<chunk> ::= <resc_name>":"<resc_value> | <chunk>":"<chunk>``

    ``<m>`` is a multiplying factor for each chunk requested

    ``<chunk>`` are resource key/value pairs

    The type populates a list of single chunk of resource
    ``key/value`` pairs, the list can be walked by iterating over
    the type itself.

    :param num_chunks: The total number of chunks in the select
    :type num_chunk: int
    :param resources: A dictionary of all resource counts in the select
    :type resources: Dictionary
    """

    def __init__(self, s=None):
        if s is not None:
            self._as_str = s
            self.resources = {}
            self.num_chunks = 0
            nc = s.split('+')
            for chunk in nc:
                self._parse_chunk(chunk)

    def _parse_chunk(self, chunk):
        d = chunk.split(':')
        # number of chunks
        _num_chunks = int(d[0])
        self.num_chunks += _num_chunks
        r = {}
        for e in d[1:]:
            k, v = e.split('=')
            r[k] = v
            if 'mem' in k:
                try:
                    v = PbsTypeSize(v).value
                except Exception:
                    # failed so we guessed wrong on the type
                    pass
            if isinstance(v, int) or v.isdigit():
                if k not in self.resources:
                    self.resources[k] = _num_chunks * int(v)
                else:
                    self.resources[k] += _num_chunks * int(v)
            else:
                if k not in self.resources:
                    self.resources[k] = v
                else:
                    self.resources[k] = [self.resources[k], v]

        # explicitly expose the multiplying factor
        for _ in range(_num_chunks):
            self.append(r)

    def __add__(self, chunk=None):
        if chunk is None:
            return self
        self._parse_chunk(chunk)
        self._as_str = self._as_str + "+" + chunk
        return self

    def __repr__(self):
        return str(self)

    def __str__(self):
        return self._as_str


class PbsTypeChunk(dict):

    """
    Descriptor class for a PBS chunk associated to a
    ``PbsTypeExecVnode``.This type of chunk corresponds to
    a node solution to a resource request,not to the select
    specification.

    ``chunk ::= <subchk> | <chunk>"+"<chunk>``

    ``subchk ::= <node>":"<resource>``

    ``resource ::= <key>":"<val> | <resource>":"<resource>``

    A chunk expresses a solution to a specific select-chunk
    request. If multiple chunks are needed to solve a single
    select-chunk, e.g., on a shared memory system, the chunk
    will be extended into virtual chunk,vchunk.

    :param vnode: the vnode name corresponding to the chunk
    :type vnode: str or None
    :param resources: the key value pair of resources in
                      dictionary form
    :type resources: Dictionary or None
    :param vchunk: a list of virtual chunks needed to solve
                   the select-chunk, vchunk is only set if more
                   than one vchunk are required to solve the
                   select-chunk
    :type vchunk: list
    """

    def __init__(self, vnode=None, resources=None, chunkstr=None):
        self.vnode = vnode
        if resources is not None:
            self.resources = resources
        else:
            self.resources = {}
        self.vchunk = []
        self.as_str = chunkstr
        self.__parse_chunk(chunkstr)

    def __parse_chunk(self, chunkstr=None):
        if chunkstr is None:
            return

        vchunks = chunkstr.split('+')
        if len(vchunks) == 1:
            entities = chunkstr.split(':')
            self.vnode = entities[0]
            if len(entities) > 1:
                for e in entities[1:]:
                    (r, v) = e.split('=')
                    self.resources[r] = v
            self[self.vnode] = self.resources
        else:
            for sc in vchunks:
                chk = PbsTypeChunk(chunkstr=sc)
                self.vchunk.append(chk)
                self[chk.vnode] = chk.resources

    def add(self, vnode, resources):
        """
        Add a chunk specificiation. If a chunk is already
        defined, add the chunk as a vchunk.

        :param vnode: The vnode to add
        :type vnode: str
        :param resources: The resources associated to the
                          vnode
        :type resources: str
        :returns: Added chunk specification
        """
        if self.vnode == vnode:
            self.resources = {**self.resources, **resources}
            return self
        elif len(self.vchunk) != 0:
            for chk in self.vchunk:
                if chk.vnode == vnode:
                    chk.resources = {**self.resources, **resources}
                    return self
        chk = PbsTypeChunk(vnode, resources)
        self.vchunk.append(chk)
        return self

    def __repr__(self):
        return self.__str__()

    def __str__(self):
        _s = ["("]
        _s += [self.vnode, ":"]
        for resc_k, resc_v in self.resources.items():
            _s += [resc_k, "=", str(resc_v)]
        if self.vchunk:
            for _v in self.vchunk:
                _s += ["+", _v.vnode, ":"]
                for resc_k, resc_v in _v.resources.items():
                    _s += [resc_k, "=", str(resc_v)]
        _s += [")"]
        return "".join(_s)


class PbsTypeExecVnode(list):

    """
    Execvnode representation, expressed as a list of
    PbsTypeChunk

    :param vchunk: List of virtual chunks, only set when
                   more than one vnode is allocated to a
                   host satisfy a chunk requested
    :type vchunk: List
    :param num_chunks: The number of chunks satisfied by
                       this execvnode
    :type num_chunks: int
    :param vnodes: List of vnode names allocated to the execvnode
    :type vnodes: List
    :param resource: method to return the amount of a named
                     resource satisfied by this execvnode
    """

    def __init__(self, s=None):
        if s is None:
            return None

        self._as_str = s
        start = 0
        self.num_chunks = 0
        for c in range(len(s)):
            # must split on '+' between parens because '+' can occur within
            # paren for complex specs
            if s[c] == '(':
                start = c + 1
            if s[c] == ')':
                self.append(PbsTypeChunk(chunkstr=s[start:c]))
                self.num_chunks += 1

    def resource(self, name=None):
        """
        :param name: Name of the resource
        :type name: str or None
        """
        if name is None:
            return None
        _total = 0
        for _c in self:
            if _c.vchunk:
                for _v in _c.vchunk:
                    if name in _v.resources:
                        _total += int(_v.resources[name])
            if name in _c.resources:
                if name in _c.resources:
                    _total += int(_c.resources[name])
        return _total

    @property
    def vnodes(self):
        vnodes = []
        for e in self:
            vnodes += [e.vnode]
            if e.vchunk:
                vnodes += [n.vnode for n in e.vchunk]

        return list(set(vnodes))

    def _str__(self):
        return self._as_str
        # below would be to verify that the converted type maps back correctly
        _s = []
        for _c in self:
            _s += [str(_c)]
        return "+".join(_s)


class PbsTypeExecHost(str):

    """
    Descriptor class for exec_host attribute

    :param hosts: List of hosts in the exec_host. Each entry is
                  a host info dictionary that maps the number of
                  cpus and its task number
    :type hosts: List
    """

    def __init__(self, s=None):
        if s is None:
            return None

        self._as_str = s

        self.hosts = []
        hsts = s.split('+')
        for h in hsts:
            hi = {}
            ti = {}
            (host, task) = h.split('/',)
            d = task.split('*')
            if len(d) == 1:
                taskslot = d[0]
                ncpus = 1
            elif len(d) == 2:
                (taskslot, ncpus) = d
            else:
                (taskslot, ncpus) = (0, 1)
            ti['task'] = taskslot
            ti['ncpus'] = ncpus
            hi[host] = ti
            self.hosts.append(hi)

    def __repr__(self):
        return str(self.hosts)

    def __str__(self):
        return self._as_str


class PbsTypeJobId(str):

    """
    Descriptor class for a Job identifier

    :param id: The numeric portion of a job identifier
    :type id: int
    :param server_name: The pbs server name
    :type server_name: str
    :param server_shortname: The first portion of a FQDN server
                             name
    :type server_shortname: str
    """

    def __init__(self, value=None):
        if value is None:
            return

        self.value = value

        r = value.split('.', 1)
        if len(r) != 2:
            return

        self.id = int(r[0])
        self.server_name = r[1]
        self.server_shortname = r[1].split('.', 1)[0]

    def __str__(self):
        return str(self.value)


class PbsTypeFGCLimit(object):

    """
    FGC limit entry, of the form:

    ``<limtype>[.<resource>]=[<entity_type>:<entity_name>=
    <entity_value>]``

    :param attr: FGC limit attribute
    :type attr: str
    :param value: Value of attribute
    :type value: int
    :returns: FGC limit entry of given format
    """

    fgc_attr_pat = re.compile(r"(?P<ltype>[a-z_]+)[\.]*(?P<resource>[\w\d-]*)")
    fgc_val_pat = re.compile(r"[\s]*\[(?P<etype>[ugpo]):(?P<ename>[\w\d-]+)"
                             r"=(?P<eval>[\d]+)\][\s]*")

    def __init__(self, attr, val):

        self.attr = attr
        self.val = val

        a = self.fgc_attr_pat.match(attr)
        if a:
            self.limit_type = a.group('ltype')
            self.resource_name = a.group('resource')
        else:
            self.limit_type = None
            self.resource_name = None

        v = self.fgc_val_pat.match(val)
        if v:
            self.lim_value = PbsAttribute.decode_value(v.group('eval'))
            self.entity_type = v.group('etype')
            self.entity_name = v.group('ename')
        else:
            self.lim_value = None
            self.entity_type = None
            self.entity_name = None

    def __val__(self):
        return ('[' + str(self.entity_type) + ':' +
                str(self.entity_name) + '=' + str(self.lim_value) + ']')

    def __str__(self):
        return (self.attr + ' = ' + self.__val__())


class PbsTypeAttribute(dict):

    """
    Experimental. This is a placeholder object that will be used
    in the future to map attribute information and circumvent
    the error-pron dynamic type detection that is currently done
    using ``decode_value()``
    """

    def __getitem__(self, name):
        return PbsAttribute.decode_value(super(PbsTypeAttribute,
                                               self).__getitem__(name))


================================================
FILE: test/fw/ptl/lib/ptl_wrappers.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import ast
import base64
import collections
import copy
import datetime
import grp
import json
import logging
import os
import pickle
import pwd
import random
import re
import socket
import string
import sys
import tempfile
import threading
import time
import traceback
from collections import OrderedDict
from distutils.version import LooseVersion
from operator import itemgetter

from ptl.lib.pbs_api_to_cli import api_to_cli
from ptl.lib.ptl_batchutils import BatchUtils
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_dshutils import DshUtils, PtlUtilError, get_method_name
from ptl.utils.pbs_procutils import ProcUtils
from ptl.utils.pbs_testusers import (ROOT_USER, TEST_USER, PbsUser,
                                     DAEMON_SERVICE_USER)

try:
    import psycopg2
    PSYCOPG = True
except Exception:
    PSYCOPG = False
from ptl.lib.ptl_error import (PbsStatusError, PbsSubmitError,
                               PbsDeljobError, PbsDelresvError,
                               PbsDeleteError, PbsSelectError,
                               PbsManagerError, PbsSignalError,
                               PbsAlterError, PbsHoldError,
                               PbsRerunError, PbsOrderError,
                               PbsRunError, PbsMoveError,
                               PbsQtermError, PbsQdisableError,
                               PbsQenableError, PbsQstartError,
                               PbsQstopError, PbsResourceError,
                               PbsResvAlterError, PtlExpectError,
                               PbsConnectError, PbsServiceError,
                               PbsInitServicesError, PbsMessageError,
                               PtlLogMatchError)
from ptl.lib.ptl_types import PbsAttribute
from ptl.lib.ptl_constants import *
from ptl.lib.ptl_entities import (Hook, Queue, Entity, Limit,
                                  EquivClass, Resource)
from ptl.lib.ptl_resourceresv import Job, Reservation, InteractiveJob
from ptl.lib.ptl_sched import Scheduler
from ptl.lib.ptl_mom import MoM, get_mom_obj
from ptl.lib.ptl_service import PBSService, PBSInitServices
from ptl.lib.ptl_expect_action import ExpectActions
try:
    from nose.plugins.skip import SkipTest
except ImportError:
    class SkipTest(Exception):
        pass

try:
    from collections.abc import Callable  # Python 3.10+
except ImportError:
    from collections import Callable  # For Python versions before 3.10


class Wrappers(PBSService):
    dflt_attributes = {
        ATTR_dfltque: "workq",
        ATTR_nodefailrq: "310",
        ATTR_FlatUID: 'True',
        ATTR_DefaultChunk + ".ncpus": "1",
    }

    dflt_sched_name = 'default'

    # this pattern is a bit relaxed to match common developer build numbers
    version_tag = re.compile(r"[a-zA-Z_]*(?P<version>[\d\.]+.[\w\d\.]*)[\s]*")

    actions = ExpectActions()

    # these server attributes revert back to default value when unset
    __special_attr_keys = {SERVER: [ATTR_scheduling, ATTR_logevents,
                                    ATTR_mailfrom, ATTR_queryother,
                                    ATTR_rescdflt + '.ncpus', ATTR_schedit,
                                    ATTR_ResvEnable, ATTR_maxarraysize,
                                    ATTR_license_min, ATTR_license_max,
                                    ATTR_license_linger,
                                    ATTR_EligibleTimeEnable,
                                    ATTR_max_concurrent_prov],
                           SCHED: [ATTR_sched_cycle_len, ATTR_scheduling,
                                   ATTR_schedit, ATTR_logevents,
                                   ATTR_sched_server_dyn_res_alarm,
                                   ATTR_SchedHost,
                                   'preempt_prio', 'preempt_queue_prio',
                                   'throughput_mode', 'job_run_wait',
                                   'partition', 'sched_priv', 'sched_log'],
                           NODE: [ATTR_rescavail + '.ncpus'],
                           HOOK: [ATTR_HOOK_type,
                                  ATTR_HOOK_enable,
                                  ATTR_HOOK_event,
                                  ATTR_HOOK_alarm,
                                  ATTR_HOOK_order,
                                  ATTR_HOOK_debug,
                                  ATTR_HOOK_fail_action,
                                  ATTR_HOOK_user]}

    __special_attr = {SERVER: None,
                      SCHED: None,
                      NODE: None,
                      HOOK: None}

    def __init__(self, name=None, attrs={}, defaults={}, pbsconf_file=None,
                 snapmap={}, snap=None, client=None, client_pbsconf_file=None,
                 db_access=None, stat=True):
        self.jobs = {}
        self.nodes = {}
        self.reservations = {}
        self.queues = {}
        self.resources = {}
        self.hooks = {}
        self.pbshooks = {}
        self.entities = {}
        self.schedulers = {}
        self.version = None
        self.default_queue = None
        self.last_error = []  # type: array. Set for CLI IFL errors. Not reset
        self.last_out = []  # type: array. Set for CLI IFL output. Not reset
        self.last_rc = None  # Set for CLI IFL return code. Not thread-safe
        self.moms = {}

        # default timeout on connect/disconnect set to 60s to mimick the qsub
        # buffer introduced in PBS 11
        self._conn_timeout = 60
        self._conn_timer = None
        self._conn = None
        self._db_conn = None
        self.current_user = pwd.getpwuid(os.getuid())[0]

        if len(defaults.keys()) == 0:
            defaults = self.dflt_attributes

        self.pexpect_timeout = 15
        self.pexpect_sleep_time = .1
        super().__init__(name, attrs, defaults, pbsconf_file, snapmap,
                         snap)
        _m = ['server ', self.shortname]
        if pbsconf_file is not None:
            _m += ['@', pbsconf_file]
        _m += [': ']
        self.logprefix = "".join(_m)
        self.pi = PBSInitServices(hostname=self.hostname,
                                  conf=self.pbs_conf_file)
        self.set_client(client)

        if client_pbsconf_file is None:
            self.client_pbs_conf_file = self.du.get_pbs_conf_file(self.client)
        else:
            self.client_pbs_conf_file = client_pbsconf_file

        self.client_conf = self.du.parse_pbs_config(
            self.client, file=self.client_pbs_conf_file)

        if self.client_pbs_conf_file == '/etc/pbs.conf':
            self.default_client_pbs_conf = True
        elif (('PBS_CONF_FILE' not in os.environ) or
              (os.environ['PBS_CONF_FILE'] != self.client_pbs_conf_file)):
            self.default_client_pbs_conf = False
        else:
            self.default_client_pbs_conf = True

        a = {}
        if os.getuid() == 0:
            a = {ATTR_aclroot: 'root'}
        self.dflt_attributes.update(a)

        if not API_OK:
            # mode must be set before the first stat call
            self.set_op_mode(PTL_CLI)

        if stat:
            try:
                tmp_attrs = self.status(SERVER, level=logging.DEBUG,
                                        db_access=db_access)
            except (PbsConnectError, PbsStatusError):
                tmp_attrs = None

            if tmp_attrs is not None and len(tmp_attrs) > 0:
                self.attributes = tmp_attrs[0]

            if ATTR_dfltque in self.attributes:
                self.default_queue = self.attributes[ATTR_dfltque]

            self.update_version_info()

    def update_version_info(self):
        """
        Update the version information.
        """
        if ATTR_version not in self.attributes:
            self.attributes[ATTR_version] = 'unknown'
        else:
            m = self.version_tag.match(self.attributes[ATTR_version])
            if m:
                v = m.group('version')
                self.version = LooseVersion(v)
        self.logger.info(self.logprefix + 'version ' +
                         self.attributes[ATTR_version])

    def set_client(self, name=None):
        """
        Set server client

        :param name: Client name
        :type name: str
        """
        if name is None:
            self.client = socket.gethostname()
        else:
            self.client = name

    def get_op_mode(self):
        """
        Returns operating mode for calls to the PBS server.
        Currently, two modes are supported, either the ``API``
        or the ``CLI``. Default is ``API``
        """
        if (not API_OK or (self.ptl_conf['mode'] == PTL_CLI)):
            return PTL_CLI
        return PTL_API

    def set_connect_timeout(self, timeout=0):
        """
        Set server connection timeout
        :param timeout: Timeout value
        :type timeout: int
        """
        self._conn_timeout = timeout

    def set_op_mode(self, mode):
        """
        set operating mode to one of either ``PTL_CLI`` or
        ``PTL_API``.Returns the mode that was set which can
        be different from the value requested, for example, if
        requesting to set ``PTL_API``, in the absence of the
        appropriate SWIG wrappers, the library will fall back to
        ``CLI``, or if requesting ``PTL_CLI`` and there is no
        ``PBS_EXEC`` on the system, None is returned.
        :param mode: Operating mode
        :type mode: str
        """
        if mode == PTL_API:
            if self._conn is not None or self._conn < 0:
                self._conn = None
            if not API_OK:
                self.logger.error(self.logprefix +
                                  'API submission is not available')
                return PTL_CLI
        elif mode == PTL_CLI:
            if ((not self.has_snap) and
                not os.path.isdir(os.path.join(self.client_conf['PBS_EXEC'],
                                               'bin'))):
                self.logger.error(self.logprefix +
                                  'PBS commands are not available')
                return None
        else:
            self.logger.error(self.logprefix + "Unrecognized operating mode")
            return None

        self.ptl_conf['mode'] = mode
        self.logger.info(self.logprefix + 'server operating mode set to ' +
                         mode)
        return mode

    def update_special_attr(self, obj_type, id=None):
        """
        Update special attributes(__special_attr) dictionary
        :param obj_type: The type of object to update attribute values
                         in special attribute dictionary.
        :type obj_type: str
        :param id: The id of the object to act upon
        :type id: str
        """
        if not id:
            if obj_type in (SERVER, NODE):
                id = self.hostname
            elif obj_type == SCHED:
                id = 'default'
        id_attr_dict = {}
        obj_stat = self.status(obj_type, id=id)[0]
        for key in obj_stat.keys():
            if key in self.__special_attr_keys[obj_type]:
                id_attr_dict[key] = obj_stat[key]

        id_attr = {id: id_attr_dict}
        self.__special_attr[obj_type] = id_attr

    def get_special_attr_val(self, obj_type, attr, id=None):
        """
        Get value for given attribute from
        special attributes(__special_attr) dictionary
        :param obj_type: The type of object to update attribute values
                         in special attribute dictionary.
        :type obj_type: str
        :param attr: The attribute for which value requested.
        :type id: str
        :param id: The id of the object to act upon
        :type id: str
        """

        if not id:
            if obj_type in (SERVER, NODE):
                id = self.hostname
            elif obj_type == SCHED:
                id = 'default'
        res_val = ATTR_rescavail + '.ncpus'
        if obj_type in (NODE, VNODE) and attr == res_val:
            obj_stat = self.status(obj_type, id=id)[0]
            if 'pcpus' not in obj_stat.keys():
                return 1
            else:
                return self.__special_attr[obj_type][id][attr]
        elif obj_type == HOOK and (id == 'pbs_cgroups' and attr == 'freq'):
            return 120
        else:
            return self.__special_attr[obj_type][id][attr]

    def _filter(self, obj_type=None, attrib=None, id=None, extend=None,
                op=None, attrop=None, bslist=None, mode=PTL_COUNTER,
                idonly=True, grandtotal=False, db_access=None, runas=None,
                resolve_indirectness=False, level=logging.DEBUG):

        if bslist is None:
            try:
                _a = resolve_indirectness
                tmp_bsl = self.status(obj_type, attrib, id,
                                      level=level, extend=extend,
                                      db_access=db_access, runas=runas,
                                      resolve_indirectness=_a)
                del _a
            except PbsStatusError:
                return None

            bslist = self.utils.filter_batch_status(tmp_bsl, attrib)
            del tmp_bsl

        if bslist is None:
            return None

        if isinstance(attrib, str):
            attrib = attrib.split(',')

        total = {}
        for bs in bslist:
            if isinstance(attrib, list):
                # when filtering on multiple values, ensure that they are
                # all present on the object, otherwise skip
                if attrop == PTL_AND:
                    match = True
                    for k in attrib:
                        if k not in bs:
                            match = False
                    if not match:
                        continue

                for a in attrib:
                    if a in bs:
                        if op == SET:
                            k = a
                        else:
                            # Since this is a list of attributes, no operator
                            # was provided so we settle on "equal"
                            k = a + '=' + str(bs[a])
                        if mode == PTL_COUNTER:
                            amt = 1
                            if grandtotal:
                                amt = PbsAttribute.decode_value(bs[a])
                                if not isinstance(amt, (int, float)):
                                    amt = 1
                                if a in total:
                                    total[a] += amt
                                else:
                                    total[a] = amt
                            else:
                                if k in total:
                                    total[k] += amt
                                else:
                                    total[k] = amt
                        elif mode == PTL_FILTER:
                            if k in total:
                                if idonly:
                                    total[k].append(bs['id'])
                                else:
                                    total[k].append(bs)
                            else:
                                if idonly:
                                    total[k] = [bs['id']]
                                else:
                                    total[k] = [bs]
                        else:
                            self.logger.error("Unhandled mode " + str(mode))
                            return None

            elif isinstance(attrib, dict):
                tmptotal = {}  # The running count that will be used for total

                # when filtering on multiple values, ensure that they are
                # all present on the object, otherwise skip
                match = True
                for k, v in attrib.items():
                    if k not in bs:
                        match = False
                        if attrop == PTL_AND:
                            break
                        else:
                            continue
                    amt = PbsAttribute.decode_value(bs[k])
                    if isinstance(v, tuple):
                        op = v[0]
                        val = PbsAttribute.decode_value(v[1])
                    elif op == SET:
                        val = None
                        pass
                    else:
                        op = EQ
                        val = PbsAttribute.decode_value(v)

                    if ((op == LT and amt < val) or
                            (op == LE and amt <= val) or
                            (op == EQ and amt == val) or
                            (op == GE and amt >= val) or
                            (op == GT and amt > val) or
                            (op == NE and amt != val) or
                            (op == MATCH and str(amt).find(str(val)) != -1) or
                            (op == MATCH_RE and
                             re.search(str(val), str(amt))) or
                            (op == SET)):
                        # There is a match, proceed to track the attribute
                        self._filter_helper(bs, k, val, amt, op, mode,
                                            tmptotal, idonly, grandtotal)
                    elif attrop == PTL_AND:
                        match = False
                        if mode == PTL_COUNTER:
                            # requesting specific key/value pairs should result
                            # in 0 available elements
                            tmptotal[str(k) + PTL_OP_TO_STR[op] + str(val)] = 0
                        break
                    elif mode == PTL_COUNTER:
                        tmptotal[str(k) + PTL_OP_TO_STR[op] + str(val)] = 0

                if attrop != PTL_AND or (attrop == PTL_AND and match):
                    for k, v in tmptotal.items():
                        if k not in total:
                            total[k] = v
                        else:
                            total[k] += v
        return total

    def _filter_helper(self, bs, k, v, amt, op, mode, total, idonly,
                       grandtotal):
        # default operation to '='
        if op is None or op not in PTL_OP_TO_STR:
            op = '='
        op_str = PTL_OP_TO_STR[op]

        if op == SET:
            # override PTL_OP_TO_STR fro SET operations
            op_str = ''
            v = ''

        ky = k + op_str + str(v)
        if mode == PTL_COUNTER:
            incr = 1
            if grandtotal:
                if not isinstance(amt, (int, float)):
                    incr = 1
                else:
                    incr = amt
            if ky in total:
                total[ky] += incr
            else:
                total[ky] = incr
        elif mode == PTL_FILTER:
            if ky in total:
                if idonly:
                    total[ky].append(bs['id'])
                else:
                    total[ky].append(bs)
            else:
                if idonly:
                    total[ky] = [bs['id']]
                else:
                    total[ky] = [bs]

    def _connect(self, hostname, attempt=1):
        if ((self._conn is None or self._conn < 0) or
                (self._conn_timeout == 0 or self._conn_timer is None)):
            self._conn = pbs_connect(hostname)
            self._conn_timer = time.time()

        if self._conn is None or self._conn < 0:
            if attempt > 5:
                m = self.logprefix + 'unable to connect'
                raise PbsConnectError(rv=None, rc=-1, msg=m)
            else:
                self._disconnect(self._conn, force=True)
                time.sleep(1)
                return self._connect(hostname, attempt + 1)

        return self._conn

    def _disconnect(self, conn, force=False):
        """
        disconnect a connection to a Server.
        For performance of the API calls, a connection is
        maintained up to _conn_timer, unless the force parameter
        is set to True
        :param conn: Server connection
        :param force: If true then diconnect forcefully
        :type force: bool
        """
        if ((conn is not None and conn >= 0) and
            (force or
             (self._conn_timeout == 0 or
              (self._conn_timer is not None and
               (time.time() - self._conn_timer > self._conn_timeout))))):
            pbs_disconnect(conn)
            self._conn_timer = None
            self._conn = None

    def update_attributes(self, obj_type, bs, overwrite=False):
        """
        Populate objects from batch status data
        """
        if bs is None:
            return

        for binfo in bs:
            if 'id' not in binfo:
                continue
            id = binfo['id']
            obj = None
            if obj_type == JOB:
                if ATTR_owner in binfo:
                    user = binfo[ATTR_owner].split('@')[0]
                else:
                    user = None
                if id in self.jobs:
                    if overwrite:
                        self.jobs[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.jobs[id].attributes.update(binfo)
                    if self.jobs[id].username != user:
                        self.jobs[id].username = user
                else:
                    self.jobs[id] = Job(user, binfo)
                obj = self.jobs[id]
            elif obj_type in (VNODE, NODE):
                if id in self.nodes:
                    if overwrite:
                        self.nodes[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.nodes[id].attributes.update(binfo)
                else:
                    if 'Mom' in binfo:
                        self.nodes[id] = get_mom_obj(self, binfo['Mom'], binfo,
                                                     snapmap={NODE: None})
                    else:
                        self.nodes[id] = get_mom_obj(self, id, binfo,
                                                     snapmap={NODE: None})
                obj = self.nodes[id]
            elif obj_type == SERVER:
                if overwrite:
                    self.attributes = copy.deepcopy(binfo)
                else:
                    self.attributes.update(binfo)
                obj = self
            elif obj_type == QUEUE:
                if id in self.queues:
                    if overwrite:
                        self.queues[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.queues[id].attributes.update(binfo)
                else:
                    self.queues[id] = Queue(id, binfo, server=self)
                obj = self.queues[id]
            elif obj_type == RESV:
                if id in self.reservations:
                    if overwrite:
                        self.reservations[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.reservations[id].attributes.update(binfo)
                else:
                    self.reservations[id] = Reservation(id, binfo)
                obj = self.reservations[id]
            elif obj_type == HOOK:
                if id in self.hooks:
                    if overwrite:
                        self.hooks[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.hooks[id].attributes.update(binfo)
                else:
                    self.hooks[id] = Hook(id, binfo, server=self)
                obj = self.hooks[id]
            elif obj_type == PBS_HOOK:
                if id in self.pbshooks:
                    if overwrite:
                        self.pbshooks[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.pbshooks[id].attributes.update(binfo)
                else:
                    self.pbshooks[id] = Hook(id, binfo, server=self)
                obj = self.pbshooks[id]
            elif obj_type == SCHED:
                if id in self.schedulers:
                    if overwrite:
                        self.schedulers[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.schedulers[id].attributes.update(binfo)
                    if 'sched_priv' in binfo:
                        self.schedulers[id].setup_sched_priv(
                            binfo['sched_priv'])
                else:
                    if 'sched_host' not in binfo:
                        hostname = self.hostname
                    else:
                        hostname = binfo['sched_host']
                    if SCHED in self.snapmap:
                        snap = self.snap
                        snapmap = self.snapmap
                    else:
                        snap = None
                        snapmap = {}
                    spriv = None
                    if 'sched_priv' in binfo:
                        spriv = binfo['sched_priv']
                    self.schedulers[id] = Scheduler(server=self,
                                                    hostname=hostname,
                                                    snap=snap,
                                                    snapmap=snapmap,
                                                    id=id,
                                                    sched_priv=spriv)
                    if overwrite:
                        self.schedulers[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.schedulers[id].attributes.update(binfo)
                obj = self.schedulers[id]

            elif obj_type == RSC:
                if id in self.resources:
                    if overwrite:
                        self.resources[id].attributes = copy.deepcopy(binfo)
                    else:
                        self.resources[id].attributes.update(binfo)
                else:
                    rtype = None
                    rflag = None
                    if 'type' in binfo:
                        rtype = binfo['type']
                    if 'flag' in binfo:
                        rflag = binfo['flag']
                    self.resources[id] = Resource(id, rtype, rflag)

            if obj is not None:
                self.utils.update_attributes_list(obj)
                obj.__dict__.update(binfo)

    def pbs_api_as(self, cmd=None, obj=None, user=None, **kwargs):
        """
        Generic handler to run an ``API`` call impersonating
        a given user.This method is only used for impersonation
        over the ``API`` because ``CLI`` impersonation takes place
        through the generic ``DshUtils`` run_cmd mechanism.
        :param cmd: PBS command
        :type cmd: str or None
        :param user: PBS user or current user
        :type user: str or None
        :raises: eval
        """
        fn = None
        objid = None
        _data = None

        if user is None:
            user = self.du.get_current_user()
        else:
            # user may be a PbsUser object, cast it to string for the remainder
            # of the function
            user = str(user)

        if cmd == 'submit':
            if obj is None:
                return None

            _data = copy.copy(obj)
            # the following attributes cause problems 'pickling',
            # since they are not needed we unset them
            _data.attrl = None
            _data.attropl = None
            _data.logger = None
            _data.utils = None

        elif cmd in ('alterjob', 'holdjob', 'sigjob', 'msgjob', 'rlsjob',
                     'rerunjob', 'orderjob', 'runjob', 'movejob',
                     'select', 'delete', 'status', 'manager', 'terminate',
                     'deljob', 'delresv', 'alterresv'):
            objid = obj
            if 'data' in kwargs:
                _data = kwargs['data']

        if _data is not None:
            fn = self.du.create_temp_file()
            with open(fn, 'w+b') as tmpfile:
                pickle.dump(_data, tmpfile)

            os.chmod(fn, 0o755)

            if self._is_local:
                os.chdir(tempfile.gettempdir())
            else:
                self.du.run_copy(self.hostname, src=fn, dest=fn)

        if not self._is_local:
            p_env = '"import os; print(os.environ[\'PTL_EXEC\'])"'
            ret = self.du.run_cmd(self.hostname, ['python3', '-c', p_env],
                                  logerr=False)
            if ret['out']:
                runcmd = [os.path.join(ret['out'][0], 'pbs_as')]
            else:
                runcmd = ['pbs_as']
        elif 'PTL_EXEC' in os.environ:
            runcmd = [os.path.join(os.environ['PTL_EXEC'], 'pbs_as')]
        else:
            runcmd = ['pbs_as']

        runcmd += ['-c', cmd, '-u', user]

        if objid is not None:
            runcmd += ['-o']
            if isinstance(objid, list):
                runcmd += [','.join(objid)]
            else:
                runcmd += [objid]

        if fn is not None:
            runcmd += ['-f', fn]

        if 'hostname' in kwargs:
            hostname = kwargs['hostname']
        else:
            hostname = self.hostname
        runcmd += ['-s', hostname]

        if 'extend' in kwargs and kwargs['extend'] is not None:
            runcmd += ['-e', kwargs['extend']]

        ret = self.du.run_cmd(self.hostname, runcmd, logerr=False, runas=user)
        out = ret['out']
        if ret['err']:
            if cmd in CMD_ERROR_MAP:
                m = CMD_ERROR_MAP[cmd]
                if m in ret['err'][0]:
                    if fn is not None:
                        os.remove(fn)
                        if not self._is_local:
                            self.du.rm(self.hostname, fn)
                    raise eval(str(ret['err'][0]))
            self.logger.debug("<" + get_method_name(self) + '>err: ' +
                              str(ret['err']))

        if fn is not None:
            os.remove(fn)
            if not self._is_local:
                self.du.rm(self.hostname, fn)

        if cmd == 'submit':
            if out:
                return out[0].strip()
            else:
                return None
        elif cmd in ('alterjob', 'holdjob', 'sigjob', 'msgjob', 'rlsjob',
                     'rerunjob', 'orderjob', 'runjob', 'movejob', 'delete',
                     'terminate', 'alterresv'):
            if ret['out']:
                return int(ret['out'][0])
            else:
                return 1

        elif cmd in ('manager', 'select', 'status'):
            return eval(out[0])

    def logit(self, msg, obj_type, attrib, id, level=logging.INFO):
        """
        Generic logging routine for ``IFL`` commands
        :param msg: The message to log
        :type msg: str
        :param obj_type: object type, i.e *
        :param attrib: attributes to log
        :param id: name of object to log
        :type id: str or list
        :param level: log level, defaults to ``INFO``
        """
        s = []
        if self.logger is not None:
            if obj_type is None:
                obj_type = MGR_OBJ_NONE
            s = [msg + PBS_OBJ_MAP[obj_type]]
            if id:
                if isinstance(id, list):
                    s += [' ' + ",".join(id)]
                else:
                    s += [' ' + str(id)]
            if attrib:
                s += [' ' + str(attrib)]
            self.logger.log(level, "".join(s))

    def status(self, obj_type=SERVER, attrib=None, id=None,
               extend=None, level=logging.INFO, db_access=None, runas=None,
               resolve_indirectness=False, logerr=True):
        """
        Stat any PBS object ``[queue, server, node, hook, job,
        resv, sched]``.If the Server is setup from snap input,
        see snap or snapmap member, the status calls are routed
        directly to the data on files from snap.
        The server can be queried either through the 'qstat'
        command line tool or through the wrapped PBS IFL api,
        see set_op_mode.
        Return a dictionary representation of a batch status object
        raises ``PbsStatsuError on error``.
        :param obj_type: The type of object to query, one of the *
                         objects.Default: SERVER
        :param attrib: Attributes to query, can be a string, a
                       list, a dictionary.Default is to query all
                       attributes.
        :type attrib: str or list or dictionary
        :param id: An optional id, the name of the object to status
        :type id: str
        :param extend: Optional extension to the IFL call
        :param level: The logging level, defaults to INFO
        :type level: str
        :param db_acccess: set to either file containing credentials
                           to DB access or dictionary containing
                           ``{'dbname':...,'user':...,'port':...}``
        :type db_access: str or dictionary
        :param runas: run stat as user
        :type runas: str
        :param resolve_indirectness: If True resolves indirect node
                                     resources values
        :type resolve_indirectness: bool
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        In addition to standard IFL stat call, this wrapper handles
        a few cases that aren't implicitly offered by pbs_stat*,
        those are for Hooks,Resources, and a formula evaluation.
        """

        prefix = 'status on ' + self.shortname
        if runas:
            prefix += ' as ' + str(runas)
        prefix += ': '
        self.logit(prefix, obj_type, attrib, id, level)

        bs = None
        bsl = []
        freebs = False
        # 2 - Special handling for gathering the job formula value.
        if attrib is not None and PTL_FORMULA in attrib:
            if (((isinstance(attrib, list) or isinstance(attrib, dict)) and
                 (len(attrib) == 1)) or
                    (isinstance(attrib, str) and len(attrib.split(',')) == 1)):
                bsl = self.status(
                    JOB, 'Resource_List.select', id=id, extend='t')
            if self.schedulers[self.dflt_sched_name] is None:
                self.schedulers[self.dflt_sched_name] = Scheduler(
                    self, name=self.hostname)
            _prev_events = self.status(SCHED, 'log_events',
                                       id=self.dflt_schd_name)[0]['log_events']

            # Job sort formula events are logged at DEBUG2 (256)
            if not int(_prev_events) & 256:
                self.manager(MGR_CMD_SET, SCHED, {'log_events': 2047},
                             id=self.dflt_schd_name)
            self.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
            if id is None:
                _formulas = self.schedulers[self.dflt_sched_name].job_formula()
            else:
                _formulas = {
                    id: self.schedulers[
                        self.dflt_sched_name].job_formula(
                        jobid=id)
                }
            if not int(_prev_filter) & 256:
                self.manager(MGR_CMD_SET, SCHED, {'log_events': _prev_events},
                             id=self.dflt_schd_name)
            if len(bsl) == 0:
                bsl = [{'id': id}]
            for _b in bsl:
                if _b['id'] in _formulas:
                    _b[PTL_FORMULA] = _formulas[_b['id']]
            return bsl

        # 3- Serve data from database if requested... and available for the
        # given object type
        if db_access and obj_type in (SERVER, SCHED, NODE, QUEUE, RESV, JOB):
            bsl = self.status_db(obj_type, attrib, id, db_access=db_access,
                                 logerr=logerr)

        # 4- Serve data from snap files
        elif obj_type in self.snapmap:
            if obj_type in (HOOK, PBS_HOOK):
                for f in self.snapmap[obj_type]:
                    _b = self.utils.file_to_dictlist(f, attrib)
                    if _b and 'hook_name' in _b[0]:
                        _b[0]['id'] = _b[0]['hook_name']
                    else:
                        _b[0]['id'] = os.path.basename(f)
                    if id is None or id == _b[0]['id']:
                        bsl.extend(_b)
            else:
                bsl = self.utils.file_to_dictlist(self.snapmap[obj_type],
                                                  attrib, id=id)
        # 6- Stat using PBS CLI commands
        elif self.get_op_mode() == PTL_CLI:
            tgt = self.client
            if obj_type in (JOB, QUEUE, SERVER):
                pcmd = [os.path.join(
                        self.client_conf['PBS_EXEC'],
                        'bin',
                        'qstat')]

                if extend:
                    pcmd += ['-' + extend]

                if obj_type == JOB:
                    pcmd += ['-f']
                    if id:
                        pcmd += [id]
                    else:
                        pcmd += ['@' + self.hostname]
                elif obj_type == QUEUE:
                    pcmd += ['-Qf']
                    if id:
                        if '@' not in id:
                            pcmd += [id + '@' + self.hostname]
                        else:
                            pcmd += [id]
                    else:
                        pcmd += ['@' + self.hostname]
                elif obj_type == SERVER:
                    pcmd += ['-Bf', self.hostname]

            elif obj_type in (NODE, VNODE, HOST):
                pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                     'pbsnodes')]
                pcmd += ['-s', self.hostname]
                if obj_type in (NODE, VNODE):
                    pcmd += ['-v']
                if obj_type == HOST:
                    pcmd += ['-H']
                if id:
                    pcmd += [id]
                else:
                    pcmd += ['-a']
            elif obj_type == RESV:
                pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                     'pbs_rstat')]
                pcmd += ['-f']
                if id:
                    pcmd += [id]
            elif obj_type in (SCHED, PBS_HOOK, HOOK, RSC):
                try:
                    rc = self.manager(MGR_CMD_LIST, obj_type, attrib, id,
                                      runas=runas, level=level, logerr=logerr)
                except PbsManagerError as e:
                    rc = e.rc
                    # PBS bug, no hooks yields a return code of 1, we ignore
                    if obj_type != HOOK:
                        raise PbsStatusError(
                            rc=rc, rv=[], msg=self.geterrmsg())
                if rc == 0:
                    if obj_type == HOOK:
                        o = self.hooks
                    elif obj_type == PBS_HOOK:
                        o = self.pbshooks
                    elif obj_type == SCHED:
                        o = self.schedulers
                    elif obj_type == RSC:
                        o = self.resources
                    if id:
                        if id in o:
                            return [o[id].attributes]
                        else:
                            return None
                    return [h.attributes for h in o.values()]
                return []

            else:
                self.logger.error(self.logprefix + "unrecognized object type")
                raise PbsStatusError(rc=-1, rv=[],
                                     msg="unrecognized object type")
                return None

            # as_script is used to circumvent some shells that will not pass
            # along environment variables when invoking a command through sudo
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            elif obj_type == RESV and not self._is_local:
                pcmd = ['PBS_SERVER=' + self.hostname] + pcmd
                as_script = True
            else:
                as_script = False

            ret = self.du.run_cmd(tgt, pcmd, runas=runas, as_script=as_script,
                                  level=logging.INFOCLI, logerr=logerr)
            o = ret['out']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = ret['rc']
            if ret['rc'] != 0:
                raise PbsStatusError(rc=ret['rc'], rv=[], msg=self.geterrmsg())

            bsl = self.utils.convert_to_dictlist(
                o, attrib, mergelines=True, obj_type=obj_type)

        # 7- Stat with impersonation over PBS IFL swig-wrapped API
        elif runas is not None:
            _data = {'obj_type': obj_type, 'attrib': attrib, 'id': id}
            bsl = self.pbs_api_as('status', user=runas, data=_data,
                                  extend=extend)
        else:
            # 8- Stat over PBS IFL API
            #
            # resources are special attributes, all resources are queried as
            # a single attribute.
            # e.g. querying the resources_available attribute returns all
            # resources such as ncpus, mem etc. when querying for
            # resources_available.ncpus and resources_available.mem only query
            # resources_available once and retrieve the resources desired from
            # there
            if isinstance(attrib, dict):
                attribcopy = {}
                restype = []
                for k, v in attrib.items():
                    if isinstance(v, tuple):
                        # SET requires a special handling because status may
                        # have been called through counter to count the number
                        # of objects have a given attribute set, in this case
                        # we set the attribute to an empty string rather than
                        # the number of elements requested. This is a
                        # side-effect of the way pbs_statjob works
                        if v[0] in (SET, MATCH_RE):
                            v = ''
                        else:
                            v = v[1]
                    if isinstance(v, Callable):
                        v = ''
                    if '.' in k:
                        _r = k.split('.')[0]
                        if _r not in restype:
                            attribcopy[k] = v
                            restype.append(_r)
                    else:
                        attribcopy[k] = v
            elif isinstance(attrib, list):
                attribcopy = []
                for k in attrib:
                    if '.' in k:
                        _found = False
                        for _e in attribcopy:
                            _r = k.split('.')[0]
                            if _r == _e.split('.')[0]:
                                _found = True
                                break
                        if not _found:
                            attribcopy.append(k)
                    else:
                        attribcopy.append(k)
            else:
                attribcopy = attrib

            a = self.utils.convert_to_attrl(attribcopy)
            c = self._connect(self.hostname)

            if obj_type == JOB:
                bs = pbs_statjob(c, id, a, extend)
            elif obj_type == QUEUE:
                bs = pbs_statque(c, id, a, extend)
            elif obj_type == SERVER:
                bs = pbs_statserver(c, a, extend)
            elif obj_type == HOST:
                bs = pbs_statnode(c, id, a, extend)
            elif obj_type == VNODE:
                bs = pbs_statvnode(c, id, a, extend)
            elif obj_type == RESV:
                bs = pbs_statresv(c, id, a, extend)
            elif obj_type == SCHED:
                bs = pbs_statsched(c, a, extend)
            elif obj_type == RSC:
                # up to PBS 12.3 pbs_statrsc was not in pbs_ifl.h
                bs = pbs_statrsc(c, id, a, extend)
            elif obj_type in (HOOK, PBS_HOOK):
                if os.getuid() != 0:
                    try:
                        rc = self.manager(MGR_CMD_LIST, obj_type, attrib,
                                          id, level=level)
                        if rc == 0:
                            if id:
                                if (obj_type == HOOK and
                                        id in self.hooks):
                                    return [self.hooks[id].attributes]
                                elif (obj_type == PBS_HOOK and
                                      id in self.pbshooks):
                                    return [self.pbshooks[id].attributes]
                                else:
                                    return None
                            if obj_type == HOOK:
                                return [h.attributes for h in
                                        self.hooks.values()]
                            elif obj_type == PBS_HOOK:
                                return [h.attributes for h in
                                        self.pbshooks.values()]
                    except Exception:
                        pass
                else:
                    bs = pbs_stathook(c, id, a, extend)
            else:
                self.logger.error(self.logprefix +
                                  "unrecognized object type " + str(obj_type))

            freebs = True
            err = self.geterrmsg()
            self._disconnect(c)

            if err:
                raise PbsStatusError(rc=-1, rv=[], msg=err)

            if not isinstance(bs, list):
                bsl = self.utils.batch_status_to_dictlist(bs, attrib)
            else:
                bsl = self.utils.filter_batch_status(bs, attrib)

        # Update each object's dictionary with corresponding attributes and
        # values
        self.update_attributes(obj_type, bsl)

        # Hook stat is done through CLI, no need to free the batch_status
        if (not isinstance(bs, list) and freebs and
                obj_type not in (HOOK, PBS_HOOK) and os.getuid() != 0):
            pbs_statfree(bs)

        # 9- Resolve indirect resources
        if obj_type in (NODE, VNODE) and resolve_indirectness:
            nodes = {}
            for _b in bsl:
                for k, v in _b.items():
                    if v.startswith('@'):
                        if v[1:] in nodes:
                            _b[k] = nodes[v[1:]][k]
                        else:
                            for l in bsl:
                                if l['id'] == v[1:]:
                                    nodes[k] = l[k]
                                    _b[k] = l[k]
                                    break
            del nodes
        return bsl

    def submit_interactive_job(self, job, cmd):
        """
        submit an ``interactive`` job. Returns a job identifier
        or raises PbsSubmitError on error
        :param cmd: The command to run to submit the interactive
                    job
        :type cmd: str
        :param job: the job object. The job must have the attribute
                    'interactive_job' populated. That attribute is
                    a list of tuples of the form:
                    (<command>, <expected output>, <...>)
                    for example to send the command
                    hostname and expect 'myhost.mydomain' one would
                    set:job.interactive_job =
                    [('hostname', 'myhost.mydomain')]
                    If more than one lines are expected they are
                    appended to the tuple.
        :raises: PbsSubmitError
        """
        ij = InteractiveJob(job, cmd, self.client)
        # start the interactive job submission thread and wait to pickup the
        # actual job identifier
        ij.start()
        while ij.jobid is None:
            continue
        return ij.jobid

    def expect(self, obj_type, attrib=None, id=None, op=EQ, attrop=PTL_AND,
               attempt=0, max_attempts=None, interval=None, count=None,
               extend=None, offset=0, runas=None, level=logging.INFO,
               msg=None, trigger_sched_cycle=True):
        """
        expect an attribute to match a given value as per an
        operation.
        :param obj_type: The type of object to query, JOB, SERVER,
                         SCHEDULER, QUEUE, NODE
        :type obj_type: str
        :param attrib: Attributes to query, can be a string, a list,
                       or a dict
        :type attrib: str or list or dictionary
        :param id: The id of the object to act upon
        :param op: An operation to perform on the queried data,
                   e.g., EQ, SET, LT,..
        :param attrop: Operation on multiple attributes, either
                       PTL_AND, PTL_OR when an PTL_AND is used, only
                       batch objects having all matches are
                       returned, otherwise an OR is applied
        :param attempt: The number of times this function has been
                        called
        :type attempt: int
        :param max_attempts: The maximum number of attempts to
                             perform
        :type max_attempts: int or None
        :param interval: The interval time between attempts.
        :param count: If True, attrib will be accumulated using
                      function counter
        :type count: bool
        :param extend: passed to the stat call
        :param offset: the time to wait before the initial check.
                       Defaults to 0.
        :type offset: int
        :param runas: query as a given user. Defaults to current
                      user
        :type runas: str or None
        :param msg: Message from last call of this function, this
                    message will be used while raising
                    PtlExpectError.
        :type msg: str or None
        :param trigger_sched_cycle: True by default can be set to False if
                          kicksched_action is not supposed to be called
        :type trigger_sched_cycle: Boolean
        :returns: True if attributes are as expected
        :raises: PtlExpectError if attributes are not as expected
        """

        if attempt == 0 and offset > 0:
            self.logger.log(level, self.logprefix + 'expect offset set to ' +
                            str(offset))
            time.sleep(offset)

        if attrib is None:
            attrib = {}

        if ATTR_version in attrib and max_attempts is None:
            max_attempts = 3

        if max_attempts is None:
            max_attempts = self.ptl_conf['max_attempts']

        if interval is None:
            interval = self.ptl_conf['attempt_interval']

        if attempt >= max_attempts:
            _msg = "expected on " + self.logprefix + msg
            raise PtlExpectError(rc=1, rv=False, msg=_msg)

        if obj_type == SERVER and id is None:
            id = self.hostname

        if isinstance(attrib, str):
            attrib = {attrib: ''}
        elif isinstance(attrib, list):
            d = {}
            for l in attrib:
                d[l] = ''
            attrib = d

        # Add check for substate=42 for jobstate=R, if not added explicitly.
        if obj_type == JOB:
            add_attribs = {}
            substate = False
            for k, v in attrib.items():
                if k == 'job_state' and ((isinstance(v, tuple) and
                                          'R' in v[-1]) or v == 'R'):
                    add_attribs['substate'] = 42
                elif k == 'job_state=R':
                    add_attribs['substate=42'] = v
                elif 'substate' in k:
                    substate = True
            if add_attribs and not substate:
                attrib.update(add_attribs)
                attrop = PTL_AND
            del add_attribs, substate

        prefix = 'expect on ' + self.logprefix
        msg = []
        attrs_to_ignore = []
        for k, v in attrib.items():
            args = None
            if isinstance(v, tuple):
                operator = v[0]
                if len(v) > 2:
                    args = v[2:]
                val = v[1]
            else:
                operator = op
                val = v
            if operator not in PTL_OP_TO_STR:
                self.logger.log(level, "Operator not supported by expect(), "
                                "cannot verify change in " + str(k))
                attrs_to_ignore.append(k)
                continue
            msg += [k, PTL_OP_TO_STR[operator].strip()]
            if isinstance(val, Callable):
                msg += ['callable(' + val.__name__ + ')']
                if args is not None:
                    msg.extend([str(x) for x in args])
            else:
                msg += [str(val)]
            msg += [PTL_ATTROP_TO_STR[attrop]]

        # Delete the attributes that we cannot verify
        for k in attrs_to_ignore:
            del(attrib[k])

        if attrs_to_ignore and len(attrib) < 1 and op == SET:
            return True

        # remove the last converted PTL_ATTROP_TO_STR
        if len(msg) > 1:
            msg = msg[:-1]

        if len(attrib) == 0:
            msg += [PTL_OP_TO_STR[op]]

        msg += [PBS_OBJ_MAP[obj_type]]
        if id is not None:
            msg += [str(id)]
        if attempt > 0:
            msg += ['attempt:', str(attempt + 1)]

        # Default count to True if the attribute contains an '=' in its name
        # for example 'job_state=R' implies that a count of job_state is needed
        if count is None and self.utils.operator_in_attribute(attrib):
            count = True

        if count:
            newattr = self.utils.convert_attributes_by_op(attrib)
            if len(newattr) == 0:
                newattr = attrib

            statlist = [self._filter(obj_type, newattr, id, extend, op=op,
                                     attrop=attrop, runas=runas,
                                     level=logging.DEBUG)]
        else:
            try:
                statlist = self.status(obj_type, attrib, id=id,
                                       level=logging.DEBUG, extend=extend,
                                       runas=runas, logerr=False)
            except PbsStatusError:
                statlist = []

        if (statlist is None or len(statlist) == 0 or
                statlist[0] is None or len(statlist[0]) == 0):
            if op == UNSET or list(set(attrib.values())) == [0]:
                self.logger.log(level, prefix + " ".join(msg) + ' ...  OK')
                return True
            else:
                time.sleep(interval)
                msg = " no data for " + " ".join(msg)
                self.logger.log(level, prefix + msg)
                return self.expect(obj_type, attrib, id, op, attrop,
                                   attempt + 1, max_attempts, interval, count,
                                   extend, level=level, msg=msg)
        else:
            if op == UNSET and obj_type in (SERVER, SCHED, NODE, HOOK, QUEUE):
                for key in attrib.keys():
                    if key in self.__special_attr_keys[obj_type]:
                        val = self.get_special_attr_val(obj_type, key, id)
                        attrib = {key: val}
                        op = EQ
                        return self.expect(obj_type, attrib, id, op, attrop,
                                           attempt, max_attempts, interval,
                                           count, extend, runas=runas,
                                           level=level, msg=msg)

        if attrib is None:
            time.sleep(interval)
            return self.expect(obj_type, attrib, id, op, attrop, attempt + 1,
                               max_attempts, interval, count, extend,
                               runas=runas, level=level, msg=" ".join(msg))
        inp_op = op
        for k, v in attrib.items():
            varargs = None
            if isinstance(v, tuple):
                op = v[0]
                if len(v) > 2:
                    varargs = v[2:]
                v = v[1]
            else:
                op = inp_op

            for stat in statlist:
                if k not in stat:
                    if op == UNSET:
                        continue

                    # Sometimes users provide the wrong case for attributes
                    # Convert to lowercase and compare
                    attrs_lower = {
                        ks.lower(): [ks, vs] for ks, vs in stat.items()}
                    k_lower = k.lower()
                    if k_lower not in attrs_lower:
                        if (statlist.index(stat) + 1) < len(statlist):
                            continue
                        time.sleep(interval)
                        _tsc = trigger_sched_cycle
                        return self.expect(obj_type, attrib, id, op, attrop,
                                           attempt + 1, max_attempts,
                                           interval, count, extend,
                                           level=level, msg=" ".join(msg),
                                           trigger_sched_cycle=_tsc)
                    stat_v = attrs_lower[k_lower][1]
                    stat_k = attrs_lower[k_lower][0]
                else:
                    stat_v = stat[k]
                    stat_k = k

                if stat_k == ATTR_version:
                    m = self.version_tag.match(stat_v)
                    if m:
                        stat_v = m.group('version')
                    else:
                        time.sleep(interval)
                        return self.expect(obj_type, attrib, id, op, attrop,
                                           attempt + 1, max_attempts, interval,
                                           count, extend, runas=runas,
                                           level=level, msg=" ".join(msg))

                # functions/methods are invoked and their return value
                # used on expect
                if isinstance(v, Callable):
                    if varargs is not None:
                        rv = v(stat_v, *varargs)
                    else:
                        rv = v(stat_v)
                    if isinstance(rv, bool):
                        if op == NOT:
                            if not rv:
                                continue
                        if rv:
                            continue
                    else:
                        v = rv

                stat_v = PbsAttribute.decode_value(stat_v)
                v = PbsAttribute.decode_value(str(v))

                if stat_k == ATTR_version:
                    stat_v = LooseVersion(str(stat_v))
                    v = LooseVersion(str(v))

                if op == EQ and stat_v == v:
                    continue
                elif op == SET and count and stat_v == v:
                    continue
                elif op == SET and count in (False, None):
                    continue
                elif op == NE and stat_v != v:
                    continue
                elif op == LT:
                    if stat_v < v:
                        continue
                elif op == GT:
                    if stat_v > v:
                        continue
                elif op == LE:
                    if stat_v <= v:
                        continue
                elif op == GE:
                    if stat_v >= v:
                        continue
                elif op == MATCH_RE:
                    if re.search(str(v), str(stat_v)):
                        continue
                elif op == MATCH:
                    if str(stat_v).find(str(v)) != -1:
                        continue

                msg += [' got: ' + stat_k + ' = ' + str(stat_v)]
                self.logger.info(prefix + " ".join(msg))
                time.sleep(interval)

                # run custom actions defined for this object type
                if trigger_sched_cycle and self.actions:
                    for act_obj in self.actions.get_actions_by_type(obj_type):
                        if act_obj.enabled:
                            act_obj.action(self, obj_type, attrib, id, op,
                                           attrop)
                return self.expect(obj_type, attrib, id, op, attrop,
                                   attempt + 1, max_attempts, interval, count,
                                   extend, level=level, msg=" ".join(msg),
                                   trigger_sched_cycle=trigger_sched_cycle)

        self.logger.log(level, prefix + " ".join(msg) + ' ...  OK')
        return True

    def submit(self, obj, script=None, extend=None, submit_dir=None,
               env=None):
        """
        Submit a job or reservation. Returns a job identifier
        or raises PbsSubmitError on error
        :param obj: The Job or Reservation instance to submit
        :param script: Path to a script to submit. Default: None
                       as an executable /bin/sleep 100 is submitted
        :type script: str or None
        :param extend: Optional extension to the IFL call.
                       see pbs_ifl.h
        :type extend: str or None
        :param submit_dir: directory from which job is submitted.
                           Defaults to temporary directory
        :type submit_dir: str or None
        :raises: PbsSubmitError
        """

        _interactive_job = False
        as_script = False
        rc = None
        if isinstance(obj, Job):
            if self.platform == 'cray' or self.platform == 'craysim':
                m = False
                vncompute = False
                if 'Resource_List.select' in obj.attributes:
                    select = obj.attributes['Resource_List.select']
                    start = select.startswith('vntype=cray_compute')
                    m = start or ':vntype=cray_compute' in select
                if 'Resource_List.vntype' in obj.attributes:
                    vn_type = obj.attributes['Resource_List.vntype']
                    if vn_type == 'cray_compute':
                        vncompute = True
                if obj.script is not None:
                    script = obj.script
                elif m or vncompute:
                    aprun_cmd = "aprun -b -B"
                    executable = obj.attributes[ATTR_executable]
                    start = executable.startswith('aprun ')
                    aprun_exist = start or '/aprun' in executable
                    if script:
                        aprun_cmd += " " + script
                    else:
                        if aprun_exist:
                            aprun_cmd = executable
                        else:
                            aprun_cmd += " " + executable
                        arg_list = obj.attributes[ATTR_Arglist]
                        aprun_cmd += " " + self.utils.convert_arglist(arg_list)
                    fn = self.du.create_temp_file(hostname=None,
                                                  prefix='PtlPbsJobScript',
                                                  asuser=obj.username,
                                                  body=aprun_cmd)
                    self.du.chmod(path=fn, mode=0o755)
                    script = fn
            elif script is None and obj.script is not None:
                script = obj.script
            if ATTR_inter in obj.attributes:
                _interactive_job = True
                if ATTR_executable in obj.attributes:
                    del obj.attributes[ATTR_executable]
                if ATTR_Arglist in obj.attributes:
                    del obj.attributes[ATTR_Arglist]
        elif not isinstance(obj, Reservation):
            m = self.logprefix + "unrecognized object type"
            self.logger.error(m)
            return None

        if not submit_dir:
            submit_dir = pwd.getpwnam(obj.username)[5]

        cwd = os.getcwd()
        if self.platform != 'shasta':
            if submit_dir:
                os.chdir(submit_dir)
        c = None

        # Revisit this after fixing submitting of executables without
        # the whole path
        # Get sleep command depending on which Mom the job will run
        if ((ATTR_executable in obj.attributes) and
                ('sleep' in obj.attributes[ATTR_executable])):
            obj.attributes[ATTR_executable] = (
                list(self.moms.values())[0]).sleep_cmd

        # 1- Submission using the command line tools
        runcmd = []
        if env:
            runcmd += ['#!/bin/bash\n']
            for k, v in env.items():
                if '()' in k:
                    f_name = k.replace('()', '')
                    runcmd += [k, v, "\n", "export", "-f", f_name]
                else:
                    runcmd += ['export %s=\"%s\"' % (k, v)]
                runcmd += ["\n"]

        script_file = None
        if self.get_op_mode() == PTL_CLI:
            exclude_attrs = []  # list of attributes to not convert to CLI
            if isinstance(obj, Job):
                runcmd += [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                        'qsub')]
            elif isinstance(obj, Reservation):
                runcmd += [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                        'pbs_rsub')]
                if ATTR_resv_start in obj.custom_attrs:
                    start = obj.custom_attrs[ATTR_resv_start]
                    obj.custom_attrs[ATTR_resv_start] = \
                        self.utils.convert_seconds_to_datetime(start)
                if ATTR_resv_end in obj.custom_attrs:
                    end = obj.custom_attrs[ATTR_resv_end]
                    obj.custom_attrs[ATTR_resv_end] = \
                        self.utils.convert_seconds_to_datetime(end)
                if ATTR_resv_timezone in obj.custom_attrs:
                    exclude_attrs += [ATTR_resv_timezone, ATTR_resv_standing]
                    # handling of impersonation differs widely across OS's,
                    # when setting PBS_TZID we standardize on running the cmd
                    # as a script instead of customizing for each OS flavor
                    _tz = obj.custom_attrs[ATTR_resv_timezone]
                    runcmd = ['PBS_TZID=' + _tz] + runcmd
                    as_script = True
                    if ATTR_resv_rrule in obj.custom_attrs:
                        _rrule = obj.custom_attrs[ATTR_resv_rrule]
                        if _rrule[0] not in ("'", '"'):
                            _rrule = "'" + _rrule + "'"
                        obj.custom_attrs[ATTR_resv_rrule] = _rrule
                if ATTR_job in obj.attributes:
                    runcmd += ['--job', obj.attributes[ATTR_job]]
                    exclude_attrs += [ATTR_job]

            if not self._is_local:
                if ATTR_queue not in obj.attributes:
                    runcmd += ['-q@' + self.hostname]
                elif '@' not in obj.attributes[ATTR_queue]:
                    curq = obj.attributes[ATTR_queue]
                    runcmd += ['-q' + curq + '@' + self.hostname]
                if obj.custom_attrs and (ATTR_queue in obj.custom_attrs):
                    del obj.custom_attrs[ATTR_queue]

            _conf = self.default_client_pbs_conf
            cmd = self.utils.convert_to_cli(obj.custom_attrs, IFL_SUBMIT,
                                            self.hostname, dflt_conf=_conf,
                                            exclude_attrs=exclude_attrs)

            if cmd is None:
                try:
                    os.chdir(cwd)
                except OSError:
                    pass
                return None
            runcmd += cmd

            if script:
                runcmd += [script]
            else:
                if ATTR_executable in obj.attributes:
                    runcmd += ['--', obj.attributes[ATTR_executable]]
                    if ((ATTR_Arglist in obj.attributes) and
                            (obj.attributes[ATTR_Arglist] is not None)):
                        args = obj.attributes[ATTR_Arglist]
                        arglist = self.utils.convert_arglist(args)
                        if arglist is None:
                            try:
                                os.chdir(cwd)
                            except OSError:
                                pass
                            return None
                        runcmd += [arglist]
            if obj.username != self.current_user:
                runas = obj.username
            else:
                runas = None

            if isinstance(obj, Reservation) and obj.hosts:
                runcmd += ['--hosts'] + obj.hosts

            if _interactive_job:
                ijid = self.submit_interactive_job(obj, runcmd)
                try:
                    os.chdir(cwd)
                except OSError:
                    pass
                return ijid

            if not self.default_client_pbs_conf:
                runcmd = [
                    'PBS_CONF_FILE=' + self.client_pbs_conf_file] + runcmd
                as_script = True
            if env:
                user = PbsUser.get_user(obj.username)
                host = user.host
                run_str = " ".join(runcmd)
                script_file = self.du.create_temp_file(hostname=host,
                                                       body=run_str)
                self.du.chmod(hostname=host, path=script_file, mode=0o755)
                runcmd = [script_file]
            ret = self.du.run_cmd(self.client, runcmd, runas=runas,
                                  level=logging.INFOCLI, as_script=as_script,
                                  env=env, logerr=False)
            if ret['rc'] != 0:
                objid = None
            else:
                objid = ret['out'][0]
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc = ret['rc']

        # 2- Submission with impersonation over API
        elif obj.username != self.current_user:
            # submit job as a user requires setting uid to that user. It's
            # done in a separate process
            obj.set_variable_list(obj.username, submit_dir)
            obj.set_attributes()
            if (obj.script is not None and not self._is_local):
                # This copy assumes that the file system layout on the
                # remote host is identical to the local host. When not
                # the case, this code will need to be updated to copy
                # to a known remote location and update the obj.script
                self.du.run_copy(
                    self.hostname, src=obj.script, dest=obj.script)
                os.remove(obj.script)
            objid = self.pbs_api_as('submit', obj, user=obj.username,
                                    extend=extend)
        # 3- Submission as current user over API
        else:
            c = self._connect(self.hostname)

            if isinstance(obj, Job):
                if script:
                    if ATTR_o not in obj.attributes:
                        obj.attributes[ATTR_o] = (self.hostname + ':' +
                                                  obj.script + '.o')
                    if ATTR_e not in obj.attributes:
                        obj.attributes[ATTR_e] = (self.hostname + ':' +
                                                  obj.script + '.e')
                    sc = os.path.basename(script)
                    obj.unset_attributes([ATTR_executable, ATTR_Arglist])
                    if ATTR_N not in obj.custom_attrs:
                        obj.attributes[ATTR_N] = sc
                if ATTR_queue in obj.attributes:
                    destination = obj.attributes[ATTR_queue]
                    # queue must be removed otherwise will cause the submit
                    # to fail silently
                    del obj.attributes[ATTR_queue]
                else:
                    destination = None

                    if (ATTR_o not in obj.attributes or
                            ATTR_e not in obj.attributes):
                        fn = PbsAttribute.random_str(
                            length=4, prefix='PtlPbsJob')
                        tmp = self.du.get_tempdir(self.hostname)
                        fn = os.path.join(tmp, fn)
                    if ATTR_o not in obj.attributes:
                        obj.attributes[ATTR_o] = (self.hostname + ':' +
                                                  fn + '.o')
                    if ATTR_e not in obj.attributes:
                        obj.attributes[ATTR_e] = (self.hostname + ':' +
                                                  fn + '.e')

                obj.attropl = self.utils.dict_to_attropl(obj.attributes)
                objid = pbs_submit(c, obj.attropl, script, destination,
                                   extend)
            elif isinstance(obj, Reservation):
                if ATTR_resv_duration in obj.attributes:
                    # reserve_duration is not a valid attribute, the API call
                    # will get rejected if it is used
                    wlt = ATTR_l + '.walltime'
                    obj.attributes[wlt] = obj.attributes[ATTR_resv_duration]
                    del obj.attributes[ATTR_resv_duration]

                obj.attropl = self.utils.dict_to_attropl(obj.attributes)
                objid = pbs_submit_resv(c, obj.attropl, extend)

        prefix = 'submit to ' + self.shortname + ' as '
        if isinstance(obj, Job):
            self.logit(prefix + '%s: ' % obj.username, JOB, obj.custom_attrs,
                       objid)
            if obj.script_body:
                self.logger.log(logging.INFOCLI, 'job script ' + script +
                                '\n---\n' + obj.script_body + '\n---')
            if objid is not None:
                self.jobs[objid] = obj
        elif isinstance(obj, Reservation):
            # Reservations without -I option return as 'R123 UNCONFIRMED'
            # so split to get the R123 only

            self.logit(prefix + '%s: ' % obj.username, RESV, obj.attributes,
                       objid)
            if objid is not None:
                objid = objid.split()[0]
                self.reservations[objid] = obj

        if objid is not None:
            obj.server[self.hostname] = objid
        else:
            try:
                os.chdir(cwd)
            except OSError:
                pass
            raise PbsSubmitError(rc=rc, rv=None, msg=self.geterrmsg(),
                                 post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        try:
            os.chdir(cwd)
        except OSError:
            pass

        return objid

    def submit_resv(self, offset, duration, select='1:ncpus=1', rrule='',
                    conf=None, confirmed=True):
        """
        Helper function to submit an advance/a standing reservation.
        :param int offset: Time in seconds from time this is called to set the
                       advance reservation's start time.
        :param int duration: Duration in seconds of advance reservation
        :param str select: Select statement for reservation placement.
                           Default: "1:ncpus=1"
        :param str rrule: Recurrence rule.  Default is an empty string.
        :param boolean times: If true, return a tuple of reservation id, start
                              time and end time of created reservation.
                              Otherwise return just the reservation id.
                              Default: False
        :param conf: Configuration for test case for PBS_TZID information.
        :param boolean confirmed: Wait until the reservation is confimred if
                                  True.
                                  Default: True
        :return The reservation id if times is false.  Otherwise a tuple of
                reservation id, start time and end time of the reservation.

        """
        start_time = int(time.time()) + offset
        end_time = start_time + duration

        attrs = {
            'reserve_start': start_time,
            'reserve_end': end_time,
            'Resource_List.select': select
        }

        if rrule:
            if conf is None:
                self.logger.info('conf not set. Falling back to Asia/Kolkata')
                tzone = 'Asia/Kolkata'
            elif 'PBS_TZID' in conf:
                tzone = conf['PBS_TZID']
            elif 'PBS_TZID' in os.environ:
                tzone = os.environ['PBS_TZID']
            else:
                self.logger.info('Missing timezone, using Asia/Kolkata')
                tzone = 'Asia/Kolkata'
            attrs[ATTR_resv_rrule] = rrule
            attrs[ATTR_resv_timezone] = tzone

        rid = self.submit(Reservation(TEST_USER, attrs))
        time_format = "%Y-%m-%d %H:%M:%S"
        self.logger.info("Submitted reservation: %s, start=%s, end=%s", rid,
                         time.strftime(time_format,
                                       time.localtime(start_time)),
                         time.strftime(time_format,
                                       time.localtime(end_time)))
        if confirmed:
            attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
            self.expect(RESV, attrs, id=rid)

        return rid, start_time, end_time

    def alter_a_reservation(self, r, start, end, shift=0,
                            alter_s=False, alter_e=False,
                            whichMessage=1, confirm=True, check_log=True,
                            interactive=0, sequence=1,
                            a_duration=None, select=None, extend=None,
                            runas=None, sched_down=False):
        """
        Helper method for altering a reservation.
        This method also checks for the server and accounting logs.

        :param r: Reservation id.
        :type  r: string.

        :param start: Start time of the reservation.
        :type  start: int.

        :param end: End time of the reservation.
        :type  end: int

        :param shift: Time in seconds the reservation times will be moved.
        :type  shift: int.

        :param alter_s: Whether the caller intends to change the start time.
                       Default - False.
        :type  alter_s: bool.

        :param alter_e: Whether the caller intends to change the end time.
                       Default - False.
        :type  alter_e: bool.

        :param whichMessage: Which message is expected to be returned.
                            Default: 1.
                             =-1 - No exception, don't check logs
                             =0 - PbsResvAlterError exception will be raised,
                                  so check for appropriate error response.
                             =1 - No exception, check for "CONFIRMED" message
                             =2 - No exception, check for "UNCONFIRMED" message
                             =3 - No exception, check for "DENIED" message
        :type  whichMessage: int.
        :param check_log: If False, do not check the log of confirmation of the
                          reservation.  Default: True
        :tupe check_log boolean

        :param confirm: The expected state of the reservation after it is
                       altered. It can be either Confirmed or Running.
                       Default - Confirmed State.
        :type  confirm: bool.

        :param sched_down: The test is being run with the scheduler down.
                           Don't wait for confirmed or running states.
                           Default - False
        :type sched_down: bool

        :param interactive: Time in seconds the CLI waits for a reply.
                           Default - 0 seconds.
        :type  interactive: int.

        :param sequence: To check the number of log matches corresponding
                        to alter.
                        Default: 1
        :type  sequence: int.

        :param a_duration: The duration to modify.
        :type a_duration: int.
        :param extend: extend parameter.
        :type extend: str.
        :param runas: User who own alters the reservation.
                      Default: user running the test.
        :type runas: PbsUser.

        raises: PBSResvAlterError
        """
        fmt = "%a %b %d %H:%M:%S %Y"
        new_start = start
        new_end = end
        attrs = {}
        bu = BatchUtils()

        if alter_s:
            new_start = start + shift
            new_start_conv = bu.convert_seconds_to_datetime(
                new_start)
            attrs['reserve_start'] = new_start_conv

        if alter_e:
            new_end = end + shift
            new_end_conv = bu.convert_seconds_to_datetime(new_end)
            attrs['reserve_end'] = new_end_conv

        if interactive > 0:
            attrs['interactive'] = interactive

        if a_duration:
            if isinstance(a_duration, str) and ':' in a_duration:
                new_duration_conv = bu.convert_duration(a_duration)
            else:
                new_duration_conv = a_duration

            if not alter_s and not alter_e:
                new_end = start + new_duration_conv + shift
            elif alter_s and not alter_e:
                new_end = new_start + new_duration_conv
            elif not alter_s and alter_e:
                new_start = new_end - new_duration_conv
            # else new_start and new_end have already been calculated
        else:
            new_duration_conv = new_end - new_start

        if a_duration:
            attrs['reserve_duration'] = new_duration_conv

        if select:
            attrs['Resource_List.select'] = select

        if runas is None:
            runas = self.du.get_current_user()

        if whichMessage:
            msg = ['']
            acct_msg = ['']

            if interactive:
                if whichMessage == 1:
                    msg = "pbs_ralter: " + r + " CONFIRMED"
                elif whichMessage == 2:
                    msg = "pbs_ralter: " + r + " UNCONFIRMED"
                else:
                    msg = "pbs_ralter: " + r + " DENIED"
            else:
                msg = "pbs_ralter: " + r + " ALTER REQUESTED"

            self.alterresv(r, attrs, extend=extend, runas=runas)

            if msg != self.last_out[0]:
                raise PBSResvAlterError(
                    msg=f"Wrong Message expected {msg} got {self.last_out[0]}")
            self.logger.info(msg + " displayed")

            if check_log:
                msg = "Resv;" + r + ";Attempting to modify reservation "
                if start != new_start:
                    msg += "start="
                    msg += time.strftime(fmt,
                                         time.localtime(int(new_start)))
                    msg += " "

                if end != new_end:
                    msg += "end="
                    msg += time.strftime(fmt,
                                         time.localtime(int(new_end)))
                    msg += " "

                if select:
                    msg += "select=" + select + " "

                # strip the last space
                msg = msg[:-1]
                self.log_match(msg, interval=2, max_attempts=30)

            if whichMessage == -1:
                return new_start, new_end
            elif whichMessage == 1:
                if alter_s:
                    new_start_conv = bu.convert_seconds_to_datetime(
                        new_start, fmt)
                    attrs['reserve_start'] = new_start_conv

                if alter_e:
                    new_end_conv = bu.convert_seconds_to_datetime(
                        new_end, fmt)
                    attrs['reserve_end'] = new_end_conv

                if a_duration:
                    attrs['reserve_duration'] = new_duration_conv

                if sched_down:
                    attrs['reserve_state'] = (MATCH_RE,
                                              'RESV_BEING_ALTERED|11')
                elif confirm:
                    attrs['reserve_state'] = (MATCH_RE, 'RESV_CONFIRMED|2')
                else:
                    attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')

                self.expect(RESV, attrs, id=r)
                if check_log:
                    acct_msg = "Y;" + r + ";requestor=Scheduler@.*" + " start="
                    acct_msg += str(new_start) + " end=" + str(new_end)
                    self.status(RESV, 'resv_nodes', id=r)
                    acct_msg += " nodes="
                    acct_msg += re.escape(self.reservations[r].
                                          resvnodes())

                    if r[0] == 'S':
                        self.status(RESV, 'reserve_count', id=r)
                        count = self.reservations[r].attributes[
                            'reserve_count']
                        acct_msg += " count=" + count

                    self.accounting_match(acct_msg, regexp=True,
                                          interval=2,
                                          max_attempts=30, n='ALL')

                # Check if reservation reports new start time
                # and updated duration.

                msg = "Resv;" + r + ";Reservation alter confirmed"
            else:
                msg = "Resv;" + r + ";Reservation alter denied"
            interval = 0.5
            max_attempts = 20
            if sched_down:
                self.logger.info("Scheduler Down: Modify should not succeed.")
                return start, end
            for attempts in range(1, max_attempts + 1):
                lines = self.log_match(msg, n='ALL', allmatch=True,
                                              max_attempts=5)
                info_msg = "log_match: searching " + \
                    str(sequence) + " sequence of message: " + \
                    msg + ": Got: " + str(len(lines))
                self.logger.info(info_msg)
                if len(lines) == sequence:
                    break
                else:
                    attempts = attempts + 1
                    time.sleep(interval)
            if attempts > max_attempts:
                raise PtlLogMatchError(rc=1, rv=False, msg=info_msg)
            return new_start, new_end
        else:
            try:
                self.alterresv(r, attrs, extend=extend, runas=runas)
            except PbsResvAlterError:
                self.logger.info(
                    "Reservation Alteration failed.  This is expected.")
                return start, end
            else:
                self.assertFalse("Reservation alter allowed when it should" +
                                 "not be.")

    def deljob(self, id=None, extend=None, runas=None, wait=False,
               logerr=True, attr_W=None):
        """
        delete a single job or list of jobs specified by id
        raises ``PbsDeljobError`` on error
        :param id: The identifier(s) of the jobs to delete
        :type id: str or list
        :param extend: Optional parameters to pass along to PBS
        :type extend: str or None
        :param runas: run as user
        :type runas: str or None
        :param wait: Set to True to wait for job(s) to no longer
                     be reported by PBS. False by default
        :type wait: bool
        :param logerr: Whether to log errors. Defaults to True.
        :type logerr: bool
        :param attr_w: -W args to qdel (Only for cli mode)
        :type attr_w: str
        :raises: PbsDeljobError
        """
        prefix = 'delete job on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if id is not None:
            if not isinstance(id, list):
                id = id.split(',')
            prefix += ', '.join(id)
        self.logger.info(prefix)
        c = None
        rc = 0
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qdel')]
            if extend is not None:
                pcmd += self.utils.convert_to_cli(extend, op=IFL_DELETE,
                                                  hostname=self.hostname)
            if attr_W is not None:
                pcmd += ['-W']
                if attr_W != PTL_NOARG:
                    pcmd += [attr_W]
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            elif not self._is_local:
                pcmd = ['PBS_SERVER=' + self.hostname] + pcmd
                as_script = True
            else:
                as_script = False
            if id is not None:
                chunks = [id[i:i + 2000] for i in range(0, len(id), 2000)]
                for chunk in chunks:
                    ret = self.du.run_cmd(self.client, pcmd + chunk,
                                          runas=runas, as_script=as_script,
                                          logerr=logerr, level=logging.INFOCLI)
                    rc = ret['rc']
                    if ret['err'] != ['']:
                        self.last_error = ret['err']
                    self.last_rc = rc
                    if rc != 0:
                        break
            else:
                ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                      as_script=as_script, logerr=logerr,
                                      level=logging.INFOCLI)
                rc = ret['rc']
                if ret['err'] != ['']:
                    self.last_error = ret['err']
                self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('deljob', id, user=runas, extend=extend)
        else:
            c = self._connect(self.hostname)
            rc = 0
            for ajob in id:
                tmp_rc = pbs_deljob(c, ajob, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsDeljobError(rc=rc, rv=False, msg=self.geterrmsg(),
                                 post=self._disconnect, conn=c)
        if self.jobs is not None:
            for j in id:
                if j in self.jobs:
                    if self.jobs[j].interactive_handle is not None:
                        self.jobs[j].interactive_handle.close()
                    del self.jobs[j]
        if c:
            self._disconnect(c)
        if wait and id is not None:
            for oid in id:
                self.expect(JOB, 'queue', id=oid, op=UNSET, runas=runas,
                            level=logging.DEBUG)
        return rc

    def delresv(self, id=None, extend=None, runas=None, wait=False,
                logerr=True):
        """
        delete a single job or list of jobs specified by id
        raises ``PbsDeljobError`` on error
        :param id: The identifier(s) of the jobs to delete
        :type id: str or list
        :param extend: Optional parameters to pass along to PBS
        :type extend: str or None
        :param runas: run as user
        :type runas: str or None
        :param wait: Set to True to wait for job(s) to no longer
                     be reported by PBS. False by default
        :type wait: bool
        :param logerr: Whether to log errors. Defaults to True.
        :type logerr: bool
        :raises: PbsDeljobError
        """
        prefix = 'delete resv on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if id is not None:
            if not isinstance(id, list):
                id = id.split(',')
            prefix += ', '.join(id)
        self.logger.info(prefix)
        c = None
        rc = 0
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'pbs_rdel')]
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            elif not self._is_local:
                pcmd = ['PBS_SERVER=' + self.hostname] + pcmd
                as_script = True
            else:
                as_script = False
            if id is not None:
                chunks = [id[i:i + 2000] for i in range(0, len(id), 2000)]
                for chunk in chunks:
                    ret = self.du.run_cmd(self.client, pcmd + chunk,
                                          runas=runas, as_script=as_script,
                                          logerr=logerr, level=logging.INFOCLI)
                    rc = ret['rc']
                    if ret['err'] != ['']:
                        self.last_error = ret['err']
                    self.last_rc = rc
                    if rc != 0:
                        break
            else:
                ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                      as_script=as_script, logerr=logerr,
                                      level=logging.INFOCLI)
                rc = ret['rc']
                if ret['err'] != ['']:
                    self.last_error = ret['err']
                self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('delresv', id, user=runas, extend=extend)
        else:
            c = self._connect(self.hostname)
            rc = 0
            for ajob in id:
                tmp_rc = pbs_delresv(c, ajob, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsDelresvError(rc=rc, rv=False, msg=self.geterrmsg(),
                                  post=self._disconnect, conn=c)
        if self.reservations is not None:
            for j in id:
                if j in self.reservations:
                    del self.reservations[j]
        if c:
            self._disconnect(c)
        if wait and id is not None:
            for oid in id:
                self.expect(RESV, 'queue', id=oid, op=UNSET, runas=runas,
                            level=logging.DEBUG)
        return rc

    def delete(self, id=None, extend=None, runas=None, wait=False,
               logerr=True):
        """
        delete a single job or list of jobs specified by id
        raises ``PbsDeleteError`` on error
        :param id: The identifier(s) of the jobs/resvs to delete
        :type id: str or list
        :param extend: Optional parameters to pass along to PBS
        :type extend: str or none
        :param runas: run as user
        :type runas: str
        :param wait: Set to True to wait for job(s)/resv(s) to
                     no longer be reported by PBS. False by default
        :type wait: bool
        :param logerr: Whether to log errors. Defaults to True.
        :type logerr: bool
        :raises: PbsDeleteError
        """
        prefix = 'delete on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if id is not None:
            if not isinstance(id, list):
                id = id.split(',')
            prefix += ','.join(id)
        if extend is not None:
            prefix += ' with ' + str(extend)
        self.logger.info(prefix)

        if not len(id) > 0:
            return 0

        obj_type = {}
        job_list = []
        resv_list = []
        for j in id:
            if j[0] in ('R', 'S', 'M'):
                obj_type[j] = RESV
                resv_list.append(j)
            else:
                obj_type[j] = JOB
                job_list.append(j)

        if resv_list:
            try:
                rc = self.delresv(resv_list, extend, runas, logerr=logerr)
            except PbsDelresvError as e:
                rc = e.rc
                msg = e.msg
                rv = e.rv
        if job_list:
            obj_type[j] = JOB
            try:
                rc = self.deljob(job_list, extend, runas, logerr=logerr)
            except PbsDeljobError as e:
                rc = e.rc
                msg = e.msg
                rv = e.rv

        if rc != 0:
            raise PbsDeleteError(rc=rc, rv=rv, msg=msg)

        if wait:
            for oid in id:
                self.expect(obj_type[oid], 'queue', id=oid, op=UNSET,
                            runas=runas, level=logging.DEBUG)

        return rc

    def select(self, attrib=None, extend=None, runas=None, logerr=True):
        """
        Select jobs that match attributes list or all jobs if no
        attributes raises ``PbsSelectError`` on error
        :param attrib: A string, list, or dictionary of attributes
        :type attrib: str or list or dictionary
        :param extend: the extended attributes to pass to select
        :type extend: str or None
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :returns: A list of job identifiers that match the
                  attributes specified
        :raises: PbsSelectError
        """
        prefix = "select on " + self.shortname
        if runas is not None:
            prefix += " as " + str(runas)
        prefix += ": "
        if attrib is None:
            s = PTL_ALL
        elif not isinstance(attrib, dict):
            self.logger.error(prefix + "attributes must be a dictionary")
            return
        else:
            s = str(attrib)
        self.logger.info(prefix + s)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'],
                                 'bin', 'qselect')]

            cmd = self.utils.convert_to_cli(attrib, op=IFL_SELECT,
                                            hostname=self.hostname)
            if extend is not None:
                pcmd += ['-' + extend]

            if not self._is_local and ((attrib is None) or
                                       (ATTR_queue not in attrib)):
                pcmd += ['-q', '@' + self.hostname]

            pcmd += cmd
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False

            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = ret['rc']
            if self.last_rc != 0:
                raise PbsSelectError(rc=self.last_rc, rv=False,
                                     msg=self.geterrmsg())
            jobs = ret['out']
            # command returns no jobs as empty, since we expect a valid id,
            # we reset the jobs to an empty array
            if len(jobs) == 1 and jobs[0] == '':
                jobs = []
        elif runas is not None:
            jobs = self.pbs_api_as('select', user=runas, data=attrib,
                                   extend=extend)
        else:
            attropl = self.utils.convert_to_attropl(attrib, op=EQ)
            c = self._connect(self.hostname)
            jobs = pbs_selectjob(c, attropl, extend)
            err = self.geterrmsg()
            if err:
                raise PbsSelectError(rc=-1, rv=False, msg=err,
                                     post=self._disconnect, conn=c)
            self._disconnect(c)

        return jobs

    def selstat(self, select_list, rattrib, runas=None, extend=None):
        """
        stat and filter jobs attributes.
        :param select_list: The filter criteria
        :type select: List
        :param rattrib: The attributes to query
        :type rattrib: List
        :param runas: run as user
        :type runas: str or None
        .. note:: No ``CLI`` counterpart for this call
        """

        attrl = self.utils.convert_to_attrl(rattrib)
        attropl = self.utils.convert_to_attropl(select_list)

        c = self._connect(self.hostname)
        bs = pbs_selstat(c, attropl, attrl, extend)
        self._disconnect(c)
        return bs

    def skipTest(self, reason=None):
        """
        Skip Test
        :param reason: message to indicate why test is skipped
        :type reason: str or None
        """
        if reason:
            self.logger.warning('test skipped: ' + reason)
        else:
            reason = 'unknown'
        raise SkipTest(reason)

    def manager(self, cmd, obj_type, attrib=None, id=None, extend=None,
                level=logging.INFO, sudo=None, runas=None, logerr=True):
        """
        issue a management command to the server, e.g to set an
        attribute
        Returns 0 for Success and non 0 number for Failure
        :param cmd: The command to issue,
                    ``MGR_CMD_[SET,UNSET, LIST,...]`` see pbs_ifl.h
        :type cmd: str
        :param obj_type: The type of object to query, one of
                         the * objects
        :param attrib: Attributes to operate on, can be a string, a
                       list,a dictionary
        :type attrib: str or list or dictionary
        :param id: The name or list of names of the object(s) to act
                   upon.
        :type id: str or list
        :param extend: Optional extension to the IFL call. see
                       pbs_ifl.h
        :type extend: str or None
        :param level: logging level
        :param sudo: If True, run the manager command as super user.
                     Defaults to None. Some attribute settings
                     should be run with sudo set to True, those are
                     acl_roots, job_sort_formula, hook operations,
                     no_sched_hook_event, in those cases, setting
                     sudo to False is only needed for testing
                     purposes
        :type sudo: bool
        :param runas: run as user
        :type runas: str
        :param logerr: If False, CLI commands do not log error,
                       i.e. silent mode
        :type logerr: bool
        :raises: PbsManagerError
        """

        if cmd == MGR_CMD_DELETE and obj_type == NODE and id != '@default':
            for cmom, momobj in self.moms.items():
                if momobj.is_cpuset_mom():
                    self.skipTest("Do not delete nodes on cpuset moms")

        if ((cmd == MGR_CMD_SET or cmd == MGR_CMD_CREATE) and
                id is not None and obj_type == NODE):
            for cmom, momobj in self.moms.items():
                cpuset_nodes = []
                if momobj.is_cpuset_mom() and attrib:
                    momobj.check_mem_request(attrib)
                    if len(attrib) == 0:
                        return True
                    vnodes = self.status(HOST, id=momobj.shortname)
                    del vnodes[0]  # don't set anything on a naturalnode
                    for vn in vnodes:
                        momobj.check_ncpus_request(attrib, vn)
                    if len(attrib) == 0:
                        return True

        if isinstance(id, str):
            oid = id.split(',')
        else:
            oid = id

        self.logit('manager on ' + self.shortname +
                   [' as ' + str(runas), ''][runas is None] + ': ' +
                   PBS_CMD_MAP[cmd] + ' ', obj_type, attrib, oid, level=level)

        c = None  # connection handle

        if (self.get_op_mode() == PTL_CLI or
            sudo is not None or
            obj_type in (HOOK, PBS_HOOK) or
            (attrib is not None and ('job_sort_formula' in attrib or
                                     'acl_roots' in attrib or
                                     'no_sched_hook_event' in attrib))):

            execcmd = [PBS_CMD_MAP[cmd], PBS_OBJ_MAP[obj_type]]

            if oid is not None:
                if cmd == MGR_CMD_DELETE and obj_type == NODE and oid[0] == "":
                    oid[0] = "@default"
                execcmd += [",".join(oid)]

            if attrib is not None and cmd != MGR_CMD_LIST:
                if cmd == MGR_CMD_IMPORT:
                    execcmd += [attrib['content-type'],
                                attrib['content-encoding'],
                                attrib['input-file']]
                else:
                    if isinstance(attrib, (dict, OrderedDict)):
                        kvpairs = []
                        for k, v in attrib.items():
                            if isinstance(v, tuple):
                                if v[0] == INCR:
                                    op = '+='
                                elif v[0] == DECR:
                                    op = '-='
                                else:
                                    msg = 'Invalid operation: %s' % (v[0])
                                    raise PbsManagerError(rc=1, rv=False,
                                                          msg=msg)
                                v = v[1]
                            else:
                                op = '='
                            if isinstance(v, list) and not isinstance(v, str):
                                # handle string arrays with strings
                                # that contain special characters
                                # with multiple manager calls
                                if any((c in vv) for c in set(', \'\n"')
                                       for vv in v):
                                    if op == '+=' or op == '=':
                                        oper = INCR
                                    else:
                                        oper = DECR
                                    for vv in v:
                                        a = {k: (oper, vv)}
                                        rc = self.manager(cmd=cmd,
                                                          obj_type=obj_type,
                                                          attrib=a, id=id,
                                                          extend=extend,
                                                          level=level,
                                                          sudo=sudo,
                                                          runas=runas,
                                                          logerr=logerr)
                                        if rc:
                                            return rc
                                    return 0
                                # if there are no special characters, then
                                # join the list and parse it normally.
                                v = ','.join(v)
                            if isinstance(v, str):
                                # don't quote if already quoted
                                if v[0] == v[-1] and v[0] in set('"\''):
                                    pass
                                # handle string arrays
                                elif ',' in v and v[0] != '"':
                                    v = '"' + v + '"'
                                # handle strings that need to be quoted
                                elif any((c in v) for c in set(', \'\n"')):
                                    if '"' in v:
                                        v = "'%s'" % v
                                    else:
                                        v = '"%s"' % v
                            kvpairs += [str(k) + op + str(v)]
                        if kvpairs:
                            execcmd += [",".join(kvpairs)]
                            del kvpairs
                    elif isinstance(attrib, list):
                        execcmd += [",".join(attrib)]
                    elif isinstance(attrib, str):
                        execcmd += [attrib]

            if not self.default_pbs_conf or not self.default_client_pbs_conf:
                as_script = True
            else:
                as_script = False

            if (not self._is_local or as_script or
                (runas and
                 not self.du.is_localhost(PbsUser.get_user(runas).host))):
                execcmd = '\'' + " ".join(execcmd) + '\''
            else:
                execcmd = " ".join(execcmd)

            # Hooks can only be queried as a privileged user on the host where
            # the server is running, care must be taken to use the appropriate
            # path to qmgr and appropriate escaping sequences
            # VERSION INFO: no_sched_hook_event introduced in 11.3.120 only
            if sudo is None:
                if (obj_type in (HOOK, PBS_HOOK) or
                    (attrib is not None and
                     ('job_sort_formula' in attrib or
                      'acl_roots' in attrib or
                      'no_sched_hook_event' in attrib))):
                    sudo = True
                else:
                    sudo = False

            pcmd = [os.path.join(self.pbs_conf['PBS_EXEC'], 'bin', 'qmgr'),
                    '-c', execcmd]

            if as_script:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd

            ret = self.du.run_cmd(self.hostname, pcmd, sudo=sudo, runas=runas,
                                  level=logging.INFOCLI, as_script=as_script,
                                  logerr=logerr)
            rc = ret['rc']
            # NOTE: workaround the fact that qmgr overloads the return code in
            # cases where the list returned is empty an error flag is set even
            # through there is no error. Handled here by checking if there is
            # no err and out message, in which case return code is set to 0
            if rc != 0 and (ret['out'] == [''] and ret['err'] == ['']):
                rc = 0
            if rc == 0:
                if cmd == MGR_CMD_LIST:
                    bsl = self.utils.convert_to_dictlist(ret['out'],
                                                         mergelines=True,
                                                         obj_type=obj_type)
                    # Since we stat everything, overwrite the cache
                    self.update_attributes(obj_type, bsl, overwrite=True)
                    # Filter out the attributes requested
                    if attrib:
                        bsl_attr = []
                        for obj in bsl:
                            dnew = {}
                            for k in obj.keys():
                                if k in attrib:
                                    dnew[k] = obj[k]
                            bsl_attr.append(dnew)
                        bsl = bsl_attr
            else:
                # Need to rework setting error, this is not thread safe
                self.last_error = ret['err']
            self.last_rc = ret['rc']
        elif runas is not None:
            _data = {'cmd': cmd, 'obj_type': obj_type, 'attrib': attrib,
                     'id': oid}
            rc = self.pbs_api_as('manager', user=runas, data=_data,
                                 extend=extend)
        else:
            a = self.utils.convert_to_attropl(attrib, cmd)
            c = self._connect(self.hostname)
            rc = 0
            if obj_type == SERVER and oid is None:
                oid = [self.hostname]
            if oid is None:
                # server will run strlen on id, it can not be NULL
                oid = ['']
            if cmd == MGR_CMD_LIST:
                if oid is None:
                    bsl = self.status(obj_type, attrib, oid, extend)
                else:
                    bsl = None
                    for i in oid:
                        tmpbsl = self.status(obj_type, attrib, i, extend)
                        if tmpbsl is None:
                            rc = 1
                        else:
                            if bsl is None:
                                bsl = tmpbsl
                            else:
                                bsl += tmpbsl
            else:
                rc = 0
                if oid is None:
                    rc = pbs_manager(c, cmd, obj_type, i, a, extend)
                else:
                    for i in oid:
                        tmprc = pbs_manager(c, cmd, obj_type, i, a, extend)
                        if tmprc != 0:
                            rc = tmprc
                            break
                    if rc == 0:
                        rc = tmprc

        if id is None and obj_type == SERVER:
            id = self.pbs_conf['PBS_SERVER']
        bs_list = []
        if cmd == MGR_CMD_DELETE and oid is not None:
            if rc == 0:
                for i in oid:
                    if obj_type == MGR_OBJ_HOOK and i in self.hooks:
                        del self.hooks[i]
                    if obj_type in (NODE, VNODE) and i in self.nodes:
                        del self.nodes[i]
                    if obj_type == MGR_OBJ_QUEUE and i in self.queues:
                        del self.queues[i]
                    if obj_type == MGR_OBJ_RSC and i in self.resources:
                        del self.resources[i]
                    if obj_type == SCHED and i in self.schedulers:
                        del self.schedulers[i]
            else:
                if obj_type == MGR_OBJ_RSC:
                    res_ret = self.du.run_cmd(cmd=[
                        os.path.join(
                            self.pbs_conf['PBS_EXEC'],
                            'bin',
                            'qmgr'),
                        '-c',
                        "list resource"],
                        logerr=True)
                    ress = [x.split()[1].strip()
                            for x in res_ret['out'] if 'Resource' in x]
                    tmp_res = copy.deepcopy(self.resources)
                    for i in tmp_res:
                        if i not in ress:
                            del self.resources[i]

        elif cmd == MGR_CMD_SET and rc == 0 and id is not None:
            if isinstance(id, list):
                for name in id:
                    tbsl = copy.deepcopy(attrib)
                    tbsl['name'] = name
                    bs_list.append(tbsl)
                    self.update_attributes(obj_type, bs_list)
            else:
                tbsl = copy.deepcopy(attrib)
                tbsl['id'] = id
                bs_list.append(tbsl)
                self.update_attributes(obj_type, bs_list)

        elif cmd == MGR_CMD_CREATE and rc == 0:
            if isinstance(id, list):
                for name in id:
                    bsl = self.status(obj_type, id=name, extend=extend)
                    self.update_attributes(obj_type, bsl)
            else:
                bsl = self.status(obj_type, id=id, extend=extend)
                self.update_attributes(obj_type, bsl)

        if rc != 0:
            raise PbsManagerError(rv=False, rc=rc, msg=self.geterrmsg(),
                                  post=self._disconnect, conn=c)

        if c is not None:
            self._disconnect(c)
        if cmd == MGR_CMD_SET and 'scheduling' in attrib:
            if attrib['scheduling'] in PTL_FALSE:
                if obj_type == SERVER:
                    sname = 'default'
                else:
                    sname = id

                # Default max cycle length is 1200 seconds (20m)
                self.expect(SCHED, {'state': 'scheduling'}, op=NE, id=sname,
                            interval=1, max_attempts=1200,
                            trigger_sched_cycle=False)
        return rc

    def sigjob(self, jobid=None, signal=None, extend=None, runas=None,
               logerr=True):
        """
        Send a signal to a job. Raises ``PbsSignalError`` on error.
        :param jobid: identifier of the job or list of jobs to send
                      the signal to
        :type jobid: str or list
        :param signal: The signal to send to the job, see pbs_ifl.h
        :type signal: str or None
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsSignalError
        """

        prefix = 'signal on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if signal is not None:
            prefix += ' with signal = ' + str(signal)
        self.logger.info(prefix)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qsig')]
            if signal is not None:
                pcmd += ['-s']
                if signal != PTL_NOARG:
                    pcmd += [str(signal)]
            if jobid is not None:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('sigjob', jobid, runas, data=signal)
        else:
            c = self._connect(self.hostname)
            rc = 0
            for ajob in jobid:
                tmp_rc = pbs_sigjob(c, ajob, signal, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsSignalError(rc=rc, rv=False, msg=self.geterrmsg(),
                                 post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def msgjob(self, jobid=None, to_file=None, msg=None, extend=None,
               runas=None, logerr=True):
        """
        Send a message to a job. Raises ``PbsMessageError`` on
        error.
        :param jobid: identifier of the job or list of jobs to
                      send the message to
        :type jobid: str or List
        :param msg: The message to send to the job
        :type msg: str or None
        :param to_file: one of ``MSG_ERR`` or ``MSG_OUT`` or
                        ``MSG_ERR|MSG_OUT``
        :type to_file: str or None
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsMessageError
        """
        prefix = 'msgjob on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if to_file is not None:
            prefix += ' with to_file = '
            if MSG_ERR == to_file:
                prefix += 'MSG_ERR'
            elif MSG_OUT == to_file:
                prefix += 'MSG_OUT'
            elif MSG_OUT | MSG_ERR == to_file:
                prefix += 'MSG_ERR|MSG_OUT'
            else:
                prefix += str(to_file)
        if msg is not None:
            prefix += ' msg = %s' % (str(msg))
        if extend is not None:
            prefix += ' extend = %s' % (str(extend))
        self.logger.info(prefix)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qmsg')]
            if to_file is not None:
                if MSG_ERR == to_file:
                    pcmd += ['-E']
                elif MSG_OUT == to_file:
                    pcmd += ['-O']
                elif MSG_OUT | MSG_ERR == to_file:
                    pcmd += ['-E', '-O']
                else:
                    pcmd += ['-' + str(to_file)]
            if msg is not None:
                pcmd += [msg]
            if jobid is not None:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False

            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            data = {'msg': msg, 'to_file': to_file}
            rc = self.pbs_api_as('msgjob', jobid, runas, data=data,
                                 extend=extend)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            for ajob in jobid:
                tmp_rc = pbs_msgjob(c, ajob, to_file, msg, extend)
                if tmp_rc != 0:
                    rc = tmp_rc

        if rc != 0:
            raise PbsMessageError(rc=rc, rv=False, msg=self.geterrmsg(),
                                  post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def alterjob(self, jobid=None, attrib=None, extend=None, runas=None,
                 logerr=True):
        """
        Alter attributes associated to a job. Raises
        ``PbsAlterError`` on error.
        :param jobid: identifier of the job or list of jobs to
                      operate on
        :type jobid: str or list
        :param attrib: A dictionary of attributes to set
        :type attrib: dictionary
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If False, CLI commands do not log error,
                       i.e. silent mode
        :type logerr: bool
        :raises: PbsAlterError
        """
        prefix = 'alter on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if attrib is not None:
            prefix += ' %s' % (str(attrib))
        self.logger.info(prefix)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'qalter')]
            if attrib is not None:
                _conf = self.default_client_pbs_conf
                pcmd += self.utils.convert_to_cli(attrib, op=IFL_ALTER,
                                                  hostname=self.client,
                                                  dflt_conf=_conf)
            if jobid is not None:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('alterjob', jobid, runas, data=attrib)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            a = self.utils.convert_to_attrl(attrib)
            rc = 0
            for ajob in jobid:
                tmp_rc = pbs_alterjob(c, ajob, a, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsAlterError(rc=rc, rv=False, msg=self.geterrmsg(),
                                post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def alterresv(self, resvid, attrib, extend=None, runas=None,
                  logerr=True):
        """
        Alter attributes associated to a reservation. Raises
        ``PbsResvAlterError`` on error.
        :param resvid: identifier of the reservation.
        :type resvid: str.
        :param attrib: A dictionary of attributes to set.
        :type attrib: dictionary.
        :param extend: extend options.
        :param runas: run as user.
        :type runas: str or None.
        :param logerr: If False, CLI commands do not log error,
                       i.e. silent mode.
        :type logerr: bool.
        :raises: PbsResvAlterError.
        """
        prefix = 'reservation alter on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': ' + resvid

        if attrib is not None:
            prefix += ' %s' % (str(attrib))
        self.logger.info(prefix)

        c = None
        resvid = resvid.split()
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'pbs_ralter')]
            if attrib is not None:
                if extend is not None:
                    attrib['extend'] = extend
                _conf = self.default_client_pbs_conf
                pcmd += self.utils.convert_to_cli(attrib, op=IFL_RALTER,
                                                  hostname=self.client,
                                                  dflt_conf=_conf)
            pcmd += resvid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            if ret['out'] != ['']:
                self.last_out = ret['out']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('alterresv', resvid, runas, data=attrib,
                                 extend=extend)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            a = self.utils.convert_to_attrl(attrib)
            rc = pbs_modify_resv(c, resvid, a, extend)

        if rc != 0:
            raise PbsResvAlterError(rc=rc, rv=False, msg=self.geterrmsg(),
                                    post=self._disconnect, conn=c)
        else:
            return rc

        if c:
            self._disconnect(c)

    def holdjob(self, jobid=None, holdtype=None, extend=None, runas=None,
                logerr=True):
        """
        Hold a job. Raises ``PbsHoldError`` on error.
        :param jobid: identifier of the job or list of jobs to hold
        :type jobid: str or list
        :param holdtype: The type of hold to put on the job
        :type holdtype: str or None
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsHoldError
        """
        prefix = 'holdjob on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if holdtype is not None:
            prefix += ' with hold_list = %s' % (holdtype)
        self.logger.info(prefix)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qhold')]
            if holdtype is not None:
                pcmd += ['-h']
                if holdtype != PTL_NOARG:
                    pcmd += [holdtype]
            if jobid is not None:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  logerr=logerr, as_script=as_script,
                                  level=logging.INFOCLI)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('holdjob', jobid, runas, data=holdtype,
                                 logerr=logerr)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            rc = 0
            for ajob in jobid:
                tmp_rc = pbs_holdjob(c, ajob, holdtype, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsHoldError(rc=rc, rv=False, msg=self.geterrmsg(),
                               post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def rlsjob(self, jobid, holdtype, extend=None, runas=None, logerr=True):
        """
        Release a job. Raises ``PbsReleaseError`` on error.
        :param jobid: job or list of jobs to release
        :type jobid: str or list
        :param holdtype: The type of hold to release on the job
        :type holdtype: str
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsReleaseError
        """
        prefix = 'release on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if holdtype is not None:
            prefix += ' with hold_list = %s' % (holdtype)
        self.logger.info(prefix)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qrls')]
            if holdtype is not None:
                pcmd += ['-h']
                if holdtype != PTL_NOARG:
                    pcmd += [holdtype]
            if jobid is not None:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('rlsjob', jobid, runas, data=holdtype)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            rc = 0
            for ajob in jobid:
                tmp_rc = pbs_rlsjob(c, ajob, holdtype, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsHoldError(rc=rc, rv=False, msg=self.geterrmsg(),
                               post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def rerunjob(self, jobid=None, extend=None, runas=None, logerr=True):
        """
        Rerun a job. Raises ``PbsRerunError`` on error.
        :param jobid: job or list of jobs to release
        :type jobid: str or list
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsRerunError
        """
        prefix = 'rerun on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if extend is not None:
            prefix += extend
        self.logger.info(prefix)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'qrerun')]
            if extend:
                pcmd += ['-W', extend]
            if jobid is not None:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('rerunjob', jobid, runas, extend=extend)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            rc = 0
            for ajob in jobid:
                tmp_rc = pbs_rerunjob(c, ajob, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsRerunError(rc=rc, rv=False, msg=self.geterrmsg(),
                                post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def orderjob(self, jobid1=None, jobid2=None, extend=None, runas=None,
                 logerr=True):
        """
        reorder position of ``jobid1`` and ``jobid2``. Raises
        ``PbsOrderJob`` on error.
        :param jobid1: first jobid
        :type jobid1: str or None
        :param jobid2: second jobid
        :type jobid2: str or None
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsOrderJob
        """
        prefix = 'orderjob on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        prefix += str(jobid1) + ', ' + str(jobid2)
        if extend is not None:
            prefix += ' ' + str(extend)
        self.logger.info(prefix)

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin',
                                 'qorder')]
            if jobid1 is not None:
                pcmd += [jobid1]
            if jobid2 is not None:
                pcmd += [jobid2]
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('orderjob', jobid1, runas, data=jobid2,
                                 extend=extend)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            rc = pbs_orderjob(c, jobid1, jobid2, extend)
        if rc != 0:
            raise PbsOrderError(rc=rc, rv=False, msg=self.geterrmsg(),
                                post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def runjob(self, jobid=None, location=None, run_async=False, extend=None,
               runas=None, logerr=False):
        """
        Run a job on given nodes. Raises ``PbsRunError`` on error.
        :param jobid: job or list of jobs to run
        :type jobid: str or list
        :param location: An execvnode on which to run the job
        :type location: str or None
        :param run_async: If true the call will return immediately
                      assuming success.
        :type run_async: bool
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsRunError
        """
        if run_async:
            prefix = 'Async run on ' + self.shortname
        else:
            prefix = 'run on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if location is not None:
            prefix += ' with location = %s' % (location)
        self.logger.info(prefix)

        if self.has_snap:
            return 0

        c = None
        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qrun')]
            if run_async:
                pcmd += ['-a']
            if location is not None:
                pcmd += ['-H']
                if location != PTL_NOARG:
                    pcmd += [location]
            if jobid:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False
            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  as_script=as_script, level=logging.INFOCLI,
                                  logerr=logerr)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as(
                'runjob', jobid, runas, data=location, extend=extend)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            rc = 0
            for ajob in jobid:
                if run_async:
                    tmp_rc = pbs_asyrunjob(c, ajob, location, extend)
                else:
                    tmp_rc = pbs_runjob(c, ajob, location, extend)
                if tmp_rc != 0:
                    rc = tmp_rc
        if rc != 0:
            raise PbsRunError(rc=rc, rv=False, msg=self.geterrmsg(),
                              post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def movejob(self, jobid=None, destination=None, extend=None, runas=None,
                logerr=True):
        """
        Move a job or list of job ids to a given destination queue.
        Raises ``PbsMoveError`` on error.
        :param jobid: A job or list of job ids to move
        :type jobid: str or list
        :param destination: The destination queue@server
        :type destination: str or None
        :param extend: extend options
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsMoveError
        """
        prefix = 'movejob on ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': '
        if jobid is not None:
            if not isinstance(jobid, list):
                jobid = jobid.split(',')
            prefix += ', '.join(jobid)
        if destination is not None:
            prefix += ' destination = %s' % (destination)
        self.logger.info(prefix)

        c = None
        rc = 0

        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qmove')]
            if destination is not None:
                pcmd += [destination]
            if jobid is not None:
                pcmd += jobid
            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False

            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  logerr=logerr, as_script=as_script,
                                  level=logging.INFOCLI)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            rc = self.pbs_api_as('movejob', jobid, runas, data=destination,
                                 extend=extend)
        else:
            c = self._connect(self.hostname)
            if c < 0:
                return c
            for ajob in jobid:
                tmp_rc = pbs_movejob(c, ajob, destination, extend)
                if tmp_rc != 0:
                    rc = tmp_rc

        if rc != 0:
            raise PbsMoveError(rc=rc, rv=False, msg=self.geterrmsg(),
                               post=self._disconnect, conn=c)

        if c:
            self._disconnect(c)

        return rc

    def qterm(self, manner=None, extend=None, server_name=None, runas=None,
              logerr=True):
        """
        Terminate the ``pbs_server`` daemon
        :param manner: one of ``(SHUT_IMMEDIATE | SHUT_DELAY |
                       SHUT_QUICK)`` and can be\
                       combined with SHUT_WHO_SCHED, SHUT_WHO_MOM,
                       SHUT_WHO_SECDRY, \
                       SHUT_WHO_IDLESECDRY, SHUT_WHO_SECDONLY. \
        :param extend: extend options
        :param server_name: name of the pbs server
        :type server_name: str or None
        :param runas: run as user
        :type runas: str or None
        :param logerr: If True (default) logs run_cmd errors
        :type logerr: bool
        :raises: PbsQtermError
        """
        prefix = 'terminate ' + self.shortname
        if runas is not None:
            prefix += ' as ' + str(runas)
        prefix += ': with manner '
        attrs = manner
        if attrs is None:
            prefix += "None "
        elif isinstance(attrs, str):
            prefix += attrs
        else:
            if ((attrs & SHUT_QUICK) == SHUT_QUICK):
                prefix += "quick "
            if ((attrs & SHUT_IMMEDIATE) == SHUT_IMMEDIATE):
                prefix += "immediate "
            if ((attrs & SHUT_DELAY) == SHUT_DELAY):
                prefix += "delay "
            if ((attrs & SHUT_WHO_SCHED) == SHUT_WHO_SCHED):
                prefix += "schedular "
            if ((attrs & SHUT_WHO_MOM) == SHUT_WHO_MOM):
                prefix += "mom "
            if ((attrs & SHUT_WHO_SECDRY) == SHUT_WHO_SECDRY):
                prefix += "secondary server "
            if ((attrs & SHUT_WHO_IDLESECDRY) == SHUT_WHO_IDLESECDRY):
                prefix += "idle secondary "
            if ((attrs & SHUT_WHO_SECDONLY) == SHUT_WHO_SECDONLY):
                prefix += "shoutdown secondary only "

        self.logger.info(prefix)

        if self.has_snap:
            return 0

        c = None
        rc = 0

        if self.get_op_mode() == PTL_CLI:
            pcmd = [os.path.join(self.client_conf['PBS_EXEC'], 'bin', 'qterm')]
            _conf = self.default_client_pbs_conf
            pcmd += self.utils.convert_to_cli(manner, op=IFL_TERMINATE,
                                              hostname=self.hostname,
                                              dflt_conf=_conf)
            if server_name is not None:
                pcmd += [server_name]

            if not self.default_client_pbs_conf:
                pcmd = ['PBS_CONF_FILE=' + self.client_pbs_conf_file] + pcmd
                as_script = True
            else:
                as_script = False

            ret = self.du.run_cmd(self.client, pcmd, runas=runas,
                                  level=logging.INFOCLI, as_script=as_script)
            rc = ret['rc']
            if ret['err'] != ['']:
                self.last_error = ret['err']
            self.last_rc = rc
        elif runas is not None:
            attrs = {'manner': manner, 'server_name': server_name}
            rc = self.pbs_api_as('terminate', None, runas, data=attrs,
                                 extend=extend)
        else:
            if server_name is None:
                server_name = self.hostname
            c = self._connect(self.hostname)
            rc = pbs_terminate(c, manner, extend)
        if rc != 0:
            raise PbsQtermError(rc=rc, rv=False, msg=self.geterrmsg(),
                                post=self._disconnect, conn=c, force=True)

        if c:
            self._disconnect(c, force=True)

        return rc
    teminate = qterm

    def geterrmsg(self):
        """
        Get the error message
        """
        mode = self.get_op_mode()
        if mode == PTL_CLI:
            return self.last_error
        elif self._conn is not None and self._conn >= 0:
            m = pbs_geterrmsg(self._conn)
            if m is not None:
                m = m.split('\n')
            return m


================================================
FILE: test/fw/ptl/utils/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


================================================
FILE: test/fw/ptl/utils/pbs_anonutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import logging
import os
import copy
import shlex
import re

from ptl.lib.pbs_teslib import (PbsTypeFGCLimit,
                                PbsAttribute)
from ptl.lib.pbs_ifl_mock import *
from ptl.utils.pbs_dshutils import DshUtils


ANON_USER_K = "user"
ANON_GROUP_K = "group"
ANON_HOST_K = "host"
ANON_JOBNAME_K = ATTR_name
ANON_ACCTNAME_K = ATTR_A


class PBSAnonymizer(object):

    """
    Holds and controls anonymizing operations of PBS data

    The anonymizer operates on attributes or resources.
    Resources operate on the resource name itself rather than
    the entire name, for example, to obfuscate the values associated
    to a custom resource "foo" that could be set as resources_available.
    foo resources_default.foo or Resource_List.foo, all that needs to be
    passed in to the function is "foo" in the list to obfuscate.

    :param attr_key: Attributes for which the attribute names themselves
                    should be obfuscated
    :type attr_key: list or None
    :param attr_val: Attributes for which the values should be obfuscated
    :type attr_val: list or None
    :param resc_key: Resources for which the resource names themselves should
                    be obfuscated
    :type resc_key: list or None
    :param resc_val: Resources for which the values should be obfuscated
    :type resc_val: list or None
    """

    logger = logging.getLogger(__name__)
    utils = BatchUtils()
    du = DshUtils()

    def __init__(self, attr_delete=None, resc_delete=None,
                 attr_key=None, attr_val=None,
                 resc_key=None, resc_val=None):

        # special cases
        self._entity = False
        self.job_sort_formula = None
        self.schedselect = None
        self.select = None

        self.set_attr_delete(attr_delete)
        self.set_resc_delete(resc_delete)
        self.set_attr_key(attr_key)
        self.set_attr_val(attr_val)
        self.set_resc_key(resc_key)
        self.set_resc_val(resc_val)
        self.anonymize = self.anonymize_batch_status

        # global anonymized mapping data
        self.gmap_attr_val = {}
        self.gmap_resc_val = {}
        self.gmap_attr_key = {}
        self.gmap_resc_key = {}
        self.num_bad_acct_records = 0

    def __get_anon_key(self, key, attr_map):
        """
        Get an anonymized string for the 'key' belonging to attr_map

        :param key: the key to anonymize
        :type key: String
        :param attr_map: the attr_map to which the key belongs
        :type attr_map: dict

        :returns: an anonymized string for the key
        """
        key = self.__refactor_key(key)

        if key in attr_map.keys():
            anon_key = attr_map[key]
        else:
            anon_key = PbsAttribute.random_str(len(key))
            attr_map[key] = anon_key

        return anon_key

    @staticmethod
    def __refactor_key(key):
        """
        There are some attributes which are aliases of each other
        and others which are lists like user/group lists, lists of hosts etc.
        Set a common key for them.
        """
        key_lower = key.lower()
        if "user" in key_lower or key == "requestor":
            key = ANON_USER_K
        elif "group" in key_lower:
            key = ANON_GROUP_K
        elif "host" in key_lower:
            key = ANON_HOST_K
        elif key == "Name" or key == "Jobname":
            key = ANON_JOBNAME_K
        elif key == "account":
            key = ANON_ACCTNAME_K

        return key

    def __get_anon_value(self, key, value, kv_map):
        """
        Get an anonymied string for the 'value' belonging to the kv_map
        provided.
        The kv_map will be in the following format:
            key:{val1:anon_val1, val2:anon_val2, ...}

        :param key: the key for this value
        :type key: String
        :param value: the value to anonymize
        :type value: String
        :param kv_map: the kv_map to which the key belongs
        :type kv_map: dict

        :returns: an anonymized string for the value
        """

        if key == "project" and value == "_pbs_project_default":
            return "_pbs_project_default"

        # Deal with attributes which have a list of values
        if key in (ATTR_u, ATTR_managers, ATTR_M, ATTR_g, ATTR_aclResvhost,
                   ATTR_aclhost, ATTR_auth_g, ATTR_auth_u):
            value_temp = "".join(value.split())
            value_list = value_temp.split(",")
        elif key == ATTR_exechost:
            value_list = []
            value_list_temp = value.split("+")
            for item in value_list_temp:
                value_list.append(item.split("/")[0])
        else:
            value_list = [value]

        key = self.__refactor_key(key)

        # Go through the list of values and anonymize each in the value string
        for val in value_list:
            if "@" in val:
                # value if of type "user@host"
                # anonymize the user and host parts separately
                if ANON_HOST_K in self.attr_val:
                    try:
                        user, host = val.split("@")
                        host = self.__get_anon_value(ANON_HOST_K, host,
                                                     self.gmap_attr_val)
                        user = self.__get_anon_value(ANON_USER_K, user,
                                                     self.gmap_attr_val)
                        anon_val = user + "@" + host
                        value = value.replace(val, anon_val)
                        continue
                    except Exception:
                        pass

            if key in kv_map:
                value_map = kv_map[key]
                anon_val = self.__get_anon_key(val, value_map)
            else:
                anon_val = PbsAttribute.random_str(len(val))
                kv_map[key] = {val: anon_val}
            value = value.replace(val, anon_val)

        return value

    def _initialize_key_map(self, keys):
        k = {}
        if keys is not None:
            if isinstance(keys, dict):
                return keys
            elif isinstance(keys, list):
                for i in keys:
                    k[i] = None
            elif isinstance(keys, str):
                for i in keys.split(","):
                    k[i] = None
            else:
                self.logger.error("unhandled map type")
                k = {None: None}
        return k

    def _initialize_value_map(self, keys):
        k = {}
        if keys is not None:
            if isinstance(keys, dict):
                return keys
            elif isinstance(keys, list):
                for i in keys:
                    k[i] = {}
            elif isinstance(keys, str):
                for i in keys.split(","):
                    k[i] = {}
            else:
                self.logger.error("unhandled map type")
                k = {None: None}
        return k

    def set_attr_delete(self, ad):
        """
        Name of attributes to delete

        :param ad: Attributes to delete
        :type ad: str or list or dictionary
        """
        self.attr_delete = self._initialize_value_map(ad)

    def set_resc_delete(self, rd):
        """
        Name of resources to delete

        :param rd: Resources to delete
        :type rd: str or list or dictionary
        """
        self.resc_delete = self._initialize_value_map(rd)

    def set_attr_key(self, ak):
        """
        Name of attributes to obfuscate.

        :param ak: Attribute keys
        :type ak: str or list or dictionary
        """
        self.attr_key = self._initialize_key_map(ak)

    def set_attr_val(self, av):
        """
        Name of attributes for which to obfuscate the value

        :param av: Attributes value to obfuscate
        :type av: str or list or dictionary
        """
        self.attr_val = self._initialize_value_map(av)
        if ("euser" or "egroup" or "project") in self.attr_val:
            self._entity = True

    def set_resc_key(self, rk):
        """
        Name of resources to obfuscate

        :param rk: Resource key
        :type rk: str or list or dictionary
        """
        self.resc_key = self._initialize_key_map(rk)

    def set_resc_val(self, rv):
        """
        Name of resources for which to obfuscate the value

        :param rv: Resource value to obfuscate
        :type rv: str or list or dictionary
        """
        self.resc_val = self._initialize_value_map(rv)

    def set_anon_map_file(self, name):
        """
        Name of file in which to store anonymized map data.
        This file is meant to remain private to a site as it
        contains the sensitive anonymized data.

        :param name: Name of file to which anonymized data to store.
        :type name: str
        """
        self.anon_map_file = name

    def anonymize_resource_group(self, filename):
        """
        Anonymize the user and group fields of a resource
        group filename

        :param filename: Resource group filename
        :type filename: str
        """
        anon_rg = []

        try:
            f = open(filename)
            lines = f.readlines()
            f.close()
        except IOError:
            self.logger.error("Error processing " + filename)
            return None

        for data in lines:
            data = data.strip()
            if data:
                if data[0] == "#":
                    continue

                _d = data.split()
                ug = _d[0]
                if ":" in ug:
                    (euser, egroup) = ug.split(":")
                else:
                    euser = ug
                    egroup = None

                if "euser" not in self.attr_val:
                    anon_euser = euser
                else:
                    anon_euser = None
                    if ANON_USER_K in self.gmap_attr_val:
                        if euser in self.gmap_attr_val[ANON_USER_K]:
                            anon_euser = self.gmap_attr_val[ANON_USER_K][euser]
                    else:
                        self.gmap_attr_val[ANON_USER_K] = {}

                if euser is not None and anon_euser is None:
                    anon_euser = PbsAttribute.random_str(len(euser))
                    self.gmap_attr_val[ANON_USER_K][euser] = anon_euser

                if "egroup" not in self.attr_val:
                    anon_egroup = egroup
                else:
                    anon_egroup = None

                    if egroup is not None:
                        if ANON_GROUP_K in self.gmap_attr_val:
                            if egroup in self.gmap_attr_val[ANON_GROUP_K]:
                                anon_egroup = (self.gmap_attr_val[ANON_GROUP_K]
                                               [egroup])
                        else:
                            self.gmap_attr_val[ANON_GROUP_K] = {}

                if egroup is not None and anon_egroup is None:
                    anon_egroup = PbsAttribute.random_str(len(egroup))
                    self.gmap_attr_val[ANON_GROUP_K][egroup] = anon_egroup

                # reconstruct the fairshare info by combining euser and egroup
                out = [anon_euser]
                if anon_egroup is not None:
                    out[0] += ":" + anon_egroup
                # and appending the rest of the original line
                out.append(_d[1])
                if len(_d) > 1:
                    p = _d[2].strip()
                    if (ANON_USER_K in self.gmap_attr_val and
                            p in self.gmap_attr_val[ANON_USER_K]):
                        out.append(self.gmap_attr_val[ANON_USER_K][p])
                    else:
                        out.append(_d[2])
                if len(_d) > 2:
                    out += _d[3:]
                anon_rg.append(" ".join(out))

        return anon_rg

    def anonymize_resource_def(self, resources):
        """
        Anonymize the resource definition
        """
        if not self.resc_key:
            return resources

        for curr_anon_resc, val in self.resc_key.items():
            if curr_anon_resc in resources:
                tmp_resc = copy.copy(resources[curr_anon_resc])
                del resources[curr_anon_resc]
                if val is None:
                    if curr_anon_resc in self.gmap_resc_key:
                        val = self.gmap_resc_key[curr_anon_resc]
                    else:
                        val = PbsAttribute.random_str(len(curr_anon_resc))
                elif curr_anon_resc not in self.gmap_resc_key:
                    self.gmap_resc_key[curr_anon_resc] = val
                tmp_resc.set_name(val)
                resources[val] = tmp_resc
        return resources

    def __anonymize_fgc(self, d, attr, ar, val):
        """
        Anonymize an FGC limit value
        """

        m = {"u": "euser", "g": "egroup", "p": "project"}

        if "," in val:
            fgc_lim = val.split(",")
        else:
            fgc_lim = [val]

        nfgc = []
        for lim in fgc_lim:
            _fgc = PbsTypeFGCLimit(attr, lim)
            ename = _fgc.entity_name
            if ename in ("PBS_GENERIC", "PBS_ALL"):
                nfgc.append(lim)
                continue

            obf_ename = ename
            for etype, nm in m.items():
                if _fgc.entity_type == etype:
                    if nm not in self.gmap_attr_val:
                        if nm in ar and ename in ar[nm]:
                            obf_ename = ar[nm][ename]
                        else:
                            obf_ename = PbsAttribute.random_str(len(ename))
                        self.gmap_attr_val[nm] = {ename: obf_ename}
                    elif ename in self.gmap_attr_val[nm]:
                        if ename in self.gmap_attr_val[nm]:
                            obf_ename = self.gmap_attr_val[nm][ename]
                    break
            _fgc.entity_name = obf_ename
            nfgc.append(_fgc.__val__())

        d[attr] = ",".join(nfgc)

    def __anonymize_attr_val(self, d, attr, ar, name, val):
        """
        Obfuscate an attribute/resource values
        """

        # don't obfuscate default project
        if attr == "project" and val == "_pbs_project_default":
            return

        nstr = []
        if "." in attr:
            m = self.gmap_resc_val
        else:
            m = self.gmap_attr_val

        if val in ar[name]:
            nstr.append(ar[name][val])
            if name in self.lmap:
                self.lmap[name][val] = ar[name][val]
            else:
                self.lmap[name] = {val: ar[name][val]}
            if name not in m:
                m[name] = {val: ar[name][val]}
            elif val not in m[name]:
                m[name][val] = ar[name][val]
        else:
            # Obfuscate by randomizing with a value of the same length
            tmp_v = val.split(",")
            for v in tmp_v:
                if v in ar[name]:
                    r = ar[name][v]
                elif name in m and v in m[name]:
                    r = m[name][v]
                else:
                    r = PbsAttribute.random_str(len(v))
                    if not isinstance(ar[name], dict):
                        ar[name] = {}
                    ar[name][v] = r
                self.lmap[name] = {v: r}
                if name not in m:
                    m[name] = {v: r}
                elif v not in m[name]:
                    m[name][v] = r

                nstr.append(r)

        if d is not None:
            d[attr] = ",".join(nstr)

    def __anonymize_attr_key(self, d, attr, ar, name, res):
        """
        Obfuscate an attribute/resource key
        """

        if res is not None:
            m = self.gmap_resc_key
        else:
            m = self.gmap_attr_key

        if not ar[name]:
            if name in m:
                ar[name] = m[name]
            else:
                randstr = PbsAttribute.random_str(len(name))
                ar[name] = randstr
                m[name] = randstr

        if d is not None:
            tmp_val = d[attr]
            del d[attr]

            if res is not None:
                d[res + "." + ar[name]] = tmp_val
            else:
                d[ar[name]] = tmp_val

        if name not in self.lmap:
            self.lmap[name] = ar[name]

        if name not in m:
            m[name] = ar[name]

    def anonymize_batch_status(self, data=None):
        """
        Anonymize arbitrary batch_status data

        :param data: Batch status data
        :type data: List or dictionary
        """
        if not isinstance(data, (list, dict)):
            self.logger.error("data expected to be dict or list")
            return None

        if isinstance(data, dict):
            dat = [data]
        else:
            dat = data

        # Local mapping data used to store obfuscation mapping data for this
        # specific item, d
        self.lmap = {}

        # loop over each "batch_status" entry to obfuscate
        for d in dat:

            if self.attr_delete is not None:
                for todel in self.attr_delete:
                    if todel in d:
                        del d[todel]

            if self.resc_delete is not None:
                for todel in self.resc_delete:
                    for tmpk in d.keys():
                        if "." in tmpk and todel == tmpk.split(".")[1]:
                            del d[tmpk]

            # Loop over each object's attributes, this is where the special
            # cases are handled (e.g., FGC limits, formula, select spec...)
            for attr in d:
                val = d[attr]

                if "." in attr:
                    (res_type, res_name) = attr.split(".")
                else:
                    res_type = None
                    res_name = attr

                if res_type is not None:
                    if self._entity and (attr.startswith("max_run") or
                                         attr.startswith("max_queued")):
                        self.__anonymize_fgc(d, attr, self.attr_val,
                                             val)

                    if res_name in self.resc_val:
                        if (attr.startswith("max_run") or
                                attr.startswith("max_queued")):
                            self.__anonymize_fgc(d, attr, self.attr_val,
                                                 val)
                        self.__anonymize_attr_val(d, attr, self.resc_val,
                                                  res_name, val)

                    if res_name in self.resc_key:
                        self.__anonymize_attr_key(d, attr, self.resc_key,
                                                  res_name, res_type)
                else:
                    if attr in self.attr_val:
                        self.__anonymize_attr_val(d, attr, self.attr_val,
                                                  attr, val)

                    if attr in self.attr_key:
                        self.__anonymize_attr_key(d, attr, self.attr_key,
                                                  attr, None)

                    if ((attr in ("job_sort_formula", "schedselect",
                                  "select")) and self.resc_key):
                        for r in self.resc_key:
                            if r in val:
                                if r not in self.gmap_resc_key:
                                    self.gmap_resc_key[
                                        r] = PbsAttribute.random_str(len(r))
                                val = val.replace(r, self.gmap_resc_key[r])
                                setattr(self, attr, val)

                        d[attr] = val

    @staticmethod
    def __verify_key(line, key):
        """
        Verify that a given key is actually a key in the context of the line
        given.

        :param line: the line to check in
        :type line: String
        :param key: the key to find
        :type key: String

        :returns a tuple of (key index, 1st character of key's value)
        :returns None if the key is invalid
        """
        line_len = len(line)
        key_len = len(key)
        key_index = line.find(key, 0, line_len)
        line_nospaces = "".join(line.split())
        len_nospaces = len(line_nospaces)
        key_idx_nospaces = line_nospaces.find(key, 0, len_nospaces)
        value_char = None

        # Find all instances of the string representing key in the line
        # Find the instance which is a valid key
        while key_index >= 0 and key_index < line_len:
            valid_key = True

            # Make sure that the characters before & after are not alpanum
            if key_index != 0:
                index_before = key_index - 1
                char_before = line[index_before]
                if char_before.isalnum() is True:
                    valid_key = False
            else:
                char_before = None
            if valid_key is True:
                if key_index < line_len:
                    index_after = key_index + key_len
                    char_after = line[index_after]
                    if char_after.isalnum() is True:
                        valid_key = False
                else:
                    char_after = None
                if valid_key is True:
                    # if 'char_after' is not "=", then the characters before
                    # and after should be the delimiter, and be equal
                    if char_before is not None and char_after is not None:
                        if char_after != "=":
                            if char_before != char_after:
                                valid_key = False
                    if valid_key is True:
                        # Now, let's look at the whitespace stripped line
                        index_after = key_idx_nospaces + key_len
                        if index_after >= len_nospaces:
                            # Nothing after the key, can't be a key
                            valid_key = False
                        else:
                            # Find a valid operator after the key
                            # valid operators: =, +=, -=, ==
                            if line_nospaces[index_after] != "=":
                                # Check for this case: "key +=/-=/== value"
                                if line_nospaces[index_after] in ("+", "-"):
                                    index_after = index_after + 1
                                    if line_nospaces[index_after] != "=":
                                        valid_key = False
                                else:
                                    valid_key = False
                            if valid_key is True:
                                val_idx_nospaces = index_after + 1
                                if val_idx_nospaces >= len_nospaces:
                                    # There's no value!, can't be a valid key
                                    valid_key = False

            if valid_key is False:
                # Find the next instance of the key
                key_index = line.find(key, key_index + len(key), line_len)
                key_idx_nospaces = line_nospaces.find(key,
                                                      key_idx_nospaces +
                                                      len(key),
                                                      len_nospaces)
            else:
                # Seems like a valid key!
                # Break out of the loop
                value_char = line_nospaces[val_idx_nospaces]
                break

        if key_index == -1 or key_idx_nospaces == -1:
            return None

        return (key_index, value_char)

    def __get_value(self, line, key):
        """
        Get the 'value' of a kv pair for the key given, from the line given

        :param line: the line to search in
        :type line: String
        :param key: the key for the value
        :type key: String

        :returns: String containing the value or None
        """
        # Check if the line is of type:
        #     <attribute name> = <value>
        line_list_spaces = line.split()
        if line_list_spaces is not None:
            first_word = line_list_spaces[0]
            if key == first_word:
                # Check that this word is followed by an '=' sign
                equals_sign = line_list_spaces[1]
                if equals_sign == "=":
                    # Ok, we are going to assume that this is enough to
                    # determine that this is the correct type
                    # return everything after the '=" as value
                    val_index = line.index("=") + 1
                    value = line[val_index:].strip()
                    return value

        # Check that a valid instance of this key exists in the string
        kv = self.__verify_key(line, key)
        if kv is None:
            return None
        key_index, val_char = kv

        # Assumption: the character before the key is the delimiter
        # for the k-v pair
        delimiter = line[key_index - 1]
        if delimiter is None:
            # Hard luck, now there's no way to know, let's just assume
            # that space is the delimiter and hope for the best
            delimiter = " "

        # Determine the value's start index
        index_after_key = key_index + len(key)
        value_index = line[index_after_key:].find(val_char) + index_after_key

        # Get the value
        lexer = shlex.shlex(line[value_index:], posix=True)
        lexer.whitespace = delimiter
        lexer.whitespace_split = True
        try:
            value = lexer.get_token()
        except ValueError:
            # Sometimes, the data can be incoherent with things like
            # Unclosed quotes, which makes get_token() throw an exception
            # Just return None
            return None

        # Strip the value of any trailing whitespaces (like newlines)
        value = value.rstrip()

        return value

    @staticmethod
    def __delete_kv(line, key, value):
        """
        Delete a key-value pair from a line
        If after deleting the k-v pair, the left over string has
        no alphanumeric characters, then delete the line

        :param line: the line in question
        :type line: String
        :param key: the key ofo the kv pair
        :type key: String
        :param value: the value of the kv pair
        :type value: String

        :returns: the line without the kv pair
        :returns: None if the line should be deleted
        """
        key_index = line.find(key)
        index_after_key = key_index + len(key)
        line_afterkey = line[index_after_key:]
        value_index = line_afterkey.find(value) + index_after_key

        # find the index of the last character of value
        end_index = value_index + len(value)

        # Find the start index of the kv pair
        # Also include the character before the key
        # This will remove an extra delimiter that would be
        # left after the kv pair is deleted
        start_index = key_index - 1
        if start_index < 0:
            start_index = 0

        # Remove the kv pair
        line = line[:start_index] + line[end_index:]

        # Check if there's any alphanumeric characters left in the line
        if re.search("[A-Za-z0-9]", line) is None:
            # Delete the whole line
            return None

        return line

    def __add_alias_attr(self, key, alias_key):
        """
        Some attributes have aliases. Added alias for a given attribute to the
        global maps

        :param key: the original attribute
        :type key: str
        :param alias_key: the alias
        :type alias_key: str
        """
        if key in self.attr_delete:
            self.attr_delete[alias_key] = self.attr_delete[key]
        if key in self.attr_key:
            self.attr_key[alias_key] = self.attr_key[key]
        if key in self.attr_val:
            self.attr_val[alias_key] = self.attr_val[key]
        if key in self.resc_delete:
            self.resc_delete[alias_key] = self.resc_delete[key]
        if key in self.resc_key:
            self.resc_key[alias_key] = self.resc_key[key]
        if key in self.resc_val:
            self.resc_val[alias_key] = self.resc_val[key]

    def anonymize_file_tabular(self, filename, extension=".anon",
                               inplace=False):
        """
        Anonymize pbs short format outputs (tabular form)
        (e.g - qstat, pbsnodes -aS)
        The 'titles' of various columns are used to look up keys inside the
        global attribute maps and they are anonymized/removed accordingly.

        Warning: only works work PBS tabular outputs, not generic.

        :param filename: Name of the file to anonymize
        :type filename: str
        :param delim: delimiter for the table
        :type delim: str
        :param extension: Extension of the anonymized file
        :type extension: str
        :param inplace: If true returns the original file name for
                        which contents have been replaced
        :type inplace: bool

        :returns: a str object containing filename of the anonymized file
        """
        fn = self.du.create_temp_file()

        # qstat outputs sometimes have different names for some attributes
        self.__add_alias_attr(ATTR_euser, "User")
        self.__add_alias_attr(ATTR_euser, "Username")
        self.__add_alias_attr(ATTR_name, "Jobname")
        self.__add_alias_attr(ATTR_name, "Name")

        # pbsnodes -aS output has a 'host' field which should be anonymized
        self.__add_alias_attr(ATTR_NODE_Host, "host")

        header = None
        with open(filename) as f, open(fn, "w") as nf:
            # Get the header and the line with '-'s
            # Also write out the header and dash lines to the output file
            line_num = 0
            for line in f:
                nf.write(line)
                line_num += 1
                line_strip = line.strip()

                if len(line_strip) == 0:
                    continue

                if line_strip[0].isalpha():
                    header = line
                    continue
                # Dash line is the line after header
                if header is not None:
                    dash_line = line
                    break

            if header is None:  # Couldn't find the header
                # Remove the aliases

                return filename

            # The dash line tells us the length of each column
            dash_list = dash_line.split()
            col_length = {}
            # Store each column's length
            col_index = 0
            for item in dash_list:
                col_len = len(item)
                col_length[col_index] = col_len
                col_index += 1

            # Find out the columns to anonymize/delete
            del_columns = []
            anon_columns = {}
            start_index = 0
            end_index = 0
            for col_index, length in enumerate(col_length):
                start_index = end_index
                end_index = start_index + length + 1

                # Get the column's title
                title = header[start_index:end_index]
                title = title.strip()

                if title in self.attr_delete.keys():
                    # Need to delete this whole column
                    del_columns.append(col_index)
                elif title in self.attr_val.keys():
                    # Need to anonymize all values in the column
                    anon_columns[col_index] = title

            anon_col_keys = anon_columns.keys()
            # Go through the file and anonymize/delete columns
            for line in f:
                start_index = 0
                end_index = 0
                # Iterate over the different fields
                col_index = 0
                for col_index in range(len(col_length)):
                    length = col_length[col_index]
                    start_index = end_index
                    end_index = start_index + length

                    if col_index in del_columns:
                        # Need to delete the value of this column
                        # Just replace the value by blank spaces
                        line2 = list(line)
                        for i in range(len(line2)):
                            if i >= start_index and i < end_index:
                                line2[i] = " "
                        line = "".join(line2)
                    elif col_index in anon_col_keys:
                        # Need to anonymize this column's value
                        # Get the value
                        value = line[start_index:end_index]
                        value_strip = value.strip()
                        anon_val = self.__get_anon_value(
                            anon_columns[col_index],
                            value_strip,
                            self.gmap_attr_val)
                        line = line.replace(value_strip, anon_val)

                nf.write(line)

        if inplace:
            out_filename = filename

        else:
            out_filename = filename + extension

        os.rename(fn, out_filename)

        return out_filename

    def anonymize_file_kv(self, filename, extension=".anon", inplace=False):
        """
        Anonymize a file which has data in the form of key-value pairs.
        Replace every occurrence of any entry in the global
        map for the given file by its anonymized values.

        :param filename: Name of the file to anonymize
        :type filename: str
        :param extension: Extension of the anonymized file
        :type extension: str
        :param inplace: If true returns the original file name for
                        which contents have been replaced
        :type inplace: bool

        :returns: a str object containing filename of the anonymized file
        """
        if not os.path.isfile(filename):
            self.logger.debug("%s not found, nothing to anonymize" % filename)
            return filename

        fn = self.du.create_temp_file()

        with open(filename) as f, open(fn, "w") as nf:
            delete_line = False
            for line in f:
                # Check if this is a line extension for an attr being deleted
                if delete_line is True and line[0] == "\t":
                    continue

                delete_line = False

                # Check if any of the attributes to delete are in the line
                for key in self.attr_delete.keys():
                    if key in line:
                        value = self.__get_value(line, key)
                        if value is None:
                            continue
                        # Delete the key-value pair
                        line = self.__delete_kv(line, key, value)
                        if line is None:
                            delete_line = True
                            break

                if delete_line is True:
                    continue

                # Anonymize key-value pairs
                for key in self.attr_key.keys():
                    if key in line:
                        if self.__verify_key(line, key) is None:
                            continue
                        anon_key = self.__get_anon_key(key, self.gmap_attr_key)
                        line = line.replace(key, anon_key)

                for key in self.resc_key.keys():
                    if key in line:
                        if self.__verify_key(line, key) is None:
                            continue
                        anon_key = self.__get_anon_key(key, self.gmap_resc_key)
                        line = line.replace(key, anon_key)

                for key in self.attr_val.keys():
                    if key in line:
                        value = self.__get_value(line, key)
                        if value is None:
                            continue
                        anon_value = self.__get_anon_value(key, value,
                                                           self.gmap_attr_val)
                        line = line.replace(value, anon_value)

                for key in self.resc_val.keys():
                    if key in line:
                        value = self.__get_value(line, key)
                        if value is None:
                            continue
                        anon_value = self.__get_anon_value(key, value,
                                                           self.gmap_resc_val)
                        line = line.replace(value, anon_value)

                # Anonymize IP addresses
                pattern = re.compile(
                    r"\b*\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}\b*")
                match_obj = re.search(pattern, line)
                if match_obj:
                    ip = match_obj.group(0)
                    anon_key = self.__get_anon_key(ip, self.gmap_attr_key)
                    line = line.replace(ip, anon_key)

                nf.write(line)

        if inplace:
            out_filename = filename

        else:
            out_filename = filename + extension

        os.rename(fn, out_filename)

        return out_filename

    def anonymize_accounting_log(self, logfile):
        """
        Anonymize the accounting log

        :param logfile: Acconting log file
        :type logfile: str
        """
        try:
            f = open(logfile)
        except IOError:
            self.logger.error("Error processing " + logfile)
            return None

        self.__add_alias_attr(ATTR_euser, "user")
        self.__add_alias_attr(ATTR_euser, "requestor")
        self.__add_alias_attr(ATTR_egroup, "group")
        self.__add_alias_attr(ATTR_A, "account")

        anon_data = []
        for data in f:
            # accounting log format is
            # %Y/%m/%d %H:%M:%S;<Key>;<Id>;<key1=val1> <key2=val2> ...
            curr = data.split(";", 3)
            if curr is None or len(curr) < 4:
                continue
            if curr[1] in ("A", "L"):
                anon_data.append(data.strip())
                continue
            buf = shlex.split(curr[3].strip())

            skip_record = False
            # Split the attribute list into key value pairs
            kvl_list = [n.split("=", 1) for n in buf]
            if kvl_list is None:
                self.num_bad_acct_records += 1
                self.logger.debug("Bad accounting record found:\n" +
                                  data)
                continue
            for kvl in kvl_list:
                try:
                    k, v = kvl
                except ValueError:
                    self.num_bad_acct_records += 1
                    self.logger.debug("Bad accounting record found:\n" +
                                      data)
                    skip_record = True
                    break

                if k in self.attr_val:
                    anon_kv = self.__get_anon_value(k, v, self.gmap_attr_val)
                    kvl[1] = anon_kv

                if k in self.attr_key:
                    anon_ak = self.__get_anon_key(k, self.gmap_attr_key)
                    kvl[0] = anon_ak

                if "." in k:
                    restype, resname = k.split(".")
                    for rv in self.resc_val:
                        if resname == rv:
                            anon_rv = self.__get_anon_value(
                                resname, rv, self.gmap_resc_val)
                            kvl[1] = anon_rv

                    if resname in self.resc_key:
                        anon_rk = self.__get_anon_key(resname,
                                                      self.gmap_resc_key)
                        kvl[0] = restype + "." + anon_rk
            if not skip_record:
                anon_data.append(";".join(curr[:3]) + ";" +
                                 " ".join(["=".join(n) for n in kvl_list]))
        f.close()

        return anon_data

    def anonymize_sched_config(self, scheduler):
        """
        Anonymize the scheduler config

        :param scheduler: PBS scheduler object
        """
        if len(self.resc_key) == 0:
            return

        # when anonymizing we get rid of the comments as they may contain
        # sensitive information
        scheduler._sched_config_comments = {}

        # If resources need to be anonymized then update the resources line
        # job_sort_key and node_sort_key
        sr = scheduler.get_resources()
        if sr:
            for i, sres in enumerate(sr):
                if sres in self.resc_key:
                    if sres in self.gmap_resc_key:
                        sr[i] = self.gmap_resc_key[sres]
                    else:
                        anon_res = PbsAttribute.random_str(len(sres))
                        self.gmap_resc_key[sres] = anon_res
                        sr[i] = anon_res

            scheduler.sched_config["resources"] = ",".join(sr)

        for k in ["job_sort_key", "node_sort_key"]:
            if k in scheduler.sched_config:
                sc_jsk = scheduler.sched_config[k]
                if not isinstance(sc_jsk, list):
                    sc_jsk = list(sc_jsk)

                for r in self.resc_key:
                    for i, key in enumerate(sc_jsk):
                        if r in key:
                            sc_jsk[i] = key.replace(r, self.resc_key[r])

    def __str__(self):
        return ("Attributes Values: " + str(self.gmap_attr_val) + "\n" +
                "Resources Values: " + str(self.gmap_resc_val) + "\n" +
                "Attributes Keys: " + str(self.gmap_attr_key) + "\n" +
                "Resources Keys: " + str(self.gmap_resc_key))


================================================
FILE: test/fw/ptl/utils/pbs_cliutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import logging
import os
import re


class CliUtils(object):
    """
    Command line interface utility
    """

    @classmethod
    def get_logging_level(cls, level):
        """
        Get the logging levels

        :param level: Name of the logging level
        :type level: str
         """
        logging.DEBUG2 = logging.DEBUG - 1
        logging.INFOCLI = logging.INFO - 1
        logging.INFOCLI2 = logging.INFOCLI - 1

        log_lvl = None
        level = str(level).upper()
        if level == 'INFO':
            log_lvl = logging.INFO
        elif level == 'INFOCLI':
            log_lvl = logging.INFOCLI
        elif level == 'INFOCLI2':
            log_lvl = logging.INFOCLI2
        elif level == 'DEBUG':
            log_lvl = logging.DEBUG
        elif level == 'DEBUG2':
            log_lvl = logging.DEBUG2
        elif level == 'WARNING':
            log_lvl = logging.WARNING
        elif level == 'ERROR':
            log_lvl = logging.ERROR
        elif level == 'FATAL':
            log_lvl = logging.FATAL

        return log_lvl

    @staticmethod
    def check_bin(bin_name):
        """
        Check for command exist

        :param bin_name: Command to be checked
        :type bin_name: str
        :returns: True if command exist else return False
        """
        ec = os.system("/usr/bin/which " + bin_name + " > /dev/null")
        if ec == 0:
            return True
        return False

    @staticmethod
    def __json__(data):
        try:
            import json
            return json.dumps(data, sort_keys=True, indent=4)
        except Exception:
            # first escape any existing double quotes
            _pre = str(data).replace('"', '\\"')
            # only then, replace the single quotes with double quotes
            return _pre.replace('\'', '"')

    @staticmethod
    def expand_abs_path(path):
        """
        Expand the path to absolute path
        """
        if path.startswith('~'):
            return os.path.expanduser(path)
        return os.path.abspath(path)

    @staticmethod
    def priv_ports_info(hostname=None):
        """
        Return a list of privileged ports in use on a given host

        :param hostname: The host on which to query privilege ports
                         usage. Defaults to the local host
        :type hostname: str or None
        """
        from ptl.utils.pbs_dshutils import DshUtils

        netstat_tag = re.compile(r"tcp[\s]+[\d]+[\s]+[\d]+[\s]+"
                                 r"(?P<srchost>[\w\*\.]+):(?P<srcport>[\d]+)"
                                 r"[\s]+(?P<desthost>[\.\w\*:]+):"
                                 r"(?P<destport>[\d]+)"
                                 r"[\s]+(?P<state>[\w]+).*")
        du = DshUtils()
        ret = du.run_cmd(hostname, ['netstat', '-at', '--numeric-ports'])
        if ret['rc'] != 0:
            return False

        msg = []
        lines = ret['out']
        resv_ports = {}
        source_hosts = []
        for line in lines:
            m = netstat_tag.match(line)
            if m:
                srcport = int(m.group('srcport'))
                srchost = m.group('srchost')
                destport = int(m.group('destport'))
                desthost = m.group('desthost')
                if srcport < 1024:
                    if srchost not in source_hosts:
                        source_hosts.append(srchost)
                    msg.append(line)
                    if srchost not in resv_ports:
                        resv_ports[srchost] = [srcport]
                    elif srcport not in resv_ports[srchost]:
                        resv_ports[srchost].append(srcport)
                if destport < 1024:
                    msg.append(line)
                    if desthost not in resv_ports:
                        resv_ports[desthost] = [destport]
                    elif destport not in resv_ports[desthost]:
                        resv_ports[desthost].append(destport)

        if len(resv_ports) > 0:
            msg.append('\nPrivilege ports in use: ')
            for k, v in resv_ports.items():
                msg.append('\t' + k + ': ' +
                           str(",".join([str(l) for l in v])))
            for sh in source_hosts:
                msg.append('\nTotal on ' + sh + ': ' +
                           str(len(resv_ports[sh])))
        else:
            msg.append('No privileged ports currently allocated')

        return msg


================================================
FILE: test/fw/ptl/utils/pbs_covutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import sys
import time
import logging
import tempfile
from stat import S_IWOTH
from urllib.parse import urljoin
from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_cliutils import CliUtils

try:
    from BeautifulSoup import BeautifulSoup
except Exception:
    pass


class LcovUtils(object):
    """
    Coverage Utils

    :param cov_bin: Coverage binary
    :param html_bin: Coverage html binary
    :param cov_out: Coverage output directory
    :type cov_out: str or None
    :param data_dir: Coverage data directory
    :type data_dir: str or None
    :param html_nosrc: HTML reports without PBS source
    :type stml_nosrc: bool
    :param html_baseurl: HTML base url
    :type html_baseurl: str or None
    """
    du = DshUtils()
    logger = logging.getLogger(__name__)

    def __init__(self, cov_bin=None, html_bin=None, cov_out=None,
                 data_dir=None, html_nosrc=False, html_baseurl=None):
        self.set_coverage_data_dir(data_dir)
        self.set_coverage_bin(cov_bin)
        self.set_genhtml_bin(html_bin)
        self.set_coverage_out(cov_out)
        self.set_html_nosource(html_nosrc)
        self.set_html_baseurl(html_baseurl)
        self.coverage_traces = []

    def set_html_baseurl(self, baseurl):
        """
        Set ``HTML`` base url
        """
        self.logger.info('coverage baseurl set to ' + str(baseurl))
        self.html_baseurl = baseurl

    def set_html_nosource(self, nosource=False):
        """
        Set HTML nosource parameter to False.
        """
        self.logger.info('coverage no-source set to ' + str(nosource))
        self.html_nosrc = nosource

    def set_coverage_bin(self, cov_bin=None):
        """
        Set the coverage binary

        :param cov_binary: Coverage bin to set
        """
        if cov_bin is None:
            cov_bin = 'lcov'
        rv = CliUtils.check_bin(cov_bin)
        if not rv:
            self.logger.error('None lcov_bin defined!')
            sys.exit(1)
        else:
            self.logger.info('coverage utility set to ' + cov_bin)
            self.cov_bin = cov_bin
        return rv

    def set_genhtml_bin(self, html_bin=None):
        """
        Set HTML generation utility.

        :param html_bin: HTML bin to set
        """
        if html_bin is None:
            html_bin = 'genhtml'
        rv = CliUtils.check_bin(html_bin)
        if not rv:
            self.logger.error('%s tool not found' % (html_bin))
            self.html_bin = None
        else:
            self.logger.info('HTML generation utility set to ' + html_bin)
            self.html_bin = html_bin
        return rv

    def set_coverage_out(self, cov_out=None):
        """
        Set the coverage output directory

        :param cov_out: Coverage output directory path.
        """
        if cov_out is None:
            d = 'pbscov-' + time.strftime('%Y%m%d_%H%M%S', time.localtime())
            cov_out = os.path.join(tempfile.gettempdir(), d)
        if not os.path.isdir(cov_out):
            os.mkdir(cov_out)
        self.logger.info('coverage output directory set to ' + cov_out)
        self.cov_out = cov_out

    def set_coverage_data_dir(self, data=None):
        """
        Set the coverage data directory

        :param data: Data directory path
        :returns: True if file name ends with .gcno else return False
        """
        self.data_dir = data
        if self.data_dir is not None:
            walker = os.walk(self.data_dir)
            for _, _, files in walker:
                for f in files:
                    if f.endswith('.gcno'):
                        return True
        return False

    def add_trace(self, trace):
        """
        Add coverage trace

        :param trace: Coverage trace
        """
        if trace not in self.coverage_traces:
            self.logger.info('Adding coverage trace: %s' % (trace))
            self.coverage_traces.append(trace)

    def create_coverage_data_files(self, path):
        """
        Create .gcda counterpart files for every .gcno file and give it
        read/write permissions
        """
        walker = os.walk(path)
        for root, _, files in walker:
            for f in files:
                if f.endswith('.gcda'):
                    pf = os.path.join(root, f)
                    s = os.stat(pf)
                    if (s.st_mode & S_IWOTH) == 0:
                        self.du.run_cmd(cmd=['chmod', '666', pf],
                                        level=logging.DEBUG, sudo=True)
                elif f.endswith('.gcno'):
                    nf = f.replace('.gcno', '.gcda')
                    pf = os.path.join(root, nf)
                    if not os.path.isfile(pf):
                        self.du.run_cmd(cmd=['touch', pf],
                                        level=logging.DEBUG, sudo=True)
                        self.du.run_cmd(cmd=['chmod', '666', pf],
                                        level=logging.DEBUG, sudo=True)

    def initialize_coverage(self, out=None, name=None):
        """
        Initialize coverage

        :param out: Output path
        :type out: str or None
        :param name: name of the command
        :type name: str or None
        """
        if self.data_dir is not None:
            if out is None:
                out = os.path.join(self.cov_out, 'baseline.info')
            self.logger.info('Initializing coverage data to ' + out)
            self.create_coverage_data_files(self.data_dir)
            cmd = [self.cov_bin]
            if name is not None:
                cmd += ['-t', name]
            cmd += ['-i', '-d', self.data_dir, '-c', '-o', out]
            self.du.run_cmd(cmd=cmd, logerr=False)
            self.add_trace(out)

    def capture_coverage(self, out=None, name=None):
        """
        Capture the coverage parameters
        """
        if self.data_dir is not None:
            if out is None:
                out = os.path.join(self.cov_out, 'tests.info')
            self.logger.info('Capturing coverage data to ' + out)
            cmd = [self.cov_bin]
            if name is not None:
                cmd += ['-t', name]
            cmd += ['-c', '-d', self.data_dir, '-o', out]
            self.du.run_cmd(cmd=cmd, logerr=False)
            self.add_trace(out)

    def zero_coverage(self):
        """
        Zero the data counters. Note that a process would need to be restarted
        in order to collect data again, running ``--initialize`` will not get
        populate the data counters
        """
        if self.data_dir is not None:
            self.logger.info('Resetting coverage data')
            cmd = [self.cov_bin, '-z', '-d', self.data_dir]
            self.du.run_cmd(cmd=cmd, logerr=False)

    def merge_coverage_traces(self, out=None, name=None, exclude=None):
        """
        Merge the coverage traces
        """
        if not self.coverage_traces:
            return
        if out is None:
            out = os.path.join(self.cov_out, 'total.info')
        self.logger.info('Merging coverage traces to ' + out)
        if exclude is not None:
            tmpout = out + '.tmp'
        else:
            tmpout = out
        cmd = [self.cov_bin]
        if name is not None:
            cmd += ['-t', name]
        for t in self.coverage_traces:
            cmd += ['-a', t]
        cmd += ['-o', tmpout]
        self.du.run_cmd(cmd=cmd, logerr=False)
        if exclude is not None:
            cmd = [self.cov_bin]
            if name is not None:
                cmd += ['-t', name]
            cmd += ['-r', tmpout] + exclude + ['-o', out]
            self.du.run_cmd(cmd=cmd, logerr=False)
            self.du.rm(path=tmpout, logerr=False)

    def generate_html(self, out=None, html_out=None, html_nosrc=False):
        """
        Generate the ``HTML`` report
        """
        if self.html_bin is None:
            self.logger.warn('No genhtml bin is defined')
            return
        if out is None:
            out = os.path.join(self.cov_out, 'total.info')
        if not os.path.isfile(out):
            return
        if html_out is None:
            html_out = os.path.join(self.cov_out, 'html')
        if (self.html_nosrc or html_nosrc):
            self.logger.info('Generating HTML reports (without PBS source)'
                             ' from  coverage data')
            cmd = [self.html_bin, '--no-source', out]
            cmd += ['-o', html_out]
            self.du.run_cmd(cmd=cmd, logerr=False)
        else:
            self.logger.info('Generating HTML reports (with PBS Source) from'
                             ' coverage data')
            cmd = [self.html_bin, out, '-o', html_out]
            self.du.run_cmd(cmd=cmd, logerr=False)

    def change_baseurl(self, html_out=None, html_baseurl=None):
        """
        Change the ``HTML`` base url
        """
        if html_baseurl is None:
            html_baseurl = self.html_baseurl
        if html_baseurl is None:
            return
        if html_out is None:
            html_out = os.path.join(self.cov_out, 'html')
        if not os.path.isdir(html_out):
            return
        html_out_bu = os.path.join(os.path.dirname(html_out),
                                   os.path.basename(html_out) + '_baseurl')
        if html_baseurl[-1] != '/':
            html_baseurl += '/'
        self.logger.info('Changing baseurl to %s' % (html_baseurl))
        self.du.run_copy(src=html_out, dest=html_out_bu, recursive=True)
        for root, _, files in os.walk(html_out_bu):
            newroot = root.split(html_out_bu)[1]
            if ((len(newroot) > 0) and (newroot[0] == '/')):
                newroot = newroot[1:]
            newroot = urljoin(html_baseurl, newroot)
            if newroot[-1] != '/':
                newroot += '/'
            print(root, newroot)
            for f in files:
                if not f.endswith('.html'):
                    continue
                f = os.path.join(root, f)
                fd = open(f, 'r')
                line = ''.join(fd.readlines())
                fd.close()
                tree = BeautifulSoup(line)
                for a in tree.findAll('a'):
                    href = a['href']
                    if href.startswith('http://'):
                        continue
                    a['href'] = urljoin(newroot, href)
                for img in tree.findAll('img'):
                    img['src'] = urljoin(newroot, img['src'])
                for css in tree.findAll('link', rel='stylesheet'):
                    css['href'] = urljoin(newroot, css['href'])
                fd = open(f, 'w+')
                fd.write(str(tree))
                fd.close()

    def summarize_coverage(self, out=None):
        """
        Summarize the coverage output
        """
        if out is None:
            out = os.path.join(self.cov_out, 'total.info')
        if not os.path.isfile(out):
            return ''
        self.logger.info('Summarizing coverage data from ' + out)
        cmd = [self.cov_bin, '--summary', out]
        return self.du.run_cmd(cmd=cmd, logerr=False)['err']


================================================
FILE: test/fw/ptl/utils/pbs_crayutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import socket
import os

from ptl.utils.pbs_dshutils import DshUtils
from ptl.lib.pbs_ifl_mock import *


class CrayUtils(object):

    """
    Cray specific utility class
    """
    node_status = []
    node_summary = {}
    cmd_output = []
    du = None

    def __init__(self):
        self.du = DshUtils()
        (self.node_status, self.node_summary) = self.parse_apstat_rn()

    def call_apstat(self, options):
        """
        Build the apstat command and run it.  Return the output of the command.

        :param options: options to pass to apstat command
        :type options: str
        :returns: the command output
        """
        hostname = socket.gethostname()
        platform = self.du.get_platform(hostname)
        apstat_env = os.environ
        apstat_cmd = "apstat"
        if 'cray' not in platform:
            return None
        if 'craysim' in platform:
            lib_path = '$LD_LIBRARY_PATH:/opt/alps/tester/usr/lib/'
            apstat_env['LD_LIBRARY_PATH'] = lib_path
            apstat_env['ALPS_CONFIG_FILE'] = '/opt/alps/tester/alps.conf'
            apstat_env['apsched_sharedDir'] = '/opt/alps/tester/'
            apstat_cmd = "/opt/alps/tester/usr/bin/apstat -d ."
        cmd_run = self.du.run_cmd(hostname, [apstat_cmd, options],
                                  as_script=True, wait_on_script=True,
                                  env=apstat_env)
        return cmd_run

    def parse_apstat_rn(self):
        """
        Parse the apstat command output for node status and summary

        :type options: str
        :returns: tuple of (node status, node summary)
        """
        status = []
        summary = {}
        count = 0
        options = '-rn'
        cmd_run = self.call_apstat(options)
        if cmd_run is None:
            return (status, summary)
        cmd_result = cmd_run['out']
        keys = cmd_result[0].split()
        # Add a key 'Mode' because 'State' is composed of two list items, e.g:
        # State = 'UP  B', where Mode = 'B'
        k2 = ['Mode']
        keys = keys[0:3] + k2 + keys[3:]
        cmd_iter = iter(cmd_result)
        for line in cmd_iter:
            if count == 0:
                count = 1
                continue
            if "Compute node summary" in line:
                summary_line = next(cmd_iter)
                summary_keys = summary_line.split()
                summary_data = next(cmd_iter).split()
                sum_index = 0
                for a in summary_keys:
                    summary[a] = summary_data[sum_index]
                    sum_index += 1
                break
            obj = {}
            line = line.split()
            for i, value in enumerate(line):
                obj[keys[i]] = value
                if keys[i] == 'State':
                    obj[keys[i]] = value + "  " + line[i + 1]
            # If there is no Apids in the apstat then use 'None' as the value
            if "Apids" in obj:
                pass
            else:
                obj["Apids"] = None
            status.append(obj)
        return (status, summary)

    def count_node_summ(self, cnsumm='up'):
        """
        Return the value of any one of the following parameters as shown in
        the 'Compute Node Summary' section of 'apstat -rn' output:
        arch, config, up, resv, use, avail, down

        :param cnsumm: parameter which is being queried, defaults to 'up'
        :type cnsumm: str
        :returns: value of parameter being queried
        """
        return int(self.node_summary[cnsumm])

    def count_node_state(self, state='UP  B'):
        """
        Return how many nodes have a certain 'State' value.

        :param state: parameter which is being queried, defaults to 'UP  B'
        :type state: str
        :returns: count of how many nodes have the state
        """
        count = 0
        status = self.node_status
        for stat in status:
            if stat['State'] == state:
                count += 1
        return count

    def get_numthreads(self, nid):
        """
        Returns the number of hyperthread for the given node
        """
        options = '-N %d -n -f "nid,c/cu"' % int(nid)
        cmd_run = self.call_apstat(options)
        if cmd_run is None:
            return None
        cmd_result = cmd_run['out']
        cmd_iter = iter(cmd_result)
        numthreads = 0
        for line in cmd_iter:
            if "Compute node summary" in line:
                break
            elif "NID" in line:
                continue
            else:
                key = line.split()
                numthreads = int(key[1])
        return numthreads

    def num_compute_vnodes(self, server):
        """
        Count the Cray compute nodes and return the value.
        """
        vnl = server.filter(MGR_OBJ_NODE,
                            {'resources_available.vntype': 'cray_compute'})
        return len(vnl["resources_available.vntype=cray_compute"])


================================================
FILE: test/fw/ptl/utils/pbs_dshutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import copy
import grp
import logging
import os
import platform
import pwd
import re
import socket
import stat
import sys
import tempfile
import traceback
import inspect
from subprocess import PIPE, Popen

from ptl.utils.pbs_testusers import PBS_ALL_USERS, PbsUser, PbsGroup

DFLT_RSYNC_CMD = ['rsync', '-e', 'ssh', '--progress', '--partial', '-ravz']
DFLT_COPY_CMD = ['scp', '-p']
DFLT_RSH_CMD = ['ssh']
DFLT_SUDO_CMD = ['sudo', '-H']

logging.DEBUG2 = logging.DEBUG - 1
logging.INFOCLI = logging.INFO - 1
logging.INFOCLI2 = logging.INFOCLI - 1


def get_method_name(slf):
    try:
        curr_method = inspect.currentframe().f_back.f_code.co_name
        method_name = "%s.%s" % (slf.__class__.__name__, curr_method)
    except AttributeError:
        method_name = "***UNKNOWN***"
    return method_name


class TimeOut(Exception):

    """
    Raise this exception to mark a test as timed out.
    """
    pass


class PbsConfigError(Exception):
    """
    Initialize PBS configuration error
    """

    def __init__(self, message=None, rv=None, rc=None, msg=None):
        self.message = message
        self.rv = rv
        self.rc = rc
        self.msg = msg

    def __str__(self):
        return ('rc=' + str(self.rc) + ', rv=' + str(self.rv) +
                ',msg=' + str(self.msg))

    def __repr__(self):
        return (self.__class__.__name__ + '(rc=' + str(self.rc) + ', rv=' +
                str(self.rv) + ', msg=' + str(self.msg) + ')')


class PtlUtilError(Exception):
    """
    Initialize PTL Util error
    """

    def __init__(self, message=None, rv=None, rc=None, msg=None):
        self.message = message
        self.rv = rv
        self.rc = rc
        self.msg = msg

    def __str__(self):
        return ('rc=' + str(self.rc) + ', rv=' + str(self.rv) +
                ',msg=' + str(self.msg))

    def __repr__(self):
        return (self.__class__.__name__ + '(rc=' + str(self.rc) + ', rv=' +
                str(self.rv) + ', msg=' + str(self.msg) + ')')


class DshUtils(object):

    """
    PBS shell utilities

    A set of tools to run commands, copy files, get process
    information and parse a PBS configuration on an arbitrary host
    """

    logger = logging.getLogger(__name__)
    _h2osinfo = {}  # host to OS info cache
    _h2p = {}  # host to platform cache
    _h2pu = {}  # host to uname cache
    _h2c = {}  # host to pbs_conf file cache
    _h2l = {}  # host to islocal cache
    _h2which = {}  # host to which cache
    rsh_cmd = DFLT_RSH_CMD
    sudo_cmd = DFLT_SUDO_CMD
    copy_cmd = DFLT_COPY_CMD
    tmpfilelist = []

    def __init__(self):

        self._current_user = None

        logging.addLevelName('INFOCLI', logging.INFOCLI)
        setattr(self.logger, 'infocli',
                lambda *args: self.logger.log(logging.INFOCLI, *args))

        logging.addLevelName('DEBUG2', logging.DEBUG2)
        setattr(self.logger, 'debug2',
                lambda *args: self.logger.log(logging.DEBUG2, *args))

        logging.addLevelName('INFOCLI2', logging.INFOCLI2)
        setattr(self.logger, 'infocli2',
                lambda *args: self.logger.log(logging.INFOCLI2, *args))

        self.mom_conf_map = {'PBS_MOM_SERVICE_PORT': '-M',
                             'PBS_MANAGER_SERVICE_PORT': '-R',
                             'PBS_HOME': '-d',
                             'PBS_BATCH_SERVICE_PORT': '-S',
                             }
        self.server_conf_map = {'PBS_MOM_SERVICE_PORT': '-M',
                                'PBS_MANAGER_SERVICE_PORT': '-R',
                                'PBS_HOME': '-d',
                                'PBS_BATCH_SERVICE_PORT': '-p',
                                'PBS_SCHEDULER_SERVICE_PORT': '-S',
                                }
        self.sched_conf_map = {'PBS_HOME': '-d',
                               'PBS_BATCH_SERVICE_PORT': '-p',
                               'PBS_SCHEDULER_SERVICE_PORT': '-S',
                               }
        self._tempdir = {}
        self.platform = self.get_platform()

    def get_platform(self, hostname=None, pyexec=None):
        """
        Get a local or remote platform info, essentially the value of
        Python's sys.platform, in case of Cray it will return a string
        as "cray" or "shasta" for actual Cray cluster and "craysim"
        for Cray ALPS simulator

        :param hostname: The hostname to query for platform info
        :type hostname: str or None
        :param pyexec: A path to a Python interpreter to use to query
                       a remote host for platform info
        :type pyexec: str or None
        For efficiency the value is cached and retrieved from the
        cache upon subsequent request
        """
        splatform = sys.platform
        found_already = False
        if hostname is None:
            hostname = socket.gethostname()
        if hostname in self._h2p:
            return self._h2p[hostname]
        if self.isfile(hostname=hostname, path='/etc/xthostname',
                       level=logging.DEBUG2):
            if self.isfile(hostname=hostname, path='/proc/cray_xt/cname',
                           level=logging.DEBUG2):
                splatform = 'cray'
            else:
                splatform = 'craysim'
            found_already = True
        if self.isfile(hostname=hostname, path='/etc/cray/xname',
                       level=logging.DEBUG2):
            splatform = 'shasta'
            found_already = True
        if not self.is_localhost(hostname) and not found_already:
            if pyexec is None:
                pyexec = self.which(hostname, 'python3', level=logging.DEBUG2)
            cmd = [pyexec, '-c', '"import sys; print(sys.platform)"']
            ret = self.run_cmd(hostname, cmd=cmd)
            if ret['rc'] != 0 or len(ret['out']) == 0:
                _msg = 'Unable to retrieve platform info,'
                _msg += 'defaulting to local platform'
                self.logger.warning(_msg)
                splatform = sys.platform
            else:
                splatform = ret['out'][0]
        self._h2p[hostname] = splatform
        return splatform

    def _parse_file(self, hostname, file):
        """
         helper function to parse a file containing entries of the
         form ``<key>=<value>`` into a Python dictionary format
        """
        if hostname is None:
            hostname = socket.gethostname()

        try:
            rv = self.cat(hostname, file, level=logging.DEBUG2, logerr=False)
            if rv['rc'] != 0:
                return {}

            props = {}
            for l in rv['out']:
                if l.find('=') != -1 and l[0] != '#':
                    c = l.split('=')
                    props[c[0]] = c[1].strip()
        except BaseException:
            self.logger.error('error parsing file ' + str(file))
            self.logger.error(traceback.print_exc())
            return {}

        return props

    def _set_file(self, hostname, fin, fout, append, variables, sudo=False):
        """
        Create a file out of a set of dictionaries, possibly parsed
        from an input file. @see _parse_file.

        :param hostname: the name of the host on which to operate.
                         Defaults to localhost
        :type hostname: str
        :param fin: the input file to read from
        :type fin: str
        :param fout: the output file to write to
        :type fout: str
        :param append: If true, append to the output file.
        :type append: bool
        :param variables: The ``key/value`` pairs to write to fout
        :type variables: dictionary
        :param sudo: copy file to destination through sudo
        :type sudo: boolean
        :return dictionary of items set
        :raises PbsConfigError:
        """
        if hostname is None:
            hostname = socket.gethostname()

        if append:
            conf = self._parse_file(hostname, fin)
        else:
            conf = {}
        conf = {**conf, **variables}
        if os.path.isfile(fout):
            fout_stat = os.stat(fout)
            user = fout_stat.st_uid
            group = fout_stat.st_gid
        else:
            user = None
            group = None

        try:
            fn = self.create_temp_file()
            self.chmod(path=fn, mode=0o644)
            with open(fn, 'w') as fd:
                for k, v in conf.items():
                    fd.write(str(k) + '=' + str(v) + '\n')
            rv = self.run_copy(hostname, src=fn, dest=fout, uid=user,
                               gid=group, level=logging.DEBUG2, sudo=sudo)
            if rv['rc'] != 0:
                raise PbsConfigError
        except BaseException:
            raise PbsConfigError(rc=1, rv=None,
                                 msg='error writing to file ' + str(fout))
        finally:
            if os.path.isfile(fn):
                self.rm(path=fn)

        return conf

    def get_pbs_conf_file(self, hostname=None):
        """
        Get the path of the pbs conf file. Defaults back to
        ``/etc/pbs.conf`` if unsuccessful

        :param hostname: Hostname of the machine
        :type hostname: str or None
        :returns: Path to pbs conf file
        """
        dflt_conf = '/etc/pbs.conf'
        dflt_python = '/opt/pbs/python/bin/python'

        if hostname is None:
            hostname = socket.gethostname()
        if hostname in self._h2c:
            return self._h2c[hostname]

        if self.is_localhost(hostname):
            if 'PBS_CONF_FILE' in os.environ:
                dflt_conf = os.environ['PBS_CONF_FILE']
        else:
            pc = ('"import os;'
                  'print(os.environ.get(\"PBS_CONF_FILE\", False))"')
            cmd = ['ls', '-1', dflt_python]
            ret = self.run_cmd(hostname, cmd, logerr=False)
            if ret['rc'] == 0:
                pyexec = dflt_python
            else:
                pyexec = 'python3'
            cmd = [pyexec, '-c', pc]
            ret = self.run_cmd(hostname, cmd, logerr=False)
            if ((ret['rc'] != 0) and (len(ret['out']) > 0) and
                    (ret['out'][0] != 'False')):
                dflt_conf = ret['out'][0]

        self._h2c[hostname] = dflt_conf
        return dflt_conf

    def parse_pbs_config(self, hostname=None, file=None):
        """
        initialize ``pbs_conf`` dictionary by parsing pbs config file

        :param file: PBS conf file
        :type file: str or None
        """
        if file is None:
            file = self.get_pbs_conf_file(hostname)
        return self._parse_file(hostname, file)

    def set_pbs_config(self, hostname=None, fin=None, fout=None,
                       append=True, confs=None):
        """
        Set ``environment/configuration`` variables in a
        ``pbs.conf`` file

        :param hostname: the name of the host on which to operate
        :type hostname: str or None
        :param fin: the input pbs.conf file
        :type fin: str or None
        :param fout: the name of the output pbs.conf file, defaults
                     to ``/etc/pbs.conf``
        :type fout: str or None
        :param append: whether to append to fout or not, defaults
                       to True
        :type append: boolean
        :param confs: The ``key/value`` pairs to create
        :type confs: Dictionary or None
        """
        if fin is None:
            fin = self.get_pbs_conf_file(hostname)
        if fout is None and fin is not None:
            fout = fin
        if confs is not None:
            self.logger.info('Set ' + str(confs) + ' in ' + fout)
        else:
            confs = {}
        return self._set_file(hostname, fin, fout, append, confs, sudo=True)

    def unset_pbs_config(self, hostname=None, fin=None, fout=None,
                         confs=None):
        """
        Unset ``environment/configuration`` variables in a pbs.conf
        file

        :param hostname: the name of the host on which to operate
        :type hostname: str or None
        :param fin: the input pbs.conf file
        :type fin: str or None
        :param fout: the name of the output pbs.conf file, defaults
                     to ``/etc/pbs.conf``
        :type fout: str or None
        :param confs: The configuration keys to unset
        :type confs: List or str or dict or None
        """
        if fin is None:
            fin = self.get_pbs_conf_file(hostname)

        if fout is None and fin is not None:
            fout = fin
        if confs is None:
            confs = []
        elif isinstance(confs, str):
            confs = confs.split(',')
        elif isinstance(confs, dict):
            confs = list(confs.keys())

        tounset = []
        cur_confs = self.parse_pbs_config(hostname, fin)
        for k in confs:
            if k in cur_confs:
                tounset.append(k)
                del cur_confs[k]
        if tounset:
            self.logger.info('Unset ' + ",".join(tounset) + ' from ' + fout)

        return self._set_file(hostname, fin, fout, append=False,
                              variables=cur_confs, sudo=True)

    def get_pbs_server_name(self, pbs_conf=None):
        """
        Return the name of the server which may be different than
        ``PBS_SERVER``,in order, this method looks at
        ``PBS_PRIMARY``, ``PBS_SERVER_HOST_NAME``, and
        ``PBS_LEAF_NAME``, and ``PBS_SERVER``
        """
        if pbs_conf is None:
            pbs_conf = self.parse_pbs_config()

        if 'PBS_PRIMARY' in pbs_conf:
            return pbs_conf['PBS_PRIMARY']
        elif 'PBS_SERVER_HOST_NAME' in pbs_conf:
            return pbs_conf['PBS_SERVER_HOST_NAME']
        elif 'PBS_LEAF_NAME' in pbs_conf:
            return pbs_conf['PBS_LEAF_NAME']

        return pbs_conf['PBS_SERVER']

    def parse_pbs_environment(self, hostname=None,
                              file='/var/spool/pbs/pbs_environment'):
        """
        Initialize pbs_conf dictionary by parsing pbs config file
        """
        return self._parse_file(hostname, file)

    def set_pbs_environment(self, hostname=None,
                            fin='/var/spool/pbs/pbs_environment', fout=None,
                            append=True, environ=None):
        """
        Set the PBS environment

        :param environ: variables to set
        :type environ: dict or None
        :param hostname: Hostname of the machine
        :type hostname: str or None
        :param fin: pbs_environment input file
        :type fin: str
        :param fout: pbs_environment output file
        :type fout: str or None
        :param append: whether to append to fout or not, defaults
                       defaults to true
        :type append: bool
        """
        if fout is None and fin is not None:
            fout = fin
        if environ is None:
            environ = {}
        return self._set_file(hostname, fin, fout, append, environ, sudo=True)

    def unset_pbs_environment(self, hostname=None,
                              fin='/var/spool/pbs/pbs_environment', fout=None,
                              environ=None):
        """
        Unset environment variables in a pbs_environment file

        :param hostname: the name of the host on which to operate
        :type hostname: str or None
        :param fin: the input pbs_environment file
        :type fin: str
        :param fout: the name of the output pbs.conf file, defaults
                     to ``/var/spool/pbs/pbs_environment``
        :type fout: str or None
        :param environ: The environment keys to unset
        :type environ: List or str or dict or None
        """
        if fout is None and fin is not None:
            fout = fin
        if environ is None:
            environ = []
        elif isinstance(environ, str):
            environ = environ.split(',')
        elif isinstance(environ, dict):
            environ = list(environ.keys())

        tounset = []
        cur_environ = self.parse_pbs_environment(hostname, fin)
        for k in environ:
            if k in cur_environ:
                tounset.append(k)
                del cur_environ[k]
        if tounset:
            self.logger.info('Unset ' + ",".join(tounset) + ' from ' + fout)

        return self._set_file(hostname, fin, fout, append=False,
                              variables=cur_environ, sudo=True)

    def parse_rhosts(self, hostname=None, user=None):
        """
        Parse remote host

        :param hostname: Hostname of the machine
        :type hostname: str or None
        :param user: User name
        :type user: str or None
        """
        if hostname is None:
            hostname = socket.gethostname()
        if user is None:
            user = os.getuid()
        try:
            # currently assumes identical file system layout on every host
            if isinstance(user, int):
                home = pwd.getpwuid(user).pw_dir
            else:
                home = pwd.getpwnam(user).pw_dir
            rhost = os.path.join(home, '.rhosts')
            rv = self.cat(hostname, rhost, level=logging.DEBUG2, runas=user,
                          logerr=False)
            if rv['rc'] != 0:
                return {}
            props = {}
            for l in rv['out']:
                if l[0] != '#':
                    k, v = l.split()
                    v = v.strip()
                    if k in self.props:
                        if isinstance(self.props[k], list):
                            self.props[k].append(v)
                        else:
                            self.props[k] = [self.props[k], v]
                    else:
                        self.props[k] = v
        except BaseException:
            self.logger.error('error parsing .rhost')
            self.logger.error(traceback.print_exc())
            return {}
        return props

    def set_rhosts(self, hostname=None, user=None, entry={}, append=True):
        """
        Set the remote host attributes

        :param entry: remote hostname user dictionary
        :type entry: Dictionary
        :param append: If true append key value else not
        :type append: boolean
        """
        if hostname is None:
            hostname = socket.gethostname()
        if user is None:
            user = os.getuid()
        if append:
            conf = self.parse_rhosts(hostname, user)
            for k, v in entry.items():
                if k in conf:
                    if isinstance(conf[k], list):
                        if isinstance(v, list):
                            conf[k].extend(v)
                        else:
                            conf[k].append(v)
                    else:
                        if isinstance(v, list):
                            conf[k] = [conf[k]] + v
                        else:
                            conf[k] = [conf[k], v]
                else:
                    conf[k] = v
        else:
            conf = entry
        try:
            # currently assumes identical file system layout on every host
            if isinstance(user, int):
                _user = pwd.getpwuid(user)
                home = _user.pw_dir
                uid = _user.pw_uid
            else:
                # user might be PbsUser object
                _user = pwd.getpwnam(str(user))
                home = _user.pw_dir
                uid = _user.pw_uid
            rhost = os.path.join(home, '.rhosts')
            fn = self.create_temp_file(hostname)
            self.chmod(hostname, fn, mode=0o755)
            with open(fn, 'w') as fd:
                fd.write('#!/bin/bash\n')
                fd.write('cd %s\n' % (home))
                fd.write('%s -rf %s\n' % (self.which(hostname, 'rm',
                                                     level=logging.DEBUG2),
                                          rhost))
                fd.write('touch %s\n' % (rhost))
                for k, v in conf.items():
                    if isinstance(v, list):
                        for eachprop in v:
                            fields = 'echo "%s %s" >> %s\n' % (
                                str(k),
                                str(eachprop),
                                rhost)
                            fd.write(fields)
                    else:
                        fields = 'echo "%s %s" >> %s\n' % (str(k), str(v),
                                                           rhost)
                        fd.write(fields)
                fd.write('%s 0600 %s\n' % (self.which(hostname, 'chmod',
                                                      level=logging.DEBUG2),
                                           rhost))
            ret = self.run_cmd(hostname, cmd=fn, runas=uid)
            self.rm(hostname, path=fn)
            if ret['rc'] != 0:
                raise Exception(ret['out'] + ret['err'])
        except Exception as e:
            raise PbsConfigError(rc=1, rv=None, msg='error writing .rhosts ' +
                                 str(e))
        return conf

    def map_pbs_conf_to_cmd(self, cmd_map={}, pconf={}):
        """
        Map PBS configuration parameter to command

        :param cmd_map: command mapping
        :type cmd_map: Dictionary
        :param pconf: PBS conf parameter dictionary
        :type pconf: Dictionary
        """
        cmd = []
        for k, v in pconf.items():
            if k in cmd_map:
                cmd += [cmd_map[k], str(v)]
        return cmd

    def get_current_user(self):
        """
        helper function to return the name of the current user
        """
        if self._current_user is not None:
            return self._current_user
        self._current_user = pwd.getpwuid(os.getuid())[0]
        return self._current_user

    def check_user_exists(self, username=None, hostname=None, port=None):
        """
        Check if user exist  or not

        :param username: Username to check
        :type username: str or None
        :param hostname: Machine hostname
        :type hostname: str or None
        :param port: port used to ssh other host
        :type port: str or None
        :returns: True if exist else return False
        """
        if hostname is None:
            hostname = socket.gethostname()
        if self.get_platform() == "shasta":
            runas = username
        else:
            runas = None
        ret = self.run_cmd(hostname, ['id', username], port=port, runas=runas)
        if ret['rc'] == 0:
            return True
        return False

    def check_group_membership(self, username=None, uid=None, grpname=None,
                               gid=None):
        """
        Checks whether a user, passed in as username or uid, is a
        member of a group, passed in as group name or group id.

        :param username: The username to inquire about
        :type username: str or None
        :param uid: The uid of the user to inquire about (alternative
                    to username)
        :param grpname: The groupname to check for user membership
        :type grpname: str or None
        :param gid: The group id to check for user membership
                    (alternative to grpname)
        """
        if username is None and uid is None:
            self.logger.warning('A username or uid was expected')
            return True
        if grpname is None and gid is None:
            self.logger.warning('A grpname or gid was expected')
            return True
        if grpname:
            try:
                _g = grp.getgrnam(grpname)
                if username and username in _g.gr_mem:
                    return True
                elif uid is not None:
                    _u = pwd.getpwuid(uid)
                    if _u.pwname in _g.gr_mem:
                        return True
            except BaseException:
                self.logger.error('Unknown user')
        return False

    def group_memberships(self, group_list=[]):
        """
        Returns all group memberships as a dictionary of group names
        and associated memberships
        """
        groups = {}
        if not group_list:
            return groups
        users_list = [u.pw_name for u in pwd.getpwall()]
        glist = {}
        for u in users_list:
            info = self.get_id_info(u)
            if not info['pgroup'] in list(glist.keys()):
                glist[info['pgroup']] = [info['name']]
            else:
                glist[info['pgroup']].append(info['name'])
            for g in info['groups']:
                if g not in list(glist.keys()):
                    glist[g] = []
                if not info['name'] in glist[g]:
                    glist[g].append(info['name'])
        for g in group_list:
            if g in list(glist.keys()):
                groups[g] = glist[g]
            else:
                try:
                    i = grp.getgrnam(g)
                    groups[g] = i.gr_mem
                except KeyError:
                    pass
        return groups

    def get_id_info(self, user):
        """
        Return user info in dic format
        obtained by ``"id -a <user>"`` command for given user

        :param user: The username to inquire about
        :type user: str
        :returns: dic format:

                {

                   "uid": <uid of given user>,

                   "gid": <gid of given user's primary group>,

                   "name": <name of given user>,

                   "pgroup": <name of primary group of given user>,

                   "groups": <list of names of groups of given user>

                }
        """
        info = {'uid': None, 'gid': None, 'name': None, 'pgroup': None,
                'groups': None}
        ret = self.run_cmd(cmd=['id', '-a', str(user)], logerr=True)
        if ret['rc'] == 0:
            p = re.compile(r'(?P<uid>\d+)\((?P<name>[\w\s."\'-]+)\)')
            map_list = re.findall(p, ret['out'][0])
            info['uid'] = int(map_list[0][0])
            info['name'] = map_list[0][1].strip()
            info['gid'] = int(map_list[1][0])
            info['pgroup'] = map_list[1][1].strip()
            groups = []
            if len(map_list) > 2:
                for g in map_list[2:]:
                    groups.append(g[1].strip().strip('"').strip("'"))
            info['groups'] = groups
        return info

    def get_tempdir(self, hostname=None):
        """
        :returns: The temporary directory on the given host
                  Default host is localhost.
        """
        # return the cached value whenever possible

        if hostname is None:
            hostname = socket.gethostname()

        if hostname in self._tempdir:
            return self._tempdir[hostname]

        if self.is_localhost(hostname):
            self._tempdir[hostname] = tempfile.gettempdir()
        else:
            pyexec = self.which(hostname, 'python3', level=logging.DEBUG2)
            cmd = [pyexec, '-c',
                   '"import tempfile; print(tempfile.gettempdir())"']
            ret = self.run_cmd(hostname, cmd, level=logging.DEBUG)
            if ret['rc'] == 0:
                self._tempdir[hostname] = ret['out'][0].strip()
            else:
                # Optimistically fall back to /tmp.
                self._tempdir[hostname] = '/tmp'
        return self._tempdir[hostname]

    def run_cmd(self, hosts=None, cmd=None, sudo=False, stdin=None,
                stdout=PIPE, stderr=PIPE, input=None, cwd=None, env=None,
                runas=None, logerr=True, as_script=False, wait_on_script=True,
                level=logging.INFOCLI2, port=None):
        """
        Run a command on a host or list of hosts.

        :param hosts: the name of hosts on which to run the command,
                      can be a comma-separated string or a list.
                      Defaults to localhost
        :type hosts: str or None
        :param cmd: the command to run
        :type cmd: str or None
        :param sudo: whether to run the command as root or not.
                     Defaults to False.
        :type sudo: boolean
        :param stdin: custom stdin. Defaults to PIPE
        :param stdout: custom stdout. Defaults to PIPE
        :param stderr: custom stderr. Defaults to PIPE
        :param input: input to pass to the pipe on target host,
                      e.g. PBS answer file
        :param cwd: working directory on local host from which
                    command is run
        :param env: environment variables to set on local host
        :param runas: run command as given user. Defaults to calling
                      user
        :param logerr: whether to log error messages or not. Defaults
                       to True
        :type logerr: boolean
        :param as_script: if True, run the command in a script
                          created as a temporary file that gets
                          deleted after being run. This is used
                          mainly to circumvent some implementations
                          of sudo that prevent passing environment
                          variables through sudo.
        :type as_script: boolean
        :param wait_on_script: If True (default) waits on process
                               launched as script to return.
        :type wait_on_script: boolean
        :type port: str
        :param port: port number used with remote host IP address
                     for ssh
        :returns: error, output, return code as a dictionary:
                  ``{'out':...,'err':...,'rc':...}``
        """

        rshcmd = []
        sudocmd = []
        platform = self.get_platform()
        _runas_user = None

        if level is None:
            level = self.logger.level

        _user = self.get_current_user()

        # runas may be a PbsUser object, ensure it is a string for the
        # remainder of the function
        if runas is not None:
            if isinstance(runas, int):
                runas = pwd.getpwuid(runas).pw_name
            elif not isinstance(runas, str):
                # must be as PbsUser object
                runas = str(runas)

        if runas:
            _runas_user = PbsUser.get_user(runas)

        if isinstance(cmd, str):
            cmd = cmd.split()

        if hosts is None:
            hosts = socket.gethostname()

        if isinstance(hosts, str):
            hosts = hosts.split(',')

        if not isinstance(hosts, list):
            err_msg = 'target hostnames must be a comma-separated ' + \
                'string or list'
            self.logger.error(err_msg)
            return {'out': '', 'err': err_msg, 'rc': 1}

        ret = {'out': '', 'err': '', 'rc': 0}

        for hostname in hosts:
            if (platform == "shasta") and _runas_user:
                hostname = _runas_user.host if _runas_user.host else hostname
                port = _runas_user.port
            islocal = self.is_localhost(hostname)
            if islocal is None:
                # an error occurred processing that name, move on
                # the error is logged in is_localhost.
                ret['err'] = 'error getting host by name in run_cmd'
                ret['rc'] = 1
                continue
            if not islocal:
                if port and platform == "shasta":
                    if runas is None:
                        user = _user
                    else:
                        user = _runas_user.name
                    rshcmd = self.rsh_cmd + ['-p', port, user + '@' + hostname]
                else:
                    rshcmd = self.rsh_cmd + [hostname]
            if platform != "shasta":
                if sudo or ((runas is not None) and (runas != _user)):
                    sudocmd = copy.copy(self.sudo_cmd)
                    if runas is not None:
                        sudocmd += ['-u', runas]

            # Initialize information to return
            ret = {'out': None, 'err': None, 'rc': None}
            rc = rshcmd + sudocmd + cmd
            if as_script:
                _script = self.create_temp_file()
                script_body = ['#!/bin/bash']
                if cwd is not None:
                    script_body += ['cd "%s"' % (cwd)]
                    cwd = None
                if isinstance(cmd, str):
                    script_body += [cmd]
                elif isinstance(cmd, list):
                    script_body += [" ".join(cmd)]
                with open(_script, 'w') as f:
                    f.write('\n'.join(script_body))
                os.chmod(_script, 0o755)
                if not islocal:
                    # TODO: get a valid remote temporary file rather than
                    # assume that the remote host has a similar file
                    # system layout
                    self.run_copy(hostname, src=_script, dest=_script,
                                  runas=runas, level=level)
                    os.remove(_script)
                runcmd = rshcmd + sudocmd + [_script]
            else:
                runcmd = rc

            _msg = hostname.split('.')[0] + '(run_cmd): '
            _runcmd = ['\'\'' if x == '' else str(x) for x in runcmd]
            _msg += ' '.join(_runcmd)
            _msg = [_msg]
            if as_script:
                _msg += ['Contents of ' + _script + ':']
                _msg += ['-' * 40, '\n'.join(script_body), '-' * 40]
            self.logger.log(level, '\n'.join(_msg))

            if input:
                self.logger.log(level, input)

            try:
                p = Popen(runcmd, bufsize=-1, stdin=stdin, stdout=stdout,
                          stderr=stderr, cwd=cwd, env=env)
            except Exception as e:
                self.logger.error("Error running command " + str(runcmd))
                if as_script:
                    self.logger.error('Script contents: \n' +
                                      '\n'.join(script_body))
                self.logger.debug(str(e))
                raise

            if as_script and not wait_on_script:
                o = p.stdout.readline()
                e = p.stderr.readline()
                ret['rc'] = 0
            else:
                try:
                    (o, e) = p.communicate(input)
                except TimeOut:
                    self.logger.error("TimeOut Exception, cmd:%s" %
                                      str(runcmd))
                    raise
                ret['rc'] = p.returncode

            if as_script:
                # Remove the script file. If we ran remotely, the file will
                # be owned by the runas user. If we ran locally, the file
                # is owned by the current user.
                # must pass as_script=False otherwise it will loop infinite
                self.rm(hostname, path=_script, as_script=False,
                        level=level, runas=(_user if islocal else runas))

            # handle the case where stdout is not a PIPE
            if o is not None:
                ret['out'] = [i.decode("utf-8", 'backslashreplace')
                              for i in o.splitlines()]
            else:
                ret['out'] = []
            # Some output can be very verbose, for example listing many lines
            # of a log file, those messages are typically channeled through
            # at level DEBUG2, since we don't to pollute the output with too
            # verbose an information, we log at most at level DEBUG
            if level < logging.DEBUG:
                self.logger.log(level, 'out: ' + str(ret['out']))
            else:
                self.logger.debug('out: ' + str(ret['out']))
            if e is not None:
                ret['err'] = [i.decode("utf-8", 'backslashreplace')
                              for i in e.splitlines()]
            else:
                ret['err'] = []
            if ret['err'] and logerr:
                self.logger.error("<" + get_method_name(self) + '>cmd:' +
                                  ' '.join(cmd) + ' err: ' + str(ret['err']))
            else:
                self.logger.debug("<" + get_method_name(self) + '>cmd:' +
                                  ' '.join(cmd) + ' err: ' + str(ret['err']))
            self.logger.debug('rc: ' + str(ret['rc']))

        return ret

    def run_copy(self, hosts=None, srchost=None, src=None, dest=None,
                 sudo=False, uid=None, gid=None, mode=None, env=None,
                 logerr=True, recursive=False, runas=None,
                 preserve_permission=True, level=logging.INFOCLI2):
        """
        copy a file or directory to specified target hosts.

        :param hosts: the host(s) to which to copy the data. Can be
                      a comma-separated string or a list
        :type hosts: str or None
        :param srchost: the host on which the src file resides.
        :type srchost: str or None
        :param src: the path to the file or directory to copy.
        :type src: str or None
        :param dest: the destination path.
        :type dest: str or None
        :param sudo: whether to copy as root or not. Defaults to
                     False
        :type sudo: boolean
        :param uid: optionally change ownership of dest to the
                    specified user id,referenced by uid number or
                    username
        :param gid: optionally change ownership of dest to the
                    specified group ``name/id``
        :param mode: optinoally set mode bits of dest
        :param env: environment variables to set on the calling host
        :param logerr: whether to log error messages or not.
                       Defaults to True.
        :param recursive: whether to copy a directory (when true) or
                          a file.Defaults to False.
        :type recursive: boolean
        :param runas: run command as user
        :type runas: str or None
        :param preserve_permission: Preserve file permission while
                                    copying file (cp cmd with -p flag)
                                    Defaults to True
        :type preserve_permission:boolean
        :param level: logging level, defaults to DEBUG
        :type level: int
        :returns: {'out':<outdata>, 'err': <errdata>, 'rc':<retcode>}
                  upon and None if no source file specified
        """

        if src is None:
            self.logger.warning('no source file specified')
            return None

        if hosts is None:
            hosts = socket.gethostname()

        if isinstance(hosts, str):
            hosts = hosts.split(',')

        if not isinstance(hosts, list):
            self.logger.error('destination must be a string or a list')
            return 1

        if dest is None:
            dest = src

        # If PTL_SUDO_CMD were to be unset we should assume no sudo
        if sudo is True and not self.sudo_cmd:
            sudo = False

        runas = PbsUser.get_user(runas)
        issrclocal = None
        if srchost:
            issrclocal = self.is_localhost(srchost)
        for targethost in hosts:
            _msg = 'run_copy: '
            _msg += " src:%s" % src
            _msg += " to:%s dest:%s" % (targethost, dest)
            _msg += " sudo:%s" % sudo
            self.logger.debug(_msg)

            islocal = self.is_localhost(targethost)
            if sudo and not islocal and not issrclocal:
                # to avoid a file copy as root, we copy it as current user
                # and move it remotely to the desired path/name.
                # First, get a remote temporary filename
                pyexec = self.which(targethost, 'python3',
                                    level=logging.DEBUG2)
                cmd = [pyexec, '-c',
                       '"import tempfile;print(' +
                       'tempfile.mkstemp(\'PtlPbstmpcopy\')[1])"']
                # save original destination
                sudo_save_dest = dest
                # Make the target of the copy the temporary file
                dest = self.run_cmd(targethost, cmd,
                                    level=level,
                                    logerr=logerr)['out'][0]
                cmd = []
            else:
                # if not using sudo or target is local, initialize the
                # command to run accordingly
                sudo_save_dest = None
                if sudo:
                    cmd = copy.copy(self.sudo_cmd)
                else:
                    cmd = []

            # Remote copy if target host is remote or if source file/dir is
            # remote.
            if srchost:
                srchost = socket.getfqdn(srchost)
            if ((not islocal) or (srchost)):
                copy_cmd = copy.deepcopy(self.copy_cmd)
                targethost = socket.getfqdn(targethost)
                if (srchost == targethost):
                    cmd += [self.which(targethost, 'cp', level=level)]
                    if preserve_permission:
                        cmd += ['-p']
                    if recursive:
                        cmd += ['-r']
                    cmd += [src]
                    cmd += [dest]
                else:
                    if not preserve_permission:
                        copy_cmd.remove('-p')
                    if copy_cmd[0][0] != '/':
                        copy_cmd[0] = self.which(targethost, copy_cmd[0],
                                                 level=level)
                    cmd += copy_cmd
                    if recursive:
                        cmd += ['-r']
                    if runas and runas.port:
                        cmd += ['-P', runas.port]
                    if srchost:
                        src = srchost + ':' + src
                    cmd += [src]
                    if islocal:
                        cmd += [dest]
                    else:
                        if self.get_platform() == 'shasta' and runas:
                            cmd += [str(runas) + '@' + targethost + ':' + dest]
                        else:
                            cmd += [targethost + ':' + dest]
            else:
                cmd += [self.which(targethost, 'cp', level=level)]
                if preserve_permission:
                    cmd += ['-p']
                if recursive:
                    cmd += ['-r']
                cmd += [src]
                cmd += [dest]

            if srchost == targethost:
                ret = self.run_cmd(targethost, cmd, env=env,
                                   runas=runas, logerr=logerr, level=level)
            elif self.get_platform() == 'shasta':
                ret = self.run_cmd(socket.gethostname(), cmd, env=env,
                                   logerr=logerr, level=level)
            else:
                ret = self.run_cmd(socket.gethostname(), cmd, env=env,
                                   runas=runas, logerr=logerr, level=level)

            if ret['rc'] != 0:
                self.logger.error(ret['err'])
            elif sudo_save_dest:
                cmd = [self.which(targethost, 'cp', level=level)]
                cmd += [dest, sudo_save_dest]
                ret = self.run_cmd(targethost, cmd=cmd, sudo=True, level=level)
                self.rm(targethost, path=dest, level=level)
                dest = sudo_save_dest
                if ret['rc'] != 0:
                    self.logger.error(ret['err'])

            if mode is not None:
                self.chmod(targethost, path=dest, mode=mode, sudo=sudo,
                           recursive=recursive, runas=runas)
            if ((uid is not None and uid != self.get_current_user()) or
                    gid is not None):
                if dest == self.get_pbs_conf_file(targethost):
                    uid = pwd.getpwnam('root')[2]
                    gid = pwd.getpwnam('root')[3]
                self.chown(targethost, path=dest, uid=uid, gid=gid, sudo=True,
                           recursive=False)

            return ret

    def run_ptl_cmd(self, hostname, cmd, sudo=False, stdin=None, stdout=PIPE,
                    stderr=PIPE, input=None, cwd=None, env=None, runas=None,
                    logerr=True, as_script=False, wait_on_script=True,
                    level=logging.INFOCLI2):
        """
        Wrapper method of run_cmd to run PTL command
        """
        # Add absolute path of command also add log level to command
        self.logger.infocli('running command "%s" on %s' % (' '.join(cmd),
                                                            hostname))
        _cmd = [self.which(exe=cmd[0], level=level)]
        _cmd += ['-l', logging.getLevelName(self.logger.parent.level)]
        _cmd += cmd[1:]
        cmd = _cmd
        self.logger.debug(' '.join(cmd))
        dest = None
        if ('PYTHONPATH' in list(os.environ.keys()) and
                not self.is_localhost(hostname)):
            body = ['#!/bin/bash']
            body += ['PYTHONPATH=%s exec %s' % (os.environ['PYTHONPATH'],
                                                ' '.join(cmd))]
            fn = self.create_temp_file(body='\n'.join(body))
            tmpdir = self.get_tempdir(hostname)
            dest = os.path.join(tmpdir, os.path.basename(fn))
            oldc = self.copy_cmd[:]
            self.set_copy_cmd('scp -p')
            self.run_copy(hostname, src=fn, dest=dest, mode=0o755, level=level)
            self.set_copy_cmd(' '.join(oldc))
            self.rm(None, path=fn, force=True, logerr=False)
            cmd = dest
        ret = self.run_cmd(hostname, cmd, sudo, stdin, stdout, stderr, input,
                           cwd, env, runas, logerr, as_script, wait_on_script,
                           level)
        if dest is not None:
            self.rm(hostname, path=dest, force=True, logerr=False)
        # TODO: check why output is coming to ret['err']
        if ret['rc'] == 0:
            ret['out'] = ret['err']
            ret['err'] = []
        return ret

    @classmethod
    def set_sudo_cmd(cls, cmd):
        """
        set the sudo command
        """
        cls.logger.infocli('setting sudo command to ' + cmd)
        cls.sudo_cmd = cmd.split()

    @classmethod
    def set_copy_cmd(cls, cmd):
        """
        set the copy command
        """
        cls.logger.infocli('setting copy command to ' + cmd)
        cls.copy_cmd = cmd.split()

    @classmethod
    def set_rsh_cmd(cls, cmd):
        """
        set the remote shell command
        """
        cls.logger.infocli('setting remote shell command to ' + cmd)
        cls.rsh_cmd = cmd.split()

    def is_localhost(self, host=None):
        """
        :param host: Hostname of machine
        :type host: str or None
        :returns: true if specified host (by name) is the localhost
                  all aliases matching the hostname are searched
        """
        if host is None:
            return True

        if host in self._h2l:
            return self._h2l[host]

        try:
            (hostname, aliaslist, iplist) = socket.gethostbyname_ex(host)
        except BaseException:
            self.logger.error('error getting host by name: ' + host)
            print((traceback.print_stack()))
            return None

        localhost = socket.gethostname()
        if localhost == hostname or localhost in aliaslist:
            self._h2l[host] = True
        try:
            ipaddr = socket.gethostbyname(localhost)
        except BaseException:
            self.logger.error('could not resolve local host name')
            return False
        if ipaddr in iplist:
            self._h2l[host] = True
            return True
        # on a shasta machine, the name returned by `hostname` (pbs-host) is
        # different than the one we tell PTL to use (pbs-service-nmn). This
        # causes a name mismatch, so we should just set it to be True
        if (self.get_platform() == 'shasta' and host == 'pbs-service-nmn' and
                localhost == 'pbs-host'):
            self._h2l[host] = True
            return True
        self._h2l[host] = False
        return False

    def isdir(self, hostname=None, path=None, sudo=False, runas=None,
              level=logging.INFOCLI2):
        """
        :param hostname: The name of the host on which to check for
                         directory
        :type hostname: str or None
        :param path: The path to the directory to check
        :type path: str or None
        :param sudo: Whether to run the command as a privileged user
        :type sudo: boolean
        :param runas: run command as user
        :type runas: str or None
        :param level: Logging level
        :returns: True if directory pointed to by path exists and
                  False otherwise
        """
        if path is None:
            return False

        if (self.is_localhost(hostname) and (not sudo) and (runas is None)):
            return os.path.isdir(path)
        else:
            # Constraints on the build system prevent running commands as
            # a privileged user through python, fall back to ls
            dirname = os.path.dirname(path)
            basename = os.path.basename(path)
            cmd = ['ls', '-l', dirname]
            self.logger.log(level, "grep'ing for " + basename + " in " +
                            dirname)
            ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, runas=runas,
                               logerr=False, level=level)
            if ret['rc'] != 0:
                return False
            else:
                for l in ret['out']:
                    if basename == l[-len(basename):] and l.startswith('d'):
                        return True

        return False

    def isfile(self, hostname=None, path=None, sudo=False, runas=None,
               level=logging.INFOCLI2):
        """
        :param hostname: The name of the host on which to check for
                         file
        :type hostname: str or None
        :param path: The path to the file to check
        :type path: str or None
        :param sudo: Whether to run the command as a privileged user
        :type sudo: boolean
        :param runas: run command as user
        :type runas: str or None
        :param level: Logging level
        :returns: True if file pointed to by path exists, and False
                  otherwise
        """

        if path is None:
            return False

        if (self.is_localhost(hostname) and (not sudo) and (runas is None)):
            return os.path.isfile(path)
        else:
            # Constraints on the build system prevent running commands as
            # a privileged user through python, fall back to ls
            cmd = ['ls', '-l', path]
            ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, runas=runas,
                               logerr=False, level=level)
            if ret['rc'] != 0:
                return False
            elif ret['out']:
                if not ret['out'][0].startswith('d'):
                    return True

        return False

    def getmtime(self, hostname=None, path=None, sudo=False, runas=None,
                 level=logging.INFOCLI2):
        """
        :param hostname: The name of the host on which file exists
        :type hostname: str or None
        :param path: The path to the file to get mtime
        :type path: str or None
        :param sudo: Whether to run the command as a privileged user
        :type sudo: boolean
        :param runas: run command as user
        :type runas: str or None
        :param level: Logging level
        :returns: Modified time of given file
        """

        if path is None:
            return None

        if (self.is_localhost(hostname) and (not sudo) and (runas is None)):
            return os.path.getmtime(path)
        else:
            py_cmd = 'import os; print(os.path.getmtime(\'%s\'))' % (path)
            if not self.is_localhost(hostname):
                py_cmd = '\"' + py_cmd + '\"'
            pyexec = self.which(hostname, 'python3', level=logging.DEBUG2)
            cmd = [pyexec, '-c', py_cmd]
            ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, runas=runas,
                               logerr=False, level=level)
            if ((ret['rc'] == 0) and (len(ret['out']) == 1) and
                    (isinstance(eval(ret['out'][0].strip()), (int, float)))):
                return eval(ret['out'][0].strip())
        return None

    def listdir(self, hostname=None, path=None, sudo=False, runas=None,
                fullpath=True, level=logging.INFOCLI2):
        """
        :param hostname: The name of the host on which to list for
                         directory
        :type hostname: str or None
        :param path: The path to directory to list
        :type path: str or None
        :param sudo: Whether to chmod as root or not. Defaults to
                     False
        :type sudo: bool
        :param runas: run command as user
        :type runas: str or None
        :param fullpath: Return full paths?
        :type fullpath: bool
        :param level: Logging level.
        :type level: int
        :returns: A list containing the names of the entries in
                  the directory or an empty list in case no files exist
        """
        retvalerr = []

        if path is None:
            return retvalerr

        if (self.is_localhost(hostname) and (not sudo) and (runas is None)):
            try:
                files = os.listdir(path)
            except OSError:
                return retvalerr
        else:
            ret = self.run_cmd(hostname, cmd=['ls', path], sudo=sudo,
                               runas=runas, logerr=False, level=level)
            if ret['rc'] == 0:
                files = ret['out']
            else:
                return retvalerr
        if fullpath is True:
            return [os.path.join(path, p.strip()) for p in files]
        else:
            return [p.strip() for p in files]

    def chmod(self, hostname=None, path=None, mode=None, sudo=False,
              runas=None, recursive=False, logerr=True,
              level=logging.INFOCLI2):
        """
        Generic function of chmod with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param path: the path to the file or directory to chmod
        :type path: str or None
        :param mode: mode to apply as octal number like 0777,
                     0666 etc.
        :param sudo: whether to chmod as root or not. Defaults
                     to False
        :type sudo: boolean
        :param runas: run command as user
        :type runas: str or None
        :param recursive: whether to chmod a directory (when true)
                          or a file.Defaults to False.
        :type recursive: boolean
        :param logerr: whether to log error messages or not. Defaults
                       to True.
        :type logerr: boolean
        :param level: logging level, defaults to INFOCLI2
        :returns: True on success otherwise False
        """
        if (path is None) or (mode is None):
            return False
        islocal = self.is_localhost(hostname)
        if islocal and not runas and not sudo and not recursive:
            self.logger.debug('os.chmod %s %s' % (path, oct(mode)))
            try:
                os.chmod(path, mode)
            except OSError as err:
                if logerr:
                    self.logger.error("os.chmod failed with err:%s" % str(err))
                else:
                    self.logger.debug("os.chmod failed with err:%s" % str(err))
                return False
            return True
        else:
            cmd = [self.which(hostname, 'chmod', level=level)]
            if recursive:
                cmd += ['-R']
            mode = '{:o}'.format(mode)
            cmd += [mode, path]
            ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, logerr=logerr,
                               runas=runas, level=level)
            if ret['rc'] == 0:
                return True
        return False

    def chown(self, hostname=None, path=None, uid=None, gid=None, sudo=False,
              recursive=False, runas=None, logerr=True,
              level=logging.INFOCLI2):
        """
        Generic function of chown with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param path: the path to the file or directory to chown
        :type path: str or None
        :param uid: uid to apply (must be either user name or
                    uid or -1)
        :param gid: gid to apply (must be either group name or
                    gid or -1)
        :param sudo: whether to chown as root or not. Defaults
                     to False
        :type sudo: boolean
        :param recursive: whether to chmod a directory (when true)
                          or a file.Defaults to False.
        :type recursive: boolean
        :param runas: run command as user
        :type runas: str or None
        :param logerr: whether to log error messages or not. Defaults
                       to True.
        :type logerr: boolean
        :param level: logging level, defaults to INFOCLI2
        :returns: True on success otherwise False
        """
        if path is None or (uid is None and gid is None):
            return False
        _u = ''
        if isinstance(uid, int) and uid != -1:
            _u = pwd.getpwuid(uid).pw_name
        elif (isinstance(uid, str) and (uid != '-1')):
            _u = uid
        else:
            # must be as PbsUser object
            if str(uid) != '-1':
                _u = str(uid)
        if _u == '':
            return False
        cmd = [self.which(hostname, 'chown', level=level)]
        if recursive:
            cmd += ['-R']
        cmd += [_u, path]
        ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, logerr=logerr,
                           runas=runas, level=level)
        if ret['rc'] == 0:
            if gid is not None:
                if runas is None:
                    runas = _u
                rv = self.chgrp(hostname, path, gid=gid, sudo=sudo,
                                level=level, recursive=recursive, runas=runas,
                                logerr=logerr)
                if not rv:
                    return False
            return True
        return False

    def chgrp(self, hostname=None, path=None, gid=None, sudo=False,
              recursive=False, runas=None, logerr=True,
              level=logging.INFOCLI2):
        """
        Generic function of chgrp with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param path: the path to the file or directory to chown
        :type path: str or None
        :param gid: gid to apply (must be either group name or
                    gid or -1)
        :param sudo: whether to chgrp as root or not. Defaults
                     to False
        :type sudo: boolean
        :param recursive: whether to chmod a directory (when true)
                          or a file.Defaults to False.
        :type recursive: boolean
        :param runas: run command as user
        :type runas: str or None
        :param logerr: whether to log error messages or not. Defaults
                       to True.
        :type logerr: boolean
        :param level: logging level, defaults to INFOCLI2
        :returns: True on success otherwise False
        """
        if path is None or gid is None:
            return False

        _g = ''
        if isinstance(gid, int) and gid != -1:
            _g = grp.getgrgid(gid).gr_name
        elif (isinstance(gid, str) and (gid != '-1')):
            _g = gid
        else:
            # must be as PbsGroup object
            if str(gid) != '-1':
                _g = str(gid)

        if _g == '':
            return False

        cmd = [self.which(hostname, 'chgrp', level=level)]
        if recursive:
            cmd += ['-R']
        cmd += [_g, path]

        ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, logerr=logerr,
                           runas=runas, level=level)
        if ret['rc'] == 0:
            return True

        return False

    def which(self, hostname=None, exe=None, level=logging.INFOCLI2):
        """
        Generic function of which with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param exe: executable to locate (can be full path also)
                    (if exe is full path then only basename will
                    be used to locate)
        :type exe: str or None
        :param level: logging level, defaults to INFOCLI2
        """
        if exe is None:
            return None

        if hostname is None:
            hostname = socket.gethostname()

        oexe = exe
        exe = os.path.basename(exe)
        if hostname in list(self._h2which.keys()):
            if exe in self._h2which[hostname]:
                return self._h2which[hostname][exe]

        sudo_wrappers_dir = '/opt/tools/wrappers'
        _exe = os.path.join(sudo_wrappers_dir, exe)
        if os.path.isfile(_exe) and os.access(_exe, os.X_OK):
            if hostname not in list(self._h2which.keys()):
                self._h2which.setdefault(hostname, {exe: _exe})
            else:
                self._h2which[hostname].setdefault(exe, _exe)
            return _exe

        # Changes specific to python
        # Use PBS Python if available before looking for system Python
        if exe == 'python3':
            pbs_conf = self.parse_pbs_config(hostname)
            py_path = os.path.join(pbs_conf['PBS_EXEC'], 'python',
                                   'bin', 'python')
            cmd = ['ls', '-1', py_path]
            ret = self.run_cmd(hostname, cmd, logerr=False)
            if ret['rc'] == 0:
                if hostname not in self._h2which.keys():
                    self._h2which.setdefault(hostname, {exe: py_path})
                else:
                    self._h2which[hostname].setdefault(exe, py_path)
                return py_path

        cmd = ['which', exe]
        ret = self.run_cmd(hostname, cmd=cmd, logerr=False,
                           level=level)
        if ((ret['rc'] == 0) and (len(ret['out']) == 1) and
                os.path.isabs(ret['out'][0].strip())):
            path = ret['out'][0].strip()
            if hostname not in self._h2which.keys():
                self._h2which.setdefault(hostname, {exe: path})
            else:
                self._h2which[hostname].setdefault(exe, path)
            return path
        else:
            return oexe

    def rm(self, hostname=None, path=None, sudo=False, runas=None,
           recursive=False, force=False, cwd=None, logerr=True,
           as_script=False, level=logging.INFOCLI2):
        """
        Generic function of rm with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param path: the path to the files or directories to remove
                     for more than one files or directories pass as
                     list
        :type path: str or None
        :param sudo: whether to remove files or directories as root
                     or not.Defaults to False
        :type sudo: boolean
        :param runas: remove files or directories as given user
                      Defaults to calling user
        :param recursive: remove files or directories and their
                          contents recursively
        :type recursive: boolean
        :param force: force remove files or directories
        :type force: boolean
        :param cwd: working directory on local host from which
                    command is run
        :param logerr: whether to log error messages or not.
                       Defaults to True.
        :type logerr: boolean
        :param as_script: if True, run the rm in a script created
                          as a temporary file that gets deleted after
                          being run. This is used mainly to handle
                          wildcard in path list. Defaults to False.
        :type as_script: boolean
        :param level: logging level, defaults to INFOCLI2
        :returns: True on success otherwise False
        """
        if (path is None) or (len(path) == 0):
            return True

        cmd = [self.which(hostname, 'rm', level=level)]
        if recursive and force:
            cmd += ['-rf']
        else:
            if recursive:
                cmd += ['-r']
            if force:
                cmd += ['-f']

        if isinstance(path, list):
            for p in path:
                if p == '/':
                    msg = 'encountered a dangerous package path ' + p
                    self.logger.error(msg)
                    return False
            cmd += path
        else:
            if path == '/':
                msg = 'encountered a dangerous package path ' + path
                self.logger.error(msg)
                return False
            cmd += [path]

        ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, logerr=logerr,
                           runas=runas, cwd=cwd, level=level,
                           as_script=as_script)
        if ret['rc'] != 0:
            return False
        return True

    def mkdir(self, hostname=None, path=None, mode=None, sudo=False,
              runas=None, parents=True, cwd=None, logerr=True,
              as_script=False, level=logging.INFOCLI2):
        """
        Generic function of mkdir with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param path: the path to the directories to create
                     for more than one directories pass as list
        :type path: str or None
        :param mode: mode to use while creating directories
                     (must be octal like 0777)
        :param sudo: whether to create directories as root or not.
                     Defaults to False
        :type sudo: boolean
        :param runas: create directories as given user. Defaults to
                      calling user
        :param parents: create parent directories as needed. Defaults
                        to True
        :type parents: boolean
        :param cwd: working directory on local host from which
                    command is run
        :type cwd: str or None
        :param logerr: whether to log error messages or not. Defaults
                       to True.
        :type logerr: boolean
        :param as_script: if True, run the command in a script
                          created as a temporary file that gets
                          deleted after being run. This is used
                          mainly to handle wildcard in path list.
                          Defaults to False.
        :type as_script: boolean
        :param level: logging level, defaults to INFOCLI2
        :returns: True on success otherwise False
        """
        if (path is None) or (len(path) == 0):
            return True

        cmd = [self.which(hostname, 'mkdir', level=level)]
        if parents:
            cmd += ['-p']
        if mode is not None:
            mode = '{:o}'.format(mode)
            cmd += ['-m', mode]
        if isinstance(path, list):
            cmd += path
        else:
            cmd += [path]
        ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, logerr=logerr,
                           runas=runas, cwd=cwd, level=level,
                           as_script=as_script)
        if ret['rc'] != 0:
            return False
        return True

    def cat(self, hostname=None, filename=None, sudo=False, runas=None,
            logerr=True, level=logging.INFOCLI2, option=None):
        """
        Generic function of cat with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param filename: the path to the filename to cat
        :type filename: str or None
        :param sudo: whether to create directories as root or not.
                     Defaults to False
        :type sudo: boolean
        :param runas: create directories as given user. Defaults
                      to calling user
        :type runas: str or None
        :param logerr: whether to log error messages or not. Defaults
                       to True.
        :type logerr: boolean
        :returns: output of run_cmd
        """
        cmd = [self.which(hostname, 'cat', level=level)]
        if option:
            cmd += [option, filename]
        else:
            cmd.append(filename)
        return self.run_cmd(hostname, cmd=cmd, sudo=sudo,
                            runas=runas, logerr=logerr, level=level)

    def tail(self, hostname=None, filename=None, sudo=False, runas=None,
             logerr=True, level=logging.INFOCLI2, option=None):
        """
        Generic function of tail with remote host support

        :param hostname: hostname (default current host)
        :type hostname: str or None
        :param filename: the path to the filename to tail
        :type filename: str or None
        :param sudo: whether to create directories as root or not.
                     Defaults to False
        :type sudo: boolean
        :param runas: create directories as given user. Defaults
                      to calling user
        :type runas: str or None
        :param logerr: whether to log error messages or not. Defaults
                       to True.
        :type logerr: boolean
        :returns: output of run_cmd
        """
        cmd = [self.which(hostname, 'tail', level=level)]
        if option:
            cmd += [option, filename]
        else:
            cmd.append(filename)
        return self.run_cmd(hostname, cmd=cmd, sudo=sudo,
                            runas=runas, logerr=logerr, level=level)

    def cmp(self, hostname=None, fileA=None, fileB=None, sudo=False,
            runas=None, logerr=True):
        """
        Compare two files and return 0 if they are identical or
        non-zero if not

        :param hostname: the name of the host to operate on
        :type hostname: str or None
        :param fileA: the first file to compare
        :type fileA: str or None
        :param fileB: the file to compare fileA to
        :type fileB: str or None
        :param sudo: run the command as a privileged user
        :type sudo: boolean
        :param runas: run the cmp command as given user
        :type runas: str or None
        :param logerr: whether to log error messages or not.
                       Defaults to True.
        :type logerr: boolean
        """

        if fileA is None and fileB is None:
            return 0

        if fileA is None or fileB is None:
            return 1

        cmd = ['cmp', fileA, fileB]
        ret = self.run_cmd(hostname, cmd=cmd, sudo=sudo, runas=runas,
                           logerr=logerr)
        return ret['rc']

    def useradd(self, name, uid=None, gid=None, shell='/bin/bash',
                create_home_dir=True, home_dir=None, groups=None, logerr=True,
                level=logging.INFOCLI2):
        """
        Add the user

        :param name: User name
        :type name: str
        :param shell: shell to use
        :param create_home_dir: If true then create home directory
        :type create_home_dir: boolean
        :param home_dir: path to home directory
        :type home_dir: str or None
        :param groups: User groups
        """
        self.logger.info('adding user ' + str(name))
        cmd = ['useradd']
        cmd += ['-K', 'UMASK=0022']
        if uid is not None:
            cmd += ['-u', str(uid)]
        if shell is not None:
            cmd += ['-s', shell]
        if gid is not None:
            cmd += ['-g', str(gid)]
        if create_home_dir:
            cmd += ['-m']
        if home_dir is not None:
            cmd += ['-d', home_dir]
        if ((groups is not None) and (len(groups) > 0)):
            cmd += ['-G', ','.join([str(g) for g in groups])]
        cmd += [str(name)]
        ret = self.run_cmd(cmd=cmd, logerr=logerr, sudo=True, level=level)
        if ((ret['rc'] != 0) and logerr):
            raise PtlUtilError(rc=ret['rc'], rv=False, msg=ret['err'])

    def userdel(self, name, del_home=True, force=True, logerr=True,
                level=logging.INFOCLI2):
        """
        Delete the user

        :param del_home: If true then delete user home
        :type del_home: boolean
        :param force: If true then delete forcefully
        :type force: boolean
        """
        cmd = ['userdel']
        if del_home:
            cmd += ['-r']
        if force:
            cmd += ['-f']
        cmd += [str(name)]
        self.logger.info('deleting user ' + str(name))
        ret = self.run_cmd(cmd=cmd, sudo=True, logerr=False, level=level)
        if ((ret['rc'] != 0) and logerr):
            raise PtlUtilError(rc=ret['rc'], rv=False, msg=ret['err'])

    def groupadd(self, name, gid=None, logerr=True, level=logging.INFOCLI2):
        """
        Add a group
        """
        self.logger.info('adding group ' + str(name))
        cmd = ['groupadd']
        if gid is not None:
            cmd += ['-g', str(gid)]
        cmd += [str(name)]
        ret = self.run_cmd(cmd=cmd, sudo=True, logerr=False, level=level)
        if ((ret['rc'] != 0) and logerr):
            raise PtlUtilError(rc=ret['rc'], rv=False, msg=ret['err'])

    def groupdel(self, name, logerr=True, level=logging.INFOCLI2):
        self.logger.info('deleting group ' + str(name))
        cmd = ['groupdel', str(name)]
        ret = self.run_cmd(cmd=cmd, sudo=True, logerr=logerr, level=level)
        if ((ret['rc'] != 0) and logerr):
            raise PtlUtilError(rc=ret['rc'], rv=False, msg=ret['err'])

    def create_temp_file(self, hostname=None, suffix='', prefix='PtlPbs',
                         dirname=None, text=False, asuser=None, body=None,
                         level=logging.INFOCLI2):
        """
        Create a temp file by calling tempfile.mkstemp

        :param hostname: the hostname on which to query tempdir from
        :type hostname: str or None
        :param suffix: the file name will end with this suffix
        :type suffix: str
        :param prefix: the file name will begin with this prefix
        :type prefix: str
        :param dirname: the file will be created in this directory
        :type dirname: str or None
        :param text: the file is opened in text mode is this is true
                     else in binary mode
        :type text: boolean
        :param asuser: Optional username or uid of temp file owner
        :type asuser: str or None
        :param body: Optional content to write to the temporary file
        :type body: str or None
        :param level: logging level, defaults to INFOCLI2
        :type level: int
        """
        _msg = 'create_temp_file(vvv start vvv):'
        self.logger.debug(_msg)

        # create a temp file as current user
        (fd, tmpfile) = tempfile.mkstemp(suffix, prefix, dirname, text)

        # write user provided contents to file
        if body is not None:
            if isinstance(body, list):
                os.write(fd, "\n".join(body).encode())
            else:
                os.write(fd, body.encode())
        os.close(fd)

        if not hostname and asuser:
            asuser = PbsUser.get_user(asuser)
            if asuser.host:
                hostname = asuser.host

        # if temp file to be created on remote host
        if not self.is_localhost(hostname):
            if asuser is not None:
                # by default mkstemp creates file with 0600 permission
                # to create file as different user first change the file
                # permission to 0644 so that other user has read permission
                self.chmod(path=tmpfile, mode=0o644)
                # copy temp file created  on local host to remote host
                # as different user
                self.run_copy(hostname, src=tmpfile, dest=tmpfile,
                              runas=asuser, preserve_permission=False,
                              level=level)
            else:
                # copy temp file created on localhost to remote as current user
                self.run_copy(hostname, src=tmpfile, dest=tmpfile,
                              preserve_permission=False, level=level)
                # remove local temp file
                os.unlink(tmpfile)
        if asuser is not None:
            # by default mkstemp creates file with 0600 permission
            # to create file as different user first change the file
            # permission to 0644 so that other user has read permission
            self.chmod(hostname, tmpfile, mode=0o644)
            # since we need to create as differnt user than current user
            # create a temp file just to get temp file name with absolute path
            (_, tmpfile2) = tempfile.mkstemp(suffix, prefix, dirname, text)
            # remove the newly created temp file
            os.unlink(tmpfile2)
            # copy the orginal temp as new temp file
            self.run_copy(hostname, src=tmpfile, dest=tmpfile2, runas=asuser,
                          preserve_permission=False, level=level)
            # remove original temp file
            os.unlink(tmpfile)
            self.tmpfilelist.append(tmpfile2)
            return tmpfile2
        self.tmpfilelist.append(tmpfile)
        _msg = 'create_temp_file(^^^ end ^^^): '
        _msg += " hostname:%s" % hostname
        _msg += " tmpfile:%s" % tmpfile
        self.logger.debug(_msg)
        return tmpfile

    def create_temp_dir(self, hostname=None, suffix='', prefix='PtlPbs',
                        dirname=None, asuser=None, asgroup=None, mode=0o755,
                        level=logging.INFOCLI2):
        """
        Create a temp dir by calling ``tempfile.mkdtemp``
        :param hostname: the hostname on which to query tempdir from
        :type hostname: str or None
        :param suffix: the directory name will end with this suffix
        :type suffix: str
        :param prefix: the directory name will begin with this prefix
        :type prefix: str
        :param dirname: the directory will be created in this directory
        :type dirname: str or None
        :param asuser: Optional username of temp directory owner
        :type asuser: str
        :param asgroup: Optional group name of temp directory
                    group owner
        :type asgroup: str
        :param mode: Optional mode bits to assign to the temporary
                     directory
        :type mode: octal integer
        :param level: logging level, defaults to INFOCLI2
        """
        current_user_info = self.get_id_info(self.get_current_user())
        uid = current_user_info['uid']
        if asuser is not None:
            uid = PbsUser.get_user(asuser).uid
        if asgroup is not None:
            gid = PbsGroup.get_group(asgroup).gid
        else:
            gid = None
        # create a temp dir as current user
        tmpdir = tempfile.mkdtemp(suffix, prefix)
        # By default mkdtemp creates dir according to umask.
        # To create dir as different user first change the dir
        # permission to 0755 so that other user has read permission
        self.chmod(path=tmpdir, mode=0o755)
        if dirname is not None:
            dirname = str(dirname)
            self.run_copy(hostname, src=tmpdir, dest=dirname, runas=asuser,
                          recursive=True, gid=gid, uid=uid,
                          level=level, preserve_permission=False)
            self.chmod(hostname, path=dirname, mode=mode, runas=asuser)

            tmpdir = dirname + tmpdir[4:]

        # if temp dir to be created on remote host
        if not self.is_localhost(hostname):
            self.run_copy(hostname, src=tmpdir, dest=tmpdir,
                          level=level, preserve_permission=False,
                          recursive=True, uid=uid, gid=gid)
            self.chmod(hostname, path=tmpdir, mode=mode, runas=asuser)
            # remove local temp dir
            os.rmdir(tmpdir)
            return tmpdir
        elif asuser is not None:
            # since we need to create as differnt user than current user
            # create a temp dir just to get temp dir name with absolute path
            tmpdir2 = tempfile.mkdtemp(suffix, prefix, dirname)
            os.rmdir(tmpdir2)
            # copy the orginal temp as new temp dir
            self.run_copy(hostname, src=tmpdir, dest=tmpdir2, runas=asuser,
                          recursive=True, uid=uid, gid=gid, level=level,
                          preserve_permission=False)
            self.chmod(hostname, path=tmpdir2, mode=mode, runas=asuser)
            # remove original temp dir
            os.rmdir(tmpdir)
            return tmpdir2
        # Its a local directory and user name is not provided
        self.chmod(path=tmpdir, mode=mode)
        return tmpdir

    def parse_strace(self, lines):
        """
        strace parsing. Just the regular expressions for now
        """
        timestamp_pat = r'(^(\d{2}:\d{2}:\d{2})(.\d+){0,1} |^(\d+.\d+) ){0,1}'
        exec_pat = r'execve\(("[^"]+"), \[([^]]+)\], [^,]+ = (\d+)$'

        timestamp_exec_re = re.compile(timestamp_pat + exec_pat)

        for line in lines:
            m = timestamp_exec_re.match(line)
            if m:
                print(line)


================================================
FILE: test/fw/ptl/utils/pbs_logutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import collections
import copy
import logging
import math
import re
import sys
import time
import traceback
from datetime import datetime, timedelta, tzinfo
from subprocess import PIPE, Popen

from ptl.lib.pbs_testlib import (EQ, JOB, NODE, SET, BatchUtils, ResourceResv,
                                 Server, PbsAttribute)
from ptl.utils.pbs_dshutils import DshUtils

"""
Analyze ``server``, ``scheduler``, ``MoM``, and ``accounting`` logs.

- Scheduler log analysis:

    Extraction of per cycle information including:
        cycle start time
        cycle duration
        time to query objects from server
        number of jobs considered
        number of jobs run
        number of jobs that failed to run
        Number of jobs preempted
        Number of jobs that failed to preempt
        Number of jobs calendared
        time to determine that a job can run
        time to determine that a job can not run
        time spent calendaring
        time spent in scheduler solver
    Summary of all cycles information

- Server log analysis:
    job submit rate
    number of jobs ended
    number of jobs run
    job run rate
    job submit rate
    job end rate
    job wait time distribution
    PBS versions
    node up rate
    wait time

- Mom log analysis:
    job submit rate
    number of jobs ended
    number of jobs run
    job run rate
    job submit rate
    job end rate
    PBS versions

- Accounting log analysis:
    job submit rate
    number of jobs ended
    number of jobs run
    job run rate
    job submit rate
    job end rate
    job size (cpu and node) distribution
    job wait time distribution
    utilization
"""

tm_re = r'(?P<datetime>\d\d/\d\d/\d{4}\s\d\d:\d\d:\d\d(\.\d{6})?)'
job_re = r';(?P<jobid>[\d\[\d*\]]+)\.'
fail_re = r';(?P<jobid>[\d\[\[]+)\.'

# Server metrics
NUR = 'node_up_rate'

# Scheduler metrics
NC = 'num_cycles'
mCD = 'cycle_duration_min'
MCD = 'cycle_duration_max'
mCT = 'min_cycle_time'
MCT = 'max_cycle_time'
CDA = 'cycle_duration_mean'
CD25 = 'cycle_duration_25p'
CDA = 'cycle_duration_mean'
CD50 = 'cycle_duration_median'
CD75 = 'cycle_duration_75p'
CST = 'cycle_start_time'
CD = 'cycle_duration'
QD = 'query_duration'
NJC = 'num_jobs_considered'
NJFR = 'num_jobs_failed_to_run'
SST = 'scheduler_solver_time'
NJCAL = 'num_jobs_calendared'
NJFP = 'num_jobs_failed_to_preempt'
NJP = 'num_jobs_preempted'
T2R = 'time_to_run'
T2D = 'time_to_discard'
TiS = 'time_in_sched'
TTC = 'time_to_calendar'

# Scheduling Estimated Start Time
EST = 'estimates'
EJ = 'estimated_jobs'
Eat = 'estimated'
DDm = 'drift_duration_min'
DDM = 'drift_duration_max'
DDA = 'drift_duration_mean'
DD50 = 'drift_duration_median'
ND = 'num_drifts'
NJD = 'num_jobs_drifted'
NJND = 'num_jobs_no_drift'
NEST = 'num_estimates'
JDD = 'job_drift_duration'
ESTR = 'estimated_start_time_range'
ESTA = 'estimated_start_time_accuracy'
JST = 'job_start_time'
ESTS = 'estimated_start_time_summary'
Ds15mn = 'drifted_sub_15mn'
Ds1hr = 'drifted_sub_1hr'
Ds3hr = 'drifted_sub_3hr'
Do3hr = 'drifted_over_3hr'

# Accounting metrics
JWTm = 'job_wait_time_min'
JWTM = 'job_wait_time_max'
JWTA = 'job_wait_time_mean'
JWT25 = 'job_wait_time_25p'
JWT50 = 'job_wait_time_median'
JWT75 = 'job_wait_time_75p'
JRTm = 'job_run_time_min'
JRT25 = 'job_run_time_25p'
JRT50 = 'job_run_time_median'
JRTA = 'job_run_time_mean'
JRT75 = 'job_run_time_75p'
JRTM = 'job_run_time_max'
JNSm = 'job_node_size_min'
JNS25 = 'job_node_size_25p'
JNS50 = 'job_node_size_median'
JNSA = 'job_node_size_mean'
JNS75 = 'job_node_size_75p'
JNSM = 'job_node_size_max'
JCSm = 'job_cpu_size_min'
JCS25 = 'job_cpu_size_25p'
JCS50 = 'job_cpu_size_median'
JCSA = 'job_cpu_size_mean'
JCS75 = 'job_cpu_size_75p'
JCSM = 'job_cpu_size_max'
CPH = 'cpu_hours'
NPH = 'node_hours'
USRS = 'unique_users'
UNCPUS = 'utilization_ncpus'
UNODES = 'utilization_nodes'

# Generic metrics
VER = 'pbs_version'
JID = 'job_id'
JRR = 'job_run_rate'
JSR = 'job_submit_rate'
JER = 'job_end_rate'
JTR = 'job_throughput'
NJQ = 'num_jobs_queued'
NJR = 'num_jobs_run'
NJE = 'num_jobs_ended'
DUR = 'duration'
RI = 'custom_interval'
IT = 'init_time'
CF = 'custom_freq'
CFC = 'custom_freq_counts'
CG = 'custom_groups'

PARSER_OK_CONTINUE = 0
PARSER_OK_STOP = 1
PARSER_ERROR_CONTINUE = 2
PARSER_ERROR_STOP = 3


class PBSLogUtils(object):

    """
    Miscellaneous utilities to process log files
    """

    logger = logging.getLogger(__name__)
    du = DshUtils()

    @classmethod
    def convert_date_time(cls, dt=None, fmt=None):
        """
        convert a date time string of the form given by fmt into
        number of seconds since epoch (with possible microseconds).
        it considers the current system's timezone to convert
        the datetime to epoch time

        :param dt: the datetime string to convert
        :type dt: str or None
        :param fmt: Format to which datetime is to be converted
        :type fmt: str
        :returns: timestamp in seconds since epoch,
                or None if conversion fails
        """
        if dt is None:
            return None

        micro = False
        if fmt is None:
            if '.' in dt:
                micro = True
                fmt = "%m/%d/%Y %H:%M:%S.%f"
            else:
                fmt = "%m/%d/%Y %H:%M:%S"

        try:
            # Get datetime object
            t = datetime.strptime(dt, fmt)
            # Get epoch-timestamp assuming local timezone
            tm = t.timestamp()
        except ValueError:
            cls.logger.debug("could not convert date time: " + str(dt))
            return None

        if micro is True:
            return tm
        else:
            return int(tm)

    def get_num_lines(self, log, hostname=None, sudo=False):
        """
        Get the number of lines of particular log

        :param log: the log file name
        :type log: str
        """
        f = self.open_log(log, hostname, sudo=sudo)
        nl = sum([1 for _ in f])
        f.close()
        return nl

    def open_log(self, log, hostname=None, sudo=False, start=None,
                 num_records=None):
        """
        :param log: the log file name to read from
        :type log: str
        :param hostname: the hostname from which to read the file
        :type hostname: str or None
        :param sudo: Whether to access log file as a privileged user.
        :type sudo: boolean
        :returns: A file instance
        """
        readcmd = ['cat', log]
        taillogs = 10000
        tailcmd = [self.du.which(hostname, 'tail')]
        if start:
            i = 0
            while(True):
                i += 1
                taillogs = 10000 * i
                tail_out = self.du.tail(hostname, log, sudo,
                                        option='-n ' + str(taillogs))
                line = tail_out['out'][0]
                ts = line.split(';')[0]
                epoch = self.convert_date_time(ts)
                readcmd = tailcmd + ['-n', str(taillogs), log]
                if start > epoch:
                    break
                elif taillogs > num_records:
                    readcmd = ['cat', log]
                    break

        try:
            if hostname is None or self.du.is_localhost(hostname):
                if sudo:
                    cmd = self.du.sudo_cmd + readcmd
                    self.logger.info('running ' + " ".join(cmd))
                    p = Popen(cmd, stdout=PIPE)
                    f = p.stdout
                else:
                    cmd = readcmd
                    p = Popen(cmd, stdout=PIPE)
                    f = p.stdout
            else:
                cmd = ['ssh', hostname]
                if sudo:
                    cmd += self.du.sudo_cmd
                cmd += readcmd
                self.logger.debug('running ' + " ".join(cmd))
                p = Popen(cmd, stdout=PIPE)
                f = p.stdout
        except Exception:
            self.logger.error(traceback.print_exc())
            self.logger.error('Problem processing file ' + log)
            f = None

        return f

    def get_timestamps(self, logfile=None, hostname=None, num=None,
                       sudo=False):
        """
        Helper function to parse logfile

        :returns: Each timestamp in a list as number of seconds since epoch
        """
        if logfile is None:
            return

        records = self.open_log(logfile, hostname, sudo=sudo)
        if records is None:
            return

        rec_times = []
        tm_tag = re.compile(tm_re)
        num_rec = 0
        for record in records:
            num_rec += 1
            if num is not None and num_rec > num:
                break

            if type(record) == bytes:
                record = record.decode("utf-8")

            m = tm_tag.match(record)
            if m:
                rec_times.append(
                    self.convert_date_time(m.group('datetime')))
        records.close()
        return rec_times

    def match_msg(self, lines, msg, allmatch=False, regexp=False,
                  starttime=None, endtime=None):
        """
        Returns (x,y) where x is the matching line y, or None if
        nothing is found.

        :param allmatch: If True (False by default), return a list
                         of matching tuples.
        :type allmatch: boolean
        :param regexp: If True, msg is a Python regular expression.
                       Defaults to False.
        :type regexp: bool
        :param starttime: If set ignore matches that occur before
                          specified time
        :param endtime: If set ignore matches that occur after
                        specified time
        """
        linecount = 0
        ret = []
        if lines:
            for l in lines:
                # l.split(';', 1)[0] gets the time stamp string
                dt_str = l.split(';', 1)[0]
                if starttime is not None:
                    tm = self.convert_date_time(dt_str)
                    if tm is None or tm < starttime:
                        continue
                if endtime is not None:
                    tm = self.convert_date_time(dt_str)
                    if tm is None or tm > endtime:
                        continue
                if ((regexp and re.search(msg, l)) or
                        (not regexp and l.find(msg) != -1)):
                    m = (linecount, l)
                    if allmatch:
                        ret.append(m)
                    else:
                        return m
                linecount += 1
        if len(ret) > 0:
            return ret
        return None

    @staticmethod
    def convert_resv_date_time(date_time):
        """
        Convert reservation datetime to seconds
        """
        try:
            t = time.strptime(date_time, "%a %b %d %H:%M:%S %Y")
        except Exception:
            t = time.localtime()
        return int(time.mktime(t))

    @staticmethod
    def convert_hhmmss_time(tm):
        """
        Convert datetime in hhmmss format to seconds
        """
        if ':' not in tm:
            return tm

        hms = tm.split(':')
        return int(int(hms[0]) * 3600 + int(hms[1]) * 60 + int(hms[2]))

    def get_rate(self, in_list=[]):
        """
        :returns: The frequency of occurrences of array l
                  The array is expected to be sorted
        """
        if len(in_list) > 0:
            duration = in_list[len(in_list) - 1] - in_list[0]
            if duration > 0:
                tm_factor = [1, 60, 60, 24]
                _rate = float(len(in_list)) / float(duration)
                index = 0
                while _rate < 1 and index < len(tm_factor):
                    index += 1
                    _rate *= tm_factor[index]
                _rate = "%.2f" % (_rate)
                if index == 0:
                    _rate = str(_rate) + '/s'
                elif index == 1:
                    _rate = str(_rate) + '/mn'
                elif index == 2:
                    _rate = str(_rate) + '/hr'
                else:
                    _rate = str(_rate) + '/day'
            else:
                _rate = str(len(in_list)) + '/s'
            return _rate
        return 0

    def in_range(self, tm, start=None, end=None):
        """
        :param tm: time to check within a provided range
        :param start: Lower limit for the time range
        :param end: Higer limit for the time range
        :returns: True if time is in the range else return False
        """
        if start is None and end is None:
            return True

        if start is None and end is not None:
            if tm <= end:
                return True
            else:
                return False

        if start is not None and end is None:
            if tm >= start:
                return True
            else:
                return False
        else:
            if tm >= start and tm <= end:
                return True
        return False

    @staticmethod
    def _duration(val=None):
        if val is not None:
            return str(timedelta(seconds=int(float(val))))

    @staticmethod
    def get_day(tm=None):
        """
        :param tm: Time for which to get a day
        """
        if tm is None:
            tm = time.time()
        return time.strftime("%Y%m%d", time.localtime(tm))

    @staticmethod
    def percentile(N, percent):
        """
        Find the percentile of a list of values.

        :param N: A list of values. Note N MUST BE already sorted.
        :type N: List
        :param percent: A float value from 0.0 to 1.0.
        :type percent: Float
        :returns: The percentile of the values
        """
        if not N:
            return None
        k = (len(N) - 1) * percent
        f = math.floor(k)
        c = math.ceil(k)
        if f == c:
            return N[int(k)]
        d0 = N[int(f)] * (c - k)
        d1 = N[int(c)] * (k - f)
        return d0 + d1

    @staticmethod
    def process_intervals(intervals, groups, frequency=60):
        """
        Process the intervals
        """
        info = {}
        if not intervals:
            return info

        val = [x - intervals[i - 1] for i, x in enumerate(intervals) if i > 0]
        info[RI] = ", ".join([str(v) for v in val])
        if intervals:
            info[IT] = intervals[0]
        if frequency is not None:
            _cf = []
            j = 0
            i = 1
            while i < len(intervals):
                if (intervals[i] - intervals[j]) > frequency:
                    _cf.append(((intervals[j], intervals[i - 1]), i - j))
                    j = i
                i += 1
            if i != j + 1:
                _cf.append(((intervals[j], intervals[i - 1]), i - j))
            else:
                _cf.append(((intervals[j], intervals[j]), 1))
            info[CFC] = _cf
            info[CF] = frequency
        if groups:
            info[CG] = groups
        return info

    def get_log_files(self, hostname, path, start, end, sudo=False):
        """
        :param hostname: Hostname of the machine
        :type hostname: str
        :param path: Path for the log file
        :type path: str
        :param start: Start time for the log file
        :param end: End time for the log file
        :returns: list of log file(s) found or an empty list
        """
        paths = []
        if self.du.isdir(hostname, path, sudo=sudo):
            logs = self.du.listdir(hostname, path, sudo=sudo)
            for f in sorted(logs):
                if start is not None or end is not None:
                    tm = self.get_timestamps(f, hostname, num=1, sudo=sudo)
                    if not tm:
                        continue
                    d1 = time.strftime("%Y%m%d", time.localtime(tm[0]))
                    if start is not None:
                        d2 = time.strftime("%Y%m%d", time.localtime(start))
                        if d1 < d2:
                            continue
                    if end is not None:
                        d2 = time.strftime("%Y%m%d", time.localtime(end))
                        if d1 > d2:
                            continue
                paths.append(f)
        elif self.du.isfile(hostname, path, sudo=sudo):
            paths = [path]

        return paths


class PBSLogAnalyzer(object):
    """
    Utility to analyze the PBS logs
    """
    logger = logging.getLogger(__name__)
    logutils = PBSLogUtils()

    generic_tag = re.compile(tm_re + ".*")
    node_type_tag = re.compile(tm_re + ".*" + "Type 58 request.*")
    queue_type_tag = re.compile(tm_re + ".*" + "Type 20 request.*")
    job_type_tag = re.compile(tm_re + ".*" + "Type 51 request.*")
    job_exit_tag = re.compile(tm_re + ".*" + job_re + ";Exit_status.*")

    def __init__(self, schedlog=None, serverlog=None,
                 momlog=None, acctlog=None, genericlog=None,
                 hostname=None, show_progress=False):

        self.hostname = hostname
        self.schedlog = schedlog
        self.serverlog = serverlog
        self.acctlog = acctlog
        self.momlog = momlog
        self.genericlog = genericlog
        self.show_progress = show_progress

        self._custom_tag = None
        self._custom_freq = None
        self._custom_id = False
        self._re_interval = []
        self._re_group = {}

        self.num_conditional_matches = 0
        self.re_conditional = None
        self.num_conditionals = 0
        self.prev_records = []

        self.info = {}

        self.scheduler = None
        self.server = None
        self.mom = None
        self.accounting = None

        if schedlog:
            self.scheduler = PBSSchedulerLog(schedlog, hostname, show_progress)

        if serverlog:
            self.server = PBSServerLog(serverlog, hostname, show_progress)
        if momlog:
            self.mom = PBSMoMLog(momlog, hostname, show_progress)

        if acctlog:
            self.accounting = PBSAccountingLog(acctlog, hostname,
                                               show_progress)

    def set_custom_match(self, pattern, frequency=None):
        """
        Set the custome matching

        :param pattern: Matching pattern
        :type pattern: str
        :param frequency: Frequency of match
        :type frequency: int
        """
        self._custom_tag = re.compile(tm_re + ".*" + pattern + ".*")
        self._custom_freq = frequency

    def set_conditional_match(self, conditions):
        """
        Set the conditional match

        :param conditions: Conditions for macthing
        """
        if not isinstance(conditions, list):
            return False
        self.re_conditional = conditions
        self.num_conditionals = len(conditions)
        self.prev_records = ['' for n in range(self.num_conditionals)]
        self.info['matches'] = []

    def analyze_scheduler_log(self, filename=None, start=None, end=None,
                              hostname=None, summarize=True):
        """
        Analyze the scheduler log

        :param filename: Scheduler log file name
        :type filename: str or None
        :param start: Time from which log to be analyzed
        :param end: Time till which log to be analyzed
        :param hostname: Hostname of the machine
        :type hostname: str or None
        :param summarize: Summarize data parsed if True else not
        :type summarize: bool
        """
        if self.scheduler is None:
            self.scheduler = PBSSchedulerLog(filename, hostname=hostname)
        return self.scheduler.analyze(filename, start, end, hostname,
                                      summarize)

    def analyze_server_log(self, filename=None, start=None, end=None,
                           hostname=None, summarize=True):
        """
        Analyze the server log
        """
        if self.server is None:
            self.server = PBSServerLog(filename, hostname=hostname)

        return self.server.analyze(filename, start, end, hostname,
                                   summarize)

    def analyze_accounting_log(self, filename=None, start=None, end=None,
                               hostname=None, summarize=True):
        """
        Analyze the accounting log
        """
        if self.accounting is None:
            self.accounting = PBSAccountingLog(filename, hostname=hostname)

        return self.accounting.analyze(filename, start, end, hostname,
                                       summarize=summarize, sudo=True)

    def analyze_mom_log(self, filename=None, start=None, end=None,
                        hostname=None, summarize=True):
        """
        Analyze the mom log
        """
        if self.mom is None:
            self.mom = PBSMoMLog(filename, hostname=hostname)

        return self.mom.analyze(filename, start, end, hostname, summarize)

    def parse_conditional(self, rec, start, end):
        """
        Match a sequence of regular expressions against multiple
        consecutive lines in a generic log. Calculate the number
        of conditional matching lines.

        Example usage: to find the number of times the scheduler
        stat'ing the server causes the scheduler to miss jobs ending,
        which could possibly indicate a race condition between the
        view of resources assigned to nodes and the actual jobs
        running, one would call this function by setting
        re_conditional to
        ``['Type 20 request received from Scheduler', 'Exit_status']``
        Which can be read as counting the number of times that the
        Type 20 message is preceded by an ``Exit_status`` message
        """
        match = True
        for rc in range(self.num_conditionals):
            if not re.search(self.re_conditional[rc], self.prev_records[rc]):
                match = False
        if match:
            self.num_conditional_matches += 1
            self.info['matches'].extend(self.prev_records)
        for i in range(self.num_conditionals - 1, -1, -1):
            self.prev_records[i] = self.prev_records[i - 1]
        self.prev_records[0] = rec
        return PARSER_OK_CONTINUE

    def parse_custom_tag(self, rec, start, end):
        m = self._custom_tag.match(rec)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            if ((start is None and end is None) or
                    self.logutils.in_range(tm, start, end)):
                self._re_interval.append(tm)
                for k, v in m.groupdict().items():
                    if k in self._re_group:
                        self._re_group[k].append(v)
                    else:
                        self._re_group[k] = [v]
            elif end is not None and tm > end:
                return PARSER_OK_STOP

        return PARSER_OK_CONTINUE

    def parse_block(self, rec, start, end):
        m = self.generic_tag.match(rec)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            if ((start is None and end is None) or
                    self.logutils.in_range(tm, start, end)):
                print(rec, end=' ')

    def comp_analyze(self, rec, start, end):
        if self.re_conditional is not None:
            return self.parse_conditional(rec, start, end)
        elif self._custom_tag is not None:
            return self.parse_custom_tag(rec, start, end)
        elif start is not None or end is not None:
            return self.parse_block(rec, start, end)

    def analyze(self, path=None, start=None, end=None, hostname=None,
                summarize=True, sudo=False):
        """
        Parse any log file. This method is not ``context-specific``
        to each log file type.

        :param path: name of ``file/dir`` to parse
        :type path: str or None
        :param start: optional record time at which to start analyzing
        :param end: optional record time after which to stop analyzing
        :param hostname: name of host on which to operate. Defaults to
                         localhost
        :type hostname: str or None
        :param summarize: if True, summarize data parsed. Defaults to
                          True.
        :type summarize: bool
        :param sudo: If True, access log file(s) as privileged user.
        :type sudo: bool
        """
        if hostname is None and self.hostname is not None:
            hostname = self.hostname

        for f in self.logutils.get_log_files(hostname, path, start, end,
                                             sudo=sudo):
            self._log_parser(f, start, end, hostname, sudo=sudo)

        if summarize:
            return self.summary()

    def _log_parser(self, filename, start, end, hostname=None, sudo=False):
        num_records = self.logutils.get_num_lines(filename, hostname,
                                                  sudo=sudo)
        if filename is not None:
            records = self.logutils.open_log(filename, hostname, sudo=sudo,
                                             start=start,
                                             num_records=num_records)
        else:
            return None

        if records is None:
            return None

        num_line = 0
        last_rec = None
        if self.show_progress:
            perc_range = list(range(10, 110, 10))
            perc_records = [num_records * x / 100 for x in perc_range]
            sys.stderr.write('Parsing ' + filename + ': |0%')
            sys.stderr.flush()

        for rec in records:
            rec = rec.decode("utf-8")
            num_line += 1
            if self.show_progress and (num_line > perc_records[0]):
                sys.stderr.write('-' + str(perc_range[0]) + '%')
                sys.stderr.flush()
                perc_range.remove(perc_range[0])
                perc_records.remove(perc_records[0])
            last_rec = rec
            rv = self.comp_analyze(rec, start, end)
            if (rv in (PARSER_OK_STOP, PARSER_ERROR_STOP) or
                    (self.show_progress and len(perc_records) == 0)):
                break
        if self.show_progress:
            sys.stderr.write('-100%|\n')
            sys.stderr.flush()
        records.close()

        if last_rec is not None:
            self.epilogue(last_rec)

    def analyze_logs(self, schedlog=None, serverlog=None, momlog=None,
                     acctlog=None, genericlog=None, start=None, end=None,
                     hostname=None, showjob=False):
        """
        Analyze logs
        """
        if hostname is None and self.hostname is not None:
            hostname = self.hostname

        if schedlog is None and self.schedlog is not None:
            schedlog = self.schedlog
        if serverlog is None and self.serverlog is not None:
            serverlog = self.serverlog
        if momlog is None and self.momlog is not None:
            momlog = self.momlog
        if acctlog is None and self.acctlog is not None:
            acctlog = self.acctlog
        if genericlog is None and self.genericlog is not None:
            genericlog = self.genericlog

        cycles = None
        sjr = {}

        if schedlog:
            self.analyze_scheduler_log(schedlog, start, end, hostname,
                                       summarize=False)
            cycles = self.scheduler.cycles

        if serverlog:
            self.analyze_server_log(serverlog, start, end, hostname,
                                    summarize=False)
            sjr = self.server.server_job_run

        if momlog:
            self.analyze_mom_log(momlog, start, end, hostname,
                                 summarize=False)

        if acctlog:
            self.analyze_accounting_log(acctlog, start, end, hostname,
                                        summarize=False)

        if genericlog:
            self.analyze(genericlog, start, end, hostname, sudo=True,
                         summarize=False)

        if cycles is not None and len(sjr.keys()) != 0:
            for cycle in cycles:
                for jid, tm in cycle.sched_job_run.items():
                    # skip job arrays: scheduler runs a subjob
                    # but we don't keep track of which Considering job to run
                    # message it is associated with because the consider
                    # message doesn't show the subjob
                    if '[' in jid:
                        continue
                    if jid in sjr:
                        for tm in sjr[jid]:
                            if tm > cycle.start and tm < cycle.end:
                                cycle.inschedduration[jid] = \
                                    tm - cycle.consider[jid]

        return self.summary(showjob)

    def epilogue(self, line):
        pass

    def summary(self, showjob=False, writer=None):

        info = {}

        if self._custom_tag is not None:
            self.info = self.logutils.process_intervals(self._re_interval,
                                                        self._re_group,
                                                        self._custom_freq)
            return self.info

        if self.re_conditional is not None:
            self.info['num_conditional_matches'] = self.num_conditional_matches
            return self.info

        if self.scheduler is not None:
            info['scheduler'] = self.scheduler.summary(self.scheduler.cycles,
                                                       showjob)
        if self.server is not None:
            info['server'] = self.server.summary()

        if self.accounting is not None:
            info['accounting'] = self.accounting.summary()

        if self.mom is not None:
            info['mom'] = self.mom.summary()

        return info


class PBSServerLog(PBSLogAnalyzer):
    """
    :param filename: Server log filename
    :type filename: str or None
    :param hostname: Hostname of the machine
    :type hostname: str or None
    """
    tm_tag = re.compile(tm_re)
    server_run_tag = re.compile(tm_re + ".*" + job_re + ".*;Job Run at.*")
    server_nodeup_tag = re.compile(tm_re + ".*Node;.*;node up.*")
    server_enquejob_tag = re.compile(tm_re + ".*" + job_re +
                                     ".*enqueuing into.*state Q .*")
    server_endjob_tag = re.compile(tm_re + ".*" + job_re +
                                   ".*;Exit_status.*")

    def __init__(self, filename=None, hostname=None, show_progress=False):

        self.server_job_queued = {}
        self.server_job_run = {}
        self.server_job_end = {}
        self.records = None
        self.nodeup = []
        self.enquejob = []
        self.record_tm = []
        self.jobsrun = []
        self.jobsend = []
        self.wait_time = []
        self.run_time = []

        self.hostname = hostname

        self.info = {}
        self.version = []

        self.filename = filename
        self.show_progress = show_progress

    def parse_runjob(self, line):
        """
        Parse server log for run job records.
        For each record keep track of the job id, and time in a
        dedicated array
        """
        m = self.server_run_tag.match(line)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.jobsrun.append(tm)
            jobid = str(m.group('jobid'))
            if jobid in self.server_job_run:
                self.server_job_run[jobid].append(tm)
            else:
                self.server_job_run[jobid] = [tm]
            if jobid in self.server_job_queued:
                self.wait_time.append(tm - self.server_job_queued[jobid])

    def parse_endjob(self, line):
        """
        Parse server log for run job records.
        For each record keep track of the job id, and time in a
        dedicated array
        """
        m = self.server_endjob_tag.match(line)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.jobsend.append(tm)
            jobid = str(m.group('jobid'))
            if jobid in self.server_job_end:
                self.server_job_end[jobid].append(tm)
            else:
                self.server_job_end[jobid] = [tm]
            if jobid in self.server_job_run:
                self.run_time.append(tm - self.server_job_run[jobid][-1:][0])

    def parse_nodeup(self, line):
        """
        Parse server log for nodes that are up
        """
        m = self.server_nodeup_tag.match(line)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.nodeup.append(tm)

    def parse_enquejob(self, line):
        """
        Parse server log for enqued jobs
        """
        m = self.server_enquejob_tag.match(line)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.enquejob.append(tm)
            jobid = str(m.group('jobid'))
            self.server_job_queued[jobid] = tm

    def comp_analyze(self, rec, start=None, end=None):
        m = self.tm_tag.match(rec)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.record_tm.append(tm)
            if not self.logutils.in_range(tm, start, end):
                if end and tm > end:
                    return PARSER_OK_STOP
                return PARSER_OK_CONTINUE

        if 'pbs_version=' in rec:
            version = rec.split('pbs_version=')[1].strip()
            if version not in self.version:
                self.version.append(version)
        self.parse_enquejob(rec)
        self.parse_nodeup(rec)
        self.parse_runjob(rec)
        self.parse_endjob(rec)

        return PARSER_OK_CONTINUE

    def summary(self):
        self.info[JSR] = self.logutils.get_rate(self.enquejob)
        self.info[NJE] = len(self.server_job_end.keys())
        self.info[NJQ] = len(self.enquejob)
        self.info[NUR] = self.logutils.get_rate(self.nodeup)
        self.info[JRR] = self.logutils.get_rate(self.jobsrun)
        self.info[JER] = self.logutils.get_rate(self.jobsend)
        if len(self.server_job_end) > 0:
            tjr = self.jobsend[-1] - self.enquejob[0]
            self.info[JTR] = str(len(self.server_job_end) / tjr) + '/s'
        if len(self.wait_time) > 0:
            wt = sorted(self.wait_time)
            wta = float(sum(self.wait_time)) / len(self.wait_time)
            self.info[JWTm] = self.logutils._duration(min(wt))
            self.info[JWTM] = self.logutils._duration(max(wt))
            self.info[JWTA] = self.logutils._duration(wta)
            self.info[JWT25] = self.logutils._duration(
                self.logutils.percentile(wt, .25))
            self.info[JWT50] = self.logutils._duration(
                self.logutils.percentile(wt, .5))
            self.info[JWT75] = self.logutils._duration(
                self.logutils.percentile(wt, .75))
        njr = 0
        for v in self.server_job_run.values():
            njr += len(v)
        self.info[NJR] = njr
        self.info[VER] = ",".join(self.version)

        if len(self.run_time) > 0:
            rt = sorted(self.run_time)
            self.info[JRTm] = self.logutils._duration(min(rt))
            self.info[JRT25] = self.logutils._duration(
                self.logutils.percentile(rt, 0.25))
            self.info[JRT50] = self.logutils._duration(
                self.logutils.percentile(rt, 0.50))
            self.info[JRTA] = self.logutils._duration(
                str(sum(rt) / len(rt)))
            self.info[JRT75] = self.logutils._duration(
                self.logutils.percentile(rt, 0.75))
            self.info[JRTM] = self.logutils._duration(max(rt))
        return self.info


class JobEstimatedStartTimeInfo(object):
    """
    Information regarding Job estimated start time
    """

    def __init__(self, jobid):
        self.jobid = jobid
        self.started_at = None
        self.estimated_at = []
        self.num_drifts = 0
        self.num_estimates = 0
        self.drift_time = 0

    def add_estimate(self, tm):
        """
        Add a job's new estimated start time
        If the new estimate is now later than any preivous one, we
        add that difference to the drift time. If the new drift time
        is pulled earlier it is not added to the drift time.

        drift time is a measure of ``"negative perception"`` that
        comes along a job being estimated to run at a later date than
        earlier ``"advertised"``.
        """
        if self.estimated_at:
            prev_tm = self.estimated_at[len(self.estimated_at) - 1]
            if tm > prev_tm:
                self.num_drifts += 1
                self.drift_time += tm - prev_tm

        self.estimated_at.append(tm)
        self.num_estimates += 1

    def __repr__(self):
        estimated_at_str = [str(t) for t in self.estimated_at]
        return " ".join([str(self.jobid), 'started: ', str(self.started_at),
                         'estimated: ', ",".join(estimated_at_str)])

    def __str__(self):
        return self.__repr__()


class PBSSchedulerLog(PBSLogAnalyzer):

    tm_tag = re.compile(tm_re)
    startcycle_tag = re.compile(tm_re + ".*Starting Scheduling.*")
    endcycle_tag = re.compile(tm_re + ".*Leaving [(the )]*[sS]cheduling.*")
    alarm_tag = re.compile(tm_re + ".*alarm.*")
    considering_job_tag = re.compile(tm_re + ".*" + job_re +
                                     ".*;Considering job to run.*")
    sched_job_run_tag = re.compile(tm_re + ".*" + job_re + ".*;Job run.*")
    estimated_tag = re.compile(tm_re + ".*" + job_re +
                               ".*;Job is a top job and will run at "
                               "(?P<est_tm>.*)")
    run_failure_tag = re.compile(tm_re + ".*" + fail_re + ".*;Failed to run.*")
    calendarjob_tag = re.compile(
        tm_re +
        ".*" +
        job_re +
        ".*;Job is a top job.*")
    preempt_failure_tag = re.compile(tm_re + ".*;Job failed to be preempted.*")
    preempt_tag = re.compile(tm_re + ".*" + job_re + ".*;Job preempted.*")
    record_tag = re.compile(tm_re + ".*")

    def __init__(self, filename=None, hostname=None, show_progress=False):

        self.filename = filename
        self.hostname = hostname
        self.show_progress = show_progress

        self.record_tm = []
        self.version = []

        self.cycle = None
        self.cycles = []

        self.estimated_jobs = {}
        self.estimated_parsing_enabled = False
        self.parse_estimated_only = False

        self.info = {}
        self.summary_info = {}

    def _parse_line(self, line):
        """
        Parse scheduling cycle Starting, Leaving, and alarm records
        From each record, keep track of the record time in a
        dedicated array
        """
        m = self.startcycle_tag.match(line)

        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            # if cycle was interrupted assume previous cycle ended now
            if self.cycle is not None and self.cycle.end == -1:
                self.cycle.end = tm
            self.cycle = PBSCycleInfo()
            self.cycles.append(self.cycle)
            self.cycle.start = tm
            self.cycle.end = -1
            return PARSER_OK_CONTINUE

        m = self.endcycle_tag.match(line)
        if m is not None and self.cycle is not None:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.cycle.end = tm
            self.cycle.duration = tm - self.cycle.start
            if (self.cycle.lastjob is not None and
                    self.cycle.lastjob not in self.cycle.sched_job_run and
                    self.cycle.lastjob not in self.cycle.calendared_jobs):
                self.cycle.cantrunduration[self.cycle.lastjob] = (
                    tm - self.cycle.consider[self.cycle.lastjob])
            return PARSER_OK_CONTINUE

        m = self.alarm_tag.match(line)
        if m is not None and self.cycle is not None:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.cycle.end = tm
            return PARSER_OK_CONTINUE

        m = self.considering_job_tag.match(line)
        if m is not None and self.cycle is not None:
            self.cycle.num_considered += 1
            jid = str(m.group('jobid'))
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.cycle.consider[jid] = tm
            self.cycle.political_order.append(jid)
            if (self.cycle.lastjob is not None and
                    self.cycle.lastjob not in self.cycle.sched_job_run and
                    self.cycle.lastjob not in self.cycle.calendared_jobs):
                self.cycle.cantrunduration[self.cycle.lastjob] = (
                    tm - self.cycle.consider[self.cycle.lastjob])
            self.cycle.lastjob = jid
            if self.cycle.queryduration == 0:
                self.cycle.queryduration = tm - self.cycle.start
            return PARSER_OK_CONTINUE

        m = self.sched_job_run_tag.match(line)
        if m is not None and self.cycle is not None:
            jid = str(m.group('jobid'))
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.cycle.sched_job_run[jid] = tm
            # job arrays require special handling because the considering
            # job to run message does not have the subjob index but only []
            if '[' in jid:
                subjid = jid
                if subjid not in self.cycle.consider:
                    jid = jid.split('[')[0] + '[]'
                    self.cycle.consider[subjid] = self.cycle.consider[jid]
                self.cycle.runduration[subjid] = tm - self.cycle.consider[jid]
            # job rerun due to preemption failure aren't considered, skip
            elif jid in self.cycle.consider:
                self.cycle.runduration[jid] = tm - self.cycle.consider[jid]
            return PARSER_OK_CONTINUE

        m = self.run_failure_tag.match(line)
        if m is not None:
            if self.cycle is not None:
                jid = str(m.group('jobid'))
                tm = self.logutils.convert_date_time(m.group('datetime'))
                self.cycle.run_failure[jid] = tm
            return PARSER_OK_CONTINUE

        m = self.preempt_failure_tag.match(line)
        if m is not None:
            if self.cycle is not None:
                self.cycle.num_preempt_failure += 1
            return PARSER_OK_CONTINUE

        m = self.preempt_tag.match(line)
        if m is not None:
            if self.cycle is not None:
                jid = str(m.group('jobid'))
                if self.cycle.lastjob in self.cycle.preempted_jobs:
                    self.cycle.preempted_jobs[self.cycle.lastjob].append(jid)
                else:
                    self.cycle.preempted_jobs[self.cycle.lastjob] = [jid]
                self.cycle.num_preempted += 1
            return PARSER_OK_CONTINUE

        m = self.calendarjob_tag.match(line)
        if m is not None:
            if self.cycle is not None:
                jid = str(m.group('jobid'))
                tm = self.logutils.convert_date_time(m.group('datetime'))
                self.cycle.calendared_jobs[jid] = tm
                if jid in self.cycle.consider:
                    self.cycle.calendarduration[jid] = \
                        (tm - self.cycle.consider[jid])
                elif '[' in jid:
                    arrjid = re.sub(r"(\[\d+\])", '[]', jid)
                    if arrjid in self.cycle.consider:
                        self.cycle.consider[jid] = self.cycle.consider[arrjid]
                        self.cycle.calendarduration[jid] = \
                            (tm - self.cycle.consider[arrjid])
            return PARSER_OK_CONTINUE

    def get_cycles(self, start=None, end=None):
        """
        Get the scheduler cycles

        :param start: Start time
        :param end: End time
        :returns: Scheduling cycles
        """
        if start is None and end is None:
            return self.cycles

        cycles = []
        if end is None:
            end = time.time()
        for c in self.cycles:
            if c.start >= start and c.end < end:
                cycles.append(c)
        return cycles

    def comp_analyze(self, rec, start, end):
        if self.estimated_parsing_enabled:
            rv = self.estimated_info_parsing(rec)
            if self.parse_estimated_only:
                return rv
        return self.scheduler_parsing(rec, start, end)

    def scheduler_parsing(self, rec, start, end):
        m = self.tm_tag.match(rec)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            self.record_tm.append(tm)
            if self.logutils.in_range(tm, start, end):
                rv = self._parse_line(rec)
                if rv in (PARSER_OK_STOP, PARSER_ERROR_STOP):
                    return rv
            if 'pbs_version=' in rec:
                version = rec.split('pbs_version=')[1].strip()
                if version not in self.version:
                    self.version.append(version)
        elif end is not None and tm > end:
            PARSER_OK_STOP

        return PARSER_OK_CONTINUE

    def estimated_info_parsing(self, line):
        """
        Parse Estimated start time information for a job
        """
        m = self.sched_job_run_tag.match(line)
        if m is not None:
            jid = str(m.group('jobid'))
            tm = self.logutils.convert_date_time(m.group('datetime'))
            if jid in self.estimated_jobs:
                self.estimated_jobs[jid].started_at = tm
            else:
                ej = JobEstimatedStartTimeInfo(jid)
                ej.started_at = tm
                self.estimated_jobs[jid] = ej

        m = self.estimated_tag.match(line)
        if m is not None:
            jid = str(m.group('jobid'))
            try:
                tm = self.logutils.convert_date_time(m.group('est_tm'),
                                                     "%a %b %d %H:%M:%S %Y")
            except Exception:
                logging.error('error converting time: ' +
                              str(m.group('est_tm')))
                return PARSER_ERROR_STOP

            if jid in self.estimated_jobs:
                self.estimated_jobs[jid].add_estimate(tm)
            else:
                ej = JobEstimatedStartTimeInfo(jid)
                ej.add_estimate(tm)
                self.estimated_jobs[jid] = ej

        return PARSER_OK_CONTINUE

    def epilogue(self, line):
        # if log ends in the middle of a cycle there is no 'Leaving cycle'
        # message, in this case the last cycle duration is computed as
        # from start to the last record in the log file
        if self.cycle is not None and self.cycle.end <= 0:
            m = self.record_tag.match(line)
            if m:
                self.cycle.end = self.logutils.convert_date_time(
                    m.group('datetime'))

    def summarize_estimated_analysis(self, estimated_jobs=None):
        """
        Summarize estimated job analysis
        """
        if estimated_jobs is None and self.estimated_jobs is not None:
            estimated_jobs = self.estimated_jobs

        einfo = {EJ: []}
        sub15mn = 0
        sub1hr = 0
        sub3hr = 0
        sup3hr = 0
        total_drifters = 0
        total_nondrifters = 0
        drift_times = []
        for e in estimated_jobs.values():
            info = {}
            if len(e.estimated_at) > 0:
                info[JID] = e.jobid
                e_sorted = sorted(e.estimated_at)
                info[Eat] = e.estimated_at
                if e.started_at is not None:
                    info[JST] = e.started_at
                    e_diff = e_sorted[len(e_sorted) - 1] - e_sorted[0]
                    e_accuracy = (e.started_at -
                                  e.estimated_at[len(e.estimated_at) - 1])
                    info[ESTR] = e_diff
                    info[ESTA] = e_accuracy

                info[NEST] = e.num_estimates
                info[ND] = e.num_drifts
                info[JDD] = e.drift_time
                drift_times.append(e.drift_time)

                if e.drift_time > 0:
                    total_drifters += 1
                    if e.drift_time < 15 * 60:
                        sub15mn += 1
                    elif e.drift_time < 3600:
                        sub1hr += 1
                    elif e.drift_time < 3 * 3600:
                        sub3hr += 1
                    else:
                        sup3hr += 1
                else:
                    total_nondrifters += 1
                einfo[EJ].append(info)

        info = {}
        info[Ds15mn] = sub15mn
        info[Ds1hr] = sub1hr
        info[Ds3hr] = sub3hr
        info[Do3hr] = sup3hr
        info[NJD] = total_drifters
        info[NJND] = total_nondrifters
        if drift_times:
            info[DDm] = min(drift_times)
            info[DDM] = max(drift_times)
            info[DDA] = (sum(drift_times) / len(drift_times))
            info[DD50] = sorted(drift_times)[len(drift_times) / 2]
        einfo[ESTS] = info

        return einfo

    def summary(self, cycles=None, showjobs=False):
        """
        Scheduler log summary
        """
        if self.estimated_parsing_enabled:
            self.info[EST] = self.summarize_estimated_analysis()
            if self.parse_estimated_only:
                return self.info

        if cycles is None and self.cycles is not None:
            cycles = self.cycles

        num_cycle = 0
        run = 0
        failed = 0
        total_considered = 0
        run_tm = []
        cycle_duration = []
        min_duration = None
        max_duration = None
        mint = maxt = None
        calendarduration = 0
        schedsolvertime = 0

        for c in cycles:
            c.summary(showjobs)
            self.info[num_cycle] = c.info
            run += len(c.sched_job_run.keys())
            run_tm.extend(list(c.sched_job_run.values()))
            failed += len(c.run_failure.keys())
            total_considered += c.num_considered

            if max_duration is None or c.duration > max_duration:
                max_duration = c.duration
                maxt = time.strftime("%Y-%m-%d %H:%M:%S",
                                     time.localtime(c.start))

            if min_duration is None or c.duration < min_duration:
                min_duration = c.duration
                mint = time.strftime("%Y-%m-%d %H:%M:%S",
                                     time.localtime(c.start))

            cycle_duration.append(c.duration)
            num_cycle += 1
            calendarduration += sum(c.calendarduration.values())
            schedsolvertime += c.scheduler_solver_time

        run_rate = self.logutils.get_rate(sorted(run_tm))

        sorted_cd = sorted(cycle_duration)

        self.summary_info[NC] = len(cycles)
        self.summary_info[NJR] = run
        self.summary_info[NJFR] = failed
        self.summary_info[JRR] = run_rate
        self.summary_info[NJC] = total_considered
        self.summary_info[mCD] = self.logutils._duration(min_duration)
        self.summary_info[MCD] = self.logutils._duration(max_duration)
        self.summary_info[CD25] = self.logutils._duration(
            self.logutils.percentile(sorted_cd, .25))
        if len(sorted_cd) > 0:
            self.summary_info[CDA] = self.logutils._duration(
                sum(sorted_cd) / len(sorted_cd))
        self.summary_info[CD50] = self.logutils._duration(
            self.logutils.percentile(sorted_cd, .5))
        self.summary_info[CD75] = self.logutils._duration(
            self.logutils.percentile(sorted_cd, .75))

        if mint is not None:
            self.summary_info[mCT] = mint
        if maxt is not None:
            self.summary_info[MCT] = maxt
        self.summary_info[DUR] = self.logutils._duration(sum(cycle_duration))
        self.summary_info[TTC] = self.logutils._duration(calendarduration)
        self.summary_info[SST] = self.logutils._duration(schedsolvertime)
        self.summary_info[VER] = ",".join(self.version)

        self.info['summary'] = dict(self.summary_info.items())
        return self.info


class PBSCycleInfo(object):

    def __init__(self):

        self.info = {}

        """
        Time between end and start of a cycle, which may be on alarm,
        or signal, not only Leaving - Starting
        """
        self.duration = 0
        " Time of a Starting scheduling cycle message "
        self.start = 0
        " Time of a Leaving scheduling cycle message "
        self.end = 0
        " Time at which Considering job to run message "
        self.consider = {}
        " Number of jobs considered "
        self.num_considered = 0
        " Time at which job run message in scheduler. This includes time to "
        " start the job by the server "
        self.sched_job_run = {}
        """
        number of jobs added to the calendar, i.e.,
        number of backfilling jobs
        """
        self.calendared_jobs = {}
        " Time between Considering job to run to Job run message "
        self.runduration = {}
        " Time to determine that job couldn't run "
        self.cantrunduration = {}
        " List of jobs preempted in order to run high priority job"
        self.preempted_jobs = {}
        """
        Time between considering job to run to server logging
        'Job Run at request...
        """
        self.inschedduration = {}
        " Total time spent in scheduler solver, insched + cantrun + calendar"
        self.scheduler_solver_time = 0
        " Error 15XXX in the sched log corresponds to a failure to run"
        self.run_failure = {}
        " Job failed to be preempted"
        self.num_preempt_failure = 0
        " Job preempted by "
        self.num_preempted = 0
        " Time between start of cycle and first job considered to run "
        self.queryduration = 0
        " The order in which jobs are considered "
        self.political_order = []
        " Time to calendar "
        self.calendarduration = {}

        self.lastjob = None

    def summary(self, showjobs=False):
        """
        Summary regarding cycle
        """
        self.info[CST] = time.strftime(
            "%Y-%m-%d %H:%M:%S", time.localtime(self.start))
        self.info[CD] = PBSLogUtils._duration(self.end - self.start)
        self.info[QD] = PBSLogUtils._duration(self.queryduration)
        # number of jobs considered may be different than length of
        # the consider dictionary due to job arrays being considered once
        # per subjob using the parent array job id
        self.info[NJC] = self.num_considered
        self.info[NJR] = len(self.sched_job_run.keys())
        self.info[NJFR] = len(self.run_failure)
        self.scheduler_solver_time = (sum(self.inschedduration.values()) +
                                      sum(self.cantrunduration.values()) +
                                      sum(self.calendarduration.values()))
        self.info[SST] = self.scheduler_solver_time
        self.info[NJCAL] = len(self.calendared_jobs.keys())
        self.info[NJFP] = self.num_preempt_failure
        self.info[NJP] = self.num_preempted
        self.info[TTC] = sum(self.calendarduration.values())

        if showjobs:
            for j in self.consider.keys():
                s = {JID: j}
                if j in self.runduration:
                    s[T2R] = self.runduration[j]
                if j in self.cantrunduration:
                    s[T2D] = self.cantrunduration[j]
                if j in self.inschedduration:
                    s[TiS] = self.inschedduration[j]
                if j in self.calendarduration:
                    s[TTC] = self.calendarduration[j]
                if 'jobs' in self.info:
                    self.info['jobs'].append(s)
                else:
                    self.info['jobs'] = [s]


class PBSMoMLog(PBSLogAnalyzer):

    """
    Container and Parser of a PBS ``MoM`` log
    """
    tm_tag = re.compile(tm_re)
    mom_run_tag = re.compile(tm_re + ".*" + job_re + ".*;Started, pid.*")
    mom_end_tag = re.compile(tm_re + ".*" + job_re +
                             ".*;delete job request received.*")
    mom_enquejob_tag = re.compile(tm_re + ".*;Type 5 .*")

    def __init__(self, filename=None, hostname=None, show_progress=False):

        self.filename = filename
        self.hostname = hostname
        self.show_progress = show_progress

        self.start = []
        self.end = []
        self.queued = []

        self.info = {}
        self.version = []

    def comp_analyze(self, rec, start, end):
        m = self.mom_run_tag.match(rec)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            if ((start is None and end is None) or
                    self.logutils.in_range(tm, start, end)):
                self.start.append(tm)
                return PARSER_OK_CONTINUE
            elif end is not None and tm > end:
                return PARSER_OK_STOP

        m = self.mom_end_tag.match(rec)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            if ((start is None and end is None) or
                    self.logutils.in_range(tm, start, end)):
                self.end.append(tm)
                return PARSER_OK_CONTINUE
            elif end is not None and tm > end:
                return PARSER_OK_STOP

        m = self.mom_enquejob_tag.match(rec)
        if m:
            tm = self.logutils.convert_date_time(m.group('datetime'))
            if ((start is None and end is None) or
                    self.logutils.in_range(tm, start, end)):
                self.queued.append(tm)
                return PARSER_OK_CONTINUE
            elif end is not None and tm > end:
                return PARSER_OK_STOP

        if 'pbs_version=' in rec:
            version = rec.split('pbs_version=')[1].strip()
            if version not in self.version:
                self.version.append(version)

        return PARSER_OK_CONTINUE

    def summary(self):
        """
        Mom log summary
        """
        run_rate = self.logutils.get_rate(self.start)
        queue_rate = self.logutils.get_rate(self.queued)
        end_rate = self.logutils.get_rate(self.end)

        self.info[NJQ] = len(self.queued)
        self.info[NJR] = len(self.start)
        self.info[NJE] = len(self.end)
        self.info[JRR] = run_rate
        self.info[JSR] = queue_rate
        self.info[JER] = end_rate
        self.info[VER] = ",".join(self.version)

        return self.info


class PBSAccountingLog(PBSLogAnalyzer):

    """
    Container and Parser of a PBS accounting log
    """

    tm_tag = re.compile(tm_re)

    record_tag = re.compile(r"""
                        (?P<date>\d\d/\d\d/\d{4,4})[\s]+
                        (?P<time>\d\d:\d\d:\d\d);
                        (?P<type>[A-Z]);
                        (?P<id>[0-9\[\]].*);
                        (?P<msg>.*)
                        """, re.VERBOSE)

    S_sub_record_tag = re.compile(r"""
                        .*user=(?P<user>[\w\d]+)[\s]+
                        .*qtime=(?P<qtime>[0-9]+)[\s]+
                        .*start=(?P<start>[0-9]+)[\s]+
                        .*exec_host=(?P<exechost>[\[\],\-\=\/\.\w/*\d\+]+)[\s]+
                        .*Resource_List.ncpus=(?P<ncpus>[0-9]+)[\s]+
                        .*
                        """, re.VERBOSE)

    E_sub_record_tag = re.compile(r"""
                        .*user=(?P<user>[\w\d]+)[\s]+
                        .*qtime=(?P<qtime>[0-9]+)[\s]+
                        .*start=(?P<start>[0-9]+)[\s]+
                        .*exec_host=(?P<exechost>[\[\],\-\=\/\.\w/*\d\+]+)[\s]+
                        .*Resource_List.ncpus=(?P<ncpus>[0-9]+)[\s]+
                        .*resources_used.walltime=(?P<walltime>[0-9:]+)
                        .*
                        """, re.VERBOSE)

    __E_sub_record_tag = re.compile(r"""
                        .*user=(?P<user>[\w\d]+)[\s]+
                        .*qtime=(?P<qtime>[0-9]+)[\s]+
                        .*start=(?P<start>[0-9]+)[\s]+
                        .*exec_host=(?P<exechost>[\[\],\-\=\/\.\w/*\d\+]+)[\s]+
                        .*Resource_List.ncpus=(?P<ncpus>[0-9]+)[\s]+
                        .*resources_used.walltime=(?P<walltime>[0-9:]+)
                        .*
                        """, re.VERBOSE)

    sub_record_tag = re.compile(r"""
                .*qtime=(?P<qtime>[0-9]+)[\s]+
                .*start=(?P<start>[0-9]+)[\s]+
                .*exec_host=(?P<exechost>[\[\],\-\=\/\.\w/*\d\+]+)[\s]+
                .*exec_vnode=(?P<execvnode>[\(\)\[\],:\-\=\/\.\w/*\d\+]+)[\s]+
                .*Resource_List.ncpus=(?P<ncpus>[\d]+)[\s]+
                .*
                """, re.VERBOSE)

    logger = logging.getLogger(__name__)
    utils = BatchUtils()

    def __init__(self, filename=None, hostname=None, show_progress=False):

        self.filename = filename
        self.hostname = hostname
        self.show_progress = show_progress

        self.record_tm = []

        self.entries = {}
        self.queue = []
        self.start = []
        self.end = []
        self.wait_time = []
        self.run_time = []
        self.job_node_size = []
        self.job_cpu_size = []
        self.used_cph = 0
        self.nodes_cph = 0
        self.used_nph = 0
        self.jobs_started = []
        self.jobs_ended = []
        self.users = {}
        self.tmp_wait_time = {}

        self.duration = 0

        self.utilization_parsing = False
        self.running_jobs_parsing = False
        self.job_info_parsing = False
        self.accounting_workload_parsing = False

        self._total_ncpus = 0
        self._num_nodes = 0
        self._running_jobids = []
        self._server = None

        self.running_jobs = {}
        self.job_start = {}
        self.job_end = {}
        self.job_nodes = {}
        self.job_cpus = {}
        self.job_rectypes = {}

        self.job_attrs = {}
        self.parser_errors = 0

        self.info = {}

    def enable_running_jobs_parsing(self):
        """
        Enable parsing for running jobs
        """
        self.running_jobs_parsing = True

    def enable_utilization_parsing(self, hostname=None, nodesfile=None,
                                   jobsfile=None):
        """
        Enable utilization parsing

        :param hostname: Hostname of the machine
        :type hostname: str or None
        :param nodesfile: optional file containing output of
                          pbsnodes -av
        :type nodesfile: str or None
        :param jobsfile: optional file containing output of
                         qstat -f
        :type jobsfile: str or None
        """
        self.utilization_parsing = True
        self.process_nodes_data(hostname, nodesfile, jobsfile)

    def enable_job_info_parsing(self):
        """
        Enable job information parsing
        """
        self.job_info_res = {}
        self.job_info_parsing = True

    def enable_accounting_workload_parsing(self):
        """
        Enable accounting workload parsing
        """
        self.accounting_workload_parsing = True

    def process_nodes_data(self, hostname=None, nodesfile=None, jobsfile=None):
        """
        Get job and node information by stat'ing and parsing node
        data from the server.
        Compute the number of nodes and populate a list of running
        job ids on those nodes.

        :param hostname: The host to query
        :type hostname: str or None
        :param nodesfile: optional file containing output of
                          pbsnodes -av
        :type nodesfile: str or None
        :param jobsfile: optional file containing output of
                         qstat -f
        :type jobsfile: str or None

        The node data is needed to compute counts of nodes and cpus
        The job data is needed to compute the amount of resources
        requested
        """
        if nodesfile or jobsfile:
            self._server = Server(snapmap={NODE: nodesfile, JOB: jobsfile})
        else:
            self._server = Server(hostname)

        ncpus = self._server.counter(NODE, 'resources_available.ncpus',
                                     grandtotal=True, level=logging.DEBUG)

        if 'resources_available.ncpus' in ncpus:
            self._total_ncpus = ncpus['resources_available.ncpus']

        self._num_nodes = len(self._server.status(NODE))

        jobs = self._server.status(NODE, 'jobs')
        running_jobids = []
        for cur_job in jobs:
            if 'jobs' not in cur_job:
                continue
            job = cur_job['jobs']
            jlist = job.split(',')
            for j in jlist:
                running_jobids.append(j.split('/')[0].strip())
        self._running_jobids = list(set(running_jobids))

    def comp_analyze(self, rec, start, end, **kwargs):
        if self.job_info_parsing:
            return self.job_info(rec)
        else:
            return self.accounting_parsing(rec, start, end)

    def accounting_parsing(self, rec, start, end):
        """
        Parsing accounting log
        """
        r = self.record_tag.match(rec.decode("utf-8"))
        if not r:
            return PARSER_ERROR_CONTINUE

        tm = self.logutils.convert_date_time(r.group('date') +
                                             ' ' + r.group('time'))
        if ((start is None and end is None) or
                self.logutils.in_range(tm, start, end)):
            self.record_tm.append(tm)
            rec_type = r.group('type')
            jobid = r.group('id')

            if not self.accounting_workload_parsing and rec_type == 'S':
                # Precompute metrics about the S record just in case
                # it does not have an E record. The differences are
                # resolved after all records are processed
                if jobid in self._running_jobids:
                    self._running_jobids.remove(jobid)
                m = self.S_sub_record_tag.match(r.group('msg'))
                if m:
                    self.users[jobid] = m.group('user')
                    qtime = int(m.group('qtime'))
                    starttime = int(m.group('start'))
                    ncpus = int(m.group('ncpus'))
                    self.job_cpus[jobid] = ncpus

                    if starttime != 0 and qtime != 0:
                        self.tmp_wait_time[jobid] = starttime - qtime
                        self.job_start[jobid] = starttime
                    ehost = m.group('exechost')
                    self.job_nodes[jobid] = ResourceResv.get_hosts(ehost)
            elif rec_type == 'E':
                if self.accounting_workload_parsing:
                    try:
                        msg = r.group('msg').split()
                        attrs = dict([l.split('=', 1) for l in msg])
                    except Exception:
                        self.parser_errors += 1
                        return PARSER_OK_CONTINUE
                    for k in attrs.keys():
                        attrs[k] = PbsAttribute.decode_value(attrs[k])
                    running_time = (int(attrs['end']) - int(attrs['start']))
                    attrs['running_time'] = str(running_time)
                    attrs['schedselect'] = attrs['Resource_List.select']
                    if 'euser' not in attrs:
                        attrs['euser'] = 'unknown_user'

                    attrs['id'] = r.group('id')
                    self.job_attrs[r.group('id')] = attrs

                m = self.E_sub_record_tag.match(r.group('msg'))
                if m:
                    if jobid not in self.users:
                        self.users[jobid] = m.group('user')
                    ehost = m.group('exechost')
                    self.job_nodes[jobid] = ResourceResv.get_hosts(ehost)
                    ncpus = int(m.group('ncpus'))
                    self.job_cpus[jobid] = ncpus
                    self.job_end[jobid] = tm

                    qtime = int(m.group('qtime'))
                    starttime = int(m.group('start'))
                    if starttime != 0 and qtime != 0:
                        # jobs enqueued prior to start of time range
                        # considered should be reset to start of time
                        # range. Only matters when computing
                        # utilization
                        if (self.utilization_parsing and
                                qtime < self.record_tm[0]):
                            qtime = self.record_tm[0]
                            if starttime < self.record_tm[0]:
                                starttime = self.record_tm[0]
                        self.wait_time.append(starttime - qtime)
                        if m.group('walltime'):
                            try:
                                walltime = self.logutils.convert_hhmmss_time(
                                    m.group('walltime').strip())
                                self.run_time.append(walltime)
                            except Exception:
                                pass
                        else:
                            walltime = tm - starttime
                            self.run_time.append(walltime)

                        if self.utilization_parsing:
                            self.used_cph += ncpus * (walltime / 60)
                            if self.utils:
                                self.used_nph += (len(self.job_nodes[jobid]) *
                                                  (walltime / 60))
            elif rec_type == 'Q':
                self.queue.append(tm)
            elif rec_type == 'D':
                if jobid not in self.job_end:
                    self.job_end[jobid] = tm

        elif end is not None and tm > end:
            return PARSER_OK_STOP

        return PARSER_OK_CONTINUE

    def epilogue(self, line):
        if self.running_jobs_parsing or self.accounting_workload_parsing:
            return

        if len(self.record_tm) > 0:
            last_record_tm = self.record_tm[len(self.record_tm) - 1]
            self.duration = last_record_tm - self.record_tm[0]
            self.info[DUR] = self.logutils._duration(self.duration)

        self.jobs_started = list(self.job_start.keys())
        self.jobs_ended = list(self.job_end.keys())
        self.job_node_size = [len(n) for n in self.job_nodes.values()]
        self.job_cpu_size = list(self.job_cpus.values())
        self.start = sorted(self.job_start.values())
        self.end = sorted(self.job_end.values())

        # list of jobs that have not yet ended, those are jobs that
        # have an S record but no E record. We port back the precomputed
        # metrics from the S record into the data to "publish"
        sjobs = set(self.jobs_started).difference(self.jobs_ended)
        for job in sjobs:
            if job in self.tmp_wait_time:
                self.wait_time.append(self.tmp_wait_time[job])
            if job in self.job_nodes:
                self.job_node_size.append(len(self.job_nodes[job]))
            if job in self.job_cpus:
                self.job_cpu_size.append(self.job_cpus[job])
            if self.utilization_parsing:
                if job in self.job_start:
                    if job in self.job_cpus:
                        self.used_cph += self.job_cpus[job] * \
                            ((last_record_tm - self.job_start[
                             job]) / 60)
                    if job in self.job_nodes:
                        self.used_nph += len(self.job_nodes[job]) * \
                            ((last_record_tm - self.job_start[
                             job]) / 60)

        # Process jobs currently running, those may have an S record
        # that is older than the time window considered or not.
        # If they have an S record, then they were already processed
        # by the S record routine, otherwise, they are processed here
        if self.utilization_parsing:
            first_record_tm = self.record_tm[0]
            a = {'job_state': (EQ, 'R'),
                 'Resource_List.ncpus': (SET, ''),
                 'exec_host': (SET, ''),
                 'stime': (SET, '')}
            alljobs = self._server.status(JOB, a)
            for job in alljobs:
                # the running_jobids is populated from the node's jobs
                # attribute. If a job id is not in the running jobids
                # list, then its S record was already processed
                if job['id'] not in self._running_jobids:
                    continue

                if ('job_state' not in job or
                        'Resource_List.ncpus' not in job or
                        'exec_host' not in job or 'stime' not in job):
                    continue
                # split to catch a customer tweak
                stime = int(job['stime'].split()[0])
                if stime < first_record_tm:
                    stime = first_record_tm
                self.used_cph += int(job['Resource_List.ncpus']) * \
                    (last_record_tm - stime)
                nodes = len(self.utils.parse_exechost(
                    job['exec_host']))
                self.used_nph += nodes * (last_record_tm - stime)

    def job_info(self, rec):
        """
        PBS Job information
        """
        m = self.record_tag.match(rec)
        if m:
            d = {}
            if m.group('type') == 'E':
                if getattr(self, 'jobid', None) != m.group('id'):
                    return PARSER_OK_CONTINUE
                if not hasattr(self, 'job_info_res'):
                    self.job_info_res = {}
                for a in m.group('msg').split():
                    (k, v) = a.split('=', 1)
                    d[k] = v
                self.job_info_res[m.group('id')] = d

        return PARSER_OK_CONTINUE

    def summary(self):
        """
        Accounting log summary
        """
        if self.running_jobs_parsing or self.accounting_workload_parsing:
            return

        run_rate = self.logutils.get_rate(self.start)
        queue_rate = self.logutils.get_rate(self.queue)
        end_rate = self.logutils.get_rate(self.end)

        self.info[NJQ] = len(self.queue)
        self.info[NJR] = len(self.start)
        self.info[NJE] = len(self.end)
        self.info[JRR] = run_rate
        self.info[JSR] = queue_rate
        self.info[JER] = end_rate
        if len(self.wait_time) > 0:
            wt = sorted(self.wait_time)
            wta = float(sum(self.wait_time)) / len(self.wait_time)
            self.info[JWTm] = self.logutils._duration(min(wt))
            self.info[JWTM] = self.logutils._duration(max(wt))
            self.info[JWTA] = self.logutils._duration(wta)
            self.info[JWT25] = self.logutils._duration(
                self.logutils.percentile(wt, .25))
            self.info[JWT50] = self.logutils._duration(
                self.logutils.percentile(wt, .5))
            self.info[JWT75] = self.logutils._duration(
                self.logutils.percentile(wt, .75))

        if len(self.run_time) > 0:
            rt = sorted(self.run_time)
            self.info[JRTm] = self.logutils._duration(min(rt))
            self.info[JRT25] = self.logutils._duration(
                self.logutils.percentile(rt, 0.25))
            self.info[JRT50] = self.logutils._duration(
                self.logutils.percentile(rt, 0.50))
            self.info[JRTA] = self.logutils._duration(
                str(sum(rt) / len(rt)))
            self.info[JRT75] = self.logutils._duration(
                self.logutils.percentile(rt, 0.75))
            self.info[JRTM] = self.logutils._duration(max(rt))

        if len(self.job_node_size) > 0:
            js = sorted(self.job_node_size)
            self.info[JNSm] = min(js)
            self.info[JNS25] = self.logutils.percentile(js, 0.25)
            self.info[JNS50] = self.logutils.percentile(js, 0.50)
            self.info[JNSA] = str("%.2f" % (float(sum(js)) / len(js)))
            self.info[JNS75] = self.logutils.percentile(js, 0.75)
            self.info[JNSM] = max(js)

        if len(self.job_cpu_size) > 0:
            js = sorted(self.job_cpu_size)
            self.info[JCSm] = min(js)
            self.info[JCS25] = self.logutils.percentile(js, 0.25)
            self.info[JCS50] = self.logutils.percentile(js, 0.50)
            self.info[JCSA] = str("%.2f" % (float(sum(js)) / len(js)))
            self.info[JCS75] = self.logutils.percentile(js, 0.75)
            self.info[JCSM] = max(js)

        if self.utilization_parsing:
            ncph = self._total_ncpus * self.duration
            nph = self._num_nodes * self.duration
            if ncph > 0:
                self.info[UNCPUS] = str("%.2f" %
                                        (100 * float(self.used_cph) / ncph) +
                                        '%')
            if nph > 0:
                self.info[UNODES] = str("%.2f" %
                                        (100 * float(self.used_nph) / nph) +
                                        '%')
            self.info[CPH] = self.used_cph
            self.info[NPH] = self.used_nph

        self.info[USRS] = len(set(self.users.values()))

        return self.info


================================================
FILE: test/fw/ptl/utils/pbs_procutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import sys
import time
import re
import threading
import logging
import socket
import os
import json
from ptl.utils.pbs_dshutils import DshUtils


class ProcUtils(object):

    """
    Utilities to query process information
    """

    logger = logging.getLogger(__name__)
    du = DshUtils()
    platform = sys.platform

    def __init__(self):
        self.processes = {}
        self.__h2ps = {}

    def get_ps_cmd(self, hostname=None):
        """
        Get the ps command

        :param hostname: hostname of the machine
        :type hostname: str or None
        """
        if hostname is None:
            hostname = socket.gethostname()

        if hostname in self.__h2ps:
            return self.__h2ps[hostname]

        if not self.du.is_localhost(hostname):
            platform = self.du.get_platform(hostname)
        else:
            platform = self.platform

        # set some platform-specific arguments to ps
        ps_arg = '-C'
        ps_cmd = ['ps', '-o', 'pid,rss,vsz,pcpu,pmem,size,cputime,command']
        self.__h2ps[hostname] = (ps_cmd, ps_arg)

        return (ps_cmd, ps_arg)

    def _init_processes(self):
        self.processes = {}

    def _get_proc_info_unix(self, hostname=None, name=None,
                            pid=None, regexp=False):
        """
        Helper function to ``get_proc_info`` for Unix only system
        """
        (ps_cmd, ps_arg) = self.get_ps_cmd(hostname)
        if name is not None:
            if not regexp:
                cr = self.du.run_cmd(hostname, (ps_cmd + [ps_arg, name]),
                                     level=logging.DEBUG2)
            else:
                cr = self.du.run_cmd(hostname, ps_cmd + ['-e'],
                                     level=logging.DEBUG2)
        elif pid is not None:
            cr = self.du.run_cmd(hostname, ps_cmd + ['-p', pid],
                                 level=logging.DEBUG2)
        else:
            return

        if cr['rc'] == 0 and cr['out']:
            for proc in cr['out']:
                _pi = None
                try:
                    _s = proc.split()
                    p = _s[0]
                    rss = _s[1]
                    vsz = _s[2]
                    pcpu = _s[3]
                    pmem = _s[4]
                    size = _s[5]
                    cputime = _s[6]
                    command = " ".join(_s[7:])
                except BaseException:
                    continue

                if ((pid is not None and p == str(pid)) or
                    (name is not None and (
                        (regexp and re.search(name, command) is not None) or
                        (not regexp and name in command)))):
                    _pi = ProcInfo(name=command)
                    _pi.pid = p
                    _pi.rss = rss
                    _pi.vsz = vsz
                    _pi.pcpu = pcpu
                    _pi.pmem = pmem
                    _pi.size = size
                    _pi.cputime = cputime
                    _pi.command = command

                if _pi is not None:
                    if command in self.processes:
                        self.processes[command].append(_pi)
                    else:
                        self.processes[command] = [_pi]
        return self.processes

    def get_proc_info(self, hostname=None, name=None, pid=None, regexp=False):
        """
        Return process information from a process name, or pid,
        on a given host

        :param hostname: The hostname on which to query the process
                         info. On Windows,only localhost is queried.
        :type hostname: str or none
        :param name: The name of the process to query.
        :type name: str or None
        :param pid: The pid of the process to query
        :type pid: int or None
        :param regexp: Match processes by regular expression. Defaults
                       to True. Does not apply to matching by PID.
        :type regexp: bool
        :returns: A list of ProcInfo objects, one for each matching
                  process.

        .. note:: If both, name and pid, are specified, name is used.
        """
        self._init_processes()
        return self._get_proc_info_unix(hostname, name, pid, regexp)

    def get_proc_state(self, hostname=None, pid=None):
        """
        :returns: PID's process state on host hostname

        On error the empty string is returned.
        """
        if not self.du.is_localhost(hostname):
            platform = self.du.get_platform(hostname)
        else:
            platform = sys.platform

        try:
            if platform.startswith('linux') or platform.startswith('shasta'):
                cmd = ['ps', '-o', 'stat', '-p', str(pid), '--no-heading']
                rv = self.du.run_cmd(hostname, cmd, level=logging.DEBUG2)
                return rv['out'][0][0]
        except BaseException:
            self.logger.error('Error getting process state for pid ' + pid)
            return ''

    def get_proc_children(self, hostname=None, ppid=None):
        """
        :returns: A list of children PIDs associated to ``PPID`` on
                  host hostname.

        On error, an empty list is returned.
        """
        try:
            if not isinstance(ppid, str):
                ppid = str(ppid)

            if int(ppid) <= 0:
                raise

            if not self.du.is_localhost(hostname):
                platform = self.du.get_platform(hostname)
            else:
                platform = sys.platform

            childlist = []

            if platform.startswith('linux') or platform.startswith('shasta'):
                cmd = ['ps', '-o', 'pid', '--ppid:%s' % ppid, '--no-heading']
                rv = self.du.run_cmd(hostname, cmd)
                children = rv['out'][:-1]
            else:
                children = []

            for child in children:
                child = child.strip()
                if child != '':
                    childlist.append(child)
                    childlist.extend(self.get_proc_children(hostname, child))

            return childlist
        except BaseException:
            self.logger.error('Error getting children processes of parent ' +
                              ppid)
            return []


class ProcInfo(object):

    """
    Process information reports ``PID``, ``RSS``, ``VSZ``, Command
    and Time at which process information is collected
    """

    def __init__(self, name=None, pid=None):
        self.name = name
        self.pid = pid
        self.rss = None
        self.vsz = None
        self.pcpu = None
        self.pmem = None
        self.size = None
        self.cputime = None
        self.time = time.time()
        self.command = None

    def __str__(self):
        return "%s pid: %s rss: %s vsz: %s pcpu: %s pmem: %s \
               size: %s cputime: %s command: %s" % \
               (self.name, str(self.pid), str(self.rss), str(self.vsz),
                str(self.pcpu), str(self.pmem), str(self.size),
                str(self.cputime), self.command)


class ProcMonitor(threading.Thread):

    """
    A background process monitoring tool
    """
    du = DshUtils()

    def __init__(self, name=None, regexp=False, frequency=60):
        threading.Thread.__init__(self)
        self.name = name
        self.frequency = frequency
        self.regexp = regexp
        self._pu = ProcUtils()
        self.stop_thread = threading.Event()
        self.db_proc_info = []

    def set_frequency(self, value=60):
        """
        Set the frequency

        :param value: Frequency value
        :type value: int
        """
        self.logger.debug('procmonitor: set frequency to ' + str(value))
        self.frequency = value

    def get_system_stats(self, nw_protocols=None):
        """
        Run system monitoring
        """
        timenow = int(time.time())
        sysstat = {}
        # if no protocols set, use default
        if not nw_protocols:
            nw_protocols = ['TCP']
        cmd = 'sar -rSub -n %s 1 1' % ','.join(nw_protocols)
        rv = self.du.run_cmd(cmd=cmd, as_script=True)
        if rv['err']:
            return None
        op = rv['out'][2:]
        op = [i.split()[2:] for i in op if
              (i and not i.startswith('Average'))]
        sysstat['name'] = "System"
        sysstat['time'] = time.ctime(timenow)
        for i in range(0, len(op), 2):
            sysstat.update(dict(zip(op[i], op[i + 1])))
        return sysstat

    def run(self):
        """
        Run the process monitoring
        """
        while not self.stop_thread.is_set():
            self._pu.get_proc_info(name=self.name, regexp=self.regexp)
            for _p in self._pu.processes.values():
                for _per_proc in _p:
                    if bool(re.search("^((?!benchpress).)*$", _per_proc.name)):
                        _to_db = {}
                        _to_db['time'] = time.ctime(int(_per_proc.time))
                        _to_db['rss'] = _per_proc.rss
                        _to_db['vsz'] = _per_proc.vsz
                        _to_db['pcpu'] = _per_proc.pcpu
                        _to_db['pmem'] = _per_proc.pmem
                        _to_db['size'] = _per_proc.size
                        _to_db['cputime'] = _per_proc.cputime
                        _to_db['name'] = _per_proc.name
                        self.db_proc_info.append(_to_db)
            _sys_info = self.get_system_stats(nw_protocols=['TCP'])
            if _sys_info is not None:
                self.db_proc_info.append(_sys_info)
            with open('proc_monitor.json', 'a+', encoding='utf-8') as proc:
                json.dump(
                    self.db_proc_info,
                    proc,
                    ensure_ascii=False,
                    indent=4)
            time.sleep(self.frequency)

    def stop(self):
        """
        Stop the process monitoring
        """
        self.stop_thread.set()
        self.join()


if __name__ == '__main__':
    pm = ProcMonitor(name='.*pbs_server.*|.*pbs_sched.*', regexp=True,
                     frequency=1)
    pm.start()
    time.sleep(4)
    pm.stop()


================================================
FILE: test/fw/ptl/utils/pbs_snaputils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import collections
import logging
import os
import pprint
import random
import re
import shlex
import shutil
import socket
import tarfile
import time
import platform
from subprocess import STDOUT
from pathlib import Path
from multiprocessing import Process

from ptl.lib.pbs_ifl_mock import *
from ptl.lib.pbs_testlib import (SCHED, BatchUtils, Scheduler, Server,
                                 PbsAttribute)
from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_logutils import PBSLogUtils

# Define an enum which is used to label various pieces of information
(   # qstat outputs
    QSTAT_B_OUT,
    QSTAT_BF_OUT,
    QSTAT_OUT,
    QSTAT_F_OUT,
    QSTAT_T_OUT,
    QSTAT_TF_OUT,
    QSTAT_X_OUT,
    QSTAT_XF_OUT,
    QSTAT_NS_OUT,
    QSTAT_FX_DSV_OUT,
    QSTAT_F_DSV_OUT,
    QSTAT_F_JSON_OUT,
    QSTAT_Q_OUT,
    QSTAT_QF_OUT,
    # qmgr outputs
    QMGR_PS_OUT,
    QMGR_PH_OUT,
    QMGR_LPBSHOOK_OUT,
    QMGR_LSCHED_OUT,
    QMGR_PN_OUT,
    QMGR_PR_OUT,
    QMGR_PQ_OUT,
    QMGR_PSCHED_OUT,
    # pbsnodes outputs
    PBSNODES_VA_OUT,
    PBSNODES_A_OUT,
    PBSNODES_AVSJ_OUT,
    PBSNODES_ASJ_OUT,
    PBSNODES_AVS_OUT,
    PBSNODES_AS_OUT,
    PBSNODES_AFDSV_OUT,
    PBSNODES_AVFDSV_OUT,
    PBSNODES_AVFJSON_OUT,
    # pbs_rstat outputs
    PBS_RSTAT_OUT,
    PBS_RSTAT_F_OUT,
    # PBS config related outputs
    PBS_CONF,
    PBS_PROBE_OUT,
    PBS_HOSTN_OUT,
    PBS_ENVIRONMENT,
    # System related outputs
    OS_INFO,
    PROCESS_INFO,
    LSOF_PBS_OUT,
    ETC_HOSTS,
    ETC_NSSWITCH_CONF,
    VMSTAT_OUT,
    DF_H_OUT,
    DMESG_OUT,
    PS_LEAF_OUT,
    # Logs
    ACCT_LOGS,
    SVR_LOGS,
    SCHED_LOGS,
    MOM_LOGS,
    PG_LOGS,
    COMM_LOGS,
    # Daemon priv directories
    SVR_PRIV,
    MOM_PRIV,
    SCHED_PRIV,
    # Core file information
    CORE_SCHED,
    CORE_SERVER,
    CORE_MOM,
    # Miscellaneous
    CTIME) = list(range(59))


# Define paths to various files/directories with respect to the snapshot
# server/
SERVER_DIR = "server"
QSTAT_B_PATH = os.path.join(SERVER_DIR, "qstat_B.out")
QSTAT_BF_PATH = os.path.join(SERVER_DIR, "qstat_Bf.out")
QMGR_PS_PATH = os.path.join(SERVER_DIR, "qmgr_ps.out")
QSTAT_Q_PATH = os.path.join(SERVER_DIR, "qstat_Q.out")
QSTAT_QF_PATH = os.path.join(SERVER_DIR, "qstat_Qf.out")
QMGR_PR_PATH = os.path.join(SERVER_DIR, "qmgr_pr.out")
QMGR_PQ_PATH = os.path.join(SERVER_DIR, "qmgr_pq.out")
# server_priv/
SVR_PRIV_PATH = "server_priv"
ACCT_LOGS_PATH = os.path.join("server_priv", "accounting")
RSCDEF_PATH = os.path.join("server_priv", "resourcedef")
# server_logs/
SVR_LOGS_PATH = "server_logs"
# job/
JOB_DIR = "job"
QSTAT_PATH = os.path.join(JOB_DIR, "qstat.out")
QSTAT_F_PATH = os.path.join(JOB_DIR, "qstat_f.out")
QSTAT_T_PATH = os.path.join(JOB_DIR, "qstat_t.out")
QSTAT_TF_PATH = os.path.join(JOB_DIR, "qstat_tf.out")
QSTAT_X_PATH = os.path.join(JOB_DIR, "qstat_x.out")
QSTAT_XF_PATH = os.path.join(JOB_DIR, "qstat_xf.out")
QSTAT_NS_PATH = os.path.join(JOB_DIR, "qstat_ns.out")
QSTAT_FX_DSV_PATH = os.path.join(JOB_DIR, "qstat_fx_F_dsv.out")
QSTAT_F_DSV_PATH = os.path.join(JOB_DIR, "qstat_f_F_dsv.out")
QSTAT_F_JSON_PATH = os.path.join(JOB_DIR, "qstat_f_F_json.out")
# node/
NODE_DIR = "node"
PBSNODES_VA_PATH = os.path.join(NODE_DIR, "pbsnodes_va.out")
PBSNODES_A_PATH = os.path.join(NODE_DIR, "pbsnodes_a.out")
PBSNODES_AVSJ_PATH = os.path.join(NODE_DIR, "pbsnodes_avSj.out")
PBSNODES_ASJ_PATH = os.path.join(NODE_DIR, "pbsnodes_aSj.out")
PBSNODES_AVS_PATH = os.path.join(NODE_DIR, "pbsnodes_avS.out")
PBSNODES_AS_PATH = os.path.join(NODE_DIR, "pbsnodes_aS.out")
PBSNODES_AFDSV_PATH = os.path.join(NODE_DIR, "pbsnodes_aFdsv.out")
PBSNODES_AVFDSV_PATH = os.path.join(NODE_DIR, "pbsnodes_avFdsv.out")
PBSNODES_AVFJSON_PATH = os.path.join(NODE_DIR, "pbsnodes_avFjson.out")
QMGR_PN_PATH = os.path.join(NODE_DIR, "qmgr_pn_default.out")
# mom_priv/
MOM_PRIV_PATH = "mom_priv"
# mom_logs/
MOM_LOGS_PATH = "mom_logs"
# comm_logs/
COMM_LOGS_PATH = "comm_logs"
# hook/
HOOK_DIR = "hook"
QMGR_PH_PATH = os.path.join(HOOK_DIR, "qmgr_ph_default.out")
QMGR_LPBSHOOK_PATH = os.path.join(HOOK_DIR, "qmgr_lpbshook.out")
# scheduler/
SCHED_DIR = "scheduler"
QMGR_LSCHED_PATH = os.path.join(SCHED_DIR, "qmgr_lsched.out")
QMGR_PSCHED_PATH = os.path.join(SCHED_DIR, "qmgr_psched.out")
# sched_priv/
DFLT_SCHED_PRIV_PATH = "sched_priv"
# sched_logs/
DFLT_SCHED_LOGS_PATH = "sched_logs"
# reservation/
RESV_DIR = "reservation"
PBS_RSTAT_PATH = os.path.join(RESV_DIR, "pbs_rstat.out")
PBS_RSTAT_F_PATH = os.path.join(RESV_DIR, "pbs_rstat_f.out")
# datastore/
DATASTORE_DIR = "datastore"
PG_LOGS_PATH = os.path.join(DATASTORE_DIR, "pg_log")
# core_file_bt/
CORE_DIR = "core_file_bt"
CORE_SERVER_PATH = os.path.join(CORE_DIR, "server_priv")
CORE_SCHED_PATH = os.path.join(CORE_DIR, "sched_priv")
CORE_MOM_PATH = os.path.join(CORE_DIR, "mom_priv")
# system/
SYS_DIR = "system"
PBS_PROBE_PATH = os.path.join(SYS_DIR, "pbs_probe_v.out")
PBS_HOSTN_PATH = os.path.join(SYS_DIR, "pbs_hostn_v.out")
PBS_ENV_PATH = os.path.join(SYS_DIR, "pbs_environment")
OS_PATH = os.path.join(SYS_DIR, "os_info")
PROCESS_PATH = os.path.join(SYS_DIR, "process_info")
ETC_HOSTS_PATH = os.path.join(SYS_DIR, "etc_hosts")
ETC_NSSWITCH_PATH = os.path.join(SYS_DIR, "etc_nsswitch_conf")
LSOF_PBS_PATH = os.path.join(SYS_DIR, "lsof_pbs.out")
VMSTAT_PATH = os.path.join(SYS_DIR, "vmstat.out")
DF_H_PATH = os.path.join(SYS_DIR, "df_h.out")
DMESG_PATH = os.path.join(SYS_DIR, "dmesg.out")
PS_LEAF_PATH = os.path.join(SYS_DIR, "ps_leaf.out")
# top-level
PBS_CONF_PATH = "pbs.conf"
CTIME_PATH = "ctime"

# Define paths to PBS commands used to capture data with respect to PBS_EXEC
QSTAT_CMD = os.path.join("bin", "qstat")
PBSNODES_CMD = os.path.join("bin", "pbsnodes")
QMGR_CMD = os.path.join("bin", "qmgr")
PBS_RSTAT_CMD = os.path.join("bin", "pbs_rstat")
PBS_PROBE_CMD = os.path.join("sbin", "pbs_probe")
PBS_HOSTN_CMD = os.path.join("bin", "pbs_hostn")


class ObfuscateSnapshot(object):
    val_obf_map = {}
    vals_to_del = []
    bu = BatchUtils()
    du = DshUtils()
    num_bad_acct_records = 0
    logger = logging.getLogger(__name__)

    job_attrs_del = [ATTR_v, ATTR_e, ATTR_jobdir,
                     ATTR_submit_arguments, ATTR_o, ATTR_S]
    resv_attrs_del = [ATTR_v]
    svr_attrs_del = [ATTR_mailfrom]
    job_attrs_obf = [ATTR_euser, ATTR_egroup, ATTR_project, ATTR_A,
                     ATTR_g, ATTR_M, ATTR_u, ATTR_owner, ATTR_name]
    resv_attrs_obf = [ATTR_A, ATTR_g, ATTR_M, ATTR_auth_u, ATTR_auth_g,
                      ATTR_auth_h, ATTR_resv_owner]
    svr_attrs_obf = [ATTR_SvrHost, ATTR_acluser, ATTR_aclResvuser,
                     ATTR_aclResvhost, ATTR_aclhost, ATTR_operators,
                     ATTR_managers]
    node_attrs_obf = [ATTR_NODE_Host, ATTR_NODE_Mom, ATTR_rescavail + ".host",
                      ATTR_rescavail + ".vnode"]
    sched_attrs_obf = [ATTR_SchedHost]
    queue_attrs_obf = [ATTR_acluser, ATTR_aclgroup, ATTR_aclhost]
    skip_vals = ["_pbs_project_default", "*", "pbsadmin", "pbsuser"]

    def _obfuscate_stat(self, file_path, attrs_to_obf, attrs_to_del):
        """
        Helper function to obfuscate qstat/rstat -f & pbsnodes -av outputs

        :param file_path - path to the qstat output file in snapshot
        :type file_path - str
        :param attrs_to_obf - attribute list to obfuscate
        :type list
        :param attrs_to_del- attribute list to delete
        :type list
        """
        fout = self.du.create_temp_file()

        with open(file_path, "r") as fdin, open(fout, "w") as fdout:
            delete_line = False
            val_obf = None
            val_del = None
            key_obf = None
            for line in fdin:
                # Check if this is a line extension for an attr being deleted
                if line[0] == "\t":
                    if delete_line:
                        val_del += line.strip()
                        continue
                    elif val_obf is not None:
                        val_obf += line.strip()
                        continue

                delete_line = False
                if val_del is not None:
                    self.vals_to_del.append(val_del)
                    val_del = None

                if val_obf is not None:
                    # Write the previous, obfuscated attribute first
                    val_to_write = []
                    for val in val_obf.split(","):
                        val = val.strip()
                        val = val.split("@")
                        out_val = []
                        for _val in val:
                            if _val in self.skip_vals:
                                obf = _val
                            elif _val not in self.val_obf_map:
                                obf = PbsAttribute.random_str(
                                    length=random.randint(8, 30))
                                self.val_obf_map[_val] = obf
                            else:
                                obf = self.val_obf_map[_val]
                            out_val.append(obf)
                        out_val = "@".join(out_val)
                        val_to_write.append(out_val)

                    # Some PBS outputs have inconsistent whitespaces
                    # e.g - pbs_rstat -f doesn't print leading spaces
                    # So, extract the lead from the original line
                    lead = ""
                    for c in line:
                        if not c.isspace():
                            break
                        lead += c

                    obf_line = lead + key_obf + " = " + \
                        ",".join(val_to_write) + "\n"
                    fdout.write(obf_line)
                    val_obf = None
                    key_obf = None

                if "=" in line:
                    attrname, attrval = line.split("=", 1)
                    attrname = attrname.strip()
                    attrval = attrval.strip()

                    # Check if this attribute needs to be deleted
                    if attrname in attrs_to_del:
                        delete_line = True
                        val_del = attrval

                    if delete_line is True:
                        continue

                    # Check if this attribute needs to be obfuscated
                    if attrname in attrs_to_obf:
                        val_obf = attrval
                        key_obf = attrname

                if val_obf is None:
                    fdout.write(line)

        shutil.move(fout, file_path)

    def _obfuscate_acct_file(self, attrs_obf, file_path):
        """
        Helper function to anonymize

        :param attrs_obf - set of attributes to obfuscate
        :type attrs_obf - set
        :param file_path - path of acct log file
        :type file_path - str
        """
        newcontent = []
        with open(file_path, "r") as fd:
            for record in fd:
                # accounting log format is
                # %Y/%m/%d %H:%M:%S;<Key>;<Id>;<key1=val1> <key2=val2> ...
                record_list = record.split(";", 3)
                if record_list is None or len(record_list) < 4:
                    continue
                if record_list[1] in ("A", "L"):
                    newcontent.append(record)
                    continue
                content_list = shlex.split(record_list[3].strip())

                skip_record = False
                kvl_list = [kv.split("=", 1) for kv in content_list]
                if kvl_list is None:
                    self.num_bad_acct_records += 1
                    self.logger.debug("Bad accounting record found:\n" +
                                      record)
                    continue
                for kvl in kvl_list:
                    try:
                        k, v = kvl
                    except ValueError:
                        self.num_bad_acct_records += 1
                        self.logger.debug("Bad accounting record found:\n" +
                                          record)
                        skip_record = True
                        break

                    if k in attrs_obf:
                        val = v.split("@")
                        obf = []
                        for _val in val:
                            if _val == "_pbs_project_default":
                                obf.append(_val)
                            elif _val not in self.val_obf_map:
                                obf_v = PbsAttribute.random_str(
                                    length=random.randint(8, 30))
                                self.val_obf_map[_val] = obf_v
                                obf.append(obf_v)
                            else:
                                obf.append(self.val_obf_map[_val])
                        kvl[1] = "@".join(obf)

                if not skip_record:
                    record = ";".join(record_list[:3]) + ";" + \
                        " ".join(["=".join(n) for n in kvl_list])
                    newcontent.append(record + "\n")

        with open(file_path, "w") as fd:
            fd.write("".join(newcontent))

    def obfuscate_acct_logs(self, snap_dir, sudo_val):
        """
        Helper function to obfuscate accounting logs

        :param snap_dir - the snapshot directory path
        :type snap_dir - str
        """
        attrs_to_obf = self.job_attrs_obf + self.resv_attrs_obf +\
            self.svr_attrs_obf + self.queue_attrs_obf + self.node_attrs_obf +\
            self.sched_attrs_obf

        # Some accounting record attributes are named differently
        acct_extras = ["user", "requestor", "group", "account"]
        attrs_to_obf += acct_extras
        attrs_to_obf = set(attrs_to_obf)

        acct_path = os.path.join(snap_dir, "server_priv", "accounting")
        if not os.path.isdir(acct_path):
            return
        acct_fpaths = self.du.listdir(path=acct_path, sudo=sudo_val)

        # Limit the number of cores used to 10
        ncpus = os.cpu_count()
        ncpus = min(ncpus, 10)
        nfiles = len(acct_fpaths)
        i = 0
        while i < nfiles:
            plist = []
            for _ in range(ncpus):
                acct_fpath = acct_fpaths[i]
                p = Process(target=self._obfuscate_acct_file,
                            args=(attrs_to_obf, acct_fpath))
                p.start()
                plist.append(p)
                i += 1
                if i >= nfiles:
                    break
            for p in plist:
                p.join()

        if self.num_bad_acct_records > 0:
            self.logger.info("Total bad records found: " +
                             str(self.num_bad_acct_records))

    def _obfuscate_with_map(self, fpath, sudo=False):
        """
        Helper function to obfuscate a file with obfuscation map

        :param filepath - path to the file
        :type filepath - str
        :param sudo - sudo True/False?
        :type bool

        :return str - possibly updated path to the obfuscated file
        """
        fout = self.du.create_temp_file()
        pathobj = Path(fpath)
        fname = pathobj.name
        fparent = pathobj.parent
        newfpath = fpath
        with open(fpath, "r", encoding="latin-1") as fd, \
                open(fout, "w") as fdout:
            alltext = fd.read()
            # Obfuscate values from val_obf_map
            for key, val in self.val_obf_map.items():
                alltext = re.sub(r'\b' + key + r'\b', val, alltext)
                if key in fname:
                    fname = fname.replace(key, val)
                    newfpath = os.path.join(fparent, fname)
            # Remove the attr values from vals_to_del list
            for val in self.vals_to_del:
                alltext = alltext.replace(val, "")
            fdout.write(alltext)

        self.du.rm(path=fpath, sudo=sudo)
        shutil.move(fout, newfpath)

        return newfpath

    def obfuscate_snapshot(self, snap_dir, map_file, sudo_val):
        """
        Helper function to obfuscate a snapshot

        :param snap_dir - path to snapshot directory to obfsucate
        :type snap_dir - str
        :param map_file - path to the map file to create
        :type map_file - str
        :param sudo_val - value of the --with-sudo option (needed for printjob)
        :type sudo_val bool
        """
        if not os.path.isdir(snap_dir):
            raise ValueError("Snapshot directory path not accessible"
                             " for obfuscation")

        # Let's go through the qmgr, qstat, pbsnodes and resourcedef file
        # Get the values associated with attributes to obfuscate and
        # obfuscate them everywhere in the snapshot
        # Delete the attribute-value pair in the delete lists
        stat_f_files = {
            QSTAT_BF_PATH: [self.svr_attrs_obf, self.svr_attrs_del],
            QSTAT_F_PATH: [self.job_attrs_obf, self.job_attrs_del],
            QSTAT_TF_PATH: [self.job_attrs_obf, self.job_attrs_del],
            QSTAT_XF_PATH: [self.job_attrs_obf, self.job_attrs_del],
            QSTAT_QF_PATH: [self.queue_attrs_obf, []],
            PBSNODES_VA_PATH: [self.node_attrs_obf, []],
            PBS_RSTAT_F_PATH: [self.resv_attrs_obf, self.resv_attrs_del]
        }
        for s_f_file, attrs in stat_f_files.items():
            qstat_f_path = os.path.join(snap_dir, s_f_file)
            if os.path.isfile(qstat_f_path):
                self._obfuscate_stat(qstat_f_path, attrs[0], attrs[1])

        # Parse resourcedef file and add custom resources to obfuscation map
        # We will later do a sed on the whole snapshot, that's when these
        # will get obfuscated
        custom_rscs = []
        custrscs_path = os.path.join(snap_dir, RSCDEF_PATH)
        if os.path.isfile(custrscs_path):
            with open(custrscs_path, "r") as fd:
                for line in fd:
                    rscs_name = line.split(" ", 1)[0]
                    custom_rscs.append(rscs_name.strip())
        for rscs in custom_rscs:
            if rscs not in self.val_obf_map:
                obf = PbsAttribute.random_str(length=random.randint(8, 30))
                self.val_obf_map[rscs] = obf

        # Obfuscate accounting logs
        # Note: We can't rely on sed to do this because there might be logs
        # From long back which have usernames & hostnames that didn't get
        # captured in the qstat/pbs_rstat/pbsnodes outputs
        self.obfuscate_acct_logs(snap_dir, sudo_val)

        # Until we can support obfuscating daemon logs, delete them
        svr_logs = os.path.join(snap_dir, SVR_LOGS_PATH)
        mom_logs = os.path.join(snap_dir, MOM_LOGS_PATH)
        comm_logs = os.path.join(snap_dir, COMM_LOGS_PATH)
        db_logs = os.path.join(snap_dir, PG_LOGS_PATH)
        topology = os.path.join(snap_dir, SVR_PRIV_PATH, "topology")
        sched_logs = []
        for dirname in self.du.listdir(path=snap_dir, sudo=sudo_val,
                                       fullpath=False):
            if dirname.startswith(DFLT_SCHED_LOGS_PATH):
                dirpath = os.path.join(snap_dir, str(dirname))
                sched_logs.append(dirpath)
        # Also delete any .JB files, store printjob outputs of them instead
        conf = self.du.parse_pbs_config()
        printjob = None
        if conf is not None:
            printjob = os.path.join(conf["PBS_EXEC"], "bin", "printjob")
            if not os.path.isfile(printjob):
                printjob = None
        if printjob is None:
            self.logger.error("printjob not found, so .JB files will "
                              "simply be deleted")
        jobspath = os.path.join(snap_dir, MOM_PRIV_PATH, "jobs")
        jbcontent = {}
        jbfilelist = self.du.listdir(path=jobspath, sudo=sudo_val,
                                     fullpath=False)
        if jbfilelist is not None:
            for name in jbfilelist:
                if name.endswith(".JB"):
                    ret = None
                    fpath = os.path.join(jobspath, name)
                    if printjob is not None:
                        cmd = [printjob, fpath]
                        ret = self.du.run_cmd(cmd=cmd, sudo=sudo_val,
                                              as_script=True)
                    self.du.rm(path=fpath)
                    if ret is not None and ret["out"] is not None:
                        jbcontent[name] = "\n".join(ret["out"])
                # Also delete any other files/directories inside mom_priv/jobs
                else:
                    path = os.path.join(jobspath, name)
                    self.du.rm(path=path, recursive=True, force=True)
        for name, content in jbcontent.items():
            # Save the printjob outputs, these will be obfuscated later
            fpath = os.path.join(jobspath, name + "_printjob")
            with open(fpath, "w") as fd:
                fd.write(str(content))

        dirs_to_del = [svr_logs, mom_logs, comm_logs, db_logs, topology]
        dirs_to_del += sched_logs
        for dirpath in dirs_to_del:
            self.du.rm(path=dirpath, recursive=True, force=True)

        # Now, go through the obfuscation map and replace all other instances
        # of the sensitive values in the snapshot with their obfuscated values
        for root, _, fnames in os.walk(snap_dir):
            for fname in fnames:
                fpath = os.path.join(root, fname)
                self._obfuscate_with_map(fpath, sudo=sudo_val)

        with open(map_file, "w") as fd:
            fd.write("Attributes Obfuscated:\n")
            fd.write(pprint.pformat(self.val_obf_map) + "\n")
            fd.write("Attributes Deleted:\n")
            fd.write("\n".join(self.vals_to_del) + "\n")


class PBSSnapUtils(object):
    """
    Wrapper class around _PBSSnapUtils
    This makes sure that we do necessay cleanup before destroying objects
    """

    def __init__(self, out_dir, basic=None, acct_logs=None,
                 daemon_logs=None, create_tar=False, log_path=None,
                 with_sudo=False):
        self.out_dir = out_dir
        self.basic = basic
        self.acct_logs = acct_logs
        self.srvc_logs = daemon_logs
        self.create_tar = create_tar
        self.log_path = log_path
        self.with_sudo = with_sudo
        self.utils_obj = None

    def __enter__(self):
        self.utils_obj = _PBSSnapUtils(self.out_dir, self.basic,
                                       self.acct_logs, self.srvc_logs,
                                       self.create_tar, self.log_path,
                                       self.with_sudo)
        return self.utils_obj

    def __exit__(self, exc_type, exc_value, traceback):
        # Do some cleanup
        self.utils_obj.finalize()

        return False


class _PBSSnapUtils(object):

    """
    PBS snapshot utilities
    """

    def __init__(self, out_dir, basic=None, acct_logs=None,
                 daemon_logs=None, create_tar=False, log_path=None,
                 with_sudo=False):
        """
        Initialize a PBSSnapUtils object with the arguments specified

        :param out_dir: path to the directory where snapshot will be created
        :type out_dir: str
        :param basic: only capture basic PBS configuration & state data?
        :type basic: bool
        :param acct_logs: number of accounting logs to capture
        :type acct_logs: int or None
        :param daemon_logs: number of daemon logs to capture
        :type daemon_logs: int or None
        :param create_tar: Create a tarball of the output snapshot?
        :type create_tar: bool or None
        :param log_path: Path to pbs_snapshot's log file
        :type log_path: str or None
        :param with_sudo: Capture relevant information with sudo?
        :type with_sudo: bool
        """
        self.logger = logging.getLogger(__name__)
        self.du = DshUtils()
        self.basic = basic
        self.server_info = {}
        self.job_info = {}
        self.node_info = {}
        self.comm_info = {}
        self.hook_info = {}
        self.sched_info = {}
        self.resv_info = {}
        self.sys_info = {}
        self.core_info = {}
        self.all_hosts = []
        self.server = None
        self.mom = None
        self.comm = None
        self.scheduler = None
        self.log_utils = PBSLogUtils()
        self.outtar_path = None
        self.outtar_fd = None
        self.create_tar = create_tar
        self.snapshot_name = None
        self.with_sudo = with_sudo
        self.log_path = log_path
        self.server_up = False
        self.server_info_avail = False
        self.mom_info_avail = False
        self.comm_info_avail = False
        self.sched_info_avail = False
        if self.log_path is not None:
            self.log_filename = os.path.basename(self.log_path)
        else:
            self.log_filename = None
        self.capture_core_files = True

        filecmd = "file"
        self.filecmd = self.du.which(exe=filecmd)
        # du.which returns the input cmd name if it can't find the cmd
        if self.filecmd is filecmd:
            self.capture_core_files = False
            self.logger.info("Warning: file command not found, "
                             "can't capture traces from any core files")

        # finalize() is called by the context's __exit__() automatically
        # however, finalize() is non-reenterant, so set a flag to keep
        # track of whether it has been called or not.
        self.finalized = False

        # Parse the input arguments
        timestamp_str = time.strftime("%Y%m%d_%H_%M_%S")
        self.snapshot_name = "snapshot_" + timestamp_str
        # Make sure that the target directory exists
        dir_path = os.path.abspath(out_dir)
        if not os.path.isdir(dir_path):
            raise ValueError("Target directory either doesn't exist" +
                             "or not accessible. Quitting.")
        self.snapdir = os.path.join(dir_path, self.snapshot_name)
        self.num_acct_logs = int(acct_logs) if acct_logs is not None else 0
        if daemon_logs is not None:
            self.num_daemon_logs = int(daemon_logs)
        else:
            self.num_daemon_logs = 0

        # Check which of the PBS daemons' information is available
        self.server = Server()
        self.scheduler = None
        daemon_status = self.server.pi.status()
        if len(daemon_status) > 0 and daemon_status['rc'] == 0 and \
                len(daemon_status['err']) == 0:
            for d_stat in daemon_status['out']:
                if d_stat.startswith("pbs_server"):
                    self.server_info_avail = True
                    if "not running" not in d_stat:
                        self.server_up = True
                elif d_stat.startswith("pbs_sched"):
                    self.sched_info_avail = True
                    self.scheduler = Scheduler(server=self.server)
                elif d_stat.startswith("pbs_mom"):
                    self.mom_info_avail = True
                elif d_stat.startswith("pbs_comm"):
                    self.comm_info_avail = True
        self.custom_rscs = None
        if self.server_up:
            self.custom_rscs = self.server.parse_resources()

        # Store paths to PBS_HOME and PBS_EXEC
        self.pbs_home = self.server.pbs_conf["PBS_HOME"]
        self.pbs_exec = self.server.pbs_conf["PBS_EXEC"]

        # If output needs to be a tarball, create the tarfile name
        # tarfile name = <output directory name>.tgz
        self.outtar_path = self.snapdir + ".tgz"

        # Set up some infrastructure
        self.__init_cmd_path_map()

        # Create the snapshot directory tree
        self.__initialize_snapshot()

    def __init_cmd_path_map(self):
        """
        Fill in various dicts which map the commands used for capturing
        various classes of outputs along with the paths to the files where
        they will be stored inside the snapshot as a tuple.
        """
        if self.server_up:
            # Server information
            value = (QSTAT_BF_PATH, [QSTAT_CMD, "-Bf"])
            self.server_info[QSTAT_BF_OUT] = value
            value = (QSTAT_QF_PATH, [QSTAT_CMD, "-Qf"])
            self.server_info[QSTAT_QF_OUT] = value
            if not self.basic:
                value = (QSTAT_B_PATH, [QSTAT_CMD, "-B"])
                self.server_info[QSTAT_B_OUT] = value
                value = (QMGR_PS_PATH, [QMGR_CMD, "-c", "p s"])
                self.server_info[QMGR_PS_OUT] = value
                value = (QSTAT_Q_PATH, [QSTAT_CMD, "-Q"])
                self.server_info[QSTAT_Q_OUT] = value
                value = (QMGR_PR_PATH, [QMGR_CMD, "-c", "p r"])
                self.server_info[QMGR_PR_OUT] = value
                value = (QMGR_PQ_PATH, [QMGR_CMD, "-c", "p q @default"])
                self.server_info[QMGR_PQ_OUT] = value

            # Job information
            value = (QSTAT_F_PATH, [QSTAT_CMD, "-f"])
            self.job_info[QSTAT_F_OUT] = value
            value = (QSTAT_TF_PATH, [QSTAT_CMD, "-tf"])
            self.job_info[QSTAT_TF_OUT] = value
            if not self.basic:
                value = (QSTAT_PATH, [QSTAT_CMD])
                self.job_info[QSTAT_OUT] = value
                value = (QSTAT_T_PATH, [QSTAT_CMD, "-t"])
                self.job_info[QSTAT_T_OUT] = value
                value = (QSTAT_X_PATH, [QSTAT_CMD, "-x"])
                self.job_info[QSTAT_X_OUT] = value
                value = (QSTAT_XF_PATH, [QSTAT_CMD, "-xf"])
                self.job_info[QSTAT_XF_OUT] = value
                value = (QSTAT_NS_PATH, [QSTAT_CMD, "-ns"])
                self.job_info[QSTAT_NS_OUT] = value
                value = (QSTAT_FX_DSV_PATH, [QSTAT_CMD, "-fx", "-F", "dsv"])
                self.job_info[QSTAT_FX_DSV_OUT] = value
                value = (QSTAT_F_DSV_PATH, [QSTAT_CMD, "-f", "-F", "dsv"])
                self.job_info[QSTAT_F_DSV_OUT] = value
                value = (QSTAT_F_JSON_PATH, [QSTAT_CMD, "-f", "-F", "json"])
                self.job_info[QSTAT_F_JSON_OUT] = value

            # Node information
            value = (PBSNODES_VA_PATH, [PBSNODES_CMD, "-va"])
            self.node_info[PBSNODES_VA_OUT] = value
            if not self.basic:
                value = (PBSNODES_A_PATH, [PBSNODES_CMD, "-a"])
                self.node_info[PBSNODES_A_OUT] = value
                value = (PBSNODES_AVSJ_PATH, [PBSNODES_CMD, "-avSj"])
                self.node_info[PBSNODES_AVSJ_OUT] = value
                value = (PBSNODES_ASJ_PATH, [PBSNODES_CMD, "-aSj"])
                self.node_info[PBSNODES_ASJ_OUT] = value
                value = (PBSNODES_AVS_PATH, [PBSNODES_CMD, "-avS"])
                self.node_info[PBSNODES_AVS_OUT] = value
                value = (PBSNODES_AS_PATH, [PBSNODES_CMD, "-aS"])
                self.node_info[PBSNODES_AS_OUT] = value
                value = (PBSNODES_AFDSV_PATH, [PBSNODES_CMD, "-aFdsv"])
                self.node_info[PBSNODES_AFDSV_OUT] = value
                value = (PBSNODES_AVFDSV_PATH, [PBSNODES_CMD, "-avFdsv"])
                self.node_info[PBSNODES_AVFDSV_OUT] = value
                value = (PBSNODES_AVFJSON_PATH, [PBSNODES_CMD, "-avFjson"])
                self.node_info[PBSNODES_AVFJSON_OUT] = value
                value = (QMGR_PN_PATH, [QMGR_CMD, "-c", "p n @default"])
                self.node_info[QMGR_PN_OUT] = value

            # Hook information
            value = (QMGR_LPBSHOOK_PATH, [QMGR_CMD, "-c", "l pbshook"])
            self.hook_info[QMGR_LPBSHOOK_OUT] = value
            if not self.basic:
                value = (QMGR_PH_PATH, [QMGR_CMD, "-c", "p h @default"])
                self.hook_info[QMGR_PH_OUT] = value

            # Reservation information
            value = (PBS_RSTAT_F_PATH, [PBS_RSTAT_CMD, "-f"])
            self.resv_info[PBS_RSTAT_F_OUT] = value
            if not self.basic:
                value = (PBS_RSTAT_PATH, [PBS_RSTAT_CMD])
                self.resv_info[PBS_RSTAT_OUT] = value

            # Scheduler information
            value = (QMGR_LSCHED_PATH, [QMGR_CMD, "-c", "l sched"])
            self.sched_info[QMGR_LSCHED_OUT] = value
            if not self.basic:
                value = (QMGR_PSCHED_PATH, [QMGR_CMD, "-c", "p sched"])
                self.sched_info[QMGR_PSCHED_OUT] = value

        if self.server_info_avail:
            # Server priv and logs
            value = (SVR_PRIV_PATH, None)
            self.server_info[SVR_PRIV] = value
            value = (SVR_LOGS_PATH, None)
            self.server_info[SVR_LOGS] = value
            value = (ACCT_LOGS_PATH, None)
            self.server_info[ACCT_LOGS] = value

            # Core file information
            value = (CORE_SERVER_PATH, None)
            self.core_info[CORE_SERVER] = value

        if self.mom_info_avail:
            # Mom priv and logs
            value = (MOM_PRIV_PATH, None)
            self.node_info[MOM_PRIV] = value
            value = (MOM_LOGS_PATH, None)
            self.node_info[MOM_LOGS] = value

            # Core file information
            value = (CORE_MOM_PATH, None)
            self.core_info[CORE_MOM] = value

        if self.comm_info_avail:
            # Comm information
            value = (COMM_LOGS_PATH, None)
            self.comm_info[COMM_LOGS] = value

        if self.sched_info_avail:
            # Scheduler logs and priv
            value = (DFLT_SCHED_PRIV_PATH, None)
            self.sched_info[SCHED_PRIV] = value
            value = (DFLT_SCHED_LOGS_PATH, None)
            self.sched_info[SCHED_LOGS] = value

            # Core file information
            value = (CORE_SCHED_PATH, None)
            self.core_info[CORE_SCHED] = value

        # System information
        if not self.basic:
            value = (PBS_PROBE_PATH, [PBS_PROBE_CMD, "-v"])
            self.sys_info[PBS_PROBE_OUT] = value
            # We'll append hostname to this later (see capture_system_info)
            value = (PBS_HOSTN_PATH, [PBS_HOSTN_CMD, "-v"])
            self.sys_info[PBS_HOSTN_OUT] = value
            value = (PBS_ENV_PATH, None)
            self.sys_info[PBS_ENVIRONMENT] = value
            value = (OS_PATH, None)
            self.sys_info[OS_INFO] = value
            value = (PROCESS_PATH, ["ps", "aux", "|", "grep", "[p]bs"])
            self.sys_info[PROCESS_INFO] = value
            value = (ETC_HOSTS_PATH,
                     ["cat", os.path.join(os.sep, "etc", "hosts")])
            self.sys_info[ETC_HOSTS] = value
            value = (ETC_NSSWITCH_PATH,
                     ["cat", os.path.join(os.sep, "etc", "nsswitch.conf")])
            self.sys_info[ETC_NSSWITCH_CONF] = value
            value = (LSOF_PBS_PATH, ["lsof", "|", "grep", "[p]bs"])
            self.sys_info[LSOF_PBS_OUT] = value
            value = (VMSTAT_PATH, ["vmstat"])
            self.sys_info[VMSTAT_OUT] = value
            value = (DF_H_PATH, ["df", "-h"])
            self.sys_info[DF_H_OUT] = value
            value = (DMESG_PATH, ["dmesg", "-T"])
            self.sys_info[DMESG_OUT] = value
            value = (PS_LEAF_PATH, ["ps", "-leaf"])
            self.sys_info[PS_LEAF_OUT] = value

    def __initialize_snapshot(self):
        """
        Create a snapshot directory along with the directory structure
        Also create a tarfile and add the snapshot dir if create_tar is True
        """

        os.mkdir(self.snapdir)

        if self.create_tar:
            self.outtar_fd = tarfile.open(self.outtar_path, "w:gz")

        dirs_in_snapshot = [SYS_DIR, CORE_DIR]
        if self.server_up:
            dirs_in_snapshot.extend([SERVER_DIR, JOB_DIR, HOOK_DIR, RESV_DIR,
                                     NODE_DIR, SCHED_DIR])
        if self.server_info_avail:
            dirs_in_snapshot.extend([SVR_PRIV_PATH, SVR_LOGS_PATH,
                                     ACCT_LOGS_PATH, DATASTORE_DIR,
                                     PG_LOGS_PATH])
        if self.mom_info_avail:
            dirs_in_snapshot.extend([MOM_PRIV_PATH, MOM_LOGS_PATH])
        if self.comm_info_avail:
            dirs_in_snapshot.append(COMM_LOGS_PATH)
        if self.sched_info_avail:
            dirs_in_snapshot.extend([DFLT_SCHED_LOGS_PATH,
                                     DFLT_SCHED_PRIV_PATH])

        for item in dirs_in_snapshot:
            rel_path = os.path.join(self.snapdir, item)
            os.makedirs(rel_path, 0o755)

    def __capture_cmd_output(self, out_path, cmd, as_script=False,
                             ret_out=False, sudo=False):
        """
        Run a command and capture its output

        :param out_path: path of the output file for this command
        :type out_path: str
        :param cmd: The command to execute
        :type cmd: list
        :param as_script: Passed to run_cmd()
        :type as_Script: bool
        :param ret_out: Return output of the command?
        :type ret_out: bool
        """
        retstr = None

        with open(out_path, "a+") as out_fd:
            try:
                self.du.run_cmd(cmd=cmd, stdout=out_fd,
                                sudo=sudo, as_script=as_script)
                if ret_out:
                    out_fd.seek(0, 0)
                    retstr = out_fd.read()
            except OSError as e:
                # This usually happens when the command is not found
                # Just log and return
                self.logger.error(str(e))
                return

        if self.create_tar:
            self.__add_to_archive(out_path)

        if ret_out:
            return retstr

    @staticmethod
    def __convert_flag_to_numeric(flag):
        """
        Convert a resource's flag attribute to its numeric equivalent

        :param flag: the resource flag to convert
        :type flag: string

        :returns: numeric value of the resource flag
        """
        # Variable assignments below mirrors definitions
        # from src/include/pbs_internal.h
        ATR_DFLAG_USRD = 0x01
        ATR_DFLAG_USWR = 0x02
        ATR_DFLAG_OPRD = 0x04
        ATR_DFLAG_OPWR = 0x08
        ATR_DFLAG_MGRD = 0x10
        ATR_DFLAG_MGWR = 0x20
        ATR_DFLAG_MOM = 0x400
        ATR_DFLAG_RASSN = 0x4000
        ATR_DFLAG_ANASSN = 0x8000
        ATR_DFLAG_FNASSN = 0x10000
        ATR_DFLAG_CVTSLT = 0x20000

        NO_USER_SET = (ATR_DFLAG_USRD | ATR_DFLAG_OPRD | ATR_DFLAG_MGRD |
                       ATR_DFLAG_OPWR | ATR_DFLAG_MGWR)
        READ_WRITE = (ATR_DFLAG_USRD | ATR_DFLAG_OPRD | ATR_DFLAG_MGRD |
                      ATR_DFLAG_USWR | ATR_DFLAG_OPWR | ATR_DFLAG_MGWR)

        resc_flag = READ_WRITE
        if "q" in flag:
            resc_flag |= ATR_DFLAG_RASSN
        if "f" in flag:
            resc_flag |= ATR_DFLAG_FNASSN
        if "n" in flag:
            resc_flag |= ATR_DFLAG_ANASSN
        if "h" in flag:
            resc_flag |= ATR_DFLAG_CVTSLT
        if "m" in flag:
            resc_flag |= ATR_DFLAG_MOM
        if "r" in flag:
            resc_flag &= ~READ_WRITE
            resc_flag |= NO_USER_SET
        if "i" in flag:
            resc_flag &= ~READ_WRITE
            resc_flag |= (ATR_DFLAG_OPRD | ATR_DFLAG_OPWR |
                          ATR_DFLAG_MGRD | ATR_DFLAG_MGWR)
        return resc_flag

    @staticmethod
    def __convert_type_to_numeric(attr_type):
        """
        Convert a resource's type attribute to its numeric equivalent

        :param attr_type: the type to convert
        :type attr_type: string

        :returns: Numeric equivalent of attr_type
        """
        PBS_ATTR_TYPE_TO_INT = {
            "long": 1,
            "string": 3,
            "string_array": 4,
            "size": 5,
            "boolean": 11,
            "float": 14,
        }

        return PBS_ATTR_TYPE_TO_INT[attr_type.strip()]

    def __capture_trace_from_core(self, core_file_name, exec_path, out_path):
        """
        Capture stack strace from the core file specified

        :param core_file_name: name of the core file
        :type core_file_name: str
        :param exec_path: path to the executable which generated the core
        :type exec_path: str
        :param out_path: ofile to print the trace out to
        :type out_path: str
        """
        self.logger.info("capturing stack trace from core file " +
                         core_file_name)

        # Create a gdb-python script to capture backtrace from core
        gdb_python = """
import gdb
gdb.execute("file %s")
gdb.execute("core %s")
o = gdb.execute("thread apply all bt", to_string=True)
print(o)
gdb.execute("quit")
quit()
        """ % (exec_path, core_file_name)
        # Remove tabs from triple quoted strings
        gdb_python = gdb_python.replace("\t", "")

        # Write the gdb-python script in a temporary file
        fn = self.du.create_temp_file(body=gdb_python)

        # Catch the stack trace using gdb
        gdb_cmd = ["gdb", "-P", fn]
        with open(out_path, "w") as outfd:
            self.du.run_cmd(cmd=gdb_cmd, stdout=outfd, stderr=STDOUT,
                            sudo=self.with_sudo)

        # Remove the temp file
        os.remove(fn)

        if self.create_tar:
            self.__add_to_archive(out_path)

    def __capture_logs(self, pbs_logdir, snap_logdir, num_days_logs,
                       sudo=False):
        """
        Capture specific logs for the days mentioned

        :param pbs_logdir: path to the PBS logs directory (source)
        :type pbs_logdir: str
        :param snap_logdir: path to the snapshot logs directory (destination)
        :type snap_logdir: str
        :param num_days_logs: Number of days of logs to capture
        :type num_days_logs: int
        :param sudo: copy logs with sudo?
        :type sudo: bool
        """

        if num_days_logs < 1:
            self.logger.debug("Number of days of logs < 1, skipping")
            return

        end_time = self.server.ctime
        start_time = end_time - ((num_days_logs - 1) * 24 * 60 * 60)

        # Get the list of log file names to capture
        pbs_logfiles = self.log_utils.get_log_files(self.server.hostname,
                                                    pbs_logdir, start_time,
                                                    end_time, sudo)
        if len(pbs_logfiles) == 0:
            self.logger.debug(pbs_logdir + "not found/accessible")
            return

        self.logger.debug("Capturing " + str(num_days_logs) +
                          " days of logs from " + pbs_logdir)

        # Make sure that the target log dir exists
        if not os.path.isdir(snap_logdir):
            os.makedirs(snap_logdir)

        # Go over the list and copy over each log file
        for pbs_logfile in pbs_logfiles:
            snap_logfile = os.path.join(snap_logdir,
                                        os.path.basename(pbs_logfile))
            pbs_logfile = pbs_logfile
            self.du.run_copy(src=pbs_logfile, dest=snap_logfile,
                             recursive=False,
                             preserve_permission=False,
                             sudo=sudo)
            if sudo:
                # Copying files with sudo makes root the owner, set it to the
                # current user
                self.du.chown(path=snap_logfile, uid=os.getuid(),
                              gid=os.getgid(), sudo=self.with_sudo)

            if self.create_tar:
                self.__add_to_archive(snap_logfile)

    def __evaluate_core_file(self, file_path, core_dir):
        """
        Check whether the specified file is a core dump
        If yes, capture its stack trace and store it

        :param file_path: path to the file
        :type file_path: str
        :param core_dir: path to directory to store core information
        :type core_dir: str


        :returns: True if this was a valid core file, otherwise False
        """
        if not self.capture_core_files:
            return False

        if not self.du.isfile(path=file_path, sudo=self.with_sudo):
            self.logger.debug("Could not find file path " + str(file_path))
            return False

        # Get the header of this file
        ret = self.du.run_cmd(cmd=[self.filecmd, file_path],
                              sudo=self.with_sudo)
        if ret['err'] is not None and len(ret['err']) != 0:
            self.logger.error(
                "\'file\' command failed with error: " + ret['err'] +
                " on file: " + str(file_path))
            return False

        file_header = ret["out"][0]
        if "core file" not in file_header:
            return False

        # Identify the program which created this core file
        header_list = file_header.split()
        if "from" not in header_list:
            return False
        exec_index = header_list.index("from") + 1
        exec_name = header_list[exec_index].replace("\'", "")
        exec_name = exec_name.replace(",", "")

        # Capture the stack trace from this core file
        filename = os.path.basename(file_path)
        core_dest = os.path.join(core_dir, filename)
        if not os.path.isdir(core_dir):
            os.makedirs(core_dir, 0o755)
        self.__capture_trace_from_core(file_path, exec_name,
                                       core_dest)

        # Delete the core file itself
        if os.path.isfile(file_path):
            os.remove(file_path)

        return True

    def __copy_dir_with_core(self, src_path, dest_path, core_dir,
                             except_list=None, only_core=False, sudo=False):
        """
        Copy over a directory recursively which might have core files
        When a core file is found, capture the stack trace from it

        :param src_path: path of the source directory
        :type src_path: str
        :param dest_path: path of the destination directory
        :type dest_path: str
        :param core_dir: path to the directory to store core files' trace
        :type core_dir: str
        :param except_list: list  of files/directories (basenames) to exclude
        :type except_list: list
        :param only_core: Copy over only core files?
        :type only_core: bool
        :param sudo: Copy with sudo?
        :type sudo: bool
        """
        if except_list is None:
            except_list = []

        # This can happen when -o is a path that we are capturing
        # Just return success
        if os.path.basename(src_path) == self.snapshot_name:
            self.logger.debug("src_path %s seems to be snapshot directory,"
                              "ignoring" % src_path)
            return
        dir_list = self.du.listdir(path=src_path, fullpath=False,
                                   sudo=sudo)

        if dir_list is None:
            self.logger.info("Can't find/access " + src_path)
            return

        # Go over the list and copy over everything
        # If we find a core file, we'll store backtrace from it inside
        # core_file_bt
        for item in dir_list:
            if item in except_list:
                continue

            item_src_path = os.path.join(src_path, item)
            if not only_core:
                item_dest_path = os.path.join(dest_path, item)
            else:
                item_dest_path = core_dir

            # We can't directly use 'recursive' argument of run_copy
            # to copy the entire directory tree as we need to take care
            # of the 'except_list'. So, we recursively explore the whole
            # tree and copy over files individually.
            if self.du.isdir(path=item_src_path, sudo=sudo):
                # Make sure that the directory exists in the snapshot
                if not self.du.isdir(path=item_dest_path):
                    # Create the directory
                    os.makedirs(item_dest_path, 0o755)
                # Recursive call to copy contents of the directory
                self.__copy_dir_with_core(item_src_path, item_dest_path,
                                          core_dir, except_list, only_core,
                                          sudo=sudo)
            else:
                # Copy the file over
                item_src_path = item_src_path
                try:
                    self.du.run_copy(src=item_src_path, dest=item_dest_path,
                                     recursive=False,
                                     preserve_permission=False,
                                     level=logging.DEBUG, sudo=sudo)
                    if sudo:
                        # Copying files with sudo makes root the owner,
                        # set it to the current user
                        self.du.chown(path=item_dest_path, uid=os.getuid(),
                                      gid=os.getgid(), sudo=self.with_sudo)
                except OSError:
                    self.logger.error("Could not copy %s" % item_src_path)
                    continue

                # Check if this is a core file
                # If it is then this method will capture its stack trace
                is_core = self.__evaluate_core_file(item_dest_path, core_dir)

                # If it was a core file, then it's already been captured
                if is_core:
                    continue

                # If only_core is True and this was not a core file, then we
                # should delete it
                if only_core:
                    os.remove(item_dest_path)
                else:
                    # This was not a core file, and 'only_core' is not True
                    # So, we need to capture this file
                    if self.create_tar:
                        self.__add_to_archive(item_dest_path)

    def __capture_mom_priv(self):
        """
        Capture mom_priv information
        """
        pbs_home = self.pbs_home
        pbs_mom_priv = os.path.join(pbs_home, "mom_priv")
        snap_mom_priv = os.path.join(self.snapdir, MOM_PRIV_PATH)
        core_dir = os.path.join(self.snapdir, CORE_MOM_PATH)
        self.__copy_dir_with_core(pbs_mom_priv, snap_mom_priv, core_dir,
                                  sudo=self.with_sudo)

    def __add_to_archive(self, dest_path, src_path=None):
        """
        Add a file to the output tarball and delete the original file

        :param dest_path: path to the file inside the target tarball
        :type dest_path: str
        :param src_path: path to the file to add, if different than dest_path
        :type src_path: str
        """
        if src_path is None:
            src_path = dest_path

        self.logger.debug("Adding " + src_path + " to tarball " +
                          self.outtar_path)

        # Add file to tar
        dest_relpath = os.path.relpath(dest_path, self.snapdir)
        path_in_tar = os.path.join(self.snapshot_name, dest_relpath)
        try:
            self.outtar_fd.add(src_path, arcname=path_in_tar)

            # Remove original file
            os.remove(src_path)
        except OSError:
            self.logger.error(
                "File %s could not be added to tarball" % (src_path))

    def __capture_svr_logs(self):
        """
        Capture server logs
        """
        pbs_logdir = os.path.join(self.pbs_home, "server_logs")
        snap_logdir = os.path.join(self.snapdir, SVR_LOGS_PATH)
        self.__capture_logs(pbs_logdir, snap_logdir, self.num_daemon_logs)

    def __capture_acct_logs(self):
        """
        Capture accounting logs
        """
        pbs_logdir = os.path.join(self.pbs_home, "server_priv", "accounting")
        snap_logdir = os.path.join(self.snapdir, ACCT_LOGS_PATH)
        self.__capture_logs(pbs_logdir, snap_logdir, self.num_acct_logs,
                            sudo=self.with_sudo)

    def __capture_sched_logs(self, pbs_logdir, snap_logdir):
        """
        Capture scheduler logs
        """
        self.__capture_logs(pbs_logdir, snap_logdir, self.num_daemon_logs)

    def __capture_mom_logs(self):
        """
        Capture mom logs
        """
        pbs_home = self.pbs_home
        pbs_logdir = os.path.join(pbs_home, "mom_logs")
        snap_logdir = os.path.join(self.snapdir, MOM_LOGS_PATH)
        self.__capture_logs(pbs_logdir, snap_logdir, self.num_daemon_logs)

    def __capture_comm_logs(self):
        """
        Capture pbs_comm logs
        """
        pbs_home = self.pbs_home
        pbs_logdir = os.path.join(pbs_home, "comm_logs")
        snap_logdir = os.path.join(self.snapdir, COMM_LOGS_PATH)
        self.__capture_logs(pbs_logdir, snap_logdir, self.num_daemon_logs)

    def capture_server(self, with_svr_logs=False, with_acct_logs=False):
        """
        Capture PBS server specific information

        :param with_svr_logs: capture server logs as well?
        :type with_svr_logs: bool
        :param with_acct_logs: capture accounting logs as well?
        :type with_acct_logs: bool

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing server information")

        if self.server_up:
            # Go through 'server_info' and capture info that depends on
            # commands
            for (path, cmd_list) in self.server_info.values():
                if cmd_list is None:
                    continue
                cmd_list_cpy = list(cmd_list)

                # Add the path to PBS_EXEC to the command path
                # The command path is the first entry in command list
                cmd_list_cpy[0] = os.path.join(self.pbs_exec, cmd_list[0])
                snap_path = os.path.join(self.snapdir, path)
                self.__capture_cmd_output(snap_path, cmd_list_cpy,
                                          sudo=self.with_sudo)

        if self.server_info_avail:
            if self.basic:
                # Only copy over the resourcedef file
                snap_rscdef = os.path.join(self.snapdir, RSCDEF_PATH)
                pbs_rscdef = os.path.join(self.pbs_home, RSCDEF_PATH)
                self.du.run_copy(src=pbs_rscdef, dest=snap_rscdef,
                                 recursive=False,
                                 preserve_permission=False,
                                 level=logging.DEBUG, sudo=self.with_sudo)
                if self.create_tar:
                    self.__add_to_archive(snap_rscdef)

            else:
                # Copy over 'server_priv', everything except accounting logs
                snap_server_priv = os.path.join(self.snapdir, SVR_PRIV_PATH)
                pbs_server_priv = os.path.join(self.pbs_home, "server_priv")
                core_dir = os.path.join(self.snapdir, CORE_SERVER_PATH)
                exclude_list = ["accounting"]
                self.__copy_dir_with_core(pbs_server_priv,
                                          snap_server_priv, core_dir,
                                          exclude_list, sudo=self.with_sudo)

            if with_svr_logs and self.num_daemon_logs > 0:
                # Capture server logs
                self.__capture_svr_logs()

            if with_acct_logs and self.num_acct_logs > 0:
                # Capture accounting logs
                self.__capture_acct_logs()

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_jobs(self):
        """
        Capture information related to jobs

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing jobs information")

        if self.server_up:
            # Go through 'job_info' and capture info that depends on commands
            for (path, cmd_list) in self.job_info.values():
                cmd_list_cpy = list(cmd_list)

                # Add the path to PBS_EXEC to the command path
                # The command path is the first entry in command list
                cmd_list_cpy[0] = os.path.join(self.pbs_exec, cmd_list[0])
                snap_path = os.path.join(self.snapdir, path)
                self.__capture_cmd_output(snap_path, cmd_list_cpy,
                                          sudo=self.with_sudo)

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_nodes(self, with_mom_logs=False):
        """
        Capture information related to nodes & mom along with mom logs

        :param with_mom_logs: Capture mom logs?
        :type with_mom_logs: bool

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing nodes & mom information")

        if self.server_up:
            # Go through 'node_info' and capture info that depends on commands
            for (path, cmd_list) in self.node_info.values():
                if cmd_list is None:
                    continue
                cmd_list_cpy = list(cmd_list)

                # Add the path to PBS_EXEC to the command path
                # The command path is the first entry in command list
                cmd_list_cpy[0] = os.path.join(self.pbs_exec, cmd_list[0])
                snap_path = os.path.join(self.snapdir, path)
                self.__capture_cmd_output(snap_path, cmd_list_cpy,
                                          sudo=self.with_sudo)

        # Collect mom logs and priv
        if self.mom_info_avail:
            if not self.basic:
                # Capture mom_priv info
                self.__capture_mom_priv()

            if with_mom_logs and self.num_daemon_logs > 0:
                # Capture mom_logs
                self.__capture_mom_logs()

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_comms(self, with_comm_logs=False):
        """
        Capture Comm related information

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing comm information")

        # Capture comm logs
        if self.comm_info_avail:
            if self.num_daemon_logs > 0 and with_comm_logs:
                self.__capture_comm_logs()

        # If not already capturing server information, copy over server_priv
        # as pbs_comm runs out of it
        if not self.server_info_avail and not self.basic:
            pbs_server_priv = os.path.join(self.pbs_home, "server_priv")
            snap_server_priv = os.path.join(self.snapdir, SVR_PRIV_PATH)
            core_dir = os.path.join(self.snapdir, CORE_SERVER_PATH)
            exclude_list = ["accounting"]
            self.__copy_dir_with_core(pbs_server_priv,
                                      snap_server_priv, core_dir, exclude_list,
                                      sudo=self.with_sudo)
        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_scheduler(self, with_sched_logs=False):
        """
        Capture information related to the scheduler

        :param with_sched_logs: Capture scheduler logs?
        :type with_sched_logs: bool

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing scheduler information")

        qmgr_lsched = None
        if self.server_up:
            # Go through 'sched_info' and capture info that depends on commands
            for (path, cmd_list) in self.sched_info.values():
                if cmd_list is None:
                    continue
                cmd_list_cpy = list(cmd_list)

                # Add the path to PBS_EXEC to the command path
                # The command path is the first entry in command list
                cmd_list_cpy[0] = os.path.join(self.pbs_exec, cmd_list[0])
                snap_path = os.path.join(self.snapdir, path)
                if "l sched" in cmd_list_cpy:
                    qmgr_lsched = self.__capture_cmd_output(snap_path,
                                                            cmd_list_cpy,
                                                            ret_out=True)
                else:
                    self.__capture_cmd_output(snap_path, cmd_list_cpy,
                                              sudo=self.with_sudo)

        # Capture sched_priv & sched_logs for all schedulers
        if qmgr_lsched is not None and self.sched_info_avail:
            sched_details = {}
            sched_name = None
            for line in qmgr_lsched.splitlines():
                if line.startswith("Sched "):
                    sched_name = line.split("Sched ")[1]
                    sched_name = "".join(sched_name.split())
                    sched_details[sched_name] = {}
                    continue
                if sched_name is not None:
                    line = "".join(line.split())
                    if line.startswith("sched_priv="):
                        sched_details[sched_name]["sched_priv"] = \
                            line.split("=")[1]
                    elif line.startswith("sched_log="):
                        sched_details[sched_name]["sched_log"] = \
                            line.split("=")[1]

            for sched_name in sched_details:
                pbs_sched_priv = None
                # Capture sched_priv for the scheduler
                if len(sched_details) == 1:  # For pre-multisched outputs
                    pbs_sched_priv = os.path.join(self.pbs_home, "sched_priv")
                elif "sched_priv" in sched_details[sched_name]:
                    pbs_sched_priv = sched_details[sched_name]["sched_priv"]
                if sched_name == "default" or len(sched_details) == 1:
                    snap_sched_priv = os.path.join(self.snapdir,
                                                   DFLT_SCHED_PRIV_PATH)
                    core_dir = os.path.join(self.snapdir, CORE_SCHED_PATH)
                else:
                    dirname = DFLT_SCHED_PRIV_PATH + "_" + sched_name
                    coredirname = CORE_SCHED_PATH + "_" + sched_name
                    snap_sched_priv = os.path.join(self.snapdir, dirname)
                    os.makedirs(snap_sched_priv, 0o755)
                    core_dir = os.path.join(self.snapdir, coredirname)

                if pbs_sched_priv and os.path.isdir(pbs_sched_priv):
                    self.__copy_dir_with_core(pbs_sched_priv,
                                              snap_sched_priv, core_dir,
                                              sudo=self.with_sudo)
                if with_sched_logs and self.num_daemon_logs > 0:
                    pbs_sched_log = None
                    # Capture scheduler logs
                    if len(sched_details) == 1:  # For pre-multisched outputs
                        pbs_sched_log = os.path.join(self.pbs_home,
                                                     "sched_logs")
                    elif "sched_log" in sched_details[sched_name]:
                        pbs_sched_log = sched_details[sched_name]["sched_log"]
                    if sched_name == "default" or len(sched_details) == 1:
                        snap_sched_log = os.path.join(self.snapdir,
                                                      DFLT_SCHED_LOGS_PATH)
                    else:
                        dirname = DFLT_SCHED_LOGS_PATH + "_" + sched_name
                        snap_sched_log = os.path.join(self.snapdir, dirname)
                        os.makedirs(snap_sched_log, 0o755)

                    if pbs_sched_log and os.path.isdir(pbs_sched_log):
                        self.__capture_sched_logs(pbs_sched_log,
                                                  snap_sched_log)

        elif self.sched_info_avail:
            # We don't know about other multi-scheds,
            # but can still capture the default sched's logs & priv
            pbs_sched_priv = os.path.join(self.pbs_home, "sched_priv")
            snap_sched_priv = os.path.join(self.snapdir,
                                           DFLT_SCHED_PRIV_PATH)
            core_dir = os.path.join(self.snapdir, CORE_SCHED_PATH)
            self.__copy_dir_with_core(pbs_sched_priv,
                                      snap_sched_priv, core_dir,
                                      sudo=self.with_sudo)
            if with_sched_logs and self.num_daemon_logs > 0:
                pbs_sched_log = os.path.join(self.pbs_home,
                                             "sched_logs")
                snap_sched_log = os.path.join(self.snapdir,
                                              DFLT_SCHED_LOGS_PATH)
                self.__capture_sched_logs(pbs_sched_log, snap_sched_log)

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_hooks(self):
        """
        Capture information related to hooks

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing hooks information")

        # Go through 'hook_info' and capture info that depends on commands
        for (path, cmd_list) in self.hook_info.values():
            if cmd_list is None:
                continue
            cmd_list_cpy = list(cmd_list)

            # Add the path to PBS_EXEC to the command path
            # The command path is the first entry in command list
            cmd_list_cpy[0] = os.path.join(self.pbs_exec, cmd_list[0])
            snap_path = os.path.join(self.snapdir, path)
            self.__capture_cmd_output(snap_path, cmd_list_cpy,
                                      sudo=self.with_sudo)

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_reservations(self):
        """
        Capture information related to reservations

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing reservations information")

        # Go through 'resv_info' and capture info that depends on commands
        for (path, cmd_list) in self.resv_info.values():
            if cmd_list is None:
                continue
            cmd_list_cpy = list(cmd_list)

            # Add the path to PBS_EXEC to the command path
            # The command path is the first entry in command list
            cmd_list_cpy[0] = os.path.join(self.pbs_exec, cmd_list[0])
            snap_path = os.path.join(self.snapdir, path)
            self.__capture_cmd_output(snap_path, cmd_list_cpy,
                                      sudo=self.with_sudo)

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_datastore(self, with_db_logs=False):
        """
        Capture information related to datastore

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing datastore information")

        if with_db_logs and self.num_daemon_logs > 0:
            # Capture database logs
            pbs_logdir = os.path.join(self.pbs_home, PG_LOGS_PATH)
            snap_logdir = os.path.join(self.snapdir, PG_LOGS_PATH)
            self.__capture_logs(pbs_logdir, snap_logdir, self.num_daemon_logs,
                                sudo=self.with_sudo)

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_pbs_conf(self):
        """
        Capture pbs.conf file

        :returns: name of the output directory/tarfile containing the snapshot
        """
        # Capture pbs.conf
        self.logger.info("capturing pbs.conf")
        snap_confpath = os.path.join(self.snapdir, PBS_CONF_PATH)
        with open(snap_confpath, "w") as fd:
            for k, v in self.server.pbs_conf.items():
                fd.write(k + "=" + str(v) + "\n")

        if self.create_tar:
            self.__add_to_archive(snap_confpath)
            return self.outtar_path
        else:
            return self.snapdir

    def capture_system_info(self):
        """
        Capture system related information

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing system information")

        if self.basic:
            return

        sudo_cmds = [PBS_PROBE_OUT, LSOF_PBS_OUT, DMESG_OUT]
        as_script_cmds = [PROCESS_INFO, LSOF_PBS_OUT]
        pbs_cmds = [PBS_PROBE_OUT, PBS_HOSTN_OUT]

        host_platform = self.du.get_platform()
        win_platform = False
        if host_platform.startswith("win"):
            win_platform = True

        # Capture information that's dependent on commands
        for (key, values) in self.sys_info.items():
            sudo = False
            (path, cmd_list) = values
            if cmd_list is None:
                continue
            # For Windows, only capture PBS commands
            if win_platform and (key not in pbs_cmds):
                continue

            cmd_list_cpy = list(cmd_list)

            # Find the full path to the command on the host
            if key in pbs_cmds:
                cmd_full = os.path.join(self.pbs_exec, cmd_list_cpy[0])
            else:
                cmd_full = self.du.which(exe=cmd_list_cpy[0])
            # du.which() returns the name of the command passed if
            # it can't find the command
            if cmd_full is cmd_list_cpy[0]:
                continue
            cmd_list_cpy[0] = cmd_full

            # Handle special commands
            if "pbs_hostn" in cmd_list_cpy[0]:
                # Append hostname to the command list
                cmd_list_cpy.append(self.server.hostname)
            if key in as_script_cmds:
                as_script = True
                if key in sudo_cmds and self.with_sudo:
                    # Because this cmd needs to be run in a script,
                    # PTL run_cmd's sudo will try to run the script
                    # itself with sudo, not the cmd
                    # So, append sudo as a prefix to the cmd instead
                    cmd_list_cpy[0] = (' '.join(self.du.sudo_cmd) +
                                       ' ' + cmd_list_cpy[0])
            else:
                as_script = False
                if key in sudo_cmds:
                    sudo = self.with_sudo

            snap_path = os.path.join(self.snapdir, path)
            self.__capture_cmd_output(snap_path, cmd_list_cpy,
                                      as_script=as_script, sudo=sudo)

        # Capture platform dependent information
        if win_platform:
            # Capture process information using tasklist command
            cmd = ["tasklist", ["/v"]]
            snap_path = PROCESS_PATH
            self.__capture_cmd_output(snap_path, cmd,
                                      sudo=self.with_sudo)

        # Capture OS/platform information
        self.logger.info("capturing OS information")
        snap_ospath = os.path.join(self.snapdir, OS_PATH)
        with open(snap_ospath, "w") as osfd:
            osinfo = platform.platform()
            osfd.write(osinfo + "\n")
            # If /etc/os-release is available then save that as well
            fpath = os.path.join(os.sep, "etc", "os-release")
            if os.path.isfile(fpath):
                with open(fpath, "r") as fd:
                    fcontent = fd.read()
                osfd.write("\n/etc/os-release:\n" + fcontent)
        if self.create_tar:
            self.__add_to_archive(snap_ospath)

        # Capture pbs_environment
        self.logger.info("capturing pbs_environment")
        snap_envpath = os.path.join(self.snapdir, PBS_ENV_PATH)
        if self.server.pbs_env is not None:
            with open(snap_envpath, "w") as envfd:
                for k, v in self.server.pbs_env.items():
                    envfd.write(k + "=" + v + "\n")
        if self.create_tar:
            self.__add_to_archive(snap_envpath)

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_pbs_logs(self):
        """
        Capture PBS logs from all relevant hosts

        :returns: name of the output directory/tarfile containing the snapshot
        """
        self.logger.info("capturing PBS logs")

        if self.num_daemon_logs > 0:
            # Capture server logs
            if self.server_info_avail:
                self.__capture_svr_logs()

            # Capture sched logs for all schedulers
            if self.sched_info_avail:
                if self.server_up:
                    sched_info = self.server.status(SCHED)
                    for sched in sched_info:
                        sched_name = sched["id"]
                        pbs_sched_log = sched["sched_log"]
                        if sched_name != "default":
                            snap_sched_log = DFLT_SCHED_LOGS_PATH + \
                                "_" + sched["id"]
                        else:
                            snap_sched_log = DFLT_SCHED_LOGS_PATH
                        snap_sched_log = os.path.join(self.snapdir,
                                                      snap_sched_log)
                        self.__capture_sched_logs(pbs_sched_log,
                                                  snap_sched_log)
                else:
                    # Capture the default sched's logs
                    pbs_sched_log = os.path.join(self.pbs_home,
                                                 "sched_logs")
                    snap_sched_log = os.path.join(self.snapdir,
                                                  DFLT_SCHED_LOGS_PATH)
                    self.__capture_sched_logs(pbs_sched_log, snap_sched_log)

            # Capture mom & comm logs
            if self.mom_info_avail:
                self.__capture_mom_logs()
            if self.comm_info_avail:
                self.__capture_comm_logs()

        if self.num_acct_logs > 0:
            # Capture accounting logs
            self.__capture_acct_logs()

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def capture_all(self):
        """
        Capture a snapshot from the PBS system

        :returns: name of the output directory/tarfile containing the snapshot
        """
        # Capture Server related information
        self.capture_server(with_svr_logs=True, with_acct_logs=True)
        # Capture scheduler information
        self.capture_scheduler(with_sched_logs=True)
        # Capture jobs related information
        self.capture_jobs()
        # Capture nodes relateed information
        self.capture_nodes(with_mom_logs=True)
        # Capture comm related information
        self.capture_comms(with_comm_logs=True)
        # Capture hooks related information
        self.capture_hooks()
        # Capture reservations related information
        self.capture_reservations()
        # Capture datastore related information
        self.capture_datastore(with_db_logs=True)
        # Capture pbs.conf
        self.capture_pbs_conf()
        # Capture system related information
        self.capture_system_info()

        if self.create_tar:
            return self.outtar_path
        else:
            return self.snapdir

    def finalize(self):
        """
        Capture some common information and perform cleanup
        """

        if self.finalized:
            # This function is non-reenterant
            # So just return if it's already been called once
            self.logger.debug("finalize() already called once, skipping it.")
            return

        self.finalized = True

        # Record timestamp of the snapshot
        snap_ctimepath = os.path.join(self.snapdir, CTIME_PATH)
        with open(snap_ctimepath, "w") as ctimefd:
            ctimefd.write(str(self.server.ctime) + "\n")
        if self.create_tar:
            self.__add_to_archive(snap_ctimepath)

        # If the caller was pbs_snapshot, add its log file to the tarball
        if self.create_tar and self.log_path is not None:
            snap_logpath = os.path.join(self.snapdir, self.log_filename)
            self.__add_to_archive(snap_logpath, self.log_path)

        # Cleanup
        if self.create_tar:
            # Close the output tarfile
            self.outtar_fd.close()
            # Remove the snapshot directory
            self.du.rm(path=self.snapdir, recursive=True, force=True)


================================================
FILE: test/fw/ptl/utils/pbs_testsuite.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import calendar
import grp
import inspect
import logging
import os
import platform
import pwd
import socket
import subprocess
import sys
import time
import textwrap
import unittest
from distutils.util import strtobool

import ptl
from ptl.lib.pbs_testlib import *
from ptl.utils.pbs_cliutils import CliUtils
from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_logutils import PBSLogAnalyzer
from ptl.utils.pbs_procutils import ProcMonitor
from ptl.utils.pbs_testusers import *
try:
    from ptl.utils.plugins.ptl_test_tags import tags
except ImportError:
    def tags(*args, **kwargs):
        pass
try:
    from nose.plugins.skip import SkipTest
except ImportError:
    class SkipTest(Exception):
        pass

SETUPLOG = 'setuplog'
TEARDOWNLOG = 'teardownlog'

SMOKE = 'smoke'
REGRESSION = 'regression'
NUMNODES = 'numnodes'
TIMEOUT_KEY = '__testcase_timeout__'
MINIMUM_TESTCASE_TIMEOUT = 600
REQUIREMENTS_KEY = '__PTL_REQS_LIST__'

# unit of min_ram and min_disk is GB
default_requirements = {
    'num_servers': 1,
    'num_moms': 1,
    'num_comms': 1,
    'num_clients': 1,
    'min_mom_ram': .128,
    'min_mom_disk': 1,
    'min_server_ram': .128,
    'min_server_disk': 1,
    'mom_on_server': False,
    'no_mom_on_server': False,
    'no_comm_on_server': False,
    'no_comm_on_mom': True
}


def skip(reason="Skipped test execution"):
    """
    Unconditionally skip a test.

    :param reason: Reason for the skip
    :type reason: str or None
    """
    skip_flag = True

    def wrapper(test_item):
        test_item.__unittest_skip__ = skip_flag
        test_item.__unittest_skip_why__ = reason
        return test_item
    return wrapper


def timeout(val):
    """
    Decorator to set timeout value of test case
    """
    def wrapper(obj):
        setattr(obj, TIMEOUT_KEY, int(val))
        return obj
    return wrapper


def checkModule(modname):
    """
    Decorator to check if named module is available on the system
    and if not skip the test
    """
    def decorated(function):
        import imp
        try:
            imp.find_module(modname)
        except ImportError:
            function.__unittest_skip__ = True
            function.__unittest_skip_why__ = 'Module unavailable ' + modname
        return function
    return decorated


def skipOnCray(function):
    """
    Decorator to skip a test on a ``Cray`` system
    """
    function.__skip_on_cray__ = True
    return function


def skipOnShasta(function):
    """
    Decorator to skip a test on a ``Cray Shasta`` system
    """
    function.__skip_on_shasta__ = True
    return function


def skipOnCpuSet(function):
    """
    Decorator to skip a test on a cgroup cpuset system
    """
    function.__skip_on_cpuset__ = True
    return function


def runOnlyOnLinux(function):
    """
    """
    function.__run_only_on_linux__ = True
    return function


def checkMomBashVersion(function):
    """
    Decorator to skip a test if bash version is less than 4.2.46
    """
    function.__check_mom_bash_version__ = True
    return function


def requirements(*args, **kwargs):
    """
    Decorator to provide the cluster information required for a particular
    testcase.
    """
    def wrap_obj(obj):
        getreq = getattr(obj, REQUIREMENTS_KEY, {})
        for name, value in kwargs.items():
            getreq[name] = value
        setattr(obj, REQUIREMENTS_KEY, getreq)
        return obj
    return wrap_obj


def testparams(**kwargs):
    """
    Decorator to set or modify test specific parameters
    """
    def decorated(function):
        function.__doc__ += "Test Params:" + "\n\t"
        for key, value in kwargs.items():
            function.__doc__ += str(key) + ' : ' + str(value) + '\n\t'

        def wrapper(self, *args):
            self.testconf = {}
            for key, value in kwargs.items():
                keyname = type(self).__name__ + "." + key
                if keyname not in self.conf.keys():
                    self.conf[keyname] = value
                    self.testconf[keyname] = value
                else:
                    self.testconf[keyname] = self.conf[keyname]
                    t = type(value)
                    if t == bool:
                        if strtobool(self.conf[keyname]):
                            self.conf[keyname] = True
                        else:
                            self.conf[keyname] = False
                    else:
                        # If value is not a boolean then typecast
                        self.conf[keyname] = t(self.conf[keyname])

            function(self, *args)
        wrapper.__doc__ = function.__doc__
        wrapper.__name__ = function.__name__
        return wrapper
    return decorated


def generate_hook_body_from_func(hook_func, *args):
    return textwrap.dedent(inspect.getsource(hook_func)) + \
        "%s%s" % (hook_func.__name__, str(args))


class PBSServiceInstanceWrapper(dict):

    """
    A wrapper class to handle multiple service
    ``(i.e., mom, server, scheduler)``instances as passed along
    through the test harness ``(pbs_benchpress)``.Returns an
    ordered dictionary of PBS service instances ``(i.e., mom/server/
    scheduler)``

    Users may invoke PTL using pointers to multiple services per
    host, for example:

    ``pbs_benchpress -p moms=hostA@/etc/pbs.conf,hostB,hostA@/etc/pbs.conf3``

    In such cases, the moms instance variable must be able to distinguish
    the ``self.moms['hostA']`` instances, each instance will be mapped
    to a unique configuration file
    """

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.orderedlist = list(super().keys())

    def __setitem__(self, key, value):
        super(self.__class__, self).__setitem__(key, value)
        if key not in self.orderedlist:
            self.orderedlist.append(key)

    def __getitem__(self, key):
        for k, v in self.items():
            if k == key:
                return v
            if '@' in k:
                name, _ = k.split('@')
                if key in name:
                    return v
            else:
                name = k
            # Users may have specified shortnames instead of FQDN, in order
            # to not enforce that PBS_SERVER match the hostname passed in as
            # parameter, we check if a shortname matches a FQDN entry
            if '.' in key and key.split('.')[0] in name:
                return v
            if '.' in name and name.split('.')[0] in key:
                return v
        return None

    def __contains__(self, key):
        if key in self.keys():
            return True

        for k in self.keys():
            if '@' in k:
                name, _ = k.split('@')
                if key in name:
                    return True
            else:
                name = k
            # Users may have specified shortnames instead of FQDN, in order
            # to not enforce that PBS_SERVER match the hostname passed in as
            # parameter, we check if a shortname matches a FQDN entry
            if '.' in key and key.split('.')[0] in name:
                return True
            if '.' in name and name.split('.')[0] in key:
                return True
        return False

    def __iter__(self):
        return iter(self.orderedlist)

    def host_keys(self):
        return [h.split('@')[0] for h in self.keys()]

    def keys(self):
        return list(self.orderedlist)

    def values(self):
        return list(self[key] for key in self.orderedlist)


class setUpClassError(Exception):
    pass


class tearDownClassError(Exception):
    pass


class PBSTestSuite(unittest.TestCase):

    """
    Generic ``setup``, ``teardown``, and ``logging`` functions to
    be used as parent class for most tests.
    Class instantiates:

    ``server object connected to localhost``

    ``scheduler objected connected to localhost``

    ``mom object connected to localhost``

    Custom parameters:

    :param server: The hostname on which the PBS ``server/scheduler``
                   are running
    :param mom: The hostname on which the PBS MoM is running
    :param servers: Colon-separated list of hostnames hosting a PBS server.
                    Servers are then accessible as a dictionary in the
                    instance variable servers.
    :param client: For CLI mode only, name of the host on which the PBS
                   client commands are to be run from. Format is
                   ``<host>@<path-to-config-file>``
    :param moms: Colon-separated list of hostnames hosting a PBS MoM.
                 MoMs are made accessible as a dictionary in the instance
                 variable moms.
    :param comms: Colon-separated list of hostnames hosting a PBS Comm.
                  Comms are made accessible as a dictionary in the
                  instance variable comms.
    :param nomom: expect no MoM on colon-separated set of hosts
    :param mode: Sets mode of operation to PBS server. Can be either
                 ``'cli'`` or ``'api'``.Defaults to API behavior.
    :param conn_timeout: set a timeout in seconds after which a pbs_connect
                         IFL call is refreshed (i.e., disconnected)
    :param skip-setup: Bypasses setUp of PBSTestSuite (not custom ones)
    :param skip-teardown: Bypasses tearDown of PBSTestSuite (not custom ones)
    :param procinfo: Enables process monitoring thread, logged into
                     ptl_proc_info test metrics. The value can be set to
                     _all_ to monitor all PBS processes,including
                     ``pbs_server``, ``pbs_sched``, ``pbs_mom``, or a process
                     defined by name.
    :param revert-to-defaults=<True|False>: if False, will not revert to
                                            defaults.True by default.
    :param revert-hooks=<True|False>: if False, do not revert hooks to
                                      defaults.Defaults to True.
                                      ``revert-to-defaults`` set to False
                                      overrides this setting.
    :param del-hooks=<True|False>: If False, do not delete hooks. Defaults
                                   to False.``revert-to-defaults`` set to
                                   False overrides this setting.
    :param revert-queues=<True|False>: If False, do not revert queues to
                                       defaults.Defaults to True.
                                       ``revert-to-defaults`` set to False
                                       overrides this setting.
    :param revert-resources=<True|False>: If False, do not revert resources
                                          to defaults. Defaults to True.
                                          ``revert-to-defaults`` set to False
                                          overrides this setting.
    :param del-queues=<True|False>: If False, do not delete queues. Defaults
                                    to False.``revert-to-defaults`` set to
                                    Falseoverrides this setting.
    :param del-vnodes=<True|False>: If False, do not delete vnodes on MoM
                                    instances.Defaults to True.
    :param server-revert-to-defaults=<True|False>: if False, don't revert
                                                   Server to defaults
    :param comm-revert-to-defaults=<True|False>: if False, don't revert Comm
                                                 to defaults
    :param mom-revert-to-defaults=<True|False>: if False, don't revert MoM
                                                to defaults
    :param sched-revert-to-defaults=<True|False>: if False, don't revert
                                                  Scheduler to defaults
    :param procmon: Enables process monitoring. Multiple values must be
                    colon separated. For example to monitor ``server``,
                    ``sched``, and ``mom`` use
                    ``procmon=pbs_server:pbs_sched:pbs_mom``
    :param procmon-freq: Sets a polling frequency for the process monitoring
                         tool.Defaults to 10 seconds.
    :param test-users: colon-separated list of users to use as test users.
                       The users specified override the default users in the
                       order in which they appear in the ``PBS_USERS`` list.
    :param default-testcase-timeout: Default test case timeout value.
    :param data-users: colon-separated list of data users.
    :param oper-users: colon-separated list of operator users.
    :param mgr-users: colon-separated list of manager users.
    :param root-users: colon-separated list of root users.
    :param build-users: colon-separated list of build users.
    :param clienthost: the hostnames to set in the MoM config file
    """

    logger = logging.getLogger(__name__)
    metrics_data = {}
    measurements = []
    additional_data = {}
    conf = {}
    testconf = {}
    param = None
    du = DshUtils()
    _procmon = None
    _process_monitoring = False
    revert_to_defaults = True
    server_revert_to_defaults = True
    mom_revert_to_defaults = True
    sched_revert_to_defaults = True
    revert_queues = True
    revert_resources = True
    revert_hooks = True
    del_hooks = True
    del_queues = True
    del_scheds = True
    del_vnodes = True
    config_saved = False
    server = None
    scheduler = None
    mom = None
    comm = None
    servers = None
    schedulers = {}
    scheds = {}
    moms = None
    comms = None

    @classmethod
    def setUpClass(cls):
        cls.log_enter_setup(True)
        cls._testMethodName = 'setUpClass'
        cls.parse_param()
        cls.init_param()
        cls.check_users_exist()
        cls.init_servers()
        cls.init_schedulers()
        cls.init_moms()
        if cls.use_cur_setup:
            _, path = tempfile.mkstemp(prefix="saved_custom_setup",
                                       suffix=".json")
            ret = cls.server.save_configuration()
            if not ret:
                cls.logger.error("Failed to save server's custom setup")
                raise Exception("Failed to save server's custom setup")
            for mom in cls.moms.values():
                ret = mom.save_configuration()
                if not ret:
                    cls.logger.error("Failed to save mom's custom setup")
                    raise Exception("Failed to save mom's custom setup")
            ret = cls.scheduler.save_configuration(path, 'w')
            if ret:
                cls.saved_file = path
            else:
                cls.logger.error("Failed to save scheduler's custom setup")
                raise Exception("Failed to save scheduler's custom setup")
            cls.add_mgrs_opers()
        cls.init_comms()
        a = {ATTR_license_min: len(cls.moms)}
        cls.server.manager(MGR_CMD_SET, SERVER, a, sudo=True)
        cls.server.restart()
        cls.log_end_setup(True)
        # methods for skipping tests with ptl decorators
        cls.populate_test_dict()
        cls.skip_cray_tests()
        cls.skip_shasta_tests()
        cls.skip_cpuset_tests()
        cls.run_only_on_linux()
        cls.check_mom_bash_version()

    def setUp(self):
        if 'skip-setup' in self.conf:
            return
        self.log_enter_setup()
        self.init_proc_mon()
        if not PBSTestSuite.config_saved and self.use_cur_setup:
            _, path = tempfile.mkstemp(prefix="saved_test_setup",
                                       suffix=".json")
            ret = self.server.save_configuration()
            if not ret:
                self.logger.error("Failed to save server's test setup")
                raise Exception("Failed to save server's test setup")
            for mom in self.moms.values():
                ret = mom.save_configuration()
                if not ret:
                    self.logger.error("Failed to save mom's test setup")
                    raise Exception("Failed to save mom's test setup")
            ret = self.scheduler.save_configuration(path, 'w')
            if ret:
                self.saved_file = path
            else:
                self.logger.error("Failed to save scheduler's test setup")
                raise Exception("Failed to save scheduler's test setup")
            PBSTestSuite.config_saved = True
        # Adding only server, mom & scheduler and pbs.conf methods in use
        # current setup block, rest of them to be added to this block
        # once save & load configurations are implemented for
        # comm
        if not self.use_cur_setup:
            self.revert_servers()
            self.revert_pbsconf()
            self.revert_schedulers()
            self.revert_moms()

        # turn off opt_backfill_fuzzy to avoid unexpected calendaring behavior
        # as many tests assume that scheduler will simulate each event
        a = {'opt_backfill_fuzzy': 'off'}
        for schedinfo in self.schedulers.values():
            for schedname in schedinfo.keys():
                self.server.manager(MGR_CMD_SET, SCHED, a, id=schedname)

        self.revert_comms()
        self.log_end_setup()
        self.measurements = []

    @classmethod
    def populate_test_dict(cls):
        cls.test_dict = {}
        for attr in dir(cls):
            if attr.startswith('test'):
                obj = getattr(cls, attr)
                if callable(obj):
                    cls.test_dict[attr] = obj

    @classmethod
    def skip_cray_tests(cls):
        if not cls.mom.is_cray():
            return
        msg = 'capability not supported on Cray'
        if cls.__dict__.get('__skip_on_cray__', False):
            # skip all test cases in this test suite
            for test_item in cls.test_dict.values():
                test_item.__unittest_skip__ = True
                test_item.__unittest_skip_why__ = msg
        else:
            # skip individual test cases
            for test_item in cls.test_dict.values():
                if test_item.__dict__.get('__skip_on_cray__', False):
                    test_item.__unittest_skip__ = True
                    test_item.__unittest_skip_why__ = msg

    @classmethod
    def skip_shasta_tests(cls):
        if not cls.mom.is_shasta():
            return
        msg = 'capability not supported on Cray Shasta'
        if cls.__dict__.get('__skip_on_shasta__', False):
            # skip all test cases in this test suite
            for test_item in cls.test_dict.values():
                test_item.__unittest_skip__ = True
                test_item.__unittest_skip_why__ = msg
        else:
            # skip individual test cases
            for test_item in cls.test_dict.values():
                if test_item.__dict__.get('__skip_on_shasta__', False):
                    test_item.__unittest_skip__ = True
                    test_item.__unittest_skip_why__ = msg

    @classmethod
    def skip_cpuset_tests(cls):
        skip_cpuset_tests = False
        for mom in cls.moms.values():
            if mom.is_cpuset_mom():
                skip_cpuset_tests = True
                msg = 'capability not supported on cgroup cpuset system: '
                msg += mom.shortname
                break
        if not skip_cpuset_tests:
            return
        if cls.__dict__.get('__skip_on_cpuset__', False):
            # skip all test cases in this test suite
            for test_item in cls.test_dict.values():
                test_item.__unittest_skip__ = True
                test_item.__unittest_skip_why__ = msg
        else:
            # skip individual test cases
            for test_item in cls.test_dict.values():
                if test_item.__dict__.get('__skip_on_cpuset__', False):
                    test_item.__unittest_skip__ = True
                    test_item.__unittest_skip_why__ = msg

    @classmethod
    def run_only_on_linux(cls):
        if cls.mom.is_only_linux():
            return
        msg = 'capability supported only on Linux'
        if cls.__dict__.get('__run_only_on_linux__', False):
            # skip all test cases in this test suite
            for test_item in cls.test_dict.values():
                test_item.__unittest_skip__ = True
                test_item.__unittest_skip_why__ = msg
        else:
            # skip individual test cases
            for test_item in cls.test_dict.values():
                if test_item.__dict__.get('__run_only_on_linux__', False):
                    test_item.__unittest_skip__ = True
                    test_item.__unittest_skip_why__ = msg

    @classmethod
    def check_mom_bash_version(cls):
        skip_test = False
        msg = 'capability supported only for bash version >= 4.2.46'
        for mom in cls.moms.values():
            if not mom.check_mom_bash_version():
                skip_test = True
                break
        if not skip_test:
            return
        if cls.__dict__.get('__check_mom_bash_version__', False):
            # skip all test cases in this test suite
            for test_item in cls.test_dict.values():
                test_item.__unittest_skip__ = True
                test_item.__unittest_skip_why__ = msg
        else:
            # skip individual test cases
            for test_item in cls.test_dict.values():
                if test_item.__dict__.get('__check_mom_bash_version__', False):
                    test_item.__unittest_skip__ = True
                    test_item.__unittest_skip_why__ = msg

    @classmethod
    def log_enter_setup(cls, iscls=False):
        _m = ' Entered ' + cls.__name__ + ' setUp'
        if iscls:
            _m += 'Class'
        _m_len = len(_m)
        cls.logger.info('=' * _m_len)
        cls.logger.info(_m)
        cls.logger.info('=' * _m_len)

    @classmethod
    def log_end_setup(cls, iscls=False):
        _m = 'Completed ' + cls.__name__ + ' setUp'
        if iscls:
            _m += 'Class'
        _m_len = len(_m)
        cls.logger.info('=' * _m_len)
        cls.logger.info(_m)
        cls.logger.info('=' * _m_len)

    @classmethod
    def _validate_param(cls, pname):
        """
        Check if parameter was enabled at the ``command-line``

        :param pname: parameter name
        :type pname: str
        :param pvar: class variable to set according to command-line setting
        """
        if pname not in cls.conf:
            return
        if cls.conf[pname] in PTL_TRUE:
            setattr(cls, pname.replace('-', '_'), True)
        else:
            setattr(cls, pname.replace('-', '_'), False)

    @classmethod
    def _set_user(cls, name, user_list):
        if name in cls.conf:
            for idx, u in enumerate(cls.conf[name].split(':')):
                user_list[idx].__init__(u)

    @classmethod
    def check_users_exist(cls):
        """
        Check whether the user is exist or not
        """
        testusersexist = True
        for u in PBS_ALL_USERS:
            rv = cls.du.check_user_exists(u.name, u.host, u.port)
            if not rv:
                _msg = 'User ' + str(u) + ' does not exist!'
                raise setUpClassError(_msg)
        return testusersexist

    @classmethod
    def kicksched_action(cls, server, obj_type, *args, **kwargs):
        """
        custom scheduler action to kick a scheduling cycle when expectig
        a job state change
        """
        if server is None:
            cls.logger.error('no server defined for custom action')
            return
        if obj_type == JOB:
            if (('scheduling' in server.attributes) and
                    (server.attributes['scheduling'] != 'False')):
                server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                               {'scheduling': 'True'},
                               level=logging.DEBUG)

    @classmethod
    def parse_param(cls):
        """
        get test configuration parameters as a ``comma-separated``
        list of attributes.

        Attributes may be ``'='`` separated key value pairs or standalone
        entries.

        ``Multi-property`` attributes are colon-delimited.
        """
        if cls.param is None:
            return
        for h in cls.param.split(','):
            if '=' in h:
                k, v = h.split('=')
                cls.conf[k.strip()] = v.strip()
            else:
                cls.conf[h.strip()] = ''
        if (('clienthost' in cls.conf) and
                not isinstance(cls.conf['clienthost'], list)):
            cls.conf['clienthost'] = cls.conf['clienthost'].split(':')
        users_map = [('test-users', PBS_USERS),
                     ('oper-users', PBS_OPER_USERS),
                     ('mgr-users', PBS_MGR_USERS),
                     ('data-users', PBS_DATA_USERS),
                     ('root-users', PBS_ROOT_USERS),
                     ('build-users', PBS_BUILD_USERS),
                     ('daemon-users', PBS_DAEMON_SERVICE_USERS)]
        for k, v in users_map:
            cls._set_user(k, v)

    @classmethod
    def init_param(cls):
        cls._validate_param('revert-to-defaults')
        cls._validate_param('server-revert-to-defaults')
        cls._validate_param('comm-revert-to-defaults')
        cls._validate_param('mom-revert-to-defaults')
        cls._validate_param('sched-revert-to-defaults')
        cls._validate_param('del-hooks')
        cls._validate_param('revert-hooks')
        cls._validate_param('del-queues')
        cls._validate_param('del-vnodes')
        cls._validate_param('revert-queues')
        cls._validate_param('revert-resources')

    @classmethod
    def is_server_licensed(cls, server):
        """
        Check if server is licensed or not
        """
        for i in range(0, 10, 1):
            lic = server.status(SERVER, 'license_count', level=logging.INFOCLI)
            if lic and 'license_count' in lic[0]:
                lic = PbsTypeLicenseCount(lic[0]['license_count'])
                if ('Avail_Nodes' in lic) and (int(lic['Avail_Nodes']) > 0):
                    return True
                elif (('Avail_Sockets' in lic) and
                        (int(lic['Avail_Sockets']) > 0)):
                    return True
                elif (('Avail_Global' in lic) and
                        (int(lic['Avail_Global']) > 0)):
                    return True
                elif ('Avail_Local' in lic) and (int(lic['Avail_Local']) > 0):
                    return True
            time.sleep(i)
        return False

    @classmethod
    def init_from_conf(cls, conf, single=None, multiple=None, skip=None,
                       func=None):
        """
        Helper method to parse test parameters for`` mom/server/scheduler``
        instances.

        The supported format of each service request is:

        ``hostname@configuration/path``

        For example:

        ``pbs_benchpress -p server=remote@/etc/pbs.conf.12.0``

        initializes a remote server instance that is configured according to
        the remote file ``/etc/pbs.conf.12.0``
        """
        endpoints = []
        if ((multiple in conf) and (conf[multiple] is not None)):
            __objs = conf[multiple].split(':')
            for _m in __objs:
                tmp = _m.split('@')
                if len(tmp) == 2:
                    endpoints.append(tuple(tmp))
                elif len(tmp) == 1:
                    endpoints.append((tmp[0], None))
        elif ((single in conf) and (conf[single] is not None)):
            tmp = conf[single].split('@')
            if len(tmp) == 2:
                endpoints.append(tuple(tmp))
            elif len(tmp) == 1:
                endpoints.append((tmp[0], None))
        else:
            endpoints = [(socket.gethostname(), None)]
        objs = PBSServiceInstanceWrapper()
        for name, objconf in endpoints:
            if ((skip is not None) and (skip in conf) and
                    ((name in conf[skip]) or (conf[skip] in name))):
                continue
            if objconf is not None:
                n = name + '@' + objconf
            else:
                n = name
            if getattr(cls, "server", None) is not None:
                objs[n] = func(name, pbsconf_file=objconf,
                               server=cls.server.hostname)
            else:
                objs[n] = func(name, pbsconf_file=objconf)
            if objs[n] is None:
                _msg = 'Failed %s(%s, %s)' % (func.__name__, name, objconf)
                raise setUpClassError(_msg)
            objs[n].initialise_service()
        return objs

    @classmethod
    def init_servers(cls, init_server_func=None, skip=None):
        """
        Initialize servers
        """
        if init_server_func is None:
            init_server_func = cls.init_server
        if 'servers' in cls.conf:
            server_param = cls.conf['servers']
            if 'comms' not in cls.conf and 'comm' not in cls.conf:
                cls.conf['comms'] = server_param
            if 'scheduler' not in cls.conf and 'schedulers' not in cls.conf:
                cls.conf['schedulers'] = server_param
            if 'moms' not in cls.conf and 'mom' not in cls.conf:
                cls.conf['moms'] = server_param
        if 'server' in cls.conf:
            server_param = cls.conf['server']
            if 'comm' not in cls.conf:
                cls.conf['comm'] = server_param
            if 'scheduler' not in cls.conf:
                cls.conf['scheduler'] = server_param
            if 'mom' not in cls.conf:
                cls.conf['mom'] = server_param
        cls.servers = cls.init_from_conf(conf=cls.conf, single='server',
                                         multiple='servers', skip=skip,
                                         func=init_server_func)
        if cls.servers:
            cls.server = cls.servers.values()[0]
            for _server in cls.servers.values():
                rv = _server.isUp()
                if not rv:
                    cls.logger.error('server ' + _server.hostname + ' is down')
                    _server.pi.restart(_server.hostname)
                    msg = 'Failed to restart server ' + _server.hostname
                    cls.assertTrue(_server.isUp(), msg)

    @classmethod
    def init_comms(cls, init_comm_func=None, skip=None):
        """
        Initialize comms
        """
        if init_comm_func is None:
            init_comm_func = cls.init_comm
        cls.comms = cls.init_from_conf(conf=cls.conf,
                                       single='comm',
                                       multiple='comms', skip=skip,
                                       func=init_comm_func)
        if cls.comms:
            cls.comm = cls.comms.values()[0]
        cls.server.comms = cls.comms

    @classmethod
    def init_schedulers(cls, init_sched_func=None, skip=None):
        """
        Initialize schedulers
        """
        if init_sched_func is None:
            init_sched_func = cls.init_scheduler
        cls.scheds = cls.init_from_conf(conf=cls.conf,
                                        single='scheduler',
                                        multiple='schedulers', skip=skip,
                                        func=init_sched_func)

        for sched in cls.scheds.values():
            if sched.server.name in cls.schedulers:
                continue
            else:
                cls.schedulers[sched.server.name] = sched.server.schedulers
        # creating a short hand for current host server.schedulers
        cls.scheds = cls.server.schedulers
        try:
            cls.scheduler = cls.scheds['default']
        except KeyError:
            cls.logger.error("Could not get default scheduler:%s, "
                             "check the server(core), server.isUp:%s" %
                             (str(cls.scheds), cls.server.isUp()))
            raise

    @classmethod
    def init_moms(cls, init_mom_func=None, skip='nomom'):
        """
        Initialize moms
        """
        if init_mom_func is None:
            init_mom_func = cls.init_mom
        cls.moms = cls.init_from_conf(conf=cls.conf, single='mom',
                                      multiple='moms', skip=skip,
                                      func=init_mom_func)
        if cls.moms:
            cls.mom = cls.moms.values()[0]
        cls.server.moms = cls.moms

    @classmethod
    def init_server(cls, hostname, pbsconf_file=None):
        """
        Initialize a server instance

        Define custom expect action to trigger a scheduling cycle when job
        is not in running state

        :returns: The server instance on success and None on failure
        """
        client = hostname
        client_conf = None
        if 'client' in cls.conf:
            _cl = cls.conf['client'].split('@')
            client = _cl[0]
            if len(_cl) > 1:
                client_conf = _cl[1]
        server = Server(hostname, pbsconf_file=pbsconf_file, client=client,
                        client_pbsconf_file=client_conf)
        server._conn_timeout = 0
        if cls.conf is not None:
            if 'mode' in cls.conf:
                if cls.conf['mode'] == 'cli':
                    server.set_op_mode(PTL_CLI)
            if 'conn_timeout' in cls.conf:
                conn_timeout = int(cls.conf['conn_timeout'])
                server.set_connect_timeout(conn_timeout)
        sched_action = ExpectAction('kicksched', True, JOB,
                                    cls.kicksched_action)
        server.add_expect_action(action=sched_action)
        return server

    @classmethod
    def init_comm(cls, hostname, pbsconf_file=None, server=None):
        """
        Initialize a Comm instance associated to the given hostname.

        This method must be called after init_server

        :param hostname: The host on which the Comm is running
        :type hostname: str
        :param pbsconf_file: Optional path to an alternate pbs config file
        :type pbsconf_file: str or None
        :returns: The instantiated Comm upon success and None on failure.
        :param server: The server name associated to the Comm
        :type server: str
        Return the instantiated Comm upon success and None on failure.
        """
        try:
            server = cls.servers[server]
        except BaseException:
            server = Server(hostname, pbsconf_file=pbsconf_file)
        return Comm(server, hostname, pbsconf_file=pbsconf_file)

    @classmethod
    def init_scheduler(cls, hostname, pbsconf_file=None, server=None):
        """
        Initialize a Scheduler instance associated to the given server.
        This method must be called after ``init_server``

        :param server: The server name associated to the scheduler
        :type server: str
        :param pbsconf_file: Optional path to an alternate config file
        :type pbsconf_file: str or None
        :param hostname: The host on which Sched is running
        :type hostname: str
        :returns: The instantiated scheduler upon success and None on failure
        """
        try:
            server = cls.servers[server]
        except BaseException:
            server = Server(hostname, pbsconf_file=pbsconf_file)
        return Scheduler(server, hostname=hostname,
                         pbsconf_file=pbsconf_file)

    @classmethod
    def init_mom(cls, hostname, pbsconf_file=None, server=None):
        """
        Initialize a ``MoM`` instance associated to the given hostname.

        This method must be called after ``init_server``

        :param hostname: The host on which the MoM is running
        :type hostname: str
        :param pbsconf_file: Optional path to an alternate pbs config file
        :type pbsconf_file: str or None
        :returns: The instantiated MoM upon success and None on failure.
        """
        try:
            server = cls.servers[server]
        except BaseException:
            server = Server(hostname, pbsconf_file=pbsconf_file)
        return get_mom_obj(server, hostname, pbsconf_file=pbsconf_file)

    def init_proc_mon(self):
        """
        Initialize process monitoring when requested
        """
        if 'procmon' in self.conf:
            _proc_mon = []
            for p in self.conf['procmon'].split(':'):
                _proc_mon += ['.*' + p + '.*']
            if _proc_mon:
                if 'procmon-freq' in self.conf:
                    freq = int(self.conf['procmon-freq'])
                else:
                    freq = 10
                self.start_proc_monitor(name='|'.join(_proc_mon), regexp=True,
                                        frequency=freq)
                self._process_monitoring = True

    def _get_dflt_pbsconfval(self, conf, svr_hostname, hosttype, hostobj):
        """
        Helper function to revert_pbsconf, tries to determine and return
        default value for the pbs.conf variable given

        :param conf: the pbs.conf variable
        :type conf: str
        :param svr_hostname: hostname of the server host
        :type svr_hostname: str
        :param hosttype: type of host being reverted
        :type hosttype: str
        :param hostobj: PTL object associated with the host
        :type hostobj: PBSService

        :return default value of the pbs.conf variable if it can be determined
        as a string, otherwise None
        """
        if conf == "PBS_SERVER":
            return svr_hostname
        elif conf == "PBS_START_SCHED":
            if hosttype == "server":
                return "1"
            else:
                return "0"
        elif conf == "PBS_START_COMM":
            if hosttype == "comm":
                return "1"
            else:
                return "0"
        elif conf == "PBS_START_SERVER":
            if hosttype == "server":
                return "1"
            else:
                return "0"
        elif conf == "PBS_START_MOM":
            if hosttype == "mom":
                return "1"
            else:
                return "0"
        elif conf == "PBS_CORE_LIMIT":
            return "unlimited"
        elif conf == "PBS_SCP":
            scppath = self.du.which(hostobj.hostname, "scp")
            if scppath != "scp":
                return scppath
        elif conf == "PBS_LOG_HIGHRES_TIMESTAMP":
            return "1"
        elif conf == "PBS_PUBLIC_HOST_NAME":
            if hostobj.platform == "shasta" and hosttype == "server":
                return socket.gethostname()
            else:
                return None
        elif conf == "PBS_DAEMON_SERVICE_USER":
            # Only set if scheduler user is not default
            if DAEMON_SERVICE_USER.name == 'root':
                return None
            else:
                return DAEMON_SERVICE_USER.name

        return None

    def _revert_pbsconf_comm(self, primary_server, vals_to_set):
        """
        Helper function to revert_pbsconf to revert all comm daemons' pbs.conf

        :param primary_server: object of the primary PBS server
        :type primary_server: PBSService
        :param vals_to_set: dict of pbs.conf values to set
        :type vals_to_set: dict
        """
        svr_hostnames = [svr.hostname for svr in self.servers.values()]
        for comm in self.comms.values():
            if comm.hostname in svr_hostnames:
                continue

            new_pbsconf = dict(vals_to_set)
            restart_comm = False
            pbs_conf_val = self.du.parse_pbs_config(comm.hostname)
            if not pbs_conf_val:
                raise ValueError("Could not parse pbs.conf on host %s" %
                                 (comm.hostname))

            # to start with, set all keys in new_pbsconf with values from the
            # existing pbs.conf
            keys_to_delete = []
            for conf in new_pbsconf:
                if new_pbsconf[conf]:
                    if (conf in pbs_conf_val) and (new_pbsconf[conf] !=
                                                   pbs_conf_val[conf]):
                        restart_pbs = True
                    elif conf not in pbs_conf_val:
                        restart_pbs = True
                    continue
                elif conf in pbs_conf_val:
                    new_pbsconf[conf] = pbs_conf_val[conf]
                elif conf in pbs_conf_val:
                    new_pbsconf[conf] = pbs_conf_val[conf]
                else:
                    # existing pbs.conf doesn't have a default variable set
                    # Try to determine the default
                    val = self._get_dflt_pbsconfval(conf,
                                                    primary_server.hostname,
                                                    "comm", comm)
                    if val is None:
                        self.logger.info("Couldn't revert %s in pbs.conf"
                                         " to its default value" %
                                         (conf))
                        keys_to_delete.append(conf)
                    else:
                        new_pbsconf[conf] = val

            for key in keys_to_delete:
                del(new_pbsconf[key])

            # Set the comm start bit to 1
            if new_pbsconf["PBS_START_COMM"] != "1":
                new_pbsconf["PBS_START_COMM"] = "1"
                restart_comm = True

            # Set PBS_CORE_LIMIT, PBS_SCP and PBS_SERVER
            if new_pbsconf["PBS_CORE_LIMIT"] != "unlimited":
                new_pbsconf["PBS_CORE_LIMIT"] = "unlimited"
                restart_comm = True
            if new_pbsconf["PBS_SERVER"] != primary_server.hostname:
                new_pbsconf["PBS_SERVER"] = primary_server.hostname
                restart_comm = True
            if "PBS_SCP" not in new_pbsconf:
                scppath = self.du.which(comm.hostname, "scp")
                if scppath != "scp":
                    new_pbsconf["PBS_SCP"] = scppath
                    restart_comm = True
            if new_pbsconf["PBS_LOG_HIGHRES_TIMESTAMP"] != "1":
                new_pbsconf["PBS_LOG_HIGHRES_TIMESTAMP"] = "1"
                restart_comm = True

            # Check if existing pbs.conf has more/less entries than the
            # default list
            if len(pbs_conf_val) != len(new_pbsconf):
                restart_comm = True
            # Check if existing pbs.conf has correct ownership
            dest = self.du.get_pbs_conf_file(comm.hostname)
            (cf_uid, cf_gid) = (os.stat(dest).st_uid, os.stat(dest).st_gid)
            if cf_uid != 0 or cf_gid > 10:
                restart_comm = True

            if restart_comm:
                self.du.set_pbs_config(comm.hostname, confs=new_pbsconf)
                comm.pbs_conf = new_pbsconf
                comm.pi.initd(comm.hostname, "restart", daemon="comm")
                if not comm.isUp():
                    self.fail("comm is not up")

    def _revert_pbsconf_mom(self, primary_server, vals_to_set):
        """
        Helper function to revert_pbsconf to revert all mom daemons' pbs.conf

        :param primary_server: object of the primary PBS server
        :type primary_server: PBSService
        :param vals_to_set: dict of pbs.conf values to set
        :type vals_to_set: dict
        """
        svr_hostnames = [svr.hostname for svr in self.servers.values()]
        for mom in self.moms.values():
            if mom.hostname in svr_hostnames:
                continue
            mom.revert_mom_pbs_conf(primary_server, vals_to_set)

    def _revert_pbsconf_server(self, vals_to_set):
        """
        Helper function to revert_pbsconf to revert all servers' pbs.conf

        :param vals_to_set: dict of pbs.conf values to set
        :type vals_to_set: dict
        """
        for server in self.servers.values():
            new_pbsconf = dict(vals_to_set)
            cmds_to_exec = []
            dmns_to_restart = 0
            restart_pbs = False
            pbs_conf_val = self.du.parse_pbs_config(server.hostname)
            if not pbs_conf_val:
                raise ValueError("Could not parse pbs.conf on host %s" %
                                 (server.hostname))

            # to start with, set all keys in new_pbsconf with values from the
            # existing pbs.conf
            keys_to_delete = []
            for conf in new_pbsconf:
                if new_pbsconf[conf]:
                    if (conf in pbs_conf_val) and (new_pbsconf[conf] !=
                                                   pbs_conf_val[conf]):
                        restart_pbs = True
                    elif conf not in pbs_conf_val:
                        restart_pbs = True
                    continue
                elif conf in pbs_conf_val:
                    new_pbsconf[conf] = pbs_conf_val[conf]
                elif conf in pbs_conf_val:
                    new_pbsconf[conf] = pbs_conf_val[conf]
                else:
                    # existing pbs.conf doesn't have a default variable set
                    # Try to determine the default
                    val = self._get_dflt_pbsconfval(conf,
                                                    server.hostname,
                                                    "server", server)
                    if val is None:
                        self.logger.error("Couldn't revert %s in pbs.conf"
                                          " to its default value" %
                                          (conf))
                        keys_to_delete.append(conf)
                    else:
                        new_pbsconf[conf] = val

            for key in keys_to_delete:
                del(new_pbsconf[key])

            # Set all start bits
            if (new_pbsconf["PBS_START_SERVER"] != "1"):
                new_pbsconf["PBS_START_SERVER"] = "1"
                dmns_to_restart += 1
                cmds_to_exec.append(["server", "start"])
            if (new_pbsconf["PBS_START_SCHED"] != "1"):
                new_pbsconf["PBS_START_SCHED"] = "1"
                cmds_to_exec.append(["sched", "start"])
                dmns_to_restart += 1
            if self.moms and server.hostname not in self.moms:
                if new_pbsconf["PBS_START_MOM"] != "0":
                    new_pbsconf["PBS_START_MOM"] = "0"
                    cmds_to_exec.append(["mom", "stop"])
                    dmns_to_restart += 1
            else:
                if (new_pbsconf["PBS_START_MOM"] != "1"):
                    new_pbsconf["PBS_START_MOM"] = "1"
                    cmds_to_exec.append(["mom", "start"])
                    dmns_to_restart += 1
            if self.comms and server.hostname not in self.comms:
                if new_pbsconf["PBS_START_COMM"] != "0":
                    new_pbsconf["PBS_START_COMM"] = "0"
                    cmds_to_exec.append(["comm", "stop"])
            else:
                if (new_pbsconf["PBS_START_COMM"] != "1"):
                    new_pbsconf["PBS_START_COMM"] = "1"
                    cmds_to_exec.append(["comm", "start"])
                    dmns_to_restart += 1

            if dmns_to_restart == 4:
                # If all daemons need to be started again, just restart PBS
                # instead of making PTL start each of them one at a time
                restart_pbs = True

            # Set PBS_CORE_LIMIT, PBS_SCP, PBS_SERVER
            # and PBS_LOG_HIGHRES_TIMESTAMP
            if new_pbsconf["PBS_CORE_LIMIT"] != "unlimited":
                new_pbsconf["PBS_CORE_LIMIT"] = "unlimited"
                restart_pbs = True
            if new_pbsconf["PBS_SERVER"] != server.shortname:
                new_pbsconf["PBS_SERVER"] = server.shortname
                restart_pbs = True
            if "PBS_SCP" not in new_pbsconf:
                scppath = self.du.which(server.hostname, "scp")
                if scppath != "scp":
                    new_pbsconf["PBS_SCP"] = scppath
                    restart_pbs = True
            if new_pbsconf["PBS_LOG_HIGHRES_TIMESTAMP"] != "1":
                new_pbsconf["PBS_LOG_HIGHRES_TIMESTAMP"] = "1"
                restart_pbs = True
            if DAEMON_SERVICE_USER.name == 'root':
                if "PBS_DAEMON_SERVICE_USER" in new_pbsconf:
                    del(new_pbsconf['PBS_DAEMON_SERVICE_USER'])
                    restart_pbs = True
            elif (new_pbsconf["PBS_DAEMON_SERVICE_USER"] !=
                  DAEMON_SERVICE_USER.name):
                new_pbsconf["PBS_DAEMON_SERVICE_USER"] = \
                    DAEMON_SERVICE_USER.name
                restart_pbs = True
            # if shasta, set PBS_PUBLIC_HOST_NAME
            if server.platform == 'shasta':
                localhost = socket.gethostname()
                if new_pbsconf["PBS_PUBLIC_HOST_NAME"] != localhost:
                    new_pbsconf["PBS_PUBLIC_HOST_NAME"] = localhost
                    restart_pbs = True

            # Check if existing pbs.conf has more/less entries than the
            # default list
            if len(pbs_conf_val) != len(new_pbsconf):
                restart_pbs = True
            # Check if existing pbs.conf has correct ownership
            dest = self.du.get_pbs_conf_file(server.hostname)
            (cf_uid, cf_gid) = (os.stat(dest).st_uid, os.stat(dest).st_gid)
            if cf_uid != 0 or cf_gid > 10:
                restart_pbs = True

            if restart_pbs or dmns_to_restart > 0:
                # Write out the new pbs.conf file
                self.du.set_pbs_config(server.hostname, confs=new_pbsconf,
                                       append=False)
                server.pbs_conf = new_pbsconf

                if restart_pbs:
                    # Restart all
                    server.pi.restart(server.hostname)
                    self._check_daemons_on_server(server, "server")
                    if new_pbsconf["PBS_START_MOM"] == "1":
                        self._check_daemons_on_server(server, "mom")
                    self._check_daemons_on_server(server, "sched")
                    if new_pbsconf["PBS_START_COMM"] == "1":
                        self._check_daemons_on_server(server, "comm")
                else:
                    for initcmd in cmds_to_exec:
                        # start/stop the particular daemon
                        server.pi.initd(server.hostname, initcmd[1],
                                        daemon=initcmd[0])
                        if initcmd[1] == "start":
                            if initcmd[0] == "server":
                                self._check_daemons_on_server(server, "server")
                            if initcmd[0] == "sched":
                                self._check_daemons_on_server(server, "sched")
                            if initcmd[0] == "mom":
                                self._check_daemons_on_server(server, "mom")
                            if initcmd[0] == "comm":
                                self._check_daemons_on_server(server, "comm")

    def _check_daemons_on_server(self, server_obj, daemon_name):
        """
        Checks if specified daemon is up and running on server host
        server_obj : server
        daemon_name : server/sched/mom/comm
        """
        if daemon_name == "server":
            if not server_obj.isUp():
                self.fail("Server is not up")
        elif daemon_name == "sched":
            if not server_obj.schedulers['default'].isUp():
                self.fail("Scheduler is not up")
        elif daemon_name == "mom":
            if not server_obj.moms.values()[0].isUp():
                self.fail("Mom is not up")
        elif daemon_name == "comm":
            if not server_obj.comms.values()[0].isUp():
                self.fail("Comm is not up")
        else:
            self.fail("Incorrect daemon specified")

    def revert_pbsconf(self):
        """
        Revert contents and ownership of the pbs.conf file
        Also start/stop the appropriate daemons
        """
        primary_server = self.server

        vals_to_set = {
            "PBS_HOME": None,
            "PBS_EXEC": None,
            "PBS_SERVER": None,
            "PBS_START_SCHED": None,
            "PBS_START_COMM": None,
            "PBS_START_SERVER": None,
            "PBS_START_MOM": None,
            "PBS_CORE_LIMIT": None,
            "PBS_SCP": None,
            "PBS_LOG_HIGHRES_TIMESTAMP": None
        }

        self._revert_pbsconf_mom(primary_server, vals_to_set)

        server_vals_to_set = copy.deepcopy(vals_to_set)

        server_vals_to_set["PBS_DAEMON_SERVICE_USER"] = None
        if primary_server.platform == 'shasta':
            server_vals_to_set["PBS_PUBLIC_HOST_NAME"] = None

        self._revert_pbsconf_server(server_vals_to_set)

        self._revert_pbsconf_comm(primary_server, vals_to_set)

    def revert_servers(self, force=False):
        """
        Revert the values set for servers
        """
        for server in self.servers.values():
            self.revert_server(server, force)

    def revert_comms(self, force=False):
        """
        Revert the values set for comms
        """
        for comm in self.comms.values():
            self.revert_comm(comm, force)

    def revert_schedulers(self, force=False):
        """
        Revert the values set for schedulers
        """
        for scheds in self.schedulers.values():
            if 'default' in scheds:
                self.revert_scheduler(scheds['default'], force)

    def revert_moms(self, force=False):
        """
        Revert the values set for moms
        """
        self.del_all_nodes = True
        for mom in self.moms.values():
            self.revert_mom(mom, force)

    @classmethod
    def add_mgrs_opers(cls):
        """
        Adding manager and operator users
        """
        if not cls.use_cur_setup:
            try:
                # Unset managers list
                cls.server.manager(MGR_CMD_UNSET, SERVER, 'managers',
                                   sudo=True)
                # Unset operators list
                cls.server.manager(MGR_CMD_UNSET, SERVER, 'operators',
                                   sudo=True)
            except PbsManagerError as e:
                cls.logger.error(e.msg)
        attr = {}
        current_user = pwd.getpwuid(os.getuid())[0]
        if str(current_user) in str(MGR_USER):
            mgrs_opers = {"managers": [str(MGR_USER) + '@*'],
                          "operators": [str(OPER_USER) + '@*']}
        else:
            current_user += '@*'
            mgrs_opers = {"managers": [current_user, str(MGR_USER) + '@*'],
                          "operators": [str(OPER_USER) + '@*']}
        server_stat = cls.server.status(SERVER, ["managers", "operators"])
        if len(server_stat) > 0:
            server_stat = server_stat[0]
        for role, users in mgrs_opers.items():
            if role not in server_stat:
                attr[role] = (INCR, ','.join(users))
            else:
                add_users = []
                for user in users:
                    if user not in server_stat[role]:
                        add_users.append(user)
                if len(add_users) > 0:
                    attr[role] = (INCR, ",".join(add_users))
        if len(attr) > 0:
            cls.server.manager(MGR_CMD_SET, SERVER, attr, sudo=True)

    def revert_server(self, server, force=False):
        """
        Revert the values set for server
        """
        rv = server.isUp()
        if not rv:
            self.logger.error('server ' + server.hostname + ' is down')
            server.start()
            msg = 'Failed to restart server ' + server.hostname
            self.assertTrue(server.isUp(), msg)
        server_stat = server.status(SERVER)[0]
        self.add_mgrs_opers()
        if ((self.revert_to_defaults and self.server_revert_to_defaults) or
                force):
            server.revert_to_defaults(reverthooks=self.revert_hooks,
                                      delhooks=self.del_hooks,
                                      revertqueues=self.revert_queues,
                                      delqueues=self.del_queues,
                                      delscheds=self.del_scheds,
                                      revertresources=self.revert_resources,
                                      server_stat=server_stat)
        rv = self.is_server_licensed(server)
        _msg = 'No license found on server %s' % (server.shortname)
        self.assertTrue(rv, _msg)
        self.logger.info('server: %s licensed', server.hostname)
        server.update_special_attr(SERVER, id=server.hostname)

    def revert_comm(self, comm, force=False):
        """
        Revert the values set for comm
        """
        rv = comm.isUp()
        if not rv:
            self.logger.error('comm ' + comm.hostname + ' is down')
            comm.start()
            msg = 'Failed to restart comm ' + comm.hostname
            self.assertTrue(comm.isUp(), msg)

    def revert_scheduler(self, scheduler, force=False):
        """
        Revert the values set for scheduler
        """
        rv = scheduler.isUp()
        if not rv:
            self.logger.error('scheduler ' + scheduler.hostname + ' is down')
            scheduler.start()
            msg = 'Failed to restart scheduler ' + scheduler.hostname
            self.assertTrue(scheduler.isUp(), msg)
        if ((self.revert_to_defaults and self.sched_revert_to_defaults) or
                force):
            rv = scheduler.revert_to_defaults()
            _msg = 'Failed to revert sched %s' % (scheduler.hostname)
            self.assertTrue(rv, _msg)
        self.server.update_special_attr(SCHED)

    def revert_mom(self, mom, force=False):
        """
        Revert the values set for mom
        :param mom: the MoM object whose values are to be reverted
        :type mom: MoM object
        :param force: Option to reverse forcibly
        :type force: bool
        """
        rv = mom.isUp()
        if not rv:
            self.logger.error('mom ' + mom.hostname + ' is down')
            mom.start()
            msg = 'Failed to restart mom ' + mom.hostname
            self.assertTrue(mom.isUp(), msg)
        restart = False
        enabled_cpuset = False
        if ((self.revert_to_defaults and self.mom_revert_to_defaults and
             mom.revert_to_default) or force):
            # no need to delete vnodes as it is already deleted in
            # server revert_to_defaults
            mom.delete_pelog()
            if mom.has_vnode_defs():
                mom.delete_vnode_defs()
                restart = True
            mom.config = {}
            conf = mom.dflt_config
            if 'clienthost' in self.conf:
                conf.update({'$clienthost': self.conf['clienthost']})
            mom.apply_config(conf=conf, hup=False, restart=False)
            if mom.is_cpuset_mom():
                enabled_cpuset = True
        if restart:
            mom.restart()
        else:
            mom.signal('-HUP')
        if not mom.isUp():
            self.logger.error('mom ' + mom.shortname + ' is down after revert')
        # give mom enough time to network sync with the server on cpuset system
        if enabled_cpuset:
            time.sleep(4)
        a = {'state': 'free'}
        self.server.manager(MGR_CMD_CREATE, NODE, None, mom.shortname,
                            runas=ROOT_USER)
        if enabled_cpuset:
            # In order to avoid intermingling CF/HK/PY file copies from the
            # create node and those caused by the following call, wait
            # until the dialogue between MoM and the server is complete
            time.sleep(4)
            just_before_enable_cgroup_cset = time.time()
            mom.enable_cgroup_cset()
            # a high max_attempts is needed to tolerate delay receiving
            # hook-related files, due to temporary network interruptions
            mom.log_match('pbs_cgroups.CF;copy hook-related '
                          'file request received', max_attempts=120,
                          starttime=just_before_enable_cgroup_cset - 1,
                          interval=1)
            # Make sure that the MoM will generate per-NUMA node vnodes
            # when the natural node was created above.
            # HUP may not be enough if exechost_startup is delayed
            time.sleep(2)
            mom.signal('-HUP')
            self.server.expect(NODE, a, id=mom.shortname + '[0]', interval=1)
        else:
            self.server.expect(NODE, a, id=mom.shortname, interval=1)
            self.server.update_special_attr(NODE, id=mom.shortname)

        return mom

    def analyze_logs(self):
        """
        analyze accounting and scheduler logs from time test was started
        until it finished
        """
        pla = PBSLogAnalyzer()
        self.metrics_data = pla.analyze_logs(serverlog=self.server.logfile,
                                             schedlog=self.scheduler.logfile,
                                             momlog=self.mom.logfile,
                                             acctlog=self.server.acctlogfile,
                                             start=self.server.ctime,
                                             end=time.time())

    def set_test_measurements(self, mdic=None):
        """
        set dictionary of analytical results of the test
        in order to include it in test report

        :param mdic: dictionary with analytical data
        :type mdic: dict

        :returns: True on successful append or False on failure
        """
        if not (mdic and isinstance(mdic, dict)):
            return False
        self.measurements.append(mdic)
        return True

    def add_additional_data_to_report(self, datadic=None):
        """
        set dictionary that will be merged with the test report
        for the overall test run

        :param datadic: dictionary with analytical data
        :type datadic: dict

        :returns: True on succssful update or False on failure
        """
        if not (datadic and isinstance(datadic, dict)):
            return False
        self.additional_data.update(datadic)
        return True

    def start_proc_monitor(self, name=None, regexp=False, frequency=60):
        """
        Start the process monitoring

        :param name: Process name
        :type name: str or None
        :param regexp: Regular expression to match
        :type regexp: bool
        :param frequency: Frequency of monitoring
        :type frequency: int
        """
        if self._process_monitoring:
            self.logger.info('A process monitor is already instantiated')
            return
        self.logger.info('starting process monitoring of ' + name +
                         ' every ' + str(frequency) + 'seconds')
        self._procmon = ProcMonitor(name=name, regexp=regexp,
                                    frequency=frequency)
        self._procmon.start()

    def stop_proc_monitor(self):
        """
        Stop the process monitoring
        """
        if not self._process_monitoring:
            return
        self.logger.info('stopping process monitoring')
        self._procmon.stop()
        self.metrics_data['procs'] = self._procmon.db_proc_info
        self.set_test_measurements(self.metrics_data)
        self._process_monitoring = False

    def skipTest(self, reason=None):
        """
        Skip Test

        :param reason: message to indicate why test is skipped
        :type reason: str or None
        """
        if reason:
            self.logger.warning('test skipped: ' + reason)
        else:
            reason = 'unknown'
        raise SkipTest(reason)

    skip_test = skipTest

    def add_pbs_python_path_to_sys_path(self):
        """
        Add the path to the installed PBS Python modules located in the PBS
        installation directory to the module search path if the path is not
        already present.
        """
        for lib_dir in ['lib64', 'lib']:
            pbs_python_path = os.path.join(
                self.server.pbs_conf['PBS_EXEC'], lib_dir, 'python', 'altair')
            if os.path.isdir(pbs_python_path):
                if pbs_python_path not in sys.path:
                    sys.path.append(pbs_python_path)
                return
        raise Exception(
            "Unable to determine the path to the PBS Python modules in the " +
            "PBS installation directory.")

    @classmethod
    def log_enter_teardown(cls, iscls=False):
        _m = ' Entered ' + cls.__name__ + ' tearDown'
        if iscls:
            _m += 'Class'
        _m_len = len(_m)
        cls.logger.info('=' * _m_len)
        cls.logger.info(_m)
        cls.logger.info('=' * _m_len)

    @classmethod
    def log_end_teardown(cls, iscls=False):
        _m = 'Completed ' + cls.__name__ + ' tearDown'
        if iscls:
            _m += 'Class'
        _m_len = len(_m)
        cls.logger.info('=' * _m_len)
        cls.logger.info(_m)
        cls.logger.info('=' * _m_len)

    @staticmethod
    def delete_current_state(svr, moms):
        """
        Delete nodes, queues, site hooks, reservations and
        vnodedef file
        """
        # unset server attributes
        svr.unset_svr_attrib()
        # Delete site hooks
        svr.delete_site_hooks()
        # cleanup reservations
        svr.cleanup_reservations()
        # Delete vnodedef file & vnodes
        for m in moms:
            # Check if vnodedef file is present
            if moms[m].has_vnode_defs():
                moms[m].delete_vnode_defs()
                moms[m].delete_vnodes()
                moms[m].restart()
        # Delete nodes
        svr.delete_nodes()
        # Delete queues
        svr.delete_queues()
        # Delete resources
        svr.delete_resources()

    def tearDown(self):
        """
        verify that ``server`` and ``scheduler`` are up
        clean up jobs and reservations
        """
        if self.conf:
            self.set_test_measurements({'testconfig': self.testconf})
        if 'skip-teardown' in self.conf:
            return
        self.log_enter_teardown()
        self.server.cleanup_jobs()
        self.stop_proc_monitor()

        for server in self.servers.values():
            server.cleanup_files()

        for comm in self.comms.values():
            if not comm.isUp(max_attempts=1):
                # If the comm was stopped, killed or left in a bad state, bring
                # the comm back up to avoid a possible delay or failure when
                # starting the next test.
                comm.start()

        for mom in self.moms.values():
            mom.cleanup_files()
            if not mom.isUp(max_attempts=1):
                # If the MoM was stopped, killed or left in a bad state, bring
                # the MoM back up to avoid a possible delay or failure when
                # starting the next test.
                mom.start()

        for sched in self.scheds.values():
            sched.cleanup_files()
            if not sched.isUp(max_attempts=1):
                # If the scheduler was stopped, killed or left in a bad state,
                # bring the scheduler back up to avoid a possible delay or
                # failure when starting the next test.
                sched.start()
        self.server.delete_sched_config()

        if self.use_cur_setup:
            self.delete_current_state(self.server, self.moms)
            ret = self.server.load_configuration(self.saved_file)
            if not ret:
                raise Exception("Failed to load server's test setup")
            ret = self.scheduler.load_configuration(self.saved_file)
            if not ret:
                raise Exception("Failed to load scheduler's test setup")
            for mom in self.moms.values():
                ret = mom.load_configuration(self.saved_file)
                if not ret:
                    raise Exception("Failed to load mom's test setup")
            self.du.rm(path=self.saved_file)
        self.log_end_teardown()

    @classmethod
    def tearDownClass(cls):
        cls._testMethodName = 'tearDownClass'
        if cls.use_cur_setup:
            PBSTestSuite.delete_current_state(cls.server, cls.moms)
            PBSTestSuite.config_saved = False
            ret = cls.server.load_configuration(cls.saved_file)
            if not ret:
                raise Exception("Failed to load server's custom setup")
            ret = cls.scheduler.load_configuration(cls.saved_file)
            if not ret:
                raise Exception("Failed to load scheduler's custom setup")
            for mom in cls.moms.values():
                ret = mom.load_configuration(cls.saved_file)
                if not ret:
                    raise Exception("Failed to load mom's custom setup")
            cls.du.rm(path=cls.saved_file)


================================================
FILE: test/fw/ptl/utils/pbs_testusers.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import grp
import pwd
import copy


class PbsGroup(object):

    """
    The PbsGroup type augments a PBS groupname to associate it
    to users to which the group belongs

    :param name: The group name referenced
    :type name: str
    :param gid: gid of group
    :type gid: int or None
    :param users: The list of PbsUser objects the group belongs to
    :type users: List or None
    """

    @staticmethod
    def get_group(group):
        """
        param: group - groupname
        type: group - str or int or class object
        returns PbsGroup class object or None
        """
        if isinstance(group, int):
            for g in PBS_ALL_GROUPS:
                if g.gid == group:
                    return g
        elif isinstance(group, str):
            for g in PBS_ALL_GROUPS:
                if g.name == group:
                    return g
        elif isinstance(group, PbsGroup):
            if group in PBS_ALL_GROUPS:
                return group
        return None

    def __init__(self, name, gid=None, users=None):
        self.name = name
        if gid is not None:
            self.gid = int(gid)
        else:
            self.gid = None

        try:
            _group = grp.getgrnam(self.name)
            self.gid = _group.gr_gid
        except Exception:
            pass

        if users is None:
            self.users = []
        elif isinstance(users, list):
            self.users = users
        else:
            self.users = users.split(",")

        for u in self.users:
            if isinstance(u, str):
                self.users.append(PbsUser(u, groups=[self]))
            elif self not in u.groups:
                u.groups.append(self)

    def __repr__(self):
        return str(self.name)

    def __str__(self):
        return self.__repr__()

    def __int__(self):
        return int(self.gid)


class PbsUser(object):

    """
    The PbsUser type augments a PBS username to associate
    it to groups to which the user belongs

    :param name: The user name referenced
    :type name: str
    :param uid: uid of user
    :type uid: int or None
    :param groups: The list of PbsGroup objects the user
                   belongs to
    :type groups: List or None
    """

    @staticmethod
    def get_user(user):
        """
        param: user - username
        type: user - str or int or class object
        returns PbsUser class object or None
        """
        if isinstance(user, int):
            for u in PBS_ALL_USERS:
                if u.uid == user:
                    return u
        elif isinstance(user, str):
            for u in PBS_ALL_USERS:
                if u.name == user:
                    return u
        elif isinstance(user, PbsUser):
            if user in PBS_ALL_USERS:
                return user
        return None

    def __init__(self, name, uid=None, groups=None):
        self.name = name
        self.home = None
        self.gid = None
        self.shell = None
        self.gecos = None
        self.host = None
        self.port = None
        if uid is not None:
            self.uid = int(uid)
        else:
            self.uid = None
        if "@" in name:
            user = name.split('@')
            self.name = user[0]
            host_port = user[1].split('+')
            self.host = host_port[0]
            if len(host_port) > 1:
                self.port = host_port[1]

        try:
            _user = pwd.getpwnam(self.name)
            self.uid = _user.pw_uid
            self.home = _user.pw_dir
            self.gid = _user.pw_gid
            self.shell = _user.pw_shell
            self.gecos = _user.pw_gecos
        except Exception:
            pass

        if groups is None:
            self.groups = []
        elif isinstance(groups, list):
            self.groups = groups
        else:
            self.groups = groups.split(",")

        for g in self.groups:
            if isinstance(g, str):
                self.groups.append(PbsGroup(g, users=[self]))
            elif self not in g.users:
                g.users.append(self)

    def __repr__(self):
        return str(self.name)

    def __str__(self):
        return self.__repr__()

    def __int__(self):
        return int(self.uid)


# Test users/groups are expected to exist on the test systems
# User running the tests and the test users should have passwordless sudo
# access configured to avoid interrupted (queries for password) test runs

# Groups

TSTGRP0 = PbsGroup('tstgrp00', gid=1900)
TSTGRP1 = PbsGroup('tstgrp01', gid=1901)
TSTGRP2 = PbsGroup('tstgrp02', gid=1902)
TSTGRP3 = PbsGroup('tstgrp03', gid=1903)
TSTGRP4 = PbsGroup('tstgrp04', gid=1904)
TSTGRP5 = PbsGroup('tstgrp05', gid=1905)
TSTGRP6 = PbsGroup('tstgrp06', gid=1906)
TSTGRP7 = PbsGroup('tstgrp07', gid=1907)
GRP_PBS = PbsGroup('pbs', gid=901)
GRP_AGT = PbsGroup('agt', gid=1146)
ROOT_GRP = PbsGroup(grp.getgrgid(0).gr_name, gid=0)

# Users
# first group from group list is primary group of user
TEST_USER = PbsUser('pbsuser', uid=4359, groups=[TSTGRP0])
TEST_USER1 = PbsUser('pbsuser1', uid=4361, groups=[TSTGRP0, TSTGRP1, TSTGRP2])
TEST_USER2 = PbsUser('pbsuser2', uid=4362, groups=[TSTGRP0, TSTGRP1, TSTGRP3])
TEST_USER3 = PbsUser('pbsuser3', uid=4363, groups=[TSTGRP0, TSTGRP1, TSTGRP4])
TEST_USER4 = PbsUser('pbsuser4', uid=4364, groups=[TSTGRP1, TSTGRP4, TSTGRP5])
TEST_USER5 = PbsUser('pbsuser5', uid=4365, groups=[TSTGRP2, TSTGRP4, TSTGRP6])
TEST_USER6 = PbsUser('pbsuser6', uid=4366, groups=[TSTGRP3, TSTGRP4, TSTGRP7])
TEST_USER7 = PbsUser('pbsuser7', uid=4368, groups=[TSTGRP1])

OTHER_USER = PbsUser('pbsother', uid=4358, groups=[TSTGRP0, TSTGRP2, GRP_PBS,
                                                   GRP_AGT])
PBSTEST_USER = PbsUser('pbstest', uid=4355, groups=[TSTGRP0, TSTGRP2, GRP_PBS,
                                                    GRP_AGT])
TST_USR = PbsUser('tstusr00', uid=11000, groups=[TSTGRP0])
TST_USR1 = PbsUser('tstusr01', uid=11001, groups=[TSTGRP0])

BUILD_USER = PbsUser('pbsbuild', uid=9000, groups=[TSTGRP0])
DATA_USER = PbsUser('pbsdata', uid=4372, groups=[TSTGRP0])
MGR_USER = PbsUser('pbsmgr', uid=4367, groups=[TSTGRP0])
OPER_USER = PbsUser('pbsoper', uid=4356, groups=[TSTGRP0, TSTGRP2, GRP_PBS,
                                                 GRP_AGT])
ADMIN_USER = PbsUser('pbsadmin', uid=4357, groups=[TSTGRP0, TSTGRP2, GRP_PBS,
                                                   GRP_AGT])
PBSROOT_USER = PbsUser('pbsroot', uid=4371, groups=[TSTGRP0, TSTGRP2])
ROOT_USER = PbsUser('root', uid=0, groups=[ROOT_GRP])

# This is so pbs_config --make-ug will create a daemon user
# However, the default is to use root as the daemon user
DAEMON_USER = PbsUser('pbsdaemon', uid=4373, groups=[GRP_PBS])
# This will let users edit the daemon user without changing ROOT_USER
DAEMON_SERVICE_USER = copy.deepcopy(ROOT_USER)

PBS_USERS = (TEST_USER, TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
             TEST_USER5, TEST_USER6, TEST_USER7, OTHER_USER, PBSTEST_USER,
             TST_USR, TST_USR1)

PBS_GROUPS = (TSTGRP0, TSTGRP1, TSTGRP2, TSTGRP3, TSTGRP4, TSTGRP5, TSTGRP6,
              TSTGRP7, GRP_PBS, GRP_AGT)

PBS_OPER_USERS = (OPER_USER,)

PBS_MGR_USERS = (MGR_USER, ADMIN_USER)

PBS_DATA_USERS = (DATA_USER,)

PBS_ROOT_USERS = (PBSROOT_USER, ROOT_USER)

PBS_BUILD_USERS = (BUILD_USER,)

PBS_DAEMON_SERVICE_USERS = (DAEMON_SERVICE_USER,)

REQUIRED_USERS = (TEST_USER, TEST_USER1, TEST_USER2, TEST_USER3)

PBS_ALL_USERS = (PBS_USERS + PBS_OPER_USERS + PBS_MGR_USERS +
                 PBS_DATA_USERS + PBS_ROOT_USERS + PBS_BUILD_USERS +
                 PBS_DAEMON_SERVICE_USERS)

PBS_ALL_GROUPS = (PBS_GROUPS + (ROOT_GRP,))


================================================
FILE: test/fw/ptl/utils/plugins/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


================================================
FILE: test/fw/ptl/utils/plugins/ptl_report_json.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import re
import copy
import statistics
from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.plugins.ptl_test_runner import PtlTextTestRunner
import datetime


class PTLJsonData(object):
    """
    The intent of the class is to generate json format of PTL test data
    """

    cur_repeat_count = 1

    def __init__(self, command):
        self.__du = DshUtils()
        self.__cmd = command

    def get_json(self, data, prev_data=None):
        """
        Method to generate test data in accordance to json schema

        :param data: dictionary of a test case details
        :type data: dict
        :param prev_data: dictionary of test run details that ran before
                          the current test
        :type prev_data: dict

        :returns a formatted dictionary of the data
        """
        FMT = '%H:%M:%S.%f'
        run_count = str(PtlTextTestRunner.cur_repeat_count)
        data_json = None
        if not prev_data:
            PTLJsonData.cur_repeat_count = 1
            tests_start = str(data['start_time']).split()[1]
            data_json = {
                'command': self.__cmd,
                'user': self.__du.get_current_user(),
                'product_version': data['pbs_version'],
                'run_id': data['start_time'].strftime('%s'),
                'test_conf': {},
                'machine_info': data['machinfo'],
                'testsuites': {},
                'additional_data': {},
                'test_summary': {},
                'avg_measurements': {},
                'result': {
                    'tests_with_failures': [],
                    'test_suites_with_failures': [],
                    'start': str(data['start_time'])
                }

            }
            test_summary = {
                'result_summary': {
                    'run': 0,
                    'succeeded': 0,
                    'failed': 0,
                    'errors': 0,
                    'skipped': 0,
                    'timedout': 0
                },
                'test_start_time': str(data['start_time']),
                'tests_with_failures': [],
                'test_suites_with_failures': []
            }
            data_json['test_summary'][run_count] = test_summary
            if data['testparam']:
                for param in data['testparam'].split(','):
                    if '=' in param:
                        par = param.split('=', 1)
                        data_json['test_conf'][par[0]] = par[1]
                    else:
                        data_json['test_conf'][param] = True
        else:
            data_json = prev_data
        if PTLJsonData.cur_repeat_count != PtlTextTestRunner.cur_repeat_count:
            test_summary = {
                'result_summary': {
                    'run': 0,
                    'succeeded': 0,
                    'failed': 0,
                    'errors': 0,
                    'skipped': 0,
                    'timedout': 0
                },
                'test_start_time': str(data['start_time']),
                'tests_with_failures': [],
                'test_suites_with_failures': []
            }
            data_json['test_summary'][run_count] = test_summary
            PTLJsonData.cur_repeat_count = PtlTextTestRunner.cur_repeat_count
        tsname = data['suite']
        tcname = data['testcase']
        jdata = {
            'status': data['status'],
            'status_data': str(data['status_data']),
            'duration': str(data['duration']),
            'start_time': str(data['start_time']),
            'end_time': str(data['end_time']),
            'measurements': []
        }
        if 'measurements' in data:
            jdata['measurements'] = data['measurements']
        if PtlTextTestRunner.cur_repeat_count == 1:
            if tsname not in data_json['testsuites']:
                data_json['testsuites'][tsname] = {
                    'module': data['module'],
                    'file': data['file'],
                    'testcases': {}
                }
            tsdoc = []
            if data['suitedoc']:
                tsdoc = (re.sub(r"[\t\n ]+", " ", data['suitedoc'])).strip()
            data_json['testsuites'][tsname]['docstring'] = tsdoc
            tcdoc = []
            if data['testdoc']:
                tcdoc = (re.sub(r"[\t\n ]+", " ", data['testdoc'])).strip()
            data_json['testsuites'][tsname]['testcases'][tcname] = {
                'docstring': tcdoc,
                'requirements': data['requirements'],
                'results': {}
            }
            if data['testdoc']:
                jdata_tests = data_json['testsuites'][tsname]['testcases']
                jdata_tests[tcname]['tags'] = data['tags']
        jdata_tests = data_json['testsuites'][tsname]['testcases']
        jdata_tests[tcname]['results'][run_count] = jdata
        if 'additional_data' in data:
            data_json['additional_data'] = data['additional_data']
        data_json['test_summary'][run_count]['test_end_time'] = str(
            data['end_time'])
        run_summary = data_json['test_summary'][run_count]
        start = run_summary['test_start_time'].split()[1]
        end = str(data['end_time']).split()[1]
        dur = str(datetime.datetime.strptime(end, FMT) -
                  datetime.datetime.strptime(start, FMT))
        data_json['test_summary'][run_count]['tests_duration'] = dur
        data_json['test_summary'][run_count]['result_summary']['run'] += 1
        d_ts = data_json['test_summary'][run_count]
        if data['status'] == 'PASS':
            d_ts['result_summary']['succeeded'] += 1
        elif data['status'] == 'SKIP':
            d_ts['result_summary']['skipped'] += 1
        elif data['status'] == 'TIMEDOUT':
            d_ts['result_summary']['timedout'] += 1
            d_ts['tests_with_failures'].append(data['testcase'])
            if data['suite'] not in d_ts['test_suites_with_failures']:
                d_ts['test_suites_with_failures'].append(data['suite'])
        elif data['status'] == 'ERROR':
            d_ts['result_summary']['errors'] += 1
            d_ts['tests_with_failures'].append(data['testcase'])
            if data['suite'] not in d_ts['test_suites_with_failures']:
                d_ts['test_suites_with_failures'].append(data['suite'])
        elif data['status'] == 'FAIL':
            d_ts['result_summary']['failed'] += 1
            d_ts['tests_with_failures'].append(data['testcase'])
            if data['suite'] not in d_ts['test_suites_with_failures']:
                d_ts['test_suites_with_failures'].append(data['suite'])
        m_avg = {
            'testsuites': {}
        }

        for tsname in data_json['testsuites']:
            m_avg['testsuites'][tsname] = {
                'testcases': {}
            }
            for tcname in data_json['testsuites'][tsname]['testcases']:
                test_status = "PASS"
                m_avg['testsuites'][tsname]['testcases'][tcname] = []
                t_sum = []
                count = 0
                j_data = data_json['testsuites'][tsname]['testcases'][tcname]
                measurements_data = []
                for key in j_data['results'].keys():
                    count += 1
                    r_count = str(count)
                    m_case = data_json['testsuites'][tsname]['testcases']
                    m = m_case[tcname]['results'][r_count]['measurements']
                    if j_data['results'][r_count]['status'] != "PASS":
                        test_status = "FAIL"
                    m_sum = []
                    for i in range(len(m)):
                        sum_mean = []
                        sum_std = []
                        sum_min = []
                        sum_max = []
                        record = []
                        if "test_measure" in m[i].keys():
                            if len(t_sum) > i:
                                sum_mean.extend(t_sum[i][0])
                                sum_std.extend(t_sum[i][1])
                                sum_min.extend(t_sum[i][2])
                                sum_max.extend(t_sum[i][3])
                            else:
                                measurements_data.append(m[i])
                                sum_mean.append(m[i]["test_data"]['mean'])
                            sum_std.append(m[i]["test_data"]['mean'])
                            sum_min.append(m[i]["test_data"]['minimum'])
                            sum_max.append(m[i]["test_data"]['maximum'])
                            record = [sum_mean, sum_std, sum_min, sum_max]
                        else:
                            if len(measurements_data) <= i:
                                measurements_data.append(m[i])
                            record = [sum_mean, sum_std, sum_min, sum_max]
                        m_sum.append(record)
                    if len(t_sum) > len(m_sum):
                        for v in range(len(m_sum)):
                            t_sum[v] = m_sum[v]
                    else:
                        t_sum = m_sum
                m_list = []
                if test_status == "PASS":
                    for i in range(len(measurements_data)):
                        m_data = {}
                        if "test_measure" in measurements_data[i].keys():
                            measure = measurements_data[i]['test_measure']
                            m_data['test_measure'] = measure
                            m_data['unit'] = measurements_data[i]['unit']
                            m_data['test_data'] = {}
                            if len(t_sum[i][1]) < 2:
                                std_dev = 0
                            else:
                                std_dev = statistics.stdev(t_sum[i][1])
                            mean = statistics.mean(t_sum[i][1])
                            lowv = mean - (std_dev * 2)
                            uppv = mean + (std_dev * 2)
                            new_list = [x for x in t_sum[i]
                                        [1] if x > lowv and x < uppv]
                            if len(new_list) == 0:
                                new_list = t_sum[i][1]
                            else:
                                mean = statistics.mean(new_list)
                                std_dev = statistics.stdev(new_list)
                            minimum = min(t_sum[i][2])
                            maximum = max(t_sum[i][3])
                            m_data['test_data']['std_dev'] = std_dev
                            m_data['test_data']['mean'] = mean
                            m_data['test_data']['minimum'] = minimum
                            m_data['test_data']['maximum'] = maximum
                            m_data['test_data']['samples_considered'] = len(
                                new_list)
                            m_data['test_data']['total_samples'] = len(
                                t_sum[i][1])
                        m_list.append(m_data)
                    m_avg['testsuites'][tsname]['testcases'][tcname] = m_list
        data_json["avg_measurements"] = m_avg

        data_json['result']['end'] = str(data['end_time'])
        start = data_json['result']['start'].split()[1]
        end = data_json['result']['end'].split()[1]
        dur = str(datetime.datetime.strptime(end, FMT) -
                  datetime.datetime.strptime(start, FMT))
        fail_tests = []
        fail_ts = []
        for count in range(PtlTextTestRunner.cur_repeat_count):
            r_count = str(count + 1)
            fail_tests.extend(
                data_json['test_summary'][r_count]['tests_with_failures'])
            fail_ts.extend(data_json['test_summary']
                           [r_count]['test_suites_with_failures'])
        data_json['result']['duration'] = dur
        data_json['result']['tests_with_failures'] = list(set(fail_tests))
        data_json['result']['test_suites_with_failures'] = list(set(fail_ts))
        return data_json


================================================
FILE: test/fw/ptl/utils/plugins/ptl_test_data.py
================================================
# coding: utf-8
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import os
import sys
import socket
import logging
import signal
import pwd
import re
from nose.util import isclass
from nose.plugins.base import Plugin
from nose.plugins.skip import SkipTest
from ptl.utils.plugins.ptl_test_runner import TimeOut
from ptl.utils.pbs_dshutils import DshUtils

log = logging.getLogger('nose.plugins.PTLTestData')


class PTLTestData(Plugin):

    """
    Save post analysis data on test cases failure or error
    """
    name = 'PTLTestData'
    score = sys.maxsize - 6
    logger = logging.getLogger(__name__)

    def __init__(self):
        Plugin.__init__(self)
        self.post_data_dir = None
        self.max_postdata_threshold = None
        self.__save_data_count = 0
        self.__priv_sn = ''
        self.du = DshUtils()

    def options(self, parser, env):
        """
        Register command line options
        """
        pass

    def set_data(self, post_data_dir, max_postdata_threshold):
        self.post_data_dir = post_data_dir
        self.max_postdata_threshold = max_postdata_threshold

    def configure(self, options, config):
        """
        Configure the plugin and system, based on selected options
        """
        self.config = config
        if self.post_data_dir is not None:
            self.enabled = True
        else:
            self.enabled = False

    def __save_home(self, test, status, err=None):
        if hasattr(test, 'test'):
            _test = test.test
            sn = _test.__class__.__name__
        elif hasattr(test, 'context'):
            _test = test.context
            sn = _test.__name__
        else:
            # test does not have any PBS Objects, so just return
            return
        if self.__priv_sn != sn:
            self.__save_data_count = 0
            self.__priv_sn = sn
        # Saving home might take time so disable timeout
        # handler set by runner
        tn = getattr(_test, '_testMethodName', 'unknown')
        testlogs = getattr(test, 'captured_logs', '')
        datadir = os.path.join(self.post_data_dir, sn, tn)
        if os.path.exists(datadir):
            _msg = 'Old post analysis data exists at %s' % datadir
            _msg += ', skipping saving data for this test case'
            self.logger.warn(_msg)
            _msg = 'Please remove old directory or'
            _msg += ' provide different directory'
            self.logger.warn(_msg)
            return
        if getattr(test, 'old_sigalrm_handler', None) is not None:
            _h = getattr(test, 'old_sigalrm_handler')
            signal.signal(signal.SIGALRM, _h)
            signal.alarm(0)
        self.logger.log(logging.DEBUG2, 'Saving post analysis data...')
        current_host = socket.gethostname().split('.')[0]
        self.du.mkdir(current_host, path=datadir, mode=0o755,
                      parents=True, logerr=False, level=logging.DEBUG2)
        if err is not None:
            if isclass(err[0]) and issubclass(err[0], SkipTest):
                status = 'SKIP'
                status_data = 'Reason = %s' % (err[1])
            else:
                if isclass(err[0]) and issubclass(err[0], TimeOut):
                    status = 'TIMEDOUT'
                status_data = getattr(test, 'err_in_string', '')
        else:
            status_data = ''
        logfile = os.path.join(datadir, 'logfile_' + status)
        f = open(logfile, 'w+')
        f.write(testlogs + '\n')
        f.write(status_data + '\n')
        f.write('test duration: %s\n' % str(getattr(test, 'duration', '0')))
        if status in ('PASS', 'SKIP'):
            # Test case passed or skipped, no need to save post analysis data
            f.close()
            return
        if ((self.max_postdata_threshold != 0) and
                (self.__save_data_count >= self.max_postdata_threshold)):
            _msg = 'Total number of saved post analysis data for this'
            _msg += ' testsuite is exceeded max postdata threshold'
            _msg += ' (%d)' % self.max_postdata_threshold
            f.write(_msg + '\n')
            self.logger.error(_msg)
            f.close()
            return

        servers = getattr(_test, 'servers', None)
        if servers is not None:
            server_host = servers.values()[0].shortname
        else:
            _msg = 'Could not find Server Object in given test object'
            _msg += ', skipping saving post analysis data'
            f.write(_msg + '\n')
            self.logger.warning(_msg)
            f.close()
            return
        moms = getattr(_test, 'moms', None)
        comms = getattr(_test, 'comms', None)
        client = getattr(_test.servers.values()[0], 'client', None)
        server = servers.values()[0]
        add_hosts = []
        if len(servers) > 1:
            for param in servers.values()[1:]:
                add_hosts.append(param.shortname)
        if moms is not None:
            for param in moms.values():
                add_hosts.append(param.shortname)
        if comms is not None:
            for param in comms.values():
                add_hosts.append(param.shortname)
        if client is not None:
            add_hosts.append(client.split('.')[0])

        add_hosts = list(set(add_hosts) - set([server_host]))

        pbs_snapshot_path = os.path.join(
            server.pbs_conf["PBS_EXEC"], "sbin", "pbs_snapshot")
        cur_user = self.du.get_current_user()
        cur_user_dir = pwd.getpwnam(cur_user).pw_dir
        cmd = [
            pbs_snapshot_path,
            '-H', server_host,
            '--daemon-logs',
            '2',
            '--accounting-logs',
            '2',
            '--with-sudo'
        ]
        if len(add_hosts) > 0:
            cmd += ['--additional-hosts=' + ','.join(add_hosts)]
        cmd += ['-o', cur_user_dir]
        ret = self.du.run_cmd(current_host, cmd, level=logging.DEBUG2,
                              logerr=False)
        if ret['rc'] != 0:
            _msg = 'Failed to get analysis information '
            _msg += 'on %s:' % server_host
            _msg += '\n\n' + '\n'.join(ret['err']) + '\n\n'
            f.write(_msg + '\n')
            self.logger.error(_msg)
            f.close()
            return
        else:
            if len(ret['out']) == 0:
                self.logger.error('Snapshot command failed')
                f.close()
                return

        snap_out = ret['out'][0]
        snap_out_dest = (snap_out.split(":")[1]).strip()

        dest = os.path.join(datadir,
                            'PBS_' + server_host + '.tar.gz')
        ret = self.du.run_copy(current_host, src=snap_out_dest,
                               dest=dest, sudo=True, level=logging.DEBUG2)
        self.du.rm(current_host, path=snap_out_dest,
                   recursive=True, force=True, level=logging.DEBUG2)

        f.close()
        self.__save_data_count += 1
        _msg = 'Saved post analysis data'
        self.logger.info(_msg)

    def addError(self, test, err):
        self.__save_home(test, 'ERROR', err)

    def addFailure(self, test, err):
        self.__save_home(test, 'FAIL', err)

    def addSuccess(self, test):
        self.__save_home(test, 'PASS')


================================================
FILE: test/fw/ptl/utils/plugins/ptl_test_db.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import datetime
import json
import copy
import logging
import os
import platform
import pwd
import sys
import time
import traceback

import ptl
import ptl.utils.pbs_logutils as lu
from ptl.lib.pbs_testlib import PbsTypeDuration
from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_testsuite import default_requirements
from ptl.utils.plugins.ptl_report_json import PTLJsonData
from ptl.utils.plugins.ptl_test_tags import TAGKEY

# Following dance require because PTLTestDb().process_output() from this file
# is used in pbs_loganalyzer script which is shipped with PBS package
# through unsupported directory where we might not have nose installed
try:
    from nose.util import isclass
    from nose.plugins.base import Plugin
    from nose.plugins.skip import SkipTest
    from ptl.utils.plugins.ptl_test_runner import TimeOut
    log = logging.getLogger('nose.plugins.PTLTestDb')
except ImportError:
    class Plugin(object):
        pass

    def isclass(obj):
        pass

    class SkipTest(Exception):
        pass

    class TimeOut(Exception):
        pass
    log = logging.getLogger('PTLTestDb')

# Table names
_DBVER_TN = 'ptl_db_version'
_TESTRESULT_TN = 'ptl_test_results'
_SCHEDM_TN = 'ptl_scheduler_metrics'
_SVRM_TN = 'ptl_server_metrics'
_MOMM_TN = 'ptl_mom_metrics'
_ACCTM_TN = 'ptl_accounting_metrics'
_PROCM_TN = 'ptl_proc_metrics'
_CYCLEM_TN = 'ptl_cycle_metrics'
_ESTINFOSUM_TN = 'ptl_estimated_info_summary'
_ESTINFO_TN = 'ptl_estimated_info'
_JOBM_TN = 'ptl_job_metrics'


class PTLDbError(Exception):

    """
    PTL database error class

    :param rv: Return value for the database error
    :type rv: str or None
    :param rc: Return code for the database error
    :type rc: str or None
    :param msg: Error message
    :type msg: str or None
    """

    def __init__(self, rv=None, rc=None, msg=None, post=None, *args, **kwargs):
        self.rv = rv
        self.rc = rc
        self.msg = msg
        if post is not None:
            post(*args, **kwargs)

    def __str__(self):
        return ('rc=' + str(self.rc) + ', rv=' + str(self.rv) +
                ', msg=' + str(self.msg))

    def __repr__(self):
        return (self.__class__.__name__ + '(rc=' + str(self.rc) + ', rv=' +
                str(self.rv) + ', msg=' + str(self.msg) + ')')


class DBType(object):

    """
    Base class for each database type
    Any type of database must inherit from me

    :param dbtype: Database type
    :type dbtype: str
    :param dbpath: Path to database
    :type dbpath: str
    :param dbaccess: Path to a file that defines db options
    :type dbaccess: str
    """

    def __init__(self, dbtype, dbpath, dbaccess):
        if dbpath is None:
            dn = _TESTRESULT_TN + '.db'
            dbdir = os.getcwd()
            dbpath = os.path.join(dbdir, dn)
        elif os.path.isdir(dbpath):
            dn = _TESTRESULT_TN + '.db'
            dbdir = dbpath
            dbpath = os.path.join(dbdir, dn)
        else:
            dbdir = os.path.dirname(dbpath)
            dbpath = dbpath
        self.dbtype = dbtype
        self.dbpath = dbpath
        self.dbdir = dbdir
        self.dbaccess = dbaccess

    def write(self, data, logfile=None):
        """
        :param data: Data to write
        :param logfile: Can be one of ``server``, ``scheduler``, ``mom``,
                        ``accounting`` or ``procs``
        :type logfile: str or None
        """
        _msg = 'write method must be implemented in'
        _msg += ' %s' % (str(self.__class__.__name__))
        raise PTLDbError(rc=1, rv=False, msg=_msg)

    def close(self, result=None):
        """
        Close the database
        """
        _msg = 'close method must be implemented in'
        _msg += ' %s' % (str(self.__class__.__name__))
        raise PTLDbError(rc=1, rv=False, msg=_msg)


class PostgreSQLDb(DBType):

    """
    PostgreSQL type database
    """

    def __init__(self, dbtype, dbpath, dbaccess):
        DBType.__init__(self, dbtype, dbpath, dbaccess)
        if self.dbtype != 'pgsql':
            _msg = 'db type does not match with my type(file)'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        if self.dbaccess is None:
            _msg = 'Db access creds require!'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        try:
            import psycopg2
        except ImportError:
            _msg = 'psycopg2 require for %s type database!' % (self.dbtype)
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        try:
            f = open(self.dbaccess)
            creds = ' '.join([n.strip() for n in f.readlines()])
            f.close()
            self.__dbobj = psycopg2.connect(creds)
        except Exception as e:
            _msg = 'Failed to connect to database:\n%s\n' % (str(e))
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        self.__username = pwd.getpwuid(os.getuid())[0]
        self.__platform = ' '.join(platform.uname()).strip()
        self.__ptlversion = str(ptl.__version__)
        self.__db_version = '1.0.0'
        self.__index = self.__create_tables()

    def __get_index(self, c):
        idxs = []
        stmt = 'SELECT max(id) from %s;' % (_TESTRESULT_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_SCHEDM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_SVRM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_MOMM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_ACCTM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_PROCM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_CYCLEM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_ESTINFOSUM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_ESTINFO_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_JOBM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        idx = max(idxs)
        if idx is not None:
            return idx
        else:
            return 1

    def __upgrade_db(self, version):
        if version == self.__db_version:
            return

    def __create_tables(self):
        c = self.__dbobj.cursor()

        try:
            stmt = ['CREATE TABLE %s (' % (_DBVER_TN)]
            stmt += ['version TEXT);']
            c.execute(''.join(stmt))
        except BaseException:
            stmt = 'SELECT version from %s;' % (_DBVER_TN)
            version = c.execute(stmt).fetchone()[0]
            self.__upgrade_db(version)
            return self.__get_index(c)
        stmt = ['INSERT INTO %s (version)' % (_DBVER_TN)]
        stmt += [' VALUES (%s);' % (self.__db_version)]
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_TESTRESULT_TN)]
        stmt += ['id INTEGER,']
        stmt += ['suite TEXT,']
        stmt += ['testcase TEXT,']
        stmt += ['testdoc TEXT,']
        stmt += ['start_time TEXT,']
        stmt += ['end_time TEXT,']
        stmt += ['duration TEXT,']
        stmt += ['pbs_version TEXT,']
        stmt += ['testparam TEXT,']
        stmt += ['username TEXT,']
        stmt += ['ptl_version TEXT,']
        stmt += ['platform TEXT,']
        stmt += ['status TEXT,']
        stmt += ['status_data TEXT,']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_SCHEDM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.VER + ' TEXT,']
        stmt += [lu.NC + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJC + ' INTEGER,']
        stmt += [lu.NJFR + ' INTEGER,']
        stmt += [lu.mCD + '  TIME,']
        stmt += [lu.CD25 + ' TIME,']
        stmt += [lu.CDA + ' TIME,']
        stmt += [lu.CD50 + ' TIME,']
        stmt += [lu.CD75 + ' TIME,']
        stmt += [lu.MCD + ' TIME,']
        stmt += [lu.mCT + ' TIMESTAMP,']
        stmt += [lu.MCT + ' TIMESTAMP,']
        stmt += [lu.TTC + ' TIME,']
        stmt += [lu.DUR + ' TIME,']
        stmt += [lu.SST + ' TIME,']
        stmt += [lu.JRR + ' TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_SVRM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.VER + ' TEXT,']
        stmt += [lu.NJQ + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJE + ' INTEGER,']
        stmt += [lu.JRR + ' TEXT,']
        stmt += [lu.JER + ' TEXT,']
        stmt += [lu.JSR + ' TEXT,']
        stmt += [lu.NUR + ' TEXT,']
        stmt += [lu.JWTm + ' TIME,']
        stmt += [lu.JWT25 + ' TIME,']
        stmt += [lu.JWT50 + ' TIME,']
        stmt += [lu.JWTA + ' TIME,']
        stmt += [lu.JWT75 + ' TIME,']
        stmt += [lu.JWTM + ' TIME,']
        stmt += [lu.JRTm + ' TIME,']
        stmt += [lu.JRT25 + ' TIME,']
        stmt += [lu.JRTA + ' TIME,']
        stmt += [lu.JRT50 + ' TIME,']
        stmt += [lu.JRT75 + ' TIME,']
        stmt += [lu.JRTM + ' TIME);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_MOMM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.VER + ' TEXT,']
        stmt += [lu.NJQ + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJE + ' INTEGER,']
        stmt += [lu.JRR + ' TEXT,']
        stmt += [lu.JER + ' TEXT,']
        stmt += [lu.JSR + ' TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_ACCTM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.DUR + ' TEXT,']
        stmt += [lu.NJQ + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJE + ' INTEGER,']
        stmt += [lu.JRR + ' TEXT,']
        stmt += [lu.JSR + ' TEXT,']
        stmt += [lu.JER + ' TEXT,']
        stmt += [lu.JWTm + ' TIME,']
        stmt += [lu.JWT25 + ' TIME,']
        stmt += [lu.JWT50 + ' TIME,']
        stmt += [lu.JWTA + ' TIME,']
        stmt += [lu.JWT75 + ' TIME,']
        stmt += [lu.JWTM + ' TIME,']
        stmt += [lu.JRTm + ' TIME,']
        stmt += [lu.JRT25 + ' TIME,']
        stmt += [lu.JRTA + ' TIME,']
        stmt += [lu.JRT50 + ' TIME,']
        stmt += [lu.JRT75 + ' TIME,']
        stmt += [lu.JRTM + ' TIME,']
        stmt += [lu.JNSm + ' INTEGER,']
        stmt += [lu.JNS25 + ' REAL,']
        stmt += [lu.JNSA + ' REAL,']
        stmt += [lu.JNS50 + ' REAL,']
        stmt += [lu.JNS75 + ' REAL,']
        stmt += [lu.JNSM + ' REAL,']
        stmt += [lu.JCSm + ' INTEGER,']
        stmt += [lu.JCS25 + ' REAL,']
        stmt += [lu.JCSA + ' REAL,']
        stmt += [lu.JCS50 + ' REAL,']
        stmt += [lu.JCS75 + ' REAL,']
        stmt += [lu.JCSM + ' REAL,']
        stmt += [lu.CPH + ' INTEGER,']
        stmt += [lu.NPH + ' INTEGER,']
        stmt += [lu.UNCPUS + ' TEXT,']
        stmt += [lu.UNODES + ' TEXT,']
        stmt += [lu.USRS + ' TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_PROCM_TN)]
        stmt += ['id INTEGER, ']
        stmt += ['name TEXT,']
        stmt += ['rss INTEGER,']
        stmt += ['vsz INTEGER,']
        stmt += ['pcpu TEXT,']
        stmt += ['time TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_CYCLEM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.CST + ' TIMESTAMP,']
        stmt += [lu.CD + ' TIME,']
        stmt += [lu.QD + ' TIME,']
        stmt += [lu.NJC + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJFR + ' INTEGER,']
        stmt += [lu.NJCAL + ' INTEGER,']
        stmt += [lu.NJFP + ' INTEGER,']
        stmt += [lu.NJP + ' INTEGER,']
        stmt += [lu.TTC + ' INTEGER,']
        stmt += [lu.SST + ' INTEGER);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_ESTINFOSUM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.NJD + ' INTEGER,']
        stmt += [lu.NJND + ' INTEGER,']
        stmt += [lu.Ds15mn + ' INTEGER,']
        stmt += [lu.Ds1hr + ' INTEGER,']
        stmt += [lu.Ds3hr + ' INTEGER,']
        stmt += [lu.Do3hr + ' INTEGER,']
        stmt += [lu.DDm + ' INTEGER,']
        stmt += [lu.DDM + ' INTEGER,']
        stmt += [lu.DDA + ' INTEGER,']
        stmt += [lu.DD50 + ' INTEGER);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_ESTINFO_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.JID + ' TEXT,']
        stmt += [lu.Eat + ' INTEGER,']
        stmt += [lu.JST + ' INTEGER,']
        stmt += [lu.ESTR + ' INTEGER,']
        stmt += [lu.ESTA + ' INTEGER,']
        stmt += [lu.NEST + ' INTEGER,']
        stmt += [lu.ND + ' INTEGER,']
        stmt += [lu.JDD + ' INTEGER);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_JOBM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.CST + ' TIMESTAMP,']
        stmt += [lu.JID + ' TEXT,']
        stmt += [lu.T2R + ' INTEGER,']
        stmt += [lu.T2D + ' INTEGER,']
        stmt += [lu.TiS + ' INTEGER,']
        stmt += [lu.TTC + ' INTEGER);']
        c.execute(''.join(stmt))
        self.__dbobj.commit()
        return self.__get_index(c)

    def __write_data(self, tablename, data, logfile):
        keys = ['id']
        values = [str(self.__index)]
        if logfile is not None:
            keys.append('logname')
            values.append('\'' + str(logfile).replace(' ', '_') + '\'')
        for k, v in data.items():
            if k == 'id':
                continue
            keys.append(str(k))
            v = str(v)
            if v.isdigit():
                values.append(v)
            else:
                values.append('\'' + v + '\'')
        _keys = ','.join(keys)
        _values = ','.join(values)
        c = self.__dbobj.cursor()
        s = 'INSERT INTO %s (%s) VALUES (%s)' % (tablename, _keys, _values)
        c.execute(s)
        self.__dbobj.commit()

    def __write_server_data(self, data, logfile=None):
        self.__write_data(_SVRM_TN, data, logfile)

    def __write_mom_data(self, data, logfile=None):
        self.__write_data(_MOMM_TN, data, logfile)

    def __write_sched_data(self, data, logfile=None):
        for k, v in data.items():
            if k == 'summary':
                self.__write_data(_SCHEDM_TN, data, logfile)
                continue
            elif k == lu.EST:
                if lu.ESTS in v:
                    self.__write_estinfosum_data(v[lu.ESTS], logfile)
                if lu.EJ in v:
                    for j in v[lu.EJ]:
                        if lu.EST in j:
                            dt = [str(s) for s in j[lu.Eat]]
                            j[lu.Eat] = ','.join(dt)
                        self.__write_estsum_data(j, logfile)
                continue
            if 'jobs' in v:
                for j in v['jobs']:
                    j[lu.CST] = v[lu.CST]
                    self.__write_job_data(j, logfile)
                del v['jobs']
            self.__write_cycle_data(v, logfile)

    def __write_acct_data(self, data, logfile=None):
        self.__write_data(_ACCTM_TN, data, logfile)

    def __write_proc_data(self, data, logfile=None):
        self.__write_data(_PROCM_TN, data, None)

    def __write_cycle_data(self, data, logfile=None):
        self.__write_data(_CYCLEM_TN, data, logfile)

    def __write_estsum_data(self, data, logfile=None):
        self.__write_data(_ESTINFOSUM_TN, data, logfile)

    def __write_estinfosum_data(self, data, logfile=None):
        self.__write_data(_ESTINFO_TN, data, logfile)

    def __write_job_data(self, data, logfile=None):
        self.__write_data(_JOBM_TN, data, logfile)

    def __write_test_data(self, data):
        keys = ['id']
        values = [str(self.__index)]
        keys.append('suite')
        values.append(str(data['suite']))
        keys.append('testcase')
        values.append(str(data['testcase']))
        doc = []
        for l in str(data['testdoc']).strip().split('\n'):
            doc.append(l.strip().replace('\t', ' ').replace('\'', '\'\''))
        doc = ' '.join(doc)
        keys.append('testdoc')
        values.append('\'' + doc + '\'')
        keys.append('start_time')
        values.append(str(data['start_time']))
        keys.append('end_time')
        values.append(str(data['end_time']))
        keys.append('duration')
        values.append(str(data['duration']))
        keys.append('pbs_version')
        values.append(str(data['pbs_version']))
        keys.append('testparam')
        values.append(str(data['testparam']))
        keys.append('username')
        values.append(str(self.__username))
        keys.append('platform')
        values.append(str(self.__platform))
        keys.append('status')
        values.append(str(data['status']))
        sdata = data['status_data']
        sdata = sdata.replace('\'', '\'\'')
        keys.append('status_data')
        values.append('\'' + sdata + '\'')
        _keys = ','.join(keys)
        _values = ','.join(values)
        c = self.__dbobj.cursor()
        s = 'INSERT INTO %s (%s) VALUES (%s)' % (
            _TESTRESULT_TN, _keys, _values)
        c.execute(s)
        self.__dbobj.commit()

    def write(self, data, logfile=None):
        if len(data) == 0:
            return
        if 'testdata' in data.keys():
            self.__write_test_data(data['testdata'])
        if 'metrics_data' in data.keys():
            md = data['metrics_data']
            if 'server' in md.keys():
                self.__write_server_data(md['server'], logfile)
            if 'mom' in md.keys():
                self.__write_mom_data(md['mom'], logfile)
            if 'scheduler' in md.keys():
                self.__write_sched_data(md['scheduler'], logfile)
            if 'accounting' in md.keys():
                self.__write_acct_data(md['accounting'], logfile)
            if 'procs' in md.keys():
                self.__write_proc_data(md['procs'], logfile)
        self.__index += 1

    def close(self, result=None):
        self.__dbobj.commit()
        self.__dbobj.close()
        del self.__dbobj


class SQLiteDb(DBType):

    """
    SQLite type database
    """

    def __init__(self, dbtype, dbpath, dbaccess):
        DBType.__init__(self, dbtype, dbpath, dbaccess)
        if self.dbtype != 'sqlite':
            _msg = 'db type does not match with my type(file)'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        if self.dbpath is None:
            _msg = 'Db path require!'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        try:
            import sqlite3 as db
        except BaseException:
            _msg = 'sqlite3 module is required'
            _msg += ' for %s type database!' % (self.dbtype)
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        try:
            self.__dbobj = db.connect(self.dbpath)
        except Exception as e:
            _msg = 'Failed to connect to database:\n%s\n' % (str(e))
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        self.__username = pwd.getpwuid(os.getuid())[0]
        self.__platform = ' '.join(platform.uname()).strip()
        self.__ptlversion = str(ptl.__version__)
        self.__db_version = '1.0.0'
        self.__index = self.__create_tables()

    def __get_index(self, c):
        idxs = []
        stmt = 'SELECT max(id) from %s;' % (_TESTRESULT_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_SCHEDM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_SVRM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_MOMM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_ACCTM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_PROCM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_CYCLEM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_ESTINFOSUM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_ESTINFO_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        stmt = 'SELECT max(id) from %s;' % (_JOBM_TN)
        idxs.append(c.execute(stmt).fetchone()[0])
        idx = max(idxs)
        if idx is not None:
            return idx
        else:
            return 1

    def __upgrade_db(self, version):
        if version == self.__db_version:
            return

    def __create_tables(self):
        c = self.__dbobj.cursor()

        try:
            stmt = ['CREATE TABLE %s (' % (_DBVER_TN)]
            stmt += ['version TEXT);']
            c.execute(''.join(stmt))
        except BaseException:
            stmt = 'SELECT version from %s;' % (_DBVER_TN)
            version = c.execute(stmt).fetchone()[0]
            self.__upgrade_db(version)
            return self.__get_index(c)
        stmt = ['INSERT INTO %s (version)' % (_DBVER_TN)]
        stmt += [' VALUES (%s);' % (self.__db_version)]
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_TESTRESULT_TN)]
        stmt += ['id INTEGER,']
        stmt += ['suite TEXT,']
        stmt += ['testcase TEXT,']
        stmt += ['testdoc TEXT,']
        stmt += ['start_time TEXT,']
        stmt += ['end_time TEXT,']
        stmt += ['duration TEXT,']
        stmt += ['pbs_version TEXT,']
        stmt += ['testparam TEXT,']
        stmt += ['username TEXT,']
        stmt += ['ptl_version TEXT,']
        stmt += ['platform TEXT,']
        stmt += ['status TEXT,']
        stmt += ['status_data TEXT,']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_SCHEDM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.VER + ' TEXT,']
        stmt += [lu.NC + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJC + ' INTEGER,']
        stmt += [lu.NJFR + ' INTEGER,']
        stmt += [lu.mCD + '  TIME,']
        stmt += [lu.CD25 + ' TIME,']
        stmt += [lu.CDA + ' TIME,']
        stmt += [lu.CD50 + ' TIME,']
        stmt += [lu.CD75 + ' TIME,']
        stmt += [lu.MCD + ' TIME,']
        stmt += [lu.mCT + ' INTEGER,']
        stmt += [lu.MCT + ' INTEGER,']
        stmt += [lu.TTC + ' TIME,']
        stmt += [lu.DUR + ' TIME,']
        stmt += [lu.SST + ' TIME,']
        stmt += [lu.JRR + ' TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_SVRM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.VER + ' TEXT,']
        stmt += [lu.NJQ + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJE + ' INTEGER,']
        stmt += [lu.JRR + ' TEXT,']
        stmt += [lu.JER + ' TEXT,']
        stmt += [lu.JSR + ' TEXT,']
        stmt += [lu.NUR + ' TEXT,']
        stmt += [lu.JWTm + ' TIME,']
        stmt += [lu.JWT25 + ' TIME,']
        stmt += [lu.JWT50 + ' TIME,']
        stmt += [lu.JWTA + ' TIME,']
        stmt += [lu.JWT75 + ' TIME,']
        stmt += [lu.JWTM + ' TIME,']
        stmt += [lu.JRTm + ' TIME,']
        stmt += [lu.JRT25 + ' TIME,']
        stmt += [lu.JRTA + ' TIME,']
        stmt += [lu.JRT50 + ' TIME,']
        stmt += [lu.JRT75 + ' TIME,']
        stmt += [lu.JRTM + ' TIME);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_MOMM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.VER + ' TEXT,']
        stmt += [lu.NJQ + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJE + ' INTEGER,']
        stmt += [lu.JRR + ' TEXT,']
        stmt += [lu.JER + ' TEXT,']
        stmt += [lu.JSR + ' TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_ACCTM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.DUR + ' TEXT,']
        stmt += [lu.NJQ + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJE + ' INTEGER,']
        stmt += [lu.JRR + ' TEXT,']
        stmt += [lu.JSR + ' TEXT,']
        stmt += [lu.JER + ' TEXT,']
        stmt += [lu.JWTm + ' TIME,']
        stmt += [lu.JWT25 + ' TIME,']
        stmt += [lu.JWT50 + ' TIME,']
        stmt += [lu.JWTA + ' TIME,']
        stmt += [lu.JWT75 + ' TIME,']
        stmt += [lu.JWTM + ' TIME,']
        stmt += [lu.JRTm + ' TIME,']
        stmt += [lu.JRT25 + ' TIME,']
        stmt += [lu.JRTA + ' TIME,']
        stmt += [lu.JRT50 + ' TIME,']
        stmt += [lu.JRT75 + ' TIME,']
        stmt += [lu.JRTM + ' TIME,']
        stmt += [lu.JNSm + ' INTEGER,']
        stmt += [lu.JNS25 + ' REAL,']
        stmt += [lu.JNSA + ' REAL,']
        stmt += [lu.JNS50 + ' REAL,']
        stmt += [lu.JNS75 + ' REAL,']
        stmt += [lu.JNSM + ' REAL,']
        stmt += [lu.JCSm + ' INTEGER,']
        stmt += [lu.JCS25 + ' REAL,']
        stmt += [lu.JCSA + ' REAL,']
        stmt += [lu.JCS50 + ' REAL,']
        stmt += [lu.JCS75 + ' REAL,']
        stmt += [lu.JCSM + ' REAL,']
        stmt += [lu.CPH + ' INTEGER,']
        stmt += [lu.NPH + ' INTEGER,']
        stmt += [lu.UNCPUS + ' TEXT,']
        stmt += [lu.UNODES + ' TEXT,']
        stmt += [lu.USRS + ' TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_PROCM_TN)]
        stmt += ['id INTEGER, ']
        stmt += ['name TEXT,']
        stmt += ['rss INTEGER,']
        stmt += ['vsz INTEGER,']
        stmt += ['pcpu TEXT,']
        stmt += ['time TEXT);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_CYCLEM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.CST + ' INTEGER,']
        stmt += [lu.CD + ' TIME,']
        stmt += [lu.QD + ' TIME,']
        stmt += [lu.NJC + ' INTEGER,']
        stmt += [lu.NJR + ' INTEGER,']
        stmt += [lu.NJFR + ' INTEGER,']
        stmt += [lu.NJCAL + ' INTEGER,']
        stmt += [lu.NJFP + ' INTEGER,']
        stmt += [lu.NJP + ' INTEGER,']
        stmt += [lu.TTC + ' INTEGER,']
        stmt += [lu.SST + ' INTEGER);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_ESTINFOSUM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.NJD + ' INTEGER,']
        stmt += [lu.NJND + ' INTEGER,']
        stmt += [lu.Ds15mn + ' INTEGER,']
        stmt += [lu.Ds1hr + ' INTEGER,']
        stmt += [lu.Ds3hr + ' INTEGER,']
        stmt += [lu.Do3hr + ' INTEGER,']
        stmt += [lu.DDm + ' INTEGER,']
        stmt += [lu.DDM + ' INTEGER,']
        stmt += [lu.DDA + ' INTEGER,']
        stmt += [lu.DD50 + ' INTEGER);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_ESTINFO_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.JID + ' TEXT,']
        stmt += [lu.Eat + ' INTEGER,']
        stmt += [lu.JST + ' INTEGER,']
        stmt += [lu.ESTR + ' INTEGER,']
        stmt += [lu.ESTA + ' INTEGER,']
        stmt += [lu.NEST + ' INTEGER,']
        stmt += [lu.ND + ' INTEGER,']
        stmt += [lu.JDD + ' INTEGER);']
        c.execute(''.join(stmt))

        stmt = ['CREATE TABLE IF NOT EXISTS %s (' % (_JOBM_TN)]
        stmt += ['id INTEGER,']
        stmt += ['logname TEXT,']
        stmt += [lu.CST + ' INTEGER,']
        stmt += [lu.JID + ' TEXT,']
        stmt += [lu.T2R + ' INTEGER,']
        stmt += [lu.T2D + ' INTEGER,']
        stmt += [lu.TiS + ' INTEGER,']
        stmt += [lu.TTC + ' INTEGER);']
        c.execute(''.join(stmt))
        self.__dbobj.commit()
        return self.__get_index(c)

    def __write_data(self, tablename, data, logfile):
        keys = ['id']
        values = [str(self.__index)]
        if logfile is not None:
            keys.append('logfile')
            values.append('\'' + str(logfile).replace(' ', '_') + '\'')
        for k, v in data.items():
            if k == 'id':
                continue
            keys.append(str(k))
            v = str(v)
            if v.isdigit():
                values.append(v)
            else:
                values.append('\'' + v + '\'')
        _keys = ','.join(keys)
        _values = ','.join(values)
        c = self.__dbobj.cursor()
        s = 'INSERT INTO %s (%s) VALUES (%s)' % (tablename, _keys, _values)
        c.execute(s)
        self.__dbobj.commit()

    def __write_server_data(self, data, logfile=None):
        self.__write_data(_SVRM_TN, data, logfile)

    def __write_mom_data(self, data, logfile=None):
        self.__write_data(_MOMM_TN, data, logfile)

    def __write_sched_data(self, data, logfile=None):
        for k, v in data.items():
            if k == 'summary':
                self.__write_data(_SCHEDM_TN, data, logfile)
                continue
            elif k == lu.EST:
                if lu.ESTS in v:
                    self.__write_estinfosum_data(v[lu.ESTS], logfile)
                if lu.EJ in v:
                    for j in v[lu.EJ]:
                        if lu.EST in j:
                            dt = [str(s) for s in j[lu.Eat]]
                            j[lu.Eat] = ','.join(dt)
                        self.__write_estsum_data(j, logfile)
                continue
            if 'jobs' in v:
                for j in v['jobs']:
                    j[lu.CST] = v[lu.CST]
                    self.__write_job_data(j, logfile)
                del v['jobs']
            self.__write_cycle_data(v, logfile)

    def __write_acct_data(self, data, logfile=None):
        self.__write_data(_ACCTM_TN, data, logfile)

    def __write_proc_data(self, data, logfile=None):
        self.__write_data(_PROCM_TN, data, None)

    def __write_cycle_data(self, data, logfile=None):
        self.__write_data(_CYCLEM_TN, data, logfile)

    def __write_estsum_data(self, data, logfile=None):
        self.__write_data(_ESTINFOSUM_TN, data, logfile)

    def __write_estinfosum_data(self, data, logfile=None):
        self.__write_data(_ESTINFO_TN, data, logfile)

    def __write_job_data(self, data, logfile=None):
        self.__write_data(_JOBM_TN, data, logfile)

    def __write_test_data(self, data):
        keys = ['id']
        values = [str(self.__index)]
        keys.append('suite')
        values.append(str(data['suite']))
        keys.append('testcase')
        values.append(str(data['testcase']))
        doc = []
        for l in str(data['testdoc']).strip().split('\n'):
            doc.append(l.strip().replace('\t', ' ').replace('\'', '\'\''))
        doc = ' '.join(doc)
        keys.append('testdoc')
        values.append('\'' + doc + '\'')
        keys.append('start_time')
        values.append(str(data['start_time']))
        keys.append('end_time')
        values.append(str(data['end_time']))
        keys.append('duration')
        values.append(str(data['duration']))
        keys.append('pbs_version')
        values.append(str(data['pbs_version']))
        keys.append('testparam')
        values.append(str(data['testparam']))
        keys.append('username')
        values.append(str(self.__username))
        keys.append('platform')
        values.append(str(self.__platform))
        keys.append('status')
        values.append(str(data['status']))
        sdata = data['status_data']
        sdata = sdata.replace('\'', '\'\'')
        keys.append('status_data')
        values.append('\'' + sdata + '\'')
        _keys = ','.join(keys)
        _values = ','.join(values)
        c = self.__dbobj.cursor()
        s = 'INSERT INTO %s (%s) VALUES (%s)' % (
            _TESTRESULT_TN, _keys, _values)
        c.execute(s)
        self.__dbobj.commit()

    def write(self, data, logfile=None):
        if len(data) == 0:
            return
        if 'testdata' in data.keys():
            self.__write_test_data(data['testdata'])
        if 'metrics_data' in data.keys():
            md = data['metrics_data']
            if 'server' in md.keys():
                self.__write_server_data(md['server'], logfile)
            if 'mom' in md.keys():
                self.__write_mom_data(md['mom'], logfile)
            if 'scheduler' in md.keys():
                self.__write_sched_data(md['scheduler'], logfile)
            if 'accounting' in md.keys():
                self.__write_acct_data(md['accounting'], logfile)
            if 'procs' in md.keys():
                self.__write_proc_data(md['procs'], logfile)
        self.__index += 1

    def close(self, result=None):
        self.__dbobj.commit()
        self.__dbobj.close()
        del self.__dbobj


class FileDb(DBType):

    """
    File type database
    """

    def __init__(self, dbtype, dbpath, dbaccess):
        DBType.__init__(self, dbtype, dbpath, dbaccess)
        if self.dbtype != 'file':
            _msg = 'db type does not match with my type(file)'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        if self.dbpath is None:
            _msg = 'Db path require!'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        self.__separator1 = '=' * 80
        self.__separator2 = '___m_oo_m___'
        self.__username = pwd.getpwuid(os.getuid())[0]
        self.__platform = ' '.join(platform.uname()).strip()
        self.__ptlversion = str(ptl.__version__)
        self.__dbobj = {}
        self.__index = 1

    def __write_data(self, key, data, logfile):
        if key not in self.__dbobj.keys():
            f = os.path.join(self.dbdir, key + '.db')
            self.__dbobj[key] = open(f, 'w+')
        msg = [self.__separator1]
        msg += ['id = %s' % (self.__index)]
        if logfile is not None:
            msg += ['logfile = %s' % (logfile)]
        for k, v in data.items():
            if k == 'id':
                continue
            msg += [str(k) + ' = ' + str(v)]
        msg += [self.__separator1]
        self.__dbobj[key].write('\n'.join(msg) + '\n')
        self.__dbobj[key].flush()

    def __write_server_data(self, data, logfile=None):
        self.__write_data(_SVRM_TN, data, logfile)

    def __write_mom_data(self, data, logfile=None):
        self.__write_data(_MOMM_TN, data, logfile)

    def __write_sched_data(self, data, logfile=None):
        for k, v in data.items():
            if k == 'summary':
                self.__write_data(_SCHEDM_TN, data, logfile)
                continue
            elif k == lu.EST:
                if lu.ESTS in v:
                    self.__write_estinfosum_data(v[lu.ESTS], logfile)
                if lu.EJ in v:
                    for j in v[lu.EJ]:
                        if lu.EST in j:
                            dt = [str(s) for s in j[lu.Eat]]
                            j[lu.Eat] = ','.join(dt)
                        self.__write_estsum_data(j, logfile)
                continue
            if 'jobs' in v:
                for j in v['jobs']:
                    j[lu.CST] = v[lu.CST]
                    self.__write_job_data(j, logfile)
                del v['jobs']
            self.__write_cycle_data(v, logfile)

    def __write_acct_data(self, data, logfile=None):
        self.__write_data(_ACCTM_TN, data, logfile)

    def __write_proc_data(self, data, logfile=None):
        self.__write_data(_PROCM_TN, data, None)

    def __write_cycle_data(self, data, logfile=None):
        self.__write_data(_CYCLEM_TN, data, logfile)

    def __write_estsum_data(self, data, logfile=None):
        self.__write_data(_ESTINFOSUM_TN, data, logfile)

    def __write_estinfosum_data(self, data, logfile=None):
        self.__write_data(_ESTINFO_TN, data, logfile)

    def __write_job_data(self, data, logfile=None):
        self.__write_data(_JOBM_TN, data, logfile)

    def __write_test_data(self, data):
        if _TESTRESULT_TN not in self.__dbobj.keys():
            self.__dbobj[_TESTRESULT_TN] = open(self.dbpath, 'w+')
        msg = [self.__separator1]
        msg += ['id = %s' % (self.__index)]
        msg += ['suite = %s' % (data['suite'])]
        msg += ['testcase = %s' % (data['testcase'])]
        doc = []
        for l in str(data['testdoc']).strip().split('\n'):
            doc.append(l.strip())
        doc = ' '.join(doc)
        msg += ['testdoc = %s' % (doc)]
        msg += ['start_time = %s' % (str(data['start_time']))]
        msg += ['end_time = %s' % (str(data['end_time']))]
        msg += ['duration = %s' % (str(data['duration']))]
        msg += ['pbs_version = %s' % (data['pbs_version'])]
        msg += ['testparam = %s' % (data['testparam'])]
        msg += ['username = %s' % (self.__username)]
        msg += ['ptl_version = %s' % (self.__ptlversion)]
        msg += ['platform = %s' % (self.__platform)]
        msg += ['status = %s' % (data['status'])]
        msg += ['status_data = ']
        msg += [self.__separator2]
        msg += ['%s' % (str(data['status_data']))]
        msg += [self.__separator2]
        msg += [self.__separator1]
        self.__dbobj[_TESTRESULT_TN].write('\n'.join(msg) + '\n')
        self.__dbobj[_TESTRESULT_TN].flush()

    def write(self, data, logfile=None):
        if len(data) == 0:
            return
        if 'testdata' in data.keys():
            self.__write_test_data(data['testdata'])
        if 'metrics_data' in data.keys():
            md = data['metrics_data']
            if 'server' in md.keys():
                self.__write_server_data(md['server'], logfile)
            if 'mom' in md.keys():
                self.__write_mom_data(md['mom'], logfile)
            if 'scheduler' in md.keys():
                self.__write_sched_data(md['scheduler'], logfile)
            if 'accounting' in md.keys():
                self.__write_acct_data(md['accounting'], logfile)
            if 'procs' in md.keys():
                self.__write_proc_data(md['procs'], logfile)
        self.__index += 1

    def close(self, result=None):
        for v in self.__dbobj.values():
            v.write('\n')
            v.flush()
            v.close()


class HTMLDb(DBType):

    """
    HTML type database
    """

    def __init__(self, dbtype, dbpath, dbaccess):
        DBType.__init__(self, dbtype, dbpath, dbaccess)
        if self.dbtype != 'html':
            _msg = 'db type does not match with my type(html)'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        if self.dbpath is None:
            _msg = 'Db path require!'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        elif not self.dbpath.endswith('.html'):
            self.dbpath = self.dbpath.rstrip('.db') + '.html'
        self.__cmd = [os.path.basename(sys.argv[0])]
        self.__cmd += sys.argv[1:]
        self.__username = pwd.getpwuid(os.getuid())[0]
        self.__platform = ' '.join(platform.uname()).strip()
        self.__ptlversion = str(ptl.__version__)
        self.__dbobj = {}
        self.__index = 1

    def __write_test_html_header(self, data):
        _title = 'PTL Test Report of %s' % (data['pbs_version'])
        __s = []
        __s += ['<!DOCTYPE html><head>']
        __s += ['<title>%s</title>' % (_title)]
        __s += ['<style type="text/css">']
        __s += [' * {']
        __s += ['     font-family: verdana;']
        __s += [' }']
        __s += [' h1 {']
        __s += ['     text-align: center;']
        __s += [' }']
        __s += [' .data {']
        __s += ['     font-size: 15px;']
        __s += ['     font-weight: normal;']
        __s += ['     width: 100%;']
        __s += [' }']
        __s += [' .data button {']
        __s += ['     float: left;']
        __s += ['     margin-right: 4px;']
        __s += ['     border: 1px solid #d0d0d0;']
        __s += ['     font-weight: bold;']
        __s += ['     outline: none;']
        __s += ['     width: 30px;']
        __s += ['     height: 30px;']
        __s += ['     cursor: pointer;']
        __s += ['     background-color: #eeeeee;']
        __s += [' }']
        __s += [' .data div {']
        __s += ['     text-align: left;']
        __s += [' }']
        __s += [' .data table {']
        __s += ['     border-spacing: 0px;']
        __s += ['     margin-top: 6px;']
        __s += ['     text-align: center;']
        __s += [' }']
        __s += [' .data th {']
        __s += ['     border: 1px solid #d0d0d0;']
        __s += ['     border-right: 0px;']
        __s += ['     background-color: #eeeeee;']
        __s += ['     font-weight: normal;']
        __s += ['     width: 13%;']
        __s += ['     padding: 5px;']
        __s += [' }']
        __s += [' .data th.innert:last-child {']
        __s += ['     width: 100%;']
        __s += [' }']
        __s += [' .data th.tsname {']
        __s += ['     font-weight: bold;']
        __s += ['     width: 500px;']
        __s += ['     text-align: left;']
        __s += [' }']
        __s += [' .data th.pass {']
        __s += ['     color: #3c763d;']
        __s += ['     background-color: #dff0d8;']
        __s += [' }']
        __s += [' .data th.skip {']
        __s += ['     color: #31708f;']
        __s += ['     background-color: #d9edf7;']
        __s += [' }']
        __s += [' .data th.fail,th.error,th.timedout {']
        __s += ['     color: #a94442;']
        __s += ['     background-color: #f2dede;']
        __s += [' }']
        __s += [' .data table th:last-child {']
        __s += ['     border: 1px solid #d0d0d0;']
        __s += [' }']
        __s += [' .data td {']
        __s += ['     border: 1px solid #d0d0d0;']
        __s += ['     border-top: 0px;']
        __s += ['     border-right: 0px;']
        __s += ['     padding: 5px;']
        __s += [' }']
        __s += [' .data td.pass_td {']
        __s += ['     background-color: #dff0d8;']
        __s += ['     color: #3c763d;']
        __s += [' }']
        __s += [' .data td.skip_td {']
        __s += ['     background-color: #d9edf7;']
        __s += ['     color: #31708f;']
        __s += [' }']
        __s += [' .data td.fail_td,td.error_td,td.timedout_td {']
        __s += ['     color: #a94442;']
        __s += ['     background-color: #f2dede;']
        __s += [' }']
        __s += [' .data tr td:last-child {']
        __s += ['     border: 1px solid #d0d0d0;']
        __s += ['     border-top: 0px;']
        __s += ['     text-align: left;']
        __s += ['     word-break: break-all;']
        __s += ['     white-space: pre-wrap;']
        __s += [' }']
        __s += [' .flt td {']
        __s += ['     padding-right: 25px;']
        __s += ['     padding-bottom: 10px;']
        __s += ['     font-size: 14px;']
        __s += [' }']
        __s += ['</style><script type="text/javascript">']
        __s += ['function toggle(id) {']
        __s += ['    var b = document.getElementById(id);']
        __s += ['    if (b == null) {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    b.textContent = b.textContent == "+" ? "-" : "+";']
        __s += ['    if (b.textContent == "-") {']
        __s += ['        var table = document.getElementById(id + "_t");']
        __s += ['        table.style.display = "";']
        __s += ['        var i = b.offsetLeft + b.offsetWidth;']
        __s += ['        i = i - b.clientLeft - 1;']
        __s += ['        table.style.marginLeft = i.toString() + "px";']
        __s += ['        sessionStorage.setItem(id, "");']
        __s += ['    } else {']
        __s += ['        var table = document.getElementById(id + "_t");']
        __s += ['        table.style.display = "none";']
        __s += ['        sessionStorage.removeItem(id);']
        __s += ['    }']
        __s += ['}']
        __s += ['function add_ts(tsn, n) {']
        __s += ['    sum = 0;']
        __s += ['    if (tsn == "Summary")']
        __s += ['        sum = 1;']
        __s += ['    if (document.getElementById(tsn + "_d") != null) {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    var div = document.createElement("div");']
        __s += ['    div.setAttribute("class", "data");']
        __s += ['    div.setAttribute("id", tsn + "_d");']
        __s += ['    if (sum == 1) {']
        __s += ['        div.setAttribute("style", "margin-bottom: 15px;");']
        __s += ['    }']
        __s += ['    document.body.appendChild(div);']
        __s += ['    if (n != null) {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    var btn = document.createElement("button");']
        __s += ['    btn.appendChild(document.createTextNode("+"));']
        __s += ['    div.appendChild(btn);']
        __s += ['    btn.setAttribute("id", tsn);']
        __s += ['    var t = "toggle(\\"" + tsn + "\\")";']
        __s += ['    btn.setAttribute("onclick", t);']
        __s += ['    if (sum == 1) {']
        __s += ['        btn.setAttribute("style", "visibility: hidden;");']
        __s += ['    }']
        __s += ['    var table = document.createElement("table");']
        __s += ['    div.appendChild(table);']
        __s += ['    table.setAttribute("id", tsn + "_i");']
        __s += ['    var th = document.createElement("th");']
        __s += ['    th.setAttribute("class", "tsname");']
        __s += ['    if (sum == 1) {']
        __s += ['        th.setAttribute("style", "text-align: center;");']
        __s += ['    }']
        __s += ['    th.appendChild(document.createTextNode(tsn));']
        __s += ['    table.appendChild(th);']
        __s += ['    var th = document.createElement("th");']
        __s += ['    th.setAttribute("class", "run");']
        __s += ['    if (sum == 1) {']
        __s += ['        th.setAttribute("style", "font-weight: bold;");']
        __s += ['    }']
        __s += ['    table.appendChild(th);']
        __s += ['    var th = document.createElement("th");']
        __s += ['    th.setAttribute("class", "pass");']
        __s += ['    if (sum == 1) {']
        __s += ['        th.setAttribute("style", "font-weight: bold;");']
        __s += ['    }']
        __s += ['    table.appendChild(th);']
        __s += ['    f = document.createElement("font");']
        __s += ['    f.setAttribute("style", "color: #ade4ad");']
        __s += ['    th.appendChild(f);']
        __s += ['    tsn = document.createTextNode("Passed: 0");']
        __s += ['    f.appendChild(tsn);']
        __s += ['    var th = document.createElement("th");']
        __s += ['    th.setAttribute("class", "skip");']
        __s += ['    if (sum == 1) {']
        __s += ['        th.setAttribute("style", "font-weight: bold;");']
        __s += ['    }']
        __s += ['    table.appendChild(th);']
        __s += ['    f = document.createElement("font");']
        __s += ['    f.setAttribute("style", "color: #b5d7f3");']
        __s += ['    th.appendChild(f);']
        __s += ['    tsn = document.createTextNode("Skipped: 0");']
        __s += ['    f.appendChild(tsn);']
        __s += ['    var th = document.createElement("th");']
        __s += ['    th.setAttribute("class", "fail");']
        __s += ['    if (sum == 1) {']
        __s += ['        th.setAttribute("style", "font-weight: bold;");']
        __s += ['    }']
        __s += ['    table.appendChild(th);']
        __s += ['    f = document.createElement("font");']
        __s += ['    f.setAttribute("style", "color: #efc0bf");']
        __s += ['    th.appendChild(f);']
        __s += ['    tsn = document.createTextNode("Failed: 0");']
        __s += ['    f.appendChild(tsn);']
        __s += ['    var th = document.createElement("th");']
        __s += ['    th.setAttribute("class", "error");']
        __s += ['    if (sum == 1) {']
        __s += ['        th.setAttribute("style", "font-weight: bold;");']
        __s += ['    }']
        __s += ['    table.appendChild(th);']
        __s += ['    f = document.createElement("font");']
        __s += ['    f.setAttribute("style", "color: #efc0bf");']
        __s += ['    th.appendChild(f);']
        __s += ['    tsn = document.createTextNode("Error: 0");']
        __s += ['    f.appendChild(tsn);']
        __s += ['    var th = document.createElement("th");']
        __s += ['    th.setAttribute("class", "timedout");']
        __s += ['    if (sum == 1) {']
        __s += ['        th.setAttribute("style", "font-weight: bold;");']
        __s += ['    }']
        __s += ['    table.appendChild(th);']
        __s += ['    f = document.createElement("font");']
        __s += ['    f.setAttribute("style", "color: #efc0bf");']
        __s += ['    th.appendChild(f);']
        __s += ['    tsn = document.createTextNode("TimedOut: 0");']
        __s += ['    f.appendChild(tsn);']
        __s += ['}']
        __s += ['function add_th(tsn) {']
        __s += ['    if (document.getElementById(tsn + "_t") != null) {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    var div = document.getElementById(tsn + "_d");']
        __s += ['    var table = document.createElement("table");']
        __s += ['    table.setAttribute("id", tsn + "_t");']
        __s += ['    table.setAttribute("style", "display: none");']
        __s += ['    div.appendChild(table);']
        __s += ['    var tr = document.createElement("tr");']
        __s += ['    table.appendChild(tr);']
        __s += ['    var lenh = datah.length;']
        __s += ['    for (var i = 0; i < lenh; i++) {']
        __s += ['        var th = document.createElement("th");']
        __s += ['        if (i < (lenh-1)) {']
        __s += ['            th.setAttribute("style", "border-right: 0px");']
        __s += ['        }']
        __s += ['        th.setAttribute("class", "innert");']
        __s += ['        var txt = document.createTextNode(datah[i]);']
        __s += ['        th.appendChild(txt);']
        __s += ['        tr.appendChild(th);']
        __s += ['    }']
        __s += ['}']
        __s += ['function restore(tc) {']
        __s += ['    var tco = document.getElementById(tc + "_o");']
        __s += ['    tco.removeAttribute("style");']
        __s += ['    tco.removeAttribute("id");']
        __s += ['    var tc = document.getElementById(tc);']
        __s += ['    tc.parentNode.removeChild(tc);']
        __s += ['}']
        __s += ['function add_row(d, sel) {']
        __s += ['    var s = d.status.toLowerCase();']
        __s += ['    if (s != sel && sel != "all") {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    if (sel == "all") {']
        __s += ['        sel = d.suite;']
        __s += ['    }']
        __s += ['    var table = document.getElementById(sel + "_t");']
        __s += ['    var tr = document.createElement("tr");']
        __s += ['    table.appendChild(tr);']
        __s += ['    var td = document.createElement("td");']
        __s += ['    td.setAttribute("class", s + "_td");']
        __s += ['    var tc = d.suite + "." + d.testcase']
        __s += ['    td.appendChild(document.createTextNode(tc));']
        __s += ['    tr.appendChild(td);']
        __s += ['    var td = document.createElement("td");']
        __s += ['    td.setAttribute("class", s + "_td");']
        __s += ['    var txt = document.createTextNode(d.duration);']
        __s += ['    td.appendChild(txt);']
        __s += ['    tr.appendChild(td);']
        __s += ['    var td = document.createElement("td");']
        __s += ['    td.setAttribute("class", s + "_td");']
        __s += ['    td.appendChild(document.createTextNode(d.status));']
        __s += ['    tr.appendChild(td);']
        __s += ['    tr.setAttribute("class", s);']
        __s += ['    var td = document.createElement("td");']
        __s += ['    td.setAttribute("class", s + "_td");']
        __s += ['    var lines = d.status_data.split("\\n");']
        __s += ['    var llen = lines.length;']
        __s += ['    if (llen > 10) {']
        __s += ['        var fl = lines.slice(0, 3).join("\\n");']
        __s += ['        td.appendChild(document.createTextNode(fl));']
        __s += ['        var a = document.createElement("a");']
        __s += ['        var scr = "javascript:restore(\\"" + tc + "\\")";']
        __s += ['        a.setAttribute("href", scr);']
        __s += ['        var txt = document.createTextNode("\\n...\\n\\n");']
        __s += ['        a.appendChild(txt);']
        __s += ['        td.setAttribute("id", tc);']
        __s += ['        td.appendChild(a);']
        __s += ['        lines = lines.slice(llen - 4, llen).join("\\n");']
        __s += ['        td.appendChild(document.createTextNode(lines));']
        __s += ['        var tdo = document.createElement("td");']
        __s += ['        tdo.setAttribute("class", s + "_td");']
        __s += ['        tdo.setAttribute("id", tc + "_o");']
        __s += ['        tdo.setAttribute("style", "display: none");']
        __s += ['        tr.appendChild(tdo);']
        __s += ['        var txt = document.createTextNode(d.status_data);']
        __s += ['        tdo.appendChild(txt);']
        __s += ['    } else {']
        __s += ['        var txt = document.createTextNode(d.status_data);']
        __s += ['        td.appendChild(txt);']
        __s += ['    }']
        __s += ['    tr.appendChild(td);']
        __s += ['    var tc = document.getElementById(sel + "_i");']
        __s += ['    if (tc == null) {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    var tt = tc.getElementsByClassName(s)[0];']
        __s += ['    var t = tt.textContent.split(" ");']
        __s += ['    var i = parseInt(t[1]) + 1;']
        __s += ['    tt.textContent = t[0] + " " + i;']
        __s += ['    var tt = tc.getElementsByClassName("run")[0]']
        __s += ['    if (tt.textContent == "") {']
        __s += ['        tt.textContent = "Run: 1";']
        __s += ['    } else {']
        __s += ['        var t = tt.textContent.split(" ");']
        __s += ['        var i = parseInt(t[1]) + 1;']
        __s += ['        tt.textContent = t[0] + " " + i;']
        __s += ['    }']
        __s += ['    var tc = document.getElementById("Summary_i");']
        __s += ['    if (tc == null) {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    var tt = tc.getElementsByClassName(s)[0];']
        __s += ['    var t = tt.textContent.split(" ");']
        __s += ['    var i = parseInt(t[1]) + 1;']
        __s += ['    tt.textContent = t[0] + " " + i;']
        __s += ['    var tt = tc.getElementsByClassName("run")[0]']
        __s += ['    if (tt.textContent == "") {']
        __s += ['        tt.textContent = "Run: 1";']
        __s += ['    } else {']
        __s += ['        var t = tt.textContent.split(" ");']
        __s += ['        var i = parseInt(t[1]) + 1;']
        __s += ['        tt.textContent = t[0] + " " + i;']
        __s += ['    }']
        __s += ['}']
        __s += ['function add_dt(sel) {']
        __s += ['    var len = data.length;']
        __s += ['    for (i = 0; i < len; i++) {']
        __s += ['        var d = data[i];']
        __s += ['        if (sel == "all") {']
        __s += ['            add_ts("Summary");']
        __s += ['            add_ts(d.suite);']
        __s += ['            add_th(d.suite);']
        __s += ['        } else {']
        __s += ['            add_ts(sel, 1);']
        __s += ['            add_th(sel, 1);']
        __s += ['        }']
        __s += ['        add_row(d, sel);']
        __s += ['    }']
        __s += ['    var size = "40px";']
        __s += ['    if (len > 0) {']
        __s += ['        var b = document.getElementById(data[0].suite);']
        __s += ['        if (b != null) {']
        __s += ['            var i = b.offsetLeft + b.offsetWidth;']
        __s += ['            i = i - b.clientLeft - 1;']
        __s += ['            size = i.toString() + "px";']
        __s += ['        }']
        __s += ['    }']
        __s += ['    var t = document.getElementById("flt");']
        __s += ['    t.style.marginLeft = size;']
        __s += ['    if (sel != "all") {']
        __s += ['        t = document.getElementById(sel + "_t");']
        __s += ['        t.style.display = "";']
        __s += ['        t.style.marginLeft = size;']
        __s += ['    }']
        __s += ['    sessionStorage.removeItem("_filter_");']
        __s += ['    for (i = 0; i < sessionStorage.length; i++) {']
        __s += ['        toggle(sessionStorage.key(i));']
        __s += ['    }']
        __s += ['    sessionStorage.setItem("_filter_", sel);']
        __s += ['}']
        __s += ['function filter(n) {']
        __s += ['    var sf = sessionStorage.getItem("_filter_");']
        __s += ['    if (sf == null)']
        __s += ['        sf = "all";']
        __s += ['    var map = [sf, "all", "pass", "skip", "fail", "error",']
        __s += ['               "timedout"];']
        __s += ['    var sel = map[n];']
        __s += ['    var rbs = document.getElementsByTagName("input");']
        __s += ['    for (i = 0; i < rbs.length; i++) {']
        __s += ['        if (rbs[i].name == sel) {']
        __s += ['            rbs[i].checked = true;']
        __s += ['        } else {']
        __s += ['            rbs[i].checked = false;']
        __s += ['        }']
        __s += ['    }']
        __s += ['    var els = document.getElementsByClassName("data");']
        __s += ['    while (els.length > 0) {']
        __s += ['        els[0].parentNode.removeChild(els[0]);']
        __s += ['    }']
        __s += ['    add_dt(sel);']
        __s += ['}']
        __s += ['document.addEventListener("keydown", function(event) {']
        __s += ['    if (event.shiftKey || event.ctrlKey || event.altKey']
        __s += ['        || event.metaKey) {']
        __s += ['        return;']
        __s += ['    }']
        __s += ['    //              a,  p,  s,  f,  e,  t']
        __s += ['    var map = [-1, 65, 80, 83, 70, 69, 84]']
        __s += ['    if (map.indexOf(event.keyCode) != -1) {']
        __s += ['        filter(map.indexOf(event.keyCode));']
        __s += ['    }']
        __s += ['});']
        __s += ['</script></head><body onload="filter(0)">']
        __s += ['<h1>%s</h1>' % (_title)]
        _s = 'margin: 30px;margin-bottom: 15px;text-align: left;'
        __s += ['<div style="%s"><table>' % (_s)]
        _s = '<tr><th>%s:</th><td>%s</td></tr>'
        __s += [_s % ('Command', ' '.join(self.__cmd))]
        __s += [_s % ('TestParm', data['testparam'])]
        __s += [_s % ('User', self.__username)]
        __s += [_s % ('PTL Version', self.__ptlversion)]
        __s += [_s % ('Platform', self.__platform)]
        __s += ['</table></div><div id="flt"><table class="flt"><tr>']
        _s = '<td><input name="%s" type="radio" onclick="filter(%d);"/>%s</td>'
        __s += [_s % ('all', 1, 'Show All')]
        __s += [_s % ('pass', 2, 'Show only "Passed"')]
        __s += [_s % ('skip', 3, 'Show only "Skipped"')]
        __s += [_s % ('fail', 4, 'Show only "Failed"')]
        __s += [_s % ('error', 5, 'Show only "Error"')]
        __s += [_s % ('timedout', 6, 'Show only "TimedOut"')]
        __s += ['</tr></table></div><script type="text/javascript">']
        __s += ['datah = ["TestCase", "Duration", "Status", "Status Data"];']
        __s += ['data = [']
        __s += ['];</script></body></html>']
        self.__dbobj[_TESTRESULT_TN].write('\n'.join(__s))
        self.__dbobj[_TESTRESULT_TN].flush()

    def __write_test_data(self, data):
        if _TESTRESULT_TN not in self.__dbobj.keys():
            self.__dbobj[_TESTRESULT_TN] = open(self.dbpath, 'w+')
            self.__write_test_html_header(data)
        d = {}
        d['suite'] = data['suite']
        d['testcase'] = data['testcase']
        d['status'] = data['status']
        d['status_data'] = data['status_data']
        d['duration'] = str(data['duration'])
        self.__dbobj[_TESTRESULT_TN].seek(0, os.SEEK_END)
        self.__dbobj[_TESTRESULT_TN].seek(
            self.__dbobj[_TESTRESULT_TN].tell() - 27, os.SEEK_SET)
        t = self.__dbobj[_TESTRESULT_TN].readline().strip()
        line = ''
        if t != '[':
            line += ',\n'
        else:
            line += '\n'
        line += str(d) + '\n];</script></body></html>'
        self.__dbobj[_TESTRESULT_TN].seek(0, os.SEEK_END)
        self.__dbobj[_TESTRESULT_TN].seek(
            self.__dbobj[_TESTRESULT_TN].tell() - 26, os.SEEK_SET)
        self.__dbobj[_TESTRESULT_TN].write(line)
        self.__dbobj[_TESTRESULT_TN].flush()
        self.__index += 1

    def write(self, data, logfile=None):
        if len(data) == 0:
            return
        if 'testdata' in data.keys():
            self.__write_test_data(data['testdata'])

    def close(self, result=None):
        for v in self.__dbobj.values():
            v.write('\n')
            v.flush()
            v.close()


class JSONDb(DBType):

    """
    JSON type database
    """

    def __init__(self, dbtype, dbpath, dbaccess):
        super(JSONDb, self).__init__(dbtype, dbpath, dbaccess)
        if self.dbtype != 'json':
            _msg = 'db type does not match with my type(json)'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        if not self.dbpath:
            _msg = 'Db path require!'
            raise PTLDbError(rc=1, rv=False, msg=_msg)
        elif not self.dbpath.endswith('.json'):
            self.dbpath = self.dbpath.rstrip('.db') + '.json'
        self.jdata = {}
        self.__cmd = [os.path.basename(sys.argv[0])]
        self.__cmd += sys.argv[1:]
        self.__cmd = ' '.join(self.__cmd)
        self.res_data = PTLJsonData(command=self.__cmd)

    def __write_test_data(self, data):
        prev_data = copy.deepcopy(self.jdata)
        self.jdata = self.res_data.get_json(data=data, prev_data=prev_data)
        with open(self.dbpath, 'w') as fd:
            json.dump(self.jdata, fd, indent=2)
            fd.write("\n")

    def write(self, data, logfile=None):
        if len(data) == 0:
            return
        if 'testdata' in data.keys():
            self.__write_test_data(data['testdata'])

    def close(self, result=None):
        if result is not None and self.jdata:
            dur = str(result.stop - result.start)
            self.jdata['result']['start'] = str(result.start)
            self.jdata['result']["end"] = str(result.stop)
            self.jdata['result']['duration'] = dur
            with open(self.dbpath, 'w') as fd:
                json.dump(self.jdata, fd, indent=2)
                fd.write("\n")


class PTLTestDb(Plugin):

    """
    PTL Test Database Plugin
    """
    name = 'PTLTestDb'
    score = sys.maxsize - 5
    logger = logging.getLogger(__name__)

    def __init__(self):
        Plugin.__init__(self)
        self.__dbconn = None
        self.__dbtype = None
        self.__dbpath = None
        self.__dbaccess = None
        self.__dbmapping = {'file': FileDb,
                            'html': HTMLDb,
                            'json': JSONDb,
                            'sqlite': SQLiteDb,
                            'pgsql': PostgreSQLDb}
        self.__du = DshUtils()

    def options(self, parser, env):
        """
        Register command line options
        """
        pass

    def set_data(self, dbtype, dbpath, dbaccess):
        """
        Set the data
        """
        self.__dbtype = dbtype
        self.__dbpath = dbpath
        self.__dbaccess = dbaccess

    def configure(self, options, config):
        """
        Configure the plugin and system, based on selected options

        :param options: Configuration options for ``plugin`` and ``system``
        """
        if self.__dbconn is not None:
            return
        if self.__dbtype is None:
            self.__dbtype = 'json'
        if self.__dbtype not in self.__dbmapping.keys():
            self.logger.error('Invalid db type: %s' % self.__dbtype)
            sys.exit(1)
        try:
            self.__dbconn = self.__dbmapping[self.__dbtype](self.__dbtype,
                                                            self.__dbpath,
                                                            self.__dbaccess)
        except PTLDbError as e:
            self.logger.error(str(e) + '\n')
            sys.exit(1)
        self.enabled = True

    def __create_data(self, test, err=None, status=None):
        if hasattr(test, 'test'):
            _test = test.test
            sn = _test.__class__.__name__
        elif hasattr(test, 'context'):
            test = _test = test.context
            sn = test.__name__
        else:
            return {}
        testdata = {}
        data = {}
        cur_time = datetime.datetime.now()
        if (hasattr(_test, 'server') and
                (getattr(_test, 'server', None) is not None)):
            testdata['pbs_version'] = _test.server.attributes['pbs_version']
            testdata['hostname'] = _test.server.hostname
        else:
            testdata['pbs_version'] = 'unknown'
            testdata['hostname'] = 'unknown'
        testdata['machinfo'] = self.__get_machine_info(_test)
        testdata['testparam'] = getattr(_test, 'param', None)
        testdata['suite'] = sn
        testdata['suitedoc'] = str(_test.__class__.__doc__)
        testdata['file'] = _test.__module__.replace('.', '/') + '.py'
        testdata['module'] = _test.__module__
        testdata['testcase'] = getattr(_test, '_testMethodName', '<unknown>')
        testdata['testdoc'] = getattr(_test, '_testMethodDoc', '<unknown>')
        testdata['start_time'] = getattr(test, 'start_time', cur_time)
        testdata['end_time'] = getattr(test, 'end_time', cur_time)
        testdata['duration'] = getattr(test, 'duration', 0)
        testdata['tags'] = getattr(_test, TAGKEY, [])
        testdata['requirements'] = getattr(_test, 'requirements',
                                           default_requirements)
        measurements_dic = getattr(_test, 'measurements', {})
        if measurements_dic:
            testdata['measurements'] = measurements_dic
        additional_data_dic = getattr(_test, 'additional_data', {})
        if additional_data_dic:
            testdata['additional_data'] = additional_data_dic
        if err is not None:
            if isclass(err[0]) and issubclass(err[0], SkipTest):
                testdata['status'] = 'SKIP'
                testdata['status_data'] = 'Reason = %s' % (err[1])
            else:
                if isclass(err[0]) and issubclass(err[0], TimeOut):
                    status = 'TIMEDOUT'
                testdata['status'] = status
                testdata['status_data'] = getattr(test, 'err_in_string',
                                                  '<unknown>')
        else:
            testdata['status'] = status
            testdata['status_data'] = ''
        data['testdata'] = testdata
        md = getattr(_test, 'metrics_data', {})
        if len(md) > 0:
            data['metrics_data'] = md
        return data

    def __get_machine_info(self, test):
        """
        Helper function to return machines dictionary with details

        :param: test
        :test type: object

        returns dictionary with machines information
        """
        mpinfo = {
            'servers': [],
            'moms': [],
            'comms': [],
            'clients': []
        }
        minstall_type = {
            'servers': 'server',
            'moms': 'execution',
            'comms': 'communication',
            'clients': 'client'
        }
        for name in mpinfo:
            mlist = None
            if (hasattr(test, name) and
                    (getattr(test, name, None) is not None)):
                mlist = getattr(test, name).values()
            if mlist:
                for mc in mlist:
                    mpinfo[name].append(mc)
        machines = {}
        for k, v in mpinfo.items():
            for _v in v:
                hst = _v.hostname
                if hst not in machines:
                    machines[hst] = {}
                    mshort = machines[hst]
                    mshort['platform'] = _v.get_uname(hostname=hst)
                    mshort['os_info'] = _v.get_os_info(hostname=hst)
                machines[hst]['pbs_install_type'] = minstall_type[k]
                if ((k == 'moms' or k == 'comms') and
                        hst in mpinfo['servers']):
                    machines[hst]['pbs_install_type'] = 'server'
        return machines

    def addError(self, test, err):
        self.__dbconn.write(self.__create_data(test, err, 'ERROR'))

    def addFailure(self, test, err):
        self.__dbconn.write(self.__create_data(test, err, 'FAIL'))

    def addSuccess(self, test):
        self.__dbconn.write(self.__create_data(test, None, 'PASS'))

    def finalize(self, result):
        self.__dbconn.close(result)
        self.__dbconn = None
        self.__dbaccess = None

    def process_output(self, info={}, dbout=None, dbtype=None, dbaccess=None,
                       name=None, logtype=None, summary=False):
        """
        Send analyzed log information to either the screen or to a database
        file.

        :param info: A dictionary of log analysis metrics.
        :type info: Dictionary
        :param dbout: The name of the database file to send output to
        :type dbout: str or None
        :param dbtype: Type of database
        :param dbaccess: Path to a file that defines db options
                         (PostreSQL only)
        :param name: The name of the log file being analyzed
        :type name: str or None
        :param logtype: The log type, one of ``accounting``, ``schedsummary``,
                        ``scheduler``, ``server``, or ``mom``
        :param summary: If True output summary only
        """
        if dbout is not None:
            try:
                self.set_data(dbtype, dbout, dbaccess)
                self.configure(None, None)
                data = {'metrics_data': {logtype: info}}
                self.__dbconn.write(data, os.path.basename(name))
                self.finalize(None)
            except Exception as e:
                sys.stderr.write(str(traceback.print_exc()))
                sys.stderr.write('Error processing output ' + str(e))
            return

        if lu.CFC in info:
            freq_info = info[lu.CFC]
        elif 'summary' in info and lu.CFC in info['summary']:
            freq_info = info['summary'][lu.CFC]
        else:
            freq_info = None

        if 'matches' in info:
            for m in info['matches']:
                print(m, end=' ')
            del info['matches']

        if freq_info is not None:
            for ((l, m), n) in freq_info:
                b = time.strftime("%m/%d/%y %H:%M:%S", time.localtime(l))
                e = time.strftime("%m/%d/%y %H:%M:%S", time.localtime(m))
                print(b + ' -', end=' ')
                if b[:8] != e[:8]:
                    print(e, end=' ')
                else:
                    print(e[9:], end=' ')
                print(': ' + str(n))
            return

        if lu.EST in info:
            einfo = info[lu.EST]
            m = []

            for j in einfo[lu.EJ]:
                m.append('Job ' + j[lu.JID] + '\n\testimated:')
                if lu.Eat in j:
                    for estimate in j[lu.Eat]:
                        m.append('\t\t' + str(time.ctime(estimate)))
                if lu.JST in j:
                    m.append('\tstarted:\n')
                    m.append('\t\t' + str(time.ctime(j[lu.JST])))
                    m.append('\testimate range: ' + str(j[lu.ESTR]))
                    m.append('\tstart to estimated: ' + str(j[lu.ESTA]))

                if lu.NEST in j:
                    m.append('\tnumber of estimates: ' + str(j[lu.NEST]))
                if lu.NJD in j:
                    m.append('\tnumber of drifts: ' + str(j[lu.NJD]))
                if lu.JDD in j:
                    m.append('\tdrift duration: ' + str(j[lu.JDD]))
                m.append('\n')

            if lu.ESTS in einfo:
                m.append('\nsummary: ')
                for k, v in sorted(einfo[lu.ESTS].items()):
                    if 'duration' in k:
                        m.append('\t' + k + ': ' +
                                 str(PbsTypeDuration(int(v))))
                    else:
                        m.append('\t' + k + ': ' + str(v))

            print("\n".join(m))
            return

        sorted_info = sorted(info.items())
        for (k, v) in sorted_info:
            if summary and k != 'summary':
                continue
            print(str(k) + ": ", end=' ')
            if isinstance(v, dict):
                sorted_v = sorted(v.items())
                for (k, val) in sorted_v:
                    print(str(k) + '=' + str(val) + ' ')
                print()
            else:
                print(str(v))
        print('')


================================================
FILE: test/fw/ptl/utils/plugins/ptl_test_info.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import sys
import logging
import unittest
from nose.plugins.base import Plugin
from ptl.utils.pbs_testsuite import PBSTestSuite
from ptl.utils.plugins.ptl_test_tags import TAGKEY
from ptl.utils.pbs_testsuite import REQUIREMENTS_KEY
from ptl.utils.pbs_testsuite import default_requirements
from copy import deepcopy

log = logging.getLogger('nose.plugins.PTLTestInfo')


def get_effective_reqs(ts_reqs=None, tc_reqs=None):
    """
    get effective requirements at test case
    """
    tc_effective_reqs = {}
    if (tc_reqs is None and ts_reqs is None):
        tc_effective_reqs = deepcopy(default_requirements)
    else:
        tc_effective_reqs = deepcopy(default_requirements)
        tc_effective_reqs.update(ts_reqs)
        tc_effective_reqs.update(tc_reqs)
    return tc_effective_reqs


class FakeRunner(object):

    def __init__(self, config):
        self.config = config

    def run(self, test):
        self.config.plugins.finalize(None)
        sys.exit(0)


class PTLTestInfo(Plugin):

    """
    Load test cases from given parameter
    """
    name = 'PTLTestInfo'
    score = sys.maxsize - 2
    logger = logging.getLogger(__name__)

    def __init__(self):
        self.list_test = None
        self.showinfo = None
        self.verbose = None
        self.gen_ts_tree = None
        self.suites = []
        self._tree = {}
        self.total_suite = 0
        self.total_case = 0
        self.__ts_tree = {}
        self.__tags_tree = {'NoTags': {}}

    def options(self, parser, env):
        """
        Register command line options
        """
        pass

    def set_data(self, suites, list_test, showinfo, verbose, gen_ts_tree):
        """
        Set the data required for running the tests

        :param suites: Test suites to run
        :param list_test: List of test to run
        :param gen_ts_tree: Generate test suite tree
        """
        self.suites = suites.split(',')
        self.list_test = list_test
        self.showinfo = showinfo
        self.verbose = verbose
        self.gen_ts_tree = gen_ts_tree

    def configure(self, options, config):
        """
        Configure the plugin and system, based on selected options

        :param options: Options to configure plugin and system
        """
        self.config = config
        self.enabled = True

    def prepareTestRunner(self, runner):
        return FakeRunner(config=self.config)

    def wantClass(self, cls):
        """
        Is the class wanted?
        """
        if not issubclass(cls, unittest.TestCase) or cls is PBSTestSuite \
                or cls is unittest.TestCase:
            return False
        self._tree.setdefault(cls.__name__, cls)
        if len(cls.__bases__) > 0:
            self.wantClass(cls.__bases__[0])

    def _get_hierarchy(self, cls, level=0):
        delim = '    ' * level
        msg = [delim + cls.__name__]
        try:
            subclses = cls.__subclasses__()
        except TypeError:
            pass
        else:
            for subcls in subclses:
                msg.extend(self._get_hierarchy(subcls, level + 1))
        return msg

    def _print_suite_info(self, suite):
        w = sys.stdout
        self.total_suite += 1
        if self.list_test:
            w.write('\n\n')
        w.write('Test Suite: %s\n\n' % suite.__name__)
        w.write('    file: %s.py\n\n' % suite.__module__.replace('.', '/'))
        w.write('    module: %s\n\n' % suite.__module__)
        tags = getattr(suite, TAGKEY, None)
        if tags is not None:
            w.write('    Tags: %s\n\n' % (', '.join(tags)))
        w.write('    Suite Doc: \n')
        for l in str(suite.__doc__).split('\n'):
            w.write('    %s\n' % l)
        dcl = suite.__dict__
        cases = []
        for k in dcl.keys():
            if k.startswith('test_'):
                k = getattr(suite, k)
                try:
                    k.__name__
                except BaseException:
                    # not a test case, ignore
                    continue
                self.total_case += 1
                cases.append('\t%s\n' % (k.__name__))
                if self.verbose:
                    tags = getattr(k, TAGKEY, None)
                    if tags is not None:
                        cases.append('\n\t    Tags: %s\n\n' %
                                     (', '.join(tags)))
                    doc = k.__doc__
                    if doc is not None:
                        cases.append('\t    Test Case Doc: \n')
                        for l in str(doc).split('\n'):
                            cases.append('\t%s\n' % (l))
        if len(cases) > 0:
            w.write('    Test Cases: \n')
            w.writelines(cases)
        if self.list_test or self.showinfo:
            lines = self._get_hierarchy(suite, 1)[1:]
            if len(lines) > 0:
                w.write('\n    Test suite hierarchy:\n')
                for l in lines:
                    w.write(l + '\n')

    def _gen_ts_tree(self, suite):
        n = suite.__name__
        tsd = {}
        tsd['doc'] = str(suite.__doc__)
        tstags = getattr(suite, TAGKEY, [])
        numnodes = 1
        for tag in tstags:
            if 'numnodes' in tag:
                numnodes = tag.split('=')[1].strip()
                break
        tsd['tags'] = tstags if len(tstags) > 0 else "None"
        tsd['numnodes'] = str(numnodes)
        tsd['file'] = suite.__module__.replace('.', '/') + '.py'
        tsd['module'] = suite.__module__
        dcl = suite.__dict__
        tcs = {}
        ts_req = getattr(suite, REQUIREMENTS_KEY, {})
        for k in dcl.keys():
            if k.startswith('test_'):
                tcd = {}
                tc = getattr(suite, k)
                try:
                    tc.__name__
                except BaseException:
                    # not a test case, ignore
                    continue
                tcd['doc'] = str(tc.__doc__)
                tc_req = getattr(tc, REQUIREMENTS_KEY, {})
                tcd['requirements'] = get_effective_reqs(ts_req, tc_req)
                numnodes = 1
                tctags = sorted(set(tstags + getattr(tc, TAGKEY, [])))
                for tag in tctags:
                    if 'numnodes' in tag:
                        numnodes = tag.split('=')[1].strip()
                        break
                tcd['tags'] = tctags if len(tctags) > 0 else "None"
                tcd['numnodes'] = str(numnodes)
                tcs[k] = deepcopy(tcd)
                if len(tctags) > 0:
                    for tag in tctags:
                        if tag not in self.__tags_tree.keys():
                            self.__tags_tree[tag] = {}
                        if n not in self.__tags_tree[tag].keys():
                            self.__tags_tree[tag][n] = deepcopy(tsd)
                        if 'tclist' not in self.__tags_tree[tag][n].keys():
                            self.__tags_tree[tag][n]['tclist'] = {}
                        self.__tags_tree[tag][n]['tclist'][k] = deepcopy(tcd)
                else:
                    if n not in self.__tags_tree['NoTags'].keys():
                        self.__tags_tree['NoTags'][n] = deepcopy(tsd)
                    if 'tclist' not in self.__tags_tree['NoTags'][n].keys():
                        self.__tags_tree['NoTags'][n]['tclist'] = {}
                    self.__tags_tree['NoTags'][n]['tclist'][k] = deepcopy(tcd)
        if len(tcs.keys()) > 0:
            self.__ts_tree[n] = deepcopy(tsd)
            self.__ts_tree[n]['tclist'] = tcs

    def finalize(self, result):
        if (self.list_test and not self.suites) or self.gen_ts_tree:
            suites = list(self._tree.keys())
        else:
            suites = self.suites
        suites.sort()
        unknown = []
        if self.gen_ts_tree:
            func = self._gen_ts_tree
        else:
            func = self._print_suite_info
        for k in suites:
            try:
                suite = eval(k, globals(), self._tree)
            except BaseException:
                unknown.append(k)
                continue
            func(suite)
        if self.list_test:
            w = sys.stdout
            w.write('\n\n')
            w.write('Total number of Test Suites: %d\n' % (self.total_suite))
            w.write('Total number of Test Cases: %d\n' % (self.total_case))
        elif self.gen_ts_tree:
            tsdata = ''
            tagsdata = ''
            try:
                import json
                tsdata = json.dumps(self.__ts_tree, indent=4)
                tagsdata = json.dumps(self.__tags_tree, indent=4)
            except ImportError:
                try:
                    import simplejson
                    tsdata = simplejson.dumps(self.__ts_tree, indent=4)
                    tagsdata = simplejson.dumps(self.__tags_tree, indent=4)
                except ImportError:
                    _pre = str(self.__ts_tree).replace('"', '\\"')
                    tsdata = _pre.replace('\'', '"')
                    _pre = str(self.__tags_tree).replace('"', '\\"')
                    tagsdata = _pre.replace('\'', '"')
            f = open('ptl_ts_tree.json', 'w+')
            f.write(tsdata)
            f.close()
            f = open('ptl_tags_tree.json', 'w+')
            f.write(tagsdata)
            f.close()
        if len(unknown) > 0:
            self.logger.error('Unknown testsuite(s): %s' % (','.join(unknown)))


================================================
FILE: test/fw/ptl/utils/plugins/ptl_test_loader.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import sys
import logging
import copy
from nose.plugins.base import Plugin
from ptl.utils.pbs_testsuite import PBSTestSuite
from ptl.utils.pbs_dshutils import DshUtils


class PTLTestLoader(Plugin):

    """
    Load test cases from given parameter
    """
    name = 'PTLTestLoader'
    score = sys.maxsize - 1
    logger = logging.getLogger(__name__)

    def __init__(self):
        Plugin.__init__(self)
        self.suites_list = []
        self.excludes = []
        self.follow = False
        self._only_ts = '__only__ts__'
        self._only_tc = '__only__tc__'
        self._test_marker = 'test_'
        self._tests_list = {self._only_ts: [], self._only_tc: []}
        self._excludes_list = {self._only_ts: [], self._only_tc: []}
        self.__tests_list_copy = {self._only_ts: [], self._only_tc: []}
        self.__allowed_cls = []
        self.__allowed_method = []
        self.testfiles = None

    def options(self, parser, env):
        """
        Register command line options
        """
        pass

    def set_data(self, testgroup, suites, excludes, follow, testfiles=None):
        """
        Set the data required for loading test data

        :param testgroup: Test group
        :param suites: Test suites to load
        :param excludes: Tests to exclude while running
        :param testfiles: Flag to check if test is run by filename
        """
        if os.access(str(testgroup), os.R_OK):
            f = open(testgroup, 'r')
            self.suites_list.extend(f.readline().strip().split(','))
            f.close()
        elif suites is not None:
            self.suites_list.extend(suites.split(','))
        if excludes is not None:
            self.excludes.extend(excludes.split(','))
        self.follow = follow
        self.testfiles = testfiles

    def configure(self, options, config):
        """
        Configure the ``plugin`` and ``system``, based on selected options
        """
        tl = self._tests_list
        tlc = self.__tests_list_copy
        for _is in self.suites_list:
            if '.' in _is:
                suite, case = _is.split('.')
                if case in tl[self._only_tc]:
                    tl[self._only_tc].remove(case)
                    tlc[self._only_tc].remove(case)
                if suite in tl.keys():
                    if case not in tl[suite]:
                        tl[suite].append(case)
                        tlc[suite].append(case)
                else:
                    tl.setdefault(suite, [case])
                    tlc.setdefault(suite, [case])
            elif _is.startswith(self._test_marker):
                if _is not in tl[self._only_tc]:
                    tl[self._only_tc].append(_is)
                    tlc[self._only_tc].append(_is)
            else:
                if _is not in tl[self._only_ts]:
                    tl[self._only_ts].append(_is)
                    tlc[self._only_ts].append(_is)
        for k, v in tl.items():
            if k in (self._only_ts, self._only_tc):
                continue
            if len(v) == 0:
                tl[self._only_ts].append(k)
                tlc[self._only_ts].append(k)
        for name in tl[self._only_ts]:
            if name in tl.keys():
                del tl[name]
                del tlc[name]
        extl = self._excludes_list
        for _is in self.excludes:
            if '.' in _is:
                suite, case = _is.split('.')
                if case in extl[self._only_tc]:
                    extl[self._only_tc].remove(case)
                if suite in extl.keys():
                    if case not in extl[suite]:
                        extl[suite].append(case)
                else:
                    extl.setdefault(suite, [case])
            elif _is.startswith(self._test_marker):
                if _is not in extl[self._only_tc]:
                    extl[self._only_tc].append(_is)
            else:
                if _is not in extl[self._only_ts]:
                    extl[self._only_ts].append(_is)
        for k, v in extl.items():
            if k in (self._only_ts, self._only_tc):
                continue
            if len(v) == 0:
                extl[self._only_ts].append(k)
        for name in extl[self._only_ts]:
            if name in extl.keys():
                del extl[name]
        self.logger.debug('included_tests:%s' % (str(self._tests_list)))
        self.logger.debug('included_tests(copy):%s' %
                          (str(self.__tests_list_copy)))
        self.logger.debug('excluded_tests:%s' % (str(self._excludes_list)))
        self.enabled = len(self.suites_list) > 0
        del self.suites_list
        del self.excludes

    def check_unknown(self):
        """
        Check for unknown test suite and test case
        """
        self.logger.debug('check_unknown called')
        tests_list_copy = copy.deepcopy(self.__tests_list_copy)
        only_ts = tests_list_copy.pop(self._only_ts)
        only_tc = tests_list_copy.pop(self._only_tc)
        msg = []
        if len(tests_list_copy) > 0:
            for k, v in tests_list_copy.items():
                msg.extend(map(lambda x: k + '.' + x, v))
        if len(only_tc) > 0:
            msg.extend(only_tc)
        if len(msg) > 0:
            _msg = ['unknown testcase(s): %s' % (','.join(msg))]
            msg = _msg
        if len(only_ts) > 0:
            msg += ['unknown testsuite(s): %s' % (','.join(only_ts))]
        if len(msg) > 0:
            for l in msg:
                self.logger.error(l)
            sys.exit(1)

    def prepareTestLoader(self, loader):
        """
        Prepare test loader
        """
        old_loadTestsFromNames = loader.loadTestsFromNames

        def check_loadTestsFromNames(names, module=None):
            tests_dir = names
            if not self.testfiles:
                ptl_test_dir = __file__
                ptl_test_dir = os.path.join(ptl_test_dir.split('ptl')[0],
                                            "ptl", "tests")
                user_test_dir = os.environ.get("PTL_TESTS_DIR", None)
                if user_test_dir and os.path.isdir(user_test_dir):
                    tests_dir += [user_test_dir]
                if os.path.isdir(ptl_test_dir):
                    tests_dir += [ptl_test_dir]
            rv = old_loadTestsFromNames(tests_dir, module)
            self.check_unknown()
            return rv
        loader.loadTestsFromNames = check_loadTestsFromNames
        return loader

    def check_follow(self, cls, method=None):
        cname = cls.__name__
        if not issubclass(cls, PBSTestSuite):
            return False
        if cname == 'PBSTestSuite':
            if 'PBSTestSuite' not in self._tests_list[self._only_ts]:
                return False
        if cname in self._excludes_list[self._only_ts]:
            return False
        if cname in self._tests_list[self._only_ts]:
            if cname in self.__tests_list_copy[self._only_ts]:
                self.__tests_list_copy[self._only_ts].remove(cname)
            return True
        if ((cname in self._tests_list.keys()) and (method is None)):
            return True
        if method is not None:
            mname = method.__name__
            if not mname.startswith(self._test_marker):
                return False
            if mname in self._excludes_list[self._only_tc]:
                return False
            if ((cname in self._excludes_list.keys()) and
                    (mname in self._excludes_list[cname])):
                return False
            if ((cname in self._tests_list.keys()) and
                    (mname in self._tests_list[cname])):
                if cname in self.__tests_list_copy.keys():
                    if mname in self.__tests_list_copy[cname]:
                        self.__tests_list_copy[cname].remove(mname)
                    if len(self.__tests_list_copy[cname]) == 0:
                        del self.__tests_list_copy[cname]
                return True
            if mname in self._tests_list[self._only_tc]:
                if mname in self.__tests_list_copy[self._only_tc]:
                    self.__tests_list_copy[self._only_tc].remove(mname)
                return True
        if self.follow:
            return self.check_follow(cls.__bases__[0], method)
        else:
            return False

    def is_already_allowed(self, cls, method=None):
        """
        :param method: Method to check
        :returns: True if method is already allowed else False
        """
        name = cls.__name__
        if method is not None:
            name += '.' + method.__name__
            if name in self.__allowed_method:
                return True
            else:
                self.__allowed_method.append(name)
                return False
        else:
            if name in self.__allowed_cls:
                return True
            else:
                self.__allowed_cls.append(name)
                return False

    def wantClass(self, cls):
        """
        Is the class wanted?
        """
        has_test = False
        for t in dir(cls):
            if t.startswith(self._test_marker):
                has_test = True
                break
        if not has_test:
            return False
        rv = self.check_follow(cls)
        if rv and not self.is_already_allowed(cls):
            self.logger.debug('wantClass:%s' % (str(cls)))
        else:
            return False

    def wantFunction(self, function):
        """
        Is the function wanted?
        """
        return self.wantMethod(function)

    def wantMethod(self, method):
        """
        Is the method wanted?
        """
        try:
            cls = method.__self__.__class__
        except AttributeError:
            return False
        if not method.__name__.startswith(self._test_marker):
            return False
        rv = self.check_follow(cls, method)
        if rv and not self.is_already_allowed(cls, method):
            self.logger.debug('wantMethod:%s' % (str(method)))
        else:
            return False


================================================
FILE: test/fw/ptl/utils/plugins/ptl_test_runner.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import datetime
import logging
import fnmatch
import os
import platform
import pwd
import re
import signal
import socket
import sys
import time
import tempfile
import unittest
from threading import Timer
from logging import StreamHandler
from traceback import format_exception
from types import ModuleType

from nose.core import TextTestRunner
from nose.plugins.base import Plugin
from nose.plugins.skip import SkipTest
from nose.suite import ContextSuite
from nose.util import isclass

import ptl
from ptl.lib.pbs_testlib import PBSInitServices
from ptl.utils.pbs_covutils import LcovUtils
from ptl.utils.pbs_dshutils import DshUtils
from ptl.utils.pbs_dshutils import TimeOut
from ptl.utils.pbs_testsuite import (MINIMUM_TESTCASE_TIMEOUT,
                                     REQUIREMENTS_KEY, TIMEOUT_KEY)
from ptl.utils.plugins.ptl_test_info import get_effective_reqs
from ptl.utils.pbs_testusers import PBS_ALL_USERS, PBS_USERS, PbsUser
from ptl.lib.ptl_constants import (PTL_TRUE, PTL_FALSE)
from io import StringIO

log = logging.getLogger('nose.plugins.PTLTestRunner')


class TCThresholdReached(Exception):
    """
    Raise this exception to tell that tc-failure-threshold reached
    """


class TestLogCaptureHandler(StreamHandler):
    """
    Log handler for capturing logs which test case print
    using logging module
    """

    def __init__(self):
        self.buffer = StringIO()
        StreamHandler.__init__(self, self.buffer)
        self.setLevel(logging.DEBUG2)
        fmt = '%(asctime)-15s %(levelname)-8s %(message)s'
        self.setFormatter(logging.Formatter(fmt))

    def get_logs(self):
        return self.buffer.getvalue()


class _PtlTestResult(unittest.TestResult):

    """
    Ptl custom test result
    """
    separator1 = '=' * 70
    separator2 = '___m_oo_m___'
    logger = logging.getLogger(__name__)

    def __init__(self, stream, descriptions, verbosity, config=None):
        unittest.TestResult.__init__(self)
        self.stream = stream
        self.showAll = verbosity > 1
        self.dots = verbosity == 1
        self.descriptions = descriptions
        self.errorClasses = {}
        self.config = config
        self.success = []
        self.skipped = []
        self.timedout = []
        self.handler = TestLogCaptureHandler()
        self.start = datetime.datetime.now()
        self.stop = datetime.datetime.now()

    def getDescription(self, test):
        """
        Get the test result description
        """
        if hasattr(test, 'test'):
            return str(test.test)
        elif isinstance(test.context, ModuleType):
            tmn = getattr(test.context, '_testMethodName', 'unknown')
            return '%s (%s)' % (tmn, test.context.__name__)
        elif isinstance(test, ContextSuite):
            tmn = getattr(test.context, '_testMethodName', 'unknown')
            return '%s (%s.%s)' % (tmn,
                                   test.context.__module__,
                                   test.context.__name__)
        else:
            return str(test)

    def getTestDoc(self, test):
        """
        Get test document
        """
        if hasattr(test, 'test'):
            if hasattr(test.test, '_testMethodDoc'):
                return test.test._testMethodDoc
            else:
                return None
        else:
            if hasattr(test, '_testMethodDoc'):
                return test._testMethodDoc
            else:
                return None

    def clear_stop(self):
        self.shouldStop = False

    def startTest(self, test):
        """
        Start the test

        :param test: Test to start
        :type test: str
        """
        ptl_logger = logging.getLogger('ptl')
        if self.handler not in ptl_logger.handlers:
            ptl_logger.addHandler(self.handler)
        self.handler.buffer.truncate(0)
        self.handler.buffer.seek(0)
        unittest.TestResult.startTest(self, test)
        test.start_time = datetime.datetime.now()
        if self.showAll:
            self.logger.info('test name: ' + self.getDescription(test) + '...')
            self.logger.info('test start time: ' + test.start_time.ctime())
            tdoc = self.getTestDoc(test)
            if tdoc is not None:
                tdoc = '\n' + tdoc
            self.logger.info('test docstring: %s' % (tdoc))

    def addSuccess(self, test):
        """
        Add success to the test result
        """
        self.success.append(test)
        unittest.TestResult.addSuccess(self, test)
        if self.showAll:
            self.logger.info('ok\n')
        elif self.dots:
            self.logger.info('.')

    def _addError(self, test, err):
        unittest.TestResult.addError(self, test, err)
        if self.showAll:
            self.logger.info('ERROR\n')
        elif self.dots:
            self.logger.info('E')

    def addError(self, test, err):
        """
        Add error to the test result

        :param test: Test for which to add error
        :type test: str
        :param error: Error message to add
        :type error: str
        """
        if isclass(err[0]) and issubclass(err[0], TCThresholdReached):
            return
        if isclass(err[0]) and issubclass(err[0], SkipTest):
            self.addSkip(test, err[1])
            return
        if isclass(err[0]) and issubclass(err[0], TimeOut):
            self.addTimedOut(test, err)
            return
        for cls, (storage, label, isfail) in self.errorClasses.items():
            if isclass(err[0]) and issubclass(err[0], cls):
                if isfail:
                    test.passed = False
                storage.append((test, err))
                if self.showAll:
                    self.logger.info(label + '\n')
                elif self.dots:
                    self.logger.info(label[0])
                return
        test.passed = False
        self._addError(test, err)

    def addFailure(self, test, err):
        """
        Indicate failure
        """
        unittest.TestResult.addFailure(self, test, err)
        if self.showAll:
            self.logger.info('FAILED\n')
        elif self.dots:
            self.logger.info('F')

    def addSkip(self, test, reason):
        """
        Indicate skipping of test

        :param test: Test to skip
        :type test: str
        :param reason: Reason fot the skip
        :type reason: str
        """
        self.skipped.append((test, reason))
        if self.showAll:
            self.logger.info('SKIPPED')
        elif self.dots:
            self.logger.info('S')

    def addTimedOut(self, test, err):
        """
        Indicate timeout

        :param test: Test for which timeout happened
        :type test: str
        :param err: Error for timeout
        :type err: str
        """
        self.timedout.append((test, self._exc_info_to_string(err, test)))
        if self.showAll:
            self.logger.info('TIMEDOUT')
        elif self.dots:
            self.logger.info('T')

    def printErrors(self):
        """
        Print the errors
        """
        _blank_line = False
        if ((len(self.errors) > 0) or (len(self.failures) > 0) or
                (len(self.timedout) > 0)):
            if self.dots or self.showAll:
                self.logger.info('')
                _blank_line = True
            self.printErrorList('ERROR', self.errors)
            self.printErrorList('FAILED', self.failures)
            self.printErrorList('TIMEDOUT', self.timedout)
        for cls in self.errorClasses.keys():
            storage, label, isfail = self.errorClasses[cls]
            if isfail:
                if not _blank_line:
                    self.logger.info('')
                    _blank_line = True
                self.printErrorList(label, storage)
        self.config.plugins.report(self.stream)

    def printErrorList(self, flavour, errors):
        """
        Print the error list

        :param errors: Errors to print
        """
        for test, err in errors:
            self.logger.info(self.separator1)
            self.logger.info('%s: %s\n' % (flavour, self.getDescription(test)))
            self.logger.info(self.separator2)
            self.logger.info('%s\n' % err)

    def printLabel(self, label, err=None):
        """
        Print the label for the error

        :param label: Label to print
        :type label: str
        :param err: Error for which label to be printed
        :type err: str
        """
        if self.showAll:
            message = [label]
            if err:
                try:
                    detail = str(err[1])
                except BaseException:
                    detail = None
                if detail:
                    message.append(detail)
            self.logger.info(': '.join(message))
        elif self.dots:
            self.logger.info(label[:1])

    def wasSuccessful(self):
        """
        Check whether the test successful or not

        :returns: True if no ``errors`` or no ``failures`` or no ``timeout``
                  else return False
        """
        if self.errors or self.failures or self.timedout:
            return False
        for cls in self.errorClasses.keys():
            storage, _, isfail = self.errorClasses[cls]
            if not isfail:
                continue
            if storage:
                return False
        return True

    def printSummary(self):
        """
        Called by the test runner to print the final summary of test
        run results.

        :param start: Time at which test begins
        :param stop:  Time at which test ends
        """
        self.printErrors()
        msg = ['=' * 80]
        ef = []
        error = 0
        fail = 0
        skip = 0
        timedout = 0
        success = len(self.success)
        if len(self.failures) > 0:
            for failedtest in self.failures:
                fail += 1
                msg += ['failed: ' + self.getDescription(failedtest[0])]
                ef.append(failedtest)
        if len(self.errors) > 0:
            for errtest in self.errors:
                error += 1
                msg += ['error: ' + self.getDescription(errtest[0])]
                ef.append(errtest)
        if len(self.skipped) > 0:
            for skiptest, reason in self.skipped:
                skip += 1
                _msg = 'skipped: ' + str(skiptest).strip()
                _msg += ' reason: ' + str(reason).strip()
                msg += [_msg]
        if len(self.timedout) > 0:
            for tdtest in self.timedout:
                timedout += 1
                msg += ['timedout: ' + self.getDescription(tdtest[0])]
                ef.append(tdtest)
        cases = []
        suites = []
        for _ef in ef:
            if hasattr(_ef[0], 'test'):
                cname = _ef[0].test.__class__.__name__
                tname = getattr(_ef[0].test, '_testMethodName', 'unknown')
                cases.append(cname + '.' + tname)
                suites.append(cname)
        cases = sorted(list(set(cases)))
        suites = sorted(list(set(suites)))
        if len(cases) > 0:
            _msg = 'Test cases with failures: '
            _msg += ','.join(cases)
            msg += [_msg]
        if len(suites) > 0:
            _msg = 'Test suites with failures: '
            _msg += ','.join(suites)
            msg += [_msg]
        runned = success + fail + error + skip + timedout
        _msg = 'run: ' + str(runned)
        _msg += ', succeeded: ' + str(success)
        _msg += ', failed: ' + str(fail)
        _msg += ', errors: ' + str(error)
        _msg += ', skipped: ' + str(skip)
        _msg += ', timedout: ' + str(timedout)
        msg += [_msg]
        msg += ['Tests run in ' + str(self.stop - self.start)]
        self.logger.info('\n'.join(msg))


class SystemInfo:

    """
        used to get system's ram size and disk size information.

        :system_ram: Available ram(in GB) of the test running machine
        :system_disk: Available disk size(in GB) of the test running machine
    """
    logger = logging.getLogger(__name__)

    def get_system_info(self, hostname=None):
        du = DshUtils()
        # getting RAM size in gb
        mem_info = du.cat(hostname, "/proc/meminfo")
        if mem_info['rc'] != 0:
            _msg = 'failed to get content of /proc/meminfo of host: '
            self.logger.error(_msg + hostname)
        else:
            got_mem_available = False
            for i in mem_info['out']:
                if "MemTotal" in i:
                    self.system_total_ram = float(i.split()[1]) / (2**20)
                elif "MemAvailable" in i:
                    mem_available = float(i.split()[1]) / (2**20)
                    got_mem_available = True
                    break
                elif "MemFree" in i:
                    mem_free = float(i.split()[1]) / (2**20)
                elif "Buffers" in i:
                    buffers = float(i.split()[1]) / (2**20)
                elif i.startswith("Cached"):
                    cached = float(i.split()[1]) / (2**20)
            if got_mem_available:
                self.system_ram = mem_available
            else:
                self.system_ram = mem_free + buffers + cached
        # getting disk size in gb
        pbs_conf = du.parse_pbs_config(hostname)
        pbs_home_info = du.run_cmd(hostname, cmd=['df', '-k',
                                                  pbs_conf['PBS_HOME']])
        if pbs_home_info['rc'] != 0:
            _msg = 'failed to get output of df -k command of host: '
            self.logger.error(_msg + hostname)
        else:
            disk_info = pbs_home_info['out']
            disk_size = disk_info[1].split()
            self.system_disk = float(disk_size[3]) / (2**20)
            self.system_disk_used_percent = float(disk_size[4].rstrip('%'))


class PtlTextTestRunner(TextTestRunner):

    """
    Test runner that uses ``PtlTestResult`` to enable errorClasses,
    as well as providing hooks for plugins to override or replace the test
    output stream, results, and the test case itself.
    """

    cur_repeat_count = 1

    def __init__(self, stream=sys.stdout, descriptions=True, verbosity=3,
                 config=None, repeat_count=1, repeat_delay=0):
        self.logger = logging.getLogger(__name__)
        self.result = None
        self.repeat_count = repeat_count
        self.repeat_delay = repeat_delay
        TextTestRunner.__init__(self, stream, descriptions, verbosity, config)

    def _makeResult(self):
        return _PtlTestResult(self.stream, self.descriptions, self.verbosity,
                              self.config)

    def run(self, test):
        """
        Overrides to provide plugin hooks and defer all output to
        the test result class.
        """
        do_exit = False
        wrapper = self.config.plugins.prepareTest(test)
        if wrapper is not None:
            test = wrapper
        wrapped = self.config.plugins.setOutputStream(self.stream)
        if wrapped is not None:
            self.stream = wrapped
        self.result = result = self._makeResult()
        self.result.start = datetime.datetime.now()
        try:
            for i in range(self.repeat_count):
                PtlTextTestRunner.cur_repeat_count = i + 1
                if i != 0:
                    time.sleep(self.repeat_delay)
                test(result)
            if self.repeat_count > 1:
                self.logger.info("==========================================")
                self.logger.info("All Tests are repeated %d times"
                                 % self.repeat_count)
                self.logger.info("==========================================")
        except KeyboardInterrupt:
            do_exit = True
        self.result.stop = datetime.datetime.now()
        result.printSummary()
        self.config.plugins.finalize(result)
        if do_exit:
            sys.exit(1)
        return result


class PTLTestRunner(Plugin):

    """
    PTL Test Runner Plugin
    """
    name = 'PTLTestRunner'
    score = sys.maxsize - 4
    logger = logging.getLogger(__name__)
    timeout = None

    def __init__(self):
        Plugin.__init__(self)
        self.param = None
        self.repeat_count = 1
        self.repeat_delay = 0
        self.use_cur_setup = False
        self.lcov_bin = None
        self.lcov_data = None
        self.lcov_out = None
        self.lcov_utils = None
        self.lcov_nosrc = None
        self.lcov_baseurl = None
        self.genhtml_bin = None
        self.config = None
        self.result = None
        self.tc_failure_threshold = None
        self.cumulative_tc_failure_threshold = None
        self.__failed_tc_count = 0
        self.__tf_count = 0
        self.__failed_tc_count_msg = False
        self._test_marker = 'test_'
        self.hardware_report_timer = None

    def options(self, parser, env):
        """
        Register command line options
        """
        pass

    def set_data(self, paramfile, testparam, repeat_count,
                 repeat_delay, lcov_bin, lcov_data, lcov_out,
                 genhtml_bin, lcov_nosrc, lcov_baseurl,
                 tc_failure_threshold, cumulative_tc_failure_threshold,
                 use_cur_setup):
        if paramfile is not None:
            _pf = open(paramfile, 'r')
            _params_from_file = _pf.readlines()
            _pf.close()
            _nparams = []
            for l in range(len(_params_from_file)):
                if _params_from_file[l].startswith('#'):
                    continue
                else:
                    _nparams.append(_params_from_file[l])
            _f = ','.join([l.strip('\r\n') for l in _nparams])
            if testparam is not None:
                testparam += ',' + _f
            else:
                testparam = _f
        self.param = testparam
        self.repeat_count = repeat_count
        self.repeat_delay = repeat_delay
        self.use_cur_setup = use_cur_setup
        self.lcov_bin = lcov_bin
        self.lcov_data = lcov_data
        self.lcov_out = lcov_out
        self.genhtml_bin = genhtml_bin
        self.lcov_nosrc = lcov_nosrc
        self.lcov_baseurl = lcov_baseurl
        self.tc_failure_threshold = tc_failure_threshold
        self.cumulative_tc_failure_threshold = cumulative_tc_failure_threshold

    def configure(self, options, config):
        """
        Configure the plugin and system, based on selected options
        """
        self.config = config
        self.enabled = True
        self.param_dict = self.__get_param_dictionary()

    def prepareTestRunner(self, runner):
        """
        Prepare test runner
        """
        return PtlTextTestRunner(verbosity=3, config=self.config,
                                 repeat_count=self.repeat_count,
                                 repeat_delay=self.repeat_delay)

    def prepareTestResult(self, result):
        """
        Prepare test result
        """
        self.result = result

    def startContext(self, context):
        context.param = self.param
        context.use_cur_setup = self.use_cur_setup
        context.start_time = datetime.datetime.now()
        if isclass(context) and issubclass(context, unittest.TestCase):
            self.result.logger.info(self.result.separator1)
            self.result.logger.info('suite name: ' + context.__name__)
            doc = context.__doc__
            if doc is not None:
                self.result.logger.info('suite docstring: \n' + doc + '\n')
            self.result.logger.info(self.result.separator1)
            self.__failed_tc_count = 0
            self.__failed_tc_count_msg = False

    def __get_timeout(self, test):
        _test = None
        if hasattr(test, 'test'):
            _test = test.test
        elif hasattr(test, 'context'):
            _test = test.context
        if _test is None:
            return MINIMUM_TESTCASE_TIMEOUT
        dflt_timeout = int(getattr(_test,
                                   'conf',
                                   {}).get('default-testcase-timeout',
                                           MINIMUM_TESTCASE_TIMEOUT))
        tc_timeout = int(getattr(getattr(_test,
                                         getattr(_test, '_testMethodName', ''),
                                         None),
                                 TIMEOUT_KEY,
                                 0))
        return max([dflt_timeout, tc_timeout])

    def __set_test_end_data(self, test, err=None):
        if self.hardware_report_timer is not None:
            self.hardware_report_timer.cancel()
        if not hasattr(test, 'start_time'):
            test = test.context
        if err is not None:
            is_skip = issubclass(err[0], SkipTest)
            is_tctr = issubclass(err[0], TCThresholdReached)
            if not (is_skip or is_tctr):
                self.__failed_tc_count += 1
                self.__tf_count += 1
            try:
                test.err_in_string = self.result._exc_info_to_string(err,
                                                                     test)
            except BaseException:
                etype, value, tb = err
                test.err_in_string = ''.join(format_exception(etype, value,
                                                              tb))
        else:
            test.err_in_string = 'None'
        test.end_time = datetime.datetime.now()
        test.duration = test.end_time - test.start_time
        test.captured_logs = self.result.handler.get_logs()

    def __get_param_dictionary(self):
        """
        Method to convert data in param into dictionary of cluster
        information
        """
        def get_bool(v):
            if v is None or v == '':
                return False
            if v in PTL_TRUE:
                return True
            if v in PTL_FALSE:
                return False
            raise ValueError("Need boolean value, not %s" % v)

        tparam_contents = {}
        nomomlist = []
        shortname = (socket.gethostname()).split('.', 1)[0]
        for key in ['servers', 'moms', 'comms', 'clients', 'nomom']:
            tparam_contents[key] = []
        tparam_contents['mom_on_server'] = False
        tparam_contents['no_mom_on_server'] = False
        tparam_contents['no_comm_on_server'] = False
        tparam_contents['no_comm_on_mom'] = False
        if self.param is not None:
            for h in self.param.split(','):
                if '=' in h:
                    k, v = h.split('=', 1)
                    hosts = [x.split('@')[0] for x in v.split(':')]
                    if (k == 'server' or k == 'servers'):
                        tparam_contents['servers'].extend(hosts)
                    elif (k == 'mom' or k == 'moms'):
                        tparam_contents['moms'].extend(hosts)
                    elif k == 'comms':
                        tparam_contents['comms'] = hosts
                    elif k == 'client':
                        tparam_contents['clients'] = hosts
                    elif k == 'nomom':
                        nomomlist = hosts
                    elif k == 'mom_on_server':
                        tparam_contents['mom_on_server'] = get_bool(v)
                    elif k == 'no_mom_on_server':
                        tparam_contents['no_mom_on_server'] = get_bool(v)
                    elif k == 'no_comm_on_mom':
                        tparam_contents['no_comm_on_mom'] = get_bool(v)
        for pkey in ['servers', 'moms', 'comms', 'clients']:
            if not tparam_contents[pkey]:
                tparam_contents[pkey] = set([shortname])
            else:
                tparam_contents[pkey] = set(tparam_contents[pkey])
        if nomomlist:
            tparam_contents['nomom'] = set(nomomlist)
        return tparam_contents

    @staticmethod
    def __are_requirements_matching(param_dic=None, test=None):
        """
        Validates test requirements against test cluster information
        returns True on match or error message otherwise None

        :param param_dic: dictionary of cluster information from data passed
                          to param list
        :param_dic type: dic
        :param test: test object
        :test type: object

        :returns True or error message or None
        """
        logger = logging.getLogger(__name__)
        ts_requirements = {}
        tc_requirements = {}
        param_count = {}
        _servers = set(param_dic['servers'])
        _moms = set(param_dic['moms'])
        _comms = set(param_dic['comms'])
        _nomom = set(param_dic['nomom'])
        _mom_on_server = param_dic['mom_on_server']
        _no_mom_on_server = param_dic['no_mom_on_server']
        _no_comm_on_mom = param_dic['no_comm_on_mom']
        _no_comm_on_server = param_dic['no_comm_on_server']
        shortname = (socket.gethostname()).split('.', 1)[0]
        if test is None:
            return None
        test_name = getattr(test.test, '_testMethodName', None)
        if test_name is not None:
            method = getattr(test.test, test_name, None)
        if method is not None:
            tc_requirements = getattr(method, REQUIREMENTS_KEY, {})
            cls = method.__self__.__class__
            ts_requirements = getattr(cls, REQUIREMENTS_KEY, {})
        if not tc_requirements:
            if not ts_requirements:
                return None
        eff_tc_req = get_effective_reqs(ts_requirements, tc_requirements)
        setattr(test.test, 'requirements', eff_tc_req)
        for key in ['servers', 'moms', 'comms', 'clients']:
            param_count['num_' + key] = len(param_dic[key])
        for pk in param_count:
            if param_count[pk] < eff_tc_req[pk]:
                _msg = 'available ' + pk + " ("
                _msg += str(param_count[pk]) + ") is less than required " + pk
                _msg += " (" + str(eff_tc_req[pk]) + ")"
                logger.error(_msg)
                return _msg

        if hasattr(test, 'test'):
            _test = test.test
        elif hasattr(test, 'context'):
            _test = test.context
        else:
            return None

        name = 'moms'
        if (hasattr(_test, name) and
                (getattr(_test, name, None) is not None)):
            for mc in getattr(_test, name).values():
                platform = mc.platform
                if platform not in ['linux', 'shasta',
                                    'cray'] and mc.hostname in _moms:
                    _moms.remove(mc.hostname)
        for hostname in _moms:
            si = SystemInfo()
            si.get_system_info(hostname)
            available_sys_ram = getattr(si, 'system_ram', None)
            if available_sys_ram is None:
                _msg = 'failed to get ram info on host: ' + hostname
                logger.error(_msg)
                return _msg
            elif eff_tc_req['min_mom_ram'] >= available_sys_ram:
                _msg = hostname + ': available ram (' + str(available_sys_ram)
                _msg += ') is less than the minimum required ram ('
                _msg += str(eff_tc_req['min_mom_ram'])
                _msg += ') for test execution'
                logger.error(_msg)
                return _msg
            available_sys_disk = getattr(si, 'system_disk', None)
            if available_sys_disk is None:
                _msg = 'failed to get disk info on host: ' + hostname
                logger.error(_msg)
                return _msg
            elif eff_tc_req['min_mom_disk'] >= available_sys_disk:
                _msg = hostname + ': available disk space ('
                _msg += str(available_sys_disk)
                _msg += ') is less than the minimum required disk space ('
                _msg += str(eff_tc_req['min_mom_disk'])
                _msg += ') for test execution'
                logger.error(_msg)
                return _msg
        for hostname in param_dic['servers']:
            si = SystemInfo()
            si.get_system_info(hostname)
            available_sys_ram = getattr(si, 'system_ram', None)
            if available_sys_ram is None:
                _msg = 'failed to get ram info on host: ' + hostname
                logger.error(_msg)
                return _msg
            elif eff_tc_req['min_server_ram'] >= available_sys_ram:
                _msg = hostname + ': available ram (' + str(available_sys_ram)
                _msg += ') is less than the minimum required ram ('
                _msg += str(eff_tc_req['min_server_ram'])
                _msg += ') for test execution'
                logger.error(_msg)
                return _msg
            available_sys_disk = getattr(si, 'system_disk', None)
            if available_sys_disk is None:
                _msg = 'failed to get disk info on host: ' + hostname
                logger.error(_msg)
                return _msg
            elif eff_tc_req['min_server_disk'] >= available_sys_disk:
                _msg = hostname + ': available disk space ('
                _msg += str(available_sys_disk)
                _msg += ') is less than the minimum required disk space ('
                _msg += str(eff_tc_req['min_server_disk'])
                _msg += ') for test execution'
                logger.error(_msg)
                return _msg
        if _moms & _servers:
            if eff_tc_req['no_mom_on_server'] or \
               (_nomom - _servers) or \
               _no_mom_on_server:
                _msg = 'no mom on server'
                logger.error(_msg)
                return _msg
        else:
            if eff_tc_req['mom_on_server'] or \
               _mom_on_server:
                _msg = 'mom on server'
                logger.error(_msg)
                return _msg
        if _comms & _servers:
            if eff_tc_req['no_comm_on_server'] or _no_comm_on_server:
                _msg = 'no comm on server'
                logger.error(_msg)
                return _msg
        comm_mom_list = _moms & _comms
        if comm_mom_list and shortname in comm_mom_list:
            # Excluding the server hostname for flag 'no_comm_on_mom'
            comm_mom_list.remove(shortname)
        if comm_mom_list:
            if eff_tc_req['no_comm_on_mom']:
                _msg = 'no comm on mom'
                logger.error(_msg)
                return _msg
        else:
            if not eff_tc_req['no_comm_on_mom']:
                _msg = 'no comm on server'
                logger.error(_msg)
                return _msg

    def check_hardware_status_and_core_files(self, test):
        """
        function checks hardware status and core files
        every 5 minutes
        """
        du = DshUtils()
        systems = list(self.param_dict['servers'])
        systems.extend(self.param_dict['moms'])
        systems.extend(self.param_dict['comms'])
        systems = list(set(systems))

        if hasattr(test, 'test'):
            _test = test.test
        elif hasattr(test, 'context'):
            _test = test.context
        else:
            return None

        for name in ['servers', 'moms', 'comms', 'clients']:
            mlist = None
            if (hasattr(_test, name) and
                    (getattr(_test, name, None) is not None)):
                mlist = getattr(_test, name).values()
            if mlist:
                for mc in mlist:
                    platform = mc.platform
                    if ((platform not in ['linux', 'shasta', 'cray']) and
                            (mc.hostname in systems)):
                        systems.remove(mc.hostname)

        self.hardware_report_timer = Timer(
            300, self.check_hardware_status_and_core_files, args=(test,))
        self.hardware_report_timer.start()

        for hostname in systems:
            hr = SystemInfo()
            hr.get_system_info(hostname)
            # monitors disk
            used_disk_percent = getattr(hr,
                                        'system_disk_used_percent', None)
            if used_disk_percent is None:
                _msg = hostname
                _msg += ": unable to get disk info"
                self.hardware_report_timer.cancel()
                raise SkipTest(_msg)
            elif 70 <= used_disk_percent < 95:
                _msg = hostname + ": disk usage is at "
                _msg += str(used_disk_percent) + "%"
                _msg += ", disk cleanup is recommended."
                self.logger.warning(_msg)
            elif used_disk_percent >= 95:
                _msg = hostname + ":disk usage > 95%, skipping the test(s)"
                self.hardware_report_timer.cancel()
                raise SkipTest(_msg)
            # checks for core files
            pbs_conf = du.parse_pbs_config(hostname)
            mom_priv_path = os.path.join(pbs_conf["PBS_HOME"], "mom_priv")
            if du.isdir(hostname=hostname, path=mom_priv_path):
                mom_priv_files = du.listdir(
                    hostname=hostname,
                    path=mom_priv_path,
                    sudo=True,
                    fullpath=False)
                if fnmatch.filter(mom_priv_files, "core*"):
                    _msg = hostname + ": core files found in "
                    _msg += mom_priv_path
                    self.logger.warning(_msg)
            server_priv_path = os.path.join(
                pbs_conf["PBS_HOME"], "server_priv")
            if du.isdir(hostname=hostname, path=server_priv_path):
                server_priv_files = du.listdir(
                    hostname=hostname,
                    path=server_priv_path,
                    sudo=True,
                    fullpath=False)
                if fnmatch.filter(server_priv_files, "core*"):
                    _msg = hostname + ": core files found in "
                    _msg += server_priv_path
                    self.logger.warning(_msg)
            sched_priv_path = os.path.join(pbs_conf["PBS_HOME"], "sched_priv")
            if du.isdir(hostname=hostname, path=sched_priv_path):
                sched_priv_files = du.listdir(
                    hostname=hostname,
                    path=sched_priv_path,
                    sudo=True,
                    fullpath=False)
                if fnmatch.filter(sched_priv_files, "core*"):
                    _msg = hostname + ": core files found in "
                    _msg += sched_priv_path
                    self.logger.warning(_msg)
            for u in PBS_ALL_USERS:
                user_home_files = du.listdir(hostname=hostname, path=u.home,
                                             sudo=True, fullpath=False,
                                             runas=u.name)
                if user_home_files and fnmatch.filter(
                        user_home_files, "core*"):
                    _msg = hostname + ": user-" + str(u)
                    _msg += ": core files found in "
                    self.logger.warning(_msg + u.home)

    def startTest(self, test):
        """
        Start the test
        """
        if ((self.cumulative_tc_failure_threshold != 0) and
                (self.__tf_count >= self.cumulative_tc_failure_threshold)):
            _msg = 'Total testcases failure count exceeded cumulative'
            _msg += ' testcase failure threshold '
            _msg += '(%d)' % self.cumulative_tc_failure_threshold
            self.logger.error(_msg)
            raise KeyboardInterrupt
        if ((self.tc_failure_threshold != 0) and
                (self.__failed_tc_count >= self.tc_failure_threshold)):
            if self.__failed_tc_count_msg:
                raise TCThresholdReached
            _msg = 'Testcases failure for this testsuite count exceeded'
            _msg += ' testcase failure threshold '
            _msg += '(%d)' % self.tc_failure_threshold
            self.logger.error(_msg)
            self.__failed_tc_count_msg = True
            raise TCThresholdReached
        rv = None
        rv = self.__are_requirements_matching(self.param_dict, test)
        if rv is not None:
            # Below method call is needed in order to get the test case
            # details in the output and to have the skipped test count
            # included in total run count of the test run
            self.result.startTest(test)
            raise SkipTest(rv)
        # function report hardware status and core files
        self.check_hardware_status_and_core_files(test)

        def timeout_handler(signum, frame):
            raise TimeOut('Timed out after %s second' % timeout)
        if PTLTestRunner.timeout is None:
            timeout = self.__get_timeout(test)
            old_handler = signal.signal(signal.SIGALRM, timeout_handler)
            setattr(test, 'old_sigalrm_handler', old_handler)
            signal.alarm(timeout)

    def stopTest(self, test):
        """
        Stop the test
        """
        old_sigalrm_handler = getattr(test, 'old_sigalrm_handler', None)
        if old_sigalrm_handler is not None:
            signal.signal(signal.SIGALRM, old_sigalrm_handler)
            signal.alarm(0)

    def addError(self, test, err):
        """
        Add error
        """
        if isclass(err[0]) and issubclass(err[0], TCThresholdReached):
            return True
        self.__set_test_end_data(test, err)

    def addFailure(self, test, err):
        """
        Add failure
        """
        self.__set_test_end_data(test, err)

    def addSuccess(self, test):
        """
        Add success
        """
        self.__set_test_end_data(test)

    def _cleanup(self):
        self.logger.info('Cleaning up temporary files')
        du = DshUtils()
        hosts = set(self.param_dict['moms']).union(
            set(self.param_dict['servers']))
        for user in PBS_USERS:
            self.logger.debug('Cleaning %s\'s home directory' % (str(user)))
            runas = PbsUser.get_user(user)
            for host in hosts:
                ret = du.run_cmd(host, cmd=['printenv', 'HOME'], sudo=True,
                                 runas=runas, logerr=False, as_script=False,
                                 level=logging.DEBUG)
                if ret['rc'] == 0:
                    path = ret['out'][0].strip()
                else:
                    return None
                ftd = []
                files = du.listdir(host, path=path, runas=user,
                                   level=logging.DEBUG)
                bn = os.path.basename
                ftd.extend([f for f in files if bn(f).startswith('PtlPbs')])
                ftd.extend([f for f in files if bn(f).startswith('STDIN')])

                if len(ftd) > 1000:
                    for i in range(0, len(ftd), 1000):
                        j = i + 1000
                        du.rm(host, path=ftd[i:j], runas=user,
                              force=True, level=logging.DEBUG)

        root_dir = os.sep
        dirlist = set([os.path.join(root_dir, 'tmp'),
                       os.path.join(root_dir, 'var', 'tmp')])
        # get tmp dir from the environment
        for envname in 'TMPDIR', 'TEMP', 'TMP':
            dirname = os.getenv(envname)
            if dirname:
                dirlist.add(dirname)

        p = re.compile(r'^pbs\.\d+')
        for tmpdir in dirlist:
            # list the contents of each tmp dir and
            # get the file list to be deleted
            self.logger.info('Cleaning up ' + tmpdir + ' dir')
            ftd = []
            files = du.listdir(path=tmpdir)
            bn = os.path.basename
            ftd.extend([f for f in files if bn(f).startswith('PtlPbs')])
            ftd.extend([f for f in files if bn(f).startswith('STDIN')])
            ftd.extend([f for f in files if bn(f).startswith('pbsscrpt')])
            ftd.extend([f for f in files if bn(f).startswith('pbs.conf.')])
            ftd.extend([f for f in files if p.match(bn(f))])
            for f in ftd:
                du.rm(path=f, sudo=True, recursive=True, force=True,
                      level=logging.DEBUG)
        for f in du.tmpfilelist:
            du.rm(path=f, sudo=True, force=True, level=logging.DEBUG)
        del du.tmpfilelist[:]
        tmpdir = tempfile.gettempdir()
        os.chdir(tmpdir)
        tmppath = os.path.join(tmpdir, 'dejagnutemp%s' % os.getpid())
        if du.isdir(path=tmppath):
            du.rm(path=tmppath, recursive=True, sudo=True, force=True,
                  level=logging.DEBUG)

    def begin(self):
        command = sys.argv
        command[0] = os.path.basename(command[0])
        self.logger.info('input command: ' + ' '.join(command))
        self.logger.info('param: ' + str(self.param))
        self.logger.info('ptl version: ' + str(ptl.__version__))
        _m = 'platform: ' + ' '.join(platform.uname()).strip()
        self.logger.info(_m)
        self.logger.info('python version: ' + str(platform.python_version()))
        self.logger.info('user: ' + pwd.getpwuid(os.getuid())[0])
        self.logger.info('-' * 80)

        if self.lcov_data is not None:
            self.lcov_utils = LcovUtils(cov_bin=self.lcov_bin,
                                        html_bin=self.genhtml_bin,
                                        cov_out=self.lcov_out,
                                        data_dir=self.lcov_data,
                                        html_nosrc=self.lcov_nosrc,
                                        html_baseurl=self.lcov_baseurl)
            # Initialize coverage analysis
            self.lcov_utils.zero_coverage()
            # The following 'dance' is done due to some oddities on lcov's
            # part, according to this the lcov readme file at
            # http://ltp.sourceforge.net/coverage/lcov/readme.php that reads:
            #
            # Note that this step only works after the application has
            # been started and stopped at least once. Otherwise lcov will
            # abort with an error mentioning that there are no data/.gcda
            # files.
            self.lcov_utils.initialize_coverage(name='PTLTestCov')
            PBSInitServices().restart()
        self._cleanup()

    def finalize(self, result):
        if self.lcov_data is not None:
            # See note above that briefly explains the 'dance' needed to get
            # reliable coverage data
            PBSInitServices().restart()
            self.lcov_utils.capture_coverage(name='PTLTestCov')
            exclude = ['"*work/gSOAP/*"', '"*/pbs/doc/*"', 'lex.yy.c',
                       'pbs_ifl_wrap.c', 'usr/include/*', 'unsupported/*']
            self.lcov_utils.merge_coverage_traces(name='PTLTestCov',
                                                  exclude=exclude)
            self.lcov_utils.generate_html()
            self.lcov_utils.change_baseurl()
            self.logger.info('\n'.join(self.lcov_utils.summarize_coverage()))
        self._cleanup()


================================================
FILE: test/fw/ptl/utils/plugins/ptl_test_tags.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import sys
import logging
import unittest
from nose.plugins.base import Plugin
import collections
try:
    from collections.abc import Callable  # Python 3.10+
except ImportError:
    from collections import Callable  # For Python versions before 3.10

log = logging.getLogger('nose.plugins.PTLTestTags')

TAGKEY = '__PTL_TAGS_LIST__'


def tags(*args, **kwargs):
    """
    Decorator that adds tags to classes or functions or methods
    """
    def wrap_obj(obj):
        tagobj = getattr(obj, TAGKEY, [])
        for name in args:
            tagobj.append(name)
            PTLTestTags.tags_list.append(name)
            setattr(obj, name, True)
        for name, value in kwargs.items():
            tagobj.append('%s=%s' % (name, value))
            PTLTestTags.tags_list.append(name)
            setattr(obj, name, value)
        setattr(obj, TAGKEY, sorted(set(tagobj)))
        return obj
    return wrap_obj


def get_tag_value(method, cls, tag_name, default=False):
    """
    Look up an tag on a ``method/function``.
    If the tag isn't found there, looking it up in the
    method's class, if any.
    """
    Missing = object()
    value = getattr(method, tag_name, Missing)
    if value is Missing and cls is not None:
        value = getattr(cls, tag_name, Missing)
    if value is Missing:
        return default
    return value


class EvalHelper(object):

    """
    Object that can act as context dictionary for eval and looks up
    names as attributes on a method/function and its class.
    """

    def __init__(self, method, cls):
        self.method = method
        self.cls = cls

    def __getitem__(self, name):
        return get_tag_value(self.method, self.cls, name)


class FakeRunner(object):

    def __init__(self, matched, tags_list, list_tags, verbose):
        self.matched = matched
        self.tags_list = tags_list
        self.list_tags = list_tags
        self.verbose = verbose

    def run(self, test):
        if self.list_tags:
            print(('\n'.join(sorted(set(self.tags_list)))))
            sys.exit(0)
        suites = sorted(set(self.matched.keys()))
        if not self.verbose:
            print(('\n'.join(suites)))
        else:
            for k in suites:
                v = sorted(set(self.matched[k]))
                for _v in v:
                    print((k + '.' + _v))
        sys.exit(0)


class PTLTestTags(Plugin):

    """
    Load test cases from given parameter
    """
    name = 'PTLTestTags'
    score = sys.maxsize - 3
    logger = logging.getLogger(__name__)
    tags_list = []

    def __init__(self):
        Plugin.__init__(self)
        self.tags_to_check = []
        self.tags = []
        self.eval_tags = []
        self.tags_info = False
        self.list_tags = False
        self.verbose = False
        self.matched = {}
        self._test_marker = 'test_'

    def options(self, parser, env):
        """
        Register command line options
        """
        pass

    def set_data(self, tags, eval_tags, tags_info=False, list_tags=False,
                 verbose=False):
        self.tags.extend(tags)
        self.eval_tags.extend(eval_tags)
        self.tags_info = tags_info
        self.list_tags = list_tags
        self.verbose = verbose

    def configure(self, options, config):
        """
        Configure the plugin and system, based on selected options.

        attr and eval_attr may each be lists.

        self.attribs will be a list of lists of tuples. In that list, each
        list is a group of attributes, all of which must match for the rule to
        match.
        """
        self.tags_to_check = []
        for tag in self.eval_tags:
            def eval_in_context(expr, obj, cls):
                return eval(expr, None, EvalHelper(obj, cls))
            self.tags_to_check.append([(tag, eval_in_context)])
        for tags in self.tags:
            tag_group = []
            for tag in tags.strip().split(','):
                if not tag:
                    continue
                items = tag.split('=', 1)
                if len(items) > 1:
                    key, value = items
                else:
                    key = items[0]
                    if key[0] == '!':
                        key = key[1:]
                        value = False
                    else:
                        value = True
                tag_group.append((key, value))
            self.tags_to_check.append(tag_group)
        if (len(self.tags_to_check) > 0) or self.list_tags:
            self.enabled = True

    def is_tags_matching(self, method, cls=None):
        """
        Verify whether a method has the required tags
        The method is considered a match if it matches all tags
        for any tag group.
        """
        any_matched = False
        for group in self.tags_to_check:
            group_matched = True
            for key, value in group:
                tag_value = get_tag_value(method, cls, key)
                if isinstance(value, Callable):
                    if not value(key, method, cls):
                        group_matched = False
                        break
                elif value is True:
                    if not bool(tag_value):
                        group_matched = False
                        break
                elif value is False:
                    if bool(tag_value):
                        group_matched = False
                        break
                elif type(tag_value) in (list, tuple):
                    value = str(value).lower()
                    if value not in [str(x).lower() for x in tag_value]:
                        group_matched = False
                        break
                else:
                    if ((value != tag_value) and
                            (str(value).lower() != str(tag_value).lower())):
                        group_matched = False
                        break
            any_matched = any_matched or group_matched
        if not any_matched:
            return False

    def prepareTestRunner(self, runner):
        """
        Prepare test runner
        """
        if (self.tags_info or self.list_tags):
            return FakeRunner(self.matched, self.tags_list, self.list_tags,
                              self.verbose)

    def wantClass(self, cls):
        """
        Accept the class if its subclass of TestCase and has at-least one
        test case
        """
        if not issubclass(cls, unittest.TestCase):
            return False
        has_test = False
        for t in dir(cls):
            if t.startswith(self._test_marker):
                has_test = True
                break
        if not has_test:
            return False

    def wantFunction(self, function):
        """
        Accept the function if its tags match.
        """
        return False

    def wantMethod(self, method):
        """
        Accept the method if its tags match.
        """
        try:
            cls = method.__self__.__class__
        except AttributeError:
            return False
        if not method.__name__.startswith(self._test_marker):
            return False
        rv = self.is_tags_matching(method, cls)
        if rv is None:
            cname = cls.__name__
            if cname not in self.matched.keys():
                self.matched[cname] = []
            self.matched[cname].append(method.__name__)
        return rv


================================================
FILE: test/fw/ptl.csh
================================================
#!/usr/bin/csh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# This file will set path variables in case of ptl installation
if ( -f /etc/debian_version ) then
    set __ptlpkgname=`dpkg -W -f='${binary:Package}\n' | grep -E '*-ptl$'`
    if ( "x${__ptlpkgname}" != "x" ) then
        set ptl_prefix_lib=`dpkg -L ${__ptlpkgname} | grep -m 1 lib$`
    endif
else
    set __ptlpkgname=`rpm -qa | grep -E '*-ptl-[[:digit:]]'`
    if ( "x${__ptlpkgname}" != "x" ) then
        set ptl_prefix_lib=`rpm -ql ${__ptlpkgname} | grep -m 1 lib$`
    endif
endif
if ( $?ptl_prefix_lib ) then
	set python_dir=`/bin/ls -1 ${ptl_prefix_lib}`
	set prefix=`dirname ${ptl_prefix_lib}`

	setenv PATH ${prefix}/bin/:${PATH}
	if ( $?PYTHONPATH ) then
		setenv PYTHONPATH ${prefix}/lib/${python_dir}/site-packages/:$PYTHONPATH
	else
		setenv PYTHONPATH ${prefix}/lib/${python_dir}/site-packages/
	endif
	unset python_dir
	unset prefix
	unset ptl_prefix_lib
else
	if ( $?PBS_CONF_FILE ) then
		set conf = "$PBS_CONF_FILE"
	else
		set conf = /etc/pbs.conf
	endif
	if ( -r "${conf}" ) then
		# we only need PBS_EXEC from pbs.conf
		set __PBS_EXEC=`grep '^[[:space:]]*PBS_EXEC=' "$conf" | tail -1 | sed 's/^[[:space:]]*PBS_EXEC=\([^[:space:]]*\)[[:space:]]*/\1/'`
		if ( "X${__PBS_EXEC}" != "X" ) then
			# Define PATH and PYTHONPATH for the users
			set PTL_PREFIX=`dirname ${__PBS_EXEC}`/ptl
			set python_dir=`/bin/ls -1 ${PTL_PREFIX}/lib`/site-packages
			if ( $?PATH && -d ${PTL_PREFIX}/bin ) then
				setenv PATH "${PATH}:${PTL_PREFIX}/bin"
			endif
			if ( -d "${PTL_PREFIX}/lib/${python_dir}" ) then
				if ( $?PYTHONPATH ) then
					setenv PYTHONPATH "${PYTHONPATH}:${PTL_PREFIX}/lib/${python_dir}"
				else
					setenv PYTHONPATH "${PTL_PREFIX}/lib/${python_dir}"
				endif
			endif
			endif
		endif
		unset __PBS_EXEC
		unset PTL_PREFIX
		unset conf
		unset python_dir
	endif
endif


================================================
FILE: test/fw/ptl.sh
================================================
#!/usr/bin/sh
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


# This file will set path variables in case of ptl installation

if [ -f /etc/debian_version ]; then
    __ptlpkgname=$(dpkg -W -f='${binary:Package}\n' 2>/dev/null | grep -E '*-ptl$')
    if [ "x${__ptlpkgname}" != "x" ]; then
        ptl_prefix_lib=$(dpkg -L ${__ptlpkgname} 2>/dev/null | grep -m 1 lib$ 2>/dev/null)
    fi
else
    __ptlpkgname=$(rpm -qa 2>/dev/null | grep -E '*-ptl-[[:digit:]]')
    if [ "x${__ptlpkgname}" != "x" ]; then
        ptl_prefix_lib=$(rpm -ql ${__ptlpkgname} 2>/dev/null | grep -m 1 lib$ 2>/dev/null)
    fi
fi
if [ "x${ptl_prefix_lib}" != "x" ]; then
	python_dir=$( /bin/ls -1 ${ptl_prefix_lib} )
	prefix=$( dirname ${ptl_prefix_lib} )

	export PATH=${prefix}/bin/:${PATH}
	export PYTHONPATH=${prefix}/lib/${python_dir}/site-packages${PYTHONPATH:+:$PYTHONPATH}
	unset python_dir
	unset prefix
	unset ptl_prefix_lib
else
	conf="${PBS_CONF_FILE:-/etc/pbs.conf}"
	if [ -r "${conf}" ]; then
		# we only need PBS_EXEC from pbs.conf
		__PBS_EXEC=$( grep '^[[:space:]]*PBS_EXEC=' "$conf" | tail -1 | sed 's/^[[:space:]]*PBS_EXEC=\([^[:space:]]*\)[[:space:]]*/\1/' )
		if [ "X${__PBS_EXEC}" != "X" ]; then
			# Define PATH and PYTHONPATH for the users
			PTL_PREFIX=$( dirname ${__PBS_EXEC} )/ptl
			python_dir=$( /bin/ls -1 ${PTL_PREFIX}/lib )/site-packages
			[ -d "${PTL_PREFIX}/bin" ] && export PATH="${PATH}:${PTL_PREFIX}/bin"
			[ -d "${PTL_PREFIX}/lib/${python_dir}" ] && export PYTHONPATH="${PYTHONPATH:+$PYTHONPATH:}${PTL_PREFIX}/lib/${python_dir}"
			[ -d "${__PBS_EXEC}/lib/python/altair" ] && export PYTHONPATH="${PYTHONPATH:+$PYTHONPATH:}${__PBS_EXEC}/lib/python/altair"
			[ -d "${__PBS_EXEC}/lib64/python/altair" ] && export PYTHONPATH="${PYTHONPATH:+$PYTHONPATH:}${__PBS_EXEC}/lib64/python/altair"
		fi
		unset __PBS_EXEC
		unset PTL_PREFIX
		unset conf
		unset python_dir
	fi
fi


================================================
FILE: test/fw/ptlreport
================================================
#!/bin/bash
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


prog="`basename $0`"

usage() {
	echo -en "${prog}\n"
	echo -en "\tParses the PTL test output file <ptl_test_log> and reports\n"
	echo -en "\tvarious counts like total, passed, failed, error-ed,\n"
	echo -en "\tskipped and timedout test cases from <ptl_test_log> file.\n\n"
	echo -en "Usage:\n\t${prog} <ptl_test_log> [OPTIONS]\n\n"
	echo -en "OPTIONS:\n"
	echo -en "\t-t | --total\t- Print total number of test cases\n"
	echo -en "\t-p | --passes\t- Print passed test cases\n"
	echo -en "\t-f | --fails\t- Print failed test cases\n"
	echo -en "\t-e | --errors\t- Print error-ed test cases\n"
	echo -en "\t-s | --skipped\t- Print skipped test cases\n"
	echo -en "\t-T | --timedout\t- Print timedout test cases\n"
	echo -en "\t-r | --runtime\t- Print total runtime of tests\n"
	echo -en "\t-S | --summary\t- Print summary of tests\n"
	echo -en "\t-v | --verbose\t- Print verbose output, can be supplied multiple times to increase verbosity\n\n"
}

# args: <is_asked> <count> <type>
print_info() {
	if [ ${1} -eq 1 ]
	then
		[ ${_space} -eq 1 ] && echo " " || _space=1
		if [ ${verbose} -ge 1 ]
		then
			[ ${2} -le 0 ] && echo "${3^} test(s): ${2}" && return
			[ ${verbose} -eq 1 -o ${3} == "skipped" ] && echo "${2} test(s) ${3}:" && \
				sed -n "/^${3}: \(.*\)$/p" ${ptl_test_log} | awk '{ $1 = "\t"; print $0 }' && return
			if [ ${verbose} -gt 1 ]
			then
				lines=`sed -n "/^${3}: \(.*\)$/p" ${ptl_test_log} | awk '{ $1 = ""; gsub(/ /, "@", $0); print $0 }'`
				for line in ${lines}
				do
					line=${3^^}":"`echo ${line} | tr '@' ' '`
					echo ${line}
					sed -n "/${line}/,\${N;/^\n$/{P;q};P;D}" ${ptl_test_log} | \
						awk 'NR > 3 { sub(/.*Traceback/, "Traceback", $0); print "  "$0}'
				done
			fi
		else
			echo ${2}
		fi
	fi
}

if [ $# -le 1 ]
then
	usage
	exit 1
fi

ptl_test_log=$1

if [ ! -r "${ptl_test_log}" ]
then
	echo "${prog}: ${ptl_test_log} doesn't exist or does't have read permission!"
	exit 1
fi

total=0
passes=0
fails=0
errors=0
skipped=0
timedout=0
summary=0
verbose=0
runtime=0
_space=0

shift
while [ "$1" != "" ]; do
	case $1 in
		-p | --passes) passes=1; shift;;
		-f | --fails) fails=1; shift;;
		-e | --errors) errors=1; shift;;
		-s | --skipped) skipped=1; shift ;;
		-T | --timedout) timedout=1; shift;;
		-v | --verbose) verbose=$((${verbose} + 1)); shift ;;
		-t | --total) total=1; shift;;
		-S | --summary) summary=1; shift;;
		-r | --runtime) runtime=1; shift;;
		-h | --help ) usage; exit 0;;
		* ) echo -en "Unknown Option: $1\n\n"; usage; exit 1;
	esac
done

summary_line=`sed -n '/^run:.*: [0-9]*$/p' ${ptl_test_log}`
read total_ct pass_ct fail_ct err_ct skip_ct timedout_ct <<< \
	`echo ${summary_line} | awk -F '[,:]' \
	'ORS=" " { for (i=2; i<=NF; i=i+2) { gsub(/^[ \t]+/, "", $i); print $i } }'`

if [ ${total} -eq 1 ]
then
	[ ${_space} -eq 1 ] && echo " " || _space=1
	[ ${verbose} -ge 1 ] && echo "Total test(s): ${total_ct}" || echo ${total_ct}
fi

if [ ${passes} -eq 1 ]
then
	[ ${_space} -eq 1 ] && echo " " || _space=1
	[ ${verbose} -ge 1 ] && echo "Passed test(s): ${pass_ct}" || echo ${pass_ct}
fi

print_info ${fails} ${fail_ct} "failed"
print_info ${errors} ${err_ct} "error"
print_info ${skipped} ${skip_ct} "skipped"
print_info ${timedout} ${timedout_ct} "timedout"

if [ ${summary} -eq 1 ]
then
	[ ${_space} -eq 1 ] && echo " " || _space=1
	[ ${verbose} -ge 1 ] && echo -en "Summary: \n\t "
	echo ${summary_line}
fi

if [ ${runtime} -eq 1 ]
then
	test_run_output=`sed -n '/^Tests run in [\.:0-9]*$/p' ${ptl_test_log} | awk -F. '{print $1}'`
	[ ${_space} -eq 1 ] && echo " " || _space=1
	[ ${verbose} -ge 1 ] && echo ${test_run_output} || echo ${test_run_output} | awk '{ print $NF }'
fi

exit 0


================================================
FILE: test/fw/requirements.txt
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

nose
beautifulsoup4
pexpect
defusedxml


================================================
FILE: test/fw/setup.py.in
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from setuptools import setup, find_packages
import os

os.chdir(os.path.dirname(os.path.abspath(os.path.abspath(__file__))))


def get_reqs():
    install_requires = open('requirements.txt').readlines()
    return [r.strip() for r in install_requires]


def get_scripts():
    return ['bin/%s' % (x) for x in os.listdir('bin')]


setup(
    name='PbsTestLab',
    version='@PBS_VERSION@',
    packages=find_packages(),
    scripts=get_scripts(),
    include_package_data=True,
    license='AGPLv3 with exceptions',
    description='PBS Testing and Benchmarking Framework',
    long_description=open(os.path.abspath('./doc/intro.rst')).read(),
    install_requires=get_reqs(),
    keywords='PbsTestLab ptl pbs',
    zip_safe=False,
    classifiers=[
        'Development Status :: 5 - Production/Stable',
        'Environment :: Other Environment',
        'Intended Audience :: Developers',
        'License :: AGPLv3 with exceptions',
        'Operating System :: POSIX :: Linux',
        'Programming Language :: Python :: 3.6',
        'Topic :: Software Development :: Testing',
        'Topic :: Software Development :: Quality Assurance',
    ]
)


================================================
FILE: test/scripts/qsub_multi.sh
================================================
#!/bin/bash

# Used to achieve faster job submission of large number of jobs for performance testing

if [ $# -lt 2 ]; then
	echo "syntax: $0 <num-threads> <jobs-per-thread>"
	exit 1
fi

function submit_jobs {
	njobs=$1

	echo "New thread submitting jobs=$njobs"

	for i in $(seq 1 $njobs)
	do
		qsub -- /bin/date > /dev/null
	done
}

if [ "$1" = "submit" ]; then
	njobs=$2
	submit_jobs $njobs
	exit 0
fi

nthreads=$1
njobs=$2

echo "parameters supplied: nthreads=$nthreads, njobs=$njobs"

start_time=`date +%s%3N`

for i in $(seq 1 $nthreads)
do
	setsid $0 submit $njobs &
done

wait

end_time=`date +%s%3N`

diff=`bc -l <<< "scale=3; ($end_time - $start_time) / 1000"`
total_jobs=`bc -l <<< "$njobs * $nthreads"`
perf=`bc -l <<< "scale=3; $total_jobs / $diff"`

echo "Time(ms) started=$start_time, ended=$end_time"
echo "Total jobs submitted=$total_jobs, time taken(secs.ms)=$diff, jobs/sec=$perf"


================================================
FILE: test/tests/Makefile.am
================================================
#
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

#
if ENABLEPTL
ptl_testsdir = ${ptl_prefix}/tests
dist_ptl_tests_PYTHON = $(wildcard $(srcdir)/*.py)

ptl_testfunctionaldir = $(ptl_testsdir)/functional
dist_ptl_testfunctional_DATA = $(wildcard $(srcdir)/functional/*.py)

ptl_testinterfacesdir = $(ptl_testsdir)/interfaces
dist_ptl_testinterfaces_DATA = $(wildcard $(srcdir)/interfaces/*.py)

ptl_testperformancedir = $(ptl_testsdir)/performance
dist_ptl_testperformance_DATA = $(wildcard $(srcdir)/performance/*.py)

ptl_testresiliencedir = $(ptl_testsdir)/resilience
dist_ptl_testresilience_DATA = $(wildcard $(srcdir)/resilience/*.py)

ptl_testsecuritydir = $(ptl_testsdir)/security
dist_ptl_testsecurity_DATA = $(wildcard $(srcdir)/security/*.py)

ptl_testselftestdir = $(ptl_testsdir)/selftest
dist_ptl_testselftest_DATA = $(wildcard $(srcdir)/selftest/*.py)

ptl_testupgradesdir = $(ptl_testsdir)/upgrades
dist_ptl_testupgrades_DATA = $(wildcard $(srcdir)/upgrades/*.py)
endif


================================================
FILE: test/tests/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


================================================
FILE: test/tests/functional/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_testsuite import *


class TestFunctional(PBSTestSuite):
    """
    Base test suite for Functional tests
    """
    pass


================================================
FILE: test/tests/functional/pbs_Rrecord_resources_used.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import re


@requirements(num_moms=2)
class Test_Rrecord_with_resources_used(TestFunctional):

    """
    This test suite tests whether the 'R' record in accounting logs has
    information on resources_used in the following scenarios.
        a) The node the job was running on goes down and node_fail_requeue
           timeout is hit.
        b) It is rerun using qrerun <job-id>.
        c) It is rerun using qrerun -Wforce <job-id>.
        d) mom is restarted without any options or with the '-r' option
    """

    def setUp(self):
        TestFunctional.setUp(self)

        if len(self.moms) != 2:
            self.skipTest('test requires two MoMs as input, ' +
                          'use -p moms=<mom1>:<mom2>')

        self.server.set_op_mode(PTL_CLI)

        # PBSTestSuite returns the moms passed in as parameters as dictionary
        # of hostname and MoM object
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostA)
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostB)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

    def common(self, is_nonrerunnable, restart_mom):

        # Set node_fail_requeue=5 on server

        a = {ATTR_nodefailrq: 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job script

        test = []
        test += ['#PBS -N RequeueTest\n']
        test += ['#PBS -l ncpus=1\n']
        test += ['echo Starting test at `date`\n']
        test += ['sleep 1000\n']

        test1 = []
        test1 += ['#PBS -N RequeueTest\n']
        test1 += ['#PBS -lselect=1:ncpus=1 -l place=scatter\n']
        test1 += ['echo Starting test at `date`\n']
        test1 += ['sleep 1000\n']

        # Submit three jobs J1,J2,J3[]

        j1 = Job(TEST_USER, attrs={ATTR_k: 'oe'})
        j1.create_script(body=test)
        jid1 = self.server.submit(j1)

        if is_nonrerunnable is True:
            j2 = Job(TEST_USER, attrs={ATTR_r: 'n', ATTR_k: 'oe'})
        else:
            j2 = Job(TEST_USER, attrs={ATTR_r: 'y', ATTR_k: 'oe'})

        j2.create_script(body=test1)
        jid2 = self.server.submit(j2)

        j3 = Job(TEST_USER, attrs={ATTR_J: '1-6', ATTR_k: 'oe'})
        j3.create_script(body=test)
        jid3 = self.server.submit(j3)

        subjobs = self.server.status(JOB, id=jid3, extend='t')
        jid3s1 = subjobs[1]['id']

        # Wait for the jobs to start running.
        self.server.expect(JOB, {ATTR_substate: '42'}, jid1)
        self.server.expect(JOB, {ATTR_substate: '42'}, jid2)
        self.server.expect(JOB, {ATTR_substate: '42'}, jid3s1)

        # Verify that accounting logs have Resource_List.<resource> value
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid1, regexp=True)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid2, regexp=True)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid3s1, regexp=True)

        # Bring both moms down using kill -9 <mom pid>
        self.momA.signal('-KILL')
        self.momB.signal('-KILL')

        # Verify that both nodes are reported to be down.
        self.server.expect(NODE, {ATTR_NODE_state: (
            MATCH_RE, '.*down.*')}, id=self.hostA)
        self.server.expect(NODE, {ATTR_NODE_state: (
            MATCH_RE, '.*down.*')}, id=self.hostB)

        self.server.expect(JOB, {ATTR_state: 'Q'}, jid1)
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid3s1)
        if is_nonrerunnable is False:
            # All rerunnable jobs - all should be in 'Q' state.
            self.server.expect(JOB, {ATTR_state: 'Q'}, jid2)
        else:
            # Job2 is non-rerunnable.
            self.server.expect(JOB, {ATTR_state: 'F'}, jid2, extend='x')

        # tracejob should show "Job requeued, execution node <node name> down"
        self.server.tracejob_match(
            msg='Job requeued, execution node .* down', id=jid1, regexp=True)

        if is_nonrerunnable is False:
            e = True
        else:
            e = False
        msg = 'Job requeued, execution node .* down'
        self.server.tracejob_match(msg=msg, id=jid2, regexp=True,
                                   existence=e)

        self.server.tracejob_match(
            msg='Job requeued, execution node .* down', id=jid3s1, regexp=True)

        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid1, regexp=True)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid2, regexp=True)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid3s1, regexp=True)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        if restart_mom == 's':
            # Start mom without any  option
            self.momA.start()
            self.momB.start()
        elif restart_mom == 'r':
            # Start mom with -r option
            self.momA.start(args=['-r'])
            self.momB.start(args=['-r'])

        return jid1, jid2, jid3s1

    def test_Rrecord_with_nodefailrequeue(self):
        """
        Scenario: The node on which the job was running goes down and
                  node_fail_requeue time-out is hit.
        Expected outcome: Server should record last known resource usage in
                  the 'R' record.
        """

        jid1, jid2, jid3s1 = self.common(False, False)

        self.server.accounting_match(
            msg='.*R;' + jid1 + '.*resources_used.*', id=jid1, regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 + '.*resources_used.*', id=jid2, regexp=True)
        self.server.accounting_match(
            msg='.*R;' + re.escape(jid3s1) + '.*resources_used.*',
            id=jid3s1, regexp=True)

    def test_Rrecord_when_mom_restarted_with_r(self):
        """
        Scenario: The node on which the job was running goes down and
                  node_fail_requeue time-out is hit and mom is restarted
                  with '-r'
        Expected outcome: Server should record last known resource usage in
                  the 'R' record.
        """

        jid1, jid2, jid3s1 = self.common(False, 'r')

        self.server.accounting_match(
            msg='.*R;' + jid1 + '.*resources_used.*run_count=1', id=jid1,
            regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 + '.*resources_used.*run_count=1', id=jid2,
            regexp=True)
        self.server.accounting_match(
            msg='.*R;' + re.escape(jid3s1) + '.*resources_used.*run_count=1',
            id=jid3s1, regexp=True)

    def test_Rrecord_for_nonrerunnable_jobs(self):
        """
        Scenario: One non-rerunnable job. The node on which the job was
                  running goes down and node_fail_requeue time-out is hit.
        Expected outcome: Server should record last known resource usage in
                  the 'R' record only for rerunnable jobs.
        """
        a = {ATTR_JobHistoryEnable: 1}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid1, jid2, jid3s1 = self.common(True, 'r')

        self.server.accounting_match(
            msg='.*R;' + jid1 + '.*resources_used.*run_count=1', id=jid1,
            regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 + '.*resources_used.*run_count=1', id=jid2,
            regexp=True, existence=False, max_attempts=5)
        self.server.accounting_match(
            msg='.*R;' + re.escape(jid3s1) + '.*resources_used.*run_count=1',
            id=jid3s1, regexp=True)

    def test_Rrecord_when_mom_restarted_without_r(self):
        """
        Scenario: Mom restarted without '-r' option and jobs are requeued
                   using qrerun.
        Expected outcome: Server should record last known resource usage in
                   the 'R' record for both.
        """

        jid1, jid2, jid3s1 = self.common(False, 's')

        self.server.accounting_match(
            msg='.*R;' + jid1 + '.*resources_used.*run_count=1', id=jid1,
            regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 + '.*resources_used.*run_count=1', id=jid2,
            regexp=True)
        self.server.accounting_match(
            msg='.*R;' + re.escape(jid3s1) + '.*resources_used.*run_count=1',
            id=jid3s1, regexp=True)

        # Verify that the jobs are in 'Q' state.
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid1)
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid3s1)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {ATTR_substate: '42'}, jid1)
        self.server.expect(JOB, {ATTR_substate: '42'}, jid2)
        self.server.expect(JOB, {ATTR_substate: '42'}, jid3s1)

        # qrerun the jobs and wait for them to start running.
        self.server.rerunjob(jobid=jid1)
        self.server.rerunjob(jobid=jid2)
        self.server.rerunjob(jobid=jid3s1)

        # Confirm that the 'R' record is generated and the run_count is 2.
        self.server.accounting_match(
            msg='.*R;' + jid1 + '.*resources_used.*run_count=2', id=jid1,
            regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 + '.*resources_used.*run_count=2', id=jid2,
            regexp=True)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

    def test_Rrecord_with_multiple_reruns(self):
        """
        Scenario: Job is rerun multiple times.
        Expected outcome: Server should record last known resource usage
                  every time the job is rerun.
        """

        dflt_q = self.server.default_queue

        # As user submit three jobs.
        test = []
        test += ['#PBS -N RequeueTest\n']
        test += ['#PBS -l ncpus=1\n']
        test += ['echo Starting test at `date`\n']
        test += ['sleep 1000\n']

        j1 = Job(TEST_USER)
        j1.create_script(body=test)
        j1.set_attributes({ATTR_r: 'y', ATTR_l + '.ncpus': 2})
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER)
        j2.create_script(body=test)
        j2.set_attributes({ATTR_r: 'n', ATTR_l + '.ncpus': 2})
        jid2 = self.server.submit(j2)

        j3 = Job(TEST_USER)
        j3.create_script(body=test)
        j3.set_attributes({ATTR_J: '1-4', ATTR_k: 'oe'})
        jid3 = self.server.submit(j3)

        subjobs = self.server.status(JOB, id=jid3, extend='t')
        jid3s1 = subjobs[1]['id']

        # Verify that the jobs have started running.
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid1)
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid2)
        self.server.expect(JOB, {ATTR_state: 'B'}, jid3)
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid3s1)

        # Verify that the accounting logs have Resource_List.<resource> but no
        # R records.
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid1, regexp=True)
        msg = '.*R;' + jid1 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid1, regexp=True,
                                     existence=False)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid2, regexp=True)
        msg = '.*R;' + jid2 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid2, regexp=True,
                                     existence=False)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid3s1, regexp=True)
        self.server.accounting_match(msg='.*R;' + re.escape(jid3s1) +
                                         '.*resources_used.*', id=jid3s1,
                                         regexp=True, existence=False)

        # sleep for 5 seconds so the jobs use some resources.
        time.sleep(5)

        self.server.rerunjob(jid1)
        self.server.rerunjob(jid3s1)

        # Verify that the accounting logs have R logs with last known resource
        # usage. No R logs for J2.

        self.server.accounting_match(
            msg='.*R;' + jid1 +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=1.*',
            id=jid1, regexp=True)

        msg = '.*R;' + jid2 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid2, regexp=True,
                                     existence=False)

        self.server.accounting_match(msg='.*R;' + re.escape(
            jid3s1) + '.*Exit_status=-11.*.*resources_used.*.*run_count=1.*',
            id=jid3s1, regexp=True)

        # sleep for 5 seconds so the jobs use some resources.
        time.sleep(5)

        self.server.rerunjob(jid1)
        self.server.rerunjob(jid3s1)

        # Verify that the accounting logs should R logs with last known
        # resource usage Resource_used and run_count should be 3 for J1.
        # No R logs in accounting for J2.
        self.server.accounting_match(
            msg='.*R;' + jid1 +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=2.*',
            id=jid1, regexp=True)
        msg = '.*R;' + jid2 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid2, regexp=True,
                                     existence=False)
        self.server.accounting_match(
            msg='.*R;' + re.escape(jid3s1) +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=1.*',
            id=jid3s1, regexp=True)

    def test_Rrecord_with_multiple_reruns_case2(self):
        """
        Scenario: Jobs submitted with select cput and ncpus. Job is rerun
                  multiple times.
        Expected outcome: Server should record last known resource usage
                  that has cputime.
        """
        dflt_q = self.server.default_queue

        script = []
        script += ['i=0;\n']
        script += ['while [ $i -ne 0 ] || sleep 0.125;\n']
        script += ['do i=$(((i+1) % 10000 ));\n']
        script += ['done\n']
        j1 = Job(TEST_USER)
        j1.create_script(body=script)

        j1.set_attributes(
            {ATTR_l + '.cput': 160, ATTR_l + '.ncpus': 3, ATTR_k: 'oe'})
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER)
        j2.create_script(body=script)
        j2.set_attributes(
            {ATTR_l + '.cput': 180, ATTR_l + '.ncpus': 3, ATTR_k: 'oe'})
        jid2 = self.server.submit(j2)

        # Verify that the jobs have started running.
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid1)
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid2)

        # Verify that the accounting logs have Resource_List.<resource> but no
        # R records.
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid1, regexp=True)
        msg = '.*R;' + jid1 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid1, regexp=True,
                                     existence=False)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid2, regexp=True)
        msg = '.*R;' + jid2 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid2, regexp=True,
                                     existence=False)

        time.sleep(5)

        jids = self.server.select()
        self.server.rerunjob(jids)

        # Verify that the accounting logs have R record with last known
        # resource usage and run_count should be 2 for J1 and J2.

        self.server.accounting_match(
            msg='.*R;' + jid1 +
            '.*.*resources_used.cput=[0-9]*:[0-9]*:[0-9]*.*.*run_count=1.*',
            id=jid1, regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 +
            '.*.*resources_used.cput=[0-9]*:[0-9]*:[0-9]*.*.*run_count=1.*',
            id=jid2, regexp=True)

        time.sleep(5)

        jids = self.server.select()
        self.server.rerunjob(jids)

        self.server.accounting_match(
            msg='.*R;' + jid1 +
            '.*.*resources_used.cput=[0-9]*:[0-9]*:[0-9]*.*.*run_count=2.*',
            id=jid1, regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 +
            '.*.*resources_used.cput=[0-9]*:[0-9]*:[0-9]*.*.*run_count=2.*',
            id=jid2, regexp=True)

    def test_Rrecord_job_rerun_forcefully(self):
        """
        Scenario: Job is forcefully rerun.
        Expected outcome: server should record last known resource usage in
                  the R record.
        """

        dflt_q = self.server.default_queue

        test = []
        test += ['#PBS -N RequeueTest\n']
        test += ['#PBS -l ncpus=1\n']
        test += ['echo Starting test at `date`\n']
        test += ['sleep 1000\n']

        j1 = Job(TEST_USER)
        j1.create_script(body=test)
        j1.set_attributes({ATTR_r: 'y', ATTR_l + '.ncpus': 2})
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER)
        j2.create_script(body=test)
        j2.set_attributes({ATTR_r: 'n', ATTR_l + '.ncpus': 2})
        jid2 = self.server.submit(j2)

        j3 = Job(TEST_USER)
        j3.create_script(body=test)
        j3.set_attributes({ATTR_J: '1-4', ATTR_k: 'oe'})
        jid3 = self.server.submit(j3)
        subjobs = self.server.status(JOB, id=jid3, extend='t')
        jid3s1 = subjobs[1]['id']

        # Verify that the jobs have started running.
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid1)
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid2)
        self.server.expect(JOB, {ATTR_state: 'B'}, jid3)
        self.server.expect(JOB, {ATTR_substate: '42', 'run_count': 1}, jid3s1)

        # Verify that the accounting logs have Resource_List.<resource> but no
        # R records.
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid1, regexp=True)
        msg = '.*R;' + jid1 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid1, regexp=True,
                                     existence=False)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid2, regexp=True)
        msg = '.*R;' + jid2 + '.*resources_used.*'
        self.server.accounting_match(msg=msg, id=jid2, regexp=True,
                                     existence=False)
        self.server.accounting_match(
            msg='.*Resource_List.*', id=jid3s1, regexp=True)
        self.server.accounting_match(msg='.*R;' +
                                         re.escape(jid3s1) +
                                         '.*resources_used.*',
                                         id=jid3s1, regexp=True,
                                     existence=False)

        time.sleep(5)

        jids = self.server.select(extend='T')
        self.server.rerunjob(jids, extend='force')

        # Verify that the accounting logs have R record with last known
        # resource usage and run_count should be 1 for J1 and J2

        self.server.accounting_match(
            msg='.*R;' + jid1 +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=1.*',
            id=jid1, regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=1.*',
            id=jid2, regexp=True)
        self.server.accounting_match(msg='.*R;' + re.escape(
            jid3s1) + '.*Exit_status=-11.*.*resources_used.*.*run_count=1.*',
            id=jid3s1, regexp=True)
        time.sleep(5)

        jids = self.server.select(extend='T')
        self.server.rerunjob(jids, extend='force')

        # Verify that the accounting logs have R record with last known
        # usage and run_count should be 2 for J1 and J2.
        self.server.accounting_match(
            msg='.*R;' + jid1 +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=2.*',
            id=jid1, regexp=True)
        self.server.accounting_match(
            msg='.*R;' + jid2 +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=2.*',
            id=jid2, regexp=True)
        self.server.accounting_match(msg='.*R;' + re.escape(
            jid3s1) +
            '.*Exit_status=-11.*.*resources_used.*.*run_count=2.*',
            id=jid3s1, regexp=True)

    def tearDown(self):
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_acct_log.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestAcctLog(TestFunctional):
    """
    Tests dealing with the PBS accounting logs
    """

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'type': 'string', 'flag': 'h'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='foo_str')

    def test_long_resource_end(self):
        """
        Test to see if a very long string resource is neither truncated
        in the job's resources_used attr or the accounting log at job end
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})

        # Create a very long string - the truncation was 2048 characters
        # 4096 is plenty big to show it

        hstr = '1'*4096
        hook_body = "import pbs\n"
        hook_body += "e = pbs.event()\n"
        hook_body += "hstr=\'" + hstr + "\'\n"
        hook_body += "e.job.resources_used[\"foo_str\"] = hstr\n"

        a = {'event': 'execjob_epilogue', 'enabled': 'True'}
        self.server.create_import_hook("ep", a, hook_body)

        J = Job()
        J.set_sleep_time(1)
        jid = self.server.submit(J)

        # Make sure the resources_used value hasn't been truncated
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        self.server.expect(
            JOB, {'resources_used.foo_str': hstr}, extend='x', max_attempts=1)

        # Make sure the accounting log hasn't been truncated
        log_match = 'resources_used.foo_str=' + hstr
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, log_match), regexp=True)

        # Make sure the server log hasn't been truncated
        log_match = 'resources_used.foo_str=' + hstr
        self.server.log_match("%s;.*%s.*" % (jid, log_match), regexp=True)

    def test_long_resource_reque(self):
        """
        Test to see if a very long string value is truncated
        in the 'R' requeue accounting record
        """

        # Create a very long string - the truncation was 2048 characters
        # 4096 is plenty big to show it
        hstr = ""
        for i in range(4096):
            hstr += "1"

        hook_body = "import pbs\n"
        hook_body += "e = pbs.event()\n"
        hook_body += "hstr=\'" + hstr + "\'\n"
        hook_body += "e.job.resources_used[\"foo_str\"] = hstr\n"

        a = {'event': 'execjob_prologue', 'enabled': 'True'}
        self.server.create_import_hook("pr", a, hook_body)

        J = Job()
        jid = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        self.server.rerunjob(jid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        # Make sure the accounting log hasn't been truncated
        acctlog_match = 'resources_used.foo_str=' + hstr
        self.server.accounting_match(
            "R;%s;.*%s.*" % (jid, acctlog_match), regexp=True)

    def test_queue_record(self):
        """
        Test the correct data is being printed in the queue record
        """
        t = time.time()
        a = {ATTR_g: TEST_USER.groups[0], ATTR_project: 'foo',
             ATTR_A: 'bar', ATTR_N: 'baz', ATTR_l + '.walltime': '1:00:00'}
        j1 = Job(TEST_USER, a)
        jid1 = self.server.submit(j1)

        (_, line) = self.server.accounting_match(';Q;' + jid1)

        # Check for euser
        self.assertIn('user=' + str(TEST_USER), line)

        # Check for egroup
        self.assertIn('group=' + str(TEST_USER.groups[0]), line)

        # Check for project
        self.assertIn('project=foo', line)

        # Check for account name
        self.assertIn('account=\"bar\"', line)

        # Check for job name
        self.assertIn('jobname=baz', line)

        # Check for queue
        self.assertIn('queue=workq', line)

        # Check for the existance of times
        self.assertIn('etime=', line)
        self.assertIn('ctime=', line)
        self.assertIn('qtime=', line)
        self.assertNotIn('start=', line)

        # Check for walltime
        self.assertIn('Resource_List.walltime=01:00:00', line)

        j2 = Job(TEST_USER, {ATTR_J: '1-2', ATTR_depend: 'afterok:' + jid1})
        jid2 = self.server.submit(j2)

        (_, line) = self.server.accounting_match(';Q;' + jid2)

        self.assertIn('array_indices=1-2', line)
        self.assertIn('depend=afterok:' + jid1, line)

        r = Reservation()
        rid1 = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid1)
        j3 = Job(TEST_USER, {ATTR_queue: rid1.split('.')[0]})
        jid3 = self.server.submit(j3)

        (_, line) = self.server.accounting_match(';Q;' + jid3)

        self.assertIn('resvID=' + rid1, line)

    def test_queue_record_hook(self):
        """
        Test that changes made in a queuejob hook are reflected in the Q record
        """
        qj_hook = """
import pbs
pbs.event().job.project = 'foo'
pbs.event().accept()
"""
        qj_attrs = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook('qj', qj_attrs, qj_hook)

        j = Job()
        jid1 = self.server.submit(j)

        (_, line) = self.server.accounting_match(';Q;' + jid1)
        self.assertIn('project=foo', line)

    def test_alter_record(self):
        """
        Test the accounting log alter record
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        j1 = Job(TEST_USER1)
        jid1 = self.server.submit(j1)

        # Basic test for existance of record for Resource_List
        self.server.alterjob(jid1, {ATTR_l + '.walltime': '1:00:00'})
        self.server.accounting_match(';a;' + jid1 +
                                     ';Resource_List.walltime=01:00:00')

        # Check for default value when unsetting
        self.server.manager(MGR_CMD_SET, SERVER,
                            {ATTR_rescdflt + '.walltime': '30:00'})
        self.server.alterjob(jid1, {ATTR_l + '.walltime': ''})
        self.server.accounting_match(';a;' + jid1 +
                                     ';Resource_List.walltime=00:30:00')

        self.server.alterjob(jid1, {ATTR_l + '.software': 'foo'})
        self.server.accounting_match(';a;' + jid1 +
                                     ';Resource_List.software=foo')
        # Check for UNSET record when value is unset
        self.server.alterjob(jid1, {ATTR_l + '.software': '\"\"'})
        self.server.accounting_match(';a;' + jid1 +
                                     ';Resource_List.software=UNSET')

        # Check for non-resource attribute
        self.server.alterjob(jid1, {ATTR_p: 150})
        self.server.accounting_match(';a;' + jid1 + ';Priority=150')

        self.server.alterjob(jid1, {ATTR_g: str(TSTGRP1)})
        self.server.accounting_match(';a;' + jid1 +
                                     ';group_list=' + str(TSTGRP1))

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        # Check that scheduler's alters are not logged
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.accounting_match(
            ';a;' + jid1 + ';comment', existence=False, max_attempts=2)

    def test_alter_record_hooks(self):
        """
        Test that when hooks set attributes, an 'a' record is logged
        """
        mj_hook = """
import pbs
pbs.event().job.comment = 'foo'
pbs.event().accept()
"""
        mj_attrs = {'event': 'modifyjob', 'enabled': 'True'}
        rj_hook = """
import pbs
pbs.event().job.project = 'abc'
pbs.event().reject('foo')
"""
        rj_attrs = {'event': 'runjob', 'enabled': 'True'}

        self.server.create_import_hook('mj', mj_attrs, mj_hook)
        self.server.create_import_hook('rj', rj_attrs, rj_hook)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        j1 = Job()
        jid1 = self.server.submit(j1)

        self.server.alterjob(jid1, {ATTR_p: 150})
        (_, line) = self.server.accounting_match(';a;' + jid1 + ';')
        self.assertIn('Priority=150', line)
        self.assertIn('comment=foo', line)

        try:
            self.server.runjob(jid1)
        except PbsRunError:
            # runjob hook is rejecting the run request
            pass
        self.server.accounting_match(';a;' + jid1 + ';project=abc')

    def test_alter_record_queuejob_hook(self):
        """
        Test that when a queuejob hook set an attribute, an 'a' record is
        logged.
        """
        qj_hook = """
import pbs
e1 = pbs.event()
e1.job.project = 'abc'
e2 = pbs.event()
e2.accept()
"""
        qj_attrs = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook('qj', qj_attrs, qj_hook)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        j1 = Job(TEST_USER, {'Resource_List.walltime': 42})
        j1.set_sleep_time(1)
        jid1 = self.server.submit(j1)
        self.server.alterjob(jid1, {ATTR_p: 150})
        (_, line) = self.server.accounting_match(';a;' + jid1 + ';')
        self.assertIn('Priority=150', line)
        (_, line) = self.server.accounting_match(';Q;' + jid1 + ';')
        self.assertIn('project=abc', line)
        self.server.runjob(jid1)
        (_, line) = self.server.accounting_match(';E;' + jid1 + ';')
        self.assertIn('project=abc', line)

    def test_alter_record_modifyjob_hook(self):
        """
        Test that when a modifyjob hook set attributes, an 'a' record is
        logged.
        """
        mj_hook = """
import pbs
e1 = pbs.event()
e1.job.comment = 'foo'
e1.job.project = 'abc'
e2 = pbs.event()
e2.accept()
"""
        mj_attrs = {'event': 'modifyjob', 'enabled': 'True'}
        self.server.create_import_hook('mj', mj_attrs, mj_hook)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        j1 = Job(TEST_USER, {'Resource_List.walltime': 42})
        j1.set_sleep_time(1)
        jid1 = self.server.submit(j1)
        self.server.alterjob(jid1, {ATTR_p: 150})
        (_, line) = self.server.accounting_match(';a;' + jid1 + ';')
        self.assertIn('Priority=150', line)
        self.assertIn('comment=foo', line)
        self.assertIn('project=abc', line)
        self.server.runjob(jid1)
        (_, line) = self.server.accounting_match(';E;' + jid1 + ';')
        # self.assertIn('comment=foo', line) # Doesn't exist in E
        self.assertIn('project=abc', line)

    def test_alter_record_runjob_hook(self):
        """
        Test that when a runjob hook set attributes, an 'a' record is logged.
        """
        info_hook = """
import pbs
e1 = pbs.event()
pbs.logmsg(pbs.LOG_ERROR, f"HOOK:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" comment:{e1.job.comment}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""

        qj_attrs = {'event': 'queuejob', 'enabled': 'True'}
        mj_attrs = {'event': 'modifyjob', 'enabled': 'True'}
        self.server.create_import_hook('qj', qj_attrs, info_hook)
        self.server.create_import_hook('mj', mj_attrs, info_hook)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        j1 = Job(TEST_USER, {'Resource_List.walltime': 42})
        j1.set_sleep_time(1)
        jid1 = self.server.submit(j1)
        self.server.alterjob(jid1, {ATTR_p: 150})

        rj_hook = """
import pbs
e1 = pbs.event()
e1.job.Output_Path = '/tmp/job-%s-output'
e1.job.Error_Path = '/tmp/job-%s-error'
e2 = pbs.event()
e2.accept()
""" % (jid1, jid1)
        rj_attrs = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook('rj', rj_attrs, rj_hook)

        self.server.runjob(jid1)
        (_, line) = self.server.accounting_match(';a;' + jid1 + ';')
        self.assertIn('Priority=150', line)
        (_, line) = self.server.accounting_match(';a;' + jid1 + ';Output_Path')
        self.assertIn('Output_Path=/tmp/job-%s-output' % jid1, line)
        (_, line) = self.server.accounting_match(';a;' + jid1 + ';Error_Path')
        self.assertIn('Error_Path=/tmp/job-%s-error' % jid1, line)

    def test_multiple_alter_record_hooks(self):
        """
        Test that when hooks set attributes, an 'a' record is logged.
        """
        mj_hook_00 = """
import pbs
e1 = pbs.event()
e1.job.comment = 'foo'
e1.job.project = "aaa"
e2 = pbs.event()
e2.accept()
"""
        mj_hook_01 = """
import pbs
e1 = pbs.event()
e1.job.comment = 'foo2'
e1.job.project = "bbb"
e2 = pbs.event()
e2.accept()
    """
        mj_attrs_00 = {'event': 'modifyjob', 'order': '1', 'enabled': 'True'}
        mj_attrs_01 = {'event': 'modifyjob', 'order': '2', 'enabled': 'True'}
        rj_hook = """
import pbs
e1 = pbs.event()
e1.job.project = 'abc'
e2 = pbs.event()
e2.reject('bar')
"""
        rj_attrs = {'event': 'runjob', 'enabled': 'True'}

        self.server.create_import_hook('mj01', mj_attrs_01, mj_hook_01)
        # create out of order.
        self.server.create_import_hook('mj00', mj_attrs_00, mj_hook_00)
        self.server.create_import_hook('rj', rj_attrs, rj_hook)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        j1 = Job(TEST_USER, {'Resource_List.walltime': 42})
        jid1 = self.server.submit(j1)

        self.server.alterjob(jid1, {ATTR_p: 150})
        (_, line) = self.server.accounting_match(';a;' + jid1 + ';')
        self.assertIn('Priority=150', line)
        self.assertIn('comment=foo2', line)
        self.assertIn('project=bbb', line)

        try:
            self.server.runjob(jid1)
        except PbsRunError:
            # runjob hook is rejecting the run request
            pass
        self.server.accounting_match(f';a;{jid1};project=abc')

    def test_queue_record_multiple_hook_00(self):
        """
        Test that changes made in a queuejob hooks are reflected in the
        Q record
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False',
                             'job_history_enable': 'True',
                             })
        qj_hook_00 = """
import pbs
e1 = pbs.event()
e1.job.project = 'foo00'
pbs.logmsg(pbs.LOG_ERROR, f"HOOK:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" Resource_List:{e1.job.Resource_List}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        qj_hook_01 = """
import pbs
e1 = pbs.event()
e1.job.project = str(e1.job.project) + '_foo01'
e1.accept()
"""
        qj_attrs = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook('qj00', qj_attrs, qj_hook_00)
        # FIXME set hook attr to priority order
        self.server.create_import_hook('qj01', qj_attrs, qj_hook_01)

        j = Job(TEST_USER, {'Resource_List.walltime': 42})
        j.set_sleep_time(1)
        jid1 = self.server.submit(j)
        self.server.alterjob(jid1, {ATTR_p: 150})
        (_, line) = self.server.accounting_match(';Q;' + jid1)
        self.assertIn('project=foo00_foo01', line)
        (_, line) = self.server.accounting_match(';a;' + jid1)
        self.assertIn('Priority=150', line)
        self.server.runjob(jid1)
        self.server.expect(JOB, {'job_state': 'F'}, extend='x', id=jid1)
        (_, line) = self.server.accounting_match(';E;' + jid1)
        self.assertIn('project=foo00_foo01', line)

    def test_queue_record_multiple_hook_01(self):
        """
        Test that changes made in a modifyjob hook are reflected in the
        E record
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False',
                             'job_history_enable': 'True',
                             })
        mj_hook_00 = """
import pbs
e1 = pbs.event()
e1.job.project = 'foo02'
pbs.logmsg(pbs.LOG_ERROR, f"HOOKQ0:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        mj_hook_01 = """
import pbs
e1 = pbs.event()
e1.job.project = str(e1.job.project) + '_foo03'
pbs.logmsg(pbs.LOG_ERROR, f"HOOKQ0:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        mj_attrs_00 = {'event': 'modifyjob', 'order': 1, 'enabled': 'True'}
        mj_attrs_01 = {'event': 'modifyjob', 'order': 2, 'enabled': 'True'}
        self.server.create_import_hook('mj_00', mj_attrs_00, mj_hook_00)
        self.server.create_import_hook('mj_01', mj_attrs_01, mj_hook_01)
        j = Job(TEST_USER, {'Resource_List.walltime': 42})
        j.set_sleep_time(1)
        jid1 = self.server.submit(j)
        self.server.alterjob(jid1, {ATTR_p: 150})
        (_, line) = self.server.accounting_match(';a;' + jid1)
        self.assertIn('Priority=150', line)
        self.assertIn('project=foo02_foo03', line)
        self.server.runjob(jid1)
        self.server.expect(JOB, {'job_state': 'F'}, extend='x', id=jid1)
        (_, line) = self.server.accounting_match(';E;' + jid1)
        self.assertIn('project=foo02_foo03', line)

    def test_queue_record_multiple_hook_02(self):
        """
        Test that changes made in a queuejob then modifyjob are stacking using
        job_o in the modifyjob hook.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False',
                             'job_history_enable': 'True',
                             })
        qj_hook_00 = """
import pbs
e1 = pbs.event()
e1.job.project = 'foo00'
e1 = pbs.event()
pbs.logmsg(pbs.LOG_ERROR, f"HOOKQ0:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" Resource_List:{e1.job.Resource_List}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        qj_attrs = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook('qj00', qj_attrs, qj_hook_00)

        mj_hook_00 = """
import pbs
e1 = pbs.event()
pbs.logmsg(pbs.LOG_ERROR, f"HOOKM0a:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" job_o.id:{e1.job_o.id}"
                    f" job_o.project:{e1.job_o.project}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.job.project = str(e1.job_o.project) + '_foo01'
pbs.logmsg(pbs.LOG_ERROR, f"HOOKM0b:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" job_o.id:{e1.job_o.id}"
                    f" job_o.project:{e1.job_o.project}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        mj_attrs = {'event': 'modifyjob', 'enabled': 'True'}
        # FIXME: there is a problem here when you enable the modifyjob hook.
        # the modifyjob hook doesn't get the change from the queuejob.
        self.server.create_import_hook('mj_00', mj_attrs, mj_hook_00)

        j = Job(TEST_USER, {'Resource_List.walltime': 1})
        j.set_sleep_time(1)
        jid1 = self.server.submit(j)
        self.server.alterjob(jid1, {ATTR_p: 150})
        self.server.runjob(jid1)
        self.server.expect(JOB, {'job_state': 'F'}, extend='x', id=jid1)

        (_, line) = self.server.accounting_match(';Q;' + jid1)
        self.assertIn('project=foo00', line)

        (_, line) = self.server.accounting_match(';a;' + jid1)
        self.assertIn('Priority=150', line)
        self.assertIn('project=foo00_foo01', line)

        (_, line) = self.server.accounting_match(';E;' + jid1)
        self.assertIn('project=foo00_foo01', line)

    def test_queue_record_multiple_hook_03(self):
        """
        Test that changes made in a queuejob then modifyjob are stacking using
        job_o in the first modifyjob hook, but not in the second.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False',
                             'job_history_enable': 'True',
                             })
        qj_hook_00 = """
import pbs
e1 = pbs.event()
e1.job.project = 'foo00'
e1.accept()
"""
        qj_hook_01 = """
import pbs
e1 = pbs.event()
e1.job.project = str(e1.job.project) + '_foo01'
pbs.logmsg(pbs.LOG_ERROR, f"HOOKQ1:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" Resource_List:{e1.job.Resource_List}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        qj_attrs = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook('qj00', qj_attrs, qj_hook_00)
        self.server.create_import_hook('qj01', qj_attrs, qj_hook_01)

        mj_hook_00 = """
import pbs
e1 = pbs.event()
pbs.logmsg(pbs.LOG_ERROR, f"HOOKM0a:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" job_o.id:{e1.job_o.id}"
                    f" job_o.project:{e1.job_o.project}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.job.project = str(e1.job_o.project) + '_foo02'
pbs.logmsg(pbs.LOG_ERROR, f"HOOKM0b:e1:{hex(id(e1))}"
                    f" jobid:{e1.job.id}"
                    f" project:{e1.job.project}"
                    f" job_o.id:{e1.job_o.id}"
                    f" job_o.project:{e1.job_o.project}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        mj_hook_01 = """
import pbs
e1 = pbs.event()
e1.job.project = str(e1.job.project) + '_foo03'
pbs.logmsg(pbs.LOG_ERROR, f"HOOKM1:e1:{hex(id(e1))}"
                    f" job.id:{e1.job.id}"
                    f" job.project:{e1.job.project}"
                    f" job_o.id:{e1.job_o.id}"
                    f" job_o.project:{e1.job_o.project}"
                    f" hex(id(job)):{hex(id(e1.job))}")
e1.accept()
"""
        mj_attrs_00 = {'event': 'modifyjob', 'order': 1, 'enabled': 'True'}
        mj_attrs_01 = {'event': 'modifyjob', 'order': 2, 'enabled': 'True'}
        self.server.create_import_hook('mj_00', mj_attrs_00, mj_hook_00)
        self.server.create_import_hook('mj_01', mj_attrs_01, mj_hook_01)

        j = Job(TEST_USER, {'Resource_List.walltime': 1})
        j.set_sleep_time(1)
        jid1 = self.server.submit(j)
        self.server.alterjob(jid1, {ATTR_p: 150})
        (_, line) = self.server.accounting_match(';Q;' + jid1)
        self.assertIn('project=foo00_foo01', line)
        self.server.runjob(jid1)
        self.server.expect(JOB, {'job_state': 'F'}, extend='x', id=jid1)

        (_, line) = self.server.accounting_match(';a;' + jid1)
        self.assertIn('Priority=150', line)
        self.assertIn('project=foo00_foo01_foo02_foo03', line)

        (_, line) = self.server.accounting_match(';E;' + jid1)
        self.assertIn('project=foo00_foo01_foo02_foo03', line)


================================================
FILE: test/tests/functional/pbs_accumulate_resc_used.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *
import ast


@requirements(num_moms=3)
class TestPbsAccumulateRescUsed(TestFunctional):

    """
    This tests the feature in PBS that enables mom hooks to accumulate
    resources_used values for resources beside cput, cpupercent, and mem.
    This includes accumulation of custom resources. The mom hooks supported
    this feature are: exechost_periodic, execjob_prologue,
    and execjob_epilogue.


    PRE: Have a cluster of PBS with 3 mom hosts, with an exechost_startup
         that adds custom resources.

    POST: When a job ends, accounting_logs reflect the aggregated
          resources_used values. And with job_history_enable=true, one
          can do a 'qstat -x -f <jobid>' to obtain information of a previous
          job.
    """

    # Class variables

    def setUp(self):

        TestFunctional.setUp(self)
        self.logger.info("len moms = %d" % (len(self.moms)))
        if len(self.moms) != 3:
            usage_string = 'test requires 3 MoMs as input, ' + \
                           'use -p moms=<mom1>:<mom2>:<mom3>'
            self.skip_test(usage_string)

        # PBSTestSuite returns the moms passed in as parameters as dictionary
        # of hostname and MoM object
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momC = self.moms.values()[2]
        self.momA.delete_vnode_defs()
        self.momB.delete_vnode_defs()
        self.momC.delete_vnode_defs()

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        self.hostC = self.momC.shortname

        rc = self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        self.assertEqual(rc, 0)

        rc = self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)
        self.assertEqual(rc, 0)

        rc = self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)
        self.assertEqual(rc, 0)

        rc = self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostC)
        self.assertEqual(rc, 0)

        # Give the moms a chance to contact the server.
        self.server.expect(NODE, {'state': 'free'}, id=self.hostA)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostB)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostC)

        # First set some custom resources via exechost_startup hook.
        startup_hook_body = """
import pbs
e=pbs.event()
localnode=pbs.get_local_nodename()

e.vnode_list[localnode].resources_available['foo_i'] = 7
e.vnode_list[localnode].resources_available['foo_f'] = 5.0
e.vnode_list[localnode].resources_available['foo_str'] = "seventyseven"
"""
        hook_name = "start"
        a = {'event': "exechost_startup", 'enabled': 'True'}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            startup_hook_body,
            overwrite=True)
        self.assertTrue(rv)

        self.momA.signal("-HUP")
        self.momB.signal("-HUP")
        self.momC.signal("-HUP")

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Next set some custom resources via qmgr -c 'create resource'
        attr = {}
        attr['type'] = 'string'
        attr['flag'] = 'h'
        r = 'foo_str2'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)
        self.assertEqual(rc, 0)

        # Ensure the new resource is seen by all moms.
        momlist = [self.momA, self.momB, self.momC]
        for m in momlist:
            m.log_match("resourcedef;copy hook-related file")

        attr['type'] = 'string'
        attr['flag'] = 'h'
        r = 'foo_str3'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)
        self.assertEqual(rc, 0)

        # Ensure the new resource is seen by all moms.
        for m in momlist:
            m.log_match("resourcedef;copy hook-related file")

        attr['type'] = 'string'
        attr['flag'] = 'h'
        r = 'foo_str4'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)
        self.assertEqual(rc, 0)

        # Ensure the new resource is seen by all moms.
        for m in momlist:
            m.log_match("resourcedef;copy hook-related file")

        attr['type'] = 'string_array'
        attr['flag'] = 'h'
        r = 'stra'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)
        self.assertEqual(rc, 0)

        # Give the moms a chance to receive the updated resource.
        # Ensure the new resource is seen by all moms.
        for m in momlist:
            m.log_match("resourcedef;copy hook-related file")

    def test_epilogue(self):
        """
        Test accumulatinon of resources of a multinode job from an
        exechost_epilogue hook.
        """
        self.logger.info("test_epilogue")
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed epilogue hook")
if e.job.in_ms_mom():
    e.job.resources_used["vmem"] = pbs.size("9gb")
    e.job.resources_used["foo_i"] = 9
    e.job.resources_used["foo_f"] = 0.09
    e.job.resources_used["foo_str"] = '{"seven":7}'
    e.job.resources_used["cput"] = 10
    e.job.resources_used["stra"] = '"glad,elated","happy"'
    e.job.resources_used["foo_str3"] = \
        \"\"\"{"a":6,"b":"some value #$%^&*@","c":54.4,"d":"32.5gb"}\"\"\"
    e.job.resources_used["foo_str2"] = "seven"
    e.job.resources_used["foo_str4"] = "eight"
else:
    e.job.resources_used["vmem"] = pbs.size("10gb")
    e.job.resources_used["foo_i"] = 10
    e.job.resources_used["foo_f"] = 0.10
    e.job.resources_used["foo_str"] = '{"eight":8,"nine":9}'
    e.job.resources_used["foo_str2"] = '{"seven":7}'
    e.job.resources_used["cput"] = 20
    e.job.resources_used["stra"] = '"cucumbers,bananas"'
    e.job.resources_used["foo_str3"] = \"\"\""vn1":4,"vn2":5,"vn3":6\"\"\"
"""

        hook_name = "epi"
        a = {'event': "execjob_epilogue", 'enabled': 'True', 'order': 999}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 10,
             'Resource_List.place': "scatter"}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time("10")
        jid = self.server.submit(j)

        # The results should show results for custom resources 'foo_i',
        # 'foo_f', 'foo_str', 'foo_str3', and bultin resources 'vmem',
        # 'cput', and should be accumulating  based
        # on the hook script, where MS defines 1 value, while the 2 sister
        # Moms define the same value. For 'string' type, it will be a
        # union of all values obtained from sister moms and local mom, and
        # the result will be in JSON-format.
        #
        # foo_str is for testing normal values.
        # foo_str2 is for testing non-JSON format value received from MS.
        # foo_str3 is for testing non-JSON format value received from a sister
        # mom.
        # foo_str4 is for testing MS-only set values.
        #
        # For string_array type  resource 'stra', it is not accumulated but
        # will be set to last seen value from a mom epilogue hook.
        self.server.expect(JOB, {
            'job_state': 'F',
            'resources_used.foo_f': '0.29',
            'resources_used.foo_i': '29',
            'resources_used.foo_str4': "eight",
            'resources_used.stra': "\"glad,elated\",\"happy\"",
            'resources_used.vmem': '29gb',
            'resources_used.cput': '00:00:50',
            'resources_used.ncpus': '3'},
            extend='x', offset=10, attrop=PTL_AND, id=jid)

        foo_str_dict_in = {"eight": 8, "seven": 7, "nine": 9}
        qstat = self.server.status(
            JOB, 'resources_used.foo_str', id=jid, extend='x')
        foo_str_dict_out_str = eval(qstat[0]['resources_used.foo_str'])
        foo_str_dict_out = eval(foo_str_dict_out_str)
        self.assertTrue(foo_str_dict_in == foo_str_dict_out)

        # resources_used.foo_str3 must not be set since a sister value is not
        # of JSON-format.
        self.server.expect(JOB, 'resources_used.foo_str3',
                           op=UNSET, extend='x', id=jid)

        self.momA.log_match(
            "Job %s resources_used.foo_str3 cannot be " % (jid,) +
            "accumulated: value '\"vn1\":4,\"vn2\":5,\"vn3\":6' " +
            "from mom %s not JSON-format" % (self.hostB,))

        # resources_used.foo_str2 must not be set.
        self.server.expect(JOB, 'resources_used.foo_str2', op=UNSET, id=jid)
        self.momA.log_match(
            "Job %s resources_used.foo_str2 cannot be " % (jid,) +
            "accumulated: value 'seven' from mom %s " % (self.hostA,) +
            "not JSON-format")

        # Match accounting_logs entry

        acctlog_match = 'resources_used.foo_f=0.29'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = 'resources_used.foo_i=29'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = "resources_used.foo_str='%s'" % (foo_str_dict_out_str,)
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = 'resources_used.vmem=29gb'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = 'resources_used.cput=00:00:50'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        # ensure resources_foo_str2 is not reported in accounting_logs since
        # it's unset due to non-JSON-format value.
        acctlog_match = 'resources_used.foo_str2='
        self.server.accounting_match("E;%s;.*%s.*" % (jid, acctlog_match),
                                     regexp=True, n=100, existence=False)

        acctlog_match = 'resources_used.foo_str4=eight'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = 'resources_used.ncpus=3'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        # resources_used.foo_str3 must not show up in accounting_logs
        acctlog_match = 'resources_used.foo_str3=',
        self.server.accounting_match("E;%s;.*%s.*" % (jid, acctlog_match),
                                     regexp=True, n=100, existence=False)

        acctlog_match = r'resources_used.stra=\"glad\,elated\"\,\"happy\"'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

    def test_prologue(self):
        """
        Test accumulatinon of resources of a multinode job from an
        exechost_prologue hook.
        On cpuset systems don't check for cput because the pbs_cgroups hook
        will be enabled and will overwrite the cput value set in the prologue
        hook
        """
        has_cpuset = False
        for mom in self.moms.values():
            if mom.is_cpuset_mom():
                has_cpuset = True

        self.logger.info("test_prologue")
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed prologue hook")
if e.job.in_ms_mom():
    e.job.resources_used["vmem"] = pbs.size("11gb")
    e.job.resources_used["foo_i"] = 11
    e.job.resources_used["foo_f"] = 0.11
    e.job.resources_used["foo_str"] = '{"seven":7}'
    e.job.resources_used["cput"] = 11
    e.job.resources_used["stra"] = '"glad,elated","happy"'
    e.job.resources_used["foo_str3"] = \
      \"\"\"{"a":6,"b":"some value #$%^&*@","c":54.4,"d":"32.5gb"}\"\"\"
    e.job.resources_used["foo_str2"] = "seven"
    e.job.resources_used["foo_str4"] = "eight"
else:
    e.job.resources_used["vmem"] = pbs.size("12gb")
    e.job.resources_used["foo_i"] = 12
    e.job.resources_used["foo_f"] = 0.12
    e.job.resources_used["foo_str"] = '{"eight":8,"nine":9}'
    e.job.resources_used["foo_str2"] = '{"seven":7}'
    e.job.resources_used["cput"] = 12
    e.job.resources_used["stra"] = '"cucumbers,bananas"'
    e.job.resources_used["foo_str3"] = \"\"\""vn1":4,"vn2":5,"vn3":6\"\"\"
"""

        hook_name = "prolo"
        a = {'event': "execjob_prologue", 'enabled': 'True'}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 10,
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)

        # The pbsdsh call is what allows a first task to get spawned on
        # on a sister mom, causing the execjob_prologue hook to execute.
        j.create_script(
            "pbsdsh -n 1 hostname\n" + "pbsdsh -n 2 hostname\n" + "sleep 10\n")

        jid = self.server.submit(j)

        # The results should show results for custom resources 'foo_i',
        # 'foo_f', 'foo_str', 'foo_str3', and bultin resources 'vmem',
        # 'cput', and should be accumulating  based
        # on the hook script, where MS defines 1 value, while the 2 sister
        # Moms define the same value. For 'string' type, it will be a
        # union of all values obtained from sister moms and local mom, and
        # the result will be in JSON-format.
        #
        # foo_str is for testing normal values.
        # foo_str2 is for testing non-JSON format value received from MS.
        # foo_str3 is for testing non-JSON format value received from a sister
        # mom.
        # foo_str4 is for testing MS-only set values.
        #
        # For string_array type  resource 'stra', it is not accumulated but
        # will be set to last seen value from a mom prologue hook.
        a = {
            'job_state': 'F',
            'resources_used.foo_f': '0.35',
            'resources_used.foo_i': '35',
            'resources_used.foo_str4': "eight",
            'resources_used.stra': "\"glad,elated\",\"happy\"",
            'resources_used.vmem': '35gb',
            'resources_used.ncpus': '3'}

        if not has_cpuset:
            a['resources_used.cput'] = '00:00:35'

        self.server.expect(JOB, a, extend='x', offset=10,
                           attrop=PTL_AND, id=jid)

        foo_str_dict_in = {"eight": 8, "seven": 7, "nine": 9}
        qstat = self.server.status(
            JOB, 'resources_used.foo_str', id=jid, extend='x')
        foo_str_dict_out_str = eval(qstat[0]['resources_used.foo_str'])
        foo_str_dict_out = eval(foo_str_dict_out_str)
        self.assertTrue(foo_str_dict_in == foo_str_dict_out)

        # resources_used.foo_str3 must not be set since a sister value is
        # not of JSON-format.
        self.server.expect(JOB, 'resources_used.foo_str3',
                           op=UNSET, extend='x', id=jid)

        self.momA.log_match(
            "Job %s resources_used.foo_str3 cannot be " % (jid,) +
            "accumulated: value '\"vn1\":4,\"vn2\":5,\"vn3\":6' " +
            "from mom %s not JSON-format" % (self.hostB,))
        self.momA.log_match(
            "Job %s resources_used.foo_str3 cannot be " % (jid,) +
            "accumulated: value '\"vn1\":4,\"vn2\":5,\"vn3\":6' " +
            "from mom %s not JSON-format" % (self.hostC,))

        # Ensure resources_used.foo_str3 is not set since it has a
        # non-JSON format value.
        self.server.expect(JOB, 'resources_used.foo_str3', op=UNSET,
                           extend='x', id=jid)

        # resources_used.foo_str2 must not be set.
        self.server.expect(JOB, 'resources_used.foo_str2', op=UNSET, id=jid)
        self.momA.log_match(
            "Job %s resources_used.foo_str2 cannot be " % (jid,) +
            "accumulated: value 'seven' from " +
            "mom %s not JSON-format" % (self.hostA,))

        # Match accounting_logs entry

        acctlog_match = 'resources_used.foo_f=0.35'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = 'resources_used.foo_i=35'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = "resources_used.foo_str='%s'" % (foo_str_dict_out_str,)
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = 'resources_used.vmem=35gb'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        if not has_cpuset:
            acctlog_match = 'resources_used.cput=00:00:35'
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        # resources_used.foo_str2 should not be reported in accounting_logs.
        acctlog_match = 'resources_used.foo_str2='
        self.server.accounting_match("E;%s;.*%s.*" % (jid, acctlog_match),
                                     regexp=True, n=100, existence=False)

        acctlog_match = 'resources_used.ncpus=3'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        # resources_used.foo_str3 must not show up in accounting_logs
        acctlog_match = 'resources_used.foo_str3='
        self.server.accounting_match("E;%s;.*%s.*" % (jid, acctlog_match),
                                     regexp=True, n=100, existence=False)

        acctlog_match = 'resources_used.foo_str4=eight'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

        acctlog_match = r'resources_used.stra=\"glad\,elated\"\,\"happy\"'
        self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

    def test_periodic(self):
        """
        Test accumulatinon of resources from an exechost_periodic hook.
        """
        self.logger.info("test_periodic")
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed periodic hook")
i = 0
l = []
for v in pbs.server().vnodes():
    pbs.logmsg(pbs.LOG_DEBUG, "node %s" % (v.name,))
    l.append(v.name)

local_node=pbs.get_local_nodename()
for jk in e.job_list.keys():
    if local_node == l[0]:
        e.job_list[jk].resources_used["vmem"] = pbs.size("11gb")
        e.job_list[jk].resources_used["foo_i"] = 11
        e.job_list[jk].resources_used["foo_f"] = 0.11
        e.job_list[jk].resources_used["foo_str"] = '{"seven":7}'
        e.job_list[jk].resources_used["cput"] = 11
        e.job_list[jk].resources_used["stra"] = '"glad,elated","happy"'
        e.job_list[jk].resources_used["foo_str3"] = \
         \"\"\"{"a":6,"b":"some value #$%^&*@","c":54.4,"d":"32.5gb"}\"\"\"
        e.job_list[jk].resources_used["foo_str2"] = "seven"
    elif local_node == l[1]:
        e.job_list[jk].resources_used["vmem"] = pbs.size("12gb")
        e.job_list[jk].resources_used["foo_i"] = 12
        e.job_list[jk].resources_used["foo_f"] = 0.12
        e.job_list[jk].resources_used["foo_str"] = '{"eight":8}'
        e.job_list[jk].resources_used["cput"] = 12
        e.job_list[jk].resources_used["stra"] = '"cucumbers,bananas"'
        e.job_list[jk].resources_used["foo_str2"] =  '{"seven":7}'
        e.job_list[jk].resources_used["foo_str3"] = \
                \"\"\"{"vn1":4,"vn2":5,"vn3":6}\"\"\"
    else:
        e.job_list[jk].resources_used["vmem"] = pbs.size("13gb")
        e.job_list[jk].resources_used["foo_i"] = 13
        e.job_list[jk].resources_used["foo_f"] = 0.13
        e.job_list[jk].resources_used["foo_str"] = '{"nine":9}'
        e.job_list[jk].resources_used["foo_str2"] =  '{"seven":7}'
        e.job_list[jk].resources_used["cput"] = 13
        e.job_list[jk].resources_used["stra"] = '"cucumbers,bananas"'
        e.job_list[jk].resources_used["foo_str3"] = \
                \"\"\"{"vn1":4,"vn2":5,"vn3":6}\"\"\"
"""

        hook_name = "period"
        a = {'event': "exechost_periodic", 'enabled': 'True', 'freq': 15}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        a = {'resources_available.ncpus': '2'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.hostA)

        self.server.manager(MGR_CMD_SET, NODE, a, self.hostB)

        self.server.manager(MGR_CMD_SET, NODE, a, self.hostC)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time("35")
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)

        for jid in [jid1, jid2]:

            # The results should show results for custom resources 'foo_i',
            # 'foo_f', 'foo_str', 'foo_str3', and bultin resources 'vmem',
            # 'cput', and should be accumulating  based
            # on the hook script, where MS defines 1 value, while the 2 sister
            # Moms define the same value. For 'string' type, it will be a
            # union of all values obtained from sister moms and local mom, and
            # the result will be in JSON-format.
            # foo_str is for testing normal values.
            # foo_str2 is for testing non-JSON format value received from MS.
            # foo_str3 is for testing non-JSON format value received from a
            # sister mom.
            #

            self.server.expect(JOB, {
                'job_state': 'F',
                'resources_used.foo_f': '0.36',
                'resources_used.foo_i': '36',
                'resources_used.stra': "\"glad,elated\",\"happy\"",
                'resources_used.vmem': '36gb',
                'resources_used.cput': '00:00:36',
                'resources_used.ncpus': '3'},
                extend='x', offset=35, attrop=PTL_AND, id=jid)

            foo_str_dict_in = {"eight": 8, "seven": 7, "nine": 9}
            qstat = self.server.status(
                JOB, 'resources_used.foo_str', id=jid, extend='x')
            foo_str_dict_out_str = eval(qstat[0]['resources_used.foo_str'])
            foo_str_dict_out = eval(foo_str_dict_out_str)
            self.assertTrue(foo_str_dict_in == foo_str_dict_out)

            foo_str3_dict_in = {"a": 6, "b": "some value #$%^&*@",
                                "c": 54.4, "d": "32.5gb", "vn1": 4,
                                "vn2": 5, "vn3": 6}
            qstat = self.server.status(
                JOB, 'resources_used.foo_str3', id=jid, extend='x')
            foo_str3_dict_out_str = eval(qstat[0]['resources_used.foo_str3'])
            foo_str3_dict_out = eval(foo_str3_dict_out_str)
            self.assertTrue(foo_str3_dict_in == foo_str3_dict_out)

            # resources_used.foo_str2 must be unset since its value is not of
            # JSON-format.
            self.server.expect(JOB, 'resources_used.foo_str2', op=UNSET,
                               extend='x', id=jid)

            # Match accounting_logs entry

            acctlog_match = 'resources_used.foo_f=0.36'
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

            acctlog_match = 'resources_used.foo_i=36'
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

            acctlog_match = "resources_used.foo_str='%s'" % (
                foo_str_dict_out_str,)
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

            acctlog_match = 'resources_used.vmem=36gb'
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

            acctlog_match = 'resources_used.cput=00:00:36'
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

            # resources_used.foo_str2 must not show in accounting_logs
            acctlog_match = 'resources_used.foo_str2=',
            self.server.accounting_match("E;%s;.*%s.*" % (jid, acctlog_match),
                                         regexp=True, n=100, existence=False)

            acctlog_match = 'resources_used.ncpus=3'
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

            acctlog_match = "resources_used.foo_str3='%s'" % (
                foo_str3_dict_out_str.replace('.', r'\.').
                replace("#$%^&*@", r"\#\$\%\^\&\*\@"))
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
            acctlog_match = r'resources_used.stra=\"glad\,elated\"\,\"happy\"'
            self.server.accounting_match(
                "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)

    def test_resource_bool(self):
        """
        To test that boolean value are not getting aggregated
        """

        # Create a boolean type resource
        attr = {}
        attr['type'] = 'boolean'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr,
            id='foo_bool', runas=ROOT_USER,
            logerr=False)

        hook_body = """
import pbs
e=pbs.event()
j=e.job
if j.in_ms_mom():
    j.resources_used["foo_bool"] = True
else:
    j.resources_used["foo_bool"] = False
"""

        hook_name = "epi_bool"
        a = {'event': "execjob_epilogue", 'enabled': "True"}
        self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 10,
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time("5")
        jid = self.server.submit(j)

        # foo_bool is True
        a = {'resources_used.foo_bool': "True",
             'job_state': 'F'}
        self.server.expect(JOB, a, extend='x', offset=5, attrop=PTL_AND,
                           id=jid)

    def test_resource_invisible(self):
        """
        Test that value aggregation is same for invisible resources
        """

        # Set float and string_array to be invisible resource
        attr = {}
        attr['flag'] = 'ih'
        self.server.manager(
            MGR_CMD_SET, RSC, attr, id='foo_f', runas=ROOT_USER)
        self.server.manager(
            MGR_CMD_SET, RSC, attr, id='foo_str', runas=ROOT_USER)

        hook_body = """
import pbs
e=pbs.event()
j = e.job
if j.in_ms_mom():
    j.resources_used["foo_f"] = 2.114
    j.resources_used["foo_str"] = '{"one":1,"two":2}'
else:
    j.resources_used["foo_f"] = 3.246
    j.resources_used["foo_str"] = '{"two":2, "three":3}'
"""

        hook_name = "epi_invis"
        a = {'event': "execjob_epilogue", 'enabled': 'True'}
        self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 10,
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time("5")
        jid = self.server.submit(j)

        # Verify that values are accumulated for float and string array
        a = {'resources_used.foo_f': '8.606'}
        self.server.expect(JOB, a, extend='x', offset=5, id=jid)

        foo_str_dict_in = {"one": 1, "two": 2, "three": 3}
        qstat = self.server.status(
            JOB, 'resources_used.foo_str', id=jid, extend='x')
        foo_str_dict_out_str = eval(qstat[0]['resources_used.foo_str'])
        foo_str_dict_out = eval(foo_str_dict_out_str)
        self.assertEqual(foo_str_dict_in, foo_str_dict_out)

    def test_reservation(self):
        """
        Test that job inside reservations works same
        NOTE: Due to the reservation duration and the job duration
        both being equal, this test found 2 race conditions.
        KEEP the durations equal to each other.
        """
        # Create non-host level resources from qmgr
        attr = {}
        attr['type'] = 'size'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id='foo_i2', runas=ROOT_USER)
        # Ensure the new resource is seen by all moms.
        momlist = [self.momA, self.momB, self.momC]
        for m in momlist:
            m.log_match("resourcedef;copy hook-related file")

        attr['type'] = 'float'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id='foo_f2', runas=ROOT_USER)
        # Ensure the new resource is seen by all moms.
        for m in momlist:
            m.log_match("resourcedef;copy hook-related file")

        attr['type'] = 'string_array'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id='stra2', runas=ROOT_USER)
        # Ensure the new resource is seen by all moms.
        for m in momlist:
            m.log_match("resourcedef;copy hook-related file")

        # Create an epilogue hook
        hook_body = """
import pbs
e = pbs.event()
j = e.job
pbs.logmsg(pbs.LOG_DEBUG, "executed epilogue hook")
j.resources_used["foo_i"] = 2
j.resources_used["foo_i2"] = pbs.size(1000)
j.resources_used["foo_f"] = 1.02
j.resources_used["foo_f2"] = 2.01
j.resources_used["stra"] = '"happy"'
j.resources_used["stra2"] = '"glad"'
"""

        # Create and import hook
        a = {'event': "execjob_epilogue", 'enabled': 'True'}
        self.server.create_import_hook(
            "epi", a, hook_body,
            overwrite=True)

        # Submit a reservation
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'scatter',
             'reserve_start': time.time() + 10,
             'reserve_end': time.time() + 30, }
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)

        rname = rid.split('.')
        # Submit a job inside reservation
        a = {'Resource_List.select': '3:ncpus=1', ATTR_queue: rname[0]}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time(20)
        jid = self.server.submit(j)

        # Verify the resource values
        a = {'resources_used.foo_i': '6',
             'resources_used.foo_i2': '3kb',
             'resources_used.foo_f': '3.06',
             'resources_used.foo_f2': '6.03',
             'resources_used.stra': "\"happy\"",
             'resources_used.stra2': "\"glad\"",
             'job_state': 'F'}
        self.server.expect(JOB, a, extend='x', attrop=PTL_AND,
                           offset=30, interval=1, id=jid)

        # Below is commented out due to a problem with history jobs
        # disapearing after a server restart when the reservation is
        # in state BD during restart.
        # Once that bug is fixed, this test code should be uncommented
        # and run.

        # Restart server and verifies that the values are still the same
        # self.server.restart()
        # self.server.expect(JOB, a, extend='x', id=jid)

    def test_server_restart(self):
        """
        Test that resource accumulation will not get
        impacted if server is restarted during job execution
        On cpuset systems don't check for cput because the pbs_cgroups hook
        will be enabled and will overwrite the cput value set in the prologue
        hook
        """
        has_cpuset = False
        for mom in self.moms.values():
            if mom.is_cpuset_mom():
                has_cpuset = True

        # Create a prologue hook
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed prologue hook")
if e.job.in_ms_mom():
    e.job.resources_used["vmem"] = pbs.size("11gb")
    e.job.resources_used["foo_i"] = 11
    e.job.resources_used["foo_f"] = 0.11
    e.job.resources_used["foo_str"] = '{"seven":7}'
    e.job.resources_used["cput"] = 11
    e.job.resources_used["stra"] = '"glad,elated","happy"'
    e.job.resources_used["foo_str4"] = "eight"
else:
    e.job.resources_used["vmem"] = pbs.size("12gb")
    e.job.resources_used["foo_i"] = 12
    e.job.resources_used["foo_f"] = 0.12
    e.job.resources_used["foo_str"] = '{"eight":8,"nine":9}'
    e.job.resources_used["cput"] = 12
    e.job.resources_used["stra"] = '"cucumbers,bananas"'
"""

        hook_name = "prolo"
        a = {'event': "execjob_prologue", 'enabled': 'True'}
        self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 20,
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)

        # The pbsdsh call is what allows a first task to get spawned on
        # on a sister mom, causing the execjob_prologue hook to execute.
        j.create_script(
            "pbsdsh -n 1 hostname\n" +
            "pbsdsh -n 2 hostname\n" +
            "sleep 10\n")

        jid = self.server.submit(j)

        # Once the job is started running restart server
        self.server.expect(JOB, {'job_state': "R", "substate": 42}, id=jid)
        self.server.restart()

        # Job will be requeued and rerun. Verify that the
        # resource accumulation is similar as if server is
        # not started
        a = {'resources_used.foo_i': '35',
             'resources_used.foo_f': '0.35',
             'resources_used.vmem': '35gb',
             'resources_used.stra': "\"glad,elated\",\"happy\"",
             'resources_used.foo_str4': "eight",
             'job_state': 'F'}
        if not has_cpuset:
            a['resources_used.cput'] = '00:00:35'
        self.server.expect(JOB, a, extend='x',
                           offset=5, id=jid, interval=1, attrop=PTL_AND)

        foo_str_dict_in = {"eight": 8, "seven": 7, "nine": 9}
        qstat = self.server.status(
            JOB, 'resources_used.foo_str', id=jid, extend='x')
        foo_str_dict_out_str = eval(qstat[0]['resources_used.foo_str'])
        foo_str_dict_out = eval(foo_str_dict_out_str)
        self.assertEqual(foo_str_dict_in, foo_str_dict_out)

    def test_mom_down(self):
        """
        Test that resource_accumulation is not impacted due to
        mom restart
        """

        # Set node_fail_requeue to requeue job
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'node_fail_requeue': 10})

        hook_body = """
import pbs
e = pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed periodic hook")

for jj in e.job_list.keys():
    e.job_list[jj].resources_used["foo_i"] = 1
    e.job_list[jj].resources_used["foo_str"] = '{"happy":"true"}'
    e.job_list[jj].resources_used["stra"] = '"one","two"'
"""

        a = {'event': "exechost_periodic", 'enabled': 'True', 'freq': 10}
        self.server.create_import_hook(
            "period",
            a,
            hook_body,
            overwrite=True)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 300,
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)
        jid1 = self.server.submit(j)

        # Submit a job that can never run
        a = {'Resource_List.select': '5:ncpus=1',
             'Resource_List.place': 'scatter'}
        j.set_attributes(a)
        j.set_sleep_time("300")
        jid2 = self.server.submit(j)

        # Wait for 10s approx for hook to get executed
        # verify the resources_used.foo_i
        self.server.expect(JOB, {'resources_used.foo_i': '3'},
                           offset=10, id=jid1, interval=1)
        self.server.expect(JOB, "resources_used.foo_i", op=UNSET, id=jid2)

        # Bring sister mom down
        self.momB.stop()

        # Wait for 20 more seconds for preiodic hook to run
        # more than once and verify that value is still 3
        self.server.expect(JOB, {'resources_used.foo_i': '3'},
                           offset=20, id=jid1, interval=1)

        # Wait for job to be requeued by node_fail_requeue
        self.server.rerunjob(jid1, runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

        # Verify that resources_used.foo_i is unset
        self.server.expect(JOB, "resources_used.foo_i", op=UNSET, id=jid1)

        # Bring sister mom up
        self.momB.start()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1, interval=1)

        # Verify that value of foo_i for job1 is set back
        self.server.expect(JOB, {'resources_used.foo_i': '3'},
                           offset=10, id=jid1, interval=1)

    def test_job_rerun(self):
        """
        Test that resource accumulates once when job
        is rerun
        """

        hook_body = """
import pbs
e = pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed periodic hook")

for jj in e.job_list.keys():
    e.job_list[jj].resources_used["foo_f"] = 1.01
    e.job_list[jj].resources_used["cput"] = 10
"""

        a = {'event': "exechost_periodic", 'enabled': 'True', 'freq': 10}
        self.server.create_import_hook(
            "period",
            a,
            hook_body,
            overwrite=True)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "R", "substate": 42}, id=jid1)

        # Wait for 10s approx for hook to get executed
        # Verify the resources_used.foo_f
        a = {'resources_used.foo_f': '3.03',
             'resources_used.cput': 30}
        self.server.expect(JOB, a,
                           offset=10, id=jid1, attrop=PTL_AND, interval=1)

        # Rerun the job
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})
        self.server.rerunjob(jobid=jid1, runas=ROOT_USER)
        self.server.expect(JOB,
                           {'job_state': 'Q'}, id=jid1)

        # Verify that foo_f is unset
        self.server.expect(JOB,
                           'Resource_List.foo_f',
                           op=UNSET, id=jid1)

        # turn the scheduling on
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': "R", "substate": 42},
                           attrop=PTL_AND, id=jid1)

        # Validate that resources_used.foo_f is reset
        self.server.expect(JOB, a,
                           offset=10, id=jid1, attrop=PTL_AND, interval=1)

    def test_job_array(self):
        """
        Test that resource accumulation for subjobs also work
        """

        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed epilogue hook")
if e.job.in_ms_mom():
    e.job.resources_used["vmem"] = pbs.size("9gb")
    e.job.resources_used["foo_i"] = 9
    e.job.resources_used["foo_f"] = 0.09
    e.job.resources_used["foo_str"] = '{"seven":7}'
    e.job.resources_used["cput"] = 10
    e.job.resources_used["stra"] = '"glad,elated","happy"'
else:
    e.job.resources_used["vmem"] = pbs.size("10gb")
    e.job.resources_used["foo_i"] = 10
    e.job.resources_used["foo_f"] = 0.10
    e.job.resources_used["foo_str"] = '{"eight":8,"nine":9}'
    e.job.resources_used["cput"] = 20
    e.job.resources_used["stra"] = '"cucumbers,bananas"'
"""

        a = {'event': "execjob_epilogue", 'enabled': 'True'}
        self.server.create_import_hook(
            "test",
            a,
            hook_body,
            overwrite=True)

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 10,
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER, attrs={ATTR_J: '1-2'})
        j.set_attributes(a)
        j.set_sleep_time("5")
        jid = self.server.submit(j)

        # Verify that once subjobs are over values are
        # set for each subjob in the accounting logs
        subjob1 = str.replace(jid, '[]', '[1]')

        acctlog_match = 'resources_used.foo_f=0.29'
        # Below code is commented due to a PTL issue
        # s = self.server.accounting_match(
        #    "E;%s;.*%s.*" % (subjob1, acctlog_match), regexp=True, n=100)
        # self.assertTrue(s)

        acctlog_match = 'resources_used.foo_i=29'
        # s = self.server.accounting_match(
        #    "E;%s;.*%s.*" % (subjob1, acctlog_match), regexp=True, n=100)
        # self.assertTrue(s)

        foo_str_dict_in = {"eight": 8, "seven": 7, "nine": 9}
        acctlog_match = "resources_used.foo_str='%s'" % (foo_str_dict_in,)
        # s = self.server.accounting_match(
        #    "E;%s;.*%s.*" % (subjob1, acctlog_match), regexp=True, n=100)
        # self.assertTrue(s)

        acctlog_match = 'resources_used.vmem=29gb'
        # s = self.server.accounting_match(
        #    "E;%s;.*%s.*" % (subjob1, acctlog_match), regexp=True, n=100)
        # self.assertTrue(s)

        acctlog_match = 'resources_used.cput=00:00:50'
        # s = self.server.accounting_match(
        #    "E;%s;.*%s.*" % (subjob1, acctlog_match), regexp=True, n=100)
        # self.assertTrue(s)

        acctlog_match = r'resources_used.stra=\"glad\,elated\"\,\"happy\"'
        # s = self.server.accounting_match(
        #    "E;%s;.*%s.*" % (subjob1, acctlog_match), regexp=True, n=100)
        # self.assertTrue(s)

    def test_epi_pro(self):
        """
        Test that epilogue and prologue changing same
        and different resources. Values of same resource
        would get overwriteen by the last hook.
        On cpuset systems don't check for cput because the pbs_cgroups hook
        will be enabled and will overwrite the cput value set in the prologue
        hook
        """
        has_cpuset = False
        for mom in self.moms.values():
            if mom.is_cpuset_mom():
                has_cpuset = True

        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "In prologue hook")
e.job.resources_used["foo_i"] = 10
e.job.resources_used["foo_f"] = 0.10
"""

        a = {'event': "execjob_prologue", 'enabled': 'True'}
        self.server.create_import_hook(
            "pro", a, hook_body,
            overwrite=True)

        # Verify the copy message in the logs to avoid
        # race conditions
        momlist = [self.momA, self.momB, self.momC]
        for m in momlist:
            m.log_match("pro.PY;copy hook-related file")

        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "In epilogue hook")
e.job.resources_used["foo_f"] = 0.20
e.job.resources_used["cput"] = 10
"""

        a = {'event': "execjob_epilogue", 'enabled': 'True'}
        self.server.create_import_hook(
            "epi", a, hook_body,
            overwrite=True)

        # Verify the copy message in the logs to avoid
        # race conditions
        for m in momlist:
            m.log_match("epi.PY;copy hook-related file")

        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.create_script(
            "pbsdsh -n 1 hostname\n" +
            "pbsdsh -n 2 hostname\n" +
            "sleep 5\n")
        jid = self.server.submit(j)

        # Verify the resources_used once the job is over
        b = {
            'resources_used.foo_i': '30',
            'resources_used.foo_f': '0.6',
            'job_state': 'F'}

        if not has_cpuset:
            b['resources_used.cput'] = '30'
        self.server.expect(JOB, b, extend='x', id=jid, offset=5, interval=1)

        # Submit another job
        j1 = Job(TEST_USER)
        j1.set_attributes(a)
        j1.create_script(
            "pbsdsh -n 1 hostname\n" +
            "pbsdsh -n 2 hostname\n" +
            "sleep 300\n")
        jid1 = self.server.submit(j1)

        # Verify that prologue hook has set the values
        self.server.expect(JOB, {
            'job_state': 'R',
            'resources_used.foo_i': '30',
            'resources_used.foo_f': '0.3'}, attrop=PTL_AND,
            id=jid1, interval=2)

        # Force delete the job
        self.server.deljob(id=jid1, wait=True, attr_W="force")

        # Verify values are accumulated by prologue hook only
        self.server.expect(JOB, {
            'resources_used.foo_i': '30',
            'resources_used.foo_f': '0.3'}, attrop=PTL_AND,
            extend='x', id=jid1)

    def test_server_restart2(self):
        """
        Test that server restart during hook execution
        has no impact
        """

        hook_body = """
import pbs
import time

e = pbs.event()

pbs.logmsg(pbs.LOG_DEBUG, "executed epilogue hook")
if e.job.in_ms_mom():
        e.job.resources_used["vmem"] = pbs.size("9gb")
        e.job.resources_used["foo_i"] = 9
        e.job.resources_used["foo_f"] = 0.09
        e.job.resources_used["foo_str"] = '{"seven":7}'
        e.job.resources_used["cput"] = 10
else:
        e.job.resources_used["vmem"] = pbs.size("10gb")
        e.job.resources_used["foo_i"] = 10
        e.job.resources_used["foo_f"] = 0.10
        e.job.resources_used["foo_str"] = '{"eight":8,"nine":9}'
        e.job.resources_used["cput"] = 20

time.sleep(15)
"""

        a = {'event': "execjob_epilogue", 'enabled': 'True'}
        self.server.create_import_hook(
            "epi", a, hook_body, overwrite=True)

        # Submit a job
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 10,
             'Resource_List.place': "scatter",
             'Keep_Files': 'oe'}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time("5")
        jid = self.server.submit(j)

        # Verify the resource values
        a = {'resources_used.foo_i': 29,
             'resources_used.foo_f': 0.29}
        a_dict = {'eight': 8, 'seven': 7, 'nine': 9}

        self.server.expect(JOB, a, extend='x', attrop=PTL_AND,
                           offset=5, id=jid, interval=1)
        # check for dictionary resource
        job_status = self.server.status(JOB, id=jid, extend='x')
        job_str_resource = dict(job_status[0])['resources_used.foo_str']
        job_str_resource = ast.literal_eval(ast.literal_eval(job_str_resource))
        self.assertEqual(job_str_resource, a_dict)

        # Restart server while hook is still executing
        self.server.restart()

        # Verify that values again
        self.server.expect(JOB, a, extend='x', attrop=PTL_AND,
                           id=jid)
        # check for dictionary resource
        job_status = self.server.status(JOB, id=jid, extend='x')
        job_str_resource = dict(job_status[0])['resources_used.foo_str']
        job_str_resource = ast.literal_eval(ast.literal_eval(job_str_resource))
        self.assertEqual(job_str_resource, a_dict)

    def test_mom_down2(self):
        """
        Test that when mom is down values are still
        accumulated for resources
        """

        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed epilogue hook")
if e.job.in_ms_mom():
    e.job.resources_used["vmem"] = pbs.size("9gb")
    e.job.resources_used["foo_i"] = 9
    e.job.resources_used["foo_f"] = 0.09
    e.job.resources_used["foo_str"] = '{"seven":7}'
    e.job.resources_used["cput"] = 10
    e.job.resources_used["stra"] = '"glad,elated","happy"'
else:
    e.job.resources_used["vmem"] = pbs.size("10gb")
    e.job.resources_used["foo_i"] = 10
    e.job.resources_used["foo_f"] = 0.10
    e.job.resources_used["foo_str"] = '{"eight":8,"nine":9}'
    e.job.resources_used["cput"] = 20
    e.job.resources_used["stra"] = '"cucumbers,bananas"'
"""

        a = {'event': "execjob_epilogue",
             'enabled': 'True'}
        self.server.create_import_hook(
            "epi", a, hook_body,
            overwrite=True)

        # Submit a job
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': 40,
             'Resource_List.place': "scatter"}
        j = Job(TEST_USER)
        j.set_attributes(a)
        jid = self.server.submit(j)

        # Verify job is running
        self.server.expect(JOB,
                           {'job_state': "R"}, id=jid)

        # Bring sister mom down
        self.momB.stop()

        # Wait for job to end
        # Validate that the values are being set
        # with 2 moms only
        self.server.expect(JOB,
                           {'job_state': 'F',
                            'resources_used.foo_i': '19',
                            'resources_used.foo_f': '0.19'},
                           offset=10, id=jid, interval=1, extend='x',
                           attrop=PTL_AND)
        a_dict = {'eight': 8, 'nine': 9, 'seven': 7}

        # check for dictionary resource
        job_status = self.server.status(JOB, id=jid, extend='x')
        job_str_resource = dict(job_status[0])['resources_used.foo_str']
        job_str_resource = ast.literal_eval(ast.literal_eval(job_str_resource))
        self.assertEqual(job_str_resource, a_dict)

        # Bring the mom back up
        self.momB.start()

    def test_finished_walltime(self):
        """
        If used resources are modified from hook, this test makes sure
        that mem used resources are merged and once the job ends,
        the walltime is not zero.
        """
        hook_body = """
import pbs
e = pbs.event()
if e.type == pbs.EXECHOST_PERIODIC:
    for jobid in e.job_list:
        e.job_list[jobid].resources_used["mem"] = pbs.size('1024kb')
else:
    e.job.resources_used["mem"] = pbs.size('1024kb')
"""
        hook_name = "multinode_used"
        attr = {'event': 'exechost_periodic,execjob_epilogue,execjob_end',
                'freq': '3',
                'enabled': 'True'}
        rv = self.server.create_import_hook(hook_name, attr, hook_body)
        self.assertTrue(rv)

        sleeptime = 30
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.walltime': sleeptime,
             'Resource_List.place': "scatter"}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time(f"{sleeptime}")
        jid = self.server.submit(j)

        self.server.expect(JOB, {
            'job_state': 'R',
            'resources_used.mem': '3072kb'},
            attrop=PTL_AND, offset=sleeptime/2, id=jid)

        self.server.expect(JOB, {
            'job_state': 'F',
            'resources_used.mem': '3072kb',
            'resources_used.walltime': sleeptime}, op=GE,
            extend='x', offset=sleeptime/2, attrop=PTL_AND, id=jid)


================================================
FILE: test/tests/functional/pbs_acl_groups.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_acl_groups(TestFunctional):
    """
    Test to check acl_groups and acl_resv_groups considers secondary group
    """

    def test_acl_grp_queue(self):
        """
        Set acl_groups on a queue and submit a job with a user
        for whom the set group is a secondary group
        """
        a = {'queue_type': 'execution', 'started': 't', 'enabled': 't',
             'acl_group_enable': 't', 'acl_groups': TSTGRP1}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')
        a = {'queue': 'workq2'}
        j = Job(TEST_USER1, attrs=a)
        # If 'Unauthorized Request' is found in error message the test would
        # fail as user was not able to submit job as a secondary group member
        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertFalse('Unauthorized Request' in e.msg[0])

    def test_acl_resv_groups(self):
        """
        Set acl_resv_groups on server and submit a reservation
        from a user for whom the set group is a secondary group
        """
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'acl_resv_group_enable': 'true'})
        self.server.manager(MGR_CMD_SET, SERVER, {'acl_resv_groups': TSTGRP1})
        # If 'Requestor's group not authorized' is found in error message the
        # test would fail as user was not able to submit reservation
        # as a secondary group member
        try:
            r = Reservation(TEST_USER1)
            rstart = int(time.time()) + 10
            rend = int(time.time()) + 360
            a = {'reserve_start': rstart,
                 'reserve_end': rend}
            r.set_attributes(a)
            rid = self.server.submit(r)
        except PbsSubmitError as e:
            self.assertFalse(
                'Requestor\'s group not authorized' in e.msg[0])


================================================
FILE: test/tests/functional/pbs_acl_host_moms.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_acl_host_moms(TestFunctional):
    """
    This test suite is for testing the server attribute acl_host_moms_enable
    and this test requires two moms.
    """

    def setUp(self):
        """
        Determine the remote host and set acl_host_enable = True
        """

        TestFunctional.setUp(self)

        usage_string = 'test requires a MoM and a client as input, ' + \
                       ' use -p moms=<mom>,client=<client>'

        # PBSTestSuite returns the moms passed in as parameters as dictionary
        # of hostname and MoM object
        self.momA = self.moms.values()[0]
        self.momA.delete_vnode_defs()

        self.hostA = self.momA.shortname
        if not self.du.is_localhost(self.server.client):
            # acl_hosts expects FQDN
            self.hostB = socket.getfqdn(self.server.client)
        else:
            self.skip_test(usage_string)

        self.remote_host = None

        if not self.du.is_localhost(self.hostA):
            self.remote_host = self.hostA
        else:
            self.skip_test(usage_string)

        self.assertTrue(self.remote_host)

        self.server.manager(MGR_CMD_SET, SERVER, {
                            'acl_hosts': self.hostB})
        self.server.manager(MGR_CMD_SET, SERVER, {'acl_host_enable': True})

        self.pbsnodes_cmd = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'pbsnodes') + ' -av'

        self.qstat_cmd = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'qstat')

    def test_acl_host_moms_enable(self):
        """
        Set acl_host_moms_enable = True and check whether or not the remote
        host is able run pbsnodes and qstat.
        """

        self.server.manager(MGR_CMD_SET, SERVER, {
                            'acl_host_moms_enable': True})
        ret = self.du.run_cmd(self.remote_host, cmd=self.pbsnodes_cmd)
        self.assertEqual(ret['rc'], 0)

        ret = self.du.run_cmd(self.remote_host, cmd=self.qstat_cmd)
        self.assertEqual(ret['rc'], 0)

    def test_acl_host_moms_disable(self):
        """
        Set acl_host_moms_enable = False and check whether or not the remote
        host is forbidden to run pbsnodes and qstat.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'acl_host_moms_enable': False})

        ret = self.du.run_cmd(self.remote_host, cmd=self.pbsnodes_cmd)
        self.assertNotEqual(ret['rc'], 0)

        ret = self.du.run_cmd(self.remote_host, cmd=self.qstat_cmd)
        self.assertNotEqual(ret['rc'], 0)

    def test_acl_host_moms_hooks_and_jobs(self):
        """
        Use hooks to test whether remote host is able to run pbs.server()
        and check whether the job that is submitted goes to the 'R' state.
        """
        hook_name = "hook_acl_host_moms_t"
        hook_body = """
import pbs
e = pbs.event()
svr = pbs.server().server_state
e.accept()
"""
        try:
            self.server.manager(MGR_CMD_DELETE, HOOK, None, hook_name)
        except Exception:
            pass

        a = {'event': 'execjob_begin', 'enabled': 'True'}
        self.server.create_import_hook(
            hook_name, a, hook_body, overwrite=True)

        self.server.manager(MGR_CMD_SET, SERVER, {
                            'acl_host_moms_enable': False})

        j = Job()
        j.set_sleep_time(10)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'H'}, id=jid)

        self.server.manager(MGR_CMD_SET, SERVER, {
                            'acl_host_moms_enable': True})
        j = Job()
        j.set_sleep_time(10)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_acl_host_mom_queue_access(self):
        """
        Test that remote host cannot submit jobs to queue where
        acl_host_enable is True and acl_host_moms_enable is set
        on server, but remote host is not added in acl_hosts.
        """
        queue_n = 'tempq'
        queue_params = {'queue_type': 'Execution', 'enabled': 'True',
                        'started': 'True', 'acl_host_enable': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, queue_params, id='tempq')

        self.server.manager(MGR_CMD_SET, SERVER, {
                            'acl_host_moms_enable': True})
        # Setting acl_host_enable on queue overrides acl_host_moms_enable
        # on server and requires acl_hosts to include remote host's name.

        self.server.manager(MGR_CMD_SET, SERVER, {'flatuid': True})
        # Setting flatuid lets us submit jobs on server as a remote
        # host without creating a seperate user account there.
        qsub_cmd_on_queue = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin',
            'qsub') + ' -q ' + queue_n + ' -- /bin/sleep 10'

        j = Job(attrs={ATTR_queue: queue_n})
        j.set_sleep_time(10)
        cannot_submit = 0
        try:
            jid = self.server.submit(j)
        except PbsSubmitError:
            cannot_submit = 1
        self.assertEqual(cannot_submit, 1)


================================================
FILE: test/tests/functional/pbs_acl_host_queue.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_acl_host_queue(TestFunctional):
    """
    This test suite is for testing the queue attributes acl_host_enable
    and acl_hosts.
    """

    def test_acl_host_enable_refuse(self):
        """
        Set acl_host_enable = True on queue and check whether or not
        the submit is refused.
        """
        a = {"acl_host_enable": True,
             "acl_hosts": "foo"}
        self.server.manager(MGR_CMD_SET, QUEUE, a,
                            self.server.default_queue)

        j = Job(TEST_USER)
        try:
            self.server.submit(j)
        except PbsSubmitError as e:
            error_msg = "qsub: Access from host not allowed, or unknown host"
            self.assertEquals(e.msg[0], error_msg)
        else:
            self.fail("Queue is violating acl_hosts")

    def test_acl_host_enable_allow(self):
        """
        Set acl_host_enable = True along with acl_hosts and check
        whether or not a job can be submitted.
        """
        a = {"acl_host_enable": True,
             "acl_hosts": self.server.hostname}
        self.server.manager(MGR_CMD_SET, QUEUE, a,
                            self.server.default_queue)

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.logger.info('Job submitted successfully: ' + jid)


================================================
FILE: test/tests/functional/pbs_acl_host_server.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_acl_host_server(TestFunctional):
    """
    This test suite is for testing the subnets in server's
    attribute acl_hosts. This test requires remote client.
    """

    def setUp(self):
        """
        Determine the server ip and remote host
        """

        TestFunctional.setUp(self)

        usage_string = 'test requires a remote client as input,' + \
                       ' use -p client=<client>'

        self.serverip = socket.gethostbyname(self.server.hostname)

        if not self.du.is_localhost(self.server.client):
            self.remote_host = socket.getfqdn(self.server.client)
        else:
            self.skip_test(usage_string)

        self.assertTrue(self.remote_host)

        self.pbsnodes_cmd = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'pbsnodes') + ' -av' \
            + ' -s ' + self.server.hostname

    def test_acl_subnet_enable_allow(self):
        """
        Set acl_host_enable = True, subnet to server ip with the mask
        255.255.0.0 or 16 and check whether or not the remote host
        is able to run pbsnodes. It should allow.
        """

        a = {"acl_host_enable": True,
             "acl_hosts": self.serverip + "/255.255.0.0"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        ret = self.du.run_cmd(self.remote_host, cmd=self.pbsnodes_cmd)
        self.assertEqual(ret['rc'], 0)

        a = {"acl_host_enable": True,
             "acl_hosts": self.serverip + "/16"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        ret = self.du.run_cmd(self.remote_host, cmd=self.pbsnodes_cmd)
        self.assertEqual(ret['rc'], 0)

    def test_acl_subnet_enable_refuse(self):
        """
        Set acl_host_enable = True, subnet to server ip with the mask
        255.255.255.255 or 32 and check whether or not the remote host
        is able to run pbsnodes. It should refuse.
        """

        a = {"acl_host_enable": True,
             "acl_hosts": self.serverip + "/255.255.255.255"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        ret = self.du.run_cmd(self.remote_host, cmd=self.pbsnodes_cmd)
        self.assertNotEqual(ret['rc'], 0)

        a = {"acl_host_enable": True,
             "acl_hosts": self.serverip + "/32"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        ret = self.du.run_cmd(self.remote_host, cmd=self.pbsnodes_cmd)
        self.assertNotEqual(ret['rc'], 0)

    def tearDown(self):
        """
        Unset the acl attributes so tearDown can process on remote host.
        """

        a = ["acl_host_enable", "acl_hosts"]
        self.server.manager(MGR_CMD_UNSET, SERVER, a)


================================================
FILE: test/tests/functional/pbs_admin_suspend.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *


class TestAdminSuspend(TestFunctional):

    """
    Test the admin-suspend/admin-resume feature for node maintenance
    """

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 1)

    def test_basic(self):
        """
        Test basic admin-suspend functionality
        """
        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)

        j2 = Job(TEST_USER)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)
        vnode = self.mom.shortname + '[0]'
        # admin-suspend job 1.
        self.server.sigjob(jid1, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid1})

        # admin-suspend job 2
        self.server.sigjob(jid2, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid1 + "," + jid2})

        # admin-resume job 1.  Make sure the node is still in state maintenance
        self.server.sigjob(jid1, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid2})

        # admin-resume job 2.  Make sure the node retuns to state free
        self.server.sigjob(jid2, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

    def test_basic_ja(self):
        """
        Test basic admin-suspend functionality for job arrays
        """
        jA = Job(TEST_USER)
        jA.set_attributes({'Resource_List.select': '1:ncpus=1', ATTR_J: '1-2'})
        jidA = self.server.submit(jA)
        self.server.expect(JOB, {'job_state': 'B'}, id=jidA)

        subjobs = self.server.status(JOB, id=jidA, extend='t')
        # subjobs[0] is the array itself.  Need the subjobs
        jid1 = subjobs[1]['id']
        jid2 = subjobs[2]['id']

        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)
        vnode = self.mom.shortname + '[0]'

        # admin-suspend job 1.
        self.server.sigjob(jid1, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid1})

        # admin-suspend job 2
        self.server.sigjob(jid2, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid1 + "," + jid2})

        # admin-resume job 1.  Make sure the node is still in state maintenance
        self.server.sigjob(jid1, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid2})

        # admin-resume job 2.  Make sure the node retuns to state free
        self.server.sigjob(jid2, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

    def test_basic_restart(self):
        """
        Test basic admin-suspend functionality with server restart
        The restart will test if the node recovers properly in maintenance
        """
        j1 = Job(TEST_USER)
        jid = self.server.submit(j1)
        self.server.expect(
            JOB, {'job_state': 'R', 'substate': 42}, attrop=PTL_AND, id=jid)
        vnode = self.mom.shortname + '[0]'
        # admin-suspend job
        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid})

        self.server.restart()

        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(NODE, {'maintenance_jobs': jid})

        # Checking licenses to avoid failure at resume since PBS licenses
        # might not be available and as a result resume fails
        rv = self.is_server_licensed(self.server)
        _msg = 'No license found on server %s' % (self.server.shortname)
        self.assertTrue(rv, _msg)

        # admin-resume job
        self.server.sigjob(jid, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

    def test_cmd_perm(self):
        """
        Test permissions on admin-suspend, admin-resume, maintenance_jobs
        and the maintenace node state.
        """
        vnode = self.mom.shortname + '[0]'
        # Test to make sure we can't set the maintenance node state
        try:
            self.server.manager(
                MGR_CMD_SET, NODE,
                {'state': 'maintenance'}, id=vnode, runas=ROOT_USER)
        except PbsManagerError as e:
            self.assertTrue('Illegal value for node state' in e.msg[0])

        self.server.expect(NODE, {'state': 'free'}, id=vnode)

        # Test to make sure we can't set the 'maintenance_jobs' attribute
        try:
            self.server.manager(
                MGR_CMD_SET, NODE,
                {'maintenance_jobs': 'foo'}, id=vnode, runas=ROOT_USER)
        except PbsManagerError as e:
            self.assertTrue(
                'Cannot set attribute, read only or insufficient permission'
                in e.msg[0])

        self.server.expect(NODE, 'maintenance_jobs', op=UNSET, id=vnode)

        # Test to make sure regular users can't admin-suspend jobs
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(
            JOB, {'job_state': 'R', 'substate': 42}, attrop=PTL_AND, id=jid)

        try:
            self.server.sigjob(jid, 'admin-suspend', runas=TEST_USER)
        except PbsSignalError as e:
            self.assertTrue('Unauthorized Request' in e.msg[0])

        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)

        # Test to make sure regular users can't admin-resume jobs
        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

        try:
            self.server.sigjob(jid, 'admin-resume', runas=TEST_USER)
        except PbsSignalError as e:
            self.assertTrue('Unauthorized Request' in e.msg[0])

        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

    def test_wrong_state1(self):
        """
        Test using wrong resume signal is correctly rejected
        """

        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)

        self.server.sigjob(jid1, "suspend", runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)

        try:
            self.server.sigjob(jid1, "admin-resume", runas=ROOT_USER)
        except PbsSignalError as e:
            self.assertTrue(
                'Job can not be resumed with the requested resume signal'
                in e.msg[0])

        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)

    def test_wrong_state2(self):
        """
        Test using wrong resume signal is correctly rejected
        """

        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)

        self.server.sigjob(jid1, "admin-suspend", runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'substate': 43}, id=jid1)

        try:
            self.server.sigjob(jid1, "resume", runas=ROOT_USER)
        except PbsSignalError as e:
            self.assertTrue(
                'Job can not be resumed with the requested resume signal'
                in e.msg[0])

        # If resume had worked, the job would be in substate 45
        self.server.expect(JOB, {'substate': 43}, id=jid1)

    def test_deljob(self):
        """
        Test whether a node leaves the maintenance state when
        an admin-suspendedd job is deleted
        """

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)
        vnode = self.mom.shortname + '[0]'

        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        self.server.deljob(jid, wait=True)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

    def test_deljob_force(self):
        """
        Test whether a node leaves the maintenance state when
        an admin-suspendedd job is deleted with -Wforce
        """

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)
        vnode = self.mom.shortname + '[0]'

        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        self.server.deljob(jid, extend='force', wait=True)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

    def test_rerunjob(self):
        """
        Test whether a node leaves the maintenance state when
        an admin-suspended job is requeued
        """

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)
        vnode = self.mom.shortname + '[0]'

        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        self.server.rerunjob(jid, extend='force')
        # Job eventually goes to R state after being requeued for short time
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

    def test_multivnode(self):
        """
        Submit a job to multiple vnodes.  Send an admin-suspend signal
        and see all nodes go into maintenance
        """
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 3, usenatvnode=True)

        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '3:ncpus=1',
                          'Resource_List.place': 'vscatter'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)

        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state=maintenance': 3})
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

        self.server.sigjob(jid, 'admin-resume', runas=ROOT_USER)
        self.server.expect(NODE, {'state=free': 3})

    def test_multivnode2(self):
        """
        Submit a job to multiple vnodes.  Send an admin-suspend signal
        and see all nodes go into maintenance
        Submit a single node job to one of the nodes.  Resume the multinode
        Job and see the single node job's node stil in maintenance
        """
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 3, usenatvnode=True)

        # Submit multinode job 1
        j1 = Job(TEST_USER)
        j1.set_attributes({'Resource_List.select': '3:ncpus=1',
                           'Resource_List.place': 'vscatter'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)

        vnode = self.mom.shortname + '[0]'
        # Submit Job 2 to specific node
        j2 = Job(TEST_USER)
        j2.set_attributes({'Resource_List.select': '1:ncpus=1:vnode=' + vnode})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)

        # admin-suspend job 1 and see all three nodes go into maintenance
        self.server.sigjob(jid1, 'admin-suspend')
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(NODE, {'state=maintenance': 3})

        # admin-suspend job 2
        self.server.sigjob(jid2, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)

        # admin-resume job1 and see one node stay in maintenance
        self.server.sigjob(jid1, 'admin-resume', runas=ROOT_USER)
        self.server.expect(NODE, {'state=free': 2})
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

    def test_multivnode_excl(self):
        """
        Submit an excl job to multiple vnodes.  Send an admin-suspend
        signal and see all nodes go into maintenance
        """
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 3, usenatvnode=True)

        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '3:ncpus=1',
                          'Resource_List.place': 'vscatter:excl'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)
        self.server.expect(NODE, {'state=job-exclusive': 3})

        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state=maintenance': 3})
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

        self.server.sigjob(jid, 'admin-resume', runas=ROOT_USER)
        self.server.expect(NODE, {'state=job-exclusive': 3})

    def test_degraded_resv(self):
        """
        Test if a reservation goes into the degraded state after its node is
        put into maintenance
        """

        # Submit a reservation
        r = Reservation(TEST_USER)
        r.set_attributes({'Resource_List.select': '1:ncpus=1',
                          'reserve_start': time.time() + 3600,
                          'reserve_end': time.time() + 7200})
        rid = self.server.submit(r)

        # See reservation is confirmed
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        d = self.server.expect(RESV, a, rid)

        # Submit a job and see it run
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '1:ncpus=1',
                          'Resource_List.walltime': 120})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)
        vnode = self.mom.shortname + '[0]'
        # Admin-suspend job
        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # See reservation in degreaded state
        a = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}
        d = self.server.expect(RESV, a, rid)

    def test_resv_jobend(self):
        """
        Test if a node goes back to free state when reservation ends and
        admin-suspended job is killed
        """

        # Submit a reservation
        r = Reservation(TEST_USER)
        r.set_attributes({'Resource_List.select': '1:ncpus=1',
                          'reserve_start': time.time() + 30,
                          'reserve_end': time.time() + 60})
        rid = self.server.submit(r)

        # See reservation is confirmed
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        d = self.server.expect(RESV, a, id=rid)

        # Submit a job
        j = Job(TEST_USER)
        rque = rid.split(".")
        j.set_attributes({'queue': rque[0]})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        # Wait for reservation to start
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|3')}
        d = self.server.expect(RESV, a, rid, offset=30)

        # job is running as well
        self.server.expect(
            JOB, {'job_state': 'R', 'substate': 42},
            id=jid, max_attempts=30)
        vnode = self.mom.shortname + '[0]'
        # Admin-suspend job
        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # Submit another job outside of reservation
        j = Job(TEST_USER)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        # Wait for the reservation to get over
        # Job also gets deleted and node state goes back to free
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=120)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

        # job2 starts running
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2, max_attempts=60)

    def test_que(self):
        """
        Test to check that job gets suspended on non-default queue
        """

        # create a high priority workq2 and a routeq
        a = {'queue_type': 'execution', 'started': 't', 'enabled': 't',
             'priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')
        a = {'queue_type': 'route', 'started': 't', 'enabled': 't',
             'route_destinations': 'workq2'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='route')

        # submit a normal job
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '1:ncpus=3'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)

        # submit a high priority job. Make sure job1 is suspended.
        j = Job(TEST_USER)
        j.set_attributes(
            {'Resource_List.select': '1:ncpus=3', 'queue': 'route'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)

        # Above will not cause node state to go to maintenance
        vnode = self.mom.shortname + '[0]'
        self.server.expect(
            NODE, {'state': (MATCH_RE, 'free|job-exclusive')}, id=vnode)

        # admin suspend job2
        self.server.sigjob(jid2, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        self.server.expect(JOB, {'job_state=S': 2})

        # Releasing job1 will fail and not change node state
        rv = self.server.sigjob(jid1, 'resume', runas=ROOT_USER, logerr='True')
        self.assertFalse(rv)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # deleting job1 will not change node state either
        self.server.deljob(jid1, wait=True)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # Admin-resume job2
        self.server.sigjob(jid2, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)
        self.server.expect(NODE, {'state': 'free'}, id=vnode)

        # suspend the job
        self.server.sigjob(jid2, 'suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(
            NODE, {'state': (MATCH_RE, 'free|job-exclusive')}, id=vnode)

    def test_resume(self):
        """
        Test node state remains in maintenance until
        all jobs are not resumed
        """

        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 3, usenatvnode=True)

        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '3:ncpus=1',
                          'Resource_List.place': 'vscatter'})
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state=R': 3, 'substate=42': 3})
        self.server.expect(NODE, {'state=free': 3})

        # admin suspend first 2 jobs and let 3rd job run
        # First only suspend job1 and verify that it will
        # put all the nodes to maintenance state
        self.server.sigjob(jid1, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(NODE, {'state=maintenance': 3})
        self.server.sigjob(jid2, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state=S': 2})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        # submit a new job and it will be queued
        j = Job(TEST_USER)
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)

        # List all maintenance_jobs
        self.server.expect(NODE, {'maintenance_jobs': jid1 + "," + jid2})

        # resume 1 job that will not change node state
        self.server.sigjob(jid1, 'admin-resume', runas=ROOT_USER)
        self.server.expect(NODE, {'state=maintenance': 3})
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid3)

        # resume the remaining job
        self.server.sigjob(jid2, 'admin-resume', runas=ROOT_USER)
        self.server.expect(NODE, {'state=free': 3})
        self.server.expect(JOB, {'job_state=R': 4})

    def test_admin_resume_loop(self):
        """
        Test that running admin-resume in a loop will have no impact on PBS
        """

        # submit a job
        j = Job(TEST_USER)
        j.set_sleep_time(300)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)
        vnode = self.mom.shortname + '[0]'
        # admin suspend and resume job in a loop
        for x in range(15):
            self.server.sigjob(jid1, 'admin-suspend', runas=ROOT_USER)
            self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
            self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

            # sleep for sometime
            time.sleep(3)

            # resume the job
            self.server.sigjob(jid1, 'admin-resume', runas=ROOT_USER)
            self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
            self.server.expect(NODE, {'state': 'free'}, id=vnode)

    def test_custom_res(self):
        """
        Test that job will not run on a node in
        maintenance state if explicitly asking
        for a resource on that node
        """

        # create multiple vnodes
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 3, usenatvnode=True)

        # create a node level resource
        self.server.manager(
            MGR_CMD_CREATE, RSC, {'type': 'float', 'flag': 'nh'}, id="foo",
            runas=ROOT_USER)
        vnode = self.mom.shortname + '[1]'
        # set foo on vn[1]
        self.server.manager(
            MGR_CMD_SET, NODE, {'resources_available.foo': 5}, id=vnode,
            runas=ROOT_USER)

        # set foo in sched_config
        self.scheduler.add_resource('foo')

        # submit a few jobs
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': 'vnode=' + vnode})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)

        # admin suspend the job to put the node to maintenance
        self.server.sigjob(jid1, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # submit other jobs asking for specific resources on vn[1]
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.foo': '2'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        # submit more jobs. They should be running
        j = Job(TEST_USER)
        jid3 = self.server.submit(j)
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid4)

        # verify that vn[1] is still in maintenance and
        # job3 and job4 not running on vn[1]
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)
        try:
            self.server.expect(JOB, {'exec_vnode': (MATCH_RE, vnode)},
                               id=jid3, max_attempts=20)
            self.server.expect(JOB, {'exec_vnode': (MATCH_RE, vnode)},
                               id=jid4, max_attempts=20)
        except Exception as e:
            self.assertFalse(e.rv)
            msg = "jid3 and jid4 not running on " + vnode + " as expected"
            self.logger.info(msg)

    def test_list_jobs_1(self):
        """
        Test to list and set maintenance_jobs as various users
        """
        # This test is run with CLI mode only
        _m = self.server.get_op_mode()
        if _m != PTL_CLI:
            self.skipTest("Not all commands can be run with API mode")

        # submit a few jobs
        j = Job(TEST_USER)
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)
        jid3 = self.server.submit(j)

        # verify that all are running
        self.server.expect(JOB, {'job_state=R': 3, 'substate=42': 3})

        # admin-suspend 2 of them
        self.server.sigjob(jid2, 'admin-suspend', runas=ROOT_USER)
        self.server.sigjob(jid3, 'admin-suspend', runas=ROOT_USER)
        vnode = self.mom.shortname + '[0]'
        # node state is in maintenance
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # list maintenance_jobs as root
        self.server.expect(NODE, {'maintenance_jobs': jid2 + "," + jid3},
                           runas=ROOT_USER)

        # list maintenance jobs as user
        self.server.expect(NODE, {'maintenance_jobs': jid2 + "," + jid3},
                           runas=TEST_USER)

        # set an operator
        self.server.manager(MGR_CMD_SET, SERVER, {'operators': 'pbsoper@*'})

        # List all jobs in maintenance mode as operator
        self.server.expect(
            NODE, {'maintenance_jobs': jid2 + "," + jid3}, runas='pbsoper')

        # set maintenance_jobs as root
        try:
            self.server.manager(MGR_CMD_SET, NODE,
                                {'maintenance_jobs': jid1}, id=vnode,
                                runas=ROOT_USER)
        except PbsManagerError as e:
            self.assertFalse(e.rv)
            msg = "Cannot set attribute, read only" +\
                  " or insufficient permission  maintenance_jobs"
            self.assertTrue(msg in e.msg[0])

        # Set maintenance_jobs as operator
        try:
            self.server.manager(MGR_CMD_SET, NODE,
                                {'maintenance_jobs': jid1}, id=vnode,
                                runas='pbsoper')
        except PbsManagerError as e:
            self.assertFalse(e.rv)
            msg = "Cannot set attribute, read only" +\
                  " or insufficient permission  maintenance_jobs"
            self.assertTrue(msg in e.msg[0])

        # Set maintenance_jobs as user
        try:
            self.server.manager(MGR_CMD_SET, NODE,
                                {'maintenance_jobs': jid1}, id=vnode,
                                runas=TEST_USER)
        except PbsManagerError as e:
            self.assertFalse(e.rv)
            self.assertTrue("Unauthorized Request" in e.msg[0])

    def test_list_jobs_2(self):
        """
        Test to list maintenance_jobs when no job is admin-suspended
        """

        # Submit a few jobs
        j = Job(TEST_USER)
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)
        jid3 = self.server.submit(j)

        # verify that all are running
        self.server.expect(JOB, {'job_state=R': 3, 'substate=42': 3})
        vnode = self.mom.shortname + '[0]'
        # list maintenance_jobs. It should be empty
        self.server.expect(NODE, 'maintenance_jobs', op=UNSET, id=vnode)

        # Regular suspend a job
        self.server.sigjob(jid2, 'suspend', runas=ROOT_USER)

        # List maintenance_jobs again
        self.server.expect(NODE, 'maintenance_jobs', op=UNSET, id=vnode)

    def test_preempt_order(self):
        """
        Test that scheduler preempt_order has no impact
        on admin-suspend
        """

        # create a high priority queue
        a = {'queue_type': 'e', 'enabled': 't', 'started': 't',
             'priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="highp")

        # set preempt_order to R
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'R'},
                            runas=ROOT_USER)
        vnode = self.mom.shortname + '[0]'
        # submit a job
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': 'vnode=' + vnode})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid1)

        # submit a high priority job
        j = Job(TEST_USER)
        j.set_attributes({'queue': 'highp', 'Resource_List.select':
                          '1:ncpus=4:vnode=' + vnode})
        jid2 = self.server.submit(j)

        # job2 is running and job1 is requeued
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

        # admin-suspend job1. It will fail
        try:
            self.server.sigjob(jid1, 'admin-suspend', logerr=False)
        except Exception as e:
            self.assertFalse(e.rv)

        # admin suspend job2
        self.server.sigjob(jid2, 'admin-suspend')
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # admin-resume job2. node state will become job-busy.
        self.server.sigjob(jid2, 'admin-resume')
        self.server.expect(NODE, {'state': 'job-busy'}, id=vnode)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

    def test_hook(self):
        """
        List maintenance_jobs via hook
        """

        # Create and import a hook
        hook_name = "test"
        hook_body = """
import pbs

vn = pbs.server().vnode('vn[0]')
pbs.logmsg(pbs.LOG_DEBUG,\
"list of maintenance_jobs are %s" % vn.maintenance_jobs)
"""
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 1, vname='vn')
        a = {'event': 'exechost_periodic', 'enabled': 'True', 'freq': 5}
        self.server.create_import_hook(hook_name, a, hook_body)

        # submit few jobs
        j = Job(TEST_USER)
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state=R': 2})

        # wait for the periodic hook
        time.sleep(5)

        # look for the log message
        self.mom.log_match("list of maintenance_jobs are None")

        # admin-suspend jobs
        self.server.sigjob(jid1, 'admin-suspend')
        self.server.sigjob(jid2, 'admin-suspend')

        # wait for periodic hook and check mom_log
        time.sleep(5)
        self.mom.log_match("list of maintenance_jobs are %s" %
                           ((jid1 + "," + jid2),))

        # admin-resume job1
        self.server.sigjob(jid1, 'admin-resume')

        # wait for periodic hook and check mom_log
        time.sleep(5)
        self.mom.log_match(
            "list of maintenance_jobs are %s" % (jid2,))

    def test_offline(self):
        """
        Test that if a node is put to offline
        and removed from maintenance state it
        remains offlined
        """

        # submit a job and admin-suspend it
        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        j2 = Job(TEST_USER)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': "R", 'substate': 42}, id=jid1)
        self.server.expect(JOB, {'job_state': "R", 'substate': 42}, id=jid2)
        self.server.sigjob(jid1, 'admin-suspend')
        self.server.sigjob(jid2, 'admin-suspend')

        vnode = self.mom.shortname + '[0]'
        # node state is in maintenance
        self.server.expect(NODE, {'state': 'maintenance'}, id=vnode)

        # submit another job. It will be queued
        j3 = Job(TEST_USER)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)

        # mark the node as offline too
        self.server.manager(MGR_CMD_SET, NODE, {'state': 'offline'},
                            id=vnode)

        # delete job1 as user and resume job2
        self.server.deljob(jid1, wait=True, runas=TEST_USER)
        self.server.sigjob(jid2, 'admin-resume')

        # verify that node state is offline and
        # job3 is still queued
        self.server.expect(NODE, {'state': 'offline'}, id=vnode)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)


================================================
FILE: test/tests/functional/pbs_allpart.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestSchedAllPart(TestFunctional):
    """
    Test the scheduler's allpart optimization
    """

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'resources_available.ncpus': 1, 'resources_available.mem': '1gb'}
        self.mom.create_vnodes(a, 2, usenatvnode=True)

    def test_free_nodes(self):
        """
        Test that if there aren't enough free nodes available, it is reported
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {'Resource_List.select': '2:ncpus=1'}
        j1 = Job(TEST_USER, a)
        jid1 = self.server.submit(j1)
        j2 = Job(TEST_USER, a)
        jid2 = self.server.submit(j2)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        a = {'job_state': 'Q', 'comment':
             'Not Running: Not enough free nodes available'}
        self.server.expect(JOB, a, id=jid2)

    def test_vscatter(self):
        """
        Test that we determine we can't run a job when there aren't enough
        free nodes available due to vscatter
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {'Resource_List.select': '1:ncpus=1'}
        j1 = Job(TEST_USER, a)
        jid1 = self.server.submit(j1)

        a = {'Resource_List.select': '2:ncpus=1',
             'Resource_List.place': 'vscatter'}
        j2 = Job(TEST_USER, a)
        jid2 = self.server.submit(j2)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        a = {'job_state': 'Q', 'comment':
             'Not Running: Not enough free nodes available'}
        self.server.expect(JOB, a, id=jid2)

    def test_vscatter2(self):
        """
        Test that we can determine a job can never run if it is requesting
        more nodes than is in the complex via vscatter
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'vscatter'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        a = {'job_state': 'Q', 'comment':
             'Can Never Run: Not enough total nodes available'}
        self.server.expect(JOB, a, id=jid)

    def test_rassn(self):
        """
        Test rassn resource (ncpus) is unavailable and the comment is shown
        with a RAT line
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {'Resource_List.select': '1:ncpus=1'}
        j1 = Job(TEST_USER, a)
        jid1 = self.server.submit(j1)

        a = {'Resource_List.select': '2:ncpus=1'}
        j2 = Job(TEST_USER, a)
        jid2 = self.server.submit(j2)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        m = 'Not Running: Insufficient amount of resource: ncpus ' + \
            '(R: 2 A: 1 T: 2)'
        a = {'job_state': 'Q', 'comment': m}
        self.server.expect(JOB, a, id=jid2)

    def test_nonexistent_non_consumable(self):
        """
        Test that a nonexistent non-consumable value is caught as 'Never Run'
        """
        a = {'Resource_List.select': '1:ncpus=1:vnode=foo'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)

        m = r'Can Never Run: Insufficient amount of resource: vnode \(foo !='
        a = {'job_state': 'Q', 'comment': (MATCH_RE, m)}
        self.server.expect(JOB, a, id=jid)

    def test_too_many_ncpus(self):
        """
        test that a job is marked as can never run if it requests more cpus
        than are available on the entire complex
        """
        a = {'Resource_List.select': '3:ncpus=1'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)

        m = 'Can Never Run: Insufficient amount of resource: ncpus ' + \
            '(R: 3 A: 2 T: 2)'
        a = {'job_state': 'Q', 'comment': m}
        self.server.expect(JOB, a, id=jid)


================================================
FILE: test/tests/functional/pbs_alps_inventory_check_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os

from tests.functional import *


@tags('cray', 'mom')
class TestAlpsInventoryCheckHook(TestFunctional):
    """
    PBS mom appears not to periodically automatically re-query the
    node inventory on Cray.
    """

    def setUp(self):
        self.platform = DshUtils().get_platform()
        if self.platform != 'cray' and self.platform != 'craysim':
            self.skipTest("This is not a cray platform")

        TestFunctional.setUp(self)
        with open("/etc/xthostname") as xthost_file:
            self.crayhostname = xthost_file.readline().rstrip()

        self.server.manager(MGR_CMD_SET, PBS_HOOK,
                            {'enabled': 'true', 'freq': 3},
                            id='PBS_alps_inventory_check')

    def delete_cray_compute_node(self):
        """
        Deletes the cray compute node from pbs node list
        """
        vnl = self.server.filter(
            VNODE, {'resources_available.vntype': 'cray_compute'})
        vlist = vnl["resources_available.vntype=cray_compute"]
        self.server.manager(MGR_CMD_DELETE, NODE, id=vlist[0])

    def test_apstat_cmd(self):
        """
        Test the log when apstat is not present in the
        expected/default location, it indicates a Cray system issue.
        """
        now = time.time()
        if self.platform == "craysim":
            if os.path.exists("/opt/cray/alps/default/bin/stat"):
                # The file to be renamed is conflicting with existing file
                self.skipTest("Conflict in the testcase settings")
            os.rename(
                "/opt/cray/alps/default/bin/apstat",
                "/opt/cray/alps/default/bin/stat")
            try:
                self.mom.log_match(
                    "ALPS Inventory Check: apstat command can not " +
                    "be found at /opt/cray/alps/default/bin/apstat",
                    starttime=now,
                    max_attempts=10,
                    interval=2)
            finally:
                os.rename(
                    "/opt/cray/alps/default/bin/stat",
                    "/opt/cray/alps/default/bin/apstat")
        else:
            self.skipTest("This test can be run on a simulator")

    def test_xthostname(self):
        """
        Test when hook attempts to read the /etc/xthostname file to
        determine Cray hostname, but the hostname file is missing.
        """
        now = time.time()
        if self.platform == "craysim":
            if os.path.exists("/etc/xt"):
                # The file to be renamed is conflicting with existing file
                self.skipTest("Conflict in the testcase settings")
            os.rename("/etc/xthostname", "/etc/xt")
            try:
                self.mom.log_match(
                    "/etc/xthostname file found on this host",
                    starttime=now,
                    max_attempts=10,
                    interval=2)
            finally:
                os.rename("/etc/xt", "/etc/xthostname")
        else:
            self.skipTest("This test can be run on a simulator")

    def test_start_of_hook(self):
        """
        Test log at the start of hook processing.
        """
        now = time.time()
        self.mom.log_match(
            "Processing ALPS inventory for crayhost %s" % self.crayhostname,
            starttime=now,
            max_attempts=10,
            interval=2)

    def test_cray_login_nodes(self):
        """
        Test log when no nodes with vntype 'cray_login' are present.
        """
        now = time.time()
        mc = self.mom.parse_config()
        save = mc["$alps_client"]
        del mc["$alps_client"]
        self.mom.apply_config(mc)
        self.host = self.mom.shortname
        try:
            self.server.manager(MGR_CMD_DELETE, NODE, None, "")
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.host)
            self.mom.log_match(
                "ALPS Inventory Check: No eligible " +
                "login nodes to perform inventory check",
                starttime=now,
                max_attempts=10,
                interval=2)
        finally:
            mc["$alps_client"] = save
            self.mom.apply_config(mc, False)

    def test_pbs_home_path(self):
        """
        Test log when mom_priv directory is not in the expected/default
        location (PBS_HOME), indicating a PBS installation issue.
        """
        if self.platform == "craysim":
            now = time.time()
            pbs_conf = self.du.parse_pbs_config(self.server.shortname)
            save = pbs_conf['PBS_HOME']
            self.du.set_pbs_config(
                self.server.shortname, confs={
                    'PBS_HOME': ''})
            try:
                self.delete_cray_compute_node()
                self.mom.log_match(
                    "ALPS Inventory Check: Internal error in retrieving " +
                    "path to mom_priv",
                    starttime=now,
                    max_attempts=10,
                    interval=2)
            finally:
                self.du.set_pbs_config(
                    self.server.shortname, confs={
                        'PBS_HOME': save})
        else:
            self.skipTest("This test can be run on a simulator")

    def test_alps_and_pbs_are_in_sync(self):
        """
        Test log when both PBS and ALPS are in sync i.e. they report the
        same number of compute nodes in the Cray cluster.
        """
        now = time.time()
        self.mom.log_match(
            "ALPS Inventory Check: PBS and ALPS are in sync",
            starttime=now,
            max_attempts=10,
            interval=2)

    def test_nodes_out_of_sync(self):
        """
         Test the log when PBS and ALPS are out of sync
        """
        now = time.time()
        self.delete_cray_compute_node()
        self.mom.log_match(
            "ALPS Inventory Check: Compute " +
            "nodes defined in ALPS, but not in PBS",
            starttime=now,
            max_attempts=10,
            interval=2)

    def test_failure_in_refreshing_nodes(self):
        """
        Test log when the Hook is unable to HUP the Mom and successfully
        refresh nodes.
        """
        if self.platform == "craysim":
            now = time.time()
            pbs_conf = self.du.parse_pbs_config(self.server.shortname)
            save = pbs_conf['PBS_HOME']
            self.du.set_pbs_config(
                self.server.shortname, confs={'PBS_HOME': 'xyz'})
            try:
                self.delete_cray_compute_node()
                self.mom.log_match(
                    "ALPS Inventory Check: Failure in refreshing nodes on " +
                    "login node (%s)" %
                    self.mom.hostname,
                    starttime=now,
                    max_attempts=10,
                    interval=2)
            finally:
                self.du.set_pbs_config(
                    self.server.shortname, confs={
                        'PBS_HOME': save})
        else:
            self.skipTest("This test can be run on cray a simulator")


================================================
FILE: test/tests/functional/pbs_alps_release_tunables.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *
import math
from ptl.utils.pbs_logutils import PBSLogUtils


@tags('cray')
class TestCrayAlpsReleaseTunables(TestFunctional):
    """
    Set of tests to verify alps release tunables namely alps_release_wait_time
    and alps_release_jitter
    """

    def setUp(self):
        machine = self.du.get_platform()
        if not machine == 'cray':
            self.skipTest("Test suite only meant to run on a Cray")
        TestFunctional.setUp(self)

    @staticmethod
    def get_epoch(msg):
        # Since its a log message split on ';' to get timestamp
        a = PBSLogUtils.convert_date_time(msg.split(';')[0])
        return a

    def test_alps_release_wait_time(self):
        """
        Set alps_release_wait_time to a higher value and then notice that
        subsequest reservation cancellation requests are made at least
        after the set interval.
        """
        # assigning a random value to alps_release_wait_time that is
        # measurable using mom log messages
        arwt = 4.298
        self.mom.add_config({'$alps_release_wait_time': arwt})

        # submit a job and then delete it after it starts running
        start_time = time.time()
        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        time.sleep(2)
        self.server.delete(jid1)

        # Look for a message that confirms that reservation is deleted
        self.mom.log_match("%s;ALPS reservation cancelled" % jid1,
                           starttime=start_time)
        # Now that we know that reservation is cleared we should
        # check for time difference between each cancellation request
        out = self.mom.log_match("%s;Canceling ALPS reservation *" % jid1,
                                 n='ALL', regexp=True, allmatch=True)

        # We found something, Let's first check there are atleast 2 such
        # log messages, If not then that means reservation was cancelled
        # in the first attempt itself, at that point right thing to do is
        # to either run it again or find out a way to delay the reservation
        # cancellation at ALPS level itself.
        if len(out) >= 2:
            # variable 'out' is a list of tuples and every second element
            # in a tuple is the matched log message
            time_prev = self.get_epoch(out[0][1])
            for data in out[1:]:
                time_current = self.get_epoch(data[1])
                fail_msg = "alps_release_wait_time not working"
                self.assertGreaterEqual(time_current - time_prev,
                                        math.floor(arwt),
                                        msg=fail_msg)
                time_prev = time_current

        else:
            self.skipTest("Reservation cancelled without retry, Try again!")

    def test_alps_release_jitter(self):
        """
        Set alps_release_jitter to a higher value and then notice that
        subsequest reservation cancellation requests are made by adding
        a random time interval (less than jitter) to alps_release_wait_time.
        """
        # assigning a random value to alps_release_jitter that is
        # measurable using mom log messages
        arj = 2.198
        arwt = 1
        max_delay = (arwt + math.ceil(arj))
        self.mom.add_config({'$alps_release_jitter': arj})
        self.mom.add_config({'$alps_release_wait_time': arwt})
        # There is no good way to test jitter and it is a random number
        # less than value set in alps_release_jitter. So in this case
        # we can probably try deleting a reservation a few times.
        n = retry = 5
        for _ in range(n):
            # submit a job and then delete it after it starts running
            start_time = time.time()
            j1 = Job(TEST_USER)
            jid1 = self.server.submit(j1)
            self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
            time.sleep(2)
            self.server.delete(jid1)

            # Look for a message that confirms that reservation is deleted
            self.mom.log_match("%s;ALPS reservation cancelled" % jid1,
                               starttime=start_time)
            # Now that we know that reservation is cleared we should
            # check for time difference between each cancellation request
            out = self.mom.log_match("%s;Canceling ALPS reservation *" % jid1,
                                     n='ALL', regexp=True, allmatch=True)

            # We found something, Let's first check there are atleast 2 such
            # log messages, If not then that means reservation was cancelled
            # in the first attempt itself, at that point right thing to do is
            # to either run it again or find out a way to delay the reservation
            # cancellation at ALPS level itself.
            if len(out) >= 2:
                retry -= 1
                # variable 'out' is a list of tuples and every second element
                # in a tuple is the matched log message
                time_prev = self.get_epoch(out[0][1])
                for data in out[1:]:
                    time_current = self.get_epoch(data[1])
                    self.assertLessEqual(time_current - time_prev,
                                         max_delay,
                                         msg="alps_release_jitter not working")
                    time_prev = time_current
        if retry == 5:
            self.skipTest("Reservation cancelled without retry, Try again!")


================================================
FILE: test/tests/functional/pbs_array_job_mail.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import os


class Test_array_job_email(TestFunctional):
    """
    This test suite is for testing arrayjob e-mailing (parent job and subjob)
    """

    def test_emails(self):
        """
        Run arrayjob with -m jabe and test if the e-mails are received
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'true'})

        mailfile = os.path.join("/var/mail", str(TEST_USER))
        if not os.path.isfile(mailfile):
            self.skip_test("Mail file '%s' does not exist or "
                           "mail is not setup. "
                           "Hence this step would be skipped. "
                           "Please check manually." % mailfile)

        J = Job(TEST_USER, attrs={ATTR_m: 'jabe', ATTR_J: '1-2'})
        J.set_sleep_time(1)
        parent_jid = self.server.submit(J)

        self.server.expect(JOB, {'job_state': 'F'}, parent_jid,
                           extend='x', max_attempts=15, interval=2)

        subjob_jid = parent_jid.replace("[]", "[1]")

        emails = [("PBS Job Id: " + parent_jid, "Begun execution"),
                  ("PBS Job Id: " + parent_jid, "Execution terminated"),
                  ("PBS Job Id: " + subjob_jid, "Begun execution"),
                  ("PBS Job Id: " + subjob_jid, "Execution terminated")]

        for (jobid, msg) in emails:
            emailpass = 0
            for j in range(5):
                time.sleep(5)
                ret = self.du.tail(filename=mailfile, sudo=True,
                                   option="-n 600")
                maillog = [x.strip() for x in ret['out']]
                for i in range(0, len(maillog) - 2):
                    if jobid == maillog[i] and msg == maillog[i + 2]:
                        emailpass = 1
                        break
                if emailpass:
                    break
            self.assertTrue(emailpass, "Message '" + jobid + " " + msg +
                            "' not found in " + mailfile)

    def test_qsub_errors_j_mailpoint(self):
        """
        Try to submit 'qsub -m j' and test possible errors
        """

        J = Job(TEST_USER, attrs={ATTR_m: 'j'})

        error_msg = "mail option 'j' can not be used without array job"
        try:
            self.server.submit(J)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

        J = Job(TEST_USER, attrs={ATTR_m: 'j', ATTR_J: '1-2'})

        error_msg = "illegal -m value"
        try:
            self.server.submit(J)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

    def test_email_non_existent_user(self):
        """
        Verify when a job array is submitted with a valid and invalid
        mail recipients and all file stageout attempts fails then
        email should get delivered to valid recipient and no email
        would be sent to invalid recipient.
        """
        non_existent_user = PbsAttribute.random_str(length=5)
        non_existent_mailfile = os.path.join(os.sep, "var", "mail",
                                             non_existent_user)
        pbsuser_mailfile = os.path.join(os.sep, "var", "mail",
                                        str(TEST_USER))

        # Check mail file should exist for existent user
        if not os.path.isfile(pbsuser_mailfile):
            msg = "Skipping this test as Mail file '%s' " % pbsuser_mailfile
            msg += "does not exist or mail is not setup."
            self.skip_test(msg)

        # Check non existent user mail file should not exist
        self.assertFalse(os.path.isfile(non_existent_mailfile))

        src_file = PbsAttribute.random_str(length=5)
        stageout_path = os.path.join(os.sep, '1', src_file)
        dest_file = stageout_path + '1'
        if not os.path.isdir(stageout_path) and os.path.exists(src_file):
            os.remove(src_file)

        # Submit job with invalid stageout path
        usermail_list = str(TEST_USER) + "," + non_existent_user
        set_attrib = {ATTR_stageout: stageout_path + '@' +
                      self.mom.shortname + ':' + dest_file,
                      ATTR_M: usermail_list, ATTR_J: '1-2',
                      ATTR_S: '/bin/bash'}
        j = Job()
        j.set_attributes(set_attrib)
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        subjid = j.create_subjob_id(jid, 1)

        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

        # Check stageout file should not be present
        self.assertFalse(os.path.exists(dest_file))

        exp_msg = "PBS Job Id: " + subjid
        err_msg = "%s msg not found in pbsuser's mail log" % exp_msg

        email_pass = 0
        for i in range(5):
            time.sleep(5)
            # Check if mail is deliverd to valid user mail file
            ret = self.du.tail(filename=pbsuser_mailfile, runas=TEST_USER,
                               option="-n 50")
            maillog = [x.strip() for x in ret['out']]
            if exp_msg in maillog:
                email_pass = 1
                break
        self.assertTrue(email_pass, err_msg)

        # Verify there should not be any email for invalid user
        self.assertFalse(os.path.isfile(non_existent_mailfile))


================================================
FILE: test/tests/functional/pbs_basil_parser_err.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('cray', 'mom')
class TestBasilParserErrors(TestFunctional):
    """
    Test the BASIL parser error messages
    """

    def setUp(self):
        TestFunctional.setUp(self)
        momA = self.moms.values()[0]
        if not momA.is_cray():
            self.skipTest("%s: not a cray mom." % (momA.shortname))

    def test_basil_errors(self):
        """
        Check for the non existence of BASIL errors in mom logs
        """
        self.mom.log_match("PERMANENT BASIL error from SYNTAX",
                           max_attempts=10,
                           interval=1,
                           existence=False)
        self.mom.log_match("Error in BASIL response",
                           max_attempts=10,
                           interval=1,
                           existence=False)


================================================
FILE: test/tests/functional/pbs_basil_support.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from string import Template
import os
import defusedxml.ElementTree as ET


@tags('cray', 'mom')
class TestBasilQuery(TestFunctional):
    """
    This test suite is for testing the support for BASIL 1.7/1.4 basil
    query.Test if query is made with correct BASIL version, and that
    vnodes are getting created as per the query response.
    """
    basil_version = ['1.7', '1.4', '1.3']
    available_version = ""

    @staticmethod
    def init_inventory_node():
        node = {}
        node['vnode'] = ""
        node['arch'] = ""
        node['current_aoe'] = ""
        node['host'] = ""
        node['hbmem'] = ""
        node['mem'] = ""
        node['ncpus'] = ""
        node['PBScrayhost'] = ""
        node['PBScraynid'] = ""
        node['vntype'] = ""
        node['accelerator_memory'] = ""
        node['accelerator_model'] = ""
        node['naccelerators'] = ""
        return node

    def reset_nodes(self, hostA):
        # Remove all nodes
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        # Restart PBS
        self.server.restart()
        # Create node
        self.server.manager(MGR_CMD_CREATE, NODE, None, hostA)
        # Wait for 3 seconds for changes to take effect
        time.sleep(3)

    def setUp(self):
        TestFunctional.setUp(self)

        self.server.manager(MGR_CMD_SET, PBS_HOOK,
                            {'enabled': 'true', 'freq': 10},
                            id='PBS_alps_inventory_check')

        momA = self.moms.values()[0]
        if not momA.is_cray():
            self.skipTest("%s: not a cray mom." % (momA.shortname))
        mom_config = momA.parse_config()
        if '$alps_client' not in mom_config:
            self.skipTest("alps_client not set in mom config.")

        if '$vnode_per_numa_node' in mom_config:
            momA.unset_mom_config('$vnode_per_numa_node', False)

        momA.add_config({'$logevent': '0xffffffff'})

        # check if required BASIL version available on the machine.
        for ver in self.basil_version:
            xml_out = self.query_alps(ver, 'QUERY', 'ENGINE')
            xml_tree = ET.parse(xml_out)
            os.remove(xml_out)
            response = xml_tree.find(".//ResponseData")
            status = response.attrib['status']
            if status == "SUCCESS":
                self.available_version = ver
                break
        if self.available_version == "":
            self.skipTest("No supported basil version found on the platform.")

        # Reset nodes
        self.reset_nodes(momA.shortname)

    def query_alps(self, ver, method, qtype):
        """
        Send a query to ALPS of a certain type and return the xml output file.
        """
        basil_protocol = 'protocol="%s"' % (ver)
        basil_method = 'method="%s"' % (method)
        basil_qtype = 'type="%s"' % (qtype)
        queryt = Template('<BasilRequest $ver $method $qtype/>\n')
        query = queryt.substitute(ver=basil_protocol,
                                  method=basil_method, qtype=basil_qtype)
        mom_config = self.mom.parse_config()
        alps_client = mom_config['$alps_client']
        fn = self.du.create_temp_file(body=query)
        xout = self.du.create_temp_file()
        self.du.run_cmd(cmd="%s < %s > %s" % (alps_client, fn, xout),
                        as_script=True)
        os.remove(fn)
        return xout

    def comp_node(self, vnode):
        """
        Check if compute node is found in pbsnodes -av output.
        If so check if the vnode attribute has the correct values.
        """
        name = vnode['vnode']
        try:
            pbs_node = self.server.status(NODE, id=name)[0]
        except PbsStatusError:
            self.assertFalse(pbs_node is None,
                             "Cray compute node %s doesn't exist on pbs server"
                             % (name))

        for rsc, xval in vnode.items():
            if rsc != 'current_aoe':
                resource = 'resources_available.' + rsc
            else:
                resource = rsc
            if xval != "":
                if resource in pbs_node:
                    rval = pbs_node[resource]
                    if rval == xval:
                        self.logger.info(
                            "%s: node has %s=%s" % (name, rsc, rval))
                        self.assertTrue(True)
                    else:
                        self.assertFalse("%s: node has %s=%s but XML %s=%s"
                                         % (name, resource, rval,
                                            rsc, xval))
                else:
                    self.assertFalse(
                        "%s\t: node has no resource %s" % (name, rsc))

    def get_knl_vnodes(self):
        xml_out = self.query_alps('1.7', 'QUERY', 'SYSTEM')
        tree = ET.parse(xml_out)
        os.remove(xml_out)
        root = tree.getroot()
        knl_vnodes = {}
        knl_info = {}

        # If node has the KNL processor then add them
        # to knl_vnodes dictionary
        for node in root.getiterator('Nodes'):
            # XML values
            role = node.attrib["role"]
            state = node.attrib["state"]
            numa_cfg = node.attrib["numa_cfg"]
            hbm_size_mb = node.attrib["hbm_size_mb"]
            hbm_cache_pct = node.attrib["hbm_cache_pct"]

            if role == 'batch' and state == 'up' and numa_cfg != ""\
               and hbm_size_mb != "" and hbm_cache_pct != "":
                # derived values from XML
                knl_info['current_aoe'] = numa_cfg + '_' + hbm_cache_pct
                knl_info['hbmem'] = hbm_size_mb + 'mb'
                nid_ranges = node.text.strip()
                nid_range_list = list(nid_ranges.split(','))
                while len(nid_range_list) > 0:
                    nid_range = nid_range_list.pop()
                    nid1 = nid_range.split('-')
                    if len(nid1) == 2:
                        # range of nodes
                        r1 = int(nid1[0])
                        r2 = int(nid1[1]) + 1
                        for node_id in range(r1, r2):
                            # associate each nid with it's knl information
                            knl_vnodes['%d' % node_id] = knl_info
                    else:
                        # single node
                        node_id = int(nid1[0])
                        knl_vnodes['%d' % node_id] = knl_info
        return knl_vnodes

    def retklist(self):
        """
        Return a list of KNL vnodes, empty list if there are no KNL vnodes.
        """
        klist = []
        # Find the list of KNL vnodes
        kvnl = self.server.filter(VNODE, {'current_aoe': (NE, "")})
        if len(kvnl) == 0:
            self.skipTest(reason='No KNL vnodes present')
        else:
            klist = list(kvnl.values())[0]
            self.logger.info("KNL vnode list: %s" % (klist))
        return klist

    def set_provisioning(self):
        """
        Set provisioning enabled and aoe resource on Xeon Phi nodes.
        """
        # Check for provisioning setup
        momA = self.moms.values()[0].shortname
        serverA = self.servers.values()[0].shortname
        msg = ("Provide a mom not present on server host while invoking"
               " the test: -p moms=<m1>")
        if momA == serverA:
            self.skipTest(reason=msg)

        nodelist = self.server.status(NODE, 'current_aoe')
        for node in nodelist:
            a = {'provision_enable': 'true',
                 'resources_available.aoe': '%s' % node['current_aoe']}
            self.server.manager(MGR_CMD_SET, NODE, a, id=node['id'])

    def unset_provisioning(self):
        """
        Unset provisioning attribute and aoe resource on Xeon Phi nodes.
        """
        nodelist = self.server.status(NODE, 'current_aoe')
        for node in nodelist:
            a = ['provision_enable',
                 'resources_available.aoe']
            self.server.manager(MGR_CMD_UNSET, NODE, a, id=node['id'])

    def request_current_aoe(self):
        """
        Get the value of current_aoe set on the XeonPhi vnodes
        """
        aoe_val = self.server.status(NODE, 'current_aoe')
        req_aoe = aoe_val[0]['current_aoe']
        return req_aoe

    def test_InventoryQueryVersion(self):
        """
        Test if BASIL version is set to required BASIL version
        on cray/simulator platform.
        """
        self.mom.signal('-HUP')

        engine_query_log = "<BasilRequest protocol=\"%s\" method=\"QUERY\" \
type=\"ENGINE\"/>" % (self.basil_version[1])
        self.mom.log_match(engine_query_log, n='ALL', max_attempts=3)

        if self.available_version == '1.7':
            msg = 'This Cray system supports the BASIL 1.7 protocol'
            self.mom.log_match(msg, n='ALL', max_attempts=3)
            basil_version_log = 'alps_engine_query;The basilversion is' \
                ' set to 1.4'
        else:
            basil_version_log = 'alps_engine_query;The basilversion is' \
                ' set to ' + self.available_version
        self.mom.log_match(basil_version_log, max_attempts=3)

    def test_InventoryVnodes(self):
        """
        This test validates the vnode created using alps BASIL 1.4 & 1.7
        inventory query response.
        """
        knl_vnodes = {}
        # Parse inventory query response and fetch node information.
        xml_out = self.query_alps('1.4', 'QUERY', 'INVENTORY')
        xml_tree = ET.parse(xml_out)
        os.remove(xml_out)
        inventory_1_4_el = xml_tree.find(".//Inventory")
        hn = inventory_1_4_el.attrib["mpp_host"]

        if self.available_version == '1.7':
            knl_vnodes = self.get_knl_vnodes()

        # Fill vnode structure using BASIL response
        for node in inventory_1_4_el.getiterator('Node'):
            role = node.attrib["role"]
            if role == 'BATCH':
                # XML values
                node_id = node.attrib["node_id"]
                cu_el = node.findall('.//ComputeUnit')
                mem_el = node.findall('.//Memory')
                ac_el = node.findall('.//Accelerator')
                page_size_kb = mem_el[0].attrib["page_size_kb"]
                page_count = mem_el[0].attrib["page_count"]

                vnode = self.init_inventory_node()
                vnode['arch'] = node.attrib['architecture']
                vnode['vnode'] = hn + '_' + node_id
                vnode['vntype'] = "cray_compute"
                vnode['mem'] = str(int(page_size_kb) *
                                   int(page_count) * len(mem_el)) + "kb"
                vnode['host'] = vnode['vnode']
                vnode['PBScraynid'] = node_id
                vnode['PBScrayhost'] = hn
                vnode['ncpus'] = str(len(cu_el))
                if ac_el:
                    vnode['naccelerators'] = str(len(ac_el))
                    vnode['accelerator_memory'] = str(
                        ac_el[0].attrib['memory_mb']) + "mb"
                    vnode['accelerator_model'] = ac_el[0].attrib['family']

                if node_id in knl_vnodes:
                    vnode['hbmem'] = knl_vnodes[node_id]['hbmem']
                    vnode['current_aoe'] = knl_vnodes[node_id]['current_aoe']
                    vnode['vnode'] = hn + '_' + node_id

                # Compare xml vnode with pbs node.
                self.logger.info("Validating vnode:%s" % (vnode['vnode']))
                self.comp_node(vnode)

    def test_cray_login_node(self):
        """
        This test validates that cray mom node resources value remain
        unchanged before and after adding $alps_client in mom config.
        """
        mom_id = self.mom.shortname
        try:
            cray_login_node = self.server.status(NODE, id=mom_id)[0]
            self.mom.unset_mom_config('$alps_client', False)
            self.reset_nodes(mom_id)
            pbs_node = self.server.status(NODE, id=mom_id)[0]

        except PbsStatusError:
            self.assertFalse(True,
                             "Mom node %s doesn't exist on pbs server"
                             % (mom_id))
        # List of resources to be ignored while comparing.
        ignr_rsc = ['license', 'last_state_change_time']

        for rsc, val in pbs_node.items():
            if rsc in ignr_rsc:
                continue
            self.assertTrue(rsc in cray_login_node,
                            ("%s\t: login node has no rsc %s") %
                            (mom_id, rsc))
            rval = cray_login_node[rsc]
            self.assertEqual(rval, val,
                             ("%s\t: pbs node has %s=%s but login "
                              "node has %s=%s") %
                             (mom_id, rsc, val, rsc, rval))

    def test_hbmemm_rsc(self):
        """
        Create a job that requests enough HBMEM. Submit the job to
        the Server. Check if the job is in the 'R' state and if the
        job runs on a KNL vnode. Delete the job.
        """

        knl_vnodes = self.get_knl_vnodes()

        if len(knl_vnodes) == 0:
            self.skipTest(reason='No KNL vnodes present')
        else:
            self.logger.info("KNL vnode list: %s" % (knl_vnodes))

        hbm_req = 4192
        a = {'Resource_List.select': '1:hbmem=%dmb' % hbm_req}
        job = Job(TEST_USER, attrs=a)

        job_id = self.server.submit(job)
        self.server.expect(JOB, {'job_state': 'R'}, id=job_id)

        # Check that exec_vnode is a KNL vnode.`
        self.server.status(JOB, 'exec_vnode', id=job_id)
        evnode = list(job.execvnode()[0].keys())[0]
        nid = evnode.split('_')[1]
        if nid in knl_vnodes.keys():
            self.logger.info("exec_vnode %s is a KNL vnode." % (evnode))
            rv = 1
        else:
            self.logger.info("exec_vnode %s is not a KNL vnode." % (evnode))
            rv = 0
        self.assertTrue(rv == 1)

        nodes = self.server.status(NODE)
        for n in nodes:
            v_name = n['id']
            if v_name == evnode:
                hbm_assig = n['resources_assigned.hbmem']
                hbm_int = int(re.search(r'\d+', hbm_assig).group())
                hbm_in_kb = hbm_req * 1024
                self.logger.info(
                    "vnode name=%s -- hbm assigned=%s -- hbm requested=%dkb"
                    % (v_name, hbm_assig, hbm_in_kb))
                if hbm_int == hbm_in_kb:
                    self.logger.info(
                        "The requested hbmem of %s mb has been assigned." %
                        (str(hbm_req)))
                    self.assertTrue(True)
                else:
                    self.logger.info(
                        "The assigned hbmem of %s, on %s, does not match "
                        "requested hbmem of %d mb" %
                        (hbm_assig, v_name, hbm_req))
                    self.assertTrue(False)

    def test_job_request_insufficent_hbmemm_rsc(self):
        """
        Submit a job request that requests more than available HBMEM.
        Check if the job is in the 'Q' state with valid comment.
        Delete the job
        """
        # Find the list of KNL vnodes
        knl_vnodes = self.get_knl_vnodes()

        if len(knl_vnodes) == 0:
            self.skipTest(reason='No KNL vnodes present')
        else:
            self.logger.info("KNL vnode list: %s" % (knl_vnodes))

        hbm_req = 18000
        a = {'Resource_List.select': '1:hbmem=%dmb' % hbm_req}
        job = Job(TEST_USER, attrs=a)

        job_id = self.server.submit(job)

        # Check that job is in Q state with valid comment
        job_comment = "Not Running: Insufficient amount of resource: hbmem"
        self.server.expect(JOB, {'job_state': 'Q', 'comment':
                                 (MATCH_RE, job_comment)}, attrop=PTL_AND,
                           id=job_id)

    def test_job_request_knl(self):
        """
        Create a job that requests aoe should run on a KNL vnode.
        Submit the job to the Server. Check if the job runs on a KNL vnode
        and if the job is in the 'R' state.
        """
        if self.du.platform == 'craysim':
            self.skipTest(reason='Test is not applicable for Craysim')

        # Find the list of KNL vnodes
        klist = self.retklist()

        # Set provisioning attributes on KNL vnode.
        self.set_provisioning()

        # Submit job that request aoe
        req_aoe = self.request_current_aoe()
        job = Job(TEST_USER)

        job.create_script(
            "#PBS -joe -o localhost:/tmp -lselect=1:ncpus=1:aoe=%s\n"
            % req_aoe +
            " cd /tmp\n"
            "aprun -B sleep 10\n"
            "sleep 10")

        job_id = self.server.submit(job)
        self.server.expect(JOB, {'job_state': 'R'}, id=job_id)

        # Check that exec_vnode is a KNL vnode.
        self.server.status(JOB, 'exec_vnode', id=job_id)
        evnode = job.get_vnodes()[0]
        self.assertIn(evnode, klist, "exec_vnode %s is not a KNL vnode."
                      % (evnode))
        self.logger.info("exec_vnode %s is a KNL vnode." % (evnode))

        # Unset provisioning attributes.
        self.unset_provisioning()

    def test_job_request_subchunk(self):
        """
        Test job request consist of subchunks with and without aoe resource.
        """
        if self.du.platform == 'craysim':
            self.skipTest(reason='Test is not applicable for craysim')

        # Find the list of KNL vnodes
        klist = self.retklist()

        # Set provisioning attributes.
        self.set_provisioning()

        # Submit job that request sub-chunk with and without aoe resources
        req_aoe = self.request_current_aoe()
        job = Job(TEST_USER)

        job.create_script(
            "#PBS -joe -o localhost:/tmp -lplace=scatter "
            "-lselect=1:ncpus=1:aoe=%s+1:ncpus=1\n" % req_aoe +
            " cd /tmp\n"
            "aprun -B sleep 10\n"
            "sleep 10")
        job_id = self.server.submit(job)
        self.server.expect(JOB, {'job_state': 'R'}, id=job_id)

        # Check that exec_vnode is a KNL vnode.
        self.server.status(JOB, 'exec_vnode', id=job_id)
        evnode = job.get_vnodes()
        self.assertIn(evnode[0], klist, "exec_vnode %s is not a KNL vnode."
                      % (evnode[0]))
        self.logger.info("exec_vnode %s is a KNL vnode." % (evnode[0]))

        self.assertNotIn(evnode[1], klist, "exec_vnode %s is a KNL"
                         " vnode." % (evnode[1]))
        self.logger.info("exec_vnode %s is not a KNL vnode." % (evnode[1]))

        # Unset provisioning attributes.
        self.unset_provisioning()

    def test_pbs_alps_in_sync(self):
        """
        Check for the presence of message indicating PBS and ALPS are
        in sync.
        """
        # Determine if BASIL 1.7 is supported.
        try:
            rv = self.mom.log_match(
                "This Cray system supports the BASIL 1.7 protocol.",
                n='ALL', max_attempts=10)
        except PtlLogMatchError:
            self.skipTest(
                reason='Test not applicable for system not having BASIL 1.7')

        # Determine if KNL vnodes are present.
        knl_vnodes = self.get_knl_vnodes()

        if len(knl_vnodes) == 0:
            self.skipTest(reason='No KNL vnodes present')
        else:
            self.logger.info("KNL vnode list: %s" % (knl_vnodes))

        # Check for PBS ALPS Inventory Hook message.
        now = time.time()
        rv = self.mom.log_match("ALPS Inventory Check: PBS and ALPS"
                                " are in sync",
                                starttime=now, interval=5)
        self.assertTrue(rv)

    def test_knl_batch_to_interactive(self):
        """
        Change the mode of any two KNL nodes to interactive. Then check if the
        PBS_alps_inventory_check hook picks up on the change and nodes are
        marked as stale. Restore changes to hook and mode of KNL nodes.
        """
        if self.du.platform == 'craysim':
            self.skipTest(reason='xtprocadmin cmd is not on cray simulator')

        # Find the list of KNL vnodes
        klist = self.retklist()

        # Change mode of two KNL nodes to interactive
        if len(klist) >= 2:
            k1 = klist[0]
            k2 = klist[len(klist) - 1]
            knl1 = re.search(r'\d+', k1).group()
            knl2 = re.search(r'\d+', k2).group()

        cmd = ['xtprocadmin', '-k', 'm', 'interactive', '-n', knl1]
        ret = self.server.du.run_cmd(self.server.hostname,
                                     cmd, logerr=True)
        self.assertEqual(ret['rc'], 0)

        cmd = ['xtprocadmin', '-k', 'm', 'interactive', '-n', knl2]
        ret = self.server.du.run_cmd(self.server.hostname,
                                     cmd, logerr=True)
        self.assertEqual(ret['rc'], 0)

        # Do Mom HUP
        self.mom.signal('-HUP')

        # Check that the nodes are now stale.
        self.server.expect(VNODE, {'state': 'Stale'}, id=k1,
                           max_attempts=10, interval=5)
        self.server.expect(VNODE, {'state': 'Stale'}, id=k2)

        # Change nodes back to batch mode
        cmd = ['xtprocadmin', '-k', 'm', 'batch']
        ret = self.server.du.run_cmd(self.server.hostname,
                                     cmd, logerr=True)
        self.assertEqual(ret['rc'], 0)

        # Do Mom HUP
        self.mom.signal('-HUP')

        # Check that the nodes are now free.
        self.server.expect(VNODE, {'state': 'free'}, id=k1,
                           max_attempts=10, interval=5)
        self.server.expect(VNODE, {'state': 'free'}, id=k2)

    def test_job_run_on_knl_node(self):
        """
        Change the mode of KNL nodes to batch.
        Then check if the PBS_alps_inventory_check hook picks up on the change.
        Submit job and confirm job should be in R state
        """
        if self.du.platform == 'craysim':
            self.skipTest(reason='xtprocadmin cmd is not on cray simulator')

        # Find the list of KNL vnodes
        klist = self.retklist()

        # Change mode of all nodes to interactive
        cmd = ['xtprocadmin', '-k', 'm', 'interactive']
        ret = self.server.du.run_cmd(self.server.hostname,
                                     cmd, logerr=True)
        self.assertEqual(ret['rc'], 0)

        # Change mode of two KNL nodes to batch
        if len(klist) >= 2:
            k1 = klist[0]
            k2 = klist[len(klist) - 1]
            knl1 = re.search(r'\d+', k1).group()
            knl2 = re.search(r'\d+', k2).group()

        cmd = ['xtprocadmin', '-k', 'm', 'batch', '-n', knl1]
        ret = self.server.du.run_cmd(self.server.hostname, cmd, logerr=True)
        self.assertEqual(ret['rc'], 0)
        cmd = ['xtprocadmin', '-k', 'm', 'batch', '-n', knl2]
        ret = self.server.du.run_cmd(self.server.hostname, cmd, logerr=True)
        self.assertEqual(ret['rc'], 0)

        # Do Mom HUP
        self.mom.signal('-HUP')

        # Check that the nodes are Free.
        self.server.expect(VNODE, {'state': 'free'}, id=k1, max_attempts=10,
                           interval=5)
        self.server.expect(VNODE, {'state': 'free'}, id=k2)

        # Submit few jobs
        a = {'Resource_List.select': '1:vntype=cray_compute'}
        job = Job(TEST_USER, attrs=a)

        job_id = self.server.submit(job)
        self.server.expect(JOB, {'job_state': 'R'}, id=job_id)
        # Check that exec_vnode is a KNL vnode.
        self.server.status(JOB, 'exec_vnode', id=job_id)
        evnode = job.get_vnodes()[0]
        self.assertIn(evnode, klist, "exec_vnode %s is not a KNL vnode."
                      % (evnode))
        self.logger.info("exec_vnode %s is a KNL vnode." % (evnode))

        job2 = Job(TEST_USER, attrs=a)

        job_id2 = self.server.submit(job2)
        self.server.expect(JOB, {'job_state': 'R'}, id=job_id2)
        # Check that exec_vnode is a KNL vnode.
        self.server.status(JOB, 'exec_vnode', id=job_id2)
        evnode = job2.get_vnodes()[0]
        self.assertIn(evnode, klist, "exec_vnode %s is not a KNL vnode."
                      % (evnode))
        self.logger.info("exec_vnode %s is a KNL vnode." % (evnode))

        job3 = Job(TEST_USER, attrs=a)

        job_id3 = self.server.submit(job3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=job_id3)

        # Delete the Job1.
        self.server.delete(job_id, wait=True)

        # Verify Job3 should start running
        self.server.expect(JOB, {'job_state': 'R'}, id=job_id3)
        # Check that exec_vnode is a KNL vnode.
        self.server.status(JOB, 'exec_vnode', id=job_id3)
        evnode = job3.get_vnodes()[0]
        self.assertIn(evnode, klist, "exec_vnode %s is not a KNL vnode."
                      % (evnode))
        self.logger.info("exec_vnode %s is a KNL vnode." % (evnode))

    def test_validate_pbs_xeon_phi_provision_hook(self):
        """
        Verify the default attribute of pbs_hook PBS_xeon_phi_provision hook.
        """
        if self.du.platform != 'cray':
            self.skipTest(reason='pbs_hook PBS_xeon_phi_provision is not'
                          ' available on non-cray machine')

        attr = {'type': 'pbs', 'enabled': 'false', 'event': 'provision',
                'alarm': 1800, 'order': 1, 'debug': 'false',
                'user': 'pbsadmin', 'fail_action': 'none'}

        self.server.manager(MGR_CMD_LIST, PBS_HOOK,
                            attr, id='PBS_xeon_phi_provision')

        self.server.manager(MGR_CMD_SET, PBS_HOOK, {'enabled': 'true',
                                                    'alarm': 1000},
                            id='PBS_xeon_phi_provision')
        self.server.manager(MGR_CMD_LIST, PBS_HOOK, {'enabled': 'true',
                                                     'alarm': 1000},
                            id='PBS_xeon_phi_provision')

        # Reset pbs_hook value to default PBS_xeon_phi_provision hook
        self.server.manager(MGR_CMD_SET, PBS_HOOK, {'enabled': 'false',
                                                    'alarm': 1800},
                            id='PBS_xeon_phi_provision')

        self.server.manager(MGR_CMD_LIST, PBS_HOOK,
                            attr, id='PBS_xeon_phi_provision')

    def tearDown(self):
        TestFunctional.tearDown(self)
        if self.du.platform == 'cray':
            # Change all nodes back to batch mode and restart PBS
            cmd = ['xtprocadmin', '-k', 'm', 'batch']
            self.logger.info(cmd)
            ret = self.server.du.run_cmd(self.server.hostname,
                                         cmd, logerr=True)
            self.assertEqual(ret['rc'], 0)

        # Restore hook freq to 300
        self.server.manager(MGR_CMD_SET, PBS_HOOK,
                            {'enabled': 'true', 'freq': 300},
                            id='PBS_alps_inventory_check')
        # Do Mom HUP
        self.mom.signal('-HUP')


================================================
FILE: test/tests/functional/pbs_calendaring.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


class TestCalendaring(TestFunctional):

    """
    This test suite tests if PBS scheduler calendars events correctly
    """

    def test_topjob_start_time(self):
        """
        In this test we test that the top job which gets added to the
        calendar has estimated start time correctly set for future when
        job history is enabled and opt_backfill_fuzzy is turned off.
        """

        self.scheduler.set_sched_config({'strict_ordering': 'true all'})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'backfill_depth': '2', 'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        # Turn opt_backfill_fuzzy off because we want to check if the job can
        # run after performing every end event in calendaring code instead
        # of rounding it off to next time boundary (default it 60 seconds)
        a = {'opt_backfill_fuzzy': 'off'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 30,
                   'array_indices_submitted': '1-6'}
        j1 = Job(TEST_USER, attrs=res_req)
        j1.set_sleep_time(30)
        jid1 = self.server.submit(j1)
        j1_sub1 = j1.create_subjob_id(jid1, 1)
        j1_sub2 = j1.create_subjob_id(jid1, 2)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 30}
        j2 = Job(TEST_USER, attrs=res_req)
        jid2 = self.server.submit(j2)

        self.server.expect(JOB, {'job_state': 'X'}, j1_sub1, interval=1)
        self.server.expect(JOB, {'job_state': 'R'}, j1_sub2)
        self.server.expect(JOB, {'job_state': 'Q'}, jid2)
        job1 = self.server.status(JOB, id=jid1)
        job2 = self.server.status(JOB, id=jid2)
        time_now = int(time.time())

        # get estimated start time of both the jobs
        self.assertIn('estimated.start_time', job1[0])
        est_val1 = job1[0]['estimated.start_time']
        self.assertIn('estimated.start_time', job2[0])
        est_val2 = job2[0]['estimated.start_time']
        est1 = time.strptime(est_val1, "%a %b %d %H:%M:%S %Y")
        est2 = time.strptime(est_val2, "%a %b %d %H:%M:%S %Y")
        est_epoch1 = int(time.mktime(est1))
        est_epoch2 = int(time.mktime(est2))

        # since only one subjob of array parent can become topjob
        # second job must start 10 seconds after that because
        # walltime of array job is 10 seconds.
        self.assertEqual(est_epoch2, est_epoch1 + 30)
        # Also make sure that since second subjob from array is running
        # Third subjob should set estimated.start_time in future.
        self.assertGreater(est_epoch1, time_now)

    def test_topjob_start_time_of_subjob(self):
        """
        In this test we test that the subjob which gets added to the
        calendar as top job and it has estimated start time correctly set when
        opt_backfill_fuzzy is turned off.
        """

        self.scheduler.set_sched_config({'strict_ordering': 'true all'})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'backfill_depth': '2'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        # Turn opt_backfill_fuzzy off because we want to check if the job can
        # run after performing every end event in calendaring code instead
        # of rounding it off to next time boundary (default it 60 seconds)
        a = {'opt_backfill_fuzzy': 'off'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 20,
                   'array_indices_submitted': '1-6'}
        j = Job(TEST_USER, attrs=res_req)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        j1_sub1 = j.create_subjob_id(jid, 1)
        j1_sub2 = j.create_subjob_id(jid, 2)

        self.server.expect(JOB, {'job_state': 'X'}, j1_sub1, interval=1)
        self.server.expect(JOB, {'job_state': 'R'}, j1_sub2)
        job_arr = self.server.status(JOB, id=jid)

        # check estimated start time is set on job array
        self.assertIn('estimated.start_time', job_arr[0])
        errmsg = jid + ";Error in calculation of start time of top job"
        self.scheduler.log_match(errmsg, existence=False, max_attempts=10)

    def test_topjob_fail(self):
        """
        Test that when we fail to add a job to the calendar it doesn't
        take up a topjob slot.  The server's backfill_depth is 1 by default,
        so we just need to submit a job that can never run and a job that can.
        The can never run job will fail to be added to the calendar and the
        second job will be.
        """

        # We need two nodes to create the situation where a job can never run.
        # We need to create this situation in such a way that the scheduler
        # doesn't detect it.  If the scheduler detects that a job can't run,
        # it won't try and add it to the calendar.  To do this, we ask for
        # 1 node with 2 cpus.  There are 2 nodes with 1 cpu each.
        attrs = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(attrib=attrs, num=2,
                               sharednode=False)

        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})

        # Submit job to eat up all the resources
        attrs = {'Resource_List.select': '2:ncpus=1',
                 'Resource_List.walltime': '1:00:00'}
        j1 = Job(TEST_USER, attrs)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # submit job that can never run.
        attrs['Resource_List.select'] = '1:ncpus=2'
        j2 = Job(TEST_USER, attrs)
        jid2 = self.server.submit(j2)

        # submit a job that can run, but just not now
        attrs['Resource_List.select'] = '1:ncpus=1'
        j3 = Job(TEST_USER, attrs)
        jid3 = self.server.submit(j3)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        msg = jid2 + ';Error in calculation of start time of top job'
        self.scheduler.log_match(msg)

        msg = jid3 + ';Job is a top job and will run at'
        self.scheduler.log_match(msg)

    def test_topjob_bucket(self):
        """
        In this test we test that a bucket job will be calendared to start
        at the end of the last job on a node
        """

        self.scheduler.set_sched_config({'strict_ordering': 'true all'})
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 1)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 30}
        j1 = Job(TEST_USER, attrs=res_req)
        j1.set_sleep_time(30)
        jid1 = self.server.submit(j1)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 45}
        j2 = Job(TEST_USER, attrs=res_req)
        j2.set_sleep_time(45)
        jid2 = self.server.submit(j2)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.place': 'excl'}
        j3 = Job(TEST_USER, attrs=res_req)
        jid3 = self.server.submit(j3)

        self.server.expect(JOB, {'job_state': 'R'}, jid1)
        self.server.expect(JOB, {'job_state': 'R'}, jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, jid3)
        job1 = self.server.status(JOB, id=jid1)
        job2 = self.server.status(JOB, id=jid2)
        job3 = self.server.status(JOB, id=jid3)

        end_time = time.mktime(time.strptime(job2[0]['stime'], '%c')) + 45
        est_time = job3[0]['estimated.start_time']
        est_time = time.mktime(time.strptime(est_time, '%c'))
        self.assertAlmostEqual(end_time, est_time, delta=1)

    def test_zero_resource_pushes_topjob(self):
        """
        This test case tests the scenario where a job that requests zero
        instance of a resource as the last resource in the select statement
        pushes the start time of top jobs
        """
        attrs = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(attrib=attrs, num=5,
                               sharednode=False)

        attr = {ATTR_RESC_TYPE: 'long', ATTR_RESC_FLAG: 'hn'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='ngpus')

        resources = self.scheduler.sched_config['resources']
        resources = resources[:-1] + ', ngpus, zz\"'
        a = {'job_sort_key': '"job_priority HIGH ALL"',
             'resources': resources,
             'strict_ordering': 'True ALL'}
        self.scheduler.set_sched_config(a)

        a = {'Resource_List.select': '2:ncpus=4',
             'Resource_List.walltime': '1:00:00',
             'Resource_List.place': 'vscatter'}

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid1 = self.server.submit(j)

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid2 = self.server.submit(j)

        a = {'Resource_List.select': '5:ncpus=4',
             'Resource_List.walltime': '1:00:00',
             ATTR_p: "1000",
             'Resource_List.place': 'vscatter'}

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid3 = self.server.submit(j)

        a = {'Resource_List.select': '1:ncpus=4',
             'Resource_List.walltime': '24:00:01',
             'Resource_List.place': 'vscatter'}

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid4 = self.server.submit(j)

        a = {'Resource_List.select': '1:ncpus=4:ngpus=0',
             'Resource_List.walltime': '24:00:01',
             'Resource_List.place': 'vscatter'}

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid5 = self.server.submit(j)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid3)
        c = "Not Running: Job would conflict with reservation or top job"
        self.server.expect(JOB, {ATTR_state: 'Q', ATTR_comment: c}, id=jid4)
        self.server.expect(JOB, {ATTR_state: 'Q', ATTR_comment: c}, id=jid5)

    def test_zero_resource_job_conflict_resv(self):
        """
        This test case tests the scenario where a job that requests zero
        instance of a resource as the last resource in the select statement
        pushes the start time of reservations
        """
        attrs = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(attrib=attrs, num=5,
                               sharednode=False)

        attr = {ATTR_RESC_TYPE: 'long', ATTR_RESC_FLAG: 'hn'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='ngpus')

        resources = self.scheduler.sched_config['resources']
        resources = resources[:-1] + ', ngpus, zz\"'
        a = {'job_sort_key': '"job_priority HIGH ALL"',
             'resources': resources,
             'strict_ordering': 'True ALL'}
        self.scheduler.set_sched_config(a)

        a = {'Resource_List.select': '2:ncpus=4',
             'Resource_List.walltime': '1:00:00',
             'Resource_List.place': 'vscatter'}

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid1 = self.server.submit(j)

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid2 = self.server.submit(j)

        now = int(time.time())
        a = {'Resource_List.select': '5:ncpus=4',
             'reserve_start': now + 3610,
             'reserve_end': now + 6610,
             'Resource_List.place': 'vscatter'}

        r = Reservation(TEST_USER)
        r.set_attributes(a)
        rid = self.server.submit(r)
        exp = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp, id=rid)

        a = {'Resource_List.select': '1:ncpus=4',
             'Resource_List.walltime': '24:00:01',
             'Resource_List.place': 'vscatter'}

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid3 = self.server.submit(j)

        a = {'Resource_List.select': '1:ncpus=4:ngpus=0',
             'Resource_List.walltime': '24:00:01',
             'Resource_List.place': 'vscatter'}

        j = Job(TEST_USER)
        j.set_attributes(a)
        jid4 = self.server.submit(j)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        c = "Not Running: Job would conflict with reservation or top job"
        self.server.expect(JOB, {ATTR_state: 'Q', ATTR_comment: c}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'Q', ATTR_comment: c}, id=jid4)

    def test_topjob_stale_estimates_clearing_on_clear_attr_set(self):
        """
        In this test we test that former top job with stale estimate
        gets the estimate cleared once the server attribute
        clear_topjob_estimates_enable is set to True
        """

        self.scheduler.set_sched_config({'strict_ordering': 'true all'})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'backfill_depth': '2'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'scheduler_iteration': '5'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 300}
        j1 = Job(TEST_USER, attrs=res_req)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, jid1)

        j2 = Job(TEST_USER, attrs=res_req)
        jid2 = self.server.submit(j2)
        job2 = self.server.status(JOB, id=jid2)
        self.assertIn('estimated.start_time', job2[0])
        self.assertIn('estimated.exec_vnode', job2[0])
        self.server.expect(JOB, {'topjob': True}, jid2, max_attempts=5)

        a = {'backfill_depth': '0'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        time.sleep(6)

        job2 = self.server.status(JOB, id=jid2)
        self.assertIn('estimated.start_time', job2[0])
        self.assertIn('estimated.exec_vnode', job2[0])
        self.server.expect(JOB, {'topjob': False}, jid2, max_attempts=5)

        a = {'clear_topjob_estimates_enable': True}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.expect(JOB, 'estimated.start_time', id=jid2, op=UNSET,
                           interval=1, max_attempts=10)
        self.server.expect(JOB, 'estimated.exec_vnode', id=jid2, op=UNSET,
                           interval=1, max_attempts=10)

    def test_topjob_estimates_clearing_enabled(self):
        """
        In this test we test that the top job which gets added to the
        calendar with valid estimate has estimate cleared once it losses
        top job status. The clearing needs to have the server attribute
        clear_topjob_estimates_enable set to true. Also, the job's topjob
        attribute is set accordingly.
        """

        self.scheduler.set_sched_config({'strict_ordering': 'true all'})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'backfill_depth': '2', 'clear_topjob_estimates_enable': True}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'scheduler_iteration': '5'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 300}
        j1 = Job(TEST_USER, attrs=res_req)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, jid1)

        j2 = Job(TEST_USER, attrs=res_req)
        jid2 = self.server.submit(j2)
        job2 = self.server.status(JOB, id=jid2)
        self.assertIn('estimated.start_time', job2[0])
        self.assertIn('estimated.exec_vnode', job2[0])
        self.server.expect(JOB, {'topjob': True}, jid2, max_attempts=5)

        a = {'backfill_depth': '0'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        time.sleep(6)

        job2 = self.server.status(JOB, id=jid2)
        self.assertNotIn('estimated.start_time', job2[0])
        self.assertNotIn('estimated.exec_vnode', job2[0])
        self.server.expect(JOB, {'topjob': False}, jid2, max_attempts=5)

    def test_topjob_estimates_clearing_disabled(self):
        """
        In this test we test that the top job which gets added to the
        calendar with valid estimate has not estimate cleared if it losses
        top job status. The clearing is prevented by clear_topjob_estimates_enable
        set to false/unset. Also, the job's topjob attribute is set accordingly.
        """

        self.scheduler.set_sched_config({'strict_ordering': 'true all'})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'backfill_depth': '2', 'clear_topjob_estimates_enable': False}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'scheduler_iteration': '5'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        res_req = {'Resource_List.select': '1:ncpus=1',
                   'Resource_List.walltime': 300}
        j1 = Job(TEST_USER, attrs=res_req)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, jid1)

        j2 = Job(TEST_USER, attrs=res_req)
        jid2 = self.server.submit(j2)
        job2 = self.server.status(JOB, id=jid2)
        self.assertIn('estimated.start_time', job2[0])
        self.assertIn('estimated.exec_vnode', job2[0])
        self.server.expect(JOB, {'topjob': True}, jid2, max_attempts=5)

        a = {'backfill_depth': '0'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        time.sleep(6)

        job2 = self.server.status(JOB, id=jid2)
        self.assertIn('estimated.start_time', job2[0])
        self.assertIn('estimated.exec_vnode', job2[0])
        self.server.expect(JOB, {'topjob': False}, jid2, max_attempts=5)


================================================
FILE: test/tests/functional/pbs_cgroups_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import glob

from tests.functional import *


#
# FUNCTION convert_size
#
def convert_size(value, units='b'):
    """
    Convert a string containing a size specification (e.g. "1m") to a
    string using different units (e.g. "1024k").

    This function only interprets a decimal number at the start of the string,
    stopping at any unrecognized character and ignoring the rest of the string.

    When down-converting (e.g. MB to KB), all calculations involve integers and
    the result returned is exact. When up-converting (e.g. KB to MB) floating
    point numbers are involved. The result is rounded up. For example:

    1023MB -> GB yields 1g
    1024MB -> GB yields 1g
    1025MB -> GB yields 2g  <-- This value was rounded up

    Pattern matching or conversion may result in exceptions.
    """
    logs = {'b': 0, 'k': 10, 'm': 20, 'g': 30,
            't': 40, 'p': 50, 'e': 60, 'z': 70, 'y': 80}
    try:
        new = units[0].lower()
        if new not in logs:
            raise ValueError('Invalid unit value')
        result = re.match(r'([-+]?\d+)([bkmgtpezy]?)',
                          str(value).lower())
        if not result:
            raise ValueError('Unrecognized value')
        val, old = result.groups()
        if int(val) < 0:
            raise ValueError('Value may not be negative')
        if old not in logs:
            old = 'b'
        factor = logs[old] - logs[new]
        val = float(val)
        val *= 2 ** factor
        if (val - int(val)) > 0.0:
            val += 1.0
        val = int(val)
        return str(val) + units.lower()
    except Exception:
        return None


def have_swap():
    """
    Returns 1 if swap space is not 0 otherwise returns 0
    """
    tt = 0
    with open(os.path.join(os.sep, 'proc', 'meminfo'), 'r') as fd:
        for line in fd:
            entry = line.split()
            if ((entry[0] == 'SwapFree:') and (entry[1] != '0')):
                tt = 1
    return tt


def systemd_escape(buf):
    """
    Escape strings for usage in system unit names
    Some distros don't provide the systemd-escape command
    """
    if not isinstance(buf, str):
        raise ValueError('Not a basetype string')
    ret = ''
    for i, char in enumerate(buf):
        if i < 1 and char == '.':
            if (sys.version_info[0] < 3):
                ret += '\\x' + '.'.encode('hex')
            else:
                ret += '\\x' + b'.'.hex()
        elif char.isalnum() or char in '_.':
            ret += char
        elif char == '/':
            ret += '-'
        else:
            # Will turn non-ASCII into UTF-8 hex sequence on both Py2/3
            if (sys.version_info[0] < 3):
                hexval = char.encode('hex')
            else:
                hexval = char.encode('utf-8').hex()
            for j in range(0, len(hexval), 2):
                ret += '\\x' + hexval[j:j + 2]
    return ret


def count_items(items):
    """
    Given a comma-separated string of numerical items of either
    singular value or a range of values (<start>-<stop>),
    return the actual number of items.
    For example,
         items="4-6,9,12-15"
         count(items) = 8
    since items expands to "4,5,6,9,12,13,14,15"
    """
    ct = 0
    if items is None:
        return ct
    for i in items.split(','):
        j = i.split('-')
        if len(j) == 2:
            ct += len(range(int(j[0]), int(j[1]))) + 1
        else:
            ct += 1
    return ct


@tags('mom', 'multi_node')
class TestCgroupsHook(TestFunctional):

    """
    This test suite targets Linux Cgroups hook functionality.
    """

    def is_memsw_enabled(self, host, mem_path):
        """
        Check if system has swapcontrol enabled, then return true
        else return false
        """
        if not mem_path:
            self.logger.info("memory controller not enabled on this host")
            return 'false'
        # List all files and check if memsw files exists
        if self.du.isfile(hostname=host,
                          path=mem_path + os.path.sep
                          + "memory.memsw.usage_in_bytes"):
            self.logger.info("memsw swap accounting is enabled on this host")
            return 'true'
        else:
            self.logger.info("memsw swap accounting not enabled on this host")
            return 'false'

    def setUp(self):

        self.hook_name = 'pbs_cgroups'
        # Cleanup previous pbs_cgroup hook so as to not interfere with test
        c_hook = self.server.filter(HOOK,
                                    {'enabled': True}, id=self.hook_name)
        if c_hook:
            self.server.manager(MGR_CMD_DELETE, HOOK, id=self.hook_name)

        a = {'resources_available.ncpus': (EQ, 0), 'state': 'free'}
        no_cpu_vnodes = self.server.filter(VNODE, a, attrop=PTL_AND)
        if no_cpu_vnodes:
            # TestFunctional.setUp() would error out if leftover setup
            # has no cpus vnodes. Best to cleanup vnodes altogether.
            self.logger.info("Deleting the existing vnodes")
            self.mom.delete_vnode_defs()
            self.mom.restart()

        for mom in self.moms.values():
            if mom.is_cpuset_mom():
                mom.revert_to_default = False

        TestFunctional.setUp(self)

        # Some of the tests requires 2 or 3 nodes.
        # Setting the default values when no mom is specified

        self.vntypename = []
        self.iscray = False
        self.noprefix = False
        self.tempfile = []
        self.moms_list = []
        self.hosts_list = []
        self.nodes_list = []
        self.paths = {}
        for cnt in range(0, len(self.moms)):
            mom = self.moms.values()[cnt]
            if mom.is_cray():
                self.iscray = True
            host = mom.shortname
            # Check if mom has needed cgroup mounted, otherwise skip test
            self.paths[host] = self.get_paths(host)
            if not self.paths[host]['cpuset']:
                self.skipTest('cpuset subsystem not mounted')
            self.logger.info("%s: cgroup cpuset is mounted" % host)
            if self.iscray:
                node = self.get_hostname(host)
            else:
                node = host
            vntype = self.get_vntype(host)
            if vntype is None:
                vntype = "no_cgroups"
            self.logger.info("vntype value is %s" % vntype)
            self.logger.info("Deleting the existing vnodes on %s" % host)
            mom.delete_vnode_defs()

            # Restart MoM
            time.sleep(2)
            time_before_restart = int(time.time())
            time.sleep(2)
            mom.restart()

            # Make sure that MoM has restarted far enough before reconfiguring
            # as that sends a HUP and may otherwise interfere with the restart
            # We send either a HELLO or a restart to server -- wait for that
            mom.log_match("sent to server",
                          starttime=time_before_restart,
                          n='ALL')

            self.logger.info("increase log level for mom and \
                             set polling intervals")
            c = {'$logevent': '0xffffffff', '$clienthost': self.server.name,
                 '$min_check_poll': 8, '$max_check_poll': 12}
            mom.add_config(c)

            self.moms_list.append(mom)
            self.hosts_list.append(host)
            self.nodes_list.append(node)
            self.vntypename.append(vntype)

        # Setting self.mom defaults to primary mom as some of
        # library methods assume that
        self.mom = self.moms_list[0]
        host = self.moms_list[0].shortname

        # Delete ALL vnodes
        # Re-creation moved to the end *after* we correctly set up the hook
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        self.serverA = self.servers.values()[0].name
        self.mem = 'true'
        if not self.paths[host]['memory']:
            self.mem = 'false'
        self.swapctl = self.is_memsw_enabled(host, self.paths[host]['memsw'])
        self.server.set_op_mode(PTL_CLI)
        self.server.cleanup_jobs()
        if not self.iscray:
            self.remove_vntype()

        self.eatmem_script = """
import sys
import time
MB = 2 ** 20
iterations = 1
chunkSizeMb = 1
sleeptime = 0
if (len(sys.argv) > 1):
    iterations = int(sys.argv[1])
if (len(sys.argv) > 2):
    chunkSizeMb = int(sys.argv[2])
if (len(sys.argv) > 3):
    sleeptime = int(sys.argv[3])
if (iterations < 1):
    print('Iteration count must be greater than zero.')
    exit(1)
if (chunkSizeMb < 1):
    print('Chunk size must be greater than zero.')
    exit(1)
totalSizeMb = chunkSizeMb * iterations
print('Allocating %d chunk(s) of size %dMB. (%dMB total)' %
      (iterations, chunkSizeMb, totalSizeMb))
buf = ''
for i in range(iterations):
    print('allocating %dMB' % ((i + 1) * chunkSizeMb))
    buf += ('#' * MB * chunkSizeMb)
if sleeptime > 0:
    time.sleep(sleeptime)
"""
        self.eatmem_script2 = """
import sys
import time
MB = 2 ** 20

iterations1 = 1
chunkSizeMb1 = 1
sleeptime1 = 0
if (len(sys.argv) > 1):
    iterations1 = int(sys.argv[1])
if (len(sys.argv) > 2):
    chunkSizeMb1 = int(sys.argv[2])
if (len(sys.argv) > 3):
    sleeptime1 = int(sys.argv[3])
if (iterations1 < 1):
    print('Iteration count must be greater than zero.')
    exit(1)
if (chunkSizeMb1 < 1):
    print('Chunk size must be greater than zero.')
    exit(1)
totalSizeMb1 = chunkSizeMb1 * iterations1
print('Allocating %d chunk(s) of size %dMB. (%dMB total)' %
      (iterations1, chunkSizeMb1, totalSizeMb1))
start_time1 = time.time()
buf = ''
for i in range(iterations1):
    print('allocating %dMB' % ((i + 1) * chunkSizeMb1))
    buf += ('#' * MB * chunkSizeMb1)
end_time1 = time.time()
if sleeptime1 > 0 and (end_time1 - start_time1) < sleeptime1 :
    time.sleep(sleeptime1 - end_time1 + start_time1)

if len(sys.argv) <= 4:
    exit(0)

iterations2 = 1
chunkSizeMb2 = 1
sleeptime2 = 0
if (len(sys.argv) > 4):
    iterations2 = int(sys.argv[4])
if (len(sys.argv) > 5):
    chunkSizeMb2 = int(sys.argv[5])
if (len(sys.argv) > 6):
    sleeptime2 = int(sys.argv[6])
if (iterations2 < 1):
    print('Iteration count must be greater than zero.')
    exit(1)
if (chunkSizeMb2 < 1):
    print('Chunk size must be greater than zero.')
    exit(1)
totalSizeMb2 = chunkSizeMb2 * iterations2
print('Allocating %d chunk(s) of size %dMB. (%dMB total)' %
      (iterations2, chunkSizeMb2, totalSizeMb2))
start_time2 = time.time()
# Do not reinitialize buf!!
for i in range(iterations2):
    print('allocating %dMB' % ((i + 1) * chunkSizeMb2))
    buf += ('#' * MB * chunkSizeMb2)
end_time2 = time.time()
if sleeptime2 > 0 and (end_time2 - start_time2) < sleeptime2 :
    time.sleep(sleeptime2 - end_time2 + start_time2)
"""
        self.eatmem_job1 = \
            '#PBS -joe\n' \
            '#PBS -S /bin/bash\n' \
            'sleep 10\n' \
            'python_path=`which python 2>/dev/null`\n' \
            'python3_path=`which python3 2>/dev/null`\n' \
            'python2_path=`which python2 2>/dev/null`\n' \
            'if [ -z "$python_path" ]; then\n' \
            '    if [ -n "$python3_path" ]; then\n' \
            '        python_path=$python3_path\n' \
            '    else\n' \
            '        python_path=$python2_path\n' \
            '    fi\n' \
            'fi\n' \
            'if [ -z "$python_path" ]; then\n' \
            '    echo Exiting -- no python found\n' \
            '    exit 1\n' \
            'fi\n' \
            '$python_path - 80 10 10 <<EOF\n' \
            '%s\nEOF\n' % self.eatmem_script
        self.eatmem_job2 = \
            '#PBS -joe\n' \
            '#PBS -S /bin/bash\n' \
            'python_path=`which python 2>/dev/null`\n' \
            'python3_path=`which python3 2>/dev/null`\n' \
            'python2_path=`which python2 2>/dev/null`\n' \
            'if [ -z "$python_path" ]; then\n' \
            '    if [ -n "$python3_path" ]; then\n' \
            '        python_path=$python3_path\n' \
            '    else\n' \
            '        python_path=$python2_path\n' \
            '    fi\n' \
            'fi\n' \
            'if [ -z "$python_path" ]; then\n' \
            '    echo Exiting -- no python found\n' \
            '    exit 1\n' \
            'fi\n' \
            'let i=0; while [ $i -lt 400000 ]; do let i+=1 ; done\n' \
            '$python_path - 200 2 10 <<EOF\n' \
            '%s\nEOF\n' \
            'let i=0; while [ $i -lt 400000 ]; do let i+=1 ; done\n' \
            '$python_path - 100 4 10 <<EOF\n' \
            '%s\nEOF\n' \
            'let i=0; while [ $i -lt 400000 ]; do let i+=1 ; done\n' \
            'sleep 25\n' % (self.eatmem_script, self.eatmem_script)
        self.eatmem_job3 = \
            '#PBS -joe\n' \
            '#PBS -S /bin/bash\n' \
            'python_path=`which python 2>/dev/null`\n' \
            'python3_path=`which python3 2>/dev/null`\n' \
            'python2_path=`which python2 2>/dev/null`\n' \
            'if [ -z "$python_path" ]; then\n' \
            '    if [ -n "$python3_path" ]; then\n' \
            '        python_path=$python3_path\n' \
            '    else\n' \
            '        python_path=$python2_path\n' \
            '    fi\n' \
            'fi\n' \
            'if [ -z "$python_path" ]; then\n' \
            '    echo Exiting -- no python found\n' \
            '    exit 1\n' \
            'fi\n' \
            'timeout 8 md5sum </dev/urandom\n' \
            '# Args are segments1 sizeMB1 sleep1 segments2 sizeMB2 sleep2\n' \
            '$python_path -  9 25 9  8 25 300 <<EOF\n' \
            '%s\nEOF\n' % self.eatmem_script2

        self.cpuset_mem_script = """
base='%s'
echo "cgroups base path for cpuset is $base"
if [ -d $base ]; then
    cpupath1=$base/cpuset.cpus
    cpupath2=$base/cpus
    if [ -f $cpupath1 ]; then
        cpus=`cat $cpupath1`
    elif [ -f $cpupath2 ]; then
        cpus=`cat $cpupath2`
    fi
    echo "CpuIDs=${cpus}"
    mempath1="$base/cpuset.mems"
    mempath2="$base/mems"
    if [ -f $mempath1 ]; then
        mems=`cat $mempath1`
    elif [ -f $mempath2 ]; then
        mems=`cat $mempath2`
    fi
    echo "MemorySocket=${mems}"
else
    echo "Cpuset subsystem job directory not created."
fi
mbase='%s'
if [ "${mbase}" != "None" ] ; then
    echo "cgroups base path for memory is $mbase"
    if [ -d $mbase ]; then
        mem_limit=`cat $mbase/memory.limit_in_bytes`
        echo "MemoryLimit=${mem_limit}"
        memsw_limit=`cat $mbase/memory.memsw.limit_in_bytes`
        echo "MemswLimit=${memsw_limit}"
    else
        echo "Memory subsystem job directory not created."
    fi
fi
"""
# no need to cater for cgroup_prefix options, it is obviously sbp here
        self.check_dirs_script = """
PBS_JOBID='%s'
jobnum=${PBS_JOBID%%.*}
devices_base='%s'
if [ -d "$devices_base/sbp" ]; then
    if [ -d "$devices_base/sbp/$PBS_JOBID" ]; then
        devices_job="$devices_base/sbp/$PBS_JOBID"
    elif [ -d "$devices_base/sbp.service/jobid/$PBS_JOBID" ]; then
        devices_job="$devices_base/sbp.service/jobid/$PBS_JOBID"
    else
        devices_job="$devices_base/sbp/sbp-${jobnum}.*.slice"
    fi
elif [ -d "$devices_base/sbp.service/jobid/$PBS_JOBID" ]; then
    devices_job="$devices_base/sbp.service/jobid/$PBS_JOBID"
else
    devices_job="$devices_base/sbp.slice/sbp-${jobnum}.*.slice"
fi
echo "devices_job: $devices_job"
sleep 10
if [ -d $devices_job ]; then
    device_list=`cat $devices_job/devices.list`
    echo "${device_list}"
else
    echo "Devices directory should be populated"
fi
"""

        self.check_gpu_script = """#!/bin/bash
#PBS -joe

jobnum=${PBS_JOBID%%.*}
devices_base=`grep cgroup /proc/mounts | grep devices | cut -d' ' -f2`
if [ -d "$devices_base/sbp" ]; then
    if [ -d "$devices_base/sbp/$PBS_JOBID" ]; then
        devices_job="$devices_base/sbp/$PBS_JOBID"
    elif [ -d "$devices_base/sbp.service/jobid/$PBS_JOBID" ]; then
        devices_job="$devices_base/sbp.service/jobid/$PBS_JOBID"
        devices_job="$devices_base/sbp/sbp-${jobnum}.*.slice"
    fi
elif [ -d "$devices_base/sbp.service/jobid/$PBS_JOBID" ]; then
    devices_job="$devices_base/sbp.service/jobid/$PBS_JOBID"
else
    devices_job="$devices_base/sbp.slice/sbp-${jobnum}.*.slice"
fi

device_list=`cat $devices_job/devices.list`
grep "195" $devices_job/devices.list

ngpus=$(nvidia-smi -L | grep "MIG-GPU" | wc -l)
if [ "$ngpus" -eq "0" ]; then
    ngpus=$(nvidia-smi -L | grep "GPU" | wc -l)
fi
echo "There are $ngpus GPUs"
echo $CUDA_VISIBLE_DEVICES
sleep 10
"""
        self.cpu_controller_script = """
base='%s'
echo "cgroups base path for cpuset is $base"
if [ -d $base ]; then
    shares=$base/cpu.shares
    echo shares=${shares}
    if [ -f $shares ]; then
        cpu_shares=`cat $shares`
        echo "cpu_shares=${cpu_shares}"
    fi
    cfs_period_us=$base/cpu.cfs_period_us
    echo cfs_period_us=${cfs_period_us}
    if [ -f $cfs_period_us ]; then
        cpu_cfs_period_us=`cat $cfs_period_us`
        echo "cpu_cfs_period_us=${cpu_cfs_period_us}"
    fi
    cfs_quota_us=$base/cpu.cfs_quota_us
    echo cfs_quota_us=$cfs_quota_us
    if [ -f $cfs_quota_us ]; then
        cpu_cfs_quota_us=`cat $cfs_quota_us`
        echo "cpu_cfs_quota_us=${cpu_cfs_quota_us}"
    fi
else
    echo "Cpu subsystem job directory not created."
fi
"""
        self.sleep15_job = """#!/bin/bash
#PBS -joe
sleep 15
"""
        self.sleep30_job = """#!/bin/bash
#PBS -joe
sleep 30
"""
        self.sleep600_job = """#!/bin/bash
#PBS -joe
sleep 600
"""
        self.sleep5_job = """#!/bin/bash
#PBS -joe
sleep 5
"""
        self.eat_cpu_script = """#!/bin/bash
#PBS -joe
for i in 1 2 3 4; do while : ; do : ; done & done
"""
        self.job_scr2 = """#!/bin/bash
#PBS -l select=host=%s:ncpus=1+ncpus=1
#PBS -l place=vscatter
#PBS -W umask=022
#PBS -koe
echo "$PBS_NODEFILE"
cat $PBS_NODEFILE
sleep 300
"""
        self.job_scr3 = """#!/bin/bash
#PBS -l select=2:ncpus=1:mem=100mb
#PBS -l place=vscatter
#PBS -W umask=022
#PBS -W tolerate_node_failures=job_start
#PBS -koe
echo "$PBS_NODEFILE"
cat $PBS_NODEFILE
sleep 300
"""
        self.cfg0 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : false,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : false,
    "use_hyperthreads"      : false,
    "cgroup" : {
        "cpuacct" : {
            "enabled"         : false
        },
        "cpuset" : {
            "enabled"         : false
        },
        "devices" : {
            "enabled"         : false
        },
        "hugetlb" : {
            "enabled"         : false
        },
        "memory" : {
            "enabled"         : false
        },
        "memsw" : {
            "enabled"         : false
        }
    }
}
"""
        self.cfg1 = """{
    "exclude_hosts"         : [%s],
    "exclude_vntypes"       : [%s],
    "run_only_on_hosts"     : [%s],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_hosts"   : [%s],
            "exclude_vntypes" : []
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "soft_limit"      : false,
            "default"         : "96MB",
            "reserve_percent" : "0",
            "reserve_amount"  : "0MB"
        },
        "memsw":
        {
            "enabled"         : %s,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "default"         : "96MB",
            "reserve_percent" : "0",
            "reserve_amount"  : "128MB"
        }
    }
}
"""
        self.cfg2 = """{
    "cgroup_prefix"         : "sbp",
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : false,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : false,
    "use_hyperthreads"      : false,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : false
        },
        "cpuset":
        {
            "enabled"         : false
        },
        "devices":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "allow"           : [
                "b *:* rwm",
                ["console","rwm"],
                ["tty0","rwm", "*"],
                "c 1:* rwm",
                "c 10:* rwm"
            ]
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : false
        },
        "memsw":
        {
            "enabled"         : false
        }
    }
}
"""
        self.cfg3 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [%s],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : %s,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : true,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [%s]
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "default"         : "96MB",
            "reserve_amount"  : "50MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : [%s]
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "96MB",
            "reserve_amount"  : "45MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : [%s]
        }
    }
}
"""
        self.cfg3b = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : %s,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : true,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : true,
            "default"         : "96MB",
            "reserve_amount"  : "50MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "swappiness"      : 0
        },
        "memsw":
        {
            "enabled"         : false,
            "default"         : "96MB",
            "reserve_amount"  : "45MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        }
    }
}
"""
        self.cfg4 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : ["no_cgroups_cpus"]
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "default"         : "96MB",
            "reserve_amount"  : "100MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : ["no_cgroups_mem"]
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "96MB",
            "reserve_amount"  : "90MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        }
    }
}
"""
        self.cfg5 = """{
    "vnode_per_numa_node" : %s,
    "cgroup" : {
        "cpuset" : {
            "enabled"            : true,
            "exclude_cpus"       : [%s],
            "mem_fences"         : %s,
            "mem_hardwall"       : %s,
            "memory_spread_page" : %s
        },
        "memory" : {
            "enabled" : %s
        },
        "memsw" : {
            "enabled" : %s
        }
    }
}
"""
        self.cfg6 = """{
    "vnode_per_numa_node" : false,
    "cgroup" : {
        "memory":
        {
            "enabled"         : %s,
            "default"         : "64MB",
            "reserve_percent" : "0",
            "reserve_amount"  : "0MB"
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "64MB",
            "reserve_percent" : "0",
            "reserve_amount"  : "0MB"
        }
    }
}
"""
        self.cfg7 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : true,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "cgroup" : {
        "cpuacct" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "cpuset" : {
            "enabled"            : true,
            "exclude_cpus"       : [],
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "devices" : {
            "enabled"            : false
        },
        "hugetlb" : {
            "enabled"            : false
        },
        "memory" : {
            "enabled"            : %s,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "256MB",
            "reserve_amount"     : "64MB"
        },
        "memsw" : {
            "enabled"            : %s,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "256MB",
            "reserve_amount"     : "64MB"
        }
    }
}
"""
        self.cfg8 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [%s],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : true,
    "ncpus_are_cores"       : true,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [%s]
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "default"         : "96MB",
            "reserve_amount"  : "50MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : [%s]
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "96MB",
            "reserve_amount"  : "45MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : [%s]
        }
    }
}
"""
        self.cfg9 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : true,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : true,
    "cgroup" : {
        "cpuacct" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "cpuset" : {
            "enabled"            : true,
            "exclude_cpus"       : [],
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "devices" : {
            "enabled"            : false
        },
        "hugetlb" : {
            "enabled"            : false
        },
        "memory" : {
            "enabled"            : %s,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "256MB",
            "reserve_amount"     : "64MB"
        },
        "memsw" : {
            "enabled"            : %s,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "256MB",
            "reserve_amount"     : "64MB"
        }
    }
}
"""
        self.cfg10 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : true,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_cpus"    : [],
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpu" : {
            "enabled"                    : true,
            "enforce_per_period_quota"   : true
          }
    }
}
"""
        self.cfg11 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : true,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_cpus"    : [],
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpu" : {
            "enabled"                    : true,
            "enforce_per_period_quota"   : true,
            "cfs_period_us"              : %d,
            "cfs_quota_fudge_factor"     : %f
          }
    }
}
"""
        self.cfg12 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_cpus"    : [],
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "allow_zero_cpus" : true
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpu" : {
            "enabled"                    : true,
            "enforce_per_period_quota"   : true
          }
    }
}
"""
        self.cfg13 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpuset":
        {
            "enabled"         : true,
            "exclude_cpus"    : [],
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "allow_zero_cpus" : true
        },
        "devices":
        {
            "enabled"         : false
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "memsw":
        {
            "enabled"         : %s,
            "default"         : "256MB",
            "reserve_amount"  : "64MB",
            "exclude_hosts"   : [],
            "exclude_vntypes" : []
        },
        "cpu" : {
            "enabled"                    : true,
            "enforce_per_period_quota"   : true,
            "cfs_period_us"              : %d,
            "cfs_quota_fudge_factor"     : %f,
            "zero_cpus_shares_fraction"  : %f,
            "zero_cpus_quota_fraction"   : %f
          }
    }
}
"""
        self.cfg14 = """{
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : false,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : false,
    "use_hyperthreads"      : false,
    "discover_gpus"         : %s,
    "cgroup":
    {
        "cpuacct":
        {
            "enabled"         : true
        },
        "cpuset":
        {
            "enabled"         : false
        },
        "devices":
        {
            "enabled"         : %s,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "allow"           : [
                "b *:* rwm",
                ["console","rwm"],
                ["tty0","rwm", "*"],
                "c 1:* rwm",
                "c 10:* rwm"
            ]
        },
        "hugetlb":
        {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : true
        },
        "memsw":
        {
            "enabled"         : false
        }
    }
}
"""
        self.cfg15 = """{
    "cgroup_prefix"         : "pbs_jobs",
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : %s,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "ncpus_are_cores"       : false,
    "cgroup" : {
        "cpuacct" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "cpuset" : {
            "enabled"            : true,
            "exclude_cpus"       : [],
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "mem_fences"         : true,
            "mem_hardwall"       : false,
            "memory_spread_page" : false,
            "allow_zero_cpus"    : true
        },
        "devices" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "allow"              : [
                "b *:* rwm",
                "c *:* rwm"
            ]
        },
        "hugetlb" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "0MB",
            "reserve_percent"    : 0,
            "reserve_amount"     : "0MB"
        },
        "memory" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "soft_limit"         : false,
            "default"            : "256MB",
            "reserve_percent"    : 0,
            "swappiness"         : 0,
            "reserve_amount"     : "1GB",
            "enforce_default"    : true,
            "exclhost_ignore_default" : true
        },
        "memsw" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "256MB",
            "reserve_percent"    : 0,
            "reserve_amount"     : "10GB",
            "manage_cgswap"      : true,
            "enforce_default"    : true,
            "exclhost_ignore_default" : true
        }
    }
}
"""
        self.cfg16 = """{
    "cgroup_prefix"         : "pbs_jobs",
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "ncpus_are_cores"       : false,
    "manage_rlimit_as"      : true,
    "cgroup" : {
        "cpuacct" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "cpuset" : {
            "enabled"            : true,
            "exclude_cpus"       : [],
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "mem_fences"         : true,
            "mem_hardwall"       : false,
            "memory_spread_page" : false
        },
        "devices" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "allow"              : [
                "b *:* rwm",
                "c *:* rwm"
            ]
        },
        "hugetlb" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "0MB",
            "reserve_percent"    : 0,
            "reserve_amount"     : "0MB"
        },
        "memory" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "soft_limit"         : false,
            "default"            : "100MB",
            "reserve_percent"    : 0,
            "swappiness"         : 0,
            "reserve_amount"     : "1GB",
            "enforce_default"    : %s,
            "exclhost_ignore_default" : true
        },
        "memsw" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "100MB",
            "reserve_percent"    : 0,
            "reserve_amount"     : "10GB",
            "manage_cgswap"      : true,
            "enforce_default"    : %s,
            "exclhost_ignore_default" : true
        }
    }
}
"""
        self.cfg17 = """{
    "cgroup_prefix"         : "pbs_jobs",
    "exclude_hosts"         : [],
    "exclude_vntypes"       : ["no_cgroups"],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : true,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : true,
    "use_hyperthreads"      : false,
    "ncpus_are_cores"       : false,
    "manage_rlimit_as"      : true,
    "cgroup" : {
        "cpuacct" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : []
        },
        "cpuset" : {
            "mount_path"          : "/sys/fs/cgroup/cpuset",
            "enabled"            : true,
            "exclude_cpus"       : [],
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "mem_fences"         : true,
            "mem_hardwall"       : false,
            "memory_spread_page" : false
        },
        "devices" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "allow"              : [
                "b *:* rwm",
                "c *:* rwm"
            ]
        },
        "hugetlb" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "0MB",
            "reserve_percent"    : 0,
            "reserve_amount"     : "0MB"
        },
        "memory" : {
            "enabled"            : true,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "soft_limit"         : false,
            "default"            : "100MB",
            "reserve_percent"    : 0,
            "swappiness"         : 0,
            "reserve_amount"     : "1GB",
            "enforce_default"    : true,
            "exclhost_ignore_default" : true
        },
        "memsw" : {
            "enabled"            : false,
            "exclude_hosts"      : [],
            "exclude_vntypes"    : [],
            "default"            : "100MB",
            "reserve_percent"    : 0,
            "reserve_amount"     : "10GB",
            "manage_cgswap"      : true,
            "enforce_default"    : true,
            "exclhost_ignore_default" : true
        }
    }
}
"""

        Job.dflt_attributes[ATTR_k] = 'oe'
        # Increase the server log level
        a = {'log_events': '4095'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        # Configure the scheduler to schedule using vmem
        a = {'resources': 'ncpus,mem,vmem,host,vnode,ngpus,nmics'}
        self.scheduler.set_sched_config(a)
        # Create resources
        attr = {'type': 'long', 'flag': 'nh'}

        rss = self.server.status(RSC)
        self.logger.info('resources on server are: %s' % str(rss))
        if not next((item for item in rss if item['id'] == 'nmics'), None):
            self.server.manager(MGR_CMD_CREATE, RSC, attr, id='nmics',
                                logerr=False)
        if not next((item for item in rss if item['id'] == 'ngpus'), None):
            self.server.manager(MGR_CMD_CREATE, RSC, attr, id='ngpus',
                                logerr=False)
        # Import the hook
        self.hook_file = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                      'lib',
                                      'python',
                                      'altair',
                                      'pbs_hooks',
                                      'pbs_cgroups.PY')

        # Load hook, but do not check MoMs
        # since the vnodes are deleted on the server
        self.load_hook(self.hook_file, mom_checks=False)

        # Recreate the nodes moved to the end, after we set up
        # the hook with its default config
        # Make sure the load_hook is done on server first
        time.sleep(2)
        for host in self.hosts_list:
            self.server.manager(MGR_CMD_CREATE, NODE, id=host)

        # Make sure that by the time we send a HUP and the test
        # actually tinkers with the hooks once more,
        # MoMs will already have gone through their initial setup
        # and copied the hooks after the new hello from the server

        # perhaps we could replace this by matching a HELLO from
        # the server
        time.sleep(10)

        # HUP mom so exechost_startup hook is run for each mom...
        for mom in self.moms_list:
            mom.signal('-HUP')

        # ...then wait for exechost_startup updates to propagate to server
        time.sleep(6)

        # queuejob hook
        self.qjob_hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "queuejob hook executed")
# Save current select spec in resource 'site'
e.job.Resource_List["site"] = str(e.job.Resource_List["select"])

# Add 1 chunk to each chunk (except the first chunk) in the job's select s
new_select = e.job.Resource_List["select"].increment_chunks(1)
e.job.Resource_List["select"] = new_select

# Make job tolerate node failures that occur only during start.
e.job.tolerate_node_failures = "job_start"
"""
        # launch hook
        self.launch_hook_body = """
import pbs
import time
e=pbs.event()

pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")

# print out the vnode_list[] values
for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")

# print out the vnode_list_fail[] values:
for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
if e.job.in_ms_mom():
    pj = e.job.release_nodes(keep_select=%s)
    if pj is None:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at LAUNCH")
"""
        # resize hook
        self.resize_hook_body = """
import pbs
e=pbs.event()
if %s e.job.in_ms_mom():
    e.reject("Cannot resize the job")
"""

    def get_paths(self, host):
        """
        Returns a dictionary containing the location where each cgroup
        is mounted on host.
        """
        paths = {'pids': None,
                 'blkio': None,
                 'systemd': None,
                 'cpuset': None,
                 'memory': None,
                 'memsw': None,
                 'cpuacct': None,
                 'devices': None,
                 'cpu': None,
                 'hugetlb': None,
                 'perf_event': None,
                 'freezer': None,
                 'net_cls': None,
                 'net_prio': None}
        # Loop through the mounts and collect the ones for cgroups
        fd = self.du.cat(host, '/proc/mounts')
        for line in fd['out']:
            entries = line.split()
            if entries[2] != 'cgroup':
                continue
            flags = entries[3].split(',')
            if 'noprefix' in flags:
                self.noprefix = True
            subsys = os.path.basename(entries[1])
            paths[subsys] = entries[1]
            if 'memory' in flags:
                paths['memsw'] = paths[subsys]
                paths['memory'] = paths[subsys]
            if 'cpuacct' in flags:
                paths['cpuacct'] = paths[subsys]
            if 'devices' in flags:
                paths['devices'] = paths[subsys]
            if 'cpu' in flags:
                paths['cpu'] = paths[subsys]
            # Add these to support future unified hierarchy
            # (everything in one dir)
            if paths['pids'] is None and 'pids' in flags:
                paths['pids'] = paths[subsys]
            if paths['blkio'] is None and 'blkio' in flags:
                paths['blkio'] = paths[subsys]
            if paths['systemd'] is None and 'systemd' in flags:
                paths['systemd'] = paths[subsys]
            if paths['cpuset'] is None and 'cpuset' in flags:
                paths['cpuset'] = paths[subsys]
            if paths['hugetlb'] is None and 'hugetlb' in flags:
                paths['hugetlb'] = paths[subsys]
            if paths['perf_event'] is None and 'perf_event' in flags:
                paths['perf_event'] = paths[subsys]
            if paths['freezer'] is None and 'freezer' in flags:
                paths['freezer'] = paths[subsys]
            if paths['net_cls'] is None and 'net_cls' in flags:
                paths['net_cls'] = paths[subsys]
            if paths['net_prio'] is None and 'net_prio' in flags:
                paths['net_prio'] = paths[subsys]
        return paths

    def is_dir(self, cpath, host):
        """
        Returns True if path exists otherwise false
        """
        for _ in range(5):
            rv = self.du.isdir(hostname=host, path=cpath, sudo=True)
            if rv:
                return True
            time.sleep(0.1)
        return False

    def is_file(self, cpath, host):
        """
        Returns True if path exists otherwise false
        """
        for _ in range(5):
            rv = self.du.isfile(hostname=host, path=cpath, sudo=True)
            if rv:
                return True
            time.sleep(0.5)
        return False

    def get_cgroup_job_dir(self, subsys, jobid, host):
        """
        Returns path of subsystem for jobid
        """
        basedir = self.paths[host][subsys]
        # One of the entries in the following list should exist
        #
        # This cleaned version assumes cgroup_prefix is always pbs_jobs,
        # i.e. that cgroup_prefix is not changed if you use this routine
        #
        # The separate test for a different prefix ("sbp") uses its own
        # script instead; that script need not support multi-host jobs
        #
        # Older possible per job paths (relative to the basedir) looked:
        # 1) <prefix>.slice/<prefix>-<jobid>.slice
        #     (and <jobid> needs to be passed through systemd_escape)
        # 2) <prefix>/<jobid>
        #
        # Some older hooks used either depending on the OS platform
        # which was the reason to support a list in the first place
        #
        # If you need to add paths to make the tests support older hooks,
        # put the least likely paths at the end of the list, to avoid
        # changing test timings too much.
        #
        jobdirs = [os.path.join(basedir, 'pbs_jobs.service/jobid', jobid)]
        for jdir in jobdirs:
            if self.du.isdir(hostname=host, path=jdir, sudo=True):
                return jdir
        return None

    def find_main_cpath(self, cdir, host=None):
        if host is None:
            host = self.hosts_list[0]
        rc = self.du.isdir(host, path=cdir)
        if rc:
            paths = ['pbs_jobs.service/jobid',
                     'pbs.service/jobid',
                     'pbs.slice',
                     'pbs']
            for p in paths:
                cpath = os.path.join(cdir, p)
                rc = self.du.isdir(host, path=cpath)
                if rc:
                    return cpath
        return None

    def load_hook(self, filename, mom_checks=True):
        """
        Import and enable a hook pointed to by the URL specified.
        """
        try:
            with open(filename, 'r') as fd:
                script = fd.read()
        except IOError:
            self.assertTrue(False, 'Failed to open hook file %s' % filename)
        events = ['execjob_begin', 'execjob_launch', 'execjob_attach',
                  'execjob_epilogue', 'execjob_end', 'exechost_startup',
                  'exechost_periodic', 'execjob_resize', 'execjob_abort']
        # Alarm timeout should be set really large because some tests will
        # create a lot of simultaneous jobs on a single (slow) MoM
        # Shipped default is 90 seconds, which is reasonable for real hosts,
        # but not for containers or VMs sharing a host
        a = {'enabled': 'True',
             'freq': '10',
             'alarm': 120,
             'event': events}
        # Sometimes the deletion of the old hook is still pending
        failed = True
        for _ in range(5):
            try:
                self.server.create_import_hook(self.hook_name, a, script,
                                               overwrite=True,
                                               level=logging.DEBUG)
            except Exception:
                time.sleep(2)
            else:
                failed = False
                break
        if failed:
            self.skipTest('pbs_cgroups_hook: failed to load hook')
        # Add the configuration
        self.load_default_config(mom_checks=mom_checks)

    def load_config(self, cfg, mom_checks=True):
        """
        Create a hook configuration file with the provided contents.
        """
        fn = self.du.create_temp_file(hostname=self.serverA, body=cfg)
        self.tempfile.append(fn)
        self.logger.info('Current config: %s' % cfg)
        a = {'content-type': 'application/x-config',
             'content-encoding': 'default',
             'input-file': fn}
        # In tests that use this, make sure that other hook CF
        # copies from setup, node creations, MoM restarts etc.
        # are all finished, so that we don't match a CF copy
        # message in the logs from someone else!
        time.sleep(5)
        just_before_import = int(time.time())
        time.sleep(2)
        self.server.manager(MGR_CMD_IMPORT, HOOK, a, self.hook_name)
        if mom_checks:
            self.moms_list[0].log_match('pbs_cgroups.CF;'
                                        'copy hook-related '
                                        'file request received',
                                        starttime=just_before_import,
                                        n='ALL')
        pbs_home = self.server.pbs_conf['PBS_HOME']
        svr_conf = os.path.join(
            os.sep, pbs_home, 'server_priv', 'hooks', 'pbs_cgroups.CF')
        pbs_home = self.mom.pbs_conf['PBS_HOME']
        mom_conf = os.path.join(
            os.sep, pbs_home, 'mom_priv', 'hooks', 'pbs_cgroups.CF')
        if mom_checks:
            # reload config if server and mom cfg differ up to count times
            count = 5
            while (count > 0):
                r1 = self.du.run_cmd(cmd=['cat', svr_conf], sudo=True,
                                     hosts=self.serverA)
                r2 = self.du.run_cmd(cmd=['cat', mom_conf], sudo=True,
                                     hosts=self.mom.shortname)
                if r1['out'] != r2['out']:
                    self.logger.info('server & mom pbs_cgroups.CF differ')
                    time.sleep(2)
                    just_before_import = int(time.time())
                    time.sleep(2)
                    self.server.manager(MGR_CMD_IMPORT, HOOK, a,
                                        self.hook_name)
                    self.moms_list[0].log_match('pbs_cgroups.CF;'
                                                'copy hook-related '
                                                'file request received',
                                                starttime=just_before_import,
                                                n='ALL')
                else:
                    self.logger.info('server & mom pbs_cgroups.CF match')
                    break
                time.sleep(1)
                count -= 1
            self.assertGreater(count, 0, "pbs_cgroups.CF failed to load")
            # A HUP of each mom ensures update to hook config file is
            # seen by the exechost_startup hook.

            time.sleep(2)
            stime = int(time.time())
            time.sleep(2)
            for mom in self.moms_list:
                mom.signal('-HUP')
                mom.log_match('hook_perf_stat;label=hook_exechost_startup_'
                              'pbs_cgroups_.* profile_stop',
                              regexp=True,
                              starttime=stime, existence=True,
                              interval=1, n='ALL')

    def load_default_config(self, mom_checks=True):
        """
        Load the default pbs_cgroups hook config file
        """
        self.config_file = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                        'lib',
                                        'python',
                                        'altair',
                                        'pbs_hooks',
                                        'pbs_cgroups.CF')
        time.sleep(2)
        now = int(time.time())
        time.sleep(2)
        a = {'content-type': 'application/x-config',
             'content-encoding': 'default',
             'input-file': self.config_file}
        self.server.manager(MGR_CMD_IMPORT, HOOK, a, self.hook_name)
        if not mom_checks:
            return
        self.moms_list[0].log_match('pbs_cgroups.CF;copy hook-related '
                                    'file request received',
                                    starttime=now, n='ALL')

    def set_vntype(self, host, typestring='myvntype'):
        """
        Set the vnode type for the local mom.
        """
        pbs_home = self.server.pbs_conf['PBS_HOME']
        vntype_file = os.path.join(pbs_home, 'mom_priv', 'vntype')
        self.logger.info('Setting vntype to %s in %s on mom %s' %
                         (typestring, vntype_file, host))
        localhost = socket.gethostname()
        fn = self.du.create_temp_file(hostname=localhost, body=typestring)
        self.tempfile.append(fn)
        ret = self.du.run_copy(hosts=host, src=fn,
                               dest=vntype_file, sudo=True, uid='root',
                               gid='root', mode=0o644)
        if ret['rc'] != 0:
            self.skipTest('pbs_cgroups_hook: failed to set vntype')

    def remove_vntype(self):
        """
        Unset the vnode type on the moms.
        """
        for mom in self.moms_list:
            pbs_home = mom.pbs_conf['PBS_HOME']
            vn_file = os.path.join(pbs_home, 'mom_priv', 'vntype')
            host = mom.shortname
            self.logger.info('Deleting vntype files %s from mom %s'
                             % (vn_file, host))
            ret = self.du.rm(hostname=host, path=vn_file,
                             force=True, sudo=True, logerr=False)
            if not ret:
                self.skipTest('pbs_cgroups_hook: failed to remove vntype')

    def get_vntype(self, host):
        """
        Get the vntype if it exists for example on cray
        """
        vntype = 'no_cgroups'
        pbs_home = self.server.pbs_conf['PBS_HOME']
        vntype_f = os.path.join(pbs_home, 'mom_priv', 'vntype')
        self.logger.info('Reading the vntype value for mom %s' % host)
        if self.du.isfile(hostname=host, path=vntype_f):
            output = self.du.cat(hostname=host, filename=vntype_f, sudo=True)
            vntype = output['out'][0]
        return vntype

    def wait_and_read_file(self, host, filename=''):
        """
        Make several attempts to read a file and return its contents
        """
        self.logger.info('Reading file: %s on host: %s' % (filename, host))
        if not filename:
            raise ValueError('Invalid filename')
        for _ in range(30):
            if self.du.isfile(hostname=host, path=filename):
                break
            time.sleep(0.5)
        self.assertTrue(self.du.isfile(hostname=host, path=filename),
                        'File %s not found on host %s' % (filename, host))
        # Wait for output to flush
        time.sleep(2)
        output = self.du.cat(hostname=host, filename=filename, sudo=True)
        if output['rc'] == 0:
            return output['out']
        else:
            return []

    def get_hostname(self, host):
        """
        get hostname of the mom.
        This is needed since cgroups logs hostname not mom name
        """
        cmd = 'hostname'
        rv = self.du.run_cmd(hosts=host, cmd=cmd)
        ret = rv['out'][0].split('.')[0]
        return ret

    def get_host_names(self, host):
        """
        get shortname and hostname of the mom. This is needed
        for some systems where hostname and shortname is different.
        """
        cmd1 = 'hostname -s'
        rv1 = self.du.run_cmd(hosts=host, cmd=cmd1)
        host2 = self.get_hostname(host)
        hostlist = '"' + host2 + '"'
        moms = [hostlist]
        mlog = ["'" + host2 + "'"]
        # if shortname and hostname is not same then construct a
        # list including both to be passed to cgroups hook
        if (str(rv1['out'][0]) != host2):
            moms.append('"' + str(rv1['out'][0]) + '"')
            mlog.append("'" + str(rv1['out'][0]) + "'")
        if len(moms) > 1:
            mom1 = ','.join(moms)
            log1 = ', '.join(mlog)
        else:
            mom1 = '"' + host2 + '"'
            log1 = "'" + host2 + "'"
        return mom1, log1

    @requirements(num_moms=2)
    def test_cgroup_vntype_excluded(self):
        """
        Test to verify that cgroups are not enforced on nodes
        that have an exclude vntype file set
        """
        name = 'CGROUP8'
        if self.vntypename[0] == 'no_cgroups':
            self.logger.info('Adding vntype %s to mom %s ' %
                             (self.vntypename[0], self.moms_list[0]))
            self.set_vntype(typestring=self.vntypename[0],
                            host=self.hosts_list[0])
        a = self.cfg1 % ('', '"' + self.vntypename[0] + '"',
                         '', '', self.mem, self.swapctl)
        self.load_config(a)
        for m in self.moms.values():
            m.restart()

        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        self.logger.info('memory subsystem is at location %s' %
                         self.paths[self.hosts_list[0]]['memory'])
        cpath = self.get_cgroup_job_dir('memory', jid, self.hosts_list[0])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[0]))
        self.moms_list[0].log_match(
            "%s is in the excluded vnode type list: ['%s']"
            % (self.vntypename[0],
               self.vntypename[0]),
            starttime=stime, n='ALL')
        self.logger.info('vntypes on both hosts are: %s and %s'
                         % (self.vntypename[0], self.vntypename[1]))
        if self.vntypename[1] == self.vntypename[0]:
            self.logger.info('Skipping the second part of this test '
                             'since hostB also has same vntype value')
            return

        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[1], ATTR_N: name}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.sleep600_job)
        jid2 = self.server.submit(j1)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid2)
        self.server.status(JOB, ATTR_o, jid2)
        o = j1.attributes[ATTR_o]
        self.tempfile.append(o)
        cpath = self.get_cgroup_job_dir('memory', jid2, self.hosts_list[1])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[1]))

    @requirements(num_moms=2)
    def test_cgroup_host_excluded(self):
        """
        Test to verify that cgroups are not enforced on nodes
        that have the exclude_hosts set
        """
        name = 'CGROUP9'
        mom, log = self.get_host_names(self.hosts_list[0])
        self.load_config(self.cfg1 % ('%s' % mom, '', '', '',
                                      self.mem, self.swapctl))
        for m in self.moms.values():
            m.restart()

        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        cpath = self.get_cgroup_job_dir('memory', jid, self.hosts_list[0])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[0]))
        host = self.get_hostname(self.hosts_list[0])
        self.moms_list[0].log_match('%s is in the excluded host list: [%s]' %
                                    (host, log), starttime=stime,
                                    n='ALL')
        self.server.delete(jid, wait=True)

        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[1], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid2 = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid2)
        self.server.status(JOB, ATTR_o, jid2)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        cpath = self.get_cgroup_job_dir('memory', jid2, self.hosts_list[1])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[1]))

    @requirements(num_moms=2)
    def test_cgroup_exclude_vntype_mem(self):
        """
        Test to verify that cgroups are not enforced on nodes
        that have an exclude vntype file set
        """
        name = 'CGROUP12'
        if self.vntypename[0] == 'no_cgroups':
            self.logger.info('Adding vntype %s to mom %s' %
                             (self.vntypename[0], self.moms_list[0]))
            self.set_vntype(typestring='no_cgroups', host=self.hosts_list[0])
        self.load_config(self.cfg3 % ('', 'false', '', self.mem,
                                      '"' + self.vntypename[0] + '"',
                                      self.swapctl,
                                      '"' + self.vntypename[0] + '"'))
        for m in self.moms.values():
            m.restart()

        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s'
             % self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        self.moms_list[0].log_match('cgroup excluded for subsystem memory '
                                    'on vnode type %s' % self.vntypename[0],
                                    starttime=stime, n='ALL')
        self.logger.info('vntype values for each hosts are: %s and %s'
                         % (self.vntypename[0], self.vntypename[1]))
        if self.vntypename[0] == self.vntypename[1]:
            self.logger.info('Skipping the second part of this test '
                             'since hostB also has same vntype value')
            return

        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' %
             self.hosts_list[1], ATTR_N: name}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.sleep600_job)
        jid2 = self.server.submit(j1)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid2)
        self.server.status(JOB, ATTR_o, jid2)
        o = j1.attributes[ATTR_o]
        self.tempfile.append(o)
        cpath = self.get_cgroup_job_dir('memory', jid2, self.hosts_list[1])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[1]))

    def test_cgroup_periodic_update_check_values(self):
        """
        Test to verify that cgroups are reporting usage for cput and mem
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        name = 'CGROUP13'
        conf = {'freq': 2}
        self.server.manager(MGR_CMD_SET, HOOK, conf, self.hook_name)
        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))

        a = {'Resource_List.select': '1:ncpus=1:mem=500mb:host=%s' %
             self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.eatmem_job3)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        # Scouring the logs for initial values takes too long
        resc_list = ['resources_used.mem']
        if self.swapctl == 'true':
            resc_list.append('resources_used.vmem')
        qstat = self.server.status(JOB, resc_list, id=jid)
        mem = convert_size(qstat[0]['resources_used.mem'], 'kb')
        match = re.match(r'(\d+)kb', mem)
        self.assertFalse(match is None)
        usage = int(match.groups()[0])
        self.assertGreater(300000, usage)
        if self.swapctl == 'true':
            vmem = convert_size(qstat[0]['resources_used.vmem'], 'kb')
            match = re.match(r'(\d+)kb', vmem)
            self.assertFalse(match is None)
            usage = int(match.groups()[0])
            self.assertGreater(300000, usage)
        err_msg = "Unexpected error in pbs_cgroups " + \
            "handling exechost_periodic event: TypeError"
        self.moms_list[0].log_match(err_msg, max_attempts=3,
                                    interval=1, n='ALL',
                                    starttime=stime, existence=False)

        # Allow some time to pass for values to be updated
        # sleep 2s: make sure no old log lines will match 'begin' time
        time.sleep(2)
        begin = int(time.time())
        # sleep 2s to allow for small time differences and rounding errors
        time.sleep(2)

        self.logger.info('Waiting for periodic hook to update usage data.')
        # loop to check if cput, mem, vmem are expected values
        cput_usage = 0.0
        mem_usage = 0
        vmem_usage = 0
        # Faster systems might expect to see the usage you finally expect
        # recorder after 8-10 seconds; on TH it can take up to a minute
        time.sleep(8)
        for count in range(30):
            time.sleep(2)
            if self.paths[self.hosts_list[0]]['cpuacct'] and cput_usage <= 1.0:
                # Match last line from the bottom
                line = self.moms_list[0].log_match(
                    '%s;update_job_usage: CPU usage:' % jid,
                    starttime=begin, n='ALL')
                match = re.search(r'CPU usage: ([0-9.]+) secs', line[1])
                cput_usage = float(match.groups()[0])
                self.logger.info("Found cput_usage: %ss" % str(cput_usage))
            if (self.paths[self.hosts_list[0]]['memory'] and
                    mem_usage <= 400000):
                # Match last line from the bottom
                line = self.moms_list[0].log_match(
                    '%s;update_job_usage: Memory usage: mem=' % jid,
                    starttime=begin, n='ALL')
                match = re.search(r'mem=(\d+)kb', line[1])
                mem_usage = int(match.groups()[0])
                self.logger.info("Found mem_usage: %skb" % str(mem_usage))
                if self.swapctl == 'true' and vmem_usage <= 400000:
                    # Match last line from the bottom
                    line = self.moms_list[0].log_match(
                        '%s;update_job_usage: Memory usage: vmem=' % jid,
                        starttime=begin, n='ALL')
                    match = re.search(r'vmem=(\d+)kb', line[1])
                    vmem_usage = int(match.groups()[0])
                    self.logger.info("Found vmem_usage: %skb"
                                     % str(vmem_usage))
            if cput_usage > 1.0 and mem_usage > 400000:
                if self.swapctl == 'true':
                    if vmem_usage > 400000:
                        break
                else:
                    break
            # try to make next loop match the _next_ updates
            # note: we might still be unlucky and just match an old update,
            # but not next time: the loop's sleep will make 'begin' advance
            begin = int(time.time())

        self.assertGreater(cput_usage, 1.0)
        self.assertGreater(mem_usage, 400000)
        if self.swapctl == 'true':
            self.assertGreater(vmem_usage, 400000)

    def test_cgroup_cpuset_and_memory(self):
        """
        Test to verify that the job cgroup is created correctly
        Check to see that cpuset.cpus=0, cpuset.mems=0 and that
        memory.limit_in_bytes = 314572800
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        name = 'CGROUP1'
        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))
        # This test expects the job to land on CPU 0.
        # The previous test may have qdel -Wforce its jobs, and then it takes
        # some time for MoM to run the execjob_epilogue and execjob_end
        # *after* the job has disappeared on the server.
        # So wait a while before restarting MoM
        time.sleep(10)
        # Restart mom for changes made by cgroups hook to take effect
        self.mom.restart()
        a = {'Resource_List.select':
             '1:ncpus=1:mem=300mb:host=%s' % self.hosts_list[0],
             ATTR_N: name, ATTR_k: 'oe'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        fna = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        self.assertFalse(fna is None, 'No job directory for cpuset subsystem')
        fnma = self.get_cgroup_job_dir('memory', jid, self.hosts_list[0])
        self.assertFalse(fnma is None, 'No job directory for memory subsystem')
        memscr = self.du.run_cmd(cmd=[self.cpuset_mem_script % (fna, fnma)],
                                 as_script=True, hosts=self.mom.shortname)
        memscr_out = memscr['out']
        self.logger.info('memscr_out:\n%s' % memscr_out)
        self.assertTrue('CpuIDs=0' in memscr_out)
        self.logger.info('CpuIDs check passed')
        self.assertTrue('MemorySocket=0' in memscr_out)
        self.logger.info('MemorySocket check passed')
        if self.mem == 'true':
            self.assertTrue('MemoryLimit=314572800' in memscr_out)
            self.logger.info('MemoryLimit check passed')

    def test_cgroup_cpuset_and_memsw(self):
        """
        Test to verify that the job cgroup is created correctly
        using the default memory and vmem
        Check to see that cpuset.cpus=0, cpuset.mems=0 and that
        memory.limit_in_bytes = 100663296
        memory.memsw.limit_in_bytes = 201326592
        If there is too little swap, the latter could be smaller
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        name = 'CGROUP2'
        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))
        a = {'Resource_List.select': '1:ncpus=1:host=%s' %
             self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        fn = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        fnm = self.get_cgroup_job_dir('memory', jid, self.hosts_list[0])
        scr = self.du.run_cmd(cmd=[self.cpuset_mem_script % (fn, fnm)],
                              as_script=True, hosts=self.mom.shortname)
        scr_out = scr['out']
        self.logger.info('scr_out:\n%s' % scr_out)
        self.assertTrue('CpuIDs=0' in scr_out)
        self.logger.info('CpuIDs check passed')
        self.assertTrue('MemorySocket=0' in scr_out)
        self.logger.info('MemorySocket check passed')
        if self.mem == 'true':
            self.assertTrue('MemoryLimit=100663296' in scr_out)
            self.logger.info('MemoryLimit check passed')
        if self.swapctl == 'true':
            # Get total phys+swap memory available
            mem_base = os.path.join(self.paths[self.hosts_list[0]]
                                    ['memory'], 'pbs_jobs.service',
                                    'jobid')
            vmem_avail = os.path.join(mem_base,
                                      'memory.memsw.limit_in_bytes')
            result = self.du.cat(hostname=self.mom.hostname,
                                 filename=vmem_avail, sudo=True)
            vmem_avail_in_bytes = None
            try:
                vmem_avail_in_bytes = int(result['out'][0])
            except Exception:
                # None will be seen as a failure, nothing to do
                pass
            self.logger.info("total available memsw: %d"
                             % vmem_avail_in_bytes)
            self.assertTrue(vmem_avail_in_bytes is not None,
                            "Unable to read total memsw available")

            mem_avail = os.path.join(mem_base,
                                     'memory.limit_in_bytes')
            result = self.du.cat(hostname=self.mom.hostname,
                                 filename=mem_avail, sudo=True)
            mem_avail_in_bytes = None
            try:
                mem_avail_in_bytes = int(result['out'][0])
            except Exception:
                # None will be seen as a failure, nothing to do
                pass
            self.logger.info("total available mem: %d"
                             % mem_avail_in_bytes)
            self.assertTrue(mem_avail_in_bytes is not None,
                            "Unable to read total mem available")

            swap_avail_in_bytes = vmem_avail_in_bytes - mem_avail_in_bytes
            MemswLimitExpected = (100663296
                                  + min(100663296, swap_avail_in_bytes))
            self.assertTrue(('MemswLimit=%d' % MemswLimitExpected)
                            in scr_out)
            self.logger.info('MemswLimit check passed')

    def test_cgroup_prefix_and_devices(self):
        """
        Test to verify that the cgroup prefix is set to "sbp" and that
        the devices subsystem exists with the correct devices allowed
        """
        if not self.paths[self.hosts_list[0]]['devices']:
            self.skipTest('Skipping test since no devices subsystem defined')
        name = 'CGROUP3'
        self.load_config(self.cfg2)
        # Restart mom for changes made by cgroups hook to take effect
        self.mom.restart()
        # Make sure to run on the MoM just restarted
        a = {ATTR_N: name}
        a['Resource_List.select'] = \
            '1:ncpus=1:mem=300mb:host=%s' % self.hosts_list[0]
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(600)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        devd = self.paths[self.hosts_list[0]]['devices']
        scr = self.du.run_cmd(
            cmd=[self.check_dirs_script % (jid, devd)],
            as_script=True, hosts=self.mom.shortname)
        scr_out = scr['out']
        self.logger.info('scr_out:\n%s' % scr_out)
        # the config file named entries must be translated to major/minor
        # containers will make them different!!
        # self.du.run_cmd returns a list of one-line strings
        # the console awk command produces major and minor on separate lines
        console_results = \
            self.du.run_cmd(cmd=['ls -al /dev/console'
                                 '| awk \'BEGIN {FS=" |,"} '
                                 '{print $5} {print $7}\''],
                            as_script=True, hosts=self.hosts_list[0])
        (console_major, console_minor) = console_results['out']
        # only one line here
        tty0_major_results = \
            self.du.run_cmd(cmd=['ls -al /dev/tty0'
                                 '| awk \'BEGIN {FS=" |,"} '
                                 '{print $5}\''],
                            as_script=True, hosts=self.hosts_list[0])
        tty0_major = tty0_major_results['out'][0]
        check_devices = ['b *:* rwm',
                         'c %s:%s rwm' % (console_major, console_minor),
                         'c %s:* rwm' % (tty0_major),
                         'c 1:* rwm',
                         'c 10:* rwm']

        for device in check_devices:
            self.assertTrue(device in scr_out,
                            '"%s" not found in: %s' % (device, scr_out))
        self.logger.info('device_list check passed')

    def test_devices_and_gpu_discovery(self):
        """
        Test to verify that if the device subsystem is enabled
        and discover_gpus is true, _discover_gpus is called

        The GPU tests should in theory make this redundant,
        but they require a test harness that has GPUs. This test will
        allow to see if the GPU discovery is at least called even when
        the test harness has no GPUs.
        """
        if not self.paths[self.hosts_list[0]]['devices']:
            self.skipTest('Skipping test since no devices subsystem defined')
        name = 'CGROUP3'
        time.sleep(2)
        begin = int(time.time())
        time.sleep(2)
        self.load_config(self.cfg14 % ('true', 'true'))

        # These will throw an exception if the routines that should not
        # have been called were called.
        # n='ALL' is needed because the cgroup hook is so verbose
        # that 50 lines will not suffice
        self.moms_list[0].log_match('_discover_devices', starttime=begin,
                                    existence=True, max_attempts=2,
                                    interval=1, n='ALL')
        self.moms_list[0].log_match('NVIDIA SMI', starttime=begin,
                                    existence=True, max_attempts=2,
                                    interval=1, n='ALL')
        self.logger.info('devices_and_gpu_discovery check passed')

    def test_suppress_devices_discovery(self):
        """
        Test to verify that if the device subsystem is turned off,
        neither _discover_devices nor _discover_gpus is called
        """
        if not self.paths[self.hosts_list[0]]['devices']:
            self.skipTest('Skipping test since no devices subsystem defined')
        name = 'CGROUP3'
        time.sleep(2)
        begin = int(time.time())
        time.sleep(2)
        self.load_config(self.cfg14 % ('true', 'false'))

        # These will throw an exception if the routines that should not
        # have been called were called.
        # n='ALL' is needed because the cgroup hook is so verbose
        # that 50 lines will not suffice
        self.moms_list[0].log_match('_discover_devices', starttime=begin,
                                    existence=False, max_attempts=2,
                                    interval=1, n='ALL')
        self.moms_list[0].log_match('_discover_gpus', starttime=begin,
                                    existence=False, max_attempts=2,
                                    interval=1, n='ALL')
        self.logger.info('suppress_devices_discovery check passed')

    def test_suppress_gpu_discovery(self):
        """
        Test to verify that if the device subsystem is enabled
        and discover_gpus is false, nvidia-smi is not called
        discover_gpus is called but just returns {}
        """
        if not self.paths[self.hosts_list[0]]['devices']:
            self.skipTest('Skipping test since no devices subsystem defined')
        name = 'CGROUP3'
        time.sleep(2)
        begin = int(time.time())
        time.sleep(2)
        self.load_config(self.cfg14 % ('false', 'true'))

        # These will throw an exception if the routines that should not
        # have been called were called.
        # n='ALL' is needed because the cgroup hook is so verbose
        # that 50 lines will not suffice
        self.moms_list[0].log_match('_discover_devices', starttime=begin,
                                    existence=True, max_attempts=2,
                                    interval=1, n='ALL')
        self.moms_list[0].log_match('NVIDIA SMI', starttime=begin,
                                    existence=False, max_attempts=2,
                                    interval=1, n='ALL')
        self.logger.info('suppress_gpu_discovery check passed')

    def test_cgroup_cpuset(self):
        """
        Test to verify that 2 jobs are not assigned the same cpus
        """
        pcpus = 0
        with open('/proc/cpuinfo', 'r') as desc:
            for line in desc:
                if re.match('^processor', line):
                    pcpus += 1
        if pcpus < 2:
            self.skipTest('Test requires at least two physical CPUs')
        name = 'CGROUP4'
        # since we do not configure vnodes ourselves wait for the setup
        # of this test to propagate all hooks etc.
        # otherwise the load_config tests to see if it's all done
        # might get confused
        # occasional trouble seen on TH2
        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))
        # Submit two jobs
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name + 'a'}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.sleep600_job)
        jid1 = self.server.submit(j1)
        b = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name + 'b'}
        j2 = Job(TEST_USER, attrs=b)
        j2.create_script(self.sleep600_job)
        jid2 = self.server.submit(j2)
        a = {'job_state': 'R'}
        # Make sure they are both running
        self.server.expect(JOB, a, jid1)
        self.server.expect(JOB, a, jid2)
        # cpuset paths for both jobs
        fn1 = self.get_cgroup_job_dir('cpuset', jid1, self.hosts_list[0])
        fn2 = self.get_cgroup_job_dir('cpuset', jid2, self.hosts_list[0])
        # Capture the output of cpuset_mem_script for both jobs
        scr1 = self.du.run_cmd(cmd=[self.cpuset_mem_script % (fn1, None)],
                               as_script=True, hosts=self.hosts_list[0])
        scr1_out = scr1['out']
        self.logger.info('scr1_out:\n%s' % scr1_out)
        scr2 = self.du.run_cmd(cmd=[self.cpuset_mem_script % (fn2, None)],
                               as_script=True, hosts=self.hosts_list[0])
        scr2_out = scr2['out']
        self.logger.info('scr2_out:\n%s' % scr2_out)
        # Ensure the CPU ID for each job differs
        cpuid1 = None
        for kv in scr1_out:
            if 'CpuIDs=' in kv:
                cpuid1 = kv
                break
        self.assertNotEqual(cpuid1, None, 'Could not read first CPU ID.')
        cpuid2 = None
        for kv in scr2_out:
            if 'CpuIDs=' in kv:
                cpuid2 = kv
                break
        self.assertNotEqual(cpuid2, None, 'Could not read second CPU ID.')
        self.logger.info("cpuid1 = %s and cpuid2 = %s" % (cpuid1, cpuid2))
        self.assertNotEqual(cpuid1, cpuid2,
                            'Processes should be assigned to different CPUs')
        self.logger.info('CpuIDs check passed')

    @timeout(1800)
    def test_cgroup_cpuset_ncpus_are_cores(self):
        """
        Test to verify that correct number of jobs run on a hyperthread
        enabled system when ncpus_are_cores is set to true.
        """
        # Check that system has hyperthreading enabled and has
        # at least two threads ("pcpus")
        # WARNING: do not assume that physical CPUs are numbered from 0
        # and that all processors from a physical ID are contiguous
        # count the number of different physical IDs with a set!
        pcpus = 0
        sibs = 0
        cores = 0
        pval = 0
        phys_set = set()
        with open('/proc/cpuinfo', 'r') as desc:
            for line in desc:
                if re.match('^processor', line):
                    pcpus += 1
                sibs_match = re.search(r'siblings	: ([0-9]+)', line)
                cores_match = re.search(r'cpu cores	: ([0-9]+)', line)
                phys_match = re.search(r'physical id	: ([0-9]+)', line)
                if sibs_match:
                    sibs = int(sibs_match.groups()[0])
                if cores_match:
                    cores = int(cores_match.groups()[0])
                if phys_match:
                    pval = int(phys_match.groups()[0])
                    phys_set.add(pval)
        phys = len(phys_set)
        if (sibs == 0 or cores == 0):
            self.skipTest('Insufficient information about the processors.')
        if pcpus < 2:
            self.skipTest('This test requires at least two processors.')
        if sibs / cores == 1:
            self.skipTest('This test requires hyperthreading to be enabled.')

        name = 'CGROUP18'
        self.load_config(self.cfg8 % ('', '', self.mem, '', self.swapctl,
                                      ''))
        # Make sure to restart MOM
        # HUP is not enough to get rid of earlier
        # per socket vnodes created when vnode_per_numa_node=True
        self.mom.restart()

        # Submit M jobs N cpus wide, where M is the amount of physical
        # processors and N is number of 'cpu cores' per M. Expect them to run.
        njobs = phys
        if njobs > 100:
            self.skipTest("too many jobs (%d) to submit" % njobs)
        a = {'Resource_List.select': '1:ncpus=%s:mem=300mb:host=%s' %
             (cores, self.hosts_list[0]), ATTR_N: name + 'a'}
        for _ in range(njobs):
            j = Job(TEST_USER, attrs=a)
            # make sure this stays around for an hour
            # (or until deleted in teardown)
            j.set_sleep_time(3600)
            jid = self.server.submit(j)
            a1 = {'job_state': 'R'}
            # give the scheduler, server and MoM some time
            # it's not a luxury on containers with few CPU resources
            time.sleep(2)
            self.server.expect(JOB, a1, jid)
        # Submit another job, expect in Q state -- this one with only 1 CPU
        b = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name + 'b'}
        j2 = Job(TEST_USER, attrs=b)
        jid2 = self.server.submit(j2)
        b1 = {'job_state': 'Q'}
        # Make sure to give the scheduler ample time here:
        # we want to make sure jid2 doesn't run because it can't,
        # not because the scheduler has not yet gotten to it
        time.sleep(30)
        self.server.expect(JOB, b1, jid2)

    def test_cgroup_enforce_memory(self):
        """
        Test to verify that the job is killed when it tries to
        use more memory than it requested
        """
        if not self.paths[self.hosts_list[0]]['memory'] or not self.mem:
            self.skipTest('Test requires memory subystem mounted')
        name = 'CGROUP5'

        self.load_config(self.cfg3b % ('false'))

        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.eatmem_job1)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        # mem and vmem limit will both be set, and either could be detected
        self.mom.log_match('%s;Cgroup mem(ory|sw) limit exceeded' % jid,
                           regexp=True, n='ALL', starttime=stime)

    def test_cgroup_enforce_memsw(self):
        """
        Test to verify that the job is killed when it tries to
        use more vmem than it requested
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        # run the test if swap space is available
        if not self.mem or not self.swapctl:
            self.skipTest('Test requires memory controller with memsw'
                          'swap accounting enabled')
        if have_swap() == 0:
            self.skipTest('no swap space available on the local host')
        # Get the grandparent directory
        fn = self.paths[self.hosts_list[0]]['memory']
        fn = os.path.join(fn, 'memory.memsw.limit_in_bytes')
        if not self.is_file(fn, self.hosts_list[0]):
            self.skipTest('vmem resource not present on node')

        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))

        name = 'CGROUP6'
        # Make sure output file is gone, otherwise wait and read
        # may pick up stale copy of earlier test
        self.du.rm(runas=TEST_USER, path='~/' + name + '.*', as_script=True)

        a = {
            'Resource_List.select':
            '1:ncpus=1:mem=400mb:vmem=420mb:host=%s' % self.hosts_list[0],
            ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.eatmem_job1)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        filename = j.attributes[ATTR_o]
        ehost = j.attributes['exec_host']
        tmp_file = filename.split(':')[1]
        tmp_host = ehost.split('/')[0]
        tmp_out = self.wait_and_read_file(filename=tmp_file, host=tmp_host)
        self.tempfile.append(tmp_file)
        success = False
        foundstr = ''
        if tmp_out == []:
            success = False
        else:
            joined_out = '\n'.join(tmp_out)
            if 'Cgroup memsw limit exceeded' in joined_out:
                success = True
                foundstr = 'Cgroup memsw limit exceeded'
            elif 'Cgroup mem limit exceeded' in joined_out:
                success = True
                foundstr = 'Cgroup mem limit exceeded'
            elif 'MemoryError' in joined_out:
                success = True
                foundstr = 'MemoryError'
        self.assertTrue(success, 'No Cgroup memory/memsw limit exceeded '
                        'or MemoryError found in joined stdout/stderr')
        self.logger.info('Joined stdout/stderr contained expected string: '
                         + foundstr)

    def test_cgroup_diag_messages(self):
        """
        Test to verify that job that exceeded resources has the diag_message
        set correctly.
        """

        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        # run the test if swap space is available
        if not self.mem or not self.swapctl:
            self.skipTest('Test requires memory controller with memsw'
                          'swap accounting enabled')
        if have_swap() == 0:
            self.skipTest('no swap space available on the local host')
        # Get the grandparent directory
        fn = self.paths[self.hosts_list[0]]['memory']
        fn = os.path.join(fn, 'memory.memsw.limit_in_bytes')
        if not self.is_file(fn, self.hosts_list[0]):
            self.skipTest('vmem resource not present on node')

        # Make sure job history is enabled to see when job is gone
        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        self.assertEqual(rc, 0)

        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))

        a = {
            'Resource_List.select':
            '1:ncpus=1:mem=400mb:vmem=420mb:host=%s' % self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.eatmem_job1)
        jid = self.server.submit(j)
        a = {'job_state': 'F'}
        self.server.expect(JOB, a, jid, extend='x', offset=10)
        resc = ['resources_used.diag_messages']
        s = self.server.status(JOB, resc, id=jid, extend='x')
        dmsg = s[0]['resources_used.diag_messages'].replace("'", "")
        json_exceeded = json.loads(dmsg)
        msg = json_exceeded[self.mom.shortname]
        self.assertEqual(msg, 'Cgroup mem limit exceeded, '
                         'Cgroup memsw limit exceeded')

    def cgroup_offline_node(self, name, vnpernuma=False):
        """
        Per vnode_per_numa_node config setting, return True if able to
        verify that the node is offlined when it can't clean up the cgroup
        and brought back online once the cgroup is cleaned up.
        """

        # Make sure job history is enabled to see when job is gone
        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        self.assertEqual(rc, 0)
        self.server.expect(SERVER, {'job_history_enable': 'True'})

        if 'freezer' not in self.paths[self.hosts_list[0]]:
            self.skipTest('Freezer cgroup is not mounted')
        # Get the grandparent directory
        fdir = self.paths[self.hosts_list[0]]['freezer']
        if not self.is_dir(fdir, self.hosts_list[0]):
            self.skipTest('Freezer cgroup is not found')
        # Configure the hook
        self.load_config(self.cfg3 % ('', vnpernuma, '', self.mem, '',
                                      self.swapctl, ''))
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], 'Resource_List.walltime': 600, ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        job_status = self.server.status(JOB, id=jid)
        filename = j.attributes[ATTR_o]
        tmp_file = filename.split(':')[1]
        self.tempfile.append(tmp_file)
        self.logger.info("Added %s to temp files to clean up"
                         % tmp_file)
        self.logger.info("Job session ID is apparently %s"
                         % str(j.attributes['session_id']))
        # Query the pids in the cgroup
        jdir = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        tasks_file = os.path.join(jdir, 'tasks')
        time.sleep(2)
        ret = self.du.cat(self.hosts_list[0], tasks_file, sudo=True)
        tasks = ret['out']
        if len(tasks) < 2:
            self.skipTest('pbs_cgroups_hook: only one task in cgroup')
        self.logger.info('Tasks: %s' % tasks)
        self.assertTrue(tasks, 'No tasks in cpuset cgroup for job')
        # Make dir in freezer subsystem under directory where we
        # have delegate control from systemd
        fdir_pbs = os.path.join(fdir, 'pbs_jobs.service', 'PtlPbs')
        if not self.du.isdir(self.hosts_list[0], fdir_pbs):
            self.du.mkdir(hostname=self.hosts_list[0], path=fdir_pbs,
                          mode=0o755, sudo=True)
        # Write PIDs into the tasks file for the freezer cgroup
        # All except the top job process -- it remains thawed to
        # let the job exit
        task_file = os.path.join(fdir_pbs, 'tasks')
        success = True
        body = ''
        for pidstr in tasks:
            if pidstr.strip() == j.attributes['session_id']:
                self.logger.info('Skipping top job process ' + pidstr)
            else:
                cmd = ['echo ' + pidstr + ' >>' + task_file]
                ret = self.du.run_cmd(hosts=self.hosts_list[0],
                                      cmd=cmd,
                                      sudo=True,
                                      as_script=True)
                if ret['rc'] != 0:
                    success = False
                    self.logger.info('Failed to put %s into %s on %s' %
                                     (pidstr, task_file, self.hosts_list[0]))
                    self.logger.info('rc = %d', ret['rc'])
                    self.logger.info('stdout = %s', ret['out'])
                    self.logger.info('stderr = %s', ret['err'])
        if not success:
            self.skipTest('pbs_cgroups_hook: Failed to copy freezer tasks')

        # Freeze the cgroup
        freezer_file = os.path.join(fdir_pbs, 'freezer.state')
        state = 'FROZEN'
        fn = self.du.create_temp_file(body=state)
        self.tempfile.append(fn)
        ret = self.du.run_copy(self.hosts_list[0], src=fn,
                               dest=freezer_file, sudo=True,
                               uid='root', gid='root',
                               mode=0o644)
        if ret['rc'] != 0:
            self.skipTest('pbs_cgroups_hook: Failed to copy '
                          'freezer state FROZEN')

        confirmed_frozen = False

        for count in range(30):
            ret = self.du.cat(hostname=self.hosts_list[0],
                              filename=freezer_file,
                              sudo=True)
            if ret['rc'] != 0:
                self.logger.info("Cannot confirm freezer state"
                                 "sleeping 30 seconds instead")
                time.sleep(30)
                break
            if ret['out'][0] == 'FROZEN':
                self.logger.info("job processes reported as FROZEN")
                confirmed_frozen = True
                break
            else:
                self.logger.info("freezer state reported as "
                                 + ret['out'][0])
                time.sleep(1)

        if not confirmed_frozen:
            self.logger.info("Freezer did not work; skip test after cleanup")

        # Catch any exception so we can thaw the cgroup or the jobs
        # will remain frozen and impact subsequent tests
        passed = True

        # Now delete the job
        try:
            self.server.delete(id=jid)
        except Exception as exc:
            passed = False
            self.logger.info('Job could not be deleted')

        if confirmed_frozen:
            # The cgroup hook should fail to clean up the cgroups
            # because of the freeze, and offline node
            # Note that when vnode per numa node is enabled, this
            # will take longer: the execjob_epilogue will first mark
            # the per-socket vnode offline, but only the exechost_periodic
            # will mark the natural node offline
            try:
                self.server.expect(NODE, {'state': (MATCH_RE, 'offline')},
                                   id=self.nodes_list[0], offset=10,
                                   interval=3)
            except Exception as exc:
                passed = False
                self.logger.info('Node never went offline')

        # Thaw the cgroup
        state = 'THAWED'
        fn = self.du.create_temp_file(body=state)
        self.tempfile.append(fn)
        ret = self.du.run_copy(self.hosts_list[0], src=fn,
                               dest=freezer_file, sudo=True,
                               uid='root', gid='root',
                               mode=0o644)

        if ret['rc'] != 0:
            # Skip the test at the end when this happens,
            # but still attempt to clean up!
            confirmed_frozen = False

        # First confirm the processes were thawed
        for count in range(30):
            ret = self.du.cat(hostname=self.hosts_list[0],
                              filename=freezer_file,
                              sudo=True)
            if ret['rc'] != 0:
                self.logger.info("Cannot confirm freezer state"
                                 "sleeping 30 seconds instead")
                time.sleep(30)
                break
            if ret['out'][0] == 'THAWED':
                self.logger.info("job processes reported as THAWED")
                break
            else:
                self.logger.info("freezer state reported as "
                                 + ret['out'][0])
                time.sleep(1)

        # once the freezer is thawed, all the processes should receive
        # the cgroup hook's kill signal and disappear;
        # confirm they're gone before deleting freezer
        freezer_tasks = os.path.join(fdir_pbs, 'tasks')
        for count in range(30):
            ret = self.du.cat(hostname=self.hosts_list[0],
                              filename=freezer_tasks,
                              sudo=True)
            if ret['rc'] != 0:
                self.logger.info("Cannot confirm freezer tasks"
                                 "sleeping 30 seconds instead")
                time.sleep(30)
                break
            if ret['out'] == [] or ret['out'][0] == '':
                self.logger.info("Processes in thawed freezer are gone")
                break
            else:
                self.logger.info("tasks still in thawed freezer: "
                                 + str(ret['out']))
                time.sleep(1)

        cmd = ["rmdir", fdir_pbs]
        self.logger.info("Removing %s" % fdir_pbs)
        self.du.run_cmd(self.hosts_list[0], cmd=cmd, sudo=True)
        # Due to orphaned jobs node is not coming back to free state
        # workaround is to recreate the nodes. Orphaned jobs will
        # get cleaned up in tearDown hence not doing it here

        # try deleting the job once more, to ensure that the node isn't
        # busy
        try:
            self.server.delete(id=jid)
        except Exception as exc:
            pass

        bs = {'job_state': 'F'}
        self.server.expect(JOB, bs, jid, extend='x', offset=1)

        if not confirmed_frozen:
            self.cgroup_recreate_nodes()
            self.skipTest('Could not confirm freeze/thaw worked')

        return passed

    def cgroup_recreate_nodes(self):
        """
        Since the job delete action was purposefully bent out of shape,
        node state might stay busy for some time
        retry until it works -- this is for the sanity of the next
        test
        """
        for count in range(30):
            try:
                self.server.manager(MGR_CMD_DELETE, NODE, None, "")
                self.logger.info('Managed to delete nodes')
                break
            except Exception:
                self.logger.info('Failed to delete nodes (still busy?)')
                time.sleep(1)

        for host in self.hosts_list:
            try:
                self.server.manager(MGR_CMD_CREATE, NODE, id=host)
            except Exception:
                # the delete might have failed and then the create will,
                # but still confirm the node goes back to free state
                pass
            self.server.expect(NODE, {'state': 'free'},
                               id=host, interval=3)

    def test_cgroup_offline_node_preserve_comment(self):
        """
        Test to verify that offlined node that is bring back online
        preserves custom comment.
        """
        a = {'comment': "foo bar"}
        self.server.manager(MGR_CMD_SET, NODE, a, self.hosts_list[0])
        name = 'CGROUP7.1'
        vn_per_numa = 'false'
        rv = self.cgroup_offline_node(name, vn_per_numa)
        self.assertTrue(rv)
        a = {'comment': "foo bar"}
        self.server.expect(NODE, a, id=self.hosts_list[0])
        self.cgroup_recreate_nodes()

    def test_cgroup_offline_node(self):
        """
        Test to verify that the node is offlined when it can't clean up
        the cgroup and brought back online once the cgroup is cleaned up.
        vnode_per_numa_node = false
        """
        name = 'CGROUP7.1'
        vn_per_numa = 'false'
        rv = self.cgroup_offline_node(name, vn_per_numa)
        self.assertTrue(rv)
        self.cgroup_recreate_nodes()

    def test_cgroup_offline_node_vnpernuma(self):
        """
        Test to verify that the node is offlined when it can't clean up
        the cgroup and brought back online once the cgroup is cleaned up.
        vnode_per_numa_node = true
        """
        with open(os.path.join(os.sep, 'proc', 'meminfo'), 'r') as fd:
            meminfo = fd.read()
        if 'Hugepagesize' not in meminfo:
            self.skipTest('Hugepagesize not in meminfo')
        name = 'CGROUP7.2'
        vn_per_numa = 'true'
        rv = self.cgroup_offline_node(name, vn_per_numa)
        self.assertTrue(rv)
        self.cgroup_recreate_nodes()

    @requirements(num_moms=2)
    def test_cgroup_cpuset_host_excluded(self):
        """
        Test to verify that cgroups subsystems are not enforced on nodes
        that have the exclude_hosts set but are enforced on other systems
        """
        name = 'CGROUP10'
        mom, _ = self.get_host_names(self.hosts_list[0])
        self.load_config(self.cfg1 % ('', '', '', '%s' % mom,
                                      self.mem, self.swapctl))
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        hostn = self.get_hostname(self.hosts_list[0])
        self.moms_list[0].log_match('cgroup excluded for subsystem cpuset '
                                    'on host %s' % hostn,
                                    starttime=stime, n='ALL')
        cpath = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[0]))
        # Now try a job on momB
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[1], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid2 = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid2)
        cpath = self.get_cgroup_job_dir('cpuset', jid2, self.hosts_list[1])
        self.logger.info('Checking for %s on %s' % (cpath, self.moms_list[1]))
        self.assertTrue(self.is_dir(cpath, self.hosts_list[1]))

    @requirements(num_moms=2)
    def test_cgroup_run_on_host(self):
        """
        Test to verify that the cgroup hook only runs on nodes
        in the run_only_on_hosts
        """
        name = 'CGROUP11'
        mom, log = self.get_host_names(self.hosts_list[0])
        self.load_config(self.cfg1 % ('', '', '%s' % mom, '',
                                      self.mem, self.swapctl))
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[1], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        hostn = self.get_hostname(self.hosts_list[1])
        self.moms_list[1].log_match(
            'set enabled to False based on run_only_on_hosts',
            starttime=stime, n='ALL')
        cpath = self.get_cgroup_job_dir('memory', jid, self.hosts_list[1])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[1]))
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid2 = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid2)
        self.server.status(JOB, ATTR_o, jid2)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        cpath = self.get_cgroup_job_dir('memory', jid2, self.hosts_list[0])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[0]))

    def test_cgroup_qstat_resources(self):
        """
        Test to verify that cgroups are reporting usage for
        mem, and vmem in qstat
        """
        name = 'CGROUP14'
        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))
        a = {'Resource_List.select': '1:ncpus=1:mem=500mb', ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.eatmem_job2)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        host = j.attributes['exec_host']
        self.logger.info('OUTPUT: %s' % o)
        resc_list = ['resources_used.cput']
        resc_list += ['resources_used.mem']
        resc_list += ['resources_used.vmem']
        qstat1 = self.server.status(JOB, resc_list, id=jid)
        for q in qstat1:
            self.logger.info('Q1: %s' % q)
        cput1 = qstat1[0]['resources_used.cput']
        mem1 = qstat1[0]['resources_used.mem']
        vmem1 = qstat1[0]['resources_used.vmem']
        self.logger.info('Waiting 35 seconds for CPU time to accumulate')
        time.sleep(35)
        qstat2 = self.server.status(JOB, resc_list, id=jid)
        for q in qstat2:
            self.logger.info('Q2: %s' % q)
        cput2 = qstat2[0]['resources_used.cput']
        mem2 = qstat2[0]['resources_used.mem']
        vmem2 = qstat2[0]['resources_used.vmem']
        self.assertNotEqual(cput1, cput2)
        self.assertNotEqual(mem1, mem2)
        # Check vmem only if system has swap control
        if self.swapctl == 'true':
            self.assertNotEqual(vmem1, vmem2)

    def test_cgroup_reserve_mem(self):
        """
        Test to verify that the mom reserve memory for OS
        when there is a reserve mem request in the config.
        Install cfg3 and then cfg4 and measure difference
        between the amount of available memory and memsw.
        For example, on a system with 1GB of physical memory
        and 1GB of active swap. With cfg3 in place, we should
        see 1GB - 50MB = 950MB of available memory and
        2GB - (50MB + 45MB) = 1905MB of available vmem.
        With cfg4 in place, we should see 1GB - 100MB = 900MB
        of available memory and 2GB - (100MB + 90MB) = 1810MB
        of available vmem. When we calculate the differences
        we get:
        mem: 950MB - 900MB = 50MB = 51200KB
        vmem: 1905MB - 1810MB = 95MB = 97280KB
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=3, offset=10)
        if self.swapctl == 'true':
            vmem = self.server.status(NODE, 'resources_available.vmem',
                                      id=self.nodes_list[0])
            self.logger.info('vmem: %s' % str(vmem))
            vmem1 = PbsTypeSize(vmem[0]['resources_available.vmem'])
            self.logger.info('Vmem-1: %s' % vmem1.value)
        mem = self.server.status(NODE, 'resources_available.mem',
                                 id=self.nodes_list[0])
        mem1 = PbsTypeSize(mem[0]['resources_available.mem'])
        self.logger.info('Mem-1: %s' % mem1.value)
        self.load_config(self.cfg4 % (self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=3, offset=10)
        if self.swapctl == 'true':
            vmem = self.server.status(NODE, 'resources_available.vmem',
                                      id=self.nodes_list[0])
            vmem2 = PbsTypeSize(vmem[0]['resources_available.vmem'])
            self.logger.info('Vmem-2: %s' % vmem2.value)
            vmem_resv = vmem1 - vmem2
            if (vmem_resv.unit == 'b'):
                vmem_resv_bytes = vmem_resv.value
            elif (vmem_resv.unit == 'kb'):
                vmem_resv_bytes = vmem_resv.value * 1024
            elif (vmem_resv.unit == 'mb'):
                vmem_resv_bytes = vmem_resv.value * 1024 * 1024
            self.logger.info('Vmem resv diff in bytes: %s' % vmem_resv_bytes)
            # rounding differences may make diff slighly smaller than we expect
            # accept 1MB deviation as irrelevant
            # Note: since we don't know if there is swap, memsw reserved
            # increase might not have been heeded. Change this to a higher
            # value (cfr. above) only on test harnesses that have enough swap
            self.assertGreaterEqual(vmem_resv_bytes, (51200 - 1024) * 1024)
        mem = self.server.status(NODE, 'resources_available.mem',
                                 id=self.nodes_list[0])
        mem2 = PbsTypeSize(mem[0]['resources_available.mem'])
        self.logger.info('Mem-2: %s' % mem2.value)
        mem_resv = mem1 - mem2
        if (mem_resv.unit == 'b'):
            mem_resv_bytes = mem_resv.value
        elif (mem_resv.unit == 'kb'):
            mem_resv_bytes = mem_resv.value * 1024
        elif (mem_resv.unit == 'mb'):
            mem_resv_bytes = mem_resv.value * 1024 * 1024
        self.logger.info('Mem resv diff in bytes: %s' % mem_resv_bytes)
        # rounding differences may make diff slighly smaller than we expect
        # accept 1MB deviation as irrelevant
        self.assertGreaterEqual(mem_resv_bytes, (51200 - 1024) * 1024)

    @requirements(num_moms=2)
    def test_cgroup_multi_node(self):
        """
        Test multi-node jobs with cgroups
        """
        name = 'CGROUP16'
        self.load_config(self.cfg6 % (self.mem, self.swapctl))
        a = {'Resource_List.select': '2:ncpus=1:mem=100mb',
             'Resource_List.place': 'scatter', ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep30_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, 'exec_host', jid)
        ehost = j.attributes['exec_host']
        tmp_host = ehost.split('+')
        ehost1 = tmp_host[0].split('/')[0]
        ehjd1 = self.get_cgroup_job_dir('memory', jid, ehost1)
        self.assertTrue(self.is_dir(ehjd1, ehost1),
                        'Missing memory subdirectory: %s' % ehjd1)
        ehost2 = tmp_host[1].split('/')[0]
        ehjd2 = self.get_cgroup_job_dir('memory', jid, ehost2)
        self.assertTrue(self.is_dir(ehjd2, ehost2),
                        'Missing memory subdirectory: %s' % ehjd2)
        # Wait for job to finish and make sure that cgroup directories
        # has been cleaned up by the hook
        self.server.expect(JOB, 'queue', op=UNSET, offset=30, interval=1,
                           id=jid)
        self.assertFalse(self.is_dir(ehjd1, ehost1),
                         'Directory still present: %s' % ehjd1)
        self.assertFalse(self.is_dir(ehjd2, ehost2),
                         'Directory still present: %s' % ehjd2)

    def test_cgroup_job_array(self):
        """
        Test that cgroups are created for subjobs like a regular job
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        name = 'CGROUP17'
        self.load_config(self.cfg1 % ('', '', '', '', self.mem, self.swapctl))
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name, ATTR_J: '1-4',
             'Resource_List.place': 'pack:excl'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(60)
        jid = self.server.submit(j)
        a = {'job_state': 'B'}
        self.server.expect(JOB, a, jid)
        # Get subjob ID
        subj1 = jid.replace('[]', '[1]')
        self.server.expect(JOB, {'job_state': 'R'}, subj1)
        rv = self.server.status(JOB, ['exec_host'], subj1)
        ehost = rv[0].get('exec_host')
        ehost1 = ehost.split('/')[0]
        # Verify that cgroups files created for subjobs
        # but not for parent job array
        cpath = self.get_cgroup_job_dir('memory', subj1, ehost1)
        self.assertTrue(self.is_dir(cpath, ehost1))
        cpath = self.get_cgroup_job_dir('memory', jid, ehost1)
        self.assertFalse(self.is_dir(cpath, ehost1))
        # Verify that subjob4 is queued and no cgroups
        # files are created for queued subjob
        subj4 = jid.replace('[]', '[4]')
        self.server.expect(JOB, {'job_state': 'Q'}, id=subj4)
        cpath = self.get_cgroup_job_dir('memory', subj4, ehost1)
        self.assertFalse(self.is_dir(cpath, self.hosts_list[0]))
        # Delete subjob1 and verify that cgroups files are cleaned up
        self.server.delete(id=subj1)
        self.server.expect(JOB, {'job_state': 'X'}, subj1)
        cpath = self.get_cgroup_job_dir('memory', subj1, ehost1)
        self.assertFalse(self.is_dir(cpath, ehost1))
        # Verify if subjob2 is running
        subj2 = jid.replace('[]', '[2]')
        self.server.expect(JOB, {'job_state': 'R'}, id=subj2)
        # Force delete the subjob and verify cgroups
        # files are cleaned up
        self.server.delete(id=subj2, extend='force')
        self.server.expect(JOB, {'job_state': 'X'}, subj2)
        # Adding extra sleep for file to clean up
        # since qdel -Wforce changed state of subjob
        # without waiting for MoM
        # retry 10 times (for 20 seconds max. in total)
        # if the directory is still there...
        cpath = self.get_cgroup_job_dir('memory', subj2, ehost1)
        for trial in range(0, 10):
            time.sleep(2)
            if not self.is_dir(cpath, ehost1):
                # we're done
                break
        self.assertFalse(self.is_dir(cpath, ehost1))

    @requirements(num_moms=2)
    def test_cgroup_cleanup(self):
        """
        Test that cgroups files are cleaned up after qdel
        """
        self.load_config(self.cfg1 % ('', '', '', '', self.mem, self.swapctl))
        a = {'Resource_List.select': '2:ncpus=1:mem=100mb',
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ['exec_host'], jid)
        ehost = j.attributes['exec_host']
        tmp_host = ehost.split('+')
        ehost1 = tmp_host[0].split('/')[0]
        ehost2 = tmp_host[1].split('/')[0]
        ehjd1 = self.get_cgroup_job_dir('cpuset', jid, ehost1)
        self.assertTrue(self.is_dir(ehjd1, ehost1))
        ehjd2 = self.get_cgroup_job_dir('cpuset', jid, ehost2)
        self.assertTrue(self.is_dir(ehjd2, ehost2))
        self.server.delete(id=jid, wait=True)
        self.assertFalse(self.is_dir(ehjd1, ehost1))
        self.assertFalse(self.is_dir(ehjd2, ehost2))

    def test_cgroup_execjob_end_should_delete_cgroup(self):
        """
        Test to verify that if execjob_epilogue hook failed to run or to
        clean up cgroup files for a job, execjob_end hook should clean
        them up
        """
        self.load_config(self.cfg4 % (self.mem, self.swapctl))
        # remove epilogue and periodic from the list of events
        attr = {'enabled': 'True',
                'event': ['execjob_begin', 'execjob_launch',
                          'execjob_attach', 'execjob_end', 'exechost_startup']}
        self.server.manager(MGR_CMD_SET, HOOK, attr, self.hook_name)
        self.server.expect(NODE, {'state': 'free'}, id=self.nodes_list[0])
        j = Job(TEST_USER)
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        # wait for job to finish
        self.server.expect(JOB, 'queue', id=jid, op=UNSET,
                           interval=1, offset=1)
        # verify that cgroup files for this job are gone even if
        # epilogue and periodic events are disabled
        for subsys, path in self.paths[self.hosts_list[0]].items():
            # only check under subsystems that are enabled
            enabled_subsys = ['cpuacct', 'cpuset', 'memory', 'memsw']
            if (any([x in subsys for x in enabled_subsys])):
                continue
            if path:
                # Following code only works with recent hooks
                # and default cgroup_prefix
                # change the path if testing with older hooks
                # see comments in get_cgroup_job_dir()
                filename = os.path.join(path,
                                        'pbs_jobs.service',
                                        'jobid', str(jid))
                self.logger.info('Checking that file %s should not exist'
                                 % filename)
                self.assertFalse(self.du.isfile(self.hosts_list[0], filename))

    @skipOnCray
    def test_cgroup_assign_resources_mem_only_vnode(self):
        """
        Test to verify that job requesting mem larger than any single vnode
        works properly
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')

        # vnode_per_numa_node enabled, so we get per-socket vnodes
        self.load_config(self.cfg3
                         % ('', 'true', '', self.mem, '', self.swapctl, ''))
        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=self.hosts_list[0]+'[0]')
        socket1_found = False
        nodestat = self.server.status(NODE)
        total_kb = 0
        for node in nodestat:
            if (self.mom.shortname + '[') not in node['id']:
                self.logger.info('Skipping vnode %s' % node['id'])
            else:
                if node['id'] == self.mom.shortname + '[0]':
                    self.logger.info('Found socket 0, vnode %s'
                                     % node['id'])
                if node['id'] == self.mom.shortname + '[1]':
                    socket1_found = True
                    self.logger.info('Found socket 1, vnode %s '
                                     '(multi socket!)'
                                     % node['id'])
                # PbsTypeSize value is in kb
                node_kb = PbsTypeSize(node['resources_available.mem']).value
                self.logger.info('Vnode %s memory: %skb'
                                 % (node['id'], node_kb))
                total_kb += node_kb
        total_mb = int(total_kb / 1024)
        self.logger.info("Total memory on first MoM: %smb" % total_mb)
        if not socket1_found:
            self.skipTest('Test requires more than one NUMA node '
                          '(i.e. "socket") on first host')
        memreq_mb = total_mb - 2
        a = {'Resource_List.select':
             '1:ncpus=1:host=%s:mem=%smb'
             % (self.mom.shortname, str(memreq_mb))}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script('date')
        jid1 = self.server.submit(j1)
        # Job should finish and thus dequeued
        self.server.expect(JOB, 'queue', id=jid1, op=UNSET,
                           interval=1, offset=1)
        a = {'Resource_List.select':
             '1:ncpus=1:host=%s:mem=%smb'
             % (self.mom.shortname, str(memreq_mb + 1024))}
        j3 = Job(TEST_USER, attrs=a)
        j3.create_script('date')
        jid3 = self.server.submit(j3)
        # Will either start with "Can Never Run" or "Not Running"
        # Don't match only one
        a = {'job_state': 'Q',
             'comment':
             (MATCH_RE,
              '.*: Insufficient amount of resource: mem.*')}
        self.server.expect(JOB, a, attrop=PTL_AND, id=jid3, offset=10,
                           interval=1)

    @timeout(1800)
    def test_cgroup_cpuset_exclude_cpu(self):
        """
        Confirm that exclude_cpus reduces resources_available.ncpus
        """
        # Fetch the unmodified value of resources_available.ncpus
        self.load_config(self.cfg5 % ('false', '', 'false', 'false',
                                      'false', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=1)
        result = self.server.status(NODE, 'resources_available.ncpus',
                                    id=self.nodes_list[0])
        orig_ncpus = int(result[0]['resources_available.ncpus'])
        self.assertGreater(orig_ncpus, 0)
        self.logger.info('Original value of ncpus: %d' % orig_ncpus)
        if orig_ncpus < 2:
            self.skipTest('Node must have at least two CPUs')
        # Now exclude CPU zero
        self.load_config(self.cfg5 % ('false', '0', 'false', 'false',
                                      'false', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=1)
        result = self.server.status(NODE, 'resources_available.ncpus',
                                    id=self.nodes_list[0])
        new_ncpus = int(result[0]['resources_available.ncpus'])
        self.assertGreater(new_ncpus, 0)
        self.logger.info('New value with one CPU excluded: %d' % new_ncpus)
        self.assertEqual((new_ncpus + 1), orig_ncpus)
        # Repeat the process with vnode_per_numa_node set to true
        vnode = '%s[0]' % self.nodes_list[0]
        self.load_config(self.cfg5 % ('true', '', 'false', 'false',
                                      'false', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=vnode, interval=1)
        result = self.server.status(NODE, 'resources_available.ncpus',
                                    id=vnode)
        orig_ncpus = int(result[0]['resources_available.ncpus'])
        self.assertGreater(orig_ncpus, 0)
        self.logger.info('Original value of vnode ncpus: %d' % orig_ncpus)
        # Exclude CPU zero again
        self.load_config(self.cfg5 % ('true', '0', 'false', 'false',
                                      'false', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=vnode, interval=1)
        result = self.server.status(NODE, 'resources_available.ncpus',
                                    id=vnode)
        new_ncpus = int(result[0]['resources_available.ncpus'])
        self.assertEqual((new_ncpus + 1), orig_ncpus)

    def test_cgroup_cpuset_mem_fences(self):
        """
        Confirm that mem_fences affects setting of cpuset.mems
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        # Get the grandparent directory
        cpuset_base = self.paths[self.hosts_list[0]]['cpuset']
        cpuset_mems = os.path.join(cpuset_base, 'cpuset.mems')
        result = self.du.cat(hostname=self.hosts_list[0], filename=cpuset_mems,
                             sudo=True)
        if result['rc'] != 0 or result['out'][0] == '0':
            self.skipTest('Test requires two NUMA nodes')
        # First try with mem_fences set to true (the default)
        self.load_config(self.cfg5 % ('false', '', 'true', 'false',
                                      'false', self.mem, self.swapctl))
        # Do not use node_list -- vnode_per_numa_node is NOW off
        # so use the natural node. Otherwise might 'expect' stale vnode
        self.server.expect(NODE, {'state': 'free'},
                           id=self.hosts_list[0], interval=3, offset=10)
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' %
             self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        fn = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        fn = os.path.join(fn, 'cpuset.mems')
        result = self.du.cat(hostname=self.hosts_list[0],
                             filename=fn, sudo=True)
        self.assertEqual(result['rc'], 0)
        value_mem_fences = result['out'][0]
        self.logger.info("value with mem_fences: %s" % value_mem_fences)
        self.server.delete(jid, wait=True)

        # Now try with mem_fences set to false
        self.load_config(self.cfg5 % ('false', '', 'false', 'false',
                                      'false', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=3, offset=10)
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' %
             self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        fn = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        fn = os.path.join(fn, 'cpuset.mems')
        result = self.du.cat(hostname=self.hosts_list[0],
                             filename=fn, sudo=True)
        self.assertEqual(result['rc'], 0)
        # compare mem value under mem_fences and under no mem_fences
        value_no_mem_fences = result['out'][0]
        self.logger.info("value with no mem_fences:%s" % value_no_mem_fences)
        self.assertNotEqual(value_no_mem_fences, value_mem_fences)

    def test_cgroup_cpuset_mem_hardwall(self):
        """
        Confirm that mem_hardwall affects setting of cpuset.mem_hardwall
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')

        self.load_config(self.cfg5 % ('false', '', 'true', 'false',
                                      'false', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=3, offset=10)
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' %
             self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        memh_path = 'cpuset.mem_hardwall'
        fn = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        if self.noprefix:
            memh_path = 'mem_hardwall'
        fn = os.path.join(fn, memh_path)
        self.logger.info('fn is %s' % fn)
        if not (self.is_file(fn, self.hosts_list[0])):
            self.skipTest('cgroup mem_hardwall of job does not exist')
        result = self.du.cat(hostname=self.hosts_list[0],
                             filename=fn, sudo=True)
        self.assertEqual(result['rc'], 0)
        self.assertEqual(result['out'][0], '0')
        self.server.delete(jid, wait=True)

        self.load_config(self.cfg5 % ('false', '', 'true', 'true',
                                      'false', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=3, offset=10)
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' %
             self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        fn = self.get_cgroup_job_dir('cpuset', jid, self.hosts_list[0])
        fn = os.path.join(fn, memh_path)
        if not (self.is_file(fn, self.hosts_list[0])):
            self.skipTest('cgroup mem_hardwall of job does not exist')
        result = self.du.cat(hostname=self.hosts_list[0],
                             filename=fn, sudo=True)
        self.assertEqual(result['rc'], 0)
        self.assertEqual(result['out'][0], '1')

    def test_cgroup_find_gpus(self):
        """
        Confirm that the hook finds the correct number of GPUs.
        Note: This assumes all GPUs have the same MIG configuration,
        either on or off.
        """
        if not self.paths[self.hosts_list[0]]['devices']:
            self.skipTest('Skipping test since no devices subsystem defined')
        name = 'CGROUP3'
        self.load_config(self.cfg2)

        cmd = ['nvidia-smi', '-L']
        try:
            rv = self.du.run_cmd(hosts=self.moms_list[0].hostname, cmd=cmd)
        except OSError:
            rv = {'err': True}
        if rv['err'] or 'GPU' not in rv['out'][0]:
            self.skipTest('Skipping test since nvidia-smi not found')
        last_gpu_was_physical = False
        gpus = 0
        # store uuids of the MIG devices
        uuid_list = []
        for l in rv['out']:
            if l.startswith('GPU'):
                last_gpu_was_physical = True
                gpus += 1
            elif l.lstrip().startswith('MIG'):
                uuid_list.append(l.split()[-1].rstrip(")"))
                if last_gpu_was_physical:
                    gpus -= 1
                last_gpu_was_physical = False
                gpus += 1
        if gpus < 1:
            self.skipTest('Skipping test since no gpus found on %s'
                          % (self.nodes_list[0]))
        ngpus_stat = self.server.status(NODE, id=self.nodes_list[0])[0]
        self.logger.info("pbsnodes for %s reported: %s"
                         % (self.nodes_list[0], ngpus_stat))
        self.assertTrue('resources_available.ngpus' in ngpus_stat,
                        "No resources_available.ngpus found on node %s"
                        % (self.nodes_list[0]))
        ngpus = int(ngpus_stat['resources_available.ngpus'])
        self.assertEqual(gpus, ngpus, 'ngpus is incorrect')
        a = {'Resource_List.select': '1:ngpus=1', ATTR_N: name}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.check_gpu_script)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        filename = j.attributes[ATTR_o]
        self.tempfile.append(filename)
        ehost = j.attributes['exec_host']
        tmp_file = filename.split(':')[1]
        tmp_host = ehost.split('/')[0]
        tmp_out = self.wait_and_read_file(filename=tmp_file, host=tmp_host)

        mig_devices_in_use = tmp_out[-1]
        for mig_device in mig_devices_in_use.split(","):
            self.assertIn(mig_device, uuid_list,
                          "MIG identifiers do not match")

        self.logger.info(tmp_out)
        self.assertIn('There are 1 GPUs', tmp_out, 'No gpus were assigned')
        self.assertIn('c 195:255 rwm', tmp_out, 'Nvidia controller not found')
        m = re.search(r'195:(?!255)', '\n'.join(tmp_out))
        self.assertIsNotNone(m.group(0), 'No gpu assigned in cgroups')

    def test_cgroup_cpuset_memory_spread_page(self):
        """
        Confirm that mem_spread_page affects setting of
        cpuset.memory_spread_page
        """
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')

        self.load_config(self.cfg5 % ('false', '', 'true', 'false',
                                      'false', self.mem, self.swapctl))
        nid = self.nodes_list[0]
        self.server.expect(NODE, {'state': 'free'}, id=nid,
                           interval=3, offset=10)
        hostn = self.hosts_list[0]
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' % hostn}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        spread_path = 'cpuset.memory_spread_page'
        fn = self.get_cgroup_job_dir('cpuset', jid, hostn)
        if self.noprefix:
            spread_path = 'memory_spread_page'
        fn = os.path.join(fn, spread_path)
        self.assertTrue(self.is_file(fn, hostn))
        result = self.du.cat(hostname=hostn, filename=fn, sudo=True)
        self.assertEqual(result['rc'], 0)
        self.assertEqual(result['out'][0], '0')
        self.server.delete(jid, wait=True)

        self.load_config(self.cfg5 % ('false', '', 'true', 'false',
                                      'true', self.mem, self.swapctl))
        self.server.expect(NODE, {'state': 'free'}, id=nid,
                           interval=3, offset=10)
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' % hostn}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, ATTR_o, jid)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        fn = self.get_cgroup_job_dir('cpuset', jid, hostn)
        fn = os.path.join(fn, spread_path)
        result = self.du.cat(hostname=hostn, filename=fn, sudo=True)
        self.assertEqual(result['rc'], 0)
        self.assertEqual(result['out'][0], '1')

    def test_cgroup_use_hierarchy(self):
        """
        Test that memory.use_hierarchy is enabled by default
        when PBS cgroups hook is instantiated
        """
        # Remove PBS directories from memory subsystem
        cpath = None
        if ('memory' in self.paths[self.hosts_list[0]] and
                self.paths[self.hosts_list[0]]['memory']):
            cdir = self.paths[self.hosts_list[0]]['memory']
            cpath = self.find_main_cpath(cdir)
        else:
            self.skipTest(
                "memory subsystem is not enabled for cgroups")
        if cpath is not None:
            cmd = ["rmdir", cpath]
            self.du.run_cmd(cmd=cmd, sudo=True, hosts=self.hosts_list[0])
        self.logger.info("Removing %s" % cpath)
        self.load_config(self.cfg6 % (self.mem, self.swapctl))
        # check where cpath is once more
        # since we loaded a new cgroup config file
        cpath = None
        if ('memory' in self.paths[self.hosts_list[0]] and
                self.paths[self.hosts_list[0]]['memory']):
            cdir = self.paths[self.hosts_list[0]]['memory']
            cpath = self.find_main_cpath(cdir)
        # Verify that memory.use_hierarchy is enabled
        fpath = os.path.join(cpath, "memory.use_hierarchy")
        self.logger.info("looking for file %s" % fpath)
        rc = self.du.isfile(hostname=self.hosts_list[0], path=fpath)
        if rc:
            ret = self.du.cat(hostname=self.hosts_list[0], filename=fpath,
                              logerr=False)
            val = (' '.join(ret['out'])).strip()
            self.assertEqual(
                val, "1", "%s is not equal to 1" % val)
            self.logger.info("memory.use_hierarchy is enabled")
        else:
            self.assertFalse(1, "File %s not present" % fpath)

    def test_cgroup_periodic_update_known_jobs(self):
        """
        Verify that jobs known to mom are updated, not orphans
        """
        conf = {'freq': 5, 'order': 100}
        self.server.manager(MGR_CMD_SET, HOOK, conf, self.hook_name)
        self.load_config(self.cfg3 % ('', 'false', '', self.mem, '',
                                      self.swapctl, ''))
        # Submit a short job and let it run to completion
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' %
             self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep5_job)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid1 = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid1)
        self.server.status(JOB, ATTR_o, jid1)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        err_msg = "Unexpected error in pbs_cgroups " + \
            "handling exechost_periodic event: TypeError"
        self.moms_list[0].log_match(err_msg, max_attempts=3,
                                    interval=1, n='ALL',
                                    starttime=stime,
                                    existence=False)
        self.server.log_match(jid1 + ';Exit_status=0', n='ALL',
                              starttime=stime)
        # Create a periodic hook that runs more frequently than the
        # cgroup hook to prepend jid1 to mom_priv/hooks/hook_data/cgroup_jobs
        hookname = 'prependjob'
        hookbody = """
import pbs
import os
import re
import time
import traceback
event = pbs.event()
jid_to_prepend = '%s'
pbs_home = ''
pbs_mom_home = ''
if 'PBS_HOME' in os.environ:
    pbs_home = os.environ['PBS_HOME']
if 'PBS_MOM_HOME' in os.environ:
    pbs_mom_home = os.environ['PBS_MOM_HOME']
pbs_conf = pbs.get_pbs_conf()
if pbs_conf:
    if not pbs_home and 'PBS_HOME' in pbs_conf:
        pbs_home = pbs_conf['PBS_HOME']
    if not pbs_mom_home and 'PBS_MOM_HOME' in pbs_conf:
        pbs_mom_home = pbs_conf['PBS_MOM_HOME']
if not pbs_home or not pbs_mom_home:
    if 'PBS_CONF_FILE' in os.environ:
        pbs_conf_file = os.environ['PBS_CONF_FILE']
    else:
        pbs_conf_file = os.path.join(os.sep, 'etc', 'pbs.conf')
    regex = re.compile(r'\\s*([^\\s]+)\\s*=\\s*([^\\s]+)\\s*')
    try:
        with open(pbs_conf_file, 'r') as desc:
            for line in desc:
                match = regex.match(line)
                if match:
                    if not pbs_home and match.group(1) == 'PBS_HOME':
                        pbs_home = match.group(2)
                    if not pbs_mom_home and (match.group(1) ==
                                             'PBS_MOM_HOME'):
                        pbs_mom_home = match.group(2)
    except Exception:
        pass
if not pbs_home:
    pbs.logmsg(pbs.EVENT_DEBUG, 'Failed to locate PBS_HOME')
    event.reject()
if not pbs_mom_home:
    pbs_mom_home = pbs_home
jobsfile = os.path.join(pbs_mom_home, 'mom_priv', 'hooks',
                        'hook_data', 'cgroup_jobs')
try:
    with open(jobsfile, 'r+') as desc:
        jobdict = eval(desc.read())
        if jid_to_prepend not in jobdict:
            jobdict[jid_to_prepend] = time.time()
            desc.seek(0)
            desc.write(str(jobdict))
            desc.truncate()
except Exception as exc:
    pbs.logmsg(pbs.EVENT_DEBUG, 'Failed to modify ' + jobsfile)
    pbs.logmsg(pbs.EVENT_DEBUG,
               str(traceback.format_exc().strip().splitlines()))
    event.reject()
event.accept()
""" % jid1
        events = ['execjob_begin', 'exechost_periodic']
        hookconf = {'enabled': 'True', 'freq': 2, 'alarm': 30, 'event': events}
        self.server.create_import_hook(hookname, hookconf, hookbody,
                                       overwrite=True)
        # Submit a second job and verify that the following message
        # does NOT appear in the mom log:
        # _exechost_periodic_handler: Failed to update jid1
        a = {'Resource_List.select': '1:ncpus=1:mem=100mb:host=%s' %
             self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        # Here a short job is OK, since we are waiting for it to end
        j.create_script(self.sleep30_job)
        time.sleep(2)
        presubmit = int(time.time())
        time.sleep(2)
        jid2 = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid2)
        self.server.status(JOB, ATTR_o, jid2)
        o = j.attributes[ATTR_o]
        self.tempfile.append(o)
        err_msg = "Unexpected error in pbs_cgroups " + \
            "handling exechost_periodic event: TypeError"
        self.moms_list[0].log_match(err_msg, max_attempts=3,
                                    interval=1, n='ALL',
                                    starttime=presubmit,
                                    existence=False)
        self.server.log_match(jid2 + ';Exit_status=0', n='ALL',
                              starttime=presubmit)
        self.server.manager(MGR_CMD_DELETE, HOOK, None, hookname)
        command = ['rm', '-rf',
                   os.path.join(self.moms_list[0].pbs_conf['PBS_HOME'],
                                'mom_priv', 'hooks', 'hook_data',
                                'cgroup_jobs')]
        self.du.run_cmd(cmd=command, hosts=self.hosts_list[0], sudo=True)
        logmsg = '_exechost_periodic_handler: Failed to update %s' % jid1
        self.moms_list[0].log_match(msg=logmsg, starttime=presubmit,
                                    n='ALL', max_attempts=1, existence=False)

    @requirements(num_moms=3)
    def test_cgroup_release_nodes(self):
        """
        Verify that exec_vnode values are trimmed
        when execjob_launch hook prunes job via release_nodes(),
        tolerate_node_failures=job_start
        """
        self.load_config(self.cfg7 % (self.mem, self.mem))
        # instantiate queuejob hook
        hook_event = 'queuejob'
        hook_name = 'qjob'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)
        # instantiate execjob_launch hook
        hook_event = 'execjob_launch'
        hook_name = 'launch'
        a = {'event': hook_event, 'enabled': 'true'}
        self.keep_select = 'e.job.Resource_List["site"]'
        self.server.create_import_hook(
            hook_name, a, self.launch_hook_body % (self.keep_select))
        # Submit a job that requires 2 nodes
        j = Job(TEST_USER)
        j.create_script(self.job_scr2 % (self.hosts_list[1]))
        jid = self.server.submit(j)
        # Check the exec_vnode while in substate 41
        self.server.expect(JOB, {ATTR_substate: '41'}, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode1 = job_stat[0]['exec_vnode']
        self.logger.info("initial exec_vnode: %s" % execvnode1)
        initial_vnodes = execvnode1.split('+')
        # Check the exec_vnode after job is in substate 42
        self.server.expect(JOB, {ATTR_substate: '42'}, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode2 = job_stat[0]['exec_vnode']
        self.logger.info("pruned exec_vnode: %s" % execvnode2)
        pruned_vnodes = execvnode2.split('+')
        # Check that the pruned exec_vnode has one less than initial value
        self.assertEqual(len(pruned_vnodes) + 1, len(initial_vnodes))
        # Find the released vnode
        for vn in initial_vnodes:
            if vn not in pruned_vnodes:
                rel_vn = vn
        vnodeB = rel_vn.split(':')[0].split('(')[1]
        self.logger.info("released vnode: %s" % vnodeB)
        # Submit a second job requesting the released vnode, job runs
        j2 = Job(TEST_USER,
                 {ATTR_l + '.select': '1:ncpus=1:mem=100mb:vnode=%s' % vnodeB})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

    @requirements(num_moms=3)
    def test_cgroup_sismom_resize_fail(self):
        """
        Verify that exec_vnode values are trimmed
        when execjob_launch hook prunes job via release_nodes(),
        exec_job_resize failure in sister mom,
        tolerate_node_failures=job_start
        """
        self.load_config(self.cfg7 % (self.mem, self.mem))
        # instantiate queuejob hook
        hook_event = 'queuejob'
        hook_name = 'qjob'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)
        # instantiate execjob_launch hook
        hook_event = 'execjob_launch'
        hook_name = 'launch'
        a = {'event': hook_event, 'enabled': 'true'}
        self.keep_select = 'e.job.Resource_List["site"]'
        self.server.create_import_hook(
            hook_name, a, self.launch_hook_body % (self.keep_select))
        # instantiate execjob_resize hook
        hook_event = 'execjob_resize'
        hook_name = 'resize'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.resize_hook_body % ('not'))
        # Submit a job that requires 2 nodes
        j = Job(TEST_USER)
        # Note mother superior is mom[1] not mom[0]
        j.create_script(self.job_scr2 % (self.hosts_list[1]))
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        # Check the exec_vnode while in substate 41
        self.server.expect(JOB, {ATTR_substate: '41'}, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode1 = job_stat[0]['exec_vnode']
        self.logger.info("initial exec_vnode: %s" % execvnode1)
        # Check the exec_resize hook reject message in sister mom logs
        self.moms_list[0].log_match(
            "Job;%s;Cannot resize the job" % (jid),
            starttime=stime, interval=2, n='ALL')
        # Check that MS saw that the sister mom failed to update the job
        # This message is on MS mom[1] but mentions sismom mom[0]
        self.moms_list[1].log_match(
            "Job;%s;sister node %s.* failed to update job"
            % (jid, self.hosts_list[0]),
            starttime=stime, interval=2, regexp=True, n='ALL')
        # Because of resize hook reject Mom failed to update the job.
        # Check that job got requeued.
        self.server.log_match("Job;%s;Job requeued" % (jid),
                              starttime=stime, n='ALL')

    @requirements(num_moms=3)
    def test_cgroup_msmom_resize_fail(self):
        """
        Verify that exec_vnode values are trimmed
        when execjob_launch hook prunes job via release_nodes(),
        exec_job_resize failure in mom superior,
        tolerate_node_failures=job_start
        """
        self.load_config(self.cfg7 % (self.mem, self.mem))
        # instantiate queuejob hook
        hook_event = 'queuejob'
        hook_name = 'qjob'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)
        # instantiate execjob_launch hook
        hook_event = 'execjob_launch'
        hook_name = 'launch'
        a = {'event': hook_event, 'enabled': 'true'}
        self.keep_select = 'e.job.Resource_List["site"]'
        self.server.create_import_hook(
            hook_name, a, self.launch_hook_body % (self.keep_select))
        # instantiate execjob_resize hook
        hook_event = 'execjob_resize'
        hook_name = 'resize'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.resize_hook_body % (''))
        # Submit a job that requires 2 nodes
        j = Job(TEST_USER)
        j.create_script(self.job_scr2 % (self.hosts_list[1]))
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        # Check the exec_vnode while in substate 41
        self.server.expect(JOB, {ATTR_substate: '41'}, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode1 = job_stat[0]['exec_vnode']
        self.logger.info("initial exec_vnode: %s" % execvnode1)
        # Check the exec_resize hook reject message in MS log
        self.moms_list[1].log_match(
            "Job;%s;Cannot resize the job" % (jid),
            starttime=stime, interval=2, n='ALL')
        # Because of resize hook reject Mom failed to update the job.
        # Check that job got requeued
        self.server.log_match("Job;%s;Job requeued" % (jid), starttime=stime)

    @requirements(num_moms=3)
    def test_cgroup_msmom_nodes_only(self):
        """
        Verify that exec_vnode values are trimmed
        when execjob_launch hook prunes job via release_nodes(),
        job is using only vnodes from mother superior host,
        tolerate_node_failures=job_start
        """
        self.load_config(self.cfg7 % (self.mem, self.mem))
        # disable queuejob hook
        hook_event = 'queuejob'
        hook_name = 'qjob'
        a = {'event': hook_event, 'enabled': 'false'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)
        # instantiate execjob_launch hook
        hook_event = 'execjob_launch'
        hook_name = 'launch'
        a = {'event': hook_event, 'enabled': 'true'}
        self.keep_select = '"ncpus=1:mem=100mb"'
        self.server.create_import_hook(
            hook_name, a, self.launch_hook_body % (self.keep_select))
        # disable execjob_resize hook
        hook_event = 'execjob_resize'
        hook_name = 'resize'
        a = {'event': hook_event, 'enabled': 'false'}
        self.server.create_import_hook(
            hook_name, a, self.resize_hook_body % (''))
        # Submit a job that requires two vnodes
        j = Job(TEST_USER)
        j.create_script(self.job_scr3)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        # Check the exec_vnode while in substate 41
        self.server.expect(JOB, {ATTR_substate: '41'}, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode1 = job_stat[0]['exec_vnode']
        self.logger.info("initial exec_vnode: %s" % execvnode1)
        initial_vnodes = execvnode1.split('+')
        # Check the exec_vnode after job is in substate 42
        self.server.expect(JOB, {ATTR_substate: '42'}, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode2 = job_stat[0]['exec_vnode']
        self.logger.info("pruned exec_vnode: %s" % execvnode2)
        pruned_vnodes = execvnode2.split('+')
        # Check that the pruned exec_vnode has one less than initial value
        self.assertEqual(len(pruned_vnodes) + 1, len(initial_vnodes))
        # Check that the exec_vnode got pruned
        self.moms_list[0].log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, execvnode1), starttime=stime, n='ALL')
        self.moms_list[0].log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, execvnode2), starttime=stime, n='ALL')
        # Find out the released vnode
        if initial_vnodes[0] == execvnode2:
            execvnodeB = initial_vnodes[1]
        else:
            execvnodeB = initial_vnodes[0]
        vnodeB = execvnodeB.split(':')[0].split('(')[1]
        self.logger.info("released vnode: %s" % vnodeB)
        # Submit job2 requesting the released vnode, job runs
        j2 = Job(TEST_USER, {
            ATTR_l + '.select': '1:ncpus=1:mem=100mb:vnode=%s' % vnodeB})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

    @requirements(num_moms=3)
    def test_cgroups_abort(self):
        """
        Verify that if one of the sister mom is down then
        cgroups hook will call the abort event which will
        cleanup the cgroups files on sister moms and primary
        mom
        """
        self.logger.info("Stopping mom on host %s" % self.hosts_list[1])
        self.moms_list[1].signal('-19')

        a = {'Resource_List.select':
             '1:ncpus=1:host=%s+1:ncpus=1:host=%s+1:ncpus=1:host=%s' %
             (self.hosts_list[0], self.hosts_list[1], self.hosts_list[2])}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R', 'substate': '41'}
        self.server.expect(JOB, a, jid)

        self.logger.info("Killing mom on host %s" % self.hosts_list[1])
        time.sleep(2)
        now = int(time.time())
        time.sleep(2)
        self.moms_list[1].signal('-9')

        self.server.expect(NODE, {'state': "down"}, id=self.hosts_list[1])
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        # Verify that cgroups directories are cleaned on primary mom
        cpath = self.get_cgroup_job_dir('memory', jid, self.hosts_list[0])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[0]))

        # Verify that cgroups directories are cleaned by execjob_abort
        # hook on sister mom
        cpath = self.get_cgroup_job_dir('memory', jid, self.hosts_list[2])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[2]))

        self.moms_list[0].log_match("job_start_error",
                                    starttime=now, n='ALL')
        self.moms_list[0].log_match("Event type is execjob_abort",
                                    starttime=now, n='ALL')
        self.moms_list[0].log_match("Event type is execjob_epilogue",
                                    starttime=now, n='ALL')
        self.moms_list[0].log_match("Event type is execjob_end",
                                    starttime=now, n='ALL')
        self.moms_list[2].log_match("Event type is execjob_abort",
                                    starttime=now, n='ALL')

        self.moms_list[1].pi.restart()
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    @timeout(1800)
    def test_big_cgroup_cpuset(self):
        """
        With vnodes_per_numa and use_hyperthreads set to "true",
        test to verify that a job requesting at least 10 vnodes
        (i.e. 10 memory sockets) get a cgroup cpuset with the
        correct number of cpus and memory sockets.
        """
        name = 'CGROUP_BIG'
        self.load_config(self.cfg9 % (self.mem, self.mem))

        vnodes_count = 10
        try:
            self.server.expect(VNODE, {'state=free': vnodes_count},
                               op=GE, count=True, interval=2)
        except Exception as exc:
            self.skipTest("Test require >= %d free vnodes" % (vnodes_count,))

        rncpus = 'resources_available.ncpus'
        a = {rncpus: (GT, 0), 'state': 'free'}
        free_nodes = self.server.filter(VNODE, a, attrop=PTL_AND, idonly=False)
        vnodes = list(free_nodes.values())[0]
        self.assertGreaterEqual(len(vnodes), vnodes_count,
                                'Test does not have enough free vnodes')
        # find the minimum number of cpus found among the vnodes
        cpus_per_vnode = None
        for v in vnodes:
            v_rncpus = int(v[rncpus])
            if not cpus_per_vnode:
                cpus_per_vnode = v_rncpus
            if v_rncpus < cpus_per_vnode:
                cpus_per_vnode = v_rncpus

        # Submit a job
        select_spec = "%d:ncpus=%d" % (vnodes_count, cpus_per_vnode)
        a = {'Resource_List.select': select_spec, ATTR_N: name + 'a'}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.sleep600_job)
        jid1 = self.server.submit(j1)
        a = {'job_state': 'R'}
        # Make sure job is running
        self.server.expect(JOB, a, jid1)
        # cpuset path for job
        fn1 = self.get_cgroup_job_dir('cpuset', jid1, self.hosts_list[0])
        # Capture the output of cpuset_mem_script for job
        scr1 = self.du.run_cmd(cmd=[self.cpuset_mem_script % (fn1, None)],
                               as_script=True, hosts=self.hosts_list[0])
        tmp_out1 = scr1['out']
        self.logger.info("test output for job1: %s" % (tmp_out1))
        # Ensure the number of cpus assigned matches request
        cpuids = None
        for kv in tmp_out1:
            if 'CpuIDs=' in kv:
                cpuids = kv.split("=")[1]
                break
        cpus_assn = count_items(cpuids)
        cpus_req = vnodes_count * cpus_per_vnode
        self.logger.info("CpuIDs assn=%d req=%d" % (cpus_assn, cpus_req))
        self.assertEqual(cpus_assn, cpus_req,
                         'CpuIDs assigned did not match requested')
        self.logger.info('CpuIDs check passed')

        # Ensure the number of sockets assigned matches request
        memsocket = None
        for kv in tmp_out1:
            if 'MemorySocket=' in kv:
                memsocket = kv.split("=")[1]
                break
        mem_assn = count_items(memsocket)
        self.logger.info("MemSocket assn=%d req=%d" % (mem_assn, vnodes_count))
        self.assertEqual(mem_assn, vnodes_count,
                         'MemSocket assigned not match requested')
        self.logger.info('MemSocket check passed')

    @requirements(num_moms=2)
    def test_checkpoint_abort_preemption(self):
        """
        Test to make sure that when scheduler preempts a multi-node job with
        checkpoint_abort, execjob_abort cgroups hook on secondary node
        gets called.  The abort hook cleans up assigned cgroups, allowing
        the higher priority job to run on the same node.
        """
        # create express queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "express")

        # have scheduler preempt lower priority jobs using 'checkpoint'
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'C'})

        # have moms do checkpoint_abort
        chk_script = """#!/bin/bash
kill $1
exit 0
"""
        a = {'resources_available.ncpus': 1}
        for m in self.moms.values():
            chk_file = m.add_checkpoint_abort_script(body=chk_script)
            # ensure resulting checkpoint file has correct permission
            self.du.chown(hostname=m.shortname, path=chk_file, uid=0, gid=0,
                          sudo=True)
            self.server.manager(MGR_CMD_SET, NODE, a, id=m.shortname)

        # submit multi-node job
        a = {'Resource_List.select': '1:ncpus=1:host=%s+1:ncpus=1:host=%s' % (
            self.hosts_list[0], self.hosts_list[1]),
            'Resource_List.place': 'scatter:exclhost'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        # to work around a scheduling race, check for substate 42
        # if you test for R then a slow job startup might update
        # resources_assigned late and make scheduler overcommit nodes
        # and run both jobs
        self.server.expect(JOB, {'substate': '42'}, id=jid1)

        # Submit an express queue job requesting needing also 2 nodes
        a[ATTR_q] = 'express'
        j2 = Job(TEST_USER, attrs=a)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        err_msg = "%s;.*Failed to assign resources.*" % (jid2,)
        for m in self.moms.values():
            m.log_match(err_msg, max_attempts=3, interval=1, starttime=stime,
                        regexp=True, existence=False, n='ALL')

        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid2)

    @requirements(num_moms=2)
    def test_checkpoint_restart(self):
        """
        Test to make sure that when a preempted and checkpointed multi-node
        job restarts, execjob_begin cgroups hook gets called on both mother
        superior and sister moms.
        """
        # create express queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "express")

        # have scheduler preempt lower priority jobs using 'checkpoint'
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'C'})

        # have moms do checkpoint_abort
        chk_script = """#!/bin/bash
kill $1
exit 0
"""
        restart_script = """#!/bin/bash
sleep 300
"""
        a = {'resources_available.ncpus': 1}
        for m in self.moms.values():
            # add checkpoint script
            m.add_checkpoint_abort_script(body=chk_script)
            m.add_restart_script(body=restart_script, abort_time=300)
            self.server.manager(MGR_CMD_SET, NODE, a, id=m.shortname)

        # submit multi-node job
        a = {'Resource_List.select': '1:ncpus=1:host=%s+1:ncpus=1:host=%s' % (
            self.hosts_list[0], self.hosts_list[1]),
            'Resource_List.place': 'scatter:exclhost'}
        j1 = Job(TEST_USER, attrs=a)
        j1.set_sleep_time(300)
        jid1 = self.server.submit(j1)
        # to work around a scheduling race, check for substate 42
        # if you test for R then a slow job startup might update
        # resources_assigned late and make scheduler overcommit nodes
        # and run both jobs
        self.server.expect(JOB, {'substate': '42'}, id=jid1)
        time.sleep(5)
        cpath = self.get_cgroup_job_dir('cpuset', jid1, self.hosts_list[0])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[0]))
        cpath = self.get_cgroup_job_dir('cpuset', jid1, self.hosts_list[1])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[1]))

        # Submit an express queue job requesting needing also 2 nodes
        a[ATTR_q] = 'express'
        j2 = Job(TEST_USER, attrs=a)
        j2.set_sleep_time(300)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        self.server.expect(JOB, {'substate': '42'}, id=jid2)
        time.sleep(5)
        cpath = self.get_cgroup_job_dir('cpuset', jid2, self.hosts_list[0])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[0]))
        cpath = self.get_cgroup_job_dir('cpuset', jid2, self.hosts_list[1])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[1]))

        # delete express queue job
        self.server.delete(jid2)
        # wait until the preempted job is sent to MoM again
        # the checkpointing script hangs, so it stays in substate 41
        self.server.expect(JOB, {'job_state': 'R', 'substate': 41}, id=jid1)
        # we need to give the hooks some time here...
        time.sleep(10)
        # check the cpusets for the deleted preemptor are gone
        cpath = self.get_cgroup_job_dir('cpuset', jid2, self.hosts_list[0])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[0]))
        cpath = self.get_cgroup_job_dir('cpuset', jid2, self.hosts_list[1])
        self.assertFalse(self.is_dir(cpath, self.hosts_list[1]))
        # check the cpusets for the restarted formerly-preempted are there
        cpath = self.get_cgroup_job_dir('cpuset', jid1, self.hosts_list[0])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[0]))
        cpath = self.get_cgroup_job_dir('cpuset', jid1, self.hosts_list[1])
        self.assertTrue(self.is_dir(cpath, self.hosts_list[1]))

    def test_cpu_controller_enforce_default(self):
        """
        Test an enabled cgroup 'cpu' controller with quotas enforced
        using default (non-specified) values of cfs_period_us, and
        cfs_quota_fudge_factor.
        """
        root_quota_host1 = None
        try:
            root_quota_host1_str = \
                self.du.run_cmd(hosts=self.hosts_list[0],
                                cmd=['cat',
                                     '/sys/fs/cgroup/cpu/cpu.cfs_quota_us'])
            root_quota_host1 = int(root_quota_host1_str['out'][0])
        except Exception:
            pass
        # If that link is missing and it's only
        # mounted under the cpu/cpuacct unified directory...
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/'
                                         'cpu,cpuacct/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass
        # If still not found, try to see if it is in a unified cgroup mount
        # as in cgroup v2
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass

        if root_quota_host1 is None:
            self.skipTest('cpu group controller test: '
                          'could not determine root cfs_quota_us')
        elif root_quota_host1 != -1:
            self.skipTest('cpu group controller test: '
                          'root cfs_quota_us is not unlimited, cannot test '
                          'cgroup hook CPU quotas in this environment')

        name = 'CGROUP1'
        self.load_config(self.cfg10 % (self.mem, self.mem))
        default_cfs_period_us = 100000
        default_cfs_quota_fudge_factor = 1.03

        # Restart mom for changes made by cgroups hook to take effect
        self.mom.restart()
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=1)
        result = self.server.status(NODE, 'resources_available.ncpus',
                                    id=self.nodes_list[0])
        orig_ncpus = int(result[0]['resources_available.ncpus'])
        self.assertGreater(orig_ncpus, 0)
        self.logger.info('Original value of ncpus: %d' % orig_ncpus)
        if orig_ncpus >= 2:
            ncpus_req = 2
        else:
            ncpus_req = 1

        a = {'Resource_List.select':
             "ncpus=%d" % ncpus_req,
             ATTR_N: name, ATTR_k: 'oe'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        fna = self.get_cgroup_job_dir('cpu', jid, self.hosts_list[0])
        self.assertFalse(fna is None, 'No job directory for cpu subsystem')
        cpu_scr = self.du.run_cmd(cmd=[self.cpu_controller_script % fna],
                                  as_script=True, hosts=self.hosts_list[0])
        cpu_scr_out = cpu_scr['out']
        self.logger.info('cpu_scr_out:\n%s' % cpu_scr_out)

        shares_match = (ncpus_req * 1000)
        self.assertTrue("cpu_shares=%d" % shares_match in cpu_scr_out)
        self.logger.info("cpu_shares check passed (match %d)" % shares_match)

        self.assertTrue("cpu_cfs_period_us=%d" %
                        (default_cfs_period_us) in cpu_scr_out)
        self.logger.info("cpu_cfs_period_us check passed (match %d)" %
                         (default_cfs_period_us))

        cfs_quota_us_match = default_cfs_period_us * \
            ncpus_req * default_cfs_quota_fudge_factor
        self.assertTrue("cpu_cfs_quota_us=%d" %
                        (cfs_quota_us_match) in cpu_scr_out)
        self.logger.info("cpu_cfs_quota_us check passed (match %d)" %
                         (cfs_quota_us_match))

    def test_cpu_controller_enforce(self):
        """
        Test an enabled cgroup 'cpu' controller with quotas enforced,
        using specific values to:
              cfs_period_us
              cfs_quota_fudge_factor
        in config file 'cfg11'.
        """
        root_quota_host1 = None
        try:
            root_quota_host1_str = \
                self.du.run_cmd(hosts=self.hosts_list[0],
                                cmd=['cat',
                                     '/sys/fs/cgroup/cpu/cpu.cfs_quota_us'])
            root_quota_host1 = int(root_quota_host1_str['out'][0])
        except Exception:
            pass
        # If that link is missing and it's only
        # mounted under the cpu/cpuacct unified directory...
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/'
                                         'cpu,cpuacct/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass
        # If still not found, try to see if it is in a unified cgroup mount
        # as in cgroup v2
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass

        if root_quota_host1 is None:
            self.skipTest('cpu group controller test: '
                          'could not determine root cfs_quota_us')
        elif root_quota_host1 != -1:
            self.skipTest('cpu group controller test: '
                          'root cfs_quota_us is not unlimited, cannot test '
                          'cgroup hook CPU quotas in this environment')

        name = 'CGROUP1'
        cfs_period_us = 200000
        cfs_quota_fudge_factor = 1.05
        self.load_config(self.cfg11 % (self.mem, self.mem,
                                       cfs_period_us, cfs_quota_fudge_factor))
        self.server.expect(NODE, {'state': 'free'},
                           id=self.nodes_list[0], interval=1)
        result = self.server.status(NODE, 'resources_available.ncpus',
                                    id=self.nodes_list[0])
        orig_ncpus = int(result[0]['resources_available.ncpus'])
        self.assertGreater(orig_ncpus, 0)
        self.logger.info('Original value of ncpus: %d' % orig_ncpus)
        if orig_ncpus >= 2:
            ncpus_req = 2
        else:
            ncpus_req = 1
        a = {'Resource_List.select':
             "ncpus=%d" % ncpus_req,
             ATTR_N: name, ATTR_k: 'oe'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        fna = self.get_cgroup_job_dir('cpu', jid, self.hosts_list[0])
        self.assertFalse(fna is None, 'No job directory for cpu subsystem')
        cpu_scr = self.du.run_cmd(cmd=[self.cpu_controller_script % fna],
                                  as_script=True, hosts=self.hosts_list[0])
        cpu_scr_out = cpu_scr['out']
        self.logger.info('cpu_scr_out:\n%s' % cpu_scr_out)
        shares_match = (ncpus_req * 1000)
        self.assertTrue("cpu_shares=%d" % shares_match in cpu_scr_out)
        self.logger.info("cpu_shares check passed (match %d)" % shares_match)

        self.assertTrue("cpu_cfs_period_us=%d" %
                        (cfs_period_us) in cpu_scr_out)
        self.logger.info(
            "cpu_cfs_period_us check passed (match %d)" % (cfs_period_us))
        cfs_quota_us_match = cfs_period_us * ncpus_req * cfs_quota_fudge_factor
        self.assertTrue("cpu_cfs_quota_us=%d" %
                        (cfs_quota_us_match) in cpu_scr_out)
        self.logger.info("cpu_cfs_quota_us check passed (match %d)" %
                         (cfs_quota_us_match))

    def test_cpu_controller_enforce_default_zero_job(self):
        """
        Test an enabled cgroup 'cpu' controller with quotas enforced
        on zero-cpu job, using default (non-specified) values of:
              cfs_period_us
              cfs_quota_fudge_factor
              zero_cpus_shares_fraction
              zero_cpus_quota_fraction
        """
        root_quota_host1 = None
        try:
            root_quota_host1_str = \
                self.du.run_cmd(hosts=self.hosts_list[0],
                                cmd=['cat',
                                     '/sys/fs/cgroup/cpu/cpu.cfs_quota_us'])
            root_quota_host1 = int(root_quota_host1_str['out'][0])
        except Exception:
            pass
        # If that link is missing and it's only
        # mounted under the cpu/cpuacct unified directory...
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/'
                                         'cpu,cpuacct/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass
        # If still not found, try to see if it is in a unified cgroup mount
        # as in cgroup v2
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass

        if root_quota_host1 is None:
            self.skipTest('cpu group controller test: '
                          'could not determine root cfs_quota_us')
        elif root_quota_host1 != -1:
            self.skipTest('cpu group controller test: '
                          'root cfs_quota_us is not unlimited, cannot test '
                          'cgroup hook CPU quotas in this environment')

        name = 'CGROUP1'
        # config file 'cfg12' has 'allow_zero_cpus=true' under cpuset, to allow
        # zero-cpu jobs.
        self.load_config(self.cfg12 % (self.mem, self.mem))
        default_cfs_period_us = 100000
        default_cfs_quota_fudge_factor = 1.03
        default_zero_shares_fraction = 0.002
        default_zero_quota_fraction = 0.2
        # Restart mom for changes made by cgroups hook to take effect
        self.mom.restart()
        a = {'Resource_List.select': 'ncpus=0',
             ATTR_N: name, ATTR_k: 'oe'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        fna = self.get_cgroup_job_dir('cpu', jid, self.hosts_list[0])
        self.assertFalse(fna is None, 'No job directory for cpu subsystem')
        cpu_scr = self.du.run_cmd(cmd=[self.cpu_controller_script % fna],
                                  as_script=True, hosts=self.hosts_list[0])
        cpu_scr_out = cpu_scr['out']
        self.logger.info('cpu_scr_out:\n%s' % cpu_scr_out)
        shares_match = (default_zero_shares_fraction * 1000)
        self.assertTrue("cpu_shares=%d" % shares_match in cpu_scr_out)
        self.logger.info("cpu_shares check passed (match %d)" % shares_match)

        self.assertTrue("cpu_cfs_period_us=%d" %
                        (default_cfs_period_us) in cpu_scr_out)
        self.logger.info("cpu_cfs_period_us check passed (match %d)" %
                         (default_cfs_period_us))
        cfs_quota_us_match = default_cfs_period_us * \
            default_zero_quota_fraction * default_cfs_quota_fudge_factor
        self.assertTrue("cpu_cfs_quota_us=%d" %
                        (cfs_quota_us_match) in cpu_scr_out)
        self.logger.info("cpu_cfs_quota_us check passed (match %d)" %
                         (cfs_quota_us_match))

    def test_cpu_controller_enforce_zero_job(self):
        """
        Test an enabled cgroup 'cpu' controller with quotas enforced on a
        zero-cpu job. Quotas are enforced using specific values to:
              cfs_period_us
              cfs_quota_fudge_factor
              zero_cpus_shares_fraction
              zero_cpus_quota_fraction
        in config file 'cfg13'.
        """
        root_quota_host1 = None
        try:
            root_quota_host1_str = \
                self.du.run_cmd(hosts=self.hosts_list[0],
                                cmd=['cat',
                                     '/sys/fs/cgroup/cpu/cpu.cfs_quota_us'])
            root_quota_host1 = int(root_quota_host1_str['out'][0])
        except Exception:
            pass
        # If that link is missing and it's only
        # mounted under the cpu/cpuacct unified directory...
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/'
                                         'cpu,cpuacct/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass
        # If still not found, try to see if it is in a unified cgroup mount
        # as in cgroup v2
        if root_quota_host1 is None:
            try:
                root_quota_host1_str = \
                    self.du.run_cmd(hosts=self.hosts_list[0],
                                    cmd=['cat',
                                         '/sys/fs/cgroup/cpu.cfs_quota_us'])
                root_quota_host1 = int(root_quota_host1_str['out'][0])
            except Exception:
                pass

        if root_quota_host1 is None:
            self.skipTest('cpu group controller test: '
                          'could not determine root cfs_quota_us')
        elif root_quota_host1 != -1:
            self.skipTest('cpu group controller test: '
                          'root cfs_quota_us is not unlimited, cannot test '
                          'cgroup hook CPU quotas in this environment')
        name = 'CGROUP1'
        cfs_period_us = 200000
        cfs_quota_fudge_factor = 1.05
        zero_cpus_shares_fraction = 0.3
        zero_cpus_quota_fraction = 0.5
        # config file 'cfg13' has 'allow_zero_cpus=true' under cpuset, to allow
        # zero-cpu jobs.
        self.load_config(self.cfg13 % (self.mem, self.mem, cfs_period_us,
                                       cfs_quota_fudge_factor,
                                       zero_cpus_shares_fraction,
                                       zero_cpus_quota_fraction))
        a = {'Resource_List.select': 'ncpus=0',
             ATTR_N: name, ATTR_k: 'oe'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        self.server.status(JOB, [ATTR_o, 'exec_host'], jid)
        fna = self.get_cgroup_job_dir('cpu', jid, self.hosts_list[0])
        self.assertFalse(fna is None, 'No job directory for cpu subsystem')
        cpu_scr = self.du.run_cmd(cmd=[self.cpu_controller_script % fna],
                                  as_script=True, hosts=self.hosts_list[0])
        cpu_scr_out = cpu_scr['out']
        self.logger.info('cpu_scr_out:\n%s' % cpu_scr_out)
        shares_match = (zero_cpus_shares_fraction * 1000)
        self.assertTrue("cpu_shares=%d" % shares_match in cpu_scr_out)
        self.logger.info("cpu_shares check passed (match %d)" % shares_match)

        self.assertTrue("cpu_cfs_period_us=%d" %
                        (cfs_period_us) in cpu_scr_out)
        self.logger.info(
            "cpu_cfs_period_us check passed (match %d)" % (cfs_period_us))
        cfs_quota_us_match = cfs_period_us * \
            zero_cpus_quota_fraction * cfs_quota_fudge_factor
        self.assertTrue("cpu_cfs_quota_us=%d" %
                        (cfs_quota_us_match) in cpu_scr_out)
        self.logger.info("cpu_cfs_quota_us check passed (match %d)" %
                         (cfs_quota_us_match))

    def test_vnodepernuma_use_hyperthreads(self):
        """
        Test to verify that correct number of jobs run with
        vnodes_per_numa=true and use_hyperthreads=true
        """
        pcpus = 0
        sibs = 0
        cores = 0
        pval = 0
        phys = {}
        with open('/proc/cpuinfo', 'r') as desc:
            for line in desc:
                if re.match('^processor', line):
                    pcpus += 1
                sibs_match = re.search(r'siblings	: ([0-9]+)', line)
                cores_match = re.search(r'cpu cores	: ([0-9]+)', line)
                phys_match = re.search(r'physical id	: ([0-9]+)', line)
                if sibs_match:
                    sibs = int(sibs_match.groups()[0])
                if cores_match:
                    cores = int(cores_match.groups()[0])
                if phys_match:
                    pval = int(phys_match.groups()[0])
                    phys[pval] = 1
        if (sibs == 0 or cores == 0):
            self.skipTest('Insufficient information about the processors.')
        if pcpus < 2:
            self.skipTest('This test requires at least two processors.')

        hyperthreads_per_core = int(sibs / cores)
        name = 'CGROUP20'
        # set vnode_per_numa=true with use_hyperthreads=true
        self.load_config(self.cfg3 % ('', 'true', '', self.mem, '',
                                      self.swapctl, ''))
        # Submit M*N*P jobs, where M is the number of physical processors,
        # N is the number of 'cpu cores' per M. and P being the
        # number of hyperthreads per core.
        njobs = len(phys) * cores * hyperthreads_per_core
        if njobs > 100:
            self.skipTest("too many jobs (%d) to submit" % njobs)
        a = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name + 'a'}
        for _ in range(njobs):
            j = Job(TEST_USER, attrs=a)
            # make sure this stays around for an hour
            # (or until deleted in teardown)
            j.set_sleep_time(3600)
            jid = self.server.submit(j)
            a1 = {'job_state': 'R'}
            self.server.expect(JOB, a1, jid)

        # Submit another job, expect in Q state
        b = {'Resource_List.select': '1:ncpus=1:mem=300mb:host=%s' %
             self.hosts_list[0], ATTR_N: name + 'b'}
        j2 = Job(TEST_USER, attrs=b)
        jid2 = self.server.submit(j2)
        b1 = {'job_state': 'Q'}
        self.server.expect(JOB, b1, jid2)

    def test_cgroup_default_config(self):
        """
        Test to make sure using the default hook config file
        still run a basic job, and cleans up cpuset upon qdel.
        """
        # The default hook config has 'memory' subsystem enabled
        if not self.paths[self.hosts_list[0]]['memory']:
            self.skipTest('Test requires memory subystem mounted')
        self.load_default_config()
        # Reduce the noise in mom_logs for existence=False matching
        c = {'$logevent': '511'}
        self.mom.add_config(c)
        a = {'Resource_List.select': 'ncpus=1:mem=100mb'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        time.sleep(2)
        stime = int(time.time())
        time.sleep(2)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)
        err_msg = "write_value: Permission denied.*%s.*memsw" % (jid)
        self.mom.log_match(err_msg, max_attempts=3, interval=1, n='ALL',
                           starttime=stime, regexp=True, existence=False)
        self.server.status(JOB, ['exec_host'], jid)
        ehost = j.attributes['exec_host']
        ehost1 = ehost.split('/')[0]
        ehjd1 = self.get_cgroup_job_dir('cpuset', jid, ehost1)
        self.assertTrue(self.is_dir(ehjd1, ehost1), "job cpuset dir not found")
        self.server.delete(id=jid, wait=True)
        self.assertFalse(self.is_dir(ehjd1, ehost1), "job cpuset dir found")

    def test_cgroup_cgswap(self, vnode_per_numa_node=False):
        """
        Test to verify (with vnode_per_numa_node disabled by default):
        - whether queuejob/modifyjob set cgswap to vmem-mem in jobs
        - whether nodes get resources_available.cgswap filled in
        - whether a collection of jobs submitted that do not exceed available
          vmem but would deplete cgswap are indeed not all run simultaneously
        """
        if not self.mem:
            self.skipTest('Test requires memory subystem mounted')
        if self.swapctl != 'true':
            self.skipTest('Test requires memsw accounting enabled')
        self.server.remove_resource('cgswap')
        self.server.add_resource('cgswap', 'size', 'nh')
        self.scheduler.add_resource('cgswap')
        events = ['execjob_begin', 'execjob_launch', 'execjob_attach',
                  'execjob_epilogue', 'execjob_end', 'exechost_startup',
                  'exechost_periodic', 'execjob_resize', 'execjob_abort',
                  'queuejob', 'modifyjob']
        # Enable the cgroups hook new events
        conf = {'enabled': 'True', 'freq': 10, 'event': events}
        self.server.manager(MGR_CMD_SET, HOOK, conf, self.hook_name)

        self.load_config(self.cfg15
                         % ('true' if vnode_per_numa_node else 'false'))
        vnode_name = self.mom.shortname
        if vnode_per_numa_node:
            vnode_name += "[0]"
        cgswapstat = self.server.status(NODE, 'resources_available.cgswap',
                                        id=vnode_name)
        self.assertTrue(cgswapstat
                        and 'resources_available.cgswap' in cgswapstat[0],
                        'cgswap resource not found on node')

        cgswap = PbsTypeSize(cgswapstat[0]['resources_available.cgswap'])
        self.logger.info('Test node appears to have %s cgswap'
                         % cgswap.encode())
        if cgswap == PbsTypeSize("0kb"):
            self.logger.info('First Mom has no swap, test will just '
                             'check if job cgswap is added')
            a = {'Resource_List.select':
                 '1:ncpus=0:mem=100mb:vmem=1100mb:vnode=%s'
                 % vnode_name}

            j = Job(TEST_USER, attrs=a)
            j.create_script(self.sleep30_job)
            jid = self.server.submit(j)

            # scheduler sets comment when the job cannot run,
            # server sets comment when the job runs
            # in both cases the comment gets set
            self.server.expect(JOB, 'comment', op=SET)
            job_status = self.server.status(JOB, id=jid)

            cgswap = None
            select_resource = job_status[0]['Resource_List.select']
            chunkspecs = select_resource.split(':')
            for c in chunkspecs:
                if '=' in c:
                    name, value = c.split('=')
                    if name == 'cgswap':
                        cgswap = PbsTypeSize(value)
            self.assertTrue(cgswap is not None, 'job cgswap was not added')
            self.assertTrue(cgswap == PbsTypeSize('1000mb'),
                            'job cgswap is %s instead of expected 1000mb'
                            % str(cgswap))
            self.logger.info('job cgswap detected to be correct, roughly %s'
                             % str(cgswap))

            # check that indeed you cannot run the job since it requests
            # swap usage and there is none
            job_comment = job_status[0]['comment']
            self.assertTrue('Insufficient amount of resource: cgswap'
                            in job_comment,
                            'Job comment should indicate insufficient cgswap '
                            'but is: %s' % job_comment)
            self.logger.info('job comment as expected: %s' % job_comment)

        else:
            self.logger.info('First MoM has swap, confirming cgswap '
                             'correctly throttles jobs accepted')
            # PbsTypeSize value is stored in kb units
            cgreqval = int(float(cgswap.value)
                           / 1024.0 / 3.0 * 2.0)
            cgreqsuffix = 'mb'
            cgreq = PbsTypeSize(str(cgreqval) + cgreqsuffix)
            vmemreqsize = PbsTypeSize("100mb") + cgreq
            vmemreq = str(int(vmemreqsize.value / 1024))+'mb'
            self.logger.info('will submit jobs with 100mb mem and %s vmem'
                             % vmemreq)
            a = {'Resource_List.select':
                 '1:ncpus=0:mem=100mb:vmem=%s:vnode=%s'
                 % (vmemreq, vnode_name)}

            j = Job(TEST_USER, attrs=a)
            j.create_script(self.sleep600_job)
            jid = self.server.submit(j)
            bs = {'job_state': 'R'}
            self.server.expect(JOB, bs, jid, offset=1)

            cgswap = None
            job_status = self.server.status(JOB, id=jid)
            select_resource = job_status[0]['Resource_List.select']
            chunkspecs = select_resource.split(':')
            for c in chunkspecs:
                if '=' in c:
                    name, value = c.split('=')
                    if name == 'cgswap':
                        cgswap = PbsTypeSize(value)
            self.assertTrue(cgswap is not None, 'job cgswap was not added')
            self.assertTrue(cgswap == cgreq,
                            'job cgswap is %s instead of expected %s'
                            % (str(cgswap), str(cgreq)))
            self.logger.info('job cgswap detected to be correct, roughly %s'
                             % str(cgswap))
            j = Job(TEST_USER, attrs=a)
            j.create_script(self.sleep600_job)
            jid = self.server.submit(j)

            # Second job should not run - not enough cgswap
            # scheduler sets comment when the job cannot run,
            # server sets comment when the job runs
            # in both cases the comment gets set
            self.server.expect(JOB, 'comment', op=SET)
            job_status = self.server.status(JOB, id=jid)

            # check that indeed you cannot run the job since it requests
            # too much swap usage while the first job runs
            job_comment = job_status[0]['comment']
            self.assertTrue('Insufficient amount of resource: cgswap'
                            in job_comment,
                            'Job comment should indicate insufficient cgswap '
                            'but is: %s' % job_comment)
            self.logger.info('job comment as expected: %s' % job_comment)

    def test_cgroup_cgswap_numa(self):
        """
        Test to verify (with vnode_per_numa_node enabled):
        - whether queuejob/modifyjob set cgswap to vmem-mem in jobs
        - whether nodes get resources_available.cgswap filled in
        - whether a collection of jobs submitted that do not exceed available
          vmem but would deplete cgswap are indeed not all run simultaneously
        """
        self.test_cgroup_cgswap(vnode_per_numa_node=True)

    def test_cgroup_enforce_default(self,
                                    enforce_flags=('true', 'true'),
                                    exclhost=False):
        """
        Test to verify if the flags to enforce default mem are working
        and to ensure mem and memsw limits are set as expected;
        default is to enforce both mem and memsw defaults:
        job should get small mem limit and larger memsw limit
        if there is swap.
        """
        if not self.mem:
            self.skipTest('Test requires memory subystem mounted')
        if self.swapctl != 'true':
            self.skipTest('Test requires memsw accounting enabled')

        self.load_config(self.cfg16
                         % enforce_flags)

        a = {'Resource_List.select':
             '1:ncpus=1:vnode=%s'
             % self.mom.shortname}
        if exclhost:
            a['Resource_List.place'] = 'exclhost'

        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        bs = {'job_state': 'R'}
        self.server.expect(JOB, bs, jid, offset=1)

        mem_base = os.path.join(self.paths[self.hosts_list[0]]['memory'],
                                'pbs_jobs.service', 'jobid')

        # Get total physical memory available
        mem_avail = os.path.join(mem_base,
                                 'memory.limit_in_bytes')
        result = self.du.cat(hostname=self.mom.hostname, filename=mem_avail,
                             sudo=True)
        mem_avail_in_bytes = None
        try:
            mem_avail_in_bytes = int(result['out'][0])
        except Exception:
            # None will be seen as a failure, nothing to do
            pass
        self.logger.info("total available mem: %d"
                         % mem_avail_in_bytes)
        self.assertTrue(mem_avail_in_bytes is not None,
                        "Unable to read total memory available")

        # Get total phys+swap memory available
        vmem_avail = os.path.join(mem_base,
                                  'memory.memsw.limit_in_bytes')
        result = self.du.cat(hostname=self.mom.hostname, filename=vmem_avail,
                             sudo=True)
        vmem_avail_in_bytes = None
        try:
            vmem_avail_in_bytes = int(result['out'][0])
        except Exception:
            # None will be seen as a failure, nothing to do
            pass
        self.assertTrue(vmem_avail_in_bytes is not None,
                        "Unable to read total memsw available")
        self.logger.info("total available memsw: %d"
                         % vmem_avail_in_bytes)

        # Get job physical mem limit
        mem_limit = os.path.join(mem_base, str(jid),
                                 'memory.limit_in_bytes')
        result = self.du.cat(hostname=self.mom.hostname, filename=mem_limit,
                             sudo=True)
        mem_limit_in_bytes = None
        try:
            mem_limit_in_bytes = int(result['out'][0])
        except Exception:
            # None will be seen as a failure, nothing to do
            pass
        self.assertTrue(mem_limit_in_bytes is not None,
                        "Unable to read job mem limit")
        self.logger.info("job mem limit: %d"
                         % mem_limit_in_bytes)

        # Get job phys+swap mem limit
        vmem_limit = os.path.join(mem_base, str(jid),
                                  'memory.memsw.limit_in_bytes')
        result = self.du.cat(hostname=self.mom.hostname, filename=vmem_limit,
                             sudo=True)
        vmem_limit_in_bytes = None
        try:
            vmem_limit_in_bytes = int(result['out'][0])
        except Exception:
            # None will be seen as a failure, nothing to do
            pass
        self.assertTrue(vmem_limit_in_bytes is not None,
                        "Unable to read job memsw limit")
        self.logger.info("job memsw limit: %d"
                         % vmem_limit_in_bytes)

        # Check results correspond to enforcement flags and job placement
        swap_avail = vmem_avail_in_bytes - mem_avail_in_bytes
        if enforce_flags[0] == 'true' and not exclhost:
            self.assertTrue(mem_limit_in_bytes == 100 * 1024 * 1024,
                            "Job mem limit is %d expected %d"
                            % (mem_limit_in_bytes, 100 * 1024 * 1024))
        else:
            self.assertTrue(mem_avail_in_bytes == mem_limit_in_bytes,
                            "job mem limit (%d) should be identical to "
                            "total mem available (%d)"
                            % (mem_limit_in_bytes, mem_avail_in_bytes))
            self.logger.info("job mem limit is total mem available (%d)"
                             % mem_avail_in_bytes)
        if enforce_flags[1] == 'true' and not exclhost:
            expected_vmem = (mem_limit_in_bytes
                             + min(100 * 1024 * 1024, swap_avail))
            self.assertTrue(vmem_limit_in_bytes == expected_vmem,
                            "memsw limit: expected %d, got %d"
                            % (expected_vmem, vmem_limit_in_bytes))
            self.logger.info("job memsw limit is expected %d"
                             % vmem_limit_in_bytes)
        else:
            if swap_avail:
                self.assertTrue(vmem_avail_in_bytes == vmem_limit_in_bytes,
                                "job memsw limit (%d) should be identical to "
                                "total memsw available (%d)"
                                % (vmem_limit_in_bytes, vmem_avail_in_bytes))
                self.logger.info("job memsw limit is total memsw available "
                                 " (%d)" % vmem_avail_in_bytes)
            else:
                self.assertTrue(mem_limit_in_bytes == vmem_limit_in_bytes,
                                "no swap, mem (%d) and vmem (%d) limits "
                                "should be identical but are not"
                                % (mem_limit_in_bytes, vmem_limit_in_bytes))
                self.logger.info("no swap: job memsw limit is job mem limit")

    def test_cgroup_enforce_default_tf(self):
        """
        Test to verify if the flags to enforce default mem are working
        and to ensure mem and memsw limits are set as expected;
        enforce mem but not memsw:
        job should get small mem limit memsw should be unlimited
        (i.e. able to consume memsw set as limit for all jobs)
        """
        self.test_cgroup_enforce_default(enforce_flags=('true', 'false'))

    def test_cgroup_enforce_default_ft(self):
        """
        Test to verify if the flags to enforce default mem are working
        and to ensure mem and memsw limits are set as expected;
        enforce memsw but not mem:
        job should be able to consume all physical memory
        set as limit for all jobs but only a small amount of additional swap
        """
        self.test_cgroup_enforce_default(enforce_flags=('false', 'true'))

    def test_cgroup_enforce_default_exclhost(self):
        """
        Test to verify if the flags to enforce default mem are working
        and to ensure mem and memsw limits are set as expected;
        enforce neither mem nor memsw by enabling flags to ignore
        enforcement for exclhost jobs and submitting an exclhost job:
        job should be able to consume all physical memory
        and memsw set as limit for all jobs
        """
        # enforce flags should both be overrided by exclhost
        self.test_cgroup_enforce_default(enforce_flags=('true', 'true'),
                                         exclhost=True)

    def test_manage_rlimit_as(self):
        if not self.mem:
            self.skipTest('Test requires memory subystem mounted')
        if self.swapctl != 'true':
            self.skipTest('Test requires memsw accounting enabled')

        # Make sure job history is enabled to see when job has ended
        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        self.assertEqual(rc, 0)
        self.server.expect(SERVER, {'job_history_enable': 'True'})

        self.load_config(self.cfg16 % ('true', 'true'))

        # First job -- request vmem and no pvmem,
        # RLIMIT_AS shoud be unlimited
        a = {'Resource_List.select':
             '1:ncpus=0:mem=400mb:vmem=400mb:vnode=%s'
             % self.mom.shortname}

        j = Job(TEST_USER, attrs=a)
        j.create_script("#!/bin/bash\nulimit -v")
        jid = self.server.submit(j)
        bs = {'job_state': 'F'}
        self.server.expect(JOB, bs, jid, extend='x', offset=1)

        thisjob = self.server.status(JOB, id=jid, extend='x')
        try:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]
        except Exception:
            self.assertTrue(False, "Could not determine job output path")
        result = self.du.cat(hostname=self.server.hostname,
                             filename=job_output_file,
                             sudo=True)
        self.assertTrue('out' in result, "Nothing in job output file?")
        job_out = '\n'.join(result['out'])
        self.logger.info("job_out=%s" % job_out)
        self.assertTrue('unlimited' in job_out)
        self.logger.info("Job that requests vmem "
                         "but no pvmem correctly has unlimited RLIMIT_AS")

        # Second job -- see if pvmem still works
        # RLIMIT_AS should correspond to pvmem
        a['Resource_List.pvmem'] = '400mb'
        j = Job(TEST_USER, attrs=a)
        j.create_script("#!/bin/bash\nulimit -v")
        jid = self.server.submit(j)
        bs = {'job_state': 'F'}
        self.server.expect(JOB, bs, jid, extend='x', offset=1)

        thisjob = self.server.status(JOB, id=jid, extend='x')
        try:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]
        except Exception:
            self.assertTrue(False, "Could not determine job output path")

        result = self.du.cat(hostname=self.server.hostname,
                             filename=job_output_file,
                             sudo=True)
        self.assertTrue('out' in result, "Nothing in job output file?")
        job_out = '\n'.join(result['out'])
        self.logger.info("job_out=%s" % job_out)
        # ulimit reports kb, not bytes
        self.assertTrue(str(400 * 1024) in job_out)
        self.logger.info("Job that requests 400mb pvmem "
                         "correctly has 400mb RLIMIT_AS")

    def test_cgroup_mount_paths(self):
        """
        Test to see if the cgroup hook picks the shortest path,
        but also if it can be overrided in the config file
        """

        if self.du.isdir(self.hosts_list[0], '/dev/tstc'):
            self.skipTest('Test requires /dev/tstc not to exist')
        if self.du.isdir(self.hosts_list[0], '/dev/tstm'):
            self.skipTest('Test requires /dev/tstm not to exist')

        self.load_config(self.cfg17)

        dir_created = self.du.mkdir(hostname=self.hosts_list[0],
                                    path='/dev/tstm', mode=0o0755,
                                    sudo=True)
        if not dir_created:
            self.skipTest('not able to create /dev/tstm')
        result = self.du.run_cmd(self.hosts_list[0],
                                 ['mount', '-t', 'cgroup', '-o',
                                  'rw,nosuid,nodev,noexec,relatime,seclabel,'
                                  'memory',
                                  'cgroup', '/dev/tstm'],
                                 sudo=True)
        if result['rc'] != 0:
            self.du.run_cmd(self.hosts_list[0],
                            ['rmdir', '/dev/tstm'],
                            sudo=True)
            self.skipTest('not able to mount /dev/tstm')

        dir_created = self.du.mkdir(hostname=self.hosts_list[0],
                                    path='/dev/tstc', mode=0o0755,
                                    sudo=True)
        if not dir_created:
            self.du.run_cmd(self.hosts_list[0],
                            ['umount', '/dev/tstm'],
                            sudo=True)
            self.du.run_cmd(self.hosts_list[0],
                            ['rmdir', '/dev/tstm'],
                            sudo=True)
            self.skipTest('not able to create /dev/tstc')

        result = self.du.run_cmd(self.hosts_list[0],
                                 ['mount', '-t', 'cgroup', '-o',
                                  'rw,nosuid,nodev,noexec,relatime,seclabel,'
                                  'cpuset',
                                  'cgroup', '/dev/tstc'],
                                 sudo=True)
        if result['rc'] != 0:
            self.du.run_cmd(self.hosts_list[0],
                            ['umount', '/dev/tstm'],
                            sudo=True)
            self.du.run_cmd(self.hosts_list[0],
                            ['rmdir', '/dev/tstm'],
                            sudo=True)
            self.du.run_cmd(self.hosts_list[0],
                            ['rmdir', '/dev/tstc'],
                            sudo=True)
            self.skipTest('not able to mount /dev/tstc')

        # sleep 2s: make sure no old log lines will match 'begin' time
        time.sleep(2)
        begin = int(time.time())
        # sleep 2s to allow for small time differences and rounding errors
        time.sleep(2)

        a = {'Resource_List.select':
             "1:ncpus=1:host=%s" % self.hosts_list[0]}
        j = Job(TEST_USER, attrs=a)
        j.create_script(self.sleep600_job)
        jid = self.server.submit(j)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, jid)
        failure = False

        try:
            self.moms_list[0].log_match(msg='create_job: Creating directory '
                                            '/sys/fs/cgroup/cpuset/'
                                            'pbs_jobs.service/jobid/%s'
                                            % jid,
                                        n='ALL', starttime=begin,
                                        max_attempts=1)
        except Exception:
            failure = True
        try:
            self.moms_list[0].log_match(msg='create_job: Creating directory '
                                            '/dev/tstm/'
                                            'pbs_jobs.service/jobid/%s'
                                            % jid,
                                        n='ALL', starttime=begin,
                                        max_attempts=1)
        except Exception:
            failure = True

        self.du.run_cmd(self.hosts_list[0],
                        ['umount', '/dev/tstm'],
                        sudo=True)
        self.du.run_cmd(self.hosts_list[0],
                        ['rmdir', '/dev/tstm'],
                        sudo=True)
        self.du.run_cmd(self.hosts_list[0],
                        ['umount', '/dev/tstc'],
                        sudo=True)
        self.du.run_cmd(self.hosts_list[0],
                        ['rmdir', '/dev/tstc'],
                        sudo=True)

        self.assertFalse(failure,
                         'Did not find correct paths for created cgroup dirs')

    def cleanup_cgroup_subsys(self, host):
        # Remove the jobdir if any under other cgroups
        cgroup_subsys = ('systemd', 'cpu', 'cpuacct', 'cpuset', 'devices',
                         'memory', 'hugetlb', 'perf_event', 'freezer',
                         'blkio', 'pids', 'net_cls', 'net_prio')
        for subsys in cgroup_subsys:
            if (subsys in self.paths[host] and
                    self.paths[host][subsys]):
                self.logger.info('Looking for orphaned jobdir in %s' % subsys)
                cdir = self.paths[host][subsys]
                if self.du.isdir(host, cdir):
                    self.logger.info("Inspecting " + cdir)
                    cpath = self.find_main_cpath(cdir, host)
                    # not always immediately under main path
                    if cpath is not None and self.du.isdir(host, cpath):
                        tasks_files = (
                            glob.glob(os.path.join(cpath,
                                                   '*', '*', 'tasks'))
                            + glob.glob(os.path.join(cpath,
                                                     '*', 'tasks')))
                        if tasks_files != []:
                            self.logger.info("Tasks files found in %s: %s"
                                             % (cpath, tasks_files))
                        for tasks_file in tasks_files:
                            jdir = os.path.dirname(tasks_file)
                            if not self.du.isdir(host, jdir):
                                continue
                            self.logger.info('deleting jobdir %s' % jdir)

                            # Kill tasks before trying to rmdir freezer
                            cgroup_tasks = os.path.join(jdir, 'tasks')
                            ret = self.du.cat(hostname=host,
                                              filename=cgroup_tasks,
                                              sudo=True)
                            if ret['rc'] == 0:
                                for taskstr in ret['out']:
                                    self.logger.info("trying to kill %s on %s"
                                                     % (taskstr,
                                                        host))
                                    self.du.run_cmd(host,
                                                    ['kill', '-9'] + [taskstr],
                                                    sudo=True)
                            for count in range(30):
                                ret = self.du.cat(hostname=host,
                                                  filename=cgroup_tasks,
                                                  sudo=True)
                                if ret['rc'] != 0:
                                    self.logger.info("Cannot confirm "
                                                     "cgroup tasks; sleeping "
                                                     "30 seconds instead")
                                    time.sleep(30)
                                    break
                                if ret['out'] == [] or ret['out'][0] == '':
                                    self.logger.info("Processes in cgroup "
                                                     "are gone")
                                    break
                                else:
                                    self.logger.info("tasks still in cgroup: "
                                                     + str(ret['out']))
                                    time.sleep(1)

                            cmd2 = ['rmdir', jdir]
                            self.du.run_cmd(host, cmd=cmd2, sudo=True)

    def cleanup_frozen_jobs(self, host):
        # Cleanup frozen jobs
        # Thaw ALL freezers found
        # If directory starts with a number (i.e. a job)
        # kill processes in the freezers and remove them

        if 'freezer' in self.paths[host]:
            # Find freezers to thaw
            self.logger.info('Cleaning up frozen jobs ****')
            fdir = self.paths[host]['freezer']
            freezer_states = \
                glob.glob(os.path.join(fdir, '*', '*', '*', 'freezer.state'))
            freezer_states += \
                glob.glob(os.path.join(fdir, '*', '*', 'freezer.state'))
            freezer_states += \
                glob.glob(os.path.join(fdir, '*', 'freezer.state'))
            self.logger.info('*** found freezer states %s'
                             % str(freezer_states))

            for freezer_state in freezer_states:
                # thaw the freezer
                self.logger.info('Thawing ' + freezer_state)
                state = 'THAWED'
                fn = self.du.create_temp_file(body=state)
                self.du.run_copy(hosts=host, src=fn,
                                 dest=freezer_state, sudo=True,
                                 uid='root', gid='root',
                                 mode=0o644)
                # Confirm it's thawed
                for count in range(30):
                    ret = self.du.cat(hostname=host,
                                      filename=freezer_state,
                                      sudo=True)
                    if ret['rc'] != 0:
                        self.logger.info("Cannot confirm freezer state"
                                         "sleeping 30 seconds instead")
                        time.sleep(30)
                        break
                    if ret['out'][0] == 'THAWED':
                        self.logger.info("freezer processes reported as"
                                         " THAWED")
                        break
                    else:
                        self.logger.info("freezer state reported as "
                                         + ret['out'][0])
                        time.sleep(1)

                freezer_basename = os.path.basename(
                    os.path.dirname(freezer_state))
                jobid = None
                try:
                    jobid = int(freezer_basename.split('.')[0])
                except Exception:
                    # not a job directory
                    pass
                if jobid is not None:
                    self.logger.info("Apparently found job freezer for job %s"
                                     % freezer_basename)
                    freezer_tasks = os.path.join(
                        os.path.dirname(freezer_state), "tasks")

                    # Kill tasks before trying to rmdir freezer
                    ret = self.du.cat(hostname=host,
                                      filename=freezer_tasks,
                                      sudo=True)
                    if ret['rc'] == 0:
                        for taskstr in ret['out']:
                            self.logger.info("trying to kill %s on %s"
                                             % (taskstr,
                                                self.hosts_list[0]))
                            self.du.run_cmd(host,
                                            ['kill', '-9'] + [taskstr],
                                            sudo=True)
                    for count in range(30):
                        ret = self.du.cat(hostname=host,
                                          filename=freezer_tasks,
                                          sudo=True)
                        if ret['rc'] != 0:
                            self.logger.info("Cannot confirm freezer tasks; "
                                             "sleeping 30 seconds instead")
                            time.sleep(30)
                            break
                        if ret['out'] == [] or ret['out'][0] == '':
                            self.logger.info("Processes in thawed freezer"
                                             " are gone")
                            break
                        else:
                            self.logger.info("tasks still in thawed freezer: "
                                             + str(ret['out']))
                            time.sleep(1)

                    cmd = ["rmdir", os.path.dirname(freezer_state)]
                    self.logger.info("Executing %s" % ' '.join(cmd))
                    self.du.run_cmd(hosts=host, cmd=cmd, sudo=True)

    def tearDown(self):
        TestFunctional.tearDown(self)
        mom_checks = True
        if self.moms_list[0].is_cpuset_mom():
            mom_checks = False
        self.load_default_config(mom_checks=mom_checks)
        if not self.iscray:
            self.remove_vntype()
        events = ['execjob_begin', 'execjob_launch', 'execjob_attach',
                  'execjob_epilogue', 'execjob_end', 'exechost_startup',
                  'exechost_periodic', 'execjob_resize', 'execjob_abort']
        # Disable the cgroups hook
        conf = {'enabled': 'False', 'freq': 10, 'event': events}
        self.server.manager(MGR_CMD_SET, HOOK, conf, self.hook_name)
        # Cleanup any temp file created
        self.logger.info('Deleting temporary files %s' % self.tempfile)
        self.du.rm(hostname=self.serverA, path=self.tempfile, force=True,
                   recursive=True, sudo=True)
        for host in self.hosts_list:
            self.cleanup_frozen_jobs(host)
            self.cleanup_cgroup_subsys(host)


================================================
FILE: test/tests/functional/pbs_check_job_attrib.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestCheckJobAttrib(TestFunctional):
    """
    This testsuite is to validate job attributes and values
    """

    def test_exec_vnode_after_job_rerun(self):
        """
        Test unsetting of exec_vnode of a job which got requeued
        after stage-in and make sure stage-in files are cleaned up.
        """
        hook_name = "momhook"
        hook_body = "import pbs\npbs.event().reject('my custom message')\n"
        a = {'event': 'execjob_begin', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, a, hook_body)

        self.server.log_match(".*successfully sent hook file.*" +
                              hook_name + ".PY" + ".*", regexp=True,
                              max_attempts=100, interval=5)
        storage_info = {}
        starttime = int(time.time())
        stagein_path = self.mom.create_and_format_stagein_path(
            storage_info, asuser=str(TEST_USER))
        a = {ATTR_stagein: stagein_path}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=UNSET)
        # make scheduling off to avoid any race conditions
        # otherwise scheduler tries to run job till it reached H state
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.expect(JOB, {'run_count': (GT, 0)}, id=jid)
        self.server.log_match('my custom message', starttime=starttime)
        path = stagein_path.split("@")
        msg = "Staged in file not cleaned"
        self.assertFalse(self.mom.isfile(path[0]), msg)


================================================
FILE: test/tests/functional/pbs_checkpoint.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_crayutils import CrayUtils
from tests.functional import *


class TestCheckpoint(TestFunctional):
    """
    This test suite targets Checkpoint functionality.
    """
    abort_file = ''
    cu = CrayUtils()

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        abort_script = """#!/bin/bash
kill $1
exit 0
"""
        self.abort_file = self.mom.add_checkpoint_abort_script(
            body=abort_script)
        self.platform = self.du.get_platform()
        if self.platform != 'cray' and self.platform != 'craysim':
            self.attrs = {ATTR_l + '.select': '1:ncpus=1',
                          ATTR_l + '.place': 'excl'}
        else:
            nv = self.cu.num_compute_vnodes(self.server)
            self.assertNotEqual(nv, 0, "No cray_compute vnodes are present.")
            self.attrs = {ATTR_l + '.select': '%d:ncpus=1' % nv,
                          ATTR_l + '.place': 'scatter'}

    def verify_checkpoint_abort(self, jid, stime):
        """
        Verify that checkpoint and abort happened.
        """
        self.ck_dir = os.path.join(self.mom.pbs_conf['PBS_HOME'],
                                   'checkpoint', jid + '.CK')
        self.assertTrue(self.du.isdir(hostname=self.mom.hostname,
                                      path=self.ck_dir, runas=ROOT_USER),
                        msg="Checkpoint directory %s not found" % self.ck_dir)
        _msg1 = "%s;req_holdjob: Checkpoint initiated." % jid
        self.mom.log_match(_msg1, starttime=stime)
        _msg2 = "%s;checkpoint_abort script %s: exit code 0" % (
            jid, self.abort_file)
        self.mom.log_match(_msg2, starttime=stime)
        _msg3 = "%s;checkpointed to %s" % (jid, self.ck_dir)
        self.mom.log_match(_msg3, starttime=stime)
        _msg4 = "%s;task 00000001 terminated" % jid
        self.mom.log_match(_msg4, starttime=stime)

    def start_server_hot(self):
        """
        Start the server with the hot option.
        """
        pbs_exec = self.server.pbs_conf['PBS_EXEC']
        svrname = self.server.pbs_server_name
        pbs_server_hot = [os.path.join(
            pbs_exec, 'sbin', 'pbs_server'), '-t', 'hot']
        self.du.run_cmd(svrname, cmd=pbs_server_hot, sudo=True)
        self.assertTrue(self.server.isUp())

    def checkpoint_abort_with_qterm_restart_hot(self, qterm_type):
        """
        Checkpointing with qterm -t <type>, hot server restart.
        """

        j1 = Job(TEST_USER, self.attrs)
        j1.set_sleep_time(20)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        start_time = int(time.time())
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.qterm(manner=qterm_type)

        self.verify_checkpoint_abort(jid1, start_time)

        self.start_server_hot()
        self.assertTrue(self.server.isUp())

        msg = "%s;Requeueing job, substate: 10 Requeued in queue: workq" % jid1
        self.server.log_match(msg, starttime=start_time)

        # wait for the server to hot start the job
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1, interval=2)
        self.server.expect(JOB, 'exec_vnode', id=jid1, op=SET)
        self.assertFalse(os.path.exists(self.ck_dir),
                         msg=self.ck_dir + " still exists")
        self.server.expect(JOB, {'job_state': 'F'},
                           jid1, extend='x', interval=5)

    def test_checkpoint_abort_with_preempt(self):
        """
        This test verifies that checkpoint_abort works as expected when
        a job is preempted via checkpoint. It does so by submitting a job
        in express queue which preempts a running job in the default queue.
        """
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'C'},
                            runas=ROOT_USER)
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq")

        j1 = Job(TEST_USER, self.attrs)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        self.attrs['queue'] = 'expressq'
        j2 = Job(TEST_USER, self.attrs)
        j2.set_sleep_time(20)
        start_time = int(time.time())
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

        self.verify_checkpoint_abort(jid1, start_time)

        self.server.expect(JOB, {'job_state': 'F'},
                           jid2, extend='x', interval=5)
        self.server.expect(JOB, {'job_state': 'F'},
                           jid1, extend='x', interval=5)

    def test_checkpoint_abort_with_qhold(self):
        """
        This test uses qhold for checkpointing.
        """
        j1 = Job(TEST_USER, self.attrs)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        start_time = int(time.time())
        self.server.holdjob(jid1)
        self.server.expect(JOB, {'job_state': 'H'}, id=jid1)

        self.verify_checkpoint_abort(jid1, start_time)

    def test_checkpoint_abort_with_qterm_immediate_restart_hot(self):
        """
        This tests checkpointing with qterm -t immediate, hot server restart.
        """
        self.checkpoint_abort_with_qterm_restart_hot("immediate")

    def test_checkpoint_abort_with_qterm_delay_restart_hot(self):
        """
        This tests checkpointing with qterm -t delay, hot server restart.
        """
        self.checkpoint_abort_with_qterm_restart_hot("delay")

    def tearDown(self):
        TestFunctional.tearDown(self)
        self.du.rm(hostname=self.mom.hostname, path=self.abort_file,
                   sudo=True, force=True)


================================================
FILE: test/tests/functional/pbs_client_response.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import time


class TestClientResponse(TestFunctional):
    """
    Test cases to check number of response getting from
    client command in 1 second
    """
    def test_qstat_reponse(self):
        """
        Test to check how many qstat can be done in 1 second.
        """
        count = 0
        t = time.time() + 1
        qstat_cmd = os.path.join(self.server.pbs_conf["PBS_EXEC"], "bin",
                                 "qstat")
        while time.time() < t:
            ret = self.du.run_cmd(self.server.hostname, qstat_cmd)
            self.assertTrue('rc', 0)
            count += 1
        self.logger.info("Number qstat response:%d", count)


================================================
FILE: test/tests/functional/pbs_complete_running_parent_job.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_complete_running_parent_job(TestFunctional):
    """
    This test suite is for testing the complete_running() procedure
    is processed for parent array job.
    """

    def setUp(self):
        """
        Set eligible_time_enable = True.
        This is due to test the issue in PP-1211
        """

        TestFunctional.setUp(self)

        self.server.manager(MGR_CMD_SET, SERVER, {
                            'eligible_time_enable': True})

    def test_parent_job_S_accounting_record(self):
        """
        Submit an array job and test whether the 'S' accounting record
        is created for parent job.
        """

        J = Job(TEST_USER, attrs={ATTR_J: '1-2'})
        J.set_sleep_time(1)
        parent_jid = self.server.submit(J)

        self.server.accounting_match(msg='.*;S;' +
                                     re.escape(parent_jid) + ".*",
                                     id=parent_jid, regexp=True)

    def test_parent_job_comment_and_stime(self):
        """
        Submit an array job and test whether the comment and stime is set
        for parent job.
        """

        J = Job(TEST_USER, attrs={ATTR_J: '1-2'})
        J.set_sleep_time(10)
        parent_jid = self.server.submit(J)

        attr = {
            ATTR_comment: (MATCH_RE, 'Job Array Began at .*'),
            ATTR_stime: (MATCH_RE, '.+')
        }
        self.server.expect(JOB, attr, id=parent_jid, attrop=PTL_AND)


================================================
FILE: test/tests/functional/pbs_conf_resv_stale_vnode.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestResvStaleVnode(TestFunctional):
    """
    Test that the scheduler won't confirm a reservation on stale vnode and
    make sure reservations that have nodes that have gone stale get degreaded
    """

    def setUp(self):
        TestFunctional.setUp(self)
        # Create 3 vnodes named different things in different vnodedef files
        # This allows us to delete a vnodedef file and make that node stale
        self.mom.add_config(conf={'$vnodedef_additive': 'False'})
        a = {'resources_available.ncpus': 1, 'priority': 100}
        self.mom.create_vnodes(a, 1, fname='nat', restart=False,
                               usenatvnode=True, expect=False, vname='foo')
        a['priority'] = 10
        self.mom.create_vnodes(a, 1, fname='fname1', delall=False,
                               restart=False, additive=True,
                               expect=False, vname='vn')
        a['priority'] = 1
        self.mom.create_vnodes(a, 1, fname='fname2', delall=False,
                               additive=True, expect=False, vname='vnode')

        self.scheduler.set_sched_config({'node_sort_key':
                                         '\"sort_priority HIGH\"'})

    def test_conf_resv_stale_vnode(self):
        """
        Test that the scheduler won't confirm a reservation on a stale node.
        """
        # Ensure the hostsets aren't used by associating a node to a queue
        a = {'queue_type': 'Execution', 'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')
        self.server.manager(MGR_CMD_SET, NODE, {'queue': 'workq2'},
                            id=self.mom.shortname)

        # Submit a job that will run on our stale vnode
        a = {'Resource_List.select': '1:vnode=vn[0]',
             'Resource_List.walltime': 3600}
        J = Job(TEST_USER, attrs=a)
        jid = self.server.submit(J)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        self.mom.delete_vnode_defs(vdefname='fname1')
        self.mom.signal('-HUP')
        self.server.expect(NODE, {'state': (MATCH_RE, 'Stale')}, id='vn[0]')

        now = int(time.time())
        a = {'reserve_start': now + 5400, 'reserve_end': now + 7200}
        R = Reservation(TEST_USER, a)
        rid = self.server.submit(R)

        # Reservation should be confirmed on vnode[0] since vn[0] is Stale
        a = {'resv_nodes': '(vnode[0]:ncpus=1)'}
        a2 = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)
        self.server.expect(RESV, a2, id=rid)

    def test_stale_degraded(self):
        """
        Test that a reservation goes into the degraded state
        when one of its vnodes go stale
        """
        self.server.expect(NODE, {'state=free': 3})
        now = int(time.time())
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'vscatter',
             'reserve_start': now + 3600, 'reserve_end': now + 7200}

        R = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(R)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        self.mom.delete_vnode_defs(vdefname='fname1')
        self.mom.signal('-HUP')
        self.server.expect(NODE, {'state': (MATCH_RE, 'Stale')}, id='vn[0]')

        a = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}
        self.server.expect(RESV, a, id=rid)


================================================
FILE: test/tests/functional/pbs_config.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import tarfile
from tests.functional import *


class TestPBSConfig(TestFunctional):
    """
    Test cases for pbs_config tool
    """

    snapdirs = []
    snaptars = []

    def test_config_for_snapshot(self):
        """
        Test pbs_config's --snap option
        """
        pbs_snapshot_path = os.path.join(
            self.server.pbs_conf["PBS_EXEC"], "sbin", "pbs_snapshot")
        if not os.path.isfile(pbs_snapshot_path):
            self.skipTest("pbs_snapshot not found")
        pbs_config_path = os.path.join(
            self.server.pbs_conf["PBS_EXEC"], "unsupported", "pbs_config")
        if not os.path.isfile(pbs_config_path):
            self.skipTest("pbs_config not found")

        # Create 4 vnodes
        a = {ATTR_rescavail + ".ncpus": 2}
        self.mom.create_vnodes(attrib=a, num=4,
                               usenatvnode=True)
        self.server.expect(VNODE, {'state=free': 4}, count=True)

        # Create a queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="expressq")

        # Set preempt_order to 'R'
        a = {"preempt_order": "R"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="default")

        # Set sched_config 'smp_cluster_dist' to 'round_robin'
        self.scheds["default"].set_sched_config(
            {"smp_cluster_dist": "round_robin"})

        # Now that we have a custom configuration, take a snapshot
        outdir = pwd.getpwnam(self.du.get_current_user()).pw_dir
        snap_cmd = [pbs_snapshot_path, "-o " + outdir, "--with-sudo"]
        ret = self.du.run_cmd(cmd=snap_cmd, logerr=False, as_script=True)
        self.assertEqual(ret["rc"], 0, "pbs_snapshot command failed")
        snap_out = ret['out'][0]
        output_tar = snap_out.split(":")[1]
        output_tar = output_tar.strip()

        # Check that the output tarball was created
        self.assertTrue(os.path.isfile(output_tar),
                        "Error capturing snapshot:\n" + str(ret))
        self.snaptars.append(output_tar)

        # Unwrap the tarball
        tar = tarfile.open(output_tar)
        tar.extractall(path=outdir)
        tar.close()

        # snapshot directory name = <snapshot>.tgz[:-4]
        snap_dir = output_tar[:-4]
        self.assertTrue(os.path.isdir(snap_dir))
        self.snapdirs.append(snap_dir)

        # Let's revert the system back to default now
        TestFunctional.setUp(self)

        # Now, use pbs_config --snap to build the system captured
        # previously in the snapshot
        config_cmd = [pbs_config_path, "--snap=" + snap_dir]
        self.du.run_cmd(cmd=config_cmd, sudo=True, logerr=False)

        # Verify that there are 4 vnodes, expressq, preempt_order=R and
        # smp_cluster_dist=round_robin
        self.server.expect(VNODE, {'state=free': 4}, count=True)
        self.server.expect(QUEUE, {"Priority": 200}, id="expressq")
        self.server.expect(SCHED, {"preempt_order": "R"}, id="default")
        self.scheds["default"].parse_sched_config()
        self.assertEqual(
            self.scheds["default"].sched_config["smp_cluster_dist"],
            "round_robin",
            "pbs_config didn't load sched_config correctly")

    def tearDown(self):
        # Cleanup snapshot dirs and tars
        for snap_dir in self.snapdirs:
            self.du.rm(path=snap_dir, recursive=True, force=True)
        for snap_tar in self.snaptars:
            self.du.rm(path=snap_tar, force=True)


================================================
FILE: test/tests/functional/pbs_cpuset.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestPbsCpuset(TestFunctional):

    """
    This testsuite covers various features using cgroup cpuset systems
        - Reliable Job Startup Feature
        - Node Rampdown Feature
    """

    def check_stageout_file_size(self):
        """
        This function will check that at least 1gb of test.img
        file which is to be stagedout is created within 10 seconds.
        """
        fpath = os.path.join(TEST_USER.home, "test.img")
        cmd = ['stat', '-c', '%s', fpath]
        fsize = 0
        for i in range(11):
            rc = self.du.run_cmd(hosts=self.h0, cmd=cmd,
                                 runas=TEST_USER)
            if rc['rc'] == 0 and len(rc['out']) == 1:
                try:
                    fsize = int(rc['out'][0])
                except Exception:
                    pass
            # 1073741824 == 1Gb
            if fsize > 1073741824:
                break
            else:
                time.sleep(1)
        if fsize <= 1073741824:
            self.fail("Failed to create 1gb file at %s" % fpath)

    def setUp(self):
        TestFunctional.setUp(self)

        # skip if there are no cpuset systems in the test cluster
        no_csetmom = True
        for mom in self.moms.values():
            if mom.is_cpuset_mom():
                no_csetmom = False
        if no_csetmom:
            self.skipTest("Skip on cluster without cgroup cpuset system.")

        # Various host names
        self.h0 = self.moms.values()[0].shortname
        self.h1 = self.moms.values()[1].shortname
        self.hostA = socket.getfqdn(self.h0)
        self.hostB = socket.getfqdn(self.h1)
        # Various node names. First mom may or may not be a cpuset system.
        try:
            self.n0 = self.server.status(
                NODE, id='%s[0]' % (self.h0))[0]['id']
        except PbsStatusError:
            self.n0 = self.h0
        self.n1 = self.h1
        self.n2 = '%s[0]' % (self.n1)
        self.n3 = '%s[1]' % (self.n1)

        # Skip if there are less than four vnodes. There should be
        # three from cpuset system (natural + two NUMA vnodes)
        nodeinfo = self.server.status(NODE)
        if len(nodeinfo) < 4:
            self.skipTest("Not enough vnodes to run the test.")
        # skip if second mom has less than two NUMA vnodes
        try:
            self.server.status(NODE, id=self.n3)
        except PbsStatusError:
            self.skipTest("vnode %s doesn't exist on pbs server" % (self.n3))
        # skip if vnodes are not in free state
        for node in nodeinfo:
            if node['state'] != 'free':
                self.skipTest("Not all the vnodes are in free state")

        self.pbs_release_nodes_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_release_nodes')
        # number of resource ncpus to request initially
        ncpus = self.server.status(NODE, 'resources_available.ncpus',
                                   id=self.n3)[0]
        # request a partial amount of ncpus in self.n3
        self.ncpus2 = int(ncpus['resources_available.ncpus']) / 2
        # cgroup cpuset path on second node
        cmd = ['grep cgroup', '/proc/mounts', '|', 'grep cpuset', '|',
               'grep -v', '/dev/cpuset']
        ret = self.server.du.run_cmd(self.n1, cmd, runas=TEST_USER)
        self.cset_path = ret['out'][0].split()[1]

        # launch hook
        self.launch_hook_body = """
import pbs
import time
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")
# print out the vnode_list[] values
for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")
# print out the vnode_list_fail[] values:
for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
if e.job.in_ms_mom():
    pj = e.job.release_nodes(keep_select="ncpus=1:mem=1gb")
    if pj is None:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at LAUNCH")
pbs.logmsg(pbs.LOG_DEBUG, "Sleeping for 20sec")
time.sleep(20)
"""

        self.script = {}
        self.job1_select = "ncpus=1:mem=1gb+" + \
            "ncpus=%d:mem=1gb:vnode=%s+" % (self.ncpus2, self.n2) + \
            "ncpus=%d:mem=1gb:vnode=%s" % (self.ncpus2, self.n3)
        self.job1_place = "vscatter"

        # expected values upon successful job submission
        self.job1_schedselect = "1:ncpus=1:mem=1gb+" + \
            "1:ncpus=%d:mem=1gb:vnode=%s+" % (self.ncpus2, self.n2) + \
            "1:ncpus=%d:mem=1gb:vnode=%s" % (self.ncpus2, self.n3)
        self.job1_exec_host = "%s/0+%s/0*%d+%s/1*%d" % (
            self.h0, self.h1, self.ncpus2, self.n1, self.ncpus2)
        self.job1_exec_vnode = "(%s:ncpus=1:mem=1048576kb)+" % (self.n0,) + \
            "(%s:ncpus=%d:mem=1048576kb)+" % (self.n2, self.ncpus2) + \
            "(%s:ncpus=%d:mem=1048576kb)" % (self.n3, self.ncpus2)

        # expected values after release of vnode of self.n3
        self.job1_schedsel1 = "1:ncpus=1:mem=1048576kb+" + \
            "1:ncpus=%d:mem=1048576kb:vnode=%s" % (self.ncpus2, self.n2)
        self.job1_exec_host1 = "%s/0+%s/0*%d" % (self.h0, self.h1, self.ncpus2)
        self.job1_exec_vnode1 = "(%s:ncpus=1:mem=1048576kb)+" % (self.n0,) + \
            "(%s:ncpus=%d:mem=1048576kb)" % (self.n2, self.ncpus2)

        # expected values during lengthy stageout
        self.job1_newsel = "1:ncpus=1:mem=1048576kb"
        self.job1_new_exec_host = "%s/0" % self.h0
        self.job1_new_exec_vnode = "(%s:ncpus=1:mem=1048576kb)" % self.n0

        # values to use when matching accounting logs
        self.job1_exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job1_exec_vnode_esc = self.job1_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.job1_sel_esc = self.job1_select.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.job1_new_exec_vnode_esc = self.job1_new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

    def tearDown(self):
        for host in [self.h0, self.h1]:
            test_img = os.path.join("/home", "pbsuser", "test.img")
            self.du.rm(hostname=host, path=test_img, force=True,
                       runas=TEST_USER)
        TestFunctional.tearDown(self)

    def test_reliable_job_startup_on_cpuset(self):
        """
        A job is started with two numa nodes and goes in R state.
        An execjob_launch hook will force job to have only one numa node.
        The released numa node can be used in another job.
        """
        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        stime = time.time()
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # Check mom logs that the launch hook got propagated
        msg = "Hook;launch.PY;copy hook-related file request received"
        self.moms.values()[1].log_match(msg, starttime=stime)

        # Submit job1 that uses second mom's two NUMA nodes, in R state
        a = {ATTR_l + '.select': self.job1_select,
             ATTR_l + '.place': self.job1_place,
             ATTR_W: 'tolerate_node_failures=job_start'}
        j = Job(TEST_USER, attrs=a)
        stime = time.time()
        jid = self.server.submit(j)

        # Check the exec_vnode while in substate 41
        self.server.expect(JOB, {ATTR_substate: '41'}, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode1 = job_stat[0]['exec_vnode']
        self.logger.info("initial exec_vnode: %s" % execvnode1)
        initial_vnodes = execvnode1.split('+')

        # Check the exec_vnode after job is in substate 42
        self.server.expect(JOB, {ATTR_substate: '42'}, offset=20, id=jid)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        execvnode2 = job_stat[0]['exec_vnode']
        self.logger.info("pruned exec_vnode: %s" % execvnode2)

        # Check mom logs for pruned from and pruned to messages
        self.moms.values()[0].log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, execvnode1), starttime=stime)
        self.moms.values()[0].log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, execvnode2), starttime=stime)

        # Find out the released vnode
        if initial_vnodes[0] == execvnode2:
            execvnodeB = initial_vnodes[1]
        else:
            execvnodeB = initial_vnodes[0]
        vnodeB = execvnodeB.split(':')[0].split('(')[1]
        self.logger.info("released vnode: %s" % vnodeB)

        # Submit job2 requesting all of the released vnode's cpus, job runs
        a = {ATTR_l + '.select': '1:ncpus=%d:mem=1gb:vnode=%s' % (
            self.ncpus2 * 2, vnodeB)}
        j2 = Job(TEST_USER, attrs=a)
        stime = time.time()
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, offset=20, id=jid2)

        # Check if vnode for job2 matches released vnode from job1
        self.server.expect(JOB, 'exec_vnode', id=jid2, op=SET)
        job_stat = self.server.status(JOB, id=jid2)
        execvnode3 = job_stat[0]['exec_vnode']
        vnode3 = execvnode3.split(':')[0].split('(')[1]
        self.assertEqual(vnode3, vnodeB)
        self.logger.info("job2 vnode %s is the released vnode %s" % (
            vnode3, vnodeB))

    def test_release_nodes_on_cpuset_sis(self):
        """
        On a cluster where the second mom is a cgroup cpuset system with two
        NUMA nodes, submit a job that will use cpus on both NUMA vnodes.
        The job goes in R state. Use pbs_release_nodes to successfully release
        one of the NUMA vnodes and its resources used in the job. Compare the
        job's cgroup cpuset info before and after calling pbs_release_nodes
        to verify that NUMA node's cpu resources were released.
        """
        # Submit a job that uses second mom's two NUMA nodes, in R state
        a = {ATTR_l + '.select': self.job1_select,
             ATTR_l + '.place': self.job1_place}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '3gb',
                                 'Resource_List.ncpus': 1 + self.ncpus2 * 2,
                                 'Resource_List.nodect': 3,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid1)

        # Check the cpuset before releasing self.n3 from jid1
        cset_file = os.path.join(self.cset_path, 'pbs_jobs.service/jobid',
                                 jid1, 'cpuset.cpus')
        cset_before = self.du.cat(self.n1, cset_file)
        cset_j1_before = cset_before['out']
        self.logger.info("cset_j1_before : %s" % cset_j1_before)

        before_release = time.time()

        # Release a NUMA vnode on second mom using command pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid1, self.n3]
        ret = self.server.du.run_cmd(self.server.hostname,
                                     cmd, runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.ncpus': 1 + self.ncpus2,
                                 'Resource_List.nodect': 2,
                                 'schedselect': self.job1_schedsel1,
                                 'exec_host': self.job1_exec_host1,
                                 'exec_vnode': self.job1_exec_vnode1}, id=jid1)

        # Check if sister mom updated its internal nodes table after release
        self.moms.values()[1].log_match('Job;%s;updated nodes info' % jid1,
                                        starttime=before_release - 1)

        # Check the cpuset for the job after releasing self.n3
        cset_after = self.du.cat(self.n1, cset_file)
        cset_j1_after = cset_after['out']
        self.logger.info("cset_j1_after : %s" % cset_j1_after)

        # Compare the before and after cpusets info
        msg = "%s: cpuset cpus remain after release of %s" % (jid1, self.n3)
        self.assertNotEqual(cset_j1_before, cset_j1_after, msg)

    def test_release_nodes_on_stageout_cset(self):
        """
        Submit a job, with -W release_nodes_on_stageout=true as a PBS directive
        in the job script, that will use cpus and mem on two NUMA vnodes on the
        second mom. The job goes in R state. The job creates a huge stageout
        file. When the job is deleted the sister NUMA vnodes are released
        during lengthy stageout and only the primary execution host's vnode
        is left assigned to the job.
        """
        FIB40 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', '') + \
            'pbs_python -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(40))\\\")"'
        FIB400 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', '') + \
            'pbs_python -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(400))\\\")"'

        self.script['job1'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            "#PBS -W stageout=test.img@%s:test.img\n" % (self.n1,) + \
            "#PBS -W release_nodes_on_stageout=true\n" + \
            "dd if=/dev/zero of=test.img count=1024 bs=2097152\n" + \
            "pbsdsh -n 1 -- %s\n" % (FIB40,) + \
            "pbsdsh -n 2 -- %s\n" % (FIB40,) + \
            "%s\n" % (FIB400,)

        stime = time.time()
        j = Job(TEST_USER)
        j.create_script(self.script['job1'])
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R',
                                 'release_nodes_on_stageout': 'True',
                                 'Resource_List.mem': '3gb',
                                 'Resource_List.ncpus': 1 + self.ncpus2 * 2,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)
        # Check various vnode status.
        attr0 = {'state': 'job-busy', 'jobs': jid + '/0',
                 'resources_assigned.ncpus': 1,
                 'resources_assigned.mem': '1048576kb'}
        self.server.expect(VNODE, attr0, id=self.n0)
        attr1 = {'state': 'free', 'resources_assigned.ncpus': 0,
                 'resources_assigned.mem': '0kb'}
        self.server.expect(VNODE, attr1, id=self.n1)
        jobs = ''
        for i in range(0, int(self.ncpus2)):
            jobs += ' %s/%d,' % (jid, i)
        jobs = jobs.strip().strip(',')
        attr2 = {'state': 'free',
                 'jobs': jobs,
                 'resources_assigned.ncpus': int(self.ncpus2),
                 'resources_assigned.mem': '1048576kb'}
        for vn in [self.n2, self.n3]:
            self.server.expect(VNODE, attr2, id=vn)
        # job's PBS_NODEFILE contents should match exec_host
        pbs_nodefile = os.path.join(self.server.
                                    pbs_conf['PBS_HOME'], 'aux', jid)
        cmd = ['cat', pbs_nodefile]
        ret = self.server.du.run_cmd(self.h0, cmd, sudo=False)
        self.assertTrue(self.hostA and self.hostB in ret['out'])

        # The job will write out enough file size to have a lengthy stageout
        self.check_stageout_file_size()

        # Deleting the job will trigger the stageout process
        # at which time the sister node is automatically released
        # due to release_nodes_stageout=true set
        self.server.delete(jid)

        # Verify remaining job resources.
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '1gb',
                                 'Resource_List.ncpus': 1,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)
        # Check various vnode status
        attr0 = {'state': 'job-busy', 'jobs': jid + '/0',
                 'resources_assigned.ncpus': 1,
                 'resources_assigned.mem': '1048576kb'}
        self.server.expect(VNODE, attr0, id=self.n0)
        attr1 = {'state': 'free', 'resources_assigned.ncpus': '0',
                 'resources_assigned.mem': '0kb'}
        for vn in [self.n1, self.n2, self.n3]:
            self.server.expect(VNODE, attr1, id=vn)
        # job's PBS_NODEFILE contents should match exec_host
        ret = self.server.du.run_cmd(self.h0, cmd, sudo=False)
        self.assertTrue(self.hostA in ret['out'])
        self.assertFalse(self.hostB in ret['out'])
        # Verify mom_logs
        self.moms.values()[0].log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.n1), n=10, regexp=True)
        self.moms.values()[1].log_match(
            "Job;%s;DELETE_JOB2 received" % (jid,), n=20)
        # Check account update ('u') record
        msg0 = ".*%s;%s.*exec_host=%s" % ('u', jid, self.job1_exec_host_esc)
        msg1 = ".*exec_vnode=%s" % self.job1_exec_vnode_esc
        msg2 = r".*Resource_List\.mem=%s" % '3gb'
        msg3 = r".*Resource_List\.ncpus=%d" % 9
        msg4 = r".*Resource_List\.place=%s" % self.job1_place
        msg5 = r".*Resource_List\.select=%s.*" % self.job1_sel_esc
        msg = msg0 + msg1 + msg2 + msg3 + msg4 + msg5
        self.server.accounting_match(msg=msg, regexp=True, n="ALL",
                                     starttime=stime)
        # Check to make sure 'c' (next) record got generated
        msg0 = ".*%s;%s.*exec_host=%s" % ('c', jid, self.job1_new_exec_host)
        msg1 = ".*exec_vnode=%s" % self.job1_new_exec_vnode_esc
        msg2 = r".*Resource_List\.mem=%s" % '1048576kb'
        msg3 = r".*Resource_List\.ncpus=%d" % 1
        msg4 = r".*Resource_List\.place=%s" % self.job1_place
        msg5 = r".*Resource_List\.select=%s.*" % self.job1_newsel
        msg = msg0 + msg1 + msg2 + msg3 + msg4 + msg5
        self.server.accounting_match(msg=msg, regexp=True, n="ALL",
                                     starttime=stime)


================================================
FILE: test/tests/functional/pbs_cray_check_node_exclusivity.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('cray', 'reservation')
class TestCheckNodeExclusivity(TestFunctional):

    """
    Test suite for reservation. This test Suite checks
    the exclusivity of node when a reservation asks for it.
    Adapted for Cray Configuration
    """
    ncpus = None
    vnode = None

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.skipTest("Test suite only meant to run on a Cray")
        self.script = []
        self.script += ['echo Hello World\n']
        self.script += ['aprun -b -B /bin/sleep 10']

        TestFunctional.setUp(self)

    def submit_and_confirm_resv(self, a=None, index=None):
        """
        This is common function to submit reservation
        and verify reservation confirmed
        """
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        if index is not None:
            a['reserve_index'] = index
        self.server.expect(RESV, a, id=rid)
        return rid

    def get_vnode_ncpus_value(self):
        all_nodes = self.server.status(NODE)
        for n in all_nodes:
            if n['resources_available.vntype'] == 'cray_compute':
                self.ncpus = n['resources_available.ncpus']
                self.vnode = n['resources_available.vnode']
                break

    def test_node_state_with_adavance_resv(self):
        """
        Test node state will change when reservation
        asks for exclusivity.
        """
        # Submit a reservation with place=excl
        start_time = time.time()
        now = int(start_time)
        a = {'Resource_List.select': '1:ncpus=1:vntype=cray_compute',
             'Resource_List.place': 'excl', 'reserve_start': now + 30,
             'reserve_end': now + 60}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)
        self.server.restart()
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)

        self.logger.info('Waiting 20s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=20)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Wait for reservation to delete from server
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=start_time, interval=10)
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)

    def test_node_state_with_standing_resv(self):
        """
        Test node state will change when reservation
        asks for exclusivity.
        """
        if 'PBS_TZID' in self.conf:
            tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Missing timezone, using America/Los_Angeles')
            tzone = 'America/Los_Angeles'
        # Submit a standing reservation to occur every other minute for a
        # total count of 2
        start = time.time() + 20
        now = start + 20
        start = int(start)
        end = int(now)
        a = {'Resource_List.select': '1:ncpus=1:vntype=cray_compute',
             'Resource_List.place': 'excl',
             ATTR_resv_rrule: 'FREQ=MINUTELY;COUNT=2',
             ATTR_resv_timezone: tzone,
             'reserve_start': start,
             'reserve_end': end,
             }
        rid = self.submit_and_confirm_resv(a, 1)
        rid_q = rid.split(".")[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)
        self.logger.info('Waiting 10s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5"),
             'reserve_index': 1}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Wait for standing reservation first instance to finished
        self.logger.info(
            'Waiting 20 sec for second instance of reservation to start')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2"),
                    'reserve_index': 2}
        self.server.expect(RESV, exp_attr, id=rid, offset=20)
        # Node state of the nodes in resv_nodes should be free
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)
        # Wait for standing reservation second instance to start
        self.logger.info(
            'Waiting 40 sec for second instance of reservation to start')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5"),
                    'reserve_index': 2}
        self.server.expect(RESV, exp_attr, id=rid, offset=40, interval=1)
        # check the node state of the nodes in resv_nodes
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Wait for reservations to be finished
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=now, interval=2)
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)

    def test_job_outside_resv_not_allowed(self):
        """
        Test Job outside the reservation will not be allowed
        to run if reservation has place=excl.
        """
        # Submit a reservation with place=excl
        start_time = time.time()
        now = int(start_time)
        a = {'Resource_List.select': '1:ncpus=1:vntype=cray_compute',
             'Resource_List.place': 'excl', 'reserve_start': now + 20,
             'reserve_end': now + 30}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)
        self.logger.info('Waiting 20s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=20)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Submit a job outside the reservation requesting resv_nodes
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_q: 'workq', ATTR_l + '.select': '1:vnode=%s' % resv_node}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        comment = 'Not Running: Insufficient amount of resource: vnode'
        self.server.expect(
            JOB, {'job_state': 'Q', 'comment': comment}, id=jid1)
        # Wait for reservation to end and verify node state
        # changed as job-exclusive
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=start_time, interval=2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive'},
                           id=resv_node)

    def test_conflict_reservation_on_resv_exclusive_node(self):
        """
        Test no other reservation will get confirmed (in the duration)
        when a node has a exclusive reservation confirmed on it.
        Reservation2 is inside the duration of confirmed reservation
        requesting the same vnode in Reservation1.
        """
        # Submit a reservation with place=excl
        start_time = time.time()
        now = int(start_time)
        a = {'Resource_List.select': '1:ncpus=1:vntype=cray_compute',
             'Resource_List.place': 'excl', 'reserve_start': now + 20,
             'reserve_end': now + 60}
        rid = self.submit_and_confirm_resv(a)
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.logger.info('Waiting 20s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=20)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Submit another reservation requesting on vnode in resv_node
        a = {ATTR_l + '.select': '1:ncpus=1:vnode=%s' % resv_node,
             'reserve_start': now + 25,
             'reserve_end': now + 30}
        r = Reservation(TEST_USER, attrs=a)
        rid2 = self.server.submit(r)
        msg = "Resv;" + rid2 + ";Reservation denied"
        self.server.log_match(msg, starttime=start_time, interval=2)
        msg2 = "Resv;" + rid2 + ";reservation deleted"
        self.server.log_match(msg2, starttime=now, interval=2)
        msg3 = "Resv;" + rid2 + ";PBS Failed to confirm resv: Insufficient "
        msg3 += "amount of resource: vnode"
        self.scheduler.log_match(msg3, starttime=now, interval=2)

    def test_node_exclusivity_with_multinode_reservation(self):
        """
        Test Jobs run correctly in multinode reservation
        and accordingly update node exclusivity.
        """
        self.get_vnode_ncpus_value()
        # Submit a reservation with place=excl
        now = int(time.time())
        a = {ATTR_l + '.select': '2:ncpus=%d' % (int(self.ncpus)),
             'Resource_List.place': 'excl', 'reserve_start': now + 10,
             'reserve_end': now + 1600}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split(".")[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()
        self.logger.info('Waiting 10s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node[0])
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node[1])
        # Submit a job inside the reservation
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '1:ncpus=1',
             'Resource_List.place': 'shared'}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive,resv-exclusive'},
                           id=resv_node[0])
        # Submit another job inside the reservation
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '2:ncpus=1',
             'Resource_List.place': 'shared'}
        j2 = Job(TEST_USER, attrs=a)
        j2.create_script(self.script)
        jid2 = self.server.submit(j2, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(NODE, {'state': 'job-exclusive,resv-exclusive'},
                           id=resv_node[0])

    def test_multiple_reservation_request_exclusive_placement(self):
        """
        Test Multiple reservations requesting exclusive placement
        are confirmed when not overlapping in time.
        """
        self.get_vnode_ncpus_value()
        # Submit a reservation with place=excl
        now = int(time.time())
        a = {ATTR_l + '.select': '1:ncpus=1:vnode=%s' % self.vnode,
             'Resource_List.place': 'excl', 'reserve_start': now + 10,
             'reserve_duration': 3600}
        rid = self.submit_and_confirm_resv(a)
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        # Submit a non-overlapping reservation requesting place=excl
        a = {ATTR_l + '.select': '1:ncpus=1:vnode=%s' % resv_node,
             'Resource_List.place': 'excl',
             'reserve_start': now + 7200,
             'reserve_duration': 3600}
        self.submit_and_confirm_resv(a)

    def test_delete_future_resv_not_effect_node_state(self):
        """
        Test (Advance Reservation)Multiple reservations requesting exclusive
        placement are confirmed when not overlapping.
        Deleting the latter reservation after earlier one starts running
        leaves node in state resv-exclusive.
        """
        self.get_vnode_ncpus_value()
        # Submit a reservation with place=excl
        now = int(time.time())
        a = {ATTR_l + '.select': '1:ncpus=1:vnode=%s' % self.vnode,
             'Resource_List.place': 'excl', 'reserve_start': now + 10,
             'reserve_duration': 3600}
        rid = self.submit_and_confirm_resv(a)
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        # Submit a non-overlapping reservation requesting place=excli
        # on vnode in resv_node
        a = {ATTR_l + '.select': '1:ncpus=1:vnode=%s' % resv_node,
             'Resource_List.place': 'excl',
             'reserve_start': now + 7200,
             'reserve_duration': 3600}
        rid2 = self.submit_and_confirm_resv(a)
        self.logger.info('Waiting 10s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Delete future reservation rid2 and verify that resv node
        # is still in state resv-exclusive
        self.server.delete(rid2)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)

    def test_delete_future_standing_resv_not_effect_node_state(self):
        """
        Test (Standing Reservation)Multiple reservations requesting exclusive
        placement are confirmed when not overlapping.
        Deleting the latter reservation after earlier one starts running
        leaves node in state resv-exclusive.
        """
        self.get_vnode_ncpus_value()

        if 'PBS_TZID' in self.conf:
            tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Missing timezone, using America/Los_Angeles')
            tzone = 'America/Los_Angeles'
        # Submit a standing reservation with place=excl
        now = int(time.time())
        a = {ATTR_l + '.select': '1:ncpus=1:vnode=%s' % self.vnode,
             'Resource_List.place': 'excl',
             ATTR_resv_rrule: 'FREQ=HOURLY;COUNT=2',
             ATTR_resv_timezone: tzone,
             'reserve_start': now + 10,
             'reserve_end': now + 3100}
        rid = self.submit_and_confirm_resv(a)
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        # Submit a non-overlapping reservation requesting place=excli
        # on vnode in resv_node
        a = {ATTR_l + '.select': '1:ncpus=1:vnode=%s' % resv_node,
             'Resource_List.place': 'excl',
             ATTR_resv_rrule: 'FREQ=HOURLY;COUNT=2',
             ATTR_resv_timezone: tzone,
             'reserve_start': now + 7200,
             'reserve_end': now + 10800}
        rid2 = self.submit_and_confirm_resv(a)
        self.logger.info('Waiting 10s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Delete future reservation rid2 and verify that resv node
        # is still in state resv-exclusive
        self.server.delete(rid2)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)

    def test_job_inside_exclusive_reservation(self):
        """
        Test Job will run correctly inside the exclusive
        reservation
        """
        self.script2 = []
        self.script2 += ['echo Hello World\n']
        self.script2 += ['/bin/sleep 10']

        # Submit a reservation with place=excl
        start_time = time.time()
        now = int(start_time)
        a = {'Resource_List.select': '1:ncpus=1:vntype=cray_login',
             'Resource_List.place': 'excl', 'reserve_start': now + 20,
             'reserve_end': now + 40}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)
        self.logger.info('Waiting 20s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=20)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Submit a job inside the reservation
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '1:ncpus=1:vntype=cray_login',
             'Resource_List.place': 'excl'}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script2)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        self.server.expect(
            JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive,resv-exclusive'},
                           id=resv_node)
        # wait 5 sec for job to end
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node, offset=5, interval=10)
        # Wait for reservation to end and verify node state
        # changed as free
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=start_time, interval=2)
        self.server.expect(NODE, {'state': 'free'},
                           id=resv_node)

        #  Test Job will run correctly inside the exclusive
        #  standing reservation requesting compute_node
        if 'PBS_TZID' in self.conf:
            tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Missing timezone, using America/Los_Angeles')
            tzone = 'America/Los_Angeles'
        # Submit a standing reservation with place=excl
        now = int(time.time())
        a = {ATTR_l + '.select': '1:ncpus=1:vntype=cray_compute',
             'Resource_List.place': 'excl',
             ATTR_resv_rrule: 'FREQ=HOURLY;COUNT=1',
             ATTR_resv_timezone: tzone,
             'reserve_start': now + 10,
             'reserve_end': now + 300}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.server.expect(NODE, {'state': 'free'}, id=resv_node)
        self.logger.info('Waiting 10s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node)
        # Submit a job inside the reservation
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_q: rid_q}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive,resv-exclusive'},
                           id=resv_node)
        # wait 5 sec for job to end
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node, offset=5, interval=10)

    def test_reservation_request_node_ignore_excl(self):
        """
        Test Reservation asking for place=excl
        will not get confirmed if node has
        ignore_excl set on it.
        """

        a = {'sharing': 'ignore_excl'}
        self.mom.create_vnodes(a, 1,
                               createnode=False,
                               delall=False, usenatvnode=True)
        self.server.expect(NODE, {'state': 'free',
                                  'sharing': 'ignore_excl'},
                           id=self.mom.shortname)
        # Submit a reservation
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1:vntype=cray_login',
             'Resource_List.place': 'excl', 'reserve_start': now + 20,
             'reserve_end': now + 40}
        rid = self.submit_and_confirm_resv(a)
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        # Wait for reservation to start and verify
        # node state should not be resv-exclusive
        self.logger.info('Waiting 10s for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_node, op=NE)

    def test_multijob_on_resv_exclusive_node(self):
        """
        Test multiple jobs request inside a reservation
        if none(node,reservation or job) asks for exclusivity
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2:vntype=cray_compute',
             'Resource_List.place': 'shared', 'reserve_start': now + 20,
             'reserve_end': now + 40}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.logger.info('Waiting for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'}, id=resv_node)
        a = {ATTR_q: rid_q}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive,resv-exclusive'},
                           id=resv_node)
        j2 = Job(TEST_USER, attrs=a)
        j2.create_script(self.script)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

    def test_job_with_exclusive_placement(self):
        """
        Job will honour exclusivity inside the reservation
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2:vntype=cray_compute',
             'Resource_List.place': 'excl', 'reserve_start': now + 20,
             'reserve_end': now + 40}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.logger.info('Waiting for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '1:ncpus=1',
             'Resource_List.place': 'excl'}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '1:ncpus=1',
             'Resource_List.place': 'shared'}
        j2 = Job(TEST_USER, attrs=a)
        j2.create_script(self.script)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid1, offset=5)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

    def test_job_running_on_multinode_reservation(self):
        """
        Test to submit job on multinode reservation with different placement
        """
        ncpus = []
        vnodes = self.server.status(NODE)
        num_vnodes = 2
        i = 0
        for vnode in vnodes:
            if i < 2:
                if vnode['resources_available.vntype'] == 'cray_compute':
                    ncpus.append(int(vnode['resources_available.ncpus']))
                    i += 1
                    if i == 2:
                        break
        total_ncpus = ncpus[0] + ncpus[1]
        req_ncpus = min(ncpus[0] / 2, ncpus[1] / 2)
        now = int(time.time())
        a = {
            'Resource_List.select': '2:ncpus=%d:vntype=cray_compute' % min(
                ncpus[0], ncpus[1]),
            'Resource_List.place': 'excl',
            'reserve_start': now + 20,
            'reserve_end': now + 60}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.logger.info('Waiting for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=20)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '2:ncpus=%d' % req_ncpus,
             'Resource_List.place': 'scatter'}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '1:ncpus=%d' % ncpus[0],
             'Resource_List.place': 'excl'}
        j2 = Job(TEST_USER, attrs=a)
        j2.create_script(self.script)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        a = {ATTR_q: rid_q, ATTR_l + '.select': '1:ncpus=%d' % ncpus[1],
             'Resource_List.place': 'shared'}
        j3 = Job(TEST_USER, attrs=a)
        j3.create_script(self.script)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid1, offset=5)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

    def test_job_with_exclhost_placement_inside_resv(self):
        """
        Job inside a reservation asking for place=exclhost on host
        will have all resources of the vnodes present on host assigned to it
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2:vntype=cray_compute',
             'Resource_List.place': 'exclhost', 'reserve_start': now + 20,
             'reserve_end': now + 40}
        rid = self.submit_and_confirm_resv(a)
        rid_q = rid.split('.')[0]
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        self.logger.info('Waiting for reservation to start')
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'resv-exclusive'}, id=resv_node)
        a = {ATTR_q: rid_q}
        j1 = Job(TEST_USER, attrs=a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive,resv-exclusive'},
                           id=resv_node)
        a = {ATTR_q: rid_q}
        j2 = Job(TEST_USER, attrs=a)
        j2.create_script(self.script)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid1, offset=10)
        self.server.expect(RESV, 'queue', op=UNSET, id=rid, offset=10)
        self.server.expect(NODE, {'state': 'free'}, id=resv_node)


================================================
FILE: test/tests/functional/pbs_cray_hyperthread.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.utils.pbs_crayutils import CrayUtils
import os


@tags('cray')
class TestCrayHyperthread(TestFunctional):

    """
    The test will submit a job script that calls aprun with the
    option that will allow callers to use the hyperthreads
    on a hyperthreaded compute node.
    """

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.skipTest("Test suite only meant to run on a Cray")
        TestFunctional.setUp(self)

    def test_hyperthread(self):
        """
        Check for a compute node that has hyperthreads, if there is one
        submit a job to that node requesting the hyperthreads.  Check
        there are no errors in the job error output.
        If there is no node with hyperthreads, skip the test.
        """
        # Get the compute nodes from PBS and see if they are threaded
        cu = CrayUtils()
        all_nodes = self.server.status(NODE)
        threaded = 0
        for n in all_nodes:
            if n['resources_available.vntype'] == 'cray_compute':
                numthreads = cu.get_numthreads(
                    n['resources_available.PBScraynid'])
                if numthreads > 1:
                    self.logger.info("Node %s has %s hyperthreads" %
                                     (n['resources_available.vnode'],
                                      numthreads))
                    ncpus = n['resources_available.ncpus']
                    vnode = n['resources_available.vnode']
                    threaded = 1
                    break
        if not threaded:
            self.skipTest("Test suite needs nodes with hyperthreads")

        # There is a node with hyperthreads, get the number of cpus
        aprun_args = '-j %d -n %d' % (int(numthreads), int(ncpus))
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})
        j1 = Job(TEST_USER, {ATTR_l + '.select': '1:ncpus=%d:vnode=%s' %
                             (int(ncpus), vnode),
                             ATTR_N: 'hyperthread'})

        scr = []
        scr += ['hostname\n']
        scr += ['/bin/sleep 5\n']
        scr += ['aprun -b %s /bin/hostname\n' % aprun_args]

        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        j1.create_script(scr)
        jid1 = self.server.submit(j1, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Verify the contents of the output/error files
        self.server.expect(JOB, {'job_state': 'F'}, id=jid1, extend='x')
        error_file = os.path.join(
            sub_dir, 'hyperthread.e' + jid1.split('.')[0])
        self.assertEqual(os.stat(error_file).st_size, 0,
                         msg="Job error file should be empty")


================================================
FILE: test/tests/functional/pbs_cray_pagg_id.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('cray')
class TestCrayPaggIdUniqueness(TestFunctional):
    """
    This test suite is written to verify that the PAGG ID provided to ALPS
    while confirming and releasing an ALPS reservation is not equal to the
    session ID of the job.
    This test is specific to Cray and will also not work on the Cray simulator,
    hence, will be skipped on non-Cray systems and Cray simulator.
    """
    def setUp(self):
        platform = self.du.get_platform()
        if platform != 'cray':
            self.skipTest("not a cray")
        TestFunctional.setUp(self)

    def test_pagg_id(self):
        """
        This test case submits a job, waits for it to run and then checks
        the MoM logs to confirm that the PAGG ID provided in the ALPS
        query is not equal to the session ID of the job.
        """
        j1 = Job(TEST_USER)
        jid = self.server.submit(j1)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        self.mom.log_match("Job;%s;Started, pid" % (jid,), n=100,
                           max_attempts=5, interval=5, regexp=True)

        self.server.status(JOB, [ATTR_session], jid)
        sess_id = j1.attributes[ATTR_session]

        msg = "pagg_id =\"" + sess_id + "\""
        try:
            self.mom.log_match(msg, n='ALL')
        except PtlLogMatchError:
            self.logger.info("pagg_id is not equal to session id, test passes")
        else:
            self.assertFalse("pagg_id is equal to session id, test fails.")


================================================
FILE: test/tests/functional/pbs_cray_reliable_job_startup.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
import fnmatch
from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


@tags('cray')
class TestPbsReliableJobStartupOnCray(TestFunctional):

    """
    This tests the Reliable Job Startup Feature on Cray.
    A job can be started with extra nodes with node failures tolerated
    during job start but setting is not supported and ignored on Cray.
    """

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.skipTest("Test suite only meant to run on a Cray")
        TestFunctional.setUp(self)

        # queuejob hook
        self.qjob_hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "queuejob hook executed")
# Save current select spec in resource 'site'
e.job.Resource_List["site"] = str(e.job.Resource_List["select"])
new_select = e.job.Resource_List["select"].increment_chunks(1)
e.job.Resource_List["select"] = new_select
e.job.tolerate_node_failures = "job_start"
"""

        # prologue hook
        self.prolo_hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prologue")
# print out the vnode_list[] values
for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "prologue: found vnode_list[" + v.name + "]")
# print out the vnode_list_fail[] values
for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "prologue: found vnode_list_fail[" + v.name + "]")
if e.job.in_ms_mom():
    pj = e.job.release_nodes(keep_select=e.job.Resource_List["site"])
    if pj is None:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at PROLOGUE")
"""

        # launch hook
        self.launch_hook_body = """
import pbs
e=pbs.event()
if 'PBS_NODEFILE' not in e.env:
    e.accept()
pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")
# print out the vnode_list[] values
for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")
# print out the vnode_list_fail[] values:
for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
    v.state = pbs.ND_OFFLINE
if e.job.in_ms_mom():
    pj = e.job.release_nodes(keep_select=e.job.Resource_List["site"])
    if pj is None:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at LAUNCH")
"""

    def match_str_in_input_file(self, file_path, file_pattern, search_str):
        """
        Assert that search string appears in the input file
        that matches file_pattern
        """
        input_file = None
        for item in self.du.listdir(path=file_path, sudo=True):
            if fnmatch.fnmatch(item, file_pattern):
                input_file = item
                break
        self.assertTrue(input_file is not None)
        with PBSLogUtils().open_log(input_file, sudo=True) as f:
            self.assertTrue(search_str in f.read().decode())
            self.logger.info("Found \"%s\" in %s" % (search_str, input_file))

    @tags('cray')
    def test_reliable_job_startup_not_supported_on_cray(self):
        """
        A job is started with extra nodes. Mom superior will show no sign
        of tolerating node failure.  Accounting logs won't have 's' record.
        Input files to prologue and launch hooks will show the
        tolerate_node_failures=none value.
        """
        # instantiate queuejob hook
        hook_event = 'queuejob'
        hook_name = 'qjob'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_prologue hook
        hook_event = 'execjob_prologue'
        hook_name = 'prolo'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_event = 'execjob_launch'
        hook_name = 'launch'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # Submit a job
        j = Job(TEST_USER, {ATTR_l + '.select': '1:ncpus=3:mem=2gb:vntype=' +
                            'cray_compute+1:ncpus=3:mem=2gb:vntype=' +
                            'cray_compute',
                            ATTR_l + '.place': 'scatter'})
        start_time = time.time()
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Check for msg in mom superior logs
        msg = "no nodes released as job does not tolerate node failures"
        self.server.expect(JOB, 'exec_host', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        exechost = job_stat[0]['exec_host'].partition('/')[0]
        mom_superior = self.moms[exechost]
        mom_superior.log_match(msg, starttime=start_time)

        # Check that 's' record is absent since release_nodes() was not called
        self.server.accounting_match(
            msg=".*%s;%s;.*" % ('s', jid),
            regexp=True, n=50, max_attempts=10, existence=False)
        self.logger.info(
            "There was no 's' record found for job %s, test passes" % jid)

        # On mom superior check the input files to prologue and launch hooks
        # showed the tolerate_node_failures=none value
        search_str = 'pbs.event().job.tolerate_node_failures=none'
        self.mom_hooks_tmp_dir = os.path.join(
            self.server.pbs_conf['PBS_HOME'], 'mom_priv', 'hooks', 'tmp')

        hook_name = 'prolo'
        input_file_pattern = os.path.join(
            self.mom_hooks_tmp_dir, 'hook_execjob_prologue_%s*.in' % hook_name)
        self.match_str_in_input_file(
            self.mom_hooks_tmp_dir, input_file_pattern, search_str)

        hook_name = 'launch'
        input_file_pattern = os.path.join(
            self.mom_hooks_tmp_dir, 'hook_execjob_launch_%s*.in' % hook_name)
        self.match_str_in_input_file(
            self.mom_hooks_tmp_dir, input_file_pattern, search_str)


================================================
FILE: test/tests/functional/pbs_cray_smoketest.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.utils.pbs_crayutils import CrayUtils
import os


@tags('cray', 'smoke')
class TestCraySmokeTest(TestFunctional):

    """
    Set of tests that qualifies as smoketest for Cray platform
    """

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.skipTest("Test suite only meant to run on a Cray")
        TestFunctional.setUp(self)

        # no node in 'resv' and 'use' in apstat
        cu = CrayUtils()
        self.assertEqual(cu.count_node_summ('resv'), 0,
                         "No compute node should be having ALPS reservation")
        self.assertEqual(cu.count_node_summ('use'), 0,
                         "No compute node should be in use")

        # The number of compute nodes in State up and batch mode
        # (State = 'UP  B') should equal the number of cray_compute nodes.
        nodes_up_b = cu.count_node_state('UP  B')
        self.logger.info("Nodes with State 'UP  B' : %s" % nodes_up_b)
        nodes_up_i = cu.count_node_state('UP  I')
        self.logger.info("Nodes with State 'UP  I' : %s" % nodes_up_i)
        nodes = self.server.filter(NODE,
                                   {ATTR_rescavail + '.vntype':
                                    'cray_compute'})
        num_cray_compute = len(nodes[ATTR_rescavail + '.vntype=cray_compute'])
        self.assertEqual(nodes_up_b, num_cray_compute)
        self.logger.info("nodes in State 'UP  B': %s == cray_compute: %s" %
                         (nodes_up_b, num_cray_compute))

        # nodes are free and resources are available.
        nodes = self.server.status(NODE)
        for node in nodes:
            self.assertEqual(node['state'], 'free')
            self.assertEqual(node['resources_assigned.ncpus'], '0')
            self.assertEqual(node['resources_assigned.mem'], '0kb')

    @staticmethod
    def find_hw(output_file):
        """
        Find the string "Hello World" in the specified file.
        Return 1 if found.
        """
        found = 0
        with open(output_file, 'r') as outf:
            for line in outf:
                if "Hello World" in line:
                    found = 1
                    break
                else:
                    continue
        return found

    @tags('cray', 'smoke')
    def test_cray_login_job(self):
        """
        Submit a simple sleep job that requests to run on a login node
        and expect that job to go in running state on a login node.
        Verify that the job runs to completion and check job output/error.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})
        j1 = Job(TEST_USER, {ATTR_l + '.vntype': 'cray_login',
                             ATTR_N: 'cray_login'})

        scr = []
        scr += ['echo Hello World\n']
        scr += ['/bin/sleep 5\n']

        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        j1.create_script(scr)
        jid1 = self.server.submit(j1, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        # fetch node name where the job is running and check that the
        # node is a login node
        self.server.status(JOB, 'exec_vnode', id=jid1)
        vname = j1.get_vnodes()[0]
        self.server.expect(NODE, {ATTR_rescavail + '.vntype': 'cray_login'},
                           id=vname, max_attempts=1)

        cu = CrayUtils()
        # Check if number of compute nodes in use are 0
        self.assertEqual(cu.count_node_summ('use'), 0)

        # verify the contents of output/error files
        self.server.expect(JOB, {'job_state': 'F'}, id=jid1, extend='x')
        error_file = os.path.join(sub_dir, 'cray_login.e' + jid1.split('.')[0])
        self.assertEqual(os.stat(error_file).st_size, 0,
                         msg="Job error file should be empty")

        output_file = os.path.join(
            sub_dir, 'cray_login.o' + jid1.split('.')[0])
        foundhw = self.find_hw(output_file)
        self.assertEqual(foundhw, 1, msg="Job output file incorrect")

    @tags('cray', 'smoke')
    def test_cray_compute_job(self):
        """
        Submit a simple sleep job that runs on a compute node and
        expect the job to go in running state on a compute node.
        Verify that the job runs to completion and check job output/error.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})
        j1 = Job(TEST_USER, {ATTR_l + '.vntype': 'cray_compute',
                             ATTR_N: 'cray_compute'})

        scr = []
        scr += ['echo Hello World\n']
        scr += ['/bin/sleep 5\n']
        scr += ['aprun -b -B /bin/sleep 10\n']

        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        j1.create_script(scr)
        jid1 = self.server.submit(j1, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        # fetch node name where the job is running and check that the
        # node is a compute node
        self.server.status(JOB, 'exec_vnode', id=jid1)
        vname = j1.get_vnodes()[0]
        self.server.expect(NODE, {ATTR_rescavail + '.vntype': 'cray_compute'},
                           id=vname)
        # Sleep for some time before aprun actually starts
        # using the reservation
        self.logger.info(
            "Sleeping 6 seconds before aprun starts using the reservation")
        time.sleep(6)

        cu = CrayUtils()
        # Check if number of compute nodes in use is 1
        self.assertEqual(cu.count_node_summ('resv'), 1)
        if self.du.get_platform() == 'cray':
            # Cray simulator will not show anything in 'use' because
            # aprun command is just a pass through on simulator
            self.assertEqual(cu.count_node_summ('use'), 1)
        # verify the contents of output/error files
        self.server.expect(JOB, {'job_state': 'F'}, id=jid1, extend='x')
        error_file = os.path.join(
            sub_dir, 'cray_compute.e' + jid1.split('.')[0])
        self.assertEqual(os.stat(error_file).st_size, 0,
                         msg="Job error file should be empty")

        output_file = os.path.join(
            sub_dir, 'cray_compute.o' + jid1.split('.')[0])
        foundhw = self.find_hw(output_file)
        self.assertEqual(foundhw, 1, msg="Job output file incorrect")

        (cu.node_status, cu.node_summary) = cu.parse_apstat_rn()
        self.assertEqual(cu.count_node_summ('resv'), 0)
        if self.du.get_platform() == 'cray':
            self.assertEqual(cu.count_node_summ('use'), 0)


================================================
FILE: test/tests/functional/pbs_cray_suspend_resume.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *
from ptl.utils.pbs_crayutils import CrayUtils


@tags('cray')
class TestSuspendResumeOnCray(TestFunctional):

    """
    Test special cases where suspend/resume functionality differs on cray
    as compared to other platforms.
    This test suite expects the platform to be 'cray' and assumes that
    suspend/resume feature is enabled on it.
    """
    cu = CrayUtils()

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.skipTest("Test suite only meant to run on a Cray")
        TestFunctional.setUp(self)

    @tags('cray', 'smoke')
    def test_default_restrict_res_to_release_on_suspend_setting(self):
        """
        Check that on Cray restrict_res_to_release_on_suspend is always set
        to 'ncpus' by default
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.expect(SERVER, a)

    def test_exclusive_job_not_suspended(self):
        """
        If a running job is a job with exclusive placement then this job can
        not be suspended.
        This test is checking for a log message which is an unstable
        interface and may need change in future when interface changes.
        """

        msg_expected = "BASIL;ERROR: ALPS error: apsched: \
at least resid .* is exclusive"
        # Submit a job
        j = Job(TEST_USER, {ATTR_l + '.select': '1:ncpus=1',
                            ATTR_l + '.place': 'excl'})
        check_after = time.time()
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # suspend job
        try:
            self.server.sigjob(jobid=jid, signal="suspend")
        except PbsSignalError as e:
            self.assertTrue("Switching ALPS reservation failed" in e.msg[0])

        self.server.expect(JOB, 'exec_host', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        s = self.mom.log_match(msg_expected, starttime=check_after,
                               regexp=True, max_attempts=10)
        self.assertTrue(s)

    @tags('cray')
    def test_basic_admin_suspend_restart(self):
        """
        Test basic admin-suspend funcionality for jobs and array jobs with
        restart on Cray. The restart will test if the node recovers properly
        in maintenance. After turning off scheduling and a mom restart, a
        subjob is always requeued and node shows up as free.
        """
        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        qstat = self.server.status(JOB, 'exec_vnode', id=jid1)
        vname = qstat[0]['exec_vnode'].partition(':')[0].strip('(')

        # admin-suspend regular job
        self.server.sigjob(jid1, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vname)
        self.server.expect(NODE, {'maintenance_jobs': jid1})

        self.server.restart()
        self.server.expect(NODE, {'state': 'maintenance'}, id=vname)
        self.server.expect(NODE, {'maintenance_jobs': jid1})

        # Adding sleep to avoid failure at resume since PBS licenses
        # might not be available and as a result resume fails
        time.sleep(2)

        # admin-resume regular job. Make sure the node retuns to state
        # job-exclusive.
        self.server.sigjob(jid1, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=vname)
        self.server.cleanup_jobs()

        # admin-suspend job array
        jA = Job(TEST_USER, {ATTR_l + '.select': '1:ncpus=1', ATTR_J: '1-2'})
        jidA = self.server.submit(jA)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jidA)

        subjobs = self.server.status(JOB, id=jidA, extend='t')
        # subjobs[0] is the array itself.  Need the subjobs
        jid1 = subjobs[1]['id']
        jid2 = subjobs[2]['id']

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        qstat = self.server.status(JOB, 'exec_vnode', id=jid1)
        vname1 = qstat[0]['exec_vnode'].partition(':')[0].strip('(')
        qstat = self.server.status(JOB, 'exec_vnode', id=jid2)
        vname2 = qstat[0]['exec_vnode'].partition(':')[0].strip('(')

        # admin-suspend subjob 1
        self.server.sigjob(jid1, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vname1)
        self.server.expect(NODE, {'maintenance_jobs': jid1})

        # admin-resume subjob 1 . Make sure the node retuns to state
        # job-exclusive.
        self.server.sigjob(jid1, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=vname1)

        # admin-suspend subjob 2
        self.server.sigjob(jid2, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid2)
        self.server.expect(NODE, {'state': 'maintenance'}, id=vname2)
        self.server.expect(NODE, {'maintenance_jobs': jid2})

        # Turn off scheduling and restart mom
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.mom.restart()

        # Check that nodes are now free
        self.server.expect(NODE, {'state': 'free'}, id=vname1)
        self.server.expect(NODE, {'state': 'free'}, id=vname2)

    def test_admin_suspend_wrong_state(self):
        """
        Check that wrong 'resume' signal is correctly rejected.
        """
        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.sigjob(jid1, "suspend", runas=ROOT_USER)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

        try:
            self.server.sigjob(jid1, "admin-resume", runas=ROOT_USER)
        except PbsSignalError as e:
            self.assertTrue(
                'Job can not be resumed with the requested resume signal'
                in e.msg[0])
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

        j2 = Job(TEST_USER)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.sigjob(jid2, "admin-suspend", runas=ROOT_USER)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 43}, id=jid2)

        try:
            self.server.sigjob(jid2, "resume", runas=ROOT_USER)
        except PbsSignalError as e:
            self.assertTrue(
                'Job can not be resumed with the requested resume signal'
                in e.msg[0])

        # The job should be in the same state as it was prior to the signal
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 43}, id=jid2)

    def submit_resv(self, resv_start, chunks, resv_dur):
        """
        Function to request a PBS reservation with start time, chunks and
        duration as arguments.
        """
        a = {'Resource_List.select': '%d:ncpus=1:vntype=cray_compute' % chunks,
             'Resource_List.place': 'scatter',
             'reserve_start': int(resv_start),
             'reserve_duration': int(resv_dur)
             }
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)
        try:
            a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
            d = self.server.expect(RESV, a, id=rid)
        except PtlExpectError as e:
            d = e.rv
        return d

    @timeout(300)
    def test_preempt_STF(self):
        """
        Test shrink to fit by creating a reservation for all compute nodes
        starting in 100 sec. with a duration of two hours.  A preempted STF job
        with min_walltime of 1 min. and max_walltime of 2 hours will stay
        suspended after higher priority job goes away if its
        min_walltime can't be satisfied.
        """
        qname = 'highp'
        a = {'queue_type': 'execution'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)
        a = {'enabled': 'True', 'started': 'True', 'priority': '150'}
        self.server.manager(MGR_CMD_SET, QUEUE, a, qname)

        # Reserve all the compute nodes
        nv = self.cu.num_compute_vnodes(self.server)
        self.assertNotEqual(nv, 0, "There are no cray_compute vnodes present.")
        now = time.time()
        resv_start = now + 100
        resv_dur = 7200
        d = self.submit_resv(resv_start, nv, resv_dur)
        self.assertTrue(d)

        j = Job(TEST_USER, {ATTR_l + '.select': '%d:ncpus=1' % nv,
                            ATTR_l + '.place': 'scatter',
                            ATTR_l + '.min_walltime': '00:01:00',
                            ATTR_l + '.max_walltime': '02:00:00'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        self.server.expect(
            JOB, {ATTR_l + '.walltime': (LE, '00:01:40')}, id=jid)
        self.server.expect(
            JOB, {ATTR_l + '.walltime': (GE, '00:01:00')}, id=jid)

        # The sleep below will leave less than 1 minute window for jid
        # after j2id is deleted. The min_walltime of jid can't be
        # satisfied and jid will stay in S state.
        time.sleep(35)

        j2 = Job(TEST_USER, {ATTR_l + '.select': '%d:ncpus=1' % nv,
                             ATTR_l + '.walltime': '00:01:00',
                             ATTR_l + '.place': 'scatter',
                             ATTR_q: 'highp'})
        j2id = self.server.submit(j2)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=j2id)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

        # The sleep below will leave less than 1 minute window for jid
        time.sleep(50)

        self.server.delete(j2id)
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(SERVER, {'server_state': 'Active'})
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_multi_express(self):
        """
        Test of multiple express queues of different priorities.
        See that jobs from the higher express queues preempt jobs
        from lower express queues.  Also see when express jobs finish
        (or are deleted), suspended jobs restart.
        Make sure loadLimit is set to 4 on the server node:
        # apmgr config loadLimit 4
        """

        _t = ('\"express_queue, normal_jobs, server_softlimits,' +
              ' queue_softlimits\"')
        a = {'preempt_prio': _t}
        self.scheduler.set_sched_config(a)

        a = {'queue_type': 'e',
             'started': 'True',
             'enabled': 'True',
             'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq")

        a['Priority'] = 160
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq2")

        a['Priority'] = 170
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq3")

        # Count the compute nodes
        nv = self.cu.num_compute_vnodes(self.server)
        self.assertNotEqual(nv, 0, "There are no cray_compute vnodes present.")

        j1 = Job(TEST_USER, {ATTR_l + '.select': '%d:ncpus=1' % nv,
                             ATTR_l + '.place': 'scatter',
                             ATTR_l + '.walltime': 3600})
        j1id = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1id)

        j2 = Job(TEST_USER, {ATTR_l + '.select': '%d:ncpus=1' % nv,
                             ATTR_l + '.place': 'scatter',
                             ATTR_l + '.walltime': 3600,
                             ATTR_q: 'expressq'})
        j2id = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=j1id)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j2id)

        j3 = Job(TEST_USER, {ATTR_l + '.select': '%d:ncpus=1' % nv,
                             ATTR_l + '.place': 'scatter',
                             ATTR_l + '.walltime': 3600,
                             ATTR_q: 'expressq2'})
        j3id = self.server.submit(j3)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=j2id)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j3id)

        j4 = Job(TEST_USER, {ATTR_l + '.select': '%d:ncpus=1' % nv,
                             ATTR_l + '.place': 'scatter',
                             ATTR_l + '.walltime': 3600,
                             ATTR_q: 'expressq3'})
        j4id = self.server.submit(j4)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=j3id)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j4id)

        self.server.delete(j4id)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j3id)

    def test_preempted_topjob_calendared(self):
        """
        That even if topjob_ineligible is set for
        a preempted job and sched_preempt_enforce_resumption
        is set true, the preempted job will be calendared
        """
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_preempt_enforce_resumption': 'true'})
        self.server.manager(MGR_CMD_SET, SERVER, {'backfill_depth': '2'})

        # Count the compute nodes
        nv = self.cu.num_compute_vnodes(self.server)
        self.assertNotEqual(nv, 0, "There are no cray_compute vnodes present.")

        # Submit a job
        j = Job(TEST_USER, {ATTR_l + '.select': '%d:ncpus=1' % nv,
                            ATTR_l + '.place': 'scatter',
                            ATTR_l + '.walltime': '120'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Alter topjob_ineligible for runnng job
        self.server.alterjob(jid1, {ATTR_W: "topjob_ineligible = true"},
                             runas=ROOT_USER, logerr=True)

        # Create a high priority queue
        a = {'queue_type': 'e', 'started': 't',
             'enabled': 'True', 'priority': '150'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="highp")

        # Submit a job to high priority queue
        j = Job(TEST_USER, {ATTR_queue: 'highp', ATTR_l + '.walltime': '60'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        # Verify that job1 is calendared
        self.server.expect(JOB, 'estimated.start_time',
                           op=SET, id=jid1)
        qstat = self.server.status(JOB, 'estimated.start_time',
                                   id=jid1)
        est_time = qstat[0]['estimated.start_time']
        self.assertNotEqual(est_time, None)
        self.scheduler.log_match(jid1 + ";Job is a top job",
                                 starttime=self.server.ctime,
                                 max_attempts=10)


================================================
FILE: test/tests/functional/pbs_cray_vnode_per_numa.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('cray', 'mom', 'configuration')
class TestVnodePerNumaNode(TestFunctional):

    """
    This test suite is for testing the new mom_priv configuration
    parameter, vnode_per_numa_node.
    Test that the information is correctly being compressed into one vnode
    using the default setting (equivalent to FALSE).
    """

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.skipTest("Test suite only meant to run on a Cray")
        TestFunctional.setUp(self)

    @tags('cray', 'smoke')
    def test_settings(self):
        """
        vnode_per_numa_node is unset (defaults to FALSE).
        Set $vnode_per_numa_node to TRUE
        Sum up the ncpus, memory, and naccelerators for all vnodes that
        have the same host (i.e. NUMA nodes that belong to the same compute
        node).
        Unset $vnode_per_numa_node in mom_priv/config.
        Now for each host, compare the ncpus, mem, and naccelerators against
        the values we got when $vnode_per_numa_node was set to TRUE.
        They should be equal.

        Verify that PBS created only one vnode, and:
            - PBScrayseg attribute is not set
            - ncpus is a total from all NUMA nodes of that node
            - mem is a total from all NUMA nodes of that node
            - the naccelerators value is correct
            - the accelerator_memory value is correct

        Set $vnode_per_numa_node to FALSE.
        Compare the pbsnodes output when vnode_per_numa_node was unset
        versus when vnode_per_numa_node was set to False.
        """
        dncpus = {}
        dmem = {}
        dacc = {}
        daccmem = {}

        # First we mimic old behavior by setting vnode_per_numa_node to TRUE
        # Do not HUP now, we will do so when we reset the nodes
        rv = self.mom.add_config({'$vnode_per_numa_node': True}, False)
        self.assertTrue(rv)

        # Start from a clean slate, delete any existing nodes and re-create
        # them
        momname = self.mom.shortname
        self.reset_nodes(momname)

        # Get the pbsnodes -av output for comparison later
        vnodes_pernuma = self.server.status(NODE)
        for n in vnodes_pernuma:
            if n['resources_available.host'] not in dncpus.keys():
                dncpus[n['resources_available.host']] = int(
                    n['resources_available.ncpus'])
            else:
                dncpus[n['resources_available.host']
                       ] += int(n['resources_available.ncpus'])
            if n['resources_available.host'] not in dmem.keys():
                dmem[n['resources_available.host']] = int(
                    n['resources_available.mem'][0:-2])
            else:
                dmem[n['resources_available.host']
                     ] += int(n['resources_available.mem'][0:-2])
            if 'resources_available.naccelerators' in n.keys():
                if n['resources_available.naccelerators'][0] != '@':
                    if n['resources_available.host'] not in dacc.keys():
                        dacc[n['resources_available.host']] = int(
                            n['resources_available.naccelerators'])
                    else:
                        dacc[n['resources_available.host']
                             ] += int(n['resources_available.naccelerators'])
            if 'resources_available.accelerator_memory' in n.keys():
                if n['resources_available.accelerator_memory'][0] != '@':
                    if n['resources_available.host'] not in daccmem.keys():
                        daccmem[n['resources_available.host']] = int(
                            n['resources_available.accelerator_memory'][0:-2])
                    else:
                        daccmem[n['resources_available.host']] += int(n[
                            'resources_available.accelerator_memory'][0:-2])

        # Remove the configuration setting and re-read the vnodes
        rv = self.mom.unset_mom_config('$vnode_per_numa_node', False)
        self.assertTrue(rv)
        self.reset_nodes(momname)

        vnodes_combined = self.server.status(NODE)

        # Compare the multiple vnodes values to the combined vnode output

        for n in vnodes_combined:
            if 'resources_available.PBScrayseg' in n:
                self.logger.error(
                    "ERROR resources_available.PBScrayseg was found.")
                self.assertTrue(False)

            self.assertEqual(int(n['resources_available.ncpus']), dncpus[
                n['resources_available.host']])
            self.assertEqual(int(n['resources_available.mem'][0:-2]), dmem[
                n['resources_available.host']])
            if 'resources_available.naccelerators' in n:
                self.assertEqual(int(n['resources_available.naccelerators']),
                                 dacc[n['resources_available.host']])
            if 'resources_available.accelerator_memory' in n:
                self.assertEqual(int(n['resources_available.accelerator_memory'
                                       ][0:-2]),
                                 daccmem[n['resources_available.host']])

        # Set vnode_per_numa_node to FALSE and re-read the vnodes
        rv = self.mom.add_config({'$vnode_per_numa_node': False}, False)
        self.assertTrue(rv)
        self.reset_nodes(momname)

        vnodes_combined1 = self.server.status(NODE)

        # Compare the pbsnodes output when vnode_per_numa_node was unset
        # versus when vnode_per_numa_node was set to False.
        # List of resources to be ignored while comparing.
        ignr_rsc = ['license', 'last_state_change_time']
        len_vnodes_combined1 = len(vnodes_combined1)
        len_vnodes_combined = len(vnodes_combined)
        n = 0
        if len_vnodes_combined == len_vnodes_combined1:
            self.logger.info(
                "pbsnodes outputs are equal in length")
            for vdict in vnodes_combined:
                for key in vdict:
                    if key in ignr_rsc:
                        continue
                    if key in vnodes_combined1[n]:
                        if vdict[key] != vnodes_combined1[n][key]:
                            self.fail("ERROR vnode %s has "
                                      "differing element." % key)
                    else:
                        self.fail("ERROR vnode %s has "
                                  "differing element." % key)
                n += 1

        else:
            self.fail("ERROR pbsnodes outputs differ in length.")

    def restartPBS(self):
        try:
            svcs = PBSInitServices()
            svcs.restart()
        except PbsInitServicesError as e:
            self.logger.error("PBS restart failed: \n" + e.msg)
            self.assertTrue(e.rv)

    def reset_nodes(self, hostA):
        """
        Reset nodes.
        """

        # Remove all nodes
        rv = self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        self.assertEqual(rv, 0)

        # Restart PBS
        self.restartPBS()

        # Create node
        rv = self.server.manager(MGR_CMD_CREATE, NODE, None, hostA)
        self.assertEqual(rv, 0)

        # Wait for 3 seconds for changes to take effect
        time.sleep(3)


================================================
FILE: test/tests/functional/pbs_cray_vnode_pool.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('cray', 'configuration')
class TestVnodePool(TestFunctional):

    """
    This test suite tests how PBS makes use of node attribute "vnode_pool"
    It expects at least 2 moms to be specified to it while executing.
    """

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.skipTest("This test can only run on a cray")
        TestFunctional.setUp(self)
        if len(self.moms.values()) < 2:
            self.skipTest("Provide at least 2 moms while invoking test")

        # The moms provided to the test may have unwanted vnodedef files.
        if self.moms.values()[0].has_vnode_defs():
            self.moms.values()[0].delete_vnode_defs()
        if self.moms.values()[1].has_vnode_defs():
            self.moms.values()[1].delete_vnode_defs()

        # Check if vnodes exist before deleting nodes.
        # Clean all default nodes because each test case will set up nodes.
        try:
            self.server.status(NODE)
            self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        except PbsStatusError as e:
            self.assertTrue("Server has no node list" in e.msg[0])

    def test_invalid_values(self):
        """
        Invalid vnode_pool values shall result in errors.
        """
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        attr_A = {'vnode_pool': '-1'}
        try:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA,
                                attrib=attr_A)
        except PbsManagerError as e:
            self.assertTrue("Illegal attribute or resource value" in e.msg[0])

        attr_A = {'vnode_pool': '0'}
        try:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA,
                                attrib=attr_A)
        except PbsManagerError as e:
            self.assertTrue("Illegal attribute or resource value" in e.msg[0])

        attr_A = {'vnode_pool': 'a'}
        try:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA,
                                attrib=attr_A)
        except PbsManagerError as e:
            self.assertTrue("Illegal attribute or resource value" in e.msg[0])

    def test_two_moms_single_vnode_pool(self):
        """
        Same vnode_pool for two moms shall result in one mom being the
        inventory mom and the other the non-inventory mom.
        The inventory mom goes down (e.g. killed).
        Compute nodes remain up even when the inventory mom is killed,
        since another mom is reporting them.
        Check that a new inventory mom is listed in the log.
        Bring up killed mom.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {"log_events": -1})

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        attr = {'vnode_pool': '1'}

        start_time = time.time()

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA, attrib=attr)
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB, attrib=attr)

        self.server.log_match("Mom %s added to vnode_pool %s" %
                              (self.momB.hostname, '1'), max_attempts=5,
                              starttime=start_time)

        _msg = "Hello (no inventory required) from server"
        try:
            self.momA.log_match(_msg, max_attempts=9, starttime=start_time)
            found_in_momA = 1
        except PtlLogMatchError:
            found_in_momA = 0
        try:
            self.momB.log_match(_msg, max_attempts=9, starttime=start_time)
            found_in_momB = 1
        except PtlLogMatchError:
            found_in_momB = 0
        self.assertEqual(found_in_momA + found_in_momB,
                         1, msg="an inventory mom not chosen correctly")

        # Only one mom is inventory mom
        if (found_in_momA == 0):
            inv_mom = self.momA
            noninv_mom = self.momB
        else:
            inv_mom = self.momB
            noninv_mom = self.momA

        self.logger.info("Inventory mom is %s." % inv_mom.shortname)
        self.logger.info("Non-inventory mom is %s." %
                         noninv_mom.shortname)

        start_time = time.time()

        # Kill inventory mom
        inv_mom.signal('-KILL')

        # Check that former inventory mom is down
        rv = self.server.expect(
            VNODE, {'state': 'down'}, id=inv_mom.shortname,
            max_attempts=10, interval=2)
        self.assertTrue(rv)

        # Check if inventory mom changed and is listed in the server log.
        self.server.log_match(
            "Setting inventory_mom for vnode_pool %s to %s" %
            ('1', noninv_mom.shortname), max_attempts=5,
            starttime=start_time)
        self.logger.info(
            "Inventory mom is now %s in server logs." %
            (noninv_mom.shortname))

        # Check compute nodes are up
        vlist = []
        try:
            vnl = self.server.filter(
                VNODE, {'resources_available.vntype': 'cray_compute'})
            vlist = vnl["resources_available.vntype=cray_compute"]
        except Exception:
            pass

        # Loop through each compute vnode in the list and check if state = free
        for v1 in vlist:
            # Check that the node is in free state
            rv = self.server.expect(
                VNODE, {'state': 'free'}, id=v1, max_attempts=3, interval=2)
            self.assertTrue(rv)

        # Start the previous inv mom.
        inv_mom.start()

        # Check previous inventory mom is up
        rv = self.server.expect(
            VNODE, {'state': 'free'}, id=inv_mom.shortname,
            max_attempts=3, interval=2)
        self.assertTrue(rv)

    def test_two_moms_different_vnode_pool(self):
        """
        Differing vnode_pool for two moms shall result in both moms reporting
        inventory.
        """
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        attr_A = {'vnode_pool': '1'}
        attr_B = {'vnode_pool': '2'}

        start_time = time.time()

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA, attrib=attr_A)
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB, attrib=attr_B)

        _msg = "Hello (no inventory required) from server"
        try:
            self.momA.log_match(_msg, max_attempts=5, starttime=start_time)
            found_in_momA = 1
        except PtlLogMatchError:
            found_in_momA = 0
        try:
            self.momB.log_match(_msg, max_attempts=5, starttime=start_time)
            found_in_momB = 1
        except PtlLogMatchError:
            found_in_momB = 0
        self.assertTrue((found_in_momA + found_in_momB == 0),
                        msg="Both moms must report inventory")

    def test_invalid_usage(self):
        """
        Setting vnode_pool for an existing mom that does not have a vnode_pool
        attribute shall not be allowable.
        Setting vnode_pool for an existing mom having a vnode_pool attribute
        shall not be allowable.
        Unsetting vnode_pool for an existing mom having a vnode_pool attribute
        shall not be allowable.
        """
        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        self.logger.info("hostA is %s." % self.hostA)

        start_time = time.time()

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)

        attr_2 = {'vnode_pool': '2'}
        try:
            self.server.manager(
                MGR_CMD_SET, NODE, id=self.hostA, attrib=attr_2)
        except PbsManagerError as e:
            self.assertTrue("Invalid request" in e.msg[0])

        self.server.log_match("Unsupported actions for vnode_pool",
                              max_attempts=5, starttime=start_time)
        self.logger.info("Found correct server log message")

        self.momB = self.moms.values()[1]
        self.hostB = self.momB.shortname

        attr_1 = {'vnode_pool': '1'}

        start_time = time.time()

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB, attrib=attr_1)

        attr_2 = {'vnode_pool': '2'}
        try:
            self.server.manager(MGR_CMD_SET, NODE, id=self.hostB,
                                attrib=attr_2)
        except PbsManagerError as e:
            self.assertTrue("Invalid request" in e.msg[0])

        self.server.log_match("Unsupported actions for vnode_pool",
                              max_attempts=5, starttime=start_time)
        try:
            self.server.manager(MGR_CMD_UNSET, NODE, id=self.hostB,
                                attrib='vnode_pool')
        except PbsManagerError as e:
            self.assertTrue("Illegal value for node vnode_pool" in e.msg[0])


================================================
FILE: test/tests/functional/pbs_daemon_service_user.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import resource

from tests.functional import *


class TestDaemonServiceUser(TestFunctional):

    """
    Test suite to test running schedulers as a non-root user
    """

    def setUp(self):
        TestFunctional.setUp(self)

    def common_test(self, binary, runas, scheduser, msg, setup_sched=False):
        """
        Test if running `binary` as `runas` with
        PBS_DAEMON_SERVICE_USER set as `scheduser`
        Check to see `msg` is in stderr
        If `msg` is None, make sure command passed
        """
        if scheduser:
            self.du.set_pbs_config(
                self.server.hostname,
                confs={'PBS_DAEMON_SERVICE_USER': str(scheduser)}
            )
        else:
            self.du.unset_pbs_config(
                self.server.hostname,
                confs='PBS_DAEMON_SERVICE_USER'
            )
        self.server.restart()
        pbs_conf = self.du.parse_pbs_config(self.server.shortname)
        if setup_sched:
            sched_logs = os.path.join(pbs_conf['PBS_HOME'], 'sched_logs')
            sched_priv = os.path.join(pbs_conf['PBS_HOME'], 'sched_priv')
            self.du.chown(path=sched_logs, uid=scheduser,
                          recursive=True, sudo=True, level=logging.INFO)
            self.du.chown(path=sched_priv, uid=scheduser,
                          recursive=True, sudo=True, level=logging.INFO)

        binpath = os.path.join(pbs_conf['PBS_EXEC'], 'sbin', binary)
        ret = self.du.run_cmd(self.server.shortname,
                              cmd=[binpath], runas=runas)
        if msg:
            self.assertEquals(ret['rc'], 1)
            self.assertIn(msg, '\n'.join(ret['err']))
        else:
            self.assertEquals(ret['rc'], 0)
            self.assertFalse(ret['err'])

    def test_sched_runas_nonroot(self):
        """
        Test if running sched as nonroot with
        PBS_DAEMON_SERVICE_USER set as another user
        """
        self.common_test('pbs_sched', TEST_USER, TEST_USER1,
                         'Must be run by PBS_DAEMON_SERVICE_USER')

    def test_pbsfs_runas_nonroot(self):
        """
        Test if running pbsfs as root with
        PBS_DAEMON_SERVICE_USER set as another user
        """
        self.common_test('pbsfs', TEST_USER, TEST_USER1,
                         'Must be run by PBS_DAEMON_SERVICE_USER')

    def test_sched_runas_nonroot_notset(self):
        """
        Test if running sched as nonroot with
        PBS_DAEMON_SERVICE_USER not set
        """
        self.common_test('pbs_sched', TEST_USER, None,
                         'Must be run by PBS_DAEMON_SERVICE_USER if '
                         'set or root if not set')

    def test_pbsfs_runas_nonroot_notset(self):
        """
        Test if running pbsfs as nonroot with
        PBS_DAEMON_SERVICE_USER not set
        """
        self.common_test('pbsfs', TEST_USER, None,
                         'Must be run by PBS_DAEMON_SERVICE_USER if '
                         'set or root if not set')

    def test_sched_runas_nonroot_pass(self):
        """
        Test if sched runs as non-root user
        """
        self.scheduler.stop()
        self.common_test('pbs_sched', TEST_USER, TEST_USER, None,
                         setup_sched=True)
        j = Job(TEST_USER1)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)


================================================
FILE: test/tests/functional/pbs_dup_acc_log_for_resv.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestDupAccLogForResv(TestFunctional):
    """
    This test suite is for testing duplicate records in accounting log
    for start of reservations.
    """

    def setUp(self):
        TestFunctional.setUp(self)

    def test_accounting_logs(self):
        r1 = Reservation(TEST_USER)
        a = {'Resource_List.select': '1:ncpus=1', 'reserve_start': int(
            time.time() + 5), 'reserve_end': int(time.time() + 60)}
        r1.set_attributes(a)
        r1id = self.server.submit(r1)
        time.sleep(8)
        self.server.restart()
        m = self.server.accounting_match(
            msg='.*B;' + r1id, id=r1id, n='ALL', allmatch=True, regexp=True)
        self.assertEqual(len(m), 1)


================================================
FILE: test/tests/functional/pbs_eligible_time.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


class TestEligibleTime(TestFunctional):
    """
    Test suite for eligible time tests
    """

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'eligible_time_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.accrue = {'ineligible': 1, 'eligible': 2, 'run': 3, 'exit': 4}

    def test_eligible_time_updated(self):
        """
        Test that eligible time gets updated when a job is eligible
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {"eligible_time_enable": "True"})

        jid1 = self.server.submit(Job())
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        jid2 = self.server.submit(Job())
        a = {ATTR_state: 'Q', "accrue_type": "2"}
        self.server.expect(JOB, a, id=jid2)

        self.server.expect(JOB, {"eligible_time": "00:00:00"}, op=NE, id=jid2)

    def test_qsub_a(self):
        """
        Test that jobs requsting qsub -a <time> do not accrue
        eligible time until <time> is reached
        """
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        now = int(time.time())
        now += 120
        s = time.strftime("%H%M.%S", time.localtime(now))

        J1 = Job(TEST_USER, attrs={ATTR_a: s})
        jid = self.server.submit(J1)
        self.server.expect(JOB, {ATTR_state: 'W'}, id=jid)

        self.logger.info("Sleeping 120s till job is out of 'W' state")
        time.sleep(120)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)
        # eligible_time should really be 0, but just incase there is some
        # lag on some slow systems, add a little leeway.
        self.server.expect(JOB, {'eligible_time': 10}, op=LT)

    def test_job_array(self):
        """
        Test that a job array switches from accruing eligible time
        to ineligible time when its last subjob starts running
        """
        logutils = PBSLogUtils()
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        a = {'log_events': 2047}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        J1 = Job(TEST_USER, attrs={ATTR_J: '1-3'})
        J1.set_sleep_time(20)
        jid = self.server.submit(J1)
        jid_short = jid.split('[')[0]
        sjid1 = jid_short + '[1]'
        sjid2 = jid_short + '[2]'
        sjid3 = jid_short + '[3]'

        # Capture the time stamp when subjob 1 starts run. Accrue type changes
        # to eligible time
        msg1 = J1.create_subjob_id(jid, 1) + ";Job Run at request of Scheduler"
        m1 = self.server.log_match(msg1)
        t1 = logutils.convert_date_time(m1[1].split(';')[0])

        self.server.expect(JOB, {ATTR_state: 'R'}, id=sjid1, extend='t')
        self.server.expect(JOB, {ATTR_state: 'R'}, id=sjid2, extend='t')
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=sjid3, extend='t')

        self.server.expect(JOB, {'accrue_type': self.accrue['eligible']},
                           id=jid)

        self.logger.info("subjobs 1 and 2 finished; subjob 3 must run now")
        self.server.expect(JOB, {ATTR_state: 'R'}, id=sjid3,
                           extend='t', offset=20)
        self.server.expect(JOB, {'accrue_type': self.accrue['ineligible']},
                           id=jid)

        # Capture the time stamp when subjob 3 starts run. Accrue type changes
        # to ineligible time. eligible_time calculation is completed.
        msg2 = J1.create_subjob_id(jid, 3) + ";Job Run at request of Scheduler"
        m2 = self.server.log_match(msg2)
        t2 = logutils.convert_date_time(m2[1].split(';')[0])
        eligible_time = int(t2) - int(t1)

        m1 = jid + ";Accrue type has changed to ineligible_time, "
        m1 += "previous accrue type was eligible_time"

        m2 = m1 + " for %d secs, " % eligible_time
        # Format timedelta object as it does not print a preceding 0 for
        # hours in HH:MM:SS
        m2 += "total eligible_time={!s:0>8}".format(
              datetime.timedelta(seconds=eligible_time))
        try:
            self.server.log_match(m2)
        except PtlLogMatchError as e:
            # In some slow machines, there is a delay observed between
            # job run and accrue type change.
            # Checking if log_match failed because eligible_time
            # value was off only by a few seconds(5 seconds).
            # This is done to acommodate differences in the eligible
            # time calculated by the test and the eligible time
            # calculated by PBS.
            # If the eligible_time value was off by > 5 seconds, test fails.
            match = self.server.log_match(m1)
            e_time = re.search(r'(\d+) secs', match[1])
            if e_time:
                self.logger.info("Checking if log_match failed because "
                                 "the eligible_time value was off by "
                                 "a few seconds, but within the allowed "
                                 "range (5 secs). Expected %d secs Got: %s"
                                 % (eligible_time, e_time.group(1)))
                if int(e_time.group(1)) - eligible_time > 5:
                    raise PtlLogMatchError(rc=1, rv=False, msg=e.msg)
            else:
                raise PtlLogMatchError(rc=1, rv=False, msg=e.msg)

    def test_after_depend(self):
        """
        Make sure jobs accrue eligible time (or not) approprately with an
        after dependency
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 2},
                            id=self.mom.shortname)
        J1 = Job(TEST_USER)
        jid1 = self.server.submit(J1)
        attribs = {'job_state': 'R', 'accrue_type': self.accrue['run']}
        self.server.expect(JOB, attribs, id=jid1)

        J2 = Job(TEST_USER, {'Resource_List.select': '1:ncpus=2'})
        jid2 = self.server.submit(J2)
        attribs = {'job_state': 'Q', 'accrue_type': self.accrue['eligible']}
        self.server.expect(JOB, attribs, id=jid2)

        a = {'Resource_List.select': '1:ncpus=1',
             ATTR_depend: 'afterany:' + jid2}
        J3 = Job(TEST_USER, a)
        jid3 = self.server.submit(J3)
        attribs = {'job_state': 'H', 'accrue_type': self.accrue['ineligible']}
        self.server.expect(JOB, attribs, id=jid3)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run_res.ncpus': '[u:PBS_GENERIC=1]'})

        # Make sure there are enough resources to run the job, so the reason
        # the job can't run is the limit.  Otherwise, we'd accrue eligible time
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 3},
                            id=self.mom.shortname)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'accrue_type': self.accrue['ineligible']},
                           id=jid2)

        # force the server to reassess the accrue type
        self.server.holdjob(jid2, 'u')
        self.server.rlsjob(jid2, 'u')

        self.server.expect(JOB, {'accrue_type': self.accrue['ineligible']},
                           id=jid2)

    def test_default_accrue_type(self):
        """
        Test that the default accrue_type for jobs is "eligible time"
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 1},
                            id=self.mom.shortname)
        self.server.manager(MGR_CMD_SET, SCHED, {"scheduling": "false"})

        jid1 = self.server.submit(Job())

        # Check that the job's accrue_type is set to eligible time
        a = {"accrue_type": self.accrue['eligible']}
        self.server.expect(JOB, a, id=jid1)

    def test_delayed_ineligible(self):
        """
        Test that jobs are still correctly marked ineligible by sched
        even if server thinks that they are eligible
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 2},
                            id=self.mom.shortname)
        self.server.manager(MGR_CMD_SET, SCHED, {"scheduling": "false"})

        a = {"max_run_res.ncpus": "[u:PBS_GENERIC=1]"}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        jid1 = self.server.submit(Job(attrs={"Resource_List.ncpus": 2}))

        # Check that server sets job's accrue_type to eligible time
        a = {"accrue_type": self.accrue['eligible']}
        self.server.expect(JOB, a, id=jid1)

        self.scheduler.run_scheduling_cycle()

        # Check that scheduler corrects the accrue_type to ineligible
        a = {"accrue_type": self.accrue['ineligible']}
        self.server.expect(JOB, a, id=jid1)


================================================
FILE: test/tests/functional/pbs_equiv_classes.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestEquivClass(TestFunctional):

    """
    Test equivalence class functionality
    """

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1, usenatvnode=True)
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})
        # capture the start time of the test for log matching
        self.t = time.time()

    def submit_jobs(self, num_jobs=1,
                    attrs={'Resource_List.select': '1:ncpus=1'},
                    user=TEST_USER):
        """
        Submit num_jobs number of jobs with attrs attributes for user.
        Return a list of job ids
        """
        ret_jids = []
        for n in range(num_jobs):
            J = Job(user, attrs)
            jid = self.server.submit(J)
            ret_jids += [jid]

        return ret_jids

    def test_basic(self):
        """
        Test the basic behavior of job equivalence classes: submit two
        different types of jobs and see they are in two different classes
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_select(self):
        """
        Test to see if jobs with select resources not in the resources line
        fall into the same equivalence class
        """
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'long', 'flag': 'nh'}, id='foo')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.select': '1:ncpus=1:foo=4'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=1:foo=8'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes: one for the resource eating job and one
        # for the other two jobs. While jobs have different amounts of
        # the foo resource, foo is not on the resources line.
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_place(self):
        """
        Test to see if jobs with different place statements
        fall into the different equivalence classes
        """
        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'free'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes: one for the resource eating job and
        # one for each place statement
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_reslist1(self):
        """
        Test to see if jobs with resources in Resource_List that are not in
        the sched_config resources line fall into the same equivalence class
        """
        self.server.manager(MGR_CMD_CREATE, RSC, {'type': 'string'},
                            id='baz')
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.software': 'foo'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.software': 'bar'}
        jids2 = self.submit_jobs(3, a)

        a = {'Resource_List.baz': 'foo'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.baz': 'bar'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes.  One for the resource eating job and
        # one for the rest.  The rest of the jobs have differing values of
        # resources not on the resources line.  They fall into one class.
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_reslist2(self):
        """
        Test to see if jobs with resources in Resource_List that are in the
        sched_config resources line fall into the different equivalence classes
        """
        self.server.manager(MGR_CMD_CREATE, RSC, {'type': 'string'},
                            id='baz')

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})
        self.scheduler.add_resource('software')
        self.scheduler.add_resource('baz')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.software': 'foo'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.software': 'bar'}
        jids2 = self.submit_jobs(3, a)

        a = {'Resource_List.baz': 'foo'}
        jids3 = self.submit_jobs(3, a)

        a = {'Resource_List.baz': 'bar'}
        jids4 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each value of software and baz.
        self.scheduler.log_match("Number of job equivalence classes: 5",
                                 starttime=self.t)

    def test_nolimits(self):
        """
        Test to see that jobs from different users, groups, and projects
        all fall into the same equivalence class when there are no limits
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, user=TEST_USER)
        jids2 = self.submit_jobs(3, user=TEST_USER2)

        b = {'group_list': TSTGRP1, 'Resource_List.select': '1:ncpus=8'}
        jids3 = self.submit_jobs(3, a, TEST_USER1)

        b = {'group_list': TSTGRP2, 'Resource_List.select': '1:ncpus=8'}
        jids4 = self.submit_jobs(3, a, TEST_USER1)

        b = {'project': 'p1', 'Resource_List.select': '1:ncpus=8'}
        jids5 = self.submit_jobs(3, a)

        b = {'project': 'p2', 'Resource_List.select': '1:ncpus=8'}
        jids6 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes: one for the resource eating job and one
        # for the rest.  Since there are no limits, user, group, nor project
        # are taken into account
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_user(self):
        """
        Test to see that jobs from different users fall into the same
        equivalence class without user limits set
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, user=TEST_USER)
        jids2 = self.submit_jobs(3, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes: One for the resource eating job and
        # one for the rest.  Since there are no limits, both users are
        # in one class.
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_user_old(self):
        """
        Test to see that jobs from different users fall into different
        equivalence classes with old style limits set
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_user_run': 4})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, user=TEST_USER)
        jids2 = self.submit_jobs(3, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job
        # and one for each user.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_user_server(self):
        """
        Test to see that jobs from different users fall into different
        equivalence classes with server hard limits set
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run': '[u:PBS_GENERIC=4]'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, user=TEST_USER)
        jids2 = self.submit_jobs(3, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job
        # and one for each user.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_user_server_soft(self):
        """
        Test to see that jobs from different users fall into different
        equivalence classes with server soft limits set
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run_soft': '[u:PBS_GENERIC=4]'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, user=TEST_USER)
        jids2 = self.submit_jobs(3, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each user.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_user_queue(self):
        """
        Test to see that jobs from different users fall into different
        equivalence classes with queue limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run': '[u:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, user=TEST_USER)
        jids2 = self.submit_jobs(3, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each user.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_user_queue_without_limits(self):
        """
        Test that jobs from different users submitted to a queue without
        a user limit set, will not create a multiple equivalence classes.
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run': '[u:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources, this job will make first equiv class
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        # Create a new queue and submit jobs to this queue
        a = {'queue_type': 'e', 'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')

        a = {'Resource_List.select': '1:ncpus=1', ATTR_q: 'workq2'}
        jids1 = self.submit_jobs(3, user=TEST_USER, attrs=a)
        jids2 = self.submit_jobs(3, user=TEST_USER2, attrs=a)
        a = {'Resource_List.select': '1:ncpus=1'}
        J3 = Job(TEST_USER3, attrs=a)
        self.server.submit(J3)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for all jobs in workq2 and one for TEST_USER3
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_user_queue_soft(self):
        """
        Test to see that jobs from different users fall into different
        equivalence classes with queue soft limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run_soft': '[u:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        jids1 = self.submit_jobs(3, user=TEST_USER)
        jids2 = self.submit_jobs(3, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each user.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_user_queue_without_soft_limits(self):
        """
        Test that jobs from different users submitted to a queue without
        a user soft limit set, will not create a multiple equivalence classes.
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run_soft': '[u:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources, this job will make first equiv class
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)

        # Create a new queue and submit jobs to this queue
        a = {'queue_type': 'e', 'started': 't', 'enabled': 't'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')

        a = {'Resource_List.select': '1:ncpus=1', ATTR_q: 'workq2'}
        jids1 = self.submit_jobs(3, user=TEST_USER, attrs=a)
        jids2 = self.submit_jobs(3, user=TEST_USER2, attrs=a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes.  One for the resource eating job and
        # one for all jobs in workq2.
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_group(self):
        """
        Test to see that jobs from different groups fall into the same
        equivalence class without group limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'group_list': TSTGRP1}
        jids1 = self.submit_jobs(3, a, TEST_USER1)

        a = {'group_list': TSTGRP2}
        jids2 = self.submit_jobs(3, a, TEST_USER1)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes: One for the resource eating job and
        # one for the rest.  Since there are no limits, both groups are
        # in one class.
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    @skipOnShasta
    def test_group_old(self):
        """
        Test to see that jobs from different groups fall into different
        equivalence class old style group limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_group_run': 4})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'group_list': TSTGRP1}
        jids1 = self.submit_jobs(3, a, TEST_USER1)

        a = {'group_list': TSTGRP2}
        jids2 = self.submit_jobs(3, a, TEST_USER1)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each group.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    @skipOnShasta
    def test_group_server(self):
        """
        Test to see that jobs from different groups fall into different
        equivalence class server group limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run': '[g:PBS_GENERIC=4]'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'group_list': TSTGRP1}
        jids1 = self.submit_jobs(3, a, TEST_USER1)

        a = {'group_list': TSTGRP2}
        jids2 = self.submit_jobs(3, a, TEST_USER1)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each group.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    @skipOnShasta
    def test_group_server_soft(self):
        """
        Test to see that jobs from different groups fall into different
        equivalence class server soft group limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run_soft': '[g:PBS_GENERIC=4]'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'group_list': TSTGRP1}
        jids1 = self.submit_jobs(3, a, TEST_USER1)

        a = {'group_list': TSTGRP2}
        jids2 = self.submit_jobs(3, a, TEST_USER1)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each group.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    @skipOnShasta
    def test_group_queue(self):
        """
        Test to see that jobs from different groups fall into different
        equivalence class queue group limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run': '[g:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'group_list': TSTGRP1}
        jids1 = self.submit_jobs(3, a, TEST_USER1)

        a = {'group_list': TSTGRP2}
        jids2 = self.submit_jobs(3, a, TEST_USER1)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each group.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    @skipOnShasta
    def test_group_queue_soft(self):
        """
        Test to see that jobs from different groups fall into different
        equivalence class queue group soft limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run_soft': '[g:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'group_list': TSTGRP1}
        jids1 = self.submit_jobs(3, a, TEST_USER1)

        a = {'group_list': TSTGRP2}
        jids2 = self.submit_jobs(3, a, TEST_USER1)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each group.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_proj(self):
        """
        Test to see that jobs from different projects fall into the same
        equivalence class without project limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'project': 'p1'}
        jids1 = self.submit_jobs(3, a)

        a = {'project': 'p2'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes: One for the resource eating job and
        # one for the rest.  Since there are no limits, both projects are
        # in one class.
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_proj_server(self):
        """
        Test to see that jobs from different projects fall into different
        equivalence classes with server project limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run': '[p:PBS_GENERIC=4]'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'project': 'p1'}
        jids1 = self.submit_jobs(3, a)

        a = {'project': 'p2'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each project.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_proj_server_soft(self):
        """
        Test to see that jobs from different projects fall into different
        equivalence class server project soft limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run_soft': '[p:PBS_GENERIC=4]'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'project': 'p1'}
        jids1 = self.submit_jobs(3, a)

        a = {'project': 'p2'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each project.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_proj_queue(self):
        """
        Test to see that jobs from different groups fall into different
        equivalence class queue project limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run': '[p:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'project': 'p1'}
        jids1 = self.submit_jobs(3, a)

        a = {'project': 'p2'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each project.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_proj_queue_soft(self):
        """
        Test to see that jobs from different groups fall into different
        equivalence class queue project soft limits set
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run_soft': '[p:PBS_GENERIC=4]'}, id='workq')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'project': 'p1'}
        jids1 = self.submit_jobs(3, a)

        a = {'project': 'p2'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one for each project.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_queue(self):
        """
        Test to see that jobs from different generic queues fall into
        the same equivalence class
        """

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='workq2')

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'Priority': 120}, id='workq')

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'queue': 'workq'}
        jids1 = self.submit_jobs(3, a)

        a = {'queue': 'workq2'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes.  One for the resource eating job and
        # one for the rest.  There is nothing to differentiate the queues
        # so all jobs are in one class.
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_queue_limits(self):
        """
        Test to see if jobs in a queue with limits use their queue as part
        of what defines their equivalence class.
        """

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='workq2')

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='limits1')

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='limits2')

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'Priority': 120}, id='workq')

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run': '[o:PBS_ALL=20]'}, id='limits1')

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run_soft': '[o:PBS_ALL=20]'}, id='limits2')

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'queue': 'workq'}
        jids1 = self.submit_jobs(3, a)

        a = {'queue': 'workq2'}
        jids2 = self.submit_jobs(3, a)

        a = {'queue': 'limits1'}
        jids3 = self.submit_jobs(3, a)

        a = {'queue': 'limits2'}
        jids4 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # 4 equivalence classes.  One for the resource eating job and
        # One for the queues without limits and one
        # each for the two queues with limits.
        self.scheduler.log_match("Number of job equivalence classes: 4",
                                 starttime=self.t)

    def test_queue_nodes(self):
        """
        Test to see if jobs that are submitted into a queue with nodes
        associated with it fall into their own equivalence class
        """

        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 2, usenatvnode=True)

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True', 'Priority': 100}, id='workq2')

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='nodes_queue')
        vn = self.mom.shortname + '[0]'
        self.server.manager(MGR_CMD_SET, NODE,
                            {'queue': 'nodes_queue'}, id=vn)

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'Priority': 120}, id='workq')

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources on the normal node
        a = {'Resource_List.select': '1:ncpus=8', 'queue': 'workq'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        # Eat up all the resources on node associated to nodes_queue
        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'nodes_queue'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'workq'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'workq2'}
        jids2 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'nodes_queue'}
        jids3 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes.  One for the resource eating job and
        # one class for the queue with nodes associated with it.
        # One class for normal queues.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_prime_queue(self):
        """
        Test to see if a job in a primetime queue has its queue be part of
        what defines its equivalence class.  Also see that jobs in anytime
        queues do not use queue as part of what determines their class
        """

        # Force primetime
        self.scheduler.holidays_set_day("weekday", prime="all",
                                        nonprime="none")
        self.scheduler.holidays_set_day("saturday", prime="all",
                                        nonprime="none")
        self.scheduler.holidays_set_day("sunday", prime="all",
                                        nonprime="none")

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True', 'Priority': 100},
                            id='anytime1')
        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='anytime2')

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True', 'Priority': 100},
                            id='p_queue1')
        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='p_queue2')

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'Priority': 120}, id='workq')

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8', 'queue': 'workq'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'anytime1'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'anytime2'}
        jids2 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'p_queue1'}
        jids3 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'p_queue2'}
        jids4 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Four equivalence classes.  One for the resource eating job and
        # one for the normal queues and one for each prime time queue
        self.scheduler.log_match("Number of job equivalence classes: 4",
                                 starttime=self.t)

    def test_non_prime_queue(self):
        """
        Test to see if a job in a non-primetime queue has its queue be part of
        what defines its equivalence class.  Also see that jobs in anytime
        queues do not use queue as part of what determines their class
        """

        # Force non-primetime
        self.scheduler.holidays_set_day("weekday", prime="none",
                                        nonprime="all")
        self.scheduler.holidays_set_day("saturday", prime="none",
                                        nonprime="all")
        self.scheduler.holidays_set_day("sunday", prime="none",
                                        nonprime="all")

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True', 'Priority': 100},
                            id='anytime1')
        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='anytime2')

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True', 'Priority': 100},
                            id='np_queue1')

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='np_queue2')

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'Priority': 120}, id='workq')

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8', 'queue': 'workq'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'anytime1'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'anytime2'}
        jids2 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'np_queue1'}
        jids3 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4', 'queue': 'np_queue2'}
        jids4 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Four equivalence classes.  One for the resource eating job and
        # one for the normal queues and one for each non-prime time queue
        self.scheduler.log_match("Number of job equivalence classes: 4",
                                 starttime=self.t)

    def test_ded_time_queue(self):
        """
        Test to see if a job in a dedicated time queue has its queue be part
        of what defines its equivalence class.  Also see that jobs in anytime
        queues do not use queue as part of what determines their class
        """

        # Force dedicated time
        now = time.time()
        self.scheduler.add_dedicated_time(start=now - 5, end=now + 3600)

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True', 'Priority': 100},
                            id='ded_queue1')

        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True', 'Priority': 100},
                            id='ded_queue2')

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'Priority': 120}, id='workq')

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8', 'queue': 'workq'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        a = {'Resource_List.select': '1:ncpus=4',
             'Resource_List.walltime': 600, 'queue': 'ded_queue1'}
        jids1 = self.submit_jobs(3, a)

        a = {'Resource_List.select': '1:ncpus=4',
             'Resource_List.walltime': 600, 'queue': 'ded_queue2'}
        jids2 = self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes: One for the resource eating job and
        # one for each dedicated time queue job
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_job_array(self):
        """
        Test that various job types will fall into single equivalence
        class with same type of request.
        """

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=8', 'queue': 'workq'}
        J = Job(TEST_USER1, attrs=a)
        self.server.submit(J)

        # Submit a job array
        j = Job(TEST_USER)
        j.set_attributes(
            {ATTR_J: '1-3:1',
             'Resource_List.select': '1:ncpus=8',
             'queue': 'workq'})
        jid = self.server.submit(j)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # One equivalence class
        self.scheduler.log_match("Number of job equivalence classes: 1",
                                 starttime=self.t)

    def test_reservation(self):
        """
        Test that similar jobs inside reservations falls under same
        equivalence class.
        """

        # Submit a reservation
        a = {'Resource_List.select': '1:ncpus=3',
             'reserve_start': int(time.time()) + 10,
             'reserve_end': int(time.time()) + 300, }
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)

        rname = rid.split('.')
        # Submit jobs inside reservation
        a = {ATTR_queue: rname[0], 'Resource_List.select': '1:ncpus=1'}
        jids1 = self.submit_jobs(3, a)

        # Submit jobs outside of reservations
        jids2 = self.submit_jobs(3)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes: one for jobs inside reservations
        # and one for regular jobs
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_time_limit(self):
        """
        Test that various time limits will have their own
        equivalence classes
        """

        # Submit a reservation
        a = {'Resource_List.select': '1:ncpus=8',
             'reserve_start': time.time() + 30,
             'reserve_end': time.time() + 300, }
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)

        rname = rid.split('.')

        # Submit jobs with cput limit inside reservation
        a = {'Resource_List.cput': '20', ATTR_queue: rname[0]}
        jid1 = self.submit_jobs(2, a)

        # Submit jobs with min and max walltime inside reservation
        a = {'Resource_List.min_walltime': '20',
             'Resource_List.max_walltime': '200',
             ATTR_queue: rname[0]}
        jid2 = self.submit_jobs(2, a)

        # Submit jobs with regular walltime inside reservation
        a = {'Resource_List.walltime': '20', ATTR_queue: rname[0]}
        jid3 = self.submit_jobs(2, a)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes: one for each job set
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_fairshare(self):
        """
        Test that scheduler do not create any equiv classes
        if fairshare is set
        """

        a = {'fair_share': 'true ALL',
             'fairshare_usage_res': 'ncpus*walltime',
             'unknown_shares': 10}
        self.scheduler.set_sched_config(a)

        # Submit jobs as different user
        jid1 = self.submit_jobs(8, user=TEST_USER1)
        jid2 = self.submit_jobs(8, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # One equivalence class
        self.scheduler.log_match("Number of job equivalence classes: 1",
                                 starttime=self.t)

        # Wait sometime for jobs to accumulate walltime
        time.sleep(20)

        # Submit another job
        self.t = time.time()
        jid3 = self.submit_jobs(1, user=TEST_USER3)

        # Look at the job equivalence classes again
        self.scheduler.log_match("Number of job equivalence classes: 1",
                                 starttime=self.t)

    def test_server_hook(self):
        """
        Test that job equivalence classes are updated
        when job attributes get updated by hooks
        """

        # Define a queuejob hook
        hook1 = """
import pbs
e = pbs.event()
e.job.Resource_List["walltime"] = 200
"""

        # Define a runjob hook
        hook2 = """
import pbs
e = pbs.event()
e.job.Resource_List["cput"] = 40
"""

        # Define a modifyjob hook
        hook3 = """
import pbs
e = pbs.event()
e.job.Resource_List["cput"] = 20
"""

        # Create a queuejob hook
        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook("t_q", a, hook1)

        # Create a runjob hook
        a = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook("t_r", a, hook2)

        # Create a modifyjob hook
        a = {'event': 'modifyjob', 'enabled': 'True'}
        self.server.create_import_hook("t_m", a, hook3)

        # Turn scheduling off
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Submit jobs as different users
        a = {'Resource_List.ncpus': 2}
        jid1 = self.submit_jobs(4, a, user=TEST_USER1)
        jid2 = self.submit_jobs(4, a, user=TEST_USER2)
        jid3 = self.submit_jobs(4, a, user=TEST_USER3)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # One equivalence class
        self.scheduler.log_match("Number of job equivalence classes: 1",
                                 starttime=self.t)

        # Alter a queued job
        self.t = time.time()
        self.server.alterjob(jid3[2], {ATTR_N: "test"})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence classes: one is for queued jobs that
        # do not have cput set. 2 for the different cputime value
        # set by runjob and modifyjob hook
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_mom_hook(self):
        """
        Test for job equivalence classes with mom hooks.
        """

        # Create resource
        attrib = {}
        attrib['type'] = "string_array"
        attrib['flag'] = 'h'
        self.server.manager(MGR_CMD_CREATE, RSC, attrib, id='foo_str')

        # Create vnodes
        a = {'resources_available.ncpus': 4,
             'resources_available.foo_str': "foo,bar,buba"}
        self.mom.create_vnodes(a, 4)

        # Add resources to sched_config
        self.scheduler.add_resource("foo_str")

        # Create execjob_begin hook
        hook1 = """
import pbs
e = pbs.event()
j = e.job

if j.Resource_List["host"] == "vnode[0]":
    j.Resource_List["foo_str"] = "foo"
elif j.Resource_List["host"] == "vnode[1]":
    j.Resource_List["foo_str"] = "bar"
else:
    j.Resource_List["foo_str"] = "buba"
"""

        a = {'event': "execjob_begin", 'enabled': 'True'}
        self.server.create_import_hook("test", a, hook1)

        # Turn off the scheduling
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})

        # Submit jobs
        a = {'Resource_List.select': "vnode=vnode[0]:ncpus=2"}
        jid1 = self.submit_jobs(2, a)
        a = {'Resource_List.select': "vnode=vnode[1]:ncpus=2"}
        jid2 = self.submit_jobs(2, a)
        a = {'Resource_List.select': "vnode=vnode[2]:ncpus=2"}
        jid3 = self.submit_jobs(2, a)

        # Turn on the scheduling
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Three equivalence class for each string value
        # set by mom_hook
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def test_incr_decr(self):
        """
        Test for varying job equivalence class values
        """

        # Submit a job
        j = Job(TEST_USER,
                attrs={'Resource_List.select': '1:ncpus=8',
                       'Resource_List.walltime': '20'})
        jid1 = self.server.submit(j)

        # One equivalance class
        self.scheduler.log_match("Number of job equivalence classes: 1",
                                 starttime=self.t)

        # Submit another job
        self.t = time.time()
        j = Job(TEST_USER,
                attrs={'Resource_List.select': '1:ncpus=8',
                       'Resource_List.walltime': '30'})
        jid2 = self.server.submit(j)

        # Two equivalence classes
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

        # Submit another job
        self.t = time.time()
        j = Job(TEST_USER,
                attrs={'Resource_List.select': '1:ncpus=8',
                       'Resource_List.walltime': '40'})
        jid3 = self.server.submit(j)

        # Three equivalence classes
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

        # Delete job1
        self.server.delete(jid1, wait='True')

        # Rerun scheduling cycle
        self.t = time.time()
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # Two equivalence classes
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

        # Delete job2
        self.server.delete(jid2, wait='true')

        # Rerun scheduling cycle
        self.t = time.time()
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # One equivalence classes
        self.scheduler.log_match("Number of job equivalence classes: 1",
                                 starttime=self.t)

        # Delete job3
        self.server.delete(jid3, wait='true')

        time.sleep(1)  # adding delay to avoid race condition
        # Rerun scheduling cycle
        self.t = time.time()
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})

        # No message for equivalence class
        self.scheduler.log_match("Number of job equivalence classes",
                                 starttime=self.t,
                                 existence=False)
        self.logger.info(
            "Number of job equivalence classes message " +
            "not present when there are no jobs as expected")

    def test_server_queue_limit(self):
        """
        Test with mix of hard and soft limits
        on resources for users and groups
        """

        # Create workq2
        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='workq2')

        # Set queue limit
        a = {
            'max_run': '[o:PBS_ALL=100],[g:PBS_GENERIC=20],\
                       [u:PBS_GENERIC=20],[g:%s = 8],[u:%s=10]' %
                       (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, QUEUE,
                            a, id='workq2')

        a = {'max_run_res.ncpus':
             '[o:PBS_ALL=100],[g:PBS_GENERIC=50],\
             [u:PBS_GENERIC=20],[g:%s=13],[u:%s=12]' %
             (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq2')

        a = {'max_run_res_soft.ncpus':
             '[o:PBS_ALL=100],[g:PBS_GENERIC=30],\
             [u:PBS_GENERIC=10],[g:%s=10],[u:%s=10]' %
             (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq2')

        # Create server limits
        a = {
            'max_run': '[o:PBS_ALL=100],[g:PBS_GENERIC=50],\
            [u:PBS_GENERIC=20],[g:%s=13],[u:%s=13]' %
            (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'max_run_soft':
             '[o:PBS_ALL=50],[g:PBS_GENERIC=25],[u:PBS_GENERIC=10],\
             [g:%s=10],[u:%s=10]' % (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Turn scheduling off
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'false'})

        # Submit jobs as pbsuser1 from group tstgrp01 in workq2
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP1, ATTR_q: 'workq2'}
        jid1 = self.submit_jobs(10, a, TEST_USER1)

        # Submit jobs as pbsuser1 from group tstgrp02 in workq2
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP2, ATTR_q: 'workq2'}
        jid2 = self.submit_jobs(10, a, TEST_USER1)

        # Submit jobs as pbsuser2 from tstgrp01 in workq2
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP1, ATTR_q: 'workq2'}
        jid3 = self.submit_jobs(10, a, TEST_USER2)

        # Submit jobs as pbsuser2 from tstgrp03 in workq2
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP3, ATTR_q: 'workq2'}
        jid4 = self.submit_jobs(10, a, TEST_USER2)

        # Submit jobs as pbsuser1 from tstgrp01 in workq
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP1, ATTR_q: 'workq'}
        jid5 = self.submit_jobs(10, a, TEST_USER1)

        # Submit jobs as pbsuser1 from tstgrp02 in workq
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP2, ATTR_q: 'workq'}
        jid6 = self.submit_jobs(10, a, TEST_USER1)

        # Submit jobs as pbsuser2 from tstgrp01 in workq
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP1, ATTR_q: 'workq'}
        jid7 = self.submit_jobs(10, a, TEST_USER2)

        # Submit jobs as pbsuser2 from tstgrp03 in workq
        a = {'Resource_List.select': '1:ncpus=1',
             'group_list': TSTGRP3, ATTR_q: 'workq'}
        jid8 = self.submit_jobs(10, a, TEST_USER2)

        self.t = time.time()

        # Run only one cycle
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        # Eight equivalence classes; one for each combination of
        # users and groups
        self.scheduler.log_match("Number of job equivalence classes: 8",
                                 starttime=self.t)

    def test_preemption(self):
        """
        Suspended jobs are placed into their own equivalence class.  If
        they remain in the class they were in when they were queued, they
        can stop other jobs in that class from running.

        Equivalence classes are created in query-order.  Test to see if
        suspended job which comes first in query-order is added to its own
        class.
        """

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, 4, usenatvnode=True)

        a = {'queue_type': 'e', 'started': 't',
             'enabled': 't', 'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='expressq')

        (jid1, ) = self.submit_jobs(1)
        (jid2, ) = self.submit_jobs(1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        a = {'Resource_List.ncpus': 3, 'queue': 'expressq'}
        (jid3,) = self.submit_jobs(1, a)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        # Make sure one of the job is suspended
        sus_job = self.server.select(attrib={'job_state': 'S'})
        self.assertEqual(len(sus_job), 1,
                         "Either no or more jobs are suspended")
        self.logger.info("Job %s is suspended" % sus_job[0])

        (jid4,) = self.submit_jobs(1)
        self.server.expect(JOB, 'comment', op=SET)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)

        # 3 equivalence classes: 1 for jid2 and jid4; 1 for jid3; and 1 for
        # jid1 by itself because it is suspended.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

        # Make sure suspended job is in its own class. If it is still in
        # jid4's class jid4 will not run.  This is because suspended job
        # will be considered first and mark the entire class as can not run.
        if sus_job[0] == jid2:
            self.server.deljob(jid1, wait=True)
        else:
            self.server.deljob(jid2, wait=True)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

    def test_preemption2(self):
        """
        Suspended jobs are placed into their own equivalence class.  If
        they remain in the class they were in when they were queued, they
        can stop other jobs in that class from running.

        Equivalence classes are created in query-order.  Test to see if
        suspended job which comes later in query-order is added to its own
        class instead of the class it was in when it was queued.
        """

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, 4, usenatvnode=True)

        a = {'queue_type': 'e', 'started': 't',
             'enabled': 't', 'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='expressq')

        a = {'preempt_sort': 'min_time_since_start'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        (jid1,) = self.submit_jobs(1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        (jid2,) = self.submit_jobs(1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        # Jobs most recently started are suspended first.
        # Sleep for a second to force jid3 to be suspended.
        time.sleep(1)
        (jid3,) = self.submit_jobs(1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        a = {'Resource_List.ncpus': 2, 'queue': 'expressq'}
        (jid4,) = self.submit_jobs(1, a)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

        (jid5,) = self.submit_jobs(1)
        self.server.expect(JOB, 'comment', op=SET)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid5)

        # 3 equivalence classes: 1 for jid1, jid2, and jid5; 1 for jid4;
        # jid3 by itself because it is suspended.
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

        # Make sure jid3 is in its own class.  If it is still in jid5's class
        # jid5 will not run.  This is because jid3 will be considered first
        # and mark the entire class as can not run.

        self.server.deljob(jid2, wait=True)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid5)

    def test_multiple_job_preemption_order(self):
        """
        Test that when multiple jobs from same eqivalence class are
        preempted in reverse order they were created in and they are placed
        into the same equivalence class
        2) Test that for jobs of same type, suspended job which comes
        later in query-order is in its own equivalence class, and can
        be picked up to run along with the queued job in
        the same scheduling cycle.
        """

        # Create 1 vnode with 3 ncpus
        a = {'resources_available.ncpus': 3}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        # Create expressq
        a = {'queue_type': 'execution', 'started': 'true',
             'enabled': 'true', 'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='expressq')

        a = {'preempt_sort': 'min_time_since_start'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        # Submit 3 jobs with delay of 1 sec
        # Delay of 1 sec will preempt jid3 and then jid2.
        a = {'Resource_List.ncpus': 1}
        J = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        time.sleep(1)

        J2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(J2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        time.sleep(1)
        J3 = Job(TEST_USER, attrs=a)
        jid3 = self.server.submit(J3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        # Preempt jid3 with expressq, check 1 equivalence class is created
        a = {'Resource_List.ncpus': 1, 'queue': 'expressq'}
        Je = Job(TEST_USER, attrs=a)
        jid4 = self.server.submit(Je)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)
        self.t = time.time()

        # Preempt jid2, check no new equivalence class is created
        Je2 = Job(TEST_USER, attrs=a)
        jid5 = self.server.submit(Je2)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid5)

        # Only One equivalence class for jid2 and jid3 is present since both
        # suspended jobs are of same type and running on same vnode

        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

        # Add a job to Queue state
        a = {'Resource_List.ncpus': 1}
        J = Job(TEST_USER, attrs=a)
        jid6 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid5)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid6)

        # Set scheduling to false before deleting jobs to free nodes, so that
        # suspended and queued jobs do not run. These jobs will be picked up
        # in the next scheduling cycle when scheduling is again set to true
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        # Delete one running, one suspended job and one of high priority job
        # This will leave 2 free nodes to pick up the suspended and queued job

        self.server.deljob([jid1, jid2, jid5])

        # if we use deljob(wait=True) starts the scheduling cycle if job
        # takes more time to be deleted.
        # The for loop below is to check that the jobs have been deleted
        # without kicking off a new scheduling cycle.

        deleted = False
        for _ in range(20):
            workq_dict = self.server.status(QUEUE, id='workq')[0]
            expressq_dict = self.server.status(QUEUE, id='expressq')[0]

            if workq_dict['total_jobs'] == '2'\
                    and expressq_dict['total_jobs'] == '1':
                deleted = True
                break
            else:
                # jobs take longer than one second to delete, use two seconds
                time.sleep(2)

        self.assertTrue(deleted)

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid6)

    def test_multiple_equivalence_class_preemption(self):
        """
        This test is to test that -
        1) Suspended jobs of different types go to different equiv classes
        2) Different types of jobs suspended by qsig signal
        go to different equivalence classes
        3) Jobs of same type and same node on suspension by qsig
        or preemption go to same equivalence classes
        4) Same type of suspended jobs, when resumed after qsig
        and jobs suspended by preemption both go to same equivalence classes
        """

        # Create vnode with 4 ncpus
        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        # Create a expressq
        a = {'queue_type': 'execution', 'started': 'true',
             'enabled': 'true', 'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='expressq')

        # Submit regular job
        a = {'Resource_List.ncpus': 1}
        (jid1, jid2) = self.submit_jobs(2, a)

        # Submit a job with walltime
        a2 = {'Resource_List.ncpus': 1, 'Resource_List.walltime': 600}
        (jid3, jid4) = self.submit_jobs(2, a2)

        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

        # Suspend 1 job from each equivalence class
        self.server.sigjob(jobid=jid1, signal="suspend")
        self.server.sigjob(jobid=jid3, signal="suspend")

        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

        # Check that both suspended jobs go to different equivalence class
        # 1 for jid1, 1 for jid2, 1 for jid3, and 1 for jid4
        self.scheduler.log_match("Number of job equivalence classes: 4",
                                 starttime=self.t)

        # Start a high priority job to preempt jid 2 and jid4
        a = {'Resource_List.ncpus': 4, 'queue': 'expressq'}
        Je = Job(TEST_USER, attrs=a)
        jid5 = self.server.submit(Je)

        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid5)

        # Check only 3 equivalence class are present,
        # i.e 1 equivalence class for jid1 and jid2,1 equivalence class
        # for jid3 and jid4 and 1 equivalence class for jid5

        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)
        self.t = time.time()

        # Resume the jobs suspended by qsig
        # 1 second delay is added so that time of next logging moves ahead.
        # This will make sure log_match does not take previous entry.
        time.sleep(1)
        self.server.sigjob(jobid=jid1, signal="resume")
        self.server.sigjob(jobid=jid3, signal="resume")

        # On resume check that there are same number of equivalence classes
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)
        self.t = time.time()

        # delete the expressq jobs and check that the suspended jobs
        # go back to running state. equivalence classes=2 again
        self.server.deljob(jid5, wait=True)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

        # Check equivalence classes =2
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_held_jobs_equiv_class(self):
        """
        1) Test that held jobs do not go into another equivalence class.
        2) Running jobs do not go into a seperate equivalence class
        """

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        a = {'Resource_List.select': '1:ncpus=1', ATTR_h: None}
        J1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(J1)

        a = {'Resource_List.select': '1:ncpus=1'}
        J2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(J2)

        self.server.expect(JOB, {'job_state': 'H'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        self.scheduler.log_match("Number of job equivalence classes: 1",
                                 starttime=self.t)

    def test_queue_resav(self):
        """
        Test that jobs in queues with resources_available limits use queue as
        part of the criteria of making an equivalence class
        """

        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        attrs = {'queue_type': 'Execution', 'started': 'True',
                 'enabled': 'True', 'resources_available.ncpus': 1,
                 'Priority': 10}
        self.server.manager(MGR_CMD_CREATE, QUEUE, attrs, id='workq2')

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        a = {'queue': 'workq', 'Resource_List.select': '1:ncpus=1'}
        a2 = {'queue': 'workq2', 'Resource_List.select': '1:ncpus=1'}
        J = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(J)

        J = Job(TEST_USER, attrs=a2)
        jid2 = self.server.submit(J)

        J = Job(TEST_USER, attrs=a2)
        jid3 = self.server.submit(J)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid3)

        # 2 quivalence classes - one for jobs inside workq2
        # and one for jobs inside workq
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

    def test_overlap_resv(self):
        """
        Test that 2 overlapping reservation creates 2 different
        equivalence classes
        """

        # Submit a reservation
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_start': int(time.time()) + 20,
             'reserve_end': int(time.time()) + 300, }
        r1 = Reservation(TEST_USER, a)
        rid1 = self.server.submit(r1)
        r2 = Reservation(TEST_USER, a)
        rid2 = self.server.submit(r2)
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid1)
        self.server.expect(RESV, a, id=rid2)

        r1name = rid1.split('.')
        r2name = rid2.split('.')
        a = {ATTR_queue: r1name[0], 'Resource_List.select': '1:ncpus=1'}
        j1 = Job(TEST_USER, a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, 'comment', op=SET, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        j2 = Job(TEST_USER, a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, 'comment', op=SET, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        a = {ATTR_queue: r2name[0], 'Resource_List.select': '1:ncpus=1'}
        j3 = Job(TEST_USER, a)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, 'comment', op=SET, id=jid3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)
        j4 = Job(TEST_USER, a)
        jid4 = self.server.submit(j4)
        self.server.expect(JOB, 'comment', op=SET, id=jid4)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)

        # Wait for reservation to start
        self.server.expect(RESV, {'reserve_state=RESV_RUNNING': 2}, offset=20)

        # Verify that equivalence class is 2; one for
        # each reservation queue
        self.scheduler.log_match("Number of job equivalence classes: 2",
                                 starttime=self.t)

        # Verify that one job from R1 is running and
        # one job from R2 is running

        self.server.expect(JOB, {"job_state": 'R'}, id=jid1)
        self.server.expect(JOB, {"job_state": 'R'}, id=jid3)

    def test_limit_res(self):
        """
        Test when resources are being limited on, but those resources are not
        in the sched_config resources line.  Jobs requesting these resources
        should be split into their own equivalence classes.
        """
        a = {ATTR_RESC_TYPE: 'long'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='foores')

        a = {'max_run_res.foores': '[u:PBS_GENERIC=4]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'Resource_List.foores': 1, 'Resource_List.select': '1:ncpus=1'}
        self.submit_jobs(2, a)
        a['Resource_List.foores'] = 2
        (_, jid4) = self.submit_jobs(2, a)
        self.server.expect(JOB, {'job_state=R': 3})
        self.server.expect(JOB, 'comment', op=SET, id=jid4)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)
        (jid5, ) = self.submit_jobs(1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid5)

        # Verify that equivalence class is 3; one for
        # foores=1 and one for  foores=2 and
        # one for no foores
        self.scheduler.log_match("Number of job equivalence classes: 3",
                                 starttime=self.t)

    def change_res(self, name, total, node_num, attribs):
        """
        Callback to change the value of memory on one of the node

        :param name: Name of the vnode which is being created
        :type name: str
        :param total: Total number of vnodes being created
        :type total: int
        :param node_num: Index of the node for which callback is being called
        :type node_num: int
        :param attribs: attributes of the node being created
        :type attribs: dict
        """
        if node_num % 2 != 0:
            attribs['resource_available.mem'] = '16gb'
        else:
            attribs['resource_available.mem'] = '4gb'
        return attribs

    def test_equiv_class_not_marked_on_suspend(self):
        """
        Test that if a job is suspended then scheduler does not mark its
        equivalence class as can_not_run within the same cycle when it gets
        suspended.
        """
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 2,
                               attrfunc=self.change_res)

        # Create an express queue
        a = {'queue_type': 'execution', 'started': 'true',
             'enabled': 'true', 'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq2')
        # Set node sort key so that higher memory node comes up first
        a = {'node_sort_key': '"mem HIGH" ALL'}
        self.scheduler.set_sched_config(a)

        a = {'Resource_List.select': '1:ncpus=1:mem=4gb'}
        (jid1, ) = self.submit_jobs(1, a)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        # Turn off scheduling
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # submit another normal job
        (jid2, ) = self.submit_jobs(1, a)

        # submit a high priority job
        a = {'queue': 'wq2', 'Resource_List.select': '1:ncpus=2:mem=14gb',
             'Resource_List.place': 'excl'}
        (jidh, ) = self.submit_jobs(1, a)

        # Turn on scheduling
        st = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jidh)

        # make sure that the second job ran in the same cycle as the high
        # priority job
        c = self.scheduler.cycles(start=st)
        found = False
        for sched_cycle in c:
            if jidh.split('.')[0] in sched_cycle.sched_job_run:
                found = True
                break
        self.assertTrue(found, "%s didn't found in any sched cycle" % jidh)
        self.assertIn(jid2.split('.')[0], sched_cycle.sched_job_run)


================================================
FILE: test/tests/functional/pbs_exceeded_resources_notification.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


class TestExceededResourcesNotification(TestFunctional):
    """
    This test suite tests exceeding resources notification.
    The notification is done via email, job comment, and job exit code.
    """

    def setUp(self):
        TestFunctional.setUp(self)

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

    def check_mail(self, jid, msg):
        """
        Check the mail file of TEST_USER for message.
        """

        mailfile = os.path.join('/var/mail', str(TEST_USER))

        self.logger.info('Wait 3s for saving the e-mail')
        time.sleep(3)

        if not os.path.isfile(mailfile):
            self.skip_test("Mail file '%s' does not exist or "
                           "mail is not setup. "
                           "Hence this step would be skipped. "
                           "Please check manually." % mailfile)

        ret = self.du.tail(filename=mailfile, runas=TEST_USER, option='-n 10')
        maillog = [x.strip() for x in ret['out']]

        self.assertIn('PBS Job Id: ' + jid, maillog)
        self.assertIn(msg, maillog)

    def test_exceeding_walltime(self):
        """
        This test suite tests exceeding walltime.
        """

        a = {'Resource_List.walltime': 1}
        j = Job(TEST_USER, a)

        jid = self.server.submit(j)
        j_comment = '.* and exceeded resource walltime'
        self.server.expect(JOB, {ATTR_state: 'F',
                                 ATTR_comment: (MATCH_RE, j_comment),
                                 ATTR_exit_status: -29},
                           id=jid, extend='x')

        msg = 'Job exceeded resource walltime'
        self.check_mail(jid, msg)

    def test_exceeding_mem(self):
        """
        This test suite tests exceeding memory.
        """

        self.mom.add_config({'$enforce mem': ''})

        self.mom.restart()

        a = {'Resource_List.walltime': 3600,
             'Resource_List.select': 'mem=1kb'}
        j = Job(TEST_USER, a)

        test = []
        test += ['#!/bin/bash']
        test += ['tail -c 100K /dev/zero']
        j.create_script(body=test)

        jid = self.server.submit(j)
        j_comment = '.* and exceeded resource mem'
        self.server.expect(JOB, {ATTR_state: "F",
                                 ATTR_comment: (MATCH_RE, j_comment),
                                 ATTR_exit_status: -27},
                           id=jid, extend='x')

        msg = 'Job exceeded resource mem'
        self.check_mail(jid, msg)

    def test_exceeding_ncpus_sum(self):
        """
        This test suite tests exceeding ncpus (sum).
        """

        self.mom.add_config(
            {'$enforce average_percent_over': '0',
             '$enforce average_cpufactor': '0.1',
             '$enforce average_trialperiod': '1',
             '$enforce cpuaverage': ''})

        self.mom.restart()

        a = {'Resource_List.walltime': 3600}
        j = Job(TEST_USER, a)

        test = []
        test += ['#!/bin/bash']
        test += ['dd if=/dev/zero of=/dev/null']
        j.create_script(body=test)

        jid = self.server.submit(j)
        j_comment = r'.* and exceeded resource ncpus \(sum\)'
        self.server.expect(JOB, {ATTR_state: 'F',
                                 ATTR_comment: (MATCH_RE, j_comment),
                                 ATTR_exit_status: -25},
                           id=jid, extend='x')

        msg = 'Job exceeded resource ncpus (sum)'
        self.check_mail(jid, msg)

    def test_exceeding_ncpus_burst(self):
        """
        This test suite tests exceeding ncpus (burst).
        """

        self.mom.add_config(
            {'$enforce delta_percent_over': '0',
             '$enforce delta_cpufactor': '0.1',
             '$enforce cpuburst': ''})

        self.mom.restart()

        a = {'Resource_List.walltime': 3600}
        j = Job(TEST_USER, a)

        test = []
        test += ['#!/bin/bash']
        test += ['dd if=/dev/zero of=/dev/null']
        j.create_script(body=test)

        jid = self.server.submit(j)
        j_comment = r'.* and exceeded resource ncpus \(burst\)'
        self.server.expect(JOB, {ATTR_state: 'F',
                                 ATTR_comment: (MATCH_RE, j_comment),
                                 ATTR_exit_status: -24},
                           id=jid, extend='x')

        msg = 'Job exceeded resource ncpus (burst)'
        self.check_mail(jid, msg)

    def test_exceeding_cput(self):
        """
        This test suite tests exceeding cput.
        """

        a = {'Resource_List.cput': 10}
        j = Job(TEST_USER, a)

        # we need at least two processes otherwise the kernel
        # would kill the process first
        test = []
        test += ['#!/bin/bash']
        test += ['dd if=/dev/zero of=/dev/null & \
dd if=/dev/zero of=/dev/null']
        j.create_script(body=test)

        jid = self.server.submit(j)
        j_comment = '.* and exceeded resource cput'
        self.server.expect(JOB, {ATTR_state: 'F',
                                 ATTR_comment: (MATCH_RE, j_comment),
                                 ATTR_exit_status: -28},
                           id=jid, extend='x')

        msg = 'Job exceeded resource cput'
        self.check_mail(jid, msg)


================================================
FILE: test/tests/functional/pbs_execjob_susp_resume.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


@requirements(num_moms=2)
class TestPbsExecjobSuspendResume(TestFunctional):
    """
    Tests the hook events execjob_postsuspend, execjob_preresume which are
    called after a job is suspended, and before the job is resumed.
    """
    logutils = PBSLogUtils()

    def setUp(self):
        if len(self.moms) != 2:
            self.skipTest('test requires two MoMs as input, ' +
                          'use -p moms=<mom1>:<mom2>')
        TestFunctional.setUp(self)
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]

        # execjob_postsuspend hook
        self.postsuspend_hook_body = """import pbs
e=pbs.event()

def proc_status(pid):
    try:
        for line in open("/proc/%d/status" % pid).readlines():
            if line.startswith("State:"):
                return line.split(":",1)[1].strip().split(' ')[0]
    except:
        pass
    return None

def print_attribs(pbs_obj, header):
    for a in pbs_obj.attributes:
        v = getattr(pbs_obj, a)
        if v and str(v):
            pbs.logjobmsg(e.job.id, "%s: %s = %s" % (header, a, v))
            if a == "session_id":
                st = proc_status(v)
                if st == 'T':
                    pbs.logjobmsg(e.job.id,
                                  "%s: process seen as suspended" % header)

if e.type == pbs.EXECJOB_POSTSUSPEND:
    pbs.logmsg(pbs.LOG_DEBUG, "%s;called execjob_postsuspend hook" %e.job.id)
print_attribs(e.job, "JOB")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    print_attribs(v, "vnode_list[" + vn + "]")
"""
        # execjob_postsuspend hook, reject
        self.postsuspend_hook_reject_body = """import pbs
e=pbs.event()
job=e.job
e.reject("bad suspend on ms")
"""
        # execjob_postsuspend hook, reject by sister only
        self.postsuspend_hook_sis_reject_body = """import pbs
e=pbs.event()
job=e.job
if not e.job.in_ms_mom():
    e.reject("bad suspend on sis")
"""
        # hook with an unhandled exception
        self.hook_error_body = """import pbs
e=pbs.event()
job=e.job
raise NameError
"""
        # hook with an unhandled exception, sister only
        self.hook_sis_error_body = """import pbs
e=pbs.event()
job=e.job
if not job.in_ms_mom():
    raise NameError
"""

        # execjob_preresume hook
        self.preresume_hook_body = """import pbs
e=pbs.event()

def proc_status(pid):
    try:
        for line in open("/proc/%d/status" % pid).readlines():
            if line.startswith("State:"):
                return line.split(":",1)[1].strip().split(' ')[0]
    except:
        pass
    return None

def print_attribs(pbs_obj, header):
    for a in pbs_obj.attributes:
        v = getattr(pbs_obj, a)
        if v and str(v):
            pbs.logjobmsg(e.job.id, "%s: %s = %s" % (header, a, v))
            if a == "session_id":
                st = proc_status(v)
                if st == 'T':
                    pbs.logjobmsg(e.job.id,
                                  "%s: process seen as suspended" % header)

if e.type == pbs.EXECJOB_PRERESUME:
    pbs.logmsg(pbs.LOG_DEBUG, "%s;called execjob_preresume hook" %e.job.id)

print_attribs(e.job, "JOB")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    print_attribs(v, "vnode_list[" + vn + "]")
"""
        # execjob_preresume hook, reject
        self.preresume_hook_reject_body = """import pbs
e=pbs.event()
job=e.job
e.reject("bad resumption on ms")
"""
        # execjob_preresume hook, reject by sister only
        self.preresume_hook_sis_reject_body = """import pbs
e=pbs.event()
job=e.job
if not e.job.in_ms_mom():
    e.reject("bad resumption on sis")
"""
        # job used in the tests
        self.j = Job(self.du.get_current_user())

        script = """
#PBS -l select=2:ncpus=1
#PBS -l place=scatter
#PBS -S /bin/bash
pbsdsh -n 1 -- sleep 60 &
sleep 60
"""
        self.j.create_script(script)

    def test_execjob_postsuspend(self):
        """
        An execjob_postsuspend hook is executed by primary mom and then by
        the connected sister moms after a job has been suspended.
        """
        # instantiate execjob_postsuspend hook
        hook_event = 'execjob_postsuspend'
        hook_name = 'psus'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.postsuspend_hook_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        self.server.status(JOB, 'exec_vnodes', id=jid)
        job_node = self.j.get_vnodes()[0]

        # Suspend job
        self.server.sigjob(jobid=jid, signal="suspend")

        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with suspend" % jid)
            else:
                vn.log_match("Job;%s;SUSPEND received" % jid)

            vn.log_match("%s;called execjob_postsuspend hook" % jid)
            if vn == self.momA:
                # as postsuspend hook is executing,
                # job's process should be seen as suspended
                vn.log_match("Job;%s;JOB: process seen as suspended" % jid)

            # Check presence of pbs.event().job
            vn.log_match("Job;%s;JOB: id = %s" % (jid, jid))

            # Check presence of vnode_list[] parameter
            vnode_list = [self.momA.name, self.momB.name]
            for v in vnode_list:
                vn.log_match("Job;%s;vnode_list[%s]: name = %s" % (
                             jid, job_node, job_node))

        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_preresume(self):
        """
        An execjob_preresume hook is executed by primary mom and then by
        the connected sister moms just before a job is resumed.
        """
        # instantiate execjob_preresume hook
        hook_event = 'execjob_preresume'
        hook_name = 'pres'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.preresume_hook_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        self.server.status(JOB, 'exec_vnodes', id=jid)
        job_node = self.j.get_vnodes()[0]

        # Suspend, then resume job
        self.server.sigjob(jobid=jid, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)
        self.server.sigjob(jobid=jid, signal="resume")

        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with resume" % jid)
            else:
                vn.log_match("Job;%s;RESUME received" % jid)

            vn.log_match("%s;called execjob_preresume hook" % jid)
            if vn == self.momA:
                # as preresume hook is executing,
                # job's process should be seen as suspended
                vn.log_match("Job;%s;JOB: process seen as suspended" % jid)
            # Check presence of pbs.event().job
            vn.log_match("Job;%s;JOB: id = %s" % (jid, jid))

            # Check presence of vnode_list[] parameter
            vnode_list = [self.momA.name, self.momB.name]
            for v in vnode_list:
                vn.log_match("Job;%s;vnode_list[%s]: name = %s" % (
                             jid, job_node, job_node))

        # after hook executes, job should be running again.
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

    def test_execjob_postsuspend_reject(self):
        """
        An execjob_postsuspend hook that results in a reject action
        would not affect the currently suspended job.
        """
        # instantiate execjob_postsuspend hook
        hook_event = 'execjob_postsuspend'
        hook_name = 'psus'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.postsuspend_hook_reject_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend job
        self.server.sigjob(jobid=jid, signal="suspend")

        hook_msg = "bad suspend on ms"
        reject_msg = "%s hook rejected request: %s" % (hook_event, hook_msg)
        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with suspend" % jid)
            else:
                vn.log_match("Job;%s;SUSPEND received" % jid)

            vn.log_match("Job;%s;%s" % (jid, hook_msg))
            vn.log_match("Job;%s;%s" % (jid, reject_msg))

        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_postsuspend_reject_sis(self):
        """
        An execjob_postsuspend hook that results in a reject action
        by sister mom only would not affect the currently suspended
        job.
        """
        # instantiate execjob_postsuspend hook
        hook_event = 'execjob_postsuspend'
        hook_name = 'psus'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.postsuspend_hook_sis_reject_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend job
        self.server.sigjob(jobid=jid, signal="suspend")

        hook_msg = "bad suspend on sis"
        reject_msg = "%s hook rejected request: %s" % (hook_event, hook_msg)
        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with suspend" % jid)
                vn.log_match("Job;%s;%s" % (jid, hook_msg),
                             existence=False, max_attempts=30)
                vn.log_match("Job;%s;%s" % (jid, reject_msg),
                             existence=False, max_attempts=30)
            else:
                vn.log_match("Job;%s;SUSPEND received" % jid)
                vn.log_match("Job;%s;%s" % (jid, hook_msg))
                vn.log_match("Job;%s;%s" % (jid, reject_msg))

        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_postsuspend_error(self):
        """
        An execjob_postsuspend hook that results in an error action
        would not affect the currently suspended job.
        """
        # instantiate execjob_postsuspend hook
        hook_event = 'execjob_postsuspend'
        hook_name = 'psus'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.hook_error_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend job
        self.server.sigjob(jobid=jid, signal="suspend")

        error_msg = \
            "%s hook \'%s\' encountered an exception, request rejected" \
            % (hook_event, hook_name)

        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with suspend" % jid)
            else:
                vn.log_match("Job;%s;SUSPEND received" % jid)

            vn.log_match("Job;%s;%s" % (jid, error_msg))

        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_postsuspend_error_sis(self):
        """
        An execjob_postsuspend hook that results in a error action
        by sister mom only would not affect the currently suspended
        job.
        """
        # instantiate execjob_postsuspend hook
        hook_event = 'execjob_postsuspend'
        hook_name = 'psus'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.hook_sis_error_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend job
        self.server.sigjob(jobid=jid, signal="suspend")

        error_msg = \
            "%s hook \'%s\' encountered an exception, request rejected" \
            % (hook_event, hook_name)

        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with suspend" % jid)
                vn.log_match("Job;%s;%s" % (jid, error_msg),
                             existence=False, max_attempts=30)
            else:
                vn.log_match("Job;%s;SUSPEND received" % jid)
                vn.log_match("Job;%s;%s" % (jid, error_msg))

        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_preresume_reject(self):
        """
        An execjob_preresume hook that results in a reject action
        would prevent suspended job from being resumed.
        """
        # instantiate execjob_preresume hook
        hook_event = 'execjob_preresume'
        hook_name = 'pres'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.preresume_hook_reject_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend, then resume job
        self.server.sigjob(jobid=jid, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)
        self.server.sigjob(jobid=jid, signal="resume")

        hook_msg = "bad resumption on ms"
        reject_msg = "%s hook rejected request: %s" % (hook_event, hook_msg)
        # Mom hook executes on momA and gets a rejection,
        # so a resume request is not sent to sister momB.
        self.momA.log_match("Job;%s;signal job with resume" % jid)
        self.momA.log_match("Job;%s;%s" % (jid, hook_msg))
        self.momA.log_match("Job;%s;%s" % (jid, reject_msg))
        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_preresume_reject_sis(self):
        """
        An execjob_preresume hook that results in a reject action
        by sister mom only would not affect the currently suspended
        job.
        """
        # instantiate execjob_preresume hook
        hook_event = 'execjob_preresume'
        hook_name = 'psus'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.preresume_hook_sis_reject_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend, then resume job
        self.server.sigjob(jobid=jid, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)
        self.server.sigjob(jobid=jid, signal="resume")

        hook_msg = "bad resumption on sis"
        reject_msg = "%s hook rejected request: %s" % (hook_event, hook_msg)
        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with resume" % jid)
                vn.log_match("Job;%s;%s" % (jid, hook_msg),
                             existence=False, max_attempts=30)
                vn.log_match("Job;%s;%s" % (jid, reject_msg),
                             existence=False, max_attempts=30)
            else:
                vn.log_match("Job;%s;RESUME received" % jid)
                vn.log_match("Job;%s;%s" % (jid, hook_msg))
                vn.log_match("Job;%s;%s" % (jid, reject_msg))

        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_preresume_error(self):
        """
        An execjob_preresume hook that results in a error action
        would prevent suspended job from being resumed.
        """
        # instantiate execjob_preresume hook
        hook_event = 'execjob_preresume'
        hook_name = 'pres'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.hook_error_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend, then resume job
        self.server.sigjob(jobid=jid, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)
        self.server.sigjob(jobid=jid, signal="resume")

        error_msg = \
            "%s hook \'%s\' encountered an exception, request rejected" \
            % (hook_event, hook_name)

        # Mom hook executes on momA and gets a errorion,
        # so a resume request is not sent to sister momB.
        self.momA.log_match("Job;%s;signal job with resume" % jid)
        self.momA.log_match("Job;%s;%s" % (jid, error_msg))
        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)

    def test_execjob_preresume_error_sis(self):
        """
        An execjob_preresume hook that results in a error action
        by sister mom only would not affect the currently suspended
        job.
        """
        # instantiate execjob_preresume hook
        hook_event = 'execjob_preresume'
        hook_name = 'psus'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.hook_sis_error_body)

        # Submit a job
        jid = self.server.submit(self.j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Suspend, then resume job
        self.server.sigjob(jobid=jid, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)
        self.server.sigjob(jobid=jid, signal="resume")

        error_msg = \
            "%s hook \'%s\' encountered an exception, request rejected" \
            % (hook_event, hook_name)

        for vn in [self.momA, self.momB]:
            if vn == self.momA:
                vn.log_match("Job;%s;signal job with resume" % jid)
                vn.log_match("Job;%s;%s" % (jid, error_msg),
                             existence=False, max_attempts=30)
            else:
                vn.log_match("Job;%s;RESUME received" % jid)
                vn.log_match("Job;%s;%s" % (jid, error_msg))

        # after hook executes, job continues to be suspended
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)


================================================
FILE: test/tests/functional/pbs_fairshare.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('sched')
class TestFairshare(TestFunctional):

    """
    Test the pbs_sched fairshare functionality.  Note there are two
    fairshare tests in the standard smoke test that are not included here.
    """

    def set_up_resource_group(self):
        """
        Set up the resource_group file for test suite
        """
        self.scheduler.add_to_resource_group('group1', 10, 'root', 40)
        self.scheduler.add_to_resource_group('group2', 20, 'root', 60)
        self.scheduler.add_to_resource_group(TEST_USER, 11, 'group1', 50)
        self.scheduler.add_to_resource_group(TEST_USER1, 12, 'group1', 50)
        self.scheduler.add_to_resource_group(TEST_USER2, 21, 'group2', 60)
        self.scheduler.add_to_resource_group(TEST_USER3, 22, 'group2', 40)
        self.scheduler.fairshare.set_fairshare_usage(TEST_USER, 100)
        self.scheduler.fairshare.set_fairshare_usage(TEST_USER1, 100)
        self.scheduler.fairshare.set_fairshare_usage(TEST_USER3, 1000)

    def test_formula_keyword(self):
        """
        Test to see if 'fairshare_tree_usage' and 'fairshare_perc' are allowed
        to be set in the job_sort_formula
        """

        # manager() will throw a PbsManagerError exception if this fails
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_sort_formula': 'fairshare_tree_usage'})

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_sort_formula': 'fairshare_perc'})

        formula = 'pow(2,-(fairshare_tree_usage/fairshare_perc))'
        self.server.manager(MGR_CMD_SET, SERVER, {'job_sort_formula': formula})

        formula = 'fairshare_factor'
        self.server.manager(MGR_CMD_SET, SERVER, {'job_sort_formula': formula})

        formula = 'fair_share_factor'
        try:
            self.server.manager(
                MGR_CMD_SET, SERVER, {'job_sort_formula': formula})
        except PbsManagerError as e:
            self.assertTrue("Formula contains invalid keyword" in e.msg[0])

    def test_fairshare_formula(self):
        """
        Test fairshare in the formula.  Make sure the fairshare_tree_usage
        is correct
        """

        self.set_up_resource_group()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_sort_formula': 'fairshare_tree_usage'})
        J1 = Job(TEST_USER)
        jid1 = self.server.submit(J1)
        J2 = Job(TEST_USER1)
        jid2 = self.server.submit(J2)
        J3 = Job(TEST_USER2)
        jid3 = self.server.submit(J3)
        J4 = Job(TEST_USER3)
        jid4 = self.server.submit(J4)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        msg = ';Formula Evaluation = '
        self.scheduler.log_match(str(jid1) + msg + '0.1253')
        self.scheduler.log_match(str(jid2) + msg + '0.1253')
        self.scheduler.log_match(str(jid3) + msg + '0.5004')
        self.scheduler.log_match(str(jid4) + msg + '0.8330')

    def test_fairshare_formula2(self):
        """
        Test fairshare in the formula.  Make sure the fairshare_perc
        is correct
        """

        self.set_up_resource_group()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_sort_formula': 'fairshare_perc'})
        J1 = Job(TEST_USER)
        jid1 = self.server.submit(J1)
        J2 = Job(TEST_USER1)
        jid2 = self.server.submit(J2)
        J3 = Job(TEST_USER2)
        jid3 = self.server.submit(J3)
        J4 = Job(TEST_USER3)
        jid4 = self.server.submit(J4)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        msg = ';Formula Evaluation = '
        self.scheduler.log_match(str(jid1) + msg + '0.2')
        self.scheduler.log_match(str(jid2) + msg + '0.2')
        self.scheduler.log_match(str(jid3) + msg + '0.36')
        self.scheduler.log_match(str(jid4) + msg + '0.24')

    def test_fairshare_formula3(self):
        """
        Test fairshare in the formula.  Make sure entities with small usage
        are negatively affected by their high usage siblings.  Make sure that
        jobs run in the correct order.  Use fairshare_tree_usage in a
        pow() formula
        """

        self.set_up_resource_group()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        formula = 'pow(2,-(fairshare_tree_usage/fairshare_perc))'

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, SERVER, {'job_sort_formula': formula})
        J1 = Job(TEST_USER2)
        jid1 = self.server.submit(J1)
        J2 = Job(TEST_USER3)
        jid2 = self.server.submit(J2)
        J3 = Job(TEST_USER)
        jid3 = self.server.submit(J3)
        J4 = Job(TEST_USER1)
        jid4 = self.server.submit(J4)
        t = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        msg = ';Formula Evaluation = '
        self.scheduler.log_match(str(jid1) + msg + '0.3816')
        self.scheduler.log_match(str(jid2) + msg + '0.0902')
        self.scheduler.log_match(str(jid3) + msg + '0.6477')
        self.scheduler.log_match(str(jid4) + msg + '0.6477')
        self.scheduler.log_match('Leaving Scheduling Cycle', starttime=t)

        c = self.scheduler.cycles(lastN=1)[0]
        job_order = [jid3, jid4, jid1, jid2]
        for i in range(len(job_order)):
            self.assertEqual(job_order[i].split('.')[0], c.political_order[i])

    def test_fairshare_formula4(self):
        """
        Test fairshare in the formula.  Make sure entities with small usage
        are negatively affected by their high usage siblings.  Make sure that
        jobs run in the correct order.  Use keyword fairshare_factor
        """

        self.set_up_resource_group()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        formula = 'fairshare_factor'

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, SERVER, {'job_sort_formula': formula})

        J1 = Job(TEST_USER2)
        jid1 = self.server.submit(J1)
        J2 = Job(TEST_USER3)
        jid2 = self.server.submit(J2)
        J3 = Job(TEST_USER)
        jid3 = self.server.submit(J3)
        J4 = Job(TEST_USER1)
        jid4 = self.server.submit(J4)
        t = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        msg = ';Formula Evaluation = '
        self.scheduler.log_match(str(jid1) + msg + '0.3816')
        self.scheduler.log_match(str(jid2) + msg + '0.0902')
        self.scheduler.log_match(str(jid3) + msg + '0.6477')
        self.scheduler.log_match(str(jid4) + msg + '0.6477')
        self.scheduler.log_match('Leaving Scheduling Cycle', starttime=t)

        c = self.scheduler.cycles(lastN=1)[0]
        job_order = [jid3, jid4, jid1, jid2]
        for i in range(len(job_order)):
            self.assertEqual(job_order[i].split('.')[0], c.political_order[i])

    def test_fairshare_formula5(self):
        """
        Test fairshare in the formula with fair_share set to true in scheduler.
        Make sure formula takes precedence over fairshare usage. Output will be
        same as in test_fairshare_formula4.
        """

        self.set_up_resource_group()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})
        a = {'fair_share': "True ALL"}
        self.scheduler.set_sched_config(a)

        formula = 'fairshare_factor'

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, SERVER, {'job_sort_formula': formula})

        J1 = Job(TEST_USER2, {'Resource_List.cput': 10})
        jid1 = self.server.submit(J1)
        J2 = Job(TEST_USER3, {'Resource_List.cput': 20})
        jid2 = self.server.submit(J2)
        J3 = Job(TEST_USER, {'Resource_List.cput': 30})
        jid3 = self.server.submit(J3)
        J4 = Job(TEST_USER1, {'Resource_List.cput': 40})
        jid4 = self.server.submit(J4)
        t = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        msg = ';Formula Evaluation = '
        self.scheduler.log_match(str(jid1) + msg + '0.3816')
        self.scheduler.log_match(str(jid2) + msg + '0.0902')
        self.scheduler.log_match(str(jid3) + msg + '0.6477')
        self.scheduler.log_match(str(jid4) + msg + '0.6477')
        self.scheduler.log_match('Leaving Scheduling Cycle', starttime=t)

        c = self.scheduler.cycles(start=t, lastN=1)[0]
        job_order = [jid3, jid4, jid1, jid2]
        for i in range(len(job_order)):
            self.assertEqual(job_order[i].split('.')[0], c.political_order[i])

    def test_fairshare_formula6(self):
        """
        Test fairshare in the formula.  Make sure entities with small usage
        are negatively affected by their high usage siblings.  Make sure that
        jobs run in the correct order.  Use keyword fairshare_factor
        with ncpus/walltime
        """

        self.set_up_resource_group()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        formula = 'fairshare_factor + (walltime/ncpus)'

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, SERVER, {'job_sort_formula': formula})

        J1 = Job(TEST_USER2, {'Resource_List.ncpus': 1,
                              'Resource_List.walltime': "00:01:00"})
        jid1 = self.server.submit(J1)
        J2 = Job(TEST_USER3, {'Resource_List.ncpus': 2,
                              'Resource_List.walltime': "00:01:00"})
        jid2 = self.server.submit(J2)
        J3 = Job(TEST_USER, {'Resource_List.ncpus': 3,
                             'Resource_List.walltime': "00:02:00"})
        jid3 = self.server.submit(J3)
        J4 = Job(TEST_USER1, {'Resource_List.ncpus': 4,
                              'Resource_List.walltime': "00:02:00"})
        jid4 = self.server.submit(J4)
        t = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        msg = ';Formula Evaluation = '
        self.scheduler.log_match(str(jid1) + msg + '60.3816')
        self.scheduler.log_match(str(jid2) + msg + '30.0902')
        self.scheduler.log_match(str(jid3) + msg + '40.6477')
        self.scheduler.log_match(str(jid4) + msg + '30.6477')
        self.scheduler.log_match('Leaving Scheduling Cycle', starttime=t)

        c = self.scheduler.cycles(start=t, lastN=1)[0]
        job_order = [jid1, jid3, jid4, jid2]
        for i in range(len(job_order)):
            self.assertEqual(job_order[i].split('.')[0], c.political_order[i])

    def test_pbsfs(self):
        """
        Test to see if running pbsfs affects the scheduler's view of the
        fairshare usage.  This is done by calling the Scheduler()'s
        revert_to_defaults().  This will call pbsfs -e to remove all usage.
        """

        self.scheduler.add_to_resource_group(TEST_USER, 11, 'root', 10)
        self.scheduler.add_to_resource_group(TEST_USER1, 12, 'root', 10)
        self.scheduler.set_sched_config({'fair_share': 'True'})

        self.scheduler.fairshare.set_fairshare_usage(TEST_USER, 100)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        J1 = Job(TEST_USER)
        jid1 = self.server.submit(J1)
        J2 = Job(TEST_USER1)
        jid2 = self.server.submit(J2)

        self.scheduler.run_scheduling_cycle()

        c = self.scheduler.cycles(lastN=1)[0]
        job_order = [jid2, jid1]
        for i in range(len(job_order)):
            self.assertEqual(job_order[i].split('.')[0], c.political_order[i])

        self.server.deljob(id=jid1, wait=True)
        self.server.deljob(id=jid2, wait=True)
        self.scheduler.revert_to_defaults()

        # revert_to_defaults() will set the default scheduler's scheduling
        # back to true.  Need to turn it off again
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # Set TEST_USER1 to 50.  If revert_to_defaults() has affected the
        # scheduler's view of the fairshare usage, it's the only entity with
        # usage.  Its job will run second.  If revert_to_defaults() did
        # nothing, 50 is less than 100, so TEST_USER1's job will run first
        self.scheduler.add_to_resource_group(TEST_USER, 11, 'root', 10)
        self.scheduler.add_to_resource_group(TEST_USER1, 12, 'root', 10)
        self.scheduler.set_sched_config({'fair_share': 'True'})

        self.scheduler.fairshare.set_fairshare_usage(TEST_USER1, 50)

        J3 = Job(TEST_USER)
        jid3 = self.server.submit(J3)
        J4 = Job(TEST_USER1)
        jid4 = self.server.submit(J4)

        self.scheduler.run_scheduling_cycle()

        c = self.scheduler.cycles(lastN=1)[0]
        job_order = [jid3, jid4]
        for i in range(len(job_order)):
            self.assertEqual(job_order[i].split('.')[0], c.political_order[i])

    def test_fairshare_decay_min_usage(self):
        """
        Test that fairshare decay doesn't reduce the usage below 1
        """
        self.scheduler.set_sched_config({'fair_share': 'True'})
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 4095})
        self.scheduler.add_to_resource_group(TEST_USER, 10, 'root', 50)
        self.scheduler.fairshare.set_fairshare_usage(TEST_USER, 1)
        self.scheduler.set_sched_config({"fairshare_decay_time": "00:00:02"})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        t = time.time()
        time.sleep(3)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.scheduler.log_match("Decaying Fairshare Tree", starttime=t)

        # Check that TEST_USER's usage is 1
        fs = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER))
        fs_usage = int(fs.usage)
        self.assertEqual(fs_usage, 1,
                         "Fairshare usage %d not equal to 1" % fs_usage)

    def test_fairshare_topjob(self):
        """
        Test that jobs are run in the augmented fairshare order after a topjob
        is added to the calendar
        """
        self.scheduler.set_sched_config({'fair_share': 'True'})
        self.scheduler.set_sched_config({'fairshare_usage_res': 'ncpus'})
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        self.scheduler.add_to_resource_group(TEST_USER, 11, 'root', 10)
        self.scheduler.add_to_resource_group(TEST_USER1, 12, 'root', 10)
        self.scheduler.add_to_resource_group(TEST_USER2, 13, 'root', 10)
        a = {'resources_available.ncpus': 5}
        self.mom.create_vnodes(a, 1)
        a = {'Resource_List.select': '5:ncpus=1'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        j2 = Job(TEST_USER1, attrs=a)
        jid2 = self.server.submit(j2)
        j3 = Job(TEST_USER1, attrs=a)
        jid3 = self.server.submit(j3)
        j4 = Job(TEST_USER2, attrs=a)
        jid4 = self.server.submit(j4)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.scheduler.log_match(jid2 + ';Job is a top job and will run at')
        c = self.scheduler.cycles(lastN=1)[0]
        jorder = [jid2, jid4, jid3]
        jorder = [j.split('.')[0] for j in jorder]
        msg = 'Jobs ran out of order'
        self.assertEqual(jorder, c.political_order, msg)

    def test_fairshare_acct_name(self):
        """
        Test fairshare with fairshare_entity as Account_Name
        """
        self.scheduler.set_sched_config({'fair_share': 'True'})
        self.scheduler.set_sched_config({'fairshare_usage_res': 'ncpus'})
        self.scheduler.set_sched_config({'fairshare_entity': ATTR_A})

        self.scheduler.add_to_resource_group('acctA', 11, 'root', 10)
        self.scheduler.fairshare.set_fairshare_usage('acctA', 1)
        self.scheduler.add_to_resource_group('acctB', 12, 'root', 25)
        self.scheduler.fairshare.set_fairshare_usage('acctB', 1)

        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': False})
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 1},
                            id=self.mom.shortname)
        a = {ATTR_A: 'acctA'}
        j1 = Job(attrs=a)
        j1.set_sleep_time(15)
        jid1 = self.server.submit(j1)

        a = {ATTR_A: 'acctB'}
        j2 = Job(attrs=a)
        j2.set_sleep_time(15)
        jid2 = self.server.submit(j2)

        j3 = Job(attrs=a)
        j3.set_sleep_time(15)
        jid3 = self.server.submit(j3)

        j4 = Job(attrs=a)
        j4.set_sleep_time(15)
        jid4 = self.server.submit(j4)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})

        # acctB has 2/3s of the shares, so 2 of its jobs will run before acctA
        # a second cycle has to be kicked between jobs to make sure the
        # scheduler acumulates the fairshare usage.
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3, offset=15)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1, offset=15)


================================================
FILE: test/tests/functional/pbs_gen_nodefile_on_sister_mom.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestGenNodefileOnSisterMom(TestFunctional):
    """
    This test suite tests the PBS_NODEFILE creation on
    sister moms of job.
    """
    def test_gen_nodefile_on_sister_mom_default(self):
        """
        This test case verifies PBS_NODEFILE gets created on
        sister mom by default
        """
        # Skip test if number of mom provided is not equal to two
        if not len(self.moms) == 2:
            self.skipTest("test requires two MoMs as input, " +
                          "use -p moms=<mom1:mom2>")
        ms = self.moms.keys()[0]
        sister_mom = self.moms.keys()[1]
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2:ncpus=1',
                          'Resource_List.place': 'scatter'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        nodefile = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                "aux", jid)

        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertTrue(file_exists, "PBS_NODEFILE not created in "
                                     "sister mom %s" % sister_mom)
        sister_nodes = "\n".join(self.du.cat(sister_mom, nodefile,
                                             sudo=True)['out'])
        ms_nodes = "\n".join(self.du.cat(ms, nodefile, sudo=True)['out'])
        self.assertEqual(ms_nodes, sister_nodes)
        self.server.log_match(jid + ";Exit_status=0", interval=4,
                              max_attempts=30)
        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertFalse(file_exists, "PBS_NODEFILE not deleted in "
                                      "sister mom %s" % sister_mom)

    def test_gen_nodefile_on_sister_mom_config_enabled(self):
        """
        This test case verifies PBS_NODEFILE gets created on
        sister mom on setting gen_nodefile_on_sister_mom mom
        config parameter to true.
        """
        # Skip test if number of mom provided is not equal to two
        if not len(self.moms) == 2:
            self.skipTest("test requires two MoMs as input, " +
                          "use -p moms=<mom1:mom2>")
        ms = self.moms.keys()[0]
        sister_mom = self.moms.keys()[1]
        sister_mom_obj = self.moms.values()[1]
        sister_mom_obj.add_config({'$gen_nodefile_on_sister_mom': 1})

        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2:ncpus=1',
                          'Resource_List.place': 'scatter'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        nodefile = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                "aux", jid)

        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertTrue(file_exists, "PBS_NODEFILE not created in "
                                     "sister mom %s" % sister_mom)
        sister_nodes = "\n".join(self.du.cat(sister_mom, nodefile,
                                             sudo=True)['out'])
        ms_nodes = "\n".join(self.du.cat(ms, nodefile, sudo=True)['out'])
        self.assertEqual(ms_nodes, sister_nodes)
        self.server.log_match(jid + ";Exit_status=0", interval=4,
                              max_attempts=30)
        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertFalse(file_exists, "PBS_NODEFILE not deleted in "
                                      "sister mom %s" % sister_mom)

    def test_gen_nodefile_on_sister_mom_config_disabled(self):
        """
        This test case verifies PBS_NODEFILE does not get created
        on sister mom on setting gen_nodefile_on_sister_mom mom
        config parameter to false.
        """
        # Skip test if number of mom provided is not equal to two
        if not len(self.moms) == 2:
            self.skipTest("test requires two MoMs as input, " +
                          "use -p moms=<mom1:mom2>")

        sister_mom = self.moms.keys()[1]
        sister_mom_obj = self.moms.values()[1]
        sister_mom_obj.add_config({'$gen_nodefile_on_sister_mom': 0})
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2:ncpus=1',
                          'Resource_List.place': 'scatter'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        nodefile = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                "aux", jid)

        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertFalse(file_exists, "PBS_NODEFILE created in "
                                      "sister mom %s" % sister_mom)

    def test_gen_nodefile_on_sister_mom_hup(self):
        """
        This test suite verifies PBS_NODEFILE does not get created
        on sister mom on setting gen_nodefile_on_sister_mom mom
        config parameter to false and then HUP the mom to verify if
        PBS_NODEFILE is created on sister.
        """
        # Skip test if number of mom provided is not equal to two
        if not len(self.moms) == 2:
            self.skipTest("test requires two MoMs as input, " +
                          "use -p moms=<mom1:mom2>")
        ms = self.moms.keys()[0]
        sister_mom = self.moms.keys()[1]
        sister_mom_obj = self.moms.values()[1]
        sister_mom_obj.add_config({'$gen_nodefile_on_sister_mom': 0})
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2:ncpus=1',
                          'Resource_List.place': 'scatter'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        nodefile = os.path.join(self.server.pbs_conf['PBS_HOME'], "aux", jid)

        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertFalse(file_exists, "PBS_NODEFILE created in "
                                      "sister mom %s" % sister_mom)
        self.server.delete(jid)
        config = {'$clienthost': self.server.hostname}
        sister_mom_obj.config = config
        sister_mom_obj.apply_config(config)
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2:ncpus=1',
                          'Resource_List.place': 'scatter'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        nodefile = os.path.join(self.server.pbs_conf['PBS_HOME'], "aux", jid)
        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertTrue(file_exists, "PBS_NODEFILE not created in "
                                     "sister mom %s" % sister_mom)
        sister_nodes = "\n".join(self.du.cat(sister_mom, nodefile,
                                             sudo=True)['out'])
        ms_nodes = "\n".join(self.du.cat(ms, nodefile, sudo=True)['out'])
        self.assertEqual(ms_nodes, sister_nodes)
        self.server.log_match(jid + ";Exit_status=0", interval=4,
                              max_attempts=30)
        file_exists = self.du.isfile(hostname=sister_mom, path=nodefile,
                                     sudo=True)
        self.assertFalse(file_exists, "PBS_NODEFILE not deleted in "
                                      "sister mom %s" % sister_mom)


================================================
FILE: test/tests/functional/pbs_grunt.py
================================================
# coding: utf-8

# Copyright (C) 2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestGrunt(TestFunctional):

    """
    This test suite is for testing the grunt routines
    """
    our_queue = 'workq2'
    kvp_size = 50
    # Define a lot of resource names
    resources = ["resource%d" % i for i in range(2*kvp_size)]

    def setUp(self):
        TestFunctional.setUp(self)

        rlist = ','.join(self.resources)
        a = {ATTR_RESC_TYPE: 'long', ATTR_RESC_FLAG: 'hn'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id=rlist)

        # Create a queue to test against
        a = {'queue_type': 'execution', 'enabled': 'True', 'started': 'False'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=self.our_queue)

    def try_a_job(self, base, job_res, que_res, svr_res):
        """ Submit a job and check its schedselect result

        :param base: the prefix of the job select statement before the
            resources under test
        :type base: list of str
        :param job_res: resources requested by job
        :type job_res: dict with keys of resource names, values of values
        :param que_res: resource defaults for queue
        :type que_res: same as job_res
        :param svr_res: resource defaults for server
        :type svr_res: same as job_res
        :returns: job id
        """
        attrs = {ATTR_queue: self.our_queue}

        job_part = ['%s=%s' % r for r in job_res.items()]
        sel_arg = ':'.join(base + job_part)
        attrs[ATTR_l] = 'select=' + sel_arg
        j = Job(TEST_USER, attrs)
        jid = self.server.submit(j)

        # Merge server, queue, and job requested resources into
        # expected resource list.  Last one wins.
        expected = svr_res.copy()
        expected.update(que_res)
        expected.update(job_res)
        e_set = set(["%s=%s" % r for r in expected.items()])

        # See which resources ended up in job's schedselect
        a = [ATTR_SchedSelect]
        job_stat = self.server.status(JOB, a, id=jid)
        ssel = job_stat[0][ATTR_SchedSelect]
        # Generate actual resource list
        a_set = set(ssel.split(':'))
        # Ignore any pieces from base
        a_set -= set((':'.join(base)).split(':'))
        # Determine where expected and actual differ
        missing = e_set.difference(a_set)
        extra = a_set.difference(e_set)
        if missing:
            msg = "Actual schedselect missing %s for select=%s" % \
                   (', '.join(sorted(missing)), sel_arg)
            self.fail(msg)
        if extra:
            msg = "Actual schedselect includes extra %s for select=%s" % \
                   (', '.join(sorted(extra)), sel_arg)
            self.fail(msg)
        return jid

    @tags('server')
    def test_nkve_overflow(self):
        """
        Test whether do_schedselect() in vnparse.c can overflow the
        grunt nkve array if a queue has a large number of default resources
        (> KVP_SIZE (50)).
        Note: This test can corrupt memory in an unpatched server.
        """

        # Remove any current server defaults
        rlist = ['default_chunk.%s' % r for r in self.resources]
        a = ','.join(rlist)
        self.server.manager(MGR_CMD_UNSET, SERVER, a)

        # Set our queue to have default values for all the resources.
        a = {'default_chunk.%s' % r: 1 for r in self.resources}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id=self.our_queue)

        base_sel = ['1:ncpus=1']
        job_res = {}
        que_res = {r: 1 for r in self.resources}
        svr_res = {}
        # Submit job to that queue and check schedselect value
        self.try_a_job(base_sel, job_res, que_res, svr_res)

    @tags('server')
    def test_general_dflt_chunks(self):
        """
        Test that chunk specifications are handled correctly. That is,
        job specs should override queue defaults which override server
        defaults.
        """
        # Remove any current defaults
        rlist = ['default_chunk.%s' % r for r in self.resources]
        a = ','.join(rlist)
        self.server.manager(MGR_CMD_UNSET, QUEUE, a, id=self.our_queue)
        self.server.manager(MGR_CMD_UNSET, SERVER, a)

        # Job with no resources

        base_sel = ['1:ncpus=1']
        job_res = {}
        que_res = {}
        svr_res = {}
        self.try_a_job(base_sel, job_res, que_res, svr_res)

        # Job specifying resources

        job_res = {'resource10': 1, 'resource11': 2}
        self.try_a_job(base_sel, job_res, que_res, svr_res)

        # Add a server chunk default

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'default_chunk.resource12': 3})
        svr_res = {'resource12': 3}
        self.try_a_job(base_sel, job_res, que_res, svr_res)

        # Add a queue chunk default

        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'default_chunk.resource13': 4},
                            id=self.our_queue)
        que_res = {'resource13': 4}

        self.try_a_job(base_sel, job_res, que_res, svr_res)

        # Check that job can override a default

        job_res = {'resource12': 10}
        self.try_a_job(base_sel, job_res, que_res, svr_res)


================================================
FILE: test/tests/functional/pbs_highreslog.py
================================================
# coding: utf-8
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestHighResLogging(TestFunctional):
    """
    TestSuite for High resolution logging in PBS
    """
    tm_micro_re = re.compile(
        r'(\d{2,2}/\d{2,2}/\d{4,4}\s\d{2,2}:\d{2,2}:\d{2,2}.\d{6,6})')

    def validate_trace_job_lines(self, jid=None):
        """
        Validate that tracejob lines have high resolution time
        stamp
        """
        lines = self.server.log_lines(logtype='tracejob', id=jid, n='ALL')
        if len(lines) > 1:
            # Remove first line as it is not log line
            lines = lines[1:]
        for line in lines:
            m = self.tm_micro_re.match(line)
            if m is None:
                # If this is accounting log, ignore it as
                # Accounting log does not have high res logging
                line = line.split()
                _msg = 'Not Found high resolution time stamp in log'
                self.assertFalse(len(line) >= 3 and
                                 (line[2].strip() != 'A'), _msg)
        _msg = self.server.shortname + \
            ': High resolution time stamp found in log'
        self.logger.info(_msg)

    def validate_server_log_lines(self):
        """
        validates that the server_log lines have high resolution
        time stamp
        """
        lines = self.server.log_lines(logtype=self.server, n=20)
        for line in lines:
            m = self.tm_micro_re.match(line)
            _msg = 'Not Found high resolution time stamp in log'
            self.assertTrue(m, _msg)
        _msg = self.server.shortname + \
            ': High resolution time stamp found in log'
        self.logger.info(_msg)

    def switch_microsecondlogging(self, hostname=None, highrestimestamp=1):
        """
        Set microsecond logging in pbs.conf
        """
        if hostname is None:
            hostname = self.server.hostname
        a = {'PBS_LOG_HIGHRES_TIMESTAMP': highrestimestamp}
        self.du.set_pbs_config(hostname=hostname, confs=a, append=True)
        PBSInitServices().restart()
        self.assertTrue(self.server.isUp(), 'Failed to restart PBS Daemons')

    def test_disabled(self):
        """
        Disable High res logging, and test that high res timestamp is not
        there in the server logs lines
        """
        self.switch_microsecondlogging(highrestimestamp=0)
        now = time.time()

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        lines = self.server.log_lines(logtype=self.server,
                                      starttime=now)

        _msg = 'Found high resolution time stamp in log,' \
               ' it shouldn\'t be there'

        for line in lines:
            m = self.tm_micro_re.match(line)
            self.assertIsNone(m, _msg)

        _msg = self.server.shortname + \
            ': High resolution time stamp correctly not set in log'
        self.logger.info(_msg)

    def test_disabled_tracejob(self):
        """
        Disable High res logging, and test that high res timestamp is not
        there in the tracejob output
        """
        self.switch_microsecondlogging(highrestimestamp=0)

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        lines = self.server.log_lines(logtype='tracejob', id=jid, n='ALL')
        if len(lines) > 1:
            # Remove first line as it is not log line
            lines = lines[1:]

        _msg = 'Found high resolution time stamp in tracejob, ' \
               'it should not be there'

        for line in lines:
            m = self.tm_micro_re.match(line)
            self.assertIsNone(m, _msg)

        _msg = self.server.shortname + \
            ': High resolution time stamp correctly not set in ' \
            'tracejob output'
        self.logger.info(_msg)

    def test_basic(self):
        """
        Enable High resolution logging, restart server
        and look for high resolution time stamp in server log
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        self.validate_server_log_lines()

    def test_basic_tracejob(self):
        """
        Enable High resolution logging, restart PBS Daemons
        and look for high resolution time stamp in tracejob output
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        self.validate_trace_job_lines(jid=jid)

    def test_env_variable_overwrite(self):
        """
        Check env variable overwrites the pbs.conf value
        """
        a = {'PBS_LOG_HIGHRES_TIMESTAMP': 0}
        self.du.set_pbs_config(confs=a, append=True)
        conf_path = self.du.parse_pbs_config()
        pbs_init = os.path.join(os.sep, conf_path['PBS_EXEC'],
                                'libexec', 'pbs_init.d')
        cmd = copy.copy(self.du.sudo_cmd)
        cmd += ['PBS_LOG_HIGHRES_TIMESTAMP = 1', pbs_init, 'restart']
        self.du.run_cmd(cmd=cmd, as_script=True, wait_on_script=True)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        self.validate_server_log_lines()
        self.validate_trace_job_lines(jid=jid)


================================================
FILE: test/tests/functional/pbs_holidays.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import datetime
from tests.functional import *


class TestHolidays(TestFunctional):

    """
    This test suite tests if PBS scheduler's holidays file feature
    works correctly
    """
    days = ["monday", "tuesday", "wednesday", "thursday", "friday",
            "saturday", "sunday"]
    np_queue = "np_workq"
    p_queue = "p_workq"
    cur_year = datetime.datetime.today().year
    allprime_msg = "It is primetime.  It will never end"
    tom = datetime.date.today() + datetime.timedelta(days=1)
    tom = tom.strftime("%m/%d/%Y")
    dayprime_msg = r"It is primetime.  It will end in \d+ seconds at " +\
        tom + " 00:00:00"
    daynp_msg = r"It is non-primetime.  It will end in \d+ seconds at " +\
        tom + " 00:00:00"

    def setUp(self):
        TestFunctional.setUp(self)

        # Enable DEBUG2 sched log messages
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 1023})

    def test_missing_days(self):
        """
        Test that scheduler correctly assumes 24hr prime-time for days that
        are missing from the holidays file
        """
        self.scheduler.holidays_delete_entry('a')

        self.scheduler.holidays_set_year(self.cur_year)

        # Set all days of the week as non-prime time and today as prime time
        today_idx = datetime.datetime.today().weekday()
        today = self.days[today_idx]
        for i in range(7):
            if i != today_idx:
                self.scheduler.holidays_set_day(self.days[i], "none", "all")

        ctime = time.time()
        time.sleep(1)

        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})

        # Verify that there's no entry in holidays file for today
        ret = self.scheduler.holidays_get_day(today)
        self.assertIsNone(ret['p'])
        self.assertIsNone(ret['np'])
        self.assertIsNone(ret['valid'])

        # Verify that it's prime-time until tomorrow
        self.scheduler.log_match(msg=self.dayprime_msg, regexp=True,
                                 starttime=ctime)

    def test_inconsistent_days(self):
        """
        Test that scheduler correctly assumes 24hr prime-time for days that
        have inconsistent data
        """
        self.scheduler.holidays_delete_entry('a')

        self.scheduler.holidays_set_year(self.cur_year)

        # Set all days of the week as non-prime time except today
        today_idx = datetime.datetime.today().weekday()
        today = self.days[today_idx]
        for i in range(7):
            if i != today_idx:
                self.scheduler.holidays_set_day(self.days[i], "none", "all")

        # Set both prime and non-prime start times to 'all' for today
        # and check that scheduler assumes that day as prime-time
        self.scheduler.holidays_set_day(today, "all", "all")

        # Verify that it's prime-time until tomorrow
        ctime = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.dayprime_msg, regexp=True,
                                 starttime=ctime)

        # Set both prime and non-prime start times to 'all' for today
        self.scheduler.holidays_set_day(today, "none", "none")

        # Verify that it's prime-time until tomorrow
        ctime = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.dayprime_msg, regexp=True,
                                 starttime=ctime)

    def test_only_year(self):
        """
        Test that scheduler assumes all prime-time if there's only a year
        entry in the holidays file
        """
        self.scheduler.holidays_delete_entry('a')

        self.scheduler.holidays_set_year(self.cur_year)

        # Verify that the holidays file has only the year line
        h_content = self.scheduler.holidays_parse_file()
        self.assertEqual(len(h_content), 1)
        self.assertEqual(h_content[0], "YEAR\t%d" % self.cur_year)

        # Verify that it's 24x7 prime-time
        ctime = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.allprime_msg, regexp=True,
                                 starttime=ctime)

    def test_empty_holidays_file(self):
        """
        Test that the scheduler assumes all prime-time if the holidays
        file is completely empty
        """
        ctime = time.time()
        self.scheduler.holidays_delete_entry('a')

        # Verify that the holidays file is empty
        h_content = self.scheduler.holidays_parse_file()
        self.assertEqual(len(h_content), 0)

        # Verify that it's 24x7 prime-time
        ctime2 = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.allprime_msg, regexp=True,
                                 starttime=ctime2)

        # Verify that scheduler didn't log a message for out of date file
        msg = "holidays;The holiday file is out of date; please update it."
        self.scheduler.log_match(msg, starttime=ctime, existence=False,
                                 max_attempts=5)

    def test_stale_year(self):
        """
        Test that the scheduler logs out-of-date log message and assumed
        all prime-time for a holidays file with just a stale year line
        """
        ctime = time.time()
        self.scheduler.holidays_delete_entry('a')

        self.scheduler.holidays_set_year(self.cur_year - 1)

        # Verify that the holidays file has only the year line
        h_content = self.scheduler.holidays_parse_file()
        self.assertEqual(len(h_content), 1)
        self.assertEqual(h_content[0], "YEAR\t%d" % (self.cur_year - 1))

        # Verify that it's 24x7 prime-time
        ctime2 = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.allprime_msg, regexp=True,
                                 starttime=ctime2)

        # Verify that scheduler logged a message for out of date file
        msg = "holidays;The holiday file is out of date; please update it."
        self.scheduler.log_match(msg, starttime=ctime)

    def test_commented_holidays_file(self):
        """
        Test that the scheduler assumes all prime-time if the holidays
        file is completely commented out
        """
        ctime = time.time()
        self.scheduler.holidays_delete_entry('a')

        content = """# YEAR 1970
#  weekday 0600  1730
#  saturday  none  all
#  sunday  none  all"""

        self.scheduler.holidays_write_file(content=content)

        # Verify that the holidays file has 4 lines
        h_content = self.du.cat(filename=self.scheduler.holidays_file,
                                sudo=True)['out']
        self.assertEqual(len(h_content), 4)

        # Verify that it's 24x7 prime-time
        ctime2 = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.allprime_msg, regexp=True,
                                 starttime=ctime2)

        # Verify that scheduler didn't log a message for out of date file
        msg = "holidays;The holiday file is out of date; please update it."
        self.scheduler.log_match(msg, starttime=ctime, existence=False,
                                 max_attempts=5)

    def test_non_prime(self):
        """
        Test that non-prime time set via holidays file works correctly
        """
        self.scheduler.holidays_delete_entry('a')

        self.scheduler.holidays_set_year(self.cur_year)

        # Set all days of the week as prime time except today
        today_idx = datetime.datetime.today().weekday()
        today = self.days[today_idx]
        for i in range(7):
            if i != today_idx:
                self.scheduler.holidays_set_day(self.days[i], "all", "none")

        # Set today as all non-prime time
        self.scheduler.holidays_set_day(today, "none", "all")

        # Verify that it's non-prime time until tomorrow
        ctime = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.daynp_msg, regexp=True,
                                 starttime=ctime)

    def test_missing_year(self):
        """
        Test that scheduler assumes all prime time if the year entry is
        missing from holidays file
        """
        ctime = time.time()
        self.scheduler.holidays_delete_entry('a')

        # Create a holidays file with no year entry and all days set to
        # 24hrs non-prime time
        content = """  weekday none  all
  saturday  none  all
  sunday  none  all"""

        self.scheduler.holidays_write_file(content=content)

        # Verify that the holidays file has 3 lines
        h_content = self.du.cat(filename=self.scheduler.holidays_file,
                                sudo=True)['out']
        self.assertEqual(len(h_content), 3)

        # Verify that it's 24x7 prime-time
        ctime2 = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.allprime_msg, regexp=True,
                                 starttime=ctime2)

        # Verify that scheduler didn't log a message for out of date file
        msg = "holidays;The holiday file is out of date; please update it."
        self.scheduler.log_match(msg, starttime=ctime, existence=False,
                                 max_attempts=5)

    def test_prime_events_calendar(self):
        """
        Test that for a commented out holidays file, scheduler doesn't
        add policy change events to the calendar
        """
        self.scheduler.set_sched_config({'strict_ordering': "true    all"})
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        self.scheduler.holidays_delete_entry('a')

        # Create a holidays file with no year entry and all days set to
        # 24hrs non-prime time
        content = """# YEAR 1970
#  weekday 0600  1730
#  saturday  none  all
#  sunday  none  all"""
        self.scheduler.holidays_write_file(content=content)

        time.sleep(1)
        ctime = time.time()

        # Verify that it's 24x7 prime-time
        ctime2 = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.allprime_msg, regexp=True,
                                 starttime=ctime2)

        # Set ncpus on vnode to 1
        attrs = {ATTR_rescavail + ".ncpus": '1'}
        self.server.manager(MGR_CMD_SET, NODE, attrs)

        # Submit a job that will occupy all resources, without a walltime
        a = {'Resource_List.select': '1:ncpus=1'}
        j = Job(TEST_USER, attrs=a)
        self.server.submit(j)

        # Submit another job which will get calendared
        j = Job(TEST_USER, attrs=a)
        self.server.submit(j)

        # Verify that scheduler did not calendar any policy change events
        msg = r".*Simulation: Policy change.*"
        self.scheduler.log_match(msg, regexp=True, starttime=ctime,
                                 existence=False,
                                 max_attempts=5)

    def test_week_day_after_weekday(self):
        """
        Test that an individual weekday's entry after the 'weekday'
        entry takes precedence in the holidays file
        """
        self.scheduler.holidays_delete_entry('a')

        self.scheduler.holidays_set_year(self.cur_year)

        # Add a weekday entry with all prime-time
        self.scheduler.holidays_set_day("weekday", "all", "none")

        # Set today as all non-prime time
        today_idx = datetime.datetime.today().weekday()
        today = self.days[today_idx]
        self.scheduler.holidays_set_day(today, "none", "all")

        # Verify that it's non-prime time until tomorrow
        ctime = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.daynp_msg, regexp=True,
                                 starttime=ctime)

    def test_year_0(self):
        """
        Test that setting holidays file's year entry to 0 causes 24x7
        prime-time
        """
        ctime = time.time()
        self.scheduler.holidays_delete_entry('a')

        self.scheduler.holidays_set_year('0')

        # Verify that the holidays file has only the year line
        h_content = self.scheduler.holidays_parse_file()
        self.assertEqual(len(h_content), 1)
        self.assertEqual(h_content[0], "YEAR\t0")

        # Verify that it's 24x7 prime-time
        ctime2 = time.time()
        time.sleep(1)
        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: True})
        self.scheduler.log_match(msg=self.allprime_msg, regexp=True,
                                 starttime=ctime2)

        # Verify that scheduler didn't log a message for out of date file
        msg = "holidays;The holiday file is out of date; please update it."
        self.scheduler.log_match(msg, starttime=ctime, existence=False,
                                 max_attempts=5)


================================================
FILE: test/tests/functional/pbs_hook_config_os_env.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


@tags('hooks')
class TestHookConfigOSEnv(TestFunctional):
    """
    Test suite to check if hook can access
    os.environ when a config file is configured
    for a hook
    """

    def test_hook_config_os_env(self):
        """
        Create a hook, import a config file for the hook
        and test the os.environ call in the hook
        """
        hook_name = "test_hook"
        hook_body = """
import pbs
import os
pbs.logmsg(pbs.LOG_DEBUG, "Printing os.environ %s" % os.environ)
"""
        cfg = """
{'hook_config':'testhook'}
"""
        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, a, hook_body)
        fn = self.du.create_temp_file(body=cfg)
        a = {'content-type': 'application/x-config',
             'content-encoding': 'default',
             'input-file': fn}
        self.server.manager(MGR_CMD_IMPORT, HOOK, a, hook_name)
        a = {'Resource_List.select': '1:ncpus=1'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.log_match("Printing os.environ", self.server.shortname)


================================================
FILE: test/tests/functional/pbs_hook_crosslink_mom.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('hooks')
@requirements(num_moms=2)
class TestPbsHookCrossLinkMom(TestFunctional):
    """
    When a hook updates attributes of vnodes not belonging to MoM on which
    the hook is running, the server wrongly cross links the MoM with the vnode.
    This testsuite tests the fix for this issue and needs two MoMs.
    """
    def setUp(self):
        TestFunctional.setUp(self)

        if len(self.moms) != 2:
            self.skipTest('test requires two MoMs as input, ' +
                          'use -p moms=<mom1>:<mom2>')

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

    def test_crosslink(self):
        """
        This test creates a execjob_end hook which updates an attribute of
        all vnodes. A job is submitted that runs on two different MoM hosts.
        When the job has finished, the test checks if the server did the wrong
        cross-linking or not.
        """
        status = self.server.status(NODE, id=self.hostA)
        Mom1_before = status[0][ATTR_NODE_Mom]

        status = self.server.status(NODE, id=self.hostB)
        Mom2_before = status[0][ATTR_NODE_Mom]

        hook_name = "job_end"
        hook_body = """
import pbs

this_event = pbs.event()
if this_event.type == pbs.EXECJOB_END:
    job = this_event.job
    exec_vnode = str(job.exec_vnode).replace("(", "").replace(")", "")
    vnodes = sorted(set([x.partition(':')[0]
                        for x in exec_vnode.split('+')]))
    for h in vnodes:
        try:
            pbs.logjobmsg(job.id, "vnode is %s ======" % h)
            pbs.event().vnode_list[h].current_eoe = None
        except:
            pass

this_event.accept()
"""

        a = {'event': "execjob_end", 'enabled': 'true', 'debug': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        select = "1:host=" + self.hostA + ":ncpus=1+1:host=" \
            + self.hostB + ":ncpus=1"
        a = {'Resource_List.select': select,  ATTR_k: 'oe'}

        j = Job(TEST_USER, a)
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')

        status = self.server.status(NODE, id=self.hostA)
        Mom = status[0][ATTR_NODE_Mom]
        self.assertEqual(Mom, Mom1_before)

        status = self.server.status(NODE, id=self.hostB)
        Mom = status[0][ATTR_NODE_Mom]
        self.assertEqual(Mom, Mom2_before)


================================================
FILE: test/tests/functional/pbs_hook_debug_input.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import os
import fnmatch
from ptl.utils.pbs_logutils import PBSLogUtils


class TestHookDebugInput(TestFunctional):
    """
    Tests related to hook debug input files
    """
    def setUp(self):
        TestFunctional.setUp(self)
        if not hasattr(self, 'server_hooks_tmp_dir'):
            self.server_hooks_tmp_dir = \
                os.path.join(self.server.pbs_conf['PBS_HOME'],
                             'server_priv', 'hooks', 'tmp')
        if not hasattr(self, 'mom_hooks_tmp_dir'):
            self.mom_hooks_tmp_dir = \
                self.mom.get_formed_path(self.mom.pbs_conf['PBS_HOME'],
                                         'mom_priv', 'hooks', 'tmp')

    def remove_files_match(self, pattern, mom=False):
        """
        Remove hook debug files in hooks/tmp folder that
        match pattern
        """
        if mom:
            hooks_tmp_dir = self.mom_hooks_tmp_dir
            a = self.mom.listdir(path=hooks_tmp_dir, sudo=True)
        else:
            hooks_tmp_dir = self.server_hooks_tmp_dir
            a = self.du.listdir(path=hooks_tmp_dir, sudo=True)

        for item in a:
            if fnmatch.fnmatch(item, pattern):
                if mom:
                    self.mom.rm(path=item, sudo=True)
                    ret = self.mom.isfile(path=item, sudo=True)
                else:
                    self.du.rm(path=item, sudo=True)
                    ret = self.du.isfile(path=item, sudo=True)

                # Check if the file was removed
                self.assertFalse(ret)

    def match_queue_name_in_input_file(self, input_file_pattern, qname):
        """
        Assert that qname appears in the hook debug input file
        that matches input_file_pattern
        """
        input_file = None
        for item in self.du.listdir(path=self.server_hooks_tmp_dir, sudo=True):
            if fnmatch.fnmatch(item, input_file_pattern):
                input_file = item
                break
        self.assertTrue(input_file is not None)
        with PBSLogUtils().open_log(input_file, sudo=True) as f:
            search_str = 'pbs.event().job.queue=%s' % qname
            self.assertTrue(search_str in f.read().decode())
        self.remove_files_match(input_file_pattern)

    def match_in_debug_file(self, input_file_pattern, search_list, mom=False):
        """
        Assert that all the strings in 'search_list' appears in the hook
        debug file that matches input_file_pattern
        """
        input_file = None
        if mom:
            hooks_tmp_dir = self.mom_hooks_tmp_dir
            a = self.mom.listdir(path=hooks_tmp_dir, sudo=True)
        else:
            hooks_tmp_dir = self.server_hooks_tmp_dir
            a = self.du.listdir(path=hooks_tmp_dir, sudo=True)

        for item in a:
            if fnmatch.fnmatch(item, input_file_pattern):
                input_file = item
                break
        self.assertTrue(input_file is not None)
        if mom:
            ret = self.mom.cat(filename=input_file, sudo=True)
        else:
            ret = self.du.cat(filename=input_file, sudo=True)

        if ret['rc'] == 0 and len(ret['out']) > 0:
            flag = False
            if(all(x in ret['out'] for x in search_list)):
                flag = True
            self.assertTrue(flag)
        self.remove_files_match(input_file_pattern, mom)

    def test_queuejob_hook_debug_input_has_queue_name(self):
        """
        Test that user requested queue name is written to
        queuejob hook debug input file
        """
        hook_name = "queuejob_debug"
        hook_body = ("import pbs\n"
                     "pbs.event().accept()")
        attr = {'enabled': 'true', 'event': 'queuejob', 'debug': 'true'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        new_queue = 'happyq'
        attr = {ATTR_qtype: 'execution', ATTR_enable: 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, attr, id=new_queue)

        input_file_pattern = os.path.join(self.server_hooks_tmp_dir,
                                          'hook_queuejob_%s*.in' % hook_name)
        self.remove_files_match(input_file_pattern)

        j1 = Job(TEST_USER)
        self.server.submit(j1)

        self.match_queue_name_in_input_file(input_file_pattern,
                                            self.server.default_queue)

        attr = {ATTR_queue: new_queue}
        j2 = Job(TEST_USER, attrs=attr)
        self.server.submit(j2)
        self.match_queue_name_in_input_file(input_file_pattern, new_queue)

    def test_mom_hook_debug_data(self):
        """
        Test that a debug enabled mom hook produces expected debug data.
        """
        def_que = self.server.default_queue
        hname = "debug"
        hook_body = """
import pbs
s = pbs.server()
q = s.queue("%s")
for vn in s.vnodes():
    pbs.logmsg(pbs.LOG_DEBUG, "found vn=" + vn.name)
pbs.event().accept()
""" % def_que
        attr = {'enabled': 'true', 'event': 'execjob_begin', 'debug': 'true'}
        self.server.create_import_hook(hname, attr, hook_body)

        data_file_pattern = self.mom.get_formed_path(
                             self.mom_hooks_tmp_dir,
                             'hook_execjob_begin_%s*.data'
                             % hname)
        self.remove_files_match(data_file_pattern, mom=True)

        j1 = Job(TEST_USER)
        j1.set_sleep_time(5)
        jid = self.server.submit(j1)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

        search = ["pbs.server().queue(%s).queue_type=Execution" % def_que]
        search.append("pbs.server().vnode(%s).ntype=0" % self.mom.shortname)
        self.logger.info(search)
        self.match_in_debug_file(data_file_pattern, search, mom=True)


================================================
FILE: test/tests/functional/pbs_hook_debug_nocrash.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestHookDebugNoCrash(TestFunctional):

    """
    This tests to make sure the following does not occur:
          Hook debug causes file descriptor leak that crashes PBS server

    PRE: Have 3 queuejob hooks, qjob1, qjob2, qjob3 with order=1, order=2,
         order=2 respectively. qjob1 and qjob2 have debug=True while
         qjob3 has debug=False. Try submitting 1000 jobs.
    POST: On a fixed PBS, this test case will run to completion.
          On a PBS containing the bug, the test could fail on a server crash,
          a failure in qsub with "Invalid credential", or even a qstat
          hang with ptl returning:
             corretja: /opt/pbs/bin/qstat -f 4833.corretja
              2016-07-08 12:56:52,799 INFO     TIMEDOUT
          and server_logs having the message "Too many open files".

         This is because a previous bug causes pbs_server to not close the
         debug output file descriptors opened by subsequent hook executions.

         NOTE: This is assuming on one's local system, we have the
                follwoing limit:
                # ulimit -a
                ...
                open files                      (-n) 1024
    """

    # Class variables
    open_files_limit_expected = 1024

    def setUp(self):
        ret = self.du.run_cmd(
            self.server.hostname, [
                'ulimit', '-n'], as_script=True, logerr=False)
        self.assertEqual(ret['rc'], 0)
        open_files_limit = ret['out'][0]
        if (open_files_limit == "unlimited") or (
                int(open_files_limit) > self.open_files_limit_expected):
            msg = "\n'This test requires 'open files' system limit"
            msg += " to be <= %d " % self.open_files_limit_expected
            msg += "(current value=%s)." % open_files_limit
            self.skipTest(msg)
        TestFunctional.setUp(self)

    @timeout(2400)
    def test_hook_debug_no_crash(self):

        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "hook %s executed" % (e.hook_name,))
"""
        hook_name = "qjob1"
        a = {
            'event': "queuejob",
            'enabled': 'True',
            'debug': 'True',
            'order': 1}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        hook_name = "qjob2"
        a = {
            'event': "queuejob",
            'enabled': 'True',
            'debug': 'True',
            'order': 2}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        hook_name = "qjob3"
        a = {
            'event': "queuejob",
            'enabled': 'True',
            'debug': 'False',
            'order': 2}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        for i in range(1000):
            j = Job(TEST_USER)
            a = {
                'Resource_List.select': '1:ncpus=1',
                'Resource_List.walltime': 3600}
            j.set_attributes(a)
            j.set_sleep_time("5")
            jid = self.server.submit(j)
            self.server.expect(JOB, {'job_state': 'Q'}, id=jid)


================================================
FILE: test/tests/functional/pbs_hook_exechost_periodic.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


common_periodic_hook_script = """import pbs
pbs.logmsg(pbs.LOG_DEBUG, "In exechost_periodic hook")
vn = pbs.event().vnode_list
host = pbs.get_local_nodename()
node = ''
for k in vn.keys():
    if host in k:
        node = k
        break
vn[node].resources_available["mem"] = pbs.size("90gb")
other_node = "invalid_node"
if other_node not in vn:
    vn[other_node] = pbs.vnode(other_node)
vn[other_node].resources_available["mem"] = pbs.size("9gb")
"""


class TestHookExechostPeriodic(TestFunctional):
    """
    Tests to test exechost_periodic hook
    """
    def setUp(self):
        TestFunctional.setUp(self)

    def test_multiple_exechost_periodic_hooks(self):
        """
        This test sets two exechost_periodic hooks and restarts the mom,
        which tests whether both the hooks will successfully run on node
        startup and the mom not crashes.
        """
        self.attr = {'event': 'exechost_periodic',
                     'enabled': 'True', 'freq': '30'}
        self.hook_body1 = ("import pbs\n"
                           "e = pbs.event()\n"
                           "pbs.logmsg(pbs.EVENT_DEBUG,\n"
                           "\t\"exechost_periodic hook1\")\n"
                           "e.accept()\n")
        self.hook_body2 = ("import pbs\n"
                           "e = pbs.event()\n"
                           "pbs.logmsg(pbs.EVENT_DEBUG,\n"
                           "\t\"exechost_periodic hook2\")\n"
                           "e.accept()\n")
        self.server.create_import_hook("exechost_periodic1",
                                       self.attr, self.hook_body1)
        self.server.create_import_hook("exechost_periodic2",
                                       self.attr, self.hook_body2)
        self.mom.restart()
        self.assertTrue(self.mom.isUp())
        self.mom.log_match("exechost_periodic hook1",
                           max_attempts=5, interval=5)
        self.mom.log_match("exechost_periodic hook2",
                           max_attempts=5, interval=5)

    @skipOnCpuSet
    @requirements(num_moms=2)
    def test_exechost_periodic_accept(self):
        """
        Test exechost_periodic which accepts event and verify that
        error is thrown when updating resources of a vnode
        which is owned by different mom
        """
        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        self.momB = self.moms.values()[1]
        self.hostB = self.momB.shortname
        hook_name = "periodic"
        hook_attrs = {'event': 'exechost_periodic', 'enabled': 'True'}
        hook_body = common_periodic_hook_script
        self.server.create_import_hook(hook_name, hook_attrs, hook_body)

        exp_msg = "In exechost_periodic hook"
        for mom in self.moms.values():
            mom.log_match(exp_msg)

        other_node = "invalid_node"
        common_msg = " as it is owned by a different mom"
        common_msg2 = "resources_available.mem=9gb per mom hook request"

        exp_msg1 = "autocreated vnode %s" % (other_node)
        msg1 = "%s;Updated vnode %s's resource " % (self.momA.hostname,
                                                    other_node)
        exp_msg2 = msg1 + common_msg2
        msg2 = "%s;Not allowed to update vnode '%s'," % (self.momB.hostname,
                                                         other_node)
        exp_msg3 = msg2 + common_msg

        for msg in [exp_msg1, exp_msg2, exp_msg3]:
            self.server.log_match(msg)

        node_attribs = {'resources_available.mem': "90gb"}
        self.server.expect(NODE, node_attribs, id=self.momB.shortname)

    @skipOnCpuSet
    @requirements(num_moms=2)
    def test_exechost_periodic_alarm(self):
        """
        Test exechost_periodic with alarm timeout in hook script
        """
        hook_name = "periodic"
        hook_attrs = {'event': 'exechost_periodic', 'enabled': 'True',
                      'alarm': '5'}
        hook_script = """time.sleep(10)"""
        hook_body = """import time \n"""
        hook_body += common_periodic_hook_script + hook_script
        self.server.create_import_hook(hook_name, hook_attrs, hook_body)
        log_msg = "alarm call while running exechost_periodic hook"
        log_msg += " '%s', request rejected" % hook_name
        exp_msg = ["In exechost_periodic hook",
                   log_msg,
                   "Non-zero exit status 253 encountered for periodic hook",
                   "exechost_periodic request rejected by '%s'" % hook_name]
        for mom in self.moms.values():
            for msg in exp_msg:
                mom.log_match(msg)

    @skipOnCpuSet
    @requirements(num_moms=2)
    def test_exechost_periodic_error(self):
        """
        Test exechost_periodic with an unhandled exception in the hook script
        """
        hook_name = "periodic"
        hook_attrs = {'event': 'exechost_periodic', 'enabled': 'True'}
        hook_script = """raise Exception('x')"""
        hook_body = common_periodic_hook_script + hook_script
        self.server.create_import_hook(hook_name, hook_attrs, hook_body)

        common_msg = "PBS server internal error (15011) in "
        common_msg += "Error evaluating Python script"
        exp_msg = ["In exechost_periodic hook",
                   common_msg + ", <class 'Exception'>",
                   common_msg + ", x",
                   "Non-zero exit status 254 encountered for periodic hook",
                   "exechost_periodic request rejected by '%s'" % hook_name]
        for mom in self.moms.values():
            for msg in exp_msg:
                mom.log_match(msg)

    @skipOnCpuSet
    @requirements(num_moms=2)
    def test_exechost_periodic_custom_resc(self):
        """
        Test setting custom resource setting on vnode using exechost_periodic
        hook
        """
        self.momB = self.moms.values()[1]
        self.hostB = self.momB.shortname
        hook_name = "periodic"
        hook_attrs = {'event': 'exechost_periodic', 'enabled': 'True'}
        hook_script = """vn[node].resources_available["foo"] = True"""
        hook_body = common_periodic_hook_script + hook_script
        self.server.create_import_hook(hook_name, hook_attrs, hook_body)
        node_attribs = {'resources_available.foo': True}
        self.server.expect(NODE, node_attribs, id=self.hostB)


================================================
FILE: test/tests/functional/pbs_hook_execjob_abort.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


@requirements(num_moms=3)
class TestPbsExecjobAbort(TestFunctional):
    """
    Tests the hook event execjob_abort for when a job prematurely exits
    during startup and the epilogue hook or end hook may not always execute.
    """
    logutils = PBSLogUtils()

    def setUp(self):
        if len(self.moms) != 3:
            self.skipTest('test requires three MoMs as input, ' +
                          'use -p moms=<mom1>:<mom2>:<mom3>')
        TestFunctional.setUp(self)
        self.momC = self.moms.values()[2]

        # execjob_abort hook
        self.abort_hook_body = """import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "called execjob_abort hook")

def print_attribs(pbs_obj, header):
    for a in pbs_obj.attributes:
        v = getattr(pbs_obj, a)
        if v and str(v) != "":
            pbs.logmsg(pbs.LOG_DEBUG, "%s: %s = %s" % (header, a, v))
print_attribs(e.job, "JOB")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    print_attribs(v, "vnode_list[" + vn + "]")
"""
        # instantiate execjob_abort hook
        hook_event = 'execjob_abort'
        hook_name = 'abort'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.abort_hook_body)

        # execjob_abort hook with sleep
        self.abort1_hook_body = """import pbs
import time
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "called execjob_abort hook")
time.sleep(2)
"""
        # execjob_prologue hook, unhandled exception
        self.prolo_hook_body = """import pbs
e=pbs.event()
job=e.job
if %s job.in_ms_mom():
    raise NameError
"""
        # execjob_launch hook, unhandled exception on MS mom
        self.launch_hook_body = """import pbs
e=pbs.event()
job=e.job
if job.in_ms_mom():
    raise NameError
"""
        # execjob_end hook
        self.end_hook_body = """import pbs
e=pbs.event()
e.reject("end hook rejected")
"""
        # execjob_begin hook with sleep
        self.begin_hook_body = """import pbs
import time
e=pbs.event()
e.job.delete()
pbs.logmsg(pbs.LOG_DEBUG, "called execjob_begin hook with job.delete()")
time.sleep(2)
"""
        # job used in the tests
        a = {ATTR_l + '.select': '3:ncpus=1', ATTR_l + '.place': 'scatter'}
        self.j = Job(TEST_USER, attrs=a)

    def test_execjob_abort_ms_prologue(self):
        """
        An execjob_abort hook is executed in the primary mom and then in the
        connected sister moms when a job has problems starting up and needing
        to be aborted because execjob_prologue hook rejected in the
        primary mom. Job is requeued, gets held (H state).
        """
        # instantiate execjob_prologue hook to run on MS mom
        hook_event = 'execjob_prologue'
        hook_name = 'prolo'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.prolo_hook_body % (''))
        # Submit a job that eventually goes in H state
        start_time = time.time()
        j1attr = {ATTR_l + '.select': '3:ncpus=1',
                  ATTR_l + '.place': 'scatter',
                  ATTR_W: 'run_count=18'}
        j1 = Job(TEST_USER, attrs=j1attr)
        jid = self.server.submit(j1)
        msg = "Job;%s;Job requeued, execution node  down" % jid
        self.server.log_match(msg, starttime=start_time)
        # Check for abort hook message in each of the moms
        msg = "called execjob_abort hook"
        for mom in self.moms.values():
            mom.log_match(msg, starttime=start_time)
        self.server.expect(JOB, {ATTR_state: 'H'}, id=jid)

    def test_execjob_abort_exit_job_launch_reject(self):
        """
        An execjob_abort hook is executed in the primary mom and then in the
        connected sister moms when a job has problems starting up and needing
        to be aborted because execjob_launch hook rejected in the
        primary mom. Job exits.
        """
        # instantiate execjob_launch hook to run on primary moms
        hook_event = 'execjob_launch'
        hook_name = 'launch'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.launch_hook_body)
        # Submit a job
        start_time = time.time()
        jid = self.server.submit(self.j)
        self.server.expect(JOB, 'exec_host', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        exechost = job_stat[0]['exec_host'].split('/')[0]
        mom_superior = self.moms[exechost]
        msg = "Job;%s;execjob_launch hook 'launch' " % (
            jid) + "encountered an exception, request rejected"
        mom_superior.log_match(msg, starttime=start_time)
        # Check for abort hook message in each of the moms
        msg = "called execjob_abort hook"
        for mom in self.moms.values():
            mom.log_match(msg, starttime=start_time)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=1)

    def msg_order(self, node, msg1, msg2, stime):
        """
        Checks if msg1 appears after stime, and msg1 appears before msg2 in
        mom logs of node. Returns date and time when msg1 and msg2 appeared.
        """
        # msg1 appears before msg2
        (_, str1) = node.log_match(msg1, starttime=stime)
        date_time1 = str1.split(";")[0]
        epoch1 = self.logutils.convert_date_time(date_time1)
        # Use epoch1 to mark the starttime of msg2
        (_, str2) = node.log_match(msg2, starttime=epoch1)
        date_time2 = str2.split(";")[0]
        return (date_time1, date_time2)

    def test_execjob_abort_sis_joinjob_requeue(self):
        """
        An execjob_abort hook is executed on a sister mom when a sister mom
        fails to join job. On connected primary mom an execjob_abort hook is
        executed first then execjob_end hook. On connected mom only an
        execjob_abort hook is executed. Job gets requeued.
        """
        # instantiate execjob_abort hook with sleep
        hook_event = 'execjob_abort'
        hook_name = 'abort'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.abort1_hook_body)
        # instantiate execjob_end hook
        hook_event = 'execjob_end'
        hook_name = 'end'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.end_hook_body)

        # Simulate a sister failure to join job
        # kill -STOP momC, submit a multi-node job, kill -9 momC
        self.momC.signal("-STOP")
        stime = time.time()
        jid = self.server.submit(self.j)
        self.server.expect(JOB, 'exec_host', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        exechost = job_stat[0]['exec_host'].split('/')[0]
        pri_mom = self.moms[exechost]
        self.momC.signal("-KILL")
        msg = "Job;%s;job_start_error.+from node %s " % (
            jid, self.momC.hostname) + "could not JOIN_JOB successfully"
        msg_abort = "called execjob_abort hook"
        msg_end = "end hook rejected"

        # momC failed to join job
        pri_mom.log_match(msg, starttime=stime, regexp=True)
        # abort hook executed before end hook on primary mom
        (dt1, dt2) = self.msg_order(pri_mom, msg_abort, msg_end, stime)
        self.logger.info(
            "\n%s: abort hook executed at: %s"
            "\n%s: end   hook executed at: %s" %
            (pri_mom.shortname, dt1, pri_mom.shortname, dt2))
        # only abort hook executed on connected sister mom
        for mom in self.moms.values():
            if mom != pri_mom and mom != self.momC:
                mom.log_match(msg_abort, starttime=stime)
                mom.log_match(
                    msg_end, starttime=stime, max_attempts=10,
                    interval=2, existence=False)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid, offset=1)

    def test_execjob_abort_sis_joinjob_exit(self):
        """
        An execjob_abort hook is executed on a sister mom when a sister mom
        fails to join job. An execjob_begin hook which instructs the job to
        be deleted via the pbs.event().job.delete() call executes before the
        execjob_abort hook. Job exits.
        """
        # instantiate execjob_begin hook
        hook_event = 'execjob_begin'
        hook_name = 'begin'
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(
            hook_name, a, self.begin_hook_body)

        # Simulate a sister failure to join job
        # kill -STOP momC, submit a multi-node job, kill -9 momC
        self.momC.signal("-STOP")
        stime = time.time()
        jid = self.server.submit(self.j)
        self.server.expect(JOB, 'exec_host', id=jid, op=SET)
        job_stat = self.server.status(JOB, id=jid)
        exechost = job_stat[0]['exec_host'].split('/')[0]
        pri_mom = self.moms[exechost]
        self.momC.signal("-KILL")

        msg = "Job;%s;job_start_error.+from node %s " % (
            jid, self.momC.hostname) + "could not JOIN_JOB successfully"
        msg_begin = "called execjob_begin hook with job.delete()"
        msg_abort = "called execjob_abort hook"

        # momC failed to join job
        pri_mom.log_match(msg, starttime=stime, regexp=True)
        # begin hook executed before abort hook on connected sister mom
        for mom in self.moms.values():
            if mom != pri_mom and mom != self.momC:
                (dt1, dt2) = self.msg_order(
                    pri_mom, msg_begin, msg_abort, stime)
                self.logger.info(
                    "\n%s: begin hook executed at: %s"
                    "\n%s: abort hook executed at: %s" %
                    (mom.shortname, dt1, mom.shortname, dt2))
        # begin hook executed before abort hook executed on primary mom
        (dt1, dt2) = self.msg_order(pri_mom, msg_begin, msg_abort, stime)
        self.logger.info(
            "\n%s: begin hook executed at: %s"
            "\n%s: abort hook executed at: %s" %
            (pri_mom.shortname, dt1, pri_mom.shortname, dt2))
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=1)


================================================
FILE: test/tests/functional/pbs_hook_execjob_end.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import textwrap

from ptl.utils.pbs_logutils import PBSLogUtils
from tests.functional import *


def get_hook_body(sleep_time):
    """
    method to return hook body
    :param sleep_time: sleep time added in the hook
    :type sleep_time: int
    """
    hook_body = """
    import pbs
    import time
    e = pbs.event()

    if e.type == pbs.EXECJOB_EPILOGUE:
        hook_type = "EXECJOB_EPILOGUE"
    elif e.type == pbs.EXECJOB_END:
        hook_type = "EXECJOB_END"
    pbs.logjobmsg(e.job.id, "starting hook event " + hook_type)
    time.sleep(%s)
    pbs.logjobmsg(e.job.id, "ending hook event " + hook_type)
    """ % sleep_time
    hook_body = textwrap.dedent(hook_body)
    return hook_body


class TestPbsExecjobEnd(TestFunctional):
    """
    This tests the feature in PBS that allows
    execjob_end hook to execute such that
    pbs_mom is not blocked upon execution.
    """
    logutils = PBSLogUtils()
    job_list = []

    def setUp(self):
        TestFunctional.setUp(self)
        self.attr = {'event': 'execjob_end', 'enabled': 'True', 'alarm': '50'}
        self.hook_body = ("import pbs\n"
                          "import time\n"
                          "e = pbs.event()\n"
                          "pbs.logjobmsg(e.job.id, \
                                         'executed execjob_end hook')\n"
                          "time.sleep(10)\n"
                          "pbs.logjobmsg(e.job.id, \
                                         'execjob_end hook ended')\n"
                          "e.accept()\n")

    def test_execjob_end_non_blocking(self):
        """
        Test to make sure that mom is unblocked and running
        exechost_periodic hook while it's child process is executing
        execjob_end hook.
        """
        hook_name = "execjob_end_logmsg"
        self.server.create_import_hook(hook_name, self.attr, self.hook_body)
        hook_name = "exechost_periodic_logmsg"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "pbs.logmsg(pbs.LOG_DEBUG, \
                                 'executed exechost_periodic hook')\n"
                     "e.accept()\n")
        attr = {'event': 'exechost_periodic', 'freq': '3', 'enabled': 'True'}
        j = Job(TEST_USER)
        j.set_sleep_time(1)
        self.server.create_import_hook(hook_name, attr, hook_body)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        # need to verify hook messages in the below mentioned order to
        # confirm mom is not blocked on execjob_end hook execution.
        # The order is verified with the use of starttime and endtime
        # parameters.
        (_, str1) = self.mom.log_match("Job;%s;executed execjob_end hook" %
                                       jid, n=100, max_attempts=10, interval=2)
        date_time1 = str1.split(";")[0]
        epoch1 = self.logutils.convert_date_time(date_time1)
        # following message should be logged while execjob_end hook is in sleep
        (_, str1) = self.mom.log_match("executed exechost_periodic hook",
                                       starttime=epoch1 - 1,
                                       endtime=epoch1 + 10,
                                       n=100, max_attempts=10, interval=1)
        date_time2 = str1.split(";")[0]
        epoch2 = self.logutils.convert_date_time(date_time2)
        (_, str1) = self.mom.log_match(
            "Job;%s;execjob_end hook ended" %
            jid, starttime=epoch2 - 1, n=100,
            max_attempts=10, interval=2)
        date_time3 = str1.split(";")[0]
        self.logger.info(
            "execjob_end hook executed at: %s,"
            "exechost_periodic at: %s and execjob_end hook ended at: %s" %
            (date_time1, date_time2, date_time3))

    def test_execjob_end_hook_order_and_reject(self):
        """
        Test with multiple execjob_end hooks having different order
        with one of the hooks rejecting the job.
        """
        hook_name1 = "execjob_end_logmsg1"
        hook_body_accept = ("import pbs\n"
                            "e = pbs.event()\n"
                            "pbs.logjobmsg(e.job.id, \
                                  'executed %s hook' % e.hook_name)\n"
                            "e.accept()\n")
        attr = {'event': 'execjob_end', 'order': '1', 'enabled': 'True'}
        self.server.create_import_hook(hook_name1, attr, hook_body_accept)
        hook_name = "execjob_end_logmsg2"
        hook_body_reject = (
            "import pbs\n"
            "e = pbs.event()\n"
            "pbs.logjobmsg(e.job.id, 'executed execjob_end hook')\n"
            "e.reject('Job is rejected')\n")
        attr = {'event': 'execjob_end', 'order': '2', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body_reject)
        hook_name2 = "execjob_end_logmsg3"
        attr = {'event': 'execjob_end', 'order': '170', 'enabled': 'True'}
        self.server.create_import_hook(hook_name2, attr, hook_body_accept)
        j = Job(TEST_USER)
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        self.mom.log_match("Job;%s;executed %s hook" % (jid, hook_name1),
                           n=100, max_attempts=10, interval=2)
        self.mom.log_match("Job;%s;Job is rejected" % jid,
                           n=100, max_attempts=10, interval=2)
        self.mom.log_match("Job;%s;executed %s hook" % (jid, hook_name2),
                           n=100, max_attempts=10, interval=2, existence=False)

    def test_execjob_end_multi_job(self):
        """
        Test to make sure that mom is unblocked with
        execjob_end hook with mutiple jobs
        """
        if self.mom.is_cpuset_mom():
            status = self.server.status(NODE,
                                        id=self.server.status(NODE)[1]['id'])
            if status[0]["resources_available.ncpus"] < "2":
                self.skip_test(reason="need 2 or more available ncpus")
        else:
            a = {'resources_available.ncpus': 2}
            self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        hook_name = "execjob_end_logmsg4"
        self.server.create_import_hook(hook_name, self.attr, self.hook_body)
        # jobs need to land on the same host even in a multi-node setup
        a = {'Resource_List.select': '1:ncpus=1:host=%s' % self.mom.shortname}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(1)
        jid1 = self.server.submit(j)
        self.job_list.append(jid1)
        # jid1 should be in E state, in sleep of execjob_end hook for
        # jid2 submmision.
        self.server.expect(JOB, {'job_state': 'E'}, id=jid1)
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(1)
        jid2 = self.server.submit(j)
        self.job_list.append(jid2)
        # hook message of jid2 should be logged after the message of jid1 and
        # before completion of sleep in hook for jid1 inorder to prove mom
        # is not in blocked state.
        (_, str1) = self.mom.log_match("Job;%s;executed execjob_end hook" %
                                       jid1, n=100, max_attempts=10,
                                       interval=2)
        date_time1 = str1.split(";")[0]
        epoch1 = self.logutils.convert_date_time(date_time1)
        # hook message for jid2 should appear while hook is in sleep for jid1
        (_, str1) = self.mom.log_match("Job;%s;executed execjob_end hook" %
                                       jid2, starttime=epoch1 - 1,
                                       endtime=epoch1 + 10,
                                       n=100, max_attempts=10, interval=1)
        date_time1 = str1.split(";")[0]
        epoch1 = self.logutils.convert_date_time(date_time1)
        (_, str1) = self.mom.log_match("Job;%s;execjob_end hook ended" % jid1,
                                       starttime=epoch1 - 1,
                                       n=100, max_attempts=10, interval=2)
        self.mom.log_match("Job;%s;execjob_end hook ended" % jid2,
                           n=100, max_attempts=10, interval=2)

    @requirements(num_moms=2)
    def test_execjob_end_non_blocking_multi_node(self):
        """
        Test to make sure sister mom is unblocked
        when execjob_end hook is running on sister mom
        """
        if len(self.moms) != 2:
            self.skip_test(reason="need 2 mom hosts: -p moms=<m1>:<m2>")
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        hook_name = "execjob_end_logmsg5"
        self.server.create_import_hook(hook_name, self.attr, self.hook_body)
        hook_name = "exechost_periodic_logmsg2"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "pbs.logmsg(pbs.LOG_DEBUG, \
                                 'executed exechost_periodic hook')\n"
                     "e.accept()\n")
        attr = {'event': 'exechost_periodic', 'freq': '3', 'enabled': 'True'}
        a = {'Resource_List.select': '1:ncpus=1:host=%s+1:ncpus=1:host=%s' %
             (self.momA.shortname, self.momB.shortname)}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(1)
        self.server.create_import_hook(hook_name, attr, hook_body)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        for host, mom in self.moms.items():
            (_, str1) = mom.log_match("Job;%s;executed execjob_end hook" %
                                      jid, n=100, max_attempts=10,
                                      interval=2)
            date_time1 = str1.split(";")[0]
            epoch1 = self.logutils.convert_date_time(date_time1)
            (_, str1) = mom.log_match("executed exechost_periodic hook",
                                      starttime=epoch1 - 1,
                                      endtime=epoch1 + 10,
                                      n=100, max_attempts=10, interval=1)
            date_time2 = str1.split(";")[0]
            epoch2 = self.logutils.convert_date_time(date_time2)
            (_, str1) = mom.log_match(
                "Job;%s;execjob_end hook ended" %
                jid, starttime=epoch2 - 1, n=100,
                max_attempts=10, interval=2)
            date_time3 = str1.split(";")[0]
            msg = "Got expected log_msg on host:%s" % host
            self.logger.info(msg)
            self.logger.info(
                "execjob_end hook executed at: %s,"
                "exechost_periodic at: %s and execjob_end hook ended at: %s" %
                (date_time1, date_time2, date_time3))

    @requirements(num_moms=2)
    def test_execjob_end_delete_request(self):
        """
        Test to make sure execjob_end hook is running
        after job force deletion request(IS_DISCARD_JOB) when
        mom is unblocked.
        """
        hook_name = "execjob_end_logmsg6"
        self.server.create_import_hook(hook_name, self.attr, self.hook_body)
        if len(self.moms) == 2:
            self.momA = self.moms.values()[0]
            self.momB = self.moms.values()[1]
            a = {'Resource_List.select':
                 '1:ncpus=1:host=%s+1:ncpus=1:host=%s' %
                 (self.momA.shortname, self.momB.shortname)}
            j = Job(TEST_USER, attrs=a)
        elif len(self.moms) == 1:
            j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.deljob(id=jid, wait=True, attr_W="force")
        for host, mom in self.moms.items():
            mom.log_match("Job;%s;executed execjob_end hook" %
                          jid, n=100, max_attempts=10,
                          interval=2)
            mom.log_match("Job;%s;execjob_end hook ended" %
                          jid, n=100, max_attempts=10,
                          interval=2)
            msg = "Got expected log_msg on host:%s" % host
            self.logger.info(msg)

    @requirements(num_moms=2)
    def test_execjob_end_reject_request(self):
        """
        Test to make sure hook job reject message should appear in mom log
        in case sister mom went down before executing execjob_end hook
        """

        if len(self.moms) != 2:
            self.skip_test(reason="need 2 mom hosts: -p moms=<m1>:<m2>")
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]

        # Create hook
        hook_name = "execjob_end_logmsg7"
        self.server.create_import_hook(hook_name, self.attr, self.hook_body)

        # Submit a multi-node job
        a = {'Resource_List.select':
             '1:ncpus=1:host=%s+1:ncpus=1:host=%s' %
             (self.momA.shortname, self.momB.shortname)}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(60)
        jid = self.server.submit(j)
        self.job_list.append(jid)

        # Verify job spawn on sisterm mom
        self.momB.log_match("Job;%s;JOIN_JOB as node" % jid, n=100,
                            max_attempts=10, interval=2)

        # When the job run approx 5 sec, bring sister mom down
        self.server.expect(JOB, {'job_state': 'R'}, id=jid, offset=5)
        msg = 'mom is not down'
        self.assertTrue(self.momB.stop(), msg)

        # Verify momB is down and job is running
        a = {'state': (MATCH_RE, "down")}
        self.server.expect(
            NODE, a, id=self.momB.shortname)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

        hook_execution_time = time.time()
        self.server.expect(JOB, {'job_state': "E"}, id=jid, max_attempts=300)

        # Following message should be logged on momA after job delete request
        # received
        msg = "%s;Unable to send delete job request to one or more" % jid
        msg += " sisters"

        self.momA.log_match(msg, interval=2, starttime=hook_execution_time)

        # Following message should be logged on momA while execjob_end hook is
        # in sleep
        self.momA.log_match("Job;%s;executed execjob_end hook" % jid,
                            starttime=hook_execution_time, max_attempts=10,
                            interval=2)

        self.momA.log_match("Job;%s;execjob_end hook ended" % jid,
                            starttime=hook_execution_time, max_attempts=10,
                            interval=2)

        # Verify  reject reply code 15059 for hook job logged in mother
        # superior(momA)
        self.momA.log_match("Req;req_reject;Reject reply code=15059,",
                            starttime=hook_execution_time, max_attempts=10,
                            interval=2)

        # Start pbs on MomA
        self.server.pi.restart(hostname=self.server.hostname)
        # Verify mother superior is not down
        self.assertTrue(self.momA.isUp())

        # Start pbs on MomB
        self.momB.start()
        # Verify sister mom is not down
        self.assertTrue(self.momB.isUp())

    def test_rerun_on_epilogue_hook(self):
        """
        Test force qrerun when epilogue hook is running
        """

        hook_name = "epiend_hook"
        hook_body = get_hook_body(5)
        attr = {'event': 'execjob_epilogue,execjob_end', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)
        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        self.mom.log_match("starting hook event EXECJOB_EPILOGUE")
        # Force rerun job
        self.server.rerunjob(jid, extend='force')
        self.mom.log_match("starting hook event EXECJOB_END")
        self.server.expect(JOB, {'job_state': 'R'}, jid)
        self.mom.log_match("ending hook event EXECJOB_END")

    def common_steps(self, jid, host):
        """
        Function to run common steps for test job on mom breakdown
        and restarts
        """

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        host.signal('-KILL')
        self.logger.info(
            "Successfully killed mom process on %s" %
            host.shortname)

        # set scheduling false
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # check for the job's state after the node_fail_requeue time hits
        self.logger.info("Waiting for 30s so that node_fail_requeue time hits")
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid, offset=30)

        host.start()
        self.logger.info(
            "Successfully started mom process on %s" %
            host.shortname)
        self.server.expect(NODE, {'state': 'free'}, id=host.shortname)

        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)
        # run job
        try:
            now = time.time()
            # qrun will fail as it is discarding the job
            self.server.runjob(jid)
        except PbsRunError as e:
            self.logger.info("Runjob throws error: " + e.msg[0])
            self.assertTrue(
                'qrun: Request invalid for state of job'
                in e.msg[0])
            self.mom.log_match("ending hook event EXECJOB_END",
                               starttime=now, interval=2)
            time.sleep(5)
            self.server.runjob(jid)
            self.server.expect(JOB, {'job_state': 'R'}, jid)
            now = time.time()
            self.mom.log_match(
                "starting hook event EXECJOB_END",
                starttime=now, interval=2)
            time.sleep(5)
            self.mom.log_match("ending hook event EXECJOB_END",
                               starttime=now, interval=2)

    def test_qrun_on_mom_breakdown(self):
        """
        Test qrun when mom breaksdown and restarts
        """

        hook_name = "end_hook"
        hook_body = get_hook_body(5)
        attr = {'event': 'execjob_end', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name, attr, hook_body)
        attrib = {ATTR_nodefailrq: 30}
        self.server.manager(MGR_CMD_SET, SERVER, attrib=attrib)
        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        self.common_steps(jid, self.mom)

    def test_qrun_arrayjob_on_mom_breakdown(self):
        """
        Test qrun array job when mom breaksdown and restarts
        """

        hook_name = "end_hook"
        hook_body = get_hook_body(5)
        attr = {'event': 'execjob_end', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name, attr, hook_body)
        attrib = {ATTR_nodefailrq: 30}
        self.server.manager(MGR_CMD_SET, SERVER, attrib=attrib)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', ATTR_k: 'oe',
            'Resource_List.select': 'ncpus=1'
        })
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        # check job array has begun
        self.server.expect(JOB, {'job_state': 'B'}, jid)
        subjid_1 = j.create_subjob_id(jid, 1)
        self.common_steps(subjid_1, self.mom)

    def test_mom_restart(self):
        """
        Test to restart mom while execjob_end hook is running
        """
        hook_name = "end_hook"
        hook_body = get_hook_body(20)
        attr = {'event': 'execjob_end', 'enabled': 'True', 'alarm': '40'}
        self.server.create_import_hook(hook_name, attr, hook_body)
        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.job_list.append(jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.mom.log_match("Job;%s;starting hook event EXECJOB_END" %
                           jid, n=100, interval=2)
        self.mom.restart()
        self.mom.log_match("Job;%s;ending hook event EXECJOB_END" %
                           jid, n=100, interval=2)
        self.server.log_match(jid + ";Exit_status=0", interval=4)

    def tearDown(self):
        for mom_val in self.moms.values():
            if mom_val.is_cpuset_mom():
                mom_val.restart()
        self.job_list.clear()


================================================
FILE: test/tests/functional/pbs_hook_execjob_prologue.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


@requirements(num_moms=3)
class TestPbsExecutePrologue(TestFunctional):
    """
    This tests the feature in PBS that allows execjob_prologue hook to
    execute on all sister moms all the time, and not just when first
    task is spawned on the node.

    PRE: Have a cluster of PBS with 3 mom hosts.
    """

    def setUp(self):
        if len(self.moms) != 3:
            self.skip_test(reason="need 3 mom hosts: -p moms=<m1>:<m2>:<m3>")

        TestFunctional.setUp(self)

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momC = self.moms.values()[2]

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        self.hostC = self.momC.shortname

        for mom in self.moms.values():
            self.server.expect(NODE, {'state': 'free'}, id=mom.shortname)

    def test_prologue_execute_on_all_moms(self):
        """
        Test to make sure execjob_prologue always get
        executed on all sister moms when mother superior
        has successfully executed its prologue hook.
        """
        hook_name = "prologue_logmsg"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "pbs.logjobmsg(e.job.id, 'executed prologue hook')\n")
        attr = {'event': 'execjob_prologue', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        attr = {'Resource_List.select': '3:ncpus=1',
                'Resource_List.place': 'scatter',
                'Resource_List.walltime': 30}
        j = Job(TEST_USER, attrs=attr)
        jid = self.server.submit(j)

        self.momB.log_match("Job;%s;JOIN_JOB as node" % jid, n=100,
                            max_attempts=10, interval=2)
        self.momC.log_match("Job;%s;JOIN_JOB as node" % jid, n=100,
                            max_attempts=10, interval=2)
        self.momA.log_match("Job;%s;executed prologue hook" % jid,
                            n=100, max_attempts=10, interval=2)
        self.momB.log_match("Job;%s;executed prologue hook" % jid,
                            n=100, max_attempts=10, interval=2)
        self.momC.log_match("Job;%s;executed prologue hook" % jid,
                            n=100, max_attempts=10, interval=2)

    def test_prologue_internal_error_no_fail_action(self):
        """
        Test a prologue hook with an internal error and no fail_action.
        """
        hook_name = "prologue_exception"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "x\n")

        attr = {'event': 'execjob_prologue',
                'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        attr = {'Resource_List.select': 'vnode=%s' % self.hostA,
                'Resource_List.walltime': 30}
        j = Job(TEST_USER, attrs=attr)
        j.set_sleep_time(1)
        self.server.submit(j)

        self.server.expect(NODE, {'state': 'free'}, id=self.hostA, offset=1)

    def test_prologue_internal_error_offline_vnodes(self):
        """
        Test a prologue hook with an internal error and
        fail_action=offline_vnodes.
        """
        attr = {'resources_available.mem': '2gb',
                'resources_available.ncpus': '1'}
        self.momC.create_vnodes(attr, 3,
                                delall=True, usenatvnode=True)
        hook_name = "prologue_exception"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "x\n")
        attr = {'event': 'execjob_prologue',
                'enabled': 'True',
                'fail_action': 'offline_vnodes'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        attr = {'Resource_List.select': 'vnode=%s[0]' % self.hostC,
                'Resource_List.walltime': 30}
        j = Job(TEST_USER, attrs=attr)
        self.server.submit(j)

        attr = {'state': 'offline',
                'comment': "offlined by hook '%s' due to hook error"
                % hook_name}
        self.server.expect(VNODE, attr, id=self.hostC, max_attempts=10,
                           interval=2)
        self.server.expect(VNODE, attr, id='%s[0]' % self.hostC,
                           max_attempts=10, interval=2)
        self.server.expect(VNODE, attr, id='%s[1]' % self.hostC,
                           max_attempts=10, interval=2)

        # revert momC
        self.server.manager(MGR_CMD_SET, NODE, {'state': (DECR, 'offline')},
                            id=self.hostC)
        self.server.manager(MGR_CMD_SET, NODE, {'state': (DECR, 'offline')},
                            id='%s[0]' % self.hostC)
        self.server.manager(MGR_CMD_SET, NODE, {'state': (DECR, 'offline')},
                            id='%s[1]' % self.hostC)

        self.server.manager(MGR_CMD_UNSET, NODE, 'comment',
                            id=self.hostC)
        self.server.manager(MGR_CMD_UNSET, NODE, 'comment',
                            id='%s[0]' % self.hostC)
        self.server.manager(MGR_CMD_UNSET, NODE, 'comment',
                            id='%s[1]' % self.hostC)
        self.momC.revert_to_defaults()

    def test_prologue_hook_set_fail_action(self):
        """
        Test that fail_actions can be set on execjob_prologue
        hooks by qmgr.
        """
        hook_name = "prologue"
        hook_body = ("import pbs\n"
                     "pbs.event().accept()\n")
        attr = {'event': 'execjob_prologue',
                'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)
        self.server.expect(HOOK, {'fail_action': 'none'}, id=hook_name)

        self.server.manager(MGR_CMD_SET, HOOK,
                            {'fail_action': 'offline_vnodes'},
                            id=hook_name)
        self.server.expect(HOOK, {'fail_action': 'offline_vnodes'})

        self.server.manager(MGR_CMD_SET, HOOK,
                            {'fail_action': 'scheduler_restart_cycle'},
                            id=hook_name)
        self.server.expect(HOOK, {'fail_action': 'scheduler_restart_cycle'},
                           id=hook_name)

    def test_prologue_hook_set_job_attr(self):
        """
        Test that a execjob_prologue hook can modify job attributes.
        """
        hook_name = "prologue_set_job_attr"
        hook_body = ("import pbs\n"
                     "pbs.event().job.resources_used['file']="
                     "pbs.size('2gb')\n")
        attr = {'event': 'execjob_prologue',
                'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})

        j = Job(TEST_USER)
        j.set_sleep_time(1)
        jid = self.server.submit(j)

        attr = {'resources_used.file': '2gb'}
        self.server.expect(JOB, attr, id=jid, extend='x', offset=1)
        self.server.accounting_match(
            "E;" + jid + ";.*resources_used.file=2gb", regexp=True,
            max_attempts=10)

    def test_prologue_hook_fail_action_non_mom_hook(self):
        """
        Test that when fail action is set to anything other than 'None' on
        a mom hook, and the mom hook event is not either execjob_begin,
        exechost_startup, execjob_prologue, an error message is dispalyed
        """
        hook_name = "prologue"
        hook_body = ("import pbs\n"
                     "pbs.event().accept()\n")
        attr = {'event': 'exechost_periodic',
                'fail_action': 'offline_vnodes'}
        try:
            self.server.create_import_hook(hook_name, attr, hook_body)
        except PbsManagerError as e:
            exp_err = "Can't set hook fail_action value to 'offline_vnodes':"
            exp_err += " hook event must"
            exp_err += " contain at least one of execjob_begin"
            exp_err += ", exechost_startup, execjob_prologue"
            self.assertTrue(exp_err in e.msg[0])

    def test_prologue_hook_does_not_execute_twice_on_pbsdsh(self):
        """
        This test creates a hook and then submits a job.
        It then uses the job output file to do a log_match
        on both the moms
        """
        hook_name = 'prologue'
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "pbs.logjobmsg(e.job.id, 'executed prologue hook')\n")
        attr = {'event': 'execjob_prologue'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        j = Job(TEST_USER, {'Resource_List.select': '2:ncpus=1',
                            'Resource_List.place': 'scatter'})
        pbsdsh_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                   "bin", "pbsdsh")
        j.create_script('#!/bin/sh\n%s  hostname\nsleep 10\n' % pbsdsh_path)
        jid = self.server.submit(j)
        attribs = self.server.status(JOB, id=jid)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)
        host, opath = attribs[0]['Output_Path'].split(':', 1)
        ret = self.du.cat(hostname=host, filename=opath, runas=TEST_USER)
        _msg = "cat command failed with error: %s" % ret['err']
        self.assertEqual(ret['rc'], 0, _msg)
        ret['out'] = ret['out'][-2:]
        mom1 = ret['out'][0].split(".")[0]
        mom2 = ret['out'][1].split(".")[0]
        self.exec_mom1 = self.moms[mom1]
        self.exec_mom2 = self.moms[mom2]
        self.exec_mom1.log_match("Job;%s;executed prologue hook" % jid)
        self.exec_mom2.log_match("Job;%s;executed prologue hook" % jid)

    def test_prologue_exception_sisters(self):
        """
        Test requeueing jobs due to a prologue hook with an exception
        when executed by sister moms only.
        Jobs should all start, fail (due to prologue hook error),
        requeue, and rerun several times before eventually getting held
        due to too many failed attempts.
        The test also confirms that all execjob_end hooks get executed.
        """
        hook_name = "prologue_exception"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "if not e.job.in_ms_mom():\n"
                     "    raise NameError\n")

        attr = {'event': 'execjob_prologue', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        hook_name = "endjob_hook1"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "pbs.logjobmsg(e.job.id, 'executed endjob hook 1')\n")

        attr = {'event': 'execjob_end', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        hook_name = "endjob_hook2"
        hook_body = ("import pbs\n"
                     "e = pbs.event()\n"
                     "pbs.logjobmsg(e.job.id, 'executed endjob hook 2')\n")

        attr = {'event': 'execjob_end', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        attr = {'Resource_List.select': '3:ncpus=1',
                'Resource_List.place': 'scatter:excl',
                'Resource_List.walltime': 30}

        num_jobs = 3
        job_list = []
        search_after = time.time()
        for _ in range(num_jobs):
            j = Job(TEST_USER, attrs=attr)
            jid = self.server.submit(j)
            job_list.append(jid)

        held_cmt = "job held, too many failed attempts to run"
        criteria = {'job_state': 'H', 'comment': held_cmt}
        for jid in job_list:
            for _ in range(21):
                self.momA.log_match("Job;%s;executed endjob hook 1" % jid,
                                    max_attempts=10, interval=1,
                                    starttime=search_after)
                self.momA.log_match("Job;%s;executed endjob hook 2" % jid,
                                    max_attempts=10, interval=1,
                                    starttime=search_after)
                search_after = time.time()
            self.server.expect(JOB, criteria, id=jid, max_attempts=100,
                               interval=2)


================================================
FILE: test/tests/functional/pbs_hook_jobobit.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *


def jobobit_hook():
    import pbs
    import sys

    try:
        e = pbs.event()
        job = e.job
        pbs.logjobmsg(
            job.id, 'jobobit hook started for test %s' % (e.hook_name,))
        pbs.logjobmsg(job.id, 'jobobit hook, job starttime:%s' % (job.stime,))
        pbs.logjobmsg(
            job.id, 'jobobit hook, job obittime:%s' % (job.obittime,))
        pbs.logjobmsg(job.id, 'jobobit hook, job_state=%s' % (job.job_state,))
        pbs.logjobmsg(
            job.id, 'jobobit hook, job_substate=%s' % (job.substate,))
        state_desc = pbs.REVERSE_JOB_STATE.get(job.job_state, '(None)')
        substate_desc = pbs.REVERSE_JOB_SUBSTATE.get(job.substate, '(None)')
        pbs.logjobmsg(
            job.id, 'jobobit hook, job_state_desc=%s' % (state_desc,))
        pbs.logjobmsg(
            job.id, 'jobobit hook, job_substate_desc=%s' % (substate_desc,))
        if hasattr(job, "resv") and job.resv:
            pbs.logjobmsg(
                job.id, 'jobobit hook, resv:%s' % (job.resv.resvid,))
            pbs.logjobmsg(
                job.id,
                'jobobit hook, resv_nodes:%s' % (job.resv.resv_nodes,))
            pbs.logjobmsg(
                job.id,
                'jobobit hook, resv_state:%s' % (job.resv.reserve_state,))
        else:
            pbs.logjobmsg(job.id, 'jobobit hook, resv:(None)')
        pbs.logjobmsg(
            job.id, 'jobobit hook finished for test %s' % (e.hook_name,))
    except Exception as err:
        ty, _, tb = sys.exc_info()
        pbs.logmsg(
            pbs.LOG_DEBUG, str(ty) + str(tb.tb_frame.f_code.co_filename) +
            str(tb.tb_lineno))
        e.reject()
    else:
        e.accept()


@tags('hooks')
class TestHookJobObit(TestFunctional):
    node_cpu_count = 4
    job_default_nchunks = 1
    job_default_ncpus = 1
    job_array_num_subjobs = node_cpu_count
    job_time_success = 5
    job_time_rerun = 10
    job_time_qdel = 30
    resv_default_nchunks = 1
    resv_default_ncpus = node_cpu_count
    resv_start_delay = 20
    resv_duration = 180

    node_fail_timeout = 15
    job_requeue_timeout = 5
    resv_retry_time = 5

    @property
    def is_array_job(self):
        return len(self.subjob_ids) > 0

    def run_test_func(self, test_body_func, *args, **kwargs):
        """
        Setup the environment for running jobobit hook related tests, execute
        the test function and then perform common checks and clean up.
        """
        self.job = None
        self.subjob_ids = []
        self.started_job_ids = set()
        self.ended_job_ids = set()
        self.deleted_job_ids = set()
        self.delete_failed_job_ids = set()
        self.rerun_job_ids = set()
        self.resv_id = None
        self.resv_queue = None
        self.resv_start_time = None
        self.scheduling_enabled = True
        self.moms_stopped = False
        self.node_count = len(self.server.moms)
        self.hook_name = test_body_func.__name__

        self.logger.info("***** JOBOBIT HOOK TEST START *****")

        a = {'resources_available.ncpus': self.node_cpu_count}
        for mom in self.moms.values():
            self.server.manager(MGR_CMD_SET, NODE, a, mom.shortname)

        try:
            # If hook exists from a previous test, remove it
            self.server.delete_hook(self.hook_name)
        except PtlException:
            pass

        a = {'event': 'jobobit', 'enabled': 'True'}
        ret = self.server.create_hook(self.hook_name, a)
        self.assertTrue(ret, "Could not create hook %s" % self.hook_name)

        hook_body = generate_hook_body_from_func(jobobit_hook)
        ret = self.server.import_hook(self.hook_name, hook_body)
        self.assertTrue(ret, "Could not import hook %s" % self.hook_name)

        a = {
            'job_history_enable': 'True',
            'job_requeue_timeout': self.job_requeue_timeout,
            'node_fail_requeue': self.node_fail_timeout,
            'reserve_retry_time': self.resv_retry_time,
        }
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.log_start_time = time.time()
        try:
            test_body_func(*args, **kwargs)
            self.check_log_for_jobobit_hook_messages()
        finally:
            # Make an effort to start the MoMs if they are not running
            for mom in self.moms.values():
                if not self.mom.isUp(max_attempts=3):
                    try:
                        self.mom.start()
                    except PtlException:
                        pass
            ret = self.server.delete_hook(self.hook_name)
            self.assertTrue(ret, "Could not delete hook %s" % self.hook_name)

        self.logger.info("***** JOBOBIT HOOK TEST END *****")

    def job_verify_jobobit_hook_messages(self, job_id, existence):
        """
        Look for messages logged by the jobobit hook.  This method assumes that
        a started job have been verified as terminated (ended/requeued) or
        forced deleted, thus insuring that the jobobit hook has run for the
        job.
        """
        self.server.log_match(
            '%s;jobobit hook started for test %s' % (job_id, self.hook_name),
            starttime=self.log_start_time, n='ALL', max_attempts=1,
            existence=existence)
        # TODO: Add checks for expected job state and substate
        self.server.log_match(
            '%s;jobobit hook, resv:%s' % (job_id, self.resv_queue or "(None)"),
            starttime=self.log_start_time, n='ALL', max_attempts=1,
            existence=existence)
        self.server.log_match(
            '%s;jobobit hook finished for test %s' % (job_id, self.hook_name),
            starttime=self.log_start_time, n='ALL', max_attempts=1,
            existence=existence)

    def check_log_for_jobobit_hook_messages(self):
        """
        Look for messages logged by the jobobit hook.  This method assumes that
        all started jobs have been verified as terminated or forced deleted,
        thus insuring that the jobobit hook has run for those jobs.
        """
        for jid in [self.job_id] + self.subjob_ids:
            job_ended = jid in self.ended_job_ids or jid in self.rerun_job_ids
            self.job_verify_jobobit_hook_messages(jid, job_ended)
            # Remove any jobs that ended from the list of started and deleted
            # jobs.  At this point, they should no longer exist and thus are
            # irrelevant in either set.
            if job_ended:
                self.started_job_ids.discard(jid)
                self.rerun_job_ids.discard(jid)
                self.deleted_job_ids.discard(jid)
                self.delete_failed_job_ids.discard(jid)
                self.ended_job_ids.discard(jid)
        # Reset the start time so that searches on requeued jobs don't match
        # state or log messages prior to the current search.  This assumes that
        # previous state and log messages for a test will not contain a time
        # stamp equal to or greater than the new start time.
        self.log_start_time = time.time()

    def get_job_id_set(self, job_ids):
        try:
            return set(job_ids)
        except TypeError:
            return set([job_ids]) if job_ids else set([self.job_id])

    def job_submit(
            self,
            subjob_count=0,
            user=TEST_USER,
            nchunks=job_default_nchunks,
            ncpus=job_default_ncpus,
            job_time=job_time_success,
            job_rerunnable=True,
            job_attrs=None):
        if self.scheduling_enabled:
            # Disable scheduling so that jobs won't be immediately started
            # until we've verified that they have been queued
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
            self.scheduling_enabled = False
        a = {}
        a['Resource_List.select'] = str(nchunks) + ':ncpus=' + str(ncpus)
        if subjob_count == 1:
            a[ATTR_J] = '0-1:2'
        elif subjob_count > 1:
            a[ATTR_J] = '0-' + str(subjob_count - 1)
        self.job_rerunnable = job_rerunnable
        if not job_rerunnable:
            a[ATTR_r] = 'n'
        a.update(job_attrs or {})
        self.job = Job(user, attrs=a)
        self.job.set_sleep_time(job_time)
        self.job_id = self.server.submit(self.job)
        self.subjob_ids = [
            self.job.create_subjob_id(self.job_id, i)
            for i in range(subjob_count)]

    def job_rerun(self, job_ids=None, force=False, user=None):
        if self.scheduling_enabled:
            # Disable scheduling so that requeued (rerun) jobs won't be
            # immediately restarted
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
            self.scheduling_enabled = False
        jids = self.get_job_id_set(job_ids)
        extend = 'force' if force else None
        try:
            self.server.rerunjob(list(jids), extend=extend, runas=user)
        except PbsRerunError:
            # A failed rerun should eventually result in the jobobit hook being
            # run and the job being requeued
            pass
        if self.is_array_job and self.job_id in jids:
            self.rerun_job_ids.update(self.started_job_ids)
            self.rerun_job_ids.remove(self.job_id)
        else:
            self.rerun_job_ids.update(jids & self.started_job_ids)

    def job_delete(self, job_ids=None, force=False, user=None):
        if self.scheduling_enabled:
            # Disable scheduling so that requeued (rerun) jobs won't be
            # immediately restarted
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
            self.scheduling_enabled = False
        jids = self.get_job_id_set(job_ids)
        extend = 'force' if force else None
        try:
            self.server.delete(list(jids), extend=extend, runas=user)
        except PbsDeleteError:
            # This assumes that if deleting one job fails then the delete
            # failed for all jobs, which in our controlled testing is likely
            # true
            job_id_set = self.delete_failed_job_ids
        else:
            job_id_set = self.deleted_job_ids
        job_id_set.update(jids)
        if self.is_array_job:
            if self.job_id in jids:
                job_id_set.update(self.subjob_ids)
            # If a single subjob is deleted (TERMINATED), the substate for the
            # array job is also set to TERMINATED.
            self.deleted_job_ids.add(self.job_id)

    def job_verify_queued(self, job_ids=None):
        # Verifying that the jobs are queued should only be performed when the
        # scheduler has been disabled before submitting or rerunning the jobs.
        # If the scheduler is active, then the jobs may have been started and
        # thus may no longer be in the queued state.
        self.assertFalse(self.scheduling_enabled, "scheduling is enabled!")
        jids = self.get_job_id_set(job_ids)
        if self.is_array_job and self.job_id in jids:
            if self.job_id not in self.started_job_ids:
                self.server.expect(JOB, {'job_state': 'Q'}, id=self.job_id)
                self.server.accounting_match(
                    "Q;%s;" % (self.job_id,),
                    starttime=int(self.log_start_time),
                    n='ALL', max_attempts=1)
            else:
                self.server.expect(JOB, {'job_state': 'B'}, id=self.job_id)
            jids.update(self.subjob_ids)
            jids.remove(self.job_id)
        for jid in jids:
            self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
            if jid in self.started_job_ids:
                # Jobs/Subjobs that were started and then requeued need to be
                # added to the rerun list to indicate that output from the hook
                # should be present.
                self.rerun_job_ids.add(jid)
            if jid in self.rerun_job_ids:
                self.server.accounting_match(
                    "R;%s;" % (jid,),
                    starttime=int(self.log_start_time),
                    n='ALL', max_attempts=1)
            elif not self.is_array_job:
                self.server.accounting_match(
                    "Q;%s;" % (jid,),
                    starttime=int(self.log_start_time),
                    n='ALL', max_attempts=1)

    def job_verify_started(self, job_ids=None):
        if not self.scheduling_enabled:
            # If scheduling was previously disabled to allow time for log
            # scraping, etc. before requeued jobs were restarted, then enabling
            # scheduling again.
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
            self.scheduling_enabled = True
        jids = self.get_job_id_set(job_ids)
        if self.is_array_job and self.job_id in jids:
            self.server.expect(JOB, {'job_state': 'B'}, id=self.job_id)
            if self.job_id not in self.started_job_ids:
                self.server.accounting_match(
                    "S;%s;" % (self.job_id,),
                    starttime=int(self.log_start_time),
                    n='ALL', max_attempts=1)
            jids.update(self.subjob_ids)
            jids.remove(self.job_id)
            self.started_job_ids.add(self.job_id)
        for jid in jids:
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)
            self.server.accounting_match(
                "S;%s;" % (jid,),
                starttime=int(self.log_start_time),
                n='ALL', max_attempts=1)
            self.started_job_ids.add(jid)

    def job_verify_ended(self, job_ids=None):
        jids = self.get_job_id_set(job_ids)
        if self.is_array_job and self.job_id in jids:
            if self.job_id not in self.delete_failed_job_ids:
                jids.update(self.started_job_ids)
            else:
                jids.remove(self.job_id)
        for jid in jids & self.started_job_ids:
            # If the job failed, the verify that the substate is FAILED (93).
            # If the job was deleted, then verify that the substate is set to
            # TERMINATED (91).  Otherwise, verify that the substate is set to
            # FINISHED (92).
            if jid in self.delete_failed_job_ids:
                substate = 93
            elif jid in self.deleted_job_ids:
                substate = 91
            else:
                substate = 92
            self.server.expect(
                JOB, {'job_state': 'F', 'substate': substate}, extend='x',
                id=jid)
            # If the job was deleted without the force flag and the moms were
            # stopped and not restarted, then an accounting 'E' record will not
            # be immediately written.
            if not (jid in self.delete_failed_job_ids and self.moms_stopped):
                self.server.accounting_match(
                    "E;%s;" % (jid,),
                    starttime=int(self.log_start_time),
                    n='ALL', max_attempts=1)
            self.ended_job_ids.add(jid)

    def resv_submit(
            self,
            user=TEST_USER,
            nchunks=resv_default_nchunks,
            ncpus=resv_default_ncpus,
            resv_start_time=None,
            resv_end_time=None,
            resv_attrs=None):
        start_time = resv_start_time or int(time.time()) + \
            self.resv_start_delay
        end_time = resv_end_time or start_time + self.resv_duration
        a = {}
        a['Resource_List.select'] = str(nchunks) + ':ncpus=' + str(ncpus)
        a['Resource_List.place'] = 'free'
        a['reserve_start'] = start_time
        a['reserve_end'] = end_time
        a.update(resv_attrs or {})
        resv = Reservation(user, a)
        self.resv_id = self.server.submit(resv)
        self.resv_start_time = start_time

    def resv_verify_confirmed(self):
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=self.resv_id)
        self.resv_queue = self.resv_id.split('.')[0]
        self.server.status(RESV, 'resv_nodes')

    def resv_verify_started(self):
        self.logger.info('Sleeping until reservation starts')
        self.server.expect(
            RESV, {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
            id=self.resv_id,
            offset=self.resv_start_time - int(time.time() + 1))

    def moms_start(self, *args, **kwargs):
        for mom in self.moms.values():
            mom.start(*args, **kwargs)
        self.moms_stopped = False
        if not self.scheduling_enabled:
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
            self.scheduling_enabled = True

    def moms_stop(self, *args, **kwargs):
        if self.scheduling_enabled:
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
            self.scheduling_enabled = False
        for mom in self.moms.values():
            mom.stop(*args, **kwargs)
        self.moms_stopped = True

    # -------------------------------------------------------------------------

    def jobobit_simple_run_job(self, subjob_count=0):
        self.job_submit(subjob_count=subjob_count)
        self.job_verify_queued()
        self.job_verify_started()
        self.job_verify_ended()

    def test_hook_jobobit_run_single_job(self):
        """
        Run a single job to completion and verify that the jobobit hook is
        executed.
        """
        self.run_test_func(
            self.jobobit_simple_run_job)

    @tags('smoke')
    def test_hook_jobobit_run_array_job(self):
        """
        Run an array of jobs to completion and verify that the jobobit hook is
        executed for all subjobs and the array job.
        """
        self.run_test_func(
            self.jobobit_simple_run_job,
            subjob_count=self.job_array_num_subjobs)

    # -------------------------------------------------------------------------

    def test_hook_jobobit_run_array_job_in_resv(self):
        """
        Run an array of jobs to completion within a reservation and verify that
        that the jobobit hook is executed for all subjobs and the array job.
        """
        def jobobit_run_array_job_in_resv():
            self.resv_submit()
            self.resv_verify_confirmed()
            a = {ATTR_queue: self.resv_queue}
            self.job_submit(
                subjob_count=2,
                ncpus=self.node_cpu_count // 2,
                job_attrs=a)
            self.job_verify_queued()
            self.resv_verify_started()
            self.job_verify_started()
            self.job_verify_ended()

        self.run_test_func(jobobit_run_array_job_in_resv)

    # -------------------------------------------------------------------------

    def jobobit_rerun_job(
            self,
            subjob_count=0,
            rerun_force=False,
            rerun_user=None,
            stop_moms=False,
            restart_moms=False):
        self.job_submit(
            subjob_count=subjob_count,
            job_time=self.job_time_rerun)
        self.job_verify_queued()
        self.job_verify_started()
        if stop_moms:
            self.moms_stop()
        self.job_rerun(force=rerun_force, user=rerun_user)
        self.job_verify_queued()
        self.check_log_for_jobobit_hook_messages()
        if restart_moms:
            self.moms_start()
        if not stop_moms or restart_moms:
            self.job_verify_started()
        self.job_verify_ended()

    def test_hook_jobobit_rerun_single_job_as_root(self):
        """
        Start a single job, issue a rerun as root, and verify that the jobobit
        hook is executed for both runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job)

    def test_hook_jobobit_rerun_single_job_as_mgr(self):
        """
        Start a single job, issue a rerun as manager, and verify that the end
        job hook is executed for both runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            rerun_user=MGR_USER)

    def test_hook_jobobit_force_rerun_single_job_as_root(self):
        """
        Start a single job, issue a rerun as root, and verify that the jobobit
        hook is executed for both runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            rerun_force=True)

    def test_hook_jobobit_force_rerun_single_job_as_mgr(self):
        """
        Start a single job, force issue a rerun as manager, and verify that the
        jobobit hook is executed for both runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            rerun_force=True,
            rerun_user=MGR_USER)

    def test_hook_jobobit_rerun_single_job_stop_moms(self):
        """
        Start a single job, issue a rerun after stopping the MoMs. Verify that
        the job is requeued and that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            stop_moms=True,
            restart_moms=False)

    def test_hook_jobobit_force_rerun_single_job_stop_moms(self):
        """
        Start a single job, issue a force rerun after stopping the MoMs. Verify
        that the job is requeued and that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            rerun_force=True,
            stop_moms=True,
            restart_moms=False)

    def test_hook_jobobit_rerun_single_job_restart_moms(self):
        """
        Start a single job, issue a rerun after stopping the MoMs, then enable
        the MoMs again, verifying that the jobobit hook is executed for both
        runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            stop_moms=True,
            restart_moms=True)

    def test_hook_jobobit_force_rerun_single_job_restart_moms(self):
        """
        Start a single job, issue a force rerun after stopping the MoMs, then
        enable the MoMs again, verifying that the jobobit hook is executed for
        both runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            rerun_force=True,
            stop_moms=True,
            restart_moms=True)

    def test_hook_jobobit_rerun_array_job(self):
        """
        Start an array job, issue a rerun, and verify that the jobobit hook is
        executed for all subjob on both runs and only once for the array job.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            subjob_count=self.job_array_num_subjobs)

    def test_hook_jobobit_force_rerun_array_job(self):
        """
        Start an array job, issue a force rerun, and verify that the jobobit
        hook is executed for all subjob on both runs and only once for the
        array job.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            subjob_count=self.job_array_num_subjobs,
            rerun_force=True)

    def test_hook_jobobit_rerun_array_job_restart_moms(self):
        """
        Start an array job, issue a rerun after stopping the MoMs, then start
        the MoMs again, verifying that the jobobit hook is executed for both
        runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            subjob_count=self.job_array_num_subjobs,
            stop_moms=True,
            restart_moms=True)

    def test_hook_jobobit_force_rerun_array_job_restart_moms(self):
        """
        Start an array job, issue a force rerun after stopping the MoMs, then
        start the MoMs again, verifying that the jobobit hook is executed for
        both runs.
        """
        self.run_test_func(
            self.jobobit_rerun_job,
            subjob_count=self.job_array_num_subjobs,
            rerun_force=True,
            stop_moms=True,
            restart_moms=True)

    # -------------------------------------------------------------------------

    def jobobit_rerun_and_delete_job(
            self,
            subjob_count=0,
            delete_force=False):
        self.job_submit(
            subjob_count=subjob_count,
            job_time=self.job_time_rerun)
        self.job_verify_started()
        self.job_rerun()
        self.job_verify_queued()
        self.check_log_for_jobobit_hook_messages()
        self.job_delete(force=delete_force)
        self.job_verify_ended()

    def test_hook_jobobit_rerun_and_delete_single_job(self):
        """
        Start a single job, issue a rerun and immediately delete it.  Verify
        that the jobobit hook is only executed once.
        """
        self.run_test_func(
            self.jobobit_rerun_and_delete_job)

    def test_hook_jobobit_rerun_and_force_delete_single_job(self):
        """
        Start a single job, issue a rerun and immediately force delete it.
        Verify that the jobobit hook is only executed once.
        """
        self.run_test_func(
            self.jobobit_rerun_and_delete_job,
            delete_force=True)

    def test_hook_jobobit_rerun_and_delete_array_job(self):
        """
        Start an array job, issue a rerun and immediately delete it. Verify
        that the jobobit hook is only executed once for each subjob and the
        job array.
        """
        self.run_test_func(
            self.jobobit_rerun_and_delete_job,
            subjob_count=self.job_array_num_subjobs)

    def test_hook_jobobit_rerun_and_force_delete_array_job(self):
        """
        Start an array job, issue a rerun and immediately force delete it.
        Verify that the jobobit hook is only executed once for each subjob and
        the job array.
        """
        self.run_test_func(
            self.jobobit_rerun_and_delete_job,
            subjob_count=self.job_array_num_subjobs,
            delete_force=True)

    # -------------------------------------------------------------------------

    def jobobit_delete_unstarted_job(
            self,
            subjob_count=0,
            delete_force=False,
            delete_user=None):
        self.job_submit(
            subjob_count=subjob_count,
            nchunks=self.node_count,
            ncpus=self.node_cpu_count * 2,
            job_time=self.job_time_qdel)
        self.job_verify_queued()
        self.job_delete(force=delete_force, user=delete_user)
        self.job_verify_ended()

    def test_hook_jobobit_delete_unstarted_single_job_as_root(self):
        """
        Queue a single job, but delete it as root before it starts.  Verify
        that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job)

    def test_hook_jobobit_delete_unstarted_single_job_as_user(self):
        """
        Queue a single job, but delete it as the user before it starts.  Verify
        that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job,
            delete_user=TEST_USER)

    def test_hook_jobobit_force_delete_unstarted_single_job_as_root(self):
        """
        Queue a single job, but force delete it as root before it starts.
        Verify that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job,
            delete_force=True)

    def test_hook_jobobit_force_delete_unstarted_single_job_as_user(self):
        """
        Queue a single job, but force delete it as the user before it starts.
        Verify that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job,
            delete_force=True,
            delete_user=TEST_USER)

    def test_hook_jobobit_delete_unstarted_array_job_as_root(self):
        """
        Queue an array job, but delete it as root before it starts.  Verify
        that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job,
            subjob_count=self.job_array_num_subjobs)

    def test_hook_jobobit_delete_unstarted_array_job_as_user(self):
        """
        Queue an array job, but delete it as the user before it starts.  Verify
        that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job,
            subjob_count=self.job_array_num_subjobs,
            delete_user=TEST_USER)

    def test_hook_jobobit_force_delete_unstarted_array_job_as_root(self):
        """
        Queue an array job, but force delete it as root before it starts.
        Verify that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job,
            subjob_count=self.job_array_num_subjobs,
            delete_force=True)

    def test_hook_jobobit_force_delete_unstarted_array_job_as_user(self):
        """
        Queue an array job, but force delete it as the user before it starts.
        Verify that the jobobit hook is not executed.
        """
        self.run_test_func(
            self.jobobit_delete_unstarted_job,
            subjob_count=self.job_array_num_subjobs,
            delete_force=True,
            delete_user=TEST_USER)

    # -------------------------------------------------------------------------

    def jobobit_delete_running_job(
            self,
            subjob_count=0,
            job_rerunnable=True,
            delete_force=False,
            delete_user=None):
        self.job_submit(
            job_rerunnable=job_rerunnable,
            subjob_count=subjob_count,
            job_time=self.job_time_qdel)
        self.job_verify_queued()
        self.job_verify_started()
        self.job_delete(force=delete_force, user=delete_user)
        self.job_verify_ended()

    def test_hook_jobobit_delete_running_single_job_as_root(self):
        """
        Run a single job, but delete as root before completion.  Verify that
        the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job)

    def test_hook_jobobit_delete_running_single_job_as_user(self):
        """
        Run a single job, but delete as the user before completion.  Verify
        that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job,
            delete_user=TEST_USER)

    def test_hook_jobobit_force_delete_running_single_job_as_root(self):
        """
        Run a single job, but force delete as root before completion.  Verify
        that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job,
            delete_force=True)

    def test_hook_jobobit_force_delete_running_single_job_as_user(self):
        """
        Run a single job, but force delete as the user before completion.
        Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job,
            delete_force=True,
            delete_user=TEST_USER)

    def test_hook_jobobit_delete_running_array_job_as_root(self):
        """
        Run an array job, where all jobs are started but also deleted (by root)
        before completion.  Verify that the jobobit hook is executed for all
        subjobs and the array job.
        """
        self.run_test_func(
            self.jobobit_delete_running_job,
            subjob_count=self.job_array_num_subjobs)

    def test_hook_jobobit_delete_running_array_job_as_user(self):
        """
        Run an array job, where all jobs have started but also deleted (by the
        user) before completion.  Verify that the jobobit hook is executed for
        all subjobs and the array job.
        """
        self.run_test_func(
            self.jobobit_delete_running_job,
            subjob_count=self.job_array_num_subjobs,
            delete_user=TEST_USER)

    def test_hook_jobobit_force_delete_running_array_job_as_root(self):
        """
        Run an array job, where all jobs are started but also force deleted (by
        root) before completion.  Verify that the jobobit hook is executed for
        all subjobs and the array job.
        """
        self.run_test_func(
            self.jobobit_delete_running_job,
            delete_force=True,
            subjob_count=self.job_array_num_subjobs)

    def test_hook_jobobit_force_delete_running_array_job_as_user(self):
        """
        Run an array job, where all jobs have started but also force deleted
        (by the user) before completion.  Verify that the jobobit hook is
        executed for all subjobs and the array job.
        """
        self.run_test_func(
            self.jobobit_delete_running_job,
            subjob_count=self.job_array_num_subjobs,
            delete_force=True,
            delete_user=TEST_USER)

    # -------------------------------------------------------------------------

    def jobobit_delete_running_job_moms_stopped(
            self,
            subjob_count=0,
            job_rerunnable=True,
            delete_user=None,
            delete_force=False,
            restart_moms=False):
        self.job_submit(
            subjob_count=subjob_count,
            job_time=self.job_time_qdel,
            job_rerunnable=job_rerunnable)
        self.job_verify_started()
        self.moms_stop()
        self.job_delete(force=delete_force, user=delete_user)
        if job_rerunnable and not delete_force:
            self.job_verify_queued()
            self.check_log_for_jobobit_hook_messages()
            if restart_moms:
                self.moms_start()
                self.job_verify_started()
        self.job_verify_ended()

    def test_hook_jobobit_delete_running_single_job_as_root_nrr_sm(self):
        """
        Run a single non-rerunable job, but delete as root before completion
        after stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            job_rerunnable=False)

    def test_hook_jobobit_delete_running_single_job_as_user_nrr_sm(self):
        """
        Run a single non-rerunable job, but delete as user before completion
        after stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_user=TEST_USER,
            job_rerunnable=False)

    def test_hook_jobobit_force_delete_running_single_job_as_root_nrr_sm(self):
        """
        Run a single non-rerunable job, but force delete as root before
        completion after stopping the MoM. Verify that the jobobit hook is
        executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_force=True,
            job_rerunnable=False)

    def test_hook_jobobit_force_delete_running_single_job_as_user_nrr_sm(self):
        """
        Run a single non-rerunable job, but force delete as user before
        completion after stopping the MoM. Verify that the jobobit hook is
        executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_force=True,
            delete_user=TEST_USER,
            job_rerunnable=False)

    def test_hook_jobobit_delete_running_single_job_as_root_sm(self):
        """
        Run a single rerunable job, but delete as user before completion
        after stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            job_rerunnable=True)

    def test_hook_jobobit_delete_running_single_job_as_user_sm(self):
        """
        Run a single rerunable job, but delete as user before completion
        after stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_user=TEST_USER,
            job_rerunnable=True)

    def test_hook_jobobit_force_delete_running_single_job_as_root_sm(self):
        """
        Run a single rerunable job, but force delete as root before completion
        after stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_force=True,
            job_rerunnable=True)

    def test_hook_jobobit_force_delete_running_single_job_as_user_sm(self):
        """
        Run a single rerunable job, but force delete as user before completion
        after stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_force=True,
            delete_user=TEST_USER,
            job_rerunnable=True)

    def test_hook_jobobit_delete_running_single_job_as_root_rm(self):
        """
        Run a single rerunable job, but delete as root before completion after
        stopping the MoM. Verify that the jobobit hook is executed.  Then
        restart the mom and verify that the job is restarted and the end
        job hook is executed again.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            restart_moms=True,
            job_rerunnable=True)

    def test_hook_jobobit_delete_running_single_job_as_user_rm(self):
        """
        Run a single rerunable job, but delete as root before completion after
        stopping the MoM. Verify that the jobobit hook is executed.  Then
        restart the mom and verify that the job is restarted and the end
        job hook is executed again.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_user=TEST_USER,
            restart_moms=True,
            job_rerunnable=True)

    def test_hook_jobobit_force_delete_running_single_job_as_root_rm(self):
        """
        Run a single rerunable job, but force delete as root before completion
        after stopping the MoM. Verify that the jobobit hook is executed.  Then
        restart the mom and verify that the jobobit hook is not executed again.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_force=True,
            restart_moms=True,
            job_rerunnable=True)

    def test_hook_jobobit_force_delete_running_single_job_as_user_rm(self):
        """
        Run a single rerunable job, but force delete as user before completion
        after stopping the MoM. Verify that the jobobit hook is executed.  Then
        restart the mom and verify that the jobobit hook is not executed again.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            delete_force=True,
            delete_user=TEST_USER,
            restart_moms=True,
            job_rerunnable=True)

    def test_hook_jobobit_delete_running_array_job_as_root_sm(self):
        """
        Run an array job, but delete as root before completion after stopping
        the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            subjob_count=self.job_array_num_subjobs)

    def test_hook_jobobit_delete_running_array_job_as_user_sm(self):
        """
        Run an array job, but delete as user before completion after stopping
        the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            subjob_count=self.job_array_num_subjobs,
            delete_user=TEST_USER)

    def test_hook_jobobit_force_delete_running_array_job_as_root_sm(self):
        """
        Run an array job, but force delete as root before completion after
        stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            subjob_count=self.job_array_num_subjobs,
            delete_force=True)

    def test_hook_jobobit_force_delete_running_array_job_as_user_sm(self):
        """
        Run an array job, but force delete as user before completion after
        stopping the MoM. Verify that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_delete_running_job_moms_stopped,
            subjob_count=self.job_array_num_subjobs,
            delete_force=True,
            delete_user=TEST_USER)

    # -------------------------------------------------------------------------

    def jobobit_job_running_during_mom_restart(
            self,
            subjob_count=0,
            mom_preserve_jobs=True,
            mom_restart_delayed=False):
        a = {
            'node_fail_requeue': self.job_time_rerun + 60,
        }
        if mom_preserve_jobs:
            mom_stop_kwargs = {'sig': '-INT'}
            mom_start_kwargs = {'args': ['-p']}
        else:
            mom_stop_kwargs = {}
            mom_start_kwargs = {}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.job_submit(
            subjob_count=subjob_count,
            job_time=self.job_time_rerun)
        self.job_verify_started()
        self.moms_stop(**mom_stop_kwargs)
        not mom_restart_delayed or time.sleep(self.job_time_rerun + 10)
        if not mom_preserve_jobs:
            self.rerun_job_ids.update(self.started_job_ids)
            if self.is_array_job:
                self.rerun_job_ids.remove(self.job_id)
            self.job_verify_queued()
            self.check_log_for_jobobit_hook_messages()
        self.moms_start(**mom_start_kwargs)
        if not mom_preserve_jobs:
            self.job_verify_started()
        self.job_verify_ended()

    def test_hook_jobobit_finish_single_job_during_mom_restart(self):
        """
        Run a single rerunable job and restart the MoMs.  Verify that the job
        successfully completes without being rerun and that the jobobit hook
        is executed.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart
        )

    def test_hook_jobobit_finish_single_job_during_mom_restart_delayed(self):
        """
        Run a single rerunable job.  Stop the MoMs long enough for the job to
        complete and then restart the MoMs.  Verify that the job successfully
        completes without being rerun and that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart,
            mom_restart_delayed=True
        )

    def test_hook_jobobit_rerun_single_job_during_mom_restart(self):
        """
        Run a single rerunable job and restart the MoMs.  Verify that the job
        is requeued and successfully completes, and that the jobobit hook is
        executed twice.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart,
            mom_preserve_jobs=False
        )

    def test_hook_jobobit_rerun_single_job_during_mom_restart_delayed(self):
        """
        Run a single rerunable job.  Stop the MoMs long enough for the job to
        complete and then restart the MoMs.  Verify that the job is requeued
        and successfully completes, and that the jobobit hook is executed
        twice.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart,
            mom_preserve_jobs=False,
            mom_restart_delayed=True
        )

    def test_hook_jobobit_finish_array_job_during_mom_restart(self):
        """
        Run an array job and restart the MoMs.  Verify that the subjobs
        successfully complete without being rerun and that the jobobit hook
        is executed.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart,
            subjob_count=self.job_array_num_subjobs
        )

    def test_hook_jobobit_finish_array_job_during_mom_restart_delayed(self):
        """
        Run an array job.  Stop the MoMs long enough for the job to
        complete and then restart the MoMs.  Verify that the job successfully
        completes without being rerun and that the jobobit hook is executed.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart,
            subjob_count=self.job_array_num_subjobs,
            mom_restart_delayed=True
        )

    def test_hook_jobobit_rerun_array_job_during_mom_restart(self):
        """
        Run an array job and restart the MoMs without preserving existing jobs.
        Verify that the subjobs are successfully rerun and that the jobobit
        hook is executed twice for each subjob.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart,
            subjob_count=self.job_array_num_subjobs,
            mom_preserve_jobs=False
        )

    def test_hook_jobobit_rerun_array_job_during_mom_restart_delayed(self):
        """
        Run an array job.  Stop the MoMs long enough for the job to complete
        and then restart the MoMs without preserving existing jobs.  Verify
        that the subjobs are successfully rerun and that the jobobit hook is
        executed twice for each subjob.
        """
        self.run_test_func(
            self.jobobit_job_running_during_mom_restart,
            subjob_count=self.job_array_num_subjobs,
            mom_preserve_jobs=False,
            mom_restart_delayed=True
        )

    # -------------------------------------------------------------------------

    # TODO: Test aborted single/array job for going over time.

    # TODO: Test deletion of individual and ranges of subjobs in an array job.

    # TODO: Test delete and rerun of an array job when a subset of the possible
    # subjobs are running.  Verify that the jobobit hooks are called for all
    # jobs/subjobs that were previously started.

    # TODO: Test various scenarios of the server being stopped and restarted,
    # insuring that the jobobit hooks are called for all jobs/subjobs that were
    # previously started.

    # TODO: Test deletion of job during provisioning to insure that the jobobit
    # hook is not run.


================================================
FILE: test/tests/functional/pbs_hook_management.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import datetime
import os
import sys
import socket
import textwrap
import time
from pprint import pformat
from ptl.utils.pbs_testsuite import generate_hook_body_from_func

from tests.functional import *
from tests.functional import JOB, MGR_CMD_SET, SERVER, TEST_USER, ATTR_h, Job


def get_hook_body(hook_msg):
    hook_body = """
    import pbs
    e = pbs.event()
    m = e.management
    pbs.logmsg(pbs.LOG_DEBUG, '%s')
    """ % hook_msg
    hook_body = textwrap.dedent(hook_body)
    return hook_body


def get_hook_body_str(hook_msg):
    hook_body = """
    import pbs
    e = pbs.event()
    m = e.management
    for a in m.attribs:
        pbs.logmsg(pbs.LOG_DEBUG, str(a))
    pbs.logmsg(pbs.LOG_DEBUG, '%s')
    """ % hook_msg
    hook_body = textwrap.dedent(hook_body)
    return hook_body


def hook_accept(hook_msg):
    import pbs
    e = pbs.event()
    m = e.management
    pbs.logmsg(pbs.LOG_DEBUG, hook_msg)
    e.accept()


def hook_reject(hook_msg):
    import pbs
    e = pbs.event()
    m = e.management
    pbs.logmsg(pbs.LOG_DEBUG, hook_msg)
    e.reject()


def get_hook_body_reject_with_text(hook_msg, bad_message="badmsg"):
    hook_body = """
    import pbs
    e = pbs.event()
    m = e.management
    pbs.logmsg(pbs.LOG_DEBUG, '%s')
    e.reject('%s')
    """ % (hook_msg, bad_message)
    hook_body = textwrap.dedent(hook_body)
    return hook_body


def get_hook_body_traceback(hook_msg, bad_message="badmsg"):
    hook_body = """
    import pbs
    e = pbs.event()
    m = e.management
    pbs.logmsg(pbs.LOG_DEBUG, '%s')
    raise Exception('%s')
    """ % (hook_msg, bad_message)
    hook_body = textwrap.dedent(hook_body)
    return hook_body


def get_hook_body_sleep(hook_msg, sleeptime=0.0):
    hook_body = """
    import pbs
    import time
    e = pbs.event()
    m = e.management
    pbs.logmsg(pbs.LOG_DEBUG, '%s')
    time.sleep(%s)
    e.accept()
    """ % (hook_msg, sleeptime)
    hook_body = textwrap.dedent(hook_body)
    return hook_body


def hook_attrs_func(hook_msg):
    def get_traceback():
        import sys
        import traceback
        (exc_cls, exc, tracbk) = sys.exc_info()
        exc_str = traceback.format_exception_only(exc_cls, exc)[0]
        stack = traceback.format_tb(tracbk)
        tracebacklst = []
        tracebacklst.append("EX(%s)" % (exc_str.strip()))
        for stackpiece in stack:
            stackpiece = stackpiece.strip().replace("\n", "||")
            tracebacklst.append(stackpiece)
        return tracebacklst

    attributes = ["cmd", "objtype", "objname", "request_time",
                  "reply_code", "reply_auxcode", "reply_choice",
                  "reply_text", 'attribs']
    import pbs
    from datetime import datetime
    missing = []
    e = pbs.event()
    try:
        import sys
        import pbs_ifl
        from pprint import pformat
        m = e.management
        # pbs.logmsg(pbs.LOG_DEBUG, str(dir(pbs)))
        # pbs.logmsg(pbs.LOG_DEBUG, str(dir(e)))
        # pbs.logmsg(pbs.LOG_DEBUG, str(dir(m)))
        for attr in attributes:
            if not hasattr(m, attr):
                missing.append(attr)
            else:
                value = getattr(m, attr)
                value_lst = []
                if attr == 'attribs':
                    if type(value) == list:
                        for obj in value:
                            value_dct = {}
                            value_dct['name'] = obj.name
                            value_dct['value'] = obj.value
                            value_dct['flags'] = obj.flags
                            subvalue_lst = []
                            for k, v in pbs.REVERSE_ATR_VFLAGS.items():
                                if int(k) & int(obj.flags):
                                    subvalue_lst.append(str(v))
                            value_dct[f"flags_lst"] = subvalue_lst
                            value_dct['op'] = obj.op
                            try:
                                value_dct[f"op_str"] = \
                                    pbs.REVERSE_BATCH_OPS[obj.op]
                            except Exception as err:
                                value_dct[f"op_str"] = "?"
                            value_dct['resource'] = obj.resource
                            value_dct['sisters'] = obj.sisters
                            value_lst.append(value_dct)
                elif attr == 'objtype':
                    value_str = pbs.REVERSE_MGR_OBJS[value]
                    pbs.logmsg(pbs.LOG_DEBUG, f"{attr}=>{value_str} "
                                              f"(reversed)")
                elif attr == 'reply_choice':
                    value_str = pbs.REVERSE_BRP_CHOICES[value]
                    pbs.logmsg(pbs.LOG_DEBUG, f"{attr}=>{value_str} "
                                              f"(reversed)")
                elif attr == 'cmd':
                    value_str = pbs.REVERSE_MGR_CMDS[value]
                    pbs.logmsg(pbs.LOG_DEBUG, f"{attr}=>{value_str} "
                                              f"(reversed)")
                if attr == 'attribs':
                    for idx, dct in enumerate(value_lst):
                        dct_lst = []
                        for key, value in dct.items():
                            dct_lst.append(f"{key}:{value}")
                        # need to sort the list to allow for the test to
                        # find the string correctly.
                        dct_lst = sorted(dct_lst)
                        dct_lst_str = f"{attr}[{idx}]=>{','.join(dct_lst)}"
                        pbs.logmsg(pbs.LOG_DEBUG, f"{dct_lst_str} "
                                                  f"(stringified)")
                pbs.logmsg(pbs.LOG_DEBUG, f"{attr}=>{value}")
        if len(missing) > 0:
            pbs.logmsg(pbs.LOG_DEBUG, "Hook, processed normally.")
            e.reject("missing attributes in pbs:" + ",".join(missing))
        else:
            pbs.logmsg(pbs.LOG_DEBUG, 'all attributes found in pbs')
            pbs.logmsg(pbs.LOG_DEBUG, hook_msg)
            pbs.logmsg(pbs.LOG_DEBUG, "Hook, processed normally.")
            e.accept()
    except Exception as err:
        now_str = datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S.%f")
        pbs.logmsg(pbs.LOG_DEBUG, "%s|Error in hook:%s" %
                   (now_str, '||'.join(get_traceback()).replace("\n", "|||")))
        pbs.logmsg(pbs.LOG_DEBUG, "Error in hook:%s" % str(err))
        # errstr = str(sys.exc_info()[:2])
        # errstr = errstr.replace('\n', '||')
        # pbs.logmsg(pbs.LOG_DEBUG, "Error in hook:%s" % errstr)
        e.reject("a hook error has occurred")


@tags('hooks', 'smoke')
class TestHookManagement(TestFunctional):

    def test_hook_00(self):
        """
        By creating an import hook, it executes a management hook.
        """
        self.logger.info("**************** HOOK START ****************")
        hook_name = "management"
        hook_msg = 'running management hook_00'
        hook_body = get_hook_body(hook_msg)
        attrs = {'event': 'management', 'enabled': 'True'}
        start_time = time.time()
        ret = self.server.create_hook(hook_name, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name)
        ret = self.server.import_hook(hook_name, hook_body)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name)
        ret = self.server.delete_hook(hook_name)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name)

        self.server.log_match(hook_msg, starttime=start_time)
        self.logger.info("**************** HOOK END ****************")

    def test_hook_01(self):
        """
        By creating an import hook, it executes a management hook.
        Create three hooks, and create, import and delete each one.
        """
        self.logger.info("**************** HOOK START ****************")
        hook_msg = 'running management hook_01'
        hook_body = get_hook_body(hook_msg)
        attrs = {'event': 'management', 'enabled': 'True'}
        start_time = time.time()
        for hook_name in ['a1234', 'b1234', 'c1234']:
            self.logger.info("hook_name:%s" % hook_name)
            ret = self.server.create_hook(hook_name, attrs)
            self.assertEqual(ret, True, "Could not create hook %s" % hook_name)
            ret = self.server.import_hook(hook_name, hook_body)
            self.assertEqual(ret, True, "Could not import hook %s" % hook_name)
            ret = self.server.delete_hook(hook_name)
            self.assertEqual(ret, True, "Could not delete hook %s" % hook_name)
            self.server.log_match(hook_msg, starttime=start_time)
        self.logger.info("**************** HOOK END ****************")

    def test_hook_02(self):
        """
        By creating an import hook, it executes a management hook.
        Create three hooks serially, then delete them out of order.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'a1234'
        hook_name_01 = 'b1234'
        hook_name_02 = 'c1234'
        hook_msg_00 = 'running management hook_02 name:%s' % hook_name_00
        hook_body_00 = get_hook_body(hook_msg_00)
        hook_msg_01 = 'running management hook_02 name:%s' % hook_name_01
        hook_body_01 = get_hook_body(hook_msg_01)
        hook_msg_02 = 'running management hook_02 name:%s' % hook_name_02
        hook_body_02 = get_hook_body(hook_msg_02)

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)
        ret = self.server.create_hook(hook_name_01, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_01)
        ret = self.server.create_hook(hook_name_02, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_02)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_01, hook_body_01)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_01)
        ret = self.server.import_hook(hook_name_02, hook_body_02)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_02)

        # out of order delete
        ret = self.server.delete_hook(hook_name_01)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_01)
        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)
        ret = self.server.delete_hook(hook_name_02)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_02)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match(hook_msg_01, starttime=start_time)
        self.server.log_match(hook_msg_02, starttime=start_time)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_03(self):
        """
        By creating an import hook, it executes a management hook.
        Also sets debug to True.
        """
        self.logger.info("**************** HOOK START ****************")
        hook_name_a = "management_03a"
        hook_msg_a = 'running management hook_03a'
        hook_body_a = get_hook_body(hook_msg_a)
        attrs = {'event': 'management', 'enabled': 'True', 'debug': 'True'}
        start_time_a = time.time()
        ret = self.server.create_hook(hook_name_a, attrs)
        self.assertEqual(ret, True, f"Could not create hook {hook_name_a}")
        ret = self.server.import_hook(hook_name_a, hook_body_a)
        self.assertEqual(ret, True, f"Could not import hook {hook_name_a}")

        self.server.add_resource("management_03_1_resource", type="string")

        hook_name_b = "management_03b"
        hook_msg_b = 'running management hook_03b'
        hook_body_b = get_hook_body(hook_msg_b)
        attrs = {'event': 'management', 'enabled': 'True', 'debug': 'True'}
        start_time_b = time.time()
        ret = self.server.create_hook(hook_name_b, attrs)
        self.assertEqual(ret, True, f"Could not create hook {hook_name_b}")
        ret = self.server.import_hook(hook_name_b, hook_body_b)
        self.assertEqual(ret, True, f"Could not import hook {hook_name_b}")

        self.server.add_resource("management_03_2_resource", type="string")
        self.server.add_resource("management_03_3_resource", type="string")
        self.server.delete_resources()

        ret = self.server.delete_hook(hook_name_a)
        self.assertEqual(ret, True, f"Could not delete hook {hook_name_a}")
        ret = self.server.delete_hook(hook_name_b)
        self.assertEqual(ret, True, f"Could not delete hook {hook_name_b}")

        self.server.log_match(hook_msg_a, starttime=start_time_a)
        self.server.log_match(hook_msg_b, starttime=start_time_b)
        self.logger.info("**************** HOOK END ****************")

    def test_hook_04(self):
        """
        By creating an import hook, it executes a management hook.
        Also sets debug to False.
        """
        self.logger.info("**************** HOOK START ****************")
        hook_name_a = "management_03a"
        hook_msg_a = 'running management hook_03a'
        hook_body_a = get_hook_body(hook_msg_a)
        attrs = {'event': 'management', 'enabled': 'True',
                 'debug': 'True', 'order': 2}
        start_time_a = time.time()
        ret = self.server.create_hook(hook_name_a, attrs)
        self.assertEqual(ret, True, f"Could not create hook {hook_name_a}")
        ret = self.server.import_hook(hook_name_a, hook_body_a)
        self.assertEqual(ret, True, f"Could not import hook {hook_name_a}")

        self.server.add_resource("management_03_1_resource", type="string")

        hook_name_b = "management_03b"
        hook_msg_b = 'running management hook_03b'
        hook_body_b = get_hook_body(hook_msg_b)
        attrs = {'event': 'management', 'enabled': 'False', 'debug': 'False'}
        start_time_b = time.time()
        ret = self.server.create_hook(hook_name_b, attrs)
        self.assertEqual(ret, True, f"Could not create hook {hook_name_b}")
        ret = self.server.import_hook(hook_name_b, hook_body_b)
        self.assertEqual(ret, True, f"Could not import hook {hook_name_b}")
        ret = self.server.import_hook(hook_name_b, hook_body_b)

        attrs = {'enabled': 'true'}
        self.logger.info(f"Enabling {hook_name_b}...")
        rc = self.server.manager(MGR_CMD_SET, HOOK, attrs, id=hook_name_b)
        self.logger.info(f"Result for {hook_name_b}->{rc}")

        self.server.add_resource("management_03_2_resource", type="string")
        self.server.add_resource("management_03_3_resource", type="string")
        self.server.delete_resources()

        ret = self.server.delete_hook(hook_name_a)
        self.assertEqual(ret, True, f"Could not delete hook {hook_name_a}")
        ret = self.server.delete_hook(hook_name_b)
        self.assertEqual(ret, True, f"Could not delete hook {hook_name_b}")

        self.server.log_match(hook_msg_a, starttime=start_time_a)
        self.server.log_match(hook_msg_b, starttime=start_time_b)
        self.logger.info("**************** HOOK END ****************")

    def test_hook_str_00(self):
        """
        By creating an import hook, it executes a management hook.
        """
        self.logger.info("**************** HOOK START ****************")
        hook_name = "management"
        hook_msg = 'running management hook_str_00'
        hook_body = get_hook_body_str(hook_msg)
        attrs = {'event': 'management', 'enabled': 'True'}
        start_time = time.time()
        ret = self.server.create_hook(hook_name, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name)
        ret = self.server.import_hook(hook_name, hook_body)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name)
        ret = self.server.delete_hook(hook_name)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name)

        self.server.log_match(hook_msg, starttime=start_time)
        self.logger.info("**************** HOOK END ****************")

    def test_hook_accept_00(self):
        """
        Tests the event.accept() of a hook.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'a1234'
        hook_name_01 = 'b1234'
        hook_name_02 = 'c1234'
        hook_msg_00 = 'running management hook_accept_00 name:%s' % \
                      hook_name_00
        hook_body_00 = get_hook_body(hook_msg_00)
        hook_msg_01 = 'running management hook_accept_00 name:%s' % \
                      hook_name_01
        hook_body_01 = get_hook_body(hook_msg_01)
        hook_msg_02 = 'running management hook_accept_00 name:%s' % \
                      hook_name_02
        hook_body_02 = get_hook_body(hook_msg_02)

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)
        ret = self.server.create_hook(hook_name_01, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_01)
        ret = self.server.create_hook(hook_name_02, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_02)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_01, hook_body_01)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_01)
        ret = self.server.import_hook(hook_name_02, hook_body_02)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_02)

        # out of order delete
        ret = self.server.delete_hook(hook_name_01)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_01)
        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)
        ret = self.server.delete_hook(hook_name_02)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_02)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match(hook_msg_01, starttime=start_time)
        self.server.log_match(hook_msg_02, starttime=start_time)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_reject_00(self):
        """
        Tests the event.reject() of a hook.  The third hook will not fire
        due to the second calling reject.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'a1234'
        hook_name_01 = 'b1234'
        hook_name_02 = 'c1234'
        hook_msg_00 = 'running management hook_reject_00 name:%s' % \
                      hook_name_00
        hook_body_00 = get_hook_body(hook_msg_00)
        hook_msg_01 = 'running management hook_reject_00 name:%s' % \
                      hook_name_01
        hook_body_01 = generate_hook_body_from_func(hook_reject, hook_msg_01)
        hook_msg_02 = 'running management hook_reject_00 name:%s' % \
                      hook_name_02
        hook_body_02 = get_hook_body(hook_msg_02)

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)
        ret = self.server.create_hook(hook_name_01, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_01)
        ret = self.server.create_hook(hook_name_02, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_02)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)
        self.server.log_match("%s;created at request" % hook_name_01,
                              starttime=start_time)
        self.server.log_match("%s;created at request" % hook_name_02,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_01, hook_body_01)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_01)
        ret = self.server.import_hook(hook_name_02, hook_body_02)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_02)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match(hook_msg_01, starttime=start_time)
        # we should not see vvv it vvv fire because ^^^ b1234 ^^^ rejects
        self.server.log_match(hook_msg_02, starttime=start_time,
                              existence=False)

        # out of order delete, make sure the reject hook is last
        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)
        ret = self.server.delete_hook(hook_name_02)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_02)
        # reject hook
        ret = self.server.delete_hook(hook_name_01)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_01)

        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)
        self.server.log_match("%s;deleted at request of" % hook_name_01,
                              starttime=start_time)
        self.server.log_match("%s;deleted at request of" % hook_name_02,
                              starttime=start_time)

    def test_hook_reject_01(self):
        """
        Tests the event.reject() of a hook.  All hooks should fire.  The
        second hook is added last thus all three will fire.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'a1234'
        hook_name_01 = 'b1234'
        hook_name_02 = 'c1234'
        hook_msg_00 = 'running management hook_reject_00 name:%s' % \
                      hook_name_00
        hook_body_00 = get_hook_body(hook_msg_00)
        hook_msg_01 = 'running management hook_reject_00 name:%s' % \
                      hook_name_01
        hook_body_01 = generate_hook_body_from_func(hook_reject, hook_msg_01)
        hook_msg_02 = 'running management hook_reject_00 name:%s' % \
                      hook_name_02
        hook_body_02 = get_hook_body(hook_msg_02)

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)
        ret = self.server.create_hook(hook_name_01, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_01)
        ret = self.server.create_hook(hook_name_02, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_02)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)
        self.server.log_match("%s;created at request" % hook_name_01,
                              starttime=start_time)
        self.server.log_match("%s;created at request" % hook_name_02,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_02, hook_body_02)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_02)
        # the bad one
        ret = self.server.import_hook(hook_name_01, hook_body_01)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_01)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match(hook_msg_02, starttime=start_time)
        self.server.log_match(hook_msg_01, starttime=start_time)

        # out of order delete, make sure the reject hook is last
        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)
        ret = self.server.delete_hook(hook_name_02)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_02)
        # reject hook
        ret = self.server.delete_hook(hook_name_01)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_01)

        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)
        self.server.log_match("%s;deleted at request of" % hook_name_01,
                              starttime=start_time)
        self.server.log_match("%s;deleted at request of" % hook_name_02,
                              starttime=start_time)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_reject_02(self):
        """
        Tests the event.reject() of a hook.  The hook will fire and reject
        with a message.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'd1234'
        hook_msg_00 = 'running management hook_reject_02 name:%s' % \
                      hook_name_00
        hook_bad_msg = "badmessagetext"
        hook_body_00 = get_hook_body_reject_with_text(hook_msg_00,
                                                      hook_bad_msg)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match(hook_bad_msg, starttime=start_time)

        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)

        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_traceback_00(self):
        """
        Tests a traceback in a hook.  The hook will fire and reject
        with a message.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'e1234'
        hook_msg_00 = 'running management hook_traceback_00 name:%s' % \
                      hook_name_00
        hook_bad_msg = "badmessagetext"
        hook_body_00 = get_hook_body_traceback(hook_msg_00,
                                               hook_bad_msg)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match(hook_bad_msg, starttime=start_time)

        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)

        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)

        self.server.log_match("hook '%s' encountered an exception"
                              % hook_name_00, starttime=start_time)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_alarm_00(self):
        """
        Tests a alarm with a hook.  The hook will fire and reject
        with a message.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True', 'alarm': 1}

        hook_name_00 = 'f1234'
        hook_msg_00 = 'running management hook_alarm_00 name:%s' % \
                      hook_name_00
        hook_body_00 = get_hook_body_sleep(hook_msg_00, sleeptime=2.0)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)

        self.server.log_match("alarm call while running management hook '%s'"
                              % hook_name_00, starttime=start_time)

        self.server.log_match(hook_msg_00, starttime=start_time)

        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)

        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)

        self.logger.info("**************** HOOK END ****************")

        self.logger.info("**************** HOOK END ****************")

    def test_hook_import_00(self):
        """
        Test for a set of the management hook attributes.
        """

        def _get_hook_body(hook_msg):
            attributes = ["MGR_CMD_NONE", "MGR_CMD_CREATE", "MGR_CMD_DELETE",
                          "MGR_CMD_SET", "MGR_CMD_UNSET", "MGR_CMD_LIST",
                          "MGR_CMD_PRINT", "MGR_CMD_ACTIVE", "MGR_CMD_IMPORT",
                          "MGR_CMD_EXPORT", "MGR_CMD_LAST", "MGR_OBJ_NONE",
                          "MGR_OBJ_SERVER", "MGR_OBJ_QUEUE", "MGR_OBJ_JOB",
                          "MGR_OBJ_NODE", "MGR_OBJ_RESV", "MGR_OBJ_RSC",
                          "MGR_OBJ_SCHED", "MGR_OBJ_HOST", "MGR_OBJ_HOOK",
                          "MGR_OBJ_PBS_HOOK", "MGR_OBJ_LAST"]
            hook_body = """
            import pbs
            import pbs_ifl
            attributes = %s
            missing = []
            e = pbs.event()
            for attr in attributes:
                if not hasattr(pbs, attr):
                    missing.append(attr)
            if len(missing) > 0:
                e.reject("missing attributes in pbs:" + ",".join(missing))
            else:
                pbs.logmsg(pbs.LOG_DEBUG, 'all attributes found in pbs')
                pbs.logmsg(pbs.LOG_DEBUG, 'dir(pbs_ifl):')
                pbs.logmsg(pbs.LOG_DEBUG, str(dir(pbs_ifl)))
                pbs.logmsg(pbs.LOG_DEBUG, 'dir(pbs):')
                pbs.logmsg(pbs.LOG_DEBUG, str(dir(pbs)))
                m = e.management
                pbs.logmsg(pbs.LOG_DEBUG, '%s')
                e.accept()
            """ % (attributes, hook_msg)
            hook_body = textwrap.dedent(hook_body)
            return hook_body

        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'g1234'
        hook_msg_00 = 'running management hook_import_00 name:%s' % \
                      hook_name_00
        hook_body_00 = _get_hook_body(hook_msg_00)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)

        self.server.log_match(hook_msg_00, starttime=start_time)

        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)

        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)

        self.server.log_match("missing attributes in pbs",
                              starttime=start_time, existence=False)
        self.server.log_match("all attributes found in pbs",
                              starttime=start_time, existence=True)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_attrs_00(self):
        """
        Test for a set of the management hook attributes.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'h1234'
        hook_msg_00 = 'running management hook_import_00 name:%s' % \
                      hook_name_00
        hook_body_00 = generate_hook_body_from_func(hook_attrs_func,
                                                    hook_msg_00)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match("cmd=>7", starttime=start_time)
        self.server.log_match("objtype=>8", starttime=start_time)
        self.server.log_match("objname=>%s" % hook_name_00,
                              starttime=start_time)
        self.server.log_match("reply_code=>0", starttime=start_time)
        self.server.log_match("reply_auxcode=>0", starttime=start_time)
        self.server.log_match("reply_choice=>1", starttime=start_time)
        self.server.log_match("reply_text=>None", starttime=start_time)

        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)

        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)

        self.server.log_match("missing attributes in pbs",
                              starttime=start_time, existence=False)
        self.server.log_match("all attributes found in pbs",
                              starttime=start_time, existence=True)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_attrs_01(self):
        """
        Test for a set of the management hook attributes.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'i1234'
        hook_msg_00 = 'running management hook_import_00 name:%s' % \
                      hook_name_00
        hook_body_00 = generate_hook_body_from_func(hook_attrs_func,
                                                    hook_msg_00)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match("cmd=>7", starttime=start_time)
        self.server.log_match("objtype=>8", starttime=start_time)
        self.server.log_match("objname=>%s" % hook_name_00,
                              starttime=start_time)
        self.server.log_match("reply_code=>0", starttime=start_time)
        self.server.log_match("reply_auxcode=>0", starttime=start_time)
        self.server.log_match("reply_choice=>1", starttime=start_time)
        self.server.log_match("reply_text=>None", starttime=start_time)

        # run a qmgr command and import the script.
        hook_name_01 = 'i1234accept'
        hook_msg_01 = "%s accept hook" % hook_name_01
        hook_body_01 = generate_hook_body_from_func(hook_accept, hook_msg_01)
        attrs = {'event': 'queuejob', 'enabled': 'True'}
        ret = self.server.create_hook(hook_name_01, attrs)
        ret = self.server.import_hook(hook_name_01, hook_body_01)

        # we don't need to run a job, we just want to check the attributes.
        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match("cmd=>0", starttime=start_time)
        self.server.log_match("objtype=>8", starttime=start_time)
        self.server.log_match("objname=>%s" % hook_name_01,
                              starttime=start_time)
        self.server.log_match("reply_code=>0", starttime=start_time)
        self.server.log_match("reply_auxcode=>0", starttime=start_time)
        self.server.log_match("reply_choice=>1", starttime=start_time)
        self.server.log_match("reply_text=>None", starttime=start_time)
        self.server.log_match("server_priv/hooks/%s.PY" % hook_name_01,
                              starttime=start_time)

        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)
        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)
        ret = self.server.delete_hook(hook_name_01)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_01)
        self.server.log_match("%s;deleted at request of" % hook_name_01,
                              starttime=start_time)
        self.server.log_match("missing attributes in pbs",
                              starttime=start_time, existence=False)
        self.server.log_match("all attributes found in pbs",
                              starttime=start_time, existence=True)

        self.logger.info("**************** HOOK END ****************")

    def test_hook_attrs_02(self):
        """
        Test for a set of the management hook attributes.
        """
        self.logger.info("**************** HOOK START ****************")
        attrs = {'event': 'management', 'enabled': 'True'}

        hook_name_00 = 'j1234'
        hook_msg_00 = 'running management hook_import_00 name:%s' % \
                      hook_name_00
        hook_body_00 = generate_hook_body_from_func(hook_attrs_func,
                                                    hook_msg_00)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

        start_time = time.time()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertEqual(ret, True, "Could not create hook %s" % hook_name_00)

        self.server.log_match("%s;created at request" % hook_name_00,
                              starttime=start_time)

        ret = self.server.import_hook(hook_name_00, hook_body_00)
        self.assertEqual(ret, True, "Could not import hook %s" % hook_name_00)

        self.server.log_match(hook_msg_00, starttime=start_time)
        self.server.log_match("cmd=>7", starttime=start_time)
        self.server.log_match("objtype=>8", starttime=start_time)
        self.server.log_match("objname=>%s" % hook_name_00,
                              starttime=start_time)
        self.server.log_match("reply_code=>0", starttime=start_time)
        self.server.log_match("reply_auxcode=>0", starttime=start_time)
        self.server.log_match("reply_choice=>1", starttime=start_time)
        self.server.log_match("reply_text=>None", starttime=start_time)

        for mom in self.server.moms.values():
            start_time_mom = time.time()
            self.logger.error(f"deleting and creating\n"
                              f"mom.hostname:{mom.hostname}\n"
                              f"mom.fqdn:{mom.fqdn}\n"
                              f"mom.name:{mom.name}\n"
                              f"mom.__dict__:{mom.__dict__}\n"
                              )
            # self.server.delete_node(mom.shortname)
            # self.server.create_node(mom.shortname)
            self.server.manager(MGR_CMD_SET, NODE,
                                {'resources_available.ncpus': '700000'},
                                id=mom.shortname)
            self.server.manager(MGR_CMD_UNSET, NODE,
                                'resources_available.ncpus',
                                id=mom.shortname)

            a = {'max_run_res_soft.ncpus': "[u:" + str(TEST_USER1) + "=2]"}
            self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')
            self.server.manager(MGR_CMD_UNSET, QUEUE,
                                'max_run_res_soft.ncpus', 'workq')

            self.server.log_match("cmd=>MGR_CMD_SET",
                                  starttime=start_time_mom)
            self.server.log_match("objtype=>MGR_OBJ_NODE",
                                  starttime=start_time_mom)
            self.server.log_match("objname=>%s" % mom.shortname,
                                  starttime=start_time_mom)
            match = self.server.log_match("attribs[0]=>flags:0,flags_lst:[]",
                                          starttime=start_time_mom,
                                          existence=True,
                                          allmatch=True,
                                          n="ALL")
            self.logger.info(pformat(match))
            match = self.server.log_match("(stringified)",
                                          starttime=start_time_mom,
                                          allmatch=True,
                                          n="ALL"
                                          )
            self.logger.info(pformat(match))
            match = self.server.log_match("resources_available.ncpus",
                                          starttime=start_time_mom,
                                          allmatch=True,
                                          n="ALL"
                                          )
            self.logger.info(pformat(match))
            match = self.server.log_match("max_run_res_soft.ncpus",
                                          starttime=start_time_mom,
                                          allmatch=True,
                                          n="ALL"
                                          )
            self.logger.info(pformat(match))
            match = self.server.log_match("Hook, processed normally.",
                                          starttime=start_time_mom)
            self.logger.info(pformat(match))
            try:
                match = self.server.log_match("Error in hook",
                                              starttime=start_time_mom,
                                              existence=False)
            except Exception:
                match = self.server.log_match("Error in hook",
                                              starttime=start_time_mom,
                                              existence=True,
                                              allmatch=True,
                                              n="ALL")
                self.logger.info(pformat(match))
                raise

            self.server.log_match("attribs[0]=>flags:0,flags_lst:[],name:reso"
                                  "urces_available,op:0,op_str:BATCH_OP_SET,r"
                                  "esource:ncpus,sisters:[],value:700000 (str"
                                  "ingified)",
                                  starttime=start_time_mom)
            self.server.log_match("attribs[0]=>flags:0,flags_lst:[],name:reso"
                                  "urces_available,op:1,op_str:BATCH_OP_UNSET"
                                  ",resource:ncpus,sisters:[],value: (stringi"
                                  "fied)",
                                  starttime=start_time_mom)
        ret = self.server.delete_hook(hook_name_00)
        self.assertEqual(ret, True, "Could not delete hook %s" % hook_name_00)
        self.server.log_match("%s;deleted at request of" % hook_name_00,
                              starttime=start_time)

        self.server.log_match("missing attributes in pbs",
                              starttime=start_time, existence=False)
        self.server.log_match("all attributes found in pbs",
                              starttime=start_time, existence=True)

        self.logger.info("**************** HOOK END ****************")


================================================
FILE: test/tests/functional/pbs_hook_modifyvnode_state_changes.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import socket
import logging
import textwrap
from pprint import pformat
from tests.functional import *
from ptl.utils.pbs_dshutils import get_method_name


node_states = {
    'ND_STATE_FREE': 0,
    'ND_STATE_OFFLINE': 1,
    'ND_STATE_DOWN': 2,
    'ND_STATE_DELETED': 4,
    'ND_STATE_UNRESOLVABLE': 8,
    'ND_STATE_STALE': 32,
    'ND_STATE_JOBBUSY': 16,
    'ND_STATE_JOB_EXCLUSIVE': 64,
    'ND_STATE_RESV_EXCLUSIVE': 8192,
    'ND_STATE_BUSY': 128,
    'ND_STATE_UNKNOWN': 256,
    'ND_STATE_NEEDS_HELLOSVR': 512,
    'ND_STATE_INIT': 1024,
    'ND_STATE_PROV': 2048,
    'ND_STATE_WAIT_PROV': 4096,
    'ND_STATE_SLEEP': 262144,
    'ND_STATE_OFFLINE_BY_MOM': 16384,
    'ND_STATE_MARKEDDOWN': 32768,
    'ND_STATE_NEED_ADDRS': 65536,
    'ND_STATE_MAINTENANCE': 131072,
    'ND_STATE_NEED_CREDENTIALS': 524288,
    'ND_STATE_VNODE_UNAVAILABLE': 409903
}


def get_hook_body_modifyvnode_param_rpt():
    hook_body = """
    import pbs
    import sys
    try:
        e = pbs.event()
        v = e.vnode
        v_o = e.vnode_o
        lsct = v.last_state_change_time
        lsct_o = v_o.last_state_change_time
        state_str_buf_v = ",".join(v.extract_state_strs())
        state_str_buf_v_o = ",".join(v_o.extract_state_strs())
        state_int_buf_v = ','.join([str(_) for _ in v.extract_state_ints()])
        state_int_buf_v_o = ','.join(
            [str(_) for _ in v_o.extract_state_ints()])
        # print show_vnode_state record (bi consumable)
        svs1_data = "v.state_hex=%s v_o.state_hex=%s v.state_strs=%s " \
                    "v_o.state_strs=%s" % \
                    (hex(v.state), hex(v_o.state), state_str_buf_v,
                     state_str_buf_v_o)
        svs2_data = "v.state_ints=%s v_o.state_ints=%s v.lsct=%s " \
                    "v_o.lsct=%s" % \
                    (state_int_buf_v, state_int_buf_v_o, str(lsct),
                     str(lsct_o))
        svs_data = "%s %s" % (svs1_data, svs2_data)
        pbs.logmsg(pbs.LOG_DEBUG,
                   "show_vnode_state;name=%s %s" % (v.name, svs_data))
        # print additional hook parameter values
        pbs.logmsg(pbs.LOG_DEBUG, "name: v=%s, v_o=%s" % (v.name, v_o.name))
        pbs.logmsg(pbs.LOG_DEBUG,
                   "state: v=%s, v_o=%s" % (hex(v.state), hex(v_o.state)))
        pbs.logmsg(pbs.LOG_DEBUG, "last_state_change_time: v=%s, v_o=%s" % (
                   str(lsct), str(lsct_o)))
        pbs.logmsg(pbs.LOG_DEBUG,
                   "comment: v=%s, v_o=%s" % (v.comment, v_o.comment))
        pbs.logmsg(pbs.LOG_DEBUG,
                   "aoe: v=%s, v_o=%s" % (v.current_aoe, v_o.current_aoe))
        pbs.logmsg(pbs.LOG_DEBUG, "in_mvn_host: v=%s, v_o=%s" % (
                   v.in_multivnode_host, v_o.in_multivnode_host))
        pbs.logmsg(pbs.LOG_DEBUG, "jobs: v=%s, v_o=%s" % (v.jobs, v_o.jobs))
        pbs.logmsg(pbs.LOG_DEBUG, "Mom: v=%s, v_o=%s" % (v.Mom, v_o.Mom))
        pbs.logmsg(pbs.LOG_DEBUG,
                   "ntype: v=%s, v_o=%s" % (hex(v.ntype), hex(v_o.ntype)))
        pbs.logmsg(pbs.LOG_DEBUG, "pcpus: v=%s, v_o=%s" % (v.pcpus, v_o.pcpus))
        pbs.logmsg(pbs.LOG_DEBUG,
                   "pnames: v=%s, v_o=%s" % (v.pnames, v_o.pnames))
        pbs.logmsg(pbs.LOG_DEBUG, "Port: v=%s, v_o=%s" % (v.Port, v_o.Port))
        pbs.logmsg(pbs.LOG_DEBUG,
                   "Priority: v=%s, v_o=%s" % (v.Priority, v_o.Priority))
        pbs.logmsg(pbs.LOG_DEBUG, "provision_enable: v=%s, v_o=%s" % (
                   v.provision_enable, v_o.provision_enable))
        pbs.logmsg(pbs.LOG_DEBUG, "queue: v=%s, v_o=%s" % (v.queue, v_o.queue))
        pbs.logmsg(pbs.LOG_DEBUG, "res_assigned: v=%s, v_o=%s" % (
                   v.resources_assigned, v_o.resources_assigned))
        pbs.logmsg(pbs.LOG_DEBUG, "res_avail: v=%s, v_o=%s" % (
                   v.resources_available, v_o.resources_available))
        pbs.logmsg(pbs.LOG_DEBUG, "resv: v=%s, v_o=%s" % (v.resv, v_o.resv))
        pbs.logmsg(pbs.LOG_DEBUG, "resv_enable: v=%s, v_o=%s" % (
                   v.resv_enable, v_o.resv_enable))
        pbs.logmsg(pbs.LOG_DEBUG,
                   "sharing: v=%s, v_o=%s" % (v.sharing, v_o.sharing))
        # sanity test some values
        if (lsct < lsct_o) or (lsct_o <= 0):
            e.reject("last_state_change_time: bad timestamp value")
        else:
            pbs.logmsg(pbs.LOG_DEBUG, "last_state_change_time: good times")
        if (v.name != v_o.name) or (not v.name):
            e.reject(
                "name: vnode and vnode_o name values are null or mismatched")
        else:
            pbs.logmsg(pbs.LOG_DEBUG, "name: good names")
        if (isinstance(v.state, int)) and (isinstance(v_o.state, int)):
            pbs.logmsg(pbs.LOG_DEBUG, "state: good states")
        else:
            e.reject("state: bad state value")
        if len(v.extract_state_strs()) == len(v.extract_state_ints()):
            pbs.logmsg(pbs.LOG_DEBUG, "state sets: good v sets")
        else:
            e.reject("state sets: bad v sets")
        if len(v_o.extract_state_strs()) == len(v_o.extract_state_ints()):
            pbs.logmsg(pbs.LOG_DEBUG, "state sets: good v_o sets")
        else:
            e.reject("state sets: bad v_o sets")
        e.accept()
    except SystemExit:
        pass
    except:
        pbs.event().reject("%s hook failed with %s" % (
                           pbs.event().hook_name, sys.exc_info()[:2]))
    """
    hook_body = textwrap.dedent(hook_body)
    return hook_body


def get_hook_body_reverse_node_state():
    hook_body = """
    import pbs
    e = pbs.event()
    pbs.logmsg(pbs.LOG_DEBUG, "pbs.__file__:" + pbs.__file__)
    # this is backwards as it's a reverse lookup.
    for value, key in pbs.REVERSE_NODE_STATE.items():
        pbs.logmsg(pbs.LOG_DEBUG, "key:%s value:%s" % (key, value))
    e.accept()
    """
    hook_body = textwrap.dedent(hook_body)
    return hook_body


class TestPbsModifyvnodeStateChanges(TestFunctional):

    """
    Test the modifyvnode hook by inducing various vnode state changes and
    inspecting the pbs log for expected values.
    """

    def setUp(self):
        TestFunctional.setUp(self)
        Job.dflt_attributes[ATTR_k] = 'oe'

    def checkLog(self, start_time, mom, check_up, check_down):
        self.server.log_match("set_vnode_state;vnode.state=",
                              starttime=start_time)
        self.server.log_match("show_vnode_state;name=",
                              starttime=start_time)
        self.server.log_match("name: v=", starttime=start_time)
        self.server.log_match("state: v=", starttime=start_time)
        self.server.log_match("last_state_change_time: v=",
                              starttime=start_time)
        self.server.log_match("good times", starttime=start_time)
        self.server.log_match("good names", starttime=start_time)
        self.server.log_match("good states", starttime=start_time)
        self.server.log_match("good v sets", starttime=start_time)
        self.server.log_match("good v_o sets", starttime=start_time)
        if check_up:
            self.server.log_match("Node;%s;node up" % mom,
                                  starttime=start_time)
        if check_down:
            self.server.log_match("Node;%s;node down" % mom,
                                  starttime=start_time)

    def checkNodeFree(self, start_time):
        self.server.log_match("v.state_hex=0x0",
                              starttime=start_time)
        self.server.log_match("v.state_strs=ND_STATE_FREE",
                              starttime=start_time)
        self.server.log_match("v.state_ints=0",
                              starttime=start_time)

    def checkNodeDown(self, start_time):
        self.server.log_match("v.state_hex=0x2",
                              starttime=start_time)
        self.server.log_match(
            "v.state_strs=ND_STATE_DOWN,ND_STATE_VNODE_UNAVAILABLE",
            starttime=start_time)
        self.server.log_match("v.state_ints=2,409903",
                              starttime=start_time)

    def checkNodeOffline(self, start_time):
        self.server.log_match("v.state_hex=0x1",
                              starttime=start_time)
        self.server.log_match(
            "v.state_strs=ND_STATE_OFFLINE,ND_STATE_VNODE_UNAVAILABLE",
            starttime=start_time)
        self.server.log_match("v.state_ints=1,409903",
                              starttime=start_time)

    def checkNodeResvExclusive(self, start_time):
        self.server.log_match("v.state_hex=0x2000",
                              starttime=start_time)
        self.server.log_match("v.state_strs=ND_STATE_RESV_EXCLUSIVE",
                              starttime=start_time)
        self.server.log_match("v.state_ints=8192",
                              starttime=start_time)

    def checkpreviousStateChain(self, start_time, end_time, mom):
        # Check the state change entries for the specified mom
        search_string = ";show_vnode_state;name=" + mom
        self.logger.info(
            'checkpreviousStateChain search_string='+search_string+' start=' +
            str(start_time)+' end='+str(end_time))

        # Retrieve requested entries from the last 2000 lines of the server log
        lines = self.server.log_match(msg=search_string,
                                      allmatch=True,
                                      starttime=start_time,
                                      endtime=end_time,
                                      tail=True,
                                      n=2000)

        not_first = False
        previous_state = None
        previous_lsct = None
        for tupleline in lines:
            line = tupleline[1]
            head, tail = line.rsplit(';', 1)
            pairs = tail.split(' ')
            line_dict = dict([key_value.split("=", 1) for key_value in pairs])
            self.logger.debug('Examining line: ' + line)
            if not_first:
                # compare current "v_o" values with previous entry's "v" values
                self.assertEqual(
                    previous_state, line_dict['v_o.state_hex'],
                    'Node state chain mismatch! previous_state=%s line=%s' %
                    (previous_state, line))
                self.assertEqual(
                    previous_lsct, line_dict['v_o.lsct'],
                    'Node lsct chain mismatch! previous_lsct=%s line=%s' %
                    (previous_lsct, line))
                self.logger.debug('Current and previous matched!')
            else:
                not_first = True
                self.logger.debug('Setting not_first!')
            # current values become the previous values for the next iteration
            previous_state = line_dict['v.state_hex']
            previous_lsct = line_dict['v.lsct']

    @skipOnCpuSet
    def test_hook_state_changes_00(self):
        """
        Test: induce a variety of vnode state changes with debug turned on
        and inspect the pbs log for expected entries
        """
        if os.getuid() != 0 or sys.platform in ('cygwin', 'win32'):
            self.skipTest("Test need to run as root")

        self.logger.debug("---- %s TEST STARTED ----" % get_method_name(self))

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 4095})
        attrs = {'event': 'modifyvnode', 'enabled': 'True', 'debug': 'True'}
        hook_name_00 = 'm1234'
        hook_body_00 = get_hook_body_modifyvnode_param_rpt()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertTrue(ret, "Could not create hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_00, hook_body_00)

        # print info about the test deployment
        self.logger.debug("socket.gethostname():%s" % socket.gethostname())
        self.logger.debug("***self.server.name:%s" % str(self.server.name))
        self.logger.debug("self.server.moms:%s" % str(self.server.moms))
        self.logger.debug("self.server.hostname=%s" % self.server.hostname)
        nodeinfo = self.server.status(NODE)

        # test effects of various state changes on each mom
        for mom in self.server.moms.values():
            # State change test: mom stop
            start_time = time.time()
            state_chain_start_time = start_time
            mom.stop()
            self.checkLog(start_time, mom.fqdn, check_up=False,
                          check_down=True)
            self.checkNodeDown(start_time)

            # State change test: mom start
            start_time = time.time()
            mom.start()
            self.checkLog(start_time, mom.fqdn, check_up=True,
                          check_down=False)
            self.checkNodeFree(start_time)

            # State change test: mom restart
            start_time = time.time()
            mom.restart()
            self.checkLog(start_time, mom.fqdn, check_up=True,
                          check_down=True)
            self.checkNodeDown(start_time)
            self.checkNodeFree(start_time)

            # State change test: take mom offline then online
            # take offline
            start_time = time.time()
            self.logger.debug("    ***offline mom:%s" % mom)
            self.server.manager(MGR_CMD_SET, NODE, {'state': (INCR,
                                                              'offline')},
                                id=mom.shortname)
            self.checkLog(start_time, mom.fqdn, check_up=False,
                          check_down=False)
            self.checkNodeOffline(start_time)
            # back online
            start_time = time.time()
            self.logger.debug("    ***online mom:%s" % mom)
            self.server.manager(MGR_CMD_SET, NODE, {'state': (DECR,
                                                              'offline')},
                                id=mom.shortname)
            self.checkLog(start_time, mom.fqdn, check_up=False,
                          check_down=False)
            self.checkNodeFree(start_time)

            # State change test: create and release maintenance reservation
            start_time = time.time()
            res_start_time = start_time + 15
            res_end_time = res_start_time + 1
            attrs = {
                'reserve_start': res_start_time,
                'reserve_end': res_end_time
            }
            self.logger.debug("    ***reserve & release mom:%s" % mom)
            rid = self.server.submit(Reservation(ROOT_USER, attrs,
                                                 hosts=[mom.shortname]))
            self.logger.debug("rid=%s" % rid)
            self.checkLog(start_time, mom.fqdn, check_up=False,
                          check_down=False)
            self.checkNodeResvExclusive(start_time)
            self.checkNodeFree(start_time)

            # Verify each preceeding state matches the current previous state
            state_chain_end_time = time.time()
            self.checkpreviousStateChain(state_chain_start_time,
                                         state_chain_end_time,
                                         mom.shortname)

        self.logger.debug("---- %s TEST ENDED ----" % get_method_name(self))

    @tags('smoke')
    def test_check_node_state_constants_00(self):
        """
        Test: verify expected node state constants and associated reverse map
        are defined in the pbs module and contain the expected values.
        """
        self.logger.debug("---- %s TEST STARTED ----" % get_method_name(self))
        self.add_pbs_python_path_to_sys_path()
        import pbs
        self.assertEqual(
            len(pbs.REVERSE_NODE_STATE), len(node_states),
            "node state count mismatch: actual=%s, expected:%s" %
            (len(pbs.REVERSE_NODE_STATE), len(node_states)))
        for attr, value in node_states.items():
            self.logger.debug("checking attribute '%s' in pbs module", attr)
            self.assertTrue(
                hasattr(pbs, attr), "pbs.%s does not exist." % attr)
            self.assertEqual(
                getattr(pbs, attr), value,
                "pbs.%s is incorrect: actual=%s, expected=%s." %
                (attr, getattr(pbs, attr), value))
            self.assertIn(value, pbs.REVERSE_NODE_STATE)
            self.assertEqual(
                pbs.REVERSE_NODE_STATE[value], attr,
                ("pbs.REVERSE_NODE_STATE[%s] is incorrect: actual=%s, " +
                 "expected=%s.") % (value, pbs.REVERSE_NODE_STATE[value],
                                    attr))
        self.logger.debug("---- %s TEST ENDED ----" % get_method_name(self))

    def test_check_node_state_lookup_00(self):
        """
        Test: check for the existence and values of the
        pbs.REVERSE_STATE_CHANGES dictionary

        run a hook that converts a state change hex into a string, then search
        for it in the server log.
        """

        self.add_pbs_python_path_to_sys_path()
        import pbs
        self.logger.debug("---- %s TEST STARTED ----" % get_method_name(self))
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 4095})
        attrs = {'event': 'modifyvnode', 'enabled': 'True', 'debug': 'True'}
        hook_name_00 = 'x1234'
        hook_body_00 = get_hook_body_reverse_node_state()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertTrue(ret, "Could not create hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_00, hook_body_00)
        for mom in self.server.moms.values():
            start_time = time.time()
            mom.restart()
            self.server.log_match("Node;%s;node up" % mom.fqdn,
                                  starttime=start_time)
            self.server.log_match("Node;%s;node down" % mom.fqdn,
                                  starttime=start_time)
            for value, key in pbs.REVERSE_NODE_STATE.items():
                self.server.log_match("key:%s value:%s" % (key, value),
                                      starttime=start_time)
        self.logger.debug("---- %s TEST ENDED ----" % get_method_name(self))

    @skipOnCpuSet
    @tags('smoke')
    def test_hook_state_changes_01(self):
        """
        Test each mom for state changes:
        1.  sigkill the mom; check server log for expected messages
        2.  start the mom; check server log for expected messages
        3.  verify the chain of reported current/previous states is unbroken
        """

        self.logger.debug("---- %s TEST STARTED ----" % get_method_name(self))

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 4095})
        attrs = {'event': 'modifyvnode', 'enabled': 'True', 'debug': 'True'}
        hook_name_00 = 'p1234'
        hook_body_00 = get_hook_body_modifyvnode_param_rpt()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertTrue(ret, "Could not create hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_00, hook_body_00)

        for mom in self.server.moms.values():
            self.logger.debug("    ***sigkilling mom:%s", mom.fqdn)

            start_time = time.time()
            state_chain_start_time = start_time
            mom.signal('-KILL')
            self.checkLog(start_time, mom.fqdn, check_up=False,
                          check_down=True)
            self.checkNodeDown(start_time)

            start_time = time.time()
            mom.start()
            self.checkLog(start_time, mom.fqdn, check_up=True,
                          check_down=False)
            self.checkNodeFree(start_time)

            # Verify each preceeding state matches the current previous state
            state_chain_end_time = time.time()
            self.checkpreviousStateChain(state_chain_start_time,
                                         state_chain_end_time,
                                         mom.shortname)

        self.logger.debug("---- %s TEST ENDED ----" % get_method_name(self))

    @skipOnCpuSet
    def test_hook_state_changes_02(self):
        """
        Test:  stop and start the pbs server; look for proper log messages
        """

        self.logger.debug("---- %s TEST STARTED ----" % get_method_name(self))

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 4095})
        attrs = {'event': 'modifyvnode', 'enabled': 'True', 'debug': 'True'}
        hook_name_00 = 's1234'
        hook_body_00 = get_hook_body_modifyvnode_param_rpt()
        ret = self.server.create_hook(hook_name_00, attrs)
        self.assertTrue(ret, "Could not create hook %s" % hook_name_00)
        ret = self.server.import_hook(hook_name_00, hook_body_00)

        # stop the server and then start it
        start_time = time.time()
        state_chain_start_time = start_time
        self.server.stop()
        self.server.start()

        # look for messages indicating all the vnodes came up
        for mom in self.server.moms.values():
            self.checkLog(start_time, mom.fqdn, check_up=True,
                          check_down=False)
            self.checkNodeFree(start_time)
            # Verify each preceeding state matches the current previous state
            state_chain_end_time = time.time()
            self.checkpreviousStateChain(state_chain_start_time,
                                         state_chain_end_time,
                                         mom.shortname)

        self.logger.debug("---- %s TEST ENDED ----" % get_method_name(self))


================================================
FILE: test/tests/functional/pbs_hook_perf_stat.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_hook_perf_stat(TestFunctional):
    """
    This test suite tests that the hook performance stats are in place
    """

    def setUp(self):
        TestFunctional.setUp(self)
        # ensure LOG_EVENT_DEBUG3 is being recorded to see perf stats
        a = {'log_events': 4095}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.mom.add_config({'$logevent': 4095})
        self.mom.signal('-HUP')

        self.hook_content = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "server hook called")
s = pbs.server()
pbs.logmsg(pbs.LOG_DEBUG, "server data collected for %s" % s.name)
"""
        self.mhook_content = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "mom hook called")
s = pbs.server()
pbs.logmsg(pbs.LOG_DEBUG, "mom data collected for %s" % s.name)
"""

    def test_queuejob_hook(self):
        """
        Test that pbs_server collects performance stats for queuejob hook
        """
        hook_name = 'qhook'
        hook_event = 'queuejob'
        hook_attr = {'enabled': 'true', 'event': hook_event}
        self.server.create_import_hook(hook_name, hook_attr, self.hook_content)

        j = Job(TEST_USER)
        self.server.submit(j)

        hd = "hook_perf_stat"
        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        tr = "profile_start"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                              regexp=True)

        stat = "walltime=.* cputime=.*"
        act = r"action=populate:pbs\.event\(\)\.job\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_func"
        act = r"action=populate:pbs.server\(\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        act = "action=run_code"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)
        tr = "profile_stop"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                              regexp=True)

        lbl = "label=hook_%s_.*" % (hook_event,)
        act = "action=hook_output"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

    def test_modifyjob_hook(self):
        """
        Test that pbs_server collects performance stats for modifyjob hook
        """
        hook_name = 'mhook'
        hook_event = 'modifyjob'
        hook_attr = {'enabled': 'true', 'event': hook_event}
        self.server.create_import_hook(hook_name, hook_attr, self.hook_content)

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.alterjob(jid, {'Priority': 7}, runas=TEST_USER)

        hd = "hook_perf_stat"
        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        tr = "profile_start"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                              regexp=True)

        stat = "walltime=.* cputime=.*"
        act = r"action=populate:pbs\.event\(\)\.job\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs.server\(\).job\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs.server\(\).queue\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs.server\(\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        act = "action=run_code"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)
        tr = "profile_stop"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                              regexp=True)

        lbl = "label=hook_%s_.*" % (hook_event,)
        act = "action=hook_output"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

    def test_movejob_hook(self):
        """
        Test that pbs_server collects performance stats for movejob hook
        """
        hook_name = 'mvhook'
        hook_event = 'movejob'
        hook_attr = {'enabled': 'true', 'event': hook_event}
        self.server.create_import_hook(hook_name, hook_attr, self.hook_content)

        j = Job(TEST_USER, {'Hold_Types': None})
        jid = self.server.submit(j)
        self.server.movejob(jobid=jid, destination="workq")

        hd = "hook_perf_stat"
        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        tr = "profile_start"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                              regexp=True)

        stat = "walltime=.* cputime=.*"
        act = r"action=populate:pbs.server\(\).job\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs.server\(\).queue\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs.server\(\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        act = "action=run_code"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)
        tr = "profile_stop"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                              regexp=True)

        lbl = "label=hook_%s_.*" % (hook_event,)
        act = "action=hook_output"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

    def test_runjob_hook(self):
        """
        Test that pbs_server collects performance stats for runjob hook
        """
        hook_name = 'rhook'
        hook_event = 'runjob'
        hook_attr = {'enabled': 'true', 'event': hook_event}
        self.server.create_import_hook(hook_name, hook_attr, self.hook_content)

        j = Job(TEST_USER)
        self.server.submit(j)

        hd = "hook_perf_stat"
        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        tr = "profile_start"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                              regexp=True)

        stat = "walltime=.* cputime=.*"
        act = r"action=populate:pbs.server\(\).job\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs.server\(\).queue\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs.server\(\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        act = "action=run_code"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)
        tr = "profile_stop"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                              regexp=True)

    def test_resvsub_hook(self):
        """
        Test that pbs_server collects performance stats for resvsub hook
        """
        hook_name = 'rhook'
        hook_event = 'resvsub'
        hook_attr = {'enabled': 'true', 'event': hook_event}
        self.server.create_import_hook(hook_name, hook_attr, self.hook_content)

        r = Reservation(TEST_USER)
        self.server.submit(r)

        hd = "hook_perf_stat"
        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        tr = "profile_start"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                              regexp=True)

        stat = "walltime=.* cputime=.*"
        act = r"action=populate:pbs\.event\(\)\.resv\(.*\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_func"
        act = r"action=populate:pbs.server\(\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        act = "action=run_code"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)
        tr = "profile_stop"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                              regexp=True)

        lbl = "label=hook_%s_.*" % (hook_event,)
        act = "action=hook_output"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

    def test_periodic_hook(self):
        """
        Test that pbs_server collects performance stats for periodic hook
        """
        hook_name = 'phook'
        hook_event = 'periodic'
        hook_attr = {'event': hook_event, 'freq': 5}
        self.server.create_import_hook(hook_name, hook_attr,
                                       self.hook_content, overwrite=True)

        hd = "hook_perf_stat"
        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        tr = "profile_start"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                              regexp=True)

        stat = "walltime=.* cputime=.*"
        act = r"action=populate:pbs\.event\(\)\.vnode_list"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        act = r"action=populate:pbs\.event\(\)\.resv_list"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_func"
        act = r"action=populate:pbs.server\(\)"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        act = "action=run_code"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)
        tr = "profile_stop"
        act = "action=server_process_hooks"
        self.server.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                              regexp=True)

        lbl = "label=hook_%s_.*" % (hook_event,)
        act = "action=hook_output"
        self.server.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                              regexp=True)

    def test_mom_hooks(self):
        """
        Test that pbs_mom collects performance stats for mom hooks
        """
        for hook_event in ['execjob_begin',
                           'execjob_launch',
                           'execjob_prologue',
                           'execjob_epilogue',
                           'execjob_end']:
            hook_name = hook_event.replace('execjob_', '')
            hook_attr = {'enabled': 'true', 'event': hook_event}
            self.server.create_import_hook(hook_name, hook_attr,
                                           self.mhook_content)
        j = Job(TEST_USER)
        j.set_sleep_time(5)
        self.server.submit(j)

        for hook_event in ['execjob_begin',
                           'execjob_launch',
                           'execjob_prologue',
                           'execjob_epilogue',
                           'execjob_end']:
            hook_name = hook_event.replace('execjob_', '')

            hd = "hook_perf_stat"
            lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
            tr = "profile_start"
            act = "action=mom_process_hooks"
            self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                               regexp=True)

            act = "action=pbs_python"
            self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                               regexp=True)

            stat = "walltime=.* cputime=.*"
            act = "action=load_hook_input_file"
            self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                               regexp=True)

            act = "action=start_interpreter"
            self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                               regexp=True)

            act = r"action=populate:pbs\.event\(\)\.job\(.*\)"
            self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                               regexp=True)

            act = "action=run_code"
            self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                               regexp=True)

            act = "action=hook_output:.*"
            self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                               regexp=True)

            tr = "profile_stop"
            act = "action=pbs_python"
            self.mom.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                               regexp=True)

            act = "action=mom_process_hooks"
            self.mom.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                               regexp=True)

    def test_mom_period_hook(self):
        """
        Test that pbs_mom collects performance stats for mom period hooks
        """
        hook_name = "mom_period"
        hook_event = "exechost_periodic"
        hook_attr = {'enabled': 'true', 'event': hook_event}
        self.server.create_import_hook(hook_name, hook_attr,
                                       self.mhook_content)

        hd = "hook_perf_stat"
        lbl = "label=hook_%s_%s_.*" % (hook_event, hook_name)
        tr = "profile_start"
        act = "action=pbs_python"
        self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, tr),
                           regexp=True)

        stat = "walltime=.* cputime=.*"
        act = "action=load_hook_input_file"
        self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                           regexp=True)

        act = "action=start_interpreter"
        self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                           regexp=True)

        act = r"action=populate:pbs\.event\(\)\.vnode_list"
        self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                           regexp=True)

        act = r"action=populate:pbs\.event\(\)\.job_list"
        self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                           regexp=True)

        act = "action=run_code"
        self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                           regexp=True)

        act = "action=hook_output:.*"
        self.mom.log_match("%s;%s %s %s" % (hd, lbl, act, stat),
                           regexp=True)

        tr = "profile_stop"
        act = "action=pbs_python"
        self.mom.log_match("%s;%s %s %s %s" % (hd, lbl, act, stat, tr),
                           regexp=True)


================================================
FILE: test/tests/functional/pbs_hook_postqueuejob.py
================================================
# coding: utf-8

# Copyright (C) 1994-2022 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *

hook_body = """
import pbs

hook_events = ['queuejob', 'postqueuejob', 'runjob']
hook_event = {}

for he in hook_events:
    if hasattr(pbs, he.upper()):
        event_code = eval('pbs.'+he.upper())
        hook_event[event_code] = he
        hook_event[he] = event_code
        hook_event[he.upper()] = event_code
        del event_code
    else:
        del hook_events[hook_events.index(he)]


pbs_event = pbs.event()
job = pbs_event.job

pbs.logmsg(pbs.LOG_DEBUG, "Starting... %s" % (hook_event[pbs_event.type]))
if hook_event[pbs_event.type] == "postqueuejob":
    myjob = pbs.server().job(job.id)
    pbs.logmsg(pbs.LOG_DEBUG, "my jobid=> %s" % (myjob.id))
    pbs.logmsg(pbs.LOG_DEBUG, "my job queue=> %s" % (myjob.queue))


pbs.logmsg(pbs.LOG_DEBUG, "hook name=> %s" % (pbs_event.hook_name))
pbs.logmsg(pbs.LOG_DEBUG, "Ending... %s" % (hook_event[pbs_event.type]))

pbs_event.accept()
"""


@tags('hooks')
class TestHookPostQueueJob(TestFunctional):
    """
    This test suite is to test the postqueuejob hook event
    """

    def test_postqueuejob_hook_single_job(self):
        """
        Verify postqueuejob is running
        """

        hook_name = "postqueuejob_hook"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my jobid=> %s" % jid)
        self.server.log_match("Ending... postqueuejob")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_postqueuejob_hook_multiple_job(self):
        """
        Verify postqueuejob hook with multiple jobs
        """

        hook_name = "postqueuejob_hook"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid1 = self.server.submit(j)
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my jobid=> %s" % jid1)
        self.server.log_match("Ending... postqueuejob")
        jid2 = self.server.submit(j)
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my jobid=> %s" % jid2)
        self.server.log_match("Ending... postqueuejob")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

    def test_postqueuejob_hook_multiple_hooks(self):
        """
        Verify postqueuejob event with multiple hooks
        """

        hook_name1 = "postqueuejob_hook1"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name1, attr, hook_body)

        hook_name2 = "postqueuejob_hook2"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name2, attr, hook_body)

        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid1 = self.server.submit(j)
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my jobid=> %s" % jid1)
        self.server.log_match("hook name=> %s" % (hook_name1))
        self.server.log_match("hook name=> %s" % (hook_name2))
        self.server.log_match("Ending... postqueuejob")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

    def test_postqueuejob_hook_multiple_hooks_muliple_jobs(self):
        """
        Verify multiple postqueuejob hooks with multiple jobs
        """

        hook_name1 = "postqueuejob_hook1"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name1, attr, hook_body)

        hook_name2 = "postqueuejob_hook2"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_name2, attr, hook_body)

        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid1 = self.server.submit(j)
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my jobid=> %s" % jid1)
        self.server.log_match("hook name=> %s" % (hook_name1))
        self.server.log_match("hook name=> %s" % (hook_name2))
        self.server.log_match("Ending... postqueuejob")
        jid2 = self.server.submit(j)
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my jobid=> %s" % jid2)
        self.server.log_match("Ending... postqueuejob")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

    def test_queuejob_with_postqueuejob_hook(self):
        """
        Test postqueuejob hook along with queuejob hook
        """

        hook_queuejob = "queuejob_hook"
        attr = {'event': 'queuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_queuejob, attr, hook_body)

        hook_postqueuejob = "postqueuejob_hook"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_postqueuejob, attr, hook_body)

        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid1 = self.server.submit(j)

        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("hook name=> %s" % (hook_queuejob))
        self.server.log_match("Ending... postqueuejob")

        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my jobid=> %s" % jid1)
        self.server.log_match("hook name=> %s" % (hook_postqueuejob))
        self.server.log_match("Ending... postqueuejob")

    def test_postqueuejob_hook_reject(self):
        """
        Test postqueuejob reject event
        """

        reject_hook_script = """
import pbs
pbs.event().reject("postqueuejob hook rejected the job")
"""
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})
        hook_postqueuejob = "postqueuejob_hook"
        attr = {'event': 'postqueuejob', 'enabled': 'True'}
        self.server.create_import_hook(
            hook_postqueuejob, attr, reject_hook_script)
        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.server.log_match("postqueuejob hook rejected the job")

    def test_postqueuejob_hook_with_route_queue(self):
        """
        Verify that a routing queue routes a job into the appropriate
        execution queue and postqueuejob hook is executed all the
        time.
        """

        hook_queuejob = "queuejob_hook"
        attr = {'event': 'queuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_queuejob, attr, hook_body)

        hook_postqueuejob = "postqueuejob_hook"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_postqueuejob, attr, hook_body)

        a = {'queue_type': 'Execution', 'resources_min.ncpus': 1,
             'enabled': 'True', 'started': 'False'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='specialq')
        dflt_q = self.server.default_queue
        a = {'queue_type': 'route',
             'route_destinations': dflt_q + ',specialq',
             'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='routeq')
        a = {'resources_min.ncpus': 4}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id=dflt_q)
        j = Job(TEST_USER, attrs={ATTR_queue: 'routeq',
                                  'Resource_List.ncpus': 1})
        jid = self.server.submit(j)
        self.server.log_match("my job queue=> %s" % 'routeq')
        self.server.expect(JOB, {ATTR_queue: 'specialq'}, id=jid)
        self.server.log_match("my job queue=> %s" % 'specialq')

    def test_postqueuejob_hook_with_movejob(self):
        """
        Verify that a job can be moved to another queue than the one it was
        originally submitted to and postqueuejob hook is executed
        """

        hook_postqueuejob = "postqueuejob_hook"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}
        self.server.create_import_hook(hook_postqueuejob, attr, hook_body)

        a = {'queue_type': 'Execution', 'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='solverq')
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my job queue=> %s" % 'workq')
        self.server.log_match("Ending... postqueuejob")
        self.server.movejob(jid, 'solverq')
        self.server.log_match("Starting... postqueuejob")
        self.server.log_match("my job queue=> %s" % 'solverq')
        self.server.log_match("Ending... postqueuejob")
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(JOB, {ATTR_queue: 'solverq', 'job_state': 'R'},
                           attrop=PTL_AND)

    def create_hook_and_submit_job(self, hook_script):
        """
        Helper function to create hook and submit job
        """

        hook_postqueuejob = "postqueuejob_hook"
        attr = {'event': 'postqueuejob', 'enabled': 'True', 'alarm': '50'}

        self.server.create_import_hook(hook_postqueuejob, attr, hook_script)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        j_status = self.server.status(JOB, id=jid)[0]
        return j_status

    def test_altering_job_attribute_in_accepted_hook(self):
        """
        Verify the postqueuejob hook can update the job attribute
        (Resource_List.ncpus, Project) when hook is accepted.
        """

        req_ncpus = '2'
        req_project = 'ptl_test'
        hook_script = """
import pbs
event = pbs.event()
job = event.job
job.Resource_List["ncpus"] = %s
job.project= "%s"
event.accept()
"""
        j_status = self.create_hook_and_submit_job(
            hook_script % (req_ncpus, req_project))
        job_ncpus = j_status['Resource_List.ncpus']
        job_project = j_status['project']
        self.assertEqual(
            req_ncpus,
            job_ncpus,
            "Requested ncpus is not updated after postqueuejob "
            "hook run")
        self.assertEqual(
            req_project,
            job_project,
            "Requested project is not updated after postqueuejob "
            "hook run")

    def test_altering_job_attribute_in_rejected_hook(self):
        """
        Verify the postqueuejob hook can not update the job attribute
        (Resource_List.ncpus, Project) when hook is rejected.
        """

        req_ncpus = '2'
        req_project = 'ptl_test'
        hook_script = """
import pbs
event = pbs.event()
job = event.job
job.Resource_List["ncpus"] = %s
job.project=%s
event.reject()
"""
        j_status = self.create_hook_and_submit_job(
            hook_script % (req_ncpus, req_project))
        job_ncpus = j_status['Resource_List.ncpus']
        job_project = j_status['project']
        self.assertNotEqual(
            req_ncpus,
            job_ncpus,
            "Requested ncpus is same as job's ncpus")
        self.assertNotEqual(
            req_project,
            job_project,
            "Requested project is same as job's project")

    def test_setting_job_readonly_attr(self):
        """
        Verify postqueuejob hook can not set job's readonly attribute
        """
        req_substate = '50'
        hook_script = """
import pbs
event = pbs.event()
job = event.job
job.substate=%s
event.accept()
"""
        j_status = self.create_hook_and_submit_job(
            hook_script % (req_substate))
        log_msg = "PBS server internal error (15011) in Error " \
            "evaluating Python script, job attribute 'substate' is " \
            "readonly"
        self.server.log_match(log_msg)
        job_substate = j_status['substate']
        self.assertNotEqual(
            req_substate,
            job_substate,
            "Requested substate is not updated after postqueuejob "
            "hook run")

    def test_postqueuejob_in_list_hook(self):
        """
        Set a hook event to queuejob and postqueuejob
        and test if it is listed successfully in qmgr
        """

        hook_name = "myhook"
        a = {'event': 'queuejob,postqueuejob', 'enabled': 'True'}
        self.server.create_hook(hook_name, a)
        attrs = {'event': 'queuejob,postqueuejob'}
        rv = self.server.expect(HOOK, attrs, id=hook_name)
        self.assertTrue(rv)


================================================
FILE: test/tests/functional/pbs_hook_set_attr.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *

hook_body_node_attr_alter = """
import pbs
e = pbs.event()
vnl = pbs.event().vnode_list
local_node = pbs.get_local_nodename()
vnl[local_node].Mom = None
vnl[local_node].Port = 123
"""


class TestHookSetAttr(TestFunctional):

    def test_node_ro_attr_hook(self):
        """
        Try to alter RO node attributes from hook and check
        the attributes are protected to the write.
        """
        hook_name = "node_attr_ro"
        a = {'event': 'exechost_periodic',
             'enabled': 'True',
             'freq': 3}
        rv = self.server.create_import_hook(
            hook_name, a, hook_body_node_attr_alter, overwrite=True)
        self.assertTrue(rv)

        msg = 'Error 15003 setting attribute Mom in update from mom hook'
        self.server.log_match(msg, starttime=time.time())

        msg = 'Error 15003 setting attribute Port in update from mom hook'
        self.server.log_match(msg, starttime=time.time())


================================================
FILE: test/tests/functional/pbs_hook_set_interrupt.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestHookInterrupt(TestFunctional):

    """
    This suite contains hook test to verify that pbs generates
    KeyBoardInterrupt via hook alarm on long running hook
    """

    def test_hook_interrupt(self):
        """
        Test hook interrupt
        """
        hook_name = "testhook"
        hook_body = """
import pbs
import time

pbs.logmsg(pbs.LOG_DEBUG, "TestHook Started")
time.sleep(100000)
pbs.logmsg(pbs.LOG_DEBUG, "TestHook Ended")
"""
        a = {'event': 'runjob', 'enabled': 'True', 'alarm': '5'}
        self.server.create_import_hook(hook_name, a, hook_body)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': -1})
        j = Job(TEST_USER)
        st = time.time()
        jid = self.server.submit(j)

        self.server.log_match("TestHook Started", starttime=st)

        _msg = "Not Running: PBS Error: request rejected"
        _msg += " as filter hook '%s' got an alarm call." % hook_name
        _msg += " Please inform Admin"
        self.server.expect(JOB,
                           {'job_state': 'Q', 'comment': _msg},
                           id=jid, offset=5)

        self.server.log_match("Hook;catch_hook_alarm;alarm call received",
                              starttime=st)
        _msg1 = "PBS server internal error (15011)"
        _msg1 += " in Python script received a KeyboardInterrupt, "
        _msg2 = "<class 'KeyboardInterrupt'>"
        _msg3 = "<could not figure out the exception value>"
        self.server.log_match(_msg1 + _msg2, starttime=st)
        self.server.log_match(_msg1 + _msg3, starttime=st)
        self.server.log_match("Hook;%s;finished" % hook_name, starttime=st)
        _msg = "alarm call while running runjob hook"
        _msg += " '%s', request rejected" % hook_name
        self.server.log_match(_msg, starttime=st)
        self.server.log_match("TestHook Ended", existence=False, starttime=st)


================================================
FILE: test/tests/functional/pbs_hook_set_jobenv.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import os
from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


class TestPbsHookSetJobEnv(TestFunctional):
    """
    This test suite to make sure hooks properly
    handle environment variables with special characters,
    values, in particular newline (\n), commas (,), semicolons (;),
    single quotes ('), double quotes ("), and backaslashes.
    PRE: Set up currently executing user's environment to have variables
         whose values have the special characters.
         Job A: Submit a job using the -V option (pass current environment)
         where there are NO hooks in the system.
         Introduce execjob_begin and execjob_launch hooks in the system.
         Let the former update pbs.event().job.Variable_List while the latter
         update pbs.event().env.
         Job B: Submit a job using the -V option (pass current environment)
         where there are now mom hooks in the system.
    POST: Job A and Job B would see the same environment variables, with
          Job B also seeing the changes made to the job by the 2 mom hooks.
    """

    # List of environment variables not to compare between
    # job ran without hooks, job ran with hooks.
    exclude_env = []
    env_nohook = {}
    env_nohook_exclude = {}
    env_hook = {}
    env_hook_exclude = {}

    def setUp(self):
        """
        Set environment variables
        """
        TestFunctional.setUp(self)
        self.interactive = False
        # Set environment variables with special characters
        os.environ['TEST_COMMA'] = '1,2,3,4'
        os.environ['TEST_RETURN'] = """'3,
4,
5'"""
        os.environ['TEST_SEMICOLON'] = ';'
        os.environ['TEST_ENCLOSED'] = '\',\''
        os.environ['TEST_COLON'] = ':'
        os.environ['TEST_BACKSLASH'] = '\\'
        os.environ['TEST_DQUOTE'] = '"'
        os.environ['TEST_DQUOTE2'] = 'happy days"are"here to stay'
        os.environ['TEST_DQUOTE3'] = 'nothing compares" to you'
        os.environ['TEST_DQUOTE4'] = '"music makes the people"'
        os.environ['TEST_DQUOTE5'] = 'music "makes \'the\'"people'
        os.environ['TEST_DQUOTE6'] = 'lalaland"'
        os.environ['TEST_SQUOTE'] = '\''
        os.environ['TEST_SQUOTE2'] = 'happy\'days'
        os.environ['TEST_SQUOTE3'] = 'the days\'are here now\'then'
        os.environ['TEST_SQUOTE4'] = '\'the way that was\''
        os.environ['TEST_SQUOTE5'] = 'music \'makes "the\'"people'
        os.environ['TEST_SQUOTE6'] = 'loving\''
        os.environ['TEST_SPECIAL'] = "{}[]()~@#$%^&*!"
        os.environ['TEST_SPECIAL2'] = "<dumb-test_text>"

        # List of environment variables not to compare between
        # job ran without hooks, job ran with hooks.
        self.exclude_env = ['PBS_NODEFILE']
        self.exclude_env += ['PBS_JOBID']
        self.exclude_env += ['PBS_JOBCOOKIE']
        # Each job submitted by default gets a unique jobname
        self.exclude_env += ['PBS_JOBNAME']
        self.exclude_env += ['TMPDIR']
        self.exclude_env += ['happy']

        self.ATTR_V = 'Full_Variable_List'
        api_to_cli.setdefault(self.ATTR_V, 'V')

        # temporary files
        fn = self.du.create_temp_file(prefix="job_out1")
        self.job_out1_tempfile = fn

        fn = self.du.create_temp_file(prefix="job_out2")
        self.job_out2_tempfile = fn

        fn = self.du.create_temp_file(prefix="job_out3")
        self.job_out3_tempfile = fn

    def tearDown(self):
        TestFunctional.tearDown(self)
        try:
            os.remove(self.job_out1_tempfile)
            os.remove(self.job_out2_tempfile)
            os.remove(self.job_out3_tempfile)
            for _file in [self.job_out1_tempfile, self.job_out2_tempfile,
                          self.job_out3_tempfile]:
                rc = self.du.isfile(hostname=self.mom.shortname,
                                    path=_file, sudo=True)
                if rc:
                    self.du.rm(self.mom.hostname, _file)
        except OSError:
            pass

    def read_env(self, outputfile, ishook):
        """
        Parse the output file and store the
        variable list in a dictionary
        """
        if (not self.du.is_localhost(self.mom.hostname)) and self.interactive:
            srchost = self.mom.hostname
            destpath = self.du.get_tempdir(self.server.hostname)
            self.du.run_copy(srchost=srchost, src=outputfile, dest=destpath)

        with open(outputfile) as fd:
            pkey = ""
            tmpenv = {}
            penv = {}
            penv_exclude = {}
            for line in fd:
                fields = line.split("=", 1)
                if (len(fields) == 2):
                    pkey = fields[0]
                    if pkey not in self.exclude_env:
                        penv[pkey] = fields[1]
                        tmpenv = penv
                    else:
                        penv_exclude[pkey] = fields[1]
                        tmpenv = penv_exclude
                elif pkey != "":
                    # append to previous dictionary entry
                    tmpenv[pkey] += fields[0]
        if (ishook == "hook"):
            self.env_hook = penv
            self.env_hook_exclude = penv_exclude
        else:
            self.env_nohook = penv
            self.env_nohook_exclude = penv_exclude

    def common_log_match(self, daemon):
        """
        Validate the env variable output in daemon logs
        """
        logutils = PBSLogUtils()
        logmsg = [r"TEST_COMMA=1\,2\,3\,4",
                  "TEST_SEMICOLON=;",
                  r"TEST_ENCLOSED=\\'\,\\'",
                  "TEST_COLON=:",
                  "TEST_BACKSLASH=\\\\",
                  "TEST_DQUOTE=\\\"",
                  "TEST_DQUOTE2=happy days\\\"are\\\"here to stay",
                  "TEST_DQUOTE3=nothing compares\\\" to you",
                  "TEST_DQUOTE4=\\\"music makes the people\\\"",
                  "TEST_DQUOTE5=music \\\"makes \\'the\\'\\\"people",
                  "TEST_DQUOTE6=lalaland\\\"",
                  "TEST_SQUOTE=\\'",
                  "TEST_SQUOTE2=happy\\'days",
                  "TEST_SQUOTE3=the days\\'are here now\\'then",
                  "TEST_SQUOTE4=\\'the way that was\\'",
                  "TEST_SQUOTE5=music \\'makes \\\"the\\'\\\"people",
                  "TEST_SQUOTE6=loving\\'",
                  "TEST_SPECIAL={}[]()~@#$%^&*!",
                  "TEST_SPECIAL2=<dumb-test_text>",
                  r"TEST_RETURN=\\'3\,",
                  # Cannot add '\n' here because '\n' is not included in
                  # the items of the list returned by log_lines(), (though
                  # lines are split by '\n')
                  r"4\,",
                  "5\\',"]

        if (daemon == "mom"):
            self.logger.info("Matching in mom logs")
            logfile_type = self.mom
            host = self.mom.hostname
        elif (daemon == "server"):
            self.logger.info("Matching in server logs")
            logfile_type = self.server
            host = self.server.hostname
        else:
            self.logger.info("Provide a valid daemon name; server or mom")
            return
        lines = None
        ret_linenum = 0
        search_msg = 'log match: searching for '
        nomatch_msg = ' No match for '
        for msg in logmsg:
            for attempt in range(1, 61):
                lines = self.server.log_lines(logfile_type,
                                              starttime=self.server.ctime,
                                              host=host, n='ALL')
                match = logutils.match_msg(lines, msg=msg)
                if match:
                    # Dont want the test to pass if there are
                    # unwanted matched for "4\," and "5\\'.
                    if msg == r"TEST_RETURN=\\'3\,":
                        ret_linenum = match[0]
                    if (msg == r"4\," and match[0] != (ret_linenum - 1)) or \
                       (msg == "5\\'" and match[0] != (ret_linenum - 2)):
                        pass
                    else:
                        self.logger.info(search_msg + msg + ' ... OK')
                        break
                else:
                    self.logger.info(nomatch_msg + msg +
                                     ' attempt ' + str(attempt))
                time.sleep(0.5)
            if match is None:
                _msg = nomatch_msg + msg
                raise PtlLogMatchError(rc=1, rv=False, msg=_msg)

    def common_validate(self):
        """
        This is a common function to validate the
        environment values with and without hook
        """

        self.assertEqual(self.env_nohook, self.env_hook)
        self.logger.info("Environment variables are same"
                         " with and without hooks")
        match_str = self.env_hook['TEST_COMMA'].rstrip('\n')
        self.assertEqual(os.environ['TEST_COMMA'], match_str)
        self.logger.info(
            "TEST_COMMA matched - " + os.environ['TEST_COMMA'] +
            " == " + match_str)
        self.assertEqual(os.environ['TEST_RETURN'],
                         self.env_hook['TEST_RETURN'].rstrip('\n'))
        self.logger.info(
            "TEST_RETURN matched - " + os.environ['TEST_RETURN'] +
            " == " + self.env_hook['TEST_RETURN'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SEMICOLON'],
                         self.env_hook['TEST_SEMICOLON'].rstrip('\n'))
        self.logger.info(
            "TEST_SEMICOLON matched - " + os.environ['TEST_SEMICOLON'] +
            " == " + self.env_hook['TEST_SEMICOLON'].rstrip('\n'))
        self.assertEqual(
            os.environ['TEST_ENCLOSED'],
            self.env_hook['TEST_ENCLOSED'].rstrip('\n'))
        self.logger.info(
            "TEST_ENCLOSED matched - " + os.environ['TEST_ENCLOSED'] +
            " == " + self.env_hook['TEST_ENCLOSED'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_COLON'],
                         self.env_hook['TEST_COLON'].rstrip('\n'))
        self.logger.info("TEST_COLON matched - " + os.environ['TEST_COLON'] +
                         " == " + self.env_hook['TEST_COLON'].rstrip('\n'))
        self.assertEqual(
            os.environ['TEST_BACKSLASH'],
            self.env_hook['TEST_BACKSLASH'].rstrip('\n'))
        self.logger.info(
            "TEST_BACKSLASH matched - " + os.environ['TEST_BACKSLASH'] +
            " == " + self.env_hook['TEST_BACKSLASH'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE'],
                         self.env_hook['TEST_DQUOTE'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE matched - " +
                         os.environ['TEST_DQUOTE'] +
                         " == " + self.env_hook['TEST_DQUOTE'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE2'],
                         self.env_hook['TEST_DQUOTE2'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE2 matched - " +
                         os.environ['TEST_DQUOTE2'] +
                         " == " + self.env_hook['TEST_DQUOTE2'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE3'],
                         self.env_hook['TEST_DQUOTE3'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE3 matched - " +
                         os.environ['TEST_DQUOTE3'] +
                         " == " + self.env_hook['TEST_DQUOTE3'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE4'],
                         self.env_hook['TEST_DQUOTE4'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE4 matched - " +
                         os.environ['TEST_DQUOTE4'] +
                         " == " + self.env_hook['TEST_DQUOTE4'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE5'],
                         self.env_hook['TEST_DQUOTE5'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE5 matched - " +
                         os.environ['TEST_DQUOTE5'] +
                         " == " + self.env_hook['TEST_DQUOTE5'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE6'],
                         self.env_hook['TEST_DQUOTE6'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE6 matched - " +
                         os.environ['TEST_DQUOTE6'] +
                         " == " + self.env_hook['TEST_DQUOTE6'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE'],
                         self.env_hook['TEST_SQUOTE'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE matched - " + os.environ['TEST_SQUOTE'] +
                         " == " + self.env_hook['TEST_SQUOTE'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE2'],
                         self.env_hook['TEST_SQUOTE2'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE2 matched - " +
                         os.environ['TEST_SQUOTE2'] +
                         " == " + self.env_hook['TEST_SQUOTE2'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE3'],
                         self.env_hook['TEST_SQUOTE3'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE3 matched - " +
                         os.environ['TEST_SQUOTE3'] +
                         " == " + self.env_hook['TEST_SQUOTE3'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE4'],
                         self.env_hook['TEST_SQUOTE4'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE4 matched - " +
                         os.environ['TEST_SQUOTE4'] +
                         " == " + self.env_hook['TEST_SQUOTE4'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE5'],
                         self.env_hook['TEST_SQUOTE5'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE5 matched - " +
                         os.environ['TEST_SQUOTE5'] +
                         " == " + self.env_hook['TEST_SQUOTE5'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE6'],
                         self.env_hook['TEST_SQUOTE6'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE6 matched - " +
                         os.environ['TEST_SQUOTE6'] +
                         " == " + self.env_hook['TEST_SQUOTE6'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SPECIAL'],
                         self.env_hook['TEST_SPECIAL'].rstrip('\n'))
        self.logger.info("TEST_SPECIAL matched - " +
                         os.environ['TEST_SPECIAL'] +
                         " == " + self.env_hook['TEST_SPECIAL'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SPECIAL2'],
                         self.env_hook['TEST_SPECIAL2'].rstrip('\n'))
        self.logger.info("TEST_SPECIAL2 matched - " +
                         os.environ['TEST_SPECIAL2'] +
                         " == " + self.env_hook['TEST_SPECIAL2'].rstrip('\n'))

    def create_and_submit_job(self, user=None, attribs=None, content=None,
                              content_interactive=None, preserve_env=False):
        """
        create the job object and submit it to the server
        as 'user', attributes list 'attribs' script
        'content' or 'content_interactive', and to
        'preserve_env' if interactive job.
        """

        # A user=None value means job will be executed by current user
        # where the environment is set up
        if attribs is None:
            use_attribs = {}
        else:
            use_attribs = attribs
        retjob = Job(username=user, attrs=use_attribs)

        if content is not None:
            retjob.create_script(body=content)
        elif content_interactive is not None:
            retjob.interactive_script = content_interactive
            retjob.preserve_env = preserve_env

        return self.server.submit(retjob)

    @skipOnShasta
    def test_begin_launch(self):
        """
        Test to verify that job environment variables having special
        characters are not truncated with execjob_launch and
        execjob_begin hook
        """

        self.exclude_env += ['HAPPY']
        self.exclude_env += ['happy']

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 10,
             self.ATTR_V: None}
        script = ['env\n']
        script += ['sleep 5\n']

        # Submit a job without hooks in the system
        jid = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)

        # Read the env variables from job output
        self.env_nohook = {}
        self.env_nohook_exclude = {}
        self.read_env(job_outfile, "nohook")

        # Now start introducing hooks
        hook_body = """
import pbs
e=pbs.event()
e.job.Variable_List["happy"] = "days"
pbs.logmsg(pbs.LOG_DEBUG,"Variable List is %s" % (e.job.Variable_List,))
"""
        hook_name = "begin"
        a2 = {'event': "execjob_begin", 'enabled': 'True', 'debug': 'True'}

        rv = self.server.create_import_hook(
            hook_name,
            a2,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        hook_body = """
import pbs
e=pbs.event()
e.env["HAPPY"] = "nights"
"""
        hook_name = "launch"
        a2 = {'event': "execjob_launch", 'enabled': 'True', 'debug': 'True'}

        rv = self.server.create_import_hook(
            hook_name,
            a2,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        # Submit a job with hooks in the system
        jid2 = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid2)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid2, offset=10)

        self.env_hook = {}
        self.env_hook_exclude = {}
        self.read_env(job_outfile, "hook")

        # Validate the values printed in job output file
        self.assertTrue('HAPPY' not in self.env_nohook_exclude)
        self.assertTrue('happy' not in self.env_nohook_exclude)
        self.assertEqual(self.env_hook_exclude['HAPPY'], 'nights\n')
        self.assertEqual(self.env_hook_exclude['happy'], 'days\n')
        self.common_validate()

        # Check the values in mom logs as well
        self.common_log_match("mom")

    @skipOnShasta
    def test_que(self):
        """
        Test that variable_list do not change with and without
        queuejob hook
        """
        self.exclude_env += ['happy']

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 10}

        script = ['#PBS -V']
        script += ['env\n']
        script += ['sleep 5\n']

        # Submit a job without hooks in the system
        jid = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)

        # Read the env variable from job output file
        self.env_nohook = {}
        self.env_nohook_exclude = {}
        self.read_env(job_outfile, "nohook")

        # Now start introducing hooks
        hook_body = """
import pbs
e=pbs.event()
e.job.Variable_List["happy"] = "days"
pbs.logmsg(pbs.LOG_DEBUG,"Variable List is %s" % (e.job.Variable_List,))
"""
        hook_name = "qjob"
        a2 = {'event': "queuejob", 'enabled': 'True', 'debug': 'True'}

        rv = self.server.create_import_hook(
            hook_name,
            a2,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        # Submit a job with hooks in the system
        jid2 = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid2)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid2, offset=10)

        self.env_hook = {}
        self.env_hook_exclude = {}
        self.read_env(job_outfile, "hook")

        # Validate the env values from job output file
        # with and without queuejob hook
        self.assertTrue('happy' not in self.env_nohook_exclude)
        self.assertEqual(self.env_hook_exclude['happy'], 'days\n')
        self.common_validate()

        self.common_log_match("server")

    @skipOnShasta
    def test_execjob_epi(self):
        """
        Test that Variable_List will contain environment variable
        with commas, newline and all special characters even for
        other mom hooks
        """
        self.exclude_env += ['happy']

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 10}
        script = ['#PBS -V']
        script += ['env\n']
        script += ['sleep 5\n']

        # Submit a job without hooks in the system
        jid = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)

        # Read the output file and parse the values
        self.env_nohook = {}
        self.env_nohook_exclude = {}
        self.read_env(job_outfile, "nohook")

        # Now start the hooks
        hook_name = "test_epi"
        hook_body = """
import pbs
e = pbs.event()
j = e.job
j.Variable_List["happy"] = "days"
pbs.logmsg(pbs.LOG_DEBUG,"Variable_List is %s" % (j.Variable_List,))
"""

        a2 = {'event': "execjob_epilogue", 'enabled': "true", 'debug': "true"}

        self.server.create_import_hook(
            hook_name,
            a2,
            hook_body,
            overwrite=True)

        # Submit a job with hooks in the system
        jid2 = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid2)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid2, offset=10)

        # read the output file for env with hooks
        self.env_hook = {}
        self.env_hook_exclude = {}
        self.read_env(job_outfile, "hook")

        # Validate
        self.common_validate()

        # Verify the env variables in logs too
        self.common_log_match("mom")

    @skipOnShasta
    def test_execjob_pro(self):
        """
        Test that environment variable not gets truncated
        for execjob_prologue hook
        """

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 10}
        script = ['#PBS -V']
        script += ['env\n']
        script += ['sleep 5\n']

        # Submit a job without hooks in the system
        jid = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)

        # read the output file for env without hook
        self.env_nohook = {}
        self.env_nohook_exclude = {}
        self.read_env(job_outfile, "nohook")

        # Now start the hooks
        hook_name = "test_pro"
        hook_body = """
import pbs
e = pbs.event()
j = e.job
j.Variable_List["happy"] = "days"
pbs.logmsg(pbs.LOG_DEBUG,"Variable_List is %s" % (j.Variable_List,))
"""
        a2 = {'event': "execjob_prologue", 'enabled': "true", 'debug': "true"}

        rv = self.server.create_import_hook(
            hook_name,
            a2,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        # Submit a job with hooks in the system
        jid2 = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, ATTR_o, id=jid2)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid2, offset=10)

        # Read the job ouput file
        self.env_hook = {}
        self.env_hook_exclude = {}
        self.read_env(job_outfile, "hook")

        # Validate the env values with and without hook
        self.common_validate()

        # compare the values in mom_logs as well
        self.common_log_match("mom")

    @skipOnShasta
    @checkModule("pexpect")
    def test_interactive(self):
        """
        Test that interactive jobs do not have truncated environment
        variable list with execjob_launch hook
        """

        self.interactive = True
        self.exclude_env += ['happy']

        # submit an interactive job without hook
        cmd = 'env > ' + self.job_out1_tempfile
        a = {ATTR_inter: '', self.ATTR_V: None}

        interactive_script = [('hostname', '.*'), (cmd, '.*')]
        jid = self.create_and_submit_job(
            attribs=a,
            content_interactive=interactive_script,
            preserve_env=True)
        # Once all commands sent and matched, job exits
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)

        # read the environment list from the job without hook
        self.env_nohook = {}
        self.env_nohook_exclude = {}
        self.read_env(self.job_out1_tempfile, "nohook")

        # now do the same with the hook
        hook_name = "launch"
        hook_body = """
import pbs
e = pbs.event()
j = e.job
j.Variable_List["happy"] = "days"
pbs.logmsg(pbs.LOG_DEBUG, "Variable_List is %s" % (j.Variable_List,))
"""

        a2 = {'event': "execjob_launch", 'enabled': 'true', 'debug': 'true'}
        self.server.create_import_hook(hook_name, a2, hook_body)

        # submit an interactive job without hook
        cmd = 'env > ' + self.job_out2_tempfile
        interactive_script = [('hostname', '.*'), (cmd, '.*')]
        jid2 = self.create_and_submit_job(
            attribs=a,
            content_interactive=interactive_script,
            preserve_env=True)
        # Once all commands sent and matched, job exits
        self.server.expect(JOB, 'queue', op=UNSET, id=jid2, offset=10)

        # read the environment list from the job without hook
        self.env_hook = {}
        self.env_hook_exclude = {}
        self.read_env(self.job_out2_tempfile, "hook")

        # validate the environment values
        self.common_validate()

        # verify the env values in logs
        self.common_log_match("mom")

    @skipOnShasta
    def test_no_hook(self):
        """
        Test to verify that environment variables are
        not truncated and also not modified by PBS when
        no hook is present
        """

        os.environ['BROL'] = r'hii\\\haha'
        os.environ['BROL1'] = """'hii
haa'"""

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 10}
        script = ['#PBS -V']
        script += ['env\n']
        script += ['sleep 5\n']

        # Submit a job without hooks in the system
        jid = self.create_and_submit_job(attribs=a, content=script)
        qstat = self.server.status(JOB, id=jid)
        job_outfile = qstat[0]['Output_Path'].split(':')[1]
        job_var = qstat[0]['Variable_List']
        self.logger.info("job variable list is %s" % job_var)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)

        # Read the env variable from job output file
        self.env_nohook = {}
        self.env_nohook_exclude = {}
        self.read_env(job_outfile, "nohook")

        # Verify the output with and without job
        self.assertEqual(os.environ['TEST_COMMA'],
                         self.env_nohook['TEST_COMMA'].rstrip('\n'))
        self.logger.info(
            "TEST_COMMA matched - " + os.environ['TEST_COMMA'] +
            " == " + self.env_nohook['TEST_COMMA'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_RETURN'],
                         self.env_nohook['TEST_RETURN'].rstrip('\n'))
        self.logger.info(
            "TEST_RETURN matched - " + os.environ['TEST_RETURN'] +
            " == " + self.env_nohook['TEST_RETURN'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SEMICOLON'],
                         self.env_nohook['TEST_SEMICOLON'].rstrip('\n'))
        self.logger.info(
            "TEST_SEMICOLON macthed - " + os.environ['TEST_SEMICOLON'] +
            " == " + self.env_nohook['TEST_SEMICOLON'].rstrip('\n'))
        self.assertEqual(
            os.environ['TEST_ENCLOSED'],
            self.env_nohook['TEST_ENCLOSED'].rstrip('\n'))
        self.logger.info(
            "TEST_ENCLOSED matched - " + os.environ['TEST_ENCLOSED'] +
            " == " + self.env_nohook['TEST_ENCLOSED'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_COLON'],
                         self.env_nohook['TEST_COLON'].rstrip('\n'))
        self.logger.info("TEST_COLON macthed - " + os.environ['TEST_COLON'] +
                         " == " + self.env_nohook['TEST_COLON'].rstrip('\n'))
        self.assertEqual(
            os.environ['TEST_BACKSLASH'],
            self.env_nohook['TEST_BACKSLASH'].rstrip('\n'))
        self.logger.info(
            "TEST_BACKSLASH matched - " + os.environ['TEST_BACKSLASH'] +
            " == " + self.env_nohook['TEST_BACKSLASH'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE'],
                         self.env_nohook['TEST_DQUOTE'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE - " + os.environ['TEST_DQUOTE'] +
                         " == " + self.env_nohook['TEST_DQUOTE'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE2'],
                         self.env_nohook['TEST_DQUOTE2'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE2 - " + os.environ['TEST_DQUOTE2'] +
                         " == " + self.env_nohook['TEST_DQUOTE2'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE3'],
                         self.env_nohook['TEST_DQUOTE3'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE3 - " + os.environ['TEST_DQUOTE3'] +
                         " == " + self.env_nohook['TEST_DQUOTE3'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE4'],
                         self.env_nohook['TEST_DQUOTE4'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE4 - " + os.environ['TEST_DQUOTE4'] +
                         " == " + self.env_nohook['TEST_DQUOTE4'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE5'],
                         self.env_nohook['TEST_DQUOTE5'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE5 - " + os.environ['TEST_DQUOTE5'] +
                         " == " + self.env_nohook['TEST_DQUOTE5'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE6'],
                         self.env_nohook['TEST_DQUOTE6'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE6 - " + os.environ['TEST_DQUOTE6'] +
                         " == " + self.env_nohook['TEST_DQUOTE6'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE'],
                         self.env_nohook['TEST_SQUOTE'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE - " + os.environ['TEST_SQUOTE'] +
                         " == " + self.env_nohook['TEST_SQUOTE'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE2'],
                         self.env_nohook['TEST_SQUOTE2'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE2 - " + os.environ['TEST_SQUOTE2'] +
                         " == " + self.env_nohook['TEST_SQUOTE2'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE3'],
                         self.env_nohook['TEST_SQUOTE3'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE3 - " + os.environ['TEST_SQUOTE3'] +
                         " == " + self.env_nohook['TEST_SQUOTE3'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE4'],
                         self.env_nohook['TEST_SQUOTE4'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE4 - " + os.environ['TEST_SQUOTE4'] +
                         " == " + self.env_nohook['TEST_SQUOTE4'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE5'],
                         self.env_nohook['TEST_SQUOTE5'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE5 - " + os.environ['TEST_SQUOTE5'] +
                         " == " + self.env_nohook['TEST_SQUOTE5'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SQUOTE6'],
                         self.env_nohook['TEST_SQUOTE6'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE6 - " + os.environ['TEST_SQUOTE6'] +
                         " == " + self.env_nohook['TEST_SQUOTE6'].rstrip('\n'))
        self.assertEqual(os.environ['BROL'],
                         self.env_nohook['BROL'].rstrip('\n'))
        self.logger.info("BROL - " + os.environ['BROL'] + " == " +
                         self.env_nohook['BROL'].rstrip('\n'))
        self.assertEqual(os.environ['BROL1'],
                         self.env_nohook['BROL1'].rstrip('\n'))
        self.logger.info("BROL - " + os.environ['BROL1'] + " == " +
                         self.env_nohook['BROL1'].rstrip('\n'))

        # match the values in qstat -f Variable_List
        # Following is blocked on PTL bug PP-1008

        # self.assertTrue("TEST_COMMA=1\,2\,3\,4" in job_var)
        # self.assertTrue("TEST_SEMICOLON=\;" in job_var)
        # self.assertTrue("TEST_COLON=:" in job_var)
        # self.assertTrue("TEST_DQUOTE=\"" in job_var)
        # self.assertTrue("TEST_SQUOTE=\'" in job_var)
        # self.assertTrue("TEST_BACKSLASH=\\" in job_var)
        # self.assertTrue("BROL=hii\\\\\\haha" in job_var)
        # self.assertTrue("TEST_ENCLOSED=\," in job_var)
        # self.assertTrue("BROL1=hii\nhaa" in job_var)
        # self.assertTrue("TEST_RETURN=3\,\n4\,\n5\," in job_var)

    @skipOnShasta
    @checkModule("pexpect")
    def test_interactive_no_hook(self):
        """
        Test to verify that environment variable values
        are not truncated or escaped wrongly whithin a
        job even when there is no hook present
        """

        self.interactive = True
        os.environ['BROL'] = r'hii\\\haha'
        os.environ['BROL1'] = """'hii
haa'"""

        # submit an interactive job without hook
        cmd = 'env > ' + self.job_out3_tempfile
        a = {ATTR_inter: '', self.ATTR_V: None}
        interactive_script = [('hostname', '.*'), (cmd, '.*')]
        jid = self.create_and_submit_job(
            attribs=a,
            content_interactive=interactive_script,
            preserve_env=True)
        # Once all commands sent and matched, job exits
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)

        # read the environment list from the job without hook
        self.env_nohook = {}
        self.env_nohook_exclude = {}
        self.read_env(self.job_out3_tempfile, "nohook")

        # Verify the output with and without job
        self.logger.info("job Variable list is ")
        self.assertEqual(os.environ['TEST_COMMA'],
                         self.env_nohook['TEST_COMMA'].rstrip('\n'))
        self.logger.info(
            "TEST_COMMA matched - " + os.environ['TEST_COMMA'] +
            " == " + self.env_nohook['TEST_COMMA'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_RETURN'],
                         self.env_nohook['TEST_RETURN'].rstrip('\n'))
        self.logger.info(
            "TEST_RETURN matched - " + os.environ['TEST_RETURN'] +
            " == " + self.env_nohook['TEST_RETURN'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_SEMICOLON'],
                         self.env_nohook['TEST_SEMICOLON'].rstrip('\n'))
        self.logger.info(
            "TEST_SEMICOLON macthed - " + os.environ['TEST_SEMICOLON'] +
            " == " + self.env_nohook['TEST_SEMICOLON'].rstrip('\n'))
        self.assertEqual(
            os.environ['TEST_ENCLOSED'],
            self.env_nohook['TEST_ENCLOSED'].rstrip('\n'))
        self.logger.info(
            "TEST_ENCLOSED matched - " + os.environ['TEST_ENCLOSED'] +
            " == " + self.env_nohook['TEST_ENCLOSED'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_COLON'],
                         self.env_nohook['TEST_COLON'].rstrip('\n'))
        self.logger.info("TEST_COLON macthed - " + os.environ['TEST_COLON'] +
                         " == " + self.env_nohook['TEST_COLON'].rstrip('\n'))
        self.assertEqual(
            os.environ['TEST_BACKSLASH'],
            self.env_nohook['TEST_BACKSLASH'].rstrip('\n'))
        self.logger.info(
            "TEST_BACKSLASH matched - " + os.environ['TEST_BACKSLASH'] +
            " == " + self.env_nohook['TEST_BACKSLASH'].rstrip('\n'))
        self.assertEqual(os.environ['TEST_DQUOTE'],
                         self.env_nohook['TEST_DQUOTE'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE - " + os.environ['TEST_DQUOTE'] +
                         " == " + self.env_nohook['TEST_DQUOTE'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE2 - " + os.environ['TEST_DQUOTE2'] +
                         " == " + self.env_nohook['TEST_DQUOTE2'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE3 - " + os.environ['TEST_DQUOTE3'] +
                         " == " + self.env_nohook['TEST_DQUOTE3'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE4 - " + os.environ['TEST_DQUOTE4'] +
                         " == " + self.env_nohook['TEST_DQUOTE4'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE5 - " + os.environ['TEST_DQUOTE5'] +
                         " == " + self.env_nohook['TEST_DQUOTE5'].rstrip('\n'))
        self.logger.info("TEST_DQUOTE6 - " + os.environ['TEST_DQUOTE6'] +
                         " == " + self.env_nohook['TEST_DQUOTE6'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE - " + os.environ['TEST_SQUOTE'] +
                         " == " + self.env_nohook['TEST_SQUOTE'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE2 - " + os.environ['TEST_SQUOTE2'] +
                         " == " + self.env_nohook['TEST_SQUOTE2'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE3 - " + os.environ['TEST_SQUOTE3'] +
                         " == " + self.env_nohook['TEST_SQUOTE3'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE4 - " + os.environ['TEST_SQUOTE4'] +
                         " == " + self.env_nohook['TEST_SQUOTE4'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE5 - " + os.environ['TEST_SQUOTE5'] +
                         " == " + self.env_nohook['TEST_SQUOTE5'].rstrip('\n'))
        self.logger.info("TEST_SQUOTE6 - " + os.environ['TEST_SQUOTE6'] +
                         " == " + self.env_nohook['TEST_SQUOTE6'].rstrip('\n'))
        self.assertEqual(os.environ['BROL'],
                         self.env_nohook['BROL'].rstrip('\n'))
        self.logger.info("BROL - " + os.environ['BROL'] + " == " +
                         self.env_nohook['BROL'].rstrip('\n'))
        self.assertEqual(os.environ['BROL1'],
                         self.env_nohook['BROL1'].rstrip('\n'))
        self.logger.info("BROL - " + os.environ['BROL1'] + " == " +
                         self.env_nohook['BROL1'].rstrip('\n'))

    @skipOnShasta
    def test_execjob_epi2(self):
        """
        Test that Variable_List will contain environment variable
        with commas, newline and all special characters for a job
        that has been recovered from a prematurely killed mom. This
        is a test from an execjob_epilogue hook's view.
        PRE: Set up currently executing user's environment to have variables
             whose values have the special characters.
             Submit a job using the -V option (pass current environment)
             where there is an execjob_epilogue hook that references
             Variable_List value.
             Now kill -9 pbs_mom and then restart it.
             This causes pbs_mom to read in job data from the *.JB file on
             disk, and pbs_mom immediately kills the job causing
             execjob_epilogue hook to execute.
        POST: The epilogue hook should see the proper value to the
              Variable_List.
        """

        msg = "skipped due to issue: "
        msg += "PTL failed to parse env variable"
        msg += " when qstat has multiline variable/attr value."
        self.skipTest(msg)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 60}
        j = Job(attrs=a)
        script = ['#PBS -V']
        script += ['env\n']
        script += ['sleep 30\n']
        j.create_script(body=script)

        # Now create/start the hook
        hook_name = "test_epi"
        hook_body = """
import pbs
import time
e = pbs.event()
j = e.job
pbs.logmsg(pbs.LOG_DEBUG,"Variable_List is %s" % (j.Variable_List,))
pbs.logmsg(pbs.LOG_DEBUG,
    "PBS_O_LOGNAME is %s" % j.Variable_List["PBS_O_LOGNAME"])
"""

        a = {'event': "execjob_epilogue", 'enabled': "true", 'debug': "true"}

        self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)

        # Submit a job with hooks in the system
        jid = self.server.submit(j)

        # Wait for the job to start running.
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # kill -9 mom
        self.mom.signal('-KILL')

        # now restart mom
        self.mom.start()

        self.mom.log_match("Restart sent to server")

        # Verify the env variables are seen in logs
        self.common_log_match("mom")
        self.mom.log_match(
            "PBS_O_LOGNAME is %s" % (self.du.get_current_user()))


================================================
FILE: test/tests/functional/pbs_hook_set_nonexist.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


class TestHookSetNonExist(TestFunctional):

    def test_set_on_nonexist_hook(self):
        try:
            a = {ATTR_enable: True}
            self.server.manager(MGR_CMD_SET, MGR_OBJ_HOOK, a, id="test")
        except PbsManagerError:
            pass
        else:
            _msg = "Mgr set operation should fail on non existance hook"
            self.assertTrue(False, _msg)


================================================
FILE: test/tests/functional/pbs_hook_timeout.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
from tests.functional import *
from time import sleep


@requirements(num_moms=3)
class TestHookTimeout(TestFunctional):
    """
    Test to make sure hooks are resent to moms that don't ack when
    the hooks are sent
    """

    def setUp(self):
        TestFunctional.setUp(self)

        if len(self.moms) != 3:
            self.skip_test('Test requires 3 moms, use -p <moms>')

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momC = self.moms.values()[2]
        self.momA.delete_vnode_defs()
        self.momB.delete_vnode_defs()
        self.momC.delete_vnode_defs()

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        self.hostC = self.momC.shortname

        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostC)
        for mom in self.moms.values():
            self.server.expect(NODE, {'state': 'free'}, id=mom.shortname)

    def timeout_messages(self, num_msg=1, starttime=None):
        msg_found = None
        for count in range(10):
            sleep(30)
            allmatch_msg = self.server.log_match(
                "Timing out previous send of mom hook updates ",
                max_attempts=1, starttime=starttime, allmatch=True)
            if len(allmatch_msg) >= num_msg:
                msg_found = allmatch_msg
                break
        self.assertIsNotNone(msg_found,
                             msg="Didn't get expected timeout messages")

    def test_hook_send(self):
        """
        Test when the server doesn't receive an ACK from a mom for
        sending hooks he resends them
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})
        timeout_max_attempt = 7

        # Make momB unresponsive
        self.logger.info("Stopping MomB")
        self.momB.signal("-STOP")

        start_time = time.time()

        hook_body = "import pbs\n"
        a = {'event': 'execjob_epilogue', 'enabled': 'True'}

        self.server.create_hook("test", a)
        self.server.import_hook("test", hook_body)

        # First batch of hook update is for the *.HK files
        self.server.log_match(
            "Timing out previous send of mom hook updates ", n=600,
            max_attempts=timeout_max_attempt, interval=30,
            starttime=start_time)

        # sent hook control file
        for h in [self.hostA, self.hostB, self.hostC]:
            hfile = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                 "server_priv", "hooks", "test.HK")
            if h != self.hostB:
                exist = True
            else:
                exist = False
            self.server.log_match(
                ".*successfully sent hook file %s to %s.*" %
                (hfile, h), max_attempts=5, interval=1,
                regexp=True, existence=exist,
                starttime=start_time)

        # Second batch of hook update is for the *.PY files + resend of
        # *.HK file to momB
        self.timeout_messages(2, start_time)
        # sent hook content file
        for h in [self.hostA, self.hostB, self.hostC]:
            hfile = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                 "server_priv", "hooks", "test.PY")
            if h != self.hostB:
                exist = True
            else:
                exist = False

            self.server.log_match(
                ".*successfully sent hook file %s to %s.*" %
                (hfile, h), max_attempts=3, interval=1,
                regexp=True, existence=exist,
                starttime=start_time)

        # Now check to make sure moms have received the hook files
        for m in [self.momA, self.momB, self.momC]:
            if m != self.momB:
                exist = True
            else:
                exist = False
            m.log_match(
                "test.HK;copy hook-related file request received",
                regexp=True, max_attempts=10, interval=1,
                existence=exist, starttime=start_time)

            m.log_match(
                "test.PY;copy hook-related file request received",
                regexp=True, max_attempts=10, interval=1,
                existence=exist, starttime=start_time)

        # Ensure that hook send updates are retried for
        # the *.HK and *.PY file to momB
        self.timeout_messages(3, start_time)
        # Submit a job, it should still run
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'scatter'}
        j1 = Job(TEST_USER, attrs=a)
        j1id = self.server.submit(j1)

        # Wait for the job to start running.
        a = {ATTR_state: (EQ, 'R'), ATTR_substate: (EQ, 41)}
        self.server.expect(JOB, a, op=PTL_AND, id=j1id)

        self.server.log_match(
            "%s;vnode %s.*parent mom.*has a pending copy hook "
            "or delete hook request.*" % (j1id, self.hostB),
            max_attempts=5, interval=1, regexp=True,
            starttime=start_time)

    def tearDown(self):
        self.momB.signal("-CONT")
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_hook_unset_res.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *

hook_body_modifyjob = """
import pbs
e = pbs.event()
j = e.job
select = "1:ncpus=1:mem=10m"
j.Resource_List['ncpus'] = None
j.Resource_List['select'] = pbs.select(select)
j.comment = "Modified this job"
"""

hook_body_node_res_unset = """
import pbs
e = pbs.event()
vnl = pbs.event().vnode_list
local_node = pbs.get_local_nodename()
vnl[local_node].resources_available["foo"] = None
"""


class TestHookUnsetRes(TestFunctional):

    def test_modifyjob_hook(self):
        """
        Unsetting ncpus, that is ['ncpus'] = None, in modifyjob hook
        """
        hook_name = "myhook"
        a = {'event': 'modifyjob', 'enabled': 'True'}
        rv = self.server.create_import_hook(
            hook_name, a, hook_body_modifyjob, overwrite=True)
        self.assertTrue(rv)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})
        j = Job(TEST_USER, attrs={
                'Resource_List.select': '1:ncpus=1', ATTR_h: None})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'H'}, id=jid)
        self.server.alterjob(jid, {'Resource_List.ncpus': '2'})

    def test_node_res_unset_hook(self):
        """
        Unsetting custom node resource via hook and test
        the resource can be set again on the node.
        """
        a = {'type': 'string', 'flag': 'h'}
        r = 'foo'
        self.server.manager(MGR_CMD_CREATE, RSC, a, id=r)

        vnode = self.mom.shortname
        self.server.manager(
            MGR_CMD_SET, NODE,
            {'resources_available.foo': 'bar'},
            id=vnode,
            runas=ROOT_USER)

        hook_name = "node_res_unset"
        a = {'event': 'exechost_periodic',
             'enabled': 'True',
             'freq': 10}
        rv = self.server.create_import_hook(
            hook_name, a, hook_body_node_res_unset, overwrite=True)
        self.assertTrue(rv)

        msg = 'resource resources_available.foo= per mom hook request'
        self.server.log_match(msg, starttime=time.time())

        rc = self.server.manager(
            MGR_CMD_SET, NODE,
            {'resources_available.foo': 'bar'},
            id=vnode,
            runas=ROOT_USER)
        self.assertEqual(rc, 0)


================================================
FILE: test/tests/functional/pbs_hooksmoketest.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


@tags('hooks', 'smoke')
class TestHookSmokeTest(TestFunctional):
    """
    Hooks Smoke Test
    """
    hook_name = "test_hook"

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'log_events': 2047, 'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.script = []
        self.script += ['echo Hello World\n']
        self.script += ['%s 30\n' % (self.mom.sleep_cmd)]
        if self.du.get_platform() == "cray" or \
           self.du.get_platform() == "craysim":
            self.script += ['aprun -b -B /bin/sleep 10']

    def check_hk_file(self, hook_name, existence=False):
        """
        Function to check existence of server's hook
        directory, name of the .HK file and path of HK file
        """
        conf = self.du.parse_pbs_config()
        pbs_home = conf['PBS_HOME']
        server_hooks_dir = os.path.join(pbs_home, "server_priv", "hooks")
        rc = self.du.isdir(hostname=self.server.hostname,
                           path=server_hooks_dir, sudo=True)
        msg = "Dir '%s' not present" % server_hooks_dir
        self.assertEqual(rc, True, msg)
        self.logger.info("As expected dir '%s' present" % server_hooks_dir)
        hk_file = hook_name + ".HK"
        hk_file_location = os.path.join(server_hooks_dir, hk_file)
        self.logger.info("Check existence of .HK file")
        count = 2
        if existence:
            count = 10
            msg = "As expected file '%s' is present" % hk_file
            msg += " in '%s' directory" % server_hooks_dir
            _msg = "File '%s' is not present" % hk_file
            _msg += " in '%s' directory" % server_hooks_dir
        else:
            msg = "As expected file '%s' is not present" % hk_file
            msg += " in '%s' directory" % server_hooks_dir
            _msg = "File '%s' is present" % hk_file
            _msg += " in '%s' directory" % server_hooks_dir

        # sleeping for some time as generation of *.HK file takes time
        while True:
            rc = self.du.isfile(hostname=self.server.hostname,
                                path=hk_file_location,
                                sudo=True)
            count = count - 1
            if rc or count == 0:
                break
            time.sleep(1)
        self.assertEqual(rc, existence, _msg)
        self.logger.info(msg)

    def test_create_and_print_hook(self):
        """
        Test create and print a hook
        """
        attrs = {'event': 'queuejob'}
        self.logger.info('Create a queuejob hook')
        self.server.create_hook(self.hook_name, attrs)
        self.check_hk_file(self.hook_name, existence=True)

        attrs = {'type': 'site', 'enabled': 'true', 'event': 'queuejob',
                 'alarm': 30, 'order': 1, 'debug': 'false',
                 'user': 'pbsadmin', 'fail_action': 'none'}
        self.logger.info('Verify hook values for test_hook')
        rc = self.server.manager(MGR_CMD_LIST, HOOK,
                                 id=self.hook_name)
        self.assertEqual(rc, 0)
        rv = self.server.expect(HOOK, attrs, id=self.hook_name)
        self.assertTrue(rv)

    def test_import_and_export_hook(self):
        """
        Test import and export hook
        """
        hook_body = """import pbs
e = pbs.event()
j = e.job
if j.Resource_List["walltime"] is None:
  e.reject("no walltime specified")
j.Resource_List["mem"] = pbs.size("7mb")
e.accept()"""
        imp_hook_body = hook_body.split('\n')
        exp_hook_body = imp_hook_body
        attrs = {'event': 'queuejob'}
        self.server.create_import_hook(self.hook_name, attrs, hook_body)
        fn = self.du.create_temp_file(asuser=ROOT_USER)
        hook_attrs = 'application/x-config default %s' % fn
        rc = self.server.manager(MGR_CMD_EXPORT, HOOK, hook_attrs,
                                 self.hook_name)
        self.assertEqual(rc, 0)
        # For Cray PTL does not run on the server host
        if self.du.is_localhost(self.server.hostname):
            cmd = "export h test_hook application/x-python default"
        else:
            cmd = "'export h test_hook application/x-python default'"
        export_cmd = [os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                   'qmgr'), '-c', cmd]
        ret = self.du.run_cmd(self.server.hostname, export_cmd, sudo=True)
        self.assertEqual(ret['out'], exp_hook_body,
                         msg="Failed to get expected usage message")

    def test_enable_and_disable_hook(self):
        """
        Test enable and disable a hook
        """
        rc = self.server.manager(MGR_CMD_CREATE, HOOK, None, self.hook_name)
        self.assertEqual(rc, 0)
        self.server.manager(MGR_CMD_SET, HOOK, {
                            'enabled': 0}, id=self.hook_name)
        attrs = {'type': 'site', 'enabled': 'false', 'event': '""',
                 'alarm': 30, 'order': 1, 'debug': 'false',
                 'user': 'pbsadmin', 'fail_action': 'none'}
        self.logger.info('Verify hook values for test_hook')
        rc = self.server.manager(MGR_CMD_LIST, HOOK,
                                 id=self.hook_name)
        self.assertEqual(rc, 0)
        rv = self.server.expect(HOOK, attrs, id=self.hook_name)
        self.assertTrue(rv)
        self.server.manager(MGR_CMD_SET, HOOK, {
                            'enabled': 1}, id=self.hook_name)
        self.logger.info('Verify hook values for test_hook')
        attrs['enabled'] = 'true'
        rc = self.server.manager(MGR_CMD_LIST, HOOK,
                                 id=self.hook_name)
        self.assertEqual(rc, 0)
        rv = self.server.expect(HOOK, attrs, id=self.hook_name)
        self.assertTrue(rv)

    def test_modify_hook(self):
        """
        Test to modify a hook"
        """
        attrs = {'event': 'queuejob', 'alarm': 60,
                 'enabled': 'false', 'order': 7}
        self.logger.info('Create hook test_hook')
        rv = self.server.create_hook(self.hook_name, attrs)
        self.assertTrue(rv)
        rc = self.server.manager(MGR_CMD_LIST, HOOK,
                                 id=self.hook_name)
        self.assertEqual(rc, 0)
        rv = self.server.expect(HOOK, attrs, id=self.hook_name)
        self.assertTrue(rv)
        self.logger.info("Modify hook test_hook event")
        self.server.manager(MGR_CMD_SET, HOOK, {
                            'event+': 'resvsub'}, id=self.hook_name)
        self.logger.info('Verify hook values for test_hook')
        attrs2 = {'event': 'queuejob,resvsub',
                  'alarm': 60, 'enabled': 'false', 'order': 7}
        rc = self.server.manager(MGR_CMD_LIST, HOOK,
                                 id=self.hook_name)
        self.assertEqual(rc, 0)
        rv = self.server.expect(HOOK, attrs2, id=self.hook_name)
        self.assertTrue(rv)
        self.server.manager(MGR_CMD_SET, HOOK, {
                            'event-': 'resvsub'}, id=self.hook_name)
        self.logger.info('Verify hook values for test_hook')
        rc = self.server.manager(MGR_CMD_LIST, HOOK,
                                 id=self.hook_name)
        self.assertEqual(rc, 0)
        rv = self.server.expect(HOOK, attrs, id=self.hook_name)
        self.assertTrue(rv)

    def test_delete_hook(self):
        """
        Test delete a hook
        """
        rc = self.server.manager(MGR_CMD_CREATE, HOOK, None, self.hook_name)
        self.assertEqual(rc, 0)
        self.server.manager(MGR_CMD_DELETE, HOOK, id=self.hook_name)
        # For Cray PTL does not run on the server host
        if self.du.is_localhost(self.server.hostname):
            cmd = "l h test_hook"
        else:
            cmd = "'l h test_hook'"
        export_cmd = [os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                   'qmgr'), '-c', cmd]
        ret = self.du.run_cmd(self.server.hostname, export_cmd, sudo=True)
        err_msg = []
        err_msg.append("qmgr obj=test_hook svr=default: hook not found")
        err_msg.append("qmgr: hook error returned from server")
        for i in err_msg:
            self.assertIn(i, ret['err'],
                          msg="Failed to get expected error message")
        self.check_hk_file(self.hook_name)

    def test_queuejob_hook(self):
        """
        Test queuejob hook
        """
        # Create a hook with event queuejob
        hook_body = """import pbs
import time

e = pbs.event()
j = e.job
if not j.Resource_List["walltime"]:

        e.reject("No walltime specified. Master does not approve! ;o)")
        # select resource
        sel = pbs.select("1:ncpus=2")
        s = repr(sel)
else:
        e.accept()"""

        attrs = {'event': 'queuejob', 'enabled': 'True'}
        rv = self.server.create_import_hook(self.hook_name, attrs, hook_body)
        self.assertTrue(rv)
        # As a user submit a job requesting walltime
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {'Resource_List.walltime': 30}
        j1 = Job(TEST_USER, a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        # As a user submit a job without requesting walltime
        # Job is denied with the message
        _msg = "qsub: No walltime specified. Master does not approve! ;o)"
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER1)
        j2 = Job(TEST_USER1)
        j2.create_script(self.script)
        try:
            jid2 = self.server.submit(j2, submit_dir=submit_dir)
        except PbsSubmitError as e:
            self.assertEqual(
                e.msg[0], _msg, msg="Did not get expected qsub err message")
            self.logger.info("Got expected qsub err message as %s", e.msg[0])
        # To handle delay in  ALPS reservation cancelation on cray simulator
        # Deleting job explicitly
        self.server.delete([jid1])

    def test_modifyjob_hook(self):
        """
        Test modifyjob hook
        """
        # Create a hook with event modifyjob
        hook_body = """import pbs

try:
 e = pbs.event()
 r = e.resv

except pbs.EventIncompatibleError:
 e.reject( "Event is incompatible")"""

        a = {'eligible_time_enable': 'True', 'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        attrs = {'event': 'modifyjob', 'enabled': 'True'}
        rv = self.server.create_import_hook(self.hook_name, attrs, hook_body)
        self.assertTrue(rv)
        # As user submit a job j1
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER2)
        j1 = Job(TEST_USER2)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        # qalter the job, qalter will fail with error
        _msg = "qalter: Event is incompatible " + jid1
        try:
            self.server.alterjob(jid1, {ATTR_p: '5'})
        except PbsAlterError as e:
            self.assertEqual(
                e.msg[0], _msg, msg="Did not get expected qalter err message")
            self.logger.info("Got expected qalter err message as %s", e.msg[0])
        # To handle delay in  ALPS reservation cancelation on cray simulator
        # Deleting job explicitly
        self.server.delete([jid1])

    def test_resvsub_hook(self):
        """
        Test resvsub hook
        """
        # Create a hook with event resvsub
        hook_body = """import pbs
e = pbs.event()
r = e.resv

r.Resource_List["place"] = pbs.place("pack:freed")"""

        attrs = {'event': 'resvsub', 'enabled': 'True'}
        rv = self.server.create_import_hook(self.hook_name, attrs, hook_body)
        self.assertTrue(rv)
        # Submit a reservation
        now = int(time.time())
        a = {'reserve_start': now + 10,
             'reserve_end': now + 120}
        r = Reservation(TEST_USER3, attrs=a)
        # The reservation gets an error as
        _msg = "pbs_rsub: request rejected as filter hook " + "'" + \
            self.hook_name + "'" + \
            " encountered an exception. Please inform Admin"
        try:
            rid = self.server.submit(r)
        except PbsSubmitError as e:
            self.assertEqual(
                e.msg[0], _msg,
                msg="Did not get expected pbs_rsub err message")
            self.logger.info(
                "Got expected pbs_rsub err message as %s", e.msg[0])

    def test_movejob_hook(self):
        """
        Test movejob hook
        """
        # Create testq
        qname = 'testq'
        err_msg = []
        err_msg.append("qmgr obj=testq svr=default: Unknown queue")
        err_msg.append("qmgr: Error (15018) returned from server")
        try:
            self.server.manager(MGR_CMD_DELETE, QUEUE, None, qname)
        except PbsManagerError as e:
            for i in err_msg:
                self.assertIn(i, e.msg,
                              msg="Failed to get expected error message")
            self.logger.info("Got expected qmgr err message as %s", e.msg)

        a = {'queue_type': 'Execution', 'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)
        # Create a hook with event movejob
        hook_body = """import pbs
e = pbs.event()
j = e.job

if j.queue.name == "testq" and not j.Resource_List["mem"]:
 e.reject("testq requires job to have mem")"""
        attrs = {'event': 'movejob', 'enabled': 'True'}
        rv = self.server.create_import_hook(self.hook_name, attrs, hook_body)
        self.assertTrue(rv)
        # submit a job j1 to default queue
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER4)
        a = {ATTR_h: None, 'Resource_List.mem': '30mb'}
        j1 = Job(TEST_USER4, a)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'H'}, id=jid1)
        # qmove the job to queue testq
        self.server.movejob(jid1, "testq")
        self.server.expect(
            JOB, {'job_state': 'H', ATTR_queue: 'testq'},
            attrop=PTL_AND, id=jid1)
        # Submit a job j2
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER5)
        a = {ATTR_h: None}
        j2 = Job(TEST_USER5, a)
        j2.create_script(self.script)
        jid2 = self.server.submit(j2, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'H'}, id=jid2)
        # qmove the job j2 to queue testq
        # Qmove will fail with an error
        _msg = "qmove: testq requires job to have mem " + jid2
        try:
            self.server.movejob(jid2, "testq")
        except PbsMoveError as e:
            self.assertEqual(
                e.msg[0], _msg, msg="Did not get expected qmove err message")
            self.logger.info("Got expected qmove err message as %s", e.msg[0])
        # Delete the jobs and delete queue testq
        self.server.delete([jid1, jid2])
        self.server.manager(MGR_CMD_DELETE, QUEUE, None, qname)

    def test_runjob_hook(self):
        """
        Test runjob hook using qrun
        """
        # Create a hook with event runjob
        hook_body = """import pbs

def print_attribs(pbs_obj):

 pbs.logmsg(pbs.LOG_DEBUG, "Printing a PBS object of type %s" % (type(pbs_obj)
))
 for a in pbs_obj.attributes:
  v = getattr(pbs_obj, a)
  if v and str(v) != "":
   pbs.logmsg(pbs.LOG_DEBUG, "%s = %s" % (a,v))

e = pbs.event()

print_attribs(e)

j = e.job
print_attribs(j)"""
        now = time.time()
        attrs = {'event': 'runjob', 'enabled': 'True'}
        rv = self.server.create_import_hook(self.hook_name, attrs, hook_body)
        self.assertTrue(rv)
        # Set scheduling false
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})
        # submit job j1
        submit_dir = self.du.create_temp_dir(asuser=TEST_USER7)
        # submit job j1
        j1 = Job(TEST_USER7)
        j1.create_script(self.script)
        jid1 = self.server.submit(j1, submit_dir=submit_dir)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        # qrun job j1
        self.server.runjob(jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        # Get exec_vnode for job j1
        ret = self.server.status(JOB, {'exec_vnode'}, id=jid1)
        ev = ret[0]['exec_vnode']
        # Verify server logs
        self.logger.info("Verifying logs in server")
        msg_1 = "Server@.*;Hook;%s;started" % \
                (re.escape(self.hook_name))
        msg_2 = "Hook;Server@.*;requestor = Scheduler"
        msg_3 = "Hook;Server@.*;hook_name = %s" % \
                (re.escape(self.hook_name))
        msg_4 = "Hook;Server@.*;exec_vnode = %s" % \
                (re.escape(ev))
        # Character escaping '()' as the log_match is regexp
        msg_5 = "Server@.*;Hook;%s;finished" % \
                (re.escape(self.hook_name))
        msg = [msg_1, msg_2, msg_3, msg_4, msg_5]
        for i in msg:
            self.server.log_match(i, starttime=now, regexp=True)
            self.logger.info("Got expected logs in server as %s", i)

    def tearDown(self):
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})
        PBSTestSuite.tearDown(self)


================================================
FILE: test/tests/functional/pbs_hookswig.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestHookSwig(TestFunctional):

    """
    This test suite contains hook test to verify that the internal,
    swig-generated 'pbs_ifl.py' does not cause an exception.
    """

    def test_hook(self):
        """
        Create a hook, import a hook content that test pbs.server() call.
        """
        hook_name = "testhook"
        hook_body = """
import pbs
e = pbs.event()
s = pbs.server()
if e.job.id:
    jid = e.job.id
else:
    jid = "newjob"
pbs.logjobmsg(jid, "server is %s" % (s.name,))
"""
        a = {'event': ['queuejob', 'execjob_begin'], 'enabled': 'True'}
        self.server.create_import_hook(hook_name, a, hook_body)

        j = Job(TEST_USER)
        a = {'Resource_List.select': '1:ncpus=1', 'Resource_List.walltime': 30}

        j.set_attributes(a)
        j.set_sleep_time(10)

        try:
            jid = self.server.submit(j)
        except PbsSubmitError:
            pass
        self.server.log_match("Job;%s;server is %s" % (
            "newjob", self.server.shortname))

        self.mom.log_match("Job;%s;server is %s" % (
            jid, self.server.shortname))


================================================
FILE: test/tests/functional/pbs_indirect_resources.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestHostResources(TestFunctional):

    def test_set_direct_on_indirect_resc(self):
        """
        Set a direct resource on indirect resource and make sure
        this change is reflected on resource assigned.
        """
        # Create a consumable custom resources 'fooi'
        self.server.add_resource('fooi', 'long', 'nh')
        # Create 2 vnodes with individual hosts
        attr = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(attr, 2, sharednode=False)
        vnode0 = self.mom.shortname + '[0]'
        vnode1 = self.mom.shortname + '[1]'
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.fooi': 100}, vnode0)
        self.server.manager(MGR_CMD_SET, NODE, {'resources_available.fooi':
                                                '@' + vnode0}, vnode1)
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.fooi': 100}, vnode1)
        self.server.expect(NODE, {'resources_assigned.fooi': ''},
                           id=vnode1, op=UNSET, max_attempts=1)

    def test_set_direct_on_indirect_resc_busy(self):
        """
        Set a direct resource on indirect resource
        but a busy node and make sure this is failing.
        """
        # Create 2 vnodes with individual hosts
        attr = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(attr, 2, sharednode=False)
        vnode0 = self.mom.shortname + '[0]'
        vnode1 = self.mom.shortname + '[1]'
        # Create a consumable custom resources 'fooi'
        self.server.add_resource('fooi', 'long', 'nh')
        self.scheduler.add_resource("fooi")
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.fooi': 100}, vnode0)
        self.server.manager(MGR_CMD_SET, NODE, {'resources_available.fooi':
                                                '@' + vnode0}, vnode1)
        # Submit jobs.
        a = {'Resource_List.fooi': 50}
        J = Job(attrs=a)
        self.server.submit(J)
        j2 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2)
        self.server.expect(NODE, {'state': 'job-busy'}, id=vnode1)
        try:
            self.server.manager(MGR_CMD_SET, NODE,
                                {'resources_available.fooi': 100},
                                vnode1)
        except PbsManagerError:
            pass
        else:
            self.server.expect(NODE, {'resources_available.fooi': 100},
                               id=vnode1, op=UNSET, max_attempts=1)

    def test_set_direct_on_target_node(self):
        """
        Set a direct resource on target node which should
        fail with error.
        A and B are having direct resources.
        C -> B
        B -> A should fail as it is alreay a target.
        """
        # Create 3 vnodes with individual hosts
        attr = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(attr, 3, sharednode=False)
        # Create a consumable custom resources 'fooi'
        self.server.add_resource('fooi', 'long', 'nh')
        vnode0 = self.mom.shortname + '[0]'
        vnode1 = self.mom.shortname + '[1]'
        vnode2 = self.mom.shortname + '[2]'
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.fooi': 100}, vnode0)
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.fooi': 100}, vnode1)
        self.server.manager(MGR_CMD_SET, NODE, {'resources_available.fooi':
                                                '@' + vnode1}, vnode2)
        try:
            self.server.manager(MGR_CMD_SET, NODE,
                                {'resources_available.fooi': '@' + vnode0},
                                vnode1)
        except PbsManagerError:
            pass
        else:
            _msg = "Setting indirect resources on a target object should fail"
            self.assertTrue(False, _msg)

    def test_create_node_without_resc_set(self):
        """
        Create a consumable resource then create a new node.
        The resources_assigned value should not get assigned
        on it without explicitely setting resource on the node.
        """
        # Create a consumable custom resources 'fooi'
        self.server.add_resource('fooi', 'long', 'nh')
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.mom.shortname)
        self.server.expect(NODE, {'resources_assigned.fooi': ''},
                           id=self.mom.shortname, op=UNSET, max_attempts=1)


================================================
FILE: test/tests/functional/pbs_init_script.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestPbsInitScript(TestFunctional):
    """
    Testing PBS init script
    """

    def test_env_vars_precede_pbs_conf_file(self):
        """
        Test PBS_START environment variables overrides values in pbs.conf file
        """
        conf = {'PBS_START_SERVER': '1', 'PBS_START_SCHED': '1',
                'PBS_START_COMM': '1', 'PBS_START_MOM': '1'}
        self.du.set_pbs_config(confs=conf)

        conf_path = self.du.parse_pbs_config()
        pbs_init = os.path.join(os.sep, conf_path['PBS_EXEC'],
                                'libexec', 'pbs_init.d')
        self.du.run_cmd(cmd=[pbs_init, 'stop'], sudo=True)

        conf['PBS_START_MOM'] = '0'
        self.du.set_pbs_config(confs=conf)

        cmd = copy.copy(self.du.sudo_cmd)
        cmd += ['PBS_START_SERVER=0', 'PBS_START_SCHED=0',
                'PBS_START_COMM=0', 'PBS_START_MOM=1',
                pbs_init, 'start']

        rc = self.du.run_cmd(cmd=cmd, as_script=True)
        output = rc['out']

        self.assertNotIn("PBS server", output)
        self.assertNotIn("PBS sched", output)
        self.assertNotIn("PBS comm", output)
        self.assertIn("PBS mom", output)

    def tearDown(self):
        # Above test leaves system in unusable state for PTL and PBS.
        # Hence restarting PBS explicitly
        PBSInitServices().restart()
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_job_array.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


class TestJobArray(TestFunctional):
    """
    Test suite for job array feature
    """
    lu = PBSLogUtils()
    qjh = """
import pbs

e = pbs.event()
j = e.job
if j.max_run_subjobs is None:
    j.max_run_subjobs = %d
pbs.logmsg(pbs.LOG_DEBUG, "max_run_subjobs set to %%d" %% j.max_run_subjobs)
e.accept()
"""
    mjh = """
import pbs

e = pbs.event()
j = e.job
if j.max_run_subjobs != 0:
    if j.max_run_subjobs > 10:
        j.max_run_subjobs = %d
pbs.logmsg(pbs.LOG_DEBUG, "max_run_subjobs set to %%d" %% j.max_run_subjobs)
e.accept()
"""
    mjh2 = """
import pbs

e = pbs.event()
j = e.job
j.max_run_subjobs = %d
pbs.logmsg(pbs.LOG_DEBUG, "max_run_subjobs set to %%d" %% j.max_run_subjobs)
e.accept()
"""

    def create_max_run_subjobs_hook(self, max_run, event, name, script):
        """
        function to create a hook
        - max_run Number of subjobs that can concurrently run
        - event queuejob or modifyjob
        - name hook name
        - script hook script
        """
        hook = script % int(max_run)
        attrs = {'event': event}
        self.server.create_import_hook(name, attrs, hook, overwrite=True)

    def test_arrayjob_Erecord_startval(self):
        """
        Check that an arrayjob's E record's 'start' value is not set to 0
        """
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', ATTR_k: 'oe',
            'Resource_List.select': 'ncpus=1'
        })
        j.set_sleep_time(1)

        j_id = self.server.submit(j)

        # Check for the E record for the arrayjob
        acct_string = ";E;" + str(j_id)
        _, record = self.server.accounting_match(acct_string, max_attempts=10,
                                                 interval=1)

        # Extract the 'start' value from the E record
        values = record.split(";", 3)[3]
        start_str = " start="
        values_temp = values.split(start_str, 1)[1]
        start_val = int(values_temp.split()[0])

        # Verify that the value of 'start' isn't 0
        self.assertNotEqual(start_val, 0,
                            "E record value of 'start' for arrayjob is 0")

    def kill_and_restart_svr(self):
        try:
            self.server.stop('-KILL')
        except PbsServiceError as e:
            # The server failed to stop
            raise self.failureException("Server failed to stop:" + e.msg)

        try:
            self.server.start()
        except PbsServiceError as e:
            # The server failed to start
            raise self.failureException("Server failed to start:" + e.msg)
        self.server.isUp()
        rv = self.is_server_licensed(self.server)
        _msg = 'No license found on server %s' % (self.server.shortname)
        self.assertTrue(rv, _msg)
        attr = {'state': (MATCH_RE, 'free|job-busy')}
        self.server.expect(NODE, attr, id=self.mom.shortname)

    def test_running_subjob_survive_restart(self):
        """
        Test to check if a running subjob of an array job survive a
        pbs_server restart
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-3', 'Resource_List.select': 'ncpus=1'})

        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)

        # 1. check job array has begun
        self.server.expect(JOB, {'job_state': 'B'}, j_id)

        # 2. check subjob 1 started running
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)

        # 3. Kill and restart the server
        self.kill_and_restart_svr()

        # 4. array job should be B
        self.server.expect(JOB, {'job_state': 'B'}, j_id)

        # 5. subjob 1 should be R
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)

    def test_running_subjob_survive_restart_with_history(self):
        """
        Test to check if a running subjob of an array job survive a
        pbs_server restart when history is enabled
        """
        attr = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        self.test_running_subjob_survive_restart()

    def test_suspended_subjob_survive_restart(self):
        """
        Test to check if a suspended subjob of an array job survive a
        pbs_server restart
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-3', 'Resource_List.select': 'ncpus=1'})

        j.set_sleep_time(10)

        j_id = self.server.submit(j)
        subjid_2 = j.create_subjob_id(j_id, 2)

        # 1. check job array has begun
        self.server.expect(JOB, {'job_state': 'B'}, j_id)

        # 2. wait till subjob_2 starts running
        self.server.expect(JOB, {'job_state': 'R'}, subjid_2)

        try:
            self.server.sigjob(subjid_2, 'suspend')
        except PbsSignalError as e:
            raise self.failureException("Failed to suspend subjob:" + e.msg)

        self.server.expect(JOB, {'job_state': 'S'}, subjid_2, max_attempts=1)

        # 3. Kill and restart the server
        self.kill_and_restart_svr()

        # 4. array job should be B
        self.server.expect(JOB, {'job_state': 'B'}, j_id, max_attempts=1)

        # 5. subjob_2 should be S
        self.server.expect(JOB, {'job_state': 'S'}, subjid_2, max_attempts=1)

        try:
            self.server.sigjob(subjid_2, 'resume')
        except PbsSignalError as e:
            raise self.failureException("Failed to resume subjob:" + e.msg)

    def test_suspended_subjob_survive_restart_with_history(self):
        """
        Test to check if a suspended subjob of an array job survive a
        pbs_server restart when history is enabled
        """
        attr = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        self.test_suspended_subjob_survive_restart()

    def test_deleted_q_subjob_survive_restart(self):
        """
        Test to check if a deleted queued subjob of an array job survive a
        pbs_server restart when history is disabled
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-3', 'Resource_List.select': 'ncpus=1'})

        j.set_sleep_time(10)

        j_id = self.server.submit(j)
        subjid_3 = j.create_subjob_id(j_id, 3)

        self.server.expect(JOB, {'job_state': 'B'}, j_id)
        self.server.deljob(subjid_3)
        self.server.expect(JOB, {'job_state': 'X'}, subjid_3)

        self.kill_and_restart_svr()

        self.server.expect(JOB, {'job_state': 'B'}, j_id, max_attempts=1)
        self.server.expect(JOB, {'job_state': 'X'}, subjid_3, max_attempts=1)

    def test_deleted_q_subjob_survive_restart_w_history(self):
        """
        Test to check if a deleted queued subjob of an array job survive a
        pbs_server restart when history is enabled
        """
        attr = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        self.test_deleted_q_subjob_survive_restart()

    def test_deleted_r_subjob_survive_restart(self):
        """
        Test to check if a deleted running subjob of an array job survive a
        pbs_server restart when history is disabled
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-3', 'Resource_List.select': 'ncpus=1'})

        j.set_sleep_time(10)

        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)

        self.server.expect(JOB, {'job_state': 'B'}, j_id)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)
        self.server.deljob(subjid_1)
        self.server.expect(JOB, {'job_state': 'X'}, subjid_1)

        self.kill_and_restart_svr()

        self.server.expect(JOB, {'job_state': 'B'}, j_id, max_attempts=1)
        self.server.expect(JOB, {'job_state': 'X'}, subjid_1, max_attempts=1)

    def test_deleted_r_subjob_survive_restart_w_history(self):
        """
        Test to check if a deleted running subjob of an array job survive a
        pbs_server restart when history is enabled
        """
        attr = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        self.test_deleted_q_subjob_survive_restart()

    def test_qdel_expired_subjob(self):
        """
        Test to check if qdel of a subjob is disallowed
        """
        attr = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-3', 'Resource_List.select': 'ncpus=1'})

        j.set_sleep_time(5)

        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)

        # 1. check job array has begun
        self.server.expect(JOB, {'job_state': 'B'}, j_id)

        # 2. wait till subjob 1 becomes expired
        self.server.expect(JOB, {'job_state': 'X'}, subjid_1)

        try:
            self.server.deljob(subjid_1)
        except PbsDeljobError as e:
            err_msg = "Request invalid for finished array subjob"
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")
        else:
            raise self.failureException("subjob in X state can be deleted")

        try:
            self.server.deljob(subjid_1, extend="deletehist")
        except PbsDeljobError as e:
            err_msg = "Request invalid for finished array subjob"
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")
        else:
            raise self.failureException("subjob in X state can be deleted")

    def test_subjob_comments(self):
        """
        Test subjob comments for finished and terminated subjobs
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-30', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(8)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        subjid_2 = j.create_subjob_id(j_id, 2)
        self.server.expect(JOB, {'comment': 'Subjob finished'}, subjid_1,
                           offset=8)
        self.server.delete(subjid_2, extend='force')
        self.server.expect(JOB, {'comment': 'Subjob finished'}, subjid_2)
        self.kill_and_restart_svr()
        self.server.expect(
            JOB, {'comment': 'Subjob finished'}, subjid_1, max_attempts=1)

    def test_subjob_comments_with_history(self):
        """
        Test subjob comments for finished, failed and terminated subjobs
        when history is enabled
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(5)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        subjid_2 = j.create_subjob_id(j_id, 2)
        self.server.delete(subjid_2, extend='force')
        self.server.expect(
            JOB, {'comment': (MATCH_RE, 'finished')}, subjid_2, extend='x')
        self.server.expect(JOB, {'comment': (
            MATCH_RE, 'Job run at.*and finished')}, subjid_1, extend='x')
        self.kill_and_restart_svr()
        self.server.expect(JOB, {'comment': (
            MATCH_RE, 'Job run at.*and finished')}, subjid_1, extend='x',
            max_attempts=1)
        script_body = "exit 1"
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.create_script(body=script_body)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        subjid_2 = j.create_subjob_id(j_id, 2)
        self.server.expect(
            JOB, {'comment': (MATCH_RE, 'Job run at.*and failed')}, subjid_1,
            extend='x')
        self.server.expect(
            JOB, {'comment': (MATCH_RE, 'Job run at.*and failed')}, subjid_2,
            extend='x')
        self.kill_and_restart_svr()
        self.server.expect(
            JOB, {'comment': (MATCH_RE, 'Job run at.*and failed')}, subjid_1,
            extend='x', max_attempts=1)
        self.server.expect(
            JOB, {'comment': (MATCH_RE, 'Job run at.*and failed')}, subjid_2,
            extend='x')

    def test_multiple_server_restarts(self):
        """
        Test subjobs wont rerun after multiple server restarts
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(300)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        a = {'job_state': 'R', 'run_count': 1}
        self.server.expect(JOB, a, subjid_1, attrop=PTL_AND)
        for _ in range(5):
            self.kill_and_restart_svr()
            self.server.expect(
                JOB, a, subjid_1, attrop=PTL_AND)

    def test_job_array_history_duration(self):
        """
        Test that job array and subjobs are purged after history duration
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'job_history_duration': 30}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(15)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        subjid_2 = j.create_subjob_id(j_id, 2)
        a = {'job_state': 'R', 'run_count': 1}
        self.server.expect(JOB, a, subjid_1, attrop=PTL_AND)
        self.server.delete(subjid_1, extend='force')
        b = {'job_state': 'X'}
        self.server.expect(JOB, b, subjid_1)
        self.server.expect(JOB, a, subjid_2, attrop=PTL_AND)
        msg = "Waiting for 150 secs as server will purge db once"
        msg += " in 2 mins plus 30 sec of history duration"
        self.logger.info(msg)
        self.server.expect(JOB, 'job_state', op=UNSET,
                           id=subjid_1, offset=150, extend='x')
        self.server.expect(JOB, 'job_state', op=UNSET,
                           id=subjid_2, extend='x')

    def test_queue_deletion_after_terminated_subjob(self):
        """
        Test that queue can be deleted after the job array is
        terminated and server is restarted.
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        a = {'job_state': 'R', 'run_count': 1}
        self.server.expect(JOB, a, subjid_1, attrop=PTL_AND)
        self.server.delete(subjid_1, extend='force')
        self.kill_and_restart_svr()
        subjid_2 = j.create_subjob_id(j_id, 2)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_2)
        self.server.delete(j_id, wait=True)
        self.server.manager(MGR_CMD_DELETE, QUEUE, id='workq')

    def test_held_job_array_survive_server_restart(self):
        """
        Test held job array can be released after server restart
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(60)
        j_id = self.server.submit(j)
        j_id2 = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        subjid_3 = j.create_subjob_id(j_id2, 1)
        a = {'job_state': 'R', 'run_count': 1}
        self.server.expect(JOB, a, subjid_1, attrop=PTL_AND)
        self.server.holdjob(j_id2, USER_HOLD)
        self.server.expect(JOB, {'job_state': 'H'}, j_id2)
        self.kill_and_restart_svr()
        self.server.delete(j_id, wait=True)
        self.server.expect(JOB, {'job_state': 'H'}, j_id2)
        self.server.rlsjob(j_id2, USER_HOLD)
        self.server.expect(JOB, {'job_state': 'B'}, j_id2)
        self.server.expect(JOB, a, subjid_3, attrop=PTL_AND)

    def test_held_job_array_survive_server_restart_w_history(self):
        """
        Test held job array can be released after server restart
        when history is enabled
        """
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.test_held_job_array_survive_server_restart()

    def test_subjobs_qrun(self):
        """
        Test that job array's subjobs can be qrun
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(60)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        self.server.runjob(subjid_1)
        self.server.expect(JOB, {'job_state': 'B'}, j_id)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)

    def test_dependent_job_array_server_restart(self):
        """
        Check Job array dependency is not released after server restart
        """
        a = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(10)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        subjid_2 = j.create_subjob_id(j_id, 2)
        self.server.expect(JOB, {'job_state': 'B'}, j_id)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_2)
        depend_value = 'afterok:' + j_id
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1',
            ATTR_depend: depend_value})
        j_id2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'H'}, j_id2)
        self.kill_and_restart_svr()
        self.server.expect(JOB, {'job_state': 'F'},
                           j_id, extend='x', interval=5)
        self.server.expect(JOB, {'job_state': 'B'}, j_id2, interval=5)

    def test_rerun_subjobs_server_restart(self):
        """
        Test that subjobs which are requeued remain queued after server restart
        """
        a = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(60)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.rerunjob(subjid_1)
        self.server.expect(JOB, {'job_state': 'Q'}, subjid_1)
        self.kill_and_restart_svr()
        self.server.expect(JOB, {'job_state': 'Q'}, subjid_1)
        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'job_state': 'R'}
        self.server.expect(JOB, a, subjid_1)

    def test_rerun_node_fail_requeue(self):
        """
        Test sub jobs gets requeued after node_fail_requeue time
        """
        a = {'node_fail_requeue': 10}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(60)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)
        self.mom.stop()
        self.server.expect(JOB, {'job_state': 'Q'}, subjid_1, offset=5)

    def test_qmove_job_array(self):
        """
        Test job array's can be qmoved to a high priority queue
        and qmoved job array preempts running subjob
        """
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq1')
        a = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        j.set_sleep_time(60)
        j_id = self.server.submit(j)
        subjid_1 = j.create_subjob_id(j_id, 1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_1)
        j_id2 = self.server.submit(j)
        subjid_3 = j.create_subjob_id(j_id2, 1)
        self.server.movejob(j_id2, 'wq1')
        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(JOB, {'job_state': 'S'}, subjid_1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid_3)

    def test_delete_history_subjob_server_restart(self):
        """
        Test that subjobs can be deleted from history
        and they remain deleted after server restart
        """
        a = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1',
            ATTR_k: 'oe'})
        j.set_sleep_time(5)
        j_id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'F'}, j_id, extend='x', offset=5)
        self.server.delete(j_id, extend='deletehist')
        self.server.expect(JOB, 'job_state', op=UNSET, extend='x', id=j_id)
        self.kill_and_restart_svr()
        self.server.expect(JOB, 'job_state', op=UNSET, extend='x', id=j_id)

    def test_job_id_duplicate_server_restart(self):
        """
        Test that after server restart there is no duplication
        of job identifiers
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
        self.server.submit(j)
        j = Job(TEST_USER)
        self.server.submit(j)
        self.kill_and_restart_svr()
        try:
            j = Job(TEST_USER, attrs={
                ATTR_J: '1-2', 'Resource_List.select': 'ncpus=1'})
            self.server.submit(j)
        except PbsSubmitError as e:
            raise self.failureException("Failed to submit job: " + str(e.msg))

    def test_expired_subjobs_not_reported(self):
        """
        Test if a subjob is finished and moves to expired state,
        it is not reported to scheduler in the next scheduling
        cycle. Scheduler expects only running subjobs to be reported to it.
        """

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        req_node = ":host=" + self.mom.shortname
        res_req = {'Resource_List.select': '1:ncpus=1' + req_node,
                   'array_indices_submitted': '1-16',
                   'Resource_List.place': 'excl'}
        j1 = Job(TEST_USER, attrs=res_req)
        j1.set_sleep_time(2)
        jid1 = self.server.submit(j1)
        j1_sub1 = j1.create_subjob_id(jid1, 1)

        self.server.expect(JOB, {'job_state': 'X'}, j1_sub1)
        # Trigger a sched cycle
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        msg = j1_sub1 + ";" + "Subjob found in undesirable state"
        msg += ", ignoring this job"
        self.scheduler.log_match(msg, existence=False, max_attempts=10)

    def test_subjob_stdfile_custom_dir(self):
        """
        Test that subjobs standard error and out files are generated
        in the custom directory provided with oe qsub options
        """
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_e: tmp_dir, ATTR_o: tmp_dir, ATTR_J: '1-4'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(2)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        self.server.expect(JOB, ATTR_state, op=UNSET, id=jid)
        file_list = [name for name in os.listdir(
            tmp_dir) if os.path.isfile(os.path.join(tmp_dir, name))]
        self.assertEqual(8, len(file_list), 'expected 8 std files')
        for ext in ['.OU', '.ER']:
            for sub_ind in range(1, 5):
                f_name = j.create_subjob_id(jid, sub_ind) + ext
                if f_name not in file_list:
                    raise self.failureException("std file " + f_name +
                                                " not found")

    @skipOnCray
    def test_subjob_wrong_state(self):
        """
        Test that after submitting a job and restarting the server,
        the subjobs are not in the wrong substate and can be scheduled.
        """
        a = {'resources_available.ncpus': 200}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(attrs={ATTR_J: '1-200'})
        j.set_sleep_time(200)
        self.server.submit(j)
        # while the server is sending the jobs to the MoM, restart the server
        self.server.restart()
        # triggering scheduling cycle all jobs are in R state.
        self.scheduler.run_scheduling_cycle()
        # ensure all the subjobs are running
        self.server.expect(JOB, {'job_state=R': 200}, extend='t')

    def test_recover_big_array_job(self):
        """
        Test that during server restart, server is able to recover valid
        array jobs which are bigger than the current value of max_array_size
        server attribute
        """
        # submit a medium size array job
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(attrs={ATTR_J: '1-200'})
        j_id = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=j_id)

        # reduce max_array_size
        a = {ATTR_maxarraysize: 40}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(SERVER, a)
        try:
            self.server.submit(Job(attrs={ATTR_J: '1-200'}))
        except PbsSubmitError as e:
            exp_msg = 'qsub: Array job exceeds server or queue size limit'
            self.assertEqual(exp_msg, e.msg[0])

        # restart the server to check for crash
        try:
            self.server.restart()
        except PbsServiceError as e:
            if 'pbs_server startup failed' in e.msg:
                reset_db = 'echo y | ' + \
                    os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                 'sbin', 'pbs_server') + ' -t create'
                self.du.run_cmd(cmd=reset_db, sudo=True, as_script=True)
            self.fail('TC failed as server recovery failed')
        else:
            self.server.expect(JOB, {ATTR_state: 'B'}, id=j_id)

    def test_max_run_subjobs_basic(self):
        """
        Test that if a job is submitted with 'max_run_subjobs' attribute
        number of subjobs that run do not exceed the attribute value.
        """

        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1)
        j = Job(attrs={ATTR_J: '1-20%2'})
        j_id = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=j_id)
        self.server.expect(JOB, {'job_state=R': 2}, extend='t')

        self.server.alterjob(j_id, {ATTR_W: 'max_run_subjobs=5'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state=R': 5}, extend='t')
        msg = "Number of concurrent running subjobs limit reached"
        self.scheduler.log_match(j_id + ';' + msg)

    @skipOnCpuSet
    def test_max_run_subjobs_equiv_class(self):
        """
        Test that if a job is submitted with 'max_run_subjobs' attribute
        it does not stop jobs in equivalence class from running
        """

        a = {'resources_available.ncpus': 8}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(attrs={ATTR_J: '1-20%2', 'Resource_List.walltime': 3600,
                       'Resource_List.select': 'ncpus=2'})
        j_id = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=j_id)
        self.server.expect(JOB, {'job_state=R': 2}, extend='t')

        j = Job(attrs={'Resource_List.walltime': 3600,
                       'Resource_List.select': 'ncpus=2'})
        j_id_equiv = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j_id_equiv)

    @skipOnCpuSet
    def test_max_run_subjobs_calendar(self):
        """
        Test that if a job is submitted with 'max_run_subjobs' attribute
        gets into calendar when it cannot run.
        """

        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1)
        a = {'backfill_depth': '2'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        j1 = Job(attrs={'Resource_List.walltime': 200})
        j1.set_sleep_time(200)
        j1_id = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1_id)
        j2 = Job(attrs={ATTR_J: '1-20%2', 'Resource_List.walltime': 300})
        j2.set_sleep_time(300)
        j2_id = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=j2_id)
        self.server.expect(JOB, {'job_state=R': 3}, extend='t')
        j2_sub1 = j2.create_subjob_id(j2_id, 1)
        job_arr = self.server.status(JOB, id=j2_sub1)
        stime = self.lu.convert_date_time(job_arr[0]['stime'],
                                          fmt="%a %b %d %H:%M:%S %Y")
        job_arr = self.server.status(JOB, id=j2_id)

        # check estimated start time is set on job array
        self.assertIn('estimated.start_time', job_arr[0])
        errmsg = j2_id + ";Error in calculation of start time of top job"
        self.scheduler.log_match(errmsg, existence=False, max_attempts=10)
        est = self.lu.convert_date_time(job_arr[0]['estimated.start_time'],
                                        fmt="%a %b %d %H:%M:%S %Y")
        self.assertAlmostEqual(stime + 300, est, 1)

    def test_max_run_subjobs_queuejob_hook(self):
        """
        Test that a queuejob hook is able to set max_run_subjobs attribute.
        """
        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1)

        self.create_max_run_subjobs_hook(3, "queuejob", "h1", self.qjh)
        j1 = Job(attrs={ATTR_J: '1-20'})
        jid1 = self.server.submit(j1)
        self.server.log_match("max_run_subjobs set to 3")
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid1)
        self.server.expect(JOB, {'job_state=R': 3}, extend='t')

        # Submit a normal job and see if queuejob hook cannot set the
        # attribute.
        with self.assertRaises(PbsSubmitError) as e:
            self.server.submit(Job())
        self.assertIn("Attribute has to be set on an array job",
                      e.exception.msg[0])

    def test_max_run_subjobs_modifyjob_hook(self):
        """
        Submit array job with large max_run_subjobs limit see if modifyjob
        modifies it.
        """
        a = {'resources_available.ncpus': 20}
        self.mom.create_vnodes(a, 1)

        self.create_max_run_subjobs_hook(3, "modifyjob", "h1", self.mjh)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        j = Job(attrs={ATTR_J: '1-50'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)
        self.server.alterjob(jid, {ATTR_W: 'max_run_subjobs=20'})
        self.server.log_match("max_run_subjobs set to 3")
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state=R': 3}, extend='t')

        # Modify a normal job and see if queuejob hook cannot set the
        # attribute.
        self.create_max_run_subjobs_hook(3, "modifyjob", "h1", self.mjh2)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        nj = self.server.submit(Job())
        with self.assertRaises(PbsAlterError) as e:
            self.server.alterjob(nj, {'Resource_List.soft_walltime': 50})
        self.assertIn("Attribute has to be set on an array job",
                      e.exception.msg[0])

    def test_max_run_subjobs_preemption(self):
        """
        Submit array job with max_run_subjobs limit and see if such a job
        hits the limit, no preemption is attempted.
        """
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "wq2")

        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1)

        a = {'Resource_List.select': 'ncpus=2'}
        j = Job(attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        a = {ATTR_J: '1-20%3', 'Resource_List.select': 'ncpus=2',
             ATTR_q: 'wq2'}
        j_arr = Job(attrs=a)
        jid_arr = self.server.submit(j_arr)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid_arr)
        self.server.expect(JOB, {'job_state=R': 4}, extend='t')
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

    def test_max_run_subjobs_qrun(self):
        """
        Submit array job with max_run_subjobs limit and see if such a job
        is run using qrun, max_run_subjobs limit is ignored.
        """
        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1)

        a = {'Resource_List.select': 'ncpus=2'}
        j = Job(attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        a = {ATTR_J: '1-20%3', 'Resource_List.select': 'ncpus=2'}
        j_arr = Job(attrs=a)
        jid_arr = self.server.submit(j_arr)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid_arr)
        self.server.expect(JOB, {'job_state=R': 4}, extend='t')
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        subjid_4 = j_arr.create_subjob_id(jid_arr, 4)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=subjid_4)
        self.server.runjob(subjid_4)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid_arr)
        self.server.expect(JOB, {'job_state=R': 4}, extend='t')
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=subjid_4)

    def test_max_run_subjobs_suspend(self):
        """
        Submit array job with max_run_subjobs limit and see if such a job
        is has suspended subjobs, those subjobs are not counted against the
        limit.
        """

        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1)

        a = {ATTR_J: '1-20%3', 'Resource_List.select': 'ncpus=2'}
        j_arr = Job(attrs=a)
        jid_arr = self.server.submit(j_arr)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid_arr)
        self.server.expect(JOB, {'job_state=R': 3}, extend='t')
        subjid_2 = j_arr.create_subjob_id(jid_arr, 2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=subjid_2)
        self.server.sigjob(jobid=subjid_2, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=subjid_2)
        self.server.expect(JOB, {'job_state=R': 3}, extend='t')
        subjid_4 = j_arr.create_subjob_id(jid_arr, 4)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=subjid_4)

    def test_max_run_subjobs_eligible_time(self):
        """
        Test that array jobs hitting max_run_subjobs limit still
        accrues eligible time.
        """

        a = {'resources_available.ncpus': 8}
        self.mom.create_vnodes(a, 1)

        a = {'eligible_time_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        accrue = {'ineligible': 1, 'eligible': 2, 'run': 3, 'exit': 4}

        a = {ATTR_J: '1-20%3', 'Resource_List.select': 'ncpus=2'}
        j_arr = Job(attrs=a)
        jid_arr = self.server.submit(j_arr)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid_arr)
        self.server.expect(JOB, {'job_state=R': 3}, extend='t')
        self.server.expect(JOB, {'accrue_type': accrue['eligible']},
                           id=jid_arr)

    def test_max_run_subjobs_on_non_array(self):
        """
        Test that setting max_run_subjobs on non-array jobs is rejected.
        """
        a = {ATTR_W: 'max_run_subjobs=4'}
        with self.assertRaises(PbsSubmitError) as e:
            self.server.submit(Job(attrs=a))
        self.assertIn("Attribute has to be set on an array job",
                      e.exception.msg[0])

    def test_multiple_max_run_subjobs_values(self):
        """
        Test that setting max_run_subjobs more than once on an array
        job is rejected.
        """

        qsub_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                'bin', 'qsub')

        cmd = [qsub_cmd, '-J1-4%2', '-Wmax_run_subjobs=4', '--',
               self.mom.sleep_cmd, '100']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertNotEqual(rv['rc'], 0, 'qsub must fail')
        msg = "qsub: multiple max_run_subjobs values found"
        self.assertEqual(rv['err'][0], msg)

    def test_qdel_job_array_downed_mom(self):
        """
        Test to check if qdel of a job array returns
        an error when mom is downed.
        """

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-3', 'Resource_List.select': 'ncpus=1'})

        j_id = self.server.submit(j)

        # 1. check job array has begun
        self.server.expect(JOB, {'job_state': 'B'}, j_id)

        self.mom.stop()

        try:
            self.server.deljob(j_id)
        except PbsDeljobError as e:
            err_msg = "could not connect to MOM"
            self.assertTrue(err_msg in e.msg[0],
                            "Did not get the expected message")
            self.assertTrue(e.rc != 0, "Exit code shows success")
        else:
            raise self.failureException("qdel job array did not return error")


================================================
FILE: test/tests/functional/pbs_job_array_comment.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestJobArrayComment(TestFunctional):
    """
    Testing job array comment is accurate
    """

    def test_job_array_comment(self):
        """
        Testing job array comment is correct when one or more sub jobs
        are rejected by mom
        """
        attr = {'resources_available.ncpus': 10}
        self.server.manager(MGR_CMD_SET, NODE, attr, id=self.mom.shortname)
        attr = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        # create a mom hook that rejects and deletes subjob 0, 5, and 7
        hook_name = "reject_subjob"
        hook_body = (
            "import pbs\n"
            "import re\n"
            "e = pbs.event()\n"
            "jid = str(e.job.id)\n"
            r"if re.match(r'[0-9]*\[[057]\]', jid):\n"
            "    e.job.delete()\n"
            "    e.reject()\n"
            "else:\n"
            "    e.accept()\n"
        )
        attr = {'event': 'execjob_begin', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attr, hook_body)

        # Check if the hook copy was successful
        self.server.log_match("successfully sent hook file.*" +
                              hook_name + ".PY", regexp=True,
                              max_attempts=60, interval=2)

        test_job_array = Job(TEST_USER, attrs={
            ATTR_J: '0-9',
            'Resource_List.select': 'ncpus=1'
        })
        jid = self.server.submit(test_job_array)
        attr = {
            ATTR_state: 'B',
            ATTR_comment: (MATCH_RE, 'Job Array Began at .*')
        }
        self.server.expect(JOB, attr, id=jid, attrop=PTL_AND)
        self.server.expect(JOB, {ATTR_comment: 'Not Running: PBS Error:' +
                                 ' Execution server rejected request' +
                                 ' and failed'},
                           id=test_job_array.create_subjob_id(jid, 0),
                           extend='x')
        attr = {
            ATTR_state: 'R',
            ATTR_comment: (MATCH_RE, 'Job run at .*')
        }
        self.server.expect(JOB, attr, extend='x',
                           id=test_job_array.create_subjob_id(jid, 1),
                           attrop=PTL_AND)
        self.server.expect(JOB, {ATTR_comment: 'Not Running: PBS Error:' +
                                 ' Execution server rejected request' +
                                 ' and failed'},
                           id=test_job_array.create_subjob_id(jid, 5),
                           extend='x')
        self.server.expect(JOB, {ATTR_comment: 'Not Running: PBS Error:' +
                                 ' Execution server rejected request' +
                                 ' and failed'},
                           id=test_job_array.create_subjob_id(jid, 7),
                           extend='x')


================================================
FILE: test/tests/functional/pbs_job_comment_on_resume.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestJobComment(TestFunctional):

    """
    Testing job comment is accurate
    """

    def test_job_comment_on_resume(self):
        """
        Testing whether job comment is accurate
        after resuming from suspended state.
        """
        attr = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, attr, self.mom.shortname)
        attr = {'queue_type': 'execution', 'started': 't', 'enabled': 't',
                'priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, attr, id='expressq')
        J = Job(TEST_USER)
        jid1 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        J = Job(TEST_USER, {'queue': 'expressq'})
        jid2 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.delete(jid2, wait=True)
        self.server.log_match(
            jid2 + ";dequeuing from expressq")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'comment': (MATCH_RE, '.*Job run at.*')})


================================================
FILE: test/tests/functional/pbs_job_default_group.py
================================================
# coding: utf-8

# Copyright (C) 1994-2022 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import pwd
from tests.functional import *


class TestJobDefaultGroup(TestFunctional):
    """
    This test suite contains test for job which gets default group
    """

    def test_job_with_default_group(self):
        """
        When a user group is not present on server machine
        then job will get a "-default-" group set on it.
        And MOM should be able to run that job
        """
        if self.server.hostname == self.mom.hostname:
            self.skipTest("Server and Execution host must be different")
        # add a temporary new user on execution host and assume that user
        # will be created and check user is not present on server host
        self.user_name = "ptlpbstestuser1"
        try:
            pwd.getpwnam(self.user_name)
            # user is present in server host, must delete user before
            # qsub
            cmd = f"userdel {self.user_name}"
            res = self.du.run_cmd(self.server.hostname, cmd=cmd, sudo=True)
            if res["rc"] != 0:
                raise PtlException("Unable to delete user on server host")
            self.logger.info(f"Deleted {self.user_name} on server host.")
        except KeyError:
            # good! user is not present on server host
            # just as we needed
            pass
        self.testuser_created = True
        cmd = f"useradd -m {self.user_name}"
        res = self.du.run_cmd(self.mom.hostname, cmd=cmd, sudo=True)
        if res["rc"] != 0:
            self.testuser_created = False
            raise PtlException("Unable to create user on execution host")
        attr = {"flatuid": True}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        starttime = int(time.time())
        user = PbsUser(self.user_name)
        self.server.client = self.mom.hostname
        jid = self.server.submit(Job(user), submit_dir="/tmp")
        self.server.client = self.server.hostname
        attr = {"job_state": "R"}
        self.server.expect(JOB, attr, id=jid)
        self.mom.log_match(
            f"Job;{jid};No Group Entry for Group -default-",
            starttime=starttime,
            existence=False,
            max_attempts=30,
        )

    def tearDown(self):
        super().tearDown()
        if self.testuser_created:
            cmd = f"userdel {self.user_name}"
            self.du.run_cmd(self.mom.hostname, cmd=cmd, sudo=True)


================================================
FILE: test/tests/functional/pbs_job_dependency.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestJobDependency(TestFunctional):

    """
    Test suite to test different job dependencies
    """
    hook_body = """
import pbs
e = pbs.event()
j = e.job
if ('DEPENDENT_JOB' in j.Variable_List):
    j.depend = pbs.depend("runone:" + str(j.Variable_List['DEPENDENT_JOB']))
e.accept()
"""

    def setUp(self):
        TestFunctional.setUp(self)
        attr = {ATTR_RESC_TYPE: 'string', ATTR_RESC_FLAG: 'h'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='NewRes')
        self.scheduler.add_resource('NewRes', apply=True)
        attr = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(attr, 6, attrfunc=self.cust_attr,
                               usenatvnode=False)

    def cust_attr(self, name, totnodes, numnode, attrib):
        res_str = "ver" + str(numnode)
        attr = {'resources_available.NewRes': res_str}
        return {**attrib, **attr}

    def assert_dependency(self, *jobs):
        dl = []
        num = len(jobs)
        for ind, job in enumerate(jobs):
            temp = self.server.status(JOB, id=job)[0][ATTR_depend]
            dl.append([i.split('@')[0] for i in temp.split(':')[1:]])
            self.assertEqual(num - 1, len(dl[ind]))

        for ind, job in enumerate(jobs):
            # make a list of dependency list that does not contain the
            # enumerated job
            check_dl = dl[:ind] + dl[ind + 1:]
            for job_list in check_dl:
                self.assertIn(job, job_list)

    def test_runone_depend_basic(self):
        """
        Test basic runone dependency tests
        1 - Submit a job that runs and then submit a job having "runone"
        dependency on the first job. Check that second job is deleted as
        soon as the first job ends.
        2 - Submit a can never run job and submit a second job having "runone"
        dependency on the first job. Check that first job is deleted when
        second job ends.
        """

        job = Job(attrs={'Resource_List.select': '1:NewRes=ver3'})
        job.set_sleep_time(10)
        j1 = self.server.submit(job)
        d_job = Job(attrs={'Resource_List.select': '2:ncpus=1',
                           ATTR_depend: 'runone:' + j1})
        j1_2 = self.server.submit(d_job)
        self.server.expect(JOB, {'job_state': 'R'}, id=j1)
        self.server.expect(JOB, {'job_state': 'H'}, id=j1_2)
        self.server.accounting_match("Job deleted as result of dependency",
                                     id=j1_2)

        job = Job(attrs={'Resource_List.select': '1:ncpus=4:NewRes=ver3'})
        job.set_sleep_time(10)
        j2 = self.server.submit(job)
        d_job = Job(attrs={'Resource_List.select': '2:ncpus=1',
                           ATTR_depend: 'runone:' + j2})
        j2_2 = self.server.submit(d_job)
        self.server.expect(JOB, {'job_state': 'H'}, id=j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2_2)
        self.server.accounting_match("Job deleted as result of dependency",
                                     id=j2)

    def test_runone_dependency_on_running_job(self):
        """
        Submit a job putting runone dependency on an already running job
        check to see that the second job is put on system hold as soon
        as it is submitted, then submit another job dependent on the
        second held job and see if that gets held as well.
        Also test that all jobs have dependency on other two jobs.
        """

        job = Job()
        j1 = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1)

        a = {ATTR_depend: 'runone:' + j1}
        job2 = Job(attrs=a)
        j2 = self.server.submit(job2)
        self.server.expect(JOB, {ATTR_state: 'H', ATTR_h: 's'}, id=j2)
        self.assert_dependency(j1, j2)

        a = {ATTR_depend: 'runone:' + j2}
        job3 = Job(attrs=a)
        j3 = self.server.submit(job3)
        self.server.expect(JOB, {ATTR_state: 'H', ATTR_h: 's'}, id=j3)
        self.assert_dependency(j1, j2, j3)

    def test_runone_depend_basic_on_job_array(self):
        """
        Test basic runone dependency tests on job arrays
        1 - Submit a job array that runs and then submit a job having "runone"
        dependency on the parent job array. Check that second job is held as
        soon as it is submitted.
        2 - Submit a can never run array job and submit a second job having
        "runone" dependency on the array parent. Check that first job is
        deleted when second job runs.
        3 - Submit a runone dependency on an array subjob and check if job
        submission fails in this case.
        """

        job = Job(attrs={'Resource_List.select': '1:ncpus=1',
                         ATTR_J: '1-2'})
        job.set_sleep_time(10)
        j1 = self.server.submit(job)
        d_job = Job(attrs={'Resource_List.select': '2:ncpus=1',
                           ATTR_depend: 'runone:' + j1})
        j1_2 = self.server.submit(d_job)
        self.server.expect(JOB, {'job_state': 'B'}, id=j1)
        self.server.expect(JOB, {'job_state': 'H'}, id=j1_2)
        self.server.accounting_match("Job deleted as result of dependency",
                                     id=j1_2)

        job = Job(attrs={'Resource_List.select': '1:ncpus=4:NewRes=ver3',
                         ATTR_J: '1-2'})
        job.set_sleep_time(10)
        j2 = self.server.submit(job)
        d_job = Job(attrs={'Resource_List.select': '2:ncpus=1',
                           ATTR_depend: 'runone:' + j2})
        j2_1 = self.server.submit(d_job)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2_1)
        self.server.expect(JOB, {'job_state': 'H'}, id=j2)
        self.server.accounting_match("Job deleted as result of dependency",
                                     id=j2)

        job = Job(attrs={'Resource_List.select': '1:ncpus=1',
                         ATTR_J: '1-2'})
        job.set_sleep_time(10)
        j3 = self.server.submit(job)
        j3_1 = job.create_subjob_id(j3, 1)
        d_job = Job(attrs={'Resource_List.select': '2:ncpus=1',
                           ATTR_depend: 'runone:' + j3_1})
        with self.assertRaises(PbsSubmitError):
            self.server.submit(d_job)

    def test_runone_queuejob_hook(self):
        """
        Check to see that a queue job hook can set runone job
        dependency.
        """
        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook('h1', a, self.hook_body)
        job = Job()
        j1 = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1)

        a = {ATTR_v: 'DEPENDENT_JOB=' + j1}
        job2 = Job(attrs=a)
        j2 = self.server.submit(job2)
        self.server.expect(JOB, {ATTR_state: 'H', ATTR_h: 's'}, id=j2)

        self.assert_dependency(j1, j2)

    def test_runone_runjob_hook(self):
        """
        Check to see that a run job hook cannot set runone job
        dependency.
        """
        a = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook('h1', a, self.hook_body)
        job = Job()
        j1 = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1)

        a = {ATTR_v: 'DEPENDENT_JOB=' + j1}
        job2 = Job(attrs=a)
        j2 = self.server.submit(job2)
        logmsg = "cannot modify job after runjob request has been accepted"
        self.server.log_match(logmsg)

    def test_deleting_one_runone_dependency_job(self):
        """
        Submit a job putting runone dependency on an already running job
        check to see that the second job is put on system hold as soon
        as it is submitted, then submit another job dependent on the
        second held job and see if that gets held as well.
        Then test that deleting second job updates dependencies on
        other two jobs.
        """
        job = Job()
        j1 = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1)

        a = {ATTR_depend: 'runone:' + j1}
        job2 = Job(attrs=a)
        j2 = self.server.submit(job2)
        self.server.expect(JOB, {ATTR_state: 'H', ATTR_h: 's'}, id=j2)

        a = {ATTR_depend: 'runone:' + j2}
        job3 = Job(attrs=a)
        j3 = self.server.submit(job3)
        self.server.expect(JOB, {ATTR_state: 'H', ATTR_h: 's'}, id=j3)

        self.assert_dependency(j1, j2, j3)

        self.server.delete(j2)
        self.assert_dependency(j1, j3)

    def check_job(self, attr, msg, state):
        """
        helper function to submit a dependent job and check the job
        to see if the dependency is met or rejected
        """
        j = Job(attrs=attr)
        jid = self.server.submit(j)
        msg_to_check = jid + ';' + msg
        self.server.expect(JOB, {ATTR_state: state}, id=jid, extend='x')
        self.server.log_match(msg_to_check)
        if state == 'R':
            self.server.delete(jid)

    def test_dependency_on_finished_job(self):
        """
        Submit a short job and when it ends submit jobs dependent on the
        finished job and check that after, afterok, afterany dependencies
        do not hold the dependent job. Also check that the job is not
        accepted for any other afternotok, before, beforeok, beforenotok
        dependency types.
        """
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        job = Job()
        job.set_sleep_time(5)
        j1 = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j1, extend='x')
        accept_msg = j1 + " Job has finished, dependency satisfied"
        reject_msg = j1 + " Finished job did not satisfy dependency"

        a = {ATTR_depend: 'after:' + j1}
        self.check_job(a, accept_msg, 'R')

        a = {ATTR_depend: 'afterok:' + j1}
        self.check_job(a, accept_msg, 'R')

        a = {ATTR_depend: 'afterany:' + j1}
        self.check_job(a, accept_msg, 'R')

        a = {ATTR_depend: 'afternotok:' + j1}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'before:' + j1}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'beforeany:' + j1}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'beforeok:' + j1}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'beforenotok:' + j1}
        self.check_job(a, reject_msg, 'F')

    def test_dependency_on_multiple_finished_job(self):
        """
        Submit a short job and and a long job, when the short job ends
        submit dependent jobs on finished job and running job,
        check that after dependecy runs, afterok, afterany dependencies
        hold the dependent job, because there is a running job in the
        system. Also check that the job is not accepted for any other
        afternotok, before, beforeok, beforenotok dependency types.
        """
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        job = Job()
        job.set_sleep_time(1)
        j1 = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j1, extend='x')
        job = Job()
        job.set_sleep_time(500)
        j2 = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j2)
        accept_msg = j1 + " Job has finished, dependency satisfied"
        reject_msg = j1 + " Finished job did not satisfy dependency"

        a = {ATTR_depend: 'after:' + j1 + ":" + j2}
        self.check_job(a, accept_msg, 'R')

        a = {ATTR_depend: 'afterok:' + j1 + ":" + j2}
        self.check_job(a, accept_msg, 'H')

        a = {ATTR_depend: 'afterany:' + j1 + ":" + j2}
        self.check_job(a, accept_msg, 'H')

        a = {ATTR_depend: 'afternotok:' + j1 + ":" + j2}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'before:' + j1 + ":" + j2}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'beforeany:' + j1 + ":" + j2}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'beforeok:' + j1 + ":" + j2}
        self.check_job(a, reject_msg, 'F')

        a = {ATTR_depend: 'beforenotok:' + j1 + ":" + j2}
        self.check_job(a, reject_msg, 'F')

    def check_depend_delete_msg(self, pjid, cjid):
        """
        helper function to check ia message that the dependent job (cjid)
        is deleted because of the parent job (pjid)
        """
        msg = cjid + ";Job deleted as result of dependency on job " + pjid
        self.server.log_match(msg)

    def test_job_end_deleting_chain_of_dependency(self):
        """
        Submit a chain of dependent jobs and see if one of the running jobs
        ends, all the dependent jobs (and their dependent jobs)
        are also deleted.
        """

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        job = Job()
        job.set_sleep_time(10)
        j1 = self.server.submit(job)

        a = {ATTR_depend: "afternotok:" + j1}
        job = Job(attrs=a)
        j2 = self.server.submit(job)

        a = {ATTR_depend: "afterok:" + j2}
        job = Job(attrs=a)
        j3 = self.server.submit(job)

        a = {ATTR_depend: "afterok:" + j1}
        job = Job(attrs=a)
        j4 = self.server.submit(job)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j1, extend='x')
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j2, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j1, j2)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j3, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j2, j3)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j4, max_attempts=3)

    def test_qdel_deleting_chain_of_dependency(self):
        """
        Submit a chain of dependent jobs and see if one of the running jobs
        is deleted, all the jobs without their dependency released
        are also deleted.
        Try the same test with array jobs as well.
        """

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        job = Job()
        j1 = self.server.submit(job)

        a = {ATTR_depend: "afterok:" + j1}
        job = Job(attrs=a)
        j2 = self.server.submit(job)

        a = {ATTR_depend: "afternotok:" + j2}
        job = Job(attrs=a)
        j3 = self.server.submit(job)

        a = {ATTR_depend: "after:" + j1}
        job = Job(attrs=a)
        j4 = self.server.submit(job)

        a = {ATTR_depend: "afternotok:" + j1}
        job = Job(attrs=a)
        j5 = self.server.submit(job)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j4)
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j5)
        self.server.delete(j1)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j1, extend='x')
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j2, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j1, j2)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j3, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j2, j3)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j4)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j5)
        self.server.delete(j4)
        self.server.delete(j5)

        # repeat the steps for array job
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        job = Job(attrs={ATTR_J: '1-2'})
        j5 = self.server.submit(job)

        a = {ATTR_depend: "afterok:" + j5}
        job = Job(attrs=a)
        j6 = self.server.submit(job)

        a = {ATTR_depend: "afternotok:" + j6}
        job = Job(attrs=a)
        j7 = self.server.submit(job)

        a = {ATTR_depend: "after:" + j5}
        job = Job(attrs=a)
        j8 = self.server.submit(job)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'B'}, id=j5)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j8)
        self.server.delete(j5)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j5, extend='x')
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j6, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j5, j6)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j7, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j6, j7)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j8)

    def test_qdel_held_job_deleting_chain_of_dependency(self):
        """
        Submit a chain of dependent jobs and see if one of the held jobs
        is deleted, all the jobs without their dependency released
        are also deleted.
        """

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        job = Job()
        j1 = self.server.submit(job)

        a = {ATTR_depend: "afternotok:" + j1}
        job = Job(attrs=a)
        j2 = self.server.submit(job)

        a = {ATTR_depend: "afterok:" + j2}
        job = Job(attrs=a)
        j3 = self.server.submit(job)

        a = {ATTR_depend: "after:" + j2}
        job = Job(attrs=a)
        j4 = self.server.submit(job)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j2)
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j3)
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j4)
        self.server.delete(j2)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j2, extend='x',
                           max_attempts=3)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j3, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j2, j3)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j4, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j2, j4)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1)

    def test_only_after_dependency_chain_is_deleted(self):
        """
        Submit a chain of dependent jobs and see that only downstream jobs
        with after dependencies are deleted.
        """

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        job = Job()
        j1 = self.server.submit(job)

        a = {ATTR_depend: "afterok:" + j1}
        job = Job(attrs=a)
        j2 = self.server.submit(job)

        a = {ATTR_depend: "afterok:" + j2}
        job = Job(attrs=a)
        j3 = self.server.submit(job)

        a = {ATTR_depend: "after:" + j3}
        job = Job(attrs=a)
        j4 = self.server.submit(job)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j2)
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j3)
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j4)
        self.server.delete(j3)
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j2)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j3, extend='x',
                           max_attempts=3)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j4, extend='x',
                           max_attempts=3)
        self.check_depend_delete_msg(j3, j4)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1)


================================================
FILE: test/tests/functional/pbs_job_purge.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestJobPurge(TestFunctional):
    """
    This test suite tests the Job purge process
    """

    def test_job_files_after_execution(self):
        """
        Checks the job related files and ensures that files are
        deleted successfully upon job completion
        """
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # Submit a normal and an array job
        j = Job(TEST_USER)
        j.set_sleep_time(30)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=25)
        j1 = Job(TEST_USER)
        j1.set_sleep_time(30)
        j1.set_attributes({ATTR_J: '1-2'})
        jid_1 = self.server.submit(j1)
        jobid_list = [jid, j1.create_subjob_id(jid_1, 1),
                      j1.create_subjob_id(jid_1, 2)]
        self.server.expect(JOB, {'job_state': 'B'}, id=jid_1)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid_1, offset=25)
        # Checking the job control(.JB) file, job script(.SC) file
        # and job task(.TK) directory after successful job execution
        jobs_suffix_list = ['.JB', '.SC', '.TK']
        for jobid in jobid_list:
            for suffix in jobs_suffix_list:
                job_file = self.mom.get_formed_path(
                            self.mom.pbs_conf['PBS_HOME'],
                            'mom_priv', 'jobs', jobid + suffix)
                self.assertFalse(self.mom.isfile(path=job_file, sudo=True))


================================================
FILE: test/tests/functional/pbs_job_requeue_timeout_error.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestJobRequeueTimeoutErrorMsg(TestFunctional):
    """
    This test suite is for testing the new job_requeue_timeout error
    message that informs the user that the job rerun process is still
    in progress.
    """

    def setUp(self):
        TestFunctional.setUp(self)

        if len(self.moms) != 2:
            self.skip_test(reason="need 2 mom hosts: -p moms=<m1>:<m2>")

        self.server.set_op_mode(PTL_CLI)

        # PBSTestSuite returns the moms passed in as parameters as dictionary
        # of hostname and MoM object
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momA.delete_vnode_defs()
        self.momB.delete_vnode_defs()

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        islocal = self.du.is_localhost(self.hostA)
        if islocal is False:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)
        else:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)

        self.server.manager(MGR_CMD_SET, SERVER, {'job_requeue_timeout': 1})

    def test_error_message(self):
        j = Job(TEST_USER, attrs={ATTR_N: 'job_requeue_timeout'})

        test = []
        test += ['dd if=/dev/zero of=file bs=1024 count=0 seek=10240\n']
        test += ['cat file\n']
        test += ['sleep 30\n']

        j.create_script(test, hostname=self.server.client)
        jid = self.server.submit(j)

        self.server.expect(
            JOB, {'job_state': 'R', 'substate': 42}, id=jid, max_attempts=30,
            interval=2)
        try:
            self.server.rerunjob(jid)
        except PbsRerunError as e:
            self.assertTrue('qrerun: Response timed out. Job rerun request ' +
                            'still in progress for' in e.msg[0])


================================================
FILE: test/tests/functional/pbs_job_routing.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestJobRouting(TestFunctional):
    """
    This test suite validates state of parent job and subjobs in a Job Array.
    """

    def setUp(self):
        TestFunctional.setUp(self)

        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'false'})

    def test_t1(self):
        """
        This test case validates Job array state when one
        of the subjob is deleted while the array job is HELD in a routing
        queue and is released after the subjob is deleted.
        """
        dflt_q = self.server.default_queue
        # Create a route queue with destination to default queue
        queue_attrib = {ATTR_qtype: 'route',
                        ATTR_routedest: dflt_q,
                        ATTR_enable: 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, queue_attrib, id='routeq')

        job_attrib = Job(TEST_USER, attrs={ATTR_queue: 'routeq',
                                           ATTR_l + '.ncpus': 1,
                                           ATTR_h: None,
                                           ATTR_J: '1-2',
                                           ATTR_r: 'y'})

        # Submit an array job in Held state
        jid = self.server.submit(job_attrib)

        self.server.expect(JOB, {ATTR_state: 'H'}, jid)
        self.server.expect(JOB, {ATTR_state + '=Q': 2}, count=True,
                           id=jid, extend='t')
        subjobs = self.server.status(JOB, id=jid, extend='t')

        # Delete one of the subjob
        self.server.deljob(subjobs[-1]['id'])

        self.server.expect(JOB, {ATTR_state: 'H'}, jid)
        self.server.expect(JOB, {ATTR_state + '=Q': 1}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=X': 1}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_queue + '=routeq': 3}, count=True,
                           id=jid, extend='t')

        # Release the array and verify job array state
        self.server.rlsjob(jid, 'u')
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid)
        self.server.expect(JOB, {ATTR_state + '=Q': 2}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=X': 1}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_queue + '=routeq': 3}, count=True,
                           id=jid, extend='t')

        # No errors should be in server logs
        msg = '(job_route) Request invalid for state of job, state=7'
        self.server.log_match(msg, id=jid, existence=False)

        # Start routing queue and verify job array queue set to default queue
        a = {ATTR_start: 'True'}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='routeq')
        self.server.expect(JOB, {ATTR_queue + '=' + dflt_q: 3}, count=True,
                           id=jid, extend='t')

    def test_t2(self):
        """
        This test case validates Job array state when running subjobs
        are force fully deleted. After deleting the running subjob
        Array job is held and released, this should cause job array
        state change to Q from B.
        """

        # Submit a job array of size 3
        job = Job()
        job.set_attributes({ATTR_l + '.ncpus': 1,
                            ATTR_J: '1-3',
                            ATTR_r: 'y'})

        job.set_sleep_time(1000)
        jid = self.server.submit(job)

        self.server.expect(JOB, {ATTR_state + '=Q': 4}, count=True,
                           id=jid, extend='t')

        # Start scheduling cycle. This will move all 3 subjobs to R state.
        # And parent job state to B state.
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'true'})

        self.server.expect(JOB, {ATTR_state + '=R': 3}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=B': 1}, count=True,
                           id=jid, extend='t')

        # Delete two of the subjobs.
        subjobs = self.server.status(JOB, id=jid, extend='t')
        self.server.deljob(subjobs[1]['id'])
        self.server.deljob(subjobs[2]['id'])

        # Mark node offline, and  rerun the third job.
        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        a = {'state': 'offline'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostA)

        # Rerun Third job, job will move to Q state.
        self.server.rerunjob(subjobs[3]['id'])
        self.server.expect(JOB, {ATTR_state + '=Q': 1}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=X': 2}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=B': 1}, count=True,
                           id=jid, extend='t')

        # Hold the job array. Parent job will move to H state.

        self.server.holdjob(jid)
        self.server.expect(JOB, {ATTR_state + '=H': 1}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=Q': 1}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=X': 2}, count=True,
                           id=jid, extend='t')

        # Release the job and validate array job state.
        # Expected parent array job state is Q

        self.server.rlsjob(jid, 'u')
        self.server.expect(JOB, {ATTR_state + '=Q': 2}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {ATTR_state + '=X': 2}, count=True,
                           id=jid, extend='t')

    def test_route_resource_with_cr(self):
        """
        test submitting and routing job with select
        containing nasty CR chars from Windows
        """

        dflt_q = self.server.default_queue
        # Create a route queue with destination to default queue
        queue_attrib = {ATTR_qtype: 'route',
                        ATTR_routedest: dflt_q,
                        ATTR_enable: 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, queue_attrib, id='routeq')

        select = "select=ncpus=1\r:mem=1gb\r:arch=linux"
        job = Job(TEST_USER, attrs={ATTR_queue: 'routeq',
                                    ATTR_l: select})
        try:
            jid = self.server.submit(job)
        except PbsSubmitError as e:
            error_msg = "qsub: Illegal attribute or " \
                        "resource value Resource_List.:mem"
            self.assertEquals(e.msg[0], error_msg)
        else:
            self.fail("Job submit did not fail as expected.")


================================================
FILE: test/tests/functional/pbs_job_script.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


class TestPbsJobScript(TestFunctional):
    """
    Test suite for testing PBS's job script functionality
    """

    def submit_job(self, addnewline=False):
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 500, vname='Verylongvnodename')

        selstr = "#PBS -l select=1"
        for node in range(500):
            selstr += ":ncpus=1:vnode=Verylongvnodename[" + str(node) + "]+1"
            if addnewline and node == 250:
                selstr += "\\\n"
        selstr = selstr[0:-2]

        scr = []
        scr += [selstr + '\n']
        scr += ['%s 100\n' % (self.mom.sleep_cmd)]

        j = Job()
        j.create_script(scr)
        jid = self.server.submit(j)
        return jid

    def test_long_select_spec(self):
        """
        Test that PBS is able to accept jobs scripts with very long select
        specification with no newline in it.
        """
        jid = self.submit_job()
        execvnode = ""
        for node in range(500):
            execvnode += "(Verylongvnodename[" + str(node) + "]:ncpus=1)+"
        execvnode = execvnode[0:-1]
        self.server.expect(JOB, {'job_state': 'R', 'exec_vnode': execvnode},
                           id=jid)

    def test_long_select_spec_extend(self):
        """
        Test that PBS is able to accept jobs scripts with very long select
        specification with newline in it.
        """
        jid = self.submit_job(addnewline=True)
        execvnode = ""
        for node in range(500):
            execvnode += "(Verylongvnodename[" + str(node) + "]:ncpus=1)+"
        execvnode = execvnode[0:-1]
        self.server.expect(JOB, {'job_state': 'R', 'exec_vnode': execvnode},
                           id=jid)


================================================
FILE: test/tests/functional/pbs_job_sort_formula.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestJobSortFormula(TestFunctional):
    """
    Tests for the job_sort_formula
    """

    def test_job_sort_formula_negative_value(self):
        """
        Test to see that negative values in the
        job_sort_formula sort properly
        """
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        self.server.manager(MGR_CMD_CREATE, RSC, {'type': 'float'}, id='foo')

        a = {'job_sort_formula': 'foo', 'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a, runas=ROOT_USER)

        j1 = Job(TEST_USER, attrs={'Resource_List.foo': -2})
        jid1 = self.server.submit(j1)
        j2 = Job(TEST_USER, attrs={'Resource_List.foo': -1})
        jid2 = self.server.submit(j2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        c = self.scheduler.cycles(lastN=1)[0]
        job_order = [jid2, jid1]
        for i, job in enumerate(job_order):
            self.assertEqual(job.split('.')[0], c.political_order[i])

        self.server.expect(JOB, {'job_state=R': 2})


================================================
FILE: test/tests/functional/pbs_job_status_after_mom_hup.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from time import sleep


class Test_job_status_after_mom_hup(TestFunctional):
    """
    Test the status of jobs after pbs_mom daemon has been signalled HUP.
    """

    def setUp(self):
        TestFunctional.setUp(self)

    def test_job_status(self):
        """
        Check whether job is still running after the MoM process is killed
        with HUP signal.
        """
        job = Job()
        job.set_sleep_time(1000)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        self.mom.signal('-HUP')

        sleep(2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)


================================================
FILE: test/tests/functional/pbs_job_task.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestJobTask(TestFunctional):
    """
    This test suite validates the job task using pbsdsh or pbs_tmrsh
    """

    def setUp(self):
        TestFunctional.setUp(self)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'true'})

    def check_jobs_file(self, out_file):
        """
        This function validates job's output file
        """
        ret = self.du.cat(hostname=self.server.shortname,
                          filename=out_file,
                          runas=TEST_USER)
        _msg = "cat command failed with error:%s" % ret['err']
        self.assertEqual(ret['rc'], 0, _msg)
        _msg = 'Job\'s error file has error:"%s"' % ret['out']
        self.assertEqual(ret['out'][0], "OK", _msg)
        self.logger.info("Job has executed without any error")

    def test_singlenode_pbsdsh(self):
        """
        This test case validates that task started by pbsdsh runs
        properly within a single-noded job.
        """
        a = {ATTR_S: '/bin/bash'}
        job = Job(TEST_USER, attrs=a)
        pbsdsh_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                  'bin', 'pbsdsh')
        script = ['%s echo "OK"' % pbsdsh_cmd]
        job.create_script(body=script)
        jid = self.server.submit(job)
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')

        job_status = self.server.status(JOB, id=jid, extend='x')
        if job_status:
            job_output_file = job_status[0]['Output_Path'].split(':')[1]
        self.check_jobs_file(job_output_file)

    def test_singlenode_pbs_tmrsh(self):
        """
        This test case validates that task started by pbs_tmrsh runs
        properly within a single-noded job.
        """
        a = {ATTR_S: '/bin/bash'}
        job = Job(TEST_USER, attrs=a)
        pbstmrsh_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                    'bin', 'pbs_tmrsh')
        script = ['%s $(hostname -f) echo "OK"' % pbstmrsh_cmd]
        job.create_script(body=script)
        jid = self.server.submit(job)

        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')

        job_status = self.server.status(JOB, id=jid, extend='x')
        if job_status:
            job_output_file = job_status[0]['Output_Path'].split(':')[1]
        self.check_jobs_file(job_output_file)

    @requirements(num_moms=3)
    def test_invoke_pbs_tmrsh_from_sister_mom(self):
        """
        This test cases verifies pbs_tmrsh invoked from sister mom
        executes successfully
        """
        # Skip test if number of mom provided is not equal to three
        if not len(self.moms) == 3:
            self.skipTest("test requires three MoMs as input, " +
                          "use -p moms=<mom1:mom2:mom3>")
        mom1 = self.moms.keys()[0]
        mom2 = self.moms.keys()[1]
        mom3 = self.moms.keys()[2]
        fqdn_mom2 = socket.getfqdn(mom2)
        fqdn_mom3 = socket.getfqdn(mom3)
        pbstmrsh_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                    'bin', 'pbs_tmrsh')

        script_mom2 = """#!/bin/bash\n%s %s hostname""" % \
                      (pbstmrsh_cmd, fqdn_mom3)
        fn = self.du.create_temp_file(hostname=mom2, body=script_mom2)
        self.du.chmod(hostname=mom2, path=fn, mode=0o755)
        a = {ATTR_S: '/bin/bash'}
        script = ['%s %s %s' % (pbstmrsh_cmd, fqdn_mom2, fn)]
        job = Job(TEST_USER, attrs=a)
        job.set_attributes({'Resource_List.select': '3:ncpus=1',
                            'Resource_List.place': 'scatter'})
        job.create_script(body=script)
        jid = self.server.submit(job)

        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        job_status = self.server.status(JOB, id=jid, extend='x')
        if job_status:
            job_output_file = job_status[0]['Output_Path'].split(':')[1]

        ret = self.du.cat(hostname=mom1, filename=job_output_file,
                          runas=TEST_USER)
        self.assertEqual(ret['out'][0], mom3, "pbs_tmrsh invoked from sister"
                                              " mom did not execute "
                                              "successfully")


================================================
FILE: test/tests/functional/pbs_maintenance_reservations.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestMaintenanceReservations(TestFunctional):
    """
    Various tests to verify behavior of maintenance reservations.
    Two moms (-p "servers=M1,moms=M1:M2") are recommended for the tests.
    """

    def setUp(self):
        TestFunctional.setUp(self)
        self.server.set_op_mode(PTL_CLI)

    def test_maintenance_acl_denied(self):
        """
        Test if the maintenance reservation is denied for common user
        """
        now = int(time.time())

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [self.mom.shortname]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rsub: Unauthorized Request", msg)

    def test_maintenance_conflicting_parameters(self):
        """
        Test if conflicting parameters are refused
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a = {'Resource_List.select': '1',
             'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [self.mom.shortname]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rsub: can't use -l with --hosts", msg)

        a = {'Resource_List.place': 'scatter',
             'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [self.mom.shortname]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rsub: can't use -l with --hosts", msg)

        a = {'interactive': 300,
             'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [self.mom.shortname]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rsub: can't use -I with --hosts", msg)

    def test_maintenance_unknown_hosts(self):
        """
        Test if the pbs_rsub with all unknown hosts return error.
        Test if the pbs_rsub with any unknown host return error.
        Test if the --hosts without host parameter return error.
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = ["foo"]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        msg = ""

        try:
            self.server.submit(r)
        except PbsSubmitError as err:
            msg = err.msg[0].strip()

        self.assertEqual("pbs_rsub: Host with resources not found: foo", msg)

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [self.mom.shortname, "foo"]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rsub: Host with resources not found: foo", msg)

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [""]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rsub: missing host(s)", msg)

    def test_maintenance_duplicate_host(self):
        """
        Test if the pbs_rsub with duplicate host return error.
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = ["foo", "foo"]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rsub: Duplicate host: foo", msg)

    def test_maintenance_confirm(self):
        """
        Test if the maintenance (prefixed with 'M') is immediately
        confirmed without scheduler and the select, place, and resv_nodes
        are correctly crafted. Also check if resv_enable = False is
        ignored.
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': False})
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, num=2)
        vn = self.mom.shortname

        a = {'resv_enable': False}
        self.server.manager(MGR_CMD_SET, NODE, a,
                            id=self.mom.shortname, runas=TEST_USER)
        self.server.manager(MGR_CMD_SET, NODE, a, vn + '[0]', runas=TEST_USER)
        self.server.manager(MGR_CMD_SET, NODE, a, vn + '[1]', runas=TEST_USER)

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [self.mom.shortname]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        rid = self.server.submit(r)

        self.assertTrue(rid.startswith('M'))
        resv_vnodes = '(' + vn + '[0]:ncpus=2)+(' + vn + '[1]:ncpus=2)'
        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                    'Resource_List.select':
                    'host=%s:ncpus=4' % self.mom.shortname,
                    'Resource_List.place': 'exclhost',
                    'resv_nodes': resv_vnodes}
        self.server.expect(RESV, exp_attr, id=rid)

    def test_maintenance_delete(self):
        """
        Test if the maintenance can not be deleted by common user.
        Test if the maintenance reservation can be deleted by a manager.
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (INCR, '%s@*' % TEST_USER)})

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        h = [self.mom.shortname]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        rid = self.server.submit(r)

        self.assertTrue(rid.startswith('M'))

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (DECR, '%s@*' % TEST_USER)})

        with self.assertRaises(PbsDeleteError) as err:
            self.server.delete(rid, runas=TEST_USER)

        msg = err.exception.msg[0].strip()

        self.assertEqual("pbs_rdel: Unauthorized Request  " + rid, msg)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (INCR, '%s@*' % TEST_USER)})

        self.server.delete(rid, runas=TEST_USER)

    def test_maintenance_degrade_reservation_overlap1(self):
        """
        Test if the reservation is degraded by overlapping
        maintenance reservation - overlap: beginning
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a1 = {'Resource_List.select': 'host=%s' % self.mom.shortname,
              'reserve_start': now + 3600,
              'reserve_end': now + 7200}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 1800,
              'reserve_end': now + 5400}
        h2 = [self.mom.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10'),
                    'reserve_substate': 12}
        self.server.expect(RESV, exp_attr, id=rid1)

    def test_maintenance_degrade_reservation_overlap2(self):
        """
        Test if the reservation is degraded by overlapping
        maintenance reservation - overlap: ending
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a1 = {'Resource_List.select': 'host=%s' % self.mom.shortname,
              'reserve_start': now + 3600,
              'reserve_end': now + 7200}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 5400,
              'reserve_end': now + 9000}
        h2 = [self.mom.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10'),
                    'reserve_substate': 12}
        self.server.expect(RESV, exp_attr, id=rid1)

    def test_maintenance_degrade_reservation_overlap3(self):
        """
        Test if the reservation is degraded by overlapping
        maintenance reservation - overlap: inner
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a1 = {'Resource_List.select': 'host=%s' % self.mom.shortname,
              'reserve_start': now + 3600,
              'reserve_end': now + 10800}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 5400,
              'reserve_end': now + 9000}
        h2 = [self.mom.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10'),
                    'reserve_substate': 12}
        self.server.expect(RESV, exp_attr, id=rid1)

    def test_maintenance_degrade_reservation_overlap4(self):
        """
        Test if the reservation is degraded by overlapping
        maintenance reservation - overlap: outer
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a1 = {'Resource_List.select': 'host=%s' % self.mom.shortname,
              'reserve_start': now + 3600,
              'reserve_end': now + 7200}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 1800,
              'reserve_end': now + 9000}
        h2 = [self.mom.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10'),
                    'reserve_substate': 12}
        self.server.expect(RESV, exp_attr, id=rid1)

    def test_maintenance_and_reservation_not_overlap1(self):
        """
        Test if the reservation is not degraded by maintenance
        reservation on the same host - not-overlap: before
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a1 = {'Resource_List.select': 'host=%s' % self.mom.shortname,
              'reserve_start': now + 10800,
              'reserve_end': now + 14400}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 3600,
              'reserve_end': now + 7200}
        h2 = [self.mom.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                    'reserve_substate': 2}
        self.server.expect(RESV, exp_attr, id=rid1)

    def test_maintenance_and_reservation_not_overlap2(self):
        """
        Test if the reservation is not degraded by maintenance
        reservation on the same host - not-overlap: after
        """
        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        a1 = {'Resource_List.select': 'host=%s' % self.mom.shortname,
              'reserve_start': now + 3600,
              'reserve_end': now + 7200}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 9000,
              'reserve_end': now + 12600}
        h2 = [self.mom.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                    'reserve_substate': 2}
        self.server.expect(RESV, exp_attr, id=rid1)

    def get_reg_expr(self, _mom, _host):
        """
        This function forms the match string based on cpuset mom
        """
        if _mom.is_cpuset_mom():
            n = self.server.status(NODE)
            cpuset_nodes = [i['id'] for i in n if i['Mom'] == _mom.hostname]
            reg_str = r'\(%s\[0\]:ncpus=[0-9]+\)' % _host
            if (len(cpuset_nodes) - 1) > 1:
                for i in range(1, len(cpuset_nodes) - 1):
                    reg_str += r'\+' + \
                        r'\(%s\[%s\]:ncpus=[0-9]+\)' % (_host, i)
        else:
            reg_str = r"\(%s:ncpus=[0-9]+\)" % _host
        return reg_str

    @requirements(num_moms=2)
    def test_maintenance_two_hosts(self):
        """
        Test if the maintenance reservation is confirmed on multiple hosts.
        Test the crafted resv_nodes, select, and place.
        Two moms (-p "servers=M1,moms=M1:M2") are needed for this test.
        """
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        reg_expr_hostA = self.get_reg_expr(self.momA, self.hostA)
        reg_expr_hostB = self.get_reg_expr(self.momB, self.hostB)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (INCR, '%s@*' % TEST_USER)})
        now = int(time.time())
        a = {'reserve_start': now + 900,
             'reserve_end': now + 5400}
        h = [self.hostA, self.hostB]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        rid = self.server.submit(r)

        possibility1 = reg_expr_hostA + r'\+' + reg_expr_hostB
        possibility2 = reg_expr_hostB + r'\+' + reg_expr_hostA

        resv_nodes_re = "%s|%s" % (possibility1, possibility2)

        possibility1 = r"host=%s:ncpus=[0-9]+\+host=%s:ncpus=[0-9]+" \
                       % (self.momA.shortname, self.momB.shortname)
        possibility2 = r"host=%s:ncpus=[0-9]+\+host=%s:ncpus=[0-9]+" \
                       % (self.momB.shortname, self.momA.shortname)
        select_re = "%s|%s" % (possibility1, possibility2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                    'reserve_substate': 2,
                    'resv_nodes': (MATCH_RE, resv_nodes_re),
                    'Resource_List.select': (MATCH_RE, select_re),
                    'Resource_List.place': 'exclhost'}
        self.server.expect(RESV, exp_attr, id=rid)

    @requirements(num_moms=2)
    def test_maintenance_reconfirm_reservation_and_run(self):
        """
        Test if the overlapping reservation is reconfirmed correctly.
        Wait for both reservations to start and submit jobs into this
        reservations. Test if the jobs will run on correct nodes.
        Two moms (-p "servers=M1,moms=M1:M2") are needed for this test.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (INCR, '%s@*' % TEST_USER)})
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduler_iteration': 3})

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        if self.momA.is_cpuset_mom():
            self.hostA += '[0]'
        if self.momB.is_cpuset_mom():
            self.hostB += '[0]'

        now = int(time.time())
        a1 = {'Resource_List.select': '1:ncpus=1',
              'reserve_start': now + 60,
              'reserve_end': now + 7200}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                    'resv_nodes': (EQ, '(%s:ncpus=1)' % self.hostA)}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 60,
              'reserve_end': now + 7200}
        h2 = [self.momA.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        rid2 = self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                    'resv_nodes': (EQ, '(%s:ncpus=1)' % self.hostB)}
        self.server.expect(RESV, exp_attr, id=rid1)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '1000',
             'queue': rid1.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(990)
        jid1 = self.server.submit(j)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '1000',
             'queue': rid2.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(990)
        jid2 = self.server.submit(j)

        self.logger.info("Wait for reservations to start (2 minutes)")
        time.sleep(120)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, exp_attr, id=rid1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, exp_attr, id=rid2)

        exp_attr = {'job_state': 'R',
                    'exec_vnode': "(%s:ncpus=1)" % self.hostB}
        self.server.expect(JOB, exp_attr, id=jid1)

        exp_attr = {'job_state': 'R',
                    'exec_vnode': "(%s:ncpus=1)" % self.hostA}
        self.server.expect(JOB, exp_attr, id=jid2)

    @requirements(num_moms=2)
    def test_maintenance_progressive_degrade_reservation(self):
        """
        Test if the reservation is partially degraded by overlapping
        maintenance reservation at first, and then do full overlap.
        Test if the job in fully overlapped reservation will not run.
        Two moms (-p "servers=M1,moms=M1:M2") are needed for this test.
        """
        if len(self.moms) != 2:
            cmt = "need 2 mom hosts: -p servers=<m1>,moms=<m1>:<m2>"
            self.skip_test(reason=cmt)

        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': '%s@*' % TEST_USER})

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]

        select = 'host=%s+host=%s' % (self.momA.shortname,
                                      self.momB.shortname)
        a1 = {'Resource_List.select': select,
              'reserve_start': now + 60,
              'reserve_end': now + 7200}
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        a2 = {'reserve_start': now + 1800,
              'reserve_end': now + 5400}
        h2 = [self.momA.shortname]
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)

        self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|12'),
                    'reserve_substate': 12}
        self.server.expect(RESV, exp_attr, id=rid1)
        self.server.status(RESV, id=rid1)
        vnodes = r1.get_vnodes()
        self.assertEqual(len(vnodes), 1)
        vnode = self.server.status(NODE, id=vnodes[0])[0]
        self.assertEqual(vnode['Mom'], self.momB.hostname)

        self.logger.info("Wait for reservation to start (2 minutes)")
        time.sleep(120)

        a3 = {'reserve_start': now + 1800,
              'reserve_end': now + 5400}
        h3 = [self.momB.shortname]
        r3 = Reservation(TEST_USER, attrs=a3, hosts=h3)

        self.server.submit(r3)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '1000',
             'queue': rid1.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(990)
        jid1 = self.server.submit(j)

        self.logger.info("Wait for the job to try to run (30 seconds)")
        time.sleep(30)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

    def test_maintenance_degrade_reservation_jobs_dont_run(self):
        """
        Test if the reservation is degraded by overlapping
        maintenance reservation the jobs inside that degraded reservations do
        not run when the maintenance reservation starts running.
        """

        now = int(time.time())

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (INCR, '%s@*' % TEST_USER)})

        a1 = {'reserve_start': now + 30,
              'reserve_end': now + 1200}
        start = now + 30
        r1 = Reservation(TEST_USER, attrs=a1)
        rid1 = self.server.submit(r1)
        resv_name = rid1.split('.')[0]

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=resv_name)
        self.server.status(RESV, 'resv_nodes', id=rid1)
        resv_node_list = self.server.reservations[rid1].get_vnodes()
        resv_node = resv_node_list[0]

        # On a cpuset machine the resv_node could be a vnode,
        # always pull the hostname from the node attribute
        status = self.server.status(NODE, id=resv_node)
        h2 = [status[0]['resources_available.host']]

        jid = self.server.submit(Job(attrs={ATTR_q: resv_name}))

        a2 = {'reserve_start': now + 35,
              'reserve_end': now + 1000}
        r2 = Reservation(TEST_USER, attrs=a2, hosts=h2)
        rid2 = self.server.submit(r2)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10'),
                    'reserve_substate': 12}
        self.server.expect(RESV, exp_attr, id=rid1)
        resv_state = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.logger.info('Sleeping until reservation starts')
        offset = start - int(time.time())
        self.server.expect(RESV, resv_state, id=rid1,
                           offset=offset)
        self.server.expect(RESV, resv_state, id=rid2,
                           offset=offset)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        a = {'comment': 'Not Running: Queue not started.',
             'job_state': 'Q'}
        self.server.expect(JOB, a, id=jid)

    def test_maintenance_parse_numerous_hosts(self):
        """
        Test if the parsing of numerous hosts succeed.
        """
        now = int(time.time())

        a = {'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        chars = 'abcdefghijklmnopqrstuvwxyz'
        h = [''.join(random.choices(chars, k=8)) for i in range(200)]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        with self.assertRaises(PbsSubmitError) as err:
            self.server.submit(r)

        msg = err.exception.msg[0].strip()

        regex = "^pbs_rsub: Host with resources not found: .*"
        self.assertTrue(re.search(regex, msg))


================================================
FILE: test/tests/functional/pbs_modifyresv_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2020 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import textwrap
from tests.functional import *


class TestModifyResvHook(TestFunctional):
    """
    Tests to verify the reservation begin hook for a confirm standing/advance/
    degraded reservation once the reservation begins.
    """

    advance_resv_hook_script = textwrap.dedent("""\
        import pbs
        e=pbs.event()

        pbs.logmsg(pbs.LOG_DEBUG, 'Reservation Modify Hook name - %s' %
                   e.hook_name)

        if e.type == pbs.MODIFYRESV:
            pbs.logmsg(pbs.LOG_DEBUG, 'Reservation ID - %s' % e.resv.resvid)
    """)

    def setUp(self):
        """
        Create a reservation begin hook and set the server log level.
        """
        super(TestModifyResvHook, self).setUp()
        self.hook_name = 'modifyresv_hook'
        attrs = {'event': 'modifyresv'}
        self.server.create_hook(self.hook_name, attrs)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

    @tags('hooks')
    def test_server_down_case_1(self):
        """
        Testcase to submit and confirm an advance reservation, turn the server
        off, attempt to modify the reservation, turn the server on, delete the
        reservation after start and verify the modifyresv hook didn't run.
        """
        self.server.import_hook(self.hook_name,
                                TestModifyResvHook.advance_resv_hook_script)

        offset = 20
        duration = 300
        shift = 30
        rid, start, end = self.server.submit_resv(offset, duration)

        self.server.stop()
        self.server.alter_a_reservation(rid, start, end, shift, whichMessage=0)
        self.server.start()

        time.sleep(11)

        self.server.delete(rid)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=1, max_attempts=10,
                              existence=False)

    @tags('hooks')
    def test_alter_advance_resv(self):
        """
        Testcase to submit and confirm an advance reservation, wait for it
        to begin and verify the reservation begin hook.
        """
        self.server.import_hook(self.hook_name,
                                TestModifyResvHook.advance_resv_hook_script)

        offset = 20
        duration = 30
        shift = 10
        rid, start, end = self.server.submit_resv(offset, duration)

        self.server.alter_a_reservation(rid, start, end, shift, alter_s=True,
                                        alter_e=True)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        off = offset + shift + 10
        self.logger.info("Waiting %s sec for resv to run.", off)
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid, offset=off)

    @tags('hooks')
    def test_set_attrs(self):
        """
        Testcase to submit and confirm an advance reservation, delete the
        reservation and verify permissions in the modifyresv hook.
        """
        msg_rw = 'Reservation modify Hook - check rw Authorized_Groups'
        msg_ro = 'Reservation modify Hook - ctime is read-only.'

        hook_script = textwrap.dedent("""\
            import pbs
            e = pbs.event()
            r = e.resv
            pbs.logmsg(pbs.LOG_DEBUG,
                       'Reservation modify Hook name - %%s' %% e.hook_name)
            if e.type == pbs.MODIFYRESV:
                vo = r.Authorized_Groups
                r.Authorized_Groups = None
                r.Authorized_Groups = vo
                pbs.logmsg(pbs.LOG_DEBUG, "%s")
                try:
                    r.ctime = None
                except pbs.v1._exc_types.BadAttributeValueError:
                    pbs.logmsg(pbs.LOG_DEBUG, "%s")
        """ % (msg_rw, msg_ro))

        self.logger.info(hook_script)
        self.server.import_hook(self.hook_name, hook_script)

        offset = 10
        duration = 30
        shift = 10
        rid, start, end = self.server.submit_resv(offset, duration)
        self.server.alter_a_reservation(rid, start, end, shift, alter_s=True,
                                        alter_e=True)

        time.sleep(15)

        self.server.delete(rid)
        msg = "Reservation modify Hook name - %s" % (self.hook_name)
        self.server.log_match(msg, tail=True, max_attempts=30, interval=2)
        self.server.log_match(msg_rw, tail=True, max_attempts=30, interval=2)
        self.server.log_match(msg_ro, tail=True, max_attempts=30, interval=2)

    @tags('hooks')
    def test_scheduler_down(self):
        """
        Testcase to turn off the scheduler and submit a reservation,
        the same will be in unconfirmed state and upon ending the
        resvmodify hook would have run.
        """
        self.server.import_hook(self.hook_name,
                                TestModifyResvHook.advance_resv_hook_script)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        offset = 10
        duration = 30
        shift = 10

        rid, start, end = self.server.submit_resv(offset, duration,
                                                  confirmed=False)
        self.server.alter_a_reservation(rid, start, end, shift, alter_s=True,
                                        alter_e=True, check_log=False,
                                        sched_down=True)

        time.sleep(5)

        msg = 'Hook;Server@%s;Reservation ID - %s' % (self.server.shortname,
                                                      rid)
        self.server.log_match(msg, tail=True)

    @tags('hooks')
    def test_multiple_hooks(self):
        """
        Define multiple hooks for the modifyresv event and make sure both
        get run.

        """
        test_hook_script = textwrap.dedent("""
        import pbs
        e=pbs.event()

        pbs.logmsg(pbs.LOG_DEBUG,
                   'Reservation Modify Hook name - %%s' %% e.hook_name)

        if e.type == pbs.MODIFYRESV:
            pbs.logmsg(pbs.LOG_DEBUG,
                       'Test %d Reservation ID - %%s' %% e.resv.resvid)
        """)

        attrs = {'event': 'modifyresv'}
        self.server.create_import_hook("test_hook_1", attrs,
                                       test_hook_script % 1)
        self.server.create_import_hook("test_hook_2", attrs,
                                       test_hook_script % 2)
        offset = 10
        duration = 30
        shift = 10
        rid, start, end = self.server.submit_resv(offset, duration)
        self.server.alter_a_reservation(rid, start, end, shift, alter_s=True,
                                        alter_e=True)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid, offset=10)

        msg = 'Hook;Server@%s;Test 1 Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=3)

        msg = 'Hook;Server@%s;Test 2 Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=3)


================================================
FILE: test/tests/functional/pbs_mom_hook_sync.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestMomHookSync(TestFunctional):
    """
    This test suite tests to make sure a hook does not disappear in
    a series of hook event change from mom hook to server hook and
    then back to a mom hook. This is a good exercise to make sure
    hook updates are not lost even when mom is stopped, killed, and
    restarted during hook event changes.
    """

    def setUp(self):
        if len(self.moms) != 2:
            self.skip_test(reason="need 2 mom hosts: -p moms=<m1>:<m2>")
        TestFunctional.setUp(self)

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momA.delete_vnode_defs()
        self.momB.delete_vnode_defs()

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        rc = self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        self.assertEqual(rc, 0)

        rc = self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)
        self.assertEqual(rc, 0)

        rc = self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)
        self.assertEqual(rc, 0)

        self.hook_name = "cpufreq"
        hook_body = "import pbs\n"
        a = {'event': 'execjob_begin', 'enabled': 'True'}
        self.server.create_import_hook(self.hook_name, a, hook_body)

        hook_config = """{
    "apple"         : "pears",
    "banana"         : "cucumbers"
}
"""
        fn = self.du.create_temp_file(body=hook_config)
        a = {'content-type': 'application/x-config',
             'content-encoding': 'default',
             'input-file': fn}
        self.server.manager(MGR_CMD_IMPORT, HOOK, a, self.hook_name)
        os.remove(fn)

        self.server.log_match(
            'successfully sent hook file.*cpufreq.HK ' +
            'to %s.*' % self.momA.hostname,
            max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file.*cpufreq.CF ' +
            'to %s.*' % self.momA.hostname,
            max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file.*cpufreq.PY ' +
            'to %s.*' % self.momA.hostname,
            max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file.*cpufreq.HK ' +
            'to %s.*' % self.momB.hostname,
            max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file.*cpufreq.CF ' +
            'to %s.*' % self.momB.hostname,
            max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file.*cpufreq.PY ' +
            'to %s.*' % self.momB.hostname,
            max_attempts=10, regexp=True)

    def tearDown(self):
        self.momB.signal("-CONT")
        TestFunctional.tearDown(self)

    def test_momhook_to_serverhook_with_resume(self):
        """
        Given an existing mom hook, suspend mom on hostB,
        change the hook to be a server hook (causes a
        delete action), then change it back to a mom hook
        (results in a send action), and then resume mom.
        The delete action occurs first and then the send
        action so we end up with a mom hook in place.
        """

        self.momB.signal('-STOP')

        # Turn current mom hook into a server hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'queuejob'},
                            id=self.hook_name)

        # Turn current mom hook back to a mom hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'exechost_periodic'},
                            id=self.hook_name)

        # For testability, delay resuming the mom so we can
        # get a different timestamp on the hook updates
        self.logger.info("Waiting 3 secs for earlier hook updates to complete")
        time.sleep(3)

        now = time.time()
        self.momB.signal('-CONT')

        # Put another sleep delay so log_match() can see all the matches
        self.logger.info("Waiting 3 secs for new hook updates to complete")
        time.sleep(3)
        match_delete = self.server.log_match(
            'successfully deleted hook file cpufreq.HK ' +
            'from %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        # Without the fix, there won't be these sent hook file messages
        match_sent1 = self.server.log_match(
            'successfully sent hook file.*cpufreq.HK ' +
            'to %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        match_sent2 = self.server.log_match(
            'successfully sent hook file.*cpufreq.CF ' +
            'to %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        match_sent3 = self.server.log_match(
            'successfully sent hook file.*cpufreq.PY ' +
            'to %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        # Lower the linecount, earlier the line appears in log
        self.assertTrue(match_delete[0] < match_sent1[0])
        self.assertTrue(match_delete[0] < match_sent2[0])
        self.assertTrue(match_delete[0] < match_sent3[0])

    def test_momhook_to_momhook_with_resume(self):
        """
        Given an existing mom hook, suspend mom on hostB,
        change the hook event to be another mom hook event
        (results in a send action), change the hook to be a
        server hook (causes a delete action),
        and then resume mom.
        The send action occurs first and then the delete
        action so we end up with no mom hook in place.
        """

        self.momB.signal('-STOP')

        # Turn current mom hook back to a mom hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'exechost_periodic'},
                            id=self.hook_name)

        # Turn current mom hook into a server hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'queuejob'},
                            id=self.hook_name)

        # For testability, delay resuming the mom so we can
        # get a different timestamp on the hook updates
        self.logger.info("Waiting 3 secs for earlier hook updates to complete")
        time.sleep(3)

        now = time.time()
        self.momB.signal('-CONT')

        # Put another sleep delay so log_match() can see all the matches
        self.logger.info("Waiting 3 secs for new hook updates to complete")
        time.sleep(3)
        match_delete = self.server.log_match(
            'successfully deleted hook file cpufreq.HK ' +
            'from %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        # Only the hook control file (.HK) is sent since that contains
        # the hook event change to exechost_periodic.
        match_sent = self.server.log_match(
            'successfully sent hook file .*cpufreq.HK ' +
            'to %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        # Lower the linecount, earlier the line appears in log
        self.assertTrue(match_sent[0] < match_delete[0])

        self.server.log_match(
            'successfully sent hook file .*cpufreq.CF ' +
            'to %s.*' % self.momB.hostname, existence=False,
            starttime=now, max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file .*cpufreq.PY ' +
            'to %s.*' % self.momB.hostname, existence=False,
            starttime=now, max_attempts=10, regexp=True)

    def test_momhook_to_serverhook_with_restart(self):
        """
        Like test_1 except instead of resuming mom,
        we kill -9 it and restart.
        """

        self.momB.signal('-STOP')

        # Turn current mom hook into a server hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'queuejob'},
                            id=self.hook_name)

        # Turn current mom hook back to a mom hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'exechost_periodic'},
                            id=self.hook_name)

        # For testability, delay resuming the mom so we can
        # get a different timestamp on the hook updates
        self.logger.info("Waiting 3 secs for earlier hook updates to complete")
        time.sleep(3)

        now = time.time()
        self.momB.signal('-KILL')
        self.momB.start()

        # Killing and restarting mom would cause server to sync
        # up its version of the mom hook file resulting in an
        # additional send action, which would not alter the
        # outcome, as send action occurs after the delete action.
        self.server.log_match(
            'Node;%s.*;' % (self.momB.hostname,) +
            'Hello from MoM',
            starttime=now, max_attempts=10, regexp=True)

        # Put another sleep delay so log_match() can see all the matches
        self.logger.info("Waiting 3 secs for new hook updates to complete")
        time.sleep(3)
        match_delete = self.server.log_match(
            'successfully deleted hook file cpufreq.HK ' +
            'from %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        # Without the fix, there won't be these sent hook file messages
        match_sent1 = self.server.log_match(
            'successfully sent hook file.*cpufreq.HK ' +
            'to %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        match_sent2 = self.server.log_match(
            'successfully sent hook file.*cpufreq.CF ' +
            'to %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        match_sent3 = self.server.log_match(
            'successfully sent hook file.*cpufreq.PY ' +
            'to %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        # Lower the linecount, earlier the line appears in log
        self.assertTrue(match_delete[0] < match_sent1[0])
        self.assertTrue(match_delete[0] < match_sent2[0])
        self.assertTrue(match_delete[0] < match_sent3[0])

    def test_momhook_to_momhook_with_restart(self):
        """
        Like test_2 except instead of resuming mom,
        we kill -9 it and restart.
        """

        self.momB.signal('-STOP')

        # Turn current mom hook back to a mom hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'exechost_periodic'},
                            id=self.hook_name)

        # Turn current mom hook into a server hook
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'event': 'queuejob'},
                            id=self.hook_name)

        # For testability, delay resuming the mom so we can
        # get a different timestamp on the hook updates
        self.logger.info("Waiting 3 secs for earlier hook updates to complete")
        time.sleep(3)

        # Killing and restarting mom would cause server to sync
        # up its version of the mom hook file resulting in an
        # delete mom hook action as that hook is now seen as a
        # server hook. Since it's now a server hook, no further
        # mom hook sends are done.
        now = time.time()
        self.momB.signal('-KILL')
        self.momB.start()

        # Put another sleep delay so log_match() can see all the matches
        self.logger.info("Waiting 3 secs for new hook updates to complete")
        time.sleep(3)
        self.server.log_match(
            'successfully deleted hook file cpufreq.HK ' +
            'from %s.*' % self.momB.hostname,
            starttime=now, max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file .*cpufreq.HK ' +
            'to %s.*' % self.momB.hostname, existence=False,
            starttime=now, max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file .*cpufreq.CF ' +
            'to %s.*' % self.momB.hostname, existence=False,
            starttime=now, max_attempts=10, regexp=True)

        self.server.log_match(
            'successfully sent hook file .*cpufreq.PY ' +
            'to %s.*' % self.momB.hostname, existence=False,
            starttime=now, max_attempts=10, regexp=True)

    def compare_rescourcedef(self):
        srvret = None

        for _ in range(5):
            time.sleep(1)
            if srvret is None:
                file = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                    'server_priv', 'hooks', 'resourcedef')
                srvret = self.du.cat(self.server.hostname, file, logerr=False,
                                     sudo=True)
                if srvret['rc'] != 0 or len(srvret['out']) == 0:
                    srvret = None
                    continue

            file = self.momB.get_formed_path(self.momB.pbs_conf['PBS_HOME'],
                                             'mom_priv', 'hooks',
                                             'resourcedef')
            momret = self.momB.cat(file, logerr=False,
                                   sudo=True)
            if momret['rc'] != 0 or len(momret['out']) == 0:
                continue

            if momret['out'] == srvret['out']:
                return
            else:
                srvret = None
        raise self.failureException("resourcedef file is not in sync")

    def test_rescdef_mom_recreate(self):
        """
        test if rescdef file is recreated when a mom is deleted and added back
        """

        # create a custom resource
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'string', 'flag': 'h'}, id='foo')

        # compare rescdef files between mom and server
        self.compare_rescourcedef()

        # delete node
        self.server.manager(MGR_CMD_DELETE, NODE, id=self.momB.shortname)
        self.server.expect(NODE, 'state', id=self.momB.shortname, op=UNSET)

        # check if rescdef is deleted
        file = self.momB.get_formed_path(self.momB.pbs_conf['PBS_HOME'],
                                         'mom_priv', 'resourcedef')
        self.assertFalse(
            self.momB.du.isfile(self.momB.hostname, file, sudo=True),
            "resourcedef not deleted at mom")

        # recreate node
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.momB.shortname)

        # check for status of the node
        self.server.expect(NODE, {'state': 'free'}, id=self.momB.shortname)

        # compare rescdef files between mom and server
        self.compare_rescourcedef()


================================================
FILE: test/tests/functional/pbs_mom_hooks_test.py
================================================
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


@requirements(num_moms=2)
class TestMoMHooks(TestFunctional):
    """
    This test covers basic functionality of MoM Hooks
    """

    def setUp(self):
        TestFunctional.setUp(self)
        if len(self.moms) != 2:
            self.skipTest('test requires two MoMs as input, ' +
                          'use -p moms=<mom1>:<mom2>')
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        a = {'resources_available.ncpus': 8, 'resources_available.mem': '8gb'}
        for mom in self.moms.values():
            self.server.manager(MGR_CMD_SET, NODE, a, mom.shortname)
        pbsdsh_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                  'bin', 'pbsdsh')
        self.job1 = Job()
        self.job1.create_script(
            "#PBS -l select=vnode=" + self.hostA + "+vnode=" + self.hostB +
            ":mem=4mb\n" +
            pbsdsh_cmd + " -n 1 /bin/date\n" +
            "sleep 20\n")
        self.job2 = Job()
        self.job2.create_script(
            "#PBS -l select=vnode=" + self.hostA + "+vnode=" + self.hostB +
            ":mem=4mb\n" +
            pbsdsh_cmd + " -n 1 /bin/date\n" +
            pbsdsh_cmd + " -n 1 /bin/echo hi\n" +
            pbsdsh_cmd + " -n 1 /bin/ls\n" +
            "sleep 20")
        self.job3 = Job()
        self.job3.create_script(
            "#PBS -l select=vnode=" + self.hostA + "+vnode=" + self.hostB +
            ":mem=4mb\n" +
            "sleep 600\n")
        self.job4 = Job()
        self.job4.create_script(
            "#PBS -l select=vnode=" + self.hostA + "+vnode=" + self.hostB +
            ":mem=4mb\n" +
            pbsdsh_cmd + " -n 1 /bin/date\n" +
            "sleep 20\n" +
            "exit 7")

    def hook_init(self, hook_name, hook_event, hook_body=None,
                  freq=None):
        """
        Dynamically create and import a MoM hook into the server.
        hook_name: the name of the hook to create. No default
        hook_event: the event type of the hook. No default
        hook_body: the body of the hook. If None, it is created "on-the-fly"
        based on vnode_comment, resc_avail_file, resc_avail_ncpus by calling
        customize_hook.
        resc_avail_file: the file size to set in the hook. Defaults to 1gb
        resc_avail_ncpus: the ncpus to set in the hook. Defaults to 2
        freq: The frequency of the periodic hook.
        ignoreerror: if True, ignore an error in importing the hook. This is
        needed for tests that test a hook error. Defaults to False.

        Return True on success and False otherwise.
        """
        a = {}
        if hook_event:
            a['event'] = hook_event
        if freq:
            a['freq'] = freq
        a['enabled'] = 'true'
        a['alarm'] = 5

        self.server.create_import_hook(hook_name, a, hook_body,
                                       overwrite=True)

    def basic_hook_accept_periodic(self, hook_name, freq, hook_body):

        hook_event = "exechost_periodic"
        self.hook_init(hook_name, hook_event, hook_body, freq=freq)
        exp_msg = ["Hook;pbs_python;event is %s" % hook_event.upper(),
                   "Hook;pbs_python;hook_name is %s" % hook_name,
                   "Hook;pbs_python;hook_type is site",
                   "Hook;pbs_python;requestor_host is %s" % self.hostA,
                   ]
        for msg in exp_msg:
            self.momA.log_match(msg)
        exp_msg[3] = "Hook;pbs_python;requestor_host is %s" % self.hostB
        for msg in exp_msg:
            self.momB.log_match(msg)
        msg = "Not allowed to update vnode 'aspasia'"
        msg += ", as it is owned by a different mom"
        self.server.log_match(msg)

        a = {'state': 'offline',
             'resources_available.file': '17tb',
             'resources_available.ncpus': 17,
             'resources_available.mem': '700gb',
             'comment': "Comment update done  by %s hook @ %s" %
             (hook_name, self.hostA)}
        self.server.expect(NODE, a, id=self.hostA)
        a['comment'] = "Comment update done  by %s hook @ %s" % (
            hook_name, self.hostB)
        self.server.expect(NODE, a, id=self.hostB)
        a = {'resources_available.file': '500tb',
             'resources_available.mem': '300gb'}
        self.server.expect(NODE, a, id="aspasia")

    def test_exechost_periodic_with_accept(self):
        """
        Test exechost_periodic which accepts the event
        """
        self.basic_hook_accept_periodic("period", 5, period_py)

    def tearDown(self):
        TestFunctional.tearDown(self)
        hooks = self.server.status(HOOK)
        for h in hooks:
            if h['id'] in ("period",):
                self.server.manager(MGR_CMD_DELETE, HOOK, id=h['id'])


period_py = """import pbs
import os
import sys
import time

local_node = pbs.get_local_nodename()
other_node = local_node
other_node2 = "aspasia"

def print_attribs(pbs_obj):
   for a in pbs_obj.attributes:
      v = getattr(pbs_obj, a)
      if (v != None) and str(v) != "":
         pbs.logmsg(pbs.LOG_DEBUG, "%s = %s" % (a,v))

s = pbs.server()

jobs = pbs.server().jobs()
for j in jobs:
   pbs.logmsg(pbs.LOG_DEBUG, "Found job %s" % (j.id))
   print_attribs(j)

queues = s.queues()
for q in queues:
   pbs.logmsg(pbs.LOG_DEBUG, "Found queue %s" % (q.name))
   for k in q.jobs():
     pbs.logmsg(pbs.LOG_DEBUG, "Found job %s in queue %s" % (k.id, q.name))

resvs = s.resvs()
for r in resvs:
   pbs.logmsg(pbs.LOG_DEBUG, "Found resv %s" % (r.id))

vnodes = s.vnodes()
for v in vnodes:
   pbs.logmsg(pbs.LOG_DEBUG, "Found vnode %s" % (v.name))

e = pbs.event()

pbs.logmsg(pbs.LOG_DEBUG,
           "printing pbs.event() values ---------------------->")
pbs.logmsg(pbs.LOG_DEBUG, "event is %s" % ("EXECHOST_PERIODIC"))

pbs.logmsg(pbs.LOG_DEBUG, "hook_name is %s" % (e.hook_name))
pbs.logmsg(pbs.LOG_DEBUG, "hook_type is %s" % (e.hook_type))
pbs.logmsg(pbs.LOG_DEBUG, "requestor is %s" % (e.requestor))
pbs.logmsg(pbs.LOG_DEBUG, "requestor_host is %s" % (e.requestor_host))

vn = pbs.event().vnode_list

pbs.logmsg(pbs.LOG_DEBUG, "vn is %s type is %s" % (str(vn), type(vn)))
for k in pbs.event().vnode_list.keys():

   if k == local_node:
      pbs.logmsg(pbs.LOG_DEBUG, "%s: pcpus=%d" % (k, vn[k].pcpus));
      pbs.logmsg(pbs.LOG_DEBUG, "%s: pbs_version=%s" % (k, vn[k].pbs_version));
      pbs.logmsg(pbs.LOG_DEBUG, "%s: resources_available[%s]=%d" % (k,
                "ncpus", vn[k].resources_available["ncpus"]));
      pbs.logmsg(pbs.LOG_DEBUG, "%s: resources_available[%s]=%s type=%s" % (k,
                "mem", vn[k].resources_available["mem"],
                type(vn[k].resources_available["mem"])));
      pbs.logmsg(pbs.LOG_DEBUG, "%s: resources_available[%s]=%s" % (k, "arch",
                    vn[k].resources_available["arch"]));

if other_node not in vn:
   vn[other_node] = pbs.vnode(other_node)

vn[other_node].pcpus = 7
vn[other_node].ntype = pbs.ND_PBS
vn[other_node].state = pbs.ND_OFFLINE
vn[other_node].sharing = pbs.ND_FORCE_EXCL
vn[other_node].resources_available["ncpus"] = 17
vn[other_node].resources_available["file"] = pbs.size("17tb")
vn[other_node].resources_available["mem"] = pbs.size("700gb")
vn[other_node].comment = "Comment update done  by period hook "
vn[other_node].comment += "@ %s" % (local_node)

if other_node2 not in vn:
   vn[other_node2] = pbs.vnode(other_node2)

vn[other_node2].resources_available["file"] = pbs.size("500tb")
vn[other_node2].resources_available["mem"] = pbs.size("300gb")
"""


================================================
FILE: test/tests/functional/pbs_mom_job_dir.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestMomJobDir(TestFunctional):
    """
    This test suite tests the mom's ability to create job directories.
    """

    def change_server_name(self, servername):
        """
        Stops the server, changes the server name to `servername`,
        sets the server hostname to the old servername,
        and starts the server again.
        """
        self.server.stop()
        self.assertFalse(self.server.isUp(), 'Failed to stop PBS')

        conf = self.du.parse_pbs_config(self.server.hostname)
        self.du.set_pbs_config(
            self.server.hostname,
            confs={'PBS_SERVER_HOST_NAME': conf['PBS_SERVER'],
                   'PBS_SERVER': servername})

        self.server.start()
        self.assertTrue(self.server.isUp(), 'Failed to start PBS')
        return

    def test_existing_directory_longid(self):
        """
        If a job directory already exists, the mom should clean it up
        after rejecting the job. When the server sends the request for
        the second time, the mom will run the job correctly.
        The mom has special code if the job id is less than 11 characters,
        so this will test job ids longer than 11 characters.
        """

        # Change the server name to create a job id longer than 11 characters
        self.change_server_name('superlongservername')

        j = Job(TEST_USER, attrs={ATTR_h: None})
        j.set_sleep_time(3)
        jid = self.server.submit(j)

        # Create the job directory in mom_priv
        path = self.mom.get_formed_path(self.mom.pbs_conf['PBS_HOME'],
                                        'mom_priv', 'jobs', jid + '.TK')
        self.logger.info('Creating directory %s', path)
        self.du.mkdir(hostname=self.mom.hostname, path=path, sudo=True)

        # Rls the job, ensure it finishes and the directory no longer exists
        self.server.rlsjob(jid, USER_HOLD)
        self.server.expect(JOB, 'queue', id=jid, op=UNSET, max_attempts=20,
                           interval=1, offset=1)
        ret = self.du.isdir(hostname=self.mom.hostname, path=path, sudo=True)
        self.assertFalse(ret, 'Directory %s still exists.' % path)

    def test_existing_directory_shortid(self):
        """
        If a job directory already exists, the mom should clean it up
        after rejecting the job. When the server sends the request for
        the second time, the mom will run the job correctly.
        The mom has special code if the job id is less than 11 characters,
        so this will test job ids shorter than 11 characters.
        """

        # Change the server name to create a job id shorter than 11 characters
        self.change_server_name('svr')

        # Submit a held job so the job id is known
        j = Job(TEST_USER, attrs={ATTR_h: None})
        j.set_sleep_time(3)
        jid = self.server.submit(j)

        # Create the job directory in mom_priv
        path = self.mom.get_formed_path(self.mom.pbs_conf['PBS_HOME'],
                                        'mom_priv', 'jobs', jid + '.TK')
        self.logger.info('Creating directory %s', path)
        self.du.mkdir(hostname=self.mom.hostname, path=path, sudo=True)

        # Rls the job, ensure it finishes and the directory no longer exists
        self.server.rlsjob(jid, USER_HOLD)
        self.server.expect(JOB, 'queue', id=jid, op=UNSET, max_attempts=20,
                           interval=1, offset=1)
        ret = self.du.isdir(hostname=self.mom.hostname, path=path, sudo=True)
        self.assertFalse(ret, 'Directory %s still exists.' % path)


================================================
FILE: test/tests/functional/pbs_mom_local_nodename.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *
from ptl.lib.pbs_testlib import BatchUtils
import socket


class TestMomLocalNodeName(TestFunctional):
    """
    This test suite tests that mom sets its short name correctly
    and that mom.get_local_nodename() returns the correct value
    """

    def test_url_nodename_not_truncated(self):
        """
        This test case tests that mom does not truncate the value of
        PBS_MOM_NODE_NAME when it contains dots
        """
        self.du.set_pbs_config(hostname=self.mom.shortname,
                               confs={'PBS_MOM_NODE_NAME': 'a.b.c.d'})
        # Restart PBS for changes
        self.server.restart()
        self.mom.restart()
        # add hook
        a = {'event': 'execjob_begin', 'enabled': 'True'}
        hook_name = "begin"
        hook_body = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG,
           'my local nodename is %s'
           % pbs.get_local_nodename())
"""
        self.server.create_import_hook(hook_name, a, hook_body)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.mom.log_match("my local nodename is a.b.c.d")

    def test_ip_nodename_not_truncated(self):
        """
        This test case tests that mom does not truncate the value of
        PBS_MOM_NODE_NAME when it is an ipaddress
        """
        ipaddr = socket.gethostbyname(self.mom.hostname)
        self.du.set_pbs_config(hostname=self.mom.shortname,
                               confs={'PBS_MOM_NODE_NAME': ipaddr})
        # Restart PBS for changes
        self.server.restart()
        self.mom.restart()
        # add hook
        a = {'event': 'execjob_begin', 'enabled': 'True'}
        hook_name = "begin"
        hook_body = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG,
           'my local nodename is %s'
           % pbs.get_local_nodename())
"""
        self.server.create_import_hook(hook_name, a, hook_body)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.mom.log_match("my local nodename is %s" % ipaddr)

    def tearDown(self):
        self.du.unset_pbs_config(hostname=self.mom.shortname,
                                 confs=['PBS_MOM_NODE_NAME'])
        self.server.restart()
        self.server.manager(MGR_CMD_DELETE, VNODE, id="@default",
                            runas=ROOT_USER)
        self.mom.restart()
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_mom_mock_run.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@skipOnCpuSet
class TestMomMockRun(TestFunctional):

    def test_rsc_used(self):
        """
        Test that resources_used are set correctly by mom under mock run
        """
        # Kill the existing mom process
        self.mom.stop()

        # Start mom in mock run mode
        mompath = os.path.join(self.server.pbs_conf["PBS_EXEC"], "sbin",
                               "pbs_mom")
        cmd = [mompath, "-m"]
        self.du.run_cmd(hosts=self.mom.shortname, cmd=cmd, sudo=True)

        # Submit a job requesting ncpus, mem and walltime
        attr = {ATTR_l + ".select": "1:ncpus=1:mem=5mb",
                ATTR_l + ".walltime": "00:00:20"}
        j = Job(attrs=attr)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.logger.info("Waiting until job finishes")
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=22)

        # Check accounting record for this job
        used_ncpus = "resources_used.ncpus=1"
        self.server.accounting_match(msg=used_ncpus, id=jid, n='ALL')
        used_mem = "resources_used.mem=5mb"
        self.server.accounting_match(msg=used_mem, id=jid, n='ALL')
        used_walltime = "resources_used.walltime=00:00:00"
        self.server.accounting_match(
            msg="resources_used.walltime", id=jid, n='ALL')
        self.server.accounting_match(
            msg=used_walltime, existence=False, id=jid,
            max_attempts=1, n='ALL')


================================================
FILE: test/tests/functional/pbs_mom_walltime.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.lib.pbs_testlib import BatchUtils


class TestMomWalltime(TestFunctional):

    def test_mom_hook_not_counted_in_walltime(self):
        """
        Test that time spent on mom hooks is not counted in walltime of the job
        """
        hook_name_event_dict = {
            'begin': 'execjob_begin',
            'prologue': 'execjob_prologue',
            'launch': 'execjob_launch',
            'epilogue': 'execjob_epilogue',
            'preterm': 'execjob_preterm',
            'end': 'execjob_end'
        }
        hook_script = (
            "import pbs\n"
            "import time\n"
            "time.sleep(2)\n"
            "pbs.event().accept\n"
        )
        hook_attrib = {'event': '', 'enabled': 'True'}
        for name, event in hook_name_event_dict.items():
            hook_attrib['event'] = event
            self.server.create_import_hook(name, hook_attrib, hook_script)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})
        job = Job(TEST_USER)
        job.set_sleep_time(3)
        jid = self.server.submit(job)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid, extend='x',
                           offset=15)
        self.server.expect(JOB, {'resources_used.walltime': 5}, op=LE, id=jid,
                           extend='x')

    def test_hold_time_not_counted_in_walltime(self):
        """
        Test that hold time is not counted in walltime
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})

        a = {'Resource_List.ncpus': 1}
        J1 = Job(TEST_USER, attrs=a)
        J1.set_sleep_time(60)
        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        # Wait for job to run for sometime
        time.sleep(15)
        self.server.expect(JOB, {'resources_used.walltime': 0}, op=GT, id=jid1,
                           extend='x')

        self.server.holdjob(jid1, USER_HOLD)
        self.server.rerunjob(jid1)
        self.server.expect(JOB, {'Hold_Types': 'u'}, jid1)
        # Wait for sometime to verify that this time is not
        # accounted in 'resource_used.walltime'
        time.sleep(20)
        self.server.rlsjob(jid1, USER_HOLD)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid1, extend='x',
                           offset=45)
        # Verify if the job's walltime is in between 60 to 70
        self.server.expect(JOB, {'resources_used.walltime': 60}, op=GE,
                           id=jid1, extend='x')
        self.server.expect(JOB, {'resources_used.walltime': 70}, op=LE,
                           id=jid1, extend='x')

    def test_suspend_time_not_counted_in_walltime(self):
        """
        Test that suspend time is not counted in walltime
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})
        a = {'Resource_List.ncpus': 1}

        script_content = (
            '#!/bin/bash\n'
            'for i in {1..30}\n'
            'do\n'
            '\techo "time wait"\n'
            '\tsleep 1\n'
            'done'
        )

        J1 = Job(TEST_USER, attrs=a)
        J1.create_script(body=script_content)
        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        # Accumulate wall time
        time.sleep(10)

        self.server.sigjob(jobid=jid1, signal="suspend")
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)

        # Make sure the sched cycle is completed before reading
        # the walltime
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        jstat = self.server.status(JOB, id=jid1,
                                   attrib=['resources_used.walltime'])
        walltime = BatchUtils().convert_duration(
            jstat[0]['resources_used.walltime'])
        self.logger.info("Walltime before sleep: %d secs" % walltime)
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'True'})

        # Sleep for the job's entire walltime secs so we can catch any
        # walltime increment during job suspension time
        self.logger.info("Suspending job for 30s, job's execution time. " +
                         "Walltime should not get incremented while job " +
                         "is suspended")
        time.sleep(30)

        # Used walltime should remain the same
        self.server.expect(JOB, {'resources_used.walltime': walltime}, op=EQ,
                           id=jid1)

        self.server.sigjob(jobid=jid1, signal="resume")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid1, extend='x',
                           offset=20)

        # Verify if the job's total walltime is within limits
        # Adding 10s buffer since min mom poll time is 10s
        jstat = self.server.status(JOB, id=jid1,
                                   attrib=['resources_used.walltime'],
                                   extend='x')
        walltime_final = BatchUtils().convert_duration(
            jstat[0]['resources_used.walltime'])
        self.assertGreater(walltime_final, 0,
                           'Error fetching resources_used.walltime value')
        self.logger.info("Walltime at job completion: %d secs"
                         % walltime_final)
        self.assertIn(walltime_final, range(25, 41),
                      'Walltime is not in expected range')

    def test_mom_restart(self):
        """
        Test that time spent on jobs running on MoM will not reset when
        MoM is restarted
        """
        job = Job(TEST_USER)
        job.set_sleep_time(300)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        self.server.expect(JOB, {'resources_used.walltime': 30}, op=GT,
                           id=jid, offset=30)

        self.mom.stop(sig='-INT')
        self.mom.start(args=['-p'])

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        try:
            self.assertFalse(
                self.server.expect(JOB, {'resources_used.walltime': 30},
                                   op=LT, id=jid, max_attempts=5, interval=5))
        except PtlExpectError:
            pass


================================================
FILE: test/tests/functional/pbs_moved_job.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestMovedJob(TestFunctional):
    """
    This test suite tests moved jobs between two servers
    """
    @timeout(500)
    def test_moved_job_history(self):
        """
        This test suite verifies that moved (M) job preserves in the system
        at least until the job is really finished on the target server.
        Supposing the job is finished, this test also checks whether
        the M job is removed after <job_history_duration>.
        """
        # Skip test if number of servers is not equal to two
        if len(self.servers) != 2:
            self.skipTest("test requires atleast two servers as input, " +
                          "use -p servers=<server1:server2>,moms=<server1>")

        second_server = self.servers.keys()[1]

        attr = {'job_history_enable': 'True', 'job_history_duration': 5}
        self.servers[second_server].manager(MGR_CMD_SET, SERVER, attr)

        attr = {'queue_type': 'execution',
                'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, attr, id='p2p')
        self.servers[second_server].manager(MGR_CMD_CREATE, QUEUE,
                                            attr, id='p2p')

        attr = {'peer_queue': '\"p2p p2p@' + second_server + '\"'}
        self.scheduler.set_sched_config(attr)

        attr = {'scheduler_iteration': 5}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        self.server.restart()

        attr = {ATTR_queue: "p2p", ATTR_j: "oe",
                ATTR_W: "Output_Path=%s:/dev/null"
                % self.servers.keys()[0],
                'Resource_List.select': 'host=%s'
                % self.moms.keys()[0]}
        j = Job(TEST_USER, attrs=attr)
        j.set_sleep_time(300)
        jid = self.servers[second_server].submit(j)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.servers[second_server].expect(JOB, {'job_state': 'M'},
                                           id=jid, extend='x')

        # history work task runs every two minutes
        self.logger.info("Wait for history work task to process...")
        time.sleep(125)

        # the jid should be still present with state M
        self.servers[second_server].expect(JOB, {'job_state': 'M'},
                                           id=jid, extend='x')

        self.server.delete(id=jid, wait=True)

        # history work task runs every two minutes
        self.logger.info("Wait for history work task to process...")
        time.sleep(125)

        # the jid should be gone
        try:
            qstat = self.servers[second_server].status(JOB, 'status',
                                                       id=jid,
                                                       extend='x')
        except PbsStatusError as err:
            #  rc = 153 is for 'Unknown Job Id'
            self.assertEqual(err.rc, 153)
            qstat = ""

        self.assertEqual(qstat, "")

    def test_movejob_to_unknown_host(self):
        """
        This test verifies the error message qmove gives when user tries to
        move a job to an unknown server
        """

        attr = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)

        j = Job(TEST_USER)
        jid = self.server.submit(j)

        err = "Access from host not allowed, or unknown host " + jid
        with self.assertRaises(PbsMoveError) as e:
            self.server.movejob(jid, 'workq@unknownserver')
        self.assertIn(err, e.exception.msg[0])


================================================
FILE: test/tests/functional/pbs_moved_job_local.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestMovedJobLocal(TestFunctional):
    """
    This test suite tests moved jobs between two queues
    """

    def test_moved_job_acl_hosts_allow(self):
        """
        This test suite verifies that job can be moved
        into queue with acl_host_enabled.
        """
        queue = 'testq'
        a = {'queue_type': 'Execution',
             'enabled': 'True',
             'started': 'True',
             'acl_host_enable': 'True',
             'acl_hosts': self.servers.keys()[0]}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=queue)
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.movejob(jid, queue, runas=TEST_USER)
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(JOB, {ATTR_queue: queue, 'job_state': 'R'},
                           attrop=PTL_AND)

    def test_moved_job_acl_hosts_denial(self):
        """
        This test suite verifies that job can not be moved
        into queue with acl_host_enabled without the right hostname.
        """
        queue = 'testq'
        a = {'queue_type': 'Execution',
             'enabled': 'True',
             'started': 'True',
             'acl_host_enable': 'True',
             'acl_hosts': 'foo'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=queue)
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        err = "Access from host not allowed, or unknown host " + jid
        with self.assertRaises(PbsMoveError) as e:
            self.server.movejob(jid, queue, runas=TEST_USER)
        self.assertIn(err, e.exception.msg[0])


================================================
FILE: test/tests/functional/pbs_multi_sched.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import resource

from tests.functional import *


class TestMultipleSchedulers(TestFunctional):

    """
    Test suite to test different scheduler interfaces
    """

    def setup_sc1(self):
        a = {'partition': 'P1',
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_CREATE, SCHED,
                            a, id="sc1")
        self.scheds['sc1'].create_scheduler()
        self.scheds['sc1'].start()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc1")
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047}, id='sc1')

    def setup_sc2(self):
        dir_path = os.path.join(os.sep, 'var', 'spool', 'pbs', 'sched_dir')
        if not os.path.exists(dir_path):
            self.du.mkdir(path=dir_path, sudo=True)
        a = {'partition': 'P2',
             'sched_priv': os.path.join(dir_path, 'sched_priv_sc2'),
             'sched_log': os.path.join(dir_path, 'sched_logs_sc2'),
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_CREATE, SCHED,
                            a, id="sc2")
        self.scheds['sc2'].create_scheduler(dir_path)
        self.scheds['sc2'].start(dir_path)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc2")

    def setup_sc3(self):
        a = {'partition': 'P3',
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_CREATE, SCHED,
                            a, id="sc3")
        self.scheds['sc3'].create_scheduler()
        self.scheds['sc3'].start()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc3")

    def setup_queues_nodes(self):
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq1')
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq2')
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq3')
        p1 = {'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, QUEUE, p1, id='wq1')
        p2 = {'partition': 'P2'}
        self.server.manager(MGR_CMD_SET, QUEUE, p2, id='wq2')
        p3 = {'partition': 'P3'}
        self.server.manager(MGR_CMD_SET, QUEUE, p3, id='wq3')
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 4)
        vnode0 = self.mom.shortname + '[0]'
        vnode1 = self.mom.shortname + '[1]'
        vnode2 = self.mom.shortname + '[2]'
        self.server.manager(MGR_CMD_SET, NODE, p1, id=vnode0)
        self.server.manager(MGR_CMD_SET, NODE, p2, id=vnode1)
        self.server.manager(MGR_CMD_SET, NODE, p3, id=vnode2)

    def common_setup(self):
        self.setup_sc1()
        self.setup_sc2()
        self.setup_sc3()
        self.setup_queues_nodes()

    def check_vnodes(self, j, vnodes, jid):
        self.server.status(JOB, 'exec_vnode', id=jid)
        nodes = j.get_vnodes(j.exec_vnode)
        for vnode in vnodes:
            if vnode not in nodes:
                self.assertFalse(True, str(vnode) +
                                 " is not in exec_vnode list as expected")

    def get_tzid(self):
        if 'PBS_TZID' in self.conf:
            tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            tzone = os.environ['PBS_TZID']
        else:
            tzone = 'America/Los_Angeles'
        return tzone

    def set_scheduling(self, scheds=None, op=False):
        if scheds is not None:
            for each in scheds:
                self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': op},
                                    id=each)

    def delete_sched(self, sched_name):
        """
        Helper function to delete sched"
        """
        self.scheds[sched_name].terminate()
        sched_log = self.scheds[sched_name].attributes['sched_log']
        sched_priv = self.scheds[sched_name].attributes['sched_priv']
        self.du.rm(path=sched_log, sudo=True, recursive=True, force=True)
        self.du.rm(path=sched_priv, sudo=True, recursive=True, force=True)
        self.server.manager(MGR_CMD_DELETE, SCHED, id=sched_name)

    def test_job_sort_formula_multisched(self):
        """
        Test that job_sort_formula can be set for each sched
        """
        self.common_setup()

        # Set JSF on server and test that it is used by all scheds
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'job_sort_formula': '1*walltime'})

        # Submit 2 jobs to each sched with different walltimes and
        # test that the one with higher walltime is scheduled first
        queues = ['wq1', 'wq2', 'wq3']
        for i in range(1, 4):
            scid = "sc" + str(i)
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'scheduling': 'False'}, id=scid)
            a = {'Resource_List.walltime': 100, ATTR_queue: queues[i - 1],
                 'Resource_List.ncpus': 2}
            j = Job(TEST_USER1, attrs=a)
            jid1 = self.server.submit(j)
            a['Resource_List.walltime'] = 1000
            j = Job(TEST_USER1, attrs=a)
            jid2 = self.server.submit(j)
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'scheduling': 'True'}, id=scid)
            self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
            self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

        # Set a different JSF on sc1, this should fail
        try:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'job_sort_formula': '2*walltime'}, id='sc1',
                                logerr=False)
            self.fail("Setting job_sort_formula on sched should have failed")
        except PbsManagerError:
            pass

        # Unset server's JSF and set sc1's JSF again
        self.server.manager(MGR_CMD_UNSET, SERVER, 'job_sort_formula')
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'job_sort_formula': '2*walltime'}, id='sc1')

        self.server.cleanup_jobs()

        # Submit 2 jobs with different walltimes to each sched again
        # This time, sc1 should be the only sched to care about walltime
        for i in range(1, 4):
            scid = "sc" + str(i)
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'scheduling': 'False'}, id=scid)
            a = {'Resource_List.walltime': 100, ATTR_queue: queues[i - 1],
                 'Resource_List.ncpus': 2}
            j = Job(TEST_USER1, attrs=a)
            jid1 = self.server.submit(j)
            a['Resource_List.walltime'] = 1000
            j = Job(TEST_USER1, attrs=a)
            jid2 = self.server.submit(j)
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'scheduling': 'True'}, id=scid)
            if scid == "sc1":
                self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
                self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
            else:
                self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
                self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

    def test_set_sched_priv(self):
        """
        Test sched_priv can be only set to valid paths
        and check for appropriate comments
        """
        self.setup_sc1()
        if not os.path.exists('/var/sched_priv_do_not_exist'):
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'sched_priv': '/var/sched_priv_do_not_exist'},
                                id="sc1")
        msg = 'PBS failed validation checks for sched_priv directory'
        a = {'sched_priv': '/var/sched_priv_do_not_exist',
             'comment': msg,
             'scheduling': 'False'}
        self.server.expect(SCHED, a, id='sc1', attrop=PTL_AND, max_attempts=10)
        pbs_home = self.server.pbs_conf['PBS_HOME']
        self.du.run_copy(self.server.hostname,
                         src=os.path.join(pbs_home, 'sched_priv'),
                         dest=os.path.join(pbs_home, 'sc1_new_priv'),
                         recursive=True)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_priv': '/var/spool/pbs/sc1_new_priv'},
                            id="sc1")
        a = {'sched_priv': '/var/spool/pbs/sc1_new_priv'}
        self.server.expect(SCHED, a, id='sc1', max_attempts=10)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc1")
        # Blocked by PP-1202 will revisit once its fixed
        # self.server.expect(SCHED, 'comment', id='sc1', op=UNSET)

    def test_set_sched_log(self):
        """
        Test sched_log can be only set to valid paths
        and check for appropriate comments
        """
        self.setup_sc1()
        if not os.path.exists('/var/sched_log_do_not_exist'):
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'sched_log': '/var/sched_log_do_not_exist'},
                                id="sc1")
        a = {'sched_log': '/var/sched_log_do_not_exist',
             'comment': 'Unable to change the sched_log directory',
             'scheduling': 'False'}
        self.server.expect(SCHED, a, id='sc1', max_attempts=10)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc1")
        pbs_home = self.server.pbs_conf['PBS_HOME']
        self.du.mkdir(path=os.path.join(pbs_home, 'sc1_new_logs'),
                      sudo=True)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_log': '/var/spool/pbs/sc1_new_logs'},
                            id="sc1")
        a = {'sched_log': '/var/spool/pbs/sc1_new_logs'}
        self.server.expect(SCHED, a, id='sc1', max_attempts=10)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc1")
        # Blocked by PP-1202 will revisit once its fixed
        # self.server.expect(SCHED, 'comment', id='sc1', op=UNSET)

    def test_start_scheduler(self):
        """
        Test that scheduler wont start without appropriate folders created.
        Scheduler will log a message if started without partition. Test
        scheduler states down, idle, scheduling.
        """
        self.setup_queues_nodes()
        pbs_home = self.server.pbs_conf['PBS_HOME']
        self.server.manager(MGR_CMD_CREATE, SCHED,
                            id="sc5")
        a = {'sched_host': self.server.hostname,
             'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="sc5")
        # Try starting without sched_priv and sched_logs
        ret = self.scheds['sc5'].start()
        self.server.expect(SCHED, {'state': 'down'}, id='sc5', max_attempts=10)
        msg = "sched_priv dir is not present for scheduler"
        self.assertTrue(ret['rc'], msg)
        self.du.run_copy(self.server.hostname,
                         src=os.path.join(pbs_home, 'sched_priv'),
                         dest=os.path.join(pbs_home, 'sched_priv_sc5'),
                         recursive=True, sudo=True)
        ret = self.scheds['sc5'].start()
        msg = "sched_logs dir is not present for scheduler"
        self.assertTrue(ret['rc'], msg)
        self.du.run_copy(self.server.hostname,
                         src=os.path.join(pbs_home, 'sched_logs'),
                         dest=os.path.join(pbs_home, 'sched_logs_sc5'),
                         recursive=True, sudo=True)
        ret = self.scheds['sc5'].start()
        self.scheds['sc5'].log_match(
            "Scheduler does not contain a partition",
            max_attempts=10, starttime=self.server.ctime)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'partition': 'P3'}, id="sc5")
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'Scheduling': 'True'}, id="sc5")
        self.server.expect(SCHED, {'state': 'idle'}, id='sc5', max_attempts=10)
        a = {'resources_available.ncpus': 100}
        vn = self.mom.shortname
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn + '[2]')
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc5")
        for _ in range(500):
            j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3'})
            self.server.submit(j)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc5")
        self.server.expect(SCHED, {'state': 'scheduling'},
                           id='sc5', max_attempts=10)

    def test_resource_sched_reconfigure(self):
        """
        Test all schedulers will reconfigure while creating,
        setting or deleting a resource
        """
        self.common_setup()
        t = time.time()
        self.server.manager(MGR_CMD_CREATE, RSC, id='foo')
        for name in self.scheds:
            self.scheds[name].log_match(
                "Scheduler is reconfiguring",
                max_attempts=10, starttime=t)
        # sleeping to make sure we are not checking for the
        # same scheduler reconfiguring message again
        time.sleep(1)
        t = time.time()
        attr = {ATTR_RESC_TYPE: 'long'}
        self.server.manager(MGR_CMD_SET, RSC, attr, id='foo')
        for name in self.scheds:
            self.scheds[name].log_match(
                "Scheduler is reconfiguring",
                max_attempts=10, starttime=t)
        # sleeping to make sure we are not checking for the
        # same scheduler reconfiguring message again
        time.sleep(1)
        t = time.time()
        self.server.manager(MGR_CMD_DELETE, RSC, id='foo')
        for name in self.scheds:
            self.scheds[name].log_match(
                "Scheduler is reconfiguring",
                max_attempts=10, starttime=t)

    def test_remove_partition_sched(self):
        """
        Test that removing all the partitions from a scheduler
        unsets partition attribute on scheduler and update scheduler logs.
        """
        self.setup_sc1()
        self.server.manager(MGR_CMD_UNSET, SCHED,
                            'partition', id="sc1")
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id="sc1")
        log_msg = "Scheduler does not contain a partition"
        self.scheds['sc1'].log_match(log_msg, max_attempts=10,
                                     starttime=self.server.ctime)
        # Blocked by PP-1202 will revisit once its fixed
        # self.server.manager(MGR_CMD_UNSET, SCHED, 'partition', id="sc2")

    def test_job_queue_partition(self):
        """
        Test job submitted to a queue associated to a partition will land
        into a node associated with that partition.
        """
        self.common_setup()
        vn = ['%s[%d]' % (self.mom.shortname, i) for i in range(3)]
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq1',
                                   'Resource_List.select': '1:ncpus=2'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.check_vnodes(j, [vn[0]], jid)
        self.scheds['sc1'].log_match(
            jid + ';Job run', max_attempts=10,
            starttime=self.server.ctime)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq2',
                                   'Resource_List.select': '1:ncpus=2'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.check_vnodes(j, [vn[1]], jid)
        self.scheds['sc2'].log_match(
            jid + ';Job run', max_attempts=10,
            starttime=self.server.ctime)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=2'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.check_vnodes(j, [vn[2]], jid)
        self.scheds['sc3'].log_match(
            jid + ';Job run', max_attempts=10,
            starttime=self.server.ctime)

    def test_multiple_queue_same_partition(self):
        """
        Test multiple queue associated with same partition
        is serviced by same scheduler
        """
        self.setup_sc1()
        self.setup_queues_nodes()
        vn0 = self.mom.shortname + '[0]'
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq1',
                                   'Resource_List.select': '1:ncpus=1'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.check_vnodes(j, [vn0], jid)
        self.scheds['sc1'].log_match(
            jid + ';Job run', max_attempts=10,
            starttime=self.server.ctime)
        p1 = {'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, QUEUE, p1, id='wq3')
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=1'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.check_vnodes(j, [vn0], jid)
        self.scheds['sc1'].log_match(
            jid + ';Job run', max_attempts=10,
            starttime=self.server.ctime)

    def test_preemption_highp_queue(self):
        """
        Test preemption occures only within queues which are assigned
        to same partition
        """
        self.common_setup()
        prio = {'Priority': 150, 'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, QUEUE, prio, id='wq3')
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq1',
                                   'Resource_List.select': '1:ncpus=2'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        t = time.time()
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=2'})
        jid2 = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=2'})
        jid3 = self.server.submit(j)
        self.server.expect(JOB, ATTR_comment, op=SET, id=jid3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.scheds['sc1'].log_match(
            jid1 + ';Job preempted by suspension',
            max_attempts=10, starttime=t)

    def test_preemption_two_sched(self):
        """
        Test two schedulers preempting jobs at the same time
        """
        self.common_setup()
        q = {'queue_type': 'Execution', 'started': 'True',
             'enabled': 'True', 'Priority': 150}
        q['partition'] = 'P1'
        self.server.manager(MGR_CMD_CREATE, QUEUE, q, id='highp_P1')
        q['partition'] = 'P2'
        self.server.manager(MGR_CMD_CREATE, QUEUE, q, id='highp_P2')

        n = {'resources_available.ncpus': 20}
        vn = ['%s[%d]' % (self.mom.shortname, i) for i in range(2)]
        self.server.manager(MGR_CMD_SET, NODE, n, id=vn)

        jids1 = []
        job_attrs = {'Resource_List.select': '1:ncpus=1', 'queue': 'wq1'}
        for _ in range(20):
            j = Job(TEST_USER, job_attrs)
            jid = self.server.submit(j)
            jids1.append(jid)

        jids2 = []
        job_attrs['queue'] = 'wq2'
        for _ in range(20):
            j = Job(TEST_USER, job_attrs)
            jid = self.server.submit(j)
            jids2.append(jid)

        self.server.expect(JOB, {'job_state=R': 40})

        s = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SCHED, s, id='sc1')
        self.server.manager(MGR_CMD_SET, SCHED, s, id='sc2')

        job_attrs = {'Resource_List.select': '20:ncpus=1', 'queue': 'highp_P1'}
        hj1 = Job(TEST_USER, job_attrs)
        hj1_jid = self.server.submit(hj1)

        job_attrs['queue'] = 'highp_P2'
        hj2 = Job(TEST_USER, job_attrs)
        hj2_jid = self.server.submit(hj2)

        s = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SCHED, s, id='sc1')
        self.server.manager(MGR_CMD_SET, SCHED, s, id='sc2')

        for jid in jids1:
            self.server.expect(JOB, {'job_state': 'S'}, id=jid)
            self.scheds['sc1'].log_match(jid + ';Job preempted by suspension')

        for jid in jids2:
            self.server.expect(JOB, {'job_state': 'S'}, id=jid)
            self.scheds['sc2'].log_match(jid + ';Job preempted by suspension')

        self.server.expect(JOB, {'job_state': 'R'}, id=hj1_jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=hj2_jid)

    def test_backfill_per_scheduler(self):
        """
        Test backfilling is applicable only per scheduler
        """
        self.common_setup()
        t = time.time()
        self.scheds['sc2'].set_sched_config(
            {'strict_ordering': 'True ALL'})
        a = {ATTR_queue: 'wq2',
             'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 60}
        j = Job(TEST_USER1, attrs=a)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        j = Job(TEST_USER1, attrs=a)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.scheds['sc2'].log_match(
            jid2 + ';Job is a top job and will run at',
            starttime=t)
        a['queue'] = 'wq3'
        j = Job(TEST_USER1, attrs=a)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        j = Job(TEST_USER1, attrs=a)
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)
        self.scheds['sc3'].log_match(
            jid4 + ';Job is a top job and will run at',
            max_attempts=5, starttime=t, existence=False)

    def test_resource_per_scheduler(self):
        """
        Test resources will be considered only by scheduler
        to which resource is added in sched_config
        """
        self.common_setup()
        a = {'type': 'float', 'flag': 'nh'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='gpus')
        self.scheds['sc3'].add_resource("gpus")
        a = {'resources_available.gpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id='@default')
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:gpus=2',
                                   'Resource_List.walltime': 60})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:gpus=2',
                                   'Resource_List.walltime': 60})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        job_comment = "Not Running: Insufficient amount of resource: "
        job_comment += "gpus (R: 2 A: 0 T: 2)"
        self.server.expect(JOB, {'comment': job_comment}, id=jid2)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq2',
                                   'Resource_List.select': '1:gpus=2'})
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq2',
                                   'Resource_List.select': '1:gpus=2'})
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

    def test_restart_server(self):
        """
        Test after server restarts sched attributes are persistent
        """
        self.setup_sc1()
        sched_priv = os.path.join(
            self.server.pbs_conf['PBS_HOME'], 'sched_priv_sc1')
        sched_logs = os.path.join(
            self.server.pbs_conf['PBS_HOME'], 'sched_logs_sc1')
        a = {'sched_host': self.server.hostname,
             'sched_priv': sched_priv,
             'sched_log': sched_logs,
             'scheduling': 'True',
             'scheduler_iteration': 600,
             'state': 'idle',
             'sched_cycle_length': '00:20:00'}
        self.server.expect(SCHED, a, id='sc1',
                           attrop=PTL_AND, max_attempts=10)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduler_iteration': 300,
                             'sched_cycle_length': '00:10:00'},
                            id='sc1')
        self.server.restart()
        a['scheduler_iteration'] = 300
        a['sched_cycle_length'] = '00:10:00'
        self.server.expect(SCHED, a, id='sc1',
                           attrop=PTL_AND, max_attempts=10)

    def test_job_sorted_per_scheduler(self):
        """
        Test jobs are sorted as per job_sort_formula
        inside each scheduler
        """
        self.common_setup()
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_sort_formula': 'ncpus'})
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="default")
        j = Job(TEST_USER1, attrs={'Resource_List.select': '1:ncpus=1'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        j = Job(TEST_USER1, attrs={'Resource_List.select': '1:ncpus=2'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="default")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc3")
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=1'})
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=2'})
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc3")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

    def test_qrun_job(self):
        """
        Test jobs can be run by qrun by a newly created scheduler.
        """
        self.setup_sc1()
        self.setup_queues_nodes()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc1")
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq1',
                                   'Resource_List.select': '1:ncpus=2'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        self.server.runjob(jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

    def test_run_limts_per_scheduler(self):
        """
        Test run_limits applied at server level is
        applied for every scheduler seperately.
        """
        self.common_setup()
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run': '[u:PBS_GENERIC=1]'})
        j = Job(TEST_USER1, attrs={'Resource_List.select': '1:ncpus=1'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        j = Job(TEST_USER1, attrs={'Resource_List.select': '1:ncpus=1'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        j = Job(TEST_USER1, attrs={'Resource_List.select': '1:ncpus=1'})
        jc = "Not Running: User has reached server running job limit."
        self.server.expect(JOB, {'comment': jc}, id=jid2)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=1'})
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq3',
                                   'Resource_List.select': '1:ncpus=1'})
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)
        jc = "Not Running: User has reached server running job limit."
        self.server.expect(JOB, {'comment': jc}, id=jid4)

    def test_multi_fairshare(self):
        """
        Test different schedulers have their own fairshare trees with
        their own usage
        """
        self.common_setup()
        default_shares = 10
        default_usage = 100

        sc1_shares = 20
        sc1_usage = 200

        sc2_shares = 30
        sc2_usage = 300

        sc3_shares = 40
        sc3_usage = 400

        self.scheds['default'].add_to_resource_group(TEST_USER, 10, 'root',
                                                     default_shares)
        self.scheds['default'].fairshare.set_fairshare_usage(
            TEST_USER, default_usage)

        self.scheds['sc1'].add_to_resource_group(TEST_USER, 10, 'root',
                                                 sc1_shares)
        self.scheds['sc1'].fairshare.set_fairshare_usage(TEST_USER, sc1_usage)

        self.scheds['sc2'].add_to_resource_group(TEST_USER, 10, 'root',
                                                 sc2_shares)
        self.scheds['sc2'].fairshare.set_fairshare_usage(TEST_USER, sc2_usage)

        self.scheds['sc3'].add_to_resource_group(TEST_USER, 10, 'root',
                                                 sc3_shares)
        self.scheds['sc3'].fairshare.set_fairshare_usage(TEST_USER, sc3_usage)

        # requery fairshare info from pbsfs
        default_fs = self.scheds['default'].fairshare.query_fairshare()
        sc1_fs = self.scheds['sc1'].fairshare.query_fairshare()
        sc2_fs = self.scheds['sc2'].fairshare.query_fairshare()
        sc3_fs = self.scheds['sc3'].fairshare.query_fairshare()

        n = default_fs.get_node(id=10)
        self.assertEqual(n.nshares, default_shares)
        self.assertEqual(n.usage, default_usage)

        n = sc1_fs.get_node(id=10)
        self.assertEqual(n.nshares, sc1_shares)
        self.assertEqual(n.usage, sc1_usage)

        n = sc2_fs.get_node(id=10)
        self.assertEqual(n.nshares, sc2_shares)
        self.assertEqual(n.usage, sc2_usage)

        n = sc3_fs.get_node(id=10)
        self.assertEqual(n.nshares, sc3_shares)
        self.assertEqual(n.usage, sc3_usage)

    def test_fairshare_usage(self):
        """
        Test the schedulers fairshare usage file and
        check the usage file is updating correctly or not
        """
        self.setup_sc1()
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'partition': 'P1'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq1')
        # Set resources to node
        if self.mom.is_cpuset_mom():
            hostname = self.server.status(NODE)[1]['id']
        else:
            hostname = self.mom.shortname

        resc = {'resources_available.ncpus': 1,
                'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, NODE, resc, hostname)
        # Add entry to the resource group of multisched 'sc1'
        self.scheds['sc1'].add_to_resource_group('grp1', 100, 'root', 60)
        self.scheds['sc1'].add_to_resource_group('grp2', 200, 'root', 40)
        self.scheds['sc1'].add_to_resource_group(TEST_USER1,
                                                 101, 'grp1', 40)
        self.scheds['sc1'].add_to_resource_group(TEST_USER2,
                                                 102, 'grp1', 20)
        self.scheds['sc1'].add_to_resource_group(TEST_USER3,
                                                 201, 'grp2', 30)
        self.scheds['sc1'].add_to_resource_group(TEST_USER4,
                                                 202, 'grp2', 10)
        # Set scheduler iteration
        sc_attr = {'scheduler_iteration': 7,
                   'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SCHED, sc_attr, id='sc1')
        # Update scheduler config file
        sc_config = {'fair_share': 'True',
                     'fairshare_usage_res': 'ncpus*100'}
        self.scheds['sc1'].set_sched_config(sc_config)
        # submit jobs to multisched 'sc1'
        sc1_attr = {ATTR_queue: 'wq1',
                    'Resource_List.select': '1:ncpus=1',
                    'Resource_List.walltime': 100}
        sc1_J1 = Job(TEST_USER1, attrs=sc1_attr)
        sc1_jid1 = self.server.submit(sc1_J1)
        sc1_J2 = Job(TEST_USER2, attrs=sc1_attr)
        sc1_jid2 = self.server.submit(sc1_J2)
        sc1_J3 = Job(TEST_USER3, attrs=sc1_attr)
        sc1_jid3 = self.server.submit(sc1_J3)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        # pbsuser1 job will run and other two will be queued
        self.server.expect(JOB, {'job_state': 'R'}, id=sc1_jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=sc1_jid3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=sc1_jid2)
        # need to delete the running job because PBS has only 1 ncpu and
        # our work is also done with the job.
        # this step will decrease the execution time as well
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        self.server.delete(sc1_jid1, wait=True)
        # pbsuser3 job will run after pbsuser1
        self.server.expect(JOB, {'job_state': 'R'}, id=sc1_jid3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=sc1_jid2)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        # deleting the currently running job
        self.server.delete(sc1_jid3, wait=True)
        # pbsuser2 job will run in the end
        self.server.expect(JOB, {'job_state': 'R'}, id=sc1_jid2)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        # deleting the currently running job
        self.server.delete(sc1_jid2, wait=True)
        # query fairshare and check usage
        sc1_fs_user1 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER1))
        self.assertEqual(sc1_fs_user1.usage, 101)
        sc1_fs_user2 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER2))
        self.assertEqual(sc1_fs_user2.usage, 101)
        sc1_fs_user3 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER3))
        self.assertEqual(sc1_fs_user3.usage, 101)
        sc1_fs_user4 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER4))
        self.assertEqual(sc1_fs_user4.usage, 1)
        # Restart the scheduler
        t = time.time()
        self.scheds['sc1'].restart()
        # Check the multisched 'sc1' usage file whether it's updating or not
        self.assertTrue(self.scheds['sc1'].isUp())
        # The scheduler will set scheduler attributes on the first scheduling
        # cycle, so we need to trigger a cycle, have the scheduler configure,
        # then turn it off again
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        self.scheds['sc1'].log_match("Scheduler is reconfiguring", starttime=t)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'False'},
                            id='sc1')
        sc1_J1 = Job(TEST_USER1, attrs=sc1_attr)
        sc1_jid1 = self.server.submit(sc1_J1)
        sc1_J2 = Job(TEST_USER2, attrs=sc1_attr)
        sc1_jid2 = self.server.submit(sc1_J2)
        sc1_J4 = Job(TEST_USER4, attrs=sc1_attr)
        sc1_jid4 = self.server.submit(sc1_J4)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        # pbsuser4 job will run and other two will be queued
        self.server.expect(JOB, {'job_state': 'R'}, id=sc1_jid4)
        self.server.expect(JOB, {'job_state': 'Q'}, id=sc1_jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=sc1_jid2)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        # deleting the currently running job
        self.server.delete(sc1_jid4, wait=True)
        # pbsuser1 job will run after pbsuser4
        self.server.expect(JOB, {'job_state': 'R'}, id=sc1_jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=sc1_jid2)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        # deleting the currently running job
        self.server.delete(sc1_jid1, wait=True)
        # pbsuser2 job will run in the end
        self.server.expect(JOB, {'job_state': 'R'}, id=sc1_jid2)
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        # deleting the currently running job
        self.server.delete(sc1_jid2, wait=True)
        # query fairshare and check usage
        sc1_fs_user1 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER1))
        self.assertEqual(sc1_fs_user1.usage, 201)
        sc1_fs_user2 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER2))
        self.assertEqual(sc1_fs_user2.usage, 201)
        sc1_fs_user3 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER3))
        self.assertEqual(sc1_fs_user3.usage, 101)
        sc1_fs_user4 = self.scheds['sc1'].fairshare.query_fairshare(
            name=str(TEST_USER4))
        self.assertEqual(sc1_fs_user4.usage, 101)

    def test_sched_priv_change(self):
        """
        Test that when the sched_priv directory changes, all of the
        PTL internal scheduler objects (e.g. fairshare tree) are reread
        """

        new_sched_priv = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                      'sched_priv2')
        if os.path.exists(new_sched_priv):
            self.du.rm(path=new_sched_priv, recursive=True,
                       sudo=True, force=True)

        dflt_sched_priv = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                       'sched_priv')

        self.du.run_copy(src=dflt_sched_priv, dest=new_sched_priv,
                         recursive=True, sudo=True)
        self.setup_sc3()
        s = self.server.status(SCHED, id='sc3')
        old_sched_priv = s[0]['sched_priv']

        self.scheds['sc3'].add_to_resource_group(TEST_USER, 10, 'root', 20)
        self.scheds['sc3'].holidays_set_year(new_year="3000")
        self.scheds['sc3'].set_sched_config({'fair_share': 'True ALL'})

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_priv': new_sched_priv}, id='sc3')

        n = self.scheds['sc3'].fairshare_tree.get_node(id=10)
        self.assertFalse(n)

        y = self.scheds['sc3'].holidays_get_year()
        self.assertNotEquals(y, "3000")
        self.assertTrue(self.scheds['sc3'].
                        sched_config['fair_share'].startswith('false'))

        # clean up: revert_to_defaults() will remove the new sched_priv.  We
        # need to remove the old one
        self.du.rm(path=old_sched_priv, sudo=True, recursive=True, force=True)

    def test_fairshare_decay(self):
        """
        Test pbsfs's fairshare decay for multisched
        """
        self.setup_sc3()
        self.scheds['sc3'].add_to_resource_group(TEST_USER, 10, 'root', 20)
        self.scheds['sc3'].fairshare.set_fairshare_usage(
            name=TEST_USER, usage=10)
        self.scheds['sc3'].decay_fairshare_tree()
        n = self.scheds['sc3'].fairshare_tree.get_node(id=10)
        self.assertTrue(n.usage, 5)

    def test_cmp_fairshare(self):
        """
        Test pbsfs's compare fairshare functionality for multisched
        """
        self.setup_sc3()
        self.scheds['sc3'].add_to_resource_group(TEST_USER, 10, 'root', 20)
        self.scheds['sc3'].fairshare.set_fairshare_usage(
            name=TEST_USER, usage=10)
        self.scheds['sc3'].add_to_resource_group(TEST_USER2, 20, 'root', 20)
        self.scheds['sc3'].fairshare.set_fairshare_usage(
            name=TEST_USER2, usage=100)

        user = self.scheds['sc3'].fairshare.cmp_fairshare_entities(
            TEST_USER, TEST_USER2)
        self.assertEqual(user, str(TEST_USER))

    def test_pbsfs_invalid_sched(self):
        """
        Test pbsfs -I <sched_name> where sched_name does not exist
        """
        sched_name = 'foo'
        pbsfs_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                 'sbin', 'pbsfs') + ' -I ' + sched_name
        ret = self.du.run_cmd(cmd=pbsfs_cmd, runas=self.scheduler.user)
        err_msg = 'Scheduler %s does not exist' % sched_name
        self.assertEqual(err_msg, ret['err'][0])

    def test_pbsfs_no_fairshare_data(self):
        """
        Test pbsfs -I <sched_name> where sched_priv_<sched_name> dir
        does not exist
        """
        a = {'partition': 'P5',
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_CREATE, SCHED, a, id="sc5")
        err_msg = 'Unable to access fairshare data: No such file or directory'
        try:
            # Only a scheduler object is created. Corresponding sched_priv
            # dir not created yet. Try to query fairshare data.
            self.scheds['sc5'].fairshare.query_fairshare()
        except PbsFairshareError as e:
            self.assertTrue(err_msg in e.msg)

    def test_pbsfs_server_restart(self):
        """
        Verify that server restart has no impact on fairshare data
        """
        self.setup_sc1()
        self.scheds['sc1'].add_to_resource_group(TEST_USER, 20, 'root', 50)
        self.scheds['sc1'].fairshare.set_fairshare_usage(
            name=TEST_USER, usage=25)
        n = self.scheds['sc1'].fairshare.query_fairshare().get_node(
            name=str(TEST_USER))
        self.assertTrue(n.usage, 25)

        self.server.restart()
        n = self.scheds['sc1'].fairshare.query_fairshare().get_node(
            name=str(TEST_USER))
        self.assertTrue(n.usage, 25)

    def test_pbsfs_revert_to_defaults(self):
        """
        Test if revert_to_defaults() works properly with multi scheds.
        revert_to_defaults() removes entities from resource_group file and
        removes their usage(with pbsfs -e)
        """
        self.setup_sc1()
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'partition': 'P1'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq1')
        a = {'partition': 'P1', 'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a,
                            id=self.mom.shortname)

        self.scheds['sc1'].add_to_resource_group(TEST_USER,
                                                 11, 'root', 10)
        self.scheds['sc1'].add_to_resource_group(TEST_USER1,
                                                 12, 'root', 10)
        self.scheds['sc1'].set_sched_config({'fair_share': 'True'})
        self.scheds['sc1'].fairshare.set_fairshare_usage(TEST_USER, 100)

        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'False'},
                            id='sc1')
        j1 = Job(TEST_USER, attrs={ATTR_queue: 'wq1'})
        jid1 = self.server.submit(j1)
        j2 = Job(TEST_USER1, attrs={ATTR_queue: 'wq1'})
        jid2 = self.server.submit(j2)

        t_start = time.time()
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        self.scheds['sc1'].log_match(
            'Leaving Scheduling Cycle', starttime=t_start)
        t_end = time.time()
        job_list = self.scheds['sc1'].log_match(
            'Considering job to run', starttime=t_start,
            allmatch=True, endtime=t_end)

        # job 1 runs second as it's run by an entity with usage = 100
        self.assertTrue(jid1 in job_list[-1][1])

        self.server.deljob(id=jid1, wait=True)
        self.server.deljob(id=jid2, wait=True)

        # revert_to_defaults() does a pbsfs -I <sched_name> -e and cleans up
        # the resource_group file
        self.scheds['sc1'].revert_to_defaults()

        # Fairshare tree is trimmed now.  TEST_USER1 is the only entity with
        # usage set.  So its job, job2 will run second. If trimming was not
        # successful TEST_USER would still have usage=100 and job1 would run
        # second

        self.scheds['sc1'].add_to_resource_group(TEST_USER,
                                                 15, 'root', 10)
        self.scheds['sc1'].add_to_resource_group(TEST_USER1,
                                                 16, 'root', 10)
        self.scheds['sc1'].set_sched_config({'fair_share': 'True'})
        self.scheds['sc1'].fairshare.set_fairshare_usage(TEST_USER1, 50)

        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'False'},
                            id='sc1')
        j1 = Job(TEST_USER, attrs={ATTR_queue: 'wq1'})
        jid1 = self.server.submit(j1)
        j2 = Job(TEST_USER1, attrs={ATTR_queue: 'wq1'})
        jid2 = self.server.submit(j2)

        t_start = time.time()
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id='sc1')
        self.scheds['sc1'].log_match(
            'Leaving Scheduling Cycle', starttime=t_start)
        t_end = time.time()
        job_list = self.scheds['sc1'].log_match(
            'Considering job to run', starttime=t_start,
            allmatch=True, endtime=t_end)

        self.assertTrue(jid2 in job_list[-1][1])

    def submit_jobs(self, num_jobs=1, attrs=None, user=TEST_USER):
        """
        Submit num_jobs number of jobs with attrs attributes for user.
        Return a list of job ids
        """
        if attrs is None:
            attrs = {'Resource_List.select': '1:ncpus=2'}
        ret_jids = []
        for _ in range(num_jobs):
            J = Job(user, attrs)
            jid = self.server.submit(J)
            ret_jids += [jid]

        return ret_jids

    def test_equiv_multisched(self):
        """
        Test the basic behavior of job equivalence classes: submit two
        different types of jobs into 2 different schedulers and see they
        are in two different classes in each scheduler
        """
        self.setup_sc1()
        self.setup_sc2()
        self.setup_queues_nodes()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047}, id='sc2')
        t = time.time()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc1")
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc2")

        # Eat up all the resources with the first job to each queue
        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'wq1'}
        self.submit_jobs(4, a)
        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'wq2'}
        self.submit_jobs(4, a)

        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: 'wq1'}
        self.submit_jobs(3, a)
        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: 'wq2'}
        self.submit_jobs(3, a)

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc1")
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc2")
        self.scheds['sc1'].log_match("Number of job equivalence classes: 2",
                                     max_attempts=10, starttime=t)
        self.scheds['sc2'].log_match("Number of job equivalence classes: 2",
                                     max_attempts=10, starttime=t)

    def test_limits_queues(self):
        """
        Test to see that jobs from different users fall into different
        equivalence classes with queue hard limits.
        """
        self.setup_sc1()
        self.setup_queues_nodes()
        p1 = {'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, QUEUE, p1, id='wq3')
        t = time.time()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc1")
        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run': '[u:PBS_GENERIC=1]'}, id='wq1')
        self.server.manager(MGR_CMD_SET, QUEUE,
                            {'max_run': '[u:PBS_GENERIC=1]'}, id='wq3')

        # Eat up all the resources
        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'wq1'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)
        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'wq3'}
        J = Job(TEST_USER, attrs=a)
        self.server.submit(J)
        a = {ATTR_queue: 'wq1'}
        self.submit_jobs(3, a, user=TEST_USER1)
        self.submit_jobs(3, a, user=TEST_USER2)
        a = {ATTR_queue: 'wq3'}
        self.submit_jobs(3, a, user=TEST_USER1)
        self.submit_jobs(3, a, user=TEST_USER2)

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc1")

        # Six equivalence classes. Two for the resource eating job in
        # different partitions and one for each user per partition.
        self.scheds['sc1'].log_match("Number of job equivalence classes: 6",
                                     starttime=t)

    def test_list_multi_sched(self):
        """
        Test to verify that qmgr list sched works when multiple
        schedulers are present
        """

        self.setup_sc1()
        self.setup_sc2()
        self.setup_sc3()

        self.server.manager(MGR_CMD_LIST, SCHED)

        self.server.manager(MGR_CMD_LIST, SCHED, id="default")

        self.server.manager(MGR_CMD_LIST, SCHED, id="sc1")

        dir_path = os.path.join(os.sep, 'var', 'spool', 'pbs', 'sched_dir')
        a = {'partition': 'P2',
             'sched_priv': os.path.join(dir_path, 'sched_priv_sc2'),
             'sched_log': os.path.join(dir_path, 'sched_logs_sc2'),
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_LIST, SCHED, a, id="sc2")

        self.server.manager(MGR_CMD_LIST, SCHED, id="sc3")

        try:
            self.server.manager(MGR_CMD_LIST, SCHED, id="invalid_scname")
        except PbsManagerError as e:
            err_msg = "Unknown Scheduler"
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")

        # delete sc3 sched
        self.delete_sched("sc3")

        try:
            self.server.manager(MGR_CMD_LIST, SCHED, id="sc3")
        except PbsManagerError as e:
            err_msg = "Unknown Scheduler"
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")

        self.server.manager(MGR_CMD_LIST, SCHED)

        self.server.manager(MGR_CMD_LIST, SCHED, id="default")

        self.server.manager(MGR_CMD_LIST, SCHED, id="sc1")

        self.server.manager(MGR_CMD_LIST, SCHED, id="sc2")

        # delete sc1 sched
        self.delete_sched("sc1")

        try:
            self.server.manager(MGR_CMD_LIST, SCHED, id="sc1")
        except PbsManagerError as e:
            err_msg = "Unknown Scheduler"
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")

    def test_job_sort_formula_threshold(self):
        """
        Test the scheduler attribute job_sort_formula_threshold for multisched
        """
        # Multisched setup
        self.setup_sc3()
        p3 = {'partition': 'P3'}
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        a.update(p3)
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq1')
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 2)
        vn0 = self.mom.shortname + '[0]'
        self.server.manager(MGR_CMD_SET, NODE, p3, id=vn0)
        # Set job_sort_formula on the server
        self.server.manager(MGR_CMD_SET, SERVER, {'job_sort_formula': 'ncpus'})
        # Set job_sort_formula_threshold on the multisched
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'job_sort_formula_threshold': '2'}, id="sc3")
        # Submit job to multisched
        j1_attrs = {ATTR_queue: 'wq1', 'Resource_List.ncpus': '1'}
        J1 = Job(TEST_USER, j1_attrs)
        jid_1 = self.server.submit(J1)
        # Submit job to default scheduler
        J2 = Job(TEST_USER, attrs={'Resource_List.ncpus': '1'})
        jid_2 = self.server.submit(J2)
        msg = {'job_state': 'Q',
               'comment': ('Not Running: Job is ' +
                           'under job_sort_formula threshold value')}
        self.server.expect(JOB, msg, id=jid_1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_2)

        # test to make sure server can still start with job_sort_formula set
        self.server.restart()
        restart_msg = 'Failed to restart PBS'
        self.assertTrue(self.server.isUp(), restart_msg)

    @staticmethod
    def cust_attr(name, totnodes, numnode, attrib):
        a = {}
        if numnode in range(0, 3):
            a['resources_available.switch'] = 'A'
        if numnode in range(3, 5):
            a['resources_available.switch'] = 'B'
        if numnode in range(6, 9):
            a['resources_available.switch'] = 'A'
            a['partition'] = 'P2'
        if numnode in range(9, 11):
            a['resources_available.switch'] = 'B'
            a['partition'] = 'P2'
        if numnode == 11:
            a['partition'] = 'P2'
        return {**attrib, **a}

    def setup_placement_set(self):
        self.server.add_resource('switch', 'string_array', 'h')
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(
            a, 12, attrfunc=self.cust_attr)
        self.server.manager(MGR_CMD_SET, SERVER, {'node_group_key': 'switch'})
        self.server.manager(MGR_CMD_SET, SERVER, {'node_group_enable': 't'})

    def test_multi_sched_explicit_ps(self):
        """
        Test only_explicit_ps set to sched attr will be in affect
        and will not read from default scheduler
        """
        self.setup_placement_set()
        self.setup_sc2()
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'partition': 'P2'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq2')
        a = {'Resource_List.select': '1:ncpus=2'}
        j = Job(TEST_USER, attrs=a)
        j1id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j1id)
        vn = ['%s[%d]' % (self.mom.shortname, i) for i in range(10)]
        nodes = [vn[5]]
        self.check_vnodes(j, nodes, j1id)
        a = {'Resource_List.select': '2:ncpus=2'}
        j = Job(TEST_USER, attrs=a)
        j2id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        nodes = vn[3:5]
        self.check_vnodes(j, nodes, j2id)
        a = {'Resource_List.select': '3:ncpus=2'}
        j = Job(TEST_USER, attrs=a)
        j3id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j3id)
        self.check_vnodes(j, vn[0:3], j3id)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'only_explicit_psets': 't'}, id='sc2')
        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'wq2'}
        j = Job(TEST_USER, attrs=a)
        j4id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j4id)
        nodes = [vn[9]]
        self.check_vnodes(j, nodes, j4id)
        a = {'Resource_List.select': '2:ncpus=2', ATTR_queue: 'wq2'}
        j = Job(TEST_USER, attrs=a)
        j5id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j5id)
        self.check_vnodes(j, vn[6:8], j5id)
        a = {'Resource_List.select': '3:ncpus=2', ATTR_queue: 'wq2'}
        j = Job(TEST_USER, attrs=a)
        j6id = self.server.submit(j)
        self.server.expect(JOB, {
                           'job_state': 'Q',
                           'comment': 'Not Running: Placement set switch=A'
                           ' has too few free resources'}, id=j6id)

    def test_jobs_do_not_span_ps(self):
        """
        Test do_not_span_psets set to sched attr will be in affect
        and will not read from default scheduler
        """
        self.setup_placement_set()
        self.setup_sc2()
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'partition': 'P2'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq2')
        # Scheduler sc2 cannot span across placement sets
        self.server.manager(MGR_CMD_SET, SCHED, {
                            'do_not_span_psets': 't'}, id='sc2')
        self.server.manager(MGR_CMD_SET, SCHED, {
                            'scheduling': 't'}, id='sc2')
        a = {'Resource_List.select': '4:ncpus=2', ATTR_queue: 'wq2'}
        j = Job(TEST_USER, attrs=a)
        j1id = self.server.submit(j)
        self.server.expect(
            JOB, {'job_state': 'Q', 'comment': 'Can Never Run: can\'t fit in '
                  'the largest placement set, and can\'t span psets'}, id=j1id)
        # Default scheduler can span as do_not_span_psets is not set
        a = {'Resource_List.select': '4:ncpus=2'}
        j = Job(TEST_USER, attrs=a)
        j2id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)

    def test_sched_preempt_enforce_resumption(self):
        """
        Test sched_preempt_enforce_resumption can be set to a multi sched
        and that even if topjob_ineligible is set for a preempted job
        and sched_preempt_enforce_resumption is set true , the
        preempted job will be calandered
        """
        self.setup_sc1()
        self.setup_queues_nodes()
        p1 = {'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, QUEUE, p1, id='wq3')
        prio = {'Priority': 150, 'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, QUEUE, prio, id='wq3')
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_preempt_enforce_resumption': 'true'},
                            id='sc1')
        self.server.manager(MGR_CMD_SET, SERVER, {'backfill_depth': '2'})

        # Submit a job
        j = Job(TEST_USER, {'Resource_List.walltime': '120',
                            'Resource_List.ncpus': '2'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        j = Job(TEST_USER, {'Resource_List.walltime': '120',
                            'Resource_List.ncpus': '2',
                            ATTR_queue: 'wq1'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        # Alter topjob_ineligible for running job
        self.server.alterjob(jid1, {ATTR_W: "topjob_ineligible = true"},
                             runas=ROOT_USER, logerr=True)
        self.server.alterjob(jid1, {ATTR_W: "topjob_ineligible = true"},
                             runas=ROOT_USER, logerr=True)

        # Create a high priority queue
        a = {'queue_type': 'e', 'started': 't',
             'enabled': 't', 'Priority': '150'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="highp")

        # Submit 2 jobs to high priority queue
        j = Job(TEST_USER, {'queue': 'highp', 'Resource_List.walltime': '60',
                            'Resource_List.ncpus': '2'})
        jid3 = self.server.submit(j)
        j = Job(TEST_USER, {'queue': 'wq3', 'Resource_List.walltime': '60',
                            'Resource_List.ncpus': '2'})
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)
        # Verify that job1 is not calendered
        self.server.expect(JOB, 'estimated.start_time',
                           op=UNSET, id=jid1)
        # Verify that job2 is calendared
        self.server.expect(JOB, 'estimated.start_time',
                           op=SET, id=jid2)
        qstat = self.server.status(JOB, 'estimated.start_time',
                                   id=jid2)
        est_time = qstat[0]['estimated.start_time']
        self.assertNotEqual(est_time, None)
        self.scheds['sc1'].log_match(jid2 + ";Job is a top job",
                                     starttime=self.server.ctime)

    def set_primetime(self, ptime_start, ptime_end, scid='default'):
        """
        This function will set the prime time
        in holidays file
        """
        self.scheds[scid].holidays_delete_entry('a')

        cur_year = datetime.datetime.today().year
        self.scheds[scid].holidays_set_year(cur_year)

        p_day = 'weekday'
        p_hhmm = time.strftime('%H%M', time.localtime(ptime_start))
        np_hhmm = time.strftime('%H%M', time.localtime(ptime_end))
        self.scheds[scid].holidays_set_day(p_day, p_hhmm, np_hhmm)

        p_day = 'saturday'
        self.scheds[scid].holidays_set_day(p_day, p_hhmm, np_hhmm)

        p_day = 'sunday'
        self.scheds[scid].holidays_set_day(p_day, p_hhmm, np_hhmm)

    def test_prime_time_backfill(self):
        """
        Test opt_backfill_fuzzy can be set to a multi sched and
        while calandering primetime/nonprimetime will be considered
        """
        self.setup_sc2()
        self.setup_queues_nodes()
        a = {'strict_ordering': "True   ALL"}
        self.scheds['sc2'].set_sched_config(a)
        # set primetime which will start after 30min
        prime_start = int(time.time()) + 1800
        prime_end = int(time.time()) + 3600
        self.set_primetime(prime_start, prime_end, scid='sc2')

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'opt_backfill_fuzzy': 'high'}, id='sc2')
        self.server.manager(MGR_CMD_SET, SERVER, {'backfill_depth': '2'})

        # Submit a job
        j = Job(TEST_USER, {'Resource_List.walltime': '60',
                            'Resource_List.ncpus': '2',
                            ATTR_queue: 'wq2'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        j = Job(TEST_USER1, {'Resource_List.ncpus': '2',
                             ATTR_queue: 'wq2'})
        jid2 = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        # Verify that job2 is calendared to start at primetime start
        self.server.expect(JOB, 'estimated.start_time',
                           op=SET, id=jid2)
        qstat = self.server.status(JOB, 'estimated.start_time',
                                   id=jid2)
        est_time = qstat[0]['estimated.start_time']
        est_epoch = est_time
        if self.server.get_op_mode() == PTL_CLI:
            est_epoch = int(time.mktime(time.strptime(est_time, '%c')))
        prime_mod = prime_start % 60  # ignoring the seconds
        self.assertEqual((prime_start - prime_mod), est_epoch)

    def test_prime_time_multisched(self):
        """
        Test prime time queue can be set partition and multi sched
        considers prime time queue for jobs submitted to the p_queue
        """
        self.setup_sc2()
        self.setup_queues_nodes()
        # set primetime which will start after 30min
        prime_start = int(time.time()) + 1800
        prime_end = int(time.time()) + 3600
        self.set_primetime(prime_start, prime_end, scid='sc2')
        a = {'queue_type': 'e', 'started': 't',
             'enabled': 't', 'partition': 'P2'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="p_queue")

        j = Job(TEST_USER1, {'Resource_List.ncpus': '1',
                             ATTR_queue: 'wq2'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        j = Job(TEST_USER1, {'Resource_List.ncpus': '1',
                             ATTR_queue: 'p_queue'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        msg = 'Job will run in primetime only'
        self.server.expect(JOB, {ATTR_comment: "Not Running: " + msg}, id=jid2)
        self.scheds['sc2'].log_match(jid2 + ";Job only runs in primetime",
                                     starttime=self.server.ctime)

    def test_dedicated_time_multisched(self):
        """
        Test dedicated time queue can be set partition and multi sched
        considers dedicated time for jobs submitted to the ded_queue
        """
        self.setup_sc2()
        self.setup_queues_nodes()
        # Create a dedicated time queue
        ded_start = int(time.time()) + 1800
        ded_end = int(time.time()) + 3600
        self.scheds['sc2'].add_dedicated_time(start=ded_start, end=ded_end)
        a = {'queue_type': 'e', 'started': 't',
             'enabled': 't', 'partition': 'P2'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="ded_queue")
        j = Job(TEST_USER1, {'Resource_List.ncpus': '1',
                             ATTR_queue: 'wq2'})
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        j = Job(TEST_USER1, {'Resource_List.ncpus': '1',
                             ATTR_queue: 'ded_queue'})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        msg = 'Dedicated time conflict'
        self.server.expect(JOB, {ATTR_comment: "Not Running: " + msg}, id=jid2)
        self.scheds['sc2'].log_match(jid2 + ";Dedicated Time",
                                     starttime=self.server.ctime)

    def test_auto_sched_off_due_to_fds_limit(self):
        """
        Test to make sure scheduling should be turned off automatically
        when number of open files per process are exhausted
        """

        if os.getuid() != 0 or sys.platform in ('cygwin', 'win32'):
            self.skipTest("Test need to run as root")

        self.setup_sc3()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduler_iteration': 1}, id="sc3")
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id="sc3")
        try:
            # get the number of open files per process
            (open_files_soft_limit, open_files_hard_limit) = \
                resource.getrlimit(resource.RLIMIT_NOFILE)

            # set the soft limit of number of open files per process to 10
            resource.setrlimit(resource.RLIMIT_NOFILE,
                               (10, open_files_hard_limit))

        except (ValueError, resource.error):
            self.assertFalse(True, "Error in accessing system RLIMIT_ "
                                   "variables, test fails.")
        try:
            self.logger.info('The sleep is 15 seconds which will '
                             'trigger required number of scheduling '
                             'cycles that are needed to exhaust open '
                             'files per process which is 10 in our case')
            time.sleep(15)

        except BaseException as exc:
            raise exc
        finally:
            try:
                resource.setrlimit(resource.RLIMIT_NOFILE,
                                   (open_files_soft_limit,
                                    open_files_hard_limit))
                # scheduling should not go to false once all fds per process
                # are exhausted.
                self.server.expect(SCHED, {'scheduling': 'True'},
                                   id='sc3', max_attempts=10)
            except (ValueError, resource.error):
                self.assertFalse(True, "Error in accessing system RLIMIT_ "
                                       "variables, test fails.")

    def test_set_msched_attr_sched_log_with_sched_off(self):
        """
        Test to set Multisched attributes even when its scheduling is off
        and check whether they are actually be effective
        """
        self.setup_sc3()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047}, id='sc3')

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc3")

        new_sched_log = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                     'sc3_new_logs')
        if os.path.exists(new_sched_log):
            self.du.rm(path=new_sched_log, recursive=True,
                       sudo=True, force=True)

        self.du.mkdir(path=new_sched_log, sudo=True)
        self.du.chown(path=new_sched_log, recursive=True,
                      uid=self.scheds['sc3'].user, sudo=True)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_log': new_sched_log}, id="sc3")

        a = {'sched_log': new_sched_log}
        self.server.expect(SCHED, a, id='sc3', max_attempts=10)

        # This is required since we need to call log_match only when
        # the new log file is created.
        time.sleep(1)
        self.scheds['sc3'].log_match(
            "scheduler log directory is changed to " + new_sched_log,
            max_attempts=10, starttime=self.server.ctime)

    def test_set_msched_attr_sched_priv_with_sched_off(self):
        """
        Test to set Multisched attributes even when its scheduling is off
        and check whether they are actually be effective
        """
        self.setup_sc3()
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'False',
                                                 'log_events': 2047}, id="sc3")

        # create and set-up a new priv directory for sc3
        new_sched_priv = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                      'sched_priv_new')
        if os.path.exists(new_sched_priv):
            self.du.rm(path=new_sched_priv, recursive=True,
                       sudo=True, force=True)
        dflt_sched_priv = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                       'sched_priv')

        self.du.run_copy(src=dflt_sched_priv, dest=new_sched_priv,
                         recursive=True, sudo=True)
        self.server.manager(MGR_CMD_SET, SCHED, {'sched_priv': new_sched_priv},
                            id="sc3")

        a = {'sched_priv': new_sched_priv}
        self.server.expect(SCHED, a, id='sc3', max_attempts=10)

        # This is required since we need to call log_match only when
        # the new log file is created.
        time.sleep(1)
        self.scheds['sc3'].log_match(
            "scheduler priv directory has changed to " + new_sched_priv,
            max_attempts=10, starttime=self.server.ctime)

    def test_set_msched_update_inbuilt_attrs_accrue_type(self):
        """
        Test to make sure Multisched is able to update any one of the builtin
        attributes like accrue_type
        """
        a = {'eligible_time_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.setup_sc3()
        self.setup_queues_nodes()

        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'wq3'}

        J1 = Job(TEST_USER1, attrs=a)

        J2 = Job(TEST_USER1, attrs=a)

        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        jid2 = self.server.submit(J2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid2)

        # accrue_type = 2 is eligible_time
        self.server.expect(JOB, {ATTR_accrue_type: 2}, id=jid2)

        self.server.delete(jid1, wait=True)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        # This makes sure that accrue_type is indeed getting changed
        self.server.expect(JOB, {ATTR_accrue_type: 3}, id=jid2)

    def test_multisched_not_crash(self):
        """
        Test to make sure Multisched does not crash when all nodes in partition
        are not associated with the corresponding queue
        """
        self.setup_sc1()
        self.setup_queues_nodes()

        # Assign a queue with the partition P1. This queue association is not
        # required as per the current Multisched feature. But this is just to
        # verify even if we associate a queue to one of the nodes in partition
        # the scheduler won't crash.
        # Ex: Here we are associating wq1 to vnode[0] but vnode[4] has no
        # queue associated to it. Expectation is in this case scheduler won't
        # crash
        a = {ATTR_queue: 'wq1'}
        vn = self.mom.shortname
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn + '[0]')

        self.scheds['sc1'].terminate()

        self.scheds['sc1'].start()

        j = Job(TEST_USER1, attrs={ATTR_queue: 'wq1',
                                   'Resource_List.select': '1:ncpus=1'})
        jid1 = self.server.submit(j)
        # If job goes to R state means scheduler is still alive.
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

    def test_multi_sched_job_sort_key(self):
        """
        Test to make sure that jobs are sorted as per
        job_sort_key in a multi sched
        """
        self.setup_sc1()
        self.setup_queues_nodes()
        a = {'job_sort_key': '"ncpus LOW"'}
        self.scheds['sc1'].set_sched_config(a)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'}, id="sc1")
        j = Job(TEST_USER, {'Resource_List.ncpus': '2',
                            ATTR_queue: 'wq1'})
        jid1 = self.server.submit(j)
        j = Job(TEST_USER, {'Resource_List.ncpus': '1',
                            ATTR_queue: 'wq1'})
        jid2 = self.server.submit(j)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc1")
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

    def test_multi_sched_node_sort_key(self):
        """
        Test to make sure nodes are sorted in the order
        as per node_sort_key in a multi sched
        """
        self.setup_sc1()
        self.setup_queues_nodes()
        a = {'partition': 'P1'}
        vn = ['%s[%d]' % (self.mom.shortname, i) for i in range(4)]
        self.server.manager(MGR_CMD_SET, NODE, a, id='@default')
        a = {'node_sort_key': '"ncpus HIGH " ALL'}
        self.scheds['sc1'].set_sched_config(a)
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn[0])
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn[1])
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn[2])
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn[3])

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl',
             ATTR_queue: 'wq1'}
        j = Job(TEST_USER1, a)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.check_vnodes(j, [vn[3]], jid1)
        j = Job(TEST_USER1, a)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.check_vnodes(j, [vn[2]], jid2)
        j = Job(TEST_USER1, a)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.check_vnodes(j, [vn[1]], jid3)
        j = Job(TEST_USER1, a)
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)
        self.check_vnodes(j, [vn[0]], jid4)

    def test_multi_sched_priority_sockets(self):
        """
        Test scheduler socket connections from all the schedulers
        are processed on priority
        """
        self.common_setup()
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})
        for name in self.scheds:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'scheduling': 'False'}, id=name)
        a = {ATTR_queue: 'wq1',
             'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 60}
        j = Job(TEST_USER1, attrs=a)
        self.server.submit(j)
        t = time.time()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id='sc1')
        self.server.log_match("processing priority socket", starttime=t)
        a = {ATTR_queue: 'wq2',
             'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 60}
        j = Job(TEST_USER1, attrs=a)
        self.server.submit(j)
        t = time.time()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id='sc2')
        self.server.log_match("processing priority socket", starttime=t)

    def test_advance_resv_in_multi_sched(self):
        """
        Test that advance reservations in a multi-sched environment can be
        serviced by any scheduler
        """
        # Create 3 multi-scheds sc1, sc2 and sc3, 3 partitions and 4 vnodes
        self.common_setup()
        # Consume all resources in partitions serviced by sc1 and sc3 and
        # default scheduler
        a = {ATTR_queue: 'wq1',
             'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 60}
        j = Job(TEST_USER1, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        a = {ATTR_queue: 'wq3',
             'Resource_List.select': '1:ncpus=2'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        a = {ATTR_queue: 'workq',
             'Resource_List.select': '1:ncpus=2'}
        j3 = Job(TEST_USER, attrs=a)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        # Now submit a reservation which only sc2 can confirm because
        # it has free nodes
        t = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 5,
             'reserve_end': t + 35}
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, rid)
        vn1 = self.mom.shortname + '[1]'
        rnodes = {'resv_nodes': '(' + vn1 + ':ncpus=2)'}
        self.server.expect(RESV, rnodes, id=rid)

        # Wait for reservation to run and then submit a job to the
        # reservation
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, rid)
        a = {ATTR_q: rid.split('.')[0]}
        j4 = Job(TEST_USER, attrs=a)
        jid4 = self.server.submit(j4)
        result = {'job_state': 'R', 'exec_vnode': '(' + vn1 + ':ncpus=1)'}
        self.server.expect(JOB, result, id=jid4)

    def test_resv_in_empty_multi_sched_env(self):
        """
        Test that advance reservations gets confirmed by all the schedulers
        running in the complex
        """
        # Create 3 multi-scheds sc1, sc2 and sc3, 3 partitions and 4 vnodes
        self.common_setup()
        # Submit 4 reservations and check they get confirmed
        for _ in range(4):
            t = int(time.time())
            a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 25,
                 'reserve_end': t + 55}
            r = Reservation(TEST_USER, attrs=a)
            rid = self.server.submit(r)
            a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
            self.server.expect(RESV, a, rid)

        # Submit 5th reservation and check that it is denied
        t = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 25,
             'reserve_end': t + 55}
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        msg = "Resv;" + rid + ";Reservation denied"
        self.server.log_match(msg)

    def test_asap_resv(self):
        """
        Test ASAP reservation in multisched environment. It should not
        matter if a job is part of a partition. An ASAP reservation could
        confirm on any of the existing partitions and then moved to the
        reservation queue.
        """
        # Create 3 multi-scheds sc1, sc2 and sc3, 4 partitions and 4 vnodes
        self.common_setup()
        # Turn off scheduling in all schedulers but one (say sc3)
        self.set_scheduling(['sc1', 'sc2', 'default'], False)

        # submit a job in partition serviced by sc1
        a = {ATTR_queue: 'wq1',
             'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 600}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        # Now turn this job into a reservation and notice that it runs inside
        # a reservation running on vnode[2] which is part of sc3
        a = {ATTR_convert: jid}
        r = Reservation(TEST_USER, a)
        r.unset_attributes(['reserve_start', 'reserve_end'])
        rid = self.server.submit(r)
        exp_attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, exp_attrs, id=rid)
        exec_vn = '(' + self.mom.shortname + '[2]:ncpus=2)'
        result = {'job_state': 'R', 'exec_vnode': exec_vn}
        self.server.expect(JOB, result, id=jid)

    def test_standing_resv_reject(self):
        """
        Test that if a scheduler serving a partition is not able to
        confirm all the occurrences of the standing reservation on the same
        partition then it will reject it.
        """

        self.common_setup()
        # Turn off scheduling in all schedulers but sc1 because sc1 serves
        # partition P1
        self.set_scheduling(['sc2', 'sc3', 'default'], False)

        # Submit an advance reservation which is going to occupy full
        # partition in future
        t = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 200,
             'reserve_end': t + 4000}
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, rid)

        # Submit a standing reservation such that it consumes one partition
        # and an occurrence finishes before the advance reservation starts.
        # This means scheduler will try to place the first occurance right
        # before the advance reservation was confirmed because the
        # node is free, it will not be able to place the second occurrence
        # because of the advance reservation
        start = int(time.time()) + 10
        end = start + 150
        tzone = self.get_tzid()
        a = {ATTR_resv_rrule: 'FREQ=HOURLY;COUNT=2',
             ATTR_resv_timezone: tzone,
             'reserve_start': start,
             'reserve_end': end,
             'Resource_List.select': '1:ncpus=2'
             }
        sr = Reservation(TEST_USER, attrs=a)
        srid = self.server.submit(sr)
        msg = "Resv;" + srid + ";Reservation denied"
        self.server.log_match(msg)

    def test_printing_partition_resv_hook(self):
        """
        Test if a reservation having a partition set on it is readable in
        a reservation hook
        """
        hook_body = """
import pbs
e = pbs.event()
resv = e.resv
pbs.logmsg(pbs.EVENT_DEBUG, "Resv partition is %s" % resv.partition)
e.accept()
"""
        a = {'event': 'resv_end', 'enabled': 'true', 'debug': 'true'}
        self.server.create_import_hook("h1", a, hook_body)
        # Create 3 multi-scheds sc1, sc2 and sc3, 3 partitions and 4 vnodes
        self.common_setup()
        # Turn off scheduling in all schedulers but one (say sc3)
        self.set_scheduling(['sc1', 'sc2', 'default'], False)
        t = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 5,
             'reserve_end': t + 15}
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, rid)
        self.logger.info("Wait for reservation to end")
        time.sleep(10)
        msg = "Resv partition is P3"
        self.server.log_match(msg)

    def test_setting_partition_resv_hook(self):
        """
        Test if a reservation can set partition name on reservation object
        """
        hook_body = """
import pbs
e = pbs.event()
resv = e.resv
resv.partition = "P-3"
pbs.logmsg(pbs.EVENT_DEBUG, "Resv partition is %s" % resv.partition)
e.accept()
"""
        a = {'event': 'resvsub', 'enabled': 'true', 'debug': 'true'}
        self.server.create_import_hook("h1", a, hook_body)
        # Create 3 multi-scheds sc1, sc2 and sc3, 3 partitions and 4 vnodes
        self.common_setup()
        t = int(time.time())
        a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 5,
             'reserve_end': t + 15}
        r = Reservation(TEST_USER, a)
        with self.assertRaises(PbsSubmitError) as e:
            rid = self.server.submit(r)
        msg = "resv attribute 'partition' is readonly"
        self.server.log_match(msg)
        self.assertIn("hook 'h1' encountered an exception",
                      e.exception.msg[0])

    def test_resv_alter(self):
        """
        Test if a reservation confirmed by a multi-sched can be altered by the
        same scheduler.
        """
        self.common_setup()
        # Submit 4 reservations to fill up the system and check they are
        # confirmed
        for _ in range(4):
            t = int(time.time())
            a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 60,
                 'reserve_end': t + 120}
            r = Reservation(TEST_USER, a)
            rid = self.server.submit(r)
            attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
            self.server.expect(RESV, attr, rid)
            partition = self.server.status(RESV, 'partition', id=rid)
            if (partition[0]['partition'] == 'P1'):
                old_end_time = a['reserve_end']
                modify_resv = rid
        # Modify the endtime of reservation confirmed on partition P1 and
        # make sure the node solution is correct.
        end_time = old_end_time + 60
        bu = BatchUtils()
        new_end_time = bu.convert_seconds_to_datetime(end_time)
        attrs = {'reserve_end': new_end_time}
        time_now = time.time()
        self.server.alterresv(modify_resv, attrs)
        attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                'partition': 'P1'}
        self.server.expect(RESV, attr, modify_resv)
        vn = self.mom.shortname
        rnodes = {'resv_nodes': '(' + vn + '[0]:ncpus=2)'}
        self.server.expect(RESV, rnodes, id=modify_resv)
        msg = modify_resv + ";Reservation Confirmed"
        self.scheds['sc1'].log_match(msg, starttime=time_now)

    def test_setting_default_partition(self):
        """
        Test if setting default partition on pbs scheduler/queue/node fails
        """

        self.common_setup()
        a = {'partition': 'pbs-default'}
        with self.assertRaises(PbsManagerError) as e:
            self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq')
        self.assertIn("Default partition name is not allowed",
                      e.exception.msg[0])
        with self.assertRaises(PbsManagerError) as e:
            vn3 = self.mom.shortname + '[3]'
            self.server.manager(MGR_CMD_SET, NODE, a, id=vn3)
        self.assertIn("Default partition name is not allowed",
                      e.exception.msg[0])
        with self.assertRaises(PbsManagerError) as e:
            self.server.manager(MGR_CMD_SET, SCHED, a, id='sc1')
        self.assertIn("Default partition name is not allowed",
                      e.exception.msg[0])

    def degraded_resv_reconfirm(self, start, end, rrule=None, run=False):
        """
        Test that a degraded reservation gets reconfirmed in a multi-sched env
        """
        # Add two nodes to partition P1 and turn off scheduling for all other
        # schedulers serving partition P2 and P3. Make scheduler sc1 serve
        # only partition P1 (vnode[0], vnode[1]).
        p1 = {'partition': 'P1'}
        vn = ['%s[%d]' % (self.mom.shortname, i) for i in range(2)]
        self.server.manager(MGR_CMD_SET, NODE, p1, id=vn[1])
        self.server.expect(SCHED, p1, id="sc1")

        a = {'reserve_retry_time': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.set_scheduling(['sc2', 'sc3', 'default'], False)

        now = int(time.time())
        attr = {'Resource_List.select': '1:ncpus=2',
                'reserve_start': now + start,
                'reserve_end': now + end}
        if rrule is not None:
            attr.update({ATTR_resv_rrule: rrule,
                         ATTR_resv_timezone: self.get_tzid()})

        resv = Reservation(TEST_USER, attr)
        rid = self.server.submit(resv)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]

        if run:
            resv_state = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
            self.logger.info('Sleeping until reservation starts')
            offset = start - int(time.time())
            self.server.expect(RESV, resv_state, id=rid,
                               offset=offset, interval=1)
        else:
            resv_state = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}

        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'false'},
                            id="sc1")
        ret = self.server.status(RESV, 'partition', id=rid)
        a = {'state': 'offline'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=resv_node)

        a = {'reserve_substate': 10}
        a.update(resv_state)
        self.server.expect(RESV, a, id=rid)

        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'True'},
                            id="sc1")
        other_node = vn[resv_node == vn[0]]

        if run:
            a = {'reserve_substate': 5}
        else:
            a = {'reserve_substate': 2}
        a.update({'resv_nodes': (MATCH_RE, re.escape(other_node))})

        self.server.expect(RESV, a, id=rid, interval=1)

    def test_advance_confirmed_resv_reconfirm(self):
        """
        Test degraded reservation gets reconfirmed on a different
        node of the same partition in multi-sched environment
        """
        self.common_setup()
        self.degraded_resv_reconfirm(start=600, end=800)

    def test_advance_running_resv_reconfirm(self):
        """
        Test degraded running reservation gets reconfirmed on a different
        node of the same partition in multi-sched environment
        """
        self.common_setup()
        self.degraded_resv_reconfirm(start=20, end=200, run=True)

    def test_standing_confimred_resv_reconfirm(self):
        """
        Test degraded standing resv gets reconfirmed on a different
        node of the same partition in multi-sched environment
        """
        self.common_setup()
        self.degraded_resv_reconfirm(start=600, end=800,
                                     rrule='FREQ=HOURLY;COUNT=2')

    def test_standing_running_resv_reconfirm(self):
        """
        Test degraded running standing resv gets reconfirmed on a different
        node of the same partition in multi-sched environment
        """
        self.common_setup()
        self.degraded_resv_reconfirm(start=20, end=200, run=True,
                                     rrule='FREQ=HOURLY;COUNT=2')

    def test_resv_from_job_in_multi_sched_using_qsub(self):
        """
        Test that a user is able to create a reservation out of a job using
        qsub when the job is part of a non-default partition
        """
        self.common_setup()
        # Turn off scheduling in all schedulers but sc1
        self.set_scheduling(['sc2', 'sc3', 'default'], False)

        a = {ATTR_W: 'create_resv_from_job=1', ATTR_q: 'wq1',
             'Resource_List.walltime': 1000}
        job = Job(TEST_USER, a)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, jid)

        a = {ATTR_job: jid}
        rid = self.server.status(RESV, a)[0]['id'].split(".")[0]

        a = {ATTR_job: jid, 'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'),
             'partition': 'P1'}
        self.server.expect(RESV, a, id=rid)

    def test_resv_from_job_in_multi_sched_using_rsub(self):
        """
        Test that a user is able to create a reservation out of a job using
        pbs_rsub when the job is part of a non-default partition
        """
        self.common_setup()
        # Turn off scheduling in all schedulers but sc1
        self.set_scheduling(['sc2', 'sc3', 'default'], False)

        a = {'Resource_List.select': '1:ncpus=2', ATTR_q: 'wq1',
             'Resource_List.walltime': 1000}
        job = Job(TEST_USER, a)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, jid)

        a = {ATTR_job: jid}
        resv = Reservation(attrs=a)
        rid = self.server.submit(resv)

        a = {ATTR_job: jid, 'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'),
             'partition': 'P1'}
        self.server.expect(RESV, a, id=rid)

    def test_resv_alter_force_for_confirmed_resv(self):
        """
        Test that in a multi-sched setup ralter -Wforce can
        modify a confirmed reservation successfully even when
        the ralter results into over subscription of resources.
        """

        self.common_setup()
        # Submit 4 reservations to fill up the system and check they are
        # confirmed
        for _ in range(4):
            t = int(time.time())
            a = {'Resource_List.select': '1:ncpus=2', 'reserve_start': t + 300,
                 'reserve_end': t + 900}
            r = Reservation(TEST_USER, a)
            rid = self.server.submit(r)
            attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
            self.server.expect(RESV, attr, rid)
            partition = self.server.status(RESV, 'partition', id=rid)
            if (partition[0]['partition'] == 'P1'):
                p1_start_time = t + 300
        # submit a reservation that will end before the start time of
        # reservation confimed in partition P1
        bu = BatchUtils()
        stime = int(time.time()) + 30
        etime = p1_start_time - 10
        # Turn off scheduling for all schedulers, except sc1
        self.set_scheduling(['sc2', 'sc3', 'default'], False)

        attrs = {'reserve_end': etime, 'reserve_start': stime,
                 'Resource_List.select': '1:ncpus=2'}
        rid_new = self.server.submit(Reservation(TEST_USER, attrs))

        check_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                      'partition': 'P1'}
        self.server.expect(RESV, check_attr, rid_new)

        # Turn off the last running scheduler
        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'false'},
                            id="sc1")
        # extend end time so that it overlaps with an existin reservation
        etime = etime + 300
        a = {'reserve_end': bu.convert_seconds_to_datetime(etime),
             'reserve_start': bu.convert_seconds_to_datetime(stime)}

        self.server.alterresv(rid_new, a, extend='force')
        msg = "pbs_ralter: " + rid_new + " CONFIRMED"
        self.assertEqual(msg, self.server.last_out[0])
        resv_attr = self.server.status(RESV, id=rid_new)[0]
        resv_end = bu.convert_stime_to_seconds(resv_attr['reserve_end'])
        self.assertEqual(int(resv_end), etime)


================================================
FILE: test/tests/functional/pbs_multiple_execjob_launch_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestExecJobHook(TestFunctional):

    hooks = {
        "execjob_hook1":
        """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "executing execjob_launch 1" )
e=pbs.event()
e.progname = "/usr/bin/echo"
e.argv=[]
e.argv.append("launch 1")
pbs.logmsg(pbs.LOG_DEBUG, "environment var from execjob_hook1 is %s" % (e.env))
        """,
        "execjob_hook2":
        """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "executing execjob_launch 2" )
e = pbs.event()
if (e.progname != "/usr/bin/echo"):
    pbs.logmsg(pbs.LOG_DEBUG,
        "Modified progname value did not propagated from launch1 hook")
    e.reject("")
else:
    pbs.logmsg(pbs.LOG_DEBUG,
        "Modified progname value got updated from launch1")
pbs.logmsg(pbs.LOG_DEBUG, "environment var from execjob_hook2 is %s" % (e.env))
        """,
    }

    def setUp(self):
        TestFunctional.setUp(self)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

    def test_multi_execjob_hook(self):
        """
        Unsetting ncpus, that is ['ncpus'] = None, in modifyjob hook
        """
        hook_names = ["execjob_hook1", "execjob_hook2"]
        hook_attrib = {'event': 'execjob_launch', 'enabled': 'True',
                       'order': ''}
        for hook_name in hook_names:
            hook_script = self.hooks[hook_name]
            hook_attrib['order'] = hook_names.index(hook_name) + 1
            retval = self.server.create_import_hook(hook_name,
                                                    hook_attrib,
                                                    hook_script,
                                                    overwrite=True)
            self.assertTrue(retval)

        job = Job(TEST_USER1, attrs={ATTR_l: 'select=1:ncpus=1',
                                     ATTR_e: '/tmp/',
                                     ATTR_o: '/tmp/'})
        job.set_sleep_time(1)
        jid = self.server.submit(job)
        self.mom.log_match(
            "Modified progname value got updated from launch1",
            max_attempts=3, interval=3)

        hook1 = ["execjob_hook1", "execjob_hook2"]

        for hk in hook1:
            msg = "environment var from " + hk
            rv = self.mom.log_match(msg, starttime=self.server.ctime,
                                    max_attempts=10)
            val = rv[1] + ','  # appending comma at the end
            self.assertTrue("PBS_TASKNUM=1," in val,
                            "Message not found for hook " + hk)


================================================
FILE: test/tests/functional/pbs_node_buckets.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestNodeBuckets(TestFunctional):
    """
    Test basic functionality of node buckets.
    """

    def setUp(self):
        TestFunctional.setUp(self)
        day = time.strftime("%Y%m%d", time.localtime(time.time()))
        filename = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                'sched_logs', day)
        self.du.rm(path=filename, force=True, sudo=True, level=logging.DEBUG2)

        self.colors = \
            ['red', 'orange', 'yellow', 'green', 'blue', 'indigo', 'violet']
        self.shapes = ['circle', 'square', 'triangle',
                       'diamond', 'pyramid', 'sphere', 'cube']
        self.letters = ['A', 'B', 'C', 'D', 'E', 'F', 'G']

        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'string', 'flag': 'h'}, id='color')
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'string_array', 'flag': 'h'}, id='shape')
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'string_array', 'flag': 'h'}, id='letter')
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'boolean', 'flag': 'h'}, id='bool')

        a = {'resources_available.ncpus': 2, 'resources_available.mem': '8gb'}
        # 10010 nodes since it divides into 7 evenly.
        # Each node bucket will have 1430 nodes in it
        self.mom.create_vnodes(attrib=a, num=10010,
                               sharednode=False,
                               expect=False, attrfunc=self.cust_attr_func)
        # Make sure all the nodes are in state free.  We can't let
        # create_vnodes() do this because it does a pbsnodes -v on each vnode.
        # This takes a long time.
        self.server.expect(NODE, {'state=free': (GE, 10010)})

        self.scheduler.add_resource('color')

        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

    def cust_attr_func(self, name, totalnodes, numnode, attribs):
        """
        Add resources to vnodes.  There are 10010 nodes, which means 1430
        nodes of each color, letter, and shape.  The value of bool is True
        for the last 5005 nodes and unset for the first 5005 nodes
        """
        a = {'resources_available.color': self.colors[numnode // 1430],
             'resources_available.shape': self.shapes[numnode % 7],
             'resources_available.letter': self.letters[numnode % 7]}

        if numnode // 5005 == 0:
            a['resources_available.bool'] = 'True'

        # Yellow buckets get a higher priority
        if numnode // 1430 == 2:
            a['Priority'] = 100
        return {**attribs, **a}

    def check_normal_path(self, sel='2:ncpus=2:mem=1gb', pl='scatter:excl',
                          queue='workq'):
        """
        Check if a job runs in the normal code path
        """
        a = {'Resource_List.select': sel, 'Resource_List.place': pl,
             'queue': queue}
        j = Job(TEST_USER, attrs=a)

        jid = self.server.submit(j)
        self.scheduler.log_match(jid + ';Evaluating subchunk', n=10000,
                                 interval=1)

        self.server.delete(jid, wait=True)

    @timeout(900)
    def test_basic(self):
        """
        Request nodes of a specific color and make sure they are correctly
        allocated to the job
        """
        chunk = '4:ncpus=1:color=yellow'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'scatter:excl'}
        J = Job(TEST_USER, a)
        jid = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)

        js = self.server.status(JOB, id=jid)
        nodes = J.get_vnodes(js[0]['exec_vnode'])
        for node in nodes:
            n = self.server.status(NODE, 'resources_available.color', id=node)
            self.assertTrue('yellow' in
                            n[0]['resources_available.color'])

    @timeout(900)
    @skip("issue 2334")
    def test_multi_bucket(self):
        """
        Request two different chunk types which need to be allocated from
        different buckets and make sure they are allocated correctly.
        """
        a = {'Resource_List.select':
             '4:ncpus=1:color=yellow+4:ncpus=1:color=blue',
             'Resource_List.place': 'scatter:excl'}
        J = Job(TEST_USER, a)
        jid = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ', n=10000)

        js = self.server.status(JOB, id=jid)
        nodes = J.get_vnodes(js[0]['exec_vnode'])
        # Yellow nodes were requested first.
        # Make sure they come before the blue nodes.
        for i in range(4):
            n = self.server.status(NODE, id=nodes[i])
            self.assertTrue('yellow' in n[0]['resources_available.color'])
        for i in range(4, 8):
            n = self.server.status(NODE, id=nodes[i])
            self.assertTrue('blue' in n[0]['resources_available.color'])

    @timeout(900)
    @skip("issue 2334")
    def test_multi_bucket2(self):
        """
        Request nodes from all 7 different buckets and see them allocated
        correctly
        """
        select = ""
        for c in self.colors:
            select += "1:ncpus=1:color=%s+" % (c)

        # remove the trailing '+'
        select = select[:-1]

        a = {'Resource_List.select': select,
             'Resource_List.place': 'scatter:excl'}

        J = Job(TEST_USER, a)
        jid = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk:', n=10000)

        js = self.server.status(JOB, id=jid)
        nodes = J.get_vnodes(js[0]['exec_vnode'])
        for i, node in enumerate(nodes):
            n = self.server.status(NODE, id=node)
            self.assertTrue(self.colors[i] in
                            n[0]['resources_available.color'])

    @skip("issue 2334")
    def test_not_run(self):
        """
        Request more nodes of one color that is available to make sure
        the job is not run on incorrect nodes.
        """
        chunk = '1431:ncpus=1:color=yellow'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'scatter:excl'}
        J = Job(TEST_USER, a)
        jid = self.server.submit(J)
        a = {'comment': (MATCH_RE, '^Can Never Run'),
             'job_state': 'Q'}
        self.server.expect(JOB, a, attrop=PTL_AND, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)

    @timeout(900)
    @skip("issue 2334")
    def test_calendaring1(self):
        """
        Test to see that nodes that are used in the future for
        calendared jobs are not used for filler jobs that would
        distrupt the scheduled time.
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True'})

        chunk1 = '1:ncpus=1'
        a = {'Resource_List.select': chunk1,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '1:00:00'}
        j = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.scheduler.log_match(jid1 + ';Chunk: ' + chunk1, n=10000)

        chunk2 = '10010:ncpus=1'
        a = {'Resource_List.select': chunk2,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '2:00:00'}
        j = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.expect(JOB, 'comment', op=SET, id=jid2, interval=1)
        self.scheduler.log_match(jid2 + ';Chunk: ' + chunk2, n=10000)

        chunk3 = '2:ncpus=1'
        a = {'Resource_List.select': chunk3,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '30:00'}
        j = Job(TEST_USER, attrs=a)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3, interval=1)
        self.scheduler.log_match(jid3 + ';Chunk: ' + chunk3, n=10000)

        a = {'Resource_List.select': chunk3,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '2:30:00'}
        j = Job(TEST_USER, attrs=a)
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)
        self.server.expect(JOB, 'comment', op=SET, id=jid4, interval=1)
        self.scheduler.log_match(jid4 + ';Chunk: ' + chunk3, n=10000)

    @timeout(900)
    @skip("issue 2334")
    def test_calendaring2(self):
        """
        Test that nodes that a reservation calendared on them later on
        are used before totally free nodes
        """

        self.scheduler.set_sched_config({'strict_ordering': 'True'})

        now = int(time.time())
        vnode = self.mom.shortname
        select_s = '1:vnode=' + vnode + '[2865]+1:vnode=' + vnode + '[2870]'
        a = {'Resource_List.select': select_s,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '1:00:00',
             'reserve_start': now + 3600, 'reserve_end': now + 7200}
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')}, id=rid)

        chunk = '2:ncpus=1:color=yellow'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '30:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)

        s = self.server.status(JOB, 'exec_vnode', id=jid)
        n = j.get_vnodes(s[0]['exec_vnode'])
        msg = 'busy_later nodes not chosen first'
        self.assertTrue(vnode + '[2865]' in n, msg)
        self.assertTrue(vnode + '[2870]' in n, msg)

    @timeout(900)
    @skip("issue 2334")
    def test_calendaring3(self):
        """
        Test that a future reservation's nodes are used first for a job
        that is put into the calendar.
        """

        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        vnode = self.mom.shortname
        now = int(time.time())
        select_s = '1:vnode=' + vnode + '[2865]+1:vnode=' + vnode + '[2870]'
        a = {'Resource_List.select': select_s,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '1:00:00',
             'reserve_start': now + 3600, 'reserve_end': now + 7200}
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')}, id=rid)

        chunk1 = '1430:ncpus=1:color=yellow'
        a = {'Resource_List.select': chunk1,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '30:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk1, n=10000)

        chunk2 = '2:ncpus=1:color=yellow'
        a = {'Resource_List.select': chunk2,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '15:00'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.scheduler.log_match(jid2 + ';Chunk: ' + chunk2, n=10000)
        self.server.expect(JOB, 'estimated.exec_vnode', op=SET, id=jid2)

        s = self.server.status(JOB, 'estimated.exec_vnode', id=jid2)
        n = j2.get_vnodes(s[0]['estimated.exec_vnode'])
        msg = 'busy_later nodes not chosen first'
        self.assertTrue(vnode + '[2865]' in n, msg)
        self.assertTrue(vnode + '[2870]' in n, msg)

    @timeout(900)
    @skip("issue 2334")
    def test_buckets_and_non(self):
        """
        Test that jobs requesting buckets and not requesting buckets
        play nice together
        """

        # vnode[1435] is orange
        vn = self.mom.shortname
        a = {'Resource_List.ncpus': 1,
             'Resource_List.vnode': vn + '[1435]'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.scheduler.log_match(jid1 + ';Evaluating subchunk', n=10000)

        chunk = '1429:ncpus=1:color=orange'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'scatter:excl'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.scheduler.log_match(jid2 + ';Chunk: ' + chunk, n=10000)

        s1 = self.server.status(JOB, 'exec_vnode', id=jid1)
        s2 = self.server.status(JOB, 'exec_vnode', id=jid2)

        nodes1 = j1.get_vnodes(s1[0]['exec_vnode'])
        nodes2 = j2.get_vnodes(s2[0]['exec_vnode'])

        msg = 'Job 1 and Job 2 are sharing nodes'
        for n in nodes2:
            self.assertNotEqual(n, nodes1[0], msg)

    @timeout(900)
    @skip("issue 2334")
    def test_not_buckets(self):
        """
        Test to make sure the jobs that should use the standard node searching
        code path do not use the bucket code path
        """

        # Running a 10010 cpu job through the normal code path spams the log.
        # We don't care about it, so there is no reason to increase
        # the log size by so much.
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 767})
        # Run a job on all nodes leaving 1 cpus available on each node
        j = Job(TEST_USER, {'Resource_List.select': '10010:ncpus=1',
                            'Resource_List.place': 'scatter'})
        j.set_sleep_time(600)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        # Node sorting via unused resources uses the standard code path
        self.logger.info('Test node_sort_key with unused resources')
        a = {'node_sort_key': '\"ncpus HIGH unused\"'}
        self.scheduler.set_sched_config(a)
        self.check_normal_path()

        self.scheduler.revert_to_defaults()
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        # provisioning_policy: avoid_provisioning uses the standard code path
        self.logger.info('Test avoid_provision')
        a = {'provision_policy': 'avoid_provision'}
        self.scheduler.set_sched_config(a)
        self.check_normal_path()

        self.scheduler.revert_to_defaults()
        self.scheduler.add_resource('color')
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        # the bucket codepath requires excl
        self.logger.info('Test different place specs')
        self.check_normal_path(pl='scatter:shared')
        self.check_normal_path(pl='free')

        vn = self.mom.shortname
        # can't request host or vnode resources on the bucket codepath
        self.logger.info('Test jobs requesting host and vnode')
        self.check_normal_path(sel='1:ncpus=2:host=' + vn + '[0]')
        self.check_normal_path(sel='1:ncpus=2:vnode=' + vn + '[0]')

        # suspended jobs use the normal codepath
        self.logger.info('Test suspended job')
        a = {'queue_type': 'execution', 'started': 'True', 'enabled': 'True',
             'priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='expressq')
        self.server.delete(jid, wait=True)

        a = {'Resource_List.select': '1430:ncpus=1:color=orange',
             'Resource_List.place': 'scatter:excl'}
        j2 = Job(TEST_USER, a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        a = {'Resource_List.select': '1:ncpus=1:color=orange',
             'queue': 'expressq'}
        j3 = Job(TEST_USER, a)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.scheduler.log_match(jid3 + ';Evaluating subchunk', n=10000)
        self.server.delete([jid2, jid3], wait=True)

        # Checkpointed jobs use normal code path
        self.logger.info('Test checkpointed job')
        chk_script = """#!/bin/bash
                kill $1
                exit 0
                """
        self.mom.add_checkpoint_abort_script(body=chk_script)

        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'C'},
                            runas=ROOT_USER)
        attrs = {'Resource_List.select': '1430:ncpus=1:color=orange',
                 'Resource_List.place': 'scatter:excl'}
        j_c1 = Job(TEST_USER, attrs)
        jid_c1 = self.server.submit(j_c1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_c1)
        self.scheduler.log_match(
            jid_c1 + ';Chunk: 1430:ncpus=1:color=orange', n=10000)
        a = {'Resource_List.select': '1:ncpus=1:color=orange',
             'queue': 'expressq'}
        j_c2 = Job(TEST_USER, a)
        jid_c2 = self.server.submit(j_c2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid_c1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_c2)
        self.scheduler.log_match(
            jid_c1 + ";Job preempted by checkpointing", n=10000)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.scheduler.log_match(jid_c2 + ';Evaluating subchunk', n=10000)
        self.server.delete([jid_c1, jid_c2], wait=True)

        # Job's in reservations use the standard codepath
        self.logger.info('Test job in reservation')
        now = int(time.time())
        a = {'Resource_List.select': '4:ncpus=2:mem=4gb',
             'Resource_List.place': 'scatter:excl',
             'reserve_start': now + 30, 'reserve_end': now + 120}
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')})
        self.logger.info('Waiting 30s for reservation to start')
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
                           offset=30)
        r_queue = rid.split('.')[0]
        self.check_normal_path(sel='1:ncpus=3', queue=r_queue)
        self.server.delete(rid)

        # Jobs on multi-vnoded systems use the standard codepath
        self.logger.info('Test job on multi-vnoded system')
        a = {'resources_available.ncpus': 2, 'resources_available.mem': '8gb'}
        self.mom.create_vnodes(a, 8, sharednode=False,
                               vnodes_per_host=4)
        self.check_normal_path(sel='2:ncpus=8')

    @timeout(900)
    @skip("issue 2334")
    def test_multi_vnode_resv(self):
        """
        Test that node buckets do not get in the way of running jobs on
        multi-vnoded systems in reservations
        """
        a = {'resources_available.ncpus': 2, 'resources_available.mem': '8gb'}
        self.mom.create_vnodes(a, 12,
                               sharednode=False, vnodes_per_host=4,
                               attrfunc=self.cust_attr_func)

        now = int(time.time())
        a = {'Resource_List.select': '8:ncpus=1',
             'Resource_List.place': 'vscatter',
             'reserve_start': now + 30,
             'reserve_end': now + 3600}

        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        self.logger.info('Waiting 30s for reservation to start')
        a['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, a, id=rid, offset=30)

        a = {'Resource_List.select': '2:ncpus=1',
             'Resource_List.place': 'group=shape',
             'queue': rid.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Evaluating subchunk', n=10000)

        ev = self.server.status(JOB, 'exec_vnode', id=jid)
        used_nodes = j.get_vnodes(ev[0]['exec_vnode'])

        n = self.server.status(NODE, 'resources_available.shape')
        s = [x['resources_available.shape']
             for x in n if x['id'] in used_nodes]
        self.assertEqual(len(set(s)), 1,
                         "Job1 ran in more than one placement set")

    @timeout(900)
    @skip("issue 2334")
    def test_bucket_sort(self):
        """
        Test if buckets are sorted properly: all of the yellow bucket
        also has priority 100.  It should be the first bucket.
        """
        a = {'node_sort_key': '\"sort_priority HIGH\"'}
        self.scheduler.set_sched_config(a)

        chunk = '2:ncpus=1'
        j = Job(TEST_USER, {'Resource_List.select': chunk,
                            'Resource_List.place': 'scatter:excl'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)

        jobs = self.server.status(JOB, {'exec_vnode'})
        jn = j.get_vnodes(jobs[0]['exec_vnode'])
        n1 = self.server.status(NODE, 'resources_available.color',
                                id=jn[0])
        n2 = self.server.status(NODE, 'resources_available.color',
                                id=jn[1])

        c1 = n1[0]['resources_available.color']
        c2 = n2[0]['resources_available.color']
        self.assertEqual(c1, 'yellow', "Job didn't run on yellow nodes")
        self.assertEqual(c2, 'yellow', "Job didn't run on yellow nodes")

    @timeout(900)
    @skip("issue 2334")
    def test_psets(self):
        """
        Test placement sets with node buckets
        """
        a = {'node_group_key': 'shape', 'node_group_enable': 'True',
             'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        chunk = '1430:ncpus=1'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'scatter:excl'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.scheduler.log_match(jid1 + ';Chunk: ' + chunk, n=10000)
        self.scheduler.log_match(jid2 + ';Chunk: ' + chunk, n=10000)

        ev = self.server.status(JOB, 'exec_vnode', id=jid1)
        used_nodes1 = j1.get_vnodes(ev[0]['exec_vnode'])

        n = self.server.status(NODE, 'resources_available.shape')
        s = [x['resources_available.shape']
             for x in n if x['id'] in used_nodes1]
        self.assertEqual(len(set(s)), 1,
                         "Job1 ran in more than one placement set")

        ev = self.server.status(JOB, 'exec_vnode', id=jid2)
        used_nodes2 = j2.get_vnodes(ev[0]['exec_vnode'])

        s = [x['resources_available.shape']
             for x in n if x['id'] in used_nodes2]
        self.assertEqual(len(set(s)), 1,
                         "Job2 ran in more than one placement set")

        for node in used_nodes1:
            self.assertNotIn(node, used_nodes2, 'Jobs share nodes: ' + node)

    @timeout(900)
    @skip("issue 2334")
    def test_psets_calendaring(self):
        """
        Test that jobs in the calendar fit within a placement set
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        svr_attr = {'node_group_key': 'shape', 'node_group_enable': 'True',
                    'backfill_depth': 5}
        self.server.manager(MGR_CMD_SET, SERVER, svr_attr)

        chunk1 = '10010:ncpus=1'
        a = {'Resource_List.select': chunk1,
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '1:00:00'}

        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.scheduler.log_match(jid1 + ';Chunk: ' + chunk1, n=10000)

        chunk2 = '1430:ncpus=1'
        a['Resource_List.select'] = chunk2

        j2 = Job(TEST_USER, a)
        jid2 = self.server.submit(j2)

        self.scheduler.log_match(
            jid2 + ';Chunk: ' + chunk2, interval=1, n=10000)
        self.scheduler.log_match(jid2 + ';Job is a top job', n=10000)

        n = self.server.status(NODE, 'resources_available.shape')

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.expect(JOB, 'estimated.start_time', id=jid2, op=SET)
        ev = self.server.status(JOB, 'estimated.exec_vnode', id=jid2)
        used_nodes2 = j2.get_vnodes(ev[0]['estimated.exec_vnode'])

        s = [x['resources_available.shape']
             for x in n if x['id'] in used_nodes2]
        self.assertEqual(len(set(s)), 1,
                         "Job1 will run in more than one placement set")

        j3 = Job(TEST_USER, a)
        jid3 = self.server.submit(j3)

        self.scheduler.log_match(
            jid3 + ';Chunk: ' + chunk2, interval=1, n=10000)
        self.scheduler.log_match(jid3 + ';Job is a top job', n=10000)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)
        self.server.expect(JOB, 'estimated.start_time', id=jid3, op=SET)
        ev = self.server.status(JOB, 'estimated.exec_vnode', id=jid3)
        used_nodes3 = j3.get_vnodes(ev[0]['estimated.exec_vnode'])

        s = [x['resources_available.shape']
             for x in n if x['id'] in used_nodes3]
        self.assertEqual(len(set(s)), 1,
                         "Job1 will run in more than one placement set")

        for node in used_nodes2:
            self.assertNotIn(node, used_nodes3,
                             'Jobs will share nodes: ' + node)

    @timeout(900)
    @skip("issue 2334")
    def test_psets_calendaring_resv(self):
        """
        Test that jobs do not run into a reservation and will correctly
        be added to the calendar on the correct vnodes with placement sets
        """

        self.scheduler.set_sched_config({'strict_ordering': True})
        self.server.manager(MGR_CMD_SET, SERVER, {'node_group_key': 'shape',
                                                  'node_group_enable': True})

        now = int(time.time())
        a = {'Resource_List.select': '10010:ncpus=1',
             'Resource_List.place': 'scatter:excl',
             'reserve_start': now + 600, 'reserve_end': now + 3600}
        r = Reservation(attrs=a)
        rid = self.server.submit(r)
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')}, id=rid)

        a = {'Resource_List.select': '1430:ncpus=1',
             'Resource_List.place': 'scatter:excl',
             'Resource_List.walltime': '1:00:00'}
        j = Job(attrs=a)
        jid = self.server.submit(j)

        self.server.expect(JOB, 'estimated.exec_vnode', id=jid, op=SET)

        n = self.server.status(NODE, 'resources_available.shape')
        st = self.server.status(JOB, 'estimated.exec_vnode', id=jid)[0]
        nodes = j.get_vnodes(st['estimated.exec_vnode'])

        s = [x['resources_available.shape']
             for x in n if x['id'] in nodes]
        self.assertEqual(len(set(s)), 1,
                         "Job will run in more than one placement set")

    @timeout(900)
    @skip("issue 2334")
    def test_place_group(self):
        """
        Test node buckets with place=group
        """
        chunk = '1430:ncpus=1'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'scatter:excl:group=letter'}

        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)

        ev = self.server.status(JOB, 'exec_vnode', id=jid)
        used_nodes = j.get_vnodes(ev[0]['exec_vnode'])

        n = self.server.status(NODE, 'resources_available.letter')
        s = [x['resources_available.letter']
             for x in n if x['id'] in used_nodes]
        self.assertEqual(len(set(s)), 1,
                         "Job ran in more than one placement set")

    @timeout(900)
    @skip("issue 2334")
    def test_psets_spanning(self):
        """
        Request more nodes than available in one placement set and see
        the job span or not depending on the value of do_not_span_psets
        """
        # Turn off scheduling to be sure there is no cycle running when
        # configurations are changed
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'node_group_key': 'shape', 'node_group_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'do_not_span_psets': 'True'}
        self.server.manager(MGR_CMD_SET, SCHED, a, id='default')

        # request one more node than the largest placement set
        chunk = '1431:ncpus=1'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'scatter:excl'}

        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Trigger a scheduling cycle
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'job_state': 'Q', 'comment':
             (MATCH_RE, 'can\'t fit in the largest placement set, '
              'and can\'t span psets')}
        self.server.expect(JOB, a, attrop=PTL_AND, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)

        a = {'do_not_span_psets': 'False'}
        self.server.manager(MGR_CMD_SET, SCHED, a, id='default')
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        ev = self.server.status(JOB, 'exec_vnode', id=jid)
        used_nodes = j.get_vnodes(ev[0]['exec_vnode'])

        n = self.server.status(NODE, 'resources_available.shape')
        s = [x['resources_available.shape']
             for x in n if x['id'] in used_nodes]
        self.assertGreater(len(set(s)), 1,
                           "Job did not span properly")

    @timeout(900)
    @skip("issue 2334")
    def test_psets_queue(self):
        """
        Test that placement sets work for nodes associated with queues
        """

        a = {'node_group_key': 'shape', 'node_group_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'queue_type': 'Execution', 'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')

        # Take the first 14 vnodes.  This means there are two nodes per shape
        vn = self.mom.shortname
        nodes = [vn + '[' + str(x) + ']' for x in range(14)]
        self.server.manager(MGR_CMD_SET, NODE, {'queue': 'workq2'}, id=nodes)

        chunk = '2:ncpus=1'
        a = {'Resource_List.select': chunk, 'queue': 'workq2',
             'Resource_List.place': 'scatter:excl'}
        for _ in range(7):
            j = Job(TEST_USER, a)
            j.set_sleep_time(1000)
            jid = self.server.submit(j)
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)
            self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)

        # Check to see if jobs ran in one placement set
        jobs = self.server.status(JOB)
        for job in jobs:
            ev = self.server.status(JOB, 'exec_vnode', id=job['id'])
            used_nodes = j.get_vnodes(ev[0]['exec_vnode'])

            n = self.server.status(NODE, 'resources_available.shape')
            s = [x['resources_available.shape']
                 for x in n if x['id'] in used_nodes]
            self.assertEqual(len(set(s)), 1,
                             "Job " + job['id'] +
                             "ran in more than one placement set")

        s = self.server.select()
        for jid in s:
            self.server.delete(jid, wait=True)

        # Check to see of jobs span correctly
        chunk = '7:ncpus=1'
        a = {'Resource_List.select': chunk, 'queue': 'workq2',
             'Resource_List.place': 'scatter:excl'}
        j = Job(TEST_USER, a)
        j.set_sleep_time(1000)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.scheduler.log_match(jid + ';Chunk: ' + chunk, n=10000)
        ev = self.server.status(JOB, 'exec_vnode', id=jid)
        used_nodes = j.get_vnodes(ev[0]['exec_vnode'])

        n = self.server.status(NODE, 'resources_available.shape')
        s = [x['resources_available.shape']
             for x in n if x['id'] in used_nodes]
        self.assertGreater(len(set(s)), 1,
                           "Job did not span properly")

    @timeout(900)
    @skip("issue 2334")
    def test_free(self):
        """
        Test that free placement works with the bucket code path
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        chunk = '1430:ncpus=1:color=yellow'
        a = {'Resource_List.select': chunk,
             'Resource_List.place': 'excl'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.scheduler.log_match(jid1 + ';Chunk: ' + chunk, n=10000)
        self.scheduler.log_match(jid2 + ';Chunk: ' + chunk, n=10000)

        s1 = self.server.status(JOB, 'exec_vnode', id=jid1)
        s2 = self.server.status(JOB, 'exec_vnode', id=jid2)

        n1 = j1.get_vnodes(s1[0]['exec_vnode'])
        n2 = j1.get_vnodes(s2[0]['exec_vnode'])

        msg = 'job did not run on correct number of nodes'
        self.assertEqual(len(n1), 715, msg)
        self.assertEqual(len(n2), 715, msg)

        for node in n1:
            self.assertTrue(node not in n2, 'Jobs share nodes: ' + node)

    @timeout(900)
    @skip("issue 2334")
    def test_queue_nodes(self):
        """
        Test that buckets work with nodes associated to a queue
        """
        v1 = self.mom.shortname + '[1431]'
        v2 = self.mom.shortname + '[1435]'
        a = {'queue_type': 'execution', 'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='q2')

        self.server.manager(MGR_CMD_SET, NODE, {'queue': 'q2'}, id=v1)
        self.server.manager(MGR_CMD_SET, NODE, {'queue': 'q2'}, id=v2)

        chunk1 = '1428:ncpus=1:color=orange'
        a = {'Resource_List.select': chunk1,
             'Resource_List.place': 'scatter:excl'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.scheduler.log_match(jid1 + ';Chunk: ' + chunk1, n=10000)
        job = self.server.status(JOB, 'exec_vnode', id=jid1)[0]
        ev = j1.get_vnodes(job['exec_vnode'])
        msg = 'Job is using queue\'s nodes'
        self.assertNotIn(v1, ev)
        self.assertNotIn(v2, ev)

        chunk2 = '2:ncpus=1'
        a = {'Resource_List.select': chunk2,
             'Resource_List.place': 'scatter:excl',
             'queue': 'q2'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.scheduler.log_match(jid2 + ';Chunk: ' + chunk2, n=10000)
        job = self.server.status(JOB, 'exec_vnode', id=jid2)[0]
        ev = j2.get_vnodes(job['exec_vnode'])
        msg = 'Job running on nodes not associated with queue'
        self.assertIn(v1, ev, msg)
        self.assertIn(v2, ev, msg)

    @timeout(900)
    @skip("issue 2334")
    def test_booleans(self):
        """
        Test that booleans are correctly handled if not in the sched_config
        resources line.  This means that an unset boolean is considered false
        and that booleans that are True are considered even though they
        aren't on the resources line.
        """

        chunk1 = '2:ncpus=1'
        a = {'Resource_List.select': chunk1,
             'Resource_List.place': 'scatter:excl'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.scheduler.log_match(jid1 + ';Chunk: ' + chunk1, n=10000)
        jst = self.server.status(JOB, 'exec_vnode', id=jid1)[0]
        ev = j1.get_vnodes(jst['exec_vnode'])
        for n in ev:
            self.server.expect(
                NODE, {'resources_available.bool': 'True'}, id=n)

        chunk2 = '2:ncpus=1:bool=False'
        a['Resource_List.select'] = chunk2
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.scheduler.log_match(jid2 + ';Chunk: ' + chunk2, n=10000)

        jst = self.server.status(JOB, 'exec_vnode', id=jid2)[0]
        ev = j2.get_vnodes(jst['exec_vnode'])
        for n in ev:
            self.server.expect(
                NODE, 'resources_available.bool', op=UNSET, id=n)

    @timeout(900)
    @skip("issue 2334")
    def test_last_pset_can_never_run(self):
        """
        Test that the job does not retain the error value of last placement
        set seen by the node bucketing code. To check this make sure that the
        last placement set check results into a 'can never run' case because
        resources do not match and check that the job is not marked as
        never run.
        """

        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'long', 'flag': 'nh'}, id='foo')
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'string', 'flag': 'h'}, id='bar')
        self.server.manager(MGR_CMD_SET, SERVER, {'node_group_key': 'bar'})
        self.server.manager(MGR_CMD_SET, SERVER, {'node_group_enable': 'true'})
        self.mom.delete_vnode_defs()
        a = {'resources_available.ncpus': 80,
             'resources_available.bar': 'large'}
        self.mom.create_vnodes(attrib=a, num=8,
                               sharednode=False)
        self.scheduler.add_resource('foo')
        a['resources_available.foo'] = 8
        a['resources_available.ncpus'] = 8
        a['resources_available.bar'] = 'small'
        for val in range(0, 5):
            vname = self.mom.shortname + "[" + str(val) + "]"
            self.server.manager(MGR_CMD_SET, NODE, a, id=vname)
        chunk1 = '4:ncpus=5:foo=5'
        a = {'Resource_List.select': chunk1,
             'Resource_List.place': 'scatter:excl'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.scheduler.log_match(jid2 + ';Job will never run',
                                 existence=False, max_attempts=10)


================================================
FILE: test/tests/functional/pbs_node_jobs_restart.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestNodeJobsRestart(TestFunctional):
    """
    Make sure that jobs remain on the node's jobs line after a server restart
    """

    def test_node_jobs_restart(self):
        """
        Make sure that jobs attribute remains set properly after the
        server is restarted
        """
        J = Job()
        jid = self.server.submit(J)
        self.server.expect(JOB, 'exec_vnode', op=SET, id=jid)

        job_nodes = J.get_vnodes(J.exec_vnode)
        svr_nodes = self.server.status(NODE, id=job_nodes[0])
        msg = 'Job ' + jid + ' not in node ' + job_nodes[0] + '\'s jobs line'
        self.assertTrue(jid in svr_nodes[0]['jobs'], msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.server.restart()

        self.server.expect(NODE, 'jobs', op=SET, id=job_nodes[0])
        svr_nodes2 = self.server.status(NODE, id=job_nodes[0])
        self.assertTrue(jid in svr_nodes2[0]['jobs'], msg)


================================================
FILE: test/tests/functional/pbs_node_jobs_restart_multinode.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from time import sleep


@requirements(num_moms=2)
class TestMultiNodeJobsRestart(TestFunctional):
    """
    Make sure that jobs remain active after node restart
    """

    def test_restart_hosts_resume(self):

        momA = self.moms.values()[0]
        momB = self.moms.values()[1]

        # Make sure moms are running with -p flag
        momA.stop(sig='-INT')
        momA.start(args=['-p'])
        momB.stop(sig='-INT')
        momB.start(args=['-p'])

        pbsdsh_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                   "bin", "pbsdsh")
        script = "sleep 60 && %s echo 'Hello, World'" % pbsdsh_path
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2',
                          'Resource_List.place': 'scatter'})
        j.create_script(script)
        start_time = time.time()
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        momA.stop(sig='-INT')
        momA.start(args=['-p'])
        momB.stop(sig='-INT')
        momB.start(args=['-p'])

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        sleep(60)

        self.server.log_match("%s;Exit_status=0" % jid, starttime=start_time)

        # Restart moms without -p flag
        momA.restart()
        momB.restart()

    def test_restart_hosts_resume_withoutp(self):

        momA = self.moms.values()[0]
        momB = self.moms.values()[1]

        # Make sure moms are running with -p flag
        momA.restart(args=[])
        momB.restart(args=[])

        pbsdsh_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                   "bin", "pbsdsh")
        script = "sleep 60 && %s echo 'Hello, World'" % pbsdsh_path
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2',
                          'Resource_List.place': 'scatter'})
        j.create_script(script)
        start_time = time.time()
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        momA.stop(sig='-INT')
        momA.start(args=['-p'])
        momB.stop(sig='-INT')
        momB.start(args=['-p'])

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        sleep(60)

        self.server.log_match("%s;Exit_status=0" % jid, starttime=start_time)

        # Restart moms without -p flag
        momA.restart()
        momB.restart()

    def test_premature_kill_restart(self):

        momA = self.moms.values()[0]
        momB = self.moms.values()[1]

        # Make sure moms are running with -p flag
        momA.restart(args=['-p'])
        momB.restart(args=['-p'])

        pbsdsh_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                   "bin", "pbsdsh")
        script = "sleep 60 && %s echo 'Hello, World'" % pbsdsh_path
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2',
                          'Resource_List.place': 'scatter'})
        j.create_script(script)
        start_time = time.time()
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        momA.signal("-KILL")
        momB.signal("-KILL")
        sleep(5)
        momA.start(args=['-p'])
        momB.start(args=['-p'])

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        sleep(55)

        self.server.log_match("%s;Exit_status=0" % jid, starttime=start_time)

        # Restart moms without -p flag
        momA.restart()
        momB.restart()


================================================
FILE: test/tests/functional/pbs_node_rampdown.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


def convert_time(fmt, tm, fixdate=False):
    """
    Convert given time stamp <tm> into given format <fmt>
    if fixdate is True add <space> before date if date is < 9
    (This is because to match output with ctime as qstat uses it)
    """
    rv = time.strftime(fmt, time.localtime(float(tm)))
    if ((sys.platform not in ('cygwin', 'win32')) and (fixdate)):
        rv = rv.split()
        date = int(rv[2])
        if date <= 9:
            date = ' ' + str(date)
        rv[2] = str(date)
        rv = ' '.join(rv)
    return rv


@requirements(num_moms=3)
class TestPbsNodeRampDown(TestFunctional):

    """
    This tests the Node Rampdown Feature,
    where while a job is running, nodes/resources
    assigned by non-mother superior can be released.

    Custom parameters:
    moms: colon-separated hostnames of three MoMs
    """

    def transform_select(self, select):
        """
        Takes a select substring:
            "<res1>=<val1>:<res2>=<val2>...:<resN>=<valN>"
        and transform it so that if any of the resource
        (res1, res2,...,resN) matches 'mem', and
        the corresponding value has a suffix of 'gb',
        then convert it too 'kb' value. Also,
        this will attach a "1:' to the returned select
        substring.
        Ex:
             % str = "ncpus=7:mem=2gb:ompthreads=3"
             % transform_select(str)
             1:ompthreads=3:mem=2097152kb:ncpus=7
        """
        sel_list = select.split(':')
        mystr = "1:"
        for index in range(len(sel_list) - 1, -1, -1):
            if (index != len(sel_list) - 1):
                mystr += ":"
            nums = [s for s in sel_list[index] if s.isdigit()]
            key = sel_list[index].split('=')[0]
            if key == "mem":
                mystr += sel_list[index].\
                    replace(nums[0] + "gb",
                            str(int(nums[0]) * 1024 * 1024)) + "kb"
            else:
                mystr += sel_list[index]
        return mystr

    def pbs_nodefile_match_exec_host(self, jid, exec_host,
                                     schedselect=None):
        """
        Look into the PBS_NODEFILE on the first host listed in 'exec_host'
        and returns True if all host entries in 'exec_host' match the entries
        in the file. Otherwise, return False.

        # Look for 'mpiprocs' values in 'schedselect' (if not None), and
        # verify that the corresponding node hosts are appearing in
        # PBS_NODEFILE 'mpiprocs' number of times.
        """

        pbs_nodefile = os.path.join(self.server.
                                    pbs_conf['PBS_HOME'], 'aux', jid)

        # look for mpiprocs settings
        mpiprocs = []
        if schedselect is not None:
            select_list = schedselect.split('+')

            for chunk in select_list:
                chl = chunk.split(':')
                for ch in chl:
                    if ch.find('=') != -1:
                        c = ch.split('=')
                        if c[0] == "mpiprocs":
                            mpiprocs.append(c[1])
        ehost = exec_host.split('+')
        first_host = ehost[0].split('/')[0]

        cmd = ['cat', pbs_nodefile]
        ret = self.server.du.run_cmd(first_host, cmd, sudo=False)
        ehost2 = []
        for h in ret['out']:
            ehost2.append(h.split('.')[0])

        ehost1 = []
        j = 0
        for eh in ehost:
            h = eh.split('/')
            if (len(mpiprocs) > 0):
                for k in range(int(mpiprocs[j])):
                    ehost1.append(h[0])
            else:
                ehost1.append(h[0])
            j += 1

        if ((ehost1 > ehost2) - (ehost1 < ehost2)) != 0:
            return False
        return True

    def check_stageout_file_size(self):
        """
        This Function will check that atleast 1gb of test.img
        file which is to be stagedout is created in 10 seconds
        """
        fpath = os.path.join(TEST_USER.home, "test.img")
        cmd = ['stat', '-c', '%s', fpath]
        fsize = 0
        for i in range(11):
            rc = self.du.run_cmd(hosts=self.hostA, cmd=cmd,
                                 runas=TEST_USER)
            if rc['rc'] == 0 and len(rc['out']) == 1:
                try:
                    fsize = int(rc['out'][0])
                except Exception:
                    pass
            # 1073741824 == 1Gb
            if fsize > 1073741824:
                break
            else:
                time.sleep(1)
        if fsize <= 1073741824:
            self.fail("Failed to create 1gb file at %s" % fpath)

    def match_accounting_log(self, atype, jid, exec_host, exec_vnode,
                             mem, ncpus, nodect, place, select):
        """
        This checks if there's an accounting log record 'atype' for
        job 'jid' containing the values given (i.e.
        Resource_List.exec_host, Resource_List.exec_vnode, etc...)
        This throws an exception upon encountering a non-matching
        accounting_logs entry.
        Some example values of 'atype' are: 'u' (update record due to
        release node request), 'c' (record containing the next
        set of resources to be used by a phased job as a result of
        release node request), 'e' (last update record for a phased job
        due to a release node request), 'E' (end of job record).
        """
        self.server.accounting_match(
            msg=".*%s;%s.*exec_host=%s.*" % (atype, jid, exec_host),
            regexp=True, n="ALL", starttime=self.stime)

        self.server.accounting_match(
            msg=".*%s;%s.*exec_vnode=%s.*" % (atype, jid, exec_vnode),
            regexp=True, n="ALL", starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.mem=%s.*" % (atype, jid, mem),
            regexp=True, n="ALL", starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.ncpus=%d.*" % (atype, jid, ncpus),
            regexp=True, n="ALL", starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.nodect=%d.*" % (atype, jid, nodect),
            regexp=True, n="ALL", starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.place=%s.*" % (atype, jid, place),
            regexp=True, n="ALL", starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.select=%s.*" % (atype, jid, select),
            regexp=True, n="ALL", starttime=self.stime)

        if atype != 'c':
            self.server.accounting_match(
                msg=r".*%s;%s.*resources_used\..*" % (atype, jid),
                regexp=True, n="ALL", starttime=self.stime)

    def match_vnode_status(self, vnode_list, state, jobs=None, ncpus=None,
                           mem=None):
        """
        Given a list of vnode names in 'vnode_list', check to make
        sure each vnode's state, jobs string, resources_assigned.mem,
        and resources_assigned.ncpus match the passed arguments.
        This will throw an exception if a match is not found.
        """
        for vn in vnode_list:
            dict_match = {'state': state}
            if jobs is not None:
                dict_match['jobs'] = jobs
            if ncpus is not None:
                dict_match['resources_assigned.ncpus'] = ncpus
            if mem is not None:
                dict_match['resources_assigned.mem'] = mem

            self.server.expect(VNODE, dict_match, id=vn)

    def create_and_submit_job(self, job_type, attribs={}):
        """
        create the job object and submit it to the server
        based on 'job_type' and attributes list 'attribs'.
        """
        retjob = Job(TEST_USER, attrs=attribs)

        if job_type == 'job1':
            retjob.create_script(self.script['job1'])
        elif job_type == 'job1_1':
            retjob.create_script(self.script['job1_1'])
        elif job_type == 'job1_2':
            retjob.create_script(self.script['job1_2'])
        elif job_type == 'job1_3':
            retjob.create_script(self.script['job1_3'])
        elif job_type == 'job1_5':
            retjob.create_script(self.script['job1_5'])
        elif job_type == 'job1_6':
            retjob.create_script(self.script['job1_6'])
        elif job_type == 'job1_extra_res':
            retjob.create_script(self.script['job1_extra_res'])
        elif job_type == 'job2':
            retjob.create_script(self.script['job2'])
        elif job_type == 'job3':
            retjob.create_script(self.script['job3'])
        elif job_type == 'job5':
            retjob.create_script(self.script['job5'])
        elif job_type == 'job11':
            retjob.create_script(self.script['job11'])
        elif job_type == 'job11x':
            retjob.create_script(self.script['job11x'])
        elif job_type == 'job12':
            retjob.create_script(self.script['job12'])
        elif job_type == 'job13':
            retjob.create_script(self.script['job13'])
        elif job_type == 'jobA':
            retjob.create_script(self.script['jobA'])

        return self.server.submit(retjob)

    def setUp(self):

        if len(self.moms) != 3:
            self.skip_test(reason="need 3 mom hosts: -p moms=<m1>:<m2>:<m3>")

        TestFunctional.setUp(self)
        Job.dflt_attributes[ATTR_k] = 'oe'

        self.server.cleanup_jobs()

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momC = self.moms.values()[2]

        # Now start setting up and creating the vnodes
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        # set node momA
        self.hostA = self.momA.shortname
        self.momA.delete_vnode_defs()
        vnode_prefix = self.hostA
        a = {'resources_available.mem': '1gb',
             'resources_available.ncpus': '1'}
        vnodedef = self.momA.create_vnode_def(vnode_prefix, a, 4)
        self.assertNotEqual(vnodedef, None)
        self.momA.insert_vnode_def(vnodedef, 'vnode.def')
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)

        # set node momB
        self.hostB = self.momB.shortname
        self.momB.delete_vnode_defs()
        vnode_prefix = self.hostB
        a = {'resources_available.mem': '1gb',
             'resources_available.ncpus': '1'}
        vnodedef = self.momB.create_vnode_def(vnode_prefix, a, 5,
                                              usenatvnode=True)
        self.assertNotEqual(vnodedef, None)
        self.momB.insert_vnode_def(vnodedef, 'vnode.def')
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)

        # set node momC
        # This one has no vnode definition.

        self.hostC = self.momC.shortname
        self.momC.delete_vnode_defs()
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostC)
        a = {'resources_available.ncpus': 2,
             'resources_available.mem': '2gb'}
        # set natural vnode of hostC
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostC)

        a = {'state': 'free', 'resources_available.ncpus': (GE, 1)}
        self.server.expect(VNODE, {'state=free': 11}, count=True,
                           interval=2)

        # Various node names
        self.n0 = self.hostA
        self.n1 = '%s[0]' % (self.hostA,)
        self.n2 = '%s[1]' % (self.hostA,)
        self.n3 = '%s[2]' % (self.hostA,)
        self.n4 = self.hostB
        self.n5 = '%s[0]' % (self.hostB,)
        self.n6 = '%s[1]' % (self.hostB,)
        self.n7 = self.hostC
        self.n8 = '%s[3]' % (self.hostA,)
        self.n9 = '%s[2]' % (self.hostB,)
        self.n10 = '%s[3]' % (self.hostB,)

        SLEEP_CMD = self.mom.sleep_cmd

        self.pbs_release_nodes_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_release_nodes')

        FIB40 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', '') + \
            'pbs_python -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(40))\\\")"'

        FIB45 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', '') + \
            'pbs_python -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(45))\\\")"'

        FIB50 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', '') + \
            'pbs_python -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(50))\\\")"'

        FIB400 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', '') + \
            'pbs_python -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(400))\\\")"'

        # job submission arguments
        self.script = {}
        self.job1_select = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=2:mem=2gb"
        self.job1_place = "scatter"

        # expected values upon successful job submission
        self.job1_schedselect = "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+" + \
            "1:ncpus=2:mem=2gb"
        self.job1_exec_host = "%s/0*0+%s/0*0+%s/0*2" % (
            self.n0, self.n4, self.n7)
        self.job1_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n1,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n2,) + \
            "%s:ncpus=1)+" % (self.n3) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n4,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,) + \
            "%s:ncpus=1)+" % (self.n6,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.n7,)

        self.job1_sel_esc = self.job1_select.replace("+", r"\+")
        self.job1_exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        self.job1_exec_vnode_esc = self.job1_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.job1_newsel = self.transform_select(self.job1_select.split(
            '+')[0])
        self.job1_new_exec_host = self.job1_exec_host.split('+')[0]
        self.job1_new_exec_vnode = self.job1_exec_vnode.split(')')[0] + ')'
        self.job1_new_exec_vnode_esc = \
            self.job1_new_exec_vnode.replace("[", r"\[").replace(
                "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                "+", r"\+")

        self.script['job1'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            "#PBS -W stageout=test.img@%s:test.img\n" % (self.n4,) + \
            "#PBS -W release_nodes_on_stageout=true\n" + \
            "dd if=/dev/zero of=test.img count=1024 bs=2097152\n" + \
            "pbsdsh -n 1 -- %s\n" % (FIB40,) + \
            "pbsdsh -n 2 -- %s\n" % (FIB40,) + \
            "%s\n" % (FIB400,)

        self.script['job1_1'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            "#PBS -W stageout=test.img@%s:test.img\n" % (self.n4,) + \
            "#PBS -W release_nodes_on_stageout=false\n" + \
            "dd if=/dev/zero of=test.img count=1024 bs=2097152\n" + \
            "pbsdsh -n 1 -- %s\n" % (FIB40,) + \
            "pbsdsh -n 2 -- %s\n" % (FIB40,) + \
            "%s\n" % (FIB400,)

        self.script['job1_2'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            "#PBS -W stageout=test.img@%s:test.img\n" % (self.n4,) + \
            "dd if=/dev/zero of=test.img count=1024 bs=2097152\n" + \
            "pbsdsh -n 1 -- %s\n" % (FIB40,) + \
            "pbsdsh -n 2 -- %s\n" % (FIB40,) + \
            "%s\n" % (FIB400,)

        self.script['job1_3'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            SLEEP_CMD + " 30\n" + \
            "pbs_release_nodes -a\n" + \
            "%s\n" % (FIB50,)

        self.script['job1_5'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            "pbsdsh -n 1 -- %s &\n" % (FIB45,) + \
            "pbsdsh -n 2 -- %s &\n" % (FIB45,) + \
            "%s\n" % (FIB400,)

        self.script['jobA'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            "#PBS -J 1-5\n"\
            "pbsdsh -n 1 -- %s &\n" % (FIB45,) + \
            "pbsdsh -n 2 -- %s &\n" % (FIB45,) + \
            "%s\n" % (FIB45,)

        self.script['job1_6'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            SLEEP_CMD + " 30\n" + \
            self.pbs_release_nodes_cmd + " " + self.n4 + "\n" + \
            "%s\n" % (FIB50,)

        self.job1_extra_res_select = \
            "ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+" + \
            "ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+" + \
            "ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"
        self.job1_extra_res_place = "scatter"
        self.job1_extra_res_schedselect = \
            "1:ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+" + \
            "1:ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+" + \
            "1:ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"
        self.job1_extra_res_exec_host = "%s/0*0+%s/0*0+%s/0*2" % (
            self.n0, self.n4, self.n7)
        self.job1_extra_res_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n1,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n2,) + \
            "%s:ncpus=1)+" % (self.n3,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n4,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,) + \
            "%s:ncpus=1)+" % (self.n6,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.n7,)
        self.script['job1_extra_res'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job1_extra_res_select + "\n" + \
            "#PBS -l place=" + self.job1_extra_res_place + "\n" + \
            "pbsdsh -n 1 -- %s &\n" % (FIB40,) + \
            "pbsdsh -n 2 -- %s &\n" % (FIB40,) + \
            "%s\n" % (FIB50,)

        self.job2_select = "ncpus=1:mem=1gb+ncpus=4:mem=4gb+ncpus=2:mem=2gb"
        self.job2_place = "scatter"
        self.job2_schedselect = "1:ncpus=1:mem=1gb+1:ncpus=4:mem=4gb+" + \
            "1:ncpus=2:mem=2gb"
        self.job2_exec_host = "%s/1+%s/1*0+%s/1*2" % (
            self.n0, self.n4, self.n7)
        self.job2_exec_vnode = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.n8,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n4,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n9,) + \
            "%s:mem=1048576kb:ncpus=1)+" % (self.n10,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.n7,)

        self.job2_exec_vnode_var1 = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.n8,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n4,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n6,) + \
            "%s:mem=1048576kb:ncpus=1)+" % (self.n9,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.n7,)

        self.script['job2'] = \
            "#PBS -l select=" + self.job2_select + "\n" + \
            "#PBS -l place=" + self.job2_place + "\n" + \
            SLEEP_CMD + " 60\n"

        self.script['job3'] = \
            "#PBS -l select=vnode=" + self.n4 + "+vnode=" + self.n0 + \
            ":mem=4mb\n" + SLEEP_CMD + " 30\n"

        self.script['job5'] = \
            "#PBS -l select=vnode=" + self.n0 + ":mem=4mb\n" + \
            SLEEP_CMD + " 300\n"

        self.job11x_select = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=1:mem=1gb"
        self.job11x_place = "scatter:excl"
        self.job11x_schedselect = "1:ncpus=3:mem=2gb+" + \
            "1:ncpus=3:mem=2gb+1:ncpus=1:mem=1gb"
        self.job11x_exec_host = "%s/0*0+%s/0*0+%s/0" % (
            self.n0, self.n4, self.n7)
        self.job11x_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n1,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n2,) + \
            "%s:ncpus=1)+" % (self.n3,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n4,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,) + \
            "%s:ncpus=1)+" % (self.n6,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.n7,)
        self.job11x_exec_vnode_match = \
            r"\(.+:mem=1048576kb:ncpus=1\+" + \
            r".+:mem=1048576kb:ncpus=1\+" + \
            r".+:ncpus=1\)\+" + \
            r"\(.+:mem=1048576kb:ncpus=1\+" + \
            r".+:mem=1048576kb:ncpus=1\+" + \
            r".+:ncpus=1\)\+" + \
            r"\(.+:ncpus=1:mem=1048576kb\)"
        self.script['job11x'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job11x_select + "\n" + \
            "#PBS -l place=" + self.job11x_place + "\n" + \
            "pbsdsh -n 1 -- %s\n" % (FIB40,) + \
            "pbsdsh -n 2 -- %s\n" % (FIB40,) + \
            "%s\n" % (FIB50,)

        self.job11_select = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=1:mem=1gb"
        self.job11_place = "scatter"
        self.job11_schedselect = "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+" + \
            "1:ncpus=1:mem=1gb"
        self.job11_exec_host = "%s/0*0+%s/0*0+%s/0" % (
            self.n0, self.n4, self.n7)
        self.job11_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n1,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n2,) + \
            "%s:ncpus=1)+" % (self.n3,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.n4,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,) + \
            "%s:ncpus=1)+" % (self.n6,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.n7,)
        self.script['job11'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job11_select + "\n" + \
            "#PBS -l place=" + self.job11_place + "\n" + \
            "pbsdsh -n 1 -- %s\n" % (FIB40,) + \
            "pbsdsh -n 2 -- %s\n" % (FIB40,) + \
            "%s\n" % (FIB50,)

        self.job12_select = "vnode=%s:ncpus=1:mem=1gb" % (self.n7,)
        self.job12_schedselect = "1:vnode=%s:ncpus=1:mem=1gb" % (self.n7,)
        self.job12_place = "free"
        self.job12_exec_host = "%s/1" % (self.n7,)
        self.job12_exec_vnode = "(%s:ncpus=1:mem=1048576kb)" % (self.n7,)
        self.script['job12'] = \
            "#PBS -l select=" + self.job12_select + "\n" + \
            "#PBS -l place=" + self.job12_place + "\n" + \
            SLEEP_CMD + " 60\n"

        self.job13_select = "3:ncpus=1"
        self.script['job13'] = \
            "#PBS -S /bin/bash\n" \
            "#PBS -l select=" + self.job13_select + "\n" + \
            "#PBS -l place=" + self.job1_place + "\n" + \
            "pbsdsh -n 1 -- %s\n" % (FIB400,) + \
            "pbsdsh -n 2 -- %s\n" % (FIB400,) + \
            "pbsdsh -n 3 -- %s\n" % (FIB400,)

        self.stime = time.time()

    def tearDown(self):
        self.momA.signal("-CONT")
        self.momB.signal("-CONT")
        self.momC.signal("-CONT")
        for host in [self.hostA, self.hostB, self.hostC]:
            test_img = os.path.join("/home", "pbsuser", "test.img")
            self.du.rm(hostname=host, path=test_img, force=True,
                       runas=TEST_USER)
        TestFunctional.tearDown(self)

    def release_nodes_rerun(self, option="rerun"):
        """
        Test:
            Test the behavior of a job with released nodes when it
            gets rerun. Specifying an option "kill_mom_and_restart" will
            kill primary mom and restart, which would cause the job
            to requeue/rerun. Otherwise, a job qrerun will be issued
            directly.

            Given a job submitted with a select spec of
            2 super-chunks of ncpus=3 and mem=2gb each,
            and 1 chunk of ncpus=2 and mem=2gb, along with
            place spec of "scatter", resulting in an:

             exec_vnode=
                  (<n1>+<n2><n3>)+(<n4>+<n5>+<n6>)+(<n7>)

            First call:
              pbs_release_nodes -j <job-id> <n5> <n6> <n7>

            Then call:
              if option is "kill_and_restart_mom":
                  kill -KILL pbs_mom
                  start pbs_mom
              otherwise,
                  qrerun <job-id>
            Causes the job to rerun with the original requested
            resources.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5,
               self.n6, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # only mom hostC released the job since the sole vnode
        # <n7> has been released
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10, regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # Verify remaining job resources.

        sel_esc = self.job1_select.replace("+", r"\+")
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=1"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host.replace(
            "+%s/0*2" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "+%s:mem=1048576kb:ncpus=1" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+%s:ncpus=1" % (self.n6,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '3gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "3145728kb",
                                  4, 2, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n5], 'job-busy', jobs_assn1,
                                1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n7, self.n8, self.n9, self.n10],
                                'free')

        # Now rerun the job

        if option == "kill_mom_and_restart":
            self.momA.signal("-KILL")
            self.momA.start()
        else:
            self.server.rerunjob(jid)

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

    def test_release_nodes_on_stageout_true(self):
        """
        Test:
              qsub -W release_nodes_on_stageout=true job.script
              where job.script specifies a select spec of
              2 super-chunks of ncpus=3 and mem=2gb each,
              and 1 chunk of ncpus=2 and mem=2gb, along with
              place spec of "scatter".

              With release_nodes_on_stageout=true option, when
              job is deleted and runs a lengthy stageout process,
              only the primary execution host's
              vnodes are left assigned to the job.
        """
        # Inside job1's script contains the
        # directive to release_nodes_on_stageout=true
        jid = self.create_and_submit_job('job1')

        self.server.expect(JOB, {'job_state': 'R',
                                 'release_nodes_on_stageout': 'True',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Deleting the job will trigger the stageout process
        # at which time sister nodes are automatically released
        # due to release_nodes_stageout=true set
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify remaining job resources.
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)
        # Check various vnode status
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.n4), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.n7), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

    def test_release_nodes_on_stageout_false(self):
        """
        Test:
              qsub -W release_nodes_on_stageout=False job.script
              where job.script specifies a select spec of
              2 super-chunks of ncpus=3 and mem=2gb each,
              and 1 chunk of ncpus=2 and mem=2gb, along with
              place spec of "scatter".

              With release_nodes_on_stageout=false option, when job is
              deleted and runs a lengthy stageout process, nothing
              changes in job's vnodes assignment.
        """
        # Inside job1_1's script contains the
        # directive to release_nodes_on_stageout=false
        jid = self.create_and_submit_job('job1_1')

        self.server.expect(JOB, {'job_state': 'R',
                                 'release_nodes_on_stageout': 'False',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Deleting a job should not trigger automatic
        # release of nodes due to release_nodes_stagout=False
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify no change in remaining job resources.
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Verify mom_logs
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_release_nodes_on_stageout_default(self):
        """
        Test:
              qsub: no -Wrelease_nodes_on_stageout
              option given.

              Job runs as normal.
        """
        jid = self.create_and_submit_job('job1_2')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify no change in remaining job resources.
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)
        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10],
                                'free')

        # Verify mom_logs
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_release_nodes_on_stageout_true_qalter(self):
        """
        Test:
              qalter -W release_nodes_on_stageout=true.

              After running job is modified by qalter,
              with release_nodes_on_stageout=true option, when
              job is deleted and runs a lengthy stageout process,
              only the primary execution host's
              vnodes are left assigned to the job.
        """

        jid = self.create_and_submit_job('job1_2')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # run qalter -Wrelease_nodes_on_stageout=true
        self.server.alterjob(jid,
                             {ATTR_W: 'release_nodes_on_stageout=true'})

        self.server.expect(JOB, {'release_nodes_on_stageout': 'True'}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # This triggers the lengthy stageout process
        # Wait for the Job to create test.img file
        self.check_stageout_file_size()
        self.server.delete(jid)

        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)
        # Check various vnode status
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1,
                                1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

    def test_release_nodes_on_stageout_false_qalter(self):
        """
        Test:
              qalter -W release_nodes_on_stageout=False.

              After running job is modified by qalter,
              With release_nodes_on_stageout=false option, when job is
              deleted and runs a lengthy stageout process, nothing
              changes in job's vnodes assignment.
        """
        jid = self.create_and_submit_job('job1_2')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # run qalter -Wrelease_nodes_on_stageout=true
        self.server.alterjob(jid,
                             {ATTR_W: 'release_nodes_on_stageout=false'})

        self.server.expect(JOB, {'release_nodes_on_stageout': 'False'}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # This triggers long stageout process
        # Wait for the Job to create test.img file
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify no change in remaining job resources.
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Verify mom_logs
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_hook_release_nodes_on_stageout_true(self):
        """
        Test:
              Using a queuejob hook to set
              release_nodes_on_stageout=true.

              When job is deleted and runs a
              lengthy stageout process, only
              the primary execution host's
              vnodes are left assigned to the job.
        """

        hook_body = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "queuejob hook executed")
pbs.event().job.release_nodes_on_stageout=True
"""
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.create_and_submit_job('job1_2')

        self.server.log_match("queuejob hook executed", n=20,
                              interval=2)

        self.server.expect(JOB, {'job_state': 'R',
                                 'release_nodes_on_stageout': 'True',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Deleting the job will trigger the stageout process
        # at which time sister nodes are automatically released
        # due to release_nodes_stageout=true set
        # Wait for the Job to create test.img file
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify remaining job resources.

        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)

        # Check various vnode status
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Verify mom_logs

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.n4,), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

    def test_hook_release_nodes_on_stageout_false(self):
        """
        Test:
              Using a queuejob hook to set
              -Wrelease_nodes_on_stageout=False.

              When job is deleted and runs a
              lengthy stageout process, nothing
              changes in job's vnodes assignment.
        """

        hook_body = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "queuejob hook executed")
pbs.event().job.release_nodes_on_stageout=False
"""
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.create_and_submit_job('job1_2')

        self.server.log_match("queuejob hook executed", n=20,
                              interval=2)

        self.server.expect(JOB, {'job_state': 'R',
                                 'release_nodes_on_stageout': 'False',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Deleting a job should not trigger automatic
        # release of nodes due to release_nodes_stagout=False
        # Wait for the Job to create test.img file
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify no change in remaining job resources.
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Verify mom_logs
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_hook2_release_nodes_on_stageout_true(self):
        """
        Test:
              Using a modifyjob hook to set
              release_nodes_on_stageout=true.

              When job is deleted and runs a
              lengthy stageout process, only
              the primary execution host's
              vnodes are left assigned to the job.
        """

        hook_body = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "modifyjob hook executed")
pbs.event().job.release_nodes_on_stageout=True
"""
        hook_event = "modifyjob"
        hook_name = "mjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.create_and_submit_job('job1_2')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # This triggers the modifyjob hook
        self.server.alterjob(jid, {ATTR_N: "test"})

        self.server.log_match("modifyjob hook executed", n=100,
                              interval=2)

        self.server.expect(JOB, {'release_nodes_on_stageout': 'True'}, id=jid)

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Deleting the job will trigger the stageout process
        # at which time sister nodes are automatically released
        # due to release_nodes_stageout=true set
        # Wait for the Job to create test.img file
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify remaining job resources.

        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

    def test_hook2_release_nodes_on_stageout_false(self):
        """
        Test:
              Using a modifyjob hook to set
              release_nodes_on_stageout=False.

              When job is deleted and runs a
              lengthy stageout process, nothing
              changes in job's vnodes assignment.
        """

        hook_body = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "modifyjob hook executed")
pbs.event().job.release_nodes_on_stageout=False
"""
        hook_event = "modifyjob"
        hook_name = "mjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.create_and_submit_job('job1_2')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # This triggers the modifyjob hook
        self.server.alterjob(jid, {ATTR_N: "test"})

        self.server.log_match("modifyjob hook executed", n=100,
                              interval=2)

        self.server.expect(JOB, {'release_nodes_on_stageout': 'False'}, id=jid)

        # Deleting a job should not trigger automatic
        # release of nodes due to release_nodes_stagout=False
        # Wait for the Job to create test.img file
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify no change in remaining job resources.
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Verify mom_logs
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, interval=1,
                            existence=False)

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_release_nodes_error(self):
        """
        Tests erroneous cases:
            - pbs_release_nodes (no options given)
            - pbs_release_nodes -j <job-id> (and nothing else)
            - pbs_release_nodes -a (not run inside a job)
            -  pbs_release_nodes -j <job-id> -a <node1>
                 (both -a and listed nodes are given)
            - pbs_release_nodes -j <unknown-job-id> -a
            - pbs_release_nodes -j <job-id> -a
              and job is not in a running state.

        Returns the appropriate error message.
        """
        # Test no option given
        cmd = [self.pbs_release_nodes_cmd]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith('usage:'))

        # test only -j <jobid> given
        cmd = [self.pbs_release_nodes_cmd, '-j', '23']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith('usage:'))

        # test only -a given
        cmd = [self.pbs_release_nodes_cmd, '-a']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: No jobid given'))

        # Test specifying an unknown job id
        cmd = [self.pbs_release_nodes_cmd, '-j', '300000', '-a']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: Unknown Job Id 300000'))

        # Test having '-a' and vnode parameter given to pbs_release_nodes
        a = {'Resource_List.select': '3:ncpus=1',
             'Resource_List.place': 'scatter'}
        jid = self.create_and_submit_job('job', a)

        cmd = [self.pbs_release_nodes_cmd, '-j', jid, '-a', self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith('usage:'))

        self.server.delete(jid)

        # Test pbs_release_nodes' permission
        jid = self.create_and_submit_job('job', a)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Run pbs_release_nodes as the executing user != TEST_USER
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, '-a']

        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER1)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: Unauthorized Request'))

        self.server.delete(jid)

        # Test pbs_release_nodes on a non-running job
        a = {'Resource_List.select': '3:ncpus=1',
             ATTR_h: None,
             'Resource_List.place': 'scatter'}
        jid = self.create_and_submit_job('job', a)

        self.server.expect(JOB, {'job_state': 'H'}, id=jid)

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, '-a']

        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: Request invalid for state of job'))

    def test_release_ms_nodes(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing pbs_release_nodes -j <job-id> <n5> <n6> <n1> <n7> where
             <n1> is a mother superior vnode, results in
             entire request to get rejected.
        """
        jid = self.create_and_submit_job('job1')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5, self.n6,
               self.n1, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)

        self.assertTrue(ret['err'][0].startswith(
            "pbs_release_nodes: " +
            "Can't free '%s' since " % (self.n1,) +
            "it's on a primary execution host"))

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_release_not_assigned_nodes(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing:
                 pbs_release_nodes -j <job-id> <n4> <n5> <no_node> <n6> <n7>
             with <no node> means such node is not assigned to the job.
             entire request to get rejected.
        Result:
              Returns an error message and no nodes get released.
        """
        jid = self.create_and_submit_job('job1')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4, self.n5,
               self.n8, self.n6, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)

        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            "pbs_release_nodes: node(s) requested " +
            "to be released not " +
            "part of the job: %s" % (self.n8,)))

        # Ensure nothing has changed with the job.
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_release_cray_nodes(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing:
                  pbs_release_nodes -j <job-id> <n4> <n5> <n6> <n7>
              where <n7> is a Cray node,
        Result:
              Returns an error message and no nodes get released.
        """
        jid = self.create_and_submit_job('job1')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Set hostC node to be of cray type
        a = {'resources_available.vntype': 'cray_login'}
        # set natural vnode of hostC
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.n7)

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4, self.n5,
               self.n6, self.n7]

        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)

        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            "pbs_release_nodes: not currently supported " +
            "on Cray X* series nodes: "
            "%s" % (self.n7,)))

        # Ensure nothing has changed with the job.
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy',
                                jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Check for no existence of account update ('u') record
        self.server.accounting_match(
            msg='.*u;' + jid + ".*exec_host=%s.*" % (self.job1_exec_host_esc,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

        # Check for no existence of account next ('c') record
        self.server.accounting_match(
            msg='.*c;' + jid + ".*exec_host=%s.*" % (self.job1_new_exec_host,),
            regexp=True, n="ALL", existence=False, max_attempts=5, interval=1,
            starttime=self.stime)

    def test_release_nodes_all(self):
        """
        Test:
              Given a job that specifies a select spec of
              2 super-chunks of ncpus=3 and mem=2gb each,
              and 1 chunk of ncpus=2 and mem=2gb, along with
              place spec of "scatter".

              Calling
                  pbs_release_nodes -j <job-id> -a

              will result in all the sister nodes getting
              unassigned from the job.
        """
        jid = self.create_and_submit_job('job1_2')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as regular user
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, '-a']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Verify remaining job resources.
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,

                                 self.n7, self.n8, self.n9, self.n10], 'free')
        self.server.expect(SERVER, {'resources_assigned.ncpus': 3,
                                    'resources_assigned.mem': '2097152kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 3,
                                   'resources_assigned.mem': '2097152kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

    def test_release_nodes_all_as_root(self):
        """
        Test:
             Same test as test_release_nodes_all except the pbs_release_nodes
             call is executed by root. Result is the same.
        """
        jid = self.create_and_submit_job('job1_2')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, '-a']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Verify remaining job resources.
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 3,
                                    'resources_assigned.mem': '2097152kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 3,
                                   'resources_assigned.mem': '2097152kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

    def test_release_nodes_all_inside_job(self):
        """
        Test:
            Like test_release_all test except instead of calling
            pbs_release_nodes from a command line, it is executed
            inside the job script of a running job. Same results.
        """
        # This one has a job script that calls 'pbs_release_nodes'
        # (no jobid specified)
        jid = self.create_and_submit_job('job1_3')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # wait for the job to execute pbs_release_nodes
        time.sleep(10)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Verify remaining job resources.
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 3,
                                    'resources_assigned.mem': '2097152kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 3,
                                   'resources_assigned.mem': '2097152kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

    def test_release_nodes1(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing pbs_release_nodes -j <job-id> <n4>
             results in:
             1. node <n4> no longer appearing in job's
                exec_vnode value,
             2. resources associated with the
                node are taken out of job's Resources_List.*,
                schedselect values,
             3. Since node <n4> is just one of the vnodes in the
                host assigned to the second super-chunk, the node
                still won't accept new jobs until all the other
                allocated vnodes from the same mom host are released.
                The resources then assigned to the job from
                node <n4> continues to be assigned including
                corresponding licenses.

             NOTE: This is testing to make sure the position of <n4>
             in the exec_vnode string (left end of a super-chunk) will
             not break the recreation of the attribute value after
             release.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # momB's host will not get DELETE_JOB2 request since
        # not all its vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host
        new_exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb",
                                  7, 3, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "5242880kb", 7, 3,
                                  self.job1_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb",
                                  8, 3, self.job1_place, self.job1_sel_esc)

    def test_release_nodes1_as_user(self):
        """
        Test:
             Same as test_release_nodes1 except pbs_release_nodes
             is executed by as regular user. Same results.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as regular user
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # momB and momC's hosts will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host
        new_exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb",
                                  7, 3, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "5242880kb", 7, 3,
                                  self.job1_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb",
                                  8, 3, self.job1_place, self.job1_sel_esc)

    def test_release_nodes1_extra(self):
        """
        Test:
             Like test_release_nodes1 except instead of the super-chunk
             and chunks getting only ncpus and mem values, additional
             resources mpiprocs and ompthreads are also requested and
             assigned:

             For example:

               qsub -l select="ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+
                               ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+
                               ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"

             We want to make sure the ompthreads and mpiprocs values are
             preserved in the new exec_vnode, and that in the $PBS_NODEFILE,
             the host names are duplicated according to the  number of
             mpiprocs. For example, if <n1> is assigned to first
             chunk, with mpiprocs=3, <n1> will appear 3 times in
             $PBS_NODEFILE.
        """
        jid = self.create_and_submit_job('job1_extra_res')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select':
                                 self.job1_extra_res_select,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'schedselect':
                                 self.job1_extra_res_schedselect,
                                 'exec_host':
                                 self.job1_extra_res_exec_host,
                                 'exec_vnode':
                                 self.job1_extra_res_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # inside pbs_nodefile_match_exec_host() function, takes  care of
        # verifying that the host names appear according to the number of
        # mpiprocs assigned to the chunk.
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(
                jid, self.job1_extra_res_exec_host,
                self.job1_extra_res_schedselect))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # momB and momC's hosts will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        sel_esc = self.job1_extra_res_select.replace("+", r"\+")
        exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        exec_vnode_esc = \
            self.job1_extra_res_exec_vnode.replace(
                "[", r"\[").replace(
                "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                "+", r"\+")

        newsel = "1:mem=2097152kb:ncpus=3:mpiprocs=3:ompthreads=2+" + \
            "1:mem=1048576kb:ncpus=2:mpiprocs=3:ompthreads=3+" + \
            "1:ncpus=2:mem=2097152kb:mpiprocs=2:ompthreads=2"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_extra_res_exec_host
        new_exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        new_exec_vnode = self.job1_extra_res_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB,
                           {'job_state': 'R',
                            'Resource_List.mem': '5gb',
                            'Resource_List.ncpus': 7,
                            'Resource_List.select': newsel,
                            'Resource_List.place': self.job1_extra_res_place,
                            'Resource_List.nodect': 3,
                            'schedselect': newsel,
                            'exec_host': new_exec_host,
                            'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_extra_res_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb",
                                  7, 3, self.job1_extra_res_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host, newsel))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "5242880kb", 7, 3,
                                  self.job1_extra_res_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb",
                                  8, 3, self.job1_extra_res_place,
                                  sel_esc)

    @timeout(400)
    def test_release_nodes2(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing pbs_release_nodes -j <job-id> <n5>
             results in:
             1. node <n5> no longer appearing in job's
                exec_vnode value,
             2. resources associated with the
                node are taken out of job's Resources_List.*,
                schedselect values,
             3. Since node <n5> is just one of the vnodes in the
                host assigned to the second super-chunk, the node
                still won't accept new jobs until all the other
                allocated vnodes from the same mom host are released.
                The resources then assigned to the job from
                node <n5> continues to be assigned including
                corresponding licenses.

             NOTE: This is testing to make sure the position of <n5>
             in the exec_vnode string (middle of a super-chunk) will
             not break the recreation of the attribute value after
             release.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # momB and momC's hosts will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
            "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host
        new_exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb",
                                  7, 3, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "5242880kb", 7, 3,
                                  self.job1_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb",
                                  8, 3, self.job1_place, self.job1_sel_esc)

    def test_release_nodes2_extra(self):
        """
        Test:
             Like test_release_nodes2 except instead of the super-chunk
             and chunks getting only ncpus and mem values, additional
             resources mpiprocs and ompthreads are also requested and
             assigned:

             For example:

               qsub -l select="ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+
                               ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+
                               ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"

             We want to make sure the ompthreads and mpiprocs values are
             preserved in the new exec_vnode, and that in the $PBS_NODEFILE,
             the host names are duplicated according to the  number of
             mpiprocs. For example, if <n1> is assigned to first
             chunk, with mpiprocs=3, <n1> will appear 3 times in
             $PBS_NODEFILE.
        """
        jid = self.create_and_submit_job('job1_extra_res')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select':
                                 self.job1_extra_res_select,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'schedselect':
                                 self.job1_extra_res_schedselect,
                                 'exec_host':
                                 self.job1_extra_res_exec_host,
                                 'exec_vnode':
                                 self.job1_extra_res_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # inside pbs_nodefile_match_exec_host() function, takes care of
        # verifying that the host names appear according to the number of
        # mpiprocs assigned to the chunk.
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(
                jid, self.job1_extra_res_exec_host,
                self.job1_extra_res_schedselect))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # momB and momC's hosts will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        sel_esc = self.job1_extra_res_select.replace("+", r"\+")
        exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        exec_vnode_esc = self.job1_extra_res_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3:mpiprocs=3:ompthreads=2+" + \
                 "1:mem=1048576kb:ncpus=2:mpiprocs=3:ompthreads=3+" + \
                 "1:ncpus=2:mem=2097152kb:mpiprocs=2:ompthreads=2"

        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_extra_res_exec_host
        new_exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_extra_res_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB,
                           {'job_state': 'R',
                            'Resource_List.mem': '5gb',
                            'Resource_List.ncpus': 7,
                            'Resource_List.select': newsel,
                            'Resource_List.place': self.job1_extra_res_place,
                            'Resource_List.nodect': 3,
                            'schedselect': newsel,
                            'exec_host': new_exec_host,
                            'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_extra_res_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb",
                                  7, 3, self.job1_extra_res_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host, newsel))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "5242880kb", 7, 3,
                                  self.job1_extra_res_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb",
                                  8, 3, self.job1_extra_res_place,
                                  sel_esc)

    @timeout(400)
    def test_release_nodes3(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing pbs_release_nodes -j <job-id> <n6>
             results in:
             1. node <n6> no longer appearing in job's
                exec_vnode value,
             2. resources associated with the
                node are taken out of job's Resources_List.*,
                schedselect values,
             3. Since node <n6> is just one of the vnodes in the
                host assigned to the second super-chunk, the node
                still won't accept new jobs until all the other
                allocated vnodes from the same mom host are released.
                The resources then assigned to the job from
                node <n6> continues to be assigned including
                corresponding licenses.

             NOTE: This is testing to make sure the position of <n6>
             in the exec_vnode string (right end of a super-chunk) will
             not break the recreation of the attribute value after
             release.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n6]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # momB and momC's hosts will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")

        newsel = "1:mem=2097152kb:ncpus=3+1:mem=2097152kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host
        new_exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "+%s:ncpus=1" % (self.n6,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_exec_host_esc,
                                  new_exec_vnode_esc, "6291456kb",
                                  7, 3, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "6291456kb", 7, 3,
                                  self.job1_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb",
                                  8, 3, self.job1_place, self.job1_sel_esc)

    @timeout(400)
    def test_release_nodes3_extra(self):
        """
        Test:
             Like test_release_nodes3 except instead of the super-chunk
             and chunks getting only ncpus and mem values, additional
             resources mpiprocs and ompthreads are also requested and
             assigned:

             For example:

               qsub -l select="ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+
                               ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+
                               ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"

             We want to make sure the ompthreads and mpiprocs values are
             preserved in the new exec_vnode, and that in the $PBS_NODEFILE,
             the host names are duplicated according to the  number of
             mpiprocs. For example, if <n1> is assigned to first
             chunk, with mpiprocs=3, <n1> will appear 3 times in
             $PBS_NODEFILE.
        """
        jid = self.create_and_submit_job('job1_extra_res')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select':
                                 self.job1_extra_res_select,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'schedselect':
                                 self.job1_extra_res_schedselect,
                                 'exec_host':
                                 self.job1_extra_res_exec_host,
                                 'exec_vnode':
                                 self.job1_extra_res_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # inside pbs_nodefile_match_exec_host() function, takes  care of
        # verifying that the host names appear according to the number of
        # mpiprocs assigned to the chunk.
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(
                jid, self.job1_extra_res_exec_host,
                self.job1_extra_res_schedselect))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n6]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # momB and momC's hosts will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        sel_esc = self.job1_extra_res_select.replace("+", r"\+")
        exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_extra_res_exec_vnode.replace(
            "[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")

        newsel = "1:mem=2097152kb:ncpus=3:mpiprocs=3:ompthreads=2+" + \
                 "1:mem=2097152kb:ncpus=2:mpiprocs=3:ompthreads=3+" + \
                 "1:ncpus=2:mem=2097152kb:mpiprocs=2:ompthreads=2"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_extra_res_exec_host
        new_exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
            "+", r"\+")
        new_exec_vnode = self.job1_extra_res_exec_vnode.replace(
            "+%s:ncpus=1" % (self.n6,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB,
                           {'job_state': 'R',
                            'Resource_List.mem': '6gb',
                            'Resource_List.ncpus': 7,
                            'Resource_List.select': newsel,
                            'Resource_List.place':
                            self.job1_extra_res_place,
                            'Resource_List.nodect': 3,
                            'schedselect': newsel,
                            'exec_host': new_exec_host,
                            'exec_vnode': new_exec_vnode}, id=jid)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_extra_res_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "6291456kb",
                                  7, 3, self.job1_extra_res_place, newsel_esc)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host, newsel))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "6291456kb", 7, 3,
                                  self.job1_extra_res_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb",
                                  8, 3, self.job1_extra_res_place,
                                  sel_esc)

    def test_release_nodes4(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing pbs_release_nodes -j <job-id> <n4> <n5> <n7>
             results in:
             1. node <n4>, <n5>, and <n7> are no longer appearing in
                job's exec_vnode value,
             2. resources associated with the released
                nodes are taken out of job's Resources_List.*,
                schedselect values,
             3. Since nodes <n4> and <n5> are some of the vnodes in the
                host assigned to the second super-chunk, the node
                still won't accept new jobs until all the other
                allocated vnodes (<n6>)  from the same mom host are
                released.
             4. The resources then assigned to the job from
                node <n4> and <n5> continue to be assigned including
                corresponding licenses.
             5. <n7> is the only vnode assigned to the host mapped
                to the third chunk so it's fully deallocated and
                its assigned resources are removed from the job.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4, self.n5,
               self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # momB's host will not get job summary reported but
        # momC's host will get the job summary since all vnodes
        # from the host have been released.
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10, regexp=True, existence=False,
            max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10, regexp=True)

        # momB's host will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        # momC's host will get DELETE_JOB2 request since sole vnnode
        # <n7> has been released from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # Ensure the 'fib' process is gone on hostC when DELETE_JOB request
        # is received
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Verify remaining job resources.
        sel_esc = self.job1_select.replace("+", r"\+")
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")

        newsel = "1:mem=2097152kb:ncpus=3+1:ncpus=1"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host.replace(
            "+%s/0*2" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n4> (1 cpu), <n5> (1 cpu), <n7> (2 cpus),
        # only <n7> got released.  <n4> and <n5> are part of a super
        # chunk that wasn't fully released.

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "2097152kb",
                                  4, 2, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        self.match_vnode_status([self.n0, self.n7, self.n8, self.n9, self.n10],
                                'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 6,
                                    'resources_assigned.mem': '4194304kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 6,
                                   'resources_assigned.mem': '4194304kb'},
                           id="workq")
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "2097152kb", 4, 2,
                                  self.job1_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb",
                                  8, 3, self.job1_place, self.job1_sel_esc)

    def test_release_nodes4_extra(self):
        """
        Test:
             Like test_release_nodes4 except instead of the super-chunk
             and chunks getting only ncpus and mem values, additional
             resources mpiprocs and ompthreads are also requested and
             assigned:

             For example:

               qsub -l select="ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+
                               ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+
                               ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"

             We want to make sure the ompthreads and mpiprocs values are
             preserved in the new exec_vnode, and that in the $PBS_NODEFILE,
             the host names are duplicated according to the  number of
             mpiprocs. For example, if <n1> is assigned to first
             chunk, with mpiprocs=3, <n1> will appear 3 times in
             $PBS_NODEFILE.
        """
        jid = self.create_and_submit_job('job1_extra_res')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select':
                                 self.job1_extra_res_select,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'schedselect':
                                 self.job1_extra_res_schedselect,
                                 'exec_host':
                                 self.job1_extra_res_exec_host,
                                 'exec_vnode':
                                 self.job1_extra_res_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # inside pbs_nodefile_match_exec_host() function, takes  care of
        # verifying that the host names appear according to the number of
        # mpiprocs assigned to the chunk.
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(
                jid, self.job1_extra_res_exec_host,
                self.job1_extra_res_schedselect))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4, self.n5,
               self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # momB's host will not get job summary reported but
        # momC's host will get the job summary since all vnodes
        # from the host have been released.
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10, regexp=True, existence=False,
            max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10, regexp=True)

        # momB's host will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        # momC will get DELETE_JOB2 request since sole vnode
        # <n7> has been released from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # Ensure the 'fib' process is gone from hostC when DELETE_JOB request
        # received
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Verify remaining job resources.
        sel_esc = self.job1_extra_res_select.replace("+", r"\+")
        exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_extra_res_exec_vnode.replace(
            "[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")

        newsel = "1:mem=2097152kb:ncpus=3:mpiprocs=3:ompthreads=2+" + \
                 "1:ncpus=1:mpiprocs=3:ompthreads=3"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_extra_res_exec_host.replace(
            "+%s/0*2" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_extra_res_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n4> (1 cpu), <n5> (1 cpu), <n7> (2 cpus),
        # only <n7> got released.  <n4> and <n5> are part of a super
        # chunk that wasn't fully released.

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_extra_res_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "2097152kb",
                                  4, 2, self.job1_extra_res_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        self.match_vnode_status([self.n0, self.n7, self.n8, self.n9, self.n10],
                                'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 6,
                                    'resources_assigned.mem': '4194304kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 6,
                                   'resources_assigned.mem': '4194304kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host, newsel))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "2097152kb", 4, 2,
                                  self.job1_extra_res_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb",
                                  8, 3, self.job1_extra_res_place,
                                  sel_esc)

    def test_release_nodes5(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing pbs_release_nodes -j <job-id> <n5> <n6> <n7>
             results in:
             1. node <n5>, <n6>, and <n7> are no longer appearing in
                job's exec_vnode value,
             2. resources associated with the released
                nodes are taken out of job's Resources_List.*,
                schedselect values,
             3. Since nodes <n5> and <n6> are some of the vnodes in the
                host assigned to the second super-chunk, the node
                still won't accept new jobs until all the other
                allocated vnodes (<n4>) from the same mom host are
                released.
             4. The resources then assigned to the job from
                node <n5> and <n6> continue to be assigned including
                corresponding licenses.
             5. <n7> is the only vnode assigned to the host mapped
                to the third chunk so it's fully deallocated and
                its assigned resources are removed from the job.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5, self.n6,
               self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # momB's host will not get job summary reported but
        # momC's host will get the job summary since all vnodes
        # from the host have been released.
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10, regexp=True, existence=False,
            max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10, regexp=True)

        # momB's host will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        # momC will get DELETE_JOB2 request since sole vnode
        # <n7> has been released from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # Ensure the 'fib' process is gone from hostC when DELETE_JOB request
        # received
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Verify remaining job resources.
        sel_esc = self.job1_select.replace("+", r"\+")
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=1"

        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host.replace(
            "+%s/0*2" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "+%s:mem=1048576kb:ncpus=1" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+%s:ncpus=1" % (self.n6,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = \
            new_exec_vnode.replace("[", r"\[").replace("]", r"\]").replace(
                "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '3gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n5> (1 cpu), <n6> (1 cpu), <n7> (2 cpus),
        # only <n7> got released.  <n5> and <n6> are part of a super
        # chunk that wasn't fully released.

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "3145728kb",
                                  4, 2, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        # <n5> still job-busy
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        # <n6> still job-busy
        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        # <n7> now free
        self.match_vnode_status([self.n0, self.n7, self.n8, self.n9, self.n10],
                                'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 6,
                                    'resources_assigned.mem': '4194304kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 6,
                                   'resources_assigned.mem': '4194304kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "3145728kb", 4, 2,
                                  self.job1_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb",
                                  8, 3, self.job1_place, self.job1_sel_esc)

    def test_release_nodes5_extra(self):
        """
        Test:
             Like test_release_nodes5 except instead of the super-chunk
             and chunks getting only ncpus and mem values, additional
             resources mpiprocs and ompthreads are also requested and
             assigned:

             For example:

               qsub -l select="ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+
                               ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+
                               ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"

             We want to make sure the ompthreads and mpiprocs values are
             preserved in the new exec_vnode, and that in the $PBS_NODEFILE,
             the host names are duplicated according to the  number of
             mpiprocs. For example, if <n1> is assigned to first
             chunk, with mpiprocs=3, <n1> will appear 3 times in
             $PBS_NODEFILE.
        """
        jid = self.create_and_submit_job('job1_extra_res')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select':
                                 self.job1_extra_res_select,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'schedselect':
                                 self.job1_extra_res_schedselect,
                                 'exec_host':
                                 self.job1_extra_res_exec_host,
                                 'exec_vnode':
                                 self.job1_extra_res_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # inside pbs_nodefile_match_exec_host() function, takes  care of
        # verifying that the host names appear according to the number of
        # mpiprocs assigned to the chunk.
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(
                jid, self.job1_extra_res_exec_host,
                self.job1_extra_res_schedselect))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5, self.n6,
               self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # momB's host will not get job summary reported but
        # momC's host will get the job summary since all vnodes
        # from the host have been released.
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10, regexp=True, existence=False,
            max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10, regexp=True)

        # momB's host will not get DELETE_JOB2 request since
        # not all their vnodes have been released yet from the job.
        # momC will get DELETE_JOB2 request since sole vnode
        # <n7> has been released from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # Ensure the 'fib' process is gone from hostC when DELETE_JOB request
        # received
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Verify remaining job resources.
        sel_esc = self.job1_extra_res_select.replace("+", r"\+")
        exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = \
            self.job1_extra_res_exec_vnode.replace("[", r"\[").replace(
                "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                "+", r"\+")
        newsel = \
            "1:mem=2097152kb:ncpus=3:mpiprocs=3:ompthreads=2+" + \
            "1:mem=1048576kb:ncpus=1:mpiprocs=3:ompthreads=3"

        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_extra_res_exec_host.replace(
            "+%s/0*2" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_extra_res_exec_vnode.replace(
            "+%s:mem=1048576kb:ncpus=1" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+%s:ncpus=1" % (self.n6,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = \
            new_exec_vnode.replace("[", r"\[").replace("]", r"\]").replace(
                "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '3gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n5> (1 cpu), <n6> (1 cpu), <n7> (2 cpus),
        # only <n7> got released.  <n5> and <n6> are part of a super
        # chunk that wasn't fully released.

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_extra_res_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "3145728kb",
                                  4, 2, self.job1_extra_res_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        # <n5> still job-busy
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        # <n6> still job-busy
        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        # <n7> is now free
        self.match_vnode_status([self.n0, self.n7, self.n8, self.n9, self.n10],
                                'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 6,
                                    'resources_assigned.mem': '4194304kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 6,
                                   'resources_assigned.mem': '4194304kb'},
                           id="workq")
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host, newsel))

        self.server.delete(jid)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "3145728kb", 4, 2,
                                  self.job1_extra_res_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb",
                                  8, 3, self.job1_extra_res_place,
                                  sel_esc)

    def test_release_nodes6(self):
        """
        Test:
             Given: a job that has been submitted with a select spec
             of 2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an

             exec_vnode=
                  (<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Executing pbs_release_nodes -j <job-id> <n4> <n5> <n6> <n7>
             is equivalent to doing 'pbs_release_nodes -a'  which
             will have the same result as test_release_nodes_all.
             That is, all sister nodes assigned to the job are
             released early from the job.
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Run pbs_release_nodes as regular user
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4, self.n5,
               self.n6, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Ensure the 'fib' process is gone when DELETE_JOB2 received on momB
        self.server.pu.get_proc_info(
            self.momB.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Ensure the 'fib' process is gone when DELETE_JOB2 received on momC
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Verify remaining job resources.
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': self.job1_newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': self.job1_newsel,
                                 'exec_host': self.job1_new_exec_host,
                                 'exec_vnode': self.job1_new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        # nodes <n4>, <n5>, <n6>, <n7> are all free now
        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 3,
                                    'resources_assigned.mem': '2097152kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 3,
                                   'resources_assigned.mem': '2097152kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_new_exec_host))

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, self.job1_newsel)

        # For job to end to get the end records in the accounting_logs
        self.server.delete(jid)

        # Check account phased end job ('e') record
        self.match_accounting_log('e', jid, self.job1_new_exec_host,
                                  self.job1_new_exec_vnode_esc, "2097152kb", 3,
                                  1, self.job1_place, self.job1_newsel)

        # Check account end of job ('E') record
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

    def test_release_nodes6_extra(self):
        """
        Test:
             Like test_release_nodes6 except instead of the super-chunk
             and chunks getting only ncpus and mem values, additional
             resources mpiprocs and ompthreads are also requested and
             assigned:

             For example:

               qsub -l select="ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+
                               ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+
                               ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"

             We want to make sure the ompthreads and mpiprocs values are
             preserved in the new exec_vnode, and that in the $PBS_NODEFILE,
             the host names are duplicated according to the  number of
             mpiprocs. For example, if <n1> is assigned to first
             chunk, with mpiprocs=3, <n1> will appear 3 times in
             $PBS_NODEFILE.
        """
        jid = self.create_and_submit_job('job1_extra_res')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select':
                                 self.job1_extra_res_select,
                                 'Resource_List.place':
                                 self.job1_extra_res_place,
                                 'schedselect':
                                 self.job1_extra_res_schedselect,
                                 'exec_host': self.job1_extra_res_exec_host,
                                 'exec_vnode': self.job1_extra_res_exec_vnode},
                           id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid,
                                              self.job1_extra_res_exec_host,
                                              self.job1_extra_res_schedselect))

        # Run pbs_release_nodes as regular user
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4, self.n5,
               self.n6, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Ensure the 'fib' process is gone when DELETE_JOB2 received on momB
        self.server.pu.get_proc_info(
            self.momB.hostname, ".*fib.*", None)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Ensure the 'fib' process is gone when DELETE_JOB2 received on momC
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Verify remaining job resources.
        sel_esc = self.job1_extra_res_select.replace("+", r"\+")
        exec_host_esc = self.job1_extra_res_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = \
            self.job1_extra_res_exec_vnode.replace("[", r"\[").replace(
                "]", r"\]").replace(
                "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3:mpiprocs=3:ompthreads=2"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_extra_res_exec_host.replace(
            "+%s/0*2" % (self.n7,), "")
        new_exec_host = new_exec_host.replace("+%s/0*0" % (self.n4,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_extra_res_exec_vnode.replace(
            "+%s:mem=1048576kb:ncpus=1" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+%s:ncpus=1" % (self.n6,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:mem=1048576kb:ncpus=1)" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = \
            new_exec_vnode.replace("[", r"\[").replace("]", r"\]").replace(
                "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB,
                           {'job_state': 'R',
                            'Resource_List.mem': '2gb',
                            'Resource_List.ncpus': 3,
                            'Resource_List.select': newsel,
                            'Resource_List.place':
                            self.job1_extra_res_place,
                            'Resource_List.nodect': 1,
                            'schedselect': newsel,
                            'exec_host': new_exec_host,
                            'exec_vnode': new_exec_vnode}, id=jid)

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 3,
                                    'resources_assigned.mem': '2097152kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 3,
                                   'resources_assigned.mem': '2097152kb'},
                           id="workq")

        # nodes <n4>, <n5>, <n6>, <n7> are all free now
        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10], 'free')

        # Ensure the $PBS_NODEFILE contents account for the mpiprocs value;
        # that is, each node hostname is listed 'mpiprocs' number of times in
        # the file.
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(
                jid, self.job1_new_exec_host, newsel))

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_extra_res_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  self.job1_new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, newsel_esc)

        # For job to end to get the end records in the accounting_logs
        self.server.delete(jid)

        # Check account phased end job ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "2097152kb", 3,
                                  1, self.job1_place, newsel_esc)

        # Check account end of job ('E') record
        self.match_accounting_log('E', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place, sel_esc)

    # longer timeout needed as the following test takes a bit
    # longer waiting for job to finish due to stage out
    @timeout(400)
    def test_release_nodes_cmd_plus_stageout(self):
        """
        Test:
            This test calling pbs_release_nodes command on a job
            submitted with release_nodes_on_stageout option.

            Given a job submitted as:
               qsub -W release_nodes_on_stageout=true job.script
            where job.script specifies a select spec of
            2 super-chunks of ncpus=3 and mem=2gb each,
            and 1 chunk of ncpus=2 and mem=2gb, along with
            place spec of "scatter", resulting in an:

            exec_vnode=(<n1>+<n2>+<n3>)+(<n4>+<n5>+<n6>)+(<n7>)

            Then issue:
                  pbs_release_nodes -j <job-id> <n7>

            This would generate a 'u' and 'c' accounting record.
            while <n7> vnode gets deallocated given that it's
            the only vnode assigned to host mapped to third chunk.

            Now call:
                  qdel <job-id>

            This would cause the remaining vnodes <n4>, <n5>, <n6>
            to be deallocated due to job have the
            -W release_nodes_on_stageout=true setting.
            The result is reflected in the 'u', 'c', and 'e'
            accounting logs. 'E' accounting record summarizes
            everything.
        """
        jid = self.create_and_submit_job('job1')

        self.server.expect(JOB, {'job_state': 'R',
                                 'release_nodes_on_stageout': 'True',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Only mom hostC will get the job summary it was released
        # early courtesy of sole vnode <n7>.
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostB), n=10,
            regexp=True, existence=False, max_attempts=5, interval=1)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            regexp=True)

        # Only mom hostC will gt the IM_DELETE_JOB2 request
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # Ensure the 'fib' process is gone from hostC when DELETE_JOB request
        # received
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        # Verify remaining job resources.

        sel_esc = self.job1_select.replace("+", r"\+")
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")

        newsel = "1:mem=2097152kb:ncpus=3+1:mem=2097152kb:ncpus=3"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = "%s/0*0+%s/0*0" % (self.n0, self.hostB)
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '4194304kb',
                                 'Resource_List.ncpus': 6,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        # <n7> now free
        self.match_vnode_status([self.n0, self.n7, self.n8, self.n9, self.n10],
                                'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 6,
                                    'resources_assigned.mem': '4194304kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 6,
                                   'resources_assigned.mem': '4194304kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "4194304kb",
                                  6, 2, self.job1_place, newsel_esc)

        # Terminate the job
        self.check_stageout_file_size()
        self.server.delete(jid)

        # Verify remaining job resources.

        sel_esc = self.job1_select.replace("+", r"\+")
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = self.transform_select(self.job1_select.split('+')[0])
        newsel_esc = newsel.replace("+", r"\+")

        new_exec_host = self.job1_exec_host.split('+')[0]
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.split(')')[0] + ')'
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
            "+", r"\+")
        self.server.expect(JOB, {'job_state': 'E',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check 'u' accounting record from release_nodes_on_stageout=true
        self.match_accounting_log('u', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "4194304kb", 6, 2,
                                  self.job1_place,
                                  newsel_esc)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Check various vnode status.

        # only vnodes from mother superior (sef.hostA) are job-busy
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5,
                                 self.n6, self.n7, self.n8, self.n9,
                                 self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        # Check 'c' accounting record from release_nodes_on_stageout=true
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, newsel_esc)

        # wait for job to finish
        self.server.expect(JOB, 'queue', id=jid, op=UNSET,
                           interval=4, offset=15)

        # Check 'e' record to release_nodes_on_stageout=true
        self.match_accounting_log('e', jid, new_exec_host,
                                  new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, newsel_esc)

        # Check 'E' (end of job) record to release_nodes_on_stageout=true
        self.match_accounting_log('E', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

    def test_multi_release_nodes(self):
        """
        Test:
             This tests several calls to pbs_release_nodes command for
             the same job.

             Given a job submitted with a select spec of
             2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an:

             has exec_vnode=
                  (<n1>+<n2><n3>)+(<n4>+<n5>+<n6>)+(<n7>)
             First call:

                  pbs_release_nodes -j <job-id> <n4>

             <n4> node no longer shows in job's exec_vnode,
             but it will still show as job-busy
             (not accept jobs) since the other 2 vnodes,
             <n5> and <n6> from the host mapped to second
             chunk are still assigned. The 'u' and 'c'
             accounting records will reflect this.

             Second call:

                  pbs_release_nodes -j <job-id> <n5> <n6> <n7>

             Now since all vnodes assigned to the job from
             host mapped to second chunk will show as free.
             Again, the accounting 'u' and 'c' records would
             reflect this fact.
        """
        jid = self.create_and_submit_job('job1')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.

        sel_esc = self.job1_select.replace("+", r"\+")
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")

        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host
        new_exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode_esc = \
            new_exec_vnode.replace("[", r"\[").replace(
                "]", r"\]").replace("(", r"\(").replace(
                ")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Though the job is listed with ncpus=7 taking away released vnode
        # <n4> (1 cpu), its license is not taken away as <n4> is assigned
        # to a super chunk, and the parent mom still has not released the
        # job as vnodes <n5> and <n6> are still allocated to the job.

        # Check various vnode status.
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10],
                                'free')

        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")

        # Check account update ('u') record
        self.match_accounting_log('u', jid, exec_host_esc,
                                  exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb",
                                  7, 3, self.job1_place, newsel_esc)

        # Run pbs_release_nodes again
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5,
               self.n6, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Now mom hostB and hostC can fully release the job
        # resulting in job summary information reported
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            interval=2, regexp=True)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            interval=2, regexp=True)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=2)

        # Check account update ('u') record got generated
        # second pbs_release_nodes call
        self.match_accounting_log('u', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb", 7, 3,
                                  self.job1_place,
                                  newsel_esc)

        # Verify remaining job resources.
        newsel = "1:mem=2097152kb:ncpus=3"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = new_exec_host.replace("+%s/0*2" % (self.n7,), "")
        new_exec_host = new_exec_host.replace("+%s/0*0" % (self.n4,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:mem=1048576kb:ncpus=1" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+%s:ncpus=1)" % (self.n6,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 3,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 1,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3], 'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n4, self.n5, self.n6,
                                 self.n7, self.n8, self.n9, self.n10],
                                'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 3,
                                    'resources_assigned.mem': '2097152kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 3,
                                   'resources_assigned.mem': '2097152kb'},
                           id="workq")

        # Check to make sure 'c' (next) record got generated for
        # second pbs_release_nodes call
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "2097152kb",
                                  3, 1, self.job1_place, newsel_esc)

    def test_release_nodes_run_next_job(self):
        """
        Test:
             Test releasing nodes of one job to allow another
             job to use resources from the released nodes.

             Given a job submitted with a select spec of
             2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter", resulting in an:

             exec_vnode=
                  (<n1>+<n2><n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             First call:

                pbs_release_nodes -j <job-id> <n4> <n5> <n7>

            Submit another job: j2 that will need also the
            unreleased vnode <n6> so job stays queued.

            Now execute:
                   pbs_release_nodes -j <job-id> <n6>>

            And job j2 starts executing using node <n6>
        """
        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid,
               self.n4, self.n5, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        # this is a 7-cpu job that needs <n6> which has not been freed
        jid2 = self.create_and_submit_job('job2')

        # we expect job_state to be Queued
        self.server.expect(JOB, 'comment', op=SET, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        # Let's release the remaining <node6> vnode from hostB
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n6]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # now job 2 should start running
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '7gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job2_select,
                                 'Resource_List.place': self.job2_place,
                                 'schedselect': self.job2_schedselect,
                                 'exec_host': self.job2_exec_host,
                                 'exec_vnode': self.job2_exec_vnode_var1},
                           id=jid2)

        jobs_assn2 = "%s/0" % (jid2,)
        self.match_vnode_status([self.n4, self.n5, self.n6, self.n8, self.n9],
                                'job-busy', jobs_assn2, 1, '1048576kb')

        jobs_assn3 = "%s/0, %s/1" % (jid2, jid2)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn3,
                                2, '2097152kb')
        self.match_vnode_status([self.n0, self.n10], 'free')

    def test_release_nodes_rerun(self):
        """
        Test:
            Test the behavior of a job with released nodes when it
            gets rerun. The job is killed, requeued, and assigned
            the original set of resources before pbs_release_nodes
            was called.
        """
        self.release_nodes_rerun()

    def test_release_nodes_rerun_downed_mom(self):
        """
        Test:
            Test the behavior of a job with released nodes when it
            gets rerun, due to primary mom getting killed and restarted.
            The job is killed, requeued, and assigned
            the original set of resources before pbs_release_nodes
            was called.
        """
        self.release_nodes_rerun("kill_mom_and_restart")

    def test_release_nodes_epilogue(self):
        """
        Test:
             Test to make sure when a job is removed from
             a mom host when all vnodes from that host have
             been released for the job, and run the epilogue hook.
        """

        # First, submit an epilogue hook:

        hook_body = """
import pbs
pbs.logjobmsg(pbs.event().job.id, "epilogue hook executed")
"""

        a = {'event': 'execjob_epilogue', 'enabled': 'true'}
        self.server.create_import_hook("epi", a, hook_body)

        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # Run pbs_release_nodes
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4, self.n5,
               self.n6, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)

        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        self.momB.log_match("Job;%s;epilogue hook executed" % (jid,), n=20)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            interval=5, regexp=True)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            interval=5, regexp=True)

        # Ensure the 'fib' process is gone when DELETE_JOB
        self.server.pu.get_proc_info(
            self.momB.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            interval=5)

        self.momC.log_match("Job;%s;epilogue hook executed" % (jid,), n=20,
                            interval=5)
        # Ensure the 'fib' process is gone when DELETE_JOB
        self.server.pu.get_proc_info(
            self.momC.hostname, ".*fib.*", None, regexp=True)
        self.assertEqual(len(self.server.pu.processes), 0)

    def test_release_nodes_complex(self):
        """
        Test:
             Test a complicated scenario involving
             releasing nodes from a job that has been
             submitted with exclusive placement
             (-l place=scatter:excl), having one of the
             parent moms of released vnodes being
             stopped and continued, suspending and resuming
             of jobs, and finally submitting a new job
             requiring a non-exclusive access to a vnode.

             Given a job submitted with a select spec of
             2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=1 and mem=1gb, along with
             place spec of "scatter:excl", resulting in an:

             exec_vnode=
                  (<n1>+<n2><n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Then stop parent mom host of <n7> (kill -STOP), now issue:
                pbs_release_nodes -j <job-id> <n4> <n5> <n7>

             causing <n4>, <n5>, and <n7> to still be tied to the job
             as there's still node <n6> tied to the job as part of mom
             hostB, which satisfies the second super-chunk.
             Node <n7> is still assigned to the job as parent
             mom hostC has been stopped.

             Submit another job (job2), needing the node <n7> and
             1 cpu but job ends up queued since first job is still
             using <n7>.
             Now Delete job2.

             Now suspend the first job, and all resources_assigned to
             the job's nodes are cleared.

             Now resume the mom of <n7> (kill -CONT). This mom would
             tell server to free up node <n7> as first job has
             been completely removed from the node.

             Now resume job1, and all resources_asssigned
             of the job's nodes including <n4>, <n5> are shown
             allocated, with resources in node <n7> freed.

             Then submit a new 1-cpu job that specifically asks for
             vnode <n7>, and job should run
             taking vnode <n7>, but on pbsnodes listing,
             notice that the vnode's state is still "free"
             and using 1 cpu and 1gb of memory. It's because
             there's still 1 cpu and 1 gb of memory left to
             use in vnode <n7>.
        """
        jid = self.create_and_submit_job('job11x')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job11x_select,
                                 'Resource_List.place': self.job11x_place,
                                 'schedselect': self.job11x_schedselect,
                                 'exec_host': self.job11x_exec_host,
                                 'exec_vnode': self.job11x_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5, self.n7],
                                'job-exclusive', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # temporarily suspend momC, prevents from operating on released nodes
        self.momC.signal("-STOP")

        # Run pbs_release_nodes on nodes belonging to momB and momC
        cmd = [self.pbs_release_nodes_cmd, '-j', jid,
               self.n4, self.n5, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # mom hostB and mom hostC continue to hold on to the job
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # since not all vnodes from momB have been freed from the job,
        # DELETE_JOB2 request from MS is not sent
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # since node <n7> from mom hostC has not been freed from the job
        # since mom is currently stopped, the DELETE_JOB2 request from
        # MS is not sent
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.

        sel_esc = self.job11x_select.replace("+", r"\+")
        exec_host_esc = self.job11x_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job11x_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:ncpus=1"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job11x_exec_host.replace(
            "+%s/0" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job11x_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=1:mem=1048576kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11x_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n4> (1 cpu), <n5> (1 cpu), <n7> (1 cpu),
        # hostB hasn't released job because <n6> is still part of the job and
        # <n7> hasn't been released because the mom is stopped.

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5,
                                 self.n7], 'job-exclusive', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # submit a new job needing node <n7>, which is still currently tied
        # to the previous job.
        jid2 = self.create_and_submit_job('job12')

        # we expect job_state to be Queued as the previous job still has
        # vnode managed by hostC assigned exclusively.
        self.server.expect(JOB, 'comment', op=SET, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.delete(jid2)

        # now suspend previous job
        self.server.sigjob(jid, 'suspend')

        a = {'job_state': 'S'}
        self.server.expect(JOB, a, id=jid)

        self.match_vnode_status([self.n0, self.n1, self.n2, self.n3,
                                 self.n4, self.n5, self.n6, self.n7,
                                 self.n8, self.n9, self.n10], 'free')

        # check server's resources_assigned values
        self.server.expect(SERVER, {'resources_assigned.ncpus': 0,
                                    'resources_assigned.mem': '0kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 0,
                                   'resources_assigned.mem': '0kb'},
                           id="workq")

        # now resume previous job
        self.server.sigjob(jid, 'resume')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11x_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5,
                                 self.n7], 'job-exclusive', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # resume momC
        self.momC.signal("-CONT")

        # With momC resumed, it now receives DELETE_JOB2 request from
        # MS
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # submit this 1 cpu job that requests specifically vnode <n7>
        jid3 = self.create_and_submit_job('job12')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '1gb',
                                 'Resource_List.ncpus': 1,
                                 'Resource_List.nodect': 1,
                                 'Resource_List.select': self.job12_select,
                                 'Resource_List.place': self.job12_place,
                                 'schedselect': self.job12_schedselect,
                                 'exec_host': self.job12_exec_host,
                                 'exec_vnode': self.job12_exec_vnode},
                           id=jid3)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-exclusive', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        # Node <n7> shows as free since job 'jid3' did not request
        # exclusive access.
        jobs_assn2 = "%s/0" % (jid3,)
        self.match_vnode_status([self.n7], 'free', jobs_assn2,
                                1, '1048576kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

    def test_release_nodes_excl_server_restart_quick(self):
        """
        Test:
             Test having a job submitted with exclusive
             placement (-l place=scatter:excl),
             then release a node from it where parent
             mom is stopped, before stopping the
             server with qterm -t quick which
             will leave the job running, and when
             server is started in warm mode where
             also previous job retains its state,
             job continues to have previous node
             assignment including the pending
             released node.

             Given a job submitted with a select spec of
             2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter:excl", resulting in an:

             exec_vnode=
                  (<n1>+<n2><n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Then stop parent mom host of <n7> (kill -STOP), now issue:
                pbs_release_nodes -j <job-id> <n4> <n5> <n7>

             causing <n4>, <n5>, and <n7> to still be tied to the job
             as there's still node <n6> tied to the job as part of mom
             hostB, which satisfies the second super-chunk.
             Node <n7> is still assigned to the job as parent
             mom hostC has been stopped.

             Do a qterm -t quick, which will leave the job
             running.

             Now start pbs_server in default warm mode where all
             running jobs are retained in that state including
             their node assignments.

             The job is restored to the same nodes assignment
             as before taking into account the released nodes.

             Now resume the mom of <n7> (kill -CONT). This mom would
             tell server to free up node <n7> as first job has
             been completely removed from the node.
        """
        jid = self.create_and_submit_job('job11x')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job11x_select,
                                 'Resource_List.place': self.job11x_place,
                                 'schedselect': self.job11x_schedselect,
                                 'exec_host': self.job11x_exec_host,
                                 'exec_vnode': self.job11x_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5, self.n7],
                                'job-exclusive', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # temporarily suspend momC, prevents from operating on released nodes
        self.momC.signal("-STOP")

        # Run pbs_release_nodes on nodes belonging to momB and momC
        cmd = [self.pbs_release_nodes_cmd, '-j', jid,
               self.n4, self.n5, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # mom hostB and mom hostC continuue to hold on to the job
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # since not all vnodes from momB have been freed from the job,
        # DELETE_JOB2 request from MS is not sent
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # since node <n7> from mom hostC has not been freed from the job
        # since mom is currently stopped, the DELETE_JOB2 request from
        # MS is not sent
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.

        sel_esc = self.job11x_select.replace("+", r"\+")
        exec_host_esc = self.job11x_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job11x_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:ncpus=1"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job11x_exec_host.replace(
            "+%s/0" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job11x_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=1:mem=1048576kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11x_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n4> (1 cpu), <n5> (1 cpu), <n7> (1 cpu),
        # hostB hasn't released job because <n6> is still part of the job and
        # <n7> hasn't been released because the mom is stopped.

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5,
                                 self.n7], 'job-exclusive', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # Stop and Start the server
        om = self.server.get_op_mode()
        self.server.set_op_mode(PTL_CLI)
        self.server.qterm(manner="quick")
        self.server.set_op_mode(om)
        self.assertFalse(self.server.isUp())
        self.server.start()
        self.assertTrue(self.server.isUp())

        # Job should have the same state as before
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11x_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-exclusive', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        # parent mom of <n7> is currently in stopped state
        self.match_vnode_status([self.n7], 'state-unknown,down,job-exclusive',
                                jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # resume momC
        self.momC.signal("-CONT")

        # With momC resumed, it now receives DELETE_JOB2 request from
        # MS
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

    def test_release_nodes_excl_server_restart_immed(self):
        """
        Test:
             Test having a job submitted with exclusive
             placement (-l place=scatter:excl),
             then release a node from it where parent
             mom is stopped, before stopping the
             server with qterm -t immediate which
             will requeue job completely, and when
             server is started, job gets assigned
             resources to the original request
             before the pbs_release_nodes call.

             Given a job submitted with a select spec of
             2 super-chunks of ncpus=3 and mem=2gb each,
             and 1 chunk of ncpus=2 and mem=2gb, along with
             place spec of "scatter:excl", resulting in an:

             exec_vnode=
                  (<n1>+<n2><n3>)+(<n4>+<n5>+<n6>)+(<n7>)

             Then stop parent mom host of <n7> (kill -STOP), now issue:
                pbs_release_nodes -j <job-id> <n4> <n5> <n7>

             causing <n4>, <n5>, and <n7> to still be tied to the job
             as there's still node <n6> tied to the job sd part of mom
             hostB, which satisfies the second super-chunk.
             Node <n7> is still assigned to the job as parent
             mom hostC has been stopped.

             Do a qterm -t immediate, which will requeue the
             currently running job.

             Now start pbs_server.

             The job goes back to getting assigned resources for the
             original request, before pbs_release_nodes
             was called.
        """
        jid = self.create_and_submit_job('job11x')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job11x_select,
                                 'Resource_List.place': self.job11x_place,
                                 'schedselect': self.job11x_schedselect,
                                 'exec_host': self.job11x_exec_host,
                                 'exec_vnode': self.job11x_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5, self.n7],
                                'job-exclusive', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # temporarily suspend momC, prevents from operating on released nodes
        self.momC.signal("-STOP")

        # Run pbs_release_nodes on nodes belonging to momB and momC
        cmd = [self.pbs_release_nodes_cmd, '-j', jid,
               self.n4, self.n5, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # mom hostB and mom hostC continuue to hold on to the job
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # since not all vnodes from momB have been freed from the job,
        # DELETE_JOB2 request from MS is not sent
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # since node <n7> from mom hostC has not been freed from the job
        # since mom is currently stopped, the DELETE_JOB2 request from
        # MS is not sent
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.

        sel_esc = self.job11x_select.replace("+", r"\+")
        exec_host_esc = self.job11x_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job11x_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:ncpus=1"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job11x_exec_host.replace(
            "+%s/0" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job11x_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=1:mem=1048576kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11x_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n4> (1 cpu), <n5> (1 cpu), <n7> (1 cpu),
        # hostB hasn't released job because <n6> is still part of the job and
        # <n7> hasn't been released because the mom is stopped.

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5,
                                 self.n7], 'job-exclusive', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # Stop and Start the server
        om = self.server.get_op_mode()
        self.server.set_op_mode(PTL_CLI)
        self.server.qterm(manner="immediate")
        self.server.set_op_mode(om)
        self.assertFalse(self.server.isUp())

        check_time = time.time()

        # resume momC, but this is a stale request (nothing happens)
        # since server is down.
        self.momC.signal("-CONT")

        # start the server again
        self.server.start()
        self.assertTrue(self.server.isUp())

        # make sure job is now running after server restart
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        # make sure job is running with assigned resources
        # from the original request
        self.server.expect(JOB, {'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job11x_select,
                                 'Resource_List.place': self.job11x_place,
                                 'schedselect': self.job11x_schedselect,
                                 'exec_host': self.job11x_exec_host}, id=jid)

        self.server.log_match("Job;%s;Job Run.+on exec_vnode %s" % (
                              jid, self.job11x_exec_vnode_match), regexp=True,
                              starttime=check_time)

        self.server.expect(VNODE, {'state=job-exclusive': 7},
                           count=True, max_attempts=20, interval=2)
        self.server.expect(VNODE, {'state=free': 4},
                           count=True, max_attempts=20, interval=2)

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

    def test_release_nodes_shared_server_restart_quick(self):
        """
        Test:
             Like test_release_nodes_excl_server_restart_quick test
             except the job submitted does not have exclusive
             placement, simply -l place=scatter.
             The results are the same, except the vnode states
             are either "job-busy" or "free" when there are resources
             still available to share.
        """

        jid = self.create_and_submit_job('job11')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job11_select,
                                 'Resource_List.place': self.job11_place,
                                 'schedselect': self.job11_schedselect,
                                 'exec_host': self.job11_exec_host,
                                 'exec_vnode': self.job11_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        # node <n7> is free since there's still 1 ncpus and 1 gb
        # that can be shared with other jobs
        self.match_vnode_status([self.n7], 'free', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # temporarily suspend momC, prevents from operating on released nodes
        self.momC.signal("-STOP")

        # Run pbs_release_nodes on nodes belonging to momB and momC
        cmd = [self.pbs_release_nodes_cmd, '-j', jid,
               self.n4, self.n5, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # mom hostB and mom hostC continuue to hold on to the job
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # since not all vnodes from momB have been freed from the job,
        # DELETE_JOB2 request from MS is not sent
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # since node <n7> from mom hostC has not been freed from the job
        # since mom is currently stopped, the DELETE_JOB2 request from
        # MS is not sent
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        sel_esc = self.job11_select.replace("+", r"\+")
        exec_host_esc = self.job11_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job11_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:ncpus=1"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job11_exec_host.replace(
            "+%s/0" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job11_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=1:mem=1048576kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n4> (1 cpu), <n5> (1 cpu), <n7> (1 cpu),
        # hostB hasn't released job because <n6> is still part of the job and
        # <n7> hasn't been released because the mom is stopped.

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        # node <n7> is free since there's still 1 ncpus and 1 gb
        # that can be shared with other jobs
        self.match_vnode_status([self.n7], 'free', jobs_assn1,
                                1, '1048576kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # Stop and Start the server
        om = self.server.get_op_mode()
        self.server.set_op_mode(PTL_CLI)
        self.server.qterm(manner="quick")
        self.server.set_op_mode(om)
        self.assertFalse(self.server.isUp())
        self.server.start()
        self.assertTrue(self.server.isUp())

        # Job should have the same state as before
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        # parent mom of <n7> is currently in stopped state
        self.match_vnode_status([self.n7], 'state-unknown,down', jobs_assn1,
                                1, '1048576kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # resume momC
        self.momC.signal("-CONT")

        # With momC resumed, it now receives DELETE_JOB2 request from
        # MS
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

    def test_release_nodes_shared_server_restart_immed(self):
        """
        Test:
             Like test_release_nodes_excl_server_restart_quick test
             except the job submitted does not have exclusive
             placement, simply -l place=scatter.
             The results are the same, except the vnode states
             are either "job-busy" or "free" when there are resources
             still available to share.
        """

        jid = self.create_and_submit_job('job11')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job11_select,
                                 'Resource_List.place': self.job11_place,
                                 'schedselect': self.job11_schedselect,
                                 'exec_host': self.job11_exec_host,
                                 'exec_vnode': self.job11_exec_vnode}, id=jid)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        # node <n7> still has resources (ncpus=1, mem=1gb) to share
        self.match_vnode_status([self.n7], 'free', jobs_assn1,
                                1, '1048576kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        # temporarily suspend momC, prevents from operating on released nodes
        self.momC.signal("-STOP")

        # Run pbs_release_nodes on nodes belonging to momB and momC
        cmd = [self.pbs_release_nodes_cmd, '-j', jid,
               self.n4, self.n5, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # mom hostB and mom hostC continuue to hold on to the job
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostC), n=10,
            regexp=True,
            existence=False, max_attempts=5, interval=1)

        # since not all vnodes from momB have been freed from the job,
        # DELETE_JOB2 request from MS is not sent
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # since node <n7> from mom hostC has not been freed from the job
        # since mom is currently stopped, the DELETE_JOB2 request from
        # MS is not sent
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            existence=False, max_attempts=5, interval=1)

        # Verify remaining job resources.
        sel_esc = self.job11_select.replace("+", r"\+")
        exec_host_esc = self.job11_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job11_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:ncpus=1"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job11_exec_host.replace(
            "+%s/0" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job11_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=1:mem=1048576kb)" % (self.n7,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        # job's substate is 41 (PRERUN) since MS mom is stopped
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '2gb',
                                 'Resource_List.ncpus': 4,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job11_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n4> (1 cpu), <n5> (1 cpu), <n7> (1 cpu),
        # hostB hasn't released job because <n6> is still part of the job and
        # <n7> hasn't been released because the mom is stopped.

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1,
                                '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        # node <n7> still has resources (ncpus=1, mem=1gb) to share
        self.match_vnode_status([self.n7], 'free', jobs_assn1,
                                1, '1048576kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

        # Stop and Start the server
        om = self.server.get_op_mode()
        self.server.set_op_mode(PTL_CLI)
        self.server.qterm(manner="immediate")
        self.server.set_op_mode(om)
        self.assertFalse(self.server.isUp())

        check_time = time.time()

        # resume momC, but this is a stale request (nothing happens)
        # since server is down.
        self.momC.signal("-CONT")

        # start the server again
        self.server.start()
        self.assertTrue(self.server.isUp())

        # make sure job is now running after server restart
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # make sure job is running with assigned resources
        # from the original request
        self.server.expect(JOB, {'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job11_select,
                                 'Resource_List.place': self.job11_place,
                                 'schedselect': self.job11_schedselect,
                                 'exec_host': self.job11_exec_host}, id=jid)

        self.server.log_match("Job;%s;Job Run.+on exec_vnode %s" % (
                              jid, self.job11x_exec_vnode_match), regexp=True,
                              starttime=check_time)

        # 7 vnodes are assigned in a shared way: 6 of them has single cpu,
        # while 1 has multiple cpus. So 6 will get "job-busy" state while
        # the other will be in "free" state like the rest.
        self.server.expect(VNODE, {'state=job-busy': 6},
                           count=True, max_attempts=20, interval=2)
        self.server.expect(VNODE, {'state=free': 5},
                           count=True, max_attempts=20, interval=2)

        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id="workq")

    def test_release_mgr_oper(self):
        """
        Test that nodes are getting released as manager and operator
        """

        jid = self.create_and_submit_job('job1_5')
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        self.server.manager(MGR_CMD_UNSET, SERVER, ["managers", "operators"])
        manager = str(MGR_USER) + '@*'
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (INCR, manager)},
                            sudo=True)
        operator = str(OPER_USER) + '@*'
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'operators': (INCR, operator)},
                            sudo=True)

        # Release hostC as manager
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=MGR_USER)
        self.assertEqual(ret['rc'], 0)

        # Only mom hostC will get the job summary it was released
        # early courtesy of sole vnode <n7>.
        self.momA.log_match(
            "Job;%s;%s.+cput=.+ mem=.+" % (jid, self.hostC), n=10,
            regexp=True)

        # Only mom hostC will get the IM_DELETE_JOB2 request
        self.momC.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20)

        # Release vnodes from momB as operator
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5, self.n6]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=OPER_USER)
        self.assertEqual(ret['rc'], 0)

        # momB's host will not get job summary reported
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            jid, self.hostB), n=10, regexp=True, max_attempts=5,
            existence=False, interval=1)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid,), n=20,
                            max_attempts=5, existence=False, interval=1)

        # Verify remaining job resources.
        sel_esc = self.job1_select.replace("+", r"\+")
        exec_host_esc = self.job1_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        exec_vnode_esc = self.job1_exec_vnode.replace("[", r"\[").replace(
            "]", r"\]").replace("(", r"\(").replace(")", r"\)").replace(
                    "+", r"\+")
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=1"

        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host.replace(
            "+%s/0*2" % (self.n7,), "")
        new_exec_host_esc = new_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "+%s:mem=1048576kb:ncpus=1" % (self.n5,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+%s:ncpus=1" % (self.n6,), "")
        new_exec_vnode = new_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        new_exec_vnode_esc = \
            new_exec_vnode.replace("[", r"\[").replace("]", r"\]").replace(
                "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB,
                           {'job_state': 'R',
                            'Resource_List.mem': '3gb',
                            'Resource_List.ncpus': 4,
                            'Resource_List.select': newsel,
                            'Resource_List.place': self.job1_place,
                            'Resource_List.nodect': 2,
                            'schedselect': newsel,
                            'exec_host': new_exec_host,
                            'exec_vnode': new_exec_vnode},
                           id=jid,
                           runas=ROOT_USER)

        # Though the job is listed with ncpus=4 taking away released vnode
        # <n5> (1 cpu), <n6> (1 cpu), <n7> (2 cpus),
        # only <n7> got released.  <n5> and <n6> are part of a super
        # chunk that wasn't fully released.

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, new_exec_host_esc,
                                  new_exec_vnode_esc, "3145728kb",
                                  4, 2, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        # <n5> still job-busy
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        # <n6> still job-busy
        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        # <n7> now free
        self.match_vnode_status([self.n0, self.n7, self.n8, self.n9, self.n10],
                                'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 6,
                                    'resources_assigned.mem': '4194304kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 6,
                                   'resources_assigned.mem': '4194304kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, new_exec_host))

        self.server.delete(jid, runas=ROOT_USER)

        # Check account phased end ('e') record
        self.match_accounting_log('e', jid, new_exec_host_esc,
                                  new_exec_vnode_esc,
                                  "3145728kb", 4, 2,
                                  self.job1_place,
                                  newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        self.match_accounting_log('E', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb",
                                  8, 3, self.job1_place, self.job1_sel_esc)

    def test_release_job_array(self):
        """
        Release vnodes from a job array and subjob
        """

        jid = self.create_and_submit_job('jobA')

        self.server.expect(JOB, {'job_state': 'B',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect}, id=jid)

        # Release nodes from job array. It will fail
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        try:
            ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                         sudo=True)
        except PtlExceptions as e:
            self.assertTrue("not supported for Array jobs" in e.msg)
            self.assertFalse(e.rc)

        # Verify the same for subjob1
        subjob1 = jid.replace('[]', '[1]')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode},
                           id=subjob1)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (subjob1,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (subjob1, subjob1)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(subjob1, self.job1_exec_host))

        # Run pbs_release_nodes as root
        cmd = [self.pbs_release_nodes_cmd, '-j', subjob1, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertEqual(ret['rc'], 0)

        # Verify mom_logs
        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            subjob1, self.hostB), n=10,
            regexp=True,
            max_attempts=5,
            existence=False, interval=1)

        self.momA.log_match("Job;%s;%s.+cput=.+ mem=.+" % (
            subjob1, self.hostC), n=10,
            regexp=True, max_attempts=5,
            existence=False, interval=1)

        # momB's host will not get DELETE_JOB2 request since
        # not all its vnodes have been released yet from the job.
        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (subjob1,),
                            n=20, max_attempts=5,
                            existence=False, interval=1)

        # Verify remaining job resources.
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_host = self.job1_exec_host

        # Below variable is being used for the accounting log match
        # which is currently blocked on PTL bug PP-596.
        # new_exec_host_esc = self.job1_exec_host.replace(
        # "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace("+",
        # r"\+")

        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=subjob1)

        # BELOW IS CODE IS BLOCEKD ON PP-596
        # Check account update ('u') record
        # self.match_accounting_log('u', subjob1, self.job1_exec_host_esc,
        #                          self.job1_exec_vnode_esc, "6gb", 8, 3,
        #                          self.job1_place,
        #                          self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        # self.match_accounting_log('c', subjob1, self.job1_exec_host_esc,
        #                          new_exec_vnode_esc, "5242880kb",
        #                          7, 3, self.job1_place, newsel_esc)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (subjob1,)
        self.match_vnode_status([self.n1, self.n2, self.n4, self.n5],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.n3, self.n6], 'job-busy', jobs_assn1, 1,
                                '0kb')

        jobs_assn2 = "%s/0, %s/1" % (subjob1, subjob1)
        self.match_vnode_status([self.n7], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.n0, self.n8, self.n9, self.n10], 'free')

        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'})
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id="workq")

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(subjob1, new_exec_host))

        self.server.delete(subjob1)

        # Check account phased end ('e') record
        # self.match_accounting_log('e', subjob1, new_exec_host_esc,
        #                          new_exec_vnode_esc,
        #                          "5242880kb", 7, 3,
        #                          self.job1_place,
        #                          newsel_esc)

        # Check to make sure 'E' (end of job) record got generated
        # self.match_accounting_log('E', subjob1, self.job1_exec_host_esc,
        #                          self.job1_exec_vnode_esc, "6gb",
        #                          8, 3, self.job1_place, self.job1_sel_esc)

    def test_release_job_states(self):
        """
        Release nodes on jobs in various states; Q, H, S, W
        """

        # Submit a regular job that cannot run
        a = {'Resource_List.ncpus': 100}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        # Release nodes from a queued job
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertNotEqual(ret['rc'], 0)

        self.server.delete(jid, wait=True)

        # Submit a held job and try releasing the node
        j1 = Job(TEST_USER, {ATTR_h: None})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'H'}, id=jid1)

        cmd = [self.pbs_release_nodes_cmd, '-j', jid1, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertNotEqual(ret['rc'], 0)
        self.server.delete(jid1, wait=True)

        # Submit a job in W state and try releasing the node
        mydate = int(time.time()) + 120
        mytime = convert_time('%m%d%H%M', str(mydate))
        j2 = Job(TEST_USER, {ATTR_a: mytime})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'W'}, id=jid2)

        cmd = [self.pbs_release_nodes_cmd, '-j', jid2, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertNotEqual(ret['rc'], 0)
        self.server.delete(jid2, wait=True)

    def test_release_finishjob(self):
        """
        Test that releasing vnodes on finished jobs will fail
        also verify the updated schedselect on a finished job
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': "true"}, sudo=True)

        jid = self.create_and_submit_job('job1_5')
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

        # Release hostC
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd)
        self.assertEqual(ret['rc'], 0)

        # Submit another job and make sure it is
        # picked up by hostC
        j = Job(TEST_USER,
                {'Resource_List.select': "1:host=" + self.hostC})
        jid2 = self.server.submit(j)
        ehost = self.hostC + "/1"
        self.server.expect(JOB, {'job_state': "R",
                                 "exec_host": ehost}, id=jid2)

        self.server.delete(jid, wait=True)

        # Release vnode4 from a finished job. It will throw error.
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd)
        self.assertNotEqual(ret['rc'], 0)

        # Verify the schedselect for a finished job
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=2097152kb:ncpus=3"
        new_exec_host = "%s/0*0+%s/0*0" % (self.n0, self.hostB)
        new_exec_vnode = self.job1_exec_vnode.replace(
            "+(%s:ncpus=2:mem=2097152kb)" % (self.n7,), "")
        self.server.expect(JOB, {'job_state': 'F',
                                 'Resource_List.mem': '4194304kb',
                                 'Resource_List.ncpus': 6,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 2,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           extend='x', id=jid)

    def test_release_suspendjob(self):
        """
        Test that releasing nodes on suspended job will also
        fail and schedselect will not change
        """

        jid = self.create_and_submit_job('job1_5')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n4]
        ret = self.server.du.run_cmd(self.server.hostname, cmd)
        self.assertEqual(ret['rc'], 0)

        # Verify remaining job resources
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Suspend the job with qsig
        self.server.sigjob(jid, 'suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

        # Try releasing a node from suspended job
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     sudo=True)
        self.assertNotEqual(ret['rc'], 0)

        # Verify that resources won't change
        self.server.expect(JOB, {'job_state': 'S',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

        # Release the job and make sure it is running
        self.server.sigjob(jid, 'resume')
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

    @timeout(500)
    def test_release_multi_jobs(self):
        """
        Release vnodes when multiple jobs are present
        """

        # Delete the vnodes and recreate them
        self.momA.delete_vnode_defs()
        self.momB.delete_vnode_defs()
        self.momA.restart()
        self.momB.restart()
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostC)

        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 3},
                            id=self.hostA)
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 3},
                            id=self.hostB)
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 3},
                            id=self.hostC)

        self.server.expect(NODE, {'state=free': 3})

        # Submit multiple jobs
        jid1 = self.create_and_submit_job('job13')
        jid2 = self.create_and_submit_job('job13')
        jid3 = self.create_and_submit_job('job13')

        e_host_j1 = self.hostA + "/0+" + self.hostB + "/0+" + self.hostC + "/0"
        e_host_j2 = self.hostA + "/1+" + self.hostB + "/1+" + self.hostC + "/1"
        e_host_j3 = self.hostA + "/2+" + self.hostB + "/2+" + self.hostC + "/2"
        e_vnode = "(%s:ncpus=1)+(%s:ncpus=1)+(%s:ncpus=1)" \
            % (self.hostA, self.hostB, self.hostC)

        self.server.expect(JOB, {"job_state=R": 3})
        self.server.expect(JOB, {"exec_host": e_host_j1,
                                 "exec_vnode": e_vnode}, id=jid1)
        self.server.expect(JOB, {"exec_host": e_host_j2,
                                 "exec_vnode": e_vnode}, id=jid2)
        self.server.expect(JOB, {"exec_host": e_host_j3,
                                 "exec_vnode": e_vnode}, id=jid3)

        # Verify that 3 processes running on hostB
        n = retry = 5
        for _ in range(n):
            process = 0
            self.server.pu.get_proc_info(
                self.momB.hostname, ".*fib.*", None, regexp=True)
            if (self.server.pu.processes is not None):
                for key in self.server.pu.processes:
                    if ("fib" in key):
                        process = len(self.server.pu.processes[key])
                        self.logger.info(
                            "length of the process is " + str(process) +
                            ", expected 3")
            if process == 3:
                break
            retry -= 1
            if retry == 0:
                raise AssertionError("not found 3 fib processes")
            self.logger.info("sleeping 3 secs before next retry")
            time.sleep(3)

        # Release node2 from job1 only
        cmd = [self.pbs_release_nodes_cmd, '-j', jid1, self.hostB]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)

        self.momB.log_match("Job;%s;DELETE_JOB2 received" % (jid1,),
                            interval=2)

        # Verify that only 2 process left on hostB now
        process = 0
        self.server.pu.get_proc_info(
            self.momB.hostname, ".*fib.*", None, regexp=True)
        if (self.server.pu.processes is not None):
            for key in self.server.pu.processes:
                if ("fib" in key):
                    process = len(self.server.pu.processes[key])
                    self.logger.info("length of the process is %d" % process)
        self.assertEqual(process, 2)

        # Mom logs only have message for job1 for node3
        self.momA.log_match(
            "Job;%s;%s.+cput=.+mem.+" % (jid1, self.hostB),
            interval=2, regexp=True)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+mem.+" % (jid2, self.hostB),
            max_attempts=5, regexp=True,
            existence=False, interval=1)

        self.momA.log_match(
            "Job;%s;%s.+cput=.+mem.+" % (jid3, self.hostB),
            max_attempts=5, regexp=True,
            existence=False, interval=1)

        # Verify the new schedselect for job1
        new_e_host_j1 = e_host_j1.replace("+%s/0" % (self.hostB,), "")
        new_e_vnode = e_vnode.replace("+(%s:ncpus=1)" % (self.hostB,), "")
        self.server.expect(JOB, {'job_state': "R",
                                 "exec_host": new_e_host_j1,
                                 "exec_vnode": new_e_vnode,
                                 "schedselect": "1:ncpus=1+1:ncpus=1",
                                 "Resource_List.ncpus": 2,
                                 "Resource_List.nodect": 2}, id=jid1)

        # Verify that host and vnode won't change for job2 and job3
        self.server.expect(JOB, {'job_state': "R",
                                 "exec_host": e_host_j2,
                                 "exec_vnode": e_vnode,
                                 "Resource_List.nodect": 3}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R',
                                 "exec_host": e_host_j3,
                                 "exec_vnode": e_vnode,
                                 "Resource_List.nodect": 3}, id=jid3)

    def test_PBS_JOBID(self):
        """
        Test that if -j jobid is not provided then it is
        picked by env variable $PBS_JOBID in job script
        """

        # This one has a job script that calls 'pbs_release_nodes'
        # (no jobid specified)
        jid = self.create_and_submit_job('job1_6')

        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode}, id=jid)

        # Verify remaining job resources
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        newsel_esc = newsel.replace("+", r"\+")
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n4,), "")
        new_exec_vnode_esc = new_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace(
            "(", r"\(").replace(")", r"\)").replace("+", r"\+")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.place': self.job1_place,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': new_exec_vnode},
                           id=jid, interval=1)

        # Check account update ('u') record
        self.match_accounting_log('u', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc, "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # Check to make sure 'c' (next) record got generated
        self.match_accounting_log('c', jid, self.job1_exec_host_esc,
                                  new_exec_vnode_esc, "5242880kb",
                                  7, 3, self.job1_place, newsel_esc)

    def test_release_nodes_on_stageout_diffvalues(self):
        """
        Set release_nodes_on_stageout to different values other than
        true or false
        """

        a = {ATTR_W: "release_nodes_on_stageout=-1"}
        j = Job(TEST_USER, a)
        try:
            self.server.submit(j)
        except PtlException as e:
            self.assertTrue("illegal -W value" in e.msg[0])

        a = {ATTR_W: "release_nodes_on_stageout=11"}
        j = Job(TEST_USER, a)
        try:
            self.server.submit(j)
        except PtlException as e:
            self.assertTrue("illegal -W value" in e.msg[0])

        a = {ATTR_W: "release_nodes_on_stageout=tru"}
        j = Job(TEST_USER, a)
        try:
            self.server.submit(j)
        except PtlException as e:
            self.assertTrue("illegal -W value" in e.msg[0])

    def test_resc_accumulation(self):
        """
        Test that resources gets accumulated when a mom is released
        """

        # skip this test due to PP-972
        self.skip_test(reason="Test fails due to PP-972")

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': "true"}, sudo=True)

        # Create custom resources
        attr = {}
        attr['type'] = 'float'
        attr['flag'] = 'nh'
        r = 'foo_f'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)

        attr1 = {}
        attr1['type'] = 'size'
        attr1['flag'] = 'nh'
        r1 = 'foo_i'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr1, id=r1, runas=ROOT_USER, logerr=False)

        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed epilogue hook")
if e.job.in_ms_mom():
    e.job.resources_used["vmem"] = pbs.size("9gb")
    e.job.resources_used["foo_i"] = pbs.size(999)
    e.job.resources_used["foo_f"] = 0.09
else:
    e.job.resources_used["vmem"] = pbs.size("10gb")
    e.job.resources_used["foo_i"] = pbs.size(1000)
    e.job.resources_used["foo_f"] = 0.10
"""

        hook_name = "epi"
        a = {'event': "execjob_epilogue", 'enabled': 'True'}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        jid = self.create_and_submit_job('job1_5')
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

        # Release hostC
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n7]
        ret = self.server.du.run_cmd(self.server.hostname, cmd)
        self.assertEqual(ret['rc'], 0)

        self.momC.log_match("executed epilogue hook")
        self.momC.log_match("DELETE_JOB2 received")

        self.server.delete(jid, wait=True)

        self.server.expect(JOB, {'job_state': 'F',
                                 "resources_used.foo_i": "3kb",
                                 "resources_used.foo_f": '0.29',
                                 "resources_used.vmem": '29gb'}, id=jid)

    @timeout(500)
    def test_release_reservations(self):
        """
        Release nodes from a reservation will throw error. However
        jobs inside reservation queue works as expected.
        """

        # Create a reservation on multiple nodes
        start = int(time.time()) + 30
        a = {'Resource_List.select': self.job1_select,
             'Resource_List.place': 'scatter',
             'reserve_start': start}
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        rid = rid.split('.')[0]

        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")},
                           id=rid)

        # Release a vnode from reservation. It will throw error.
        cmd = [self.pbs_release_nodes_cmd, '-j', rid, self.n5]
        r = self.server.du.run_cmd(self.server.hostname, cmd)
        self.assertNotEqual(r['rc'], 0)

        # Submit a job inside reservations and release vnode
        a = {'queue': rid,
             'Resource_List.select': self.job1_select}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)

        # Wait for the job to start
        self.server.expect(JOB, {'job_state': 'R'},
                           offset=30, id=jid)

        # Release vnodes from the job
        cmd = [self.pbs_release_nodes_cmd, '-j', jid, self.n5]
        r = self.server.du.run_cmd(self.server.hostname, cmd)
        self.assertEqual(r['rc'], 0)

        # Verify the new schedselect
        newsel = "1:mem=2097152kb:ncpus=3+1:mem=1048576kb:ncpus=2+" + \
                 "1:ncpus=2:mem=2097152kb"
        new_exec_host = self.job1_exec_host
        new_exec_vnode = self.job1_exec_vnode.replace(
            "%s:mem=1048576kb:ncpus=1+" % (self.n5,), "")
        self.server.expect(JOB, {'job_state': 'R',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.select': newsel,
                                 'Resource_List.nodect': 3,
                                 'schedselect': newsel,
                                 'exec_host': new_exec_host,
                                 'exec_vnode': new_exec_vnode}, id=jid)

    def test_execjob_end_called(self):
        """
        Test:
             Test to make sure when a job is removed from
             a mom host that the execjob_end hook is called on
             that mom.
        """

        # First, submit an execjob_end hook:

        hook_body = """
import pbs
pbs.logjobmsg(pbs.event().job.id, "execjob_end hook executed")
"""

        a = {'event': 'execjob_end', 'enabled': 'true'}
        self.server.create_import_hook("endjob", a, hook_body)

        # Create a multinode job request
        a = {'Resource_List.select': '2:ncpus=1',
             'Resource_List.place': 'scatter'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Wait for the job to start
        self.server.expect(JOB, {'job_state': 'R'},
                           offset=30, id=jid)

        cmd = [self.pbs_release_nodes_cmd, '-j', jid, '-a']
        ret = self.server.du.run_cmd(self.server.hostname,
                                     cmd, runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)

        # Check the sister mom log for the "execjob_end hook executed"
        self.momB.log_match("execjob_end hook executed")

        # Verify the rest of the job is still running
        self.server.expect(JOB, {'job_state': 'R'},
                           id=jid)


================================================
FILE: test/tests/functional/pbs_node_rampdown_keep_select.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from collections import Counter
from copy import deepcopy
from os import name

from tests.functional import *


class n_conf:
    """
    used to define node configuration info
    """
    def __init__(self, node_a={}, node_ct=0, usenatvn=False):
        self.vnode_ct = node_ct
        self.a = node_a
        self.usenatvnode = usenatvn


class new_res:
    """
    used to define new custom resource
    """
    def __init__(self, res_name, res_a={}):
        self.res_name = res_name
        self.a = res_a


class test_config:
    """
    used to store config of a test case
    """
    def __init__(self, qsub_sel, keep_sel, sched_sel, expected_res, job_stat,
                 rel_user, qsub_sel_after, sched_sel_after, job_stat_after,
                 expected_res_after, skip_vnode_status_check=False,
                 use_script=False):
        self.qsub_sel = qsub_sel
        self.keep_sel = keep_sel
        self.sched_sel = sched_sel
        self.expected_res = expected_res
        self.job_stat = job_stat
        self.rel_user = rel_user
        self.qsub_sel_after = qsub_sel_after
        self.sched_sel_after = sched_sel_after
        self.job_stat_after = job_stat_after
        self.expected_res_after = expected_res_after
        self.skip_vnode_status_check = skip_vnode_status_check
        self.use_script = use_script


@requirements(num_moms=5)
class TestPbsNodeRampDownKeepSelect(TestFunctional):
    """
    This tests the Node Rampdown Feature's extension called keep_select,
    where while a job is running, nodes/resources assigned on non-mother
    superior can be released by specifying a subselect.

    Custom parameters:
    moms: colon-separated hostnames of five MoMs
    """

    res_s_h = {'type': 'string', 'flag': 'h'}
    res_b_h = {'type': 'boolean', 'flag': 'h'}
    res_l_nh = {'type': 'long', 'flag': 'nh'}
    res_sz_nh = {'type': 'size', 'flag': 'nh'}
    res_f_nh = {'type': 'float', 'flag': 'nh'}

    def pbs_nodefile_match_exec_host(self, jid, ehost, schedselect=None):
        """
        Look into the PBS_NODEFILE on the first host listed in 'exec_host'
        and returns True if all host entries in 'exec_host' match the entries
        in the file. Otherwise, return False.

        # Look for 'mpiprocs' values in 'schedselect' (if not None), and
        # verify that the corresponding node hosts are appearing in
        # PBS_NODEFILE 'mpiprocs' number of times.
        """

        pbs_nodefile = os.path.join(self.server.
                                    pbs_conf['PBS_HOME'], 'aux', jid)

        # look for mpiprocs settings
        mpiprocs = []
        if schedselect is not None:
            select_list = schedselect.split('+')

            for chunk in select_list:
                ch_ct = '1'
                chl = chunk.split(':')
                if chl[0].isnumeric():
                    ch_ct = chl[0]
                    del chl[0]
                for x in range(int(ch_ct)):
                    tmpmpi = '1'
                    for ch in chl:
                        if ch.find('=') != -1:
                            c = ch.split('=')
                            if c[0] == "mpiprocs":
                                tmpmpi = c[1]
                    mpiprocs.append(tmpmpi)
        first_host = ehost[0]

        cmd = ['cat', pbs_nodefile]
        ret = self.server.du.run_cmd(first_host, cmd, sudo=False)
        ehost2 = []
        for h in ret['out']:
            ehost2.append(h.split('.')[0])

        ehost1 = []
        for (eh, mpin) in zip(ehost, mpiprocs):
            for k in range(int(mpin)):
                ehost1.append(eh)

        self.assertEqual(Counter(ehost1), Counter(ehost2),
                         'PBS_NODEFILE match failed')

    def match_vnode_status(self, vnode_list, state, ncpus=None, jobs=None,
                           mem=None):
        """
        Given a list of vnode names in 'vnode_list', check to make
        sure each vnode's state, jobs string, resources_assigned.mem,
        and resources_assigned.ncpus match the passed arguments.
        This will throw an exception if a match is not found.
        """
        if ncpus is None:
            if state == 'free':
                ncpus = [0 for x in range(len(vnode_list))]
            else:
                ncpus = [None for x in range(len(vnode_list))]
        for (vn, cpus) in zip(vnode_list, ncpus):
            dict_match = {'state': state}
            if jobs is not None:
                dict_match['jobs'] = jobs
            if cpus is not None:
                dict_match['resources_assigned.ncpus'] = cpus
            if mem is not None:
                dict_match['resources_assigned.mem'] = mem

            self.server.expect(VNODE, dict_match, id=vn)

    def create_res(self, res_list):
        """
        creates custom resources
        """
        for res in res_list:
            self.server.manager(MGR_CMD_CREATE, RSC, res.a, id=res.res_name)

    def config_nodes(self, node_conf):
        """
        configures nodes as per the node_conf list parameter
        """
        self.mom_list = []
        self.vnode_dict = {}
        # Now start setting up and creating the vnodes

        for (mom, conf) in zip(self.momArr, node_conf):
            if mom.has_vnode_defs():
                mom.delete_vnode_defs()
            start_time = time.time()
            mom.create_vnodes(conf.a, conf.vnode_ct,
                              delall=False,
                              usenatvnode=conf.usenatvnode)
            self.vnode_dict[mom.shortname] = {'mom': mom,
                                              'res': conf}
            vn_ct = conf.vnode_ct
            if conf.usenatvnode:
                vn_ct -= 1
            elif vn_ct:
                self.vnode_dict[mom.shortname]['res'] = None
            vstat = deepcopy(conf.a)
            vstat['state'] = 'free'
            for n in range(vn_ct):
                vnid = mom.shortname + '[' + str(n) + ']'
                self.server.expect(NODE, id=vnid, attrib=vstat)
                self.vnode_dict[vnid] = {'mom': mom,
                                         'res': conf}
            if not conf.usenatvnode:
                if not vn_ct:
                    nvstat = deepcopy(conf.a)
                else:
                    nvstat = {}
                nvstat['state'] = 'free'
                self.server.expect(NODE, id=mom.shortname, attrib=nvstat)
            mom.log_match("copy hook-related file request received",
                          starttime=start_time)
            self.mom_list.append(mom)

    def setUp(self):

        if len(self.moms) != 5:
            self.skip_test(reason="need 5 mom hosts: " +
                           "-p moms=<m1>:<m2>:<m3>:<m4>:<m5>")

        TestFunctional.setUp(self)
        Job.dflt_attributes[ATTR_k] = 'oe'

        self.server.cleanup_jobs()

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momC = self.moms.values()[2]
        self.momD = self.moms.values()[3]
        self.momE = self.moms.values()[4]

        self.momArr = [self.momA, self.momB, self.momC, self.momD, self.momE]

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        self.hostC = self.momC.shortname
        self.hostD = self.momD.shortname
        self.hostE = self.momE.shortname

        self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        if sys.platform in ('cygwin', 'win32'):
            SLEEP_CMD = "pbs-sleep"
        else:
            SLEEP_CMD = "/bin/sleep"

        self.rel_nodes_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_release_nodes')

    def tearDown(self):
        self.momA.signal("-CONT")
        self.momB.signal("-CONT")
        self.momC.signal("-CONT")
        self.momD.signal("-CONT")
        self.momE.signal("-CONT")
        TestFunctional.tearDown(self)
        # Delete managers and operators if added
        attrib = ['operators', 'managers']
        self.server.manager(MGR_CMD_UNSET, SERVER, attrib)

    def flatten_node_res(self, nc_list):
        """
        returns a list of flattened node resource dictionary
        """
        ret = []
        for nc in nc_list:
            ret.append(','.join("%s=%r" % (key, val) for key, val in
                                sorted(nc.a.items())))
        return ret

    def get_mom_vn_execvn(self, execvnode):
        """
        will get vnode list and corresponding mom list from
        the execvnode paramter
        """
        mlist = []
        vlist = []
        for chunk in execvnode:
            if chunk.vchunk:
                mlist.append(self.vnode_dict[chunk.vchunk[0].vnode]
                             ['mom'].shortname)
                for vch in chunk.vchunk:
                    vlist.append(vch.vnode)
            else:
                mlist.append(self.vnode_dict[chunk.vnode]['mom'].shortname)
                vlist.append(chunk.vnode)
        return (mlist, vlist)

    def common_tc_flow(self, tc):
        """
        Defines a common test case flow, the configuration of a test case is
        passed using the 'tc' argument
        """
        # 1. submit the job wih select spec
        a = {'Resource_List.select': tc.qsub_sel, ATTR_S: '/bin/bash'}
        job = Job(TEST_USER, attrs=a)
        if tc.use_script is True:
            job.create_script(self.jobscript)
        else:
            job.set_sleep_time(1000)
        jid = self.server.submit(job)

        # 2. validate job state and attributes.
        self.server.expect(JOB, tc.job_stat, id=jid)
        js = self.server.status(JOB, [ATTR_execvnode, ATTR_exechost], jid)[0]

        # 3. extract vnode list and mom list from execvnode
        (mlist, vlist) = self.get_mom_vn_execvn(job.execvnode())
        actual_res = self.flatten_node_res([self.vnode_dict[vn]['res'] for vn
                                            in vlist])

        # 4. compare actual resources allocated vs expected
        self.assertEqual(Counter(tc.expected_res), Counter(actual_res),
                         'Actual Vnode resources are not as expected')

        # 5. validate hostnames in exechost correspond to vnodes in execvnode
        self.assertEqual(Counter(mlist),
                         Counter([list(x.keys())[0] for x in
                                  job.exechost().hosts]),
                         'exechost failed to correspond with execvnode')

        # 6. check assigned vnodes are in job-busy state
        self.match_vnode_status(vlist, 'job-busy',
                                [self.vnode_dict[x]['res'].a[
                                 'resources_available.ncpus'] for x in vlist])

        # 7. validate PBS_NODEFILE
        self.pbs_nodefile_match_exec_host(jid, mlist, tc.sched_sel)

        # 8. (drum rolls) submit release node command
        if tc.use_script is False:
            cmd = [self.rel_nodes_cmd, '-j', jid, '-k', tc.keep_sel]
            ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                         runas=tc.rel_user)
            self.assertEqual(ret['rc'], 0)
        else:
            time.sleep(2)
            self.server.sigjob(jid, 'INT')

        # 9. verify job state and attributes are as expected
        self.server.expect(JOB, tc.job_stat_after, id=jid)

        js = self.server.status(JOB, [ATTR_execvnode, ATTR_exechost], jid)[0]

        # 10. extract vnode list and mom list from execvnode
        (mlist_new, vlist_new) = self.get_mom_vn_execvn(job.execvnode())
        actual_res_after = self.flatten_node_res([self.vnode_dict[vn]['res']
                                                  for vn in vlist_new])

        # 11. compare actual resources allocated vs expected
        self.assertEqual(Counter(tc.expected_res_after),
                         Counter(actual_res_after),
                         'Actual Vnode resources are not as expected')

        # 12. validate hostnames in exechost correspond to vnodes in execvnode
        self.assertEqual(Counter(mlist_new),
                         Counter([list(x.keys())[0] for x in
                                 job.exechost().hosts]),
                         'exechost failed to correspond with execvnode')

        if tc.skip_vnode_status_check is False:
            # 13. check assigned vnodes are in job-busy state
            self.match_vnode_status(vlist_new, 'job-busy',
                                    [self.vnode_dict[x]['res'].a[
                                     'resources_available.ncpus'] for x in
                                     vlist_new])

            # 14. compute freed vnodes resource list
            freed_res = list(set(vlist) - set(vlist_new))

            # 15. check freed vnodes are in 'free' state
            self.match_vnode_status(freed_res, 'free')

        # 16. validate PBS_NODEFILE again
        self.pbs_nodefile_match_exec_host(jid, mlist_new, tc.sched_sel_after)

    def test_basic_use_case_ncpus(self, rel_user=TEST_USER, use_script=False):
        """
        submit job with below select string
        'select=ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2'
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=2+ncpus=3:mpiprocs=2'
        """
        n1 = n_conf({'resources_available.ncpus': '1'})
        n2 = n_conf({'resources_available.ncpus': '2'})
        n3 = n_conf({'resources_available.ncpus': '3'})

        nc_list = [n1, n2, n2, n3, n3]
        # 1. configure the cluster
        self.config_nodes(nc_list)

        args = {
            'qsub_sel': 'ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2',
            'keep_sel': 'select=ncpus=2+ncpus=3:mpiprocs=2',
            'sched_sel': '1:ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': rel_user,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2+1:ncpus=3:mpiprocs=2',
            'sched_sel_after': '1:ncpus=1+1:ncpus=2+1:ncpus=3:mpiprocs=2',
            'expected_res_after': self.flatten_node_res([n1, n2, n3])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.mpiprocs': 4,
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.mpiprocs': 2,
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        if use_script is True:
            args['use_script'] = True

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_basic_use_case_ncpus_as_root(self):
        """
        submit job with below select string
        'select=ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2'
        as root release nodes except the MS and nodes matching below sub
        select string 'select=ncpus=2+ncpus=3:mpiprocs=2'
        """
        self.test_basic_use_case_ncpus(rel_user=ROOT_USER)

    def test_basic_use_case_ncpus_using_script(self):
        """
        Like test_basic_use_case_ncpus test except instead of calling
        pbs_release_nodes from a command line, it is executed
        inside the job script of a running job. Same results.
        """
        self.jobscript = \
            "#!/bin/sh\n" + \
            "trap 'pbs_release_nodes -k select=ncpus=2+ncpus=3:mpiprocs=2" + \
            ";sleep 1000;exit 0' INT\n" + \
            "sleep 1000\n" + \
            "exit 0"
        self.test_basic_use_case_ncpus(use_script=True)

    def test_with_a_custom_str_res(self, partial_res_list=False):
        """
        submit job with select string containing a custom string resource
        'select=ncpus=1+ncpus=2:model=abc+ncpus=2:model=def+ncpus=3:model=def+
        ncpus=3:model=xyz'
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=2:model=def+ncpus=3:model=def'
        """
        # 1. create a custom string resources
        str_res = 'model'
        model_a = 'abc'
        model_b = 'def'
        model_c = 'xyz'
        self.create_res([new_res(str_res, self.res_s_h)])

        # 2. add the custom resource to sched_config
        self.scheduler.add_resource(str_res)

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2_a = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+str_res: model_a})
        n2_b = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+str_res: model_b})
        n3_b = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+str_res: model_b})
        n3_c = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+str_res: model_c})

        nc_list = [n1, n2_a, n2_b, n3_b, n3_c]
        # 3. configure the cluster
        self.config_nodes(nc_list)

        if partial_res_list is False:
            keep_sel = ('select=ncpus=2:model='+model_b +
                        '+ncpus=3:model='+model_b)
        else:
            keep_sel = 'select=2:model='+model_b

        args = {
            'qsub_sel': 'ncpus=1+ncpus=2:model='+model_a+'+ncpus=2:model=' +
            model_b+'+ncpus=3:model='+model_b+'+ncpus=3:model='+model_c,
            'keep_sel': keep_sel,
            'sched_sel': '1:ncpus=1+1:ncpus=2:model='+model_a +
            '+1:ncpus=2:model='+model_b+'+1:ncpus=3:model='+model_b +
            '+1:ncpus=3:model='+model_c,
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2:model='+model_b +
            '+1:ncpus=3:model='+model_b,
            'sched_sel_after': '1:ncpus=1+1:ncpus=2:model='+model_b +
            '+1:ncpus=3:model='+model_b,
            'expected_res_after': self.flatten_node_res([n1, n2_b, n3_b])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_with_a_custom_str_res_partial_list(self, partial_res_list=False):
        """
        submit job with select string containing a custom string resource
        'select=ncpus=1+ncpus=2:model=abc+ncpus=2:model=def+ncpus=3:model=def+
        ncpus=3:model=xyz'
        release nodes except the MS and nodes matching below sub select string
        containing partial resource list
        'select=2:model=def'
        """
        self.test_with_a_custom_str_res(partial_res_list=True)

    def test_with_a_custom_bool_res(self, partial_res_list=False):
        """
        submit job with select string containing a custom boolean resource
        'select=ncpus=1+ncpus=2:bigmem=true+ncpus=2+
        ncpus=3:bigmem=true+ncpus=3'
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=2:bigmem=true+ncpus=3:bigmem=true'
        """
        # 1. create a custom string resources
        bool_res = 'bigmem'
        self.create_res([new_res(bool_res, self.res_b_h)])

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2_a = n_conf({'resources_available.ncpus': '2'})
        n2_b = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+bool_res: 'True'})
        n3_b = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+bool_res: 'True'})
        n3_c = n_conf({'resources_available.ncpus': '3'})

        nc_list = [n1, n2_a, n2_b, n3_b, n3_c]
        # 2. configure the cluster
        self.config_nodes(nc_list)

        if partial_res_list is False:
            keep_sel = ('select=ncpus=2:'+bool_res+'=true+ncpus=3:' +
                        bool_res+'=true')
        else:
            keep_sel = 'select=2:'+bool_res+'=true'

        args = {
            'qsub_sel': 'ncpus=1+ncpus=2:'+bool_res+'=true+ncpus=2+ncpus=3:' +
            bool_res+'=true+ncpus=3',
            'keep_sel': keep_sel,
            'sched_sel': '1:ncpus=1+1:ncpus=2:'+bool_res +
            '=True+1:ncpus=2+1:ncpus=3:'+bool_res+'=True+1:ncpus=3',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2:'+bool_res +
            '=True+1:ncpus=3:'+bool_res+'=True',
            'sched_sel_after': '1:ncpus=1+1:ncpus=2:'+bool_res +
            '=True+1:ncpus=3:'+bool_res+'=True',
            'expected_res_after': self.flatten_node_res([n1, n2_b, n3_b])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_with_a_custom_bool_res_partial_list(self,
                                                 partial_res_list=False):
        """
        submit job with select string containing a boolean resource
        'select=ncpus=1+ncpus=2:bigmem=true+ncpus=2+
        ncpus=3:bigmem=true+ncpus=3'
        release nodes except the MS and nodes matching below sub select string
        containing partial resource list
        'select=2:bigmem=true'
        """
        self.test_with_a_custom_bool_res(partial_res_list=True)

    def test_with_a_custom_long_res(self, partial_res_list=False):
        """
        submit job with select string containing a custom long resource
        'select=ncpus=1+ncpus=2:longres=7+ncpus=2:longres=9+
        ncpus=3:longres=9+ncpus=3:longres=10'
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=2:longres=9+ncpus=3:longres=9'
        """
        # 1. create a custom string resources
        long_res = 'longres'
        self.create_res([new_res(long_res, self.res_l_nh)])

        # 2. add the custom resource to sched_config
        self.scheduler.add_resource(long_res)

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2_a = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+long_res: '7'})
        n2_b = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+long_res: '9'})
        n3_b = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+long_res: '9'})
        n3_c = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+long_res: '10'})

        nc_list = [n1, n2_a, n2_b, n3_b, n3_c]
        # 3. configure the cluster
        self.config_nodes(nc_list)

        if partial_res_list is False:
            keep_sel = ('select=ncpus=2:'+long_res+'=9+ncpus=3:' +
                        long_res+'=9')
        else:
            keep_sel = 'select=2:'+long_res+'=9'

        args = {
            'qsub_sel': 'ncpus=1+ncpus=2:'+long_res+'=7+ncpus=2:'+long_res +
            '=9+ncpus=3:'+long_res+'=9+ncpus=3:'+long_res+'=10',
            'keep_sel': keep_sel,
            'sched_sel': '1:ncpus=1+1:ncpus=2:'+long_res+'=7+1:ncpus=2:' +
            long_res+'=9+1:ncpus=3:'+long_res+'=9+1:ncpus=3:'+long_res+'=10',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2:'+long_res +
            '=9+1:ncpus=3:'+long_res+'=9',
            'sched_sel_after': '1:ncpus=1+1:ncpus=2:'+long_res +
            '=9+1:ncpus=3:'+long_res+'=9',
            'expected_res_after': self.flatten_node_res([n1, n2_b, n3_b])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.longres': 35,
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.longres': 18,
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_with_a_custom_long_partial_list(self, partial_res_list=False):
        """
        submit job with select string containing a custom long resource
        'select=ncpus=1+ncpus=2:longres=7+ncpus=2:longres=9+
        ncpus=3:longres=9+ncpus=3:longres=10'
        release nodes except the MS and nodes matching below sub select string
        containing partial resource list
        'select=2:longres=9'
        """
        self.test_with_a_custom_long_res(partial_res_list=True)

    def test_with_a_custom_size_res(self, partial_res_list=False):
        """
        submit job with select string containing a custom size resource
        'select=ncpus=1+ncpus=2:sizres=7k+ncpus=2:sizres=9k+
        ncpus=3:sizres=9k+ncpus=3:sizres=10k'
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=2:sizres=9k+ncpus=3:sizres=9k'
        """
        # 1. create a custom string resources
        size_res = 'sizres'
        self.create_res([new_res(size_res, self.res_sz_nh)])

        # 2. add the custom resource to sched_config
        self.scheduler.add_resource(size_res)

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2_a = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+size_res: '7kb'})
        n2_b = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+size_res: '9kb'})
        n3_b = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+size_res: '9kb'})
        n3_c = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+size_res: '10kb'})

        nc_list = [n1, n2_a, n2_b, n3_b, n3_c]
        # 3. configure the cluster
        self.config_nodes(nc_list)

        if partial_res_list is False:
            keep_sel = ('select=ncpus=2:'+size_res+'=9k+ncpus=3:' +
                        size_res+'=9k')
        else:
            keep_sel = 'select=2:'+size_res+'=9k'

        args = {
            'qsub_sel': 'ncpus=1+ncpus=2:'+size_res+'=7k+ncpus=2:'+size_res +
            '=9k+ncpus=3:'+size_res+'=9k+ncpus=3:'+size_res+'=10k',
            'keep_sel': keep_sel,
            'sched_sel': '1:ncpus=1+1:ncpus=2:'+size_res+'=7kb+1:ncpus=2:' +
            size_res+'=9kb+1:ncpus=3:'+size_res+'=9kb+1:ncpus=3:'+size_res +
            '=10kb',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2:'+size_res +
            '=9kb+1:ncpus=3:'+size_res+'=9kb',
            'sched_sel_after': '1:ncpus=1+1:ncpus=2:'+size_res +
            '=9kb+1:ncpus=3:'+size_res+'=9kb',
            'expected_res_after': self.flatten_node_res([n1, n2_b, n3_b])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.sizres': '35kb',
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.sizres': '18kb',
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_with_a_custom_size_partial_list(self, partial_res_list=False):
        """
        submit job with select string containing a custom size resource
        'select=ncpus=1+ncpus=2:sizres=7k+ncpus=2:sizres=9k+
        ncpus=3:sizres=9k+ncpus=3:sizres=10k'
        release nodes except the MS and nodes matching below sub select string
        containing partial resource list
        'select=2:sizres=9k'
        """
        self.test_with_a_custom_size_res(partial_res_list=True)

    def test_with_a_custom_float_res(self, partial_res_list=False):
        """
        submit job with select string containing a custom float resource
        'select=ncpus=1+ncpus=2:fltres=7.1+ncpus=2:fltres=9.1+
        ncpus=3:fltres=9.1+ncpus=3:fltres=10.1'
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=2:fltres=9.1+ncpus=3:fltres=9.1'
        """
        # 1. create a custom string resources
        float_res = 'fltres'
        self.create_res([new_res(float_res, self.res_f_nh)])

        # 2. add the custom resource to sched_config
        self.scheduler.add_resource(float_res)

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2_a = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+float_res: '7.1'})
        n2_b = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+float_res: '9.1'})
        n3_b = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+float_res: '9.1'})
        n3_c = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+float_res: '10.1'})

        nc_list = [n1, n2_a, n2_b, n3_b, n3_c]
        # 3. configure the cluster
        self.config_nodes(nc_list)

        if partial_res_list is False:
            keep_sel = ('select=ncpus=2:'+float_res+'=9.1+ncpus=3:' +
                        float_res+'=9.1')
        else:
            keep_sel = 'select=2:'+float_res+'=9.1'

        args = {
            'qsub_sel': 'ncpus=1+ncpus=2:'+float_res+'=7.1+ncpus=2:' +
            float_res+'=9.1+ncpus=3:'+float_res+'=9.1+ncpus=3:' +
            float_res+'=10.1',
            'keep_sel': keep_sel,
            'sched_sel': '1:ncpus=1+1:ncpus=2:'+float_res+'=7.1+1:ncpus=2:' +
            float_res+'=9.1+1:ncpus=3:'+float_res+'=9.1+1:ncpus=3:'+float_res +
            '=10.1',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2:'+float_res +
            '=9.1+1:ncpus=3:'+float_res+'=9.1',
            'sched_sel_after': '1:ncpus=1+1:ncpus=2:'+float_res +
            '=9.1+1:ncpus=3:'+float_res+'=9.1',
            'expected_res_after': self.flatten_node_res([n1, n2_b, n3_b])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.fltres': '35.4',
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.fltres': '18.2',
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_with_a_custom_float_partial_list(self, partial_res_list=False):
        """
        submit job with select string containing a custom float resource
        'select=ncpus=1+ncpus=2:fltres=7.1+ncpus=2:fltres=9.1+
        ncpus=3:fltres=9.1+ncpus=3:fltres=10.1'
        release nodes except the MS and nodes matching below sub select string
        containing partial resource list
        'select=2:fltres=9.1'
        """
        self.test_with_a_custom_float_res(partial_res_list=True)

    def test_with_mixed_custom_res(self, partial_res_list=False):
        """
        submit job with select string containing a mix of all types of
        custom resources
        'select=ncpus=1+ncpus=2:model=abc:longres=7:sizres=7k:fltres=7.1+
        ncpus=2:model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1+ncpus=3:
        model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1+ncpus=3:
        model=xyz:longres=10:sizres=10k:fltres=10.1'
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=2:model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1+
        ncpus=3:model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1'
        """
        # 1. create a custom string resources
        str_res = 'model'
        model_a = 'abc'
        model_b = 'def'
        model_c = 'xyz'
        bool_res = 'bigmem'
        long_res = 'longres'
        size_res = 'sizres'
        float_res = 'fltres'

        self.create_res(
            [
                new_res(str_res, self.res_s_h),
                new_res(bool_res, self.res_b_h),
                new_res(long_res, self.res_l_nh),
                new_res(size_res, self.res_sz_nh),
                new_res(float_res, self.res_f_nh)
            ])

        # 2. add the custom resource to sched_config
        self.scheduler.add_resource(str_res)
        self.scheduler.add_resource(long_res)
        self.scheduler.add_resource(size_res)
        self.scheduler.add_resource(float_res)

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2_a = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+str_res: model_a,
                       'resources_available.'+long_res: '7',
                       'resources_available.'+size_res: '7kb',
                       'resources_available.'+float_res: '7.1'})
        n2_b = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+str_res: model_b,
                       'resources_available.'+bool_res: 'True',
                       'resources_available.'+long_res: '9',
                       'resources_available.'+size_res: '9kb',
                       'resources_available.'+float_res: '9.1'})
        n3_b = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+str_res: model_b,
                       'resources_available.'+bool_res: 'True',
                       'resources_available.'+long_res: '9',
                       'resources_available.'+size_res: '9kb',
                       'resources_available.'+float_res: '9.1'})
        n3_c = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+str_res: model_c,
                       'resources_available.'+long_res: '10',
                       'resources_available.'+size_res: '10kb',
                       'resources_available.'+float_res: '10.1'})

        nc_list = [n1, n2_a, n2_b, n3_b, n3_c]
        # 3. configure the cluster
        self.config_nodes(nc_list)

        if partial_res_list is False:
            keep_sel = ('select=ncpus=2:model='+model_b+':' +
                        bool_res+'=true:'+long_res+'=9:'+size_res+'=9k:' +
                        float_res+'=9.1+ncpus=3:model='+model_b+':'+bool_res +
                        '=true:'+long_res+'=9:'+size_res+'=9k:'+float_res +
                        '=9.1')
        else:
            keep_sel = 'select=2:'+bool_res+'=true'

        args = {
            'qsub_sel': 'ncpus=1+ncpus=2:model='+model_a+':'+long_res+'=7:' +
            size_res+'=7k:'+float_res+'=7.1+ncpus=2:model='+model_b+':' +
            bool_res+'=true:'+long_res+'=9:'+size_res+'=9k:'+float_res +
            '=9.1+ncpus=3:model='+model_b+':'+bool_res+'=true:'+long_res +
            '=9:'+size_res+'=9k:'+float_res+'=9.1+ncpus=3:model='+model_c +
            ':'+long_res+'=10:'+size_res+'=10k:'+float_res+'=10.1',
            'keep_sel': keep_sel,
            'sched_sel': '1:ncpus=1+1:ncpus=2:model='+model_a+':'+long_res +
            '=7:'+size_res+'=7kb:'+float_res+'=7.1+1:ncpus=2:model='+model_b +
            ':'+bool_res+'=True:'+long_res+'=9:'+size_res+'=9kb:'+float_res +
            '=9.1+1:ncpus=3:model='+model_b+':'+bool_res+'=True:'+long_res +
            '=9:'+size_res+'=9kb:'+float_res+'=9.1+1:ncpus=3:model='+model_c +
            ':'+long_res+'=10:'+size_res+'=10kb:'+float_res+'=10.1',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2:model=' +
            model_b+':'+bool_res+'=True:'+long_res+'=9:'+size_res +
            '=9kb:'+float_res +
            '=9.1+1:ncpus=3:model='+model_b+':'+bool_res+'=True:'+long_res +
            '=9:'+size_res+'=9kb:'+float_res+'=9.1',
            'sched_sel_after': '1:ncpus=1+1:ncpus=2:model=' +
            model_b+':'+bool_res+'=True:'+long_res+'=9:'+size_res+'=9kb:' +
            float_res+'=9.1+1:ncpus=3:model='+model_b+':'+bool_res+'=True:' +
            long_res+'=9:'+size_res+'=9kb:'+float_res+'=9.1',
            'expected_res_after': self.flatten_node_res([n1, n2_b, n3_b])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.longres': 35,
                    'Resource_List.fltres': '35.4',
                    'Resource_List.sizres': '35kb',
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.longres': 18,
                          'Resource_List.sizres': '18kb',
                          'Resource_List.fltres': '18.2',
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_with_mixed_custom_res_partial_list(self, partial_res_list=False):
        """
        submit job with select string containing a mix of all types of
        custom resources
        'select=ncpus=1+ncpus=2:model=abc:longres=7:sizres=7k:fltres=7.1+
        ncpus=2:model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1+ncpus=3:
        model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1+ncpus=3:
        model=xyz:longres=10:sizres=10k:fltres=10.1'
        release nodes except the MS and nodes matching below sub select string
        containing partial resource list
        'select=2:bigmem=true'
        """
        self.test_with_mixed_custom_res(partial_res_list=True)

    def test_schunk_use_case(self, release_partial_schunk=False):
        """
        submit job with below select string
        'ncpus=1+2:ncpus=6+2:ncpus=9:mpiprocs=2'
        cluster is configured such that we get 4 superchunks
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=6+ncpus=9:mpiprocs=2'
        so that whole super chunks are released or kept
        """
        n1 = n_conf({'resources_available.ncpus': '1'})
        n2 = n_conf({'resources_available.ncpus': '2'}, 3)
        n3 = n_conf({'resources_available.ncpus': '3'}, 3)

        nc_list = [n1, n2, n2, n3, n3]
        # 1. configure the cluster
        self.config_nodes(nc_list)

        if release_partial_schunk is False:
            keep_sel = 'select=ncpus=6+ncpus=9:mpiprocs=2'
            expected_res_list = [n1, n2, n2, n2, n3, n3, n3]
        else:
            keep_sel = 'select=ncpus=4+ncpus=6:mpiprocs=2'
            expected_res_list = [n1, n2, n2, n3, n3]

        args = {
            'qsub_sel': 'ncpus=1+2:ncpus=6+2:ncpus=9:mpiprocs=2',
            'keep_sel': keep_sel,
            'sched_sel': '1:ncpus=1+2:ncpus=6+2:ncpus=9:mpiprocs=2',
            'expected_res': self.flatten_node_res(
                [n1, n2, n2, n2, n2, n2, n2, n3, n3, n3, n3, n3, n3]),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=6+1:ncpus=9:mpiprocs=2',
            'sched_sel_after': '1:ncpus=1+1:ncpus=6+1:ncpus=9:mpiprocs=2',
            'expected_res_after': self.flatten_node_res(expected_res_list)
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.mpiprocs': 4,
                    'Resource_List.ncpus': 31,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.mpiprocs': 2,
                          'Resource_List.ncpus': 16,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        if release_partial_schunk is True:
            args['skip_vnode_status_check'] = True

        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_schunk_partial_release_use_case(self):
        """
        submit job with below select string
        'ncpus=1+2:ncpus=6+2:ncpus=9:mpiprocs=2'
        cluster is configured such that we get 4 superchungs
        release nodes except the MS and nodes matching below sub select string
        'select=ncpus=4+ncpus=6:mpiprocs=2'
        so that some vnodes of super chunks are released or kept
        """
        self.test_schunk_use_case(release_partial_schunk=True)

    def test_release_nodes_error(self):
        """
        Tests erroneous cases:
        1. pbs_release_nodes -j <job-id> -a -k <select>
            "pbs_release_nodes: -a and -k options cannot be used together"
        2. pbs_release_nodes -j <job-id> -k <select> <node1>...
            "pbs_release_nodes: cannot supply node list with -k option"
        3. pbs_release_nodes -j <job-id> -k place=scatter
            "pbs_release_nodes: only a "select=" string is valid in -k option"
        4. pbs_release_nodes -j <job-id> -k <select containing undefined res>
            "pbs_release_nodes: Unknown resource: <undefined res name>"
        5. pbs_release_nodes -j <job-id> -k <unsatisfying/non-sub select>
            "pbs_release_nodes: Server returned error 15010 for job"
        6. pbs_release_nodes -j <job-id> -k <high node count>
            "pbs_release_nodes: Server returned error 15010 for job"
        """

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2 = n_conf({'resources_available.ncpus': '2'})
        n3 = n_conf({'resources_available.ncpus': '3'})

        nc_list = [n1, n2, n2, n3, n3]
        self.config_nodes(nc_list)
        qsub_sel = 'ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2'
        keep_sel = 'select=ncpus=2+ncpus=3:mpiprocs=2'
        job = Job(TEST_USER, attrs={'Resource_List.select': qsub_sel})
        job.set_sleep_time(1000)
        jid = self.server.submit(job)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # 1. "pbs_release_nodes: -a and -k options cannot be used together"
        cmd = [self.rel_nodes_cmd, '-j', jid, '-a', '-k', keep_sel]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: -a and -k options cannot be used together'))

        # 2. "pbs_release_nodes: cannot supply node list with -k option"
        cmd = [self.rel_nodes_cmd, '-j', jid, '-k', keep_sel,
               list(self.vnode_dict.keys())[2]]
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: cannot supply node list with -k option'))

        # 3. "pbs_release_nodes: only a "select=" string is valid in -k option"
        cmd = [self.rel_nodes_cmd, '-j', jid, '-k', 'place=scatter']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: only a "select=" string is valid in -k option'
            ))

        # 4. "pbs_release_nodes: Unknown resource: <undefined res name>"
        cmd = [self.rel_nodes_cmd, '-j', jid, '-k',
               'select=ncpus=2:unkownres=3']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: Unknown resource: unkownres'))

        # 5. "pbs_release_nodes: Server returned error 15010 for job"
        cmd = [self.rel_nodes_cmd, '-j', jid, '-k', 'select=ncpus=4']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: Server returned error 15010 for job'))

        # 6. "pbs_release_nodes: Server returned error 15010 for job"
        cmd = [self.rel_nodes_cmd, '-j', jid, '-k', '5']
        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: Server returned error 15010 for job'))

    def test_node_count(self, rel_user=TEST_USER, use_script=False):
        """
        submit job with below select string
        'select=ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2'
        release nodes except the MS and 2 nodes
        """
        n1 = n_conf({'resources_available.ncpus': '1'})
        n2 = n_conf({'resources_available.ncpus': '2'})
        n3 = n_conf({'resources_available.ncpus': '3'})

        nc_list = [n1, n2, n2, n3, n3]
        # 1. configure the cluster
        self.config_nodes(nc_list)

        args = {
            'qsub_sel': 'ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2',
            'keep_sel': '2',
            'sched_sel': '1:ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': rel_user,
            'qsub_sel_after': '1:ncpus=1+2:ncpus=2',
            'sched_sel_after': '1:ncpus=1+2:ncpus=2',
            'expected_res_after': self.flatten_node_res([n1, n2, n2])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.mpiprocs': 4,
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.ncpus': 5,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        if use_script is True:
            args['use_script'] = True

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_node_count_as_root(self):
        """
        submit job with below select string
        'select=ncpus=1+2:ncpus=2+2:ncpus=3:mpiprocs=2'
        as root release nodes except the MS and 2 nodes
        """
        self.test_node_count(rel_user=ROOT_USER)

    def test_node_count_using_script(self):
        """
        Like test_node_count test except instead of calling
        pbs_release_nodes from a command line, it is executed
        inside the job script of a running job. Same results.
        """
        self.jobscript = \
            "#!/bin/sh\n" + \
            "trap 'pbs_release_nodes -k 2" + \
            ";sleep 1000;exit 0' INT\n" + \
            "sleep 1000\n" + \
            "exit 0"
        self.test_node_count(use_script=True)

    def test_node_count_with_mixed_custom_res(self):
        """
        submit job with select string containing a mix of all types of
        custom resources
        'select=ncpus=1+ncpus=2:model=abc:longres=7:sizres=7k:fltres=7.1+
        ncpus=2:model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1+ncpus=3:
        model=def:bigmem=true:longres=9:sizres=9k:fltres=9.1+ncpus=3:
        model=xyz:longres=10:sizres=10k:fltres=10.1'
        release nodes except the MS and 2 nodes
        """
        # 1. create a custom string resources
        str_res = 'model'
        model_a = 'abc'
        model_b = 'def'
        model_c = 'xyz'
        bool_res = 'bigmem'
        long_res = 'longres'
        size_res = 'sizres'
        float_res = 'fltres'

        self.create_res(
            [
                new_res(str_res, self.res_s_h),
                new_res(bool_res, self.res_b_h),
                new_res(long_res, self.res_l_nh),
                new_res(size_res, self.res_sz_nh),
                new_res(float_res, self.res_f_nh)
            ])

        # 2. add the custom resource to sched_config
        self.scheduler.add_resource(str_res)
        self.scheduler.add_resource(long_res)
        self.scheduler.add_resource(size_res)
        self.scheduler.add_resource(float_res)

        n1 = n_conf({'resources_available.ncpus': '1'})
        n2_a = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+str_res: model_a,
                       'resources_available.'+long_res: '7',
                       'resources_available.'+size_res: '7kb',
                       'resources_available.'+float_res: '7.1'})
        n2_b = n_conf({'resources_available.ncpus': '2',
                       'resources_available.'+str_res: model_b,
                       'resources_available.'+bool_res: 'True',
                       'resources_available.'+long_res: '9',
                       'resources_available.'+size_res: '9kb',
                       'resources_available.'+float_res: '9.1'})
        n3_b = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+str_res: model_b,
                       'resources_available.'+bool_res: 'True',
                       'resources_available.'+long_res: '9',
                       'resources_available.'+size_res: '9kb',
                       'resources_available.'+float_res: '9.1'})
        n3_c = n_conf({'resources_available.ncpus': '3',
                       'resources_available.'+str_res: model_c,
                       'resources_available.'+long_res: '10',
                       'resources_available.'+size_res: '10kb',
                       'resources_available.'+float_res: '10.1'})

        nc_list = [n1, n2_a, n2_b, n3_b, n3_c]
        # 3. configure the cluster
        self.config_nodes(nc_list)

        args = {
            'qsub_sel': 'ncpus=1+ncpus=2:model='+model_a+':'+long_res+'=7:' +
            size_res+'=7k:'+float_res+'=7.1+ncpus=2:model='+model_b+':' +
            bool_res+'=true:'+long_res+'=9:'+size_res+'=9k:'+float_res +
            '=9.1+ncpus=3:model='+model_b+':'+bool_res+'=true:'+long_res +
            '=9:'+size_res+'=9k:'+float_res+'=9.1+ncpus=3:model='+model_c +
            ':'+long_res+'=10:'+size_res+'=10k:'+float_res+'=10.1',
            'keep_sel': '2',
            'sched_sel': '1:ncpus=1+1:ncpus=2:model='+model_a+':'+long_res +
            '=7:'+size_res+'=7kb:'+float_res+'=7.1+1:ncpus=2:model='+model_b +
            ':'+bool_res+'=True:'+long_res+'=9:'+size_res+'=9kb:'+float_res +
            '=9.1+1:ncpus=3:model='+model_b+':'+bool_res+'=True:'+long_res +
            '=9:'+size_res+'=9kb:'+float_res+'=9.1+1:ncpus=3:model='+model_c +
            ':'+long_res+'=10:'+size_res+'=10kb:'+float_res+'=10.1',
            'expected_res': self.flatten_node_res(nc_list),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+1:ncpus=2:model=' +
            model_a+':'+long_res+'=7:'+size_res+'=7kb:'+float_res +
            '=7.1+1:ncpus=3:model='+model_c+':'+long_res+'=10:'+size_res +
            '=10kb:'+float_res+'=10.1',
            'sched_sel_after': '1:ncpus=1+1:ncpus=2:model=' +
            model_a+':'+long_res+'=7:'+size_res+'=7kb:'+float_res +
            '=7.1+1:ncpus=3:model='+model_c+':'+long_res+'=10:'+size_res +
            '=10kb:'+float_res+'=10.1',
            'expected_res_after': self.flatten_node_res([n1, n2_a, n3_c])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.longres': 35,
                    'Resource_List.fltres': '35.4',
                    'Resource_List.sizres': '35kb',
                    'Resource_List.ncpus': 11,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.longres': 17,
                          'Resource_List.sizres': '17kb',
                          'Resource_List.fltres': '17.2',
                          'Resource_List.ncpus': 6,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after
        tc = test_config(**args)
        self.common_tc_flow(tc)

    def test_node_count_schunk_use_case(self):
        """
        submit job with below select string
        'ncpus=1+2:ncpus=6+2:ncpus=9:mpiprocs=2'
        cluster is configured such that we get 4 superchunks
        release nodes except the MS and 2 nodes
        """
        n1 = n_conf({'resources_available.ncpus': '1'})
        n2 = n_conf({'resources_available.ncpus': '2'}, 3)
        n3 = n_conf({'resources_available.ncpus': '3'}, 3)

        nc_list = [n1, n2, n2, n3, n3]
        # 1. configure the cluster
        self.config_nodes(nc_list)

        args = {
            'qsub_sel': 'ncpus=1+2:ncpus=6+2:ncpus=9:mpiprocs=2',
            'keep_sel': '2',
            'sched_sel': '1:ncpus=1+2:ncpus=6+2:ncpus=9:mpiprocs=2',
            'expected_res': self.flatten_node_res(
                [n1, n2, n2, n2, n2, n2, n2, n3, n3, n3, n3, n3, n3]),
            'rel_user': TEST_USER,
            'qsub_sel_after': '1:ncpus=1+2:ncpus=6',
            'sched_sel_after': '1:ncpus=1+2:ncpus=6',
            'expected_res_after': self.flatten_node_res(
                [n1, n2, n2, n2, n2, n2, n2])
            }

        job_stat = {'job_state': 'R',
                    'substate': 42,
                    'Resource_List.mpiprocs': 4,
                    'Resource_List.ncpus': 31,
                    'Resource_List.nodect': 5,
                    'Resource_List.select': args['qsub_sel'],
                    'schedselect': args['sched_sel']}

        args['job_stat'] = job_stat

        job_stat_after = {'job_state': 'R',
                          'substate': 42,
                          'Resource_List.ncpus': 13,
                          'Resource_List.nodect': 3,
                          'Resource_List.select': args['qsub_sel_after'],
                          'schedselect': args['sched_sel_after']}

        args['job_stat_after'] = job_stat_after

        tc = test_config(**args)
        self.common_tc_flow(tc)


================================================
FILE: test/tests/functional/pbs_node_sleep_state.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestNodeSleepState(TestFunctional):

    """
    This test suite contains regression tests for node sleep state
    """

    def test_node_set_sleep_state(self):
        """
        Tests node setting state to sleep
        """
        self.server.manager(MGR_CMD_SET, NODE, {'state': 'sleep'},
                            id=self.mom.shortname)
        self.server.expect(NODE, {'state': 'sleep'})
        # submit a job and it should remain in Q state
        j = Job(self.du.get_current_user())
        self.jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=self.jid)

    def test_node_state_sleep_to_free_manual(self):
        """
        Tests setting node state to free from sleep manually
        """
        self.test_node_set_sleep_state()
        self.server.manager(MGR_CMD_SET, NODE, {'state': 'free'},
                            id=self.mom.shortname)
        self.server.expect(NODE, {'state': 'free'})
        self.server.expect(JOB, {'job_state': 'R'}, id=self.jid)

    def test_node_state_sleep_to_free_on_node_restart(self):
        """
        Tests setting node state to free from sleep on node restart
        """
        self.test_node_set_sleep_state()
        self.mom.stop()
        self.server.expect(NODE, {'state': 'down,sleep'})
        self.mom.start()
        self.server.expect(NODE, {'state': 'free'})
        self.server.expect(JOB, {'job_state': 'R'}, id=self.jid)

    def test_node_state_offline_and_sleep_restart(self):
        """
        Tests setting node state to offline and sleep on restart node
        will still remain in offline
        """
        self.test_node_set_sleep_state()
        self.server.manager(MGR_CMD_SET, NODE, {'state': (INCR, 'offline')},
                            id=self.mom.shortname)
        self.mom.stop()
        self.server.expect(NODE, {'state': 'down,offline,sleep'})
        self.mom.start()
        self.server.expect(NODE, {'state': 'offline'})


================================================
FILE: test/tests/functional/pbs_nodes_json.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import json


class TestPbsnodes_json(TestFunctional):
    """
    Tests the json output of pbsnodes
    """

    def test_check_no_escape_json(self):
        """
        Test if the comment with no special characters is valid json
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'comment': '"hiha"'}, id=self.mom.shortname)
        cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                           'bin', 'pbsnodes') + ' -av -Fjson'
        n_out = self.du.run_cmd(self.server.hostname, cmd=cmd)['out']

        try:
            json.loads("\n".join(n_out))
        except ValueError:
            self.assertFalse(True, "Json failed to load")

    def test_check_newline_escape_json(self):
        """
        Test if the comment with newline is valid json
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'comment': '"hi\nha"'}, id=self.mom.shortname)
        cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                           'bin', 'pbsnodes') + ' -av -Fjson'
        n_out = self.du.run_cmd(self.server.hostname, cmd=cmd)['out']

        try:
            json.loads("\n".join(n_out))
        except ValueError:
            self.assertFalse(True, "Json failed to load")

    def test_check_tab_escape_json(self):
        """
        Test if the comment with tab is valid json
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'comment': '"hi\tha"'}, id=self.mom.shortname)
        cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                           'bin', 'pbsnodes') + ' -av -Fjson'
        n_out = self.du.run_cmd(self.server.hostname, cmd=cmd)['out']

        try:
            json.loads("\n".join(n_out))
        except ValueError:
            self.assertFalse(True, "Json failed to load")

    def test_check_quotes_escape_json(self):
        """
        Test if the comment with quotes is valid json
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'comment': '\'hi\"ha\''}, id=self.mom.shortname)
        cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                           'bin', 'pbsnodes') + ' -av -Fjson'
        n_out = self.du.run_cmd(self.server.hostname, cmd=cmd)['out']

        try:
            json.loads("\n".join(n_out))
        except ValueError:
            self.assertFalse(True, "Json failed to load")

    def test_check_reverse_solidus_escape_json(self):
        """
        Test if the comment with reverse solidus is valid json
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'comment': '"hi\\ha"'}, id=self.mom.shortname)
        cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                           'bin', 'pbsnodes') + ' -av -Fjson'
        n_out = self.du.run_cmd(self.server.hostname, cmd=cmd)['out']

        try:
            json.loads("\n".join(n_out))
        except ValueError:
            self.assertFalse(True, "Json failed to load")

    def test_empty_comment_json(self):
        """
        Test an empty node comment (only a space) under json.
        """

        self.server.manager(MGR_CMD_SET, NODE,
                            {'comment': ' '}, id=self.mom.shortname)
        cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                           'bin', 'pbsnodes') + ' -av -Fjson'
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd)
        n_out = "\n".join(ret['out'])
        try:
            json.loads(n_out)
        except ValueError:
            self.logger.info(n_out)
            self.assertFalse(True, "Json failed to load")


================================================
FILE: test/tests/functional/pbs_nodes_queues.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestNodesQueues(TestFunctional):

    def setUp(self):
        TestFunctional.setUp(self)
        self.server.add_resource('foo', 'string', 'h')

        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(
            a, 8, attrfunc=self.cust_attr)
        self.vn = ['%s[%d]' % (self.mom.shortname, i) for i in range(4)]
        a = {'queue_type': 'execution', 'started': 't', 'enabled': 't'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')

        self.server.manager(MGR_CMD_SET, NODE, {
                            'queue': 'workq2'}, id=self.vn)
        self.server.manager(MGR_CMD_SET, SERVER, {'node_group_key': 'foo'})
        self.server.manager(MGR_CMD_SET, SERVER, {'node_group_enable': 't'})

    def cust_attr(self, name, totnodes, numnode, attrib):
        a = {}
        if numnode % 2 == 0:
            a['resources_available.foo'] = 'A'
        else:
            a['resources_available.foo'] = 'B'
        return {**attrib, **a}

    def test_node_queue_assoc_ignored(self):
        """
        Issue with node grouping and nodes associated with queues.  If
        node_grouping is set at the server level, node/queue association is
        not honored
        """

        a = {'Resource_List.select': '2:ncpus=1',
             'Resource_List.place': 'vscatter', 'queue': 'workq2'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, 'exec_vnode', id=jid, op=SET)
        nodes = j.get_vnodes(j.exec_vnode)
        self.assertTrue((nodes[0] == self.vn[0] and
                         nodes[1] == self.vn[2]) or
                        (nodes[0] == self.vn[1] and
                         nodes[1] == self.vn[3]))


================================================
FILE: test/tests/functional/pbs_nonprint_characters.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import json
import os


class TestNonprintingCharacters(TestFunctional):
    """
    Test to check passing non-printable environment variables
    """

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        # Mapping of ASCII non-printable character to escaped representation
        self.npcat = {
            "\x00": "^@", "\x01": "^A", "\x02": "^B", "\x03": "^C",
            "\x04": "^D", "\x05": "^E", "\x06": "^F", "\x07": "^G",
            "\x08": "^H", "\x09": "^I", "\x0A": "^J", "\x0B": "^K",
            "\x0C": "^L", "\x0D": "^M", "\x0E": "^N", "\x0F": "^O",
            "\x10": "^P", "\x11": "^Q", "\x12": "^R", "\x13": "^S",
            "\x14": "^T", "\x15": "^U", "\x16": "^V", "\x17": "^W",
            "\x18": "^X", "\x19": "^Y", "\x1A": "^Z", "\x1B": "^[",
            "\x1C": "^\\", "\x1D": "^]", "\x1E": "^^", "\x1F": "^_"
        }

        # Exclude these:
        # NULL(\0) causes qsub error, LINE FEED(\n) causes error in expect()
        self.npch_exclude = ['\x00', '\x0A']

        # Characters displayed as is: TAB (\t), LINE FEED(\n)
        self.npch_asis = ['\x09', '\x0A']

        # Terminal control characters used in the tests
        self.bold = "\u001b[1m"
        self.red = "\u001b[31m"
        self.reset = "\u001b[0m"
        # Mapping of terminal control character to escaped representation
        self.bold_esc = "^[[1m"
        self.red_esc = "^[[31m"
        self.reset_esc = "^[[0m"

        self.ATTR_V = 'Full_Variable_List'
        api_to_cli.setdefault(self.ATTR_V, 'V')

        # Check if ShellShock fix for exporting shell function in bash exists
        # on this system and what "BASH_FUNC_" format to use
        foo_scr = """#!/bin/bash
foo() { a=B; echo $a; }
export -f foo
env | grep foo
unset -f foo
exit 0
"""
        self.script = """#PBS -V
env | grep -A2 BASH_FUNC_foo
foo
sleep 5
"""
        fn = self.du.create_temp_file(body=foo_scr)
        self.du.chmod(path=fn, mode=0o755)
        foo_msg = 'Failed to run foo_scr'
        ret = self.du.run_cmd(self.server.hostname, cmd=fn)
        self.assertEqual(ret['rc'], 0, foo_msg)
        msg = 'BASH_FUNC_'
        self.n = 'foo'
        for m in ret['out']:
            if m.find(msg) != -1:
                self.n = m.split('=')[0]
                continue

        # Client commands full path
        self.qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                      'bin', 'qstat')
        self.qmgr_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                     'bin', 'qmgr')
        self.pbsnodes_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                         'bin', 'pbsnodes')

    def create_and_submit_job(self, user=None, attribs=None, content=None,
                              content_interactive=None, preserve_env=False,
                              set_env={}):
        """
        Create the job object and submit it to the server as 'user',
        attributes list 'attribs' script 'content' or 'content_interactive',
        and to 'preserve_env' if interactive job.
        """
        if attribs is None:
            use_attribs = {}
        else:
            use_attribs = attribs
        retjob = Job(username=user, attrs=use_attribs)

        if content is not None:
            retjob.create_script(body=content)
        elif content_interactive is not None:
            retjob.interactive_script = content_interactive
            retjob.preserve_env = preserve_env
        return self.server.submit(retjob, env=set_env)

    def check_jobout(self, chk_var, jid, job_outfile, host=None):
        """
        Check if unescaped variable is in job output
        """
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=1)
        ret = self.du.cat(hostname=host, sudo=True, filename=job_outfile,
                          option="-v")
        j_output = ""
        if len(ret['out']) > 0:
            if '\t' in chk_var:
                j_output = '\n'.join(ret['out']).replace('\t\t', '\t')
            else:
                j_output = '\n'.join(ret['out']).replace('\t', '')
        self.assertIn(chk_var, j_output)
        self.logger.info('job output has: %s' % chk_var)

    def check_qstatout(self, chk_var, jid):
        """
        Check if escaped variable is in qstat -f output
        """
        cmd = [self.qstat_cmd, '-xf', jid]
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd)
        if '\t' in chk_var:
            job_str = ''.join(ret['out']).replace('\t\t', '\t')
        else:
            job_str = ''.join(ret['out']).replace('\t', '')
        self.assertIn(chk_var, job_str)
        self.logger.info('qstat -xf output has: %s' % chk_var)

    def test_nonprint_character_qsubv(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (x00), and LINE FEED (x0A) which will cause a qsub error,
        submit a job script with
        qsub -v "var1='A,B,<non-printable character>,C,D'"
        and check that the value with the character is passed correctly
        """
        uhost = PbsUser.get_user(TEST_USER).host
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            # variable to check if with escaped nonprinting character or not
            chk_var = r'var1=A\,B\,%s\,C\,D' % self.npcat[ch]
            if ch in self.npch_asis:
                chk_var = r'var1=A\,B\,%s\,C\,D' % ch
            if uhost is None or self.du.is_localhost(uhost):
                a = {ATTR_v: "var1=\'A,B,%s,C,D\'" % ch}
            else:
                a = {ATTR_v: r"var1=\'A\,B\,%s\,C\,D\'" % ch}
            script = ['sleep 10']
            script += ['env | grep var1']
            jid = self.create_and_submit_job(attribs=a, content=script)
            # Check if qstat -f output contains the escaped character
            self.check_qstatout(chk_var, jid)
            # Check if job output contains the character as is
            qstat = self.server.status(JOB, ATTR_o, id=jid)
            job_outfile = qstat[0][ATTR_o].split(':')[1]
            job_host = qstat[0][ATTR_o].split(':')[0]
            if ch == '\x09':
                chk_var = "var1=A,B,%s,C,D" % ch
            else:
                chk_var = "var1=A,B,%s,C,D" % self.npcat[ch]
            self.check_jobout(chk_var, jid, job_outfile, job_host)

    def test_nonprint_character_directive(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (hex 00) and LINE FEED (hex 0A) which will cause a qsub error,
        submit a job script with PBS directive
        -v "var1='A,B,<non-printable character>,C,D'"
        and check that the value with the character is passed correctly
        """
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            # variable to check if with escaped nonprinting character or not
            chk_var = r'var1=A\,B\,%s\,C\,D' % self.npcat[ch]
            if ch in self.npch_asis:
                chk_var = r'var1=A\,B\,%s\,C\,D' % ch
            script = ['#PBS -v "var1=\'A,B,%s,C,D\'"' % ch]
            script += ['sleep 1']
            script += ['env | grep var1']
            jid = self.create_and_submit_job(content=script)
            # Check if qstat -f output contains the escaped character
            self.check_qstatout(chk_var, jid)
            # Check if job output contains the character
            qstat = self.server.status(JOB, ATTR_o, id=jid)
            job_outfile = qstat[0][ATTR_o].split(':')[1]
            job_host = qstat[0][ATTR_o].split(':')[0]
            if ch == '\x09':
                chk_var = "var1=A,B,%s,C,D" % ch
            else:
                chk_var = "var1=A,B,%s,C,D" % self.npcat[ch]
            self.check_jobout(chk_var, jid, job_outfile, job_host)

    def test_nonprint_character_qsubV(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (hex 00) and LINE FEED (hex 0A) which will cause a qsub error,
        test exporting the character in environment variable
        when -V is passed through command line.
        """
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            # variable to check if with escaped nonprinting character or not
            chk_var = 'NONPRINT_VAR=X%sY' % self.npcat[ch]
            if ch in self.npch_asis:
                chk_var = 'NONPRINT_VAR=X%sY' % ch
            script = ['sleep 5']
            script += ['env | grep NONPRINT_VAR']
            a = {self.ATTR_V: None, ATTR_S: '/bin/bash'}
            j = Job(TEST_USER, attrs=a)
            j.create_script(body=script)
            xval = "X%sY" % ch
            env_to_set = {"NONPRINT_VAR": xval}
            jid = self.server.submit(j, env=env_to_set)
            # Check if qstat -f output contains the escaped character
            self.check_qstatout(chk_var, jid)
            # Check if job output contains the character
            qstat = self.server.status(JOB, ATTR_o, id=jid)
            job_outfile = qstat[0][ATTR_o].split(':')[1]
            job_host = qstat[0][ATTR_o].split(':')[0]
            if ch == '\x09':
                chk_var = 'NONPRINT_VAR=X%sY' % ch
            else:
                chk_var = 'NONPRINT_VAR=X%sY' % self.npcat[ch]
            self.check_jobout(chk_var, jid, job_outfile, job_host)

    def test_nonprint_character_default_qsubV(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (hex 00) and LINE FEED (hex 0A) which will cause a qsub error,
        test exporting the character in environment variable
        when -V is in the server's default_qsub_arguments.
        """
        user = PbsUser.get_user(TEST_USER)
        host = user.host
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            # variable to check if with escaped nonprinting character or not
            chk_var = 'NONPRINT_VAR=X%sY' % self.npcat[ch]
            if ch in self.npch_asis:
                chk_var = 'NONPRINT_VAR=X%sY' % ch
            os.environ["NONPRINT_VAR"] = "X%sY" % ch
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'default_qsub_arguments': '-V'})
            script = ['sleep 5']
            script += ['env | grep NONPRINT_VAR']
            j = Job(TEST_USER, attrs={ATTR_S: '/bin/bash'})
            j.create_script(body=script)
            xval = "X%sY" % ch
            env_to_set = {"NONPRINT_VAR": xval}
            jid = self.server.submit(j, env=env_to_set)
            # Check if qstat -f output contains the escaped character
            self.check_qstatout(chk_var, jid)
            # Check if job output contains the character
            qstat = self.server.status(JOB, ATTR_o, id=jid)
            job_outfile = qstat[0][ATTR_o].split(':')[1]
            job_host = qstat[0][ATTR_o].split(':')[0]
            if ch == '\x09':
                chk_var = 'NONPRINT_VAR=X%sY' % ch
            else:
                chk_var = 'NONPRINT_VAR=X%sY' % self.npcat[ch]
            self.check_jobout(chk_var, jid, job_outfile, job_host)

    @checkMomBashVersion
    def test_nonprint_shell_function(self):
        """
        Export a shell function with a non-printable character and check
        that the function is passed correctly.
        Using each of the non-printable ASCII characters, except
        NULL (hex 00), SOH (hex 01), TAB (hex 09), LINE FEED (hex 0A)
        which will cause problems in the exported shell function.
        """
        self.npch_exclude += ['\x01', '\x09']

        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            func = '{ a=%s; echo XX${a}YY}; }' % ch
            # Adjustments in bash due to ShellShock malware fix in various OS
            env_vals = {"foo()": func}
            chk_var = (self.n + '=() {  a=%s; echo XX${a}YY}}' %
                       self.npcat[ch])
            if ch in self.npch_asis:
                chk_var = self.n + '=() {  a=%s; echo XX${a}YY}}' % ch
            out = (self.n + '=() {  a=%s;\n echo XX${a}YY}\n}\nXX%sYY}' %
                   (self.npcat[ch], self.npcat[ch]))
            jid = self.create_and_submit_job(content=self.script,
                                             set_env=env_vals)
            # Check if qstat -f output contains the escaped character
            self.check_qstatout(chk_var, jid)
            # Check if job output contains the character
            qstat = self.server.status(JOB, ATTR_o, id=jid)
            job_outfile = qstat[0][ATTR_o].split(':')[1]
            job_host = qstat[0][ATTR_o].split(':')[0]
            self.check_jobout(out, jid, job_outfile, job_host)

    def test_terminal_control_in_qsubv(self):
        """
        Using terminal control in environment variable
        submit a job script with qsub
        -v "var1='X<terminal control>Y'"
        and check that the value with the character is passed correctly
        """
        chk_var = "var1=X%s%sY" % (self.bold_esc, self.red_esc)
        a = {ATTR_v: "var1=\'X%s%sY\'" % (self.bold, self.red)}
        script = ['env | grep var1']
        script += ['sleep 5']
        jid = self.create_and_submit_job(attribs=a, content=script)
        # Check if qstat -f output contains the escaped character
        self.check_qstatout(chk_var, jid)
        # Check if job output contains the character
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        job_host = qstat[0][ATTR_o].split(':')[0]
        match = "var1=X%s%sY" % (self.bold_esc, self.red_esc)
        self.check_jobout(match, jid, job_outfile, job_host)
        # Reset the terminal
        self.logger.info('%sReset terminal' % self.reset)

    def test_terminal_control_in_directive(self):
        """
        Using terminal control in environment variable
        submit a job script with PBS directive
        -v "var1='X<terminal control>Y'"
        and check that the value with the character is passed correctly
        """
        chk_var = "var1=X%s%sY" % (self.bold_esc, self.red_esc)
        script = ['#PBS -v "var1=\'X%s%sY\'"' % (self.bold, self.red)]
        script += ['env | grep var1']
        script += ['sleep 5']
        jid = self.create_and_submit_job(content=script)
        # Check if qstat -f output contains the escaped character
        self.check_qstatout(chk_var, jid)
        # Check if job output contains the character
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        job_host = qstat[0][ATTR_o].split(':')[0]
        match = "var1=X%s%sY" % (self.bold_esc, self.red_esc)
        self.check_jobout(match, jid, job_outfile, job_host)
        # Reset the terminal
        self.logger.info('%sReset terminal' % self.reset)

    def test_terminal_control_qsubV(self):
        """
        Test exporting terminal control in environment variable
        when -V is passed through command line.
        """
        exp = "X" + self.bold + self.red + "Y"
        chk_var = 'VAR_IN_TERM=X%s%sY' % (self.bold_esc, self.red_esc)
        job_script = ['sleep 5']
        job_script += ['env | grep VAR_IN_TERM']
        a = {self.ATTR_V: None, ATTR_S: '/bin/bash'}
        j = Job(TEST_USER, attrs=a)
        file_n = j.create_script(body=job_script)
        env_vals = {"VAR_IN_TERM": exp}
        jid = self.server.submit(j, env=env_vals)
        # Check if qstat -f output contains the escaped character
        self.check_qstatout(chk_var, jid)
        # Check if job output contains the character
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        job_host = qstat[0][ATTR_o].split(':')[0]
        chk_var = 'VAR_IN_TERM=X%s%sY' % (self.bold_esc, self.red_esc)
        self.check_jobout(chk_var, jid, job_outfile, job_host)
        # Reset the terminal
        self.logger.info('%sReset terminal' % self.reset)

    def test_terminal_control_default_qsubV(self):
        """
        Test exporting terminal control in environment variable
        when -V is in the server's default_qsub_arguments.
        """
        chk_var = 'VAR_IN_TERM=X%s%sY' % (self.bold_esc, self.red_esc)
        exp = "X%s%sY" % (self.bold, self.red)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'default_qsub_arguments': '-V'})
        script = ['sleep 5']
        script += ['env | grep VAR_IN_TERM']
        env_to_set = {"VAR_IN_TERM": exp}
        j = Job(TEST_USER, attrs={ATTR_S: '/bin/bash'})
        j.create_script(body=script)
        jid = self.server.submit(j, env=env_to_set)
        # Check if qstat -f output contains the escaped character
        self.check_qstatout(chk_var, jid)
        # Check if job output contains the character
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        job_host = qstat[0][ATTR_o].split(':')[0]
        chk_var = 'VAR_IN_TERM=X%s%sY' % (self.bold_esc, self.red_esc)
        self.check_jobout(chk_var, jid, job_outfile, job_host)
        # Reset the terminal
        self.logger.info('%sReset terminal' % self.reset)

    @checkMomBashVersion
    def test_terminal_control_shell_function(self):
        """
        Export a shell function with terminal control
        characters and check that the function is passed correctly
        """
        func = '{ a=$(%s; %s); echo XX${a}YY; }' % (self.bold, self.red)
        # Adjustments in bash due to ShellShock malware fix in various OS
        env_vals = {"foo()": func}
        chk_var = self.n + '=() {  a=$(%s; %s); echo XX${a}YY}' % (
            self.bold_esc, self.red_esc)
        out = self.n + '=() {  a=$(%s; %s);\n echo XX${a}YY\n}\nXXYY' % (
            self.bold_esc, self.red_esc)
        jid = self.create_and_submit_job(content=self.script, set_env=env_vals)
        # Check if qstat -f output contains the escaped character
        self.check_qstatout(chk_var, jid)
        # Check if job output contains the character
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        job_host = qstat[0][ATTR_o].split(':')[0]
        self.check_jobout(out, jid, job_outfile, job_host)
        # Reset the terminal
        self.logger.info('%sReset terminal' % self.reset)

    def find_in_tracejob(self, msg, jid):
        """
        Find msg in tracejob output of jid.
        """
        rc = 0
        tracejob_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                    'bin', 'tracejob')
        cmd = [tracejob_cmd, jid]
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd, sudo=True)
        self.assertEqual(ret['rc'], 0)
        for m in ret['out']:
            if m.find(msg) != -1:
                self.logger.info('Found \"%s\" in tracejob output' % msg)
                rc += 1
                continue
        return rc

    def find_in_printjob(self, msg, jid):
        """
        Find msg in printjob output of jid.
        """
        self.server.expect(JOB, {ATTR_state: 'R'}, offset=1, id=jid)
        rc = 0
        ret = self.mom.printjob(jid)
        self.assertEqual(ret['rc'], 0)
        for m in ret['out']:
            if m.find(msg) != -1:
                self.logger.info('Found \"%s\" in printjob output' % msg)
                rc += 1
                continue
        return rc

    def test_nonprint_character_in_qsubA(self):
        """
        Using each of the non-printable ASCII characters, except
        NULL (hex 00) and LINE FEED (hex 0A),
        submit a job script with Account_Name containing the character
        qsub -A "J<non-printable character>K"
        and check that the value with the character is passed correctly
        """
        uhost = PbsUser.get_user(TEST_USER).host
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            if uhost is None or self.du.is_localhost(uhost):
                a = {ATTR_A: "J%sK" % ch}
            else:
                a = {ATTR_A: "'J%sK'" % ch}
            j = Job(TEST_USER, a)
            jid = self.server.submit(j)
            job_stat = self.server.status(JOB, id=jid)
            acct_name = job_stat[0]['Account_Name']
            self.logger.info("job Account_Name: %s" % repr(acct_name))
            exp_name = 'J%sK' % self.npcat[ch]
            if ch in self.npch_asis:
                exp_name = 'J%sK' % ch
            self.logger.info("exp Account_Name: %s" % repr(exp_name))
            self.assertEqual(acct_name, exp_name)
            # Check printjob output
            msg = 'Account_Name = %s' % exp_name
            rc = self.find_in_printjob(msg, jid)
            self.assertEqual(rc, 1)
            # Check tracejob output
            msg = 'account="%s"' % exp_name
            rc = self.find_in_tracejob(msg, jid)
            self.assertGreaterEqual(rc, 1)
            self.server.delete(jid)
            self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=1)

    def test_terminal_control_in_qsubA(self):
        """
        Using terminal control in environment variable
        submit a job script with Account_Name
        qsub -A "J<terminal control>K"
        and check that the value with the character is passed correctly
        """
        j = Job(TEST_USER, {ATTR_A: "J%s%sK" % (self.bold, self.red)})
        jid = self.server.submit(j)
        job_stat = self.server.status(JOB, id=jid)
        acct_name = job_stat[0]['Account_Name']
        self.logger.info("job Account_Name: %s" % repr(acct_name))
        exp_name = 'J%s%sK' % (self.bold_esc, self.red_esc)
        self.logger.info("exp Account_Name: %s" % exp_name)
        self.assertEqual(acct_name, exp_name)
        # Check printjob output
        msg = 'Account_Name = %s' % exp_name
        rc = self.find_in_printjob(msg, jid)
        self.assertEqual(rc, 1)
        # Check tracejob output
        msg = 'account="%s"' % exp_name
        rc = self.find_in_tracejob(msg, jid)
        self.assertGreaterEqual(rc, 1)
        self.logger.info('%sReset terminal' % self.reset)

    def find_in_json_valid(self, cmd, msg, jid):
        """
        Check if qstat json output is valid of jid and find msg in output.
        Returns 2 or greater on success (valid + found).
        """
        rc = 0
        if cmd == 'qstat':
            qstat_cmd_json = self.qstat_cmd + ' -f -F json ' + str(jid)
            ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        elif cmd == 'nodes':
            nodes_cmd_json = self.pbsnodes_cmd + ' -av -F json'
            ret = self.du.run_cmd(self.server.hostname, cmd=nodes_cmd_json)
        ret_out = "\n".join(ret['out'])
        try:
            json.loads(ret_out)
        except ValueError as err:
            self.assertFalse(err)
        rc += 1
        self.logger.info('json output is valid')
        # Check msg is in output
        # cJSON uses different ANSI escape codes (like '\u001b')
        # we need to recode to check chars are preserved
        out_esc = []
        for m in ret['out']:
            b = m.encode('utf-8')
            tmp = b.decode('unicode_escape')
            for ch in self.npcat:
                if ch in self.npch_exclude:
                    continue
                if ch in tmp:
                    tmp = tmp.replace(ch, self.npcat[ch])
            out_esc.append(tmp)
        for m in out_esc:
            if m.find(msg) != -1:
                self.logger.info('Found \"%s\" in json output' % msg)
                rc += 1
                continue
        return rc

    @skipOnShasta
    def test_nonprint_character_in_qstat_json_valid(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (hex 00) and LINE FEED (hex 0A) which will cause a qsub error,
        and File Separator (hex 1C) which will cause invalid json,
        submit a job script with
        qsub -v "var1='A,B,<non-printable character>,C,D'"
        and check that the qstat -f -F json output is valid
        """
        uhost = PbsUser.get_user(TEST_USER).host
        self.npch_exclude += ['\x1C']
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            if self.du.is_localhost(uhost):
                a = {ATTR_v: "var1=\'A,B,%s,C,D\'" % ch, ATTR_S: '/bin/bash'}
            else:
                a = {ATTR_v: r"var1=\'A\,B\,%s\,C\,D\'" % ch}
            msg = 'A,B,%s,C,D' % self.npcat[ch]
            script = ['env | grep var1']
            script += ['sleep 5']
            jid = self.create_and_submit_job(attribs=a, content=script)
            rc = self.find_in_json_valid('qstat', msg, jid)
            self.assertGreaterEqual(rc, 2)

    def test_terminal_control_in_qstat_json_valid(self):
        """
        Using terminal control in environment variable
        submit a job script with qsub
        -v "var1='<terminal control>XY<terminal control>'"
        and check that the qstat -f -F json output is valid
        """
        a = {ATTR_v: "var1=\'%s%sXY%s\'" % (self.bold, self.red, self.reset)}
        msg = "%s%sXY%s" % (self.bold_esc, self.red_esc, self.reset_esc)
        script = ['env | grep var1']
        script += ['sleep 5']
        jid = self.create_and_submit_job(attribs=a, content=script)
        rc = self.find_in_json_valid('qstat', msg, jid)
        self.assertGreaterEqual(rc, 2)

    def test_nonprint_character_in_qstat_dsv(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (hex 00) and LINE FEED (hex 0A) which will cause a qsub error,
        submit a job script with
        qsub -v "var1='AB<non-printable character>CD'"
        and check that the 'qstat -f -F dsv' output contains proper var1
        """
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            a = {ATTR_v: "var1=\'AB%sCD\'" % ch}
            script = ['env | grep var1']
            jid = self.create_and_submit_job(attribs=a, content=script)
            qstat_cmd_dsv = self.qstat_cmd + ' -f -F dsv ' + str(jid)
            ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_dsv)
            qstat_out = "\n".join(ret['out'])
            match = 'var1=AB%sCD' % self.npcat[ch]
            if qstat_out.find(match) != -1:
                self.logger.info('Found %s in qstat -f -F dsv output' % match)

    def test_terminal_control_in_qstat_dsv(self):
        """
        Using terminal control in environment variable
        submit a job script with qsub
        -v "var1='<terminal control>XY<terminal control>'"
        and check that the 'qstat -f -F dsv' output contains proper var1
        """
        a = {ATTR_v: "var1=\'%s%sXY%s\'" % (self.bold, self.red, self.reset)}
        script = ['env | grep var1']
        jid = self.create_and_submit_job(attribs=a, content=script)
        qstat_cmd_dsv = self.qstat_cmd + ' -f -F dsv ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_dsv)
        qstat_out = "\n".join(ret['out'])
        match = 'var1=%s%sXY%s' % (self.bold_esc, self.red_esc, self.reset_esc)
        if qstat_out.find(match) != -1:
            self.logger.info('Found %s in qstat -f -F dsv output' % match)

    @timeout(1200)
    def test_nonprint_character_job_array(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (hex 00) and LINE FEED (hex 0A) which will cause a qsub error,
        test exporting the character in environment variable of
        job array when qsub -V is passed through command line.
        """
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            # variable to check if with escaped nonprinting character or not
            chk_var = 'NONPRINT_VAR=X%sY' % self.npcat[ch]
            if ch in self.npch_asis:
                chk_var = 'NONPRINT_VAR=X%sY' % ch
            exp = "X%sY" % ch
            set_env = {"NONPRINT_VAR": exp}
            script = ['sleep 5']
            script += ['env | grep NONPRINT_VAR']
            a = {self.ATTR_V: None, ATTR_J: '1-2', ATTR_S: '/bin/bash'}
            j = Job(TEST_USER, attrs=a)
            j.create_script(body=script)
            jid = self.server.submit(j, env=set_env)
            subj1 = jid.replace('[]', '[1]')
            subj2 = jid.replace('[]', '[2]')
            # Check if qstat -f output contains the escaped character
            ja = [jid, subj1, subj2]
            for j in ja:
                # Check if qstat -f output contains the escaped character
                self.check_qstatout(chk_var, j)
            qstat1 = self.server.status(JOB, ATTR_o, id=subj1, extend='x')
            job_outfile1 = qstat1[0][ATTR_o].split(':')[1]
            job_host = qstat1[0][ATTR_o].split(':')[0]
            if job_outfile1.split('.')[2] == '^array_index^':
                job_outfile1 = job_outfile1.replace('^array_index^', '1')
            job_outfile2 = job_outfile1.replace('.1', '.2')
            # Check if job array output contains the character as is
            if ch == '\x09':
                chk_var = 'NONPRINT_VAR=X%sY' % ch
            else:
                chk_var = 'NONPRINT_VAR=X%sY' % self.npcat[ch]
            self.check_jobout(chk_var, subj1, job_outfile1, job_host)
            self.check_jobout(chk_var, subj2, job_outfile2, job_host)

    def test_terminal_control_job_array(self):
        """
        Using terminal control in environment variable of
        job array when qsub -V is passed through command line.
        """
        # variable to check if with escaped nonprinting character
        chk_var = 'NONPRINT_VAR=X%s%sY' % (self.bold_esc, self.red_esc)
        env_vals = {"NONPRINT_VAR": "X%s%sY" % (self.bold, self.red)}
        script = ['sleep 5']
        script += ['env | grep NONPRINT_VAR']
        a = {self.ATTR_V: None, ATTR_J: '1-2', ATTR_S: '/bin/bash'}
        j = Job(TEST_USER, attrs=a)
        j.create_script(body=script)
        jid = self.server.submit(j, env=env_vals)
        subj1 = jid.replace('[]', '[1]')
        subj2 = jid.replace('[]', '[2]')
        # Check if qstat -f output contains the escaped character
        ja = [jid, subj1, subj2]
        for j in ja:
            # Check if qstat -f output contains the escaped character
            self.check_qstatout(chk_var, j)
        qstat1 = self.server.status(JOB, ATTR_o, id=subj1)
        job_outfile1 = qstat1[0][ATTR_o].split(':')[1]
        job_host = qstat1[0][ATTR_o].split(':')[0]
        if job_outfile1.split('.')[2] == '^array_index^':
            job_outfile1 = job_outfile1.replace('^array_index^', '1')
        job_outfile2 = job_outfile1.replace('.1', '.2')
        # Check if job array output contains the character as is
        chk_var = 'NONPRINT_VAR=X%s%sY' % (self.bold_esc, self.red_esc)
        self.check_jobout(chk_var, subj1, job_outfile1, job_host)
        self.logger.info('%sReset terminal' % self.reset)
        self.check_jobout(chk_var, subj2, job_outfile2, job_host)
        self.logger.info('%sReset terminal' % self.reset)

    @checkModule("pexpect")
    def test_nonprint_character_interactive_job(self):
        """
        Using each of the non-printable ASCII characters, except NULL
        (hex 00) and LINE FEED (hex 0A) which will cause a qsub error,
        test exporting the character in environment variable of
        interactive job when qsub -V is passed through command line.
        """
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            # variable to check if with escaped nonprinting character or not
            chk_var = r'NONPRINT_VAR=X\,%s\,Y' % self.npcat[ch]
            if ch in self.npch_asis:
                chk_var = r'NONPRINT_VAR=X\,%s\,Y' % ch
            os.environ["NONPRINT_VAR"] = "X,%s,Y" % ch
            fn = self.du.create_temp_file(prefix="job_out1")
            self.job_out1_tempfile = fn
            # submit an interactive job
            cmd = 'env > ' + self.job_out1_tempfile
            a = {self.ATTR_V: None, ATTR_inter: ''}
            interactive_script = [('hostname', '.*'), (cmd, '.*'),
                                  ('sleep 5', '.*')]
            jid = self.create_and_submit_job(
                attribs=a,
                content_interactive=interactive_script,
                preserve_env=True)
            # Check if qstat -f output contains the escaped character
            self.check_qstatout(chk_var, jid)
            # Once all commands sent and matched, job exits
            self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=1)
            # Check for the non-printable character in the output file
            with open(self.job_out1_tempfile, newline="") as fd:
                pkey = ""
                penv = {}
                for line in fd:
                    fields = line.split('=', 1)
                    if len(fields) == 2:
                        pkey = fields[0]
                        penv[pkey] = fields[1]
            np_var = penv['NONPRINT_VAR']
            np_char = np_var.split(',')[1]
            self.assertEqual(ch, np_char)
            self.logger.info(
                "non-printable %s was in interactive job environment"
                % repr(np_char))

    @checkModule("pexpect")
    def test_terminal_control_interactive_job(self):
        """
        Using terminal control characters test exporting them
        in environment variable of interactive job
        when qsub -V is passed through command line.
        """
        # variable to check if with escaped nonprinting character
        chk_var = r'NONPRINT_VAR=X\,%s\,%s\,Y' % (self.bold_esc, self.red_esc)
        var = "X,%s,%s,Y" % (self.bold, self.red)
        os.environ["NONPRINT_VAR"] = var
        fn = self.du.create_temp_file(prefix="job_out1")
        self.job_out1_tempfile = fn
        # submit an interactive job
        cmd = 'env > ' + self.job_out1_tempfile
        a = {self.ATTR_V: None, ATTR_inter: ''}
        interactive_script = [('hostname', '.*'), (cmd, '.*'),
                              ('sleep 5', '.*')]
        jid = self.create_and_submit_job(
            attribs=a,
            content_interactive=interactive_script,
            preserve_env=True)
        # Check if qstat -f output contains the escaped character
        self.check_qstatout(chk_var, jid)
        # Once all commands sent and matched, job exits
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=1)
        # Parse for the non-printable character in the output file
        with open(self.job_out1_tempfile) as fd:
            pkey = ""
            penv = {}
            for line in fd:
                fields = line.split('=', 1)
                if len(fields) == 2:
                    pkey = fields[0]
                    penv[pkey] = fields[1]
        np_var = penv['NONPRINT_VAR']
        self.logger.info("np_var: %s" % repr(np_var))
        np_char1 = np_var.split(',')[1]
        np_char2 = np_var.split(',')[2]
        var_env = "X,%s,%s,Y" % (np_char1, np_char2)
        self.logger.info(
            "np_chars are: %s and %s" % (repr(np_char1), repr(np_char2)))
        self.assertEqual(var, var_env)
        self.logger.info(
            "non-printables were in interactive job environment %s"
            % repr(var_env))

    def test_terminal_control_begin_launch_hook(self):
        """
        Using terminal control characters test exporting them
        in environment variable of job having hooks execjob_begin and
        execjob_launch when qsub -V is passed through command line.
        """
        # variable to check if with escaped nonprinting character
        chk_var = r'NONPRINT_VAR=X\,%s\,%s\,Y' % (self.bold_esc, self.red_esc)
        var = "X,%s,%s,Y" % (self.bold, self.red)
        env_vals = {"NONPRINT_VAR": var}
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 3,
             self.ATTR_V: None}
        script = ['env\n']
        script += ['sleep 5\n']
        # hook1: execjob_begin
        hook_body = """
import pbs
e=pbs.event()
e.job.Variable_List["BEGIN_NONPRINT"] = "AB"
pbs.logmsg(pbs.LOG_DEBUG,"Variable List is %s" % (e.job.Variable_List,))
"""
        hook_name = "begin"
        a2 = {'event': "execjob_begin", 'enabled': 'True', 'debug': 'True'}
        rv = self.server.create_import_hook(
            hook_name,
            a2,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)
        # hook2: execjob_launch
        hook_body = """
import pbs
e=pbs.event()
e.env["LAUNCH_NONPRINT"] = "CD"
"""
        hook_name = "launch"
        a2 = {'event': "execjob_launch", 'enabled': 'True', 'debug': 'True'}
        rv = self.server.create_import_hook(
            hook_name,
            a2,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        # Submit a job with hooks in the system
        jid = self.create_and_submit_job(attribs=a, content=script,
                                         set_env=env_vals)
        # Check if qstat -f output contains the escaped character
        self.check_qstatout(chk_var, jid)
        # Check for the non-printable character in the job output file
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        job_host = qstat[0][ATTR_o].split(':')[0]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=3)
        ret = self.du.cat(
            hostname=job_host,
            filename=job_outfile,
            sudo=True,
            option="-v")
        j_output = ret['out']
        penv = {}
        for line in j_output:
            fields = line.split('=', 1)
            if len(fields) == 2:
                pkey = fields[0]
                penv[pkey] = fields[1]
        np_var = penv['NONPRINT_VAR']
        self.logger.info("np_var: %s" % repr(np_var))
        np_char1 = np_var.split(',')[1]
        np_char2 = np_var.split(',')[2]
        var_env = "X,%s,%s,Y" % (np_char1, np_char2)
        var = "X,%s,%s,Y" % (self.bold_esc, self.red_esc)
        self.logger.info(
            "np_chars are: %s and %s" % (repr(np_char1), repr(np_char2)))
        self.assertEqual(var, var_env)
        self.logger.info(
            "non-printables were in interactive job environment %s"
            % repr(var_env))

    def check_print_list_hook(self, hook_name, hook_name_esc):
        """
        Check if the hook_name_esc is displayed in the output of qmgr
        'print hook' and 'list hook'
        """
        # Print hook displays escaped nonprinting characters
        phook = 'create hook %s' % hook_name_esc
        cmd = [self.qmgr_cmd, '-c', 'print hook']
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd, sudo=True)
        self.assertEqual(ret['rc'], 0)
        if phook in ret['out']:
            self.logger.info('Found \"%s\" in print hook output' % phook)
        # List hook displays escaped nonprinting characters
        lhook = 'Hook %s' % hook_name_esc
        cmd = [self.qmgr_cmd, '-c', 'list hook']
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd, sudo=True)
        self.assertEqual(ret['rc'], 0)
        if lhook in ret['out']:
            self.logger.info('Found \"%s\" in list hook output' % lhook)

    def test_terminal_control_hook_name(self):
        """
        Test using terminal control characters in hook name. Qmgr
        'print hook' and 'list hook' displays the escaped nonprint character.
        """
        hook_name = "h%s%sd" % (self.bold, self.red)
        create_hook = [self.qmgr_cmd, '-c', 'create hook %s' % hook_name]
        delete_hook = [self.qmgr_cmd, '-c', 'delete hook %s' % hook_name]
        list_hook = [self.qmgr_cmd, '-c', 'list hook %s' % hook_name]
        # Delete hook if hook already exists
        ret = self.du.run_cmd(self.server.hostname, cmd=list_hook, sudo=True)
        if ret['rc'] == 0:
            ret = self.du.run_cmd(self.server.hostname,
                                  cmd=delete_hook, sudo=True)
            self.assertEqual(ret['rc'], 0)
        # Create hook. Qmgr print,list hook output will have escaped chars
        ret = self.du.run_cmd(self.server.hostname, cmd=create_hook, sudo=True)
        self.assertEqual(ret['rc'], 0)
        hook_name_esc = "h%s%sd" % (self.bold_esc, self.red_esc)
        self.check_print_list_hook(hook_name, hook_name_esc)
        # Delete the hook
        ret = self.du.run_cmd(self.server.hostname, cmd=delete_hook, sudo=True)
        self.assertEqual(ret['rc'], 0)
        # Reset the terminal
        self.logger.info('%sReset terminal' % self.reset)

    def test_nonprint_character_hook_name(self):
        """
        Use in a hook name each of the non-printable ASCII characters, except
        NULL (x00), TAB (x09), LINE FEED (x0A), VT (x0B), FF (x0C), CR (x0D)
        which will cause a qmgr create hook error. Qmgr 'print hook' and
        'list hook' displays the escaped nonprint character.
        """
        self.npch_exclude += ['\x09', '\x0B', '\x0C', '\x0D']
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            # Create hook
            hk_name = 'h%sd' % ch
            a = {'event': "execjob_begin", 'enabled': 'True', 'debug': 'True'}
            try:
                rv = self.server.create_hook(hk_name, a)
            except PbsManagerError:
                # Delete pre-existing hook first then create the hook
                self.server.manager(MGR_CMD_DELETE, HOOK, id=hk_name)
                rv = self.server.create_hook(hk_name, a)
            self.assertTrue(rv)
            hk_name_esc = "h%sd" % self.npcat[ch]
            self.check_print_list_hook(hk_name, hk_name_esc)
            self.server.manager(MGR_CMD_DELETE, HOOK, id=hk_name)

    def test_terminal_control_in_rsubH(self):
        """
        Using terminal control in authorized hostnames submit a reservation
        pbs_rsub -H "h<terminal control>d" and check that the escaped
        representation is displayed in pbs_rstat correctly.
        """
        r = Reservation(TEST_USER, {"-H": "h%s%sd" % (self.bold, self.red)})
        rid = self.server.submit(r)
        resv_stat = self.server.status(RESV, id=rid)
        auth_hname = resv_stat[0]['Authorized_Hosts']
        self.logger.info("job Authorized_Hosts: %s" % auth_hname)
        exp_name = 'h%s%sd' % (self.bold_esc, self.red_esc)
        self.logger.info("expected Authorized_Hosts: %s" % exp_name)
        self.assertEqual(auth_hname, exp_name)
        self.logger.info('%sReset terminal' % self.reset)

    def test_nonprint_character_in_rsubH(self):
        """
        Using each of the non-printable ASCII characters, except NULL (hex 00)
        and LINE FEED (hex 0A), submit a reservation with authorized hostnames
        pbs_rsub -H "h<terminal control>d" and check that the escaped
        representation is displayed in pbs_rstat correctly.
        """
        uhost = PbsUser.get_user(TEST_USER).host
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            if uhost is None or self.du.is_localhost(uhost):
                h = {"-H": "h%sd" % ch}
            else:
                h = {"-H": "'h%sd'" % ch}
            r = Reservation(TEST_USER, h)
            rid = self.server.submit(r)
            resv_stat = self.server.status(RESV, id=rid)
            auth_hname = resv_stat[0]['Authorized_Hosts']
            self.logger.info("job Authorized_Hosts: %s" % auth_hname)
            exp_name = 'h%sd' % self.npcat[ch]
            if ch in self.npch_asis:
                exp_name = 'h%sd' % ch
            self.logger.info("expected Authorized_Hosts: %s" % exp_name)
            self.assertEqual(auth_hname, exp_name)
            self.server.delete(rid)

    def test_terminal_control_in_node_comment(self):
        """
        Test if pbsnodes -C with terminal control characters results in
        valid json and escaped representation id displayed correctly.
        """
        comment = 'h%s%sd%s' % (self.bold, self.red, self.reset)
        cmd = [self.pbsnodes_cmd, '-C', '%s' % comment, self.mom.shortname]
        self.du.run_cmd(self.server.hostname, cmd=cmd)
        # Check json output
        comm1 = 'h%s%sd%s' % (self.bold_esc, self.red_esc, self.reset_esc)
        rc = self.find_in_json_valid('nodes', comm1, None)
        self.assertGreaterEqual(rc, 2)
        # Check qmgr -c 'list node @default' output
        comm2 = '    comment = %s' % comm1
        cmd = [self.qmgr_cmd, '-c', 'list node @default']
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd, sudo=True)
        self.assertEqual(ret['rc'], 0)
        if comm2 in ret['out']:
            self.logger.info('Found \"%s\" in qmgr list node output' % comm2)
        # Check pbsnodes -a output
        comm3 = '     comment = %s' % comm1
        cmd = [self.pbsnodes_cmd, '-a']
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEqual(ret['rc'], 0)
        if comm3 in ret['out']:
            self.logger.info('Found \"%s\" in pbsnodes -a output' % comm3)

    def test_nonprint_character_in_node_comment(self):
        """
        Using each of the non-printable ASCII characters, except NULL (hex 00),
        LINE FEED (hex 0A), and File Separator (hex 1C) which will cause
        invalid json, test if pbsnodes -C with special characters results in
        valid json and escaped representation id displayed correctly.
        """
        self.npch_exclude += ['\x1C']
        for ch in self.npcat:
            self.logger.info('##### non-printable char: %s #####' % repr(ch))
            if ch in self.npch_exclude:
                self.logger.info('##### excluded char: %s' % repr(ch))
                continue
            comment = 'h%sd' % ch
            cmd = [self.pbsnodes_cmd, '-C', '%s' % comment, self.mom.shortname]
            self.du.run_cmd(self.server.hostname, cmd=cmd, sudo=True)
            comm1 = 'h%sd' % self.npcat[ch]
            # Check json output
            rc = self.find_in_json_valid('nodes', comm1, None)
            self.assertGreaterEqual(rc, 2)
            # Check qmgr -c 'list node @default' output
            comm2 = '    comment = %s' % comm1
            cmd = [self.qmgr_cmd, '-c', 'list node @default']
            ret = self.du.run_cmd(self.server.hostname, cmd=cmd, sudo=True)
            self.assertEqual(ret['rc'], 0)
            if comm2 in ret['out']:
                self.logger.info('Found \"%s\" in qmgr list node out' % comm2)
            # Check pbsnodes -a output
            comm3 = '     comment = %s' % comm1
            cmd = [self.pbsnodes_cmd, '-a']
            ret = self.du.run_cmd(self.server.hostname, cmd=cmd)
            self.assertEqual(ret['rc'], 0)
            if comm3 in ret['out']:
                self.logger.info('Found \"%s\" in pbsnodes -a output' % comm3)


================================================
FILE: test/tests/functional/pbs_offline_vnodes.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestOfflineVnode(TestFunctional):
    """
    Tests if vnodes are marked offline:
     - when a hook fails and the hook fail action is 'offline_vnodes'
     - using pbsnodes -o
    """
    is_cray = True

    def setUp(self):
        if not self.du.get_platform().startswith('cray'):
            self.is_cray = False

        TestFunctional.setUp(self)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

    def create_mom_hook(self):
        name = "h1"
        body = ("import pbs\n"
                "import time\n"
                "time.sleep(60)\n"
                "pbs.event.accept()")
        attr = {'event': 'execjob_begin', 'fail_action': 'offline_vnodes',
                'alarm': '3', 'enabled': 'true'}
        self.server.create_import_hook(name, attr, body)

    def create_bad_begin_hook(self):
        name = "h2"
        body = ("import pbs\n"
                "e=pbs.event()\n"
                "if e.job.in_ms_mom():\n"
                "    e.accept()\n"
                "raise ValueError('invalid name')\n")
        attr = {'event': 'execjob_begin', 'fail_action': 'offline_vnodes'}
        self.server.create_import_hook(name, attr, body)

    def create_bad_startup_hook(self):
        name = "h3"
        body = ("import pbs\n"
                "raise ValueError('invalid name')\n")
        attr = {'event': 'exechost_startup', 'fail_action': 'offline_vnodes'}
        self.server.create_import_hook(name, attr, body)

    def create_multi_vnodes(self, num_moms, num_vnode=3):
        if num_moms != len(self.moms):
            self.server.manager(MGR_CMD_DELETE, NODE, id="@default")
        if self.is_cray is True:
            if num_moms == 1 and len(self.moms) != 1:
                self.server.manager(MGR_CMD_CREATE, NODE,
                                    id=self.moms.values()[0].shortname)
                # adding a sleep of two seconds because it takes some time
                # before node resources start showing up
                time.sleep(2)
            return
        # No need to create vnodes on a cpuset mom
        if self.moms.values()[0].is_cpuset_mom() is True:
            return
        vn_attrs = {ATTR_rescavail + '.ncpus': 1,
                    ATTR_rescavail + '.mem': '1024mb'}
        for i in range(num_moms):
            self.moms.values()[i].create_vnodes(vn_attrs, num_vnode,
                                                usenatvnode=True, delall=False,
                                                expect=False)
            # Calling an explicit expect on newly created nodes.
            self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                               id=self.moms.values()[i].shortname)

    def verify_vnodes_state(self, expected_state, nodes):
        """
        Verify that the vnodes are set to the expected state
        """
        vlist = []
        for nd in nodes:
            vn = nd.shortname
            if self.is_cray is True:
                vnl = self.server.filter(
                    VNODE, {'resources_available.vntype': 'cray_compute'})
                vlist = vnl["resources_available.vntype=cray_compute"]
            elif nd.is_cpuset_mom() is True:
                vnl = self.server.status(NODE)
                vlist = [x['id'] for x in vnl if x['id'] !=
                         self.mom.shortname]
            else:
                vlist = [vn + "[0]", vn + "[1]"]
            for v1 in vlist:
                # Check the vnode state
                self.server.expect(
                    VNODE, {'state': expected_state}, id=v1, interval=2)
        return vlist[0]

    def tearDown(self):
        TestFunctional.tearDown(self)

        # Restore original node setup for future test cases.
        self.server.cleanup_jobs()
        self.server.manager(MGR_CMD_DELETE, NODE, id="@default")
        for m in self.moms.values():
            self.server.manager(MGR_CMD_CREATE, NODE,
                                id=m.shortname)

    def test_single_mom_hook_failure_affects_vnode(self):
        """
        Run an execjob_begin hook that sleep for sometime,
        at the same time set an alarm value so less that
        the hook alarms out and server executes the fail_action
        After this check if vnodes are marked offline.
        In case of a single mom reporting vnodes, it should mark
        all the vnodes and mom as offline.
        Once offlined, reset the mom by issueing pbsnodes -r
        and check if the job runs on one of the vnodes.
        """
        single_mom = self.moms.values()[0]
        start_time = time.time()
        self.create_multi_vnodes(1)
        self.create_mom_hook()

        # Check if hook files were copied to mom
        single_mom.log_match(
            "h1.HK;copy hook-related file request received",
            starttime=start_time, interval=2)
        single_mom.log_match(
            "h1.PY;copy hook-related file request received",
            starttime=start_time, interval=2)

        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=single_mom.shortname, interval=2)
        j1 = Job(TEST_USER)
        j1.set_sleep_time(1000)
        jid = self.server.submit(j1)
        # mom hook will alarm out and job will get into Q state
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)

        # since mom hook alarm out it's fail_action will put the
        # node in offline state
        self.server.expect(
            NODE, {ATTR_NODE_state: 'offline'},
            id=single_mom.shortname, interval=2)

        vname = self.verify_vnodes_state('offline', [single_mom])

        mom_host = single_mom.shortname
        pbs_exec = self.server.pbs_conf['PBS_EXEC']
        pbsnodes_cmd = os.path.join(pbs_exec, 'bin', 'pbsnodes')
        pbsnodes_reset = pbsnodes_cmd + ' -r ' + mom_host

        # Set mom sync hook timeout to be a low value because if mom fails to
        # get the hook after disabling it then next sync will happen after
        # 2 minutes by default and we don't want to wait that long.
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'sync_mom_hookfiles_timeout': '5'})
        self.server.manager(MGR_CMD_SET, HOOK, {'enabled': 'False'}, id="h1")
        # Make sure that hook has been sent to mom
        self.server.log_match("successfully sent hook file")
        self.du.run_cmd(self.server.hostname, cmd=pbsnodes_reset)
        self.server.delete(jid, wait=True)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:vnode=' + vname})
        jid2 = self.server.submit(j2)
        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=single_mom.shortname, interval=2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

    @requirements(num_moms=2)
    def test_multi_mom_hook_failure_affects_vnode(self):
        """
        Run an execjob_begin hook that sleeps for sometime,
        at the same time set an alarm value so less that
        the hook alarms out and server executes the fail_action
        After this check if vnodes are marked offline.
        In case of a multiple mom reporting same set of vnodes,
        it should not mark the vnodes and mom as offline because
        there are other moms active and reporting same vnodes.
        NOTE: This test needs moms to report the same set of vnodes
        """
        if len(self.moms) != 2:
            self.skipTest("Provide 2 moms while invoking test")

        for m in self.moms.values():
            if m.is_cpuset_mom():
                self.skipTest("Skipping test on cpuset moms")

        # The moms provided to the test may have unwanted vnodedef files.
        if self.moms.values()[0].has_vnode_defs():
            self.moms.values()[0].delete_vnode_defs()
        if self.moms.values()[1].has_vnode_defs():
            self.moms.values()[1].delete_vnode_defs()

        start_time = time.time()
        self.create_multi_vnodes(2)
        self.create_mom_hook()

        # Check if hook files were copied to mom
        for m in self.moms.values():
            m.log_match(
                "h1.HK;copy hook-related file request received",
                starttime=start_time, interval=2)
            m.log_match(
                "h1.PY;copy hook-related file request received",
                starttime=start_time, interval=2)

        # set one natural node to have higher ncpus than the other one so
        # that the job only goes to this natural node.
        self.server.manager(MGR_CMD_SET, NODE, {
                            ATTR_rescavail + '.ncpus': '256'},
                            id=self.moms.values()[0].shortname)
        self.server.manager(MGR_CMD_SET, NODE, {
                            ATTR_rescavail + '.ncpus': '1'},
                            id=self.moms.values()[1].shortname)

        j1 = Job(TEST_USER)

        if self.is_cray is True:
            # on a cray, make sure job runs on login node with higher number of
            # ncpus
            j1.set_attributes(
                {ATTR_l + '.select': '1:ncpus=256:vntype=cray_login'})
        else:
            j1.set_attributes({ATTR_l + '.select': '1:ncpus=256'})

        jid = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)

        self.server.expect(NODE, {ATTR_NODE_state: 'offline'},
                           id=self.moms.values()[0].shortname, interval=2)
        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=self.moms.values()[1].shortname, interval=2)

        self.verify_vnodes_state('free', [self.moms.values()[1]])
        self.verify_vnodes_state('offline', [self.moms.values()[0]])

    @requirements(num_moms=2)
    def test_multi_mom_hook_failure_affects_vnode2(self):
        """
        Run an execjob_begin hook that gets an exception
        when executed by sister mom, causing
        the server to execute the fail_action=offline_vnodes, which
        result in sister vnode to be marked offline.
        """
        if len(self.moms) != 2:
            self.skipTest("Provide 2 moms while invoking test")

        for m in self.moms.values():
            if m.is_cpuset_mom():
                self.skipTest("Skipping test on cpuset moms")

        if self.is_cray is True:
            self.skipTest("Skipping test on Crays")

        # The moms provided to the test may have unwanted vnodedef files.
        if self.moms.values()[0].has_vnode_defs():
            self.moms.values()[0].delete_vnode_defs()
        if self.moms.values()[1].has_vnode_defs():
            self.moms.values()[1].delete_vnode_defs()

        start_time = time.time()
        self.create_multi_vnodes(num_moms=2, num_vnode=1)

        self.create_bad_begin_hook()

        # Check if hook files were copied to mom
        for m in self.moms.values():
            m.log_match(
                "h2.HK;copy hook-related file request received",
                starttime=start_time, interval=2)
            m.log_match(
                "h2.PY;copy hook-related file request received",
                starttime=start_time, interval=2)

        j1 = Job(TEST_USER)

        a = {ATTR_l + '.select': '2:ncpus=1',
             ATTR_l + '.place': 'scatter'}
        j1.set_attributes(a)

        jid = self.server.submit(j1)

        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=self.moms.values()[0].shortname, interval=2)
        # sister mom's vnode gets offlined due to hook exception
        self.server.expect(NODE,
                           {ATTR_NODE_state: 'offline',
                            ATTR_comment:
                            "offlined by hook 'h2' due to hook error"},
                           id=self.moms.values()[1].shortname,
                           interval=2, attrop=PTL_AND)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)

    def test_fail_action_startup_hook(self):
        """
        Run an exechost_startup hook that gets an
        exception when local mom is restarted. Vnode representing
        local mom would be marked offline.
        """
        mom = self.moms.values()[0]
        if mom.is_cpuset_mom():
            self.skipTest("Skipping test on cpuset moms")

        if self.is_cray is True:
            self.skipTest("Skipping test on Crays")

        # The moms provided to the test may have unwanted vnodedef files.
        if mom.has_vnode_defs():
            mom.delete_vnode_defs()

        start_time = time.time()
        self.create_multi_vnodes(1)
        self.create_bad_startup_hook()

        # Check if hook files were copied to mom
        mom.log_match(
            "h3.HK;copy hook-related file request received",
            starttime=start_time, interval=2)
        mom.log_match(
            "h3.PY;copy hook-related file request received",
            starttime=start_time, interval=2)

        mom.stop()
        mom.start()

        # primary mom's vnode gets offlined due to startup hook exception
        self.server.expect(NODE,
                           {ATTR_NODE_state: 'offline',
                            ATTR_comment:
                            "offlined by hook 'h3' due to hook error"},
                           id=mom.shortname,
                           interval=2, attrop=PTL_AND)

    def test_pbsnodes_o_single_mom(self):
        """
        Offline a mom using pbsnodes -o.
        Since it is the only mom, all vnodes reported by her
        should also be offline.
        """
        single_mom = self.moms.values()[0]
        self.create_multi_vnodes(1)
        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=single_mom.shortname, interval=2)

        mom_host = single_mom.shortname
        pbs_exec = self.server.pbs_conf['PBS_EXEC']
        pbsnodes_cmd = os.path.join(pbs_exec, 'bin', 'pbsnodes')
        pbsnodes_offline = [pbsnodes_cmd, '-o', mom_host]
        self.du.run_cmd(self.server.hostname, cmd=pbsnodes_offline)

        # the mom node and all of her children should be offline
        self.server.expect(
            NODE, {ATTR_NODE_state: 'offline'},
            id=single_mom.shortname, interval=2)

        self.verify_vnodes_state('offline', [single_mom])

    @requirements(num_moms=2)
    def test_pbsnodes_o_multi_mom_only_one_offline(self):
        """
        Offline one mom using pbsnodes -o.
        In the case of multiple moms reporting the same set of vnodes,
        none of the vnodes should be marked offline,
        including the children vnodes.
        NOTE: This test needs moms to report the same set of vnodes.
        """
        if len(self.moms) != 2:
            self.skipTest("Provide 2 moms while invoking test")

        for m in self.moms.values():
            if m.is_cpuset_mom():
                self.skipTest("Skipping test on cpuset moms")

        momA = self.moms.values()[0]
        momB = self.moms.values()[1]

        # The moms provided to the test may have unwanted vnodedef files.
        if momA.has_vnode_defs():
            momA.delete_vnode_defs()
        if momB.has_vnode_defs():
            momB.delete_vnode_defs()

        self.create_multi_vnodes(2)

        # Offline only one of the moms, the other mom and her children
        # should still be free
        pbs_exec = self.server.pbs_conf['PBS_EXEC']
        pbsnodes_cmd = os.path.join(pbs_exec, 'bin', 'pbsnodes')
        pbsnodes_offline = [pbsnodes_cmd, '-o', momA.shortname]
        self.du.run_cmd(self.server.hostname, cmd=pbsnodes_offline)

        # MomA should be offline
        self.server.expect(
            NODE, {ATTR_NODE_state: 'offline'},
            id=momA.shortname, interval=2)

        # momB and the rest of the vnodes should be free
        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=momB.shortname, interval=2)
        self.verify_vnodes_state('free', [momB])
        self.verify_vnodes_state('offline', [momA])

    @requirements(num_moms=2)
    def test_pbsnodes_multi_mom_offline_online(self):
        """
        When all of the moms reporting a vnode are offline,
        the vnode should also be marked offline.
        And when pbsnodes -r is used to clear the offline from at
        least one of the moms reporting a vnode, then that vnode
        should also get the offline cleared.
        Note: This test needs moms to report the same set of vnodes.
        """
        if len(self.moms) != 2:
            self.skipTest("Provide 2 moms while invoking test")

        for m in self.moms.values():
            if m.is_cpuset_mom():
                self.skipTest("Skipping test on cpuset moms")

        momA = self.moms.values()[0]
        momB = self.moms.values()[1]

        # The moms provided to the test may have unwanted vnodedef files.
        if momA.has_vnode_defs():
            momA.delete_vnode_defs()
        if momB.has_vnode_defs():
            momB.delete_vnode_defs()

        self.create_multi_vnodes(2)

        # Offline both of the moms, the vnodes reported by them
        # will also be offlined
        pbs_exec = self.server.pbs_conf['PBS_EXEC']
        pbsnodes_cmd = os.path.join(pbs_exec, 'bin', 'pbsnodes')
        pbsnodes_offline = [pbsnodes_cmd, '-o', momA.shortname, momB.shortname]
        self.du.run_cmd(self.server.hostname, cmd=pbsnodes_offline)

        # MomA and MomB should be offline
        self.server.expect(
            NODE, {ATTR_NODE_state: 'offline'},
            id=momA.shortname, interval=2)

        self.server.expect(
            NODE, {ATTR_NODE_state: 'offline'},
            id=momB.shortname, interval=2)

        self.verify_vnodes_state('offline', [momA, momB])

        # Now call pbsnodes -r to clear the offline from MomA
        pbsnodes_clear_offline = [pbsnodes_cmd, '-r', momA.shortname]
        self.du.run_cmd(self.server.hostname, cmd=pbsnodes_clear_offline)

        # MomB should still be offline
        self.server.expect(
            NODE, {ATTR_NODE_state: 'offline'},
            id=momB.shortname, interval=2)

        # momA and the vnodes she reports should be free
        self.server.expect(NODE, {ATTR_NODE_state: 'free'},
                           id=momA.shortname, interval=2)
        self.verify_vnodes_state('free', [momA])
        self.verify_vnodes_state('offline', [momB])


================================================
FILE: test/tests/functional/pbs_one_event_multiple_hooks.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_single_event_multiple_hooks(TestFunctional):
    """
    Test if changes made to pbs objects by multiple hooks of same
    event type takes effect or not.
    """
    hook_string = """
import pbs
e = pbs.event()
e.job.Resource_List["%s"]=%s
%s
"""

    def create_hook_scr(self, accept, resource, value):
        """
        function to create a hook script.
        It accepts 3 arguments
        - accept	If set to true, then hook will accept else reject
        - resource	Resource whose value we want to change
        - value		New value to be assigned
        """
        hook_action = "e.accept()"
        if not accept:
            hook_action = "e.reject()"
        final_hook = self.hook_string % (resource, value, hook_action)
        return final_hook

    def test_two_queuejob_hooks(self):
        """
        Submit two queue job hooks. One of the hook modifies resource ncpus
        and other hook modifies walltime. Check the result of modification.
        """
        hook_name = "h1"
        scr = self.create_hook_scr(True, "ncpus", "int(5)")
        attrs = {'event': "queuejob", 'order': '1'}
        rv = self.server.create_import_hook(
            hook_name,
            attrs,
            scr,
            overwrite=True)
        self.assertTrue(rv)

        hook_name = "h2"
        scr = self.create_hook_scr(True, "walltime", "600")
        attrs = {'event': "queuejob", 'order': '2'}
        rv = self.server.create_import_hook(
            hook_name,
            attrs,
            scr,
            overwrite=True)
        self.assertTrue(rv)
        a = {'Resource_List.ncpus': 1,
             'Resource_List.walltime': 10}
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time("10")
        jid = self.server.submit(j)
        self.server.expect(JOB, {
            'Resource_List.ncpus': 5,
            'Resource_List.walltime': '00:10:00'},
            offset=2, id=jid)


================================================
FILE: test/tests/functional/pbs_only_explicit_psets.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_explicit_psets(TestFunctional):
    """
    Test if 'only_explicit_psets = True' disables the creation of pool of nodes
    with unset resources in psets.
    """

    def setUp(self):
        """
        Set the attributes 'only_explicit_psets', 'do_not_span_psets'
        to True and create 'foo' host resource.
        """
        TestFunctional.setUp(self)
        sched_qmgr_attr = {'do_not_span_psets': 'True',
                           'only_explicit_psets': 'True'}
        self.server.manager(MGR_CMD_SET, SCHED, sched_qmgr_attr)

        attr = {'type': 'string',
                'flag': 'h'}
        r = 'foo'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)

    def test_only_explicit_psets(self):
        """
        Test if job with '-lplace=group=foo' can run. It shouldn't.
        """

        # submit a job that can never run with only_explicit_psets = True
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'group=foo'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        c = "Can Never Run: can't fit in the largest placement set,\
 and can't span psets"
        self.server.expect(JOB, {'comment': c}, id=jid)


================================================
FILE: test/tests/functional/pbs_only_small_files_over_tpp.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestOnlySmallFilesOverTPP(TestFunctional):
    """
    This test suite is for testing that only smaller job files (.OU/.ER/.CK)
    and scripts (size < 2MB) are sent over TPP and larger files are sent by
    forking.
    """

    def setUp(self):
        TestFunctional.setUp(self)

        if len(self.moms) != 2:
            self.skip_test(reason="need 2 mom hosts: -p moms=<m1>:<m2>")

        self.server.set_op_mode(PTL_CLI)

        # PBSTestSuite returns the moms passed in as parameters as dictionary
        # of hostname and MoM object
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momA.delete_vnode_defs()
        self.momB.delete_vnode_defs()

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        islocal = self.du.is_localhost(self.hostA)
        if islocal is False:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)
        else:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)

        self.server.manager(MGR_CMD_SET, SERVER, {'job_requeue_timeout': 175})

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 4095})

    def test_small_job_file(self):
        """
        This test case tests that small output files are sent over TPP.
        """
        j = Job(TEST_USER, attrs={ATTR_N: 'small_job_file'})

        test = []
        test += ['dd if=/dev/zero of=file bs=1024 count=0 seek=1024\n']
        test += ['cat file\n']
        test += ['sleep 30\n']

        j.create_script(test, hostname=self.server.client)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R', 'substate': 42},
                           id=jid, max_attempts=30, interval=2)
        time.sleep(5)
        try:
            self.server.rerunjob(jid)
        except PbsRerunError as e:
            self.assertTrue('qrerun: Response timed out. Job rerun request ' +
                            'still in progress for' in e.msg[0])

        msg = jid + ";big job files, sending via subprocess"
        self.server.log_match(msg, max_attempts=10, interval=2,
                              existence=False)

    def test_big_job_file(self):
        """
        This test case tests that large output files are not sent over TPP.
        """
        j = Job(TEST_USER, attrs={ATTR_N: 'big_job_file'})

        test = []
        test += ['dd if=/dev/zero of=file bs=1024 count=0 seek=3072\n']
        test += ['cat file\n']
        test += ['sleep 30\n']

        j.create_script(test, hostname=self.server.client)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R', 'substate': 42},
                           id=jid, max_attempts=30, interval=2)
        time.sleep(5)
        try:
            self.server.rerunjob(jid)
        except PbsRerunError as e:
            self.assertTrue('qrerun: Response timed out. Job rerun request ' +
                            'still in progress for' in e.msg[0])

        msg = jid + ";big job files, sending via subprocess"
        self.server.log_match(msg, max_attempts=30, interval=2)

    def test_big_job_script(self):
        """
        This test case tests that large job scripts are not sent over TPP.
        """
        j = Job(TEST_USER, attrs={
            ATTR_N: 'big_job_script'})

        # Create a big job script.
        test = []
        for i in range(105000):
            test += ['echo hey > /dev/null']
            test += ['sleep 5']

        j.create_script(test, hostname=self.server.client)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R', 'substate': 42},
                           id=jid, max_attempts=30, interval=2)

        msg = jid + ";big job files, sending via subprocess"
        self.server.log_match(
            msg, max_attempts=30, interval=2)


================================================
FILE: test/tests/functional/pbs_passing_environment_variable.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_passing_environment_variable_via_qsub(TestFunctional):
    """
    Test to check passing environment variables via qsub
    """

    def create_and_submit_job(self, user=None, attribs=None, content=None,
                              content_interactive=None, preserve_env=False):
        """
        create the job object and submit it to the server as 'user',
        attributes list 'attribs' script 'content' or 'content_interactive',
        and to 'preserve_env' if interactive job.
        """
        # A user=None value means job will be executed by current user
        # where the environment is set up
        if attribs is None:
            use_attribs = {}
        else:
            use_attribs = attribs
        retjob = Job(username=user, attrs=use_attribs)

        if content is not None:
            retjob.create_script(body=content)
        elif content_interactive is not None:
            retjob.interactive_script = content_interactive
            retjob.preserve_env = preserve_env

        return self.server.submit(retjob)

    def test_commas_in_custom_variable(self):
        """
        Submit a job with -v "var1='A,B,C,D'" and check that the value
        is passed correctly
        """
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 10}
        script = ['#PBS -v "var1=\'A,B,C,D\'"']
        script += ['env | grep var1']
        jid = self.create_and_submit_job(user=TEST_USER, content=script,
                                         attribs={ATTR_S: "/bin/bash"})
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]

        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=10)
        job_output = ""
        ret = self.du.cat(self.server.client, filename=job_outfile,
                          runas=TEST_USER, logerr=False)
        job_output = (' '.join(ret['out'])).strip()
        self.assertEqual(job_output, "var1=A,B,C,D")

    def test_passing_shell_function(self):
        """
        Define a shell function with new line characters and check that
        the function is passed correctly
        """
        # Check if ShellShock fix for exporting shell function in bash exists
        # on this system and what "BASH_FUNC_" format to use
        foo_scr = """#!/bin/bash
foo() { a=B; echo $a; }
export -f foo
env | grep foo
unset -f foo
exit 0
"""
        fn = self.du.create_temp_file(hostname=self.mom.hostname, body=foo_scr)
        self.du.chmod(hostname=self.mom.hostname, path=fn, mode=0o755)
        foo_msg = 'Failed to run foo_scr'
        ret = self.du.run_cmd(self.mom.hostname, cmd=fn)
        self.assertEqual(ret['rc'], 0, foo_msg)
        msg = 'BASH_FUNC_'
        n = 'foo'
        for m in ret['out']:
            if m.find(msg) != -1:
                n = m.split('=')[0]
                break
        # Adjustments in bash due to ShellShock malware fix in various OS
        script = """#!/bin/bash
foo() { if [ /bin/true ]; then\necho hello;\nfi\n}
export -f foo
#PBS -V
env | grep -A 3 foo\n
foo\n
"""
        # Submit a job without hooks in the system
        jid = self.create_and_submit_job(user=TEST_USER, content=script,
                                         attribs={ATTR_S: "/bin/bash"})
        qstat = self.server.status(JOB, ATTR_o, id=jid)
        job_outfile = qstat[0][ATTR_o].split(':')[1]
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=2)
        job_output = ""
        ret = self.du.cat(self.server.client, filename=job_outfile,
                          runas=TEST_USER, logerr=False)
        job_output = ('\n'.join(ret['out'])).strip()
        match = n + \
            '=() {  if [ /bin/true ]; then\n echo hello;\n fi\n}\nhello'
        self.assertEqual(job_output, match,
                         msg="Environment variable foo content does "
                         "not match original")

    def test_option_V_dfltqsubargs(self):
        """
        Test exporting environment variable when -V is enabled
        in default_qsub_arguments.
        """
        os.environ["SET_IN_SUBMISSION"] = "true"
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'default_qsub_arguments': '-V'})
        j = Job(self.du.get_current_user())
        jid = self.server.submit(j)
        self.server.expect(JOB, {'Variable_List': (MATCH_RE,
                                                   'SET_IN_SUBMISSION=true')},
                           id=jid)

    def test_option_V_cmdline(self):
        """
        Test exporting environment variable when -V is passed
        through command line.
        """
        os.environ["SET_IN_SUBMISSION"] = "true"
        self.ATTR_V = 'Full_Variable_List'
        api_to_cli.setdefault(self.ATTR_V, 'V')
        a = {self.ATTR_V: None}
        j = Job(self.du.get_current_user(), attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'Variable_List': (MATCH_RE,
                                                   'SET_IN_SUBMISSION=true')},
                           id=jid)

    def test_option_V_dfltqsubargs_qsub_daemon(self):
        """
        Test whether the changed value of the exported
        environment variable is reflected if the submitted job
        goes to qsub daemon.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'default_qsub_arguments': '-V'})
        os.environ["SET_IN_SUBMISSION"] = "true"
        j = Job(self.du.get_current_user())
        jid = self.server.submit(j)
        os.environ["SET_IN_SUBMISSION"] = "false"
        j1 = Job(self.du.get_current_user())
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'Variable_List': (MATCH_RE,
                                                   'SET_IN_SUBMISSION=true')},
                           id=jid)
        self.server.expect(JOB, {'Variable_List': (MATCH_RE,
                                                   'SET_IN_SUBMISSION=false')},
                           id=jid1)

    def test_passing_env_special_char_via_qsub(self):
        """
        Submit a job with -v ENV_TEST=N:\\aa\\bb\\cc\\dd\\ee\\ff\\gg\\hh\\ii
        and check that the value is passed correctly

        NOTE: As per the Guide 5.2.4.7 Special Characters
        in Variable_List Job Attribute
        Python requires that double quotes
        and backslashes also be escaped with a backslash
        """
        a = {ATTR_v: 'ENV_TEST="N:\\aa\\bb\\cc\\dd\\ee\\ff\\gg\\hh\\ii"'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        qstat = self.server.status(JOB, ATTR_v, id=jid2)
        job_outfile = qstat[0]['Variable_List']
        var_list = job_outfile.split(",")
        exp_string = 'ENV_TEST=N:\\\\\\\\aa\\\\\\\\bb\\\\\\\\cc\\\\\\\\dd'
        exp_string += '\\\\\\\\ee\\\\\\\\ff\\\\\\\\gg\\\\\\\\hh\\\\\\\\ii'
        self.assertIn(exp_string, var_list)

    def test_long_env(self):
        """
        Test to verify that job is able to process
        very long env attribute.
        """

        env = "VAR0=foobar"
        for i in range(1, 300):
            env = f"{env},VAR{i}=foobar"

        a = {ATTR_v: env}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        qstat = self.server.status(JOB, ATTR_v, id=jid)
        var_list = qstat[0]['Variable_List'].split(",")

        for i in range(0, 300):
            exp_string = f"VAR{i}=foobar"
            self.assertIn(exp_string, var_list)

    def test_passing_non_ascii_env(self):
        """
        Test to verify that job is able to process
        non-ascii env attribute.
        """

        import locale
        target_locale = 'cs_CZ.UTF-8'
        try:
            locale.setlocale(locale.LC_ALL, target_locale)
        except:
            msg = f"Target locale ${target_locale} not available."
            self.skipTest(msg)

        env = "VAR=ěščřžýáíéů"

        a = {ATTR_v: env}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        qstat = self.server.status(JOB, ATTR_v, id=jid)
        var_list = qstat[0]['Variable_List'].split(",")

        exp_string = f"VAR=ěščřžýáíéů"
        self.assertIn(exp_string, var_list)


================================================
FILE: test/tests/functional/pbs_pbsnodes.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@tags('commands')
class TestPbsnodes(TestFunctional):

    """
    This test suite contains regression tests for pbsnodes command.
    """

    def setUp(self):
        TestFunctional.setUp(self)

        self.header = ['vnode', 'state', 'OS', 'hardware', 'host',
                       'queue', 'mem', 'ncpus', 'nmics', 'ngpus', 'comment']
        self.pbs_exec = self.server.pbs_conf['PBS_EXEC']
        self.pbsnodes = [os.path.join(self.pbs_exec, 'bin', 'pbsnodes')]
        self.svrname = self.server.pbs_server_name
        self.hostA = self.moms.values()[0].shortname

    def common_setUp(self):
        """
        Common setUp for tests test_pbsnodes_as_user and test_pbsnodes_as_root
        """
        TestFunctional.setUp(self)
        self.server.manager(MGR_CMD_DELETE, NODE, id="", sudo=True)
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.mom.shortname)
        self.server.expect(NODE, {'state': 'free'})

    def get_newnode_attrs(self, user):
        """
        return expected values of attributes on a newly created node
        """
        expect_dict = {}
        expect_dict[ATTR_NODE_Mom] = self.mom.hostname
        expect_dict[ATTR_NODE_ntype] = 'PBS'
        expect_dict[ATTR_NODE_state] = 'free'
        expect_dict[ATTR_rescavail + '.vnode'] = self.mom.shortname
        expect_dict[ATTR_rescavail + '.host'] = self.mom.shortname
        expect_dict[ATTR_NODE_resv_enable] = 'True'

        if user == 'root':
            expect_dict[ATTR_version] = self.server.pbs_version
            expect_dict[ATTR_NODE_Port] = '15002'

        if self.mom.is_cpuset_mom():
            del expect_dict['resources_available.vnode']

        return expect_dict

    def verify_node_dynamic_val(self, last_state_change_time, available_ncpus,
                                pcpus, sharing, available_mem):
        """
        verifies node dynamic attributes have expected value
        """
        sharing_list = ['default_shared', 'default_excl', 'default_exclhost',
                        'ignore_excl', 'force_excl', 'force_exclhost']

        # Verify that 'last_state_change_time' has value in datetime format
        last_state_change_time = str(last_state_change_time)
        try:
            time.strptime(last_state_change_time, "%a %b %d %H:%M:%S %Y")
        except ValueError:
            self.fail("'last_state_change_time' has value in incorrect format")
        else:
            mssg = "'last_state_change_time' has value in correct format"
            self.logger.info(mssg)

        # checking resources_avalable.ncpus and pcpus value are positive value
        ncpus_val = int(available_ncpus)
        if ncpus_val >= 0:
            mssg = "resources_available.ncpus have positive int value"
            self.logger.info(mssg)
        else:
            self.fail("resources_available.ncpus have negative value")
        pcpus_val = int(pcpus)
        if pcpus_val >= 0:
            self.logger.info("pcpus have positive int value")
        else:
            self.fail("pcpus have negative value")

        # verify pcpus and ncpus value are same
        if pcpus_val == ncpus_val:
            self.logger.info("pcpus and ncpus have same value")
        else:
            self.fail("pcpus and ncpus not having same value")

        # verify node sharing attribute have one of the value in
        # sharing_val list
        mssg = "Node sharing attribute not have expected value"
        self.assertIn(sharing, sharing_list, mssg)

        # checking resources_avalable.mem value is positive value
        index = available_mem.find('kb')
        if int(available_mem[:index]) >= 0:
            mssg = "resources_available.mem have positive int value"
            self.logger.info(mssg)
        else:
            self.fail("resources_available.mem not having positive int value")

    def test_pbsnodes_S(self):
        """
        This verifies that 'pbsnodes -S' results in a usage message
        """
        pbsnodes_S = self.pbsnodes + ['-S']
        out = self.du.run_cmd(self.svrname, cmd=pbsnodes_S)
        self.logger.info(out['err'][0])
        self.assertIn('usage:', out['err'][
                      0], 'usage not found in error message')

    def test_pbsnodes_S_host(self):
        """
        This verifies that 'pbsnodes -S <host>' results in an output
        with correct headers.
        """
        pbsnodes_S_host = self.pbsnodes + ['-S', self.hostA]
        out1 = self.du.run_cmd(self.svrname, cmd=pbsnodes_S_host)
        self.logger.info(out1['out'])
        for hdr in self.header:
            self.assertIn(
                hdr, out1['out'][0],
                "header %s not found in output" % hdr)

    def test_pbsnodes_aS(self):
        """
        This verifies that 'pbsnodes -aS' results in an output
        with correct headers.
        """
        pbsnodes_aS = self.pbsnodes + ['-aS']
        out2 = self.du.run_cmd(self.svrname, cmd=pbsnodes_aS)
        self.logger.info(out2['out'])
        for hdr in self.header:
            self.assertIn(
                hdr, out2['out'][0],
                "header %s not found in output" % hdr)

    def test_pbsnodes_av(self):
        """
        This verifies the values of last_used_time in 'pbsnodes -av'
        result before and after server shutdown, once a job submitted.
        """
        j = Job(TEST_USER)
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        self.server.accounting_match("E;%s;" % jid)
        if self.mom.is_cpuset_mom():
            i = 1
        else:
            i = 0

        prev = self.server.status(NODE, 'last_used_time')[i]['last_used_time']
        self.logger.info("Restarting server")
        self.server.restart()
        self.assertTrue(self.server.isUp(), 'Failed to restart Server Daemon')

        now = self.server.status(NODE, 'last_used_time')[i]['last_used_time']
        self.logger.info("Before: " + prev + ". After: " + now + ".")
        self.assertEqual(prev.strip(), now.strip(),
                         'Last used time mismatch after server restart')

    @skipOnCray
    def test_pbsnodes_as_user(self):
        """
        Validate default values of node attributes for non-root user
        """
        self.common_setUp()
        attr_dict = {}
        expected_attrs = self.get_newnode_attrs(TEST_USER)
        command = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                               'bin', 'pbsnodes -a')
        ret = self.du.run_cmd(self.server.hostname, command)
        self.assertEqual(ret['rc'], 0)
        attr_list = ret['out']
        list_len = len(attr_list) - 1
        for i in range(1, list_len):
            attr = attr_list[i].split('=')[0].strip()
            val = attr_list[i].split('=')[1].strip()
            attr_dict[attr] = val

        # comparing the pbsnodes -a output with expected result
        for attr in expected_attrs:
            self.assertEqual(expected_attrs[attr], attr_dict[attr])

        self.verify_node_dynamic_val(attr_dict['last_state_change_time'],
                                     attr_dict['resources_available.ncpus'],
                                     attr_dict['pcpus'], attr_dict['sharing'],
                                     attr_dict['resources_available.mem'])

    @tags('smoke')
    @skipOnCray
    def test_pbsnodes_as_root(self):
        """
        Validate default values of node attributes for root user
        """
        self.common_setUp()
        attr_dict = {}
        expected_attrs = self.get_newnode_attrs('root')
        command = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                               'bin', 'pbsnodes -a')
        ret = self.du.run_cmd(self.server.hostname, command, sudo=True)
        self.assertEqual(ret['rc'], 0)
        attr_list = ret['out']
        list_len = len(attr_list) - 1
        for i in range(1, list_len):
            attr = attr_list[i].split('=')[0].strip()
            val = attr_list[i].split('=')[1].strip()
            attr_dict[attr] = val

        # comparing the pbsnodes -a output with expected result
        for attr in expected_attrs:
            self.assertEqual(expected_attrs[attr], attr_dict[attr])

        self.verify_node_dynamic_val(attr_dict['last_state_change_time'],
                                     attr_dict['resources_available.ncpus'],
                                     attr_dict['pcpus'], attr_dict['sharing'],
                                     attr_dict['resources_available.mem'])


================================================
FILE: test/tests/functional/pbs_pbsnodes_output_trimmed.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import socket

from tests.functional import *


class TestPbsnodesOutputTrimmed(TestFunctional):
    """
    This test suite tests pbsnodes executable with -l
    and makes sure that the node names are not trimmed.
    """

    def test_pbsnodes_output(self):
        """
        This method creates a new vnode with name more than
        20 characters, and checks the pbsnodes output and
        makes sure it is not trimmed
        """
        self.server.manager(MGR_CMD_DELETE, NODE, None, '')
        pbsnodes = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                "bin", "pbsnodes")
        hname = "long123456789012345678901234567890.pbs.com"
        a = {'resources_available.ncpus': 4}
        rc = self.mom.create_vnodes(a, 1, vname=hname)
        command = pbsnodes + " -s " + self.server.hostname + \
            ' -v ' + hname + "[0]"
        rc = self.du.run_cmd(cmd=command, sudo=True)
        self.assertEqual(rc['out'][0], hname + '[0]')
        self.server.manager(MGR_CMD_DELETE, NODE, None, '')


================================================
FILE: test/tests/functional/pbs_peer.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


class TestPeering(TestFunctional):
    """
    Some tests for Peering queues
    """

    cres = "custom_res"
    cqueue = "custom_queue"

    def create_resource(self, name=None, server=None):
        if not name:
            name = self.cres

        if not server:
            server = self.server

        server.manager(MGR_CMD_CREATE, RSC,
                       {'type': 'long', 'flag': 'q'},
                       id=name)

        self.scheduler.add_resource(name)

    def create_queue(self, name=None, server=None, a=None):
        if not name:
            name = self.cqueue

        if not server:
            server = self.server

        if not a:
            a = {'queue_type': 'execution', 'enabled': True, 'started': True}

        server.manager(MGR_CMD_CREATE, QUEUE, a, id=name)

    def test_local_resc_limits(self):
        """
        Test that a local peering queue enforces new limits
        """
        self.create_resource()
        self.create_queue()
        a = {'resources_max.' + self.cres: 4}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id=self.cqueue)
        a = {'started': False}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq')
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': False})

        a = {'peer_queue': '"' + self.cqueue + ' workq"'}
        self.scheduler.set_sched_config(a)

        j = Job(TEST_USER, attrs={'Resource_List.' + self.cres: 100})
        jid = self.server.submit(j)
        j = Job(TEST_USER, attrs={'Resource_List.' + self.cres: 1})
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        msg = (jid + ';Failed to run: Job violates queue and/or server'
               ' resource limits (15036)')
        self.scheduler.log_match(msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

    @requirements(num_servers=2)
    def test_remote_resc_limits(self):
        """
        Test that a remote peering queue enforces new limits
        """
        s1 = self.servers.values()[0]
        s2 = self.servers.values()[1]
        self.create_resource(server=s1)
        self.create_resource(server=s2)
        a = {'resources_max.' + self.cres: 4}
        s1.manager(MGR_CMD_SET, QUEUE, a, id='workq')
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': False})

        a = {'flatuid': True}
        s1.manager(MGR_CMD_SET, SERVER, a)
        s2.manager(MGR_CMD_SET, SERVER, a)

        a = {'peer_queue': '"workq workq@' + s2.hostname + '"'}
        self.scheduler.set_sched_config(a)

        a = {'Resource_List.' + self.cres: 100,
             ATTR_queue: 'workq@' + s2.hostname}
        j = Job(TEST_USER, attrs=a)
        jid = s1.submit(j)
        a['Resource_List.' + self.cres] = 1
        j = Job(TEST_USER, attrs=a)
        jid2 = s1.submit(j)
        s2.expect(JOB, {'job_state': 'Q'}, id=jid)
        s2.expect(JOB, {'job_state': 'Q'}, id=jid2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        s1.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        s1.expect(JOB, {'job_state': 'Q'}, id=jid)
        msg = (jid + r';Failed to run: .* \(15039\)')
        self.scheduler.log_match(msg, regexp=True)
        msg = jid + ';send of job to workq@.* failed error = 15036'
        s2.log_match(msg, regexp=True)
        s1.expect(JOB, {'job_state': 'R'}, id=jid2)


================================================
FILE: test/tests/functional/pbs_periodic_constant.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_periodic_constant(TestFunctional):
    """
    Test if pbs.PERIODIC constant is available in pbs module.
    """
    hook_script = """
import pbs
e = pbs.event()
if e.type == pbs.PERIODIC:
    pbs.logmsg(pbs.EVENT_DEBUG,"This hook is using pbs.PERIODIC")
"""

    def test_periodic_constant_via_server_log(self):
        """
        Create periodic hook. The hook will test the availability of
        pbs.PERIODIC. If constant is available the hook will write a log
        message to the server_log.
        """
        hook_name = "periodic_constant"
        hook_attrib = {'event': 'periodic', 'freq': 5}
        retval = self.server.create_import_hook(hook_name,
                                                hook_attrib,
                                                self.hook_script,
                                                overwrite=True)
        self.assertTrue(retval)

        self.server.log_match("This hook is using pbs.PERIODIC")


================================================
FILE: test/tests/functional/pbs_power_provisioning_cray.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import json
from subprocess import Popen, PIPE
import time


class Test_power_provisioning_cray(TestFunctional):

    """
    Test power provisioning feature for the CRAY platform.

    """

    def setUp(self):
        """
        Use the MOM's that are already setup or define the ones passed in.
        """
        TestFunctional.setUp(self)
        pltfom = self.du.get_platform()
        if pltfom != 'cray':
            self.skipTest("%s: not a cray")
        self.mom.add_config({"logevent": "0xfffffff"})
        a = {'log_events': '2047'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.nids = []
        self.names = []
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                self.names.append(n['id'])
                craynid = n['resources_available.PBScraynid']
                self.nids.append(craynid)
        self.enable_power()     # enable hooks

    def modify_hook_config(self, attrs, hook_id):
        """
        Modify the hook config file contents
        """
        conf_file = str(hook_id) + '.CF'
        conf_file_path = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                      'server_priv', 'hooks', conf_file)
        with open(conf_file_path) as data_file:
            data = json.load(data_file)
        for key, value in attrs.items():
            data[key] = value
        with open(conf_file_path, 'w') as fp:
            json.dump(data, fp)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id=hook_id, sudo=True)

    def setup_cray_eoe(self):
        """
        Setup a eoe list for all the nodes.
        Get possible values for pcaps using capmc command.
        """
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"power_provisioning": True}, n['id'])
        # Dividing total number of nodes by 3 and setting each part to a
        # different power profile , which will be used to submit jobs with
        # chunks matching to the number of nodes set to each profile
        self.npp = len(self.names) / 3
        for i in range(len(self.names)):
            if i in range(0, self.npp):
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"resources_available.eoe": 'low'},
                                    self.names[i])
            if i in range(self.npp, self.npp * 2):
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"resources_available.eoe": 'med'},
                                    self.names[i])
            if i in range(self.npp * 2, self.npp * 3):
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"resources_available.eoe": 'high'},
                                    self.names[i])

        # Find nid range for capmc command
        cmd = "/opt/cray/capmc/default/bin/capmc "\
              "get_power_cap_capabilities --nids " + ','.join(self.nids)
        p = Popen(cmd, shell=True, stdout=PIPE, stderr=PIPE)
        (o, e) = p.communicate()
        out = json.loads(o)
        low = 0
        med = 0
        high = 0
        rv = 'groups' in out
        msg = "Error while creating hook content from capmc output: " + cmd
        self.assertTrue(rv, msg)
        for group in out['groups']:
            for control in group['controls']:
                if control['name'] == 'node':
                    min_cap = control['min']
                    max_cap = control['max']
            pcap_list = {}
            for nid in group['nids']:
                pcap_list[nid] = {}
                pcap_list[nid]['min'] = min_cap
                pcap_list[nid]['max'] = max_cap
                if low == 0 or low < min_cap:
                    low = min_cap
                if high == 0 or high > max_cap:
                    high = max_cap
        # Get the med using mean of low and high
        med = (low + high) / 2

        # Now create the map_eoe hook file
        hook_content = """
import pbs
e = pbs.event()
j = e.job
profile = j.Resource_List['eoe']
if profile is None:
    res = j.Resource_List['select']
    if res is not None:
        for s in str(res).split('+')[0].split(':'):
            if s[:4] == 'eoe=':
                profile = s.partition('=')[2]
                break
pbs.logmsg(pbs.LOG_DEBUG, "got profile '%s'" % str(profile))
if profile == "low":
    j.Resource_List["pcap_node"] = LOW_PCAP
    pbs.logmsg(pbs.LOG_DEBUG, "set low")
elif profile == "med":
    j.Resource_List["pcap_node"] = MED_PCAP
    pbs.logmsg(pbs.LOG_DEBUG, "set med")
elif profile == "high":
    j.Resource_List["pcap_node"] = HIGH_PCAP
    pbs.logmsg(pbs.LOG_DEBUG, "set high")
else:
    pbs.logmsg(pbs.LOG_DEBUG, "unhandled profile '%s'" % str(profile))

e.accept()
"""

        hook_content = hook_content.replace('LOW_PCAP', str(low))
        hook_content = hook_content.replace('MED_PCAP', str(med))
        hook_content = hook_content.replace('HIGH_PCAP', str(high))
        hook_name = "map_eoe"
        a = {'event': 'queuejob', 'enabled': 'true'}
        rv = self.server.create_import_hook(hook_name, a, hook_content)
        msg = "Error while creating and importing hook contents"
        self.assertTrue(rv, msg)
        msg = "Hook %s created and " % hook_name
        msg += "hook script is imported successfully"
        self.logger.info(msg)

    def enable_power(self):
        """
        Enable power_provisioning on the server.
        """
        a = {'enabled': 'True'}
        hook_name = "PBS_power"
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id=hook_name,
                            sudo=True)

        # check that hook becomes active
        nodes = self.server.status(NODE)
        n = nodes[0]
        host = n['Mom']
        self.assertTrue(host is not None)
        mom = self.moms[host]
        mom.log_match(
            "Hook;PBS_power.HK;copy hook-related file request received",
            starttime=self.server.ctime)

    def disable_power(self):
        """
        Disable power_provisioning on the server.
        """
        a = {'enabled': 'False'}
        hook_name = "PBS_power"
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id=hook_name,
                            sudo=True)

    def submit_job(self, secs=10, a={}):
        """
        secs: sleep time for the job
        a: any job attributes
        """
        a['Keep_Files'] = 'oe'
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(secs)
        self.logger.info(str(j))
        jid = self.server.submit(j)
        self.job = j
        return jid

    def energy_check(self, jid):
        s = self.server.accounting_match("E;%s;.*" % jid,
                                         regexp=True)
        self.assertTrue(s is not None)
        # got the account record, hack it apart
        for resc in s[1].split(';')[3].split():
            if resc.partition('=')[0] == "resources_used.energy":
                return True
        return False

    def mom_logcheck(self, msg, jid=None):
        mom = self.moms[self.host]           # top mom
        if jid is not None:
            mom.log_match(msg % jid,
                          regexp=True, starttime=self.server.ctime,
                          max_attempts=10)
        else:
            mom.log_match(msg,
                          regexp=True, starttime=self.server.ctime,
                          max_attempts=10)

    def eoe_check(self, jid, eoe, secs):
        # check that job is running and that the vnode has current_eoe set
        # check for the appropriate log messages for cray
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        qstat = self.server.status(JOB, id=jid)
        nodes = self.job.get_vnodes(self.job.exec_vnode)
        for vname in nodes:
            self.server.expect(VNODE, {'current_eoe': eoe}, id=vname)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=secs)
        self.host = qstat[0]['exec_host'].partition('/')[0]
        self.mom_logcheck("capmc get_node_energy_counter --nids")
        self.mom_logcheck(";Job;%s;energy usage", jid)
        self.mom_logcheck(";Job;%s;Cray: pcap node", jid)
        self.mom_logcheck("capmc set_power_cap --nids")
        self.mom_logcheck(";Job;%s;PMI: reset current_eoe", jid)
        self.mom_logcheck(";Job;%s;Cray: remove pcap node", jid)
        for vname in nodes:
            self.server.expect(VNODE, {'current_eoe': eoe}, id=vname, op=UNSET)

    def eoe_job(self, num, eoe):
        """
        Helper function to submit a job with an eoe value.
        Parameters:
        num: number of chunks
        eoe: profile name
        """
        secs = 10
        jid = self.submit_job(secs,
                              {'Resource_List.place': 'scatter',
                               'Resource_List.select': '%d:eoe=%s' % (num,
                                                                      eoe)})
        self.eoe_check(jid, eoe, secs)
        return jid

    def cleanup_power_on(self):
        """
        cleanup by switching back all the nodes
        """
        capmc_cmd = os.path.join(
            os.sep, 'opt', 'cray', 'capmc', 'default', 'bin', 'capmc')
        self.du.run_cmd(self.server.hostname, [
                        capmc_cmd, 'node_on', '--nids',
                        ','.join(self.nids)], sudo=True)
        self.logger.info("Waiting for 15 mins to power on all the nodes")
        time.sleep(900)

    def cleanup_power_ramp_rate(self):
        """
        cleanup by ramping back all the nodes
        """
        for nid in self.nids:
            capmc_cmd = os.path.join(
                os.sep, 'opt', 'cray', 'capmc', 'default', 'bin', 'capmc')
            self.du.run_cmd(self.server.hostname, [
                capmc_cmd, 'set_sleep_state_limit', '--nids',
                str(nid), '--limit', '1'], sudo=True)
            self.logger.info("ramping up the node with nid" + str(nid))

    def setup_power_ramp_rate(self):
        """
        Offline the nodes which does not have sleep_state_capablities
        """
        self.offnodes = 0
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                nid = n['resources_available.PBScraynid']
                cmd = os.path.join(os.sep, 'opt', 'cray',
                                   'capmc', 'default', 'bin', 'capmc')
                ret = self.du.run_cmd(self.server.hostname,
                                      [cmd,
                                       'get_sleep_state_limit_capabilities',
                                       '--nids', str(nid)], sudo=True)
                try:
                    out = json.loads(ret['out'][0])
                except Exception:
                    out = None
                if out is not None:
                    errno = out["e"]
                    msg = out["err_msg"]
                    if errno == 52 and msg == "Invalid exchange":
                        self.offnodes = self.offnodes + 1
                        a = {'state': 'offline'}
                        self.server.manager(MGR_CMD_SET, NODE, a, id=n['id'])

    @timeout(700)
    def test_cray_eoe_job(self):
        """
        Submit jobs with an eoe value and check that messages are logged
        indicating PMI activity, and current_eoe and resources_used.energy
        get set.
        """
        self.setup_cray_eoe()
        eoes = ['low', 'med', 'high']
        for profile in eoes:
            jid = self.eoe_job(self.npp, profile)
            self.energy_check(jid)

    @timeout(700)
    def test_cray_request_more_eoe(self):
        """
        Submit jobs with available+1 eoe chunks and verify job comment.
        """
        self.setup_cray_eoe()
        x = self.npp + 1
        jid = self.submit_job(10,
                              {'Resource_List.place': 'scatter',
                               'Resource_List.select': '%d:eoe=%s' % (x,
                                                                      'high')})
        self.server.expect(JOB, {
            'job_state': 'Q',
            'comment': 'Not Running: No available resources on nodes'},
            id=jid)

    @timeout(700)
    def test_cray_eoe_job_multiple_eoe(self):
        """
        Submit jobs requesting multiple eoe and job should rejected by qsub.
        """
        self.setup_cray_eoe()
        a = {'Resource_List.place': 'scatter',
             'Resource_List.select': '10:eoe=low+10:eoe=high'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(10)
        jid = None
        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue(
                'Invalid provisioning request in chunk' in e.msg[0])
        self.assertFalse(jid)

    @timeout(700)
    def test_cray_server_prov_off(self):
        """
        Submit jobs requesting eoe when power provisioning unset on server
        and verify that jobs wont run.
        """
        self.setup_cray_eoe()
        eoes = ['low', 'med', 'high']
        a = {'enabled': 'False'}
        hook_name = "PBS_power"
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id=hook_name,
                            sudo=True)
        self.server.expect(SERVER, {'power_provisioning': 'False'})
        for profile in eoes:
            jid = self.submit_job(10,
                                  {'Resource_List.place': 'scatter',
                                   'Resource_List.select': '%d:eoe=%s'
                                   % (self.npp, profile)})
            self.server.expect(JOB, {
                'job_state': 'Q',
                'comment': 'Not Running: No available resources on nodes'},
                id=jid)

    @timeout(700)
    def test_cray_node_prov_off(self):
        """
        Submit jobs requesting eoe and verify that jobs wont run on
        nodes where power provisioning is set to false.
        """
        self.setup_cray_eoe()
        eoes = ['med', 'high']
        # set power_provisioning to off where eoe is set to false
        for i in range(0, self.npp):
            a = {'power_provisioning': 'False'}
            self.server.manager(MGR_CMD_SET, NODE, a, id=self.names[i])

        for profile in eoes:
            jid = self.submit_job(10,
                                  {'Resource_List.place': 'scatter',
                                   'Resource_List.select': '%d:eoe=%s'
                                   % (self.npp, profile)})
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        jid_low = self.submit_job(10,
                                  {'Resource_List.place': 'scatter',
                                   'Resource_List.select': '%d:eoe=%s'
                                   % (self.npp, 'low')})
        exp_comm = 'Not Running: Insufficient amount of resource: '
        exp_comm += 'vntype (cray_compute != cray_login)'
        self.server.expect(JOB, {
                           'job_state': 'Q',
                           'comment': exp_comm}, attrop=PTL_AND, id=jid_low)

    @timeout(700)
    def test_cray_job_preemption(self):
        """
        Submit job to a high priority queue and verify
        that job is preempted by requeueing.
        """
        self.setup_cray_eoe()
        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'execution', 'started': 'True',
                             'enabled': 'True', 'priority': 150}, id='workq2')
        jid = self.submit_job(10,
                              {'Resource_List.place': 'scatter',
                               'Resource_List.select': '%d:eoe=%s'
                               % (self.npp, 'low')})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        t = time.time()
        jid_hp = self.submit_job(10, {ATTR_queue: 'workq2',
                                      'Resource_List.place': 'scatter',
                                      'Resource_List.select': '%d:eoe=%s' %
                                      (self.npp, 'low')})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_hp)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.scheduler.log_match("Job preempted by requeuing", starttime=t)

    def test_power_provisioning_attribute(self):
        """
        Test that when hook is disabled power_provisioning on
        server is set to false and when enabled true.
        """
        self.enable_power()
        a = {'power_provisioning': 'True'}
        self.server.expect(SERVER, a)

        self.disable_power()
        a = {'power_provisioning': 'False'}
        self.server.expect(SERVER, a)

    def test_poweroff_eligible_atrribute(self):
        """
        Test that we can set poweroff_eligible for nodes to true/false.
        """
        nodes = self.server.status(NODE)
        host = nodes[0]['id']
        self.server.manager(MGR_CMD_SET, NODE, {'poweroff_eligible': 'True'},
                            id=host)
        self.server.manager(MGR_CMD_SET, NODE, {'poweroff_eligible': 'False'},
                            id=host)

    def test_last_state_change_time(self):
        """
        Test last_state_change_time is set when a job is run and is exited.
        """
        pattern = '%a %b %d %H:%M:%S %Y'
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'job_history_enable': 'True'})
        nodes = self.server.status(NODE)
        vnode = nodes[0]['resources_available.vnode']
        ncpus = nodes[0]['resources_available.ncpus']
        vntype = nodes[0]['resources_available.vntype']
        jid = self.submit_job(5, {'Resource_List.vnode': vnode,
                                  'Resource_List.ncpus': ncpus,
                                  'Resource_List.vntype': vntype})
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        status = self.server.status(NODE, id=vnode)
        fmttime = status[0][ATTR_NODE_last_state_change_time]
        sts_time1 = int(time.mktime(time.strptime(fmttime, pattern)))
        jid = self.submit_job(5, {'Resource_List.vnode': vnode,
                                  'Resource_List.ncpus': ncpus,
                                  'Resource_List.vntype': vntype})
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        status = self.server.status(NODE, id=vnode)
        fmttime = status[0][ATTR_NODE_last_state_change_time]
        sts_time2 = int(time.mktime(time.strptime(fmttime, pattern)))
        self.assertGreater(sts_time2, sts_time1)

    def test_last_used_time(self):
        """
        Test last_used_time is set when a job is run and is exited.
        """
        pattern = '%a %b %d %H:%M:%S %Y'
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'job_history_enable': 'True'})
        nodes = self.server.status(NODE)
        vnode = nodes[0]['resources_available.vnode']
        vntype = nodes[0]['resources_available.vntype']
        jid = self.submit_job(5, {'Resource_List.vnode': vnode,
                                  'Resource_List.vntype': vntype})
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        status = self.server.status(NODE, id=vnode)
        fmttime = status[0][ATTR_NODE_last_used_time]
        sts_time1 = int(time.mktime(time.strptime(fmttime, pattern)))
        jid = self.submit_job(5, {'Resource_List.vnode': vnode,
                                  'Resource_List.vntype': vntype})
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        status = self.server.status(NODE, id=vnode)
        fmttime = status[0][ATTR_NODE_last_used_time]
        sts_time2 = int(time.mktime(time.strptime(fmttime, pattern)))
        self.assertGreater(sts_time2, sts_time1)

    @timeout(1200)
    def test_power_off_nodes(self):
        """
        Test power hook will power off the nodes if power_on_off_enable when
        poweroff_eligible is set to true on nodes.
        """
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"poweroff_eligible": True}, n['id'])
        a = {"power_on_off_enable": True,
             "max_concurrent_nodes": "30", 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 30}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        t = time.time()
        self.logger.info("Waiting for 4 mins to power off all the nodes")
        time.sleep(240)
        self.server.log_match(
            "/opt/cray/capmc/default/bin/capmc node_off", starttime=t)
        # Expect sleep state on all nodes expect login node
        self.server.expect(
            NODE, {'state=sleep': len(self.server.status(NODE)) - 1})
        self.cleanup_power_on()

    @timeout(1200)
    def test_power_on_off_max_concurennt_nodes(self):
        """
        Test power hook will power off the only the number of
        max_concurrent nodes specified in conf file per hook run
        even when poweroff_eligible is set to true on all the nodes.
        """
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"poweroff_eligible": True}, n['id'])
        a = {"power_on_off_enable": True, 'node_idle_limit': '10',
             'max_concurrent_nodes': '2'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 30}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 40 secs to power off 2 nodes")
        time.sleep(40)
        a = {'enabled': 'False'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.server.expect(NODE, {'state=sleep': 2})
        self.cleanup_power_on()

    def test_poweroffelgible_false(self):
        """
        Test hook wont power off the nodes where
        poweroff_eligible is set to false
        """
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"poweroff_eligible": False}, n['id'])
        a = {"power_on_off_enable": True,
             "max_concurrent_nodes": "30", 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 30}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info(
            "Waiting for 100 secs to make sure no nodes are powered off")
        time.sleep(100)
        self.server.expect(NODE, {'state=free': len(self.server.status(NODE))})

    @timeout(900)
    def test_power_on_nodes(self):
        """
        Test when a job is calandered on a vnode which is in sleep state,
        the node will be powered on and job will run.
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})
        self.server.manager(MGR_CMD_SET, NODE, {
                            "poweroff_eligible": True}, self.names[0])
        a = {"power_on_off_enable": True, 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 30}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        t = time.time()
        self.logger.info("Waiting for 1 min to poweroff 1st node")
        time.sleep(60)
        self.server.log_match(
            "/opt/cray/capmc/default/bin/capmc node_off", starttime=t)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[0])
        a = {"node_idle_limit": "1800", 'min_node_down_delay': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        t = time.time()
        jid = self.submit_job(1000, {'Resource_List.vnode': self.names[0]})
        self.scheduler.log_match(
            jid + ';Job is a top job and will run at',
            max_attempts=10, starttime=t)
        t = time.time()
        self.logger.info("Waiting for 10 min to poweron 1st node")
        time.sleep(600)
        self.server.log_match(
            "/opt/cray/capmc/default/bin/capmc node_on", starttime=t)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[0])

    @timeout(900)
    def test_power_on_ramp_rate_nodes(self):
        """
        Test when both ramp rate and power on off is enabled,
        power_on_off_enable will override and nodes will be powered off
        and powered on.
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})
        self.server.manager(MGR_CMD_SET, NODE, {
                            "poweroff_eligible": True}, self.names[0])
        a = {"power_on_off_enable": True,
             "power_ramp_rate_enable": True, 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 30}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        t = time.time()
        self.logger.info("Waiting for 1 min to poweroff 1st node")
        time.sleep(60)
        self.server.log_match(
            "power_on_off_enable is over-riding power_ramp_rate_enable",
            starttime=t)
        self.server.log_match(
            "/opt/cray/capmc/default/bin/capmc node_off", starttime=t)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[0])
        a = {"node_idle_limit": "1800", 'min_node_down_delay': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        t = time.time()
        jid = self.submit_job(1000, {'Resource_List.vnode': self.names[0]})
        self.scheduler.log_match(
            jid + ';Job is a top job and will run at',
            max_attempts=10, starttime=t)
        t = time.time()
        self.logger.info("Waiting for 10 min to poweron 1st node")
        time.sleep(600)
        self.server.log_match(
            "/opt/cray/capmc/default/bin/capmc node_on", starttime=t)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[0])

    @timeout(1200)
    def test_power_on_min_node_down_delay(self):
        """
        Test when a job is calandered on a vnode which is in sleep state,
        the node will be not be powered on until min_node_down_delay time.
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})
        self.server.manager(MGR_CMD_SET, NODE, {
                            "poweroff_eligible": True}, self.names[0])
        a = {"power_on_off_enable": True, 'min_node_down_delay': '3000'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 30}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 1 min to poweroff 1st node")
        time.sleep(60)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[0])
        jid = self.submit_job(1000, {'Resource_List.vnode': self.names[0]})
        t = time.time()
        self.scheduler.log_match(
            jid + ';Job is a top job and will run at',
            max_attempts=10, starttime=t)
        self.logger.info("Waiting for 2 mins to make sure node is not powered")
        time.sleep(120)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[0])
        self.cleanup_power_on()

    @timeout(1800)
    def test_max_jobs_analyze_limit(self):
        """
        Test that even when 4 jobs are calandered only nodes assigned
        to max_jobs_analyze_limit number of jobs will be considered
        for powering on.
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})
        self.server.manager(MGR_CMD_SET, SERVER, {'backfill_depth': '4'})
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                self.server.manager(MGR_CMD_SET, NODE, {
                                    "poweroff_eligible": True}, n['id'])
        a = {"power_on_off_enable": True, 'max_jobs_analyze_limit': '2',
             'node_idle_limit': '30', 'max_concurrent_nodes': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 30}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 2 mins to poweroff all the nodes")
        time.sleep(120)
        # Expect sleep state on all nodes expect login node
        self.server.expect(
            NODE, {'state=sleep': len(self.server.status(NODE)) - 1})
        a = {"node_idle_limit": "1800", 'min_node_down_delay': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        j1id = self.submit_job(1000, {'Resource_List.vnode': self.names[0]})
        j2id = self.submit_job(1000, {'Resource_List.vnode': self.names[1]})
        j3id = self.submit_job(1000, {'Resource_List.vnode': self.names[2]})
        j4id = self.submit_job(1000, {'Resource_List.vnode': self.names[3]})
        self.logger.info(
            "Waiting for 10 mins to poweron the nodes which are calandered")
        time.sleep(600)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'R'}, id=j1id)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[1])
        self.server.expect(JOB, {'job_state': 'Q'}, id=j3id)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[2])
        self.server.expect(JOB, {'job_state': 'Q'}, id=j4id)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[3])
        self.cleanup_power_on()

    def test_last_used_time_node_sort_key(self):
        """
        Test last_used_time as node sort key.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'job_history_enable': 'True'})
        i = 0
        for n in self.server.status(NODE):
            if 'resources_available.PBScraynid' in n:
                if i > 1:
                    self.server.manager(MGR_CMD_SET, NODE, {
                        'state': 'offline'}, id=n['id'])
                i += 1
        a = {'node_sort_key': '"last_used_time LOW" ALL'}
        self.scheduler.set_sched_config(a)
        jid = self.submit_job(
            1, {'Resource_List.select': '1:ncpus=1',
                'Resource_List.place': 'excl'})
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        status = self.server.status(JOB, 'exec_vnode', id=jid, extend='x')
        exec_vnode = status[0]['exec_vnode']
        node1 = exec_vnode.split(':')[0][1:]
        jid = self.submit_job(
            1, {'Resource_List.select': '1:ncpus=1',
                'Resource_List.place': 'excl'})
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        jid = self.submit_job(
            1, {'Resource_List.select': '1:ncpus=1',
                'Resource_List.place': 'excl'})
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        status = self.server.status(JOB, 'exec_vnode', id=jid, extend='x')
        exec_vnode = status[0]['exec_vnode']
        node2 = exec_vnode.split(':')[0][1:]
        # Check that 3rd job falls on the same node as 1st job as per
        # node_sort_key. Node on which 1st job ran has lower last_used_time
        # than the node on which 2nd job ran.
        self.assertEqual(node1, node2)

    @timeout(1200)
    def test_power_ramp_down_nodes(self):
        """
        Test power hook will ramp down the nodes if power_ramp_rate_enable
        is enabled and node_idle_limit is reached.
        """
        self.setup_power_ramp_rate()
        a = {"power_ramp_rate_enable": True, 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 60}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 15 mins to ramp down all the nodes")
        time.sleep(900)
        # Do not check for the offline nodes and 1 login node
        nn = self.offnodes + 1
        self.server.expect(
            NODE, {'state=sleep': len(self.server.status(NODE)) - nn})
        self.cleanup_power_ramp_rate()

    @timeout(1000)
    def test_power_ramp_down_max_concurennt_nodes(self):
        """
        Test power hook will ramp down only the number of
        max_concurrent nodes specified in conf file per hook run.
        """
        self.setup_power_ramp_rate()
        a = {"power_ramp_rate_enable": True, 'node_idle_limit': '10',
             'max_concurrent_nodes': '2'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 60}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 90 secs to ramp down 2 nodes")
        time.sleep(90)
        a = {'enabled': 'False'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.server.expect(NODE, {'state=sleep': 2})
        self.cleanup_power_ramp_rate()

    @timeout(1500)
    def test_power_ramp_up_nodes(self):
        """
        Test when a job is calandered on a vnode which is in sleep state,
        the node will be ramped up and job will run.
        """
        self.setup_power_ramp_rate()
        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})
        a = {"power_ramp_rate_enable": True, 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 60}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 15 mins to ramp down all the nodes")
        time.sleep(900)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[0])
        a = {"node_idle_limit": "1800", 'min_node_down_delay': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        t = time.time()
        jid = self.submit_job(1000, {'Resource_List.vnode': self.names[0]})
        self.scheduler.log_match(
            jid + ';Job is a top job and will run at',
            max_attempts=10, starttime=t)
        self.logger.info("Waiting for 90 secs to ramp up the calandered node")
        time.sleep(90)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[0])
        self.cleanup_power_ramp_rate()

    @timeout(1200)
    def test_max_jobs_analyze_limit_ramp_up(self):
        """
        Test that even when 4 jobs are calandered only nodes assigned
        to max_jobs_analyze_limit number of jobs will be considered
        for ramping up.
        """
        self.setup_power_ramp_rate()
        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})
        self.server.manager(MGR_CMD_SET, SERVER, {'backfill_depth': '4'})
        a = {"power_ramp_rate_enable": True,
             'max_jobs_analyze_limit': '2', 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 60}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 15 mins to ramp down all the nodes")
        time.sleep(900)
        # Do not check for the offline nodes and 1 login node
        nn = self.offnodes + 1
        self.server.expect(
            NODE, {'state=sleep': len(self.server.status(NODE)) - nn})
        a = {"node_idle_limit": "1800", 'min_node_down_delay': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        j1id = self.submit_job(1000, {'Resource_List.vnode': self.names[0]})
        j2id = self.submit_job(1000, {'Resource_List.vnode': self.names[1]})
        j3id = self.submit_job(1000, {'Resource_List.vnode': self.names[2]})
        j4id = self.submit_job(1000, {'Resource_List.vnode': self.names[3]})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.logger.info("Waiting for 90 secs to ramp up the calandered nodes")
        time.sleep(90)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'R'}, id=j1id)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[1])
        self.server.expect(JOB, {'job_state': 'Q'}, id=j3id)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[2])
        self.server.expect(JOB, {'job_state': 'Q'}, id=j4id)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[3])
        self.cleanup_power_ramp_rate()

    @timeout(1200)
    def test_power_ramp_up_poweroff_eligible(self):
        """
        Test that nodes are considered for ramp down and ramp up
        even when poweroff_elgible is set to false.
        """
        self.setup_power_ramp_rate()
        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})
        self.server.manager(MGR_CMD_SET, NODE, {'poweroff_eligible': 'False'},
                            id=self.names[0])
        a = {"power_ramp_rate_enable": True, 'node_idle_limit': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        a = {'freq': 60}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        a = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id='PBS_power',
                            sudo=True)
        self.logger.info("Waiting for 15 mins to ramp down all the nodes")
        time.sleep(900)
        self.server.expect(NODE, {'state': 'sleep'}, id=self.names[0])
        a = {"node_idle_limit": "1800", 'min_node_down_delay': '30'}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        t = time.time()
        jid = self.submit_job(1000, {'Resource_List.vnode': self.names[0]})
        self.scheduler.log_match(
            jid + ';Job is a top job and will run at',
            max_attempts=10, starttime=t)
        self.logger.info("Waiting for 90 secs to ramp up calandered node")
        time.sleep(90)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(NODE, {'state': 'job-exclusive'}, id=self.names[0])
        self.cleanup_power_ramp_rate()

    def tearDown(self):
        a = {"power_ramp_rate_enable": False,
             "power_on_off_enable": False,
             'node_idle_limit': '1800',
             'min_node_down_delay': '1800',
             "max_jobs_analyze_limit": "100",
             "max_concurrent_nodes": "5"}
        self.modify_hook_config(attrs=a, hook_id='PBS_power')
        self.disable_power()
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_power_provisioning_sgi.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(no_mom_on_server=True)
class Test_power_provisioning_sgi(TestFunctional):

    """
    Test power provisioning feature for the SGI platform.

    Create stub SGI API script at /opt/sgi/ta  and load eoe's from it.
    """
    script = \
        """
# Fake SGI API python
import time

def VerifyConnection():
    return "connected"

def ListAvailableProfiles():
    return ['100W', '150W', '200W', '250W', '300W', '350W', '400W', '450W',
            '500W', 'NONE']

def MonitorStart( nodeset_name, profile ):
    return None

def MonitorReport( nodeset_name ):
    # fake an energy value
    fmt = "%Y/%d/%m"
    now = time.time()
    st = time.strptime(time.strftime(fmt, time.localtime(now)), fmt)
    night = time.mktime(st)
    return ['total_energy', (now - night)/60000, 1415218704.5979109]

def MonitorStop( nodeset_name ):
    return None

def NodesetCreate( nodeset_name, node_hostname_list ):
    return None

def NodesetDelete( nodeset_name ):
    return None
"""
    power_nodes = None

    def setUp(self):
        """
        Don't set any special flags.
        Use the MOM's that are already setup or define the ones passed in.
        """
        TestFunctional.setUp(self)
        nodes = self.server.status(NODE)
        if(self.check_mom_configuration()):
            for n in nodes:
                host = n['Mom']
                if host is None:
                    continue
                # Delete the server side Mom
                if host == self.server.shortname:
                    self.server.manager(MGR_CMD_DELETE, NODE, None, host)
                    break
            # setup environment for power provisioning
            self.power_nodes = self.setup_sgi_api(self.script)
            if(self.power_nodes == 0):
                self.skip_test("No mom found with power profile setup")
            else:
                # enable power hook
                self.enable_power()
                for i in range(0, len(self.moms)):
                    a = {'power_provisioning': 'True'}
                    self.server.manager(
                        MGR_CMD_SET, NODE, a, id=self.moms.keys()[i])
        else:
            self.skip_test("No mom defined on non-server host")

    def check_mom_configuration(self):
        """
        There needs to be at least one Mom that is not running on the
        server host.
        """
        multimom = False
        moms = self.server.filter(NODE, 'Mom')
        if moms is not None:
            for filt in moms.values():
                if filt[0] != self.server.shortname:
                    self.logger.info("found different mom %s from local %s" %
                                     (filt, self.server.shortname))
                    multimom = True
                    return True
            if not multimom:
                return False
        else:
            self.skip_test(
                "No mom found at server/non-server host")

    def setup_sgi_api(self, script, perm=0o755):
        """
        Setup a fake sgi_api script on all the nodes.
        Return the number of nodes.
        """
        fn = self.du.create_temp_file(body=script)
        self.du.chmod(path=fn, mode=perm, sudo=True)

        done = set()
        nodes = self.server.status(NODE)
        for n in nodes:
            host = n['Mom']
            if host is None:
                continue
            if host in done:
                continue
            done.add(host)
            pwr_dir = os.path.join(os.sep, "opt", "clmgr", "power-service")
            dest = os.path.join(pwr_dir, "hpe_clmgr_power_api.py")
            self.server.du.run_cmd(host, "mkdir -p " + pwr_dir, sudo=True)
            self.server.du.run_copy(host, src=fn, dest=dest, sudo=True)
            # Set PBS_PMINAME=sgi in pbs_environment so the power hook
            # will use the SGI functionality.
            mom = self.moms[host]
            if mom is not None:
                environ = {"PBS_PMINAME": "sgi"}
                self.server.du.set_pbs_environment(host,
                                                   environ=environ)
                self.server.du.run_cmd(host, "chown root %s" %
                                       os.path.join(mom.pbs_conf[
                                                    'PBS_HOME'],
                                                    "pbs_environment"),
                                       sudo=True)
            else:
                self.skip_test("Need to pass atleast one mom "
                               "use -p moms=<mom1:mom2>")

        os.remove(fn)
        return len(nodes)

    def revert_sgi_api(self):
        """
        Remove any fake sgi_api from the nodes.
        Return the number of nodes.
        """
        done = set()
        nodes = self.server.status(NODE)
        for n in nodes:
            host = n['Mom']
            if host is None:
                continue
            if host in done:
                continue
            done.add(host)
            pwr_dir = os.path.join(os.sep, "opt", "clmgr", "power-service")
            dest = os.path.join(pwr_dir, "hpe_clmgr_power_api.py")
            self.server.du.run_cmd(host, "rm " + dest, sudo=True)

    def enable_power(self):
        """
        Enable power_provisioning on the server.
        """
        a = {'enabled': 'True'}
        hook_name = "PBS_power"
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id=hook_name,
                            sudo=True)
        done = set()		# check that hook becomes active
        nodes = self.server.status(NODE)
        for n in nodes:
            host = n['Mom']
            if host is None:
                continue
            if host in done:
                continue
            mom = self.moms[host]
            s = mom.log_match(
                "Hook;PBS_power.HK;copy hook-related file request received",
                starttime=self.server.ctime, max_attempts=60)
            self.assertTrue(s)
            mom.signal("-HUP")

    def submit_job(self, secs=10, attr=None):
        """
        secs: sleep time for the job
        a: any job attributes
        """
        attr['Keep_Files'] = 'oe'
        j = Job(TEST_USER, attrs=attr)
        j.set_sleep_time(secs)
        self.logger.info(str(j))
        jid = self.server.submit(j)
        return jid

    def energy_check(self, jid):
        s = self.server.accounting_match("E;%s;.*" % jid,
                                         regexp=True)
        self.assertTrue(s is not None)
        # got the account record, hack it apart
        for resc in s[1].split(';')[3].split():
            if resc.partition('=')[0] == "resources_used.energy":
                return True
        return False

    def eoe_check(self, jid, eoe, secs):
        # check that job is running and that the vnode has current_eoe set
        qstat = self.server.status(JOB, id=jid)
        vname = qstat[0]['exec_vnode'].partition(':')[0].strip('(')
        self.server.expect(VNODE, {'current_eoe': eoe}, id=vname)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid, offset=secs)
        host = qstat[0]['exec_host'].partition('/')[0]
        mom = self.moms[host]		# top mom
        s = mom.log_match(".*;Job;%s;PMI: reset current_eoe.*" % jid,
                          regexp=True, starttime=self.server.ctime,
                          max_attempts=10)
        self.assertTrue(s)
        # check that vnode has current_eoe unset
        self.server.expect(VNODE, {'current_eoe': eoe}, id=vname, op=UNSET)

    def eoe_job(self, num, eoe):
        """
        Helper function to submit a job with an eoe value.
        Parameters:
        num: number of chunks
        eoe: profile name
        """
        secs = 10
        jid = self.submit_job(secs,
                              {'Resource_List.select': '%d:eoe=%s' % (num,
                                                                      eoe)})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.eoe_check(jid, eoe, secs)
        return jid

    def test_sgi_job(self):
        """
        Submit jobs with an eoe value and check that messages are logged
        indicating PMI activity, and current_eoe and resources_used.energy
        get set.
        """
        # Make sure eoe is set correctly on the vnodes
        eoes = set()		# use sets to be order independent
        nodes = list()
        for n in self.server.status(NODE):
            name = n['id']
            if 'resources_available.eoe' in n:
                self.server.manager(MGR_CMD_SET, NODE,
                                    {"power_provisioning": True}, name)
                nodes.append(name)
                curr = n['resources_available.eoe'].split(',')
                self.logger.info("%s has eoe values %s" % (name, str(curr)))
                if len(eoes) == 0:  # empty set
                    eoes.update(curr)
                else:  # all vnodes must have same eoes
                    self.assertTrue(eoes == set(curr))
        self.assertTrue(len(eoes) > 0)

        # submit jobs for each eoe value
        while len(eoes) > 0:
            eoe = eoes.pop()
            for x in range(1, len(nodes) + 1):
                jid = self.eoe_job(x, eoe)
                self.energy_check(jid)

    def test_sgi_eoe_job(self):
        """
        Submit jobs with an eoe values and check that messages are logged
        indicating PMI activity, and current_eoe and resources_used.energy
        get set.
        """
        eoes = ['100W', '150W', '450W']
        for x in range(1, self.power_nodes + 1):
            while len(eoes) > 0:
                eoe_profile = eoes.pop()
                jid = self.eoe_job(x, eoe_profile)
                self.energy_check(jid)

    def test_sgi_request_more_power_nodes(self):
        """
        Submit job with available+1 power nodes and verify job comment.
        """
        total_nodes = self.power_nodes + 1
        jid = self.submit_job(10, {'Resource_List.place': 'scatter',
                                   'Resource_List.select': '%d:eoe=%s'
                                   % (total_nodes, '150W')})
        msg = "Can Never Run: Not enough total nodes available"
        self.server.expect(JOB, {'job_state': 'Q', 'comment': msg},
                           id=jid)

    def test_sgi_job_multiple_eoe(self):
        """
        Submit jobs requesting multiple eoe and job should rejected by qsub.
        """
        try:
            a = {'Resource_List.place': 'scatter',
                 'Resource_List.select': '10:eoe=150W+10:eoe=300W'}
            self.submit_job(attr=a)
        except PbsSubmitError as e:
            self.assertTrue(
                'Invalid provisioning request in chunk' in e.msg[0])

    def test_sgi_server_prov_off(self):
        """
        Submit jobs requesting eoe when power provisioning unset on server
        and verify that jobs wont run.
        """
        a = {'enabled': 'False'}
        hook_name = "PBS_power"
        self.server.manager(MGR_CMD_SET, PBS_HOOK, a, id=hook_name,
                            sudo=True)
        self.server.expect(SERVER, {'power_provisioning': 'False'})
        eoes = ['150W', '300W', '450W']
        for profile in eoes:
            jid = self.submit_job(10,
                                  {'Resource_List.place': 'scatter',
                                   'Resource_List.select': '%d:eoe=%s'
                                   % (self.power_nodes, profile)})
            self.server.expect(JOB, {
                'job_state': 'Q',
                'comment': 'Not Running: No available resources on nodes'},
                id=jid)

    def test_sgi_node_prov_off(self):
        """
        Submit jobs requesting eoe and verify that jobs won't run on
        nodes where power provisioning is set to false.
        """
        eoes = ['100W', '250W', '300W', '400W']
        # set power_provisioning to off where eoe is set to false
        for i in range(0, self.power_nodes):
            a = {'power_provisioning': 'False'}
            self.server.manager(
                MGR_CMD_SET, NODE, a, id=self.moms.keys()[i])
        for profile in eoes:
            jid = self.submit_job(10,
                                  {'Resource_List.place': 'scatter',
                                   'Resource_List.select': '%d:eoe=%s'
                                   % (self.power_nodes, profile)})
            msg = "Not Running: No available resources on nodes"
            self.server.expect(JOB, {'job_state': 'Q', 'comment': msg},
                               id=jid)

    def test_sgi_job_preemption(self):
        """
        Submit job to a high priority queue and verify
        that job is preempted by requeueing.
        """
        for i in range(0, self.power_nodes):
            a = {'resources_available.ncpus': 1}
            self.server.manager(
                MGR_CMD_SET, NODE, a, id=self.moms.keys()[i])
        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'execution', 'started': 'True',
                             'enabled': 'True', 'priority': 150}, id='workq2')
        jid = self.submit_job(30,
                              {'Resource_List.place': 'scatter',
                               'Resource_List.select': '%d:eoe=%s'
                               % (self.power_nodes, '150W')})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        t = time.time()
        jid_workq2 = self.submit_job(10, {ATTR_queue: 'workq2',
                                          'Resource_List.place': 'scatter',
                                          'Resource_List.select': '%d:eoe=%s' %
                                          (self.power_nodes, '150W')})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_workq2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.scheduler.log_match("Job preempted by requeuing", starttime=t)

    def tearDown(self):
        # remove SGI fake script file
        self.revert_sgi_api()
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_preemption.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestPreemption(TestFunctional):
    """
    Contains tests for scheduler's preemption functionality
    """
    chk_script = """#!/bin/bash
kill $1
exit 0
"""
    chk_script_fail = """#!/bin/bash
exit 1
"""

    def setUp(self):
        TestFunctional.setUp(self)

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        # create express queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq")
        if len(self.moms) == 2:
            self.mom1 = self.moms.keys()[0]
            self.mom2 = self.moms.keys()[1]
            # Since some tests need multi-node setup and majority don't,
            # delete the second node so that single node tests don't fail.
            # Tests needing multi-node setup will create the second node
            # explicity.
            self.server.manager(MGR_CMD_DELETE, NODE, id=self.mom2)

    def submit_jobs(self):
        """
        Function to submit two normal job and one high priority job
        """
        j1 = Job(TEST_USER)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        time.sleep(1)
        j2 = Job(TEST_USER)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_q: 'expressq'})
        jid3 = self.server.submit(j3)

        return jid1, jid2, jid3

    def submit_and_preempt_jobs(self, preempt_order='R', order=None,
                                job_array=False, extra_attrs=None):
        """
        This function will set the prempt order, submit jobs,
        preempt jobs and do log_match()
        """
        if preempt_order[-1] == 'R':
            job_state = 'Q'
            preempted_by = 'requeuing'
        elif preempt_order[-1] == 'C':
            job_state = 'Q'
            preempted_by = 'checkpointing'
        elif preempt_order[-1] == 'S':
            job_state = 'S'
            preempted_by = 'suspension'
        elif preempt_order[-1] == 'D':
            job_state = ''
            preempted_by = 'deletion'

        # construct preempt_order with a number inbetween.  We use 50
        # since that will cause a different preempt_order to be used for the
        # first 50% and a different for the second 50%
        if order == 1:  # first half
            po = '"' + preempt_order + ' 50 S"'
        elif order == 2:  # second half
            po = '"S 50 ' + preempt_order + '"'
        else:
            po = preempt_order

        # set preempt order
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': po})

        lpattrs = {ATTR_l + '.select': '1:ncpus=1', ATTR_l + '.walltime': 40}
        if job_array is True:
            lpattrs[ATTR_J] = '1-3'
        if extra_attrs is not None:
            lpattrs.update(extra_attrs)

        # submit a job to regular queue
        j1 = Job(TEST_USER, lpattrs)
        jid1 = self.server.submit(j1)
        if job_array is True:
            run_state = 'B'
        else:
            run_state = 'R'
        self.server.expect(JOB, {'job_state': run_state}, id=jid1)

        if job_array is True:
            jids1 = j1.create_subjob_id(jid1, 1)
            self.server.expect(JOB, {'job_state': 'R'}, id=jids1)

        if order == 2:
            self.logger.info('Sleep 30s until the job is over 50% done')
            time.sleep(30)

        # submit a job to high priority queue
        j2 = Job(TEST_USER, {'queue': 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        if job_array is True:
            jid = jids1
        else:
            jid = jid1

        if preempt_order[-1] != 'D':
            self.server.expect(JOB, {'job_state': job_state}, id=jid)
        elif job_array is True:
            self.server.expect(JOB, {'job_state': 'X'}, id=jids1)
        else:
            self.server.expect(JOB, 'queue', op=UNSET, id=jid)

        self.scheduler.log_match(jid + ";Job preempted by " + preempted_by)

    def test_preempt_suspend(self):
        """
        Test that a job is preempted by suspension
        """
        self.submit_and_preempt_jobs(preempt_order='S')

    def test_preempt_suspend_ja(self):
        """
        Test that a subjob is preempted by suspension
        """
        self.submit_and_preempt_jobs(preempt_order='S', job_array=True)

    def test_preempt_checkpoint(self):
        """
        Test that a job is preempted with checkpoint
        """
        self.mom.add_checkpoint_abort_script(body=self.chk_script)
        self.submit_and_preempt_jobs(preempt_order='C')

    def test_preempt_checkpoint_requeue(self):
        """
        Test that when checkpoint fails, a job is correctly requeued
        """
        # no checkpoint script, should requeue
        self.submit_and_preempt_jobs(preempt_order='CR')
        self.server.cleanup_jobs()

        # checkpoint script fails, should requeue
        self.mom.add_checkpoint_abort_script(body=self.chk_script_fail)
        self.submit_and_preempt_jobs(preempt_order='CR')

    def test_preempt_requeue(self):
        """
        Test that a job is preempted by requeue
        """
        self.submit_and_preempt_jobs(preempt_order='R')

    @skipOnCpuSet
    def test_preempt_requeue_exclhost(self):
        """
        Test that a job is preempted by requeue on node
        where attribute share is set to force_exclhost
        """
        # set node share attribute to force_exclhost
        a = {'resources_available.ncpus': '1',
             'sharing': 'force_exclhost'}
        self.mom.create_vnodes(attrib=a, num=0)
        start_time = time.time()
        self.submit_and_preempt_jobs(preempt_order='R')
        self.scheduler.log_match(
            "Failed to run: Resource temporarily unavailable (15044)",
            existence=False, starttime=start_time,
            max_attempts=5)

    def test_preempt_requeue_ja(self):
        """
        Test that a subjob is preempted by requeue
        """
        self.submit_and_preempt_jobs(preempt_order='R', job_array=True)

    def test_preempt_delete(self):
        """
        Test preempt via delete correctly deletes a job
        """
        self.submit_and_preempt_jobs(preempt_order='D')

    def test_preempt_delete_ja(self):
        """
        Test preempt via delete correctly deletes a subjob
        """

        self.submit_and_preempt_jobs(preempt_order='D', job_array=True)

    def test_preempt_checkpoint_delete(self):
        """
        Test that when checkpoint fails, a job is correctly deleted
        """
        self.mom.add_checkpoint_abort_script(body=self.chk_script_fail)
        self.submit_and_preempt_jobs(preempt_order='CD')

    def test_preempt_rerunable_false(self):
        # in CLI mode Rerunnable requires a 'n' value.  It's different with API
        m = self.server.get_op_mode()

        self.server.set_op_mode(PTL_CLI)
        a = {'Rerunable': 'n'}
        self.submit_and_preempt_jobs(preempt_order='RD', extra_attrs=a)

        self.server.set_op_mode(m)

    def test_preempt_checkpoint_false(self):
        # in CLI mode Checkpoint requires a 'n' value.  It's different with API
        m = self.server.get_op_mode()
        self.server.set_op_mode(PTL_CLI)
        self.mom.add_checkpoint_abort_script(body=self.chk_script)
        a = {'Checkpoint': 'n'}
        self.submit_and_preempt_jobs(preempt_order='CD', extra_attrs=a)

        self.server.set_op_mode(m)

    def test_preempt_order_requeue_first(self):
        """
        Test that a low priority job is requeued if preempt_order is in
        the form of 'R 50 S' and the job is in the first 50% of its run time
        """
        self.submit_and_preempt_jobs(preempt_order='R', order=1)

    def test_preempt_order_requeue_second(self):
        """
        Test that a low priority job is requeued if preempt_order is in
        the form of 'S 50 R' and the job is in the second 50% of its run time
        """
        self.submit_and_preempt_jobs(preempt_order='R', order=2)

    def test_preempt_requeue_never_run(self):
        """
        Test that a job is preempted by requeue and the scheduler does not
        report the job as can never run
        """
        start_time = time.time()
        self.submit_and_preempt_jobs(preempt_order='R')
        self.scheduler.log_match(
            ";Job will never run", existence=False, starttime=start_time,
            max_attempts=5)

    def test_preempt_multiple_jobs(self):
        """
        Test that multiple jobs are preempted by one large high priority job
        """
        a = {'resources_available.ncpus': 10}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        for _ in range(10):
            a = {'Resource_List.select': '1:ncpus=1',
                 'Resource_List.walltime': 40}
            j = Job(TEST_USER, a)
            self.server.submit(j)

        self.server.expect(JOB, {'job_state=R': 10})
        a = {'Resource_List.select': '1:ncpus=10',
             'Resource_List.walltime': 40,
             'queue': 'expressq'}
        hj = Job(TEST_USER, a)
        hjid = self.server.submit(hj)

        self.server.expect(JOB, {'job_state=S': 10})
        self.server.expect(JOB, {'job_state': 'R'}, id=hjid)

    def test_qalter_preempt_targets_to_none(self):
        """
        Test that a job requesting preempt targets set to two different queues
        can be altered to set preempt_targets as NONE
        """

        # create an addition queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "workq2")

        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'False'})
        # submit a job in expressq with preempt targets set to workq, workq2
        a = {'Resource_List.preempt_targets': 'queue=workq,queue=workq2'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)

        self.server.alterjob(jobid=jid,
                             attrib={'Resource_List.preempt_targets': 'None'})
        self.server.expect(JOB, id=jid,
                           attrib={'Resource_List.preempt_targets': 'None'})

    def test_preempt_sort_when_set(self):
        """
        This test is for preempt_sort when it is set to min_time_since_start
        """
        a = {ATTR_rescavail + '.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        a = {'preempt_sort': 'min_time_since_start'}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        jid1, jid2, jid3 = self.submit_jobs()
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)

    def test_preempt_retry(self):
        """
        Test that jobs can be successfully preempted after a previously failed
        attempt at preemption.
        """
        # in CLI mode Rerunnable requires a 'n' value.  It's different with API
        m = self.server.get_op_mode()

        self.server.set_op_mode(PTL_CLI)

        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        abort_script = """#!/bin/bash
exit 3
"""
        self.mom.add_checkpoint_abort_script(body=abort_script)
        # submit two jobs to regular queue
        attrs = {'Resource_List.select': '1:ncpus=1', 'Rerunable': 'n'}
        j1 = Job(TEST_USER, attrs)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        time.sleep(2)

        j2 = Job(TEST_USER, attrs)
        jid2 = self.server.submit(j2)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        # set preempt order
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'CR'})

        # submit a job to high priority queue
        a = {ATTR_q: 'expressq'}
        j3 = Job(TEST_USER, a)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)

        self.server.log_match(jid1 + ';Job failed to be preempted')
        self.server.log_match(jid2 + ';Job failed to be preempted')

        # Allow jobs to be requeued.
        attrs = {'Rerunable': 'y'}
        self.server.alterjob(jid1, attrs)
        self.server.alterjob(jid2, attrs)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.set_op_mode(m)

    def test_vnode_resource_contention(self):
        """
        Test to make sure that preemption happens when the resource in
        contention is vnode.
        """
        vn4 = self.mom.shortname + '[4]'
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(attrib=a, num=11, usenatvnode=False)

        a = {'Resource_List.select': '1:ncpus=2+1:ncpus=2'}
        for _ in range(5):
            j = Job(TEST_USER, attrs=a)
            jid = self.server.submit(j)
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Randomly select a vnode with running jobs on it. Request this
        # vnode in the high priority job later.
        self.server.expect(NODE, {'state': 'job-busy'}, id=vn4)

        a = {ATTR_q: 'expressq', 'Resource_List.vnode': vn4}
        hj = Job(TEST_USER, attrs=a)
        hjid = self.server.submit(hj)
        self.server.expect(JOB, {'job_state': 'R'}, id=hjid)

        # Since high priority job consumed only one ncpu, vnode[4]'s
        # node state should be free now
        self.server.expect(NODE, {'state': 'free'}, id=vn4)

    @requirements(num_moms=2)
    def test_host_resource_contention(self):
        """
        Test to make sure that preemption happens when the resource in
        contention is host.
        """
        # Skip test if number of mom provided is not equal to two
        if len(self.moms) != 2:
            self.skipTest("test requires two MoMs as input, " +
                          "use -p moms=<mom1>:<mom2>")
        else:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.mom2)

        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom1)
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom2)

        a = {'Resource_List.select': '1:ncpus=2'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        # Stat job to check which job is running on mom1
        pjid = jid2
        job_stat = self.server.status(JOB, id=jid1)
        ehost = job_stat[0]['exec_host'].partition('/')[0]
        if ehost == self.mom1:
            pjid = jid1

        # Submit a express queue job requesting the host
        a = {ATTR_q: 'expressq', 'Resource_List.host': self.mom1}
        hj = Job(TEST_USER, attrs=a)
        hjid = self.server.submit(hj)
        self.server.expect(JOB, {'job_state': 'R'}, id=hjid)
        self.server.expect(JOB, {'job_state': 'S'}, id=pjid)

        # Submit another express queue job requesting the host,
        # this job will stay queued
        a = {ATTR_q: 'expressq', 'Resource_List.host': self.mom1,
             'Resource_List.ncpus': 2}
        hj2 = Job(TEST_USER, attrs=a)
        hjid2 = self.server.submit(hj2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=hjid2)
        comment = "Not Running: Insufficient amount of resource: host"
        self.server.expect(JOB, {'comment': comment}, id=hjid2)

    def test_preempt_queue_restart(self):
        """
        Test that a queue which has preempt_targets set to another queue
        recovers successfully before the target queue during server restart
        """
        # create an addition queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "workq2")

        # create an addition queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "workq3")

        a = {'resources_default.preempt_targets': 'queue=workq3'}
        self.server.manager(MGR_CMD_SET, QUEUE, a, "workq2")
        self.server.expect(QUEUE, a, id='workq2')
        self.server.manager(MGR_CMD_SET, QUEUE, a, "workq3")

        self.server.restart()

        try:
            self.server.expect(QUEUE, a, id='workq2', max_attempts=1)
        except PtlExpectError:
            self.server.stop()
            reset_db = 'echo y | ' + \
                os.path.join(self.server.pbs_conf['PBS_EXEC'],
                             'sbin', 'pbs_server') + ' -t create'
            self.du.run_cmd(cmd=reset_db, sudo=True, as_script=True)
            self.fail('TC failed as workq2 recovery failed')

    def test_insufficient_server_rassn_select_resc(self):
        """
        Set a rassn_select resource (like ncpus or mem) ons server and
        check if scheduler is able to preempt a lower priority job when
        resource in contention is this rassn_select resource.
        """

        a = {ATTR_rescavail + ".ncpus": "8"}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        # Make resource ncpu available on server
        a = {ATTR_rescavail + ".ncpus": 4}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {ATTR_l + '.select': '1:ncpus=3'}
        j = Job(TEST_USER, attrs=a)
        jid_low = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid_low)

        a = {ATTR_l + '.select': '1:ncpus=3', ATTR_q: 'expressq'}
        j = Job(TEST_USER, attrs=a)
        jid_high = self.server.submit(j)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid_high)

    def test_preemption_priority_escalation(self):
        """
        Test that scheduler does not try preempting a job that escalates its
        preemption priority when preempted.
        """
        # create an addition queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "workq2")

        a = {'resources_available.ncpus': 8}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        a = {'max_run_res_soft.ncpus': "[u:" + str(TEST_USER) + "=4]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')

        a = {'max_run_res_soft.ncpus': "[u:" + str(TEST_USER2) + "=2]"}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        p = "express_queue, normal_jobs, server_softlimits, queue_softlimits"
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a)
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events':  2047})

        # Submit 4 jobs requesting 1 ncpu each in workq
        a = {ATTR_l + '.select': '1:ncpus=1'}
        jid_list = []
        for _ in range(4):
            j = Job(TEST_USER, a)
            jid = self.server.submit(j)
            jid_list.append(jid)

        # Submit 5th job that will make all the job in workq to go over its
        # softlimits
        a = {ATTR_l + '.select': '1:ncpus=1'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        jid_list.append(jid)
        self.server.expect(JOB, {'job_state=R': 5})

        # Submit a job in workq2 which requests for 3 ncpus, this job will
        # make user2 go over its soft limits
        a = {ATTR_l + '.select': '1:ncpus=3', ATTR_q: 'workq2'}
        j = Job(TEST_USER2, a)
        jid = self.server.submit(j)
        jid_list.append(jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        # Submit a job in workq2 which requests for 1 ncpus, this job will
        # not preempt because if it does then all TEST_USER jobs will move
        # from being over queue softlimits to normal.
        a = {ATTR_l + '.select': '1:ncpus=1', ATTR_q: 'workq2'}
        j = Job(TEST_USER2, a)
        jid = self.server.submit(j)
        jid_list.append(jid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        msg = ";Preempting job will escalate its priority"
        for job_id in jid_list[0:-2]:
            self.scheduler.log_match(job_id + msg)

    def test_preemption_priority_escalation_2(self):
        """
        Test that scheduler does not try preempting a job that escalates its
        preemption priority when preempted. But in this case ensure that the
        job whose preemption priority gets escalated is one of the running
        jobs that scheduler is yet to preempt in simulated universe.
        """
        # create an addition queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "workq2")

        a = {'resources_available.ncpus': 10}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        a = {'type': 'long', 'flag': 'nh'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='foo')

        a = {'resources_available.foo': 10}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        self.scheduler.add_resource('foo')

        a = {'max_run_res_soft.ncpus': "[u:PBS_GENERIC=5]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')
        # Set a soft limit on resource foo to 0 so that all jobs requesting
        # this resource are over soft limits.
        a = {'max_run_res_soft.foo': "[u:PBS_GENERIC=0]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')

        p = "express_queue, normal_jobs, queue_softlimits"
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a)
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events':  2047})

        # Submit 4 jobs requesting 1 ncpu each in workq
        jid_list = []
        for index in range(4):
            a = {ATTR_l + '.select': '1:ncpus=1:foo=2'}
            if (index == 2):
                # Since this job is not requesting foo, preempting one job
                # from this queue will escalate its preemption priority to
                # normal and scheduler will not attempt to preempt it.
                a = {ATTR_l + '.select': '1:ncpus=1'}
            j = Job(TEST_USER, a)
            jid = self.server.submit(j)
            jid_list.append(jid)
            time.sleep(1)

        # Submit 5th job that will make all the job in workq to go over its
        # softlimits because if resource ncpus
        a = {ATTR_l + '.select': '1:ncpus=2:foo=2'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        jid_list.append(jid)
        self.server.expect(JOB, {'job_state=R': 5})

        # Submit a job in workq2 which requests for 8 ncpus and 3 foo resource
        a = {ATTR_l + '.select': '1:ncpus=8:foo=3', ATTR_q: 'workq2'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        jid_list.append(jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_list[5])
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_list[2])
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_list[0])
        self.server.expect(JOB, {'job_state': 'S'}, id=jid_list[1])
        self.server.expect(JOB, {'job_state': 'S'}, id=jid_list[3])
        self.server.expect(JOB, {'job_state': 'S'}, id=jid_list[4])

    def test_preempt_requeue_resc(self):
        """
        Test that scheduler will preempt jobs for resources with rrtros
        set for other resources
        """
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        a = {'type': 'long', 'flag': 'q'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='foo')

        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'R'})

        a = {'resources_available.foo': 2,
             ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.scheduler.add_resource('foo')

        a = {'Resource_List.foo': 1}
        jid1 = self.server.submit(Job(attrs=a))
        jid2 = self.server.submit(Job(attrs=a))

        self.server.expect(JOB, {'job_state=R': 2})
        a = {'Resource_List.foo': 1,
             'queue': 'expressq'}
        hjid = self.server.submit(Job(attrs=a))

        self.server.expect(JOB, {'job_state': 'R'}, id=hjid)
        self.server.expect(JOB, {'job_state=Q': 1})

    @staticmethod
    def wrong_cull_attr(name, totnodes, numnode, attrib):
        """
        Helper function for test_preempt_wrong_cull
        """

        a = {}
        if numnode % 2 == 0:
            a['resources_available.app'] = 'appA'
        else:
            a['resources_available.app'] = 'appB'
        return {**attrib, **a}

    def test_preempt_wrong_cull(self):
        """
        Test to make sure that if a preemptor cannot run because
        it misses a non-consumable on a node, preemption candidates
        are not incorrectly removed from consideration
        if and because they "do not request the relevant resource".
        Deciding on their utility should be left to the check
        to see whether the nodes they occupy are useful.
        """

        attr = {'type': 'string_array', 'flag': 'h'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='app')
        self.scheduler.add_resource('app')

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(attrib=a, num=2, usenatvnode=False,
                               attrfunc=self.wrong_cull_attr)
        # set the preempt_order to kill/requeue only -- try old and new syntax
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'R'})

        # create express queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 200}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "hipri")

        # create normal queue
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True',
             'Priority': 1}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "lopri")

        # submit job 1
        a = {'Resource_List.select': '1:ncpus=1:vnode=' +
             self.mom.shortname + '[0]', ATTR_q: 'lopri'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        # submit job 2
        a = {'Resource_List.select': '1:ncpus=1:app=appA', ATTR_q: 'hipri'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

    @requirements(num_moms=2)
    def test_chunk_level_host_resource_contention(self):
        """
        Test to make sure that preemption happens when the resource in
        contention is host requested inside a chunk.
        """
        # Skip test if number of mom provided is not equal to two
        if len(self.moms) != 2:
            self.skipTest("test requires two MoMs as input, " +
                          "use -p moms=<mom1>:<mom2>")
        else:
            self.server.manager(MGR_CMD_CREATE, NODE, id=self.mom2)

        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom1)
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom2)

        a = {'Resource_List.select': '1:ncpus=2'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        # Stat job to check which job is running on mom1
        pjid = jid1
        job_stat = self.server.status(JOB, id=jid1)
        ehost = job_stat[0]['exec_host'].partition('/')[0]

        # Submit a express queue job requesting the host
        a = {ATTR_q: 'expressq',
             'Resource_List.select': '1:ncpus=2:host=' + ehost}
        hj = Job(TEST_USER, attrs=a)
        hjid = self.server.submit(hj)
        self.server.expect(JOB, {'job_state': 'R'}, id=hjid)
        self.server.expect(JOB, {'job_state': 'S'}, id=pjid)

        # Submit another express queue job requesting the host,
        # this job will stay queued
        a = {ATTR_q: 'expressq', 'Resource_List.host': ehost,
             'Resource_List.ncpus': 2}
        hj2 = Job(TEST_USER, attrs=a)
        hjid2 = self.server.submit(hj2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=hjid2)
        comment = "Not Running: Insufficient amount of resource: host"
        self.server.expect(JOB, {'comment': comment}, id=hjid2)

    def test_chunk_level_vnode_resource_contention(self):
        """
        Test to make sure that preemption happens when the resource in
        contention is vnode requested inside a chunk.
        """

        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(attrib=a, num=11, usenatvnode=False)

        a = {'Resource_List.select': '1:ncpus=2+1:ncpus=2'}
        for _ in range(5):
            j = Job(TEST_USER, attrs=a)
            jid = self.server.submit(j)
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Select a vnode with running jobs on it. Request this
        # vnode in the high priority job later.
        vn4 = self.mom.shortname + '[4]'
        self.server.expect(NODE, {'state': 'job-busy'}, id=vn4)

        a = {ATTR_q: 'expressq',
             'Resource_List.select': '1:ncpus=1:vnode=' + vn4}
        hj = Job(TEST_USER, attrs=a)
        hjid = self.server.submit(hj)
        self.server.expect(JOB, {'job_state': 'R'}, id=hjid)
        self.server.expect(JOB, {'job_state=R': 5})
        self.server.expect(JOB, {'job_state=S': 1})


================================================
FILE: test/tests/functional/pbs_printjob.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestPrintjob(TestFunctional):
    def test_state_substate(self):
        """
        Verify that printjob prints the state and substate in expected format
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        a = {'job_state': 'R', 'substate': 42}
        self.server.expect(JOB, a, id=jid)
        ret = self.mom.printjob(jid)
        self.assertEqual(ret['rc'], 0)
        sfound = False
        ssfound = False
        for line in ret['out']:
            if line.startswith("state:"):
                val = line.split("state:", 1)[1]
                val = val.strip()
                numval = int(val, 16)
                self.assertEqual(numval, 4)  # R state = numeric 4
                sfound = True
            elif line.startswith("substate:"):
                val = line.split("substate:", 1)[1]
                val = val.split()[0]
                val = val.strip()
                numval = int(val, 16)
                self.assertEqual(numval, 42)
                ssfound = True
        self.assertTrue(sfound and ssfound)


================================================
FILE: test/tests/functional/pbs_provisioning.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *


hook_begin = """
import pbs
pbs.logmsg(pbs.LOG_DEBUG,
"executed execjob_begin hook on job %s" % (pbs.event().job.id))
"""
hook_provision = """
import pbs
import time
e = pbs.event()
vnode = e.vnode
aoe = e.aoe
if aoe == 'App1':
    pbs.logmsg(pbs.LOG_DEBUG, "fake calling application provisioning script")
    e.accept(1)
pbs.logmsg(pbs.LOG_DEBUG, "aoe=%s,vnode=%s" % (aoe,vnode))
pbs.logmsg(pbs.LOG_DEBUG, "fake calling os provisioning script")
e.accept(0)
"""


@requirements(no_mom_on_server=True)
class TestProvisioningJob(TestFunctional):
    """
    This testsuite tests whether OS provisioned jobs are getting all
     required hook files at MOM

      PRE: Have a cluster of PBS with a MOM installed on other
             than PBS server host.

      1) Enable provisioning and set AOEs to the provisioning MOM
      2) Create Hooks
          i) Provisioning hook which is facking OS provisioning.
         ii) execjob_begin hook prints a log message on MOM node.
      3) Submit job with an aoe.
      4) Node will go into the provisioning state while it is
             running provisioning hook.
      5) Deletes execjob_begin hook file begin.PY from MOM
      6) Restarts MOM as we are not doing actual OS provisioning
      7) Then check for hook files are copied to the MOM node
             and job is printing log message from execjob_begin hook.
    """
    hook_list = ['begin', 'my_provisioning']
    hostA = ""

    def setUp(self):
        TestFunctional.setUp(self)
        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        msg = ("We cannot provision on cpuset mom, host has vnodes")
        if self.momA.is_cpuset_mom():
            self.skipTest(msg)
        self.momA.delete_vnode_defs()
        self.logger.info(self.momA.shortname)
        a = {'provision_enable': 'true'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostA)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})
        self.server.expect(NODE, {'state': 'free'}, id=self.hostA)

        a = {'event': 'execjob_begin', 'enabled': 'True'}
        rv = self.server.create_import_hook(
            self.hook_list[0], a, hook_begin, overwrite=True)
        self.assertTrue(rv)

        a = {'event': 'provision', 'enabled': 'True', 'alarm': '300'}
        rv = self.server.create_import_hook(
            self.hook_list[1], a, hook_provision, overwrite=True)
        self.assertTrue(rv)

    def test_execjob_begin_hook_on_os_provisioned_job(self):
        """
        Test the execjob_begin hook is seen by OS provisioned job.
        """
        a = {'resources_available.aoe': 'osimage1'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostA)

        job = Job(TEST_USER1, attrs={ATTR_l: 'aoe=osimage1'})
        job.set_sleep_time(1)
        jid = self.server.submit(job)

        rv = self.server.expect(NODE, {'state': 'provisioning'}, id=self.hostA)
        self.assertTrue(rv)

        phome = self.momA.pbs_conf['PBS_HOME']
        begin = self.momA.get_formed_path(phome, 'mom_priv', 'hooks',
                                          'begin.PY')
        ret = self.momA.rm(path=begin, force=True, sudo=True, logerr=False)
        if not ret:
            self.logger.error("problem deleting %s" % begin)
        self.momA.restart()
        time.sleep(5)
        rv = self.server.log_match(
            "successfully sent hook file "
            "/var/spool/pbs/server_priv/hooks/begin.PY",
            max_attempts=20,
            interval=1)
        self.assertTrue(rv)
        rv = self.mom.log_match("begin.PY;copy hook-related file "
                                "request received",
                                regexp=True,
                                max_attempts=20,
                                interval=1)
        self.assertTrue(rv)
        rv = self.mom.log_match("executed execjob_begin hook on job %s" % jid,
                                regexp=True,
                                max_attempts=20,
                                interval=1)
        self.assertTrue(rv)

    def test_app_provisioning(self):
        """
        Test application provisioning
        """
        a = {'resources_available.aoe': 'App1'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostA)

        job = Job(TEST_USER1, attrs={ATTR_l: 'aoe=App1'})
        jid = self.server.submit(job)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.log_match(
            "fake calling application provisioning script",
            max_attempts=20,
            interval=1)

    def test_os_provisioning_pending_hook_copy(self):
        """
        Test that job still runs after:
        1. os provisioning succeeded
        2. pending mom hook copy action has persisted on
           downed node that is not part of job
        """
        if len(self.moms) < 2:
            cmt = "need 2 non-server mom hosts: -p moms=<m1>:<m2>"
            self.skip_test(reason=cmt)
        self.momB = self.moms.values()[1]
        self.hostB = self.momB.shortname
        msg = ("We cannot provision on cpuset mom, host has vnodes")
        if self.momA.is_cpuset_mom() or self.momB.is_cpuset_mom():
            self.skipTest(msg)
        a = {'resources_available.aoe': 'osimage1'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostA)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostB)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostA)

        job = Job(TEST_USER1, attrs={ATTR_l: 'aoe=osimage1'})
        job.set_sleep_time(30)
        jid = self.server.submit(job)
        self.server.expect(NODE, {'state': 'provisioning'}, id=self.hostA)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 71}, id=jid)
        self.server.log_match("fake calling os provisioning script")

        # Bring down the mom that is not part of the job
        self.momB.stop()
        # Force a server hook send of mom hooks
        # With momB being down, pending hook copy to momB action persists
        self.server.manager(MGR_CMD_SET, HOOK,
                            {'enabled': 'True'}, self.hook_list[0])

        # a restart is needed to complete os provisioning
        self.momA.restart()
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)


================================================
FILE: test/tests/functional/pbs_provisioning_enhancement.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestProvisioningJob_Enh(TestFunctional):
    """
    This testsuite tests newly introduced provisioining capabilities.
    With this enhacement, PBS will be able to run job requesting aoe
    in subchunks, just like any other custom non consumable resource.

    PRE: Have a cluster of PBS with two MOM's installed, with one MOM
    on a node other than PBS server host. Pass the provisionable mom
    first in pbs_bencpress.
    Eg. pbs_bencpress -p moms=second_node:server_node ...
    """

    fake_prov_hook = """
import pbs
import time
e = pbs.event()

vnode = e.vnode
aoe = e.aoe
if aoe == 'App1':
    pbs.logmsg(pbs.LOG_DEBUG, "fake application provisioning script")
    e.accept(1)
pbs.logmsg(pbs.LOG_DEBUG, "aoe=%s,vnode=%s" % (aoe,vnode))
pbs.logmsg(pbs.LOG_DEBUG, "fake os provisioning script")
e.accept(0)
"""
    reject_runjob_hook = """
import pbs
e = pbs.event()
j = e.job
pbs.logmsg(pbs.LOG_DEBUG, "job " + str(j) + " solution " + str(j.exec_vnode))
e.reject()
"""

    def setUp(self):

        if self.du.get_platform().startswith('cray'):
            self.skipTest("Test suite only meant to run on non-Cray")
        if len(self.moms) < 2:
            self.skipTest("Provide at least 2 moms while invoking test")

        TestFunctional.setUp(self)
        # This test suite expects the the first mom given with "-p moms"
        # benchpress option to be remote mom. In case this assumption
        # is not true then it reverses the order in the setup.
        if self.moms.values()[0].shortname == self.server.shortname:
            self.momA = self.moms.values()[1]
            self.momB = self.moms.values()[0]
        else:
            self.momA = self.moms.values()[0]
            self.momB = self.moms.values()[1]

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        # Remove all nodes
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        # Create node
        self.server.manager(MGR_CMD_CREATE, NODE, None, self.hostA)
        self.server.manager(MGR_CMD_CREATE, NODE, None, self.hostB)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostA)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostB)

        # Set hostA provisioning attributes.
        a = {'provision_enable': 'true',
             'resources_available.ncpus': '2',
             'resources_available.aoe': 'App1,osimage1'}
        self.server.manager(
            MGR_CMD_SET, NODE, a, id=self.hostA)
        self.server.manager(MGR_CMD_UNSET, NODE, id=self.hostA,
                            attrib='current_aoe')

        # Set hostB ncpus to 12
        a = {'resources_available.ncpus': '12'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostB)

        # Setup provisioning hook.
        a = {'event': 'provision', 'enabled': 'True', 'alarm': '300'}
        rv = self.server.create_import_hook(
            'fake_prov_hook', a, self.fake_prov_hook, overwrite=True)
        self.assertTrue(rv)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

    def test_app_provisioning(self):
        """
        Test application provisioning
        """
        j = Job(TEST_USER1)
        j.set_attributes({'Resource_List.select': '1:aoe=App1'})
        jid = self.server.submit(j)

        # Job should start running after provisioining script finish
        # executing.
        # Since this is application provisioining, mom restart is
        # not needed.
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Current aoe on momA, should be set to the requested aoe in job.
        self.server.expect(NODE, {'current_aoe': 'App1'}, id=self.hostA)

        self.server.log_match(
            "fake application provisioning script",
            max_attempts=20,
            interval=1)

    def test_os_provisioning(self):
        """
        Test os provisioning
        """

        j = Job(TEST_USER1)
        j.set_attributes({'Resource_List.select': '1:aoe=osimage1'})
        jid = self.server.submit(j)

        # Job will start and wait for provisioning to complete.
        self.server.expect(JOB, {ATTR_substate: '71'}, id=jid)
        self.server.log_match("fake os provisioning script",
                              max_attempts=60,
                              interval=1)

        # Since this is OS provisioining, mom restart is
        # required to finish provisioining. Sending SIGHUP
        # to the provisioning mom will also work, but restart
        # is more apt to simulate real world scenario.
        self.momA.restart()

        # Current aoe on momA should be set to the requested aoe in job.
        self.server.expect(NODE, {'current_aoe': 'osimage1'}, id=self.hostA)

        # After mom restart job execution should start, as
        # OS provisioining completes affer mom restart.
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

    def test_subchunk_application_provisioning(self):
        """
        Test application provisioning job request consist of subchunks
        with and without aoe resource.
        """
        j = Job(TEST_USER1)
        j.set_attributes({'Resource_List.select':
                          '1:ncpus=1:aoe=App1+1:ncpus=12'})
        jid = self.server.submit(j)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        self.server.expect(JOB, ATTR_execvnode, id=jid, op=SET)
        nodes = j.get_vnodes(j.exec_vnode)
        self.server.log_match("fake application provisioning script",
                              max_attempts=20,
                              interval=1)
        self.assertTrue((nodes[0] == self.momA.shortname and
                         nodes[1] == self.momB.shortname) or
                        (nodes[0] == self.momB.shortname and
                         nodes[1] == self.momA.shortname))

        # Current aoe on momA, should be set to the requested aoe in job.
        self.server.expect(NODE, {'current_aoe': 'App1'}, id=self.hostA)

    def test_subchunk_os_provisioning(self):
        """
        Test os provisioning job request consist of subchunks
        with and without aoe resource.
        """
        a = {'Resource_List.select': '1:aoe=osimage1+1:ncpus=12'}
        j = Job(TEST_USER1, a)
        jid = self.server.submit(j)
        self.server.expect(JOB, ATTR_execvnode, id=jid, op=SET)
        nodes = j.get_vnodes(j.exec_vnode)
        self.assertTrue((nodes[0] == self.momA.shortname and
                         nodes[1] == self.momB.shortname) or
                        (nodes[0] == self.momB.shortname and
                         nodes[1] == self.momA.shortname))

        self.momA.restart()

        # After mom restart job execution should start, as
        # OS provisioining completes affer mom restart.
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Current aoe on momA, should be set to the requested aoe in job.
        self.server.expect(NODE, {'current_aoe': 'osimage1'}, id=self.hostA)

    def test_job_wide_provisioining_request(self):
        """
        Test jobs with jobwide aoe resource request.
        """

        # Below job will not run, since resource requested are job-wide,
        # and no single node have all the requested resource.

        j = Job(TEST_USER1)
        j.set_attributes({"Resource_List.aoe": "App1",
                          "Resource_List.ncpus": 12})
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'Q',
                                 ATTR_comment:
                                 (MATCH_RE, 'Not Running: Insufficient ' +
                                  'amount of resource: .*')}, id=jid)

        j = Job(TEST_USER1)
        j.set_attributes({"Resource_List.aoe": "App1",
                          "Resource_List.ncpus": 1})
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Current aoe on momA, should be set to the requested aoe in job.
        self.server.expect(NODE, {'current_aoe': 'App1'}, id=self.hostA)

    def test_multiple_aoe_request(self):
        """
        Test jobs with multiple similar/various aoe request in subchunks.
        Job request cosisting of multiple subchunks with different aoe will
        fail submission, Whereas job request with same aoe across multiple
        subchunks should be succesful.
        """

        a1 = {'Resource_List.select':
              '1:ncpus=1:aoe=App1+1:ncpus=12:aoe=osimage1'}

        a2 = {'Resource_List.select':
              '1:ncpus=1:aoe=App1+1:ncpus=12:aoe=App1'}

        # Below job will fail submission, since different aoe's requested,
        # across multiple subchunks.

        j = Job(TEST_USER1)
        j.set_attributes(a1)
        jid = None
        try:
            jid = self.server.submit(j)
            self.assertTrue(jid is None, 'Job successfully submitted' +
                            'when it should have failed')
        except PbsSubmitError as e:
            self.assertTrue('Invalid provisioning request in chunk(s)'
                            in e.msg[0],
                            'Job submission failed, but due to ' +
                            'unexpected reason.\n%s' % e.msg[0])
            self.logger.info("Job submission failed, as expected")

        # Below job will get submitted, since same aoe requested,
        # across multiple subchunks.

        j = Job(TEST_USER1)
        j.set_attributes(a2)
        jid = self.server.submit(j)
        self.assertTrue(jid is not None, 'Job submission failed' +
                        'when it should have succeeded')
        self.logger.info("Job submission succeeded, as expected")

    def test_provisioning_with_placement(self):
        """
        Test provisioining job with various placement options.
        """

        # Below job will not run, since placement is set to pack.
        # and no single node have all the requested resource.

        j = Job(TEST_USER1)
        j.set_attributes({'Resource_List.select':
                          '1:ncpus=1:aoe=App1+1:ncpus=12',
                          'Resource_List.place': 'pack'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'Q',
                                 ATTR_comment:
                                 (MATCH_RE, 'Not Running: Insufficient ' +
                                  'amount of resource: .*')}, id=jid)

        # Below job will run with placement set to pack.
        # since there is only one node with the requested resource.

        j = Job(TEST_USER1)
        j.set_attributes({'Resource_List.select':
                          '1:ncpus=1:aoe=App1+1:ncpus=1',
                          'Resource_List.place': 'pack'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(JOB, ATTR_execvnode, id=jid, op=SET)
        nodes = j.get_vnodes(j.exec_vnode)
        self.assertTrue(nodes[0] == self.momA.shortname)

        # Current aoe on momA, should be set to the requested aoe in job.
        self.server.expect(NODE, {'current_aoe': 'App1'}, id=self.hostA)

        # This was needed since sometime the above job takes longer
        # to finish and release the resources. This causes delay for
        # the next job to start and can probably fail the test.
        self.server.cleanup_jobs()

        # Below job will run on two node with placement set to scatter.
        # even though single node can satisfy both the requested chunks.

        j = Job(TEST_USER1)
        j.set_attributes({'Resource_List.select':
                          '1:ncpus=1:aoe=App1+1:ncpus=1',
                          'Resource_List.place': 'scatter'})
        jid = self.server.submit(j)
        self.server.expect(JOB, ATTR_execvnode, id=jid, op=SET)
        nodes = j.get_vnodes(j.exec_vnode)
        self.assertTrue((nodes[0] == self.momA.shortname and
                         nodes[1] == self.momB.shortname) or
                        (nodes[0] == self.momB.shortname and
                         nodes[1] == self.momA.shortname))
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Current aoe on momA, should be set to the requested aoe in job.
        self.server.expect(NODE, {'current_aoe': 'App1'}, id=self.hostA)

    def test_sched_provisioning_response_with_runjob(self):
        """
        Test that if one provisioning job fails to run then scheduler
        correctly provides the node solution for the second job with aoe in
        it.
        """
        # Setup runjob hook.
        a = {'event': 'runjob', 'enabled': 'True'}
        rv = self.server.create_import_hook(
            'reject_runjob_hook', a, self.reject_runjob_hook, overwrite=True)
        self.assertTrue(rv)
        # Set current aoe to App1
        self.server.manager(MGR_CMD_SET, NODE, id=self.hostA,
                            attrib={'current_aoe': 'App1'})

        # Turn on scheduling
        self.server.manager(MGR_CMD_SET,
                            SERVER, {'scheduling': 'False'})

        # submit two provisioning jobs
        a = {'Resource_List.select': '1:aoe=osimage1:ncpus=1+1:ncpus=4',
             'Resource_List.place': 'vscatter'}
        j = Job(TEST_USER1, attrs=a)
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)

        # Turn off scheduling
        self.server.manager(MGR_CMD_SET,
                            SERVER, {'scheduling': 'True'})

        # Job will be rejected by runjob hook and it should log
        # correct exec_vnode for each job.
        msg = "job %s " + "solution (%s:aoe=osimage1:ncpus=1)+(%s:ncpus=4)"
        job1_msg = msg % (jid1, self.hostA, self.hostB)
        job2_msg = msg % (jid2, self.hostA, self.hostB)
        self.server.log_match(job1_msg)
        self.server.log_match(job2_msg)

    def test_sched_provisioning_response(self):
        """
        Test that if scheduler could not find node solution for one
        provisioning job then it will find the correct solution for the
        second one.
        """

        # Set current aoe to osimage1
        self.server.manager(MGR_CMD_SET, NODE, id=self.hostA,
                            attrib={'current_aoe': 'osimage1'})

        # submit one job that will run on local node
        a = {'Resource_List.select': '1:ncpus=10'}
        j1 = Job(TEST_USER1, attrs=a)
        j1.set_sleep_time(200)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        # Turn off scheduling
        self.server.manager(MGR_CMD_SET,
                            SERVER, {'scheduling': 'False'})

        # submit two provisioning jobs where first job will not be able
        # to run and second one can
        a = {'Resource_List.select': '1:aoe=App1:ncpus=1+1:ncpus=3',
             'Resource_List.place': 'vscatter'}
        j2 = Job(TEST_USER1, attrs=a)
        jid2 = self.server.submit(j2)

        a = {'Resource_List.select': '1:aoe=App1:ncpus=1+1:ncpus=2',
             'Resource_List.place': 'vscatter'}
        j3 = Job(TEST_USER1, attrs=a)
        jid3 = self.server.submit(j3)

        # Turn on scheduling
        self.server.manager(MGR_CMD_SET,
                            SERVER, {'scheduling': 'True'})

        ev_format = "(%s:aoe=App1:ncpus=1)+(%s:ncpus=2)"
        solution = ev_format % (self.hostA, self.hostB)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        job_state = self.server.status(JOB, id=jid3)
        self.assertEqual(job_state[0]['exec_vnode'], solution)

    def test_multinode_provisioning(self):
        """
        Test the effect of max_concurrent_provision
        If set to 1 and job requests a 4 node provision, the provision should
        occur 1 node at a time
        """
        # Setup provisioning hook with smaller alarm.
        a = {'event': 'provision', 'enabled': 'True', 'alarm': '5'}
        rv = self.server.create_import_hook(
            'fake_prov_hook', a, self.fake_prov_hook, overwrite=True)

        a = {'max_concurrent_provision': 1}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.aoe': 'App1,osimage1',
             'current_aoe': 'App1',
             'provision_enable': 'True',
             'resources_available.ncpus': 1}
        rv = self.momA.create_vnodes(a, 4,
                                     sharednode=False)
        self.assertTrue(rv)
        j = Job(TEST_USER,
                attrs={'Resource_List.select': '4:ncpus=1:aoe=osimage1'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R',
                                 'substate': 71}, attrop=PTL_AND, id=jid)
        exp_msg = "Provisioning vnode " + self.momA.shortname
        exp_msg += r"\[[0-3]\] with AOE osimage1 started"
        logs = self.server.log_match(msg=exp_msg, regexp=True, allmatch=True)

        # since max_concurrent_provision is 1, there should be only one
        # log
        self.assertEqual(len(logs), 1)

        # A node in provisioning state cannot be deleted. In order to make
        # sure that cleanup happens properly do the following -
        # sleep for a few seconds so that provisin timesout and the node
        # is marked offline and then delete all the nodes
        time.sleep(8)
        # delete all nodes
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")


================================================
FILE: test/tests/functional/pbs_python_restart_settings.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


class TestPythonRestartSettings(TestFunctional):

    """
    For addressing memory leak in server due to python objects python
    interpreter needs to be restarted. Previously there were macros in
    code to do that. The new design has added attributes in server to
    configure how frequently python interpreter should be restarted
    This test suite is to validate the server attributes. Actual memory
    leak test is still manual
    """
    logutils = PBSLogUtils()

    def test_non_integer(self):
        """
        This is to test that qmgr will throw error when non-integer
        values are provided
        """

        exp_err = "Illegal attribute or resource value"
        # -1 will throw error
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_hooks': '-1'},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_objects': '-1'},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_min_interval': '-1'},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")
        # 0 will also give error
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_hooks': 0},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_objects': 0},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_min_interval': 0},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_min_interval': "00:00:00"},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_min_interval': "HH:MM:SS"},
                                runas=ROOT_USER, logerr=True)
        except PbsManagerError as e:
            self.assertTrue(exp_err in e.msg[0],
                            "Error message is not expected")

    def test_non_manager(self):
        """
        Test that hook values can not be set as operator or users.
        """
        exp_err = "Cannot set attribute, read only or insufficient permission"
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_hooks': 30},
                                runas=OPER_USER, logerr=True)
        except PbsManagerError as e:
            self.assertIn(exp_err, e.msg[0],
                          "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_objects': 2000},
                                runas=OPER_USER, logerr=True)
        except PbsManagerError as e:
            self.assertIn(exp_err, e.msg[0],
                          "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_min_interval': 10},
                                runas=OPER_USER, logerr=True)
        except PbsManagerError as e:
            self.assertIn(exp_err, e.msg[0],
                          "Error message is not expected")
        exp_err = "Unauthorized Request"
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_hooks': 30},
                                runas=TEST_USER, logerr=True)
        except PbsManagerError as e:
            self.assertIn(exp_err, e.msg[0],
                          "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_max_objects': 2000},
                                runas=TEST_USER, logerr=True)
        except PbsManagerError as e:
            self.assertIn(exp_err, e.msg[0],
                          "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SERVER,
                                {'python_restart_min_interval': 10},
                                runas=TEST_USER, logerr=True)
        except PbsManagerError as e:
            self.assertIn(exp_err, e.msg[0],
                          "Error message is not expected")

    def test_log_message(self):
        """
        Test that message logged in server_logs when values get set
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_hooks': 200},
                            runas=ROOT_USER, logerr=True)
        self.server.log_match("python_restart_max_hooks = 200",
                              max_attempts=5)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_objects': 2000},
                            runas=ROOT_USER, logerr=True)
        self.server.log_match("python_restart_max_objects = 2000",
                              max_attempts=5)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': "00:01:00"},
                            runas=ROOT_USER, logerr=True)
        self.server.log_match("python_restart_min_interval = 00:01:00",
                              max_attempts=5)

    def test_long_values(self):
        """
        Test that very long values are accepted
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_hooks': 2147483647},
                            runas=ROOT_USER, logerr=True)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_objects': 2147483647},
                            runas=ROOT_USER, logerr=True)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': 2147483647},
                            runas=ROOT_USER, logerr=True)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': "596523:00:00"},
                            runas=ROOT_USER, logerr=True)

    def test_set_unset(self):
        """
        Test that when unset attribte is not visible in qmgr.
        Also values will not change after server restart.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_hooks': 20},
                            runas=ROOT_USER, logerr=True)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_objects': 20},
                            runas=ROOT_USER, logerr=True)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': "00:00:20"},
                            runas=ROOT_USER, logerr=True)
        # Restart server
        self.server.restart()
        self.server.expect(SERVER, {'python_restart_max_hooks': 20},
                           op=SET, runas=ROOT_USER)
        self.server.expect(SERVER, {'python_restart_max_objects': 20},
                           op=SET, runas=ROOT_USER)
        self.server.expect(SERVER, {'python_restart_min_interval': 20},
                           op=SET, runas=ROOT_USER)
        self.server.manager(MGR_CMD_UNSET, SERVER,
                            'python_restart_max_hooks',
                            runas=ROOT_USER, logerr=True)
        self.server.manager(MGR_CMD_UNSET, SERVER,
                            'python_restart_max_objects',
                            runas=ROOT_USER, logerr=True)
        self.server.manager(MGR_CMD_UNSET, SERVER,
                            'python_restart_min_interval',
                            runas=ROOT_USER, logerr=True)
        # Restart server again
        self.server.restart()
        self.server.expect(SERVER, "python_restart_max_hooks",
                           op=UNSET, runas=ROOT_USER)
        self.server.expect(SERVER, "python_restart_max_objects",
                           op=UNSET, runas=ROOT_USER)
        self.server.expect(SERVER, "python_restart_min_interval",
                           op=UNSET, runas=ROOT_USER)

    def test_max_hooks(self):
        """
        Test that python restarts at set interval
        """
        # create a hook
        hook_body = """
import pbs

e = pbs.event()

s = pbs.server()

localnode = pbs.get_local_nodename()
vn = pbs.server().vnode(localnode)
pbs.event().accept()
"""
        a = {'event': ["queuejob", "movejob", "modifyjob", "runjob"],
             'enabled': "True"}
        self.server.create_import_hook("test", a, hook_body, overwrite=True)
        # Create workq2
        a = {'queue_type': 'e', 'started': 't', 'enabled': 't'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "workq2")
        # Set max_hooks and min_interval so that further changes
        # will generate a log message.
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_hooks': 100},
                            runas=ROOT_USER)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': 30},
                            runas=ROOT_USER)
        # Need to run a job so these new settings are remembered
        j = Job()
        jid = self.server.submit(j)
        # Set server log_events
        self.server.manager(MGR_CMD_SET, SERVER, {"log_events": 2047})
        # Set time to start scanning logs
        time.sleep(1)
        stime = time.time()
        # Set max_hooks to low to hit max_hooks only
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_hooks': 1},
                            runas=ROOT_USER)
        # Set min_interval to 3
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': 3},
                            runas=ROOT_USER)
        # Submit multiple jobs
        for x in range(6):
            j = Job()
            j.set_attributes({ATTR_h: None})
            j.set_sleep_time(1)
            jid = self.server.submit(j)
            self.server.expect(JOB, {'job_state': "H"}, id=jid)
            self.server.alterjob(jid, {ATTR_N: "yaya"})
            self.server.movejob(jid, "workq2")
            self.server.rlsjob(jid, None)
            time.sleep(1)
        # Verify the logs and make sure that python interpreter is restarted
        # every 3s
        logs = self.server.log_match(
            "Restarting Python interpreter to reduce mem usage",
            allmatch=True, starttime=stime, max_attempts=8, n="ALL")
        self.assertTrue(len(logs) > 1)
        log1 = logs[0][1]
        log2 = logs[1][1]
        tmp = log1.split(';')
        # Convert the time into epoch time
        time1 = int(self.logutils.convert_date_time(tmp[0]))
        tmp = log2.split(';')
        time2 = int(self.logutils.convert_date_time(tmp[0]))
        # Difference between log message should not be less than 3
        diff = time2 - time1
        self.logger.info("Time difference between log message is " +
                         str(diff) + " seconds")
        # Leave a little wiggle room for slow systems
        self.assertTrue(diff > 2, "time between Python restart log messages"
                        " (%s seconds) is too short;"
                        " expected roughly 3 seconds" % str(diff))
        self.assertTrue(diff <= 10, "time between Python restart log messages"
                        " (%s seconds) is too long;"
                        " expected roughly 3 seconds" % str(diff))
        # This message only gets printed if /proc/self/statm is present
        if os.path.isfile("/proc/self/statm"):
            self.server.log_match("Current memory usage:",
                                  starttime=self.server.ctime,
                                  max_attempts=5)
        else:
            self.server.log_match("unknown", max_attempts=5)
        # Verify other log messages
        self.server.log_match("python_restart_max_hooks is now 1",
                              starttime=stime, max_attempts=5)
        self.server.log_match("python_restart_min_interval is now 3",
                              starttime=stime, max_attempts=5)

    def test_max_objects(self):
        """
        Test that python restarts if max objects limit have met
        """
        hook_body = """
import pbs
pbs.event().accept()
"""
        a = {'event': ["queuejob", "modifyjob"], 'enabled': 'True'}
        self.server.create_import_hook("test", a, hook_body, overwrite=True)
        # Set max_objects and min_interval so that further changes
        # will generate a log message.
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_objects': 1000},
                            runas=ROOT_USER)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': 30},
                            runas=ROOT_USER)
        # Need to run a job so these new settings are remembered
        j = Job()
        jid = self.server.submit(j)
        # Set server log_events
        self.server.manager(MGR_CMD_SET, SERVER, {"log_events": 2047})
        # Set time to start scanning logs
        time.sleep(1)
        stime = time.time()
        # Set max_objects only
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_objects': 1},
                            runas=ROOT_USER)
        # Set min_interval to 1
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': '00:00:01'},
                            runas=ROOT_USER)
        # Submit held jobs
        for x in range(3):
            j = Job()
            j.set_attributes({ATTR_h: None})
            j.set_sleep_time(1)
            jid = self.server.submit(j)
            self.server.expect(JOB, {'job_state': "H"}, id=jid)
            self.server.alterjob(jid, {ATTR_N: "yaya"})
        # Verify that python is restarted
        self.server.log_match(
            "Restarting Python interpreter to reduce mem usage",
            starttime=self.server.ctime, max_attempts=5)
        # This message only gets printed if
        # /proc/self/statm presents
        if os.path.isfile("/proc/self/statm"):
            self.server.log_match(
                "Current memory usage:",
                starttime=self.server.ctime, max_attempts=5)
        else:
            self.server.log_match("unknown", max_attempts=5)
        # Verify other log messages
        self.server.log_match(
            "python_restart_max_objects is now 1",
            starttime=stime, max_attempts=5)
        self.server.log_match(
            "python_restart_min_interval is now 1",
            starttime=stime, max_attempts=5)

    def test_no_restart(self):
        """
        Test that if limit not reached then python interpreter
        will not be started
        """
        hook_body = """
import pbs
pbs.event().accept()
"""
        a = {'event': "queuejob", 'enabled': "True"}
        self.server.create_import_hook("test", a, hook_body, overwrite=True)
        # Set max_hooks, max_objects, and min_interval to large values
        # to avoid restarting the Python interpreter.
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_hooks': 10000},
                            runas=ROOT_USER)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_max_objects': 10000},
                            runas=ROOT_USER)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'python_restart_min_interval': 10000},
                            runas=ROOT_USER)
        stime = time.time()
        # Submit a job
        for x in range(10):
            j = Job()
            j.set_sleep_time(1)
            jid = self.server.submit(j)
        # Verify no restart message
        msg = "Restarting Python interpreter to reduce mem usage"
        self.server.log_match(msg, starttime=stime, max_attempts=8,
                              existence=False)


================================================
FILE: test/tests/functional/pbs_python_test.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import subprocess
from subprocess import PIPE, Popen

from tests.functional import *


class Test_pbs_python(TestFunctional):
    """
    This test suite tests pbs_python executable
    and makes sure it works fine.
    """

    def test_pbs_python(self):
        """
        This method spawns a python process using
        pbs_python and checks for the result
        """
        fn = self.du.create_temp_file(prefix='test', suffix='.py',
                                      body="print(\"Hello\")", text=True)
        self.logger.info("created temp python script " + fn)
        pbs_python = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                  "bin", "pbs_python")
        msg = ['Hello']
        cmd = [pbs_python] + [fn]
        rc = self.du.run_cmd(cmd=cmd, sudo=True)
        self.assertTrue('out' in rc)
        self.assertEqual(rc['out'], msg)

    def test_pbs_python_zero_size(self):
        """
        This method verifies that there are no shenanigans
        when using pbs.size('0mb') et al
        """
        fn = self.du.create_temp_file(
            prefix='test_0mb', suffix='.py',
            body="import pbs\n"
                 "if pbs.size('10mb') > pbs.size('0mb'):\n"
                 "    pbs.event().accept()\n"
                 "else:\n"
                 "    pbs.event().reject()\n",
            text=True)
        self.logger.info("created test python script " + fn)
        fn2 = self.du.create_temp_file(
            prefix='dummy',
            suffix='.in',
            body="pbs.event().type=exechost_startup\n",
            text=True)
        self.logger.info("created dummy input file " + fn2)

        msg = "pbs.event().accept=True"
        pbs_python = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                  "bin", "pbs_python")
        cmd = [pbs_python] + ['--hook', '-i', fn2, fn]
        self.logger.info("running %s" % repr(cmd))
        rc = self.du.run_cmd(cmd=cmd, sudo=True)
        self.assertTrue('out' in rc, "command has no output")
        combined_output = '\n'.join(rc['out'])
        self.assertTrue(msg in combined_output, "Test hooklet rejected event")
        self.logger.info("Test hooklet accepted event")


================================================
FILE: test/tests/functional/pbs_qdel.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import re


class TestQdel(TestFunctional):
    """
    This test suite contains tests for qdel
    """

    def test_qdel_with_server_tagged_in_jobid(self):
        """
        Test to make sure that qdel uses server tagged in jobid instead of
        the PBS_SERVER conf setting
        """
        self.du.set_pbs_config(confs={'PBS_SERVER': 'not-a-server'})
        j = Job(TEST_USER)
        j.set_attributes({ATTR_q: 'workq@' + self.server.hostname})
        jid = self.server.submit(j)
        try:
            self.server.delete(jid)
        except PbsDeleteError as e:
            self.assertFalse(
                'Unknown Host' in e.msg[0],
                "Error message is not expected as server name is"
                "tagged in the jobid")
        self.du.set_pbs_config(confs={'PBS_SERVER': self.server.hostname})

    def test_qdel_unknown(self):
        """
        Test that qdel for an unknown job throws error saying the same
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.delete(jid, wait=True)
        try:
            self.server.delete(jid)
            self.fail("qdel didn't throw 'Unknown job id' error")
        except PbsDeleteError as e:
            self.assertEqual("qdel: Unknown Job Id " + jid, e.msg[0])

    def test_qdel_history_job(self):
        """
        Test deleting a history job after a custom resource is deleted
        The deletion of the history job happens in teardown
        """
        self.server.add_resource('foo')
        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        hook_body = "import pbs\n"
        hook_body += "e = pbs.event()\n"
        hook_body += "e.job.resources_used[\"foo\"] = \"10\"\n"
        a = {'event': 'execjob_epilogue', 'enabled': 'True'}
        self.server.create_import_hook("epi", a, hook_body)
        j = Job(TEST_USER)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(JOB, {'job_state': 'F'}, id=jid,
                           extend='x', max_attempts=20)
        msg = "Resource allowed to be deleted"
        with self.assertRaises(PbsManagerError, msg=msg) as e:
            self.server.manager(MGR_CMD_DELETE, RSC, id="foo")
        m = "Resource busy on job"
        self.assertIn(m, e.exception.msg[0])
        self.server.delete(jid, extend='deletehist')

    def test_qdel_arrayjob_in_transit(self):
        """
        Test the array job deletion
        soon after they have been signalled for running.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'false'})
        a = {'resources_available.ncpus': 6}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={
            ATTR_J: '1-3', 'Resource_List.select': 'ncpus=1'})
        job_set = []
        for i in range(4):
            job_set.append(self.server.submit(j))
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'true'})
        self.server.delete(job_set)
        # Make sure that the counters are not going negative
        msg = "job*has already been deleted from delete job list"
        self.scheduler.log_match(msg, existence=False,
                                 max_attempts=3, regexp=True)
        # Make sure the last two jobs doesn't started running
        # while the deletion is in process
        for job in job_set[2:]:
            jobid, server = job.split('.')
            arrjob = jobid[-2:] + '[1]' + server
            msg = arrjob + ";Job Run at request of Scheduler"
            self.scheduler.log_match(msg, existence=False, max_attempts=3)

    def test_qdel_history_job_rerun(self):
        """
        Test rerunning a history job that was prematurely terminated due
        to a a downed mom.
        """
        a = {'job_history_enable': 'True', 'job_history_duration': '5',
             'job_requeue_timeout': '5', 'node_fail_requeue': '5',
             'scheduler_iteration': '5'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job()
        j.set_sleep_time(30)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.mom.stop()

        # Force job to be prematurely terminated
        try:
            self.server.deljob(jid)
        except PbsDeljobError as e:
            err_msg = "could not connect to MOM"
            self.assertTrue(err_msg in e.msg[0],
                            "Did not get the expected message")
            self.assertTrue(e.rc != 0, "Exit code shows success")
        else:
            raise self.failureException("qdel job did not return error")

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.mom.start()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        # Upon rerun, finished status should be '92' (Finished)
        a = {'job_state': 'F', 'substate': '92'}
        self.server.expect(JOB, a, extend='x',
                           offset=30, id=jid, interval=1)

    def test_qdel_history_job_rerun_nx(self):
        """
        Test rerunning a history job that was prematurely terminated due
        to a a downed mom.
        """
        a = {'job_history_enable': 'True', 'job_history_duration': '5',
             'job_requeue_timeout': '5', 'node_fail_requeue': '5',
             'scheduler_iteration': '5'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job()
        j.set_sleep_time(30)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.mom.stop()

        # Force job to be prematurely terminated and try to delete it more than
        # once.
        err_msg = "could not connect to MOM"
        msg = "qdel job did not return error"
        with self.assertRaises(PbsDeljobError, msg=msg) as e:
            self.server.deljob([jid, jid, jid, jid])
        self.assertIn(err_msg, e.exception.msg[0])
        self.assertNotEqual(e.exception.rc, 0)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.mom.start()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        # Upon rerun, finished status should be '92' (Finished)
        a = {'job_state': 'F', 'substate': '92'}
        self.server.expect(JOB, a, extend='x',
                           offset=1, id=jid, interval=1)

    def test_qdel_same_jobid_nx_00(self):
        """
        Test that qdel that deletes the job more than once in the same line.
        """
        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: "R"}, id=jid)
        self.server.delete([jid.split(".")[0], jid, jid, jid, jid], wait=True)
        self.server.expect(JOB, {'job_state': 'F', 'substate': 91}, id=jid,
                           extend='x', max_attempts=20)

    def test_qdel_same_jobid_nx_01(self):
        """
        Test that qdel that deletes the job more than once in the same line.
        Done twice.
        """
        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: "R"}, id=jid)
        self.server.delete([jid, jid], wait=True)
        self.server.expect(JOB, {'job_state': 'F', 'substate': 91}, id=jid,
                           extend='x', max_attempts=20)

        # this may take 2 or more times to break.
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: "R"}, id=jid)
        self.server.delete([jid, jid], wait=True)
        self.server.expect(JOB, {'job_state': 'F', 'substate': 91}, id=jid,
                           extend='x', max_attempts=20)

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: "R"}, id=jid)
        self.server.delete([jid, jid], wait=True)
        self.server.expect(JOB, {'job_state': 'F', 'substate': 91}, id=jid,
                           extend='x', max_attempts=20)

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: "R"}, id=jid)
        self.server.delete([jid, jid], wait=True)
        self.server.expect(JOB, {'job_state': 'F', 'substate': 91}, id=jid,
                           extend='x', max_attempts=20)

    def test_qdel_same_jobid_nx_02(self):
        """
        Test that qdel that deletes the job more than once in the same line.
        With rerun.
        """
        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        attrs = {ATTR_r: 'y'}
        j = Job(TEST_USER, attrs=attrs)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: "R"}, id=jid)
        self.server.delete([jid, jid, jid, jid, jid], wait=True)
        self.server.expect(JOB, {'job_state': 'F', 'substate': 91}, id=jid,
                           extend='x', max_attempts=20)

    def array_job_start(self, job_sleep_time, ncpus, sj_range=None):
        """
        Start an array job and capture job and subjob info
        """
        if not sj_range:
            sj_range = f"1-{ncpus}"
        elif isinstance(sj_range, int):
            sj_range = f"1-{sj_range}"
        a = {
            # 'log_events': 4095,
            'job_history_enable': 'True'
        }
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': ncpus}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={ATTR_J: sj_range})
        j.set_sleep_time(job_sleep_time)
        jid = self.server.submit(j)
        array_id = jid.split("[")[0]
        sjm = re.match(r'(\d+)-(\d+)(:(\d+))?', sj_range).groups()
        sj_range_start = int(sjm[0])
        sj_range_end = int(sjm[1])
        sj_range_step = int(sjm[3]) if sjm[3] else 1
        sjids = [j.create_subjob_id(jid, sjn) for sjn in
                 range(sj_range_start, sj_range_end+1, sj_range_step or 1)]
        return (jid, array_id, sjids)

    def test_qdel_same_jobid_nx_array_00(self):
        """
        Test that qdel that deletes the array job more than once in the same
        line.
        """
        jid, _, sjids = self.array_job_start(20, 6, 2)
        self.server.expect(JOB, {ATTR_state: "R"}, id=sjids[0])
        self.server.delete([jid] * 10, wait=True)
        self.server.expect(JOB, {'job_state': 'F', 'substate': 91}, id=jid,
                           extend='x', max_attempts=20)

    def test_qdel_same_jobid_nx_array_01(self):
        """
        Test that qdel that deletes the array job more than once in the same
        line.
        """
        jid, _, sjids = self.array_job_start(20, 6, '0-734:512')
        self.server.expect(JOB, {ATTR_state: "R"}, id=sjids[0])
        self.server.delete([jid] * 10, wait=True)
        self.server.expect(JOB, {'job_state': 'F'}, id=jid,
                           extend='x', max_attempts=60)

    def test_qdel_same_jobid_nx_array_subjob_00(self):
        """
        Test that the server handles deleting a running array subjob repeated
        multiple times in the same operation (qdel command).
        """
        jid, _, sjids = self.array_job_start(20, 6, 2)
        for sjid in sjids:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)
        self.server.delete([sjids[0]] * 10, wait=True)
        self.server.expect(JOB, {'job_state': 'F'}, id=jid,
                           extend='x', max_attempts=60)

    def test_qdel_same_jobid_nx_array_subjob_01(self):
        """
        Test that the server handles deleting a running array subjob repeated
        multiple times in the same operation (qdel command) where the array
        specification containes a step.
        """
        jid, _, sjids = self.array_job_start(20, 6, '0-734:512')
        for sjid in sjids:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)
        self.server.delete([sjids[0]] * 10, wait=True)
        self.server.expect(JOB, {'job_state': 'F'}, id=jid,
                           extend='x', max_attempts=60)

    @requirements(num_moms=1)
    def test_qdel_same_jobid_nx_array_subjob_02(self):
        """
        Test that the server handles deleting repeating overlapping ranges of
        running array subjobs in the same operation (qdel command).
        """
        jid, array_id, sjids = self.array_job_start(20, 6, 12)
        for sjid in sjids[:6]:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)

        sj_range1 = f"{array_id}[2-4]"
        sj_range2 = f"{array_id}[3-5]"
        sj_list = [sj_range1, sj_range2] * 10
        self.server.delete(sj_list, wait=True)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=jid, extend='x', max_attempts=20)

    @requirements(num_moms=1)
    def test_qdel_same_jobid_nx_array_subjob_03(self):
        """
        Test that the server handles deleting repeating overlapping ranges of
        running array subjobs in the multiple operations (multiple qdel
        commands backgrounded).
        """
        jid, array_id, sjids = self.array_job_start(20, 6, 12)
        for sjid in sjids[:6]:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)

        sj_range1 = f"{array_id}[2-4]"
        sj_range2 = f"{array_id}[3-5]"
        sj_list = [sj_range1, sj_range2] * 10
        # roughly equivalent to "qdel & qdel & qdel & wait"
        self.server.delete(sj_list, wait=False)
        self.server.delete(sj_list, wait=False)
        self.server.delete(sj_list, wait=True)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=jid, extend='x', max_attempts=20)

    @requirements(num_moms=1)
    def test_qdel_same_jobid_nx_array_subjob_04(self):
        """
        Test that the server handles deleting repeating overlapping ranges of
        array subjobs in a single operation, where a subset are running, but
        none have completed, and some are queued.
        """
        jid, array_id, sjids = self.array_job_start(20, 6, 12)
        for sjid in sjids[:6]:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)

        sj_range1 = f"{array_id}[1-4]"
        sj_range2 = f"{array_id}[3-8]"
        sj_list = [sj_range1, sj_range2] * 10
        self.server.delete(sj_list, wait=True)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=jid, extend='x', max_attempts=20)

    @requirements(num_moms=1)
    def test_qdel_same_jobid_nx_array_subjob_05(self):
        """
        Test that the server handles deleting repeating overlapping ranges of
        array subjobs in a single operation, where some subjobs have completed,
        a subset are running, and some are queued.
        """
        jid, array_id, sjids = self.array_job_start(20, 4, 12)
        for sjid in sjids[:6]:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)
        sj_range1 = f"{array_id}[1-4]"
        sj_range2 = f"{array_id}[3-8]"
        sj_list = [sj_range1, sj_range2] * 10
        self.server.delete(sj_list, wait=True)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=jid, extend='x', max_attempts=20)

    @requirements(num_moms=1)
    def test_qdel_same_jobid_nx_array_subjob_06(self):
        """
        Test that the server handles deleting repeating ranges of
        array subjobs in a single operation, where some subjobs have completed,
        a subset are running, and some are queued.
        """
        jid, array_id, sjids = self.array_job_start(20, 4, 12)
        for sjid in sjids[:6]:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)
        sj_range1 = f"{array_id}[1-4]"
        sj_list = [sj_range1] * 20
        self.server.delete(sj_list, wait=True)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=jid, extend='x', max_attempts=20)

    @requirements(num_moms=1)
    def test_qdel_same_jobid_nx_array_subjob_07(self):
        """
        Test that the server handles deleting repeating ranges of
        array subjobs in a single operation, where some subjobs have completed,
        a subset are running, and some are queued.
        """
        jid, array_id, sjids = self.array_job_start(20, 4, 12)
        for sjid in sjids[:6]:
            self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)
        sj_range1 = f"{array_id}[1-4]"
        sj_range2 = f"{array_id}[3-6]"
        sj_range3 = f"{array_id}[5-8]"

        sj_list = [sj_range1, sj_range2, sj_range3]
        self.server.delete(sj_list, wait=True)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=jid, extend='x', max_attempts=20)

    # TODO: add rerun nx for job arrays

    def test_qdel_with_list_of_jobids(self):
        """
        Test deleting the list of jobids, containing unknown, queued
        and running jobs in the list.
        """

        self.server.manager(
            MGR_CMD_SET, SERVER, {
                'job_history_enable': 'True'})
        fail_msg = f'qdel didn\'t throw unknown job error'
        with self.assertRaises(PbsDeleteError, msg=fail_msg) as c:
            j = Job(TEST_USER)
            j.set_sleep_time(5)
            unknown_jid = "100000"
            jid = self.server.submit(j)
            stripped_jid = jid.split('.')[0]
            self.server.expect(JOB, {'job_state': 'R'}, id=stripped_jid)
            j = Job(TEST_USER)
            j.set_sleep_time(1000)
            running_jid = self.server.submit(j)
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
            j = Job(TEST_USER)
            queued_jid = self.server.submit(j)

            self.server.expect(JOB, {'job_state': 'R'}, id=running_jid)
            self.server.expect(JOB, {'job_state': 'Q'}, id=queued_jid)
            job_set = [unknown_jid, running_jid, queued_jid, stripped_jid]
            self.server.delete(job_set)
        msg = f'qdel: Unknown Job Id {unknown_jid}'
        self.assertTrue(c.exception.msg[0].startswith(msg))
        self.server.expect(JOB, {'job_state': 'F'}, id=stripped_jid,
                           extend='x')
        self.server.expect(JOB, {'job_state': 'F'}, id=running_jid,
                           extend='x')
        self.server.expect(JOB, {'job_state': 'F'}, id=queued_jid,
                           extend='x')

    def test_qdel_with_duplicate_jobids_in_list(self):
        """
        This tests server crash with duplicate jobids
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        jid_list = [jid, jid, jid, jid]
        self.server.delete(jid_list)
        rv = self.server.isUp()
        self.assertTrue(rv, "Server crashed")
        j = Job(TEST_USER)
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)
        jid3 = self.server.submit(j)
        jid4 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        jid_list = [jid1, jid2, jid1, jid2, jid3, jid4, jid4, jid3]
        self.server.delete(jid_list)
        rv = self.server.isUp()
        self.assertTrue(rv, "Server crashed")

    def test_qdel_with_duplicate_array_jobs(self):
        """
        Test server crash with duplicate array jobs
        """
        j = Job(TEST_USER, {
            ATTR_J: '1-20', 'Resource_List.select': 'ncpus=1'})
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)
        jid3 = self.server.submit(j)
        jid4 = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'B'}, jid1)
        jid_list = [jid1, jid1, jid2, jid1, jid3, jid4, jid3, jid2]
        self.server.delete(jid_list)
        rv = self.server.isUp()
        self.assertTrue(rv, "Server crashed")

    def test_qdel_with_duplicate_array_non_array_jobs(self):
        """
        Test server crash with duplicate array and non-array jobs
        """
        j = Job(TEST_USER, {
            ATTR_J: '1-20', 'Resource_List.select': 'ncpus=1'})
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)

        j = Job(TEST_USER, {'Resource_List.select': 'ncpus=1'})
        jid3 = self.server.submit(j)
        jid4 = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'B'}, jid1)
        jid_list = [jid1, jid1, jid2, jid1, jid3, jid4, jid3, jid2]
        self.server.delete(jid_list)
        rv = self.server.isUp()
        self.assertTrue(rv, "Server crashed")

    def test_qdel_with_overlaping_array_jobs(self):
        """
        Test server crash with overlaping array jobs
        """
        j = Job(TEST_USER, {
            ATTR_J: '1-20', 'Resource_List.select': 'ncpus=1'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'B'}, jid)
        subjob1 = jid.replace('[]', '[1-6]')
        subjob2 = jid.replace('[]', '[5-8]')
        jid_list = [subjob1, subjob2]
        self.server.delete(jid_list)
        rv = self.server.isUp()
        self.assertTrue(rv, "Server crashed")

        subjob3 = jid.replace('[]', '[11-18]')
        subjob4 = jid.replace('[]', '[15-19]')
        jid_list = [subjob3, subjob4]
        self.server.delete(jid_list)
        rv = self.server.isUp()
        self.assertTrue(rv, "Server crashed")

    def test_qdel_mix_of_job_and_arrayjob_range(self):
        """
        Test that the server handles deleting mix of common job
        and array job range in one request
        """
        j = Job(TEST_USER, {'Resource_List.select': 'ncpus=1'})
        jid = self.server.submit(j)

        ajid, array_id, sjids = self.array_job_start(20, 2, 2)

        sj_list = [jid, f"{array_id}[1]", f"{array_id}[2]"]
        self.server.delete(sj_list, wait=True)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=jid, extend='x', max_attempts=20)
        self.server.expect(
            JOB, {'job_state': 'F'}, id=ajid, extend='x', max_attempts=20)


================================================
FILE: test/tests/functional/pbs_qmgr.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os

from ptl.lib.pbs_ifl_mock import *
from tests.functional import *


@tags('commands')
class TestQmgr(TestFunctional):

    """
    Test suite for qmgr command
    """

    resc_flags = [None, 'n', 'h', 'nh', 'q', 'f', 'fh', 'm', 'mh']
    resc_flags_ctl = [None, 'r', 'i']
    objs = [QUEUE, SERVER, NODE, JOB, RESV]
    resc_name = "ptl_custom_res"
    avail_resc_name = 'resources_available.' + resc_name

    def setUp(self):
        TestFunctional.setUp(self)
        self.obj_map = {QUEUE: self.server.default_queue,
                        SERVER: self.server.name,
                        NODE: self.mom.shortname,
                        JOB: None, RESV: None}

    def __check_whitespace_prefix(self, line):
        """
        Check whether the whitespace prefix for the line specified is correct

        :param line: the line to check
        :type line: String
        """
        if line is None:
            return

        if line[0] == " ":
            # Spaces are the prefix for new attribute lines
            # Make sure that this is a new attribute line
            self.assertTrue("=" in line)
        elif line[0] == "\t":
            # Tabs are prefix for line extensions
            # Make sure that this is a line extension
            self.assertTrue("=" not in line)

    def test_listcmd_whitespaces(self):
        """
        Check that the prefix for new attributes listed out by qmgr list
        are spaces and that for line extensions is a tab
        """
        fn = self.du.create_temp_file()
        node_prefix = "vn"
        nodename = node_prefix + "[0]"
        vndef_file = None
        qmgr_path = os.path.join(self.server.pbs_conf["PBS_EXEC"], "bin",
                                 "qmgr")
        if not os.path.isfile(qmgr_path):
            self.server.skipTest("qmgr binary not found!")

        try:
            # Check 1: New attributes are prefixed with spaces and not tabs
            # Execute qmgr -c 'list sched' and store output in a temp file
            if self.du.is_localhost(self.server.hostname) is True:
                qmgr_cmd = [qmgr_path, "-c", "list sched"]
            else:
                qmgr_cmd = [qmgr_path, "-c", "\'list sched\'"]
            with open(fn, "w+") as tempfd:
                ret = self.du.run_cmd(self.server.hostname, qmgr_cmd,
                                      stdout=tempfd)

                self.assertTrue(ret['rc'] == 0)
                for line in tempfd:
                    self.__check_whitespace_prefix(line)

            # Check 2: line extensions are prefixed with tabs and not spaces
            # Create a random long, comma separated string
            blah = "blah"
            long_string = ""
            for i in range(49):
                long_string += blah + ","
            long_string += blah
            # Create a new vnode
            attrs = {ATTR_rescavail + ".ncpus": 2}
            self.mom.create_vnodes(attrs, 1, vname=node_prefix)
            # Set 'comment' attribute to the long string we created above
            attrs = {ATTR_comment: long_string}
            self.server.manager(MGR_CMD_SET, VNODE, attrs, nodename)
            # Execute "qmgr 'list node vn[0]'"
            # The comment attribute should generate a line extension
            if self.du.is_localhost(self.server.hostname) is True:
                qmgr_cmd = [qmgr_path, "-c", "list node " + nodename]
            else:
                qmgr_cmd = [qmgr_path, "-c", "\'list node " + nodename + "\'"]
            with open(fn, "w+") as tempfd:
                ret = self.du.run_cmd(self.server.hostname, qmgr_cmd,
                                      stdout=tempfd)
                self.assertTrue(ret['rc'] == 0)
                for line in tempfd:
                    self.__check_whitespace_prefix(line)

        finally:
            # Cleanup
            # Remove the temporary file
            os.remove(fn)
            # Delete the vnode created
            if vndef_file is not None:
                self.mom.delete_vnodes()
                self.server.manager(MGR_CMD_DELETE, VNODE, id=nodename)

    def test_multi_attributes(self):
        """
        Test to verify that if multiple attributes are set
        simultaneously and out of which one fail then none
        will be set.
        """

        a = {'queue_type': 'execution',
             'enabled': 'True',
             'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')

        a = {'partition': 'foo'}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq')

        a = {'partition': 'bar'}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq2')

        a = {'queue': 'workq', 'partition': 'bar'}
        try:
            self.server.manager(MGR_CMD_SET, NODE, a,
                                id=self.mom.shortname)
        except PbsManagerError as e:
            self.assertNotEqual(e.rc, '0')
            # Due to PP-1073 checking for the partial message
            msg = " is not part of queue for node"
            self.logger.info("looking for error, %s" % msg)
            self.assertTrue(msg in e.msg[0])
        self.server.expect(NODE, 'queue', op=UNSET, id=self.mom.shortname)

    def set_and_test_comment(self, comment):
        """
        Set the node's comment, then print it and re-import it
        """
        a = {'comment': comment}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        qmgr_path = \
            os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', 'qmgr')
        qmgr_cmd_print = qmgr_path + \
            (' -c "p n %s comment"' % self.mom.shortname)
        ret = self.du.run_cmd(self.server.hostname,
                              cmd=qmgr_cmd_print, as_script=True)
        self.assertEqual(ret['rc'], 0)
        fn = self.du.create_temp_file()
        for line in ret['out']:
            if '#' in line:
                continue
            if 'create node' in line:
                continue
            with open(fn, 'w') as f:
                f.write(line)
            qmgr_cmd_set = qmgr_path + ' < ' + fn
            ret_s = self.du.run_cmd(self.server.hostname,
                                    cmd=qmgr_cmd_set, as_script=True)
            self.assertEqual(ret_s['rc'], 0)

    def create_resource_helper(self, resc_type, resc_flag, ctrl_flag):
        """
        create a resource with associated type, flag, and control flag

        resc_type - Type of the resource

        resc_flag - Permissions/flags associated to the resource

        ctrl_flag - Control flags
        """
        attr = {}
        if resc_type:
            attr['type'] = resc_type
        if resc_flag:
            attr['flag'] = resc_flag
        if ctrl_flag:
            if 'flag' in attr:
                attr['flag'] += ctrl_flag
            else:
                attr['flag'] = ctrl_flag
        if attr is not None:
            try:
                rc = self.server.manager(MGR_CMD_CREATE, RSC, attr,
                                         id=self.resc_name)
            except PbsManagerError as e:
                msg = 'Erroneous to have'
                self.assertIn(msg, e.msg[0])
                return False
        else:
            rv = self.server.resources[self.resc_name].attributes['type']
            if resc_type is None:
                self.assertEqual(rv, 'string')
            else:
                self.assertEqual(rv, resc_type)

            if ctrl_flag is not None:
                resc_flag += ctrl_flag
            if resc_flag:
                rv = self.server.resources[self.resc_name].attributes['flag']
                self.assertEqual(sorted(rv), sorted(resc_flag))
        return True

    def delete_resource_helper(self, resc_type, resc_flg, ctrl_flg,
                               obj_type, obj_id):
        """
        Vierify behavior upon deleting a resource that is set on a PBS object.

        resc_type - The type of resource

        resc_flg - The permissions/flags of the resource

        ctrl_flg - The control flags of the resource

        obj_type - The object type (server, queue, node, job, reservation) on
        which the resource is set.

        obj_id - The object identifier/name
        """
        ar = 'resources_available.' + self.resc_name
        resc_map = {'long': 1, 'float': 1.0, 'string': 'abc', 'boolean': False,
                    'string_array': 'abc', 'size': '1gb'}
        if resc_type is not None:
            val = resc_map[resc_type]
        else:
            val = 'abc'
        objs = [JOB, RESV]
        if obj_type in objs:
            attr = {'Resource_List.' + self.resc_name: val}
            if obj_type == JOB:
                j = Job(TEST_USER1, attr)
            else:
                j = Reservation(TEST_USER1, attr)
            try:
                jid = self.server.submit(j)
            except PbsSubmitError as e:
                jid = e.rv
            if ctrl_flg is not None and ('r' in ctrl_flg or 'i' in ctrl_flg):
                self.assertEqual(jid, None)
                self.server.manager(MGR_CMD_DELETE, RSC, id=self.resc_name)
                return
            if obj_type == RESV:
                a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
                self.server.expect(RESV, a, id=jid)
            self.assertNotEqual(jid, None)
        else:
            self.server.manager(MGR_CMD_SET, obj_type, {ar: val},
                                id=obj_id)
        try:
            rc = self.server.manager(MGR_CMD_DELETE, RSC, id=self.resc_name)
        except PbsManagerError as e:
            if obj_type in objs:
                self.assertNotEqual(e.rc, 0)
                m = "Resource busy on " + PBS_OBJ_MAP[obj_type]
                self.assertIn(m, e.msg[0])
                self.server.delete(jid)
                self.server.expect(obj_type, 'queue', op=UNSET)
                self.server.manager(MGR_CMD_DELETE, RSC, id=self.resc_name)
            else:
                self.assertEqual(e.rc, 0)
                d = self.server.status(obj_type, ar, id=obj_id)
                if d:
                    self.assertNotIn(ar, d[0])

    def test_string_single_quoting(self):
        """
        Test to verify that if a string attribute has a double quote,
        the value is single-quoted correctly
        """
        self.set_and_test_comment('This is "my" node.')

    def test_string_double_quoting(self):
        """
        Test to verify that if a string attribute has a quote, the value
        is double-quoted correctly
        """
        self.set_and_test_comment("This node isn't good.")

    def test_string_type_resource_create_delete(self):
        """
        Test behavior of string type resource creation and deletion
        by all possible and supported types and flags.
        """
        for k, v in self.obj_map.items():
            for resc_flag in self.resc_flags:
                for ctrl_flag in self.resc_flags_ctl:
                    rv = self.create_resource_helper('string', resc_flag,
                                                     ctrl_flag)
                    if rv:
                        self.delete_resource_helper('string', resc_flag,
                                                    ctrl_flag, k, v)

    def test_long_type_resource_create_delete(self):
        """
        Test behavior of long type resource creation and deletion
        by all possible and supported types and flags.
        """
        for k, v in self.obj_map.items():
            for resc_flag in self.resc_flags:
                for ctrl_flag in self.resc_flags_ctl:
                    rv = self.create_resource_helper('long', resc_flag,
                                                     ctrl_flag)
                    if rv:
                        self.delete_resource_helper('long', resc_flag,
                                                    ctrl_flag, k, v)

    def test_float_type_resource_create_delete(self):
        """
        Test behavior of float type resource creation and deletion
        by all possible and supported types and flags.
        """
        for k, v in self.obj_map.items():
            for resc_flag in self.resc_flags:
                for ctrl_flag in self.resc_flags_ctl:
                    rv = self.create_resource_helper('float', resc_flag,
                                                     ctrl_flag)
                    if rv:
                        self.delete_resource_helper('float', resc_flag,
                                                    ctrl_flag, k, v)

    def test_boolean_type_resource_create_delete(self):
        """
        Test behavior of boolean type resource creation and deletion
        by all possible and supported types and flags.
        """
        for k, v in self.obj_map.items():
            for resc_flag in self.resc_flags:
                for ctrl_flag in self.resc_flags_ctl:
                    rv = self.create_resource_helper('boolean', resc_flag,
                                                     ctrl_flag)
                    if rv:
                        self.delete_resource_helper('boolean', resc_flag,
                                                    ctrl_flag, k, v)

    def test_size_type_resource_create_delete(self):
        """
        Test behavior of size type resource creation and deletion
        by all possible and supported types and flags.
        """
        for k, v in self.obj_map.items():
            for resc_flag in self.resc_flags:
                for ctrl_flag in self.resc_flags_ctl:
                    rv = self.create_resource_helper('size', resc_flag,
                                                     ctrl_flag)
                    if rv:
                        self.delete_resource_helper('size', resc_flag,
                                                    ctrl_flag, k, v)

    def test_string_array_type_resource_create_delete(self):
        """
        Test behavior of string_array type resource creation and deletion
        by all possible and supported types and flags.
        """
        for k, v in self.obj_map.items():
            for resc_flag in self.resc_flags:
                for ctrl_flag in self.resc_flags_ctl:
                    rv = self.create_resource_helper('string_array', resc_flag,
                                                     ctrl_flag)
                    if rv:
                        self.delete_resource_helper('string_array', resc_flag,
                                                    ctrl_flag, k, v)

    def test_none_type_resource_create_delete(self):
        """
        Test behavior of None type resource creation and deletion
        by all possible and supported types and flags.
        """
        for k, v in self.obj_map.items():
            for resc_flag in self.resc_flags:
                for ctrl_flag in self.resc_flags_ctl:
                    rv = self.create_resource_helper(None, resc_flag,
                                                     ctrl_flag)
                    if rv:
                        self.delete_resource_helper(None, resc_flag,
                                                    ctrl_flag, k, v)


================================================
FILE: test/tests/functional/pbs_qrun.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import os
import signal


class TestQrun(TestFunctional):

    def setUp(self):
        TestFunctional.setUp(self)
        # set ncpus to a known value, 2 here
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        self.pbs_exec = self.server.pbs_conf['PBS_EXEC']
        self.qrun = os.path.join(self.pbs_exec, 'bin', 'qrun')

    def test_invalid_host_val(self):
        """
        Tests that pbs_server should not crash when the node list in
        qrun is ill-formed
        """
        j1 = Job(TEST_USER)
        # submit a multi-chunk job
        j1 = Job(attrs={'Resource_List.select':
                        'ncpus=2:host=%s+ncpus=2:host=%s' %
                        (self.mom.shortname, self.mom.shortname)})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid1)
        exec_vnode = '"\'(%s)+(%s)\'"' % \
                     (self.mom.shortname, self.mom.shortname)
        err_msg = 'qrun: Unknown node  "\'(%s)+(%s)\'"' % \
            (self.mom.shortname, self.mom.shortname)
        try:
            self.server.runjob(jobid=jid1, location=exec_vnode)
        except PbsRunError as e:
            self.assertIn(err_msg, e.msg[0])
            self.logger.info('As expected qrun throws error: ' + err_msg)
        else:
            msg = "Able to run job successfully"
            self.assertTrue(False, msg)
        msg = "Server is not up"
        self.assertTrue(self.server.isUp(), msg)
        self.logger.info("As expected server is up and running")
        j2 = Job(TEST_USER)
        # submit a sleep job
        j2 = Job(attrs={'Resource_List.select': 'ncpus=3'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid2)
        try:
            self.server.runjob(jobid=jid2, location=exec_vnode)
        except PbsRunError as e:
            self.assertIn(err_msg, e.msg[0])
            self.logger.info('As expected qrun throws error: ' + err_msg)
        else:
            msg = "Able to run job successfully"
            self.assertTrue(False, msg)
        msg = "Server is not up"
        self.assertTrue(self.server.isUp(), msg)
        self.logger.info("As expected server is up and running")

    def test_qrun_hangs(self):
        """
        This test submit 500 jobs with differnt equivalence class,
        turn of scheduling and qrun job to
        verify whether qrun hangs.
        """
        node = self.mom.shortname
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 1}, id=node)
        for walltime in range(1, 501):
            j = Job(TEST_USER)
            a = {'Resource_List.walltime': walltime}
            j.set_attributes(a)
            if walltime == 500:
                jid = self.server.submit(j)
            else:
                self.server.submit(j)
        self.logger.info("Submitted 500 jobs with different walltime")
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        time.sleep(1)
        now = time.time()
        pid = os.fork()
        if pid == 0:
            try:
                self.server.runjob(jobid=jid)
                self.logger.info("Successfully runjob. Child process exit.")
                os._exit(0)
            except PbsRunError as e:
                self.logger.info("Runjob throws error: " + e.msg[0])
        else:
            try:
                self.scheduler.log_match("Starting Scheduling Cycle",
                                         interval=5, starttime=now,
                                         max_attempts=10)
                self.logger.info("No hangs. Parent process exit")
            except PtlLogMatchError:
                os.kill(pid, signal.SIGKILL)
                os.waitpid(pid, 0)
                self.logger.info("Runjob hung. Child process exit.")
                self.fail("Qrun didn't start another sched cycle")

    def test_qrun_subjob(self):
        """
        This test tests if PBS is able to qrun an array subjob
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        jid = self.server.submit(Job())
        self.server.expect(JOB, {'job_state': 'R'}, jid)
        j = Job(TEST_USER, {ATTR_J: '1-5'})
        arr_jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, arr_jid)
        subj2 = j.create_subjob_id(arr_jid, 2)
        self.server.runjob(jobid=subj2)
        self.server.expect(JOB, {'job_state': 'R'}, subj2)
        self.server.expect(JOB, {'job_state': 'S'}, jid)


================================================
FILE: test/tests/functional/pbs_qselect.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQselect(TestFunctional):
    """
    Test suite for qselect command
    """
    def test_qselect_buffer_overflow(self):
        """
        Check that various qselect option arguments does not buffer overflow
        """
        # test -q option
        qselect_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                   'bin', 'qselect')
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-q',
                                   ('a' * 30) + '@' + ('b' * 30)])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegally formed destination: aaaaaaaaaaaaaaaa'
                      'aaaaaaaaaaaaaa@bbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',
                      ret['err'])
        # test -c
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-c.abcd.w'])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -c value', ret['err'])
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-c.eq.abcdefg'])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -c value', ret['err'])
        # test -a
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-a.ne.' + ('1' * 100)])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -a value', ret['err'])
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-a.abcd.5001011212'])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -a value', ret['err'])
        # test accounting string buf and optarg buf using -A
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-A', ('a' * 300)])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertEqual(ret['err'], [])
        # test -l
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-l',
                                   ('a' * 300) + '.abcd.' + ('b' * 300)])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -l value', ret['err'])
        # test -N
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-N', ('a' * 300)])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -N value', ret['err'])
        # test -u
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-u',
                                   ('a' * 300) + '@' + ('b' * 300)])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -u value', ret['err'])
        # test -S
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-s', 'ABCD'])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -s value', ret['err'])
        # test -t
        ret = self.du.run_cmd(cmd=[qselect_cmd, '-t',
                                   ('a' * 90) + '.eq.' + ('1' * 90)])
        self.assertNotEqual(ret, None)
        self.assertIn('err', ret)
        self.assertIn('qselect: illegal -t value', ret['err'])


================================================
FILE: test/tests/functional/pbs_qstat.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQstat(TestFunctional):
    """
    This test suite validates output of qstat with various options
    """

    def test_qstat_pt(self):
        """
        Test that checks correct output for qstat -pt
        """

        attr = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, attr,
                            id=self.mom.shortname)

        job_count = 10
        j = Job(TEST_USER)
        j.set_sleep_time(5)
        j.set_attributes({ATTR_J: '1-' + str(job_count)})
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'B'}, id=jid)

        qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                 'bin', 'qstat')
        qstat_cmd_pt = [qstat_cmd, '-pt', str(jid)]

        # wait for first subjob to finish before doing qstat -pt
        sj1 = j.create_subjob_id(jid, 1)
        self.server.expect(JOB, {'job_state': 'X'}, id=sj1)

        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_pt)
        self.assertEqual(ret['rc'], 0,
                         'Qstat returned with non-zero exit status')
        qstat_out = '\n'.join(ret['out'])

        sjids = [j.create_subjob_id(jid, x) for x in range(1, job_count + 1)]
        for sjid in sjids:
            if len(sjid) > 17:
                sjid = sjid[0:16] + '*'
            self.assertIn(sjid, qstat_out, 'Job %s not in output' % sjid)
            sj_escaped = re.escape(sjid)
            # check that at least first job is in X state and 100 percent done
            match = re.search(
                sj_escaped + r'\s+\S+\s+\S+\s+(--\s+[RQ]|100\s+X)\s+\S+',
                qstat_out)
            self.assertIsNotNone(match, 'Job output does not match')

    def test_qstat_qselect(self):
        """
        Test to check that qstat can handle more than 150 jobs query at a time
        without any connection issues.
        """
        self.server.restart()
        j = Job(TEST_USER)
        for i in range(150):
            self.server.submit(j)
        ret_msg = 'Too many open connections.'
        qselect_cmd = ' `' + \
            os.path.join(
                self.server.client_conf['PBS_EXEC'],
                'bin',
                'qselect') + '`'
        qstat_cmd = os.path.join(
            self.server.client_conf['PBS_EXEC'], 'bin', 'qstat')
        final_cmd = qstat_cmd + qselect_cmd
        ret = self.du.run_cmd(self.server.hostname, final_cmd,
                              as_script=True)
        if ret['rc'] != 0:
            self.assertFalse(ret['err'][0], ret_msg)

    def test_qstat_n_ip(self):
        """
        Test qstat -n output reports the correct node name
        when node is created using IP address as name of the node.
        """
        self.server.manager(MGR_CMD_DELETE, NODE, None, '')
        ipaddr = socket.gethostbyname(self.mom.hostname)
        attr_A = {'Mom': self.mom.hostname}
        self.server.manager(MGR_CMD_CREATE, NODE, id=ipaddr, attrib=attr_A)
        self.server.expect(NODE, {'state': 'free'}, id=ipaddr)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                 'bin', 'qstat')
        qstat_cmd_n = [qstat_cmd, '-n', str(jid)]
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_n)
        self.assertEqual(ret['rc'], 0,
                         'Qstat returned with non-zero exit status')
        qstat_out = '\n'.join(ret['out'])
        self.assertIn(ipaddr, qstat_out,
                      "Incorrect node name in qstat -n when "
                      "node created using IP address")

    def test_qstat_n_fqdn(self):
        """
        Test qstat -n output reports task slot and processor info
        when node is created using FQDN.
        """
        self.server.manager(MGR_CMD_DELETE, NODE, None, '')
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.mom.hostname)
        self.server.expect(NODE, {'state': 'free'}, id=self.mom.hostname)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                 'bin', 'qstat')
        qstat_cmd_n = [qstat_cmd, '-n', str(jid)]
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_n)
        self.assertEqual(ret['rc'], 0,
                         'Qstat returned with non-zero exit status')
        qstat_out = '\n'.join(ret['out'])
        self.assertNotEqual(re.search(r"%s/([0-9]+)"
                                      % re.escape(self.mom.shortname),
                                      qstat_out), None, "The exec host does"
                            " not contain the task slot number")


================================================
FILE: test/tests/functional/pbs_qstat_2servers.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQstatTwoServers(TestFunctional):

    """
    This test suite checks that qstat works correctly when there
    are 2 PBS servers set up
    """

    def setUp(self):
        if len(self.servers) != 2 or self.server.client in self.servers:
            self.skipTest("This test needs two servers and one client")
        # Because of a bug in PTL, having moms on respective server hosts
        # don't work, so the server hosts need to be passed as nomom hosts
        svrnames = self.servers.keys()
        if "nomom" not in self.conf or \
                svrnames[0] not in self.conf["nomom"] or \
                svrnames[1] not in self.conf["nomom"]:
            self.skipTest("This test needs the server hosts to be passed"
                          " as nomom hosts: -p servers=<host1>:<host2>,"
                          "nomom=<host1>:<host2>")
        TestFunctional.setUp(self)

    def test_qstat_req_server(self):
        _m = self.server.get_op_mode()
        if _m != PTL_CLI:
            self.skipTest("Test only supported for CLI mode")

        self.server1 = self.servers.values()[0]
        self.server2 = self.servers.values()[1]
        a = {'scheduling': 'false', 'flatuid': 'true'}
        self.server1.manager(MGR_CMD_SET, SERVER, a)
        self.server2.manager(MGR_CMD_SET, SERVER, a)

        j = Job(TEST_USER)
        jid = self.server1.submit(j)
        destination = '@%s' % self.server2.hostname
        self.server1.movejob(jobid=jid, destination=destination)
        self.server1.status(JOB, id=jid + '@%s' % self.server2.hostname,
                            runas=str(TEST_USER))
        expmsg = "Type 19 request received"\
                 " from %s@%s" % (str(TEST_USER), self.server.client)
        self.server1.log_match(msg=expmsg, existence=False, max_attempts=5)
        self.server2.log_match(msg=expmsg)


================================================
FILE: test/tests/functional/pbs_qstat_count.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestqstatStateCount(TestFunctional):

    def setUp(self):
        TestFunctional.setUp(self)
        # set ncpus to a known value, 2 here
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

    def submit_waiting_job(self, timedelta):
        """
        Submit a job in W state using -a option.
        The time specified for -a is current time + timedelta.
        """
        attribs = {ATTR_a: BatchUtils().convert_seconds_to_datetime(
            int(time.time()) + timedelta)}
        j = Job(TEST_USER, attribs)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'W'}, id=jid)
        return jid

    def find_state_counts(self):
        """
        From the output of qstat -Bf, parses the number of jobs in R, H, W
        and Q states and the value of total_jobs. Calculates the total number
        of jobs based on individual counts parsed. Returns these values in a
        dictionary.
        """
        counts = {}
        # Get output of qstat
        qstat = self.server.status(SERVER)
        state_count = qstat[0]['state_count'].split()
        all_state_count = 0
        for s in state_count:
            state = s.split(':')
            # Check for negative value
            self.assertGreaterEqual(
                int(state[1]), 0, 'state count has negative values')
            counts[state[0]] = int(state[1])
            all_state_count = all_state_count + int(state[1])
        counts['all_state_count'] = all_state_count
        counts['total_jobs'] = int(qstat[0]['total_jobs'])
        # Find queued count from output of qstat
        counts['expected_queued_count'] = (counts['total_jobs'] -
                                           counts['Held'] -
                                           counts['Waiting'] -
                                           counts['Running'])
        return counts

    def verify_count(self):
        """
        The function does following checks based on output of qstat -Bf:
        1. total_jobs should match the number of jobs submitted
        2. queued_count should match total_jobs minus the number of jobs in
        state other than Q.
        (each job uses ncpus=1)
        """
        counts = self.find_state_counts()
        self.assertEqual(counts['total_jobs'],
                         counts['all_state_count'], 'Job count incorrect')
        self.assertEqual(counts['expected_queued_count'], counts['Queued'],
                         'Queued count incorrect')

    def test_queued_no_restart(self):
        """
        The test case verifies that the reported queued_count in qstat -Bf
        without a server restart is equal to the total_jobs - number of jobs in
        state other than Q.
        (each job uses ncpus=1)
        """
        jid = []
        # submit 4 jobs to ensure some jobs are in state Q as available ncpus=2
        for _ in range(4):
            j = Job(TEST_USER)
            jid.append(self.server.submit(j))

        a = {ATTR_h: None}
        j = Job(TEST_USER, a)
        self.server.submit(j)

        self.submit_waiting_job(600)

        # Wait for jobs to go in R state
        self.server.expect(JOB, {'job_state': 'R'}, id=jid[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=jid[1])
        self.verify_count()

    def test_queued_restart(self):
        """
        The test case verifies that the reported queued_count in qstat -Bf
        is equal to total_jobs - number of jobs in state other than Q,
        even after the server is restarted.
        (each job uses ncpus=1)
        """
        jid = []
        # submit 4 jobs to ensure some jobs are in state Q as available ncpus=2
        for _ in range(4):
            j = Job(TEST_USER)
            jid.append(self.server.submit(j))

        a = {ATTR_h: None}
        j = Job(TEST_USER, a)
        self.server.submit(j)

        self.submit_waiting_job(600)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=jid[1])

        self.server.restart()
        self.verify_count()

    def test_queued_no_restart_multiple_queue(self):
        """
        The test case verifies that the queued_count reported in the output
        of qstat -Bf is equal to total_jobs - running jobs, without server
        restart.
        (each job uses ncpus=1)
        """
        # create 2 execution queues
        qname = ['workq1', 'workq2']
        for que in qname:
            a = {
                'queue_type': 'Execution',
                'enabled': 'True',
                'started': 'True'}
            self.server.manager(MGR_CMD_CREATE, QUEUE, a, que)

        q1_attr = {ATTR_queue: 'workq1'}
        q2_attr = {ATTR_queue: 'workq2'}

        # submit 1 job per queue to ensure a running job in each queue,
        # then submit 2 more jobs per queue i.e. overall 3 jobs in each queue
        j = Job(TEST_USER, q1_attr)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        j = Job(TEST_USER, q2_attr)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        for _ in range(2):
            j = Job(TEST_USER, q1_attr)
            self.server.submit(j)
            j = Job(TEST_USER, q2_attr)
            self.server.submit(j)

        self.verify_count()

    def test_queued_restart_multiple_queue(self):
        """
        The test case verifies that the queued_count reported in the output
        of qstat -Bf is equal to total_jobs - running jobs, even after the
        server is restart.
        (each job uses ncpus=1)
        """
        qname = ['workq1', 'workq2']
        for que in qname:
            a = {
                'queue_type': 'Execution',
                'enabled': 'True',
                'started': 'True'}
            self.server.manager(MGR_CMD_CREATE, QUEUE, a, que)

        q1_attr = {ATTR_queue: 'workq1'}
        q2_attr = {ATTR_queue: 'workq2'}

        # submit 1 job per queue to ensure a running job in each queue,
        # then submit 2 more jobs per queue i.e. overall 3 jobs in each queue
        j = Job(TEST_USER, q1_attr)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        j = Job(TEST_USER, q2_attr)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        for _ in range(2):
            j = Job(TEST_USER, q1_attr)
            self.server.submit(j)
            j = Job(TEST_USER, q2_attr)
            self.server.submit(j)

        self.server.restart()
        self.verify_count()

    def test_queued_sched_false(self):
        """
        This test case verifies that the value of queued_count in the output
        of qstat -Bf matches the number of jobs submitted (each using ncpus=1),
        as scheduling is set to False.
        """
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        for _ in range(4):
            j = Job(TEST_USER)
            self.server.submit(j)
        self.server.restart()
        self.verify_count()

    def test_wait_to_queued(self):
        """
        This test case verifies that when a job state changes from W to Q after
        server is restarted, the value of queued_count reported in the
        output of qstat -Bf is as expected.
        """
        a = {
            ATTR_stagein: 'inputData@' +
            self.server.hostname +
            ':' + os.path.join('noDir', 'nofile')}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'W'}, id=jid,
                           offset=30, interval=2)

        jid1 = self.submit_waiting_job(10)
        j = Job(TEST_USER)
        jid2 = self.server.submit(j)
        j = Job(TEST_USER)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1, offset=10)
        self.server.restart()
        self.verify_count()

    def test_job_state_count(self):
        """
        Testing if jobs in the 'W' state will cause
        the state_count to go negative or incorrect
        """
        # Failing stage-in operation, to put job into the waiting state
        a = {
            ATTR_stagein: 'inputData@' +
            self.server.hostname +
            ':/noDir/nofile'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'W'}, id=jid,
                           offset=30, interval=2)
        # Restart server
        self.server.restart()
        self.verify_count()


================================================
FILE: test/tests/functional/pbs_qstat_formats.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import json


@tags('commands')
class TestQstatFormats(TestFunctional):
    """
    This test suite validates output of qstat for
    various formats
    """

    def parse_dsv(self, jid, qstat_type, delimiter=None):
        """
        Common function to parse qstat dsv output using delimiter
        """
        if delimiter:
            delim = "-D" + str(delimiter)
        else:
            delim = " "
        if qstat_type == "job":
            cmd = ' -f -F dsv ' + delim + " " + str(jid)
            qstat_cmd_dsv = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                         'bin', 'qstat') + cmd
            qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                     'bin', 'qstat') + ' -f ' + str(jid)
        elif qstat_type == "server":
            qstat_cmd_dsv = os.path.join(self.server.pbs_conf[
                'PBS_EXEC'], 'bin', 'qstat') + ' -Bf -F dsv ' + delim
            qstat_cmd = os.path.join(self.server.pbs_conf[
                'PBS_EXEC'], 'bin', 'qstat') + ' -Bf '
        elif qstat_type == "queue":
            qstat_cmd_dsv = os.path.join(self.server.pbs_conf[
                'PBS_EXEC'], 'bin', 'qstat') + ' -Qf -F dsv ' + delim
            qstat_cmd = os.path.join(self.server.pbs_conf[
                'PBS_EXEC'], 'bin', 'qstat') + ' -Qf '
        rv = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd)
        attrs_qstatf = []
        for line in rv['out']:
            attr = line.split("=")
            if not re.match(r'[\t]', attr[0]):
                attrs_qstatf.append(attr[0].strip())
        attrs_qstatf.pop()
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_dsv)
        qstat_attrs = []
        for line in ret['out']:
            if delimiter:
                attr_vals = line.split(str(delimiter))
            else:
                attr_vals = line.split("|")
        for item in attr_vals:
            qstat_attr = item.split("=")
            qstat_attrs.append(qstat_attr[0])
        for attr in attrs_qstatf:
            if attr not in qstat_attrs:
                self.assertFalse(attr + " is missing")

    def parse_json(self, dictitems, qstat_attr):
        """
        Common function for parsing all values in json output
        """
        for key, val in dictitems.items():
            qstat_attr.append(str(key))
            if isinstance(val, dict):
                for key, val in val.items():
                    qstat_attr.append(str(key))
                    if isinstance(val, dict):
                        self.parse_json(val, qstat_attr)
        return qstat_attr

    def get_qstat_attribs(self, obj_type):
        """
        Common function to get the qstat attributes in default format.
        Attributes returned by this function are used to validate the
        '-F json' format output.
        The dictionary of attributes as returned by status() can not
        be used directly because some attributes are printed differently
        in '-F json' format.  Hence this function returns a modified
        attributes list.
        obj_type: Can be SERVER, QUEUE or JOB for qstat -Bf, qstat -Qf
              and qstat -f respectively
        """
        attrs = self.server.status(obj_type)
        qstat_attrs = []

        for key, val in attrs[0].items():
            # qstat -F json output does not
            # print the 'id' attribute. Its value
            # is printed instead.
            if key == 'id':
                qstat_attrs.append(str(val))
            else:
                # Extract keys coming after '.' in 'qstat -f' output so they
                # can be matched with 'qstat -f -F json' format.
                # This is because some attributes, like below, are represented
                # differently in 'qstat -f' output and 'qstat -f -F json'
                # outputs
                #
                # Example:
                # qstat -f output:
                #   default_chunk.ncpus = 1
                #   default_chunk.mem = 1gb
                #   Resource_List.ncpus = 1
                #   Resource_List.nodect = 1
                #
                # qstat -f -F json output:
                #   "default_chunk":{
                #      "ncpus":1
                #      "mem":1gb
                #   }
                #    "Resource_List":{
                #       "ncpus":1,
                #      "nodect":1,
                #   }

                k = key.split('.')
                if k[0] not in qstat_attrs:
                    qstat_attrs.append(str(k[0]))
                if len(k) == 2:
                    qstat_attrs.append(str(k[1]))

            # Extract individual variables under 'Variable_List' from
            # 'qstat -f' output so they can be matched with 'qstat -f -F json'
            # format.
            # Example:
            #
            # qstat -f output:
            #    Variable_List = PBS_O_LANG=en_US.UTF-8,
            #        PBS_O_PATH=/usr/lib64/qt-3.3/bin
            #        PBS_O_SHELL=/bin/bash,
            #        PBS_O_WORKDIR=/home/pbsuser,
            #        PBS_O_SYSTEM=Linux,PBS_O_QUEUE=workq,
            #
            # qstat -f -F json output:
            #    "Variable_List":{
            #        "PBS_O_LANG":"en_US.UTF-8",
            #        "PBS_O_PATH":"/usr/lib64/qt-3.3/bin:/usr/local/bin
            #        "PBS_O_SHELL":"/bin/bash",
            #        "PBS_O_WORKDIR":"/home/pbsuser,
            #        "PBS_O_SYSTEM":"Linux",
            #        "PBS_O_QUEUE":"workq",
            #    },

            if key == ATTR_v:
                for v in val.split(','):
                    qstat_attrs.append(str(v).split('=')[0])
        return qstat_attrs

    def test_qstat_dsv(self):
        """
        test qstat outputs job info in dsv format with default delimiter pipe
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)
        self.parse_dsv(jid, "job")

    def test_qstat_bf_dsv(self):
        """
        test qstat outputs server info in dsv format with default
        delimiter pipe
        """
        self.parse_dsv(None, "server")

    def test_qstat_qf_dsv(self):
        """
        test qstat outputs queue info in dsv format with default delimiter pipe
        """
        self.parse_dsv(None, "queue")

    def test_qstat_dsv_semicolon(self):
        """
        test qstat outputs job info in dsv format with semicolon as delimiter
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)
        self.parse_dsv(jid, "job", ";")

    def test_qstat_bf_dsv_semicolon(self):
        """
        test qstat outputs server info in dsv format with semicolon as
        delimiter
        """
        self.parse_dsv(None, "server", ";")

    def test_qstat_qf_dsv_semicolon(self):
        """
        test qstat outputs queue info in dsv format with semicolon as delimiter
        """
        self.parse_dsv(None, "queue", ";")

    def test_qstat_dsv_comma_ja(self):
        """
        test qstat outputs job array info in dsv format with comma as delimiter
        """
        j = Job(TEST_USER)
        j.set_attributes({ATTR_J: '1-3'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "B"}, id=jid)
        self.parse_dsv(jid, "job", ",")

    def test_qstat_bf_dsv_comma(self):
        """
        test qstat outputs server info in dsv format with comma as delimiter
        """
        self.parse_dsv(None, "server", ",")

    def test_qstat_qf_dsv_comma(self):
        """
        test qstat outputs queue info in dsv format with comma as delimiter
        """
        self.parse_dsv(None, "queue", ",")

    def test_qstat_dsv_string(self):
        """
        test qstat outputs job info in dsv format with string as delimiter
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)
        self.parse_dsv(jid, "job", "QWERTY")

    def test_qstat_bf_dsv_string(self):
        """
        test qstat outputs server info in dsv format with string as delimiter
        """
        self.parse_dsv(None, "server", "QWERTY")

    def test_qstat_qf_dsv_string(self):
        """
        test qstat outputs queue info in dsv format with string as delimiter
        """
        self.parse_dsv(None, "queue", "QWERTY")

    def test_oneline_dsv(self):
        """
        submit a single job and check the no of attributes parsed from dsv
        is equal to the one parsed from one line output.
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        time.sleep(1)
        qstat_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'qstat')
        [qstat_dsv_script, qstat_dsv_out, qstat_oneline_script,
         qstat_oneline_out] = [DshUtils().create_temp_file() for _ in range(4)]
        f = open(qstat_dsv_script, 'w')
        f.write(qstat_cmd + ' -f -F dsv ' + str(jid) + ' > ' + qstat_dsv_out)
        f.close()
        run_script = "sh " + qstat_dsv_script
        dsv_ret = self.du.run_cmd(
            self.server.hostname,
            cmd=run_script)
        f = open(qstat_dsv_out, 'r')
        dsv_out = f.read()
        f.close()
        dsv_attr_count = len(dsv_out.replace(r"\|", "").split("|"))
        f = open(qstat_oneline_script, 'w')
        f.write(qstat_cmd + ' -f -w ' + str(jid) + ' > ' + qstat_oneline_out)
        f.close()
        run_script = 'sh ' + qstat_oneline_script
        oneline_ret = self.du.run_cmd(
            self.server.hostname, cmd=run_script)
        oneline_attr_count = sum(1 for line in open(
            qstat_oneline_out) if not line.isspace())
        map(os.remove, [qstat_dsv_script, qstat_dsv_out,
                        qstat_oneline_script, qstat_oneline_out])
        self.assertEqual(dsv_attr_count, oneline_attr_count)

    def test_json(self):
        """
        Check whether the qstat json output can be parsed using
        python json module
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        [qstat_json_script, qstat_json_out] = [DshUtils().create_temp_file()
                                               for _ in range(2)]
        qstat_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'qstat')
        f = open(qstat_json_script, 'w')
        f.write(qstat_cmd + ' -f -F json ' + str(jid) + ' > ' + qstat_json_out)
        f.close()
        self.du.chmod(path=qstat_json_script, mode=0o755)
        run_script = 'sh ' + qstat_json_script
        json_ret = self.du.run_cmd(
            self.server.hostname, cmd=run_script)
        data = open(qstat_json_out, 'r').read()
        map(os.remove, [qstat_json_script, qstat_json_out])
        try:
            json_data = json.loads(data)
        except BaseException:
            self.assertTrue(False)

    def test_qstat_tag(self):
        """
        Test <jsdl-hpcpa:Executable> tag is dispalyed with "Executable"
        while doing qstat -f
        """
        ret = True
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                 'qstat') + ' -f ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd, sudo=True)
        if -1 != str(ret).find('Executable'):
            if -1 == str(ret).find('<jsdl-hpcpa:Executable>'):
                ret = False
        self.assertTrue(ret)

    @tags('smoke')
    def test_qstat_json_valid(self):
        """
        Test json output of qstat -f is in valid format when querired as a
        super user and all attributes displayed in qstat are present in output
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

        qstat_cmd_json = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'qstat') + ' -f -F json ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json_object = json.loads(qstat_out)
        except ValueError as e:
            self.assertTrue(False)

        json_only_attrs = ['Jobs', 'timestamp', 'pbs_version', 'pbs_server']
        attrs_qstatf = self.get_qstat_attribs(JOB)
        qstat_json_attr = []

        for key, val in json_object.items():
            qstat_json_attr.append(str(key))
            if isinstance(val, dict):
                self.parse_json(val, qstat_json_attr)

        for attr in attrs_qstatf:
            if attr not in qstat_json_attr:
                self.assertFalse(attr + " is missing")

        for attr in json_only_attrs:
            if attr not in qstat_json_attr:
                self.assertFalse(attr + " is missing")

    def test_qstat_json_valid_multiple_jobs(self):
        """
        Test json output of qstat -f is in valid format when multiple jobs are
        queried and make sure that all attributes are displayed in qstat are
        present in the output
        """
        j = Job(TEST_USER)
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(j)
        qstat_cmd_json = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                      'qstat') + \
            ' -f -F json ' + str(jid1) + ' ' + str(jid2)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json.loads(qstat_out)
        except ValueError:
            self.assertTrue(False)

    def test_qstat_json_valid_multiple_jobs_p(self):
        """
        Test json output of qstat -f is in valid format when multiple jobs are
        queried and make sure that attributes are displayed with `p` option.
        When -p is passed, then only the Resource_List is requested. An
        attribute with type resource list has to be the last attribute
        in order to hit the bug.
        """
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        jid2 = self.server.submit(j)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)
        self.server.expect(JOB, {'job_state': "R"}, id=jid2)
        self.server.expect(JOB, {'job_state': "R"}, id=jid3)
        qstat_cmd_json = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                      'qstat') + ' -fp -F json '
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = '\n'.join(ret['out'])
        try:
            js = json.loads(qstat_out)
        except ValueError:
            self.assertTrue(False, 'JSON failed to load.')

        self.assertIn('Jobs', js)
        self.assertIn(jid, js['Jobs'])
        self.assertIn('Resource_List', js['Jobs'][jid])
        self.assertIn(jid2, js['Jobs'])
        self.assertIn('Resource_List', js['Jobs'][jid2])
        self.assertIn(jid3, js['Jobs'])
        self.assertIn('Resource_List', js['Jobs'][jid3])

    def test_qstat_json_valid_user(self):
        """
        Test json output of qstat -f is in valid format when queried as
        normal user
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)
        qstat_cmd_json = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'qstat') + ' -f -F json ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname,
                              cmd=qstat_cmd_json, runas=TEST_USER)
        qstat_out = "\n".join(ret['out'])
        try:
            json_object = json.loads(qstat_out)
        except ValueError as e:
            self.assertTrue(False)

    def test_qstat_json_valid_ja(self):
        """
        Test json output of qstat -f of Job arrays is in valid format
        """
        j = Job(TEST_USER)
        j.set_attributes({ATTR_J: '1-3'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': "B"}, id=jid)
        qstat_cmd_json = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'qstat') + ' -f -F json ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json_object = json.loads(qstat_out)
        except ValueError as e:
            self.assertTrue(False)

    @tags('smoke')
    def test_qstat_bf_json_valid(self):
        """
        Test json output of qstat -Bf is in valid format and all
        attributes displayed in qstat are present in output
        """
        qstat_cmd_json = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'qstat') + ' -Bf -F json'
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json_object = json.loads(qstat_out)
        except ValueError as e:
            self.assertTrue(False)

        json_only_attrs = ['Server', 'timestamp', 'pbs_version', 'pbs_server']
        attrs_qstatbf = self.get_qstat_attribs(SERVER)

        qstat_json_attr = []
        for key, val in json_object.items():
            qstat_json_attr.append(str(key))
            if isinstance(val, dict):
                self.parse_json(val, qstat_json_attr)

        for attr in attrs_qstatbf:
            if attr not in qstat_json_attr:
                self.assertFalse(attr + " is missing")

        for attr in json_only_attrs:
            if attr not in qstat_json_attr:
                self.assertFalse(attr + " is missing")

    @tags('smoke')
    def test_qstat_qf_json_valid(self):
        """
        Test json output of qstat -Qf is in valid format and all
        attributes displayed in qstat are present in output
        """
        qstat_cmd_json = os.path.join(self.server.pbs_conf[
            'PBS_EXEC'], 'bin', 'qstat') + ' -Qf -F json'
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json_object = json.loads(qstat_out)
        except ValueError as e:
            self.assertTrue(False)

        json_only_attrs = ['Queue', 'timestamp', 'pbs_version', 'pbs_server']
        attrs_qstatqf = self.get_qstat_attribs(QUEUE)

        qstat_json_attr = []
        for key, val in json_object.items():
            qstat_json_attr.append(str(key))
            if isinstance(val, dict):
                self.parse_json(val, qstat_json_attr)

        for attr in attrs_qstatqf:
            if attr not in qstat_json_attr:
                self.assertFalse(attr + " is missing")

        for attr in json_only_attrs:
            if attr not in qstat_json_attr:
                self.assertFalse(attr + " is missing")

    def test_qstat_qf_json_valid_multiple_queues(self):
        """
        Test json output of qstat -Qf is in valid format when
        we query multiple queues
        """
        a = {'queue_type': 'Execution', 'resources_max.walltime': '10:00:00'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq3')
        qstat_cmd_json = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                      'qstat') + ' -Q -f -F json'
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            qs = json.loads(qstat_out)
        except ValueError:
            self.assertTrue(False, "Invalid JSON, failed to load")

        self.assertIn('Queue', qs)
        self.assertIn('workq', qs['Queue'])
        self.assertIn('workq2', qs['Queue'])
        self.assertIn('resources_max', qs['Queue']['workq2'])
        self.assertIn('workq3', qs['Queue'])
        self.assertIn('resources_max', qs['Queue']['workq3'])

    def test_qstat_json_valid_job_special_env(self):
        """
        Test json output of qstat -f is in valid format
        with special chars in env
        """
        os.environ["DOUBLEQUOTES"] = 'hi"ha'
        os.environ["REVERSESOLIDUS"] = r'hi\ha'
        os.environ["MYVAR"] = """\'\"asads\"\'"""
        os.environ["MYHOME"] = """/home/pbstest01/Mo\\'"""
        os.environ["FOO0"] = """00123"""
        os.environ["FOO1"] = """.123"""
        os.environ["FOO2"] = """123."""
        os.environ["FOO3"] = """00"""
        os.environ["FOO4"] = """-00"""
        os.environ["FOO5"] = """00.123"""
        os.environ["FOO6"] = """-00.123"""
        os.environ["MYVAR0"] = """\'"""
        os.environ["MYVAR1"] = """\\'"""
        os.environ["MYVAR2"] = """\\\'"""
        os.environ["MYVAR3"] = """\\\\'"""
        os.environ["MYVAR4"] = """\\\\\\'"""
        os.environ["MYVAR5"] = """\\\\\\\\\\'"""
        os.environ["MYVAR6"] = r"""\,"""
        os.environ["MYVAR7"] = """\\,"""
        os.environ["MYVAR8"] = r"""\\\,"""
        os.environ["MYVAR9"] = """\\\\,"""
        os.environ["MYVAR10"] = """\\\\\\,"""
        os.environ["MYVAR11"] = """\\\\\\\\\\,"""
        os.environ["MYVAR12"] = r"""apple\,delight"""

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'default_qsub_arguments': '-V'})

        j = Job(self.du.get_current_user())
        j.preserve_env = True
        jid = self.server.submit(j)
        qstat_cmd_json = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                      'qstat') + \
            ' -f -F json ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json.loads(qstat_out)
        except ValueError:
            self.logger.info(qstat_out)
            self.assertTrue(False)

    def test_qstat_json_valid_job_longint_env(self):
        """
        Test if JSON output of qstat -f is in valid format
        with longint in env
        """
        os.environ["LONGINT"] = '1111111111111111111111111111111111111111' + \
                                '1111111111111111111111111111111111111111' + \
                                '11111111111111111111111111111111111'
        os.environ["LONGDOUBLE"] = '1111111111111111111111111111112.88888' + \
                                   '8888888888888888'

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'default_qsub_arguments': '-V'})

        j = Job(self.du.get_current_user())
        j.preserve_env = True
        jid = self.server.submit(j)
        qstat_cmd_json = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                      'qstat') + \
            ' -f -F json ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json.loads(qstat_out)
        except ValueError:
            self.assertTrue(False)

    def run_namelength_test(self, options=''):
        """
        Changes the server name, sets a long job and queue name,
        and ensures they're truncated correctly in a wide format
        """
        self.server.stop()
        self.assertFalse(self.server.isUp(), 'Failed to stop PBS')

        conf = self.du.parse_pbs_config(self.server.hostname)
        self.du.set_pbs_config(
            self.server.hostname,
            confs={'PBS_SERVER_HOST_NAME': conf['PBS_SERVER'],
                   'PBS_SERVER': 'supersuperduperlongservername31'})

        self.server.start()
        self.assertTrue(self.server.isUp(), 'Failed to start PBS')
        a = {'queue_type': 'Execution', 'enabled': 'True',
             'started': 'True'}
        qname = 'queuename15char'
        jname = 'jobname16xxxchar'
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=qname)
        a = {ATTR_queue: qname, ATTR_name: jname}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                 'qstat') + ' ' + options + ' ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd)
        qstat_out = '\n'.join(ret['out'])
        jid_trunc = jid[:29] + '*'
        jname_trunc = jname[:14] + '*'
        self.assertIn(jid_trunc, qstat_out)
        self.assertIn(qname, qstat_out)
        self.assertIn(jname_trunc, qstat_out)
        self.assertNotIn(jid, qstat_out)
        self.assertNotIn(jname, qstat_out)

    def test_qstat_wide(self):
        """
        Test if qstat -w correctly prints in wide format
        This tests the normal display function
        """
        self.run_namelength_test('-w')

    def test_qstat_rwt(self):
        """
        Test if qstat -rwt correctly prints in wide format.
        This tests the alternate display function
        """
        self.run_namelength_test('-rwt')

    def test_qstat_answ(self):
        """
        Test if qstat -answ correctly prints in wide format.
        This tests the alternate display function
        """
        self.run_namelength_test('-answ')

    def test_qstat_ans(self):
        """
        Test if qstat -ans correctly prints with truncation.
        """
        self.server.stop()
        self.assertFalse(self.server.isUp(), 'Failed to stop PBS')

        server_hostname = self.server.pbs_conf['PBS_SERVER']
        self.du.set_pbs_config(
            self.server.hostname,
            confs={'PBS_SERVER_HOST_NAME': server_hostname,
                   'PBS_SERVER': 'supersuperduperlongservername31'})

        self.server.start()
        self.assertTrue(self.server.isUp(), 'Failed to start PBS')
        a = {'queue_type': 'Execution', 'enabled': 'True',
             'started': 'True'}
        qname = 'queuename15char'
        jname = 'jobname16xxxchar'
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=qname)
        a = {ATTR_queue: qname, ATTR_name: jname}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        qstat_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                 'qstat') + ' -ans ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd)
        qstat_out = '\n'.join(ret['out'])
        jid_trunc = jid[:14] + '*'
        jname_trunc = jname[:9] + '*'
        qname_trunc = qname[:7] + '*'
        self.assertIn(jid_trunc, qstat_out)
        self.assertIn(jname_trunc, qstat_out)
        self.assertIn(qname_trunc, qstat_out)
        self.assertNotIn(jid, qstat_out)
        self.assertNotIn(jname, qstat_out)
        self.assertNotIn(qname, qstat_out)

    def test_qstat_json_empty_job_pset(self):
        """
        Test an empty pset resource value under json.
        """
        # create a custom resource
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'string', 'flag': 'h'}, id='iru')
        attr = {'node_group_enable': 'True', 'node_group_key': 'iru'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        time.sleep(6)
        # when job runs, pset will be set to iru="""
        qstat_cmd_json = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                      'qstat') + ' -f -F json ' + str(jid)
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            json.loads(qstat_out)
        except ValueError:
            self.logger.info(qstat_out)
            self.assertFalse(True, "Json failed to load")

    def test_qstat_format_conflicts(self):
        """
        Test conflicting combinations of alt_opt flags with -F
        """
        binpath = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', 'qstat')
        conflicting_opts = [
            '-a -F JSON',
            '-i -F JSON',
            '-r -F JSON',
            '-n -F JSON',
            '-s -F JSON',
            '-H -F JSON',
            '-T -F JSON',
            '-G -F JSON',
            '-M -F JSON',
            '-1 -F JSON',
            '-w -F JSON',
        ]

        for flags in conflicting_opts:
            qstat_cmd = binpath + ' ' + flags
            ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd)

            self.assertNotEqual(ret['rc'], 0, f"Expected failure for: {flags}")
            self.assertIn("conflicting options", ''.join(ret['err']).lower(),
                          f"Missing conflict error for: {flags}")
            self.assertEqual(len(ret['out']), 0, f"Unexpected stdout for: {flags}")


    def test_qstat_format_valid_combos(self):
        """
        Test valid combinations of alt_opt flags with - JSON
        i.e. should not throw errors
        """
        binpath = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', 'qstat')

        j = Job(TEST_USER)
        jid = self.server.submit(j)
        ret = self.du.run_cmd(self.server.hostname, cmd="qstat -f " + jid)
        self.assertIn("job_state", ''.join(ret['out']))

        valid_opts = [
            '-f -F JSON',
            f'-f -F JSON {jid}',
            '-Bf -F JSON',
            '-Qf -F JSON'
        ]

        for flags in valid_opts:
            qstat_cmd = binpath + ' ' + flags
            ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd)

            self.assertEqual(ret['rc'], 0, f"Expected success for: {flags}")
            self.assertEqual(len(ret['err']), 0, f"Unexpected stderr for: {flags}")
    

    def test_qstat_Qf_json_new_type_queue_format(self):
        """
        Test if qstat -Qf -F JSON returns multiple new-type queue restrictions
        as a single comma separated string, rather than having duplicate keys
        """

        qname = 'newtypeq'
        a = {'queue_type': 'Execution', 'enabled': 'True',
             'started': 'True'}
        
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=qname)

        # set multiple new-type restrictions:
        restriction_settings = [
            ('max_queued ', '[u:foo=3]'),
            ('max_queued +', '[g:bar=2]'),
            ('max_run ', '[u:foo=4]'),
            ('max_run +', '[p:projectX=10]'),
            ('max_run_soft ', '[g:devs=6]'),
            ('queued_jobs_threshold ', '[u:baz=15]'),
            ('max_queued_res.mem ', '[u:foo=100mb]'),
            ('max_queued_res.mem +', '[g:bar=200mb]'),
            ('max_queued_res.ncpus ', '[u:foo=3]'),
        ]

        for attr, val in restriction_settings:
            self.server.manager(MGR_CMD_SET, QUEUE, {attr: val}, id=qname)

        qstat_cmd_json = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                                      'qstat') + f' -Qf -F JSON {qname}'
        ret = self.du.run_cmd(self.server.hostname, cmd=qstat_cmd_json)
        qstat_out = "\n".join(ret['out'])
        try:
            j = json.loads(qstat_out)
        except ValueError:
            self.logger.info(qstat_out)
            self.assertFalse(True, "Json failed to load")

        self.assertIn("Queue", j)
        self.assertIn(qname, j["Queue"])
        qdata = j["Queue"][qname]
        
        expected = { #regular new type restrictions
            "max_queued": "[u:foo=3],[g:bar=2]",
            "max_run": "[u:foo=4],[p:projectX=10]",
            "max_run_soft": "[g:devs=6]",
            "queued_jobs_threshold": "[u:baz=15]",
        }

        for key, val in expected.items():
            self.assertIn(key, qdata)
            self.assertIsInstance(qdata[key], str, f"{key} should be a comma-separated string")
            self.assertCountEqual(qdata[key], val)

        res_expected = { #resource based new type restrictions
            "max_queued_res": {
                "mem": "[u:foo=100mb],[g:bar=200mb]",
                "ncpus": "[u:foo=3]"
            }
        }

        for attr_key, attr_val in res_expected.items():
            self.assertIn(attr_key, qdata)
            self.assertIsInstance(qdata[attr_key], dict)
            for res_key, res_val in attr_val.items():
                self.assertIn(res_key, qdata[attr_key])
                self.assertCountEqual(qdata[attr_key][res_key], res_val)


        self.server.manager(MGR_CMD_DELETE, QUEUE, id=qname)


================================================
FILE: test/tests/functional/pbs_qsub_direct_write.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQsub_direct_write(TestFunctional):
    """
    validate qsub direct write option.
    """

    def setUp(self):
        """
        Default setup and variable declaration
        """
        TestFunctional.setUp(self)
        self.msg = "Job is sleeping for 10 secs as job should  be running"
        self.msg += " at the time we check for directly written files"

    def checks_available_ncpus(self, ncpus=1):
        nodes = self.server.counter(NODE, 'resources_available.ncpus',
                                    grandtotal=True, level=logging.DEBUG)
        if nodes and 'resources_available.ncpus' in nodes:
            total_ncpus = nodes['resources_available.ncpus']
            if total_ncpus < ncpus:
                self.skip_test(reason="need %d available ncpus" % ncpus)

    @requirements(mom_on_server=True)
    def test_direct_write_when_job_succeeds(self):
        """
        submit a sleep job and make sure that the std_files
        are getting directly written to the mapped directory
        when direct_files option is used.
        """
        j = Job(TEST_USER, attrs={ATTR_k: 'doe'})
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        file_count = len([name for name in os.listdir(
            mapping_dir) if os.path.isfile(os.path.join(mapping_dir, name))])
        self.assertEqual(2, file_count)
        self.server.expect(JOB, {ATTR_k: 'doe'}, id=jid)

    @requirements(mom_on_server=True)
    def test_direct_write_when_job_succeeds_controlled(self):
        """
        submit a sleep job and make sure that the std_files
        are getting directly written to the mapped directory
        when direct_files option is used.

        directory should be
        1) owned by a different user
        2) owned by a group that is not the job user's primary gid
                (but is a gid that the user is a member of)
        3) not accessible via other permissions
        """
        j = Job(TEST_USER2, attrs={ATTR_k: 'doe'})
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER5)
        mapping_dir = self.du.create_temp_dir(
            asuser=TEST_USER2, asgroup=TSTGRP0, mode=0o770)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        file_count = len([name for name in os.listdir(
            mapping_dir) if os.path.isfile(os.path.join(mapping_dir, name))])
        self.assertEqual(2, file_count)
        self.server.expect(JOB, {ATTR_k: 'doe'}, id=jid)

    @requirements(mom_on_server=True)
    def test_direct_write_output_file(self):
        """
        submit a sleep job and make sure that the output file
        are getting directly written to the mapped directory
        when direct_files option is used with o option.
        """
        j = Job(TEST_USER, attrs={ATTR_k: 'do'})
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        for name in os.listdir(mapping_dir):
            p = re.search('STDIN.e*', name)
            if p:
                self.logger.info('Match found: ' + p.group())
            else:
                self.assertTrue(False)
        file_count = len([name for name in os.listdir(
            mapping_dir) if os.path.isfile(os.path.join(mapping_dir, name))])
        self.assertEqual(1, file_count)
        self.server.expect(JOB, {ATTR_k: 'do'}, id=jid)

    @requirements(mom_on_server=True)
    def test_direct_write_error_file(self):
        """
        submit a sleep job and make sure that the error file
        are getting directly written to the mapped directory
        when direct_files option is used with e option.
        """
        j = Job(TEST_USER, attrs={ATTR_k: 'de'})
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        for name in os.listdir(mapping_dir):
            p = re.search('STDIN.e*', name)
            if p:
                self.logger.info('Match found: ' + p.group())
            else:
                self.assertTrue(False)
        file_count = len([name for name in os.listdir(
            mapping_dir) if os.path.isfile(os.path.join(mapping_dir, name))])
        self.assertEqual(1, file_count)
        self.server.expect(JOB, {ATTR_k: 'de'}, id=jid)

    @requirements(mom_on_server=True)
    def test_direct_write_error_custom_path(self):
        """
        submit a sleep job and make sure that the files
        are getting directly written to the custom path
        provided in -e and -o option even when -doe is set.
        """
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        err_file = os.path.join(tmp_dir, 'error_file')
        out_file = os.path.join(tmp_dir, 'output_file')
        a = {ATTR_e: err_file, ATTR_o: out_file, ATTR_k: 'doe'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        file_count = len([name for name in os.listdir(
            tmp_dir) if os.path.isfile(os.path.join(tmp_dir, name))])
        self.assertEqual(2, file_count)
        self.server.expect(JOB, {ATTR_k: 'doe'}, id=jid)

    @requirements(mom_on_server=True)
    def test_direct_write_error_custom_dir(self):
        """
        submit a sleep job and make sure that the files
        are getting directly written to the custom dir
        provided in -e and -o option even when -doe is set.
        """
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_e: tmp_dir, ATTR_o: tmp_dir, ATTR_k: 'doe'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        file_count = len([name for name in os.listdir(
            tmp_dir) if os.path.isfile(os.path.join(tmp_dir, name))])
        self.assertEqual(2, file_count)
        self.server.expect(JOB, {ATTR_k: 'doe'}, id=jid)

    @requirements(mom_on_server=True)
    def test_direct_write_default_qsub_arguments(self):
        """
        submit a sleep job and make sure that the std_files
        are getting directly written to the mapped directory
        when default_qsub_arguments is set to -kdoe.
        """
        j = Job(TEST_USER)
        j.set_sleep_time(10)
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'default_qsub_arguments': '-kdoe'})
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        file_count = len([name for name in os.listdir(
            mapping_dir) if os.path.isfile(os.path.join(mapping_dir, name))])
        self.assertEqual(2, file_count)
        self.server.expect(JOB, {ATTR_k: 'doe'}, id=jid)

    @requirements(mom_on_server=True)
    def test_direct_write_without_config_entry(self):
        """
        submit a sleep job and make sure that the std_files
        is directly written to the submission directory when it is
        accessible from mom and direct_files option is used
        but submission directory is not mapped in mom config file.
        """
        j = Job(TEST_USER, attrs={ATTR_k: 'doe'})
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        file_count = len([name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))])
        self.assertEqual(2, file_count)

    def test_qalter_direct_write(self):
        """
        submit a job and make sure that it in queued state.
        alter the job with -koed and check whether it is
        reflecting in qstat -f output.
        """
        mydate = int(time.time()) + 60
        j = Job(TEST_USER)
        attribs = {
            ATTR_a: time.strftime(
                '%m%d%H%M',
                time.localtime(
                    float(mydate)))}
        j.set_attributes(attribs)
        jid = self.server.submit(j)
        attribs = {ATTR_k: 'oed'}
        try:
            self.server.alterjob(jid, attribs)
            if self.server.expect(JOB, {'job_state': 'W'},
                                  id=jid):
                self.server.expect(JOB, attribs,
                                   id=jid)
        except PbsAlterError as e:
            print(str(e))

    def test_qalter_direct_write_error(self):
        """
        submit a job and after it starts running alter
        the job with -koed and check whether expected
        error message appears
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        attribs = {ATTR_k: 'oed'}
        self.server.expect(JOB, {'job_state': 'R'})
        try:
            self.server.alterjob(jid, attribs)
        except PbsAlterError as e:
            self.assertTrue(
                'Cannot modify attribute while job running  Keep_Files'
                in e.msg[0])

    @requirements(mom_on_server=True)
    def test_direct_write_qrerun(self):
        """
        submit a sleep job and make sure that the std_files
        are written and when a job is rerun error message
        in logged in mom_log that it is skipping directly
        written/absent spool file as files are already
        present on first run of the job.
        """
        self.mom.add_config({'$logevent': '0xffffffff'})
        j = Job(TEST_USER, attrs={ATTR_k: 'doe'})
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.logger.info(self.msg)
        self.server.expect(JOB, {ATTR_k: 'doe'}, id=jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.rerunjob(jid)
        self.mom.log_match(
            "stage_file;Skipping directly written/absent spool file",
            max_attempts=10, interval=5)
        file_count = len([name for name in os.listdir(
            mapping_dir) if os.path.isfile(os.path.join(mapping_dir, name))])
        self.assertEqual(2, file_count)

    @requirements(mom_on_server=True)
    def test_direct_write_job_array(self):
        """
        submit a job array and make sure that the std_files
        is directly written to the submission directory when it is
        accessible from mom and direct_files option is used
        but submission directory is not mapped in mom config file.
        """
        self.checks_available_ncpus(4)
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER, attrs={ATTR_k: 'doe', ATTR_J: '1-4'})
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        self.server.expect(JOB, {ATTR_state + '=R': 4}, count=True,
                           id=jid, extend='t')
        self.logger.info('checking for directly written std files')
        file_list = [name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))]
        self.assertEqual(8, len(file_list))
        idn = jid[:jid.find('[]')]
        for std in ['o', 'e']:
            for sub_ind in range(1, 5):
                f_name = 'STDIN.' + std + idn + '.' + str(sub_ind)
                if f_name not in file_list:
                    raise self.failureException("std file " + f_name +
                                                " not found")

    @requirements(mom_on_server=True)
    def test_direct_write_job_array_custom_dir(self):
        """
        submit a job array and make sure that the files
        are getting directly written to the custom dir
        provided in -e and -o option even when -doe is set.
        """
        self.checks_available_ncpus(4)
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_e: tmp_dir, ATTR_o: tmp_dir, ATTR_k: 'doe', ATTR_J: '1-4'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(10)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        self.server.expect(JOB, {ATTR_state + '=R': 4}, count=True,
                           id=jid, extend='t')
        self.logger.info('checking for directly written std files')
        file_list = [name for name in os.listdir(
            tmp_dir) if os.path.isfile(os.path.join(tmp_dir, name))]
        self.assertEqual(8, len(file_list))
        for ext in ['.OU', '.ER']:
            for sub_ind in range(1, 5):
                f_name = j.create_subjob_id(jid, sub_ind) + ext
                if f_name not in file_list:
                    raise self.failureException("std file " + f_name +
                                                " not found")


================================================
FILE: test/tests/functional/pbs_qsub_opts_args.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import os


class TestQsubOptionsArguments(TestFunctional):
    """
    validate qsub submission with a script and executable.
    note: The no-arg test is an interactive job, which is tested in
    SmokeTest.test_interactive_job
    """
    fn = None

    def setUp(self):
        TestFunctional.setUp(self)
        script = '/bin/hostname'
        self.fn = self.du.create_temp_file(body=script)
        self.qsub_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'qsub')
        self.jobdir_root = "/tmp"
        self.jobdir = []
        self.remove_jobdir = False

    def tearDown(self):
        TestFunctional.tearDown(self)
        if self.remove_jobdir:
            for mom in self.moms.values():
                for d in self.jobdir:
                    if d.startswith(self.jobdir_root):
                        self.logger.info('%s:remove jobdir %s' % (
                                         mom.hostname, d))
                        self.du.rm(hostname=mom.shortname, sudo=True,
                                   path=d, recursive=True, force=True)
            self.remove_jobdir = False

    def validate_error(self, err):
        ret_msg = 'qsub: Failed to save job/resv, '\
            'refer server logs for details'
        # PBS returns 15161 error code when it fails to save the job in db
        # but in PTL_CLI mode it returns modulo of the error code.

        # PTL_API and PTL_CLI mode returns 15161 and 57 error code respectively
        if err.rc == 15161 or err.rc == 15161 % 256:
            self.assertFalse(err.msg[0], ret_msg)
        else:
            self.fail(
                "ERROR in submitting a job with future time: %s" %
                err.msg[0])

    def jobdir_shared_body(self, location):
        """
        Test submission of job with sandbox=PRIVATE,
        and moms have $jobdir_root set to shared.
        """
        self.remove_jobdir = True
        momA = self.moms.values()[0]
        momB = self.moms.values()[1]

        loglevel = {'$logevent': 4095}
        momB.add_config(loglevel)
        c = {'$jobdir_root': '%s shared' % location}
        for mom in [momA, momB]:
            mom.add_config(c)
            mom.restart()

        a = {'Resource_List.select': '2:ncpus=1',
             'Resource_List.place': 'scatter',
             ATTR_sandbox: 'PRIVATE',
             }
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(30)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        attribs = self.server.status(JOB, id=jid)
        jobdir = attribs[0]['jobdir']
        self.jobdir.append(jobdir)
        relpath = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_release_nodes')

        rel_cmd = [relpath, '-j', jid, momB.shortname]
        ret = self.server.du.run_cmd(self.server.hostname, cmd=rel_cmd,
                                     runas=TEST_USER)
        self.assertEqual(ret['rc'], 0)
        # sister mom has preserved the file
        errmsg = "sister mom deleted jobdir %s" % jobdir
        rc = self.du.isdir(hostname=momB.shortname, path=jobdir,
                           sudo=True)
        self.assertTrue(rc, errmsg)
        msg = "shared jobdir %s to be removed by primary mom" % jobdir
        momB.log_match(msg)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        # primary mom has deleted the file
        errmsg = "MS mom preserved jobdir %s" % jobdir
        rc = self.du.isdir(hostname=momA.shortname, path=jobdir,
                           sudo=True)
        self.assertFalse(rc, errmsg)

    def test_qsub_with_script_with_long_TMPDIR(self):
        """
        submit a job with a script and with long path in TMPDIR
        """
        longpath = '%s/aaaaaaaaaa/bbbbbbbbbb/cccccccccc/eeeeeeeeee/\
ffffffffff/gggggggggg/hhhhhhhhhh/iiiiiiiiii/jj/afdj/hlppoo/jkloiytupoo/\
bhtiusabsdlg' % (os.environ['HOME'])
        os.environ['TMPDIR'] = longpath
        if not os.path.exists(longpath):
            os.makedirs(longpath)
        cmd = [self.qsub_cmd, self.fn]
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEqual(rv['rc'], 0, 'qsub failed')

    def test_qsub_with_script_executable(self):
        """
        submit a job with a script and executable
        """
        cmd = [self.qsub_cmd, self.fn, '--', self.mom.sleep_cmd, '10']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        failed = rv['rc'] == 2 and rv['err'][0].split(' ')[0] == 'usage:'
        self.assertTrue(failed, 'qsub should have failed, but did not fail')

    def test_qsub_with_script_dashes(self):
        """
        submit a job with a script and dashes
        """
        cmd = [self.qsub_cmd, self.fn, '--']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        failed = rv['rc'] == 2 and rv['err'][0].split(' ')[0] == 'usage:'
        self.assertTrue(failed, 'qsub should have failed, but did not fail')

    def test_qsub_with_dashes(self):
        """
        submit a job with only dashes
        """
        cmd = [self.qsub_cmd, '--']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        failed = rv['rc'] == 2 and rv['err'][0].split(' ')[0] == 'usage:'
        self.assertTrue(failed, 'qsub should have failed, but did not fail')

    def test_qsub_with_script(self):
        """
        submit a job with only a script
        """
        cmd = [self.qsub_cmd, self.fn]
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEqual(rv['rc'], 0, 'qsub failed')

    def test_qsub_with_executable(self):
        """
        submit a job with only an executable
        """
        cmd = [self.qsub_cmd, '--', self.mom.sleep_cmd, '10']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEqual(rv['rc'], 0, 'qsub failed')

    def test_qsub_with_option_executable(self):
        """
        submit a job with an option and executable
        """
        cmd = [self.qsub_cmd, '-V', '--', self.mom.sleep_cmd, '10']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEqual(rv['rc'], 0, 'qsub failed')

    def test_qsub_with_option_script(self):
        """
        submit a job with an option and script
        """
        cmd = [self.qsub_cmd, '-V', self.fn]
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEqual(rv['rc'], 0, 'qsub failed')

    def test_qsub_with_option_a(self):
        """
        Test submission of job with execution time(future and past)
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 2},
                            self.mom.shortname)
        present_tm = int(time.time())
        # submit a job with future time and should start whenever time hits
        future_tm = time.strftime(
            "%Y%m%d%H%M", time.localtime(
                present_tm + 120))
        j1 = Job(TEST_USER, {ATTR_a: future_tm})
        try:
            jid_1 = self.server.submit(j1)
        except PbsSubmitError as e:
            self.validate_error(e)
        self.server.expect(JOB, {'job_state': 'W'}, id=jid_1)
        self.logger.info(
            'waiting for 90 seconds to run the job as it is a future job...')
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_1, offset=90,
                           interval=2)

        # submit a job with past time and should start right away
        past_tm = time.strftime(
            "%Y%m%d%H%M", time.localtime(
                present_tm - 3600))
        j2 = Job(TEST_USER, {ATTR_a: past_tm})
        try:
            jid_2 = self.server.submit(j2)
        except PbsSubmitError as e:
            self.validate_error(e)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_2)

    @requirements(num_moms=2)
    def test_qsub_sandbox_private_jobdir_shared(self):
        """
        Test submission of job with sandbox=PRIVATE,
        and moms have $jobdir_root set to shared.
        """
        self.jobdir_shared_body(self.jobdir_root)

    @requirements(num_moms=2)
    def test_qsub_sandbox_private_jobdir_default_shared(self):
        """
        Test submission of job with sandbox=PRIVATE,
        and moms have $jobdir_root set to shared,
        with location set to PBS_USER_HOME.
        """
        self.jobdir_shared_body("PBS_USER_HOME")

    @runOnlyOnLinux
    def test_qsub_with_options_o_e_with_colon(self):
        """
        Test submission of job with output and error
        paths with a colon
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'true'})
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        err_file = os.path.join(tmp_dir, 'err:or_file')
        out_file = os.path.join(tmp_dir, 'out:put_file')
        a = {ATTR_e: err_file, ATTR_o: out_file}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'F'}, extend='x', id=jid)
        self.assertTrue(os.path.isfile(err_file),
                        "The error file was not found")
        self.assertTrue(os.path.isfile(out_file),
                        "The output file was not found")


================================================
FILE: test/tests/functional/pbs_qsub_remove_files.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQsub_remove_files(TestFunctional):
    """
    validate qsub remove file option.
    """

    def test_remove_file_when_job_succeeds(self):
        """
        submit a sleep job and make sure that the std_files
        are getting deleted when remove_files option is used.
        """
        j = Job(TEST_USER, attrs={ATTR_R: 'oe'})
        j.set_sleep_time(5)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_R: 'oe'}, id=jid)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        file_count = len([name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))])
        self.assertEqual(0, file_count)

    def test_remove_file_sandbox_private(self):
        """
        submit a sleep job and make sure that the std_files
        are getting deleted when remove_files option is used
        and job is submitted with -Wsandbox=private.
        """
        j = Job(TEST_USER, attrs={ATTR_R: 'oe', ATTR_sandbox: 'private'})
        j.set_sleep_time(5)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_R: 'oe'}, id=jid)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        file_count = len([name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))])
        self.assertEqual(0, file_count)

    def test_remove_files_output_file(self):
        """
        submit a job with -Ro option and make sure the output file
        gets deleted after job finishes
        """
        j = Job(TEST_USER, attrs={ATTR_R: 'o'})
        j.set_sleep_time(5)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_R: 'o'}, id=jid)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        for name in os.listdir(sub_dir):
            p = re.search('STDIN.e*', name)
            if p:
                self.logger.info('Match found: ' + p.group())
            else:
                self.assertTrue(False)
        file_count = len([name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))])
        self.assertEqual(1, file_count)

    @requirements(mom_on_server=True)
    def test_remove_files_error_file(self):
        """
        submit a job with -Re option and make sure the error file
        gets deleted after job finishes and works with direct_write
        """
        j = Job(TEST_USER, attrs={ATTR_k: 'de', ATTR_R: 'e'})
        j.set_sleep_time(5)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        mapping_dir = self.du.create_temp_dir(asuser=TEST_USER)
        self.mom.add_config(
            {'$usecp': self.mom.hostname + ':' + sub_dir +
             ' ' + mapping_dir})
        self.mom.restart()
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_R: 'e'}, id=jid)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        for name in os.listdir(mapping_dir):
            p = re.search('STDIN.o*', name)
            if p:
                self.logger.info('Match found: ' + p.group())
            else:
                self.assertTrue(False)
        file_count = len([name for name in os.listdir(
            mapping_dir) if os.path.isfile(os.path.join(mapping_dir, name))])
        self.assertEqual(1, file_count)

    def test_remove_files_error_custom_path(self):
        """
        submit a sleep job and make sure that the files
        are getting deleted from custom path provided in
        -e and -o option when -Roe is set.
        """
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        err_file = os.path.join(tmp_dir, 'error_file')
        out_file = os.path.join(tmp_dir, 'output_file')
        a = {ATTR_e: err_file, ATTR_o: out_file, ATTR_R: 'oe'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(5)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_R: 'oe'}, id=jid)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        file_count = len([name for name in os.listdir(
            tmp_dir) if os.path.isfile(os.path.join(tmp_dir, name))])
        self.assertEqual(0, file_count)

    def test_remove_files_error_custom_dir(self):
        """
        submit a sleep job and make sure that the files
        are getting deleted from custom directory path
        provided in -e and -o option when -Roe is set.
        """
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        a = {ATTR_e: tmp_dir, ATTR_o: tmp_dir, ATTR_R: 'oe'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(5)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_R: 'oe'}, id=jid)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        file_count = len([name for name in os.listdir(
            tmp_dir) if os.path.isfile(os.path.join(tmp_dir, name))])
        self.assertEqual(0, file_count)

    def test_remove_files_default_qsub_arguments(self):
        """
        submit a sleep job and make sure that the std_files
        are removed after the job finishes from submission
        directory when default_qsub_arguments is set to -Roe.
        """
        j = Job(TEST_USER)
        j.set_sleep_time(5)
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'default_qsub_arguments': '-Roe'})
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_R: 'oe'}, id=jid)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        file_count = len([name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))])
        self.assertEqual(0, file_count)

    def test_remove_file_when_job_fails(self):
        """
        submit a job using unavailable binary and make sure
        that the std_files are available when remove_files
        option is used.
        """
        j = Job(TEST_USER, attrs={ATTR_R: 'oe'})
        j.set_execargs('hostname')
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, 'job_state', op=UNSET, id=jid)
        file_count = len([name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))])
        self.assertEqual(2, file_count)

    def test_qalter_remove_files(self):
        """
        submit a job and make sure that it in queued state.
        alter the job with -Roe and check whether it is
        reflecting in qstat -f output.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        attribs = {ATTR_R: 'oe'}
        try:
            self.server.alterjob(jid, attribs)
            self.server.expect(JOB, attribs, id=jid)
        except PbsAlterError as e:
            print(str(e))

    def test_qalter_direct_write_error(self):
        """
        submit a job and after it starts running alter
        the job with -Roe and check whether expected
        error message appears
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        attribs = {ATTR_R: 'oe'}
        self.server.expect(JOB, {'job_state': 'R'})
        try:
            self.server.alterjob(jid, attribs)
        except PbsAlterError as e:
            self.assertTrue(
                'Cannot modify attribute while job'
                ' running  Remove_Files' in e.msg[0])

    def test_remove_file_job_array(self):
        """
        submit job array script that makes subjobs to exit with 0 except for
        subjob[2] and make sure that the std_files for only subjob[2] are
        available when remove_files option is used.
        """
        script = \
            "#!/bin/sh\n"\
            "%s 3;\n"\
            "if [ $PBS_ARRAY_INDEX -eq 2 ]; then\n"\
            "exit 1; fi; exit 0;" % (self.mom.sleep_cmd)
        j = Job(TEST_USER, attrs={ATTR_R: 'oe', ATTR_J: '1-3'},
                jobname='JOB_NAME')
        j.create_script(script)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        self.server.expect(JOB, ATTR_state, op=UNSET, id=jid)
        file_list = [name for name in os.listdir(
            sub_dir) if os.path.isfile(os.path.join(sub_dir, name))]
        self.assertEqual(2, len(file_list), "expected 2 std files")
        idn = jid[:jid.find('[]')]
        std_files = ['JOB_NAME.o' + idn + '.2', 'JOB_NAME.e' + idn + '.2']
        for f_name in std_files:
            if f_name not in file_list:
                raise self.failureException("std file " + f_name +
                                            " not found")

    def test_remove_file_custom_path_job_array(self):
        """
        submit job array script that makes subjobs to exit with 0 except for
        subjob[2] and make sure that the std_files for only subjob[2] are
        available in custom directory when remove_files option is used with
        -o and -e options.
        """
        script = \
            "#!/bin/sh\n"\
            "%s 3;\n"\
            "if [ $PBS_ARRAY_INDEX -eq 2 ]; then\n"\
            "exit 1; fi; exit 0;" % (self.mom.sleep_cmd)
        tmp_dir = self.du.create_temp_dir(asuser=TEST_USER)
        j = Job(TEST_USER, attrs={ATTR_e: tmp_dir, ATTR_o: tmp_dir,
                                  ATTR_R: 'oe', ATTR_J: '1-3'})
        j.create_script(script)
        sub_dir = self.du.create_temp_dir(asuser=TEST_USER)
        jid = self.server.submit(j, submit_dir=sub_dir)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        self.server.expect(JOB, ATTR_state, op=UNSET, id=jid)
        file_list = [name for name in os.listdir(
            tmp_dir) if os.path.isfile(os.path.join(tmp_dir, name))]
        self.assertEqual(2, len(file_list), "expected 2 std files")
        subj2_id = j.create_subjob_id(jid, 2)
        std_files = [subj2_id + '.OU', subj2_id + '.ER']
        for f_name in std_files:
            if f_name not in file_list:
                raise self.failureException("std file " + f_name +
                                            " not found")


================================================
FILE: test/tests/functional/pbs_qsub_script.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQsubScript(TestFunctional):
    """
    This test suite validates that qsub does not modify the script file
    """

    def setUp(self):
        TestFunctional.setUp(self)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'true'})
        self.qsub_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'qsub')
        self.sub_dir = self.du.create_temp_dir(asuser=TEST_USER)

    def test_qsub_basic_job(self):
        """
        This test case ensures that #PBS directive lines are not
        modified
        """
        script = """#!/bin/sh
        #PBS -m n
        cat $0
        """

        fn = self.du.create_temp_file(body=script, asuser=TEST_USER)
        cmd = [self.qsub_cmd, fn]
        rv = self.du.run_cmd(self.server.hostname,
                             cmd=cmd,
                             runas=TEST_USER,
                             cwd=self.sub_dir)
        self.assertEqual(rv['rc'], 0, 'qsub failed')
        jid = rv['out'][0]
        self.logger.info("Job ID: %s" % jid)

        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        job_status = self.server.status(JOB, id=jid, extend='x')
        if job_status:
            job_output_file = job_status[0]['Output_Path'].split(':')[1]
        rc = self.du.cmp(fileA=fn, fileB=job_output_file, runas=TEST_USER)
        self.assertEqual(rc, 0, 'cmp of job files failed')

    def test_qsub_line_extensions(self):
        """
        This test case ensures that only #PBS directive lines are treated
        as candidates for line extension
        """
        script = '''\
#!/bin/sh
#PBS -m \\
\\
n
# This is a test comment that shouldn't be extended \\
cat $0
'''
        expected_script = '''\
#!/bin/sh
#PBS -m n
# This is a test comment that shouldn't be extended \\
cat $0
'''

        j = Job()
        j.create_script(body=script, asuser=TEST_USER)
        submitted_script = j.script
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')
        job_status = self.server.status(JOB, id=jid, extend='x')
        if job_status:
            job_output_file = job_status[0]['Output_Path'].split(':')[1]
        expected_fn = self.du.create_temp_file(
            body=expected_script, asuser=TEST_USER)
        rc = self.du.cmp(fileA=expected_fn,
                         fileB=job_output_file, runas=TEST_USER)
        self.assertEqual(rc, 0, 'cmp of job files failed')

    def test_qsub_crlf(self):
        """
        This test case check the qsub rejects script ending with cr,lf.
        """
        script = """#!/bin/sh\r\nhostname\r\n"""
        j = Job(TEST_USER)
        j.create_script(script)
        fail_msg = 'qsub didn\'t throw an error'
        with self.assertRaises(PbsSubmitError, msg=fail_msg) as c:
            self.server.submit(j)
        msg = 'qsub: script contains cr, lf'
        self.assertEqual(c.exception.msg[0], msg)


================================================
FILE: test/tests/functional/pbs_qsub_wblock.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQsubWblock(TestFunctional):
    """
    This test suite contains the block job feature tests
    """
    def test_block_job(self):
        """
        Test to submit a block job and verify the Server response
        """
        j = Job(TEST_USER, attrs={ATTR_block: 'true'})
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        client_host = socket.getfqdn(self.server.client)
        msg = 'Server@%s;Job;%s;check_block_wt: Write successful' \
              ' to client %s for job %s' % \
              (self.server.shortname, jid, client_host, jid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    def test_block_job_array(self):
        """
        Test to submit a block array job and verify the Server response
        """
        j = Job(TEST_USER, attrs={ATTR_block: 'true', ATTR_J: '1-3'})
        j.set_sleep_time(1)
        jid = self.server.submit(j)
        client_host = socket.getfqdn(self.server.client)
        msg = 'Server@%s;Job;%s;check_block_wt: Write successful ' \
              'to client %s for job %s' % \
              (self.server.shortname, jid, client_host, jid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)


================================================
FILE: test/tests/functional/pbs_que_resc_usage.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQueRescUsage(TestFunctional):
    """
    Test resource behavior after set/unset/assign/release resource on the queue
    """
    err_msg = 'Failed to get the expected resource value'

    def setUp(self):
        TestFunctional.setUp(self)
        self.server.manager(MGR_CMD_SET, NODE, {
                            'resources_available.ncpus': 10},
                            self.mom.shortname)

    def create_custom_resc(self):
        """
        function to create the resource named as "foo"
        """
        self.server.manager(MGR_CMD_CREATE, RSC, {
                            'type': 'long', 'flag': 'q'}, id='foo')
        self.scheduler.add_resource('foo')
        self.server.manager(MGR_CMD_SET, QUEUE, {
                            'resources_available.foo': 6}, id='workq')

    def test_resc_assigned_set_unset(self):
        """
        Test "resources_assigned" attribute of the resource and it's behavior
        during set/unset
        """

        # set a resource and unset it without using
        self.server.manager(MGR_CMD_SET, QUEUE, {
                            'resources_available.ncpus': 4}, id='workq')
        q_status = self.server.status(QUEUE, id='workq')
        self.assertEqual(
            int(q_status[0]['resources_available.ncpus']), 4, self.err_msg)
        self.assertNotIn('resources_assigned.ncpus',
                         q_status[0], self.err_msg)
        self.server.manager(MGR_CMD_UNSET, QUEUE,
                            'resources_available.ncpus', id='workq')
        q_status = self.server.status(QUEUE, id='workq')
        self.assertNotIn('resources_available.ncpus',
                         q_status[0], self.err_msg)

        # set the resource and unset it after using
        a = {'resources_available.ncpus': 8}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq')
        q_status = self.server.status(QUEUE, id='workq')
        self.assertEqual(
            int(q_status[0]['resources_available.ncpus']), 8, self.err_msg)
        # job submission
        j_attr = {'Resource_List.ncpus': '3'}
        j1 = Job(attrs=j_attr)
        jid_1 = self.server.submit(j1)
        j2 = Job(attrs=j_attr)
        jid_2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, jid_1)
        self.server.expect(JOB, {'job_state': 'R'}, jid_2)
        q_status = self.server.status(
            QUEUE, 'resources_assigned.ncpus', id='workq')
        self.assertEqual(
            int(q_status[0]['resources_assigned.ncpus']), 6, self.err_msg)
        self.server.manager(MGR_CMD_UNSET, QUEUE,
                            'resources_available.ncpus', id='workq')
        q_status = self.server.status(QUEUE, id='workq')
        self.assertNotIn('resources_available.ncpus',
                         q_status[0], self.err_msg)
        self.assertIn('resources_assigned.ncpus',
                      q_status[0], self.err_msg)

        # Restart the server() and check "resources_assigned" value when
        # resource is not set but still some jobs are running in the system
        # and using the same resource.
        self.server.restart()
        q_status = self.server.status(QUEUE, id='workq')
        self.assertNotIn('resources_available.ncpus',
                         q_status[0], self.err_msg)
        self.assertEqual(
            int(q_status[0]['resources_assigned.ncpus']), 6, self.err_msg)
        # If no jobs are running at the time of restart the server
        self.server.delete(jid_1, extend='force', wait=True)
        self.server.delete(jid_2, extend='force', wait=True)
        self.server.restart()
        q_status = self.server.status(QUEUE, id='workq')
        self.assertNotIn('resources_available.ncpus',
                         q_status[0], self.err_msg)
        self.assertNotIn('resources_assigned.ncpus',
                         q_status[0], self.err_msg)

    def test_resources_assigned_with_zero_val(self):
        """
        In PBS we can request +ve or -ve values so sometimes resources_assigned
        becomes zero despite some jobs are still using the same resource.
        In this case resources_assigned shouldn't be unset if jobs are there
        in the system or else unset it.
        """

        # create a resource
        self.create_custom_resc()

        # resources_assigned is zero but still jobs are in the system
        j1_attr = {'Resource_List.foo': '3'}
        j1 = Job(attrs=j1_attr)
        jid_1 = self.server.submit(j1)
        # requesting negative resource here
        j2_attr = {'Resource_List.foo': '-3'}
        j2 = Job(attrs=j2_attr)
        jid_2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, jid_1)
        self.server.expect(JOB, {'job_state': 'R'}, jid_2)
        q_status = self.server.status(QUEUE, id='workq')
        self.assertEqual(
            int(q_status[0]['resources_assigned.foo']), 0, self.err_msg)
        self.server.manager(MGR_CMD_UNSET, QUEUE,
                            'resources_available.foo', id='workq')
        self.server.restart()
        q_status = self.server.status(QUEUE, id='workq')
        self.assertEqual(
            int(q_status[0]['resources_assigned.foo']), 0, self.err_msg)
        self.server.delete(jid_1, extend='force', wait=True)
        self.server.delete(jid_2, extend='force', wait=True)
        # jobs are finished now, resources_assigned should unset this time
        self.server.restart()
        q_status = self.server.status(QUEUE, id='workq')
        self.assertNotIn('resources_assigned.foo',
                         q_status[0], self.err_msg)

    def test_resources_assigned_deletion(self):
        """
        Test resources_assigned.<resc_name> deletion from the system
        """
        # create a resource
        self.create_custom_resc()
        # submit jobs
        j_attr = {'Resource_List.foo': '3'}
        j1 = Job(attrs=j_attr)
        j1.set_sleep_time(30)
        jid_1 = self.server.submit(j1)
        j2 = Job(attrs=j_attr)
        j2.set_sleep_time(30)
        jid_2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, jid_1)
        self.server.expect(JOB, {'job_state': 'R'}, jid_2)
        # try to delete the resource when it's busy on job
        try:
            self.server.manager(MGR_CMD_DELETE, RSC, id='foo')
        except PbsManagerError as e:
            self.assertIn("Resource busy on job", e.msg[0])
        self.server.expect(JOB, 'queue', op=UNSET, id=jid_1)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid_2)
        # now jobs has been finished, try to delete the resource again
        self.server.manager(MGR_CMD_DELETE, RSC, id='foo')
        q_status = self.server.status(QUEUE, id='workq')
        self.assertNotIn('resources_assigned.foo',
                         q_status[0], self.err_msg)
        self.assertNotIn('resources_available.foo',
                         q_status[0], self.err_msg)


================================================
FILE: test/tests/functional/pbs_ralter.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


class TestPbsResvAlter(TestFunctional):

    """
    This test suite is for testing the reservation times modification feature.
    """

    # Class variables
    tzone = None
    # These must be equal to the declarations in pbs_error.h
    PBSE_UNKRESVID = 236
    PBSE_SELECT_NOT_SUBSET = 79
    PBSE_RESV_NOT_EMPTY = 74
    PBSE_STDG_RESV_OCCR_CONFLICT = 75
    PBSE_INCORRECT_USAGE = 2
    PBSE_PERM = 159
    PBSE_NOSUP = 181
    fmt = "%a %b %d %H:%M:%S %Y"
    bu = BatchUtils()

    def setUp(self):

        TestFunctional.setUp(self)
        self.server.set_op_mode(PTL_CLI)
        # Set PBS_TZID, needed for standing reservation.
        if 'PBS_TZID' in self.conf:
            self.tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            self.tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Timezone not set, using Asia/Kolkata')
            self.tzone = 'Asia/Kolkata'

        a = {'resources_available.ncpus': 4, 'resources_available.mem': '1gb'}
        self.mom.create_vnodes(a, num=2,
                               usenatvnode=True)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 4095})

    def submit_and_confirm_reservation(self, offset, duration, standing=False,
                                       select="1:ncpus=4",
                                       rrule="FREQ=HOURLY;COUNT=2",
                                       ExpectSuccess=1, ruser=TEST_USER):
        """
        Helper function to submit a reservation and wait until it is confirmed.
        It also checks for the corresponding server and accounting logs.

        :param offset: time in seconds after which the reservation should
                       start.
        :type  offset: int

        :param duration: duration of the reservation to be submitted.
        :type  duration: int

        :param standing: whether to submit a standing reservation. Default: No.
        :type  standing: bool

        :param select: select specification for the reservation,
                      Default: "1:ncpus=4"
        :type  select: string.

        :param rrule:  iCal recurrence rule for submitting a standing
                      reservation.  Default: "FREQ=HOURLY;COUNT=2"
        :type  select: string.

        :param ExpectSuccess: Whether the caller expects the submission to be
                             successful or not. If set anything other than 1
                             or 0, reservation state is not checked at all.
                             Default: 1
        :type  ExpectSuccess: int.

        :param ruser: User who own the reservation. Default: TEST_USER.
        :type ruser: PbsUser.
        """
        start = int(time.time()) + offset
        end = start + duration

        if standing:
            attrs = {'Resource_List.select': select,
                     'reserve_start': start,
                     'reserve_end': end,
                     'reserve_timezone': self.tzone,
                     'reserve_rrule': rrule}
        else:
            attrs = {'Resource_List.select': select,
                     'reserve_start': start,
                     'reserve_end': end}

        rid = self.server.submit(Reservation(ruser, attrs))
        msg = "Resv;" + rid + ";New reservation submitted start="
        msg += time.strftime(self.fmt, time.localtime(int(start)))
        msg += " end="
        msg += time.strftime(self.fmt, time.localtime(int(end)))
        if standing:
            msg += " recurrence_rrule=" + rrule + " timezone="
            msg += self.tzone

        self.server.log_match(msg, interval=2, max_attempts=30)

        if ExpectSuccess == 1:
            attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
            self.server.expect(RESV, attrs, id=rid)

            msg = "Resv;" + rid + ";Reservation confirmed"
            self.server.log_match(msg, interval=2,
                                  max_attempts=30)

            self.server.expect(RESV, attrs, id=rid)
            acct_msg = "U;" + rid + ";requestor=" + ruser.name + "@.*"

            if standing:
                acct_msg += " recurrence_rrule=" + re.escape(rrule)
                acct_msg += " timezone=" + re.escape(self.tzone)

            self.server.accounting_match(acct_msg, interval=2, regexp=True,
                                         max_attempts=30, n='ALL')
        elif ExpectSuccess == 0:
            msg = "Resv;" + rid + ";Reservation denied"
            self.server.log_match(msg, interval=2,
                                  max_attempts=30)

        return rid, start, end

    def check_resv_running(self, rid, offset=0, display=True):
        """
        Helper method to wait for reservation to start running.

        :param rid: Reservation id.
        :type  rid: string.

        :param offset: Time in seconds to wait for the reservation to start
                      running.
        :type  offset: int.

        :param display: Whether to display a message or not, default - Yes.
        :type  display: bool
        """
        if offset > 0:
            if display:
                self.logger.info("Waiting for reservation to start running.")
            else:
                self.logger.info("Sleeping.")

        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid, offset=offset)

    def check_occr_finish(self, rid, duration):
        """
        Helper method to wait for a reservation occurrence to finish.
        This method will not work when waiting for the last occurrence of a
        standing reservation to finish running.

        :param rid: Reservation id.
        :type  rid: string.

        :param duration: Time in seconds to wait for the reservation to finish
                      running.
        :type  duration: int.

        :param standing: Whether to display a message or not, default - Yes.
        :type  standing: bool
        NOTE: This won't work for the final occurrence of a standing
              reservation.
        """
        if duration > 0:
            self.logger.info("Waiting for reservation to finish.")
        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid,
                           offset=(duration - 5), interval=2)

    def check_standing_resv_second_occurrence(self, rid, start, end,
                                              select=None, freq=3600,
                                              wait=False):
        """
        Helper method to verify that the second occurrence of a standing
        reservation retains its original start, and end times and select.
        Assumption: This method assumes that rid represents an HOURLY
                    reservation.

        :param rid: Reservation id.
        :type  rid: string.

        :param start: Start time of the first occurrence of the reservation.
        :type  start: int.

        :param end: End time of the first occurrence of the reservation.
        :type  end: int.

        :param freq: Frequency in seconds to run occurrences, default - 1 hour.
        :type  freq: int.

        :param wait: Whether to wait for occurrence to start, default - No.
        :type  wait: int.
        """
        next_start = start + freq
        next_end = end + freq
        duration = end - start
        next_start_conv = self.bu.convert_seconds_to_datetime(
            next_start, self.fmt)
        next_end_conv = self.bu.convert_seconds_to_datetime(
            next_end, self.fmt)
        attrs = {'reserve_start': next_start_conv,
                 'reserve_end': next_end_conv,
                 'reserve_duration': duration}
        if select:
            attrs.update({'Resource_List.select': select})
        self.server.expect(RESV, attrs, id=rid, max_attempts=10,
                           interval=5)
        if wait is True:
            attr = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
            t = start + freq - time.time()
            self.server.expect(RESV, attr, id=rid,
                               offset=t, max_attempts=10)

    def submit_job_to_resv(self, rid, sleep=10, user=None):
        """
        Helper method for submitting a sleep job to the reservation.

        :param rid: Reservation id.
        :type  rid: string.

        :param sleep: Sleep time in seconds for the job.
        :type  sleep: int.
        """
        r_queue = rid.split('.')[0]
        a = {'queue': r_queue}
        if not user:
            user = TEST_USER
        j = Job(user, a)
        j.set_sleep_time(sleep)
        jid = self.server.submit(j)
        return jid

    def alter_a_reservation(self, r, start, end, shift=0,
                            alter_s=False, alter_e=False,
                            whichMessage=1, confirm=True, check_log=True,
                            interactive=0, sequence=1,
                            a_duration=None, select=None, extend=None,
                            runas=None):
        """
        Helper method for altering a reservation.
        This method also checks for the server and accounting logs.

        :param r: Reservation id.
        :type  r: string.

        :param start: Start time of the reservation.
        :type  start: int.

        :param end: End time of the reservation.
        :type  end: int

        :param shift: Time in seconds the reservation times will be moved.
        :type  shift: int.

        :param alter_s: Whether the caller intends to change the start time.
                       Default - False.
        :type  alter_s: bool.

        :param alter_e: Whether the caller intends to change the end time.
                       Default - False.
        :type  alter_e: bool.

        :param whichMessage: Which message is expected to be returned.
                            Default: 1.
                             =-1 - No exception, don't check logs
                             =0 - PbsResvAlterError exception will be raised,
                                  so check for appropriate error response.
                             =1 - No exception, check for "CONFIRMED" message
                             =2 - No exception, check for "UNCONFIRMED" message
                             =3 - No exception, check for "DENIED" message
        :type  whichMessage: int.

        :param confirm: The expected state of the reservation after it is
                       altered. It can be either Confirmed or Running.
                       Default - Confirmed State.
        :type  confirm: bool.

        :param interactive: Time in seconds the CLI waits for a reply.
                           Default - 0 seconds.
        :type  interactive: int.

        :param sequence: To check the number of log matches corresponding
                        to alter.
                        Default: 1
        :type  sequence: int.

        :param a_duration: The duration to modify.
        :type a_duration: int.
        :param extend: extend parameter.
        :type extend: str.
        :param runas: User who own alters the reservation.
                      Default: user running the test.
        :type runas: PbsUser.
        """
        new_start = start
        new_end = end
        attrs = {}

        if alter_s:
            new_start = start + shift
            new_start_conv = self.bu.convert_seconds_to_datetime(
                new_start)
            attrs['reserve_start'] = new_start_conv

        if alter_e:
            new_end = end + shift
            new_end_conv = self.bu.convert_seconds_to_datetime(new_end)
            attrs['reserve_end'] = new_end_conv

        if interactive > 0:
            attrs['interactive'] = interactive

        if a_duration:
            if isinstance(a_duration, str) and ':' in a_duration:
                new_duration_conv = self.bu.convert_duration(a_duration)
            else:
                new_duration_conv = a_duration

            if not alter_s and not alter_e:
                new_end = start + new_duration_conv + shift
            elif alter_s and not alter_e:
                new_end = new_start + new_duration_conv
            elif not alter_s and alter_e:
                new_start = new_end - new_duration_conv
            # else new_start and new_end have already been calculated
        else:
            new_duration_conv = new_end - new_start

        if a_duration:
            attrs['reserve_duration'] = new_duration_conv

        if select:
            attrs['Resource_List.select'] = select

        if runas is None:
            runas = self.du.get_current_user()

        if whichMessage:
            msg = ['']
            acct_msg = ['']

            if interactive:
                if whichMessage == 1:
                    msg = "pbs_ralter: " + r + " CONFIRMED"
                elif whichMessage == 2:
                    msg = "pbs_ralter: " + r + " UNCONFIRMED"
                else:
                    msg = "pbs_ralter: " + r + " DENIED"
            else:
                msg = "pbs_ralter: " + r + " ALTER REQUESTED"

            self.server.alterresv(r, attrs, extend=extend, runas=runas)

            self.assertEqual(msg, self.server.last_out[0])
            self.logger.info(msg + " displayed")

            if check_log:
                msg = "Resv;" + r + ";Attempting to modify reservation "
                if start != new_start:
                    msg += "start="
                    msg += time.strftime(self.fmt,
                                         time.localtime(int(new_start)))
                    msg += " "

                if end != new_end:
                    msg += "end="
                    msg += time.strftime(self.fmt,
                                         time.localtime(int(new_end)))
                    msg += " "

                if select:
                    msg += "select=" + select + " "

                # strip the last space
                msg = msg[:-1]
                self.server.log_match(msg, interval=2, max_attempts=30)

            if whichMessage == -1:
                return new_start, new_end
            elif whichMessage == 1:
                if alter_s:
                    new_start_conv = self.bu.convert_seconds_to_datetime(
                        new_start, self.fmt)
                    attrs['reserve_start'] = new_start_conv

                if alter_e:
                    new_end_conv = self.bu.convert_seconds_to_datetime(
                        new_end, self.fmt)
                    attrs['reserve_end'] = new_end_conv

                if a_duration:
                    attrs['reserve_duration'] = new_duration_conv

                if confirm:
                    attrs['reserve_state'] = (MATCH_RE, 'RESV_CONFIRMED|2')
                else:
                    attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')

                self.server.expect(RESV, attrs, id=r)
                if check_log:
                    acct_msg = "Y;" + r + ";requestor=Scheduler@.*" + " start="
                    acct_msg += str(new_start) + " end=" + str(new_end)
                    self.server.status(RESV, 'resv_nodes', id=r)
                    acct_msg += " nodes="
                    acct_msg += re.escape(self.server.reservations[r].
                                          resvnodes())

                    if r[0] == 'S':
                        self.server.status(RESV, 'reserve_count', id=r)
                        count = self.server.reservations[r].attributes[
                            'reserve_count']
                        acct_msg += " count=" + count

                    self.server.accounting_match(acct_msg, regexp=True,
                                                 interval=2,
                                                 max_attempts=30, n='ALL')

                # Check if reservation reports new start time
                # and updated duration.

                msg = "Resv;" + r + ";Reservation alter confirmed"
            else:
                msg = "Resv;" + r + ";Reservation alter denied"
            interval = 0.5
            max_attempts = 20
            for attempts in range(1, max_attempts + 1):
                lines = self.server.log_match(msg, n='ALL', allmatch=True,
                                              max_attempts=5)
                info_msg = "log_match: searching " + \
                    str(sequence) + " sequence of message: " + \
                    msg + ": Got: " + str(len(lines))
                self.logger.info(info_msg)
                if len(lines) == sequence:
                    break
                else:
                    attempts = attempts + 1
                    time.sleep(interval)
            if attempts > max_attempts:
                raise PtlLogMatchError(rc=1, rv=False, msg=info_msg)
            return new_start, new_end
        else:
            try:
                self.server.alterresv(r, attrs, extend=extend, runas=runas)
            except PbsResvAlterError as e:
                if e.rc == self.PBSE_RESV_NOT_EMPTY:
                    msg = "pbs_ralter: Reservation not empty"
                elif e.rc == self.PBSE_UNKRESVID:
                    msg = "pbs_ralter: Unknown Reservation Id"
                elif e.rc == self.PBSE_SELECT_NOT_SUBSET:
                    msg = "pbs_ralter: New select must be made up of a "
                    msg += "subset of the original chunks"
                elif e.rc == self.PBSE_STDG_RESV_OCCR_CONFLICT:
                    msg = "Requested time(s) will interfere with "
                    msg += "a later occurrence"
                    log_msg = "Resv;" + r + ";" + msg
                    msg = "pbs_ralter: " + msg
                    self.server.log_match(log_msg, interval=2,
                                          max_attempts=30)
                elif e.rc == self.PBSE_INCORRECT_USAGE:
                    pass
                elif e.rc == self.PBSE_PERM:
                    msg = "pbs_ralter: Unauthorized Request"
                elif e.rc == self.PBSE_NOSUP:
                    msg = "pbs_ralter: No support for requested service"

                self.assertNotEqual(e.msg, msg)
                return start, end
            else:
                self.assertFalse("Reservation alter allowed when it should" +
                                 "not be.")

    def get_resv_time_info(self, rid):
        """
        Get the start time, end time and duration of a reservation
        in seconds
        :param rid: reservation id
        :type  rid: string
        """
        resv_data = self.server.status(RESV, id=rid)
        t_duration = int(resv_data[0]['reserve_duration'])
        t_end = self.bu.convert_stime_to_seconds(resv_data[0]['reserve_end'])
        t_start = self.bu.convert_stime_to_seconds(resv_data[0]
                                                   ['reserve_start'])
        return t_duration, t_start, t_end

    def test_alter_advance_resv_start_time_before_run(self):
        """
        This test case covers the below scenarios for an advance reservation
        that has not started running.

        1. Make an advance reservation start late (empty reservation)
        2. Make an advance reservation start early (empty reservation)
        3. Make an advance reservation start early (with a job in it)

        All the above operations are expected to be successful.
        """
        offset = 60
        duration = 20
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        new_start, new_end = self.alter_a_reservation(rid, start, end, shift,
                                                      alter_s=True, sequence=1)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      -shift, alter_s=True,
                                                      interactive=5,
                                                      sequence=2)

        # Submit a job to the reservation and change its start time.
        self.submit_job_to_resv(rid)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      -shift, alter_s=True,
                                                      sequence=3)

    def test_alter_advance_resv_start_time_after_run(self):
        """
        This test case covers the below scenarios for an advance reservation
        that has started running.

        1. Make an advance reservation start late (empty reservation)
        2. Make an advance reservation start late (with a job in it)

        Only operation 1 should be successful, operation 2 should fail.
        """
        offset = 10
        duration = 20
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Changing start time should be allowed as the reservation is empty.
        self.alter_a_reservation(rid, start, end, shift, alter_s=True)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Submit a job to the reservation.
        self.submit_job_to_resv(rid)

        # Changing start time should fail this time as it is not empty.
        self.alter_a_reservation(rid, start, end, shift, alter_s=True,
                                 whichMessage=0)

    def test_alter_advance_resv_end_time_before_run(self):
        """
        This test case covers the below scenarios for an advance reservation
        that has not started running.

        1. Make an advance reservation end late (empty reservation)
        2. Make an advance reservation end late (empty reservation)
        3. Make an advance reservation end late (with a job in it)

        All the above operations are expected to be successful.
        """
        duration = 20
        shift = 10
        offset = 60
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        new_start, new_end = self.alter_a_reservation(rid, start, end, shift,
                                                      alter_e=True, sequence=1)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      shift, alter_e=True,
                                                      sequence=2)

        # Submit a job to the reservation.
        self.submit_job_to_resv(rid)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      shift, alter_e=True,
                                                      sequence=3)

    def test_alter_advance_resv_end_time_after_run(self):
        """
        This test case covers the below scenarios for an advance reservation
        that has started running.

        1. Make an advance reservation end late (with a job in it)

        The above operation is expected to be successful.
        """
        duration = 20
        shift = 30
        offset = 10
        sleep = 45
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        # Submit a job to the reservation.
        jid = self.submit_job_to_resv(rid, sleep)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        self.alter_a_reservation(rid, start, end, shift, alter_e=True,
                                 confirm=False)

        self.check_resv_running(rid, duration, 0)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

    def test_alter_advance_resv_both_times_before_run(self):
        """
        This test case covers the below scenarios for an advance reservation
        that has not started running.

        1. Make an advance reservation start and end late (empty reservation)
        2. Make an advance reservation start and end early (empty reservation)
        3. Make an advance reservation start and end early (with a job in it)

        All the above operations are expected to be successful.
        """
        offset = 60
        duration = 20
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        new_start, new_end = self.alter_a_reservation(rid, start, end,
                                                      shift, alter_s=True,
                                                      alter_e=True, sequence=1)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      -shift, alter_s=True,
                                                      alter_e=True, sequence=2)

        # Submit a job to the reservation and change its start time.
        self.submit_job_to_resv(rid)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      -shift, alter_s=True,
                                                      alter_e=True, sequence=3)

    def test_alter_advance_resv_both_times_after_run(self):
        """
        This test case covers the below scenarios for an advance reservation
        that has started running.

        1. Make an advance reservation start and end late (empty reservation)
        2. Make an advance reservation start and end late (with a job in it)

        Only operation 1 should be successful, operation 2 should fail.
        """
        offset = 10
        duration = 200
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Changing start time should be allowed as the reservation is empty.
        new_start, new_end = self.alter_a_reservation(rid, start, end,
                                                      shift, alter_s=True,
                                                      alter_e=True)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Submit a job to the reservation.
        self.submit_job_to_resv(rid)

        # Changing start time should fail this time as it is not empty.
        self.alter_a_reservation(rid, new_start, new_end,
                                 shift, alter_s=True,
                                 alter_e=True, whichMessage=0)

    def test_alter_standing_resv_start_time_before_run(self):
        """
        This test case covers the below scenarios for a standing reservation
        that has not started running.

        1. Make an occurrence of a standing reservation start
           late (empty reservation)
        2. Make an occurrence of a standing reservation start
           early (empty reservation)
        3. Make an occurrence of a standing reservation start
           early (with a job in it)
        4. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        All the above operations are expected to be successful.
        """
        offset = 30
        duration = 20
        shift = 15
        rid, start, end = self.submit_and_confirm_reservation(offset,
                                                              duration,
                                                              standing=True)

        new_start, new_end = self.alter_a_reservation(rid, start, end, shift,
                                                      alter_s=True, sequence=1)

        new_start, new_end = self.alter_a_reservation(rid, new_start,
                                                      new_end, -shift,
                                                      alter_s=True, sequence=2)

        # Submit a job to the reservation and change its start time.
        self.submit_job_to_resv(rid)

        new_start, new_end = self.alter_a_reservation(rid, new_start,
                                                      new_end, -shift,
                                                      alter_s=True, sequence=3)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset - shift)

        # Wait for the reservation occurrence to finish.
        new_duration = new_end - new_start
        self.check_occr_finish(rid, new_duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_alter_standing_resv_start_time_after_run(self):
        """
        This test case covers the below scenarios for a standing reservation
        that has started running.

        1. Make an occurrence of a standing reservation start
           late (empty reservation)
        2. Make an occurrence of a standing reservation start
           late (with a job in it)
        3. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        Only operations 1 and 3 should be successful, operation 2 should fail.
        """
        offset = 10
        duration = 20
        shift = 15
        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              standing=True)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Changing start time should be allowed as the reservation is empty.
        new_start, new_end = self.alter_a_reservation(rid, start, end, shift,
                                                      alter_s=True)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Submit a job to the reservation.
        self.submit_job_to_resv(rid, sleep=15)

        # Changing start time should fail this time as it is not empty.
        self.alter_a_reservation(rid, new_start, new_end, shift,
                                 alter_s=True, whichMessage=False)

        # Wait for the reservation occurrence to finish.
        new_duration = new_end - new_start
        self.check_occr_finish(rid, new_duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_alter_standing_resv_end_time_before_run(self):
        """
        This test case covers the below scenarios for a standing reservation
        that has not started running and some scenarios after it starts
        running.

        1. Make an occurrence of a standing reservation end
           late (empty reservation)
        2. Make an occurrence of a standing reservation end early
           (empty reservation)
        3. Make an occurrence of a standing reservation end
           late (with a job in it)
        4. Check if the reservation continues to be in Running state after the
           original end time has passed.
        5. Verify that the job inside this reservation also continues to run
           after the original end time has passed.
        6. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        All the above operations are expected to be successful.
        """
        duration = 30
        shift = 10
        offset = 30
        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              standing=True)

        new_start, new_end = self.alter_a_reservation(rid, start, end, shift,
                                                      alter_e=True, sequence=1)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      -shift, alter_e=True,
                                                      sequence=2)

        # Submit a job to the reservation.
        jid = self.submit_job_to_resv(rid, 100)

        new_start, new_end = self.alter_a_reservation(rid, start, end, shift,
                                                      alter_e=True, sequence=3)

        self.check_resv_running(rid, offset)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

        # Sleep for the actual duration.
        time.sleep(duration)
        self.check_resv_running(rid)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

        # Wait for the reservation occurrence to finish.
        self.check_occr_finish(rid, shift)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_alter_standing_resv_end_time_after_run(self):
        """
        This test case covers the below scenarios for a standing reservation
        that has started running.

        1. Make an occurrence of a standing reservation end
           late (with a job in it)
        2. Check if the reservation continues to be in Running state after the
           original end time has passed.
        3. Verify that the job inside this reservation also continues to run
           after the original end time has passed.
        4. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        All the above operations are expected to be successful.
        """
        duration = 20
        shift = 10
        offset = 10
        sleep = 30
        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              standing=True)

        # Submit a job to the reservation.
        jid = self.submit_job_to_resv(rid, sleep)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        new_end = self.alter_a_reservation(rid, start, end,
                                           shift, alter_e=True,
                                           confirm=False)[1]

        self.check_resv_running(rid, end - int(time.time()) + 1, True)
        self.server.expect(JOB, {'job_state': "R"}, id=jid)

        # Wait for the reservation occurrence to finish.
        new_duration = int(new_end - time.time())
        self.check_occr_finish(rid, new_duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_alter_standing_resv_both_times_before_run(self):
        """
        This test case covers the below scenarios for a standing reservation
        that has not started running.

        1. Make an occurrence of a standing reservation start and end
           late (empty reservation).
        2. Make an occurrence of a standing reservation start and end early
           (empty reservation).
        3. Make an occurrence of a standing reservation start and end early
           (with a job in it).
        4. Check if the reservation starts and ends as per the new times.
        5. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        All the above operations are expected to be successful.
        """
        offset = 40
        duration = 20
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset,
                                                              duration,
                                                              standing=True)

        new_start, new_end = self.alter_a_reservation(rid, start, end,
                                                      shift, alter_s=True,
                                                      alter_e=True, sequence=1)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      -shift, alter_s=True,
                                                      alter_e=True, sequence=2)

        # Submit a job to the reservation and change its start time.
        self.submit_job_to_resv(rid)

        new_start, new_end = self.alter_a_reservation(rid, new_start, new_end,
                                                      -shift, alter_s=True,
                                                      alter_e=True, sequence=3)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset - shift)

        # Wait for the reservation occurrence to finish.
        self.check_occr_finish(rid, duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_alter_standing_resv_both_times_after_run(self):
        """
        This test case covers the below scenarios for a standing reservation
        that has started running.

        1. Make an occurrence of a standing reservation start and end
           late (empty reservation).
        2. Make an occurrence of a standing reservation start and end
           late (with a job in it).
        3. Check if the reservation starts and ends as per the new times.
        4. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        Only scenario 1, 3 and 4 should be successful, operation 3
        should fail.
        """
        offset = 10
        duration = 20
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              standing=True)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Changing start time should be allowed as the reservation is empty.
        new_start, new_end = self.alter_a_reservation(rid, start, end,
                                                      shift, alter_s=True,
                                                      alter_e=True,
                                                      confirm=False)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset)

        # Submit a job to the reservation.
        self.submit_job_to_resv(rid)

        # Changing start time should fail this time as it is not empty.
        self.alter_a_reservation(rid, new_start, new_end, shift,
                                 alter_s=True, alter_e=True,
                                 whichMessage=False)

        # Wait for the reservation occurrence to finish.
        self.check_occr_finish(rid, duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_conflict_two_advance_resvs(self):
        """
        This test confirms that an advance reservation cannot be extended
        (made to end late) if there is a conflicting reservation and all the
        nodes in the complex are busy.

        Two back to back advance reservations are submitted that use all the
        nodes in the complex to test this.
        """
        duration = 120
        shift = 10
        offset1 = 60
        offset2 = 180

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration, select="2:ncpus=4")
        rid2, start2, end2 = self.submit_and_confirm_reservation(
            offset2, duration, select="2:ncpus=4")
        self.submit_and_confirm_reservation(offset1, duration,
                                            select="2:ncpus=4",
                                            ExpectSuccess=0)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_e=True,
                                 whichMessage=3)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_e=True,
                                 whichMessage=3, interactive=5, sequence=2)
        self.alter_a_reservation(rid2, start2, end2, -shift, alter_s=True,
                                 whichMessage=3)
        self.alter_a_reservation(rid2, start2, end2, -shift, alter_s=True,
                                 whichMessage=3, interactive=5, sequence=2)

    def test_conflict_two_standing_resvs(self):
        """
        This test confirms that an occurrence of a standing reservation cannot
        be extended (made to end late) if there is a conflicting reservation
        and all the nodes in the complex are busy.

        Two back to back standing reservations are submitted that use all the
        nodes in the complex to test this.
        """
        duration = 120
        shift = 10
        offset1 = 60
        offset2 = 180

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration, select="2:ncpus=4", standing=True)
        rid2, start2, end2 = self.submit_and_confirm_reservation(
            offset2, duration, select="2:ncpus=4", standing=True)
        self.submit_and_confirm_reservation(offset1, duration,
                                            select="2:ncpus=4",
                                            ExpectSuccess=0, standing=True)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_e=True,
                                 whichMessage=3)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_e=True,
                                 whichMessage=3, interactive=5, sequence=2)
        self.alter_a_reservation(rid2, start2, end2, -shift, alter_s=True,
                                 whichMessage=3)
        self.alter_a_reservation(rid2, start2, end2, -shift, alter_s=True,
                                 whichMessage=3, interactive=5, sequence=2)

    def test_check_alternate_nodes_advance_resv_endtime(self):
        """
        This test confirms that an advance reservation can be extended even if
        there is a conflicting reservation but there are nodes in the complex
        that satisfy the resource requirements of the reservation.

        Two back to back advance reservations are submitted that use the
        same nodes in the complex to test this and end time of the later
        reservation is altered.
        """
        duration = 120
        shift = 10
        offset1 = 60
        offset2 = 180

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration, select="1:ncpus=4")

        self.server.status(RESV, 'resv_nodes', id=rid1)
        resv_node = self.server.reservations[rid1].get_vnodes()[0]
        select = "1:vnode=" + resv_node + ":ncpus=4"
        rid2 = self.submit_and_confirm_reservation(
            offset2, duration, select=select)[0]

        attrs = {'resv_nodes': (MATCH_RE, re.escape(resv_node))}
        self.server.expect(RESV, attrs, id=rid2)

        nodes = self.server.status(NODE)
        free_node = nodes[resv_node == nodes[0]['id']]['id']

        self.alter_a_reservation(rid1, start1, end1, shift, alter_e=True)
        attrs = {'resv_nodes': (MATCH_RE, re.escape(free_node))}
        self.server.expect(RESV, attrs, id=rid1)

    def test_check_alternate_nodes_advance_resv_starttime(self):
        """
        This test confirms that an advance reservation can be extended even if
        there is a conflicting reservation but there are nodes in the complex
        that satisfy the resource requirements of the reservation.

        Two back to back advance reservations are submitted that use the
        same nodes in the complex to test this and start time of the former
        reservation is altered.
        """
        duration = 120
        shift = 40
        offset1 = 180
        offset2 = 30

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration, select="1:ncpus=4")

        self.server.status(RESV, 'resv_nodes', id=rid1)
        resv_node = self.server.reservations[rid1].get_vnodes()[0]

        select = "1:vnode=" + resv_node + ":ncpus=4"
        rid2 = self.submit_and_confirm_reservation(offset2, duration,
                                                   select=select)[0]

        attrs = {'resv_nodes': (MATCH_RE, re.escape(resv_node))}
        self.server.expect(RESV, attrs, id=rid2)

        nodes = self.server.status(NODE)
        free_node = nodes[resv_node == nodes[0]['id']]['id']

        self.alter_a_reservation(rid1, start1, end1, -shift, alter_s=True)
        attrs = {'resv_nodes': (MATCH_RE, re.escape(free_node))}
        self.server.expect(RESV, attrs, id=rid1)

    def test_check_alternate_nodes_standing_resv_endtime(self):
        """
        This test confirms that an occurrence of a standing reservation can be
        extended even if there is a conflicting reservation but there are
        nodes in the complex that satisfy the resource requirements of the
        reservation.

        Two back to back standing reservations are submitted that use the
        same nodes in the complex to test this and end time of the later
        reservation is altered.
        """
        duration = 120
        shift = 10
        offset1 = 60
        offset2 = 180

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration, standing=True)

        self.server.status(RESV, 'resv_nodes', id=rid1)
        resv_node = self.server.reservations[rid1].get_vnodes()[0]

        select = "1:vnode=" + resv_node + ":ncpus=4"
        rid2 = self.submit_and_confirm_reservation(offset2, duration,
                                                   select=select,
                                                   standing=True)[0]

        attrs = {'resv_nodes': (MATCH_RE, re.escape(resv_node))}
        self.server.expect(RESV, attrs, id=rid2)

        nodes = self.server.status(NODE)
        free_node = nodes[resv_node == nodes[0]['id']]['id']

        self.alter_a_reservation(rid1, start1, end1, shift, alter_e=True)
        attrs = {'resv_nodes': (MATCH_RE, re.escape(free_node))}
        self.server.expect(RESV, attrs, id=rid1)

    def test_check_alternate_nodes_standing_resv_starttime(self):
        """
        This test confirms that an advance reservation can be extended even if
        there is a conflicting reservation but there are nodes in the complex
        that satisfy the resource requirements of the reservation.

        Two back to back advance reservations are submitted that use the
        same nodes in the complex to test this and start time of the former
        reservation is altered.
        """
        duration = 120
        shift = 40
        offset1 = 30
        offset2 = 180

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset2, duration, select="1:ncpus=4", standing=True)

        self.server.status(RESV, 'resv_nodes', id=rid1)
        resv_node = self.server.reservations[rid1].get_vnodes()[0]

        select = "1:vnode=" + resv_node + ":ncpus=4"
        rid2 = self.submit_and_confirm_reservation(offset1, duration,
                                                   select=select,
                                                   standing=True)[0]

        attrs = {'resv_nodes': (MATCH_RE, re.escape(resv_node))}
        self.server.expect(RESV, attrs, id=rid2)

        nodes = self.server.status(NODE)
        free_node = nodes[resv_node == nodes[0]['id']]['id']

        self.alter_a_reservation(rid1, start1, end1, -shift, alter_s=True)
        attrs = {'resv_nodes': (MATCH_RE, re.escape(free_node))}
        self.server.expect(RESV, attrs, id=rid1)

    def test_conflict_standing_resv_occurrence(self):
        """
        This test confirms that if the requested time while altering an
        occurrence of a standing reservation will conflict with a later
        occurrence of the same standing reservation, the alter request
        will be denied.
        """
        duration = 60
        shift = 10
        offset = 10

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="1:ncpus=4", standing=True,
            rrule="FREQ=MINUTELY;COUNT=2")

        self.alter_a_reservation(rid, start, end, shift, alter_e=True,
                                 whichMessage=0)

    def test_large_resv_nodes_server_crash(self):
        """
        This test is to test whether the server crashes or not when a very
        large resv_nodes is being recorded in the 'Y' accounting log.
        If tested with a build without the fix, the test case will fail
        and vice versa.
        """
        duration = 60
        shift = 10
        offset = 10

        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, num=256,
                               usenatvnode=True)

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="256:ncpus=4")

        self.alter_a_reservation(rid, start, end, shift, alter_s=True)

    def test_alter_advance_resv_boundary_values(self):
        """
        This test checks the alter of start and end times at the boundary
        values for advance reservation.
        """
        duration = 30
        shift = 5
        offset = 100

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration)

        start, end = self.alter_a_reservation(
            rid, start, end, shift, alter_e=True, sequence=1)
        start, end = self.alter_a_reservation(
            rid, start, end, -shift, alter_e=True, sequence=2)
        start, end = self.alter_a_reservation(
            rid, start, end, shift, alter_s=True, sequence=3)
        self.alter_a_reservation(
            rid, start, end, -shift, alter_s=True, sequence=4)

    def test_alter_standing_resv_boundary_values(self):
        """
        This test checks the alter of start and end times at the boundary
        values for standing reservation.
        """
        duration = 30
        shift = 5
        offset = 100

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, standing=True)

        start, end = self.alter_a_reservation(
            rid, start, end, shift, alter_e=True, sequence=1)
        start, end = self.alter_a_reservation(
            rid, start, end, -shift, alter_e=True, sequence=2)
        start, end = self.alter_a_reservation(
            rid, start, end, shift, alter_s=True, sequence=3)
        self.alter_a_reservation(
            rid, start, end, -shift, alter_s=True, sequence=4)

    def test_alter_degraded_resv_mom_down(self):
        """
        This test checks the alter of start and end times of reservations
        when mom is down.
        """
        duration = 30
        shift = 5
        offset = 200

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset, duration, select="1:ncpus=2")
        rid2, start2, end2 = self.submit_and_confirm_reservation(
            offset, duration, select="1:ncpus=2", standing=True)
        self.mom.stop()
        msg = 'mom is not down'
        self.assertFalse(self.mom.isUp(max_attempts=5), msg)
        attrs = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}
        self.server.expect(RESV, attrs, id=rid1)
        self.server.expect(RESV, attrs, id=rid2)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_s=True,
                                 alter_e=True, whichMessage=3, sequence=1)
        self.alter_a_reservation(rid2, start2, end2, shift, alter_s=True,
                                 alter_e=True, whichMessage=3, sequence=1)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_s=True,
                                 alter_e=True, whichMessage=3, interactive=2,
                                 sequence=2)
        self.alter_a_reservation(rid2, start2, end2, shift, alter_s=True,
                                 alter_e=True, whichMessage=3, interactive=2,
                                 sequence=2)
        self.mom.start()
        # test same for node offline case
        attrs1 = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs1, id=rid1)
        self.server.expect(RESV, attrs1, id=rid2)
        resv_node1 = self.server.status(RESV, 'resv_nodes', id=rid1)[0][
            'resv_nodes'].split(':')[0].split('(')[1]
        resv_node2 = self.server.status(RESV, 'resv_nodes', id=rid2)[0][
            'resv_nodes'].split(':')[0].split('(')[1]
        mtype = 0
        seq = 0
        if resv_node1 == resv_node2:
            self.server.manager(MGR_CMD_SET, NODE, {
                                'state': "offline"}, id=resv_node1)
            mtype = 1
            seq = 1
        else:
            self.server.manager(MGR_CMD_SET, NODE, {
                                'state': "offline"}, id=resv_node1)
            self.server.manager(MGR_CMD_SET, NODE, {
                                'state': "offline"}, id=resv_node2)
            mtype = 3
            seq = 3

        self.server.expect(RESV, attrs, id=rid1)
        self.server.expect(RESV, attrs, id=rid2)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_s=True,
                                 alter_e=True, whichMessage=mtype,
                                 sequence=seq)
        self.alter_a_reservation(rid2, start2, end2, shift, alter_s=True,
                                 alter_e=True, whichMessage=mtype,
                                 sequence=seq)
        self.alter_a_reservation(rid1, start1, end1, shift, alter_s=True,
                                 alter_e=True, whichMessage=mtype,
                                 interactive=2, sequence=seq + 1)
        self.alter_a_reservation(rid2, start2, end2, shift, alter_s=True,
                                 alter_e=True, whichMessage=mtype,
                                 interactive=2, sequence=seq + 1)

    def test_alter_resv_name(self):
        """
        This test checks the alter of reservation name.
        """
        duration = 30
        offset = 20

        rid1 = self.submit_and_confirm_reservation(
            offset, duration)
        attr1 = {ATTR_N: "Adv_Resv"}
        self.server.alterresv(rid1[0], attr1)
        attr1 = {'Reserve_Name': "Adv_Resv"}
        self.server.expect(RESV, attr1, id=rid1[0])
        rid2 = self.submit_and_confirm_reservation(
            offset, duration, standing=True)
        attr2 = {ATTR_N: "Std_Resv"}
        self.server.alterresv(rid2[0], attr2)
        attr2 = {'Reserve_Name': "Std_Resv"}
        self.server.expect(RESV, attr2, id=rid2[0])

    def test_alter_user_permission(self):
        """
        This test checks the user permissions for pbs_ralter.
        """
        duration = 30
        offset = 20
        shift = 10

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset, duration)
        rid2, start2, end2 = self.submit_and_confirm_reservation(
            offset, duration, standing=True)
        new_start1 = self.bu.convert_seconds_to_datetime(start1 + shift)
        new_start2 = self.bu.convert_seconds_to_datetime(start2 + shift)
        new_end1 = self.bu.convert_seconds_to_datetime(end1 + shift)
        new_end2 = self.bu.convert_seconds_to_datetime(end2 + shift)
        try:
            attr = {'reserve_start': new_start1, 'reserve_end': new_end1}
            self.server.alterresv(rid1, attr, runas=TEST_USER1)
        except PbsResvAlterError as e:
            self.assertTrue("Unauthorized Request" in e.msg[0])
        try:
            attr = {'reserve_start': new_start2, 'reserve_end': new_end2}
            self.server.alterresv(rid2, attr, runas=TEST_USER1)
        except PbsResvAlterError as e:
            self.assertTrue("Unauthorized Request" in e.msg[0])

    def test_auth_user(self):
        """
        This test checks changing Authorized_Users
        """
        duration = 30
        offset = 1000
        rid = self.submit_and_confirm_reservation(offset, duration)[0]

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        with self.assertRaises(PbsSubmitError):
            self.submit_job_to_resv(rid, user=TEST_USER1)

        attr = {ATTR_auth_u: str(TEST_USER1)}
        self.server.alterresv(rid, attr)

        with self.assertRaises(PbsSubmitError):
            self.submit_job_to_resv(rid, user=TEST_USER)

        jid = self.submit_job_to_resv(rid, user=TEST_USER1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        attr = {ATTR_auth_u: str(TEST_USER) + ',' + str(TEST_USER1)}
        self.server.alterresv(rid, attr)

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        jid = self.submit_job_to_resv(rid, user=TEST_USER1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        attr = {ATTR_auth_u: str(TEST_USER) + ',-' + str(TEST_USER1)}
        self.server.alterresv(rid, attr)

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        with self.assertRaises(PbsSubmitError):
            self.submit_job_to_resv(rid, user=TEST_USER1)

    @skipOnShasta
    def test_auth_group(self):
        """
        This test checks changing Authorized_Groups
        Skipped on shasta due to groups not being setup on the server
        """
        duration = 30
        offset = 1000
        rid = self.submit_and_confirm_reservation(offset, duration)[0]

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        with self.assertRaises(PbsSubmitError):
            self.submit_job_to_resv(rid, user=TEST_USER4)

        attr = {ATTR_auth_g: str(TSTGRP0) + ',' + str(TSTGRP1)}
        self.server.alterresv(rid, attr)

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        with self.assertRaises(PbsSubmitError):
            self.submit_job_to_resv(rid, user=TEST_USER4)

        attr = {ATTR_auth_u: str(TEST_USER) + ',' + str(TEST_USER4),
                ATTR_auth_g: str(TSTGRP0) + ',' + str(TSTGRP1)}
        self.server.alterresv(rid, attr)

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        jid = self.submit_job_to_resv(rid, user=TEST_USER4)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

    @skipOnShasta
    def test_auth_group_restart(self):
        """
        This test checks changing Authorized_Groups survives a server restart
        Skipped on shasta due to groups not being setup on the server
        """
        self.skipTest('skipped due to existing bug unsetting attributes')
        duration = 30
        offset = 1000
        rid = self.submit_and_confirm_reservation(offset, duration)[0]
        qid = rid.split('.')[0]

        attr = {ATTR_auth_g: str(TSTGRP0) + ',' + str(TSTGRP1)}
        self.server.alterresv(rid, attr)
        attr2 = {
            ATTR_aclgroup: attr[ATTR_auth_g],
            ATTR_aclgren: 'True'
        }

        self.server.expect(RESV, attr, id=rid, max_attempts=5)
        self.server.expect(QUEUE, attr2, id=qid, max_attempts=5)

        self.server.restart()

        self.server.expect(RESV, attr, id=rid, max_attempts=5)
        self.server.expect(QUEUE, attr2, id=qid, max_attempts=5)

        attr = {ATTR_auth_g: ''}
        self.server.alterresv(rid, attr)

        attr = [ATTR_auth_g]
        attr2 = [ATTR_aclgroup, ATTR_aclgren]
        self.server.expect(RESV, attr, op=UNSET, id=rid, max_attempts=5)
        self.server.expect(QUEUE, attr2, op=UNSET, id=qid, max_attempts=5)

        self.server.restart()

        self.server.expect(RESV, attr, op=UNSET, id=rid, max_attempts=5)
        self.server.expect(QUEUE, attr2, op=UNSET, id=qid, max_attempts=5)

    def test_ralter_psets(self):
        """
        Test that PBS will not place a job across placement sets after
        successfully being altered
        """
        duration = 120
        offset1 = 30
        offset2 = 180

        a = {'type': 'string', 'flag': 'h'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='color')

        a = {'resources_available.ncpus': 4, 'resources_available.mem': '4gb'}
        self.mom.create_vnodes(a, 3)

        a = {'resources_available.color': 'red'}
        vn = self.mom.shortname
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn + '[0]')
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn + '[1]')
        a = {'resources_available.color': 'green'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=vn + '[2]')

        a = {'node_group_key': 'color', 'node_group_enable': True}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration, select="2:ncpus=4")

        self.server.status(RESV)
        nodes = self.server.reservations[rid1].get_vnodes()

        rid2, start2, end2 = self.submit_and_confirm_reservation(
            offset2, duration, select="1:ncpus=4:vnode=" + nodes[0])

        c = 'resources_available.color'
        color1 = self.server.status(NODE, c, id=nodes[0])[0][c]
        color2 = self.server.status(NODE, c, id=nodes[1])[0][c]
        self.assertEqual(color1, color2)

        self.alter_a_reservation(rid1, start1, end1, shift=300,
                                 alter_e=True, whichMessage=3)

        t = start1 - int(time.time())
        self.logger.info('Sleeping until reservation starts')
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
                           id=rid1, offset=t)

        # sequence=2 because we'll get one message from the last alter attempt
        # and one message from this alter attempt
        self.alter_a_reservation(rid1, start1, end1, shift=300,
                                 alter_e=True, sequence=2, whichMessage=3)

    def test_failed_ralter(self):
        """
        Test that a failed ralter does not allow jobs to interfere with
        that reservation.
        """
        duration = 120
        offset1 = 30
        offset2 = 180

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration, select="2:ncpus=4")

        j = Job(attrs={'Resource_List.walltime': 100})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q',
                                 'comment': (MATCH_RE, 'Not Running')}, id=jid)

        rid2, start2, end2 = self.submit_and_confirm_reservation(
            offset2, duration, select="2:ncpus=4")

        self.alter_a_reservation(rid1, start1, end1, shift=300,
                                 alter_e=True, whichMessage=3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        self.logger.info('Sleeping until reservation starts')
        t = start1 - int(time.time())
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_RUNNING|5')},
                           offset=t, id=rid1)

        self.alter_a_reservation(rid1, start1, end1, shift=300,
                                 alter_e=True, sequence=2, whichMessage=3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

    def test_adv_resv_duration_before_start(self):
        """
        Test duration of reservation can be changed. In this case end
        time changes, and start time remains the same.
        """

        offset = 20
        duration = 20
        new_duration = 30
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        self.alter_a_reservation(rid, start, end, a_duration=new_duration,
                                 check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)

        self.assertEqual(t_end, end + shift)
        self.assertEqual(t_start, start)
        self.assertEqual(t_duration, new_duration)

        # Submit a job to the reservation and change its duration.
        self.submit_job_to_resv(rid)

        temp_end = t_end
        temp_start = t_start

        new_duration2 = new_duration + 10
        self.alter_a_reservation(rid, temp_start, temp_end, sequence=2,
                                 a_duration=new_duration2, check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_end, temp_end + shift)
        self.assertEqual(t_start, temp_start)
        self.assertEqual(t_duration, new_duration2)

        sleepdur = (temp_end + shift / 2) - time.time()
        self.logger.info('Sleeping until reservation would have ended')
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
                           id=rid, max_attempts=5, offset=sleepdur)

    def test_adv_resv_dur_and_endtime_before_start(self):
        """
        Test that duration and end time of reservation can be changed together.
        In this case the start time of reservation may also change.
        """

        offset = 20
        duration = 20
        new_duration = 40
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        self.alter_a_reservation(rid, start, end, shift=shift,
                                 alter_e=True, a_duration=new_duration,
                                 check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)

        self.assertEqual(t_end, end + shift)
        self.assertEqual(t_start, t_end - t_duration)
        self.assertEqual(t_duration, new_duration)

        # Submit a job to the reservation and change its start time.
        self.submit_job_to_resv(rid)
        temp_end = t_end
        temp_start = t_start

        new_duration2 = new_duration + 10
        self.alter_a_reservation(rid, temp_start, temp_end, shift=shift,
                                 alter_e=True, sequence=2,
                                 a_duration=new_duration2, check_log=False)
        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_end, temp_end + shift)
        self.assertEqual(t_start, t_end - t_duration)
        self.assertEqual(t_duration, new_duration2)

    def test_adv_resv_dur_and_starttime_before_start(self):
        """
        Test duration and starttime of reservation can be changed together.
        In this case the endtime will change accordingly
        """

        offset = 20
        duration = 20
        new_duration = 30
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        self.alter_a_reservation(rid, start, end, shift=shift,
                                 alter_s=True, a_duration=new_duration,
                                 check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)

        self.assertEqual(t_end, t_start + t_duration)
        self.assertEqual(t_start, start + shift)
        self.assertEqual(t_duration, new_duration)

        # Submit a job to the reservation and change its start time.
        self.submit_job_to_resv(rid)
        temp_end = t_end
        temp_start = t_start

        new_duration2 = new_duration + 10
        self.alter_a_reservation(rid, temp_start, temp_end, shift=shift,
                                 alter_s=True, sequence=2,
                                 a_duration=new_duration2, check_log=False)
        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_end, t_start + t_duration)
        self.assertEqual(t_start, temp_start + shift)
        self.assertEqual(t_duration, new_duration2)

    def test_adv_res_dur_after_start(self):
        """
        Test that duration can be changed after the reservation starts.
        Test that if the duration changes endtime of the reservation to an
        already passed time, the reservation is deleted
        """
        offset = 10
        duration = 20
        new_duration = 30
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        self.check_resv_running(rid, offset)

        self.alter_a_reservation(rid, start, end, a_duration=new_duration,
                                 confirm=False, check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_duration, new_duration)

        time.sleep(5)
        new_duration = int(time.time()) - int(t_start) - 1
        attr = {'reserve_duration': new_duration}
        self.server.alterresv(rid, attr)
        msg = "Resv;" + rid + ";Reservation alter confirmed"
        self.server.log_match(msg, id=rid)
        rid = rid.split('.')[0]
        self.server.log_match(rid + ";deleted at request of pbs_server",
                              id=rid, interval=2)

    def test_adv_resv_endtime_starttime_dur_together(self):
        """
        Test that all three end, start and duration can be changed together.
        If the values of start, end, duration are not reolves properly, this
        test should fail
        """
        offset = 20
        duration = 20
        new_duration = 25
        wrong_duration = 45
        shift_start = 10
        shift_end = 15
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)
        new_start = self.bu.convert_seconds_to_datetime(start + shift_start)
        new_end = self.bu.convert_seconds_to_datetime(end + shift_end)

        with self.assertRaises(PbsResvAlterError) as e:
            attr = {'reserve_start': new_start, 'reserve_end': new_end,
                    'reserve_duration': wrong_duration}
            self.server.alterresv(rid, attr)
        self.assertIn('pbs_ralter: Bad time specification(s)',
                      e.exception.msg[0])

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(int(t_start), start)
        self.assertEqual(int(t_duration), duration)
        self.assertEqual(int(t_end), end)

        attr = {'reserve_start': new_start, 'reserve_end': new_end,
                'reserve_duration': new_duration}
        self.server.alterresv(rid, attr)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(int(t_start), start + shift_start)
        self.assertEqual(int(t_duration), new_duration)
        self.assertEqual(int(t_end), end + shift_end)

    def test_standing_resv_duration(self):
        """
        This test case covers the below scenarios for a standing reservation.

        1. Change duration of standing reservation occurance
        2. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        All the above operations are expected to be successful.
        """
        offset = 20
        duration = 30
        new_duration = 90
        shift = 15
        rid, start, end = self.submit_and_confirm_reservation(offset,
                                                              duration,
                                                              standing=True)

        self.alter_a_reservation(rid, start, end, shift=shift,
                                 a_duration=new_duration, check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_duration, new_duration)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset - shift)

        # Wait for the reservation occurrence to finish.
        new_duration = t_end - t_start
        self.check_occr_finish(rid, new_duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_standing_resv_duration_and_endtime(self):
        """
        This test case covers the below scenarios for a standing reservation.

        1. Change duration and endtime of standing reservation
        2. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        All the above operations are expected to be successful.
        """
        offset = 20
        duration = 20
        new_duration = 30
        shift = 15
        rid, start, end = self.submit_and_confirm_reservation(offset,
                                                              duration,
                                                              standing=True)

        self.alter_a_reservation(rid, start, end, shift=shift, alter_e=True,
                                 a_duration=new_duration, check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_duration, new_duration)
        self.assertEqual(t_end, end + shift)
        self.assertEqual(t_start, t_end - t_duration)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset - shift)

        # Wait for the reservation occurrence to finish.
        new_duration = t_end - t_start
        self.check_occr_finish(rid, new_duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_standing_resv_duration_and_starttime(self):
        """
        This test case covers the below scenarios for a standing reservation.

        1. Change duration and endtime of standing reservation
        2. After the first occurrence of the reservation finishes, verify that
           the start and end time of the second occurrence have not changed.

        All the above operations are expected to be successful.
        """
        offset = 20
        duration = 20
        new_duration = 30
        shift = 15
        rid, start, end = self.submit_and_confirm_reservation(offset,
                                                              duration,
                                                              standing=True)

        self.alter_a_reservation(rid, start, end, shift=shift, alter_s=True,
                                 a_duration=new_duration, check_log=False)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_duration, new_duration)
        self.assertEqual(t_end, t_start + t_duration)
        self.assertEqual(t_start, start + shift)

        # Wait for the reservation to start running.
        self.check_resv_running(rid, offset - shift)

        # Wait for the reservation occurrence to finish.
        new_duration = t_end - t_start
        self.check_occr_finish(rid, new_duration)

        # Check that duration of the second occurrence is not altered.
        self.check_standing_resv_second_occurrence(rid, start, end)

    def test_conflict_standing_resv_occurrence_duration(self):
        """
        This test confirms that if the requested duration while altering an
        occurrence of a standing reservation will conflict with a later
        occurrence of the same standing reservation, the alter request
        will be denied.
        """
        duration = 60
        new_duration = 70
        shift = 10
        offset = 10

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="1:ncpus=4", standing=True,
            rrule="FREQ=MINUTELY;COUNT=2")

        self.alter_a_reservation(rid, start, end, a_duration=new_duration,
                                 check_log=False, whichMessage=0)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(int(t_start), start)
        self.assertEqual(int(t_duration), duration)
        self.assertEqual(int(t_end), end)

    def test_alter_empty_fail(self):
        """
        This test confirms that if a requested ralter fails due to the
        reservation having running jobs, the attributes are kept the same
        """
        offset = 20
        dur = 20
        shift = 120

        rid, start, end = self.submit_and_confirm_reservation(offset, dur)

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid, offset=offset)

        now = int(time.time())
        new_start = self.bu.convert_seconds_to_datetime(now + shift)
        new_end = self.bu.convert_seconds_to_datetime(now + shift + dur)

        # This bug only shows if end time is changed before start time
        ralter_cmd = [
            os.path.join(
                self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_ralter'),
            '-E', str(new_end),
            '-R', str(new_start),
            rid
        ]
        ret = self.du.run_cmd(self.server.hostname, ralter_cmd)
        self.assertIn('pbs_ralter: Reservation not empty', ret['err'][0])

        # Test that the reservation state is Running and not RESV_NONE
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(int(t_start), start)
        self.assertEqual(int(t_duration), dur)
        self.assertEqual(int(t_end), end)

    def test_duration_in_hhmmss_format(self):
        """
        Test duration input can be in hh:mm:ss format
        """
        offset = 20
        duration = 20
        new_duration = "00:00:30"
        new_duration_in_sec = 30
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        new_end = end + 10

        attr = {'reserve_duration': new_duration}
        self.server.alterresv(rid, attr)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(int(t_start), start)
        self.assertEqual(int(t_duration), new_duration_in_sec)
        self.assertEqual(int(t_end), new_end)

    def test_adv_resv_dur_and_endtime_with_running_jobs(self):
        """
        Test that duration and end time of reservation cannot be changed
        together if there are running jobs inside it. This will fail
        because start time cannot be changed when there are running
        jobs in a reservation.
        """

        offset = 10
        duration = 20
        new_duration = 30
        shift = 10
        rid, start, end = self.submit_and_confirm_reservation(offset, duration)

        self.check_resv_running(rid, offset)

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        new_end = self.bu.convert_seconds_to_datetime(end + 30)
        with self.assertRaises(PbsResvAlterError) as e:
            attr = {'reserve_end': new_end,
                    'reserve_duration': new_duration}
            self.server.alterresv(rid, attr)
        self.assertIn('pbs_ralter: Reservation not empty',
                      e.exception.msg[0])

        # Test that the reservation state is Running and not RESV_NONE
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)

        self.assertEqual(t_end, end)
        self.assertEqual(t_start, start)
        self.assertEqual(t_duration, duration)

    def test_standing_resv_dur_and_endtime_with_running_jobs(self):
        """
        Change duration and endtime of standing reservation with
        running jobs in it. Verify that the alter fails and
        starttime remains the same
        """
        offset = 10
        duration = 20
        new_duration = 30
        shift = 15
        rid, start, end = self.submit_and_confirm_reservation(offset,
                                                              duration,
                                                              standing=True)

        jid = self.submit_job_to_resv(rid, user=TEST_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid, offset=offset)

        new_end = self.bu.convert_seconds_to_datetime(end + 30)
        with self.assertRaises(PbsResvAlterError) as e:
            attr = {'reserve_end': new_end,
                    'reserve_duration': new_duration}
            self.server.alterresv(rid, attr)
        self.assertIn('pbs_ralter: Reservation not empty',
                      e.exception.msg[0])

        # Test that the reservation state is Running and not RESV_NONE
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid)

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(t_end, end)
        self.assertEqual(t_start, start)
        self.assertEqual(t_duration, duration)

    def test_duration_walltime(self):
        """
        Check when ralter changes duration, it also changes walltime
        """

        rid, start, end = self.submit_and_confirm_reservation(3600, 600)

        self.server.expect(RESV, {'Resource_List.walltime': 600}, id=rid)

        # Alter start + end
        self.alter_a_reservation(rid, start, end, shift=30, alter_s=True,
                                 alter_e=True)
        self.server.expect(RESV, {'Resource_List.walltime': 600}, id=rid)

        # Alter start + duration
        self.alter_a_reservation(rid, start, end, shift=30, alter_s=True,
                                 a_duration=300, sequence=2)
        self.server.expect(RESV, {'Resource_List.walltime': 300}, id=rid)

        # Alter end + duration
        self.alter_a_reservation(rid, start, end, shift=30, alter_e=True,
                                 a_duration=450, sequence=3)
        self.server.expect(RESV, {'Resource_List.walltime': 450}, id=rid)

        # Alter start + end + duration
        self.alter_a_reservation(rid, start, end, shift=30, alter_e=True,
                                 alter_s=True, a_duration=600, sequence=4)
        self.server.expect(RESV, {'Resource_List.walltime': 600}, id=rid)

    def test_alter_select_basic(self):
        """
        Test basic use of pbs_ralter -l select to shrink a reservation
        We start with a 2 +'d reservation, and then we drop out the 1st and 3rd
        chunk, and then reduce further
        """
        select = "2:ncpus=1:mem=1gb+4:ncpus=1:mem=2gb+2:ncpus=1:mem=3gb"
        aselect1 = "4:ncpus=1:mem=2gb"
        aselect2 = "2:ncpus=1:mem=2gb"

        rid, start, end, rnodes = self.alter_select_initial(True, select)

        self.alter_select(
            rid, start, end, True, aselect1, 4, [], 1)

        self.alter_select(rid, start, end, True, aselect2, 2, [], 2)

    def test_alter_select_basic_running(self):
        """
        Test basic use of pbs_ralter -l select
        to shrink a running reservation
        We start with a 2 +'d reservation, and then we drop out the 1st and 3rd
        chunk, and then reduce further
        """
        select = "2:ncpus=1:mem=1gb+4:ncpus=1:mem=2gb+2:ncpus=1:mem=3gb"
        aselect1 = "4:ncpus=1:mem=2gb"
        aselect2 = "2:ncpus=1:mem=2gb"

        rid, start, end, rnodes = self.alter_select_initial(False, select)

        rnodes2 = self.alter_select(rid, start, end, False, aselect1, 4, [], 1)

        self.alter_select(rid, start, end, False, aselect2, 2, [], 2)

    def test_alter_select_complex(self):
        """
        Test more complex use of pbs_ralter -l select
        to shrink a reservation
        We start with a 2 +'d spec, and shrink each chunk by one, and
        then we shrink further and drop out the middle chunk
        """
        select = "2:ncpus=1:mem=1gb+4:ncpus=1:mem=2gb+2:ncpus=1:mem=3gb"
        aselect1 = "1:ncpus=1:mem=1gb+2:ncpus=1:mem=2gb+1:ncpus=1:mem=3gb"
        aselect2 = "1:ncpus=1:mem=2gb"

        rid, start, end, rnodes = self.alter_select_initial(True, select)

        self.alter_select(rid, start, end, True, aselect1, 4, [], 1)

        self.alter_select(rid, start, end, True, aselect2, 1, [], 2)

    def test_alter_select_complex_running(self):
        """
        Test more complex use of pbs_ralter -l select to
        shrink a running reservation
        We start with a 2 +'d spec, and shrink each chunk by one, and
        then we shrink further and drop out the middle chunk
        """
        select = "2:ncpus=1:mem=1gb+4:ncpus=1:mem=2gb+2:ncpus=1:mem=3gb"
        aselect1 = "1:ncpus=1:mem=1gb+2:ncpus=1:mem=2gb+1:ncpus=1:mem=3gb"
        aselect2 = "1:ncpus=1:mem=2gb"

        rid, start, end, rnodes = self.alter_select_initial(False, select)

        rnodes2 = self.alter_select(rid, start, end, False,
                                    aselect1, 4, [], 1)

        self.alter_select(rid, start, end, False, aselect2, 1, [], 2)

    def test_alter_select_complex2(self):
        """
        Test more complex use of pbs_ralter -l select
        to shrink a reservation
        We start with a 2 +'d chunk and then shrink each chunk by 1
        We then shrink further and drop out the middle chunk
        Lastly we drop out the first chunk
        """
        select = "3:ncpus=1:mem=1gb+2:ncpus=1:mem=2gb+3:ncpus=1:mem=3gb"
        aselect1 = "2:ncpus=1:mem=1gb+1:ncpus=1:mem=2gb+2:ncpus=1:mem=3gb"
        aselect2 = "1:ncpus=1:mem=1gb+1:ncpus=1:mem=3gb"
        aselect3 = "1:ncpus=1:mem=3gb"

        rid, start, end, rnodes = self.alter_select_initial(True, select)

        rnodes2 = self.alter_select(rid, start, end,
                                    True, aselect1, 5, [], 1)

        self.alter_select(rid, start, end, True, aselect2, 2, [], 2)

        self.alter_select(rid, start, end, True, aselect3, 1, [], 3)

    def test_alter_select_complex_running2(self):
        """
        Test more complex use of pbs_ralter -l select to
        shrink a running reservation
        We start with a 2 +'d chunk and then shrink each chunk by 1
        We then shrink further and drop out the middle chunk
        Lastly we drop out the first chunk
        """
        select = "3:ncpus=1:mem=1gb+2:ncpus=1:mem=2gb+3:ncpus=1:mem=3gb"
        aselect1 = "2:ncpus=1:mem=1gb+1:ncpus=1:mem=2gb+2:ncpus=1:mem=3gb"
        aselect2 = "1:ncpus=1:mem=1gb+1:ncpus=1:mem=3gb"
        aselect3 = "1:ncpus=1:mem=3gb"

        rid, start, end, rnodes = self.alter_select_initial(False, select)

        rnodes2 = self.alter_select(rid, start, end,
                                    False, aselect1, 5, [], 1)

        rnodes3 = self.alter_select(rid, start, end,
                                    False, aselect2, 2, [], 2)

        self.alter_select(rid, start, end, False, aselect3, 1, [], 3)

    def test_alter_select_complex_running3(self):
        """
        A complex set of ralters with running jobs
        """
        select = "3:ncpus=1:mem=1gb+2:ncpus=1:mem=2gb+3:ncpus=1:mem=3gb"
        aselect1 = "2:ncpus=1:mem=1gb+1:ncpus=1:mem=2gb+2:ncpus=1:mem=3gb"
        aselect2 = "1:ncpus=1:mem=1gb+1:ncpus=1:mem=3gb"
        aselect3 = "1:ncpus=1:mem=3gb"

        rid, start, end, rnodes = self.alter_select_initial(False, select)
        rq = rid.split('.')[0]

        a = {'queue': rq, 'Resource_List.select': '1:ncpus=1:mem=3gb'}
        J1 = Job(attrs=a)
        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        a['Resource_List.select'] = '1:ncpus=1:mem=1gb'
        J2 = Job(attrs=a)
        jid2 = self.server.submit(J2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        st = self.server.status(JOB)

        nodes1 = J1.get_vnodes(st[0]['exec_vnode'])
        nodes2 = J2.get_vnodes(st[1]['exec_vnode'])
        needed_nodes = [nodes1[0], nodes2[0]]

        self.alter_select(rid, start, end, False, aselect1, 5, needed_nodes, 1)

        self.alter_select(rid, start, end, False, aselect2, 2, needed_nodes, 2)

        # Alter will fail because we're trying to release Jid2's node

        self.alter_select(rid, start, end, False, aselect3, 2,
                          needed_nodes, 1, False)

        self.server.delete(jid2, wait=True)

        self.alter_select(rid, start, end, False, aselect3, 1, nodes1, 3)

    def alter_select_initial(self, confirm, select):
        """
        Submit initial reservation and possibly wait until it starts
        """
        numnodes = 8
        offset = 30
        dur = 3600

        a = {'resources_available.ncpus': 1,
             'resources_available.mem': '8gb'}
        self.mom.create_vnodes(a, num=8)

        rid, start, end = self.submit_and_confirm_reservation(offset, dur,
                                                              select=select)
        st = self.server.status(RESV)
        resv_nodes = self.server.reservations[rid].get_vnodes()

        self.assertEquals(len(st[0]['resv_nodes'].split('+')), numnodes)
        a = {'Resource_List.ncpus': numnodes,
             'Resource_List.nodect': numnodes}
        self.server.expect(RESV, a, id=rid)

        if not confirm:
            a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
            off = start - int(time.time())
            self.logger.info('Waiting until reservation runs')
            self.server.expect(RESV, a, id=rid, offset=off)

        return rid, start, end, resv_nodes

    def alter_select(self, rid, start, end,
                     confirm, selectN, numnodes, nodes, seq, success=True):
        """
        Alter a reservation and make sure it is on the correct nodes
        """

        w = 1
        if not success:
            w = 3
        self.alter_a_reservation(rid, start, end, select=selectN,
                                 confirm=confirm, sequence=seq, whichMessage=w)

        st = self.server.status(RESV)
        self.assertEquals(len(st[0]['resv_nodes'].split('+')), numnodes)
        a = {'Resource_List.ncpus': numnodes,
             'Resource_List.nodect': numnodes}
        self.server.expect(RESV, a, id=rid)
        resv_nodes = self.server.reservations[rid].get_vnodes()
        # nodes is a list of nodes we must keep
        for n in nodes:
            self.assertIn(n, resv_nodes, "Required node not in resv_nodes")
        return resv_nodes

    def test_alter_select_with_times(self):
        """
        Modify the select with the start and end times all at once
        """
        offset = 3600
        duration = 3600
        select = '6:ncpus=1'
        new_select = '4:ncpus=1'
        shift = 300

        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              select=select)
        st = self.server.status(RESV)
        self.assertEquals(len(st[0]['resv_nodes'].split('+')), 6)

        self.alter_a_reservation(rid, start, end, alter_s=True, alter_e=True,
                                 shift=shift, select=new_select, interactive=9)

        st = self.server.status(RESV)
        self.assertEquals(len(st[0]['resv_nodes'].split('+')), 4)
        t = int(time.mktime(time.strptime(st[0]['reserve_start'], '%c')))
        self.assertEquals(t, start + shift)

        t = int(time.mktime(time.strptime(st[0]['reserve_end'], '%c')))
        self.assertEquals(t, end + shift)

    def test_alter_select_with_running_jobs(self):
        """
        Test that when a reservation is running and has running jobs,
        that an ralter -lselect will release nodes without running jobs
        """
        offset = 20
        duration = 600
        select = '3:ncpus=4'
        select2 = '2:ncpus=4'
        select3 = '1:ncpus=4'

        a = {'resources_available.ncpus': 4, 'resources_available.mem': '1gb'}
        self.mom.create_vnodes(a, num=3,
                               usenatvnode=True)

        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              select=select)
        resv_queue = rid.split('.')[0]
        a = {'queue': resv_queue}
        j1 = Job(attrs=a)
        jid = self.server.submit(j1)

        self.logger.info('Waiting for reservation to start')
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        off = int(start - time.time())
        self.server.expect(RESV, a, id=rid, offset=off)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.status(JOB)
        job_node = j1.get_vnodes()[0]

        self.alter_a_reservation(rid, start, end,
                                 select=select2, confirm=False)
        self.server.status(RESV)
        resv_nodes = self.server.reservations[rid].get_vnodes()
        errmsg1 = 'Reservation does not have the right number of nodes'
        self.assertEquals(len(resv_nodes), 2, errmsg1)

        errmsg2 = 'Reservation does not contain job node'
        self.assertIn(job_node, resv_nodes, errmsg2)

        self.alter_a_reservation(rid, start, end,
                                 select=select3, confirm=False, sequence=2)
        self.server.status(RESV)
        resv_nodes = self.server.reservations[rid].get_vnodes()

        self.assertEquals(len(resv_nodes), 1, errmsg1)
        self.assertIn(job_node, resv_nodes, errmsg2)

    def test_alter_select_running_degraded(self):
        """
        Test that when a degraded running reservation with a running job is
        altered, the unavailable nodes are released and the node with the
        running job is kept
        """
        offset = 20
        duration = 3600
        select = '3:ncpus=4'
        select2 = '1:ncpus=4'

        a = {'resources_available.ncpus': 4, 'resources_available.mem': '1gb'}
        self.mom.create_vnodes(a, num=3,
                               usenatvnode=True)

        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              select=select)
        resv_queue = rid.split('.')[0]
        self.server.status(RESV)
        resv_nodes = self.server.reservations[rid].get_vnodes()

        self.assertEquals(len(resv_nodes), 3)

        a = {'queue': resv_queue,
             'Resource_List.select': '1:vnode=%s:ncpus=1' % resv_nodes[1]}
        j1 = Job(attrs=a)
        jid = self.server.submit(j1)

        self.logger.info('Waiting for reservation to start')
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        off = int(start - time.time())
        self.server.expect(RESV, a, id=rid, offset=off)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.status(JOB)
        job_node = j1.get_vnodes()[0]

        self.server.manager(MGR_CMD_SET, NODE, {'state': 'offline'},
                            id=resv_nodes[2])

        self.server.expect(RESV, {'reserve_substate': 10}, id=rid)

        self.alter_a_reservation(rid, start, end,
                                 select=select2, confirm=False)
        self.server.status(RESV)
        resv_nodes = self.server.reservations[rid].get_vnodes()

        errmsg1 = 'Reservation does not have the right number of nodes'
        self.assertEquals(len(resv_nodes), 1, errmsg1)

        errmsg2 = 'Reservation does not contain job node'
        self.assertIn(job_node, resv_nodes, errmsg2)

    def test_alter_select_with_times_standing(self):
        """
        Modify the select with start and end times on a standing reservation
        """
        offset = 20
        duration = 20
        select = '6:ncpus=1'
        new_select = '4:ncpus=1'
        shift = 15

        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              select=select,
                                                              standing=True)
        st = self.server.status(RESV)
        self.assertEquals(len(st[0]['resv_nodes'].split('+')), 6)

        self.alter_a_reservation(rid, start, end, alter_s=True, alter_e=True,
                                 shift=shift, select=new_select, interactive=9)

        st = self.server.status(RESV)
        self.assertEquals(len(st[0]['resv_nodes'].split('+')), 4)
        t = int(time.mktime(time.strptime(st[0]['reserve_start'], '%c')))
        self.assertEquals(t, start + shift)

        t = int(time.mktime(time.strptime(st[0]['reserve_end'], '%c')))
        self.assertEquals(t, end + shift)

        t = start + shift - int(time.time())

        self.logger.info('Waiting until reservation starts')
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_RUNNING|5')}, offset=t)

        self.check_standing_resv_second_occurrence(rid, start, end, select)

    def test_alter_select_larger_fail(self):
        """
        Test proper failures if ralter -lselect with a larger select
        """

        offset = 3600
        duration = 3600
        select = '6:ncpus=1'
        select_more = '7:ncpus=1'
        select_extra = '6:ncpus=1+1:ncpus=1:mem=1gb'
        select_different = '6:ncpus=4:mem=1gb'

        rid, start, end = self.submit_and_confirm_reservation(offset, duration,
                                                              select=select)

        self.alter_a_reservation(rid, start, end, select=select_more,
                                 whichMessage=0)

        self.alter_a_reservation(rid, start, end, select=select_extra,
                                 whichMessage=0)
        self.alter_a_reservation(rid, start, end, select=select_different,
                                 whichMessage=0)

    def test_standing_multiple_alter(self):
        """
        Test that a standing reservation's second occurrence reverts to the
        original start/end/duration/select if it is altered multiple times
        """

        offset = 60
        shift1 = -20
        shift2 = -30
        dur = 30
        dur2 = 20
        dur3 = 15
        select = '6:ncpus=1'
        select2 = '4:ncpus=1'
        select3 = '2:ncpus=1'

        rid, start, end = \
            self.submit_and_confirm_reservation(offset, dur, select=select,
                                                standing=True,
                                                rrule="FREQ=MINUTELY;COUNT=2")

        self.alter_a_reservation(rid, start, end, alter_s=True,
                                 shift=shift1, a_duration=dur2, select=select2)
        self.alter_a_reservation(rid, start, end, alter_s=True,
                                 shift=shift2, a_duration=dur3,
                                 select=select3, sequence=2)

        t = start - int(time.time()) + shift2

        self.logger.info('Sleeping %ds until resv starts' % (t))
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
                           id=rid, offset=t)

        self.check_standing_resv_second_occurrence(rid, start, end, select,
                                                   freq=60, wait=True)

    def test_select_fail_revert(self):
        """
        Test that when a ralter fails, the select is reverted properly
        """
        offset = 3600
        offset2 = 7200
        shift = 1800
        dur = 3600
        select = '8:ncpus=1'
        select2 = '4:ncpus=1'

        rid, start, end = self.submit_and_confirm_reservation(offset, dur,
                                                              select=select)

        rid2, start2, end2 = self.submit_and_confirm_reservation(offset2, dur,
                                                                 select=select)

        self.alter_a_reservation(rid, start, end, alter_s=True, alter_e=True,
                                 shift=shift, select=select2, whichMessage=3)

        a = {'Resource_List.select': '8:ncpus=1', 'Resource_List.ncpus': 8,
             'Resource_List.nodect': 8}
        self.server.expect(RESV, a, id=rid)

    def test_resv_resc_assigned(self):
        """
        Test that when an ralter -D is issued, the resources on the node
        are still correct
        """

        offset = 60
        dur = 60
        select = '4:ncpus=1'

        rid, start, end = self.submit_and_confirm_reservation(offset, dur,
                                                              select=select)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]

        sleepdur = start - time.time()
        self.logger.info('Sleeping until reservation starts')
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
                           offset=sleepdur)
        self.alter_a_reservation(rid, start, end, a_duration=600,
                                 confirm=False)
        self.server.expect(NODE, {'resources_assigned.ncpus': 4},
                           max_attempts=1, id=resv_node)

    def test_alter_start_standing_resv_future_occrs(self):
        """
        Test that when start time of a confirmed standing reservation is
        altered, only the upcoming occurence changes and not all occurences
        are modified.
        """

        duration = 20
        offset = 3600
        shift = -3000

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="2:ncpus=4", standing=True,
            rrule="FREQ=HOURLY;COUNT=3")

        # move the reservation 10 mins in future
        self.alter_a_reservation(rid, start, end, confirm=True, alter_s=True,
                                 alter_e=True, shift=shift)
        # Ideally this reservation should confirm because second occurrence
        # of the first reservation happens in almost 2 hrs from now.
        rid2, start, end = self.submit_and_confirm_reservation(
            3000, 1800, select="2:ncpus=4")

    def test_alter_duration_standing_resv_future_occrs(self):
        """
        Test that when duration of a confirmed standing reservation is
        altered, only the upcoming occurence changes and not all occurences
        are modified.
        """

        duration = 180
        offset = 300

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="2:ncpus=4", standing=True,
            rrule="FREQ=HOURLY;COUNT=3")

        # change the reservation's duration to 20 seconds
        self.alter_a_reservation(rid, start, end, confirm=True, a_duration=20)

        # Submit another reservation that starts in 1hr and 30 seconds.
        # Ideally, in 1 hr second occurrence of reservation will start running
        # and it will run for 3 mins. This means the new reservation will be
        # denied.
        new_offset = (start + 3630) - time.time()
        rid2, start, end = self.submit_and_confirm_reservation(
            new_offset, 180, select="2:ncpus=4", ExpectSuccess=0)

    def test_ralter_force_start_end_confirmed_resv(self):
        """
        Test that forcefully altering a confirmed reservation takes effect.
        Especially when there are conflicting reservations
        """

        duration1 = 3600
        offset1 = 3600

        rid1, start1, end1 = self.submit_and_confirm_reservation(
            offset1, duration1, select="2:ncpus=4")

        duration2 = 1800
        offset2 = 600

        rid2, start2, end2 = self.submit_and_confirm_reservation(
            offset2, duration2, select="2:ncpus=4")

        self.alter_a_reservation(rid1, start1, end1, confirm=True, shift=-3000,
                                 alter_s=True, alter_e=True, extend='force')
        t_duration, t_start, t_end = self.get_resv_time_info(rid1)
        start1 = start1 - 3000
        end1 = end1 - 3000
        self.assertEqual(int(t_start), start1)
        self.assertEqual(int(t_duration), duration1)
        self.assertEqual(int(t_end), end1)

        # Try the same alter but in interactive mode
        duration = 300
        self.alter_a_reservation(rid1, start1, end1, confirm=True,
                                 a_duration=duration, extend='force',
                                 interactive=10, sequence=2)
        t_duration, _, _ = self.get_resv_time_info(rid1)
        self.assertEqual(int(t_duration), duration)

    def test_ralter_force_start_end_unconfirmed_resv(self):
        """
        Test that forcefully altering unconfirmed reservation takes effect.
        """

        self.server.manager(MGR_CMD_SET, SCHED, {'scheduling': 'False'})

        duration = 3600
        offset = 3600

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="2:ncpus=4", ExpectSuccess=2)
        attrs = {}
        new_start = start - 1800
        new_end = end - 3600
        new_duration = duration - 1800

        new_start_conv = self.bu.convert_seconds_to_datetime(new_start)
        attrs['reserve_start'] = new_start_conv

        new_end_conv = self.bu.convert_seconds_to_datetime(new_end)
        attrs['reserve_end'] = new_end_conv

        self.server.alterresv(rid, attrs, extend='force')
        msg = "pbs_ralter: " + rid + " CONFIRMED"
        self.assertEqual(msg, self.server.last_out[0])

        t_duration, t_start, t_end = self.get_resv_time_info(rid)
        self.assertEqual(int(t_start), new_start)
        self.assertEqual(int(t_duration), new_duration)
        self.assertEqual(int(t_end), new_end)

        # Try the same alter but in interactive mode
        new_end = new_end - 100
        new_end_conv = self.bu.convert_seconds_to_datetime(new_end)
        attrs['reserve_end'] = new_end_conv
        attrs['interactive'] = 10
        self.server.alterresv(rid, attrs, extend='force')
        msg = "pbs_ralter: " + rid + " CONFIRMED"
        self.assertEqual(msg, self.server.last_out[0])

        _, _, t_end = self.get_resv_time_info(rid)
        self.assertEqual(int(t_end), new_end)
        check_attr = {'reserve_state': (MATCH_RE, 'RESV_UNCONFIRMED|1')}
        self.server.expect(RESV, check_attr, rid)

    def test_alter_force_duration_standing_resv_future_occrs(self):
        """
        Test that when duration of a confirmed standing reservation is
        forcefully altered, only the upcoming occurence changes and not all
        occurrences are modified.
        """

        duration = 180
        offset = 300
        offset_a = 500

        rid_a, start_a, end_a = self.submit_and_confirm_reservation(
            offset_a, duration, select="2:ncpus=4")

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="2:ncpus=4", standing=True,
            rrule="FREQ=HOURLY;COUNT=3")

        # change the reservation's duration to 300 seconds, so that it clashes
        # with the advance reservation
        self.alter_a_reservation(rid, start, end, confirm=True,
                                 a_duration=300, extend='force')

        # Submit another reservation that starts in 1hr and 200 seconds.
        # Ideally, in 1 hr second occurrence of reservation will start running
        # and it will run for 3 mins. This means the new reservation will be
        # confirmed.
        new_offset = (start + 3800) - int(time.time())
        rid2, start, end = self.submit_and_confirm_reservation(
            new_offset, 180, select="2:ncpus=4", ExpectSuccess=1)

    def test_alter_force_non_manager_user(self):
        """
        Test that ralter -Wforce option fails for non-manager users
        """

        duration = 180
        offset = 300
        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="2:ncpus=4", ruser=TEST_USER2)
        self.alter_a_reservation(rid, start, end,
                                 a_duration=300, extend='force',
                                 runas=TEST_USER2, whichMessage=0)

    def test_alter_force_select(self):
        """
        Test that ralter -Wforce option fails for select resource
        """

        duration = 180
        offset = 300
        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="2:ncpus=4", ruser=TEST_USER2)
        self.alter_a_reservation(rid, start, end, select="1:ncpus=1",
                                 a_duration=20, extend='force',
                                 whichMessage=0)

    def test_ralter_force_start_end_running_resv(self):
        """
        Test that forcefully altering a running reservation takes effect.
        """

        duration = 3600
        offset = 20

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, select="2:ncpus=4")

        resv_queue = rid.split('.')[0]
        a = {'queue': resv_queue}
        j = Job(attrs=a)
        jid = self.server.submit(j)

        self.logger.info('Waiting for reservation to start')
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        off = int(start - time.time())
        self.server.expect(RESV, a, id=rid, offset=off)

        # this alter command is rejected because the reservation has
        # a running job in it.
        self.alter_a_reservation(rid, start, end, confirm=False, shift=-10,
                                 alter_s=True, extend='force', whichMessage=0)

        self.alter_a_reservation(rid, start, end, confirm=False, shift=-100,
                                 alter_e=True, extend='force')
        _, _, t_end = self.get_resv_time_info(rid)
        end -= 100
        self.assertEqual(int(t_end), end)

        self.alter_a_reservation(rid, start, end, confirm=False,
                                 a_duration=4000, extend='force', sequence=2)
        t_duration, _, _ = self.get_resv_time_info(rid)
        self.assertEqual(int(t_duration), 4000)

        self.server.delete(jid, wait=True)
        end = start + 4000
        self.alter_a_reservation(rid, start, end, confirm=True, shift=1000,
                                 alter_s=True, extend='force', sequence=3)
        _, t_start, _ = self.get_resv_time_info(rid)
        self.assertEqual(int(t_start), start + 1000)

    def test_restart_revert(self):
        """
        Test that if a reservation is in state RESV_BEING_ALTERED and
        the server shuts down, when the server recovers the reservation
        from the database, it will revert the reservation to the original
        attributes.
        """

        duration = 60
        offset = 60
        shift = 5

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration)

        attrs = {'reserve_start':
                 self.bu.convert_seconds_to_datetime(start, self.fmt),
                 'reserve_end':
                 self.bu.convert_seconds_to_datetime(end, self.fmt),
                 'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': False})
        new_start, new_end = self.alter_a_reservation(rid, start, end,
                                                      alter_s=True,
                                                      alter_e=True,
                                                      shift=shift,
                                                      confirm=False,
                                                      whichMessage=-1)
        a2 = {'reserve_start':
              self.bu.convert_seconds_to_datetime(new_start, self.fmt),
              'reserve_end':
              self.bu.convert_seconds_to_datetime(new_end, self.fmt),
              'reserve_state': (MATCH_RE, 'RESV_BEING_ALTERED|11')}
        self.server.expect(RESV, a2, id=rid)
        self.server.restart()
        self.server.expect(RESV, attrs, id=rid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        self.server.expect(RESV, attrs, id=rid)
        wait = start - time.time()
        self.check_resv_running(rid, offset=wait)

    def test_alter_degrade_reconfirm_standing(self):
        """
        Test that if a standing reservation is altered, degraded,
        then reconfirmed, the reservation will use the original
        select
        """
        duration = 60
        offset = 60

        confirmed = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        degraded = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}
        offline = {'state': 'offline'}

        self.server.manager(MGR_CMD_SET, SERVER, {'reserve_retry_time': 5})

        rid, start, end = self.submit_and_confirm_reservation(
            offset, duration, standing=True, select="2:ncpus=2")

        self.alter_a_reservation(rid, start, end, select="1:ncpus=2")

        self.server.status(RESV, id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': False})
        self.server.manager(MGR_CMD_SET, NODE, offline, id=resv_node)
        self.server.expect(RESV, degraded, id=rid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})
        self.server.expect(RESV, confirmed, id=rid)

        stat = self.server.status(RESV, id=rid)[0]
        resvnodes = stat['resv_nodes']
        self.assertNotEquals(resv_node, resvnodes)
        self.assertEquals(1, len(resvnodes.split('+')))

        self.check_occr_finish(rid, end - time.time())
        stat = self.server.status(RESV, id=rid)[0]
        resvnodes = stat['resv_nodes']
        self.assertEquals(2, len(resvnodes.split('+')))


================================================
FILE: test/tests/functional/pbs_release_limited_res_suspend.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *


class TestReleaseLimitedResOnSuspend(TestFunctional):
    """
    Test that based on admin's input only limited number of resources are
    released when suspending a running job.
    """

    def setUp(self):
        TestFunctional.setUp(self)
        # Set default resources available on the default mom
        a = {ATTR_rescavail + '.ncpus': 4, ATTR_rescavail + '.mem': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # Create an express queue
        b = {ATTR_qtype: 'Execution', ATTR_enable: 'True',
             ATTR_start: 'True', ATTR_p: '200'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, b, "expressq")

    def test_do_not_release_mem_sched_susp(self):
        """
        During preemption by suspension test that only ncpus are released from
        the running job and memory is not released.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=512mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        ras_mem = ATTR_rescassn + '.mem'
        ras_ncpus = ATTR_rescassn + '.ncpus'

        rv = self.server.status(
            NODE, [ras_ncpus, ras_mem], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_mem], "1048576kb",
                         msg="pbs should not release memory")
        self.assertEqual(rv[0][ras_ncpus], "2",
                         msg="pbs did not release ncpus")

    def test_do_not_release_mem_qsig_susp(self):
        """
        If a running job is suspended using qsig, test that only ncpus are
        released from the running job and memory is not released.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")

        ras_mem = ATTR_rescassn + '.mem'
        ras_ncpus = ATTR_rescassn + '.ncpus'

        rv = self.server.status(
            NODE, [ras_ncpus, ras_mem], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_mem], "524288kb",
                         msg="pbs should not release memory")
        self.assertEqual(rv[0][ras_ncpus], "0",
                         msg="pbs did not release ncpus")

    def test_change_in_res_to_release_on_suspend(self):
        """
        set restrict_res_to_release_on_suspend to only ncpus and then suspend
        a job after the job is suspended change
        restrict_res_to_release_on_suspend to release only memory and check
        if the suspended job resumes and do not account for memory twice.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=256mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        # Change restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        rc = 0
        try:
            rc = self.server.deljob(jid2, wait=True)
        except PbsDeljobError as e:
            self.assertEqual(rc, 0, e.msg[0])

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        ras_mem = ATTR_rescassn + '.mem'
        ras_ncpus = ATTR_rescassn + '.ncpus'

        rv = self.server.status(
            NODE, [ras_ncpus, ras_mem], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_mem], "524288kb",
                         msg="pbs did not account for memory correctly")
        self.assertEqual(rv[0][ras_ncpus], "4",
                         msg="pbs did not account for ncpus correctly")

    def test_res_released_sched_susp(self):
        """
        Test if job's resources_released attribute is correctly set when
        it is suspended.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=512mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        job = self.server.status(JOB, id=jid1)

        rr = "(%s:ncpus=4)" % self.mom.shortname
        self.assertEqual(job[0][ATTR_released], rr,
                         msg="resources_released incorrect")

    def test_res_released_sched_susp_multi_vnode(self):
        """
        Test if job's resources_released attribute is correctly set when
        a multi vnode job is suspended.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        vn_attrs = {ATTR_rescavail + '.ncpus': 8,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1,
                               fname="vnodedef1", vname="vnode1")
        # Append a vnode
        vn_attrs = {ATTR_rescavail + '.ncpus': 6,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1, additive=True,
                               fname="vnodedef2", vname="vnode2")

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select':
                           '1:ncpus=8:mem=512mb+1:ncpus=6:mem=256mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=8:mem=256mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        job = self.server.status(JOB, id=jid1)

        rr = "(vnode1[0]:ncpus=8)+(vnode2[0]:ncpus=6)"
        self.logger.info("resources released are " + job[0][ATTR_released])
        self.assertEqual(job[0][ATTR_released], rr,
                         msg="resources_released incorrect")

    def test_res_released_sched_susp_arrayjob(self):
        """
        Test if array subjob's resources_released attribute is correctly
        set when it is suspended.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb',
                           ATTR_J: '1-3'})
        jid1 = self.server.submit(j1)
        subjobs = self.server.status(JOB, id=jid1, extend='t')
        sub_jid1 = subjobs[1]['id']
        self.server.expect(JOB, {ATTR_state: 'R'}, id=sub_jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=512mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45},
                           id=sub_jid1)

        job = self.server.status(JOB, id=sub_jid1)

        rr = "(%s:ncpus=4)" % self.mom.shortname
        self.assertEqual(job[0][ATTR_released], rr,
                         msg="resources_released incorrect")

    def test_res_released_list_sched_susp_arrayjob(self):
        """
        Test if array subjob's resources_released_list attribute is correctly
        set when it is suspended.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb',
                           ATTR_J: '1-3'})
        jid1 = self.server.submit(j1)
        subjobs = self.server.status(JOB, id=jid1, extend='t')
        sub_jid1 = subjobs[1]['id']
        self.server.expect(JOB, {ATTR_state: 'R'}, id=sub_jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=256mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45},
                           id=sub_jid1)

        job = self.server.status(JOB, id=sub_jid1)

        rr_l_ncpus = job[0][ATTR_rel_list + ".ncpus"]
        self.assertEqual(rr_l_ncpus, "4", msg="ncpus not released")
        rr_l_mem = job[0][ATTR_rel_list + ".mem"]
        self.assertEqual(rr_l_mem, "524288kb", msg="memory not released")

    def test_res_released_list_sched_susp(self):
        """
        Test if job's resources_released_list attribute is correctly set when
        it is suspended.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=256mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        job = self.server.status(JOB, id=jid1)

        rr_l_ncpus = job[0][ATTR_rel_list + ".ncpus"]
        self.assertEqual(rr_l_ncpus, "4", msg="ncpus not released")
        rr_l_mem = job[0][ATTR_rel_list + ".mem"]
        self.assertEqual(rr_l_mem, "524288kb", msg="memory not released")

    def test_res_released_list_sched_susp_multi_vnode(self):
        """
        Test if job's resources_released_list attribute is correctly set when
        a multi vnode job is suspended.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        vn_attrs = {ATTR_rescavail + '.ncpus': 8,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1,
                               fname="vnodedef1", vname="vnode1")
        # Append a vnode
        vn_attrs = {ATTR_rescavail + '.ncpus': 6,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1, additive=True,
                               fname="vnodedef2", vname="vnode2")

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select':
                           '1:ncpus=8:mem=512mb+1:ncpus=6:mem=256mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=8:mem=256mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        job = self.server.status(JOB, id=jid1)

        rr_l_ncpus = job[0][ATTR_rel_list + ".ncpus"]
        self.assertEqual(rr_l_ncpus, "14", msg="ncpus not released")
        rr_l_mem = job[0][ATTR_rel_list + ".mem"]
        self.assertNotEqual(rr_l_mem, "2097152kb", msg="memory not released")

    def test_node_res_after_deleting_suspended_job(self):
        """
        Test that once a suspended job is deleted node's resources assigned
        are back to 0.
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 43}, id=jid1)

        ras_mem = ATTR_rescassn + '.mem'
        ras_ncpus = ATTR_rescassn + '.ncpus'

        rv = self.server.status(
            NODE, [ras_ncpus, ras_mem], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertEqual(
            rv[0][ras_mem], "524288kb",
            msg="pbs did not retain memory correctly on the node")
        self.assertEqual(
            rv[0][ras_ncpus], "0",
            msg="pbs did not release ncpus correctly on the node")

        rc = 0
        try:
            rc = self.server.deljob(jid1, wait=True)
        except PbsDeljobError as e:
            self.assertEqual(rc, 0, e.msg[0])

        rv = self.server.status(
            NODE, [ras_ncpus, ras_mem], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertEqual(
            rv[0][ras_mem], "0kb",
            msg="pbs did not reassign memory correctly on the node")
        self.assertEqual(
            rv[0][ras_ncpus], "0",
            msg="pbs did not reassign ncpus correctly on the node")

    def test_default_restrict_res_released_on_suspend(self):
        """
        Test the default value of restrict_res_to_release_on_suspend.
        It should release all the resources by default.
        """
        # Submit a low priority job
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=256mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        ras_mem = ATTR_rescassn + '.mem'
        ras_ncpus = ATTR_rescassn + '.ncpus'

        rv = self.server.status(
            NODE, [ras_ncpus, ras_mem], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_mem], "262144kb",
                         msg="pbs did not release memory")
        self.assertEqual(rv[0][ras_ncpus], "2",
                         msg="pbs did not release ncpus")

    def test_setting_unknown_resc(self):
        """
        Set a non existing resource in restrict_res_to_release_on_suspend
        and expect an unknown resource error
        """

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,abc'}
        try:
            self.server.manager(MGR_CMD_SET, SERVER, a)
        except PbsManagerError as e:
            self.assertTrue("Unknown resource" in e.msg[0])

    def test_delete_res_busy_on_res_to_release_list(self):
        """
        Create a resource, set it in restrict_res_to_release_on_suspend
        then delete the resource and check for resource busy error
        """

        # create a custom resource
        attr = {ATTR_RESC_TYPE: 'long'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='bar')

        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,foo,bar'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # delete the custom resources
        try:
            self.server.manager(MGR_CMD_DELETE, RSC, id='foo')
        except PbsManagerError as e:
            self.assertTrue("Resource busy on server" in e.msg[0])

        try:
            self.server.manager(MGR_CMD_DELETE, RSC, id='bar')
        except PbsManagerError as e:
            self.assertTrue("Resource busy on server" in e.msg[0])

    def test_queue_res_release_upon_suspension(self):
        """
        Create 2 consumable resources and set it on queue,
        set one of those resouces in restrict_res_to_release_on_suspend,
        submit a job requesting these resources, check if the resource
        set in restrict_res_to_release_on_suspend shows up as released
        on the queue
        """

        # create a custom resource
        attr = {ATTR_RESC_TYPE: 'long',
                ATTR_RESC_FLAG: 'q'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='bar')

        # Set foo in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,foo'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {ATTR_rescavail + ".foo": '100',
             ATTR_rescavail + ".bar": '100'}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id="workq")

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.ncpus': '4',
                           ATTR_l + '.foo': '30',
                           ATTR_l + '.bar': '40'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")

        ras_foo = ATTR_rescassn + '.foo'
        ras_bar = ATTR_rescassn + '.bar'

        rv = self.server.status(
            QUEUE, [ras_foo, ras_bar], id="workq")
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_foo], "0",
                         msg="pbs did not release resource foo")

        self.assertEqual(rv[0][ras_bar], "40",
                         msg="pbs should not release resource bar")

    def test_server_res_release_upon_suspension_using_qsig(self):
        """
        Create 2 consumable resources and set it on server,
        set one of those resouces in restrict_res_to_release_on_suspend,
        submit a job requesting these resources, check if the resource
        set in restrict_res_to_release_on_suspend shows up as released
        on the server when job is suspended using qsig
        """

        # create a custom resource
        attr = {ATTR_RESC_TYPE: 'long',
                ATTR_RESC_FLAG: 'q'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='bar')

        # Set foo in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,foo'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {ATTR_rescavail + ".foo": '100',
             ATTR_rescavail + ".bar": '100'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.ncpus': '4',
                           ATTR_l + '.foo': '30',
                           ATTR_l + '.bar': '40'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")

        ras_foo = ATTR_rescassn + '.foo'
        ras_bar = ATTR_rescassn + '.bar'

        rv = self.server.status(
            SERVER, [ras_foo, ras_bar])
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_foo], "0",
                         msg="pbs did not release resource foo")

        self.assertEqual(rv[0][ras_bar], "40",
                         msg="pbs should not release resource bar")

    def test_server_res_release_upon_suspension_using_preemption(self):
        """
        Create 2 consumable resources and set it on server,
        set one of those resouces in restrict_res_to_release_on_suspend,
        submit a job requesting these resources, check if the resource
        set in restrict_res_to_release_on_suspend shows up as released
        on the server when preemption happens
        """

        # create a custom resource
        attr = {ATTR_RESC_TYPE: 'long',
                ATTR_RESC_FLAG: 'q'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='bar')

        # Set foo in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,foo'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Add foo and bar to the resources scheduler checks for
        resources = self.scheduler.sched_config['resources']
        resources = resources[:-1] + ', foo, bar\"'
        self.scheduler.set_sched_config({'resources': resources})

        a = {ATTR_rescavail + ".foo": '100',
             ATTR_rescavail + ".bar": '100'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        # Submit 2 normal priority jobs
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.ncpus': '1',
                           ATTR_l + '.foo': '40',
                           ATTR_l + '.bar': '20'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.ncpus': '1',
                           ATTR_l + '.foo': '40',
                           ATTR_l + '.bar': '20'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        # Submit a high priority job
        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.ncpus': '1',
                           ATTR_l + '.foo': '70',
                           ATTR_l + '.bar': '20',
                           ATTR_q: 'expressq'})
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

        ras_foo = ATTR_rescassn + '.foo'
        ras_bar = ATTR_rescassn + '.bar'

        rv = self.server.status(
            SERVER, [ras_foo, ras_bar])
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_foo], "70",
                         msg="pbs did not release resource foo")

        self.assertEqual(rv[0][ras_bar], "60",
                         msg="pbs should not release resource bar")

    def test_node_custom_res_release_upon_suspension(self):
        """
        Create 2 consumable resources and set it on node,
        set one of those resouces in restrict_res_to_release_on_suspend,
        submit a job requesting these resources, check if the resource
        set in restrict_res_to_release_on_suspend shows up as released
        on the node
        """

        # create a custom resource
        attr = {ATTR_RESC_TYPE: 'long',
                ATTR_RESC_FLAG: 'nh'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='bar')

        # Set foo in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,foo'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.scheduler.add_resource("foo,bar")

        a = {ATTR_rescavail + ".foo": '100',
             ATTR_rescavail + ".bar": '100'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.ncpus': '4',
                           ATTR_l + '.foo': '30',
                           ATTR_l + '.bar': '40'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")

        ras_foo = ATTR_rescassn + '.foo'
        ras_bar = ATTR_rescassn + '.bar'

        rv = self.server.status(
            NODE, [ras_foo, ras_bar], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertEqual(rv[0][ras_foo], "0",
                         msg="pbs did not release resource foo")

        self.assertEqual(rv[0][ras_bar], "40",
                         msg="pbs should not release resource bar")

    def test_resuming_with_no_res_released(self):
        """
        Set restrict_res_to_release_on_suspend to a resource that a job
        does not request and then suspend this running job using qsig
        check if such a job resumes when qsig -s resume is issued
        """
        # Set mem in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.ncpus': '4'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")

        job = self.server.status(JOB, id=jid1)

        rr = "(%s:ncpus=0)" % self.mom.shortname
        self.assertEqual(job[0][ATTR_released], rr,
                         msg="resources_released incorrect")

        # resume job
        self.server.sigjob(jobid=jid1, signal="resume")
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

    def test_resuming_with_no_res_released_multi_vnode(self):
        """
        Set restrict_res_to_release_on_suspend to a resource that multi-vnode
        job does not request and then suspend this running job using qsig
        check if such a job resumes when qsig -s resume is issued
        """
        # Set mem in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        vn_attrs = {ATTR_rescavail + '.ncpus': 2,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1, fname="vnodedef1",
                               vname="vnode1")
        # Append a vnode
        vn_attrs = {ATTR_rescavail + '.ncpus': 6,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1, additive=True,
                               fname="vnodedef2", vname="vnode2")
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select':
                           '1:ncpus=2+1:ncpus=6',
                           ATTR_l + '.place': 'vscatter'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")

        job = self.server.status(JOB, id=jid1)

        rr = "(vnode1[0]:ncpus=0)+(vnode2[0]:ncpus=0)"
        self.assertEqual(job[0][ATTR_released], rr,
                         msg="resources_released incorrect")

        # resume job
        self.server.sigjob(jobid=jid1, signal="resume")
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

    def test_resuming_excljob_with_no_res_released(self):
        """
        Set restrict_res_to_release_on_suspend to a resource that an node excl
        job does not request and then suspend this running job using peemption
        check if such a job resumes when high priority job is deleted
        """
        # Set mem in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_l + '.place': 'excl'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        job = self.server.status(JOB, id=jid1)

        rr = "(%s:ncpus=0)" % self.mom.shortname
        self.assertEqual(job[0][ATTR_released], rr,
                         msg="resources_released incorrect")

        # resume job
        self.server.deljob(jid2, wait=True)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

    def test_normal_user_unable_to_see_res_released(self):
        """
        Check if normal user (non-operator, non-manager) has privileges to see
        resources_released and resource_released_list attribute in job status
        """
        # Set mem in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

        # stat the job as a normal user
        attrs = self.server.status(JOB, id=jid1, runas=TEST_USER)
        self.assertFalse("resources_released" in attrs[0],
                         "Normal user can see resources_released "
                         "which is not expected")

        self.assertFalse("resource_released_list.mem" in attrs[0],
                         "Normal user can see resources_released_list "
                         "which is not expected")

    def test_if_node_gets_oversubscribed(self):
        """
        Check if the node gets oversubscribed if a filler job runs
        on resources left on the node after suspension.
        """
        # Set mem in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {ATTR_sched_preempt_enforce_resumption: True}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=2:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a filler job
        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=3',
                           ATTR_l + '.walltime': 50})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid2)

        # Submit a high priority job
        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.select': '1:ncpus=1:mem=2gb',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 100})
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        # Check that resources_assigned is not exceeding resources_available
        ras_ncpus = ATTR_rescassn + '.ncpus'
        rav_ncpus = ATTR_rescavail + '.ncpus'
        rv = self.server.status(
            NODE, [ras_ncpus, rav_ncpus], id=self.mom.shortname)
        self.assertNotEqual(rv, None)

        self.assertLessEqual(rv[0][ras_ncpus], rv[0][rav_ncpus],
                             msg="pbs released resource ncpus incorrectly")

        # Expect filler job to be in queued state because
        # suspended job did not release any ncpus
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid2)

    def test_suspended_job_gets_calendered(self):
        """
        Check if a job which releases limited amount of resources gets
        calendared in the same cycle when it gets suspended.
        """
        # Set mem in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {ATTR_sched_preempt_enforce_resumption: True}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        # Set 5 ncpus available on the node
        a = {ATTR_rescavail + '.ncpus': 5}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=3:mem=1512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=2:mem=2gb',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 100})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

        # Check if the job is calendared
        self.scheduler.log_match(
            jid1 + ";Can't find start time estimate", existence=False,
            max_attempts=2)

    def helper_test_preempt_release_all(self, preempt_method):
        """
        Helper function to test that when preempting jobs, all resources
        are released during preemption simulation for R and C methods
        """
        if preempt_method == "R":
            schedlog_msg = "Job preempted by requeuing"
        elif preempt_method == "C":
            schedlog_msg = "Job preempted by checkpointing"
        else:
            raise Exception("Unexpected value of argument preempt_method: %s"
                            % (preempt_method))

        a = {ATTR_restrict_res_to_release_on_suspend: 'mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'preempt_order': preempt_method}, runas=ROOT_USER)

        # Set 2 ncpus available on the node
        a = {ATTR_rescavail + '.ncpus': "2"}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        # Submit a low priority jobs which takes up all of the ncpus
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=2'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job which requests 1 ncpus
        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)

        # Even though server is configured to only release mem for suspend,
        # for requeue and checkpointing, we should have released ncpus as well
        # and correctly preempted the low priority job
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.scheduler.log_match(jid1 + ";" + schedlog_msg)

    def test_preempt_requeue_release_all(self):
        """
        Test that when preempting jobs via Requeue, all resources
        are release during the preemption simulation
        """
        self.helper_test_preempt_release_all("R")

    def test_preempt_checkpoint_release_all(self):
        """
        Test that when preempting jobs via Checkpointing, all resources
        are release during the preemption simulation
        """
        # Create checkpoint
        chk_script = """#!/bin/bash
                kill $1
                exit 0
                """
        pbs_home = self.mom.pbs_conf['PBS_HOME']
        self.mom.add_checkpoint_abort_script(body=chk_script)
        self.helper_test_preempt_release_all("C")

    def test_server_restart_with_suspened_job(self):
        """
        Test that when a job releases limited resources on a node and then
        PBS server is restarted, the job is able to resume back on the same
        node.
        """
        # Set ncpus in restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Set 2 ncpus available on the node
        a = {ATTR_rescavail + '.ncpus': "2"}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        # Submit a job which takes up all of the ncpus
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=2'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # make sure that job id is part of node's jobs attribute
        node = self.server.status(NODE, id=self.mom.shortname)
        self.assertIn(jid1, node[0]['jobs'])

        # suspend job
        self.server.sigjob(jobid=jid1, signal="suspend")

        self.server.restart()

        self.assertTrue(self.server.isUp())
        self.server.expect(NODE, {'state': 'free'}, id=self.mom.shortname)
        self.server.expect(NODE, 'jobs', op=UNSET, id=self.mom.shortname)

        # resume job
        self.server.sigjob(jobid=jid1, signal="resume")
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(NODE, 'jobs', op=SET, id=self.mom.shortname)

    def test_server_restart_with_suspened_job_unset(self):
        """
        Test that when the attribute is set and unset,
        the server does not crash on restart with a suspended job.
        """
        a = {'type': 'long', 'flag': 'q'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='l1')
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='l2')

        self.scheduler.add_resource('l1, l2', apply=True)

        a = {'Resources_available.l1': 5, 'Resources_available.l2': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {ATTR_restrict_res_to_release_on_suspend: ['ncpus', 'l1']}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'Resource_List.select': '1:ncpus=1:mem=1024kb',
             'Resource_List.l1': 1,
             'Resource_List.l2': 1}

        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        node = self.server.status(NODE, id=self.mom.shortname)
        self.assertIn(jid1, node[0]['jobs'])
        self.server.expect(NODE,
                           {'resources_assigned.ncpus': 1,
                            'resources_assigned.mem': '1024kb'},
                           id=self.mom.shortname)
        self.server.expect(SERVER,
                           {'resources_assigned.l1': 1,
                            'resources_assigned.l2': 1})

        self.server.sigjob(jobid=jid1, signal="suspend")
        self.server.expect(NODE,
                           {'resources_assigned.ncpus': 0,
                            'resources_assigned.mem': '1024kb'},
                           id=self.mom.shortname)
        self.server.expect(SERVER,
                           {'resources_assigned.l1': 0,
                            'resources_assigned.l2': 1})

        a = [ATTR_restrict_res_to_release_on_suspend]
        self.server.manager(MGR_CMD_UNSET, SERVER, a)

        self.server.restart()

        self.assertTrue(self.server.isUp())
        self.server.expect(NODE,
                           {'state': 'free',
                            'resources_assigned.ncpus': 0,
                            'resources_assigned.mem': '1024kb'},
                           id=self.mom.shortname)
        self.server.expect(SERVER,
                           {'resources_assigned.l1': 0,
                            'resources_assigned.l2': 1})
        self.server.expect(NODE, 'jobs', op=UNSET, id=self.mom.shortname)

        self.server.sigjob(jobid=jid1, signal="resume")
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(NODE, 'jobs', op=SET, id=self.mom.shortname)
        self.server.expect(NODE,
                           {'resources_assigned.ncpus': 1,
                            'resources_assigned.mem': '1024kb'},
                           id=self.mom.shortname)
        self.server.expect(SERVER,
                           {'resources_assigned.l1': 1,
                            'resources_assigned.l2': 1})


================================================
FILE: test/tests/functional/pbs_reliable_job_startup.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.utils.pbs_logutils import PBSLogUtils


def convert_time(fmt, tm, fixdate=False):
    """
    Convert given time stamp <tm> into given format <fmt>
    if fixdate is True add <space> before date if date is < 9
    (This is because to match output with ctime as qstat uses it)
    """
    rv = time.strftime(fmt, time.localtime(float(tm)))
    if ((sys.platform not in ('cygwin', 'win32')) and (fixdate)):
        rv = rv.split()
        date = int(rv[2])
        if date <= 9:
            date = ' ' + str(date)
        rv[2] = str(date)
        rv = ' '.join(rv)
    return rv


def create_subjob_id(job_array_id, subjob_index):
    """
    insert subjob index into the square brackets of job array id
    """
    idx = job_array_id.find('[]')
    return job_array_id[:idx + 1] + str(subjob_index) + job_array_id[idx + 1:]


@requirements(num_moms=5)
class TestPbsReliableJobStartup(TestFunctional):

    """
    This tests the Reliable Job Startup Feature,
    where a job can be started with extra nodes,
    with node failures tolerated during job start
    (and even throughout the life of the job),
    before pruning job back to a set of healthy
    nodes that satisfy the original request.

    Custom parameters:
    moms: colon-separated hostnames of five MoMs
    """
    logutils = PBSLogUtils()

    def pbs_nodefile_match_exec_host(self, jid, exec_host,
                                     schedselect=None):
        """
        Look into the PBS_NODEFILE on the first host listed in 'exec_host'
        and returns True if all host entries in 'exec_host' match the entries
        in the file. Otherwise, return False.

        # Look for 'mpiprocs' values in 'schedselect' (if not None), and
        # verify that the corresponding node hosts are appearing in
        # PBS_NODEFILE 'mpiprocs' number of times.
        """

        pbs_nodefile = os.path.join(self.server.
                                    pbs_conf['PBS_HOME'], 'aux', jid)

        # look for mpiprocs settings
        mpiprocs = []
        if schedselect is not None:
            for chunk in schedselect.split('+'):
                chl = chunk.split(':')
                for ch in chl:
                    if ch.find('=') != -1:
                        c = ch.split('=')
                        if c[0] == "mpiprocs":
                            mpiprocs.append(c[1])
        ehost = exec_host.split('+')
        first_host = ehost[0].split('/')[0]

        cmd = ['cat', pbs_nodefile]
        ret = self.server.du.run_cmd(first_host, cmd, sudo=False)
        ehost2 = []
        for h in ret['out']:
            ehost2.append(h.split('.')[0])

        ehost1 = []
        j = 0
        for eh in ehost:
            h = eh.split('/')
            if (len(mpiprocs) > 0):
                for _ in range(int(mpiprocs[j])):
                    ehost1.append(h[0])
            else:
                ehost1.append(h[0])
            j += 1

        self.logger.info("EHOST1=%s" % (ehost1,))
        self.logger.info("EHOST2=%s" % (ehost2,))
        if ehost1 == ehost2:
            return True
        return False

    def match_accounting_log(self, atype, jid, exec_host, exec_vnode,
                             mem, ncpus, nodect, place, select):
        """
        This checks if there's an accounting log record 'atype' for
        job 'jid' containing the values given (i.e.
        Resource_List.exec_host, Resource_List.exec_vnode, etc...)
        This throws an exception upon encountering a non-matching
        accounting_logs entry.
        Some example values of 'atype' are: 'u' (update record due to
        release node request), 'c' (record containing the next
        set of resources to be used by a phased job as a result of
        release node request), 'e' (last update record for a phased job
        due to a release node request), 'E' (end of job record),
        's' (secondary start record).
        """

        if atype == 'e':
            self.mom.log_match("Job;%s;Obit sent" % (jid,), n="ALL",
                               max_attempts=5, interval=5,
                               starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*exec_host=%s" % (atype, jid, exec_host),
            regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*exec_vnode=%s" % (atype, jid, exec_vnode),
            regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.mem=%s" % (atype, jid,  mem),
            regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.ncpus=%d" % (atype, jid, ncpus),
            regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.nodect=%d" % (atype, jid, nodect),
            regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.place=%s" % (atype, jid, place),
            regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

        self.server.accounting_match(
            msg=r".*%s;%s.*Resource_List\.select=%s" % (atype, jid, select),
            regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

        if (atype != 'c') and (atype != 'S') and (atype != 's'):
            self.server.accounting_match(
                msg=r".*%s;%s.*resources_used\." % (atype, jid),
                regexp=True, n="ALL", max_attempts=3, starttime=self.stime)

    def match_vnode_status(self, vnode_list, state, jobs=None, ncpus=None,
                           mem=None):
        """
        Given a list of vnode names in 'vnode_list', check to make
        sure each vnode's state, jobs string, resources_assigned.mem,
        and resources_assigned.ncpus match the passed arguments.
        This will throw an exception if a match is not found.
        """
        for vn in vnode_list:
            dict_match = {'state': state}
            if jobs is not None:
                dict_match['jobs'] = jobs
            if ncpus is not None:
                dict_match['resources_assigned.ncpus'] = ncpus
            if mem is not None:
                dict_match['resources_assigned.mem'] = mem

            self.server.expect(VNODE, dict_match, id=vn)

    def create_and_submit_job(self, job_type, attribs=None):
        """
        create the job object and submit it to the server
        based on 'job_type' and attributes list 'attribs'.
        """
        if attribs:
            retjob = Job(TEST_USER, attrs=attribs)
        else:
            retjob = Job(TEST_USER)

        if job_type == 'job1':
            retjob.create_script(self.script['job1'])
        elif job_type == 'job1_2':
            retjob.create_script(self.script['job1_2'])
        elif job_type == 'job1_3':
            retjob.create_script(self.script['job1_3'])
        elif job_type == 'job1_4':
            retjob.create_script(self.script['job1_4'])
        elif job_type == 'job2':
            retjob.create_script(self.script['job2'])
        elif job_type == 'job3':
            retjob.create_script(self.script['job3'])
        elif job_type == 'job4':
            retjob.create_script(self.script['job4'])
        elif job_type == 'job5':
            retjob.create_script(self.script['job5'])
        elif job_type == 'jobA':
            retjob.create_script(self.script['jobA'])

        return self.server.submit(retjob)

    def setUp(self):

        if len(self.moms) != 5:
            cmt = "need 5 mom hosts: -p moms=<m1>:<m2>:<m3>:<m4>:<m5>"
            self.skip_test(reason=cmt)

        TestFunctional.setUp(self)
        Job.dflt_attributes[ATTR_k] = 'oe'

        self.server.cleanup_jobs()

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momC = self.moms.values()[2]
        self.momD = self.moms.values()[3]
        self.momE = self.moms.values()[4]

        # Now start setting up and creating the vnodes
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")

        # set node momA
        self.hostA = self.momA.shortname
        self.momA.delete_vnode_defs()
        vnode_prefix = self.hostA
        a = {'resources_available.mem': '1gb',
             'resources_available.ncpus': '1'}
        vnodedef = self.momA.create_vnode_def(vnode_prefix, a, 4)
        self.assertNotEqual(vnodedef, None)
        self.momA.insert_vnode_def(vnodedef, 'vnode.def')
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)

        # set node momB
        self.hostB = self.momB.shortname
        self.momB.delete_vnode_defs()
        vnode_prefix = self.hostB
        a = {'resources_available.mem': '1gb',
             'resources_available.ncpus': '1'}
        vnodedef = self.momB.create_vnode_def(vnode_prefix, a, 5,
                                              usenatvnode=True)
        self.assertNotEqual(vnodedef, None)
        self.momB.insert_vnode_def(vnodedef, 'vnode.def')
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostB)

        # set node momC
        # This one has no vnode definition.

        self.hostC = self.momC.shortname
        self.momC.delete_vnode_defs()
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostC)
        a = {'resources_available.ncpus': 2,
             'resources_available.mem': '2gb'}
        # set natural vnode of hostC
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostC)

        # set node momD
        # This one has no vnode definition.

        self.hostD = self.momD.shortname
        self.momD.delete_vnode_defs()
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostD)
        a = {'resources_available.ncpus': 5,
             'resources_available.mem': '5gb'}
        # set natural vnode of hostD
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.hostD)

        # set node momE
        self.hostE = self.momE.shortname
        self.momE.delete_vnode_defs()
        vnode_prefix = self.hostE
        a = {'resources_available.mem': '1gb',
             'resources_available.ncpus': '1'}
        vnodedef = self.momE.create_vnode_def(vnode_prefix, a, 5,
                                              usenatvnode=True)
        self.assertNotEqual(vnodedef, None)
        self.momE.insert_vnode_def(vnodedef, 'vnode.def')
        self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostE)

        # Various node names
        self.nA = self.hostA
        self.nAv0 = '%s[0]' % (self.hostA,)
        self.nAv1 = '%s[1]' % (self.hostA,)
        self.nAv2 = '%s[2]' % (self.hostA,)
        self.nAv3 = '%s[3]' % (self.hostA,)
        self.nB = self.hostB
        self.nBv0 = '%s[0]' % (self.hostB,)
        self.nBv1 = '%s[1]' % (self.hostB,)
        self.nBv2 = '%s[2]' % (self.hostB,)
        self.nBv3 = '%s[3]' % (self.hostB,)
        self.nC = self.hostC
        self.nD = self.hostD
        self.nE = self.hostE
        self.nEv0 = '%s[0]' % (self.hostE,)
        self.nEv1 = '%s[1]' % (self.hostE,)
        self.nEv2 = '%s[2]' % (self.hostE,)
        self.nEv3 = '%s[3]' % (self.hostE,)

        a = {'state': 'free', 'resources_available.ncpus': (GE, 1)}
        self.server.expect(VNODE, {'state=free': 17}, count=True,
                           max_attempts=10, interval=2)

        if sys.platform in ('cygwin', 'win32'):
            SLEEP_CMD = "pbs-sleep"
        else:
            SLEEP_CMD = os.path.join(os.sep, "bin", "sleep")

        self.pbs_release_nodes_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_release_nodes')

        FIB37 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                             'pbs_python') + \
            ' -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(37))\\\")"'

        self.fib37_value = 24157817

        FIB40 = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                             'pbs_python') + \
            ' -c "exec(\\\"def fib(i):\\n if i < 2:\\n  \
return i\\n return fib(i-1) + fib(i-2)\\n\\nprint(fib(40))\\\")"'

        # job submission arguments
        self.script = {}
        # original select spec
        self.job1_oselect = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=2:mem=2gb"
        self.job1_place = "scatter"
        # incremented values at job start and just before actual launch
        self.job1_iselect = \
            "1:ncpus=3:mem=2gb+2:ncpus=3:mem=2gb+2:ncpus=2:mem=2gb"
        self.job1_ischedselect = self.job1_iselect
        self.job1_iexec_host = "%s/0*0+%s/0*0+%s/0*3+%s/0*2+%s/0*0" % (
            self.nA, self.nB, self.nD, self.nC, self.nE)
        self.job1_iexec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:ncpus=2:mem=2097152kb)+" % (self.nC,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nE,) + \
            "%s:mem=1048576kb:ncpus=1)" % (self.nEv0,)
        self.job1_isel_esc = self.job1_iselect.replace(r"+", r"\+")
        self.job1_iexec_host_esc = self.job1_iexec_host.replace(
            r"*", r"\*").replace(r"[", r"\[").replace(r"]", r"\]").replace(
                    r"+", r"\+")
        self.job1_iexec_vnode_esc = self.job1_iexec_vnode.replace(
            r"[", r"\[").replace(r"]", r"\]").replace(r"(", r"\(").replace(
            r")", r"\)").replace(r"+", r"\+")

        # expected values version 1 upon successful job launch
        self.job1_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job1_schedselect = self.job1_select
        self.job1_exec_host = r"%s/0*0+%s/0*3+%s/0*0" % (
            self.nA, self.nD, self.nE)
        self.job1_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nE,) + \
            "%s:mem=1048576kb:ncpus=1)" % (self.nEv0,)

        self.job1_sel_esc = self.job1_select.replace(r"+", r"\+")
        self.job1_exec_host_esc = self.job1_exec_host.replace(
            r"*", r"\*").replace(r"[", r"\[").replace(r"]", r"\]").replace(
                    r"+", r"\+")
        self.job1_exec_vnode_esc = self.job1_exec_vnode.replace(
            r"[", r"\[").replace(r"]", r"\]").replace(r"(", r"\(").replace(
            r")", r"\)").replace(r"+", r"\+")

        # expected values version 2 upon successful job launch
        self.job1v2_select = \
            r"1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job1v2_schedselect = self.job1v2_select
        self.job1v2_exec_host = r"%s/0*0+%s/0*3+%s/0*2" % (
            self.nA, self.nD, self.nC)
        self.job1v2_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.nC,)

        self.job1v2_sel_esc = self.job1v2_select.replace(r"+", r"\+")
        self.job1v2_exec_host_esc = self.job1v2_exec_host.replace(
            r"*", r"\*").replace(r"[", r"\[").replace(r"]", r"\]").replace(
                    r"+", r"\+")
        self.job1v2_exec_vnode_esc = self.job1v2_exec_vnode.replace(
            r"[", r"\[").replace(r"]", r"\]").replace(r"(", r"\(").replace(
            r")", r"\)").replace(r"+", r"\+")

        # expected values version 3 upon successful job launch
        self.job1v3_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job1v3_schedselect = self.job1v3_select
        self.job1v3_exec_host = "%s/0*0+%s/0*0+%s/0*0" % (
            self.nA, self.nB, self.nE)
        self.job1v3_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nE,) + \
            "%s:mem=1048576kb:ncpus=1)" % (self.nEv0,)

        self.job1v3_sel_esc = self.job1v3_select.replace("+", r"\+")
        self.job1v3_exec_host_esc = self.job1v3_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job1v3_exec_vnode_esc = self.job1v3_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        # expected values version 4 upon successful job launch
        self.job1v4_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job1v4_schedselect = self.job1v4_select
        self.job1v4_exec_host = "%s/0*0+%s/0*0+%s/0*2" % (
            self.nA, self.nB, self.nD)
        self.job1v4_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.nD,)

        self.job1v4_sel_esc = self.job1v4_select.replace("+", r"\+")
        self.job1v4_exec_host_esc = self.job1v4_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job1v4_exec_vnode_esc = self.job1v4_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        # expected values version 5 upon successful job launch
        self.job1v5_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job1v5_schedselect = self.job1v5_select
        self.job1v5_exec_host = "%s/0*0+%s/0*0+%s/0*2" % (
            self.nA, self.nB, self.nC)
        self.job1v5_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.nC,)

        self.job1v5_sel_esc = self.job1v5_select.replace("+", r"\+")
        self.job1v5_exec_host_esc = self.job1v5_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job1v5_exec_vnode_esc = self.job1v5_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        # expected values version 6 upon successful job launch
        self.job1v6_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job1v6_select += "+1:ncpus=1:mem=1gb"
        self.job1v6_schedselect = self.job1v6_select
        self.job1v6_exec_host = "%s/0*0+%s/0*0+%s/0*2+%s/0" % (
            self.nA, self.nB, self.nC, self.nE)
        self.job1v6_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=2:mem=2097152kb)+" % (self.nC,) + \
            "(%s:mem=1048576kb:ncpus=1)" % (self.nE,)

        self.job1v6_sel_esc = self.job1v6_select.replace("+", r"\+")
        self.job1v6_exec_host_esc = self.job1v6_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job1v6_exec_vnode_esc = self.job1v6_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        self.script['job1'] = """
#PBS -l select=%s
#PBS -l place=%s
#PBS -W umask=022
#PBS -S /bin/bash
echo "$PBS_NODEFILE"
cat $PBS_NODEFILE
echo 'FIB TESTS'
echo 'pbsdsh -n 1 fib 37'
pbsdsh -n 1 -- %s
echo 'pbsdsh -n 2 fib 37'
pbsdsh -n 2 -- %s
echo 'fib 37'
%s
echo 'HOSTNAME TESTS'
echo 'pbsdsh -n 0 hostname'
pbsdsh -n 0 --  hostname -s
echo 'pbsdsh -n 1 hostname'
pbsdsh -n 1 --  hostname -s
echo 'pbsdsh -n 2 hostname'
pbsdsh -n 2 --  hostname -s
echo 'PBS_NODEFILE tests'
for h in `cat $PBS_NODEFILE`
do
    echo "HOST=$h"
    echo "pbs_tmrsh $h hostname"
    pbs_tmrsh $h hostname -s
done
""" % (self.job1_oselect, self.job1_place, FIB37, FIB37, FIB37)

        # original select spec
        self.jobA_oselect = "ncpus=1:mem=1gb+ncpus=1:mem=1gb+ncpus=1:mem=1gb"
        self.jobA_place = "scatter"
        # incremented values at job start and just before actual launch
        self.jobA_iselect = \
            "1:ncpus=1:mem=1gb+2:ncpus=1:mem=1gb+2:ncpus=1:mem=1gb"
        self.jobA_ischedselect = self.jobA_iselect
        self.jobA_iexec_host1 = "%s/0+%s/0+%s/0+%s/0+%s/0" % (
            self.nA, self.nB, self.nC, self.nD, self.nE)
        self.jobA_iexec_host2 = "%s/1+%s/1+%s/1+%s/1+%s/1" % (
            self.nA, self.nB, self.nC, self.nD, self.nE)
        self.jobA_iexec_host3 = "%s/2+%s/2+%s/0+%s/2+%s/0" % (
            self.nA, self.nB, self.nC, self.nD, self.nE)
        self.jobA_iexec_vnode1 = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nAv0,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nB,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nC,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nD,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.nE,)
        self.jobA_iexec_vnode2 = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nAv1,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nBv0,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nC,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nD,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.nEv0,)
        self.jobA_iexec_vnode3 = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nAv2,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nBv1,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nC,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nD,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.nE,)
        self.jobA_isel_esc = self.jobA_iselect.replace("+", r"\+")
        self.jobA_iexec_host1_esc = self.jobA_iexec_host1.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.jobA_iexec_host2_esc = self.jobA_iexec_host2.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.jobA_iexec_host3_esc = self.jobA_iexec_host3.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.jobA_iexec_vnode1_esc = self.jobA_iexec_vnode1.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.jobA_iexec_vnode2_esc = self.jobA_iexec_vnode2.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.jobA_iexec_vnode3_esc = self.jobA_iexec_vnode3.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        # expected values version 1 upon successful job launch
        self.jobA_select = \
            "1:ncpus=1:mem=1gb+1:ncpus=1:mem=1gb+1:ncpus=1:mem=1gb"
        self.jobA_schedselect = self.jobA_select
        self.jobA_exec_host1 = "%s/0+%s/0+%s/0" % (
            self.nA, self.nB, self.nD)
        self.jobA_exec_host2 = "%s/1+%s/1+%s/1" % (
            self.nA, self.nB, self.nD)
        self.jobA_exec_host3 = "%s/2+%s/2+%s/2" % (
            self.nA, self.nB, self.nD)
        self.jobA_exec_vnode1 = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nAv0,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nB,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.nD,)
        self.jobA_exec_vnode2 = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nAv1,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nBv0,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.nD,)
        self.jobA_exec_vnode3 = \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nAv2,) + \
            "(%s:ncpus=1:mem=1048576kb)+" % (self.nBv1,) + \
            "(%s:ncpus=1:mem=1048576kb)" % (self.nD,)

        self.jobA_sel_esc = self.jobA_select.replace("+", r"\+")
        self.jobA_exec_host1_esc = self.jobA_exec_host1.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.jobA_exec_host2_esc = self.jobA_exec_host2.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.jobA_exec_host3_esc = self.jobA_exec_host3.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.jobA_exec_vnode1_esc = self.jobA_exec_vnode1.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.jobA_exec_vnode2_esc = self.jobA_exec_vnode2.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.jobA_exec_vnode3_esc = self.jobA_exec_vnode3.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")
        self.script['jobA'] = """
#PBS -J 1-3
#PBS -l select=%s
#PBS -l place=%s
#PBS -S /bin/bash
echo 'HOSTNAME TESTS'
echo 'pbsdsh -n 0 hostname'
pbsdsh -n 0 -- hostname -s
echo 'pbsdsh -n 1 hostname'
pbsdsh -n 1 -- hostname -s
echo 'pbsdsh -n 2 hostname'
pbsdsh -n 2 -- hostname -s
sleep 180
""" % (self.jobA_oselect, self.jobA_place)

        self.script['job1_3'] = """
#PBS -l select=%s
#PBS -l place=%s
#PBS -W umask=022
#PBS -S /bin/bash
echo "$PBS_NODEFILE"
cat $PBS_NODEFILE
echo 'FIB TESTS'
echo 'pbsdsh -n 2 fib 40'
pbsdsh -n 2 -- %s
echo 'fib 40'
%s
echo 'HOSTNAME TESTS'
echo 'pbsdsh -n 0 hostname'
pbsdsh -n 0 -- hostname -s
echo 'pbsdsh -n 2 hostname'
pbsdsh -n 2 -- hostname -s
""" % (self.job1_oselect, self.job1_place, FIB40, FIB40)

        self.script['job1_2'] = """
#PBS -l select=%s
#PBS -l place=%s
#PBS -W umask=022
#PBS -S /bin/bash
echo "$PBS_NODEFILE"
cat $PBS_NODEFILE
echo 'FIB TESTS'
echo 'pbsdsh -n 2 fib 37'
pbsdsh -n 2 -- %s
echo 'fib 37'
%s
echo 'HOSTNAME TESTS'
echo 'pbsdsh -n 0 hostname'
pbsdsh -n 0 -- hostname -s
echo 'pbsdsh -n 2 hostname'
pbsdsh -n 2 -- hostname -s
""" % (self.job1_oselect, self.job1_place, FIB37, FIB37)

        self.script['job1_3'] = """
#PBS -l select=%s
#PBS -l place=%s
#PBS -W umask=022
#PBS -S /bin/bash
echo "$PBS_NODEFILE"
cat $PBS_NODEFILE
echo 'FIB TESTS'
echo 'pbsdsh -n 2 fib 40'
pbsdsh -n 2 -- %s
echo 'fib 40'
%s
echo 'HOSTNAME TESTS'
echo 'pbsdsh -n 0 hostname'
pbsdsh -n 0 -- hostname -s
echo 'pbsdsh -n 2 hostname'
pbsdsh -n 2 -- hostname -s
""" % (self.job1_oselect, self.job1_place, FIB40, FIB40)

        self.script['job1_4'] = """
#PBS -l select=%s
#PBS -l place=%s
#PBS -W umask=022
#PBS -S /bin/bash
echo "$PBS_NODEFILE"
cat $PBS_NODEFILE
echo 'FIB TESTS'
echo 'pbsdsh -n 1 fib 37'
pbsdsh -n 1 -- %s
echo 'pbsdsh -n 2 fib 37'
pbsdsh -n 2 -- %s
echo 'pbsdsh -n 3 fib 37'
pbsdsh -n 3 -- %s
echo 'fib 37'
%s
echo 'HOSTNAME TESTS'
echo 'pbsdsh -n 0 hostname'
pbsdsh -n 0 -- hostname -s
echo 'pbsdsh -n 1 hostname'
pbsdsh -n 1 -- hostname -s
echo 'pbsdsh -n 2 hostname'
pbsdsh -n 2 -- hostname -s
echo 'pbsdsh -n 3 hostname'
pbsdsh -n 3 -- hostname -s
echo 'PBS_NODEFILE tests'
for h in `cat $PBS_NODEFILE`
do
    echo "HOST=$h"
    echo "pbs_tmrsh $h hostname"
    pbs_tmrsh $h hostname -s
done
""" % (self.job1_oselect, self.job1_place, FIB37, FIB37, FIB37, FIB37)

        # original select spec
        self.job2_oselect = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=0:mem=2gb"
        self.job2_place = "scatter"
        # incremented values at job start and just before actual launch
        self.job2_iselect = \
            "1:ncpus=3:mem=2gb+2:ncpus=3:mem=2gb+2:ncpus=0:mem=2gb"
        self.job2_ischedselect = self.job2_iselect
        self.job2_iexec_host = "%s/0*0+%s/0*0+%s/0*3+%s/0*0+%s/0*0" % (
            self.nA, self.nB, self.nD, self.nC, self.nE)
        self.job2_iexec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:ncpus=0:mem=2097152kb)+" % (self.nC,) + \
            "(%s:mem=1048576kb:ncpus=0+" % (self.nE,) + \
            "%s:mem=1048576kb)" % (self.nEv0,)
        self.job2_isel_esc = self.job2_iselect.replace("+", r"\+")
        self.job2_iexec_host_esc = self.job2_iexec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job2_iexec_vnode_esc = self.job2_iexec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        # expected values version upon successful job launch
        self.job2_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=0:mem=2gb"
        self.job2_schedselect = self.job2_select
        self.job2_exec_host = "%s/0*0+%s/0*3+%s/0*0" % (
            self.nA, self.nD, self.nE)

        # ncpus=0 assigned hosts are not listed in $PBS_NODEFILE
        self.job2_exec_host_nfile = "%s/0*0+%s/0*3" % (
            self.nA, self.nD)

        self.job2_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:mem=1048576kb+" % (self.nE,) + \
            "%s:mem=1048576kb)" % (self.nEv0,)

        self.job2_sel_esc = self.job2_select.replace("+", r"\+")
        self.job2_exec_host_esc = self.job2_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job2_exec_vnode_esc = self.job2_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        self.script['job2'] = \
            "#PBS -l select=" + self.job2_oselect + "\n" + \
            "#PBS -l place=" + self.job2_place + "\n" + \
            SLEEP_CMD + " 60\n"

        # Job with mpiprocs and ompthreads requested
        self.job3_oselect = \
            "ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+" + \
            "ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+" + \
            "ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"
        self.job3_place = "scatter"
        # incremented values at job start and just before actual launch
        self.job3_iselect = \
            "1:ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+" + \
            "2:ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+" + \
            "2:ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"
        self.job3_ischedselect = self.job3_iselect
        self.job3_iexec_host = \
            "%s/0*0+%s/0*0+%s/0*3+%s/0*2+%s/0*0" % (
                self.nA, self.nB, self.nD, self.nC, self.nE)
        self.job3_iexec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:ncpus=2:mem=2097152kb)+" % (self.nC,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nE,) + \
            "%s:mem=1048576kb:ncpus=1)" % (self.nEv0,)

        # expected values version 6 upon successful job launch
        self.job3_select = \
            "1:ncpus=3:mem=2gb:mpiprocs=3:ompthreads=2+" + \
            "1:ncpus=3:mem=2gb:mpiprocs=3:ompthreads=3+" + \
            "1:ncpus=2:mem=2gb:mpiprocs=2:ompthreads=2"

        self.job3_schedselect = self.job3_select
        self.job3_exec_host = "%s/0*0+%s/0*3+%s/0*0" % (
            self.nA, self.nD, self.nE)
        self.job3_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nE,) + \
            "%s:mem=1048576kb:ncpus=1)" % (self.nEv0,)

        self.job3_sel_esc = self.job3_select.replace("+", r"\+")
        self.job3_exec_host_esc = self.job3_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job3_exec_vnode_esc = self.job3_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        self.job3_isel_esc = self.job3_iselect.replace("+", r"\+")
        self.job3_iexec_host_esc = self.job3_iexec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job3_iexec_vnode_esc = self.job3_iexec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        self.script['job3'] = \
            "#PBS -l select=" + self.job3_oselect + "\n" + \
            "#PBS -l place=" + self.job3_place + "\n" + \
            SLEEP_CMD + " 300\n"

        self.job3_ischedselect = self.job3_iselect

        self.job4_oselect = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=2:mem=2gb"
        self.job4_place = "scatter:excl"
        self.job4_iselect = \
            "1:ncpus=3:mem=2gb+2:ncpus=3:mem=2gb+2:ncpus=2:mem=2gb"
        self.job4_ischedselect = self.job4_iselect
        self.job4_iexec_host = \
            "%s/0*0+%s/0*0+%s/0*3+%s/0*2+%s/0*0" % (
                self.nA, self.nB, self.nD, self.nC, self.nE)
        self.job4_iexec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:ncpus=2:mem=2097152kb)+" % (self.nC,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nE,) + \
            "%s:mem=1048576kb:ncpus=1)" % (self.nEv0,)

        # expected values upon successful job launch
        self.job4_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job4_schedselect = "1:ncpus=3:mem=2gb+" + \
            "1:ncpus=3:mem=2gb+1:ncpus=2:mem=2gb"
        self.job4_exec_host = "%s/0*0+%s/0*3+%s/0*0" % (
            self.nA, self.nD, self.nE)
        self.job4_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nE,) + \
            "%s:mem=1048576kb:ncpus=1)" % (self.nEv0,)

        self.script['job4'] = \
            "#PBS -l select=" + self.job4_oselect + "\n" + \
            "#PBS -l place=" + self.job4_place + "\n" + \
            SLEEP_CMD + " 300\n"

        self.job4_sel_esc = self.job4_select.replace("+", r"\+")
        self.job4_exec_host_esc = self.job4_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job4_exec_vnode_esc = self.job4_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        self.job4_isel_esc = self.job4_iselect.replace("+", r"\+")
        self.job4_iexec_host_esc = self.job4_iexec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job4_iexec_vnode_esc = self.job4_iexec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        self.job5_oselect = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=2:mem=2gb"
        self.job5_place = "free"
        self.job5_iselect = \
            "1:ncpus=3:mem=2gb+2:ncpus=3:mem=2gb+2:ncpus=2:mem=2gb"
        self.job5_ischedselect = self.job5_iselect
        self.job5_iexec_host = \
            "%s/0*0+%s/0*0+%s/0*3+%s/1*0+%s/0*2" % (
                self.nA, self.nB, self.nD, self.nB, self.nC)
        self.job5_iexec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:ncpus=3:mem=2097152kb)+" % (self.nD,) + \
            "(%s:mem=1048576kb+" % (self.nBv1,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv2,) + \
            "%s:ncpus=1)+" % (self.nBv3,) + \
            "(%s:ncpus=2:mem=2097152kb)" % (self.nC,)

        # expected values upon successful job launch
        self.job5_select = \
            "1:ncpus=3:mem=2gb+1:ncpus=3:mem=2gb+1:ncpus=1:mem=1gb"
        self.job5_schedselect = self.job5_select
        self.job5_exec_host = "%s/0*0+%s/0*0+%s/1*0" % (
            self.nA, self.nB, self.nB)
        self.job5_exec_vnode = \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nAv0,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nAv1,) + \
            "%s:ncpus=1)+" % (self.nAv2) + \
            "(%s:mem=1048576kb:ncpus=1+" % (self.nB,) + \
            "%s:mem=1048576kb:ncpus=1+" % (self.nBv0,) + \
            "%s:ncpus=1)+" % (self.nBv1,) + \
            "(%s:mem=1048576kb+" % (self.nBv1,) + \
            "%s:ncpus=1)" % (self.nBv2,)

        self.script['job5'] = \
            "#PBS -l select=" + self.job5_oselect + "\n" + \
            "#PBS -l place=" + self.job5_place + "\n" + \
            SLEEP_CMD + " 300\n"

        self.job5_sel_esc = self.job5_select.replace("+", r"\+")
        self.job5_exec_host_esc = self.job5_exec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job5_exec_vnode_esc = self.job5_exec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        self.job5_isel_esc = self.job5_iselect.replace("+", r"\+")
        self.job5_iexec_host_esc = self.job5_iexec_host.replace(
            "*", r"\*").replace("[", r"\[").replace("]", r"\]").replace(
                    "+", r"\+")
        self.job5_iexec_vnode_esc = self.job5_iexec_vnode.replace(
            "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
            ")", r"\)").replace("+", r"\+")

        # queuejob hooks used throughout the test
        self.qjob_hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "queuejob hook executed")
# Save current select spec in resource 'site'
e.job.Resource_List["site"] = str(e.job.Resource_List["select"])
new_select = e.job.Resource_List["select"].increment_chunks(1)
e.job.Resource_List["select"] = new_select
e.job.tolerate_node_failures = "job_start"
"""
        self.qjob_hook_body2 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "queuejob hook executed")
# Save current select spec in resource 'site'
e.job.Resource_List["site"] = str(e.job.Resource_List["select"])
new_select = e.job.Resource_List["select"].increment_chunks(1)
e.job.Resource_List["select"] = new_select
e.job.tolerate_node_failures = "all"
"""
        # begin hooks used throughout the test
        self.begin_hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing begin")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    e.reject("bad node")
""" % (self.nB,)
        # The below hook may not really be doing anything, but is
        # used in a test of the sister join job alarm time with
        # the hook's alarm value.
        self.begin_hook_body2 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing begin")
localnode=pbs.get_local_nodename()
"""
        self.begin_hook_body3 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing begin")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    x
""" % (self.nE,)

        self.begin_hook_body4 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing begin")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    e.reject("bad node")
""" % (self.nD,)

        self.begin_hook_body5 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing begin")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    e.reject("bad node")
""" % (self.nC,)

        # prologue hooks used throughout the test
        self.prolo_hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prolo")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list_fail[" + v.name + "]")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    e.reject("bad node")
""" % (self.nC,)

        self.prolo_hook_body2 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prologue")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    x
""" % (self.nC,)

        self.prolo_hook_body3 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prolo")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list_fail[" + v.name + "]")
localnode=pbs.get_local_nodename()
"""
        self.prolo_hook_body4 = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prolo")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list_fail[" + v.name + "]")
localnode=pbs.get_local_nodename()

if e.job.in_ms_mom():
    pj = e.job.release_nodes(keep_select=e.job.Resource_List["site"])
    if pj != None:
        pbs.logjobmsg(e.job.id, "prolo: job.exec_vnode=%s" % (pj.exec_vnode,))
        pbs.logjobmsg(e.job.id, "prolo: job.exec_host=%s" % (pj.exec_host,))
        pbs.logjobmsg(e.job.id,
                      "prolo: job.schedselect=%s" % (pj.schedselect,))
    else:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at PROLOGUE")
"""
        self.prolo_hook_body5 = """
import pbs
import time
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prolo")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "prolo: found vnode_list_fail[" + v.name + "]")
if not e.job.in_ms_mom():
    pbs.logjobmsg(e.job.id, "sleeping for 30 secs")
    time.sleep(30)
"""

        # launch hooks used throughout the test
        self.launch_hook_body = """
import pbs
e=pbs.event()

if 'PBS_NODEFILE' not in e.env:
    e.accept()

pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
if e.job.in_ms_mom():
    pj = e.job.release_nodes(keep_select=e.job.Resource_List["site"])
    if pj != None:
        pbs.logjobmsg(e.job.id, "launch: job.exec_vnode=%s" % (pj.exec_vnode,))
        pbs.logjobmsg(e.job.id, "launch: job.exec_host=%s" % (pj.exec_host,))
        pbs.logjobmsg(e.job.id,
                      "launch: job.schedselect=%s" % (pj.schedselect,))
    else:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at LAUNCH")
"""

        self.launch_hook_body2 = """
import pbs
e=pbs.event()

if 'PBS_NODEFILE' not in e.env:
    e.accept()

pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
if e.job.in_ms_mom():
    new_sel = "ncpus=3:mem=2gb+ncpus=3:mem=2gb+ncpus=1:mem=1gb"
    pj = e.job.release_nodes(keep_select=new_sel)
    if pj != None:
        pbs.logjobmsg(e.job.id, "launch: job.exec_vnode=%s" % (pj.exec_vnode,))
        pbs.logjobmsg(e.job.id, "launch: job.exec_host=%s" % (pj.exec_host,))
        pbs.logjobmsg(e.job.id,
                      "launch: job.schedselect=%s" % (pj.schedselect,))
    else:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at LAUNCH")
"""
        self.stime = time.time()

    def tearDown(self):
        self.momA.signal("-CONT")
        self.momB.signal("-CONT")
        self.momC.signal("-CONT")
        self.momD.signal("-CONT")
        self.momE.signal("-CONT")
        self.momA.unset_mom_config('$sister_join_job_alarm', False)
        self.momA.unset_mom_config('$job_launch_delay', False)
        a = {'state': (DECR, 'offline')}
        self.server.manager(MGR_CMD_SET, NODE, a, self.momA.shortname)
        self.server.manager(MGR_CMD_SET, NODE, a, self.momB.shortname)
        self.server.manager(MGR_CMD_SET, NODE, a, self.momC.shortname)
        self.server.manager(MGR_CMD_SET, NODE, a, self.momD.shortname)
        self.server.manager(MGR_CMD_SET, NODE, a, self.momE.shortname)
        TestFunctional.tearDown(self)
        # Delete managers and operators if added
        attrib = ['operators', 'managers']
        self.server.manager(MGR_CMD_UNSET, SERVER, attrib)

    @timeout(400)
    def test_t1(self):
        """
        Test tolerating job_start 2 node failures after adding
             extra nodes to the job, pruning
             job's assigned resources to match up to the original
             select spec, and offlining the failed vnodes.

             1.	Have a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=job_start

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                 chunk C.

             3. Have an execjob_begin hook that fails (causes rejection)
                when executed by mom managing vnodes in (B).

             4. Have an execjob_prologue hook that fails (causes rejection)
                when executed by mom managing vnodes in (C).

             5. Then create an execjob_launch hook that offlines the failed
                nodes (B) and (C), and prunes back the job's exec_vnode
                assignment back to satisfying the original 3-node select
                spec, choosing only healthy nodes.

             6. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(D)+(E)

                   since (B) and (C) contain vnodes from failed moms.

                b. vnodes in (B) and (C) are now showing a state of
                   "offline".
                c. The accounting log start record 'S' will reflect the
                   select request where additional chunks were added, while
                   the secondary start record 's' will reflect the assigned
                   resources after pruning the original select request via
                   the pbs.release_nodes(keep_select=...) call
                   inside execjob_launch hook.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_body = """
import pbs
e=pbs.event()

if 'PBS_NODEFILE' not in e.env:
    e.accept()

pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch:offline vnode_list_fail[" + v.name + "]")
    v.state = pbs.ND_OFFLINE
if e.job.in_ms_mom():
    pj = e.job.release_nodes(keep_select=e.job.Resource_List["site"])
    if pj != None:
        pbs.logjobmsg(e.job.id, "launch: job.exec_vnode=%s" % (pj.exec_vnode,))
        pbs.logjobmsg(e.job.id, "launch: job.exec_host=%s" % (pj.exec_host,))
        pbs.logjobmsg(e.job.id,
                      "launch: job.schedselect=%s" % (pj.schedselect,))
    else:
        e.job.Hold_Types = pbs.hold_types("s")
        e.job.rerun()
        e.reject("unsuccessful at LAUNCH")
"""
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nE, self.nEv0],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nBv2, self.nBv3,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        self.match_vnode_status([self.nB, self.nBv0, self.nBv1, self.nC],
                                'offline')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)
        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_prologue hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;prolo: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1, self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match(
                "Job;%s;launch:offline vnode_list_fail[%s]" % (jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momD.hostname, self.momE.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momD.shortname, self.momE.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname,
            self.momE.hostname, self.momE.hostname, self.momE.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    @timeout(400)
    def test_t2(self):
        """
        Test tolerating job_start 2 node failures after adding
             extra nodes to the job, pruning
             job's assigned resources to match up to the original
             select spec, without offlining the failed vnodes, and
             specifying mom config file options 'sister_join_job_alarm' and
             'job_launch_delay'.

             1. Set $sister_join_job_alarm and $job_launch_delay values
                in mom's config file.

             2.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=job_start

             3. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                chunk C.

             4. Prior to submitting a job, suspend mom B. When job runs,
                momB won't be able to join the job, so it won't be considered
                as a "healthy" mom.

             5. Have an execjob_begin hook that doesn't fail.

             6. Have an execjob_prologue hook that fails (causes rejection)
                when executed by mom managing vnodes in (C).

             7. Have an execjob_launch hook that prunes back the
                job's exec_vnode assignment back to satisfying the original
                3-node select spec, choosing only healthy nodes.

             8. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(D)+(E)

                   since (B) and (C) contain vnodes from failed moms.

                b. vnodes in (B) and (C) are now showing a state of "free".

                c. Mom's log file will show explicit values to
                   $sister_join_job_alarm and $job_launch_delay.

                c. The accounting log start record 'S' will reflect the
                   select request where additional chunks were added, while
                   the secondary start record 's' will reflect the assigned
                   resources after pruning the original select request via
                   the pbs.release_nodes(keep_select=...) call
                   inside execjob_launch hook.
        """
        # set mom config options:
        sis_join_alarm = 45
        c = {'$sister_join_job_alarm': sis_join_alarm}
        self.momA.add_config(c)

        job_launch_delay = 40
        c = {'$job_launch_delay': job_launch_delay}
        self.momA.add_config(c)

        self.momA.signal("-HUP")

        self.momA.log_match(
            "sister_join_job_alarm;%d" % (sis_join_alarm,), max_attempts=5,
            interval=5)
        self.momA.log_match(
            "job_launch_delay;%d" % (job_launch_delay,),
            max_attempts=5, interval=5)

        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body2)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # temporarily suspend momB, simulating a failed mom host.
        self.momB.signal("-STOP")
        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        # Set time to start scanning logs
        stime = time.time()

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND,
                           max_attempts=100)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Verify the logs and make sure sister_join_job_alarm is honored
        logs = self.mom.log_match(
            "Executing begin",
            allmatch=True, starttime=stime, max_attempts=8)
        log1 = logs[0][1]
        logs = self.mom.log_match(
            "Executing prolo",
            allmatch=True, starttime=stime, max_attempts=8)
        log2 = logs[0][1]
        tmp = log1.split(';')
        # Convert the time into epoch time
        time1 = int(self.logutils.convert_date_time(tmp[0]))
        tmp = log2.split(';')
        time2 = int(self.logutils.convert_date_time(tmp[0]))

        diff = time2 - time1
        self.logger.info(
            "Time diff between begin hook and prologue hook is " +
            str(diff) + " seconds")
        # Leave a little wiggle room for slow systems
        self.assertTrue((diff >= sis_join_alarm) and
                        diff <= (sis_join_alarm + 5))

        self.mom.log_match(
            "sister_join_job_alarm wait time %d secs exceeded" % (
                sis_join_alarm,), starttime=stime, max_attempts=8)

        # Verify the logs and make sure job_launch_delay is honored
        logs = self.mom.log_match(
            "Executing prolo",
            allmatch=True, starttime=stime, max_attempts=8)
        log1 = logs[0][1]
        logs = self.mom.log_match(
            "Executing launch",
            allmatch=True, starttime=stime, max_attempts=8)
        log2 = logs[0][1]
        tmp = log1.split(';')
        # Convert the time into epoch time
        time1 = int(self.logutils.convert_date_time(tmp[0]))
        tmp = log2.split(';')
        time2 = int(self.logutils.convert_date_time(tmp[0]))

        diff = time2 - time1
        self.logger.info("Time diff between prolo hook and launch hook is " +
                         str(diff) + " seconds")
        # Leave a little wiggle room for slow systems
        self.assertTrue((diff >= job_launch_delay) and
                        diff <= (job_launch_delay + 3))

        self.momA.log_match(
            "not all prologue hooks to sister moms completed, " +
            "but job will proceed to execute", n=10)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nE, self.nEv0],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nC,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)
        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momD.hostname, self.momE.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momD.shortname, self.momE.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname,
            self.momE.hostname, self.momE.hostname, self.momE.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    @timeout(400)
    def test_t3(self):
        """
        Test: tolerating job_start 2 node failures after adding
              extra nodes to the job, pruning
              job's assigned resources to match up to the original
              select spec, without offlining the failed vnodes, and
              with 2 execjob_prologue hooks, with prologue hook1
              having alarm1 and prologue hook2 having alarm2.
              This also test the default value to sister_join_job_alarm.

             1.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=job_start

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                chunk C.

             3. Prior to submitting a job, suspend mom B. When job runs,
                momB won't be able to join the job, so it won't be considered
                as a "healthy" mom.

             4. Have an execjob_prologue hook that doesn't fail any mom host
                with alarm=alarm1, order=1.

             5. Have an execjob_prologue hook2 with alarm=alarm2, order=2,
                that fails (causes rejection) when executed by mom managing
                vnodes in (C).

             6. Have an execjob_launch hook that prunes back the
                job's exec_vnode assignment back to satisfying the original
                3-node select spec, choosing only healthy nodes.

             7. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(D)+(E)

                   since (B) and (C) contain vnodes from failed moms.

                b. vnodes in (B) and (C) are now showing a state of "free".

                c. Mom's log file shows the wait time from execjob_prologue
                   hook1 execution and the execution of the exescjob_launch
                   hook is no more than alarm1+alarm2.

                c. The accounting log start record 'S' will reflect the
                   select request where additional chunks were added, while
                   the secondary start record 's' will reflect the assigned
                   resources after pruning the original select request via
                   the pbs.release_nodes(keep_select=...) call
                   inside execjob_launch hook.
        """

        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body2)

        # instantiate execjob_prologue hook #1
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prolo1")
localnode=pbs.get_local_nodename()
"""
        hook_event = "execjob_prologue"
        hook_name = "prolo1"
        alarm1 = 17
        a = {'event': hook_event, 'enabled': 'true', 'order': 1,
             'alarm': alarm1}
        self.server.create_import_hook(hook_name, a, hook_body)

        # instantiate execjob_prologue hook #2
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prolo2")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "prolo2: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "prolo2: found vnode_list_fail[" + v.name + "]")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    x
""" % (self.nC,)
        hook_event = "execjob_prologue"
        hook_name = "prolo2"
        alarm2 = 16
        a = {'event': hook_event, 'enabled': 'true', 'order': 2,
             'alarm': alarm2}
        self.server.create_import_hook(hook_name, a, hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # temporarily suspend momB, simulating a failed mom host.
        self.momB.signal("-STOP")

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        # Set time to start scanning logs
        stime = time.time()

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND,
                           max_attempts=100)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Verify the logs and make sure sister_join_job_alarm is honored
        logs = self.mom.log_match(
            "Executing begin",
            allmatch=True, starttime=stime, max_attempts=8)
        log1 = logs[0][1]
        logs = self.mom.log_match(
            "Executing prolo1",
            allmatch=True, starttime=stime, max_attempts=8)
        log2 = logs[0][1]
        tmp = log1.split(';')
        # Convert the time into epoch time
        time1 = int(self.logutils.convert_date_time(tmp[0]))
        tmp = log2.split(';')
        time2 = int(self.logutils.convert_date_time(tmp[0]))

        diff = time2 - time1
        self.logger.info(
            "Time diff between begin hook and prologue hook is " +
            str(diff) + " seconds")
        # Leave a little wiggle room for slow systems

        # test default sister_join_job_alarm value
        sis_join_alarm = 30
        self.assertTrue((diff >= sis_join_alarm) and
                        diff <= (sis_join_alarm + 5))

        self.mom.log_match(
            "sister_join_job_alarm wait time %d secs exceeded" % (
                sis_join_alarm,), starttime=stime, max_attempts=8)

        # Verify the logs and make sure job_launch_delay is honored
        logs = self.mom.log_match(
            "Executing prolo1",
            allmatch=True, starttime=stime, max_attempts=8)
        log1 = logs[0][1]
        logs = self.mom.log_match(
            "Executing launch",
            allmatch=True, starttime=stime, max_attempts=8)
        log2 = logs[0][1]
        tmp = log1.split(';')
        # Convert the time into epoch time
        time1 = int(self.logutils.convert_date_time(tmp[0]))
        tmp = log2.split(';')
        time2 = int(self.logutils.convert_date_time(tmp[0]))

        diff = time2 - time1
        self.logger.info(
            "Time diff between prolo1 hook and launch hook is " +
            str(diff) + " seconds")
        # Leave a little wiggle room for slow systems
        job_launch_delay = alarm1 + alarm2
        self.assertTrue((diff >= job_launch_delay) and
                        diff <= (job_launch_delay + 3))

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nE, self.nEv0],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nC,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)

        self.momA.log_match(
            "not all prologue hooks to sister moms completed, " +
            "but job will proceed to execute", n=10)

        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo2: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match(
                "Job;%s;launch: found vnode_list_fail[%s]" % (jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momD.hostname, self.momE.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momD.shortname, self.momE.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname,
            self.momE.hostname, self.momE.hostname, self.momE.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    @timeout(400)
    def test_t4(self):
        """
        Test: tolerating job_start 1 node failure that is used
              to satisfy a multi-chunk request, after adding
              extra nodes to the job, pruning
              job's assigned resources to match up to the original
              select spec.

             1.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=job_start

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                chunk C.

             3. Have an execjob_begin hook that fails (causes rejection)
                when executed by mom managing vnodes in (B).

             4. Then create an execjob_launch hook that
                prunes back the job's exec_vnode assignment back to
                satisfying the original 3-node select spec,
                choosing only healthy nodes.

             5. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(D)+(C)

                   since (B) contain vnodes from failed moms.

                b. The accounting log start record 'S' will reflect the
                   select request where additional chunks were added, while
                   the secondary start record 's' will reflect the assigned
                   resources after pruning the original select request via
                   the pbs.release_nodes(keep_select=...) call
                   inside execjob_launch hook.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1v2_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1v2_schedselect,
                                 'exec_host': self.job1v2_exec_host,
                                 'exec_vnode': self.job1v2_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=70)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.nC], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nE,
                                 self.nEv0, self.nEv1, self.nEv2,
                                 self.nEv3], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1v2_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1v2_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v2_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v2_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v2_exec_host_esc,
                                  self.job1v2_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1v2_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momD.hostname, self.momC.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momD.shortname, self.momC.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname,
            self.momC.hostname, self.momC.hostname, self.momC.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    @timeout(400)
    def test_t5(self):
        """
        Test: tolerating job_start 1 node failure used in a regular
              chunk after adding extra nodes to the job, pruning
             job's assigned resources to match up to the original
             select spec.

             1.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=job_start

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                chunk C.

             3. Have an execjob_prologue hook that fails (causes
                rejection) when executed by mom managing vnodes in (C).

             4. Then create an execjob_launch hook that
                prunes back the job's exec_vnode assignment back to
                satisfying the original 3-node select spec,
                choosing only healthy nodes.

             5. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(B)+(E)

                   since (C) contain vnodes from failed moms.

                b. The accounting log start record 'S' will reflect the
                   select request where additional chunks were added, while
                   the secondary start record 's' will reflect the assigned
                   resources after pruning the original select request via
                   the pbs.release_nodes(keep_select=...) call
                   inside execjob_launch hook.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body2)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1v3_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1v3_schedselect,
                                 'exec_host': self.job1v3_exec_host,
                                 'exec_vnode': self.job1v3_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=70)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1, self.nB, self.nBv0,
                                 self.nE, self.nEv0], 'job-busy', jobs_assn1,
                                1, '1048576kb')

        self.match_vnode_status([self.nAv2, self.nBv1],
                                'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nBv2, self.nBv3,
                                 self.nC, self.nD, self.nEv1, self.nEv2,
                                 self.nEv3], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1v3_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match(
                "Job;%s;launch: found vnode_list_fail[%s]" % (jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
                            jid, self.job1v3_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v3_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
                            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v3_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v3_exec_host_esc,
                                  self.job1v3_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1v3_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momB.hostname, self.momE.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momB.shortname, self.momE.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momB.hostname, self.momB.hostname, self.momB.shortname,
            self.momE.hostname, self.momE.hostname, self.momE.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    def test_t6(self):
        """
        Test: tolerating job_start of 2 node failures used to
              satisfy the smaller chunks, after adding extra nodes
              to the job, pruning job's assigned resources to match up
              to the original select spec.

             1.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=job_start

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                chunk C. (C) and (E) are of smaller chunks than (B)
                and (D). For example:
                    (D) =  "(nadal:ncpus=3:mem=2097152kb)"
                    (C) =  "(lendl:ncpus=2:mem=2097152kb)"

             3. Have an execjob_begin hook that fails (causes
                rejection) when executed by mom managing vnodes in (C).

             4. Have an execjob_prologue hook that fails (causes
                rejection) when executed by mom managing vnodes in (E).

             5. Then create an execjob_launch hook that
                prunes back the job's exec_vnode assignment back to
                satisfying the original 3-node select spec,
                choosing only healthy nodes.

             6. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(B)+(D)

                   since (C) and (E) contain vnodes from failed moms.
                   Note that from (D), only allocate enough resources
                   to satisfy the smaller third requested chunk.
                   if (D) originally has "(nadal:ncpus=3:mem=2097152kb)",
                   reassigning this would only be
                   "(nadal:ncpus=2:mem=2097152kb)".

                b. The accounting log start record 'S' will reflect the
                   select request where additional chunks were added, while
                   the secondary start record 's' will reflect the assigned
                   resources after pruning the original select request via
                   the pbs.release_nodes(keep_select=...) call
                   inside execjob_launch hook.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body3)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body2)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1v4_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1v4_schedselect,
                                 'exec_host': self.job1v4_exec_host,
                                 'exec_vnode': self.job1v4_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=70)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1, self.nB, self.nBv0],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.nAv2, self.nBv1],
                                'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nBv2, self.nBv3,
                                 self.nC, self.nD, self.nEv1, self.nEv2,
                                 self.nEv3], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1v4_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostE), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostE) +
            "is tolerant of node failures",
            regexp=True, n=10)

        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nC, self.nE]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1v4_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v4_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v4_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v4_exec_host_esc,
                                  self.job1v4_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1v4_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momB.hostname, self.momD.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momB.shortname, self.momD.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momB.hostname, self.momB.hostname, self.momB.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    def test_t7(self):
        """
        Test: tolerating job_start of 2 node failures used to
              satisfy the larger chunks, after adding extra nodes
              to the job. Pruning job's assigned resources to match up
              to the original select spec would fail, as the
              unsatisfied chunk requests cannot be handled by
              by the remaining smaller sized nodes. The failure
              to prune job is followed by a pbs.event().rerun()
              action and a job hold. Also, this test
              setting tolerate_node_falures=none.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_prologue hook
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing prologue")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    x
""" % (self.nD,)
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostD) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostD) +
            "as job is tolerant of node failures", n=10, regexp=True)

        self.momA.log_match("Job;%s;could not satisfy select chunk" % (jid,),
                            n=10)

        self.momA.log_match("Job;%s;NEED chunks for keep_select" % (jid,),
                            n=10)

        self.momA.log_match(
            "Job;%s;HAVE chunks from job's exec_vnode" % (jid,), n=10)

        self.momA.log_match("execjob_launch request rejected by 'launch'",
                            n=10)

        errmsg = "unsuccessful at LAUNCH"
        self.momA.log_match("Job;%s;%s" % (jid, errmsg,), n=10)
        self.server.expect(JOB, {'job_state': 'H'},
                           id=jid, interval=1, max_attempts=70)

        # turn off queuejob
        self.server.manager(MGR_CMD_SET, HOOK, {'enabled': 'false'}, 'qjob')

        # modify job so as to not tolerate_node_failures
        a = {ATTR_tolerate_node_failures: "none"}
        self.server.alterjob(jobid=jid, attrib=a)

        # release hold on job
        self.server.rlsjob(jobid=jid, holdtype='s')

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+could not JOIN_JOB" % (
                jid), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostE) +
            "is tolerant of node failures",
            regexp=True, n=10, existence=False, max_attempts=10)

        self.server.expect(JOB, {'job_state': 'H'},
                           id=jid, interval=1, max_attempts=30)

        # turn off begin hook, leaving prologue hook in place
        self.server.manager(MGR_CMD_SET, HOOK, {'enabled': 'false'}, 'begin')

        # release hold on job
        self.server.rlsjob(jobid=jid, holdtype='s')

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.momA.log_match(
            "Job;%s;job_start_error.+could not IM_EXEC_PROLOGUE" % (jid,),
            n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True,
            existence=False, max_attempts=10)

        self.server.expect(JOB, {'job_state': 'H'},
                           id=jid, interval=1, max_attempts=15)

        # turn off prologue hook, so only launch hook remains.
        self.server.manager(MGR_CMD_SET, HOOK, {'enabled': 'false'}, 'prolo')

        # release hold on job
        self.server.rlsjob(jobid=jid, holdtype='s')

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'none',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'exec_host': self.job1_iexec_host,
                                 'exec_vnode': self.job1_iexec_vnode,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        # tolerate_node_failures=none and launch hook calls release_nodes()
        emsg = "no nodes released as job does not tolerate node failures"
        self.momA.log_match("%s: %s" % (jid, emsg), n=30)

    def test_t8(self):
        """
        Test tolerating node failures at job startup with no
             failed moms.

             1.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=all

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                 chunk C.

             3. Have an execjob_begin, execjob_prologue hooks that don't
                fail any of the sister moms.
                when executed by mom managing vnodes in (C).

             4. Then create an execjob_launch that prunes back the job's
                exec_vnode assignment back to satisfying the original 3-node
                select spec, choosing only healthy nodes.

             5. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(B)+(C)

                b. The accounting log start record 'S' will reflect the
                   select request where additional chunks were added, while
                   the secondary start record 's' will reflect the assigned
                   resources after pruning the original select request via
                   the pbs.release_nodes(keep_select=...) call
                   inside execjob_launch hook.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body2)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body3)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1v5_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1v5_schedselect,
                                 'exec_host': self.job1v5_exec_host,
                                 'exec_vnode': self.job1v5_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nB, self.nBv0],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2, self.nBv1],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)

        self.match_vnode_status([self.nC], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nBv2, self.nBv3,
                                 self.nE, self.nEv0, self.nEv1, self.nEv2,
                                 self.nEv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1v5_exec_host))

        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1v5_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v5_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v5_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v5_exec_host_esc,
                                  self.job1v5_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1v5_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momB.hostname, self.momC.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momB.shortname, self.momC.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momB.hostname, self.momB.hostname, self.momB.shortname,
            self.momC.hostname, self.momC.hostname, self.momC.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    @timeout(400)
    def test_t9(self):
        """
        Test tolerating 'all' node failures at job startup and
             within the life of the job.

             1.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=all

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                chunk C.

             3. Have an execjob_begin hook that fails (causes rejection)
                when executed by mom managing vnodes in (B).

             4. Have an execjob_prologue hook that fails (causes rejection)
                when executed by mom managing vnodes in (C).

             5. Then create an execjob_launch that prunes back the job's
                exec_vnode assignment back to satisfying the original 3-node
                select spec, choosing only healthy nodes.

             6. Now kill -KILL mom host hostD.

             7. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(D)+(E)

                   since (B) and (C) contain vnodes from failed moms.

                b. Job continues to run even after nodeD goes down with
                   only an indication in mom_logs with the message:
                   im_eof, Premature end of message from addr n stream 4

        """
        # set this so as to not linger on delaying job kill.
        c = {'$max_poll_downtime': 10}
        self.momA.add_config(c)

        # instantiate queuejob hook, tolerate_node_failure is set to 'all'
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body2)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1_2')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'all',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'all',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nE, self.nEv0],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nC,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)
        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_prologue hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;prolo: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1, self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match(
                "Job;%s;launch: found vnode_list_fail[%s]" % (jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # temporarily suspend momD, simulating a failed mom host.
        self.momD.signal("-KILL")
        self.momA.log_match("im_eof, Premature end of message.+on stream 4",
                            n=10, max_attempts=30, interval=2, regexp=True)

        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 2 hostname
%s
""" % (jid, self.momA.hostname, self.momD.hostname, self.momE.hostname,
            self.fib37_value, self.fib37_value, self.momA.shortname,
            self.momE.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)
        self.momD.start()

    def test_t10(self):
        """
        Test tolerating node failures at job startup but also
             cause a failure on one of the nodes after the job has
             started.

             1.	Submit a job that has been submitted with a select
                spec of 2 super-chunks say (A) and (B), and 1 chunk
                of (C), along with place spec of "scatter",
                resulting in the following assignment:

                    exec_vnode = (A)+(B)+(C)

                and -Wtolerate_node_failures=all

             2. Have a queuejob hook that adds 1 extra node to each
                chunk (except the MS (first) chunk), resulting in the
                assignment:

                    exec_vnode = (A)+(B)+(D)+(C)+(E)

                where D mirrors super-chunk B specs while E mirrors
                chunk C.

             3. Have an execjob_begin hook that fails (causes rejection)
                when executed by mom managing vnodes in (B).

             4. Have an execjob_prologue hook that fails (causes rejection)
                when executed by mom managing vnodes in (C).

             5. Then create an execjob_launch that prunes back the job's
                exec_vnode assignment back to satisfying the original 3-node
                select spec, choosing only healthy nodes.

             6. Now kill -KILL mom host hostD.

             7. Result:

                a. This results in the following reassignment of chunks:

                   exec_vnode = (A)+(D)+(E)

                   since (B) and (C) contain vnodes from failed moms.

                b. Job eventually aborts after nodeD goes down with
                   an indication in mom_logs with the message:
                   "im_eof, lost communication with <host>"
                   "node EOF 1 (<host>)"
                   "kill_job"

        """
        # set this so as to not linger on delaying job kill.
        c = {'$max_poll_downtime': 10}
        self.momA.add_config(c)

        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1_3')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_schedselect,
                                 'exec_host': self.job1_exec_host,
                                 'exec_vnode': self.job1_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nE, self.nEv0],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nC,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)
        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_prologue hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;prolo: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1, self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1_exec_host_esc,
                                  self.job1_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1_sel_esc)

        # temporarily suspend momD, simulating a failed mom host.
        self.momD.signal("-KILL")

        self.momA.log_match(
            "Job;%s;im_eof, lost communication with %s.+killing job now" % (
                jid, self.nD), n=10, max_attempts=30, interval=2, regexp=True)

        self.momA.log_match("Job;%s;kill_job" % (jid,),
                            n=10, max_attempts=60, interval=2)
        self.momD.start()

    def test_t11(self):
        """
        Test: tolerating node failures at job startup with
              job having an ncpus=0 assignment. This ensures
              the hooks will have the info for the ncpus=0 chunks
              in pbs.event().vnode_list[].
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job2')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 9,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job2_iselect,
                                 'Resource_List.site': self.job2_oselect,
                                 'Resource_List.place': self.job2_place,
                                 'schedselect': self.job2_ischedselect},
                           max_attempts=10, id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 6,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job2_select,
                                 'Resource_List.place': self.job2_place,
                                 'schedselect': self.job2_schedselect,
                                 'exec_host': self.job2_exec_host,
                                 'exec_vnode': self.job2_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nE, self.nEv0],
                                'free', jobs_assn1, 0, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nC,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 6,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 6,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job2_exec_host_nfile))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)
        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_prologue hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;prolo: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1, self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match(
                "Job;%s;launch: found vnode_list_fail[%s]" % (jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job2_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job2_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job2_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job2_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job2_iexec_host_esc,
                                  self.job2_iexec_vnode_esc, "10gb", 9, 5,
                                  self.job2_place,
                                  self.job2_isel_esc)

        self.match_accounting_log('s', jid, self.job2_exec_host_esc,
                                  self.job2_exec_vnode_esc,
                                  "6gb", 6, 3,
                                  self.job2_place,
                                  self.job2_sel_esc)

    def test_t12(self):
        """
        Test: tolerating node failures at job startup with
              extra resources requested such as mpiprocs and
              ompthtreads which would affect content of $PBS_NODEFILE.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job3')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job3_iselect,
                                 'Resource_List.site': self.job3_oselect,
                                 'Resource_List.place': self.job3_place,
                                 'schedselect': self.job3_ischedselect},
                           max_attempts=10, id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job3_select,
                                 'Resource_List.place': self.job3_place,
                                 'schedselect': self.job3_schedselect,
                                 'exec_host': self.job3_exec_host,
                                 'exec_vnode': self.job3_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nE, self.nEv0],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nC,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job3_exec_host,
                                              self.job3_schedselect))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)
        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_prologue hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;prolo: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1, self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job3_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job3_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job3_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job3_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job3_iexec_host_esc,
                                  self.job3_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job3_place,
                                  self.job3_isel_esc)

        self.match_accounting_log('s', jid, self.job3_exec_host_esc,
                                  self.job3_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job3_place,
                                  self.job3_sel_esc)

    def test_t13(self):
        """
        Test: pbs.event().job.select.increment_chunks() method.
        """
        # instantiate queuejob hook
        hook_body = """
import pbs
e=pbs.event()
sel=pbs.select("ncpus=3:mem=1gb+1:ncpus=2:mem=2gb+2:ncpus=1:mem=3gb")
inp=2
isel=sel.increment_chunks(inp)
pbs.logmsg(pbs.LOG_DEBUG, "sel=%s" % (sel,))
pbs.logmsg(pbs.LOG_DEBUG, "sel.increment_chunks(%d)=%s" % (inp,isel))
inp="3"
isel=sel.increment_chunks(inp)
pbs.logmsg(pbs.LOG_DEBUG, "sel.increment_chunks(%s)=%s" % (inp,isel))
inp="23.5%"
isel=sel.increment_chunks(inp)
pbs.logmsg(pbs.LOG_DEBUG, "sel.increment_chunks(%s)=%s" % (inp,isel))
inp={0: 0, 1: 4, 2: "50%"}
isel=sel.increment_chunks(inp)
pbs.logmsg(pbs.LOG_DEBUG, "sel.increment_chunks(%s)=%s" % (inp,isel))
sel=pbs.select("5:ncpus=3:mem=1gb+1:ncpus=2:mem=2gb+2:ncpus=1:mem=3gb")
pbs.logmsg(pbs.LOG_DEBUG, "sel=%s" % (sel,))
inp={0: "50%", 1: "50%", 2: "50%"}
isel=sel.increment_chunks(inp)
pbs.logmsg(pbs.LOG_DEBUG, "sel.increment_chunks(%s)=%s" % (inp,isel))
"""
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job(TEST_USER)
        j1.set_sleep_time(10)
        self.server.submit(j1)

        # Verify server_logs
        self.server.log_match(
            "sel=ncpus=3:mem=1gb+1:ncpus=2:mem=2gb+2:ncpus=1:mem=3gb", n=10)

        self.server.log_match(
            "sel.increment_chunks(2)=1:ncpus=3:mem=1gb+" +
            "3:ncpus=2:mem=2gb+4:ncpus=1:mem=3gb", n=10)

        self.server.log_match(
            "sel.increment_chunks(3)=1:ncpus=3:mem=1gb+" +
            "4:ncpus=2:mem=2gb+5:ncpus=1:mem=3gb", n=10)

        self.server.log_match(
            "sel.increment_chunks(23.5%)=1:ncpus=3:mem=1gb+" +
            "2:ncpus=2:mem=2gb+3:ncpus=1:mem=3gb", n=10)

        self.server.log_match(
            "sel.increment_chunks({0: 0, 1: 4, 2: \'50%\'})=1:ncpus=3:" +
            "mem=1gb+5:ncpus=2:mem=2gb+3:ncpus=1:mem=3gb", n=10)

        self.server.log_match(
            "sel=5:ncpus=3:mem=1gb+1:ncpus=2:mem=2gb+2:ncpus=1:mem=3gb",
            n=10)

        self.server.log_match(
            "sel.increment_chunks({0: \'50%\', 1: \'50%\', 2: \'50%\'})=" +
            "7:ncpus=3:mem=1gb+2:ncpus=2:mem=2gb+3:ncpus=1:mem=3gb", n=10)

    def test_t14(self):
        """
        Test: tolerating job_start of no node failures,
              but pruning job's assigned nodes to satisfy the original
              select spec + 1 additional node.
              Basically, given an original spec requiring
              3 nodes, and a queuejob hook has added 2 more nodes,
              resulting in a new assignment:
                   exec_vnode=(A)+(B)+(C)+(D)+(E) where
              (C) mirrors (B) and satisfy the second chunk, and (E)
              mirrors (D) and satisfy the third chunk.
              Now pruning the assigned nodes to need 4 nodes, would
              result in:
                   exec_vnode=(A)+(B)+(D)+(e1)
              where (E) is a super-chunk of the form (e1+e2) and only
              need 'e1' part.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_launch hook
        hook_body = """
import pbs
e=pbs.event()

if 'PBS_NODEFILE' not in e.env:
    e.accept()

pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
if e.job.in_ms_mom():
    new_jsel = e.job.Resource_List["site"] + "+ncpus=1:mem=1gb"
    pj = e.job.release_nodes(keep_select=new_jsel)
    pbs.logmsg(pbs.LOG_DEBUG, "release_nodes(keep_select=%s)" % (new_jsel,))
    if pj != None:
        pbs.logjobmsg(e.job.id, "launch: job.exec_vnode=%s" % (pj.exec_vnode,))
        pbs.logjobmsg(e.job.id, "launch: job.exec_host=%s" % (pj.exec_host,))
        pbs.logjobmsg(e.job.id,
                      "launch: job.schedselect=%s" % (pj.schedselect,))
    else:
        e.job.delete()
        msg = "unsuccessful at LAUNCH"
        e.reject("unsuccessful at LAUNCH")
"""
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1_4')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '7gb',
                                 'Resource_List.ncpus': 9,
                                 'Resource_List.nodect': 4,
                                 'Resource_List.select': self.job1v6_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1v6_schedselect,
                                 'exec_host': self.job1v6_exec_host,
                                 'exec_vnode': self.job1v6_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nB, self.nBv0, self.nE],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2, self.nBv1],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)

        self.match_vnode_status([self.nC], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nBv2, self.nBv3,
                                 self.nEv0, self.nEv1, self.nEv2,
                                 self.nEv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 9,
                                    'resources_assigned.mem': '7340032kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 9,
                                   'resources_assigned.mem': '7340032kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1v6_exec_host))

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1v6_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v6_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v6_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v6_exec_host_esc,
                                  self.job1v6_exec_vnode_esc,
                                  "7gb", 9, 4,
                                  self.job1_place,
                                  self.job1v6_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
pbsdsh -n 3 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
pbsdsh -n 3 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momB.hostname, self.momC.hostname,
            self.momE.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.fib37_value,
            self.momA.shortname, self.momB.shortname, self.momC.shortname,
            self.momE.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momB.hostname, self.momB.hostname, self.momB.shortname,
            self.momC.hostname, self.momC.hostname, self.momC.shortname,
            self.momE.hostname, self.momE.hostname, self.momE.shortname)

        self.logger.info("expected out=%s" % (expected_out,))
        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()
            self.logger.info("job_out=%s" % (job_out,))

        self.assertEqual(job_out, expected_out)

    def test_t15(self):
        """
        Test: tolerating job_start of no node failures,
              but pruning job's assigned nodes to satisfy the original
              select spec minus 1 node, except one of the chunks is.
              unsatisfiable. This time, the action pbs.event().delete()
              action is specified on a failure to prune the job.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_launch hook
        hook_body = """
import pbs
e=pbs.event()

if 'PBS_NODEFILE' not in e.env:
    e.accept()

pbs.logmsg(pbs.LOG_DEBUG, "Executing launch")

for vn in e.vnode_list:
    v = e.vnode_list[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list[" + v.name + "]")

for vn in e.vnode_list_fail:
    v = e.vnode_list_fail[vn]
    pbs.logjobmsg(e.job.id, "launch: found vnode_list_fail[" + v.name + "]")
if e.job.in_ms_mom():
    new_jsel ="ncpus=3:mem=2gb+ncpus=5:mem=3gb"
    pj = e.job.release_nodes(keep_select=new_jsel)
    pbs.logmsg(pbs.LOG_DEBUG, "release_nodes(keep_select=%s)" % (new_jsel,))
    if pj != None:
        pbs.logjobmsg(e.job.id, "launch: job.exec_vnode=%s" % (pj.exec_vnode,))
        pbs.logjobmsg(e.job.id, "launch: job.exec_host=%s" % (pj.exec_host,))
        pbs.logjobmsg(e.job.id,
                      "launch: job.schedselect=%s" % (pj.schedselect,))
    else:
        e.job.delete()
        msg = "unsuccessful at LAUNCH"
        e.reject("unsuccessful at LAUNCH")
"""
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1_4')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.momA.log_match("Job;%s;could not satisfy select chunk" % (jid,),
                            n=10, max_attempts=60, interval=2)

        self.momA.log_match("Job;%s;NEED chunks for keep_select" % (jid,),
                            n=10)

        self.momA.log_match(
            "Job;%s;HAVE chunks from job's exec_vnode" % (jid,), n=10)

        self.momA.log_match("execjob_launch request rejected by 'launch'",
                            n=10)

        errmsg = "unsuccessful at LAUNCH"
        self.momA.log_match("Job;%s;%s" % (jid, errmsg,), n=10)

        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

    def test_t16(self):
        """
        Test: tolerating node failures at job startup with
              a job submitted with -l place="scatter:excl".
              Like jobs submitted with only "-l place=scatter"
              except the vnodes assigned would have a
             "job-exclusive" state.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "Executing begin")
localnode=pbs.get_local_nodename()
if not e.job.in_ms_mom() and (localnode == '%s'):
    x
""" % (self.nB,)
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job4')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job4_iselect,
                                 'Resource_List.site': self.job4_oselect,
                                 'Resource_List.place': self.job4_place,
                                 'schedselect': self.job4_ischedselect},
                           max_attempts=10, id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job4_select,
                                 'Resource_List.place': self.job4_place,
                                 'schedselect': self.job4_schedselect,
                                 'exec_host': self.job4_exec_host,
                                 'exec_vnode': self.job4_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1],
                                'job-exclusive', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nE, self.nEv0],
                                'job-exclusive', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-exclusive', jobs_assn1, 1, '0kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'job-exclusive', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nC,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job4_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+" % (jid, self.hostC) +
            "could not IM_EXEC_PROLOGUE", n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+" % (jid, self.hostC) +
            "as job is tolerant of node failures", n=10, regexp=True)
        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_prologue hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;prolo: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1, self.nC]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job4_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job4_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job4_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job4_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job4_iexec_host_esc,
                                  self.job4_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job4_place,
                                  self.job4_isel_esc)

        self.match_accounting_log('s', jid, self.job4_exec_host_esc,
                                  self.job4_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job4_place,
                                  self.job4_sel_esc)

    def test_t17(self):
        """
        Test: tolerating 1 node failure at job startup with
              a job submitted with -l place="free".
              Like jobs submitted with only "-l place=scatter"
              except some vnodes from the same mom would get
              allocated to satisfy different chunks.
              This test breaks apart one of the multi-chunks of
              the form (b1+b2+b3) so that upon reassignment,
              (b1+b2) is used.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body4)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body3)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body2)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job5')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job5_iselect,
                                 'Resource_List.site': self.job5_oselect,
                                 'Resource_List.place': self.job5_place,
                                 'schedselect': self.job5_ischedselect},
                           max_attempts=10, id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 7,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job5_select,
                                 'Resource_List.place': self.job5_place,
                                 'schedselect': self.job5_schedselect,
                                 'exec_host': self.job5_exec_host,
                                 'exec_vnode': self.job5_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=60)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status(
            [self.nAv0, self.nAv1, self.nB, self.nBv0],
            'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2, self.nBv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        # due to free placement, job appears twice as it's been allocated
        # twice, one for mem only and the other for ncpus
        jobs_assn2 = "%s/0, %s/0" % (jid, jid)
        self.match_vnode_status([self.nBv1],
                                'job-busy', jobs_assn2, 1, '1048576kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nC, self.nD,
                                 self.nD, self.nE, self.nEv0, self.nEv1,
                                 self.nEv2, self.nEv3, self.nBv3], 'free')

        # Check server/queue counts.
        self.server.expect(SERVER, {'resources_assigned.ncpus': 7,
                                    'resources_assigned.mem': '5242880kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 7,
                                   'resources_assigned.mem': '5242880kb'},
                           id='workq', attrop=PTL_AND)
        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job5_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostD), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostD) +
            "is tolerant of node failures",
            regexp=True, n=10)

        # Check vnode_list[] parameter in execjob_prologue hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nD]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job5_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job5_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job5_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job5_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job5_iexec_host_esc,
                                  self.job5_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job5_place,
                                  self.job5_isel_esc)

        self.match_accounting_log('s', jid, self.job5_exec_host_esc,
                                  self.job5_exec_vnode_esc,
                                  "5gb", 7, 3,
                                  self.job5_place,
                                  self.job5_sel_esc)

    def test_t18(self):
        """
        Test: having a node failure tolerant job waiting for healthy nodes
              to get rerun (i.e. qrerun). Upon qrerun, job should get
              killed, requeued, and restarted.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        jid = self.create_and_submit_job('job1')
        # job's substate is 41 (PRERUN) since it would be waiting for
        # healthy nodes being a node failure tolerant job.
        # With no prologue hook, MS would wait the default 30
        # seconds for healthy nodes.
        self.server.expect(JOB, {'job_state': 'R',
                                 'substate': 41,
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'exec_host': self.job1_iexec_host,
                                 'exec_vnode': self.job1_iexec_vnode,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1, self.nB, self.nBv0,
                                 self.nE, self.nEv0],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2, self.nBv1],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.nC], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nBv2, self.nBv3,
                                 self.nEv1, self.nEv2, self.nEv3], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 13,
                                    'resources_assigned.mem': '10485760'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 13,
                                   'resources_assigned.mem': '10485760'},
                           id='workq', attrop=PTL_AND)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.rerunjob(jid)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        self.match_vnode_status([self.nA, self.nAv0, self.nAv1, self.nAv2,
                                 self.nAv3,
                                 self.nB, self.nBv0, self.nBv1, self.nBv2,
                                 self.nBv3, self.nC, self.nD, self.nE,
                                 self.nEv0, self.nEv1, self.nEv2,
                                 self.nEv3], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 0,
                                    'resources_assigned.mem': '0kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 0,
                                   'resources_assigned.mem': '0kb'},
                           id='workq', attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Now job should start running again
        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1v2_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1v2_schedselect,
                                 'exec_host': self.job1v2_exec_host,
                                 'exec_vnode': self.job1v2_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=70)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        self.match_vnode_status([self.nAv2],
                                'job-busy', jobs_assn1, 1, '0kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.nC], 'job-busy', jobs_assn2,
                                2, '2097152kb')

        jobs_assn3 = "%s/0, %s/1, %s/2" % (jid, jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn3,
                                3, '2097152kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nB, self.nBv0,
                                 self.nBv1, self.nBv2, self.nBv3, self.nE,
                                 self.nEv0, self.nEv1, self.nEv2,
                                 self.nEv3], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1v2_exec_host))

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1v2_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v2_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v2_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v2_exec_host_esc,
                                  self.job1v2_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1v2_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momD.hostname, self.momC.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momD.shortname, self.momC.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname,
            self.momC.hostname, self.momC.hostname, self.momC.shortname)

        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()

        self.assertIn(expected_out, job_out, "job output is not present")

        # Re-check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Re-check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nB, self.nBv0, self.nBv1]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1v2_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v2_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v2_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v2_exec_host_esc,
                                  self.job1v2_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1v2_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momD.hostname, self.momC.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momD.shortname, self.momC.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname,
            self.momC.hostname, self.momC.hostname, self.momC.shortname)

        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()

        self.assertIn(expected_out, job_out, "job output is not present")

    def test_t19(self):
        """
        Test: having a node tolerant job waiting for healthy nodes
              to get issued a request to release nodes. The call
              to pbs_release_nodes would fail given that the job
              is not fully running yet, still figuring out which nodes
              assigned are deemed good.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        jid = self.create_and_submit_job('job1')
        # job's substate is 41 (PRERUN) since it would be waiting for
        # healthy nodes being a node failure tolerant job
        self.server.expect(JOB, {'job_state': 'R',
                                 'substate': 41,
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'exec_host': self.job1_iexec_host,
                                 'exec_vnode': self.job1_iexec_vnode,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        # Verify mom_logs
        self.momA.log_match(
            "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                jid, self.hostB), n=10, regexp=True)

        self.momA.log_match(
            "Job;%s;ignoring error from %s.+as job " % (jid, self.hostB) +
            "is tolerant of node failures",
            regexp=True, n=10)

        # Run pbs_release_nodes on a job whose state is running but
        # substate is under PRERUN
        pbs_release_nodes_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_release_nodes')
        cmd = [pbs_release_nodes_cmd, '-j', jid, '-a']

        ret = self.server.du.run_cmd(self.server.hostname, cmd,
                                     runas=TEST_USER)
        self.assertNotEqual(ret['rc'], 0)
        self.assertTrue(ret['err'][0].startswith(
            'pbs_release_nodes: Request invalid for state of job'))

    def test_t20(self):
        """
        Test: node failure tolerant job array, with multiple subjobs
              starting at the same time, and job's assigned resources
              are pruned to match up to the original select spec using
              an execjob_prologue hook this time.
        """
        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_begin hook
        hook_event = "execjob_begin"
        hook_name = "begin"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.begin_hook_body5)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body4)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('jobA')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 5,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.jobA_iselect,
                                 'Resource_List.site': self.jobA_oselect,
                                 'Resource_List.place': self.jobA_place,
                                 'schedselect': self.jobA_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.expect(JOB, {'job_state': 'B',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '5gb',
                                 'Resource_List.ncpus': 5,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.jobA_iselect,
                                 'Resource_List.site': self.jobA_oselect,
                                 'Resource_List.place': self.jobA_place,
                                 'schedselect': self.jobA_ischedselect},
                           id=jid, attrop=PTL_AND)

        self.server.expect(JOB, {'job_state=R': 3}, extend='t')

        idx_values = {}
        sub_jobs = {}
        for idx in range(1, 4):
            sjid = create_subjob_id(jid, idx)
            if idx == 1:
                d = {'iexec_host_esc': self.jobA_iexec_host1_esc,
                     'iexec_vnode': self.jobA_iexec_vnode1,
                     'iexec_vnode_esc': self.jobA_iexec_vnode1_esc,
                     'exec_host': self.jobA_exec_host1,
                     'exec_host_esc': self.jobA_exec_host1_esc,
                     'exec_vnode': self.jobA_exec_vnode1,
                     'exec_vnode_esc': self.jobA_exec_vnode1_esc,
                     'vnode_list': [self.nAv0, self.nB, self.nC,
                                    self.nD, self.nE]}
            elif idx == 2:
                d = {'iexec_host_esc': self.jobA_iexec_host2_esc,
                     'iexec_vnode': self.jobA_iexec_vnode2,
                     'iexec_vnode_esc': self.jobA_iexec_vnode2_esc,
                     'exec_host': self.jobA_exec_host2,
                     'exec_host_esc': self.jobA_exec_host2_esc,
                     'exec_vnode': self.jobA_exec_vnode2,
                     'exec_vnode_esc': self.jobA_exec_vnode2_esc,
                     'vnode_list': [self.nAv1, self.nBv0, self.nC,
                                    self.nD, self.nEv0]}
            elif idx == 3:
                d = {'iexec_host_esc': self.jobA_iexec_host3_esc,
                     'iexec_vnode': self.jobA_iexec_vnode3,
                     'iexec_vnode_esc': self.jobA_iexec_vnode3_esc,
                     'exec_host': self.jobA_exec_host3,
                     'exec_host_esc': self.jobA_exec_host3_esc,
                     'exec_vnode': self.jobA_exec_vnode3,
                     'exec_vnode_esc': self.jobA_exec_vnode3_esc,
                     'vnode_list': [self.nAv2, self.nBv1, self.nC,
                                    self.nD, self.nE]}
            idx_values[idx] = d
            sub_jobs[idx] = sjid
            self.server.expect(JOB, {'job_state': 'R',
                                     'substate': 42,
                                     'tolerate_node_failures': 'job_start',
                                     'Resource_List.mem': '3gb',
                                     'Resource_List.ncpus': 3,
                                     'Resource_List.nodect': 3,
                                     'exec_host': d['exec_host'],
                                     'exec_vnode': d['exec_vnode'],
                                     'Resource_List.select': self.jobA_select,
                                     'Resource_List.site': self.jobA_oselect,
                                     'Resource_List.place': self.jobA_place,
                                     'schedselect': self.jobA_schedselect},
                               id=sjid, attrop=PTL_AND)

        for idx in range(1, 4):
            sjid = sub_jobs[idx]
            # Verify mom_logs
            sjid_esc = sjid.replace(
                "[", r"\[").replace("]", r"\]").replace("(", r"\(").replace(
                ")", r"\)").replace("+", r"\+")
            self.momA.log_match(
                "Job;%s;job_start_error.+from node %s.+could not JOIN_JOB" % (
                    sjid_esc, self.hostC), n=10, regexp=True)
            self.momA.log_match(
                "Job;%s;ignoring error from %s.+as job " % (
                    sjid_esc, self.hostC) + "is tolerant of node failures",
                regexp=True, n=10)

            for vn in idx_values[idx]['vnode_list']:
                self.momA.log_match("Job;%s;prolo: found vnode_list[%s]" % (
                                    sjid, vn), n=10)

            vnode_list_fail = [self.nC]
            for vn in vnode_list_fail:
                self.momA.log_match(
                    "Job;%s;prolo: found vnode_list_fail[%s]" % (
                        sjid, vn), n=10)
            # Check result of pbs.event().job.release_nodes(keep_select)
            # call
            self.momA.log_match("Job;%s;prolo: job.exec_vnode=%s" % (
                sjid, idx_values[idx]['exec_vnode']), n=10)
            self.momA.log_match("Job;%s;prolo: job.schedselect=%s" % (
                sjid, self.jobA_schedselect), n=10)
            self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
                sjid, idx_values[idx]['iexec_vnode']), n=10)
            self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
                sjid, idx_values[idx]['exec_vnode']), n=10)

            # Check accounting_logs
            self.match_accounting_log('S', sjid_esc,
                                      idx_values[idx]['iexec_host_esc'],
                                      idx_values[idx]['iexec_vnode_esc'],
                                      "5gb", 5, 5,
                                      self.jobA_place,
                                      self.jobA_isel_esc)
            self.match_accounting_log('s', sjid_esc,
                                      idx_values[idx]['exec_host_esc'],
                                      idx_values[idx]['exec_vnode_esc'],
                                      "3gb", 3, 3,
                                      self.jobA_place,
                                      self.jobA_sel_esc)

    @timeout(400)
    def test_t21(self):
        """
        Test: radio silent moms causing the primary mom to not get
              any acks from the sister moms executing prologue hooks.
              After some 'job_launch_delay' time has passed, primary
              mom will consider node hosts that have not acknowledged
              the prologue hook execution as failed hosts, and will
              not use their vnodes in the pruning of jobs.
        """
        job_launch_delay = 120
        c = {'$job_launch_delay': job_launch_delay}
        self.momA.add_config(c)

        # instantiate queuejob hook
        hook_event = "queuejob"
        hook_name = "qjob"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.qjob_hook_body)

        # instantiate execjob_prologue hook
        hook_event = "execjob_prologue"
        hook_name = "prolo"
        a = {'event': hook_event, 'enabled': 'true', 'alarm': 60}
        self.server.create_import_hook(hook_name, a, self.prolo_hook_body5)

        # instantiate execjob_launch hook
        hook_event = "execjob_launch"
        hook_name = "launch"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, self.launch_hook_body)

        # First, turn off scheduling
        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        jid = self.create_and_submit_job('job1')
        # Job gets queued and reflects the incremented values from queuejob
        # hook
        self.server.expect(JOB, {'job_state': 'Q',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '10gb',
                                 'Resource_List.ncpus': 13,
                                 'Resource_List.nodect': 5,
                                 'Resource_List.select': self.job1_iselect,
                                 'Resource_List.site': self.job1_oselect,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1_ischedselect},
                           id=jid, attrop=PTL_AND)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.momE.log_match(
            "Job;%s;sleeping for 30 secs" % (jid, ), n=10)

        # temporarily suspend momE, simulating a radio silent mom.
        self.momE.signal("-STOP")

        self.momC.log_match(
            "Job;%s;sleeping for 30 secs" % (jid, ), n=10)

        # temporarily suspend momC, simulating a radio silent mom.
        self.momC.signal("-STOP")

        # sleep as long as the time primary mom waits for all
        # prologue hook acknowledgement from the sister moms
        self.logger.info("sleeping for %d secs waiting for healthy nodes" % (
                         job_launch_delay,))
        time.sleep(job_launch_delay)

        # Job eventually launches reflecting the pruned back values
        # to the original select spec
        # There's a max_attempts=60 for it would take up to 60 seconds
        # for primary mom to wait for the sisters to join
        # (default $sister_join_job_alarm of 30 seconds) and to wait for
        # sisters to execjob_prologue hooks (default $job_launch_delay
        # value of 30 seconds)

        self.server.expect(JOB, {'job_state': 'R',
                                 'tolerate_node_failures': 'job_start',
                                 'Resource_List.mem': '6gb',
                                 'Resource_List.ncpus': 8,
                                 'Resource_List.nodect': 3,
                                 'Resource_List.select': self.job1v4_select,
                                 'Resource_List.place': self.job1_place,
                                 'schedselect': self.job1v4_schedselect,
                                 'exec_host': self.job1v4_exec_host,
                                 'exec_vnode': self.job1v4_exec_vnode},
                           id=jid, interval=1, attrop=PTL_AND, max_attempts=70)

        thisjob = self.server.status(JOB, id=jid)
        if thisjob:
            job_output_file = thisjob[0]['Output_Path'].split(':')[1]

        # Check various vnode status.
        jobs_assn1 = "%s/0" % (jid,)
        self.match_vnode_status([self.nAv0, self.nAv1, self.nB, self.nBv0],
                                'job-busy', jobs_assn1, 1, '1048576kb')

        jobs_assn2 = "%s/0, %s/1" % (jid, jid)
        self.match_vnode_status([self.nD], 'free', jobs_assn2,
                                2, '2097152kb')

        self.match_vnode_status([self.nAv2, self.nBv1],
                                'job-busy', jobs_assn1, 1, '0kb')

        self.match_vnode_status([self.nA, self.nAv3, self.nBv2, self.nBv3,
                                 self.nC, self.nD, self.nEv1, self.nEv2,
                                 self.nEv3, self.nE, self.nEv0], 'free')

        # check server/queue counts
        self.server.expect(SERVER, {'resources_assigned.ncpus': 8,
                                    'resources_assigned.mem': '6291456kb'},
                           attrop=PTL_AND)
        self.server.expect(QUEUE, {'resources_assigned.ncpus': 8,
                                   'resources_assigned.mem': '6291456kb'},
                           id='workq', attrop=PTL_AND)

        self.assertTrue(
            self.pbs_nodefile_match_exec_host(jid, self.job1v4_exec_host))

        # Check vnode_list[] parameter in execjob_launch hook
        vnode_list = [self.nAv0, self.nAv1, self.nAv2,
                      self.nB, self.nBv0, self.nBv1,
                      self.nC, self.nD, self.nE, self.nEv0]
        for vn in vnode_list:
            self.momA.log_match("Job;%s;launch: found vnode_list[%s]" % (
                                jid, vn), n=10)

        # Check vnode_list_fail[] parameter in execjob_launch hook
        vnode_list_fail = [self.nC, self.nE, self.nEv0]
        for vn in vnode_list_fail:
            self.momA.log_match("Job;%s;launch: found vnode_list_fail[%s]" % (
                                jid, vn), n=10)

        # Check result of pbs.event().job.release_nodes(keep_select) call
        self.momA.log_match("Job;%s;launch: job.exec_vnode=%s" % (
            jid, self.job1v4_exec_vnode), n=10)

        self.momA.log_match("Job;%s;launch: job.schedselect=%s" % (
            jid, self.job1v4_schedselect), n=10)

        self.momA.log_match("Job;%s;pruned from exec_vnode=%s" % (
            jid, self.job1_iexec_vnode), n=10)

        self.momA.log_match("Job;%s;pruned to exec_vnode=%s" % (
            jid, self.job1v4_exec_vnode), n=10)

        # Check accounting_logs
        self.match_accounting_log('S', jid, self.job1_iexec_host_esc,
                                  self.job1_iexec_vnode_esc, "10gb", 13, 5,
                                  self.job1_place,
                                  self.job1_isel_esc)

        self.match_accounting_log('s', jid, self.job1v4_exec_host_esc,
                                  self.job1v4_exec_vnode_esc,
                                  "6gb", 8, 3,
                                  self.job1_place,
                                  self.job1v4_sel_esc)
        self.momA.log_match("Job;%s;task.+started, hostname" % (jid,),
                            n=10, interval=5, regexp=True)

        self.momA.log_match("Job;%s;copy file request received" % (jid,),
                            n=10, interval=5)

        # validate output
        expected_out = """/var/spool/pbs/aux/%s
%s
%s
%s
FIB TESTS
pbsdsh -n 1 fib 37
%d
pbsdsh -n 2 fib 37
%d
fib 37
%d
HOSTNAME TESTS
pbsdsh -n 0 hostname
%s
pbsdsh -n 1 hostname
%s
pbsdsh -n 2 hostname
%s
PBS_NODEFILE tests
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
HOST=%s
pbs_tmrsh %s hostname
%s
""" % (jid, self.momA.hostname, self.momB.hostname, self.momD.hostname,
            self.fib37_value, self.fib37_value, self.fib37_value,
            self.momA.shortname, self.momB.shortname, self.momD.shortname,
            self.momA.hostname, self.momA.hostname, self.momA.shortname,
            self.momB.hostname, self.momB.hostname, self.momB.shortname,
            self.momD.hostname, self.momD.hostname, self.momD.shortname)

        job_out = ""
        with open(job_output_file, 'r') as fd:
            job_out = fd.read()

        self.assertEqual(job_out, expected_out)


================================================
FILE: test/tests/functional/pbs_resc_custom_perm.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_Custom_Resource_Perm(TestFunctional):
    rsc_list = ['foo_str', 'foo_strm', 'foo_strh']
    hook_list = ["start", "begin"]

    def setUp(self):
        TestFunctional.setUp(self)

        self.momA = self.moms.values()[0]
        self.momA.delete_vnode_defs()
        self.hostA = self.momA.shortname

        rc = self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        self.assertEqual(rc, 0)

        rc = self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)
        self.assertEqual(rc, 0)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostA)

        # Next set custom resources with m flag and without m flag
        # via qmgr -c 'create resource'
        attr = {'type': 'string', 'flag': 'h'}
        r = 'foo_str'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, logerr=False)

        attr = {'type': 'string', 'flag': 'hm'}
        r = 'foo_strm'
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id=r, logerr=False)

        # Create a custom resources via exechost_startup hook.
        startup_hook_body = """
import pbs
e=pbs.event()
localnode=pbs.get_local_nodename()
e.vnode_list[localnode].resources_available['foo_strh'] = "str_hook"
"""
        hook_name = "start"
        a = {'event': "exechost_startup", 'enabled': 'True'}
        self.server.create_import_hook(
            hook_name,
            a,
            startup_hook_body,
            overwrite=True)

        # Restart the MoM so that exechost_startup hook can run.
        self.momA.restart()

        # Give the moms a chance to receive the updated resource.
        # Ensure the new resource is seen by all moms.
        self.momA.log_match("resourcedef;copy hook-related file",
                            max_attempts=20, interval=1)

        # Create a exechost_begin hook.
        begin_hook_body = """
import pbs
e=pbs.event()
res_list = getattr(e.job, 'Resource_List')
pbs.logjobmsg(e.job.id, "Resource_List is %s" % str(res_list))
"""
        hook_name = "begin"
        a = {'event': "execjob_begin", 'enabled': 'True'}
        self.server.create_import_hook(
            hook_name,
            a,
            begin_hook_body,
            overwrite=True)

    def test_custom_resc_single_node(self):
        """
        Test permission flag of resources of a single node job
        using a execjob_begin hook.
        """
        self.logger.info("test_custom_resc__single_node")

        a = {'Resource_List.foo_str': 'str_noperm',
             'Resource_List.foo_strm': 'str_perm',
             'Resource_List.foo_strh': 'str_hook'
             }
        j = Job(TEST_USER, a)
        j.set_sleep_time("100")
        jid = self.server.submit(j)

        self.server.expect(JOB, {
            'job_state': 'R',
            'Resource_List.foo_str': 'str_noperm',
            'Resource_List.foo_strm': 'str_perm',
            'Resource_List.foo_strh': 'str_hook'},
            offset=1, id=jid)

        # Match mom logs entry, only resoruces with "m" flag would show up.
        msg = 'foo_strm=str_perm'
        self.momA.log_match("Job;%s;.*%s.*" % (jid, msg),
                            regexp=True, n=10, max_attempts=10, interval=2)
        msg = 'foo_strh=str_hook'
        self.momA.log_match("Job;%s;.*%s.*" % (jid, msg),
                            regexp=True, n=10, max_attempts=10, interval=2)
        msg = 'foo_str=str_noperm'
        self.momA.log_match("Job;%s;.*%s.*" % (jid, msg),
                            regexp=True, n=5, max_attempts=10, interval=2,
                            existence=False)


================================================
FILE: test/tests/functional/pbs_resc_used_single_node.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from tests.functional import *


class Test_singleNode_Job_ResourceUsed(TestFunctional):
    rsc_list = ['foo_str', 'foo_f', 'foo_i', 'foo_str2', 'foo_str3']

    def tearDown(self):
        self.du.set_pbs_config(confs={'PBS_SERVER': self.server.hostname})
        TestFunctional.tearDown(self)
        for r in self.rsc_list:
            try:
                self.server.manager(MGR_CMD_DELETE, RSC, id=r, runas=ROOT_USER)
            except Exception:
                pass
        self.server.restart()
        self.mom.restart()

    def setUp(self):
        TestFunctional.setUp(self)
        for r in self.rsc_list:
            try:
                self.server.manager(MGR_CMD_DELETE, RSC, id=r, runas=ROOT_USER)
            except Exception:
                pass

        self.server.restart()

        self.momA = self.moms.values()[0]
        self.momA.restart()
        self.momA.delete_vnode_defs()
        self.hostA = self.momA.shortname

        rc = self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        self.assertEqual(rc, 0)

        rc = self.server.manager(MGR_CMD_CREATE, NODE, id=self.hostA)
        self.assertEqual(rc, 0)
        self.server.expect(NODE, {'state': 'free'}, id=self.hostA)

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Next set some custom resources via qmgr -c 'create resource'
        attr = {'type': 'string', 'flag': 'h'}
        r = 'foo_str2'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)
        self.assertEqual(rc, 0)

        r = 'foo_str3'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)
        self.assertEqual(rc, 0)

        attr['type'] = 'string_array'
        r = 'stra'
        rc = self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, runas=ROOT_USER, logerr=False)
        self.assertEqual(rc, 0)

        # Set some custom resources via exechost_startup hook.
        startup_hook_body = """
import pbs
e=pbs.event()
localnode=pbs.get_local_nodename()
e.vnode_list[localnode].resources_available['foo_i'] = 7
e.vnode_list[localnode].resources_available['foo_f'] = 5.0
e.vnode_list[localnode].resources_available['foo_str'] = "seventyseven"
e.vnode_list[localnode].resources_available['foo_str2'] = "seven"
"""
        hook_name = "start"
        a = {'event': "exechost_startup", 'enabled': 'True'}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            startup_hook_body,
            overwrite=True)
        self.assertTrue(rv)

        self.momA.signal("-HUP")
        # Give the moms a chance to receive the updated resource.
        # Ensure the new resource is seen by all moms.
        m = self.momA.log_match("resourcedef;copy hook-related file",
                                max_attempts=20, interval=1)
        self.assertTrue(m)

    def test_epilogue_single_node(self):
        """
        Test accumulation of resources of a single node job from an
        exechost_epilogue hook.
        """
        self.logger.info("test_epilogue_single_node")
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executed epilogue hook")
e.job.resources_used["vmem"] = pbs.size("9gb")
e.job.resources_used["foo_i"] = 9
e.job.resources_used["foo_f"] = 0.09
e.job.resources_used["foo_str"] = '{"seven":7}'
e.job.resources_used["foo_str3"] = \
"\"\"{"a":6,"b":"some value #$%^&*@","c":54.4,"d":"32.5gb"}\"\"\"
e.job.resources_used["foo_str2"] = "seven"
e.job.resources_used["cput"] = 10
e.job.resources_used["stra"] = '"glad,elated","happy"'
"""

        hook_name = "epi"
        # this hook must run last on the same machine, and after the
        # cgroups hook (default order=100)
        a = {'event': "execjob_epilogue", 'enabled': 'True', 'order': '1000'}
        rv = self.server.create_import_hook(
            hook_name,
            a,
            hook_body,
            overwrite=True)
        self.assertTrue(rv)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 3
             }
        j = Job(TEST_USER)
        j.set_attributes(a)
        j.set_sleep_time("3")
        jid = self.server.submit(j)

        # The results should show value for custom resources 'foo_i',
        # 'foo_f', 'foo_str', 'foo_str3', and builtin resources 'vmem',
        # 'cput', and should be accumulating  based on the hook script,
        # For 'string' type resources set to a json string will be within
        # single quotes.
        #
        # foo_str and foo_str3 are string type resource set to JSON
        # format string

        self.server.expect(JOB, {
            'job_state': 'F',
            'resources_used.foo_f': '0.09',
            'resources_used.foo_i': '9',
            'resources_used.foo_str': '\'{"seven": 7}\'',
            'resources_used.foo_str2': 'seven',
            'resources_used.stra': "\"glad,elated\",\"happy\"",
            'resources_used.vmem': '9gb',
            'resources_used.cput': '00:00:10',
            'resources_used.ncpus': '1'},
            extend='x', offset=10, attrop=PTL_AND, id=jid)

        # Match accounting_logs entry

        acctlog_match = 'resources_used.foo_f=0.09'
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)

        acctlog_match = 'resources_used.foo_i=9'
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)

        acctlog_match = 'resources_used.foo_str=\'{"seven": 7}\''
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)

        acctlog_match = 'resources_used.vmem=9gb'
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)

        acctlog_match = 'resources_used.cput=00:00:10'
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)

        acctlog_match = 'resources_used.foo_str2=seven'
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)

        acctlog_match = 'resources_used.ncpus=1'
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)

        acctlog_match = 'resources_used.foo_str3='
        s = self.server.accounting_match(
            "E;%s;.*%s'{.*}'.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)
        acctlog_match = r'resources_used.stra=\"glad\,elated\"\,\"happy\"'
        s = self.server.accounting_match(
            "E;%s;.*%s.*" % (jid, acctlog_match), regexp=True, n=100)
        self.assertTrue(s)


================================================
FILE: test/tests/functional/pbs_reservations.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import time
from datetime import datetime as dt

from tests.functional import *


@tags('reservations')
class TestReservations(TestFunctional):
    """
    Various tests to verify behavior of PBS scheduler in handling
    reservations
    """

    def setUp(self):
        super().setUp()
        self._submitted_reservations = []
        # self.server.manager(MGR_CMD_SET, SERVER, {'log_events': '8191'})

    def tearDown(self):
        for rid in self._submitted_reservations:
            try:
                self.server.delete(rid)
            except PbsDeleteError:
                pass
        super().tearDown()

    def get_tz(self):
        if 'PBS_TZID' in self.conf:
            tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Missing timezone, using America/Los_Angeles')
            tzone = 'America/Los_Angeles'
        return tzone

    def dst_changes(self, start, end):
        """
        Returns true if it detects that DST changes between start and end
        """
        s = dt.fromtimestamp(start)
        e = dt.fromtimestamp(end)
        s_tz = s.astimezone().strftime("%Z")
        e_tz = e.astimezone().strftime("%Z")
        if s_tz != e_tz:
            return True
        return False

    def submit_reservation(self, select, start, end, user, rrule=None,
                           place='free', extra_attrs=None):
        """
        helper method to submit a reservation
        """
        a = {'Resource_List.select': select,
             'Resource_List.place': place,
             'reserve_start': start,
             }

        if self.dst_changes(start, end) is True:
            a['reserve_duration'] = int(end - start)
        else:
            a['reserve_end'] = end

        if rrule is not None:
            tzone = self.get_tz()
            a.update({ATTR_resv_rrule: rrule, ATTR_resv_timezone: tzone})

        if extra_attrs:
            a.update(extra_attrs)
        r = Reservation(user, a)

        rid = self.server.submit(r)
        if rid:
            self._submitted_reservations.append(rid)

        return rid

    def submit_asap_reservation(self, user, jid, extra_attrs=None):
        """
        Helper method to submit an ASAP reservation
        """
        a = {ATTR_convert: jid}
        if extra_attrs:
            a.update(extra_attrs)
        r = Reservation(user, a)

        # PTL's Reservation class sets the default ATTR_resv_start
        # and ATTR_resv_end.
        # But pbs_rsub: -Wqmove is not compatible with -R or -E option
        # So, unset these attributes from the reservation instance.
        r.unset_attributes(['reserve_start', 'reserve_end'])

        rid = self.server.submit(r)
        if rid:
            self._submitted_reservations.append(rid)

        return rid

    def submit_job(self, set_attrib=None, sleep=100, job_running=False):
        """
        This function submits job
        :param set_attrib: Job attributes to set
        :type set_attrib: Dictionary
        """
        j = Job(TEST_USER)
        if set_attrib is not None:
            j.set_attributes(set_attrib)
        j.set_sleep_time(sleep)
        jid = self.server.submit(j)
        self.logger.info("Job submitted successfully-%s" % jid)
        job_node = None
        if job_running:
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)
            get_exec_vnode = self.server.status(JOB, 'exec_vnode', id=jid)[0]
            job_node = get_exec_vnode['exec_vnode']
        return (jid, job_node)

    @staticmethod
    def cust_attr(name, totnodes, numnode, attrib):
        a = {}
        if numnode % 2 == 0:
            a['resources_available.color'] = 'red'
        else:
            a['resources_available.color'] = 'blue'
        return {**attrib, **a}

    def degraded_resv_reconfirm(self, start, end, rrule=None, run=False):
        """
        Test that a degraded reservation gets reconfirmed
        """
        a = {'reserve_retry_time': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'type': 'string', 'flag': 'h'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='color')
        self.scheduler.add_resource('color')

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, num=5,
                               attrfunc=self.cust_attr)

        now = int(time.time())

        rid = self.submit_reservation(user=TEST_USER,
                                      select='2:ncpus=1:color=red',
                                      rrule=rrule, start=now + start,
                                      end=now + end)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node_list = self.server.reservations[rid].get_vnodes()
        resv_node = resv_node_list[0]

        if run:
            resv_state = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
            self.logger.info('Sleeping until reservation starts')
            offset = start - int(time.time())
            self.server.expect(RESV, resv_state, id=rid,
                               offset=offset, interval=1)
        else:
            resv_state = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}

        a = {'state': 'offline'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=resv_node)

        a = {'reserve_substate': 10}
        a.update(resv_state)
        self.server.expect(RESV, a, id=rid)

        a = {'resources_available.color': 'red'}
        free_nodes = self.server.filter(NODE, a)
        nodes = list(free_nodes.values())[0]

        other_node = [x for x in nodes if x not in resv_node_list][0]

        if run:
            a = {'reserve_substate': 5}
        else:
            a = {'reserve_substate': 2}

        self.server.expect(RESV, a, id=rid, interval=1)

        self.server.status(RESV)
        self.assertEquals(set(self.server.reservations[rid].get_vnodes()),
                          {resv_node_list[1], other_node},
                          "Node not replaced correctly")
        if run:
            a = {'resources_assigned.ncpus': 0}
            self.server.expect(NODE, a, id=resv_node)
            a = {'resources_assigned.ncpus=1': 2}
            self.server.expect(NODE, a)

    def degraded_resv_failed_reconfirm(self, start, end, rrule=None,
                                       run=False, resume=False):
        """
        Test that reservations do not get reconfirmed if there is no place
        to put them.
        """
        a = {'reserve_retry_time': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, num=2)

        now = time.time()

        rid = self.submit_reservation(user=TEST_USER, select='1:ncpus=1',
                                      rrule=rrule, start=now + start,
                                      end=now + end)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '1:00:00'}
        j = Job(attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.status(JOB, 'exec_vnode', id=jid)
        job_node = j.get_vnodes()[0]

        msg = 'Job and Resv share node'
        self.assertNotEqual(resv_node, job_node, msg)

        if run:
            resv_state = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
            self.logger.info('Sleeping until reservation starts')
            offset = start - int(time.time())
            self.server.expect(RESV, resv_state, id=rid,
                               offset=offset, interval=1)
        else:
            resv_state = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}

        a = {'state': 'offline'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=resv_node)

        a = {'reserve_substate': 10}
        a.update(resv_state)
        self.server.expect(RESV, a, id=rid)

        self.scheduler.log_match(rid + ';Reservation is in degraded mode',
                                 starttime=now, interval=1)

        self.server.expect(RESV, a, id=rid)

        self.server.expect(RESV, {'resv_nodes':
                                  (MATCH_RE, re.escape(resv_node))}, id=rid)

        if rrule and run:
            a = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10'),
                 'reserve_substate': 10}
            t = end - int(time.time())
            self.logger.info('Sleeping until reservation ends')
            self.server.expect(RESV, a, id=rid, offset=t)

        self.server.manager(MGR_CMD_SET, NODE, {'state': (DECR, 'offline')},
                            id=resv_node)
        # If run and rrule are true, we waited until the occurrence
        # finished and the reservation is no longer running otherwise
        # the reservation is still running.
        if run:
            if rrule:
                resv_state = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                              'reserve_substate': 2}
            else:
                resv_state = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'),
                              'reserve_substate': 5}
        else:
            resv_state = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
                          'reserve_substate': 2}

        self.server.expect(RESV, resv_state, id=rid)

    def test_degraded_standing_reservations(self):
        """
        Verify that degraded standing reservations are reconfirmed
        on other nodes
        """
        self.degraded_resv_reconfirm(start=125, end=625,
                                     rrule='freq=HOURLY;count=5')

    def test_degraded_advance_reservations(self):
        """
        Verify that degraded advance reservations are reconfirmed
        on other nodes
        """
        self.degraded_resv_reconfirm(start=125, end=625)

    def test_degraded_standing_running_reservations(self):
        """
        Verify that degraded standing reservations are reconfirmed
        on other nodes
        """
        self.degraded_resv_reconfirm(start=25, end=625,
                                     rrule='freq=HOURLY;count=5', run=True)

    def test_degraded_advance_running_reservations(self):
        """
        Verify that degraded advance reservations are not reconfirmed
        on other nodes if no space is available
        """
        self.degraded_resv_reconfirm(
            start=25, end=625, run=True)

    def test_degraded_standing_reservations_fail(self):
        """
        Verify that degraded standing reservations are not
        reconfirmed on other nodes if there is no space available
        """
        self.degraded_resv_failed_reconfirm(start=120, end=720,
                                            rrule='freq=HOURLY;count=5')

    def test_degraded_advance_reservations_fail(self):
        """
        Verify that advance reservations are not reconfirmed if there
        is no space available
        """
        self.degraded_resv_failed_reconfirm(start=120, end=720)

    def test_degraded_standing_running_reservations_fail(self):
        """
        Verify that degraded running standing reservations are not
        reconfirmed on other nodes if there is no space available
        """
        self.degraded_resv_failed_reconfirm(start=25, end=55,
                                            rrule='freq=HOURLY;count=5',
                                            run=True)

    def test_degraded_advance_running_reservations_fail(self):
        """
        Verify that advance running reservations are not reconfirmed if there
        is no space available
        """
        self.degraded_resv_failed_reconfirm(
            start=25, end=625, run=True)

    def test_degraded_advanced_reservation_superchunk(self):
        """
        Verify that an advanced reservation requesting a superchunk is
        correctly reconfirmed on other nodes
        """
        retry = 15
        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, num=6)
        self.server.manager(MGR_CMD_SET, SERVER, {'reserve_retry_time': retry})

        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1+1:ncpus=3',
                                      start=now + 60,
                                      end=now + 240)

        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')}, id=rid)
        st = self.server.status(RESV, 'resv_nodes', id=rid)[0]
        nds1 = st['resv_nodes']
        # Should have 4 nodes.  Nodes 2-4 are the superchunk.  Choose the
        # middle node to avoid the '(' and ')' of the superchunk.
        sp = nds1.split('+')
        sn = sp[2].split(':')[0]

        # Keep the first chunk's node around to confirm it is still the same
        sc = sp[0]

        t = int(time.time())
        self.server.manager(MGR_CMD_SET, NODE, {'state': 'offline'}, id=sn)
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_DEGRADED|10')}, id=rid)

        retry_time = t + retry
        offset = retry_time - int(time.time())
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')},
                           id=rid, offset=offset)
        st = self.server.status(RESV, 'resv_nodes', id=rid)[0]
        nds2 = st['resv_nodes']
        self.assertEqual(len(sp), len(nds2.split('+')))
        self.assertNotEqual(nds1, nds2)
        self.assertEquals(sc, nds1.split('+')[0])

    def test_degraded_running_only_replace(self):
        """
        Test that when a running degraded reservation is reconfirmed,
        make sure that only the nodes that unavailable are replaced
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'reserve_retry_time': 15})

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, 5)

        # Submit two jobs to take up nodes 0 and 1. This forces the reservation
        # onto nodes 3 and 4. The idea is to delete the two jobs and see
        # if the reservation shifts onto nodes 0 and 1 after the reconfirm
        j1 = Job(attrs={'Resource_List.select': '1:ncpus=1'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        j2 = Job(attrs={'Resource_List.select': '1:ncpus=1'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        now = int(time.time())
        start = now + 20
        rid = self.submit_reservation(user=TEST_USER,
                                      select='2:ncpus=1',
                                      start=start,
                                      end=start + 60)
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')}, id=rid)
        resv_queue = rid.split('.')[0]
        a = {'Resource_List.select': '1:ncpus=1', 'queue': resv_queue}
        j3 = Job(attrs=a)
        jid3 = self.server.submit(j3)

        self.logger.info('Sleeping until reservation starts')
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
                           id=rid, offset=start - int(time.time()))
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        self.server.delete(jid1, wait=True)
        self.server.delete(jid2, wait=True)
        self.server.status(RESV)
        rnodes = self.server.reservations[rid].get_vnodes()
        self.server.status(JOB)
        jnode = j3.get_vnodes()[0]
        other_node = rnodes[rnodes[0] == jnode]
        self.server.manager(MGR_CMD_SET, NODE, {
                            'state': (INCR, 'offline')}, id=other_node)
        self.server.expect(RESV, {'reserve_substate': 10}, id=rid)
        self.logger.info('Waiting until reconfirmation')
        self.server.expect(RESV, {'reserve_substate': 5}, id=rid, offset=7)
        self.server.status(RESV)
        rnodes2 = self.server.reservations[rid].get_vnodes()
        self.assertIn(jnode, rnodes2, 'Reservation not on job node')

    def test_standing_reservation_occurrence_two_not_degraded(self):
        """
        Test that when a standing reservation's occurrence 1 is on an offline
        vnode and occurrence 2 is not, that when the first occurrence finishes
        the reservation is back in the confirmed state
        """

        a = {'reserve_retry_time': 15}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, num=2)

        start_time = time.time()
        now = int(start_time)
        rid1 = self.submit_reservation(user=TEST_USER, select='1:ncpus=1',
                                       start=now + 3600, end=now + 7200)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid1)

        start = now + 25
        end = now + 55
        rid2 = self.submit_reservation(user=TEST_USER, select='1:ncpus=1',
                                       start=start, end=end,
                                       rrule='freq=HOURLY;count=5')
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid2)

        self.server.status(RESV, 'resv_nodes')
        resv_node = self.server.reservations[rid1].get_vnodes()[0]
        resv_node2 = self.server.reservations[rid2].get_vnodes()[0]

        msg = 'Reservations not on the same vnode'
        self.assertEqual(resv_node, resv_node2, msg)

        J = Job(attrs={'Resource_List.walltime': 1800})
        jid = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.server.manager(MGR_CMD_SET, NODE, {'state': 'offline'}, resv_node)

        self.logger.info('Sleeping until retry timer fires')
        time.sleep(15)
        # Can't reconfirm rid1 because rid2's second occurrence should be
        # on node 2 at that time.
        self.scheduler.log_match(rid1 + ';Reservation is in degraded mode',
                                 starttime=start_time, interval=1)
        # Can't reconfirm rid2 because the job is running on node 2.
        self.scheduler.log_match(rid2 + ';Reservation is in degraded mode',
                                 starttime=start_time, interval=1)

        self.logger.info('Sleeping until standing reservation runs')
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid2, offset=start - int(time.time()))

        self.logger.info('Sleeping until occurrence finishes')
        # occurrence 2 is not on the offlined node.  It should be confirmed
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid2, offset=end - int(time.time()))

    def test_degraded_reservation_reconfirm_running_job(self):
        """
        Test that a reservation isn't reconfirmed if there is a running job
        on an node that is offline until the job finishes.
        """
        a = {'reserve_retry_time': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, num=2)

        now = int(time.time())
        start = now + 25
        rid = self.submit_reservation(select='1:ncpus=1', user=TEST_USER,
                                      start=start, end=now + 625)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)
        resv_queue = rid.split('.')[0]

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]

        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: resv_queue}
        J = Job(attrs=a)
        jid = self.server.submit(J)

        self.logger.info('Sleeping until reservation runs')
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')},
                           offset=start - int(time.time()), id=rid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.server.manager(MGR_CMD_SET, NODE, {'state': 'offline'},
                            id=resv_node)
        self.server.expect(RESV, {'reserve_substate': 10}, id=rid)
        self.scheduler.log_match(rid + ';PBS Failed to confirm resv: '
                                 'Reservation has running jobs in it',
                                 interval=1)

        self.server.delete(jid)

        self.server.expect(RESV, {'reserve_substate': 5}, id=rid)

    def test_not_honoring_resvs(self):
        """
        PBS schedules jobs on nodes without accounting
        for the reservation on the node
        """

        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        now = int(time.time())
        start1 = now + 15
        end1 = now + 25
        start2 = now + 600
        end2 = now + 7200

        r1id = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       start=start1,
                                       end=end1)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, r1id)

        r2id = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=4',
                                       start=start2,
                                       end=end2)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, r2id)

        r1_que = r1id.split('.')[0]
        for i in range(20):
            j = Job(TEST_USER)
            a = {'Resource_List.select': '1:ncpus=1',
                 'Resource_List.walltime': 10, 'queue': r1_que}
            j.set_attributes(a)
            self.server.submit(j)

        j1 = Job(TEST_USER)
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 7200}
        j1.set_attributes(a)
        j1id = self.server.submit(j1)

        j2 = Job(TEST_USER)
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 7200}
        j2.set_attributes(a)
        j2id = self.server.submit(j2)

        self.logger.info('Sleeping till Resv 1 ends')
        a = {'reserve_state': (MATCH_RE, "RESV_BEING_DELETED|7")}
        off = end1 - int(time.time())
        self.server.expect(RESV, a, id=r1id, interval=1, offset=off)

        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.expect(JOB, {'job_state': 'Q'}, id=j1id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j2id)

    def test_sched_cycle_starts_on_resv_end(self):
        """
        This test checks whether the sched cycle gets started
        when the advance reservation ends.
        """
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname,
                            sudo=True)

        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=2',
                                      start=now + 10,
                                      end=now + 30)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, rid)

        attr = {'Resource_List.walltime': '00:00:20'}
        j = Job(TEST_USER, attr)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'Q'},
                           id=jid)
        msg = "Job would conflict with reservation or top job"
        self.server.expect(
            JOB, {ATTR_comment: "Not Running: " + msg}, id=jid)
        self.scheduler.log_match(
            jid + ";" + msg,
            max_attempts=30)

        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|2')}
        self.server.expect(RESV, a, rid)

        resid = rid.split('.')[0]
        self.server.log_match(resid + ";deleted at request of pbs_server",
                              id=resid, interval=5)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

    def test_exclusive_state(self):
        """
        Test that the resv-exclusive and job-exclusive
        states are approprately set
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname,
                            sudo=True)

        now = int(time.time())
        rid = self.submit_reservation('1:ncpus=1', now + 30, now + 3600,
                                      user=TEST_USER, place='excl')

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid)

        self.logger.info('Waiting 30s for reservation to start')
        exp_attr['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, exp_attr, id=rid, offset=30)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_vnode = self.server.reservations[rid].get_vnodes()[0]
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=resv_vnode)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl', 'queue': rid.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        n = self.server.status(NODE, id=resv_vnode)
        states = n[0]['state'].split(',')
        self.assertIn('resv-exclusive', states)
        self.assertIn('job-exclusive', states)

    def test_resv_excl_future_resv(self):
        """
        Test to see that exclusive reservations in the near term do not
        interfere with longer term reservations
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname,
                            sudo=True)

        now = int(time.time())
        rid1 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       start=now + 30,
                                       end=now + 3600)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid1)

        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       start=now + 7200,
                                       end=now + 10800)

        self.server.expect(RESV, exp_attr, id=rid2)

    def test_job_exceed_resv_end(self):
        """
        Test to see that a job when submitted to a reservation without the
        walltime would not show up as exceeding the reservation and
        making the scheduler reject future reservations.
        """

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname,
                            sudo=True)

        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      place='excl',
                                      start=now + 30,
                                      end=now + 300)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid)

        self.logger.info('Waiting 30s for reservation to start')
        exp_attr['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, exp_attr, id=rid, offset=30)

        # Submit a job but do not specify walltime, scheduler will consider
        # the walltime of such a job to be 5 years
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl',
             'queue': rid.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Submit another reservation that will start after first
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       start=now + 360,
                                       end=now + 3600)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid2)

    def test_future_resv_conflicts_running_job(self):
        """
        Test if a running exclusive job without walltime will deny the future
        resv from getting confirmed.
        """

        vnode_val = None
        if self.mom.is_cpuset_mom():
            vnode_val = '1:ncpus=1:vnode=' + self.server.status(NODE)[1]['id']
            select_val = vnode_val
        else:
            select_val = '1:ncpus=1'

        now = int(time.time())
        # Submit a job but do not specify walltime, scheduler will consider
        # the walltime of such a job to be 5 years
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl'}
        if self.mom.is_cpuset_mom():
            a['Resource_List.select'] = vnode_val

        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Submit a reservation that will start after the job starts running
        rid1 = self.submit_reservation(user=TEST_USER,
                                       select=select_val,
                                       start=now + 360,
                                       end=now + 3600)

        self.server.log_match(rid1 + ";Reservation denied",
                              id=rid1, interval=5)

    def test_future_resv_confirms_after_running_job(self):
        """
        Test if a future reservation gets confirmed if its start time starts
        after the end time of a job running in an exclusive reservation
        """

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname,
                            sudo=True)

        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      place='excl',
                                      start=now + 30,
                                      end=now + 300)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid)

        self.logger.info('Waiting 30s for reservation to start')
        exp_attr['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, exp_attr, id=rid, offset=30)

        # Submit a job with walltime exceeding reservation duration
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl',
             'Resource_List.walltime': 600,
             'queue': rid.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Submit another reservation that will start after the job ends
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       start=now + 630,
                                       end=now + 3600)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid2)

    def test_future_resv_confirms_before_non_excl_job(self):
        """
        Test if a future reservation gets confirmed if its start time starts
        before the end time of a non exclusive job running in an exclusive
        reservation.
        """

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname,
                            sudo=True)

        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      place='excl',
                                      start=now + 30,
                                      end=now + 300)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid)

        self.logger.info('Waiting 30s for reservation to start')
        exp_attr['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, exp_attr, id=rid, offset=30)

        # Submit a job with walltime exceeding reservation duration
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 600,
             'queue': rid.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Submit another reservation that will start after the first
        # reservation ends
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       start=now + 330,
                                       end=now + 3600)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid2)

    def test_future_resv_with_non_excl_jobs(self):
        """
        Test if future reservations with/without exclusive placement are
        confirmed if their start time starts before end time of non exclusive
        jobs that are running in reservation.
        """

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname,
                            sudo=True)

        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      start=now + 30,
                                      end=now + 300)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid)

        self.logger.info('Waiting 30s for reservation to start')
        exp_attr['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, exp_attr, id=rid, offset=30)

        # Submit a job with walltime exceeding reservation
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 600,
             'queue': rid.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Submit another non exclusive reservation that will start after
        # previous reservation ends but before job's walltime is over.
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       start=now + 330,
                                       end=now + 3600)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid2)

        self.server.delete(rid2)

        # Submit another exclusive reservation that will start after
        # previous reservation ends but before job's walltime is over.
        rid3 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       start=now + 330,
                                       end=now + 3600)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid3)

    def test_resv_excl_with_jobs(self):
        """
        Test to see that exclusive reservations in the near term do not
        interfere with longer term reservations with jobs inside
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      place='excl',
                                      start=now + 30,
                                      end=now + 300)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid)

        self.logger.info('Waiting 30s for reservation to start')
        exp_attr['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, exp_attr, id=rid, offset=30)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl',
             'Resource_List.walltime': '30',
             'queue': rid.split('.')[0]}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        # Submit another reservation that will start after first
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       start=now + 360,
                                       end=now + 3600)

        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid2)

    def test_resv_server_restart(self):
        """
        Test if a reservation correctly goes into the resv-exclusive state
        if the server is restarted between when the reservation gets
        confirmed and when it starts
        """
        now = int(time.time())
        start = now + 30
        a = {'Resource_List.select': '1:ncpus=1:vnode=' +
             self.mom.shortname}
        if self.mom.is_cpuset_mom():
            vnode_val = '1:ncpus=1:vnode=' + self.server.status(NODE)[1]['id']
            a['Resource_List.select'] = vnode_val

        rid = self.submit_reservation(user=TEST_USER,
                                      select=a['Resource_List.select'],
                                      place='excl',
                                      start=start,
                                      end=start + 3600)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        self.server.restart()

        sleep_time = start - int(time.time())

        self.logger.info('Waiting %d seconds till resv starts' % sleep_time)
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid, offset=sleep_time)

        mom_name = self.mom.shortname
        if self.mom.is_cpuset_mom():
            mom_name = self.server.status(NODE)[1]['id']
        self.server.expect(NODE, {'state': 'resv-exclusive'},
                           id=mom_name)

    def test_resv_exclusive_after_node_offlined(self):
        """
        Test if the set of reserved nodes correctly goes into the
        resv-exclusive state if a node in the initially confirmed reservation
        is offlined and the reservation is only reconfirmed and assigned new
        nodes when the reservation is starting.
        """
        a = {'reserve_retry_time': 3600}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'resources_available.ncpus': 1, 'sharing': 'default_excl'}
        self.mom.create_vnodes(a, num=6)

        now = int(time.time())
        start = now + 30
        rid = self.submit_reservation(user=TEST_USER,
                                      select='4:ncpus=1',
                                      place='excl',
                                      start=start,
                                      end=start + 3600)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_nodes = self.server.reservations[rid].get_vnodes()
        self.logger.info("RESV_NODES: %s", resv_nodes)

        self.server.manager(MGR_CMD_SET, NODE, {'state': 'offline'},
                            id=resv_nodes[0])

        a = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED')}
        self.server.expect(RESV, a, id=rid)

        sleep_time = start - int(time.time())
        self.logger.info('Waiting %d seconds till resv starts' % sleep_time)
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid, offset=sleep_time)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_nodes = self.server.reservations[rid].get_vnodes()
        self.logger.info("RESV_NODES: %s", resv_nodes)

        for n in resv_nodes:
            self.server.expect(NODE, {'state': 'resv-exclusive'},
                               id=n, max_attempts=1)

    def test_multiple_asap_resv(self):
        """
        Test that multiple ASAP reservations are scheduled one after another
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 1},
                            id=self.mom.shortname)

        job_attrs = {'Resource_List.select': '1:ncpus=1',
                     'Resource_List.walltime': '1:00:00'}
        j = Job(TEST_USER, attrs=job_attrs)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        s = self.server.status(JOB, 'stime', id=jid1)
        job_stime = int(time.mktime(time.strptime(s[0]['stime'], '%c')))

        j = Job(TEST_USER, attrs=job_attrs)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, 'comment', op=SET, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        rid1 = self.submit_asap_reservation(TEST_USER, jid2)
        exp_attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attrs, id=rid1)
        s = self.server.status(RESV, 'reserve_start', id=rid1)
        resv1_stime = int(time.mktime(
            time.strptime(s[0]['reserve_start'], '%c')))
        msg = 'ASAP reservation has incorrect start time'
        self.assertEqual(resv1_stime, job_stime + 3600, msg)

        j = Job(TEST_USER, attrs=job_attrs)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, 'comment', op=SET, id=jid3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)

        rid2 = self.submit_asap_reservation(TEST_USER, jid3)
        exp_attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attrs, id=rid2)
        s = self.server.status(RESV, 'reserve_start', id=rid2)
        resv2_stime = int(time.mktime(
            time.strptime(s[0]['reserve_start'], '%c')))
        msg = 'ASAP reservation has incorrect start time'
        self.assertEqual(resv2_stime, resv1_stime + 3600, msg)

    def test_excl_asap_resv_before_longterm_resvs(self):
        """
        Test if an ASAP reservation created from an exclusive
        placement job does not interfere with subsequent long
        term advance and standing exclusive reservations
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        # Submit a job and let it run with available resources
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 30}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        # Submit a second job with exclusive node placement
        # and let it be queued
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 300,
             'Resource_List.place': 'excl'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, 'comment', op=SET, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        # Convert j2 into an ASAP reservation
        rid1 = self.submit_asap_reservation(user=TEST_USER,
                                            jid=jid2)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid1)

        # Wait for the reservation to start
        self.logger.info('Waiting 30 seconds for reservation to start')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid1, offset=30)

        # Submit a long term reservation with exclusive node
        # placement when rid1 is running
        # This reservation should be confirmed
        now = int(time.time())
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       start=now + 3600,
                                       end=now + 3605)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid2)

        # Submit a long term standing reservation with exclusive node
        # placement when rid1 is running
        # This reservation should also be confirmed
        now = int(time.time())
        rid3 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       rrule='FREQ=HOURLY;COUNT=3',
                                       start=now + 7200,
                                       end=now + 7205)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid3)

    def test_excl_asap_resv_after_longterm_resvs(self):
        """
        Test if an exclusive ASAP reservation created from an exclusive
        placement job does not interfere with already existing long term
        exclusive reservations.
        Also, test if future exclusive reservations are successful when
        the ASAP reservation is running.
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        # Submit a long term advance reservation with exclusive node
        now = int(time.time())
        rid1 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       start=now + 360,
                                       end=now + 365)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid1)

        # Submit a long term standing reservation with exclusive node
        now = int(time.time())
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       rrule='FREQ=HOURLY;COUNT=3',
                                       start=now + 3600,
                                       end=now + 3605)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid2)

        # Submit a job and let it run with available resources
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 30}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        # Submit a second job with exclusive node placement
        # and let it be queued
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 300,
             'Resource_List.place': 'excl'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, 'comment', op=SET, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        # Convert j2 into an ASAP reservation
        rid1 = self.submit_asap_reservation(user=TEST_USER,
                                            jid=jid2)

        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid1)

        # Wait for the reservation to start
        self.logger.info('Waiting 30 seconds for reservation to start')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid1, offset=30)

        # Submit a long term reservation with exclusive node
        # placement when rid1 is running
        # This reservation should be confirmed
        now = int(time.time())
        rid3 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=1',
                                       place='excl',
                                       start=now + 3600,
                                       end=now + 3605)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid3)

    def test_multi_vnode_excl_advance_resvs(self):
        """
        Test if long term exclusive reservations do not interfere
        with current reservations on a multi-vnoded host
        """
        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, num=3)

        # Submit a long term standing reservation with
        # exclusive nodes.
        now = int(time.time())
        rid1 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=9',
                                       place='excl',
                                       rrule='FREQ=HOURLY;COUNT=3',
                                       start=now + 7200,
                                       end=now + 7205)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid1)

        # Submit a long term advance reservation with exclusive node
        now = int(time.time())
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=10',
                                       place='excl',
                                       start=now + 3600,
                                       end=now + 3605)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid2)

        # Submit a short term reservation requesting all the nodes
        # exclusively
        now = int(time.time())
        rid3 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=12',
                                       place='excl',
                                       start=now + 20,
                                       end=now + 100)
        exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, exp_attr, id=rid3)

        exp_attr['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, exp_attr, id=rid3, offset=30)

    def test_multi_vnode_excl_asap_resv(self):
        """
        Test if an ASAP reservation created from a excl placement
        job does not interfere with future multinode exclusive
        reservations on a multi-vnoded host
        """
        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, num=3)

        # Submit 3 exclusive jobs, so all the nodes are busy
        # j1 requesting 4 cpus, j2 requesting 4 cpus and j3
        # requesting 5 cpus
        a = {'Resource_List.select': '1:ncpus=4',
             'Resource_List.place': 'excl',
             'Resource_List.walltime': 30}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        a['Resource_List.walltime'] = 400
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        a = {'Resource_List.select': '1:ncpus=5',
             'Resource_List.place': 'excl',
             'Resource_List.walltime': 100}
        j3 = Job(TEST_USER, attrs=a)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, 'comment', op=SET, id=jid3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)

        # Convert J3 to ASAP reservation
        rid1 = self.submit_asap_reservation(user=TEST_USER,
                                            jid=jid3)

        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid1)

        # Wait for the reservation to start
        self.logger.info('Waiting 30 seconds for reservation to start')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid1, offset=30)

        # Submit a long term reservation with exclusive node
        # placement when rid1 is running (requesting all nodes)
        # This reservation should be confirmed
        now = int(time.time())
        rid2 = self.submit_reservation(user=TEST_USER,
                                       select='1:ncpus=12',
                                       place='excl',
                                       start=now + 3600,
                                       end=now + 3605)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid2)

    def test_fail_confirm_resv_message(self):
        """
        Test if the scheduler fails to reserve a
        reservation, the reason will be logged.
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        # Submit a long term advance reservation that will be denied
        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=10',
                                      start=now + 360,
                                      end=now + 365)
        self.server.log_match(rid + ";Reservation denied",
                              id=rid, interval=5)
        # The scheduler should log reason why it was denied
        self.scheduler.log_match(rid + ";PBS Failed to confirm resv: " +
                                 "Insufficient amount of resource: ncpus")

    def common_steps(self):
        """
        This function has common steps for configuration used in tests
        """
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        self.server.manager(MGR_CMD_SET, SERVER, {
            'job_history_enable': 'True'})

    def test_advance_reservation_with_job_array(self):
        """
        Test to submit a job array within a advance reservation
        Check if the reservation gets confimed and the jobs
        inside the reservation starts running when the reservation runs.
        """
        self.common_steps()
        # Submit a job-array
        j = Job(TEST_USER, attrs={ATTR_J: '1-4'})
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'B'}, jid)
        self.server.expect(JOB, {'job_state=R': 4}, count=True,
                           id=jid, extend='t')
        # Check status of the sub-job using qstat -fx once job completes
        self.server.expect(JOB, {'job_state': 'F'}, extend='x',
                           offset=10, id=jid)

        # Submit a advance reservation (R1) and an array job to the reservation
        # once reservation confirmed
        start_time = time.time()
        resv_start_time = int(start_time) + 20
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      start=resv_start_time,
                                      end=resv_start_time + 100)
        rid_q = rid.split('.')[0]
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)

        a = {ATTR_q: rid_q, ATTR_J: '1-4'}
        j2 = Job(TEST_USER, attrs=a)
        j2.set_sleep_time(20)
        jid2 = self.server.submit(j2)
        subjid = []
        for i in range(1, 5):
            subjid.append(j.create_subjob_id(jid2, i))

        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        expect_offset = resv_start_time - int(time.time())
        self.server.expect(RESV, a, id=rid, offset=expect_offset)
        self.server.expect(JOB, {'job_state': 'B'}, jid2)
        self.server.expect(JOB, {'job_state=R': 1}, count=True,
                           id=jid2, extend='t')
        self.server.expect(JOB, {'job_state=Q': 3}, count=True,
                           extend='t', id=jid2)
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid[0])
        self.server.expect(JOB, {'job_state': 'Q'}, id=subjid[1])
        self.server.expect(JOB, {'job_state': 'Q'}, id=subjid[2])
        self.server.expect(JOB, {'job_state': 'Q'}, id=subjid[3])
        self.server.delete(subjid[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid[1])
        # Wait for reservation to delete from server
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=start_time, interval=10)
        # Check status of the sub-job using qstat -fx once job completes
        self.server.expect(JOB, {'job_state': 'F', 'Exit_status': '271'},
                           extend='x', attrop=PTL_AND, id=subjid[0])
        self.server.expect(JOB, {'job_state': 'F', 'Exit_status': '0'},
                           extend='x', attrop=PTL_AND, id=subjid[3])

        # Submit a advance reservation (R2) and an array job to the reservation
        # once reservation confirmed
        start_time = time.time()
        resv_start_time = int(start_time) + 20
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=4',
                                      start=resv_start_time,
                                      end=resv_start_time + 160)
        rid_q = rid.split('.')[0]
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)

        a = {ATTR_q: rid_q, ATTR_J: '1-4'}
        j2 = Job(TEST_USER, attrs=a)
        j2.set_sleep_time(60)
        jid2 = self.server.submit(j2)
        subjid = []
        for i in range(1, 5):
            subjid.append(j.create_subjob_id(jid2, i))

        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        expect_offset = resv_start_time - int(time.time())
        self.server.expect(RESV, a, id=rid, offset=expect_offset)
        self.server.expect(JOB, {'job_state': 'B'}, jid2)
        self.server.expect(JOB, {'job_state=R': 4}, count=True,
                           id=jid2, extend='t')
        # Submit another job-array with small sleep time than job j2
        a = {ATTR_q: rid_q, ATTR_J: '1-4'}
        j3 = Job(TEST_USER, attrs=a)
        j3.set_sleep_time(20)
        jid3 = self.server.submit(j3)
        subjid2 = []
        for i in range(1, 5):
            subjid2.append(j.create_subjob_id(jid3, i))
        self.server.expect(JOB, {'job_state': 'Q'}, jid3)
        self.server.expect(JOB, {'job_state=Q': 5}, count=True,
                           id=jid3, extend='t')
        self.server.expect(JOB, {'job_state': 'Q'}, id=subjid2[0])
        # Wait for job array j2 to finish and verify all sub-job
        # from j3 start running
        self.server.expect(JOB, {'job_state': 'B'}, jid3, offset=30,
                           interval=5, max_attempts=30)
        self.server.expect(JOB, {'job_state=R': 4}, count=True,
                           id=jid3, extend='t')
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=start_time, interval=10)
        # Check status of the job-array using qstat -fx at the end of
        # reservation
        self.server.expect(JOB, {'job_state': 'F', 'Exit_status': '0'},
                           extend='x', attrop=PTL_AND, id=jid2)
        self.server.expect(JOB, {'job_state': 'F', 'Exit_status': '0'},
                           extend='x', attrop=PTL_AND, id=jid3)

    @requirements(num_moms=2)
    def test_advance_resv_with_multinode_job_array(self):
        """
        Test multinode job array with advance reservation
        """
        if (len(self.moms) < 2):
            self.skip_test("Test requires 2 moms: use -p mom1:mom2")
        a = {'resources_available.ncpus': 4}
        for mom in self.moms.values():
            self.server.manager(MGR_CMD_SET, NODE, a, id=mom.shortname)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})
        # Submit reservation with placement type scatter
        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER,
                                      select='2:ncpus=2',
                                      place='scatter',
                                      start=now + 30,
                                      end=now + 300)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)
        resv_queue = rid.split(".")[0]

        # Submit job array in reservation queue
        attrs = {ATTR_q: resv_queue, ATTR_J: '1-5',
                 'Resource_List.select': '2:ncpus=1'}
        j = Job(PBSROOT_USER, attrs)
        j.set_sleep_time(60)
        jid = self.server.submit(j)
        subjid = []
        for i in range(1, 6):
            subjid.append(j.create_subjob_id(jid, i))

        self.logger.info("Wait 30s for resv to be in Running state")
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid, offset=30)
        self.server.expect(JOB, {'job_state': 'B'}, id=jid)
        self.server.expect(JOB, {'job_state=R': 2}, count=True,
                           extend='t', id=jid)
        self.server.expect(JOB, {'job_state=Q': 3}, count=True,
                           extend='t', id=jid)
        self.server.sigjob(jobid=subjid[0], signal="suspend")
        self.server.expect(JOB, {'job_state': 'S'}, id=subjid[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid[2])

        # Submit job array with placement type scatter in resv queue
        attrs = {ATTR_q: resv_queue, ATTR_J: '1-5',
                 'Resource_List.place': 'scatter',
                 'Resource_List.select': '2:ncpus=1'}
        j1 = Job(PBSROOT_USER, attrs)
        j1.set_sleep_time(60)
        jid2 = self.server.submit(j1)
        subjid2 = []
        for i in range(1, 6):
            subjid2.append(j.create_subjob_id(jid2, i))
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        self.server.sigjob(subjid[0], 'resume')
        self.logger.info("Wait 120s for all the subjobs to complete")
        self.server.expect(JOB, {'job_state': 'F', 'exit_status': '0'},
                           id=jid, extend='x', interval=10, offset=120)

        self.server.expect(JOB, {'job_state': 'B'}, id=jid2)
        self.server.expect(JOB, {'job_state=R': 2}, count=True,
                           extend='t', id=jid2)
        self.server.expect(JOB, {'job_state=Q': 3}, count=True,
                           extend='t', id=jid2)
        self.server.sigjob(jobid=subjid2[0], signal="suspend")
        self.server.expect(JOB, {'job_state': 'S'}, id=subjid2[0])
        self.server.sigjob(jobid=subjid2[1], signal="suspend")
        self.server.expect(JOB, {'job_state': 'S'}, id=subjid2[1])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid2[2])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid2[3])
        self.server.delete([subjid2[2], subjid2[3]])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid2[4])
        self.server.expect(JOB, {'job_state': 'X'}, id=subjid2[4], offset=60)
        self.server.sigjob(subjid2[0], 'resume')
        self.server.sigjob(subjid2[1], 'resume')
        self.server.expect(JOB, {'job_state=R': 2}, count=True,
                           extend='t', id=jid2)
        self.logger.info("Wait 120s for all the subjobs to complete")
        self.server.expect(JOB, {'job_state': 'F'},
                           id=jid2, extend='x', interval=10, offset=120)

    def test_reservations_with_expired_subjobs(self):
        """
        Test that an array job submitted to a reservation ends when
        there are expired subjobs in the array job and job history is
        enabled
        """
        self.common_steps()
        # Submit an advance reservation and an array job to the reservation
        # once reservation confirmed
        start_time = time.time()
        now = int(start_time)
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      start=now + 10,
                                      end=now + 40)
        rid_q = rid.split('.')[0]
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)

        # submit enough jobs that there are some expired subjobs and some
        # queued/running subjobs left in the system by the time reservation
        # ends
        a = {ATTR_q: rid_q, ATTR_J: '1-20'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(2)
        jid = self.server.submit(j)

        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(JOB, {'job_state': 'B'}, jid)
        # Wait for reservation to delete from server
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=start_time, interval=10)
        # Check status of the parent-job using qstat -fx once reservation ends
        self.server.expect(JOB, {'job_state': 'F', 'substate': '91'},
                           extend='x', id=jid)

    def test_ASAP_resv_request_same_time(self):
        """
        Test two jobs converted in two ASAP reservation
        which request same walltime should run and finish as
        per available resources.
        Also to verify 2 ASAP reservations with same start
        time doesn't crashes PBS daemon.
        """
        self.common_steps()

        # Submit job j to consume all resources
        a = {'Resource_List.walltime': '10',
             'Resource_List.select': '1:ncpus=4'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)

        # Submit a job j2
        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': '10'}
        j2 = Job(TEST_USER, attrs=a)
        j2.set_sleep_time(10)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, jid2)

        # Convert j2 into an ASAP reservation
        now = time.time()
        rid1 = self.submit_asap_reservation(user=TEST_USER,
                                            jid=jid2)
        rid1_q = rid1.split('.')[0]
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2"),
                    'reserve_duration': 10}
        self.server.expect(RESV, exp_attr, id=rid1)
        self.server.expect(
            JOB, {'job_state': 'Q', 'queue': rid1_q}, id=jid2)

        # Submit another job j3 same as j2
        j3 = Job(TEST_USER, attrs=a)
        j3.set_sleep_time(10)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'Q'}, jid3)
        # Convert j3 into an ASAP reservation
        now2 = time.time()
        rid2 = self.submit_asap_reservation(user=TEST_USER,
                                            jid=jid3)
        rid2_q = rid2.split('.')[0]
        self.server.expect(RESV, exp_attr, id=rid2)
        self.server.expect(
            JOB, {'job_state': 'Q', 'queue': rid2_q}, id=jid3)

        # Wait for both  reservation to start
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid1)
        self.server.expect(RESV, exp_attr, id=rid2)
        # Verify j2 and j3 start running
        self.server.expect(
            JOB, {'job_state': 'R', 'queue': rid1_q}, id=jid2)
        self.server.expect(
            JOB, {'job_state': 'R', 'queue': rid2_q}, id=jid3)

        # Wait for reservations to be finish
        msg = "Que;" + rid1_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=now, interval=5)
        msg = "Que;" + rid2_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=now2)
        # Check status of the job using qstat -fx once reservation
        # ends
        jids = [jid2, jid3]
        for job in jids:
            self.server.expect(JOB, 'queue', op=UNSET, id=job)
            self.server.expect(JOB, {'job_state=F': 1}, count=True,
                               id=job, extend='x')

        # Verify pbs_server and pbs_scheduler is up
        if not self.server.isUp():
            self.fail("Server is not up")
        if not self.scheduler.isUp():
            self.fail("Scheduler is not up")

    def test_standing_resv_with_job_array(self):
        """
        Test job-array with standing reservation
        """
        self.common_steps()
        if 'PBS_TZID' in self.conf:
            tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Missing timezone, using America/Los_Angeles')
            tzone = 'America/Los_Angeles'
        # Submit a standing reservation to occur every other minute for a
        # total count of 2
        start = time.time() + 10
        now = start + 25
        start = int(start)
        end = int(now)
        rid = self.submit_reservation(user=TEST_USER, select='1:ncpus=4',
                                      rrule='FREQ=MINUTELY;INTERVAL=2;COUNT=2',
                                      start=start, end=end)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)
        rid_q = rid.split(".")[0]
        # Submit a job-array within reservation
        j = Job(TEST_USER, attrs={'Resource_List.select': '1:ncpus=1',
                                  ATTR_q: rid_q, ATTR_J: '1-4'})
        j.set_sleep_time(15)
        jid = self.server.submit(j)
        subjid = []
        for i in range(1, 4):
            subjid.append(j.create_subjob_id(jid, i))
        # Wait for standing reservation first instance to start
        self.logger.info('Waiting until reservation runs')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid,
                           offset=start - int(time.time()))
        self.server.expect(RESV, {'reserve_index': 1}, id=rid)
        self.server.expect(JOB, {'job_state': 'B'}, jid)
        self.server.expect(JOB, {'job_state=R': 4}, count=True,
                           id=jid, extend='t')
        # Wait for standing reservation first instance to finished
        self.logger.info('Waiting for first occurrence to finish')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid,
                           offset=end - int(time.time()))
        self.server.expect(JOB, 'queue', op=UNSET, id=jid)
        # Wait for standing reservation second instance to start
        offset = end - int(time.time()) + 120 - (end - start)
        self.logger.info(
            'Waiting for second occurrence of reservation to start')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid, offset=offset, interval=1)
        self.server.expect(RESV, {'reserve_index': 2}, id=rid)
        # Wait for reservations to be finished
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=now, interval=2)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

        # Check for subjob status for job-array
        # as all subjobs from job-array finished within the
        # instance so it should have substate=92
        for i in subjid:
            self.server.expect(JOB, {'job_state': 'F', 'substate': '92'},
                               extend='x', id=i)
        # Check for finished jobs by issuing the command qstat
        self.server.expect(JOB, {'job_state': 'F', 'substate': '92'},
                           extend='xt', id=jid)

        start = int(time.time()) + 25
        end = int(time.time()) + 3660
        rid = self.submit_reservation(user=TEST_USER, select='1:ncpus=1',
                                      rrule='FREQ=DAILY;COUNT=2',
                                      start=start, end=end)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)
        rid_q = rid.split(".")[0]
        # Submit a job-array within resrvation
        j = Job(TEST_USER, attrs={
            'Resource_List.walltime': 20, ATTR_q: rid_q, ATTR_J: '1-5'})
        j.set_sleep_time(20)
        jid = self.server.submit(j)
        subjid = []
        for i in range(1, 6):
            subjid.append(j.create_subjob_id(jid, i))
        # Wait for standing reservation first instance to start
        # Verify one subjob start running and others remain queued
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid, interval=1)
        self.server.expect(RESV, {'reserve_index': 1}, id=rid)
        self.server.expect(JOB, {'job_state': 'B'}, jid)
        self.server.expect(JOB, {'job_state=R': 1}, count=True,
                           id=jid, extend='t')
        self.server.expect(JOB, {'job_state=Q': 4}, count=True,
                           id=jid, extend='t')
        # Suspend running subjob[1], verify
        # subjob[2] start running
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid[0])
        self.server.sigjob(jobid=subjid[0], signal="suspend")
        self.server.expect(JOB, {'job_state': 'S'}, id=subjid[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid[1])
        # Resume subjob[1] and verify subjob[1] should
        # run once resources are available
        self.server.sigjob(subjid[0], 'resume')
        self.server.expect(JOB, {'job_state': 'S'}, id=subjid[0])
        self.server.delete(subjid[1])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid[2])
        self.server.delete([subjid[2], subjid[3], subjid[4]])
        self.server.expect(JOB, {'job_state': 'R'}, id=subjid[0])
        self.server.expect(JOB, {'job_state': 'F',  'substate': '92',
                                 'queue': rid_q}, id=subjid[0], extend='x')

        self.server.expect(JOB, {'job_state': 'F',  'queue': rid_q},
                           id=jid, extend='x')

    def test_multiple_job_array_within_standing_reservation(self):
        """
        Test multiple job-array submitted to a standing reservations
        and subjobs exceed walltime to run within instance of
        reservation
        """
        self.common_steps()

        # Submit a standing reservation to occur every other minute for a
        # total count of 2
        start = time.time() + 10
        now = start + 30
        start = int(start)
        end = int(now)
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=4',
                                      rrule='FREQ=MINUTELY;INTERVAL=2;COUNT=2',
                                      start=start,
                                      end=end)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)
        rid_q = rid.split(".")[0]
        # Submit 3 job-array within reservation with sleep time longer
        # than instance duration
        subjid = []
        jids = []
        for i in range(3):
            j = Job(TEST_USER, attrs={ATTR_q: rid_q, ATTR_J: '1-2'})
            j.set_sleep_time(100)
            pjid = self.server.submit(j)
            jids.append(pjid)
            for subid in range(1, 3):
                subjid.append(j.create_subjob_id(pjid, subid))
        # Wait for first instance of reservation to be start
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid, interval=1)
        self.server.expect(RESV, {'reserve_index': 1}, id=rid)
        self.server.expect(JOB, {'job_state': 'B'}, jids[0])
        self.server.expect(JOB, {'job_state=R': 2}, count=True,
                           id=jids[0], extend='t')
        self.server.expect(JOB, {'job_state=R': 2}, count=True,
                           id=jids[1], extend='t')
        self.server.expect(JOB, {'job_state=Q': 3}, count=True,
                           id=jids[2], extend='t')
        # At end of first instance of reservation ,verify running subjobs
        # should be finished
        self.logger.info(
            'Waiting 20 sec job-array 1 and 2 to be finished')
        self.server.expect(JOB, {'job_state=F': 3}, extend='xt',
                           offset=20, id=jids[0])
        self.server.expect(JOB, {'job_state=F': 3}, extend='xt',
                           id=jids[1])

        # Wait for standing reservation second instance to confirmed
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)
        # Check for queued jobs in second instance of reservation
        self.server.expect(JOB, {'job_state': 'Q',
                                 'comment': (MATCH_RE, 'Queue not started')},
                           id=jids[2])
        self.logger.info(
            'Waiting 55 sec for second instance of reservation to start')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, exp_attr, id=rid, offset=55, interval=1)
        self.server.expect(RESV, {'reserve_index': 2}, id=rid)
        # Check for queued jobs should be running
        self.server.expect(JOB, {'job_state=R': 2}, extend='xt',
                           id=jids[2])

        # Check for running jobs in second instance should finished
        self.logger.info(
            'Waiting 30 sec for second instance of reservation to finished')
        self.server.expect(JOB, {'job_state=F': 3}, extend='xt',
                           offset=30, id=jids[2])

        # Wait for reservation to be finished
        msg = "Que;" + rid_q + ";deleted at request of pbs_server@"
        self.server.log_match(msg, starttime=now, interval=2)
        for job in jids:
            self.server.expect(JOB, 'queue', op=UNSET, id=job)

        # At end of reservation,verify running subjobs from job-array 3
        # terminated
        self.server.expect(JOB, {'job_state': 'F', 'substate': '91'},
                           extend='x', id=jids[2])
        self.server.expect(JOB, {'job_state': 'F', 'substate': '91',
                                 'queue': rid_q}, extend='x',
                           attrop=PTL_AND, id=subjid[5])

        # Check for subjobs status of job-array 1 and 2
        # as all subjobs from job-array 1 and 2 exceed walltime of
        # reservation,so they will not complete running within an instance
        # so the substate of these subjobs should be 93
        job_list = subjid
        job_list.pop()
        job_list.pop()
        for subjob in job_list:
            self.server.expect(JOB, {'job_state': 'F', 'substate': '93',
                                     'queue': rid_q}, extend='xt',
                               attrop=PTL_AND, id=subjob)

    def test_delete_idle_resv_basic(self):
        """
        Test basic functionality of delete_idle_time.  Submit a reservation
        with delete_idle_time and no jobs.  Wait until the timer expires
        and see the reservation get deleted
        """
        now = int(time.time())
        start = now + 30
        idle_timer = 15
        extra = {'delete_idle_time': idle_timer}
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      start=start,
                                      end=now + 3600,
                                      extra_attrs=extra)

        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)
        self.logger.info('Sleeping until reservation starts')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        offset = start - int(time.time())
        self.server.expect(RESV, exp_attr, id=rid, offset=offset)

        self.logger.info('Sleeping until resv idle timer fires')
        self.server.expect(RESV, 'queue', op=UNSET, id=rid, offset=idle_timer)

    def test_delete_idle_resv_job_finish(self):
        """
        Test that an idle reservation is properly deleted after its only
        job runs and finishes
        """
        now = int(time.time())
        start = now + 30
        idle_timer = 15
        extra = {'delete_idle_time': idle_timer}
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      start=start,
                                      end=now + 3600,
                                      extra_attrs=extra)

        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)

        rid_q = rid.split('.', 1)[0]

        a = {'Resource_List.select': '1:ncpus=1', ATTR_q: rid_q}
        j = Job(attrs=a)
        j.set_sleep_time(5)
        jid = self.server.submit(j)

        self.logger.info('Sleeping until reservation starts')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        offset = start - int(time.time())
        self.server.expect(RESV, exp_attr, id=rid, offset=offset)

        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

        # Wait for idle resv timer to hit and delete reservation
        self.logger.info('Sleeping until resv idle timer fires')
        self.server.expect(RESV, 'queue', op=UNSET,
                           id=rid, offset=idle_timer + 5)

    def test_delete_idle_resv_job_delete(self):
        """
        Test that when a running job is deleted, the
        idle reservation is deleted
        """
        now = int(time.time())
        start = now + 30
        idle_timer = 15
        extra = {'delete_idle_time': idle_timer}
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      start=start,
                                      end=now + 3600,
                                      extra_attrs=extra)

        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)

        rid_q = rid.split('.', 1)[0]

        a = {'Resource_List.select': '1:ncpus=1', ATTR_q: rid_q}
        j = Job(attrs=a)
        jid = self.server.submit(j)

        self.logger.info('Sleeping until reservation starts')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        offset = start - int(time.time())
        self.server.expect(RESV, exp_attr, id=rid, offset=offset)

        self.server.delete(jid)

        self.logger.info('Sleeping until resv idle timer fires')
        self.server.expect(RESV, 'queue', op=UNSET, id=rid,
                           offset=idle_timer)

    def test_delete_idle_resv_job_standing(self):
        """
        Test that an idle standing reservation is properly deleted after its
        only job finishes
        """
        now = int(time.time())
        start = now + 30
        idle_timer = 15
        extra = {'delete_idle_time': idle_timer}
        rid = self.submit_reservation(
            user=TEST_USER, select='1:ncpus=1', rrule='freq=DAILY;COUNT=3',
            start=start, end=start + 1800, extra_attrs=extra)

        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)

        rid_q = rid.split('.', 1)[0]

        a = {'Resource_List.select': '1:ncpus=1', ATTR_q: rid_q}
        j = Job(attrs=a)
        j.set_sleep_time(5)
        jid = self.server.submit(j)

        self.logger.info('Sleeping until reservation starts')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        offset = start - int(time.time())
        self.server.expect(RESV, exp_attr, id=rid, offset=offset)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        strf_str = '%a %b %d %T %Y'
        start_str = time.strftime(strf_str, time.localtime(start + 86400))

        self.logger.info('Sleeping until resv idle timer fires')
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2"),
                    'reserve_start': start_str}
        self.server.expect(RESV, exp_attr, id=rid, offset=idle_timer + 5)

    def test_asap_delete_idle_resv_set(self):
        """
        Test that an ASAP reservation gets a default 10m idle timer if not set
        or keeps its idle timer if it is set
        """
        ncpus = self.server.status(NODE)[0]['resources_available.ncpus']

        a = {'Resource_List.select': '1:ncpus=' + ncpus,
             'Resource_List.walltime': 3600}

        vnode_val = None
        if self.mom.is_cpuset_mom():
            vnode_val = 'vnode=' + self.server.status(NODE)[1]['id']
            ncpus = self.server.status(NODE)[1]['resources_available.ncpus']
            a['Resource_List.select'] = vnode_val + ":ncpus=" + ncpus

        j1 = Job(attrs=a)
        jid1 = self.server.submit(j1)

        j2 = Job(attrs=a)
        jid2 = self.server.submit(j2)

        j3 = Job(attrs=a)
        jid3 = self.server.submit(j3)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)

        rid = self.submit_asap_reservation(TEST_USER, jid2)
        self.server.expect(RESV, {'delete_idle_time': '10:00'}, id=rid)

        extra_attrs = {'delete_idle_time': '5:00'}
        rid = self.submit_asap_reservation(TEST_USER, jid3, extra_attrs)
        self.server.expect(RESV, {'delete_idle_time': '5:00'}, id=rid)

    def common_config(self):
        """
        This function contains common steps for test
        "test_ASAP_resv_with_multivnode_job" and
        "test_standing_resv_with_multivnode_job_array"
        """
        vn_attrs = {ATTR_rescavail + '.ncpus': 4}
        self.mom.create_vnodes(vn_attrs, 2,
                               fname="vnodedef1")
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})

    def test_ASAP_resv_with_multivnode_job(self):
        """
        Test 2 multivnode jobs converted to ASAP resv
        having same start time run as per resources available and
        doesn't crashes PBS daemons on completion of reservation.
        """
        self.common_config()
        # Submit job such that it consumes all the resources
        # on both vnodes
        attrs = {'Resource_List.select': '2:ncpus=4',
                 'Resource_List.walltime': '10',
                 'Resource_List.place': 'vscatter'}
        j = Job(PBSROOT_USER)
        j.set_sleep_time(10)
        j.set_attributes(attrs)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        # Submit 2 jobs and verify that both jobs are in Q state
        attrs = {'Resource_List.select': '2:ncpus=2',
                 'Resource_List.walltime': '10',
                 'Resource_List.place': 'vscatter'}
        j1 = Job(PBSROOT_USER)
        j1.set_sleep_time(10)
        j1.set_attributes(attrs)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        j2 = Job(PBSROOT_USER)
        j2.set_sleep_time(10)
        j2.set_attributes(attrs)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)
        # Convert 2 jobs into ASAP reservation
        now = time.time()
        rid1 = self.submit_asap_reservation(PBSROOT_USER, jid1)
        rid1_q = rid1.split('.')[0]
        rid2 = self.submit_asap_reservation(PBSROOT_USER, jid2)
        rid2_q = rid2.split('.')[0]
        # Check both the reservation starts running
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid1, offset=10)
        self.server.expect(RESV, a, id=rid2)
        # Wait for reservation to end
        resv_queue = [rid1_q, rid2_q]
        for queue in resv_queue:
            msg = "Que;" + queue + ";deleted at request of pbs_server@"
            self.server.log_match(msg, starttime=now, interval=10)
        # Verify all the jobs are deleted once resv ends
        jids = [jid1, jid2]
        for job in jids:
            self.server.expect(JOB, 'queue', op=UNSET, id=job)
        exp_attrib = {'job_state': 'F'}
        for jid in jids:
            self.server.expect(JOB, exp_attrib, id=jid, extend='x')
        # Verify all the PBS daemons are up and running upon resv completion
        self.server.isUp()
        self.mom.isUp()
        self.scheduler.isUp()

    def test_standing_resv_with_multivnode_job_array(self):
        """
        Test multivnode job array with standing reservation. Also
        verify that subjobs with walltime exceeding the resv duration
        are deleted once reservation ends
        """
        self.common_config()

        start = int(time.time()) + 10
        end = int(time.time()) + 61
        rid = self.submit_reservation(user=PBSROOT_USER,
                                      select='2:ncpus=2',
                                      place='vscatter',
                                      rrule='FREQ=MINUTELY;COUNT=2',
                                      start=start,
                                      end=end)
        exp_attr = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp_attr, id=rid)
        resv_queue = rid.split(".")[0]
        # Submit job requesting more walltime than the resv duration
        attrs = {ATTR_q: resv_queue, ATTR_J: '1-5',
                 'Resource_List.select': '2:ncpus=1',
                 'Resource_List.place': 'vscatter'}
        j = Job(PBSROOT_USER)
        j.set_attributes(attrs)
        jid = self.server.submit(j)
        subjid = []
        for i in range(1, 6):
            subjid.append(j.create_subjob_id(jid, i))
        exp_attrib = {'job_state': 'Q',
                      'comment': (MATCH_RE, 'Queue not started')}
        self.server.expect(JOB, exp_attrib, id=subjid[0])
        # Wait for first instance of standing resv to start
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid, offset=10)
        self.server.expect(JOB, {'job_state': 'B'}, id=jid)
        self.server.expect(JOB, {'job_state=R': 2}, count=True,
                           extend='t', id=jid)
        # Wait for second instance of standing resv to start
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'), 'reserve_index': 2}
        self.server.expect(RESV, a, offset=60, id=rid)
        # Verify running subjobs were terminated after the first
        # instance of standing resv
        jobs = [subjid[0], subjid[1]]
        attrib = {'job_state': 'X', 'substate': '93'}
        for jobid in jobs:
            self.server.expect(JOB, attrib, id=jobid)
        self.server.expect(JOB, {'job_state=R': 2}, count=True,
                           extend='t', id=jid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=subjid[4])
        # Wait for reservation to end
        self.server.log_match(resv_queue + ";deleted at request of pbs_server",
                              id=rid, interval=10)
        # Verify all the jobs are deleted once resv ends
        self.server.expect(JOB, 'queue', op=UNSET, id=jid)
        self.server.expect(JOB, {'job_state=F': 6}, count=True,
                           extend='xt', id=jid)

    def test_standing_resv_resc_used(self):
        """
        Test that resources are released from the server when a
        standing reservation's occurrence finishes
        """

        self.server.expect(SERVER, {'resources_assigned.ncpus': 0})
        now = int(time.time())

        # submitting 25 seconds from now to allow some of the older testbed
        # systems time to process (discovered empirically)
        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=1',
                                      rrule='FREQ=MINUTELY;COUNT=2',
                                      start=now + 25,
                                      end=now + 35)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)
        self.server.expect(SERVER, {'resources_assigned.ncpus': 0})

        offset = now + 25 - int(time.time())
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid, offset=offset, interval=1)
        self.server.expect(SERVER, {'resources_assigned.ncpus': 1})

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid, offset=10, interval=1)
        self.server.expect(SERVER, {'resources_assigned.ncpus': 0})

        offset = now + 85 - int(time.time())
        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid, offset=offset, interval=1)
        self.server.expect(SERVER, {'resources_assigned.ncpus': 1})

        self.server.expect(RESV, 'queue', op=UNSET, id=rid, offset=10)
        self.server.expect(SERVER, {'resources_assigned.ncpus': 0})

    def test_server_recover_resv_queue(self):
        """
        Test that PBS server can recover a reservation queue after a
        restart
        """

        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, num=2)
        now = int(time.time())
        rid = self.submit_reservation(user=TEST_USER, select='1:ncpus=1',
                                      start=now + 5, end=now + 300)

        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid)

        self.server.restart()
        self.server.expect(RESV, a, id=rid)

        resv_queue = rid.split('.')[0]
        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: resv_queue}
        J = Job(attrs=a)
        jid = self.server.submit(J)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

    def test_resv_job_hard_walltime(self):
        """
        Test that a job with hard walltime will not conflict with
        reservtion if hard walltime is less that reservation start time.
        """
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        now = int(time.time())

        rid = self.submit_reservation(user=TEST_USER,
                                      select='1:ncpus=4',
                                      start=now + 65,
                                      end=now + 240)
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')},
                           id=rid)
        a = {'Resource_List.ncpus': 4,
             'Resource_List.walltime': 50}
        J = Job(TEST_USER, attrs=a)
        jid = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_resv_reconfirm_holding_partial_nodes(self):
        """
        Test that scheduler is able to reconfirm a reservation when
        only some of the nodes reservation was running on goes down.
        Also make sure it hangs on to the node that was not down.
        """
        a = {'reserve_retry_time': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, num=3)
        vn_list = ["%s[%d]" % (self.mom.shortname, i) for i in range(3)]

        now = int(time.time())
        sel = '1:ncpus=2+1:ncpus=1'
        rid = self.submit_reservation(user=TEST_USER, select=sel,
                                      start=now + 5, end=now + 300)

        a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid)

        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node_list = self.server.reservations[rid].get_vnodes()
        resv_node = resv_node_list[0]
        resv_node2 = resv_node_list[1]
        vn = [i for i in vn_list if i not in resv_node_list]

        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.manager(MGR_CMD_SET, NODE, {'state': 'offline'},
                            id=resv_node)
        self.server.expect(RESV, {'reserve_substate': 10}, id=rid)

        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        solution = '(' + vn[0] + ':ncpus=2)+(' + resv_node2 + ':ncpus=1)'
        a = {'reserve_substate': '5'}
        self.server.expect(RESV, a, id=rid)
        self.server.status(RESV)
        rnodes = self.server.reservations[rid].get_vnodes()
        self.assertIn(vn[0], rnodes, "Wrong node assigned to resv")
        self.assertIn(resv_node2, rnodes, "Wrong node assigned to resv")

    def test_standing_resv_with_start_in_past(self):
        """
        Test that PBS accepts standing reservations with its start time in the
        past and end time in future. Check that PBS treats this kind of
        reservation as a reservation for the next day.
        """

        now = int(time.time())

        # we cannot use self.server.submit to submit the reservation
        # because we don't want to specify date in start and end options
        start = [" -R " + time.strftime('%H%M', time.localtime(now - 3600))]
        end = [" -E " + time.strftime('%H%M', time.localtime(now + 3600))]

        runcmd = [os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin',
                               'pbs_rsub')]
        tz = ['PBS_TZID=' + self.get_tz()]
        rule = ["-r 'freq=WEEKLY;BYDAY=SU;COUNT=3'"]

        runcmd = tz + runcmd + start + end + rule
        ret = self.du.run_cmd(self.server.hostname, runcmd, as_script=True)
        self.assertEqual(ret['rc'], 0)
        rid = ret['out'][0].split()[0]

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)
        d = datetime.datetime.today()

        # weekday() returns the weekday's index. Monday to Sunday (0 to 6)
        # We calculate how far away is today than Sunday and move
        # the day ahead.
        n = d.weekday()
        # If today is Sunday, move 7 days ahead, else move "6 - weekday()"
        delta = (6 - n) if (6 - n > 0) else 7
        d += datetime.timedelta(days=delta)
        sunday = d.strftime('%a %b %d')
        start = time.strftime('%H:%M', time.localtime(now - 3600))
        sunday = sunday + " " + start

        stat = self.server.status(RESV, 'reserve_start', id=rid)
        self.assertIn(sunday, stat[0]['reserve_start'])

    def qmove_job_to_reserv(self, Res_Status, Res_substate, start, end):
        """
        Function to qmove job into reservation and verify job state
        in reservation
        """
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        jid1 = self.submit_job(job_running=True)

        # Submit a standing reservation to occur every other minute for a
        # total count of 2
        rid = self.submit_reservation(user=TEST_USER, select='1:ncpus=1',
                                      rrule='FREQ=MINUTELY;INTERVAL=2;COUNT=2',
                                      start=start, end=end)
        rid_q = rid.split('.')[0]
        exp_attr = {'reserve_state': Res_Status,
                    'reserve_substate': Res_substate}
        self.server.expect(RESV, exp_attr, id=rid, offset=5)
        self.server.holdjob(jid1[0])
        # qrerun the jobs
        self.server.rerunjob(jobid=jid1[0])
        self.server.expect(JOB, {'job_state': 'H'}, id=jid1[0])
        # qmove the job to reservation queue
        self.server.movejob(jid1[0], rid_q)
        self.server.expect(JOB, {'job_state': 'H', 'queue': rid_q},
                           id=jid1[0])
        self.server.rlsjob(jid1[0], 'u')
        if Res_Status == 'RESV_CONFIRMED':
            self.server.expect(JOB, {'job_state': 'Q'}, id=jid1[0])
            self.logger.info('Job %s is in Q as expected' % jid1[0])
        if Res_Status == 'RESV_RUNNING':
            self.server.expect(JOB, {'job_state': 'R'}, id=jid1[0])
            self.logger.info('Job %s is in R as expected' % jid1[0])
        jid2 = self.submit_job(job_running=True)
        self.server.delete([rid, jid2[0]], wait=True)

    def test_qmove_job_into_standing_reservation(self):
        """
        Test qmove job into standing reservation
        """
        # Test qmove of a job to a confirmed standing reservation instance
        self.qmove_job_to_reserv("RESV_CONFIRMED", 2, time.time() + 15,
                                 time.time() + 60)

        # Test qmove of a job to a running standing reservation instance
        self.qmove_job_to_reserv("RESV_RUNNING", 5, time.time() + 10,
                                 time.time() + 60)

    def test_shared_exclusive_job_not_in_same_rsv_vnode(self):
        """
        Test to verify user cannot submit an exclusive placement job
        in a free placement reservation, job submission would be denied
        because placement spec does not match.
        Also verify  shared and exclusive job in reservation should
        not overlap on same vnode.
        """
        vn_attrs = {ATTR_rescavail + '.ncpus': 4,
                    'sharing': 'default_excl'}
        self.mom.create_vnodes(vn_attrs, 6)

        # Submit a advance reservation (R1)
        rid = self.submit_reservation(select='3:ncpus=4', user=TEST_USER,
                                      start=time.time() + 10,
                                      end=time.time() + 1000)
        rid_q = rid.split('.')[0]
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)
        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.place': 'shared',
             'queue': rid_q}
        jid = self.submit_job(set_attrib=a, job_running=True)
        vn = self.mom.shortname
        self.assertEqual(jid[1], '(' + vn + '[0]:ncpus=2)')
        a = {'Resource_List.select': '1:ncpus=8',
             'Resource_List.place': 'excl',
             'queue': rid_q}
        _msg = "qsub: job and reservation have conflicting specification "
        _msg += "Resource_List.place"
        try:
            self.submit_job(set_attrib=a)
        except PbsSubmitError as e:
            self.assertEqual(
                e.msg[0], _msg, msg="Did not get expected qsub err message")
            self.logger.info("Got expected qsub err message as %s", e.msg[0])
        else:
            self.fail("Job got submitted")
        self.server.delete([jid[0], rid], wait=True)

        # Repeat above test with reservation have place=excl
        # Submit a advance reservation (R2)
        rid = self.submit_reservation(select='3:ncpus=4', user=TEST_USER,
                                      start=time.time() + 10,
                                      end=time.time() + 1000,
                                      place='excl')
        rid_q = rid.split('.')[0]
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)
        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.place': 'shared',
             'queue': rid_q}
        jid = self.submit_job(set_attrib=a, job_running=True)
        job1_node = jid[1]
        self.assertEqual(jid[1], '(' + vn + '[0]:ncpus=2)')
        a = {'Resource_List.select': '1:ncpus=8',
             'Resource_List.place': 'excl',
             'queue': rid_q}
        jid2 = self.submit_job(set_attrib=a, job_running=True)
        job2_node = jid2[1]
        errmsg = 'job1_node contain job_node2 value'
        self.assertEqual(
            jid2[1], '(' + vn + '[1]:ncpus=4+' + vn + '[2]:ncpus=4)')
        self.assertNotIn(job1_node, job2_node, errmsg)

    def test_clashing_reservations(self):
        """
        Test that when a standing reservation and advance reservation
        are submitted to start at the same time on the same set of
        resources, then the one that is submitted first wins and second
        is rejected.
        """

        self.common_config()
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        start1 = int(time.time()) + 3600
        end1 = int(time.time()) + 7200
        start2 = int(time.time()) + 1800
        end2 = int(time.time()) + 5400

        srid = self.submit_reservation(user=TEST_USER,
                                       select='2:ncpus=4',
                                       rrule='FREQ=DAILY;COUNT=2',
                                       start=start1,
                                       end=end1)

        arid = self.submit_reservation(user=TEST_USER,
                                       select='2:ncpus=4',
                                       start=start2,
                                       end=end2)
        self.scheduler.run_scheduling_cycle()
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')},
                           id=srid, max_attempts=1)
        self.server.log_match(arid + ";Reservation denied", id=arid,
                              max_attempts=1)


================================================
FILE: test/tests/functional/pbs_resource_multichunk.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestResourceMultiChunk(TestFunctional):

    """
    Test suite to test value of custom resource
    in a multi chunk job request
    """

    def setUp(self):
        TestFunctional.setUp(self)
        attr = {}
        attr['type'] = 'float'
        attr['flag'] = 'nh'
        r = 'foo_float'
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id=r)
        self.scheduler.add_resource('foo_float')
        a = {'resources_available.foo_float': 4.2,
             'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

    def test_resource_float_type(self):
        """
        Test to check the value of custom resource
        in Resource_List.<custom resc> matches the value
        requested by the multi-chunk job
        """
        a = {'Resource_List.select': '2:ncpus=1:foo_float=0.8',
             'Resource_List.place': 'shared'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(JOB, {'Resource_List.foo_float': 1.6}, id=jid)


================================================
FILE: test/tests/functional/pbs_resource_unset.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestResourceUnset(TestFunctional):
    """
    Test that resources behave properly when unset
    """
    def setUp(self):
        TestFunctional.setUp(self)

        resources = {
            'tbool': {'type': 'boolean'},
            'tstr': {'type': 'string'},
            'tlong': {'type': 'long'},
            'thbool': {'type': 'boolean', 'flag': 'h'},
            'thstr': {'type': 'string', 'flag': 'h'},
            'thlong':  {'type': 'long', 'flag': 'h'}
        }
        res_str = ''
        for r in resources:
            self.server.manager(MGR_CMD_CREATE, RSC, resources[r], id=r)
            res_str += r + ','

        res_str = res_str[:-1]
        self.scheduler.add_resource(res_str)

        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 3},
                            id=self.mom.shortname)

    def test_unset_server_resources(self):
        """
        test server resources are ignored if unset and the job runs
        """

        J1 = Job(attrs={'Resource_List.tbool': True})
        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        J2 = Job(attrs={'Resource_List.tstr': "foo"})
        jid2 = self.server.submit(J2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        J3 = Job(attrs={'Resource_List.tlong': 1})
        jid3 = self.server.submit(J3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

    def test_unset_node_resources(self):
        """
        test if node level resources are not matched if unset.
        The job does not run.
        """
        J1 = Job(attrs={'Resource_List.thbool': True})
        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

        J2 = Job(attrs={'Resource_List.thstr': "foo"})
        jid2 = self.server.submit(J2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        J3 = Job(attrs={'Resource_List.thlong': 1})
        jid3 = self.server.submit(J3)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)


================================================
FILE: test/tests/functional/pbs_resource_usage_log.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestResourceUsageLog(TestFunctional):

    """
    Test various scenarios in which resource usage is logged
    in the accounting logs
    """

    def setUp(self):
        TestFunctional.setUp(self)
        attr1 = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, attr1)
        attr2 = {'resources_available.mem': '200gb'}
        self.server.manager(MGR_CMD_SET, NODE, attr2, id=self.mom.shortname)

    def cleanup_eatcpu(self, scripts):
        for script in scripts:
            cmd = 'pgrep -f ' + script
            ret = self.du.run_cmd(cmd=cmd, level=logging.DEBUG)
            for pid in ret['out']:
                cmd = 'kill -9 ' + pid
                ret = self.du.run_cmd(
                    cmd=cmd, level=logging.DEBUG, runas=TEST_USER)

    def test_acclog_for_job_states(self):
        """
        Check accounting logs when a job completes successfully and when
        a job is deleted in Q or R state
        """
        a = {'Resource_List.select': '1:ncpus=1:mem=200gb'}
        j1 = Job(TEST_USER, a)
        j1.create_eatcpu_job(40, self.mom.shortname)
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER, a)
        j2.create_eatcpu_job(30, self.mom.shortname)
        jid2 = self.server.submit(j2)

        self.server.expect(JOB, {'job_state': 'R'}, jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        self.server.delete(jid2, wait=True)
        self.server.expect(JOB, {'job_state': 'F'},
                           offset=40, extend='x', id=jid1)

        j3 = Job(TEST_USER, a)
        j3.create_eatcpu_job(hostname=self.mom.shortname)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'R'}, jid3)
        self.server.delete(jid3, wait=True)

        # No R record ; Only E record for job1 which finished
        self.server.accounting_match(
            msg='E;' + jid1 +
            '.*Exit_status=0.*resources_used.*run_count=1', id=jid1,
            regexp=True)
        self.server.accounting_match(
            msg='R;' + jid1, id=jid1, existence=False,
            max_attempts=10)

        # No R record, No E record for job2 which is in 'Q' state
        self.server.accounting_match(
            msg='R;' + jid2, id=jid2, existence=False,
            max_attempts=10)
        self.server.accounting_match(
            msg='E;' + jid2, id=jid2, existence=False,
            max_attempts=10)

        # No R record ; Only E record for job3 which was deleted
        # when in 'R' state
        self.server.accounting_match(
            msg='R;' + jid3, id=jid3, existence=False,
            max_attempts=10)
        self.server.accounting_match(
            msg='E;' + jid3 +
            '.*Exit_status=271.*resources_used.*run_count=1', id=jid3,
            regexp=True)

    def test_acclog_mom_down(self):
        """
        Check accounting logs when node is down and MoM is restarted
        """
        a = {ATTR_nodefailrq: 15}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        scripts = []
        # Submit a job
        a = {'Resource_List.select': '1:ncpus=1:mem=20gb'}
        j = Job(TEST_USER, a)
        scripts.append(j.create_eatcpu_job(hostname=self.mom.shortname))
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)
        # Submit a job array
        ja = Job(TEST_USER, attrs={
            ATTR_J: '1-2',
            'Resource_List.select': 'ncpus=1:mem=20gb'}
        )
        scripts.append(ja.create_eatcpu_job(hostname=self.mom.shortname))
        jid_a = self.server.submit(ja)

        subjid1 = j.create_subjob_id(jid_a, 1)
        subjid2 = j.create_subjob_id(jid_a, 2)

        self.server.expect(JOB, {'job_state': 'R'}, subjid1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid2)

        self.assertTrue(self.server.isUp())
        self.assertTrue(self.mom.isUp())

        # kill -9 mom
        self.mom.signal('-KILL')

        # Verify that node is reported to be down.
        self.server.expect(NODE, {ATTR_NODE_state: 'down'},
                           id=self.mom.shortname, offset=15)

        self.server.expect(JOB, {'job_state': 'Q'}, jid)
        self.server.expect(JOB, {'job_state': 'Q'}, subjid1)
        self.server.expect(JOB, {'job_state': 'Q'}, subjid2)

        self.server.tracejob_match(
            msg='Job requeued, execution node .* down', id=jid,
            regexp=True)
        self.server.tracejob_match(
            msg='Job requeued, execution node .* down', id=subjid1,
            regexp=True)
        self.server.tracejob_match(
            msg='Job requeued, execution node .* down', id=subjid2,
            regexp=True)

        # now start mom
        self.mom.start()
        self.assertTrue(self.mom.isUp())
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'R'}, jid)

        self.server.delete(jid, wait=True)
        self.server.delete(jid_a, wait=True)

        # job1 has R and E record
        self.server.accounting_match(
            msg='R;' + jid + '.*Exit_status=0.*resources_used.*run_count=1',
            id=jid, regexp=True, allmatch=True)
        self.server.accounting_match(
            msg='E;' + jid +
            '.*Exit_status=271.*resources_used.*run_count=2',
            id=jid, regexp=True)

        # job array's subjobs have a R record and
        # the jobarray has E record with run_count=0
        self.server.accounting_match(
            msg='R;' + re.escape(subjid1) +
            '.*Exit_status=0.*resources_used.*run_count=1',
            id=subjid1, regexp=True, allmatch=True)
        self.server.accounting_match(
            msg='R;' + re.escape(subjid2) +
            '.*Exit_status=0.*resources_used.*run_count=1',
            id=subjid2, regexp=True, allmatch=True)
        self.server.accounting_match(
            msg='E;' + re.escape(jid_a) +
            '.*Exit_status=1.*run_count=0', id=jid_a, regexp=True)
        self.cleanup_eatcpu(scripts)

    def test_acclog_job_multiple_qrerun(self):
        """
        Check for R record in accounting logs when job is
        requeued using qrerun command
        """
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        # Submit job
        a = {'Resource_List.select': '1:ncpus=1:mem=20gb'}
        j = Job(TEST_USER, a)
        j.create_eatcpu_job(hostname=self.mom.shortname)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)

        # Submit job array
        ja = Job(TEST_USER, attrs={
            ATTR_J: '1-2',
            'Resource_List.select': 'ncpus=1:mem=20gb'}
        )
        ja.create_eatcpu_job(hostname=self.mom.shortname)
        jid_a = self.server.submit(ja)
        subjid1 = j.create_subjob_id(jid_a, 1)
        subjid2 = j.create_subjob_id(jid_a, 2)
        self.server.expect(JOB, {'job_state': 'R'}, subjid1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid2)

        # Turn scheduling off before rerun
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # Rerun jobs first time
        self.server.rerunjob(jobid=jid)
        self.server.rerunjob(jobid=jid_a)

        self.server.expect(JOB, {'job_state': 'Q'}, jid)
        self.server.expect(JOB, {'job_state': 'Q'}, subjid1)
        self.server.expect(JOB, {'job_state': 'Q'}, subjid2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state': 'R'}, jid)
        self.server.expect(JOB, {'job_state': 'R'}, subjid1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid2)

        # Rerun jobs second time
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.rerunjob(jobid=jid)
        self.server.rerunjob(jobid=jid_a)

        self.server.expect(JOB, {'job_state': 'Q'}, jid)
        self.server.expect(JOB, {'job_state': 'Q'}, subjid1)
        self.server.expect(JOB, {'job_state': 'Q'}, subjid2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'R'}, jid)
        self.server.expect(JOB, {'job_state': 'R'}, subjid1)
        self.server.expect(JOB, {'job_state': 'R'}, subjid2)

        self.server.delete(jid, wait=True)
        self.server.delete(jid_a, wait=True)

        # Check for R records for every qrerun
        self.server.accounting_match(
            msg='R;' + jid +
            '.*Exit_status=-11.*resources_used.*run_count=1', id=jid,
            regexp=True)
        self.server.accounting_match(
            msg='R;' + jid +
            '.*Exit_status=-11.*resources_used.*run_count=2', id=jid,
            regexp=True)
        self.server.accounting_match(
            msg='E;' + jid +
            '.*Exit_status=271.*resources_used.*run_count=3', id=jid,
            regexp=True)

        self.server.accounting_match(
            msg='R;' + re.escape(subjid1) +
            '.*Exit_status=-11.*resources_used.*run_count=1',
            id=subjid1, regexp=True, allmatch=True)
        self.server.accounting_match(
            msg='R;' + re.escape(subjid1) +
            '.*Exit_status=-11.*resources_used.*run_count=1',
            id=subjid2, regexp=True, allmatch=True)
        self.server.accounting_match(
            msg='E;' + re.escape(jid_a) +
            '.*Exit_status=1.*run_count=0',
            id=jid_a, regexp=True)

    def test_acclog_force_requeue(self):
        """
        Check for resource usage when job is force requeued
        """
        scripts = []
        a = {'Resource_List.select': '1:ncpus=1:mem=200gb'}
        j1 = Job(TEST_USER, a)
        scripts.append(j1.create_eatcpu_job(hostname=self.mom.shortname))
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, jid1)

        # kill -9 mom
        self.mom.signal('-KILL')

        # Verify that nodes are reported to be down.
        self.server.expect(NODE, {ATTR_NODE_state: (MATCH_RE, 'down')},
                           id=self.mom.shortname, offset=15)
        self.server.rerunjob(jid1, extend='force')

        # Look for R record as job was force requeued
        self.server.accounting_match(
            msg='.*R;' +
            jid1 +
            '.*Exit_status=-11.*resources_used.*run_count=1',
            id=jid1,
            regexp=True)
        self.cleanup_eatcpu(scripts)

    def test_acclog_services_restart(self):
        """
        Check for resource usage in accounting logs after
        PBS services are restarted
        """
        a = {'Resource_List.select': '1:ncpus=1:mem=200gb'}
        j1 = Job(TEST_USER, a)
        j1.create_eatcpu_job(60, self.mom.shortname)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, jid1)

        # Restart PBS services
        PBSInitServices().restart()
        if self.server.shortname != self.mom.shortname:
            self.mom.restart()

        self.assertTrue(self.server.isUp())
        self.assertTrue(self.mom.isUp())

        # Sleep so accounting logs get updated
        time.sleep(40)
        self.logger.info("Sleep for 40s so accounting log is updated")

        # Check for R record
        self.server.accounting_match(
            msg='R;' + jid1 + '.*resources_used.*run_count=1', id=jid1,
            regexp=True)

    def test_acclog_preempt_order(self):
        """
        Check for R record when editing preempt order to "R" and requeuing job
        """
        # Create a high priority queue
        a = {'queue_type': 'e', 'started': 't',
             'enabled': 't', 'priority': '180'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="highp")
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': 'R'})

        a = {'Resource_List.select': '1:ncpus=1:mem=200gb'}
        j1 = Job(TEST_USER, a)
        j1.create_eatcpu_job(30, self.mom.shortname)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, jid1)

        a = {'Resource_List.select': '1:ncpus=1:mem=200gb', 'queue': 'highp'}
        j2 = Job(TEST_USER, a)
        j2.create_eatcpu_job(60, self.mom.shortname)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, jid1)

        self.server.accounting_match(
            msg='.*R;' + jid1 +
            '.*Exit_status=-11.*resources_used.*run_count=1',
            id=jid1, regexp=True)


================================================
FILE: test/tests/functional/pbs_resv_begin_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2020 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import textwrap
from tests.functional import *


def get_hook_body_reverse_node_state():
    hook_body = """
    import pbs
    e = pbs.event()
    pbs.logmsg(pbs.LOG_DEBUG, "pbs.__file__:" + pbs.__file__)
    # this is backwards as it's a reverse lookup.
    for value, key in pbs.REVERSE_RESV_STATE.items():
        pbs.logmsg(pbs.LOG_DEBUG, "key:%s value:%s" % (key, value))
    e.accept()
    """
    hook_body = textwrap.dedent(hook_body)
    return hook_body


class TestResvBeginHook(TestFunctional):
    """
    Tests to verify the reservation begin hook for a confirm standing/advance/
    degraded reservation once the reservation begins.
    """

    advance_resv_hook_script = textwrap.dedent("""
        import pbs
        e=pbs.event()

        pbs.logmsg(pbs.LOG_DEBUG, 'Reservation Begin Hook name - %s' %
                   e.hook_name)

        if e.type == pbs.RESV_BEGIN:
            pbs.logmsg(pbs.LOG_DEBUG, 'Reservation ID - %s' % e.resv.resvid)
    """)

    standing_resv_hook_script = textwrap.dedent("""
        import pbs
        e=pbs.event()

        pbs.logmsg(pbs.LOG_DEBUG, 'Reservation Begin Hook name - %s' %
                   e.hook_name)

        if e.type == pbs.RESV_BEGIN:
            pbs.logmsg(pbs.LOG_DEBUG, 'Reservation occurrence - %s' %
            e.resv.reserve_index)
    """)

    def setUp(self):
        """
        Create a reservation begin hook and set the server log level.
        """
        super(TestResvBeginHook, self).setUp()
        self.hook_name = 'resvbegin_hook'
        attrs = {'event': 'resv_begin'}
        self.server.create_hook(self.hook_name, attrs)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

    @tags('hooks')
    def test_begin_advance_resv(self):
        """
        Testcase to submit and confirm an advance reservation, wait for it
        to begin and verify the reservation begin hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid, _, _ = self.server.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid, offset=10)

        # Don't need to wait.  Let teardown clear the reservation
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    @tags('hooks')
    def test_delete_advance_resv(self):
        """
        Testcase to submit and confirm advance reservation, delete the same
        and verify the resvbegin hook did not run.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid, start, _ = self.server.submit_resv(offset, duration)
        self.server.delete(rid)
        time.sleep(start - time.time())
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=1, max_attempts=5,
                              existence=False)

    @tags('hooks')
    def test_delete_degraded_resv(self):
        """
        Testcase to submit and confirm an advance reservation, turn the mom
        off, delete the degraded reservation and verify the resvbegin
        hook did not run.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.advance_resv_hook_script)

        offset = 10
        duration = 30

        rid, start, _ = self.server.submit_resv(offset, duration)
        self.server.manager(MGR_CMD_SET, NODE, {'state': (INCR, 'offline')},
                            id=self.mom.shortname)
        attrs = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}
        self.server.expect(RESV, attrs, id=rid)
        self.server.delete(rid)
        time.sleep(start - time.time())

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
            (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=1, max_attempts=5,
                              existence=False)

    @tags('hooks')
    def test_server_down_case_1(self):
        """
        Testcase to submit and confirm an advance reservation, turn the server
        off, turn the server on after the reservation would have started and
        verify the resvbegin hook ran.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.advance_resv_hook_script)

        offset = 10
        duration = 300
        rid, start, _ = self.server.submit_resv(offset, duration)

        self.server.stop()
        time.sleep(offset + 5)
        self.server.start()
        self.assertTrue(self.server.isUp())

        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=1, max_attempts=5)

    @tags('hooks')
    def test_server_down_case_2(self):
        """
        Testcase to submit and confirm an advance reservation, turn the
        server off, wait for the reservation duration to finish, turn the
        server on and verify the resvbegin hook never ran.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        wait_time = offset + duration + 5
        rid, _, _ = self.server.submit_resv(offset, duration)

        self.server.stop()

        self.logger.info('wait for %s seconds till the reservation would end' %
                         (wait_time))
        time.sleep(wait_time)

        self.server.start()
        self.assertTrue(self.server.isUp())

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=2,
                              existence=False)

    @tags('hooks')
    def test_set_attrs(self):
        """
        Testcase to submit and confirm an advance reservation, delete the
        reservation and verify the read permissions in the resvbegin hook.
        """

        hook_script = textwrap.dedent("""
            import pbs
            e=pbs.event()

            pbs.logmsg(pbs.LOG_DEBUG,
                       'Reservation begin Hook name - %s' % e.hook_name)

            if e.type == pbs.RESV_BEGIN:
                pbs.logmsg(pbs.LOG_DEBUG, 'e.resv = %s' % e.resv.__dict__)
                e.resv.queue = 'workq'
                pbs.logmsg(pbs.LOG_DEBUG, 'Reservation ID - %s' %
                e.resv.queue)
        """)

        self.server.import_hook(self.hook_name, hook_script)

        offset = 10
        duration = 30
        _, start, _ = self.server.submit_resv(offset, duration)

        time.sleep(start - time.time())

        msg = 'Svr;Server@%s;PBS server internal error (15011) in Error ' \
              'evaluating Python script, attribute '"'queue'"' is ' \
              'part of a readonly object' % self.server.shortname
        self.server.log_match(msg, tail=True, max_attempts=30, interval=2)

    @tags('hooks')
    def test_delete_resv_after_first_occurrence(self):
        """
        Testcase to submit and confirm a standing reservation for two
        occurrences, wait for the first occurrence to begin and verify
        the begin hook for the same, delete before the second occurrence and
        verify the resvbegin hook for the latter didn't run.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.standing_resv_hook_script)

        offset = 20
        duration = 30
        rid, start, _ = self.server.submit_resv(offset, duration,
                                                rrule='FREQ=MINUTELY;COUNT=2',
                                                conf=self.conf)

        off = start - time.time()
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid, offset=off)

        msg = 'Hook;Server@%s;Reservation occurrence - 1' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation begin hook ran for first occurrence of '
                         'a standing reservation')

        self.logger.info('delete during first occurence')

        self.server.delete(rid)
        time.sleep(max(start + 60 - time.time(), 0))
        msg = 'Hook;Server@%s;Reservation occurrence - 2' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=3,
                              existence=False)

    @tags('hooks')
    def test_begin_resv_occurrences(self):
        """
        Testcase to submit and confirm a standing reservation for two
        occurrences, wait for the first occurrence to begin and verify
        the begin hook for the same, wait for the second occurrence to
        start and end, verify the resvbegin hook for the latter.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.standing_resv_hook_script)

        offset = 20
        duration = 30
        rid, start, _ = self.server.submit_resv(offset, duration,
                                                rrule='FREQ=MINUTELY;COUNT=2',
                                                conf=self.conf)
        off = start - time.time()
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid, offset=off)

        msg = 'Hook;Server@%s;Reservation occurrence - 1' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation begin hook ran for first occurrence of a'
                         ' standing reservation')

        off = start + 60 - time.time()
        self.logger.info('Wait for second occurrence')
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'),
                 'reserve_index': 2}
        self.server.expect(RESV, attrs, id=rid, attrop=PTL_AND, offset=off)

        msg = 'Hook;Server@%s;Reservation occurrence - 2' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation begin hook ran for second occurrence of '
                         'a standing reservation')

    @tags('hooks')
    def test_unconfirmed_resv_with_node(self):
        """
        Testcase to set the node attributes such that the number of ncpus is 1,
        submit and confirm a reservation on the same node, submit another
        reservation on the same node and verify the reservation begin hook
        as the latter one stays in unconfirmed state.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.advance_resv_hook_script)

        node_attrs = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, node_attrs,
                            id=self.mom.shortname)
        offset = 10
        duration = 10
        self.server.submit_resv(offset, duration)
        unconf_rid, unconf_start, _ = self.server.submit_resv(offset,
                                                              duration,
                                                              confirmed=False)
        msg = 'Server@%s;Resv;%s;Reservation denied' % \
            (self.server.shortname, unconf_rid)
        self.server.log_match(msg, tail=True, max_attempts=10)

        time.sleep(max(unconf_start - time.time(), 0))
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, unconf_rid)
        self.server.log_match(msg, tail=True, max_attempts=5, existence=False)

    @tags('hooks')
    def test_scheduler_down(self):
        """
        Testcase to turn off the scheduler and submit a reservation,
        the same will be in unconfirmed state and at the start time
        resvbegin hook shall not run.
        """
        self.server.import_hook(self.hook_name,
                                TestResvBeginHook.advance_resv_hook_script)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        offset = 10
        duration = 30
        rid, start, _ = self.server.submit_resv(offset, duration,
                                                confirmed=False)

        self.logger.info('wait utill the reservation would begin')
        off = start - time.time() + 10
        attrs = {'reserve_state': (MATCH_RE, 'RESV_UNCONFIRMED|1')}
        self.server.expect(RESV, attrs, id=rid, offset=off)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, max_attempts=5,
                              existence=False)

    # Test Reverser
    @tags("hooks")
    def test_check_reservation_state_lookup(self):
        """
        Test: check for the existence and values of the
        pbs.REVERSE_RESV_STATE dictionary

        run a hook that converts reservation state change ints into a string,
        then search for it in the server log.
        """

        self.add_pbs_python_path_to_sys_path()
        import pbs
        self.server.import_hook(self.hook_name,
                                get_hook_body_reverse_node_state())
        start_time = int(time.time())

        duration = 30
        offset = 10
        rid, _, _ = self.server.submit_resv(offset, duration)
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid)

        for value, key in pbs.REVERSE_RESV_STATE.items():
            self.server.log_match("key:%s value:%s" % (key, value),
                                  starttime=start_time)

    @tags('hooks')
    def test_multiple_hooks(self):
        """
        Define multiple hooks for the resv_begin event and make sure both
        get run.

        """
        test_hook_script = textwrap.dedent("""
        import pbs
        e=pbs.event()

        pbs.logmsg(pbs.LOG_DEBUG,
                   'Reservation Begin Hook name - %%s' %% e.hook_name)

        if e.type == pbs.RESV_BEGIN:
            pbs.logmsg(pbs.LOG_DEBUG,
                       'Test %d Reservation ID - %%s' %% e.resv.resvid)
        """)

        attrs = {'event': 'resv_begin'}
        self.server.create_import_hook("test_hook_1", attrs,
                                       test_hook_script % 1)
        self.server.create_import_hook("test_hook_2", attrs,
                                       test_hook_script % 2)

        offset = 20
        duration = 30
        rid, _, _ = self.server.submit_resv(offset, duration)
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid, offset=offset)

        msg = 'Hook;Server@%s;Test 1 Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=3)

        msg = 'Hook;Server@%s;Test 2 Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=3)


================================================
FILE: test/tests/functional/pbs_resv_confirm_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2020 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import textwrap
from tests.functional import *


class TestResvConfirmHook(TestFunctional):
    """
    Tests to verify the reservation begin hook for a confirm standing/advance/
    degraded reservation once the reservation begins.
    """

    advance_resv_hook_script = textwrap.dedent("""
        import pbs
        e=pbs.event()

        pbs.logmsg(pbs.LOG_DEBUG,
                   'Reservation Confirm Hook name - %s' % e.hook_name)

        if e.type == pbs.RESV_CONFIRM:
            pbs.logmsg(pbs.LOG_DEBUG,
                       'Reservation ID - %s' % e.resv.resvid)
            pbs.logmsg(pbs.LOG_DEBUG, 'Reservation occurrence - %s' %
                       e.resv.reserve_index)
    """)

    def setUp(self):
        """
        Create a reservation confirm hook and set the server log level.
        """
        super(TestResvConfirmHook, self).setUp()
        self.hook_name = 'resvconfirm_hook'
        attrs = {'event': 'resv_confirm'}
        self.server.create_hook(self.hook_name, attrs)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

    @tags('hooks')
    def test_run_advance_resv(self):
        """
        Testcase to submit and confirm advance reservation, delete the same
        and verify the resv_confirm hook ran.
        """
        self.server.import_hook(self.hook_name,
                                TestResvConfirmHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid, _, _ = self.server.submit_resv(offset, duration)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=1, max_attempts=10)

    @tags('hooks')
    def test_degraded_resv(self):
        """
        Testcase to submit and confirm an advance reservation, offline vnode,
        verify reservation degredation, restore the vnode and verify the
        resv_confirm hook ran the correct number of times.
        """
        self.server.import_hook(self.hook_name,
                                TestResvConfirmHook.advance_resv_hook_script)

        offset = 300
        duration = 30
        rid, _, _ = self.server.submit_resv(offset, duration)
        msg = 'Hook;Server@%s;Reservation ID - %s' % (self.server.shortname,
                                                      rid)
        self.server.log_match(msg, tail=True)

        self.server.manager(MGR_CMD_SET, NODE, {'state': (INCR, 'offline')},
                            id=self.mom.shortname)
        vnode_off_time = time.time()

        attrs = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.manager(MGR_CMD_SET, NODE, {'state': (DECR, 'offline')},
                            id=self.mom.shortname)
        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.log_match(msg, starttime=vnode_off_time, interval=1,
                              max_attempts=10, existence=False)

    @tags('hooks')
    def test_set_attrs(self):
        """
        Testcase to submit and confirm an advance reservation, delete the
        reservation and verify the read permissions in the resvconfirm hook.
        """

        hook_script = """\
            import pbs
            e=pbs.event()

            pbs.logmsg(pbs.LOG_DEBUG,
                       'Reservation confirm Hook name - %s' % e.hook_name)

            if e.type == pbs.RESV_CONFIRM:
                pbs.logmsg(pbs.LOG_DEBUG, "e.resv = %s" % e.resv.resvid)
                e.resv.queue = 'workq'
                pbs.logmsg(pbs.LOG_DEBUG, 'Reservation ID - %s' %
                e.resv.queue)
        """
        hook_script = textwrap.dedent(hook_script)
        self.server.import_hook(self.hook_name, hook_script)

        offset = 10
        duration = 30
        rid, _, _ = self.server.submit_resv(offset, duration)

        msg = 'Svr;Server@%s;PBS server internal error (15011) in Error ' \
              'evaluating Python script, attribute '"'queue'"' is ' \
              'part of a readonly object' % self.server.shortname
        self.server.log_match(msg, tail=True, max_attempts=30, interval=2)

    @tags('hooks')
    def test_delete_resv_after_first_occurrence(self):
        """
        Testcase to submit and confirm a standing reservation for two
        occurrences, wait for the first occurrence to begin and verify
        the confirm hook for the reservation, delete before the second
        occurrence and verify the confirm ran only once.
        """
        self.server.import_hook(self.hook_name,
                                TestResvConfirmHook.advance_resv_hook_script)

        offset = 20
        duration = 30
        rid, _, _ = self.server.submit_resv(offset, duration,
                                            rrule='FREQ=MINUTELY;COUNT=2',
                                            conf=self.conf)
        msg = 'Hook;Server@%s;Reservation ID - %s' % (self.server.shortname,
                                                      rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation confirm hook ran for first occurrence of'
                         ' a standing reservation')
        post_first_conf_time = time.time()
        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, attrs, id=rid)
        off = offset + duration - time.time()
        self.logger.info('Wait %s sec until reservation completed.', off)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid, offset=off)

        self.server.log_match(msg, starttime=post_first_conf_time, interval=1,
                              max_attempts=10, existence=False)

    @tags('hooks')
    def test_unconfirmed_resv_with_node(self):
        """
        Testcase to set the node attributes such that the number of ncpus is 1,
        submit and confirm a reservation on the same node, submit another
        reservation on the same node and verify the reservation confirm hook
        did not run as the latter one never gets past the unconfirmed state.
        """
        self.server.import_hook(self.hook_name,
                                TestResvConfirmHook.advance_resv_hook_script)

        node_attrs = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, node_attrs,
                            id=self.mom.shortname)
        offset = 20
        duration = 300
        rid, _, _ = self.server.submit_resv(offset, duration)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, max_attempts=10)

        new_rid, _, _ = self.server.submit_resv(offset, duration,
                                                confirmed=False)
        msg = "Server@%s;Resv;%s;Reservation denied" % (self.server.shortname,
                                                        new_rid)
        self.server.log_match(msg, tail=True)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, new_rid)
        self.server.log_match(msg, tail=True, max_attempts=10,
                              existence=False)

    @tags('hooks')
    def test_scheduler_down(self):
        """
        Testcase to turn off the scheduler and submit a reservation,
        the same will be in unconfirmed state and upon ending the
        resv_confirm hook shall not run.
        """
        self.server.import_hook(self.hook_name,
                                TestResvConfirmHook.advance_resv_hook_script)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        offset = 20
        duration = 30
        rid, _, end = self.server.submit_resv(offset, duration,
                                              confirmed=False)
        off = end - time.time()

        self.logger.info('wait for %s seconds till the reservation begins',
                         off)
        time.sleep(off)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, max_attempts=3,
                              existence=False)

    @tags('hooks')
    def test_multiple_reconfirm_hooks(self):
        """
        Define multiple hooks for the resv_confirm event and make sure
        both get run.

        Check for initial confirmation and also in a degraded/reconfirmed case.
        """
        test_hook_script = textwrap.dedent("""
        import pbs
        e=pbs.event()

        pbs.logmsg(pbs.LOG_DEBUG,
                   'Reservation Confirm Hook name - %%s' %% e.hook_name)

        if e.type == pbs.RESV_CONFIRM:
            pbs.logmsg(pbs.LOG_DEBUG,
                       'Test %d Reservation ID - %%s' %% e.resv.resvid)
        """)

        attrs = {'event': 'resv_confirm'}
        self.server.create_import_hook("test_hook_1", attrs,
                                       test_hook_script % 1)
        self.server.create_import_hook("test_hook_2", attrs,
                                       test_hook_script % 2)
        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, 2)
        offset = 10
        duration = 30

        self.server.manager(MGR_CMD_SET, SERVER, {'reserve_retry_time': 5})
        rid, _, _ = self.server.submit_resv(offset, duration)
        msg1 = 'Hook;Server@%s;Test 1 Reservation ID - %s' % \
            (self.server.shortname, rid)
        self.server.log_match(msg1, tail=True)

        msg2 = 'Hook;Server@%s;Test 2 Reservation ID - %s' % \
            (self.server.shortname, rid)
        self.server.log_match(msg2, tail=True)

        self.server.status(RESV, 'resv_nodes', id=rid)
        rnodes = self.server.reservations[rid].get_vnodes()
        self.server.manager(MGR_CMD_SET, NODE, {'state': (INCR, 'offline')},
                            id=rnodes[0])
        vnode_off_time = time.time()

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.log_match(msg1, starttime=vnode_off_time, interval=1,
                              max_attempts=10)
        self.server.log_match(msg2, starttime=vnode_off_time, interval=1,
                              max_attempts=10)


================================================
FILE: test/tests/functional/pbs_resv_end_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestResvEndHook(TestFunctional):
    """
    Tests to verify the reservation end hook for a confirm standing/advance/
    degraded reservation once the reservation ends or gets deleted.
    """

    advance_resv_hook_script = """
import pbs
e=pbs.event()

pbs.logmsg(pbs.LOG_DEBUG, 'Reservation End Hook name - %s' % e.hook_name)

if e.type == pbs.RESV_END:
    pbs.logmsg(pbs.LOG_DEBUG, 'Reservation ID - %s' % e.resv.resvid)
"""

    standing_resv_hook_script = """
import pbs
e=pbs.event()

pbs.logmsg(pbs.LOG_DEBUG, 'Reservation End Hook name - %s' % e.hook_name)

if e.type == pbs.RESV_END:
    pbs.logmsg(pbs.LOG_DEBUG, 'Reservation occurrence - %s' %
    e.resv.reserve_index)
"""

    def setUp(self):
        """
        Create a reservation end hook and set the server log level.
        """
        super(TestResvEndHook, self).setUp()
        self.hook_name = 'resvend_hook'
        attrs = {'event': 'resv_end'}
        self.server.create_hook(self.hook_name, attrs)

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})

    def submit_resv(self, offset, duration, select='1:ncpus=1', rrule=''):
        """
        Helper function to submit an advance/a standing reservation.
        """
        start_time = int(time.time()) + offset
        end_time = start_time + duration

        attrs = {
            'reserve_start': start_time,
            'reserve_end': end_time,
            'Resource_List.select': select
        }

        if rrule:
            if 'PBS_TZID' in self.conf:
                tzone = self.conf['PBS_TZID']
            elif 'PBS_TZID' in os.environ:
                tzone = os.environ['PBS_TZID']
            else:
                self.logger.info('Missing timezone, using Asia/Kolkata')
                tzone = 'Asia/Kolkata'
            attrs[ATTR_resv_rrule] = rrule
            attrs[ATTR_resv_timezone] = tzone

        rid = self.server.submit(Reservation(TEST_USER, attrs))

        return rid

    def test_delete_advance_resv(self):
        """
        Testcase to submit and confirm advance reservation, delete the same
        and verify the resvend hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.delete(rid)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    def test_delete_degraded_resv(self):
        """
        Testcase to submit and confirm an advance reservation, turn the mom
        off, delete the degraded reservation and verify the resvend
        hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.mom.stop()

        attrs['reserve_state'] = (MATCH_RE, 'RESV_DEGRADED|10')
        self.server.expect(RESV, attrs, id=rid)

        self.server.delete(rid)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    def test_server_down_case_1(self):
        """
        Testcase to submit and confirm an advance reservation, turn the server
        off, turn the server on, delete the reservation and verify the resvend
        hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        offset = 10
        duration = 300
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.stop()

        self.server.start()

        self.server.delete(rid)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    @timeout(300)
    def test_server_down_case_2(self):
        """
        Testcase to submit and confirm an advance reservation, turn the
        server off, wait for the reservation duration to finish, turn the
        server on and verify the resvend hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.stop()

        self.logger.info('wait for 30 seconds till the reservation ends')
        time.sleep(30)

        self.server.start()

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    @timeout(240)
    def test_end_advance_resv(self):
        """
        Testcase to submit and confirm an advance reservation, wait for it
        to end and verify the reservation end hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, attrs, id=rid, offset=10)

        self.logger.info('wait 30 seconds until the reservation ends')
        time.sleep(30)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    def test_delete_advance_resv_with_jobs(self):
        """
        Testcase to submit and confirm an advance reservation, submit
        some jobs to the same, wait for the same to end and
        verify the reservation end hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, attrs, id=rid, offset=10)

        job_attrs = {
            'Resource_List.walltime': 5,
            'Resource_List.select': '1:ncpus=1',
            'queue': rid.split('.')[0]
        }

        for _ in range(10):
            self.server.submit(Job(TEST_USER, job_attrs))

        self.logger.info('wait 10 seconds till the reservation runs some jobs')
        time.sleep(10)

        self.server.delete(rid)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    @timeout(240)
    def test_end_advance_resv_with_jobs(self):
        """
        Testcase to submit and confirm an advance reservation, submit
        some jobs to the same, wait for it to start and end, verify
        the resvend hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, attrs, id=rid, offset=10)

        job_attrs = {
            'Resource_List.walltime': 10,
            'Resource_List.select': '1:ncpus=1',
            'queue': rid.split('.')[0]
        }

        for _ in range(10):
            self.server.submit(Job(TEST_USER, job_attrs))

        self.logger.info('wait till 30 seconds until the reservation ends')
        time.sleep(30)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    def test_set_attrs(self):
        """
        Testcase to submit and confirm an advance reservation, delete the
        reservation and verify the read permissions in the resvend hook.
        """

        hook_script = """
import pbs
e=pbs.event()

pbs.logmsg(pbs.LOG_DEBUG, 'Reservation End Hook name - %s' % e.hook_name)

if e.type == pbs.RESV_END:
    e.resv.resources_used.walltime = 10
    pbs.logmsg(pbs.LOG_DEBUG, 'Reservation ID - %s' %
    e.resv.resources_used.walltime)
"""

        self.server.import_hook(self.hook_name, hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        self.server.delete(rid)
        msg = 'Svr;Server@%s;PBS server internal error (15011) in Error ' \
              'evaluating Python script, attribute '"'resources_used'"' is ' \
              'part of a readonly object' % self.server.shortname
        self.server.log_match(msg, tail=True, max_attempts=30, interval=2)

    @timeout(300)
    def test_delete_resv_occurrence(self):
        """
        Testcase to submit and confirm a standing reservation for two
        occurrences, wait for the first occurrence to end and verify
        the end hook for the same, delete the second occurrence and
        verify the resvend hook for the latter.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.standing_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration, rrule='FREQ=MINUTELY;COUNT=2')

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, attrs, id=rid, offset=10)

        self.logger.info('wait till 30 seconds until the reservation ends')
        time.sleep(30)

        msg = 'Hook;Server@%s;Reservation occurrence - 1' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation end hook ran for first occurrence of '
                         'a standing reservation')

        self.logger.info(
            'wait for 10 seconds till the next occurrence is submitted')
        time.sleep(10)

        self.server.delete(rid)
        msg = 'Hook;Server@%s;Reservation occurrence - 2' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    @timeout(300)
    def test_end_resv_occurrences(self):
        """
        Testcase to submit and confirm a standing reservation for two
        occurrences, wait for the first occurrence to end and verify
        the end hook for the same, wait for the second occurrence to
        start and end, verify the resvend hook for the latter.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.standing_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration, rrule='FREQ=MINUTELY;COUNT=2')

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, attrs, id=rid, offset=10)

        self.logger.info('Sleep for 30 seconds for the reservation occurrence '
                         'to end')
        time.sleep(30)

        msg = 'Hook;Server@%s;Reservation occurrence - 1' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation end hook ran for first occurrence of a '
                         'standing reservation')

        self.logger.info('Sleep for 30 seconds as this is a '
                         'minutely occurrence')
        time.sleep(30)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'),
                 'reserve_index': 2}
        self.server.expect(RESV, attrs, id=rid, attrop=PTL_AND)

        msg = 'Hook;Server@%s;Reservation occurrence - 2' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation end hook ran for second occurrence of a'
                         ' standing reservation')

    @timeout(300)
    def test_delete_resv_occurrence_with_jobs(self):
        """
        Testcase to submit and confirm a standing reservation for two
        occurrences, submit some jobs to it, wait for the first
        occurrence to end and verify the end hook for the same,
        delete the second occurrence and verify the resvend hook
        for the latter.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.standing_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration, rrule='FREQ=MINUTELY;COUNT=2')

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, attrs, id=rid, offset=10)

        job_attrs = {
            'Resource_List.walltime': 5,
            'Resource_List.select': '1:ncpus=1',
            'queue': rid.split('.')[0]
        }

        for _ in range(10):
            self.server.submit(Job(TEST_USER, job_attrs))

        self.logger.info('Sleep for 30 seconds for the reservation occurrence '
                         'to end')
        time.sleep(30)

        msg = 'Hook;Server@%s;Reservation occurrence - 1' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation end hook ran for first occurrence of a '
                         'standing reservation')

        self.logger.info(
            'wait for 10 seconds till the next occurrence is submitted')
        time.sleep(10)

        self.server.delete(rid)
        msg = 'Hook;Server@%s;Reservation occurrence - 2' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)

    @timeout(300)
    def test_end_resv_occurrences_with_jobs(self):
        """
        Testcase to submit and confirm a standing reservation for two
        occurrences, wait for the first occurrence to end and verify
        the end hook for the same, wait for the second occurrence to
        end and verify the resvend hook for the latter.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.standing_resv_hook_script)

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration, rrule='FREQ=MINUTELY;COUNT=2')

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        job_attrs = {
            'Resource_List.walltime': 5,
            'Resource_List.select': '1:ncpus=1',
            'queue': rid.split('.')[0]
        }

        for _ in range(10):
            self.server.submit(Job(TEST_USER, job_attrs))

        attrs['reserve_state'] = (MATCH_RE, 'RESV_RUNNING|5')
        self.server.expect(RESV, attrs, id=rid, offset=10)

        self.logger.info('Sleep for 30 seconds for the reservation occurrence '
                         'to end')
        time.sleep(30)

        msg = 'Hook;Server@%s;Reservation occurrence - 1' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation end hook ran for first occurrence of a '
                         'standing reservation')

        self.logger.info('Sleep for 30 seconds as this is a '
                         'minutely occurrence')
        time.sleep(30)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'),
                 'reserve_index': 2}
        self.server.expect(RESV, attrs, id=rid, attrop=PTL_AND)

        msg = 'Hook;Server@%s;Reservation occurrence - 2' % \
              self.server.shortname
        self.server.log_match(msg, tail=True, interval=2, max_attempts=30)
        self.logger.info('Reservation end hook ran for second occurrence of a '
                         'standing reservation')

    def test_unconfirmed_resv_with_node(self):
        """
        Testcase to set the node attributes such that the number of ncpus is 1,
        submit and confirm a reservation on the same node, submit another
        reservation on the same node and verify the reservation end hook
        as the latter one stays in unconfirmed state.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        node_attrs = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, node_attrs,
                            id=self.mom.shortname)
        offset = 10
        duration = 10
        rid = self.submit_resv(offset, duration)

        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        new_rid = self.submit_resv(offset, duration)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, new_rid)
        self.server.log_match(msg, tail=True, max_attempts=10,
                              existence=False)

    @timeout(240)
    def test_scheduler_down_case_1(self):
        """
        Testcase to turn off the scheduler and submit a reservation,
        the same will be in unconfirmed state and upon ending the
        resvend hook shall not run.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        self.scheduler.stop()

        offset = 10
        duration = 30
        rid = self.submit_resv(offset, duration)

        self.logger.info('wait for 30 seconds till the reservation ends ')
        time.sleep(30)

        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, max_attempts=10,
                              existence=False)

    def test_scheduler_down_case_2(self):
        """
        Testcase to turn off the scheduler and submit a reservation,
        the same will be in unconfirmed state and deleting that should
        not run the resvend hook.
        """
        self.server.import_hook(self.hook_name,
                                TestResvEndHook.advance_resv_hook_script)

        self.scheduler.stop()

        offset = 10
        duration = 10
        rid = self.submit_resv(offset, duration)

        self.server.delete(rid)
        msg = 'Hook;Server@%s;Reservation ID - %s' % \
              (self.server.shortname, rid)
        self.server.log_match(msg, tail=True, max_attempts=10,
                              existence=False)


================================================
FILE: test/tests/functional/pbs_resv_start_dur_end.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestReservationRequests(TestFunctional):

    """
    Various tests to verify behavoir of server
    in validating reservation requests
    """
    # Class variables
    bu = BatchUtils()
    fmt = "%a %b %d %H:%M:%S %Y"

    def test_duration_end_resv(self):
        """
        To test if reservations can be made by using
        duration and endtime, making the server calculate
        the starttime.
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_end': now + 30,
             'reserve_duration': 5}
        R = Reservation(TEST_USER, attrs=a)
        R.unset_attributes(['reserve_start'])
        rid = self.server.submit(R)

        a = {'reserve_start': self.bu.convert_seconds_to_datetime(
            now + 25, self.fmt)}
        self.server.expect(RESV, a, id=rid)

    def test_duration_end_resv_fail(self):
        """
        To test if reservations made by using
        duration and endtime, making the server calculate
        the starttime and rejects if the starttime is before now.
        """
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_end': int(time.time()) + 15,
             'reserve_duration': 20}
        R = Reservation(TEST_USER, attrs=a)
        R.unset_attributes(['reserve_start'])
        rid = None
        try:
            rid = self.server.submit(R)
        except PbsSubmitError as e:
            self.assertTrue('Bad time specification(s)' in e.msg[0],
                            'Reservation Submit failed in an unexpected way')
        self.assertTrue(rid is None,
                        'Reservation Submit succeeded ' +
                        'when it should have failed')

    def test_start_dur_end_resv_fail(self):
        """
        Test to submit a job with a start, end, and duration
        where start + duration != end.
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_start': now + 20,
             'reserve_end': now + 40,
             'reserve_duration': 10}
        R = Reservation(TEST_USER, attrs=a)
        rid = None
        try:
            rid = self.server.submit(R)
        except PbsSubmitError as e:
            self.assertTrue('Bad time specification(s)' in e.msg[0],
                            'Reservation Submit failed in an unexpected way')
        self.assertTrue(rid is None,
                        'Reservation Submit succeeded' +
                        'when it should have failed')

    def test_start_dur_end_resv(self):
        """
        Test to submit a job with a start, end, and duration
        where start + duration = end.
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_start': now + 20,
             'reserve_end': now + 30,
             'reserve_duration': 10}
        R = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(R)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

    def test_end_wall_resv(self):
        """
        Test to submit a job with end and walltime
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '10',
             'reserve_end': now + 30}
        R = Reservation(TEST_USER, attrs=a)
        R.unset_attributes(['reserve_start'])
        rid = self.server.submit(R)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

    def test_rstat_longterm_resv(self):
        """
        Test to submit a reservation, where duration > INT_MAX.
        Check whether rstat displaying negative number.
        """
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_start': now + 3600,
             'reserve_end': now + 4294970895}
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

        out = self.server.status(RESV, 'reserve_duration', id=rid)[0][
            'reserve_duration']
        dur = int(out)
        self.assertGreater(dur, 0, 'Duration ' + str(dur) + 'is negative.')


================================================
FILE: test/tests/functional/pbs_root_owned_script.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import os
from tests.functional import *


class Test_RootOwnedScript(TestFunctional):
    """
    Test suite to test whether the root owned script is getting rejected
    and the comment is getting updated when root_reject_scripts set to true.
    """

    def setUp(self):
        """
        Set up the parameters required for Test_RootOwnedScript
        """
        if os.getuid() != 0 or sys.platform in ('cygwin', 'win32'):
            self.skipTest("Test need to run as root")
        TestFunctional.setUp(self)
        mom_conf_attr = {'$reject_root_scripts': 'true'}
        qmgr_attr = {'acl_roots': ROOT_USER}
        self.mom.add_config(mom_conf_attr)
        self.mom.restart()
        self.server.manager(MGR_CMD_SET, SERVER, qmgr_attr)
        self.sleep_5 = """#!/bin/bash
        sleep 5
        """
        self.qsub_cmd = os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin', 'qsub')
        # Make sure local mom is ready to run jobs
        a = {'state': 'free', 'resources_available.ncpus': (GE, 1)}
        self.server.expect(VNODE, a, max_attempts=10, interval=2)

    def test_root_owned_script(self):
        """
        Edit the mom config to reject root script
        submit a script as root and observe the job comment.
        """
        j = Job(ROOT_USER)
        j.create_script(self.sleep_5)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        jid = self.server.submit(j)
        self.server.runjob(jid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid, offset=2)
        _comment = 'Not Running: PBS Error: Execution server rejected request'
        self.server.expect(JOB, {'comment': _comment}, id=jid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'H'}, id=jid)
        _comment = 'job held, too many failed attempts to run'
        self.server.expect(JOB, {'comment': _comment}, id=jid)

    def test_root_owned_job_array_script(self):
        """
        Like test_root_owned_script, except job array is used.
        """
        a = {ATTR_J: '1-3'}
        j = Job(ROOT_USER, a)
        j.create_script(self.sleep_5)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        jid = self.server.submit(j)
        sjid = j.create_subjob_id(jid, 1)
        self.server.runjob(sjid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid, offset=2)
        _comment = 'Not Running: PBS Error: Execution server rejected request'
        self.server.expect(JOB, {'comment': _comment}, id=jid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'H'}, id=jid)
        _comment = 'job held, too many failed attempts to run'
        self.server.expect(JOB, {'comment': _comment}, id=sjid)
        ja_comment = "Job Array Held, too many failed attempts to run subjob"
        self.server.expect(JOB, {ATTR_state: "H", ATTR_comment: (MATCH_RE,
                           ja_comment)}, attrop=PTL_AND, id=jid)

    def test_non_root_script(self):
        """
        Edit the mom config to reject root script
        submit a script as TEST_USER and observe the job comment.
        """
        j = Job(TEST_USER)
        j.create_script(self.sleep_5)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_root_owned_executable(self):
        """
        Edit the mom config to reject root script
        submit a job as root with the -- <executable> option.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        cmd = [self.qsub_cmd, '--', '/usr/bin/id']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEquals(rv['rc'], 0, 'qsub failed')
        jid = rv['out'][0]
        self.server.runjob(jid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid, offset=2)
        _comment = 'Not Running: PBS Error: Execution server rejected request'
        self.server.expect(JOB, {'comment': _comment}, id=jid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'H'}, id=jid)
        _comment = 'job held, too many failed attempts to run'
        self.server.expect(JOB, {'comment': _comment}, id=jid)

    def test_root_owned_job_array_executable(self):
        """
        Like test_root_owned_executable, except job array is used.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        cmd = [self.qsub_cmd, '-J', '1-3', '--', '/usr/bin/id']
        rv = self.du.run_cmd(self.server.hostname, cmd=cmd)
        self.assertEquals(rv['rc'], 0, 'qsub failed')
        jid = rv['out'][0]
        sjid = Job().create_subjob_id(jid, 1)
        self.server.runjob(sjid)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid, offset=2)
        _comment = 'Not Running: PBS Error: Execution server rejected request'
        self.server.expect(JOB, {'comment': _comment}, id=jid)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'H'}, id=jid)
        _comment = 'job held, too many failed attempts to run'
        self.server.expect(JOB, {'comment': _comment}, id=sjid)
        ja_comment = "Job Array Held, too many failed attempts to run subjob"
        self.server.expect(JOB, {ATTR_state: "H", ATTR_comment: (MATCH_RE,
                           ja_comment)}, attrop=PTL_AND, id=jid)

    def test_root_owned_job_pbs_attach(self):
        """
        submit a job as root and test pbs_attach feature.
        """
        mom_conf_attr = {'$reject_root_scripts': 'false'}
        self.mom.add_config(mom_conf_attr)
        self.mom.restart()
        qmgr_attr = {'acl_roots': ROOT_USER}
        self.server.manager(MGR_CMD_SET, SERVER, qmgr_attr)
        pbs_attach = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                  'bin', 'pbs_attach')

        # Job script
        test = []
        test += ['#PBS -l select=ncpus=1\n']
        test += ['%s -j $PBS_JOBID -P -s %s 30\n' %
                 (pbs_attach, self.mom.sleep_cmd)]

        # Submit a job
        j = Job(ROOT_USER)
        j.create_script(body=test)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        msg_expected = ".+%s;pid.+attached as task.+" % jid
        s = self.mom.log_match(msg_expected, regexp=True, max_attempts=10)

    def test_user_owned_job_pbs_attach(self):
        """
        submit a job as user and test pbs_attach feature.
        """
        pbs_attach = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                  'bin', 'pbs_attach')

        # Job script
        test = []
        test += ['#PBS -l select=ncpus=1\n']
        test += ['%s -j $PBS_JOBID -P -s %s 30\n' %
                 (pbs_attach, self.mom.sleep_cmd)]

        # Submit a job
        j = Job(TEST_USER)
        j.create_script(body=test)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        msg_expected = ".+%s;pid.+attached as task.+" % jid
        s = self.mom.log_match(msg_expected, regexp=True, max_attempts=10)


================================================
FILE: test/tests/functional/pbs_rstat.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestPbsRstat(TestFunctional):
    """
    This test suite validates output of pbs_rstat
    """

    def test_rstat_missing_resv(self):
        """
        Test that checks if pbs_rstat will continue to display
        reservations after not locating one reservation
        """

        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_start': now + 1000,
             'reserve_end': now + 2000}
        r = Reservation(TEST_USER)
        r.set_attributes(a)
        rid = self.server.submit(r)
        exp = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, exp, id=rid)

        a2 = {'Resource_List.select': '1:ncpus=1',
              'reserve_start': now + 3000,
              'reserve_end': now + 4000}
        r2 = Reservation(TEST_USER)
        r.set_attributes(a2)
        rid2 = self.server.submit(r)
        self.server.expect(RESV, exp, id=rid2)

        self.server.delresv(rid, wait=True)

        rstat_cmd = \
            os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', 'pbs_rstat')
        rstat_opt = [rstat_cmd, '-B', rid, rid2]
        ret = self.du.run_cmd(self.server.hostname, cmd=rstat_opt,
                              logerr=False)

        self.assertEqual(ret['rc'], 0,
                         'pbs_rstat returned with non-zero exit status')

        rstat_out = '\n'.join(ret['out'])
        self.assertIn(rid2, rstat_out)


================================================
FILE: test/tests/functional/pbs_runjob_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestRunJobHook(TestFunctional):
    """
    This test suite tests the runjob hook
    """
    index_hook_script = """
import pbs
e = pbs.event()
j = e.job
pbs.logmsg(pbs.LOG_DEBUG, "job_id=%s" % j.id)
pbs.logmsg(pbs.LOG_DEBUG, "sub_job_array_index=%s"
           % j.array_index)
e.accept()
"""

    reject_hook_script = """
import pbs
pbs.event().reject("runjob hook rejected the job")
"""

    new_res_in_hook_script = """
import pbs
e = pbs.event()
e.job.Resource_List['site'] = 'site_value'
"""

    rerun_hook_script = """
import pbs
e = pbs.event()
j = e.job
if not j.run_version is None:
    pbs.logmsg(pbs.LOG_DEBUG,
        "rerun_job_hook %s(%s): Resource_List.foo_str=%s" %
        (j.id,j.run_version,j.Resource_List['foo_str']))
else:
    j.Resource_List['foo_str'] = "foo_value"
"""

    def test_array_sub_job_index(self):
        """
        Submit a job array. Check the array sub-job index value
        """
        hook_name = "runjob_hook"
        attrs = {'event': "runjob"}
        rv = self.server.create_import_hook(hook_name, attrs,
                                            self.index_hook_script,
                                            overwrite=True)
        self.assertTrue(rv)
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        lower = 1
        upper = 3
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_J: '%d-%d' % (lower, upper)})
        self.server.submit(j1)
        for i in range(lower, upper + 1):
            self.server.log_match("sub_job_array_index=%d" % (i),
                                  starttime=self.server.ctime)

    def test_array_sub_new_res_in_hook(self):
        """
        Insert site resource in runjob hook. Submit a job array.
        Check if site resource set for all subjobs
        """
        hook_name = "runjob_hook"
        attrs = {'event': "runjob"}
        rv = self.server.create_import_hook(hook_name, attrs,
                                            self.new_res_in_hook_script,
                                            overwrite=True)
        self.assertTrue(rv)
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        lower = 1
        upper = 3
        j1 = Job(TEST_USER)
        j1.set_sleep_time(10)
        j1.set_attributes({ATTR_J: '%d-%d' % (lower, upper)})
        jid = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        time.sleep(5)
        self.server.expect(JOB, ATTR_state, op=UNSET, id=jid)
        for i in range(lower, upper + 1):
            sid = j1.create_subjob_id(jid, i)
            m = "'runjob_hook' hook set job's Resource_List.site = site_value"
            self.server.tracejob_match(m, id=sid, n='ALL', tail=False)
            m = 'E;' + re.escape(sid) + ';.*Resource_List.site=site_value'
            self.server.accounting_match(m, regexp=True)

    def test_array_sub_res_persist_in_hook_forcereque(self):
        """
        set custom resource in runjob hook. Submit a job array.
        Check if custom resource set persists after force requeue due to
        node fail requeue
        """
        # configure node fail requeue to lower value
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'node_fail_requeue': 5})
        # set three cpu for three subjobs
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # create custom non-consumable string server resource
        attr = {'type': 'string'}
        r = 'foo_str'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, logerr=False)
        # create and import hook
        hook_name = "runjob_hook"
        attrs = {'event': "runjob"}
        rv = self.server.create_import_hook(hook_name, attrs,
                                            self.rerun_hook_script,
                                            overwrite=True)
        self.assertTrue(rv)
        # create and submit job array
        lower = 1
        upper = 3
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_J: '%d-%d' % (lower, upper)})
        jid = self.server.submit(j1)
        # check if running
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        self.server.expect(JOB, {'job_state=R': 3}, count=True,
                           id=jid, extend='t')
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})
        # kill mom
        self.mom.stop('-KILL')
        m = "'runjob_hook' hook set job's Resource_List.foo_str = foo_value"
        sid = {}
        for i in range(lower, upper + 1):
            sid[i] = j1.create_subjob_id(jid, i)
            self.server.tracejob_match(m, id=sid[i], n='ALL', tail=False)
        # check subjob state change from R->Q
        self.server.expect(JOB, {'job_state=Q': 3}, count=True,
                           id=jid, extend='t')
        # bring back mom
        self.mom.start()
        start_time = time.time()
        self.mom.isUp()
        # let subjobs get rerun from sched Q->R
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state=R': 3}, count=True,
                           id=jid, extend='t')
        # log match from hook log for custom res value
        m = "rerun_job_hook %s(1): Resource_List.foo_str=foo_value"
        for i in range(lower, upper + 1):
            self.server.log_match(m % (sid[i]), start_time)

    def test_array_sub_res_persist_in_hook_qrerun(self):
        """
        set custom resource in runjob hook. Submit a job array.
        Check if custom resource set persists after a qrerun
        """
        # set three cpu for three subjobs
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # create custom non-consumable string server resource
        attr = {'type': 'string'}
        r = 'foo_str'
        self.server.manager(
            MGR_CMD_CREATE, RSC, attr, id=r, logerr=False)
        # create and import hook
        hook_name = "runjob_hook"
        attrs = {'event': "runjob"}
        rv = self.server.create_import_hook(hook_name, attrs,
                                            self.rerun_hook_script,
                                            overwrite=True)
        self.assertTrue(rv)
        # create and submit job array
        lower = 1
        upper = 3
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_J: '%d-%d' % (lower, upper)})
        jid = self.server.submit(j1)
        # check if running
        self.server.expect(JOB, {ATTR_state: 'B'}, id=jid)
        self.server.expect(JOB, {'job_state=R': 3}, count=True,
                           id=jid, extend='t')
        m = "'runjob_hook' hook set job's Resource_List.foo_str = foo_value"
        sid = {}
        for i in range(lower, upper + 1):
            sid[i] = j1.create_subjob_id(jid, i)
            self.server.tracejob_match(m, id=sid[i], n='ALL', tail=False)
        start_time = time.time()
        # rerun the array job
        self.server.rerunjob(jobid=jid, runas=ROOT_USER)
        self.server.expect(JOB, {'job_state=R': 3}, count=True,
                           id=jid, extend='t')
        # log match from hook log for custom res value
        m = "rerun_job_hook %s(1): Resource_List.foo_str=foo_value"
        for i in range(lower, upper + 1):
            self.server.log_match(m % (sid[i]), start_time)
        start_time = time.time()
        # rerun a single subjob
        self.server.rerunjob(jobid=sid[2], runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=sid[2])
        # log match from hook log for custom res value
        m = "rerun_job_hook %s(2): Resource_List.foo_str=foo_value"
        self.server.log_match(m % (sid[2]), start_time)

    def test_normal_job_index(self):
        """
        Submit a normal job. Check the job index value which should be None
        """
        hook_name = "runjob_hook"
        attrs = {'event': "runjob"}
        rv = self.server.create_import_hook(hook_name, attrs,
                                            self.index_hook_script,
                                            overwrite=True)
        self.assertTrue(rv)
        j1 = Job(TEST_USER)
        self.server.submit(j1)
        self.server.log_match("sub_job_array_index=None",
                              starttime=self.server.ctime)

    def test_reject_array_sub_job(self):
        """
        Test to check array subjobs,
        jobs should run after runjob hook enabled set to false.
        """
        hook_name = "runjob_hook"
        attrs = {'event': "runjob"}
        rv = self.server.create_import_hook(hook_name, attrs,
                                            self.reject_hook_script,
                                            overwrite=True)
        self.assertTrue(rv)
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_J: '1-3'})
        jid = self.server.submit(j1)
        msg = "Not Running: PBS Error: runjob hook rejected the job"
        self.server.expect(JOB, {'job_state': 'Q', 'comment': msg}, id=jid)
        a = {'enabled': 'false'}
        self.server.manager(MGR_CMD_SET, HOOK, a, id=hook_name, sudo=True)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'B'}, id=jid)
        self.server.expect(JOB, {'job_state=R': 3}, count=True,
                           id=jid, extend='t')


================================================
FILE: test/tests/functional/pbs_sched_attr_updates.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


class TestSchedAttrUpdates(TestFunctional):

    def test_basic_throttling(self):
        """
        Test the behavior of sched's 'attr_update_period' attribute
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {"resources_available.ncpus": 1},
                            id=self.mom.shortname)

        jid1 = self.server.submit(Job())
        jid2 = self.server.submit(Job())

        self.server.expect(JOB, {"job_state": "R"}, id=jid1)
        self.server.expect(JOB, {"job_state": "Q"}, id=jid2)
        self.server.expect(JOB, "comment", op=SET, id=jid2)

        self.server.cleanup_jobs()

        a = {"attr_update_period": 45, "scheduling": "False"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="default")

        self.server.submit(Job())
        jid4 = self.server.submit(Job())

        self.scheduler.run_scheduling_cycle()

        # Scheduler should send attr updates in the first cycle
        # after attr_update_period is set
        self.server.expect(JOB, "comment", op=SET, id=jid4)

        jid5 = self.server.submit(Job())
        jid6 = self.server.submit(Job())

        t = time.time()
        self.scheduler.run_scheduling_cycle()

        # Verify that scheduler didn't send attr updates for new jobs
        self.server.expect(JOB, "comment", op=UNSET, id=jid5)
        self.server.expect(JOB, "comment", op=UNSET, id=jid6)
        self.server.log_match("Type 96 request received", existence=False,
                              starttime=t, max_attempts=5)

        self.logger.info("Sleep for 45s for the attr_update_period to pass")
        time.sleep(45)
        jid7 = self.server.submit(Job())
        jid8 = self.server.submit(Job())

        t = time.time()
        self.scheduler.run_scheduling_cycle()

        # Verify that scheduler sent attr updates for all new jobs
        self.server.expect(JOB, "comment", op=SET, id=jid7)
        self.server.expect(JOB, "comment", op=SET, id=jid8)
        self.server.log_match("Type 96 request received", starttime=t)

    def test_accrue_type(self):
        """
        Test that accrue_type updates are sent immediately
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {"resources_available.ncpus": 1},
                            id=self.mom.shortname)

        a = {"attr_update_period": 600, "scheduling": "False"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="default")

        j = Job()
        j.set_sleep_time(1000)
        jid1 = self.server.submit(j)
        jid2 = self.server.submit(Job())

        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, {"job_state": "R"}, id=jid1)
        self.server.expect(JOB, {"job_state": "Q"}, id=jid2)
        self.server.expect(JOB, "comment", op=SET, id=jid2)

        jid3 = self.server.submit(Job())
        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, "comment", op=UNSET, id=jid3)

        # Now, turn eligible time on and add a limit that'll be crossed
        # by the user, this will trigger an accrue_type update from sched
        a = {"eligible_time_enable": "True"}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'max_run_res.ncpus': '[u:PBS_GENERIC=1]'})

        # We should still be within the throttling window
        # But, because accrue_type needed to be sent out,
        # sched will send all updates for the jobs
        jid4 = self.server.submit(Job())
        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, "comment", op=SET, id=jid4, max_attempts=1)
        self.server.expect(JOB, {"accrue_type": "1"}, id=jid4, max_attempts=1)
        self.server.expect(JOB, "comment", op=SET, id=jid3, max_attempts=1)
        self.server.expect(JOB, {"accrue_type": "1"}, id=jid3, max_attempts=1)
        self.server.expect(JOB, {"accrue_type": "1"}, id=jid2, max_attempts=1)


================================================
FILE: test/tests/functional/pbs_sched_badstate.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import copy
from tests.functional import *


class TestSchedBadstate(TestFunctional):

    def test_sched_badstate_subjob(self):
        """
        This test case tests if scheduler goes into infinite loop
        when following conditions are met.
        - Kill a mom
        - mark the mom's state as free
        - submit an array job
        - check the sched log for "Leaving sched cycle" from the time
          array job was submitted.
        If we are unable to find a log match then scheduler is in
          endless loop and test case has failed.
        """

        self.mom.signal('-KILL')

        attr = {'state': 'free', 'resources_available.ncpus': '2'}
        self.server.manager(MGR_CMD_SET, NODE, attr, self.mom.shortname)

        attr = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)

        j1 = Job(TEST_USER)
        j1.set_attributes({'Resource_List.ncpus': '2', ATTR_J: '1-3'})
        j1id = self.server.submit(j1)

        now = time.time()

        attr = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)

        self.scheduler.log_match("Leaving Scheduling Cycle",
                                 starttime=now,
                                 interval=1)
        self.server.delete(j1id)

    def test_sched_unknown_node_state(self):
        """
        Test to see if the scheduler reports node states as 'Unknown'
        """
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        # free is when all ncpus are free
        self.server.expect(NODE, {'state': 'free'}, id=self.mom.shortname)
        self.scheduler.log_match("Unknown Node State",
                                 existence=False, max_attempts=2)
        ncpus = self.server.status(NODE)[0]['resources_available.ncpus']
        if self.mom.is_cpuset_mom():
            vnode_id = self.server.status(NODE)[1]['id']
            vnode_val = 'vnode=' + vnode_id
            ncpus = self.server.status(NODE)[1]['resources_available.ncpus']
            a = {'Resource_List.select': vnode_val + ':ncpus=' + ncpus}
        else:
            a = {'Resource_List.select': '1:ncpus=' + ncpus}
        b = a.copy()
        J = Job(attrs=a)
        jid1 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        if self.mom.is_cpuset_mom():
            self.server.expect(VNODE, {'state': 'job-busy'}, id=vnode_id)
        else:
            self.server.expect(NODE, {'state': 'job-busy'},
                               id=self.mom.shortname)
        self.scheduler.log_match("Unknown Node State",
                                 existence=False, max_attempts=2)

        # maintenance is when a job is has been admin-suspended
        self.server.sigjob(jid1, 'admin-suspend')
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        if self.mom.is_cpuset_mom():
            self.server.expect(VNODE, {'state': 'maintenance'}, id=vnode_id)
        else:
            self.server.expect(NODE, {'state': 'maintenance'},
                               id=self.mom.shortname)
        self.scheduler.log_match("Unknown Node State",
                                 existence=False, max_attempts=2)

        self.server.delete(jid1, wait=True)

        # job-exclusive is when a job requests place=excl
        b['Resource_List.place'] = 'excl'
        J = Job(attrs=b)
        jid2 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        if self.mom.is_cpuset_mom():
            self.server.expect(VNODE, {'state': 'job-exclusive'}, id=vnode_id)
        else:
            self.server.expect(NODE, {'state': 'job-exclusive'},
                               id=self.mom.shortname)
        self.scheduler.log_match("Unknown Node State",
                                 existence=False, max_attempts=2)

        self.server.delete(jid2, wait=True)

        # resv-exclusive is when a reservation requersts -lplace=excl
        st = time.time() + 30
        et = st + 30
        b['reserve_start'] = st
        b['reserve_end'] = et
        R = Reservation(attrs=b)
        rid = self.server.submit(R)
        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_CONFIRMED|2')}, id=rid)

        self.server.expect(RESV, {'reserve_state':
                                  (MATCH_RE, 'RESV_RUNNING|5')},
                           id=rid, offset=30)

        if self.mom.is_cpuset_mom():
            self.server.expect(VNODE, {'state': 'resv-exclusive'}, id=vnode_id)
        else:
            self.server.expect(NODE, {'state': 'resv-exclusive'},
                               id=self.mom.shortname)
        self.scheduler.log_match("Unknown Node State",
                                 existence=False, max_attempts=2)
        self.server.delete(rid)

        # Multiple node states eg: down + job-busy
        J = Job(attrs=a)
        jid3 = self.server.submit(J)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.mom.signal('-KILL')
        if self.mom.is_cpuset_mom():
            self.server.expect(VNODE, {'state': 'down,job-busy'},
                               id=vnode_id)
        else:
            self.server.expect(NODE, {'state': 'down,job-busy'},
                               id=self.mom.shortname)
        self.scheduler.log_match("Unknown Node State",
                                 existence=False, max_attempts=2)


================================================
FILE: test/tests/functional/pbs_sched_fifo.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestSchedFifo(TestFunctional):
    """
    Test suite for FIFO scheduling
    """

    def test_sched_fifo(self):
        """
        Check that FIFO works.
        """

        # Configure sched for FIFO
        self.scheduler.set_sched_config({'strict_ordering': 'True',
                                         'by_queue': 'False'})

        # Create a new queue to test FIFO
        queue_attrib = {ATTR_qtype: 'execution',
                        ATTR_start: 'True',
                        ATTR_enable: 'True'}
        self.server.manager(MGR_CMD_CREATE,
                            QUEUE, queue_attrib, id="workq2")

        # Set ncpus to 2 so it is easy to test, and scheduling off
        self.server.manager(MGR_CMD_SET,
                            NODE, {'resources_available.ncpus': 2},
                            self.mom.shortname)
        self.server.manager(MGR_CMD_SET,
                            SERVER, {'scheduling': 'False'})

        # Submit 3 jobs: j1 (workq), j2 (workq2), j3 (workq)
        j1 = Job(TEST_USER, attrs={
            ATTR_queue: "workq"})
        j2 = Job(TEST_USER, attrs={
            ATTR_queue: "workq2"})
        j3 = Job(TEST_USER, attrs={
            ATTR_queue: "workq"})

        j_id1 = self.server.submit(j1)
        j_id2 = self.server.submit(j2)
        j_id3 = self.server.submit(j3)

        # Turn scheduling on again
        self.server.manager(MGR_CMD_SET,
                            SERVER, {'scheduling': 'True'})

        # j1 and j2 should be running
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j_id1, max_attempts=10)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j_id2, max_attempts=10)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=j_id3, max_attempts=10)


================================================
FILE: test/tests/functional/pbs_sched_preempt_enforce_resumption.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestSchedPreemptEnforceResumption(TestFunctional):
    """
    Test sched_preempt_enforce_resumption working
    """

    def setUp(self):
        TestFunctional.setUp(self)

        a = {ATTR_qtype: 'Execution', ATTR_enable: 'True',
             ATTR_start: 'True', ATTR_p: '151'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq")

        a = {ATTR_sched_preempt_enforce_resumption: True}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

    def test_filler_job_higher_walltime(self):
        """
        This test confirms that the filler job does not run if it conflicts
        with running of a suspended job.
        """
        a = {ATTR_rescavail + '.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_l + '.walltime': 80})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 30})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_l + '.walltime': 90})
        jid3 = self.server.submit(j3)
        logmsg = ";Job would conflict with reservation or top job"
        self.scheduler.log_match(jid3 + logmsg)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid3)

    def test_suspended_job_ded_time_calendared(self):
        """
        This test confirms that a suspended job becomes top job when unable to
        resume due to conflict with dedicated time.
        """
        a = {ATTR_rescavail + '.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        now = int(time.time())
        temp = 60 - now % 60
        start = now + 180 + temp
        end = start + 120
        self.scheduler.add_dedicated_time(start=start, end=end)

        j1 = Job(TEST_USER)
        jtime = int(time.time())
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_l + '.walltime': start - jtime - 10})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_l + '.walltime': 60,
                           ATTR_q: 'expressq'})
        j2.set_sleep_time(60)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

        self.server.tracejob_match(
            msg='Job is a top job and will run at', id=jid1)

        attr = 'estimated.start_time'
        stat = self.server.status(JOB, attr, id=jid1)
        est_val = stat[0][attr]
        est_str = time.strptime(est_val, '%c')
        est_start_time = int(time.mktime(est_str))

        self.assertGreaterEqual(est_start_time, end)

    def test_filler_job_lesser_walltime(self):
        """
        This test confirms that the filler job does run when the walltime does
        not conflict with running of a suspended job.
        """
        a = {ATTR_rescavail + '.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4',
                           ATTR_l + '.walltime': 50})
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_l + '.walltime': 80})
        jid2 = self.server.submit(j2)

        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_l + '.walltime': 50})
        jid3 = self.server.submit(j3)

        j4 = Job(TEST_USER)
        j4.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_l + '.walltime': 150})
        jid4 = self.server.submit(j4)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid4)

        j5 = Job(TEST_USER)
        j5.set_attributes({ATTR_l + '.select': '1:ncpus=1',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 100})
        jid5 = self.server.submit(j5)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid4)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid5)

        logmsg = ";Job would conflict with reservation or top job"
        self.scheduler.log_match(jid4 + logmsg)

    def test_filler_job_suspend(self):
        """
        This test confirms that the filler gets suspended by a high
        priority job.
        """
        a = {ATTR_rescavail + '.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        j1 = Job(TEST_USER)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4',
                           ATTR_l + '.walltime': 90})
        jid1 = self.server.submit(j1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_l + '.walltime': 30})
        jid2 = self.server.submit(j2)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid2)

        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 50})
        jid3 = self.server.submit(j3)

        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)

        j4 = Job(TEST_USER)
        j4.set_sleep_time(30)
        j4.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 30})
        jid4 = self.server.submit(j4)

        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid4)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid4, extend='x',
                           offset=5, interval=2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)

        logmsg = ";Job would conflict with reservation or top job"
        self.scheduler.log_match(jid2 + logmsg)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid3, extend='x',
                           offset=15, interval=2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid2)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid1, extend='x',
                           offset=30, interval=2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

    def test_preempted_job_server_soft_limits(self):
        """
        This test confirms that a preempted job remains suspended if it has
        violated server soft limits
        """
        a = {ATTR_rescavail + '.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        a = {'max_run_res_soft.ncpus': "[u:" + str(TEST_USER1) + "=2]"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        p = '"express_queue, normal_jobs, server_softlimits"'
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        j1 = Job(TEST_USER1)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4',
                           ATTR_l + '.walltime': 50})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 20})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_l + '.walltime': 25})
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid3)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid2, extend='x',
                           offset=30, interval=2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid3, extend='x',
                           offset=30, interval=2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

    def test_preempted_job_queue_soft_limits(self):
        """
        This test confirms that a preempted job remains suspended if it has
        violated queue soft limits
        """
        a = {ATTR_rescavail + '.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        a = {'max_run_res_soft.ncpus': "[u:" + str(TEST_USER1) + "=2]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')

        p = '"express_queue, normal_jobs, queue_softlimits"'
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        j1 = Job(TEST_USER1)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4',
                           ATTR_l + '.walltime': 50})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 20})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_l + '.walltime': 25})
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid3)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid2, extend='x',
                           offset=30, interval=2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)

        self.server.expect(JOB, {ATTR_state: 'F'}, id=jid3, extend='x',
                           offset=30, interval=2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

    def test_filler_jobs_with_no_walltime(self):
        """
        This test confirms that filler jobs with no walltime remain queued
        """
        a = {ATTR_rescavail + '.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        j1 = Job(TEST_USER1)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4',
                           ATTR_l + '.walltime': 20})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        j2 = Job(TEST_USER)
        j2.set_attributes({ATTR_l + '.select': '1:ncpus=2',
                           ATTR_q: 'expressq',
                           ATTR_l + '.walltime': 8})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)

        j3 = Job(TEST_USER)
        j3.set_attributes({ATTR_l + '.select': '1:ncpus=2'})
        jid3 = self.server.submit(j3)

        j4 = Job(TEST_USER)
        j4.set_attributes({ATTR_l + '.select': '1:ncpus=2'})
        jid4 = self.server.submit(j4)

        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid4)

    def test_filler_stf(self):
        """
        Test that confirms filler shrink to fit jobs will shrink correctly
        """
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        a = {ATTR_l + '.select': '1:ncpus=3',
             ATTR_l + '.walltime': 50}
        jid1 = self.server.submit(Job(attrs=a))
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        a = {ATTR_l + '.select': '1:ncpus=1',
             ATTR_l + '.walltime': 115,
             ATTR_q: 'expressq'}
        jid2 = self.server.submit(Job(attrs=a))
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

        a = {ATTR_l + '.select': '1:ncpus=1',
             ATTR_l + '.min_walltime': 70,
             ATTR_l + '.max_walltime': 90}
        jid3 = self.server.submit(Job(attrs=a))
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)
        self.scheduler.log_match('Job;%s;Job will run for duration=00:01:' %
                                 (jid3))

        a = {ATTR_l + '.select': '1:ncpus=1',
             ATTR_l + '.min_walltime': '01:00',
             ATTR_l + '.max_walltime': '10:00'}
        jid4 = self.server.submit(Job(attrs=a))
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid4)
        self.scheduler.log_match('Job;%s;Job will run for duration=00:01:' %
                                 (jid4))

        a = {ATTR_l + '.select': '1:ncpus=1',
             ATTR_l + '.min_walltime': '02:30',
             ATTR_l + '.max_walltime': '05:00'}
        jid5 = self.server.submit(Job(attrs=a))
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid5)

        stat = self.server.status(JOB, id=jid1)[0]
        j1start = datetime.datetime.strptime(stat['estimated.start_time'],
                                             '%c')

        stat = self.server.status(JOB, id=jid3)[0]
        t = datetime.datetime.strptime(stat[ATTR_l + '.walltime'], '%H:%M:%S')
        j3dur = datetime.timedelta(hours=t.hour,
                                   minutes=t.minute,
                                   seconds=t.second)
        j3start = datetime.datetime.strptime(stat[ATTR_stime], '%c')
        self.assertGreaterEqual(j1start, j3start + j3dur)
        self.assertGreaterEqual(j3dur.total_seconds(), 70)
        self.assertLessEqual(j3dur.total_seconds(), 90)

        stat = self.server.status(JOB, id=jid4)[0]
        t = datetime.datetime.strptime(stat[ATTR_l + '.walltime'], '%H:%M:%S')
        j4dur = datetime.timedelta(hours=t.hour,
                                   minutes=t.minute,
                                   seconds=t.second)
        j4start = datetime.datetime.strptime(stat[ATTR_stime], '%c')
        self.assertEquals(j4start + j4dur, j1start)


================================================
FILE: test/tests/functional/pbs_sched_rerun.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestSchedRerun(TestFunctional):
    """
    Tests to verify scheduling of rerun jobs.
    """

    @requirements(num_moms=2)
    def test_rerun_job_over_reservation(self):
        """
        Test that job will not run over reservation/top job
        after first failed attempt to run (with used resource set).
        """
        now = int(time.time())

        usage_string = 'test requires two moms,' + \
                       'use -p "servers=M1,moms=M1:M2"'

        if len(self.moms.values()) != 2:
            self.skip_test(usage_string)

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        if not self.hostA or not self.hostB:
            self.skip_test(usage_string)

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'managers': (INCR, '%s@*' % TEST_USER)})

        a = {'type': 'long', 'flag': 'i'}
        r = 'foo'
        self.server.manager(MGR_CMD_CREATE, RSC, a, id=r)

        hook_body = f"""
import pbs
e = pbs.event()
if e.type == pbs.EXECJOB_BEGIN:
    e.job.resources_used["foo"] = 123
    if e.job.run_count == 1:
        for v in e.vnode_list:
            if v == "{self.hostA}":
                e.vnode_list[v].state = pbs.ND_OFFLINE
        e.job.rerun()
        e.reject("rerun job")
e.accept()
"""

        hook_name = "rerun_job"
        a = {'event': 'execjob_begin',
             'enabled': 'True'}
        rv = self.server.create_import_hook(
            hook_name, a, hook_body, overwrite=True)
        self.assertTrue(rv)

        a = {'reserve_start': now + 60,
             'reserve_end': now + 7200}
        h = [self.hostB]
        r = Reservation(TEST_USER, attrs=a, hosts=h)

        self.server.submit(r)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '24:00:00'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(1000)
        jid = self.server.submit(j)

        self.logger.info("Wait for the job to try to rerun (10 seconds)")
        time.sleep(10)

        # the job shoud not run because first mom is offline
        # second mom is occupied by maintenance reservation
        a = {'job_state': 'Q'}
        self.server.expect(JOB, a, id=jid)


================================================
FILE: test/tests/functional/pbs_sched_runjobwait.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *


class TestSchedJobRunWait(TestFunctional):
    """
    Tests related to scheduler attribute job_run_wait
    """

    def setup_scn(self, n):
        """
        set up n multi-scheds for a test
        """
        sc_quenames = []
        for i in range(n):
            scname = "sc" + str(i)
            pname = "P" + str(i)
            qname = "wq" + str(i)
            sc_quenames.append([scname, qname])

            a = {'partition': pname,
                 'sched_host': self.server.hostname}
            self.server.manager(MGR_CMD_CREATE, SCHED,
                                a, id=scname)
            self.scheds[scname].create_scheduler()
            self.scheds[scname].start()
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'log_events': 2047}, id=scname)

            a = {'queue_type': 'execution',
                 'started': 'True',
                 'enabled': 'True',
                 'partition': pname}
            self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=qname)
            a = {'resources_available.ncpus': 1, 'partition': pname}
            prefix = 'vnode' + str(i)
            nname = prefix + "[0]"
            self.mom.create_vnodes(a, 1, delall=False,
                                   additive=True, vname=nname)
        return sc_quenames

    def test_throughput_mode_deprecated(self):
        """
        Test that server logs throughput_mode as deprecated
        """
        t1 = time.time()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'throughput_mode': "True"}, id="default")
        msg = "'throughput_mode' is being deprecated, " +\
            "it is recommended to use 'job_run_wait'"
        self.server.log_match(msg, starttime=t1)

    def test_jobrunwait_throughput_clash(self):
        """
        Test that job_run_wait and throughput_mode don't clash
        """
        # Setting TP to True/False should set JRW correctly
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'throughput_mode': "False"}, id="default")
        self.server.expect(SCHED, {'job_run_wait': "execjob_hook"},
                           id="default")

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'throughput_mode': "True"}, id="default")
        self.server.expect(SCHED, {'job_run_wait': "runjob_hook"},
                           id="default")

        # Setting job_run_wait to 'none' should just delete TP
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'job_run_wait': "none"}, id="default")
        rt = self.server.status(SCHED, id="default")
        self.assertNotIn('throughput_mode', rt[0].keys(),
                         'throughput_mode displayed when not expected')

        # Setting JRW to runjob/execjob should set TP correctly
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'job_run_wait': "execjob_hook"}, id="default")
        self.server.expect(SCHED, {'throughput_mode': "False"},
                           id="default")
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'job_run_wait': "runjob_hook"}, id="default")
        self.server.expect(SCHED, {'throughput_mode': "True"},
                           id="default")

    def test_jobrunwait_default(self):
        """
        Test that job_run_wait gets set to its default when unset
        """
        # Unsetting job_run_wait should set both to default
        self.server.manager(MGR_CMD_UNSET, SCHED,
                            'job_run_wait', id="default")
        self.server.expect(SCHED, {'job_run_wait': 'runjob_hook'},
                           id='default')
        self.server.expect(SCHED, {'throughput_mode': "True"},
                           id="default")

        # Unsetting TP should do the same
        self.server.manager(MGR_CMD_UNSET, SCHED,
                            'throughput_mode', id="default")
        self.server.expect(SCHED, {'job_run_wait': "runjob_hook"},
                           id="default")
        self.server.expect(SCHED, {'throughput_mode': "True"},
                           id="default")

    def test_valid_vals(self):
        """
        Test that job_run_wait can only be set to its default values
        """
        self.server.manager(MGR_CMD_SET, SCHED, {'job_run_wait': 'none'},
                            id='default')
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'job_run_wait': 'runjob_hook'}, id='default')
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'job_run_wait': 'execjob_hook'}, id='default')
        with self.assertRaises(PbsManagerError,
                               msg="invalid str value was accepted"):
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'job_run_wait': 'badstr'}, id='default')

        with self.assertRaises(PbsManagerError,
                               msg="invalid int value was accepted"):
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'job_run_wait': 0}, id='default')

    def test_multisched_multival(self):
        """
        Test that multiple scheds can be configured with different vals of
        job_run_wait, and behave correctly
        """
        sc_queue = self.setup_scn(3)
        a = {"scheduling": "False", "job_run_wait": "none"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id=sc_queue[0][0])
        a["job_run_wait"] = "runjob_hook"
        self.server.manager(MGR_CMD_SET, SCHED, a, id=sc_queue[1][0])
        a["job_run_wait"] = "execjob_hook"
        self.server.manager(MGR_CMD_SET, SCHED, a, id=sc_queue[2][0])

        hook_txt = """
import pbs

if pbs.event().job.id == '%s':
    pbs.event().reject("rejecting first job")
pbs.event().accept()
"""
        hk_attrs = {'event': 'runjob', 'enabled': 'True'}

        # All of the scheds have a 1 ncpu node only
        # Submit 2 1cpu jobs to each sched
        # The runjob hook will reject first job that's run by each sched
        a = {"queue": sc_queue[0][1], "Resource_List.ncpus": "1"}
        jid1 = self.server.submit(Job(attrs=a))
        jid2 = self.server.submit(Job(attrs=a))
        self.server.create_import_hook('rj', hk_attrs, hook_txt % (jid1))

        # sched 1 with job_run_wait=none runs first job without waiting
        # for runjob reject, so it doesn't run second job.
        # Ultimately, neither jobs should run
        self.scheds[sc_queue[0][0]].run_scheduling_cycle()
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        self.server.delete_hook('rj')
        a["queue"] = sc_queue[1][1]
        jid3 = self.server.submit(Job(attrs=a))
        jid4 = self.server.submit(Job(attrs=a))
        self.server.create_import_hook('rj', hk_attrs, hook_txt % str(jid3))

        # sched 2 with job_run_wait=runjob_hook should wait for runjob
        # reject and then run the second job
        self.scheds[sc_queue[1][0]].run_scheduling_cycle()
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)

        self.server.delete_hook('rj')
        a["queue"] = sc_queue[1][1]
        jid5 = self.server.submit(Job(attrs=a))
        jid6 = self.server.submit(Job(attrs=a))
        hk_attrs["event"] = 'execjob_begin'
        self.server.create_import_hook('ej', hk_attrs, hook_txt % str(jid5))

        # sched 2 with job_run_wait=runjob_hook won't wait for execjob_begin
        # reject, so it will run first job and not run second.
        # Ultimately no jobs will run
        self.scheds[sc_queue[1][0]].run_scheduling_cycle()
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid5)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid6)

        self.server.delete_hook('ej')
        a["queue"] = sc_queue[2][1]
        jid7 = self.server.submit(Job(attrs=a))
        jid8 = self.server.submit(Job(attrs=a))
        hk_attrs["event"] = 'execjob_begin'
        self.server.create_import_hook('ej', hk_attrs, hook_txt % str(jid7))

        # sched 3 with job_run_wait=execjob_hook should wait for runjob
        # reject and then run the second job
        self.scheds[sc_queue[2][0]].run_scheduling_cycle()
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid7)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid8)

    def test_no_runjob_hook(self):
        """
        Test that when there is no runjob hook configured, sched behaves as if
        job_run_wait == none, even if it's set to "runjob_hook"
        """

        a = {"scheduling": "False", "job_run_wait": "runjob_hook"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="default")

        self.server.submit(Job())

        t = time.time()
        self.scheduler.run_scheduling_cycle()

        # Check that server received PBS_BATCH_AsyrunJob, truly async request
        logmsg = "Type 23 request received"
        self.server.log_match(logmsg, starttime=t)

    def test_with_runjob_hook(self):
        """
        Test that when there is a runjob hook configured, sched doesn't
        upgrade job_run_wait from "runjob_hook" to "none"
        """

        a = {"scheduling": "False", "job_run_wait": "runjob_hook"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="default")

        hook_txt = """
import pbs

pbs.event().accept()
"""
        hk_attrs = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook('rj', hk_attrs, hook_txt)

        self.server.submit(Job())

        t = time.time()
        self.scheduler.run_scheduling_cycle()

        # Check that server received PBS_BATCH_AsyrunJob_ack request
        self.server.log_match("Type 97 request received", starttime=t)

    @skip("issue 2330")
    def test_throughput_ok(self):
        """
        Test that throughput_mode still works correctly
        """
        self.server.manager(MGR_CMD_UNSET, SCHED,
                            'job_run_wait', id="default")

        a = {'throughput_mode': "True", "scheduling": "False"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="default")

        jid = self.server.submit(Job())

        t = time.time()
        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, {"job_state": "R"}, id=jid)

        # Check that server received PBS_BATCH_AsyrunJob request
        self.server.log_match("Type 23 request received", starttime=t)

        self.server.cleanup_jobs()

        self.server.manager(MGR_CMD_SET, SCHED, {'throughput_mode': "False"},
                            id="default")
        jid = self.server.submit(Job())
        t = time.time()
        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, {"job_state": "R"}, id=jid)

        # Check that server received PBS_BATCH_RunJob request
        self.server.log_match("Type 15 request received", starttime=t)

        hook_txt = """
import pbs

pbs.event().accept()
"""
        hk_attrs = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook('rj', hk_attrs, hook_txt)

        self.server.cleanup_jobs()

        self.server.manager(MGR_CMD_SET, SCHED, {'throughput_mode': "True"},
                            id="default")
        jid = self.server.submit(Job())
        t = time.time()
        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, {"job_state": "R"}, id=jid)

        # Check that server received PBS_BATCH_AsynJob_ack request
        self.server.log_match("Type 97 request received", starttime=t)

    def test_runhook_reject_comment_sched(self):
        """
        Test that when a runjob hook rejects a job, with job_run_wait
        unset, that a job's comment is set correctly by sched
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {"resources_available.ncpus": 4},
                            id=self.mom.shortname)

        self.server.manager(MGR_CMD_UNSET, SCHED, "job_run_wait")

        jid1 = self.server.submit(Job())
        self.server.expect(JOB, {"job_state": "R"}, id=jid1)
        jid2 = self.server.submit(Job())
        self.server.expect(JOB, {"job_state": "R"}, id=jid2)
        jid3 = self.server.submit(Job())
        self.server.expect(JOB, {"job_state": "R"}, id=jid3)

        hook_txt = """
import pbs

e = pbs.event()
j = e.job

if not j.Resource_List["walltime"]:
    e.reject("%s: no walltime specified" % (e.hook_name) )
e.accept()"""
        hk_attrs = {'event': 'runjob'}
        self.server.create_import_hook('rj', hk_attrs, hook_txt)

        t1 = time.time()
        jid4 = self.server.submit(Job())
        self.server.expect(JOB, {"job_state": "Q"}, id=jid4)
        a = {"comment": (MATCH_RE, "no walltime specified")}
        self.server.expect(JOB, a, id=jid4)
        self.server.log_match("Type 96 request", starttime=t1, max_attempts=5)

    def test_runhook_reject_comment_server(self):
        """
        Test that when a runjob hook rejects a job, with job_run_wait
        set to "none", that a job's comment is set correctly by the server
        """
        self.server.manager(MGR_CMD_SET, SCHED, {"job_run_wait": "none"})

        hook_txt = """
import pbs

e = pbs.event()
j = e.job

if not j.Resource_List["walltime"]:
    e.reject("%s: no walltime specified" % (e.hook_name) )
e.accept()"""
        hk_attrs = {'event': 'runjob'}
        self.server.create_import_hook('rj', hk_attrs, hook_txt)

        t1 = time.time()
        jid = self.server.submit(Job())
        self.server.expect(JOB, {"job_state": "Q"}, id=jid)
        a = {"comment": (MATCH_RE, "no walltime specified")}
        self.server.expect(JOB, a, id=jid)
        self.server.log_match("Type 96 request", starttime=t1, max_attempts=5,
                              existence=False)


================================================
FILE: test/tests/functional/pbs_sched_signal.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestSchedSignal(TestFunctional):

    def test_sigpipe(self):
        """
        Test that pbs_sched receives a SIGPIPE correctly and it is not ignored
        """
        self.scheduler.signal('-PIPE')
        self.scheduler.log_match("We've received a sigpipe:")


================================================
FILE: test/tests/functional/pbs_schedule_indirect_resources.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestIndirectResources(TestFunctional):
    """
    Test Scheduler resolve indirect resources correctly
    """

    def config_complex_for_grouping(self, res, res_type='string', flag='h'):
        """
        Configure the PBS complex for node grouping test
        """
        # Create a custom resource
        attr = {"type": res_type, "flag": flag}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id=res)

        # Add resource to the resources line in sched_config
        self.scheduler.add_resource(res)

        # Set resource as the node_group_key
        attr = {'node_group_enable': 'True', 'node_group_key': res}
        self.server.manager(MGR_CMD_SET, SERVER, attr)

    def submit_job(self, attr):
        """
        Helper function to submit a sleep job with provided attributes
        """
        job = Job(TEST_USER1, attr)
        jobid = self.server.submit(job)

        return (jobid, job)

    def test_node_grouping_with_indirect_res(self):
        """
        Test node grouping with indirect resources set on some nodes
        Steps:
        -> Configure the system to have 6 vnodes with custom resource 'foostr'
        set as the node_group_key
        -> Set 'foostr' to 'A', 'B', and 'C' on the first three vnodes
        -> Set 'foostr' for the next three vnodes to point to the first three
        vnodes correspondingly
        -> Verify that the last three vnodes are part of their respective
        placement sets
        """

        # Create 6 vnodes
        attr = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(attr, 6)
        vn = ['%s[%d]' % (self.mom.shortname, i) for i in range(6)]
        # Configure a system with 6 vnodes and 'foostr' as node_group_key
        self.config_complex_for_grouping('foostr')

        # Set 'foostr' to 'A', 'B' and 'C' respectively for the first
        # three vnodes
        attr = {'resources_available.foostr': 'A'}
        self.server.manager(MGR_CMD_SET, NODE, attr, vn[0])
        attr = {'resources_available.foostr': 'B'}
        self.server.manager(MGR_CMD_SET, NODE, attr, vn[1])
        attr = {'resources_available.foostr': 'C'}
        self.server.manager(MGR_CMD_SET, NODE, attr, vn[2])

        # Set 'foostr' for last three vnodes as indirect resource to
        # the first three vnodes correcpondingly
        attr = {'resources_available.foostr': '@' + vn[0]}
        self.server.manager(MGR_CMD_SET, NODE, attr, vn[3])
        attr = {'resources_available.foostr': '@' + vn[1]}
        self.server.manager(MGR_CMD_SET, NODE, attr, vn[4])
        attr = {'resources_available.foostr': '@' + vn[2]}
        self.server.manager(MGR_CMD_SET, NODE, attr, vn[5])

        # Submit 3 jobs requesting 2 vnodes and check they ran on the nodes
        # within same group
        attr = {'Resource_List.select': '2:ncpus=1'}

        # since there are 6 vnodes and the test grouped them on foostr
        # resource, we now have groups in pair of vnode 0+3, 1+4, 2+5
        # check that the jobs are running on correct vnode groups.
        for i in range(3):
            jid, j = self.submit_job(attr)
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)
            self.server.status(JOB, 'exec_vnode', jid)
            vn = j.get_vnodes()
            self.assertEqual(int(vn[0][-2]) + 3, int(vn[1][-2]))


================================================
FILE: test/tests/functional/pbs_server_hook_attr.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestServerHookAttr(TestFunctional):

    def test_queuejob_hook_requestor_host(self):
        """
        Check the requestor_host attribute is set properly in hook.
        """
        hook_body = f"""
import pbs
e = pbs.event()
if e.requestor_host == "{self.servers.values()[0].name}":
    e.accept()
e.reject()
"""
        hook_name = "test_requestor_host"
        a = {'event': 'queuejob',
             'enabled': 'True'}
        rv = self.server.create_import_hook(
            hook_name, a, hook_body, overwrite=True)
        self.assertTrue(rv)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'False'})
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        a = {'job_state': 'Q'}
        self.server.expect(JOB, a, id=jid)


================================================
FILE: test/tests/functional/pbs_server_periodic_hook.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_server_periodic_hook(TestFunctional):
    hook_string = """
import pbs
import time
e = pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "periodic hook started at %%d" %% time.time())
time.sleep(%d)
pbs.logmsg(pbs.LOG_DEBUG, "periodic hook ended at %%d" %% time.time())
%s
"""

    def create_hook(self, accept, sleep_time):
        """
        function to create a hook script.
        It accepts 2 arguments
        - accept        If set to true, then hook will accept else reject
        - sleep_time        Number of seconds we want the hook to sleep
        """
        hook_action = "e.accept()"
        if accept is False:
            hook_action = "e.reject()"
        final_hook = self.hook_string % (int(sleep_time), hook_action)
        return final_hook

    start_msg = "periodic hook started at "
    end_msg = "periodic hook ended at "

    def get_timestamp(self, msg):
        a = msg.rsplit(' ', 1)
        return int(a[1])

    def check_next_occurances(self, count, freq,
                              hook_run_time, check_for_hook_end, alarm=0):
        """
        Helper function to check the occurances of hook by matching their
        logs in server logs.
        It needs 4 arguments:
        - count                     to know how many times to repeat
                                    checking these logs
        - freq                      is the frequency set in pbs server to run
                                    this hook
        - hook_run_time             is the amount of time hook takes to run.
        - check_for_hook_end        If it is true then the functions checks for
                                    hook end messages.
        - alarm                     hook alarm
        """
        occurance = 0
        # time after which we want to start matching log
        search_after = time.time()
        intr = freq
        while (occurance < count):
            msg_expected = self.start_msg
            msg = self.server.log_match(msg_expected,
                                        interval=(intr + 1),
                                        starttime=search_after)
            if occurance == 0:
                time_expected = time_logged = self.get_timestamp(msg[1])
            else:
                time_logged = self.get_timestamp(msg[1])
                self.assertFalse(time_logged - time_expected > 1)

            if check_for_hook_end is True:
                time_expected = time_logged + hook_run_time
                # set it to a second before we expect the hook to end
                search_after = time_expected - 1
                msg_expected = self.end_msg
                msg = self.server.log_match(msg_expected, max_attempts=2,
                                            interval=(hook_run_time + 1),
                                            starttime=search_after)
                time_logged = self.get_timestamp(msg[1])
                if alarm != 0:
                    self.assertLessEqual(time_logged - time_expected,
                                         alarm - hook_run_time)
                else:
                    self.assertLessEqual(time_logged - time_expected, 1)

                if hook_run_time <= freq:
                    intr = freq - hook_run_time
                else:
                    intr = freq - (hook_run_time % freq)
            else:
                if hook_run_time <= freq:
                    intr = freq
                else:
                    intr = hook_run_time + (freq - (hook_run_time % freq))

            # we just matched hook start/end message, next start message is
            # surely after time_expected.
            search_after = time_expected + 1
            time_expected = time_logged + intr
            occurance += 1

    def test_sp_hook_run(self):
        """
        Submit a server periodic hook that rejects
        """
        hook_name = "medium_hook"
        freq = 20
        hook_run_time = 10
        scr = self.create_hook(True, hook_run_time)
        attrs = {'event': "periodic"}
        rv = self.server.create_import_hook(
            hook_name,
            attrs,
            scr,
            overwrite=True)
        self.assertTrue(rv)
        attrs = {'freq': freq}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        attrs = {'enabled': 'True'}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        self.check_next_occurances(2, freq, hook_run_time, True)

    def test_sp_hook_reject(self):
        """
        Submit a server periodic hook that rejects
        """
        hook_name = "reject_hook"
        freq = 20
        hook_run_time = 10
        scr = self.create_hook(False, hook_run_time)
        attrs = {'event': "periodic"}
        msg_expected = ";periodic request rejected by " + "'" + hook_name + "'"
        rv = self.server.create_import_hook(
            hook_name,
            attrs,
            scr,
            overwrite=True)
        self.assertTrue(rv)
        attrs = {'freq': freq}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        attrs = {'enabled': 'True'}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        self.check_next_occurances(2, freq, hook_run_time, True)
        self.server.log_match(msg_expected, interval=1)

    def test_sp_hook_long_run(self):
        """
        Submit a hook that runs longer than the frequency set by the hook and
        see if the hook starts at the next subsequent freq interval.
        in this case hook runs for 20 seconds and freq is 6. So if a hook
        starts at time 'x' then it's next occurance should be at 'x +24'.
        """
        hook_name = "long_hook"
        freq = 6
        hook_run_time = 20
        scr = self.create_hook(True, hook_run_time)
        attrs = {'event': "periodic"}
        rv = self.server.create_import_hook(
            hook_name,
            attrs,
            scr,
            overwrite=True)
        self.assertTrue(rv)
        attrs = {'freq': freq}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        attrs = {'enabled': 'True'}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        self.check_next_occurances(2, freq, hook_run_time, True)

    def test_sp_hook_aborts_after_short_alarm(self):
        """
        Submit a hook that runs longer than the frequency set by the hook and
        see if the hook starts at the next subsequent freq interval.
        in this case hook runs for 20 seconds and freq is 15 and alarm is 12.
        So if a hook starts at time 'x' then it's next occurance should be
        at 'x +15' because alarm is going to kill it at 12th second of it's
        run.
        """
        hook_name = "long_hook"
        freq = 15
        alarm = 12
        hook_run_time = alarm
        scr = self.create_hook(True, 20)
        attrs = {'event': "periodic"}
        rv = self.server.create_import_hook(
            hook_name,
            attrs,
            scr,
            overwrite=True)
        self.assertTrue(rv)
        attrs = {'freq': freq, 'alarm': alarm}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        attrs = {'enabled': 'True'}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        self.check_next_occurances(2, freq, hook_run_time, False)

    def test_sp_hook_aborts_after_long_alarm(self):
        """
        Submit a hook that runs longer than the frequency set by the hook and
        see if the hook starts at the next subsequent freq interval.
        in this case hook runs for 20 seconds and freq is 12 and alarm is 15.
        So if a hook starts at time 'x' then it's next occurance should be
        at 'x +12' but it is going to run and get killed due to an alarm at
        x +15 and then again start execution at x+24.
        """
        hook_name = "long_hook"
        freq = 12
        alarm = 15
        hook_run_time = alarm
        scr = self.create_hook(True, 20)
        attrs = {'event': "periodic"}
        rv = self.server.create_import_hook(
            hook_name,
            attrs,
            scr,
            overwrite=True)
        self.assertTrue(rv)
        attrs = {'freq': freq, 'alarm': alarm}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        attrs = {'enabled': 'True'}
        rv = self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.assertEqual(rv, 0)
        self.check_next_occurances(2, freq, hook_run_time, False)

    def test_sp_with_queuejob(self):
        """
        This test case checks that periodic and queuejob
        event can be set for the same hook
        """
        events = ["periodic", "queuejob"]
        hook_name = "TestHook"
        hook_attrib = {'event': events, 'freq': 100}
        scr = self.create_hook(True, 10)
        retval = self.server.create_import_hook(hook_name,
                                                hook_attrib,
                                                scr,
                                                overwrite=True)
        self.assertTrue(retval)
        attrs = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)

        job = Job(TEST_USER1, attrs={ATTR_l: 'select=1:ncpus=1',
                                     ATTR_l: 'walltime=1:00:00'})
        jid = self.server.submit(job)
        self.server.log_match(self.start_msg, interval=3)
        self.server.log_match(self.end_msg, interval=3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_alarm_more_than_freq(self):
        """
        Test when alarm is more than freq. Ensure multiple
        instances do not get launched
        """
        hook_name = "medium_hook"
        scr = self.create_hook(accept=True, sleep_time=10)
        attrs = {'event': 'periodic', 'alarm': 15, 'freq': 6}
        self.server.create_import_hook(hook_name, attrs, scr, overwrite=True)
        self.check_next_occurances(2, freq=6, hook_run_time=10,
                                   check_for_hook_end=True, alarm=15)

    def test_check_for_negative_freq(self):
        """
        Check for the correct messages thrown if negative values of freq is set
        """
        hook_name = "med_hook"
        attrs = {'event': "periodic", 'freq': "0"}
        match_str1 = "set_hook_freq: freq value '0'"
        match_str1 += " of a hook must be > 0"
        try:
            self.server.create_hook(hook_name, attrs)
        except PbsManagerError as e:
            self.assertIn(match_str1, e.msg[0])
            self.logger.info('Expected error: ' + match_str1)
        else:
            msg = "Able to set freq to zero"
            self.assertTrue(False, msg)
        attrs = {'enabled': "False", 'event': "periodic", 'freq': '120'}
        self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        attrs = {'freq': "-1"}
        match_str1 = "set_hook_freq: freq value '-1'"
        match_str1 += " of a hook must be > 0"
        try:
            self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        except PbsManagerError as e:
            self.assertIn(match_str1, e.msg[0])
            self.logger.info('Expected error: ' + match_str1)
        else:
            msg = "Able to set freq to negative value"
            self.assertTrue(False, msg)

    @timeout(600)
    def test_with_other_hooks(self):
        """
        Test periodic hook works fine with other hooks
        """
        hook_name = "periodic_hook"
        freq = 30
        scr = self.create_hook(accept=True, sleep_time=25)
        attrs = {'event': "periodic", 'alarm': "28"}
        self.server.create_import_hook(hook_name, attrs, scr, overwrite=True)
        start_time = time.time()
        attrs = {'freq': 30, 'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        expected_msg = "periodic hook started at "
        self.server.log_match(expected_msg, starttime=start_time,
                              interval=(freq + 1))
        self.check_next_occurances(count=1, freq=freq, hook_run_time=25,
                                   check_for_hook_end=False)
        hook_name = "exechost_periodic_hook3"
        freq = 8
        hook_run_time = 5
        scr = self.create_hook(True, sleep_time=5)
        attrs = {'event': "exechost_periodic", 'alarm': "7", 'freq': "8",
                 'enabled': 'True'}
        self.server.create_import_hook(hook_name, attrs, scr)
        start_time = time.time()
        expected_msg = "periodic hook started at "
        self.mom.log_match(expected_msg, interval=(freq + 1),
                           starttime=start_time)
        expected_msg = "periodic hook ended at "
        self.mom.log_match(expected_msg, interval=(hook_run_time + 1),
                           starttime=start_time)

    def test_other_pbs_operations_work(self):
        """
        Test that when periodic hook is launched PBS operations do not get
        hampered
        """
        hook_name = "medium_hook"
        freq = 20
        scr = self.create_hook(accept=True, sleep_time=15)
        attrs = {'event': "periodic"}
        self.server.create_import_hook(hook_name, attrs, scr)
        attrs = {'alarm': "18", 'freq': freq}
        self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        attrs = {'enabled': 'True'}
        self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.start_msg = ";periodic hook started at "
        self.check_next_occurances(count=1, freq=freq, hook_run_time=25,
                                   check_for_hook_end=False)
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 3}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(3)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, 'queue', id=jid1, op=UNSET, offset=3)
        self.server.log_match(jid1 + ";Exit_status=0")
        j1 = Job(TEST_USER)
        jid2 = self.server.submit(j1)
        self.server.delete(jid2)

    def test_set_as_non_admin(self):
        """
        Check for the correct messages thrown if user other
        than pbsadmin tries to set
        """
        hook_name = "medium_hook"
        host_name = str(self.server.hostname)
        self.server.create_hook(hook_name, attrs={'enabled': "False"})
        attrs = {'event': "periodic", 'freq': '120'}
        match_str1 = "unauthorized to access hooks data from server"
        try:
            self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name,
                                runas=TEST_USER1)
        except PbsManagerError as e:
            self.assertIn(match_str1, e.msg[0])
            self.logger.info('Expected error: ' + match_str1)
        else:
            msg = "Able to create hook as other user"
            self.assertTrue(False, msg)
        self.server.manager(MGR_CMD_SET, HOOK, attrs, hook_name)
        self.server.manager(MGR_CMD_LIST, HOOK, {'freq': '120'}, hook_name)


================================================
FILE: test/tests/functional/pbs_set_enforcement.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestMomEnforcement(TestFunctional):
    """
    This test suite tests enforcement on mom
    """

    def test_set_enforcement(self):
        """
        This test suite verifies that mom successfully handle the setting
        of enforcement in the config file
        """
        self.mom.add_config(
            {'$enforce delta_percent_over': '50',
             '$enforce delta_cpufactor': '1.5',
             '$enforce delta_weightup': '0.4',
             '$enforce delta_weightdown': '0.1',
             '$enforce average_percent_over': '50',
             '$enforce average_cpufactor': '1.025',
             '$enforce average_trialperiod': '120',
             '$enforce cpuburst': '',
             '$enforce cpuaverage': '',
             '$enforce mem': ''})

        error = ""
        try:
            self.mom.stop()
            self.mom.start()
        except PbsServiceError as err:
            error = err

        self.assertEqual(error, "")


================================================
FILE: test/tests/functional/pbs_sister_mom_crash.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestSisterMom(TestFunctional):
    """
    This test suite tests the sister mom crash
    """
    @timeout(240)
    def test_sister_mom_crash(self):
        """
        This test suite verifies that sister mom
        doesn't crash
        """
        # Skip test if number of mom provided is not equal to two
        if len(self.moms) != 2:
            self.skipTest("test requires atleast two MoMs as input, " +
                          "use -p moms=<mom1:mom2>")
        sister_mom = self.moms.keys()[1]
        pbsdsh_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                   "bin", "pbsdsh")
        script = "%s dd if=/dev/zero of=/dev/null" % pbsdsh_path
        j = Job(TEST_USER)
        j.set_attributes({'Resource_List.select': '2',
                          'Resource_List.place': 'scatter'})
        j.create_script(script)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.log_match(";%s;node down: communication closed"
                              % (sister_mom),
                              max_attempts=18, interval=10, existence=False)


================================================
FILE: test/tests/functional/pbs_snapshot_unittest.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import json
import os
import time

from ptl.utils.pbs_snaputils import *
from tests.functional import *


class TestPBSSnapshot(TestFunctional):
    """
    Test suit with unit tests for the pbs_snapshot tool
    """
    pbs_snapshot_path = None
    snapdirs = []
    snaptars = []
    parent_dir = os.getcwd()

    def setUp(self):
        TestFunctional.setUp(self)

        # Check whether pbs_snapshot is accessible
        try:
            self.pbs_snapshot_path = os.path.join(
                self.server.pbs_conf["PBS_EXEC"], "sbin", "pbs_snapshot")
            ret = self.du.run_cmd(cmd=[self.pbs_snapshot_path, "-h"])
            if ret['rc'] != 0:
                self.pbs_snapshot_path = None
        except Exception:
            self.pbs_snapshot_path = None

        # Check whether the user has root access or not
        # pbs_snapshot only supports being run as root, so skip the entire
        # testsuite if the user doesn't have root privileges
        ret = self.du.run_cmd(
            cmd=["ls", os.path.join(os.sep, "root")], sudo=True)
        if ret['rc'] != 0:
            self.skipTest("pbs_snapshot/PBSSnapUtils need root privileges")

    def setup_sc(self, sched_id, partition, port,
                 sched_priv=None, sched_log=None):
        """
        Setup a scheduler

        :param sched_id: id of the scheduler
        :type sched_id: str
        :param partition: partition name for the scheduler (e.g "P1", "P1,P2")
        :type partition: str
        :param port: The port number string for the scheduler
        :type port: str
        :param sched_priv: 'sched_priv' (full path) for the scheduler
        :type sched_priv: str
        :param sched_log: 'sched_log' (full path) for the scheduler
        :type sched_log: str
        """
        a = {'partition': partition,
             'sched_host': self.server.hostname}
        if sched_priv is not None:
            a['sched_priv'] = sched_priv
        if sched_log is not None:
            a['sched_log'] = sched_log
        self.server.manager(MGR_CMD_CREATE, SCHED, a, id=sched_id)
        if 'sched_priv' in a:
            sched_dir = os.path.dirname(sched_priv)
            self.scheds[sched_id].create_scheduler(sched_dir)
            self.scheds[sched_id].start(sched_dir)
        else:
            self.scheds[sched_id].create_scheduler()
            self.scheds[sched_id].start()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id=sched_id)

    def setup_queues_nodes(self, num_partitions):
        """
        Given a no. of partitions, create equal no. of associated queues
        and nodes

        :param num_partitions: number of partitions
        :type num_partitions: int
        :return a tuple of lists of queue and node ids:
            ([q1, q1, ..], [n1, n2, ..])
        """
        queues = []
        nodes = []
        a_q = {"queue_type": "execution",
               "started": "True",
               "enabled": "True"}
        a_n = {"resources_available.ncpus": 2}
        self.mom.create_vnodes(a_n, (num_partitions + 1), vname='vnode')
        for i in range(num_partitions):
            partition_id = "P" + str(i + 1)

            # Create queue i + 1 with partition i + 1
            id_q = "wq" + str(i + 1)
            queues.append(id_q)
            a_q["partition"] = partition_id
            self.server.manager(MGR_CMD_CREATE, QUEUE, a_q, id=id_q)

            # Set the partition i + 1 on node i
            id_n = "vnode[" + str(i) + "]"
            nodes.append(id_n)
            a = {"partition": partition_id}
            self.server.manager(MGR_CMD_SET, NODE, a, id=id_n)

        return (queues, nodes)

    def take_snapshot(self, acct_logs=None, daemon_logs=None,
                      obfuscate=None, with_sudo=True, hosts=None,
                      primary_host=None, basic=None, obf_snap=None):
        """
        Take a snapshot using pbs_snapshot command

        :param acct_logs: Number of accounting logs to capture
        :type acct_logs: int
        :param daemon_logs: Number of daemon logs to capture
        :type daemon_logs: int
        :param obfuscate: Obfuscate information?
        :type obfuscate: bool
        :param with_sudo: use the --with-sudo option?
        :type with_sudo: bool
        :param hosts: list of additional hosts to capture information from
        :type list
        :param primary_host: hostname of the primary host to capture (-H)
        :type primary_host: str
        :param basic: use --basic option
        :type bool
        :param obf_snap: path to existing snapshot to obfuscate
        :type str
        :return a tuple of name of tarball and snapshot directory captured:
            (tarfile, snapdir)
        """
        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        if obf_snap:
            snap_cmd = [self.pbs_snapshot_path, "--obf-snap", obf_snap]
        else:
            snap_cmd = [self.pbs_snapshot_path, "-o", self.parent_dir]
            if acct_logs is not None:
                snap_cmd.append("--accounting-logs=" + str(acct_logs))
            if daemon_logs is not None:
                snap_cmd.append("--daemon-logs=" + str(daemon_logs))
            if obfuscate:
                snap_cmd.append("--obfuscate")
            if hosts is not None:
                hosts_str = ",".join(hosts)
                snap_cmd.append("--additional-hosts=" + hosts_str)
            if primary_host is not None:
                snap_cmd.append("-H " + primary_host)
            if basic is not None:
                snap_cmd.append("--basic")

        if with_sudo:
            snap_cmd.append("--with-sudo")

        ret = self.du.run_cmd(cmd=snap_cmd, logerr=False, as_script=True)
        self.assertEqual(ret['rc'], 0)

        # Get the name of the tarball that was created
        # pbs_snapshot prints to stdout only the following:
        #     "Snapshot available at: <path to tarball>"
        self.assertTrue(len(ret['out']) > 0, str(ret))
        snap_out = ret['out'][0]
        output_tar = snap_out.split(":")[1]
        output_tar = output_tar.strip()

        # Check that the output tarball was created
        self.assertTrue(os.path.isfile(output_tar),
                        "Error capturing snapshot:\n" + str(ret))

        # Unwrap the tarball
        tar = tarfile.open(output_tar)
        tar.extractall(path=self.parent_dir)
        tar.close()

        # snapshot directory name = <snapshot>.tgz[:-4]
        snap_dir = output_tar[:-4]

        # Check that the directory exists
        self.assertTrue(os.path.isdir(snap_dir))

        self.snapdirs.append(snap_dir)
        self.snaptars.append(output_tar)

        return (output_tar, snap_dir)

    def check_snap_obfuscated(self, snap_dir, real_values):
        """
        Check that a snapshot doesn't contain any sensitive values

        :param snap_dir: path to the snapshot dir
        :type str
        :param real_values: map of {attribute name: sensitive value}
        :type dict
        """
        values = real_values.values()
        for val_list in values:
            for val in val_list:
                # Just do a grep for the value in the snapshot
                cmd = ["grep", "-wR", "\'" + str(val) + "\'", snap_dir]
                ret = self.du.run_cmd(cmd=cmd, level=logging.DEBUG)
                # grep returns 2 if an error occurred
                self.assertNotEqual(ret["rc"], 2, "grep failed!")
                self.assertIn(ret["out"], ["", None, []], str(val) +
                              " was not obfuscated. Real values:\n" +
                              str(real_values))
                # Also make sure that no filenames contain the sensitive val
                cmd = ["find", snap_dir, "-name", "\'*" + str(val) + "*\'"]
                ret = self.du.run_cmd(cmd=cmd, level=logging.DEBUG)
                self.assertEqual(ret["rc"], 0, "find command failed!")
                self.assertIn(ret["out"], ["", None, []], str(val) +
                              " was not obfuscated. Real values:\n" +
                              str(real_values))

    def test_capture_server(self):
        """
        Test the 'capture_server' interface of PBSSnapUtils
        """

        # Set something on the server so we can match it later
        job_hist_duration = "12:00:00"
        attr_list = {"job_history_enable": "True",
                     "job_history_duration": job_hist_duration}
        self.server.manager(MGR_CMD_SET, SERVER, attr_list)

        num_daemon_logs = 2
        num_acct_logs = 5

        with PBSSnapUtils(out_dir=self.parent_dir, acct_logs=num_acct_logs,
                          daemon_logs=num_daemon_logs,
                          with_sudo=True) as snap_obj:
            snap_dir = snap_obj.capture_server(True, True)

            # Go through the snapshot and perform certain checks
            # Check 1: the snapshot exists
            self.assertTrue(os.path.isdir(snap_dir))
            # Check 2: all directories except the 'server' directory have no
            # files
            svr_fullpath = os.path.join(snap_dir, "server")
            for root, _, files in os.walk(snap_dir):
                for filename in files:
                    file_fullpath = os.path.join(root, filename)
                    # Find the common paths between 'server' & the file
                    common_path = os.path.commonprefix([file_fullpath,
                                                        svr_fullpath])
                    try:
                        self.assertEqual(os.path.basename(common_path),
                                         "server")
                    except AssertionError:
                        # Check if this was a server core file, which would
                        # explain why it was captured
                        svrcorepath = os.path.join(CORE_DIR, "server_priv")
                        if svrcorepath in file_fullpath:
                            continue
                        raise
            # Check 3: qstat_Bf.out exists
            qstat_bf_out = os.path.join(snap_obj.snapdir, QSTAT_BF_PATH)
            self.assertTrue(os.path.isfile(qstat_bf_out))
            # Check 4: qstat_Bf.out has 'job_history_duration' set to 24:00:00
            with open(qstat_bf_out, "r") as fd:
                for line in fd:
                    if "job_history_duration" in line:
                        # Remove whitespaces
                        line = "".join(line.split())
                        # Split it up by '='
                        key_val = line.split("=")
                        self.assertEqual(key_val[1], job_hist_duration)

        # Cleanup
        if os.path.isdir(snap_dir):
            self.du.rm(path=snap_dir, recursive=True, force=True)

    def test_capture_all(self):
        """
        Test the 'capture_all' interface of PBSSnapUtils

        WARNING: Assumes that the test is being run on type - 1 PBS install
        """
        num_daemon_logs = 2
        num_acct_logs = 5

        # Check that all PBS daemons are up and running
        all_daemons_up = self.server.isUp()
        all_daemons_up = all_daemons_up and self.mom.isUp()
        all_daemons_up = all_daemons_up and self.comm.isUp()
        all_daemons_up = all_daemons_up and self.scheduler.isUp()

        if not all_daemons_up:
            # Skip the test
            self.skipTest("Type 1 installation not present or " +
                          "all daemons are not running")

        with PBSSnapUtils(out_dir=self.parent_dir, acct_logs=num_acct_logs,
                          daemon_logs=num_daemon_logs,
                          with_sudo=True) as snap_obj:
            snap_dir = snap_obj.capture_all()
            snap_obj.finalize()

            # Test that all the expected information has been captured
            # PBSSnapUtils has various dictionaries which store metadata
            # for various objects. Create a list of these dicts
            all_info = [snap_obj.server_info, snap_obj.job_info,
                        snap_obj.node_info, snap_obj.comm_info,
                        snap_obj.hook_info, snap_obj.sched_info,
                        snap_obj.resv_info, snap_obj.core_info,
                        snap_obj.sys_info]
            skip_list = [ACCT_LOGS, QMGR_LPBSHOOK_OUT, "reservation", "job",
                         QMGR_PR_OUT, PG_LOGS, "core_file_bt",
                         "pbs_snapshot.log"]
            platform = self.du.get_platform()
            if not platform.startswith("linux"):
                skip_list.extend([ETC_HOSTS, ETC_NSSWITCH_CONF, LSOF_PBS_OUT,
                                  VMSTAT_OUT, DF_H_OUT, DMESG_OUT])
            for item_info in all_info:
                for key, info in item_info.items():
                    info_path = info[0]
                    if info_path is None:
                        continue
                    # Check if we should skip checking this info
                    skip_item = False
                    for item in skip_list:
                        if isinstance(item, int):
                            if item == key:
                                skip_item = True
                                break
                        else:
                            if item in info_path:
                                skip_item = True
                                break
                    if skip_item:
                        continue

                    # Check if this information was captured
                    info_full_path = os.path.join(snap_dir, info_path)
                    self.assertTrue(os.path.exists(info_full_path),
                                    msg=info_full_path + " was not captured")

        # Cleanup
        if os.path.isdir(snap_dir):
            self.du.rm(path=snap_dir, recursive=True, force=True)

    def test_capture_pbs_logs(self):
        """
        Test the 'capture_pbs_logs' interface of PBSSnapUtils
        """
        num_daemon_logs = 2
        num_acct_logs = 5

        # Check which PBS daemons are up on this machine.
        # We'll only check for logs from the daemons which were up
        # when the snapshot was taken.
        server_up = self.server.isUp()
        mom_up = self.mom.isUp()
        comm_up = self.comm.isUp()
        sched_up = self.scheduler.isUp()

        if not (server_up or mom_up or comm_up or sched_up):
            # Skip the test
            self.skipTest("No PBS daemons found on the system," +
                          " skipping the test")

        with PBSSnapUtils(out_dir=self.parent_dir, acct_logs=num_acct_logs,
                          daemon_logs=num_daemon_logs,
                          with_sudo=True) as snap_obj:
            snap_dir = snap_obj.capture_pbs_logs()

            # Perform some checks
            # Check that the snapshot exists
            self.assertTrue(os.path.isdir(snap_dir))
            if server_up:
                # Check that 'server_logs' were captured
                log_path = os.path.join(snap_dir, SVR_LOGS_PATH)
                self.assertTrue(os.path.isdir(log_path))
                # Check that 'accounting_logs' were captured
                log_path = os.path.join(snap_dir, ACCT_LOGS_PATH)
                self.assertTrue(os.path.isdir(log_path))
            if mom_up:
                # Check that 'mom_logs' were captured
                log_path = os.path.join(snap_dir, MOM_LOGS_PATH)
                self.assertTrue(os.path.isdir(log_path))
            if comm_up:
                # Check that 'comm_logs' were captured
                log_path = os.path.join(snap_dir, COMM_LOGS_PATH)
                self.assertTrue(os.path.isdir(log_path))
            if sched_up:
                # Check that 'sched_logs' were captured
                log_path = os.path.join(snap_dir, DFLT_SCHED_LOGS_PATH)
                self.assertTrue(os.path.isdir(log_path))

        if os.path.isdir(snap_dir):
            self.du.rm(path=snap_dir, recursive=True, force=True)

    def test_snapshot_basic(self):
        """
        Test capturing a snapshot via the pbs_snapshot program
        """
        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        output_tar, _ = self.take_snapshot()

        # Check that the output tarball was created
        self.assertTrue(os.path.isfile(output_tar))

    def test_snapshot_without_logs(self):
        """
        Test capturing a snapshot via the pbs_snapshot program
        Capture no logs
        """
        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        (_, snap_dir) = self.take_snapshot(0, 0)

        # Check that 'server_logs' were not captured
        log_path = os.path.join(snap_dir, SVR_LOGS_PATH)
        self.assertTrue(not os.path.isdir(log_path))
        # Check that 'mom_logs' were not captured
        log_path = os.path.join(snap_dir, MOM_LOGS_PATH)
        self.assertTrue(not os.path.isdir(log_path))
        # Check that 'comm_logs' were not captured
        log_path = os.path.join(snap_dir, COMM_LOGS_PATH)
        self.assertTrue(not os.path.isdir(log_path))
        # Check that 'sched_logs' were not captured
        log_path = os.path.join(snap_dir, DFLT_SCHED_LOGS_PATH)
        self.assertTrue(not os.path.isdir(log_path))
        # Check that 'accounting_logs' were not captured
        log_path = os.path.join(snap_dir, ACCT_LOGS_PATH)
        self.assertTrue(not os.path.isdir(log_path))

    def test_obfuscate_resv_user_groups(self):
        """
        Test obfuscation of user & group related attributes while capturing
        snapshots via pbs_snapshot
        """
        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        now = int(time.time())

        # Let's submit a reservation with Authorized_Users and
        # Authorized_Groups set
        attribs = {ATTR_auth_u: TEST_USER1, ATTR_auth_g: TSTGRP0,
                   ATTR_l + ".ncpus": 1, 'reserve_start': now + 25,
                   'reserve_end': now + 45}
        resv_obj = Reservation(attrs=attribs)
        resv_id = self.server.submit(resv_obj)
        attribs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attribs, id=resv_id)

        # Now, take a snapshot with --obfuscate
        (_, snap_dir) = self.take_snapshot(0, 0, True)

        # Make sure that the pbs_rstat -f output captured doesn't have the
        # Authorized user and group names
        pbsrstat_path = os.path.join(snap_dir, PBS_RSTAT_F_PATH)
        self.assertTrue(os.path.isfile(pbsrstat_path))
        with open(pbsrstat_path, "r") as rstatfd:
            all_content = rstatfd.read()
            self.assertFalse(str(TEST_USER1) in all_content)
            self.assertFalse(str(TSTGRP0) in all_content)

    def test_obfuscate_acct_bad(self):
        """
        Test that pbs_snapshot --obfuscate can work with bad accounting records
        """
        if os.getuid() != 0:
            self.skipTest("Test need to run as root")

        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        # Delete all existing accounting logs
        acct_logpath = os.path.join(self.server.pbs_conf["PBS_HOME"],
                                    "server_priv", "accounting")
        self.du.rm(path=os.path.join(acct_logpath, "*"), force=True,
                   as_script=True)
        ret = os.listdir(acct_logpath)
        self.assertEqual(len(ret), 0)
        self.server.pi.restart()

        # Make sure that the restart generated a new accounting log
        # Let's submit a job to generate a new accounting log
        j = Job(TEST_USER)
        j.set_sleep_time(1)
        jid = self.server.submit(j)

        # Check that the accounting E record was generated
        self.server.accounting_match(";E;%s;" % jid)

        # Now, Add some garbage data to the accounting file
        ret = os.listdir(acct_logpath)
        self.assertGreater(len(ret), 0)
        acct_filename = ret[0]
        filepath = os.path.join(acct_logpath, acct_filename)
        with open(filepath, "a+") as fd:
            fd.write("!@#$%^")

        # Now, take a snapshot with --obfuscate
        (_, snap_dir) = self.take_snapshot(obfuscate=True, with_sudo=False)

        # Make sure that the accounting log was captured with the job record
        snapacctdir = os.path.join(snap_dir, "server_priv", "accounting")
        self.assertTrue(os.path.isdir(snapacctdir))
        snapacctpath = os.path.join(snapacctdir, acct_filename)
        self.assertTrue(os.path.isfile(snapacctpath))
        with open(snapacctpath, "r") as fd:
            content = fd.read()
            self.assertIn(";E;%s;" % jid, content)

        # Now, modify the job record itself to add some garbage to it
        file_contents = []
        contents_out = []
        with open(filepath, "r") as fd:
            file_contents = fd.readlines()
        for line in file_contents:
            if ";E;%s;" % jid in line:
                line = line[:-1] + " !@#$^\n"
            contents_out.append(line)
        with open(filepath, "w") as fd:
            fd.writelines(contents_out)

        # Capture another snapshot with --obfuscate
        (_, snap_dir) = self.take_snapshot(obfuscate=True, with_sudo=False)

        # Make sure that the accounting log was captured
        # This time, the job record should not be captured as it had garbage
        snapacctdir = os.path.join(snap_dir, "server_priv", "accounting")
        self.assertTrue(os.path.isdir(snapacctdir))
        snapacctpath = os.path.join(snapacctdir, acct_filename)
        self.assertTrue(os.path.isfile(snapacctpath))
        with open(snapacctpath, "r") as fd:
            content = fd.read()
            self.assertNotIn(";E;%s;" % jid, content)

    def test_multisched_support(self):
        """
        Test that pbs_snapshot can capture details of all schedulers
        """
        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        # Setup 3 schedulers
        sched_ids = ["sc1", "sc2", "sc3", "default"]
        self.setup_sc(sched_ids[0], "P1", "15050")
        self.setup_sc(sched_ids[1], "P2", "15051")
        # Setup scheduler at non-default location
        dir_path = os.path.join(os.sep, 'var', 'spool', 'pbs', 'sched_dir')
        if not os.path.exists(dir_path):
            self.du.mkdir(path=dir_path, sudo=True)
        sched_priv = os.path.join(dir_path, 'sched_priv_sc3')
        sched_log = os.path.join(dir_path, 'sched_logs_sc3')
        self.setup_sc(sched_ids[2], "P3", "15052", sched_priv, sched_log)

        # Add 3 partitions, each associated with a queue and a node
        (q_ids, _) = self.setup_queues_nodes(3)

        # Submit some jobs to fill the system up and get the multiple
        # schedulers busy
        for q_id in q_ids:
            for _ in range(2):
                attr = {"queue": q_id, "Resource_List.ncpus": "1"}
                j = Job(TEST_USER1, attrs=attr)
                self.server.submit(j)

        # Capture a snapshot of the system with multiple schedulers
        (_, snapdir) = self.take_snapshot()

        # Check that sched priv and sched logs for all schedulers was captured
        for sched_id in sched_ids:
            if (sched_id == "default"):
                schedi_priv = os.path.join(snapdir, DFLT_SCHED_PRIV_PATH)
                schedi_logs = os.path.join(snapdir, DFLT_SCHED_LOGS_PATH)
            else:
                schedi_priv = os.path.join(snapdir, "sched_priv_" + sched_id)
                schedi_logs = os.path.join(snapdir, "sched_logs_" + sched_id)

            self.assertTrue(os.path.isdir(schedi_priv))
            self.assertTrue(os.path.isdir(schedi_logs))

            # Make sure that these directories are not empty
            self.assertTrue(len(os.listdir(schedi_priv)) > 0)
            self.assertTrue(len(os.listdir(schedi_logs)) > 0)

        # Check that qmgr -c "l sched" captured information about all scheds
        lschedpath = os.path.join(snapdir, QMGR_LSCHED_PATH)
        with open(lschedpath, "r") as fd:
            scheds_found = 0
            for line in fd:
                if line.startswith("Sched "):
                    sched_id = line.split("Sched ")[1]
                    sched_id = sched_id.strip()
                    self.assertTrue(sched_id in sched_ids)
                    scheds_found += 1
            self.assertEqual(scheds_found, 4)

    def test_snapshot_from_hook(self):
        """
        Test that pbs_snapshot can be called from inside a hook
        """
        logmsg = "pbs_snapshot was successfully run"
        hook_body = """
import pbs
import os
import subprocess
import time

pbs_snap_exec = os.path.join(pbs.pbs_conf['PBS_EXEC'], "sbin", "pbs_snapshot")
if not os.path.isfile(pbs_snap_exec):
    raise ValueError("pbs_snapshot executable not found")

ref_time = time.time()
snap_cmd = [pbs_snap_exec, "-o", "."]
assert(not subprocess.call(snap_cmd))

# Check that the snapshot was captured
snapshot_found = False
for filename in os.listdir("."):
    if filename.startswith("snapshot") and filename.endswith(".tgz"):
        # Make sure the mtime on this file is recent enough
        mtime_file = os.path.getmtime(filename)
        if mtime_file > ref_time:
            snapshot_found = True
            break
assert(snapshot_found)
pbs.logmsg(pbs.EVENT_DEBUG,"%s")
""" % (logmsg)
        hook_name = "snapshothook"
        attr = {"event": "periodic", "freq": 5}
        rv = self.server.create_import_hook(hook_name, attr, hook_body,
                                            overwrite=True)
        self.assertTrue(rv)
        self.server.log_match(logmsg)

    def snapshot_multi_mom_basic(self, obfuscate=False):
        """
        Test capturing data from a multi-mom system

        :param obfuscate: take snapshot with --obfuscate?
        :type obfuscate: bool
        """
        # Skip test if number of moms is not equal to two
        if len(self.moms) != 2:
            self.skipTest("test requires atleast two moms as input, "
                          "use -p moms=<mom 1>:<mom 2>")

        mom1 = self.moms.values()[0]
        mom2 = self.moms.values()[1]

        host1 = mom1.shortname
        host2 = mom2.shortname

        self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        self.server.manager(MGR_CMD_CREATE, NODE, id=host1)
        self.server.manager(MGR_CMD_CREATE, NODE, id=host2)

        # Give the moms a chance to contact the server.
        self.server.expect(NODE, {'state': 'free'}, id=host1)
        self.server.expect(NODE, {'state': 'free'}, id=host2)

        # Capture a snapshot with details from the remote moms
        (_, snapdir) = self.take_snapshot(hosts=[host1, host2],
                                          obfuscate=obfuscate)

        # Check that snapshots for the 2 hosts were captured
        host1_outtar = os.path.join(snapdir, host1 + "_snapshot.tgz")
        host2_outtar = os.path.join(snapdir, host2 + "_snapshot.tgz")

        self.assertTrue(os.path.isfile(host1_outtar),
                        "Failed to capture snapshot on %s" % (host1))
        self.assertTrue(os.path.isfile(host2_outtar),
                        "Failed to capture snapshot on %s" % (host2))

        # Unwrap the host snapshots
        host1_snapdir = host1 + "_snapshot"
        host2_snapdir = host2 + "_snapshot"
        os.mkdir(host1_snapdir)
        self.snapdirs.append(host1_snapdir)
        os.mkdir(host2_snapdir)
        self.snapdirs.append(host2_snapdir)
        tar = tarfile.open(host1_outtar)
        tar.extractall(path=host1_snapdir)
        tar.close()
        tar = tarfile.open(host2_outtar)
        tar.extractall(path=host2_snapdir)
        tar.close()

        # Determine the name of the child snapshots
        snap1_path = self.du.listdir(path=host1_snapdir, fullpath=True)
        snap2_path = self.du.listdir(path=host2_snapdir, fullpath=True)
        snap1_path = snap1_path[0]
        snap2_path = snap2_path[0]

        # Check that at least pbs.conf was captured on all of these hosts
        self.assertTrue(os.path.isfile(os.path.join(snapdir, "pbs.conf")),
                        "Main snapshot didn't capture all expected"
                        " information")
        self.assertTrue(os.path.isfile(os.path.join(snap1_path, "pbs.conf")),
                        "%s snapshot didn't capture all expected"
                        " information" % (host1))
        self.assertTrue(os.path.isfile(os.path.join(snap2_path, "pbs.conf")),
                        "%s snapshot didn't capture all expected"
                        " information" % (host2))

    @requirements(num_moms=2)
    def test_multi_mom_basic(self):
        """
        Test running pbs_snapshot on a multi-mom setup
        """
        self.snapshot_multi_mom_basic()

    @requirements(num_moms=2)
    def test_multi_mom_basic_obfuscate(self):
        """
        Test running pbs_snapshot on a multi-mom setup with obfuscation
        """
        self.snapshot_multi_mom_basic(obfuscate=True)

    def test_no_sudo(self):
        """
        Test that running pbs_snapshot without sudo doesn't fail
        """
        output_tar, _ = self.take_snapshot(with_sudo=False)

        # Check that the output tarball was created
        self.assertTrue(os.path.isfile(output_tar))

    def test_snapshot_json(self):
        """
        Test that pbs_snapshot captures job and vnode info in json
        """
        _, snap_dir = self.take_snapshot()

        # Verify that qstat json was captured
        jsonpath = os.path.join(snap_dir, QSTAT_F_JSON_PATH)
        self.assertTrue(os.path.isfile(jsonpath))
        with open(jsonpath, "r") as fd:
            json.load(fd)   # this will fail if file is not a valid json

        # Verify that pbsnodes json was captured
        jsonpath = os.path.join(snap_dir, PBSNODES_AVFJSON_PATH)
        self.assertTrue(os.path.isfile(jsonpath))
        with open(jsonpath, "r") as fd:
            json.load(fd)

    @requirements(no_mom_on_server=True)
    def test_remote_primary_mom(self):
        """
        Test that pbs_snapshot -H works correctly to capture a remote primary
        MoM host
        """
        # Skip test if there's no remote mom host available
        if len(self.moms) == 0 or \
                self.du.is_localhost((self.moms.values()[0]).shortname):
            self.skipTest("test requires a remote mom host as input, "
                          "use -p moms=<mom host>")

        mom_host = (self.moms.values()[0]).shortname

        _, snap_dir = self.take_snapshot(primary_host=mom_host)

        # Verify that mom_priv was captured
        momprivpath = os.path.join(snap_dir, "mom_priv")
        self.assertTrue(os.path.isdir(momprivpath))

    @requirements(num_moms=2)
    def test_remote_primary_multinode(self):
        """
        Test that pbs_snapshot -H works with --additional-hosts to capture
        """
        # Skip test if number of moms is not equal to two
        if len(self.moms) != 2:
            self.skipTest("test requires atleast two moms as input, "
                          "use -p moms=<mom 1>:<mom 2>")

        mom1 = self.moms.values()[0]
        mom2 = self.moms.values()[1]

        host1 = mom1.shortname
        host2 = mom2.shortname

        _, snap_dir = self.take_snapshot(hosts=[host2], primary_host=host1)

        # Verify that the primary host's mom_priv was captured
        momprivpath = os.path.join(snap_dir, "mom_priv")
        self.assertTrue(os.path.isdir(momprivpath))

        # The other host was captured as an additional host,
        # so there should be a snapshot tar for it inside the main snapshot
        host2_outtar = os.path.join(snap_dir, host2 + "_snapshot.tgz")
        self.assertTrue(os.path.isfile(host2_outtar))

        # Verify that mom_priv was captured, we can do this by just checking
        # for mom_priv/config file
        tar = tarfile.open(host2_outtar)
        host2_snapname = tar.getnames()[0].split(os.sep, 1)[0]
        try:
            config_path = os.path.join(host2_snapname, "mom_priv", "config")
            tar.getmember(config_path)
        except KeyError:
            self.fail("mom_priv/config not found in %s's snapshot" % host2)

    @skipOnShasta
    def test_snapshot_obf_stress(self):
        """
        A stress test to make sure that snapshot --obufscate really obfuscates
        the attributes that it claims to
        """
        real_values = {}

        # We will try to set all attributes which --obfuscate anonymizes
        manager1 = str(MGR_USER) + '@*'
        manager2 = str(TEST_USER) + "@*"
        self.server.manager(MGR_CMD_SET, SERVER,
                            {ATTR_managers: (INCR, manager2)},
                            sudo=True)
        real_values[ATTR_managers] = [manager1, manager2]

        operator = str(OPER_USER) + '@*'
        real_values[ATTR_operators] = [operator]

        real_values[ATTR_SvrHost] = [self.server.hostname]

        # Create a queue with acls set
        a = {ATTR_qtype: 'execution', ATTR_start: 'True', ATTR_enable: 'True',
             ATTR_aclgren: 'True', ATTR_aclgroup: TSTGRP0,
             ATTR_acluser: TEST_USER}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')
        real_values[ATTR_aclgroup] = [TSTGRP0]
        real_values[ATTR_acluser] = [TEST_USER]

        # Create a custom resource
        attr = {"type": "long", "flag": "nh"}
        rsc_id = "myres"
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id=rsc_id,
                            logerr=False)

        # Make it schedulable
        self.scheduler.add_resource("myres")

        # Set myres on the vnode
        attr = {"resources_available.myres": 1}
        self.server.manager(MGR_CMD_SET, NODE, attr, id=self.mom.shortname)

        # Set acls on server
        self.server.manager(MGR_CMD_SET, SERVER,
                            {ATTR_aclResvgroup: TSTGRP0,
                             ATTR_aclResvuser: TEST_USER,
                             ATTR_aclResvhost: self.server.hostname,
                             ATTR_aclhost: self.server.hostname},
                            sudo=True)
        real_values[ATTR_aclResvgroup] = [TSTGRP0]
        real_values[ATTR_aclResvuser] = [TEST_USER]

        # ATTR_SchedHost  is already set on the default host
        real_values[ATTR_SchedHost] = [self.server.hostname]

        # Add node's 'Host' & 'Mom'
        real_values[ATTR_NODE_Host] = [self.mom.shortname, self.mom.hostname]
        real_values[ATTR_NODE_Mom] = [self.mom.shortname, self.mom.hostname]
        real_values[ATTR_rescavail + ".host"] = [self.mom.shortname,
                                                 self.mom.hostname]
        real_values[ATTR_rescavail + ".vnode"] = [self.mom.shortname]

        # Submit a reservation with Authorized_Users & Authorized_Groups set
        a = {ATTR_auth_u: TEST_USER, ATTR_auth_g: TSTGRP0}
        Reservation(TEST_USER, a)
        real_values[ATTR_auth_u] = [TEST_USER]
        real_values[ATTR_auth_g] = [TSTGRP0]
        real_values[ATTR_resv_owner] = [TEST_USER, self.server.hostname]

        # Set up fairshare so that resource_group file gets filled
        self.scheduler.add_to_resource_group(TEST_USER, 11, 'root', 40)
        self.scheduler.add_to_resource_group(TEST_USER1, 11, 'root', 60)

        # Submit a job with sensitive attributes set
        a = {ATTR_project: 'p1', ATTR_A: 'a1', ATTR_g: TSTGRP0,
             ATTR_M: TEST_USER, ATTR_u: TEST_USER,
             ATTR_l + ".walltime": "00:01:00",
             ATTR_l + ".myres": 1, ATTR_S: "/bin/bash"}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(1000)
        self.server.submit(j)

        # Add job's attributes to the list
        # TEST_USER belongs to group TESTGRP0
        real_values[ATTR_euser] = [TEST_USER]
        real_values[ATTR_egroup] = [TSTGRP0]
        real_values[ATTR_project] = ['p1']
        real_values[ATTR_A] = ['a1']
        real_values[ATTR_g] = [TSTGRP0]
        real_values[ATTR_M] = [TEST_USER]
        real_values[ATTR_u] = [TEST_USER]
        real_values[ATTR_owner] = [TEST_USER, self.server.hostname]
        real_values[ATTR_exechost] = [self.server.hostname]
        real_values[ATTR_S] = ["/bin/bash"]
        real_values[ATTR_l] = ["myres"]

        # Take a snapshot with --obfuscate
        (_, snap_dir) = self.take_snapshot(obfuscate=True)

        # Make sure that none of the sensitive values were captured
        self.check_snap_obfuscated(snap_dir, real_values)

    def test_basic_option(self):
        """
        Test pbs_snapshot --basic
        """
        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        _, snap_dir = self.take_snapshot(basic=True)

        # Check that the output tarball was created
        self.assertTrue(os.path.isdir(snap_dir))

        # Check that only the following was captured:
        target_files = ["server/qstat_Bf.out", "server/qstat_Qf.out",
                        "scheduler/qmgr_lsched.out", "node/pbsnodes_va.out",
                        "reservation/pbs_rstat_f.out", "job/qstat_f.out",
                        "hook/qmgr_lpbshook.out", "server_priv/resourcedef",
                        "pbs.conf", "pbs_snapshot.log", "ctime",
                        "job/qstat_tf.out"]
        target_files = [os.path.join(snap_dir, f) for f in target_files]
        sched_priv_dir = os.path.join(snap_dir, "sched_priv")
        for (root, dirs, files) in os.walk(snap_dir):
            for fname in files:
                fpath = os.path.join(root, fname)
                if fpath not in target_files:
                    if not fpath.startswith(sched_priv_dir):
                        self.fail("Unexpected file " + fpath + " captured")

    def test_snapshot_mom_obf(self):
        """
        Test capturing a snapshot of a system that's only running pbs_mom
        """
        # Kill all daemons and start only pbs_mom
        self.server.pi.initd(op="stop", daemon="all")
        self.mom.pi.start_mom()
        self.assertTrue(self.mom.isUp())
        self.assertFalse(self.server.isUp())

        # Take & verify a snapshot with obfuscate
        self.take_snapshot(obfuscate=True, with_sudo=True, acct_logs=10)

        # Bring the rest of daemons up otherwise tearDown will error out
        self.server.pi.initd(op="start", daemon="all")

    def test_obfuscate_existing(self):
        """
        Test the --obf-snap option which obfuscates an existing snapshot
        """
        if self.pbs_snapshot_path is None:
            self.skip_test("pbs_snapshot not found")

        now = int(time.time())

        # Submit a job with sensitive attributes set
        a = {ATTR_project: 'p1', ATTR_A: 'a1', ATTR_g: TSTGRP0,
             ATTR_M: TEST_USER, ATTR_u: TEST_USER,
             ATTR_l + ".walltime": "00:01:00", ATTR_S: "/bin/bash"}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(1000)
        self.server.submit(j)

        # Add job's attributes to the list
        # TEST_USER belongs to group TESTGRP0
        real_values = {}
        real_values[ATTR_euser] = [TEST_USER]
        real_values[ATTR_egroup] = [TSTGRP0]
        real_values[ATTR_project] = ['p1']
        real_values[ATTR_A] = ['a1']
        real_values[ATTR_g] = [TSTGRP0]
        real_values[ATTR_M] = [TEST_USER]
        real_values[ATTR_u] = [TEST_USER]
        real_values[ATTR_owner] = [TEST_USER, self.server.hostname]
        real_values[ATTR_exechost] = [self.server.hostname]
        real_values[ATTR_S] = ["/bin/bash"]

        # Take a normal snapshot
        (snap_tar, snap_dir) = self.take_snapshot(0, 0, with_sudo=True)

        # Now, obfuscate the snapshot that we just took
        (snap_obf_tar, snap_obf) = self.take_snapshot(obf_snap=snap_dir)

        # Make sure that none of the sensitive values were captured
        self.check_snap_obfuscated(snap_obf, real_values)
        self.du.rm(path=snap_obf, force=True, recursive=True)
        self.du.rm(path=snap_dir, force=True, recursive=True)

        # Now, obfuscate using the tar directly instead of the snapshot dir
        self.du.rm(path=snap_obf_tar, force=True)
        (_, snap_obf) = self.take_snapshot(obf_snap=snap_tar)
        self.check_snap_obfuscated(snap_obf, real_values)

    def tearDown(self):
        # Delete the snapshot directories and tarballs created
        for snap_dir in self.snapdirs:
            self.du.rm(path=snap_dir, recursive=True, force=True)
        for snap_tar in self.snaptars:
            self.du.rm(path=snap_tar, sudo=True, force=True)

        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_soft_walltime.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


def cvt_duration(duration):
    """
    convert string form of a duration (HH:MM:SS) into seconds
    """
    h = 0
    m = 0
    sp = duration.split(':')
    if len(sp) == 3:
        h = int(sp[0])
        m = int(sp[1])
        s = int(sp[2])
    elif len(sp) == 2:
        m = int(sp[0])
        s = int(sp[1])
    else:
        s = int(sp[0])

    return h * 3600 + m * 60 + s


class TestSoftWalltime(TestFunctional):

    """
    Test that the soft_walltime resource is being used properly and
    being extended properly when exceeded
    """

    def setUp(self):
        TestFunctional.setUp(self)
        self.server.manager(
            MGR_CMD_UNSET, SERVER, 'Resources_default.soft_walltime')
        # Delete operators if added
        self.server.manager(MGR_CMD_UNSET, SERVER, 'operators')

    def tearDown(self):
        if self.mom.is_cpuset_mom():
            # reset the freq value
            attrs = {'freq': 120}
            self.server.manager(MGR_CMD_SET, HOOK, attrs, "pbs_cgroups")
        TestFunctional.tearDown(self)

    def stat_job(self, job):
        """
        stat a job for its estimated.start_time and soft_walltime or walltime
        :param job: Job to stat
        :type job: string
        """
        a = ['estimated.start_time', 'Resource_List.soft_walltime',
             'Resource_List.walltime']
        # If we're in CLI mode, qstat returns times in a human readable format
        # We need to turn it back into an epoch.  API mode will be the epoch.
        Jstat = self.server.status(JOB, id=job, attrib=a)
        wt = 0
        if self.server.get_op_mode() == PTL_CLI:
            strp = time.strptime(Jstat[0]['estimated.start_time'], '%c')
            est = int(time.mktime(strp))
            if 'Resource_List.soft_walltime' in Jstat[0]:
                wt = cvt_duration(Jstat[0]['Resource_List.soft_walltime'])
            elif 'Resource_List.walltime' in Jstat[0]:
                wt = cvt_duration(Jstat[0]['Resource_List.walltime'])
        else:
            est = int(Jstat[0]['estimated.start_time'])
            if 'Resource_List.soft_walltime' in Jstat[0]:
                wt = int(Jstat[0]['Resource_List.soft_walltime'])
            elif 'Resource_List.walltime' in RN_stat[0]:
                wt = int(Jstat[0]['Resource_List.walltime'])

        return (est, wt)

    def compare_estimates(self, baseline_job, jobs):
        """
        Check if estimated start times are correct
        :param baseline_job: initial top job to base times off of
        :type baseline_job: string (job id)
        :param jobs: calendared jobs
        :type jobs: list of strings (job ids)
        """
        est, wt = self.stat_job(baseline_job)
        for j in jobs:
            est2, wt2 = self.stat_job(j)
            self.assertEqual(est + wt, est2)
            est = est2
            wt = wt2

    def setup_holidays(self, prime_offset, nonprime_offset):
        """
        Set up the holidays file for test execution.  This function will
        first remove all entries in the holidays file and then add a year,
        prime, and nonprime for all days.  The prime and nonprime entries
        will be offsets from the current time.

        This all is necessary because there are some holidays set by default.
        The test should be able to be run on any day of the year.  If it is
        run on one of these holidays, it will be nonprime time only.
        """
        # Delete all entries in the holidays file
        self.scheduler.holidays_delete_entry('a')

        lt = time.localtime(time.time())
        self.scheduler.holidays_set_year(str(lt[0]))

        now = int(time.time())
        prime = time.strftime('%H%M', time.localtime(now + prime_offset))
        nonprime = time.strftime('%H%M', time.localtime(now + nonprime_offset))

        # set prime-time and nonprime-time for all days
        self.scheduler.holidays_set_day('weekday', prime, nonprime)
        self.scheduler.holidays_set_day('saturday', prime, nonprime)
        self.scheduler.holidays_set_day('sunday', prime, nonprime)

    def test_soft_walltime_perms(self):
        """
        Test to see if soft_walltime can't be submitted with a job or
        altered by a normal user or operator
        """
        J = Job(TEST_USER, attrs={'Resource_List.soft_walltime': 10})
        msg = 'Cannot set attribute, read only or insufficient permission'

        jid = None
        try:
            jid = self.server.submit(J)
        except PbsSubmitError as e:
            self.assertTrue(msg in e.msg[0])

        self.assertEqual(jid, None)

        J = Job(TEST_USER)
        jid = self.server.submit(J)
        try:
            self.server.alterjob(jid, {'Resource_List.soft_walltime': 10},
                                 runas=TEST_USER)
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        self.server.expect(JOB, 'Resource_List.soft_walltime',
                           op=UNSET, id=jid)

        operator = str(OPER_USER) + '@*'
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'operators': (INCR, operator)},
                            sudo=True)

        try:
            self.server.alterjob(jid, {'Resource_List.soft_walltime': 10},
                                 runas=OPER_USER)
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        self.server.expect(JOB, 'Resource_List.soft_walltime',
                           op=UNSET, id=jid)

    def test_soft_walltime_STF(self):
        """
        Test that STF jobs can't have soft_walltime
        """
        msg = 'soft_walltime is not supported with Shrink to Fit jobs'
        J = Job(attrs={'Resource_List.min_walltime': 120, ATTR_h: None})
        jid = self.server.submit(J)
        try:
            self.server.alterjob(jid, {'Resource_List.soft_walltime': 10})
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        self.server.expect(JOB, 'Resource_List.soft_walltime',
                           op=UNSET, id=jid)

        J = Job(TEST_USER, attrs={ATTR_h: None})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 10})
        try:
            self.server.alterjob(jid, {'Resource_List.min_walltime': 120})
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        self.server.expect(JOB, 'Resource_List.min_walltime',
                           op=UNSET, id=jid)

        J = Job(TEST_USER, attrs={ATTR_h: None})
        jid = self.server.submit(J)
        a = {'Resource_List.soft_walltime': 10,
             'Resource_List.min_walltime': 120}
        try:
            self.server.alterjob(jid, a)
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        al = ['Resource_List.min_walltime', 'Resource_List.soft_walltime']
        self.server.expect(JOB, al, op=UNSET, id=jid)

    def test_soft_greater_hard(self):
        """
        Test that a job's soft_walltime can't be greater than its hard walltime
        """
        msg = 'Illegal attribute or resource value'
        J = Job(TEST_USER, attrs={'Resource_List.walltime': 120, ATTR_h: None})
        jid = self.server.submit(J)

        try:
            self.server.alterjob(jid, {'Resource_List.soft_walltime': 240})
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        self.server.expect(JOB, 'Resource_List.soft_walltime',
                           op=UNSET, id=jid)

        J = Job(TEST_USER, {ATTR_h: None})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 240})
        try:
            self.server.alterjob(jid, {'Resource_List.walltime': 120})
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        self.server.expect(JOB, 'Resource_List.walltime', op=UNSET, id=jid)

        J = Job(TEST_USER, {ATTR_h: None})
        jid = self.server.submit(J)
        try:
            self.server.alterjob(jid, {'Resource_List.walltime': 120,
                                       'Resource_List.soft_walltime': 240})
        except PbsAlterError as e:
            self.assertTrue(msg in e.msg[0])

        al = ['Resource_List.walltime', 'Resource_List.soft_walltime']
        self.server.expect(JOB, al, op=UNSET, id=jid)

    def test_direct_set_soft_walltime(self):
        """
        Test setting soft_walltime directly
        """
        hook_body = \
            """import pbs
e = pbs.event()
j = e.job
j.Resource_List["soft_walltime"] = \
pbs.duration(j.Resource_List["set_soft_walltime"])
e.accept()
"""
        self.server.manager(MGR_CMD_CREATE, RSC, {'type': 'long'},
                            id='set_soft_walltime')

        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook("que", a, hook_body)

        J = Job(TEST_USER, attrs={'Resource_List.set_soft_walltime': 5})
        jid = self.server.submit(J)

        self.server.expect(JOB, {'Resource_List.soft_walltime': 5}, id=jid)

    def test_soft_walltime_extend(self):
        """
        Test to see that soft_walltime is extended properly
        """
        J = Job(TEST_USER)
        jid = self.server.submit(J)

        self.server.alterjob(jid, {'Resource_List.soft_walltime': 6})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        time.sleep(7)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime': 6}, op=GT, id=jid)

        # Get the current soft_walltime
        jstat = self.server.status(JOB, id=jid,
                                   attrib=['estimated.soft_walltime'])
        est_soft_walltime = jstat[0]['estimated.soft_walltime']

        time.sleep(7)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        # Check if soft_walltime extended
        self.server.expect(JOB, {'estimated.soft_walltime':
                                 est_soft_walltime}, op=GT, id=jid)

    def test_soft_walltime_extend_hook(self):
        """
        Test to see that soft_walltime is extended properly when submitted
        through a queue job hook
        """
        hook_body = \
            """import pbs
e = pbs.event()
e.job.Resource_List["soft_walltime"] = pbs.duration(5)
e.accept()
"""
        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook("que", a, hook_body)

        J = Job(TEST_USER)
        jid = self.server.submit(J)

        self.server.expect(JOB, {'Resource_List.soft_walltime': 5}, id=jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        time.sleep(6)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime': 5}, op=GT, id=jid)

        # Get the current soft_walltime
        jstat = self.server.status(JOB, id=jid,
                                   attrib=['estimated.soft_walltime'])
        est_soft_walltime = jstat[0]['estimated.soft_walltime']

        time.sleep(6)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime':
                                 est_soft_walltime}, op=GT, id=jid)

    def test_soft_then_hard(self):
        """
        Test to see if a job has both a soft and a hard walltime, that
        the job's soft_walltime is not extended past its hard walltime.
        It should first extend once and then extend to its hard walltime
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})

        J = Job(TEST_USER,
                attrs={'Resource_List.ncpus': 1, 'Resource_List.walltime': 16})
        jid = self.server.submit(J)

        self.server.alterjob(jid, {'Resource_List.soft_walltime': 6})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        time.sleep(7)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime': 6}, op=GT, id=jid)

        time.sleep(7)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime': 16},
                           offset=4, extend='x', id=jid)

        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

    def test_soft_before_dedicated(self):
        """
        Make sure that if a job's soft_walltime won't complete before
        dedicated time, the job does not start
        """

        now = int(time.time())
        self.scheduler.add_dedicated_time(start=now + 120, end=now + 2500)

        J = Job(TEST_USER)
        J.set_sleep_time(200)
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 180})
        comment = 'Not Running: Job would cross dedicated time boundary'
        self.server.expect(JOB, {'comment': comment}, id=jid)

    def test_soft_extend_dedicated(self):
        """
        Have a job with a soft_walltime extend into dedicated time and see
        the job continue running like normal
        """

        # Dedicated time is in the granularity of minutes.  This can't be set
        # any shorter without making it dedicated time right now.
        now = int(time.time())
        self.scheduler.add_dedicated_time(start=now + 70, end=now + 180)
        J = Job(TEST_USER, {'Resource_List.walltime': 180})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 5})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.logger.info("Waiting until dedicated time starts")
        time.sleep(61)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime': 65},
                           op=GE, id=jid)

    def test_soft_before_prime(self):
        """
        Make sure that if a job's soft_walltime won't complete before
        prime boundry, the job does not start
        """
        self.scheduler.set_sched_config({'backfill_prime': 'True'})

        self.setup_holidays(3600, 7200)

        J = Job(TEST_USER)
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 5400})
        comment = 'Not Running: Job will cross into primetime'
        self.server.expect(JOB, {'comment': comment}, id=jid)

    def test_soft_backfill_prime(self):
        """
        Test if soft_walltime is used to see if a job can run before
        the next prime boundry
        """
        self.scheduler.set_sched_config({'backfill_prime': 'True'})

        self.setup_holidays(60, 3600)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 5})

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        self.logger.info("Waiting until prime time starts.")
        time.sleep(61)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'estimated.soft_walltime': 65}, op=GE,
                           id=jid)

    def test_resv_conf_soft(self):
        """
        Test that there is no change in the reservation behavior with
        soft_walltime set on jobs with no hard walltime set
        """

        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        J = Job(TEST_USER, attrs={'Resource_List.ncpus': 4})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 5})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        now = time.time()
        a = {'Resource_List.ncpus': 1, 'reserve_start': now + 10,
             'reserve_end': now + 130}
        R = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(R)
        self.server.log_match(rid + ';reservation deleted', max_attempts=5)

    def test_resv_conf_soft_with_hard(self):
        """
        Test that there is no change in the reservation behavior with
        soft_walltime set on jobs with a hard walltime set.  The soft_walltime
        should be ignored and only the hard walltime should be used.
        """

        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        now = int(time.time())
        J = Job(TEST_USER, attrs={'Resource_List.ncpus': 4,
                                  'Resource_List.walltime': 120})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 5})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        a = {'Resource_List.ncpus': 1, 'reserve_start': now + 60,
             'reserve_end': now + 250}
        R = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(R)
        self.server.log_match(rid + ';reservation deleted', max_attempts=5)

    def test_resv_job_soft(self):
        """
        Test to see that a job with a soft walltime which would "end" before
        a reservation starts does not start.  It would interfere with the
        reservation.
        """
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        now = int(time.time())

        a = {'Resource_List.ncpus': 4, 'reserve_start': now + 120,
             'reserve_end': now + 240}
        R = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(R)
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')},
                           id=rid)

        a = {'Resource_List.ncpus': 4, ATTR_h: None}
        J = Job(TEST_USER, attrs=a)
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 60})
        self.server.rlsjob(jid, 'u')
        a = {ATTR_state: 'Q', ATTR_comment:
             'Not Running: Job would conflict with reservation or top job'}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_resv_job_soft_hard(self):
        """
        Test to see that a job with a soft walltime and a hard walltime does
        not interfere with a confirmed reservation.  The soft walltime would
        have the job "end" before the reservation starts, but the hard
        walltime would not.
        """
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        now = int(time.time())

        a = {'Resource_List.ncpus': 4, 'reserve_start': now + 120,
             'reserve_end': now + 240}
        R = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(R)
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')},
                           id=rid)

        a = {'Resource_List.ncpus': 4,
             'Resource_List.walltime': 150, ATTR_h: None}
        J = Job(TEST_USER, attrs=a)
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 60})
        self.server.rlsjob(jid, 'u')
        a = {ATTR_state: 'Q', ATTR_comment:
             'Not Running: Job would conflict with reservation or top job'}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_topjob(self):
        """
        Test that soft_walltime is used for calendaring of topjobs
        Submit 3 jobs:
        Job1 has a soft_walltime=150 and runs now
        Job2 has a soft_walltime=150 and gets added to the calendar at now+150
        Job3 has a soft_walltime=150 and gets added to the calendar at now+300
        Job4 has a soft_walltime=150 and gets added to the calendar at now+450
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_backfill_depth: 3})

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid1 = self.server.submit(J)
        self.server.alterjob(jid1, {'Resource_List.soft_walltime': 150})

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid2 = self.server.submit(J)
        self.server.alterjob(jid2, {'Resource_List.soft_walltime': 150})

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid3 = self.server.submit(J)
        self.server.alterjob(jid3, {'Resource_List.soft_walltime': 150})

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid4 = self.server.submit(J)
        self.server.alterjob(jid4, {'Resource_List.soft_walltime': 150})

        now = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.scheduler.log_match('Leaving Scheduling Cycle', starttime=now,
                                 max_attempts=20)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.compare_estimates(jid2, [jid3, jid4])

    def test_topjob2(self):
        """
        Test a mixture of soft_walltime and walltime used in the calendar
        Submit 3 jobs:
        Job1 has a soft_walltime=150 runs now
        Job2 has a soft_walltime=150 and gets added to the calendar at now+150
        Job3 has a soft_walltime=150 and gets added to the calendar at now+300
        Job4 has a walltime=300 and gets added to the calendar at now+450
        Job5 gets added to the calendar at now+750
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_backfill_depth: 4})

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid1 = self.server.submit(J)
        self.server.alterjob(jid1, {'Resource_List.soft_walltime': 150})

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid2 = self.server.submit(J)
        self.server.alterjob(jid2, {'Resource_List.soft_walltime': 150})

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid3 = self.server.submit(J)
        self.server.alterjob(jid3, {'Resource_List.soft_walltime': 150})

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid4 = self.server.submit(J)

        J = Job(TEST_USER, {'Resource_List.walltime': 300})
        jid5 = self.server.submit(J)

        now = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.scheduler.log_match('Leaving Scheduling Cycle', starttime=now)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.compare_estimates(jid2, [jid3, jid4, jid5])

    def test_filler_job(self):
        """
        Test to see if filler jobs will run based on their soft_walltime
        Submit 3 jobs:
        Job1 requests 1cpu and runs now
        Job2 requests 2cpus gets added to the calendar at now+300
        Job3 requests 1cpu and has a soft_walltime=150 and walltime=450
        Job3 should run because its soft_walltime will finish before now+300
        """
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        J1 = Job(TEST_USER, {'Resource_List.walltime': 300,
                             'Resource_List.ncpus': 1})
        jid1 = self.server.submit(J1)

        J2 = Job(TEST_USER, {'Resource_List.walltime': 300,
                             'Resource_List.ncpus': 2})
        jid2 = self.server.submit(J2)

        J3 = Job(TEST_USER, {'Resource_List.walltime': 450,
                             'Resource_List.ncpus': 1})
        jid3 = self.server.submit(J3)
        self.server.alterjob(jid3, {'Resource_List.soft_walltime': 150})

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)

    def test_preempt_order(self):
        """
        Test if soft_walltime is used for preempt_order.  It should be used
        to calculate percent done and also if the soft_walltime is exceeded,
        the percent done should remain at 100%
        """
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_order': "R 10 S"},
                            runas=ROOT_USER)
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        a = {'queue_type': 'Execution', 'enabled': 'True',
             'started': 'True', 'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='expressq')

        a = {'Resource_List.walltime': 600}
        J1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(J1)
        a = {'Resource_List.soft_walltime': 45}
        self.server.alterjob(jid1, a)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # test preempt_order with percentage < 90.  jid1 should be requeued.
        express_a = {'Resource_List.ncpus': 2, ATTR_queue: 'expressq'}
        J2 = Job(TEST_USER, attrs=express_a)
        jid2 = self.server.submit(J2)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid1)

        self.server.deljob(jid2, wait=True)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # preempt_order percentage done is based on resources_used.walltime
        # this is only periodically updated.  Sleep until half way through
        # the extended soft_walltime to make sure we're over 100%
        self.logger.info("Sleeping 60 seconds to accumulate "
                         "resources_used.walltime")
        time.sleep(60)

        J3 = Job(TEST_USER, attrs=express_a)
        jid3 = self.server.submit(J3)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid3)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=jid1)

    def test_soft_values_default(self):
        """
        Test to verify that soft_walltime will only take integer/long type
        value
        """

        msg = 'Illegal attribute or resource value'
        try:
            self.server.manager(
                MGR_CMD_SET, SERVER, {'resources_default.soft_walltime': '0'})
        except PbsManagerError as e:
            self.assertTrue(msg in e.msg[0])

        try:
            self.server.manager(
                MGR_CMD_SET, SERVER,
                {'resources_default.soft_walltime': '00:00:00'})
        except PbsManagerError as e:
            self.assertTrue(msg in e.msg[0])

        try:
            self.server.manager(
                MGR_CMD_SET, SERVER,
                {'resources_default.soft_walltime': 'abc'})
        except PbsManagerError as e:
            self.assertTrue(msg in e.msg[0])

        try:
            self.server.manager(
                MGR_CMD_SET, SERVER,
                {'resources_default.soft_walltime': '01:20:aa'})
        except PbsManagerError as e:
            self.assertTrue(msg in e.msg[0])

        try:
            self.server.manager(MGR_CMD_SET, SERVER, {
                                'resources_default.soft_walltime':
                                '1000000000000000000000000'})
        except PbsManagerError as e:
            self.assertTrue(msg in e.msg[0])

        try:
            self.server.manager(
                MGR_CMD_SET, SERVER,
                {'resources_default.soft_walltime': '-1'})
        except PbsManagerError as e:
            self.assertTrue(msg in e.msg[0])

        try:
            self.server.manager(
                MGR_CMD_SET, SERVER,
                {'resources_default.soft_walltime': '00.10'})
        except PbsManagerError as e:
            self.assertTrue(msg in e.msg[0])

        self.server.manager(
            MGR_CMD_SET, SERVER,
            {'resources_default.soft_walltime': '00:01:00'})

    def test_soft_runjob_hook(self):
        """
        Test that soft walltime is set by runjob hook
        """

        hook_body = \
            """import pbs
e = pbs.event()
e.job.Resource_List["soft_walltime"] = pbs.duration(5)
e.accept()
"""
        a = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook("que", a, hook_body)

        J = Job(TEST_USER)
        jid = self.server.submit(J)

        self.server.expect(JOB, {'Resource_List.soft_walltime': 5}, id=jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_soft_modifyjob_hook(self):
        """
        Test that soft walltime is set by modifyjob hook
        """

        hook_body = \
            """import pbs
e = pbs.event()
e.job.Resource_List["soft_walltime"] = pbs.duration(15)
e.accept()
"""
        a = {'event': 'modifyjob', 'enabled': 'True'}
        self.server.create_import_hook("que", a, hook_body)

        J = Job(TEST_USER)
        jid = self.server.submit(J)

        self.server.expect(
            JOB, 'Resource_List.soft_walltime', op=UNSET, id=jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.server.alterjob(jid, {'Resource_List.soft_walltime': 5})
        self.server.expect(JOB, {'Resource_List.soft_walltime': 15}, id=jid)

    def test_walltime_default(self):
        """
        Test soft walltime behavior with hard walltime is same
        even if set under resource_default
        """

        self.server.manager(MGR_CMD_SET, SERVER,
                            {'resources_default.soft_walltime': '15'})

        J = Job(TEST_USER, attrs={'Resource_List.walltime': 15})
        jid = self.server.submit(J)
        self.server.expect(JOB, {'Resource_List.soft_walltime': 15}, id=jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.server.deljob(jid, wait=True)

        J = Job(TEST_USER, attrs={'Resource_List.walltime': 16})
        jid1 = self.server.submit(J)
        self.server.expect(JOB, {'Resource_List.soft_walltime': 15}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.deljob(jid1, wait=True)

        # following piece is commented due to PP-1058
        # try:
        #    J = Job(TEST_USER, attrs={'Resource_List.walltime': 10})
        #    jid1 = self.server.submit(J)
        # except PtlSubmitError as e:
        #    self.assertTrue("illegal attribute or resource value" in e.msg[0])
        # self.assertEqual(jid1, None)

    def test_soft_held(self):
        """
        Test that if job is held soft_walltime will not get extended
        """
        J = Job(TEST_USER, attrs={'Resource_List.walltime': '100'})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 7})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.logger.info(
            "Sleep to let soft_walltime get extended")
        time.sleep(10)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime': 7}, op=GT,
                           id=jid)

        # Save the soft_walltime before holding the job
        jstat = self.server.status(JOB, id=jid,
                                   attrib=['estimated.soft_walltime'])
        est_soft_walltime = jstat[0]['estimated.soft_walltime']

        self.server.holdjob(jid, 'u')
        self.server.rerunjob(jid)
        self.server.expect(JOB, {'job_state': 'H'}, id=jid)

        self.logger.info(
            "Sleep to verify that soft_walltime: %s"
            " doesn't change while job is held" % est_soft_walltime)
        time.sleep(10)
        self.server.expect(JOB, {'estimated.soft_walltime':
                                 est_soft_walltime}, id=jid)

        # release the job and look for the soft_walltime again
        self.server.rlsjob(jid, 'u')
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state': 'R', 'estimated.soft_walltime':
                                 est_soft_walltime}, attrop=PTL_AND, id=jid)

        # Wait for some more time and verify that soft_walltime
        # extending again
        self.logger.info(
            "Sleep enough to let soft_walltime get extended again"
            " since the walltime was reset to 0")
        time.sleep(17)
        self.server.expect(JOB, {'estimated.soft_walltime': est_soft_walltime},
                           op=GT, id=jid)

    def test_soft_less_cput(self):
        """
        Test that soft_walltime has no impact on cput enforcement limit
        """

        script = """
i=0
while [ 1 ]
do
    sleep 0.125;
    dd if=/dev/zero of=/dev/null;
done
"""
        # If it is a cpuset mom, the cgroups hook relies on the periodic hook
        # to update cput, so make the periodic hook run more often for the
        # purpose of this test.
        if self.mom.is_cpuset_mom():
            attrs = {'freq': 1}
            self.server.manager(MGR_CMD_SET, HOOK, attrs, "pbs_cgroups")
            # cause the change to take effect now
            self.mom.restart()

        j1 = Job(TEST_USER, {'Resource_List.cput': 5})
        j1.create_script(body=script)
        jid = self.server.submit(j1)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 300})
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.logger.info("Sleep 10 secs waiting for cput to cause the"
                         " job to be deleted")
        time.sleep(10)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

    def test_soft_walltime_resv(self):
        """
        Submit a job with soft walltime inside a reservation
        """

        now = int(time.time())

        a = {'Resource_List.ncpus': 1, 'reserve_start': now + 10,
             'reserve_end': now + 20}
        R = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(R)
        self.server.expect(RESV,
                           {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')},
                           id=rid)
        r1 = rid.split('.')[0]

        j1 = Job(TEST_USER, attrs={ATTR_queue: r1})
        jid = self.server.submit(j1)

        # Set soft walltime to greater than reservation end time
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 300})
        self.server.expect(JOB, {'Resource_List.soft_walltime': 300}, id=jid)

        # verify that the job gets deleted when reservation ends
        self.server.expect(
            JOB, 'queue', op=UNSET, id=jid, offset=20)

    def test_restart_server(self):
        """
        Test that on server restart soft walltime is not reset
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})

        hook_body = \
            """import pbs
e = pbs.event()
e.job.Resource_List["soft_walltime"] = pbs.duration(8)
e.accept()
"""
        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook("que", a, hook_body)

        J = Job(TEST_USER)
        jid = self.server.submit(J)

        self.server.expect(JOB, {'Resource_List.soft_walltime': 8}, id=jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.logger.info("Wait till the soft_walltime is extended once")
        time.sleep(9)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'estimated.soft_walltime': 8}, op=GT,
                           id=jid)

        self.server.restart()

        self.server.expect(JOB, {'Resource_List.soft_walltime': 8}, id=jid)
        self.server.expect(JOB, {'estimated.soft_walltime': 8}, op=GT,
                           id=jid)

        # Get the current soft_walltime
        jstat = self.server.status(JOB, id=jid,
                                   attrib=['estimated.soft_walltime'])
        est_soft_walltime = jstat[0]['estimated.soft_walltime']

        # Delete the job and verify that estimated.soft_walltime is set
        # for job history
        self.server.deljob(jid, wait=True)
        self.server.expect(JOB,
                           {'job_state': 'F',
                            'estimated.soft_walltime':
                            est_soft_walltime}, op=GE,
                           extend='x', attrop=PTL_AND, id=jid)

    def test_soft_job_array(self):
        """
        Test that soft walltime works similar way with subjobs as
        regular jobs
        """

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        J = Job(TEST_USER, attrs={ATTR_J: '1-5',
                                  'Resource_List.walltime': 15})
        jid = self.server.submit(J)
        self.server.alterjob(jid, {'Resource_List.soft_walltime': 5})

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(
            JOB, {'job_state': 'B', 'Resource_List.soft_walltime': 5}, id=jid)
        subjob1 = jid.replace('[]', '[1]')
        self.server.expect(
            JOB, {'job_state': 'R', 'Resource_List.soft_walltime': 5},
            id=subjob1)

        self.logger.info("Wait for 6s and make sure that subjob1 is not"
                         "deleted even past soft_walltime")
        time.sleep(6)
        self.server.expect(JOB, {'job_state': 'R'}, id=subjob1)

        # Make sure the subjob1 is deleted after 15s past walltime limit
        self.server.expect(JOB, {'job_state': 'X'}, id=subjob1,
                           offset=9)


================================================
FILE: test/tests/functional/pbs_stf.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestSTF(TestFunctional):

    """
    The goal for this test suite is to contain basic STF tests that use
    the following timed events that cause the STF job to shrink its walltime:

    - dedicated time

    - primetime (with backfill_prime)

    - reservations
    """

    def setUp(self):
        TestFunctional.setUp(self)
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

    def set_primetime(self, ptime_start, ptime_end):
        """
        Set primttime to start at ptime_start and end at ptime_end.
        Remove all default holidays because will cause a test to fail on
        a holiday
        """
        # Delete all entries in the holidays file
        self.scheduler.holidays_delete_entry('a')

        # Without the YEAR entry primetime is considered to be 24 hours.
        p_yy = time.strftime('%Y', time.localtime(ptime_start))
        self.scheduler.holidays_set_year(p_yy)

        p_day = 'weekday'
        p_hhmm = time.strftime('%H%M', time.localtime(ptime_start))
        np_hhmm = time.strftime('%H%M', time.localtime(ptime_end))
        self.scheduler.holidays_set_day(p_day, p_hhmm, np_hhmm)

        p_day = 'saturday'
        self.scheduler.holidays_set_day(p_day, p_hhmm, np_hhmm)

        p_day = 'sunday'
        self.scheduler.holidays_set_day(p_day, p_hhmm, np_hhmm)

    def submit_resv(self, resv_start, ncpus, resv_dur):
        """
        Submit a reservation and expect it to be confirmed
        """
        a = {'Resource_List.select': '1:ncpus=%d' % ncpus,
             'Resource_List.place': 'free',
             'reserve_start': int(resv_start),
             'reserve_duration': int(resv_dur)
             }
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)

        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)

    def submit_jq(self, ncpus):
        """
        Submit a job and expect it to stay queued
        """
        a = {'Resource_List.select': '1:ncpus=%d' % ncpus,
             'Resource_List.place': 'free',
             'Resource_List.walltime': '01:00:00'
             }
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, ATTR_comment, op=SET)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)

    def test_t_4_1_3(self):
        """
        Test shrink to fit by setting a dedicated time that started 20 minutes
        ago with a duration of 2 hours.  Submit a job that can run for as
        short as 1 minute and as long as 20 hours.  Submit a second job to the
        dedicated time queue.  Expect the first job to be in Q state and the
        second job in R state with a walltime that's less than or equal to
        1 hr 40 mins and greater than or equal to 1 min.
        """
        qname = 'ded_time'

        a = {'queue_type': 'execution', 'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)
        now = int(time.time())
        self.scheduler.add_dedicated_time(start=now - 1200, end=now + 6000)

        j = Job(TEST_USER)
        a = {'Resource_List.max_walltime': '20:00:00',
             'Resource_List.min_walltime': '00:01:00'}
        j.set_attributes(a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        a = {'queue': 'ded_time',
             'Resource_List.max_walltime': '20:00:00',
             'Resource_List.min_walltime': '00:01:00'}
        j = Job(TEST_USER, attrs=a)
        j2id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '01:40:00')}
        self.server.expect(JOB, attr, id=j2id)

        attr = {'Resource_List.walltime': (GE, '00:01:00')}
        self.server.expect(JOB, attr, id=j2id)

        sw = self.server.status(JOB, 'Resource_List.walltime', id=j2id)
        wt = sw[0]['Resource_List.walltime']
        wt2 = wt

        # Make walltime given by qstat to agree with format in sched_logs.
        # A leading '0' is removed in the hour string.
        hh = wt.split(':')[0]
        if len(hh) == 2 and hh[0] == '0':
            wt2 = wt[1:]

        msg = "Job;%s;Job will run for duration=[%s|%s]" % (j2id, wt, wt2)
        self.scheduler.log_match(msg, regexp=True, max_attempts=5, interval=2)

    def test_t_4_1_1(self):
        """
        Test shrink to fit by setting a dedicated time that starts 1 hour
        from now for 1 hour  Submit a job that can run for as low as 10 minutes
        and as long as 10 hours.  Expect the job in R state with a walltime
        that is less than or equal to 1 hour and greater than or equal to
        10 minutes.
        """
        now = int(time.time())
        self.scheduler.add_dedicated_time(start=now + 3600, end=now + 7200)

        a = {'Resource_List.max_walltime': '10:00:00',
             'Resource_List.min_walltime': '00:10:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '01:00:00')}
        self.server.expect(JOB, attr, id=jid)

        attr = {'Resource_List.walltime': (GE, '00:10:00')}
        self.server.expect(JOB, attr, id=jid)

    def test_t_4_2_1(self):
        """
        Test shrink to fit by setting primetime that starts 4 hours from now
        and ends 12 hours from now and scheduler's backfill_prime is true.
        A regular job is submitted which goes into Q state.  Then a STF job
        with a max_walltime of 10:00:00 is able to run with a shrunk walltime
        of less than or equal to 4:00:00.
        """
        now = time.time()
        ptime_start = now + 14400
        ptime_end = now + 43200

        self.set_primetime(ptime_start, ptime_end)

        self.scheduler.set_sched_config({'backfill_prime': 'True'})

        a = {'Resource_List.ncpus': '1'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        a2 = {'Resource_List.max_walltime': '10:00:00',
              'Resource_List.min_walltime': '00:10:00'}
        j = Job(TEST_USER, attrs=a2)
        j2id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '04:00:00')}
        self.server.expect(JOB, attr, id=j2id)

        attr = {'Resource_List.walltime': (GE, '00:10:00')}
        self.server.expect(JOB, attr, id=j2id)

    def test_t_4_2_3(self):
        """
        Test shrink to fit by setting primetime that starts 4 hours from now
        and ends 12 hours from now and scheduler's backfill_prime is true and
        prime_spill is 1 hour.  A STF job with a min_walltime of 00:10:00 and
        with a max_walltime of 10:00:00 gets queued with a shrunk walltime
        of less than or equal to 05:00:00.
        """
        now = time.time()
        ptime_start = now + 14400
        ptime_end = now + 43200

        self.set_primetime(ptime_start, ptime_end)

        self.scheduler.set_sched_config({'backfill_prime': 'True',
                                         'prime_spill': '01:00:00'})

        a2 = {'Resource_List.max_walltime': '10:00:00',
              'Resource_List.min_walltime': '00:10:00'}
        j = Job(TEST_USER, attrs=a2)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '05:00:00')}
        self.server.expect(JOB, attr, id=jid)

        attr = {'Resource_List.walltime': (GE, '00:10:00')}
        self.server.expect(JOB, attr, id=jid)

    def test_t_4_2_4(self):
        """
        Test shrink to fit by setting primetime that started 22 minutes ago
        and ends 5:38 hours from now and scheduler's backfill_prime is true and
        prime_spill is 1 hour.  A STF job with a min_walltime of 00:01:00 and
        with a max_walltime of 20:00:00 gets queued with a shrunk walltime
        of less than or equal to 06:38:00.
        """
        now = time.time()
        ptime_start = now - 1320
        ptime_end = now + 20280

        self.set_primetime(ptime_start, ptime_end)

        self.scheduler.set_sched_config({'backfill_prime': 'True',
                                         'prime_spill': '01:00:00'})

        a = {'Resource_List.max_walltime': '20:00:00',
             'Resource_List.min_walltime': '00:01:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '06:38:00')}
        self.server.expect(JOB, attr, id=jid)

        attr = {'Resource_List.walltime': (GE, '00:01:00')}
        self.server.expect(JOB, attr, id=jid)

    def test_t_4_3_1(self):
        """
        Test shrink to fit by creating 16 reservations, say from R110 to R125,
        with R117, R121, R124 having ncpus=3, all others having ncpus=2.
        Duration of 10 min with 30 min difference between consecutive
        reservation.	A STF job will shrink its walltime to less than or
        equal to 4 hours.
        """
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        now = int(time.time())
        resv_dur = 600

        for i in range(1, 8):
            resv_start = now + i * 1800
            self.submit_resv(resv_start, 2, resv_dur)

        resv_start = now + 8 * 1800
        self.submit_resv(resv_start, 3, resv_dur)

        for i in range(9, 12):
            resv_start = now + i * 1800
            self.submit_resv(resv_start, 2, resv_dur)

        resv_start = now + 12 * 1800
        self.submit_resv(resv_start, 3, resv_dur)

        for i in range(13, 15):
            resv_start = now + i * 1800
            self.submit_resv(resv_start, 2, resv_dur)

        resv_start = now + 15 * 1800
        self.submit_resv(resv_start, 3, resv_dur)

        resv_start = now + 16 * 1800
        self.submit_resv(resv_start, 2, resv_dur)

        a = {'Resource_List.max_walltime': '10:00:00',
             'Resource_List.min_walltime': '00:10:00'}
        j = Job(TEST_USER, attrs=a)

        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '04:00:00')}
        self.server.expect(JOB, attr, id=jid)

        attr = {'Resource_List.walltime': (GE, '00:10:00')}
        self.server.expect(JOB, attr, id=jid)

    def test_t_4_3_6(self):
        """
        Test shrink to fit by creating one reservation having ncpus=1,
        starting in 3 min. with a duration of two hours.  A preempted STF job
        with min_walltime of 2 min. and max_walltime of 2 hours will stay
        suspended after higher priority job goes away if its
        min_walltime can't be satisfied.
        """
        self.skip_test('Skipping test due to PP-1049')
        qname = 'highp'

        a = {'queue_type': 'execution', 'enabled': 'True', 'started': 'True',
             'priority': '150'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)

        now = int(time.time())
        resv_dur = 7200

        resv_start = now + 180
        d = self.submit_resv(resv_start, 1, resv_dur)
        self.assertTrue(d)

        a = {'Resource_List.max_walltime': '02:00:00',
             'Resource_List.min_walltime': '00:02:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '00:03:00')}
        self.server.expect(JOB, attr, id=jid)

        attr = {'Resource_List.walltime': (GE, '00:02:00')}
        self.server.expect(JOB, attr, id=jid)

        # The sleep below will leave less than 2 minutes window for jid
        # after j2id is deleted.  The min_walltime of jid can't be
        # satisfied and jid will stay in S state.
        self.logger.info("Sleeping 65s to leave less than 2m before resv")
        time.sleep(65)

        a = {'queue': 'highp', 'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '00:01:00'}
        j = Job(TEST_USER, attrs=a)
        j2id = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

        self.server.delete(j2id)

        t = time.time()
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.scheduler.log_match("Leaving Scheduling Cycle", starttime=t,
                                 max_attempts=5)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

    def test_t_4_3_8(self):
        """
        Test shrink to fit by submitting a STF job and then creating a
        reservation having ncpus=1 that overlaps with the job.  The
        reservation is denied.
        """
        a = {'Resource_List.max_walltime': '02:00:00',
             'Resource_List.min_walltime': '00:02:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        now = int(time.time())
        resv_start = now + 300
        resv_dur = 7200

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'free',
             'reserve_start': resv_start,
             'reserve_duration': resv_dur
             }
        r = Reservation(TEST_USER, attrs=a)
        rid1 = self.server.submit(r)
        self.server.log_match(rid1 + ";reservation deleted", max_attempts=10)

        self.server.delete(jid, wait=True)

        a = {'Resource_List.select': '1:ncpus=1'}
        j = Job(TEST_USER, attrs=a)
        j2id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)

        resv_start = now + 300
        resv_dur = 7200

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'free',
             'reserve_start': resv_start,
             'reserve_duration': resv_dur
             }
        r = Reservation(TEST_USER, attrs=a)
        rid2 = self.server.submit(r)

        self.server.log_match(rid2 + ";reservation deleted", max_attempts=10)

    def test_t_4_4_1(self):
        """
        Test shrink to fit by submitting top jobs as barrier.
        A STF job will shrink its walltime relative to top jobs
        """
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        a = {'strict_ordering': 'true ALL', 'backfill': 'true ALL'}
        self.scheduler.set_sched_config(a)

        a = {'backfill_depth': '20'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.place': 'free',
             'Resource_List.walltime': '01:00:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        for _ in range(1, 5):
            self.submit_jq(2)

        self.submit_jq(3)

        for _ in range(6, 8):
            self.submit_jq(2)

        self.submit_jq(3)

        for _ in range(9, 12):
            self.submit_jq(2)

        self.submit_jq(3)

        for _ in range(13, 16):
            self.submit_jq(2)

        a = {'Resource_List.max_walltime': '10:00:00',
             'Resource_List.min_walltime': '00:10:00',
             'Resource_List.select': '1:ncpus=1'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        attr = {'Resource_List.walltime': (LE, '05:00:00')}
        self.server.expect(JOB, attr, id=jid)

    def test_t_4_5_1(self):
        """
        Test shrink to fit by setting primetime that started 45 minutes ago
        and ends 2:45 hours from now and dedicated time starting in 5 minutes
        ending in 1:45 hours.  A STF job with a min_walltime of 00:01:00 and
        with a max_walltime of 20:00:00 gets queued with a shrunk walltime
        of less than or equal to 00:05:00.
        """
        now = int(time.time())
        ptime_start = now - 2700
        ptime_end = now + 9900

        p_day = 'weekday'
        p_hhmm = time.strftime('%H%M', time.localtime(ptime_start))
        np_hhmm = time.strftime('%H%M', time.localtime(ptime_end))
        self.scheduler.holidays_set_day(p_day, p_hhmm, np_hhmm)

        p_day = 'saturday'
        self.scheduler.holidays_set_day(p_day, p_hhmm, np_hhmm)

        p_day = 'sunday'
        self.scheduler.holidays_set_day(p_day, p_hhmm, np_hhmm)

        self.scheduler.add_dedicated_time(start=now + 300, end=now + 6300)

        a = {'Resource_List.max_walltime': '20:00:00',
             'Resource_List.min_walltime': '00:01:00'}
        j = Job(TEST_USER, attrs=a)
        j2id = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)

        attr = {'Resource_List.walltime': (LE, '00:05:00')}
        self.server.expect(JOB, attr, id=j2id)

    def test_t_4_6_1(self):
        """
        Test shrink to fit by submitting a reservation and top jobs as
        barriers. A STF job will shrink its walltime relative to top jobs
        and reservations.
        """
        a = {'resources_available.ncpus': 3}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)

        self.scheduler.set_sched_config({'strict_ordering': 'True ALL'})

        now = int(time.time())
        resv_start = now + 4200
        resv_dur = 900
        self.submit_resv(resv_start, 3, resv_dur)

        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.place': 'free',
             'Resource_List.walltime': '00:15:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        a = {'Resource_List.select': '1:ncpus=3',
             'Resource_List.place': 'free',
             'Resource_List.walltime': '00:15:00'}
        j = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        a = {'Resource_List.max_walltime': '02:00:00',
             'Resource_List.min_walltime': '00:01:00',
             'Resource_List.select': '1:ncpus=1'}
        j = Job(TEST_USER, attrs=a)
        jid3 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)

        attr = {'Resource_List.walltime': (LE, '00:15:00')}
        self.server.expect(JOB, attr, id=jid3)

    def test_t_5_1_1(self):
        """
        STF job's min/max_walltime relative to resources_min/max.walltime
        setting on queue.
        """
        a = {'resources_min.walltime': '00:10:00',
             'resources_max.walltime': '10:00:00'}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id="workq")

        a = {'Resource_List.max_walltime': '10:00:00',
             'Resource_List.min_walltime': '00:09:00'}
        j = Job(TEST_USER, attrs=a)

        error_msg = 'Job violates queue and/or server resource limits'
        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

        a = {'Resource_List.max_walltime': '00:09:00',
             'Resource_List.min_walltime': '00:09:00'}
        j = Job(TEST_USER, attrs=a)

        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

        a = {'Resource_List.max_walltime': '11:00:00',
             'Resource_List.min_walltime': '00:10:00'}
        j = Job(TEST_USER, attrs=a)

        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

        a = {'Resource_List.max_walltime': '11:00:00',
             'Resource_List.min_walltime': '11:00:00'}
        j = Job(TEST_USER, attrs=a)
        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

        a = {'Resource_List.max_walltime': '10:00:00',
             'Resource_List.min_walltime': '00:10:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.delete(jid)

        a = {'Resource_List.max_walltime': '00:10:00',
             'Resource_List.min_walltime': '00:10:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.delete(jid)

        a = {'Resource_List.max_walltime': '10:00:00',
             'Resource_List.min_walltime': '10:00:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.delete(jid)

        a = {'Resource_List.max_walltime': '09:00:00',
             'Resource_List.min_walltime': '00:11:00'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_t_5_1_2(self):
        """
        STF job's max_walltime relative to resources_max.walltime
        setting on server.
        """
        a = {'resources_max.walltime': '15:00:00'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'Resource_List.max_walltime': '16:00:00',
             'Resource_List.min_walltime': '00:20:00'}
        j = Job(TEST_USER, attrs=a)

        error_msg = 'Job violates queue and/or server resource limits'
        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

        a = {'Resource_List.max_walltime': '16:00:00',
             'Resource_List.min_walltime': '16:00:00'}
        j = Job(TEST_USER, attrs=a)

        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue(error_msg in e.msg[0])

        a = {'Resource_List.max_walltime': '15:00:00',
             'Resource_List.min_walltime': '15:00:00'}
        j = Job(TEST_USER, attrs=a)

        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_t_5_2_1(self):
        """
        Setting resources_max.min_walltime on a queue.
        """
        a = {'resources_max.min_walltime': '10:00:00'}
        try:
            self.server.manager(MGR_CMD_SET, QUEUE, a, id="workq")
        except PbsManagerError as e:
            self.assertTrue('Resource limits can not be set for the resource'
                            in e.msg[0])

    def test_t_5_2_2(self):
        """
        Setting resources_max.min_walltime on the server.
        """
        a = {'resources_max.min_walltime': '10:00:00'}
        try:
            self.server.manager(MGR_CMD_SET, SERVER, a)
        except PbsManagerError as e:
            self.assertTrue('Resource limits can not be set for the resource'
                            in e.msg[0])

    def test_t_6(self):
        """
        Test to see that the min_walltime is not unset if the max_walltime
        is attempted to be set less than the min.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {'Resource_List.min_walltime': 9, 'Resource_List.max_walltime': 60}
        J = Job(TEST_USER, attrs=a)
        jid = self.server.submit(J)
        try:
            self.server.alterjob(jid, {'Resource_List.max_walltime': 3})
        except PbsAlterError as e:
            self.assertTrue('\"min_walltime\" can not be greater'
                            ' than \"max_walltime\"' in e.msg[0])

        self.server.expect(JOB, 'Resource_List.min_walltime', op=SET)
        self.server.expect(JOB, 'Resource_List.max_walltime', op=SET)

        try:
            self.server.alterjob(jid, {'Resource_List.min_walltime': 180})
        except PbsAlterError as e:
            self.assertTrue('\"min_walltime\" can not be greater'
                            ' than \"max_walltime\"' in e.msg[0])

        self.server.expect(JOB, 'Resource_List.min_walltime', op=SET)
        self.server.expect(JOB, 'Resource_List.max_walltime', op=SET)

        try:
            a = {'Resource_List.min_walltime': 60,
                 'Resource_List.max_walltime': 30}
            self.server.alterjob(jid, a)
        except PbsAlterError as e:
            self.assertTrue('\"min_walltime\" can not be greater'
                            ' than \"max_walltime\"' in e.msg[0])

        self.server.expect(JOB, 'Resource_List.min_walltime', op=SET)
        self.server.expect(JOB, 'Resource_List.max_walltime', op=SET)


================================================
FILE: test/tests/functional/pbs_strict_ordering.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import string
import time

from tests.functional import *


class TestStrictOrderingAndBackfilling(TestFunctional):

    """
    Test strict ordering when backfilling is truned off
    """
    @timeout(1800)
    def test_t1(self):

        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        rv = self.scheduler.set_sched_config(
            {'round_robin': 'false all', 'by_queue': 'false all',
             'strict_ordering': 'true all'})
        self.assertTrue(rv)

        a = {'backfill_depth': 0}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job(TEST_USER)
        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 9999}
        j1.set_sleep_time(9999)
        j1.set_attributes(a)
        j1 = self.server.submit(j1)

        j2 = Job(TEST_USER)
        a = {'Resource_List.select': '1:ncpus=3',
             'Resource_List.walltime': 9999}
        j2.set_sleep_time(9999)
        j2.set_attributes(a)
        j2 = self.server.submit(j2)

        j3 = Job(TEST_USER)
        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 9999}
        j3.set_sleep_time(9999)
        j3.set_attributes(a)
        j3 = self.server.submit(j3)
        rv = self.server.expect(
            JOB,
            {'comment': 'Not Running: Job would break strict sorted order'},
            id=j3,
            offset=2,
            max_attempts=2,
            interval=2)
        self.assertTrue(rv)
    """
    Test strict ordering when queue backilling is enabled and server
    backfilling is off
    """

    def test_t2(self):
        rv = self.scheduler.set_sched_config(
            {'by_queue': 'false prime', 'strict_ordering': 'true all'})
        self.assertTrue(rv)
        a = {'backfill_depth': 2}
        self.server.manager(
            MGR_CMD_SET, QUEUE, a, id='workq')
        a = {
            'queue_type': 'execution',
            'started': 't',
            'enabled': 't',
            'backfill_depth': 1}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq2')
        a = {
            'queue_type': 'execution',
            'started': 't',
            'enabled': 't',
            'backfill_depth': 0}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq3')
        a = {'backfill_depth': 0}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 5}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'workq'}
        j = Job(TEST_USER, a)
        j.set_sleep_time(100)
        j1id = self.server.submit(j)
        j2id = self.server.submit(j)
        j3id = self.server.submit(j)
        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: 'wq2'}
        j = Job(TEST_USER, a)
        j.set_sleep_time(100)
        j4id = self.server.submit(j)
        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: 'wq3'}
        j = Job(TEST_USER, a)
        j.set_sleep_time(100)
        j5id = self.server.submit(j)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB,
                           {'job_state': 'R'},
                           id=j1id,
                           max_attempts=30,
                           interval=2)
        self.server.expect(JOB,
                           {'job_state': 'R'},
                           id=j2id,
                           max_attempts=30,
                           interval=2)
        self.server.expect(JOB,
                           {'job_state': 'R'},
                           id=j4id,
                           max_attempts=30,
                           interval=2)
        self.server.expect(JOB,
                           {'job_state': 'Q'},
                           id=j5id,
                           max_attempts=30,
                           interval=2)

    def test_zero_backfill_depth_on_queue(self):
        """
        Test if scheduler tries to run a job when strict ordering is enabled
        and backfill_depth is set to 0 on the queue
        """
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        rv = self.scheduler.set_sched_config(
            {'round_robin': 'false all', 'by_queue': 'false all',
             'strict_ordering': 'true all'})
        self.assertTrue(rv)

        a = {'backfill_depth': 0}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id="workq")

        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'Resource_List.select': '1:ncpus=1'}
        j1 = Job(TEST_USER)
        j1.set_attributes(a)
        jid1 = self.server.submit(j1)

        a = {'Resource_List.select': '1:ncpus=2'}
        j2 = Job(TEST_USER)
        j2.set_attributes(a)
        jid2 = self.server.submit(j2)

        a = {'Resource_List.select': '1:ncpus=1'}
        j3 = Job(TEST_USER)
        j3.set_attributes(a)
        jid3 = self.server.submit(j3)

        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        job_comment = "Not Running: Job would break strict sorted order"
        self.server.expect(JOB, {'comment': job_comment}, id=jid3, offset=2,
                           max_attempts=2, interval=2)

        # Now try the same scenario with backfilling set to one and check
        # that first and third job runs but second gets calendared.
        # since we want thrid job to backfill around second, we need to make
        # sure that walltime of third job is less than the walltime of first
        # job
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.deljob([jid1, jid2, jid3])

        a = {'backfill_depth': 1}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id="workq")

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '100'}
        j4 = Job(TEST_USER)
        j4.set_attributes(a)
        jid4 = self.server.submit(j4)

        a = {'Resource_List.select': '1:ncpus=2'}
        j5 = Job(TEST_USER)
        j5.set_attributes(a)
        jid5 = self.server.submit(j5)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': '50'}
        j6 = Job(TEST_USER)
        j6.set_attributes(a)
        jid6 = self.server.submit(j6)

        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid6)
        self.scheduler.log_match(jid5 + ";Job is a top job")

    def test_zero_backfill_depth_on_one_queue(self):
        """
        Test if scheduler tries to run a job when strict ordering is enabled
        and backfill_depth is set to 0 on one queue but backfill_depth is
        enabled on another queue.
        """
        a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, 1, usenatvnode=True)

        rv = self.scheduler.set_sched_config(
            {'round_robin': 'false all', 'by_queue': 'false all',
             'strict_ordering': 'true all'})
        self.assertTrue(rv)

        a = {'backfill_depth': 0}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id="workq")

        a = {'queue_type': 'execution', 'started': 'True', 'enabled': 'True',
             'priority': '100'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id="workq2")

        a = {'backfill_depth': 1}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id="workq2")

        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'Resource_List.select': '1:ncpus=1'}
        j1 = Job(TEST_USER)
        j1.set_attributes(a)
        self.server.submit(j1)

        j2 = Job(TEST_USER)
        j2.set_attributes(a)
        self.server.submit(j2)

        j3 = Job(TEST_USER)
        j3.set_attributes(a)
        jid3 = self.server.submit(j3)

        a = {'Resource_List.select': '1:ncpus=1', 'queue': 'workq2'}
        j4 = Job(TEST_USER)
        j4.set_attributes(a)
        jid4 = self.server.submit(j4)

        j5 = Job(TEST_USER)
        j5.set_attributes(a)
        self.server.submit(j5)

        j6 = Job(TEST_USER)
        j6.set_attributes(a)
        self.server.submit(j6)

        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        job_comment = "Not Running: Job would break strict sorted order"
        self.server.expect(JOB, {'comment': job_comment}, id=jid3, offset=2,
                           max_attempts=2, interval=2)
        self.scheduler.log_match(jid4 + ";Job is a top job")


================================================
FILE: test/tests/functional/pbs_support_linux_hook_event_phase1_2.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestSupportLinuxHookEventPhase1_2(TestFunctional):
    """
    Tests that cover support for Linux hook events in phase 1.2.
    """

    def setUp(self):
        TestFunctional.setUp(self)
        self.pbs_attach = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                       'bin', 'pbs_attach')
        self.pbs_tmrsh = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                      'bin', 'pbs_tmrsh')

    def test_prologue_attach_order(self):
        """
        Check that the execjob_prologue and execjob_attach event types
        of a hook happen in the sister mom and mom superior.
        Check that execjob_prologue event happens before execjob_attach.
        """

        hook_body = """
import pbs
import time
e = pbs.event()
time.sleep(2)
if e.type == pbs.EXECJOB_PROLOGUE:
        pbs.logmsg(pbs.LOG_DEBUG, "event is %s" % ("EXECJOB_PROLOGUE"))
elif e.type == pbs.EXECJOB_ATTACH:
        pbs.logmsg(pbs.LOG_DEBUG, "event is %s" % ("EXECJOB_ATTACH"))
else:
        pbs.logmsg(pbs.LOG_DEBUG, "event is %s" % ("UNKNOWN"))
"""

        a = {'event': 'execjob_prologue,execjob_attach', 'enabled': 'True'}
        self.server.create_import_hook("hook1", a, hook_body)

        self.momA = list(self.moms.values())[0]
        self.momB = list(self.moms.values())[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        if self.momA.is_cpuset_mom():
            self.hostA = self.hostA + '[0]'
        if self.momB.is_cpuset_mom():
            self.hostB = self.hostB + '[0]'

        # Job script
        test = []
        test += ['#PBS -l select=vnode=%s+vnode=%s\n' %
                 (self.hostA, self.hostB)]
        test += ['setsid --fork %s -j $PBS_JOBID %s 3000\n'
                 % (self.pbs_attach, self.mem.sleep_cmd)]
        test += ['%s %s setsid --fork %s -j $PBS_JOBID %s 3000\n'
                 % (self.pbs_tmrsh, self.momB.shortname, self.pbs_attach,
                    self.mem.sleep_cmd)]
        test += ['%s 3000\n' % self.mom.sleep_cmd]

        # Submit a job
        j = Job(TEST_USER)
        j.create_script(body=test)
        check_after1 = time.time()
        check_after2 = check_after1 + 2
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Check mom logs
        msg_expected = "event is EXECJOB_PROLOGUE"
        s = self.momA.log_match(msg_expected, starttime=check_after1,
                                max_attempts=10)
        self.assertTrue(s)
        s = self.momB.log_match(msg_expected, starttime=check_after1,
                                max_attempts=10)
        self.assertTrue(s)

        msg_expected = "event is EXECJOB_ATTACH"
        s = self.momA.log_match(msg_expected, starttime=check_after2,
                                max_attempts=10)
        self.assertTrue(s)
        # Allow time for log message to appear before checking on sister mom
        time.sleep(31)
        s = self.momB.log_match(msg_expected, starttime=check_after2,
                                max_attempts=10)
        self.assertTrue(s)

    def test_execjob_attach_hook_with_accept(self):
        """
        Check that the execjob_attach event type with accept
        of a hook happen in the sister mom and mom superior;
        execjob_attach hook returns process id, job and vnode list.
        """

        hook_body = """
import pbs
import os
import sys
import time

e = pbs.event()
pbs.logmsg(pbs.LOG_DEBUG,
           "printing pbs.event() values ---------------------->")
if e.type == pbs.EXECJOB_ATTACH:
   pbs.logmsg(pbs.LOG_DEBUG, "Event is: %s" % ("EXECJOB_ATTACH"))
else:
   pbs.logmsg(pbs.LOG_DEBUG, "Event is: %s" % ("UNKNOWN"))

pbs.logmsg(pbs.LOG_DEBUG, "Requestor is: %s" % (e.requestor))
pbs.logmsg(pbs.LOG_DEBUG, "Requestor_host is: %s" % (e.requestor_host))

# Getting/setting vnode_list
vn = pbs.event().vnode_list

for k in vn.keys():
   pbs.logmsg(pbs.LOG_DEBUG, "Vnode: [%s]-------------->" % (k))

pbs.logjobmsg(e.job.id, "PID = %d, type = %s" % (e.pid, type(e.pid)))

if e.job.in_ms_mom():
        pbs.logmsg(pbs.LOG_DEBUG, "job is in_ms_mom")
else:
        pbs.logmsg(pbs.LOG_DEBUG, "job is NOT in_ms_mom")

e.accept()
"""

        a = {'event': 'execjob_attach', 'enabled': 'True'}
        self.server.create_import_hook("hook1", a, hook_body)

        self.momA = list(self.moms.values())[0]
        self.momB = list(self.moms.values())[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        if self.momA.is_cpuset_mom():
            self.hostA = self.hostA + '[0]'
        if self.momB.is_cpuset_mom():
            self.hostB = self.hostB + '[0]'

        # Job script
        test = []
        test += ['#PBS -l select=vnode=%s+vnode=%s\n' %
                 (self.hostA, self.hostB)]

        test += ['setsid --fork %s -j $PBS_JOBID %s 3000\n'
                 % (self.pbs_attach, self.mom.sleep_cmd)]
        test += ['%s %s setsid --fork %s -j $PBS_JOBID %s 3000\n'
                 % (self.pbs_tmrsh, self.momB.shortname, self.pbs_attach,
                    self.mom.sleep_cmd)]
        test += ['%s 3000\n' % self.mom.sleep_cmd]

        # Submit a job
        j = Job(TEST_USER)
        j.create_script(body=test)
        check_after = time.time()
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        # Allow time for log messages to appear before checking mom logs
        time.sleep(31)

        # Check log msgs on sister mom
        log_msgB = [
            "Hook;pbs_python;printing pbs.event() values " +
            "---------------------->",
            "Hook;pbs_python;Event is: EXECJOB_ATTACH",
            "Hook;pbs_python;Requestor is: pbs_mom",
            "Hook;pbs_python;Requestor_host is: %s" %
            self.momB.shortname,
            "Hook;pbs_python;Vnode: [%s]-------------->" %
            self.hostA,
            "Hook;pbs_python;Vnode: [%s]-------------->" %
            self.hostB,
            "pbs_python;Job;%s;PID =" %
            jid,
            "Hook;pbs_python;job is NOT in_ms_mom"]

        for msg in log_msgB:
            rc = self.momB.log_match(msg, starttime=check_after,
                                     max_attempts=10)
            _msg = "Didn't get expected log msg: %s " % msg
            _msg += "on host:%s" % self.hostB
            self.assertTrue(rc, _msg)
            _msg = "Got expected log msg: %s on host: %s" % (msg, self.hostB)
            self.logger.info(_msg)

        # Check log msgs on mom superior
        log_msgA = ["Hook;pbs_python;printing pbs.event() values " +
                    "---------------------->",
                    "Hook;pbs_python;Event is: EXECJOB_ATTACH",
                    "Hook;pbs_python;Requestor is: pbs_mom",
                    "Hook;pbs_python;Requestor_host is: %s" %
                    self.momA.shortname,
                    "Hook;pbs_python;Vnode: [%s]-------------->" % self.hostA,
                    "Job;%s;PID =" % jid,
                    "Hook;pbs_python;Vnode: [%s]-------------->" % self.hostB,
                    "Hook;pbs_python;job is in_ms_mom"]

        for msg in log_msgA:
            rc = self.momA.log_match(msg, starttime=check_after,
                                     max_attempts=10)
            _msg = "Didn't get expected log msg: %s " % msg
            _msg += "on host:%s" % self.hostA
            self.assertTrue(rc, _msg)
            _msg = "Got expected log msg: %s on host: %s" % (msg, self.hostA)
            self.logger.info(_msg)


================================================
FILE: test/tests/functional/pbs_suspend_resume_accounting.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestSuspendResumeAccounting(TestFunctional):
    """
    Testsuite for verifying accounting of
    suspend/resume events of job
    """

    script = ['#!/bin/bash\nfor ((c=1; c <= 1000000000; c++));']
    script += ['do']
    script += ['sleep 1']
    script += ['done']

    def test_suspend_resume_job_signal(self):
        """
        Test case to verify accounting suspend
        and resume records when the events are
        triggered by client for one job.
        """
        j = Job()
        j.create_script(self.script)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

        self.server.sigjob(jobid=jid, signal="suspend")

        record = 'z;%s;.*resources_used.' % jid
        self.server.accounting_match(msg=record, id=jid, regexp=True)

        self.server.sigjob(jobid=jid, signal="resume")
        record = 'r;%s;' % jid
        self.server.accounting_match(msg=record, id=jid)

    def test_suspend_resume_job_array_signal(self):
        """
        Test case to verify accounting suspend
        and resume records when the events are
        triggered by client for a job array.
        """
        a = {ATTR_rescavail + '.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        j = Job()
        j.create_script(self.script)
        j.set_attributes({ATTR_J: '1-2'})
        jid = self.server.submit(j)

        sub_jid1 = j.create_subjob_id(jid, 1)
        sub_jid2 = j.create_subjob_id(jid, 2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=sub_jid1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=sub_jid2)

        # suspend job
        self.server.sigjob(jobid=jid, signal="suspend")
        self.server.expect(JOB, {ATTR_state: 'S'}, id=sub_jid1)
        self.server.expect(JOB, {ATTR_state: 'S'}, id=sub_jid2)

        record = 'z;%s;resources_used.' % sub_jid1
        self.server.accounting_match(msg=record, id=sub_jid1)

        record = 'z;%s;resources_used.' % sub_jid2
        self.server.accounting_match(msg=record, id=sub_jid2)

        self.server.sigjob(jobid=jid, signal="resume")
        record = 'r;%s;' % sub_jid1
        self.server.accounting_match(msg=record, id=sub_jid1)

        record = 'r;%s;' % sub_jid2
        self.server.accounting_match(msg=record, id=sub_jid2)

    def test_interactive_job_suspend_resume(self):
        """
        Test case to verify accounting suspend
        and resume records when the events are
        triggered by client for a interactive job.
        """

        cmd = 'sleep 10'
        j = Job(attrs={ATTR_inter: ''})
        j.interactive_script = [('hostname', '.*'),
                                (cmd, '.*')]

        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        self.server.sigjob(jobid=jid, signal="suspend")

        record = 'z;%s;.*resources_used.' % jid
        self.server.accounting_match(msg=record, id=jid, regexp=True)

        self.server.sigjob(jobid=jid, signal="resume")
        record = 'r;%s;' % jid
        self.server.accounting_match(msg=record, id=jid)

    def test_suspend_resume_job_scheduler(self):
        """
        Test case to verify accounting suspend
        and resume records when the events are
        triggered by Scheduler.
        """

        a = {ATTR_rescavail + '.ncpus': 4, ATTR_rescavail + '.mem': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        # Create an express queue
        b = {ATTR_qtype: 'Execution', ATTR_enable: 'True',
             ATTR_start: 'True', ATTR_p: '200'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, b, "expressq")

        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job()
        j1.create_script(self.script)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        j2 = Job()
        j2.create_script(self.script)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=512mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        resc_released = "resources_released=(%s:ncpus=4:mem=524288kb)" \
                        % self.mom.shortname
        record = 'z;%s;resources_used.' % jid1
        line = self.server.accounting_match(msg=record, id=jid1)[1]
        self.assertIn(resc_released, line)

        self.server.delete(jid2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)
        record = 'r;%s;' % jid1
        self.server.accounting_match(msg=record, id=jid1)

    def test_admin_suspend_resume_signal(self):
        """
        Test case to verify accounting of admin-suspend
        and admin-resume records.
        """
        j = Job()
        j.create_script(self.script)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=jid)

        self.server.sigjob(jid, 'admin-suspend', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

        record = 'z;%s;.*resources_used.' % jid
        self.server.accounting_match(msg=record, id=jid, regexp=True)

        self.server.sigjob(jid, 'admin-resume', runas=ROOT_USER)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        record = 'r;%s;' % jid
        self.server.accounting_match(msg=record, id=jid)

    def test_resc_released_susp_resume(self):
        """
        Test case to verify accounting of suspend/resume
        events with restrict_res_to_release_on_suspend set
        on server
        """
        # Set both ncpus and mem
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus,mem'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j = Job()
        j.create_script(self.script)
        j.set_attributes({ATTR_l + '.select': '1:ncpus=1:mem=512mb'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)
        self.server.sigjob(jobid=jid, signal="suspend")

        # check for both ncpus and mem are released
        resc_released = 'resources_released=(%s:ncpus=1:mem=524288kb)'

        node = self.server.status(JOB, 'exec_vnode', id=jid)[0]['exec_vnode']
        vn = node.split('+')[0].split(':')[0].split('(')[1]
        resc_released = resc_released % vn
        record = 'z;%s;resources_used.' % jid
        line = self.server.accounting_match(msg=record, id=jid)[1]
        self.assertIn(resc_released, line)

        self.server.sigjob(jobid=jid, signal="resume")
        record = 'r;%s;' % jid
        self.server.accounting_match(msg=record, id=jid)

    def test_resc_released_susp_resume_multi_vnode(self):
        """
        Test case to verify accounting of suspend/resume
        events with restrict_res_to_release_on_suspend set
        on server for multiple vnodes
        """
        # Set restrict_res_to_release_on_suspend server attribute
        a = {ATTR_restrict_res_to_release_on_suspend: 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        b = {ATTR_qtype: 'Execution', ATTR_enable: 'True',
             ATTR_start: 'True', ATTR_p: '200'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, b, "expressq")

        vn_attrs = {ATTR_rescavail + '.ncpus': 8,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1,
                               fname="vnodedef1", vname="vnode1")
        # Append a vnode
        vn_attrs = {ATTR_rescavail + '.ncpus': 6,
                    ATTR_rescavail + '.mem': '1024mb'}
        self.mom.create_vnodes(vn_attrs, 1, additive=True,
                               fname="vnodedef2", vname="vnode2")

        # Submit a low priority job
        j1 = Job()
        j1.create_script(self.script)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=8:mem=512mb+1'
                                               ':ncpus=6:mem=256mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        # Submit a high priority job
        j2 = Job()
        j2.create_script(self.script)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=8:mem=256mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid2)
        self.server.expect(JOB, {ATTR_state: 'S', ATTR_substate: 45}, id=jid1)

        resc_released = 'resources_released=(vnode1[0]:ncpus=8)+' \
                        '(vnode2[0]:ncpus=6)'
        record = 'z;%s;resources_used.' % jid1
        line = self.server.accounting_match(msg=record, id=jid1)[1]
        self.assertIn(resc_released, line)

    def test_higher_priority_job_hook_reject(self):
        """
        Test case to verify accounting of suspend/resume
        events of a job which gets suspended by a higher priority
        job and gets resumed when the runjob hook rejects the
        higher priority job.
        """
        a = {ATTR_rescavail + '.ncpus': 4, ATTR_rescavail + '.mem': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        b = {ATTR_qtype: 'Execution', ATTR_enable: 'True',
             ATTR_start: 'True', ATTR_p: '200'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, b, "expressq")

        # Define a runjob hook
        hook = """
import pbs
e = pbs.event()
e.reject()
"""
        j1 = Job()
        j1.create_script(self.script)
        j1.set_attributes({ATTR_l + '.select': '1:ncpus=4:mem=512mb'})
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        a = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook("sr_hook", a, hook)

        j2 = Job()
        j2.create_script(self.script)
        j2.set_attributes(
            {ATTR_l + '.select': '1:ncpus=2:mem=512mb',
             ATTR_q: 'expressq'})
        jid2 = self.server.submit(j2)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid1)

        record = 'z;%s;.*resources_used.' % jid1
        self.server.accounting_match(msg=record, id=jid1, regexp=True)

        record = 'r;%s;' % jid1
        self.server.accounting_match(msg=record, id=jid1)


================================================
FILE: test/tests/functional/pbs_svr_dyn_res.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
from ptl.lib.pbs_ifl_mock import *
from ptl.utils.pbs_procutils import ProcUtils


class TestServerDynRes(TestFunctional):

    dirnames = []

    def setUp(self):
        TestFunctional.setUp(self)

    def check_access_log(self, fp, exist=True):
        """
        Helper function to check if scheduler logged a file security
        message.
        """
        # adding a second delay because log_match can then start from the
        # correct log message and avoid false positives from previous
        # logs
        time.sleep(1)
        match_from = time.time()
        self.scheduler.apply_config(validate=False)
        self.scheduler.get_pid()
        self.scheduler.signal('-HUP')
        self.scheduler.log_match(fp + ' file has a non-secure file access',
                                 starttime=match_from, existence=exist)

    def setup_dyn_res(self, resname, restype, script_body):
        """
        Helper function to setup server dynamic resources
        returns a list of dynamic resource scripts created by the function
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        val = []
        scripts = []
        attr = {}
        for i, name in enumerate(resname):
            attr["type"] = restype[i]
            self.server.manager(MGR_CMD_CREATE, RSC, attr, id=name)
            # Add resource to sched_config's 'resources' line
            self.scheduler.add_resource(name)
            dest_file = self.scheduler.add_server_dyn_res(name,
                                                          script_body[i],
                                                          prefix="svr_resc",
                                                          suffix=".scr")
            val.append('"' + name + ' ' + '!' + dest_file + '"')
            scripts.append(dest_file)
        a = {'server_dyn_res': val}
        self.scheduler.set_sched_config(a)

        # The server dynamic resource script gets executed for every
        # scheduling cycle
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        return scripts

    def test_invalid_script_out(self):
        """
        Test that the scheduler handles incorrect output from server_dyn_res
        script correctly
        """
        # Create a server_dyn_res of type long
        resname = ["mybadres"]
        restype = ["long"]
        script_body = ['echo abc']

        start_time = time.time()
        # Add it as a server_dyn_res that returns a string output
        filenames = self.setup_dyn_res(resname, restype, script_body)

        # Submit a job
        j = Job(TEST_USER)
        j.set_sleep_time(1)
        jid = self.server.submit(j)

        # Make sure that "Problem with creating server data structure"
        # is not logged in sched_logs
        self.scheduler.log_match("Problem with creating server data structure",
                                 existence=False, max_attempts=10,
                                 starttime=start_time)

        # Also check that "<script> returned bad output"
        # is in the logs
        self.scheduler.log_match("%s returned bad output" % filenames[0])

        # The scheduler uses 0 as the available amount of the dynamic resource
        # if the server_dyn_res script output is bad
        # So, submit a job that requests 1 of the resource
        attr = {"Resource_List." + resname[0]: 1}

        # Submit job
        j = Job(TEST_USER, attrs=attr)
        jid = self.server.submit(j)

        # The job shouldn't run
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        # Check for the expected log message for insufficient resources
        self.scheduler.log_match(
            "Insufficient amount of server resource: %s (R: 1 A: 0 T: 0)"
            % (resname[0]), level=logging.DEBUG2)

    def test_res_long_pos(self):
        """
        Test that server_dyn_res accepts command line arguments to the
        commands it runs. Resource value set to a positive long int.
        """
        # Create a resource of type long. positive value
        resname = ["foobar"]
        restype = ["long"]
        resval = ['/bin/echo 4']

        # Add server_dyn_res entry in sched_config
        self.setup_dyn_res(resname, restype, resval)

        a = {'Resource_List.foobar': 4}
        # Submit job
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar': '4'}
        self.server.expect(JOB, a, id=jid)

    def test_res_long_neg(self):
        """
        Test that server_dyn_res accepts command line arguments to the
        commands it runs. Resource value set to a negative long int.
        """
        # Create a resource of type long. negative value
        resname = ["foobar"]
        restype = ["long"]
        resval = ['/bin/echo -1']

        # Add server_dyn_res entry in sched_config
        self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foobar': '1'}
        # Submit job
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Check for the expected log message for insufficient resources
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foobar (R: 1 A: -1 T: -1)"

        # The job shouldn't run
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_res_whitespace(self):
        """
        Test for parse errors when more than one white space
        is added between the resource name and the !<script> in a
        server_dyn_res line. There shouldn't be any errors.
        """
        # Create a resource of type long
        resname = ["foo"]
        restype = ["long"]
        resval = ['echo get_foo > /tmp/PtlPbs_got_foo; echo 1']

        # Prep for server_dyn_resource scripts. Script "PbsPtl_get_foo*"
        # generates file "PbsPtl_got_foo" and returns 1.
        fpath_out = os.path.join(os.sep, "tmp", "PtlPbs_got_foo")

        self.setup_dyn_res(resname, restype, resval)

        # Check if the file "PbsPtl_got_foo" was created
        for _ in range(10):
            self.logger.info("Waiting for the file [%s] to appear",
                             fpath_out)
            if self.du.isfile(path=fpath_out):
                break
            time.sleep(1)
        self.assertTrue(self.du.isfile(path=fpath_out))

        # Submit job
        a = {'Resource_List.foo': '1'}
        # Submit job
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foo': 1}
        self.server.expect(JOB, a, id=jid)
        # Cleanup dynamically created file
        self.du.rm(fpath_out, sudo=True, force=True)

    def test_multiple_res(self):
        """
        Test multiple dynamic resources specified in resourcedef
        and sched_config
        """
        # Create resources of type long
        resname = ["foobar_small", "foobar_medium", "foobar_large"]
        restype = ["long", "long", "long"]

        # Prep for server_dyn_resource scripts.
        script_body = ["echo 8", "echo 12", "echo 20"]

        self.setup_dyn_res(resname, restype, script_body)

        a = {'Resource_List.foobar_small': '4'}
        # Submit job
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar_small': 4}
        self.server.expect(JOB, a, id=jid)

        self.server.delete(jid, wait=True)

        a = {'Resource_List.foobar_medium': '10'}
        # Submit job
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar_medium': 10}
        self.server.expect(JOB, a, id=jid)

        self.server.delete(jid, wait=True)

        a = {'Resource_List.foobar_large': '18'}
        # Submit job
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar_large': 18}
        self.server.expect(JOB, a, id=jid)

    def test_res_string(self):
        """
        Test that server_dyn_res accepts a string value returned
        by a script
        """
        # Create a resource of type string
        resname = ["foobar"]
        restype = ["string"]

        # Prep for server_dyn_resource script
        resval = ["echo abc"]

        self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foobar': 'abc'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar': 'abc'}
        self.server.expect(JOB, a, id=jid)

        self.server.delete(jid, wait=True)

        # Submit job
        a = {'Resource_List.foobar': 'xyz'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Check for the expected log message for insufficient resources
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foobar (xyz != abc)"

        # The job shouldn't run
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_res_string_array(self):
        """
        Test that server_dyn_res accepts string array returned
        by a script
        """
        # Create a resource of type string_array
        resname = ["foobar"]
        restype = ["string_array"]

        # Prep for server_dyn_resource script
        resval = ["echo white, red, blue"]

        self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foobar': 'red'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar': 'red'}
        self.server.expect(JOB, a, id=jid)

        self.server.delete(jid, wait=True)

        # Submit job
        a = {'Resource_List.foobar': 'green'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Check for the expected log message for insufficient resources
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foobar (green != white,red,blue)"

        # The job shouldn't run
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_res_size(self):
        """
        Test that server_dyn_res accepts type "size" and a "value"
        returned by a script
        """
        # Create a resource of type size
        resname = ["foobar"]
        restype = ["size"]

        # Prep for server_dyn_resource script
        resval = ["echo 100gb"]

        self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foobar': '95gb'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar': '95gb'}
        self.server.expect(JOB, a, id=jid1)

        self.server.delete(jid1, wait=True)

        # Submit job
        a = {'Resource_List.foobar': '101gb'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)

        # Check for the expected log message for insufficient resources
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foobar (R: 101gb A: 100gb T: 100gb)"

        # The job shouldn't run
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid2, attrop=PTL_AND)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid1)
        self.server.deljob(jid2, wait=True, runas=TEST_USER)

        # Submit jobs again
        a = {'Resource_List.foobar': '100gb'}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)
        a = {'job_state': 'R', 'Resource_List.foobar': '100gb'}
        self.server.expect(JOB, a, id=jid1)

    def test_res_size_runtime(self):
        """
        Test that server_dyn_res accepts type "size" and a "value"
        returned by a script. Check if the script change during
        job run is correctly considered
        """

        # Create a resource of type size
        resname = ["foobar"]
        restype = ["size"]

        # Prep for server_dyn_resource script
        resval = ["echo 100gb"]

        filenames = self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foobar': '95gb'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Job must run successfully
        a = {'job_state': 'R', 'Resource_List.foobar': '95gb'}
        self.server.expect(JOB, a, id=jid)

        # Turn off scheduling. There is a race where scheduler could
        # already be inside a cycle because of previous expect call and
        # read the old dynamic resource script.
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        # Change script during job run
        tmp_file = self.du.create_temp_file(body="echo 50gb")
        self.du.run_copy(src=tmp_file, dest=filenames[0], sudo=True,
                         preserve_permission=False)

        # Rerun job
        self.server.rerunjob(jid)

        # Turn on scheduling
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        # The job shouldn't run
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foobar (R: 95gb A: 50gb T: 50gb)"
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_res_size_invalid_input(self):
        """
        Test invalid values returned from server_dyn_resource
        script for resource type 'size'.
        Script returns a 'string' instead of type 'size'.
        """
        # Create a resource of type size
        resname = ["foobar"]
        restype = ["size"]

        # Script returns invalid value for resource type 'size'
        resval = ["echo two gb"]

        filenames = self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foobar': '2gb'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Also check that "<script> returned bad output"
        # is in the logs
        self.scheduler.log_match("%s returned bad output" % filenames[0])

        # The job shouldn't run
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foobar (R: 2gb A: 0kb T: 0kb)"
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_res_float_invalid_input(self):
        """
        Test invalid values returned from server_dyn_resource
        script for resource type 'float'
        Script returns 'string' instead of type 'float'.
        """

        # Create a resource of type float
        resname = ["foo"]
        restype = ["float"]

        # Prep for server_dyn_resource script
        resval = ["echo abc"]

        filenames = self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foo': '1.2'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Also check that "<script> returned bad output"
        # is in the logs
        self.scheduler.log_match("%s returned bad output" % filenames[0])

        # The job shouldn't run
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foo (R: 1.2 A: 0 T: 0)"
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_res_boolean_invalid_input(self):
        """
        Test invalid values returned from server_dyn_resource
        script for resource type 'boolean'.
        Script returns 'non boolean' values
        """

        # Create a resource of type boolean
        resname = ["foo"]
        restype = ["boolean"]

        # Prep for server_dyn_resource script
        resval = ["echo yes"]

        filenames = self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foo': '"true"'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        # Also check that "<script> returned bad output"
        # is in the logs
        self.scheduler.log_match("%s returned bad output" % filenames[0])

        # The job shouldn't run
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foo (True != False)"
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid)

    def test_res_timeout(self):
        """
        Test server_dyn_res script timeouts after 30 seconds
        """

        # Create a resource of type boolean
        resname = ["foo"]
        restype = ["boolean"]

        # Prep for server_dyn_resource script
        resval = ["sleep 60\necho true"]

        filenames = self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foo': 'true'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        self.logger.info('Sleeping 30 seconds to wait for script to timeout')
        time.sleep(30)
        self.scheduler.log_match("%s timed out" % filenames[0])
        self.scheduler.log_match("Setting resource foo to 0")

        # The job shouldn't run
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foo (True != False)"
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid)

    def test_res_set_timeout(self):
        """
        Test setting server_dyn_res script to timeout after 10 seconds
        """

        self.server.manager(MGR_CMD_SET, SCHED,
                            {ATTR_sched_server_dyn_res_alarm: 10})

        # Create a resource of type boolean
        resname = ["foo"]
        restype = ["boolean"]

        # Prep for server_dyn_resource script
        resval = ["sleep 20\necho true"]

        filenames = self.setup_dyn_res(resname, restype, resval)

        # Submit job
        a = {'Resource_List.foo': 'true'}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)

        self.logger.info('Sleeping 10 seconds to wait for script to timeout')
        time.sleep(10)
        self.scheduler.log_match("%s timed out" % filenames[0])
        self.scheduler.log_match("Setting resource foo to 0")

        # The job shouldn't run
        job_comment = "Can Never Run: Insufficient amount of server resource:"
        job_comment += " foo (True != False)"
        a = {'job_state': 'Q', 'comment': job_comment}
        self.server.expect(JOB, a, id=jid, attrop=PTL_AND)

    def test_svr_dyn_res_permissions(self):
        """
        Test whether scheduler rejects the server_dyn_res script when the
        permission of the script are open to write for others and group
        """

        # Create a new resource
        attr = {'type': 'long', 'flag': 'q'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        self.scheduler.add_resource('foo')

        scr_body = ['echo "10"', 'exit 0']
        home_dir = os.path.expanduser('~')
        fp = self.scheduler.add_server_dyn_res("foo", scr_body,
                                               dirname=home_dir,
                                               validate=False)

        # give write permission to group and others
        self.du.chmod(path=fp, mode=0o766, sudo=True)
        self.check_access_log(fp)

        # give write permission to group
        self.du.chmod(path=fp, mode=0o764, sudo=True)
        self.check_access_log(fp)

        # give write permission to others
        self.du.chmod(path=fp, mode=0o746, sudo=True)
        self.check_access_log(fp)

        # give write permission to user only
        self.du.chmod(path=fp, mode=0o744, sudo=True)
        if os.getuid() != 0:
            self.check_access_log(fp, exist=True)
        else:
            self.check_access_log(fp, exist=False)

        # Create script in a directory which has more open privileges
        # This should make loading of this file fail in all cases
        # Create the directory name with a space in it, to make sure PBS parses
        # it correctly.
        dir_temp = self.du.create_temp_dir(mode=0o766,
                                           dirname=home_dir,
                                           suffix=' tmp')
        self.du.chmod(path=dir_temp, mode=0o766, sudo=True)
        self.du.chown(path=dir_temp, sudo=True, uid=self.scheduler.user)
        fp = self.scheduler.add_server_dyn_res("foo", scr_body,
                                               dirname=dir_temp,
                                               validate=False)

        # Add to dirnames for cleanup
        self.dirnames.append(dir_temp)

        # give write permission to group and others
        self.du.chmod(path=fp, mode=0o766, sudo=True)
        self.check_access_log(fp)

        # give write permission to group
        self.du.chmod(path=fp, mode=0o764, sudo=True)
        self.check_access_log(fp)

        # give write permission to others
        self.du.chmod(path=fp, mode=0o746, sudo=True)
        self.check_access_log(fp)

        # give write permission to user only
        self.du.chmod(path=fp, mode=0o744, sudo=True)
        self.check_access_log(fp)

        # Create dynamic resource script in PBS_HOME directory and check
        # file permissions
        # self.scheduler.add_server_dyn_res by default creates the script in
        # PBS_HOME as root
        fp = self.scheduler.add_server_dyn_res("foo", scr_body, perm=0o766,
                                               validate=False)

        self.check_access_log(fp)

        # give write permission to group
        self.du.chmod(path=fp, mode=0o764, sudo=True)
        self.check_access_log(fp)

        # give write permission to others
        self.du.chmod(path=fp, mode=0o746, sudo=True)
        self.check_access_log(fp)

        # give write permission to user only
        self.du.chmod(path=fp, mode=0o744, sudo=True)
        self.check_access_log(fp, exist=False)

    def test_res_cleanup(self):
        """
        Test that the scheduler cleans up its children
        """
        pu = ProcUtils()
        resname = ["normal", "invalid", "timeout"]
        restype = ["long", "long", "long"]

        # Prep for server_dyn_resource scripts.
        script_body = ["echo 8", "echo hello", "sleep 40; echo 20"]

        filenames = self.setup_dyn_res(resname, restype, script_body)

        a = {'Resource_List.normal': '2',
             'Resource_List.invalid': '8',
             'Resource_List.timeout': 10}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.logger.info('Sleeping 30 seconds to wait for script to timeout')
        time.sleep(30)
        self.scheduler.log_match("%s timed out" % filenames[2])
        children = pu.get_proc_children(hostname=self.scheduler.hostname,
                                        ppid=self.scheduler.get_pid())
        self.assertFalse(children)

    def tearDown(self):
        # removing all files creating in test
        if len(self.dirnames) != 0:
            self.du.rm(path=self.dirnames, sudo=True, force=True,
                       recursive=True)
            self.dirnames[:] = []
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_systemd.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *
import socket


class Test_systemd(TestFunctional):
    """
    Test whether you are able to control pbs using systemd
    """

    def setUp(self):
        TestFunctional.setUp(self)
        # Skip test if systemctl command is not found.
        is_systemctl = self.du.which(exe='systemctl')
        if is_systemctl == 'systemctl':
            self.skipTest("Systemctl command not found")
        ret = self.du.run_cmd(self.server.hostname, "systemctl is-active dbus")
        if ret['rc'] == 1:
            self.skipTest("Systemd not functional")

    def shutdown_all(self):
        if self.server.isUp():
            self.server.stop()
        if self.scheduler.isUp():
            self.scheduler.stop()
        if self.comm.isUp():
            self.comm.stop()
        if self.mom.isUp():
            self.mom.stop()

    def start_using_systemd(self):
        cmd = "systemctl start pbs"
        self.du.run_cmd(self.hostname, cmd, True)
        if ('1' == self.server.pbs_conf['PBS_START_SERVER'] and
                not self.server.isUp()):
            return False
        if ('1' == self.server.pbs_conf['PBS_START_SCHED'] and
                not self.scheduler.isUp()):
            return False
        if ('1' == self.server.pbs_conf['PBS_START_COMM'] and
                not self.comm.isUp()):
            return False
        if ('1' == self.server.pbs_conf['PBS_START_MOM'] and
                not self.mom.isUp()):
            return False
        return True

    def stop_using_systemd(self):
        cmd = "systemctl stop pbs"
        self.du.run_cmd(self.hostname, cmd, True)
        if ('1' == self.server.pbs_conf['PBS_START_SERVER'] and
                self.server.isUp(max_attempts=10)):
            return False
        if ('1' == self.server.pbs_conf['PBS_START_SCHED'] and
                self.scheduler.isUp(max_attempts=10)):
            return False
        if ('1' == self.server.pbs_conf['PBS_START_COMM'] and
                self.comm.isUp(max_attempts=10)):
            return False
        if ('1' == self.server.pbs_conf['PBS_START_MOM'] and
                self.mom.isUp(max_attempts=10)):
            return False
        return True

    @skipOnShasta
    def test_systemd(self):
        """
        Test whether you are able to control pbs using systemd
        """
        self.hostname = socket.gethostname()
        cmd = "systemctl daemon-reload"
        out = self.du.run_cmd(self.hostname, cmd, True)
        self.shutdown_all()
        rv = self.start_using_systemd()
        self.assertTrue(rv)
        rv = self.stop_using_systemd()
        self.assertTrue(rv)
        rv = self.start_using_systemd()

    @skipOnShasta
    def test_missing_daemon(self):
        """
        Test whether missing daemons starts without re-starting other daemons
        """
        self.hostname = self.server.hostname
        self.shutdown_all()
        rv = self.start_using_systemd()
        self.assertTrue(rv)
        cmd = "systemctl reload pbs"
        # Mom
        self.mom.signal("-KILL")
        if self.mom.isUp(max_attempts=10):
            self.fail("MoM is still running")
        self.du.run_cmd(self.hostname, cmd, True)
        if self.mom.isUp(max_attempts=10):
            self.logger.info("MoM started and running")
        else:
            self.fail("MoM not started")
        # Sched
        self.scheduler.signal("-KILL")
        if self.scheduler.isUp(max_attempts=10):
            self.fail("Sched is still running")
        self.du.run_cmd(self.hostname, cmd, True)
        if self.scheduler.isUp(max_attempts=10):
            self.logger.info("Sched started and running")
        else:
            self.fail("Sched not started")
        # Comm
        self.comm.signal("-KILL")
        if self.comm.isUp(max_attempts=10):
            self.fail("Comm is still running")
        self.du.run_cmd(self.hostname, cmd, True)
        if self.comm.isUp(max_attempts=10):
            self.logger.info("Comm started and running")
        else:
            self.fail("Comm not started")
        # Server
        self.server.signal("-KILL")
        if self.server.isUp(max_attempts=10):
            self.fail("Server is still running")
        self.du.run_cmd(self.hostname, cmd, True)
        if self.server.isUp(max_attempts=10):
            self.logger.info("Server started and running")
        else:
            self.fail("Server not started")


================================================
FILE: test/tests/functional/pbs_test_entity_limits.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestEntityLimits(TestFunctional):

    """
    This test suite tests working of FGC limits

    PBS supports entity limits at queue and server level. And these limits
    can be applied for a user, group, project or overall.
    This test suite iterates over all the entities.

    """

    limit = 10

    def setUp(self):
        TestFunctional.setUp(self)

        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

    def common_limit_test(self, server, entstr, job_attr={}, queued=False,
                          exp_err=''):
        if not server:
            qname = self.server.default_queue
            self.server.manager(MGR_CMD_SET, QUEUE, entstr, qname)
        else:
            self.server.manager(MGR_CMD_SET, SERVER, entstr)

        if queued:
            j = Job(TEST_USER, job_attr)
            jid = self.server.submit(j)
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        for _ in range(self.limit):
            j = Job(TEST_USER, job_attr)
            self.server.submit(j)

        try:
            j = Job(TEST_USER, job_attr)
            self.server.submit(j)
        except PbsSubmitError as e:
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])
        else:
            self.assertFalse(True, "Job violating limits got submitted.")

        self.server.cleanup_jobs()

        try:
            jval = "1-" + str(self.limit + 1)
            job_attr[ATTR_J] = jval
            j = Job(TEST_USER, job_attr)
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])
        else:
            self.assertFalse(True, "Array Job violating limits got submitted.")

        jval = "1-" + str(self.limit)
        job_attr[ATTR_J] = jval

        j = Job(TEST_USER, job_attr)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'B'}, id=jid)
        subjob1 = j.create_subjob_id(jid, 1)
        self.server.expect(JOB, {'job_state': 'R'}, id=subjob1)

        del job_attr[ATTR_J]

        if queued:
            j = Job(TEST_USER, job_attr)
            self.server.submit(j)

        try:
            j = Job(TEST_USER, job_attr)
            self.server.submit(j)
        except PbsSubmitError as e:
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])
        else:
            self.assertFalse(True, "Job violating limits got submitted.")

        self.server.restart()

        try:
            self.server.submit(j)
        except PbsSubmitError as e:
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])
        else:
            self.assertFalse(True, "Job violating limits got submitted after "
                             "server restart.")

    def test_server_generic_user_limits_queued(self):
        """
        Test queued_jobs_threshold for any user at the server level.
        """
        a = {"queued_jobs_threshold":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        m = "qsub: would exceed complex's per-user limit of jobs in 'Q' state"
        self.common_limit_test(True, a, queued=True, exp_err=m)

    def test_server_user_limits_queued(self):
        """
        Test queued_jobs_threshold for user TEST_USER at the server level.
        """
        a = {"queued_jobs_threshold":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        errmsg = "qsub: Maximum number of jobs in 'Q' state for user " + \
            str(TEST_USER) + ' already in complex'
        self.common_limit_test(True, a, queued=True, exp_err=errmsg)

    def test_server_project_limits_queued(self):
        """
        Test queued_jobs_threshold for project p1 at the server level.
        """
        a = {"queued_jobs_threshold": "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_project: 'p1'}
        errmsg = "qsub: Maximum number of jobs in 'Q' state for project p1 " \
            + "already in complex"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    def test_server_generic_project_limits_queued(self):
        """
        Test queued_jobs_threshold for any project at the server level.
        """
        a = {"queued_jobs_threshold":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        errmsg = "qsub: would exceed complex's per-project limit of jobs in " \
            + "'Q' state"
        self.common_limit_test(True, a, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_server_group_limits_queued(self):
        """
        Test queued_jobs_threshold for group TSTGRP0 at the server level.
        """
        a = {"queued_jobs_threshold":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        errmsg = "qsub: Maximum number of jobs in 'Q' state for group " + \
            str(TSTGRP0) + ' already in complex'
        self.common_limit_test(True, a, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_server_generic_group_limits_queued(self):
        """
        Test queued_jobs_threshold for any group at the server level.
        """
        a = {"queued_jobs_threshold":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        m = "qsub: would exceed complex's per-group limit of jobs in 'Q' state"
        self.common_limit_test(True, a, queued=True, exp_err=m)

    def test_server_overall_limits_queued(self):
        """
        Test queued_jobs_threshold for any entity at the server level.
        """
        a = {"queued_jobs_threshold": "[o:PBS_ALL=" + str(self.limit) + "]"}
        errmsg = "qsub: Maximum number of jobs in 'Q' state already in complex"
        self.common_limit_test(True, a, queued=True, exp_err=errmsg)

    def test_queue_generic_user_limits_queued(self):
        """
        Test queued_jobs_threshold for any user for the default queue.
        """
        a = {"queued_jobs_threshold":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = "qsub: would exceed queue generic's per-user limit of " \
            + "jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_user_limits_queued(self):
        """
        Test queued_jobs_threshold for user pbsuser1 for the default queue.
        """
        a = {"queued_jobs_threshold":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = "qsub: Maximum number of jobs in 'Q' state for user " + \
            str(TEST_USER) + ' already in queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_queue_group_limits_queued(self):
        """
        Test queued_jobs_threshold for group TSTGRP0 for the default queue.
        """
        a = {"queued_jobs_threshold":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = "qsub: Maximum number of jobs in 'Q' state for group " + \
            str(TSTGRP0) + ' already in queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_project_limits_queued(self):
        """
        Test queued_jobs_threshold for project p1 for the default queue.
        """
        a = {"queued_jobs_threshold": "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue, ATTR_project: 'p1'}
        errmsg = "qsub: Maximum number of jobs in 'Q' state for project p1 " \
            'already in queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_generic_project_limits_queued(self):
        """
        Test queued_jobs_threshold for any project for the default queue.
        """
        a = {"queued_jobs_threshold":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = 'qsub: would exceed queue ' + self.server.default_queue + \
            "'s per-project limit of jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_queue_generic_group_limits_queued(self):
        """
        Test queued_jobs_threshold for any group for the default queue.
        """
        a = {"queued_jobs_threshold":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = 'qsub: would exceed queue ' + self.server.default_queue + \
            "'s per-group limit of jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_overall_limits_queued(self):
        """
        Test queued_jobs_threshold for all entities for the default queue.
        """
        a = {"queued_jobs_threshold": "[o:PBS_ALL=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        emsg = "qsub: Maximum number of jobs in 'Q' state already in queue " \
            + self.server.default_queue
        self.common_limit_test(False, a, attrs, queued=True, exp_err=emsg)

    def test_server_generic_user_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for any user at the server level.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-user limit on resource ncpus in ' \
            + "complex for jobs in 'Q' state"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    def test_server_user_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for user pbsuser1 at the server level.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed user ' + str(TEST_USER) + \
            "'s limit on resource ncpus in complex for jobs in 'Q' state"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_server_generic_group_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for any group at the server level.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-group limit on resource ncpus in '\
            + "complex for jobs in 'Q' state"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    def test_server_project_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for project p1 at the server level.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_project: 'p1', 'Resource_List.select': '1:ncpus=1'}
        errmsg = "qsub: would exceed project p1's limit on resource ncpus in" \
            + " complex for jobs in 'Q' state"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    def test_server_generic_project_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for any project at the server level.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-project limit on resource ncpus in ' \
            + "complex for jobs in 'Q' state"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_server_group_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for group pbsuser1 at the server level.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed group ' + str(TSTGRP0) + \
            "'s limit on resource ncpus in complex for jobs in 'Q' state"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    def test_server_overall_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for all entities at the server level.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[o:PBS_ALL=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed limit on resource ncpus in complex for '\
            + "jobs in 'Q' state"
        self.common_limit_test(True, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_generic_user_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for all users for the default queue.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        emsg = 'qsub: would exceed per-user limit on resource ncpus in queue '\
            + self.server.default_queue + " for jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=emsg)

    def test_queue_user_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for user pbsuser1 for the default queue.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed user ' + str(TEST_USER) + \
            "'s limit on resource ncpus in queue " + \
            self.server.default_queue + " for jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_queue_group_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for group pbsuser1 for the default queue
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed group ' + str(TSTGRP0) + \
            "'s limit on resource ncpus in queue " + \
            self.server.default_queue + " for jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    @skipOnShasta
    def test_queue_generic_group_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for any group for the default queue.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-group limit on resource ncpus in ' \
            + 'queue ' + self.server.default_queue + " for jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_project_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for project p1 for the default queue.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 ATTR_project: 'p1', 'Resource_List.select': '1:ncpus=1'}
        errmsg = "qsub: would exceed project p1's limit on resource ncpus " + \
            'in queue ' + self.server.default_queue + " for jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_generic_project_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for any project for the default queue.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-project limit on resource ncpus in' \
            + ' queue ' + self.server.default_queue + " for jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_queue_overall_limits_res_queued(self):
        """
        Test queued_jobs_threshold_res for any entity for the default queue.
        """
        a = {"queued_jobs_threshold_res.ncpus":
             "[o:PBS_ALL=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed limit on resource ncpus in queue ' + \
            self.server.default_queue + " for jobs in 'Q' state"
        self.common_limit_test(False, a, attrs, queued=True, exp_err=errmsg)

    def test_server_generic_user_limits_max(self):
        """
        Test max_queued for any user at the server level.
        """
        a = {"max_queued":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        errmsg = "qsub: would exceed complex's per-user limit"
        self.common_limit_test(True, a, exp_err=errmsg)

    def test_server_user_limits_max(self):
        """
        Test max_queued for user pbsuser1 at the server level.
        """
        a = {"max_queued":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        errmsg = 'qsub: Maximum number of jobs for user ' + str(TEST_USER) + \
            ' already in complex'
        self.common_limit_test(True, a, exp_err=errmsg)

    def test_server_project_limits_max(self):
        """
        Test max_queued for project p1 at the server level.
        """
        a = {"max_queued": "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_project: 'p1'}
        msg = 'qsub: Maximum number of jobs for project p1 already in complex'
        self.common_limit_test(True, a, attrs, exp_err=msg)

    def test_server_generic_project_limits_max(self):
        """
        Test max_queued for any project at the server level.
        """
        a = {"max_queued":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        errmsg = "qsub: would exceed complex's per-project limit"
        self.common_limit_test(True, a, exp_err=errmsg)

    @skipOnShasta
    def test_server_group_limits_max(self):
        """
        Test max_queued for group TSTGRP0 at the server level.
        """
        a = {"max_queued":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        errmsg = 'qsub: Maximum number of jobs for group ' + str(TSTGRP0) + \
            ' already in complex'
        self.common_limit_test(True, a, exp_err=errmsg)

    @skipOnShasta
    def test_server_generic_group_limits_max(self):
        """
        Test max_queued for any group at the server level.
        """
        a = {"max_queued":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        errmsg = "qsub: would exceed complex's per-group limit"
        self.common_limit_test(True, a, exp_err=errmsg)

    def test_server_overall_limits_max(self):
        """
        Test max_queued for any entity at the server level.
        """
        a = {"max_queued": "[o:PBS_ALL=" + str(self.limit) + "]"}
        errmsg = 'qsub: Maximum number of jobs already in complex'
        self.common_limit_test(True, a, exp_err=errmsg)

    def test_queue_generic_user_limits_max(self):
        """
        Test max_queued for any user for the default queue.
        """
        a = {"max_queued":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = "qsub: would exceed queue generic's per-user limit"
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_queue_user_limits_max(self):
        """
        Test max_queued for user pbsuser1 for the default queue.
        """
        a = {"max_queued":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = 'qsub: Maximum number of jobs for user ' + str(TEST_USER) + \
            ' already in queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    @skipOnShasta
    def test_queue_group_limits_max(self):
        """
        Test max_queued for group pbsuser1 for the default queue.
        """
        a = {"max_queued":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = 'qsub: Maximum number of jobs for group ' + str(TSTGRP0) + \
            ' already in queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_queue_project_limits_max(self):
        """
        Test max_queued for project p1 for the default queue.
        """
        a = {"max_queued": "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue, ATTR_project: 'p1'}
        msg = 'qsub: Maximum number of jobs for project p1 already in queue '\
            + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=msg)

    def test_queue_generic_project_limits_max(self):
        """
        Test max_queued for any project for the default queue.
        """
        a = {"max_queued":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = 'qsub: would exceed queue ' + self.server.default_queue + \
            "'s per-project limit"
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    @skipOnShasta
    def test_queue_generic_group_limits_max(self):
        """
        Test max_queued for any group for the default queue.
        """
        a = {"max_queued":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = 'qsub: would exceed queue ' + self.server.default_queue + \
            "'s per-group limit"
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_queue_overall_limits_max(self):
        """
        Test max_queued for all entities for the default queue.
        """
        a = {"max_queued": "[o:PBS_ALL=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue}
        errmsg = 'qsub: Maximum number of jobs already in queue ' + \
            self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_server_generic_user_limits_res_max(self):
        """
        Test max_queued_res for any user at the server level.
        """
        a = {"max_queued_res.ncpus":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        emsg = 'qsub: would exceed per-user limit on resource ncpus in complex'
        self.common_limit_test(True, a, attrs, exp_err=emsg)

    def test_server_user_limits_res_max(self):
        """
        Test max_queued_res for user pbsuser1 at the server level.
        """
        a = {"max_queued_res.ncpus":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed user ' + str(TEST_USER) + \
            "'s limit on resource ncpus in complex"
        self.common_limit_test(True, a, attrs, exp_err=errmsg)

    @skipOnShasta
    def test_server_generic_group_limits_res_max(self):
        """
        Test max_queued_res for any group at the server level.
        """
        a = {"max_queued_res.ncpus":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        msg = 'qsub: would exceed per-group limit on resource ncpus in complex'
        self.common_limit_test(True, a, attrs, exp_err=msg)

    def test_server_project_limits_res_max(self):
        """
        Test max_queued_res for project p1 at the server level.
        """
        a = {"max_queued_res.ncpus":
             "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_project: 'p1', 'Resource_List.select': '1:ncpus=1'}
        errmsg = "qsub: would exceed project p1's limit on resource ncpus in" \
            + " complex"
        self.common_limit_test(True, a, attrs, exp_err=errmsg)

    def test_server_generic_project_limits_res_max(self):
        """
        Test max_queued_res for any project at the server level.
        """
        a = {"max_queued_res.ncpus":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        m = 'qsub: would exceed per-project limit on resource ncpus in complex'
        self.common_limit_test(True, a, attrs, exp_err=m)

    @skipOnShasta
    def test_server_group_limits_res_max(self):
        """
        Test max_queued_res for group pbsuser1 at the server level.
        """
        a = {"max_queued_res.ncpus":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed group ' + str(TSTGRP0) + \
            "'s limit on resource ncpus in complex"
        self.common_limit_test(True, a, attrs, exp_err=errmsg)

    def test_server_overall_limits_res_max(self):
        """
        Test max_queued_res for all entities at the server level.
        """
        a = {"max_queued_res.ncpus":
             "[o:PBS_ALL=" + str(self.limit) + "]"}
        attrs = {'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed limit on resource ncpus in complex'
        self.common_limit_test(True, a, attrs, exp_err=errmsg)

    def test_queue_generic_user_limits_res_max(self):
        """
        Test max_queued_res for all users for the default queue.
        """
        a = {"max_queued_res.ncpus":
             "[u:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-user limit on resource ncpus in' \
            + ' queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_queue_user_limits_res_max(self):
        """
        Test max_queued_res for user pbsuser1 for the default queue.
        """
        a = {"max_queued_res.ncpus":
             "[u:" + str(TEST_USER) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed user ' + str(TEST_USER) + \
            "'s limit on resource ncpus in queue " + \
            self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    @skipOnShasta
    def test_queue_group_limits_res_max(self):
        """
        Test max_queued_res for group pbsuser1 for the default queue
        """
        a = {"max_queued_res.ncpus":
             "[g:" + str(TSTGRP0) + "=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed group ' + str(TSTGRP0) + \
            "'s limit on resource ncpus in queue " + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    @skipOnShasta
    def test_queue_generic_group_limits_res_max(self):
        """
        Test max_queued_res for any group for the default queue.
        """
        a = {"max_queued_res.ncpus":
             "[g:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-group limit on resource ncpus in' \
            + ' queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_queue_project_limits_res_max(self):
        """
        Test max_queued_res for project p1 for the default queue.
        """
        a = {"max_queued_res.ncpus":
             "[p:p1=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 ATTR_project: 'p1', 'Resource_List.select': '1:ncpus=1'}
        errmsg = "qsub: would exceed project p1's limit on resource ncpus" + \
            ' in queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_queue_generic_project_limits_res_max(self):
        """
        Test max_queued_res for any project for the default queue.
        """
        a = {"max_queued_res.ncpus":
             "[p:PBS_GENERIC=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed per-project limit on resource ncpus in' \
            + ' queue ' + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_queue_overall_limits_res_max(self):
        """
        Test max_queued_res for any entity for the default queue.
        """
        a = {"max_queued_res.ncpus":
             "[o:PBS_ALL=" + str(self.limit) + "]"}
        attrs = {ATTR_queue: self.server.default_queue,
                 'Resource_List.select': '1:ncpus=1'}
        errmsg = 'qsub: would exceed limit on resource ncpus in queue ' \
                 + self.server.default_queue
        self.common_limit_test(False, a, attrs, exp_err=errmsg)

    def test_qalter_resource(self):
        """
        Test that qaltering a job's resource list is accounted
        """
        res_name = 'res_long'
        res_attr = {ATTR_RESC_TYPE: 'long', ATTR_RESC_FLAG: 'q'}
        rc = self.server.manager(MGR_CMD_CREATE, RSC, res_attr, id=res_name)

        a = {"max_queued_res." + res_name:
             "[o:PBS_ALL=" + str(self.limit) + "]"}
        qname = self.server.default_queue
        self.server.manager(MGR_CMD_SET, QUEUE, a, qname)

        self.server.manager(MGR_CMD_SET, SERVER, {ATTR_scheduling: 'False'})

        attrs = {ATTR_queue: qname, 'Resource_List.' + res_name: 9}
        j_1 = Job(TEST_USER, attrs)
        J_1_id = self.server.submit(j_1)

        try:
            attrs = {ATTR_queue: qname, 'Resource_List.' + res_name: 2}
            j_2 = Job(TEST_USER, attrs)
            self.server.submit(j_2)
        except PbsSubmitError as e:
            exp_err = 'qsub: would exceed limit on resource ' + res_name + \
                ' in queue ' + qname
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])

        attribs = {'Resource_List.' + res_name: 8}
        self.server.alterjob(J_1_id, attribs)
        self.server.expect(JOB, attribs, id=J_1_id)

        self.server.submit(j_2)

        try:
            attrs = {ATTR_queue: qname, 'Resource_List.' + res_name: 1}
            j_3 = Job(TEST_USER, attrs)
            self.server.submit(j_3)
        except PbsSubmitError as e:
            exp_err = 'qsub: would exceed limit on resource ' + res_name + \
                ' in queue ' + qname
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])

    def test_multiple_queued_limits(self):
        defqname = self.server.default_queue
        q2name = 'q2'
        a = OrderedDict()
        a['queue_type'] = 'execution'
        a['enabled'] = 'True'
        a['started'] = 'True'
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id=q2name)

        a = {"queued_jobs_threshold":
             "[u:PBS_GENERIC=10]"}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {"queued_jobs_threshold":
             "[u:PBS_GENERIC=5]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, defqname)
        jd = Job(TEST_USER, {ATTR_queue: defqname})
        j2 = Job(TEST_USER, {ATTR_queue: q2name})

        jid = self.server.submit(jd)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        for _ in range(5):
            jd = Job(TEST_USER, {ATTR_queue: defqname})
            self.server.submit(jd)

        try:
            self.server.submit(jd)
        except PbsSubmitError as e:
            exp_err = "qsub: would exceed queue generic's per-user limit " + \
                "of jobs in 'Q' state"
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])
        else:
            self.assertFalse(True, "Job violating limits got submitted.")

        for _ in range(5):
            self.server.submit(j2)

        try:
            self.server.submit(j2)
        except PbsSubmitError as e:
            exp_err = "qsub: would exceed complex's per-user limit of " + \
                "jobs in 'Q' state"
            if e.msg[0] != exp_err:
                raise self.failureException("rcvd unexpected err message: " +
                                            e.msg[0])
        else:
            self.assertFalse(True, "Job violating limits got submitted.")

    def test_pbs_all_soft_limits(self):
        """
        Set resource soft limit on server for PBS_ALL and see that the job
        requesting this resource is susceptible to preemption
        """
        # set max_run_res_soft on mem for PBS_ALL
        a = {'max_run_res_soft.mem': '[o:PBS_ALL=256mb]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 4,
             'resources_available.mem': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # set preempt prio on the scheduler
        t = "express_queue, normal_jobs, server_softlimits"
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_prio': t})

        # submit a job that requests mem and exceeds soft limit
        attr = {'Resource_List.select': '1:ncpus=2:mem=1gb'}
        j1 = Job(attrs=attr)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        # Sleep for a second and submit another job requesting all ncpus left
        # Sleep is required so that scheduler sorts the most recently started
        # job to the top of the preemptible candidates when it tries
        # preemption
        time.sleep(1)
        attr = {'Resource_List.select': '1:ncpus=2'}
        j2 = Job(attrs=attr)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        # Submit third job (normal priority) that will try to preempt the
        # job which is running over its softlimits (which is J1 here).
        j3 = Job(attrs=attr)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        # Now that no job is over its soft limits, if we submit another
        # normal priority job, it should stay queued
        j4 = Job(attrs=attr)
        jid4 = self.server.submit(j4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)

    def test_user_soft_limits(self):
        """
        Set resource soft limit on server for a user and see that the job
        requesting this resource submitted by same user are susceptible
        to preemption
        """
        # set max_run_res_soft on mem for TEST_USER
        a = {'max_run_res_soft.mem': '[u:' + str(TEST_USER) + '=256mb]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 4,
             'resources_available.mem': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # set preempt prio on the scheduler
        t = "express_queue, normal_jobs, server_softlimits"
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_prio': t})

        # submit a job as TEST_USER that requests mem and exceeds soft limit
        attr = {'Resource_List.select': '1:ncpus=2:mem=1gb'}
        j1 = Job(TEST_USER, attrs=attr)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        # Sleep for a second and submit another job requesting all ncpus left
        # Sleep is required so that scheduler sorts the most recently started
        # job to the top of the preemptible candidates when it tries
        # preemption
        time.sleep(1)
        attr = {'Resource_List.select': '1:ncpus=2'}
        j2 = Job(TEST_USER, attrs=attr)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        # Submit third job (normal priority) that will try to preempt the
        # job which is running over its softlimits (which is J1 here).
        j3 = Job(TEST_USER, attrs=attr)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        # Now that no job is over its soft limits, if we submit another
        # normal priority job, it should stay queued
        j4 = Job(TEST_USER, attrs=attr)
        jid4 = self.server.submit(j4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)

    def test_group_soft_limits(self):
        """
        Set resource soft limit on server for a group and see that the job
        requesting this resource submitted by same group are susceptible
        to preemption
        """
        # set max_run_res_soft on mem for TSTGRP0
        a = {'max_run_res_soft.mem': '[g:' + str(TSTGRP0) + '=256mb]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 4,
             'resources_available.mem': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # set preempt prio on the scheduler
        t = "express_queue, normal_jobs, server_softlimits"
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_prio': t})

        # submit a job as TSTGRP0 that requests mem and exceeds soft limit
        attr = {'Resource_List.select': '1:ncpus=2:mem=1gb',
                'group_list': TSTGRP0}
        j1 = Job(TEST_USER, attrs=attr)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        # Sleep for a second and submit another job requesting all ncpus left
        # Sleep is required so that scheduler sorts the most recently started
        # job to the top of the preemptible candidates when it tries
        # preemption
        time.sleep(1)
        attr = {'Resource_List.select': '1:ncpus=2',
                'group_list': TSTGRP1}
        j2 = Job(TEST_USER1, attrs=attr)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        # Submit third job (normal priority) that will try to preempt the
        # job which is running over its softlimits (which is J1 here).
        j3 = Job(TEST_USER1, attrs=attr)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        # Now that no job is over its soft limits, if we submit another
        # normal priority job, it should stay queued
        j4 = Job(TEST_USER1, attrs=attr)
        jid4 = self.server.submit(j4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)

    def test_project_soft_limits(self):
        """
        Set resource soft limit on server for a project and see that the job
        requesting this resource submitted under same project is susceptible
        to preemption
        """
        # set max_run_res_soft on mem for project P1
        a = {'max_run_res_soft.mem': '[p:P1=256mb]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 4,
             'resources_available.mem': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        # set preempt prio on the scheduler
        t = "express_queue, normal_jobs, server_softlimits"
        self.server.manager(MGR_CMD_SET, SCHED, {'preempt_prio': t})

        # submit a job under P1 project that requests mem and exceeds
        # soft limit
        attr = {'Resource_List.select': '1:ncpus=2:mem=1gb',
                ATTR_project: 'P1'}
        j1 = Job(TEST_USER, attrs=attr)
        jid1 = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        # Sleep for a second and submit another job requesting all ncpus left
        # Sleep is required so that scheduler sorts the most recently started
        # job to the top of the preemptible candidates when it tries
        # preemption
        time.sleep(1)
        attr = {'Resource_List.select': '1:ncpus=2',
                ATTR_project: 'P2'}
        j2 = Job(TEST_USER, attrs=attr)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        # Submit third job (normal priority) that will try to preempt the
        # job which is running over its softlimits (which is J1 here).
        j3 = Job(TEST_USER, attrs=attr)
        jid3 = self.server.submit(j3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        # Now that no job is over its soft limits, if we submit another
        # normal priority job, it should stay queued
        j4 = Job(TEST_USER, attrs=attr)
        jid4 = self.server.submit(j4)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid3)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid4)


================================================
FILE: test/tests/functional/pbs_test_qorder.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_qorder(TestFunctional):
    """
    Test suite to test whether the political order of selecting a job to run
    in scheduler changes when one does a qorder.
    """

    def test_qorder_job(self):
        """
        Submit two jobs, switch their order using qorder and then check if the
        jobs are selected to run in the newly created order.
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j1 = Job(TEST_USER)
        j1.set_sleep_time(10)
        j2 = Job(TEST_USER)
        j2.set_sleep_time(10)
        jid1 = self.server.submit(j1)
        jid2 = self.server.submit(j2)

        rc = self.server.orderjob(jobid1=jid1, jobid2=jid2)
        self.assertEqual(rc, 0)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'server_state': 'Scheduling'}
        self.server.expect(SERVER, a, op=NE)

        jid2 = jid2.split('.')[0]
        cycle = self.scheduler.cycles(start=self.server.ctime, lastN=1)
        cycle = cycle[0]
        firstconsidered = cycle.political_order[0]
        msg = 'testinfo: first job considered [' + str(firstconsidered) + \
              '] == second submitted [' + str(jid2) + ']'
        self.logger.info(msg)

        self.assertEqual(firstconsidered, jid2)

    def test_qorder_job_across_queues(self):
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        a = {'scheduling': 'false'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'queue_type': 'e', 'enabled': '1', 'started': '1'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='workq2')

        self.scheduler.set_sched_config({'by_queue': 'False'})

        a = {ATTR_queue: 'workq'}
        j1 = Job(TEST_USER, a)
        j1.set_sleep_time(10)
        a = {ATTR_queue: 'workq2'}
        j2 = Job(TEST_USER, a)
        j2.set_sleep_time(10)
        jid1 = self.server.submit(j1)
        jid2 = self.server.submit(j2)

        rc = self.server.orderjob(jobid1=jid1, jobid2=jid2)
        self.assertEqual(rc, 0)

        a = {'scheduling': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'server_state': 'Scheduling'}
        self.server.expect(SERVER, a, op=NE)

        jid2 = jid2.split('.')[0]
        cycle = self.scheduler.cycles(start=self.server.ctime, lastN=1)
        cycle = cycle[0]
        firstconsidered = cycle.political_order[0]
        msg = 'testinfo: first job considered [' + str(firstconsidered) + \
              '] == second submitted [' + str(jid2) + ']'
        self.logger.info(msg)

        self.assertEqual(firstconsidered, jid2)


================================================
FILE: test/tests/functional/pbs_test_run_count.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_run_count(TestFunctional):
    """
    Test suite to test run_count attribute of a job.
    """
    hook_name = "h1"
    hook_body = ("import pbs\n"
                 "e=pbs.event()\n"
                 "e.reject()\n")

    def create_reject_begin_hook(self):
        start_time = time.time()
        attr = {'event': 'execjob_begin'}
        self.server.create_import_hook(self.hook_name, attr, self.hook_body)

        # make sure hook has propogated to mom
        self.mom.log_match("h1.HK;copy hook-related file request received",
                           existence=True, starttime=start_time)

    def disable_reject_begin_hook(self):
        start_time = time.time()
        attr = {'enabled': 'false'}
        self.server.manager(MGR_CMD_SET, HOOK, attr, self.hook_name)

        # make sure hook has propogated to mom
        self.mom.log_match("h1.HK;copy hook-related file request received",
                           existence=True, starttime=start_time)

    def check_run_count(self, input_count="0", output_count="21"):
        """
        Creates a hook, submits a job and checks the run count.
        input_count is the user requested run_count and output_count
        is the run_count attribute of job from the scheduler.
        """
        # Create an execjob_begin hook that rejects the job
        self.create_reject_begin_hook()

        a = {ATTR_W: "run_count=" + input_count}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': "H", 'run_count': output_count},
                           attrop=PTL_AND, id=jid)

    def test_run_count_overflow(self):
        """
        Submit a job that requests run count exceeding 64 bit integer limit
        and see that such a job gets rejected.
        """
        a = {ATTR_W: "run_count=18446744073709551616"}
        j = Job(TEST_USER, a)
        try:
            self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue("illegal -W value" in e.msg[0])

    def test_large_run_count(self):
        """
        Submit a job with a large (>20) but valid run_count value and create
        an execjob_begin hook that will reject the job. Check run_count to
        make sure that the job goes to held state just after one rejection.
        This is so because if run_count is greater than 20 then PBS will hold
        the job upon the first rejection from mom.
        """

        self.check_run_count(input_count="184", output_count="185")

    def test_less_than_20_run_count(self):
        """
        Submit a job with a run count 15, create a execjob_begin
        hook to reject the job and test that the job goes
        into held state after 5 rejections
        """
        self.check_run_count(input_count="15", output_count="21")

    def subjob_check(self, jid, sjid, maxruncount="21"):
        self.server.expect(JOB, {ATTR_state: "H", ATTR_runcount: maxruncount},
                           attrop=PTL_AND, id=sjid)
        ja_comment = "Job Array Held, too many failed attempts to run subjob"
        self.server.expect(JOB, {ATTR_state: "H",
                                 ATTR_comment: (MATCH_RE, ja_comment)},
                           attrop=PTL_AND, id=jid)
        self.disable_reject_begin_hook()
        self.server.rlsjob(jid, 's')
        self.server.expect(JOB, {ATTR_state: "R"}, id=sjid)
        ja_comment = "Job Array Began at"
        self.server.expect(JOB, {ATTR_state: "B",
                                 ATTR_comment: (MATCH_RE, ja_comment)},
                           attrop=PTL_AND, id=jid)

    def test_run_count_subjob(self):
        """
        Submit a job array and check if the subjob and the parent are getting
        held after 20 rejection from mom
        """
        # Create an execjob_begin hook that rejects the job
        self.create_reject_begin_hook()

        a = {ATTR_J: '1-2'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.subjob_check(jid=jid, sjid=j.create_subjob_id(jid, 1))

    def test_run_count_subjob_in_x(self):
        """
        Submit a job array and check if the subjob and the parent are getting
        held after 20 rejection from mom when there is another subjob in X
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 1},
                            id=self.mom.shortname)

        a = {ATTR_J: '1-6'}
        j = Job(TEST_USER, a)
        j.set_sleep_time(20)
        jid = self.server.submit(j)
        self.logger.info("Waiting for second subjob to go in R state")
        self.server.expect(JOB, {ATTR_state: "R"},
                           id=j.create_subjob_id(jid, 2), offset=15)
        # Create an execjob_begin hook that rejects the job
        self.create_reject_begin_hook()
        self.logger.info("Waiting for subjob to finish")
        self.server.expect(JOB, {ATTR_state: "X"},
                           id=j.create_subjob_id(jid, 2), offset=15)

        self.subjob_check(jid=jid, sjid=j.create_subjob_id(jid, 3))

    def test_large_run_count_subjob(self):
        """
        Submit a job array with a large (>20) but valid run_count value and
        check if the subjob and the parent are getting
        held after 1 rejection from mom
        """
        # Create an execjob_begin hook that rejects the job
        self.create_reject_begin_hook()

        a = {ATTR_W: "run_count=39", ATTR_J: '1-2'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        sjid = j.create_subjob_id(jid, 1)
        self.subjob_check(jid, sjid, maxruncount="40")
        return sjid

    def test_large_run_count_subjob_in_x(self):
        """
        Submit a job array and check if the subjob and the parent are getting
        held after 20 rejection from mom when there is another subjob in X
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 1},
                            id=self.mom.shortname)

        a = {ATTR_W: "run_count=453", ATTR_J: '1-6'}
        j = Job(TEST_USER, a)
        j.set_sleep_time(10)
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_state: "R"},
                           id=j.create_subjob_id(jid, 2))
        self.server.manager(MGR_CMD_SET, SCHED, {"scheduling": "false"})
        # Create an execjob_begin hook that rejects the job
        self.create_reject_begin_hook()
        self.server.manager(MGR_CMD_SET, SCHED, {"scheduling": "true"})
        self.server.expect(JOB, {ATTR_state: "X"},
                           id=j.create_subjob_id(jid, 2))

        self.subjob_check(jid=jid, sjid=j.create_subjob_id(jid, 3),
                          maxruncount="454")

    def test_subjob_run_count_on_rerun(self):
        """
        to check if subjob which was previously held retains its run_count on
        rerun
        """
        sjid = self.test_large_run_count_subjob()
        self.server.rerunjob(sjid)
        self.server.expect(JOB, {ATTR_state: "R", ATTR_runcount: "42"},
                           attrop=PTL_AND, id=sjid)


================================================
FILE: test/tests/functional/pbs_test_svr_dflt.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestServerDefaultAttrib(TestFunctional):

    dflt_attr = {'scheduling': 'True',
                 'query_other_jobs': 'True',
                 'scheduler_iteration': '600',
                 'resources_default.ncpus': '1',
                 'log_events': '511',
                 'mail_from': 'adm',
                 'pbs_license_linger_time': '31536000',
                 'pbs_license_min': '0',
                 'pbs_license_max': '2147483647',
                 'eligible_time_enable': 'False',
                 'max_concurrent_provision': '5',
                 'resv_enable': 'True',
                 'max_array_size': '10000',
                 }

    def test_server_unset_dflt_attr(self):
        """
        Test that server sets the listed attributes with their default values
        when they are unset
        """
        for attr in self.dflt_attr:
            self.server.manager(MGR_CMD_UNSET, SERVER, attr)

        self.server.expect(SERVER, self.dflt_attr, attrop=PTL_AND,
                           max_attempts=20)

    def test_server_unset_dflt_attr_and_restart(self):
        """
        Test that server sets the listed attributes with their default values
        when they are unset and retain it across boots
        """
        for attr in self.dflt_attr:
            self.server.manager(MGR_CMD_UNSET, SERVER, attr)

        self.server.expect(SERVER, self.dflt_attr, attrop=PTL_AND,
                           max_attempts=20)
        self.server.restart()
        self.server.expect(SERVER, self.dflt_attr, attrop=PTL_AND,
                           max_attempts=20)


================================================
FILE: test/tests/functional/pbs_test_tpp.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.functional import *
import socket


@tags('comm')
class TestTPP(TestFunctional):
    """
    Test suite consists of tests to check the functionality of pbs_comm daemon
    """
    node_list = []
    default_client = None

    def setUp(self):
        TestFunctional.setUp(self)
        self.pbs_conf = self.du.parse_pbs_config(self.server.shortname)
        self.pbs_conf_path = self.du.get_pbs_conf_file(
            hostname=self.server.hostname)
        msg = "Unable to retrieve pbs.conf file path"
        self.assertNotEqual(self.pbs_conf_path, None, msg)

        self.exec_path = os.path.join(self.pbs_conf['PBS_EXEC'], "bin")
        if not self.default_client:
            self.default_client = self.server.client

        # Retrieve temporary directory
        self.tmp_dir = self.du.get_tempdir(hostname=self.server.hostname)
        msg = "Unable to get temp_dir"
        self.assertNotEqual(self.tmp_dir, None, msg)

    def pbs_restart(self, host_name):
        """
        This function restarts PBS daemons
        :param host_name: Name of the host on which PBS
                          has to be restarted
        :type host_name: String
        """
        pi = PBSInitServices(hostname=host_name)
        pi.restart()

    def set_pbs_conf(self, host_name, conf_param):
        """
        This function sets attributes in pbs.conf file
        :param host_name: Name of the host on which pbs.conf
                          has to be updated
        :type host_name: String
        :param conf_param: Parameters to be updated in pbs.conf
        :type conf_param: Dictionary
        """
        pbsconfpath = self.du.get_pbs_conf_file(hostname=host_name)
        self.du.set_pbs_config(hostname=host_name, fin=pbsconfpath,
                               confs=conf_param)
        self.pbs_restart(host_name)

    def unset_pbs_conf(self, host_name, conf_param):
        """
        This function unsets parameters in pbs.conf file
        :param host_name: Name of the host on which pbs.conf
                          has to be updated
        :type host_name: String
        :param conf_param: Parameters to be removed from pbs.conf
        :type conf_param: List
        """
        pbsconfpath = self.du.get_pbs_conf_file(hostname=host_name)
        self.du.unset_pbs_config(hostname=host_name,
                                 fin=pbsconfpath, confs=conf_param)
        self.pbs_restart(host_name)

    def submit_resv(self, resv_set_attr=None, resv_exp_attr=None):
        """
        Submits reservation and check for the reservation attributes
        :param resv_set_attr: Reservation attributes to set
        :type resv_set_attr: Dictionary. Defaults to None
        :param resv_exp_attrib: Reservation attributes to verify
        :type resv_exp_attrib: Dictionary. Defaults to None
        """
        r = Reservation(TEST_USER)
        if resv_set_attr is None:
            resv_set_attr = {ATTR_l + '.select': '2:ncpus=1',
                             ATTR_l + '.place': 'scatter',
                             'reserve_start': time.time() + 10,
                             'reserve_end': time.time() + 120}
        r.set_attributes(resv_set_attr)
        rid = self.server.submit(r)
        if not resv_exp_attr:
            resv_exp_attr = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, resv_exp_attr, id=rid)
        return rid

    def submit_job(self, set_attr=None, exp_attr=None, job=False,
                   job_script=False, interactive=False, rid=None,
                   resv_job=False, sleep=1):
        """
        Submits job and check for the job attributes
        :param set_attr: Job attributes to set
        :type set_attr: Dictionary. Defaults to None
        :param exp_attr: Job attributes to verify
        :type exp_attr: Dictionary. Defaults to None
        :param job: Whether to submit a multi chunk job
        :type job: Bool. Defaults to False
        :param job_script: Whether to submit a job using job script
        :type job_script: Bool. Defaults to False
        :param interactive: Whether to submit a interactive job
        :type interactive: Bool. Defaults to False
        :param rid: Reservation id
        :type rid: String
        :param resv_job: Whether to submit job into reservation.
        :type resv_job: Bool. Defaults to False
        :param sleep: Job's sleep time
        :type sleep: Integer. Defaults to 1s
        """
        j = Job(TEST_USER)
        if set_attr is None:
            set_attr = {ATTR_l + '.select': '2:ncpus=1',
                        ATTR_l + '.place': 'scatter', ATTR_k: 'oe'}
        if job:
            j.set_attributes(set_attr)

        if interactive:
            set_attr[ATTR_inter] = ''
            j.set_attributes(set_attr)
            j.interactive_script = [('hostname', '.*'),
                                    ('export PATH=$PATH:%s' %
                                     self.exec_path, '.*'),
                                    ('qstat', '.*')]
        if resv_job:
            if ATTR_inter in set_attr:
                del set_attr[ATTR_inter]
            resv_que = rid.split('.')[0]
            set_attr[ATTR_q] = resv_que
            j.set_attributes(set_attr)

        if job_script:
            pbsdsh_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                       "bin", "pbsdsh")
            script = "#!/bin/sh\n%s sleep %s" % (pbsdsh_path, sleep)
            j.create_script(script, hostname=self.server.client)
        else:
            j.set_sleep_time(sleep)

        jid = self.server.submit(j)
        if exp_attr is not None:
            self.server.expect(JOB, exp_attr, offset=offset, id=jid)
        return jid

    def common_steps(self, set_attr=None, exp_attr=None, job=False,
                     interactive=False, resv=False,
                     resv_set_attr=None, resv_exp_attr=None,
                     resv_job=False, client=None):
        """
        This function contains common steps of submitting
        different kind of jobs.
        Submits job and check for the job attributes
        :param set_attr: Job attributes to set
        :type set_attr: Dictionary. Defaults to None
        :param exp_attr: Job attributes to verify
        :type exp_attr: Dictionary. Defaults to None
        :param job: Whether to submit a multi chunk job
        :type job: Bool. Defaults to False
        :param interactive: Whether to submit a interactive job
        :type interactive: Bool. Defaults to False
        :param resv: Whether to submit reservation.
        :type resv: Bool. Defaults to False
        :param resv_set_attr: Reservation attributes to set
        :type resv_set_attr: Dictionary. Defaults to None
        :param resv_exp_attrib: Reservation attributes to verify
        :type resv_exp_attrib: Dictionary. Defaults to None
        :param resv_job: Whether to submit job into reservation.
        :type resv_job: Bool. Defaults to False
        :param client: Name of the client
        :type client: String. Defaults to None
        """
        if client is None:
            self.server.client = self.server.hostname
        else:
            self.server.client = client
        if job:
            jid = self.submit_job(set_attr, exp_attr, job=True,
                                  job_script=True)
            self.server.expect(JOB, 'queue', id=jid, op=UNSET, offset=1)
            self.server.log_match("%s;Exit_status=0" % jid)
        # Submit Interactive Job
        if interactive:
            jid = self.submit_job(set_attr, exp_attr, interactive=True)
            self.server.expect(JOB, 'queue', id=jid, op=UNSET)
            self.server.log_match("%s;Exit_status=0" % jid)
        # Submit reservation
        if resv:
            rid = self.submit_resv(resv_set_attr, resv_exp_attr)
            jid = self.submit_job(set_attr, exp_attr, resv_job=True,
                                  rid=rid, job_script=True)
            # Wait for reservation to start
            a = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
            self.server.expect(RESV, a, rid)
            self.server.expect(JOB, 'queue', id=jid, op=UNSET, offset=1)
            self.server.log_match("%s;Exit_status=0" % jid)

    @requirements(num_moms=2)
    def test_comm_with_mom(self):
        """
        This test verifies communication between server-mom and
        between moms through pbs_comm
        Configuration:
        Node 1 : Server, Mom, Sched, Comm
        Node 2 : Mom
        """
        log_msgs = ["TPP initialization done",
                    "Connected to pbs_comm %s.*:17001" % self.server.shortname]
        for msg in log_msgs:
            self.server.log_match(msg, regexp=True)
            for mom in self.moms.values():
                self.mom.log_match(msg, regexp=True)
        server_ip = socket.gethostbyname(self.server.hostname)
        msg = "Registering address %s:15001 to pbs_comm" % server_ip
        self.server.log_match(msg)
        for mom in self.moms.values():
            ip = socket.gethostbyname(mom.shortname)
            msg1 = "Registering address %s:15003 to pbs_comm" % ip
            msg2 = "Leaf registered address %s:15003" % ip
            mom.log_match(msg1)
            self.comm.log_match(msg2)
        self.common_steps(job=True, interactive=True, resv=True,
                          resv_job=True)

    @requirements(num_moms=2, num_clients=1)
    def test_client_with_mom(self):
        """
        This test verifies communication between server-mom,
        server-client and between moms through pbs_comm
        Configuration:
        Node 1 : Server, Mom, Sched, Comm
        Node 2 : Mom
        Node 3 : Client
        """
        if self.server.client == self.server.hostname:
            msg = "Test requires client as input which is on non server"
            msg += " host"
            self.skipTest(msg)
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        self.hostC = self.server.client
        self.node_list = [self.hostA, self.hostB, self.hostC]
        self.server.manager(MGR_CMD_SET, SERVER, {'flatuid': True})
        self.common_steps(job=True, interactive=True)
        self.common_steps(resv=True, resv_job=True, client=self.hostB)

    @requirements(num_moms=2, num_clients=1, no_comm_on_server=True)
    def test_comm_non_server_host(self):
        """
        This test verifies communication between server-mom,
        server-client and between moms through pbs_comm which
        is running on non server host
        Configuration:
        Node 1 : Server, Mom, Sched
        Node 2 : Client
        Node 3 : Mom
        Node 4 : Comm
        """
        if self.server.client == self.server.hostname:
            msg = "Test requires client as input which is on non server"
            msg += " host"
            self.skipTest(msg)
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.comm1 = self.comms.values()[0]
        self.hostA = self.momA.shortname
        self.hostB = self.server.client
        self.hostC = self.momB.shortname
        self.hostD = self.comm1.shortname
        self.node_list = [self.hostA, self.hostB,
                          self.hostC, self.hostD]
        a = {'PBS_START_COMM': '0', 'PBS_START_MOM': '1',
             'PBS_LEAF_ROUTERS': self.hostD}
        b = {'PBS_LEAF_ROUTERS': self.hostD}
        hosts = [self.hostA, self.hostB, self.hostC]
        moms = [self.hostA, self.hostC]
        if self.server.shortname not in hosts:
            hosts.append(self.server.shortname)
        for host in hosts:
            if host == self.server.shortname and host in moms:
                self.set_pbs_conf(host_name=host, conf_param=a)
            elif host == self.server.shortname and \
                    host not in self.moms.values():
                a['PBS_START_MOM'] = "0"
                self.set_pbs_conf(host_name=host, conf_param=a)
            else:
                self.set_pbs_conf(host_name=host, conf_param=b)
        self.common_steps(job=True, resv=True, resv_job=True)
        self.common_steps(interactive=True, client=self.hostB)

    @requirements(num_moms=2, no_mom_on_server=True)
    def test_mom_non_server_host(self):
        """
        This test verifies communication between server-mom,
        between moms which are running on non server host
        through pbs_comm.
        Configuration:
        Node 1 : Server, Sched, Comm
        Node 2 : Mom
        Node 3 : Mom
        """
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname
        self.node_list = [self.hostA, self.hostB]
        self.common_steps(job=True, resv=True,
                          resv_job=True, client=self.hostA)
        self.common_steps(job=True, interactive=True,
                          client=self.hostB)

    def test_comm_with_vnode_insertion(self):
        """
        Test for verifying vnode insertion when using TPP
        """
        vn = self.mom.shortname
        if not self.mom.is_cpuset_mom():
            a = {'resources_available.ncpus': 1}
            self.mom.create_vnodes(a, 2)
            vnode_val = "vnode=%s[0]:ncpus=1+vnode=%s[1]:ncpus=1" % (vn, vn)
        else:
            vnode_val = "vnode=%s:ncpus=1" % self.server.status(NODE)[1]['id']
            vnode_val += "+vnode=%s:ncpus=1" % self.server.status(NODE)[
                2]['id']
        set_attr = {ATTR_l + '.select': vnode_val,
                    ATTR_k: 'oe'}
        resv_set_attr = {ATTR_l + '.select': vnode_val,
                         'reserve_start': time.time() + 30,
                         'reserve_end': time.time() + 120}
        self.common_steps(job=True, set_attr=set_attr,
                          resv_set_attr=resv_set_attr)
        self.comm.stop('-KILL')
        if self.mom.is_cpuset_mom():
            ret = self.server.status(NODE)
            vnode_list = [ret[1]['id'], ret[2]['id']]
        else:
            vnode_list = [vn + "[0]", vn + "[1]"]
        a = {'state': (MATCH_RE, "down")}
        for vnode in vnode_list:
            self.server.expect(VNODE, a, id=vnode)

    def common_setup(self, no_mom_on_comm=False, no_comm_on_server=False,
                     req_moms=2, req_comms=2):
        """
        This function sets the shortnames of moms and comms in the cluster
        accordingly.
        Mom objects : self.momA, self.momB, self.momC
        Mom shortnames : self.hostA, self.hostB, self.hostC
        comm objects : self.comm2, self.comm3
        comm shortnames : self.hostD, self.hostE
        :param no_mom_on_comm: Flag, True if no mom is present on comm
        :type no_mom_on_comm: Bool. Defaults to False
        :param no_comm_on_server: Flag, True if no comm is present on server
        :type no_comm_on_server: Bool. Defaults to False
        :param req_moms: No of required moms
        :type req_moms: Integer. Defaults to 2
        :param req_comms: No of required comms
        :type req_comms: Integer. Defaults to 2
        """
        mom_list = [x.shortname for x in self.moms.values()]
        comm_list = [y.shortname for y in self.comms.values()]
        num_moms = len(mom_list)
        num_comms = len(comm_list)
        if (req_moms != num_moms) and (req_comms != num_comms):
            msg = "Test requires exact %s moms and %s" % (req_moms, req_comms)
            msg += " comms as input"
            self.skipTest(msg)
        if not no_mom_on_comm and not no_comm_on_server:
            if self.server.shortname not in mom_list:
                self.skipTest("Mom and comm should be on server host")
        if num_moms == 2 and num_comms == 2:
            self.hostA = self.server.shortname
            self.momB = self.moms.values()[1]
            self.hostB = mom_list[1]
            self.comm2 = self.comms.values()[1]
            self.hostC = comm_list[1]
            self.node_list = [self.hostA, self.hostB, self.hostC]
        elif num_moms == 3 and num_comms == 3:
            self.hostA = self.server.shortname
            self.hostB = mom_list[1]
            self.hostC = comm_list[1]
            self.hostD = mom_list[2]
            self.hostE = comm_list[2]
            self.node_list = [
                self.hostA,
                self.hostB,
                self.hostC,
                self.hostD,
                self.hostE]
        elif num_moms == 2 and num_comms == 3:
            if self.server.shortname not in comm_list:
                self.hostA = comm_list[0]
            else:
                self.hostA = self.server.shortname
            self.hostB = mom_list[0]
            self.hostD = comm_list[1]
            self.hostC = mom_list[1]
            self.hostE = comm_list[2]
            self.node_list = [
                self.hostA,
                self.hostB,
                self.hostC,
                self.hostD,
                self.hostE]
        elif num_moms == 4 and num_comms == 5:
            self.hostA = self.server.shortname
            self.hostB = mom_list[0]
            self.hostC = mom_list[1]
            self.hostD = mom_list[2]
            self.hostE = mom_list[3]
            self.comm2 = self.comms.values()[1]
            self.hostF = comm_list[1]
            self.hostG = comm_list[2]
            self.comm4 = self.comms.values()[3]
            self.hostH = comm_list[3]
            self.hostI = comm_list[4]
            self.node_list = [
                self.hostA,
                self.hostB,
                self.hostC,
                self.hostD,
                self.hostE, self.hostF, self.hostG, self.hostH,
                self.hostI]

    @requirements(num_moms=2, num_comms=2)
    def test_multiple_comm_with_mom(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        """
        self.common_setup()
        a = {'PBS_COMM_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        b = {'PBS_LEAF_ROUTERS': self.hostC}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.common_steps(job=True, interactive=True, resv=True,
                          resv_job=True)

    def common_steps_for_comm_failover(self):
        """
        This function has common steps for comm failover used in
        diff tests
        """
        self.common_steps(job=True, interactive=True)
        rid = self.submit_resv()
        jid = self.submit_job(rid=rid, resv_job=True, sleep=60)
        resv_exp_attrib = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, resv_exp_attrib, rid, offset=10)
        job_exp_attrib = {'job_state': 'R'}
        self.server.expect(JOB, job_exp_attrib, id=jid)
        self.comm2.stop('-KILL')
        for mom in self.moms.values():
            self.server.expect(NODE, {'state': 'free'}, id=mom.shortname)
        self.server.expect(RESV, resv_exp_attrib, rid)
        self.server.expect(JOB, job_exp_attrib, id=jid)
        self.comm2.start()
        self.comm.stop('-KILL')
        for mom in self.moms.values():
            self.server.expect(NODE, {'state': 'free'}, id=mom.shortname)
        self.server.expect(RESV, resv_exp_attrib, rid)
        self.server.expect(JOB, job_exp_attrib, id=jid)

    @requirements(num_moms=2, num_comms=2)
    def test_comm_failover(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        """
        self.common_setup()
        a = {'PBS_COMM_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        leaf_val = self.hostA + "," + self.hostC
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = self.hostC + "," + self.hostA
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.common_steps_for_comm_failover()

    @requirements(num_moms=2, num_comms=2)
    def test_comm_failover_with_invalid_values(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when values of PBS_LEAF_ROUTERS
        in pbs.conf are invalid
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        """
        self.common_setup()
        # set a valid hostname but invalid PBS_LEAF_ROUTERS value
        param = {'PBS_LEAF_ROUTERS': self.hostB}
        self.set_pbs_conf(host_name=self.hostB, conf_param=param)
        self.server.expect(NODE, {'state': 'down'}, id=self.hostB)
        # set a invalid PBS_LEAF_ROUTERS value for secondary comm
        invalid_val = self.hostA + "XXXX"
        leaf_val = self.hostC + "," + invalid_val
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.comm2.stop('-KILL')
        self.server.expect(NODE, {'state': 'down'}, id=self.hostB)
        exp_msg = ["Error 99 while connecting to %s:17001" % invalid_val,
                   "Error -2 resolving %s" % invalid_val
                   ]
        for msg in exp_msg:
            self.momB.log_match(msg)
        # set a invalid PBS_LEAF_ROUTERS value for primary comm
        leaf_val = invalid_val + "," + self.hostC
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        self.comm.stop('-KILL')
        self.server.expect(NODE,
                           {'state': 'state-unknown,down'},
                           id=self.hostA)
        for msg in exp_msg:
            self.momB.log_match(msg)
        # set a invalid port value for PBS_LEAF_ROUTERS
        invalid_val = self.hostA + ":1700"
        leaf_val = self.hostC + "," + invalid_val
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.comm2.stop('-KILL')
        self.server.expect(NODE,
                           {'state': 'state-unknown,down'},
                           id=self.hostB)

        # set same value for secondary comm as primary in PBS_LEAF_ROUTERS
        leaf_val = self.hostC + "," + self.hostC
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.comm2.stop('-KILL')
        self.server.expect(NODE,
                           {'state': 'state-unknown,down'},
                           id=self.hostB)

    @requirements(num_moms=2, num_comms=2)
    def test_comm_failover_with_ipaddress(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when PBS_LEAF_ROUTERS has ipaddress as value
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        """
        self.common_setup()
        hostA_ip = socket.gethostbyname(self.hostA)
        hostC_ip = socket.gethostbyname(self.hostC)
        a = {'PBS_COMM_ROUTERS': hostA_ip}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        leaf_val = hostA_ip + "," + hostC_ip
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = hostC_ip + "," + hostA_ip
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.common_steps_for_comm_failover()

    @requirements(num_moms=2, num_comms=2)
    def test_comm_failover_with_ipaddress_hostnames(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when PBS_LEAF_ROUTERS has ipaddress
        and hostname as values
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        """
        self.common_setup()
        hostA_ip = socket.gethostbyname(self.hostA)
        hostC_ip = socket.gethostbyname(self.hostC)
        a = {'PBS_COMM_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        leaf_val = self.hostA + "," + hostC_ip
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = self.hostC + "," + hostA_ip
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.common_steps_for_comm_failover()

    @requirements(num_moms=2, num_comms=2)
    def test_comm_failover_with_ipaddress_hostnames_port(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when PBS_LEAF_ROUTERS has ipaddress,
        port number and hostname as its values
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        """
        self.common_setup()
        hostA_ip = socket.gethostbyname(self.hostA)
        hostC_ip = socket.gethostbyname(self.hostC)
        a = {'PBS_COMM_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        leaf_val = self.hostA + ":17001" + "," + self.hostC
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = hostC_ip + "," + self.hostA + ":17001"
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.common_steps_for_comm_failover()

    def copy_pbs_conf_to_non_default_path(self):
        """
        This function copies the pbs.conf from default location
        to non default location
        """
        self.new_conf_path = os.path.join(self.tmp_dir, "pbs.conf")

        # Copy pbs.conf file to temporary location
        rc = self.du.run_copy(src=self.pbs_conf_path, dest=self.new_conf_path)
        msg = "Cannot copy %s " % self.pbs_conf_path
        msg += "%s, error: %s" % (self.new_conf_path, rc['err'])
        self.assertEqual(rc['rc'], 0, msg)

        # Set the PBS_CONF_FILE variable to the temp location
        os.environ['PBS_CONF_FILE'] = self.new_conf_path
        self.logger.info("Successfully exported PBS_CONF_FILE variable")

        self.server.pi.conf_file = self.new_conf_path
        self.pbs_restart(self.server.hostname)
        self.logger.info("PBS services started successfully")

    @requirements(num_moms=2, num_comms=2)
    def test_comm_failover_with_nondefault_pbs_conf(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when PBS_LEAF_ROUTERS has ipaddress,
        port number and hostname as values and pbs.conf is in
        non default location
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        """
        self.common_setup()
        hostA_ip = socket.gethostbyname(self.hostA)
        hostC_ip = socket.gethostbyname(self.hostC)
        a = {'PBS_COMM_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        leaf_val = self.hostA + ":17001" + "," + self.hostC
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = hostC_ip + "," + self.hostA + ":17001"
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        self.copy_pbs_conf_to_non_default_path()
        self.common_steps_for_comm_failover()

    @requirements(num_moms=3, num_comms=3)
    def test_comm_routers_with_hostname(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when multiple hostname values for
        PBS_COMM_ROUTERS are set.
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        Node 4 : Mom (self.hostD)
        Node 5 : Comm (self.hostE)
        """
        self.common_setup(req_moms=3, req_comms=3)
        a = {'PBS_COMM_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        comm_val = self.hostA + "," + self.hostC
        a = {'PBS_COMM_ROUTERS': comm_val}
        self.set_pbs_conf(host_name=self.hostE, conf_param=a)
        leaf_val = self.hostA + "," + self.hostC + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = self.hostC + "," + self.hostA + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        leaf_val = self.hostE + "," + self.hostC + "," + self.hostA
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostD, conf_param=b)
        set_attr = {ATTR_l + '.select': '3:ncpus=1',
                    ATTR_l + '.place': 'scatter', ATTR_k: 'oe'}
        resv_set_attr = {ATTR_l + '.select': '3:ncpus=1',
                         ATTR_l + '.place': 'scatter',
                         'reserve_start': time.time() + 30,
                         'reserve_end': time.time() + 120}
        self.common_steps(set_attr=set_attr, resv_set_attr=resv_set_attr,
                          job=True, interactive=True, resv=True,
                          resv_job=True)

    @requirements(num_moms=3, num_comms=3)
    def test_comm_routers_with_ipaddress(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when multiple ipadress for
        PBS_COMM_ROUTERS are set.
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        Node 4 : Mom (self.hostD)
        Node 5 : Comm (self.hostE)
        """
        self.common_setup(req_moms=3, req_comms=3)
        hostA_ip = socket.gethostbyname(self.hostA)
        hostC_ip = socket.gethostbyname(self.hostC)
        a = {'PBS_COMM_ROUTERS': hostA_ip}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        comm_val = hostA_ip + "," + hostC_ip
        a = {'PBS_COMM_ROUTERS': comm_val}
        self.set_pbs_conf(host_name=self.hostE, conf_param=a)
        leaf_val = self.hostA + "," + self.hostC + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = self.hostC + "," + self.hostA + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        leaf_val = self.hostE + "," + self.hostC + "," + self.hostA
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostD, conf_param=b)
        set_attr = {ATTR_l + '.select': '3:ncpus=1',
                    ATTR_l + '.place': 'scatter', ATTR_k: 'oe'}
        resv_set_attr = {ATTR_l + '.select': '3:ncpus=1',
                         ATTR_l + '.place': 'scatter',
                         'reserve_start': int(time.time()) + 30,
                         'reserve_end': int(time.time()) + 120}
        self.common_steps(set_attr=set_attr, resv_set_attr=resv_set_attr,
                          job=True, interactive=True, resv=True,
                          resv_job=True)

    @requirements(num_moms=3, num_comms=3)
    def test_comm_routers_with_ipaddress_hostnames_port(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        with pbs_comm failover when PBS_COMM_ROUTERS has ipaddress,
        port number and hostname as its values
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        Node 4 : Mom (self.hostD)
        Node 5 : Comm (self.hostE)
        """
        self.common_setup(req_moms=3, req_comms=3)
        hostA_ip = socket.gethostbyname(self.hostA)
        comm_val = self.hostA + ":17001"
        a = {'PBS_COMM_ROUTERS': comm_val}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        comm_val = hostA_ip + ":17001" + "," + self.hostC
        a = {'PBS_COMM_ROUTERS': comm_val}
        self.set_pbs_conf(host_name=self.hostE, conf_param=a)
        leaf_val = self.hostA + "," + self.hostC + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = self.hostC + "," + self.hostA + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        leaf_val = self.hostE + "," + self.hostC + "," + self.hostA
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostD, conf_param=b)
        set_attr = {ATTR_l + '.select': '3:ncpus=1',
                    ATTR_l + '.place': 'scatter', ATTR_k: 'oe'}
        resv_set_attr = {ATTR_l + '.select': '3:ncpus=1',
                         ATTR_l + '.place': 'scatter',
                         'reserve_start': int(time.time()) + 30,
                         'reserve_end': int(time.time()) + 120}
        self.common_steps(set_attr=set_attr, resv_set_attr=resv_set_attr,
                          job=True, interactive=True, resv=True,
                          resv_job=True)

    @requirements(num_moms=3, num_comms=3)
    def test_comm_routers_with_nondefault_pbs_conf(self):
        """
        This test verifies communication between server-mom and
        between mom when multiple pbs_comm are present in cluster
        when PBS_COMM_ROUTERS has ipaddress, port number and hostname
        as values and pbs.conf is in non default location
        Configuration:
        Node 1 : Server, Sched, Mom, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostC)
        Node 4 : Mom (self.hostD)
        Node 5 : Comm (self.hostE)
        """
        self.common_setup(req_moms=3, req_comms=3)
        hostA_ip = socket.gethostbyname(self.hostA)
        comm_val = self.hostA + ":17001"
        a = {'PBS_COMM_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.hostC, conf_param=a)
        comm_val = hostA_ip + ":17001" + "," + self.hostC
        a = {'PBS_COMM_ROUTERS': comm_val}
        self.set_pbs_conf(host_name=self.hostE, conf_param=a)
        leaf_val = self.hostA + "," + self.hostC + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostA, conf_param=b)
        leaf_val = self.hostC + "," + self.hostA + "," + self.hostE
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        leaf_val = self.hostE + "," + self.hostC + "," + self.hostA
        b = {'PBS_LEAF_ROUTERS': leaf_val}
        self.set_pbs_conf(host_name=self.hostD, conf_param=b)
        self.copy_pbs_conf_to_non_default_path()
        set_attr = {ATTR_l + '.select': '3:ncpus=1',
                    ATTR_l + '.place': 'scatter', ATTR_k: 'oe'}
        resv_set_attr = {ATTR_l + '.select': '3:ncpus=1',
                         ATTR_l + '.place': 'scatter',
                         'reserve_start': int(time.time()) + 30,
                         'reserve_end': int(time.time()) + 120}
        self.common_steps(set_attr=set_attr, resv_set_attr=resv_set_attr,
                          job=True, interactive=True, resv=True,
                          resv_job=True)

    def calculate_no_of_wait_threads(self, comm_pid):
        """
        This function calculate the number of wait threads
        :param comm_pid: Comm's Pid
        :type comm_pid: Integer.
        """
        ps_cmd = "ps -eT | grep pbs_comm | wc -l"
        rc = self.server.du.run_cmd(self.server.hostname,
                                    cmd=ps_cmd, as_script=True)
        num_wait_threads = int(rc['out'][0]) - 1
        return num_wait_threads

    def test_comm_threads(self):
        """
        Test allowable values for PBS_COMM_THREADS
        """
        threads = [1, 2, 100, 101, "T"]
        for wait_thread in threads:
            a = {'PBS_COMM_THREADS': wait_thread}
            self.set_pbs_conf(host_name=self.server.shortname, conf_param=a)
            comm_pid = self.comm.get_pid()
            num_wait_thread = self.calculate_no_of_wait_threads(comm_pid)
            if wait_thread == 1 or wait_thread == 101:
                num_threads = -1
            elif wait_thread == "T":
                num_threads = 4
            else:
                num_threads = wait_thread
            _msg = "No of wait threads is not equal to %s" % num_threads
            self.assertEqual(num_wait_thread, num_threads, _msg)
            exp_msg = ["pbs_comms should have at least 2 threads",
                       "tpp init failed"]
            if num_threads == 1:
                for msg in exp_msg:
                    self.comm.log_match(msg)
            elif num_threads == 101:
                exp_msg[0] = "pbs_comms should have <= 100 threads"
                for msg in exp_msg:
                    self.comm.log_match(msg)

    def test_comm_log_events(self):
        """
        Test for verifying the allowable values for PBS_COMM_LOG_EVENTS
        """
        a = [0, "T", 511]
        for log_event in a:
            hook_name = "begin_" + str(log_event)
            attrib = {'PBS_COMM_LOG_EVENTS': log_event}
            if log_event == 0 or log_event == "T":
                existence = False
            else:
                existence = True
            self.set_pbs_conf(host_name=self.server.shortname,
                              conf_param=attrib)
            exp_msg = ["MCAST packet from .*:15001",
                       "mcast done"]
            attrs = {'event': 'execjob_begin', 'enabled': 'True'}
            start_time = time.time()
            self.server.create_hook(hook_name, attrs)
            for msg in exp_msg:
                self.comm.log_match(msg, existence=existence,
                                    starttime=start_time, regexp=True)
            start_time = time.time()
            self.server.import_hook(hook_name, body="import pbs")
            for msg in exp_msg:
                self.comm.log_match(msg, existence=existence,
                                    starttime=start_time, regexp=True)
            start_time = time.time()
            self.server.manager(MGR_CMD_DELETE, HOOK, id=hook_name)
            for msg in exp_msg:
                self.comm.log_match(msg, existence=existence,
                                    starttime=start_time, regexp=True)

    def common_steps_for_mom_pool_tests(self):
        """
        This function submit different jobs as required by test
        "test_isolated_mom_pools" and
        "test_isolated_mom_pools_when_comm_on_non_serverhost"
        """
        set_attr = {ATTR_l + '.select': '1:ncpus=1', ATTR_k: 'oe',
                    ATTR_l + '.place': 'excl'}
        jid1 = self.submit_job(job=True, set_attr=set_attr)
        jid2 = self.submit_job(job=True, set_attr=set_attr)
        jobs = [jid1, jid2]
        for job_id in jobs:
            self.server.expect(JOB, 'queue', op=UNSET, id=job_id, offset=1)
            self.server.log_match("%s;Exit_status=0" % job_id)
        set_attr[ATTR_inter] = ''
        jid1 = self.submit_job(interactive=True, set_attr=set_attr)
        jid2 = self.submit_job(interactive=True, set_attr=set_attr)
        jobs = [jid1, jid2]
        for job_id in jobs:
            self.server.expect(JOB, 'queue', op=UNSET, id=job_id)
            self.server.log_match("%s;Exit_status=0" % job_id)
        del set_attr[ATTR_inter]
        resv_set_attr = {ATTR_l + '.select': '1:ncpus=1',
                         ATTR_l + '.place': 'excl',
                         'reserve_start': time.time() + 10,
                         'reserve_end': time.time() + 120}
        rid1 = self.submit_resv(resv_set_attr)
        resv_job1 = self.submit_job(set_attr=set_attr, resv_job=True, rid=rid1)
        resv_set_attr['reserve_start'] = time.time() + 10
        resv_set_attr['reserve_end'] = time.time() + 120
        rid2 = self.submit_resv(resv_set_attr)
        resv_job2 = self.submit_job(set_attr=set_attr, resv_job=True, rid=rid2)
        resv_jobs = [resv_job1, resv_job2]
        for job_id in resv_jobs:
            self.server.expect(JOB, 'queue', op=UNSET, id=job_id, offset=1)
            self.server.log_match("%s;Exit_status=0" % job_id)

    @requirements(num_moms=2, no_mom_on_server=True, num_comms=3)
    def test_isolated_mom_pools(self):
        """
        Test isolated mom pools
        Configuration:
        Node 1 : Server, Sched, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostD)
        Node 4 : Mom (self.hostC)
        Node 5 : Comm (self.hostE)
        """
        self.common_setup(no_mom_on_comm=True, req_comms=3)
        a = {'PBS_COMM_ROUTERS': self.hostA}
        hosts = [self.hostD, self.hostE]
        for host in hosts:
            self.set_pbs_conf(host_name=host, conf_param=a)
        b = {'PBS_LEAF_ROUTERS': self.hostD}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        b = {'PBS_LEAF_ROUTERS': self.hostE}
        self.set_pbs_conf(host_name=self.hostC, conf_param=b)
        self.common_steps_for_mom_pool_tests()

    @requirements(num_moms=2, no_mom_on_server=True,
                  num_comms=3, no_comm_on_server=True)
    def test_isolated_mom_pools_when_comm_on_non_serverhost(self):
        """
        Test isolated mom pools when comm is present on non server host
        Configuration:
        Node 1 : Server, Sched
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostD)
        Node 4 : Mom (self.hostC)
        Node 5 : Comm (self.hostE)
        Node 6 : Comm (self.hostA)
        """
        self.common_setup(no_mom_on_comm=True, no_comm_on_server=True,
                          req_comms=3)
        a = {'PBS_COMM_ROUTERS': self.hostA}
        hosts = [self.hostD, self.hostE]
        for host in hosts:
            self.set_pbs_conf(host_name=host, conf_param=a)
        b = {'PBS_LEAF_ROUTERS': self.hostD}
        self.set_pbs_conf(host_name=self.hostB, conf_param=b)
        b = {'PBS_LEAF_ROUTERS': self.hostE}
        self.set_pbs_conf(host_name=self.hostC, conf_param=b)
        c = {'PBS_LEAF_ROUTERS': self.hostA}
        self.set_pbs_conf(host_name=self.server.shortname, conf_param=c)
        self.common_steps_for_mom_pool_tests()

    @requirements(num_moms=4, no_mom_on_server=True, num_comms=5)
    def test_comm_failover_with_isolated_mom_pools(self):
        """
        Test comm failover with isolated mom pools
        Configuration:
        Node 1 : Server, Sched, Comm (self.hostA)
        Node 2 : Mom (self.hostB)
        Node 3 : Comm (self.hostF)
        Node 4 : Mom (self.hostC)
        Node 5 : Comm (self.hostG)
        Node 6 : Mom (self.hostD)
        Node 7 : Comm (self.hostH)
        Node 8 : Mom (self.hostE)
        Node 9 : Comm (self.hostI)
        """
        self.common_setup(no_mom_on_comm=True, req_moms=4, req_comms=5)
        node_attr = {'resources_available.ncpus': '1'}
        for mom in self.moms.values():
            self.server.manager(MGR_CMD_SET, NODE, node_attr, id=mom.name)
        a = {'PBS_COMM_ROUTERS': self.hostA}
        comm_hosts = [self.hostF, self.hostG, self.hostH, self.hostI]
        for host in comm_hosts:
            self.set_pbs_conf(host_name=host, conf_param=a)
        mom_hosts = [self.hostB, self.hostC, self.hostD, self.hostE]
        for host in mom_hosts:
            if host == self.hostB:
                leaf_val = self.hostF + "," + self.hostG
            elif host == self.hostC:
                leaf_val = self.hostG + "," + self.hostF
            elif host == self.hostD:
                leaf_val = self.hostH + "," + self.hostI
            elif host == self.hostE:
                leaf_val = self.hostI + "," + self.hostH
            b = {'PBS_LEAF_ROUTERS': leaf_val}
            self.set_pbs_conf(host_name=host, conf_param=b)
        vnode_val = "vnode=" + self.hostB + ":ncpus=1+vnode="
        vnode_val += self.hostC + ":ncpus=1"
        set_attr = {ATTR_l + '.select': vnode_val,
                    ATTR_l + '.place': 'scatter', ATTR_k: 'oe'}
        jid = self.submit_job(set_attr=set_attr, job=True,
                              job_script=True, sleep=30)
        exp_attr = {'job_state': 'R'}
        self.server.expect(JOB, exp_attr, id=jid)
        self.comm2.stop('-KILL')
        hosts = [self.hostB, self.hostC]
        for mom in hosts:
            self.server.expect(NODE, {'state': 'job-busy'}, id=mom)
        self.server.expect(JOB, exp_attr, id=jid)
        self.comm2.start()
        self.server.expect(JOB, 'queue', id=jid, op=UNSET, offset=30)

        vnode_val = "vnode=" + self.hostD + ":ncpus=1+vnode="
        vnode_val += self.hostE + ":ncpus=1"
        resv_set_attr = {ATTR_l + '.select': vnode_val,
                         ATTR_l + '.place': 'scatter',
                         'reserve_start': time.time() + 10,
                         'reserve_end': time.time() + 120}
        rid = self.submit_resv(resv_set_attr)
        jid = self.submit_job(rid=rid, resv_job=True, sleep=30)
        resv_exp_attrib = {'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, resv_exp_attrib, rid, offset=10)
        self.server.expect(JOB, exp_attr, id=jid)
        self.comm4.stop('-KILL')
        hosts = [self.hostD, self.hostE]
        for mom in hosts:
            self.server.expect(NODE, {'state': 'job-busy'}, id=mom)
        self.server.expect(RESV, resv_exp_attrib, rid)
        self.server.expect(JOB, exp_attr, id=jid)
        self.comm4.start()
        self.server.expect(JOB, 'queue', id=jid, op=UNSET, offset=30)

    def tearDown(self):
        os.environ['PBS_CONF_FILE'] = self.pbs_conf_path
        self.logger.info("Successfully exported PBS_CONF_FILE variable")
        conf_param = ['PBS_LEAF_ROUTERS', 'PBS_COMM_ROUTERS',
                      'PBS_COMM_THREADS', 'PBS_COMM_LOG_EVENTS']
        for host in self.node_list:
            self.unset_pbs_conf(host, conf_param)
        self.node_list.clear()
        self.server.client = self.default_client
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_trillion_jobid.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestTrillionJobid(TestFunctional):
    """
    This test suite tests the Trillion Job ID and sequence jobid
    """

    update_svr_db_script = """#!/bin/bash
. %s
. ${PBS_EXEC}/libexec/pbs_db_env

DATA_PORT=${PBS_DATA_SERVICE_PORT}
if [ -z ${DATA_PORT} ]; then
    DATA_PORT=15007
fi

sudo ls ${PBS_HOME}/server_priv/db_user &>/dev/null
if [ $? -eq 0 ]; then
    DATA_USER=`sudo cat ${PBS_HOME}/server_priv/db_user`
    if [ $? -ne 0 ]; then
        exit 1
    fi
fi

sudo ${PBS_EXEC}/sbin/pbs_ds_password test
if [ $? -eq 0 ]; then
    sudo ${PBS_EXEC}/sbin/pbs_dataservice stop
    if [ $? -ne 0 ]; then
        exit 1
    fi
fi

sudo ${PBS_EXEC}/sbin/pbs_dataservice status
if [ $? -eq 0 ]; then
    sudo ${PBS_EXEC}/sbin/pbs_dataservice stop
    if [ $? -ne 0 ]; then
        exit 1
    fi
fi

sudo ${PBS_EXEC}/sbin/pbs_dataservice start
if [ $? -ne 0 ]; then
    exit 1
fi

args="-U ${DATA_USER} -p ${DATA_PORT} -d pbs_datastore"
PGPASSWORD=test ${PGSQL_BIN}/psql ${args} <<-EOF
    UPDATE pbs.server SET sv_jobidnumber = %d;
EOF

ret=$?
if [ $ret -eq 0 ]; then
    echo "Server sv_jobidnumber attribute has been updated successfully"
fi

sudo ${PBS_EXEC}/sbin/pbs_dataservice stop
if [ $? -ne 0 ]; then
    exit 1
fi

exit 0

"""

    def set_svr_sv_jobidnumber(self, num=0):
        """
        This function is to set the next jobid into server database
        """
        # Stop the PBS server
        self.server.stop()
        stop_msg = 'Failed to stop PBS'
        self.assertFalse(self.server.isUp(), stop_msg)
        # Create a shell script file and update the database
        conf_path = self.du.get_pbs_conf_file()
        fn = self.du.create_temp_file(
            body=self.update_svr_db_script %
            (conf_path, num))
        self.du.chmod(path=fn, mode=0o755)
        fail_msg = 'Failed to set sequence id in database'
        ret = self.du.run_cmd(cmd=fn)
        self.assertEqual(ret['rc'], 0, fail_msg)
        # Start the PBS server
        start_msg = 'Failed to restart PBS'
        self.server.start()
        self.assertTrue(self.server.isUp(), start_msg)

    def stop_and_restart_svr(self, restart_type):
        """
            Abruptly/Gracefully stop and restart the server

        """
        try:
            if(restart_type == 'kill'):
                self.server.stop('-KILL')
            else:
                self.server.stop()
        except PbsServiceError as e:
            # The server failed to stop
            raise self.failureException("Server failed to stop:" + e.msg)
        try:
            self.server.start()
        except PbsServiceError as e:
            # The server failed to start
            raise self.failureException("Server failed to start:" + e.msg)
        restart_msg = 'Failed to restart PBS'
        self.assertTrue(self.server.isUp(), restart_msg)

    def submit_job(self, sleep=100, lower=0,
                   upper=0, job_id=None, job_msg=None, verify=False):
        """
        Helper method to submit a normal/array job
        and also checks the R state and particular jobid if success,
        else log the error message

        :param sleep   : Sleep time in seconds for the job
        :type  sleep   : int

        :param lower   : Lower limit for the array job
        :type  lower   : int

        :param upper   : Upper limit for the array job
        :type  upper   : int

        :param job_id  : Expected jobid upon submission
        :type  job_id  : string

        :param job_msg : Expected message upon submission failure
        :type  job_msg : int

        :param verify : Checks Job status R
        :type  verify : boolean(True/False)

        """
        arr_flag = False
        j = Job(TEST_USER)
        if((lower >= 0) and (upper > lower)):
            j.set_attributes({ATTR_J: '%d-%d' % (lower, upper)})
            arr_flag = True
            total_jobs = upper - lower + 1
        j.set_sleep_time(sleep)
        try:
            jid = self.server.submit(j)
            if job_id is not None:
                self.assertEqual(jid.split('.')[0], job_id)
            if arr_flag:
                if verify:
                    self.server.expect(JOB, {'job_state': 'B'}, id=jid)
                    self.server.expect(
                        JOB,
                        {'job_state=R': total_jobs},
                        count=True, id=jid, extend='t')
            else:
                if verify:
                    self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        except PbsSubmitError as e:
            if job_msg is not None:
                # if JobId already exist
                self.assertEqual(e.msg[0], job_msg)
            else:
                # Unable to submit Job
                self.logger.info('Error in submitting job:', e.msg)

    def submit_resv(self, resv_dur=2, resv_id=None, resv_msg=None):
        """
        Helper method to submit a reservation and checks the
        reservation id if success, else log the error message.

        :param resv_dur : Reservation duration in seconds
        :type  resv_dur : int

        :param resv_id  : Expected resvid upon submission
        :type  resv_id  : string

        :param resv_msg : Expected message upon reservation failure
        :type  resv_msg : string

        """
        resv_start = int(time.time()) + 2
        a = {'reserve_start': int(resv_start),
             'reserve_duration': int(resv_dur)
             }
        r = Reservation(TEST_USER, attrs=a)
        try:
            rid = self.server.submit(r)
            if resv_id is not None:
                self.assertEqual(rid.split('.')[0], resv_id)
        except PbsSubmitError as e:
            if resv_msg is not None:
                # if ResvId already exist
                self.assertEqual(e.msg[0], resv_msg)
            else:
                # Unable to submit reservation
                self.logger.info('Error in submitting reservation:', e.msg)

    def test_set_unset_max_job_sequence_id(self):
        """
        Set/Unset max_job_sequence_id attribute and
        also verify the attribute value after server qterm/kill
        """
        # Set as Non-admin user
        seq_id = {ATTR_max_job_sequence_id: 123456789}
        try:
            self.server.manager(MGR_CMD_SET, SERVER, seq_id, runas=TEST_USER1)
        except PbsManagerError as e:
            self.assertTrue('Unauthorized Request' in e.msg[0])

        # Set as Admin User and also check the value after server restart
        self.server.manager(MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)
        self.server.expect(SERVER, seq_id)
        self.server.log_match('svr_max_job_sequence_id set to '
                              'val %d' % (seq_id[ATTR_max_job_sequence_id]),
                              starttime=self.server.ctime)
        # Abruptly kill the server
        self.stop_and_restart_svr('kill')
        self.server.expect(SERVER, seq_id)
        # Gracefully stop the server
        self.stop_and_restart_svr('normal')
        self.server.expect(SERVER, seq_id)

        # Unset as Non-admin user
        try:
            self.server.manager(
                MGR_CMD_UNSET,
                SERVER,
                'max_job_sequence_id',
                runas=TEST_USER1)
        except PbsManagerError as e:
            self.assertTrue('Unauthorized Request' in e.msg[0])

        # Unset as Admin user
        self.server.manager(MGR_CMD_UNSET, SERVER, 'max_job_sequence_id',
                            runas=ROOT_USER)
        self.server.log_match('svr_max_job_sequence_id reverting back '
                              'to default val 9999999',
                              starttime=self.server.ctime)

    def test_max_job_sequence_id_values(self):
        """
        Test to check valid/invalid values for the
        max_job_sequence_id server attribute
        """
        # Invalid Values
        invalid_values = [-9999999, '*456879846',
                          23545.45, 'ajndd', '**45', 'asgh456']
        for val in invalid_values:
            try:
                seq_id = {ATTR_max_job_sequence_id: val}
                self.server.manager(
                    MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)
            except PbsManagerError as e:
                self.assertTrue(
                    'Illegal attribute or resource value' in e.msg[0])
        # Less than or Greater than the attribute limit
        min_max_values = [120515, 999999, 1234567891234, 9999999999999]
        for val in min_max_values:
            try:
                seq_id = {ATTR_max_job_sequence_id: val}
                self.server.manager(
                    MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)
            except PbsManagerError as e:
                self.assertTrue('Cannot set max_job_sequence_id < 9999999, '
                                'or > 999999999999' in e.msg[0])
        # Valid values
        valid_values = [9999999, 123456789, 100000000000, 999999999999]
        for val in valid_values:
            seq_id = {ATTR_max_job_sequence_id: val}
            self.server.manager(MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)

    def test_max_job_sequence_id_wrap(self):
        """
        Test to check the jobid's/resvid's are wrapping it to zero or not,
        after reaching to the given limit
        """
        # Check default limit(9999999) and wrap it 0
        a = {'resources_available.ncpus': 20}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        self.submit_job(verify=True)
        self.submit_job(lower=1, upper=2, verify=True)
        self.submit_resv()
        sv_jobidnumber = 9999999  # default
        self.set_svr_sv_jobidnumber(sv_jobidnumber)
        self.submit_job(job_id='%s' % (sv_jobidnumber), verify=True)
        self.submit_job(lower=1, upper=2, job_id='0[]',
                        verify=True)  # wrap it
        self.submit_resv(resv_id='R1')

        # Check max limit (999999999999) and wrap it 0
        sv_jobidnumber = 999999999999  # max limit
        seq_id = {ATTR_max_job_sequence_id: sv_jobidnumber}
        self.server.manager(MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)
        self.server.expect(SERVER, seq_id)
        self.submit_job(verify=True)
        self.submit_job(lower=1, upper=2, verify=True)
        self.submit_resv()
        self.set_svr_sv_jobidnumber(sv_jobidnumber)
        self.submit_job(job_id='%s' % (sv_jobidnumber), verify=True)
        self.submit_job(lower=1, upper=2, job_id='0[]',
                        verify=True)  # wrap it
        self.submit_resv(resv_id='R1')

        # Someone set the max_job_sequence_id less than current jobid then also
        # wrap it 0
        sv_jobidnumber = 1234567890
        seq_id = {ATTR_max_job_sequence_id: sv_jobidnumber}
        self.server.manager(MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)
        self.server.expect(SERVER, seq_id)
        sv_jobidnumber = 123456789
        self.set_svr_sv_jobidnumber(sv_jobidnumber)
        self.submit_job(job_id='%s' % (sv_jobidnumber), verify=True)
        self.submit_job(lower=1, upper=2, job_id='123456790[]', verify=True)
        self.submit_resv(resv_id='R123456791')
        # Set smaller(12345678) than current jobid(123456790)
        sv_jobidnumber = 12345678
        seq_id = {ATTR_max_job_sequence_id: sv_jobidnumber}
        self.server.manager(MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)
        self.server.expect(SERVER, seq_id)
        self.submit_job(job_id='0', verify=True)  # wrap it to zero
        self.submit_job(lower=1, upper=2, job_id='1[]', verify=True)
        self.submit_resv(resv_id='R2')

    @timeout(3000)
    def test_verify_sequence_window(self):
        """
        Tests the sequence window scenario in which jobid
        number save to the database once in a 1000 time
        """
        # Abruptly kill the server so next jobid should be 1000 after server
        # start
        self.set_svr_sv_jobidnumber(0)
        self.submit_job(job_id='0')
        self.submit_job(lower=1, upper=2, job_id='1[]')
        self.submit_resv(resv_id='R2')
        # kill the server forcefully
        self.stop_and_restart_svr('kill')
        self.submit_job(job_id='1000')
        self.submit_job(lower=1, upper=2, job_id='1001[]')
        self.submit_resv(resv_id='R1002')
        # if server gets killed again abruptly then next jobid would be 2000
        self.stop_and_restart_svr('kill')
        self.submit_job(job_id='2000')
        self.submit_job(lower=1, upper=2, job_id='2001[]')
        self.submit_resv(resv_id='R2002')

        # Gracefully stop the server so jobid's will continue from the last
        # jobid
        self.stop_and_restart_svr('normal')
        self.submit_job(job_id='2003')
        self.submit_job(lower=1, upper=2, job_id='2004[]')
        self.submit_resv(resv_id='R2005')

        # Verify the sequence window, incase of submitting more than 1001 jobs
        # and all jobs should submit successfully without any duplication error
        for _ in range(1010):
            j = Job(TEST_USER)
            self.server.submit(j)

    def test_jobid_duplication(self):
        """
                Tests the JobId/ResvId duplication after wrap
                Job/Resv shouldn't submit because previous
                jobs with the same id's are still running
        """
        seq_id = {ATTR_max_job_sequence_id: 99999999}
        self.server.manager(MGR_CMD_SET, SERVER, seq_id, runas=ROOT_USER)
        self.set_svr_sv_jobidnumber(0)
        self.submit_job(sleep=1000, job_id='0')
        self.submit_job(sleep=1000, lower=1, upper=2, job_id='1[]')
        self.submit_resv(resv_dur=300, resv_id='R2')
        sv_jobidnumber = 99999999
        self.set_svr_sv_jobidnumber(sv_jobidnumber)
        self.submit_job(sleep=1000, job_id='%s' % (sv_jobidnumber))

        # Now job/resv shouldn't submit because same id's are already occupied
        msg = "qsub: Job with requested ID already exists"
        self.submit_job(job_msg=msg)
        self.submit_job(lower=1, upper=2, job_msg=msg)
        msg = 'pbs_rsub: Reservation with '\
              'requested ID already exists'
        self.submit_resv(resv_msg=msg)
        # Job should submit successfully because all existing id's has been
        # passed
        self.submit_job(lower=1, upper=2, job_id='3[]')

    def test_jobid_resvid_after_multiple_restart(self):
        """
        Test to check the Jobid/Resvid should not wrap to 0 during
        server restart multiple times consecutively either gracefully/abruptly
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        curr_id = int(jid.split('.')[0])
        self.submit_job(job_id='%s' % str(curr_id + 1))
        self.submit_job(lower=1, upper=2, job_id='%s[]' % str(curr_id + 2))
        self.submit_resv(resv_id='R%s' % str(curr_id + 3))
        # Gracefully stop and start the server twice consecutively
        self.stop_and_restart_svr('normal')
        self.stop_and_restart_svr('normal')
        self.submit_job(job_id='%s' % str(curr_id + 4))
        self.submit_job(lower=1, upper=2, job_id='%s[]' % str(curr_id + 5))
        self.submit_resv(resv_id='R%s' % str(curr_id + 6))
        # Abruptly kill and start the server twice consecutively
        self.stop_and_restart_svr('kill')
        self.stop_and_restart_svr('kill')
        # Starting at 1000 in current jobid for the sequence window buffer
        curr_id = 1000
        self.submit_job(job_id='%s' % str(curr_id))
        self.submit_job(lower=1, upper=2, job_id='%s[]' % str(curr_id + 1))
        self.submit_resv(resv_id='R%s' % str(curr_id + 2))

    def tearDown(self):
        self.server.cleanup_jobs()
        TestFunctional.tearDown(self)


================================================
FILE: test/tests/functional/pbs_two_mom_hooks_resources_used.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


@requirements(num_moms=2)
class TestAcctlogRescUsedWithTwoMomHooks(TestFunctional):

    """
    This test suite tests the accounting logs to have non-zero resources_used
    in the scenario where we have execjob_begin and execjob_end hooks.
    """

    def setUp(self):
        TestFunctional.setUp(self)
        if len(self.moms) != 2:
            self.skipTest('Test requires two MoMs as input, '
                          'use -p moms=<mom1>:<mom2>')

        hook_body = "import time\n"
        a = {'event': 'execjob_begin', 'enabled': 'True'}
        rv = self.server.create_import_hook("test", a, hook_body)
        self.assertTrue(rv)

        a = {'event': 'execjob_end', 'enabled': 'True'}
        rv = self.server.create_import_hook("test2", a, hook_body)
        self.assertTrue(rv)

        a = {ATTR_nodefailrq: 5}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        self.assertEqual(rc, 0)

        a = {'job_history_enable': 'True'}
        rc = self.server.manager(MGR_CMD_SET, SERVER, a)
        self.assertEqual(rc, 0)

        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]

        if self.momA.is_cpuset_mom() or self.momB.is_cpuset_mom():
            node_status = self.server.status(NODE)

        if self.momA.is_cpuset_mom():
            self.hostA = node_status[1]['id']
        else:
            self.hostA = self.momA.shortname
        if self.momB.is_cpuset_mom():
            self.hostB = node_status[-1]['id']
        else:
            self.hostB = self.momB.shortname

    def test_Rrecord(self):
        """
        This test case runs a job on two nodes. Kills the mom process on
        MS, waits for the job to be requeued and tests for the
        resources_used value to be present in the 'R' record.
        """

        # Submit job
        select = "vnode=" + self.hostA + "+vnode=" + self.hostB
        j1 = Job(TEST_USER, attrs={
             ATTR_N: 'NodeFailRequeueTest',
             'Resource_List.select': select})
        jid1 = self.server.submit(j1)

        # Wait for the job to start running.
        self.server.expect(JOB, {ATTR_state: 'R'}, jid1)
        # Kill the MoM process on the MS.

        self.momA.signal('-KILL')
        # Wait for the job to be requeued.
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)

        # Check for resources_used value in the 'R' record.
        msg = '.*R;' + str(jid1) + '.*resources_used.ncpus=2.*'
        self.server.accounting_match(msg, regexp=True, n='ALL')

    def test_Erecord(self):
        """
        This test case runs a job on two nodes. Waits for the job to complete.
        After that, tests for the E record to have non-zero values in
        resources_used.
        """

        # Submit job
        select = "vnode=" + self.hostA + "+vnode=" + self.hostB
        j1 = Job(TEST_USER, attrs={
             ATTR_N: 'JobEndTest',
             'Resource_List.select': select})
        j1.set_sleep_time(15)
        jid1 = self.server.submit(j1)

        # Wait for the job to start running.
        self.server.expect(JOB, {ATTR_state: 'R'}, jid1)

        # Wait for the job to finish running.
        self.server.expect(JOB, {'job_state': 'F'}, id=jid1, extend='x')

        rv = 0
        # Check if resources_used.walltime is zero or not.
        try:
            rv = self.server.expect(JOB, {'resources_used.walltime': '0'},
                                    id=jid1, max_attempts=2, extend='x')
        except PtlExpectError as e:
            # resources_used.walltime is non-zero.
            self.assertFalse(rv)
        else:
            # resources_used.walltime is zero, test case fails.
            self.logger.info("resources_used.walltime reported to be zero")
            self.assertFalse(True)

        # Check for the E record to NOT have zero walltime.
        msg = '.*E;' + str(jid1) + '.*resources_used.walltime=\"00:00:00.*'
        self.server.accounting_match(msg, tail=True, regexp=True,
                                     existence=False)

        # Check for the E record to have non-zero ncpus.
        msg = '.*E;' + str(jid1) + '.*resources_used.ncpus=2.*'
        self.server.accounting_match(msg, tail=True, regexp=True)


================================================
FILE: test/tests/functional/pbs_types.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Test_pbs_types(TestFunctional):
    """
    This test suite tests pbs python types and their related functions
    """
    def test_pbs_size_deepcopy(self):
        """
        Test that deepcopy works for pbs.size type
        """
        hook_content = ("""
import pbs
import copy
a = pbs.size(1000)
b = copy.deepcopy(a)
c = a
pbs.logmsg(pbs.EVENT_DEBUG, 'a=%s, b=%s, c=%s' % (a, b, c))
d = pbs.size('1m')
e = copy.deepcopy(d)
f = d
pbs.logmsg(pbs.EVENT_DEBUG, 'd=%s, e=%s, f=%s' % (d, e, f))
""")
        hook_name = 'deepcopy'
        hook_attr = {'enabled': 'true', 'event': 'queuejob'}
        self.server.create_import_hook(hook_name, hook_attr, hook_content)

        j = Job(TEST_USER)
        self.server.submit(j)
        self.server.log_match("a=1000b, b=1000b, c=1000b")
        self.server.log_match("d=1mb, e=1mb, f=1mb")


================================================
FILE: test/tests/functional/pbs_unknown_resource_hook_update.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestUnknownResourceHookUpdate(TestFunctional):
    """
    Test that a resource that is not known to the server and is
    updated in an execjob_epilogue hook doesn't crash the server.
    """

    def test_epilogue_update(self):
        """
        Test setting resources_used values of resources that
        are unknown to the server, using an epilogue hook.
        """
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'job_history_enable': 'True'})

        hook_body = "import pbs\n"
        hook_body += "e = pbs.event()\n"
        hook_body += "hstr=\'" + "unkown_resource" + "\'\n"
        hook_body += "e.job.resources_used[\"foo_str\"] = 'unknown resource'\n"
        hook_body += "e.job.resources_used[\"foo_i\"] = 5\n"

        a = {'event': 'execjob_epilogue', 'enabled': 'True'}
        self.server.create_import_hook("ep", a, hook_body)

        J = Job()
        J.set_sleep_time(1)
        jid = self.server.submit(J)

        self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x')

        # Make sure the server is still up
        self.server.isUp()

        # Server_logs would only show the first resource it has failed to
        # update
        log_match = 'unable to update attribute resources_used.foo_str '
        log_match += 'in job_obit'
        self.server.log_match("%s;.*%s.*" % (jid, log_match), regexp=True)


================================================
FILE: test/tests/functional/pbs_unset_exectime.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class Testunset_exectime(TestFunctional):
    """
    Test that unsetting execution time through hooks does not throw parse error
    """

    def test_unset_exectime(self):
        """
        Create a hook to unset execution time and check after submitting
        a job no error messages are logged
        """
        hook_name = "exechook"
        hook_body = """
import pbs
e = pbs.event()
if (e.type is pbs.QUEUEJOB):
        o = e.job
        o.Execution_Time = None
else:
        e.reject("unmatched event type!")
"""
        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, a, hook_body)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})
        j = Job(TEST_USER)
        self.server.submit(j)
        msg = "Error evaluating Python script, "
        msg += "exec_time could not be parsed"
        self.server.log_match(msg, max_attempts=5, existence=False)


================================================
FILE: test/tests/functional/pbs_user_reliability.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

import re

from tests.functional import *


class Test_user_reliability(TestFunctional):

    """
    This test suite is for testing the user reliability workflow feature.
    """

    def test_create_resv_from_job_using_runjob_hook(self):
        """
        This test is for creating a reservation out of a job using runjob hook.
        """
        qmgr_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                'bin', 'qmgr')

        runjob_hook_body = """
import pbs
e = pbs.event()
j = e.job
j.create_resv_from_job=1
"""
        hook_event = "runjob"
        hook_name = "rsub"
        a = {'event': hook_event, 'enabled': 'true'}
        self.server.create_import_hook(hook_name, a, runjob_hook_body)

        s_ncpus = 'resources_assigned.ncpus'
        s_nodect = 'resources_assigned.nodect'
        try:
            s_ncpus_before = self.server.status(SERVER, s_ncpus)[0][s_ncpus]
            s_nodect_before = self.server.status(SERVER, s_nodect)[0][s_nodect]
        except IndexError:
            s_nodect_before = '0'
            s_ncpus_before = '0'

        a = {'Resource_List.walltime': 9999}
        job = Job(TEST_USER, a)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, jid)

        a = {ATTR_job: jid}
        rid = self.server.status(RESV, a)[0]['id'].split(".")[0]

        a = {ATTR_job: jid, 'reserve_state': (MATCH_RE, 'RESV_RUNNING|5'),
             'Resource_List.walltime': 9999}
        self.server.expect(RESV, a, id=rid)

        a = {ATTR_queue: rid}
        self.server.expect(JOB, a, id=jid)

        self.server.deljob(jid, wait=True)
        self.server.expect(RESV, a, id=rid)
        self.server.delete(rid)

        s_ncpus_after = self.server.status(SERVER, s_ncpus)[0][s_ncpus]
        s_nodect_after = self.server.status(SERVER, s_nodect)[0][s_nodect]

        self.assertEqual(s_ncpus_before, s_ncpus_after)
        self.assertEqual(s_nodect_before, s_nodect_after)

    def test_create_resv_from_job_using_qsub(self):
        """
        This test is for creating a reservation out of a job using qsub.
        """
        s_ncpus = 'resources_assigned.ncpus'
        s_nodect = 'resources_assigned.nodect'
        try:
            s_ncpus_before = self.server.status(SERVER, s_ncpus)[0][s_ncpus]
            s_nodect_before = self.server.status(SERVER, s_nodect)[0][s_nodect]
        except IndexError:
            s_nodect_before = '0'
            s_ncpus_before = '0'

        now = time.time()

        a = {ATTR_W: 'create_resv_from_job=True'}
        job = Job(TEST_USER, a)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, jid)

        self.server.log_match("Reject reply code=15095", starttime=now,
                              interval=2, max_attempts=10, existence=False)

        a = {ATTR_job: jid}
        rid = self.server.status(RESV, a)[0]['id'].split(".")[0]

        a = {ATTR_job: jid, 'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid)

        a = {ATTR_queue: rid}
        self.server.expect(JOB, a, id=jid)

        self.server.deljob(jid, wait=True)
        self.server.expect(RESV, a, id=rid)
        self.server.delete(rid)

        s_ncpus_after = self.server.status(SERVER, s_ncpus)[0][s_ncpus]
        s_nodect_after = self.server.status(SERVER, s_nodect)[0][s_nodect]

        self.assertEqual(s_ncpus_before, s_ncpus_after)
        self.assertEqual(s_nodect_before, s_nodect_after)

        a = {ATTR_W: 'create_resv_from_job=False'}
        job = Job(TEST_USER, a)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, jid)
        self.assertFalse(self.server.status(RESV))

    def test_create_resv_from_job_using_rsub(self):
        """
        This test is for creating a reservation out of a job using pbs_rsub.
        """
        s_ncpus = 'resources_assigned.ncpus'
        s_nodect = 'resources_assigned.nodect'
        try:
            s_ncpus_before = self.server.status(SERVER, s_ncpus)[0][s_ncpus]
            s_nodect_before = self.server.status(SERVER, s_nodect)[0][s_nodect]
        except IndexError:
            s_nodect_before = '0'
            s_ncpus_before = '0'

        a = {'Resource_List.walltime': 9999}
        job = Job(TEST_USER, a)
        jid = self.server.submit(job)
        self.server.expect(JOB, {ATTR_state: 'R'}, jid)

        a = {ATTR_job: jid}
        resv = Reservation(attrs=a)
        self.server.submit(resv)

        a = {ATTR_job: jid}
        rid = self.server.status(RESV, a)[0]['id'].split(".")[0]

        a = {ATTR_job: jid, 'reserve_state': (MATCH_RE, 'RESV_RUNNING|5')}
        self.server.expect(RESV, a, id=rid)

        a = {ATTR_queue: rid}
        self.server.expect(JOB, a, id=jid)

        self.server.deljob(jid, wait=True)
        self.server.expect(RESV, a, id=rid)
        self.server.delete(rid)

        s_ncpus_after = self.server.status(SERVER, s_ncpus)[0][s_ncpus]
        s_nodect_after = self.server.status(SERVER, s_nodect)[0][s_nodect]

        self.assertEqual(s_ncpus_before, s_ncpus_after)
        self.assertEqual(s_nodect_before, s_nodect_after)

    def test_create_resv_from_array_job(self):
        """
        This test confirms that a reservation cannot be created out of an
        array job.
        """

        j = Job(TEST_USER)
        j.set_attributes({ATTR_J: '1-3'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'B'}, jid)

        subjobs = self.server.status(JOB, id=jid, extend='t')
        jids1 = subjobs[1]['id']

        a = {ATTR_job: jids1}
        resv = Reservation(attrs=a)
        msg = "Reservation may not be created from an array job"
        try:
            self.server.submit(resv)
        except PbsSubmitError as e:
            self.assertTrue(msg in e.msg[0])
        else:
            self.fail("Error message not as expected")

        a = {ATTR_job: jid}
        resv = Reservation(attrs=a)
        try:
            self.server.submit(resv)
        except PbsSubmitError as e:
            self.assertTrue(msg in e.msg[0])
        else:
            self.fail("Error message not as expected")

    def test_create_resv_by_other_user(self):
        """
        This test confirms that a reservation cannot be created out of an
        job owned by someone else.
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)

        a = {ATTR_job: jid}
        resv = Reservation(username=TEST_USER2, attrs=a)
        msg = "Unauthorized Request"
        try:
            self.server.submit(resv)
        except PbsSubmitError as e:
            self.assertTrue(msg in e.msg[0])
        else:
            self.fail("Error message not as expected")

    def test_flatuid_false(self):
        """
        This test confirms that a reservation can be created out of a job
        even when flatuid is set to False.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'flatuid': False})
        self.test_create_resv_from_job_using_qsub()

    def test_set_attr_when_job_running(self):
        """
        This test confirms that create_resv_from_job is not allowed to be
        altered when the job is already running.
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)

        msg = "attribute allowed to be modified"
        with self.assertRaises(PbsAlterError, msg=msg) as c:
            self.server.alterjob(jid, {ATTR_W: 'create_resv_from_job=1'})

        msg = "qalter: Cannot modify attribute while job running  "
        msg += "create_resv_from_job"
        self.assertIn(msg, c.exception.msg[0])


================================================
FILE: test/tests/functional/pbs_validate_job_qsub_attributes.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.functional import *


class TestQsubWithQueuejobHook(TestFunctional):
    """
    This test suite validates the job submitted through qsub
    when queuejob hook is enabled in the PBS complex.
    """

    hooks = {
        "queuejob_hook1":
        """
import pbs
pbs.logmsg(pbs.LOG_DEBUG, "submitted job with long select" )
        """,
    }

    def setUp(self):
        TestFunctional.setUp(self)

    def test_qsub_long_select_with_hook(self):
        """
        This test case validates that, when a long string of resource is
        requested in qsub through lselect. The requested resource should not
        get truncated by the server hook infra when there exists a queuejob
        hook.
        """

        hook_names = ["queuejob_hook1"]
        hook_attrib = {'event': 'queuejob', 'enabled': 'True'}
        for hook_name in hook_names:
            hook_script = self.hooks[hook_name]
            retval = self.server.create_import_hook(hook_name,
                                                    hook_attrib,
                                                    hook_script,
                                                    overwrite=True)
            self.assertTrue(retval)

        # Create a long select statement for the job
        loop_str = "1:host=testnode"
        long_select = loop_str
        for loop_i in range(1, 5120, len(loop_str) + 1):
            long_select += "+" + loop_str

        select_len = len(long_select)
        long_select = "select=" + long_select
        job = Job(TEST_USER1, attrs={ATTR_l: long_select})
        jid = self.server.submit(job)
        job_status = self.server.status(JOB, id=jid)
        select_resource = job_status[0]['Resource_List.select']
        self.assertTrue(select_len == len(select_resource))

    def test_qsub_N_cmdline(self):
        """
        This test case validates, illlegal characters in job name,
        cause qsub to error out
        """
        J = Job(TEST_USER, attrs={ATTR_N: 'j&whoami&gt;/tmp/b&'})
        try:
            jid = self.server.submit(J)
        except PbsSubmitError as e:
            self.assertTrue("illegal -N value" in e.msg[0])
            self.logger.info('qsub: illegal -N value.Job not submitted')
        else:
            self.logger.info('Job created with illegal name: ' + jid)
            self.assertTrue(False, "Job shouldn't be accepted")

    def test_qsub_N_jobscript(self):
        """
        This test case validates, illlegal characters in job name
        passed from job script, cause qsub to error out
        """
        j = Job(TEST_USER)
        scrpt = []
        scrpt += ['#!/bin/bash']
        scrpt += ['#PBS -N "j&whoami&gt;/tmp/b&"\n']
        scrpt += ['#PBS -j oe\n']
        scrpt += ['#PBS -m n\n']
        scrpt += ['#PBS -l select=1:ncpus=1\n']
        scrpt += ['#PBS -l walltime=00:0:15\n']
        scrpt += ['#PBS -l place=scatter:excl\n']
        scrpt += ['date +%s']
        j.create_script(body=scrpt, hostname=self.server.client)
        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertTrue("illegal -N value" in e.msg[0])
            self.logger.info('qsub: illegal -N value.Job not submitted')
        else:
            self.logger.info('Job created with illegal name: ' + jid)
            self.assertTrue(False, "Job shouldn't be accepted")

    def test_qsub_N_job_array(self):
        """
        This test case validates, illlegal characters in job name
        for a job array, cause qsub to error out
        """
        J = Job(TEST_USER, attrs={ATTR_N: 'j&whoami&g;/tmp/b&', ATTR_J: '1-2'})
        try:
            jid = self.server.submit(J)
        except PbsSubmitError as e:
            self.assertTrue("illegal -N value" in e.msg[0])
            self.logger.info('qsub: illegal -N value.Job not submitted')
        else:
            self.logger.info('Job created with illegal name: ' + jid)
            self.assertTrue(False, "Job shouldn't be accepted")

    def test_qsub_N_validchar(self):
        """
        This test case validates whether character "."
        in job name passed via -N args in qsub works fine
        """
        j = Job(TEST_USER, {ATTR_N: 'job.scr'})
        try:
            jid = self.server.submit(j)
        except PbsSubmitError as e:
            self.assertNotIn('illegal -N value', e.msg[0],
                             'qsub: Not accepted "." in job name')
        else:
            self.server.expect(JOB, {'job_state': (MATCH_RE, '[RQ]')}, id=jid)
            self.logger.info('Job submitted successfully: ' + jid)


================================================
FILE: test/tests/functional/pbs_verify_log_output.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import array
import fcntl
import socket
import struct
import sys

from tests.functional import *


class TestVerifyLogOutput(TestFunctional):
    """
    Test that hostname and interface information
    is added to all logs at log open
    """

    def setUp(self):
        TestFunctional.setUp(self)

    def all_interfaces(self):
        """
        Miscellaneous function to return all interface names
        that should also be added to logs
        """
        is_64bits = sys.maxsize > 2**32
        struct_size = 40 if is_64bits else 32
        s = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
        max_possible = 8
        while True:
            bytes = max_possible * struct_size
            names = array.array('B', b'\0' * bytes)
            outbytes = struct.unpack('iL', fcntl.ioctl(
                s.fileno(),
                0x8912,
                struct.pack('iL', bytes, names.buffer_info()[0])
            ))[0]
            if outbytes == bytes:
                max_possible *= 2
            else:
                break
        namestr = names.tostring()
        for i in range(0, outbytes, struct_size):
            yield namestr[i:i + 16].split(b'\0', 1)[0].decode()

    def test_hostname_add(self):
        """
        Test for hostname presence in log files
        """
        log_val = socket.gethostname()
        momname = self.mom.shortname
        self.scheduler.log_match(
            log_val,
            regexp=False,
            starttime=self.server.ctime,
            max_attempts=5,
            interval=2)
        self.server.log_match(
            log_val,
            regexp=False,
            starttime=self.server.ctime,
            max_attempts=5,
            interval=2)
        self.mom.log_match(
            momname,
            regexp=False,
            starttime=self.server.ctime,
            max_attempts=5,
            interval=2)

    def test_if_info_add(self):
        """
        Test for interface info presence in log files
        """
        interfaceGenerator = self.all_interfaces()
        for ifname in interfaceGenerator:
            name = "[(" + ifname + ")]"
            log_val = "[( interface: )]" + name
            # Workaround for PTL regex to match
            # entire word once using () inside []
            self.scheduler.log_match(
                log_val,
                regexp=True,
                starttime=self.server.ctime,
                max_attempts=5,
                interval=2)
            self.server.log_match(
                log_val,
                regexp=True,
                starttime=self.server.ctime,
                max_attempts=5,
                interval=2)
            self.mom.log_match(
                log_val,
                regexp=True,
                starttime=self.server.ctime,
                max_attempts=5,
                interval=2)

    def test_auto_sched_cycle_trigger(self):
        """
        Test case to verify that scheduling cycle is triggered automatically
        without any delay  after restart of PBS Services.
        """
        started_time = time.time()
        self.logger.info('Restarting PBS Services')
        PBSInitServices().restart()

        if self.server.isUp() and self.scheduler.isUp():
            self.scheduler.log_match("Req;;Starting Scheduling Cycle",
                                     starttime=started_time)
            self.scheduler.log_match("Req;;Leaving Scheduling Cycle",
                                     starttime=started_time)

    def test_supported_auth_method_msgs(self):
        """
        Test to verify PBS_SUPPORTED_AUTH_METHODS is logged in server
        and comm daemon logs after start or restart
        """
        attr_name = 'PBS_SUPPORTED_AUTH_METHODS'
        started_time = time.time()
        # check the logs after restarting the server and comm daemon
        self.server.restart()
        self.comm.restart()
        resvport_msg = 'Supported authentication method: ' + 'resvport'
        if self.server.isUp() and self.comm.isUp():
            self.server.log_match(resvport_msg, starttime=started_time)
            self.comm.log_match(resvport_msg, starttime=started_time)

        # Added an attribute PBS_SUPPORTED_AUTH_METHODS in pbs.conf file
        conf_attr = {'PBS_SUPPORTED_AUTH_METHODS': 'munge,resvport'}
        self.du.set_pbs_config(confs=conf_attr)
        started_time = time.time()
        # check the logs after restarting the server and comm daemon
        self.server.restart()
        self.comm.restart()
        munge_msg = 'Supported authentication method: ' + 'munge'
        if self.server.isUp() and self.comm.isUp():
            self.server.log_match(munge_msg, starttime=started_time)
            self.comm.log_match(munge_msg, starttime=started_time)
            self.server.log_match(resvport_msg, starttime=started_time)
            self.comm.log_match(resvport_msg, starttime=started_time)


================================================
FILE: test/tests/interfaces/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_testsuite import *


class TestInterfaces(PBSTestSuite):
    """
    Base test suite for Interfaces related tests
    """
    pass


================================================
FILE: test/tests/interfaces/pbs_libpbs_so.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.interfaces import *

test_code = '''
#include <stdio.h>
#include <string.h>
#include <pbs_ifl.h>

int main(int argc, char **argv)
{
    struct batch_status *status = NULL;
    struct attrl *a;
    int c = pbs_connect(NULL);

    if (c <= 0)
        return 1;
    status = pbs_statserver(c, NULL, NULL);
    if (status == NULL)
        return 1;
    a = status->attribs;
    while (a != NULL) {
        if (a->name != NULL &&
            (!strcmp(a->name, ATTR_SvrHost) ||
                !strcmp(a->name, ATTR_total))) {
            printf("%s = %s\\n", a->name, a->value);
        }
        a = a->next;
    }
    pbs_statfree(status);
    pbs_disconnect(c);
    return 0;
}
'''


class TestLibpbsLinking(TestInterfaces):
    """
    Test suite to shared libpbs library linking
    """

    def test_libpbs(self):
        """
        Test shared libpbs library linking with test code
        """
        if self.du.get_platform().lower() != 'linux':
            self.skipTest("This test is only supported on Linux!")
        _gcc = self.du.which(exe='gcc')
        if _gcc == 'gcc':
            self.skipTest("Couldn't find gcc!")
        _exec = self.server.pbs_conf['PBS_EXEC']
        _id = os.path.join(_exec, 'include')
        _ld = os.path.join(_exec, 'lib')
        if not self.du.isfile(path=os.path.join(_id, 'pbs_ifl.h')):
            _m = "Couldn't find pbs_ifl.h in %s" % _id
            _m += ", Please install PBS devel package"
            self.skipTest(_m)
        self.assertTrue(self.du.isfile(path=os.path.join(_ld, 'libpbs.so')))
        _fn = self.du.create_temp_file(body=test_code, suffix='.c')
        _en = self.du.create_temp_file()
        self.du.rm(path=_en)
        cmd = ['gcc', '-g', '-O2', '-Wall', '-Werror']
        cmd += ['-o', _en]
        cmd += ['-I%s' % _id, _fn, '-L%s' % _ld, '-lpbs', '-lz']
        _res = self.du.run_cmd(cmd=cmd)
        self.assertEqual(_res['rc'], 0, "\n".join(_res['err']))
        self.assertTrue(self.du.isfile(path=_en))
        cmd = ['LD_LIBRARY_PATH=%s %s' % (_ld, _en)]
        _res = self.du.run_cmd(cmd=cmd, as_script=True)
        self.assertEqual(_res['rc'], 0)
        self.assertEqual(len(_res['out']), 2)
        _s = self.server.status(SERVER)[0]
        _exp = ["%s = %s" % (ATTR_SvrHost, _s[ATTR_SvrHost])]
        _exp += ["%s = %s" % (ATTR_total, _s[ATTR_total])]
        _exp = "\n".join(_exp)
        _out = "\n".join(_res['out'])
        self.assertEqual(_out, _exp)


================================================
FILE: test/tests/interfaces/pbs_node_partition.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.interfaces import *


@tags('multisched')
class TestNodePartition(TestInterfaces):
    """
    Test suite to test partition attr for node
    """

    def setUp(self):
        TestInterfaces.setUp(self)
        self.mom_hostname = self.mom.shortname

    def set_node_partition_attr(self, mgr_cmd="MGR_CMD_SET", n_name=None,
                                partition="P1", user=ROOT_USER):
        """
        Common function to set partition attribute to node object
        :param mgr_cmd: qmgr "MGR_CMD_SET/MGR_CMD_UNSET" cmd,
        Defaults to MGR_CMD_SET
        :type mgr_cmd: str
        :param n_name: name of the vnode, Defaults to "hostname of server"
        :type n_name: str
        :param partition: "partition" attribute of node object,
                    Defaults to "P1"
        :type partition: str
        :param user: one of the pre-defined set of users
        :type user: :py:class:`~ptl.lib.pbs_testlib.PbsUser`
        """
        attr = {'partition': partition}
        if mgr_cmd == "MGR_CMD_SET":
            self.server.manager(MGR_CMD_SET, NODE, attr, id=n_name, runas=user)
        elif mgr_cmd == "MGR_CMD_UNSET":
            self.server.manager(MGR_CMD_UNSET, NODE,
                                "partition", id=n_name, runas=user)
        else:
            msg = ("Error: test_set_node_partition_attr function takes only "
                   "MGR_CMD_SET/MGR_CMD_UNSET value for mgr_cmd")
            self.assertTrue(False, msg)

    def test_set_unset_partition_node_attr(self):
        """
        Test to set/unset the partition attribute of node object
        """
        self.set_node_partition_attr(n_name=self.mom_hostname)
        self.set_node_partition_attr(partition="P2", n_name=self.mom_hostname)

        # resetting the same partition value
        self.set_node_partition_attr(partition="P2", n_name=self.mom_hostname)
        self.set_node_partition_attr(mgr_cmd="MGR_CMD_UNSET",
                                     n_name=self.mom_hostname)

    def test_set_partition_node_attr_user_permissions(self):
        """
        Test to check the user permissions for set/unset the partition
        attribute of node
        """
        self.set_node_partition_attr(n_name=self.mom_hostname)
        msg1 = "Unauthorized Request"
        msg2 = "didn't receive expected error message"
        try:
            self.set_node_partition_attr(partition="P2", user=TEST_USER)
        except PbsManagerError as e:
            self.assertTrue(msg1 in e.msg[0], msg2)
        try:
            self.set_node_partition_attr(mgr_cmd="MGR_CMD_UNSET",
                                         user=TEST_USER)
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15007)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)

    def test_partition_association_with_node_and_queue(self):
        """
        Test to check the set of partition attribute and association
        between queue and node
        """
        attr = {'queue_type': "execution", 'enabled': "True",
                'started': "True", 'partition': "P1"}
        self.server.manager(MGR_CMD_CREATE, QUEUE, attr, id="Q1")
        self.set_node_partition_attr(n_name=self.mom_hostname)
        attr = {'queue_type': "execution", 'enabled': "True",
                'started': "True", 'partition': "P2"}
        self.server.manager(MGR_CMD_CREATE, QUEUE, attr, id="Q2")

        self.set_node_partition_attr(mgr_cmd="MGR_CMD_UNSET",
                                     n_name=self.mom_hostname)
        self.server.manager(MGR_CMD_SET, NODE, {
                            'queue': "Q2"}, id=self.mom_hostname)
        self.set_node_partition_attr(partition="P2", n_name=self.mom_hostname)

    def test_mismatch_of_partition_on_node_and_queue(self):
        """
        Test to check the set of partition attribute is disallowed
        if partition ids do not match on queue and node
        """
        self.test_partition_association_with_node_and_queue()
        msg1 = "Invalid partition in queue"
        msg2 = "didn't receive expected error message"
        try:
            self.server.manager(MGR_CMD_SET,
                                QUEUE, {'partition': "P1"},
                                id="Q2")
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15221)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)
        msg1 = "Partition P2 is not part of queue for node"
        try:
            self.server.manager(MGR_CMD_SET,
                                NODE, {'queue': "Q1"},
                                id=self.mom_hostname)
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15220)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)
        msg1 = "Queue Q2 is not part of partition for node"
        try:
            self.set_node_partition_attr(n_name=self.mom_hostname)
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15219)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)


================================================
FILE: test/tests/interfaces/pbs_partition.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.interfaces import *


class TestPartition(TestInterfaces):
    """
    Test suite to test partition attr
    """

    def partition_attr(self, mgr_cmd=MGR_CMD_SET,
                       obj_name="QUEUE", q_type=None,
                       name="Q1", enable="True",
                       start="True", partition="P1", user=ROOT_USER):
        """
        Common function to set partition attribute/s to node/queue object
        :param mgr_cmd: qmgr "MGR_CMD_SET/MGR_CMD_UNSET/MGR_CMD_CREATE" cmd,
        Defaults to MGR_CMD_SET
        :type mgr_cmd: int
        :param obj_name: PBS object vnode/queue. Defaults to queue
        :type obj_name: str
        :param q_type: "queue_type" attribute of queue object ,
                    Defaults to "execution"
        :type q_type:  str
        :param name: name of the queue/vnode , Defaults to Q1 for Queue object,
        and server shortname for Node object
        :type name: str
        :param enable: "enabled" attribute of queue object, Defaults to "True"
        :type enable: boolean
        :param start: "started" attribute of queue object, Defaults to "True"
        :type start: boolean
        :param partition: "partition" attribute of vnode/queue object,
                    Defaults to "P1"
        :type partition: str
        :param user: one of the pre-defined set of users
        :type user: :py:class:`~ptl.lib.pbs_testlib.PbsUser`
        """
        if obj_name == "QUEUE":
            if mgr_cmd == MGR_CMD_CREATE:
                if q_type is None:
                    attr = {'partition': partition}
                else:
                    attr = {
                        'queue_type': q_type,
                        'enabled': enable,
                        'started': start,
                        'partition': partition}
                self.server.manager(MGR_CMD_CREATE,
                                    QUEUE, attr, id=name, runas=user)
            elif mgr_cmd == MGR_CMD_SET:
                attr = {'partition': partition}
                self.server.manager(MGR_CMD_SET, QUEUE,
                                    attr, id=name, runas=user)
            elif mgr_cmd == MGR_CMD_UNSET:
                self.server.manager(MGR_CMD_UNSET, QUEUE,
                                    "partition", id=name, runas=user)
            else:
                msg = ("Error: partition_attr function takes only "
                       "MGR_CMD_[CREATE/SET/UNSET] value for mgr_cmd when "
                       "pbs object is queue")
                self.assertTrue(False, msg)
        elif obj_name == "NODE":
            if name == "Q1":
                name = self.mom.shortname
            attr = {'partition': partition}
            if mgr_cmd == MGR_CMD_SET:
                self.server.manager(MGR_CMD_SET, NODE, attr,
                                    id=name, runas=user)
            elif mgr_cmd == MGR_CMD_UNSET:
                self.server.manager(MGR_CMD_UNSET, NODE,
                                    "partition", id=name, runas=user)
            else:
                msg = ("Error: partition_attr function takes only "
                       "MGR_CMD_SET/MGR_CMD_UNSET value for mgr_cmd when "
                       "pbs object is node")
                self.assertTrue(False, msg)
        else:
            msg = ("Error: partition_attr function takes only "
                   "QUEUE/NODE objects value for obj_name")
            self.assertTrue(False, msg)

    def test_set_unset_queue_partition(self):
        """
        Test to set/unset the partition attribute of queue object
        """
        self.partition_attr(mgr_cmd=MGR_CMD_CREATE, q_type="execution")
        self.partition_attr(mgr_cmd=MGR_CMD_SET, partition="P2")
        # resetting the same partition value
        self.partition_attr(mgr_cmd=MGR_CMD_SET, partition="P2")
        self.partition_attr(mgr_cmd=MGR_CMD_UNSET)

    def test_set_queue_partition_user_permissions(self):
        """
        Test to check the user permissions for set/unset the partition
        attribute of queue
        """
        self.partition_attr(mgr_cmd=MGR_CMD_CREATE, q_type="execution")
        msg1 = "Unauthorized Request"
        msg2 = "checking the qmgr error message"
        try:
            self.partition_attr(mgr_cmd=MGR_CMD_SET, partition="P2")
        except PbsManagerError as e:
            self.assertTrue(msg1 in e.msg[0], msg2)
        try:
            self.partition_attr(mgr_cmd=MGR_CMD_UNSET)
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15007)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)

    def test_set_partition_to_routing_queue(self):
        """
        Test to check the set of partition attribute on routing queue
        """
        msg0 = "Route queues are incompatible with the "\
               "partition attribute"
        msg1 = "Cannot assign a partition to route queue"
        msg2 = "Qmgr error message do not match"
        try:
            self.partition_attr(
                mgr_cmd=MGR_CMD_CREATE,
                q_type="route",
                enable="False",
                start="False")
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15217)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg0 in e.msg[0], msg2)
        self.server.manager(
            MGR_CMD_CREATE, QUEUE, {
                'queue_type': 'route'}, id='Q1')
        try:
            self.partition_attr(mgr_cmd=MGR_CMD_SET)
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15007)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)

    def test_modify_queue_with_partition_to_routing(self):
        """
        Test to check the modify of execution queue to routing when
        partition attribute is set
        """
        self.partition_attr(mgr_cmd=MGR_CMD_CREATE, q_type="execution")
        msg1 = ("Route queues are incompatible "
                "with the partition attribute queue_type")
        msg2 = "checking the qmgr error message"
        try:
            self.partition_attr(mgr_cmd=MGR_CMD_SET, q_type="route")
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15218)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)

    def test_set_partition_without_queue_type(self):
        """
        Test to check the set of partition attribute on queue
        with not queue_type set
        """
        self.partition_attr(mgr_cmd=MGR_CMD_CREATE)
        self.partition_attr(mgr_cmd=MGR_CMD_SET, partition="P2")
        self.partition_attr(mgr_cmd=MGR_CMD_SET, q_type="execution")

    def test_partition_node_attr(self):
        """
        Test to set/unset the partition attribute of node object
        """
        self.partition_attr(obj_name="NODE")
        self.partition_attr(obj_name="NODE", partition="P2")
        # resetting the same partition value
        self.partition_attr(obj_name="NODE", partition="P2")
        self.partition_attr(mgr_cmd=MGR_CMD_UNSET, obj_name="NODE")

    def test_set_partition_node_attr_user_permissions(self):
        """
        Test to check the user permissions for set/unset the partition
        attribute of node
        """
        self.partition_attr(obj_name="NODE")
        msg1 = "Unauthorized Request"
        msg2 = "didn't receive expected error message"
        try:
            self.partition_attr(
                obj_name="NODE",
                partition="P2",
                user=TEST_USER)
        except PbsManagerError as e:
            self.assertTrue(msg1 in e.msg[0], msg2)
        try:
            self.partition_attr(mgr_cmd=MGR_CMD_UNSET,
                                obj_name="NODE", user=TEST_USER)
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15007)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)

    def test_partition_association_with_node_and_queue(self):
        """
        Test to check the set of partition attribute and association
        between queue and node
        """
        self.partition_attr(mgr_cmd=MGR_CMD_CREATE, q_type="execution")
        self.partition_attr(obj_name="NODE")
        self.partition_attr(
            mgr_cmd=MGR_CMD_CREATE,
            q_type="execution",
            name="Q2",
            partition="P2")
        self.partition_attr(mgr_cmd=MGR_CMD_UNSET, obj_name="NODE")
        self.server.manager(MGR_CMD_SET, NODE, {
                            'queue': "Q2"}, id=self.mom.shortname)
        self.partition_attr(obj_name="NODE", partition="P2")

    def test_mismatch_of_partition_on_node_and_queue(self):
        """
        Test to check the set of partition attribute is disallowed
        if partition ids do not match on queue and node
        """
        self.test_partition_association_with_node_and_queue()
        msg1 = "Invalid partition in queue"
        msg2 = "didn't receive expected error message"
        try:
            self.partition_attr(mgr_cmd=MGR_CMD_SET, name="Q2")
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15221)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)
        msg1 = "Partition P2 is not part of queue for node"
        try:
            self.server.manager(MGR_CMD_SET,
                                NODE, {'queue': "Q1"},
                                id=self.mom.shortname)
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15220)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)
        msg1 = "Queue Q2 is not part of partition for node"
        try:
            self.partition_attr(obj_name="NODE")
        except PbsManagerError as e:
            # self.assertEqual(e.rc, 15219)
            # The above code has to be uncommented when the PTL framework
            # bug PP-881 gets fixed
            self.assertTrue(msg1 in e.msg[0], msg2)


================================================
FILE: test/tests/interfaces/pbs_preempt_params.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.interfaces import *


class TestPreemptParamsQmgr(TestInterfaces):
    """
    This testsuite is for testing setting/unsetting of preemption paramaters
    that were moved from sched_config to the scheduler object.
    """
    UNAUTH = 1

    def func_set_fail(self, a, msg, user=ROOT_USER, error_type=0):
        """
        function to confirm that setting the value fails.
        """
        error = ""
        error_code = ""
        if error_type == self.UNAUTH:
            error = "Unauthorized Request"
            error_code = "15007"
        else:
            error = "Illegal attribute or resource value"
            error_code = "15014"

        try:
            self.server.manager(MGR_CMD_SET, SCHED, a, runas=user)
        except PbsManagerError as e:
            self.assertTrue(error in e.msg[0])
            self.assertTrue(error_code in e.msg[1])
        else:
            self.fail(msg)

    def common_tests(self, param, msg):
        """
        function that executes common steps in the actual tests.
        """
        a = {param: 'abc'}
        self.func_set_fail(a, msg)

        a = {param: '123abc'}
        self.func_set_fail(a, msg)

        a = {param: 'abc123'}
        self.func_set_fail(a, msg)

    def test_set_unset_preempt_queue_prio(self):
        """
        This test case sets preempt_queue_prio parameter to valid/invalid
        values and checks if the server allows/disallows the operation.
        """
        msg = "preempt_queue_prio set to invalid value"
        param = 'preempt_queue_prio'

        self.common_tests(param, msg)

        a = {param: 120}
        self.func_set_fail(a, msg, TEST_USER, self.UNAUTH)

        self.server.manager(MGR_CMD_SET, SCHED, a, runas=ROOT_USER)

        self.server.manager(MGR_CMD_UNSET, SCHED, 'preempt_queue_prio',
                            runas=ROOT_USER)

        a = {param: 150}
        self.server.manager(MGR_CMD_LIST, SCHED, a, runas=ROOT_USER)

    def test_set_unset_preempt_prio(self):
        """
        This test case sets preempt_prio parameter to valid/invalid
        values and checks if the server allows/disallows the operation.
        """
        msg = "preempt_prio set to invalid value"
        param = 'preempt_prio'

        self.common_tests(param, msg)

        p = '"express_queue, nrmal_jobs, server_softlimits, queue_softlimits"'
        a = {param: p}
        self.func_set_fail(a, msg)

        p = '"express_queue, normal_jobs, server_softlimits, queue_softlimits"'
        a = {param: p}
        self.func_set_fail(a, msg, TEST_USER, self.UNAUTH)

        self.server.manager(MGR_CMD_SET, SCHED, a, runas=ROOT_USER)

        p = '"express_queue, normal_jobs, express_queue+fairshare, fairshare"'
        a = {param: p}
        self.server.manager(MGR_CMD_SET, SCHED, a,
                            runas=ROOT_USER)

        self.server.manager(MGR_CMD_LIST, SCHED, a, runas=ROOT_USER)

        self.server.manager(MGR_CMD_UNSET, SCHED, param,
                            runas=ROOT_USER)

        p = 'express_queue, normal_jobs'
        a = {param: p}
        self.server.manager(MGR_CMD_LIST, SCHED, a, runas=ROOT_USER)

    def test_set_unset_preempt_order(self):
        """
        This test case sets preempt_order parameter to valid/invalid
        values and checks if the server allows/disallows the operation.
        """
        msg = "preempt_order set to invalid value"
        param = 'preempt_order'

        self.common_tests(param, msg)

        a = {param: '"SCR 80 PQR"'}
        self.func_set_fail(a, msg)

        a = {param: '"PQR"'}
        self.func_set_fail(a, msg)

        a = {param: '"SCR SC"'}
        self.func_set_fail(a, msg)

        a = {param: '"80 SC"'}
        self.func_set_fail(a, msg)

        a = {param: '"SCR 80 70"'}
        self.func_set_fail(a, msg)

        a = {param: '"SCR 80 SC 50 S"'}
        self.server.manager(MGR_CMD_SET, SCHED, a, runas=ROOT_USER)

        a = {param: 'SCR'}
        self.func_set_fail(a, msg, TEST_USER, self.UNAUTH)

        self.server.manager(MGR_CMD_SET, SCHED, a, runas=ROOT_USER)

        self.server.manager(MGR_CMD_UNSET, SCHED, param, runas=ROOT_USER)

        self.server.manager(MGR_CMD_LIST, SCHED, a, runas=ROOT_USER)

    def test_set_unset_preempt_sort(self):
        """
        This test case sets preempt_sort parameter to valid/invalid
        values and checks if the server allows/disallows the operation.
        """
        msg = "preempt_sort set to invalid value"
        param = 'preempt_sort'

        self.common_tests(param, msg)

        a = {param: '123'}
        self.func_set_fail(a, msg)

        a = {param: 'min_time_sincestart'}
        self.func_set_fail(a, msg)

        a = {param: 'min_time_since_start'}
        self.func_set_fail(a, msg, TEST_USER, self.UNAUTH)

        self.server.manager(MGR_CMD_SET, SCHED, a, runas=ROOT_USER)

        self.server.manager(MGR_CMD_UNSET, SCHED, param, runas=ROOT_USER)
        self.server.expect(SCHED, a, runas=ROOT_USER)
        self.server.manager(MGR_CMD_LIST, SCHED, a, runas=ROOT_USER)


================================================
FILE: test/tests/interfaces/pbs_sched_interface_test.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.interfaces import *


class TestSchedulerInterface(TestInterfaces):

    """
    Test suite to test different scheduler interfaces
    """

    def setUp(self):
        TestInterfaces.setUp(self)
        a = {'partition': 'P1',
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_CREATE,
                            SCHED, a,
                            id="TestCommonSched")
        self.scheds['TestCommonSched'].create_scheduler()
        self.scheds['TestCommonSched'].start()

    def test_duplicate_scheduler_name(self):
        """
        Check for the scheduler object name.
        """
        try:
            self.server.manager(MGR_CMD_CREATE,
                                SCHED,
                                {'sched_host': self.server.hostname},
                                id="TestCommonSched")
        except PbsManagerError as e:
            if self.server.get_op_mode() == PTL_CLI:
                self.assertTrue(
                    'qmgr: Error (15211) returned from server' in e.msg[1])

    def test_permission_on_scheduler(self):
        """
        Check for the permission to create/delete/modify scheduler object.
        """
        # Check for create permission
        try:
            self.server.manager(MGR_CMD_CREATE,
                                SCHED,
                                {'sched_host': self.server.hostname},
                                id="testCreateSched",
                                runas=OPER_USER)
        except PbsManagerError as e:
            if self.server.get_op_mode() == PTL_CLI:
                self.assertTrue(
                    'qmgr: Error (15007) returned from server' in e.msg[1])

        self.server.manager(MGR_CMD_CREATE,
                            SCHED,
                            {'sched_host': self.server.hostname},
                            id="testCreateSched",
                            runas=ROOT_USER)

        # Check for delete permission
        self.server.manager(MGR_CMD_CREATE,
                            SCHED,
                            {'sched_host': self.server.hostname},
                            id="testDeleteSched")
        try:
            self.server.manager(MGR_CMD_DELETE,
                                SCHED,
                                id="testDeleteSched",
                                runas=OPER_USER)
        except PbsManagerError as e:
            if self.server.get_op_mode() == PTL_CLI:
                self.assertTrue(
                    'qmgr: Error (15007) returned from server' in e.msg[1])

        self.server.manager(MGR_CMD_DELETE,
                            SCHED,
                            id="testDeleteSched",
                            runas=ROOT_USER)

        # Check for attribute set permission
        try:
            self.server.manager(MGR_CMD_SET,
                                SCHED,
                                {'sched_cycle_length': 12000},
                                id="TestCommonSched",
                                runas=OPER_USER)
        except PbsManagerError as e:
            if self.server.get_op_mode() == PTL_CLI:
                self.assertTrue(
                    'qmgr: Error (15007) returned from server' in e.msg[1])

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_cycle_length': 12000},
                            id="TestCommonSched", runas=ROOT_USER)

    def test_delete_default_sched(self):
        """
        Delete default scheduler.
        """
        try:
            self.server.manager(MGR_CMD_DELETE,
                                SCHED,
                                id="default")
        except PbsManagerError as e:
            if self.server.get_op_mode() == PTL_CLI:
                self.assertTrue(
                    'qmgr: Error (15214) returned from server' in e.msg[1])

    def test_set_and_unset_sched_attributes(self):
        """
        Set and unset an attribute of a scheduler object .
        """
        # Set an attribute of a scheduler object.
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'sched_cycle_length': 1234}, id="TestCommonSched")

        # Unset an attribute of a scheduler object.
        self.server.manager(MGR_CMD_UNSET,
                            SCHED,
                            'sched_cycle_length',
                            id="TestCommonSched")
        a = {'sched_cycle_length': '00:20:00'}
        self.server.expect(SCHED, a, id='TestCommonSched', max_attempts=10)

    def test_sched_default_attrs(self):
        """
        Test all sched attributes are set by default on default scheduler
        """
        sched_priv = os.path.join(
            self.server.pbs_conf['PBS_HOME'], 'sched_priv')
        sched_logs = os.path.join(
            self.server.pbs_conf['PBS_HOME'], 'sched_logs')
        a = {'sched_host': self.server.hostname,
             'sched_priv': sched_priv,
             'sched_log': sched_logs,
             'scheduling': 'True',
             'scheduler_iteration': 600,
             'state': 'idle',
             'sched_cycle_length': '00:20:00'}
        self.server.expect(SCHED, a, id='default',
                           attrop=PTL_AND, max_attempts=10)

    def test_scheduling_attribute(self):
        """
        Test scheduling attribute on newly created scheduler is false
        unless made true
        """
        self.server.expect(SCHED, {'scheduling': 'False'},
                           id='TestCommonSched', max_attempts=10)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'},
                            runas=ROOT_USER, id='TestCommonSched')
        self.server.expect(SCHED, {'scheduling': 'True'},
                           id='TestCommonSched', max_attempts=10)

    def test_set_sched_priv_log_duplicate_value(self):
        """
        Test setting of sched_priv and sched_log to a
        value assigned to another scheduler
        """
        err_msg = "Another scheduler also has same "
        err_msg += "value for its sched_priv directory"
        try:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'sched_priv': '/var/spool/pbs/sched_priv'},
                                runas=ROOT_USER, id='TestCommonSched')
        except PbsManagerError as e:
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")
        err_msg = "Another scheduler also has same "
        err_msg += "value for its sched_log directory"
        try:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'sched_log': '/var/spool/pbs/sched_logs'},
                                runas=ROOT_USER, id='TestCommonSched')
        except PbsManagerError as e:
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")

    def test_set_default_sched_not_permitted(self):
        """
        Test setting partition on default scheduler
        """
        err_msg = "Operation is not permitted on default scheduler"
        try:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'partition': 'P1'},
                                runas=ROOT_USER)
        except PbsManagerError as e:
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'sched_priv': '/var/spool/somedir'},
                                runas=ROOT_USER)
        except PbsManagerError as e:
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")
        try:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'sched_log': '/var/spool/somedir'},
                                runas=ROOT_USER)
        except PbsManagerError as e:
            self.assertTrue(err_msg in e.msg[0],
                            "Error message is not expected")

    def test_sched_name_too_long(self):
        """
        Test creating a scheduler with name longer than 15 chars
        """
        try:
            self.server.manager(MGR_CMD_CREATE, SCHED,
                                runas=ROOT_USER, id="TestLongScheduler")
        except PbsManagerError as e:
            self.assertTrue("Scheduler name is too long" in e.msg[0],
                            "Error message is not expected")

    def test_set_default_sched_attrs(self):
        """
        Test setting scheduling and scheduler_iteration on default scheduler
        and it updates server attributes and vice versa
        """
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'False'},
                            runas=ROOT_USER)
        self.server.expect(SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduling': 'True'},
                            runas=ROOT_USER)
        self.server.expect(SCHED, {'scheduling': 'True'},
                           id='default', max_attempts=10)
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduler_iteration': 300},
                            runas=ROOT_USER)
        self.server.expect(SERVER, {'scheduler_iteration': 300})
        self.server.manager(MGR_CMD_SET, SERVER,
                            {'scheduler_iteration': 500},
                            runas=ROOT_USER)
        self.server.expect(SCHED, {'scheduler_iteration': 500},
                           id='default', max_attempts=10)

    def test_scheduling_iteration(self):
        """
        Test scheduler_itration attribute after it is unset. It should go
        to its default value which is 600. If this happens Server will not
        kickoff infinite scheduling cycles. Also make sure that all other
        scheduler attributes are set to its correct default values after
        this change.
        """
        self.server.manager(MGR_CMD_SET, SCHED,
                            {ATTR_schedit: 500},
                            runas=ROOT_USER, id='TestCommonSched')
        self.server.expect(SCHED, {ATTR_schedit: '500'},
                           id='TestCommonSched', max_attempts=5)

        self.server.manager(MGR_CMD_UNSET, SCHED, ATTR_schedit,
                            id='TestCommonSched')

        sched_priv = os.path.join(
            self.server.pbs_conf['PBS_HOME'], 'sched_priv_TestCommonSched')
        sched_logs = os.path.join(
            self.server.pbs_conf['PBS_HOME'], 'sched_logs_TestCommonSched')
        a = {'sched_host': self.server.hostname,
             'sched_priv': sched_priv,
             'sched_log': sched_logs,
             'scheduling': 'False',
             'scheduler_iteration': 600,
             'sched_cycle_length': '00:20:00'}
        self.server.expect(SCHED, a, id='TestCommonSched', max_attempts=10)


================================================
FILE: test/tests/pbs_smoketest.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_testsuite import *


@tags('smoke')
class SmokeTest(PBSTestSuite):

    """
    This test suite contains a few smoke tests of PBS

    """

    def test_submit_job(self):
        """
        Test to submit a job
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_submit_job_array(self):
        """
        Test to submit a job array
        """
        a = {'resources_available.ncpus': 8}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        j = Job(TEST_USER)
        j.set_attributes({ATTR_J: '1-3:1'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'B'}, jid)
        self.server.expect(JOB, {'job_state=R': 3}, count=True,
                           id=jid, extend='t')

    def test_advance_reservation(self):
        """
        Test to submit an advanced reservation and submit jobs to that
        reservation. Check if the reservation gets confimed and the jobs
        inside the reservation starts running when the reservation runs.
        """
        a = {'resources_available.ncpus': 4}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        r = Reservation(TEST_USER)
        now = int(time.time())
        r_start_time = now + 30
        a = {'Resource_List.select': '1:ncpus=4',
             'reserve_start': r_start_time,
             'reserve_end': now + 110}
        r.set_attributes(a)
        rid = self.server.submit(r)
        rid_q = rid.split('.')[0]
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)

        # submit a normal job and an array job to the reservation
        a = {'Resource_List.select': '1:ncpus=1',
             ATTR_q: rid_q}
        j1 = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j1)

        a = {'Resource_List.select': '1:ncpus=1',
             ATTR_q: rid_q, ATTR_J: '1-2'}
        j2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j2)

        offset = r_start_time - int(time.time())
        a = {'reserve_state': (MATCH_RE, "RESV_RUNNING|5")}
        self.server.expect(RESV, a, id=rid, interval=1,
                           offset=offset)
        self.server.expect(JOB, {'job_state': 'R'}, jid1)
        self.server.expect(JOB, {'job_state': 'B'}, jid2)

    def test_standing_reservation(self):
        """
        Test to submit a standing reservation
        """
        # PBS_TZID environment variable must be set, there is no way to set
        # it through the API call, use CLI instead for this test

        _m = self.server.get_op_mode()
        if _m != PTL_CLI:
            self.server.set_op_mode(PTL_CLI)
        if 'PBS_TZID' in self.conf:
            tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Missing timezone, using America/Los_Angeles')
            tzone = 'America/Los_Angeles'
        a = {'Resource_List.select': '1:ncpus=1',
             ATTR_resv_rrule: 'FREQ=WEEKLY;COUNT=3',
             ATTR_resv_timezone: tzone,
             ATTR_resv_standing: '1',
             'reserve_start': time.time() + 20,
             'reserve_end': time.time() + 30, }
        r = Reservation(TEST_USER, a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)
        if _m == PTL_API:
            self.server.set_op_mode(PTL_API)

    def test_degraded_advance_reservation(self):
        """
        Make reservations more fault tolerant
        Test for an advance reservation
        """

        now = int(time.time())
        a = {'reserve_retry_init': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, num=2)
        a = {'Resource_List.select': '1:ncpus=4',
             'reserve_start': now + 3600,
             'reserve_end': now + 7200}
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, a, id=rid)
        self.server.status(RESV, 'resv_nodes', id=rid)
        resv_node = self.server.reservations[rid].get_vnodes()[0]
        a = {'state': 'offline'}
        self.server.manager(MGR_CMD_SET, NODE, a, id=resv_node)
        a = {'reserve_state': (MATCH_RE, 'RESV_DEGRADED|10')}
        self.server.expect(RESV, a, id=rid)
        a = {'resources_available.ncpus': (GT, 0)}
        free_nodes = self.server.filter(NODE, a)
        nodes = list(free_nodes.values())[0]
        other_node = [nodes[0], nodes[1]][resv_node == nodes[0]]
        a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2'),
             'resv_nodes': (MATCH_RE, re.escape(other_node))}
        self.server.expect(RESV, a, id=rid, offset=3, attrop=PTL_AND)

    def test_select(self):
        """
        Test to qselect
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, jid)
        jobs = self.server.select()
        self.assertNotEqual(jobs, None)

    def test_alter(self):
        """
        Test to alter job
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.server.alterjob(jid, {'comment': 'job comment altered'})
        self.server.expect(JOB, {'comment': 'job comment altered'}, id=jid)

    def test_sigjob(self):
        """
        Test to signal job
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42},
                           attrop=PTL_AND, id=jid)
        self.server.sigjob(jid, 'suspend')
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)
        self.server.sigjob(jid, 'resume')
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    def test_backfilling(self):
        """
        Test for backfilling
        """
        a = {'resources_available.ncpus': 2}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 3600}
        j = Job(TEST_USER, attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        a = {'Resource_List.select': '1:ncpus=2',
             'Resource_List.walltime': 3600}
        j = Job(TEST_USER, attrs=a)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, 'comment', op=SET, id=jid1)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid1)
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.walltime': 1800}
        j = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

    def test_hold_release(self):
        """
        Test to hold and release a job
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        a = {'job_state': 'R', 'substate': '42'}
        self.server.expect(JOB, a, jid, attrop=PTL_AND)
        self.server.holdjob(jid, USER_HOLD)
        self.server.expect(JOB, {'Hold_Types': 'u'}, jid)
        self.server.rlsjob(jid, USER_HOLD)
        self.server.expect(JOB, {'Hold_Types': 'n'}, jid)

    def test_create_vnode(self):
        """
        Test to create vnodes
        """
        self.server.expect(SERVER, {'pbs_version': '8'}, op=GT)
        self.server.manager(MGR_CMD_DELETE, NODE, None, "")
        a = {'resources_available.ncpus': 20, 'sharing': 'force_excl'}
        momstr = self.mom.create_vnode_def('testnode', a, 10)
        self.mom.insert_vnode_def(momstr)
        self.server.manager(MGR_CMD_CREATE, NODE, None, self.mom.hostname)
        a = {'resources_available.ncpus=20': 10}
        self.server.expect(VNODE, a, count=True, interval=5)

    def test_create_execution_queue(self):
        """
        Test to create execution queue
        """
        qname = 'testq'
        try:
            self.server.manager(MGR_CMD_DELETE, QUEUE, None, qname)
        except PbsManagerError:
            pass
        a = {'queue_type': 'Execution', 'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)
        self.server.manager(MGR_CMD_DELETE, QUEUE, id=qname)

    def test_create_routing_queue(self):
        """
        Test to create routing queue
        """
        qname = 'routeq'
        try:
            self.server.manager(MGR_CMD_DELETE, QUEUE, None, qname)
        except PbsManagerError:
            pass
        a = {'queue_type': 'Route', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)
        self.server.manager(MGR_CMD_DELETE, QUEUE, id=qname)

    def test_fgc_limits(self):
        """
        Test for limits
        """
        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, 2)
        a = {'max_run': '[u:' + str(TEST_USER) + '=2]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(SERVER, a)
        j1 = Job(TEST_USER)
        j2 = Job(TEST_USER)
        j3 = Job(TEST_USER)
        j1id = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R'}, j1id)
        j2id = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        j3id = self.server.submit(j3)
        self.server.expect(JOB, 'comment', op=SET, id=j3id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j3id)

    def test_limits(self):
        """
        Test for limits
        """
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '2gb'}
        self.mom.create_vnodes(a, 2)
        a = {'max_run_res.ncpus': '[u:' + str(TEST_USER) + '=2]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        for _ in range(3):
            j = Job(TEST_USER)
            self.server.submit(j)
        a = {'server_state': 'Scheduling'}
        self.server.expect(SERVER, a, op=NE)
        a = {'job_state=R': 2, 'euser=' + str(TEST_USER): 2}
        self.server.expect(JOB, a, attrop=PTL_AND)

        # Now set limit on mem as well and submit 2 jobs, each requesting
        # a different limit resource and check both of them run
        self.server.cleanup_jobs()
        a = {'max_run_res.mem': '[u:' + str(TEST_USER) + '=1gb]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'Resource_List.ncpus': 1}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        a = {'Resource_List.mem': '1gb'}
        j = Job(TEST_USER, a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

    @runOnlyOnLinux
    def test_finished_jobs(self):
        """
        Test for finished jobs and resource used for jobs.
        """
        a = {'resources_available.ncpus': '2'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'Resource_List.ncpus': 2}
        j = Job(TEST_USER, a)
        j.set_sleep_time(15)
        j.create_eatcpu_job(15, self.mom.shortname)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'F'}, extend='x', offset=15,
                           interval=1, id=jid)
        jobs = self.server.status(JOB, id=jid, extend='x')
        exp_eq_val = {ATTR_used + '.ncpus': '2',
                      ATTR_exit_status: '0'}
        for key in exp_eq_val:
            self.assertEqual(exp_eq_val[key], jobs[0][key])
        exp_noteq_val = {ATTR_used + '.walltime': '00:00:00',
                         ATTR_used + '.cput': '00:00:00',
                         ATTR_used + '.mem': '0kb',
                         ATTR_used + '.cpupercent': '0'}
        for key in exp_noteq_val:
            self.assertNotEqual(exp_noteq_val[key], jobs[0][key])

    def test_project_based_limits(self):
        """
        Test for project based limits
        """
        proj = 'testproject'
        a = {'max_run': '[p:' + proj + '=1]'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        for _ in range(5):
            j = Job(TEST_USER, attrs={ATTR_project: proj})
            self.server.submit(j)
        self.server.expect(SERVER, {'server_state': 'Scheduling'}, op=NE)
        self.server.expect(JOB, {'job_state=R': 1})

    def test_job_scheduling_order(self):
        """
        Test for job scheduling order
        """
        a = {'backfill_depth': 5}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.scheduler.set_sched_config({'strict_ordering': 'True'})
        a = {'resources_available.ncpus': '1'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        if self.mom.is_cpuset_mom():
            a = {'state=free': (GE, 1)}
        else:
            a = {'state=free': 1}
        self.server.expect(VNODE, a, attrop=PTL_AND)
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        for _ in range(6):
            j = Job(TEST_USER, attrs={'Resource_List.select': '1:ncpus=1',
                                      'Resource_List.walltime': 3600})
            self.server.submit(j)
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'server_state': 'Scheduling'}
        self.server.expect(SERVER, a, op=NE)
        self.server.expect(JOB, {'estimated.start_time': 5},
                           count=True, op=SET)

    def test_preemption(self):
        """
        Test for preemption
        """
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})
        a = {'resources_available.ncpus': '1'}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        self.server.status(QUEUE)
        if 'expressq' in self.server.queues.keys():
            self.server.manager(MGR_CMD_DELETE, QUEUE, None, 'expressq')
        a = {'queue_type': 'execution'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, 'expressq')
        a = {'enabled': 'True', 'started': 'True', 'priority': 150}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'expressq')
        j = Job(TEST_USER, attrs={'Resource_List.select': '1:ncpus=1'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        j2 = Job(TEST_USER,
                 attrs={'queue': 'expressq',
                        'Resource_List.select': '1:ncpus=1'})
        j2id = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid)

    def test_preemption_qrun(self):
        """
        Test that a job is preempted when a high priority job is run via qrun
        """
        self.server.manager(MGR_CMD_SET, NODE,
                            {'resources_available.ncpus': 1},
                            id=self.mom.shortname)

        j = Job(TEST_USER)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        j2 = Job(TEST_USER)
        jid2 = self.server.submit(j2)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid2)

        self.server.runjob(jid2)
        self.server.expect(JOB, {'job_state': 'S'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        self.scheduler.log_match(jid1 + ";Job preempted by suspension")

    def test_fairshare(self):
        """
        Test for fairshare
        """
        a = {'fair_share': 'true ALL',
             'fairshare_usage_res': 'ncpus*walltime',
             'unknown_shares': 10}
        self.scheduler.set_sched_config(a)
        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, 4)
        a = {'Resource_List.select': '1:ncpus=4'}
        for _ in range(10):
            j = Job(TEST_USER1, a)
            self.server.submit(j)
        a = {'job_state=R': 4}
        self.server.expect(JOB, a)
        self.logger.info('testinfo: waiting for walltime accumulation')
        running_jobs = self.server.filter(JOB, {'job_state': 'R'})
        if running_jobs.values():
            for _j in list(running_jobs.values())[0]:
                a = {'resources_used.walltime': (NE, '00:00:00')}
                self.server.expect(JOB, a, id=_j, interval=1, max_attempts=30)
        j = Job(TEST_USER2)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid, offset=5)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        a = {'server_state': 'Scheduling'}
        self.server.expect(SERVER, a, op=NE)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        cycle = self.scheduler.cycles(start=self.server.ctime, lastN=10)
        if len(cycle) > 0:
            i = len(cycle) - 1
            while len(cycle[i].political_order) == 0:
                i -= 1
            cycle = cycle[i]
            firstconsidered = cycle.political_order[0]
            lastsubmitted = jid.split('.')[0]
            msg = 'testinfo: first job considered [' + str(firstconsidered) + \
                  '] == last submitted [' + str(lastsubmitted) + ']'
            self.logger.info(msg)
            self.assertEqual(firstconsidered, lastsubmitted)

    def test_server_hook(self):
        """
        Create a hook, import a hook content that rejects all jobs, verify
        that a job is rejected by the hook.
        """
        hook_name = "testhook"
        hook_body = "import pbs\npbs.event().reject('my custom message')\n"
        a = {'event': 'queuejob', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, a, hook_body)
        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 2047})
        j = Job(TEST_USER)
        now = time.time()
        try:
            self.server.submit(j)
        except PbsSubmitError:
            pass
        self.server.log_match("my custom message", starttime=now)

    def test_mom_hook(self):
        """
        Create a hook, import a hook content that rejects all jobs, verify
        that a job is rejected by the hook.
        """
        hook_name = "momhook"
        hook_body = "import pbs\npbs.event().reject('my custom message')\n"
        a = {'event': 'execjob_begin', 'enabled': 'True'}
        self.server.create_import_hook(hook_name, a, hook_body)
        # Asynchronous copy of hook content, we wait for the copy to occur
        self.server.log_match(".*successfully sent hook file.*" +
                              hook_name + ".PY" + ".*", regexp=True,
                              max_attempts=100, interval=5)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.mom.log_match("my custom message", starttime=self.server.ctime,
                           interval=1)

    def test_shrink_to_fit(self):
        """
        Smoke test shrink to fit by setting a dedicated time to start in an
        hour and submit a job that can run for as low as 59 mn and as long as
        4 hours. Expect the job's walltime to be greater or equal than the
        minimum set.
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        now = time.time()
        self.scheduler.add_dedicated_time(start=now + 3600, end=now + 7200)
        j = Job(TEST_USER)
        a = {'Resource_List.max_walltime': '04:00:00',
             'Resource_List.min_walltime': '00:58:00'}
        j.set_attributes(a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        attr = {'Resource_List.walltime':
                (GE, a['Resource_List.min_walltime'])}
        self.server.expect(JOB, attr, id=jid)

    def test_submit_job_with_script(self):
        """
        Test to submit job with job script
        """
        sleep_cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                 'bin', 'pbs_sleep')
        script_body = sleep_cmd + ' 120'
        j = Job(TEST_USER, attrs={ATTR_N: 'test'})
        j.create_script(script_body, hostname=self.server.client)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.delete(id=jid, extend='force', wait=True)
        self.logger.info("Testing script with extension")
        j = Job(TEST_USER)

        fn = self.du.create_temp_file(hostname=self.server.client,
                                      suffix=".scr",
                                      body=script_body,
                                      asuser=str(TEST_USER))
        jid = self.server.submit(j, script=fn)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.logger.info('Job submitted successfully: ' + jid)

    def test_formula_match(self):
        """
        Test for job sort formula
        """
        a = {'resources_available.ncpus': 8}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})
        a = {'job_sort_formula': 'ncpus'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        # purposely submitting a job that is highly unlikely to run so
        # it stays Q'd
        j = Job(TEST_USER, attrs={'Resource_List.select': '1:ncpus=128'})
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        _f1 = self.scheduler.job_formula(jid)
        _f2 = self.server.evaluate_formula(jid, full=False)
        self.assertEqual(_f1, _f2)
        self.logger.info(str(_f1) + " = " + str(_f2) + " ... OK")

    @skipOnShasta
    def test_staging(self):
        """
        Test for file staging
        """
        execution_info = {}
        storage_info = {}
        stagein_path = self.mom.create_and_format_stagein_path(
            storage_info, asuser=str(TEST_USER))
        a = {ATTR_stagein: stagein_path}
        j = Job(TEST_USER, a)
        j.set_sleep_time(2)
        jid = self.server.submit(j)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=2)
        execution_info['hostname'] = self.mom.hostname
        storage_info['hostname'] = self.server.hostname
        stageout_path = self.mom.create_and_format_stageout_path(
            execution_info, storage_info, asuser=str(TEST_USER))
        a = {ATTR_stageout: stageout_path}
        j = Job(TEST_USER, a)
        j.set_sleep_time(2)
        jid = self.server.submit(j)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid, offset=2)

    def test_route_queue(self):
        """
        Verify that a routing queue routes a job into the appropriate execution
        queue.
        """
        a = {'queue_type': 'Execution', 'resources_min.ncpus': 1,
             'enabled': 'True', 'started': 'False'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='specialq')
        dflt_q = self.server.default_queue
        a = {'queue_type': 'route',
             'route_destinations': dflt_q + ',specialq',
             'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='routeq')
        a = {'resources_min.ncpus': 4}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id=dflt_q)
        j = Job(TEST_USER, attrs={ATTR_queue: 'routeq',
                                  'Resource_List.ncpus': 1})
        jid = self.server.submit(j)
        self.server.expect(JOB, {ATTR_queue: 'specialq'}, id=jid)

    def test_movejob(self):
        """
        Verify that a job can be moved to another queue than the one it was
        originally submitted to
        """
        a = {'queue_type': 'Execution', 'enabled': 'True', 'started': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='solverq')
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.movejob(jid, 'solverq')
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(JOB, {ATTR_queue: 'solverq', 'job_state': 'R'},
                           attrop=PTL_AND)

    def test_by_queue(self):
        """
        Test by_queue scheduling policy
        """
        a = OrderedDict()
        a['queue_type'] = 'execution'
        a['enabled'] = 'True'
        a['started'] = 'True'
        a['priority'] = 200
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='p1')
        a['priority'] = 400
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='p2')
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.scheduler.set_sched_config({'by_queue': 'True'})
        a = {'resources_available.ncpus': 8}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: 'p1'}
        j = Job(TEST_USER, a)
        j1id = self.server.submit(j)
        a = {'Resource_List.select': '1:ncpus=8', ATTR_queue: 'p1'}
        j = Job(TEST_USER, a)
        j2id = self.server.submit(j)
        a = {'Resource_List.select': '1:ncpus=2', ATTR_queue: 'p1'}
        j = Job(TEST_USER, a)
        j3id = self.server.submit(j)
        a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: 'p2'}
        j = Job(TEST_USER, a)
        j4id = self.server.submit(j)
        a = {'Resource_List.select': '1:ncpus=8', ATTR_queue: 'p2'}
        j = Job(TEST_USER, a)
        j5id = self.server.submit(j)
        a = {'Resource_List.select': '1:ncpus=8', ATTR_queue: 'p2'}
        j = Job(TEST_USER, a)
        j6id = self.server.submit(j)
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        # Given node configuration of 8 cpus the only jobs that could run are
        # j4id j1id and j3id
        self.server.expect(JOB, {'job_state=R': 3},
                           trigger_sched_cycle=False)
        cycle = self.scheduler.cycles(start=self.server.ctime, lastN=2)
        if len(cycle) > 0:
            i = len(cycle) - 1
            while len(cycle[i].political_order) == 0:
                i -= 1
            cycle = cycle[i]
            p1jobs = [j1id, j2id, j3id]
            p2jobs = [j4id, j5id, j6id]
            jobs = [j1id, j2id, j3id, j4id, j5id, j6id]
            job_order = [j.split('.')[0] for j in p2jobs + p1jobs]
            self.logger.info(
                'Political order: ' + ','.join(cycle.political_order))
            self.logger.info('Expected order: ' + ','.join(job_order))
            self.assertTrue(cycle.political_order == job_order)

    def test_round_robin(self):
        """
        Test round_robin scheduling policy
        """
        a = OrderedDict()
        a['queue_type'] = 'execution'
        a['enabled'] = 'True'
        a['started'] = 'True'
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='p1')
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='p2')
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='p3')
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.scheduler.set_sched_config({'round_robin': 'true   ALL'})
        a = {'resources_available.ncpus': 9}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        jids = []
        queues = ['p1', 'p2', 'p3']
        queue = queues[0]
        for i in range(9):
            if (i != 0) and (i % 3 == 0):
                del queues[0]
                queue = queues[0]
            a = {'Resource_List.select': '1:ncpus=1', ATTR_queue: queue}
            j = Job(TEST_USER, a)
            jids.append(self.server.submit(j))
        start_time = time.time()
        a = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(JOB, {'job_state=R': 9})
        end_time = int(time.time()) + 1
        cycle = self.scheduler.cycles(start=start_time, end=end_time)
        self.logger.info("len(cycle):%s, td:%s" % (len(cycle),
                                                   end_time - start_time))
        if len(cycle) > 0:
            i = len(cycle) - 1
            while ((i >= 0) and (len(cycle[i].political_order) == 0)):
                i -= 1
            if i < 0:
                self.assertTrue(False, 'failed to found political order')
            for j, _cycle in enumerate(cycle):
                self.logger.info("cycle:%s:%s" % (i, _cycle.political_order))
            self.logger.info("cycle i:%s" % i)
            cycle = cycle[i]
            jobs = [jids[0], jids[3], jids[6], jids[1], jids[4], jids[7],
                    jids[2], jids[5], jids[8]]
            job_order = [j.split('.')[0] for j in jobs]
            self.logger.info(
                'Political order: ' + ','.join(cycle.political_order))
            self.logger.info('Expected order: ' + ','.join(job_order))
            self.assertTrue(cycle.political_order == job_order)

    def test_pbs_probe(self):
        """
        Verify that pbs_probe runs and returns 0 when no errors are detected
        """
        probe = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'sbin',
                             'pbs_probe')
        ret = self.du.run_cmd(self.server.hostname, [probe], sudo=True)
        self.assertEqual(ret['rc'], 0)

    def test_printjob(self):
        """
        Verify that printjob can be executed
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        a = {'job_state': 'R', 'substate': 42}
        self.server.expect(JOB, a, id=jid)
        ret = self.mom.printjob(jid)
        self.assertEqual(ret['rc'], 0)

    def test_comm_service(self):
        """
        Examples to demonstrate how to start/stop/signal the pbs_comm service
        """
        svr_obj = Server()
        comm = Comm(svr_obj)
        comm.isUp()
        comm.signal('-HUP')
        comm.stop()
        comm.start()
        comm.log_match('Thread')

    def test_add_server_dyn_res(self):
        """
        Examples to demonstrate how to add a server dynamic resource script
        """
        attr = {}
        attr['type'] = 'long'
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        body = "echo 10"
        self.scheduler.add_server_dyn_res("foo", script_body=body)
        self.scheduler.add_resource("foo", apply=True)
        j1 = Job(TEST_USER)
        j1.set_attributes({'Resource_List': 'foo=15'})
        j1id = self.server.submit(j1)
        msg = "Can Never Run: Insufficient amount of server resource: foo "\
              "(R: 15 A: 10 T: 10)"
        a = {'job_state': 'Q', 'Resource_List.foo': '15',
             'comment': msg}
        self.server.expect(JOB, a, id=j1id)

    def test_schedlog_preempted_info(self):
        """
        Demonstrate how to retrieve a list of jobs that had to be preempted in
        order to run a high priority job
        """
        # run the preemption smoketest
        self.test_preemption()
        # Analyze the scheduler log
        a = PBSLogAnalyzer()
        a.analyze_scheduler_log(self.scheduler.logfile,
                                start=self.server.ctime)
        for cycle in a.scheduler.cycles:
            if cycle.preempted_jobs:
                self.logger.info('Preemption info: ' +
                                 str(cycle.preempted_jobs))

    def test_basic(self):
        """
        basic express queue preemption test
        """
        try:
            self.server.manager(MGR_CMD_DELETE, QUEUE, id="expressq")
        except PbsManagerError:
            pass
        a = {'queue_type': 'e',
             'started': 'True',
             'enabled': 'True',
             'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq")
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '2gb'}
        self.mom.create_vnodes(a, 4)
        j1 = Job(TEST_USER)
        j1.set_attributes(
            {'Resource_List.select': '4:ncpus=4',
             'Resource_List.walltime': 3600})
        j1id = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=j1id)
        j2 = Job(TEST_USER)
        j2.set_attributes(
            {'Resource_List.select': '1:ncpus=4',
             'Resource_List.walltime': 3600,
             'queue': 'expressq'})
        j2id = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'S'}, id=j1id)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.cleanup_jobs()
        self.server.expect(SERVER, {'total_jobs': 0})
        self.server.manager(MGR_CMD_DELETE, QUEUE, id="expressq")

    def test_basic_ja(self):
        """
        basic express queue preemption test with job array
        """
        try:
            self.server.manager(MGR_CMD_DELETE, QUEUE, id="expressq")
        except PbsManagerError:
            pass
        a = {'queue_type': 'e',
             'started': 'True',
             'enabled': 'True',
             'Priority': 150}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, "expressq")
        a = {'resources_available.ncpus': 4, 'resources_available.mem': '2gb'}
        self.mom.create_vnodes(a, 4)
        j1 = Job(TEST_USER)
        j1.set_attributes({'Resource_List.select': '4:ncpus=4',
                           'Resource_List.walltime': 3600})
        j1id = self.server.submit(j1)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42}, id=j1id)
        j2 = Job(TEST_USER)
        j2.set_attributes({'Resource_List.select': '1:ncpus=4',
                           'Resource_List.walltime': 3600,
                           'queue': 'expressq',
                           ATTR_J: '1-3'})
        j2id = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'S'}, id=j1id)
        self.server.expect(JOB, {'job_state=R': 3}, count=True,
                           id=j2id, extend='t')
        self.server.cleanup_jobs()
        self.server.expect(SERVER, {'total_jobs': 0})
        self.server.manager(MGR_CMD_DELETE, QUEUE, id="expressq")

    def submit_reserv(self, resv_start, ncpus, resv_dur):
        a = {'Resource_List.select': '1:ncpus=%d' % ncpus,
             'Resource_List.place': 'free',
             'reserve_start': int(resv_start),
             'reserve_duration': int(resv_dur)
             }
        r = Reservation(TEST_USER, attrs=a)
        rid = self.server.submit(r)
        try:
            a = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
            d = self.server.expect(RESV, a, id=rid)
        except PtlExpectError as e:
            d = e.rv
        return d

    def test_shrink_to_fit_resv_barrier(self):
        """
        Test shrink to fit by creating one reservation having ncpus=1,
        starting in 3 hours with a duration of two hours.  A STF job with
        a min_walltime of 10 min. and max_walltime of 20.5 hrs will shrink
        its walltime to less than or equal to 3 hours and greater than or
        equal to 10 mins.
        """
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        now = time.time()
        resv_dur = 7200
        resv_start = now + 10800
        d = self.submit_reserv(resv_start, 1, resv_dur)
        self.assertTrue(d)
        j = Job(TEST_USER)
        a = {'Resource_List.ncpus': '1'}
        j.set_attributes(a)
        jid = self.server.submit(j)
        j2 = Job(TEST_USER)
        a = {'Resource_List.max_walltime': '20:30:00',
             'Resource_List.min_walltime': '00:10:00'}
        j2.set_attributes(a)
        jid2 = self.server.submit(j2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        attr = {'Resource_List.walltime': (LE, '03:00:00')}
        self.server.expect(JOB, attr, id=jid2)
        attr = {'Resource_List.walltime': (GE, '00:10:00')}
        self.server.expect(JOB, attr, id=jid2)

    def test_job_sort_formula_threshold(self):
        """
        Test job_sort_formula_threshold basic behavior
        """
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})
        a = {'resources_available.ncpus': 1}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)
        a = {'job_sort_formula':
             'ceil(fabs(-ncpus*(mem/100.00)*sqrt(walltime)))'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        a = {'job_sort_formula_threshold': '7'}
        self.server.manager(MGR_CMD_SET, SCHED, a)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {'Resource_List.select': '1:ncpus=1:mem=300kb',
             'Resource_List.walltime': 4}
        J1 = Job(TEST_USER1, attrs=a)
        a = {'Resource_List.select': '1:ncpus=1:mem=350kb',
             'Resource_List.walltime': 4}
        J2 = Job(TEST_USER1, attrs=a)
        a = {'Resource_List.select': '1:ncpus=1:mem=380kb',
             'Resource_List.walltime': 4}
        J3 = Job(TEST_USER1, attrs=a)
        a = {'Resource_List.select': '1:ncpus=1:mem=440kb',
             'Resource_List.walltime': 4}
        J4 = Job(TEST_USER1, attrs=a)
        j1id = self.server.submit(J1)
        j2id = self.server.submit(J2)
        j3id = self.server.submit(J3)
        j4id = self.server.submit(J4)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        rv = self.server.expect(SERVER, {'server_state': 'Scheduling'}, op=NE)
        self.logger.info("Checking the job state of " + j4id)
        self.server.expect(JOB, {'job_state': 'R'}, id=j4id, max_attempts=30,
                           interval=2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j3id, max_attempts=30,
                           interval=2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j2id, max_attempts=30,
                           interval=2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j1id, max_attempts=30,
                           interval=2)
        msg = "Checking the job state of %s, runs after %s is deleted" % (j3id,
                                                                          j4id)
        self.logger.info(msg)
        try:
            self.server.deljob(id=j4id, wait=True, extend='force',
                               runas=MGR_USER)
        except PbsDeljobError as e:
            self.assertIn(
                'qdel: Unknown Job Id', e.msg[0])
        self.server.expect(JOB, {'job_state': 'R'}, id=j3id, max_attempts=30,
                           interval=2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j2id, max_attempts=30,
                           interval=2)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j1id, max_attempts=30,
                           interval=2)
        self.scheduler.log_match(j1id + ";Formula Evaluation = 6",
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        m = ";Job's formula value 6 is under threshold 7"
        self.scheduler.log_match(j1id + m,
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        m = ";Job is under job_sort_formula threshold value"
        self.scheduler.log_match(j1id + m,
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        self.scheduler.log_match(j2id + ";Formula Evaluation = 7",
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        m = ";Job's formula value 7 is under threshold 7"
        self.scheduler.log_match(j2id + m,
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        m = ";Job is under job_sort_formula threshold value"
        self.scheduler.log_match(j1id + m,
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        self.scheduler.log_match(j3id + ";Formula Evaluation = 8",
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        self.scheduler.log_match(j4id + ";Formula Evaluation = 9",
                                 regexp=True, starttime=self.server.ctime,
                                 max_attempts=10, interval=2)
        try:
            self.server.deljob(id=j3id, wait=True, extend='force',
                               runas=MGR_USER)
        except PbsDeljobError as e:
            self.assertIn(
                'qdel: Unknown Job Id', e.msg[0])
        # Make sure we can qrun a job under the threshold
        rv = self.server.expect(SERVER, {'server_state': 'Scheduling'}, op=NE)
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=j1id)
        self.server.runjob(jobid=j1id)
        self.server.expect(JOB, {ATTR_state: 'R'}, id=j1id)

        # test to make sure server can still start with job_sort_formula set
        self.server.restart()
        restart_msg = 'Failed to restart PBS'
        self.assertTrue(self.server.isUp(), restart_msg)

    def isSuspended(self, ppid):
        """
        Check wether <ppid> is in Suspended state, return True if
        <ppid> in Suspended state else return False
        """
        return self.mom.is_proc_suspended(ppid)

    def do_preempt_config(self):
        """
        Do Scheduler Preemption configuration
        """
        _t = ('\"express_queue, normal_jobs, server_softlimits,' +
              ' queue_softlimits\"')
        a = {'preempt_prio': _t}
        self.scheduler.set_sched_config(a)
        try:
            self.server.manager(MGR_CMD_DELETE, QUEUE, None, 'expressq')
        except PbsManagerError:
            pass
        a = {'queue_type': 'e',
             'started': 'True',
             'Priority': 150,
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, 'expressq')

    def common_stuff(self, isJobArray=False, isWithPreempt=False):
        """
        Do common stuff for job like submitting, stating and suspending
        """
        if isJobArray:
            a = {'resources_available.ncpus': 3}
        else:
            a = {'resources_available.ncpus': 1}
        self.mom.create_vnodes(a, 1)
        if isWithPreempt:
            self.do_preempt_config()
        j1 = Job(TEST_USER, attrs={'Resource_List.walltime': 100})
        if isJobArray:
            j1.set_attributes({ATTR_J: '1-3'})
        j1id = self.server.submit(j1)
        if isJobArray:
            a = {'job_state=R': 3, 'substate=42': 3}
        else:
            a = {'job_state': 'R', 'substate': 42}
        self.server.expect(JOB, a, extend='t')
        if isWithPreempt:
            j2 = Job(TEST_USER, attrs={'Resource_List.walltime': 100,
                                       'queue': 'expressq'})
            if isJobArray:
                j2.set_attributes({ATTR_J: '1-3'})
            j2id = self.server.submit(j2)
            self.assertNotEqual(j2id, None)
            if isJobArray:
                a = {'job_state=R': 3, 'substate=42': 3}
            else:
                a = {'job_state': 'R', 'substate': 42}
            self.server.expect(JOB, a, id=j2id, extend='t')
        else:
            self.server.sigjob(j1id, 'suspend')
        if isJobArray:
            a = {'job_state=S': 3}
        else:
            a = {'job_state': 'S'}
        self.server.expect(JOB, a, id=j1id, extend='t')
        jobs = self.server.status(JOB, id=j1id)
        for job in jobs:
            if 'session_id' in job:
                self.server.expect(JOB, {'session_id': self.isSuspended},
                                   id=job['id'])
        if isWithPreempt:
            return (j1id, j2id)
        else:
            return j1id

    def test_suspend_job_with_preempt(self):
        """
        Test Suspend of Job using Scheduler Preemption
        """
        self.common_stuff(isWithPreempt=True)

    def test_resume_job_with_preempt(self):
        """
        Test Resume of Job using Scheduler Preemption
        """
        (j1id, j2id) = self.common_stuff(isWithPreempt=True)
        self.server.delete(j2id)
        self.server.expect(JOB, {'job_state': 'R', 'substate': 42},
                           id=j1id)
        jobs = self.server.status(JOB, id=j1id)
        for job in jobs:
            if 'session_id' in job:
                self.server.expect(JOB,
                                   {'session_id': (NOT, self.isSuspended)},
                                   id=job['id'])

    def test_suspend_job_array_with_preempt(self):
        """
        Test Suspend of Job array using Scheduler Preemption
        """
        self.common_stuff(isJobArray=True, isWithPreempt=True)

    def test_resume_job_array_with_preempt(self):
        """
        Test Resume of Job array using Scheduler Preemption
        """
        (j1id, j2id) = self.common_stuff(isJobArray=True, isWithPreempt=True)
        self.server.delete(j2id)
        self.server.expect(JOB,
                           {'job_state=R': 3, 'substate=42': 3},
                           extend='t')
        jobs = self.server.status(JOB, id=j1id, extend='t')
        for job in jobs:
            if 'session_id' in job:
                self.server.expect(JOB,
                                   {'session_id': (NOT, self.isSuspended)},
                                   id=job['id'])

    def test_resource_create_delete(self):
        """
        Verify behavior of resource on creation, deletion
        and job.
        """

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        attr = {'type': 'boolean'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo')
        attr = {'type': 'long', 'flag': 'nh'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo1')
        attr = {'type': 'string'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo2')
        attr = {'type': 'size', 'flag': 'nh'}
        self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo3')

        with self.assertRaises(PbsManagerError) as e:
            self.server.manager(MGR_CMD_CREATE, RSC, attr, id='foo1')
        msg = 'qmgr obj=foo1 svr=default: Duplicate entry in list '
        self.assertIn(msg, e.exception.msg)

        self.scheduler.add_resource("foo, foo1, foo2, foo3", apply=True)

        attr = {'Resources_available.foo': True}
        self.server.manager(MGR_CMD_SET, SERVER, attr)

        vnode_val = self.mom.shortname
        if self.mom.is_cpuset_mom():
            nodeinfo = self.server.status(NODE)
            if len(nodeinfo) > 1:
                vnode_val = nodeinfo[1]['id']
        attr = {'Resources_available.foo3': '2gb'}
        self.server.manager(MGR_CMD_SET, NODE, attr, id=vnode_val)
        attr = {'Resources_available.foo1': 3}
        self.server.manager(MGR_CMD_SET, NODE, attr, id=vnode_val)

        now = time.time()
        r = Reservation(TEST_USER)
        a = {'Resource_List.foo2': 'abc',
             'reserve_start': now + 10,
             'reserve_end': now + 40}
        r.set_attributes(a)
        rid = self.server.submit(r)
        rid_q = rid.split('.')[0]
        a = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED|2")}
        self.server.expect(RESV, a, id=rid)
        a = {'Resource_List.foo3': '1gb',
             'Resource_List.foo1': 2,
             ATTR_q: rid_q}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(15)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid,
                           offset=10)

        with self.assertRaises(PbsManagerError) as e:
            self.server.manager(MGR_CMD_DELETE, RSC, id='foo1')
        msg = 'qmgr obj=foo1 svr=default: Resource busy on job'
        self.assertIn(msg, e.exception.msg)

        self.server.expect(JOB, {'job_state': 'F'}, extend='x',
                           offset=15, id=jid)

        a = {'Resource_List.foo': True}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(15)
        jid1 = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'F'}, extend='x',
                           offset=15, id=jid1)

        a = {'job_history_enable': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.manager(MGR_CMD_DELETE, RSC, id='foo1')
        self.server.manager(MGR_CMD_DELETE, RSC, id='foo2')
        self.server.manager(MGR_CMD_DELETE, RSC, id='foo3')

    def setup_fs(self, formula):

        # change resource group file and validate after all the changes are in
        self.scheduler.add_to_resource_group('grp1', 100, 'root', 60,
                                             validate=False)
        self.scheduler.add_to_resource_group('grp2', 200, 'root', 40,
                                             validate=False)
        self.scheduler.add_to_resource_group(TEST_USER1, 101, 'grp1', 40,
                                             validate=False)
        self.scheduler.add_to_resource_group(TEST_USER2, 102, 'grp1', 20,
                                             validate=False)
        self.scheduler.add_to_resource_group(TEST_USER3, 201, 'grp2', 30,
                                             validate=False)
        self.scheduler.add_to_resource_group(TEST_USER4, 202, 'grp2', 10,
                                             validate=True)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduler_iteration': 7})
        a = {'fair_share': 'True', 'fairshare_decay_time': '24:00:00',
             'fairshare_decay_factor': 0.5, 'fairshare_usage_res': formula}
        self.scheduler.set_sched_config(a)
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 4095})

    def test_fairshare_enhanced(self):
        """
        Test the basic fairshare behavior with custom resources for math module
        """
        rv = self.server.add_resource('foo1', 'float', 'nh')
        self.assertTrue(rv)
        # Set scheduler fairshare usage formula
        self.setup_fs(
            'ceil(fabs(-ncpus*(foo1/100.00)*sqrt(100)))')
        node_attr = {'resources_available.ncpus': 1,
                     'resources_available.foo1': 5000}
        self.server.manager(MGR_CMD_SET, NODE, node_attr, self.mom.shortname)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        job_attr = {'Resource_List.select': '1:ncpus=1:foo1=20'}
        J1 = Job(TEST_USER2, attrs=job_attr)
        J2 = Job(TEST_USER3, attrs=job_attr)
        J3 = Job(TEST_USER1, attrs=job_attr)
        j1id = self.server.submit(J1)
        j2id = self.server.submit(J2)
        j3id = self.server.submit(J3)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        rv = self.server.expect(SERVER, {'server_state': 'Scheduling'}, op=NE)

        self.logger.info("Checking the job state of " + j3id)
        self.server.expect(JOB, {'job_state': 'R'}, id=j3id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j2id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j1id)
        # While nothing has changed, we must run another cycle for the
        # scheduler to take note of the fairshare usage.
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.delete(j3id)
        msg = "Checking the job state of " + j2id + ", runs after "
        msg += j3id + " is deleted"
        self.logger.info(msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j1id)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.delete(j2id)
        msg = "Checking the job state of " + j1id + ", runs after "
        msg += j2id + " is deleted"
        self.logger.info(msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=j1id)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.delete(j1id)

        # query fairshare and check usage
        fs1 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER1))
        self.logger.info('Checking ' + str(fs1.usage) + " == 3")
        self.assertEqual(fs1.usage, 3)
        fs2 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER2))
        self.logger.info('Checking ' + str(fs2.usage) + " == 3")
        self.assertEqual(fs2.usage, 3)
        fs3 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER3))
        self.logger.info('Checking ' + str(fs3.usage) + " == 3")
        self.assertEqual(fs3.usage, 3)
        fs4 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER4))
        self.logger.info('Checking ' + str(fs4.usage) + " == 1")
        self.assertEqual(fs4.usage, 1)

        # Check the scheduler usage file whether it's updating or not
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        J1 = Job(TEST_USER4, attrs=job_attr)
        J2 = Job(TEST_USER2, attrs=job_attr)
        J3 = Job(TEST_USER1, attrs=job_attr)
        j1id = self.server.submit(J1)
        j2id = self.server.submit(J2)
        j3id = self.server.submit(J3)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.logger.info("Checking the job state of " + j1id)
        self.server.expect(JOB, {'job_state': 'R'}, id=j1id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j2id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j3id)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.delete(j1id)
        msg = "Checking the job state of " + j3id + ", runs after "
        msg += j1id + " is deleted"
        self.logger.info(msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=j3id)
        self.server.expect(JOB, {'job_state': 'Q'}, id=j2id)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.delete(j3id)
        msg = "Checking the job state of " + j2id + ", runs after "
        msg += j3id + " is deleted"
        self.logger.info(msg)
        self.server.expect(JOB, {'job_state': 'R'}, id=j2id)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        # query fairshare and check usage
        fs1 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER1))
        self.logger.info('Checking ' + str(fs1.usage) + " == 5")
        self.assertEqual(fs1.usage, 5)
        fs2 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER2))
        self.logger.info('Checking ' + str(fs2.usage) + " == 5")
        self.assertEqual(fs2.usage, 5)
        fs3 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER3))
        self.logger.info('Checking ' + str(fs3.usage) + " == 3")
        self.assertEqual(fs3.usage, 3)
        fs4 = self.scheduler.fairshare.query_fairshare(name=str(TEST_USER4))
        self.logger.info('Checking ' + str(fs4.usage) + " == 3")
        self.assertEqual(fs4.usage, 3)

    @checkModule("pexpect")
    @skipOnShasta
    @runOnlyOnLinux
    def test_interactive_job(self):
        """
        Submit an interactive job
        """
        cmd = 'sleep 10'
        j = Job(TEST_USER, attrs={ATTR_inter: ''})
        j.interactive_script = [('hostname', '.*'),
                                (cmd, '.*')]
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.delete(jid)
        self.server.expect(JOB, 'queue', op=UNSET, id=jid)

    def test_man_pages(self):
        """
        Test basic functionality of man pages
        """
        pbs_conf = self.du.parse_pbs_config(self.server.shortname)
        man_cmd = "man"
        man_bin_path = self.du.which(exe=man_cmd)
        if man_bin_path == man_cmd:
            self.skip_test(reason='man command is not available. Please '
                                  'install man and try again.')
        manpath = os.path.join(pbs_conf['PBS_EXEC'], "share", "man")
        pbs_cmnds = ["pbsnodes", "qsub"]
        os.environ['MANPATH'] = manpath
        for pbs_cmd in pbs_cmnds:
            cmd = "man %s" % pbs_cmd
            rc = self.du.run_cmd(cmd=cmd)
            msg = "Error while retrieving man page of %s" % pbs_cmd
            msg += "command: %s" % rc['err']
            self.assertEqual(rc['rc'], 0, msg)
            msg = "Successfully retrieved man page for"
            msg += " %s command" % pbs_cmd
            self.logger.info(msg)

    def test_exclhost(self):
        """
        Test that a job requesting exclhost is not placed on another host
        with a running job on it.
        """
        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 8, sharednode=False,
                               vnodes_per_host=4)
        vn = self.mom.shortname
        req_nodes = '1:ncpus=1:vnode=' + vn + '[3]'
        J1 = Job(TEST_USER, {'Resource_List.select': req_nodes})
        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)

        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'exclhost'}
        J2 = Job(TEST_USER, a)
        jid2 = self.server.submit(J2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        st = self.server.status(JOB, 'exec_vnode', id=jid2)
        vnodes = J2.get_vnodes(st[0]['exec_vnode'])
        expected_vnodes = [vn + '[4]', vn + '[5]', vn + '[6]', vn + '[7]']

        for v in vnodes:
            self.assertIn(v, expected_vnodes)

    def test_jobscript_max_size(self):
        """
        Test that if jobscript_max_size attribute is set, users can not
        submit jobs with job script size exceeding the limit.
        """

        scr = []
        for i in range(2048):
            scr += ['echo "This is a very long line, it will exceed 20 bytes"']

        j = Job()
        j.create_script(scr)

        self.server.manager(MGR_CMD_SET, SERVER, {'jobscript_max_size': 65537})
        try:
            self.server.submit(j)
        except PbsSubmitError as e:
            self.assertIn("jobscript size exceeded the jobscript_max_size",
                          e.msg[0])
        self.server.log_match("Req;req_reject;Reject reply code=15175",
                              max_attempts=5)

    def test_import_pbs_module(self):
        """
        Test that the pbs module located in the PBS installation directory is
        able to be loaded and symbols within it accessed.
        """
        self.add_pbs_python_path_to_sys_path()
        import pbs
        msg = "pbs.JOB_STATE_RUNNING=%s" % (pbs.JOB_STATE_RUNNING,)
        self.logger.info(msg)

    def test_import_pbs_ifl_module(self):
        """
        Test that the pbs_ifl module located in the PBS installation directory
        is able to be loaded and a connection to the server can be established.
        """
        self.add_pbs_python_path_to_sys_path()
        import pbs_ifl
        server_conn = pbs_ifl.pbs_connect(None)
        server_stat = pbs_ifl.pbs_statserver(server_conn, None, None)
        pbs_ifl.pbs_disconnect(server_conn)
        msg = "server name is %s" % (server_stat.name,)
        self.logger.info(msg)


================================================
FILE: test/tests/performance/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import math
from math import sqrt
from ptl.utils.pbs_testsuite import *
import statistics


class TestPerformance(PBSTestSuite):
    """
    Base test suite for Performance tests
    """

    def check_value(self, res):
        if isinstance(res, list):
            for val in res:
                if not isinstance(val, (int, float)):
                    raise self.failureException(
                        "Test result list must be int or float")
        else:
            if not isinstance(res, (int, float)):
                raise self.failureException("Test result must be int or float")

    def perf_test_result(self, result, test_measure, unit):
        """
        Add test results to json file. If a multiple trial values are passed
        calculate mean,std_dev,min,max for the list.
        """
        self.check_value(result)

        if isinstance(result, list) and len(result) > 1:
            mean_res = statistics.mean(result)
            stddev_res = statistics.stdev(result)
            lowv = mean_res - (stddev_res * 2)
            uppv = mean_res + (stddev_res * 2)
            new_result = [x for x in result if x > lowv and x < uppv]
            if len(new_result) == 0:
                new_result = result
            max_res = round(max(new_result), 2)
            min_res = round(min(new_result), 2)
            mean_res = statistics.mean(new_result)
            mean_res = round(mean_res, 2)
            trial_no = 1
            trial_data = []
            for trial_result in result:
                trial_result = round(trial_result, 2)
                trial_data.append(
                    {"trial_no": trial_no, "value": trial_result})
                trial_no += 1
            test_data = {"test_measure": test_measure,
                         "unit": unit,
                         "test_data": {"mean": mean_res,
                                       "std_dev": stddev_res,
                                       "minimum": min_res,
                                       "maximum": max_res,
                                       "trials": trial_data,
                                       "samples_considered": len(new_result),
                                       "total_samples": len(result)}}
            return self.set_test_measurements(test_data)
        else:
            variance = 0
            if isinstance(result, list):
                result = result[0]
            if isinstance(result, float):
                result = round(result, 2)
            testdic = {"test_measure": test_measure, "unit": unit,
                       "test_data": {"mean": result,
                                     "std_dev": variance,
                                     "minimum": result,
                                     "maximum": result}}
            return self.set_test_measurements(testdic)

    pass


================================================
FILE: test/tests/performance/pbs_cgroups_stress.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.performance import *


def is_memsw_enabled(mem_path):
    """
    Check if system has swapcontrol enabled, then return true
    else return false
    """
    # List all files and check if memsw files exists
    for files in os.listdir(mem_path):
        if 'memory.memsw' in files:
            return 'true'
    return 'false'


class TestCgroupsStress(TestPerformance):
    """
    This test suite targets Linux Cgroups hook stress.
    """

    def setUp(self):
        TestPerformance.setUp(self)

        self.true_script = """#!/bin/bash
#PBS -joe
/bin/true
"""
        self.cfg0 = """{
    "cgroup_prefix"         : "pbs",
    "exclude_hosts"         : [],
    "exclude_vntypes"       : [],
    "run_only_on_hosts"     : [],
    "periodic_resc_update"  : false,
    "vnode_per_numa_node"   : false,
    "online_offlined_nodes" : false,
    "use_hyperthreads"      : false,
    "cgroup" : {
        "cpuacct" : {
            "enabled"         : false
        },
        "cpuset" : {
            "enabled"         : false
        },
        "devices" : {
            "enabled"         : false
        },
        "hugetlb" : {
            "enabled"         : false
        },
        "memory":
        {
            "enabled"         : true,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "soft_limit"      : false,
            "default"         : "256MB",
            "reserve_percent" : "0",
            "reserve_amount"  : "0MB"
        },
        "memsw":
        {
            "enabled"         : %s,
            "exclude_hosts"   : [],
            "exclude_vntypes" : [],
            "default"         : "256MB",
            "reserve_percent" : "0",
            "reserve_amount"  : "128MB"
        }
    }
}"""

        self.noprefix = False
        self.paths = self.get_paths()
        if not (self.paths['cpuset'] and self.paths['memory']):
            self.skipTest('cpuset or memory cgroup subsystem not mounted')
        self.swapctl = is_memsw_enabled(self.paths['memsw'])
        self.server.set_op_mode(PTL_CLI)
        self.server.cleanup_jobs()
        Job.dflt_attributes[ATTR_k] = 'oe'
        # Configure the scheduler to schedule using vmem
        a = {'resources': 'ncpus,mem,vmem,host,vnode'}
        self.scheduler.set_sched_config(a)
        # Import the hook
        self.hook_name = 'pbs_cgroups'
        self.hook_file = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                      'lib',
                                      'python',
                                      'altair',
                                      'pbs_hooks',
                                      'pbs_cgroups.PY')
        self.load_hook(self.hook_file)
        # Enable the cgroups hook
        conf = {'enabled': 'True', 'freq': 2}
        self.server.manager(MGR_CMD_SET, HOOK, conf, self.hook_name)
        # Restart mom so exechost_startup hook is run
        self.mom.signal('-HUP')

    def get_paths(self):
        """
        Returns a dictionary containing the location where each cgroup
        is mounted.
        """
        paths = {'pids': None,
                 'blkio': None,
                 'systemd': None,
                 'cpuset': None,
                 'memory': None,
                 'memsw': None,
                 'cpuacct': None,
                 'devices': None}
        # Loop through the mounts and collect the ones for cgroups
        with open(os.path.join(os.sep, 'proc', 'mounts'), 'r') as fd:
            for line in fd:
                entries = line.split()
                if entries[2] != 'cgroup':
                    continue
                flags = entries[3].split(',')
                if 'noprefix' in flags:
                    self.noprefix = True
                subsys = os.path.basename(entries[1])
                paths[subsys] = entries[1]
                if 'memory' in flags:
                    paths['memsw'] = paths[subsys]
                    paths['memory'] = paths[subsys]
                if 'cpuacct' in flags:
                    paths['cpuacct'] = paths[subsys]
                if 'devices' in flags:
                    paths['devices'] = paths[subsys]
        return paths

    def load_hook(self, filename):
        """
        Import and enable a hook pointed to by the URL specified.
        """
        try:
            with open(filename, 'r') as fd:
                script = fd.read()
        except IOError:
            self.assertTrue(False, "Failed to open hook file %s" % filename)
        events = '"execjob_begin,execjob_launch,execjob_attach,'
        events += 'execjob_epilogue,execjob_end,exechost_startup,'
        events += 'exechost_periodic"'
        a = {'enabled': 'True',
             'freq': '2',
             'event': events}
        self.server.create_import_hook(self.hook_name, a, script,
                                       overwrite=True)
        # Add the configuration
        self.load_config(self.cfg0 % self.swapctl)

    def load_config(self, cfg):
        """
        Create a hook configuration file with the provided contents.
        """
        fn = self.du.create_temp_file(body=cfg)
        self.logger.info("Current config: %s" % cfg)
        a = {'content-type': 'application/x-config',
             'content-encoding': 'default',
             'input-file': fn}
        self.server.manager(MGR_CMD_IMPORT, HOOK, a, self.hook_name)
        os.remove(fn)
        self.mom.log_match('pbs_cgroups.CF;copy hook-related ' +
                           'file request received',
                           starttime=self.server.ctime)
        pbs_home = self.server.pbs_conf['PBS_HOME']
        svr_conf = os.path.join(
            os.sep, pbs_home, 'server_priv', 'hooks', 'pbs_cgroups.CF')
        pbs_home = self.mom.pbs_conf['PBS_HOME']
        mom_conf = os.path.join(
            os.sep, pbs_home, 'mom_priv', 'hooks', 'pbs_cgroups.CF')
        # reload config if server and mom cfg differ up to count times
        count = 5
        while (count > 0):
            r1 = self.du.run_cmd(cmd=['cat', svr_conf], sudo=True)
            r2 = self.du.run_cmd(cmd=['cat', mom_conf], sudo=True)
            if r1['out'] != r2['out']:
                self.logger.info('server & mom pbs_cgroups.CF differ')
                self.server.manager(MGR_CMD_IMPORT, HOOK, a, self.hook_name)
                self.mom.log_match('pbs_cgroups.CF;copy hook-related ' +
                                   'file request received',
                                   starttime=self.server.ctime)
            else:
                self.logger.info('server & mom pbs_cgroups.CF match')
                break
            time.sleep(1)
            count -= 1
        # A HUP of mom ensures update to hook config file is
        # seen by the exechost_startup hook.
        self.mom.signal('-HUP')

    @timeout(1200)
    def test_cgroups_race_condition(self):
        """
        Test to ensure a cgroups event does not read the cgroups file system
        while another event is writing to it. By submitting 1000 instant jobs,
        the events should collide at least once.
        """
        pcpus = 0
        with open('/proc/cpuinfo', 'r') as desc:
            for line in desc:
                if re.match('^processor', line):
                    pcpus += 1
        if pcpus < 8:
            self.skipTest("Test requires at least 8 physical CPUs")

        attr = {'job_history_enable': 'true'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)
        self.load_config(self.cfg0 % self.swapctl)
        now = time.time()
        j = Job(TEST_USER, attrs={ATTR_J: '0-1000'})
        j.create_script(self.true_script)
        jid = self.server.submit(j)
        jid = jid.split(']')[0]
        done = False
        for i in range(0, 1000):
            # Build the subjob id and ensure it is complete
            sjid = jid + str(i) + "]"
            # If the array job is finished, it and all subjobs will be put
            # into the F state. This can happen while checking the last
            # couple of subjobs. If this happens, we need to check for the
            # F state instead of the X state.
            if done:
                self.server.expect(
                    JOB, {'job_state': 'F'}, id=sjid, extend='x')
            else:
                try:
                    self.server.expect(
                        JOB, {'job_state': 'X'}, id=sjid, extend='tx')
                except PtlExpectError:
                    # The expect failed, maybe because the array job finished
                    # Check for the F state for this and future subjobs.
                    done = True
                    self.server.expect(
                        JOB, {'job_state': 'F'}, id=sjid, extend='x')
            # Check the logs for IOError every 100 subjobs, to reduce time of
            # a failing test.
            if i % 100 == 0:
                self.mom.log_match(msg="IOError", starttime=now,
                                   existence=False, max_attempts=1, n="ALL")
        # Check the logs one last time to ensure it passed
        self.mom.log_match(msg="IOError", starttime=now,
                           existence=False, max_attempts=10, n="ALL")


================================================
FILE: test/tests/performance/pbs_client_nagle_performance.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import timeit

from tests.performance import *


class TestClientNagles(TestPerformance):

    """
    Testing the effect of Nagles algorithm on CLI Performance
    """
    time_command = 'time'

    def setUp(self):
        """
        Base class method overriding
        builds absolute path of commands to execute
        """
        TestPerformance.setUp(self)
        self.time_command = self.du.which(exe="time")
        if self.time_command == "time":
            self.skipTest("Time command not found")

    def tearDown(self):
        """
        cleanup jobs
        """

        TestPerformance.tearDown(self)
        self.server.cleanup_jobs()

    def compute_qdel_time(self):
        """
        Computes qdel time in secs"
        return :
              -1 on qdel fail
        """
        qsel_list = self.server.select()
        qsel_list = " ".join(qsel_list)
        command = self.time_command
        command += " -f \"%e\" "
        command += os.path.join(self.server.client_conf['PBS_EXEC'],
                                'bin',
                                'qdel ')
        command += qsel_list
        # compute elapse time without -E option
        qdel_perf = self.du.run_cmd(self.server.hostname,
                                    command,
                                    as_script=True,
                                    runas=TEST_USER1,
                                    logerr=False)
        if qdel_perf['rc'] != 0:
            return -1

        return qdel_perf['err'][0]

    def submit_jobs(self, user, num_jobs):
        """
        Submit specified number of simple jobs
        Arguments :
             user - user under which to submit jobs
             num_jobs - number of jobs to submit
        """
        job = Job(user)
        job.set_sleep_time(1)
        for _ in range(num_jobs):
            self.server.submit(job)

    @timeout(600)
    def test_qdel_nagle_perf(self):
        """
        Submit 500 jobs, measure qdel performace before/after adding managers
        """

        # Adding to managers ensures that packets are larger than 1023 bytes
        # that triggers Nagle's algorithm which slows down the communication.
        # Effect on TCP seems irreversible till server is restarted, so in
        # this test case we restart server so that any effects from earlier
        # test cases/runs do not interfere

        # Baseline qdel performance with scheduling false and managers unset
        # Restart server to ensure no effect from earlier tests/operations
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.manager(MGR_CMD_UNSET, SERVER, 'managers')
        self.server.restart()

        self.submit_jobs(TEST_USER1, 500)
        qdel_perf = self.compute_qdel_time()
        self.assertTrue((qdel_perf != -1), "qdel command failed")

        # Add to the managers list so that TCP packets are now larger and
        # triggers Nagle's
        manager = TEST_USER1.name + '@' + self.server.hostname
        self.server.manager(MGR_CMD_SET, SERVER, {
                            'managers': (INCR, manager)}, sudo=True)

        # Remeasure the qdel performance
        self.submit_jobs(TEST_USER1, 500)
        qdel_perf2 = self.compute_qdel_time()
        self.assertTrue((qdel_perf2 != -1), "qdel command failed")

        self.logger.info("qdel performance: " + str(qdel_perf))
        self.logger.info(
            "qdel performance after setting manager: " + str(qdel_perf2))
        self.perf_test_result(float(qdel_perf), "qdel_perf", "sec")
        self.perf_test_result(float(qdel_perf2),
                              "qdel_perf_with_manager", "sec")

    @timeout(900)
    def test_qsub_perf(self):
        """
        Test that qsub performance have improved when run
        with -f option
        """

        # Restart server
        self.server.restart()

        # Submit a job for 500 times and timeit
        cmd = os.path.join(
            self.server.client_conf['PBS_EXEC'],
            'bin',
            'qsub -- /bin/true >/dev/null')
        start_time = timeit.default_timer()
        for x in range(1, 500):
            rv = self.du.run_cmd(self.server.hostname, cmd)
            self.assertTrue(rv['rc'] == 0)
        elap_time1 = timeit.default_timer() - float(start_time)

        # submit a job with -f for 500 times and timeit
        cmd = os.path.join(
            self.server.client_conf['PBS_EXEC'],
            'bin',
            'qsub -f -- /bin/true >/dev/null >/dev/null')
        start_time = timeit.default_timer()
        for x in range(1, 500):
            rv = self.du.run_cmd(self.server.hostname,
                                 cmd)
            self.assertTrue(rv['rc'] == 0)
        elap_time2 = timeit.default_timer() - float(start_time)
        self.logger.info("Time taken by qsub -f is " + str(elap_time2) +
                         " and time taken by qsub is " + str(elap_time1))
        self.perf_test_result(elap_time1, "qsub_-f_time", "sec")
        self.perf_test_result(elap_time2, "qsub_time", "sec")


================================================
FILE: test/tests/performance/pbs_equiv_classes_perf.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os

from tests.performance import *


class TestJobEquivClassPerf(TestPerformance):

    """
    Test job equivalence class performance
    """

    def setUp(self):
        TestPerformance.setUp(self)
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047})

        # Create vnodes
        a = {'resources_available.ncpus': 1, 'resources_available.mem': '8gb'}
        self.mom.create_vnodes(a, 10000, expect=False,
                               sharednode=False)
        self.server.expect(NODE, {'state=free': 10001})

    def run_n_get_cycle_time(self):
        """
        Run a scheduling cycle and calculate its duration
        """

        t = time.time()

        # Run only one cycle
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        # Wait for cycle to finish
        self.scheduler.log_match("Leaving Scheduling Cycle", starttime=t,
                                 max_attempts=300, interval=3)

        c = self.scheduler.cycles(lastN=1)[0]
        cycle_time = c.end - c.start

        return cycle_time

    @timeout(2000)
    def test_basic(self):
        """
        Test basic functionality of job equivalence classes.
        Pre test: one class per job
        Post test: one class for all jobs
        """

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        num_jobs = 5000
        jids = []
        # Create num_jobs different equivalence classes.  These jobs can't run
        # because there aren't 2cpu nodes.  This bypasses the quick
        # 'can I run?' check the scheduler does.  It will better show the
        # equivalence class performance.
        for n in range(num_jobs):
            a = {'Resource_List.select': str(n + 1) + ':ncpus=2',
                 "Resource_List.place": "free"}
            J = Job(TEST_USER, attrs=a)
            jid = self.server.submit(J)
            jids += [jid]

        cycle1_time = self.run_n_get_cycle_time()

        # Make all jobs into one equivalence class
        a = {'Resource_List.select': str(num_jobs) + ":ncpus=2",
             "Resource_List.place": "free"}
        for n in range(num_jobs):
            self.server.alterjob(jids[n], a)

        cycle2_time = self.run_n_get_cycle_time()

        self.logger.info('Cycle 1: %d Cycle 2: %d Cycle time difference: %d' %
                         (cycle1_time, cycle2_time, cycle1_time - cycle2_time))
        self.assertGreaterEqual(cycle1_time, cycle2_time)
        time_diff = cycle1_time - cycle2_time
        self.perf_test_result(cycle1_time, "different_equiv_class", "sec")
        self.perf_test_result(cycle2_time, "single_equiv_class", "sec")
        self.perf_test_result(time_diff,
                              "time_diff_bn_single_diff_equiv_classes", "sec")

    @timeout(10000)
    def test_server_queue_limit(self):
        """
        Test the performance with hard and soft limits
        on resources
        """

        # Create workq2
        self.server.manager(MGR_CMD_CREATE, QUEUE,
                            {'queue_type': 'e', 'started': 'True',
                             'enabled': 'True'}, id='workq2')

        # Set queue limit
        a = {
            'max_run': ('[o:PBS_ALL=100],[g:PBS_GENERIC=20],'
                        '[u:PBS_GENERIC=20],[g:%s = 8],[u:%s=10]' %
                        (str(TSTGRP1), str(TEST_USER1)))}
        self.server.manager(MGR_CMD_SET, QUEUE,
                            a, id='workq2')

        a = {'max_run_res.ncpus':
             '[o:PBS_ALL=100],[g:PBS_GENERIC=50],\
             [u:PBS_GENERIC=20],[g:%s=13],[u:%s=12]' %
             (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq2')

        a = {'max_run_res_soft.ncpus':
             '[o:PBS_ALL=100],[g:PBS_GENERIC=30],\
             [u:PBS_GENERIC=10],[g:%s=10],[u:%s=10]' %
             (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, QUEUE, a, id='workq2')

        # Set server limits
        a = {
            'max_run': '[o:PBS_ALL=100],[g:PBS_GENERIC=50],\
            [u:PBS_GENERIC=20],[g:%s=13],[u:%s=13]' %
            (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'max_run_soft':
             '[o:PBS_ALL=50],[g:PBS_GENERIC=25],[u:PBS_GENERIC=10],\
             [g:%s=10],[u:%s=10]' %
             (str(TSTGRP1), str(TEST_USER1))}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Turn scheduling off
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'false'})

        # Submit jobs as pbsuser1 from group tstgrp01 in workq2
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP1, ATTR_q: 'workq2'}
            J = Job(TEST_USER1, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for ~100 classes
        cyc1 = self.run_n_get_cycle_time()

        # Submit jobs as pbsuser1 from group tstgrp02 in workq2
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP2, ATTR_q: 'workq2'}
            J = Job(TEST_USER1, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for ~200 classes
        cyc2 = self.run_n_get_cycle_time()

        # Submit jobs as pbsuser2 from tstgrp01 in workq2
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP1, ATTR_q: 'workq2'}
            J = Job(TEST_USER2, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for ~300 classes
        cyc3 = self.run_n_get_cycle_time()

        # Submit jobs as pbsuser2 from tstgrp03 in workq2
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP3, ATTR_q: 'workq2'}
            J = Job(TEST_USER2, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for ~400 classes
        cyc4 = self.run_n_get_cycle_time()

        # Submit jobs as pbsuser1 from tstgrp01 in workq
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP1, ATTR_q: 'workq'}
            J = Job(TEST_USER1, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for ~500 classes
        cyc5 = self.run_n_get_cycle_time()

        # Submit jobs as pbsuser1 from tstgrp02 in workq
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP2, ATTR_q: 'workq'}
            J = Job(TEST_USER1, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for 60k jobs for ~600 classes
        cyc6 = self.run_n_get_cycle_time()

        # Submit jobs as pbsuser2 from tstgrp01 in workq
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP1, ATTR_q: 'workq'}
            J = Job(TEST_USER2, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for 70k jobs for ~700 classes
        cyc7 = self.run_n_get_cycle_time()

        # Submit jobs as pbsuser2 from tstgrp03 in workq
        for x in range(100):
            a = {'Resource_List.select': '1:ncpus=2',
                 'Resource_List.walltime': int(x),
                 'group_list': TSTGRP3, ATTR_q: 'workq'}
            J = Job(TEST_USER2, attrs=a)
            for y in range(100):
                self.server.submit(J)

        # Get time for 80k jobs for ~800 classes
        cyc8 = self.run_n_get_cycle_time()

        # Print the time taken for all the classes and compare
        # it against previous releases
        self.logger.info("time taken for \n100 classes is %d"
                         "\n200 classes is %d,"
                         "\n300 classes is %d,"
                         "\n400 classes is %d,"
                         "\n500 classes is %d,"
                         "\n600 classes is %d,"
                         "\n700 classes is %d,"
                         "\n800 classes is %d"
                         % (cyc1, cyc2, cyc3, cyc4, cyc5, cyc6, cyc7, cyc8))
        self.perf_test_result(cyc1, "100_class_time", "sec")
        self.perf_test_result(cyc2, "200_class_time", "sec")
        self.perf_test_result(cyc3, "300_class_time", "sec")
        self.perf_test_result(cyc4, "400_class_time", "sec")
        self.perf_test_result(cyc5, "500_class_time", "sec")
        self.perf_test_result(cyc6, "600_class_time", "sec")
        self.perf_test_result(cyc7, "700_class_time", "sec")
        self.perf_test_result(cyc8, "800_class_time", "sec")


================================================
FILE: test/tests/performance/pbs_history_cleanup_quasihang.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.performance import *


class HistoryCleanupQuasihang(TestPerformance):
    """
    This test suite aims at testing the quasihang caused by a lot of jobs
    in the history.
    Without the fix, the server takes a lot of time to respond to a client.
    With the fix, the amount of time is significantly reduced.
    """

    def setUp(self):
        TestPerformance.setUp(self)

        a = {'job_history_enable': 'True', "job_history_duration": "10:00:00"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {ATTR_rescavail + '.ncpus': 100}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

    @timeout(18000)
    def test_time_for_stat_during_history_cleanup(self):
        """
        This test case submits 50k very short jobs so that the job history
        has a lot of jobs in it.
        After submitting the jobs, the job_history_duration is reduced so
        that the server could start purging the job history.

        Another job is submitted and stat-ed. The test case then finds the
        amount of time the server takes to respond.

        The test case is not designed to pass/fail on builds with/without
        the fix.
        """
        test = ['echo test\n']
        # Submit a lot of jobs.
        for _ in range(0, 10):
            for _ in range(0, 10):
                for _ in range(0, 500):
                    j = Job(TEST_USER, attrs={ATTR_k: 'oe'})
                    j.create_script(body=test)
                    jid = self.server.submit(j)
                time.sleep(1)
            self.server.expect(JOB, {'job_state': 'F'}, id=jid, extend='x',
                               offset=10, interval=2, max_attempts=100)

        a = {"job_history_duration": "00:00:05"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        j = Job(TEST_USER)
        j.set_sleep_time(10000)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        now1 = 0
        now2 = 0
        i = 0

        while now2 - now1 < 2 and i < 125:
            time.sleep(1)
            now1 = int(time.time())
            self.server.expect(JOB, {'job_state': 'R'}, id=jid)
            now2 = int(time.time())
            i += 1

        self.logger.info("qstat took %d seconds to return\n",
                         (now2 - now1))
        self.perf_test_result((now2 - now1), "qstat_return_time", "sec")


================================================
FILE: test/tests/performance/pbs_jobperf.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os
import subprocess
import multiprocessing
from threading import Thread
from tests.performance import *
from ptl.utils.pbs_logutils import PBSLogAnalyzer


class TestJobPerf(TestPerformance):
    """
    Performance Testsuite for job related tests
    """

    def setUp(self):
        TestPerformance.setUp(self)

    def set_test_config(self, config):
        """
        Sets test level configuration
        """
        testconfig = {}
        for key, value in config.items():
            if isinstance(value, int):
                testconfig[key] = int(
                    self.conf[key]) if key in self.conf else value
            else:
                testconfig[key] = self.conf[key] if key in self.conf else value
        self.set_test_measurements({"test_config": testconfig})
        return testconfig

    def submit_jobs(self, user, num_jobs, qsub_exec=None,
                    qsub_exec_arg=None):
        """
        Submit jobs with provided arguments and job
        """
        job = 'sudo -u ' + str(user) + ' ' + \
              str(os.path.join(
                  self.server.pbs_conf['PBS_EXEC'], 'bin', 'qsub'))
        if qsub_exec_arg is None:
            job += ' -koe -o /dev/null -e /dev/null'
        else:
            job += ' ' + qsub_exec_arg
        if qsub_exec is None:
            job += ' -- /bin/true'
        else:
            job += ' ' + qsub_exec
        for _ in range(num_jobs):
            subprocess.call(job, shell=True)

    def wait_for_job_finish(self, jobiter=True):
        """
        Wait for jobs to get finished
        """
        total_jobs = self.config['No_of_jobs_per_user']
        total_jobs *= self.config['No_of_users']
        if jobiter:
            total_jobs *= self.config['No_of_iterations']
        self.server.expect(JOB, {'job_state=F': total_jobs}, extend='x',
                           interval=20, trigger_sched_cycle=False)

    def delete_jobs_per_user(self, users, num_users):
        """
        Delete jobs faster by providing more job id's at once
        """
        bin_path = str(os.path.join(
            self.server.pbs_conf['PBS_EXEC'], 'bin'))
        qdel = str(os.path.join(bin_path, 'qdel'))
        qdel = qdel + ' -W force'
        cmd = qdel + " `" + str(os.path.join(bin_path, 'qselect'))
        for u in range(0, num_users):
            qdel_cmd = cmd + " -u" + str(users[u]) + " `"
            subprocess.call(qdel_cmd, shell=True)

    @timeout(3600)
    def test_job_performance_sched_off(self):
        """
        Test Job subission rate when scheduling is off by
        submitting 1k jobs and turn on scheduling with 1k ncpus.
        Test Params:  'No_of_jobs_per_user': 100,
                      'No_of_tries': 10,
                      'No_of_iterations': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qsub_exec': '-- /bin/true',
                      'qsub_exec_arg': None,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48
        """
        testconfig = {'No_of_jobs_per_user': 100,
                      'No_of_tries': 10,
                      'No_of_iterations': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qsub_exec': '-- /bin/true',
                      'qsub_exec_arg': None,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48}
        config = self.set_test_config(testconfig)

        avg_sub_time = []
        avg_run_rate = []
        j = 0
        counts = self.server.counter(NODE, {'state': 'free'})
        if counts['state=free'] < config['No_of_moms']:
            a = {'resources_available.ncpus': config['No_of_ncpus_per_node']}
            self.server.create_moms(
                'mom', a,
                config['No_of_moms'], self.mom)
        while j < config['No_of_tries']:
            sub_rate = []
            run_rate = []
            i = 0
            users = [TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
                     TEST_USER5, TEST_USER6, TEST_USER7, TEST_USER,
                     TST_USR, TST_USR1]
            a = {'log_events': config['svr_log_level']}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            while i < config['No_of_iterations']:
                start = time.time()
                os.chdir('/tmp')
                thrds = []
                for u in range(0, config['No_of_users']):
                    t = multiprocessing.Process(target=self.submit_jobs, args=(
                                                users[u],
                                                config['No_of_jobs_per_user'],
                                                config['qsub_exec'],
                                                config['qsub_exec_arg']))
                    t.start()
                    thrds.append(t)
                for t in thrds:
                    t.join()
                stop = time.time()
                res = stop - start
                resps = (config['No_of_jobs_per_user'] *
                         config['No_of_users']) / res
                sub_rate.append(resps)
                i += 1
            a = {'scheduling': 'True'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            self.scheduler.log_match(
                "Starting Scheduling Cycle", starttime=int(start),
                max_attempts=30)
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            self.scheduler.log_match("Leaving Scheduling Cycle",
                                     starttime=int(start) + 1,
                                     max_attempts=30, interval=1)
            sclg = PBSLogAnalyzer()
            md = sclg.analyze_scheduler_log(
                filename=self.scheduler.logfile, start=int(start))
            rr = md['summary']['job_run_rate']
            value = rr.strip().split('/', 1)
            rr = float(value[0])
            run_rate.append(rr)
            avg_sub_time.extend(sub_rate)
            avg_run_rate.extend(run_rate)
            j = j + 1
        self.perf_test_result(avg_sub_time, "job_submission", "jobs/sec")
        self.perf_test_result(avg_run_rate, "job_run_rate", "jobs/sec")

    @timeout(6000)
    def test_job_performance_sched_on(self):
        """
        Test job submit_rate, run_rate, throughput by submitting 10k jobs
        when scheduling is on with 1k ncpus.
        Test Params: 'No_of_jobs_per_user': 100,
                      'No_of_tries': 1,
                      'No_of_iterations': 10,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qsub_exec': '-- /bin/true',
                      'qsub_exec_arg': None,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48
        """
        testconfig = {'No_of_jobs_per_user': 100,
                      'No_of_tries': 1,
                      'No_of_iterations': 10,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qsub_exec': '-- /bin/true',
                      'qsub_exec_arg': None,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48}
        self.config = self.set_test_config(testconfig)
        num_ncpus = self.config['No_of_ncpus_per_node']
        avg_sub_time = []
        avg_run_rate = []
        avg_throughput = []
        j = 0
        counts = self.server.counter(NODE, {'state': 'free'})
        if counts['state=free'] < self.config['No_of_moms']:
            a = {'resources_available.ncpus': num_ncpus}
            self.server.create_moms(
                'mom', a,
                self.config['No_of_moms'], self.mom)
        while j < self.config['No_of_tries']:
            sub_time = []
            run_rate = []
            throughput = []
            i = 0
            log_start = time.time()
            users = [TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
                     TEST_USER5, TEST_USER6, TEST_USER7, TEST_USER,
                     TST_USR, TST_USR1]
            a = {'log_events': self.config['svr_log_level']}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'job_history_enable': True}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            while i < self.config['No_of_iterations']:
                os.chdir('/tmp')
                thrds = []
                start = time.time()
                for u in range(0, self.config['No_of_users']):
                    t = multiprocessing.Process(target=self.submit_jobs, args=(
                        users[u], self.config['No_of_jobs_per_user'],
                        self.config['qsub_exec'],
                        self.config['qsub_exec_arg']))
                    t.start()
                    thrds.append(t)
                for t in thrds:
                    t.join()
                i = i + 1
                stop = time.time()
                res = stop - start
                resps = (self.config['No_of_jobs_per_user'] *
                         self.config['No_of_users']) / res
                sub_time.append(resps)
            j += 1
            self.wait_for_job_finish()
            a = {'job_history_enable': False}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            sclg = PBSLogAnalyzer()
            md = sclg.analyze_scheduler_log(
                filename=self.scheduler.logfile, start=int(log_start))
            rr = md['summary']['job_run_rate']
            value = rr.strip().split('/', 1)
            rr = float(value[0])
            run_rate.append(rr)
            md = sclg.analyze_server_log(
                filename=self.server.logfile, start=int(log_start))
            jobs_ended = md['num_jobs_ended']
            if jobs_ended:
                jtr = md['job_throughput']
                value = jtr.strip().split('/', 1)
                jtr = float(value[0])
                throughput.append(jtr)
            else:
                throughput.append(0)
            avg_run_rate.extend(run_rate)
            avg_sub_time.extend(sub_time)
            avg_throughput.extend(throughput)
        self.perf_test_result(avg_sub_time, "job_submission", "jobs/sec")
        self.perf_test_result(avg_run_rate, "job_run_rate", "jobs/sec")
        self.perf_test_result(avg_throughput, "job_throughput", "jobs/sec")

    def qstat_jobs(self, user, num_stats, qstat_arg=None):
        for _ in range(num_stats):
            qstat = 'sudo -u ' + str(user) + ' ' + \
                str(os.path.join(
                    self.server.pbs_conf['PBS_EXEC'], 'bin', 'qstat'))
            if qstat_arg:
                qstat = qstat + ' ' + qstat_arg
            self.logger.info(qstat)
            subprocess.call(qstat, shell=True)

    @timeout(3600)
    def test_qstat_perf(self):
        """
        Test time taken by 100 qstat -f with 10k jobs in queue
        Test Params: 'No_of_jobs_per_user': 100,
                      'No_of_tries': 1,
                      'No_of_iterations': 10,
                      'No_of_qstats': 10,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qstat_args': '-f',
                      'qsub_exec_arg': None
        """
        testconfig = {'No_of_jobs_per_user': 100,
                      'No_of_tries': 1,
                      'No_of_iterations': 10,
                      'No_of_qstats': 10,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qstat_args': '-f',
                      'qsub_exec_arg': None}
        config = self.set_test_config(testconfig)

        avg_stat_time = []
        j = 0
        while j < config['No_of_tries']:
            i = 0
            stat_time = []
            users = [TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
                     TEST_USER5, TEST_USER6, TEST_USER7, TEST_USER,
                     TST_USR, TST_USR1]
            a = {'log_events': config['svr_log_level']}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            thrds = []
            for u in range(0, config['No_of_users']):
                t = Thread(target=self.submit_jobs, args=(
                    users[u], config['No_of_jobs_per_user'], None,
                    config['qsub_exec_arg']))
                t.start()
                thrds.append(t)
            for t in thrds:
                t.join()

            while i < config['No_of_iterations']:
                os.chdir('/tmp')
                start = time.time()
                thrds = []
                for u in range(0, config['No_of_users']):
                    t = Thread(target=self.qstat_jobs, args=(
                        users[u], config['No_of_users'],
                        config['qsub_exec_arg']))
                    t.start()
                    thrds.append(t)
                for t in thrds:
                    t.join()
                stop = time.time()
                res = stop - start
                i = i + 1
                stat_time.append(res)
            j = j + 1
            avg_stat_time.extend(stat_time)
        self.delete_jobs_per_user(users, config['No_of_users'])
        self.perf_test_result(avg_stat_time, "job_stats", "secs")

    @timeout(3600)
    def test_qstat_hist_perf(self):
        """
        Test time taken by 100 qstat -fx with 10k jobs in history
        Test Params: 'No_of_jobs_per_user': 100,
                      'No_of_tries': 1,
                      'No_of_iterations': 10,
                      'No_of_qstats': 100,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qstat_args': '-fx',
                      'qsub_exec_arg': None,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48
        """
        testconfig = {'No_of_jobs_per_user': 100,
                      'No_of_tries': 1,
                      'No_of_iterations': 10,
                      'No_of_qstats': 10,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qstat_args': '-fx',
                      'qsub_exec_arg': None,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48}
        self.config = self.set_test_config(testconfig)

        avg_stat_time = []
        num_ncpus = self.config['No_of_ncpus_per_node']
        j = 0
        counts = self.server.counter(NODE, {'state': 'free'})
        if counts['state=free'] < self.config['No_of_moms']:
            a = {'resources_available.ncpus': num_ncpus}
            self.server.create_moms(
                'mom', a,
                self.config['No_of_moms'], self.mom)
        while j < self.config['No_of_tries']:
            stat_time = []
            i = 0
            users = [TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
                     TEST_USER5, TEST_USER6, TEST_USER7, TEST_USER,
                     TST_USR, TST_USR1]
            a = {'log_events': self.config['svr_log_level']}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            thrds = []
            for u in range(0, self.config['No_of_users']):
                t = Thread(target=self.submit_jobs, args=(
                    users[u], self.config['No_of_jobs_per_user'], None,
                    self.config['qsub_exec_arg']))
                t.start()
                thrds.append(t)
            for t in thrds:
                t.join()
            a = {'job_history_enable': 'True'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'True'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            self.wait_for_job_finish(jobiter=False)
            while i < self.config['No_of_iterations']:
                os.chdir('/tmp')
                start = time.time()
                thrds = []
                for u in range(0, self.config['No_of_users']):
                    t = Thread(target=self.qstat_jobs, args=(
                        users[u], self.config['No_of_qstats'],
                        self.config['qstat_args']))
                    t.start()
                    thrds.append(t)
                for t in thrds:
                    t.join()
                stop = time.time()
                res = stop - start
                i = i + 1
                stat_time.append(res)
            j = j + 1
            avg_stat_time.extend(stat_time)
            a = {'job_history_enable': False}
            self.server.manager(MGR_CMD_SET, SERVER, a)
        self.perf_test_result(avg_stat_time, "job_stats_history", "secs")

    @timeout(3600)
    def common_server_restart(self, option=None):
        """
        Test server restart performance with huge number of jobs in queue
        """
        testconfig = {'No_of_jobs_per_user': 10000,
                      'No_of_tries': 1,
                      'No_of_iterations': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511}
        config = self.set_test_config(testconfig)

        avg_result = []
        j = 0
        while j < config['No_of_tries']:
            result = []
            i = 0
            users = [TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
                     TEST_USER5, TEST_USER6, TEST_USER7, TEST_USER,
                     TST_USR, TST_USR1]
            a = {'log_events': config['svr_log_level']}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            thrds = []
            for u in range(0, config['No_of_users']):
                t = Thread(target=self.submit_jobs,
                           args=(users[u], config['No_of_jobs_per_user']))
                t.start()
                thrds.append(t)
            for t in thrds:
                t.join()
            while i < config['No_of_iterations']:
                if option == 'kill':
                    self.server.stop('-KILL')
                else:
                    self.server.stop()
                start = time.time()
                self.server.start()
                stop = time.time()
                res = stop - start
                i = i + 1
                result.append(res)
            j = j + 1
            avg_result.extend(result)
            self.delete_jobs_per_user(users, config['No_of_users'])
        self.perf_test_result(avg_result, "server_restart_perf", "secs")

    @timeout(3600)
    def test_server_restart_kill(self):
        """
        Test server kill and restart performance with 100k jobs in queue
        Test Params: 'No_of_jobs_per_user': 10000,
                      'No_of_tries': 1,
                      'No_of_iterations': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511
        """
        self.common_server_restart(option='kill')

    @timeout(3600)
    def test_server_restart(self):
        """
        Test server restart performance 100k jobs in queue
        Test Params: 'No_of_jobs_per_user': 10000,
                      'No_of_tries': 1,
                      'No_of_iterations': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511
        """
        self.common_server_restart()

    @timeout(3600)
    def test_qdel_perf(self):
        """
        Test job deletion performance for 10k queued jobs
        Test Params: 'No_of_jobs_per_user': 1000,
                      'No_of_tries': 1,
                      'No_of_iterations': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511
        """
        testconfig = {'No_of_jobs_per_user': 1000,
                      'No_of_tries': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'qdel_exec_args': None}
        config = self.set_test_config(testconfig)

        avg_qdel_time = []
        j = 0
        while j < config['No_of_tries']:
            qdel_time = []
            users = [TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
                     TEST_USER5, TEST_USER6, TEST_USER7, TEST_USER,
                     TST_USR, TST_USR1]
            a = {'log_events': config['svr_log_level']}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            thrds = []
            for u in range(0, config['No_of_users']):
                t = Thread(target=self.submit_jobs,
                           args=(users[u], config['No_of_jobs_per_user']))
                t.start()
                thrds.append(t)
            for t in thrds:
                t.join()

            start = time.time()
            bin_path = str(os.path.join(
                self.server.pbs_conf['PBS_EXEC'], 'bin'))
            qdel = str(os.path.join(bin_path, 'qdel'))
            if config['qdel_exec_args']:
                qdel = qdel + ' -W force'
            cmd = qdel + " `" + str(os.path.join(bin_path, 'qselect')) + "`"
            subprocess.call(cmd, shell=True)
            stop = time.time()
            res = stop - start
            qdel_time.append(res)
            j = j + 1
            avg_qdel_time.extend(qdel_time)
        self.perf_test_result(avg_qdel_time, "job_deletion", "secs")

    @timeout(3600)
    def test_qdel_hist_perf(self):
        """
        Test job deletion performance for 10k history jobs
        Test Params: 'No_of_jobs_per_user': 1000,
                      'No_of_tries': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48
        """
        testconfig = {'No_of_jobs_per_user': 1000,
                      'No_of_tries': 1,
                      'No_of_users': 10,
                      'svr_log_level': 511,
                      'No_of_moms': 21,
                      'No_of_ncpus_per_node': 48}
        self.config = self.set_test_config(testconfig)
        num_ncpus = self.config['No_of_ncpus_per_node']
        avg_qdel_time = []
        qdel_time = []
        j = 0
        counts = self.server.counter(NODE, {'state': 'free'})
        if counts['state=free'] < self.config['No_of_moms']:
            a = {'resources_available.ncpus': num_ncpus}
            self.server.create_moms(
                'mom', a,
                self.config['No_of_moms'], self.mom)
        while j < self.config['No_of_tries']:
            qdel_time = []
            users = [TEST_USER1, TEST_USER2, TEST_USER3, TEST_USER4,
                     TEST_USER5, TEST_USER6, TEST_USER7, TEST_USER,
                     TST_USR, TST_USR1]
            a = {'log_events': self.config['svr_log_level']}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            thrds = []
            for u in range(0, self.config['No_of_users']):
                t = Thread(target=self.submit_jobs,
                           args=(users[u], self.config['No_of_jobs_per_user']))
                t.start()
                thrds.append(t)
            for t in thrds:
                t.join()
            a = {'job_history_enable': 'True'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            a = {'scheduling': 'True'}
            self.server.manager(MGR_CMD_SET, SERVER, a)
            self.wait_for_job_finish(jobiter=False)
            start = time.time()
            bin_path = str(os.path.join(
                self.server.pbs_conf['PBS_EXEC'], 'bin'))
            qdel = str(os.path.join(bin_path, 'qdel')) + ' -x'
            cmd = qdel + " `" + \
                str(os.path.join(bin_path, 'qselect')) + " -x" + "`"
            self.logger.info(cmd)
            subprocess.call(cmd, shell=True)
            stop = time.time()
            res = stop - start
            qdel_time.append(res)
            j = j + 1
            avg_qdel_time.extend(qdel_time)
        self.perf_test_result(avg_qdel_time, "job_deletion_history", 'secs')


================================================
FILE: test/tests/performance/pbs_preemptperformance.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.performance import *
from ptl.utils.pbs_logutils import PBSLogUtils


class TestPreemptPerformance(TestPerformance):

    """
    Check the preemption performance
    """
    lu = PBSLogUtils()

    def setUp(self):
        TestPerformance.setUp(self)
        # set poll cycle to a high value because mom spends a lot of time
        # in gathering job's resources used. We don't need that in this test
        self.mom.add_config({'$min_check_poll': 7200, '$max_check_poll': 9600})

    def create_workload_and_preempt(self):
        a = {
            'queue_type': 'execution',
            'started': 'True',
            'enabled': 'True'
        }
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, 'workq2')

        a = {'max_run_res_soft.ncpus': "[u:PBS_GENERIC=2]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')

        a = {'max_run_res.mem': "[u:" + str(TEST_USER) + "=1500mb]"}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        a = {'Resource_List.select': '1:ncpus=3:mem=90mb',
             'Resource_List.walltime': 9999}
        for _ in range(8):
            j = Job(TEST_USER, attrs=a)
            j.set_sleep_time(9999)
            self.server.submit(j)

        for _ in range(7):
            j = Job(TEST_USER1, attrs=a)
            j.set_sleep_time(9999)
            self.server.submit(j)

        sched_off = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, sched_off)

        a = {'Resource_List.select': '1:ncpus=3',
             'Resource_List.walltime': 9999}
        for _ in range(775):
            j = Job(TEST_USER, attrs=a)
            j.set_sleep_time(9999)
            self.server.submit(j)

        for _ in range(800):
            j = Job(TEST_USER1, attrs=a)
            j.set_sleep_time(9999)
            self.server.submit(j)

        sched_on = {'scheduling': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, sched_on)

        self.server.expect(JOB, {'job_state=R': 1590},
                           offset=15, interval=20)

        a = {'Resource_List.select': '1:ncpus=90:mem=1350mb',
             'Resource_List.walltime': 9999, ATTR_queue: 'workq2'}
        j1 = Job(TEST_USER, attrs=a)
        j1.set_sleep_time(9999)
        j1id = self.server.submit(j1)

        self.server.expect(JOB, {'job_state': 'R'}, id=j1id,
                           offset=15, interval=5)
        self.server.expect(JOB, {'job_state=S': 20}, interval=5)

        (_, str1) = self.scheduler.log_match(j1id + ";Considering job to run",
                                             id=j1id, n='ALL',
                                             max_attempts=1, interval=2)
        (_, str2) = self.scheduler.log_match(j1id + ";Job run",
                                             id=j1id, n='ALL',
                                             max_attempts=1, interval=2)

        date_time1 = str1.split(";")[0]
        date_time2 = str2.split(";")[0]
        epoch1 = self.lu.convert_date_time(date_time1)
        epoch2 = self.lu.convert_date_time(date_time2)
        time_diff = epoch2 - epoch1
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        res_str = "RESULT: THE TIME TAKEN IS : " + str(time_diff) + " SECONDS"
        self.logger.info(res_str)
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)

    @timeout(3600)
    @tags('sched', 'scheduling_policy')
    def test_preemption_with_limits(self):
        """
        Measure the time scheduler takes to preempt when the high priority
        job hits soft/hard limits under a considerable amount of workload.
        """
        a = {'resources_available.ncpus': 4800,
             'resources_available.mem': '2800mb'}
        self.mom.create_vnodes(a, 1, usenatvnode=True)
        p = '"express_queue, normal_jobs, server_softlimits, queue_softlimits"'
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a, runas=ROOT_USER)

        self.create_workload_and_preempt()

    @timeout(3600)
    @tags('sched', 'scheduling_policy')
    def test_preemption_with_insufficient_resc(self):
        """
        Measure the time scheduler takes to preempt when the high priority
        job hits soft/hard limits and there is scarcity of resources
        under a considerable amount of workload.
        """
        a = {'resources_available.ncpus': 4800,
             'resources_available.mem': '1500mb'}
        self.mom.create_vnodes(a, 1, usenatvnode=True)
        p = '"express_queue, normal_jobs, server_softlimits, queue_softlimits"'
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a, runas=ROOT_USER)

        self.create_workload_and_preempt()

    @timeout(3600)
    @tags('sched', 'scheduling_policy')
    def test_insufficient_resc_non_cons(self):
        """
        Submit a number of low priority job and then submit a high priority
        job that needs a non-consumable resource which is assigned to last
        running job. This will make scheduler go through all running jobs
        to find the preemptable job.
        """

        a = {'type': 'string', 'flag': 'h'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='qlist')

        a = {ATTR_rescavail + ".qlist": "list1",
             ATTR_rescavail + ".ncpus": "8"}
        self.mom.create_vnodes(
            a, 400, self.mom, additive=True, fname="vnodedef1")

        a = {ATTR_rescavail + ".qlist": "list2",
             ATTR_rescavail + ".ncpus": "1"}
        self.mom.create_vnodes(
            a, 1, self.mom, additive=True, fname="vnodedef2")

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        a = {ATTR_l + '.select': '1:ncpus=1:qlist=list2'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(3000)

        # Add qlist to the resources scheduler checks for
        self.scheduler.add_resource('qlist')

        jid = self.server.submit(j)
        time.sleep(1)

        a = {ATTR_l + '.select': '1:ncpus=1:qlist=list1'}
        for _ in range(3200):
            j = Job(TEST_USER, attrs=a)
            j.set_sleep_time(3000)
            self.server.submit(j)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state=R': 3201}, interval=20,
                           offset=15)

        qname = 'highp'
        a = {'queue_type': 'execution', 'priority': '200',
             'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)

        a = {ATTR_l + '.select': '1:ncpus=1:qlist=list2',
             ATTR_q: 'highp'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(3000)
        jid_highp = self.server.submit(j)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid_highp, interval=10)
        self.server.expect(JOB, {ATTR_state: (MATCH_RE, 'S|Q')}, id=jid)

        search_str = jid_highp + ";Considering job to run"
        (_, str1) = self.scheduler.log_match(search_str,
                                             id=jid_highp, n='ALL',
                                             max_attempts=1, interval=2)
        search_str = jid_highp + ";Job run"
        (_, str2) = self.scheduler.log_match(search_str,
                                             id=jid_highp, n='ALL',
                                             max_attempts=1, interval=2)
        date_time1 = str1.split(";")[0]
        date_time2 = str2.split(";")[0]
        epoch1 = self.lu.convert_date_time(date_time1)
        epoch2 = self.lu.convert_date_time(date_time2)
        time_diff = epoch2 - epoch1
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        res_str = "RESULT: PREEMPTION TOOK: " + str(time_diff) + " SECONDS"
        self.logger.info(res_str)
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        self.perf_test_result(time_diff,
                              "preempt_time_nonconsumable_resc", "sec")

    @timeout(3600)
    @tags('sched', 'scheduling_policy')
    def test_insufficient_resc_multiple_non_cons(self):
        """
        Submit a number of low priority jobs and then submit a high priority
        job that needs a non-consumable resource in 2 chunks. These resources
        are assigned to last two running jobs. This will make scheduler go
        through all running jobs to find preemptable jobs.
        """

        a = {'type': 'string', 'flag': 'h'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='qlist')

        a = {ATTR_rescavail + ".qlist": "list1",
             ATTR_rescavail + ".ncpus": "8"}
        self.mom.create_vnodes(
            a, 400, additive=True, fname="vnodedef1")

        a = {ATTR_rescavail + ".qlist": "list2",
             ATTR_rescavail + ".ncpus": "1"}
        self.mom.create_vnodes(
            a, 1, additive=True, fname="vnodedef2")

        a = {ATTR_rescavail + ".qlist": "list3",
             ATTR_rescavail + ".ncpus": "1"}
        self.mom.create_vnodes(
            a, 1, additive=True, fname="vnodedef3")

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        a = {ATTR_l + '.select': '1:ncpus=1:qlist=list2'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(3000)

        b = {ATTR_l + '.select': '1:ncpus=1:qlist=list3'}
        j2 = Job(TEST_USER, attrs=b)
        j2.set_sleep_time(3000)

        # Add qlist to the resources scheduler checks for
        self.scheduler.add_resource('qlist')

        jid = self.server.submit(j)
        jid2 = self.server.submit(j2)

        a = {ATTR_l + '.select': '1:ncpus=1:qlist=list1'}
        for _ in range(3200):
            j = Job(TEST_USER, attrs=a)
            j.set_sleep_time(3000)
            self.server.submit(j)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        self.server.expect(JOB, {'job_state=R': 3202}, interval=20,
                           offset=15)

        qname = 'highp'
        a = {'queue_type': 'execution', 'priority': '200',
             'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)

        a = {ATTR_l + '.select': '1:ncpus=1:qlist=list2+1:ncpus=1:qlist=list3',
             ATTR_q: 'highp'}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(3000)
        jid_highp = self.server.submit(j)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid_highp, interval=10)
        self.server.expect(JOB, {ATTR_state: (MATCH_RE, 'S|Q')}, id=jid)
        self.server.expect(JOB, {ATTR_state: (MATCH_RE, 'S|Q')}, id=jid2)

        search_str = jid_highp + ";Considering job to run"
        (_, str1) = self.scheduler.log_match(search_str,
                                             id=jid_highp, n='ALL',
                                             max_attempts=1, interval=2)
        search_str = jid_highp + ";Job run"
        (_, str2) = self.scheduler.log_match(search_str,
                                             id=jid_highp, n='ALL',
                                             max_attempts=1, interval=2)
        date_time1 = str1.split(";")[0]
        date_time2 = str2.split(";")[0]
        epoch1 = self.lu.convert_date_time(date_time1)
        epoch2 = self.lu.convert_date_time(date_time2)
        time_diff = epoch2 - epoch1
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        res_str = "RESULT: PREEMPTION TOOK: " + str(time_diff) + " SECONDS"
        self.logger.info(res_str)
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        self.perf_test_result(time_diff,
                              "preempt_time_multiplenonconsumable_resc",
                              "sec")

    @timeout(3600)
    @tags('sched', 'scheduling_policy')
    def test_insufficient_server_resc(self):
        """
        Submit a number of low priority jobs and then make the last low
        priority job to consume some server level resources. Submit a
        high priority job that request for this server level resource
        and measure the time it takes for preemption.
        """

        a = {'type': 'long', 'flag': 'q'}
        self.server.manager(MGR_CMD_CREATE, RSC, a, id='foo')

        a = {ATTR_rescavail + ".ncpus": "8"}
        self.mom.create_vnodes(
            a, 401, additive=True, fname="vnodedef1")

        # Make resource foo available on server
        a = {ATTR_rescavail + ".foo": 50, 'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)

        # Add foo to the resources scheduler checks for
        self.scheduler.add_resource('foo')

        a = {ATTR_l + '.select': '1:ncpus=1', ATTR_l + '.foo': 25}
        j = Job(TEST_USER, attrs=a)
        j.set_sleep_time(3000)
        jid = self.server.submit(j)
        time.sleep(1)

        a = {ATTR_l + '.select': '1:ncpus=1'}
        for _ in range(3200):
            j = Job(TEST_USER, attrs=a)
            j.set_sleep_time(3000)
            self.server.submit(j)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state=R': 3201}, interval=20,
                           offset=15)

        qname = 'highp'
        a = {'queue_type': 'execution', 'priority': '200',
             'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)

        a = {ATTR_l + '.select': '1:ncpus=1', ATTR_l + '.foo': 50,
             ATTR_q: 'highp'}
        j2 = Job(TEST_USER, attrs=a)
        j2.set_sleep_time(3000)
        jid_highp = self.server.submit(j2)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid_highp, interval=10)
        self.server.expect(JOB, {ATTR_state: (MATCH_RE, 'S|Q')}, id=jid)

        search_str = jid_highp + ";Considering job to run"
        (_, str1) = self.scheduler.log_match(search_str,
                                             id=jid_highp, n='ALL',
                                             max_attempts=1, interval=2)
        search_str = jid_highp + ";Job run"
        (_, str2) = self.scheduler.log_match(search_str,
                                             id=jid_highp, n='ALL',
                                             max_attempts=1, interval=2)
        date_time1 = str1.split(";")[0]
        date_time2 = str2.split(";")[0]
        epoch1 = self.lu.convert_date_time(date_time1)
        epoch2 = self.lu.convert_date_time(date_time2)
        time_diff = epoch2 - epoch1
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        res_str = "RESULT: PREEMPTION TOOK: " + str(time_diff) + " SECONDS"
        self.logger.info(res_str)
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        self.perf_test_result(time_diff, "High_priority_preemption", "sec")

    @timeout(7200)
    def test_preemption_basic(self):
        """
        Submit a number of low priority job and then submit a high priority
        job.
        """

        a = {ATTR_rescavail + ".ncpus": "8"}
        self.mom.create_vnodes(
            a, 400, additive=True, fname="vnodedef1")

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        a = {ATTR_l + '.select': '1:ncpus=1'}
        for _ in range(3200):
            j = Job(TEST_USER, attrs=a)
            j.set_sleep_time(3000)
            self.server.submit(j)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state=R': 3200}, interval=20,
                           offset=15)

        qname = 'highp'
        a = {'queue_type': 'execution', 'priority': '200',
             'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)

        ncpus = 20
        S_jobs = 20
        for _ in range(5):
            a = {ATTR_l + '.select': ncpus,
                 ATTR_q: 'highp'}
            j = Job(TEST_USER, attrs=a)
            j.set_sleep_time(3000)
            jid_highp = self.server.submit(j)

            self.server.expect(JOB, {ATTR_state: 'R'}, id=jid_highp,
                               interval=10)
            self.server.expect(JOB, {'job_state=S': S_jobs}, interval=5)
            search_str = jid_highp + ";Considering job to run"
            (_, str1) = self.scheduler.log_match(search_str,
                                                 id=jid_highp, n='ALL',
                                                 max_attempts=1)
            search_str = jid_highp + ";Job run"
            (_, str2) = self.scheduler.log_match(search_str,
                                                 id=jid_highp, n='ALL',
                                                 max_attempts=1)
            date_time1 = str1.split(";")[0]
            date_time2 = str2.split(";")[0]
            epoch1 = self.lu.convert_date_time(date_time1)
            epoch2 = self.lu.convert_date_time(date_time2)
            time_diff = epoch2 - epoch1
            self.logger.info('#' * 80)
            self.logger.info('#' * 80)
            res_str = "RESULT: PREEMPTION OF " + str(ncpus) + " JOBS TOOK: " \
                + str(time_diff) + " SECONDS"
            self.logger.info(res_str)
            self.logger.info('#' * 80)
            self.logger.info('#' * 80)
            ncpus *= 3
            S_jobs += ncpus
            self.perf_test_result(time_diff, "preemption_time", "sec")

    @timeout(3600)
    def test_preemption_with_unrelated_soft_limits(self):
        """
        Measure the time scheduler takes to preempt when there are user
        soft limits in the system and preemptor and preemptee jobs are
        submitted as different user.
        """
        a = {'resources_available.ncpus': 4,
             'resources_available.mem': '6400mb'}
        self.mom.create_vnodes(a, 500, usenatvnode=False,
                               sharednode=False)
        p = "express_queue, normal_jobs, server_softlimits, queue_softlimits"
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        a = {'max_run_res_soft.ncpus': "[u:" + str(TEST_USER) + "=1]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # submit a bunch of jobs as TEST_USER2
        a = {ATTR_l + '.select=1:ncpus': 1}
        for _ in range(2000):
            j = Job(TEST_USER2, attrs=a)
            j.set_sleep_time(3000)
            self.server.submit(j)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state=R': 2000}, interval=10, offset=5,
                           max_attempts=100)

        qname = 'highp'
        a = {'queue_type': 'execution', 'priority': '200',
             'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {ATTR_l + '.select=2000:ncpus': 1, ATTR_q: qname}
        j = Job(TEST_USER3, attrs=a)
        j.set_sleep_time(3000)
        hjid = self.server.submit(j)
        scycle = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        (_, str1) = self.scheduler.log_match(hjid + ";Considering job to run")

        date_time1 = str1.split(";")[0]
        epoch1 = self.lu.convert_date_time(date_time1)
        # make sure 2000 jobs were suspended
        self.server.expect(JOB, {'job_state=S': 2000}, interval=10, offset=5,
                           max_attempts=100)

        # check when server received the request
        (_, req_svr) = self.server.log_match(";Type 93 request received",
                                             starttime=epoch1)
        date_time_svr = req_svr.split(";")[0]
        epoch_svr = self.lu.convert_date_time(date_time_svr)
        # check when scheduler gets first reply from server
        (_, resp_sched) = self.scheduler.log_match(";Job preempted ",
                                                   starttime=epoch1)
        date_time_sched = resp_sched.split(";")[0]
        epoch_sched = self.lu.convert_date_time(date_time_sched)
        svr_delay = epoch_sched - epoch_svr

        # record the start time of high priority job
        (_, str2) = self.scheduler.log_match(hjid + ";Job run",
                                             n='ALL', interval=2)
        date_time2 = str2.split(";")[0]
        epoch2 = self.lu.convert_date_time(date_time2)
        time_diff = epoch2 - epoch1
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        res_str = "RESULT: TOTAL PREEMPTION TIME: " + \
                  str(time_diff) + " SECONDS, SERVER TOOK: " + \
                  str(svr_delay) + " , SCHED TOOK: " + \
                  str(time_diff - svr_delay)
        self.logger.info(res_str)
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)

    @timeout(3600)
    def test_preemption_with_user_soft_limits(self):
        """
        Measure the time scheduler takes to preempt when there are user
        soft limits in the system for one user and only some preemptee jobs
        are submitted as that user.
        """
        a = {'resources_available.ncpus': 4,
             'resources_available.mem': '6400mb'}
        self.mom.create_vnodes(a, 500, usenatvnode=False,
                               sharednode=False)
        p = "express_queue, normal_jobs, server_softlimits, queue_softlimits"
        a = {'preempt_prio': p}
        self.server.manager(MGR_CMD_SET, SCHED, a)

        a = {'max_run_res_soft.ncpus': "[u:" + str(TEST_USER) + "=1]"}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'workq')
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # submit a bunch of jobs as different users
        a = {ATTR_l + '.select=1:ncpus': 1}
        usr_list = [TEST_USER, TEST_USER2, TEST_USER3, TEST_USER4]
        num_usr = len(usr_list)
        for ind in range(2000):
            j = Job(usr_list[ind % num_usr], attrs=a)
            j.set_sleep_time(3000)
            self.server.submit(j)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.expect(JOB, {'job_state=R': 2000}, interval=10, offset=5,
                           max_attempts=100)

        qname = 'highp'
        a = {'queue_type': 'execution', 'priority': '200',
             'started': 'True', 'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, qname)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        a = {ATTR_l + '.select=2000:ncpus': 1, ATTR_q: qname}
        j = Job(TEST_USER5, attrs=a)
        j.set_sleep_time(3000)
        hjid = self.server.submit(j)
        scycle = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})

        (_, str1) = self.scheduler.log_match(hjid + ";Considering job to run")

        date_time1 = str1.split(";")[0]
        epoch1 = self.lu.convert_date_time(date_time1)
        # make sure 2000 jobs were suspended
        self.server.expect(JOB, {'job_state=S': 2000}, interval=10, offset=5,
                           max_attempts=100)

        # check when server received the request
        (_, req_svr) = self.server.log_match(";Type 93 request received",
                                             starttime=epoch1)
        date_time_svr = req_svr.split(";")[0]
        epoch_svr = self.lu.convert_date_time(date_time_svr)
        # check when scheduler gets first reply from server
        (_, resp_sched) = self.scheduler.log_match(";Job preempted ",
                                                   starttime=epoch1)
        date_time_sched = resp_sched.split(";")[0]
        epoch_sched = self.lu.convert_date_time(date_time_sched)
        svr_delay = epoch_sched - epoch_svr

        # record the start time of high priority job
        (_, str2) = self.scheduler.log_match(hjid + ";Job run",
                                             n='ALL', interval=2)
        date_time2 = str2.split(";")[0]
        epoch2 = self.lu.convert_date_time(date_time2)
        time_diff = epoch2 - epoch1
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        res_str = "RESULT: TOTAL PREEMPTION TIME: " + \
                  str(time_diff) + " SECONDS, SERVER TOOK: " + \
                  str(svr_delay) + " , SCHED TOOK: " + \
                  str(time_diff - svr_delay)
        self.logger.info(res_str)
        self.logger.info('#' * 80)
        self.logger.info('#' * 80)
        self.perf_test_result(time_diff, "preempt_time_soft_limits", "sec")

    def tearDown(self):
        TestPerformance.tearDown(self)
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        job_ids = self.server.select()
        self.server.delete(id=job_ids)


================================================
FILE: test/tests/performance/pbs_qstat_performance.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


import os

from tests.performance import *


class TestQstatPerformance(TestPerformance):

    """
    Testing Qstat Performance
    """
    time_command = 'time'

    def setUp(self):
        """
            Base class method overridding
            builds absolute path of commands to execute
        """
        TestPerformance.setUp(self)
        self.qstat_query_list = []
        self.time_command = self.du.which(exe="time")
        if self.time_command == "time":
            self.skipTest("Time command not found")

        qselect_command = os.path.join(
            self.server.client_conf['PBS_EXEC'],
            'bin',
            'qselect')

        self.qstat_query_list.append(" `" + qselect_command + "`")
        self.qstat_query_list.append(" workq `" + qselect_command + "`")
        self.qstat_query_list.append(" `" + qselect_command + "` workq")

        self.qstat_query_list.append(" -s `" + qselect_command + "`")
        self.qstat_query_list.append(" -f `" + qselect_command + "` workq")
        self.qstat_query_list.append(" -f workq `" + qselect_command + "`")

    def compute_elapse_time(self, query):
        """
        Computes qstat time in secs"
        Arguments :
             query - qstat query to run
        return :
              -1 on qstat fail
        """
        command = self.time_command
        command += " -f \"%e\" "
        command += os.path.join(
            self.server.client_conf['PBS_EXEC'],
            'bin',
            'qstat')
        command += query

        # compute elapse time without -E option
        without_E_option = self.du.run_cmd(self.server.hostname,
                                           command,
                                           as_script=True,
                                           logerr=False)
        if without_E_option['rc'] != 0:
            return -1
        # compute elapse time with -E option
        command += " -E"
        with_E_option = self.du.run_cmd(self.server.hostname,
                                        command,
                                        as_script=True,
                                        logerr=False)

        if with_E_option['rc'] != 0:
            return -1
        self.logger.info("Without E option :" + without_E_option['err'][0])
        self.logger.info("With E option    :" + with_E_option['err'][0])
        measure = "elapse_time qstat" + query.split("`")[0]
        self.perf_test_result(float(without_E_option['err'][0]),
                              measure, "sec")
        self.perf_test_result(float(with_E_option['err'][0]),
                              measure + "-E", "sec")
        self.assertTrue(
            (without_E_option['err'][0] >= with_E_option['err'][0]),
            "Qstat command with option : " + query + " Failed")

    def submit_jobs(self, user, num_jobs):
        """
        Submit specified number of simple jobs
        Arguments :
             user - user under which qstat to run
             num_jobs - number of jobs to submit and stat
        """
        job = Job(user)
        job.set_sleep_time(1000)
        for _ in range(num_jobs):
            self.server.submit(job)

    def submit_and_stat_jobs(self, number_jobs):
        """
        Submit specified number of simple jobs and stats jobs
        Arguments :
             num_jobs - number of jobs to submit and stat
        """
        self.submit_jobs(TEST_USER1, number_jobs)
        for query in self.qstat_query_list:
            self.compute_elapse_time(query)

    @timeout(600)
    def test_with_100_jobs(self):
        """
        Submit 100 job and compute performace of qstat
        """
        self.submit_and_stat_jobs(100)

    @timeout(600)
    def test_with_1000_jobs(self):
        """
        Submit 1000 job and compute performace of qstat
        """
        self.submit_and_stat_jobs(1000)


================================================
FILE: test/tests/performance/pbs_qsub_performance.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.performance import *


class TestQsubPerformance(TestPerformance):

    def setUp(self):
        TestPerformance.setUp(self)
        attr = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, attr)

    def submit_jobs(self, qsub_exec_arg=None, env=None):
        """
        Submits n num of jobs according to the arguments provided
        and returns submission time
        :param qsub_exec_arg: Arguments to qsub.
        :type qsub_exec_arg: String. Defaults to None.
        :param env: Environment variable to be set before submittign job.
        :type env: Dictionary. Defaults to None.
        """
        qsub_path = os.path.join(
                  self.server.pbs_conf['PBS_EXEC'], 'bin', 'qsub')

        if qsub_exec_arg is not None:
            job_sub_arg = qsub_path + ' ' + qsub_exec_arg
            env = {'VARIABLE': 'b' * 13000}
        else:
            job_sub_arg = qsub_path

        job_sub_arg += ' -- /bin/sleep 100'

        start_time = time.time()
        for _ in range(1000):
            qsub = self.du.run_cmd(self.server.hostname,
                                   job_sub_arg,
                                   env=env,
                                   as_script=True,
                                   logerr=False)
            if qsub['rc'] != 0:
                return -1
        end_time = time.time()
        sub_time = round(end_time - start_time, 2)
        return sub_time

    def test_submit_large_env(self):
        """
        This test case does the following
        1. Submit 1000 jobs
        2. Set env variable with huge value
        3. Submit 1000 jobs again with -V as argument to qsub
        4. Collect time taken for both submissions
        """
        sub_time_without_env = self.submit_jobs()
        sub_time_with_env = self.submit_jobs(qsub_exec_arg="-V")

        self.logger.info(
            "Submission time without env is %d and with env is %d sec"
            % (sub_time_without_env, sub_time_with_env))
        self.perf_test_result(sub_time_without_env,
                              "submission_time_without_env", "sec")
        self.perf_test_result(sub_time_with_env,
                              "submission_time_with_env", "sec")


================================================
FILE: test/tests/performance/pbs_rerunjob_file_transfer_perf.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.performance import *


@requirements(num_moms=2)
class JobRerunFileTransferPerf(TestPerformance):
    """
    This test suite is for testing the performance of job script
    and job output (stdout) transfers in case of rerun
    """

    def setUp(self):
        TestPerformance.setUp(self)

        if len(self.moms) != 2:
            self.logger.error('test requires two MoMs as input, ' +
                              '  use -p moms=<mom1>:<mom2>')
            self.assertEqual(len(self.moms), 2)

        # PBSTestSuite returns the moms passed in as parameters as dictionary
        # of hostname and MoM object
        self.momA = self.moms.values()[0]
        self.momB = self.moms.values()[1]
        self.momA.delete_vnode_defs()
        self.momB.delete_vnode_defs()

        self.hostA = self.momA.shortname
        self.hostB = self.momB.shortname

        self.server.manager(MGR_CMD_SET, SERVER, {'log_events': 4095})

        self.server.manager(MGR_CMD_SET, SERVER, {'job_requeue_timeout': 1000})

    @timeout(600)
    def test_huge_job_file(self):
        j = Job(TEST_USER, attrs={
                ATTR_N: 'huge_job_file', 'Resource_List.select': '1:host=%s'
                % self.momB.shortname})

        test = []
        test += ['dd if=/dev/zero of=file bs=1024 count=0 seek=250000\n']
        test += ['cat file\n']
        test += ['sleep 10000\n']

        j.create_script(test, hostname=self.server.client)

        now1 = int(time.time())
        jid = self.server.submit(j)
        self.server.expect(
            JOB, {'job_state': 'R', 'substate': 42}, id=jid,
            max_attempts=30, interval=5)
        now2 = int(time.time())
        self.logger.info("Job %s took %d seconds to start\n",
                         jid, (now2 - now1))
        self.perf_test_result((now2 - now1), "job_start_time", "sec")

        # give a few seconds to job to create large spool file
        time.sleep(5)

        now1 = int(time.time())
        self.server.rerunjob(jid)
        self.server.expect(
            JOB, {'job_state': 'R', 'substate': 42}, id=jid,
            max_attempts=500, interval=5)
        now2 = int(time.time())
        self.logger.info("Job %s took %d seconds to rerun\n",
                         jid, (now2 - now1))
        self.perf_test_result((now2 - now1), "job_return_time", "sec")


================================================
FILE: test/tests/performance/pbs_runjobwait_perf.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.performance import *


class TestRunjobWaitPerf(TestPerformance):
    """
    Performance tests related to performance testing of sched job_run_wait attr
    """

    def common_test(self, rw_val):
        """
        Common testing method for job_run_wait tests
        """
        # Create 100 vnodes with 100 ncpus each, capable of running 10k jobs
        a = {"resources_available.ncpus": 100}
        self.mom.create_vnodes(
            a, 100, sharednode=False, expect=False)
        self.server.expect(NODE, {'state=free': (GE, 100)})

        # Start pbs_mom in mock run mode
        self.mom.stop()
        mompath = os.path.join(self.server.pbs_conf["PBS_EXEC"], "sbin",
                               "pbs_mom")
        cmd = [mompath, "-m"]
        self.du.run_cmd(cmd=cmd, sudo=True)
        self.assertTrue(self.mom.isUp())
        self.server.expect(NODE, {'resources_available.ncpus=100': (GE, 100)})

        self.server.manager(MGR_CMD_SET, SCHED, {'job_run_wait': rw_val},
                            id="default")

        self.server.manager(MGR_CMD_SET, SERVER, {"scheduling": "False"})
        a = {'Resource_List.select': '1:ncpus=1'}
        for i in range(10000):
            self.server.submit(Job(attrs=a))

        t = time.time()
        self.scheduler.run_scheduling_cycle()

        c = self.scheduler.cycles(lastN=1)[0]
        t = c.end - c.start
        self.logger.info('#' * 80)
        m = "Time taken for job_run_wait=%s: %s" % (rw_val, str(t))
        self.logger.info(m)
        self.logger.info('#' * 80)

        return t

    @timeout(7200)
    def test_rw_none(self):
        """
        Test performance of job_run_wait=none
        """
        t = self.common_test("none")
        self.perf_test_result(t, "time_taken_run_wait_none", "sec")

    @timeout(7200)
    def test_rw_runjobhook(self):
        """
        Test performance of job_run_wait=runjob_hook
        """
        # Create runjob hook so that sched doesn't upgrade runjob_hook to none
        hook_txt = """
import pbs

pbs.event().accept()
"""
        hk_attrs = {'event': 'runjob', 'enabled': 'True'}
        self.server.create_import_hook('rj', hk_attrs, hook_txt)
        t = self.common_test("runjob_hook")
        self.perf_test_result(t, "time_taken_run_wait_runjobhook", "sec")

    @timeout(7200)
    def test_rw_execjobhook(self):
        """
        Test performance of job_run_wait=execjob_hook
        """
        t = self.common_test("execjob_hook")
        self.perf_test_result(t, "time_taken_run_wait_execjobhook", "sec")

    @timeout(14400)
    def test_rw_runjobhook_nohook(self):
        """
        Test performance of job_run_wait=runjob_hook without a runjob hook
        """
        t_rj = self.common_test("runjob_hook")
        t_none = self.common_test("none")

        # Verify that time taken by runjob_hook mode was less than 1.5 times
        # the time taken by none mode, as without a runjob hook, the
        # scheduler should assume none mode even if job_run_wait=runjob_hook
        self.assertLess(t_rj / t_none, 1.5)
        self.perf_test_result(
            t_rj, "time_taken_run_wait_runjobhook_nohook", "sec")
        self.perf_test_result(t_none, "time_taken_run_wait_none", "sec")
        self.perf_test_result(
            (t_none - t_rj),
            "time_diff_run_wait_none_and_run_wait_runjobhook_nohook", "sec")


================================================
FILE: test/tests/performance/pbs_sched_perf.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_logutils import PBSLogUtils
from tests.performance import *


class TestSchedPerf(TestPerformance):
    """
    Test the performance of scheduler features
    """

    def common_setup1(self):
        TestPerformance.setUp(self)
        self.server.manager(MGR_CMD_CREATE, RSC,
                            {'type': 'string', 'flag': 'h'}, id='color')
        self.colors = \
            ['red', 'orange', 'yellow', 'green', 'blue', 'indigo', 'violet']
        a = {'resources_available.ncpus': 1, 'resources_available.mem': '8gb'}
        # 10010 nodes since it divides into 7 evenly.
        # Each node bucket will have 1430 nodes in it
        self.mom.create_vnodes(a, 10010,
                               sharednode=False,
                               attrfunc=self.cust_attr_func, expect=False)
        self.server.expect(NODE, {'state=free': (GE, 10010)})
        self.scheduler.add_resource('color')

    def cust_attr_func(self, name, totalnodes, numnode, attribs):
        """
        Add custom resources to nodes
        """
        a = {'resources_available.color': self.colors[numnode % 7]}
        return {**attribs, **a}

    def submit_jobs(self, attribs, num, step=1, wt_start=100):
        """
        Submit num jobs each in their individual equiv class
        """
        jids = []

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        for i in range(num):
            job_wt = wt_start + (i * step)
            attribs['Resource_List.walltime'] = job_wt
            J = Job(TEST_USER, attrs=attribs)
            J.set_sleep_time(job_wt)
            jid = self.server.submit(J)
            jids.append(jid)

        return jids

    def run_cycle(self):
        """
        Run a cycle and return the length of the cycle
        """
        self.server.expect(SERVER, {'server_state': 'Scheduling'}, op=NE)
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'True'})
        self.server.expect(SERVER, {'server_state': 'Scheduling'})
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        # 600 * 2sec = 20m which is the max cycle length
        self.server.expect(SERVER, {'server_state': 'Scheduling'}, op=NE,
                           max_attempts=600, interval=2)
        c = self.scheduler.cycles(lastN=1)[0]
        return c.end - c.start

    def compare_normal_path_to_buckets(self, place, num_jobs):
        """
        Submit num_jobs jobs and run two cycles.  First one with the normal
        node search code path and the second with buckets.  Print the
        time difference between the two cycles.
        """
        # Submit one job to eat up the resources.  We want to compare the
        # time it takes for the scheduler to attempt and fail to run the jobs
        a = {'Resource_List.select': '1429:ncpus=1:color=yellow',
             'Resource_List.place': place,
             'Resource_List.walltime': '1:00:00'}
        Jyellow = Job(TEST_USER, attrs=a)
        Jyellow.set_sleep_time(3600)
        jid_yellow = self.server.submit(Jyellow)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid_yellow)

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        # Shared jobs use standard code path
        a = {'Resource_List.select':
             '1429:ncpus=1:color=blue+1429:ncpus=1:color=yellow',
             "Resource_List.place": place}
        jids = self.submit_jobs(a, num_jobs)

        cycle1_time = self.run_cycle()

        # Excl jobs use bucket codepath
        a = {'Resource_List.place': place + ':excl'}
        for jid in jids:
            self.server.alterjob(jid, a)

        cycle2_time = self.run_cycle()

        log_msg = 'Cycle 1: %.2f Cycle 2: %.2f Cycle time difference: %.2f'
        self.logger.info(log_msg % (cycle1_time, cycle2_time,
                                    cycle1_time - cycle2_time))
        self.assertGreater(cycle1_time, cycle2_time)

    @timeout(10000)
    def test_node_bucket_perf_scatter(self):
        """
        Submit a large number of jobs which use node buckets.  Run a cycle and
        compare that to a cycle that doesn't use node buckets.  Jobs require
        place=excl to use node buckets.
        This test uses place=scatter.  Scatter placement is quicker than free
        """
        self.common_setup1()
        num_jobs = 3000
        self.compare_normal_path_to_buckets('scatter', num_jobs)

    @timeout(10000)
    def test_node_bucket_perf_free(self):
        """
        Submit a large number of jobs which use node buckets.  Run a cycle and
        compare that to a cycle that doesn't use node buckets.  Jobs require
        place=excl to use node buckets.
        This test uses free placement.  Free placement is slower than scatter
        """
        self.common_setup1()
        num_jobs = 3000
        self.compare_normal_path_to_buckets('free', num_jobs)

    @timeout(3600)
    def test_run_many_normal_jobs(self):
        """
        Submit many normal path jobs and time the cycle that runs all of them.
        """
        self.common_setup1()
        num_jobs = 10000
        a = {'Resource_List.select': '1:ncpus=1'}
        jids = self.submit_jobs(a, num_jobs, wt_start=num_jobs)
        t = self.run_cycle()
        self.server.expect(JOB, {'job_state=R': num_jobs},
                           trigger_sched_cycle=False, interval=5,
                           max_attempts=240)
        self.logger.info('#' * 80)
        m = 'Time taken in cycle to run %d normal jobs: %.2f' % (num_jobs, t)
        self.logger.info(m)
        self.logger.info('#' * 80)

    @timeout(3600)
    def test_run_many_bucket_jobs(self):
        """
        Submit many bucket path jobs and time the cycle that runs all of them.
        """
        self.common_setup1()
        num_jobs = 10000
        a = {'Resource_List.select': '1:ncpus=1',
             'Resource_List.place': 'excl'}
        self.submit_jobs(a, num_jobs, wt_start=num_jobs)
        t = self.run_cycle()

        self.server.expect(JOB, {'job_state=R': num_jobs},
                           trigger_sched_cycle=False, interval=5,
                           max_attempts=240)
        self.logger.info('#' * 80)
        m = 'Time taken in cycle to run %d bucket jobs: %.2f' % (num_jobs, t)
        self.logger.info(m)
        self.logger.info('#' * 80)
        self.perf_test_result(t, m, "seconds")

    @timeout(3600)
    def test_pset_fuzzy_perf(self):
        """
        Test opt_backfill_fuzzy with placement sets.
        """
        self.common_setup1()
        a = {'strict_ordering': 'True'}
        self.scheduler.set_sched_config(a)

        a = {'node_group_key': 'color', 'node_group_enable': 'True',
             'scheduling': 'False'}

        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.server.expect(SERVER, {'server_state': (NE, 'Scheduling')})

        a = {'Resource_List.select': '1:ncpus=1:color=yellow'}
        self.submit_jobs(attribs=a, num=1430, step=60, wt_start=3600)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        self.server.expect(JOB, {'job_state=R': 1430},
                           trigger_sched_cycle=False, interval=5,
                           max_attempts=240)

        a = {'Resource_List.select': '10000:ncpus=1'}
        tj = Job(TEST_USER, attrs=a)
        self.server.submit(tj)

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        cycle1 = self.scheduler.cycles(lastN=1)[0]
        cycle1_time = cycle1.end - cycle1.start

        a = {'opt_backfill_fuzzy': 'High'}
        self.server.manager(MGR_CMD_SET, SCHED, a, id='default')

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        cycle2 = self.scheduler.cycles(lastN=1)[0]
        cycle2_time = cycle2.end - cycle2.start

        self.logger.info('Cycle 1: %f Cycle 2: %f Perc %.2f%%' % (
            cycle1_time, cycle2_time, (cycle1_time / cycle2_time) * 100))
        self.assertLess(cycle2_time, cycle1_time,
                        'Optimization was not faster')
        self.perf_test_result(((cycle1_time / cycle2_time) * 100),
                              "optimized_percentage", "percentage")

    @timeout(1200)
    def test_many_chunks(self):
        self.common_setup1()
        num_jobs = 1000
        num_cycles = 3
        # Submit jobs with a large number of chunks that can't run
        a = {'Resource_List.select': '9999:ncpus=1:color=red'}
        jids = self.submit_jobs(a, num_jobs, wt_start=1000)
        m = 'Time taken to consider %d normal jobs' % num_jobs
        times = []
        for i in range(num_cycles):
            t = self.run_cycle()
            times.append(t)

        self.logger.info('#' * 80)
        for i in range(num_cycles):
            m2 = '[%d] %s: %.2f' % (i, m, times[i])
            self.logger.info(m2)
        self.logger.info('#' * 80)

        self.perf_test_result(times, m, "sec")

    @timeout(10000)
    def test_many_jobs_with_calendaring(self):
        """
        Performance test for when there are many jobs and calendaring is on
        """
        self.common_setup1()
        # Turn strict ordering on and backfill_depth=20
        a = {'strict_ordering': 'True'}
        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'backfill_depth': '20'})

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})
        jids = []

        # Submit around 10k jobs
        chunk_size = 100
        total_jobs = 10000
        while total_jobs > 0:
            for i in range(1, chunk_size + 1):
                a = {'Resource_List.select':
                     str(i) + ":ncpus=1:color=" + self.colors[i % 7]}
                njobs = int(chunk_size / i)
                _jids = self.submit_jobs(a, njobs, wt_start=1000)
                jids.extend(_jids)
                total_jobs -= njobs
                if total_jobs <= 0:
                    break

        t1 = time.time()
        for _ in range(100):
            self.scheduler.run_scheduling_cycle()
        t2 = time.time()

        self.logger.info("Time taken by 100 sched cycles: " + str(t2 - t1))

        # Delete all jobs
        self.server.cleanup_jobs()

    @timeout(5000)
    def test_attr_update_period_perf(self):
        """
        Test the performance boost gained by using attr_update_period
        """
        # Create 1 node with 1 cpu
        a = {"resources_available.ncpus": 1}
        self.mom.create_vnodes(a, 1, sharednode=False)

        a = {"attr_update_period": 10000, "scheduling": "False"}
        self.server.manager(MGR_CMD_SET, SCHED, a, id="default")

        # Submit 5k jobs
        for _ in range(5000):
            self.server.submit(Job())

        # The first scheduling cycle will send attribute updates
        self.scheduler.run_scheduling_cycle()
        cycle1 = self.scheduler.cycles(lastN=1)[0]
        cycle1_time = cycle1.end - cycle1.start

        # Delete all jobs, submit 5k jobs again
        self.server.cleanup_jobs()
        for _ in range(5000):
            self.server.submit(Job())

        # This is the second scheduling cycle. We gave a very long
        # attr_update_period value, so we should still be within that period
        # So, sched should NOT send updates this time
        self.scheduler.run_scheduling_cycle()
        cycle2 = self.scheduler.cycles(lastN=1)[0]
        cycle2_time = cycle2.end - cycle2.start

        # Compare performance of the 2 cycles
        self.logger.info("##################################################")
        self.logger.info(
            "Sched cycle time with attribute updates: %f" % cycle1_time)
        self.logger.info(
            "Sched cycle time without attribute updates: %f" % cycle2_time)
        self.logger.info("##################################################")
        m = "sched cycle time"
        self.perf_test_result([cycle1_time, cycle2_time], m, "sec")

    def setup_scheds(self):
        for i in range(1, 6):
            partition = 'P' + str(i)
            sched_name = 'sc' + str(i)
            a = {'partition': partition,
                 'sched_host': self.server.hostname}
            self.server.manager(MGR_CMD_CREATE, SCHED,
                                a, id=sched_name)
            self.scheds[sched_name].create_scheduler()
            self.scheds[sched_name].start()
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'scheduling': 'True'}, id=sched_name)

    def setup_queues_nodes(self):
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        for i in range(1, 6):
            self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq' + str(i))
            p = {'partition': 'P' + str(i)}
            self.server.manager(MGR_CMD_SET, QUEUE, p, id='wq' + str(i))
            node = str(self.mom.shortname)
            num = i - 1
            self.server.manager(MGR_CMD_SET, NODE, p,
                                id=node + '[' + str(num) + ']')

    def submit_njobs(self, num_jobs=1, attrs=None, user=TEST_USER):
        """
        Submit num_jobs number of jobs with attrs attributes for user.
        Return a list of job ids
        """
        if attrs is None:
            attrs = {ATTR_q: 'workq'}
        ret_jids = []
        for _ in range(num_jobs):
            J = Job(user, attrs)
            jid = self.server.submit(J)
            ret_jids += [jid]

        return ret_jids

    @timeout(3600)
    def test_multi_sched_perf(self):
        """
        Test time taken to schedule and run 5k jobs with
        single scheduler and workload divided among 5 schedulers.
        """
        a = {'resources_available.ncpus': 1000}
        self.mom.create_vnodes(a, 5)
        a = {'scheduling': 'False'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        self.submit_njobs(5000)
        start = time.time()
        self.scheduler.run_scheduling_cycle()
        c = self.scheduler.cycles(lastN=1)[0]
        cyc_dur = c.end - c.start
        self.perf_test_result(cyc_dur, "default_cycle_duration", "secs")
        msg = 'Time taken by default scheduler to run 5k jobs is '
        self.logger.info(msg + str(cyc_dur))
        self.server.cleanup_jobs()
        self.setup_scheds()
        self.setup_queues_nodes()
        for sc in self.scheds:
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SCHED, a, id=sc)
        a = {ATTR_q: 'wq1'}
        self.submit_njobs(1000, a)
        a = {ATTR_q: 'wq2'}
        self.submit_njobs(1000, a)
        a = {ATTR_q: 'wq3'}
        self.submit_njobs(1000, a)
        a = {ATTR_q: 'wq4'}
        self.submit_njobs(1000, a)
        a = {ATTR_q: 'wq5'}
        self.submit_njobs(1000, a)
        start = time.time()
        for sc in self.scheds:
            a = {'scheduling': 'True'}
            self.server.manager(MGR_CMD_SET, SCHED, a, id=sc)
        for sc in self.scheds:
            a = {'scheduling': 'False'}
            self.server.manager(MGR_CMD_SET, SCHED, a, id=sc)
        sc_dur = []
        for sc in self.scheds:
            if sc != 'default':
                self.logger.info("searching log for scheduler " + str(sc))
                log_msg = self.scheds[sc].log_match("Leaving Scheduling Cycle",
                                                    starttime=int(start),
                                                    max_attempts=30)
                endtime = PBSLogUtils.convert_date_time(
                    log_msg[1].split(';')[0])
                dur = endtime - start
                sc_dur.append(dur)
        max_dur = max(sc_dur)
        self.perf_test_result(max_dur, "max_multisched_cycle_duration", "secs")
        msg = 'Max time taken by one of the multi sched to run 1k jobs is '
        self.logger.info(msg + str(max_dur))
        self.perf_test_result(
            cyc_dur - max_dur, "multisched_defaultsched_cycle_diff", "secs")
        self.assertLess(max_dur, cyc_dur)
        msg1 = 'Multi scheduler is faster than single scheduler by '
        msg2 = 'secs in scheduling 5000 jobs with 5 schedulers'
        self.logger.info(msg1 + str(cyc_dur - max_dur) + msg2)


================================================
FILE: test/tests/performance/pbs_standing_resv_quasihang.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.performance import *


class StandingResvQuasihang(TestPerformance):
    """
    This test suite aims at testing the quasihang caused by a MoM HUP
    when there is a standing reservation with more than a 1000 instances.
    Without the fix, the server takes a lot of time to respond to a client.
    With the fix, the amount of time is significantly reduced.
    """

    def setUp(self):
        TestPerformance.setUp(self)

        # Set PBS_TZID, needed for standing reservation.
        if 'PBS_TZID' in self.conf:
            self.tzone = self.conf['PBS_TZID']
        elif 'PBS_TZID' in os.environ:
            self.tzone = os.environ['PBS_TZID']
        else:
            self.logger.info('Timezone not set, using Asia/Kolkata')
            self.tzone = 'Asia/Kolkata'

        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, num=2000, usenatvnode=True)

    @timeout(6000)
    def test_time_for_stat_after_mom_hup(self):
        """
        This test case submits a standing reservation with 2000 instances,
        HUPS the MoM, stats the reservation and finds the amount of time
        the server took to respond.

        The test case is not designed to pass/fail on builds with/without
        the fix.
        """
        start = int(time.time()) + 3600
        attrs = {'Resource_List.select': "64:ncpus=2",
                 'reserve_start': start,
                 'reserve_duration': 2000,
                 'reserve_timezone': self.tzone,
                 'reserve_rrule': "FREQ=HOURLY;BYHOUR=1,2,3,4,5;COUNT=2000"}

        rid = self.server.submit(Reservation(TEST_USER, attrs))
        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}

        # it takes a while for all the instances of the reservation to get
        # confirmed, hence the interval of 5 seconds.
        self.server.expect(RESV, attrs, id=rid, interval=5)

        self.mom.signal('-HUP')

        # sleep for 5 seconds so that the HUP takes its effect.
        time.sleep(5)

        now1 = int(time.time())
        attrs = {'reserve_state': (MATCH_RE, 'RESV_CONFIRMED|2')}
        self.server.expect(RESV, attrs, id=rid)

        now2 = int(time.time())
        self.logger.info("pbs_rstat took %d seconds to return\n",
                         (now2 - now1))
        self.perf_test_result((now2 - now1), "pbs_rstat_return_time", "sec")


================================================
FILE: test/tests/performance/test_dependency_perf.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.performance import *


class TestDependencyPerformance(TestPerformance):
    """
    Test the performance of job dependency feature
    """

    def check_depend_delete_msg(self, pjid, cjid):
        """
        helper function to check ia message that the dependent job (cjid)
        is deleted because of the parent job (pjid)
        """
        msg = cjid + ";Job deleted as result of dependency on job " + pjid
        self.server.log_match(msg)

    @timeout(1800)
    def test_delete_long_dependency_chains(self):
        """
        Submit a very long chain of dependent jobs and then measure the time
        PBS takes to get rid of all dependent jobs.
        """

        a = {'job_history_enable': 'True'}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        job = Job()
        job.set_sleep_time(3600)
        jid = self.server.submit(job)
        j_arr = [jid]
        for _ in range(5000):
            a = {ATTR_depend: 'afternotok:' + jid}
            jid = self.server.submit(Job(attrs=a))
            j_arr.append(jid)

        self.server.expect(JOB, {ATTR_state: 'R'}, id=j_arr[0])
        self.server.expect(JOB, {ATTR_state: 'H'}, id=j_arr[5000])
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        t1 = time.time()
        self.server.delete(j_arr[0])
        self.server.expect(JOB, {ATTR_state: 'F'}, id=j_arr[5000],
                           extend='x', interval=2)
        t2 = time.time()
        self.logger.info('#' * 80)
        self.logger.info('Time taken to delete all jobs %f' % (t2-t1))
        self.logger.info('#' * 80)
        self.check_depend_delete_msg(j_arr[4999], j_arr[5000])
        self.perf_test_result((t2 - t1),
                              "time_taken_delete_all_dependent_jobs", "sec")


================================================
FILE: test/tests/resilience/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_testsuite import *


class TestResilience(PBSTestSuite):
    """
    Base test suite for all kinds of resilience tests
    like Failover, stress, load, endurance etc.
    """
    pass


================================================
FILE: test/tests/resilience/pbs_hook_alarm_large_multinode_job.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.resilience import *
from time import sleep


class TestPbsHookAlarmLargeMultinodeJob(TestResilience):

    """
    This test suite contains hooks test to verify that a large
    multi-node job does not slow down hook execution and cause an alarm.
    """

    def setUp(self):

        TestResilience.setUp(self)
        # Increasing the daemon log for debugging
        self.server.manager(MGR_CMD_SET, SERVER, {"log_events": '2047'})
        self.mom.add_config({"$logevent": "0xfffffff"})

        if not self.mom.is_cpuset_mom():
            a = {'resources_available.mem': '1gb',
                 'resources_available.ncpus': '1'}
            self.mom.create_vnodes(a, 5000, expect=False)
            # Make sure all the nodes are in state free.  We can't let
            # create_vnodes() do this because it does
            # a pbsnodes -v on each vnode.
            # This takes a long time.
            self.server.expect(NODE, {'state=free': (GE, 5000)})
            # Restart mom explicitly due to PP-993
            self.mom.restart()

    def submit_job(self):
        a = {'Resource_List.walltime': 10}
        if self.mom.is_cpuset_mom():
            vnode_val = self.server.status(NODE)
            del vnode_val[0]
            vnode_id = vnode_val[0]['id']
            ncpus = vnode_val[0]['resources_available.ncpus']
            del vnode_val[0]
            a = {'Resource_List.select': '1:ncpus=' +
                 ncpus + ':vnode=' + vnode_id}
            for _vnode in vnode_val:
                vnode_id = _vnode['id']
                ncpus = _vnode['resources_available.ncpus']
                a['Resource_List.select'] += '+1:ncpus=' + \
                    ncpus + ':vnode=' + vnode_id
        else:
            a['Resource_List.select'] = '5000:ncpus=1:mem=1gb'
        j = Job(TEST_USER)

        j.set_attributes(a)
        j.set_sleep_time(10)

        jid = self.server.submit(j)
        return jid

    def test_begin_hook(self):
        """
        Create an execjob_begin hook, import a hook content with a small
        alarm value, and test it against a large multi-node job.
        """
        hook_name = "beginhook"
        hook_event = "execjob_begin"
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executing begin hook %s" % (e.hook_name,))
"""
        a = {'event': hook_event, 'enabled': 'True',
             'alarm': '60'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.submit_job()

        self.server.expect(JOB, {'job_state': 'R'},
                           jid, max_attempts=100, interval=2)
        self.mom.log_match(
            "pbs_python;executing begin hook %s" % (hook_name,), n=100,
            max_attempts=5, interval=5, regexp=True)

        self.mom.log_match(
            "Job;%s;alarm call while running %s hook" % (jid, hook_event),
            n=100, max_attempts=5, interval=5, regexp=True, existence=False)

        self.mom.log_match("Job;%s;Started, pid" % (jid,), n=100,
                           max_attempts=5, interval=5, regexp=True)

    def test_prolo_hook(self):
        """
        Create an execjob_prologue hook, import a hook content with a
        small alarm value, and test it against a large multi-node job.
        """
        hook_name = "prolohook"
        hook_event = "execjob_prologue"
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executing prologue hook %s" % (e.hook_name,))
"""
        a = {'event': hook_event, 'enabled': 'True',
             'alarm': '60'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.submit_job()

        self.server.expect(JOB, {'job_state': 'R'},
                           jid, max_attempts=100, interval=2)

        self.mom.log_match(
            "pbs_python;executing prologue hook %s" % (hook_name,), n=100,
            max_attempts=5, interval=5, regexp=True)

        self.mom.log_match(
            "Job;%s;alarm call while running %s hook" % (jid, hook_event),
            n=100, max_attempts=5, interval=5, regexp=True, existence=False)

    def test_epi_hook(self):
        """
        Create an execjob_epilogue hook, import a hook content with a small
        alarm value, and test it against a large multi-node job.
        """
        hook_name = "epihook"
        hook_event = "execjob_epilogue"
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executing epilogue hook %s" % (e.hook_name,))
"""
        search_after = time.time()
        a = {'event': hook_event, 'enabled': 'True',
             'alarm': '60'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.submit_job()

        self.server.expect(JOB, {'job_state': 'R'},
                           jid, max_attempts=100, interval=2)

        self.logger.info("Wait 10s for job to finish")
        sleep(10)

        self.server.log_match("dequeuing from", max_attempts=100,
                              interval=3, starttime=search_after)

        self.mom.log_match(
            "pbs_python;executing epilogue hook %s" % (hook_name,), n=100,
            max_attempts=5, interval=5, regexp=True)

        self.mom.log_match(
            "Job;%s;alarm call while running %s hook" % (jid, hook_event),
            n=100, max_attempts=5, interval=5, regexp=True, existence=False)

        self.mom.log_match("Job;%s;Obit sent" % (jid,), n=100,
                           max_attempts=5, interval=5, regexp=True)

    def test_end_hook(self):
        """
        Create an execjob_end hook, import a hook content with a small
        alarm value, and test it against a large multi-node job.
        """
        hook_name = "endhook"
        hook_event = "execjob_end"
        hook_body = """
import pbs
e=pbs.event()
pbs.logmsg(pbs.LOG_DEBUG, "executing end hook %s" % (e.hook_name,))
"""
        search_after = time.time()
        a = {'event': hook_event, 'enabled': 'True',
             'alarm': '40'}
        self.server.create_import_hook(hook_name, a, hook_body)

        jid = self.submit_job()
        self.server.expect(JOB, {'job_state': 'R'},
                           jid, max_attempts=100, interval=2)

        self.logger.info("Wait 10s for job to finish")
        sleep(10)

        self.server.log_match("dequeuing from", max_attempts=100,
                              interval=3, starttime=search_after)

        self.mom.log_match(
            "pbs_python;executing end hook %s" % (hook_name,), n=100,
            max_attempts=5, interval=5, regexp=True)

        self.mom.log_match(
            "Job;%s;alarm call while running %s hook" % (jid, hook_event),
            n=100, max_attempts=5, interval=5, regexp=True, existence=False)

        self.mom.log_match("Job;%s;Obit sent" % (jid,), n=100,
                           max_attempts=5, interval=5, regexp=True)


================================================
FILE: test/tests/security/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_testsuite import *


class TestSecurity(PBSTestSuite):
    """
    Base test suite for Security tests
    """
    pass


================================================
FILE: test/tests/security/pbs_command_injection.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.security import *


class Test_command_injection(TestSecurity):
    """
    This test suite is for testing command injection
    """
    def setUp(self):
        TestSecurity.setUp(self)

    def test_pbs_rcp_command_injection(self):
        """
        """
        cmd = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'sbin', 'pbs_rcp')
        cmd_opt = \
            [cmd, 'test@1.1.1.1:/tmp/abc;cat /etc/passwd test@2.2.2.2:/tmp']
        ret = self.du.run_cmd(self.server.hostname, cmd=cmd_opt, logerr=False)

        self.assertNotEqual(ret['rc'], 0,
                            'pbs_rcp returned with success')


================================================
FILE: test/tests/security/pbs_multiple_auth.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.security import *
import os
import errno
import socket
import re
import random
import string
import sys
import time

class TestMultipleAuthMethods(TestSecurity):
    """
    This test suite contains tests for Multiple authentication added to PBS
    """
    node_list = []
    # Regular expression that will be used to get the address and port number
    # from the output of 'netstat' or 'ss' commands
    re_addr_port = re.compile(r'(?P<addr>.*):(?P<port>\d+)')
    # Regular expression that will be used to get the second argument of write
    # system calls from the output of 'strace' command
    re_syscall = re.compile(r'.*\"(?P<write_buffer>.*)\".*')

    def setUp(self):
        TestSecurity.setUp(self)
        attrib = {'log_events': 2047}
        self.server.manager(MGR_CMD_SET, SERVER, attrib)
        self.mom.add_config({'$logevent': '4095'})
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 4095})
        self.cur_user = self.du.get_current_user()
        self.svr_hostname = self.server.shortname
        self.node_list.append(self.svr_hostname)
        self.client_host = None

    def update_pbs_conf(self, conf_param, host_name=None,
                        restart=True, op='set', check_state=True):
        """
        This function updates pbs conf file.

        :param conf_param: PBS confs 'key/value' need to update in pbs.conf
        :type conf_param: Dictionary
        :param host_name: Name of the host on which pbs.conf
                          has to be updated
        :param restart: Restart PBS or not after update pbs.conf
        :type restart: Boolean
        :param op: Operation need to perform on pbs.conf
                   Set or Unset operation will perform.
        :type set: String
        :param check_state: Check node state to be free
        :type check_state: Bool
        """

        check_sched_log = False
        if host_name == None:
            host_name = self.svr_hostname
        pbsconfpath = self.du.get_pbs_conf_file(host_name)
        if op == 'set':
            check_sched_log = True
            self.du.set_pbs_config(hostname=host_name,
                                   fin=pbsconfpath,
                                   confs=conf_param)
        else:
            self.du.unset_pbs_config(hostname=host_name,
                                     fin=pbsconfpath,
                                     confs=conf_param)
        if restart:
            self.pbs_restart(host_name, node_state=check_state,
                             sched_log=check_sched_log)
            # Wait for Server to be ready after restart
            time.sleep(5)

    def munge_operation(self, host_name, op=None):
        """
        This function starts the munge dameon on a given host

        :param host_name: Name of the host on which munge
                          service has to be start.
        :type host_name: String
        :param op: Operation perform on munge daemon.
        :type op: String
        """
        cmd = 'service munge %s' % (op)
        status = self.du.run_cmd(hosts=host_name, cmd=cmd, sudo=True)
        if op == 'status':
            if status['rc'] == 0:
                return True
            else:
                return False
        else:
            msg = "Failed to %s Munge on %s, Error: %s" % (op, host_name,
                                                           str(status['err']))
            self.assertEquals(status['rc'], 0, msg)

    def pbs_restart(self, host_name=None, node_state=True, daemon=None,
                    sched_log=True):
        """
        This function restarts PBS on host.
        :param host_name: Name of the host on which pbs daemons
                          has to be restarted
        :type host_name: String
        :param node_state: Check node state to be free
        :type node_state: Bool
        """
        if host_name == None:
            host_name = self.mom.shortname
        if daemon == "pbs_comm":
            self.comm.restart
            pi = PBSInitServices(hostname=self.server.shortname)
            pi.restart_comm()
        else:
            start_time = time.time()
            pi = PBSInitServices(hostname=host_name)
            pi.restart()
        if node_state:
            self.server.expect(NODE, {'state': 'free'}, id=host_name)

    def perform_op(self, choice, host_name, node_state=True):
        """
        This function check if munge is installed or not installed
        based on test case. If installed then check if munge daemon
        is active or not,if not active then start it.

        param choice: which operation want to perform on host.
        type choice: String
        param host_name: Hostname on which operation want to perform.
        type host_name: String or None
        :param node_state: Check node state to be free
        :type node_state: Bool
        """
        munge_cmd = self.du.which(exe="munge", hostname=host_name)
        if choice == 'check_installed_and_run':
            if munge_cmd == 'munge':
                self.skipTest(reason='Munge is not installed')
            else:
                _msg = "Munge is installed as per test suite requirement,"
                _msg += " proceeding to check if munge is active"
                self.logger.info(_msg)
                if not self.munge_operation(host_name, op='status'):
                    _msg = "Munge daemon is not running, trying to start it..."
                    self.logger.info(_msg)
                    self.munge_operation(host_name=host_name,
                                         op='start')
                    self.logger.info(
                        "Munge started successfully, proceeding further")
                    self.pbs_restart(
                        host_name=host_name, node_state=node_state)
                else:
                    _msg = "Munge is running as per test suite requirement, "
                    _msg += "proceeding with test case execution"
                    self.logger.info(_msg)
        else:
            if munge_cmd != 'munge':
                _msg = 'Munge is installed which is not a pre-requiste'
                _msg += ' for test cases, skipping test case'
                self.skipTest(reason=_msg)
            else:
                _msg = "Munge is not installed as per test suite requirement,"
                _msg += " proceeding with test case execution"
                self.logger.info(_msg)

    def match_logs(self, exp_msg, nt_exp_msg=None):
        """
        This function verifies the expected log msgs with respect
                to authentication in daemon logs

        param exp_msg: Expected log messages in daemons log file.
        type exp_msg: Dictionary
        param nt_exp_msg: Not expected message in daemons log file.
        type exp_msg: String
        """

        st_time = self.server.ctime
        if 'mom' in exp_msg:
            self.mom.log_match(exp_msg['mom'], starttime=st_time)
        for msg in exp_msg.get('server', []):
            self.server.log_match(msg, starttime=st_time)
        for msg in exp_msg.get('comm', []):
            self.comm.log_match(msg, starttime=st_time)

        if nt_exp_msg:
            self.mom.log_match(nt_exp_msg, starttime=st_time,
                               existence=False)
            self.server.log_match(nt_exp_msg, starttime=st_time,
                                  existence=False)
            self.comm.log_match(nt_exp_msg, starttime=st_time,
                                existence=False)

    def common_commands_steps(self, set_attr=None, job_script=False,
                              resv_attr=None, client=None):
        """
        This function check all pbs commands are authenticated via
        respective auth method.

        :param set_attr: Job attributes to set
        :type set_attr: Dictionary. Defaults to None
        :param job_script: Whether to submit a job using job script
        :type job_script: Bool. Defaults to False
        :param resv_set_attr: Reservation attributes to set
        :type resv_set_attr: Dictionary. Defaults to None
        :param client: Name of the client
        :type client: String. Defaults to None
        """
        if client is None:
            self.server.client = self.svr_hostname
        else:
            self.server.client = client
        # Verify that PBS commands are authenticated
        exp_msg = "Type 95 request received"
        start_time = time.time()
        self.server.status(SERVER)
        self.server.log_match(exp_msg, starttime=start_time)

        if resv_attr is None:
            resv_attr = {'reserve_start': time.time() + 30,
                         'reserve_end': time.time() + 60}

        r = Reservation(TEST_USER, resv_attr)
        rid = self.server.submit(r)
        exp_state = {'reserve_state': (MATCH_RE, "RESV_CONFIRMED")}
        self.server.expect(RESV, exp_state, id=rid)

        start_time = time.time()
        self.server.delete(rid)
        self.server.log_match(exp_msg, starttime=start_time)

        start_time = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        self.server.log_match(exp_msg, starttime=start_time)

        start_time = time.time()
        j = Job(TEST_USER)
        if set_attr is not None:
            j.set_attributes(set_attr)
        if job_script:
            pbsdsh_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                       "bin", "pbsdsh")
            script = "#!/bin/sh\n%s sleep 30" % pbsdsh_path
            j.create_script(script, hostname=self.server.client)
        else:
            j.set_sleep_time(30)
        jid = self.server.submit(j)

        self.server.log_match(exp_msg, starttime=start_time)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

        start_time = time.time()
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        self.server.log_match(exp_msg, starttime=start_time)

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        start_time = time.time()
        self.server.alterjob(jid, {ATTR_N: 'test'})
        self.server.log_match(exp_msg, starttime=start_time)

        start_time = time.time()
        self.server.expect(JOB, 'queue', id=jid, op=UNSET, offset=30)
        self.server.log_match("%s;Exit_status=0" % jid)

    def common_setup(self, req_moms=2, req_comms=1):
        """
        This function sets the shortnames of server, moms, comms and
        Client in the cluster
        Server shortname : self.hostA
        Mom objects : self.momB, self.momC
        Mom shortnames : self.hostB, self.hostC
        Comm objects : self.comm2, self.comm3
        Comm shortnames : self.hostD, self.hostE
        Client name : self.hostF
        :param req_moms: No of required moms
        :type req_moms: Integer. Defaults to 2
        :param req_comms: No of required comms
        :type req_comms: Integer. Defaults to 1
        """
        num_moms = len(self.moms)
        num_comms = len(self.comms)
        if (req_moms != num_moms) and (req_comms != num_comms):
            msg = "Test requires exact %s moms and %s" % (req_moms, req_comms)
            msg += " comms as input"
            self.skipTest(msg)
        if num_moms == 2 and num_comms == 2:
            self.hostA = self.server.shortname
            self.momB = self.moms.values()[0]
            self.hostB = self.momB.shortname
            self.momC = self.moms.values()[1]
            self.hostC = self.momC.shortname
            self.comm2 = self.comms.values()[0]
            self.hostD = self.comm2.shortname
            self.comm3 = self.comms.values()[1]
            self.hostE = self.comm3.shortname
            self.hostF = self.client_host = self.server.client
            self.node_list = [self.hostA, self.hostB,
                              self.hostC, self.hostD,
                              self.hostE, self.hostF]
        elif num_moms == 2 and num_comms == 3:
            self.hostA = self.server.shortname
            self.momB = self.moms.values()[0]
            self.hostB = self.momB.shortname
            self.momC = self.moms.values()[1]
            self.hostC = self.momC.shortname
            self.comm2 = self.comms.values()[1]
            self.hostD = self.comm2.shortname
            self.comm3 = self.comms.values()[2]
            self.hostE = self.comm3.shortname
            self.hostF = self.client_host = self.server.client
            self.node_list = [self.hostA, self.hostB,
                              self.hostC, self.hostD,
                              self.hostE, self.hostF]

    def simple_interactive_job(self):
        self.svr_mode = self.server.get_op_mode()
        if self.svr_mode != PTL_CLI:
            self.server.set_op_mode(PTL_CLI)

        j = Job(TEST_USER, attrs={ATTR_inter: ''})
        j.interactive_script = [('hostname', '.*'),
                                ('sleep 100', '.*')]
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.delete(jid)

    def test_default_auth_method(self):
        """
        Test to verify all PBS daemons and commands are authenticated
        via default authentication method
        default authentication method is resvport
        """
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047"}
        if self.server.shortname != self.mom.shortname:
            check_state = False
        else:
            check_state = True
        self.update_pbs_conf(conf_param, check_state=check_state)
        common_msg = 'TPP authentication method = resvport'
        common_msg1 = 'Supported authentication method: resvport'
        exp_msg = {'server': [common_msg, common_msg1],
                   'comm': [common_msg1],
                   'mom': common_msg}
        self.match_logs(exp_msg)
        self.common_commands_steps()

    def test_munge_auth_method(self):
        """
        Test to verify all PBS daemons and commands are authenticated
        via munge authentication method
        """
        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            check_state = False
        else:
            check_state = True

        # Function call to check if munge is installed and enabled
        for host_name in self.node_list:
            self.perform_op(choice='check_installed_and_run',
                            host_name=host_name)

        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                      'PBS_AUTH_METHOD': 'MUNGE',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, check_state=check_state)

        if self.server.shortname != self.mom.shortname:
            conf_param = {'PBS_AUTH_METHOD': 'MUNGE'}
            self.update_pbs_conf(conf_param, host_name=self.mom.shortname)

        common_msg = 'TPP authentication method = munge'
        common_msg1 = 'Supported authentication method: munge'

        exp_msg = {'server': [common_msg, common_msg1],
                   'comm': [common_msg1],
                   'mom': common_msg}

        nt_exp_msg = 'TPP authentication method = resvport'
        self.match_logs(exp_msg, nt_exp_msg)
        self.common_commands_steps()

    def test_multiple_supported_auth_methods(self):
        """
        Test to verify all PBS daemons and commands are authenticated
        via multiple authentication method.
        we authenticated with resvport and munge.
        """
        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            check_state = False
        else:
            check_state = True

        # Function call to check if munge is installed and enabled
        for host_name in self.node_list:
            self.perform_op(choice='check_installed_and_run',
                            host_name=host_name)

        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE,resvport',
                      'PBS_AUTH_METHOD': 'MUNGE',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, check_state=check_state)

        if self.server.shortname != self.mom.shortname:
            conf_param = {'PBS_AUTH_METHOD': 'MUNGE'}
            self.update_pbs_conf(conf_param, host_name=self.mom.shortname)

        common_msg = 'TPP authentication method = munge'
        common_msg1 = 'Supported authentication method: munge'
        common_msg2 = 'Supported authentication method: resvport'

        exp_msg = {'server': [common_msg, common_msg1, common_msg2],
                   'comm': [common_msg, common_msg1, common_msg2],
                   'mom': common_msg}
        nt_exp_msg = 'TPP authentication method = resvport'
        self.match_logs(exp_msg, nt_exp_msg)
        self.common_commands_steps()

        confs = ['PBS_AUTH_METHOD']
        self.update_pbs_conf(confs, op='unset', restart=False)

        common_msg = 'TPP authentication method = resvport'
        conf_param = {'PBS_AUTH_METHOD': 'resvport'}
        for host_name in self.node_list:
            if host_name == self.svr_hostname:
                check_state = False
            else:
                check_state = True
            self.update_pbs_conf(conf_param, host_name=host_name,
                                 check_state=check_state)

        exp_msg['server'][0] = exp_msg['comm'][0] = common_msg
        exp_msg['mom'] = common_msg
        self.match_logs(exp_msg)
        self.common_commands_steps()

    def test_multiple_auth_method(self):
        """
        Test to verify getting expected error message
        with multiple PBS_AUTH_METHOD.
        """
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                      'PBS_AUTH_METHOD': 'resvport,MUNGE',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, restart=False)

        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            conf_param = {'PBS_AUTH_METHOD': 'resvport,MUNGE'}
            self.update_pbs_conf(conf_param, host_name=self.mom.shortname,
                                 restart=False)

        lib_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                'lib')
        msg = "/libauth_resvport,munge.so: cannot open shared object file:"
        msg += " No such file or directory"
        matchs = lib_path + msg

        # Restart PBS and it should fail with expected error message
        try:
            self.pbs_restart(self.server.shortname)
        except PbsInitServicesError as e:
            self.assertIn(matchs, e.msg)
            _msg = "PBS start up failed with logger info: " + str(e.msg)
            self.logger.info(_msg)
        else:
            err_msg = "Failed to get expected error message in PBS restart: "
            err_msg += msg
            self.fail(err_msg)

    def test_not_listed_auth_method(self):
        """
        test to verify that pbs give appropiate error message
        if we use not listed PBS_AUTH_METHOD.
        """
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'resvport',
                      'PBS_AUTH_METHOD': 'MUNGE',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, restart=False)

        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            conf_param = {'PBS_AUTH_METHOD': 'MUNGE'}
            self.update_pbs_conf(conf_param, host_name=self.mom.shortname,
                                 restart=False)

        err_msg = ['auth: error returned: 15029',
                   'auth: Failed to send auth request',
                   'No support for requested service.',
                   f'qstat: cannot connect to server {self.server.shortname} (errno=15029)']

        try:
            self.server.status(SERVER)
        except PbsStatusError as e:
            for msg in err_msg:
                self.assertIn(msg, e.msg)
        else:
            err_msg = "Failed to get expected error message"
            err_msg += " while checking server status."
            self.fail(err_msg)

    def test_null_authentication_value(self):
        """
        Set PBS_AUTH_METHOD to NULL (empty).
        Check for error message
        """

        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'resvport',
                      'PBS_AUTH_METHOD': '',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, restart=False)

        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            conf_param = {'PBS_AUTH_METHOD': ''}
            self.update_pbs_conf(conf_param, host_name=self.mom.shortname,
                                 restart=False)

        comm_path = os.path.join(self.server.pbs_conf['PBS_EXEC'],
                                 'sbin', 'pbs_comm')
        matchs = comm_path + ": Configuration error"

        # Restart PBS and it should fail with expected error message
        _msg = "PBS start up failed with logger info: "
        try:
            self.pbs_restart(self.server.shortname)
        except PbsInitServicesError as e:
            self.assertIn(matchs, e.msg)
            self.logger.info(_msg + str(e.msg))
        else:
            err_msg = "Failed to get expected error message in PBS restart: "
            err_msg += matchs
            self.fail(err_msg)

        if self.mom.shortname != self.svr_hostname:
            try:
                self.pbs_restart()
            except PbsInitServicesError as e:
                matchs = "pbs_mom startup failed, exit 1 aborting"
                self.assertIn(matchs, e.msg)
                self.logger.info(_msg + str(e.msg))
            else:
                err_msg = "Failed to get expected error message in PBS restart: "
                err_msg += matchs
                self.fail(err_msg)

    def test_munge_not_running_state(self):
        """
        Submit a job when munge process is not running on server host.
        Job submit error should occur because of
        Munge encode failure
        """
        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            check_state = False
        else:
            check_state = True

        # Function call to check if munge is installed and enabled
        for host_name in self.node_list:
            self.perform_op(choice='check_installed_and_run',
                            host_name=host_name)

        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                      'PBS_AUTH_METHOD': 'MUNGE',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, check_state=check_state)

        if self.server.shortname != self.mom.shortname:
            conf_param = {'PBS_AUTH_METHOD': 'MUNGE'}
            self.update_pbs_conf(conf_param, host_name=self.mom.shortname)

        common_msg = 'MUNGE user-authentication on encode failed with '
        err_msg1 = common_msg + '`Munged communication error`'
        err_msg2 = common_msg + '`Socket communication error`'

        # To stop munge process and check if successfull
        self.munge_operation(host_name=self.svr_hostname, op='stop')

        msg = f"qsub: cannot connect to server {self.server.hostname}"
        msg += " (errno=15010)"
        exp_msg = ['munge_get_auth_data: ' + err_msg1,
                    'auth: error returned: 15010',
                    'auth: ' + err_msg1,
                    msg
                    ]

        exp_msg1 = copy.copy(exp_msg)

        exp_msg1[0] = 'munge_get_auth_data: ' + err_msg2
        exp_msg1[2] = 'auth: ' + err_msg2

        # Submit a job and it should fail resulting in expected error
        j = Job(self.cur_user)
        _msg = "Trying to start munge daemon"
        try:
            j1id = self.server.submit(j)
        except PbsSubmitError as e:
            # Check if all lines of exp_msg are present in the error message
            all_in_exp_msg = all(any(s in msg for msg in e.msg)
                                 for s in exp_msg)
            # Check if all lines of exp_msg1 are present in the error message
            all_in_exp_msg1 = all(any(s in msg for msg in e.msg)
                                  for s in exp_msg1)
            self.assertTrue(all_in_exp_msg or all_in_exp_msg1,
                            f"{str(e.msg)} does not match with {str(exp_msg)} or {str(exp_msg1)}")
            self.logger.info("Job submit failed as expected with" + str(e.msg))
        else:
            err_msg = "Failed to get expected error message"
            err_msg += " while submiting job."
            self.fail(err_msg)
        # Clean Up: To start munge that was stopped in first step
        finally:
            self.logger.info(_msg)
            self.munge_operation(host_name=self.svr_hostname, op='start')
            self.logger.info("Munge started as a part of cleanup")

    def test_invalid_authentication_value(self):
        """
        Set PBS_AUTH_METHOD to invalid value.
        Check for error message on restart of daemons
        """
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'resvport',
                      'PBS_AUTH_METHOD': 'testing',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, restart=False)

        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            conf_param = {'PBS_AUTH_METHOD': 'testing'}
            self.update_pbs_conf(conf_param, host_name=self.mom.shortname,
                                 restart=False)

        matchs = "/opt/pbs/lib/libauth_testing.so:"
        matchs += " cannot open shared object file: No such file or directory"

        # Restart PBS and it should fail with expected error message
        _msg = "PBS restart failed as expected, error message: "
        try:
            self.pbs_restart()
        except PbsInitServicesError as e:
            self.assertIn(matchs, e.msg)
            self.logger.info(_msg + str(e.msg))
        else:
            err_msg = "Failed to get expected error message in PBS restart: "
            err_msg += matchs
            self.fail(err_msg)

    @requirements(num_moms=2)
    def test_munge_disabled_on_mom_host(self):
        """
        Test behavior when munge is stopped on Mom host
        Configuration:
        Node 1 : Server, Sched, Comm, Mom (self.hostA)
        Node 2 : Mom (self.hostB)
        """
        if len(self.moms) != 2:
            msg = "Test requires exactly 2 mom host as input"
            msg += " host as input"
            self.skipTest(msg)

        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        self.momB = self.moms.values()[1]
        self.hostB = self.momB.shortname
        self.node_list.extend([self.hostA, self.hostB])
        for host in self.node_list:
            self.perform_op('check_installed_and_run', host, node_state=False)

        # Update pbs.conf of Server host
        conf_param = {'PBS_COMM_LOG_EVENTS': '2047',
                      'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE,resvport',
                      'PBS_AUTH_METHOD': 'munge'}
        self.update_pbs_conf(
            conf_param,
            host_name=self.svr_hostname, check_state=False)

        # Update pbs.conf of Mom hosts
        del conf_param['PBS_COMM_LOG_EVENTS']
        del conf_param['PBS_SUPPORTED_AUTH_METHODS']
        for mom in self.moms.values():
            if mom.name != self.server.hostname:
                self.update_pbs_conf(
                  conf_param,
                  host_name=mom.name)

        self.munge_operation(self.hostB, op="stop")
        self.pbs_restart(self.hostB, node_state=False)
        self.server.expect(NODE, {'state': 'down'}, id=self.hostB)
        set_attr = {ATTR_l + '.select': '2:ncpus=1',
                    ATTR_l + '.place': 'scatter'}
        j = Job(attrs=set_attr)
        jid = self.server.submit(j)

        self.server.expect(JOB, {'job_state': 'Q'}, id=jid)

    @requirements(no_mom_on_server=True, num_client=1)
    def test_munge_without_supported_auth_method_on_server(self):
        """
        Verify appropriate error msg is thrown when
        PBS_SUPPORTED_AUTH_METHODS is not added to pbs.conf on server host
        Configuration:
        Node 1 : Server, Sched, Comm (self.hostA)
        Node 2 : Mom, Client (self.hostB)
        """
        if self.server.client == self.server.hostname:
            msg = "Test requires 1 mom and 1 client which is on non server"
            msg += " host as input"
            self.skipTest(msg)

        self.hostA = self.server.shortname
        self.momA = self.moms.values()[0]
        self.hostB = self.momA.shortname

        self.node_list = [self.hostA, self.hostB]

        # Verify if munge is installed on all the hosts
        for host in self.node_list:
            self.perform_op('check_installed_and_run', host)

        conf_param = {'PBS_AUTH_METHOD': 'MUNGE'}
        for host in self.node_list:
            self.update_pbs_conf(conf_param, host_name=host, check_state=False)

        err_msg = ['auth: error returned: 15029',
                   'auth: Failed to send auth request',
                   'No support for requested service.',
                   f'qstat: cannot connect to server {self.server.shortname} (errno=15029)']

        try:
            self.server.status(SERVER)
        except PbsStatusError as e:
            for msg in err_msg:
                self.assertIn(msg, e.msg)
        else:
            err_msg = "Failed to get expected error message"
            err_msg += " while checking server status."
            self.fail(err_msg)

    def common_steps_without_munge(self, client=None):
        """
        This function contains common steps for tests which
        verify behavior when munge is not installed on one of the host
        :param client: Name of the client
        :type client: String. Defaults to None
        """
        if client is None:
            self.server.client = self.svr_hostname
        else:
            self.server.client = client

        cmd_path = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin')

        err_msg = ": cannot connect to server %s" % self.server.hostname
        err_msg += ", error=15010"

        pbsnodes_cmd = os.path.join(cmd_path, 'pbsnodes')
        msg = pbsnodes_cmd + err_msg
        exp_msgs = ['init_munge: libmunge.so not found',
                    'auth: error returned: 15010',
                    'auth: Munge lib is not loaded',
                    msg
                    ]
        try:
            self.server.status(NODE, id=self.server.client)
        except PbsStatusError as e:
            for msg in exp_msgs:
                self.assertIn(msg, e.msg)
            cmd_exp_msg = "Getting expected error message."
            self.logger.info(cmd_exp_msg)
        else:
            cmd_msg = "Failed to get expected error message "
            cmd_msg = "while checking Node status."
            self.fail(cmd_msg)

        err_msg = "qstat: cannot connect to server %s" % self.server.hostname
        err_msg += " (errno=15010)"
        exp_msgs[3] = err_msg
        try:
            self.server.status(SERVER, id=self.svr_hostname)
        except PbsStatusError as e:
            for msg in exp_msgs:
                self.assertIn(msg, e.msg)
            cmd_exp_msg = "Getting expected error message."
            self.logger.info(cmd_exp_msg)
        else:
            cmd_msg = "Failed to get expected error message "
            cmd_msg += "while checking Server status."
            self.fail(cmd_msg)

    def test_without_munge_on_server_host(self):
        """
        Munge is not installed on server host.
        Set PBS_AUTH_METHOD=munge in conf and check respective error message.
        """
        # Function call to check if munge is not installed and then proceeding
        # with test case execution
        self.perform_op(choice='check_not_installed',
                        host_name=self.svr_hostname)

        conf_attrib = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                       'PBS_AUTH_METHOD': 'MUNGE',
                       'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_attrib, check_state=False)

        if self.svr_hostname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            conf_param = {'PBS_AUTH_METHOD': 'munge'}
            self.update_pbs_conf(
                conf_param,
                host_name=self.mom.shortname,
                check_state=False)
        exp_log = "libmunge.so not found"
        self.server.log_match(exp_log)
        self.mom.log_match(exp_log)
        self.common_steps_without_munge(self.svr_hostname)

    @requirements(num_moms=2)
    def test_without_munge_on_mom_host(self):
        """
        Test behavior when PBS_AUTH_METHOD is set to munge on remote
        mom host where munge is not installed.
        Node 1: Server, Sched, Mom, Comm [self.hostA]
        Node 2: Mom [self.hostB]
        """
        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        self.momB = self.moms.values()[1]
        self.hostB = self.momB.shortname

        self.perform_op(choice='check_not_installed',
                        host_name=self.hostB)
        self.node_list.extend([self.hostA, self.hostB])

        conf_attrib = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                       'PBS_AUTH_METHOD': 'MUNGE',
                       'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_attrib, check_state=False)

        conf_param = {'PBS_AUTH_METHOD': 'munge'}
        for mom in self.moms.values():
            if mom.shortname != self.svr_hostname:
                self.update_pbs_conf(
                    conf_param, host_name=mom.name, check_state=False)

        exp_log = "libmunge.so not found"
        self.momB.log_match(exp_log)
        self.common_steps_without_munge(self.hostB)

    @requirements(num_moms=1, num_comms=1, no_comm_on_server=True)
    def test_without_munge_on_comm_host(self):
        """
        Test behavior when PBS_AUTH_METHOD is set to munge on
        comm host where munge is not installed.
        when pbs_comm and client are on non-server host
        Configuration:
        Node 1: Server, Sched, Mom [self.hostA]
        Node 2: Comm [self.hostB]
        """
        if self.svr_hostname == self.comm.shortname:
            msg = "Test requires a comm host which is present on "
            msg += "non server host"
            self.skip_test(msg)

        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        self.hostB = self.comm.shortname

        self.perform_op(choice='check_not_installed',
                        host_name=self.hostB)
        self.node_list.extend([self.hostA, self.hostB])

        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                      'PBS_AUTH_METHOD': 'MUNGE',
                      'PBS_LEAF_ROUTERS': self.hostB}
        self.update_pbs_conf(conf_param, check_state=False)

        del conf_param['PBS_LEAF_ROUTERS']
        conf_param['PBS_COMM_LOG_EVENTS'] = 2047
        self.update_pbs_conf(
            conf_param,
            host_name=self.hostB,
            check_state=False)

        del conf_param['PBS_SUPPORTED_AUTH_METHODS']
        conf_param['PBS_LEAF_ROUTERS'] = self.hostB
        for mom in self.moms.values():
            if mom.shortname != self.svr_hostname:
                self.update_pbs_conf(
                    conf_param, host_name=mom.name, check_state=False)

        self.common_steps_without_munge(self.hostB)

    @requirements(num_client=1, num_moms=1)
    def test_without_munge_on_client_host(self):
        """
        Test behavior when PBS_AUTH_METHOD is set to munge on
        comm host where munge is not installed.
        when pbs_comm and client are on non-server host
        Configuration:
        Node 1: Server, Sched, Mom, Comm [self.hostA]
        Node 2: Client [self.hostB]
        """
        if self.svr_hostname == self.server.client:
            msg = "Test requires a client host which is present on "
            msg += "non server host"
            self.skip_test(msg)

        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        self.hostB = self.server.client

        self.perform_op(choice='check_not_installed',
                        host_name=self.hostB)
        self.node_list.extend([self.hostA, self.hostB])

        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                      'PBS_AUTH_METHOD': 'MUNGE',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, check_state=False)
        del conf_param['PBS_COMM_LOG_EVENTS']
        self.update_pbs_conf(conf_param, host_name=self.hostB,
                             restart=False)
        conf_param = {'PBS_AUTH_METHOD': 'MUNGE'}
        for mom in self.moms.values():
            if mom.shortname != self.svr_hostname:
                self.update_pbs_conf(
                    conf_param, host_name=mom.name, check_state=False)

        self.common_steps_without_munge(self.hostB)

    @requirements(num_client=1)
    def test_diff_auth_method_on_client(self):
        """
        Verify all PBS daemons and commands are authenticated when
        different authentication method is on client
        Configuration:
        Node 1 : Server, Sched, Comm, Mom (self.hostA)
        Node 2 : Client (self.hostB)
        """
        if self.svr_hostname == self.server.client:
            msg = "Test requires a client host which is present on "
            msg += "non server host"
            self.skip_test(msg)

        if self.server.shortname != self.mom.shortname:
            check_state = False
        else:
            check_state = True

        self.hostB = self.server.client
        self.server.client = self.svr_hostname
        # Update pbs.conf on server host (self.hostA)
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE',
                      'PBS_AUTH_METHOD': 'MUNGE',
                      'PBS_COMM_LOG_EVENTS': "2047"}
        self.update_pbs_conf(conf_param, check_state=check_state)

        self.server.client = self.hostB

        msg = "auth: Unable to authenticate connection"
        msg += " (%s:15001)" % self.server.hostname
        err_msg = ['auth: error returned: -1',
                   msg,
                   'qstat: cannot connect to server %s (errno=-1)'
                   % (self.server.shortname)]
        try:
            self.server.status(SERVER)
        except PbsStatusError as e:
            for msg in err_msg:
                self.assertIn(msg, e.msg)
        else:
            err_msg = "Failed to get expected error message"
            err_msg += " while checking server status."
            self.fail(err_msg)

    @requirements(num_moms=2)
    def test_diff_auth_methods_on_moms(self):
        """
        Verify all PBS daemons and commands are authenticated when
        different authentication method are used on execution host.
        This also tests the behavior when authentication mechanism
        is different on server and execution host.
        """
        comm_list = [x.shortname for x in self.comms.values()]
        if not(len(self.moms) == 2) or self.server.shortname not in comm_list:
            msg = "Test needs 2 moms as input and a comm which is present"
            msg += " on server host"
            self.skip_test(msg)

        self.momA = self.moms.values()[0]
        self.hostA = self.momA.shortname
        self.momB = self.moms.values()[1]
        self.hostB = self.momB.shortname

        self.node_list.extend([self.hostA, self.hostB])
        self.perform_op('check_installed_and_run', self.hostA,
                        node_state=False)

        # Update pbs.conf of Server
        conf_param = {'PBS_COMM_LOG_EVENTS': '2047',
                      'PBS_SUPPORTED_AUTH_METHODS': 'MUNGE,resvport',
                      'PBS_AUTH_METHOD': 'MUNGE'
                      }
        self.update_pbs_conf(
            conf_param,
            check_state=False)

        server_ip = socket.gethostbyname(self.svr_hostname)
        mom2_ip = socket.gethostbyname(self.hostB)

        if self.hostA != self.svr_hostname:
            conf_param = {'PBS_AUTH_METHOD': 'MUNGE'}
            self.update_pbs_conf(conf_param, host_name=self.hostA)
            mom1_ip = socket.gethostbyname(self.hostA)
            self.momA = self.moms.values()[0]
            attrib = {self.server.hostname: [server_ip, 15001],
                      self.momB.hostname: [mom2_ip, 15003],
                      self.momA.hostname: [mom1_ip, 15003]}
        else:
            self.pbs_restart(host_name=self.svr_hostname)
            attrib = {self.server.hostname: [server_ip, 15001, 15003],
                      self.momB.hostname: [mom2_ip, 15003]}

        msg = "Unauthenticated connection from %s" % self.server.shortname
        self.comm.log_match(msg, existence=False, starttime=self.server.ctime)
        ip = []
        port = []
        for host, host_attribs in attrib.items():
            ip = host_attribs.pop(0)
            for port in host_attribs:
                exp_msg = "Leaf registered address %s:%s" % (ip, port)
                self.comm.log_match(exp_msg)

        # Submit a job on the execution hosts with different
        # authentication mechanism
        set_attr = {ATTR_l + '.select': '2:ncpus=1',
                    ATTR_l + '.place': 'scatter', ATTR_k: 'oe'}
        resv_attr = {ATTR_l + '.select': '2:ncpus=1',
                     'reserve_start': time.time() + 30,
                     'reserve_end': time.time() + 60}
        self.common_commands_steps(resv_attr=resv_attr,
                                   set_attr=set_attr)

    def test_daemon_not_in_service_users_with_munge(self):
        """
        Test behavior when the daemon user is not in the PBS_AUTH_SERVICE_USERS
        list when using munge for authentication. No daemon should be able to
        establish a connection with comm.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        auth_method = 'munge'
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047",
                      'PBS_SUPPORTED_AUTH_METHODS': auth_method,
                      'PBS_AUTH_METHOD': auth_method,
                      'PBS_AUTH_SERVICE_USERS': 'random_user'}

        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)

        # Function call to check if munge is installed and enabled
        for host_name in self.node_list:
            self.perform_op(choice='check_installed_and_run',
                            host_name=host_name)

        common_msg = f'Connection to pbs_comm {self.server.shortname}:17001 down'
        common_msg1 = f'Supported authentication method: {auth_method}'
        common_msg2 = f'TPP authentication method = {auth_method}'

        exp_msg = {'comm': [common_msg1, common_msg2, f'User {str(ROOT_USER)} not in service users list'],
                   'mom': common_msg,
                   'server': [common_msg, common_msg1, common_msg2]
                   }
        self.update_pbs_conf(conf_param, check_state=False)
        self.match_logs(exp_msg)

    def test_daemon_not_in_service_users_with_resvport(self):
        """
        Test behavior when the daemon user is not in the PBS_AUTH_SERVICE_USERS
        list when using resvport for authentication. The daemon user name is not
        available with using resvport. Therefore we expect that the daemons will
        connect to comm successfully.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        auth_method = 'resvport'
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047",
                      'PBS_SUPPORTED_AUTH_METHODS': auth_method,
                      'PBS_AUTH_METHOD': auth_method,
                      'PBS_AUTH_SERVICE_USERS': 'random_user'}

        nt_exp_msg = f'Connection to pbs_comm {self.server.shortname}:17001 down'
        common_msg1 = f'Supported authentication method: {auth_method}'
        common_msg2 = f'TPP authentication method = {auth_method}'

        exp_msg = {'comm': [common_msg1],
                   'mom': common_msg2,
                   'server': [common_msg1, common_msg2]
                   }
        self.update_pbs_conf(conf_param, check_state=False)
        self.match_logs(exp_msg, nt_exp_msg)
        self.common_commands_steps()

    def test_default_interactive_auth_method(self):
        """
        Test that we can successfully run interactive jobs when using the default
        (resvport) interactive authentication method.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047"}
        if self.server.shortname != self.mom.shortname:
            check_state = False
        else:
            check_state = True

        auth_method = 'resvport'
        common_msg1 = f'TPP authentication method = {auth_method}'
        common_msg2 = f'Supported authentication method: {auth_method}'
        mom_msg = f'interactive authentication method = {auth_method}'
        exp_msg = {'server': [common_msg1, common_msg2],
                   'comm': [common_msg2]}

        self.update_pbs_conf(conf_param, check_state=check_state)
        self.match_logs(exp_msg)
        self.simple_interactive_job()
        self.match_logs({'mom': mom_msg})

    def test_interactive_job_with_resvport(self):
        """
        Test that we can successfully run interactive jobs when using resvport
        as the interactive authentication method.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        auth_method = 'resvport'
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047",
                      'PBS_SUPPORTED_AUTH_METHODS': auth_method,
                      'PBS_AUTH_METHOD': auth_method,
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}
        if self.server.shortname != self.mom.shortname:
            check_state = False
        else:
            check_state = True

        common_msg1 = f'TPP authentication method = {auth_method}'
        common_msg2 = f'Supported authentication method: {auth_method}'
        mom_msg = f'interactive authentication method = {auth_method}'
        exp_msg = {'server': [common_msg1, common_msg2],
                   'comm': [common_msg2]}

        self.update_pbs_conf(conf_param, check_state=check_state)
        self.match_logs(exp_msg)
        self.simple_interactive_job()
        self.match_logs({'mom': mom_msg})

    def test_interactive_job_with_munge(self):
        """
        Test that we can successfully run interactive jobs when using munge
        as the interactive authentication method.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        auth_method = 'munge'
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047",
                      'PBS_SUPPORTED_AUTH_METHODS': f"resvport,{auth_method}",
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}

        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            check_state = False
        else:
            check_state = True

        # Function call to check if munge is installed and enabled
        for host_name in self.node_list:
            self.perform_op(choice='check_installed_and_run',
                            host_name=host_name)

        common_msg1 = f'TPP authentication method = resvport'
        common_msg2 = f'Supported authentication method: resvport'
        common_msg3 = f'Supported authentication method: {auth_method}'
        mom_msg = f'interactive authentication method = {auth_method}'
        exp_msg = {'server': [common_msg1, common_msg2, common_msg3],
                   'comm': [common_msg2, common_msg3]}

        self.update_pbs_conf(conf_param, check_state=check_state)
        self.match_logs(exp_msg)
        self.simple_interactive_job()
        self.match_logs({'mom': mom_msg})

    def test_multiple_interactive_auth_methods(self):
        """
        Test that we can successfully run itneractive jobs when supporting
        multiple interactive auth methods.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047",
                      'PBS_SUPPORTED_AUTH_METHODS': 'munge,resvport'}
        if self.server.shortname != self.mom.shortname:
            self.node_list.append(self.mom.shortname)
            check_state = False
        else:
            check_state = True

        # Function call to check if munge is installed and enabled
        for host_name in self.node_list:
            self.perform_op(choice='check_installed_and_run',
                            host_name=host_name)

        common_msg1 = f'Supported authentication method: munge'
        common_msg2 = f'Supported authentication method: resvport'

        exp_msg = {'server': [common_msg1, common_msg2],
                   'comm': [common_msg1, common_msg2]}

        for auth_method in ['resvport', 'munge']:
            conf_param['PBS_INTERACTIVE_AUTH_METHOD'] = auth_method
            self.update_pbs_conf(conf_param, check_state=check_state)
            if self.server.shortname != self.mom.shortname:
                self.update_pbs_conf(conf_param, host_name=self.mom.shortname)
            self.match_logs(exp_msg)
            self.simple_interactive_job()
            self.match_logs({'mom': f'interactive authentication method = {auth_method}'})
            self.update_pbs_conf(['PBS_INTERACTIVE_AUTH_METHOD'], op='unset', restart=False)

    def test_not_listed_interactive_auth_method(self):
        """
        Test behavior when the provided interactive auth method is not in
        supported methods.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        self.svr_mode = self.server.get_op_mode()
        if self.svr_mode != PTL_CLI:
            self.server.set_op_mode(PTL_CLI)

        auth_method = 'munge'
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047",
                      'PBS_SUPPORTED_AUTH_METHODS': 'resvport',
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}
        if self.server.shortname != self.mom.shortname:
            check_state = False
        else:
            check_state = True

        self.update_pbs_conf(conf_param, check_state=check_state)
        common_msg1 = f'Supported authentication method: resvport'

        exp_msg = {'server': [common_msg1],
                   'comm': [common_msg1]}
        self.match_logs(exp_msg)
        j = Job(TEST_USER, attrs={ATTR_inter: ''})
        j.interactive_script = [('sleep 100', '.*')]
        jid = self.server.submit(j)
        self.match_logs({'mom': f'interactive authentication method {auth_method} not supported'})

    def test_invalid_interactive_auth_method(self):
        """
        Test behavior when the provided interactive auth method is invalid.

        Node 1: Server, Sched, Mom, Comm [self.hostA]
        """
        self.svr_mode = self.server.get_op_mode()
        if self.svr_mode != PTL_CLI:
            self.server.set_op_mode(PTL_CLI)

        auth_method = 'testing'
        conf_param = {'PBS_COMM_LOG_EVENTS': "2047",
                      'PBS_SUPPORTED_AUTH_METHODS': 'resvport',
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}
        if self.server.shortname != self.mom.shortname:
            check_state = False
        else:
            check_state = True

        self.update_pbs_conf(conf_param, check_state=check_state)
        common_msg1 = f'Supported authentication method: resvport'

        exp_msg = {'server': [common_msg1],
                   'comm': [common_msg1]}
        self.match_logs(exp_msg)
        j = Job(TEST_USER, attrs={ATTR_inter: ''})
        j.interactive_script = [('sleep 100', '.*')]
        jid = self.server.submit(j)
        self.match_logs({'mom': f'interactive authentication method {auth_method} not supported'})

    def test_penetration_interactive_auth_resvport(self):
        """
        Test that qsub interactive will reject unathorized incoming connections.
        1. qsub -I starts listening for an incoming connection
        2. We connect to the qsub socket and send a random message
        3. qsub should reject the connection since it does not originate from a
        privileged port.

        Node 1: Server, Sched, Mom, Comm
        """
        auth_method = 'resvport'
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': auth_method,
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}
        self.helper_pentest_interactive_auth_1(conf_param)

    def test_penetration_interactive_auth_munge(self):
        """
        Test that qsub interactive will reject unathorized incoming connections.
        1. qsub -I starts listening for an incoming connection
        2. We connect to the qsub socket and send a random message
        3. qsub should reject the connection since it does not match with a valid
        root munge token.

        Node 1: Server, Sched, Mom, Comm
        """
        # Function call to check if munge is installed and enabled
        self.perform_op(choice='check_installed_and_run',
                        host_name=self.server.hostname)

        auth_method = 'munge'
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': f'resvport,{auth_method}',
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}
        self.helper_pentest_interactive_auth_1(conf_param)

    def helper_pentest_interactive_auth_1(self, conf_param):
        """
        Helper function for pen-testing interactive authentication.
        In this test a malicious user connects to the qsub -I socket and
        submits a random message. The connection should be refused since it
        does not match the expected credentials. When scheduling is turned on,
        a valid execution host should be able to connect to qsub -I and the
        interactive job should start running.

        :param conf_param: Configuration parameters to update in pbs.conf
        :type conf_param: dict
        """
        if self.server.get_op_mode() != PTL_CLI:
            self.server.set_op_mode(PTL_CLI)

        self.update_pbs_conf(conf_param, host_name=self.svr_hostname)

        # turn off scheduling, so we can try to connect with qsub
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})
        # submit an interactive job
        j = Job(TEST_USER, attrs={ATTR_inter: ''})
        j.interactive_script = [('sleep 100', '.*')]
        jid = self.server.submit(j)
        # Get the address and port of qsub -I
        address, port = self.get_qsub_address_port(host=self.svr_hostname)
        self.assertTrue(port and address, "Failed to get qsub -I address and port")
        family, socktype, _, _, sockaddr = socket.getaddrinfo(address, port)[0]
        # Create a TCP socket and connect to qsub
        with socket.socket(family, socktype) as sock:
            sock = socket.socket(family, socktype)
            sock.connect(sockaddr)
            with self.assertRaises(BrokenPipeError, msg='Connection was not refused'):
                for _ in range(10):
                    # Add a small delay so that MoM has the time to close the connection
                    time.sleep(5)
                    # Send the job id to qsub
                    sock.sendall(jid.encode())
        self.logger.info('Connection refused as expected')

        # the job should be still in the queue
        self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)
        # now turn scheduling on
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
        # the job should be running
        self.server.expect(JOB, {ATTR_state: 'R'}, id=jid)

    def test_penetration_interactive_auth_resvport_2(self):
        """
        In this test the malicious user connects to the socket and stays idle.
        1. qsub -I starts listening for an incoming connection
        2. We connect to the qsub socket and stay idle.
        3. After a while the connection should timeout and be closed.
        4. When scheduling is turned on, a valid execution host should be able
        to connect to qsub -I.
        5. The interactive job should start running.

        Node 1: Server, Sched, Mom, Comm
        """
        auth_method = 'resvport'
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': f'{auth_method}',
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}
        self.helper_pentest_interactive_auth_2(conf_param=conf_param)

    def test_penetration_interactive_auth_munge_2(self):
        """
        In this test the malicious user connects to the socket and stays idle.
        1. qsub -I starts listening for an incoming connection
        2. We connect to the qsub socket and stay idle.
        3. After a while the connection should timeout and be closed.
        4. When scheduling is turned on, a valid execution host should be able
        to connect to qsub -I.
        5. The interactive job should start running.

        Node 1: Server, Sched, Mom, Comm
        """

        # Function call to check if munge is installed and enabled
        self.perform_op(choice='check_installed_and_run',
                        host_name=self.server.hostname)

        auth_method = 'munge'
        conf_param = {'PBS_SUPPORTED_AUTH_METHODS': f'resvport,{auth_method}',
                      'PBS_INTERACTIVE_AUTH_METHOD': auth_method}
        self.helper_pentest_interactive_auth_2(conf_param=conf_param)

    def helper_pentest_interactive_auth_2(self, conf_param):
        """
        Helper function for pen-testing interactive authentication.
        In this test a malicious user connects to the socket and stays idle.
        After a while the connection should timeout and be closed.
        When scheduling is turned on, a valid execution host should be able
        to connect to qsub -I and the interactive job should start running.

        :param conf_param: Configuration parameters to update in pbs.conf
        :type conf_param: dict
        """
        if self.server.get_op_mode() != PTL_CLI:
            self.server.set_op_mode(PTL_CLI)

        self.update_pbs_conf(conf_param, host_name=self.svr_hostname)

        # turn off scheduling, so we can try to connect with qsub
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'False'})

        # submit an interactive job
        j = Job(TEST_USER, attrs={ATTR_inter: ''})
        j.interactive_script = [('sleep 100', '.*')]
        jid = self.server.submit(j)

        # Get the address and port of qsub -I
        address, port = self.get_qsub_address_port(host=self.svr_hostname)
        self.assertTrue(port and address, "Failed to get qsub -I address and port")
        family, socktype, _, _, sockaddr = socket.getaddrinfo(address, port)[0]
        # Create a TCP socket and try to connect to qsub
        with socket.socket(family, socktype) as sock:
            sock.connect(sockaddr)
            # the job should be still in the queue
            self.server.expect(JOB, {ATTR_state: 'Q'}, id=jid)
            # now turn scheduling on
            self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': 'True'})
            # the job should be running
            self.server.expect(JOB, {ATTR_state: 'R'}, id=jid, offset=30)

    def test_penetration_root_impersonation_munge(self):
        """
        Test that server will reject credentials that don't match with the
        username in the batch request.
        1. Send to the server a connect request with root as the username
        2. Then send a authenticate request with a root as the username
        3. Finally we send the TEST_USER's munge token.
        4. The server should reject the request since the username in the
        batch requests does not match with the username in the munge token.

        Node 1: Server, Sched, Mom, Comm
        """
        # Function call to check if munge is installed and enabled
        self.perform_op(choice='check_installed_and_run',
                        host_name=self.server.hostname)

        auth_method = 'munge'
        conf_param = {'PBS_AUTH_METHOD': f'{auth_method}',
                      'PBS_SUPPORTED_AUTH_METHODS': f'resvport,{auth_method}'}
        self.update_pbs_conf(conf_param, host_name=self.svr_hostname)

        packets_to_send = []
        # Need to run qstat under strace, to get all write system calls
        root_packets = self.get_qstat_write_syscalls(runas=ROOT_USER)
        self.assertGreater(len(root_packets), 2, f"Failed to get {ROOT_USER}'s write system calls for qstat")

        user_packets = self.get_qstat_write_syscalls(runas=TEST_USER)
        self.assertGreater(len(user_packets), 2, f"Failed to get {TEST_USER}'s write system calls for qstat")

        # This is the order the packets will be sent:
        # 1. PBS_BATCH_Connect as root
        # 2. PBS_BATCH_Authenticate as root
        # 3. TEST_USER's munge credentials
        packets_to_send = root_packets[:2] + [user_packets[2]]
        start_time = time.time()
        # Establish connection with server in port PBS_BATCH_SERVICE_PORT
        server_port = self.server.pbs_conf.get('PBS_BATCH_SERVICE_PORT', 15001)
        family, socktype, _, _, sockaddr = socket.getaddrinfo(self.svr_hostname, server_port)[0]
        # Create a TCP socket and try to connect to the server
        with socket.socket(family, socktype) as sock:
            sock = socket.socket(family, socktype)
            sock.connect(sockaddr)
            # Send PBS_BATCH_Connect
            sock.sendall(bytes.fromhex(packets_to_send[0].replace(r'\x', ' ')))
            # Send PBS_BATCH_Authenticate with user credentials
            sock.sendall(bytes.fromhex(packets_to_send[1].replace(r'\x', ' ')))
            sock.sendall(bytes.fromhex(packets_to_send[2].replace(r'\x', ' ')))
            reply = sock.recv(1024).decode()
            # Now match expected server logs
            self.server.log_match(f".*Type 0 request received from {ROOT_USER}.*",
                                    regexp=True, starttime=start_time)
            self.server.log_match(f".*Type 95 request received from {ROOT_USER}.*",
                                    regexp=True, starttime=start_time)
            self.server.log_match(".*;munge_validate_auth_data;MUNGE user-authentication on decode failed with `Replayed credential`.*",
                                    regexp=True, starttime=start_time)
            self.server.log_match(".*;tcp_pre_process;MUNGE user-authentication on decode failed with `Replayed credential`.*",
                                    regexp=True, starttime=start_time)

    def test_penetration_server_to_mom_over_tcp_1(self):
        """
        Test that MoM will reject unathenticated TCP requests at port 15002.
        1. We establish a TCP connection with MoM on port 15002 and submit a
        random request.
        2. MoM should reject the request since it does not contain the correct
        encrypted cipher.

        Node 1: Server, Sched, Mom, Comm
        """
        if os.getuid() != 0 or sys.platform in ('cygwin', 'win32'):
            self.skipTest("Test needs to run as root")

        packet = 'PKTV1\x00\x00\x00\x00\x00\x0d+1+1+2+5ncpus'
        # Establish connection with mom in port PBS_MANAGER_SERVICE_PORT
        mom_port = self.server.pbs_conf.get('PBS_MOM_SERVICE_PORT', 15002)
        family, socktype, _, _, sockaddr = socket.getaddrinfo(self.svr_hostname, mom_port)[0]
        start_time = time.time()
        # Create a TCP socket and connect to mom
        with socket.socket(family, socktype) as sock:
            # Bind to an available, privileged port
            self.bind_to_privileged_port(sock)
            sock.connect(sockaddr)
            # Send the packet
            sock.sendall(packet.encode())
            # Now match expected mom log
            self.mom.log_match(f".*pbs_mom;.*received incorrect auth token.*",
                               regexp=True, starttime=start_time)
            self.mom.log_match(f".*;pbs_mom;Svr;wait_request;process socket failed.*",
                               regexp=True, starttime=start_time)

    def test_penetration_server_to_mom_over_tcp_2(self):
        """
        Test that MoM will reject unathenticated TCP requests at port 15002.
        1. We establish a TCP connection with MoM on port 15002 and submit a
        request that looks similar to an encrypted cipher.
        2. MoM should reject the request since it does not match the expected
        encrypted cipher according to the authentication protocol.

        Node 1: Server, Sched, Mom, Comm
        """
        if os.getuid() != 0 or sys.platform in ('cygwin', 'win32'):
            self.skipTest("Test needs to run as root")

        random_str = ''.join(random.choices(string.ascii_letters, k=15)) +\
            ';' + ''.join(random.choices(string.ascii_letters, k=33))
        packet = 'PKTV1\x00\x01\x00\x00\x00\x31' + random_str
        # Establish connection with mom in port PBS_MANAGER_SERVICE_PORT
        mom_port = self.server.pbs_conf.get('PBS_MOM_SERVICE_PORT', 15002)
        family, socktype, _, _, sockaddr = socket.getaddrinfo(self.svr_hostname, mom_port)[0]
        start_time = time.time()
        # Create a TCP socket and connect to mom
        with socket.socket(family, socktype) as sock:
            # Bind to an available, privileged port
            self.bind_to_privileged_port(sock)
            sock.connect(sockaddr)
            # Send the packet
            sock.sendall(packet.encode())
            # Now match expected mom log
            self.mom.log_match(f".*pbs_mom;validate_hostkey, decyrpt failed, host_keylen=.*",
                               regexp=True, starttime=start_time)
            self.mom.log_match(f".*pbs_mom;.*Failed to decrypt auth data.*",
                               regexp=True, starttime=start_time)
            self.mom.log_match(f".*;pbs_mom;Svr;wait_request;process socket failed.*",
                               regexp=True, starttime=start_time)

    def bind_to_privileged_port(self, sock):
        """
        Bind to an available, privileged port

        :param sock: The socket to bind
        :type sock: socket.socket
        :return: The privileged port number that was successfully bound
        """
        port_found = False
        for local_port in range(1023, 0, -1):
            try:
                sock.bind((self.svr_hostname, local_port))
                port_found = True
                break
            except socket.error as e:
                if e.errno != errno.EADDRINUSE:
                    raise e
        self.assertTrue(port_found, "Failed to find an available privileged port")
        return local_port

    def get_qsub_address_port(self, host):
        """
        Extract the address and listenting port of a qsub interactive session

        :param host: The hostname of the host where qsub -I was run
        :type host: str
        :return: A tuple containing the address and port of the qsub session,
                    or (None, None) if not found
        """
        tool = self.du.which(hostname=host, exe='ss')
        if tool == 'ss':
            tool = self.du.which(hostname=host, exe='netstat')
        if tool == 'netstat':
            self.skipTest(f"Command ss or netstat not found on {host}")
        cmd = [tool, '-tnap']
        ret = self.du.run_cmd(hosts=host, cmd=cmd, runas=ROOT_USER)
        if ret['rc'] == 0:
            for line in ret['out']:
                if 'LISTEN' in line and 'qsub' in line:
                    # this should extract the port number from the output
                    m = self.re_addr_port.match(line.split()[3])
                    if m:
                        return m.group('addr'), m.group('port')
        self.logger.error(f"Failed to get qsub -I address and port with: {ret['err']}")
        return None, None

    def get_qstat_write_syscalls(self, runas, host=None):
        """
        Get all write system calls made by qstat

        param runas: The user to run the command as
        type runas: str
        return: A list of all write system calls made by qstat.
        """
        strace = self.du.which(hostname=host, exe='strace')
        if strace == 'strace':
            self.skipTest("Command strace not found")
        qstat = os.path.join(self.server.pbs_conf['PBS_EXEC'], 'bin', 'qstat')
        cmd = [strace, '--trace=write', '-s1024', '-x', '-q', '--', qstat]
        ret = self.du.run_cmd(cmd=cmd, runas=runas, hosts=host, logerr=False)
        calls = []
        if ret['rc'] == 0:
            for line in ret['err']:
                m = self.re_syscall.match(line)
                if m:
                    calls.append(m.group('write_buffer'))
        else:
            self.logger.error(f"Failed to get qstat write system calls with: {ret['err']}")
        return calls

    def tearDown(self):
        conf_param = ['PBS_SUPPORTED_AUTH_METHODS',
                      'PBS_AUTH_METHOD',
                      'PBS_COMM_LOG_EVENTS',
                      'PBS_COMM_ROUTERS',
                      'PBS_LEAF_ROUTERS',
                      'PBS_INTERACTIVE_AUTH_METHOD',
                      'PBS_AUTH_SERVICE_USERS']
        restart = True
        self.node_list = set(self.node_list)
        for host_name in self.node_list:
            if host_name == self.client_host:
                restart = False
            self.update_pbs_conf(conf_param, host_name, op='unset',
                                 restart=restart, check_state=False)
        self.node_list.clear()


================================================
FILE: test/tests/selftest/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_testsuite import *


class TestSelf(PBSTestSuite):
    """
    Base test suite for Self tests
    """


================================================
FILE: test/tests/selftest/pbs_config_sched.py
================================================
# coding: utf-8

# Copyright (C) 2022 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

from tests.selftest import *
import re


class TestSchedConfig(TestSelf):
    """
    Test setting values in sched_config file.
    """

    def test_set_sched_config(self):
        '''
        Test whether Scheduler.set_sched_config() works as expected.
        '''
        sched = self.scheds['default']

        def set_and_get(confs):
            """
            Change settings in scheduler config file and fetch the new
            file contents
            """
            sched.set_sched_config(confs, apply=True, validate=False)
            sched.parse_sched_config()
            return sched.sched_config

        def cmp_dict(old, new):
            """
            Compare two dictionaries and build list of changes
            """
            all_keys = set(old.keys()) | set(new.keys())
            diffs = []
            for key in sorted(all_keys):
                o = old.get(key, '<missing>')
                n = new.get(key, '<missing>')
                if o != n:
                    diffs.append([key, n])
            return diffs

        # See if we can change an existing value, and leave others alone
        old_conf = sched.sched_config
        new_conf = set_and_get({'round_robin': 'True ALL'})
        diffs = cmp_dict(old_conf, new_conf)
        self.assertEqual(diffs, [['round_robin', 'True ALL']])

        # Repeat for initially missing setting
        old_conf = new_conf
        new_conf = set_and_get({'job_sort_key': '"ncpus HIGH"'})
        diffs = cmp_dict(old_conf, new_conf)
        self.assertEqual(diffs, [['job_sort_key', '"ncpus HIGH"']])

        # Test whether we can unset a value by setting to empty list
        old_conf = new_conf
        new_conf = set_and_get({'job_sort_key': []})
        diffs = cmp_dict(old_conf, new_conf)
        self.assertEqual(diffs, [['job_sort_key', '<missing>']])

        # Test whether we can set multiple values for one setting
        old_conf = new_conf
        jsk = ['"job_priority HIGH"', '"ncpus HIGH"']
        new_conf = set_and_get({'job_sort_key': jsk})
        diffs = cmp_dict(old_conf, new_conf)
        self.assertEqual(diffs, [['job_sort_key', jsk]])

        # Test whether we can change multiple settings
        old_conf = new_conf
        jsk = ['"job_priority LOW"', '"mem LOW"']
        new_conf = set_and_get({'primetime_prefix': 'xp_',
                                'job_sort_key': jsk})
        diffs = cmp_dict(old_conf, new_conf)
        self.assertEqual(diffs, [['job_sort_key', jsk],
                                 ['primetime_prefix', 'xp_']])

        # Finally, check if the scheduler likes the result
        sched.set_sched_config(confs={}, apply=True, validate=True)


================================================
FILE: test/tests/selftest/pbs_cycles_test.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class PBSTestCycle(TestSelf):
    """
    Tests to check that the cycle function returns correct information
    for schedulers
    """

    def test_cycle_multi_sched(self):
        """
        Test that scheduler.cycle() reads the correct multisched log file
        This test will check the start time and political order from the
        cycles() output to test the correct log file is being read.
        """
        # Create a queue, vnode and link them to the newly created sched
        a = {'queue_type': 'execution',
             'started': 'True',
             'enabled': 'True'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, id='wq')

        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(a, 1)
        vn = self.mom.shortname
        p1 = {'partition': 'P1'}
        self.server.manager(MGR_CMD_SET, QUEUE, p1, id='wq')
        self.server.manager(MGR_CMD_SET, NODE, p1, id=vn + '[0]')

        a = {'partition': 'P1',
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_CREATE, SCHED,
                            a, id="sc")
        self.scheds['sc'].create_scheduler()
        self.scheds['sc'].start()
        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id="sc")
        self.server.manager(MGR_CMD_SET, SCHED, {'log_events': 2047}, id='sc')

        # Turn off scheduling for all the scheds.
        for name in self.scheds:
            self.server.manager(MGR_CMD_SET, SCHED,
                                {'scheduling': 'False'}, id=name)
        st = time.time()

        # submit jobs and check political order
        a = {ATTR_queue: 'wq'}

        j1 = Job(TEST_USER1, attrs=a)
        jid1 = self.server.submit(j1)
        j2 = Job(TEST_USER1, attrs=a)
        jid2 = self.server.submit(j2)

        self.server.manager(MGR_CMD_SET, SCHED,
                            {'scheduling': 'True'}, id='sc')
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)

        cycles = self.scheds['sc'].cycles(start=st, firstN=1)
        self.assertNotEqual(len(cycles), 0)
        cycle = cycles[0]

        political_order = cycle.political_order
        self.assertNotEqual(len(political_order), 0)
        firstconsidered = political_order[0]

        # Check that the cycle start time is after st
        self.assertGreater(cycle.start, st)

        # check the first considered is jid1
        self.assertEqual(firstconsidered, jid1.split('.')[0])


================================================
FILE: test/tests/selftest/pbs_default_timeout.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from ptl.utils.plugins.ptl_test_runner import TimeOut


class TestDefaultTimeout(TestSelf):
    """
    Test suite to verify increase default testcase timeout working properly.
    """

    def test_default_timeout(self):
        """
        Verify that test not timedout after 180 sec.
        i.e. after previous default timeout value
        """
        try:
            mssg = 'sleeping for %ssec and minimum-testcase-timeout is %ssec' \
                   % (MINIMUM_TESTCASE_TIMEOUT/2, MINIMUM_TESTCASE_TIMEOUT)
            self.logger.info(mssg)
            time.sleep(MINIMUM_TESTCASE_TIMEOUT/2)
        except TimeOut as e:
            mssg = 'Timed out after %s second' % MINIMUM_TESTCASE_TIMEOUT
            err_mssg = 'The test timed out for an incorrect timeout duration'
            self.assertEqual(mssg, str(e), err_mssg)

    def test_timeout_greater_default_value(self):
        """
        Verify that test timedout after 600 sec.
        """
        try:
            mssg = 'sleeping for %ssec and minimum-testcase-timeout is %ssec' \
                   % (MINIMUM_TESTCASE_TIMEOUT+1, MINIMUM_TESTCASE_TIMEOUT)
            self.logger.info(mssg)
            time.sleep(MINIMUM_TESTCASE_TIMEOUT+1)
        except TimeOut as e:
            mssg = 'Timed out after %s second' % MINIMUM_TESTCASE_TIMEOUT
            err_mssg = 'The test timed out for an incorrect timeout duration'
            self.assertEqual(mssg, str(e), err_mssg)
        else:
            msg = 'Test did not timeout after the min. timeout period of %d' \
                  % MINIMUM_TESTCASE_TIMEOUT
            self.fail(msg)

    @timeout(200)
    def test_timeout_decorator_less_default_value(self):
        """
        If timeout decorator value is less than 600 then
        default testcase timeout is considered
        """
        try:
            mssg = 'sleeping for %ssec and minimum-testcase-timeout is %ssec' \
                   % (MINIMUM_TESTCASE_TIMEOUT/2, MINIMUM_TESTCASE_TIMEOUT)
            self.logger.info(mssg)
            time.sleep(MINIMUM_TESTCASE_TIMEOUT/2)
        except TimeOut as e:
            mssg = 'Timed out after %s second' % MINIMUM_TESTCASE_TIMEOUT
            err_mssg = 'The test timed out for an incorrect timeout duration'
            self.assertEqual(mssg, str(e), err_mssg)

    @timeout(800)
    def test_timeout_decorator_greater_default_value(self):
        """
        If timeout decorator value is greater than 600 then
        testcase timeout value consider as timeout decorator value
        """
        try:
            mssg = 'sleeping for %ssec and minimum-testcase-timeout is %ssec' \
                   % (MINIMUM_TESTCASE_TIMEOUT+1, 800)
            self.logger.info(mssg)
            time.sleep(MINIMUM_TESTCASE_TIMEOUT+1)
        except TimeOut as e:
            mssg = 'Timed out after 800 second'
            err_mssg = 'The test timed out for an incorrect timeout duration'
            self.assertEqual(mssg, str(e), err_mssg)


================================================
FILE: test/tests/selftest/pbs_dshutils_tests.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from ptl.utils.pbs_dshutils import PbsConfigError
import pwd
import getpass
import grp
import os


class TestDshUtils(TestSelf):
    """
    Test pbs distributed utilities util pbs_dshutils.py
    """

    def test_pbs_conf(self):
        """
        Test setting a pbs.conf variable and then unsetting it
        """
        var = 'PBS_COMM_THREADS'
        val = '16'
        self.du.set_pbs_config(confs={var: val})
        conf = self.du.parse_pbs_config()
        msg = 'pbs.conf variable not set'
        self.assertIn(var, conf, msg)
        self.assertEqual(conf[var], val, msg)

        msg = 'pbs.conf variable not unset'
        self.du.unset_pbs_config(confs=[var])
        conf = self.du.parse_pbs_config()
        self.assertNotIn(var, conf, msg)

        exception_found = False
        try:
            self.du.set_pbs_config(confs={'f': 'b'}, fout='/does/not/exist')
        except PbsConfigError:
            exception_found = True

        self.assertTrue(exception_found, 'PbsConfigError not thrown')

    def test_pbs_env(self):
        """
        Test setting a pbs_environment variable and then unsetting it
        """
        self.du.set_pbs_environment(environ={'pbs_foo': 'True'})
        environ = self.du.parse_pbs_environment()
        msg = 'pbs environment variable not set'
        self.assertIn('pbs_foo', environ, msg)
        self.assertEqual(environ['pbs_foo'], 'True', msg)

        msg = 'pbs environment variable not unset'
        self.du.unset_pbs_environment(environ=['pbs_foo'])
        environ = self.du.parse_pbs_environment()
        self.assertNotIn('pbs_foo', environ, msg)

    def check_access(self, path, mode=0o755, user=None, group=None, host=None):
        """
        Helper function to check user, group and mode of given path
        """
        if host is None:
            result = os.stat(path)
            m = result.st_mode
            u = result.st_uid
            g = result.st_gid

        else:
            py = self.du.which(host, 'python3')
            c = '"import os;s = os.stat(\'' + path + '\');'
            c += 'print(s.st_uid,s.st_gid,s.st_mode)"'
            cmd = [py, '-c', c]
            runas = self.du.get_current_user()
            ret = self.du.run_cmd(host, cmd, sudo=True, runas=runas)
            self.assertEqual(ret['rc'], 0)
            res = ret['out'][0]
            u, g, m = [int(v) for v in
                       res.split(' ')]

        self.assertEqual(oct(m & 0o777), oct(mode))
        if user is not None:
            uid = pwd.getpwnam(str(user)).pw_uid
            self.assertEqual(u, uid)
        if group is not None:
            gid = grp.getgrnam(str(group))[2]
            self.assertEqual(g, gid)

    def test_create_dir_as_user(self):
        """
        Test creating a directory as user
        """

        # create a directory with permissions
        tmpdir = self.du.create_temp_dir(mode=0o750)
        self.check_access(tmpdir, mode=0o750)

        # check default configurations
        tmpdir = self.du.create_temp_dir()
        self.check_access(tmpdir, user=getpass.getuser())

        # create a directory as a specific user
        tmpdir = self.du.create_temp_dir(asuser=TEST_USER2)
        self.check_access(tmpdir, user=TEST_USER2, mode=0o755)

        # create a directory as a specific user and permissions
        tmpdir = self.du.create_temp_dir(asuser=TEST_USER2, mode=0o750)
        self.check_access(tmpdir, mode=0o750, user=TEST_USER2)

        # create a directory as a specific user, group and permissions
        tmpdir = self.du.create_temp_dir(asuser=TEST_USER2, mode=0o770,
                                         asgroup=TSTGRP3)
        self.check_access(tmpdir, mode=0o770, user=TEST_USER2, group=TSTGRP3)

    @requirements(num_moms=2)
    def test_create_remote_dir_as_user(self):
        """
        Test creating a directory on a remote host as a user
        """

        if len(self.moms) < 2:
            self.skip_test("Test requires 2 moms: use -p moms=mom1:mom2")
        remote = None
        for each in self.moms:
            if not self.du.is_localhost(each):
                remote = each
                break

        if remote is None:
            self.skip_test("Provide a remote hostname")

        # check default configurations
        tmpdir = self.du.create_temp_dir(remote)
        self.check_access(tmpdir, user=getpass.getuser(), host=remote)

        # create a directory with permissions
        tmpdir = self.du.create_temp_dir(remote, mode=0o750)
        self.check_access(tmpdir, mode=0o750, host=remote)

        # create a directory as a specific user
        tmpdir = self.du.create_temp_dir(remote, asuser=TEST_USER2)
        self.check_access(tmpdir, user=TEST_USER2, mode=0o755, host=remote)

        # create a directory as a specific user and permissions
        tmpdir = self.du.create_temp_dir(remote, asuser=TEST_USER2,
                                         mode=0o750)
        self.check_access(tmpdir, mode=0o750, user=TEST_USER2, host=remote)

        # create a directory as a specific user, group and permissions
        tmpdir = self.du.create_temp_dir(remote, asuser=TEST_USER2, mode=0o770,
                                         asgroup=TSTGRP3)
        self.check_access(tmpdir, mode=0o770, user=TEST_USER2, group=TSTGRP3,
                          host=remote)

    @requirements(num_moms=1)
    def test_script_cleanup(self):
        """
        Make sure run_cmd with the as_script option cleans up the
        temporary file it creates.
        """

        if len(self.moms) < 1:
            self.skip_test("Test requires a mom: use -p mom=mom_host")
        remote = None
        for each in self.moms:
            if not self.du.is_localhost(each):
                remote = each
                break

        if remote is None:
            self.skip_test("Provide a remote mom")

        # First, figure out where temp files are created
        pfx = 'PtlPbs'      # This should be a constant someplace
        tmpname = self.du.create_temp_file(prefix=pfx)
        tmp_dir_path = os.path.dirname(tmpname)
        long_pfx = os.path.join(tmp_dir_path, pfx)
        self.du.rm(path=tmpname)

        # Get current contents of temp file dir
        before = self.du.listdir(path=tmp_dir_path, level=logging.DEBUG)

        # Run an as_script command
        example_cmd = "printenv HOME"
        result = self.du.run_cmd(cmd=example_cmd, as_script=True,
                                 level=logging.DEBUG)
        self.assertEqual(result['rc'], 0)

        # Get contents of temp file dir post script
        after = self.du.listdir(path=tmp_dir_path, level=logging.DEBUG)

        # Compare contents, looking for new PTL files
        new_files = set(after) - set(before)
        our_new_files = [x for x in new_files if x.startswith(long_pfx)]
        self.assertEqual([], our_new_files, "script file not cleaned up")

        # Repeat, running on remote host
        before = self.du.listdir(hostname=remote, path=tmp_dir_path,
                                 level=logging.DEBUG)
        result = self.du.run_cmd(hosts=remote, cmd=example_cmd,
                                 as_script=True, level=logging.DEBUG)
        self.assertEqual(result['rc'], 0)
        after = self.du.listdir(hostname=remote, path=tmp_dir_path,
                                level=logging.DEBUG)
        new_files = set(after) - set(before)
        our_new_files = [x for x in new_files if x.startswith(long_pfx)]
        self.assertEqual([], our_new_files,
                         "remote script file not cleaned up")

        # Repeat, running locally as a different user
        before = self.du.listdir(path=tmp_dir_path, runas=TEST_USER,
                                 level=logging.DEBUG)
        result = self.du.run_cmd(cmd=example_cmd, as_script=True,
                                 runas=TEST_USER, level=logging.DEBUG)
        self.assertEqual(result['rc'], 0)
        after = self.du.listdir(path=tmp_dir_path, runas=TEST_USER,
                                level=logging.DEBUG)
        new_files = set(after) - set(before)
        our_new_files = [x for x in new_files if x.startswith(long_pfx)]
        self.assertEqual([], our_new_files,
                         "alternate user script file not cleaned up")

        # Once more, with both remote host and different user
        before = self.du.listdir(hostname=remote, path=tmp_dir_path,
                                 runas=TEST_USER, level=logging.INFOCLI)
        result = self.du.run_cmd(hosts=remote, cmd=example_cmd,
                                 as_script=True, runas=TEST_USER,
                                 level=logging.DEBUG)
        self.assertEqual(result['rc'], 0)
        after = self.du.listdir(hostname=remote, path=tmp_dir_path,
                                runas=TEST_USER, level=logging.INFOCLI)
        new_files = set(after) - set(before)
        our_new_files = [x for x in new_files if x.startswith(long_pfx)]
        self.assertEqual([], our_new_files,
                         "alt user script file on remote not cleaned up")


================================================
FILE: test/tests/selftest/pbs_expect.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from io import StringIO
import logging


class TestExpect(TestSelf):
    """
    Contains tests for the expect() function
    """

    def test_attribute_case(self):
        """
        Test that when verifying attribute list containing attribute names
        with different case, expect() is case insensitive
        """
        # Create a queue
        a = {'queue_type': 'execution'}
        self.server.manager(MGR_CMD_CREATE, QUEUE, a, 'expressq')

        # Set the Priority attribute on the queue but provide 'p' lowercase
        # Set other attributes normally
        a = {'enabled': 'True', 'started': 'True', 'priority': 150}
        self.server.manager(MGR_CMD_SET, QUEUE, a, 'expressq')
        self.server.expect(QUEUE, a, id='expressq')

    def test_revert_attributes(self):
        """
        test that when we unset any attribute in expect(),
        attribute will be unset and should get value on attribute basis.
        """
        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': False})
        self.server.manager(MGR_CMD_UNSET, SERVER, 'scheduling')
        self.server.expect(SERVER, 'scheduling', op=UNSET)

        self.server.manager(MGR_CMD_UNSET, SERVER, 'max_job_sequence_id')
        self.server.expect(SERVER, 'max_job_sequence_id', op=UNSET)

        self.server.manager(MGR_CMD_UNSET, SCHED, 'sched_host')
        self.server.expect(SCHED, 'sched_host', op=UNSET)

        self.server.manager(MGR_CMD_UNSET, SCHED, ATTR_sched_cycle_len)
        self.server.expect(SCHED, ATTR_sched_cycle_len, op=UNSET)

        self.server.manager(MGR_CMD_UNSET, NODE, ATTR_NODE_resv_enable,
                            id=self.mom.shortname)
        self.server.expect(NODE, ATTR_NODE_resv_enable,
                           op=UNSET, id=self.mom.shortname)

        hook_name = "testhook"
        hook_body = "import pbs\npbs.event().reject('my custom message')\n"
        a = {'event': 'queuejob', 'enabled': 'True', 'alarm': 10}
        self.server.create_import_hook(hook_name, a, hook_body)
        self.server.manager(MGR_CMD_UNSET, HOOK, 'alarm', id=hook_name)
        self.server.expect(HOOK, 'alarm', op=UNSET, id=hook_name)

        a = {'partition': 'P1',
             'sched_host': self.server.hostname}
        self.server.manager(MGR_CMD_CREATE, SCHED,
                            a, id="sc1")
        new_sched_home = os.path.join(self.server.pbs_conf['PBS_HOME'],
                                      'sc_1_mot')
        self.scheds['sc1'].create_scheduler(sched_home=new_sched_home)
        self.scheds['sc1'].start()
        self.server.manager(MGR_CMD_UNSET, SCHED, 'sched_priv', id='sc1')
        self.server.expect(SCHED, 'sched_priv', op=UNSET, id='sc1')

        a = {'resources_available.ncpus': 2}
        self.mom.create_vnodes(attrib=a, num=2, vname='vn')
        self.server.manager(MGR_CMD_UNSET, VNODE,
                            'resources_available.ncpus', id='vn[1]')
        self.server.expect(VNODE, 'resources_available.ncpus',
                           id='vn[1]', op=UNSET)
        self.server.manager(MGR_CMD_UNSET, VNODE,
                            ATTR_NODE_resv_enable, id='vn[1]')
        self.server.expect(VNODE, ATTR_NODE_resv_enable,
                           op=UNSET, id='vn[1]')

        self.server.manager(MGR_CMD_UNSET, NODE, 'resources_available.ncpus',
                            id=self.mom.shortname)
        self.server.expect(NODE, 'resources_available.ncpus',
                           op=UNSET, id=self.mom.shortname)


================================================
FILE: test/tests/selftest/pbs_initservices.py
================================================
# coding: utf-8
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class TestPbsInitServices(TestSelf):
    """
    Contains tests related to PBSInitServices class
    """
    def test_init_services_pid(self):
        """
        Test if the pid of PBS daemons are updated correctly
        after a restart via PBSInitServices's functions
        """
        self.server.pi.stop()
        self.server.pi.start_server()
        self.server.pi.start_mom()
        self.server.pi.start_comm()
        self.server.pi.start_sched()

        self.assertTrue(self.server.signal('-HUP'))
        self.assertTrue(self.mom.signal('-HUP'))
        self.assertTrue(self.scheduler.signal('-HUP'))
        self.assertTrue(self.comm.signal('-HUP'))


================================================
FILE: test/tests/selftest/pbs_job_cleanup.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class TestJobCleanup(TestSelf):
    """
    Tests for checking the job cleanup functionality in PTL
    """

    @timeout(10000)
    def test_cleanup_perf(self):
        """
        Test the time that it takes to cleanup a large number of jobs
        """
        num_jobs = 10000

        # Set npcus to a number that'll allow half the jobs to run
        ncpus = int(num_jobs / 2)
        a = {'resources_available.ncpus': str(ncpus)}
        self.server.manager(MGR_CMD_SET, NODE, a, self.mom.shortname)

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        for i in range(num_jobs):
            j = Job()
            j.set_sleep_time(1000)
            self.server.submit(j)

        self.scheduler.run_scheduling_cycle()

        # Measure job cleanup performance
        t1 = time.time()
        self.server.cleanup_jobs()

        # Restart the mom
        self.mom.restart()
        t2 = time.time()

        self.logger.info("Time taken for job cleanup " + str(t2 - t1))

    def test_del_large_num_jobs(self):
        """
        Test that the delete jobs functionality works correctly with large
        number of jobs
        """
        num_jobs = 1000
        a = {'resources_available.ncpus': 1,
             'resources_available.mem': '2gb'}
        self.mom.create_vnodes(a, num_jobs,
                               sharednode=False, expect=False)
        self.server.expect(NODE, {'state=free': (GE, num_jobs)})

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        for i in range(num_jobs):
            j = Job(TEST_USER)
            self.server.submit(j)

        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, {'job_state=R': num_jobs}, max_attempts=120)

        self.server.cleanup_jobs()
        self.server.expect(SERVER, {'total_jobs': 0})

    def test_del_queued_jobs(self):
        """
        Test that the delete jobs functionality works correctly with large
        number of queued jobs that do not have processes associated with them.
        """
        num_jobs = 1000
        a = {'resources_available.ncpus': 1,
             'resources_available.mem': '2gb'}
        self.mom.create_vnodes(a, num_jobs,
                               sharednode=False, expect=False)
        self.server.expect(NODE, {'state=free': (GE, num_jobs)})

        self.server.manager(MGR_CMD_SET, MGR_OBJ_SERVER,
                            {'scheduling': 'False'})

        for i in range(num_jobs):
            j = Job(TEST_USER, attrs={ATTR_l + '.select': '1:ncpus=4'})
            self.server.submit(j)

        self.scheduler.run_scheduling_cycle()
        self.server.expect(JOB, {'job_state=Q': num_jobs}, max_attempts=120)

        self.server.cleanup_jobs()
        self.server.expect(SERVER, {'total_jobs': 0})


================================================
FILE: test/tests/selftest/pbs_json_test_report.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from ptl.utils.plugins.ptl_report_json import PTLJsonData


class TestJSONReport(TestSelf):
    """
    Tests to test JSON test report
    """

    def test_json_fields(self):
        """
        Test to verify fields of JSON test report
        """
        test_data = {
            'status': 'PASS',
            'start_time': datetime.datetime(2018, 10, 4, 0, 18, 8, 509426),
            'hostname': self.server.hostname,
            'status_data': '',
            'pbs_version': '19.2.0.20180903140741',
            'testcase': 'test_select',
            'end_time': datetime.datetime(2018, 10, 4, 0, 18, 11, 153022),
            'testdoc': '\n        Test to qselect\n        ',
            'duration': datetime.timedelta(0, 2, 643596),
            'suite': 'SmokeTest',
            'testparam': 'ABC=DEF,x=100',
            'machinfo': {
                self.server.hostname: {
                    'platform': 'Linux centos7alpha3.10.0-862.11.6.el7.x86_64',
                    'pbs_install_type': 'server',
                    'os_info': 'Linux-3.10.0-862.11.6.el7.x86_64-x86_64'
                }
            },
            'suitedoc': '\n    This test suite contains smoke tests of PBS\n',
            'tags': ['smoke'],
            'file': 'tests/pbs_smoketest.py',
            'module': 'tests.pbs_smoketest',
            'requirements': {
                "num_moms": 1,
                "no_comm_on_mom": True,
                "no_comm_on_server": False,
                "num_servers": 1,
                "no_mom_on_server": False,
                "num_comms": 1,
                "num_clients": 1
            }
        }
        verify_data = {
            'test_keys': ["command", "user", "product_version", "run_id",
                          "test_conf", "machine_info", "testsuites",
                          "test_summary", "additional_data"],
            'test_summary_keys': ["result_summary", "test_start_time",
                                  "test_end_time", "tests_with_failures",
                                  "test_suites_with_failures"],
            'test_machine_info': ["platform", "os_info", "pbs_install_type"],
            'test_results': ["run", "succeeded", "failed", "errors", "skipped",
                             "timedout"],
            'test_suites_info': ["testcases", "docstring", "module", "file"],
            'test_cases_info': ["docstring", "tags", "requirements",
                                "results"],
            'test_results_info': ["duration", "status", "status_data",
                                  "start_time", "end_time", "measurements"]
        }
        field_values = {
            'machine_info_name': list(test_data['machinfo'].keys())[0],
            'testresult_status': test_data['status'],
            'requirements': {
                "num_moms": 1,
                "no_comm_on_mom": True,
                "no_comm_on_server": False,
                "num_servers": 1,
                "no_mom_on_server": False,
                "num_comms": 1,
                "num_clients": 1
            }
        }
        faulty_fields = []
        faulty_values = []
        test_cmd = "pbs_benchpress -t SmokeTest.test_submit_job"
        jsontest = PTLJsonData(command=test_cmd)
        jdata = jsontest.get_json(data=test_data, prev_data=None)
        tsname = test_data['suite']
        tcname = test_data['testcase']
        vdata = jdata['testsuites'][tsname]['testcases'][tcname]
        for k in verify_data['test_keys']:
            if k not in jdata:
                faulty_fields.append(k)
        for l in verify_data['test_summary_keys']:
            if l not in jdata['test_summary']['1']:
                faulty_fields.append(l)
        for o in verify_data['test_results']:
            if o not in jdata['test_summary']['1']['result_summary']:
                faulty_fields.append(o)
        for node in jdata['machine_info']:
            for m in verify_data['test_machine_info']:
                if m not in jdata['machine_info'][node]:
                    faulty_fields.append(m)
        for q in jdata['testsuites']:
            for p in verify_data['test_suites_info']:
                if p not in jdata['testsuites'][q]:
                    faulty_fields.append(p)
        for s in jdata['testsuites']:
            for t in jdata['testsuites'][s]:
                for u in jdata['testsuites'][s]['testcases']:
                    for r in verify_data['test_cases_info']:
                        if r not in jdata['testsuites'][s]['testcases'][u]:
                            faulty_fields.append(r)
        for s in jdata['testsuites']:
            for t in jdata['testsuites'][s]['testcases']:
                for v in verify_data['test_results_info']:
                    testcase = jdata['testsuites'][s]['testcases'][t]
                    if v not in testcase['results']['1']:
                        faulty_fields.append(v)
        for k, v in field_values.items():
            if k == 'machine_info_name':
                if list(jdata['machine_info'].keys())[0] != v:
                    faulty_values.append(k)
            if k == 'testresult_status':
                if vdata['results']['1']['status'] != v:
                    faulty_values.append(k)
            if k == 'requirements':
                if vdata['requirements'] != v:
                    faulty_values.append(r)
        if (faulty_fields or faulty_values):
            raise AssertionError("Faulty fields or values",
                                 (faulty_fields, faulty_values))


================================================
FILE: test/tests/selftest/pbs_manager.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class TestManager(TestSelf):
    """
    Test ptl.server.manager()
    """

    def test_pbs_conf(self):
        """
        Test setting an string array with quote characters
        """
        attr = {'type': 'string_array', 'flag': 'h'}
        rc = self.server.manager(MGR_CMD_CREATE, RSC, attr, id='f')
        self.assertEqual(rc, 0)
        self.server.manager(MGR_CMD_SET, SERVER,
                            {"resources_available.f":
                             ["A'A", 'B"B', 'C C']
                             })
        servers = self.server.filter(SERVER,
                                     {'resources_available.f':
                                      """A'A,B"B,C C"""})
        self.logger.info(servers)
        self.assertTrue(servers)


================================================
FILE: test/tests/selftest/pbs_managers_operators.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class TestManagersOperators(TestSelf):

    """
        Additional managers users, except current user and MGR_USER
        should get unset after test setUp run
    """
    def test_managers_unset_setup(self):
        """
        Additional managers users, except current user and MGR_USER should
        get unset after test setUp run
        """
        runas = ROOT_USER
        manager_usr_str = str(MGR_USER) + '@*'
        current_usr = pwd.getpwuid(os.getuid())[0]
        current_usr_str = str(current_usr) + '@*'
        mgr_users = {manager_usr_str, current_usr_str}
        svr_mgr = self.server.status(SERVER, 'managers')[0]['managers']\
            .split(",")
        self.assertEqual(mgr_users, set(svr_mgr))

        mgr_user1 = str(TEST_USER)
        mgr_user2 = str(TEST_USER1)
        a = {ATTR_managers: (INCR, mgr_user1 + '@*,' + mgr_user2 + '@*')}
        self.server.manager(MGR_CMD_SET, SERVER, a, runas=runas)
        self.logger.info("Calling test setUp:")
        TestSelf.setUp(self)

        svr_mgr = self.server.status(SERVER, 'managers')[0]['managers'] \
            .split(",")
        self.assertEqual(mgr_users, set(svr_mgr))

    def test_default_oper(self):
        """
        Check that default operator user is set on PTL setup
        """
        svr_opr = self.server.status(SERVER, 'operators')[0].get('operators')
        opr_usr = str(OPER_USER) + '@*'
        self.assertEqual(opr_usr, svr_opr)

    def test_add_mgr_opr_fail(self):
        """
        Check that if unset mgr/ opr in add_mgr_opr fails, error is logged.
        There was a bug where self.logger.error() was used instead
        of cls.logger.error().
        """
        self.server.stop()
        with self.assertRaises(PbsStatusError) as e:
            self.add_mgrs_opers()
        self.assertIn('Connection refused', e.exception.msg[0])
        self.server.start()


================================================
FILE: test/tests/selftest/pbs_param_dict.py
================================================
# coding: utf-8

# Copyright (C) 2022 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from ptl.utils.plugins.ptl_test_runner import PTLTestRunner


class TestParamDict(TestSelf):
    """
    Test parsing the pbs_benchpress -p argument
    """

    def test_gpd(self):
        """
        Pass various -p param strings to __get_param_dictionary and check
        that result is correct.
        """
        def try_one(runner, param):
            """
            Run get_param_dictionary to convert param string to dict
            """
            runner.param = param
            try:
                # Note that we call private routine directly to avoid
                # possible side effects.
                result = runner._PTLTestRunner__get_param_dictionary()
            except ValueError:
                result = None
            return result

        def compare(old, new, expect_none=False):
            """
            Compare new param dict to old
            """
            if new is None and not expect_none:
                return 'Unexpected parse error'
            if expect_none and new is not None:
                return 'Should have failed'
            diffs = [(k, new[k]) for k in old if old[k] != new[k]]
            return sorted(diffs)

        def check_diffs(self, new, expected):
            """
            Validate changes between baseline and new param dict
            """
            if expected is None:
                self.assertEqual(new, expected)
                return
            diffs = compare(self.base, new)
            self.assertEqual(diffs, expected)

        our_runner = PTLTestRunner()

        # Create baseline dictionary
        self.base = try_one(our_runner, '')

        # Try simple key=value (boolean)
        new = try_one(our_runner, 'mom_on_server=True')
        check_diffs(self, new, [('mom_on_server', True)])

        # Try one that generates a set of hostnames
        new = try_one(our_runner, 'moms=foo')
        check_diffs(self, new, [('moms', set(['foo']))])

        # Test that unknown parameter is ignored
        new = try_one(our_runner, 'nonsense')
        check_diffs(self, new, [])

        # Test more complicated host list
        new = try_one(our_runner, 'comms=foo:bar@/path/to/bleem:baz')
        check_diffs(self, new, [('comms', set(['foo', 'baz', 'bar']))])

        # Test bad boolean arg
        new = try_one(our_runner, 'mom_on_server=oops')
        check_diffs(self, new, None)

        # Test multiple options, one of which is default
        new = try_one(our_runner,
                      'server=foo2:bar,mom_on_server=y,comm_on_server=f')
        expected = [('mom_on_server', True),
                    ('servers', set(['foo2', 'bar']))]
        check_diffs(self, new, expected)


================================================
FILE: test/tests/selftest/pbs_pbstestsuite.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from ptl.utils.pbs_snaputils import *


class TestPBSTestSuite(TestSelf):
    """
    Contains tests for pbs_testsuite module's functionality
    """

    def test_revert_pbsconf_onehost(self):
        """
        Test the functionality of PBSTestSuite.revert_pbsconf()
        for a single host type 1 installation
        """
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertTrue(pbs_conf_val and len(pbs_conf_val) >= 1,
                        "Could not parse pbs.conf on host %s" %
                        (self.server.hostname))

        # Since the setUp already ran, check that the start bits are turned on
        self.assertEqual(pbs_conf_val["PBS_START_MOM"], "1")
        self.assertEqual(pbs_conf_val["PBS_START_SERVER"], "1")
        self.assertEqual(pbs_conf_val["PBS_START_SCHED"], "1")
        self.assertEqual(pbs_conf_val["PBS_START_COMM"], "1")

        self.server.pi.stop()

        # Now, change pbs.conf to turn the sched off
        pbs_conf_val["PBS_START_SCHED"] = "0"
        self.du.set_pbs_config(confs=pbs_conf_val)

        # Start PBS again
        self.server.pi.start()

        # Verify that the scheduler didn't come up
        self.assertFalse(self.scheduler.isUp())

        # Now call revert_pbsconf()
        self.revert_pbsconf()

        # Verify that the scheduler came up and start bit is 1
        self.assertTrue(self.scheduler.isUp())
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertEqual(pbs_conf_val["PBS_START_SCHED"], "1")

    def test_revert_pbsconf_remotemom(self):
        """
        Test the functionality of PBSTestSuite.revert_pbsconf()
        with a remote mom setup
        """
        remotemom = None
        for mom in self.moms.values():
            if not self.du.is_localhost(mom.hostname):
                remotemom = mom
                break
        if remotemom is None:
            self.skip_test("Test needs at least one remote Mom host,"
                           " use -p moms=<hostname>")

        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertTrue(pbs_conf_val and len(pbs_conf_val) >= 1,
                        "Could not parse pbs.conf on host %s" %
                        (self.server.hostname))

        # Check that the start bits on server host are set correctly
        self.assertEqual(pbs_conf_val["PBS_START_SERVER"], "1")
        self.assertEqual(pbs_conf_val["PBS_START_SCHED"], "1")
        self.assertEqual(pbs_conf_val["PBS_START_COMM"], "1")
        if self.server.hostname in self.moms:
            self.assertEqual(pbs_conf_val["PBS_START_MOM"], "1")
        else:
            self.assertEqual(pbs_conf_val["PBS_START_MOM"], "0")

        # Check that the remote mom's pbs.conf has mom start bit on
        pbs_conf_val = self.du.parse_pbs_config(remotemom.hostname)
        self.assertEqual(pbs_conf_val["PBS_START_MOM"], "1")

        # Now set it to 0 and restart the mom
        remotemom.pi.stop(remotemom.hostname)
        pbs_conf_val["PBS_START_MOM"] = "0"
        self.du.set_pbs_config(remotemom.hostname, confs=pbs_conf_val)
        remotemom.pi.start(remotemom.hostname)

        # Confirm that the mom is down
        self.assertFalse(remotemom.isUp())

        # Now call revert_pbsconf()
        self.revert_pbsconf()

        # Confirm that the mom came up and start bit is 1
        self.assertTrue(remotemom.isUp())
        pbs_conf_val = self.du.parse_pbs_config(remotemom.hostname)
        self.assertEqual(pbs_conf_val["PBS_START_MOM"], "1")

    def test_revert_pbsconf_corelimit(self):
        """
        Test the functionality of PBSTestSuite.revert_pbsconf() when
        PBS_CORE_LIMIT is set to a value other than the default
        """
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertTrue(pbs_conf_val and len(pbs_conf_val) >= 1,
                        "Could not parse pbs.conf on host %s" %
                        (self.server.hostname))

        # Since the setUp already ran, check that PBS_CORE_LIMIT is set to
        # unlimited
        self.assertEqual(pbs_conf_val["PBS_CORE_LIMIT"], "unlimited")

        # Now, set the core limit to 0 and restart PBS
        self.server.pi.stop()
        pbs_conf_val["PBS_CORE_LIMIT"] = "0"
        self.du.set_pbs_config(confs=pbs_conf_val)
        self.server.pi.start()

        # First, check that there's no existing core file in mom_priv
        mom_priv_path = os.path.join(self.server.pbs_conf["PBS_HOME"],
                                     "mom_priv")
        mom_priv_filenames = self.du.listdir(self.server.hostname,
                                             mom_priv_path, sudo=True,
                                             fullpath=False)
        for filename in mom_priv_filenames:
            if filename.startswith("core"):
                # Found a core file, delete it
                corepath = os.path.join(mom_priv_path, filename)
                self.du.rm(self.server.hostname, corepath, sudo=True,
                           force=True)

        # Send SIGSEGV to pbs_mom
        self.assertTrue(self.mom.isUp())
        self.mom.signal("-SEGV")
        for _ in range(20):
            ret = self.mom.isUp(max_attempts=1)
            if not ret:
                break
            time.sleep(1)
        self.assertFalse(ret, "Mom was expected to go down but it didn't")

        # Confirm that no core file was generated
        mom_priv_filenames = self.du.listdir(self.server.hostname,
                                             mom_priv_path, sudo=True,
                                             fullpath=False)
        corefound = False
        for filename in mom_priv_filenames:
            if filename.startswith("core"):
                corefound = True
                break
        self.assertFalse(corefound, "mom unexpectedly dumped core")

        # Now, call self.revert_pbsconf()
        self.revert_pbsconf()

        # Confirm that PBS_CORE_LIMIT was reverted
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertEqual(pbs_conf_val["PBS_CORE_LIMIT"], "unlimited")

        # Send another SIGSEGV to pbs_mom
        self.assertTrue(self.mom.isUp())
        self.mom.signal("-SEGV")
        for _ in range(20):
            ret = self.mom.isUp(max_attempts=1)
            if not ret:
                break
            time.sleep(1)
        self.assertFalse(ret, "Mom was expected to go down but it didn't")

        # Confirm that a core file was generated this time
        mom_priv_filenames = self.du.listdir(self.server.hostname,
                                             mom_priv_path, sudo=True,
                                             fullpath=False)
        corefound = False
        for filename in mom_priv_filenames:
            if filename.startswith("core"):
                corefound = True
                break
        self.assertTrue(corefound,
                        "mom was expected to dump core but it didn't")

    def test_revert_pbsconf_extra_vars(self):
        """
        Test the functionality of PBSTestSuite.revert_pbsconf() when
        there are extra pbs.conf variables than the default
        """
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertTrue(pbs_conf_val and len(pbs_conf_val) >= 1,
                        "Could not parse pbs.conf on host %s" %
                        (self.server.hostname))

        # Set a non-default pbs.conf variables, let's say
        # PBS_LOCALLOG, and restart PBS
        self.server.pi.stop()
        pbs_conf_val["PBS_LOCALLOG"] = "1"
        self.du.set_pbs_config(confs=pbs_conf_val)
        self.server.pi.start()

        # Confirm that the pbs.conf variable is set
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertEqual(pbs_conf_val["PBS_LOCALLOG"], "1")

        # Now, call self.revert_pbsconf()
        self.revert_pbsconf()

        # Confirm that the value gets removed from the list as it is not
        # a default setting
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertFalse("PBS_LOCALLOG" in pbs_conf_val)

    def test_revert_pbsconf_fewer_vars(self):
        """
        Test the functionality of PBSTestSuite.revert_pbsconf() when
        there are fewer pbs.conf variables than the default
        """
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertTrue(pbs_conf_val and len(pbs_conf_val) >= 1,
                        "Could not parse pbs.conf on host %s" %
                        (self.server.hostname))

        # Remove a default pbs.conf variable, say PBS_CORE_LIMIT,
        # and restart PBS
        self.server.pi.stop()
        del pbs_conf_val["PBS_CORE_LIMIT"]
        self.du.set_pbs_config(confs=pbs_conf_val, append=False)
        self.server.pi.start()

        # Confirm that the pbs.conf variable is gone
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertNotIn("PBS_CORE_LIMIT", pbs_conf_val)

        # Now, call self.revert_pbsconf()
        self.revert_pbsconf()

        # Confirm that the variable was set again
        pbs_conf_val = self.du.parse_pbs_config(self.server.hostname)
        self.assertIn("PBS_CORE_LIMIT", pbs_conf_val)

    def test_revert_moms_default_conf(self):
        """
        Test if PBSTestSuite.revert_moms() reverts the mom configuration
        setting to defaults
        """
        c1 = self.mom.parse_config()
        # Save a copy of default config to check it was reverted
        # correctly later
        c2 = c1.copy()
        a = {'$prologalarm': '280'}
        self.mom.add_config(a)
        c1.update(a)
        self.assertEqual(self.mom.parse_config(), c1)
        self.mom.revert_to_defaults()
        # Make sure the default config is back
        self.assertEqual(self.mom.parse_config(), c2)

    def test_revert_conf_highres_logging(self):
        """
        Test that if PBS_LOG_HIGHRES_TIMESTAMP by default is set to 1 and
        if its value is changed in the test it will be reverted to 1 by
        revert_pbsconf()
        """
        highres_val = self.du.parse_pbs_config()\
            .get("PBS_LOG_HIGHRES_TIMESTAMP")
        self.assertEqual("1", highres_val)

        a = {'PBS_LOG_HIGHRES_TIMESTAMP': "0"}
        self.du.set_pbs_config(confs=a, append=True)
        highres_val = self.du.parse_pbs_config()\
            .get("PBS_LOG_HIGHRES_TIMESTAMP")
        self.assertEqual("0", highres_val)

        self.revert_pbsconf()
        highres_val = self.du.parse_pbs_config()\
            .get("PBS_LOG_HIGHRES_TIMESTAMP")
        self.assertEqual("1", highres_val)


================================================
FILE: test/tests/selftest/pbs_requirements_decorator.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


@requirements(num_servers=1, num_comms=1, min_mom_ram=1,
              min_mom_disk=5, min_server_ram=1, min_server_disk=5)
class TestRequirementsDecorator(TestSelf):

    """
    This test suite is to verify functionality of requirements
    decorator. This test suite when run on single node without any
    hostnames passed in -p or param file, tests run and skip functionality
    of this decorator

    """
    @requirements(num_servers=1, num_comms=1, min_mom_ram=2,
                  min_mom_disk=5, min_server_ram=2, min_server_disk=5)
    def test_tc_run(self):
        """
        Test to verify test run when requirements are satisfied
        test suite requirements overridden by test case requirements
        """
        j = Job(TEST_USER)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)
        self.server.expect(SERVER, {'server_state': 'Active'})
        requirements_set = {
            'num_servers': 1,
            'num_comms': 1
        }
        ds = getattr(self, REQUIREMENTS_KEY, {})
        if ds == requirements_set:
            raise self.failureException("Requirements not as expected")

    @requirements(num_servers=3)
    def test_tc_skip(self):
        """
        Test to verify test skip when requirements are not satisfied
        due to num_servers
        """
        self.server.expect(SERVER, {'server_state': 'Active'})

    def test_ts_skip(self):
        """
        Test to verify test skip when requirements are not satisfied
        at test suite level
        """
        self.server.expect(SERVER, {'server_state': 'Active'})

    @requirements(num_servers=1, num_comms=1, no_mom_on_server=True)
    def test_skip_no_server_on_mom(self):
        """
        Test to verify test skip when requirements are not satisfied
        due to no_mom_on_server flag
        """
        self.server.expect(SERVER, {'server_state': 'Active'})

    @requirements(num_servers=1, num_comms=1, no_comm_on_mom=True)
    def test_skip_no_comm_on_mom(self):
        """
        Test to verify test skip when requirements are not satisfied
        due to no_comm_on_mom flag set true
        """
        self.server.expect(SERVER, {'server_state': 'Active'})

    @requirements(num_comms=2, num_moms=2, no_comm_on_server=True)
    def test_skip_no_comm_on_server(self):
        """
        Test to verify test skip when requirements are not satisfied
        due to no_comm_on_server flag set true
        """
        self.server.expect(SERVER, {'server_state': 'Active'})


================================================
FILE: test/tests/selftest/pbs_resvid_test.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class TestPTLConvertsResvIDtoid(TestSelf):
    """
    This test suite tests PTL should not convert
    'Resv ID' to 'id' when query a reservation
    """

    def test_attrib_ResvID(self):
        """
        Test reservation attribute 'Resv Id' in pbs_rstat output
        is not replaced with 'id' by PTL framework.
        """
        r = Reservation(TEST_USER)
        now = int(time.time())
        a = {'Resource_List.select': '1:ncpus=1',
             'reserve_start': now + 10,
             'reserve_end': now + 110}
        r.set_attributes(a)
        rid = self.server.submit(r)
        val = self.server.status(RESV, id=rid)
        self.logger.info("Verifying attribute in pbs_rstat -f rid")
        self.assertIn('id', val[0], msg="Failed to get expected attrib id")
        self.logger.info("Got expected attribute id")
        self.logger.info("Look for attribute Resv ID")
        self.assertIn(
            'Resv ID', val[0], msg="Failed to get expected attrib Resv ID")
        self.logger.info("Got expected attribute Resv ID")


================================================
FILE: test/tests/selftest/pbs_test_create_vnodes.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


@requirements(num_moms=2)
class Test_create_vnodes(TestSelf):
    """
    Tests to test Server().create_vnodes()
    """

    def test_delall_multi(self):
        # Skip test if number of mom provided is not equal to two
        if len(self.moms) != 2:
            self.skipTest("test requires atleast two MoMs as input, "
                          "use -p moms=<mom1:mom2>")
        a = {'resources_available.ncpus': 4}
        self.moms.values()[0].create_vnodes(a, 4)
        self.moms.values()[1].create_vnodes(a, 5,
                                            usenatvnode=True, delall=False)
        stat = self.server.status(NODE)
        self.assertEqual(len(stat), 10)

    def test_delall(self):
        a = {'resources_available.ncpus': 4}
        self.mom.create_vnodes(a, 4, vname='first')
        self.mom.create_vnodes(a, 5, usenatvnode=True,
                               delall=False, vname='second')
        self.mom.create_vnodes(a, 5, delall=False, vname='third')
        stat = self.server.status(NODE)
        self.assertEqual(len(stat), 14)


================================================
FILE: test/tests/selftest/pbs_test_revert_site_hooks.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class TestRevertSiteHook(TestSelf):
    """
    Test suite to verify default site hooks exist after
    revert_to_defaults() is called
    """

    def test_verify_cgroups_hook_exists_after_setup(self):
        """
        Test if cgroups hook exists after revert_to_defaults() is called
        """
        hooks = [h['id'] for h in self.server.status(HOOK)]
        if 'pbs_cgroups' not in hooks:
            self.fail("Default cgroups hook doesn't exist")


================================================
FILE: test/tests/selftest/pbs_test_revert_to_defaults.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from datetime import datetime, timedelta


class TestPTLRevertToDefault(TestSelf):
    """
    This test suite tests PTL's revert to default functionality
    """

    svr_dflt_attr = {'scheduling': 'True',
                     'query_other_jobs': 'True',
                     'scheduler_iteration': '600',
                     'resources_default.ncpus': '1',
                     'log_events': '511',
                     'mail_from': 'adm',
                     'pbs_license_linger_time': '31536000',
                     'pbs_license_min': '0',
                     'pbs_license_max': '2147483647',
                     'eligible_time_enable': 'False',
                     'max_concurrent_provision': '5',
                     'resv_enable': 'True',
                     'max_array_size': '10000',
                     }

    def test_svr_revert_to_default(self):
        """
        This test case tests the server attributes after revert_to_default
        is called.
        """
        modified_attr = {'scheduling': 'FALSE',
                         'query_other_jobs': 'FALSE',
                         'scheduler_iteration': '100',
                         'resources_default.ncpus': '12',
                         'log_events': '2047',
                         'mail_from': 'user1',
                         'pbs_license_linger_time': '6000',
                         'pbs_license_min': '10',
                         'pbs_license_max': '3647',
                         'eligible_time_enable': 'TRUE',
                         'max_concurrent_provision': '15',
                         'resv_enable': 'FALSE',
                         'max_array_size': '900',
                         }
        self.server.manager(MGR_CMD_SET, SERVER, modified_attr)
        self.server.revert_to_defaults()

        self.server.expect(SERVER, self.svr_dflt_attr,
                           attrop=PTL_AND, max_attempts=20)

    def test_sched_revert_to_defaults_dedtime(self):
        """
        Test that revert_to_defaults() reverts the dedicated time file
        """
        dt_start = datetime.now() + timedelta(seconds=3600)
        dt_start_str = dt_start.strftime("%m/%d/%Y %H:%M")
        dt_end = dt_start + timedelta(seconds=3600)
        dt_end_str = dt_end.strftime("%m/%d/%Y %H:%M")
        self.scheduler.add_dedicated_time(dt_start_str + ' ' + dt_end_str)

        J = Job(attrs={'Resource_List.walltime': '7200'})
        jid = self.server.submit(J)

        a = {'job_state': 'Q',
             'comment': 'Not Running: Job would cross dedicated time boundary'}
        self.server.expect(JOB, a, id=jid)

        self.scheduler.revert_to_defaults()

        self.server.manager(MGR_CMD_SET, SERVER, {'scheduling': True})

        self.server.expect(JOB, {'job_state': 'R'}, id=jid)


================================================
FILE: test/tests/selftest/pbs_testlogutils.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *
from ptl.utils.pbs_logutils import PBSLogUtils


class TestLogUtils(TestSelf):
    """
    Test PBSLogUtils functionality in PTL
    """

    def switch_microsecondlogging(self, hostname=None, highrestimestamp=1):
        """
        Set microsecond logging in pbs.conf
        """
        if hostname is None:
            hostname = self.server.hostname
        a = {'PBS_LOG_HIGHRES_TIMESTAMP': highrestimestamp}
        self.du.set_pbs_config(hostname=hostname, confs=a, append=True)
        PBSInitServices().restart()
        self.assertTrue(self.server.isUp(), 'Failed to restart PBS Daemons')

    def test_log_match_microsec_logging(self):
        """
        Test that log_match will work when microsecond logging
        is turned on and then off
        """
        # Turn of microsecond logging and test log_match()
        self.switch_microsecondlogging(highrestimestamp=1)
        a = {'Resource_List.ncpus': 1}
        J1 = Job(TEST_USER, attrs=a)
        st = time.time()
        jid1 = self.server.submit(J1)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid1)
        msg_str = "Job;" + jid1 + ";Job Run at request of Scheduler"
        et = time.time()
        self.server.log_match(msg_str, starttime=st, endtime=et)
        self.server.deljob(jid1, wait=True)

        # Turn off microsecond logging and test log_match()
        st = int(time.time())
        self.switch_microsecondlogging(highrestimestamp=0)
        a = {'Resource_List.ncpus': 1}
        J2 = Job(TEST_USER, attrs=a)
        jid2 = self.server.submit(J2)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid2)
        et = int(time.time())
        msg_str = "Job;" + jid2 + ";Job Run at request of Scheduler"
        self.server.log_match(msg_str, starttime=st, endtime=et)

    def test_get_timestamps(self):
        """
        test that LogUtils.get_timestamps() works correctly
        """
        # Submit a 1 cpu job, this will create some accounting records
        a = {'Resource_List.ncpus': 1}
        j = Job(attrs=a)
        jid = self.server.submit(j)
        self.server.expect(JOB, {'job_state': 'R'}, id=jid)

        acctpath = os.path.join(self.server.pbs_conf["PBS_HOME"],
                                "server_priv", "accounting")
        self.assertTrue(self.du.isdir(self.server.hostname, acctpath,
                                      sudo=True))
        logs = self.du.listdir(self.server.hostname, acctpath, sudo=True)
        log_today = sorted(logs, reverse=True)[0]
        self.assertTrue(self.du.isfile(self.server.hostname, acctpath,
                                       sudo=True))

        # Call LogUtils.get_timestamps() for today's accounting log file
        lu = PBSLogUtils()
        tm = lu.get_timestamps(log_today, self.server.hostname, num=1,
                               sudo=True)
        self.assertIsNotNone(tm)
        self.assertEqual(len(tm), 1)


================================================
FILE: test/tests/selftest/pbs_testparams_decorator.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from tests.selftest import *


class Test_TestparamsDecorator(TestSelf):

    """
    This test suite is to verify functionality of requirements
    decorator. The test specific parameters can be modified by
    -p or param file.

    """
    @testparams(num_jobs=100, scheduling=False)
    def test_testparams(self):
        """
        Test to submit n number of jobs and expect jobs to be
        in running or queued state as per tunable scheduling
        parameter.
        """
        scheduling = self.conf["Test_TestparamsDecorator.scheduling"]
        num_jobs = self.conf["Test_TestparamsDecorator.num_jobs"]
        a = {'resources_available.ncpus': num_jobs}
        self.server.manager(MGR_CMD_SET, NODE, a, id=self.mom.shortname)
        a = {'scheduling': scheduling}
        self.server.manager(MGR_CMD_SET, SERVER, a)
        j = Job(TEST_USER)
        for _ in range(num_jobs):
            self.server.submit(j)
        if scheduling:
            self.server.expect(JOB, {'job_state=R': num_jobs})
        else:
            self.server.expect(JOB, {'job_state=Q': num_jobs})


================================================
FILE: test/tests/upgrades/__init__.py
================================================
# coding: utf-8

# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.


from ptl.utils.pbs_testsuite import *


class TestUpgrades(PBSTestSuite):
    """
    Base test suite for Upgrades tests
    """
    pass


================================================
FILE: valgrind.supp
================================================
# Copyright (C) 1994-2021 Altair Engineering, Inc.
# For more information, contact Altair at www.altair.com.
#
# This file is part of both the OpenPBS software ("OpenPBS")
# and the PBS Professional ("PBS Pro") software.
#
# Open Source License Information:
#
# OpenPBS is free software. You can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the
# Free Software Foundation, either version 3 of the License, or (at your
# option) any later version.
#
# OpenPBS is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
# License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
# Commercial License Information:
#
# PBS Pro is commercially licensed software that shares a common core with
# the OpenPBS software.  For a copy of the commercial license terms and
# conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
# Altair Legal Department.
#
# Altair's dual-license business model allows companies, individuals, and
# organizations to create proprietary derivative works of OpenPBS and
# distribute them - whether embedded or bundled with other software -
# under a commercial license agreement.
#
# Use of Altair's trademarks, including but not limited to "PBS™",
# "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
# subject to Altair's trademark licensing policies.

# These are unfreed memory (still reachable blocks) detected in python

{
   ADDRESS_IN_RANGE/Invalid read of size 4
   Memcheck:Addr4
   fun:Py_ADDRESS_IN_RANGE
}

{
   ADDRESS_IN_RANGE/Invalid read of size 4
   Memcheck:Value4
   fun:Py_ADDRESS_IN_RANGE
}

{
   ADDRESS_IN_RANGE/Invalid read of size 8 (x86_64 aka amd64)
   Memcheck:Value8
   fun:Py_ADDRESS_IN_RANGE
}

{
   ADDRESS_IN_RANGE/Conditional jump or move depends on uninitialised value
   Memcheck:Cond
   fun:Py_ADDRESS_IN_RANGE
}

#
# Leaks (including possible leaks)
#    Hmmm, I wonder if this masks some real leaks.  I think it does.
#    Will need to fix that.
#

{
   Suppress leaking the GIL.  Happens once per process, see comment in ceval.c.
   Memcheck:Leak
   fun:malloc
   fun:PyThread_allocate_lock
   fun:PyEval_InitThreads
}

{
   Suppress leaking the GIL after a fork.
   Memcheck:Leak
   fun:malloc
   fun:PyThread_allocate_lock
   fun:PyEval_ReInitThreads
}

{
   Suppress leaking the autoTLSkey.  This looks like it shouldn't leak though.
   Memcheck:Leak
   fun:malloc
   fun:PyThread_create_key
   fun:_PyGILState_Init
   fun:Py_InitializeEx
   fun:Py_Main
}

{
   Hmmm, is this a real leak or like the GIL?
   Memcheck:Leak
   fun:malloc
   fun:PyThread_ReInitTLS
}

{
   Handle PyMalloc confusing valgrind (possibly leaked)
   Memcheck:Leak
   fun:realloc
   fun:_PyObject_GC_Resize
#   fun:COMMENT_THIS_LINE_TO_DISABLE_LEAK_WARNING
}

{
   Handle PyMalloc confusing valgrind (possibly leaked)
   Memcheck:Leak
   fun:malloc
   fun:_PyObject_GC_New
#   fun:COMMENT_THIS_LINE_TO_DISABLE_LEAK_WARNING
}

{
   Handle PyMalloc confusing valgrind (possibly leaked)
   Memcheck:Leak
   fun:malloc
   fun:_PyObject_GC_NewVar
#   fun:COMMENT_THIS_LINE_TO_DISABLE_LEAK_WARNING
}

#
# Non-python specific leaks
#

{
   Handle pthread issue (possibly leaked)
   Memcheck:Leak
   fun:calloc
   fun:allocate_dtv
   fun:_dl_allocate_tls_storage
   fun:_dl_allocate_tls
}

{
   Handle pthread issue (possibly leaked)
   Memcheck:Leak
   fun:memalign
   fun:_dl_allocate_tls_storage
   fun:_dl_allocate_tls
}

###{
###   ADDRESS_IN_RANGE/Invalid read of size 4
###   Memcheck:Addr4
###   fun:PyObject_Free
###}
###
###{
###   ADDRESS_IN_RANGE/Invalid read of size 4
###   Memcheck:Value4
###   fun:PyObject_Free
###}
###
###{
###   ADDRESS_IN_RANGE/Use of uninitialised value of size 8
###   Memcheck:Addr8
###   fun:PyObject_Free
###}
###
###{
###   ADDRESS_IN_RANGE/Use of uninitialised value of size 8
###   Memcheck:Value8
###   fun:PyObject_Free
###}
###
###{
###   ADDRESS_IN_RANGE/Conditional jump or move depends on uninitialised value
###   Memcheck:Cond
###   fun:PyObject_Free
###}

###{
###   ADDRESS_IN_RANGE/Invalid read of size 4
###   Memcheck:Addr4
###   fun:PyObject_Realloc
###}
###
###{
###   ADDRESS_IN_RANGE/Invalid read of size 4
###   Memcheck:Value4
###   fun:PyObject_Realloc
###}
###
###{
###   ADDRESS_IN_RANGE/Use of uninitialised value of size 8
###   Memcheck:Addr8
###   fun:PyObject_Realloc
###}
###
###{
###   ADDRESS_IN_RANGE/Use of uninitialised value of size 8
###   Memcheck:Value8
###   fun:PyObject_Realloc
###}
###
###{
###   ADDRESS_IN_RANGE/Conditional jump or move depends on uninitialised value
###   Memcheck:Cond
###   fun:PyObject_Realloc
###}

###
### All the suppressions below are for errors that occur within libraries
### that Python uses.  The problems to not appear to be related to Python's
### use of the libraries.
###

{
   Generic ubuntu ld problems
   Memcheck:Addr8
   obj:/lib/ld-2.4.so
   obj:/lib/ld-2.4.so
   obj:/lib/ld-2.4.so
   obj:/lib/ld-2.4.so
}

{
   Generic gentoo ld problems
   Memcheck:Cond
   obj:/lib/ld-2.3.4.so
   obj:/lib/ld-2.3.4.so
   obj:/lib/ld-2.3.4.so
   obj:/lib/ld-2.3.4.so
}

{
   DBM problems, see test_dbm
   Memcheck:Param
   write(buf)
   fun:write
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   fun:dbm_close
}

{
   DBM problems, see test_dbm
   Memcheck:Value8
   fun:memmove
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   fun:dbm_store
   fun:dbm_ass_sub
}

{
   DBM problems, see test_dbm
   Memcheck:Cond
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   fun:dbm_store
   fun:dbm_ass_sub
}

{
   DBM problems, see test_dbm
   Memcheck:Cond
   fun:memmove
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   obj:/usr/lib/libdb1.so.2
   fun:dbm_store
   fun:dbm_ass_sub
}

{
   GDBM problems, see test_gdbm
   Memcheck:Param
   write(buf)
   fun:write
   fun:gdbm_open

}

{
   ZLIB problems, see test_gzip
   Memcheck:Cond
   obj:/lib/libz.so.1.2.3
   obj:/lib/libz.so.1.2.3
   fun:deflate
}

{
   Avoid problems w/readline doing a putenv and leaking on exit
   Memcheck:Leak
   fun:malloc
   fun:xmalloc
   fun:sh_set_lines_and_columns
   fun:_rl_get_screen_size
   fun:_rl_init_terminal_io
   obj:/lib/libreadline.so.4.3
   fun:rl_initialize
}

###
### These occur from somewhere within the SSL, when running
###  test_socket_sll.  They are too general to leave on by default.
###
###{
###   somewhere in SSL stuff
###   Memcheck:Cond
###   fun:memset
###}
###{
###   somewhere in SSL stuff
###   Memcheck:Value4
###   fun:memset
###}
###
###{
###   somewhere in SSL stuff
###   Memcheck:Cond
###   fun:MD5_Update
###}
###
###{
###   somewhere in SSL stuff
###   Memcheck:Value4
###   fun:MD5_Update
###}

#
# All of these problems come from using test_socket_ssl
#
{
   from test_socket_ssl
   Memcheck:Cond
   fun:BN_bin2bn
}

{
   from test_socket_ssl
   Memcheck:Cond
   fun:BN_num_bits_word
}

{
   from test_socket_ssl
   Memcheck:Value4
   fun:BN_num_bits_word
}

{
   from test_socket_ssl
   Memcheck:Cond
   fun:BN_mod_exp_mont_word
}

{
   from test_socket_ssl
   Memcheck:Cond
   fun:BN_mod_exp_mont
}

{
   from test_socket_ssl
   Memcheck:Param
   write(buf)
   fun:write
   obj:/usr/lib/libcrypto.so.0.9.7
}

{
   from test_socket_ssl
   Memcheck:Cond
   fun:RSA_verify
}

{
   from test_socket_ssl
   Memcheck:Value4
   fun:RSA_verify
}

{
   from test_socket_ssl
   Memcheck:Value4
   fun:DES_set_key_unchecked
}

{
   from test_socket_ssl
   Memcheck:Value4
   fun:DES_encrypt2
}

{
   from test_socket_ssl
   Memcheck:Cond
   obj:/usr/lib/libssl.so.0.9.7
}

{
   from test_socket_ssl
   Memcheck:Value4
   obj:/usr/lib/libssl.so.0.9.7
}

{
   from test_socket_ssl
   Memcheck:Cond
   fun:BUF_MEM_grow_clean
}

{
   from test_socket_ssl
   Memcheck:Cond
   fun:memcpy
   fun:ssl3_read_bytes
}

{
   from test_socket_ssl
   Memcheck:Cond
   fun:SHA1_Update
}

{
   from test_socket_ssl
   Memcheck:Value4
   fun:SHA1_Update
}

{
   From PBS (TPP layer) - suppress epoll_pwait() glibc bug
   Memcheck:Param
   epoll_pwait(sigmask)
   fun:epoll_pwait
   fun:tpp_em_pwait
   fun:tpp_em_wait
   fun:work
   fun:start_thread
   fun:clone
}
{
   From PBS (TPP layer) - suppress warning about uninitialized bytes in sendto
   Memcheck:Param
   socketcall.sendto(msg)
   fun:send
   fun:send_data
   fun:handle_cmd
   fun:work
   fun:start_thread
   fun:clone
}
{
   From PBS (server) - Suppress intentional unfreed memory for pbs_db_get_svr_id
   Memcheck:Leak
   match-leak-kinds: reachable
   fun:malloc
   fun:strdup
   fun:pbs_db_get_svr_id
   fun:chk_and_update_db_svrhost
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from hook_recov
   Memcheck:Leak
   fun:malloc
   fun:strdup
   fun:hook_recov
   fun:pbsd_init
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from loading hook script at hook_recov
   Memcheck:Leak
   fun:malloc
   fun:pbs_python_ext_alloc_python_script
   fun:hook_recov
   fun:pbsd_init
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from loading hook script at hook_recov
   Memcheck:Leak
   fun:malloc
   fun:strdup
   fun:pbs_python_ext_alloc_python_script
   fun:hook_recov
   fun:pbsd_init
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from allocating hook data at hook_recov
   Memcheck:Leak
   fun:malloc
   fun:hook_alloc
   fun:hook_recov
   fun:pbsd_init
   fun:main
}
{
   From PBS (all deamons) - Suppress memory allocated for log mutex
   Memcheck:Leak
   fun:calloc
   fun:log_mutex_lock
   fun:log_record
   fun:*
}
{
   From PBS (mom) - Suppress intentional unfreed memory from python_script_alloc() inside req_copy_hookfile() that is tracked globally in svr_allhooks.
   Memcheck:Leak
   fun:malloc
   ...
   fun:python_script_alloc
   ...
   fun:req_copy_hookfile
   fun:is_request
   fun:do_tpp
   fun:tpp_request
   fun:wait_request
   fun:main
}
{
   From PBS (mom) - Suppress intentional unfreed memory from hook_recov() inside req_copy_hookfile() that is tracked globally in svr_allhooks.
   Memcheck:Leak
   fun:malloc
   ...
   fun:hook_recov
   fun:req_copy_hookfile
   fun:is_request
   fun:do_tpp
   fun:tpp_request
   fun:wait_request
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from pbs_python_populae_attributes_to_python_class() that is tracked globally in pbs_resource_value_list.
   Memcheck:Leak
   fun:malloc
   fun:pbs_python_populate_attributes_to_python_class
   fun:*
}
{
   From PBS (server) - Suppress intentional unfreed memory from pbs_python_populate_attributes_to_python_class() that is tracked and freed in a local pbs_list_head
   Memcheck:Leak
   fun:malloc
   fun:attrlist_alloc
   fun:attrlist_create
   fun:encode_l
   fun:encode_resc
   fun:pbs_python_populate_attributes_to_python_class
   fun:*
}
{
   From PBS (server) - Suppress intentional unfreed memory from pbs_python_populate_attributes_to_python_class() that is tracked and freed in a local pbs_list_head.
   Memcheck:Leak
   fun:malloc
   fun:attrlist_alloc
   fun:attrlist_create
   fun:encode_size
   fun:encode_resc
   fun:pbs_python_populate_attributes_to_python_class
   fun:*
}
{
   From PBS (server) - Suppress intentional unfreed memory from pbs_python_populate_attributes_to_python_class() that is tracked and freed in a local pbs_list_head.
   Memcheck:Leak
   fun:malloc
   fun:attrlist_alloc
   fun:attrlist_create
   fun:encode_str
   fun:encode_resc
   fun:pbs_python_populate_attributes_to_python_class
   fun:*
}
{
   From PBS (server) - Suppress intentional unfreed memory from pbs_python_populate_attributes_to_python_class() that is tracked and freed in a local pbs_list_head.
   Memcheck:Leak
   fun:malloc
   fun:attrlist_alloc
   fun:attrlist_create
   fun:encode_time
   fun:encode_resc
   fun:pbs_python_populate_attributes_to_python_class
   fun:*
}
{
   From PBS (server) - Suppress intentional unfreed memory from loading hook script at mgr_hook_import
   Memcheck:Leak
   fun:malloc
   fun:strdup
   fun:pbs_python_ext_alloc_python_script
   fun:mgr_hook_import
   fun:req_manager
   fun:dispatch_request
   fun:process_request
   fun:wait_request
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from loading hook script at mgr_hook_import
   Memcheck:Leak
   fun:malloc
   fun:pbs_python_ext_alloc_python_script
   fun:mgr_hook_import
   fun:req_manager
   fun:dispatch_request
   fun:process_request
   fun:wait_request
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from allocating hook data at mgr_hook_create
   Memcheck:Leak
   fun:malloc
   fun:hook_alloc
   fun:mgr_hook_create
   fun:req_manager
   fun:dispatch_request
   fun:process_request
   fun:wait_request
   fun:main
}
{
   From PBS (server) - Suppress intentional unfreed memory from allocating hook name at mgr_hook_create
   Memcheck:Leak
   fun:malloc
   fun:strdup
   fun:set_hook_name
   fun:mgr_hook_create
   fun:req_manager
   fun:dispatch_request
   fun:process_request
   fun:wait_request
   fun:main
}
{
   From PBS - Suppress intentional unfreed memory of auth struct inside global tpp_conf struct
   Memcheck:Leak
   fun:malloc
   fun:make_auth_config
   fun:set_tpp_config
   fun:main
}
{
   From PBS - Suppress intentional unfreed memory of auth struct inside global tpp_conf struct
   Memcheck:Leak
   fun:malloc
   fun:strdup
   fun:make_auth_config
   fun:set_tpp_config
   fun:main
}
{
   From PBS - Suppress intentional unfreed memory of auth struct inside global tpp_conf struct
   Memcheck:Leak
   fun:malloc
   fun:mk_hostname
   fun:set_tpp_config
   fun:main
}
{
   From PBS - Suppress intentional unfreed memory of auth struct inside global tpp_conf struct
   Memcheck:Leak
   fun:malloc
   fun:strdup
   fun:set_tpp_config
   fun:main
}
{
   From PBS - Suppress intentional unfreed memory of auth struct inside global tpp_conf struct
   Memcheck:Leak
   fun:realloc
   fun:set_tpp_config
   fun:main
}
{
   From PBS - Suppress intentional unfreed avl tree tls data
   Memcheck:Leak
   fun:calloc
   fun:get_avl_tls
   ...
}
{
   From PBS - Suppress intentional unfreed tpp tls data
   Memcheck:Leak
   fun:calloc
   fun:tpp_get_tls
   fun:work
   ...
}
{
   From PBS - Suppress uninitialized job fs structure in mom
   Memcheck:Param
   write(buf)
   ...
   fun:job_save_fs
   ...
}
{
   From PBS - Suppress hook allocated buffer
   Memcheck:Leak
   match-leak-kinds: possible
   fun:malloc
   fun:hook_alloc
   fun:hook_recov
   ...
}
{
   From PBS - Suppress hook allocated buffer
   Memcheck:Leak
   match-leak-kinds: possible
   fun:malloc
   fun:hook_alloc
   fun:mgr_hook_create
   ...
}
{
   From PBS - Suppress uninitialized DIS buffer
   Memcheck:Param
   write(buf)
   ...
   fun:__send_pkt
   fun:dis_flush
   ...
}
{
   From PBS - Suppress scheduler query resources leak, it is misreported
   Memcheck:Leak
   match-leak-kinds: definite
   ...
   fun:*query_resources*
   fun:*update_resource_def*
   fun:schedule
   ...
}